{"train_loss": 1.4540659189224243, "global_step": 0, "epoch": 0} {"train_loss": 1.4467453956604004, "global_step": 1, "epoch": 0} {"train_loss": 1.5013054609298706, "global_step": 2, "epoch": 0} {"train_loss": 1.438310146331787, "global_step": 3, "epoch": 0} {"train_loss": 1.472869873046875, "global_step": 4, "epoch": 0} {"train_loss": 1.4412144422531128, "global_step": 5, "epoch": 0} {"train_loss": 1.4227914810180664, "global_step": 6, "epoch": 0} {"train_loss": 1.4502081871032715, "global_step": 7, "epoch": 0} {"train_loss": 1.4349720478057861, "global_step": 8, "epoch": 0} {"train_loss": 1.4494154453277588, "global_step": 9, "epoch": 0} {"train_loss": 1.446377158164978, "global_step": 10, "epoch": 0} {"train_loss": 1.4226880073547363, "global_step": 11, "epoch": 0} {"train_loss": 1.4226690530776978, "global_step": 12, "epoch": 0} {"train_loss": 1.4105441570281982, "global_step": 13, "epoch": 0} {"train_loss": 1.4267042875289917, "global_step": 14, "epoch": 0} {"train_loss": 1.3882628679275513, "global_step": 15, "epoch": 0} {"train_loss": 1.4031932353973389, "global_step": 16, "epoch": 0} {"train_loss": 1.4084110260009766, "global_step": 17, "epoch": 0} {"train_loss": 1.3916505575180054, "global_step": 18, "epoch": 0} {"train_loss": 1.417123556137085, "global_step": 19, "epoch": 0} {"train_loss": 1.3585381507873535, "global_step": 20, "epoch": 0} {"train_loss": 1.3431410789489746, "global_step": 21, "epoch": 0} {"train_loss": 1.3792901039123535, "global_step": 22, "epoch": 0} {"train_loss": 1.3673138618469238, "global_step": 23, "epoch": 0} {"train_loss": 1.3355035781860352, "global_step": 24, "epoch": 0} {"train_loss": 1.3362408876419067, "global_step": 25, "epoch": 0} {"train_loss": 1.3193485736846924, "global_step": 26, "epoch": 0} {"train_loss": 1.2880157232284546, "global_step": 27, "epoch": 0} {"train_loss": 1.2977629899978638, "global_step": 28, "epoch": 0} {"train_loss": 1.2705628871917725, "global_step": 29, "epoch": 0} {"train_loss": 1.2666881084442139, "global_step": 30, "epoch": 0} {"train_loss": 1.2558231353759766, "global_step": 31, "epoch": 0} {"train_loss": 1.2338998317718506, "global_step": 32, "epoch": 0} {"train_loss": 1.2172449827194214, "global_step": 33, "epoch": 0} {"train_loss": 1.221379280090332, "global_step": 34, "epoch": 0} {"train_loss": 1.1715869903564453, "global_step": 35, "epoch": 0} {"train_loss": 1.169663429260254, "global_step": 36, "epoch": 0} {"train_loss": 1.1294398307800293, "global_step": 37, "epoch": 0} {"train_loss": 1.139783263206482, "global_step": 38, "epoch": 0} {"train_loss": 1.0796573162078857, "global_step": 39, "epoch": 0} {"train_loss": 1.0956391096115112, "global_step": 40, "epoch": 0} {"train_loss": 1.3328796312922524, "global_step": 41, "epoch": 0, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.030704983161909942, "train/sim_max_reward_3": 0.12103990487797428, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.5982473441418509, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.0, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.27937153809368176, "test/sim_max_reward_4300004": 0.38877855626331503, "test/sim_max_reward_4300005": 0.23907313396036559, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.045127646075307386, "test/sim_max_reward_4300008": 0.0, "test/sim_max_reward_4300009": 0.007743177188927948, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.43237485407073917, "test/sim_max_reward_4300012": 0.2102399034002108, "test/sim_max_reward_4300013": 0.3223185640591602, "test/sim_max_reward_4300014": 0.09774428935694213, "test/sim_max_reward_4300015": 0.2396881801166403, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.012342010202988205, "test/sim_max_reward_4300018": 0.17074369940582684, "test/sim_max_reward_4300019": 0.1874757479944171, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.18713933905621868, "test/sim_max_reward_4300022": 0.35959116471295516, "test/sim_max_reward_4300023": 0.20575297892733313, "test/sim_max_reward_4300024": 0.0, "test/sim_max_reward_4300025": 0.08847875242732427, "test/sim_max_reward_4300026": 0.050878423390650566, "test/sim_max_reward_4300027": 0.0, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.0, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.2603000335592396, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.2067489459302592, "test/sim_max_reward_4300037": 0.5527122599440878, "test/sim_max_reward_4300038": 0.0, "test/sim_max_reward_4300039": 0.0, "test/sim_max_reward_4300040": 0.09105749141191678, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.2736347319128165, "test/sim_max_reward_4300043": 0.01912165197990456, "test/sim_max_reward_4300044": 0.04345707006804553, "test/sim_max_reward_4300045": 0.0, "test/sim_max_reward_4300046": 0.0, "test/sim_max_reward_4300047": 0.45016269539689346, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.1584114195967193, "test/mean_score": 0.11561351039094114, "val_loss": 11232949.0} {"train_loss": 1.0208582878112793, "global_step": 42, "epoch": 1} {"train_loss": 1.015068769454956, "global_step": 43, "epoch": 1} {"train_loss": 0.9827287793159485, "global_step": 44, "epoch": 1} {"train_loss": 0.9678745269775391, "global_step": 45, "epoch": 1} {"train_loss": 0.9203119874000549, "global_step": 46, "epoch": 1} {"train_loss": 0.8939889669418335, "global_step": 47, "epoch": 1} {"train_loss": 0.8535091280937195, "global_step": 48, "epoch": 1} {"train_loss": 0.849371075630188, "global_step": 49, "epoch": 1} {"train_loss": 0.8297841548919678, "global_step": 50, "epoch": 1} {"train_loss": 0.8643181324005127, "global_step": 51, "epoch": 1} {"train_loss": 0.8258622288703918, "global_step": 52, "epoch": 1} {"train_loss": 0.814349889755249, "global_step": 53, "epoch": 1} {"train_loss": 0.7348862886428833, "global_step": 54, "epoch": 1} {"train_loss": 0.7174451351165771, "global_step": 55, "epoch": 1} {"train_loss": 0.6819474697113037, "global_step": 56, "epoch": 1} {"train_loss": 0.7075159549713135, "global_step": 57, "epoch": 1} {"train_loss": 0.6666371822357178, "global_step": 58, "epoch": 1} {"train_loss": 0.6624457836151123, "global_step": 59, "epoch": 1} {"train_loss": 0.5757495164871216, "global_step": 60, "epoch": 1} {"train_loss": 0.543035626411438, "global_step": 61, "epoch": 1} {"train_loss": 0.5862610340118408, "global_step": 62, "epoch": 1} {"train_loss": 0.5269531607627869, "global_step": 63, "epoch": 1} {"train_loss": 0.5057094097137451, "global_step": 64, "epoch": 1} {"train_loss": 0.4860968589782715, "global_step": 65, "epoch": 1} {"train_loss": 0.42014795541763306, "global_step": 66, "epoch": 1} {"train_loss": 0.47680604457855225, "global_step": 67, "epoch": 1} {"train_loss": 0.4607170820236206, "global_step": 68, "epoch": 1} {"train_loss": 0.40944045782089233, "global_step": 69, "epoch": 1} {"train_loss": 0.398501992225647, "global_step": 70, "epoch": 1} {"train_loss": 0.40619656443595886, "global_step": 71, "epoch": 1} {"train_loss": 0.3920794427394867, "global_step": 72, "epoch": 1} {"train_loss": 0.35808730125427246, "global_step": 73, "epoch": 1} {"train_loss": 0.33238035440444946, "global_step": 74, "epoch": 1} {"train_loss": 0.36293619871139526, "global_step": 75, "epoch": 1} {"train_loss": 0.4291444420814514, "global_step": 76, "epoch": 1} {"train_loss": 0.3553174138069153, "global_step": 77, "epoch": 1} {"train_loss": 0.3719518482685089, "global_step": 78, "epoch": 1} {"train_loss": 0.30507010221481323, "global_step": 79, "epoch": 1} {"train_loss": 0.23480874300003052, "global_step": 80, "epoch": 1} {"train_loss": 0.33622118830680847, "global_step": 81, "epoch": 1} {"train_loss": 0.3048571050167084, "global_step": 82, "epoch": 1} {"train_loss": 0.5918673404625484, "global_step": 83, "epoch": 1, "val_loss": 5938927.0} {"train_loss": 0.22306157648563385, "global_step": 84, "epoch": 2} {"train_loss": 0.28714120388031006, "global_step": 85, "epoch": 2} {"train_loss": 0.25468116998672485, "global_step": 86, "epoch": 2} {"train_loss": 0.25405460596084595, "global_step": 87, "epoch": 2} {"train_loss": 0.280617892742157, "global_step": 88, "epoch": 2} {"train_loss": 0.2113836109638214, "global_step": 89, "epoch": 2} {"train_loss": 0.22265221178531647, "global_step": 90, "epoch": 2} {"train_loss": 0.19046813249588013, "global_step": 91, "epoch": 2} {"train_loss": 0.3090999126434326, "global_step": 92, "epoch": 2} {"train_loss": 0.1845555603504181, "global_step": 93, "epoch": 2} {"train_loss": 0.16842074692249298, "global_step": 94, "epoch": 2} {"train_loss": 0.2336711585521698, "global_step": 95, "epoch": 2} {"train_loss": 0.12927387654781342, "global_step": 96, "epoch": 2} {"train_loss": 0.15663652122020721, "global_step": 97, "epoch": 2} {"train_loss": 0.09308917820453644, "global_step": 98, "epoch": 2} {"train_loss": 0.07111652195453644, "global_step": 99, "epoch": 2} {"train_loss": 0.06545024365186691, "global_step": 100, "epoch": 2} {"train_loss": 0.17648255825042725, "global_step": 101, "epoch": 2} {"train_loss": 0.035631246864795685, "global_step": 102, "epoch": 2} {"train_loss": -0.01318657398223877, "global_step": 103, "epoch": 2} {"train_loss": 0.006441272795200348, "global_step": 104, "epoch": 2} {"train_loss": 0.061115656048059464, "global_step": 105, "epoch": 2} {"train_loss": 0.06397709995508194, "global_step": 106, "epoch": 2} {"train_loss": 0.09266793727874756, "global_step": 107, "epoch": 2} {"train_loss": 0.01328933984041214, "global_step": 108, "epoch": 2} {"train_loss": 0.06658939272165298, "global_step": 109, "epoch": 2} {"train_loss": 0.07439127564430237, "global_step": 110, "epoch": 2} {"train_loss": 0.03880520164966583, "global_step": 111, "epoch": 2} {"train_loss": 0.012480254285037518, "global_step": 112, "epoch": 2} {"train_loss": 0.0709834173321724, "global_step": 113, "epoch": 2} {"train_loss": 0.0031457431614398956, "global_step": 114, "epoch": 2} {"train_loss": -0.002028554677963257, "global_step": 115, "epoch": 2} {"train_loss": 0.0059441253542900085, "global_step": 116, "epoch": 2} {"train_loss": 0.005574056878685951, "global_step": 117, "epoch": 2} {"train_loss": 0.01677727699279785, "global_step": 118, "epoch": 2} {"train_loss": -0.13312464952468872, "global_step": 119, "epoch": 2} {"train_loss": -0.09426446259021759, "global_step": 120, "epoch": 2} {"train_loss": -0.10077901184558868, "global_step": 121, "epoch": 2} {"train_loss": -0.07904971390962601, "global_step": 122, "epoch": 2} {"train_loss": -0.14626061916351318, "global_step": 123, "epoch": 2} {"train_loss": -0.12131902575492859, "global_step": 124, "epoch": 2} {"train_loss": 0.07767133248437728, "global_step": 125, "epoch": 2, "val_loss": 4815260.0} {"train_loss": -0.10519064962863922, "global_step": 126, "epoch": 3} {"train_loss": -0.08981063216924667, "global_step": 127, "epoch": 3} {"train_loss": -0.1813444197177887, "global_step": 128, "epoch": 3} {"train_loss": -0.15331345796585083, "global_step": 129, "epoch": 3} {"train_loss": -0.1684861034154892, "global_step": 130, "epoch": 3} {"train_loss": -0.1494218409061432, "global_step": 131, "epoch": 3} {"train_loss": -0.2122676819562912, "global_step": 132, "epoch": 3} {"train_loss": -0.1420471966266632, "global_step": 133, "epoch": 3} {"train_loss": -0.1610298901796341, "global_step": 134, "epoch": 3} {"train_loss": -0.25715065002441406, "global_step": 135, "epoch": 3} {"train_loss": -0.1929774284362793, "global_step": 136, "epoch": 3} {"train_loss": -0.16662444174289703, "global_step": 137, "epoch": 3} {"train_loss": -0.12424670159816742, "global_step": 138, "epoch": 3} {"train_loss": -0.20516617596149445, "global_step": 139, "epoch": 3} {"train_loss": -0.3039698004722595, "global_step": 140, "epoch": 3} {"train_loss": -0.2842889428138733, "global_step": 141, "epoch": 3} {"train_loss": -0.15718069672584534, "global_step": 142, "epoch": 3} {"train_loss": -0.3200772702693939, "global_step": 143, "epoch": 3} {"train_loss": -0.2188946008682251, "global_step": 144, "epoch": 3} {"train_loss": -0.1792522370815277, "global_step": 145, "epoch": 3} {"train_loss": -0.24467787146568298, "global_step": 146, "epoch": 3} {"train_loss": -0.25486141443252563, "global_step": 147, "epoch": 3} {"train_loss": -0.2823946177959442, "global_step": 148, "epoch": 3} {"train_loss": -0.2732309103012085, "global_step": 149, "epoch": 3} {"train_loss": -0.3746352791786194, "global_step": 150, "epoch": 3} {"train_loss": -0.38104212284088135, "global_step": 151, "epoch": 3} {"train_loss": -0.3348652124404907, "global_step": 152, "epoch": 3} {"train_loss": -0.2951519191265106, "global_step": 153, "epoch": 3} {"train_loss": -0.35190320014953613, "global_step": 154, "epoch": 3} {"train_loss": -0.36508622765541077, "global_step": 155, "epoch": 3} {"train_loss": -0.4201236963272095, "global_step": 156, "epoch": 3} {"train_loss": -0.47223329544067383, "global_step": 157, "epoch": 3} {"train_loss": -0.27746570110321045, "global_step": 158, "epoch": 3} {"train_loss": -0.3210342526435852, "global_step": 159, "epoch": 3} {"train_loss": -0.35707348585128784, "global_step": 160, "epoch": 3} {"train_loss": -0.4061461091041565, "global_step": 161, "epoch": 3} {"train_loss": -0.5174804925918579, "global_step": 162, "epoch": 3} {"train_loss": -0.4136618375778198, "global_step": 163, "epoch": 3} {"train_loss": -0.4389405846595764, "global_step": 164, "epoch": 3} {"train_loss": -0.5324921607971191, "global_step": 165, "epoch": 3} {"train_loss": -0.4302380084991455, "global_step": 166, "epoch": 3} {"train_loss": -0.2842828689941338, "global_step": 167, "epoch": 3, "val_loss": 3853224.5} {"train_loss": -0.5360043048858643, "global_step": 168, "epoch": 4} {"train_loss": -0.4662514328956604, "global_step": 169, "epoch": 4} {"train_loss": -0.5039394497871399, "global_step": 170, "epoch": 4} {"train_loss": -0.43809428811073303, "global_step": 171, "epoch": 4} {"train_loss": -0.5264625549316406, "global_step": 172, "epoch": 4} {"train_loss": -0.44129616022109985, "global_step": 173, "epoch": 4} {"train_loss": -0.4339068830013275, "global_step": 174, "epoch": 4} {"train_loss": -0.46454787254333496, "global_step": 175, "epoch": 4} {"train_loss": -0.49031853675842285, "global_step": 176, "epoch": 4} {"train_loss": -0.5210659503936768, "global_step": 177, "epoch": 4} {"train_loss": -0.5255270004272461, "global_step": 178, "epoch": 4} {"train_loss": -0.5684991478919983, "global_step": 179, "epoch": 4} {"train_loss": -0.5150684118270874, "global_step": 180, "epoch": 4} {"train_loss": -0.5204536318778992, "global_step": 181, "epoch": 4} {"train_loss": -0.607123076915741, "global_step": 182, "epoch": 4} {"train_loss": -0.46359196305274963, "global_step": 183, "epoch": 4} {"train_loss": -0.6431531310081482, "global_step": 184, "epoch": 4} {"train_loss": -0.40077999234199524, "global_step": 185, "epoch": 4} {"train_loss": -0.4919963479042053, "global_step": 186, "epoch": 4} {"train_loss": -0.6038305759429932, "global_step": 187, "epoch": 4} {"train_loss": -0.47980988025665283, "global_step": 188, "epoch": 4} {"train_loss": -0.6136447191238403, "global_step": 189, "epoch": 4} {"train_loss": -0.55631422996521, "global_step": 190, "epoch": 4} {"train_loss": -0.5420609712600708, "global_step": 191, "epoch": 4} {"train_loss": -0.6007013320922852, "global_step": 192, "epoch": 4} {"train_loss": -0.5448952317237854, "global_step": 193, "epoch": 4} {"train_loss": -0.6635226011276245, "global_step": 194, "epoch": 4} {"train_loss": -0.6159459352493286, "global_step": 195, "epoch": 4} {"train_loss": -0.6901183128356934, "global_step": 196, "epoch": 4} {"train_loss": -0.6374943852424622, "global_step": 197, "epoch": 4} {"train_loss": -0.5588765144348145, "global_step": 198, "epoch": 4} {"train_loss": -0.6029942035675049, "global_step": 199, "epoch": 4} {"train_loss": -0.6153543591499329, "global_step": 200, "epoch": 4} {"train_loss": -0.647894561290741, "global_step": 201, "epoch": 4} {"train_loss": -0.7010469436645508, "global_step": 202, "epoch": 4} {"train_loss": -0.613686740398407, "global_step": 203, "epoch": 4} {"train_loss": -0.7155455946922302, "global_step": 204, "epoch": 4} {"train_loss": -0.654948890209198, "global_step": 205, "epoch": 4} {"train_loss": -0.6496022939682007, "global_step": 206, "epoch": 4} {"train_loss": -0.6945359706878662, "global_step": 207, "epoch": 4} {"train_loss": -0.7572752833366394, "global_step": 208, "epoch": 4} {"train_loss": -0.571169546672276, "global_step": 209, "epoch": 4, "val_loss": 3308961.25} {"train_loss": -0.7136316299438477, "global_step": 210, "epoch": 5} {"train_loss": -0.671282947063446, "global_step": 211, "epoch": 5} {"train_loss": -0.7403661012649536, "global_step": 212, "epoch": 5} {"train_loss": -0.7070361375808716, "global_step": 213, "epoch": 5} {"train_loss": -0.7715414762496948, "global_step": 214, "epoch": 5} {"train_loss": -0.7376683950424194, "global_step": 215, "epoch": 5} {"train_loss": -0.6407405138015747, "global_step": 216, "epoch": 5} {"train_loss": -0.849372148513794, "global_step": 217, "epoch": 5} {"train_loss": -0.7007472515106201, "global_step": 218, "epoch": 5} {"train_loss": -0.6487658023834229, "global_step": 219, "epoch": 5} {"train_loss": -0.8206651210784912, "global_step": 220, "epoch": 5} {"train_loss": -0.7927142381668091, "global_step": 221, "epoch": 5} {"train_loss": -0.8031151294708252, "global_step": 222, "epoch": 5} {"train_loss": -0.6937841176986694, "global_step": 223, "epoch": 5} {"train_loss": -0.6992763876914978, "global_step": 224, "epoch": 5} {"train_loss": -0.632790207862854, "global_step": 225, "epoch": 5} {"train_loss": -0.7984310388565063, "global_step": 226, "epoch": 5} {"train_loss": -0.7448620796203613, "global_step": 227, "epoch": 5} {"train_loss": -0.7212517261505127, "global_step": 228, "epoch": 5} {"train_loss": -0.7534048557281494, "global_step": 229, "epoch": 5} {"train_loss": -0.7908241748809814, "global_step": 230, "epoch": 5} {"train_loss": -0.7424228191375732, "global_step": 231, "epoch": 5} {"train_loss": -0.7627503275871277, "global_step": 232, "epoch": 5} {"train_loss": -0.6683834791183472, "global_step": 233, "epoch": 5} {"train_loss": -0.7667509317398071, "global_step": 234, "epoch": 5} {"train_loss": -0.7687947750091553, "global_step": 235, "epoch": 5} {"train_loss": -0.7318363189697266, "global_step": 236, "epoch": 5} {"train_loss": -0.793596088886261, "global_step": 237, "epoch": 5} {"train_loss": -0.794610321521759, "global_step": 238, "epoch": 5} {"train_loss": -0.7707472443580627, "global_step": 239, "epoch": 5} {"train_loss": -0.62339848279953, "global_step": 240, "epoch": 5} {"train_loss": -0.7922433614730835, "global_step": 241, "epoch": 5} {"train_loss": -0.8346412181854248, "global_step": 242, "epoch": 5} {"train_loss": -0.6992638111114502, "global_step": 243, "epoch": 5} {"train_loss": -0.7972555160522461, "global_step": 244, "epoch": 5} {"train_loss": -0.7291396856307983, "global_step": 245, "epoch": 5} {"train_loss": -0.6736106276512146, "global_step": 246, "epoch": 5} {"train_loss": -0.863975465297699, "global_step": 247, "epoch": 5} {"train_loss": -0.836030900478363, "global_step": 248, "epoch": 5} {"train_loss": -0.7345304489135742, "global_step": 249, "epoch": 5} {"train_loss": -0.9274780750274658, "global_step": 250, "epoch": 5} {"train_loss": -0.7514281954084124, "global_step": 251, "epoch": 5, "val_loss": 2878086.75} {"train_loss": -0.8776708841323853, "global_step": 252, "epoch": 6} {"train_loss": -0.7657326459884644, "global_step": 253, "epoch": 6} {"train_loss": -0.8203249573707581, "global_step": 254, "epoch": 6} {"train_loss": -0.871324896812439, "global_step": 255, "epoch": 6} {"train_loss": -0.7214906215667725, "global_step": 256, "epoch": 6} {"train_loss": -0.8425886631011963, "global_step": 257, "epoch": 6} {"train_loss": -0.8298913240432739, "global_step": 258, "epoch": 6} {"train_loss": -0.7082198262214661, "global_step": 259, "epoch": 6} {"train_loss": -0.9047219753265381, "global_step": 260, "epoch": 6} {"train_loss": -0.853540301322937, "global_step": 261, "epoch": 6} {"train_loss": -0.9139492511749268, "global_step": 262, "epoch": 6} {"train_loss": -0.9243578910827637, "global_step": 263, "epoch": 6} {"train_loss": -0.8530220985412598, "global_step": 264, "epoch": 6} {"train_loss": -0.8792333006858826, "global_step": 265, "epoch": 6} {"train_loss": -0.892673671245575, "global_step": 266, "epoch": 6} {"train_loss": -0.9515854716300964, "global_step": 267, "epoch": 6} {"train_loss": -0.8681751489639282, "global_step": 268, "epoch": 6} {"train_loss": -0.9285545349121094, "global_step": 269, "epoch": 6} {"train_loss": -0.9322136640548706, "global_step": 270, "epoch": 6} {"train_loss": -0.9316230416297913, "global_step": 271, "epoch": 6} {"train_loss": -1.060189962387085, "global_step": 272, "epoch": 6} {"train_loss": -0.9967048168182373, "global_step": 273, "epoch": 6} {"train_loss": -0.9121919870376587, "global_step": 274, "epoch": 6} {"train_loss": -1.057435393333435, "global_step": 275, "epoch": 6} {"train_loss": -0.9165706634521484, "global_step": 276, "epoch": 6} {"train_loss": -0.8871102333068848, "global_step": 277, "epoch": 6} {"train_loss": -0.9739199876785278, "global_step": 278, "epoch": 6} {"train_loss": -0.860520601272583, "global_step": 279, "epoch": 6} {"train_loss": -0.8879280090332031, "global_step": 280, "epoch": 6} {"train_loss": -0.8928805589675903, "global_step": 281, "epoch": 6} {"train_loss": -0.9103612899780273, "global_step": 282, "epoch": 6} {"train_loss": -0.9876779913902283, "global_step": 283, "epoch": 6} {"train_loss": -0.8378302454948425, "global_step": 284, "epoch": 6} {"train_loss": -0.8698583841323853, "global_step": 285, "epoch": 6} {"train_loss": -0.9333783388137817, "global_step": 286, "epoch": 6} {"train_loss": -0.9192638397216797, "global_step": 287, "epoch": 6} {"train_loss": -0.9667123556137085, "global_step": 288, "epoch": 6} {"train_loss": -0.9392381310462952, "global_step": 289, "epoch": 6} {"train_loss": -1.0201717615127563, "global_step": 290, "epoch": 6} {"train_loss": -1.1119673252105713, "global_step": 291, "epoch": 6} {"train_loss": -0.9624872803688049, "global_step": 292, "epoch": 6} {"train_loss": -0.9058477651505243, "global_step": 293, "epoch": 6, "val_loss": 2610753.25} {"train_loss": -1.0681235790252686, "global_step": 294, "epoch": 7} {"train_loss": -0.9070056676864624, "global_step": 295, "epoch": 7} {"train_loss": -0.9035718441009521, "global_step": 296, "epoch": 7} {"train_loss": -0.9630419611930847, "global_step": 297, "epoch": 7} {"train_loss": -1.0848912000656128, "global_step": 298, "epoch": 7} {"train_loss": -0.8790398836135864, "global_step": 299, "epoch": 7} {"train_loss": -1.1043205261230469, "global_step": 300, "epoch": 7} {"train_loss": -1.0273535251617432, "global_step": 301, "epoch": 7} {"train_loss": -0.96843421459198, "global_step": 302, "epoch": 7} {"train_loss": -1.0300846099853516, "global_step": 303, "epoch": 7} {"train_loss": -0.9826042652130127, "global_step": 304, "epoch": 7} {"train_loss": -1.0682003498077393, "global_step": 305, "epoch": 7} {"train_loss": -1.0763468742370605, "global_step": 306, "epoch": 7} {"train_loss": -0.9600091576576233, "global_step": 307, "epoch": 7} {"train_loss": -1.011047124862671, "global_step": 308, "epoch": 7} {"train_loss": -0.9943722486495972, "global_step": 309, "epoch": 7} {"train_loss": -1.0284861326217651, "global_step": 310, "epoch": 7} {"train_loss": -1.1991462707519531, "global_step": 311, "epoch": 7} {"train_loss": -1.0355498790740967, "global_step": 312, "epoch": 7} {"train_loss": -0.9969649314880371, "global_step": 313, "epoch": 7} {"train_loss": -0.938249409198761, "global_step": 314, "epoch": 7} {"train_loss": -0.996869683265686, "global_step": 315, "epoch": 7} {"train_loss": -1.1410462856292725, "global_step": 316, "epoch": 7} {"train_loss": -0.9995198249816895, "global_step": 317, "epoch": 7} {"train_loss": -0.961237907409668, "global_step": 318, "epoch": 7} {"train_loss": -1.058931827545166, "global_step": 319, "epoch": 7} {"train_loss": -0.9899581074714661, "global_step": 320, "epoch": 7} {"train_loss": -1.0167008638381958, "global_step": 321, "epoch": 7} {"train_loss": -0.9625723958015442, "global_step": 322, "epoch": 7} {"train_loss": -1.008886694908142, "global_step": 323, "epoch": 7} {"train_loss": -1.0854196548461914, "global_step": 324, "epoch": 7} {"train_loss": -1.0835262537002563, "global_step": 325, "epoch": 7} {"train_loss": -1.1271519660949707, "global_step": 326, "epoch": 7} {"train_loss": -0.9641644954681396, "global_step": 327, "epoch": 7} {"train_loss": -1.1958526372909546, "global_step": 328, "epoch": 7} {"train_loss": -1.0713754892349243, "global_step": 329, "epoch": 7} {"train_loss": -1.0820577144622803, "global_step": 330, "epoch": 7} {"train_loss": -1.0169970989227295, "global_step": 331, "epoch": 7} {"train_loss": -1.0258194208145142, "global_step": 332, "epoch": 7} {"train_loss": -1.1290063858032227, "global_step": 333, "epoch": 7} {"train_loss": -1.1182942390441895, "global_step": 334, "epoch": 7} {"train_loss": -1.0264089646793546, "global_step": 335, "epoch": 7, "val_loss": 2366671.25} {"train_loss": -0.9925836324691772, "global_step": 336, "epoch": 8} {"train_loss": -1.0710923671722412, "global_step": 337, "epoch": 8} {"train_loss": -1.0250303745269775, "global_step": 338, "epoch": 8} {"train_loss": -1.032158613204956, "global_step": 339, "epoch": 8} {"train_loss": -1.1973841190338135, "global_step": 340, "epoch": 8} {"train_loss": -1.1458345651626587, "global_step": 341, "epoch": 8} {"train_loss": -1.068821907043457, "global_step": 342, "epoch": 8} {"train_loss": -1.0537687540054321, "global_step": 343, "epoch": 8} {"train_loss": -1.076400876045227, "global_step": 344, "epoch": 8} {"train_loss": -1.124106764793396, "global_step": 345, "epoch": 8} {"train_loss": -0.9815613031387329, "global_step": 346, "epoch": 8} {"train_loss": -1.1445629596710205, "global_step": 347, "epoch": 8} {"train_loss": -1.2030601501464844, "global_step": 348, "epoch": 8} {"train_loss": -1.1231989860534668, "global_step": 349, "epoch": 8} {"train_loss": -1.066112756729126, "global_step": 350, "epoch": 8} {"train_loss": -1.2070659399032593, "global_step": 351, "epoch": 8} {"train_loss": -1.158046007156372, "global_step": 352, "epoch": 8} {"train_loss": -1.1082749366760254, "global_step": 353, "epoch": 8} {"train_loss": -1.1724414825439453, "global_step": 354, "epoch": 8} {"train_loss": -1.1588571071624756, "global_step": 355, "epoch": 8} {"train_loss": -1.06636381149292, "global_step": 356, "epoch": 8} {"train_loss": -1.1098870038986206, "global_step": 357, "epoch": 8} {"train_loss": -1.1504242420196533, "global_step": 358, "epoch": 8} {"train_loss": -1.17108154296875, "global_step": 359, "epoch": 8} {"train_loss": -1.0463343858718872, "global_step": 360, "epoch": 8} {"train_loss": -1.050464153289795, "global_step": 361, "epoch": 8} {"train_loss": -1.173079252243042, "global_step": 362, "epoch": 8} {"train_loss": -1.306384801864624, "global_step": 363, "epoch": 8} {"train_loss": -1.196860909461975, "global_step": 364, "epoch": 8} {"train_loss": -1.2879102230072021, "global_step": 365, "epoch": 8} {"train_loss": -1.3539347648620605, "global_step": 366, "epoch": 8} {"train_loss": -1.228053331375122, "global_step": 367, "epoch": 8} {"train_loss": -1.1947898864746094, "global_step": 368, "epoch": 8} {"train_loss": -1.1022745370864868, "global_step": 369, "epoch": 8} {"train_loss": -1.1426029205322266, "global_step": 370, "epoch": 8} {"train_loss": -1.2771339416503906, "global_step": 371, "epoch": 8} {"train_loss": -1.378239631652832, "global_step": 372, "epoch": 8} {"train_loss": -1.2131999731063843, "global_step": 373, "epoch": 8} {"train_loss": -1.2024842500686646, "global_step": 374, "epoch": 8} {"train_loss": -1.3731250762939453, "global_step": 375, "epoch": 8} {"train_loss": -1.2089873552322388, "global_step": 376, "epoch": 8} {"train_loss": -1.1545578752245222, "global_step": 377, "epoch": 8, "val_loss": 2179189.75} {"train_loss": -1.0705561637878418, "global_step": 378, "epoch": 9} {"train_loss": -1.2320197820663452, "global_step": 379, "epoch": 9} {"train_loss": -1.2611980438232422, "global_step": 380, "epoch": 9} {"train_loss": -1.3038798570632935, "global_step": 381, "epoch": 9} {"train_loss": -1.2280348539352417, "global_step": 382, "epoch": 9} {"train_loss": -1.1682641506195068, "global_step": 383, "epoch": 9} {"train_loss": -1.4166680574417114, "global_step": 384, "epoch": 9} {"train_loss": -1.3126823902130127, "global_step": 385, "epoch": 9} {"train_loss": -1.322462797164917, "global_step": 386, "epoch": 9} {"train_loss": -1.2673370838165283, "global_step": 387, "epoch": 9} {"train_loss": -1.2119104862213135, "global_step": 388, "epoch": 9} {"train_loss": -1.2318840026855469, "global_step": 389, "epoch": 9} {"train_loss": -1.297996163368225, "global_step": 390, "epoch": 9} {"train_loss": -1.1737221479415894, "global_step": 391, "epoch": 9} {"train_loss": -1.2064300775527954, "global_step": 392, "epoch": 9} {"train_loss": -1.2870938777923584, "global_step": 393, "epoch": 9} {"train_loss": -1.2622560262680054, "global_step": 394, "epoch": 9} {"train_loss": -1.2044024467468262, "global_step": 395, "epoch": 9} {"train_loss": -1.2310144901275635, "global_step": 396, "epoch": 9} {"train_loss": -1.1428585052490234, "global_step": 397, "epoch": 9} {"train_loss": -1.3390827178955078, "global_step": 398, "epoch": 9} {"train_loss": -1.2633143663406372, "global_step": 399, "epoch": 9} {"train_loss": -1.2967708110809326, "global_step": 400, "epoch": 9} {"train_loss": -1.1254571676254272, "global_step": 401, "epoch": 9} {"train_loss": -1.2783732414245605, "global_step": 402, "epoch": 9} {"train_loss": -1.2161865234375, "global_step": 403, "epoch": 9} {"train_loss": -1.3139245510101318, "global_step": 404, "epoch": 9} {"train_loss": -1.3046616315841675, "global_step": 405, "epoch": 9} {"train_loss": -1.3196754455566406, "global_step": 406, "epoch": 9} {"train_loss": -1.2723554372787476, "global_step": 407, "epoch": 9} {"train_loss": -1.3453538417816162, "global_step": 408, "epoch": 9} {"train_loss": -1.2125494480133057, "global_step": 409, "epoch": 9} {"train_loss": -1.2747331857681274, "global_step": 410, "epoch": 9} {"train_loss": -1.3129620552062988, "global_step": 411, "epoch": 9} {"train_loss": -1.258942723274231, "global_step": 412, "epoch": 9} {"train_loss": -1.208476185798645, "global_step": 413, "epoch": 9} {"train_loss": -1.4754117727279663, "global_step": 414, "epoch": 9} {"train_loss": -1.1589123010635376, "global_step": 415, "epoch": 9} {"train_loss": -1.2803003787994385, "global_step": 416, "epoch": 9} {"train_loss": -1.1403826475143433, "global_step": 417, "epoch": 9} {"train_loss": -1.4098429679870605, "global_step": 418, "epoch": 9} {"train_loss": -1.2596579052153087, "global_step": 419, "epoch": 9, "val_loss": 1990184.75} {"train_loss": -1.3051643371582031, "global_step": 420, "epoch": 10} {"train_loss": -1.21370530128479, "global_step": 421, "epoch": 10} {"train_loss": -1.4113961458206177, "global_step": 422, "epoch": 10} {"train_loss": -1.381969690322876, "global_step": 423, "epoch": 10} {"train_loss": -1.4070217609405518, "global_step": 424, "epoch": 10} {"train_loss": -1.4346344470977783, "global_step": 425, "epoch": 10} {"train_loss": -1.2139086723327637, "global_step": 426, "epoch": 10} {"train_loss": -1.2513718605041504, "global_step": 427, "epoch": 10} {"train_loss": -1.2649130821228027, "global_step": 428, "epoch": 10} {"train_loss": -1.332465410232544, "global_step": 429, "epoch": 10} {"train_loss": -1.3139711618423462, "global_step": 430, "epoch": 10} {"train_loss": -1.4609161615371704, "global_step": 431, "epoch": 10} {"train_loss": -1.372430443763733, "global_step": 432, "epoch": 10} {"train_loss": -1.3405905961990356, "global_step": 433, "epoch": 10} {"train_loss": -1.477759599685669, "global_step": 434, "epoch": 10} {"train_loss": -1.387232780456543, "global_step": 435, "epoch": 10} {"train_loss": -1.352647304534912, "global_step": 436, "epoch": 10} {"train_loss": -1.3617935180664062, "global_step": 437, "epoch": 10} {"train_loss": -1.313601016998291, "global_step": 438, "epoch": 10} {"train_loss": -1.3144828081130981, "global_step": 439, "epoch": 10} {"train_loss": -1.3875685930252075, "global_step": 440, "epoch": 10} {"train_loss": -1.3264639377593994, "global_step": 441, "epoch": 10} {"train_loss": -1.3495972156524658, "global_step": 442, "epoch": 10} {"train_loss": -1.5013669729232788, "global_step": 443, "epoch": 10} {"train_loss": -1.3074041604995728, "global_step": 444, "epoch": 10} {"train_loss": -1.4313362836837769, "global_step": 445, "epoch": 10} {"train_loss": -1.4444940090179443, "global_step": 446, "epoch": 10} {"train_loss": -1.3576085567474365, "global_step": 447, "epoch": 10} {"train_loss": -1.3207645416259766, "global_step": 448, "epoch": 10} {"train_loss": -1.3326306343078613, "global_step": 449, "epoch": 10} {"train_loss": -1.459911584854126, "global_step": 450, "epoch": 10} {"train_loss": -1.3362787961959839, "global_step": 451, "epoch": 10} {"train_loss": -1.3802194595336914, "global_step": 452, "epoch": 10} {"train_loss": -1.3731943368911743, "global_step": 453, "epoch": 10} {"train_loss": -1.4423518180847168, "global_step": 454, "epoch": 10} {"train_loss": -1.3905572891235352, "global_step": 455, "epoch": 10} {"train_loss": -1.4583693742752075, "global_step": 456, "epoch": 10} {"train_loss": -1.5819900035858154, "global_step": 457, "epoch": 10} {"train_loss": -1.3591499328613281, "global_step": 458, "epoch": 10} {"train_loss": -1.4098117351531982, "global_step": 459, "epoch": 10} {"train_loss": -1.5014984607696533, "global_step": 460, "epoch": 10} {"train_loss": -1.3724500309853327, "global_step": 461, "epoch": 10, "val_loss": 1853122.125} {"train_loss": -1.4739997386932373, "global_step": 462, "epoch": 11} {"train_loss": -1.4418213367462158, "global_step": 463, "epoch": 11} {"train_loss": -1.3421063423156738, "global_step": 464, "epoch": 11} {"train_loss": -1.4967846870422363, "global_step": 465, "epoch": 11} {"train_loss": -1.4576356410980225, "global_step": 466, "epoch": 11} {"train_loss": -1.3974672555923462, "global_step": 467, "epoch": 11} {"train_loss": -1.4298994541168213, "global_step": 468, "epoch": 11} {"train_loss": -1.4227041006088257, "global_step": 469, "epoch": 11} {"train_loss": -1.3554188013076782, "global_step": 470, "epoch": 11} {"train_loss": -1.347485065460205, "global_step": 471, "epoch": 11} {"train_loss": -1.3884923458099365, "global_step": 472, "epoch": 11} {"train_loss": -1.4471186399459839, "global_step": 473, "epoch": 11} {"train_loss": -1.3852406740188599, "global_step": 474, "epoch": 11} {"train_loss": -1.5178022384643555, "global_step": 475, "epoch": 11} {"train_loss": -1.3831449747085571, "global_step": 476, "epoch": 11} {"train_loss": -1.5205299854278564, "global_step": 477, "epoch": 11} {"train_loss": -1.3362922668457031, "global_step": 478, "epoch": 11} {"train_loss": -1.4745274782180786, "global_step": 479, "epoch": 11} {"train_loss": -1.5571529865264893, "global_step": 480, "epoch": 11} {"train_loss": -1.4094126224517822, "global_step": 481, "epoch": 11} {"train_loss": -1.4696135520935059, "global_step": 482, "epoch": 11} {"train_loss": -1.4960732460021973, "global_step": 483, "epoch": 11} {"train_loss": -1.5177745819091797, "global_step": 484, "epoch": 11} {"train_loss": -1.576391339302063, "global_step": 485, "epoch": 11} {"train_loss": -1.4765312671661377, "global_step": 486, "epoch": 11} {"train_loss": -1.5370246171951294, "global_step": 487, "epoch": 11} {"train_loss": -1.5814836025238037, "global_step": 488, "epoch": 11} {"train_loss": -1.562819004058838, "global_step": 489, "epoch": 11} {"train_loss": -1.4841864109039307, "global_step": 490, "epoch": 11} {"train_loss": -1.4123942852020264, "global_step": 491, "epoch": 11} {"train_loss": -1.5483721494674683, "global_step": 492, "epoch": 11} {"train_loss": -1.5655810832977295, "global_step": 493, "epoch": 11} {"train_loss": -1.5702763795852661, "global_step": 494, "epoch": 11} {"train_loss": -1.4619444608688354, "global_step": 495, "epoch": 11} {"train_loss": -1.5053043365478516, "global_step": 496, "epoch": 11} {"train_loss": -1.3099644184112549, "global_step": 497, "epoch": 11} {"train_loss": -1.4178991317749023, "global_step": 498, "epoch": 11} {"train_loss": -1.4942646026611328, "global_step": 499, "epoch": 11} {"train_loss": -1.588794231414795, "global_step": 500, "epoch": 11} {"train_loss": -1.520461082458496, "global_step": 501, "epoch": 11} {"train_loss": -1.4300651550292969, "global_step": 502, "epoch": 11} {"train_loss": -1.4699548255829584, "global_step": 503, "epoch": 11, "val_loss": 1724765.75} {"train_loss": -1.4838064908981323, "global_step": 504, "epoch": 12} {"train_loss": -1.5761690139770508, "global_step": 505, "epoch": 12} {"train_loss": -1.60178804397583, "global_step": 506, "epoch": 12} {"train_loss": -1.508998155593872, "global_step": 507, "epoch": 12} {"train_loss": -1.5491385459899902, "global_step": 508, "epoch": 12} {"train_loss": -1.475031852722168, "global_step": 509, "epoch": 12} {"train_loss": -1.6695691347122192, "global_step": 510, "epoch": 12} {"train_loss": -1.582472562789917, "global_step": 511, "epoch": 12} {"train_loss": -1.5479868650436401, "global_step": 512, "epoch": 12} {"train_loss": -1.5066263675689697, "global_step": 513, "epoch": 12} {"train_loss": -1.525808334350586, "global_step": 514, "epoch": 12} {"train_loss": -1.5294687747955322, "global_step": 515, "epoch": 12} {"train_loss": -1.5908219814300537, "global_step": 516, "epoch": 12} {"train_loss": -1.559167504310608, "global_step": 517, "epoch": 12} {"train_loss": -1.4305965900421143, "global_step": 518, "epoch": 12} {"train_loss": -1.693107008934021, "global_step": 519, "epoch": 12} {"train_loss": -1.5495431423187256, "global_step": 520, "epoch": 12} {"train_loss": -1.6581398248672485, "global_step": 521, "epoch": 12} {"train_loss": -1.4452321529388428, "global_step": 522, "epoch": 12} {"train_loss": -1.4567331075668335, "global_step": 523, "epoch": 12} {"train_loss": -1.6152522563934326, "global_step": 524, "epoch": 12} {"train_loss": -1.4762977361679077, "global_step": 525, "epoch": 12} {"train_loss": -1.589228868484497, "global_step": 526, "epoch": 12} {"train_loss": -1.4884014129638672, "global_step": 527, "epoch": 12} {"train_loss": -1.6079943180084229, "global_step": 528, "epoch": 12} {"train_loss": -1.5950772762298584, "global_step": 529, "epoch": 12} {"train_loss": -1.4288907051086426, "global_step": 530, "epoch": 12} {"train_loss": -1.5969294309616089, "global_step": 531, "epoch": 12} {"train_loss": -1.5852819681167603, "global_step": 532, "epoch": 12} {"train_loss": -1.5744572877883911, "global_step": 533, "epoch": 12} {"train_loss": -1.6149553060531616, "global_step": 534, "epoch": 12} {"train_loss": -1.649193525314331, "global_step": 535, "epoch": 12} {"train_loss": -1.5697489976882935, "global_step": 536, "epoch": 12} {"train_loss": -1.5199910402297974, "global_step": 537, "epoch": 12} {"train_loss": -1.6575469970703125, "global_step": 538, "epoch": 12} {"train_loss": -1.3711668252944946, "global_step": 539, "epoch": 12} {"train_loss": -1.5355427265167236, "global_step": 540, "epoch": 12} {"train_loss": -1.5756137371063232, "global_step": 541, "epoch": 12} {"train_loss": -1.6449251174926758, "global_step": 542, "epoch": 12} {"train_loss": -1.5321691036224365, "global_step": 543, "epoch": 12} {"train_loss": -1.6105233430862427, "global_step": 544, "epoch": 12} {"train_loss": -1.5555212157113212, "global_step": 545, "epoch": 12, "val_loss": 1599088.625} {"train_loss": -1.6619682312011719, "global_step": 546, "epoch": 13} {"train_loss": -1.6694247722625732, "global_step": 547, "epoch": 13} {"train_loss": -1.6392004489898682, "global_step": 548, "epoch": 13} {"train_loss": -1.6934516429901123, "global_step": 549, "epoch": 13} {"train_loss": -1.529876708984375, "global_step": 550, "epoch": 13} {"train_loss": -1.627023696899414, "global_step": 551, "epoch": 13} {"train_loss": -1.5711965560913086, "global_step": 552, "epoch": 13} {"train_loss": -1.779996395111084, "global_step": 553, "epoch": 13} {"train_loss": -1.4839509725570679, "global_step": 554, "epoch": 13} {"train_loss": -1.7487506866455078, "global_step": 555, "epoch": 13} {"train_loss": -1.7104451656341553, "global_step": 556, "epoch": 13} {"train_loss": -1.7035367488861084, "global_step": 557, "epoch": 13} {"train_loss": -1.5989580154418945, "global_step": 558, "epoch": 13} {"train_loss": -1.623702049255371, "global_step": 559, "epoch": 13} {"train_loss": -1.4296270608901978, "global_step": 560, "epoch": 13} {"train_loss": -1.7396597862243652, "global_step": 561, "epoch": 13} {"train_loss": -1.5696942806243896, "global_step": 562, "epoch": 13} {"train_loss": -1.5709532499313354, "global_step": 563, "epoch": 13} {"train_loss": -1.6869759559631348, "global_step": 564, "epoch": 13} {"train_loss": -1.8204396963119507, "global_step": 565, "epoch": 13} {"train_loss": -1.6468791961669922, "global_step": 566, "epoch": 13} {"train_loss": -1.6941334009170532, "global_step": 567, "epoch": 13} {"train_loss": -1.7840840816497803, "global_step": 568, "epoch": 13} {"train_loss": -1.6145899295806885, "global_step": 569, "epoch": 13} {"train_loss": -1.653458595275879, "global_step": 570, "epoch": 13} {"train_loss": -1.7088122367858887, "global_step": 571, "epoch": 13} {"train_loss": -1.5952085256576538, "global_step": 572, "epoch": 13} {"train_loss": -1.5411171913146973, "global_step": 573, "epoch": 13} {"train_loss": -1.7124030590057373, "global_step": 574, "epoch": 13} {"train_loss": -1.6686975955963135, "global_step": 575, "epoch": 13} {"train_loss": -1.6546859741210938, "global_step": 576, "epoch": 13} {"train_loss": -1.7517188787460327, "global_step": 577, "epoch": 13} {"train_loss": -1.6570384502410889, "global_step": 578, "epoch": 13} {"train_loss": -1.598872184753418, "global_step": 579, "epoch": 13} {"train_loss": -1.5965442657470703, "global_step": 580, "epoch": 13} {"train_loss": -1.5528604984283447, "global_step": 581, "epoch": 13} {"train_loss": -1.5872550010681152, "global_step": 582, "epoch": 13} {"train_loss": -1.6444733142852783, "global_step": 583, "epoch": 13} {"train_loss": -1.6167361736297607, "global_step": 584, "epoch": 13} {"train_loss": -1.5186115503311157, "global_step": 585, "epoch": 13} {"train_loss": -1.6148087978363037, "global_step": 586, "epoch": 13} {"train_loss": -1.641808813526517, "global_step": 587, "epoch": 13, "val_loss": 1501454.75} {"train_loss": -1.734889268875122, "global_step": 588, "epoch": 14} {"train_loss": -1.7024143934249878, "global_step": 589, "epoch": 14} {"train_loss": -1.6773978471755981, "global_step": 590, "epoch": 14} {"train_loss": -1.7304826974868774, "global_step": 591, "epoch": 14} {"train_loss": -1.6240243911743164, "global_step": 592, "epoch": 14} {"train_loss": -1.688915729522705, "global_step": 593, "epoch": 14} {"train_loss": -1.5509425401687622, "global_step": 594, "epoch": 14} {"train_loss": -1.670548439025879, "global_step": 595, "epoch": 14} {"train_loss": -1.6584298610687256, "global_step": 596, "epoch": 14} {"train_loss": -1.7112252712249756, "global_step": 597, "epoch": 14} {"train_loss": -1.7108911275863647, "global_step": 598, "epoch": 14} {"train_loss": -1.803239345550537, "global_step": 599, "epoch": 14} {"train_loss": -1.7471144199371338, "global_step": 600, "epoch": 14} {"train_loss": -1.8138246536254883, "global_step": 601, "epoch": 14} {"train_loss": -1.5694639682769775, "global_step": 602, "epoch": 14} {"train_loss": -1.7850265502929688, "global_step": 603, "epoch": 14} {"train_loss": -1.7085673809051514, "global_step": 604, "epoch": 14} {"train_loss": -1.7104966640472412, "global_step": 605, "epoch": 14} {"train_loss": -1.6849801540374756, "global_step": 606, "epoch": 14} {"train_loss": -1.7434108257293701, "global_step": 607, "epoch": 14} {"train_loss": -1.7137153148651123, "global_step": 608, "epoch": 14} {"train_loss": -1.7369383573532104, "global_step": 609, "epoch": 14} {"train_loss": -1.725365400314331, "global_step": 610, "epoch": 14} {"train_loss": -1.8863046169281006, "global_step": 611, "epoch": 14} {"train_loss": -1.6899197101593018, "global_step": 612, "epoch": 14} {"train_loss": -1.5908676385879517, "global_step": 613, "epoch": 14} {"train_loss": -1.5896928310394287, "global_step": 614, "epoch": 14} {"train_loss": -1.6924126148223877, "global_step": 615, "epoch": 14} {"train_loss": -1.7295169830322266, "global_step": 616, "epoch": 14} {"train_loss": -1.6581041812896729, "global_step": 617, "epoch": 14} {"train_loss": -1.5973283052444458, "global_step": 618, "epoch": 14} {"train_loss": -1.9645516872406006, "global_step": 619, "epoch": 14} {"train_loss": -1.721176266670227, "global_step": 620, "epoch": 14} {"train_loss": -1.7338738441467285, "global_step": 621, "epoch": 14} {"train_loss": -1.936579942703247, "global_step": 622, "epoch": 14} {"train_loss": -1.7109606266021729, "global_step": 623, "epoch": 14} {"train_loss": -1.7009540796279907, "global_step": 624, "epoch": 14} {"train_loss": -1.6119805574417114, "global_step": 625, "epoch": 14} {"train_loss": -1.7319210767745972, "global_step": 626, "epoch": 14} {"train_loss": -1.6687361001968384, "global_step": 627, "epoch": 14} {"train_loss": -1.7695670127868652, "global_step": 628, "epoch": 14} {"train_loss": -1.7138088799658275, "global_step": 629, "epoch": 14, "val_loss": 1421714.375} {"train_loss": -1.7829382419586182, "global_step": 630, "epoch": 15} {"train_loss": -1.763852834701538, "global_step": 631, "epoch": 15} {"train_loss": -1.667877435684204, "global_step": 632, "epoch": 15} {"train_loss": -1.931139588356018, "global_step": 633, "epoch": 15} {"train_loss": -1.990209937095642, "global_step": 634, "epoch": 15} {"train_loss": -1.8464287519454956, "global_step": 635, "epoch": 15} {"train_loss": -1.8388502597808838, "global_step": 636, "epoch": 15} {"train_loss": -1.7182962894439697, "global_step": 637, "epoch": 15} {"train_loss": -1.7715749740600586, "global_step": 638, "epoch": 15} {"train_loss": -1.8246088027954102, "global_step": 639, "epoch": 15} {"train_loss": -1.662508487701416, "global_step": 640, "epoch": 15} {"train_loss": -1.837032437324524, "global_step": 641, "epoch": 15} {"train_loss": -1.8893048763275146, "global_step": 642, "epoch": 15} {"train_loss": -1.9266252517700195, "global_step": 643, "epoch": 15} {"train_loss": -1.8196245431900024, "global_step": 644, "epoch": 15} {"train_loss": -1.822205901145935, "global_step": 645, "epoch": 15} {"train_loss": -1.744624376296997, "global_step": 646, "epoch": 15} {"train_loss": -1.7209402322769165, "global_step": 647, "epoch": 15} {"train_loss": -1.8017849922180176, "global_step": 648, "epoch": 15} {"train_loss": -1.681922435760498, "global_step": 649, "epoch": 15} {"train_loss": -1.7941644191741943, "global_step": 650, "epoch": 15} {"train_loss": -1.7453868389129639, "global_step": 651, "epoch": 15} {"train_loss": -1.6885240077972412, "global_step": 652, "epoch": 15} {"train_loss": -1.8887405395507812, "global_step": 653, "epoch": 15} {"train_loss": -1.6623903512954712, "global_step": 654, "epoch": 15} {"train_loss": -1.982704520225525, "global_step": 655, "epoch": 15} {"train_loss": -1.5221325159072876, "global_step": 656, "epoch": 15} {"train_loss": -1.8143666982650757, "global_step": 657, "epoch": 15} {"train_loss": -1.6474859714508057, "global_step": 658, "epoch": 15} {"train_loss": -1.8010997772216797, "global_step": 659, "epoch": 15} {"train_loss": -1.8387818336486816, "global_step": 660, "epoch": 15} {"train_loss": -1.833807349205017, "global_step": 661, "epoch": 15} {"train_loss": -1.879155158996582, "global_step": 662, "epoch": 15} {"train_loss": -1.792240858078003, "global_step": 663, "epoch": 15} {"train_loss": -1.9247404336929321, "global_step": 664, "epoch": 15} {"train_loss": -1.9640223979949951, "global_step": 665, "epoch": 15} {"train_loss": -1.9904974699020386, "global_step": 666, "epoch": 15} {"train_loss": -1.9589498043060303, "global_step": 667, "epoch": 15} {"train_loss": -1.760956883430481, "global_step": 668, "epoch": 15} {"train_loss": -1.7451956272125244, "global_step": 669, "epoch": 15} {"train_loss": -1.718652606010437, "global_step": 670, "epoch": 15} {"train_loss": -1.8062004503749667, "global_step": 671, "epoch": 15, "val_loss": 1310871.0} {"train_loss": -1.8526146411895752, "global_step": 672, "epoch": 16} {"train_loss": -1.7573400735855103, "global_step": 673, "epoch": 16} {"train_loss": -1.9407203197479248, "global_step": 674, "epoch": 16} {"train_loss": -1.894371509552002, "global_step": 675, "epoch": 16} {"train_loss": -1.8178486824035645, "global_step": 676, "epoch": 16} {"train_loss": -1.7002522945404053, "global_step": 677, "epoch": 16} {"train_loss": -1.8760735988616943, "global_step": 678, "epoch": 16} {"train_loss": -1.9433879852294922, "global_step": 679, "epoch": 16} {"train_loss": -1.8955986499786377, "global_step": 680, "epoch": 16} {"train_loss": -1.8040378093719482, "global_step": 681, "epoch": 16} {"train_loss": -1.9468799829483032, "global_step": 682, "epoch": 16} {"train_loss": -1.8377751111984253, "global_step": 683, "epoch": 16} {"train_loss": -1.8644100427627563, "global_step": 684, "epoch": 16} {"train_loss": -1.86941397190094, "global_step": 685, "epoch": 16} {"train_loss": -1.9476583003997803, "global_step": 686, "epoch": 16} {"train_loss": -1.8671563863754272, "global_step": 687, "epoch": 16} {"train_loss": -1.9089306592941284, "global_step": 688, "epoch": 16} {"train_loss": -2.0693817138671875, "global_step": 689, "epoch": 16} {"train_loss": -1.8082574605941772, "global_step": 690, "epoch": 16} {"train_loss": -1.9241946935653687, "global_step": 691, "epoch": 16} {"train_loss": -1.9478297233581543, "global_step": 692, "epoch": 16} {"train_loss": -1.8778666257858276, "global_step": 693, "epoch": 16} {"train_loss": -1.8833682537078857, "global_step": 694, "epoch": 16} {"train_loss": -1.9186038970947266, "global_step": 695, "epoch": 16} {"train_loss": -1.9296990633010864, "global_step": 696, "epoch": 16} {"train_loss": -2.083757162094116, "global_step": 697, "epoch": 16} {"train_loss": -1.7408089637756348, "global_step": 698, "epoch": 16} {"train_loss": -1.950425148010254, "global_step": 699, "epoch": 16} {"train_loss": -1.9067186117172241, "global_step": 700, "epoch": 16} {"train_loss": -1.9271669387817383, "global_step": 701, "epoch": 16} {"train_loss": -1.8619306087493896, "global_step": 702, "epoch": 16} {"train_loss": -1.8382046222686768, "global_step": 703, "epoch": 16} {"train_loss": -2.0098445415496826, "global_step": 704, "epoch": 16} {"train_loss": -1.8721027374267578, "global_step": 705, "epoch": 16} {"train_loss": -1.9098095893859863, "global_step": 706, "epoch": 16} {"train_loss": -1.882932424545288, "global_step": 707, "epoch": 16} {"train_loss": -1.8552590608596802, "global_step": 708, "epoch": 16} {"train_loss": -1.842915415763855, "global_step": 709, "epoch": 16} {"train_loss": -1.9215008020401, "global_step": 710, "epoch": 16} {"train_loss": -1.7982356548309326, "global_step": 711, "epoch": 16} {"train_loss": -1.8531540632247925, "global_step": 712, "epoch": 16} {"train_loss": -1.8895806244441442, "global_step": 713, "epoch": 16, "val_loss": 1261776.25} {"train_loss": -1.9008110761642456, "global_step": 714, "epoch": 17} {"train_loss": -1.9999150037765503, "global_step": 715, "epoch": 17} {"train_loss": -1.8631720542907715, "global_step": 716, "epoch": 17} {"train_loss": -1.9406119585037231, "global_step": 717, "epoch": 17} {"train_loss": -1.9971213340759277, "global_step": 718, "epoch": 17} {"train_loss": -2.092515468597412, "global_step": 719, "epoch": 17} {"train_loss": -2.043389320373535, "global_step": 720, "epoch": 17} {"train_loss": -2.1280035972595215, "global_step": 721, "epoch": 17} {"train_loss": -1.9358484745025635, "global_step": 722, "epoch": 17} {"train_loss": -1.9946657419204712, "global_step": 723, "epoch": 17} {"train_loss": -2.034946918487549, "global_step": 724, "epoch": 17} {"train_loss": -1.8875935077667236, "global_step": 725, "epoch": 17} {"train_loss": -2.057898759841919, "global_step": 726, "epoch": 17} {"train_loss": -1.9426615238189697, "global_step": 727, "epoch": 17} {"train_loss": -1.9216032028198242, "global_step": 728, "epoch": 17} {"train_loss": -2.063718557357788, "global_step": 729, "epoch": 17} {"train_loss": -2.0148401260375977, "global_step": 730, "epoch": 17} {"train_loss": -1.9404053688049316, "global_step": 731, "epoch": 17} {"train_loss": -1.8830809593200684, "global_step": 732, "epoch": 17} {"train_loss": -2.020738124847412, "global_step": 733, "epoch": 17} {"train_loss": -2.0419821739196777, "global_step": 734, "epoch": 17} {"train_loss": -1.9559104442596436, "global_step": 735, "epoch": 17} {"train_loss": -1.906834363937378, "global_step": 736, "epoch": 17} {"train_loss": -1.9188814163208008, "global_step": 737, "epoch": 17} {"train_loss": -2.0523953437805176, "global_step": 738, "epoch": 17} {"train_loss": -1.8477330207824707, "global_step": 739, "epoch": 17} {"train_loss": -1.9967446327209473, "global_step": 740, "epoch": 17} {"train_loss": -1.8618812561035156, "global_step": 741, "epoch": 17} {"train_loss": -1.934336543083191, "global_step": 742, "epoch": 17} {"train_loss": -1.907344937324524, "global_step": 743, "epoch": 17} {"train_loss": -2.0128378868103027, "global_step": 744, "epoch": 17} {"train_loss": -1.838850975036621, "global_step": 745, "epoch": 17} {"train_loss": -2.003624439239502, "global_step": 746, "epoch": 17} {"train_loss": -2.1754016876220703, "global_step": 747, "epoch": 17} {"train_loss": -1.9464391469955444, "global_step": 748, "epoch": 17} {"train_loss": -1.941394329071045, "global_step": 749, "epoch": 17} {"train_loss": -2.06465482711792, "global_step": 750, "epoch": 17} {"train_loss": -1.9872201681137085, "global_step": 751, "epoch": 17} {"train_loss": -1.833808183670044, "global_step": 752, "epoch": 17} {"train_loss": -1.9360240697860718, "global_step": 753, "epoch": 17} {"train_loss": -1.7972301244735718, "global_step": 754, "epoch": 17} {"train_loss": -1.966151964096796, "global_step": 755, "epoch": 17, "val_loss": 1186264.375} {"train_loss": -1.904386043548584, "global_step": 756, "epoch": 18} {"train_loss": -1.8554408550262451, "global_step": 757, "epoch": 18} {"train_loss": -2.085163116455078, "global_step": 758, "epoch": 18} {"train_loss": -1.7894288301467896, "global_step": 759, "epoch": 18} {"train_loss": -1.8799080848693848, "global_step": 760, "epoch": 18} {"train_loss": -1.8682498931884766, "global_step": 761, "epoch": 18} {"train_loss": -1.9304311275482178, "global_step": 762, "epoch": 18} {"train_loss": -1.8935422897338867, "global_step": 763, "epoch": 18} {"train_loss": -1.9968373775482178, "global_step": 764, "epoch": 18} {"train_loss": -1.7512516975402832, "global_step": 765, "epoch": 18} {"train_loss": -1.8097953796386719, "global_step": 766, "epoch": 18} {"train_loss": -1.7610208988189697, "global_step": 767, "epoch": 18} {"train_loss": -1.9226164817810059, "global_step": 768, "epoch": 18} {"train_loss": -2.0057475566864014, "global_step": 769, "epoch": 18} {"train_loss": -1.9322545528411865, "global_step": 770, "epoch": 18} {"train_loss": -2.040550708770752, "global_step": 771, "epoch": 18} {"train_loss": -2.1061129570007324, "global_step": 772, "epoch": 18} {"train_loss": -1.9693613052368164, "global_step": 773, "epoch": 18} {"train_loss": -1.8946173191070557, "global_step": 774, "epoch": 18} {"train_loss": -1.9503916501998901, "global_step": 775, "epoch": 18} {"train_loss": -1.9375102519989014, "global_step": 776, "epoch": 18} {"train_loss": -1.9825987815856934, "global_step": 777, "epoch": 18} {"train_loss": -2.019195079803467, "global_step": 778, "epoch": 18} {"train_loss": -1.9184238910675049, "global_step": 779, "epoch": 18} {"train_loss": -2.0617775917053223, "global_step": 780, "epoch": 18} {"train_loss": -2.0373728275299072, "global_step": 781, "epoch": 18} {"train_loss": -2.0604701042175293, "global_step": 782, "epoch": 18} {"train_loss": -2.0591492652893066, "global_step": 783, "epoch": 18} {"train_loss": -1.9559311866760254, "global_step": 784, "epoch": 18} {"train_loss": -1.9404804706573486, "global_step": 785, "epoch": 18} {"train_loss": -2.006718158721924, "global_step": 786, "epoch": 18} {"train_loss": -2.1156914234161377, "global_step": 787, "epoch": 18} {"train_loss": -2.096492052078247, "global_step": 788, "epoch": 18} {"train_loss": -1.980408787727356, "global_step": 789, "epoch": 18} {"train_loss": -2.0630321502685547, "global_step": 790, "epoch": 18} {"train_loss": -2.0754542350769043, "global_step": 791, "epoch": 18} {"train_loss": -1.8810126781463623, "global_step": 792, "epoch": 18} {"train_loss": -2.1518006324768066, "global_step": 793, "epoch": 18} {"train_loss": -2.0951478481292725, "global_step": 794, "epoch": 18} {"train_loss": -1.8747565746307373, "global_step": 795, "epoch": 18} {"train_loss": -2.07401704788208, "global_step": 796, "epoch": 18} {"train_loss": -1.9708074700264704, "global_step": 797, "epoch": 18, "val_loss": 1112281.625} {"train_loss": -2.0321333408355713, "global_step": 798, "epoch": 19} {"train_loss": -1.8863165378570557, "global_step": 799, "epoch": 19} {"train_loss": -2.096971273422241, "global_step": 800, "epoch": 19} {"train_loss": -2.0673983097076416, "global_step": 801, "epoch": 19} {"train_loss": -2.1019272804260254, "global_step": 802, "epoch": 19} {"train_loss": -2.038322925567627, "global_step": 803, "epoch": 19} {"train_loss": -2.073436975479126, "global_step": 804, "epoch": 19} {"train_loss": -2.1527414321899414, "global_step": 805, "epoch": 19} {"train_loss": -2.124642848968506, "global_step": 806, "epoch": 19} {"train_loss": -2.103374481201172, "global_step": 807, "epoch": 19} {"train_loss": -1.982078194618225, "global_step": 808, "epoch": 19} {"train_loss": -2.060555934906006, "global_step": 809, "epoch": 19} {"train_loss": -1.8655357360839844, "global_step": 810, "epoch": 19} {"train_loss": -2.0598716735839844, "global_step": 811, "epoch": 19} {"train_loss": -2.0970160961151123, "global_step": 812, "epoch": 19} {"train_loss": -1.9072071313858032, "global_step": 813, "epoch": 19} {"train_loss": -2.1384437084198, "global_step": 814, "epoch": 19} {"train_loss": -2.025407314300537, "global_step": 815, "epoch": 19} {"train_loss": -2.1945924758911133, "global_step": 816, "epoch": 19} {"train_loss": -2.029451847076416, "global_step": 817, "epoch": 19} {"train_loss": -2.045041799545288, "global_step": 818, "epoch": 19} {"train_loss": -1.9578311443328857, "global_step": 819, "epoch": 19} {"train_loss": -2.091040849685669, "global_step": 820, "epoch": 19} {"train_loss": -2.258413314819336, "global_step": 821, "epoch": 19} {"train_loss": -2.0424907207489014, "global_step": 822, "epoch": 19} {"train_loss": -2.1369895935058594, "global_step": 823, "epoch": 19} {"train_loss": -2.0384035110473633, "global_step": 824, "epoch": 19} {"train_loss": -2.108586311340332, "global_step": 825, "epoch": 19} {"train_loss": -2.045525074005127, "global_step": 826, "epoch": 19} {"train_loss": -2.157154083251953, "global_step": 827, "epoch": 19} {"train_loss": -2.0368738174438477, "global_step": 828, "epoch": 19} {"train_loss": -2.1938259601593018, "global_step": 829, "epoch": 19} {"train_loss": -2.1731486320495605, "global_step": 830, "epoch": 19} {"train_loss": -2.1151394844055176, "global_step": 831, "epoch": 19} {"train_loss": -2.143554925918579, "global_step": 832, "epoch": 19} {"train_loss": -2.072518825531006, "global_step": 833, "epoch": 19} {"train_loss": -2.016897678375244, "global_step": 834, "epoch": 19} {"train_loss": -2.1169991493225098, "global_step": 835, "epoch": 19} {"train_loss": -2.185199022293091, "global_step": 836, "epoch": 19} {"train_loss": -2.123000144958496, "global_step": 837, "epoch": 19} {"train_loss": -2.058978319168091, "global_step": 838, "epoch": 19} {"train_loss": -2.0801703532536826, "global_step": 839, "epoch": 19, "val_loss": 1060468.0} {"train_loss": -2.1770360469818115, "global_step": 840, "epoch": 20} {"train_loss": -2.190251350402832, "global_step": 841, "epoch": 20} {"train_loss": -2.1439781188964844, "global_step": 842, "epoch": 20} {"train_loss": -2.171724796295166, "global_step": 843, "epoch": 20} {"train_loss": -2.116283655166626, "global_step": 844, "epoch": 20} {"train_loss": -2.17274808883667, "global_step": 845, "epoch": 20} {"train_loss": -2.0813820362091064, "global_step": 846, "epoch": 20} {"train_loss": -2.209580421447754, "global_step": 847, "epoch": 20} {"train_loss": -2.082855224609375, "global_step": 848, "epoch": 20} {"train_loss": -2.19700288772583, "global_step": 849, "epoch": 20} {"train_loss": -2.205904960632324, "global_step": 850, "epoch": 20} {"train_loss": -2.0469837188720703, "global_step": 851, "epoch": 20} {"train_loss": -2.160947799682617, "global_step": 852, "epoch": 20} {"train_loss": -2.138988494873047, "global_step": 853, "epoch": 20} {"train_loss": -2.1603217124938965, "global_step": 854, "epoch": 20} {"train_loss": -2.043118953704834, "global_step": 855, "epoch": 20} {"train_loss": -2.054535388946533, "global_step": 856, "epoch": 20} {"train_loss": -2.210606098175049, "global_step": 857, "epoch": 20} {"train_loss": -2.066929817199707, "global_step": 858, "epoch": 20} {"train_loss": -2.20046067237854, "global_step": 859, "epoch": 20} {"train_loss": -1.910071849822998, "global_step": 860, "epoch": 20} {"train_loss": -2.1757256984710693, "global_step": 861, "epoch": 20} {"train_loss": -2.040835380554199, "global_step": 862, "epoch": 20} {"train_loss": -2.2154204845428467, "global_step": 863, "epoch": 20} {"train_loss": -2.0484981536865234, "global_step": 864, "epoch": 20} {"train_loss": -2.251418352127075, "global_step": 865, "epoch": 20} {"train_loss": -2.142119884490967, "global_step": 866, "epoch": 20} {"train_loss": -2.031778573989868, "global_step": 867, "epoch": 20} {"train_loss": -2.244199752807617, "global_step": 868, "epoch": 20} {"train_loss": -2.0768566131591797, "global_step": 869, "epoch": 20} {"train_loss": -2.16848087310791, "global_step": 870, "epoch": 20} {"train_loss": -1.9623863697052002, "global_step": 871, "epoch": 20} {"train_loss": -2.314639091491699, "global_step": 872, "epoch": 20} {"train_loss": -1.947317361831665, "global_step": 873, "epoch": 20} {"train_loss": -1.9809843301773071, "global_step": 874, "epoch": 20} {"train_loss": -1.989180088043213, "global_step": 875, "epoch": 20} {"train_loss": -1.9363489151000977, "global_step": 876, "epoch": 20} {"train_loss": -2.0536766052246094, "global_step": 877, "epoch": 20} {"train_loss": -2.056755781173706, "global_step": 878, "epoch": 20} {"train_loss": -2.133925676345825, "global_step": 879, "epoch": 20} {"train_loss": -2.172936201095581, "global_step": 880, "epoch": 20} {"train_loss": -2.116935045946212, "global_step": 881, "epoch": 20, "val_loss": 1033933.4375} {"train_loss": -2.062434673309326, "global_step": 882, "epoch": 21} {"train_loss": -2.139338970184326, "global_step": 883, "epoch": 21} {"train_loss": -2.1221110820770264, "global_step": 884, "epoch": 21} {"train_loss": -2.1045494079589844, "global_step": 885, "epoch": 21} {"train_loss": -2.1516733169555664, "global_step": 886, "epoch": 21} {"train_loss": -2.2689807415008545, "global_step": 887, "epoch": 21} {"train_loss": -2.021331787109375, "global_step": 888, "epoch": 21} {"train_loss": -2.2865917682647705, "global_step": 889, "epoch": 21} {"train_loss": -2.0566189289093018, "global_step": 890, "epoch": 21} {"train_loss": -2.251486301422119, "global_step": 891, "epoch": 21} {"train_loss": -2.003563404083252, "global_step": 892, "epoch": 21} {"train_loss": -2.086181879043579, "global_step": 893, "epoch": 21} {"train_loss": -1.9472705125808716, "global_step": 894, "epoch": 21} {"train_loss": -1.99729585647583, "global_step": 895, "epoch": 21} {"train_loss": -2.1015212535858154, "global_step": 896, "epoch": 21} {"train_loss": -2.123091697692871, "global_step": 897, "epoch": 21} {"train_loss": -2.2197508811950684, "global_step": 898, "epoch": 21} {"train_loss": -2.0334818363189697, "global_step": 899, "epoch": 21} {"train_loss": -2.2811851501464844, "global_step": 900, "epoch": 21} {"train_loss": -1.9557254314422607, "global_step": 901, "epoch": 21} {"train_loss": -2.0247559547424316, "global_step": 902, "epoch": 21} {"train_loss": -2.0279159545898438, "global_step": 903, "epoch": 21} {"train_loss": -2.060438871383667, "global_step": 904, "epoch": 21} {"train_loss": -2.052676200866699, "global_step": 905, "epoch": 21} {"train_loss": -2.201730728149414, "global_step": 906, "epoch": 21} {"train_loss": -2.157034397125244, "global_step": 907, "epoch": 21} {"train_loss": -2.210308313369751, "global_step": 908, "epoch": 21} {"train_loss": -2.2689452171325684, "global_step": 909, "epoch": 21} {"train_loss": -2.189603805541992, "global_step": 910, "epoch": 21} {"train_loss": -2.2164998054504395, "global_step": 911, "epoch": 21} {"train_loss": -2.189964532852173, "global_step": 912, "epoch": 21} {"train_loss": -2.2163867950439453, "global_step": 913, "epoch": 21} {"train_loss": -2.2254276275634766, "global_step": 914, "epoch": 21} {"train_loss": -2.2520248889923096, "global_step": 915, "epoch": 21} {"train_loss": -2.1658058166503906, "global_step": 916, "epoch": 21} {"train_loss": -2.168884754180908, "global_step": 917, "epoch": 21} {"train_loss": -2.314915895462036, "global_step": 918, "epoch": 21} {"train_loss": -2.2661333084106445, "global_step": 919, "epoch": 21} {"train_loss": -2.2849655151367188, "global_step": 920, "epoch": 21} {"train_loss": -2.2171363830566406, "global_step": 921, "epoch": 21} {"train_loss": -2.1760566234588623, "global_step": 922, "epoch": 21} {"train_loss": -2.148452869483403, "global_step": 923, "epoch": 21, "val_loss": 963500.125} {"train_loss": -2.3100812435150146, "global_step": 924, "epoch": 22} {"train_loss": -2.184896469116211, "global_step": 925, "epoch": 22} {"train_loss": -2.3336055278778076, "global_step": 926, "epoch": 22} {"train_loss": -2.0375185012817383, "global_step": 927, "epoch": 22} {"train_loss": -2.240859031677246, "global_step": 928, "epoch": 22} {"train_loss": -2.1984641551971436, "global_step": 929, "epoch": 22} {"train_loss": -2.3304200172424316, "global_step": 930, "epoch": 22} {"train_loss": -2.365267038345337, "global_step": 931, "epoch": 22} {"train_loss": -2.379802703857422, "global_step": 932, "epoch": 22} {"train_loss": -2.3664627075195312, "global_step": 933, "epoch": 22} {"train_loss": -2.2181878089904785, "global_step": 934, "epoch": 22} {"train_loss": -2.2442026138305664, "global_step": 935, "epoch": 22} {"train_loss": -2.1281094551086426, "global_step": 936, "epoch": 22} {"train_loss": -2.1795217990875244, "global_step": 937, "epoch": 22} {"train_loss": -2.2791600227355957, "global_step": 938, "epoch": 22} {"train_loss": -2.1421525478363037, "global_step": 939, "epoch": 22} {"train_loss": -2.189662218093872, "global_step": 940, "epoch": 22} {"train_loss": -1.9114843606948853, "global_step": 941, "epoch": 22} {"train_loss": -2.140137195587158, "global_step": 942, "epoch": 22} {"train_loss": -2.1883304119110107, "global_step": 943, "epoch": 22} {"train_loss": -2.1203160285949707, "global_step": 944, "epoch": 22} {"train_loss": -2.199517250061035, "global_step": 945, "epoch": 22} {"train_loss": -2.2158946990966797, "global_step": 946, "epoch": 22} {"train_loss": -2.2766497135162354, "global_step": 947, "epoch": 22} {"train_loss": -2.2507805824279785, "global_step": 948, "epoch": 22} {"train_loss": -2.1759228706359863, "global_step": 949, "epoch": 22} {"train_loss": -2.207984447479248, "global_step": 950, "epoch": 22} {"train_loss": -2.2463788986206055, "global_step": 951, "epoch": 22} {"train_loss": -2.1867294311523438, "global_step": 952, "epoch": 22} {"train_loss": -2.4253101348876953, "global_step": 953, "epoch": 22} {"train_loss": -2.156601905822754, "global_step": 954, "epoch": 22} {"train_loss": -2.2902467250823975, "global_step": 955, "epoch": 22} {"train_loss": -2.2761316299438477, "global_step": 956, "epoch": 22} {"train_loss": -2.245882272720337, "global_step": 957, "epoch": 22} {"train_loss": -2.1605708599090576, "global_step": 958, "epoch": 22} {"train_loss": -2.289222478866577, "global_step": 959, "epoch": 22} {"train_loss": -2.190854787826538, "global_step": 960, "epoch": 22} {"train_loss": -2.1917848587036133, "global_step": 961, "epoch": 22} {"train_loss": -2.1334309577941895, "global_step": 962, "epoch": 22} {"train_loss": -2.195113182067871, "global_step": 963, "epoch": 22} {"train_loss": -2.3363020420074463, "global_step": 964, "epoch": 22} {"train_loss": -2.2203991327966963, "global_step": 965, "epoch": 22, "val_loss": 918389.4375} {"train_loss": -2.369340419769287, "global_step": 966, "epoch": 23} {"train_loss": -2.218306541442871, "global_step": 967, "epoch": 23} {"train_loss": -2.3720784187316895, "global_step": 968, "epoch": 23} {"train_loss": -2.319791555404663, "global_step": 969, "epoch": 23} {"train_loss": -2.2222089767456055, "global_step": 970, "epoch": 23} {"train_loss": -2.3358802795410156, "global_step": 971, "epoch": 23} {"train_loss": -2.355147361755371, "global_step": 972, "epoch": 23} {"train_loss": -2.384709358215332, "global_step": 973, "epoch": 23} {"train_loss": -2.3946828842163086, "global_step": 974, "epoch": 23} {"train_loss": -2.374612808227539, "global_step": 975, "epoch": 23} {"train_loss": -2.3686389923095703, "global_step": 976, "epoch": 23} {"train_loss": -2.2479910850524902, "global_step": 977, "epoch": 23} {"train_loss": -2.2212471961975098, "global_step": 978, "epoch": 23} {"train_loss": -2.2906382083892822, "global_step": 979, "epoch": 23} {"train_loss": -2.328099250793457, "global_step": 980, "epoch": 23} {"train_loss": -2.2351233959198, "global_step": 981, "epoch": 23} {"train_loss": -2.3332977294921875, "global_step": 982, "epoch": 23} {"train_loss": -2.257948875427246, "global_step": 983, "epoch": 23} {"train_loss": -2.3226585388183594, "global_step": 984, "epoch": 23} {"train_loss": -2.327296257019043, "global_step": 985, "epoch": 23} {"train_loss": -2.2668838500976562, "global_step": 986, "epoch": 23} {"train_loss": -2.4552035331726074, "global_step": 987, "epoch": 23} {"train_loss": -2.2397704124450684, "global_step": 988, "epoch": 23} {"train_loss": -2.2597968578338623, "global_step": 989, "epoch": 23} {"train_loss": -2.170473098754883, "global_step": 990, "epoch": 23} {"train_loss": -2.4634203910827637, "global_step": 991, "epoch": 23} {"train_loss": -2.1451663970947266, "global_step": 992, "epoch": 23} {"train_loss": -2.2542901039123535, "global_step": 993, "epoch": 23} {"train_loss": -2.353344678878784, "global_step": 994, "epoch": 23} {"train_loss": -2.312737464904785, "global_step": 995, "epoch": 23} {"train_loss": -2.2882978916168213, "global_step": 996, "epoch": 23} {"train_loss": -2.2488858699798584, "global_step": 997, "epoch": 23} {"train_loss": -2.279268264770508, "global_step": 998, "epoch": 23} {"train_loss": -2.252368927001953, "global_step": 999, "epoch": 23} {"train_loss": -2.338108539581299, "global_step": 1000, "epoch": 23} {"train_loss": -2.3935275077819824, "global_step": 1001, "epoch": 23} {"train_loss": -2.396358013153076, "global_step": 1002, "epoch": 23} {"train_loss": -2.291851758956909, "global_step": 1003, "epoch": 23} {"train_loss": -2.431415557861328, "global_step": 1004, "epoch": 23} {"train_loss": -2.4134435653686523, "global_step": 1005, "epoch": 23} {"train_loss": -2.2642593383789062, "global_step": 1006, "epoch": 23} {"train_loss": -2.3142535402661277, "global_step": 1007, "epoch": 23, "val_loss": 882852.875} {"train_loss": -2.436336040496826, "global_step": 1008, "epoch": 24} {"train_loss": -2.3128480911254883, "global_step": 1009, "epoch": 24} {"train_loss": -2.458526849746704, "global_step": 1010, "epoch": 24} {"train_loss": -2.355851888656616, "global_step": 1011, "epoch": 24} {"train_loss": -2.411884069442749, "global_step": 1012, "epoch": 24} {"train_loss": -2.1620287895202637, "global_step": 1013, "epoch": 24} {"train_loss": -2.5332441329956055, "global_step": 1014, "epoch": 24} {"train_loss": -2.3935863971710205, "global_step": 1015, "epoch": 24} {"train_loss": -2.3640379905700684, "global_step": 1016, "epoch": 24} {"train_loss": -2.258632183074951, "global_step": 1017, "epoch": 24} {"train_loss": -2.3965201377868652, "global_step": 1018, "epoch": 24} {"train_loss": -2.462709903717041, "global_step": 1019, "epoch": 24} {"train_loss": -2.406872272491455, "global_step": 1020, "epoch": 24} {"train_loss": -2.337249279022217, "global_step": 1021, "epoch": 24} {"train_loss": -2.3402936458587646, "global_step": 1022, "epoch": 24} {"train_loss": -2.282395601272583, "global_step": 1023, "epoch": 24} {"train_loss": -2.4037537574768066, "global_step": 1024, "epoch": 24} {"train_loss": -2.433952808380127, "global_step": 1025, "epoch": 24} {"train_loss": -2.384106159210205, "global_step": 1026, "epoch": 24} {"train_loss": -2.2992162704467773, "global_step": 1027, "epoch": 24} {"train_loss": -2.3151516914367676, "global_step": 1028, "epoch": 24} {"train_loss": -2.338005542755127, "global_step": 1029, "epoch": 24} {"train_loss": -2.177511215209961, "global_step": 1030, "epoch": 24} {"train_loss": -2.3473737239837646, "global_step": 1031, "epoch": 24} {"train_loss": -2.216890335083008, "global_step": 1032, "epoch": 24} {"train_loss": -2.4250926971435547, "global_step": 1033, "epoch": 24} {"train_loss": -2.3817858695983887, "global_step": 1034, "epoch": 24} {"train_loss": -2.245727062225342, "global_step": 1035, "epoch": 24} {"train_loss": -2.4390127658843994, "global_step": 1036, "epoch": 24} {"train_loss": -2.230865955352783, "global_step": 1037, "epoch": 24} {"train_loss": -2.4370522499084473, "global_step": 1038, "epoch": 24} {"train_loss": -2.2791643142700195, "global_step": 1039, "epoch": 24} {"train_loss": -2.444967746734619, "global_step": 1040, "epoch": 24} {"train_loss": -2.315600872039795, "global_step": 1041, "epoch": 24} {"train_loss": -2.458698272705078, "global_step": 1042, "epoch": 24} {"train_loss": -2.1943538188934326, "global_step": 1043, "epoch": 24} {"train_loss": -2.4986069202423096, "global_step": 1044, "epoch": 24} {"train_loss": -2.247040271759033, "global_step": 1045, "epoch": 24} {"train_loss": -2.4456915855407715, "global_step": 1046, "epoch": 24} {"train_loss": -2.286298990249634, "global_step": 1047, "epoch": 24} {"train_loss": -2.4054503440856934, "global_step": 1048, "epoch": 24} {"train_loss": -2.354058782259623, "global_step": 1049, "epoch": 24, "val_loss": 841201.375} {"train_loss": -2.4138665199279785, "global_step": 1050, "epoch": 25} {"train_loss": -2.2769641876220703, "global_step": 1051, "epoch": 25} {"train_loss": -2.4773733615875244, "global_step": 1052, "epoch": 25} {"train_loss": -2.33903169631958, "global_step": 1053, "epoch": 25} {"train_loss": -2.413449764251709, "global_step": 1054, "epoch": 25} {"train_loss": -2.3228724002838135, "global_step": 1055, "epoch": 25} {"train_loss": -2.5124714374542236, "global_step": 1056, "epoch": 25} {"train_loss": -2.3539175987243652, "global_step": 1057, "epoch": 25} {"train_loss": -2.428419828414917, "global_step": 1058, "epoch": 25} {"train_loss": -2.515108108520508, "global_step": 1059, "epoch": 25} {"train_loss": -2.473360776901245, "global_step": 1060, "epoch": 25} {"train_loss": -2.48744535446167, "global_step": 1061, "epoch": 25} {"train_loss": -2.594576835632324, "global_step": 1062, "epoch": 25} {"train_loss": -2.4312734603881836, "global_step": 1063, "epoch": 25} {"train_loss": -2.4177088737487793, "global_step": 1064, "epoch": 25} {"train_loss": -2.366706132888794, "global_step": 1065, "epoch": 25} {"train_loss": -2.3700997829437256, "global_step": 1066, "epoch": 25} {"train_loss": -2.3613121509552, "global_step": 1067, "epoch": 25} {"train_loss": -2.440321445465088, "global_step": 1068, "epoch": 25} {"train_loss": -2.3842005729675293, "global_step": 1069, "epoch": 25} {"train_loss": -2.2623939514160156, "global_step": 1070, "epoch": 25} {"train_loss": -2.457244396209717, "global_step": 1071, "epoch": 25} {"train_loss": -2.364703416824341, "global_step": 1072, "epoch": 25} {"train_loss": -2.32578182220459, "global_step": 1073, "epoch": 25} {"train_loss": -2.3303260803222656, "global_step": 1074, "epoch": 25} {"train_loss": -2.317225456237793, "global_step": 1075, "epoch": 25} {"train_loss": -2.491306781768799, "global_step": 1076, "epoch": 25} {"train_loss": -2.348186492919922, "global_step": 1077, "epoch": 25} {"train_loss": -2.45379638671875, "global_step": 1078, "epoch": 25} {"train_loss": -2.356301784515381, "global_step": 1079, "epoch": 25} {"train_loss": -2.473510980606079, "global_step": 1080, "epoch": 25} {"train_loss": -2.227037191390991, "global_step": 1081, "epoch": 25} {"train_loss": -2.4871318340301514, "global_step": 1082, "epoch": 25} {"train_loss": -2.337210178375244, "global_step": 1083, "epoch": 25} {"train_loss": -2.4437851905822754, "global_step": 1084, "epoch": 25} {"train_loss": -2.3633809089660645, "global_step": 1085, "epoch": 25} {"train_loss": -2.473125457763672, "global_step": 1086, "epoch": 25} {"train_loss": -2.4291844367980957, "global_step": 1087, "epoch": 25} {"train_loss": -2.4269018173217773, "global_step": 1088, "epoch": 25} {"train_loss": -2.4940361976623535, "global_step": 1089, "epoch": 25} {"train_loss": -2.504274606704712, "global_step": 1090, "epoch": 25} {"train_loss": -2.411369039898827, "global_step": 1091, "epoch": 25, "val_loss": 816417.5} {"train_loss": -2.346527099609375, "global_step": 1092, "epoch": 26} {"train_loss": -2.515956163406372, "global_step": 1093, "epoch": 26} {"train_loss": -2.324641704559326, "global_step": 1094, "epoch": 26} {"train_loss": -2.492155075073242, "global_step": 1095, "epoch": 26} {"train_loss": -2.3501510620117188, "global_step": 1096, "epoch": 26} {"train_loss": -2.4467830657958984, "global_step": 1097, "epoch": 26} {"train_loss": -2.4794483184814453, "global_step": 1098, "epoch": 26} {"train_loss": -2.3020949363708496, "global_step": 1099, "epoch": 26} {"train_loss": -2.5538833141326904, "global_step": 1100, "epoch": 26} {"train_loss": -2.406790256500244, "global_step": 1101, "epoch": 26} {"train_loss": -2.557917594909668, "global_step": 1102, "epoch": 26} {"train_loss": -2.43414306640625, "global_step": 1103, "epoch": 26} {"train_loss": -2.4133734703063965, "global_step": 1104, "epoch": 26} {"train_loss": -2.4770753383636475, "global_step": 1105, "epoch": 26} {"train_loss": -2.4473109245300293, "global_step": 1106, "epoch": 26} {"train_loss": -2.4122633934020996, "global_step": 1107, "epoch": 26} {"train_loss": -2.3830065727233887, "global_step": 1108, "epoch": 26} {"train_loss": -2.47689151763916, "global_step": 1109, "epoch": 26} {"train_loss": -2.446589231491089, "global_step": 1110, "epoch": 26} {"train_loss": -2.341031074523926, "global_step": 1111, "epoch": 26} {"train_loss": -2.473994016647339, "global_step": 1112, "epoch": 26} {"train_loss": -2.3588528633117676, "global_step": 1113, "epoch": 26} {"train_loss": -2.4347076416015625, "global_step": 1114, "epoch": 26} {"train_loss": -2.491647243499756, "global_step": 1115, "epoch": 26} {"train_loss": -2.5022428035736084, "global_step": 1116, "epoch": 26} {"train_loss": -2.5492939949035645, "global_step": 1117, "epoch": 26} {"train_loss": -2.536161422729492, "global_step": 1118, "epoch": 26} {"train_loss": -2.5333619117736816, "global_step": 1119, "epoch": 26} {"train_loss": -2.4554877281188965, "global_step": 1120, "epoch": 26} {"train_loss": -2.506748914718628, "global_step": 1121, "epoch": 26} {"train_loss": -2.504232168197632, "global_step": 1122, "epoch": 26} {"train_loss": -2.4341204166412354, "global_step": 1123, "epoch": 26} {"train_loss": -2.3791303634643555, "global_step": 1124, "epoch": 26} {"train_loss": -2.628377914428711, "global_step": 1125, "epoch": 26} {"train_loss": -2.4333837032318115, "global_step": 1126, "epoch": 26} {"train_loss": -2.5701663494110107, "global_step": 1127, "epoch": 26} {"train_loss": -2.4020919799804688, "global_step": 1128, "epoch": 26} {"train_loss": -2.375824213027954, "global_step": 1129, "epoch": 26} {"train_loss": -2.4935197830200195, "global_step": 1130, "epoch": 26} {"train_loss": -2.464421033859253, "global_step": 1131, "epoch": 26} {"train_loss": -2.41355037689209, "global_step": 1132, "epoch": 26} {"train_loss": -2.4550197578611828, "global_step": 1133, "epoch": 26, "val_loss": 767516.25} {"train_loss": -2.5355842113494873, "global_step": 1134, "epoch": 27} {"train_loss": -2.479161262512207, "global_step": 1135, "epoch": 27} {"train_loss": -2.4296624660491943, "global_step": 1136, "epoch": 27} {"train_loss": -2.3795461654663086, "global_step": 1137, "epoch": 27} {"train_loss": -2.5409932136535645, "global_step": 1138, "epoch": 27} {"train_loss": -2.5084781646728516, "global_step": 1139, "epoch": 27} {"train_loss": -2.43967604637146, "global_step": 1140, "epoch": 27} {"train_loss": -2.473419666290283, "global_step": 1141, "epoch": 27} {"train_loss": -2.585259437561035, "global_step": 1142, "epoch": 27} {"train_loss": -2.397266387939453, "global_step": 1143, "epoch": 27} {"train_loss": -2.6269307136535645, "global_step": 1144, "epoch": 27} {"train_loss": -2.471510410308838, "global_step": 1145, "epoch": 27} {"train_loss": -2.570888042449951, "global_step": 1146, "epoch": 27} {"train_loss": -2.243920087814331, "global_step": 1147, "epoch": 27} {"train_loss": -2.5042853355407715, "global_step": 1148, "epoch": 27} {"train_loss": -2.5404515266418457, "global_step": 1149, "epoch": 27} {"train_loss": -2.5095601081848145, "global_step": 1150, "epoch": 27} {"train_loss": -2.4006519317626953, "global_step": 1151, "epoch": 27} {"train_loss": -2.5752036571502686, "global_step": 1152, "epoch": 27} {"train_loss": -2.398693799972534, "global_step": 1153, "epoch": 27} {"train_loss": -2.668489933013916, "global_step": 1154, "epoch": 27} {"train_loss": -2.523627281188965, "global_step": 1155, "epoch": 27} {"train_loss": -2.38222074508667, "global_step": 1156, "epoch": 27} {"train_loss": -2.466034412384033, "global_step": 1157, "epoch": 27} {"train_loss": -2.407200336456299, "global_step": 1158, "epoch": 27} {"train_loss": -2.5839600563049316, "global_step": 1159, "epoch": 27} {"train_loss": -2.3143346309661865, "global_step": 1160, "epoch": 27} {"train_loss": -2.5678744316101074, "global_step": 1161, "epoch": 27} {"train_loss": -2.3498079776763916, "global_step": 1162, "epoch": 27} {"train_loss": -2.4303174018859863, "global_step": 1163, "epoch": 27} {"train_loss": -2.3864328861236572, "global_step": 1164, "epoch": 27} {"train_loss": -2.479536771774292, "global_step": 1165, "epoch": 27} {"train_loss": -2.500507354736328, "global_step": 1166, "epoch": 27} {"train_loss": -2.4808082580566406, "global_step": 1167, "epoch": 27} {"train_loss": -2.3709425926208496, "global_step": 1168, "epoch": 27} {"train_loss": -2.6291861534118652, "global_step": 1169, "epoch": 27} {"train_loss": -2.5455634593963623, "global_step": 1170, "epoch": 27} {"train_loss": -2.458139419555664, "global_step": 1171, "epoch": 27} {"train_loss": -2.448321580886841, "global_step": 1172, "epoch": 27} {"train_loss": -2.459423065185547, "global_step": 1173, "epoch": 27} {"train_loss": -2.5529065132141113, "global_step": 1174, "epoch": 27} {"train_loss": -2.478250060762678, "global_step": 1175, "epoch": 27, "val_loss": 737240.875} {"train_loss": -2.507568359375, "global_step": 1176, "epoch": 28} {"train_loss": -2.455799102783203, "global_step": 1177, "epoch": 28} {"train_loss": -2.596764087677002, "global_step": 1178, "epoch": 28} {"train_loss": -2.5701966285705566, "global_step": 1179, "epoch": 28} {"train_loss": -2.614867925643921, "global_step": 1180, "epoch": 28} {"train_loss": -2.4383432865142822, "global_step": 1181, "epoch": 28} {"train_loss": -2.529268264770508, "global_step": 1182, "epoch": 28} {"train_loss": -2.6247096061706543, "global_step": 1183, "epoch": 28} {"train_loss": -2.553480625152588, "global_step": 1184, "epoch": 28} {"train_loss": -2.5764122009277344, "global_step": 1185, "epoch": 28} {"train_loss": -2.487406015396118, "global_step": 1186, "epoch": 28} {"train_loss": -2.617311477661133, "global_step": 1187, "epoch": 28} {"train_loss": -2.491999626159668, "global_step": 1188, "epoch": 28} {"train_loss": -2.533052444458008, "global_step": 1189, "epoch": 28} {"train_loss": -2.630363941192627, "global_step": 1190, "epoch": 28} {"train_loss": -2.5893807411193848, "global_step": 1191, "epoch": 28} {"train_loss": -2.647826910018921, "global_step": 1192, "epoch": 28} {"train_loss": -2.503068447113037, "global_step": 1193, "epoch": 28} {"train_loss": -2.5776000022888184, "global_step": 1194, "epoch": 28} {"train_loss": -2.5689468383789062, "global_step": 1195, "epoch": 28} {"train_loss": -2.612866163253784, "global_step": 1196, "epoch": 28} {"train_loss": -2.5039525032043457, "global_step": 1197, "epoch": 28} {"train_loss": -2.306307315826416, "global_step": 1198, "epoch": 28} {"train_loss": -2.617246150970459, "global_step": 1199, "epoch": 28} {"train_loss": -2.5878520011901855, "global_step": 1200, "epoch": 28} {"train_loss": -2.3755903244018555, "global_step": 1201, "epoch": 28} {"train_loss": -2.504133939743042, "global_step": 1202, "epoch": 28} {"train_loss": -2.3477001190185547, "global_step": 1203, "epoch": 28} {"train_loss": -2.4611008167266846, "global_step": 1204, "epoch": 28} {"train_loss": -2.498013973236084, "global_step": 1205, "epoch": 28} {"train_loss": -2.4464430809020996, "global_step": 1206, "epoch": 28} {"train_loss": -2.502256393432617, "global_step": 1207, "epoch": 28} {"train_loss": -2.5925674438476562, "global_step": 1208, "epoch": 28} {"train_loss": -2.447636127471924, "global_step": 1209, "epoch": 28} {"train_loss": -2.6408495903015137, "global_step": 1210, "epoch": 28} {"train_loss": -2.5031566619873047, "global_step": 1211, "epoch": 28} {"train_loss": -2.6547369956970215, "global_step": 1212, "epoch": 28} {"train_loss": -2.4844954013824463, "global_step": 1213, "epoch": 28} {"train_loss": -2.590768337249756, "global_step": 1214, "epoch": 28} {"train_loss": -2.586977243423462, "global_step": 1215, "epoch": 28} {"train_loss": -2.518378496170044, "global_step": 1216, "epoch": 28} {"train_loss": -2.535174670673552, "global_step": 1217, "epoch": 28, "val_loss": 717288.6875} {"train_loss": -2.6526718139648438, "global_step": 1218, "epoch": 29} {"train_loss": -2.497915267944336, "global_step": 1219, "epoch": 29} {"train_loss": -2.594374179840088, "global_step": 1220, "epoch": 29} {"train_loss": -2.7192258834838867, "global_step": 1221, "epoch": 29} {"train_loss": -2.4869384765625, "global_step": 1222, "epoch": 29} {"train_loss": -2.500669002532959, "global_step": 1223, "epoch": 29} {"train_loss": -2.452193260192871, "global_step": 1224, "epoch": 29} {"train_loss": -2.4789068698883057, "global_step": 1225, "epoch": 29} {"train_loss": -2.6631155014038086, "global_step": 1226, "epoch": 29} {"train_loss": -2.663064479827881, "global_step": 1227, "epoch": 29} {"train_loss": -2.5063040256500244, "global_step": 1228, "epoch": 29} {"train_loss": -2.650845766067505, "global_step": 1229, "epoch": 29} {"train_loss": -2.531877040863037, "global_step": 1230, "epoch": 29} {"train_loss": -2.541604518890381, "global_step": 1231, "epoch": 29} {"train_loss": -2.684624195098877, "global_step": 1232, "epoch": 29} {"train_loss": -2.553115129470825, "global_step": 1233, "epoch": 29} {"train_loss": -2.5768346786499023, "global_step": 1234, "epoch": 29} {"train_loss": -2.6535086631774902, "global_step": 1235, "epoch": 29} {"train_loss": -2.593857765197754, "global_step": 1236, "epoch": 29} {"train_loss": -2.431250810623169, "global_step": 1237, "epoch": 29} {"train_loss": -2.8070931434631348, "global_step": 1238, "epoch": 29} {"train_loss": -2.5103464126586914, "global_step": 1239, "epoch": 29} {"train_loss": -2.6069912910461426, "global_step": 1240, "epoch": 29} {"train_loss": -2.630202054977417, "global_step": 1241, "epoch": 29} {"train_loss": -2.598813772201538, "global_step": 1242, "epoch": 29} {"train_loss": -2.43656063079834, "global_step": 1243, "epoch": 29} {"train_loss": -2.5692672729492188, "global_step": 1244, "epoch": 29} {"train_loss": -2.4645822048187256, "global_step": 1245, "epoch": 29} {"train_loss": -2.495197057723999, "global_step": 1246, "epoch": 29} {"train_loss": -2.788341999053955, "global_step": 1247, "epoch": 29} {"train_loss": -2.5828514099121094, "global_step": 1248, "epoch": 29} {"train_loss": -2.664306163787842, "global_step": 1249, "epoch": 29} {"train_loss": -2.5735015869140625, "global_step": 1250, "epoch": 29} {"train_loss": -2.657078504562378, "global_step": 1251, "epoch": 29} {"train_loss": -2.595695734024048, "global_step": 1252, "epoch": 29} {"train_loss": -2.660825490951538, "global_step": 1253, "epoch": 29} {"train_loss": -2.6857969760894775, "global_step": 1254, "epoch": 29} {"train_loss": -2.687389850616455, "global_step": 1255, "epoch": 29} {"train_loss": -2.4819908142089844, "global_step": 1256, "epoch": 29} {"train_loss": -2.5631492137908936, "global_step": 1257, "epoch": 29} {"train_loss": -2.7199482917785645, "global_step": 1258, "epoch": 29} {"train_loss": -2.591441063653855, "global_step": 1259, "epoch": 29, "val_loss": 677838.25} {"train_loss": -2.7673423290252686, "global_step": 1260, "epoch": 30} {"train_loss": -2.4676733016967773, "global_step": 1261, "epoch": 30} {"train_loss": -2.6274280548095703, "global_step": 1262, "epoch": 30} {"train_loss": -2.7854650020599365, "global_step": 1263, "epoch": 30} {"train_loss": -2.612056255340576, "global_step": 1264, "epoch": 30} {"train_loss": -2.811765193939209, "global_step": 1265, "epoch": 30} {"train_loss": -2.602170944213867, "global_step": 1266, "epoch": 30} {"train_loss": -2.657526969909668, "global_step": 1267, "epoch": 30} {"train_loss": -2.6475718021392822, "global_step": 1268, "epoch": 30} {"train_loss": -2.664628028869629, "global_step": 1269, "epoch": 30} {"train_loss": -2.834843635559082, "global_step": 1270, "epoch": 30} {"train_loss": -2.67478084564209, "global_step": 1271, "epoch": 30} {"train_loss": -2.7351245880126953, "global_step": 1272, "epoch": 30} {"train_loss": -2.657289743423462, "global_step": 1273, "epoch": 30} {"train_loss": -2.7905831336975098, "global_step": 1274, "epoch": 30} {"train_loss": -2.704697608947754, "global_step": 1275, "epoch": 30} {"train_loss": -2.4743282794952393, "global_step": 1276, "epoch": 30} {"train_loss": -2.60217547416687, "global_step": 1277, "epoch": 30} {"train_loss": -2.615586757659912, "global_step": 1278, "epoch": 30} {"train_loss": -2.6296205520629883, "global_step": 1279, "epoch": 30} {"train_loss": -2.707693099975586, "global_step": 1280, "epoch": 30} {"train_loss": -2.8011889457702637, "global_step": 1281, "epoch": 30} {"train_loss": -2.5715911388397217, "global_step": 1282, "epoch": 30} {"train_loss": -2.7646827697753906, "global_step": 1283, "epoch": 30} {"train_loss": -2.5276119709014893, "global_step": 1284, "epoch": 30} {"train_loss": -2.54056978225708, "global_step": 1285, "epoch": 30} {"train_loss": -2.5040929317474365, "global_step": 1286, "epoch": 30} {"train_loss": -2.641213893890381, "global_step": 1287, "epoch": 30} {"train_loss": -2.6116185188293457, "global_step": 1288, "epoch": 30} {"train_loss": -2.473231554031372, "global_step": 1289, "epoch": 30} {"train_loss": -2.7364962100982666, "global_step": 1290, "epoch": 30} {"train_loss": -2.519531726837158, "global_step": 1291, "epoch": 30} {"train_loss": -2.692964553833008, "global_step": 1292, "epoch": 30} {"train_loss": -2.702096939086914, "global_step": 1293, "epoch": 30} {"train_loss": -2.6449289321899414, "global_step": 1294, "epoch": 30} {"train_loss": -2.5092287063598633, "global_step": 1295, "epoch": 30} {"train_loss": -2.635645866394043, "global_step": 1296, "epoch": 30} {"train_loss": -2.477783441543579, "global_step": 1297, "epoch": 30} {"train_loss": -2.790390968322754, "global_step": 1298, "epoch": 30} {"train_loss": -2.7304553985595703, "global_step": 1299, "epoch": 30} {"train_loss": -2.455821990966797, "global_step": 1300, "epoch": 30} {"train_loss": -2.6446016970134916, "global_step": 1301, "epoch": 30, "val_loss": 660914.0625} {"train_loss": -2.492269992828369, "global_step": 1302, "epoch": 31} {"train_loss": -2.7452144622802734, "global_step": 1303, "epoch": 31} {"train_loss": -2.674008369445801, "global_step": 1304, "epoch": 31} {"train_loss": -2.7233829498291016, "global_step": 1305, "epoch": 31} {"train_loss": -2.70656681060791, "global_step": 1306, "epoch": 31} {"train_loss": -2.6645889282226562, "global_step": 1307, "epoch": 31} {"train_loss": -2.6853888034820557, "global_step": 1308, "epoch": 31} {"train_loss": -2.632336139678955, "global_step": 1309, "epoch": 31} {"train_loss": -2.626406669616699, "global_step": 1310, "epoch": 31} {"train_loss": -2.787921905517578, "global_step": 1311, "epoch": 31} {"train_loss": -2.6609740257263184, "global_step": 1312, "epoch": 31} {"train_loss": -2.739222764968872, "global_step": 1313, "epoch": 31} {"train_loss": -2.853696584701538, "global_step": 1314, "epoch": 31} {"train_loss": -2.858243465423584, "global_step": 1315, "epoch": 31} {"train_loss": -2.7481203079223633, "global_step": 1316, "epoch": 31} {"train_loss": -2.7626726627349854, "global_step": 1317, "epoch": 31} {"train_loss": -2.626189947128296, "global_step": 1318, "epoch": 31} {"train_loss": -2.7578506469726562, "global_step": 1319, "epoch": 31} {"train_loss": -2.67014741897583, "global_step": 1320, "epoch": 31} {"train_loss": -2.510416030883789, "global_step": 1321, "epoch": 31} {"train_loss": -2.7525711059570312, "global_step": 1322, "epoch": 31} {"train_loss": -2.710969924926758, "global_step": 1323, "epoch": 31} {"train_loss": -2.7540957927703857, "global_step": 1324, "epoch": 31} {"train_loss": -2.635082483291626, "global_step": 1325, "epoch": 31} {"train_loss": -2.7437570095062256, "global_step": 1326, "epoch": 31} {"train_loss": -2.777859687805176, "global_step": 1327, "epoch": 31} {"train_loss": -2.8679347038269043, "global_step": 1328, "epoch": 31} {"train_loss": -2.6924266815185547, "global_step": 1329, "epoch": 31} {"train_loss": -2.7521564960479736, "global_step": 1330, "epoch": 31} {"train_loss": -2.6664512157440186, "global_step": 1331, "epoch": 31} {"train_loss": -2.7661705017089844, "global_step": 1332, "epoch": 31} {"train_loss": -2.665283203125, "global_step": 1333, "epoch": 31} {"train_loss": -2.7547879219055176, "global_step": 1334, "epoch": 31} {"train_loss": -2.660271167755127, "global_step": 1335, "epoch": 31} {"train_loss": -2.9177908897399902, "global_step": 1336, "epoch": 31} {"train_loss": -2.6174654960632324, "global_step": 1337, "epoch": 31} {"train_loss": -2.5619397163391113, "global_step": 1338, "epoch": 31} {"train_loss": -2.6394214630126953, "global_step": 1339, "epoch": 31} {"train_loss": -2.7192611694335938, "global_step": 1340, "epoch": 31} {"train_loss": -2.61246919631958, "global_step": 1341, "epoch": 31} {"train_loss": -2.600466251373291, "global_step": 1342, "epoch": 31} {"train_loss": -2.705925385157267, "global_step": 1343, "epoch": 31, "val_loss": 639606.5625} {"train_loss": -2.5782992839813232, "global_step": 1344, "epoch": 32} {"train_loss": -2.713430166244507, "global_step": 1345, "epoch": 32} {"train_loss": -2.4615612030029297, "global_step": 1346, "epoch": 32} {"train_loss": -2.8102126121520996, "global_step": 1347, "epoch": 32} {"train_loss": -2.5399394035339355, "global_step": 1348, "epoch": 32} {"train_loss": -2.6957058906555176, "global_step": 1349, "epoch": 32} {"train_loss": -2.633009910583496, "global_step": 1350, "epoch": 32} {"train_loss": -2.715061664581299, "global_step": 1351, "epoch": 32} {"train_loss": -2.5259242057800293, "global_step": 1352, "epoch": 32} {"train_loss": -2.8003430366516113, "global_step": 1353, "epoch": 32} {"train_loss": -2.7757411003112793, "global_step": 1354, "epoch": 32} {"train_loss": -2.7255401611328125, "global_step": 1355, "epoch": 32} {"train_loss": -2.7425413131713867, "global_step": 1356, "epoch": 32} {"train_loss": -2.8256609439849854, "global_step": 1357, "epoch": 32} {"train_loss": -2.768733024597168, "global_step": 1358, "epoch": 32} {"train_loss": -2.6704530715942383, "global_step": 1359, "epoch": 32} {"train_loss": -2.791883707046509, "global_step": 1360, "epoch": 32} {"train_loss": -2.9065160751342773, "global_step": 1361, "epoch": 32} {"train_loss": -2.7731893062591553, "global_step": 1362, "epoch": 32} {"train_loss": -2.8695950508117676, "global_step": 1363, "epoch": 32} {"train_loss": -2.8638761043548584, "global_step": 1364, "epoch": 32} {"train_loss": -2.7173078060150146, "global_step": 1365, "epoch": 32} {"train_loss": -2.8830080032348633, "global_step": 1366, "epoch": 32} {"train_loss": -2.834393262863159, "global_step": 1367, "epoch": 32} {"train_loss": -2.7199912071228027, "global_step": 1368, "epoch": 32} {"train_loss": -2.726935863494873, "global_step": 1369, "epoch": 32} {"train_loss": -2.6214160919189453, "global_step": 1370, "epoch": 32} {"train_loss": -2.6680891513824463, "global_step": 1371, "epoch": 32} {"train_loss": -2.655282974243164, "global_step": 1372, "epoch": 32} {"train_loss": -2.6306519508361816, "global_step": 1373, "epoch": 32} {"train_loss": -2.810408353805542, "global_step": 1374, "epoch": 32} {"train_loss": -2.7738852500915527, "global_step": 1375, "epoch": 32} {"train_loss": -2.6724905967712402, "global_step": 1376, "epoch": 32} {"train_loss": -2.709242343902588, "global_step": 1377, "epoch": 32} {"train_loss": -2.921505928039551, "global_step": 1378, "epoch": 32} {"train_loss": -2.735586166381836, "global_step": 1379, "epoch": 32} {"train_loss": -2.7625246047973633, "global_step": 1380, "epoch": 32} {"train_loss": -2.7312355041503906, "global_step": 1381, "epoch": 32} {"train_loss": -2.751132011413574, "global_step": 1382, "epoch": 32} {"train_loss": -2.5535171031951904, "global_step": 1383, "epoch": 32} {"train_loss": -2.7321176528930664, "global_step": 1384, "epoch": 32} {"train_loss": -2.717596002987453, "global_step": 1385, "epoch": 32, "val_loss": 601370.5} {"train_loss": -2.6907706260681152, "global_step": 1386, "epoch": 33} {"train_loss": -2.404118061065674, "global_step": 1387, "epoch": 33} {"train_loss": -2.8317174911499023, "global_step": 1388, "epoch": 33} {"train_loss": -2.335580587387085, "global_step": 1389, "epoch": 33} {"train_loss": -2.7172858715057373, "global_step": 1390, "epoch": 33} {"train_loss": -2.45658540725708, "global_step": 1391, "epoch": 33} {"train_loss": -2.7326273918151855, "global_step": 1392, "epoch": 33} {"train_loss": -2.549877166748047, "global_step": 1393, "epoch": 33} {"train_loss": -2.602431058883667, "global_step": 1394, "epoch": 33} {"train_loss": -2.711716890335083, "global_step": 1395, "epoch": 33} {"train_loss": -2.4338765144348145, "global_step": 1396, "epoch": 33} {"train_loss": -2.6415276527404785, "global_step": 1397, "epoch": 33} {"train_loss": -2.5244593620300293, "global_step": 1398, "epoch": 33} {"train_loss": -2.656041383743286, "global_step": 1399, "epoch": 33} {"train_loss": -2.6770200729370117, "global_step": 1400, "epoch": 33} {"train_loss": -2.543821334838867, "global_step": 1401, "epoch": 33} {"train_loss": -2.6725635528564453, "global_step": 1402, "epoch": 33} {"train_loss": -2.5550496578216553, "global_step": 1403, "epoch": 33} {"train_loss": -2.6425421237945557, "global_step": 1404, "epoch": 33} {"train_loss": -2.674609661102295, "global_step": 1405, "epoch": 33} {"train_loss": -2.725126266479492, "global_step": 1406, "epoch": 33} {"train_loss": -2.439911365509033, "global_step": 1407, "epoch": 33} {"train_loss": -2.794693946838379, "global_step": 1408, "epoch": 33} {"train_loss": -2.513648748397827, "global_step": 1409, "epoch": 33} {"train_loss": -2.6763968467712402, "global_step": 1410, "epoch": 33} {"train_loss": -2.6350648403167725, "global_step": 1411, "epoch": 33} {"train_loss": -2.751736640930176, "global_step": 1412, "epoch": 33} {"train_loss": -2.5809175968170166, "global_step": 1413, "epoch": 33} {"train_loss": -2.7031025886535645, "global_step": 1414, "epoch": 33} {"train_loss": -2.701295852661133, "global_step": 1415, "epoch": 33} {"train_loss": -2.748312473297119, "global_step": 1416, "epoch": 33} {"train_loss": -2.72000789642334, "global_step": 1417, "epoch": 33} {"train_loss": -2.7379064559936523, "global_step": 1418, "epoch": 33} {"train_loss": -2.8268160820007324, "global_step": 1419, "epoch": 33} {"train_loss": -2.72589373588562, "global_step": 1420, "epoch": 33} {"train_loss": -2.86458158493042, "global_step": 1421, "epoch": 33} {"train_loss": -2.8260068893432617, "global_step": 1422, "epoch": 33} {"train_loss": -2.7948338985443115, "global_step": 1423, "epoch": 33} {"train_loss": -2.8091936111450195, "global_step": 1424, "epoch": 33} {"train_loss": -2.8492302894592285, "global_step": 1425, "epoch": 33} {"train_loss": -2.722339630126953, "global_step": 1426, "epoch": 33} {"train_loss": -2.670006962049575, "global_step": 1427, "epoch": 33, "val_loss": 576736.875} {"train_loss": -2.7200398445129395, "global_step": 1428, "epoch": 34} {"train_loss": -2.6052520275115967, "global_step": 1429, "epoch": 34} {"train_loss": -2.883086681365967, "global_step": 1430, "epoch": 34} {"train_loss": -2.8482303619384766, "global_step": 1431, "epoch": 34} {"train_loss": -2.7552578449249268, "global_step": 1432, "epoch": 34} {"train_loss": -2.868795394897461, "global_step": 1433, "epoch": 34} {"train_loss": -2.8383660316467285, "global_step": 1434, "epoch": 34} {"train_loss": -2.884788990020752, "global_step": 1435, "epoch": 34} {"train_loss": -2.7942099571228027, "global_step": 1436, "epoch": 34} {"train_loss": -2.8783907890319824, "global_step": 1437, "epoch": 34} {"train_loss": -2.8628859519958496, "global_step": 1438, "epoch": 34} {"train_loss": -2.9630751609802246, "global_step": 1439, "epoch": 34} {"train_loss": -2.6823036670684814, "global_step": 1440, "epoch": 34} {"train_loss": -2.799781560897827, "global_step": 1441, "epoch": 34} {"train_loss": -2.6040472984313965, "global_step": 1442, "epoch": 34} {"train_loss": -2.780841827392578, "global_step": 1443, "epoch": 34} {"train_loss": -2.8136825561523438, "global_step": 1444, "epoch": 34} {"train_loss": -2.7356464862823486, "global_step": 1445, "epoch": 34} {"train_loss": -2.7496774196624756, "global_step": 1446, "epoch": 34} {"train_loss": -2.6701340675354004, "global_step": 1447, "epoch": 34} {"train_loss": -2.8220202922821045, "global_step": 1448, "epoch": 34} {"train_loss": -2.6878561973571777, "global_step": 1449, "epoch": 34} {"train_loss": -2.900521755218506, "global_step": 1450, "epoch": 34} {"train_loss": -2.78237247467041, "global_step": 1451, "epoch": 34} {"train_loss": -2.9282960891723633, "global_step": 1452, "epoch": 34} {"train_loss": -2.747567892074585, "global_step": 1453, "epoch": 34} {"train_loss": -2.867711067199707, "global_step": 1454, "epoch": 34} {"train_loss": -2.8802714347839355, "global_step": 1455, "epoch": 34} {"train_loss": -2.9004769325256348, "global_step": 1456, "epoch": 34} {"train_loss": -2.7804360389709473, "global_step": 1457, "epoch": 34} {"train_loss": -2.900351047515869, "global_step": 1458, "epoch": 34} {"train_loss": -2.825446605682373, "global_step": 1459, "epoch": 34} {"train_loss": -2.89322566986084, "global_step": 1460, "epoch": 34} {"train_loss": -2.8460209369659424, "global_step": 1461, "epoch": 34} {"train_loss": -2.787034511566162, "global_step": 1462, "epoch": 34} {"train_loss": -2.764860153198242, "global_step": 1463, "epoch": 34} {"train_loss": -2.916006088256836, "global_step": 1464, "epoch": 34} {"train_loss": -2.8232226371765137, "global_step": 1465, "epoch": 34} {"train_loss": -2.852719306945801, "global_step": 1466, "epoch": 34} {"train_loss": -2.7999205589294434, "global_step": 1467, "epoch": 34} {"train_loss": -2.81437087059021, "global_step": 1468, "epoch": 34} {"train_loss": -2.8148985022590276, "global_step": 1469, "epoch": 34, "val_loss": 555142.4375} {"train_loss": -2.736189126968384, "global_step": 1470, "epoch": 35} {"train_loss": -2.801342487335205, "global_step": 1471, "epoch": 35} {"train_loss": -2.7538437843322754, "global_step": 1472, "epoch": 35} {"train_loss": -2.8253531455993652, "global_step": 1473, "epoch": 35} {"train_loss": -2.938535690307617, "global_step": 1474, "epoch": 35} {"train_loss": -2.8876450061798096, "global_step": 1475, "epoch": 35} {"train_loss": -2.8090758323669434, "global_step": 1476, "epoch": 35} {"train_loss": -2.907984972000122, "global_step": 1477, "epoch": 35} {"train_loss": -2.804394245147705, "global_step": 1478, "epoch": 35} {"train_loss": -2.8605384826660156, "global_step": 1479, "epoch": 35} {"train_loss": -2.788557529449463, "global_step": 1480, "epoch": 35} {"train_loss": -2.72224760055542, "global_step": 1481, "epoch": 35} {"train_loss": -2.7962441444396973, "global_step": 1482, "epoch": 35} {"train_loss": -2.7934696674346924, "global_step": 1483, "epoch": 35} {"train_loss": -2.6335365772247314, "global_step": 1484, "epoch": 35} {"train_loss": -2.83799409866333, "global_step": 1485, "epoch": 35} {"train_loss": -2.6327054500579834, "global_step": 1486, "epoch": 35} {"train_loss": -2.826474666595459, "global_step": 1487, "epoch": 35} {"train_loss": -2.71537184715271, "global_step": 1488, "epoch": 35} {"train_loss": -2.8857626914978027, "global_step": 1489, "epoch": 35} {"train_loss": -2.6656651496887207, "global_step": 1490, "epoch": 35} {"train_loss": -2.9482338428497314, "global_step": 1491, "epoch": 35} {"train_loss": -2.8101117610931396, "global_step": 1492, "epoch": 35} {"train_loss": -2.954220771789551, "global_step": 1493, "epoch": 35} {"train_loss": -2.84182071685791, "global_step": 1494, "epoch": 35} {"train_loss": -2.835872173309326, "global_step": 1495, "epoch": 35} {"train_loss": -2.7697348594665527, "global_step": 1496, "epoch": 35} {"train_loss": -2.758758068084717, "global_step": 1497, "epoch": 35} {"train_loss": -2.886275291442871, "global_step": 1498, "epoch": 35} {"train_loss": -2.9902236461639404, "global_step": 1499, "epoch": 35} {"train_loss": -3.0058140754699707, "global_step": 1500, "epoch": 35} {"train_loss": -2.826878547668457, "global_step": 1501, "epoch": 35} {"train_loss": -2.711916208267212, "global_step": 1502, "epoch": 35} {"train_loss": -2.8775839805603027, "global_step": 1503, "epoch": 35} {"train_loss": -2.9915528297424316, "global_step": 1504, "epoch": 35} {"train_loss": -2.8019049167633057, "global_step": 1505, "epoch": 35} {"train_loss": -2.846501588821411, "global_step": 1506, "epoch": 35} {"train_loss": -2.769819736480713, "global_step": 1507, "epoch": 35} {"train_loss": -2.8006591796875, "global_step": 1508, "epoch": 35} {"train_loss": -2.7363743782043457, "global_step": 1509, "epoch": 35} {"train_loss": -2.8839685916900635, "global_step": 1510, "epoch": 35} {"train_loss": -2.8172018073853993, "global_step": 1511, "epoch": 35, "val_loss": 537398.25} {"train_loss": -2.8175487518310547, "global_step": 1512, "epoch": 36} {"train_loss": -2.633955955505371, "global_step": 1513, "epoch": 36} {"train_loss": -2.7123827934265137, "global_step": 1514, "epoch": 36} {"train_loss": -2.8094727993011475, "global_step": 1515, "epoch": 36} {"train_loss": -2.8735246658325195, "global_step": 1516, "epoch": 36} {"train_loss": -3.0681686401367188, "global_step": 1517, "epoch": 36} {"train_loss": -2.855442523956299, "global_step": 1518, "epoch": 36} {"train_loss": -2.856266736984253, "global_step": 1519, "epoch": 36} {"train_loss": -2.8882827758789062, "global_step": 1520, "epoch": 36} {"train_loss": -2.996196985244751, "global_step": 1521, "epoch": 36} {"train_loss": -2.716468334197998, "global_step": 1522, "epoch": 36} {"train_loss": -2.865629196166992, "global_step": 1523, "epoch": 36} {"train_loss": -2.642764091491699, "global_step": 1524, "epoch": 36} {"train_loss": -2.929586172103882, "global_step": 1525, "epoch": 36} {"train_loss": -2.6343894004821777, "global_step": 1526, "epoch": 36} {"train_loss": -2.7284352779388428, "global_step": 1527, "epoch": 36} {"train_loss": -2.714691638946533, "global_step": 1528, "epoch": 36} {"train_loss": -2.8361127376556396, "global_step": 1529, "epoch": 36} {"train_loss": -2.605809211730957, "global_step": 1530, "epoch": 36} {"train_loss": -2.8812711238861084, "global_step": 1531, "epoch": 36} {"train_loss": -2.6608242988586426, "global_step": 1532, "epoch": 36} {"train_loss": -2.879624366760254, "global_step": 1533, "epoch": 36} {"train_loss": -2.6818954944610596, "global_step": 1534, "epoch": 36} {"train_loss": -2.9580435752868652, "global_step": 1535, "epoch": 36} {"train_loss": -2.817196846008301, "global_step": 1536, "epoch": 36} {"train_loss": -2.7082107067108154, "global_step": 1537, "epoch": 36} {"train_loss": -2.821913242340088, "global_step": 1538, "epoch": 36} {"train_loss": -2.7069172859191895, "global_step": 1539, "epoch": 36} {"train_loss": -2.879296064376831, "global_step": 1540, "epoch": 36} {"train_loss": -2.7640204429626465, "global_step": 1541, "epoch": 36} {"train_loss": -2.9168953895568848, "global_step": 1542, "epoch": 36} {"train_loss": -2.8298792839050293, "global_step": 1543, "epoch": 36} {"train_loss": -2.910712718963623, "global_step": 1544, "epoch": 36} {"train_loss": -2.8377397060394287, "global_step": 1545, "epoch": 36} {"train_loss": -2.9839460849761963, "global_step": 1546, "epoch": 36} {"train_loss": -2.925462245941162, "global_step": 1547, "epoch": 36} {"train_loss": -2.8927080631256104, "global_step": 1548, "epoch": 36} {"train_loss": -2.8367960453033447, "global_step": 1549, "epoch": 36} {"train_loss": -2.9854049682617188, "global_step": 1550, "epoch": 36} {"train_loss": -2.941084861755371, "global_step": 1551, "epoch": 36} {"train_loss": -2.91802978515625, "global_step": 1552, "epoch": 36} {"train_loss": -2.8302697397413707, "global_step": 1553, "epoch": 36, "val_loss": 512915.625} {"train_loss": -2.816866636276245, "global_step": 1554, "epoch": 37} {"train_loss": -2.9716944694519043, "global_step": 1555, "epoch": 37} {"train_loss": -2.9932143688201904, "global_step": 1556, "epoch": 37} {"train_loss": -2.86604642868042, "global_step": 1557, "epoch": 37} {"train_loss": -2.8328135013580322, "global_step": 1558, "epoch": 37} {"train_loss": -3.017590284347534, "global_step": 1559, "epoch": 37} {"train_loss": -2.9588570594787598, "global_step": 1560, "epoch": 37} {"train_loss": -2.9900622367858887, "global_step": 1561, "epoch": 37} {"train_loss": -2.8224329948425293, "global_step": 1562, "epoch": 37} {"train_loss": -3.046034574508667, "global_step": 1563, "epoch": 37} {"train_loss": -3.0093493461608887, "global_step": 1564, "epoch": 37} {"train_loss": -2.9688448905944824, "global_step": 1565, "epoch": 37} {"train_loss": -2.9395649433135986, "global_step": 1566, "epoch": 37} {"train_loss": -3.0229039192199707, "global_step": 1567, "epoch": 37} {"train_loss": -2.998645782470703, "global_step": 1568, "epoch": 37} {"train_loss": -2.963487386703491, "global_step": 1569, "epoch": 37} {"train_loss": -2.8241031169891357, "global_step": 1570, "epoch": 37} {"train_loss": -2.853759765625, "global_step": 1571, "epoch": 37} {"train_loss": -2.964837074279785, "global_step": 1572, "epoch": 37} {"train_loss": -2.813277006149292, "global_step": 1573, "epoch": 37} {"train_loss": -2.92012095451355, "global_step": 1574, "epoch": 37} {"train_loss": -2.934790849685669, "global_step": 1575, "epoch": 37} {"train_loss": -2.9735374450683594, "global_step": 1576, "epoch": 37} {"train_loss": -2.968588352203369, "global_step": 1577, "epoch": 37} {"train_loss": -2.8000402450561523, "global_step": 1578, "epoch": 37} {"train_loss": -2.9560184478759766, "global_step": 1579, "epoch": 37} {"train_loss": -2.676267623901367, "global_step": 1580, "epoch": 37} {"train_loss": -3.063636302947998, "global_step": 1581, "epoch": 37} {"train_loss": -2.6885323524475098, "global_step": 1582, "epoch": 37} {"train_loss": -2.796813488006592, "global_step": 1583, "epoch": 37} {"train_loss": -2.6787161827087402, "global_step": 1584, "epoch": 37} {"train_loss": -2.9599688053131104, "global_step": 1585, "epoch": 37} {"train_loss": -2.6078174114227295, "global_step": 1586, "epoch": 37} {"train_loss": -2.9874520301818848, "global_step": 1587, "epoch": 37} {"train_loss": -2.937169075012207, "global_step": 1588, "epoch": 37} {"train_loss": -2.957406520843506, "global_step": 1589, "epoch": 37} {"train_loss": -2.7677860260009766, "global_step": 1590, "epoch": 37} {"train_loss": -2.9328274726867676, "global_step": 1591, "epoch": 37} {"train_loss": -2.6848835945129395, "global_step": 1592, "epoch": 37} {"train_loss": -2.938291072845459, "global_step": 1593, "epoch": 37} {"train_loss": -2.8014461994171143, "global_step": 1594, "epoch": 37} {"train_loss": -2.89458167552948, "global_step": 1595, "epoch": 37, "val_loss": 497908.375} {"train_loss": -3.0094964504241943, "global_step": 1596, "epoch": 38} {"train_loss": -2.854606866836548, "global_step": 1597, "epoch": 38} {"train_loss": -3.0082809925079346, "global_step": 1598, "epoch": 38} {"train_loss": -2.8462228775024414, "global_step": 1599, "epoch": 38} {"train_loss": -3.0871634483337402, "global_step": 1600, "epoch": 38} {"train_loss": -2.9025115966796875, "global_step": 1601, "epoch": 38} {"train_loss": -2.85392427444458, "global_step": 1602, "epoch": 38} {"train_loss": -2.978386402130127, "global_step": 1603, "epoch": 38} {"train_loss": -2.9580297470092773, "global_step": 1604, "epoch": 38} {"train_loss": -2.7885634899139404, "global_step": 1605, "epoch": 38} {"train_loss": -2.915377140045166, "global_step": 1606, "epoch": 38} {"train_loss": -2.9158899784088135, "global_step": 1607, "epoch": 38} {"train_loss": -2.914175033569336, "global_step": 1608, "epoch": 38} {"train_loss": -3.0658950805664062, "global_step": 1609, "epoch": 38} {"train_loss": -2.8030967712402344, "global_step": 1610, "epoch": 38} {"train_loss": -2.752084493637085, "global_step": 1611, "epoch": 38} {"train_loss": -2.9762425422668457, "global_step": 1612, "epoch": 38} {"train_loss": -2.8876662254333496, "global_step": 1613, "epoch": 38} {"train_loss": -2.967561721801758, "global_step": 1614, "epoch": 38} {"train_loss": -2.912864923477173, "global_step": 1615, "epoch": 38} {"train_loss": -2.804777145385742, "global_step": 1616, "epoch": 38} {"train_loss": -2.969125270843506, "global_step": 1617, "epoch": 38} {"train_loss": -2.98663592338562, "global_step": 1618, "epoch": 38} {"train_loss": -2.832036018371582, "global_step": 1619, "epoch": 38} {"train_loss": -3.095592975616455, "global_step": 1620, "epoch": 38} {"train_loss": -2.763000726699829, "global_step": 1621, "epoch": 38} {"train_loss": -3.0756986141204834, "global_step": 1622, "epoch": 38} {"train_loss": -2.9765243530273438, "global_step": 1623, "epoch": 38} {"train_loss": -2.954890727996826, "global_step": 1624, "epoch": 38} {"train_loss": -3.0051727294921875, "global_step": 1625, "epoch": 38} {"train_loss": -2.833796739578247, "global_step": 1626, "epoch": 38} {"train_loss": -2.940850019454956, "global_step": 1627, "epoch": 38} {"train_loss": -3.0149264335632324, "global_step": 1628, "epoch": 38} {"train_loss": -2.9813380241394043, "global_step": 1629, "epoch": 38} {"train_loss": -3.044853687286377, "global_step": 1630, "epoch": 38} {"train_loss": -2.943660259246826, "global_step": 1631, "epoch": 38} {"train_loss": -3.005509853363037, "global_step": 1632, "epoch": 38} {"train_loss": -3.113657236099243, "global_step": 1633, "epoch": 38} {"train_loss": -2.995152711868286, "global_step": 1634, "epoch": 38} {"train_loss": -3.034106731414795, "global_step": 1635, "epoch": 38} {"train_loss": -2.991184711456299, "global_step": 1636, "epoch": 38} {"train_loss": -2.9470781769071306, "global_step": 1637, "epoch": 38, "val_loss": 472707.9375} {"train_loss": -3.083122491836548, "global_step": 1638, "epoch": 39} {"train_loss": -3.0072243213653564, "global_step": 1639, "epoch": 39} {"train_loss": -2.931999683380127, "global_step": 1640, "epoch": 39} {"train_loss": -3.0475568771362305, "global_step": 1641, "epoch": 39} {"train_loss": -3.095426559448242, "global_step": 1642, "epoch": 39} {"train_loss": -2.942786693572998, "global_step": 1643, "epoch": 39} {"train_loss": -3.0310912132263184, "global_step": 1644, "epoch": 39} {"train_loss": -2.964125156402588, "global_step": 1645, "epoch": 39} {"train_loss": -2.999302864074707, "global_step": 1646, "epoch": 39} {"train_loss": -2.976449489593506, "global_step": 1647, "epoch": 39} {"train_loss": -3.046945571899414, "global_step": 1648, "epoch": 39} {"train_loss": -3.0800845623016357, "global_step": 1649, "epoch": 39} {"train_loss": -3.0952863693237305, "global_step": 1650, "epoch": 39} {"train_loss": -3.029791831970215, "global_step": 1651, "epoch": 39} {"train_loss": -2.9566471576690674, "global_step": 1652, "epoch": 39} {"train_loss": -2.894325017929077, "global_step": 1653, "epoch": 39} {"train_loss": -3.1791481971740723, "global_step": 1654, "epoch": 39} {"train_loss": -3.0527758598327637, "global_step": 1655, "epoch": 39} {"train_loss": -2.9260661602020264, "global_step": 1656, "epoch": 39} {"train_loss": -2.8213729858398438, "global_step": 1657, "epoch": 39} {"train_loss": -3.0564351081848145, "global_step": 1658, "epoch": 39} {"train_loss": -2.704387664794922, "global_step": 1659, "epoch": 39} {"train_loss": -2.971970796585083, "global_step": 1660, "epoch": 39} {"train_loss": -2.973175525665283, "global_step": 1661, "epoch": 39} {"train_loss": -2.907381772994995, "global_step": 1662, "epoch": 39} {"train_loss": -3.1110029220581055, "global_step": 1663, "epoch": 39} {"train_loss": -2.987992763519287, "global_step": 1664, "epoch": 39} {"train_loss": -2.9537734985351562, "global_step": 1665, "epoch": 39} {"train_loss": -3.04691219329834, "global_step": 1666, "epoch": 39} {"train_loss": -3.106520414352417, "global_step": 1667, "epoch": 39} {"train_loss": -2.946190595626831, "global_step": 1668, "epoch": 39} {"train_loss": -3.0546793937683105, "global_step": 1669, "epoch": 39} {"train_loss": -2.9551103115081787, "global_step": 1670, "epoch": 39} {"train_loss": -2.9558568000793457, "global_step": 1671, "epoch": 39} {"train_loss": -3.122224807739258, "global_step": 1672, "epoch": 39} {"train_loss": -3.0545787811279297, "global_step": 1673, "epoch": 39} {"train_loss": -2.8945324420928955, "global_step": 1674, "epoch": 39} {"train_loss": -3.0709519386291504, "global_step": 1675, "epoch": 39} {"train_loss": -2.957796573638916, "global_step": 1676, "epoch": 39} {"train_loss": -2.9654541015625, "global_step": 1677, "epoch": 39} {"train_loss": -3.1573853492736816, "global_step": 1678, "epoch": 39} {"train_loss": -2.9982240824472335, "global_step": 1679, "epoch": 39, "val_loss": 453631.84375} {"train_loss": -3.081845283508301, "global_step": 1680, "epoch": 40} {"train_loss": -2.939021110534668, "global_step": 1681, "epoch": 40} {"train_loss": -3.042109489440918, "global_step": 1682, "epoch": 40} {"train_loss": -3.036982774734497, "global_step": 1683, "epoch": 40} {"train_loss": -2.972480535507202, "global_step": 1684, "epoch": 40} {"train_loss": -2.9842777252197266, "global_step": 1685, "epoch": 40} {"train_loss": -2.700751304626465, "global_step": 1686, "epoch": 40} {"train_loss": -3.0501816272735596, "global_step": 1687, "epoch": 40} {"train_loss": -2.797531843185425, "global_step": 1688, "epoch": 40} {"train_loss": -3.1492390632629395, "global_step": 1689, "epoch": 40} {"train_loss": -2.824014186859131, "global_step": 1690, "epoch": 40} {"train_loss": -2.910832405090332, "global_step": 1691, "epoch": 40} {"train_loss": -2.99615216255188, "global_step": 1692, "epoch": 40} {"train_loss": -2.9496781826019287, "global_step": 1693, "epoch": 40} {"train_loss": -2.966059923171997, "global_step": 1694, "epoch": 40} {"train_loss": -3.0620198249816895, "global_step": 1695, "epoch": 40} {"train_loss": -3.054239511489868, "global_step": 1696, "epoch": 40} {"train_loss": -2.9701550006866455, "global_step": 1697, "epoch": 40} {"train_loss": -2.9831671714782715, "global_step": 1698, "epoch": 40} {"train_loss": -2.7978415489196777, "global_step": 1699, "epoch": 40} {"train_loss": -3.040767192840576, "global_step": 1700, "epoch": 40} {"train_loss": -2.8311023712158203, "global_step": 1701, "epoch": 40} {"train_loss": -3.1550393104553223, "global_step": 1702, "epoch": 40} {"train_loss": -2.90396785736084, "global_step": 1703, "epoch": 40} {"train_loss": -3.0834460258483887, "global_step": 1704, "epoch": 40} {"train_loss": -2.903299570083618, "global_step": 1705, "epoch": 40} {"train_loss": -2.962244749069214, "global_step": 1706, "epoch": 40} {"train_loss": -2.897886276245117, "global_step": 1707, "epoch": 40} {"train_loss": -3.1080923080444336, "global_step": 1708, "epoch": 40} {"train_loss": -2.9909961223602295, "global_step": 1709, "epoch": 40} {"train_loss": -3.1046206951141357, "global_step": 1710, "epoch": 40} {"train_loss": -3.023386001586914, "global_step": 1711, "epoch": 40} {"train_loss": -3.0434765815734863, "global_step": 1712, "epoch": 40} {"train_loss": -3.105282783508301, "global_step": 1713, "epoch": 40} {"train_loss": -3.065462112426758, "global_step": 1714, "epoch": 40} {"train_loss": -3.1941733360290527, "global_step": 1715, "epoch": 40} {"train_loss": -2.972205638885498, "global_step": 1716, "epoch": 40} {"train_loss": -3.0856246948242188, "global_step": 1717, "epoch": 40} {"train_loss": -3.1244704723358154, "global_step": 1718, "epoch": 40} {"train_loss": -3.1662650108337402, "global_step": 1719, "epoch": 40} {"train_loss": -3.0612645149230957, "global_step": 1720, "epoch": 40} {"train_loss": -3.0012311935424805, "global_step": 1721, "epoch": 40, "val_loss": 435971.09375} {"train_loss": -3.184654712677002, "global_step": 1722, "epoch": 41} {"train_loss": -3.1389148235321045, "global_step": 1723, "epoch": 41} {"train_loss": -3.0023560523986816, "global_step": 1724, "epoch": 41} {"train_loss": -3.1280412673950195, "global_step": 1725, "epoch": 41} {"train_loss": -2.893610954284668, "global_step": 1726, "epoch": 41} {"train_loss": -3.136039972305298, "global_step": 1727, "epoch": 41} {"train_loss": -3.039360523223877, "global_step": 1728, "epoch": 41} {"train_loss": -3.1615538597106934, "global_step": 1729, "epoch": 41} {"train_loss": -3.0457019805908203, "global_step": 1730, "epoch": 41} {"train_loss": -2.941960334777832, "global_step": 1731, "epoch": 41} {"train_loss": -2.888822317123413, "global_step": 1732, "epoch": 41} {"train_loss": -3.0657763481140137, "global_step": 1733, "epoch": 41} {"train_loss": -2.944331645965576, "global_step": 1734, "epoch": 41} {"train_loss": -2.910585880279541, "global_step": 1735, "epoch": 41} {"train_loss": -3.1205430030822754, "global_step": 1736, "epoch": 41} {"train_loss": -3.0155773162841797, "global_step": 1737, "epoch": 41} {"train_loss": -2.998264789581299, "global_step": 1738, "epoch": 41} {"train_loss": -3.161038875579834, "global_step": 1739, "epoch": 41} {"train_loss": -3.164433002471924, "global_step": 1740, "epoch": 41} {"train_loss": -2.820988178253174, "global_step": 1741, "epoch": 41} {"train_loss": -3.0136258602142334, "global_step": 1742, "epoch": 41} {"train_loss": -3.023515224456787, "global_step": 1743, "epoch": 41} {"train_loss": -2.986804246902466, "global_step": 1744, "epoch": 41} {"train_loss": -3.0485472679138184, "global_step": 1745, "epoch": 41} {"train_loss": -3.0739989280700684, "global_step": 1746, "epoch": 41} {"train_loss": -3.0351109504699707, "global_step": 1747, "epoch": 41} {"train_loss": -2.9524624347686768, "global_step": 1748, "epoch": 41} {"train_loss": -3.2277326583862305, "global_step": 1749, "epoch": 41} {"train_loss": -3.028635025024414, "global_step": 1750, "epoch": 41} {"train_loss": -3.0988521575927734, "global_step": 1751, "epoch": 41} {"train_loss": -3.1047606468200684, "global_step": 1752, "epoch": 41} {"train_loss": -3.061779260635376, "global_step": 1753, "epoch": 41} {"train_loss": -3.0220437049865723, "global_step": 1754, "epoch": 41} {"train_loss": -3.224135398864746, "global_step": 1755, "epoch": 41} {"train_loss": -3.1709837913513184, "global_step": 1756, "epoch": 41} {"train_loss": -3.095156192779541, "global_step": 1757, "epoch": 41} {"train_loss": -3.2461071014404297, "global_step": 1758, "epoch": 41} {"train_loss": -3.2518975734710693, "global_step": 1759, "epoch": 41} {"train_loss": -3.168379783630371, "global_step": 1760, "epoch": 41} {"train_loss": -3.210226535797119, "global_step": 1761, "epoch": 41} {"train_loss": -3.0805275440216064, "global_step": 1762, "epoch": 41} {"train_loss": -3.0714027541024342, "global_step": 1763, "epoch": 41, "val_loss": 419723.09375} {"train_loss": -3.140446186065674, "global_step": 1764, "epoch": 42} {"train_loss": -3.0817108154296875, "global_step": 1765, "epoch": 42} {"train_loss": -3.0511770248413086, "global_step": 1766, "epoch": 42} {"train_loss": -3.132859945297241, "global_step": 1767, "epoch": 42} {"train_loss": -3.189444065093994, "global_step": 1768, "epoch": 42} {"train_loss": -3.084317684173584, "global_step": 1769, "epoch": 42} {"train_loss": -3.0849175453186035, "global_step": 1770, "epoch": 42} {"train_loss": -3.1086511611938477, "global_step": 1771, "epoch": 42} {"train_loss": -3.127004623413086, "global_step": 1772, "epoch": 42} {"train_loss": -2.922748565673828, "global_step": 1773, "epoch": 42} {"train_loss": -3.1503310203552246, "global_step": 1774, "epoch": 42} {"train_loss": -3.208488702774048, "global_step": 1775, "epoch": 42} {"train_loss": -3.065323829650879, "global_step": 1776, "epoch": 42} {"train_loss": -3.0090365409851074, "global_step": 1777, "epoch": 42} {"train_loss": -3.1495237350463867, "global_step": 1778, "epoch": 42} {"train_loss": -3.027219295501709, "global_step": 1779, "epoch": 42} {"train_loss": -3.2944955825805664, "global_step": 1780, "epoch": 42} {"train_loss": -3.0642948150634766, "global_step": 1781, "epoch": 42} {"train_loss": -2.945432662963867, "global_step": 1782, "epoch": 42} {"train_loss": -3.1692721843719482, "global_step": 1783, "epoch": 42} {"train_loss": -3.114325523376465, "global_step": 1784, "epoch": 42} {"train_loss": -3.0974340438842773, "global_step": 1785, "epoch": 42} {"train_loss": -3.1670663356781006, "global_step": 1786, "epoch": 42} {"train_loss": -2.9267539978027344, "global_step": 1787, "epoch": 42} {"train_loss": -3.1039271354675293, "global_step": 1788, "epoch": 42} {"train_loss": -2.9807350635528564, "global_step": 1789, "epoch": 42} {"train_loss": -3.185600757598877, "global_step": 1790, "epoch": 42} {"train_loss": -3.1306750774383545, "global_step": 1791, "epoch": 42} {"train_loss": -3.018369436264038, "global_step": 1792, "epoch": 42} {"train_loss": -3.3188581466674805, "global_step": 1793, "epoch": 42} {"train_loss": -3.110990047454834, "global_step": 1794, "epoch": 42} {"train_loss": -3.0759944915771484, "global_step": 1795, "epoch": 42} {"train_loss": -2.928994655609131, "global_step": 1796, "epoch": 42} {"train_loss": -3.2334768772125244, "global_step": 1797, "epoch": 42} {"train_loss": -2.912930727005005, "global_step": 1798, "epoch": 42} {"train_loss": -2.982086658477783, "global_step": 1799, "epoch": 42} {"train_loss": -3.0963873863220215, "global_step": 1800, "epoch": 42} {"train_loss": -3.0804519653320312, "global_step": 1801, "epoch": 42} {"train_loss": -3.0966124534606934, "global_step": 1802, "epoch": 42} {"train_loss": -3.1597328186035156, "global_step": 1803, "epoch": 42} {"train_loss": -3.176647186279297, "global_step": 1804, "epoch": 42} {"train_loss": -3.0952875216801963, "global_step": 1805, "epoch": 42, "val_loss": 401108.9375} {"train_loss": -3.1778557300567627, "global_step": 1806, "epoch": 43} {"train_loss": -3.063671112060547, "global_step": 1807, "epoch": 43} {"train_loss": -2.934272289276123, "global_step": 1808, "epoch": 43} {"train_loss": -3.2275238037109375, "global_step": 1809, "epoch": 43} {"train_loss": -3.084433078765869, "global_step": 1810, "epoch": 43} {"train_loss": -3.2145605087280273, "global_step": 1811, "epoch": 43} {"train_loss": -3.136624813079834, "global_step": 1812, "epoch": 43} {"train_loss": -3.1812124252319336, "global_step": 1813, "epoch": 43} {"train_loss": -3.3042123317718506, "global_step": 1814, "epoch": 43} {"train_loss": -3.1413450241088867, "global_step": 1815, "epoch": 43} {"train_loss": -3.092647075653076, "global_step": 1816, "epoch": 43} {"train_loss": -3.1001076698303223, "global_step": 1817, "epoch": 43} {"train_loss": -3.180850028991699, "global_step": 1818, "epoch": 43} {"train_loss": -3.20031476020813, "global_step": 1819, "epoch": 43} {"train_loss": -3.175015449523926, "global_step": 1820, "epoch": 43} {"train_loss": -3.136354446411133, "global_step": 1821, "epoch": 43} {"train_loss": -3.1293258666992188, "global_step": 1822, "epoch": 43} {"train_loss": -3.0828745365142822, "global_step": 1823, "epoch": 43} {"train_loss": -3.0083329677581787, "global_step": 1824, "epoch": 43} {"train_loss": -2.9748756885528564, "global_step": 1825, "epoch": 43} {"train_loss": -3.325892925262451, "global_step": 1826, "epoch": 43} {"train_loss": -3.1424179077148438, "global_step": 1827, "epoch": 43} {"train_loss": -3.080792188644409, "global_step": 1828, "epoch": 43} {"train_loss": -3.1615633964538574, "global_step": 1829, "epoch": 43} {"train_loss": -3.0810036659240723, "global_step": 1830, "epoch": 43} {"train_loss": -3.0694339275360107, "global_step": 1831, "epoch": 43} {"train_loss": -3.227173328399658, "global_step": 1832, "epoch": 43} {"train_loss": -3.2447285652160645, "global_step": 1833, "epoch": 43} {"train_loss": -3.2422609329223633, "global_step": 1834, "epoch": 43} {"train_loss": -3.112414598464966, "global_step": 1835, "epoch": 43} {"train_loss": -3.255624294281006, "global_step": 1836, "epoch": 43} {"train_loss": -3.230891704559326, "global_step": 1837, "epoch": 43} {"train_loss": -3.1396219730377197, "global_step": 1838, "epoch": 43} {"train_loss": -3.1077003479003906, "global_step": 1839, "epoch": 43} {"train_loss": -3.1609623432159424, "global_step": 1840, "epoch": 43} {"train_loss": -3.1794655323028564, "global_step": 1841, "epoch": 43} {"train_loss": -3.0934157371520996, "global_step": 1842, "epoch": 43} {"train_loss": -3.0811333656311035, "global_step": 1843, "epoch": 43} {"train_loss": -3.1976983547210693, "global_step": 1844, "epoch": 43} {"train_loss": -3.240377902984619, "global_step": 1845, "epoch": 43} {"train_loss": -3.2139992713928223, "global_step": 1846, "epoch": 43} {"train_loss": -3.152130161012922, "global_step": 1847, "epoch": 43, "val_loss": 381000.5625} {"train_loss": -3.275864839553833, "global_step": 1848, "epoch": 44} {"train_loss": -3.1931405067443848, "global_step": 1849, "epoch": 44} {"train_loss": -3.1615917682647705, "global_step": 1850, "epoch": 44} {"train_loss": -3.1551294326782227, "global_step": 1851, "epoch": 44} {"train_loss": -3.2586100101470947, "global_step": 1852, "epoch": 44} {"train_loss": -3.166933059692383, "global_step": 1853, "epoch": 44} {"train_loss": -3.1599481105804443, "global_step": 1854, "epoch": 44} {"train_loss": -3.0570363998413086, "global_step": 1855, "epoch": 44} {"train_loss": -3.007366180419922, "global_step": 1856, "epoch": 44} {"train_loss": -3.139249324798584, "global_step": 1857, "epoch": 44} {"train_loss": -3.1418251991271973, "global_step": 1858, "epoch": 44} {"train_loss": -3.2103705406188965, "global_step": 1859, "epoch": 44} {"train_loss": -3.2136647701263428, "global_step": 1860, "epoch": 44} {"train_loss": -3.0919666290283203, "global_step": 1861, "epoch": 44} {"train_loss": -3.140538454055786, "global_step": 1862, "epoch": 44} {"train_loss": -3.3040664196014404, "global_step": 1863, "epoch": 44} {"train_loss": -3.077486038208008, "global_step": 1864, "epoch": 44} {"train_loss": -3.1531004905700684, "global_step": 1865, "epoch": 44} {"train_loss": -3.1489360332489014, "global_step": 1866, "epoch": 44} {"train_loss": -3.2145559787750244, "global_step": 1867, "epoch": 44} {"train_loss": -3.1462903022766113, "global_step": 1868, "epoch": 44} {"train_loss": -3.2123217582702637, "global_step": 1869, "epoch": 44} {"train_loss": -3.205482006072998, "global_step": 1870, "epoch": 44} {"train_loss": -3.1934032440185547, "global_step": 1871, "epoch": 44} {"train_loss": -3.2879223823547363, "global_step": 1872, "epoch": 44} {"train_loss": -3.1811838150024414, "global_step": 1873, "epoch": 44} {"train_loss": -3.06705641746521, "global_step": 1874, "epoch": 44} {"train_loss": -3.2803874015808105, "global_step": 1875, "epoch": 44} {"train_loss": -2.883932590484619, "global_step": 1876, "epoch": 44} {"train_loss": -3.199359655380249, "global_step": 1877, "epoch": 44} {"train_loss": -3.3105480670928955, "global_step": 1878, "epoch": 44} {"train_loss": -3.2918689250946045, "global_step": 1879, "epoch": 44} {"train_loss": -3.0766453742980957, "global_step": 1880, "epoch": 44} {"train_loss": -3.2173430919647217, "global_step": 1881, "epoch": 44} {"train_loss": -3.138364315032959, "global_step": 1882, "epoch": 44} {"train_loss": -3.1517484188079834, "global_step": 1883, "epoch": 44} {"train_loss": -3.2537012100219727, "global_step": 1884, "epoch": 44} {"train_loss": -3.0372042655944824, "global_step": 1885, "epoch": 44} {"train_loss": -3.2039713859558105, "global_step": 1886, "epoch": 44} {"train_loss": -3.245103597640991, "global_step": 1887, "epoch": 44} {"train_loss": -3.1344521045684814, "global_step": 1888, "epoch": 44} {"train_loss": -3.1720423982256936, "global_step": 1889, "epoch": 44, "val_loss": 373632.96875} {"train_loss": -3.08146333694458, "global_step": 1890, "epoch": 45} {"train_loss": -3.2689194679260254, "global_step": 1891, "epoch": 45} {"train_loss": -3.1635687351226807, "global_step": 1892, "epoch": 45} {"train_loss": -3.0804102420806885, "global_step": 1893, "epoch": 45} {"train_loss": -3.2819504737854004, "global_step": 1894, "epoch": 45} {"train_loss": -3.129685401916504, "global_step": 1895, "epoch": 45} {"train_loss": -3.2391700744628906, "global_step": 1896, "epoch": 45} {"train_loss": -3.147956609725952, "global_step": 1897, "epoch": 45} {"train_loss": -3.2321248054504395, "global_step": 1898, "epoch": 45} {"train_loss": -3.3260154724121094, "global_step": 1899, "epoch": 45} {"train_loss": -3.109464406967163, "global_step": 1900, "epoch": 45} {"train_loss": -3.2266299724578857, "global_step": 1901, "epoch": 45} {"train_loss": -3.1946845054626465, "global_step": 1902, "epoch": 45} {"train_loss": -3.238051176071167, "global_step": 1903, "epoch": 45} {"train_loss": -3.3270318508148193, "global_step": 1904, "epoch": 45} {"train_loss": -3.1975293159484863, "global_step": 1905, "epoch": 45} {"train_loss": -3.117002248764038, "global_step": 1906, "epoch": 45} {"train_loss": -3.30922794342041, "global_step": 1907, "epoch": 45} {"train_loss": -3.3574233055114746, "global_step": 1908, "epoch": 45} {"train_loss": -3.4321718215942383, "global_step": 1909, "epoch": 45} {"train_loss": -3.1877055168151855, "global_step": 1910, "epoch": 45} {"train_loss": -3.2035791873931885, "global_step": 1911, "epoch": 45} {"train_loss": -3.095465660095215, "global_step": 1912, "epoch": 45} {"train_loss": -3.079096555709839, "global_step": 1913, "epoch": 45} {"train_loss": -3.4757556915283203, "global_step": 1914, "epoch": 45} {"train_loss": -3.3075203895568848, "global_step": 1915, "epoch": 45} {"train_loss": -2.9907662868499756, "global_step": 1916, "epoch": 45} {"train_loss": -3.203864574432373, "global_step": 1917, "epoch": 45} {"train_loss": -3.1732840538024902, "global_step": 1918, "epoch": 45} {"train_loss": -3.1246132850646973, "global_step": 1919, "epoch": 45} {"train_loss": -3.1423113346099854, "global_step": 1920, "epoch": 45} {"train_loss": -3.2398910522460938, "global_step": 1921, "epoch": 45} {"train_loss": -3.246428966522217, "global_step": 1922, "epoch": 45} {"train_loss": -3.1103765964508057, "global_step": 1923, "epoch": 45} {"train_loss": -3.35959529876709, "global_step": 1924, "epoch": 45} {"train_loss": -3.0855860710144043, "global_step": 1925, "epoch": 45} {"train_loss": -3.0988311767578125, "global_step": 1926, "epoch": 45} {"train_loss": -3.208556890487671, "global_step": 1927, "epoch": 45} {"train_loss": -2.8629095554351807, "global_step": 1928, "epoch": 45} {"train_loss": -3.224773406982422, "global_step": 1929, "epoch": 45} {"train_loss": -2.9682259559631348, "global_step": 1930, "epoch": 45} {"train_loss": -3.193449542635963, "global_step": 1931, "epoch": 45, "val_loss": 355172.6875} {"train_loss": -3.3014485836029053, "global_step": 1932, "epoch": 46} {"train_loss": -3.095219612121582, "global_step": 1933, "epoch": 46} {"train_loss": -3.1844358444213867, "global_step": 1934, "epoch": 46} {"train_loss": -3.059329032897949, "global_step": 1935, "epoch": 46} {"train_loss": -3.1369967460632324, "global_step": 1936, "epoch": 46} {"train_loss": -2.9455063343048096, "global_step": 1937, "epoch": 46} {"train_loss": -3.05914044380188, "global_step": 1938, "epoch": 46} {"train_loss": -3.1053524017333984, "global_step": 1939, "epoch": 46} {"train_loss": -3.300981283187866, "global_step": 1940, "epoch": 46} {"train_loss": -2.94368314743042, "global_step": 1941, "epoch": 46} {"train_loss": -3.2955760955810547, "global_step": 1942, "epoch": 46} {"train_loss": -3.1785409450531006, "global_step": 1943, "epoch": 46} {"train_loss": -3.2721102237701416, "global_step": 1944, "epoch": 46} {"train_loss": -3.2294106483459473, "global_step": 1945, "epoch": 46} {"train_loss": -3.2509589195251465, "global_step": 1946, "epoch": 46} {"train_loss": -3.172450542449951, "global_step": 1947, "epoch": 46} {"train_loss": -3.2365245819091797, "global_step": 1948, "epoch": 46} {"train_loss": -3.333446502685547, "global_step": 1949, "epoch": 46} {"train_loss": -3.166245222091675, "global_step": 1950, "epoch": 46} {"train_loss": -3.252251625061035, "global_step": 1951, "epoch": 46} {"train_loss": -3.179826259613037, "global_step": 1952, "epoch": 46} {"train_loss": -3.226652145385742, "global_step": 1953, "epoch": 46} {"train_loss": -3.2698888778686523, "global_step": 1954, "epoch": 46} {"train_loss": -3.29392147064209, "global_step": 1955, "epoch": 46} {"train_loss": -3.2152280807495117, "global_step": 1956, "epoch": 46} {"train_loss": -3.159886121749878, "global_step": 1957, "epoch": 46} {"train_loss": -3.28851318359375, "global_step": 1958, "epoch": 46} {"train_loss": -3.17207670211792, "global_step": 1959, "epoch": 46} {"train_loss": -3.223767042160034, "global_step": 1960, "epoch": 46} {"train_loss": -3.446063995361328, "global_step": 1961, "epoch": 46} {"train_loss": -3.3005313873291016, "global_step": 1962, "epoch": 46} {"train_loss": -3.2567272186279297, "global_step": 1963, "epoch": 46} {"train_loss": -3.2412850856781006, "global_step": 1964, "epoch": 46} {"train_loss": -3.2887561321258545, "global_step": 1965, "epoch": 46} {"train_loss": -3.098247766494751, "global_step": 1966, "epoch": 46} {"train_loss": -3.3409924507141113, "global_step": 1967, "epoch": 46} {"train_loss": -3.1396408081054688, "global_step": 1968, "epoch": 46} {"train_loss": -3.267867088317871, "global_step": 1969, "epoch": 46} {"train_loss": -3.3749947547912598, "global_step": 1970, "epoch": 46} {"train_loss": -3.2252206802368164, "global_step": 1971, "epoch": 46} {"train_loss": -3.288304090499878, "global_step": 1972, "epoch": 46} {"train_loss": -3.2146951527822587, "global_step": 1973, "epoch": 46, "val_loss": 346108.25} {"train_loss": -3.085562229156494, "global_step": 1974, "epoch": 47} {"train_loss": -3.3176443576812744, "global_step": 1975, "epoch": 47} {"train_loss": -3.0405454635620117, "global_step": 1976, "epoch": 47} {"train_loss": -3.2475099563598633, "global_step": 1977, "epoch": 47} {"train_loss": -3.0081372261047363, "global_step": 1978, "epoch": 47} {"train_loss": -3.3096814155578613, "global_step": 1979, "epoch": 47} {"train_loss": -3.072937488555908, "global_step": 1980, "epoch": 47} {"train_loss": -3.1812655925750732, "global_step": 1981, "epoch": 47} {"train_loss": -3.3368327617645264, "global_step": 1982, "epoch": 47} {"train_loss": -2.910367965698242, "global_step": 1983, "epoch": 47} {"train_loss": -3.054877519607544, "global_step": 1984, "epoch": 47} {"train_loss": -3.060605764389038, "global_step": 1985, "epoch": 47} {"train_loss": -3.1703507900238037, "global_step": 1986, "epoch": 47} {"train_loss": -3.0985498428344727, "global_step": 1987, "epoch": 47} {"train_loss": -3.244047164916992, "global_step": 1988, "epoch": 47} {"train_loss": -3.109130382537842, "global_step": 1989, "epoch": 47} {"train_loss": -3.299919605255127, "global_step": 1990, "epoch": 47} {"train_loss": -3.154712200164795, "global_step": 1991, "epoch": 47} {"train_loss": -3.191157102584839, "global_step": 1992, "epoch": 47} {"train_loss": -3.262197732925415, "global_step": 1993, "epoch": 47} {"train_loss": -3.211970806121826, "global_step": 1994, "epoch": 47} {"train_loss": -3.3973352909088135, "global_step": 1995, "epoch": 47} {"train_loss": -3.178201675415039, "global_step": 1996, "epoch": 47} {"train_loss": -3.1957879066467285, "global_step": 1997, "epoch": 47} {"train_loss": -3.420945405960083, "global_step": 1998, "epoch": 47} {"train_loss": -3.3744068145751953, "global_step": 1999, "epoch": 47} {"train_loss": -3.2326464653015137, "global_step": 2000, "epoch": 47} {"train_loss": -3.295346260070801, "global_step": 2001, "epoch": 47} {"train_loss": -3.2068660259246826, "global_step": 2002, "epoch": 47} {"train_loss": -3.256328582763672, "global_step": 2003, "epoch": 47} {"train_loss": -3.4017210006713867, "global_step": 2004, "epoch": 47} {"train_loss": -3.276355266571045, "global_step": 2005, "epoch": 47} {"train_loss": -3.3280110359191895, "global_step": 2006, "epoch": 47} {"train_loss": -3.3513684272766113, "global_step": 2007, "epoch": 47} {"train_loss": -3.3848137855529785, "global_step": 2008, "epoch": 47} {"train_loss": -3.340435266494751, "global_step": 2009, "epoch": 47} {"train_loss": -3.289635419845581, "global_step": 2010, "epoch": 47} {"train_loss": -3.3111157417297363, "global_step": 2011, "epoch": 47} {"train_loss": -3.317448139190674, "global_step": 2012, "epoch": 47} {"train_loss": -3.162691116333008, "global_step": 2013, "epoch": 47} {"train_loss": -3.172930955886841, "global_step": 2014, "epoch": 47} {"train_loss": -3.227134335608709, "global_step": 2015, "epoch": 47, "val_loss": 332403.96875} {"train_loss": -3.0686593055725098, "global_step": 2016, "epoch": 48} {"train_loss": -3.3519980907440186, "global_step": 2017, "epoch": 48} {"train_loss": -2.925231456756592, "global_step": 2018, "epoch": 48} {"train_loss": -3.2674267292022705, "global_step": 2019, "epoch": 48} {"train_loss": -3.074972152709961, "global_step": 2020, "epoch": 48} {"train_loss": -3.187011480331421, "global_step": 2021, "epoch": 48} {"train_loss": -3.3570632934570312, "global_step": 2022, "epoch": 48} {"train_loss": -3.070873737335205, "global_step": 2023, "epoch": 48} {"train_loss": -3.2173683643341064, "global_step": 2024, "epoch": 48} {"train_loss": -3.0206308364868164, "global_step": 2025, "epoch": 48} {"train_loss": -3.1274092197418213, "global_step": 2026, "epoch": 48} {"train_loss": -3.1583330631256104, "global_step": 2027, "epoch": 48} {"train_loss": -3.182368516921997, "global_step": 2028, "epoch": 48} {"train_loss": -3.260490894317627, "global_step": 2029, "epoch": 48} {"train_loss": -3.262127161026001, "global_step": 2030, "epoch": 48} {"train_loss": -3.2903146743774414, "global_step": 2031, "epoch": 48} {"train_loss": -3.0715818405151367, "global_step": 2032, "epoch": 48} {"train_loss": -3.3901429176330566, "global_step": 2033, "epoch": 48} {"train_loss": -3.0856003761291504, "global_step": 2034, "epoch": 48} {"train_loss": -3.213906764984131, "global_step": 2035, "epoch": 48} {"train_loss": -3.2354013919830322, "global_step": 2036, "epoch": 48} {"train_loss": -3.0270018577575684, "global_step": 2037, "epoch": 48} {"train_loss": -3.284518241882324, "global_step": 2038, "epoch": 48} {"train_loss": -3.149430274963379, "global_step": 2039, "epoch": 48} {"train_loss": -3.186891555786133, "global_step": 2040, "epoch": 48} {"train_loss": -3.157987594604492, "global_step": 2041, "epoch": 48} {"train_loss": -3.1962292194366455, "global_step": 2042, "epoch": 48} {"train_loss": -3.347386598587036, "global_step": 2043, "epoch": 48} {"train_loss": -3.1693227291107178, "global_step": 2044, "epoch": 48} {"train_loss": -3.1966352462768555, "global_step": 2045, "epoch": 48} {"train_loss": -3.3720479011535645, "global_step": 2046, "epoch": 48} {"train_loss": -3.2724714279174805, "global_step": 2047, "epoch": 48} {"train_loss": -3.2491447925567627, "global_step": 2048, "epoch": 48} {"train_loss": -3.178347110748291, "global_step": 2049, "epoch": 48} {"train_loss": -3.412100315093994, "global_step": 2050, "epoch": 48} {"train_loss": -3.3915398120880127, "global_step": 2051, "epoch": 48} {"train_loss": -3.2476367950439453, "global_step": 2052, "epoch": 48} {"train_loss": -3.376915216445923, "global_step": 2053, "epoch": 48} {"train_loss": -3.431659698486328, "global_step": 2054, "epoch": 48} {"train_loss": -3.329979181289673, "global_step": 2055, "epoch": 48} {"train_loss": -3.1617939472198486, "global_step": 2056, "epoch": 48} {"train_loss": -3.2236562002272833, "global_step": 2057, "epoch": 48, "val_loss": 309156.0} {"train_loss": -3.1250157356262207, "global_step": 2058, "epoch": 49} {"train_loss": -3.316361427307129, "global_step": 2059, "epoch": 49} {"train_loss": -3.459562301635742, "global_step": 2060, "epoch": 49} {"train_loss": -3.371793746948242, "global_step": 2061, "epoch": 49} {"train_loss": -3.2294440269470215, "global_step": 2062, "epoch": 49} {"train_loss": -3.4599149227142334, "global_step": 2063, "epoch": 49} {"train_loss": -3.059357166290283, "global_step": 2064, "epoch": 49} {"train_loss": -3.306253433227539, "global_step": 2065, "epoch": 49} {"train_loss": -3.2759408950805664, "global_step": 2066, "epoch": 49} {"train_loss": -3.2977447509765625, "global_step": 2067, "epoch": 49} {"train_loss": -3.319033622741699, "global_step": 2068, "epoch": 49} {"train_loss": -3.242269992828369, "global_step": 2069, "epoch": 49} {"train_loss": -3.3547565937042236, "global_step": 2070, "epoch": 49} {"train_loss": -3.211615800857544, "global_step": 2071, "epoch": 49} {"train_loss": -3.348017692565918, "global_step": 2072, "epoch": 49} {"train_loss": -3.380642890930176, "global_step": 2073, "epoch": 49} {"train_loss": -3.3580007553100586, "global_step": 2074, "epoch": 49} {"train_loss": -3.2448110580444336, "global_step": 2075, "epoch": 49} {"train_loss": -3.377537727355957, "global_step": 2076, "epoch": 49} {"train_loss": -3.446295738220215, "global_step": 2077, "epoch": 49} {"train_loss": -3.3917481899261475, "global_step": 2078, "epoch": 49} {"train_loss": -3.3589091300964355, "global_step": 2079, "epoch": 49} {"train_loss": -3.4525885581970215, "global_step": 2080, "epoch": 49} {"train_loss": -3.406172275543213, "global_step": 2081, "epoch": 49} {"train_loss": -3.297786235809326, "global_step": 2082, "epoch": 49} {"train_loss": -3.4164724349975586, "global_step": 2083, "epoch": 49} {"train_loss": -3.448136568069458, "global_step": 2084, "epoch": 49} {"train_loss": -3.4768238067626953, "global_step": 2085, "epoch": 49} {"train_loss": -3.3438796997070312, "global_step": 2086, "epoch": 49} {"train_loss": -3.403442859649658, "global_step": 2087, "epoch": 49} {"train_loss": -3.461155891418457, "global_step": 2088, "epoch": 49} {"train_loss": -3.333798408508301, "global_step": 2089, "epoch": 49} {"train_loss": -3.416797637939453, "global_step": 2090, "epoch": 49} {"train_loss": -3.268105983734131, "global_step": 2091, "epoch": 49} {"train_loss": -3.28849196434021, "global_step": 2092, "epoch": 49} {"train_loss": -3.294076919555664, "global_step": 2093, "epoch": 49} {"train_loss": -3.3487844467163086, "global_step": 2094, "epoch": 49} {"train_loss": -3.438164710998535, "global_step": 2095, "epoch": 49} {"train_loss": -3.2274961471557617, "global_step": 2096, "epoch": 49} {"train_loss": -3.297842264175415, "global_step": 2097, "epoch": 49} {"train_loss": -3.427917003631592, "global_step": 2098, "epoch": 49} {"train_loss": -3.3452067318416776, "global_step": 2099, "epoch": 49, "val_loss": 289084.25} {"train_loss": -3.440931797027588, "global_step": 2100, "epoch": 50} {"train_loss": -3.3724164962768555, "global_step": 2101, "epoch": 50} {"train_loss": -3.370025634765625, "global_step": 2102, "epoch": 50} {"train_loss": -3.3907151222229004, "global_step": 2103, "epoch": 50} {"train_loss": -3.3375489711761475, "global_step": 2104, "epoch": 50} {"train_loss": -3.450784683227539, "global_step": 2105, "epoch": 50} {"train_loss": -3.3961238861083984, "global_step": 2106, "epoch": 50} {"train_loss": -3.513162612915039, "global_step": 2107, "epoch": 50} {"train_loss": -3.2384254932403564, "global_step": 2108, "epoch": 50} {"train_loss": -3.2603745460510254, "global_step": 2109, "epoch": 50} {"train_loss": -3.4237723350524902, "global_step": 2110, "epoch": 50} {"train_loss": -3.3510031700134277, "global_step": 2111, "epoch": 50} {"train_loss": -3.416996479034424, "global_step": 2112, "epoch": 50} {"train_loss": -3.3824901580810547, "global_step": 2113, "epoch": 50} {"train_loss": -3.4559130668640137, "global_step": 2114, "epoch": 50} {"train_loss": -3.576908588409424, "global_step": 2115, "epoch": 50} {"train_loss": -3.5354809761047363, "global_step": 2116, "epoch": 50} {"train_loss": -3.468810558319092, "global_step": 2117, "epoch": 50} {"train_loss": -3.3484063148498535, "global_step": 2118, "epoch": 50} {"train_loss": -3.5032155513763428, "global_step": 2119, "epoch": 50} {"train_loss": -3.2957372665405273, "global_step": 2120, "epoch": 50} {"train_loss": -3.293549060821533, "global_step": 2121, "epoch": 50} {"train_loss": -3.3462164402008057, "global_step": 2122, "epoch": 50} {"train_loss": -3.1512157917022705, "global_step": 2123, "epoch": 50} {"train_loss": -3.4151225090026855, "global_step": 2124, "epoch": 50} {"train_loss": -3.3562092781066895, "global_step": 2125, "epoch": 50} {"train_loss": -3.010502815246582, "global_step": 2126, "epoch": 50} {"train_loss": -3.088287115097046, "global_step": 2127, "epoch": 50} {"train_loss": -3.355727434158325, "global_step": 2128, "epoch": 50} {"train_loss": -2.8482186794281006, "global_step": 2129, "epoch": 50} {"train_loss": -2.9453341960906982, "global_step": 2130, "epoch": 50} {"train_loss": -2.47866153717041, "global_step": 2131, "epoch": 50} {"train_loss": -2.8711564540863037, "global_step": 2132, "epoch": 50} {"train_loss": -2.5598151683807373, "global_step": 2133, "epoch": 50} {"train_loss": -2.847799777984619, "global_step": 2134, "epoch": 50} {"train_loss": -2.8073859214782715, "global_step": 2135, "epoch": 50} {"train_loss": -2.7942633628845215, "global_step": 2136, "epoch": 50} {"train_loss": -2.87540864944458, "global_step": 2137, "epoch": 50} {"train_loss": -2.963845729827881, "global_step": 2138, "epoch": 50} {"train_loss": -3.0231781005859375, "global_step": 2139, "epoch": 50} {"train_loss": -3.0701262950897217, "global_step": 2140, "epoch": 50} {"train_loss": -3.2043154466719854, "global_step": 2141, "epoch": 50, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.14325166398039643, "train/sim_max_reward_2": 0.1914733050982292, "train/sim_max_reward_3": 0.14397967142913157, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.22628304730620832, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.0, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.28120237555563865, "test/sim_max_reward_4300004": 0.4477675062535832, "test/sim_max_reward_4300005": 0.4036381391339061, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.045127646075307386, "test/sim_max_reward_4300008": 0.40804262309720407, "test/sim_max_reward_4300009": 0.032425669850822174, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.3231105229852605, "test/sim_max_reward_4300012": 0.25872152142121096, "test/sim_max_reward_4300013": 0.33189700255264337, "test/sim_max_reward_4300014": 0.8411203619233111, "test/sim_max_reward_4300015": 0.22434380981056135, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.13058715121156275, "test/sim_max_reward_4300018": 0.0, "test/sim_max_reward_4300019": 0.18254307829060798, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.3201164962678058, "test/sim_max_reward_4300022": 0.019566254610673364, "test/sim_max_reward_4300023": 0.2057529789273333, "test/sim_max_reward_4300024": 0.0, "test/sim_max_reward_4300025": 0.4820260129846914, "test/sim_max_reward_4300026": 0.050878423390650566, "test/sim_max_reward_4300027": 0.0, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.12451198223229273, "test/sim_max_reward_4300031": 0.0, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.2603000335592396, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.6900478767566082, "test/sim_max_reward_4300038": 0.02050720219077905, "test/sim_max_reward_4300039": 0.0, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.3472692786068953, "test/sim_max_reward_4300043": 0.01912165197990456, "test/sim_max_reward_4300044": 0.5165530837993422, "test/sim_max_reward_4300045": 0.16097352018622602, "test/sim_max_reward_4300046": 0.2390766344897214, "test/sim_max_reward_4300047": 0.506290204025247, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.15079808199845782, "test/mean_score": 0.16862663676746797, "val_loss": 291822.5} {"train_loss": -3.1864371299743652, "global_step": 2142, "epoch": 51} {"train_loss": -3.127845048904419, "global_step": 2143, "epoch": 51} {"train_loss": -3.1741080284118652, "global_step": 2144, "epoch": 51} {"train_loss": -3.1839027404785156, "global_step": 2145, "epoch": 51} {"train_loss": -3.161630868911743, "global_step": 2146, "epoch": 51} {"train_loss": -3.0049126148223877, "global_step": 2147, "epoch": 51} {"train_loss": -3.0863137245178223, "global_step": 2148, "epoch": 51} {"train_loss": -3.126389503479004, "global_step": 2149, "epoch": 51} {"train_loss": -3.1573214530944824, "global_step": 2150, "epoch": 51} {"train_loss": -3.1006526947021484, "global_step": 2151, "epoch": 51} {"train_loss": -3.1987662315368652, "global_step": 2152, "epoch": 51} {"train_loss": -3.0723769664764404, "global_step": 2153, "epoch": 51} {"train_loss": -3.2757606506347656, "global_step": 2154, "epoch": 51} {"train_loss": -3.273916482925415, "global_step": 2155, "epoch": 51} {"train_loss": -3.228074073791504, "global_step": 2156, "epoch": 51} {"train_loss": -3.1972262859344482, "global_step": 2157, "epoch": 51} {"train_loss": -3.314302682876587, "global_step": 2158, "epoch": 51} {"train_loss": -3.3019204139709473, "global_step": 2159, "epoch": 51} {"train_loss": -3.3076696395874023, "global_step": 2160, "epoch": 51} {"train_loss": -3.3701846599578857, "global_step": 2161, "epoch": 51} {"train_loss": -3.3442764282226562, "global_step": 2162, "epoch": 51} {"train_loss": -3.2633578777313232, "global_step": 2163, "epoch": 51} {"train_loss": -3.4022765159606934, "global_step": 2164, "epoch": 51} {"train_loss": -3.3743491172790527, "global_step": 2165, "epoch": 51} {"train_loss": -3.3571085929870605, "global_step": 2166, "epoch": 51} {"train_loss": -3.5042080879211426, "global_step": 2167, "epoch": 51} {"train_loss": -3.4218192100524902, "global_step": 2168, "epoch": 51} {"train_loss": -3.4242944717407227, "global_step": 2169, "epoch": 51} {"train_loss": -3.405120849609375, "global_step": 2170, "epoch": 51} {"train_loss": -3.4018125534057617, "global_step": 2171, "epoch": 51} {"train_loss": -3.293182373046875, "global_step": 2172, "epoch": 51} {"train_loss": -3.508512496948242, "global_step": 2173, "epoch": 51} {"train_loss": -3.5173285007476807, "global_step": 2174, "epoch": 51} {"train_loss": -3.457331418991089, "global_step": 2175, "epoch": 51} {"train_loss": -3.4203145503997803, "global_step": 2176, "epoch": 51} {"train_loss": -3.258105754852295, "global_step": 2177, "epoch": 51} {"train_loss": -3.4311344623565674, "global_step": 2178, "epoch": 51} {"train_loss": -3.487652063369751, "global_step": 2179, "epoch": 51} {"train_loss": -3.3191351890563965, "global_step": 2180, "epoch": 51} {"train_loss": -3.5784571170806885, "global_step": 2181, "epoch": 51} {"train_loss": -3.349874973297119, "global_step": 2182, "epoch": 51} {"train_loss": -3.301377364567348, "global_step": 2183, "epoch": 51, "val_loss": 266260.875} {"train_loss": -3.4460349082946777, "global_step": 2184, "epoch": 52} {"train_loss": -3.5171098709106445, "global_step": 2185, "epoch": 52} {"train_loss": -3.3868680000305176, "global_step": 2186, "epoch": 52} {"train_loss": -3.49307918548584, "global_step": 2187, "epoch": 52} {"train_loss": -3.424093246459961, "global_step": 2188, "epoch": 52} {"train_loss": -3.366884231567383, "global_step": 2189, "epoch": 52} {"train_loss": -3.4498581886291504, "global_step": 2190, "epoch": 52} {"train_loss": -3.5021135807037354, "global_step": 2191, "epoch": 52} {"train_loss": -3.441582202911377, "global_step": 2192, "epoch": 52} {"train_loss": -3.194455623626709, "global_step": 2193, "epoch": 52} {"train_loss": -3.436091899871826, "global_step": 2194, "epoch": 52} {"train_loss": -3.1575398445129395, "global_step": 2195, "epoch": 52} {"train_loss": -3.4068639278411865, "global_step": 2196, "epoch": 52} {"train_loss": -3.184183359146118, "global_step": 2197, "epoch": 52} {"train_loss": -3.3497791290283203, "global_step": 2198, "epoch": 52} {"train_loss": -3.520993232727051, "global_step": 2199, "epoch": 52} {"train_loss": -3.109760046005249, "global_step": 2200, "epoch": 52} {"train_loss": -3.3478193283081055, "global_step": 2201, "epoch": 52} {"train_loss": -3.136021137237549, "global_step": 2202, "epoch": 52} {"train_loss": -3.3235158920288086, "global_step": 2203, "epoch": 52} {"train_loss": -3.2120370864868164, "global_step": 2204, "epoch": 52} {"train_loss": -3.3780696392059326, "global_step": 2205, "epoch": 52} {"train_loss": -3.1962509155273438, "global_step": 2206, "epoch": 52} {"train_loss": -3.462392568588257, "global_step": 2207, "epoch": 52} {"train_loss": -3.0238587856292725, "global_step": 2208, "epoch": 52} {"train_loss": -3.4002301692962646, "global_step": 2209, "epoch": 52} {"train_loss": -2.8831892013549805, "global_step": 2210, "epoch": 52} {"train_loss": -3.5635385513305664, "global_step": 2211, "epoch": 52} {"train_loss": -3.153872489929199, "global_step": 2212, "epoch": 52} {"train_loss": -3.3961904048919678, "global_step": 2213, "epoch": 52} {"train_loss": -3.2854762077331543, "global_step": 2214, "epoch": 52} {"train_loss": -3.329267978668213, "global_step": 2215, "epoch": 52} {"train_loss": -3.3586015701293945, "global_step": 2216, "epoch": 52} {"train_loss": -3.28763484954834, "global_step": 2217, "epoch": 52} {"train_loss": -3.3517913818359375, "global_step": 2218, "epoch": 52} {"train_loss": -3.2836923599243164, "global_step": 2219, "epoch": 52} {"train_loss": -3.393690347671509, "global_step": 2220, "epoch": 52} {"train_loss": -3.2604479789733887, "global_step": 2221, "epoch": 52} {"train_loss": -3.497063159942627, "global_step": 2222, "epoch": 52} {"train_loss": -3.454390525817871, "global_step": 2223, "epoch": 52} {"train_loss": -3.256194591522217, "global_step": 2224, "epoch": 52} {"train_loss": -3.3316701366787864, "global_step": 2225, "epoch": 52, "val_loss": 256007.03125} {"train_loss": -3.5612831115722656, "global_step": 2226, "epoch": 53} {"train_loss": -3.460573196411133, "global_step": 2227, "epoch": 53} {"train_loss": -3.6137351989746094, "global_step": 2228, "epoch": 53} {"train_loss": -3.45044207572937, "global_step": 2229, "epoch": 53} {"train_loss": -3.5280609130859375, "global_step": 2230, "epoch": 53} {"train_loss": -3.3407323360443115, "global_step": 2231, "epoch": 53} {"train_loss": -3.538203477859497, "global_step": 2232, "epoch": 53} {"train_loss": -3.309041976928711, "global_step": 2233, "epoch": 53} {"train_loss": -3.5069596767425537, "global_step": 2234, "epoch": 53} {"train_loss": -3.544401168823242, "global_step": 2235, "epoch": 53} {"train_loss": -3.3456876277923584, "global_step": 2236, "epoch": 53} {"train_loss": -3.4555578231811523, "global_step": 2237, "epoch": 53} {"train_loss": -3.4462878704071045, "global_step": 2238, "epoch": 53} {"train_loss": -3.5733795166015625, "global_step": 2239, "epoch": 53} {"train_loss": -3.4218478202819824, "global_step": 2240, "epoch": 53} {"train_loss": -3.4163665771484375, "global_step": 2241, "epoch": 53} {"train_loss": -3.5805466175079346, "global_step": 2242, "epoch": 53} {"train_loss": -3.320737600326538, "global_step": 2243, "epoch": 53} {"train_loss": -3.4297688007354736, "global_step": 2244, "epoch": 53} {"train_loss": -3.4579477310180664, "global_step": 2245, "epoch": 53} {"train_loss": -3.4474122524261475, "global_step": 2246, "epoch": 53} {"train_loss": -3.5908098220825195, "global_step": 2247, "epoch": 53} {"train_loss": -3.431203842163086, "global_step": 2248, "epoch": 53} {"train_loss": -3.319575786590576, "global_step": 2249, "epoch": 53} {"train_loss": -3.4608325958251953, "global_step": 2250, "epoch": 53} {"train_loss": -3.61771821975708, "global_step": 2251, "epoch": 53} {"train_loss": -3.4578094482421875, "global_step": 2252, "epoch": 53} {"train_loss": -3.496018171310425, "global_step": 2253, "epoch": 53} {"train_loss": -3.33450984954834, "global_step": 2254, "epoch": 53} {"train_loss": -3.4833984375, "global_step": 2255, "epoch": 53} {"train_loss": -3.4709324836730957, "global_step": 2256, "epoch": 53} {"train_loss": -3.5741639137268066, "global_step": 2257, "epoch": 53} {"train_loss": -3.535165786743164, "global_step": 2258, "epoch": 53} {"train_loss": -3.5813920497894287, "global_step": 2259, "epoch": 53} {"train_loss": -3.489820718765259, "global_step": 2260, "epoch": 53} {"train_loss": -3.3415932655334473, "global_step": 2261, "epoch": 53} {"train_loss": -3.609748363494873, "global_step": 2262, "epoch": 53} {"train_loss": -3.5377092361450195, "global_step": 2263, "epoch": 53} {"train_loss": -3.312396764755249, "global_step": 2264, "epoch": 53} {"train_loss": -3.552525520324707, "global_step": 2265, "epoch": 53} {"train_loss": -3.4957220554351807, "global_step": 2266, "epoch": 53} {"train_loss": -3.472453895069304, "global_step": 2267, "epoch": 53, "val_loss": 241668.125} {"train_loss": -3.4509775638580322, "global_step": 2268, "epoch": 54} {"train_loss": -3.4899604320526123, "global_step": 2269, "epoch": 54} {"train_loss": -3.46549654006958, "global_step": 2270, "epoch": 54} {"train_loss": -3.5825977325439453, "global_step": 2271, "epoch": 54} {"train_loss": -3.4969968795776367, "global_step": 2272, "epoch": 54} {"train_loss": -3.4530744552612305, "global_step": 2273, "epoch": 54} {"train_loss": -3.4834699630737305, "global_step": 2274, "epoch": 54} {"train_loss": -3.4702200889587402, "global_step": 2275, "epoch": 54} {"train_loss": -3.476731300354004, "global_step": 2276, "epoch": 54} {"train_loss": -3.5710597038269043, "global_step": 2277, "epoch": 54} {"train_loss": -3.275386333465576, "global_step": 2278, "epoch": 54} {"train_loss": -3.3516604900360107, "global_step": 2279, "epoch": 54} {"train_loss": -3.380258560180664, "global_step": 2280, "epoch": 54} {"train_loss": -3.514490842819214, "global_step": 2281, "epoch": 54} {"train_loss": -3.29290771484375, "global_step": 2282, "epoch": 54} {"train_loss": -3.5622410774230957, "global_step": 2283, "epoch": 54} {"train_loss": -3.543778657913208, "global_step": 2284, "epoch": 54} {"train_loss": -3.476818561553955, "global_step": 2285, "epoch": 54} {"train_loss": -3.564857244491577, "global_step": 2286, "epoch": 54} {"train_loss": -3.5375993251800537, "global_step": 2287, "epoch": 54} {"train_loss": -3.5217292308807373, "global_step": 2288, "epoch": 54} {"train_loss": -3.506371021270752, "global_step": 2289, "epoch": 54} {"train_loss": -3.662297248840332, "global_step": 2290, "epoch": 54} {"train_loss": -3.4647552967071533, "global_step": 2291, "epoch": 54} {"train_loss": -3.6317715644836426, "global_step": 2292, "epoch": 54} {"train_loss": -3.4071059226989746, "global_step": 2293, "epoch": 54} {"train_loss": -3.545048713684082, "global_step": 2294, "epoch": 54} {"train_loss": -3.5702953338623047, "global_step": 2295, "epoch": 54} {"train_loss": -3.6237103939056396, "global_step": 2296, "epoch": 54} {"train_loss": -3.5365066528320312, "global_step": 2297, "epoch": 54} {"train_loss": -3.4851763248443604, "global_step": 2298, "epoch": 54} {"train_loss": -3.65236496925354, "global_step": 2299, "epoch": 54} {"train_loss": -3.4829061031341553, "global_step": 2300, "epoch": 54} {"train_loss": -3.6789231300354004, "global_step": 2301, "epoch": 54} {"train_loss": -3.464930534362793, "global_step": 2302, "epoch": 54} {"train_loss": -3.5339412689208984, "global_step": 2303, "epoch": 54} {"train_loss": -3.556830406188965, "global_step": 2304, "epoch": 54} {"train_loss": -3.5900356769561768, "global_step": 2305, "epoch": 54} {"train_loss": -3.5054216384887695, "global_step": 2306, "epoch": 54} {"train_loss": -3.6003260612487793, "global_step": 2307, "epoch": 54} {"train_loss": -3.4472107887268066, "global_step": 2308, "epoch": 54} {"train_loss": -3.5154696759723483, "global_step": 2309, "epoch": 54, "val_loss": 232458.78125} {"train_loss": -3.577014684677124, "global_step": 2310, "epoch": 55} {"train_loss": -3.517293930053711, "global_step": 2311, "epoch": 55} {"train_loss": -3.3647537231445312, "global_step": 2312, "epoch": 55} {"train_loss": -3.563119888305664, "global_step": 2313, "epoch": 55} {"train_loss": -3.515150547027588, "global_step": 2314, "epoch": 55} {"train_loss": -3.535637378692627, "global_step": 2315, "epoch": 55} {"train_loss": -3.537571907043457, "global_step": 2316, "epoch": 55} {"train_loss": -3.3352341651916504, "global_step": 2317, "epoch": 55} {"train_loss": -3.6177666187286377, "global_step": 2318, "epoch": 55} {"train_loss": -3.761626958847046, "global_step": 2319, "epoch": 55} {"train_loss": -3.3824896812438965, "global_step": 2320, "epoch": 55} {"train_loss": -3.487933874130249, "global_step": 2321, "epoch": 55} {"train_loss": -3.546797275543213, "global_step": 2322, "epoch": 55} {"train_loss": -3.353072166442871, "global_step": 2323, "epoch": 55} {"train_loss": -3.4457600116729736, "global_step": 2324, "epoch": 55} {"train_loss": -3.727132797241211, "global_step": 2325, "epoch": 55} {"train_loss": -3.6241981983184814, "global_step": 2326, "epoch": 55} {"train_loss": -3.420518398284912, "global_step": 2327, "epoch": 55} {"train_loss": -3.5698111057281494, "global_step": 2328, "epoch": 55} {"train_loss": -3.662213087081909, "global_step": 2329, "epoch": 55} {"train_loss": -3.447338104248047, "global_step": 2330, "epoch": 55} {"train_loss": -3.518630027770996, "global_step": 2331, "epoch": 55} {"train_loss": -3.6237735748291016, "global_step": 2332, "epoch": 55} {"train_loss": -3.5298712253570557, "global_step": 2333, "epoch": 55} {"train_loss": -3.385206699371338, "global_step": 2334, "epoch": 55} {"train_loss": -3.5859155654907227, "global_step": 2335, "epoch": 55} {"train_loss": -3.6228156089782715, "global_step": 2336, "epoch": 55} {"train_loss": -3.6698927879333496, "global_step": 2337, "epoch": 55} {"train_loss": -3.7235381603240967, "global_step": 2338, "epoch": 55} {"train_loss": -3.4445743560791016, "global_step": 2339, "epoch": 55} {"train_loss": -3.492008686065674, "global_step": 2340, "epoch": 55} {"train_loss": -3.5121893882751465, "global_step": 2341, "epoch": 55} {"train_loss": -3.527149200439453, "global_step": 2342, "epoch": 55} {"train_loss": -3.557819366455078, "global_step": 2343, "epoch": 55} {"train_loss": -3.632930278778076, "global_step": 2344, "epoch": 55} {"train_loss": -3.4597511291503906, "global_step": 2345, "epoch": 55} {"train_loss": -3.502213478088379, "global_step": 2346, "epoch": 55} {"train_loss": -3.784722328186035, "global_step": 2347, "epoch": 55} {"train_loss": -3.4685497283935547, "global_step": 2348, "epoch": 55} {"train_loss": -3.4759435653686523, "global_step": 2349, "epoch": 55} {"train_loss": -3.5920796394348145, "global_step": 2350, "epoch": 55} {"train_loss": -3.539961440222604, "global_step": 2351, "epoch": 55, "val_loss": 225779.171875} {"train_loss": -3.4197981357574463, "global_step": 2352, "epoch": 56} {"train_loss": -3.4655141830444336, "global_step": 2353, "epoch": 56} {"train_loss": -3.5201728343963623, "global_step": 2354, "epoch": 56} {"train_loss": -3.511244535446167, "global_step": 2355, "epoch": 56} {"train_loss": -3.648383617401123, "global_step": 2356, "epoch": 56} {"train_loss": -3.5202229022979736, "global_step": 2357, "epoch": 56} {"train_loss": -3.6320292949676514, "global_step": 2358, "epoch": 56} {"train_loss": -3.6183671951293945, "global_step": 2359, "epoch": 56} {"train_loss": -3.428563117980957, "global_step": 2360, "epoch": 56} {"train_loss": -3.601747989654541, "global_step": 2361, "epoch": 56} {"train_loss": -3.301470994949341, "global_step": 2362, "epoch": 56} {"train_loss": -3.486938238143921, "global_step": 2363, "epoch": 56} {"train_loss": -3.0362725257873535, "global_step": 2364, "epoch": 56} {"train_loss": -3.232027053833008, "global_step": 2365, "epoch": 56} {"train_loss": -3.0771350860595703, "global_step": 2366, "epoch": 56} {"train_loss": -3.307253122329712, "global_step": 2367, "epoch": 56} {"train_loss": -3.3375403881073, "global_step": 2368, "epoch": 56} {"train_loss": -3.0535268783569336, "global_step": 2369, "epoch": 56} {"train_loss": -3.36606502532959, "global_step": 2370, "epoch": 56} {"train_loss": -3.2715747356414795, "global_step": 2371, "epoch": 56} {"train_loss": -3.518922805786133, "global_step": 2372, "epoch": 56} {"train_loss": -3.355334758758545, "global_step": 2373, "epoch": 56} {"train_loss": -3.5038576126098633, "global_step": 2374, "epoch": 56} {"train_loss": -3.2625222206115723, "global_step": 2375, "epoch": 56} {"train_loss": -3.412966728210449, "global_step": 2376, "epoch": 56} {"train_loss": -3.3438711166381836, "global_step": 2377, "epoch": 56} {"train_loss": -3.413512706756592, "global_step": 2378, "epoch": 56} {"train_loss": -3.5038580894470215, "global_step": 2379, "epoch": 56} {"train_loss": -3.409027576446533, "global_step": 2380, "epoch": 56} {"train_loss": -3.484968900680542, "global_step": 2381, "epoch": 56} {"train_loss": -3.4580583572387695, "global_step": 2382, "epoch": 56} {"train_loss": -3.434572219848633, "global_step": 2383, "epoch": 56} {"train_loss": -3.5644001960754395, "global_step": 2384, "epoch": 56} {"train_loss": -3.5251951217651367, "global_step": 2385, "epoch": 56} {"train_loss": -3.481264114379883, "global_step": 2386, "epoch": 56} {"train_loss": -3.5512218475341797, "global_step": 2387, "epoch": 56} {"train_loss": -3.7443792819976807, "global_step": 2388, "epoch": 56} {"train_loss": -3.561842441558838, "global_step": 2389, "epoch": 56} {"train_loss": -3.6264445781707764, "global_step": 2390, "epoch": 56} {"train_loss": -3.493896007537842, "global_step": 2391, "epoch": 56} {"train_loss": -3.606088876724243, "global_step": 2392, "epoch": 56} {"train_loss": -3.4471200647808256, "global_step": 2393, "epoch": 56, "val_loss": 214778.84375} {"train_loss": -3.568525552749634, "global_step": 2394, "epoch": 57} {"train_loss": -3.633460521697998, "global_step": 2395, "epoch": 57} {"train_loss": -3.5436038970947266, "global_step": 2396, "epoch": 57} {"train_loss": -3.3941903114318848, "global_step": 2397, "epoch": 57} {"train_loss": -3.7886853218078613, "global_step": 2398, "epoch": 57} {"train_loss": -3.6687660217285156, "global_step": 2399, "epoch": 57} {"train_loss": -3.670342445373535, "global_step": 2400, "epoch": 57} {"train_loss": -3.5597188472747803, "global_step": 2401, "epoch": 57} {"train_loss": -3.2858152389526367, "global_step": 2402, "epoch": 57} {"train_loss": -3.7481446266174316, "global_step": 2403, "epoch": 57} {"train_loss": -3.7191014289855957, "global_step": 2404, "epoch": 57} {"train_loss": -3.741650104522705, "global_step": 2405, "epoch": 57} {"train_loss": -3.560117244720459, "global_step": 2406, "epoch": 57} {"train_loss": -3.5069589614868164, "global_step": 2407, "epoch": 57} {"train_loss": -3.5931618213653564, "global_step": 2408, "epoch": 57} {"train_loss": -3.643098831176758, "global_step": 2409, "epoch": 57} {"train_loss": -3.5937681198120117, "global_step": 2410, "epoch": 57} {"train_loss": -3.5705628395080566, "global_step": 2411, "epoch": 57} {"train_loss": -3.530282974243164, "global_step": 2412, "epoch": 57} {"train_loss": -3.4537649154663086, "global_step": 2413, "epoch": 57} {"train_loss": -3.6945300102233887, "global_step": 2414, "epoch": 57} {"train_loss": -3.7597479820251465, "global_step": 2415, "epoch": 57} {"train_loss": -3.6646909713745117, "global_step": 2416, "epoch": 57} {"train_loss": -3.684429883956909, "global_step": 2417, "epoch": 57} {"train_loss": -3.5000572204589844, "global_step": 2418, "epoch": 57} {"train_loss": -3.64121150970459, "global_step": 2419, "epoch": 57} {"train_loss": -3.5907843112945557, "global_step": 2420, "epoch": 57} {"train_loss": -3.4522690773010254, "global_step": 2421, "epoch": 57} {"train_loss": -3.5707411766052246, "global_step": 2422, "epoch": 57} {"train_loss": -3.672635555267334, "global_step": 2423, "epoch": 57} {"train_loss": -3.468745470046997, "global_step": 2424, "epoch": 57} {"train_loss": -3.731149911880493, "global_step": 2425, "epoch": 57} {"train_loss": -3.7381036281585693, "global_step": 2426, "epoch": 57} {"train_loss": -3.52598237991333, "global_step": 2427, "epoch": 57} {"train_loss": -3.662938117980957, "global_step": 2428, "epoch": 57} {"train_loss": -3.560544490814209, "global_step": 2429, "epoch": 57} {"train_loss": -3.5156023502349854, "global_step": 2430, "epoch": 57} {"train_loss": -3.618345260620117, "global_step": 2431, "epoch": 57} {"train_loss": -3.5801992416381836, "global_step": 2432, "epoch": 57} {"train_loss": -3.494316577911377, "global_step": 2433, "epoch": 57} {"train_loss": -3.526848316192627, "global_step": 2434, "epoch": 57} {"train_loss": -3.593373457590739, "global_step": 2435, "epoch": 57, "val_loss": 206627.125} {"train_loss": -3.710160970687866, "global_step": 2436, "epoch": 58} {"train_loss": -3.365880012512207, "global_step": 2437, "epoch": 58} {"train_loss": -3.6116795539855957, "global_step": 2438, "epoch": 58} {"train_loss": -3.5405945777893066, "global_step": 2439, "epoch": 58} {"train_loss": -3.45065975189209, "global_step": 2440, "epoch": 58} {"train_loss": -3.722609758377075, "global_step": 2441, "epoch": 58} {"train_loss": -3.486459970474243, "global_step": 2442, "epoch": 58} {"train_loss": -3.6748900413513184, "global_step": 2443, "epoch": 58} {"train_loss": -3.494050979614258, "global_step": 2444, "epoch": 58} {"train_loss": -3.47269344329834, "global_step": 2445, "epoch": 58} {"train_loss": -3.4865829944610596, "global_step": 2446, "epoch": 58} {"train_loss": -3.4943692684173584, "global_step": 2447, "epoch": 58} {"train_loss": -3.5019655227661133, "global_step": 2448, "epoch": 58} {"train_loss": -3.4996883869171143, "global_step": 2449, "epoch": 58} {"train_loss": -3.5798373222351074, "global_step": 2450, "epoch": 58} {"train_loss": -3.469083309173584, "global_step": 2451, "epoch": 58} {"train_loss": -3.73980712890625, "global_step": 2452, "epoch": 58} {"train_loss": -3.4579153060913086, "global_step": 2453, "epoch": 58} {"train_loss": -3.651110887527466, "global_step": 2454, "epoch": 58} {"train_loss": -3.7429587841033936, "global_step": 2455, "epoch": 58} {"train_loss": -3.5352940559387207, "global_step": 2456, "epoch": 58} {"train_loss": -3.676360607147217, "global_step": 2457, "epoch": 58} {"train_loss": -3.597719192504883, "global_step": 2458, "epoch": 58} {"train_loss": -3.523285150527954, "global_step": 2459, "epoch": 58} {"train_loss": -3.606245279312134, "global_step": 2460, "epoch": 58} {"train_loss": -3.5742106437683105, "global_step": 2461, "epoch": 58} {"train_loss": -3.5267393589019775, "global_step": 2462, "epoch": 58} {"train_loss": -3.646595001220703, "global_step": 2463, "epoch": 58} {"train_loss": -3.487792491912842, "global_step": 2464, "epoch": 58} {"train_loss": -3.6412534713745117, "global_step": 2465, "epoch": 58} {"train_loss": -3.586190700531006, "global_step": 2466, "epoch": 58} {"train_loss": -3.6120429039001465, "global_step": 2467, "epoch": 58} {"train_loss": -3.550042152404785, "global_step": 2468, "epoch": 58} {"train_loss": -3.559255599975586, "global_step": 2469, "epoch": 58} {"train_loss": -3.4341864585876465, "global_step": 2470, "epoch": 58} {"train_loss": -3.5868327617645264, "global_step": 2471, "epoch": 58} {"train_loss": -3.426194190979004, "global_step": 2472, "epoch": 58} {"train_loss": -3.6455278396606445, "global_step": 2473, "epoch": 58} {"train_loss": -3.6467766761779785, "global_step": 2474, "epoch": 58} {"train_loss": -3.5489661693573, "global_step": 2475, "epoch": 58} {"train_loss": -3.6631698608398438, "global_step": 2476, "epoch": 58} {"train_loss": -3.566549227351234, "global_step": 2477, "epoch": 58, "val_loss": 198162.390625} {"train_loss": -3.6513142585754395, "global_step": 2478, "epoch": 59} {"train_loss": -3.5573978424072266, "global_step": 2479, "epoch": 59} {"train_loss": -3.5272274017333984, "global_step": 2480, "epoch": 59} {"train_loss": -3.4841322898864746, "global_step": 2481, "epoch": 59} {"train_loss": -3.421152114868164, "global_step": 2482, "epoch": 59} {"train_loss": -3.6654326915740967, "global_step": 2483, "epoch": 59} {"train_loss": -3.522763729095459, "global_step": 2484, "epoch": 59} {"train_loss": -3.6960439682006836, "global_step": 2485, "epoch": 59} {"train_loss": -3.5691778659820557, "global_step": 2486, "epoch": 59} {"train_loss": -3.659048080444336, "global_step": 2487, "epoch": 59} {"train_loss": -3.697779655456543, "global_step": 2488, "epoch": 59} {"train_loss": -3.5861315727233887, "global_step": 2489, "epoch": 59} {"train_loss": -3.616281032562256, "global_step": 2490, "epoch": 59} {"train_loss": -3.543536424636841, "global_step": 2491, "epoch": 59} {"train_loss": -3.854045867919922, "global_step": 2492, "epoch": 59} {"train_loss": -3.703293800354004, "global_step": 2493, "epoch": 59} {"train_loss": -3.772228956222534, "global_step": 2494, "epoch": 59} {"train_loss": -3.7011892795562744, "global_step": 2495, "epoch": 59} {"train_loss": -3.4293856620788574, "global_step": 2496, "epoch": 59} {"train_loss": -3.647308588027954, "global_step": 2497, "epoch": 59} {"train_loss": -3.7396535873413086, "global_step": 2498, "epoch": 59} {"train_loss": -3.759751796722412, "global_step": 2499, "epoch": 59} {"train_loss": -3.662212610244751, "global_step": 2500, "epoch": 59} {"train_loss": -3.517638683319092, "global_step": 2501, "epoch": 59} {"train_loss": -3.6652421951293945, "global_step": 2502, "epoch": 59} {"train_loss": -3.405730724334717, "global_step": 2503, "epoch": 59} {"train_loss": -3.602720260620117, "global_step": 2504, "epoch": 59} {"train_loss": -3.4301438331604004, "global_step": 2505, "epoch": 59} {"train_loss": -3.6364662647247314, "global_step": 2506, "epoch": 59} {"train_loss": -3.62984299659729, "global_step": 2507, "epoch": 59} {"train_loss": -3.799882411956787, "global_step": 2508, "epoch": 59} {"train_loss": -3.6470131874084473, "global_step": 2509, "epoch": 59} {"train_loss": -3.53971529006958, "global_step": 2510, "epoch": 59} {"train_loss": -3.707789897918701, "global_step": 2511, "epoch": 59} {"train_loss": -3.6861934661865234, "global_step": 2512, "epoch": 59} {"train_loss": -3.7174878120422363, "global_step": 2513, "epoch": 59} {"train_loss": -3.706270694732666, "global_step": 2514, "epoch": 59} {"train_loss": -3.646747589111328, "global_step": 2515, "epoch": 59} {"train_loss": -3.6119296550750732, "global_step": 2516, "epoch": 59} {"train_loss": -3.5525450706481934, "global_step": 2517, "epoch": 59} {"train_loss": -3.709573268890381, "global_step": 2518, "epoch": 59} {"train_loss": -3.633281770206633, "global_step": 2519, "epoch": 59, "val_loss": 198483.875} {"train_loss": -3.3632593154907227, "global_step": 2520, "epoch": 60} {"train_loss": -3.639888286590576, "global_step": 2521, "epoch": 60} {"train_loss": -3.544717311859131, "global_step": 2522, "epoch": 60} {"train_loss": -3.604579448699951, "global_step": 2523, "epoch": 60} {"train_loss": -3.487095832824707, "global_step": 2524, "epoch": 60} {"train_loss": -3.3396458625793457, "global_step": 2525, "epoch": 60} {"train_loss": -3.558539390563965, "global_step": 2526, "epoch": 60} {"train_loss": -3.526365280151367, "global_step": 2527, "epoch": 60} {"train_loss": -3.422886610031128, "global_step": 2528, "epoch": 60} {"train_loss": -3.591306447982788, "global_step": 2529, "epoch": 60} {"train_loss": -3.3033881187438965, "global_step": 2530, "epoch": 60} {"train_loss": -3.526836395263672, "global_step": 2531, "epoch": 60} {"train_loss": -3.2284188270568848, "global_step": 2532, "epoch": 60} {"train_loss": -3.5903704166412354, "global_step": 2533, "epoch": 60} {"train_loss": -3.5685384273529053, "global_step": 2534, "epoch": 60} {"train_loss": -3.7381458282470703, "global_step": 2535, "epoch": 60} {"train_loss": -3.4898781776428223, "global_step": 2536, "epoch": 60} {"train_loss": -3.5320866107940674, "global_step": 2537, "epoch": 60} {"train_loss": -3.451488971710205, "global_step": 2538, "epoch": 60} {"train_loss": -3.5245542526245117, "global_step": 2539, "epoch": 60} {"train_loss": -3.5496826171875, "global_step": 2540, "epoch": 60} {"train_loss": -3.467942714691162, "global_step": 2541, "epoch": 60} {"train_loss": -3.6611621379852295, "global_step": 2542, "epoch": 60} {"train_loss": -3.4667980670928955, "global_step": 2543, "epoch": 60} {"train_loss": -3.599928379058838, "global_step": 2544, "epoch": 60} {"train_loss": -3.577794075012207, "global_step": 2545, "epoch": 60} {"train_loss": -3.6708788871765137, "global_step": 2546, "epoch": 60} {"train_loss": -3.772709608078003, "global_step": 2547, "epoch": 60} {"train_loss": -3.6098427772521973, "global_step": 2548, "epoch": 60} {"train_loss": -3.7227730751037598, "global_step": 2549, "epoch": 60} {"train_loss": -3.740967273712158, "global_step": 2550, "epoch": 60} {"train_loss": -3.662271499633789, "global_step": 2551, "epoch": 60} {"train_loss": -3.656562328338623, "global_step": 2552, "epoch": 60} {"train_loss": -3.901228427886963, "global_step": 2553, "epoch": 60} {"train_loss": -3.8527302742004395, "global_step": 2554, "epoch": 60} {"train_loss": -3.7771952152252197, "global_step": 2555, "epoch": 60} {"train_loss": -3.718843936920166, "global_step": 2556, "epoch": 60} {"train_loss": -3.6954612731933594, "global_step": 2557, "epoch": 60} {"train_loss": -3.7207226753234863, "global_step": 2558, "epoch": 60} {"train_loss": -3.525723934173584, "global_step": 2559, "epoch": 60} {"train_loss": -3.6744351387023926, "global_step": 2560, "epoch": 60} {"train_loss": -3.5885700157710483, "global_step": 2561, "epoch": 60, "val_loss": 189370.390625} {"train_loss": -3.570563793182373, "global_step": 2562, "epoch": 61} {"train_loss": -3.625197649002075, "global_step": 2563, "epoch": 61} {"train_loss": -3.728855609893799, "global_step": 2564, "epoch": 61} {"train_loss": -3.7603001594543457, "global_step": 2565, "epoch": 61} {"train_loss": -3.6216354370117188, "global_step": 2566, "epoch": 61} {"train_loss": -3.635063409805298, "global_step": 2567, "epoch": 61} {"train_loss": -3.7267649173736572, "global_step": 2568, "epoch": 61} {"train_loss": -3.729604959487915, "global_step": 2569, "epoch": 61} {"train_loss": -3.7036681175231934, "global_step": 2570, "epoch": 61} {"train_loss": -3.593834638595581, "global_step": 2571, "epoch": 61} {"train_loss": -3.7975099086761475, "global_step": 2572, "epoch": 61} {"train_loss": -3.686762809753418, "global_step": 2573, "epoch": 61} {"train_loss": -3.711792469024658, "global_step": 2574, "epoch": 61} {"train_loss": -3.795236349105835, "global_step": 2575, "epoch": 61} {"train_loss": -3.719414234161377, "global_step": 2576, "epoch": 61} {"train_loss": -3.7277705669403076, "global_step": 2577, "epoch": 61} {"train_loss": -3.6556835174560547, "global_step": 2578, "epoch": 61} {"train_loss": -3.717283010482788, "global_step": 2579, "epoch": 61} {"train_loss": -3.6583330631256104, "global_step": 2580, "epoch": 61} {"train_loss": -3.795668601989746, "global_step": 2581, "epoch": 61} {"train_loss": -3.568493366241455, "global_step": 2582, "epoch": 61} {"train_loss": -3.755380153656006, "global_step": 2583, "epoch": 61} {"train_loss": -3.7199301719665527, "global_step": 2584, "epoch": 61} {"train_loss": -3.67175555229187, "global_step": 2585, "epoch": 61} {"train_loss": -3.834000825881958, "global_step": 2586, "epoch": 61} {"train_loss": -3.7369513511657715, "global_step": 2587, "epoch": 61} {"train_loss": -3.634026050567627, "global_step": 2588, "epoch": 61} {"train_loss": -3.584352731704712, "global_step": 2589, "epoch": 61} {"train_loss": -3.8164405822753906, "global_step": 2590, "epoch": 61} {"train_loss": -3.7055532932281494, "global_step": 2591, "epoch": 61} {"train_loss": -3.751396417617798, "global_step": 2592, "epoch": 61} {"train_loss": -3.795732021331787, "global_step": 2593, "epoch": 61} {"train_loss": -3.735654354095459, "global_step": 2594, "epoch": 61} {"train_loss": -3.775082588195801, "global_step": 2595, "epoch": 61} {"train_loss": -3.626720905303955, "global_step": 2596, "epoch": 61} {"train_loss": -3.6669726371765137, "global_step": 2597, "epoch": 61} {"train_loss": -3.666632652282715, "global_step": 2598, "epoch": 61} {"train_loss": -3.7867519855499268, "global_step": 2599, "epoch": 61} {"train_loss": -3.865079641342163, "global_step": 2600, "epoch": 61} {"train_loss": -3.9355990886688232, "global_step": 2601, "epoch": 61} {"train_loss": -3.6369662284851074, "global_step": 2602, "epoch": 61} {"train_loss": -3.714344694500878, "global_step": 2603, "epoch": 61, "val_loss": 181849.609375} {"train_loss": -3.8099865913391113, "global_step": 2604, "epoch": 62} {"train_loss": -3.7431111335754395, "global_step": 2605, "epoch": 62} {"train_loss": -3.7158284187316895, "global_step": 2606, "epoch": 62} {"train_loss": -3.6910953521728516, "global_step": 2607, "epoch": 62} {"train_loss": -3.854184627532959, "global_step": 2608, "epoch": 62} {"train_loss": -3.7268495559692383, "global_step": 2609, "epoch": 62} {"train_loss": -3.6226563453674316, "global_step": 2610, "epoch": 62} {"train_loss": -3.585439682006836, "global_step": 2611, "epoch": 62} {"train_loss": -3.865144729614258, "global_step": 2612, "epoch": 62} {"train_loss": -3.561431884765625, "global_step": 2613, "epoch": 62} {"train_loss": -3.65944242477417, "global_step": 2614, "epoch": 62} {"train_loss": -3.8966641426086426, "global_step": 2615, "epoch": 62} {"train_loss": -3.5280728340148926, "global_step": 2616, "epoch": 62} {"train_loss": -3.511401653289795, "global_step": 2617, "epoch": 62} {"train_loss": -3.6432533264160156, "global_step": 2618, "epoch": 62} {"train_loss": -3.7856340408325195, "global_step": 2619, "epoch": 62} {"train_loss": -3.667036533355713, "global_step": 2620, "epoch": 62} {"train_loss": -3.7064051628112793, "global_step": 2621, "epoch": 62} {"train_loss": -3.6724886894226074, "global_step": 2622, "epoch": 62} {"train_loss": -3.4001877307891846, "global_step": 2623, "epoch": 62} {"train_loss": -3.6741907596588135, "global_step": 2624, "epoch": 62} {"train_loss": -3.328265905380249, "global_step": 2625, "epoch": 62} {"train_loss": -3.548118829727173, "global_step": 2626, "epoch": 62} {"train_loss": -3.5225026607513428, "global_step": 2627, "epoch": 62} {"train_loss": -3.449162483215332, "global_step": 2628, "epoch": 62} {"train_loss": -3.687391757965088, "global_step": 2629, "epoch": 62} {"train_loss": -3.5199038982391357, "global_step": 2630, "epoch": 62} {"train_loss": -3.526383876800537, "global_step": 2631, "epoch": 62} {"train_loss": -3.6353812217712402, "global_step": 2632, "epoch": 62} {"train_loss": -3.4978973865509033, "global_step": 2633, "epoch": 62} {"train_loss": -3.6767849922180176, "global_step": 2634, "epoch": 62} {"train_loss": -3.5986223220825195, "global_step": 2635, "epoch": 62} {"train_loss": -3.685614824295044, "global_step": 2636, "epoch": 62} {"train_loss": -3.6545872688293457, "global_step": 2637, "epoch": 62} {"train_loss": -3.5311222076416016, "global_step": 2638, "epoch": 62} {"train_loss": -3.7159957885742188, "global_step": 2639, "epoch": 62} {"train_loss": -3.515291452407837, "global_step": 2640, "epoch": 62} {"train_loss": -3.6896603107452393, "global_step": 2641, "epoch": 62} {"train_loss": -3.499880313873291, "global_step": 2642, "epoch": 62} {"train_loss": -3.779672622680664, "global_step": 2643, "epoch": 62} {"train_loss": -3.6200759410858154, "global_step": 2644, "epoch": 62} {"train_loss": -3.6387411128906977, "global_step": 2645, "epoch": 62, "val_loss": 174359.109375} {"train_loss": -3.711611032485962, "global_step": 2646, "epoch": 63} {"train_loss": -3.770602226257324, "global_step": 2647, "epoch": 63} {"train_loss": -3.762502670288086, "global_step": 2648, "epoch": 63} {"train_loss": -3.734602928161621, "global_step": 2649, "epoch": 63} {"train_loss": -3.694430351257324, "global_step": 2650, "epoch": 63} {"train_loss": -3.8617711067199707, "global_step": 2651, "epoch": 63} {"train_loss": -3.806990146636963, "global_step": 2652, "epoch": 63} {"train_loss": -3.887564182281494, "global_step": 2653, "epoch": 63} {"train_loss": -3.6611080169677734, "global_step": 2654, "epoch": 63} {"train_loss": -3.730832576751709, "global_step": 2655, "epoch": 63} {"train_loss": -3.6933465003967285, "global_step": 2656, "epoch": 63} {"train_loss": -3.7814478874206543, "global_step": 2657, "epoch": 63} {"train_loss": -3.744080066680908, "global_step": 2658, "epoch": 63} {"train_loss": -3.71108078956604, "global_step": 2659, "epoch": 63} {"train_loss": -3.7722930908203125, "global_step": 2660, "epoch": 63} {"train_loss": -3.6855525970458984, "global_step": 2661, "epoch": 63} {"train_loss": -3.7539100646972656, "global_step": 2662, "epoch": 63} {"train_loss": -3.8932759761810303, "global_step": 2663, "epoch": 63} {"train_loss": -3.7092833518981934, "global_step": 2664, "epoch": 63} {"train_loss": -3.6774120330810547, "global_step": 2665, "epoch": 63} {"train_loss": -3.8111352920532227, "global_step": 2666, "epoch": 63} {"train_loss": -3.780385732650757, "global_step": 2667, "epoch": 63} {"train_loss": -3.9686031341552734, "global_step": 2668, "epoch": 63} {"train_loss": -3.8738059997558594, "global_step": 2669, "epoch": 63} {"train_loss": -3.7810604572296143, "global_step": 2670, "epoch": 63} {"train_loss": -3.601750373840332, "global_step": 2671, "epoch": 63} {"train_loss": -3.9346933364868164, "global_step": 2672, "epoch": 63} {"train_loss": -3.889833927154541, "global_step": 2673, "epoch": 63} {"train_loss": -3.644672155380249, "global_step": 2674, "epoch": 63} {"train_loss": -3.7295584678649902, "global_step": 2675, "epoch": 63} {"train_loss": -3.719180107116699, "global_step": 2676, "epoch": 63} {"train_loss": -3.679647922515869, "global_step": 2677, "epoch": 63} {"train_loss": -3.8817930221557617, "global_step": 2678, "epoch": 63} {"train_loss": -3.8785204887390137, "global_step": 2679, "epoch": 63} {"train_loss": -3.8454995155334473, "global_step": 2680, "epoch": 63} {"train_loss": -3.8457367420196533, "global_step": 2681, "epoch": 63} {"train_loss": -3.645228624343872, "global_step": 2682, "epoch": 63} {"train_loss": -3.704163074493408, "global_step": 2683, "epoch": 63} {"train_loss": -3.775301456451416, "global_step": 2684, "epoch": 63} {"train_loss": -3.718470573425293, "global_step": 2685, "epoch": 63} {"train_loss": -3.902689218521118, "global_step": 2686, "epoch": 63} {"train_loss": -3.774067203203837, "global_step": 2687, "epoch": 63, "val_loss": 169138.359375} {"train_loss": -3.8640007972717285, "global_step": 2688, "epoch": 64} {"train_loss": -3.84674072265625, "global_step": 2689, "epoch": 64} {"train_loss": -3.768489360809326, "global_step": 2690, "epoch": 64} {"train_loss": -3.743511915206909, "global_step": 2691, "epoch": 64} {"train_loss": -3.8366446495056152, "global_step": 2692, "epoch": 64} {"train_loss": -3.815605640411377, "global_step": 2693, "epoch": 64} {"train_loss": -3.6448683738708496, "global_step": 2694, "epoch": 64} {"train_loss": -3.875826120376587, "global_step": 2695, "epoch": 64} {"train_loss": -3.7014718055725098, "global_step": 2696, "epoch": 64} {"train_loss": -3.803162097930908, "global_step": 2697, "epoch": 64} {"train_loss": -3.8737213611602783, "global_step": 2698, "epoch": 64} {"train_loss": -3.722714900970459, "global_step": 2699, "epoch": 64} {"train_loss": -3.7435739040374756, "global_step": 2700, "epoch": 64} {"train_loss": -3.7294914722442627, "global_step": 2701, "epoch": 64} {"train_loss": -3.782219171524048, "global_step": 2702, "epoch": 64} {"train_loss": -3.7984399795532227, "global_step": 2703, "epoch": 64} {"train_loss": -3.78727126121521, "global_step": 2704, "epoch": 64} {"train_loss": -3.8192379474639893, "global_step": 2705, "epoch": 64} {"train_loss": -3.733787775039673, "global_step": 2706, "epoch": 64} {"train_loss": -3.601424217224121, "global_step": 2707, "epoch": 64} {"train_loss": -3.6323909759521484, "global_step": 2708, "epoch": 64} {"train_loss": -3.879070281982422, "global_step": 2709, "epoch": 64} {"train_loss": -3.6641435623168945, "global_step": 2710, "epoch": 64} {"train_loss": -3.792754650115967, "global_step": 2711, "epoch": 64} {"train_loss": -3.7852025032043457, "global_step": 2712, "epoch": 64} {"train_loss": -3.572415828704834, "global_step": 2713, "epoch": 64} {"train_loss": -3.695787191390991, "global_step": 2714, "epoch": 64} {"train_loss": -3.8616104125976562, "global_step": 2715, "epoch": 64} {"train_loss": -3.4349236488342285, "global_step": 2716, "epoch": 64} {"train_loss": -3.7539424896240234, "global_step": 2717, "epoch": 64} {"train_loss": -3.546259641647339, "global_step": 2718, "epoch": 64} {"train_loss": -3.63401460647583, "global_step": 2719, "epoch": 64} {"train_loss": -3.649531602859497, "global_step": 2720, "epoch": 64} {"train_loss": -3.6089227199554443, "global_step": 2721, "epoch": 64} {"train_loss": -3.6409566402435303, "global_step": 2722, "epoch": 64} {"train_loss": -3.8065690994262695, "global_step": 2723, "epoch": 64} {"train_loss": -3.548511266708374, "global_step": 2724, "epoch": 64} {"train_loss": -3.5288050174713135, "global_step": 2725, "epoch": 64} {"train_loss": -3.7151174545288086, "global_step": 2726, "epoch": 64} {"train_loss": -3.4871599674224854, "global_step": 2727, "epoch": 64} {"train_loss": -3.8445935249328613, "global_step": 2728, "epoch": 64} {"train_loss": -3.7157204945882163, "global_step": 2729, "epoch": 64, "val_loss": 167790.46875} {"train_loss": -3.8421459197998047, "global_step": 2730, "epoch": 65} {"train_loss": -3.6772258281707764, "global_step": 2731, "epoch": 65} {"train_loss": -3.6939456462860107, "global_step": 2732, "epoch": 65} {"train_loss": -3.6840758323669434, "global_step": 2733, "epoch": 65} {"train_loss": -3.582395076751709, "global_step": 2734, "epoch": 65} {"train_loss": -3.7975878715515137, "global_step": 2735, "epoch": 65} {"train_loss": -3.614680767059326, "global_step": 2736, "epoch": 65} {"train_loss": -3.779939651489258, "global_step": 2737, "epoch": 65} {"train_loss": -3.827777624130249, "global_step": 2738, "epoch": 65} {"train_loss": -3.745319128036499, "global_step": 2739, "epoch": 65} {"train_loss": -3.674403667449951, "global_step": 2740, "epoch": 65} {"train_loss": -3.760457992553711, "global_step": 2741, "epoch": 65} {"train_loss": -3.8576085567474365, "global_step": 2742, "epoch": 65} {"train_loss": -3.722100257873535, "global_step": 2743, "epoch": 65} {"train_loss": -3.6851887702941895, "global_step": 2744, "epoch": 65} {"train_loss": -3.847729444503784, "global_step": 2745, "epoch": 65} {"train_loss": -3.828457832336426, "global_step": 2746, "epoch": 65} {"train_loss": -3.718804359436035, "global_step": 2747, "epoch": 65} {"train_loss": -3.7246997356414795, "global_step": 2748, "epoch": 65} {"train_loss": -3.737485408782959, "global_step": 2749, "epoch": 65} {"train_loss": -3.7679288387298584, "global_step": 2750, "epoch": 65} {"train_loss": -3.8118152618408203, "global_step": 2751, "epoch": 65} {"train_loss": -3.9194793701171875, "global_step": 2752, "epoch": 65} {"train_loss": -3.904526710510254, "global_step": 2753, "epoch": 65} {"train_loss": -3.6986989974975586, "global_step": 2754, "epoch": 65} {"train_loss": -3.6662518978118896, "global_step": 2755, "epoch": 65} {"train_loss": -3.8166439533233643, "global_step": 2756, "epoch": 65} {"train_loss": -3.571120262145996, "global_step": 2757, "epoch": 65} {"train_loss": -3.650068759918213, "global_step": 2758, "epoch": 65} {"train_loss": -3.6556777954101562, "global_step": 2759, "epoch": 65} {"train_loss": -3.9695065021514893, "global_step": 2760, "epoch": 65} {"train_loss": -3.848588228225708, "global_step": 2761, "epoch": 65} {"train_loss": -3.634556531906128, "global_step": 2762, "epoch": 65} {"train_loss": -3.816046714782715, "global_step": 2763, "epoch": 65} {"train_loss": -3.7216527462005615, "global_step": 2764, "epoch": 65} {"train_loss": -3.884420871734619, "global_step": 2765, "epoch": 65} {"train_loss": -3.912968158721924, "global_step": 2766, "epoch": 65} {"train_loss": -3.830869197845459, "global_step": 2767, "epoch": 65} {"train_loss": -3.7281877994537354, "global_step": 2768, "epoch": 65} {"train_loss": -3.8214645385742188, "global_step": 2769, "epoch": 65} {"train_loss": -3.7498040199279785, "global_step": 2770, "epoch": 65} {"train_loss": -3.7617685227167037, "global_step": 2771, "epoch": 65, "val_loss": 162610.5625} {"train_loss": -3.7955129146575928, "global_step": 2772, "epoch": 66} {"train_loss": -3.7692618370056152, "global_step": 2773, "epoch": 66} {"train_loss": -3.8685293197631836, "global_step": 2774, "epoch": 66} {"train_loss": -3.81943416595459, "global_step": 2775, "epoch": 66} {"train_loss": -3.7876241207122803, "global_step": 2776, "epoch": 66} {"train_loss": -3.879901647567749, "global_step": 2777, "epoch": 66} {"train_loss": -3.94529390335083, "global_step": 2778, "epoch": 66} {"train_loss": -3.8905041217803955, "global_step": 2779, "epoch": 66} {"train_loss": -3.771088123321533, "global_step": 2780, "epoch": 66} {"train_loss": -3.7991766929626465, "global_step": 2781, "epoch": 66} {"train_loss": -3.8798422813415527, "global_step": 2782, "epoch": 66} {"train_loss": -3.836850643157959, "global_step": 2783, "epoch": 66} {"train_loss": -3.797638416290283, "global_step": 2784, "epoch": 66} {"train_loss": -3.7829043865203857, "global_step": 2785, "epoch": 66} {"train_loss": -3.8722989559173584, "global_step": 2786, "epoch": 66} {"train_loss": -3.882607936859131, "global_step": 2787, "epoch": 66} {"train_loss": -3.9486160278320312, "global_step": 2788, "epoch": 66} {"train_loss": -3.984675407409668, "global_step": 2789, "epoch": 66} {"train_loss": -3.6998424530029297, "global_step": 2790, "epoch": 66} {"train_loss": -4.125916004180908, "global_step": 2791, "epoch": 66} {"train_loss": -3.894376516342163, "global_step": 2792, "epoch": 66} {"train_loss": -3.8156793117523193, "global_step": 2793, "epoch": 66} {"train_loss": -3.724508762359619, "global_step": 2794, "epoch": 66} {"train_loss": -3.993896484375, "global_step": 2795, "epoch": 66} {"train_loss": -3.788900375366211, "global_step": 2796, "epoch": 66} {"train_loss": -3.740387201309204, "global_step": 2797, "epoch": 66} {"train_loss": -3.9420392513275146, "global_step": 2798, "epoch": 66} {"train_loss": -3.9029035568237305, "global_step": 2799, "epoch": 66} {"train_loss": -3.9369378089904785, "global_step": 2800, "epoch": 66} {"train_loss": -3.711520195007324, "global_step": 2801, "epoch": 66} {"train_loss": -3.8252358436584473, "global_step": 2802, "epoch": 66} {"train_loss": -3.8698363304138184, "global_step": 2803, "epoch": 66} {"train_loss": -3.834146022796631, "global_step": 2804, "epoch": 66} {"train_loss": -3.867905616760254, "global_step": 2805, "epoch": 66} {"train_loss": -3.8043055534362793, "global_step": 2806, "epoch": 66} {"train_loss": -3.8640050888061523, "global_step": 2807, "epoch": 66} {"train_loss": -3.7267022132873535, "global_step": 2808, "epoch": 66} {"train_loss": -3.674516201019287, "global_step": 2809, "epoch": 66} {"train_loss": -3.7132341861724854, "global_step": 2810, "epoch": 66} {"train_loss": -3.6488325595855713, "global_step": 2811, "epoch": 66} {"train_loss": -3.7807974815368652, "global_step": 2812, "epoch": 66} {"train_loss": -3.836963403792608, "global_step": 2813, "epoch": 66, "val_loss": 159173.8125} {"train_loss": -3.7094788551330566, "global_step": 2814, "epoch": 67} {"train_loss": -3.8515851497650146, "global_step": 2815, "epoch": 67} {"train_loss": -3.7918858528137207, "global_step": 2816, "epoch": 67} {"train_loss": -3.923591136932373, "global_step": 2817, "epoch": 67} {"train_loss": -3.951505184173584, "global_step": 2818, "epoch": 67} {"train_loss": -3.8803563117980957, "global_step": 2819, "epoch": 67} {"train_loss": -3.7964792251586914, "global_step": 2820, "epoch": 67} {"train_loss": -3.8957836627960205, "global_step": 2821, "epoch": 67} {"train_loss": -3.681382656097412, "global_step": 2822, "epoch": 67} {"train_loss": -3.897568702697754, "global_step": 2823, "epoch": 67} {"train_loss": -3.8330671787261963, "global_step": 2824, "epoch": 67} {"train_loss": -3.8906350135803223, "global_step": 2825, "epoch": 67} {"train_loss": -3.9557878971099854, "global_step": 2826, "epoch": 67} {"train_loss": -3.957577705383301, "global_step": 2827, "epoch": 67} {"train_loss": -4.002353191375732, "global_step": 2828, "epoch": 67} {"train_loss": -3.798053741455078, "global_step": 2829, "epoch": 67} {"train_loss": -3.7847237586975098, "global_step": 2830, "epoch": 67} {"train_loss": -3.8738746643066406, "global_step": 2831, "epoch": 67} {"train_loss": -3.7532460689544678, "global_step": 2832, "epoch": 67} {"train_loss": -3.8072710037231445, "global_step": 2833, "epoch": 67} {"train_loss": -3.820084571838379, "global_step": 2834, "epoch": 67} {"train_loss": -3.945511817932129, "global_step": 2835, "epoch": 67} {"train_loss": -3.8803133964538574, "global_step": 2836, "epoch": 67} {"train_loss": -3.7580487728118896, "global_step": 2837, "epoch": 67} {"train_loss": -3.7381591796875, "global_step": 2838, "epoch": 67} {"train_loss": -3.9753308296203613, "global_step": 2839, "epoch": 67} {"train_loss": -3.8377723693847656, "global_step": 2840, "epoch": 67} {"train_loss": -3.825641393661499, "global_step": 2841, "epoch": 67} {"train_loss": -3.7447736263275146, "global_step": 2842, "epoch": 67} {"train_loss": -3.97891902923584, "global_step": 2843, "epoch": 67} {"train_loss": -3.909320592880249, "global_step": 2844, "epoch": 67} {"train_loss": -3.8967580795288086, "global_step": 2845, "epoch": 67} {"train_loss": -3.762894630432129, "global_step": 2846, "epoch": 67} {"train_loss": -3.8187255859375, "global_step": 2847, "epoch": 67} {"train_loss": -4.065998077392578, "global_step": 2848, "epoch": 67} {"train_loss": -3.7252368927001953, "global_step": 2849, "epoch": 67} {"train_loss": -3.8499646186828613, "global_step": 2850, "epoch": 67} {"train_loss": -3.865493059158325, "global_step": 2851, "epoch": 67} {"train_loss": -4.024099349975586, "global_step": 2852, "epoch": 67} {"train_loss": -4.035989761352539, "global_step": 2853, "epoch": 67} {"train_loss": -3.825355291366577, "global_step": 2854, "epoch": 67} {"train_loss": -3.863887134052458, "global_step": 2855, "epoch": 67, "val_loss": 152946.0625} {"train_loss": -3.84814190864563, "global_step": 2856, "epoch": 68} {"train_loss": -3.784501075744629, "global_step": 2857, "epoch": 68} {"train_loss": -3.8028769493103027, "global_step": 2858, "epoch": 68} {"train_loss": -3.7986667156219482, "global_step": 2859, "epoch": 68} {"train_loss": -3.9171316623687744, "global_step": 2860, "epoch": 68} {"train_loss": -3.8226613998413086, "global_step": 2861, "epoch": 68} {"train_loss": -3.801727294921875, "global_step": 2862, "epoch": 68} {"train_loss": -3.8503036499023438, "global_step": 2863, "epoch": 68} {"train_loss": -3.7047767639160156, "global_step": 2864, "epoch": 68} {"train_loss": -3.6226162910461426, "global_step": 2865, "epoch": 68} {"train_loss": -3.8832240104675293, "global_step": 2866, "epoch": 68} {"train_loss": -3.900559663772583, "global_step": 2867, "epoch": 68} {"train_loss": -3.606839418411255, "global_step": 2868, "epoch": 68} {"train_loss": -3.9481167793273926, "global_step": 2869, "epoch": 68} {"train_loss": -3.741790294647217, "global_step": 2870, "epoch": 68} {"train_loss": -3.821031093597412, "global_step": 2871, "epoch": 68} {"train_loss": -3.96073055267334, "global_step": 2872, "epoch": 68} {"train_loss": -3.834340810775757, "global_step": 2873, "epoch": 68} {"train_loss": -3.943147659301758, "global_step": 2874, "epoch": 68} {"train_loss": -4.019248008728027, "global_step": 2875, "epoch": 68} {"train_loss": -3.9134254455566406, "global_step": 2876, "epoch": 68} {"train_loss": -3.816106081008911, "global_step": 2877, "epoch": 68} {"train_loss": -4.018333435058594, "global_step": 2878, "epoch": 68} {"train_loss": -3.74168062210083, "global_step": 2879, "epoch": 68} {"train_loss": -3.87977933883667, "global_step": 2880, "epoch": 68} {"train_loss": -3.9786980152130127, "global_step": 2881, "epoch": 68} {"train_loss": -3.740302562713623, "global_step": 2882, "epoch": 68} {"train_loss": -3.8198704719543457, "global_step": 2883, "epoch": 68} {"train_loss": -3.813009262084961, "global_step": 2884, "epoch": 68} {"train_loss": -3.912987232208252, "global_step": 2885, "epoch": 68} {"train_loss": -3.8739354610443115, "global_step": 2886, "epoch": 68} {"train_loss": -3.9588522911071777, "global_step": 2887, "epoch": 68} {"train_loss": -3.9913103580474854, "global_step": 2888, "epoch": 68} {"train_loss": -3.869675397872925, "global_step": 2889, "epoch": 68} {"train_loss": -3.9113290309906006, "global_step": 2890, "epoch": 68} {"train_loss": -3.991209030151367, "global_step": 2891, "epoch": 68} {"train_loss": -3.907172203063965, "global_step": 2892, "epoch": 68} {"train_loss": -3.77738618850708, "global_step": 2893, "epoch": 68} {"train_loss": -3.932487964630127, "global_step": 2894, "epoch": 68} {"train_loss": -3.7726223468780518, "global_step": 2895, "epoch": 68} {"train_loss": -3.9572625160217285, "global_step": 2896, "epoch": 68} {"train_loss": -3.8616485879534768, "global_step": 2897, "epoch": 68, "val_loss": 151793.203125} {"train_loss": -3.8810486793518066, "global_step": 2898, "epoch": 69} {"train_loss": -3.8104586601257324, "global_step": 2899, "epoch": 69} {"train_loss": -3.6903650760650635, "global_step": 2900, "epoch": 69} {"train_loss": -3.975250720977783, "global_step": 2901, "epoch": 69} {"train_loss": -4.000422477722168, "global_step": 2902, "epoch": 69} {"train_loss": -3.893616199493408, "global_step": 2903, "epoch": 69} {"train_loss": -4.001166820526123, "global_step": 2904, "epoch": 69} {"train_loss": -3.9239308834075928, "global_step": 2905, "epoch": 69} {"train_loss": -3.7895240783691406, "global_step": 2906, "epoch": 69} {"train_loss": -3.8964548110961914, "global_step": 2907, "epoch": 69} {"train_loss": -3.9217634201049805, "global_step": 2908, "epoch": 69} {"train_loss": -3.917518138885498, "global_step": 2909, "epoch": 69} {"train_loss": -3.746622323989868, "global_step": 2910, "epoch": 69} {"train_loss": -3.923189163208008, "global_step": 2911, "epoch": 69} {"train_loss": -3.8620641231536865, "global_step": 2912, "epoch": 69} {"train_loss": -3.88305401802063, "global_step": 2913, "epoch": 69} {"train_loss": -3.8418784141540527, "global_step": 2914, "epoch": 69} {"train_loss": -3.911938190460205, "global_step": 2915, "epoch": 69} {"train_loss": -3.8885128498077393, "global_step": 2916, "epoch": 69} {"train_loss": -3.963318347930908, "global_step": 2917, "epoch": 69} {"train_loss": -3.8880767822265625, "global_step": 2918, "epoch": 69} {"train_loss": -3.962324857711792, "global_step": 2919, "epoch": 69} {"train_loss": -4.041823387145996, "global_step": 2920, "epoch": 69} {"train_loss": -3.996612787246704, "global_step": 2921, "epoch": 69} {"train_loss": -3.8654584884643555, "global_step": 2922, "epoch": 69} {"train_loss": -3.970646858215332, "global_step": 2923, "epoch": 69} {"train_loss": -3.726044178009033, "global_step": 2924, "epoch": 69} {"train_loss": -4.084036827087402, "global_step": 2925, "epoch": 69} {"train_loss": -3.804351806640625, "global_step": 2926, "epoch": 69} {"train_loss": -3.8511576652526855, "global_step": 2927, "epoch": 69} {"train_loss": -3.838839054107666, "global_step": 2928, "epoch": 69} {"train_loss": -3.8169426918029785, "global_step": 2929, "epoch": 69} {"train_loss": -3.7198729515075684, "global_step": 2930, "epoch": 69} {"train_loss": -3.7807226181030273, "global_step": 2931, "epoch": 69} {"train_loss": -3.8517227172851562, "global_step": 2932, "epoch": 69} {"train_loss": -3.5718884468078613, "global_step": 2933, "epoch": 69} {"train_loss": -3.964125871658325, "global_step": 2934, "epoch": 69} {"train_loss": -3.520838975906372, "global_step": 2935, "epoch": 69} {"train_loss": -3.914517879486084, "global_step": 2936, "epoch": 69} {"train_loss": -3.4919047355651855, "global_step": 2937, "epoch": 69} {"train_loss": -3.406435489654541, "global_step": 2938, "epoch": 69} {"train_loss": -3.8407208976291476, "global_step": 2939, "epoch": 69, "val_loss": 151398.890625} {"train_loss": -3.7310709953308105, "global_step": 2940, "epoch": 70} {"train_loss": -3.088848114013672, "global_step": 2941, "epoch": 70} {"train_loss": -3.515340805053711, "global_step": 2942, "epoch": 70} {"train_loss": -3.194484233856201, "global_step": 2943, "epoch": 70} {"train_loss": -3.2893524169921875, "global_step": 2944, "epoch": 70} {"train_loss": -3.5573809146881104, "global_step": 2945, "epoch": 70} {"train_loss": -3.3870015144348145, "global_step": 2946, "epoch": 70} {"train_loss": -3.5825283527374268, "global_step": 2947, "epoch": 70} {"train_loss": -3.6316142082214355, "global_step": 2948, "epoch": 70} {"train_loss": -3.6127896308898926, "global_step": 2949, "epoch": 70} {"train_loss": -3.5506131649017334, "global_step": 2950, "epoch": 70} {"train_loss": -3.461005449295044, "global_step": 2951, "epoch": 70} {"train_loss": -3.653512954711914, "global_step": 2952, "epoch": 70} {"train_loss": -3.812376022338867, "global_step": 2953, "epoch": 70} {"train_loss": -3.7891592979431152, "global_step": 2954, "epoch": 70} {"train_loss": -3.7411842346191406, "global_step": 2955, "epoch": 70} {"train_loss": -3.6010501384735107, "global_step": 2956, "epoch": 70} {"train_loss": -3.7923507690429688, "global_step": 2957, "epoch": 70} {"train_loss": -3.8454251289367676, "global_step": 2958, "epoch": 70} {"train_loss": -3.7789576053619385, "global_step": 2959, "epoch": 70} {"train_loss": -3.79856014251709, "global_step": 2960, "epoch": 70} {"train_loss": -3.811607837677002, "global_step": 2961, "epoch": 70} {"train_loss": -3.8726422786712646, "global_step": 2962, "epoch": 70} {"train_loss": -3.8447818756103516, "global_step": 2963, "epoch": 70} {"train_loss": -3.8039698600769043, "global_step": 2964, "epoch": 70} {"train_loss": -3.7685012817382812, "global_step": 2965, "epoch": 70} {"train_loss": -3.854443073272705, "global_step": 2966, "epoch": 70} {"train_loss": -3.9430880546569824, "global_step": 2967, "epoch": 70} {"train_loss": -3.8189566135406494, "global_step": 2968, "epoch": 70} {"train_loss": -3.884549140930176, "global_step": 2969, "epoch": 70} {"train_loss": -3.9415066242218018, "global_step": 2970, "epoch": 70} {"train_loss": -3.8703153133392334, "global_step": 2971, "epoch": 70} {"train_loss": -3.6443610191345215, "global_step": 2972, "epoch": 70} {"train_loss": -3.8685035705566406, "global_step": 2973, "epoch": 70} {"train_loss": -3.9376161098480225, "global_step": 2974, "epoch": 70} {"train_loss": -3.8397889137268066, "global_step": 2975, "epoch": 70} {"train_loss": -4.001499652862549, "global_step": 2976, "epoch": 70} {"train_loss": -3.840686321258545, "global_step": 2977, "epoch": 70} {"train_loss": -3.922597885131836, "global_step": 2978, "epoch": 70} {"train_loss": -3.911548137664795, "global_step": 2979, "epoch": 70} {"train_loss": -3.8447086811065674, "global_step": 2980, "epoch": 70} {"train_loss": -3.7330465770903087, "global_step": 2981, "epoch": 70, "val_loss": 146653.96875} {"train_loss": -3.8042538166046143, "global_step": 2982, "epoch": 71} {"train_loss": -3.8935294151306152, "global_step": 2983, "epoch": 71} {"train_loss": -4.017312049865723, "global_step": 2984, "epoch": 71} {"train_loss": -3.8603150844573975, "global_step": 2985, "epoch": 71} {"train_loss": -3.720025062561035, "global_step": 2986, "epoch": 71} {"train_loss": -3.961489200592041, "global_step": 2987, "epoch": 71} {"train_loss": -3.7058420181274414, "global_step": 2988, "epoch": 71} {"train_loss": -3.8001794815063477, "global_step": 2989, "epoch": 71} {"train_loss": -4.008465766906738, "global_step": 2990, "epoch": 71} {"train_loss": -3.8678698539733887, "global_step": 2991, "epoch": 71} {"train_loss": -3.9617300033569336, "global_step": 2992, "epoch": 71} {"train_loss": -3.8323285579681396, "global_step": 2993, "epoch": 71} {"train_loss": -3.9784364700317383, "global_step": 2994, "epoch": 71} {"train_loss": -4.055634021759033, "global_step": 2995, "epoch": 71} {"train_loss": -3.9127206802368164, "global_step": 2996, "epoch": 71} {"train_loss": -3.7829909324645996, "global_step": 2997, "epoch": 71} {"train_loss": -3.99603271484375, "global_step": 2998, "epoch": 71} {"train_loss": -3.8290770053863525, "global_step": 2999, "epoch": 71} {"train_loss": -3.9003195762634277, "global_step": 3000, "epoch": 71} {"train_loss": -3.9711549282073975, "global_step": 3001, "epoch": 71} {"train_loss": -3.8664727210998535, "global_step": 3002, "epoch": 71} {"train_loss": -3.8070662021636963, "global_step": 3003, "epoch": 71} {"train_loss": -3.950875997543335, "global_step": 3004, "epoch": 71} {"train_loss": -3.946539878845215, "global_step": 3005, "epoch": 71} {"train_loss": -3.918666362762451, "global_step": 3006, "epoch": 71} {"train_loss": -3.93692684173584, "global_step": 3007, "epoch": 71} {"train_loss": -3.9415183067321777, "global_step": 3008, "epoch": 71} {"train_loss": -4.01863431930542, "global_step": 3009, "epoch": 71} {"train_loss": -3.9856321811676025, "global_step": 3010, "epoch": 71} {"train_loss": -4.014001369476318, "global_step": 3011, "epoch": 71} {"train_loss": -3.845062732696533, "global_step": 3012, "epoch": 71} {"train_loss": -3.9885363578796387, "global_step": 3013, "epoch": 71} {"train_loss": -4.006195545196533, "global_step": 3014, "epoch": 71} {"train_loss": -4.116448879241943, "global_step": 3015, "epoch": 71} {"train_loss": -3.8791451454162598, "global_step": 3016, "epoch": 71} {"train_loss": -3.9532787799835205, "global_step": 3017, "epoch": 71} {"train_loss": -4.0487260818481445, "global_step": 3018, "epoch": 71} {"train_loss": -3.9934468269348145, "global_step": 3019, "epoch": 71} {"train_loss": -3.946157932281494, "global_step": 3020, "epoch": 71} {"train_loss": -4.081308364868164, "global_step": 3021, "epoch": 71} {"train_loss": -3.84794282913208, "global_step": 3022, "epoch": 71} {"train_loss": -3.9233109383356, "global_step": 3023, "epoch": 71, "val_loss": 142542.0625} {"train_loss": -3.918929100036621, "global_step": 3024, "epoch": 72} {"train_loss": -3.8802456855773926, "global_step": 3025, "epoch": 72} {"train_loss": -3.740741491317749, "global_step": 3026, "epoch": 72} {"train_loss": -3.9399194717407227, "global_step": 3027, "epoch": 72} {"train_loss": -3.966391086578369, "global_step": 3028, "epoch": 72} {"train_loss": -3.9425392150878906, "global_step": 3029, "epoch": 72} {"train_loss": -3.9965178966522217, "global_step": 3030, "epoch": 72} {"train_loss": -3.9123740196228027, "global_step": 3031, "epoch": 72} {"train_loss": -3.9596199989318848, "global_step": 3032, "epoch": 72} {"train_loss": -3.9129629135131836, "global_step": 3033, "epoch": 72} {"train_loss": -3.988915205001831, "global_step": 3034, "epoch": 72} {"train_loss": -3.886014938354492, "global_step": 3035, "epoch": 72} {"train_loss": -3.7660369873046875, "global_step": 3036, "epoch": 72} {"train_loss": -3.994710922241211, "global_step": 3037, "epoch": 72} {"train_loss": -3.9449219703674316, "global_step": 3038, "epoch": 72} {"train_loss": -3.8341989517211914, "global_step": 3039, "epoch": 72} {"train_loss": -3.8676068782806396, "global_step": 3040, "epoch": 72} {"train_loss": -4.004378795623779, "global_step": 3041, "epoch": 72} {"train_loss": -3.8261616230010986, "global_step": 3042, "epoch": 72} {"train_loss": -4.0329389572143555, "global_step": 3043, "epoch": 72} {"train_loss": -4.010222911834717, "global_step": 3044, "epoch": 72} {"train_loss": -4.052060127258301, "global_step": 3045, "epoch": 72} {"train_loss": -4.040436267852783, "global_step": 3046, "epoch": 72} {"train_loss": -3.990962505340576, "global_step": 3047, "epoch": 72} {"train_loss": -3.9399192333221436, "global_step": 3048, "epoch": 72} {"train_loss": -4.020325660705566, "global_step": 3049, "epoch": 72} {"train_loss": -4.017892837524414, "global_step": 3050, "epoch": 72} {"train_loss": -4.027372360229492, "global_step": 3051, "epoch": 72} {"train_loss": -3.9785408973693848, "global_step": 3052, "epoch": 72} {"train_loss": -4.037896633148193, "global_step": 3053, "epoch": 72} {"train_loss": -3.9397079944610596, "global_step": 3054, "epoch": 72} {"train_loss": -3.9517955780029297, "global_step": 3055, "epoch": 72} {"train_loss": -3.806579113006592, "global_step": 3056, "epoch": 72} {"train_loss": -3.9718103408813477, "global_step": 3057, "epoch": 72} {"train_loss": -4.073381423950195, "global_step": 3058, "epoch": 72} {"train_loss": -4.021886825561523, "global_step": 3059, "epoch": 72} {"train_loss": -3.9118893146514893, "global_step": 3060, "epoch": 72} {"train_loss": -3.833378791809082, "global_step": 3061, "epoch": 72} {"train_loss": -3.9928863048553467, "global_step": 3062, "epoch": 72} {"train_loss": -3.9074325561523438, "global_step": 3063, "epoch": 72} {"train_loss": -4.049799919128418, "global_step": 3064, "epoch": 72} {"train_loss": -3.9503286282221475, "global_step": 3065, "epoch": 72, "val_loss": 139540.671875} {"train_loss": -3.9462573528289795, "global_step": 3066, "epoch": 73} {"train_loss": -3.961530923843384, "global_step": 3067, "epoch": 73} {"train_loss": -3.8954992294311523, "global_step": 3068, "epoch": 73} {"train_loss": -4.125389099121094, "global_step": 3069, "epoch": 73} {"train_loss": -3.9123334884643555, "global_step": 3070, "epoch": 73} {"train_loss": -4.049385070800781, "global_step": 3071, "epoch": 73} {"train_loss": -4.168355941772461, "global_step": 3072, "epoch": 73} {"train_loss": -3.996311664581299, "global_step": 3073, "epoch": 73} {"train_loss": -3.9958386421203613, "global_step": 3074, "epoch": 73} {"train_loss": -4.001124382019043, "global_step": 3075, "epoch": 73} {"train_loss": -4.066054344177246, "global_step": 3076, "epoch": 73} {"train_loss": -4.095099925994873, "global_step": 3077, "epoch": 73} {"train_loss": -3.934711456298828, "global_step": 3078, "epoch": 73} {"train_loss": -3.942584753036499, "global_step": 3079, "epoch": 73} {"train_loss": -3.959249496459961, "global_step": 3080, "epoch": 73} {"train_loss": -4.049349784851074, "global_step": 3081, "epoch": 73} {"train_loss": -3.929511785507202, "global_step": 3082, "epoch": 73} {"train_loss": -3.705585479736328, "global_step": 3083, "epoch": 73} {"train_loss": -3.874837875366211, "global_step": 3084, "epoch": 73} {"train_loss": -3.9533767700195312, "global_step": 3085, "epoch": 73} {"train_loss": -4.042145729064941, "global_step": 3086, "epoch": 73} {"train_loss": -3.907883882522583, "global_step": 3087, "epoch": 73} {"train_loss": -3.9389915466308594, "global_step": 3088, "epoch": 73} {"train_loss": -4.034274101257324, "global_step": 3089, "epoch": 73} {"train_loss": -4.203852653503418, "global_step": 3090, "epoch": 73} {"train_loss": -3.828737735748291, "global_step": 3091, "epoch": 73} {"train_loss": -4.053554058074951, "global_step": 3092, "epoch": 73} {"train_loss": -4.026252746582031, "global_step": 3093, "epoch": 73} {"train_loss": -3.961264133453369, "global_step": 3094, "epoch": 73} {"train_loss": -4.093484401702881, "global_step": 3095, "epoch": 73} {"train_loss": -4.029459476470947, "global_step": 3096, "epoch": 73} {"train_loss": -4.125868797302246, "global_step": 3097, "epoch": 73} {"train_loss": -4.050002098083496, "global_step": 3098, "epoch": 73} {"train_loss": -4.122060775756836, "global_step": 3099, "epoch": 73} {"train_loss": -4.077480316162109, "global_step": 3100, "epoch": 73} {"train_loss": -3.8054306507110596, "global_step": 3101, "epoch": 73} {"train_loss": -3.971651554107666, "global_step": 3102, "epoch": 73} {"train_loss": -3.9867658615112305, "global_step": 3103, "epoch": 73} {"train_loss": -4.008586406707764, "global_step": 3104, "epoch": 73} {"train_loss": -3.989887237548828, "global_step": 3105, "epoch": 73} {"train_loss": -4.042572021484375, "global_step": 3106, "epoch": 73} {"train_loss": -3.992184939838591, "global_step": 3107, "epoch": 73, "val_loss": 135452.578125} {"train_loss": -4.051619529724121, "global_step": 3108, "epoch": 74} {"train_loss": -4.042629718780518, "global_step": 3109, "epoch": 74} {"train_loss": -4.085089683532715, "global_step": 3110, "epoch": 74} {"train_loss": -3.985743761062622, "global_step": 3111, "epoch": 74} {"train_loss": -4.058515548706055, "global_step": 3112, "epoch": 74} {"train_loss": -4.010370254516602, "global_step": 3113, "epoch": 74} {"train_loss": -3.936016082763672, "global_step": 3114, "epoch": 74} {"train_loss": -3.8485045433044434, "global_step": 3115, "epoch": 74} {"train_loss": -3.80403208732605, "global_step": 3116, "epoch": 74} {"train_loss": -3.9634652137756348, "global_step": 3117, "epoch": 74} {"train_loss": -3.9772748947143555, "global_step": 3118, "epoch": 74} {"train_loss": -3.949721097946167, "global_step": 3119, "epoch": 74} {"train_loss": -3.9488182067871094, "global_step": 3120, "epoch": 74} {"train_loss": -3.952275276184082, "global_step": 3121, "epoch": 74} {"train_loss": -3.8977534770965576, "global_step": 3122, "epoch": 74} {"train_loss": -3.7054057121276855, "global_step": 3123, "epoch": 74} {"train_loss": -3.869966506958008, "global_step": 3124, "epoch": 74} {"train_loss": -3.9738922119140625, "global_step": 3125, "epoch": 74} {"train_loss": -4.017066955566406, "global_step": 3126, "epoch": 74} {"train_loss": -3.9480223655700684, "global_step": 3127, "epoch": 74} {"train_loss": -3.852764129638672, "global_step": 3128, "epoch": 74} {"train_loss": -3.987297534942627, "global_step": 3129, "epoch": 74} {"train_loss": -3.9589195251464844, "global_step": 3130, "epoch": 74} {"train_loss": -4.009730339050293, "global_step": 3131, "epoch": 74} {"train_loss": -4.046922206878662, "global_step": 3132, "epoch": 74} {"train_loss": -4.034712791442871, "global_step": 3133, "epoch": 74} {"train_loss": -3.985581398010254, "global_step": 3134, "epoch": 74} {"train_loss": -3.841439962387085, "global_step": 3135, "epoch": 74} {"train_loss": -4.051758766174316, "global_step": 3136, "epoch": 74} {"train_loss": -3.9007530212402344, "global_step": 3137, "epoch": 74} {"train_loss": -3.7715134620666504, "global_step": 3138, "epoch": 74} {"train_loss": -3.967479705810547, "global_step": 3139, "epoch": 74} {"train_loss": -3.677100658416748, "global_step": 3140, "epoch": 74} {"train_loss": -3.873991012573242, "global_step": 3141, "epoch": 74} {"train_loss": -3.8797590732574463, "global_step": 3142, "epoch": 74} {"train_loss": -3.917156934738159, "global_step": 3143, "epoch": 74} {"train_loss": -4.0671844482421875, "global_step": 3144, "epoch": 74} {"train_loss": -3.9635543823242188, "global_step": 3145, "epoch": 74} {"train_loss": -4.013951301574707, "global_step": 3146, "epoch": 74} {"train_loss": -4.014749526977539, "global_step": 3147, "epoch": 74} {"train_loss": -4.055495262145996, "global_step": 3148, "epoch": 74} {"train_loss": -3.949618725549607, "global_step": 3149, "epoch": 74, "val_loss": 133308.03125} {"train_loss": -4.0338029861450195, "global_step": 3150, "epoch": 75} {"train_loss": -3.9961957931518555, "global_step": 3151, "epoch": 75} {"train_loss": -4.074831962585449, "global_step": 3152, "epoch": 75} {"train_loss": -4.006293296813965, "global_step": 3153, "epoch": 75} {"train_loss": -3.919753313064575, "global_step": 3154, "epoch": 75} {"train_loss": -3.993157386779785, "global_step": 3155, "epoch": 75} {"train_loss": -4.2120208740234375, "global_step": 3156, "epoch": 75} {"train_loss": -3.932507038116455, "global_step": 3157, "epoch": 75} {"train_loss": -4.117865562438965, "global_step": 3158, "epoch": 75} {"train_loss": -3.94543194770813, "global_step": 3159, "epoch": 75} {"train_loss": -4.021566867828369, "global_step": 3160, "epoch": 75} {"train_loss": -4.17045783996582, "global_step": 3161, "epoch": 75} {"train_loss": -4.035365104675293, "global_step": 3162, "epoch": 75} {"train_loss": -4.085943222045898, "global_step": 3163, "epoch": 75} {"train_loss": -3.9741413593292236, "global_step": 3164, "epoch": 75} {"train_loss": -3.847297191619873, "global_step": 3165, "epoch": 75} {"train_loss": -3.940390110015869, "global_step": 3166, "epoch": 75} {"train_loss": -3.9782156944274902, "global_step": 3167, "epoch": 75} {"train_loss": -3.912752151489258, "global_step": 3168, "epoch": 75} {"train_loss": -3.7253053188323975, "global_step": 3169, "epoch": 75} {"train_loss": -4.079072952270508, "global_step": 3170, "epoch": 75} {"train_loss": -3.615340232849121, "global_step": 3171, "epoch": 75} {"train_loss": -3.6492719650268555, "global_step": 3172, "epoch": 75} {"train_loss": -3.9802136421203613, "global_step": 3173, "epoch": 75} {"train_loss": -3.916095733642578, "global_step": 3174, "epoch": 75} {"train_loss": -3.897524356842041, "global_step": 3175, "epoch": 75} {"train_loss": -4.017502784729004, "global_step": 3176, "epoch": 75} {"train_loss": -3.8479669094085693, "global_step": 3177, "epoch": 75} {"train_loss": -3.9861092567443848, "global_step": 3178, "epoch": 75} {"train_loss": -3.9308438301086426, "global_step": 3179, "epoch": 75} {"train_loss": -3.8494796752929688, "global_step": 3180, "epoch": 75} {"train_loss": -3.974642753601074, "global_step": 3181, "epoch": 75} {"train_loss": -3.915492534637451, "global_step": 3182, "epoch": 75} {"train_loss": -4.1412858963012695, "global_step": 3183, "epoch": 75} {"train_loss": -3.790132761001587, "global_step": 3184, "epoch": 75} {"train_loss": -4.06717586517334, "global_step": 3185, "epoch": 75} {"train_loss": -3.8583168983459473, "global_step": 3186, "epoch": 75} {"train_loss": -3.980591058731079, "global_step": 3187, "epoch": 75} {"train_loss": -3.9153199195861816, "global_step": 3188, "epoch": 75} {"train_loss": -3.9573006629943848, "global_step": 3189, "epoch": 75} {"train_loss": -3.8125946521759033, "global_step": 3190, "epoch": 75} {"train_loss": -3.9520396902447654, "global_step": 3191, "epoch": 75, "val_loss": 131491.40625} {"train_loss": -4.055720806121826, "global_step": 3192, "epoch": 76} {"train_loss": -3.98148512840271, "global_step": 3193, "epoch": 76} {"train_loss": -3.93198299407959, "global_step": 3194, "epoch": 76} {"train_loss": -3.9142017364501953, "global_step": 3195, "epoch": 76} {"train_loss": -3.966259717941284, "global_step": 3196, "epoch": 76} {"train_loss": -3.9562792778015137, "global_step": 3197, "epoch": 76} {"train_loss": -3.8601160049438477, "global_step": 3198, "epoch": 76} {"train_loss": -3.9194791316986084, "global_step": 3199, "epoch": 76} {"train_loss": -4.041529178619385, "global_step": 3200, "epoch": 76} {"train_loss": -4.075292587280273, "global_step": 3201, "epoch": 76} {"train_loss": -3.9465274810791016, "global_step": 3202, "epoch": 76} {"train_loss": -4.1109395027160645, "global_step": 3203, "epoch": 76} {"train_loss": -3.9290027618408203, "global_step": 3204, "epoch": 76} {"train_loss": -4.070918560028076, "global_step": 3205, "epoch": 76} {"train_loss": -4.164946556091309, "global_step": 3206, "epoch": 76} {"train_loss": -4.070449352264404, "global_step": 3207, "epoch": 76} {"train_loss": -4.205456733703613, "global_step": 3208, "epoch": 76} {"train_loss": -4.075957775115967, "global_step": 3209, "epoch": 76} {"train_loss": -4.027679443359375, "global_step": 3210, "epoch": 76} {"train_loss": -4.113796234130859, "global_step": 3211, "epoch": 76} {"train_loss": -4.150592803955078, "global_step": 3212, "epoch": 76} {"train_loss": -4.094755172729492, "global_step": 3213, "epoch": 76} {"train_loss": -4.214069366455078, "global_step": 3214, "epoch": 76} {"train_loss": -4.058274745941162, "global_step": 3215, "epoch": 76} {"train_loss": -3.97202730178833, "global_step": 3216, "epoch": 76} {"train_loss": -4.039366245269775, "global_step": 3217, "epoch": 76} {"train_loss": -4.087392807006836, "global_step": 3218, "epoch": 76} {"train_loss": -4.320106506347656, "global_step": 3219, "epoch": 76} {"train_loss": -3.9321389198303223, "global_step": 3220, "epoch": 76} {"train_loss": -3.9058609008789062, "global_step": 3221, "epoch": 76} {"train_loss": -3.913559913635254, "global_step": 3222, "epoch": 76} {"train_loss": -4.133917808532715, "global_step": 3223, "epoch": 76} {"train_loss": -4.0879740715026855, "global_step": 3224, "epoch": 76} {"train_loss": -3.666311740875244, "global_step": 3225, "epoch": 76} {"train_loss": -3.936828136444092, "global_step": 3226, "epoch": 76} {"train_loss": -4.234239101409912, "global_step": 3227, "epoch": 76} {"train_loss": -3.918590545654297, "global_step": 3228, "epoch": 76} {"train_loss": -3.9691150188446045, "global_step": 3229, "epoch": 76} {"train_loss": -3.8959076404571533, "global_step": 3230, "epoch": 76} {"train_loss": -4.117583751678467, "global_step": 3231, "epoch": 76} {"train_loss": -3.8129239082336426, "global_step": 3232, "epoch": 76} {"train_loss": -4.014921262150719, "global_step": 3233, "epoch": 76, "val_loss": 129305.8515625} {"train_loss": -4.005208969116211, "global_step": 3234, "epoch": 77} {"train_loss": -3.7904765605926514, "global_step": 3235, "epoch": 77} {"train_loss": -3.9411439895629883, "global_step": 3236, "epoch": 77} {"train_loss": -3.914168357849121, "global_step": 3237, "epoch": 77} {"train_loss": -3.671215057373047, "global_step": 3238, "epoch": 77} {"train_loss": -3.876006603240967, "global_step": 3239, "epoch": 77} {"train_loss": -3.6278223991394043, "global_step": 3240, "epoch": 77} {"train_loss": -4.083389759063721, "global_step": 3241, "epoch": 77} {"train_loss": -3.53647518157959, "global_step": 3242, "epoch": 77} {"train_loss": -4.131684303283691, "global_step": 3243, "epoch": 77} {"train_loss": -3.6264822483062744, "global_step": 3244, "epoch": 77} {"train_loss": -3.907782793045044, "global_step": 3245, "epoch": 77} {"train_loss": -3.7689261436462402, "global_step": 3246, "epoch": 77} {"train_loss": -3.965820789337158, "global_step": 3247, "epoch": 77} {"train_loss": -3.7031025886535645, "global_step": 3248, "epoch": 77} {"train_loss": -4.019801616668701, "global_step": 3249, "epoch": 77} {"train_loss": -3.8751068115234375, "global_step": 3250, "epoch": 77} {"train_loss": -4.152965545654297, "global_step": 3251, "epoch": 77} {"train_loss": -3.8517303466796875, "global_step": 3252, "epoch": 77} {"train_loss": -4.01154899597168, "global_step": 3253, "epoch": 77} {"train_loss": -3.8748972415924072, "global_step": 3254, "epoch": 77} {"train_loss": -3.9087042808532715, "global_step": 3255, "epoch": 77} {"train_loss": -3.9937210083007812, "global_step": 3256, "epoch": 77} {"train_loss": -4.164322853088379, "global_step": 3257, "epoch": 77} {"train_loss": -3.846163034439087, "global_step": 3258, "epoch": 77} {"train_loss": -4.134648323059082, "global_step": 3259, "epoch": 77} {"train_loss": -4.001852035522461, "global_step": 3260, "epoch": 77} {"train_loss": -4.015891075134277, "global_step": 3261, "epoch": 77} {"train_loss": -3.8864569664001465, "global_step": 3262, "epoch": 77} {"train_loss": -3.9724183082580566, "global_step": 3263, "epoch": 77} {"train_loss": -3.9697628021240234, "global_step": 3264, "epoch": 77} {"train_loss": -4.06719970703125, "global_step": 3265, "epoch": 77} {"train_loss": -3.9447669982910156, "global_step": 3266, "epoch": 77} {"train_loss": -4.117793560028076, "global_step": 3267, "epoch": 77} {"train_loss": -3.974233627319336, "global_step": 3268, "epoch": 77} {"train_loss": -4.030791759490967, "global_step": 3269, "epoch": 77} {"train_loss": -4.137136459350586, "global_step": 3270, "epoch": 77} {"train_loss": -4.00092887878418, "global_step": 3271, "epoch": 77} {"train_loss": -4.070132732391357, "global_step": 3272, "epoch": 77} {"train_loss": -4.111991882324219, "global_step": 3273, "epoch": 77} {"train_loss": -3.84537935256958, "global_step": 3274, "epoch": 77} {"train_loss": -3.945784574463254, "global_step": 3275, "epoch": 77, "val_loss": 126824.2109375} {"train_loss": -4.018515110015869, "global_step": 3276, "epoch": 78} {"train_loss": -3.8724498748779297, "global_step": 3277, "epoch": 78} {"train_loss": -4.196440696716309, "global_step": 3278, "epoch": 78} {"train_loss": -3.9150309562683105, "global_step": 3279, "epoch": 78} {"train_loss": -4.029182434082031, "global_step": 3280, "epoch": 78} {"train_loss": -3.935068368911743, "global_step": 3281, "epoch": 78} {"train_loss": -3.930319309234619, "global_step": 3282, "epoch": 78} {"train_loss": -4.061885833740234, "global_step": 3283, "epoch": 78} {"train_loss": -3.993695020675659, "global_step": 3284, "epoch": 78} {"train_loss": -4.162878036499023, "global_step": 3285, "epoch": 78} {"train_loss": -4.1152777671813965, "global_step": 3286, "epoch": 78} {"train_loss": -3.9559152126312256, "global_step": 3287, "epoch": 78} {"train_loss": -4.053289413452148, "global_step": 3288, "epoch": 78} {"train_loss": -4.080019474029541, "global_step": 3289, "epoch": 78} {"train_loss": -4.082671165466309, "global_step": 3290, "epoch": 78} {"train_loss": -4.130497932434082, "global_step": 3291, "epoch": 78} {"train_loss": -4.049857139587402, "global_step": 3292, "epoch": 78} {"train_loss": -3.939230442047119, "global_step": 3293, "epoch": 78} {"train_loss": -4.054421424865723, "global_step": 3294, "epoch": 78} {"train_loss": -4.134000778198242, "global_step": 3295, "epoch": 78} {"train_loss": -4.204388618469238, "global_step": 3296, "epoch": 78} {"train_loss": -4.227297306060791, "global_step": 3297, "epoch": 78} {"train_loss": -4.132565021514893, "global_step": 3298, "epoch": 78} {"train_loss": -4.241996765136719, "global_step": 3299, "epoch": 78} {"train_loss": -3.9646716117858887, "global_step": 3300, "epoch": 78} {"train_loss": -3.975127696990967, "global_step": 3301, "epoch": 78} {"train_loss": -4.095233917236328, "global_step": 3302, "epoch": 78} {"train_loss": -4.200631618499756, "global_step": 3303, "epoch": 78} {"train_loss": -4.056845664978027, "global_step": 3304, "epoch": 78} {"train_loss": -3.9196267127990723, "global_step": 3305, "epoch": 78} {"train_loss": -3.89577579498291, "global_step": 3306, "epoch": 78} {"train_loss": -4.123556137084961, "global_step": 3307, "epoch": 78} {"train_loss": -4.128475189208984, "global_step": 3308, "epoch": 78} {"train_loss": -3.8644919395446777, "global_step": 3309, "epoch": 78} {"train_loss": -3.9316699504852295, "global_step": 3310, "epoch": 78} {"train_loss": -3.908803939819336, "global_step": 3311, "epoch": 78} {"train_loss": -4.219877243041992, "global_step": 3312, "epoch": 78} {"train_loss": -3.92655348777771, "global_step": 3313, "epoch": 78} {"train_loss": -4.10717248916626, "global_step": 3314, "epoch": 78} {"train_loss": -4.0503106117248535, "global_step": 3315, "epoch": 78} {"train_loss": -4.046314239501953, "global_step": 3316, "epoch": 78} {"train_loss": -4.046250553358169, "global_step": 3317, "epoch": 78, "val_loss": 127802.625} {"train_loss": -3.88511061668396, "global_step": 3318, "epoch": 79} {"train_loss": -4.06916618347168, "global_step": 3319, "epoch": 79} {"train_loss": -4.08151388168335, "global_step": 3320, "epoch": 79} {"train_loss": -4.049228668212891, "global_step": 3321, "epoch": 79} {"train_loss": -3.9642066955566406, "global_step": 3322, "epoch": 79} {"train_loss": -4.016162872314453, "global_step": 3323, "epoch": 79} {"train_loss": -3.981778144836426, "global_step": 3324, "epoch": 79} {"train_loss": -3.979215145111084, "global_step": 3325, "epoch": 79} {"train_loss": -4.098331451416016, "global_step": 3326, "epoch": 79} {"train_loss": -4.0843095779418945, "global_step": 3327, "epoch": 79} {"train_loss": -3.9809153079986572, "global_step": 3328, "epoch": 79} {"train_loss": -4.106108665466309, "global_step": 3329, "epoch": 79} {"train_loss": -4.046548366546631, "global_step": 3330, "epoch": 79} {"train_loss": -4.039052486419678, "global_step": 3331, "epoch": 79} {"train_loss": -3.893833875656128, "global_step": 3332, "epoch": 79} {"train_loss": -4.075329780578613, "global_step": 3333, "epoch": 79} {"train_loss": -3.994584560394287, "global_step": 3334, "epoch": 79} {"train_loss": -3.9101200103759766, "global_step": 3335, "epoch": 79} {"train_loss": -4.202027320861816, "global_step": 3336, "epoch": 79} {"train_loss": -3.9114699363708496, "global_step": 3337, "epoch": 79} {"train_loss": -4.0630574226379395, "global_step": 3338, "epoch": 79} {"train_loss": -4.162685394287109, "global_step": 3339, "epoch": 79} {"train_loss": -4.02602481842041, "global_step": 3340, "epoch": 79} {"train_loss": -4.1110124588012695, "global_step": 3341, "epoch": 79} {"train_loss": -3.9242255687713623, "global_step": 3342, "epoch": 79} {"train_loss": -4.249059677124023, "global_step": 3343, "epoch": 79} {"train_loss": -4.113401412963867, "global_step": 3344, "epoch": 79} {"train_loss": -4.146541595458984, "global_step": 3345, "epoch": 79} {"train_loss": -3.988832950592041, "global_step": 3346, "epoch": 79} {"train_loss": -4.30755615234375, "global_step": 3347, "epoch": 79} {"train_loss": -4.104250907897949, "global_step": 3348, "epoch": 79} {"train_loss": -4.195232391357422, "global_step": 3349, "epoch": 79} {"train_loss": -4.228885173797607, "global_step": 3350, "epoch": 79} {"train_loss": -4.157020568847656, "global_step": 3351, "epoch": 79} {"train_loss": -4.077071666717529, "global_step": 3352, "epoch": 79} {"train_loss": -4.227356910705566, "global_step": 3353, "epoch": 79} {"train_loss": -4.208805084228516, "global_step": 3354, "epoch": 79} {"train_loss": -4.229629993438721, "global_step": 3355, "epoch": 79} {"train_loss": -4.02486515045166, "global_step": 3356, "epoch": 79} {"train_loss": -4.029874801635742, "global_step": 3357, "epoch": 79} {"train_loss": -4.199333190917969, "global_step": 3358, "epoch": 79} {"train_loss": -4.074335058530171, "global_step": 3359, "epoch": 79, "val_loss": 123033.9375} {"train_loss": -4.042778968811035, "global_step": 3360, "epoch": 80} {"train_loss": -4.161262512207031, "global_step": 3361, "epoch": 80} {"train_loss": -4.235741138458252, "global_step": 3362, "epoch": 80} {"train_loss": -4.1777191162109375, "global_step": 3363, "epoch": 80} {"train_loss": -4.159646987915039, "global_step": 3364, "epoch": 80} {"train_loss": -4.1283063888549805, "global_step": 3365, "epoch": 80} {"train_loss": -4.076358318328857, "global_step": 3366, "epoch": 80} {"train_loss": -3.9881322383880615, "global_step": 3367, "epoch": 80} {"train_loss": -4.012452125549316, "global_step": 3368, "epoch": 80} {"train_loss": -4.1210126876831055, "global_step": 3369, "epoch": 80} {"train_loss": -4.186110019683838, "global_step": 3370, "epoch": 80} {"train_loss": -4.165016174316406, "global_step": 3371, "epoch": 80} {"train_loss": -4.257584571838379, "global_step": 3372, "epoch": 80} {"train_loss": -4.099391460418701, "global_step": 3373, "epoch": 80} {"train_loss": -4.042693138122559, "global_step": 3374, "epoch": 80} {"train_loss": -3.973447799682617, "global_step": 3375, "epoch": 80} {"train_loss": -4.163621425628662, "global_step": 3376, "epoch": 80} {"train_loss": -4.14268159866333, "global_step": 3377, "epoch": 80} {"train_loss": -4.139629364013672, "global_step": 3378, "epoch": 80} {"train_loss": -4.010841369628906, "global_step": 3379, "epoch": 80} {"train_loss": -4.067901611328125, "global_step": 3380, "epoch": 80} {"train_loss": -3.873246669769287, "global_step": 3381, "epoch": 80} {"train_loss": -3.668912410736084, "global_step": 3382, "epoch": 80} {"train_loss": -3.9030885696411133, "global_step": 3383, "epoch": 80} {"train_loss": -3.6171715259552, "global_step": 3384, "epoch": 80} {"train_loss": -3.9358677864074707, "global_step": 3385, "epoch": 80} {"train_loss": -3.569643497467041, "global_step": 3386, "epoch": 80} {"train_loss": -3.925657272338867, "global_step": 3387, "epoch": 80} {"train_loss": -3.8122565746307373, "global_step": 3388, "epoch": 80} {"train_loss": -3.898871660232544, "global_step": 3389, "epoch": 80} {"train_loss": -3.974421977996826, "global_step": 3390, "epoch": 80} {"train_loss": -3.905322551727295, "global_step": 3391, "epoch": 80} {"train_loss": -3.546724557876587, "global_step": 3392, "epoch": 80} {"train_loss": -3.8906829357147217, "global_step": 3393, "epoch": 80} {"train_loss": -3.8599560260772705, "global_step": 3394, "epoch": 80} {"train_loss": -3.9208035469055176, "global_step": 3395, "epoch": 80} {"train_loss": -4.052665710449219, "global_step": 3396, "epoch": 80} {"train_loss": -3.9484410285949707, "global_step": 3397, "epoch": 80} {"train_loss": -3.9662749767303467, "global_step": 3398, "epoch": 80} {"train_loss": -4.204146862030029, "global_step": 3399, "epoch": 80} {"train_loss": -3.9141852855682373, "global_step": 3400, "epoch": 80} {"train_loss": -3.9915928954169866, "global_step": 3401, "epoch": 80, "val_loss": 122907.875} {"train_loss": -3.9223265647888184, "global_step": 3402, "epoch": 81} {"train_loss": -3.9603748321533203, "global_step": 3403, "epoch": 81} {"train_loss": -3.99210786819458, "global_step": 3404, "epoch": 81} {"train_loss": -3.985623836517334, "global_step": 3405, "epoch": 81} {"train_loss": -3.9892489910125732, "global_step": 3406, "epoch": 81} {"train_loss": -4.0224785804748535, "global_step": 3407, "epoch": 81} {"train_loss": -4.02047061920166, "global_step": 3408, "epoch": 81} {"train_loss": -4.062610626220703, "global_step": 3409, "epoch": 81} {"train_loss": -4.058834075927734, "global_step": 3410, "epoch": 81} {"train_loss": -4.020637512207031, "global_step": 3411, "epoch": 81} {"train_loss": -4.022987365722656, "global_step": 3412, "epoch": 81} {"train_loss": -4.162511825561523, "global_step": 3413, "epoch": 81} {"train_loss": -3.960456371307373, "global_step": 3414, "epoch": 81} {"train_loss": -4.11213493347168, "global_step": 3415, "epoch": 81} {"train_loss": -4.140113830566406, "global_step": 3416, "epoch": 81} {"train_loss": -3.9845948219299316, "global_step": 3417, "epoch": 81} {"train_loss": -4.184126377105713, "global_step": 3418, "epoch": 81} {"train_loss": -4.1973090171813965, "global_step": 3419, "epoch": 81} {"train_loss": -4.2163190841674805, "global_step": 3420, "epoch": 81} {"train_loss": -4.144619941711426, "global_step": 3421, "epoch": 81} {"train_loss": -4.222184658050537, "global_step": 3422, "epoch": 81} {"train_loss": -4.124863624572754, "global_step": 3423, "epoch": 81} {"train_loss": -4.035003662109375, "global_step": 3424, "epoch": 81} {"train_loss": -4.140679359436035, "global_step": 3425, "epoch": 81} {"train_loss": -4.108447074890137, "global_step": 3426, "epoch": 81} {"train_loss": -3.9325859546661377, "global_step": 3427, "epoch": 81} {"train_loss": -4.0430450439453125, "global_step": 3428, "epoch": 81} {"train_loss": -4.217868804931641, "global_step": 3429, "epoch": 81} {"train_loss": -4.132445335388184, "global_step": 3430, "epoch": 81} {"train_loss": -4.095946788787842, "global_step": 3431, "epoch": 81} {"train_loss": -4.2291717529296875, "global_step": 3432, "epoch": 81} {"train_loss": -4.170886993408203, "global_step": 3433, "epoch": 81} {"train_loss": -4.083150863647461, "global_step": 3434, "epoch": 81} {"train_loss": -4.057250499725342, "global_step": 3435, "epoch": 81} {"train_loss": -4.055700778961182, "global_step": 3436, "epoch": 81} {"train_loss": -4.041723251342773, "global_step": 3437, "epoch": 81} {"train_loss": -4.036910057067871, "global_step": 3438, "epoch": 81} {"train_loss": -4.084874153137207, "global_step": 3439, "epoch": 81} {"train_loss": -3.9991159439086914, "global_step": 3440, "epoch": 81} {"train_loss": -4.074037551879883, "global_step": 3441, "epoch": 81} {"train_loss": -4.22701358795166, "global_step": 3442, "epoch": 81} {"train_loss": -4.082397086279733, "global_step": 3443, "epoch": 81, "val_loss": 121414.5546875} {"train_loss": -4.009549617767334, "global_step": 3444, "epoch": 82} {"train_loss": -4.2880048751831055, "global_step": 3445, "epoch": 82} {"train_loss": -4.151558876037598, "global_step": 3446, "epoch": 82} {"train_loss": -4.147979259490967, "global_step": 3447, "epoch": 82} {"train_loss": -4.110997676849365, "global_step": 3448, "epoch": 82} {"train_loss": -4.245325088500977, "global_step": 3449, "epoch": 82} {"train_loss": -4.194520950317383, "global_step": 3450, "epoch": 82} {"train_loss": -4.197735786437988, "global_step": 3451, "epoch": 82} {"train_loss": -4.176000118255615, "global_step": 3452, "epoch": 82} {"train_loss": -4.229892253875732, "global_step": 3453, "epoch": 82} {"train_loss": -4.335641384124756, "global_step": 3454, "epoch": 82} {"train_loss": -4.191712379455566, "global_step": 3455, "epoch": 82} {"train_loss": -4.126180171966553, "global_step": 3456, "epoch": 82} {"train_loss": -4.299287796020508, "global_step": 3457, "epoch": 82} {"train_loss": -4.261994361877441, "global_step": 3458, "epoch": 82} {"train_loss": -4.318987846374512, "global_step": 3459, "epoch": 82} {"train_loss": -4.271952152252197, "global_step": 3460, "epoch": 82} {"train_loss": -4.201053619384766, "global_step": 3461, "epoch": 82} {"train_loss": -4.01927375793457, "global_step": 3462, "epoch": 82} {"train_loss": -3.926802635192871, "global_step": 3463, "epoch": 82} {"train_loss": -4.072063446044922, "global_step": 3464, "epoch": 82} {"train_loss": -4.243454933166504, "global_step": 3465, "epoch": 82} {"train_loss": -3.7109718322753906, "global_step": 3466, "epoch": 82} {"train_loss": -3.5736405849456787, "global_step": 3467, "epoch": 82} {"train_loss": -4.176344394683838, "global_step": 3468, "epoch": 82} {"train_loss": -4.007531642913818, "global_step": 3469, "epoch": 82} {"train_loss": -3.6983225345611572, "global_step": 3470, "epoch": 82} {"train_loss": -4.158333778381348, "global_step": 3471, "epoch": 82} {"train_loss": -4.149573802947998, "global_step": 3472, "epoch": 82} {"train_loss": -3.894286632537842, "global_step": 3473, "epoch": 82} {"train_loss": -4.059409141540527, "global_step": 3474, "epoch": 82} {"train_loss": -3.9610486030578613, "global_step": 3475, "epoch": 82} {"train_loss": -4.005093097686768, "global_step": 3476, "epoch": 82} {"train_loss": -3.9259705543518066, "global_step": 3477, "epoch": 82} {"train_loss": -4.015643119812012, "global_step": 3478, "epoch": 82} {"train_loss": -4.113905906677246, "global_step": 3479, "epoch": 82} {"train_loss": -4.01286506652832, "global_step": 3480, "epoch": 82} {"train_loss": -4.015689849853516, "global_step": 3481, "epoch": 82} {"train_loss": -4.1013031005859375, "global_step": 3482, "epoch": 82} {"train_loss": -3.9613165855407715, "global_step": 3483, "epoch": 82} {"train_loss": -4.200954437255859, "global_step": 3484, "epoch": 82} {"train_loss": -4.088260105678013, "global_step": 3485, "epoch": 82, "val_loss": 121118.5390625} {"train_loss": -4.088737964630127, "global_step": 3486, "epoch": 83} {"train_loss": -4.003265380859375, "global_step": 3487, "epoch": 83} {"train_loss": -4.098137378692627, "global_step": 3488, "epoch": 83} {"train_loss": -4.020280838012695, "global_step": 3489, "epoch": 83} {"train_loss": -4.014884948730469, "global_step": 3490, "epoch": 83} {"train_loss": -3.9730873107910156, "global_step": 3491, "epoch": 83} {"train_loss": -4.238585948944092, "global_step": 3492, "epoch": 83} {"train_loss": -4.17880916595459, "global_step": 3493, "epoch": 83} {"train_loss": -4.1822333335876465, "global_step": 3494, "epoch": 83} {"train_loss": -4.107954025268555, "global_step": 3495, "epoch": 83} {"train_loss": -4.075406074523926, "global_step": 3496, "epoch": 83} {"train_loss": -4.112863540649414, "global_step": 3497, "epoch": 83} {"train_loss": -4.219777584075928, "global_step": 3498, "epoch": 83} {"train_loss": -4.315329074859619, "global_step": 3499, "epoch": 83} {"train_loss": -4.258900165557861, "global_step": 3500, "epoch": 83} {"train_loss": -4.0745849609375, "global_step": 3501, "epoch": 83} {"train_loss": -4.179476737976074, "global_step": 3502, "epoch": 83} {"train_loss": -4.093613624572754, "global_step": 3503, "epoch": 83} {"train_loss": -4.194691181182861, "global_step": 3504, "epoch": 83} {"train_loss": -4.025177478790283, "global_step": 3505, "epoch": 83} {"train_loss": -4.209407806396484, "global_step": 3506, "epoch": 83} {"train_loss": -4.25809383392334, "global_step": 3507, "epoch": 83} {"train_loss": -4.121734619140625, "global_step": 3508, "epoch": 83} {"train_loss": -4.125276565551758, "global_step": 3509, "epoch": 83} {"train_loss": -4.078425884246826, "global_step": 3510, "epoch": 83} {"train_loss": -4.08855676651001, "global_step": 3511, "epoch": 83} {"train_loss": -4.272774696350098, "global_step": 3512, "epoch": 83} {"train_loss": -4.014230251312256, "global_step": 3513, "epoch": 83} {"train_loss": -4.117157459259033, "global_step": 3514, "epoch": 83} {"train_loss": -4.18151330947876, "global_step": 3515, "epoch": 83} {"train_loss": -4.223257064819336, "global_step": 3516, "epoch": 83} {"train_loss": -3.9931788444519043, "global_step": 3517, "epoch": 83} {"train_loss": -4.2058305740356445, "global_step": 3518, "epoch": 83} {"train_loss": -4.19663143157959, "global_step": 3519, "epoch": 83} {"train_loss": -4.153227806091309, "global_step": 3520, "epoch": 83} {"train_loss": -4.189882278442383, "global_step": 3521, "epoch": 83} {"train_loss": -4.044919013977051, "global_step": 3522, "epoch": 83} {"train_loss": -4.26453971862793, "global_step": 3523, "epoch": 83} {"train_loss": -4.320791244506836, "global_step": 3524, "epoch": 83} {"train_loss": -4.110983848571777, "global_step": 3525, "epoch": 83} {"train_loss": -4.18394136428833, "global_step": 3526, "epoch": 83} {"train_loss": -4.144416604723249, "global_step": 3527, "epoch": 83, "val_loss": 117508.0546875} {"train_loss": -4.004143714904785, "global_step": 3528, "epoch": 84} {"train_loss": -4.044919013977051, "global_step": 3529, "epoch": 84} {"train_loss": -4.0918684005737305, "global_step": 3530, "epoch": 84} {"train_loss": -4.06821346282959, "global_step": 3531, "epoch": 84} {"train_loss": -4.112558841705322, "global_step": 3532, "epoch": 84} {"train_loss": -4.064052581787109, "global_step": 3533, "epoch": 84} {"train_loss": -3.8487002849578857, "global_step": 3534, "epoch": 84} {"train_loss": -4.091838836669922, "global_step": 3535, "epoch": 84} {"train_loss": -4.044529914855957, "global_step": 3536, "epoch": 84} {"train_loss": -3.7751355171203613, "global_step": 3537, "epoch": 84} {"train_loss": -3.9321718215942383, "global_step": 3538, "epoch": 84} {"train_loss": -4.009291648864746, "global_step": 3539, "epoch": 84} {"train_loss": -4.195348262786865, "global_step": 3540, "epoch": 84} {"train_loss": -3.827082633972168, "global_step": 3541, "epoch": 84} {"train_loss": -4.263552188873291, "global_step": 3542, "epoch": 84} {"train_loss": -3.853893280029297, "global_step": 3543, "epoch": 84} {"train_loss": -3.979656457901001, "global_step": 3544, "epoch": 84} {"train_loss": -4.117541313171387, "global_step": 3545, "epoch": 84} {"train_loss": -4.051358222961426, "global_step": 3546, "epoch": 84} {"train_loss": -4.024519443511963, "global_step": 3547, "epoch": 84} {"train_loss": -4.0578203201293945, "global_step": 3548, "epoch": 84} {"train_loss": -4.197124004364014, "global_step": 3549, "epoch": 84} {"train_loss": -4.0345354080200195, "global_step": 3550, "epoch": 84} {"train_loss": -4.251463413238525, "global_step": 3551, "epoch": 84} {"train_loss": -3.9070792198181152, "global_step": 3552, "epoch": 84} {"train_loss": -4.203168869018555, "global_step": 3553, "epoch": 84} {"train_loss": -4.120594024658203, "global_step": 3554, "epoch": 84} {"train_loss": -4.250322341918945, "global_step": 3555, "epoch": 84} {"train_loss": -4.253622055053711, "global_step": 3556, "epoch": 84} {"train_loss": -3.993011236190796, "global_step": 3557, "epoch": 84} {"train_loss": -4.176633834838867, "global_step": 3558, "epoch": 84} {"train_loss": -4.035701274871826, "global_step": 3559, "epoch": 84} {"train_loss": -4.154473781585693, "global_step": 3560, "epoch": 84} {"train_loss": -4.115874767303467, "global_step": 3561, "epoch": 84} {"train_loss": -4.266820907592773, "global_step": 3562, "epoch": 84} {"train_loss": -4.048323631286621, "global_step": 3563, "epoch": 84} {"train_loss": -4.149679183959961, "global_step": 3564, "epoch": 84} {"train_loss": -4.214323997497559, "global_step": 3565, "epoch": 84} {"train_loss": -4.184284687042236, "global_step": 3566, "epoch": 84} {"train_loss": -4.231622695922852, "global_step": 3567, "epoch": 84} {"train_loss": -4.363809585571289, "global_step": 3568, "epoch": 84} {"train_loss": -4.09011025088174, "global_step": 3569, "epoch": 84, "val_loss": 113725.0390625} {"train_loss": -4.242971420288086, "global_step": 3570, "epoch": 85} {"train_loss": -4.073326110839844, "global_step": 3571, "epoch": 85} {"train_loss": -4.194702625274658, "global_step": 3572, "epoch": 85} {"train_loss": -4.309661865234375, "global_step": 3573, "epoch": 85} {"train_loss": -4.252180576324463, "global_step": 3574, "epoch": 85} {"train_loss": -4.174397945404053, "global_step": 3575, "epoch": 85} {"train_loss": -4.319876670837402, "global_step": 3576, "epoch": 85} {"train_loss": -4.396097660064697, "global_step": 3577, "epoch": 85} {"train_loss": -4.374841690063477, "global_step": 3578, "epoch": 85} {"train_loss": -4.042810440063477, "global_step": 3579, "epoch": 85} {"train_loss": -4.077533721923828, "global_step": 3580, "epoch": 85} {"train_loss": -4.196812629699707, "global_step": 3581, "epoch": 85} {"train_loss": -4.241095542907715, "global_step": 3582, "epoch": 85} {"train_loss": -4.185697555541992, "global_step": 3583, "epoch": 85} {"train_loss": -4.101305961608887, "global_step": 3584, "epoch": 85} {"train_loss": -4.137448787689209, "global_step": 3585, "epoch": 85} {"train_loss": -4.120995998382568, "global_step": 3586, "epoch": 85} {"train_loss": -3.9374961853027344, "global_step": 3587, "epoch": 85} {"train_loss": -4.280453681945801, "global_step": 3588, "epoch": 85} {"train_loss": -4.263622283935547, "global_step": 3589, "epoch": 85} {"train_loss": -4.149466037750244, "global_step": 3590, "epoch": 85} {"train_loss": -4.041147708892822, "global_step": 3591, "epoch": 85} {"train_loss": -4.095254898071289, "global_step": 3592, "epoch": 85} {"train_loss": -4.128582000732422, "global_step": 3593, "epoch": 85} {"train_loss": -3.9321508407592773, "global_step": 3594, "epoch": 85} {"train_loss": -4.003878593444824, "global_step": 3595, "epoch": 85} {"train_loss": -4.092278480529785, "global_step": 3596, "epoch": 85} {"train_loss": -4.199902534484863, "global_step": 3597, "epoch": 85} {"train_loss": -3.8410239219665527, "global_step": 3598, "epoch": 85} {"train_loss": -4.134471893310547, "global_step": 3599, "epoch": 85} {"train_loss": -3.8148388862609863, "global_step": 3600, "epoch": 85} {"train_loss": -4.231396675109863, "global_step": 3601, "epoch": 85} {"train_loss": -3.9707980155944824, "global_step": 3602, "epoch": 85} {"train_loss": -4.077549934387207, "global_step": 3603, "epoch": 85} {"train_loss": -4.24675989151001, "global_step": 3604, "epoch": 85} {"train_loss": -3.858773708343506, "global_step": 3605, "epoch": 85} {"train_loss": -4.303360939025879, "global_step": 3606, "epoch": 85} {"train_loss": -4.055797576904297, "global_step": 3607, "epoch": 85} {"train_loss": -4.041937351226807, "global_step": 3608, "epoch": 85} {"train_loss": -4.050158977508545, "global_step": 3609, "epoch": 85} {"train_loss": -4.079080581665039, "global_step": 3610, "epoch": 85} {"train_loss": -4.127626430420649, "global_step": 3611, "epoch": 85, "val_loss": 115390.234375} {"train_loss": -4.083653926849365, "global_step": 3612, "epoch": 86} {"train_loss": -4.2052321434021, "global_step": 3613, "epoch": 86} {"train_loss": -4.118218898773193, "global_step": 3614, "epoch": 86} {"train_loss": -4.166308879852295, "global_step": 3615, "epoch": 86} {"train_loss": -4.060685634613037, "global_step": 3616, "epoch": 86} {"train_loss": -4.327180862426758, "global_step": 3617, "epoch": 86} {"train_loss": -4.198378562927246, "global_step": 3618, "epoch": 86} {"train_loss": -4.205873966217041, "global_step": 3619, "epoch": 86} {"train_loss": -4.237709999084473, "global_step": 3620, "epoch": 86} {"train_loss": -4.326092720031738, "global_step": 3621, "epoch": 86} {"train_loss": -4.100170612335205, "global_step": 3622, "epoch": 86} {"train_loss": -4.136590957641602, "global_step": 3623, "epoch": 86} {"train_loss": -4.206975936889648, "global_step": 3624, "epoch": 86} {"train_loss": -4.200862884521484, "global_step": 3625, "epoch": 86} {"train_loss": -4.350135803222656, "global_step": 3626, "epoch": 86} {"train_loss": -4.234236717224121, "global_step": 3627, "epoch": 86} {"train_loss": -4.285525321960449, "global_step": 3628, "epoch": 86} {"train_loss": -4.243767738342285, "global_step": 3629, "epoch": 86} {"train_loss": -4.171991348266602, "global_step": 3630, "epoch": 86} {"train_loss": -4.133817672729492, "global_step": 3631, "epoch": 86} {"train_loss": -4.347952365875244, "global_step": 3632, "epoch": 86} {"train_loss": -4.13232946395874, "global_step": 3633, "epoch": 86} {"train_loss": -4.063222408294678, "global_step": 3634, "epoch": 86} {"train_loss": -4.2162981033325195, "global_step": 3635, "epoch": 86} {"train_loss": -4.185154914855957, "global_step": 3636, "epoch": 86} {"train_loss": -3.946589946746826, "global_step": 3637, "epoch": 86} {"train_loss": -4.231639385223389, "global_step": 3638, "epoch": 86} {"train_loss": -4.087247848510742, "global_step": 3639, "epoch": 86} {"train_loss": -4.1716461181640625, "global_step": 3640, "epoch": 86} {"train_loss": -4.256919860839844, "global_step": 3641, "epoch": 86} {"train_loss": -4.212099075317383, "global_step": 3642, "epoch": 86} {"train_loss": -4.066605567932129, "global_step": 3643, "epoch": 86} {"train_loss": -3.9702653884887695, "global_step": 3644, "epoch": 86} {"train_loss": -4.285882472991943, "global_step": 3645, "epoch": 86} {"train_loss": -4.054748058319092, "global_step": 3646, "epoch": 86} {"train_loss": -3.9774653911590576, "global_step": 3647, "epoch": 86} {"train_loss": -4.173165321350098, "global_step": 3648, "epoch": 86} {"train_loss": -4.0112152099609375, "global_step": 3649, "epoch": 86} {"train_loss": -4.18870210647583, "global_step": 3650, "epoch": 86} {"train_loss": -4.155231952667236, "global_step": 3651, "epoch": 86} {"train_loss": -3.9372963905334473, "global_step": 3652, "epoch": 86} {"train_loss": -4.16373944850195, "global_step": 3653, "epoch": 86, "val_loss": 117386.71875} {"train_loss": -3.902998447418213, "global_step": 3654, "epoch": 87} {"train_loss": -4.1486101150512695, "global_step": 3655, "epoch": 87} {"train_loss": -4.120145797729492, "global_step": 3656, "epoch": 87} {"train_loss": -4.22127628326416, "global_step": 3657, "epoch": 87} {"train_loss": -4.0485920906066895, "global_step": 3658, "epoch": 87} {"train_loss": -4.102316379547119, "global_step": 3659, "epoch": 87} {"train_loss": -4.120450973510742, "global_step": 3660, "epoch": 87} {"train_loss": -4.01906681060791, "global_step": 3661, "epoch": 87} {"train_loss": -4.25344181060791, "global_step": 3662, "epoch": 87} {"train_loss": -4.238483428955078, "global_step": 3663, "epoch": 87} {"train_loss": -4.14384126663208, "global_step": 3664, "epoch": 87} {"train_loss": -4.031007766723633, "global_step": 3665, "epoch": 87} {"train_loss": -4.275166034698486, "global_step": 3666, "epoch": 87} {"train_loss": -4.275578498840332, "global_step": 3667, "epoch": 87} {"train_loss": -4.234218597412109, "global_step": 3668, "epoch": 87} {"train_loss": -4.312310695648193, "global_step": 3669, "epoch": 87} {"train_loss": -4.146848678588867, "global_step": 3670, "epoch": 87} {"train_loss": -4.233620643615723, "global_step": 3671, "epoch": 87} {"train_loss": -4.338469505310059, "global_step": 3672, "epoch": 87} {"train_loss": -4.306880474090576, "global_step": 3673, "epoch": 87} {"train_loss": -4.271281719207764, "global_step": 3674, "epoch": 87} {"train_loss": -4.21500301361084, "global_step": 3675, "epoch": 87} {"train_loss": -4.336297512054443, "global_step": 3676, "epoch": 87} {"train_loss": -4.260793685913086, "global_step": 3677, "epoch": 87} {"train_loss": -4.295997619628906, "global_step": 3678, "epoch": 87} {"train_loss": -4.237254619598389, "global_step": 3679, "epoch": 87} {"train_loss": -4.2846598625183105, "global_step": 3680, "epoch": 87} {"train_loss": -4.466367721557617, "global_step": 3681, "epoch": 87} {"train_loss": -4.216124534606934, "global_step": 3682, "epoch": 87} {"train_loss": -4.1781086921691895, "global_step": 3683, "epoch": 87} {"train_loss": -4.369598865509033, "global_step": 3684, "epoch": 87} {"train_loss": -4.21134614944458, "global_step": 3685, "epoch": 87} {"train_loss": -4.2493720054626465, "global_step": 3686, "epoch": 87} {"train_loss": -4.289040565490723, "global_step": 3687, "epoch": 87} {"train_loss": -4.223165035247803, "global_step": 3688, "epoch": 87} {"train_loss": -4.2484235763549805, "global_step": 3689, "epoch": 87} {"train_loss": -4.266470909118652, "global_step": 3690, "epoch": 87} {"train_loss": -4.268644332885742, "global_step": 3691, "epoch": 87} {"train_loss": -4.180943489074707, "global_step": 3692, "epoch": 87} {"train_loss": -4.206430435180664, "global_step": 3693, "epoch": 87} {"train_loss": -4.261104106903076, "global_step": 3694, "epoch": 87} {"train_loss": -4.221769866489229, "global_step": 3695, "epoch": 87, "val_loss": 111494.890625} {"train_loss": -4.200321197509766, "global_step": 3696, "epoch": 88} {"train_loss": -4.299954414367676, "global_step": 3697, "epoch": 88} {"train_loss": -4.327564239501953, "global_step": 3698, "epoch": 88} {"train_loss": -4.324713230133057, "global_step": 3699, "epoch": 88} {"train_loss": -4.1724090576171875, "global_step": 3700, "epoch": 88} {"train_loss": -4.243809700012207, "global_step": 3701, "epoch": 88} {"train_loss": -4.114330291748047, "global_step": 3702, "epoch": 88} {"train_loss": -4.198948860168457, "global_step": 3703, "epoch": 88} {"train_loss": -4.315244674682617, "global_step": 3704, "epoch": 88} {"train_loss": -4.257821083068848, "global_step": 3705, "epoch": 88} {"train_loss": -4.243643760681152, "global_step": 3706, "epoch": 88} {"train_loss": -4.016218662261963, "global_step": 3707, "epoch": 88} {"train_loss": -4.248241424560547, "global_step": 3708, "epoch": 88} {"train_loss": -4.22257137298584, "global_step": 3709, "epoch": 88} {"train_loss": -4.125796318054199, "global_step": 3710, "epoch": 88} {"train_loss": -4.005178451538086, "global_step": 3711, "epoch": 88} {"train_loss": -4.011730194091797, "global_step": 3712, "epoch": 88} {"train_loss": -4.031352519989014, "global_step": 3713, "epoch": 88} {"train_loss": -4.0996856689453125, "global_step": 3714, "epoch": 88} {"train_loss": -3.9268131256103516, "global_step": 3715, "epoch": 88} {"train_loss": -3.706859588623047, "global_step": 3716, "epoch": 88} {"train_loss": -4.012835502624512, "global_step": 3717, "epoch": 88} {"train_loss": -4.037941932678223, "global_step": 3718, "epoch": 88} {"train_loss": -3.9238126277923584, "global_step": 3719, "epoch": 88} {"train_loss": -4.057394027709961, "global_step": 3720, "epoch": 88} {"train_loss": -4.0366740226745605, "global_step": 3721, "epoch": 88} {"train_loss": -3.912261962890625, "global_step": 3722, "epoch": 88} {"train_loss": -4.1046247482299805, "global_step": 3723, "epoch": 88} {"train_loss": -4.138472557067871, "global_step": 3724, "epoch": 88} {"train_loss": -4.091215133666992, "global_step": 3725, "epoch": 88} {"train_loss": -4.090553283691406, "global_step": 3726, "epoch": 88} {"train_loss": -4.0912346839904785, "global_step": 3727, "epoch": 88} {"train_loss": -4.191659450531006, "global_step": 3728, "epoch": 88} {"train_loss": -4.138134002685547, "global_step": 3729, "epoch": 88} {"train_loss": -4.194051265716553, "global_step": 3730, "epoch": 88} {"train_loss": -4.082611083984375, "global_step": 3731, "epoch": 88} {"train_loss": -3.985133171081543, "global_step": 3732, "epoch": 88} {"train_loss": -4.257486820220947, "global_step": 3733, "epoch": 88} {"train_loss": -4.229720115661621, "global_step": 3734, "epoch": 88} {"train_loss": -3.998117446899414, "global_step": 3735, "epoch": 88} {"train_loss": -3.8359436988830566, "global_step": 3736, "epoch": 88} {"train_loss": -4.114293160892668, "global_step": 3737, "epoch": 88, "val_loss": 113037.0546875} {"train_loss": -4.2128448486328125, "global_step": 3738, "epoch": 89} {"train_loss": -3.945176124572754, "global_step": 3739, "epoch": 89} {"train_loss": -4.056270599365234, "global_step": 3740, "epoch": 89} {"train_loss": -4.095672607421875, "global_step": 3741, "epoch": 89} {"train_loss": -4.145655632019043, "global_step": 3742, "epoch": 89} {"train_loss": -4.143486022949219, "global_step": 3743, "epoch": 89} {"train_loss": -4.159710884094238, "global_step": 3744, "epoch": 89} {"train_loss": -4.179827690124512, "global_step": 3745, "epoch": 89} {"train_loss": -4.11973237991333, "global_step": 3746, "epoch": 89} {"train_loss": -4.104935169219971, "global_step": 3747, "epoch": 89} {"train_loss": -4.205976486206055, "global_step": 3748, "epoch": 89} {"train_loss": -3.963313579559326, "global_step": 3749, "epoch": 89} {"train_loss": -4.217940330505371, "global_step": 3750, "epoch": 89} {"train_loss": -4.264102935791016, "global_step": 3751, "epoch": 89} {"train_loss": -4.196300506591797, "global_step": 3752, "epoch": 89} {"train_loss": -4.291926383972168, "global_step": 3753, "epoch": 89} {"train_loss": -4.059352874755859, "global_step": 3754, "epoch": 89} {"train_loss": -4.124828338623047, "global_step": 3755, "epoch": 89} {"train_loss": -4.208797931671143, "global_step": 3756, "epoch": 89} {"train_loss": -4.030184268951416, "global_step": 3757, "epoch": 89} {"train_loss": -4.081874847412109, "global_step": 3758, "epoch": 89} {"train_loss": -4.150846481323242, "global_step": 3759, "epoch": 89} {"train_loss": -4.064162254333496, "global_step": 3760, "epoch": 89} {"train_loss": -4.134465217590332, "global_step": 3761, "epoch": 89} {"train_loss": -4.223199844360352, "global_step": 3762, "epoch": 89} {"train_loss": -4.193434715270996, "global_step": 3763, "epoch": 89} {"train_loss": -4.262732028961182, "global_step": 3764, "epoch": 89} {"train_loss": -4.283062934875488, "global_step": 3765, "epoch": 89} {"train_loss": -4.233773231506348, "global_step": 3766, "epoch": 89} {"train_loss": -4.223016738891602, "global_step": 3767, "epoch": 89} {"train_loss": -4.090307235717773, "global_step": 3768, "epoch": 89} {"train_loss": -4.147210121154785, "global_step": 3769, "epoch": 89} {"train_loss": -4.2429399490356445, "global_step": 3770, "epoch": 89} {"train_loss": -4.287558555603027, "global_step": 3771, "epoch": 89} {"train_loss": -4.329953193664551, "global_step": 3772, "epoch": 89} {"train_loss": -4.1132493019104, "global_step": 3773, "epoch": 89} {"train_loss": -4.188554763793945, "global_step": 3774, "epoch": 89} {"train_loss": -4.174544334411621, "global_step": 3775, "epoch": 89} {"train_loss": -4.417023658752441, "global_step": 3776, "epoch": 89} {"train_loss": -4.221798896789551, "global_step": 3777, "epoch": 89} {"train_loss": -4.176351547241211, "global_step": 3778, "epoch": 89} {"train_loss": -4.1690385682242255, "global_step": 3779, "epoch": 89, "val_loss": 108893.625} {"train_loss": -4.21893835067749, "global_step": 3780, "epoch": 90} {"train_loss": -3.970099687576294, "global_step": 3781, "epoch": 90} {"train_loss": -4.122230529785156, "global_step": 3782, "epoch": 90} {"train_loss": -4.294824600219727, "global_step": 3783, "epoch": 90} {"train_loss": -4.044323444366455, "global_step": 3784, "epoch": 90} {"train_loss": -4.330765724182129, "global_step": 3785, "epoch": 90} {"train_loss": -4.205466270446777, "global_step": 3786, "epoch": 90} {"train_loss": -4.006680488586426, "global_step": 3787, "epoch": 90} {"train_loss": -4.257233142852783, "global_step": 3788, "epoch": 90} {"train_loss": -4.120196342468262, "global_step": 3789, "epoch": 90} {"train_loss": -4.4612932205200195, "global_step": 3790, "epoch": 90} {"train_loss": -4.3416056632995605, "global_step": 3791, "epoch": 90} {"train_loss": -4.069859981536865, "global_step": 3792, "epoch": 90} {"train_loss": -4.242837429046631, "global_step": 3793, "epoch": 90} {"train_loss": -4.273707389831543, "global_step": 3794, "epoch": 90} {"train_loss": -4.215257167816162, "global_step": 3795, "epoch": 90} {"train_loss": -4.0261430740356445, "global_step": 3796, "epoch": 90} {"train_loss": -4.158124923706055, "global_step": 3797, "epoch": 90} {"train_loss": -4.266427993774414, "global_step": 3798, "epoch": 90} {"train_loss": -4.163433074951172, "global_step": 3799, "epoch": 90} {"train_loss": -4.198366165161133, "global_step": 3800, "epoch": 90} {"train_loss": -4.227794647216797, "global_step": 3801, "epoch": 90} {"train_loss": -4.301856517791748, "global_step": 3802, "epoch": 90} {"train_loss": -4.144284725189209, "global_step": 3803, "epoch": 90} {"train_loss": -4.258435249328613, "global_step": 3804, "epoch": 90} {"train_loss": -4.292438983917236, "global_step": 3805, "epoch": 90} {"train_loss": -4.11876106262207, "global_step": 3806, "epoch": 90} {"train_loss": -4.367005348205566, "global_step": 3807, "epoch": 90} {"train_loss": -4.160221576690674, "global_step": 3808, "epoch": 90} {"train_loss": -4.36993932723999, "global_step": 3809, "epoch": 90} {"train_loss": -4.358487129211426, "global_step": 3810, "epoch": 90} {"train_loss": -4.269241809844971, "global_step": 3811, "epoch": 90} {"train_loss": -4.2430830001831055, "global_step": 3812, "epoch": 90} {"train_loss": -4.217962265014648, "global_step": 3813, "epoch": 90} {"train_loss": -4.106113433837891, "global_step": 3814, "epoch": 90} {"train_loss": -4.263884544372559, "global_step": 3815, "epoch": 90} {"train_loss": -4.052647590637207, "global_step": 3816, "epoch": 90} {"train_loss": -4.384108543395996, "global_step": 3817, "epoch": 90} {"train_loss": -4.212368011474609, "global_step": 3818, "epoch": 90} {"train_loss": -4.068293571472168, "global_step": 3819, "epoch": 90} {"train_loss": -4.4110002517700195, "global_step": 3820, "epoch": 90} {"train_loss": -4.213803115345183, "global_step": 3821, "epoch": 90, "val_loss": 108489.3359375} {"train_loss": -4.169073104858398, "global_step": 3822, "epoch": 91} {"train_loss": -4.183445453643799, "global_step": 3823, "epoch": 91} {"train_loss": -4.379688262939453, "global_step": 3824, "epoch": 91} {"train_loss": -4.1465630531311035, "global_step": 3825, "epoch": 91} {"train_loss": -4.143276214599609, "global_step": 3826, "epoch": 91} {"train_loss": -4.352507591247559, "global_step": 3827, "epoch": 91} {"train_loss": -4.123551368713379, "global_step": 3828, "epoch": 91} {"train_loss": -4.23344612121582, "global_step": 3829, "epoch": 91} {"train_loss": -4.198060035705566, "global_step": 3830, "epoch": 91} {"train_loss": -4.378416061401367, "global_step": 3831, "epoch": 91} {"train_loss": -4.10440731048584, "global_step": 3832, "epoch": 91} {"train_loss": -4.223780155181885, "global_step": 3833, "epoch": 91} {"train_loss": -4.314907073974609, "global_step": 3834, "epoch": 91} {"train_loss": -4.2073163986206055, "global_step": 3835, "epoch": 91} {"train_loss": -4.393608093261719, "global_step": 3836, "epoch": 91} {"train_loss": -4.439778804779053, "global_step": 3837, "epoch": 91} {"train_loss": -4.192183971405029, "global_step": 3838, "epoch": 91} {"train_loss": -4.240531921386719, "global_step": 3839, "epoch": 91} {"train_loss": -4.209702491760254, "global_step": 3840, "epoch": 91} {"train_loss": -4.24069881439209, "global_step": 3841, "epoch": 91} {"train_loss": -4.280315399169922, "global_step": 3842, "epoch": 91} {"train_loss": -4.330987453460693, "global_step": 3843, "epoch": 91} {"train_loss": -4.1814045906066895, "global_step": 3844, "epoch": 91} {"train_loss": -4.093122482299805, "global_step": 3845, "epoch": 91} {"train_loss": -4.450753688812256, "global_step": 3846, "epoch": 91} {"train_loss": -4.357072830200195, "global_step": 3847, "epoch": 91} {"train_loss": -4.248392105102539, "global_step": 3848, "epoch": 91} {"train_loss": -4.144683837890625, "global_step": 3849, "epoch": 91} {"train_loss": -4.305361747741699, "global_step": 3850, "epoch": 91} {"train_loss": -4.311556816101074, "global_step": 3851, "epoch": 91} {"train_loss": -4.380712032318115, "global_step": 3852, "epoch": 91} {"train_loss": -4.464357376098633, "global_step": 3853, "epoch": 91} {"train_loss": -4.354949474334717, "global_step": 3854, "epoch": 91} {"train_loss": -4.346508979797363, "global_step": 3855, "epoch": 91} {"train_loss": -4.379738807678223, "global_step": 3856, "epoch": 91} {"train_loss": -4.256515026092529, "global_step": 3857, "epoch": 91} {"train_loss": -4.285149574279785, "global_step": 3858, "epoch": 91} {"train_loss": -4.499777793884277, "global_step": 3859, "epoch": 91} {"train_loss": -4.4653778076171875, "global_step": 3860, "epoch": 91} {"train_loss": -4.287613868713379, "global_step": 3861, "epoch": 91} {"train_loss": -4.150799751281738, "global_step": 3862, "epoch": 91} {"train_loss": -4.280599355697632, "global_step": 3863, "epoch": 91, "val_loss": 108028.09375} {"train_loss": -4.377792835235596, "global_step": 3864, "epoch": 92} {"train_loss": -4.369494915008545, "global_step": 3865, "epoch": 92} {"train_loss": -4.278529167175293, "global_step": 3866, "epoch": 92} {"train_loss": -4.249490261077881, "global_step": 3867, "epoch": 92} {"train_loss": -4.2862114906311035, "global_step": 3868, "epoch": 92} {"train_loss": -4.50232458114624, "global_step": 3869, "epoch": 92} {"train_loss": -4.20197868347168, "global_step": 3870, "epoch": 92} {"train_loss": -4.4527411460876465, "global_step": 3871, "epoch": 92} {"train_loss": -4.454161643981934, "global_step": 3872, "epoch": 92} {"train_loss": -4.119182586669922, "global_step": 3873, "epoch": 92} {"train_loss": -4.341343402862549, "global_step": 3874, "epoch": 92} {"train_loss": -4.226982116699219, "global_step": 3875, "epoch": 92} {"train_loss": -4.137419700622559, "global_step": 3876, "epoch": 92} {"train_loss": -4.310177803039551, "global_step": 3877, "epoch": 92} {"train_loss": -4.335689067840576, "global_step": 3878, "epoch": 92} {"train_loss": -4.259052276611328, "global_step": 3879, "epoch": 92} {"train_loss": -4.443532466888428, "global_step": 3880, "epoch": 92} {"train_loss": -4.293998718261719, "global_step": 3881, "epoch": 92} {"train_loss": -4.2493391036987305, "global_step": 3882, "epoch": 92} {"train_loss": -4.397047996520996, "global_step": 3883, "epoch": 92} {"train_loss": -4.384646415710449, "global_step": 3884, "epoch": 92} {"train_loss": -4.237829208374023, "global_step": 3885, "epoch": 92} {"train_loss": -4.069411277770996, "global_step": 3886, "epoch": 92} {"train_loss": -4.289689064025879, "global_step": 3887, "epoch": 92} {"train_loss": -4.270334720611572, "global_step": 3888, "epoch": 92} {"train_loss": -4.059386253356934, "global_step": 3889, "epoch": 92} {"train_loss": -4.321773529052734, "global_step": 3890, "epoch": 92} {"train_loss": -4.235384941101074, "global_step": 3891, "epoch": 92} {"train_loss": -4.259454250335693, "global_step": 3892, "epoch": 92} {"train_loss": -4.281335353851318, "global_step": 3893, "epoch": 92} {"train_loss": -4.240717887878418, "global_step": 3894, "epoch": 92} {"train_loss": -4.067890167236328, "global_step": 3895, "epoch": 92} {"train_loss": -4.3623046875, "global_step": 3896, "epoch": 92} {"train_loss": -4.251450061798096, "global_step": 3897, "epoch": 92} {"train_loss": -4.252341270446777, "global_step": 3898, "epoch": 92} {"train_loss": -4.071073055267334, "global_step": 3899, "epoch": 92} {"train_loss": -4.283268451690674, "global_step": 3900, "epoch": 92} {"train_loss": -4.289320945739746, "global_step": 3901, "epoch": 92} {"train_loss": -4.186374187469482, "global_step": 3902, "epoch": 92} {"train_loss": -4.410721778869629, "global_step": 3903, "epoch": 92} {"train_loss": -4.244738578796387, "global_step": 3904, "epoch": 92} {"train_loss": -4.278225660324097, "global_step": 3905, "epoch": 92, "val_loss": 106454.1015625} {"train_loss": -4.326503276824951, "global_step": 3906, "epoch": 93} {"train_loss": -4.261614799499512, "global_step": 3907, "epoch": 93} {"train_loss": -4.267470836639404, "global_step": 3908, "epoch": 93} {"train_loss": -4.280485153198242, "global_step": 3909, "epoch": 93} {"train_loss": -4.257902145385742, "global_step": 3910, "epoch": 93} {"train_loss": -4.400913238525391, "global_step": 3911, "epoch": 93} {"train_loss": -4.0986433029174805, "global_step": 3912, "epoch": 93} {"train_loss": -4.2664570808410645, "global_step": 3913, "epoch": 93} {"train_loss": -4.3535051345825195, "global_step": 3914, "epoch": 93} {"train_loss": -4.209763526916504, "global_step": 3915, "epoch": 93} {"train_loss": -4.251855373382568, "global_step": 3916, "epoch": 93} {"train_loss": -4.357204437255859, "global_step": 3917, "epoch": 93} {"train_loss": -4.307687282562256, "global_step": 3918, "epoch": 93} {"train_loss": -4.369054317474365, "global_step": 3919, "epoch": 93} {"train_loss": -4.293084144592285, "global_step": 3920, "epoch": 93} {"train_loss": -4.327108383178711, "global_step": 3921, "epoch": 93} {"train_loss": -4.04190731048584, "global_step": 3922, "epoch": 93} {"train_loss": -4.176391124725342, "global_step": 3923, "epoch": 93} {"train_loss": -4.376225471496582, "global_step": 3924, "epoch": 93} {"train_loss": -4.268982887268066, "global_step": 3925, "epoch": 93} {"train_loss": -4.262262344360352, "global_step": 3926, "epoch": 93} {"train_loss": -4.3604278564453125, "global_step": 3927, "epoch": 93} {"train_loss": -4.294731140136719, "global_step": 3928, "epoch": 93} {"train_loss": -4.345339298248291, "global_step": 3929, "epoch": 93} {"train_loss": -4.252569198608398, "global_step": 3930, "epoch": 93} {"train_loss": -4.417565822601318, "global_step": 3931, "epoch": 93} {"train_loss": -4.42525577545166, "global_step": 3932, "epoch": 93} {"train_loss": -4.417899131774902, "global_step": 3933, "epoch": 93} {"train_loss": -4.3911261558532715, "global_step": 3934, "epoch": 93} {"train_loss": -4.402803897857666, "global_step": 3935, "epoch": 93} {"train_loss": -4.377458572387695, "global_step": 3936, "epoch": 93} {"train_loss": -4.290599822998047, "global_step": 3937, "epoch": 93} {"train_loss": -4.042975902557373, "global_step": 3938, "epoch": 93} {"train_loss": -4.318930149078369, "global_step": 3939, "epoch": 93} {"train_loss": -3.871377468109131, "global_step": 3940, "epoch": 93} {"train_loss": -4.0754194259643555, "global_step": 3941, "epoch": 93} {"train_loss": -4.132180213928223, "global_step": 3942, "epoch": 93} {"train_loss": -4.166121482849121, "global_step": 3943, "epoch": 93} {"train_loss": -4.093656539916992, "global_step": 3944, "epoch": 93} {"train_loss": -4.080463409423828, "global_step": 3945, "epoch": 93} {"train_loss": -4.457653999328613, "global_step": 3946, "epoch": 93} {"train_loss": -4.269870758056641, "global_step": 3947, "epoch": 93, "val_loss": 108878.125} {"train_loss": -4.377974510192871, "global_step": 3948, "epoch": 94} {"train_loss": -4.2203826904296875, "global_step": 3949, "epoch": 94} {"train_loss": -4.342418670654297, "global_step": 3950, "epoch": 94} {"train_loss": -4.257884979248047, "global_step": 3951, "epoch": 94} {"train_loss": -4.347590446472168, "global_step": 3952, "epoch": 94} {"train_loss": -4.384991645812988, "global_step": 3953, "epoch": 94} {"train_loss": -4.24970817565918, "global_step": 3954, "epoch": 94} {"train_loss": -4.406050682067871, "global_step": 3955, "epoch": 94} {"train_loss": -4.2229766845703125, "global_step": 3956, "epoch": 94} {"train_loss": -4.3951263427734375, "global_step": 3957, "epoch": 94} {"train_loss": -4.464776039123535, "global_step": 3958, "epoch": 94} {"train_loss": -4.367011070251465, "global_step": 3959, "epoch": 94} {"train_loss": -4.213287353515625, "global_step": 3960, "epoch": 94} {"train_loss": -4.349944591522217, "global_step": 3961, "epoch": 94} {"train_loss": -4.156245231628418, "global_step": 3962, "epoch": 94} {"train_loss": -4.387411117553711, "global_step": 3963, "epoch": 94} {"train_loss": -4.186785697937012, "global_step": 3964, "epoch": 94} {"train_loss": -4.33876895904541, "global_step": 3965, "epoch": 94} {"train_loss": -4.228823661804199, "global_step": 3966, "epoch": 94} {"train_loss": -4.239633560180664, "global_step": 3967, "epoch": 94} {"train_loss": -4.255088806152344, "global_step": 3968, "epoch": 94} {"train_loss": -4.212980270385742, "global_step": 3969, "epoch": 94} {"train_loss": -4.331347465515137, "global_step": 3970, "epoch": 94} {"train_loss": -4.328481674194336, "global_step": 3971, "epoch": 94} {"train_loss": -4.4287004470825195, "global_step": 3972, "epoch": 94} {"train_loss": -4.330926895141602, "global_step": 3973, "epoch": 94} {"train_loss": -4.376704216003418, "global_step": 3974, "epoch": 94} {"train_loss": -4.380107879638672, "global_step": 3975, "epoch": 94} {"train_loss": -4.331928253173828, "global_step": 3976, "epoch": 94} {"train_loss": -4.365538120269775, "global_step": 3977, "epoch": 94} {"train_loss": -4.531288146972656, "global_step": 3978, "epoch": 94} {"train_loss": -4.374519348144531, "global_step": 3979, "epoch": 94} {"train_loss": -4.36792516708374, "global_step": 3980, "epoch": 94} {"train_loss": -4.365808486938477, "global_step": 3981, "epoch": 94} {"train_loss": -4.287989616394043, "global_step": 3982, "epoch": 94} {"train_loss": -4.330081939697266, "global_step": 3983, "epoch": 94} {"train_loss": -4.352925777435303, "global_step": 3984, "epoch": 94} {"train_loss": -4.274065971374512, "global_step": 3985, "epoch": 94} {"train_loss": -4.302088260650635, "global_step": 3986, "epoch": 94} {"train_loss": -4.258498191833496, "global_step": 3987, "epoch": 94} {"train_loss": -4.384367942810059, "global_step": 3988, "epoch": 94} {"train_loss": -4.32453483626956, "global_step": 3989, "epoch": 94, "val_loss": 105936.375} {"train_loss": -4.5542802810668945, "global_step": 3990, "epoch": 95} {"train_loss": -4.486364841461182, "global_step": 3991, "epoch": 95} {"train_loss": -4.359927177429199, "global_step": 3992, "epoch": 95} {"train_loss": -4.3956098556518555, "global_step": 3993, "epoch": 95} {"train_loss": -4.304909706115723, "global_step": 3994, "epoch": 95} {"train_loss": -4.474826335906982, "global_step": 3995, "epoch": 95} {"train_loss": -4.310421943664551, "global_step": 3996, "epoch": 95} {"train_loss": -4.368526935577393, "global_step": 3997, "epoch": 95} {"train_loss": -4.2189226150512695, "global_step": 3998, "epoch": 95} {"train_loss": -4.3188323974609375, "global_step": 3999, "epoch": 95} {"train_loss": -4.288152694702148, "global_step": 4000, "epoch": 95} {"train_loss": -4.4024553298950195, "global_step": 4001, "epoch": 95} {"train_loss": -4.41280460357666, "global_step": 4002, "epoch": 95} {"train_loss": -4.288539886474609, "global_step": 4003, "epoch": 95} {"train_loss": -4.26405143737793, "global_step": 4004, "epoch": 95} {"train_loss": -4.140081882476807, "global_step": 4005, "epoch": 95} {"train_loss": -4.452666282653809, "global_step": 4006, "epoch": 95} {"train_loss": -4.446660995483398, "global_step": 4007, "epoch": 95} {"train_loss": -4.334980010986328, "global_step": 4008, "epoch": 95} {"train_loss": -4.37578010559082, "global_step": 4009, "epoch": 95} {"train_loss": -4.352977752685547, "global_step": 4010, "epoch": 95} {"train_loss": -4.46864128112793, "global_step": 4011, "epoch": 95} {"train_loss": -4.304409027099609, "global_step": 4012, "epoch": 95} {"train_loss": -4.3097357749938965, "global_step": 4013, "epoch": 95} {"train_loss": -4.3570756912231445, "global_step": 4014, "epoch": 95} {"train_loss": -4.215737342834473, "global_step": 4015, "epoch": 95} {"train_loss": -4.024299621582031, "global_step": 4016, "epoch": 95} {"train_loss": -4.107201099395752, "global_step": 4017, "epoch": 95} {"train_loss": -4.313023090362549, "global_step": 4018, "epoch": 95} {"train_loss": -4.315899848937988, "global_step": 4019, "epoch": 95} {"train_loss": -3.9318692684173584, "global_step": 4020, "epoch": 95} {"train_loss": -4.289331436157227, "global_step": 4021, "epoch": 95} {"train_loss": -4.076911449432373, "global_step": 4022, "epoch": 95} {"train_loss": -4.15709114074707, "global_step": 4023, "epoch": 95} {"train_loss": -4.372555255889893, "global_step": 4024, "epoch": 95} {"train_loss": -4.333052635192871, "global_step": 4025, "epoch": 95} {"train_loss": -4.359099388122559, "global_step": 4026, "epoch": 95} {"train_loss": -4.145260810852051, "global_step": 4027, "epoch": 95} {"train_loss": -4.3371076583862305, "global_step": 4028, "epoch": 95} {"train_loss": -4.288600444793701, "global_step": 4029, "epoch": 95} {"train_loss": -4.357043743133545, "global_step": 4030, "epoch": 95} {"train_loss": -4.3110533725647695, "global_step": 4031, "epoch": 95, "val_loss": 105847.921875} {"train_loss": -4.259210586547852, "global_step": 4032, "epoch": 96} {"train_loss": -4.255496025085449, "global_step": 4033, "epoch": 96} {"train_loss": -4.28120231628418, "global_step": 4034, "epoch": 96} {"train_loss": -4.330636978149414, "global_step": 4035, "epoch": 96} {"train_loss": -4.299144744873047, "global_step": 4036, "epoch": 96} {"train_loss": -4.3318915367126465, "global_step": 4037, "epoch": 96} {"train_loss": -4.373274326324463, "global_step": 4038, "epoch": 96} {"train_loss": -4.293146133422852, "global_step": 4039, "epoch": 96} {"train_loss": -4.3325958251953125, "global_step": 4040, "epoch": 96} {"train_loss": -4.360112190246582, "global_step": 4041, "epoch": 96} {"train_loss": -4.465605735778809, "global_step": 4042, "epoch": 96} {"train_loss": -4.333346366882324, "global_step": 4043, "epoch": 96} {"train_loss": -4.35887336730957, "global_step": 4044, "epoch": 96} {"train_loss": -4.26629114151001, "global_step": 4045, "epoch": 96} {"train_loss": -4.270151615142822, "global_step": 4046, "epoch": 96} {"train_loss": -4.424321174621582, "global_step": 4047, "epoch": 96} {"train_loss": -4.322566032409668, "global_step": 4048, "epoch": 96} {"train_loss": -4.345454216003418, "global_step": 4049, "epoch": 96} {"train_loss": -4.53252649307251, "global_step": 4050, "epoch": 96} {"train_loss": -4.386484146118164, "global_step": 4051, "epoch": 96} {"train_loss": -4.212035179138184, "global_step": 4052, "epoch": 96} {"train_loss": -4.345876693725586, "global_step": 4053, "epoch": 96} {"train_loss": -4.444817543029785, "global_step": 4054, "epoch": 96} {"train_loss": -4.2968549728393555, "global_step": 4055, "epoch": 96} {"train_loss": -4.371458053588867, "global_step": 4056, "epoch": 96} {"train_loss": -4.335356712341309, "global_step": 4057, "epoch": 96} {"train_loss": -4.3303728103637695, "global_step": 4058, "epoch": 96} {"train_loss": -4.4392194747924805, "global_step": 4059, "epoch": 96} {"train_loss": -4.373908042907715, "global_step": 4060, "epoch": 96} {"train_loss": -4.100491046905518, "global_step": 4061, "epoch": 96} {"train_loss": -4.1412739753723145, "global_step": 4062, "epoch": 96} {"train_loss": -4.202854156494141, "global_step": 4063, "epoch": 96} {"train_loss": -3.76283597946167, "global_step": 4064, "epoch": 96} {"train_loss": -4.2939348220825195, "global_step": 4065, "epoch": 96} {"train_loss": -3.8955867290496826, "global_step": 4066, "epoch": 96} {"train_loss": -3.908289909362793, "global_step": 4067, "epoch": 96} {"train_loss": -4.1831889152526855, "global_step": 4068, "epoch": 96} {"train_loss": -3.9476168155670166, "global_step": 4069, "epoch": 96} {"train_loss": -4.22262716293335, "global_step": 4070, "epoch": 96} {"train_loss": -4.049271583557129, "global_step": 4071, "epoch": 96} {"train_loss": -4.252697467803955, "global_step": 4072, "epoch": 96} {"train_loss": -4.264045522326515, "global_step": 4073, "epoch": 96, "val_loss": 103972.0625} {"train_loss": -4.239791393280029, "global_step": 4074, "epoch": 97} {"train_loss": -4.157487869262695, "global_step": 4075, "epoch": 97} {"train_loss": -4.2092485427856445, "global_step": 4076, "epoch": 97} {"train_loss": -4.28019905090332, "global_step": 4077, "epoch": 97} {"train_loss": -4.182348251342773, "global_step": 4078, "epoch": 97} {"train_loss": -4.301726818084717, "global_step": 4079, "epoch": 97} {"train_loss": -4.258825778961182, "global_step": 4080, "epoch": 97} {"train_loss": -4.141057968139648, "global_step": 4081, "epoch": 97} {"train_loss": -4.325193881988525, "global_step": 4082, "epoch": 97} {"train_loss": -4.331695556640625, "global_step": 4083, "epoch": 97} {"train_loss": -4.247171401977539, "global_step": 4084, "epoch": 97} {"train_loss": -4.291741847991943, "global_step": 4085, "epoch": 97} {"train_loss": -4.334229469299316, "global_step": 4086, "epoch": 97} {"train_loss": -4.29632568359375, "global_step": 4087, "epoch": 97} {"train_loss": -4.263833999633789, "global_step": 4088, "epoch": 97} {"train_loss": -4.337090492248535, "global_step": 4089, "epoch": 97} {"train_loss": -4.370112419128418, "global_step": 4090, "epoch": 97} {"train_loss": -4.298188209533691, "global_step": 4091, "epoch": 97} {"train_loss": -4.417145729064941, "global_step": 4092, "epoch": 97} {"train_loss": -4.483766078948975, "global_step": 4093, "epoch": 97} {"train_loss": -4.361553192138672, "global_step": 4094, "epoch": 97} {"train_loss": -4.423766136169434, "global_step": 4095, "epoch": 97} {"train_loss": -4.436090469360352, "global_step": 4096, "epoch": 97} {"train_loss": -4.213015556335449, "global_step": 4097, "epoch": 97} {"train_loss": -4.099605560302734, "global_step": 4098, "epoch": 97} {"train_loss": -4.230160713195801, "global_step": 4099, "epoch": 97} {"train_loss": -4.3754048347473145, "global_step": 4100, "epoch": 97} {"train_loss": -4.251741886138916, "global_step": 4101, "epoch": 97} {"train_loss": -4.395034313201904, "global_step": 4102, "epoch": 97} {"train_loss": -4.424567699432373, "global_step": 4103, "epoch": 97} {"train_loss": -4.338772773742676, "global_step": 4104, "epoch": 97} {"train_loss": -4.4518280029296875, "global_step": 4105, "epoch": 97} {"train_loss": -4.3106865882873535, "global_step": 4106, "epoch": 97} {"train_loss": -4.528660297393799, "global_step": 4107, "epoch": 97} {"train_loss": -4.33693265914917, "global_step": 4108, "epoch": 97} {"train_loss": -4.4237895011901855, "global_step": 4109, "epoch": 97} {"train_loss": -4.29560661315918, "global_step": 4110, "epoch": 97} {"train_loss": -4.290609359741211, "global_step": 4111, "epoch": 97} {"train_loss": -4.442753791809082, "global_step": 4112, "epoch": 97} {"train_loss": -4.507652282714844, "global_step": 4113, "epoch": 97} {"train_loss": -4.342489719390869, "global_step": 4114, "epoch": 97} {"train_loss": -4.323307752609253, "global_step": 4115, "epoch": 97, "val_loss": 101982.125} {"train_loss": -4.5433430671691895, "global_step": 4116, "epoch": 98} {"train_loss": -4.409080982208252, "global_step": 4117, "epoch": 98} {"train_loss": -4.3066864013671875, "global_step": 4118, "epoch": 98} {"train_loss": -4.467885971069336, "global_step": 4119, "epoch": 98} {"train_loss": -4.361124515533447, "global_step": 4120, "epoch": 98} {"train_loss": -4.426433086395264, "global_step": 4121, "epoch": 98} {"train_loss": -4.490260124206543, "global_step": 4122, "epoch": 98} {"train_loss": -4.366708755493164, "global_step": 4123, "epoch": 98} {"train_loss": -4.3910746574401855, "global_step": 4124, "epoch": 98} {"train_loss": -4.274969100952148, "global_step": 4125, "epoch": 98} {"train_loss": -4.32828950881958, "global_step": 4126, "epoch": 98} {"train_loss": -4.356074333190918, "global_step": 4127, "epoch": 98} {"train_loss": -4.482149124145508, "global_step": 4128, "epoch": 98} {"train_loss": -4.338345527648926, "global_step": 4129, "epoch": 98} {"train_loss": -4.509336471557617, "global_step": 4130, "epoch": 98} {"train_loss": -4.471404552459717, "global_step": 4131, "epoch": 98} {"train_loss": -4.592889785766602, "global_step": 4132, "epoch": 98} {"train_loss": -4.493711471557617, "global_step": 4133, "epoch": 98} {"train_loss": -4.288658142089844, "global_step": 4134, "epoch": 98} {"train_loss": -4.523860931396484, "global_step": 4135, "epoch": 98} {"train_loss": -4.473867416381836, "global_step": 4136, "epoch": 98} {"train_loss": -4.259555339813232, "global_step": 4137, "epoch": 98} {"train_loss": -4.321107864379883, "global_step": 4138, "epoch": 98} {"train_loss": -4.309722900390625, "global_step": 4139, "epoch": 98} {"train_loss": -4.388962745666504, "global_step": 4140, "epoch": 98} {"train_loss": -4.447323322296143, "global_step": 4141, "epoch": 98} {"train_loss": -4.622709274291992, "global_step": 4142, "epoch": 98} {"train_loss": -4.473118782043457, "global_step": 4143, "epoch": 98} {"train_loss": -4.477031707763672, "global_step": 4144, "epoch": 98} {"train_loss": -4.299433708190918, "global_step": 4145, "epoch": 98} {"train_loss": -4.232666015625, "global_step": 4146, "epoch": 98} {"train_loss": -4.149640083312988, "global_step": 4147, "epoch": 98} {"train_loss": -4.1457624435424805, "global_step": 4148, "epoch": 98} {"train_loss": -4.460810661315918, "global_step": 4149, "epoch": 98} {"train_loss": -4.246531963348389, "global_step": 4150, "epoch": 98} {"train_loss": -4.209167957305908, "global_step": 4151, "epoch": 98} {"train_loss": -4.395944595336914, "global_step": 4152, "epoch": 98} {"train_loss": -4.399501800537109, "global_step": 4153, "epoch": 98} {"train_loss": -4.088217258453369, "global_step": 4154, "epoch": 98} {"train_loss": -4.260366439819336, "global_step": 4155, "epoch": 98} {"train_loss": -4.283322334289551, "global_step": 4156, "epoch": 98} {"train_loss": -4.37487318402245, "global_step": 4157, "epoch": 98, "val_loss": 104171.484375} {"train_loss": -4.4655890464782715, "global_step": 4158, "epoch": 99} {"train_loss": -4.4491729736328125, "global_step": 4159, "epoch": 99} {"train_loss": -4.310002326965332, "global_step": 4160, "epoch": 99} {"train_loss": -4.508199691772461, "global_step": 4161, "epoch": 99} {"train_loss": -4.54856538772583, "global_step": 4162, "epoch": 99} {"train_loss": -4.364995956420898, "global_step": 4163, "epoch": 99} {"train_loss": -4.3831892013549805, "global_step": 4164, "epoch": 99} {"train_loss": -4.393047332763672, "global_step": 4165, "epoch": 99} {"train_loss": -4.41124153137207, "global_step": 4166, "epoch": 99} {"train_loss": -4.343052864074707, "global_step": 4167, "epoch": 99} {"train_loss": -4.387577056884766, "global_step": 4168, "epoch": 99} {"train_loss": -4.40582275390625, "global_step": 4169, "epoch": 99} {"train_loss": -4.453916549682617, "global_step": 4170, "epoch": 99} {"train_loss": -4.311498641967773, "global_step": 4171, "epoch": 99} {"train_loss": -4.40647029876709, "global_step": 4172, "epoch": 99} {"train_loss": -4.456331253051758, "global_step": 4173, "epoch": 99} {"train_loss": -4.236246109008789, "global_step": 4174, "epoch": 99} {"train_loss": -4.281262397766113, "global_step": 4175, "epoch": 99} {"train_loss": -4.1392974853515625, "global_step": 4176, "epoch": 99} {"train_loss": -3.8987293243408203, "global_step": 4177, "epoch": 99} {"train_loss": -3.9460554122924805, "global_step": 4178, "epoch": 99} {"train_loss": -4.29028844833374, "global_step": 4179, "epoch": 99} {"train_loss": -4.357115745544434, "global_step": 4180, "epoch": 99} {"train_loss": -4.2281718254089355, "global_step": 4181, "epoch": 99} {"train_loss": -4.143126487731934, "global_step": 4182, "epoch": 99} {"train_loss": -4.323759078979492, "global_step": 4183, "epoch": 99} {"train_loss": -4.299552917480469, "global_step": 4184, "epoch": 99} {"train_loss": -4.304791450500488, "global_step": 4185, "epoch": 99} {"train_loss": -4.14266300201416, "global_step": 4186, "epoch": 99} {"train_loss": -4.249519348144531, "global_step": 4187, "epoch": 99} {"train_loss": -4.200117111206055, "global_step": 4188, "epoch": 99} {"train_loss": -4.235888481140137, "global_step": 4189, "epoch": 99} {"train_loss": -4.171056270599365, "global_step": 4190, "epoch": 99} {"train_loss": -4.114620685577393, "global_step": 4191, "epoch": 99} {"train_loss": -4.331930160522461, "global_step": 4192, "epoch": 99} {"train_loss": -4.392607688903809, "global_step": 4193, "epoch": 99} {"train_loss": -4.279812335968018, "global_step": 4194, "epoch": 99} {"train_loss": -4.376190185546875, "global_step": 4195, "epoch": 99} {"train_loss": -4.438381671905518, "global_step": 4196, "epoch": 99} {"train_loss": -4.32973575592041, "global_step": 4197, "epoch": 99} {"train_loss": -4.377307415008545, "global_step": 4198, "epoch": 99} {"train_loss": -4.312011468978155, "global_step": 4199, "epoch": 99, "val_loss": 101586.96875} {"train_loss": -4.324489593505859, "global_step": 4200, "epoch": 100} {"train_loss": -4.409955978393555, "global_step": 4201, "epoch": 100} {"train_loss": -4.446681976318359, "global_step": 4202, "epoch": 100} {"train_loss": -4.361928939819336, "global_step": 4203, "epoch": 100} {"train_loss": -4.3919677734375, "global_step": 4204, "epoch": 100} {"train_loss": -4.43420934677124, "global_step": 4205, "epoch": 100} {"train_loss": -4.488226413726807, "global_step": 4206, "epoch": 100} {"train_loss": -4.468177795410156, "global_step": 4207, "epoch": 100} {"train_loss": -4.4750213623046875, "global_step": 4208, "epoch": 100} {"train_loss": -4.410764217376709, "global_step": 4209, "epoch": 100} {"train_loss": -4.510424613952637, "global_step": 4210, "epoch": 100} {"train_loss": -4.380716323852539, "global_step": 4211, "epoch": 100} {"train_loss": -4.530901908874512, "global_step": 4212, "epoch": 100} {"train_loss": -4.374459266662598, "global_step": 4213, "epoch": 100} {"train_loss": -4.54814338684082, "global_step": 4214, "epoch": 100} {"train_loss": -4.263364791870117, "global_step": 4215, "epoch": 100} {"train_loss": -4.317501068115234, "global_step": 4216, "epoch": 100} {"train_loss": -4.417766571044922, "global_step": 4217, "epoch": 100} {"train_loss": -4.4268879890441895, "global_step": 4218, "epoch": 100} {"train_loss": -4.493549346923828, "global_step": 4219, "epoch": 100} {"train_loss": -4.301024436950684, "global_step": 4220, "epoch": 100} {"train_loss": -4.430579662322998, "global_step": 4221, "epoch": 100} {"train_loss": -4.342749118804932, "global_step": 4222, "epoch": 100} {"train_loss": -4.028481483459473, "global_step": 4223, "epoch": 100} {"train_loss": -4.189981460571289, "global_step": 4224, "epoch": 100} {"train_loss": -4.376276969909668, "global_step": 4225, "epoch": 100} {"train_loss": -4.387401580810547, "global_step": 4226, "epoch": 100} {"train_loss": -4.273564338684082, "global_step": 4227, "epoch": 100} {"train_loss": -4.468802452087402, "global_step": 4228, "epoch": 100} {"train_loss": -4.350078582763672, "global_step": 4229, "epoch": 100} {"train_loss": -4.373161315917969, "global_step": 4230, "epoch": 100} {"train_loss": -4.267086029052734, "global_step": 4231, "epoch": 100} {"train_loss": -4.428342819213867, "global_step": 4232, "epoch": 100} {"train_loss": -4.4167633056640625, "global_step": 4233, "epoch": 100} {"train_loss": -4.401398658752441, "global_step": 4234, "epoch": 100} {"train_loss": -4.321800231933594, "global_step": 4235, "epoch": 100} {"train_loss": -4.417877197265625, "global_step": 4236, "epoch": 100} {"train_loss": -4.498996734619141, "global_step": 4237, "epoch": 100} {"train_loss": -4.443068504333496, "global_step": 4238, "epoch": 100} {"train_loss": -4.26618766784668, "global_step": 4239, "epoch": 100} {"train_loss": -4.351380348205566, "global_step": 4240, "epoch": 100} {"train_loss": -4.3848241964976, "global_step": 4241, "epoch": 100, "train/sim_max_reward_0": 0.1954521622783382, "train/sim_max_reward_1": 0.0033310335652570145, "train/sim_max_reward_2": 0.27333862530939207, "train/sim_max_reward_3": 0.07533144974326397, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.19361130651752678, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.18595249437928857, "test/sim_max_reward_4300002": 0.4592167704375657, "test/sim_max_reward_4300003": 0.2841017370417513, "test/sim_max_reward_4300004": 0.22985729103897057, "test/sim_max_reward_4300005": 0.2708923028398744, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.4113886304539096, "test/sim_max_reward_4300008": 0.0, "test/sim_max_reward_4300009": 0.00022323700018118755, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.05037829994571917, "test/sim_max_reward_4300012": 0.3266366821019302, "test/sim_max_reward_4300013": 0.40102468770185185, "test/sim_max_reward_4300014": 0.20966916140869507, "test/sim_max_reward_4300015": 0.2406835783390168, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.4292296690712788, "test/sim_max_reward_4300018": 0.0, "test/sim_max_reward_4300019": 0.18480292685684, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.3041463821064192, "test/sim_max_reward_4300022": 0.04201593845211718, "test/sim_max_reward_4300023": 0.3329516950215018, "test/sim_max_reward_4300024": 0.19350814803491512, "test/sim_max_reward_4300025": 0.12397361995963062, "test/sim_max_reward_4300026": 0.2183726183132791, "test/sim_max_reward_4300027": 0.0, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.0016321922435916195, "test/sim_max_reward_4300032": 0.44320458295888465, "test/sim_max_reward_4300033": 0.35234157964137924, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.08503333936424134, "test/sim_max_reward_4300036": 0.19932963306586157, "test/sim_max_reward_4300037": 0.5527122599440878, "test/sim_max_reward_4300038": 0.36815357704816415, "test/sim_max_reward_4300039": 0.4344322671048987, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.27363473191281656, "test/sim_max_reward_4300043": 0.01912165197990456, "test/sim_max_reward_4300044": 0.06625216004612239, "test/sim_max_reward_4300045": 0.11771219793176359, "test/sim_max_reward_4300046": 0.0, "test/sim_max_reward_4300047": 0.13641398180172895, "test/sim_max_reward_4300048": 0.2891328981870391, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.12509464749741792, "test/mean_score": 0.16476265847470445, "val_loss": 103787.6875} {"train_loss": -4.327613830566406, "global_step": 4242, "epoch": 101} {"train_loss": -4.389378547668457, "global_step": 4243, "epoch": 101} {"train_loss": -4.462754249572754, "global_step": 4244, "epoch": 101} {"train_loss": -4.342252731323242, "global_step": 4245, "epoch": 101} {"train_loss": -4.385904312133789, "global_step": 4246, "epoch": 101} {"train_loss": -4.481494903564453, "global_step": 4247, "epoch": 101} {"train_loss": -4.3259196281433105, "global_step": 4248, "epoch": 101} {"train_loss": -4.4087066650390625, "global_step": 4249, "epoch": 101} {"train_loss": -4.325446128845215, "global_step": 4250, "epoch": 101} {"train_loss": -4.508395195007324, "global_step": 4251, "epoch": 101} {"train_loss": -4.404268264770508, "global_step": 4252, "epoch": 101} {"train_loss": -4.390056610107422, "global_step": 4253, "epoch": 101} {"train_loss": -4.554144382476807, "global_step": 4254, "epoch": 101} {"train_loss": -4.691901206970215, "global_step": 4255, "epoch": 101} {"train_loss": -4.358024597167969, "global_step": 4256, "epoch": 101} {"train_loss": -4.411195278167725, "global_step": 4257, "epoch": 101} {"train_loss": -4.34967041015625, "global_step": 4258, "epoch": 101} {"train_loss": -4.410743713378906, "global_step": 4259, "epoch": 101} {"train_loss": -4.294769763946533, "global_step": 4260, "epoch": 101} {"train_loss": -4.242087364196777, "global_step": 4261, "epoch": 101} {"train_loss": -4.3968658447265625, "global_step": 4262, "epoch": 101} {"train_loss": -4.337747097015381, "global_step": 4263, "epoch": 101} {"train_loss": -4.36366605758667, "global_step": 4264, "epoch": 101} {"train_loss": -4.336347579956055, "global_step": 4265, "epoch": 101} {"train_loss": -4.364285945892334, "global_step": 4266, "epoch": 101} {"train_loss": -4.354023456573486, "global_step": 4267, "epoch": 101} {"train_loss": -4.4598517417907715, "global_step": 4268, "epoch": 101} {"train_loss": -4.328821182250977, "global_step": 4269, "epoch": 101} {"train_loss": -4.381322860717773, "global_step": 4270, "epoch": 101} {"train_loss": -4.230249404907227, "global_step": 4271, "epoch": 101} {"train_loss": -4.192391395568848, "global_step": 4272, "epoch": 101} {"train_loss": -4.330163478851318, "global_step": 4273, "epoch": 101} {"train_loss": -4.415774345397949, "global_step": 4274, "epoch": 101} {"train_loss": -4.41454553604126, "global_step": 4275, "epoch": 101} {"train_loss": -4.397867202758789, "global_step": 4276, "epoch": 101} {"train_loss": -4.4678473472595215, "global_step": 4277, "epoch": 101} {"train_loss": -4.43818473815918, "global_step": 4278, "epoch": 101} {"train_loss": -4.322878837585449, "global_step": 4279, "epoch": 101} {"train_loss": -4.228307723999023, "global_step": 4280, "epoch": 101} {"train_loss": -4.124251365661621, "global_step": 4281, "epoch": 101} {"train_loss": -4.0275421142578125, "global_step": 4282, "epoch": 101} {"train_loss": -4.3530376354853315, "global_step": 4283, "epoch": 101, "val_loss": 103259.7734375} {"train_loss": -4.193327903747559, "global_step": 4284, "epoch": 102} {"train_loss": -4.356900215148926, "global_step": 4285, "epoch": 102} {"train_loss": -4.092960357666016, "global_step": 4286, "epoch": 102} {"train_loss": -3.9595065116882324, "global_step": 4287, "epoch": 102} {"train_loss": -4.082286834716797, "global_step": 4288, "epoch": 102} {"train_loss": -4.430990219116211, "global_step": 4289, "epoch": 102} {"train_loss": -4.155689239501953, "global_step": 4290, "epoch": 102} {"train_loss": -4.347350120544434, "global_step": 4291, "epoch": 102} {"train_loss": -4.178997039794922, "global_step": 4292, "epoch": 102} {"train_loss": -4.18804931640625, "global_step": 4293, "epoch": 102} {"train_loss": -4.347486972808838, "global_step": 4294, "epoch": 102} {"train_loss": -4.372389793395996, "global_step": 4295, "epoch": 102} {"train_loss": -4.282351493835449, "global_step": 4296, "epoch": 102} {"train_loss": -4.444779872894287, "global_step": 4297, "epoch": 102} {"train_loss": -4.391190528869629, "global_step": 4298, "epoch": 102} {"train_loss": -4.338386535644531, "global_step": 4299, "epoch": 102} {"train_loss": -4.359535217285156, "global_step": 4300, "epoch": 102} {"train_loss": -4.390794277191162, "global_step": 4301, "epoch": 102} {"train_loss": -4.451043128967285, "global_step": 4302, "epoch": 102} {"train_loss": -4.412495136260986, "global_step": 4303, "epoch": 102} {"train_loss": -4.538887977600098, "global_step": 4304, "epoch": 102} {"train_loss": -4.333285808563232, "global_step": 4305, "epoch": 102} {"train_loss": -4.363585472106934, "global_step": 4306, "epoch": 102} {"train_loss": -4.262955665588379, "global_step": 4307, "epoch": 102} {"train_loss": -4.4019927978515625, "global_step": 4308, "epoch": 102} {"train_loss": -4.386056900024414, "global_step": 4309, "epoch": 102} {"train_loss": -4.2682576179504395, "global_step": 4310, "epoch": 102} {"train_loss": -4.251978397369385, "global_step": 4311, "epoch": 102} {"train_loss": -4.382262229919434, "global_step": 4312, "epoch": 102} {"train_loss": -4.426544189453125, "global_step": 4313, "epoch": 102} {"train_loss": -4.250080585479736, "global_step": 4314, "epoch": 102} {"train_loss": -4.084822177886963, "global_step": 4315, "epoch": 102} {"train_loss": -4.332417011260986, "global_step": 4316, "epoch": 102} {"train_loss": -3.992147445678711, "global_step": 4317, "epoch": 102} {"train_loss": -4.135697841644287, "global_step": 4318, "epoch": 102} {"train_loss": -4.412097454071045, "global_step": 4319, "epoch": 102} {"train_loss": -4.1662211418151855, "global_step": 4320, "epoch": 102} {"train_loss": -4.475639343261719, "global_step": 4321, "epoch": 102} {"train_loss": -4.160555839538574, "global_step": 4322, "epoch": 102} {"train_loss": -4.520565986633301, "global_step": 4323, "epoch": 102} {"train_loss": -4.281479835510254, "global_step": 4324, "epoch": 102} {"train_loss": -4.296572560355777, "global_step": 4325, "epoch": 102, "val_loss": 102396.8359375} {"train_loss": -4.313303470611572, "global_step": 4326, "epoch": 103} {"train_loss": -4.351380348205566, "global_step": 4327, "epoch": 103} {"train_loss": -4.234921455383301, "global_step": 4328, "epoch": 103} {"train_loss": -4.423140525817871, "global_step": 4329, "epoch": 103} {"train_loss": -4.2584638595581055, "global_step": 4330, "epoch": 103} {"train_loss": -4.346408843994141, "global_step": 4331, "epoch": 103} {"train_loss": -4.399864196777344, "global_step": 4332, "epoch": 103} {"train_loss": -4.476316452026367, "global_step": 4333, "epoch": 103} {"train_loss": -4.4477338790893555, "global_step": 4334, "epoch": 103} {"train_loss": -4.452033996582031, "global_step": 4335, "epoch": 103} {"train_loss": -4.477477073669434, "global_step": 4336, "epoch": 103} {"train_loss": -4.4718427658081055, "global_step": 4337, "epoch": 103} {"train_loss": -4.515401840209961, "global_step": 4338, "epoch": 103} {"train_loss": -4.343846797943115, "global_step": 4339, "epoch": 103} {"train_loss": -4.457039833068848, "global_step": 4340, "epoch": 103} {"train_loss": -4.445505142211914, "global_step": 4341, "epoch": 103} {"train_loss": -4.453639030456543, "global_step": 4342, "epoch": 103} {"train_loss": -4.279850482940674, "global_step": 4343, "epoch": 103} {"train_loss": -4.162034034729004, "global_step": 4344, "epoch": 103} {"train_loss": -4.369809150695801, "global_step": 4345, "epoch": 103} {"train_loss": -4.390487194061279, "global_step": 4346, "epoch": 103} {"train_loss": -4.404718399047852, "global_step": 4347, "epoch": 103} {"train_loss": -4.405852317810059, "global_step": 4348, "epoch": 103} {"train_loss": -4.395566463470459, "global_step": 4349, "epoch": 103} {"train_loss": -4.500002384185791, "global_step": 4350, "epoch": 103} {"train_loss": -4.489813327789307, "global_step": 4351, "epoch": 103} {"train_loss": -4.456918716430664, "global_step": 4352, "epoch": 103} {"train_loss": -4.602260589599609, "global_step": 4353, "epoch": 103} {"train_loss": -4.47611141204834, "global_step": 4354, "epoch": 103} {"train_loss": -4.30687141418457, "global_step": 4355, "epoch": 103} {"train_loss": -4.330533027648926, "global_step": 4356, "epoch": 103} {"train_loss": -4.47435998916626, "global_step": 4357, "epoch": 103} {"train_loss": -4.32558536529541, "global_step": 4358, "epoch": 103} {"train_loss": -4.323824882507324, "global_step": 4359, "epoch": 103} {"train_loss": -4.398222923278809, "global_step": 4360, "epoch": 103} {"train_loss": -4.337403774261475, "global_step": 4361, "epoch": 103} {"train_loss": -4.392742156982422, "global_step": 4362, "epoch": 103} {"train_loss": -4.513470649719238, "global_step": 4363, "epoch": 103} {"train_loss": -4.324551582336426, "global_step": 4364, "epoch": 103} {"train_loss": -4.522700786590576, "global_step": 4365, "epoch": 103} {"train_loss": -4.325131416320801, "global_step": 4366, "epoch": 103} {"train_loss": -4.400213911419823, "global_step": 4367, "epoch": 103, "val_loss": 100910.859375} {"train_loss": -4.424874305725098, "global_step": 4368, "epoch": 104} {"train_loss": -4.392755508422852, "global_step": 4369, "epoch": 104} {"train_loss": -4.417875289916992, "global_step": 4370, "epoch": 104} {"train_loss": -4.478583812713623, "global_step": 4371, "epoch": 104} {"train_loss": -4.329449653625488, "global_step": 4372, "epoch": 104} {"train_loss": -4.14759635925293, "global_step": 4373, "epoch": 104} {"train_loss": -4.527848243713379, "global_step": 4374, "epoch": 104} {"train_loss": -4.396234512329102, "global_step": 4375, "epoch": 104} {"train_loss": -4.30355978012085, "global_step": 4376, "epoch": 104} {"train_loss": -4.5115556716918945, "global_step": 4377, "epoch": 104} {"train_loss": -4.48049783706665, "global_step": 4378, "epoch": 104} {"train_loss": -4.40812873840332, "global_step": 4379, "epoch": 104} {"train_loss": -4.54763650894165, "global_step": 4380, "epoch": 104} {"train_loss": -4.3959856033325195, "global_step": 4381, "epoch": 104} {"train_loss": -4.287355422973633, "global_step": 4382, "epoch": 104} {"train_loss": -4.512764930725098, "global_step": 4383, "epoch": 104} {"train_loss": -4.479647159576416, "global_step": 4384, "epoch": 104} {"train_loss": -4.523625373840332, "global_step": 4385, "epoch": 104} {"train_loss": -4.309070110321045, "global_step": 4386, "epoch": 104} {"train_loss": -4.4714202880859375, "global_step": 4387, "epoch": 104} {"train_loss": -4.42352294921875, "global_step": 4388, "epoch": 104} {"train_loss": -4.489134788513184, "global_step": 4389, "epoch": 104} {"train_loss": -4.320087909698486, "global_step": 4390, "epoch": 104} {"train_loss": -4.3355817794799805, "global_step": 4391, "epoch": 104} {"train_loss": -4.297463417053223, "global_step": 4392, "epoch": 104} {"train_loss": -4.485056400299072, "global_step": 4393, "epoch": 104} {"train_loss": -4.507994651794434, "global_step": 4394, "epoch": 104} {"train_loss": -4.485709190368652, "global_step": 4395, "epoch": 104} {"train_loss": -4.424434661865234, "global_step": 4396, "epoch": 104} {"train_loss": -4.496140480041504, "global_step": 4397, "epoch": 104} {"train_loss": -4.448878765106201, "global_step": 4398, "epoch": 104} {"train_loss": -4.400495529174805, "global_step": 4399, "epoch": 104} {"train_loss": -4.441858291625977, "global_step": 4400, "epoch": 104} {"train_loss": -4.400406837463379, "global_step": 4401, "epoch": 104} {"train_loss": -4.624117374420166, "global_step": 4402, "epoch": 104} {"train_loss": -4.6316680908203125, "global_step": 4403, "epoch": 104} {"train_loss": -4.475241184234619, "global_step": 4404, "epoch": 104} {"train_loss": -4.545825481414795, "global_step": 4405, "epoch": 104} {"train_loss": -4.514748573303223, "global_step": 4406, "epoch": 104} {"train_loss": -4.405231475830078, "global_step": 4407, "epoch": 104} {"train_loss": -4.310810089111328, "global_step": 4408, "epoch": 104} {"train_loss": -4.439488365536644, "global_step": 4409, "epoch": 104, "val_loss": 101531.78125} {"train_loss": -4.41489839553833, "global_step": 4410, "epoch": 105} {"train_loss": -4.394721031188965, "global_step": 4411, "epoch": 105} {"train_loss": -4.433131217956543, "global_step": 4412, "epoch": 105} {"train_loss": -4.414164066314697, "global_step": 4413, "epoch": 105} {"train_loss": -4.565228462219238, "global_step": 4414, "epoch": 105} {"train_loss": -4.366408348083496, "global_step": 4415, "epoch": 105} {"train_loss": -4.346386909484863, "global_step": 4416, "epoch": 105} {"train_loss": -4.433513641357422, "global_step": 4417, "epoch": 105} {"train_loss": -4.494258880615234, "global_step": 4418, "epoch": 105} {"train_loss": -4.290610313415527, "global_step": 4419, "epoch": 105} {"train_loss": -4.189452171325684, "global_step": 4420, "epoch": 105} {"train_loss": -4.558793067932129, "global_step": 4421, "epoch": 105} {"train_loss": -4.416886329650879, "global_step": 4422, "epoch": 105} {"train_loss": -4.429553985595703, "global_step": 4423, "epoch": 105} {"train_loss": -4.509375095367432, "global_step": 4424, "epoch": 105} {"train_loss": -4.523638725280762, "global_step": 4425, "epoch": 105} {"train_loss": -4.486427307128906, "global_step": 4426, "epoch": 105} {"train_loss": -4.30553674697876, "global_step": 4427, "epoch": 105} {"train_loss": -4.537137985229492, "global_step": 4428, "epoch": 105} {"train_loss": -4.321181297302246, "global_step": 4429, "epoch": 105} {"train_loss": -4.550753593444824, "global_step": 4430, "epoch": 105} {"train_loss": -4.50925350189209, "global_step": 4431, "epoch": 105} {"train_loss": -4.360348701477051, "global_step": 4432, "epoch": 105} {"train_loss": -4.423732280731201, "global_step": 4433, "epoch": 105} {"train_loss": -4.520114898681641, "global_step": 4434, "epoch": 105} {"train_loss": -4.431350231170654, "global_step": 4435, "epoch": 105} {"train_loss": -4.579995155334473, "global_step": 4436, "epoch": 105} {"train_loss": -4.577475070953369, "global_step": 4437, "epoch": 105} {"train_loss": -4.402859687805176, "global_step": 4438, "epoch": 105} {"train_loss": -4.436222553253174, "global_step": 4439, "epoch": 105} {"train_loss": -4.53681755065918, "global_step": 4440, "epoch": 105} {"train_loss": -4.4717793464660645, "global_step": 4441, "epoch": 105} {"train_loss": -4.572397232055664, "global_step": 4442, "epoch": 105} {"train_loss": -4.600945949554443, "global_step": 4443, "epoch": 105} {"train_loss": -4.358409881591797, "global_step": 4444, "epoch": 105} {"train_loss": -4.410526275634766, "global_step": 4445, "epoch": 105} {"train_loss": -4.430153846740723, "global_step": 4446, "epoch": 105} {"train_loss": -4.382010459899902, "global_step": 4447, "epoch": 105} {"train_loss": -4.525084495544434, "global_step": 4448, "epoch": 105} {"train_loss": -4.5012383460998535, "global_step": 4449, "epoch": 105} {"train_loss": -4.581066131591797, "global_step": 4450, "epoch": 105} {"train_loss": -4.449099324998402, "global_step": 4451, "epoch": 105, "val_loss": 100646.7109375} {"train_loss": -4.313213348388672, "global_step": 4452, "epoch": 106} {"train_loss": -4.50870418548584, "global_step": 4453, "epoch": 106} {"train_loss": -4.436278343200684, "global_step": 4454, "epoch": 106} {"train_loss": -4.477654457092285, "global_step": 4455, "epoch": 106} {"train_loss": -4.4271240234375, "global_step": 4456, "epoch": 106} {"train_loss": -4.5709052085876465, "global_step": 4457, "epoch": 106} {"train_loss": -4.59736967086792, "global_step": 4458, "epoch": 106} {"train_loss": -4.640435218811035, "global_step": 4459, "epoch": 106} {"train_loss": -4.5868377685546875, "global_step": 4460, "epoch": 106} {"train_loss": -4.6047515869140625, "global_step": 4461, "epoch": 106} {"train_loss": -4.484709739685059, "global_step": 4462, "epoch": 106} {"train_loss": -4.495354175567627, "global_step": 4463, "epoch": 106} {"train_loss": -4.683591842651367, "global_step": 4464, "epoch": 106} {"train_loss": -4.547501564025879, "global_step": 4465, "epoch": 106} {"train_loss": -4.447649002075195, "global_step": 4466, "epoch": 106} {"train_loss": -4.47155237197876, "global_step": 4467, "epoch": 106} {"train_loss": -4.532136917114258, "global_step": 4468, "epoch": 106} {"train_loss": -4.533440589904785, "global_step": 4469, "epoch": 106} {"train_loss": -4.528013706207275, "global_step": 4470, "epoch": 106} {"train_loss": -4.361843109130859, "global_step": 4471, "epoch": 106} {"train_loss": -4.1746978759765625, "global_step": 4472, "epoch": 106} {"train_loss": -4.5844597816467285, "global_step": 4473, "epoch": 106} {"train_loss": -4.461912631988525, "global_step": 4474, "epoch": 106} {"train_loss": -4.296693325042725, "global_step": 4475, "epoch": 106} {"train_loss": -4.31120491027832, "global_step": 4476, "epoch": 106} {"train_loss": -4.232356071472168, "global_step": 4477, "epoch": 106} {"train_loss": -4.501102447509766, "global_step": 4478, "epoch": 106} {"train_loss": -4.412630081176758, "global_step": 4479, "epoch": 106} {"train_loss": -4.430727958679199, "global_step": 4480, "epoch": 106} {"train_loss": -4.600260257720947, "global_step": 4481, "epoch": 106} {"train_loss": -4.57215690612793, "global_step": 4482, "epoch": 106} {"train_loss": -4.287898063659668, "global_step": 4483, "epoch": 106} {"train_loss": -4.5391011238098145, "global_step": 4484, "epoch": 106} {"train_loss": -4.439120292663574, "global_step": 4485, "epoch": 106} {"train_loss": -4.269466876983643, "global_step": 4486, "epoch": 106} {"train_loss": -4.4678955078125, "global_step": 4487, "epoch": 106} {"train_loss": -4.40593147277832, "global_step": 4488, "epoch": 106} {"train_loss": -4.439457893371582, "global_step": 4489, "epoch": 106} {"train_loss": -4.53256893157959, "global_step": 4490, "epoch": 106} {"train_loss": -4.330041885375977, "global_step": 4491, "epoch": 106} {"train_loss": -4.354072570800781, "global_step": 4492, "epoch": 106} {"train_loss": -4.463229974110921, "global_step": 4493, "epoch": 106, "val_loss": 101655.4140625} {"train_loss": -4.423089981079102, "global_step": 4494, "epoch": 107} {"train_loss": -4.430614948272705, "global_step": 4495, "epoch": 107} {"train_loss": -4.457422256469727, "global_step": 4496, "epoch": 107} {"train_loss": -4.592082500457764, "global_step": 4497, "epoch": 107} {"train_loss": -4.616016387939453, "global_step": 4498, "epoch": 107} {"train_loss": -4.491438865661621, "global_step": 4499, "epoch": 107} {"train_loss": -4.606897354125977, "global_step": 4500, "epoch": 107} {"train_loss": -4.504807949066162, "global_step": 4501, "epoch": 107} {"train_loss": -4.426360607147217, "global_step": 4502, "epoch": 107} {"train_loss": -4.449702262878418, "global_step": 4503, "epoch": 107} {"train_loss": -4.590290069580078, "global_step": 4504, "epoch": 107} {"train_loss": -4.503374099731445, "global_step": 4505, "epoch": 107} {"train_loss": -4.515642166137695, "global_step": 4506, "epoch": 107} {"train_loss": -4.387610912322998, "global_step": 4507, "epoch": 107} {"train_loss": -4.54497766494751, "global_step": 4508, "epoch": 107} {"train_loss": -4.331501007080078, "global_step": 4509, "epoch": 107} {"train_loss": -4.416053771972656, "global_step": 4510, "epoch": 107} {"train_loss": -4.364455223083496, "global_step": 4511, "epoch": 107} {"train_loss": -4.453332901000977, "global_step": 4512, "epoch": 107} {"train_loss": -4.2980122566223145, "global_step": 4513, "epoch": 107} {"train_loss": -4.295060634613037, "global_step": 4514, "epoch": 107} {"train_loss": -4.4477949142456055, "global_step": 4515, "epoch": 107} {"train_loss": -4.244452476501465, "global_step": 4516, "epoch": 107} {"train_loss": -4.51814079284668, "global_step": 4517, "epoch": 107} {"train_loss": -4.429272651672363, "global_step": 4518, "epoch": 107} {"train_loss": -4.27656364440918, "global_step": 4519, "epoch": 107} {"train_loss": -4.429505348205566, "global_step": 4520, "epoch": 107} {"train_loss": -4.423213958740234, "global_step": 4521, "epoch": 107} {"train_loss": -4.211545467376709, "global_step": 4522, "epoch": 107} {"train_loss": -4.43218469619751, "global_step": 4523, "epoch": 107} {"train_loss": -4.521842956542969, "global_step": 4524, "epoch": 107} {"train_loss": -4.3615031242370605, "global_step": 4525, "epoch": 107} {"train_loss": -4.3511552810668945, "global_step": 4526, "epoch": 107} {"train_loss": -4.592899322509766, "global_step": 4527, "epoch": 107} {"train_loss": -4.5491533279418945, "global_step": 4528, "epoch": 107} {"train_loss": -4.48731803894043, "global_step": 4529, "epoch": 107} {"train_loss": -4.465773582458496, "global_step": 4530, "epoch": 107} {"train_loss": -4.456937789916992, "global_step": 4531, "epoch": 107} {"train_loss": -4.555607795715332, "global_step": 4532, "epoch": 107} {"train_loss": -4.550753116607666, "global_step": 4533, "epoch": 107} {"train_loss": -4.400357246398926, "global_step": 4534, "epoch": 107} {"train_loss": -4.452405838739304, "global_step": 4535, "epoch": 107, "val_loss": 97664.7890625} {"train_loss": -4.592175006866455, "global_step": 4536, "epoch": 108} {"train_loss": -4.311896324157715, "global_step": 4537, "epoch": 108} {"train_loss": -4.547975540161133, "global_step": 4538, "epoch": 108} {"train_loss": -4.5105814933776855, "global_step": 4539, "epoch": 108} {"train_loss": -4.464887619018555, "global_step": 4540, "epoch": 108} {"train_loss": -4.639723777770996, "global_step": 4541, "epoch": 108} {"train_loss": -4.483731269836426, "global_step": 4542, "epoch": 108} {"train_loss": -4.420635223388672, "global_step": 4543, "epoch": 108} {"train_loss": -4.561585426330566, "global_step": 4544, "epoch": 108} {"train_loss": -4.555599689483643, "global_step": 4545, "epoch": 108} {"train_loss": -4.566186904907227, "global_step": 4546, "epoch": 108} {"train_loss": -4.569687843322754, "global_step": 4547, "epoch": 108} {"train_loss": -4.497359275817871, "global_step": 4548, "epoch": 108} {"train_loss": -4.577874183654785, "global_step": 4549, "epoch": 108} {"train_loss": -4.458694934844971, "global_step": 4550, "epoch": 108} {"train_loss": -4.490223407745361, "global_step": 4551, "epoch": 108} {"train_loss": -4.3558268547058105, "global_step": 4552, "epoch": 108} {"train_loss": -4.40207052230835, "global_step": 4553, "epoch": 108} {"train_loss": -4.506142616271973, "global_step": 4554, "epoch": 108} {"train_loss": -4.402682304382324, "global_step": 4555, "epoch": 108} {"train_loss": -4.342893600463867, "global_step": 4556, "epoch": 108} {"train_loss": -4.449325084686279, "global_step": 4557, "epoch": 108} {"train_loss": -4.452691555023193, "global_step": 4558, "epoch": 108} {"train_loss": -4.633014678955078, "global_step": 4559, "epoch": 108} {"train_loss": -4.403693675994873, "global_step": 4560, "epoch": 108} {"train_loss": -4.455238342285156, "global_step": 4561, "epoch": 108} {"train_loss": -4.464042663574219, "global_step": 4562, "epoch": 108} {"train_loss": -4.52538537979126, "global_step": 4563, "epoch": 108} {"train_loss": -4.549725532531738, "global_step": 4564, "epoch": 108} {"train_loss": -4.676224708557129, "global_step": 4565, "epoch": 108} {"train_loss": -4.408734321594238, "global_step": 4566, "epoch": 108} {"train_loss": -4.586809158325195, "global_step": 4567, "epoch": 108} {"train_loss": -4.633963584899902, "global_step": 4568, "epoch": 108} {"train_loss": -4.498215675354004, "global_step": 4569, "epoch": 108} {"train_loss": -4.442394256591797, "global_step": 4570, "epoch": 108} {"train_loss": -4.587937355041504, "global_step": 4571, "epoch": 108} {"train_loss": -4.506773948669434, "global_step": 4572, "epoch": 108} {"train_loss": -4.339370250701904, "global_step": 4573, "epoch": 108} {"train_loss": -4.557272434234619, "global_step": 4574, "epoch": 108} {"train_loss": -4.603310585021973, "global_step": 4575, "epoch": 108} {"train_loss": -4.402294158935547, "global_step": 4576, "epoch": 108} {"train_loss": -4.495210057213193, "global_step": 4577, "epoch": 108, "val_loss": 97219.3203125} {"train_loss": -4.632640361785889, "global_step": 4578, "epoch": 109} {"train_loss": -4.3709869384765625, "global_step": 4579, "epoch": 109} {"train_loss": -4.3359880447387695, "global_step": 4580, "epoch": 109} {"train_loss": -4.421413421630859, "global_step": 4581, "epoch": 109} {"train_loss": -4.397818565368652, "global_step": 4582, "epoch": 109} {"train_loss": -4.317102432250977, "global_step": 4583, "epoch": 109} {"train_loss": -4.548460960388184, "global_step": 4584, "epoch": 109} {"train_loss": -4.471750259399414, "global_step": 4585, "epoch": 109} {"train_loss": -4.344326972961426, "global_step": 4586, "epoch": 109} {"train_loss": -4.2577805519104, "global_step": 4587, "epoch": 109} {"train_loss": -4.235856056213379, "global_step": 4588, "epoch": 109} {"train_loss": -4.575582981109619, "global_step": 4589, "epoch": 109} {"train_loss": -4.182017803192139, "global_step": 4590, "epoch": 109} {"train_loss": -4.302391052246094, "global_step": 4591, "epoch": 109} {"train_loss": -4.447580814361572, "global_step": 4592, "epoch": 109} {"train_loss": -4.456242084503174, "global_step": 4593, "epoch": 109} {"train_loss": -4.230203628540039, "global_step": 4594, "epoch": 109} {"train_loss": -4.531069278717041, "global_step": 4595, "epoch": 109} {"train_loss": -4.362898826599121, "global_step": 4596, "epoch": 109} {"train_loss": -4.361485481262207, "global_step": 4597, "epoch": 109} {"train_loss": -4.390814781188965, "global_step": 4598, "epoch": 109} {"train_loss": -4.348267078399658, "global_step": 4599, "epoch": 109} {"train_loss": -4.453598976135254, "global_step": 4600, "epoch": 109} {"train_loss": -4.406817436218262, "global_step": 4601, "epoch": 109} {"train_loss": -4.405943870544434, "global_step": 4602, "epoch": 109} {"train_loss": -4.425816059112549, "global_step": 4603, "epoch": 109} {"train_loss": -4.532844543457031, "global_step": 4604, "epoch": 109} {"train_loss": -4.531801223754883, "global_step": 4605, "epoch": 109} {"train_loss": -4.538424491882324, "global_step": 4606, "epoch": 109} {"train_loss": -4.58029842376709, "global_step": 4607, "epoch": 109} {"train_loss": -4.484469890594482, "global_step": 4608, "epoch": 109} {"train_loss": -4.541010856628418, "global_step": 4609, "epoch": 109} {"train_loss": -4.531214237213135, "global_step": 4610, "epoch": 109} {"train_loss": -4.430924415588379, "global_step": 4611, "epoch": 109} {"train_loss": -4.50080680847168, "global_step": 4612, "epoch": 109} {"train_loss": -4.547309875488281, "global_step": 4613, "epoch": 109} {"train_loss": -4.457040786743164, "global_step": 4614, "epoch": 109} {"train_loss": -4.539350509643555, "global_step": 4615, "epoch": 109} {"train_loss": -4.51528263092041, "global_step": 4616, "epoch": 109} {"train_loss": -4.635692119598389, "global_step": 4617, "epoch": 109} {"train_loss": -4.682274341583252, "global_step": 4618, "epoch": 109} {"train_loss": -4.452480225335984, "global_step": 4619, "epoch": 109, "val_loss": 96771.609375} {"train_loss": -4.408090114593506, "global_step": 4620, "epoch": 110} {"train_loss": -4.54212760925293, "global_step": 4621, "epoch": 110} {"train_loss": -4.588481903076172, "global_step": 4622, "epoch": 110} {"train_loss": -4.4763641357421875, "global_step": 4623, "epoch": 110} {"train_loss": -4.5179548263549805, "global_step": 4624, "epoch": 110} {"train_loss": -4.663790225982666, "global_step": 4625, "epoch": 110} {"train_loss": -4.584978103637695, "global_step": 4626, "epoch": 110} {"train_loss": -4.514028549194336, "global_step": 4627, "epoch": 110} {"train_loss": -4.636348247528076, "global_step": 4628, "epoch": 110} {"train_loss": -4.515298366546631, "global_step": 4629, "epoch": 110} {"train_loss": -4.4751482009887695, "global_step": 4630, "epoch": 110} {"train_loss": -4.507747173309326, "global_step": 4631, "epoch": 110} {"train_loss": -4.459010601043701, "global_step": 4632, "epoch": 110} {"train_loss": -4.205441951751709, "global_step": 4633, "epoch": 110} {"train_loss": -4.572857856750488, "global_step": 4634, "epoch": 110} {"train_loss": -4.401384353637695, "global_step": 4635, "epoch": 110} {"train_loss": -4.1841511726379395, "global_step": 4636, "epoch": 110} {"train_loss": -4.428757190704346, "global_step": 4637, "epoch": 110} {"train_loss": -4.401878356933594, "global_step": 4638, "epoch": 110} {"train_loss": -4.209280490875244, "global_step": 4639, "epoch": 110} {"train_loss": -4.494495868682861, "global_step": 4640, "epoch": 110} {"train_loss": -4.376458168029785, "global_step": 4641, "epoch": 110} {"train_loss": -4.4732208251953125, "global_step": 4642, "epoch": 110} {"train_loss": -4.3952226638793945, "global_step": 4643, "epoch": 110} {"train_loss": -4.556451320648193, "global_step": 4644, "epoch": 110} {"train_loss": -4.40107536315918, "global_step": 4645, "epoch": 110} {"train_loss": -4.628087520599365, "global_step": 4646, "epoch": 110} {"train_loss": -4.476822853088379, "global_step": 4647, "epoch": 110} {"train_loss": -4.586645603179932, "global_step": 4648, "epoch": 110} {"train_loss": -4.598775386810303, "global_step": 4649, "epoch": 110} {"train_loss": -4.538694381713867, "global_step": 4650, "epoch": 110} {"train_loss": -4.589540481567383, "global_step": 4651, "epoch": 110} {"train_loss": -4.483402729034424, "global_step": 4652, "epoch": 110} {"train_loss": -4.52005672454834, "global_step": 4653, "epoch": 110} {"train_loss": -4.5679931640625, "global_step": 4654, "epoch": 110} {"train_loss": -4.517796039581299, "global_step": 4655, "epoch": 110} {"train_loss": -4.652695178985596, "global_step": 4656, "epoch": 110} {"train_loss": -4.569235801696777, "global_step": 4657, "epoch": 110} {"train_loss": -4.637578010559082, "global_step": 4658, "epoch": 110} {"train_loss": -4.567866325378418, "global_step": 4659, "epoch": 110} {"train_loss": -4.486404895782471, "global_step": 4660, "epoch": 110} {"train_loss": -4.499885422842843, "global_step": 4661, "epoch": 110, "val_loss": 97163.515625} {"train_loss": -4.569916248321533, "global_step": 4662, "epoch": 111} {"train_loss": -4.475472927093506, "global_step": 4663, "epoch": 111} {"train_loss": -4.536690711975098, "global_step": 4664, "epoch": 111} {"train_loss": -4.526793956756592, "global_step": 4665, "epoch": 111} {"train_loss": -4.643550872802734, "global_step": 4666, "epoch": 111} {"train_loss": -4.536655426025391, "global_step": 4667, "epoch": 111} {"train_loss": -4.606280326843262, "global_step": 4668, "epoch": 111} {"train_loss": -4.639266014099121, "global_step": 4669, "epoch": 111} {"train_loss": -4.597685813903809, "global_step": 4670, "epoch": 111} {"train_loss": -4.499050140380859, "global_step": 4671, "epoch": 111} {"train_loss": -4.363779544830322, "global_step": 4672, "epoch": 111} {"train_loss": -4.626983642578125, "global_step": 4673, "epoch": 111} {"train_loss": -4.772066593170166, "global_step": 4674, "epoch": 111} {"train_loss": -4.485168933868408, "global_step": 4675, "epoch": 111} {"train_loss": -4.555474281311035, "global_step": 4676, "epoch": 111} {"train_loss": -4.604454517364502, "global_step": 4677, "epoch": 111} {"train_loss": -4.669246673583984, "global_step": 4678, "epoch": 111} {"train_loss": -4.600153923034668, "global_step": 4679, "epoch": 111} {"train_loss": -4.405452728271484, "global_step": 4680, "epoch": 111} {"train_loss": -4.417573928833008, "global_step": 4681, "epoch": 111} {"train_loss": -4.511301040649414, "global_step": 4682, "epoch": 111} {"train_loss": -4.486313819885254, "global_step": 4683, "epoch": 111} {"train_loss": -4.337216377258301, "global_step": 4684, "epoch": 111} {"train_loss": -4.523815155029297, "global_step": 4685, "epoch": 111} {"train_loss": -4.421807289123535, "global_step": 4686, "epoch": 111} {"train_loss": -4.538919448852539, "global_step": 4687, "epoch": 111} {"train_loss": -4.478519439697266, "global_step": 4688, "epoch": 111} {"train_loss": -4.4895243644714355, "global_step": 4689, "epoch": 111} {"train_loss": -4.703289985656738, "global_step": 4690, "epoch": 111} {"train_loss": -4.443678855895996, "global_step": 4691, "epoch": 111} {"train_loss": -4.328855991363525, "global_step": 4692, "epoch": 111} {"train_loss": -4.476378440856934, "global_step": 4693, "epoch": 111} {"train_loss": -4.495826721191406, "global_step": 4694, "epoch": 111} {"train_loss": -4.296147346496582, "global_step": 4695, "epoch": 111} {"train_loss": -4.292778491973877, "global_step": 4696, "epoch": 111} {"train_loss": -4.550219535827637, "global_step": 4697, "epoch": 111} {"train_loss": -4.212604522705078, "global_step": 4698, "epoch": 111} {"train_loss": -4.522660255432129, "global_step": 4699, "epoch": 111} {"train_loss": -3.9948062896728516, "global_step": 4700, "epoch": 111} {"train_loss": -4.475183963775635, "global_step": 4701, "epoch": 111} {"train_loss": -4.435362815856934, "global_step": 4702, "epoch": 111} {"train_loss": -4.486707426252819, "global_step": 4703, "epoch": 111, "val_loss": 97882.2890625} {"train_loss": -4.323884963989258, "global_step": 4704, "epoch": 112} {"train_loss": -4.091639518737793, "global_step": 4705, "epoch": 112} {"train_loss": -4.510204792022705, "global_step": 4706, "epoch": 112} {"train_loss": -4.294741630554199, "global_step": 4707, "epoch": 112} {"train_loss": -4.261828422546387, "global_step": 4708, "epoch": 112} {"train_loss": -4.5529937744140625, "global_step": 4709, "epoch": 112} {"train_loss": -4.163309097290039, "global_step": 4710, "epoch": 112} {"train_loss": -4.458770751953125, "global_step": 4711, "epoch": 112} {"train_loss": -4.388269901275635, "global_step": 4712, "epoch": 112} {"train_loss": -4.4793853759765625, "global_step": 4713, "epoch": 112} {"train_loss": -4.62216854095459, "global_step": 4714, "epoch": 112} {"train_loss": -4.430695533752441, "global_step": 4715, "epoch": 112} {"train_loss": -4.4712910652160645, "global_step": 4716, "epoch": 112} {"train_loss": -4.298332691192627, "global_step": 4717, "epoch": 112} {"train_loss": -4.393017292022705, "global_step": 4718, "epoch": 112} {"train_loss": -4.447723865509033, "global_step": 4719, "epoch": 112} {"train_loss": -4.482235431671143, "global_step": 4720, "epoch": 112} {"train_loss": -4.514669418334961, "global_step": 4721, "epoch": 112} {"train_loss": -4.526869773864746, "global_step": 4722, "epoch": 112} {"train_loss": -4.469361782073975, "global_step": 4723, "epoch": 112} {"train_loss": -4.5077691078186035, "global_step": 4724, "epoch": 112} {"train_loss": -4.500539779663086, "global_step": 4725, "epoch": 112} {"train_loss": -4.586499214172363, "global_step": 4726, "epoch": 112} {"train_loss": -4.483933448791504, "global_step": 4727, "epoch": 112} {"train_loss": -4.538911819458008, "global_step": 4728, "epoch": 112} {"train_loss": -4.646581172943115, "global_step": 4729, "epoch": 112} {"train_loss": -4.460728645324707, "global_step": 4730, "epoch": 112} {"train_loss": -4.689142227172852, "global_step": 4731, "epoch": 112} {"train_loss": -4.59291934967041, "global_step": 4732, "epoch": 112} {"train_loss": -4.591784954071045, "global_step": 4733, "epoch": 112} {"train_loss": -4.644375801086426, "global_step": 4734, "epoch": 112} {"train_loss": -4.605867385864258, "global_step": 4735, "epoch": 112} {"train_loss": -4.583233833312988, "global_step": 4736, "epoch": 112} {"train_loss": -4.602481365203857, "global_step": 4737, "epoch": 112} {"train_loss": -4.418752670288086, "global_step": 4738, "epoch": 112} {"train_loss": -4.4342360496521, "global_step": 4739, "epoch": 112} {"train_loss": -4.197359085083008, "global_step": 4740, "epoch": 112} {"train_loss": -4.36899471282959, "global_step": 4741, "epoch": 112} {"train_loss": -4.310785293579102, "global_step": 4742, "epoch": 112} {"train_loss": -4.202674388885498, "global_step": 4743, "epoch": 112} {"train_loss": -4.437087535858154, "global_step": 4744, "epoch": 112} {"train_loss": -4.452012641089303, "global_step": 4745, "epoch": 112, "val_loss": 98928.765625} {"train_loss": -4.127904891967773, "global_step": 4746, "epoch": 113} {"train_loss": -4.6769795417785645, "global_step": 4747, "epoch": 113} {"train_loss": -4.240683555603027, "global_step": 4748, "epoch": 113} {"train_loss": -4.419846057891846, "global_step": 4749, "epoch": 113} {"train_loss": -4.563459873199463, "global_step": 4750, "epoch": 113} {"train_loss": -4.48319149017334, "global_step": 4751, "epoch": 113} {"train_loss": -4.50821590423584, "global_step": 4752, "epoch": 113} {"train_loss": -4.365803241729736, "global_step": 4753, "epoch": 113} {"train_loss": -4.573744297027588, "global_step": 4754, "epoch": 113} {"train_loss": -4.535133361816406, "global_step": 4755, "epoch": 113} {"train_loss": -4.403892517089844, "global_step": 4756, "epoch": 113} {"train_loss": -4.552896499633789, "global_step": 4757, "epoch": 113} {"train_loss": -4.470349311828613, "global_step": 4758, "epoch": 113} {"train_loss": -4.542007923126221, "global_step": 4759, "epoch": 113} {"train_loss": -4.475235462188721, "global_step": 4760, "epoch": 113} {"train_loss": -4.656559944152832, "global_step": 4761, "epoch": 113} {"train_loss": -4.430902004241943, "global_step": 4762, "epoch": 113} {"train_loss": -4.578985691070557, "global_step": 4763, "epoch": 113} {"train_loss": -4.465645790100098, "global_step": 4764, "epoch": 113} {"train_loss": -4.632381439208984, "global_step": 4765, "epoch": 113} {"train_loss": -4.534028053283691, "global_step": 4766, "epoch": 113} {"train_loss": -4.581747055053711, "global_step": 4767, "epoch": 113} {"train_loss": -4.6564531326293945, "global_step": 4768, "epoch": 113} {"train_loss": -4.565373420715332, "global_step": 4769, "epoch": 113} {"train_loss": -4.572680950164795, "global_step": 4770, "epoch": 113} {"train_loss": -4.525228500366211, "global_step": 4771, "epoch": 113} {"train_loss": -4.578165054321289, "global_step": 4772, "epoch": 113} {"train_loss": -4.4870781898498535, "global_step": 4773, "epoch": 113} {"train_loss": -4.630847930908203, "global_step": 4774, "epoch": 113} {"train_loss": -4.4653215408325195, "global_step": 4775, "epoch": 113} {"train_loss": -4.436896324157715, "global_step": 4776, "epoch": 113} {"train_loss": -4.632340431213379, "global_step": 4777, "epoch": 113} {"train_loss": -4.618664264678955, "global_step": 4778, "epoch": 113} {"train_loss": -4.6330132484436035, "global_step": 4779, "epoch": 113} {"train_loss": -4.812819957733154, "global_step": 4780, "epoch": 113} {"train_loss": -4.574030876159668, "global_step": 4781, "epoch": 113} {"train_loss": -4.4924516677856445, "global_step": 4782, "epoch": 113} {"train_loss": -4.405342102050781, "global_step": 4783, "epoch": 113} {"train_loss": -4.525142669677734, "global_step": 4784, "epoch": 113} {"train_loss": -4.579397201538086, "global_step": 4785, "epoch": 113} {"train_loss": -4.602563858032227, "global_step": 4786, "epoch": 113} {"train_loss": -4.527939864567348, "global_step": 4787, "epoch": 113, "val_loss": 95272.2890625} {"train_loss": -4.630377292633057, "global_step": 4788, "epoch": 114} {"train_loss": -4.448574066162109, "global_step": 4789, "epoch": 114} {"train_loss": -4.509831428527832, "global_step": 4790, "epoch": 114} {"train_loss": -4.510021209716797, "global_step": 4791, "epoch": 114} {"train_loss": -4.455193519592285, "global_step": 4792, "epoch": 114} {"train_loss": -4.514167785644531, "global_step": 4793, "epoch": 114} {"train_loss": -4.586933135986328, "global_step": 4794, "epoch": 114} {"train_loss": -4.390664100646973, "global_step": 4795, "epoch": 114} {"train_loss": -4.478559494018555, "global_step": 4796, "epoch": 114} {"train_loss": -4.320855617523193, "global_step": 4797, "epoch": 114} {"train_loss": -4.382576942443848, "global_step": 4798, "epoch": 114} {"train_loss": -3.922846794128418, "global_step": 4799, "epoch": 114} {"train_loss": -4.234556674957275, "global_step": 4800, "epoch": 114} {"train_loss": -4.326157569885254, "global_step": 4801, "epoch": 114} {"train_loss": -4.220317840576172, "global_step": 4802, "epoch": 114} {"train_loss": -4.343305587768555, "global_step": 4803, "epoch": 114} {"train_loss": -4.12314510345459, "global_step": 4804, "epoch": 114} {"train_loss": -4.419584274291992, "global_step": 4805, "epoch": 114} {"train_loss": -4.417797088623047, "global_step": 4806, "epoch": 114} {"train_loss": -4.388871669769287, "global_step": 4807, "epoch": 114} {"train_loss": -4.390963554382324, "global_step": 4808, "epoch": 114} {"train_loss": -4.359091281890869, "global_step": 4809, "epoch": 114} {"train_loss": -4.42922830581665, "global_step": 4810, "epoch": 114} {"train_loss": -4.457314491271973, "global_step": 4811, "epoch": 114} {"train_loss": -4.413364410400391, "global_step": 4812, "epoch": 114} {"train_loss": -4.489067077636719, "global_step": 4813, "epoch": 114} {"train_loss": -4.463475227355957, "global_step": 4814, "epoch": 114} {"train_loss": -4.326474189758301, "global_step": 4815, "epoch": 114} {"train_loss": -4.514486312866211, "global_step": 4816, "epoch": 114} {"train_loss": -4.371151924133301, "global_step": 4817, "epoch": 114} {"train_loss": -4.519707202911377, "global_step": 4818, "epoch": 114} {"train_loss": -4.4936017990112305, "global_step": 4819, "epoch": 114} {"train_loss": -4.606164932250977, "global_step": 4820, "epoch": 114} {"train_loss": -4.524481296539307, "global_step": 4821, "epoch": 114} {"train_loss": -4.522391319274902, "global_step": 4822, "epoch": 114} {"train_loss": -4.520669460296631, "global_step": 4823, "epoch": 114} {"train_loss": -4.466472148895264, "global_step": 4824, "epoch": 114} {"train_loss": -4.403639793395996, "global_step": 4825, "epoch": 114} {"train_loss": -4.585221767425537, "global_step": 4826, "epoch": 114} {"train_loss": -4.57537841796875, "global_step": 4827, "epoch": 114} {"train_loss": -4.641738414764404, "global_step": 4828, "epoch": 114} {"train_loss": -4.434069588070824, "global_step": 4829, "epoch": 114, "val_loss": 94133.4609375} {"train_loss": -4.5157060623168945, "global_step": 4830, "epoch": 115} {"train_loss": -4.688999176025391, "global_step": 4831, "epoch": 115} {"train_loss": -4.612148284912109, "global_step": 4832, "epoch": 115} {"train_loss": -4.595415115356445, "global_step": 4833, "epoch": 115} {"train_loss": -4.492897987365723, "global_step": 4834, "epoch": 115} {"train_loss": -4.163564682006836, "global_step": 4835, "epoch": 115} {"train_loss": -4.391996383666992, "global_step": 4836, "epoch": 115} {"train_loss": -4.722132682800293, "global_step": 4837, "epoch": 115} {"train_loss": -4.558896064758301, "global_step": 4838, "epoch": 115} {"train_loss": -4.642657279968262, "global_step": 4839, "epoch": 115} {"train_loss": -4.661349296569824, "global_step": 4840, "epoch": 115} {"train_loss": -4.633965492248535, "global_step": 4841, "epoch": 115} {"train_loss": -4.515232086181641, "global_step": 4842, "epoch": 115} {"train_loss": -4.475986480712891, "global_step": 4843, "epoch": 115} {"train_loss": -4.632474899291992, "global_step": 4844, "epoch": 115} {"train_loss": -4.649139881134033, "global_step": 4845, "epoch": 115} {"train_loss": -4.617828369140625, "global_step": 4846, "epoch": 115} {"train_loss": -4.48588752746582, "global_step": 4847, "epoch": 115} {"train_loss": -4.577157020568848, "global_step": 4848, "epoch": 115} {"train_loss": -4.673540115356445, "global_step": 4849, "epoch": 115} {"train_loss": -4.518708229064941, "global_step": 4850, "epoch": 115} {"train_loss": -4.420172691345215, "global_step": 4851, "epoch": 115} {"train_loss": -4.6348981857299805, "global_step": 4852, "epoch": 115} {"train_loss": -4.593320846557617, "global_step": 4853, "epoch": 115} {"train_loss": -4.52973747253418, "global_step": 4854, "epoch": 115} {"train_loss": -4.613925933837891, "global_step": 4855, "epoch": 115} {"train_loss": -4.6288251876831055, "global_step": 4856, "epoch": 115} {"train_loss": -4.403717041015625, "global_step": 4857, "epoch": 115} {"train_loss": -4.530523300170898, "global_step": 4858, "epoch": 115} {"train_loss": -4.705692768096924, "global_step": 4859, "epoch": 115} {"train_loss": -4.622167110443115, "global_step": 4860, "epoch": 115} {"train_loss": -4.611555099487305, "global_step": 4861, "epoch": 115} {"train_loss": -4.534786701202393, "global_step": 4862, "epoch": 115} {"train_loss": -4.431089878082275, "global_step": 4863, "epoch": 115} {"train_loss": -4.520775318145752, "global_step": 4864, "epoch": 115} {"train_loss": -4.547360897064209, "global_step": 4865, "epoch": 115} {"train_loss": -4.561995506286621, "global_step": 4866, "epoch": 115} {"train_loss": -4.654115676879883, "global_step": 4867, "epoch": 115} {"train_loss": -4.688986778259277, "global_step": 4868, "epoch": 115} {"train_loss": -4.50961971282959, "global_step": 4869, "epoch": 115} {"train_loss": -4.434256076812744, "global_step": 4870, "epoch": 115} {"train_loss": -4.560615312485468, "global_step": 4871, "epoch": 115, "val_loss": 95029.3125} {"train_loss": -4.629632949829102, "global_step": 4872, "epoch": 116} {"train_loss": -4.620009422302246, "global_step": 4873, "epoch": 116} {"train_loss": -4.703878402709961, "global_step": 4874, "epoch": 116} {"train_loss": -4.492286682128906, "global_step": 4875, "epoch": 116} {"train_loss": -4.387566566467285, "global_step": 4876, "epoch": 116} {"train_loss": -4.719486713409424, "global_step": 4877, "epoch": 116} {"train_loss": -4.600427627563477, "global_step": 4878, "epoch": 116} {"train_loss": -4.658124923706055, "global_step": 4879, "epoch": 116} {"train_loss": -4.684360504150391, "global_step": 4880, "epoch": 116} {"train_loss": -4.546859264373779, "global_step": 4881, "epoch": 116} {"train_loss": -4.608221054077148, "global_step": 4882, "epoch": 116} {"train_loss": -4.475597381591797, "global_step": 4883, "epoch": 116} {"train_loss": -4.550357818603516, "global_step": 4884, "epoch": 116} {"train_loss": -4.541292190551758, "global_step": 4885, "epoch": 116} {"train_loss": -4.6220927238464355, "global_step": 4886, "epoch": 116} {"train_loss": -4.644504547119141, "global_step": 4887, "epoch": 116} {"train_loss": -4.678918838500977, "global_step": 4888, "epoch": 116} {"train_loss": -4.535015106201172, "global_step": 4889, "epoch": 116} {"train_loss": -4.606810092926025, "global_step": 4890, "epoch": 116} {"train_loss": -4.657003879547119, "global_step": 4891, "epoch": 116} {"train_loss": -4.767736434936523, "global_step": 4892, "epoch": 116} {"train_loss": -4.609735012054443, "global_step": 4893, "epoch": 116} {"train_loss": -4.5458083152771, "global_step": 4894, "epoch": 116} {"train_loss": -4.433344841003418, "global_step": 4895, "epoch": 116} {"train_loss": -4.500855922698975, "global_step": 4896, "epoch": 116} {"train_loss": -4.580240249633789, "global_step": 4897, "epoch": 116} {"train_loss": -4.629814147949219, "global_step": 4898, "epoch": 116} {"train_loss": -4.562851905822754, "global_step": 4899, "epoch": 116} {"train_loss": -4.4483323097229, "global_step": 4900, "epoch": 116} {"train_loss": -4.626568794250488, "global_step": 4901, "epoch": 116} {"train_loss": -4.486701965332031, "global_step": 4902, "epoch": 116} {"train_loss": -4.624910831451416, "global_step": 4903, "epoch": 116} {"train_loss": -4.596330165863037, "global_step": 4904, "epoch": 116} {"train_loss": -4.367196559906006, "global_step": 4905, "epoch": 116} {"train_loss": -4.578334808349609, "global_step": 4906, "epoch": 116} {"train_loss": -4.710908889770508, "global_step": 4907, "epoch": 116} {"train_loss": -4.670307159423828, "global_step": 4908, "epoch": 116} {"train_loss": -4.359199047088623, "global_step": 4909, "epoch": 116} {"train_loss": -4.530600547790527, "global_step": 4910, "epoch": 116} {"train_loss": -4.6220550537109375, "global_step": 4911, "epoch": 116} {"train_loss": -4.367074012756348, "global_step": 4912, "epoch": 116} {"train_loss": -4.576765355609712, "global_step": 4913, "epoch": 116, "val_loss": 92702.5390625} {"train_loss": -4.746555328369141, "global_step": 4914, "epoch": 117} {"train_loss": -4.700374603271484, "global_step": 4915, "epoch": 117} {"train_loss": -4.766554355621338, "global_step": 4916, "epoch": 117} {"train_loss": -4.660464286804199, "global_step": 4917, "epoch": 117} {"train_loss": -4.505458354949951, "global_step": 4918, "epoch": 117} {"train_loss": -4.533841133117676, "global_step": 4919, "epoch": 117} {"train_loss": -4.674275875091553, "global_step": 4920, "epoch": 117} {"train_loss": -4.685001850128174, "global_step": 4921, "epoch": 117} {"train_loss": -4.523676872253418, "global_step": 4922, "epoch": 117} {"train_loss": -4.538291931152344, "global_step": 4923, "epoch": 117} {"train_loss": -4.684967994689941, "global_step": 4924, "epoch": 117} {"train_loss": -4.606115341186523, "global_step": 4925, "epoch": 117} {"train_loss": -4.579860687255859, "global_step": 4926, "epoch": 117} {"train_loss": -4.684278964996338, "global_step": 4927, "epoch": 117} {"train_loss": -4.681349277496338, "global_step": 4928, "epoch": 117} {"train_loss": -4.632039546966553, "global_step": 4929, "epoch": 117} {"train_loss": -4.676794052124023, "global_step": 4930, "epoch": 117} {"train_loss": -4.7074666023254395, "global_step": 4931, "epoch": 117} {"train_loss": -4.6971635818481445, "global_step": 4932, "epoch": 117} {"train_loss": -4.427347183227539, "global_step": 4933, "epoch": 117} {"train_loss": -4.578649520874023, "global_step": 4934, "epoch": 117} {"train_loss": -4.741350173950195, "global_step": 4935, "epoch": 117} {"train_loss": -4.477072715759277, "global_step": 4936, "epoch": 117} {"train_loss": -4.146089553833008, "global_step": 4937, "epoch": 117} {"train_loss": -4.450301170349121, "global_step": 4938, "epoch": 117} {"train_loss": -4.495322227478027, "global_step": 4939, "epoch": 117} {"train_loss": -4.004718780517578, "global_step": 4940, "epoch": 117} {"train_loss": -4.548396110534668, "global_step": 4941, "epoch": 117} {"train_loss": -4.392004013061523, "global_step": 4942, "epoch": 117} {"train_loss": -4.209453582763672, "global_step": 4943, "epoch": 117} {"train_loss": -4.646866798400879, "global_step": 4944, "epoch": 117} {"train_loss": -4.318180084228516, "global_step": 4945, "epoch": 117} {"train_loss": -4.469635486602783, "global_step": 4946, "epoch": 117} {"train_loss": -4.437057018280029, "global_step": 4947, "epoch": 117} {"train_loss": -4.434327125549316, "global_step": 4948, "epoch": 117} {"train_loss": -4.563292026519775, "global_step": 4949, "epoch": 117} {"train_loss": -4.507568836212158, "global_step": 4950, "epoch": 117} {"train_loss": -4.683694839477539, "global_step": 4951, "epoch": 117} {"train_loss": -4.623356342315674, "global_step": 4952, "epoch": 117} {"train_loss": -4.565332889556885, "global_step": 4953, "epoch": 117} {"train_loss": -4.53945779800415, "global_step": 4954, "epoch": 117} {"train_loss": -4.550187860216413, "global_step": 4955, "epoch": 117, "val_loss": 93799.5625} {"train_loss": -4.540684223175049, "global_step": 4956, "epoch": 118} {"train_loss": -4.58059549331665, "global_step": 4957, "epoch": 118} {"train_loss": -4.701499938964844, "global_step": 4958, "epoch": 118} {"train_loss": -4.680963516235352, "global_step": 4959, "epoch": 118} {"train_loss": -4.616817474365234, "global_step": 4960, "epoch": 118} {"train_loss": -4.689332008361816, "global_step": 4961, "epoch": 118} {"train_loss": -4.6749587059021, "global_step": 4962, "epoch": 118} {"train_loss": -4.707326889038086, "global_step": 4963, "epoch": 118} {"train_loss": -4.655026435852051, "global_step": 4964, "epoch": 118} {"train_loss": -4.537667274475098, "global_step": 4965, "epoch": 118} {"train_loss": -4.647800445556641, "global_step": 4966, "epoch": 118} {"train_loss": -4.767388343811035, "global_step": 4967, "epoch": 118} {"train_loss": -4.573674201965332, "global_step": 4968, "epoch": 118} {"train_loss": -4.57279109954834, "global_step": 4969, "epoch": 118} {"train_loss": -4.581002235412598, "global_step": 4970, "epoch": 118} {"train_loss": -4.76216983795166, "global_step": 4971, "epoch": 118} {"train_loss": -4.696383953094482, "global_step": 4972, "epoch": 118} {"train_loss": -4.461263656616211, "global_step": 4973, "epoch": 118} {"train_loss": -4.485454559326172, "global_step": 4974, "epoch": 118} {"train_loss": -4.736389636993408, "global_step": 4975, "epoch": 118} {"train_loss": -4.5511908531188965, "global_step": 4976, "epoch": 118} {"train_loss": -4.4960126876831055, "global_step": 4977, "epoch": 118} {"train_loss": -4.698785781860352, "global_step": 4978, "epoch": 118} {"train_loss": -4.604902744293213, "global_step": 4979, "epoch": 118} {"train_loss": -4.404841423034668, "global_step": 4980, "epoch": 118} {"train_loss": -4.449036598205566, "global_step": 4981, "epoch": 118} {"train_loss": -4.135810852050781, "global_step": 4982, "epoch": 118} {"train_loss": -4.519387245178223, "global_step": 4983, "epoch": 118} {"train_loss": -3.8910417556762695, "global_step": 4984, "epoch": 118} {"train_loss": -3.912644863128662, "global_step": 4985, "epoch": 118} {"train_loss": -4.558349609375, "global_step": 4986, "epoch": 118} {"train_loss": -3.662492275238037, "global_step": 4987, "epoch": 118} {"train_loss": -4.6155266761779785, "global_step": 4988, "epoch": 118} {"train_loss": -4.148491859436035, "global_step": 4989, "epoch": 118} {"train_loss": -4.034682750701904, "global_step": 4990, "epoch": 118} {"train_loss": -4.177351951599121, "global_step": 4991, "epoch": 118} {"train_loss": -4.17595911026001, "global_step": 4992, "epoch": 118} {"train_loss": -4.5914764404296875, "global_step": 4993, "epoch": 118} {"train_loss": -4.212892055511475, "global_step": 4994, "epoch": 118} {"train_loss": -4.475697040557861, "global_step": 4995, "epoch": 118} {"train_loss": -4.279695510864258, "global_step": 4996, "epoch": 118} {"train_loss": -4.46719977969215, "global_step": 4997, "epoch": 118, "val_loss": 100046.03125} {"train_loss": -4.431203842163086, "global_step": 4998, "epoch": 119} {"train_loss": -4.471364498138428, "global_step": 4999, "epoch": 119} {"train_loss": -4.409241676330566, "global_step": 5000, "epoch": 119} {"train_loss": -4.515749454498291, "global_step": 5001, "epoch": 119} {"train_loss": -4.437743663787842, "global_step": 5002, "epoch": 119} {"train_loss": -4.429539680480957, "global_step": 5003, "epoch": 119} {"train_loss": -4.603317737579346, "global_step": 5004, "epoch": 119} {"train_loss": -4.447985649108887, "global_step": 5005, "epoch": 119} {"train_loss": -4.459895133972168, "global_step": 5006, "epoch": 119} {"train_loss": -4.509985446929932, "global_step": 5007, "epoch": 119} {"train_loss": -4.505989074707031, "global_step": 5008, "epoch": 119} {"train_loss": -4.401337146759033, "global_step": 5009, "epoch": 119} {"train_loss": -4.426022529602051, "global_step": 5010, "epoch": 119} {"train_loss": -3.9083809852600098, "global_step": 5011, "epoch": 119} {"train_loss": -4.08204460144043, "global_step": 5012, "epoch": 119} {"train_loss": -4.478023529052734, "global_step": 5013, "epoch": 119} {"train_loss": -4.513983726501465, "global_step": 5014, "epoch": 119} {"train_loss": -4.350543022155762, "global_step": 5015, "epoch": 119} {"train_loss": -4.273710250854492, "global_step": 5016, "epoch": 119} {"train_loss": -4.44968318939209, "global_step": 5017, "epoch": 119} {"train_loss": -4.584721565246582, "global_step": 5018, "epoch": 119} {"train_loss": -4.544163227081299, "global_step": 5019, "epoch": 119} {"train_loss": -4.527307510375977, "global_step": 5020, "epoch": 119} {"train_loss": -4.55602502822876, "global_step": 5021, "epoch": 119} {"train_loss": -4.651571750640869, "global_step": 5022, "epoch": 119} {"train_loss": -4.6155266761779785, "global_step": 5023, "epoch": 119} {"train_loss": -4.486989498138428, "global_step": 5024, "epoch": 119} {"train_loss": -4.585373878479004, "global_step": 5025, "epoch": 119} {"train_loss": -4.58816385269165, "global_step": 5026, "epoch": 119} {"train_loss": -4.494985580444336, "global_step": 5027, "epoch": 119} {"train_loss": -4.650792121887207, "global_step": 5028, "epoch": 119} {"train_loss": -4.5921220779418945, "global_step": 5029, "epoch": 119} {"train_loss": -4.556570529937744, "global_step": 5030, "epoch": 119} {"train_loss": -4.5903496742248535, "global_step": 5031, "epoch": 119} {"train_loss": -4.681640625, "global_step": 5032, "epoch": 119} {"train_loss": -4.634578227996826, "global_step": 5033, "epoch": 119} {"train_loss": -4.5613555908203125, "global_step": 5034, "epoch": 119} {"train_loss": -4.53197717666626, "global_step": 5035, "epoch": 119} {"train_loss": -4.347378253936768, "global_step": 5036, "epoch": 119} {"train_loss": -4.49276065826416, "global_step": 5037, "epoch": 119} {"train_loss": -4.568514823913574, "global_step": 5038, "epoch": 119} {"train_loss": -4.490772769564674, "global_step": 5039, "epoch": 119, "val_loss": 91369.3046875} {"train_loss": -4.614422798156738, "global_step": 5040, "epoch": 120} {"train_loss": -4.5865373611450195, "global_step": 5041, "epoch": 120} {"train_loss": -4.5377068519592285, "global_step": 5042, "epoch": 120} {"train_loss": -4.610967636108398, "global_step": 5043, "epoch": 120} {"train_loss": -4.630091667175293, "global_step": 5044, "epoch": 120} {"train_loss": -4.517892837524414, "global_step": 5045, "epoch": 120} {"train_loss": -4.570512294769287, "global_step": 5046, "epoch": 120} {"train_loss": -4.782050132751465, "global_step": 5047, "epoch": 120} {"train_loss": -4.520936489105225, "global_step": 5048, "epoch": 120} {"train_loss": -4.723775863647461, "global_step": 5049, "epoch": 120} {"train_loss": -4.636966228485107, "global_step": 5050, "epoch": 120} {"train_loss": -4.566527843475342, "global_step": 5051, "epoch": 120} {"train_loss": -4.660168170928955, "global_step": 5052, "epoch": 120} {"train_loss": -4.62927770614624, "global_step": 5053, "epoch": 120} {"train_loss": -4.801231384277344, "global_step": 5054, "epoch": 120} {"train_loss": -4.436408996582031, "global_step": 5055, "epoch": 120} {"train_loss": -4.231084823608398, "global_step": 5056, "epoch": 120} {"train_loss": -4.5097856521606445, "global_step": 5057, "epoch": 120} {"train_loss": -4.576785087585449, "global_step": 5058, "epoch": 120} {"train_loss": -4.655088424682617, "global_step": 5059, "epoch": 120} {"train_loss": -4.572576522827148, "global_step": 5060, "epoch": 120} {"train_loss": -4.4724650382995605, "global_step": 5061, "epoch": 120} {"train_loss": -4.6313629150390625, "global_step": 5062, "epoch": 120} {"train_loss": -4.647001266479492, "global_step": 5063, "epoch": 120} {"train_loss": -4.537496089935303, "global_step": 5064, "epoch": 120} {"train_loss": -4.640872001647949, "global_step": 5065, "epoch": 120} {"train_loss": -4.654633522033691, "global_step": 5066, "epoch": 120} {"train_loss": -4.5780029296875, "global_step": 5067, "epoch": 120} {"train_loss": -4.5159101486206055, "global_step": 5068, "epoch": 120} {"train_loss": -4.819003105163574, "global_step": 5069, "epoch": 120} {"train_loss": -4.505853652954102, "global_step": 5070, "epoch": 120} {"train_loss": -4.4742817878723145, "global_step": 5071, "epoch": 120} {"train_loss": -4.6146745681762695, "global_step": 5072, "epoch": 120} {"train_loss": -4.593833923339844, "global_step": 5073, "epoch": 120} {"train_loss": -4.624431610107422, "global_step": 5074, "epoch": 120} {"train_loss": -4.523517608642578, "global_step": 5075, "epoch": 120} {"train_loss": -4.498350620269775, "global_step": 5076, "epoch": 120} {"train_loss": -4.638883113861084, "global_step": 5077, "epoch": 120} {"train_loss": -4.735132694244385, "global_step": 5078, "epoch": 120} {"train_loss": -4.737054824829102, "global_step": 5079, "epoch": 120} {"train_loss": -4.668583393096924, "global_step": 5080, "epoch": 120} {"train_loss": -4.598832153138661, "global_step": 5081, "epoch": 120, "val_loss": 90019.7578125} {"train_loss": -4.585835933685303, "global_step": 5082, "epoch": 121} {"train_loss": -4.693968772888184, "global_step": 5083, "epoch": 121} {"train_loss": -4.64476203918457, "global_step": 5084, "epoch": 121} {"train_loss": -4.602793216705322, "global_step": 5085, "epoch": 121} {"train_loss": -4.64576530456543, "global_step": 5086, "epoch": 121} {"train_loss": -4.470575332641602, "global_step": 5087, "epoch": 121} {"train_loss": -4.76154899597168, "global_step": 5088, "epoch": 121} {"train_loss": -4.489120960235596, "global_step": 5089, "epoch": 121} {"train_loss": -4.700953483581543, "global_step": 5090, "epoch": 121} {"train_loss": -4.654275417327881, "global_step": 5091, "epoch": 121} {"train_loss": -4.675078868865967, "global_step": 5092, "epoch": 121} {"train_loss": -4.369138717651367, "global_step": 5093, "epoch": 121} {"train_loss": -4.455659866333008, "global_step": 5094, "epoch": 121} {"train_loss": -4.641924858093262, "global_step": 5095, "epoch": 121} {"train_loss": -4.485178470611572, "global_step": 5096, "epoch": 121} {"train_loss": -4.145313739776611, "global_step": 5097, "epoch": 121} {"train_loss": -4.736823081970215, "global_step": 5098, "epoch": 121} {"train_loss": -4.338157653808594, "global_step": 5099, "epoch": 121} {"train_loss": -4.3364739418029785, "global_step": 5100, "epoch": 121} {"train_loss": -4.555727481842041, "global_step": 5101, "epoch": 121} {"train_loss": -3.886746883392334, "global_step": 5102, "epoch": 121} {"train_loss": -4.58545446395874, "global_step": 5103, "epoch": 121} {"train_loss": -4.157784938812256, "global_step": 5104, "epoch": 121} {"train_loss": -4.692922592163086, "global_step": 5105, "epoch": 121} {"train_loss": -4.186148643493652, "global_step": 5106, "epoch": 121} {"train_loss": -4.530784606933594, "global_step": 5107, "epoch": 121} {"train_loss": -4.257089614868164, "global_step": 5108, "epoch": 121} {"train_loss": -4.625020980834961, "global_step": 5109, "epoch": 121} {"train_loss": -4.3230204582214355, "global_step": 5110, "epoch": 121} {"train_loss": -4.652311325073242, "global_step": 5111, "epoch": 121} {"train_loss": -4.489526271820068, "global_step": 5112, "epoch": 121} {"train_loss": -4.50701379776001, "global_step": 5113, "epoch": 121} {"train_loss": -4.534996032714844, "global_step": 5114, "epoch": 121} {"train_loss": -4.517276287078857, "global_step": 5115, "epoch": 121} {"train_loss": -4.601675987243652, "global_step": 5116, "epoch": 121} {"train_loss": -4.539123058319092, "global_step": 5117, "epoch": 121} {"train_loss": -4.643483638763428, "global_step": 5118, "epoch": 121} {"train_loss": -4.430362701416016, "global_step": 5119, "epoch": 121} {"train_loss": -4.529990196228027, "global_step": 5120, "epoch": 121} {"train_loss": -4.59395694732666, "global_step": 5121, "epoch": 121} {"train_loss": -4.7182512283325195, "global_step": 5122, "epoch": 121} {"train_loss": -4.514818100702195, "global_step": 5123, "epoch": 121, "val_loss": 91411.078125} {"train_loss": -4.618908882141113, "global_step": 5124, "epoch": 122} {"train_loss": -4.381529331207275, "global_step": 5125, "epoch": 122} {"train_loss": -4.615196228027344, "global_step": 5126, "epoch": 122} {"train_loss": -4.400258541107178, "global_step": 5127, "epoch": 122} {"train_loss": -4.5991411209106445, "global_step": 5128, "epoch": 122} {"train_loss": -4.537303447723389, "global_step": 5129, "epoch": 122} {"train_loss": -4.683428764343262, "global_step": 5130, "epoch": 122} {"train_loss": -4.620095252990723, "global_step": 5131, "epoch": 122} {"train_loss": -4.540427207946777, "global_step": 5132, "epoch": 122} {"train_loss": -4.740497589111328, "global_step": 5133, "epoch": 122} {"train_loss": -4.7832794189453125, "global_step": 5134, "epoch": 122} {"train_loss": -4.6347150802612305, "global_step": 5135, "epoch": 122} {"train_loss": -4.550135135650635, "global_step": 5136, "epoch": 122} {"train_loss": -4.439289569854736, "global_step": 5137, "epoch": 122} {"train_loss": -4.654279708862305, "global_step": 5138, "epoch": 122} {"train_loss": -4.739487648010254, "global_step": 5139, "epoch": 122} {"train_loss": -4.4433135986328125, "global_step": 5140, "epoch": 122} {"train_loss": -4.439050197601318, "global_step": 5141, "epoch": 122} {"train_loss": -4.624361515045166, "global_step": 5142, "epoch": 122} {"train_loss": -4.6965460777282715, "global_step": 5143, "epoch": 122} {"train_loss": -4.54283332824707, "global_step": 5144, "epoch": 122} {"train_loss": -4.652781009674072, "global_step": 5145, "epoch": 122} {"train_loss": -4.664910316467285, "global_step": 5146, "epoch": 122} {"train_loss": -4.6176934242248535, "global_step": 5147, "epoch": 122} {"train_loss": -4.518706321716309, "global_step": 5148, "epoch": 122} {"train_loss": -4.634667873382568, "global_step": 5149, "epoch": 122} {"train_loss": -4.458405017852783, "global_step": 5150, "epoch": 122} {"train_loss": -4.821507930755615, "global_step": 5151, "epoch": 122} {"train_loss": -4.540332794189453, "global_step": 5152, "epoch": 122} {"train_loss": -4.560013771057129, "global_step": 5153, "epoch": 122} {"train_loss": -4.607412338256836, "global_step": 5154, "epoch": 122} {"train_loss": -4.716244220733643, "global_step": 5155, "epoch": 122} {"train_loss": -4.5832624435424805, "global_step": 5156, "epoch": 122} {"train_loss": -4.723616600036621, "global_step": 5157, "epoch": 122} {"train_loss": -4.517993450164795, "global_step": 5158, "epoch": 122} {"train_loss": -4.508213043212891, "global_step": 5159, "epoch": 122} {"train_loss": -4.758468151092529, "global_step": 5160, "epoch": 122} {"train_loss": -4.594623565673828, "global_step": 5161, "epoch": 122} {"train_loss": -4.748767852783203, "global_step": 5162, "epoch": 122} {"train_loss": -4.674605846405029, "global_step": 5163, "epoch": 122} {"train_loss": -4.479673862457275, "global_step": 5164, "epoch": 122} {"train_loss": -4.598905563354492, "global_step": 5165, "epoch": 122, "val_loss": 92042.375} {"train_loss": -4.381123065948486, "global_step": 5166, "epoch": 123} {"train_loss": -4.634096622467041, "global_step": 5167, "epoch": 123} {"train_loss": -4.234745979309082, "global_step": 5168, "epoch": 123} {"train_loss": -4.463346481323242, "global_step": 5169, "epoch": 123} {"train_loss": -4.694398880004883, "global_step": 5170, "epoch": 123} {"train_loss": -4.584392547607422, "global_step": 5171, "epoch": 123} {"train_loss": -4.556676864624023, "global_step": 5172, "epoch": 123} {"train_loss": -4.726924896240234, "global_step": 5173, "epoch": 123} {"train_loss": -4.683526039123535, "global_step": 5174, "epoch": 123} {"train_loss": -4.7110819816589355, "global_step": 5175, "epoch": 123} {"train_loss": -4.756342887878418, "global_step": 5176, "epoch": 123} {"train_loss": -4.628406524658203, "global_step": 5177, "epoch": 123} {"train_loss": -4.8164520263671875, "global_step": 5178, "epoch": 123} {"train_loss": -4.715330123901367, "global_step": 5179, "epoch": 123} {"train_loss": -4.748857021331787, "global_step": 5180, "epoch": 123} {"train_loss": -4.6903581619262695, "global_step": 5181, "epoch": 123} {"train_loss": -4.721611976623535, "global_step": 5182, "epoch": 123} {"train_loss": -4.762243270874023, "global_step": 5183, "epoch": 123} {"train_loss": -4.733148574829102, "global_step": 5184, "epoch": 123} {"train_loss": -4.628101348876953, "global_step": 5185, "epoch": 123} {"train_loss": -4.713259696960449, "global_step": 5186, "epoch": 123} {"train_loss": -4.651155471801758, "global_step": 5187, "epoch": 123} {"train_loss": -4.793945789337158, "global_step": 5188, "epoch": 123} {"train_loss": -4.700471878051758, "global_step": 5189, "epoch": 123} {"train_loss": -4.783850193023682, "global_step": 5190, "epoch": 123} {"train_loss": -4.745852470397949, "global_step": 5191, "epoch": 123} {"train_loss": -4.8277812004089355, "global_step": 5192, "epoch": 123} {"train_loss": -4.836391448974609, "global_step": 5193, "epoch": 123} {"train_loss": -4.656579494476318, "global_step": 5194, "epoch": 123} {"train_loss": -4.540463924407959, "global_step": 5195, "epoch": 123} {"train_loss": -4.726241111755371, "global_step": 5196, "epoch": 123} {"train_loss": -4.73099946975708, "global_step": 5197, "epoch": 123} {"train_loss": -4.559426307678223, "global_step": 5198, "epoch": 123} {"train_loss": -4.632543563842773, "global_step": 5199, "epoch": 123} {"train_loss": -4.667300224304199, "global_step": 5200, "epoch": 123} {"train_loss": -4.677289009094238, "global_step": 5201, "epoch": 123} {"train_loss": -4.724433898925781, "global_step": 5202, "epoch": 123} {"train_loss": -4.530196189880371, "global_step": 5203, "epoch": 123} {"train_loss": -4.371269226074219, "global_step": 5204, "epoch": 123} {"train_loss": -4.620826721191406, "global_step": 5205, "epoch": 123} {"train_loss": -4.721320629119873, "global_step": 5206, "epoch": 123} {"train_loss": -4.660858528954642, "global_step": 5207, "epoch": 123, "val_loss": 93991.640625} {"train_loss": -4.267327308654785, "global_step": 5208, "epoch": 124} {"train_loss": -4.606535911560059, "global_step": 5209, "epoch": 124} {"train_loss": -4.722219467163086, "global_step": 5210, "epoch": 124} {"train_loss": -4.279443740844727, "global_step": 5211, "epoch": 124} {"train_loss": -4.621058464050293, "global_step": 5212, "epoch": 124} {"train_loss": -4.508530616760254, "global_step": 5213, "epoch": 124} {"train_loss": -4.489439010620117, "global_step": 5214, "epoch": 124} {"train_loss": -4.780486106872559, "global_step": 5215, "epoch": 124} {"train_loss": -4.494845390319824, "global_step": 5216, "epoch": 124} {"train_loss": -4.592557430267334, "global_step": 5217, "epoch": 124} {"train_loss": -4.699912071228027, "global_step": 5218, "epoch": 124} {"train_loss": -4.572768211364746, "global_step": 5219, "epoch": 124} {"train_loss": -4.702673435211182, "global_step": 5220, "epoch": 124} {"train_loss": -4.543730735778809, "global_step": 5221, "epoch": 124} {"train_loss": -4.700475692749023, "global_step": 5222, "epoch": 124} {"train_loss": -4.610811233520508, "global_step": 5223, "epoch": 124} {"train_loss": -4.634528160095215, "global_step": 5224, "epoch": 124} {"train_loss": -4.700516700744629, "global_step": 5225, "epoch": 124} {"train_loss": -4.581164360046387, "global_step": 5226, "epoch": 124} {"train_loss": -4.7083587646484375, "global_step": 5227, "epoch": 124} {"train_loss": -4.599595069885254, "global_step": 5228, "epoch": 124} {"train_loss": -4.598874568939209, "global_step": 5229, "epoch": 124} {"train_loss": -4.774240493774414, "global_step": 5230, "epoch": 124} {"train_loss": -4.686481475830078, "global_step": 5231, "epoch": 124} {"train_loss": -4.545803546905518, "global_step": 5232, "epoch": 124} {"train_loss": -4.741766929626465, "global_step": 5233, "epoch": 124} {"train_loss": -4.752943992614746, "global_step": 5234, "epoch": 124} {"train_loss": -4.754803657531738, "global_step": 5235, "epoch": 124} {"train_loss": -4.389822959899902, "global_step": 5236, "epoch": 124} {"train_loss": -4.617447853088379, "global_step": 5237, "epoch": 124} {"train_loss": -4.777336120605469, "global_step": 5238, "epoch": 124} {"train_loss": -4.6567487716674805, "global_step": 5239, "epoch": 124} {"train_loss": -4.766575813293457, "global_step": 5240, "epoch": 124} {"train_loss": -4.564976215362549, "global_step": 5241, "epoch": 124} {"train_loss": -4.724996566772461, "global_step": 5242, "epoch": 124} {"train_loss": -4.689691543579102, "global_step": 5243, "epoch": 124} {"train_loss": -4.578307151794434, "global_step": 5244, "epoch": 124} {"train_loss": -4.592436790466309, "global_step": 5245, "epoch": 124} {"train_loss": -4.749096870422363, "global_step": 5246, "epoch": 124} {"train_loss": -4.600236892700195, "global_step": 5247, "epoch": 124} {"train_loss": -4.576589584350586, "global_step": 5248, "epoch": 124} {"train_loss": -4.626011587324596, "global_step": 5249, "epoch": 124, "val_loss": 90063.3203125} {"train_loss": -4.690555572509766, "global_step": 5250, "epoch": 125} {"train_loss": -4.574485778808594, "global_step": 5251, "epoch": 125} {"train_loss": -4.670163154602051, "global_step": 5252, "epoch": 125} {"train_loss": -4.653203010559082, "global_step": 5253, "epoch": 125} {"train_loss": -4.629242897033691, "global_step": 5254, "epoch": 125} {"train_loss": -4.712967872619629, "global_step": 5255, "epoch": 125} {"train_loss": -4.760002613067627, "global_step": 5256, "epoch": 125} {"train_loss": -4.669206142425537, "global_step": 5257, "epoch": 125} {"train_loss": -4.661757946014404, "global_step": 5258, "epoch": 125} {"train_loss": -4.721367359161377, "global_step": 5259, "epoch": 125} {"train_loss": -4.721080780029297, "global_step": 5260, "epoch": 125} {"train_loss": -4.590779781341553, "global_step": 5261, "epoch": 125} {"train_loss": -4.708365440368652, "global_step": 5262, "epoch": 125} {"train_loss": -4.782240867614746, "global_step": 5263, "epoch": 125} {"train_loss": -4.729070663452148, "global_step": 5264, "epoch": 125} {"train_loss": -4.632863521575928, "global_step": 5265, "epoch": 125} {"train_loss": -4.742863655090332, "global_step": 5266, "epoch": 125} {"train_loss": -4.717824459075928, "global_step": 5267, "epoch": 125} {"train_loss": -4.878481864929199, "global_step": 5268, "epoch": 125} {"train_loss": -4.729743480682373, "global_step": 5269, "epoch": 125} {"train_loss": -4.48348331451416, "global_step": 5270, "epoch": 125} {"train_loss": -4.7869343757629395, "global_step": 5271, "epoch": 125} {"train_loss": -4.766291618347168, "global_step": 5272, "epoch": 125} {"train_loss": -4.544486045837402, "global_step": 5273, "epoch": 125} {"train_loss": -4.404284477233887, "global_step": 5274, "epoch": 125} {"train_loss": -4.61054801940918, "global_step": 5275, "epoch": 125} {"train_loss": -4.730454444885254, "global_step": 5276, "epoch": 125} {"train_loss": -4.6478071212768555, "global_step": 5277, "epoch": 125} {"train_loss": -4.730016708374023, "global_step": 5278, "epoch": 125} {"train_loss": -4.672762870788574, "global_step": 5279, "epoch": 125} {"train_loss": -4.714874267578125, "global_step": 5280, "epoch": 125} {"train_loss": -4.65873908996582, "global_step": 5281, "epoch": 125} {"train_loss": -4.681804656982422, "global_step": 5282, "epoch": 125} {"train_loss": -4.842929840087891, "global_step": 5283, "epoch": 125} {"train_loss": -4.814241409301758, "global_step": 5284, "epoch": 125} {"train_loss": -4.735922813415527, "global_step": 5285, "epoch": 125} {"train_loss": -4.747314453125, "global_step": 5286, "epoch": 125} {"train_loss": -4.569115161895752, "global_step": 5287, "epoch": 125} {"train_loss": -4.733428955078125, "global_step": 5288, "epoch": 125} {"train_loss": -4.663897514343262, "global_step": 5289, "epoch": 125} {"train_loss": -4.836226463317871, "global_step": 5290, "epoch": 125} {"train_loss": -4.692147992906117, "global_step": 5291, "epoch": 125, "val_loss": 91543.0390625} {"train_loss": -4.690073013305664, "global_step": 5292, "epoch": 126} {"train_loss": -4.951984882354736, "global_step": 5293, "epoch": 126} {"train_loss": -4.529604911804199, "global_step": 5294, "epoch": 126} {"train_loss": -4.735044956207275, "global_step": 5295, "epoch": 126} {"train_loss": -4.811344146728516, "global_step": 5296, "epoch": 126} {"train_loss": -4.73021936416626, "global_step": 5297, "epoch": 126} {"train_loss": -4.761419296264648, "global_step": 5298, "epoch": 126} {"train_loss": -4.723222732543945, "global_step": 5299, "epoch": 126} {"train_loss": -4.728225231170654, "global_step": 5300, "epoch": 126} {"train_loss": -4.754419326782227, "global_step": 5301, "epoch": 126} {"train_loss": -4.777506351470947, "global_step": 5302, "epoch": 126} {"train_loss": -4.680028438568115, "global_step": 5303, "epoch": 126} {"train_loss": -4.679349899291992, "global_step": 5304, "epoch": 126} {"train_loss": -4.691138744354248, "global_step": 5305, "epoch": 126} {"train_loss": -4.699676990509033, "global_step": 5306, "epoch": 126} {"train_loss": -4.657318115234375, "global_step": 5307, "epoch": 126} {"train_loss": -4.57016134262085, "global_step": 5308, "epoch": 126} {"train_loss": -4.629395484924316, "global_step": 5309, "epoch": 126} {"train_loss": -4.519471168518066, "global_step": 5310, "epoch": 126} {"train_loss": -4.685513496398926, "global_step": 5311, "epoch": 126} {"train_loss": -4.715397834777832, "global_step": 5312, "epoch": 126} {"train_loss": -4.7212300300598145, "global_step": 5313, "epoch": 126} {"train_loss": -4.812251091003418, "global_step": 5314, "epoch": 126} {"train_loss": -4.859820365905762, "global_step": 5315, "epoch": 126} {"train_loss": -4.842035293579102, "global_step": 5316, "epoch": 126} {"train_loss": -4.751223564147949, "global_step": 5317, "epoch": 126} {"train_loss": -4.771628379821777, "global_step": 5318, "epoch": 126} {"train_loss": -4.658167362213135, "global_step": 5319, "epoch": 126} {"train_loss": -4.691885948181152, "global_step": 5320, "epoch": 126} {"train_loss": -4.752820014953613, "global_step": 5321, "epoch": 126} {"train_loss": -4.87666130065918, "global_step": 5322, "epoch": 126} {"train_loss": -4.791540622711182, "global_step": 5323, "epoch": 126} {"train_loss": -4.56797981262207, "global_step": 5324, "epoch": 126} {"train_loss": -4.739805221557617, "global_step": 5325, "epoch": 126} {"train_loss": -4.947793006896973, "global_step": 5326, "epoch": 126} {"train_loss": -4.793290138244629, "global_step": 5327, "epoch": 126} {"train_loss": -4.6433820724487305, "global_step": 5328, "epoch": 126} {"train_loss": -4.742404937744141, "global_step": 5329, "epoch": 126} {"train_loss": -4.62160587310791, "global_step": 5330, "epoch": 126} {"train_loss": -4.530229568481445, "global_step": 5331, "epoch": 126} {"train_loss": -4.681220531463623, "global_step": 5332, "epoch": 126} {"train_loss": -4.718934002376738, "global_step": 5333, "epoch": 126, "val_loss": 90059.9140625} {"train_loss": -4.414231777191162, "global_step": 5334, "epoch": 127} {"train_loss": -4.592830181121826, "global_step": 5335, "epoch": 127} {"train_loss": -4.744927406311035, "global_step": 5336, "epoch": 127} {"train_loss": -4.748676300048828, "global_step": 5337, "epoch": 127} {"train_loss": -4.764182090759277, "global_step": 5338, "epoch": 127} {"train_loss": -4.701174736022949, "global_step": 5339, "epoch": 127} {"train_loss": -4.741934776306152, "global_step": 5340, "epoch": 127} {"train_loss": -4.658324718475342, "global_step": 5341, "epoch": 127} {"train_loss": -4.771961212158203, "global_step": 5342, "epoch": 127} {"train_loss": -4.760290145874023, "global_step": 5343, "epoch": 127} {"train_loss": -4.742517948150635, "global_step": 5344, "epoch": 127} {"train_loss": -4.861711502075195, "global_step": 5345, "epoch": 127} {"train_loss": -4.7458271980285645, "global_step": 5346, "epoch": 127} {"train_loss": -4.692957401275635, "global_step": 5347, "epoch": 127} {"train_loss": -4.622950077056885, "global_step": 5348, "epoch": 127} {"train_loss": -4.737682819366455, "global_step": 5349, "epoch": 127} {"train_loss": -4.795285224914551, "global_step": 5350, "epoch": 127} {"train_loss": -4.761938095092773, "global_step": 5351, "epoch": 127} {"train_loss": -4.547147750854492, "global_step": 5352, "epoch": 127} {"train_loss": -4.454904079437256, "global_step": 5353, "epoch": 127} {"train_loss": -4.781815528869629, "global_step": 5354, "epoch": 127} {"train_loss": -4.4261474609375, "global_step": 5355, "epoch": 127} {"train_loss": -4.400082588195801, "global_step": 5356, "epoch": 127} {"train_loss": -4.710880756378174, "global_step": 5357, "epoch": 127} {"train_loss": -4.549180030822754, "global_step": 5358, "epoch": 127} {"train_loss": -4.476257801055908, "global_step": 5359, "epoch": 127} {"train_loss": -4.650740623474121, "global_step": 5360, "epoch": 127} {"train_loss": -4.62985897064209, "global_step": 5361, "epoch": 127} {"train_loss": -4.717161178588867, "global_step": 5362, "epoch": 127} {"train_loss": -4.75190544128418, "global_step": 5363, "epoch": 127} {"train_loss": -4.497384071350098, "global_step": 5364, "epoch": 127} {"train_loss": -4.590672492980957, "global_step": 5365, "epoch": 127} {"train_loss": -4.7584381103515625, "global_step": 5366, "epoch": 127} {"train_loss": -4.626208305358887, "global_step": 5367, "epoch": 127} {"train_loss": -4.586568832397461, "global_step": 5368, "epoch": 127} {"train_loss": -4.765374660491943, "global_step": 5369, "epoch": 127} {"train_loss": -4.536440849304199, "global_step": 5370, "epoch": 127} {"train_loss": -4.803805351257324, "global_step": 5371, "epoch": 127} {"train_loss": -4.574909210205078, "global_step": 5372, "epoch": 127} {"train_loss": -4.812656402587891, "global_step": 5373, "epoch": 127} {"train_loss": -4.669231414794922, "global_step": 5374, "epoch": 127} {"train_loss": -4.661936589649746, "global_step": 5375, "epoch": 127, "val_loss": 88627.1953125} {"train_loss": -4.852349758148193, "global_step": 5376, "epoch": 128} {"train_loss": -4.4582037925720215, "global_step": 5377, "epoch": 128} {"train_loss": -4.595060348510742, "global_step": 5378, "epoch": 128} {"train_loss": -4.823925495147705, "global_step": 5379, "epoch": 128} {"train_loss": -4.529181480407715, "global_step": 5380, "epoch": 128} {"train_loss": -4.639116287231445, "global_step": 5381, "epoch": 128} {"train_loss": -4.748553276062012, "global_step": 5382, "epoch": 128} {"train_loss": -4.675538063049316, "global_step": 5383, "epoch": 128} {"train_loss": -4.626726150512695, "global_step": 5384, "epoch": 128} {"train_loss": -4.5914459228515625, "global_step": 5385, "epoch": 128} {"train_loss": -4.720054626464844, "global_step": 5386, "epoch": 128} {"train_loss": -4.826172828674316, "global_step": 5387, "epoch": 128} {"train_loss": -4.675661563873291, "global_step": 5388, "epoch": 128} {"train_loss": -4.736420154571533, "global_step": 5389, "epoch": 128} {"train_loss": -4.6149797439575195, "global_step": 5390, "epoch": 128} {"train_loss": -4.575442790985107, "global_step": 5391, "epoch": 128} {"train_loss": -4.876542091369629, "global_step": 5392, "epoch": 128} {"train_loss": -4.7026166915893555, "global_step": 5393, "epoch": 128} {"train_loss": -4.741571426391602, "global_step": 5394, "epoch": 128} {"train_loss": -4.607615947723389, "global_step": 5395, "epoch": 128} {"train_loss": -4.674869537353516, "global_step": 5396, "epoch": 128} {"train_loss": -4.723101615905762, "global_step": 5397, "epoch": 128} {"train_loss": -4.83660888671875, "global_step": 5398, "epoch": 128} {"train_loss": -4.685757637023926, "global_step": 5399, "epoch": 128} {"train_loss": -4.543181419372559, "global_step": 5400, "epoch": 128} {"train_loss": -4.584075927734375, "global_step": 5401, "epoch": 128} {"train_loss": -4.734989166259766, "global_step": 5402, "epoch": 128} {"train_loss": -4.640840530395508, "global_step": 5403, "epoch": 128} {"train_loss": -4.755455017089844, "global_step": 5404, "epoch": 128} {"train_loss": -4.834507942199707, "global_step": 5405, "epoch": 128} {"train_loss": -4.684738636016846, "global_step": 5406, "epoch": 128} {"train_loss": -4.75095272064209, "global_step": 5407, "epoch": 128} {"train_loss": -4.632225036621094, "global_step": 5408, "epoch": 128} {"train_loss": -4.75353479385376, "global_step": 5409, "epoch": 128} {"train_loss": -4.80976676940918, "global_step": 5410, "epoch": 128} {"train_loss": -4.725702285766602, "global_step": 5411, "epoch": 128} {"train_loss": -4.7953290939331055, "global_step": 5412, "epoch": 128} {"train_loss": -4.953350067138672, "global_step": 5413, "epoch": 128} {"train_loss": -4.715051651000977, "global_step": 5414, "epoch": 128} {"train_loss": -4.748230457305908, "global_step": 5415, "epoch": 128} {"train_loss": -4.528786659240723, "global_step": 5416, "epoch": 128} {"train_loss": -4.7033847740718295, "global_step": 5417, "epoch": 128, "val_loss": 86987.0546875} {"train_loss": -4.750710487365723, "global_step": 5418, "epoch": 129} {"train_loss": -4.776946067810059, "global_step": 5419, "epoch": 129} {"train_loss": -4.509946823120117, "global_step": 5420, "epoch": 129} {"train_loss": -4.608684539794922, "global_step": 5421, "epoch": 129} {"train_loss": -4.808816909790039, "global_step": 5422, "epoch": 129} {"train_loss": -4.695415496826172, "global_step": 5423, "epoch": 129} {"train_loss": -4.455092430114746, "global_step": 5424, "epoch": 129} {"train_loss": -4.762425899505615, "global_step": 5425, "epoch": 129} {"train_loss": -4.6593708992004395, "global_step": 5426, "epoch": 129} {"train_loss": -4.5021653175354, "global_step": 5427, "epoch": 129} {"train_loss": -4.77629280090332, "global_step": 5428, "epoch": 129} {"train_loss": -4.849010944366455, "global_step": 5429, "epoch": 129} {"train_loss": -4.6412506103515625, "global_step": 5430, "epoch": 129} {"train_loss": -4.560487747192383, "global_step": 5431, "epoch": 129} {"train_loss": -4.58287239074707, "global_step": 5432, "epoch": 129} {"train_loss": -4.3973283767700195, "global_step": 5433, "epoch": 129} {"train_loss": -4.683148384094238, "global_step": 5434, "epoch": 129} {"train_loss": -4.711507797241211, "global_step": 5435, "epoch": 129} {"train_loss": -4.7265753746032715, "global_step": 5436, "epoch": 129} {"train_loss": -4.712320327758789, "global_step": 5437, "epoch": 129} {"train_loss": -4.675947666168213, "global_step": 5438, "epoch": 129} {"train_loss": -4.7276458740234375, "global_step": 5439, "epoch": 129} {"train_loss": -4.7354841232299805, "global_step": 5440, "epoch": 129} {"train_loss": -4.7754011154174805, "global_step": 5441, "epoch": 129} {"train_loss": -4.744168281555176, "global_step": 5442, "epoch": 129} {"train_loss": -4.7745513916015625, "global_step": 5443, "epoch": 129} {"train_loss": -4.6342058181762695, "global_step": 5444, "epoch": 129} {"train_loss": -4.949123382568359, "global_step": 5445, "epoch": 129} {"train_loss": -4.7288947105407715, "global_step": 5446, "epoch": 129} {"train_loss": -4.799147605895996, "global_step": 5447, "epoch": 129} {"train_loss": -4.727035999298096, "global_step": 5448, "epoch": 129} {"train_loss": -4.640669822692871, "global_step": 5449, "epoch": 129} {"train_loss": -4.640505790710449, "global_step": 5450, "epoch": 129} {"train_loss": -4.729195594787598, "global_step": 5451, "epoch": 129} {"train_loss": -4.566441535949707, "global_step": 5452, "epoch": 129} {"train_loss": -4.433750152587891, "global_step": 5453, "epoch": 129} {"train_loss": -4.6928558349609375, "global_step": 5454, "epoch": 129} {"train_loss": -4.829223155975342, "global_step": 5455, "epoch": 129} {"train_loss": -4.601388931274414, "global_step": 5456, "epoch": 129} {"train_loss": -4.544999122619629, "global_step": 5457, "epoch": 129} {"train_loss": -4.731314182281494, "global_step": 5458, "epoch": 129} {"train_loss": -4.678683587482998, "global_step": 5459, "epoch": 129, "val_loss": 88687.890625} {"train_loss": -4.469564437866211, "global_step": 5460, "epoch": 130} {"train_loss": -4.791948318481445, "global_step": 5461, "epoch": 130} {"train_loss": -4.849541664123535, "global_step": 5462, "epoch": 130} {"train_loss": -4.6443634033203125, "global_step": 5463, "epoch": 130} {"train_loss": -4.785305023193359, "global_step": 5464, "epoch": 130} {"train_loss": -4.662939548492432, "global_step": 5465, "epoch": 130} {"train_loss": -4.685851097106934, "global_step": 5466, "epoch": 130} {"train_loss": -4.771930694580078, "global_step": 5467, "epoch": 130} {"train_loss": -4.616281509399414, "global_step": 5468, "epoch": 130} {"train_loss": -4.802089691162109, "global_step": 5469, "epoch": 130} {"train_loss": -4.749607086181641, "global_step": 5470, "epoch": 130} {"train_loss": -4.616451263427734, "global_step": 5471, "epoch": 130} {"train_loss": -4.640719413757324, "global_step": 5472, "epoch": 130} {"train_loss": -4.653982162475586, "global_step": 5473, "epoch": 130} {"train_loss": -4.647671699523926, "global_step": 5474, "epoch": 130} {"train_loss": -4.830498218536377, "global_step": 5475, "epoch": 130} {"train_loss": -4.840323448181152, "global_step": 5476, "epoch": 130} {"train_loss": -4.672161102294922, "global_step": 5477, "epoch": 130} {"train_loss": -4.698695659637451, "global_step": 5478, "epoch": 130} {"train_loss": -4.698497772216797, "global_step": 5479, "epoch": 130} {"train_loss": -4.724544048309326, "global_step": 5480, "epoch": 130} {"train_loss": -4.874185562133789, "global_step": 5481, "epoch": 130} {"train_loss": -4.914355278015137, "global_step": 5482, "epoch": 130} {"train_loss": -4.803325176239014, "global_step": 5483, "epoch": 130} {"train_loss": -4.787476539611816, "global_step": 5484, "epoch": 130} {"train_loss": -4.683393955230713, "global_step": 5485, "epoch": 130} {"train_loss": -4.809643268585205, "global_step": 5486, "epoch": 130} {"train_loss": -4.722817897796631, "global_step": 5487, "epoch": 130} {"train_loss": -4.83702278137207, "global_step": 5488, "epoch": 130} {"train_loss": -4.817214012145996, "global_step": 5489, "epoch": 130} {"train_loss": -4.83811092376709, "global_step": 5490, "epoch": 130} {"train_loss": -4.864943981170654, "global_step": 5491, "epoch": 130} {"train_loss": -4.591832160949707, "global_step": 5492, "epoch": 130} {"train_loss": -4.186727523803711, "global_step": 5493, "epoch": 130} {"train_loss": -4.711615085601807, "global_step": 5494, "epoch": 130} {"train_loss": -4.3536834716796875, "global_step": 5495, "epoch": 130} {"train_loss": -4.084455490112305, "global_step": 5496, "epoch": 130} {"train_loss": -3.931072950363159, "global_step": 5497, "epoch": 130} {"train_loss": -4.56695556640625, "global_step": 5498, "epoch": 130} {"train_loss": -2.888763427734375, "global_step": 5499, "epoch": 130} {"train_loss": -4.094364643096924, "global_step": 5500, "epoch": 130} {"train_loss": -4.584098083632333, "global_step": 5501, "epoch": 130, "val_loss": 119868.984375} {"train_loss": -2.9785115718841553, "global_step": 5502, "epoch": 131} {"train_loss": -2.8869142532348633, "global_step": 5503, "epoch": 131} {"train_loss": -3.3588905334472656, "global_step": 5504, "epoch": 131} {"train_loss": -3.8405325412750244, "global_step": 5505, "epoch": 131} {"train_loss": -2.277885913848877, "global_step": 5506, "epoch": 131} {"train_loss": -2.78438663482666, "global_step": 5507, "epoch": 131} {"train_loss": -4.031280517578125, "global_step": 5508, "epoch": 131} {"train_loss": -3.146085739135742, "global_step": 5509, "epoch": 131} {"train_loss": -3.757233142852783, "global_step": 5510, "epoch": 131} {"train_loss": -3.744448184967041, "global_step": 5511, "epoch": 131} {"train_loss": -3.883307456970215, "global_step": 5512, "epoch": 131} {"train_loss": -3.715733528137207, "global_step": 5513, "epoch": 131} {"train_loss": -3.998347282409668, "global_step": 5514, "epoch": 131} {"train_loss": -3.9656825065612793, "global_step": 5515, "epoch": 131} {"train_loss": -4.017879962921143, "global_step": 5516, "epoch": 131} {"train_loss": -3.8912317752838135, "global_step": 5517, "epoch": 131} {"train_loss": -3.884054183959961, "global_step": 5518, "epoch": 131} {"train_loss": -3.9666290283203125, "global_step": 5519, "epoch": 131} {"train_loss": -3.9744346141815186, "global_step": 5520, "epoch": 131} {"train_loss": -3.973958969116211, "global_step": 5521, "epoch": 131} {"train_loss": -4.095125198364258, "global_step": 5522, "epoch": 131} {"train_loss": -4.267666339874268, "global_step": 5523, "epoch": 131} {"train_loss": -4.145519256591797, "global_step": 5524, "epoch": 131} {"train_loss": -4.161537170410156, "global_step": 5525, "epoch": 131} {"train_loss": -4.097010135650635, "global_step": 5526, "epoch": 131} {"train_loss": -4.296645164489746, "global_step": 5527, "epoch": 131} {"train_loss": -4.293531894683838, "global_step": 5528, "epoch": 131} {"train_loss": -4.273332595825195, "global_step": 5529, "epoch": 131} {"train_loss": -4.315426826477051, "global_step": 5530, "epoch": 131} {"train_loss": -4.404494285583496, "global_step": 5531, "epoch": 131} {"train_loss": -4.279398441314697, "global_step": 5532, "epoch": 131} {"train_loss": -4.385812759399414, "global_step": 5533, "epoch": 131} {"train_loss": -4.482799530029297, "global_step": 5534, "epoch": 131} {"train_loss": -4.592504501342773, "global_step": 5535, "epoch": 131} {"train_loss": -4.446521759033203, "global_step": 5536, "epoch": 131} {"train_loss": -4.506582260131836, "global_step": 5537, "epoch": 131} {"train_loss": -4.461800575256348, "global_step": 5538, "epoch": 131} {"train_loss": -4.5219268798828125, "global_step": 5539, "epoch": 131} {"train_loss": -4.583782196044922, "global_step": 5540, "epoch": 131} {"train_loss": -4.638874530792236, "global_step": 5541, "epoch": 131} {"train_loss": -4.537854194641113, "global_step": 5542, "epoch": 131} {"train_loss": -4.010843481336321, "global_step": 5543, "epoch": 131, "val_loss": 85984.2265625} {"train_loss": -4.634088516235352, "global_step": 5544, "epoch": 132} {"train_loss": -4.7193450927734375, "global_step": 5545, "epoch": 132} {"train_loss": -4.632480621337891, "global_step": 5546, "epoch": 132} {"train_loss": -4.602738380432129, "global_step": 5547, "epoch": 132} {"train_loss": -4.509621620178223, "global_step": 5548, "epoch": 132} {"train_loss": -4.4931640625, "global_step": 5549, "epoch": 132} {"train_loss": -4.579441547393799, "global_step": 5550, "epoch": 132} {"train_loss": -4.712441444396973, "global_step": 5551, "epoch": 132} {"train_loss": -4.631770133972168, "global_step": 5552, "epoch": 132} {"train_loss": -4.562170028686523, "global_step": 5553, "epoch": 132} {"train_loss": -4.6234540939331055, "global_step": 5554, "epoch": 132} {"train_loss": -4.697352409362793, "global_step": 5555, "epoch": 132} {"train_loss": -4.506164073944092, "global_step": 5556, "epoch": 132} {"train_loss": -4.544698238372803, "global_step": 5557, "epoch": 132} {"train_loss": -4.484842300415039, "global_step": 5558, "epoch": 132} {"train_loss": -4.451986789703369, "global_step": 5559, "epoch": 132} {"train_loss": -4.8641438484191895, "global_step": 5560, "epoch": 132} {"train_loss": -4.568018913269043, "global_step": 5561, "epoch": 132} {"train_loss": -4.440276145935059, "global_step": 5562, "epoch": 132} {"train_loss": -4.513385772705078, "global_step": 5563, "epoch": 132} {"train_loss": -4.621413230895996, "global_step": 5564, "epoch": 132} {"train_loss": -4.533607482910156, "global_step": 5565, "epoch": 132} {"train_loss": -4.617339134216309, "global_step": 5566, "epoch": 132} {"train_loss": -4.604307651519775, "global_step": 5567, "epoch": 132} {"train_loss": -4.7328596115112305, "global_step": 5568, "epoch": 132} {"train_loss": -4.570976257324219, "global_step": 5569, "epoch": 132} {"train_loss": -4.558558940887451, "global_step": 5570, "epoch": 132} {"train_loss": -4.725163459777832, "global_step": 5571, "epoch": 132} {"train_loss": -4.586828708648682, "global_step": 5572, "epoch": 132} {"train_loss": -4.663987159729004, "global_step": 5573, "epoch": 132} {"train_loss": -4.690566062927246, "global_step": 5574, "epoch": 132} {"train_loss": -4.833120822906494, "global_step": 5575, "epoch": 132} {"train_loss": -4.783349990844727, "global_step": 5576, "epoch": 132} {"train_loss": -4.539165496826172, "global_step": 5577, "epoch": 132} {"train_loss": -4.84678840637207, "global_step": 5578, "epoch": 132} {"train_loss": -4.801901817321777, "global_step": 5579, "epoch": 132} {"train_loss": -4.821913242340088, "global_step": 5580, "epoch": 132} {"train_loss": -4.81193733215332, "global_step": 5581, "epoch": 132} {"train_loss": -4.601855754852295, "global_step": 5582, "epoch": 132} {"train_loss": -4.710996627807617, "global_step": 5583, "epoch": 132} {"train_loss": -4.714822292327881, "global_step": 5584, "epoch": 132} {"train_loss": -4.639596939086914, "global_step": 5585, "epoch": 132, "val_loss": 87394.859375} {"train_loss": -4.567239761352539, "global_step": 5586, "epoch": 133} {"train_loss": -4.6823649406433105, "global_step": 5587, "epoch": 133} {"train_loss": -4.7487592697143555, "global_step": 5588, "epoch": 133} {"train_loss": -4.676698684692383, "global_step": 5589, "epoch": 133} {"train_loss": -4.740016460418701, "global_step": 5590, "epoch": 133} {"train_loss": -4.779734134674072, "global_step": 5591, "epoch": 133} {"train_loss": -4.678974151611328, "global_step": 5592, "epoch": 133} {"train_loss": -4.673230171203613, "global_step": 5593, "epoch": 133} {"train_loss": -4.66004753112793, "global_step": 5594, "epoch": 133} {"train_loss": -4.716030120849609, "global_step": 5595, "epoch": 133} {"train_loss": -4.58836555480957, "global_step": 5596, "epoch": 133} {"train_loss": -4.754868507385254, "global_step": 5597, "epoch": 133} {"train_loss": -4.688961029052734, "global_step": 5598, "epoch": 133} {"train_loss": -4.719959735870361, "global_step": 5599, "epoch": 133} {"train_loss": -4.664728164672852, "global_step": 5600, "epoch": 133} {"train_loss": -4.79856538772583, "global_step": 5601, "epoch": 133} {"train_loss": -4.692549705505371, "global_step": 5602, "epoch": 133} {"train_loss": -4.651974678039551, "global_step": 5603, "epoch": 133} {"train_loss": -4.706258773803711, "global_step": 5604, "epoch": 133} {"train_loss": -4.677400588989258, "global_step": 5605, "epoch": 133} {"train_loss": -4.8148603439331055, "global_step": 5606, "epoch": 133} {"train_loss": -4.590373992919922, "global_step": 5607, "epoch": 133} {"train_loss": -4.892505645751953, "global_step": 5608, "epoch": 133} {"train_loss": -4.73153018951416, "global_step": 5609, "epoch": 133} {"train_loss": -4.7689032554626465, "global_step": 5610, "epoch": 133} {"train_loss": -4.697972297668457, "global_step": 5611, "epoch": 133} {"train_loss": -4.645906448364258, "global_step": 5612, "epoch": 133} {"train_loss": -4.7981061935424805, "global_step": 5613, "epoch": 133} {"train_loss": -4.697165489196777, "global_step": 5614, "epoch": 133} {"train_loss": -4.630084991455078, "global_step": 5615, "epoch": 133} {"train_loss": -4.674419403076172, "global_step": 5616, "epoch": 133} {"train_loss": -4.79884672164917, "global_step": 5617, "epoch": 133} {"train_loss": -4.7885026931762695, "global_step": 5618, "epoch": 133} {"train_loss": -4.930063247680664, "global_step": 5619, "epoch": 133} {"train_loss": -4.7772064208984375, "global_step": 5620, "epoch": 133} {"train_loss": -4.739714622497559, "global_step": 5621, "epoch": 133} {"train_loss": -4.76950740814209, "global_step": 5622, "epoch": 133} {"train_loss": -4.844022750854492, "global_step": 5623, "epoch": 133} {"train_loss": -4.854326248168945, "global_step": 5624, "epoch": 133} {"train_loss": -4.659836292266846, "global_step": 5625, "epoch": 133} {"train_loss": -4.688473701477051, "global_step": 5626, "epoch": 133} {"train_loss": -4.720579215458462, "global_step": 5627, "epoch": 133, "val_loss": 86145.6640625} {"train_loss": -4.628791332244873, "global_step": 5628, "epoch": 134} {"train_loss": -4.710819244384766, "global_step": 5629, "epoch": 134} {"train_loss": -4.663311958312988, "global_step": 5630, "epoch": 134} {"train_loss": -4.580106258392334, "global_step": 5631, "epoch": 134} {"train_loss": -4.565115451812744, "global_step": 5632, "epoch": 134} {"train_loss": -4.663863182067871, "global_step": 5633, "epoch": 134} {"train_loss": -4.941544532775879, "global_step": 5634, "epoch": 134} {"train_loss": -4.80879020690918, "global_step": 5635, "epoch": 134} {"train_loss": -4.678150177001953, "global_step": 5636, "epoch": 134} {"train_loss": -4.776654243469238, "global_step": 5637, "epoch": 134} {"train_loss": -4.694324493408203, "global_step": 5638, "epoch": 134} {"train_loss": -4.556975364685059, "global_step": 5639, "epoch": 134} {"train_loss": -4.699785232543945, "global_step": 5640, "epoch": 134} {"train_loss": -4.702157020568848, "global_step": 5641, "epoch": 134} {"train_loss": -4.711256980895996, "global_step": 5642, "epoch": 134} {"train_loss": -4.694055080413818, "global_step": 5643, "epoch": 134} {"train_loss": -4.635643482208252, "global_step": 5644, "epoch": 134} {"train_loss": -4.610308647155762, "global_step": 5645, "epoch": 134} {"train_loss": -4.727669715881348, "global_step": 5646, "epoch": 134} {"train_loss": -4.830321788787842, "global_step": 5647, "epoch": 134} {"train_loss": -4.694873809814453, "global_step": 5648, "epoch": 134} {"train_loss": -4.729936599731445, "global_step": 5649, "epoch": 134} {"train_loss": -4.845497131347656, "global_step": 5650, "epoch": 134} {"train_loss": -4.765317440032959, "global_step": 5651, "epoch": 134} {"train_loss": -4.700782775878906, "global_step": 5652, "epoch": 134} {"train_loss": -4.7524261474609375, "global_step": 5653, "epoch": 134} {"train_loss": -4.897929668426514, "global_step": 5654, "epoch": 134} {"train_loss": -4.738346099853516, "global_step": 5655, "epoch": 134} {"train_loss": -4.668737411499023, "global_step": 5656, "epoch": 134} {"train_loss": -4.608284950256348, "global_step": 5657, "epoch": 134} {"train_loss": -4.843840599060059, "global_step": 5658, "epoch": 134} {"train_loss": -4.734148025512695, "global_step": 5659, "epoch": 134} {"train_loss": -4.641748428344727, "global_step": 5660, "epoch": 134} {"train_loss": -4.646021366119385, "global_step": 5661, "epoch": 134} {"train_loss": -4.8064069747924805, "global_step": 5662, "epoch": 134} {"train_loss": -4.906155586242676, "global_step": 5663, "epoch": 134} {"train_loss": -4.887253761291504, "global_step": 5664, "epoch": 134} {"train_loss": -4.847508907318115, "global_step": 5665, "epoch": 134} {"train_loss": -4.760087013244629, "global_step": 5666, "epoch": 134} {"train_loss": -4.7684221267700195, "global_step": 5667, "epoch": 134} {"train_loss": -4.673158645629883, "global_step": 5668, "epoch": 134} {"train_loss": -4.72390840167091, "global_step": 5669, "epoch": 134, "val_loss": 86135.40625} {"train_loss": -4.842844009399414, "global_step": 5670, "epoch": 135} {"train_loss": -4.568449020385742, "global_step": 5671, "epoch": 135} {"train_loss": -4.688910484313965, "global_step": 5672, "epoch": 135} {"train_loss": -4.889670372009277, "global_step": 5673, "epoch": 135} {"train_loss": -4.8104567527771, "global_step": 5674, "epoch": 135} {"train_loss": -4.703165054321289, "global_step": 5675, "epoch": 135} {"train_loss": -4.700458526611328, "global_step": 5676, "epoch": 135} {"train_loss": -4.73747444152832, "global_step": 5677, "epoch": 135} {"train_loss": -4.793243408203125, "global_step": 5678, "epoch": 135} {"train_loss": -4.8490071296691895, "global_step": 5679, "epoch": 135} {"train_loss": -4.709949493408203, "global_step": 5680, "epoch": 135} {"train_loss": -4.713466644287109, "global_step": 5681, "epoch": 135} {"train_loss": -4.716667175292969, "global_step": 5682, "epoch": 135} {"train_loss": -4.6778974533081055, "global_step": 5683, "epoch": 135} {"train_loss": -4.646581172943115, "global_step": 5684, "epoch": 135} {"train_loss": -4.7280755043029785, "global_step": 5685, "epoch": 135} {"train_loss": -4.679451942443848, "global_step": 5686, "epoch": 135} {"train_loss": -4.705015182495117, "global_step": 5687, "epoch": 135} {"train_loss": -4.868507385253906, "global_step": 5688, "epoch": 135} {"train_loss": -4.701718330383301, "global_step": 5689, "epoch": 135} {"train_loss": -4.531682014465332, "global_step": 5690, "epoch": 135} {"train_loss": -4.755157470703125, "global_step": 5691, "epoch": 135} {"train_loss": -4.684581279754639, "global_step": 5692, "epoch": 135} {"train_loss": -4.945930480957031, "global_step": 5693, "epoch": 135} {"train_loss": -4.866316318511963, "global_step": 5694, "epoch": 135} {"train_loss": -4.5392656326293945, "global_step": 5695, "epoch": 135} {"train_loss": -4.579724311828613, "global_step": 5696, "epoch": 135} {"train_loss": -4.485846519470215, "global_step": 5697, "epoch": 135} {"train_loss": -4.610699653625488, "global_step": 5698, "epoch": 135} {"train_loss": -4.718523025512695, "global_step": 5699, "epoch": 135} {"train_loss": -4.756811618804932, "global_step": 5700, "epoch": 135} {"train_loss": -4.731533527374268, "global_step": 5701, "epoch": 135} {"train_loss": -4.673051834106445, "global_step": 5702, "epoch": 135} {"train_loss": -4.636178970336914, "global_step": 5703, "epoch": 135} {"train_loss": -4.776918411254883, "global_step": 5704, "epoch": 135} {"train_loss": -4.94734001159668, "global_step": 5705, "epoch": 135} {"train_loss": -4.78488302230835, "global_step": 5706, "epoch": 135} {"train_loss": -4.77009391784668, "global_step": 5707, "epoch": 135} {"train_loss": -4.819860458374023, "global_step": 5708, "epoch": 135} {"train_loss": -4.700328350067139, "global_step": 5709, "epoch": 135} {"train_loss": -4.6432366371154785, "global_step": 5710, "epoch": 135} {"train_loss": -4.723558970860073, "global_step": 5711, "epoch": 135, "val_loss": 84593.9140625} {"train_loss": -4.760387897491455, "global_step": 5712, "epoch": 136} {"train_loss": -4.711613655090332, "global_step": 5713, "epoch": 136} {"train_loss": -4.757720947265625, "global_step": 5714, "epoch": 136} {"train_loss": -4.773180961608887, "global_step": 5715, "epoch": 136} {"train_loss": -4.675120830535889, "global_step": 5716, "epoch": 136} {"train_loss": -4.823095798492432, "global_step": 5717, "epoch": 136} {"train_loss": -4.756976127624512, "global_step": 5718, "epoch": 136} {"train_loss": -4.746376037597656, "global_step": 5719, "epoch": 136} {"train_loss": -4.5018391609191895, "global_step": 5720, "epoch": 136} {"train_loss": -4.53339147567749, "global_step": 5721, "epoch": 136} {"train_loss": -4.682058811187744, "global_step": 5722, "epoch": 136} {"train_loss": -4.608321189880371, "global_step": 5723, "epoch": 136} {"train_loss": -4.860713005065918, "global_step": 5724, "epoch": 136} {"train_loss": -4.676451206207275, "global_step": 5725, "epoch": 136} {"train_loss": -4.702164649963379, "global_step": 5726, "epoch": 136} {"train_loss": -4.777469635009766, "global_step": 5727, "epoch": 136} {"train_loss": -4.760514736175537, "global_step": 5728, "epoch": 136} {"train_loss": -4.740784168243408, "global_step": 5729, "epoch": 136} {"train_loss": -4.7980852127075195, "global_step": 5730, "epoch": 136} {"train_loss": -4.825310707092285, "global_step": 5731, "epoch": 136} {"train_loss": -4.840719223022461, "global_step": 5732, "epoch": 136} {"train_loss": -4.7423095703125, "global_step": 5733, "epoch": 136} {"train_loss": -4.622097015380859, "global_step": 5734, "epoch": 136} {"train_loss": -4.777378082275391, "global_step": 5735, "epoch": 136} {"train_loss": -4.557523727416992, "global_step": 5736, "epoch": 136} {"train_loss": -4.662355899810791, "global_step": 5737, "epoch": 136} {"train_loss": -4.798089981079102, "global_step": 5738, "epoch": 136} {"train_loss": -4.7788848876953125, "global_step": 5739, "epoch": 136} {"train_loss": -4.630814552307129, "global_step": 5740, "epoch": 136} {"train_loss": -4.643749713897705, "global_step": 5741, "epoch": 136} {"train_loss": -4.746006488800049, "global_step": 5742, "epoch": 136} {"train_loss": -4.852034568786621, "global_step": 5743, "epoch": 136} {"train_loss": -4.752430438995361, "global_step": 5744, "epoch": 136} {"train_loss": -4.675845146179199, "global_step": 5745, "epoch": 136} {"train_loss": -4.804426193237305, "global_step": 5746, "epoch": 136} {"train_loss": -4.8360724449157715, "global_step": 5747, "epoch": 136} {"train_loss": -4.80526065826416, "global_step": 5748, "epoch": 136} {"train_loss": -4.828752040863037, "global_step": 5749, "epoch": 136} {"train_loss": -4.698920726776123, "global_step": 5750, "epoch": 136} {"train_loss": -4.766115665435791, "global_step": 5751, "epoch": 136} {"train_loss": -4.4179511070251465, "global_step": 5752, "epoch": 136} {"train_loss": -4.7240134761447, "global_step": 5753, "epoch": 136, "val_loss": 84546.8515625} {"train_loss": -4.820610046386719, "global_step": 5754, "epoch": 137} {"train_loss": -4.8204216957092285, "global_step": 5755, "epoch": 137} {"train_loss": -4.512399673461914, "global_step": 5756, "epoch": 137} {"train_loss": -4.885501861572266, "global_step": 5757, "epoch": 137} {"train_loss": -4.747185230255127, "global_step": 5758, "epoch": 137} {"train_loss": -4.677853584289551, "global_step": 5759, "epoch": 137} {"train_loss": -4.736907958984375, "global_step": 5760, "epoch": 137} {"train_loss": -4.845593452453613, "global_step": 5761, "epoch": 137} {"train_loss": -4.797678470611572, "global_step": 5762, "epoch": 137} {"train_loss": -4.72572135925293, "global_step": 5763, "epoch": 137} {"train_loss": -4.534830093383789, "global_step": 5764, "epoch": 137} {"train_loss": -4.796740531921387, "global_step": 5765, "epoch": 137} {"train_loss": -4.759084701538086, "global_step": 5766, "epoch": 137} {"train_loss": -4.770471096038818, "global_step": 5767, "epoch": 137} {"train_loss": -4.624770164489746, "global_step": 5768, "epoch": 137} {"train_loss": -4.87471866607666, "global_step": 5769, "epoch": 137} {"train_loss": -4.858591079711914, "global_step": 5770, "epoch": 137} {"train_loss": -4.685879230499268, "global_step": 5771, "epoch": 137} {"train_loss": -4.778939247131348, "global_step": 5772, "epoch": 137} {"train_loss": -4.661648750305176, "global_step": 5773, "epoch": 137} {"train_loss": -4.742980480194092, "global_step": 5774, "epoch": 137} {"train_loss": -4.736970901489258, "global_step": 5775, "epoch": 137} {"train_loss": -4.767200469970703, "global_step": 5776, "epoch": 137} {"train_loss": -4.834562301635742, "global_step": 5777, "epoch": 137} {"train_loss": -4.779056072235107, "global_step": 5778, "epoch": 137} {"train_loss": -4.768012523651123, "global_step": 5779, "epoch": 137} {"train_loss": -4.655766487121582, "global_step": 5780, "epoch": 137} {"train_loss": -4.656131744384766, "global_step": 5781, "epoch": 137} {"train_loss": -4.59766149520874, "global_step": 5782, "epoch": 137} {"train_loss": -4.705240249633789, "global_step": 5783, "epoch": 137} {"train_loss": -4.851669788360596, "global_step": 5784, "epoch": 137} {"train_loss": -4.806434631347656, "global_step": 5785, "epoch": 137} {"train_loss": -4.598760604858398, "global_step": 5786, "epoch": 137} {"train_loss": -4.706023216247559, "global_step": 5787, "epoch": 137} {"train_loss": -4.64648962020874, "global_step": 5788, "epoch": 137} {"train_loss": -4.7092180252075195, "global_step": 5789, "epoch": 137} {"train_loss": -4.928779602050781, "global_step": 5790, "epoch": 137} {"train_loss": -4.818601131439209, "global_step": 5791, "epoch": 137} {"train_loss": -4.782827377319336, "global_step": 5792, "epoch": 137} {"train_loss": -4.697274208068848, "global_step": 5793, "epoch": 137} {"train_loss": -4.6912336349487305, "global_step": 5794, "epoch": 137} {"train_loss": -4.743300801231747, "global_step": 5795, "epoch": 137, "val_loss": 82845.96875} {"train_loss": -4.781612873077393, "global_step": 5796, "epoch": 138} {"train_loss": -4.634740829467773, "global_step": 5797, "epoch": 138} {"train_loss": -4.59561824798584, "global_step": 5798, "epoch": 138} {"train_loss": -4.81036376953125, "global_step": 5799, "epoch": 138} {"train_loss": -4.91340970993042, "global_step": 5800, "epoch": 138} {"train_loss": -4.797588348388672, "global_step": 5801, "epoch": 138} {"train_loss": -4.781498908996582, "global_step": 5802, "epoch": 138} {"train_loss": -4.7055158615112305, "global_step": 5803, "epoch": 138} {"train_loss": -4.898250579833984, "global_step": 5804, "epoch": 138} {"train_loss": -4.818179130554199, "global_step": 5805, "epoch": 138} {"train_loss": -4.707871437072754, "global_step": 5806, "epoch": 138} {"train_loss": -4.742715835571289, "global_step": 5807, "epoch": 138} {"train_loss": -4.762394428253174, "global_step": 5808, "epoch": 138} {"train_loss": -4.768310070037842, "global_step": 5809, "epoch": 138} {"train_loss": -4.764732360839844, "global_step": 5810, "epoch": 138} {"train_loss": -4.768169403076172, "global_step": 5811, "epoch": 138} {"train_loss": -4.79742431640625, "global_step": 5812, "epoch": 138} {"train_loss": -4.697153091430664, "global_step": 5813, "epoch": 138} {"train_loss": -4.647629737854004, "global_step": 5814, "epoch": 138} {"train_loss": -4.661198616027832, "global_step": 5815, "epoch": 138} {"train_loss": -4.838940143585205, "global_step": 5816, "epoch": 138} {"train_loss": -4.786130428314209, "global_step": 5817, "epoch": 138} {"train_loss": -4.635499000549316, "global_step": 5818, "epoch": 138} {"train_loss": -4.594264984130859, "global_step": 5819, "epoch": 138} {"train_loss": -4.783710479736328, "global_step": 5820, "epoch": 138} {"train_loss": -4.929474353790283, "global_step": 5821, "epoch": 138} {"train_loss": -4.792654514312744, "global_step": 5822, "epoch": 138} {"train_loss": -4.802567481994629, "global_step": 5823, "epoch": 138} {"train_loss": -4.895393371582031, "global_step": 5824, "epoch": 138} {"train_loss": -4.871884346008301, "global_step": 5825, "epoch": 138} {"train_loss": -4.729023456573486, "global_step": 5826, "epoch": 138} {"train_loss": -4.751023292541504, "global_step": 5827, "epoch": 138} {"train_loss": -5.006924152374268, "global_step": 5828, "epoch": 138} {"train_loss": -4.611172676086426, "global_step": 5829, "epoch": 138} {"train_loss": -4.824662208557129, "global_step": 5830, "epoch": 138} {"train_loss": -4.4816575050354, "global_step": 5831, "epoch": 138} {"train_loss": -4.534207344055176, "global_step": 5832, "epoch": 138} {"train_loss": -4.542088508605957, "global_step": 5833, "epoch": 138} {"train_loss": -4.699652671813965, "global_step": 5834, "epoch": 138} {"train_loss": -4.777642250061035, "global_step": 5835, "epoch": 138} {"train_loss": -4.855348587036133, "global_step": 5836, "epoch": 138} {"train_loss": -4.752847943987165, "global_step": 5837, "epoch": 138, "val_loss": 84632.8203125} {"train_loss": -4.713504791259766, "global_step": 5838, "epoch": 139} {"train_loss": -4.56517219543457, "global_step": 5839, "epoch": 139} {"train_loss": -4.832235813140869, "global_step": 5840, "epoch": 139} {"train_loss": -4.796880722045898, "global_step": 5841, "epoch": 139} {"train_loss": -4.703341484069824, "global_step": 5842, "epoch": 139} {"train_loss": -4.54625129699707, "global_step": 5843, "epoch": 139} {"train_loss": -4.679867267608643, "global_step": 5844, "epoch": 139} {"train_loss": -4.690783977508545, "global_step": 5845, "epoch": 139} {"train_loss": -4.8274946212768555, "global_step": 5846, "epoch": 139} {"train_loss": -4.84694766998291, "global_step": 5847, "epoch": 139} {"train_loss": -4.8224029541015625, "global_step": 5848, "epoch": 139} {"train_loss": -4.712051868438721, "global_step": 5849, "epoch": 139} {"train_loss": -4.8265862464904785, "global_step": 5850, "epoch": 139} {"train_loss": -4.838581562042236, "global_step": 5851, "epoch": 139} {"train_loss": -4.758699417114258, "global_step": 5852, "epoch": 139} {"train_loss": -4.665691375732422, "global_step": 5853, "epoch": 139} {"train_loss": -4.657779693603516, "global_step": 5854, "epoch": 139} {"train_loss": -4.87178897857666, "global_step": 5855, "epoch": 139} {"train_loss": -4.745608806610107, "global_step": 5856, "epoch": 139} {"train_loss": -4.607613563537598, "global_step": 5857, "epoch": 139} {"train_loss": -4.7960286140441895, "global_step": 5858, "epoch": 139} {"train_loss": -4.8692827224731445, "global_step": 5859, "epoch": 139} {"train_loss": -4.791897773742676, "global_step": 5860, "epoch": 139} {"train_loss": -4.788963317871094, "global_step": 5861, "epoch": 139} {"train_loss": -4.596156120300293, "global_step": 5862, "epoch": 139} {"train_loss": -4.636893272399902, "global_step": 5863, "epoch": 139} {"train_loss": -4.857510566711426, "global_step": 5864, "epoch": 139} {"train_loss": -4.744361400604248, "global_step": 5865, "epoch": 139} {"train_loss": -4.714352607727051, "global_step": 5866, "epoch": 139} {"train_loss": -4.931733131408691, "global_step": 5867, "epoch": 139} {"train_loss": -4.725476264953613, "global_step": 5868, "epoch": 139} {"train_loss": -4.743953704833984, "global_step": 5869, "epoch": 139} {"train_loss": -4.613973617553711, "global_step": 5870, "epoch": 139} {"train_loss": -4.803275108337402, "global_step": 5871, "epoch": 139} {"train_loss": -4.841551780700684, "global_step": 5872, "epoch": 139} {"train_loss": -4.738308906555176, "global_step": 5873, "epoch": 139} {"train_loss": -4.802398681640625, "global_step": 5874, "epoch": 139} {"train_loss": -4.821462631225586, "global_step": 5875, "epoch": 139} {"train_loss": -4.621850967407227, "global_step": 5876, "epoch": 139} {"train_loss": -4.619877338409424, "global_step": 5877, "epoch": 139} {"train_loss": -4.789949893951416, "global_step": 5878, "epoch": 139} {"train_loss": -4.74384635970706, "global_step": 5879, "epoch": 139, "val_loss": 82566.984375} {"train_loss": -4.735356330871582, "global_step": 5880, "epoch": 140} {"train_loss": -4.76278018951416, "global_step": 5881, "epoch": 140} {"train_loss": -4.6622161865234375, "global_step": 5882, "epoch": 140} {"train_loss": -4.738069534301758, "global_step": 5883, "epoch": 140} {"train_loss": -4.914955139160156, "global_step": 5884, "epoch": 140} {"train_loss": -4.930178642272949, "global_step": 5885, "epoch": 140} {"train_loss": -4.77764368057251, "global_step": 5886, "epoch": 140} {"train_loss": -4.7355194091796875, "global_step": 5887, "epoch": 140} {"train_loss": -4.743565559387207, "global_step": 5888, "epoch": 140} {"train_loss": -4.441230773925781, "global_step": 5889, "epoch": 140} {"train_loss": -4.473546504974365, "global_step": 5890, "epoch": 140} {"train_loss": -4.710729598999023, "global_step": 5891, "epoch": 140} {"train_loss": -4.685366630554199, "global_step": 5892, "epoch": 140} {"train_loss": -4.819021224975586, "global_step": 5893, "epoch": 140} {"train_loss": -4.823640823364258, "global_step": 5894, "epoch": 140} {"train_loss": -4.742231369018555, "global_step": 5895, "epoch": 140} {"train_loss": -4.774372100830078, "global_step": 5896, "epoch": 140} {"train_loss": -4.730145454406738, "global_step": 5897, "epoch": 140} {"train_loss": -4.786355972290039, "global_step": 5898, "epoch": 140} {"train_loss": -4.6806159019470215, "global_step": 5899, "epoch": 140} {"train_loss": -4.798477649688721, "global_step": 5900, "epoch": 140} {"train_loss": -4.844547748565674, "global_step": 5901, "epoch": 140} {"train_loss": -4.604204177856445, "global_step": 5902, "epoch": 140} {"train_loss": -4.972707748413086, "global_step": 5903, "epoch": 140} {"train_loss": -4.794648170471191, "global_step": 5904, "epoch": 140} {"train_loss": -4.520081520080566, "global_step": 5905, "epoch": 140} {"train_loss": -4.673550128936768, "global_step": 5906, "epoch": 140} {"train_loss": -4.820024013519287, "global_step": 5907, "epoch": 140} {"train_loss": -4.567122459411621, "global_step": 5908, "epoch": 140} {"train_loss": -4.590417861938477, "global_step": 5909, "epoch": 140} {"train_loss": -4.78895902633667, "global_step": 5910, "epoch": 140} {"train_loss": -4.560059547424316, "global_step": 5911, "epoch": 140} {"train_loss": -4.687575817108154, "global_step": 5912, "epoch": 140} {"train_loss": -4.783206939697266, "global_step": 5913, "epoch": 140} {"train_loss": -4.725200176239014, "global_step": 5914, "epoch": 140} {"train_loss": -4.398186683654785, "global_step": 5915, "epoch": 140} {"train_loss": -4.819154739379883, "global_step": 5916, "epoch": 140} {"train_loss": -4.664149284362793, "global_step": 5917, "epoch": 140} {"train_loss": -4.711865425109863, "global_step": 5918, "epoch": 140} {"train_loss": -4.771938800811768, "global_step": 5919, "epoch": 140} {"train_loss": -4.770076751708984, "global_step": 5920, "epoch": 140} {"train_loss": -4.723213865643456, "global_step": 5921, "epoch": 140, "val_loss": 81850.234375} {"train_loss": -4.790596008300781, "global_step": 5922, "epoch": 141} {"train_loss": -4.869375228881836, "global_step": 5923, "epoch": 141} {"train_loss": -4.843815803527832, "global_step": 5924, "epoch": 141} {"train_loss": -4.6344499588012695, "global_step": 5925, "epoch": 141} {"train_loss": -4.686858177185059, "global_step": 5926, "epoch": 141} {"train_loss": -4.869306564331055, "global_step": 5927, "epoch": 141} {"train_loss": -4.7954206466674805, "global_step": 5928, "epoch": 141} {"train_loss": -4.635477542877197, "global_step": 5929, "epoch": 141} {"train_loss": -4.759617328643799, "global_step": 5930, "epoch": 141} {"train_loss": -4.823481559753418, "global_step": 5931, "epoch": 141} {"train_loss": -4.779335021972656, "global_step": 5932, "epoch": 141} {"train_loss": -4.656294822692871, "global_step": 5933, "epoch": 141} {"train_loss": -4.780541896820068, "global_step": 5934, "epoch": 141} {"train_loss": -4.804183006286621, "global_step": 5935, "epoch": 141} {"train_loss": -4.912998676300049, "global_step": 5936, "epoch": 141} {"train_loss": -4.816732883453369, "global_step": 5937, "epoch": 141} {"train_loss": -4.865527629852295, "global_step": 5938, "epoch": 141} {"train_loss": -4.770216941833496, "global_step": 5939, "epoch": 141} {"train_loss": -4.872617721557617, "global_step": 5940, "epoch": 141} {"train_loss": -4.678556442260742, "global_step": 5941, "epoch": 141} {"train_loss": -4.922141075134277, "global_step": 5942, "epoch": 141} {"train_loss": -4.727328300476074, "global_step": 5943, "epoch": 141} {"train_loss": -4.75727653503418, "global_step": 5944, "epoch": 141} {"train_loss": -4.699615955352783, "global_step": 5945, "epoch": 141} {"train_loss": -4.692409992218018, "global_step": 5946, "epoch": 141} {"train_loss": -4.643179893493652, "global_step": 5947, "epoch": 141} {"train_loss": -4.597301959991455, "global_step": 5948, "epoch": 141} {"train_loss": -4.7572197914123535, "global_step": 5949, "epoch": 141} {"train_loss": -4.759549617767334, "global_step": 5950, "epoch": 141} {"train_loss": -4.654896259307861, "global_step": 5951, "epoch": 141} {"train_loss": -4.649834632873535, "global_step": 5952, "epoch": 141} {"train_loss": -4.747875690460205, "global_step": 5953, "epoch": 141} {"train_loss": -4.896329402923584, "global_step": 5954, "epoch": 141} {"train_loss": -4.775171279907227, "global_step": 5955, "epoch": 141} {"train_loss": -4.670280456542969, "global_step": 5956, "epoch": 141} {"train_loss": -4.846250534057617, "global_step": 5957, "epoch": 141} {"train_loss": -4.884329795837402, "global_step": 5958, "epoch": 141} {"train_loss": -4.822025299072266, "global_step": 5959, "epoch": 141} {"train_loss": -4.847995758056641, "global_step": 5960, "epoch": 141} {"train_loss": -4.676530838012695, "global_step": 5961, "epoch": 141} {"train_loss": -4.708412170410156, "global_step": 5962, "epoch": 141} {"train_loss": -4.762317157927013, "global_step": 5963, "epoch": 141, "val_loss": 81176.609375} {"train_loss": -4.845753192901611, "global_step": 5964, "epoch": 142} {"train_loss": -4.929925918579102, "global_step": 5965, "epoch": 142} {"train_loss": -4.775263786315918, "global_step": 5966, "epoch": 142} {"train_loss": -4.5285234451293945, "global_step": 5967, "epoch": 142} {"train_loss": -4.568140983581543, "global_step": 5968, "epoch": 142} {"train_loss": -4.947333812713623, "global_step": 5969, "epoch": 142} {"train_loss": -4.824307918548584, "global_step": 5970, "epoch": 142} {"train_loss": -4.79998779296875, "global_step": 5971, "epoch": 142} {"train_loss": -4.770984649658203, "global_step": 5972, "epoch": 142} {"train_loss": -4.7107133865356445, "global_step": 5973, "epoch": 142} {"train_loss": -4.753771781921387, "global_step": 5974, "epoch": 142} {"train_loss": -4.832610130310059, "global_step": 5975, "epoch": 142} {"train_loss": -4.788681983947754, "global_step": 5976, "epoch": 142} {"train_loss": -4.8771562576293945, "global_step": 5977, "epoch": 142} {"train_loss": -4.863764762878418, "global_step": 5978, "epoch": 142} {"train_loss": -4.725405693054199, "global_step": 5979, "epoch": 142} {"train_loss": -4.834604263305664, "global_step": 5980, "epoch": 142} {"train_loss": -4.8623528480529785, "global_step": 5981, "epoch": 142} {"train_loss": -4.761434078216553, "global_step": 5982, "epoch": 142} {"train_loss": -4.87856388092041, "global_step": 5983, "epoch": 142} {"train_loss": -4.812082290649414, "global_step": 5984, "epoch": 142} {"train_loss": -4.845605850219727, "global_step": 5985, "epoch": 142} {"train_loss": -4.774838447570801, "global_step": 5986, "epoch": 142} {"train_loss": -4.614588737487793, "global_step": 5987, "epoch": 142} {"train_loss": -4.867306709289551, "global_step": 5988, "epoch": 142} {"train_loss": -4.676854133605957, "global_step": 5989, "epoch": 142} {"train_loss": -4.866690635681152, "global_step": 5990, "epoch": 142} {"train_loss": -4.780125141143799, "global_step": 5991, "epoch": 142} {"train_loss": -4.884796142578125, "global_step": 5992, "epoch": 142} {"train_loss": -4.9031877517700195, "global_step": 5993, "epoch": 142} {"train_loss": -4.703160762786865, "global_step": 5994, "epoch": 142} {"train_loss": -4.7080302238464355, "global_step": 5995, "epoch": 142} {"train_loss": -4.670291900634766, "global_step": 5996, "epoch": 142} {"train_loss": -4.882829666137695, "global_step": 5997, "epoch": 142} {"train_loss": -4.894386291503906, "global_step": 5998, "epoch": 142} {"train_loss": -4.83028507232666, "global_step": 5999, "epoch": 142} {"train_loss": -4.7113494873046875, "global_step": 6000, "epoch": 142} {"train_loss": -4.74785041809082, "global_step": 6001, "epoch": 142} {"train_loss": -4.664722442626953, "global_step": 6002, "epoch": 142} {"train_loss": -4.73225736618042, "global_step": 6003, "epoch": 142} {"train_loss": -4.79470157623291, "global_step": 6004, "epoch": 142} {"train_loss": -4.788177149636405, "global_step": 6005, "epoch": 142, "val_loss": 81608.7734375} {"train_loss": -4.714960098266602, "global_step": 6006, "epoch": 143} {"train_loss": -4.752346038818359, "global_step": 6007, "epoch": 143} {"train_loss": -4.722207069396973, "global_step": 6008, "epoch": 143} {"train_loss": -4.784268379211426, "global_step": 6009, "epoch": 143} {"train_loss": -4.718250274658203, "global_step": 6010, "epoch": 143} {"train_loss": -4.72699499130249, "global_step": 6011, "epoch": 143} {"train_loss": -4.866603851318359, "global_step": 6012, "epoch": 143} {"train_loss": -4.820096969604492, "global_step": 6013, "epoch": 143} {"train_loss": -4.856842041015625, "global_step": 6014, "epoch": 143} {"train_loss": -4.727146148681641, "global_step": 6015, "epoch": 143} {"train_loss": -4.697299957275391, "global_step": 6016, "epoch": 143} {"train_loss": -4.772109508514404, "global_step": 6017, "epoch": 143} {"train_loss": -4.775692939758301, "global_step": 6018, "epoch": 143} {"train_loss": -4.611881256103516, "global_step": 6019, "epoch": 143} {"train_loss": -4.657071113586426, "global_step": 6020, "epoch": 143} {"train_loss": -4.717850685119629, "global_step": 6021, "epoch": 143} {"train_loss": -4.907548427581787, "global_step": 6022, "epoch": 143} {"train_loss": -4.758622646331787, "global_step": 6023, "epoch": 143} {"train_loss": -4.797090530395508, "global_step": 6024, "epoch": 143} {"train_loss": -4.791070938110352, "global_step": 6025, "epoch": 143} {"train_loss": -4.775130271911621, "global_step": 6026, "epoch": 143} {"train_loss": -4.760863304138184, "global_step": 6027, "epoch": 143} {"train_loss": -4.799180030822754, "global_step": 6028, "epoch": 143} {"train_loss": -4.775650978088379, "global_step": 6029, "epoch": 143} {"train_loss": -4.916386604309082, "global_step": 6030, "epoch": 143} {"train_loss": -4.760079860687256, "global_step": 6031, "epoch": 143} {"train_loss": -4.894657611846924, "global_step": 6032, "epoch": 143} {"train_loss": -4.80470609664917, "global_step": 6033, "epoch": 143} {"train_loss": -4.79974889755249, "global_step": 6034, "epoch": 143} {"train_loss": -4.722831726074219, "global_step": 6035, "epoch": 143} {"train_loss": -4.835165500640869, "global_step": 6036, "epoch": 143} {"train_loss": -4.838409423828125, "global_step": 6037, "epoch": 143} {"train_loss": -4.821228504180908, "global_step": 6038, "epoch": 143} {"train_loss": -4.61000919342041, "global_step": 6039, "epoch": 143} {"train_loss": -4.452903747558594, "global_step": 6040, "epoch": 143} {"train_loss": -4.869288444519043, "global_step": 6041, "epoch": 143} {"train_loss": -4.770958423614502, "global_step": 6042, "epoch": 143} {"train_loss": -4.766711235046387, "global_step": 6043, "epoch": 143} {"train_loss": -4.797942161560059, "global_step": 6044, "epoch": 143} {"train_loss": -4.922264099121094, "global_step": 6045, "epoch": 143} {"train_loss": -4.866637229919434, "global_step": 6046, "epoch": 143} {"train_loss": -4.770302602222988, "global_step": 6047, "epoch": 143, "val_loss": 81137.375} {"train_loss": -4.925651550292969, "global_step": 6048, "epoch": 144} {"train_loss": -4.92258882522583, "global_step": 6049, "epoch": 144} {"train_loss": -4.913224220275879, "global_step": 6050, "epoch": 144} {"train_loss": -4.910510063171387, "global_step": 6051, "epoch": 144} {"train_loss": -4.955450057983398, "global_step": 6052, "epoch": 144} {"train_loss": -4.864534378051758, "global_step": 6053, "epoch": 144} {"train_loss": -4.771092414855957, "global_step": 6054, "epoch": 144} {"train_loss": -4.777178764343262, "global_step": 6055, "epoch": 144} {"train_loss": -4.740516185760498, "global_step": 6056, "epoch": 144} {"train_loss": -4.78166389465332, "global_step": 6057, "epoch": 144} {"train_loss": -4.786235332489014, "global_step": 6058, "epoch": 144} {"train_loss": -4.736201286315918, "global_step": 6059, "epoch": 144} {"train_loss": -4.705310821533203, "global_step": 6060, "epoch": 144} {"train_loss": -4.899181365966797, "global_step": 6061, "epoch": 144} {"train_loss": -4.826408863067627, "global_step": 6062, "epoch": 144} {"train_loss": -4.838808059692383, "global_step": 6063, "epoch": 144} {"train_loss": -4.805096626281738, "global_step": 6064, "epoch": 144} {"train_loss": -4.953751564025879, "global_step": 6065, "epoch": 144} {"train_loss": -4.70411491394043, "global_step": 6066, "epoch": 144} {"train_loss": -4.731680870056152, "global_step": 6067, "epoch": 144} {"train_loss": -4.857551574707031, "global_step": 6068, "epoch": 144} {"train_loss": -4.570191860198975, "global_step": 6069, "epoch": 144} {"train_loss": -4.779207229614258, "global_step": 6070, "epoch": 144} {"train_loss": -4.725688457489014, "global_step": 6071, "epoch": 144} {"train_loss": -4.835179328918457, "global_step": 6072, "epoch": 144} {"train_loss": -4.364749431610107, "global_step": 6073, "epoch": 144} {"train_loss": -4.61925745010376, "global_step": 6074, "epoch": 144} {"train_loss": -4.7736382484436035, "global_step": 6075, "epoch": 144} {"train_loss": -4.7873125076293945, "global_step": 6076, "epoch": 144} {"train_loss": -4.60096549987793, "global_step": 6077, "epoch": 144} {"train_loss": -4.606157302856445, "global_step": 6078, "epoch": 144} {"train_loss": -4.885315895080566, "global_step": 6079, "epoch": 144} {"train_loss": -4.7586894035339355, "global_step": 6080, "epoch": 144} {"train_loss": -4.611294746398926, "global_step": 6081, "epoch": 144} {"train_loss": -4.985111713409424, "global_step": 6082, "epoch": 144} {"train_loss": -4.634410381317139, "global_step": 6083, "epoch": 144} {"train_loss": -4.687530517578125, "global_step": 6084, "epoch": 144} {"train_loss": -4.717119216918945, "global_step": 6085, "epoch": 144} {"train_loss": -4.839293479919434, "global_step": 6086, "epoch": 144} {"train_loss": -4.869688034057617, "global_step": 6087, "epoch": 144} {"train_loss": -4.7935967445373535, "global_step": 6088, "epoch": 144} {"train_loss": -4.775393111365182, "global_step": 6089, "epoch": 144, "val_loss": 80406.390625} {"train_loss": -4.838257789611816, "global_step": 6090, "epoch": 145} {"train_loss": -4.674314022064209, "global_step": 6091, "epoch": 145} {"train_loss": -4.8838300704956055, "global_step": 6092, "epoch": 145} {"train_loss": -4.777994632720947, "global_step": 6093, "epoch": 145} {"train_loss": -4.761180400848389, "global_step": 6094, "epoch": 145} {"train_loss": -4.908778190612793, "global_step": 6095, "epoch": 145} {"train_loss": -4.7876691818237305, "global_step": 6096, "epoch": 145} {"train_loss": -4.871237754821777, "global_step": 6097, "epoch": 145} {"train_loss": -4.8044514656066895, "global_step": 6098, "epoch": 145} {"train_loss": -4.998839378356934, "global_step": 6099, "epoch": 145} {"train_loss": -4.792105674743652, "global_step": 6100, "epoch": 145} {"train_loss": -4.8666253089904785, "global_step": 6101, "epoch": 145} {"train_loss": -4.816560745239258, "global_step": 6102, "epoch": 145} {"train_loss": -4.742708206176758, "global_step": 6103, "epoch": 145} {"train_loss": -4.835352420806885, "global_step": 6104, "epoch": 145} {"train_loss": -4.799992084503174, "global_step": 6105, "epoch": 145} {"train_loss": -4.81845760345459, "global_step": 6106, "epoch": 145} {"train_loss": -4.927285194396973, "global_step": 6107, "epoch": 145} {"train_loss": -4.760329723358154, "global_step": 6108, "epoch": 145} {"train_loss": -4.610363006591797, "global_step": 6109, "epoch": 145} {"train_loss": -4.698526859283447, "global_step": 6110, "epoch": 145} {"train_loss": -4.551619052886963, "global_step": 6111, "epoch": 145} {"train_loss": -4.64786958694458, "global_step": 6112, "epoch": 145} {"train_loss": -4.2570576667785645, "global_step": 6113, "epoch": 145} {"train_loss": -4.795083999633789, "global_step": 6114, "epoch": 145} {"train_loss": -4.963859558105469, "global_step": 6115, "epoch": 145} {"train_loss": -4.448700428009033, "global_step": 6116, "epoch": 145} {"train_loss": -4.810370445251465, "global_step": 6117, "epoch": 145} {"train_loss": -4.584172248840332, "global_step": 6118, "epoch": 145} {"train_loss": -4.4219465255737305, "global_step": 6119, "epoch": 145} {"train_loss": -4.837238311767578, "global_step": 6120, "epoch": 145} {"train_loss": -4.67369270324707, "global_step": 6121, "epoch": 145} {"train_loss": -4.733891487121582, "global_step": 6122, "epoch": 145} {"train_loss": -4.726128101348877, "global_step": 6123, "epoch": 145} {"train_loss": -4.549161911010742, "global_step": 6124, "epoch": 145} {"train_loss": -4.804388999938965, "global_step": 6125, "epoch": 145} {"train_loss": -4.704172134399414, "global_step": 6126, "epoch": 145} {"train_loss": -4.8335676193237305, "global_step": 6127, "epoch": 145} {"train_loss": -4.764001369476318, "global_step": 6128, "epoch": 145} {"train_loss": -4.809889316558838, "global_step": 6129, "epoch": 145} {"train_loss": -4.832123279571533, "global_step": 6130, "epoch": 145} {"train_loss": -4.749154908316476, "global_step": 6131, "epoch": 145, "val_loss": 81007.234375} {"train_loss": -4.844193458557129, "global_step": 6132, "epoch": 146} {"train_loss": -4.77597713470459, "global_step": 6133, "epoch": 146} {"train_loss": -4.709518909454346, "global_step": 6134, "epoch": 146} {"train_loss": -4.793920516967773, "global_step": 6135, "epoch": 146} {"train_loss": -4.826085090637207, "global_step": 6136, "epoch": 146} {"train_loss": -4.8305816650390625, "global_step": 6137, "epoch": 146} {"train_loss": -4.777854919433594, "global_step": 6138, "epoch": 146} {"train_loss": -4.79033899307251, "global_step": 6139, "epoch": 146} {"train_loss": -4.870430946350098, "global_step": 6140, "epoch": 146} {"train_loss": -4.762573719024658, "global_step": 6141, "epoch": 146} {"train_loss": -4.825801849365234, "global_step": 6142, "epoch": 146} {"train_loss": -4.810341835021973, "global_step": 6143, "epoch": 146} {"train_loss": -4.851696014404297, "global_step": 6144, "epoch": 146} {"train_loss": -4.911882400512695, "global_step": 6145, "epoch": 146} {"train_loss": -4.874022483825684, "global_step": 6146, "epoch": 146} {"train_loss": -4.864763259887695, "global_step": 6147, "epoch": 146} {"train_loss": -4.7436723709106445, "global_step": 6148, "epoch": 146} {"train_loss": -4.8170037269592285, "global_step": 6149, "epoch": 146} {"train_loss": -4.8067731857299805, "global_step": 6150, "epoch": 146} {"train_loss": -4.806151390075684, "global_step": 6151, "epoch": 146} {"train_loss": -4.838397979736328, "global_step": 6152, "epoch": 146} {"train_loss": -4.976111888885498, "global_step": 6153, "epoch": 146} {"train_loss": -4.86065673828125, "global_step": 6154, "epoch": 146} {"train_loss": -4.939395427703857, "global_step": 6155, "epoch": 146} {"train_loss": -4.88912296295166, "global_step": 6156, "epoch": 146} {"train_loss": -4.9733757972717285, "global_step": 6157, "epoch": 146} {"train_loss": -4.865784645080566, "global_step": 6158, "epoch": 146} {"train_loss": -4.868165016174316, "global_step": 6159, "epoch": 146} {"train_loss": -4.716022491455078, "global_step": 6160, "epoch": 146} {"train_loss": -4.84028434753418, "global_step": 6161, "epoch": 146} {"train_loss": -4.697798728942871, "global_step": 6162, "epoch": 146} {"train_loss": -4.3381452560424805, "global_step": 6163, "epoch": 146} {"train_loss": -4.880875587463379, "global_step": 6164, "epoch": 146} {"train_loss": -4.7837724685668945, "global_step": 6165, "epoch": 146} {"train_loss": -4.640548229217529, "global_step": 6166, "epoch": 146} {"train_loss": -4.491069793701172, "global_step": 6167, "epoch": 146} {"train_loss": -4.817302703857422, "global_step": 6168, "epoch": 146} {"train_loss": -4.886110305786133, "global_step": 6169, "epoch": 146} {"train_loss": -4.862771034240723, "global_step": 6170, "epoch": 146} {"train_loss": -4.673135280609131, "global_step": 6171, "epoch": 146} {"train_loss": -4.763730049133301, "global_step": 6172, "epoch": 146} {"train_loss": -4.80263226372855, "global_step": 6173, "epoch": 146, "val_loss": 80901.140625} {"train_loss": -4.76976203918457, "global_step": 6174, "epoch": 147} {"train_loss": -4.771471977233887, "global_step": 6175, "epoch": 147} {"train_loss": -4.738382339477539, "global_step": 6176, "epoch": 147} {"train_loss": -4.67126989364624, "global_step": 6177, "epoch": 147} {"train_loss": -4.74724006652832, "global_step": 6178, "epoch": 147} {"train_loss": -4.812496662139893, "global_step": 6179, "epoch": 147} {"train_loss": -4.808365821838379, "global_step": 6180, "epoch": 147} {"train_loss": -4.864764213562012, "global_step": 6181, "epoch": 147} {"train_loss": -4.803084850311279, "global_step": 6182, "epoch": 147} {"train_loss": -4.8026323318481445, "global_step": 6183, "epoch": 147} {"train_loss": -4.834554672241211, "global_step": 6184, "epoch": 147} {"train_loss": -4.711720943450928, "global_step": 6185, "epoch": 147} {"train_loss": -4.7909440994262695, "global_step": 6186, "epoch": 147} {"train_loss": -4.8177313804626465, "global_step": 6187, "epoch": 147} {"train_loss": -4.849786758422852, "global_step": 6188, "epoch": 147} {"train_loss": -4.805866241455078, "global_step": 6189, "epoch": 147} {"train_loss": -4.903003215789795, "global_step": 6190, "epoch": 147} {"train_loss": -4.825608730316162, "global_step": 6191, "epoch": 147} {"train_loss": -4.781503677368164, "global_step": 6192, "epoch": 147} {"train_loss": -4.8777899742126465, "global_step": 6193, "epoch": 147} {"train_loss": -4.782215118408203, "global_step": 6194, "epoch": 147} {"train_loss": -4.817477226257324, "global_step": 6195, "epoch": 147} {"train_loss": -4.907797813415527, "global_step": 6196, "epoch": 147} {"train_loss": -4.780099391937256, "global_step": 6197, "epoch": 147} {"train_loss": -4.940049171447754, "global_step": 6198, "epoch": 147} {"train_loss": -5.001319885253906, "global_step": 6199, "epoch": 147} {"train_loss": -4.938028335571289, "global_step": 6200, "epoch": 147} {"train_loss": -4.909862518310547, "global_step": 6201, "epoch": 147} {"train_loss": -4.716063499450684, "global_step": 6202, "epoch": 147} {"train_loss": -4.946966171264648, "global_step": 6203, "epoch": 147} {"train_loss": -4.566073894500732, "global_step": 6204, "epoch": 147} {"train_loss": -4.765888214111328, "global_step": 6205, "epoch": 147} {"train_loss": -4.922338485717773, "global_step": 6206, "epoch": 147} {"train_loss": -4.758893013000488, "global_step": 6207, "epoch": 147} {"train_loss": -4.443323135375977, "global_step": 6208, "epoch": 147} {"train_loss": -4.686342239379883, "global_step": 6209, "epoch": 147} {"train_loss": -4.8453779220581055, "global_step": 6210, "epoch": 147} {"train_loss": -4.444247245788574, "global_step": 6211, "epoch": 147} {"train_loss": -4.297980308532715, "global_step": 6212, "epoch": 147} {"train_loss": -4.723345756530762, "global_step": 6213, "epoch": 147} {"train_loss": -4.539658546447754, "global_step": 6214, "epoch": 147} {"train_loss": -4.7629972639538, "global_step": 6215, "epoch": 147, "val_loss": 81634.9375} {"train_loss": -4.686185836791992, "global_step": 6216, "epoch": 148} {"train_loss": -4.582438945770264, "global_step": 6217, "epoch": 148} {"train_loss": -4.700298309326172, "global_step": 6218, "epoch": 148} {"train_loss": -4.47708797454834, "global_step": 6219, "epoch": 148} {"train_loss": -4.728915214538574, "global_step": 6220, "epoch": 148} {"train_loss": -4.657263278961182, "global_step": 6221, "epoch": 148} {"train_loss": -4.754268169403076, "global_step": 6222, "epoch": 148} {"train_loss": -4.74964714050293, "global_step": 6223, "epoch": 148} {"train_loss": -4.743583679199219, "global_step": 6224, "epoch": 148} {"train_loss": -4.590315818786621, "global_step": 6225, "epoch": 148} {"train_loss": -4.792342185974121, "global_step": 6226, "epoch": 148} {"train_loss": -4.707766056060791, "global_step": 6227, "epoch": 148} {"train_loss": -4.74611759185791, "global_step": 6228, "epoch": 148} {"train_loss": -4.701103210449219, "global_step": 6229, "epoch": 148} {"train_loss": -4.771913528442383, "global_step": 6230, "epoch": 148} {"train_loss": -4.766231536865234, "global_step": 6231, "epoch": 148} {"train_loss": -4.721746444702148, "global_step": 6232, "epoch": 148} {"train_loss": -4.830049514770508, "global_step": 6233, "epoch": 148} {"train_loss": -4.7406110763549805, "global_step": 6234, "epoch": 148} {"train_loss": -4.798649787902832, "global_step": 6235, "epoch": 148} {"train_loss": -4.707038402557373, "global_step": 6236, "epoch": 148} {"train_loss": -4.770846366882324, "global_step": 6237, "epoch": 148} {"train_loss": -4.828430652618408, "global_step": 6238, "epoch": 148} {"train_loss": -4.955876350402832, "global_step": 6239, "epoch": 148} {"train_loss": -4.752710342407227, "global_step": 6240, "epoch": 148} {"train_loss": -4.735672473907471, "global_step": 6241, "epoch": 148} {"train_loss": -4.793505668640137, "global_step": 6242, "epoch": 148} {"train_loss": -4.923891067504883, "global_step": 6243, "epoch": 148} {"train_loss": -4.851842403411865, "global_step": 6244, "epoch": 148} {"train_loss": -4.83933687210083, "global_step": 6245, "epoch": 148} {"train_loss": -4.794069290161133, "global_step": 6246, "epoch": 148} {"train_loss": -4.895199775695801, "global_step": 6247, "epoch": 148} {"train_loss": -4.7562575340271, "global_step": 6248, "epoch": 148} {"train_loss": -4.954596996307373, "global_step": 6249, "epoch": 148} {"train_loss": -4.719204902648926, "global_step": 6250, "epoch": 148} {"train_loss": -4.858503341674805, "global_step": 6251, "epoch": 148} {"train_loss": -4.824300289154053, "global_step": 6252, "epoch": 148} {"train_loss": -4.827288627624512, "global_step": 6253, "epoch": 148} {"train_loss": -4.725397109985352, "global_step": 6254, "epoch": 148} {"train_loss": -4.746673583984375, "global_step": 6255, "epoch": 148} {"train_loss": -4.866808891296387, "global_step": 6256, "epoch": 148} {"train_loss": -4.760347718284244, "global_step": 6257, "epoch": 148, "val_loss": 79573.0546875} {"train_loss": -4.747324466705322, "global_step": 6258, "epoch": 149} {"train_loss": -4.799404144287109, "global_step": 6259, "epoch": 149} {"train_loss": -4.74277925491333, "global_step": 6260, "epoch": 149} {"train_loss": -4.693647384643555, "global_step": 6261, "epoch": 149} {"train_loss": -4.776013374328613, "global_step": 6262, "epoch": 149} {"train_loss": -4.8293561935424805, "global_step": 6263, "epoch": 149} {"train_loss": -4.827755928039551, "global_step": 6264, "epoch": 149} {"train_loss": -5.089402198791504, "global_step": 6265, "epoch": 149} {"train_loss": -4.804203033447266, "global_step": 6266, "epoch": 149} {"train_loss": -4.723090171813965, "global_step": 6267, "epoch": 149} {"train_loss": -4.9118571281433105, "global_step": 6268, "epoch": 149} {"train_loss": -4.81614875793457, "global_step": 6269, "epoch": 149} {"train_loss": -4.784006118774414, "global_step": 6270, "epoch": 149} {"train_loss": -4.777635097503662, "global_step": 6271, "epoch": 149} {"train_loss": -4.969915390014648, "global_step": 6272, "epoch": 149} {"train_loss": -4.7386980056762695, "global_step": 6273, "epoch": 149} {"train_loss": -4.829283237457275, "global_step": 6274, "epoch": 149} {"train_loss": -4.748154163360596, "global_step": 6275, "epoch": 149} {"train_loss": -4.873633861541748, "global_step": 6276, "epoch": 149} {"train_loss": -4.808000564575195, "global_step": 6277, "epoch": 149} {"train_loss": -4.763219833374023, "global_step": 6278, "epoch": 149} {"train_loss": -4.823847770690918, "global_step": 6279, "epoch": 149} {"train_loss": -4.697169303894043, "global_step": 6280, "epoch": 149} {"train_loss": -4.705473899841309, "global_step": 6281, "epoch": 149} {"train_loss": -4.880924701690674, "global_step": 6282, "epoch": 149} {"train_loss": -5.021151542663574, "global_step": 6283, "epoch": 149} {"train_loss": -4.817760467529297, "global_step": 6284, "epoch": 149} {"train_loss": -4.8957085609436035, "global_step": 6285, "epoch": 149} {"train_loss": -4.894217491149902, "global_step": 6286, "epoch": 149} {"train_loss": -4.831260681152344, "global_step": 6287, "epoch": 149} {"train_loss": -4.954207420349121, "global_step": 6288, "epoch": 149} {"train_loss": -4.886350154876709, "global_step": 6289, "epoch": 149} {"train_loss": -4.74481201171875, "global_step": 6290, "epoch": 149} {"train_loss": -4.846224308013916, "global_step": 6291, "epoch": 149} {"train_loss": -4.962802886962891, "global_step": 6292, "epoch": 149} {"train_loss": -4.947083950042725, "global_step": 6293, "epoch": 149} {"train_loss": -4.8198981285095215, "global_step": 6294, "epoch": 149} {"train_loss": -4.873685836791992, "global_step": 6295, "epoch": 149} {"train_loss": -4.946175575256348, "global_step": 6296, "epoch": 149} {"train_loss": -4.9308271408081055, "global_step": 6297, "epoch": 149} {"train_loss": -4.956693649291992, "global_step": 6298, "epoch": 149} {"train_loss": -4.843724738983881, "global_step": 6299, "epoch": 149, "val_loss": 79045.0078125} {"train_loss": -4.894896030426025, "global_step": 6300, "epoch": 150} {"train_loss": -4.917922496795654, "global_step": 6301, "epoch": 150} {"train_loss": -4.829415798187256, "global_step": 6302, "epoch": 150} {"train_loss": -4.926395416259766, "global_step": 6303, "epoch": 150} {"train_loss": -4.974087715148926, "global_step": 6304, "epoch": 150} {"train_loss": -4.9225311279296875, "global_step": 6305, "epoch": 150} {"train_loss": -4.910079002380371, "global_step": 6306, "epoch": 150} {"train_loss": -4.77663516998291, "global_step": 6307, "epoch": 150} {"train_loss": -4.756912708282471, "global_step": 6308, "epoch": 150} {"train_loss": -4.788710594177246, "global_step": 6309, "epoch": 150} {"train_loss": -4.7787628173828125, "global_step": 6310, "epoch": 150} {"train_loss": -4.885424613952637, "global_step": 6311, "epoch": 150} {"train_loss": -4.865784645080566, "global_step": 6312, "epoch": 150} {"train_loss": -4.851158142089844, "global_step": 6313, "epoch": 150} {"train_loss": -4.6360087394714355, "global_step": 6314, "epoch": 150} {"train_loss": -4.764449119567871, "global_step": 6315, "epoch": 150} {"train_loss": -4.544686794281006, "global_step": 6316, "epoch": 150} {"train_loss": -4.856748104095459, "global_step": 6317, "epoch": 150} {"train_loss": -4.999787330627441, "global_step": 6318, "epoch": 150} {"train_loss": -4.9073486328125, "global_step": 6319, "epoch": 150} {"train_loss": -4.807506084442139, "global_step": 6320, "epoch": 150} {"train_loss": -4.679510116577148, "global_step": 6321, "epoch": 150} {"train_loss": -4.916031360626221, "global_step": 6322, "epoch": 150} {"train_loss": -4.9769439697265625, "global_step": 6323, "epoch": 150} {"train_loss": -4.586430549621582, "global_step": 6324, "epoch": 150} {"train_loss": -4.786182403564453, "global_step": 6325, "epoch": 150} {"train_loss": -4.738241672515869, "global_step": 6326, "epoch": 150} {"train_loss": -4.726871490478516, "global_step": 6327, "epoch": 150} {"train_loss": -4.7564496994018555, "global_step": 6328, "epoch": 150} {"train_loss": -4.86646842956543, "global_step": 6329, "epoch": 150} {"train_loss": -4.6664252281188965, "global_step": 6330, "epoch": 150} {"train_loss": -4.8189287185668945, "global_step": 6331, "epoch": 150} {"train_loss": -4.853914260864258, "global_step": 6332, "epoch": 150} {"train_loss": -4.789870262145996, "global_step": 6333, "epoch": 150} {"train_loss": -4.817934513092041, "global_step": 6334, "epoch": 150} {"train_loss": -4.8350300788879395, "global_step": 6335, "epoch": 150} {"train_loss": -4.438854694366455, "global_step": 6336, "epoch": 150} {"train_loss": -4.740173816680908, "global_step": 6337, "epoch": 150} {"train_loss": -4.767570495605469, "global_step": 6338, "epoch": 150} {"train_loss": -4.720425128936768, "global_step": 6339, "epoch": 150} {"train_loss": -4.812813758850098, "global_step": 6340, "epoch": 150} {"train_loss": -4.801902714229765, "global_step": 6341, "epoch": 150, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.0009951100988861814, "train/sim_max_reward_2": 0.13148977134425843, "train/sim_max_reward_3": 0.011010147606976956, "train/sim_max_reward_4": 0.14992101891632995, "train/sim_max_reward_5": 0.39614133204936186, "test/sim_max_reward_4300000": 0.17883606179011122, "test/sim_max_reward_4300001": 0.17001191176546598, "test/sim_max_reward_4300002": 0.17527410724918904, "test/sim_max_reward_4300003": 0.27937153809368176, "test/sim_max_reward_4300004": 0.5413529726211888, "test/sim_max_reward_4300005": 0.3711075993340984, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.08774228885749182, "test/sim_max_reward_4300008": 0.0, "test/sim_max_reward_4300009": 0.16451156088806596, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.11531517539022802, "test/sim_max_reward_4300012": 0.16123959756641615, "test/sim_max_reward_4300013": 0.3087005263470075, "test/sim_max_reward_4300014": 0.4009787938652654, "test/sim_max_reward_4300015": 0.35143410153512206, "test/sim_max_reward_4300016": 0.03306571180895471, "test/sim_max_reward_4300017": 0.23222753797343584, "test/sim_max_reward_4300018": 0.0, "test/sim_max_reward_4300019": 0.18599451394693686, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.28997522133470477, "test/sim_max_reward_4300022": 0.0014174770924601115, "test/sim_max_reward_4300023": 0.2057529789273333, "test/sim_max_reward_4300024": 0.0, "test/sim_max_reward_4300025": 0.08847875242732427, "test/sim_max_reward_4300026": 0.4769974239949311, "test/sim_max_reward_4300027": 0.1082413334987913, "test/sim_max_reward_4300028": 0.3495077217847826, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.5096957166899363, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.4871904203057197, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.08015844245760208, "test/sim_max_reward_4300036": 0.6735971105556618, "test/sim_max_reward_4300037": 0.5527122599440878, "test/sim_max_reward_4300038": 0.23693476918831427, "test/sim_max_reward_4300039": 0.016130705053474133, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.34076439249111967, "test/sim_max_reward_4300043": 0.3641956961053606, "test/sim_max_reward_4300044": 0.07466210867936685, "test/sim_max_reward_4300045": 0.18183967019105582, "test/sim_max_reward_4300046": 0.28610548185360357, "test/sim_max_reward_4300047": 0.5011704284981949, "test/sim_max_reward_4300048": 0.19984684759664026, "test/sim_max_reward_4300049": 0.1334340438265475, "train/mean_score": 0.14664247943697756, "test/mean_score": 0.2020111063135865, "val_loss": 79252.7890625} {"train_loss": -4.727565765380859, "global_step": 6342, "epoch": 151} {"train_loss": -4.971281051635742, "global_step": 6343, "epoch": 151} {"train_loss": -4.87509822845459, "global_step": 6344, "epoch": 151} {"train_loss": -4.776040077209473, "global_step": 6345, "epoch": 151} {"train_loss": -4.933834075927734, "global_step": 6346, "epoch": 151} {"train_loss": -4.777727127075195, "global_step": 6347, "epoch": 151} {"train_loss": -4.825769424438477, "global_step": 6348, "epoch": 151} {"train_loss": -4.732580184936523, "global_step": 6349, "epoch": 151} {"train_loss": -4.804192066192627, "global_step": 6350, "epoch": 151} {"train_loss": -4.82858943939209, "global_step": 6351, "epoch": 151} {"train_loss": -4.881072044372559, "global_step": 6352, "epoch": 151} {"train_loss": -4.849024295806885, "global_step": 6353, "epoch": 151} {"train_loss": -4.941105365753174, "global_step": 6354, "epoch": 151} {"train_loss": -4.887142658233643, "global_step": 6355, "epoch": 151} {"train_loss": -4.8642191886901855, "global_step": 6356, "epoch": 151} {"train_loss": -4.893582344055176, "global_step": 6357, "epoch": 151} {"train_loss": -4.755658149719238, "global_step": 6358, "epoch": 151} {"train_loss": -4.890105247497559, "global_step": 6359, "epoch": 151} {"train_loss": -4.866422653198242, "global_step": 6360, "epoch": 151} {"train_loss": -4.917451858520508, "global_step": 6361, "epoch": 151} {"train_loss": -4.752476692199707, "global_step": 6362, "epoch": 151} {"train_loss": -4.806914329528809, "global_step": 6363, "epoch": 151} {"train_loss": -4.841104030609131, "global_step": 6364, "epoch": 151} {"train_loss": -4.735197067260742, "global_step": 6365, "epoch": 151} {"train_loss": -4.575625419616699, "global_step": 6366, "epoch": 151} {"train_loss": -4.591338157653809, "global_step": 6367, "epoch": 151} {"train_loss": -4.644765377044678, "global_step": 6368, "epoch": 151} {"train_loss": -4.822638511657715, "global_step": 6369, "epoch": 151} {"train_loss": -4.9047136306762695, "global_step": 6370, "epoch": 151} {"train_loss": -4.78822660446167, "global_step": 6371, "epoch": 151} {"train_loss": -4.800412178039551, "global_step": 6372, "epoch": 151} {"train_loss": -4.8428778648376465, "global_step": 6373, "epoch": 151} {"train_loss": -4.857270240783691, "global_step": 6374, "epoch": 151} {"train_loss": -4.973221778869629, "global_step": 6375, "epoch": 151} {"train_loss": -4.735374450683594, "global_step": 6376, "epoch": 151} {"train_loss": -4.993594169616699, "global_step": 6377, "epoch": 151} {"train_loss": -4.898739814758301, "global_step": 6378, "epoch": 151} {"train_loss": -4.968440055847168, "global_step": 6379, "epoch": 151} {"train_loss": -4.923197269439697, "global_step": 6380, "epoch": 151} {"train_loss": -4.927010536193848, "global_step": 6381, "epoch": 151} {"train_loss": -4.740147113800049, "global_step": 6382, "epoch": 151} {"train_loss": -4.831909043448312, "global_step": 6383, "epoch": 151, "val_loss": 78103.6484375} {"train_loss": -4.886420249938965, "global_step": 6384, "epoch": 152} {"train_loss": -4.722431182861328, "global_step": 6385, "epoch": 152} {"train_loss": -4.743304252624512, "global_step": 6386, "epoch": 152} {"train_loss": -4.9569597244262695, "global_step": 6387, "epoch": 152} {"train_loss": -4.63704776763916, "global_step": 6388, "epoch": 152} {"train_loss": -4.863170623779297, "global_step": 6389, "epoch": 152} {"train_loss": -4.788499355316162, "global_step": 6390, "epoch": 152} {"train_loss": -4.663016319274902, "global_step": 6391, "epoch": 152} {"train_loss": -4.618287086486816, "global_step": 6392, "epoch": 152} {"train_loss": -4.772622108459473, "global_step": 6393, "epoch": 152} {"train_loss": -4.809597492218018, "global_step": 6394, "epoch": 152} {"train_loss": -4.7052903175354, "global_step": 6395, "epoch": 152} {"train_loss": -4.77908992767334, "global_step": 6396, "epoch": 152} {"train_loss": -4.894981861114502, "global_step": 6397, "epoch": 152} {"train_loss": -4.709933757781982, "global_step": 6398, "epoch": 152} {"train_loss": -4.728236198425293, "global_step": 6399, "epoch": 152} {"train_loss": -4.78631591796875, "global_step": 6400, "epoch": 152} {"train_loss": -4.741707801818848, "global_step": 6401, "epoch": 152} {"train_loss": -4.945077896118164, "global_step": 6402, "epoch": 152} {"train_loss": -4.726040840148926, "global_step": 6403, "epoch": 152} {"train_loss": -4.7893171310424805, "global_step": 6404, "epoch": 152} {"train_loss": -4.884787082672119, "global_step": 6405, "epoch": 152} {"train_loss": -4.934344291687012, "global_step": 6406, "epoch": 152} {"train_loss": -4.763182163238525, "global_step": 6407, "epoch": 152} {"train_loss": -4.83025598526001, "global_step": 6408, "epoch": 152} {"train_loss": -4.914013862609863, "global_step": 6409, "epoch": 152} {"train_loss": -4.716609954833984, "global_step": 6410, "epoch": 152} {"train_loss": -4.754362106323242, "global_step": 6411, "epoch": 152} {"train_loss": -4.909872055053711, "global_step": 6412, "epoch": 152} {"train_loss": -4.836164951324463, "global_step": 6413, "epoch": 152} {"train_loss": -4.74600076675415, "global_step": 6414, "epoch": 152} {"train_loss": -4.80585241317749, "global_step": 6415, "epoch": 152} {"train_loss": -4.84294319152832, "global_step": 6416, "epoch": 152} {"train_loss": -4.873126029968262, "global_step": 6417, "epoch": 152} {"train_loss": -4.824952125549316, "global_step": 6418, "epoch": 152} {"train_loss": -4.8164567947387695, "global_step": 6419, "epoch": 152} {"train_loss": -4.931492328643799, "global_step": 6420, "epoch": 152} {"train_loss": -4.6412553787231445, "global_step": 6421, "epoch": 152} {"train_loss": -4.841358661651611, "global_step": 6422, "epoch": 152} {"train_loss": -4.889355659484863, "global_step": 6423, "epoch": 152} {"train_loss": -4.933643341064453, "global_step": 6424, "epoch": 152} {"train_loss": -4.805616287958054, "global_step": 6425, "epoch": 152, "val_loss": 77637.765625} {"train_loss": -4.95175838470459, "global_step": 6426, "epoch": 153} {"train_loss": -4.863945007324219, "global_step": 6427, "epoch": 153} {"train_loss": -4.895336151123047, "global_step": 6428, "epoch": 153} {"train_loss": -4.862186908721924, "global_step": 6429, "epoch": 153} {"train_loss": -5.000394821166992, "global_step": 6430, "epoch": 153} {"train_loss": -4.743405342102051, "global_step": 6431, "epoch": 153} {"train_loss": -4.539114952087402, "global_step": 6432, "epoch": 153} {"train_loss": -4.804390907287598, "global_step": 6433, "epoch": 153} {"train_loss": -4.882523536682129, "global_step": 6434, "epoch": 153} {"train_loss": -4.712211608886719, "global_step": 6435, "epoch": 153} {"train_loss": -4.596624374389648, "global_step": 6436, "epoch": 153} {"train_loss": -4.834039688110352, "global_step": 6437, "epoch": 153} {"train_loss": -4.816431045532227, "global_step": 6438, "epoch": 153} {"train_loss": -4.7159929275512695, "global_step": 6439, "epoch": 153} {"train_loss": -4.763921737670898, "global_step": 6440, "epoch": 153} {"train_loss": -4.6292009353637695, "global_step": 6441, "epoch": 153} {"train_loss": -4.616967678070068, "global_step": 6442, "epoch": 153} {"train_loss": -4.833186149597168, "global_step": 6443, "epoch": 153} {"train_loss": -4.593476295471191, "global_step": 6444, "epoch": 153} {"train_loss": -4.760871410369873, "global_step": 6445, "epoch": 153} {"train_loss": -4.743201732635498, "global_step": 6446, "epoch": 153} {"train_loss": -4.850156784057617, "global_step": 6447, "epoch": 153} {"train_loss": -4.930075645446777, "global_step": 6448, "epoch": 153} {"train_loss": -4.802992820739746, "global_step": 6449, "epoch": 153} {"train_loss": -4.827973365783691, "global_step": 6450, "epoch": 153} {"train_loss": -4.7997589111328125, "global_step": 6451, "epoch": 153} {"train_loss": -4.7175984382629395, "global_step": 6452, "epoch": 153} {"train_loss": -4.829616546630859, "global_step": 6453, "epoch": 153} {"train_loss": -4.948696136474609, "global_step": 6454, "epoch": 153} {"train_loss": -4.8507537841796875, "global_step": 6455, "epoch": 153} {"train_loss": -4.888413429260254, "global_step": 6456, "epoch": 153} {"train_loss": -4.766874313354492, "global_step": 6457, "epoch": 153} {"train_loss": -4.877448558807373, "global_step": 6458, "epoch": 153} {"train_loss": -4.761962413787842, "global_step": 6459, "epoch": 153} {"train_loss": -4.853639602661133, "global_step": 6460, "epoch": 153} {"train_loss": -4.753583908081055, "global_step": 6461, "epoch": 153} {"train_loss": -4.999090194702148, "global_step": 6462, "epoch": 153} {"train_loss": -4.834590911865234, "global_step": 6463, "epoch": 153} {"train_loss": -4.832332134246826, "global_step": 6464, "epoch": 153} {"train_loss": -4.906290531158447, "global_step": 6465, "epoch": 153} {"train_loss": -4.78886079788208, "global_step": 6466, "epoch": 153} {"train_loss": -4.804940439405895, "global_step": 6467, "epoch": 153, "val_loss": 78463.6640625} {"train_loss": -4.765619277954102, "global_step": 6468, "epoch": 154} {"train_loss": -4.871498107910156, "global_step": 6469, "epoch": 154} {"train_loss": -4.921285629272461, "global_step": 6470, "epoch": 154} {"train_loss": -4.683349609375, "global_step": 6471, "epoch": 154} {"train_loss": -4.661548614501953, "global_step": 6472, "epoch": 154} {"train_loss": -4.865597724914551, "global_step": 6473, "epoch": 154} {"train_loss": -4.805947303771973, "global_step": 6474, "epoch": 154} {"train_loss": -4.751213550567627, "global_step": 6475, "epoch": 154} {"train_loss": -4.780021667480469, "global_step": 6476, "epoch": 154} {"train_loss": -4.947065830230713, "global_step": 6477, "epoch": 154} {"train_loss": -4.9380292892456055, "global_step": 6478, "epoch": 154} {"train_loss": -4.771158218383789, "global_step": 6479, "epoch": 154} {"train_loss": -4.851181983947754, "global_step": 6480, "epoch": 154} {"train_loss": -4.777588844299316, "global_step": 6481, "epoch": 154} {"train_loss": -4.700118064880371, "global_step": 6482, "epoch": 154} {"train_loss": -4.782876968383789, "global_step": 6483, "epoch": 154} {"train_loss": -5.099483013153076, "global_step": 6484, "epoch": 154} {"train_loss": -4.836582660675049, "global_step": 6485, "epoch": 154} {"train_loss": -4.774285316467285, "global_step": 6486, "epoch": 154} {"train_loss": -4.927676677703857, "global_step": 6487, "epoch": 154} {"train_loss": -4.825743675231934, "global_step": 6488, "epoch": 154} {"train_loss": -4.8773088455200195, "global_step": 6489, "epoch": 154} {"train_loss": -5.056905269622803, "global_step": 6490, "epoch": 154} {"train_loss": -4.780505180358887, "global_step": 6491, "epoch": 154} {"train_loss": -4.732083320617676, "global_step": 6492, "epoch": 154} {"train_loss": -4.792872905731201, "global_step": 6493, "epoch": 154} {"train_loss": -4.749602317810059, "global_step": 6494, "epoch": 154} {"train_loss": -4.824101448059082, "global_step": 6495, "epoch": 154} {"train_loss": -4.8751301765441895, "global_step": 6496, "epoch": 154} {"train_loss": -4.866318702697754, "global_step": 6497, "epoch": 154} {"train_loss": -4.800127029418945, "global_step": 6498, "epoch": 154} {"train_loss": -4.89990758895874, "global_step": 6499, "epoch": 154} {"train_loss": -4.777702331542969, "global_step": 6500, "epoch": 154} {"train_loss": -4.813195705413818, "global_step": 6501, "epoch": 154} {"train_loss": -4.909792900085449, "global_step": 6502, "epoch": 154} {"train_loss": -4.797229766845703, "global_step": 6503, "epoch": 154} {"train_loss": -4.8244242668151855, "global_step": 6504, "epoch": 154} {"train_loss": -4.830593109130859, "global_step": 6505, "epoch": 154} {"train_loss": -4.873041152954102, "global_step": 6506, "epoch": 154} {"train_loss": -4.864505767822266, "global_step": 6507, "epoch": 154} {"train_loss": -4.868519306182861, "global_step": 6508, "epoch": 154} {"train_loss": -4.83498874164763, "global_step": 6509, "epoch": 154, "val_loss": 77726.453125} {"train_loss": -4.92797327041626, "global_step": 6510, "epoch": 155} {"train_loss": -4.86562442779541, "global_step": 6511, "epoch": 155} {"train_loss": -4.9107465744018555, "global_step": 6512, "epoch": 155} {"train_loss": -4.903409957885742, "global_step": 6513, "epoch": 155} {"train_loss": -4.820835113525391, "global_step": 6514, "epoch": 155} {"train_loss": -4.761503219604492, "global_step": 6515, "epoch": 155} {"train_loss": -4.973738670349121, "global_step": 6516, "epoch": 155} {"train_loss": -4.74873685836792, "global_step": 6517, "epoch": 155} {"train_loss": -4.6368865966796875, "global_step": 6518, "epoch": 155} {"train_loss": -4.8937668800354, "global_step": 6519, "epoch": 155} {"train_loss": -4.994730472564697, "global_step": 6520, "epoch": 155} {"train_loss": -4.852034091949463, "global_step": 6521, "epoch": 155} {"train_loss": -4.811070919036865, "global_step": 6522, "epoch": 155} {"train_loss": -4.945309638977051, "global_step": 6523, "epoch": 155} {"train_loss": -4.9546661376953125, "global_step": 6524, "epoch": 155} {"train_loss": -4.921725273132324, "global_step": 6525, "epoch": 155} {"train_loss": -4.673264503479004, "global_step": 6526, "epoch": 155} {"train_loss": -4.915831089019775, "global_step": 6527, "epoch": 155} {"train_loss": -4.935175895690918, "global_step": 6528, "epoch": 155} {"train_loss": -4.775120258331299, "global_step": 6529, "epoch": 155} {"train_loss": -4.966352939605713, "global_step": 6530, "epoch": 155} {"train_loss": -4.889507293701172, "global_step": 6531, "epoch": 155} {"train_loss": -4.658376693725586, "global_step": 6532, "epoch": 155} {"train_loss": -4.8114237785339355, "global_step": 6533, "epoch": 155} {"train_loss": -5.020589828491211, "global_step": 6534, "epoch": 155} {"train_loss": -4.700193405151367, "global_step": 6535, "epoch": 155} {"train_loss": -4.858997344970703, "global_step": 6536, "epoch": 155} {"train_loss": -4.762879371643066, "global_step": 6537, "epoch": 155} {"train_loss": -4.619179725646973, "global_step": 6538, "epoch": 155} {"train_loss": -4.634069442749023, "global_step": 6539, "epoch": 155} {"train_loss": -4.974853515625, "global_step": 6540, "epoch": 155} {"train_loss": -4.96722412109375, "global_step": 6541, "epoch": 155} {"train_loss": -4.677762985229492, "global_step": 6542, "epoch": 155} {"train_loss": -4.680266857147217, "global_step": 6543, "epoch": 155} {"train_loss": -4.826830863952637, "global_step": 6544, "epoch": 155} {"train_loss": -4.707697868347168, "global_step": 6545, "epoch": 155} {"train_loss": -4.738076210021973, "global_step": 6546, "epoch": 155} {"train_loss": -4.822408676147461, "global_step": 6547, "epoch": 155} {"train_loss": -4.638679027557373, "global_step": 6548, "epoch": 155} {"train_loss": -4.757040023803711, "global_step": 6549, "epoch": 155} {"train_loss": -4.92454719543457, "global_step": 6550, "epoch": 155} {"train_loss": -4.8215667974381216, "global_step": 6551, "epoch": 155, "val_loss": 76739.390625} {"train_loss": -4.898994445800781, "global_step": 6552, "epoch": 156} {"train_loss": -4.800769805908203, "global_step": 6553, "epoch": 156} {"train_loss": -4.8845696449279785, "global_step": 6554, "epoch": 156} {"train_loss": -5.017626762390137, "global_step": 6555, "epoch": 156} {"train_loss": -4.805649757385254, "global_step": 6556, "epoch": 156} {"train_loss": -4.895188331604004, "global_step": 6557, "epoch": 156} {"train_loss": -4.8139142990112305, "global_step": 6558, "epoch": 156} {"train_loss": -4.972158432006836, "global_step": 6559, "epoch": 156} {"train_loss": -4.8658857345581055, "global_step": 6560, "epoch": 156} {"train_loss": -4.793436050415039, "global_step": 6561, "epoch": 156} {"train_loss": -4.8871049880981445, "global_step": 6562, "epoch": 156} {"train_loss": -4.922601699829102, "global_step": 6563, "epoch": 156} {"train_loss": -4.836090564727783, "global_step": 6564, "epoch": 156} {"train_loss": -4.943320274353027, "global_step": 6565, "epoch": 156} {"train_loss": -4.75438117980957, "global_step": 6566, "epoch": 156} {"train_loss": -4.974193096160889, "global_step": 6567, "epoch": 156} {"train_loss": -4.884294509887695, "global_step": 6568, "epoch": 156} {"train_loss": -4.815321922302246, "global_step": 6569, "epoch": 156} {"train_loss": -4.703434944152832, "global_step": 6570, "epoch": 156} {"train_loss": -4.411642074584961, "global_step": 6571, "epoch": 156} {"train_loss": -4.937681198120117, "global_step": 6572, "epoch": 156} {"train_loss": -4.915319919586182, "global_step": 6573, "epoch": 156} {"train_loss": -4.637367248535156, "global_step": 6574, "epoch": 156} {"train_loss": -4.44154167175293, "global_step": 6575, "epoch": 156} {"train_loss": -4.833187580108643, "global_step": 6576, "epoch": 156} {"train_loss": -4.8154497146606445, "global_step": 6577, "epoch": 156} {"train_loss": -4.569611549377441, "global_step": 6578, "epoch": 156} {"train_loss": -4.918138027191162, "global_step": 6579, "epoch": 156} {"train_loss": -4.798036098480225, "global_step": 6580, "epoch": 156} {"train_loss": -4.823922157287598, "global_step": 6581, "epoch": 156} {"train_loss": -4.866826057434082, "global_step": 6582, "epoch": 156} {"train_loss": -4.819897174835205, "global_step": 6583, "epoch": 156} {"train_loss": -4.904989719390869, "global_step": 6584, "epoch": 156} {"train_loss": -4.794443130493164, "global_step": 6585, "epoch": 156} {"train_loss": -4.942088603973389, "global_step": 6586, "epoch": 156} {"train_loss": -4.983469009399414, "global_step": 6587, "epoch": 156} {"train_loss": -4.764361381530762, "global_step": 6588, "epoch": 156} {"train_loss": -4.813063621520996, "global_step": 6589, "epoch": 156} {"train_loss": -4.849264144897461, "global_step": 6590, "epoch": 156} {"train_loss": -4.8481597900390625, "global_step": 6591, "epoch": 156} {"train_loss": -4.8645782470703125, "global_step": 6592, "epoch": 156} {"train_loss": -4.830335276467459, "global_step": 6593, "epoch": 156, "val_loss": 77160.3984375} {"train_loss": -4.846841812133789, "global_step": 6594, "epoch": 157} {"train_loss": -4.831035614013672, "global_step": 6595, "epoch": 157} {"train_loss": -4.7990922927856445, "global_step": 6596, "epoch": 157} {"train_loss": -4.8840484619140625, "global_step": 6597, "epoch": 157} {"train_loss": -4.940360069274902, "global_step": 6598, "epoch": 157} {"train_loss": -4.823124885559082, "global_step": 6599, "epoch": 157} {"train_loss": -4.842979431152344, "global_step": 6600, "epoch": 157} {"train_loss": -5.0514912605285645, "global_step": 6601, "epoch": 157} {"train_loss": -4.933418273925781, "global_step": 6602, "epoch": 157} {"train_loss": -4.606942176818848, "global_step": 6603, "epoch": 157} {"train_loss": -4.881969928741455, "global_step": 6604, "epoch": 157} {"train_loss": -4.906442642211914, "global_step": 6605, "epoch": 157} {"train_loss": -4.8164472579956055, "global_step": 6606, "epoch": 157} {"train_loss": -4.776239395141602, "global_step": 6607, "epoch": 157} {"train_loss": -4.722166061401367, "global_step": 6608, "epoch": 157} {"train_loss": -4.682940483093262, "global_step": 6609, "epoch": 157} {"train_loss": -4.892162322998047, "global_step": 6610, "epoch": 157} {"train_loss": -4.790743350982666, "global_step": 6611, "epoch": 157} {"train_loss": -4.574148654937744, "global_step": 6612, "epoch": 157} {"train_loss": -5.004308700561523, "global_step": 6613, "epoch": 157} {"train_loss": -4.866405963897705, "global_step": 6614, "epoch": 157} {"train_loss": -4.6621246337890625, "global_step": 6615, "epoch": 157} {"train_loss": -4.842504024505615, "global_step": 6616, "epoch": 157} {"train_loss": -4.934003829956055, "global_step": 6617, "epoch": 157} {"train_loss": -4.905280113220215, "global_step": 6618, "epoch": 157} {"train_loss": -4.798791885375977, "global_step": 6619, "epoch": 157} {"train_loss": -4.846047401428223, "global_step": 6620, "epoch": 157} {"train_loss": -5.112990379333496, "global_step": 6621, "epoch": 157} {"train_loss": -4.832643508911133, "global_step": 6622, "epoch": 157} {"train_loss": -4.8160400390625, "global_step": 6623, "epoch": 157} {"train_loss": -4.8122992515563965, "global_step": 6624, "epoch": 157} {"train_loss": -5.001274108886719, "global_step": 6625, "epoch": 157} {"train_loss": -4.652097225189209, "global_step": 6626, "epoch": 157} {"train_loss": -4.825505256652832, "global_step": 6627, "epoch": 157} {"train_loss": -4.9360833168029785, "global_step": 6628, "epoch": 157} {"train_loss": -4.855172157287598, "global_step": 6629, "epoch": 157} {"train_loss": -4.89096736907959, "global_step": 6630, "epoch": 157} {"train_loss": -4.975608825683594, "global_step": 6631, "epoch": 157} {"train_loss": -4.842609405517578, "global_step": 6632, "epoch": 157} {"train_loss": -4.856212615966797, "global_step": 6633, "epoch": 157} {"train_loss": -4.827502250671387, "global_step": 6634, "epoch": 157} {"train_loss": -4.850926614943004, "global_step": 6635, "epoch": 157, "val_loss": 77969.328125} {"train_loss": -4.845728874206543, "global_step": 6636, "epoch": 158} {"train_loss": -4.823493003845215, "global_step": 6637, "epoch": 158} {"train_loss": -4.952526092529297, "global_step": 6638, "epoch": 158} {"train_loss": -4.885646820068359, "global_step": 6639, "epoch": 158} {"train_loss": -5.048883438110352, "global_step": 6640, "epoch": 158} {"train_loss": -4.990181922912598, "global_step": 6641, "epoch": 158} {"train_loss": -4.829000473022461, "global_step": 6642, "epoch": 158} {"train_loss": -4.990729808807373, "global_step": 6643, "epoch": 158} {"train_loss": -4.994028091430664, "global_step": 6644, "epoch": 158} {"train_loss": -5.017941951751709, "global_step": 6645, "epoch": 158} {"train_loss": -4.958744525909424, "global_step": 6646, "epoch": 158} {"train_loss": -4.826634407043457, "global_step": 6647, "epoch": 158} {"train_loss": -4.846904277801514, "global_step": 6648, "epoch": 158} {"train_loss": -5.003907203674316, "global_step": 6649, "epoch": 158} {"train_loss": -4.869140148162842, "global_step": 6650, "epoch": 158} {"train_loss": -4.790401458740234, "global_step": 6651, "epoch": 158} {"train_loss": -4.801949501037598, "global_step": 6652, "epoch": 158} {"train_loss": -4.863434791564941, "global_step": 6653, "epoch": 158} {"train_loss": -4.875863075256348, "global_step": 6654, "epoch": 158} {"train_loss": -4.684352874755859, "global_step": 6655, "epoch": 158} {"train_loss": -4.722538948059082, "global_step": 6656, "epoch": 158} {"train_loss": -4.95944881439209, "global_step": 6657, "epoch": 158} {"train_loss": -4.769296169281006, "global_step": 6658, "epoch": 158} {"train_loss": -4.817824363708496, "global_step": 6659, "epoch": 158} {"train_loss": -4.960866928100586, "global_step": 6660, "epoch": 158} {"train_loss": -4.783875942230225, "global_step": 6661, "epoch": 158} {"train_loss": -4.895282745361328, "global_step": 6662, "epoch": 158} {"train_loss": -4.999282360076904, "global_step": 6663, "epoch": 158} {"train_loss": -4.934159278869629, "global_step": 6664, "epoch": 158} {"train_loss": -4.7395758628845215, "global_step": 6665, "epoch": 158} {"train_loss": -4.819093704223633, "global_step": 6666, "epoch": 158} {"train_loss": -4.961660385131836, "global_step": 6667, "epoch": 158} {"train_loss": -4.919997215270996, "global_step": 6668, "epoch": 158} {"train_loss": -4.763088226318359, "global_step": 6669, "epoch": 158} {"train_loss": -4.877424240112305, "global_step": 6670, "epoch": 158} {"train_loss": -4.938696384429932, "global_step": 6671, "epoch": 158} {"train_loss": -4.880965232849121, "global_step": 6672, "epoch": 158} {"train_loss": -4.730775356292725, "global_step": 6673, "epoch": 158} {"train_loss": -4.850372791290283, "global_step": 6674, "epoch": 158} {"train_loss": -4.8972392082214355, "global_step": 6675, "epoch": 158} {"train_loss": -4.99916934967041, "global_step": 6676, "epoch": 158} {"train_loss": -4.87705533845084, "global_step": 6677, "epoch": 158, "val_loss": 77591.8515625} {"train_loss": -4.796167373657227, "global_step": 6678, "epoch": 159} {"train_loss": -4.886246681213379, "global_step": 6679, "epoch": 159} {"train_loss": -4.849843502044678, "global_step": 6680, "epoch": 159} {"train_loss": -4.791193962097168, "global_step": 6681, "epoch": 159} {"train_loss": -4.907586097717285, "global_step": 6682, "epoch": 159} {"train_loss": -4.694693088531494, "global_step": 6683, "epoch": 159} {"train_loss": -4.934746742248535, "global_step": 6684, "epoch": 159} {"train_loss": -4.783544540405273, "global_step": 6685, "epoch": 159} {"train_loss": -4.8311052322387695, "global_step": 6686, "epoch": 159} {"train_loss": -4.923885822296143, "global_step": 6687, "epoch": 159} {"train_loss": -4.784464359283447, "global_step": 6688, "epoch": 159} {"train_loss": -4.827391147613525, "global_step": 6689, "epoch": 159} {"train_loss": -4.884932994842529, "global_step": 6690, "epoch": 159} {"train_loss": -4.708381175994873, "global_step": 6691, "epoch": 159} {"train_loss": -4.852153778076172, "global_step": 6692, "epoch": 159} {"train_loss": -4.834310531616211, "global_step": 6693, "epoch": 159} {"train_loss": -4.905134201049805, "global_step": 6694, "epoch": 159} {"train_loss": -4.920061111450195, "global_step": 6695, "epoch": 159} {"train_loss": -5.018688201904297, "global_step": 6696, "epoch": 159} {"train_loss": -4.842225074768066, "global_step": 6697, "epoch": 159} {"train_loss": -4.860342025756836, "global_step": 6698, "epoch": 159} {"train_loss": -4.998966217041016, "global_step": 6699, "epoch": 159} {"train_loss": -4.9440999031066895, "global_step": 6700, "epoch": 159} {"train_loss": -4.820667743682861, "global_step": 6701, "epoch": 159} {"train_loss": -4.966842174530029, "global_step": 6702, "epoch": 159} {"train_loss": -4.916745662689209, "global_step": 6703, "epoch": 159} {"train_loss": -4.849512100219727, "global_step": 6704, "epoch": 159} {"train_loss": -4.8149871826171875, "global_step": 6705, "epoch": 159} {"train_loss": -4.788899898529053, "global_step": 6706, "epoch": 159} {"train_loss": -4.723820209503174, "global_step": 6707, "epoch": 159} {"train_loss": -4.984720230102539, "global_step": 6708, "epoch": 159} {"train_loss": -4.820890426635742, "global_step": 6709, "epoch": 159} {"train_loss": -4.991733551025391, "global_step": 6710, "epoch": 159} {"train_loss": -4.939153671264648, "global_step": 6711, "epoch": 159} {"train_loss": -4.892215728759766, "global_step": 6712, "epoch": 159} {"train_loss": -4.713316917419434, "global_step": 6713, "epoch": 159} {"train_loss": -4.755435466766357, "global_step": 6714, "epoch": 159} {"train_loss": -4.921098232269287, "global_step": 6715, "epoch": 159} {"train_loss": -5.027986526489258, "global_step": 6716, "epoch": 159} {"train_loss": -4.639887809753418, "global_step": 6717, "epoch": 159} {"train_loss": -4.841029167175293, "global_step": 6718, "epoch": 159} {"train_loss": -4.859465178989229, "global_step": 6719, "epoch": 159, "val_loss": 76975.0546875} {"train_loss": -4.859878063201904, "global_step": 6720, "epoch": 160} {"train_loss": -4.961388111114502, "global_step": 6721, "epoch": 160} {"train_loss": -4.836559772491455, "global_step": 6722, "epoch": 160} {"train_loss": -4.869964122772217, "global_step": 6723, "epoch": 160} {"train_loss": -4.695822715759277, "global_step": 6724, "epoch": 160} {"train_loss": -4.926554203033447, "global_step": 6725, "epoch": 160} {"train_loss": -4.930207252502441, "global_step": 6726, "epoch": 160} {"train_loss": -4.577392578125, "global_step": 6727, "epoch": 160} {"train_loss": -4.945377826690674, "global_step": 6728, "epoch": 160} {"train_loss": -4.808603286743164, "global_step": 6729, "epoch": 160} {"train_loss": -4.885521411895752, "global_step": 6730, "epoch": 160} {"train_loss": -4.847363471984863, "global_step": 6731, "epoch": 160} {"train_loss": -4.858267784118652, "global_step": 6732, "epoch": 160} {"train_loss": -4.593404293060303, "global_step": 6733, "epoch": 160} {"train_loss": -4.886822700500488, "global_step": 6734, "epoch": 160} {"train_loss": -4.835421562194824, "global_step": 6735, "epoch": 160} {"train_loss": -4.66242790222168, "global_step": 6736, "epoch": 160} {"train_loss": -4.940253257751465, "global_step": 6737, "epoch": 160} {"train_loss": -4.879344940185547, "global_step": 6738, "epoch": 160} {"train_loss": -4.855106353759766, "global_step": 6739, "epoch": 160} {"train_loss": -4.882025241851807, "global_step": 6740, "epoch": 160} {"train_loss": -4.893729209899902, "global_step": 6741, "epoch": 160} {"train_loss": -4.812259674072266, "global_step": 6742, "epoch": 160} {"train_loss": -4.878838539123535, "global_step": 6743, "epoch": 160} {"train_loss": -4.866243362426758, "global_step": 6744, "epoch": 160} {"train_loss": -4.713135719299316, "global_step": 6745, "epoch": 160} {"train_loss": -4.803228378295898, "global_step": 6746, "epoch": 160} {"train_loss": -4.8259968757629395, "global_step": 6747, "epoch": 160} {"train_loss": -4.896699905395508, "global_step": 6748, "epoch": 160} {"train_loss": -4.836822509765625, "global_step": 6749, "epoch": 160} {"train_loss": -4.93681526184082, "global_step": 6750, "epoch": 160} {"train_loss": -4.848644256591797, "global_step": 6751, "epoch": 160} {"train_loss": -4.894105911254883, "global_step": 6752, "epoch": 160} {"train_loss": -4.881328105926514, "global_step": 6753, "epoch": 160} {"train_loss": -4.877435684204102, "global_step": 6754, "epoch": 160} {"train_loss": -4.923003196716309, "global_step": 6755, "epoch": 160} {"train_loss": -5.004978656768799, "global_step": 6756, "epoch": 160} {"train_loss": -4.9998779296875, "global_step": 6757, "epoch": 160} {"train_loss": -4.903677940368652, "global_step": 6758, "epoch": 160} {"train_loss": -4.738789081573486, "global_step": 6759, "epoch": 160} {"train_loss": -4.696467876434326, "global_step": 6760, "epoch": 160} {"train_loss": -4.851152261098226, "global_step": 6761, "epoch": 160, "val_loss": 76396.4296875} {"train_loss": -4.849508762359619, "global_step": 6762, "epoch": 161} {"train_loss": -4.944589614868164, "global_step": 6763, "epoch": 161} {"train_loss": -4.93094539642334, "global_step": 6764, "epoch": 161} {"train_loss": -4.9187164306640625, "global_step": 6765, "epoch": 161} {"train_loss": -4.773413181304932, "global_step": 6766, "epoch": 161} {"train_loss": -4.869865894317627, "global_step": 6767, "epoch": 161} {"train_loss": -4.963094711303711, "global_step": 6768, "epoch": 161} {"train_loss": -4.974100112915039, "global_step": 6769, "epoch": 161} {"train_loss": -4.827759265899658, "global_step": 6770, "epoch": 161} {"train_loss": -5.0011491775512695, "global_step": 6771, "epoch": 161} {"train_loss": -4.918007850646973, "global_step": 6772, "epoch": 161} {"train_loss": -5.015023231506348, "global_step": 6773, "epoch": 161} {"train_loss": -4.873603343963623, "global_step": 6774, "epoch": 161} {"train_loss": -4.73933744430542, "global_step": 6775, "epoch": 161} {"train_loss": -4.583507537841797, "global_step": 6776, "epoch": 161} {"train_loss": -4.935577869415283, "global_step": 6777, "epoch": 161} {"train_loss": -4.869582653045654, "global_step": 6778, "epoch": 161} {"train_loss": -4.968894958496094, "global_step": 6779, "epoch": 161} {"train_loss": -4.726047515869141, "global_step": 6780, "epoch": 161} {"train_loss": -4.928987503051758, "global_step": 6781, "epoch": 161} {"train_loss": -4.879944801330566, "global_step": 6782, "epoch": 161} {"train_loss": -4.96098518371582, "global_step": 6783, "epoch": 161} {"train_loss": -4.915191650390625, "global_step": 6784, "epoch": 161} {"train_loss": -4.81847620010376, "global_step": 6785, "epoch": 161} {"train_loss": -4.912405967712402, "global_step": 6786, "epoch": 161} {"train_loss": -4.938085079193115, "global_step": 6787, "epoch": 161} {"train_loss": -4.8552045822143555, "global_step": 6788, "epoch": 161} {"train_loss": -4.925156593322754, "global_step": 6789, "epoch": 161} {"train_loss": -4.786237716674805, "global_step": 6790, "epoch": 161} {"train_loss": -4.9331254959106445, "global_step": 6791, "epoch": 161} {"train_loss": -4.887149810791016, "global_step": 6792, "epoch": 161} {"train_loss": -4.8861212730407715, "global_step": 6793, "epoch": 161} {"train_loss": -4.995149612426758, "global_step": 6794, "epoch": 161} {"train_loss": -4.790292739868164, "global_step": 6795, "epoch": 161} {"train_loss": -4.911683559417725, "global_step": 6796, "epoch": 161} {"train_loss": -4.8189544677734375, "global_step": 6797, "epoch": 161} {"train_loss": -4.991674423217773, "global_step": 6798, "epoch": 161} {"train_loss": -4.917015075683594, "global_step": 6799, "epoch": 161} {"train_loss": -4.671229362487793, "global_step": 6800, "epoch": 161} {"train_loss": -4.735878944396973, "global_step": 6801, "epoch": 161} {"train_loss": -4.9773173332214355, "global_step": 6802, "epoch": 161} {"train_loss": -4.879910162517002, "global_step": 6803, "epoch": 161, "val_loss": 76634.1015625} {"train_loss": -4.885785102844238, "global_step": 6804, "epoch": 162} {"train_loss": -4.866935729980469, "global_step": 6805, "epoch": 162} {"train_loss": -4.851070880889893, "global_step": 6806, "epoch": 162} {"train_loss": -4.97925329208374, "global_step": 6807, "epoch": 162} {"train_loss": -4.928498268127441, "global_step": 6808, "epoch": 162} {"train_loss": -4.901307106018066, "global_step": 6809, "epoch": 162} {"train_loss": -4.7888288497924805, "global_step": 6810, "epoch": 162} {"train_loss": -4.850860595703125, "global_step": 6811, "epoch": 162} {"train_loss": -4.828742504119873, "global_step": 6812, "epoch": 162} {"train_loss": -4.874081611633301, "global_step": 6813, "epoch": 162} {"train_loss": -4.941697120666504, "global_step": 6814, "epoch": 162} {"train_loss": -5.013587474822998, "global_step": 6815, "epoch": 162} {"train_loss": -4.937557220458984, "global_step": 6816, "epoch": 162} {"train_loss": -4.950156211853027, "global_step": 6817, "epoch": 162} {"train_loss": -5.046194076538086, "global_step": 6818, "epoch": 162} {"train_loss": -4.859131813049316, "global_step": 6819, "epoch": 162} {"train_loss": -4.933635711669922, "global_step": 6820, "epoch": 162} {"train_loss": -4.9550251960754395, "global_step": 6821, "epoch": 162} {"train_loss": -5.000059127807617, "global_step": 6822, "epoch": 162} {"train_loss": -4.802202224731445, "global_step": 6823, "epoch": 162} {"train_loss": -4.764235496520996, "global_step": 6824, "epoch": 162} {"train_loss": -4.732022285461426, "global_step": 6825, "epoch": 162} {"train_loss": -4.931440353393555, "global_step": 6826, "epoch": 162} {"train_loss": -5.01824426651001, "global_step": 6827, "epoch": 162} {"train_loss": -4.805201530456543, "global_step": 6828, "epoch": 162} {"train_loss": -4.793654441833496, "global_step": 6829, "epoch": 162} {"train_loss": -4.7951250076293945, "global_step": 6830, "epoch": 162} {"train_loss": -4.90017032623291, "global_step": 6831, "epoch": 162} {"train_loss": -4.896633148193359, "global_step": 6832, "epoch": 162} {"train_loss": -4.730761528015137, "global_step": 6833, "epoch": 162} {"train_loss": -4.911436557769775, "global_step": 6834, "epoch": 162} {"train_loss": -4.791470527648926, "global_step": 6835, "epoch": 162} {"train_loss": -4.915869235992432, "global_step": 6836, "epoch": 162} {"train_loss": -5.007887840270996, "global_step": 6837, "epoch": 162} {"train_loss": -4.881938934326172, "global_step": 6838, "epoch": 162} {"train_loss": -4.834533214569092, "global_step": 6839, "epoch": 162} {"train_loss": -4.919769287109375, "global_step": 6840, "epoch": 162} {"train_loss": -4.978191375732422, "global_step": 6841, "epoch": 162} {"train_loss": -4.95147705078125, "global_step": 6842, "epoch": 162} {"train_loss": -4.851826190948486, "global_step": 6843, "epoch": 162} {"train_loss": -4.746451377868652, "global_step": 6844, "epoch": 162} {"train_loss": -4.883595546086629, "global_step": 6845, "epoch": 162, "val_loss": 76187.28125} {"train_loss": -5.012225151062012, "global_step": 6846, "epoch": 163} {"train_loss": -4.752204418182373, "global_step": 6847, "epoch": 163} {"train_loss": -4.796710014343262, "global_step": 6848, "epoch": 163} {"train_loss": -4.710765838623047, "global_step": 6849, "epoch": 163} {"train_loss": -4.941064357757568, "global_step": 6850, "epoch": 163} {"train_loss": -4.819118499755859, "global_step": 6851, "epoch": 163} {"train_loss": -4.995790481567383, "global_step": 6852, "epoch": 163} {"train_loss": -4.707058906555176, "global_step": 6853, "epoch": 163} {"train_loss": -4.89426326751709, "global_step": 6854, "epoch": 163} {"train_loss": -4.877956867218018, "global_step": 6855, "epoch": 163} {"train_loss": -4.753269195556641, "global_step": 6856, "epoch": 163} {"train_loss": -4.811383247375488, "global_step": 6857, "epoch": 163} {"train_loss": -4.8952484130859375, "global_step": 6858, "epoch": 163} {"train_loss": -5.007027626037598, "global_step": 6859, "epoch": 163} {"train_loss": -4.794121265411377, "global_step": 6860, "epoch": 163} {"train_loss": -4.877981662750244, "global_step": 6861, "epoch": 163} {"train_loss": -4.785825729370117, "global_step": 6862, "epoch": 163} {"train_loss": -4.984125137329102, "global_step": 6863, "epoch": 163} {"train_loss": -4.917477130889893, "global_step": 6864, "epoch": 163} {"train_loss": -4.9694013595581055, "global_step": 6865, "epoch": 163} {"train_loss": -4.76690149307251, "global_step": 6866, "epoch": 163} {"train_loss": -4.941483020782471, "global_step": 6867, "epoch": 163} {"train_loss": -4.900047302246094, "global_step": 6868, "epoch": 163} {"train_loss": -4.795612812042236, "global_step": 6869, "epoch": 163} {"train_loss": -4.891119956970215, "global_step": 6870, "epoch": 163} {"train_loss": -4.937487602233887, "global_step": 6871, "epoch": 163} {"train_loss": -4.925317764282227, "global_step": 6872, "epoch": 163} {"train_loss": -4.889108657836914, "global_step": 6873, "epoch": 163} {"train_loss": -4.9345808029174805, "global_step": 6874, "epoch": 163} {"train_loss": -4.77360725402832, "global_step": 6875, "epoch": 163} {"train_loss": -4.826259613037109, "global_step": 6876, "epoch": 163} {"train_loss": -4.962081432342529, "global_step": 6877, "epoch": 163} {"train_loss": -5.012025833129883, "global_step": 6878, "epoch": 163} {"train_loss": -4.9010090827941895, "global_step": 6879, "epoch": 163} {"train_loss": -4.864311218261719, "global_step": 6880, "epoch": 163} {"train_loss": -4.919071197509766, "global_step": 6881, "epoch": 163} {"train_loss": -4.946303844451904, "global_step": 6882, "epoch": 163} {"train_loss": -4.920886993408203, "global_step": 6883, "epoch": 163} {"train_loss": -4.953466892242432, "global_step": 6884, "epoch": 163} {"train_loss": -4.953972816467285, "global_step": 6885, "epoch": 163} {"train_loss": -4.947141170501709, "global_step": 6886, "epoch": 163} {"train_loss": -4.880188567297799, "global_step": 6887, "epoch": 163, "val_loss": 75775.21875} {"train_loss": -4.802016735076904, "global_step": 6888, "epoch": 164} {"train_loss": -4.841853141784668, "global_step": 6889, "epoch": 164} {"train_loss": -4.879839897155762, "global_step": 6890, "epoch": 164} {"train_loss": -4.613760948181152, "global_step": 6891, "epoch": 164} {"train_loss": -4.9200005531311035, "global_step": 6892, "epoch": 164} {"train_loss": -4.9273295402526855, "global_step": 6893, "epoch": 164} {"train_loss": -4.719133377075195, "global_step": 6894, "epoch": 164} {"train_loss": -4.354376792907715, "global_step": 6895, "epoch": 164} {"train_loss": -4.938732147216797, "global_step": 6896, "epoch": 164} {"train_loss": -4.598360061645508, "global_step": 6897, "epoch": 164} {"train_loss": -4.553036689758301, "global_step": 6898, "epoch": 164} {"train_loss": -4.97486686706543, "global_step": 6899, "epoch": 164} {"train_loss": -4.440027713775635, "global_step": 6900, "epoch": 164} {"train_loss": -4.886117935180664, "global_step": 6901, "epoch": 164} {"train_loss": -4.697319507598877, "global_step": 6902, "epoch": 164} {"train_loss": -4.605776786804199, "global_step": 6903, "epoch": 164} {"train_loss": -4.749820709228516, "global_step": 6904, "epoch": 164} {"train_loss": -4.811561107635498, "global_step": 6905, "epoch": 164} {"train_loss": -4.855030059814453, "global_step": 6906, "epoch": 164} {"train_loss": -4.815586566925049, "global_step": 6907, "epoch": 164} {"train_loss": -4.984046459197998, "global_step": 6908, "epoch": 164} {"train_loss": -4.799802780151367, "global_step": 6909, "epoch": 164} {"train_loss": -4.728394508361816, "global_step": 6910, "epoch": 164} {"train_loss": -4.893805027008057, "global_step": 6911, "epoch": 164} {"train_loss": -4.849366664886475, "global_step": 6912, "epoch": 164} {"train_loss": -4.870553970336914, "global_step": 6913, "epoch": 164} {"train_loss": -5.0002031326293945, "global_step": 6914, "epoch": 164} {"train_loss": -4.9321746826171875, "global_step": 6915, "epoch": 164} {"train_loss": -4.806999683380127, "global_step": 6916, "epoch": 164} {"train_loss": -4.819867134094238, "global_step": 6917, "epoch": 164} {"train_loss": -4.938604354858398, "global_step": 6918, "epoch": 164} {"train_loss": -4.978554725646973, "global_step": 6919, "epoch": 164} {"train_loss": -4.746404647827148, "global_step": 6920, "epoch": 164} {"train_loss": -4.891260147094727, "global_step": 6921, "epoch": 164} {"train_loss": -4.865822792053223, "global_step": 6922, "epoch": 164} {"train_loss": -4.862117290496826, "global_step": 6923, "epoch": 164} {"train_loss": -4.831145286560059, "global_step": 6924, "epoch": 164} {"train_loss": -4.926337718963623, "global_step": 6925, "epoch": 164} {"train_loss": -4.976381778717041, "global_step": 6926, "epoch": 164} {"train_loss": -4.9370317459106445, "global_step": 6927, "epoch": 164} {"train_loss": -4.791415214538574, "global_step": 6928, "epoch": 164} {"train_loss": -4.818435827891032, "global_step": 6929, "epoch": 164, "val_loss": 75682.671875} {"train_loss": -4.998902320861816, "global_step": 6930, "epoch": 165} {"train_loss": -4.9833083152771, "global_step": 6931, "epoch": 165} {"train_loss": -4.795915603637695, "global_step": 6932, "epoch": 165} {"train_loss": -4.891861438751221, "global_step": 6933, "epoch": 165} {"train_loss": -5.0218024253845215, "global_step": 6934, "epoch": 165} {"train_loss": -5.026012420654297, "global_step": 6935, "epoch": 165} {"train_loss": -4.939960479736328, "global_step": 6936, "epoch": 165} {"train_loss": -4.899248123168945, "global_step": 6937, "epoch": 165} {"train_loss": -4.83695125579834, "global_step": 6938, "epoch": 165} {"train_loss": -5.07745885848999, "global_step": 6939, "epoch": 165} {"train_loss": -4.762465476989746, "global_step": 6940, "epoch": 165} {"train_loss": -4.944723606109619, "global_step": 6941, "epoch": 165} {"train_loss": -4.915666103363037, "global_step": 6942, "epoch": 165} {"train_loss": -4.835955619812012, "global_step": 6943, "epoch": 165} {"train_loss": -5.017011642456055, "global_step": 6944, "epoch": 165} {"train_loss": -4.948090076446533, "global_step": 6945, "epoch": 165} {"train_loss": -5.002632141113281, "global_step": 6946, "epoch": 165} {"train_loss": -4.9759721755981445, "global_step": 6947, "epoch": 165} {"train_loss": -4.9333600997924805, "global_step": 6948, "epoch": 165} {"train_loss": -4.918587684631348, "global_step": 6949, "epoch": 165} {"train_loss": -4.73812198638916, "global_step": 6950, "epoch": 165} {"train_loss": -4.425573348999023, "global_step": 6951, "epoch": 165} {"train_loss": -4.597360610961914, "global_step": 6952, "epoch": 165} {"train_loss": -4.884594917297363, "global_step": 6953, "epoch": 165} {"train_loss": -5.069203853607178, "global_step": 6954, "epoch": 165} {"train_loss": -4.752911567687988, "global_step": 6955, "epoch": 165} {"train_loss": -4.725150108337402, "global_step": 6956, "epoch": 165} {"train_loss": -4.833675384521484, "global_step": 6957, "epoch": 165} {"train_loss": -4.962130069732666, "global_step": 6958, "epoch": 165} {"train_loss": -4.905755996704102, "global_step": 6959, "epoch": 165} {"train_loss": -4.90683650970459, "global_step": 6960, "epoch": 165} {"train_loss": -5.049128532409668, "global_step": 6961, "epoch": 165} {"train_loss": -4.925832748413086, "global_step": 6962, "epoch": 165} {"train_loss": -4.909198760986328, "global_step": 6963, "epoch": 165} {"train_loss": -5.025945663452148, "global_step": 6964, "epoch": 165} {"train_loss": -4.703205108642578, "global_step": 6965, "epoch": 165} {"train_loss": -4.753292083740234, "global_step": 6966, "epoch": 165} {"train_loss": -4.8197550773620605, "global_step": 6967, "epoch": 165} {"train_loss": -4.814640522003174, "global_step": 6968, "epoch": 165} {"train_loss": -4.7513885498046875, "global_step": 6969, "epoch": 165} {"train_loss": -5.00579309463501, "global_step": 6970, "epoch": 165} {"train_loss": -4.884220077877953, "global_step": 6971, "epoch": 165, "val_loss": 77093.734375} {"train_loss": -4.940853595733643, "global_step": 6972, "epoch": 166} {"train_loss": -4.8969621658325195, "global_step": 6973, "epoch": 166} {"train_loss": -4.88353157043457, "global_step": 6974, "epoch": 166} {"train_loss": -4.667003631591797, "global_step": 6975, "epoch": 166} {"train_loss": -4.875108242034912, "global_step": 6976, "epoch": 166} {"train_loss": -4.59064245223999, "global_step": 6977, "epoch": 166} {"train_loss": -4.771344184875488, "global_step": 6978, "epoch": 166} {"train_loss": -4.858329772949219, "global_step": 6979, "epoch": 166} {"train_loss": -4.551207065582275, "global_step": 6980, "epoch": 166} {"train_loss": -4.8716535568237305, "global_step": 6981, "epoch": 166} {"train_loss": -4.516252517700195, "global_step": 6982, "epoch": 166} {"train_loss": -4.915392875671387, "global_step": 6983, "epoch": 166} {"train_loss": -4.739768981933594, "global_step": 6984, "epoch": 166} {"train_loss": -4.558442115783691, "global_step": 6985, "epoch": 166} {"train_loss": -4.589849948883057, "global_step": 6986, "epoch": 166} {"train_loss": -4.796954154968262, "global_step": 6987, "epoch": 166} {"train_loss": -4.81768798828125, "global_step": 6988, "epoch": 166} {"train_loss": -4.52602481842041, "global_step": 6989, "epoch": 166} {"train_loss": -4.786715030670166, "global_step": 6990, "epoch": 166} {"train_loss": -4.788665771484375, "global_step": 6991, "epoch": 166} {"train_loss": -4.914407730102539, "global_step": 6992, "epoch": 166} {"train_loss": -4.824774265289307, "global_step": 6993, "epoch": 166} {"train_loss": -4.726952075958252, "global_step": 6994, "epoch": 166} {"train_loss": -4.771885871887207, "global_step": 6995, "epoch": 166} {"train_loss": -4.866555213928223, "global_step": 6996, "epoch": 166} {"train_loss": -4.705992698669434, "global_step": 6997, "epoch": 166} {"train_loss": -4.861929416656494, "global_step": 6998, "epoch": 166} {"train_loss": -4.7771759033203125, "global_step": 6999, "epoch": 166} {"train_loss": -4.674948692321777, "global_step": 7000, "epoch": 166} {"train_loss": -4.935421466827393, "global_step": 7001, "epoch": 166} {"train_loss": -4.972569942474365, "global_step": 7002, "epoch": 166} {"train_loss": -4.907237529754639, "global_step": 7003, "epoch": 166} {"train_loss": -4.901883602142334, "global_step": 7004, "epoch": 166} {"train_loss": -4.84104585647583, "global_step": 7005, "epoch": 166} {"train_loss": -4.9463887214660645, "global_step": 7006, "epoch": 166} {"train_loss": -4.859067916870117, "global_step": 7007, "epoch": 166} {"train_loss": -4.951839447021484, "global_step": 7008, "epoch": 166} {"train_loss": -4.890030384063721, "global_step": 7009, "epoch": 166} {"train_loss": -4.886148929595947, "global_step": 7010, "epoch": 166} {"train_loss": -4.897950172424316, "global_step": 7011, "epoch": 166} {"train_loss": -4.965949058532715, "global_step": 7012, "epoch": 166} {"train_loss": -4.809705075763521, "global_step": 7013, "epoch": 166, "val_loss": 76143.8125} {"train_loss": -4.894099235534668, "global_step": 7014, "epoch": 167} {"train_loss": -4.813337326049805, "global_step": 7015, "epoch": 167} {"train_loss": -4.945229530334473, "global_step": 7016, "epoch": 167} {"train_loss": -4.861723899841309, "global_step": 7017, "epoch": 167} {"train_loss": -4.737380027770996, "global_step": 7018, "epoch": 167} {"train_loss": -4.97329044342041, "global_step": 7019, "epoch": 167} {"train_loss": -4.976879119873047, "global_step": 7020, "epoch": 167} {"train_loss": -4.932332515716553, "global_step": 7021, "epoch": 167} {"train_loss": -4.951881408691406, "global_step": 7022, "epoch": 167} {"train_loss": -5.0940446853637695, "global_step": 7023, "epoch": 167} {"train_loss": -4.900129795074463, "global_step": 7024, "epoch": 167} {"train_loss": -4.970239162445068, "global_step": 7025, "epoch": 167} {"train_loss": -4.853598117828369, "global_step": 7026, "epoch": 167} {"train_loss": -4.904244422912598, "global_step": 7027, "epoch": 167} {"train_loss": -4.848984241485596, "global_step": 7028, "epoch": 167} {"train_loss": -4.914920330047607, "global_step": 7029, "epoch": 167} {"train_loss": -4.88975191116333, "global_step": 7030, "epoch": 167} {"train_loss": -4.86539888381958, "global_step": 7031, "epoch": 167} {"train_loss": -4.906257629394531, "global_step": 7032, "epoch": 167} {"train_loss": -4.961717128753662, "global_step": 7033, "epoch": 167} {"train_loss": -4.952422142028809, "global_step": 7034, "epoch": 167} {"train_loss": -4.892024993896484, "global_step": 7035, "epoch": 167} {"train_loss": -4.838443756103516, "global_step": 7036, "epoch": 167} {"train_loss": -4.750496864318848, "global_step": 7037, "epoch": 167} {"train_loss": -4.563902854919434, "global_step": 7038, "epoch": 167} {"train_loss": -4.680025577545166, "global_step": 7039, "epoch": 167} {"train_loss": -5.016541481018066, "global_step": 7040, "epoch": 167} {"train_loss": -4.8058037757873535, "global_step": 7041, "epoch": 167} {"train_loss": -4.4424591064453125, "global_step": 7042, "epoch": 167} {"train_loss": -4.917594909667969, "global_step": 7043, "epoch": 167} {"train_loss": -4.652595043182373, "global_step": 7044, "epoch": 167} {"train_loss": -4.557847023010254, "global_step": 7045, "epoch": 167} {"train_loss": -4.845849990844727, "global_step": 7046, "epoch": 167} {"train_loss": -4.444930553436279, "global_step": 7047, "epoch": 167} {"train_loss": -4.906237602233887, "global_step": 7048, "epoch": 167} {"train_loss": -4.499523162841797, "global_step": 7049, "epoch": 167} {"train_loss": -4.904397010803223, "global_step": 7050, "epoch": 167} {"train_loss": -4.717604637145996, "global_step": 7051, "epoch": 167} {"train_loss": -4.912223815917969, "global_step": 7052, "epoch": 167} {"train_loss": -4.6075897216796875, "global_step": 7053, "epoch": 167} {"train_loss": -4.863096237182617, "global_step": 7054, "epoch": 167} {"train_loss": -4.826250871022542, "global_step": 7055, "epoch": 167, "val_loss": 75781.125} {"train_loss": -4.695250034332275, "global_step": 7056, "epoch": 168} {"train_loss": -4.803079128265381, "global_step": 7057, "epoch": 168} {"train_loss": -4.939019203186035, "global_step": 7058, "epoch": 168} {"train_loss": -4.69779634475708, "global_step": 7059, "epoch": 168} {"train_loss": -5.011066436767578, "global_step": 7060, "epoch": 168} {"train_loss": -4.808647632598877, "global_step": 7061, "epoch": 168} {"train_loss": -4.948243141174316, "global_step": 7062, "epoch": 168} {"train_loss": -4.871288299560547, "global_step": 7063, "epoch": 168} {"train_loss": -4.860991477966309, "global_step": 7064, "epoch": 168} {"train_loss": -4.8121747970581055, "global_step": 7065, "epoch": 168} {"train_loss": -4.892897605895996, "global_step": 7066, "epoch": 168} {"train_loss": -4.9323272705078125, "global_step": 7067, "epoch": 168} {"train_loss": -4.869349002838135, "global_step": 7068, "epoch": 168} {"train_loss": -4.867918014526367, "global_step": 7069, "epoch": 168} {"train_loss": -4.8402838706970215, "global_step": 7070, "epoch": 168} {"train_loss": -4.889218330383301, "global_step": 7071, "epoch": 168} {"train_loss": -4.850863456726074, "global_step": 7072, "epoch": 168} {"train_loss": -4.832850456237793, "global_step": 7073, "epoch": 168} {"train_loss": -4.7701311111450195, "global_step": 7074, "epoch": 168} {"train_loss": -4.870208740234375, "global_step": 7075, "epoch": 168} {"train_loss": -4.876991271972656, "global_step": 7076, "epoch": 168} {"train_loss": -4.856419563293457, "global_step": 7077, "epoch": 168} {"train_loss": -4.824300765991211, "global_step": 7078, "epoch": 168} {"train_loss": -4.736893653869629, "global_step": 7079, "epoch": 168} {"train_loss": -4.9247236251831055, "global_step": 7080, "epoch": 168} {"train_loss": -4.927049160003662, "global_step": 7081, "epoch": 168} {"train_loss": -4.844845771789551, "global_step": 7082, "epoch": 168} {"train_loss": -4.799520492553711, "global_step": 7083, "epoch": 168} {"train_loss": -4.840821266174316, "global_step": 7084, "epoch": 168} {"train_loss": -4.776297569274902, "global_step": 7085, "epoch": 168} {"train_loss": -5.020723342895508, "global_step": 7086, "epoch": 168} {"train_loss": -4.88120174407959, "global_step": 7087, "epoch": 168} {"train_loss": -4.854169845581055, "global_step": 7088, "epoch": 168} {"train_loss": -4.932062149047852, "global_step": 7089, "epoch": 168} {"train_loss": -4.757120132446289, "global_step": 7090, "epoch": 168} {"train_loss": -4.784692764282227, "global_step": 7091, "epoch": 168} {"train_loss": -4.8240532875061035, "global_step": 7092, "epoch": 168} {"train_loss": -4.9472246170043945, "global_step": 7093, "epoch": 168} {"train_loss": -4.796182155609131, "global_step": 7094, "epoch": 168} {"train_loss": -4.865145206451416, "global_step": 7095, "epoch": 168} {"train_loss": -4.983736038208008, "global_step": 7096, "epoch": 168} {"train_loss": -4.857897996902466, "global_step": 7097, "epoch": 168, "val_loss": 75310.2421875} {"train_loss": -5.1103620529174805, "global_step": 7098, "epoch": 169} {"train_loss": -4.952522277832031, "global_step": 7099, "epoch": 169} {"train_loss": -5.026623725891113, "global_step": 7100, "epoch": 169} {"train_loss": -4.934109687805176, "global_step": 7101, "epoch": 169} {"train_loss": -4.947994709014893, "global_step": 7102, "epoch": 169} {"train_loss": -4.942680358886719, "global_step": 7103, "epoch": 169} {"train_loss": -4.967430114746094, "global_step": 7104, "epoch": 169} {"train_loss": -5.006715297698975, "global_step": 7105, "epoch": 169} {"train_loss": -4.96997594833374, "global_step": 7106, "epoch": 169} {"train_loss": -4.861270904541016, "global_step": 7107, "epoch": 169} {"train_loss": -4.775033950805664, "global_step": 7108, "epoch": 169} {"train_loss": -4.860287189483643, "global_step": 7109, "epoch": 169} {"train_loss": -5.053092956542969, "global_step": 7110, "epoch": 169} {"train_loss": -4.964162826538086, "global_step": 7111, "epoch": 169} {"train_loss": -4.968677520751953, "global_step": 7112, "epoch": 169} {"train_loss": -4.847777843475342, "global_step": 7113, "epoch": 169} {"train_loss": -4.953322410583496, "global_step": 7114, "epoch": 169} {"train_loss": -4.8540754318237305, "global_step": 7115, "epoch": 169} {"train_loss": -4.744915962219238, "global_step": 7116, "epoch": 169} {"train_loss": -4.910580635070801, "global_step": 7117, "epoch": 169} {"train_loss": -4.8203349113464355, "global_step": 7118, "epoch": 169} {"train_loss": -4.850834846496582, "global_step": 7119, "epoch": 169} {"train_loss": -4.8007965087890625, "global_step": 7120, "epoch": 169} {"train_loss": -4.914595127105713, "global_step": 7121, "epoch": 169} {"train_loss": -4.8685455322265625, "global_step": 7122, "epoch": 169} {"train_loss": -4.911109924316406, "global_step": 7123, "epoch": 169} {"train_loss": -4.915616035461426, "global_step": 7124, "epoch": 169} {"train_loss": -5.040401458740234, "global_step": 7125, "epoch": 169} {"train_loss": -4.960994720458984, "global_step": 7126, "epoch": 169} {"train_loss": -4.891024589538574, "global_step": 7127, "epoch": 169} {"train_loss": -4.9012932777404785, "global_step": 7128, "epoch": 169} {"train_loss": -4.938082695007324, "global_step": 7129, "epoch": 169} {"train_loss": -4.940643787384033, "global_step": 7130, "epoch": 169} {"train_loss": -4.844115257263184, "global_step": 7131, "epoch": 169} {"train_loss": -4.880047798156738, "global_step": 7132, "epoch": 169} {"train_loss": -4.842986106872559, "global_step": 7133, "epoch": 169} {"train_loss": -4.827296257019043, "global_step": 7134, "epoch": 169} {"train_loss": -4.873824596405029, "global_step": 7135, "epoch": 169} {"train_loss": -4.887017250061035, "global_step": 7136, "epoch": 169} {"train_loss": -4.950522422790527, "global_step": 7137, "epoch": 169} {"train_loss": -4.974708080291748, "global_step": 7138, "epoch": 169} {"train_loss": -4.913713739031837, "global_step": 7139, "epoch": 169, "val_loss": 75474.6875} {"train_loss": -4.869407653808594, "global_step": 7140, "epoch": 170} {"train_loss": -4.897509574890137, "global_step": 7141, "epoch": 170} {"train_loss": -4.8201584815979, "global_step": 7142, "epoch": 170} {"train_loss": -4.960383892059326, "global_step": 7143, "epoch": 170} {"train_loss": -4.9969482421875, "global_step": 7144, "epoch": 170} {"train_loss": -4.949215412139893, "global_step": 7145, "epoch": 170} {"train_loss": -4.926225662231445, "global_step": 7146, "epoch": 170} {"train_loss": -4.9520721435546875, "global_step": 7147, "epoch": 170} {"train_loss": -4.899830341339111, "global_step": 7148, "epoch": 170} {"train_loss": -4.97578239440918, "global_step": 7149, "epoch": 170} {"train_loss": -4.892340660095215, "global_step": 7150, "epoch": 170} {"train_loss": -4.844430923461914, "global_step": 7151, "epoch": 170} {"train_loss": -4.989238262176514, "global_step": 7152, "epoch": 170} {"train_loss": -4.802623748779297, "global_step": 7153, "epoch": 170} {"train_loss": -4.742092132568359, "global_step": 7154, "epoch": 170} {"train_loss": -4.9112749099731445, "global_step": 7155, "epoch": 170} {"train_loss": -4.877025127410889, "global_step": 7156, "epoch": 170} {"train_loss": -5.0027031898498535, "global_step": 7157, "epoch": 170} {"train_loss": -4.798389434814453, "global_step": 7158, "epoch": 170} {"train_loss": -4.890734672546387, "global_step": 7159, "epoch": 170} {"train_loss": -4.880306243896484, "global_step": 7160, "epoch": 170} {"train_loss": -4.883479118347168, "global_step": 7161, "epoch": 170} {"train_loss": -4.936795234680176, "global_step": 7162, "epoch": 170} {"train_loss": -4.968111038208008, "global_step": 7163, "epoch": 170} {"train_loss": -4.965266227722168, "global_step": 7164, "epoch": 170} {"train_loss": -4.796817779541016, "global_step": 7165, "epoch": 170} {"train_loss": -4.839058876037598, "global_step": 7166, "epoch": 170} {"train_loss": -5.05449104309082, "global_step": 7167, "epoch": 170} {"train_loss": -4.9334259033203125, "global_step": 7168, "epoch": 170} {"train_loss": -4.922680854797363, "global_step": 7169, "epoch": 170} {"train_loss": -4.925759792327881, "global_step": 7170, "epoch": 170} {"train_loss": -5.064776420593262, "global_step": 7171, "epoch": 170} {"train_loss": -4.877931594848633, "global_step": 7172, "epoch": 170} {"train_loss": -4.982926368713379, "global_step": 7173, "epoch": 170} {"train_loss": -4.930609226226807, "global_step": 7174, "epoch": 170} {"train_loss": -4.966677665710449, "global_step": 7175, "epoch": 170} {"train_loss": -4.851952075958252, "global_step": 7176, "epoch": 170} {"train_loss": -4.958750247955322, "global_step": 7177, "epoch": 170} {"train_loss": -4.907731533050537, "global_step": 7178, "epoch": 170} {"train_loss": -4.83063268661499, "global_step": 7179, "epoch": 170} {"train_loss": -4.970416069030762, "global_step": 7180, "epoch": 170} {"train_loss": -4.915181318918864, "global_step": 7181, "epoch": 170, "val_loss": 75130.859375} {"train_loss": -4.935887336730957, "global_step": 7182, "epoch": 171} {"train_loss": -4.952571868896484, "global_step": 7183, "epoch": 171} {"train_loss": -4.941083908081055, "global_step": 7184, "epoch": 171} {"train_loss": -4.6750288009643555, "global_step": 7185, "epoch": 171} {"train_loss": -4.65589714050293, "global_step": 7186, "epoch": 171} {"train_loss": -4.7387285232543945, "global_step": 7187, "epoch": 171} {"train_loss": -4.8826494216918945, "global_step": 7188, "epoch": 171} {"train_loss": -4.917511940002441, "global_step": 7189, "epoch": 171} {"train_loss": -4.6882476806640625, "global_step": 7190, "epoch": 171} {"train_loss": -4.852138996124268, "global_step": 7191, "epoch": 171} {"train_loss": -5.031105995178223, "global_step": 7192, "epoch": 171} {"train_loss": -4.747389793395996, "global_step": 7193, "epoch": 171} {"train_loss": -4.855502128601074, "global_step": 7194, "epoch": 171} {"train_loss": -4.923090934753418, "global_step": 7195, "epoch": 171} {"train_loss": -4.775542736053467, "global_step": 7196, "epoch": 171} {"train_loss": -4.9045000076293945, "global_step": 7197, "epoch": 171} {"train_loss": -4.942702293395996, "global_step": 7198, "epoch": 171} {"train_loss": -4.8925862312316895, "global_step": 7199, "epoch": 171} {"train_loss": -4.856083869934082, "global_step": 7200, "epoch": 171} {"train_loss": -4.932241916656494, "global_step": 7201, "epoch": 171} {"train_loss": -4.903335094451904, "global_step": 7202, "epoch": 171} {"train_loss": -4.87455940246582, "global_step": 7203, "epoch": 171} {"train_loss": -4.928031921386719, "global_step": 7204, "epoch": 171} {"train_loss": -4.760619163513184, "global_step": 7205, "epoch": 171} {"train_loss": -4.922311782836914, "global_step": 7206, "epoch": 171} {"train_loss": -5.0622663497924805, "global_step": 7207, "epoch": 171} {"train_loss": -4.923338413238525, "global_step": 7208, "epoch": 171} {"train_loss": -4.927807331085205, "global_step": 7209, "epoch": 171} {"train_loss": -4.993966102600098, "global_step": 7210, "epoch": 171} {"train_loss": -4.857935905456543, "global_step": 7211, "epoch": 171} {"train_loss": -4.955600738525391, "global_step": 7212, "epoch": 171} {"train_loss": -4.949936866760254, "global_step": 7213, "epoch": 171} {"train_loss": -4.836660861968994, "global_step": 7214, "epoch": 171} {"train_loss": -4.925628662109375, "global_step": 7215, "epoch": 171} {"train_loss": -5.126272201538086, "global_step": 7216, "epoch": 171} {"train_loss": -4.984166145324707, "global_step": 7217, "epoch": 171} {"train_loss": -4.961747169494629, "global_step": 7218, "epoch": 171} {"train_loss": -4.86558723449707, "global_step": 7219, "epoch": 171} {"train_loss": -4.865729331970215, "global_step": 7220, "epoch": 171} {"train_loss": -4.9205322265625, "global_step": 7221, "epoch": 171} {"train_loss": -5.086383819580078, "global_step": 7222, "epoch": 171} {"train_loss": -4.89597243354434, "global_step": 7223, "epoch": 171, "val_loss": 75690.78125} {"train_loss": -4.856543064117432, "global_step": 7224, "epoch": 172} {"train_loss": -4.852418422698975, "global_step": 7225, "epoch": 172} {"train_loss": -4.858249664306641, "global_step": 7226, "epoch": 172} {"train_loss": -4.866101264953613, "global_step": 7227, "epoch": 172} {"train_loss": -5.063628673553467, "global_step": 7228, "epoch": 172} {"train_loss": -5.115036487579346, "global_step": 7229, "epoch": 172} {"train_loss": -4.945162773132324, "global_step": 7230, "epoch": 172} {"train_loss": -5.028924942016602, "global_step": 7231, "epoch": 172} {"train_loss": -4.921337127685547, "global_step": 7232, "epoch": 172} {"train_loss": -5.035341739654541, "global_step": 7233, "epoch": 172} {"train_loss": -4.8100128173828125, "global_step": 7234, "epoch": 172} {"train_loss": -4.819375038146973, "global_step": 7235, "epoch": 172} {"train_loss": -4.846225738525391, "global_step": 7236, "epoch": 172} {"train_loss": -4.824028968811035, "global_step": 7237, "epoch": 172} {"train_loss": -4.886654853820801, "global_step": 7238, "epoch": 172} {"train_loss": -4.937262535095215, "global_step": 7239, "epoch": 172} {"train_loss": -4.940466403961182, "global_step": 7240, "epoch": 172} {"train_loss": -4.826269149780273, "global_step": 7241, "epoch": 172} {"train_loss": -4.758491039276123, "global_step": 7242, "epoch": 172} {"train_loss": -4.890146732330322, "global_step": 7243, "epoch": 172} {"train_loss": -4.905078887939453, "global_step": 7244, "epoch": 172} {"train_loss": -4.953789234161377, "global_step": 7245, "epoch": 172} {"train_loss": -4.829891681671143, "global_step": 7246, "epoch": 172} {"train_loss": -5.038164138793945, "global_step": 7247, "epoch": 172} {"train_loss": -4.910345077514648, "global_step": 7248, "epoch": 172} {"train_loss": -4.71235466003418, "global_step": 7249, "epoch": 172} {"train_loss": -4.91628360748291, "global_step": 7250, "epoch": 172} {"train_loss": -5.054662704467773, "global_step": 7251, "epoch": 172} {"train_loss": -4.916661739349365, "global_step": 7252, "epoch": 172} {"train_loss": -4.8769025802612305, "global_step": 7253, "epoch": 172} {"train_loss": -5.0061798095703125, "global_step": 7254, "epoch": 172} {"train_loss": -4.90785026550293, "global_step": 7255, "epoch": 172} {"train_loss": -5.013535976409912, "global_step": 7256, "epoch": 172} {"train_loss": -4.926177501678467, "global_step": 7257, "epoch": 172} {"train_loss": -4.923832893371582, "global_step": 7258, "epoch": 172} {"train_loss": -4.951153755187988, "global_step": 7259, "epoch": 172} {"train_loss": -4.967723846435547, "global_step": 7260, "epoch": 172} {"train_loss": -4.9427642822265625, "global_step": 7261, "epoch": 172} {"train_loss": -4.961691379547119, "global_step": 7262, "epoch": 172} {"train_loss": -4.888840198516846, "global_step": 7263, "epoch": 172} {"train_loss": -4.876979827880859, "global_step": 7264, "epoch": 172} {"train_loss": -4.916901736032395, "global_step": 7265, "epoch": 172, "val_loss": 74532.890625} {"train_loss": -5.003892421722412, "global_step": 7266, "epoch": 173} {"train_loss": -4.881208419799805, "global_step": 7267, "epoch": 173} {"train_loss": -4.963621139526367, "global_step": 7268, "epoch": 173} {"train_loss": -4.728132247924805, "global_step": 7269, "epoch": 173} {"train_loss": -4.86257791519165, "global_step": 7270, "epoch": 173} {"train_loss": -4.866457939147949, "global_step": 7271, "epoch": 173} {"train_loss": -4.663692474365234, "global_step": 7272, "epoch": 173} {"train_loss": -4.79332160949707, "global_step": 7273, "epoch": 173} {"train_loss": -4.839715003967285, "global_step": 7274, "epoch": 173} {"train_loss": -4.896945953369141, "global_step": 7275, "epoch": 173} {"train_loss": -4.717939376831055, "global_step": 7276, "epoch": 173} {"train_loss": -4.904356002807617, "global_step": 7277, "epoch": 173} {"train_loss": -4.770893096923828, "global_step": 7278, "epoch": 173} {"train_loss": -5.026517868041992, "global_step": 7279, "epoch": 173} {"train_loss": -5.100469589233398, "global_step": 7280, "epoch": 173} {"train_loss": -4.7396650314331055, "global_step": 7281, "epoch": 173} {"train_loss": -4.829190254211426, "global_step": 7282, "epoch": 173} {"train_loss": -4.972939491271973, "global_step": 7283, "epoch": 173} {"train_loss": -5.034799575805664, "global_step": 7284, "epoch": 173} {"train_loss": -4.771360874176025, "global_step": 7285, "epoch": 173} {"train_loss": -4.9821648597717285, "global_step": 7286, "epoch": 173} {"train_loss": -4.937877655029297, "global_step": 7287, "epoch": 173} {"train_loss": -4.888124465942383, "global_step": 7288, "epoch": 173} {"train_loss": -4.85245418548584, "global_step": 7289, "epoch": 173} {"train_loss": -4.810304164886475, "global_step": 7290, "epoch": 173} {"train_loss": -4.896011829376221, "global_step": 7291, "epoch": 173} {"train_loss": -4.851740837097168, "global_step": 7292, "epoch": 173} {"train_loss": -4.901236534118652, "global_step": 7293, "epoch": 173} {"train_loss": -4.972148418426514, "global_step": 7294, "epoch": 173} {"train_loss": -5.127905368804932, "global_step": 7295, "epoch": 173} {"train_loss": -4.953902721405029, "global_step": 7296, "epoch": 173} {"train_loss": -4.928036212921143, "global_step": 7297, "epoch": 173} {"train_loss": -4.972585678100586, "global_step": 7298, "epoch": 173} {"train_loss": -4.916004657745361, "global_step": 7299, "epoch": 173} {"train_loss": -5.095798492431641, "global_step": 7300, "epoch": 173} {"train_loss": -4.8086042404174805, "global_step": 7301, "epoch": 173} {"train_loss": -4.953325271606445, "global_step": 7302, "epoch": 173} {"train_loss": -5.039916515350342, "global_step": 7303, "epoch": 173} {"train_loss": -4.877180576324463, "global_step": 7304, "epoch": 173} {"train_loss": -4.97908353805542, "global_step": 7305, "epoch": 173} {"train_loss": -4.898934364318848, "global_step": 7306, "epoch": 173} {"train_loss": -4.901192233676002, "global_step": 7307, "epoch": 173, "val_loss": 75324.578125} {"train_loss": -4.916197299957275, "global_step": 7308, "epoch": 174} {"train_loss": -4.984140396118164, "global_step": 7309, "epoch": 174} {"train_loss": -4.999058246612549, "global_step": 7310, "epoch": 174} {"train_loss": -4.915818214416504, "global_step": 7311, "epoch": 174} {"train_loss": -4.991753101348877, "global_step": 7312, "epoch": 174} {"train_loss": -4.850975036621094, "global_step": 7313, "epoch": 174} {"train_loss": -5.006192207336426, "global_step": 7314, "epoch": 174} {"train_loss": -5.073436737060547, "global_step": 7315, "epoch": 174} {"train_loss": -4.845609664916992, "global_step": 7316, "epoch": 174} {"train_loss": -4.940651893615723, "global_step": 7317, "epoch": 174} {"train_loss": -4.963273048400879, "global_step": 7318, "epoch": 174} {"train_loss": -5.066638469696045, "global_step": 7319, "epoch": 174} {"train_loss": -4.9093017578125, "global_step": 7320, "epoch": 174} {"train_loss": -4.866489887237549, "global_step": 7321, "epoch": 174} {"train_loss": -4.973764896392822, "global_step": 7322, "epoch": 174} {"train_loss": -5.015439033508301, "global_step": 7323, "epoch": 174} {"train_loss": -4.782855033874512, "global_step": 7324, "epoch": 174} {"train_loss": -4.9374871253967285, "global_step": 7325, "epoch": 174} {"train_loss": -4.644796371459961, "global_step": 7326, "epoch": 174} {"train_loss": -4.586315631866455, "global_step": 7327, "epoch": 174} {"train_loss": -4.568930625915527, "global_step": 7328, "epoch": 174} {"train_loss": -4.802143573760986, "global_step": 7329, "epoch": 174} {"train_loss": -4.890313148498535, "global_step": 7330, "epoch": 174} {"train_loss": -4.500551700592041, "global_step": 7331, "epoch": 174} {"train_loss": -4.903607368469238, "global_step": 7332, "epoch": 174} {"train_loss": -4.83445930480957, "global_step": 7333, "epoch": 174} {"train_loss": -4.883459568023682, "global_step": 7334, "epoch": 174} {"train_loss": -4.756603240966797, "global_step": 7335, "epoch": 174} {"train_loss": -4.901561737060547, "global_step": 7336, "epoch": 174} {"train_loss": -4.914394378662109, "global_step": 7337, "epoch": 174} {"train_loss": -4.751969814300537, "global_step": 7338, "epoch": 174} {"train_loss": -4.848840236663818, "global_step": 7339, "epoch": 174} {"train_loss": -4.861969947814941, "global_step": 7340, "epoch": 174} {"train_loss": -4.803962707519531, "global_step": 7341, "epoch": 174} {"train_loss": -4.844237804412842, "global_step": 7342, "epoch": 174} {"train_loss": -5.010519504547119, "global_step": 7343, "epoch": 174} {"train_loss": -4.820697784423828, "global_step": 7344, "epoch": 174} {"train_loss": -4.857159614562988, "global_step": 7345, "epoch": 174} {"train_loss": -4.866669654846191, "global_step": 7346, "epoch": 174} {"train_loss": -4.835711479187012, "global_step": 7347, "epoch": 174} {"train_loss": -5.060590744018555, "global_step": 7348, "epoch": 174} {"train_loss": -4.872276669456845, "global_step": 7349, "epoch": 174, "val_loss": 74537.359375} {"train_loss": -4.948971748352051, "global_step": 7350, "epoch": 175} {"train_loss": -4.984838485717773, "global_step": 7351, "epoch": 175} {"train_loss": -4.8606977462768555, "global_step": 7352, "epoch": 175} {"train_loss": -4.92228889465332, "global_step": 7353, "epoch": 175} {"train_loss": -4.962430000305176, "global_step": 7354, "epoch": 175} {"train_loss": -4.975998878479004, "global_step": 7355, "epoch": 175} {"train_loss": -4.961297035217285, "global_step": 7356, "epoch": 175} {"train_loss": -5.008671283721924, "global_step": 7357, "epoch": 175} {"train_loss": -4.994779109954834, "global_step": 7358, "epoch": 175} {"train_loss": -4.9183549880981445, "global_step": 7359, "epoch": 175} {"train_loss": -5.028304100036621, "global_step": 7360, "epoch": 175} {"train_loss": -4.974208831787109, "global_step": 7361, "epoch": 175} {"train_loss": -4.712467193603516, "global_step": 7362, "epoch": 175} {"train_loss": -5.100493431091309, "global_step": 7363, "epoch": 175} {"train_loss": -5.089321136474609, "global_step": 7364, "epoch": 175} {"train_loss": -4.842624664306641, "global_step": 7365, "epoch": 175} {"train_loss": -4.780739784240723, "global_step": 7366, "epoch": 175} {"train_loss": -4.93711519241333, "global_step": 7367, "epoch": 175} {"train_loss": -4.938331127166748, "global_step": 7368, "epoch": 175} {"train_loss": -4.916297435760498, "global_step": 7369, "epoch": 175} {"train_loss": -5.04757833480835, "global_step": 7370, "epoch": 175} {"train_loss": -4.903526306152344, "global_step": 7371, "epoch": 175} {"train_loss": -5.0417799949646, "global_step": 7372, "epoch": 175} {"train_loss": -4.909749507904053, "global_step": 7373, "epoch": 175} {"train_loss": -4.684271812438965, "global_step": 7374, "epoch": 175} {"train_loss": -4.984447479248047, "global_step": 7375, "epoch": 175} {"train_loss": -4.880832672119141, "global_step": 7376, "epoch": 175} {"train_loss": -4.878992557525635, "global_step": 7377, "epoch": 175} {"train_loss": -4.846739768981934, "global_step": 7378, "epoch": 175} {"train_loss": -5.007629871368408, "global_step": 7379, "epoch": 175} {"train_loss": -5.050780296325684, "global_step": 7380, "epoch": 175} {"train_loss": -4.866375923156738, "global_step": 7381, "epoch": 175} {"train_loss": -5.038115501403809, "global_step": 7382, "epoch": 175} {"train_loss": -4.896900653839111, "global_step": 7383, "epoch": 175} {"train_loss": -4.874020576477051, "global_step": 7384, "epoch": 175} {"train_loss": -4.9090070724487305, "global_step": 7385, "epoch": 175} {"train_loss": -5.053485870361328, "global_step": 7386, "epoch": 175} {"train_loss": -4.914214611053467, "global_step": 7387, "epoch": 175} {"train_loss": -4.995920181274414, "global_step": 7388, "epoch": 175} {"train_loss": -4.946931838989258, "global_step": 7389, "epoch": 175} {"train_loss": -5.075848579406738, "global_step": 7390, "epoch": 175} {"train_loss": -4.9449365593138195, "global_step": 7391, "epoch": 175, "val_loss": 74678.421875} {"train_loss": -5.016948223114014, "global_step": 7392, "epoch": 176} {"train_loss": -4.958741188049316, "global_step": 7393, "epoch": 176} {"train_loss": -5.016867160797119, "global_step": 7394, "epoch": 176} {"train_loss": -4.898146629333496, "global_step": 7395, "epoch": 176} {"train_loss": -4.917085647583008, "global_step": 7396, "epoch": 176} {"train_loss": -4.781242370605469, "global_step": 7397, "epoch": 176} {"train_loss": -4.713832378387451, "global_step": 7398, "epoch": 176} {"train_loss": -4.769112586975098, "global_step": 7399, "epoch": 176} {"train_loss": -5.017978668212891, "global_step": 7400, "epoch": 176} {"train_loss": -5.048077583312988, "global_step": 7401, "epoch": 176} {"train_loss": -4.852720737457275, "global_step": 7402, "epoch": 176} {"train_loss": -4.86243200302124, "global_step": 7403, "epoch": 176} {"train_loss": -4.8851213455200195, "global_step": 7404, "epoch": 176} {"train_loss": -4.978588104248047, "global_step": 7405, "epoch": 176} {"train_loss": -4.91242790222168, "global_step": 7406, "epoch": 176} {"train_loss": -5.024519920349121, "global_step": 7407, "epoch": 176} {"train_loss": -4.720276832580566, "global_step": 7408, "epoch": 176} {"train_loss": -5.00838041305542, "global_step": 7409, "epoch": 176} {"train_loss": -4.89027214050293, "global_step": 7410, "epoch": 176} {"train_loss": -4.829827785491943, "global_step": 7411, "epoch": 176} {"train_loss": -4.916171073913574, "global_step": 7412, "epoch": 176} {"train_loss": -4.908409118652344, "global_step": 7413, "epoch": 176} {"train_loss": -4.917525291442871, "global_step": 7414, "epoch": 176} {"train_loss": -4.888047695159912, "global_step": 7415, "epoch": 176} {"train_loss": -4.867793560028076, "global_step": 7416, "epoch": 176} {"train_loss": -4.909732341766357, "global_step": 7417, "epoch": 176} {"train_loss": -4.941668510437012, "global_step": 7418, "epoch": 176} {"train_loss": -4.963181495666504, "global_step": 7419, "epoch": 176} {"train_loss": -4.985892295837402, "global_step": 7420, "epoch": 176} {"train_loss": -4.967944622039795, "global_step": 7421, "epoch": 176} {"train_loss": -4.839413166046143, "global_step": 7422, "epoch": 176} {"train_loss": -5.068079948425293, "global_step": 7423, "epoch": 176} {"train_loss": -4.954556941986084, "global_step": 7424, "epoch": 176} {"train_loss": -5.023455619812012, "global_step": 7425, "epoch": 176} {"train_loss": -4.926285743713379, "global_step": 7426, "epoch": 176} {"train_loss": -4.805225372314453, "global_step": 7427, "epoch": 176} {"train_loss": -4.889010906219482, "global_step": 7428, "epoch": 176} {"train_loss": -4.92861270904541, "global_step": 7429, "epoch": 176} {"train_loss": -4.9532856941223145, "global_step": 7430, "epoch": 176} {"train_loss": -4.769323825836182, "global_step": 7431, "epoch": 176} {"train_loss": -4.920143127441406, "global_step": 7432, "epoch": 176} {"train_loss": -4.914597227459862, "global_step": 7433, "epoch": 176, "val_loss": 75223.796875} {"train_loss": -4.896780014038086, "global_step": 7434, "epoch": 177} {"train_loss": -4.699582099914551, "global_step": 7435, "epoch": 177} {"train_loss": -4.950965881347656, "global_step": 7436, "epoch": 177} {"train_loss": -4.890195846557617, "global_step": 7437, "epoch": 177} {"train_loss": -5.084165096282959, "global_step": 7438, "epoch": 177} {"train_loss": -4.654153823852539, "global_step": 7439, "epoch": 177} {"train_loss": -5.042328834533691, "global_step": 7440, "epoch": 177} {"train_loss": -4.998570919036865, "global_step": 7441, "epoch": 177} {"train_loss": -4.687989234924316, "global_step": 7442, "epoch": 177} {"train_loss": -4.822220802307129, "global_step": 7443, "epoch": 177} {"train_loss": -4.921741485595703, "global_step": 7444, "epoch": 177} {"train_loss": -4.834528923034668, "global_step": 7445, "epoch": 177} {"train_loss": -4.890862941741943, "global_step": 7446, "epoch": 177} {"train_loss": -4.855133056640625, "global_step": 7447, "epoch": 177} {"train_loss": -4.821444511413574, "global_step": 7448, "epoch": 177} {"train_loss": -4.961291790008545, "global_step": 7449, "epoch": 177} {"train_loss": -4.815187454223633, "global_step": 7450, "epoch": 177} {"train_loss": -4.986623764038086, "global_step": 7451, "epoch": 177} {"train_loss": -4.917416095733643, "global_step": 7452, "epoch": 177} {"train_loss": -4.869197845458984, "global_step": 7453, "epoch": 177} {"train_loss": -4.799277305603027, "global_step": 7454, "epoch": 177} {"train_loss": -5.038686752319336, "global_step": 7455, "epoch": 177} {"train_loss": -4.7793426513671875, "global_step": 7456, "epoch": 177} {"train_loss": -4.808889389038086, "global_step": 7457, "epoch": 177} {"train_loss": -4.862015724182129, "global_step": 7458, "epoch": 177} {"train_loss": -4.783542156219482, "global_step": 7459, "epoch": 177} {"train_loss": -4.899147987365723, "global_step": 7460, "epoch": 177} {"train_loss": -5.018598556518555, "global_step": 7461, "epoch": 177} {"train_loss": -4.958902359008789, "global_step": 7462, "epoch": 177} {"train_loss": -4.864847183227539, "global_step": 7463, "epoch": 177} {"train_loss": -4.960705280303955, "global_step": 7464, "epoch": 177} {"train_loss": -4.903122901916504, "global_step": 7465, "epoch": 177} {"train_loss": -4.9874677658081055, "global_step": 7466, "epoch": 177} {"train_loss": -4.8978400230407715, "global_step": 7467, "epoch": 177} {"train_loss": -4.979379177093506, "global_step": 7468, "epoch": 177} {"train_loss": -4.972424030303955, "global_step": 7469, "epoch": 177} {"train_loss": -4.9265265464782715, "global_step": 7470, "epoch": 177} {"train_loss": -4.995777130126953, "global_step": 7471, "epoch": 177} {"train_loss": -5.0185723304748535, "global_step": 7472, "epoch": 177} {"train_loss": -4.909032821655273, "global_step": 7473, "epoch": 177} {"train_loss": -4.897648811340332, "global_step": 7474, "epoch": 177} {"train_loss": -4.899553503308978, "global_step": 7475, "epoch": 177, "val_loss": 74256.109375} {"train_loss": -5.029078483581543, "global_step": 7476, "epoch": 178} {"train_loss": -5.0087971687316895, "global_step": 7477, "epoch": 178} {"train_loss": -4.91740608215332, "global_step": 7478, "epoch": 178} {"train_loss": -4.893340110778809, "global_step": 7479, "epoch": 178} {"train_loss": -4.99741268157959, "global_step": 7480, "epoch": 178} {"train_loss": -5.00578498840332, "global_step": 7481, "epoch": 178} {"train_loss": -4.961739540100098, "global_step": 7482, "epoch": 178} {"train_loss": -4.961721420288086, "global_step": 7483, "epoch": 178} {"train_loss": -4.967093467712402, "global_step": 7484, "epoch": 178} {"train_loss": -4.840034008026123, "global_step": 7485, "epoch": 178} {"train_loss": -4.802868366241455, "global_step": 7486, "epoch": 178} {"train_loss": -4.840450286865234, "global_step": 7487, "epoch": 178} {"train_loss": -4.9014997482299805, "global_step": 7488, "epoch": 178} {"train_loss": -4.864696025848389, "global_step": 7489, "epoch": 178} {"train_loss": -4.912747383117676, "global_step": 7490, "epoch": 178} {"train_loss": -4.787386894226074, "global_step": 7491, "epoch": 178} {"train_loss": -4.736954689025879, "global_step": 7492, "epoch": 178} {"train_loss": -4.97393274307251, "global_step": 7493, "epoch": 178} {"train_loss": -4.849558353424072, "global_step": 7494, "epoch": 178} {"train_loss": -4.828961372375488, "global_step": 7495, "epoch": 178} {"train_loss": -4.824333667755127, "global_step": 7496, "epoch": 178} {"train_loss": -4.976850986480713, "global_step": 7497, "epoch": 178} {"train_loss": -4.931427955627441, "global_step": 7498, "epoch": 178} {"train_loss": -4.77590799331665, "global_step": 7499, "epoch": 178} {"train_loss": -4.9350175857543945, "global_step": 7500, "epoch": 178} {"train_loss": -4.895710468292236, "global_step": 7501, "epoch": 178} {"train_loss": -5.021145820617676, "global_step": 7502, "epoch": 178} {"train_loss": -5.041446685791016, "global_step": 7503, "epoch": 178} {"train_loss": -4.8895440101623535, "global_step": 7504, "epoch": 178} {"train_loss": -4.919712066650391, "global_step": 7505, "epoch": 178} {"train_loss": -4.970733642578125, "global_step": 7506, "epoch": 178} {"train_loss": -4.8801984786987305, "global_step": 7507, "epoch": 178} {"train_loss": -4.814478874206543, "global_step": 7508, "epoch": 178} {"train_loss": -5.076643943786621, "global_step": 7509, "epoch": 178} {"train_loss": -4.8529157638549805, "global_step": 7510, "epoch": 178} {"train_loss": -4.9962077140808105, "global_step": 7511, "epoch": 178} {"train_loss": -4.950726509094238, "global_step": 7512, "epoch": 178} {"train_loss": -5.012630462646484, "global_step": 7513, "epoch": 178} {"train_loss": -4.997833251953125, "global_step": 7514, "epoch": 178} {"train_loss": -4.9999589920043945, "global_step": 7515, "epoch": 178} {"train_loss": -4.938699722290039, "global_step": 7516, "epoch": 178} {"train_loss": -4.918889919916789, "global_step": 7517, "epoch": 178, "val_loss": 74706.0859375} {"train_loss": -4.8753767013549805, "global_step": 7518, "epoch": 179} {"train_loss": -4.985934257507324, "global_step": 7519, "epoch": 179} {"train_loss": -4.883791923522949, "global_step": 7520, "epoch": 179} {"train_loss": -4.959339141845703, "global_step": 7521, "epoch": 179} {"train_loss": -4.779111862182617, "global_step": 7522, "epoch": 179} {"train_loss": -4.9594879150390625, "global_step": 7523, "epoch": 179} {"train_loss": -4.84018611907959, "global_step": 7524, "epoch": 179} {"train_loss": -5.060958385467529, "global_step": 7525, "epoch": 179} {"train_loss": -4.907776355743408, "global_step": 7526, "epoch": 179} {"train_loss": -4.937437534332275, "global_step": 7527, "epoch": 179} {"train_loss": -4.939897537231445, "global_step": 7528, "epoch": 179} {"train_loss": -5.017725467681885, "global_step": 7529, "epoch": 179} {"train_loss": -5.03292989730835, "global_step": 7530, "epoch": 179} {"train_loss": -4.9897565841674805, "global_step": 7531, "epoch": 179} {"train_loss": -4.970456123352051, "global_step": 7532, "epoch": 179} {"train_loss": -5.013241767883301, "global_step": 7533, "epoch": 179} {"train_loss": -5.067929744720459, "global_step": 7534, "epoch": 179} {"train_loss": -4.868326187133789, "global_step": 7535, "epoch": 179} {"train_loss": -5.022356033325195, "global_step": 7536, "epoch": 179} {"train_loss": -4.998128890991211, "global_step": 7537, "epoch": 179} {"train_loss": -4.927360534667969, "global_step": 7538, "epoch": 179} {"train_loss": -4.794191360473633, "global_step": 7539, "epoch": 179} {"train_loss": -4.849124908447266, "global_step": 7540, "epoch": 179} {"train_loss": -4.8177056312561035, "global_step": 7541, "epoch": 179} {"train_loss": -4.946977615356445, "global_step": 7542, "epoch": 179} {"train_loss": -4.694217681884766, "global_step": 7543, "epoch": 179} {"train_loss": -4.87104606628418, "global_step": 7544, "epoch": 179} {"train_loss": -5.033283233642578, "global_step": 7545, "epoch": 179} {"train_loss": -4.839308261871338, "global_step": 7546, "epoch": 179} {"train_loss": -4.853368282318115, "global_step": 7547, "epoch": 179} {"train_loss": -4.863266944885254, "global_step": 7548, "epoch": 179} {"train_loss": -5.058698654174805, "global_step": 7549, "epoch": 179} {"train_loss": -4.958362579345703, "global_step": 7550, "epoch": 179} {"train_loss": -4.780605316162109, "global_step": 7551, "epoch": 179} {"train_loss": -4.8705339431762695, "global_step": 7552, "epoch": 179} {"train_loss": -4.781447410583496, "global_step": 7553, "epoch": 179} {"train_loss": -4.899377822875977, "global_step": 7554, "epoch": 179} {"train_loss": -5.05061149597168, "global_step": 7555, "epoch": 179} {"train_loss": -4.9488091468811035, "global_step": 7556, "epoch": 179} {"train_loss": -4.793127536773682, "global_step": 7557, "epoch": 179} {"train_loss": -4.951979637145996, "global_step": 7558, "epoch": 179} {"train_loss": -4.916914769581386, "global_step": 7559, "epoch": 179, "val_loss": 73785.8046875} {"train_loss": -4.955574035644531, "global_step": 7560, "epoch": 180} {"train_loss": -4.94288969039917, "global_step": 7561, "epoch": 180} {"train_loss": -4.939887046813965, "global_step": 7562, "epoch": 180} {"train_loss": -4.836671352386475, "global_step": 7563, "epoch": 180} {"train_loss": -4.936146259307861, "global_step": 7564, "epoch": 180} {"train_loss": -4.868570327758789, "global_step": 7565, "epoch": 180} {"train_loss": -4.736091613769531, "global_step": 7566, "epoch": 180} {"train_loss": -4.912820816040039, "global_step": 7567, "epoch": 180} {"train_loss": -4.946706771850586, "global_step": 7568, "epoch": 180} {"train_loss": -4.736122131347656, "global_step": 7569, "epoch": 180} {"train_loss": -5.0559916496276855, "global_step": 7570, "epoch": 180} {"train_loss": -4.980358600616455, "global_step": 7571, "epoch": 180} {"train_loss": -4.9780049324035645, "global_step": 7572, "epoch": 180} {"train_loss": -4.937463760375977, "global_step": 7573, "epoch": 180} {"train_loss": -5.061710357666016, "global_step": 7574, "epoch": 180} {"train_loss": -5.015883922576904, "global_step": 7575, "epoch": 180} {"train_loss": -4.944409370422363, "global_step": 7576, "epoch": 180} {"train_loss": -4.9495134353637695, "global_step": 7577, "epoch": 180} {"train_loss": -5.028983116149902, "global_step": 7578, "epoch": 180} {"train_loss": -5.0098490715026855, "global_step": 7579, "epoch": 180} {"train_loss": -4.897939205169678, "global_step": 7580, "epoch": 180} {"train_loss": -4.955630779266357, "global_step": 7581, "epoch": 180} {"train_loss": -4.972018241882324, "global_step": 7582, "epoch": 180} {"train_loss": -5.050797462463379, "global_step": 7583, "epoch": 180} {"train_loss": -4.905163764953613, "global_step": 7584, "epoch": 180} {"train_loss": -4.882383346557617, "global_step": 7585, "epoch": 180} {"train_loss": -4.890033721923828, "global_step": 7586, "epoch": 180} {"train_loss": -4.928532600402832, "global_step": 7587, "epoch": 180} {"train_loss": -5.068572044372559, "global_step": 7588, "epoch": 180} {"train_loss": -4.860311985015869, "global_step": 7589, "epoch": 180} {"train_loss": -4.9478559494018555, "global_step": 7590, "epoch": 180} {"train_loss": -4.942893981933594, "global_step": 7591, "epoch": 180} {"train_loss": -4.984012603759766, "global_step": 7592, "epoch": 180} {"train_loss": -5.006170272827148, "global_step": 7593, "epoch": 180} {"train_loss": -5.02844762802124, "global_step": 7594, "epoch": 180} {"train_loss": -4.92057991027832, "global_step": 7595, "epoch": 180} {"train_loss": -4.72096061706543, "global_step": 7596, "epoch": 180} {"train_loss": -4.890043258666992, "global_step": 7597, "epoch": 180} {"train_loss": -4.973298072814941, "global_step": 7598, "epoch": 180} {"train_loss": -4.89592981338501, "global_step": 7599, "epoch": 180} {"train_loss": -4.734264373779297, "global_step": 7600, "epoch": 180} {"train_loss": -4.931230806169056, "global_step": 7601, "epoch": 180, "val_loss": 74097.6171875} {"train_loss": -4.908878326416016, "global_step": 7602, "epoch": 181} {"train_loss": -4.887785911560059, "global_step": 7603, "epoch": 181} {"train_loss": -4.961249351501465, "global_step": 7604, "epoch": 181} {"train_loss": -4.870541572570801, "global_step": 7605, "epoch": 181} {"train_loss": -4.895493507385254, "global_step": 7606, "epoch": 181} {"train_loss": -4.970739364624023, "global_step": 7607, "epoch": 181} {"train_loss": -4.822405815124512, "global_step": 7608, "epoch": 181} {"train_loss": -4.955521583557129, "global_step": 7609, "epoch": 181} {"train_loss": -5.002889156341553, "global_step": 7610, "epoch": 181} {"train_loss": -4.960593223571777, "global_step": 7611, "epoch": 181} {"train_loss": -4.989624500274658, "global_step": 7612, "epoch": 181} {"train_loss": -4.956056594848633, "global_step": 7613, "epoch": 181} {"train_loss": -4.997092247009277, "global_step": 7614, "epoch": 181} {"train_loss": -5.071234703063965, "global_step": 7615, "epoch": 181} {"train_loss": -5.027477264404297, "global_step": 7616, "epoch": 181} {"train_loss": -4.851744651794434, "global_step": 7617, "epoch": 181} {"train_loss": -4.890883445739746, "global_step": 7618, "epoch": 181} {"train_loss": -4.926784515380859, "global_step": 7619, "epoch": 181} {"train_loss": -4.850383758544922, "global_step": 7620, "epoch": 181} {"train_loss": -4.956900596618652, "global_step": 7621, "epoch": 181} {"train_loss": -5.096798896789551, "global_step": 7622, "epoch": 181} {"train_loss": -5.010370254516602, "global_step": 7623, "epoch": 181} {"train_loss": -4.952028274536133, "global_step": 7624, "epoch": 181} {"train_loss": -4.9239501953125, "global_step": 7625, "epoch": 181} {"train_loss": -5.046148777008057, "global_step": 7626, "epoch": 181} {"train_loss": -5.016236305236816, "global_step": 7627, "epoch": 181} {"train_loss": -4.976184368133545, "global_step": 7628, "epoch": 181} {"train_loss": -4.929682731628418, "global_step": 7629, "epoch": 181} {"train_loss": -5.08002233505249, "global_step": 7630, "epoch": 181} {"train_loss": -5.15675687789917, "global_step": 7631, "epoch": 181} {"train_loss": -5.135125160217285, "global_step": 7632, "epoch": 181} {"train_loss": -5.032196044921875, "global_step": 7633, "epoch": 181} {"train_loss": -4.931678771972656, "global_step": 7634, "epoch": 181} {"train_loss": -4.825831890106201, "global_step": 7635, "epoch": 181} {"train_loss": -5.0724663734436035, "global_step": 7636, "epoch": 181} {"train_loss": -5.016782283782959, "global_step": 7637, "epoch": 181} {"train_loss": -4.776606559753418, "global_step": 7638, "epoch": 181} {"train_loss": -4.70310640335083, "global_step": 7639, "epoch": 181} {"train_loss": -4.8210530281066895, "global_step": 7640, "epoch": 181} {"train_loss": -4.837532997131348, "global_step": 7641, "epoch": 181} {"train_loss": -4.779972076416016, "global_step": 7642, "epoch": 181} {"train_loss": -4.947188161668324, "global_step": 7643, "epoch": 181, "val_loss": 74310.4453125} {"train_loss": -5.041839599609375, "global_step": 7644, "epoch": 182} {"train_loss": -4.759714126586914, "global_step": 7645, "epoch": 182} {"train_loss": -4.869040489196777, "global_step": 7646, "epoch": 182} {"train_loss": -4.958254814147949, "global_step": 7647, "epoch": 182} {"train_loss": -4.929448127746582, "global_step": 7648, "epoch": 182} {"train_loss": -4.878129959106445, "global_step": 7649, "epoch": 182} {"train_loss": -4.929942607879639, "global_step": 7650, "epoch": 182} {"train_loss": -5.036953926086426, "global_step": 7651, "epoch": 182} {"train_loss": -4.8243536949157715, "global_step": 7652, "epoch": 182} {"train_loss": -4.872532844543457, "global_step": 7653, "epoch": 182} {"train_loss": -5.053041458129883, "global_step": 7654, "epoch": 182} {"train_loss": -4.845173358917236, "global_step": 7655, "epoch": 182} {"train_loss": -5.039357662200928, "global_step": 7656, "epoch": 182} {"train_loss": -4.9602460861206055, "global_step": 7657, "epoch": 182} {"train_loss": -5.023089408874512, "global_step": 7658, "epoch": 182} {"train_loss": -4.936533451080322, "global_step": 7659, "epoch": 182} {"train_loss": -4.884471893310547, "global_step": 7660, "epoch": 182} {"train_loss": -4.948668003082275, "global_step": 7661, "epoch": 182} {"train_loss": -4.902858734130859, "global_step": 7662, "epoch": 182} {"train_loss": -4.874294281005859, "global_step": 7663, "epoch": 182} {"train_loss": -4.9037065505981445, "global_step": 7664, "epoch": 182} {"train_loss": -4.936718940734863, "global_step": 7665, "epoch": 182} {"train_loss": -4.894784927368164, "global_step": 7666, "epoch": 182} {"train_loss": -4.9354400634765625, "global_step": 7667, "epoch": 182} {"train_loss": -4.955996990203857, "global_step": 7668, "epoch": 182} {"train_loss": -4.69855260848999, "global_step": 7669, "epoch": 182} {"train_loss": -4.918497085571289, "global_step": 7670, "epoch": 182} {"train_loss": -4.910493850708008, "global_step": 7671, "epoch": 182} {"train_loss": -4.7535319328308105, "global_step": 7672, "epoch": 182} {"train_loss": -4.921623706817627, "global_step": 7673, "epoch": 182} {"train_loss": -4.920295715332031, "global_step": 7674, "epoch": 182} {"train_loss": -4.964069366455078, "global_step": 7675, "epoch": 182} {"train_loss": -4.860337257385254, "global_step": 7676, "epoch": 182} {"train_loss": -4.98834228515625, "global_step": 7677, "epoch": 182} {"train_loss": -4.899540424346924, "global_step": 7678, "epoch": 182} {"train_loss": -4.93330192565918, "global_step": 7679, "epoch": 182} {"train_loss": -4.974386692047119, "global_step": 7680, "epoch": 182} {"train_loss": -4.936287879943848, "global_step": 7681, "epoch": 182} {"train_loss": -4.972237586975098, "global_step": 7682, "epoch": 182} {"train_loss": -5.121148109436035, "global_step": 7683, "epoch": 182} {"train_loss": -4.868902206420898, "global_step": 7684, "epoch": 182} {"train_loss": -4.922178938275292, "global_step": 7685, "epoch": 182, "val_loss": 73513.125} {"train_loss": -5.0069732666015625, "global_step": 7686, "epoch": 183} {"train_loss": -4.933862686157227, "global_step": 7687, "epoch": 183} {"train_loss": -4.89468240737915, "global_step": 7688, "epoch": 183} {"train_loss": -5.079543113708496, "global_step": 7689, "epoch": 183} {"train_loss": -4.979862689971924, "global_step": 7690, "epoch": 183} {"train_loss": -5.06307315826416, "global_step": 7691, "epoch": 183} {"train_loss": -4.971959114074707, "global_step": 7692, "epoch": 183} {"train_loss": -4.950102806091309, "global_step": 7693, "epoch": 183} {"train_loss": -4.903286457061768, "global_step": 7694, "epoch": 183} {"train_loss": -4.993928909301758, "global_step": 7695, "epoch": 183} {"train_loss": -5.063579082489014, "global_step": 7696, "epoch": 183} {"train_loss": -4.966322898864746, "global_step": 7697, "epoch": 183} {"train_loss": -4.900793552398682, "global_step": 7698, "epoch": 183} {"train_loss": -5.041292190551758, "global_step": 7699, "epoch": 183} {"train_loss": -4.924574851989746, "global_step": 7700, "epoch": 183} {"train_loss": -4.953218460083008, "global_step": 7701, "epoch": 183} {"train_loss": -4.901874542236328, "global_step": 7702, "epoch": 183} {"train_loss": -4.945135593414307, "global_step": 7703, "epoch": 183} {"train_loss": -4.899174690246582, "global_step": 7704, "epoch": 183} {"train_loss": -4.926094055175781, "global_step": 7705, "epoch": 183} {"train_loss": -4.895207405090332, "global_step": 7706, "epoch": 183} {"train_loss": -4.756381034851074, "global_step": 7707, "epoch": 183} {"train_loss": -4.9229536056518555, "global_step": 7708, "epoch": 183} {"train_loss": -4.923035621643066, "global_step": 7709, "epoch": 183} {"train_loss": -4.895377159118652, "global_step": 7710, "epoch": 183} {"train_loss": -4.890354156494141, "global_step": 7711, "epoch": 183} {"train_loss": -5.062238693237305, "global_step": 7712, "epoch": 183} {"train_loss": -4.917984962463379, "global_step": 7713, "epoch": 183} {"train_loss": -4.803430080413818, "global_step": 7714, "epoch": 183} {"train_loss": -5.026076793670654, "global_step": 7715, "epoch": 183} {"train_loss": -5.035747528076172, "global_step": 7716, "epoch": 183} {"train_loss": -4.916286945343018, "global_step": 7717, "epoch": 183} {"train_loss": -4.967813491821289, "global_step": 7718, "epoch": 183} {"train_loss": -4.977606773376465, "global_step": 7719, "epoch": 183} {"train_loss": -4.898106575012207, "global_step": 7720, "epoch": 183} {"train_loss": -5.0483503341674805, "global_step": 7721, "epoch": 183} {"train_loss": -5.0261006355285645, "global_step": 7722, "epoch": 183} {"train_loss": -4.933927059173584, "global_step": 7723, "epoch": 183} {"train_loss": -5.006731033325195, "global_step": 7724, "epoch": 183} {"train_loss": -4.9629716873168945, "global_step": 7725, "epoch": 183} {"train_loss": -4.911419868469238, "global_step": 7726, "epoch": 183} {"train_loss": -4.952969664619083, "global_step": 7727, "epoch": 183, "val_loss": 74214.390625} {"train_loss": -4.879549026489258, "global_step": 7728, "epoch": 184} {"train_loss": -4.996711730957031, "global_step": 7729, "epoch": 184} {"train_loss": -5.046424388885498, "global_step": 7730, "epoch": 184} {"train_loss": -4.95201301574707, "global_step": 7731, "epoch": 184} {"train_loss": -4.664181709289551, "global_step": 7732, "epoch": 184} {"train_loss": -4.8603692054748535, "global_step": 7733, "epoch": 184} {"train_loss": -4.813295364379883, "global_step": 7734, "epoch": 184} {"train_loss": -4.876068115234375, "global_step": 7735, "epoch": 184} {"train_loss": -4.692058563232422, "global_step": 7736, "epoch": 184} {"train_loss": -4.896548748016357, "global_step": 7737, "epoch": 184} {"train_loss": -5.028079032897949, "global_step": 7738, "epoch": 184} {"train_loss": -5.0979461669921875, "global_step": 7739, "epoch": 184} {"train_loss": -4.931142807006836, "global_step": 7740, "epoch": 184} {"train_loss": -4.934508323669434, "global_step": 7741, "epoch": 184} {"train_loss": -4.990745544433594, "global_step": 7742, "epoch": 184} {"train_loss": -4.998316764831543, "global_step": 7743, "epoch": 184} {"train_loss": -5.043275833129883, "global_step": 7744, "epoch": 184} {"train_loss": -4.920441627502441, "global_step": 7745, "epoch": 184} {"train_loss": -4.863527774810791, "global_step": 7746, "epoch": 184} {"train_loss": -4.909173965454102, "global_step": 7747, "epoch": 184} {"train_loss": -4.99696159362793, "global_step": 7748, "epoch": 184} {"train_loss": -4.765761375427246, "global_step": 7749, "epoch": 184} {"train_loss": -4.864637851715088, "global_step": 7750, "epoch": 184} {"train_loss": -4.991115093231201, "global_step": 7751, "epoch": 184} {"train_loss": -4.757388591766357, "global_step": 7752, "epoch": 184} {"train_loss": -4.9309892654418945, "global_step": 7753, "epoch": 184} {"train_loss": -4.844287872314453, "global_step": 7754, "epoch": 184} {"train_loss": -4.79174280166626, "global_step": 7755, "epoch": 184} {"train_loss": -5.010666847229004, "global_step": 7756, "epoch": 184} {"train_loss": -4.784927845001221, "global_step": 7757, "epoch": 184} {"train_loss": -4.956094741821289, "global_step": 7758, "epoch": 184} {"train_loss": -4.871291637420654, "global_step": 7759, "epoch": 184} {"train_loss": -4.778559684753418, "global_step": 7760, "epoch": 184} {"train_loss": -4.816771030426025, "global_step": 7761, "epoch": 184} {"train_loss": -4.877875328063965, "global_step": 7762, "epoch": 184} {"train_loss": -4.966192722320557, "global_step": 7763, "epoch": 184} {"train_loss": -4.772128105163574, "global_step": 7764, "epoch": 184} {"train_loss": -5.025510787963867, "global_step": 7765, "epoch": 184} {"train_loss": -4.944846153259277, "global_step": 7766, "epoch": 184} {"train_loss": -5.007076263427734, "global_step": 7767, "epoch": 184} {"train_loss": -4.950979709625244, "global_step": 7768, "epoch": 184} {"train_loss": -4.9039077418191095, "global_step": 7769, "epoch": 184, "val_loss": 73562.234375} {"train_loss": -4.933385848999023, "global_step": 7770, "epoch": 185} {"train_loss": -4.8642377853393555, "global_step": 7771, "epoch": 185} {"train_loss": -4.996249198913574, "global_step": 7772, "epoch": 185} {"train_loss": -5.014690399169922, "global_step": 7773, "epoch": 185} {"train_loss": -4.940828800201416, "global_step": 7774, "epoch": 185} {"train_loss": -4.92710018157959, "global_step": 7775, "epoch": 185} {"train_loss": -4.951443195343018, "global_step": 7776, "epoch": 185} {"train_loss": -4.870003700256348, "global_step": 7777, "epoch": 185} {"train_loss": -4.853895664215088, "global_step": 7778, "epoch": 185} {"train_loss": -4.942996025085449, "global_step": 7779, "epoch": 185} {"train_loss": -5.12764310836792, "global_step": 7780, "epoch": 185} {"train_loss": -5.04163932800293, "global_step": 7781, "epoch": 185} {"train_loss": -5.031689643859863, "global_step": 7782, "epoch": 185} {"train_loss": -4.987311363220215, "global_step": 7783, "epoch": 185} {"train_loss": -5.061446189880371, "global_step": 7784, "epoch": 185} {"train_loss": -4.984745979309082, "global_step": 7785, "epoch": 185} {"train_loss": -4.880825996398926, "global_step": 7786, "epoch": 185} {"train_loss": -4.889129638671875, "global_step": 7787, "epoch": 185} {"train_loss": -5.088104248046875, "global_step": 7788, "epoch": 185} {"train_loss": -5.056031227111816, "global_step": 7789, "epoch": 185} {"train_loss": -4.965910911560059, "global_step": 7790, "epoch": 185} {"train_loss": -4.896676540374756, "global_step": 7791, "epoch": 185} {"train_loss": -4.935194969177246, "global_step": 7792, "epoch": 185} {"train_loss": -4.775815963745117, "global_step": 7793, "epoch": 185} {"train_loss": -4.895654201507568, "global_step": 7794, "epoch": 185} {"train_loss": -5.076084613800049, "global_step": 7795, "epoch": 185} {"train_loss": -4.8086371421813965, "global_step": 7796, "epoch": 185} {"train_loss": -4.976213455200195, "global_step": 7797, "epoch": 185} {"train_loss": -4.9353790283203125, "global_step": 7798, "epoch": 185} {"train_loss": -5.007821083068848, "global_step": 7799, "epoch": 185} {"train_loss": -5.001129150390625, "global_step": 7800, "epoch": 185} {"train_loss": -4.7704362869262695, "global_step": 7801, "epoch": 185} {"train_loss": -5.049213409423828, "global_step": 7802, "epoch": 185} {"train_loss": -4.892704010009766, "global_step": 7803, "epoch": 185} {"train_loss": -5.01495361328125, "global_step": 7804, "epoch": 185} {"train_loss": -4.868899345397949, "global_step": 7805, "epoch": 185} {"train_loss": -5.0393781661987305, "global_step": 7806, "epoch": 185} {"train_loss": -4.965147495269775, "global_step": 7807, "epoch": 185} {"train_loss": -5.026318550109863, "global_step": 7808, "epoch": 185} {"train_loss": -5.100610733032227, "global_step": 7809, "epoch": 185} {"train_loss": -4.982858180999756, "global_step": 7810, "epoch": 185} {"train_loss": -4.960020122073946, "global_step": 7811, "epoch": 185, "val_loss": 74081.90625} {"train_loss": -4.939913749694824, "global_step": 7812, "epoch": 186} {"train_loss": -5.002885341644287, "global_step": 7813, "epoch": 186} {"train_loss": -4.855201721191406, "global_step": 7814, "epoch": 186} {"train_loss": -4.967757225036621, "global_step": 7815, "epoch": 186} {"train_loss": -4.96169376373291, "global_step": 7816, "epoch": 186} {"train_loss": -4.9029645919799805, "global_step": 7817, "epoch": 186} {"train_loss": -5.032957553863525, "global_step": 7818, "epoch": 186} {"train_loss": -5.080816268920898, "global_step": 7819, "epoch": 186} {"train_loss": -4.982082366943359, "global_step": 7820, "epoch": 186} {"train_loss": -4.948868751525879, "global_step": 7821, "epoch": 186} {"train_loss": -5.000144958496094, "global_step": 7822, "epoch": 186} {"train_loss": -5.12397575378418, "global_step": 7823, "epoch": 186} {"train_loss": -4.959628105163574, "global_step": 7824, "epoch": 186} {"train_loss": -4.836385250091553, "global_step": 7825, "epoch": 186} {"train_loss": -4.969034194946289, "global_step": 7826, "epoch": 186} {"train_loss": -4.976280689239502, "global_step": 7827, "epoch": 186} {"train_loss": -5.080711841583252, "global_step": 7828, "epoch": 186} {"train_loss": -5.0074639320373535, "global_step": 7829, "epoch": 186} {"train_loss": -4.657215118408203, "global_step": 7830, "epoch": 186} {"train_loss": -4.8730363845825195, "global_step": 7831, "epoch": 186} {"train_loss": -4.949429512023926, "global_step": 7832, "epoch": 186} {"train_loss": -5.103046417236328, "global_step": 7833, "epoch": 186} {"train_loss": -4.999963283538818, "global_step": 7834, "epoch": 186} {"train_loss": -4.970232963562012, "global_step": 7835, "epoch": 186} {"train_loss": -4.9647932052612305, "global_step": 7836, "epoch": 186} {"train_loss": -4.967120170593262, "global_step": 7837, "epoch": 186} {"train_loss": -5.174612045288086, "global_step": 7838, "epoch": 186} {"train_loss": -4.951512336730957, "global_step": 7839, "epoch": 186} {"train_loss": -4.831782341003418, "global_step": 7840, "epoch": 186} {"train_loss": -5.016902923583984, "global_step": 7841, "epoch": 186} {"train_loss": -4.917452812194824, "global_step": 7842, "epoch": 186} {"train_loss": -4.80535888671875, "global_step": 7843, "epoch": 186} {"train_loss": -4.903827667236328, "global_step": 7844, "epoch": 186} {"train_loss": -5.06474494934082, "global_step": 7845, "epoch": 186} {"train_loss": -5.033634662628174, "global_step": 7846, "epoch": 186} {"train_loss": -5.123142242431641, "global_step": 7847, "epoch": 186} {"train_loss": -4.942873001098633, "global_step": 7848, "epoch": 186} {"train_loss": -4.879426002502441, "global_step": 7849, "epoch": 186} {"train_loss": -4.727096080780029, "global_step": 7850, "epoch": 186} {"train_loss": -4.891325950622559, "global_step": 7851, "epoch": 186} {"train_loss": -4.993285179138184, "global_step": 7852, "epoch": 186} {"train_loss": -4.957248880749657, "global_step": 7853, "epoch": 186, "val_loss": 75896.6953125} {"train_loss": -4.646232604980469, "global_step": 7854, "epoch": 187} {"train_loss": -4.796456336975098, "global_step": 7855, "epoch": 187} {"train_loss": -4.891155242919922, "global_step": 7856, "epoch": 187} {"train_loss": -4.819443702697754, "global_step": 7857, "epoch": 187} {"train_loss": -4.799572944641113, "global_step": 7858, "epoch": 187} {"train_loss": -4.9976654052734375, "global_step": 7859, "epoch": 187} {"train_loss": -4.922289848327637, "global_step": 7860, "epoch": 187} {"train_loss": -4.936046600341797, "global_step": 7861, "epoch": 187} {"train_loss": -4.783590793609619, "global_step": 7862, "epoch": 187} {"train_loss": -4.766596794128418, "global_step": 7863, "epoch": 187} {"train_loss": -5.102199554443359, "global_step": 7864, "epoch": 187} {"train_loss": -4.951044082641602, "global_step": 7865, "epoch": 187} {"train_loss": -4.873870372772217, "global_step": 7866, "epoch": 187} {"train_loss": -4.866434097290039, "global_step": 7867, "epoch": 187} {"train_loss": -4.863519191741943, "global_step": 7868, "epoch": 187} {"train_loss": -4.963497161865234, "global_step": 7869, "epoch": 187} {"train_loss": -5.006702423095703, "global_step": 7870, "epoch": 187} {"train_loss": -4.583800792694092, "global_step": 7871, "epoch": 187} {"train_loss": -4.997989654541016, "global_step": 7872, "epoch": 187} {"train_loss": -4.9334869384765625, "global_step": 7873, "epoch": 187} {"train_loss": -4.562099456787109, "global_step": 7874, "epoch": 187} {"train_loss": -4.867072582244873, "global_step": 7875, "epoch": 187} {"train_loss": -4.393399238586426, "global_step": 7876, "epoch": 187} {"train_loss": -4.99951171875, "global_step": 7877, "epoch": 187} {"train_loss": -4.8325653076171875, "global_step": 7878, "epoch": 187} {"train_loss": -4.631796836853027, "global_step": 7879, "epoch": 187} {"train_loss": -4.956151962280273, "global_step": 7880, "epoch": 187} {"train_loss": -4.618783950805664, "global_step": 7881, "epoch": 187} {"train_loss": -4.858911514282227, "global_step": 7882, "epoch": 187} {"train_loss": -4.696331977844238, "global_step": 7883, "epoch": 187} {"train_loss": -4.918941497802734, "global_step": 7884, "epoch": 187} {"train_loss": -4.764178276062012, "global_step": 7885, "epoch": 187} {"train_loss": -4.92362117767334, "global_step": 7886, "epoch": 187} {"train_loss": -4.888974666595459, "global_step": 7887, "epoch": 187} {"train_loss": -4.788814544677734, "global_step": 7888, "epoch": 187} {"train_loss": -4.835846900939941, "global_step": 7889, "epoch": 187} {"train_loss": -4.955365180969238, "global_step": 7890, "epoch": 187} {"train_loss": -4.887739181518555, "global_step": 7891, "epoch": 187} {"train_loss": -4.894990921020508, "global_step": 7892, "epoch": 187} {"train_loss": -5.011223793029785, "global_step": 7893, "epoch": 187} {"train_loss": -4.958562850952148, "global_step": 7894, "epoch": 187} {"train_loss": -4.850672721862793, "global_step": 7895, "epoch": 187, "val_loss": 73472.984375} {"train_loss": -4.877326011657715, "global_step": 7896, "epoch": 188} {"train_loss": -5.054243564605713, "global_step": 7897, "epoch": 188} {"train_loss": -4.866823673248291, "global_step": 7898, "epoch": 188} {"train_loss": -4.897951126098633, "global_step": 7899, "epoch": 188} {"train_loss": -5.029049873352051, "global_step": 7900, "epoch": 188} {"train_loss": -4.926088809967041, "global_step": 7901, "epoch": 188} {"train_loss": -5.103121757507324, "global_step": 7902, "epoch": 188} {"train_loss": -4.914301872253418, "global_step": 7903, "epoch": 188} {"train_loss": -5.037583351135254, "global_step": 7904, "epoch": 188} {"train_loss": -4.774312973022461, "global_step": 7905, "epoch": 188} {"train_loss": -4.983626365661621, "global_step": 7906, "epoch": 188} {"train_loss": -4.934999465942383, "global_step": 7907, "epoch": 188} {"train_loss": -4.979510307312012, "global_step": 7908, "epoch": 188} {"train_loss": -4.903091907501221, "global_step": 7909, "epoch": 188} {"train_loss": -4.978236675262451, "global_step": 7910, "epoch": 188} {"train_loss": -5.106066703796387, "global_step": 7911, "epoch": 188} {"train_loss": -4.923504829406738, "global_step": 7912, "epoch": 188} {"train_loss": -4.876917839050293, "global_step": 7913, "epoch": 188} {"train_loss": -4.87052583694458, "global_step": 7914, "epoch": 188} {"train_loss": -4.831310272216797, "global_step": 7915, "epoch": 188} {"train_loss": -4.9322309494018555, "global_step": 7916, "epoch": 188} {"train_loss": -4.983578205108643, "global_step": 7917, "epoch": 188} {"train_loss": -5.085021018981934, "global_step": 7918, "epoch": 188} {"train_loss": -4.944836616516113, "global_step": 7919, "epoch": 188} {"train_loss": -4.959272861480713, "global_step": 7920, "epoch": 188} {"train_loss": -4.994279861450195, "global_step": 7921, "epoch": 188} {"train_loss": -4.982724189758301, "global_step": 7922, "epoch": 188} {"train_loss": -5.189915657043457, "global_step": 7923, "epoch": 188} {"train_loss": -5.033603668212891, "global_step": 7924, "epoch": 188} {"train_loss": -4.922074317932129, "global_step": 7925, "epoch": 188} {"train_loss": -4.9285054206848145, "global_step": 7926, "epoch": 188} {"train_loss": -4.893640041351318, "global_step": 7927, "epoch": 188} {"train_loss": -5.055222034454346, "global_step": 7928, "epoch": 188} {"train_loss": -4.969738960266113, "global_step": 7929, "epoch": 188} {"train_loss": -5.0955095291137695, "global_step": 7930, "epoch": 188} {"train_loss": -5.145025253295898, "global_step": 7931, "epoch": 188} {"train_loss": -5.071535110473633, "global_step": 7932, "epoch": 188} {"train_loss": -4.975120544433594, "global_step": 7933, "epoch": 188} {"train_loss": -4.784777641296387, "global_step": 7934, "epoch": 188} {"train_loss": -4.8109235763549805, "global_step": 7935, "epoch": 188} {"train_loss": -4.876723289489746, "global_step": 7936, "epoch": 188} {"train_loss": -4.965260721388317, "global_step": 7937, "epoch": 188, "val_loss": 73346.0546875} {"train_loss": -4.983015537261963, "global_step": 7938, "epoch": 189} {"train_loss": -4.774834632873535, "global_step": 7939, "epoch": 189} {"train_loss": -4.818070411682129, "global_step": 7940, "epoch": 189} {"train_loss": -5.109433174133301, "global_step": 7941, "epoch": 189} {"train_loss": -4.938452243804932, "global_step": 7942, "epoch": 189} {"train_loss": -4.848716735839844, "global_step": 7943, "epoch": 189} {"train_loss": -4.99893856048584, "global_step": 7944, "epoch": 189} {"train_loss": -5.05101203918457, "global_step": 7945, "epoch": 189} {"train_loss": -4.885433673858643, "global_step": 7946, "epoch": 189} {"train_loss": -4.9845099449157715, "global_step": 7947, "epoch": 189} {"train_loss": -5.049030303955078, "global_step": 7948, "epoch": 189} {"train_loss": -4.864530563354492, "global_step": 7949, "epoch": 189} {"train_loss": -4.833587646484375, "global_step": 7950, "epoch": 189} {"train_loss": -4.826946258544922, "global_step": 7951, "epoch": 189} {"train_loss": -4.813792705535889, "global_step": 7952, "epoch": 189} {"train_loss": -4.861928939819336, "global_step": 7953, "epoch": 189} {"train_loss": -4.8908209800720215, "global_step": 7954, "epoch": 189} {"train_loss": -4.832900047302246, "global_step": 7955, "epoch": 189} {"train_loss": -4.890869617462158, "global_step": 7956, "epoch": 189} {"train_loss": -4.77359676361084, "global_step": 7957, "epoch": 189} {"train_loss": -5.0228986740112305, "global_step": 7958, "epoch": 189} {"train_loss": -4.875911712646484, "global_step": 7959, "epoch": 189} {"train_loss": -4.640925407409668, "global_step": 7960, "epoch": 189} {"train_loss": -4.768108367919922, "global_step": 7961, "epoch": 189} {"train_loss": -5.072704315185547, "global_step": 7962, "epoch": 189} {"train_loss": -4.81990909576416, "global_step": 7963, "epoch": 189} {"train_loss": -4.870433330535889, "global_step": 7964, "epoch": 189} {"train_loss": -4.923227310180664, "global_step": 7965, "epoch": 189} {"train_loss": -5.100864410400391, "global_step": 7966, "epoch": 189} {"train_loss": -4.789896011352539, "global_step": 7967, "epoch": 189} {"train_loss": -5.078976154327393, "global_step": 7968, "epoch": 189} {"train_loss": -5.099546432495117, "global_step": 7969, "epoch": 189} {"train_loss": -4.841787815093994, "global_step": 7970, "epoch": 189} {"train_loss": -4.884515762329102, "global_step": 7971, "epoch": 189} {"train_loss": -5.0276947021484375, "global_step": 7972, "epoch": 189} {"train_loss": -4.867626667022705, "global_step": 7973, "epoch": 189} {"train_loss": -4.955759048461914, "global_step": 7974, "epoch": 189} {"train_loss": -5.002504348754883, "global_step": 7975, "epoch": 189} {"train_loss": -4.751114368438721, "global_step": 7976, "epoch": 189} {"train_loss": -4.935407638549805, "global_step": 7977, "epoch": 189} {"train_loss": -4.817950248718262, "global_step": 7978, "epoch": 189} {"train_loss": -4.905754475366502, "global_step": 7979, "epoch": 189, "val_loss": 72982.8671875} {"train_loss": -5.010409355163574, "global_step": 7980, "epoch": 190} {"train_loss": -4.937682151794434, "global_step": 7981, "epoch": 190} {"train_loss": -4.769012928009033, "global_step": 7982, "epoch": 190} {"train_loss": -4.879756927490234, "global_step": 7983, "epoch": 190} {"train_loss": -5.036489009857178, "global_step": 7984, "epoch": 190} {"train_loss": -4.784219741821289, "global_step": 7985, "epoch": 190} {"train_loss": -5.053722381591797, "global_step": 7986, "epoch": 190} {"train_loss": -5.083646774291992, "global_step": 7987, "epoch": 190} {"train_loss": -4.953614234924316, "global_step": 7988, "epoch": 190} {"train_loss": -4.894698619842529, "global_step": 7989, "epoch": 190} {"train_loss": -4.789216995239258, "global_step": 7990, "epoch": 190} {"train_loss": -4.9551920890808105, "global_step": 7991, "epoch": 190} {"train_loss": -4.709494113922119, "global_step": 7992, "epoch": 190} {"train_loss": -5.042636871337891, "global_step": 7993, "epoch": 190} {"train_loss": -5.031828880310059, "global_step": 7994, "epoch": 190} {"train_loss": -4.742731094360352, "global_step": 7995, "epoch": 190} {"train_loss": -4.991633415222168, "global_step": 7996, "epoch": 190} {"train_loss": -5.016384601593018, "global_step": 7997, "epoch": 190} {"train_loss": -4.786486625671387, "global_step": 7998, "epoch": 190} {"train_loss": -4.972517013549805, "global_step": 7999, "epoch": 190} {"train_loss": -4.953188896179199, "global_step": 8000, "epoch": 190} {"train_loss": -4.938373565673828, "global_step": 8001, "epoch": 190} {"train_loss": -4.923807621002197, "global_step": 8002, "epoch": 190} {"train_loss": -4.993721961975098, "global_step": 8003, "epoch": 190} {"train_loss": -4.9829792976379395, "global_step": 8004, "epoch": 190} {"train_loss": -4.889766216278076, "global_step": 8005, "epoch": 190} {"train_loss": -4.918262958526611, "global_step": 8006, "epoch": 190} {"train_loss": -4.9614081382751465, "global_step": 8007, "epoch": 190} {"train_loss": -4.970937728881836, "global_step": 8008, "epoch": 190} {"train_loss": -5.074945449829102, "global_step": 8009, "epoch": 190} {"train_loss": -5.059422016143799, "global_step": 8010, "epoch": 190} {"train_loss": -4.815609455108643, "global_step": 8011, "epoch": 190} {"train_loss": -4.9160614013671875, "global_step": 8012, "epoch": 190} {"train_loss": -5.130673885345459, "global_step": 8013, "epoch": 190} {"train_loss": -5.119054794311523, "global_step": 8014, "epoch": 190} {"train_loss": -4.920217514038086, "global_step": 8015, "epoch": 190} {"train_loss": -4.972368240356445, "global_step": 8016, "epoch": 190} {"train_loss": -5.026267051696777, "global_step": 8017, "epoch": 190} {"train_loss": -4.998990535736084, "global_step": 8018, "epoch": 190} {"train_loss": -4.956621170043945, "global_step": 8019, "epoch": 190} {"train_loss": -4.903112411499023, "global_step": 8020, "epoch": 190} {"train_loss": -4.947436673300607, "global_step": 8021, "epoch": 190, "val_loss": 73252.984375} {"train_loss": -4.890875816345215, "global_step": 8022, "epoch": 191} {"train_loss": -4.8739166259765625, "global_step": 8023, "epoch": 191} {"train_loss": -5.101029396057129, "global_step": 8024, "epoch": 191} {"train_loss": -5.047345161437988, "global_step": 8025, "epoch": 191} {"train_loss": -4.952353000640869, "global_step": 8026, "epoch": 191} {"train_loss": -4.948667049407959, "global_step": 8027, "epoch": 191} {"train_loss": -4.8761091232299805, "global_step": 8028, "epoch": 191} {"train_loss": -4.830691337585449, "global_step": 8029, "epoch": 191} {"train_loss": -4.780290603637695, "global_step": 8030, "epoch": 191} {"train_loss": -4.861399173736572, "global_step": 8031, "epoch": 191} {"train_loss": -5.032100677490234, "global_step": 8032, "epoch": 191} {"train_loss": -5.0695648193359375, "global_step": 8033, "epoch": 191} {"train_loss": -4.993682861328125, "global_step": 8034, "epoch": 191} {"train_loss": -4.987454891204834, "global_step": 8035, "epoch": 191} {"train_loss": -4.951977729797363, "global_step": 8036, "epoch": 191} {"train_loss": -4.941944122314453, "global_step": 8037, "epoch": 191} {"train_loss": -4.94356632232666, "global_step": 8038, "epoch": 191} {"train_loss": -4.973797798156738, "global_step": 8039, "epoch": 191} {"train_loss": -4.965670585632324, "global_step": 8040, "epoch": 191} {"train_loss": -4.894408226013184, "global_step": 8041, "epoch": 191} {"train_loss": -4.931114196777344, "global_step": 8042, "epoch": 191} {"train_loss": -4.817190170288086, "global_step": 8043, "epoch": 191} {"train_loss": -4.935529708862305, "global_step": 8044, "epoch": 191} {"train_loss": -4.974143028259277, "global_step": 8045, "epoch": 191} {"train_loss": -4.8898773193359375, "global_step": 8046, "epoch": 191} {"train_loss": -4.858241081237793, "global_step": 8047, "epoch": 191} {"train_loss": -4.943042278289795, "global_step": 8048, "epoch": 191} {"train_loss": -4.88119649887085, "global_step": 8049, "epoch": 191} {"train_loss": -4.70267391204834, "global_step": 8050, "epoch": 191} {"train_loss": -4.948787689208984, "global_step": 8051, "epoch": 191} {"train_loss": -4.91632080078125, "global_step": 8052, "epoch": 191} {"train_loss": -4.962625503540039, "global_step": 8053, "epoch": 191} {"train_loss": -5.031275272369385, "global_step": 8054, "epoch": 191} {"train_loss": -4.954792022705078, "global_step": 8055, "epoch": 191} {"train_loss": -4.789745330810547, "global_step": 8056, "epoch": 191} {"train_loss": -4.920119762420654, "global_step": 8057, "epoch": 191} {"train_loss": -4.894284248352051, "global_step": 8058, "epoch": 191} {"train_loss": -5.053616523742676, "global_step": 8059, "epoch": 191} {"train_loss": -4.8523125648498535, "global_step": 8060, "epoch": 191} {"train_loss": -4.884614944458008, "global_step": 8061, "epoch": 191} {"train_loss": -4.955095291137695, "global_step": 8062, "epoch": 191} {"train_loss": -4.929801634379795, "global_step": 8063, "epoch": 191, "val_loss": 72871.7109375} {"train_loss": -5.04095458984375, "global_step": 8064, "epoch": 192} {"train_loss": -5.008029937744141, "global_step": 8065, "epoch": 192} {"train_loss": -4.908673286437988, "global_step": 8066, "epoch": 192} {"train_loss": -4.891273498535156, "global_step": 8067, "epoch": 192} {"train_loss": -5.005716323852539, "global_step": 8068, "epoch": 192} {"train_loss": -4.970842361450195, "global_step": 8069, "epoch": 192} {"train_loss": -5.057512283325195, "global_step": 8070, "epoch": 192} {"train_loss": -4.958839416503906, "global_step": 8071, "epoch": 192} {"train_loss": -4.943169593811035, "global_step": 8072, "epoch": 192} {"train_loss": -4.947406768798828, "global_step": 8073, "epoch": 192} {"train_loss": -5.072232723236084, "global_step": 8074, "epoch": 192} {"train_loss": -4.930614948272705, "global_step": 8075, "epoch": 192} {"train_loss": -4.996615409851074, "global_step": 8076, "epoch": 192} {"train_loss": -4.94630241394043, "global_step": 8077, "epoch": 192} {"train_loss": -4.988361358642578, "global_step": 8078, "epoch": 192} {"train_loss": -4.9932861328125, "global_step": 8079, "epoch": 192} {"train_loss": -5.088161468505859, "global_step": 8080, "epoch": 192} {"train_loss": -5.071259021759033, "global_step": 8081, "epoch": 192} {"train_loss": -4.897421836853027, "global_step": 8082, "epoch": 192} {"train_loss": -5.015437602996826, "global_step": 8083, "epoch": 192} {"train_loss": -4.960097312927246, "global_step": 8084, "epoch": 192} {"train_loss": -4.761463165283203, "global_step": 8085, "epoch": 192} {"train_loss": -4.937460899353027, "global_step": 8086, "epoch": 192} {"train_loss": -4.793627738952637, "global_step": 8087, "epoch": 192} {"train_loss": -4.89422607421875, "global_step": 8088, "epoch": 192} {"train_loss": -4.861462116241455, "global_step": 8089, "epoch": 192} {"train_loss": -4.909531116485596, "global_step": 8090, "epoch": 192} {"train_loss": -5.038732528686523, "global_step": 8091, "epoch": 192} {"train_loss": -4.928863525390625, "global_step": 8092, "epoch": 192} {"train_loss": -4.758937835693359, "global_step": 8093, "epoch": 192} {"train_loss": -5.029094696044922, "global_step": 8094, "epoch": 192} {"train_loss": -4.9777350425720215, "global_step": 8095, "epoch": 192} {"train_loss": -4.823114395141602, "global_step": 8096, "epoch": 192} {"train_loss": -4.936391830444336, "global_step": 8097, "epoch": 192} {"train_loss": -4.827497482299805, "global_step": 8098, "epoch": 192} {"train_loss": -4.932744979858398, "global_step": 8099, "epoch": 192} {"train_loss": -4.86174201965332, "global_step": 8100, "epoch": 192} {"train_loss": -4.946233749389648, "global_step": 8101, "epoch": 192} {"train_loss": -4.82633113861084, "global_step": 8102, "epoch": 192} {"train_loss": -4.962751388549805, "global_step": 8103, "epoch": 192} {"train_loss": -4.922413349151611, "global_step": 8104, "epoch": 192} {"train_loss": -4.9452654747735885, "global_step": 8105, "epoch": 192, "val_loss": 73077.328125} {"train_loss": -4.99583625793457, "global_step": 8106, "epoch": 193} {"train_loss": -4.94360876083374, "global_step": 8107, "epoch": 193} {"train_loss": -4.9972968101501465, "global_step": 8108, "epoch": 193} {"train_loss": -4.992861747741699, "global_step": 8109, "epoch": 193} {"train_loss": -5.01492977142334, "global_step": 8110, "epoch": 193} {"train_loss": -4.995261192321777, "global_step": 8111, "epoch": 193} {"train_loss": -4.8568315505981445, "global_step": 8112, "epoch": 193} {"train_loss": -5.032994747161865, "global_step": 8113, "epoch": 193} {"train_loss": -5.030262470245361, "global_step": 8114, "epoch": 193} {"train_loss": -4.898211479187012, "global_step": 8115, "epoch": 193} {"train_loss": -4.911131858825684, "global_step": 8116, "epoch": 193} {"train_loss": -5.039427280426025, "global_step": 8117, "epoch": 193} {"train_loss": -4.96773099899292, "global_step": 8118, "epoch": 193} {"train_loss": -4.98472785949707, "global_step": 8119, "epoch": 193} {"train_loss": -5.041625499725342, "global_step": 8120, "epoch": 193} {"train_loss": -4.789482593536377, "global_step": 8121, "epoch": 193} {"train_loss": -4.8786940574646, "global_step": 8122, "epoch": 193} {"train_loss": -4.985190391540527, "global_step": 8123, "epoch": 193} {"train_loss": -5.015008926391602, "global_step": 8124, "epoch": 193} {"train_loss": -4.855886936187744, "global_step": 8125, "epoch": 193} {"train_loss": -5.115035057067871, "global_step": 8126, "epoch": 193} {"train_loss": -4.822596549987793, "global_step": 8127, "epoch": 193} {"train_loss": -4.895880699157715, "global_step": 8128, "epoch": 193} {"train_loss": -4.835721015930176, "global_step": 8129, "epoch": 193} {"train_loss": -4.976008892059326, "global_step": 8130, "epoch": 193} {"train_loss": -4.926609039306641, "global_step": 8131, "epoch": 193} {"train_loss": -5.05357551574707, "global_step": 8132, "epoch": 193} {"train_loss": -4.963743209838867, "global_step": 8133, "epoch": 193} {"train_loss": -5.081413269042969, "global_step": 8134, "epoch": 193} {"train_loss": -4.8992919921875, "global_step": 8135, "epoch": 193} {"train_loss": -5.069263458251953, "global_step": 8136, "epoch": 193} {"train_loss": -5.018860340118408, "global_step": 8137, "epoch": 193} {"train_loss": -4.655577659606934, "global_step": 8138, "epoch": 193} {"train_loss": -4.994938373565674, "global_step": 8139, "epoch": 193} {"train_loss": -4.899320125579834, "global_step": 8140, "epoch": 193} {"train_loss": -4.915335655212402, "global_step": 8141, "epoch": 193} {"train_loss": -4.787841320037842, "global_step": 8142, "epoch": 193} {"train_loss": -5.133362293243408, "global_step": 8143, "epoch": 193} {"train_loss": -4.996971607208252, "global_step": 8144, "epoch": 193} {"train_loss": -4.977116584777832, "global_step": 8145, "epoch": 193} {"train_loss": -4.953075885772705, "global_step": 8146, "epoch": 193} {"train_loss": -4.9605343114762075, "global_step": 8147, "epoch": 193, "val_loss": 72550.078125} {"train_loss": -5.2061614990234375, "global_step": 8148, "epoch": 194} {"train_loss": -5.001481533050537, "global_step": 8149, "epoch": 194} {"train_loss": -5.038548469543457, "global_step": 8150, "epoch": 194} {"train_loss": -4.951293468475342, "global_step": 8151, "epoch": 194} {"train_loss": -4.96017599105835, "global_step": 8152, "epoch": 194} {"train_loss": -5.000646114349365, "global_step": 8153, "epoch": 194} {"train_loss": -5.040246963500977, "global_step": 8154, "epoch": 194} {"train_loss": -4.870296478271484, "global_step": 8155, "epoch": 194} {"train_loss": -4.981164932250977, "global_step": 8156, "epoch": 194} {"train_loss": -5.038107872009277, "global_step": 8157, "epoch": 194} {"train_loss": -5.00940465927124, "global_step": 8158, "epoch": 194} {"train_loss": -4.649357318878174, "global_step": 8159, "epoch": 194} {"train_loss": -4.957757949829102, "global_step": 8160, "epoch": 194} {"train_loss": -4.838433265686035, "global_step": 8161, "epoch": 194} {"train_loss": -4.937938690185547, "global_step": 8162, "epoch": 194} {"train_loss": -4.736206531524658, "global_step": 8163, "epoch": 194} {"train_loss": -5.04338264465332, "global_step": 8164, "epoch": 194} {"train_loss": -4.944980621337891, "global_step": 8165, "epoch": 194} {"train_loss": -4.919216156005859, "global_step": 8166, "epoch": 194} {"train_loss": -4.924274921417236, "global_step": 8167, "epoch": 194} {"train_loss": -4.9609832763671875, "global_step": 8168, "epoch": 194} {"train_loss": -5.087872505187988, "global_step": 8169, "epoch": 194} {"train_loss": -5.015041828155518, "global_step": 8170, "epoch": 194} {"train_loss": -5.010717391967773, "global_step": 8171, "epoch": 194} {"train_loss": -4.933104991912842, "global_step": 8172, "epoch": 194} {"train_loss": -5.013003349304199, "global_step": 8173, "epoch": 194} {"train_loss": -5.036012649536133, "global_step": 8174, "epoch": 194} {"train_loss": -4.928579807281494, "global_step": 8175, "epoch": 194} {"train_loss": -5.038597583770752, "global_step": 8176, "epoch": 194} {"train_loss": -5.152177333831787, "global_step": 8177, "epoch": 194} {"train_loss": -4.980432987213135, "global_step": 8178, "epoch": 194} {"train_loss": -4.917412757873535, "global_step": 8179, "epoch": 194} {"train_loss": -5.036801338195801, "global_step": 8180, "epoch": 194} {"train_loss": -4.985859394073486, "global_step": 8181, "epoch": 194} {"train_loss": -4.870609283447266, "global_step": 8182, "epoch": 194} {"train_loss": -4.911975860595703, "global_step": 8183, "epoch": 194} {"train_loss": -5.062310218811035, "global_step": 8184, "epoch": 194} {"train_loss": -4.928698539733887, "global_step": 8185, "epoch": 194} {"train_loss": -5.070723533630371, "global_step": 8186, "epoch": 194} {"train_loss": -4.820253849029541, "global_step": 8187, "epoch": 194} {"train_loss": -4.768482685089111, "global_step": 8188, "epoch": 194} {"train_loss": -4.9645194326128275, "global_step": 8189, "epoch": 194, "val_loss": 73281.2734375} {"train_loss": -5.073935508728027, "global_step": 8190, "epoch": 195} {"train_loss": -4.824769973754883, "global_step": 8191, "epoch": 195} {"train_loss": -4.875214099884033, "global_step": 8192, "epoch": 195} {"train_loss": -5.048742771148682, "global_step": 8193, "epoch": 195} {"train_loss": -4.995239734649658, "global_step": 8194, "epoch": 195} {"train_loss": -4.912601470947266, "global_step": 8195, "epoch": 195} {"train_loss": -4.991241455078125, "global_step": 8196, "epoch": 195} {"train_loss": -5.022889137268066, "global_step": 8197, "epoch": 195} {"train_loss": -4.956251621246338, "global_step": 8198, "epoch": 195} {"train_loss": -5.058621883392334, "global_step": 8199, "epoch": 195} {"train_loss": -4.9678449630737305, "global_step": 8200, "epoch": 195} {"train_loss": -5.1566877365112305, "global_step": 8201, "epoch": 195} {"train_loss": -4.940737724304199, "global_step": 8202, "epoch": 195} {"train_loss": -4.980576515197754, "global_step": 8203, "epoch": 195} {"train_loss": -5.0399346351623535, "global_step": 8204, "epoch": 195} {"train_loss": -4.95415735244751, "global_step": 8205, "epoch": 195} {"train_loss": -5.068925380706787, "global_step": 8206, "epoch": 195} {"train_loss": -4.810553550720215, "global_step": 8207, "epoch": 195} {"train_loss": -5.0533905029296875, "global_step": 8208, "epoch": 195} {"train_loss": -5.0411152839660645, "global_step": 8209, "epoch": 195} {"train_loss": -5.063264846801758, "global_step": 8210, "epoch": 195} {"train_loss": -4.82394552230835, "global_step": 8211, "epoch": 195} {"train_loss": -4.8249006271362305, "global_step": 8212, "epoch": 195} {"train_loss": -5.016491889953613, "global_step": 8213, "epoch": 195} {"train_loss": -4.936129093170166, "global_step": 8214, "epoch": 195} {"train_loss": -5.009211540222168, "global_step": 8215, "epoch": 195} {"train_loss": -5.004497528076172, "global_step": 8216, "epoch": 195} {"train_loss": -4.876823425292969, "global_step": 8217, "epoch": 195} {"train_loss": -4.980194091796875, "global_step": 8218, "epoch": 195} {"train_loss": -4.944398403167725, "global_step": 8219, "epoch": 195} {"train_loss": -4.899272918701172, "global_step": 8220, "epoch": 195} {"train_loss": -4.9784088134765625, "global_step": 8221, "epoch": 195} {"train_loss": -5.016631126403809, "global_step": 8222, "epoch": 195} {"train_loss": -5.073193550109863, "global_step": 8223, "epoch": 195} {"train_loss": -5.1017680168151855, "global_step": 8224, "epoch": 195} {"train_loss": -5.038419246673584, "global_step": 8225, "epoch": 195} {"train_loss": -4.78635311126709, "global_step": 8226, "epoch": 195} {"train_loss": -4.855267524719238, "global_step": 8227, "epoch": 195} {"train_loss": -5.074963092803955, "global_step": 8228, "epoch": 195} {"train_loss": -4.913475036621094, "global_step": 8229, "epoch": 195} {"train_loss": -5.106657981872559, "global_step": 8230, "epoch": 195} {"train_loss": -4.975747142519269, "global_step": 8231, "epoch": 195, "val_loss": 72762.6015625} {"train_loss": -4.803317070007324, "global_step": 8232, "epoch": 196} {"train_loss": -5.113080978393555, "global_step": 8233, "epoch": 196} {"train_loss": -4.928686141967773, "global_step": 8234, "epoch": 196} {"train_loss": -4.92075252532959, "global_step": 8235, "epoch": 196} {"train_loss": -4.91689395904541, "global_step": 8236, "epoch": 196} {"train_loss": -5.105512619018555, "global_step": 8237, "epoch": 196} {"train_loss": -4.783775329589844, "global_step": 8238, "epoch": 196} {"train_loss": -4.811090469360352, "global_step": 8239, "epoch": 196} {"train_loss": -5.063675880432129, "global_step": 8240, "epoch": 196} {"train_loss": -4.894016742706299, "global_step": 8241, "epoch": 196} {"train_loss": -4.910853385925293, "global_step": 8242, "epoch": 196} {"train_loss": -5.005050182342529, "global_step": 8243, "epoch": 196} {"train_loss": -4.934159278869629, "global_step": 8244, "epoch": 196} {"train_loss": -4.746459484100342, "global_step": 8245, "epoch": 196} {"train_loss": -4.8958635330200195, "global_step": 8246, "epoch": 196} {"train_loss": -4.992460250854492, "global_step": 8247, "epoch": 196} {"train_loss": -4.878003120422363, "global_step": 8248, "epoch": 196} {"train_loss": -4.833217620849609, "global_step": 8249, "epoch": 196} {"train_loss": -4.810729026794434, "global_step": 8250, "epoch": 196} {"train_loss": -4.912985801696777, "global_step": 8251, "epoch": 196} {"train_loss": -4.987833023071289, "global_step": 8252, "epoch": 196} {"train_loss": -4.952658653259277, "global_step": 8253, "epoch": 196} {"train_loss": -4.919066429138184, "global_step": 8254, "epoch": 196} {"train_loss": -4.943033218383789, "global_step": 8255, "epoch": 196} {"train_loss": -4.966391563415527, "global_step": 8256, "epoch": 196} {"train_loss": -5.071356773376465, "global_step": 8257, "epoch": 196} {"train_loss": -4.9667887687683105, "global_step": 8258, "epoch": 196} {"train_loss": -5.0366597175598145, "global_step": 8259, "epoch": 196} {"train_loss": -4.933999061584473, "global_step": 8260, "epoch": 196} {"train_loss": -4.960184574127197, "global_step": 8261, "epoch": 196} {"train_loss": -4.985136032104492, "global_step": 8262, "epoch": 196} {"train_loss": -4.933475971221924, "global_step": 8263, "epoch": 196} {"train_loss": -4.956298828125, "global_step": 8264, "epoch": 196} {"train_loss": -4.982308387756348, "global_step": 8265, "epoch": 196} {"train_loss": -4.954165458679199, "global_step": 8266, "epoch": 196} {"train_loss": -4.992776870727539, "global_step": 8267, "epoch": 196} {"train_loss": -4.932008743286133, "global_step": 8268, "epoch": 196} {"train_loss": -4.997191429138184, "global_step": 8269, "epoch": 196} {"train_loss": -4.9649200439453125, "global_step": 8270, "epoch": 196} {"train_loss": -5.006208419799805, "global_step": 8271, "epoch": 196} {"train_loss": -4.966517925262451, "global_step": 8272, "epoch": 196} {"train_loss": -4.946935449327741, "global_step": 8273, "epoch": 196, "val_loss": 72592.5234375} {"train_loss": -4.990299701690674, "global_step": 8274, "epoch": 197} {"train_loss": -4.872488021850586, "global_step": 8275, "epoch": 197} {"train_loss": -4.779179573059082, "global_step": 8276, "epoch": 197} {"train_loss": -4.933956623077393, "global_step": 8277, "epoch": 197} {"train_loss": -5.02313756942749, "global_step": 8278, "epoch": 197} {"train_loss": -5.016262054443359, "global_step": 8279, "epoch": 197} {"train_loss": -4.99072790145874, "global_step": 8280, "epoch": 197} {"train_loss": -4.839326858520508, "global_step": 8281, "epoch": 197} {"train_loss": -5.0286760330200195, "global_step": 8282, "epoch": 197} {"train_loss": -4.899136543273926, "global_step": 8283, "epoch": 197} {"train_loss": -4.876249313354492, "global_step": 8284, "epoch": 197} {"train_loss": -4.890707015991211, "global_step": 8285, "epoch": 197} {"train_loss": -4.992485046386719, "global_step": 8286, "epoch": 197} {"train_loss": -4.985659122467041, "global_step": 8287, "epoch": 197} {"train_loss": -4.833989143371582, "global_step": 8288, "epoch": 197} {"train_loss": -4.903756141662598, "global_step": 8289, "epoch": 197} {"train_loss": -4.8680925369262695, "global_step": 8290, "epoch": 197} {"train_loss": -5.149410247802734, "global_step": 8291, "epoch": 197} {"train_loss": -4.900517463684082, "global_step": 8292, "epoch": 197} {"train_loss": -5.017764091491699, "global_step": 8293, "epoch": 197} {"train_loss": -5.114340782165527, "global_step": 8294, "epoch": 197} {"train_loss": -5.035758972167969, "global_step": 8295, "epoch": 197} {"train_loss": -4.732779502868652, "global_step": 8296, "epoch": 197} {"train_loss": -4.8764328956604, "global_step": 8297, "epoch": 197} {"train_loss": -5.040614604949951, "global_step": 8298, "epoch": 197} {"train_loss": -5.034605979919434, "global_step": 8299, "epoch": 197} {"train_loss": -4.992643356323242, "global_step": 8300, "epoch": 197} {"train_loss": -5.0237956047058105, "global_step": 8301, "epoch": 197} {"train_loss": -5.011579513549805, "global_step": 8302, "epoch": 197} {"train_loss": -5.038333892822266, "global_step": 8303, "epoch": 197} {"train_loss": -4.941976070404053, "global_step": 8304, "epoch": 197} {"train_loss": -5.008231163024902, "global_step": 8305, "epoch": 197} {"train_loss": -4.92763614654541, "global_step": 8306, "epoch": 197} {"train_loss": -4.982881546020508, "global_step": 8307, "epoch": 197} {"train_loss": -4.9543256759643555, "global_step": 8308, "epoch": 197} {"train_loss": -5.099043846130371, "global_step": 8309, "epoch": 197} {"train_loss": -4.964087963104248, "global_step": 8310, "epoch": 197} {"train_loss": -4.937737941741943, "global_step": 8311, "epoch": 197} {"train_loss": -5.0735602378845215, "global_step": 8312, "epoch": 197} {"train_loss": -4.990569114685059, "global_step": 8313, "epoch": 197} {"train_loss": -4.863990783691406, "global_step": 8314, "epoch": 197} {"train_loss": -4.964627890359788, "global_step": 8315, "epoch": 197, "val_loss": 72591.96875} {"train_loss": -5.126618385314941, "global_step": 8316, "epoch": 198} {"train_loss": -4.95455265045166, "global_step": 8317, "epoch": 198} {"train_loss": -5.016628265380859, "global_step": 8318, "epoch": 198} {"train_loss": -4.908760070800781, "global_step": 8319, "epoch": 198} {"train_loss": -5.031912803649902, "global_step": 8320, "epoch": 198} {"train_loss": -4.9643354415893555, "global_step": 8321, "epoch": 198} {"train_loss": -4.933401584625244, "global_step": 8322, "epoch": 198} {"train_loss": -5.0829033851623535, "global_step": 8323, "epoch": 198} {"train_loss": -5.057337760925293, "global_step": 8324, "epoch": 198} {"train_loss": -5.121278762817383, "global_step": 8325, "epoch": 198} {"train_loss": -4.894655227661133, "global_step": 8326, "epoch": 198} {"train_loss": -4.991952896118164, "global_step": 8327, "epoch": 198} {"train_loss": -5.070647239685059, "global_step": 8328, "epoch": 198} {"train_loss": -5.145082950592041, "global_step": 8329, "epoch": 198} {"train_loss": -5.073492050170898, "global_step": 8330, "epoch": 198} {"train_loss": -4.886876106262207, "global_step": 8331, "epoch": 198} {"train_loss": -4.914546966552734, "global_step": 8332, "epoch": 198} {"train_loss": -4.88956356048584, "global_step": 8333, "epoch": 198} {"train_loss": -5.076220512390137, "global_step": 8334, "epoch": 198} {"train_loss": -5.016081809997559, "global_step": 8335, "epoch": 198} {"train_loss": -5.0806474685668945, "global_step": 8336, "epoch": 198} {"train_loss": -5.11436128616333, "global_step": 8337, "epoch": 198} {"train_loss": -4.984180927276611, "global_step": 8338, "epoch": 198} {"train_loss": -4.986841678619385, "global_step": 8339, "epoch": 198} {"train_loss": -4.951983451843262, "global_step": 8340, "epoch": 198} {"train_loss": -4.961184501647949, "global_step": 8341, "epoch": 198} {"train_loss": -4.950626373291016, "global_step": 8342, "epoch": 198} {"train_loss": -4.919894218444824, "global_step": 8343, "epoch": 198} {"train_loss": -5.035585403442383, "global_step": 8344, "epoch": 198} {"train_loss": -4.9637274742126465, "global_step": 8345, "epoch": 198} {"train_loss": -4.9816765785217285, "global_step": 8346, "epoch": 198} {"train_loss": -5.054962158203125, "global_step": 8347, "epoch": 198} {"train_loss": -4.927468776702881, "global_step": 8348, "epoch": 198} {"train_loss": -4.958181381225586, "global_step": 8349, "epoch": 198} {"train_loss": -4.905569076538086, "global_step": 8350, "epoch": 198} {"train_loss": -5.111183166503906, "global_step": 8351, "epoch": 198} {"train_loss": -4.98366117477417, "global_step": 8352, "epoch": 198} {"train_loss": -4.794885635375977, "global_step": 8353, "epoch": 198} {"train_loss": -4.8573479652404785, "global_step": 8354, "epoch": 198} {"train_loss": -5.040801048278809, "global_step": 8355, "epoch": 198} {"train_loss": -5.014240264892578, "global_step": 8356, "epoch": 198} {"train_loss": -4.986825818107242, "global_step": 8357, "epoch": 198, "val_loss": 72435.390625} {"train_loss": -5.006387710571289, "global_step": 8358, "epoch": 199} {"train_loss": -4.800266742706299, "global_step": 8359, "epoch": 199} {"train_loss": -4.645273685455322, "global_step": 8360, "epoch": 199} {"train_loss": -4.8981523513793945, "global_step": 8361, "epoch": 199} {"train_loss": -4.877803802490234, "global_step": 8362, "epoch": 199} {"train_loss": -4.736013412475586, "global_step": 8363, "epoch": 199} {"train_loss": -5.0673112869262695, "global_step": 8364, "epoch": 199} {"train_loss": -4.974077224731445, "global_step": 8365, "epoch": 199} {"train_loss": -4.973163604736328, "global_step": 8366, "epoch": 199} {"train_loss": -4.913728713989258, "global_step": 8367, "epoch": 199} {"train_loss": -4.925390720367432, "global_step": 8368, "epoch": 199} {"train_loss": -5.020109176635742, "global_step": 8369, "epoch": 199} {"train_loss": -4.93299674987793, "global_step": 8370, "epoch": 199} {"train_loss": -5.040496826171875, "global_step": 8371, "epoch": 199} {"train_loss": -4.843661308288574, "global_step": 8372, "epoch": 199} {"train_loss": -5.057007312774658, "global_step": 8373, "epoch": 199} {"train_loss": -4.9841508865356445, "global_step": 8374, "epoch": 199} {"train_loss": -4.8639326095581055, "global_step": 8375, "epoch": 199} {"train_loss": -4.908636093139648, "global_step": 8376, "epoch": 199} {"train_loss": -5.102989196777344, "global_step": 8377, "epoch": 199} {"train_loss": -5.140313625335693, "global_step": 8378, "epoch": 199} {"train_loss": -5.017938613891602, "global_step": 8379, "epoch": 199} {"train_loss": -4.910453796386719, "global_step": 8380, "epoch": 199} {"train_loss": -4.885439395904541, "global_step": 8381, "epoch": 199} {"train_loss": -5.056056976318359, "global_step": 8382, "epoch": 199} {"train_loss": -5.040365219116211, "global_step": 8383, "epoch": 199} {"train_loss": -5.047664642333984, "global_step": 8384, "epoch": 199} {"train_loss": -4.991096496582031, "global_step": 8385, "epoch": 199} {"train_loss": -5.03223991394043, "global_step": 8386, "epoch": 199} {"train_loss": -4.855461120605469, "global_step": 8387, "epoch": 199} {"train_loss": -4.775144577026367, "global_step": 8388, "epoch": 199} {"train_loss": -4.881514549255371, "global_step": 8389, "epoch": 199} {"train_loss": -5.03189754486084, "global_step": 8390, "epoch": 199} {"train_loss": -4.989731788635254, "global_step": 8391, "epoch": 199} {"train_loss": -5.092252254486084, "global_step": 8392, "epoch": 199} {"train_loss": -5.055495262145996, "global_step": 8393, "epoch": 199} {"train_loss": -4.914140701293945, "global_step": 8394, "epoch": 199} {"train_loss": -4.976604461669922, "global_step": 8395, "epoch": 199} {"train_loss": -5.024614334106445, "global_step": 8396, "epoch": 199} {"train_loss": -4.951641082763672, "global_step": 8397, "epoch": 199} {"train_loss": -5.218698501586914, "global_step": 8398, "epoch": 199} {"train_loss": -4.963772035780407, "global_step": 8399, "epoch": 199, "val_loss": 72259.53125} {"train_loss": -4.8933563232421875, "global_step": 8400, "epoch": 200} {"train_loss": -5.019372940063477, "global_step": 8401, "epoch": 200} {"train_loss": -5.032995223999023, "global_step": 8402, "epoch": 200} {"train_loss": -5.005776405334473, "global_step": 8403, "epoch": 200} {"train_loss": -4.897678375244141, "global_step": 8404, "epoch": 200} {"train_loss": -4.939923286437988, "global_step": 8405, "epoch": 200} {"train_loss": -5.021270751953125, "global_step": 8406, "epoch": 200} {"train_loss": -5.044591903686523, "global_step": 8407, "epoch": 200} {"train_loss": -5.0324530601501465, "global_step": 8408, "epoch": 200} {"train_loss": -5.055048942565918, "global_step": 8409, "epoch": 200} {"train_loss": -4.780203819274902, "global_step": 8410, "epoch": 200} {"train_loss": -5.037538528442383, "global_step": 8411, "epoch": 200} {"train_loss": -5.05797815322876, "global_step": 8412, "epoch": 200} {"train_loss": -4.887238025665283, "global_step": 8413, "epoch": 200} {"train_loss": -4.875231742858887, "global_step": 8414, "epoch": 200} {"train_loss": -4.993551254272461, "global_step": 8415, "epoch": 200} {"train_loss": -5.058870315551758, "global_step": 8416, "epoch": 200} {"train_loss": -4.883117198944092, "global_step": 8417, "epoch": 200} {"train_loss": -4.986269950866699, "global_step": 8418, "epoch": 200} {"train_loss": -5.031885623931885, "global_step": 8419, "epoch": 200} {"train_loss": -5.016463756561279, "global_step": 8420, "epoch": 200} {"train_loss": -4.765043258666992, "global_step": 8421, "epoch": 200} {"train_loss": -4.819669246673584, "global_step": 8422, "epoch": 200} {"train_loss": -4.97682523727417, "global_step": 8423, "epoch": 200} {"train_loss": -4.900221347808838, "global_step": 8424, "epoch": 200} {"train_loss": -5.076715469360352, "global_step": 8425, "epoch": 200} {"train_loss": -4.9826555252075195, "global_step": 8426, "epoch": 200} {"train_loss": -4.904748439788818, "global_step": 8427, "epoch": 200} {"train_loss": -5.175022125244141, "global_step": 8428, "epoch": 200} {"train_loss": -5.067959308624268, "global_step": 8429, "epoch": 200} {"train_loss": -5.022852420806885, "global_step": 8430, "epoch": 200} {"train_loss": -5.00364351272583, "global_step": 8431, "epoch": 200} {"train_loss": -5.051569938659668, "global_step": 8432, "epoch": 200} {"train_loss": -5.119734764099121, "global_step": 8433, "epoch": 200} {"train_loss": -5.074562072753906, "global_step": 8434, "epoch": 200} {"train_loss": -4.903628349304199, "global_step": 8435, "epoch": 200} {"train_loss": -4.958674430847168, "global_step": 8436, "epoch": 200} {"train_loss": -4.949278354644775, "global_step": 8437, "epoch": 200} {"train_loss": -5.039334297180176, "global_step": 8438, "epoch": 200} {"train_loss": -4.918920993804932, "global_step": 8439, "epoch": 200} {"train_loss": -4.99103307723999, "global_step": 8440, "epoch": 200} {"train_loss": -4.981675534021287, "global_step": 8441, "epoch": 200, "train/sim_max_reward_0": 0.2092088009213681, "train/sim_max_reward_1": 0.00820528720489563, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.0053467998742405525, "train/sim_max_reward_4": 0.16044221599521505, "train/sim_max_reward_5": 0.352824913641803, "test/sim_max_reward_4300000": 0.0015403922763074424, "test/sim_max_reward_4300001": 0.07170434046856054, "test/sim_max_reward_4300002": 0.17574869679010507, "test/sim_max_reward_4300003": 0.35333889108557365, "test/sim_max_reward_4300004": 0.39090244766843846, "test/sim_max_reward_4300005": 0.2573583502111308, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.053710631720728666, "test/sim_max_reward_4300008": 0.15785203442146425, "test/sim_max_reward_4300009": 0.16237717912915545, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.14154918772673358, "test/sim_max_reward_4300012": 0.5318024912485066, "test/sim_max_reward_4300013": 0.40847526318074784, "test/sim_max_reward_4300014": 0.38012690626617684, "test/sim_max_reward_4300015": 0.2581820459986872, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.11169753259719492, "test/sim_max_reward_4300018": 0.10277607634838962, "test/sim_max_reward_4300019": 0.18442011417370335, "test/sim_max_reward_4300020": 0.13426383633139533, "test/sim_max_reward_4300021": 0.057077959485435176, "test/sim_max_reward_4300022": 0.5279280963707574, "test/sim_max_reward_4300023": 0.2528532734025846, "test/sim_max_reward_4300024": 0.3023048669749727, "test/sim_max_reward_4300025": 0.08847875242732427, "test/sim_max_reward_4300026": 0.30414813292820125, "test/sim_max_reward_4300027": 0.0, "test/sim_max_reward_4300028": 0.002225903667142085, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.5440356117061396, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.2603000335592396, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.5529165429060827, "test/sim_max_reward_4300037": 0.6668982857003312, "test/sim_max_reward_4300038": 0.15680151247105614, "test/sim_max_reward_4300039": 0.04056694370744269, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.2736347319128165, "test/sim_max_reward_4300043": 0.4564000917383221, "test/sim_max_reward_4300044": 0.09086622339549981, "test/sim_max_reward_4300045": 0.0, "test/sim_max_reward_4300046": 0.24183250315971014, "test/sim_max_reward_4300047": 0.18538320613299594, "test/sim_max_reward_4300048": 0.3101976338618322, "test/sim_max_reward_4300049": 0.007171156804363759, "train/mean_score": 0.12267133627292039, "test/mean_score": 0.1876886038820981, "val_loss": 74363.828125} {"train_loss": -4.762670516967773, "global_step": 8442, "epoch": 201} {"train_loss": -5.0724639892578125, "global_step": 8443, "epoch": 201} {"train_loss": -5.128618240356445, "global_step": 8444, "epoch": 201} {"train_loss": -5.150773525238037, "global_step": 8445, "epoch": 201} {"train_loss": -5.042275428771973, "global_step": 8446, "epoch": 201} {"train_loss": -5.056711196899414, "global_step": 8447, "epoch": 201} {"train_loss": -4.98085880279541, "global_step": 8448, "epoch": 201} {"train_loss": -5.138912200927734, "global_step": 8449, "epoch": 201} {"train_loss": -5.0555830001831055, "global_step": 8450, "epoch": 201} {"train_loss": -5.016326904296875, "global_step": 8451, "epoch": 201} {"train_loss": -4.973902702331543, "global_step": 8452, "epoch": 201} {"train_loss": -5.0748748779296875, "global_step": 8453, "epoch": 201} {"train_loss": -5.179776668548584, "global_step": 8454, "epoch": 201} {"train_loss": -5.055084705352783, "global_step": 8455, "epoch": 201} {"train_loss": -4.935568332672119, "global_step": 8456, "epoch": 201} {"train_loss": -4.998351573944092, "global_step": 8457, "epoch": 201} {"train_loss": -4.965295791625977, "global_step": 8458, "epoch": 201} {"train_loss": -4.936061859130859, "global_step": 8459, "epoch": 201} {"train_loss": -5.123330593109131, "global_step": 8460, "epoch": 201} {"train_loss": -5.093637466430664, "global_step": 8461, "epoch": 201} {"train_loss": -5.000896453857422, "global_step": 8462, "epoch": 201} {"train_loss": -5.015363693237305, "global_step": 8463, "epoch": 201} {"train_loss": -5.122527122497559, "global_step": 8464, "epoch": 201} {"train_loss": -5.016761779785156, "global_step": 8465, "epoch": 201} {"train_loss": -5.042232036590576, "global_step": 8466, "epoch": 201} {"train_loss": -4.8825883865356445, "global_step": 8467, "epoch": 201} {"train_loss": -5.0692973136901855, "global_step": 8468, "epoch": 201} {"train_loss": -4.913834571838379, "global_step": 8469, "epoch": 201} {"train_loss": -4.910275459289551, "global_step": 8470, "epoch": 201} {"train_loss": -4.955617427825928, "global_step": 8471, "epoch": 201} {"train_loss": -5.029582500457764, "global_step": 8472, "epoch": 201} {"train_loss": -5.042181015014648, "global_step": 8473, "epoch": 201} {"train_loss": -5.002532482147217, "global_step": 8474, "epoch": 201} {"train_loss": -4.879367828369141, "global_step": 8475, "epoch": 201} {"train_loss": -4.852470397949219, "global_step": 8476, "epoch": 201} {"train_loss": -5.054380416870117, "global_step": 8477, "epoch": 201} {"train_loss": -4.896035194396973, "global_step": 8478, "epoch": 201} {"train_loss": -4.81318998336792, "global_step": 8479, "epoch": 201} {"train_loss": -4.953048229217529, "global_step": 8480, "epoch": 201} {"train_loss": -5.069345474243164, "global_step": 8481, "epoch": 201} {"train_loss": -5.005582809448242, "global_step": 8482, "epoch": 201} {"train_loss": -5.001760755266462, "global_step": 8483, "epoch": 201, "val_loss": 72882.2890625} {"train_loss": -4.799830436706543, "global_step": 8484, "epoch": 202} {"train_loss": -4.9527177810668945, "global_step": 8485, "epoch": 202} {"train_loss": -4.989701747894287, "global_step": 8486, "epoch": 202} {"train_loss": -4.619959831237793, "global_step": 8487, "epoch": 202} {"train_loss": -4.920008659362793, "global_step": 8488, "epoch": 202} {"train_loss": -5.056329727172852, "global_step": 8489, "epoch": 202} {"train_loss": -4.648370265960693, "global_step": 8490, "epoch": 202} {"train_loss": -4.812712669372559, "global_step": 8491, "epoch": 202} {"train_loss": -5.03135871887207, "global_step": 8492, "epoch": 202} {"train_loss": -4.913698196411133, "global_step": 8493, "epoch": 202} {"train_loss": -4.990710258483887, "global_step": 8494, "epoch": 202} {"train_loss": -4.819771766662598, "global_step": 8495, "epoch": 202} {"train_loss": -4.912073135375977, "global_step": 8496, "epoch": 202} {"train_loss": -5.000528335571289, "global_step": 8497, "epoch": 202} {"train_loss": -5.069907188415527, "global_step": 8498, "epoch": 202} {"train_loss": -4.834450721740723, "global_step": 8499, "epoch": 202} {"train_loss": -4.941722393035889, "global_step": 8500, "epoch": 202} {"train_loss": -4.918121337890625, "global_step": 8501, "epoch": 202} {"train_loss": -4.957581520080566, "global_step": 8502, "epoch": 202} {"train_loss": -5.038494110107422, "global_step": 8503, "epoch": 202} {"train_loss": -4.993210315704346, "global_step": 8504, "epoch": 202} {"train_loss": -5.103394508361816, "global_step": 8505, "epoch": 202} {"train_loss": -4.93366813659668, "global_step": 8506, "epoch": 202} {"train_loss": -5.029493808746338, "global_step": 8507, "epoch": 202} {"train_loss": -4.966080188751221, "global_step": 8508, "epoch": 202} {"train_loss": -5.136255741119385, "global_step": 8509, "epoch": 202} {"train_loss": -5.031712532043457, "global_step": 8510, "epoch": 202} {"train_loss": -5.011093616485596, "global_step": 8511, "epoch": 202} {"train_loss": -4.970928192138672, "global_step": 8512, "epoch": 202} {"train_loss": -4.983941078186035, "global_step": 8513, "epoch": 202} {"train_loss": -4.949307918548584, "global_step": 8514, "epoch": 202} {"train_loss": -5.072983741760254, "global_step": 8515, "epoch": 202} {"train_loss": -5.113861083984375, "global_step": 8516, "epoch": 202} {"train_loss": -4.909200668334961, "global_step": 8517, "epoch": 202} {"train_loss": -4.915458679199219, "global_step": 8518, "epoch": 202} {"train_loss": -5.140867233276367, "global_step": 8519, "epoch": 202} {"train_loss": -4.89853572845459, "global_step": 8520, "epoch": 202} {"train_loss": -4.844574928283691, "global_step": 8521, "epoch": 202} {"train_loss": -4.7512969970703125, "global_step": 8522, "epoch": 202} {"train_loss": -4.6315178871154785, "global_step": 8523, "epoch": 202} {"train_loss": -4.9897565841674805, "global_step": 8524, "epoch": 202} {"train_loss": -4.938056866327922, "global_step": 8525, "epoch": 202, "val_loss": 74334.7421875} {"train_loss": -4.727683067321777, "global_step": 8526, "epoch": 203} {"train_loss": -4.784740924835205, "global_step": 8527, "epoch": 203} {"train_loss": -5.066133975982666, "global_step": 8528, "epoch": 203} {"train_loss": -4.700936794281006, "global_step": 8529, "epoch": 203} {"train_loss": -5.003788948059082, "global_step": 8530, "epoch": 203} {"train_loss": -4.912938117980957, "global_step": 8531, "epoch": 203} {"train_loss": -4.689105987548828, "global_step": 8532, "epoch": 203} {"train_loss": -5.073117256164551, "global_step": 8533, "epoch": 203} {"train_loss": -4.805142402648926, "global_step": 8534, "epoch": 203} {"train_loss": -4.935761451721191, "global_step": 8535, "epoch": 203} {"train_loss": -4.922208309173584, "global_step": 8536, "epoch": 203} {"train_loss": -4.9725751876831055, "global_step": 8537, "epoch": 203} {"train_loss": -4.922289848327637, "global_step": 8538, "epoch": 203} {"train_loss": -4.8954973220825195, "global_step": 8539, "epoch": 203} {"train_loss": -4.855947971343994, "global_step": 8540, "epoch": 203} {"train_loss": -4.785624027252197, "global_step": 8541, "epoch": 203} {"train_loss": -5.047299385070801, "global_step": 8542, "epoch": 203} {"train_loss": -4.788384914398193, "global_step": 8543, "epoch": 203} {"train_loss": -4.899460315704346, "global_step": 8544, "epoch": 203} {"train_loss": -4.908934116363525, "global_step": 8545, "epoch": 203} {"train_loss": -5.049067497253418, "global_step": 8546, "epoch": 203} {"train_loss": -4.92819881439209, "global_step": 8547, "epoch": 203} {"train_loss": -4.977217197418213, "global_step": 8548, "epoch": 203} {"train_loss": -4.911805152893066, "global_step": 8549, "epoch": 203} {"train_loss": -4.932494163513184, "global_step": 8550, "epoch": 203} {"train_loss": -4.947411060333252, "global_step": 8551, "epoch": 203} {"train_loss": -5.054503440856934, "global_step": 8552, "epoch": 203} {"train_loss": -5.027964115142822, "global_step": 8553, "epoch": 203} {"train_loss": -4.924241065979004, "global_step": 8554, "epoch": 203} {"train_loss": -5.0830841064453125, "global_step": 8555, "epoch": 203} {"train_loss": -4.996517181396484, "global_step": 8556, "epoch": 203} {"train_loss": -4.88118839263916, "global_step": 8557, "epoch": 203} {"train_loss": -4.9216814041137695, "global_step": 8558, "epoch": 203} {"train_loss": -4.985987663269043, "global_step": 8559, "epoch": 203} {"train_loss": -4.986920356750488, "global_step": 8560, "epoch": 203} {"train_loss": -5.013132095336914, "global_step": 8561, "epoch": 203} {"train_loss": -4.949014186859131, "global_step": 8562, "epoch": 203} {"train_loss": -4.964022159576416, "global_step": 8563, "epoch": 203} {"train_loss": -4.8551225662231445, "global_step": 8564, "epoch": 203} {"train_loss": -4.9953765869140625, "global_step": 8565, "epoch": 203} {"train_loss": -5.053739547729492, "global_step": 8566, "epoch": 203} {"train_loss": -4.931838705426171, "global_step": 8567, "epoch": 203, "val_loss": 72251.265625} {"train_loss": -4.939596176147461, "global_step": 8568, "epoch": 204} {"train_loss": -4.9892706871032715, "global_step": 8569, "epoch": 204} {"train_loss": -5.045109748840332, "global_step": 8570, "epoch": 204} {"train_loss": -5.137073516845703, "global_step": 8571, "epoch": 204} {"train_loss": -5.031899929046631, "global_step": 8572, "epoch": 204} {"train_loss": -4.871432304382324, "global_step": 8573, "epoch": 204} {"train_loss": -4.925159931182861, "global_step": 8574, "epoch": 204} {"train_loss": -4.931793212890625, "global_step": 8575, "epoch": 204} {"train_loss": -5.017724990844727, "global_step": 8576, "epoch": 204} {"train_loss": -4.98057746887207, "global_step": 8577, "epoch": 204} {"train_loss": -5.002141952514648, "global_step": 8578, "epoch": 204} {"train_loss": -5.005049705505371, "global_step": 8579, "epoch": 204} {"train_loss": -4.945481300354004, "global_step": 8580, "epoch": 204} {"train_loss": -4.954283714294434, "global_step": 8581, "epoch": 204} {"train_loss": -4.99129581451416, "global_step": 8582, "epoch": 204} {"train_loss": -4.959484100341797, "global_step": 8583, "epoch": 204} {"train_loss": -4.792746543884277, "global_step": 8584, "epoch": 204} {"train_loss": -5.004865646362305, "global_step": 8585, "epoch": 204} {"train_loss": -4.871695518493652, "global_step": 8586, "epoch": 204} {"train_loss": -5.079612731933594, "global_step": 8587, "epoch": 204} {"train_loss": -5.009307384490967, "global_step": 8588, "epoch": 204} {"train_loss": -5.126290321350098, "global_step": 8589, "epoch": 204} {"train_loss": -4.929193019866943, "global_step": 8590, "epoch": 204} {"train_loss": -4.980449199676514, "global_step": 8591, "epoch": 204} {"train_loss": -5.012878894805908, "global_step": 8592, "epoch": 204} {"train_loss": -5.045228958129883, "global_step": 8593, "epoch": 204} {"train_loss": -5.0284013748168945, "global_step": 8594, "epoch": 204} {"train_loss": -5.034409523010254, "global_step": 8595, "epoch": 204} {"train_loss": -5.089848518371582, "global_step": 8596, "epoch": 204} {"train_loss": -5.062492370605469, "global_step": 8597, "epoch": 204} {"train_loss": -4.909157752990723, "global_step": 8598, "epoch": 204} {"train_loss": -4.979204177856445, "global_step": 8599, "epoch": 204} {"train_loss": -4.887216567993164, "global_step": 8600, "epoch": 204} {"train_loss": -4.8479905128479, "global_step": 8601, "epoch": 204} {"train_loss": -4.964299201965332, "global_step": 8602, "epoch": 204} {"train_loss": -4.9832000732421875, "global_step": 8603, "epoch": 204} {"train_loss": -4.984889030456543, "global_step": 8604, "epoch": 204} {"train_loss": -4.782540798187256, "global_step": 8605, "epoch": 204} {"train_loss": -4.84768009185791, "global_step": 8606, "epoch": 204} {"train_loss": -4.8963470458984375, "global_step": 8607, "epoch": 204} {"train_loss": -4.730332374572754, "global_step": 8608, "epoch": 204} {"train_loss": -4.9635670866285055, "global_step": 8609, "epoch": 204, "val_loss": 71989.546875} {"train_loss": -4.987215042114258, "global_step": 8610, "epoch": 205} {"train_loss": -4.729686260223389, "global_step": 8611, "epoch": 205} {"train_loss": -4.892547130584717, "global_step": 8612, "epoch": 205} {"train_loss": -5.029640197753906, "global_step": 8613, "epoch": 205} {"train_loss": -4.947642803192139, "global_step": 8614, "epoch": 205} {"train_loss": -4.9797234535217285, "global_step": 8615, "epoch": 205} {"train_loss": -5.027091979980469, "global_step": 8616, "epoch": 205} {"train_loss": -5.060695648193359, "global_step": 8617, "epoch": 205} {"train_loss": -5.0179338455200195, "global_step": 8618, "epoch": 205} {"train_loss": -5.032921314239502, "global_step": 8619, "epoch": 205} {"train_loss": -5.015726566314697, "global_step": 8620, "epoch": 205} {"train_loss": -4.833386421203613, "global_step": 8621, "epoch": 205} {"train_loss": -4.991680145263672, "global_step": 8622, "epoch": 205} {"train_loss": -5.079993724822998, "global_step": 8623, "epoch": 205} {"train_loss": -4.683509826660156, "global_step": 8624, "epoch": 205} {"train_loss": -4.695441246032715, "global_step": 8625, "epoch": 205} {"train_loss": -4.994080066680908, "global_step": 8626, "epoch": 205} {"train_loss": -4.952030181884766, "global_step": 8627, "epoch": 205} {"train_loss": -4.81925106048584, "global_step": 8628, "epoch": 205} {"train_loss": -4.926434516906738, "global_step": 8629, "epoch": 205} {"train_loss": -4.850327491760254, "global_step": 8630, "epoch": 205} {"train_loss": -4.9557271003723145, "global_step": 8631, "epoch": 205} {"train_loss": -4.862285614013672, "global_step": 8632, "epoch": 205} {"train_loss": -4.974543571472168, "global_step": 8633, "epoch": 205} {"train_loss": -5.0938825607299805, "global_step": 8634, "epoch": 205} {"train_loss": -4.952295303344727, "global_step": 8635, "epoch": 205} {"train_loss": -4.970939636230469, "global_step": 8636, "epoch": 205} {"train_loss": -5.075180530548096, "global_step": 8637, "epoch": 205} {"train_loss": -4.977065086364746, "global_step": 8638, "epoch": 205} {"train_loss": -4.956234931945801, "global_step": 8639, "epoch": 205} {"train_loss": -5.026323318481445, "global_step": 8640, "epoch": 205} {"train_loss": -5.097622871398926, "global_step": 8641, "epoch": 205} {"train_loss": -5.201456069946289, "global_step": 8642, "epoch": 205} {"train_loss": -5.058744430541992, "global_step": 8643, "epoch": 205} {"train_loss": -4.9584784507751465, "global_step": 8644, "epoch": 205} {"train_loss": -5.049393653869629, "global_step": 8645, "epoch": 205} {"train_loss": -5.049201011657715, "global_step": 8646, "epoch": 205} {"train_loss": -4.958370208740234, "global_step": 8647, "epoch": 205} {"train_loss": -5.034013748168945, "global_step": 8648, "epoch": 205} {"train_loss": -4.897253036499023, "global_step": 8649, "epoch": 205} {"train_loss": -4.9771199226379395, "global_step": 8650, "epoch": 205} {"train_loss": -4.967680545080276, "global_step": 8651, "epoch": 205, "val_loss": 72280.9140625} {"train_loss": -4.955214500427246, "global_step": 8652, "epoch": 206} {"train_loss": -5.005911827087402, "global_step": 8653, "epoch": 206} {"train_loss": -5.090520858764648, "global_step": 8654, "epoch": 206} {"train_loss": -5.023896217346191, "global_step": 8655, "epoch": 206} {"train_loss": -5.049555778503418, "global_step": 8656, "epoch": 206} {"train_loss": -5.006404399871826, "global_step": 8657, "epoch": 206} {"train_loss": -4.877419471740723, "global_step": 8658, "epoch": 206} {"train_loss": -4.948869705200195, "global_step": 8659, "epoch": 206} {"train_loss": -4.883687973022461, "global_step": 8660, "epoch": 206} {"train_loss": -4.99057674407959, "global_step": 8661, "epoch": 206} {"train_loss": -5.14183235168457, "global_step": 8662, "epoch": 206} {"train_loss": -5.052993297576904, "global_step": 8663, "epoch": 206} {"train_loss": -5.028876304626465, "global_step": 8664, "epoch": 206} {"train_loss": -5.0368804931640625, "global_step": 8665, "epoch": 206} {"train_loss": -4.992247581481934, "global_step": 8666, "epoch": 206} {"train_loss": -5.138889312744141, "global_step": 8667, "epoch": 206} {"train_loss": -4.910055160522461, "global_step": 8668, "epoch": 206} {"train_loss": -5.036998748779297, "global_step": 8669, "epoch": 206} {"train_loss": -5.020092487335205, "global_step": 8670, "epoch": 206} {"train_loss": -4.9197797775268555, "global_step": 8671, "epoch": 206} {"train_loss": -4.898369789123535, "global_step": 8672, "epoch": 206} {"train_loss": -4.934338569641113, "global_step": 8673, "epoch": 206} {"train_loss": -5.139966011047363, "global_step": 8674, "epoch": 206} {"train_loss": -4.946584701538086, "global_step": 8675, "epoch": 206} {"train_loss": -4.89069128036499, "global_step": 8676, "epoch": 206} {"train_loss": -4.962315559387207, "global_step": 8677, "epoch": 206} {"train_loss": -4.927740573883057, "global_step": 8678, "epoch": 206} {"train_loss": -5.014130592346191, "global_step": 8679, "epoch": 206} {"train_loss": -4.887124061584473, "global_step": 8680, "epoch": 206} {"train_loss": -5.051149368286133, "global_step": 8681, "epoch": 206} {"train_loss": -4.8811774253845215, "global_step": 8682, "epoch": 206} {"train_loss": -5.123151779174805, "global_step": 8683, "epoch": 206} {"train_loss": -5.001936435699463, "global_step": 8684, "epoch": 206} {"train_loss": -5.012248516082764, "global_step": 8685, "epoch": 206} {"train_loss": -4.996175765991211, "global_step": 8686, "epoch": 206} {"train_loss": -4.914775371551514, "global_step": 8687, "epoch": 206} {"train_loss": -5.021078586578369, "global_step": 8688, "epoch": 206} {"train_loss": -5.136772155761719, "global_step": 8689, "epoch": 206} {"train_loss": -5.079685688018799, "global_step": 8690, "epoch": 206} {"train_loss": -4.83380126953125, "global_step": 8691, "epoch": 206} {"train_loss": -4.856070518493652, "global_step": 8692, "epoch": 206} {"train_loss": -4.990082286653065, "global_step": 8693, "epoch": 206, "val_loss": 72363.4453125} {"train_loss": -4.902374744415283, "global_step": 8694, "epoch": 207} {"train_loss": -4.9251909255981445, "global_step": 8695, "epoch": 207} {"train_loss": -5.124260902404785, "global_step": 8696, "epoch": 207} {"train_loss": -5.148294448852539, "global_step": 8697, "epoch": 207} {"train_loss": -4.96299934387207, "global_step": 8698, "epoch": 207} {"train_loss": -5.085318565368652, "global_step": 8699, "epoch": 207} {"train_loss": -4.957155227661133, "global_step": 8700, "epoch": 207} {"train_loss": -4.866433143615723, "global_step": 8701, "epoch": 207} {"train_loss": -5.006035327911377, "global_step": 8702, "epoch": 207} {"train_loss": -4.998203277587891, "global_step": 8703, "epoch": 207} {"train_loss": -4.9380340576171875, "global_step": 8704, "epoch": 207} {"train_loss": -4.984119415283203, "global_step": 8705, "epoch": 207} {"train_loss": -4.931194305419922, "global_step": 8706, "epoch": 207} {"train_loss": -4.865983963012695, "global_step": 8707, "epoch": 207} {"train_loss": -5.052422046661377, "global_step": 8708, "epoch": 207} {"train_loss": -5.047633647918701, "global_step": 8709, "epoch": 207} {"train_loss": -4.984321117401123, "global_step": 8710, "epoch": 207} {"train_loss": -4.925877571105957, "global_step": 8711, "epoch": 207} {"train_loss": -5.151494026184082, "global_step": 8712, "epoch": 207} {"train_loss": -5.0403642654418945, "global_step": 8713, "epoch": 207} {"train_loss": -4.910192966461182, "global_step": 8714, "epoch": 207} {"train_loss": -5.0869035720825195, "global_step": 8715, "epoch": 207} {"train_loss": -5.010683536529541, "global_step": 8716, "epoch": 207} {"train_loss": -4.984506607055664, "global_step": 8717, "epoch": 207} {"train_loss": -4.844332695007324, "global_step": 8718, "epoch": 207} {"train_loss": -4.974542140960693, "global_step": 8719, "epoch": 207} {"train_loss": -4.985696792602539, "global_step": 8720, "epoch": 207} {"train_loss": -4.910300254821777, "global_step": 8721, "epoch": 207} {"train_loss": -4.981931686401367, "global_step": 8722, "epoch": 207} {"train_loss": -5.025095462799072, "global_step": 8723, "epoch": 207} {"train_loss": -5.04988956451416, "global_step": 8724, "epoch": 207} {"train_loss": -4.915505409240723, "global_step": 8725, "epoch": 207} {"train_loss": -4.814388275146484, "global_step": 8726, "epoch": 207} {"train_loss": -4.885499954223633, "global_step": 8727, "epoch": 207} {"train_loss": -5.114210605621338, "global_step": 8728, "epoch": 207} {"train_loss": -5.02801513671875, "global_step": 8729, "epoch": 207} {"train_loss": -5.116693496704102, "global_step": 8730, "epoch": 207} {"train_loss": -4.928361415863037, "global_step": 8731, "epoch": 207} {"train_loss": -5.061866283416748, "global_step": 8732, "epoch": 207} {"train_loss": -5.16651725769043, "global_step": 8733, "epoch": 207} {"train_loss": -5.091853141784668, "global_step": 8734, "epoch": 207} {"train_loss": -4.994328623726254, "global_step": 8735, "epoch": 207, "val_loss": 71950.890625} {"train_loss": -5.029656410217285, "global_step": 8736, "epoch": 208} {"train_loss": -5.022882461547852, "global_step": 8737, "epoch": 208} {"train_loss": -5.031492233276367, "global_step": 8738, "epoch": 208} {"train_loss": -4.828464508056641, "global_step": 8739, "epoch": 208} {"train_loss": -4.847018241882324, "global_step": 8740, "epoch": 208} {"train_loss": -5.083214282989502, "global_step": 8741, "epoch": 208} {"train_loss": -5.063098430633545, "global_step": 8742, "epoch": 208} {"train_loss": -4.893598556518555, "global_step": 8743, "epoch": 208} {"train_loss": -5.002961158752441, "global_step": 8744, "epoch": 208} {"train_loss": -4.8026533126831055, "global_step": 8745, "epoch": 208} {"train_loss": -4.9940690994262695, "global_step": 8746, "epoch": 208} {"train_loss": -4.888259410858154, "global_step": 8747, "epoch": 208} {"train_loss": -4.767669677734375, "global_step": 8748, "epoch": 208} {"train_loss": -5.0536394119262695, "global_step": 8749, "epoch": 208} {"train_loss": -4.993915557861328, "global_step": 8750, "epoch": 208} {"train_loss": -4.8499369621276855, "global_step": 8751, "epoch": 208} {"train_loss": -4.980800628662109, "global_step": 8752, "epoch": 208} {"train_loss": -4.82258415222168, "global_step": 8753, "epoch": 208} {"train_loss": -4.923823833465576, "global_step": 8754, "epoch": 208} {"train_loss": -4.8810577392578125, "global_step": 8755, "epoch": 208} {"train_loss": -4.879631519317627, "global_step": 8756, "epoch": 208} {"train_loss": -4.90801477432251, "global_step": 8757, "epoch": 208} {"train_loss": -5.126235008239746, "global_step": 8758, "epoch": 208} {"train_loss": -4.815247535705566, "global_step": 8759, "epoch": 208} {"train_loss": -4.923061370849609, "global_step": 8760, "epoch": 208} {"train_loss": -4.9463396072387695, "global_step": 8761, "epoch": 208} {"train_loss": -5.035959243774414, "global_step": 8762, "epoch": 208} {"train_loss": -5.00929069519043, "global_step": 8763, "epoch": 208} {"train_loss": -4.955817699432373, "global_step": 8764, "epoch": 208} {"train_loss": -5.01401424407959, "global_step": 8765, "epoch": 208} {"train_loss": -4.952834129333496, "global_step": 8766, "epoch": 208} {"train_loss": -4.782782077789307, "global_step": 8767, "epoch": 208} {"train_loss": -5.067113876342773, "global_step": 8768, "epoch": 208} {"train_loss": -5.008492946624756, "global_step": 8769, "epoch": 208} {"train_loss": -5.087873458862305, "global_step": 8770, "epoch": 208} {"train_loss": -4.999117851257324, "global_step": 8771, "epoch": 208} {"train_loss": -4.864290237426758, "global_step": 8772, "epoch": 208} {"train_loss": -5.068671703338623, "global_step": 8773, "epoch": 208} {"train_loss": -4.9057769775390625, "global_step": 8774, "epoch": 208} {"train_loss": -4.847481727600098, "global_step": 8775, "epoch": 208} {"train_loss": -4.8796467781066895, "global_step": 8776, "epoch": 208} {"train_loss": -4.947030635107131, "global_step": 8777, "epoch": 208, "val_loss": 72657.234375} {"train_loss": -4.982538223266602, "global_step": 8778, "epoch": 209} {"train_loss": -4.841617107391357, "global_step": 8779, "epoch": 209} {"train_loss": -4.867744445800781, "global_step": 8780, "epoch": 209} {"train_loss": -4.944110870361328, "global_step": 8781, "epoch": 209} {"train_loss": -5.082424163818359, "global_step": 8782, "epoch": 209} {"train_loss": -4.9789934158325195, "global_step": 8783, "epoch": 209} {"train_loss": -4.910432815551758, "global_step": 8784, "epoch": 209} {"train_loss": -5.126716613769531, "global_step": 8785, "epoch": 209} {"train_loss": -4.9108357429504395, "global_step": 8786, "epoch": 209} {"train_loss": -4.935574054718018, "global_step": 8787, "epoch": 209} {"train_loss": -4.984121322631836, "global_step": 8788, "epoch": 209} {"train_loss": -4.953858375549316, "global_step": 8789, "epoch": 209} {"train_loss": -4.983035087585449, "global_step": 8790, "epoch": 209} {"train_loss": -5.144417762756348, "global_step": 8791, "epoch": 209} {"train_loss": -5.130537986755371, "global_step": 8792, "epoch": 209} {"train_loss": -4.952852725982666, "global_step": 8793, "epoch": 209} {"train_loss": -4.937051773071289, "global_step": 8794, "epoch": 209} {"train_loss": -5.009678363800049, "global_step": 8795, "epoch": 209} {"train_loss": -5.086029052734375, "global_step": 8796, "epoch": 209} {"train_loss": -5.024919509887695, "global_step": 8797, "epoch": 209} {"train_loss": -5.016049385070801, "global_step": 8798, "epoch": 209} {"train_loss": -4.941781997680664, "global_step": 8799, "epoch": 209} {"train_loss": -5.054096221923828, "global_step": 8800, "epoch": 209} {"train_loss": -4.908593654632568, "global_step": 8801, "epoch": 209} {"train_loss": -4.996215343475342, "global_step": 8802, "epoch": 209} {"train_loss": -5.07705020904541, "global_step": 8803, "epoch": 209} {"train_loss": -4.937736988067627, "global_step": 8804, "epoch": 209} {"train_loss": -4.956061840057373, "global_step": 8805, "epoch": 209} {"train_loss": -4.9572858810424805, "global_step": 8806, "epoch": 209} {"train_loss": -5.049264430999756, "global_step": 8807, "epoch": 209} {"train_loss": -4.742077350616455, "global_step": 8808, "epoch": 209} {"train_loss": -5.091078758239746, "global_step": 8809, "epoch": 209} {"train_loss": -5.154253005981445, "global_step": 8810, "epoch": 209} {"train_loss": -4.818281173706055, "global_step": 8811, "epoch": 209} {"train_loss": -4.802840232849121, "global_step": 8812, "epoch": 209} {"train_loss": -4.995628833770752, "global_step": 8813, "epoch": 209} {"train_loss": -4.924828052520752, "global_step": 8814, "epoch": 209} {"train_loss": -4.988982200622559, "global_step": 8815, "epoch": 209} {"train_loss": -5.109353065490723, "global_step": 8816, "epoch": 209} {"train_loss": -4.842922687530518, "global_step": 8817, "epoch": 209} {"train_loss": -5.013252258300781, "global_step": 8818, "epoch": 209} {"train_loss": -4.980705352056594, "global_step": 8819, "epoch": 209, "val_loss": 72162.7421875} {"train_loss": -4.941436767578125, "global_step": 8820, "epoch": 210} {"train_loss": -5.017281532287598, "global_step": 8821, "epoch": 210} {"train_loss": -5.169004440307617, "global_step": 8822, "epoch": 210} {"train_loss": -5.039872169494629, "global_step": 8823, "epoch": 210} {"train_loss": -5.006134033203125, "global_step": 8824, "epoch": 210} {"train_loss": -5.123418807983398, "global_step": 8825, "epoch": 210} {"train_loss": -5.006312370300293, "global_step": 8826, "epoch": 210} {"train_loss": -4.9571685791015625, "global_step": 8827, "epoch": 210} {"train_loss": -4.947998046875, "global_step": 8828, "epoch": 210} {"train_loss": -4.952062129974365, "global_step": 8829, "epoch": 210} {"train_loss": -4.885106563568115, "global_step": 8830, "epoch": 210} {"train_loss": -5.094346046447754, "global_step": 8831, "epoch": 210} {"train_loss": -5.14674186706543, "global_step": 8832, "epoch": 210} {"train_loss": -4.978271007537842, "global_step": 8833, "epoch": 210} {"train_loss": -4.904049873352051, "global_step": 8834, "epoch": 210} {"train_loss": -5.02584981918335, "global_step": 8835, "epoch": 210} {"train_loss": -5.0159010887146, "global_step": 8836, "epoch": 210} {"train_loss": -4.990331172943115, "global_step": 8837, "epoch": 210} {"train_loss": -4.872516632080078, "global_step": 8838, "epoch": 210} {"train_loss": -5.049708843231201, "global_step": 8839, "epoch": 210} {"train_loss": -5.002232551574707, "global_step": 8840, "epoch": 210} {"train_loss": -4.961948394775391, "global_step": 8841, "epoch": 210} {"train_loss": -4.90022087097168, "global_step": 8842, "epoch": 210} {"train_loss": -5.0010786056518555, "global_step": 8843, "epoch": 210} {"train_loss": -4.964052677154541, "global_step": 8844, "epoch": 210} {"train_loss": -4.967165470123291, "global_step": 8845, "epoch": 210} {"train_loss": -4.879880905151367, "global_step": 8846, "epoch": 210} {"train_loss": -5.081432342529297, "global_step": 8847, "epoch": 210} {"train_loss": -4.946402072906494, "global_step": 8848, "epoch": 210} {"train_loss": -5.044111728668213, "global_step": 8849, "epoch": 210} {"train_loss": -5.089998245239258, "global_step": 8850, "epoch": 210} {"train_loss": -5.030291557312012, "global_step": 8851, "epoch": 210} {"train_loss": -5.074063301086426, "global_step": 8852, "epoch": 210} {"train_loss": -5.054030418395996, "global_step": 8853, "epoch": 210} {"train_loss": -5.051409721374512, "global_step": 8854, "epoch": 210} {"train_loss": -4.951287269592285, "global_step": 8855, "epoch": 210} {"train_loss": -5.013789176940918, "global_step": 8856, "epoch": 210} {"train_loss": -5.035702705383301, "global_step": 8857, "epoch": 210} {"train_loss": -5.068955898284912, "global_step": 8858, "epoch": 210} {"train_loss": -5.008544921875, "global_step": 8859, "epoch": 210} {"train_loss": -4.880702018737793, "global_step": 8860, "epoch": 210} {"train_loss": -5.004495995385306, "global_step": 8861, "epoch": 210, "val_loss": 71302.3203125} {"train_loss": -5.037751197814941, "global_step": 8862, "epoch": 211} {"train_loss": -5.132754802703857, "global_step": 8863, "epoch": 211} {"train_loss": -5.003514289855957, "global_step": 8864, "epoch": 211} {"train_loss": -5.014190673828125, "global_step": 8865, "epoch": 211} {"train_loss": -5.032785415649414, "global_step": 8866, "epoch": 211} {"train_loss": -4.852934837341309, "global_step": 8867, "epoch": 211} {"train_loss": -4.976806640625, "global_step": 8868, "epoch": 211} {"train_loss": -4.931318283081055, "global_step": 8869, "epoch": 211} {"train_loss": -4.878720283508301, "global_step": 8870, "epoch": 211} {"train_loss": -5.076989650726318, "global_step": 8871, "epoch": 211} {"train_loss": -4.911759376525879, "global_step": 8872, "epoch": 211} {"train_loss": -5.1034770011901855, "global_step": 8873, "epoch": 211} {"train_loss": -5.023751735687256, "global_step": 8874, "epoch": 211} {"train_loss": -5.063966751098633, "global_step": 8875, "epoch": 211} {"train_loss": -5.03291654586792, "global_step": 8876, "epoch": 211} {"train_loss": -4.813568115234375, "global_step": 8877, "epoch": 211} {"train_loss": -4.902400970458984, "global_step": 8878, "epoch": 211} {"train_loss": -4.959861755371094, "global_step": 8879, "epoch": 211} {"train_loss": -4.951343536376953, "global_step": 8880, "epoch": 211} {"train_loss": -4.743317604064941, "global_step": 8881, "epoch": 211} {"train_loss": -5.0398759841918945, "global_step": 8882, "epoch": 211} {"train_loss": -4.81221866607666, "global_step": 8883, "epoch": 211} {"train_loss": -4.99647331237793, "global_step": 8884, "epoch": 211} {"train_loss": -5.132555961608887, "global_step": 8885, "epoch": 211} {"train_loss": -4.939646244049072, "global_step": 8886, "epoch": 211} {"train_loss": -4.852418899536133, "global_step": 8887, "epoch": 211} {"train_loss": -5.12175178527832, "global_step": 8888, "epoch": 211} {"train_loss": -5.101903438568115, "global_step": 8889, "epoch": 211} {"train_loss": -5.028646469116211, "global_step": 8890, "epoch": 211} {"train_loss": -5.072488784790039, "global_step": 8891, "epoch": 211} {"train_loss": -5.000668525695801, "global_step": 8892, "epoch": 211} {"train_loss": -5.0205078125, "global_step": 8893, "epoch": 211} {"train_loss": -5.019124984741211, "global_step": 8894, "epoch": 211} {"train_loss": -4.876533508300781, "global_step": 8895, "epoch": 211} {"train_loss": -4.9923095703125, "global_step": 8896, "epoch": 211} {"train_loss": -4.963137626647949, "global_step": 8897, "epoch": 211} {"train_loss": -5.0424652099609375, "global_step": 8898, "epoch": 211} {"train_loss": -5.04099702835083, "global_step": 8899, "epoch": 211} {"train_loss": -5.006543159484863, "global_step": 8900, "epoch": 211} {"train_loss": -5.036499977111816, "global_step": 8901, "epoch": 211} {"train_loss": -4.981935977935791, "global_step": 8902, "epoch": 211} {"train_loss": -4.99070786294483, "global_step": 8903, "epoch": 211, "val_loss": 71575.609375} {"train_loss": -5.066520690917969, "global_step": 8904, "epoch": 212} {"train_loss": -5.125982284545898, "global_step": 8905, "epoch": 212} {"train_loss": -5.046271324157715, "global_step": 8906, "epoch": 212} {"train_loss": -4.903072357177734, "global_step": 8907, "epoch": 212} {"train_loss": -4.907491683959961, "global_step": 8908, "epoch": 212} {"train_loss": -5.026221752166748, "global_step": 8909, "epoch": 212} {"train_loss": -5.051652908325195, "global_step": 8910, "epoch": 212} {"train_loss": -4.9582037925720215, "global_step": 8911, "epoch": 212} {"train_loss": -5.060150146484375, "global_step": 8912, "epoch": 212} {"train_loss": -4.9404096603393555, "global_step": 8913, "epoch": 212} {"train_loss": -4.987393379211426, "global_step": 8914, "epoch": 212} {"train_loss": -4.930408000946045, "global_step": 8915, "epoch": 212} {"train_loss": -5.033013820648193, "global_step": 8916, "epoch": 212} {"train_loss": -4.979388236999512, "global_step": 8917, "epoch": 212} {"train_loss": -5.021574020385742, "global_step": 8918, "epoch": 212} {"train_loss": -4.94771671295166, "global_step": 8919, "epoch": 212} {"train_loss": -4.935951232910156, "global_step": 8920, "epoch": 212} {"train_loss": -5.03764533996582, "global_step": 8921, "epoch": 212} {"train_loss": -5.055559158325195, "global_step": 8922, "epoch": 212} {"train_loss": -5.126277446746826, "global_step": 8923, "epoch": 212} {"train_loss": -4.9001545906066895, "global_step": 8924, "epoch": 212} {"train_loss": -5.072254657745361, "global_step": 8925, "epoch": 212} {"train_loss": -5.103425979614258, "global_step": 8926, "epoch": 212} {"train_loss": -5.056258201599121, "global_step": 8927, "epoch": 212} {"train_loss": -5.004478931427002, "global_step": 8928, "epoch": 212} {"train_loss": -5.092110633850098, "global_step": 8929, "epoch": 212} {"train_loss": -5.092151165008545, "global_step": 8930, "epoch": 212} {"train_loss": -5.097057342529297, "global_step": 8931, "epoch": 212} {"train_loss": -5.179405212402344, "global_step": 8932, "epoch": 212} {"train_loss": -5.043079853057861, "global_step": 8933, "epoch": 212} {"train_loss": -4.969633102416992, "global_step": 8934, "epoch": 212} {"train_loss": -5.018074035644531, "global_step": 8935, "epoch": 212} {"train_loss": -4.948948860168457, "global_step": 8936, "epoch": 212} {"train_loss": -4.8519287109375, "global_step": 8937, "epoch": 212} {"train_loss": -4.922351360321045, "global_step": 8938, "epoch": 212} {"train_loss": -5.0734663009643555, "global_step": 8939, "epoch": 212} {"train_loss": -5.048784255981445, "global_step": 8940, "epoch": 212} {"train_loss": -5.016631126403809, "global_step": 8941, "epoch": 212} {"train_loss": -5.043242454528809, "global_step": 8942, "epoch": 212} {"train_loss": -5.0390706062316895, "global_step": 8943, "epoch": 212} {"train_loss": -5.1604509353637695, "global_step": 8944, "epoch": 212} {"train_loss": -5.017796164467221, "global_step": 8945, "epoch": 212, "val_loss": 71551.3828125} {"train_loss": -4.957901954650879, "global_step": 8946, "epoch": 213} {"train_loss": -5.003411769866943, "global_step": 8947, "epoch": 213} {"train_loss": -5.047049522399902, "global_step": 8948, "epoch": 213} {"train_loss": -4.934877872467041, "global_step": 8949, "epoch": 213} {"train_loss": -4.860948085784912, "global_step": 8950, "epoch": 213} {"train_loss": -4.900754928588867, "global_step": 8951, "epoch": 213} {"train_loss": -5.130659580230713, "global_step": 8952, "epoch": 213} {"train_loss": -5.073171615600586, "global_step": 8953, "epoch": 213} {"train_loss": -5.013711452484131, "global_step": 8954, "epoch": 213} {"train_loss": -5.052530765533447, "global_step": 8955, "epoch": 213} {"train_loss": -4.823624134063721, "global_step": 8956, "epoch": 213} {"train_loss": -4.976736068725586, "global_step": 8957, "epoch": 213} {"train_loss": -4.8518595695495605, "global_step": 8958, "epoch": 213} {"train_loss": -4.687741756439209, "global_step": 8959, "epoch": 213} {"train_loss": -4.987242221832275, "global_step": 8960, "epoch": 213} {"train_loss": -4.810355186462402, "global_step": 8961, "epoch": 213} {"train_loss": -5.044497489929199, "global_step": 8962, "epoch": 213} {"train_loss": -4.974809646606445, "global_step": 8963, "epoch": 213} {"train_loss": -4.930011749267578, "global_step": 8964, "epoch": 213} {"train_loss": -5.013293266296387, "global_step": 8965, "epoch": 213} {"train_loss": -5.029781818389893, "global_step": 8966, "epoch": 213} {"train_loss": -4.93310546875, "global_step": 8967, "epoch": 213} {"train_loss": -4.9140214920043945, "global_step": 8968, "epoch": 213} {"train_loss": -4.9517621994018555, "global_step": 8969, "epoch": 213} {"train_loss": -4.814758777618408, "global_step": 8970, "epoch": 213} {"train_loss": -5.02994441986084, "global_step": 8971, "epoch": 213} {"train_loss": -5.007033348083496, "global_step": 8972, "epoch": 213} {"train_loss": -5.175894260406494, "global_step": 8973, "epoch": 213} {"train_loss": -5.07530403137207, "global_step": 8974, "epoch": 213} {"train_loss": -5.033204555511475, "global_step": 8975, "epoch": 213} {"train_loss": -5.0289177894592285, "global_step": 8976, "epoch": 213} {"train_loss": -4.923239707946777, "global_step": 8977, "epoch": 213} {"train_loss": -5.001978874206543, "global_step": 8978, "epoch": 213} {"train_loss": -4.9530181884765625, "global_step": 8979, "epoch": 213} {"train_loss": -5.016835689544678, "global_step": 8980, "epoch": 213} {"train_loss": -4.943308353424072, "global_step": 8981, "epoch": 213} {"train_loss": -5.0277910232543945, "global_step": 8982, "epoch": 213} {"train_loss": -5.10013484954834, "global_step": 8983, "epoch": 213} {"train_loss": -4.907740116119385, "global_step": 8984, "epoch": 213} {"train_loss": -5.04872989654541, "global_step": 8985, "epoch": 213} {"train_loss": -5.105747699737549, "global_step": 8986, "epoch": 213} {"train_loss": -4.9779349735804965, "global_step": 8987, "epoch": 213, "val_loss": 71759.8515625} {"train_loss": -5.03314208984375, "global_step": 8988, "epoch": 214} {"train_loss": -5.124131679534912, "global_step": 8989, "epoch": 214} {"train_loss": -5.101057052612305, "global_step": 8990, "epoch": 214} {"train_loss": -4.965610027313232, "global_step": 8991, "epoch": 214} {"train_loss": -4.996403694152832, "global_step": 8992, "epoch": 214} {"train_loss": -4.893106460571289, "global_step": 8993, "epoch": 214} {"train_loss": -5.150794982910156, "global_step": 8994, "epoch": 214} {"train_loss": -4.974175453186035, "global_step": 8995, "epoch": 214} {"train_loss": -4.995368003845215, "global_step": 8996, "epoch": 214} {"train_loss": -5.065016269683838, "global_step": 8997, "epoch": 214} {"train_loss": -5.284693717956543, "global_step": 8998, "epoch": 214} {"train_loss": -5.1361799240112305, "global_step": 8999, "epoch": 214} {"train_loss": -4.911334037780762, "global_step": 9000, "epoch": 214} {"train_loss": -5.063478469848633, "global_step": 9001, "epoch": 214} {"train_loss": -5.080201148986816, "global_step": 9002, "epoch": 214} {"train_loss": -5.176666259765625, "global_step": 9003, "epoch": 214} {"train_loss": -4.901784896850586, "global_step": 9004, "epoch": 214} {"train_loss": -4.774934768676758, "global_step": 9005, "epoch": 214} {"train_loss": -5.025661945343018, "global_step": 9006, "epoch": 214} {"train_loss": -5.01041316986084, "global_step": 9007, "epoch": 214} {"train_loss": -4.960205078125, "global_step": 9008, "epoch": 214} {"train_loss": -4.8479814529418945, "global_step": 9009, "epoch": 214} {"train_loss": -4.885985851287842, "global_step": 9010, "epoch": 214} {"train_loss": -4.937484264373779, "global_step": 9011, "epoch": 214} {"train_loss": -4.982398986816406, "global_step": 9012, "epoch": 214} {"train_loss": -4.999457359313965, "global_step": 9013, "epoch": 214} {"train_loss": -4.922947883605957, "global_step": 9014, "epoch": 214} {"train_loss": -5.050107955932617, "global_step": 9015, "epoch": 214} {"train_loss": -5.009088516235352, "global_step": 9016, "epoch": 214} {"train_loss": -4.959973335266113, "global_step": 9017, "epoch": 214} {"train_loss": -4.927111625671387, "global_step": 9018, "epoch": 214} {"train_loss": -5.028358459472656, "global_step": 9019, "epoch": 214} {"train_loss": -4.929244518280029, "global_step": 9020, "epoch": 214} {"train_loss": -4.977118492126465, "global_step": 9021, "epoch": 214} {"train_loss": -4.8625335693359375, "global_step": 9022, "epoch": 214} {"train_loss": -4.796882629394531, "global_step": 9023, "epoch": 214} {"train_loss": -4.8438825607299805, "global_step": 9024, "epoch": 214} {"train_loss": -4.884488582611084, "global_step": 9025, "epoch": 214} {"train_loss": -5.131444931030273, "global_step": 9026, "epoch": 214} {"train_loss": -5.020223140716553, "global_step": 9027, "epoch": 214} {"train_loss": -5.003002166748047, "global_step": 9028, "epoch": 214} {"train_loss": -4.990435668400356, "global_step": 9029, "epoch": 214, "val_loss": 71457.328125} {"train_loss": -5.07673454284668, "global_step": 9030, "epoch": 215} {"train_loss": -5.03564453125, "global_step": 9031, "epoch": 215} {"train_loss": -4.976601600646973, "global_step": 9032, "epoch": 215} {"train_loss": -5.06001091003418, "global_step": 9033, "epoch": 215} {"train_loss": -4.9486083984375, "global_step": 9034, "epoch": 215} {"train_loss": -5.188272476196289, "global_step": 9035, "epoch": 215} {"train_loss": -5.1157050132751465, "global_step": 9036, "epoch": 215} {"train_loss": -4.814352512359619, "global_step": 9037, "epoch": 215} {"train_loss": -5.062891483306885, "global_step": 9038, "epoch": 215} {"train_loss": -4.991724014282227, "global_step": 9039, "epoch": 215} {"train_loss": -4.815293312072754, "global_step": 9040, "epoch": 215} {"train_loss": -4.993434429168701, "global_step": 9041, "epoch": 215} {"train_loss": -5.037178993225098, "global_step": 9042, "epoch": 215} {"train_loss": -5.101131439208984, "global_step": 9043, "epoch": 215} {"train_loss": -5.0525383949279785, "global_step": 9044, "epoch": 215} {"train_loss": -5.000105381011963, "global_step": 9045, "epoch": 215} {"train_loss": -4.955018043518066, "global_step": 9046, "epoch": 215} {"train_loss": -5.079573631286621, "global_step": 9047, "epoch": 215} {"train_loss": -5.0506768226623535, "global_step": 9048, "epoch": 215} {"train_loss": -4.938323974609375, "global_step": 9049, "epoch": 215} {"train_loss": -5.033646583557129, "global_step": 9050, "epoch": 215} {"train_loss": -5.085613250732422, "global_step": 9051, "epoch": 215} {"train_loss": -5.019824981689453, "global_step": 9052, "epoch": 215} {"train_loss": -5.057614326477051, "global_step": 9053, "epoch": 215} {"train_loss": -5.026858329772949, "global_step": 9054, "epoch": 215} {"train_loss": -4.967487335205078, "global_step": 9055, "epoch": 215} {"train_loss": -4.996683120727539, "global_step": 9056, "epoch": 215} {"train_loss": -5.013175964355469, "global_step": 9057, "epoch": 215} {"train_loss": -5.011354446411133, "global_step": 9058, "epoch": 215} {"train_loss": -5.0504560470581055, "global_step": 9059, "epoch": 215} {"train_loss": -5.048044681549072, "global_step": 9060, "epoch": 215} {"train_loss": -4.995274543762207, "global_step": 9061, "epoch": 215} {"train_loss": -4.992650985717773, "global_step": 9062, "epoch": 215} {"train_loss": -4.991985321044922, "global_step": 9063, "epoch": 215} {"train_loss": -5.015102386474609, "global_step": 9064, "epoch": 215} {"train_loss": -5.125760078430176, "global_step": 9065, "epoch": 215} {"train_loss": -5.037884712219238, "global_step": 9066, "epoch": 215} {"train_loss": -5.103412628173828, "global_step": 9067, "epoch": 215} {"train_loss": -5.03082799911499, "global_step": 9068, "epoch": 215} {"train_loss": -4.790833473205566, "global_step": 9069, "epoch": 215} {"train_loss": -5.137183666229248, "global_step": 9070, "epoch": 215} {"train_loss": -5.019028425216675, "global_step": 9071, "epoch": 215, "val_loss": 71243.7421875} {"train_loss": -4.975822448730469, "global_step": 9072, "epoch": 216} {"train_loss": -5.05962610244751, "global_step": 9073, "epoch": 216} {"train_loss": -4.900744915008545, "global_step": 9074, "epoch": 216} {"train_loss": -5.038270473480225, "global_step": 9075, "epoch": 216} {"train_loss": -5.069967269897461, "global_step": 9076, "epoch": 216} {"train_loss": -5.025487899780273, "global_step": 9077, "epoch": 216} {"train_loss": -5.065851211547852, "global_step": 9078, "epoch": 216} {"train_loss": -4.901562690734863, "global_step": 9079, "epoch": 216} {"train_loss": -5.0321760177612305, "global_step": 9080, "epoch": 216} {"train_loss": -5.049999713897705, "global_step": 9081, "epoch": 216} {"train_loss": -4.940268039703369, "global_step": 9082, "epoch": 216} {"train_loss": -4.940810203552246, "global_step": 9083, "epoch": 216} {"train_loss": -4.884834289550781, "global_step": 9084, "epoch": 216} {"train_loss": -5.023797988891602, "global_step": 9085, "epoch": 216} {"train_loss": -5.064098834991455, "global_step": 9086, "epoch": 216} {"train_loss": -5.123559474945068, "global_step": 9087, "epoch": 216} {"train_loss": -4.898690223693848, "global_step": 9088, "epoch": 216} {"train_loss": -4.983214378356934, "global_step": 9089, "epoch": 216} {"train_loss": -4.8520636558532715, "global_step": 9090, "epoch": 216} {"train_loss": -5.06210470199585, "global_step": 9091, "epoch": 216} {"train_loss": -5.086913585662842, "global_step": 9092, "epoch": 216} {"train_loss": -4.945928573608398, "global_step": 9093, "epoch": 216} {"train_loss": -5.022351264953613, "global_step": 9094, "epoch": 216} {"train_loss": -4.9569549560546875, "global_step": 9095, "epoch": 216} {"train_loss": -5.057133197784424, "global_step": 9096, "epoch": 216} {"train_loss": -4.8829665184021, "global_step": 9097, "epoch": 216} {"train_loss": -4.823169708251953, "global_step": 9098, "epoch": 216} {"train_loss": -5.133032321929932, "global_step": 9099, "epoch": 216} {"train_loss": -5.006036758422852, "global_step": 9100, "epoch": 216} {"train_loss": -5.017404556274414, "global_step": 9101, "epoch": 216} {"train_loss": -5.002291679382324, "global_step": 9102, "epoch": 216} {"train_loss": -4.97603178024292, "global_step": 9103, "epoch": 216} {"train_loss": -5.082205772399902, "global_step": 9104, "epoch": 216} {"train_loss": -4.939247131347656, "global_step": 9105, "epoch": 216} {"train_loss": -4.983593463897705, "global_step": 9106, "epoch": 216} {"train_loss": -4.998135566711426, "global_step": 9107, "epoch": 216} {"train_loss": -4.933424472808838, "global_step": 9108, "epoch": 216} {"train_loss": -5.264185905456543, "global_step": 9109, "epoch": 216} {"train_loss": -5.125218391418457, "global_step": 9110, "epoch": 216} {"train_loss": -4.798038959503174, "global_step": 9111, "epoch": 216} {"train_loss": -4.950014591217041, "global_step": 9112, "epoch": 216} {"train_loss": -4.997270470573788, "global_step": 9113, "epoch": 216, "val_loss": 71755.6796875} {"train_loss": -4.968591690063477, "global_step": 9114, "epoch": 217} {"train_loss": -4.974784851074219, "global_step": 9115, "epoch": 217} {"train_loss": -5.020673751831055, "global_step": 9116, "epoch": 217} {"train_loss": -4.989671230316162, "global_step": 9117, "epoch": 217} {"train_loss": -5.0901780128479, "global_step": 9118, "epoch": 217} {"train_loss": -5.022464752197266, "global_step": 9119, "epoch": 217} {"train_loss": -4.995077133178711, "global_step": 9120, "epoch": 217} {"train_loss": -4.896784782409668, "global_step": 9121, "epoch": 217} {"train_loss": -5.138293266296387, "global_step": 9122, "epoch": 217} {"train_loss": -5.066473960876465, "global_step": 9123, "epoch": 217} {"train_loss": -4.974869728088379, "global_step": 9124, "epoch": 217} {"train_loss": -5.083289623260498, "global_step": 9125, "epoch": 217} {"train_loss": -4.978118896484375, "global_step": 9126, "epoch": 217} {"train_loss": -5.064591407775879, "global_step": 9127, "epoch": 217} {"train_loss": -4.962206840515137, "global_step": 9128, "epoch": 217} {"train_loss": -5.076297760009766, "global_step": 9129, "epoch": 217} {"train_loss": -4.912213325500488, "global_step": 9130, "epoch": 217} {"train_loss": -5.059114933013916, "global_step": 9131, "epoch": 217} {"train_loss": -5.013797283172607, "global_step": 9132, "epoch": 217} {"train_loss": -4.875250816345215, "global_step": 9133, "epoch": 217} {"train_loss": -5.032019138336182, "global_step": 9134, "epoch": 217} {"train_loss": -5.026505470275879, "global_step": 9135, "epoch": 217} {"train_loss": -4.75043249130249, "global_step": 9136, "epoch": 217} {"train_loss": -4.8351263999938965, "global_step": 9137, "epoch": 217} {"train_loss": -5.072755336761475, "global_step": 9138, "epoch": 217} {"train_loss": -5.009960651397705, "global_step": 9139, "epoch": 217} {"train_loss": -4.706412315368652, "global_step": 9140, "epoch": 217} {"train_loss": -5.111321449279785, "global_step": 9141, "epoch": 217} {"train_loss": -4.920614242553711, "global_step": 9142, "epoch": 217} {"train_loss": -4.808328628540039, "global_step": 9143, "epoch": 217} {"train_loss": -4.948101043701172, "global_step": 9144, "epoch": 217} {"train_loss": -4.809403419494629, "global_step": 9145, "epoch": 217} {"train_loss": -4.919960021972656, "global_step": 9146, "epoch": 217} {"train_loss": -4.969377517700195, "global_step": 9147, "epoch": 217} {"train_loss": -4.8393449783325195, "global_step": 9148, "epoch": 217} {"train_loss": -4.872422218322754, "global_step": 9149, "epoch": 217} {"train_loss": -5.0458502769470215, "global_step": 9150, "epoch": 217} {"train_loss": -4.978894233703613, "global_step": 9151, "epoch": 217} {"train_loss": -4.975610733032227, "global_step": 9152, "epoch": 217} {"train_loss": -4.846769332885742, "global_step": 9153, "epoch": 217} {"train_loss": -4.947039604187012, "global_step": 9154, "epoch": 217} {"train_loss": -4.967823073977516, "global_step": 9155, "epoch": 217, "val_loss": 71436.78125} {"train_loss": -4.921953201293945, "global_step": 9156, "epoch": 218} {"train_loss": -4.998323440551758, "global_step": 9157, "epoch": 218} {"train_loss": -4.922974109649658, "global_step": 9158, "epoch": 218} {"train_loss": -5.136334419250488, "global_step": 9159, "epoch": 218} {"train_loss": -5.11140251159668, "global_step": 9160, "epoch": 218} {"train_loss": -5.002655029296875, "global_step": 9161, "epoch": 218} {"train_loss": -5.0857768058776855, "global_step": 9162, "epoch": 218} {"train_loss": -5.049934387207031, "global_step": 9163, "epoch": 218} {"train_loss": -4.967041015625, "global_step": 9164, "epoch": 218} {"train_loss": -4.926353454589844, "global_step": 9165, "epoch": 218} {"train_loss": -4.898224830627441, "global_step": 9166, "epoch": 218} {"train_loss": -5.213484287261963, "global_step": 9167, "epoch": 218} {"train_loss": -4.972973823547363, "global_step": 9168, "epoch": 218} {"train_loss": -5.015508651733398, "global_step": 9169, "epoch": 218} {"train_loss": -5.1089558601379395, "global_step": 9170, "epoch": 218} {"train_loss": -4.874809265136719, "global_step": 9171, "epoch": 218} {"train_loss": -4.765810966491699, "global_step": 9172, "epoch": 218} {"train_loss": -5.028189182281494, "global_step": 9173, "epoch": 218} {"train_loss": -5.055461406707764, "global_step": 9174, "epoch": 218} {"train_loss": -4.968457221984863, "global_step": 9175, "epoch": 218} {"train_loss": -5.035734176635742, "global_step": 9176, "epoch": 218} {"train_loss": -5.14101505279541, "global_step": 9177, "epoch": 218} {"train_loss": -4.872946739196777, "global_step": 9178, "epoch": 218} {"train_loss": -5.016977310180664, "global_step": 9179, "epoch": 218} {"train_loss": -5.085992336273193, "global_step": 9180, "epoch": 218} {"train_loss": -5.035956382751465, "global_step": 9181, "epoch": 218} {"train_loss": -4.889102935791016, "global_step": 9182, "epoch": 218} {"train_loss": -5.035637855529785, "global_step": 9183, "epoch": 218} {"train_loss": -4.907873630523682, "global_step": 9184, "epoch": 218} {"train_loss": -5.013948440551758, "global_step": 9185, "epoch": 218} {"train_loss": -5.081597328186035, "global_step": 9186, "epoch": 218} {"train_loss": -4.789289951324463, "global_step": 9187, "epoch": 218} {"train_loss": -4.6320037841796875, "global_step": 9188, "epoch": 218} {"train_loss": -5.038805961608887, "global_step": 9189, "epoch": 218} {"train_loss": -4.8807597160339355, "global_step": 9190, "epoch": 218} {"train_loss": -4.765218734741211, "global_step": 9191, "epoch": 218} {"train_loss": -5.032836437225342, "global_step": 9192, "epoch": 218} {"train_loss": -4.856132984161377, "global_step": 9193, "epoch": 218} {"train_loss": -4.940548419952393, "global_step": 9194, "epoch": 218} {"train_loss": -4.977109432220459, "global_step": 9195, "epoch": 218} {"train_loss": -4.836390972137451, "global_step": 9196, "epoch": 218} {"train_loss": -4.9756246748424715, "global_step": 9197, "epoch": 218, "val_loss": 71160.9140625} {"train_loss": -5.07982063293457, "global_step": 9198, "epoch": 219} {"train_loss": -4.889899253845215, "global_step": 9199, "epoch": 219} {"train_loss": -4.963489532470703, "global_step": 9200, "epoch": 219} {"train_loss": -4.995457649230957, "global_step": 9201, "epoch": 219} {"train_loss": -4.847735404968262, "global_step": 9202, "epoch": 219} {"train_loss": -5.085193157196045, "global_step": 9203, "epoch": 219} {"train_loss": -5.014650344848633, "global_step": 9204, "epoch": 219} {"train_loss": -4.87400484085083, "global_step": 9205, "epoch": 219} {"train_loss": -4.932629585266113, "global_step": 9206, "epoch": 219} {"train_loss": -4.921877384185791, "global_step": 9207, "epoch": 219} {"train_loss": -4.966668605804443, "global_step": 9208, "epoch": 219} {"train_loss": -5.018362522125244, "global_step": 9209, "epoch": 219} {"train_loss": -4.941122055053711, "global_step": 9210, "epoch": 219} {"train_loss": -4.916635513305664, "global_step": 9211, "epoch": 219} {"train_loss": -4.940471649169922, "global_step": 9212, "epoch": 219} {"train_loss": -4.974516868591309, "global_step": 9213, "epoch": 219} {"train_loss": -5.016590118408203, "global_step": 9214, "epoch": 219} {"train_loss": -5.074254989624023, "global_step": 9215, "epoch": 219} {"train_loss": -5.074564456939697, "global_step": 9216, "epoch": 219} {"train_loss": -5.094132423400879, "global_step": 9217, "epoch": 219} {"train_loss": -4.919025421142578, "global_step": 9218, "epoch": 219} {"train_loss": -5.092988014221191, "global_step": 9219, "epoch": 219} {"train_loss": -5.117109298706055, "global_step": 9220, "epoch": 219} {"train_loss": -5.1548051834106445, "global_step": 9221, "epoch": 219} {"train_loss": -5.126923561096191, "global_step": 9222, "epoch": 219} {"train_loss": -4.845687389373779, "global_step": 9223, "epoch": 219} {"train_loss": -5.190942764282227, "global_step": 9224, "epoch": 219} {"train_loss": -4.978132247924805, "global_step": 9225, "epoch": 219} {"train_loss": -4.985753536224365, "global_step": 9226, "epoch": 219} {"train_loss": -5.182898998260498, "global_step": 9227, "epoch": 219} {"train_loss": -4.934945106506348, "global_step": 9228, "epoch": 219} {"train_loss": -4.963564872741699, "global_step": 9229, "epoch": 219} {"train_loss": -5.04276180267334, "global_step": 9230, "epoch": 219} {"train_loss": -4.791682243347168, "global_step": 9231, "epoch": 219} {"train_loss": -5.088414669036865, "global_step": 9232, "epoch": 219} {"train_loss": -5.055700302124023, "global_step": 9233, "epoch": 219} {"train_loss": -4.954841613769531, "global_step": 9234, "epoch": 219} {"train_loss": -4.9108052253723145, "global_step": 9235, "epoch": 219} {"train_loss": -5.021125793457031, "global_step": 9236, "epoch": 219} {"train_loss": -4.937010765075684, "global_step": 9237, "epoch": 219} {"train_loss": -5.050431251525879, "global_step": 9238, "epoch": 219} {"train_loss": -4.997392018636067, "global_step": 9239, "epoch": 219, "val_loss": 71586.3515625} {"train_loss": -5.009951591491699, "global_step": 9240, "epoch": 220} {"train_loss": -4.939873218536377, "global_step": 9241, "epoch": 220} {"train_loss": -4.972261428833008, "global_step": 9242, "epoch": 220} {"train_loss": -5.058262825012207, "global_step": 9243, "epoch": 220} {"train_loss": -4.9565887451171875, "global_step": 9244, "epoch": 220} {"train_loss": -5.136686325073242, "global_step": 9245, "epoch": 220} {"train_loss": -5.067112922668457, "global_step": 9246, "epoch": 220} {"train_loss": -5.005587577819824, "global_step": 9247, "epoch": 220} {"train_loss": -4.980252265930176, "global_step": 9248, "epoch": 220} {"train_loss": -5.029961585998535, "global_step": 9249, "epoch": 220} {"train_loss": -4.947617053985596, "global_step": 9250, "epoch": 220} {"train_loss": -5.058740615844727, "global_step": 9251, "epoch": 220} {"train_loss": -4.97526741027832, "global_step": 9252, "epoch": 220} {"train_loss": -4.8729352951049805, "global_step": 9253, "epoch": 220} {"train_loss": -4.973360061645508, "global_step": 9254, "epoch": 220} {"train_loss": -5.03348445892334, "global_step": 9255, "epoch": 220} {"train_loss": -5.038583755493164, "global_step": 9256, "epoch": 220} {"train_loss": -5.12396240234375, "global_step": 9257, "epoch": 220} {"train_loss": -5.055637359619141, "global_step": 9258, "epoch": 220} {"train_loss": -4.937047004699707, "global_step": 9259, "epoch": 220} {"train_loss": -5.105199337005615, "global_step": 9260, "epoch": 220} {"train_loss": -4.989931106567383, "global_step": 9261, "epoch": 220} {"train_loss": -4.949419021606445, "global_step": 9262, "epoch": 220} {"train_loss": -5.1344757080078125, "global_step": 9263, "epoch": 220} {"train_loss": -5.171597957611084, "global_step": 9264, "epoch": 220} {"train_loss": -4.991612911224365, "global_step": 9265, "epoch": 220} {"train_loss": -4.973381996154785, "global_step": 9266, "epoch": 220} {"train_loss": -5.021881580352783, "global_step": 9267, "epoch": 220} {"train_loss": -5.121997833251953, "global_step": 9268, "epoch": 220} {"train_loss": -5.006187438964844, "global_step": 9269, "epoch": 220} {"train_loss": -5.0304765701293945, "global_step": 9270, "epoch": 220} {"train_loss": -5.057929039001465, "global_step": 9271, "epoch": 220} {"train_loss": -5.104767799377441, "global_step": 9272, "epoch": 220} {"train_loss": -5.007530212402344, "global_step": 9273, "epoch": 220} {"train_loss": -5.1172943115234375, "global_step": 9274, "epoch": 220} {"train_loss": -5.090744495391846, "global_step": 9275, "epoch": 220} {"train_loss": -5.028686046600342, "global_step": 9276, "epoch": 220} {"train_loss": -5.15779447555542, "global_step": 9277, "epoch": 220} {"train_loss": -5.085895538330078, "global_step": 9278, "epoch": 220} {"train_loss": -4.9394731521606445, "global_step": 9279, "epoch": 220} {"train_loss": -4.983246326446533, "global_step": 9280, "epoch": 220} {"train_loss": -5.028430530003139, "global_step": 9281, "epoch": 220, "val_loss": 71129.0234375} {"train_loss": -5.0824174880981445, "global_step": 9282, "epoch": 221} {"train_loss": -5.128413677215576, "global_step": 9283, "epoch": 221} {"train_loss": -4.935039520263672, "global_step": 9284, "epoch": 221} {"train_loss": -4.8579254150390625, "global_step": 9285, "epoch": 221} {"train_loss": -4.937770366668701, "global_step": 9286, "epoch": 221} {"train_loss": -5.054458141326904, "global_step": 9287, "epoch": 221} {"train_loss": -5.135928153991699, "global_step": 9288, "epoch": 221} {"train_loss": -4.961606979370117, "global_step": 9289, "epoch": 221} {"train_loss": -5.068312168121338, "global_step": 9290, "epoch": 221} {"train_loss": -5.138584136962891, "global_step": 9291, "epoch": 221} {"train_loss": -4.930271625518799, "global_step": 9292, "epoch": 221} {"train_loss": -4.947765827178955, "global_step": 9293, "epoch": 221} {"train_loss": -5.05581521987915, "global_step": 9294, "epoch": 221} {"train_loss": -5.055322647094727, "global_step": 9295, "epoch": 221} {"train_loss": -5.048544406890869, "global_step": 9296, "epoch": 221} {"train_loss": -5.10838508605957, "global_step": 9297, "epoch": 221} {"train_loss": -4.947327613830566, "global_step": 9298, "epoch": 221} {"train_loss": -5.015637397766113, "global_step": 9299, "epoch": 221} {"train_loss": -5.081827163696289, "global_step": 9300, "epoch": 221} {"train_loss": -5.039494037628174, "global_step": 9301, "epoch": 221} {"train_loss": -4.938945770263672, "global_step": 9302, "epoch": 221} {"train_loss": -4.905368804931641, "global_step": 9303, "epoch": 221} {"train_loss": -5.1422295570373535, "global_step": 9304, "epoch": 221} {"train_loss": -5.013078689575195, "global_step": 9305, "epoch": 221} {"train_loss": -4.77862024307251, "global_step": 9306, "epoch": 221} {"train_loss": -4.938601493835449, "global_step": 9307, "epoch": 221} {"train_loss": -5.023387908935547, "global_step": 9308, "epoch": 221} {"train_loss": -4.774721622467041, "global_step": 9309, "epoch": 221} {"train_loss": -4.776155471801758, "global_step": 9310, "epoch": 221} {"train_loss": -4.955322742462158, "global_step": 9311, "epoch": 221} {"train_loss": -4.917985439300537, "global_step": 9312, "epoch": 221} {"train_loss": -5.003048419952393, "global_step": 9313, "epoch": 221} {"train_loss": -4.818439960479736, "global_step": 9314, "epoch": 221} {"train_loss": -5.057460784912109, "global_step": 9315, "epoch": 221} {"train_loss": -4.915840148925781, "global_step": 9316, "epoch": 221} {"train_loss": -4.890124320983887, "global_step": 9317, "epoch": 221} {"train_loss": -5.016239643096924, "global_step": 9318, "epoch": 221} {"train_loss": -4.874014377593994, "global_step": 9319, "epoch": 221} {"train_loss": -4.990221977233887, "global_step": 9320, "epoch": 221} {"train_loss": -5.018073558807373, "global_step": 9321, "epoch": 221} {"train_loss": -5.041778564453125, "global_step": 9322, "epoch": 221} {"train_loss": -4.985599631354923, "global_step": 9323, "epoch": 221, "val_loss": 70715.890625} {"train_loss": -5.130123138427734, "global_step": 9324, "epoch": 222} {"train_loss": -4.958489418029785, "global_step": 9325, "epoch": 222} {"train_loss": -5.107974052429199, "global_step": 9326, "epoch": 222} {"train_loss": -4.984114170074463, "global_step": 9327, "epoch": 222} {"train_loss": -4.949383735656738, "global_step": 9328, "epoch": 222} {"train_loss": -5.059321880340576, "global_step": 9329, "epoch": 222} {"train_loss": -5.1308274269104, "global_step": 9330, "epoch": 222} {"train_loss": -5.001711368560791, "global_step": 9331, "epoch": 222} {"train_loss": -4.922219276428223, "global_step": 9332, "epoch": 222} {"train_loss": -5.190264701843262, "global_step": 9333, "epoch": 222} {"train_loss": -5.031248092651367, "global_step": 9334, "epoch": 222} {"train_loss": -5.112790107727051, "global_step": 9335, "epoch": 222} {"train_loss": -4.994593620300293, "global_step": 9336, "epoch": 222} {"train_loss": -5.00913143157959, "global_step": 9337, "epoch": 222} {"train_loss": -5.004874229431152, "global_step": 9338, "epoch": 222} {"train_loss": -5.1042561531066895, "global_step": 9339, "epoch": 222} {"train_loss": -4.9857683181762695, "global_step": 9340, "epoch": 222} {"train_loss": -4.985659599304199, "global_step": 9341, "epoch": 222} {"train_loss": -5.1143622398376465, "global_step": 9342, "epoch": 222} {"train_loss": -5.076644420623779, "global_step": 9343, "epoch": 222} {"train_loss": -5.032927989959717, "global_step": 9344, "epoch": 222} {"train_loss": -5.058957099914551, "global_step": 9345, "epoch": 222} {"train_loss": -4.987013816833496, "global_step": 9346, "epoch": 222} {"train_loss": -4.918242454528809, "global_step": 9347, "epoch": 222} {"train_loss": -4.911427974700928, "global_step": 9348, "epoch": 222} {"train_loss": -4.822753429412842, "global_step": 9349, "epoch": 222} {"train_loss": -5.200272560119629, "global_step": 9350, "epoch": 222} {"train_loss": -5.037721633911133, "global_step": 9351, "epoch": 222} {"train_loss": -4.994258880615234, "global_step": 9352, "epoch": 222} {"train_loss": -5.1129350662231445, "global_step": 9353, "epoch": 222} {"train_loss": -5.089883327484131, "global_step": 9354, "epoch": 222} {"train_loss": -5.10103702545166, "global_step": 9355, "epoch": 222} {"train_loss": -4.978450298309326, "global_step": 9356, "epoch": 222} {"train_loss": -5.004057884216309, "global_step": 9357, "epoch": 222} {"train_loss": -4.985568046569824, "global_step": 9358, "epoch": 222} {"train_loss": -4.898672103881836, "global_step": 9359, "epoch": 222} {"train_loss": -5.0188093185424805, "global_step": 9360, "epoch": 222} {"train_loss": -4.984332084655762, "global_step": 9361, "epoch": 222} {"train_loss": -4.9169697761535645, "global_step": 9362, "epoch": 222} {"train_loss": -5.006361961364746, "global_step": 9363, "epoch": 222} {"train_loss": -5.082311630249023, "global_step": 9364, "epoch": 222} {"train_loss": -5.024456818898519, "global_step": 9365, "epoch": 222, "val_loss": 71516.0703125} {"train_loss": -4.840384483337402, "global_step": 9366, "epoch": 223} {"train_loss": -5.032388210296631, "global_step": 9367, "epoch": 223} {"train_loss": -5.035774230957031, "global_step": 9368, "epoch": 223} {"train_loss": -5.132137775421143, "global_step": 9369, "epoch": 223} {"train_loss": -4.846116542816162, "global_step": 9370, "epoch": 223} {"train_loss": -5.06533145904541, "global_step": 9371, "epoch": 223} {"train_loss": -4.984132289886475, "global_step": 9372, "epoch": 223} {"train_loss": -4.905495643615723, "global_step": 9373, "epoch": 223} {"train_loss": -5.054111003875732, "global_step": 9374, "epoch": 223} {"train_loss": -5.009437561035156, "global_step": 9375, "epoch": 223} {"train_loss": -4.999114513397217, "global_step": 9376, "epoch": 223} {"train_loss": -5.078138828277588, "global_step": 9377, "epoch": 223} {"train_loss": -4.98778772354126, "global_step": 9378, "epoch": 223} {"train_loss": -5.099246025085449, "global_step": 9379, "epoch": 223} {"train_loss": -5.072758674621582, "global_step": 9380, "epoch": 223} {"train_loss": -5.0491485595703125, "global_step": 9381, "epoch": 223} {"train_loss": -5.011438369750977, "global_step": 9382, "epoch": 223} {"train_loss": -5.020951271057129, "global_step": 9383, "epoch": 223} {"train_loss": -5.107181549072266, "global_step": 9384, "epoch": 223} {"train_loss": -5.094822883605957, "global_step": 9385, "epoch": 223} {"train_loss": -4.985923767089844, "global_step": 9386, "epoch": 223} {"train_loss": -5.042233467102051, "global_step": 9387, "epoch": 223} {"train_loss": -4.984036922454834, "global_step": 9388, "epoch": 223} {"train_loss": -4.887197494506836, "global_step": 9389, "epoch": 223} {"train_loss": -5.0906524658203125, "global_step": 9390, "epoch": 223} {"train_loss": -4.975071907043457, "global_step": 9391, "epoch": 223} {"train_loss": -5.04111385345459, "global_step": 9392, "epoch": 223} {"train_loss": -5.013341903686523, "global_step": 9393, "epoch": 223} {"train_loss": -4.920112609863281, "global_step": 9394, "epoch": 223} {"train_loss": -4.954042911529541, "global_step": 9395, "epoch": 223} {"train_loss": -4.946244239807129, "global_step": 9396, "epoch": 223} {"train_loss": -5.041858673095703, "global_step": 9397, "epoch": 223} {"train_loss": -5.098772048950195, "global_step": 9398, "epoch": 223} {"train_loss": -4.992209434509277, "global_step": 9399, "epoch": 223} {"train_loss": -5.043140888214111, "global_step": 9400, "epoch": 223} {"train_loss": -5.092747688293457, "global_step": 9401, "epoch": 223} {"train_loss": -4.9880523681640625, "global_step": 9402, "epoch": 223} {"train_loss": -5.123111724853516, "global_step": 9403, "epoch": 223} {"train_loss": -5.1343584060668945, "global_step": 9404, "epoch": 223} {"train_loss": -4.999799728393555, "global_step": 9405, "epoch": 223} {"train_loss": -5.075232028961182, "global_step": 9406, "epoch": 223} {"train_loss": -5.020852679298038, "global_step": 9407, "epoch": 223, "val_loss": 71338.1796875} {"train_loss": -4.995957374572754, "global_step": 9408, "epoch": 224} {"train_loss": -5.031131744384766, "global_step": 9409, "epoch": 224} {"train_loss": -5.00576114654541, "global_step": 9410, "epoch": 224} {"train_loss": -5.11680793762207, "global_step": 9411, "epoch": 224} {"train_loss": -5.085906982421875, "global_step": 9412, "epoch": 224} {"train_loss": -5.033768653869629, "global_step": 9413, "epoch": 224} {"train_loss": -5.151146411895752, "global_step": 9414, "epoch": 224} {"train_loss": -4.992194175720215, "global_step": 9415, "epoch": 224} {"train_loss": -5.0850372314453125, "global_step": 9416, "epoch": 224} {"train_loss": -5.099865913391113, "global_step": 9417, "epoch": 224} {"train_loss": -5.13918924331665, "global_step": 9418, "epoch": 224} {"train_loss": -5.06203556060791, "global_step": 9419, "epoch": 224} {"train_loss": -4.993617057800293, "global_step": 9420, "epoch": 224} {"train_loss": -4.872315406799316, "global_step": 9421, "epoch": 224} {"train_loss": -5.026557445526123, "global_step": 9422, "epoch": 224} {"train_loss": -5.084907531738281, "global_step": 9423, "epoch": 224} {"train_loss": -4.913592338562012, "global_step": 9424, "epoch": 224} {"train_loss": -5.02841854095459, "global_step": 9425, "epoch": 224} {"train_loss": -4.994659423828125, "global_step": 9426, "epoch": 224} {"train_loss": -4.964818000793457, "global_step": 9427, "epoch": 224} {"train_loss": -4.890165328979492, "global_step": 9428, "epoch": 224} {"train_loss": -5.003181457519531, "global_step": 9429, "epoch": 224} {"train_loss": -4.937777519226074, "global_step": 9430, "epoch": 224} {"train_loss": -4.857983112335205, "global_step": 9431, "epoch": 224} {"train_loss": -5.0530195236206055, "global_step": 9432, "epoch": 224} {"train_loss": -4.96776008605957, "global_step": 9433, "epoch": 224} {"train_loss": -5.067410945892334, "global_step": 9434, "epoch": 224} {"train_loss": -5.064756393432617, "global_step": 9435, "epoch": 224} {"train_loss": -4.862027645111084, "global_step": 9436, "epoch": 224} {"train_loss": -4.914988994598389, "global_step": 9437, "epoch": 224} {"train_loss": -4.894366264343262, "global_step": 9438, "epoch": 224} {"train_loss": -4.814718246459961, "global_step": 9439, "epoch": 224} {"train_loss": -5.089884281158447, "global_step": 9440, "epoch": 224} {"train_loss": -4.86857795715332, "global_step": 9441, "epoch": 224} {"train_loss": -4.8416948318481445, "global_step": 9442, "epoch": 224} {"train_loss": -5.098754405975342, "global_step": 9443, "epoch": 224} {"train_loss": -4.994785308837891, "global_step": 9444, "epoch": 224} {"train_loss": -4.997529983520508, "global_step": 9445, "epoch": 224} {"train_loss": -5.057572364807129, "global_step": 9446, "epoch": 224} {"train_loss": -5.03867244720459, "global_step": 9447, "epoch": 224} {"train_loss": -5.018329620361328, "global_step": 9448, "epoch": 224} {"train_loss": -4.998482420330956, "global_step": 9449, "epoch": 224, "val_loss": 71465.625} {"train_loss": -5.012911319732666, "global_step": 9450, "epoch": 225} {"train_loss": -4.9994635581970215, "global_step": 9451, "epoch": 225} {"train_loss": -5.169682502746582, "global_step": 9452, "epoch": 225} {"train_loss": -5.078108787536621, "global_step": 9453, "epoch": 225} {"train_loss": -4.984180450439453, "global_step": 9454, "epoch": 225} {"train_loss": -5.066372871398926, "global_step": 9455, "epoch": 225} {"train_loss": -4.937899589538574, "global_step": 9456, "epoch": 225} {"train_loss": -5.044246673583984, "global_step": 9457, "epoch": 225} {"train_loss": -5.044107437133789, "global_step": 9458, "epoch": 225} {"train_loss": -5.012022495269775, "global_step": 9459, "epoch": 225} {"train_loss": -5.032503128051758, "global_step": 9460, "epoch": 225} {"train_loss": -5.173593521118164, "global_step": 9461, "epoch": 225} {"train_loss": -4.937533378601074, "global_step": 9462, "epoch": 225} {"train_loss": -5.024654865264893, "global_step": 9463, "epoch": 225} {"train_loss": -5.014705657958984, "global_step": 9464, "epoch": 225} {"train_loss": -4.991045951843262, "global_step": 9465, "epoch": 225} {"train_loss": -5.05526065826416, "global_step": 9466, "epoch": 225} {"train_loss": -5.065485954284668, "global_step": 9467, "epoch": 225} {"train_loss": -5.049487590789795, "global_step": 9468, "epoch": 225} {"train_loss": -4.956889629364014, "global_step": 9469, "epoch": 225} {"train_loss": -5.161324977874756, "global_step": 9470, "epoch": 225} {"train_loss": -5.028459072113037, "global_step": 9471, "epoch": 225} {"train_loss": -4.9645094871521, "global_step": 9472, "epoch": 225} {"train_loss": -5.024534702301025, "global_step": 9473, "epoch": 225} {"train_loss": -5.121046543121338, "global_step": 9474, "epoch": 225} {"train_loss": -5.097268104553223, "global_step": 9475, "epoch": 225} {"train_loss": -4.917304515838623, "global_step": 9476, "epoch": 225} {"train_loss": -5.008251667022705, "global_step": 9477, "epoch": 225} {"train_loss": -4.984329700469971, "global_step": 9478, "epoch": 225} {"train_loss": -5.060219764709473, "global_step": 9479, "epoch": 225} {"train_loss": -4.997010231018066, "global_step": 9480, "epoch": 225} {"train_loss": -5.088174819946289, "global_step": 9481, "epoch": 225} {"train_loss": -5.232914447784424, "global_step": 9482, "epoch": 225} {"train_loss": -5.014070510864258, "global_step": 9483, "epoch": 225} {"train_loss": -5.068921089172363, "global_step": 9484, "epoch": 225} {"train_loss": -4.7117180824279785, "global_step": 9485, "epoch": 225} {"train_loss": -5.132613658905029, "global_step": 9486, "epoch": 225} {"train_loss": -5.148499488830566, "global_step": 9487, "epoch": 225} {"train_loss": -4.979453086853027, "global_step": 9488, "epoch": 225} {"train_loss": -4.7679948806762695, "global_step": 9489, "epoch": 225} {"train_loss": -5.019835472106934, "global_step": 9490, "epoch": 225} {"train_loss": -5.027643691925776, "global_step": 9491, "epoch": 225, "val_loss": 71272.9609375} {"train_loss": -5.019333839416504, "global_step": 9492, "epoch": 226} {"train_loss": -4.956053256988525, "global_step": 9493, "epoch": 226} {"train_loss": -4.984677314758301, "global_step": 9494, "epoch": 226} {"train_loss": -4.887048721313477, "global_step": 9495, "epoch": 226} {"train_loss": -4.998477935791016, "global_step": 9496, "epoch": 226} {"train_loss": -5.043398857116699, "global_step": 9497, "epoch": 226} {"train_loss": -5.055239677429199, "global_step": 9498, "epoch": 226} {"train_loss": -5.029380798339844, "global_step": 9499, "epoch": 226} {"train_loss": -5.106078147888184, "global_step": 9500, "epoch": 226} {"train_loss": -4.827639579772949, "global_step": 9501, "epoch": 226} {"train_loss": -5.055777072906494, "global_step": 9502, "epoch": 226} {"train_loss": -5.001365661621094, "global_step": 9503, "epoch": 226} {"train_loss": -4.704899311065674, "global_step": 9504, "epoch": 226} {"train_loss": -5.010612487792969, "global_step": 9505, "epoch": 226} {"train_loss": -4.8383402824401855, "global_step": 9506, "epoch": 226} {"train_loss": -4.827106952667236, "global_step": 9507, "epoch": 226} {"train_loss": -4.936128616333008, "global_step": 9508, "epoch": 226} {"train_loss": -4.997920036315918, "global_step": 9509, "epoch": 226} {"train_loss": -4.97879695892334, "global_step": 9510, "epoch": 226} {"train_loss": -4.955351829528809, "global_step": 9511, "epoch": 226} {"train_loss": -5.060047149658203, "global_step": 9512, "epoch": 226} {"train_loss": -4.994546413421631, "global_step": 9513, "epoch": 226} {"train_loss": -4.916812896728516, "global_step": 9514, "epoch": 226} {"train_loss": -5.029474258422852, "global_step": 9515, "epoch": 226} {"train_loss": -5.123222827911377, "global_step": 9516, "epoch": 226} {"train_loss": -5.127945899963379, "global_step": 9517, "epoch": 226} {"train_loss": -5.0338850021362305, "global_step": 9518, "epoch": 226} {"train_loss": -4.965821743011475, "global_step": 9519, "epoch": 226} {"train_loss": -5.0836334228515625, "global_step": 9520, "epoch": 226} {"train_loss": -5.0785980224609375, "global_step": 9521, "epoch": 226} {"train_loss": -5.093470096588135, "global_step": 9522, "epoch": 226} {"train_loss": -5.052250862121582, "global_step": 9523, "epoch": 226} {"train_loss": -5.066079616546631, "global_step": 9524, "epoch": 226} {"train_loss": -5.089998245239258, "global_step": 9525, "epoch": 226} {"train_loss": -5.030808448791504, "global_step": 9526, "epoch": 226} {"train_loss": -5.101194381713867, "global_step": 9527, "epoch": 226} {"train_loss": -4.909339904785156, "global_step": 9528, "epoch": 226} {"train_loss": -4.931514739990234, "global_step": 9529, "epoch": 226} {"train_loss": -5.046328544616699, "global_step": 9530, "epoch": 226} {"train_loss": -4.836889266967773, "global_step": 9531, "epoch": 226} {"train_loss": -4.957675457000732, "global_step": 9532, "epoch": 226} {"train_loss": -4.999082099823725, "global_step": 9533, "epoch": 226, "val_loss": 71833.0625} {"train_loss": -4.981103897094727, "global_step": 9534, "epoch": 227} {"train_loss": -5.1428542137146, "global_step": 9535, "epoch": 227} {"train_loss": -5.039070129394531, "global_step": 9536, "epoch": 227} {"train_loss": -5.027188777923584, "global_step": 9537, "epoch": 227} {"train_loss": -4.992847442626953, "global_step": 9538, "epoch": 227} {"train_loss": -5.019074440002441, "global_step": 9539, "epoch": 227} {"train_loss": -5.129015922546387, "global_step": 9540, "epoch": 227} {"train_loss": -5.046156883239746, "global_step": 9541, "epoch": 227} {"train_loss": -4.987737655639648, "global_step": 9542, "epoch": 227} {"train_loss": -4.809431076049805, "global_step": 9543, "epoch": 227} {"train_loss": -4.97330379486084, "global_step": 9544, "epoch": 227} {"train_loss": -5.09796142578125, "global_step": 9545, "epoch": 227} {"train_loss": -5.079623222351074, "global_step": 9546, "epoch": 227} {"train_loss": -5.0075154304504395, "global_step": 9547, "epoch": 227} {"train_loss": -5.167791366577148, "global_step": 9548, "epoch": 227} {"train_loss": -5.147010803222656, "global_step": 9549, "epoch": 227} {"train_loss": -5.160920143127441, "global_step": 9550, "epoch": 227} {"train_loss": -5.084290981292725, "global_step": 9551, "epoch": 227} {"train_loss": -5.0262556076049805, "global_step": 9552, "epoch": 227} {"train_loss": -5.0821309089660645, "global_step": 9553, "epoch": 227} {"train_loss": -5.026787757873535, "global_step": 9554, "epoch": 227} {"train_loss": -5.009354591369629, "global_step": 9555, "epoch": 227} {"train_loss": -5.01132869720459, "global_step": 9556, "epoch": 227} {"train_loss": -4.933948040008545, "global_step": 9557, "epoch": 227} {"train_loss": -5.1565093994140625, "global_step": 9558, "epoch": 227} {"train_loss": -5.0465264320373535, "global_step": 9559, "epoch": 227} {"train_loss": -5.003103256225586, "global_step": 9560, "epoch": 227} {"train_loss": -4.956679344177246, "global_step": 9561, "epoch": 227} {"train_loss": -5.00016975402832, "global_step": 9562, "epoch": 227} {"train_loss": -5.084747314453125, "global_step": 9563, "epoch": 227} {"train_loss": -5.116135597229004, "global_step": 9564, "epoch": 227} {"train_loss": -5.165252685546875, "global_step": 9565, "epoch": 227} {"train_loss": -5.134223937988281, "global_step": 9566, "epoch": 227} {"train_loss": -5.130037784576416, "global_step": 9567, "epoch": 227} {"train_loss": -5.120124816894531, "global_step": 9568, "epoch": 227} {"train_loss": -5.127646446228027, "global_step": 9569, "epoch": 227} {"train_loss": -5.204629421234131, "global_step": 9570, "epoch": 227} {"train_loss": -5.079972267150879, "global_step": 9571, "epoch": 227} {"train_loss": -5.031819820404053, "global_step": 9572, "epoch": 227} {"train_loss": -4.842293739318848, "global_step": 9573, "epoch": 227} {"train_loss": -4.911250114440918, "global_step": 9574, "epoch": 227} {"train_loss": -5.047212827773321, "global_step": 9575, "epoch": 227, "val_loss": 70380.2734375} {"train_loss": -5.0424418449401855, "global_step": 9576, "epoch": 228} {"train_loss": -5.117053031921387, "global_step": 9577, "epoch": 228} {"train_loss": -5.045742034912109, "global_step": 9578, "epoch": 228} {"train_loss": -5.0357513427734375, "global_step": 9579, "epoch": 228} {"train_loss": -5.13668155670166, "global_step": 9580, "epoch": 228} {"train_loss": -4.976126194000244, "global_step": 9581, "epoch": 228} {"train_loss": -5.026658058166504, "global_step": 9582, "epoch": 228} {"train_loss": -5.024833679199219, "global_step": 9583, "epoch": 228} {"train_loss": -5.155951023101807, "global_step": 9584, "epoch": 228} {"train_loss": -4.9581193923950195, "global_step": 9585, "epoch": 228} {"train_loss": -5.122916221618652, "global_step": 9586, "epoch": 228} {"train_loss": -4.939349174499512, "global_step": 9587, "epoch": 228} {"train_loss": -5.1553955078125, "global_step": 9588, "epoch": 228} {"train_loss": -5.009443283081055, "global_step": 9589, "epoch": 228} {"train_loss": -5.134246349334717, "global_step": 9590, "epoch": 228} {"train_loss": -5.148818016052246, "global_step": 9591, "epoch": 228} {"train_loss": -5.042417526245117, "global_step": 9592, "epoch": 228} {"train_loss": -5.161468029022217, "global_step": 9593, "epoch": 228} {"train_loss": -5.043534278869629, "global_step": 9594, "epoch": 228} {"train_loss": -5.204360008239746, "global_step": 9595, "epoch": 228} {"train_loss": -5.076001167297363, "global_step": 9596, "epoch": 228} {"train_loss": -5.131106376647949, "global_step": 9597, "epoch": 228} {"train_loss": -4.756369590759277, "global_step": 9598, "epoch": 228} {"train_loss": -4.981540679931641, "global_step": 9599, "epoch": 228} {"train_loss": -5.000522613525391, "global_step": 9600, "epoch": 228} {"train_loss": -5.0784993171691895, "global_step": 9601, "epoch": 228} {"train_loss": -5.069738388061523, "global_step": 9602, "epoch": 228} {"train_loss": -5.082266807556152, "global_step": 9603, "epoch": 228} {"train_loss": -4.823553085327148, "global_step": 9604, "epoch": 228} {"train_loss": -5.013468265533447, "global_step": 9605, "epoch": 228} {"train_loss": -4.911689758300781, "global_step": 9606, "epoch": 228} {"train_loss": -4.936892509460449, "global_step": 9607, "epoch": 228} {"train_loss": -4.992483139038086, "global_step": 9608, "epoch": 228} {"train_loss": -5.06889533996582, "global_step": 9609, "epoch": 228} {"train_loss": -5.085968494415283, "global_step": 9610, "epoch": 228} {"train_loss": -4.876572132110596, "global_step": 9611, "epoch": 228} {"train_loss": -4.965123176574707, "global_step": 9612, "epoch": 228} {"train_loss": -5.147699356079102, "global_step": 9613, "epoch": 228} {"train_loss": -4.980871677398682, "global_step": 9614, "epoch": 228} {"train_loss": -4.9473066329956055, "global_step": 9615, "epoch": 228} {"train_loss": -5.125510215759277, "global_step": 9616, "epoch": 228} {"train_loss": -5.0348390738169355, "global_step": 9617, "epoch": 228, "val_loss": 70976.671875} {"train_loss": -5.072751045227051, "global_step": 9618, "epoch": 229} {"train_loss": -5.104419708251953, "global_step": 9619, "epoch": 229} {"train_loss": -5.008743762969971, "global_step": 9620, "epoch": 229} {"train_loss": -4.900551795959473, "global_step": 9621, "epoch": 229} {"train_loss": -5.162570953369141, "global_step": 9622, "epoch": 229} {"train_loss": -4.9375081062316895, "global_step": 9623, "epoch": 229} {"train_loss": -4.953495979309082, "global_step": 9624, "epoch": 229} {"train_loss": -4.908340930938721, "global_step": 9625, "epoch": 229} {"train_loss": -5.003906726837158, "global_step": 9626, "epoch": 229} {"train_loss": -4.998013973236084, "global_step": 9627, "epoch": 229} {"train_loss": -4.921412944793701, "global_step": 9628, "epoch": 229} {"train_loss": -4.9901862144470215, "global_step": 9629, "epoch": 229} {"train_loss": -4.997986793518066, "global_step": 9630, "epoch": 229} {"train_loss": -4.95746374130249, "global_step": 9631, "epoch": 229} {"train_loss": -4.909967422485352, "global_step": 9632, "epoch": 229} {"train_loss": -5.1449408531188965, "global_step": 9633, "epoch": 229} {"train_loss": -4.765013694763184, "global_step": 9634, "epoch": 229} {"train_loss": -5.085633277893066, "global_step": 9635, "epoch": 229} {"train_loss": -5.062079429626465, "global_step": 9636, "epoch": 229} {"train_loss": -4.96679162979126, "global_step": 9637, "epoch": 229} {"train_loss": -5.013528823852539, "global_step": 9638, "epoch": 229} {"train_loss": -5.029601573944092, "global_step": 9639, "epoch": 229} {"train_loss": -4.814419746398926, "global_step": 9640, "epoch": 229} {"train_loss": -5.052742004394531, "global_step": 9641, "epoch": 229} {"train_loss": -5.0202836990356445, "global_step": 9642, "epoch": 229} {"train_loss": -5.089375019073486, "global_step": 9643, "epoch": 229} {"train_loss": -4.862154006958008, "global_step": 9644, "epoch": 229} {"train_loss": -4.930906295776367, "global_step": 9645, "epoch": 229} {"train_loss": -5.121731758117676, "global_step": 9646, "epoch": 229} {"train_loss": -5.070834159851074, "global_step": 9647, "epoch": 229} {"train_loss": -5.131769180297852, "global_step": 9648, "epoch": 229} {"train_loss": -4.930437088012695, "global_step": 9649, "epoch": 229} {"train_loss": -5.033114910125732, "global_step": 9650, "epoch": 229} {"train_loss": -5.051906585693359, "global_step": 9651, "epoch": 229} {"train_loss": -5.097090244293213, "global_step": 9652, "epoch": 229} {"train_loss": -5.031381607055664, "global_step": 9653, "epoch": 229} {"train_loss": -5.037722587585449, "global_step": 9654, "epoch": 229} {"train_loss": -5.02100944519043, "global_step": 9655, "epoch": 229} {"train_loss": -5.044127464294434, "global_step": 9656, "epoch": 229} {"train_loss": -5.121868133544922, "global_step": 9657, "epoch": 229} {"train_loss": -5.0465288162231445, "global_step": 9658, "epoch": 229} {"train_loss": -5.009809153420584, "global_step": 9659, "epoch": 229, "val_loss": 71285.7578125} {"train_loss": -5.103609085083008, "global_step": 9660, "epoch": 230} {"train_loss": -4.970305442810059, "global_step": 9661, "epoch": 230} {"train_loss": -5.040067195892334, "global_step": 9662, "epoch": 230} {"train_loss": -4.875439643859863, "global_step": 9663, "epoch": 230} {"train_loss": -5.008823394775391, "global_step": 9664, "epoch": 230} {"train_loss": -4.9212799072265625, "global_step": 9665, "epoch": 230} {"train_loss": -5.102673530578613, "global_step": 9666, "epoch": 230} {"train_loss": -5.1192498207092285, "global_step": 9667, "epoch": 230} {"train_loss": -5.104109764099121, "global_step": 9668, "epoch": 230} {"train_loss": -5.176775932312012, "global_step": 9669, "epoch": 230} {"train_loss": -4.95609188079834, "global_step": 9670, "epoch": 230} {"train_loss": -4.934429168701172, "global_step": 9671, "epoch": 230} {"train_loss": -5.1533203125, "global_step": 9672, "epoch": 230} {"train_loss": -5.082337856292725, "global_step": 9673, "epoch": 230} {"train_loss": -5.004301071166992, "global_step": 9674, "epoch": 230} {"train_loss": -5.13968563079834, "global_step": 9675, "epoch": 230} {"train_loss": -5.027498245239258, "global_step": 9676, "epoch": 230} {"train_loss": -5.084334373474121, "global_step": 9677, "epoch": 230} {"train_loss": -5.082063674926758, "global_step": 9678, "epoch": 230} {"train_loss": -5.080080032348633, "global_step": 9679, "epoch": 230} {"train_loss": -4.949031829833984, "global_step": 9680, "epoch": 230} {"train_loss": -5.032437324523926, "global_step": 9681, "epoch": 230} {"train_loss": -4.965455532073975, "global_step": 9682, "epoch": 230} {"train_loss": -4.990085601806641, "global_step": 9683, "epoch": 230} {"train_loss": -5.1046929359436035, "global_step": 9684, "epoch": 230} {"train_loss": -5.044291973114014, "global_step": 9685, "epoch": 230} {"train_loss": -5.129400253295898, "global_step": 9686, "epoch": 230} {"train_loss": -5.060792922973633, "global_step": 9687, "epoch": 230} {"train_loss": -4.986246109008789, "global_step": 9688, "epoch": 230} {"train_loss": -5.110813617706299, "global_step": 9689, "epoch": 230} {"train_loss": -5.055444717407227, "global_step": 9690, "epoch": 230} {"train_loss": -5.033953666687012, "global_step": 9691, "epoch": 230} {"train_loss": -5.0439982414245605, "global_step": 9692, "epoch": 230} {"train_loss": -5.032747268676758, "global_step": 9693, "epoch": 230} {"train_loss": -5.045409202575684, "global_step": 9694, "epoch": 230} {"train_loss": -5.051905632019043, "global_step": 9695, "epoch": 230} {"train_loss": -4.951678276062012, "global_step": 9696, "epoch": 230} {"train_loss": -5.069388389587402, "global_step": 9697, "epoch": 230} {"train_loss": -5.028722763061523, "global_step": 9698, "epoch": 230} {"train_loss": -5.101502895355225, "global_step": 9699, "epoch": 230} {"train_loss": -4.932156085968018, "global_step": 9700, "epoch": 230} {"train_loss": -5.045278844379244, "global_step": 9701, "epoch": 230, "val_loss": 70613.3046875} {"train_loss": -5.145601272583008, "global_step": 9702, "epoch": 231} {"train_loss": -4.984981060028076, "global_step": 9703, "epoch": 231} {"train_loss": -5.179001808166504, "global_step": 9704, "epoch": 231} {"train_loss": -5.076434135437012, "global_step": 9705, "epoch": 231} {"train_loss": -5.061652183532715, "global_step": 9706, "epoch": 231} {"train_loss": -5.100176811218262, "global_step": 9707, "epoch": 231} {"train_loss": -5.2217512130737305, "global_step": 9708, "epoch": 231} {"train_loss": -5.150992393493652, "global_step": 9709, "epoch": 231} {"train_loss": -4.78607702255249, "global_step": 9710, "epoch": 231} {"train_loss": -4.906053066253662, "global_step": 9711, "epoch": 231} {"train_loss": -5.139873504638672, "global_step": 9712, "epoch": 231} {"train_loss": -4.966897487640381, "global_step": 9713, "epoch": 231} {"train_loss": -4.8277788162231445, "global_step": 9714, "epoch": 231} {"train_loss": -4.963576316833496, "global_step": 9715, "epoch": 231} {"train_loss": -5.061190605163574, "global_step": 9716, "epoch": 231} {"train_loss": -4.946933746337891, "global_step": 9717, "epoch": 231} {"train_loss": -4.943221092224121, "global_step": 9718, "epoch": 231} {"train_loss": -5.1531243324279785, "global_step": 9719, "epoch": 231} {"train_loss": -5.070925235748291, "global_step": 9720, "epoch": 231} {"train_loss": -5.050933837890625, "global_step": 9721, "epoch": 231} {"train_loss": -5.115344047546387, "global_step": 9722, "epoch": 231} {"train_loss": -5.074610710144043, "global_step": 9723, "epoch": 231} {"train_loss": -4.999539375305176, "global_step": 9724, "epoch": 231} {"train_loss": -4.918520927429199, "global_step": 9725, "epoch": 231} {"train_loss": -4.957498550415039, "global_step": 9726, "epoch": 231} {"train_loss": -4.997331142425537, "global_step": 9727, "epoch": 231} {"train_loss": -4.984570503234863, "global_step": 9728, "epoch": 231} {"train_loss": -5.045251846313477, "global_step": 9729, "epoch": 231} {"train_loss": -5.132135391235352, "global_step": 9730, "epoch": 231} {"train_loss": -5.089596748352051, "global_step": 9731, "epoch": 231} {"train_loss": -5.0217061042785645, "global_step": 9732, "epoch": 231} {"train_loss": -4.962015628814697, "global_step": 9733, "epoch": 231} {"train_loss": -5.167532444000244, "global_step": 9734, "epoch": 231} {"train_loss": -5.1003193855285645, "global_step": 9735, "epoch": 231} {"train_loss": -4.935281753540039, "global_step": 9736, "epoch": 231} {"train_loss": -5.018409252166748, "global_step": 9737, "epoch": 231} {"train_loss": -5.028911590576172, "global_step": 9738, "epoch": 231} {"train_loss": -4.901088237762451, "global_step": 9739, "epoch": 231} {"train_loss": -4.942500114440918, "global_step": 9740, "epoch": 231} {"train_loss": -5.040863990783691, "global_step": 9741, "epoch": 231} {"train_loss": -5.238611221313477, "global_step": 9742, "epoch": 231} {"train_loss": -5.035388810294015, "global_step": 9743, "epoch": 231, "val_loss": 71837.265625} {"train_loss": -4.9539031982421875, "global_step": 9744, "epoch": 232} {"train_loss": -4.862971305847168, "global_step": 9745, "epoch": 232} {"train_loss": -5.093563556671143, "global_step": 9746, "epoch": 232} {"train_loss": -5.0142669677734375, "global_step": 9747, "epoch": 232} {"train_loss": -4.974555969238281, "global_step": 9748, "epoch": 232} {"train_loss": -5.030887126922607, "global_step": 9749, "epoch": 232} {"train_loss": -4.95570707321167, "global_step": 9750, "epoch": 232} {"train_loss": -5.055644989013672, "global_step": 9751, "epoch": 232} {"train_loss": -5.003589630126953, "global_step": 9752, "epoch": 232} {"train_loss": -5.031956672668457, "global_step": 9753, "epoch": 232} {"train_loss": -5.196603298187256, "global_step": 9754, "epoch": 232} {"train_loss": -5.144644737243652, "global_step": 9755, "epoch": 232} {"train_loss": -5.020781993865967, "global_step": 9756, "epoch": 232} {"train_loss": -5.090695381164551, "global_step": 9757, "epoch": 232} {"train_loss": -5.205270290374756, "global_step": 9758, "epoch": 232} {"train_loss": -4.903336524963379, "global_step": 9759, "epoch": 232} {"train_loss": -4.985157012939453, "global_step": 9760, "epoch": 232} {"train_loss": -5.03752326965332, "global_step": 9761, "epoch": 232} {"train_loss": -5.162417888641357, "global_step": 9762, "epoch": 232} {"train_loss": -5.023748397827148, "global_step": 9763, "epoch": 232} {"train_loss": -4.96138858795166, "global_step": 9764, "epoch": 232} {"train_loss": -5.04599142074585, "global_step": 9765, "epoch": 232} {"train_loss": -4.960096836090088, "global_step": 9766, "epoch": 232} {"train_loss": -4.997178077697754, "global_step": 9767, "epoch": 232} {"train_loss": -4.83591890335083, "global_step": 9768, "epoch": 232} {"train_loss": -4.978099822998047, "global_step": 9769, "epoch": 232} {"train_loss": -5.055688858032227, "global_step": 9770, "epoch": 232} {"train_loss": -5.002391815185547, "global_step": 9771, "epoch": 232} {"train_loss": -5.096406936645508, "global_step": 9772, "epoch": 232} {"train_loss": -4.982324600219727, "global_step": 9773, "epoch": 232} {"train_loss": -5.158254623413086, "global_step": 9774, "epoch": 232} {"train_loss": -5.015564918518066, "global_step": 9775, "epoch": 232} {"train_loss": -5.032016754150391, "global_step": 9776, "epoch": 232} {"train_loss": -5.024656295776367, "global_step": 9777, "epoch": 232} {"train_loss": -5.016048431396484, "global_step": 9778, "epoch": 232} {"train_loss": -4.957089424133301, "global_step": 9779, "epoch": 232} {"train_loss": -4.982281684875488, "global_step": 9780, "epoch": 232} {"train_loss": -5.130148410797119, "global_step": 9781, "epoch": 232} {"train_loss": -5.0881757736206055, "global_step": 9782, "epoch": 232} {"train_loss": -4.937948226928711, "global_step": 9783, "epoch": 232} {"train_loss": -4.906881332397461, "global_step": 9784, "epoch": 232} {"train_loss": -5.020840576716831, "global_step": 9785, "epoch": 232, "val_loss": 70907.9375} {"train_loss": -5.150723934173584, "global_step": 9786, "epoch": 233} {"train_loss": -5.001851558685303, "global_step": 9787, "epoch": 233} {"train_loss": -5.096705436706543, "global_step": 9788, "epoch": 233} {"train_loss": -4.954663276672363, "global_step": 9789, "epoch": 233} {"train_loss": -5.134603977203369, "global_step": 9790, "epoch": 233} {"train_loss": -5.06842041015625, "global_step": 9791, "epoch": 233} {"train_loss": -5.1314921379089355, "global_step": 9792, "epoch": 233} {"train_loss": -5.103943824768066, "global_step": 9793, "epoch": 233} {"train_loss": -5.104876518249512, "global_step": 9794, "epoch": 233} {"train_loss": -5.093847274780273, "global_step": 9795, "epoch": 233} {"train_loss": -5.088253974914551, "global_step": 9796, "epoch": 233} {"train_loss": -5.038851261138916, "global_step": 9797, "epoch": 233} {"train_loss": -4.9840168952941895, "global_step": 9798, "epoch": 233} {"train_loss": -5.069561958312988, "global_step": 9799, "epoch": 233} {"train_loss": -4.968447685241699, "global_step": 9800, "epoch": 233} {"train_loss": -5.04567813873291, "global_step": 9801, "epoch": 233} {"train_loss": -5.045657157897949, "global_step": 9802, "epoch": 233} {"train_loss": -4.988035202026367, "global_step": 9803, "epoch": 233} {"train_loss": -5.046867370605469, "global_step": 9804, "epoch": 233} {"train_loss": -5.097115516662598, "global_step": 9805, "epoch": 233} {"train_loss": -4.981269836425781, "global_step": 9806, "epoch": 233} {"train_loss": -5.15140438079834, "global_step": 9807, "epoch": 233} {"train_loss": -5.095666885375977, "global_step": 9808, "epoch": 233} {"train_loss": -5.150216102600098, "global_step": 9809, "epoch": 233} {"train_loss": -4.818808555603027, "global_step": 9810, "epoch": 233} {"train_loss": -4.974381446838379, "global_step": 9811, "epoch": 233} {"train_loss": -4.992733478546143, "global_step": 9812, "epoch": 233} {"train_loss": -4.924592971801758, "global_step": 9813, "epoch": 233} {"train_loss": -5.0866289138793945, "global_step": 9814, "epoch": 233} {"train_loss": -5.010209083557129, "global_step": 9815, "epoch": 233} {"train_loss": -5.056606292724609, "global_step": 9816, "epoch": 233} {"train_loss": -5.042341709136963, "global_step": 9817, "epoch": 233} {"train_loss": -4.998606204986572, "global_step": 9818, "epoch": 233} {"train_loss": -4.968709945678711, "global_step": 9819, "epoch": 233} {"train_loss": -5.11552619934082, "global_step": 9820, "epoch": 233} {"train_loss": -5.081170082092285, "global_step": 9821, "epoch": 233} {"train_loss": -5.004927635192871, "global_step": 9822, "epoch": 233} {"train_loss": -5.048060417175293, "global_step": 9823, "epoch": 233} {"train_loss": -5.011444091796875, "global_step": 9824, "epoch": 233} {"train_loss": -5.140042781829834, "global_step": 9825, "epoch": 233} {"train_loss": -5.069632530212402, "global_step": 9826, "epoch": 233} {"train_loss": -5.050394228526524, "global_step": 9827, "epoch": 233, "val_loss": 71068.5859375} {"train_loss": -4.9394731521606445, "global_step": 9828, "epoch": 234} {"train_loss": -5.014634132385254, "global_step": 9829, "epoch": 234} {"train_loss": -5.036638259887695, "global_step": 9830, "epoch": 234} {"train_loss": -4.780457496643066, "global_step": 9831, "epoch": 234} {"train_loss": -4.982004642486572, "global_step": 9832, "epoch": 234} {"train_loss": -5.024575233459473, "global_step": 9833, "epoch": 234} {"train_loss": -5.208672523498535, "global_step": 9834, "epoch": 234} {"train_loss": -5.0056304931640625, "global_step": 9835, "epoch": 234} {"train_loss": -4.836336135864258, "global_step": 9836, "epoch": 234} {"train_loss": -5.051631927490234, "global_step": 9837, "epoch": 234} {"train_loss": -5.001116752624512, "global_step": 9838, "epoch": 234} {"train_loss": -4.832197189331055, "global_step": 9839, "epoch": 234} {"train_loss": -5.001170635223389, "global_step": 9840, "epoch": 234} {"train_loss": -5.026904106140137, "global_step": 9841, "epoch": 234} {"train_loss": -5.163264274597168, "global_step": 9842, "epoch": 234} {"train_loss": -4.839689254760742, "global_step": 9843, "epoch": 234} {"train_loss": -5.068141937255859, "global_step": 9844, "epoch": 234} {"train_loss": -4.772164344787598, "global_step": 9845, "epoch": 234} {"train_loss": -4.84393835067749, "global_step": 9846, "epoch": 234} {"train_loss": -5.132262706756592, "global_step": 9847, "epoch": 234} {"train_loss": -4.959444046020508, "global_step": 9848, "epoch": 234} {"train_loss": -5.08113956451416, "global_step": 9849, "epoch": 234} {"train_loss": -5.143166542053223, "global_step": 9850, "epoch": 234} {"train_loss": -4.840702056884766, "global_step": 9851, "epoch": 234} {"train_loss": -5.16743278503418, "global_step": 9852, "epoch": 234} {"train_loss": -5.227894306182861, "global_step": 9853, "epoch": 234} {"train_loss": -4.98560905456543, "global_step": 9854, "epoch": 234} {"train_loss": -4.973014831542969, "global_step": 9855, "epoch": 234} {"train_loss": -4.9224772453308105, "global_step": 9856, "epoch": 234} {"train_loss": -4.969937324523926, "global_step": 9857, "epoch": 234} {"train_loss": -5.052444934844971, "global_step": 9858, "epoch": 234} {"train_loss": -5.03233003616333, "global_step": 9859, "epoch": 234} {"train_loss": -4.9009504318237305, "global_step": 9860, "epoch": 234} {"train_loss": -4.938706874847412, "global_step": 9861, "epoch": 234} {"train_loss": -5.015449523925781, "global_step": 9862, "epoch": 234} {"train_loss": -4.947253704071045, "global_step": 9863, "epoch": 234} {"train_loss": -5.097797393798828, "global_step": 9864, "epoch": 234} {"train_loss": -4.977861404418945, "global_step": 9865, "epoch": 234} {"train_loss": -4.989879608154297, "global_step": 9866, "epoch": 234} {"train_loss": -5.0257954597473145, "global_step": 9867, "epoch": 234} {"train_loss": -5.123540878295898, "global_step": 9868, "epoch": 234} {"train_loss": -4.996097621463594, "global_step": 9869, "epoch": 234, "val_loss": 70984.0078125} {"train_loss": -5.111177444458008, "global_step": 9870, "epoch": 235} {"train_loss": -5.137949466705322, "global_step": 9871, "epoch": 235} {"train_loss": -5.0785675048828125, "global_step": 9872, "epoch": 235} {"train_loss": -5.107581615447998, "global_step": 9873, "epoch": 235} {"train_loss": -4.97892951965332, "global_step": 9874, "epoch": 235} {"train_loss": -5.063347339630127, "global_step": 9875, "epoch": 235} {"train_loss": -5.1080241203308105, "global_step": 9876, "epoch": 235} {"train_loss": -5.0789008140563965, "global_step": 9877, "epoch": 235} {"train_loss": -5.01173210144043, "global_step": 9878, "epoch": 235} {"train_loss": -5.012843132019043, "global_step": 9879, "epoch": 235} {"train_loss": -4.897721767425537, "global_step": 9880, "epoch": 235} {"train_loss": -5.130635738372803, "global_step": 9881, "epoch": 235} {"train_loss": -5.006097793579102, "global_step": 9882, "epoch": 235} {"train_loss": -4.849632263183594, "global_step": 9883, "epoch": 235} {"train_loss": -4.93995475769043, "global_step": 9884, "epoch": 235} {"train_loss": -5.090583801269531, "global_step": 9885, "epoch": 235} {"train_loss": -4.91793155670166, "global_step": 9886, "epoch": 235} {"train_loss": -4.93086051940918, "global_step": 9887, "epoch": 235} {"train_loss": -5.012295722961426, "global_step": 9888, "epoch": 235} {"train_loss": -4.871499061584473, "global_step": 9889, "epoch": 235} {"train_loss": -5.007944583892822, "global_step": 9890, "epoch": 235} {"train_loss": -5.079653739929199, "global_step": 9891, "epoch": 235} {"train_loss": -4.924095153808594, "global_step": 9892, "epoch": 235} {"train_loss": -4.94283390045166, "global_step": 9893, "epoch": 235} {"train_loss": -5.209532737731934, "global_step": 9894, "epoch": 235} {"train_loss": -5.146093368530273, "global_step": 9895, "epoch": 235} {"train_loss": -5.043949604034424, "global_step": 9896, "epoch": 235} {"train_loss": -5.003939628601074, "global_step": 9897, "epoch": 235} {"train_loss": -5.030008792877197, "global_step": 9898, "epoch": 235} {"train_loss": -5.138176918029785, "global_step": 9899, "epoch": 235} {"train_loss": -4.9507622718811035, "global_step": 9900, "epoch": 235} {"train_loss": -5.0566606521606445, "global_step": 9901, "epoch": 235} {"train_loss": -5.0083160400390625, "global_step": 9902, "epoch": 235} {"train_loss": -5.041094779968262, "global_step": 9903, "epoch": 235} {"train_loss": -5.095790863037109, "global_step": 9904, "epoch": 235} {"train_loss": -4.993231773376465, "global_step": 9905, "epoch": 235} {"train_loss": -4.971362113952637, "global_step": 9906, "epoch": 235} {"train_loss": -4.985333442687988, "global_step": 9907, "epoch": 235} {"train_loss": -4.998831748962402, "global_step": 9908, "epoch": 235} {"train_loss": -5.095128059387207, "global_step": 9909, "epoch": 235} {"train_loss": -4.977461814880371, "global_step": 9910, "epoch": 235} {"train_loss": -5.024996814273653, "global_step": 9911, "epoch": 235, "val_loss": 71258.3125} {"train_loss": -5.103992462158203, "global_step": 9912, "epoch": 236} {"train_loss": -4.961068630218506, "global_step": 9913, "epoch": 236} {"train_loss": -5.074253082275391, "global_step": 9914, "epoch": 236} {"train_loss": -5.141571998596191, "global_step": 9915, "epoch": 236} {"train_loss": -5.102398872375488, "global_step": 9916, "epoch": 236} {"train_loss": -5.004671573638916, "global_step": 9917, "epoch": 236} {"train_loss": -5.104184150695801, "global_step": 9918, "epoch": 236} {"train_loss": -5.082976818084717, "global_step": 9919, "epoch": 236} {"train_loss": -4.931982040405273, "global_step": 9920, "epoch": 236} {"train_loss": -5.110772132873535, "global_step": 9921, "epoch": 236} {"train_loss": -5.174139976501465, "global_step": 9922, "epoch": 236} {"train_loss": -4.952080726623535, "global_step": 9923, "epoch": 236} {"train_loss": -5.037850379943848, "global_step": 9924, "epoch": 236} {"train_loss": -4.951188087463379, "global_step": 9925, "epoch": 236} {"train_loss": -4.9429450035095215, "global_step": 9926, "epoch": 236} {"train_loss": -5.082845687866211, "global_step": 9927, "epoch": 236} {"train_loss": -4.955953121185303, "global_step": 9928, "epoch": 236} {"train_loss": -5.104194641113281, "global_step": 9929, "epoch": 236} {"train_loss": -5.128691673278809, "global_step": 9930, "epoch": 236} {"train_loss": -5.0265326499938965, "global_step": 9931, "epoch": 236} {"train_loss": -4.85023832321167, "global_step": 9932, "epoch": 236} {"train_loss": -5.087624549865723, "global_step": 9933, "epoch": 236} {"train_loss": -5.055526256561279, "global_step": 9934, "epoch": 236} {"train_loss": -4.950797080993652, "global_step": 9935, "epoch": 236} {"train_loss": -4.979561805725098, "global_step": 9936, "epoch": 236} {"train_loss": -5.066919803619385, "global_step": 9937, "epoch": 236} {"train_loss": -5.039831161499023, "global_step": 9938, "epoch": 236} {"train_loss": -5.070437431335449, "global_step": 9939, "epoch": 236} {"train_loss": -5.02412748336792, "global_step": 9940, "epoch": 236} {"train_loss": -5.032946586608887, "global_step": 9941, "epoch": 236} {"train_loss": -4.899500846862793, "global_step": 9942, "epoch": 236} {"train_loss": -5.105327606201172, "global_step": 9943, "epoch": 236} {"train_loss": -4.8929762840271, "global_step": 9944, "epoch": 236} {"train_loss": -4.841543197631836, "global_step": 9945, "epoch": 236} {"train_loss": -4.997425556182861, "global_step": 9946, "epoch": 236} {"train_loss": -4.9627485275268555, "global_step": 9947, "epoch": 236} {"train_loss": -5.041055679321289, "global_step": 9948, "epoch": 236} {"train_loss": -5.041043281555176, "global_step": 9949, "epoch": 236} {"train_loss": -5.123561859130859, "global_step": 9950, "epoch": 236} {"train_loss": -4.802916526794434, "global_step": 9951, "epoch": 236} {"train_loss": -4.927371501922607, "global_step": 9952, "epoch": 236} {"train_loss": -5.020474649610973, "global_step": 9953, "epoch": 236, "val_loss": 73162.6875} {"train_loss": -4.812434196472168, "global_step": 9954, "epoch": 237} {"train_loss": -5.174482345581055, "global_step": 9955, "epoch": 237} {"train_loss": -5.010251998901367, "global_step": 9956, "epoch": 237} {"train_loss": -5.0416998863220215, "global_step": 9957, "epoch": 237} {"train_loss": -4.995307445526123, "global_step": 9958, "epoch": 237} {"train_loss": -4.9175310134887695, "global_step": 9959, "epoch": 237} {"train_loss": -5.090963363647461, "global_step": 9960, "epoch": 237} {"train_loss": -5.052363395690918, "global_step": 9961, "epoch": 237} {"train_loss": -4.911587715148926, "global_step": 9962, "epoch": 237} {"train_loss": -5.064452171325684, "global_step": 9963, "epoch": 237} {"train_loss": -4.882552146911621, "global_step": 9964, "epoch": 237} {"train_loss": -5.0845046043396, "global_step": 9965, "epoch": 237} {"train_loss": -4.906375885009766, "global_step": 9966, "epoch": 237} {"train_loss": -4.912723064422607, "global_step": 9967, "epoch": 237} {"train_loss": -5.032240390777588, "global_step": 9968, "epoch": 237} {"train_loss": -4.956272125244141, "global_step": 9969, "epoch": 237} {"train_loss": -5.201420783996582, "global_step": 9970, "epoch": 237} {"train_loss": -4.8884806632995605, "global_step": 9971, "epoch": 237} {"train_loss": -5.002676010131836, "global_step": 9972, "epoch": 237} {"train_loss": -4.957022190093994, "global_step": 9973, "epoch": 237} {"train_loss": -4.935595512390137, "global_step": 9974, "epoch": 237} {"train_loss": -4.973440170288086, "global_step": 9975, "epoch": 237} {"train_loss": -4.998745441436768, "global_step": 9976, "epoch": 237} {"train_loss": -4.9703569412231445, "global_step": 9977, "epoch": 237} {"train_loss": -4.945429801940918, "global_step": 9978, "epoch": 237} {"train_loss": -5.029698371887207, "global_step": 9979, "epoch": 237} {"train_loss": -5.116275787353516, "global_step": 9980, "epoch": 237} {"train_loss": -5.084637641906738, "global_step": 9981, "epoch": 237} {"train_loss": -5.009469032287598, "global_step": 9982, "epoch": 237} {"train_loss": -5.143978118896484, "global_step": 9983, "epoch": 237} {"train_loss": -5.106369495391846, "global_step": 9984, "epoch": 237} {"train_loss": -5.080849647521973, "global_step": 9985, "epoch": 237} {"train_loss": -5.105062484741211, "global_step": 9986, "epoch": 237} {"train_loss": -5.008388519287109, "global_step": 9987, "epoch": 237} {"train_loss": -4.859705924987793, "global_step": 9988, "epoch": 237} {"train_loss": -4.950898170471191, "global_step": 9989, "epoch": 237} {"train_loss": -5.008803367614746, "global_step": 9990, "epoch": 237} {"train_loss": -5.084150791168213, "global_step": 9991, "epoch": 237} {"train_loss": -4.908367156982422, "global_step": 9992, "epoch": 237} {"train_loss": -4.951601505279541, "global_step": 9993, "epoch": 237} {"train_loss": -5.008247375488281, "global_step": 9994, "epoch": 237} {"train_loss": -4.999573105857486, "global_step": 9995, "epoch": 237, "val_loss": 70635.828125} {"train_loss": -5.003732204437256, "global_step": 9996, "epoch": 238} {"train_loss": -5.010289192199707, "global_step": 9997, "epoch": 238} {"train_loss": -5.003479480743408, "global_step": 9998, "epoch": 238} {"train_loss": -4.893496990203857, "global_step": 9999, "epoch": 238} {"train_loss": -5.026712417602539, "global_step": 10000, "epoch": 238} {"train_loss": -4.943275451660156, "global_step": 10001, "epoch": 238} {"train_loss": -5.003689765930176, "global_step": 10002, "epoch": 238} {"train_loss": -5.001543045043945, "global_step": 10003, "epoch": 238} {"train_loss": -4.954785346984863, "global_step": 10004, "epoch": 238} {"train_loss": -5.1082539558410645, "global_step": 10005, "epoch": 238} {"train_loss": -5.114824295043945, "global_step": 10006, "epoch": 238} {"train_loss": -5.04212760925293, "global_step": 10007, "epoch": 238} {"train_loss": -5.028888702392578, "global_step": 10008, "epoch": 238} {"train_loss": -4.953578948974609, "global_step": 10009, "epoch": 238} {"train_loss": -5.031641483306885, "global_step": 10010, "epoch": 238} {"train_loss": -4.979421138763428, "global_step": 10011, "epoch": 238} {"train_loss": -5.1710991859436035, "global_step": 10012, "epoch": 238} {"train_loss": -5.055458068847656, "global_step": 10013, "epoch": 238} {"train_loss": -5.0042405128479, "global_step": 10014, "epoch": 238} {"train_loss": -5.021252632141113, "global_step": 10015, "epoch": 238} {"train_loss": -5.019320487976074, "global_step": 10016, "epoch": 238} {"train_loss": -5.044435024261475, "global_step": 10017, "epoch": 238} {"train_loss": -5.087140083312988, "global_step": 10018, "epoch": 238} {"train_loss": -5.070559501647949, "global_step": 10019, "epoch": 238} {"train_loss": -5.201770782470703, "global_step": 10020, "epoch": 238} {"train_loss": -5.136835098266602, "global_step": 10021, "epoch": 238} {"train_loss": -5.0861382484436035, "global_step": 10022, "epoch": 238} {"train_loss": -4.963465690612793, "global_step": 10023, "epoch": 238} {"train_loss": -5.1981096267700195, "global_step": 10024, "epoch": 238} {"train_loss": -5.133209228515625, "global_step": 10025, "epoch": 238} {"train_loss": -5.056698799133301, "global_step": 10026, "epoch": 238} {"train_loss": -5.023629188537598, "global_step": 10027, "epoch": 238} {"train_loss": -5.121538162231445, "global_step": 10028, "epoch": 238} {"train_loss": -4.901893615722656, "global_step": 10029, "epoch": 238} {"train_loss": -5.018037796020508, "global_step": 10030, "epoch": 238} {"train_loss": -5.040589809417725, "global_step": 10031, "epoch": 238} {"train_loss": -4.982986927032471, "global_step": 10032, "epoch": 238} {"train_loss": -5.018983364105225, "global_step": 10033, "epoch": 238} {"train_loss": -4.975927352905273, "global_step": 10034, "epoch": 238} {"train_loss": -5.0010175704956055, "global_step": 10035, "epoch": 238} {"train_loss": -5.1044511795043945, "global_step": 10036, "epoch": 238} {"train_loss": -5.03715181350708, "global_step": 10037, "epoch": 238, "val_loss": 71053.8515625} {"train_loss": -5.0846381187438965, "global_step": 10038, "epoch": 239} {"train_loss": -5.004359245300293, "global_step": 10039, "epoch": 239} {"train_loss": -5.089632511138916, "global_step": 10040, "epoch": 239} {"train_loss": -4.977713584899902, "global_step": 10041, "epoch": 239} {"train_loss": -4.912386417388916, "global_step": 10042, "epoch": 239} {"train_loss": -4.927694320678711, "global_step": 10043, "epoch": 239} {"train_loss": -5.088112831115723, "global_step": 10044, "epoch": 239} {"train_loss": -4.995909690856934, "global_step": 10045, "epoch": 239} {"train_loss": -5.10090970993042, "global_step": 10046, "epoch": 239} {"train_loss": -5.128957271575928, "global_step": 10047, "epoch": 239} {"train_loss": -5.0671892166137695, "global_step": 10048, "epoch": 239} {"train_loss": -5.154359817504883, "global_step": 10049, "epoch": 239} {"train_loss": -5.0311102867126465, "global_step": 10050, "epoch": 239} {"train_loss": -5.0829362869262695, "global_step": 10051, "epoch": 239} {"train_loss": -5.0746750831604, "global_step": 10052, "epoch": 239} {"train_loss": -4.9820356369018555, "global_step": 10053, "epoch": 239} {"train_loss": -5.123367786407471, "global_step": 10054, "epoch": 239} {"train_loss": -5.021479606628418, "global_step": 10055, "epoch": 239} {"train_loss": -5.116480827331543, "global_step": 10056, "epoch": 239} {"train_loss": -5.097033500671387, "global_step": 10057, "epoch": 239} {"train_loss": -4.953177452087402, "global_step": 10058, "epoch": 239} {"train_loss": -5.14107608795166, "global_step": 10059, "epoch": 239} {"train_loss": -5.052423000335693, "global_step": 10060, "epoch": 239} {"train_loss": -5.126033782958984, "global_step": 10061, "epoch": 239} {"train_loss": -4.972322940826416, "global_step": 10062, "epoch": 239} {"train_loss": -5.133225917816162, "global_step": 10063, "epoch": 239} {"train_loss": -5.0291900634765625, "global_step": 10064, "epoch": 239} {"train_loss": -5.08475399017334, "global_step": 10065, "epoch": 239} {"train_loss": -5.144811153411865, "global_step": 10066, "epoch": 239} {"train_loss": -4.9884185791015625, "global_step": 10067, "epoch": 239} {"train_loss": -4.895689964294434, "global_step": 10068, "epoch": 239} {"train_loss": -5.043842792510986, "global_step": 10069, "epoch": 239} {"train_loss": -4.982612609863281, "global_step": 10070, "epoch": 239} {"train_loss": -4.988214492797852, "global_step": 10071, "epoch": 239} {"train_loss": -5.1171979904174805, "global_step": 10072, "epoch": 239} {"train_loss": -4.930530071258545, "global_step": 10073, "epoch": 239} {"train_loss": -5.030436038970947, "global_step": 10074, "epoch": 239} {"train_loss": -4.919398784637451, "global_step": 10075, "epoch": 239} {"train_loss": -5.246120452880859, "global_step": 10076, "epoch": 239} {"train_loss": -5.088181972503662, "global_step": 10077, "epoch": 239} {"train_loss": -4.931532382965088, "global_step": 10078, "epoch": 239} {"train_loss": -5.045505296616327, "global_step": 10079, "epoch": 239, "val_loss": 71349.671875} {"train_loss": -5.1114349365234375, "global_step": 10080, "epoch": 240} {"train_loss": -4.919835090637207, "global_step": 10081, "epoch": 240} {"train_loss": -4.93978214263916, "global_step": 10082, "epoch": 240} {"train_loss": -5.13278341293335, "global_step": 10083, "epoch": 240} {"train_loss": -5.045670509338379, "global_step": 10084, "epoch": 240} {"train_loss": -5.190437316894531, "global_step": 10085, "epoch": 240} {"train_loss": -5.060304164886475, "global_step": 10086, "epoch": 240} {"train_loss": -5.112081527709961, "global_step": 10087, "epoch": 240} {"train_loss": -5.0478410720825195, "global_step": 10088, "epoch": 240} {"train_loss": -4.930392265319824, "global_step": 10089, "epoch": 240} {"train_loss": -5.122200965881348, "global_step": 10090, "epoch": 240} {"train_loss": -5.004003524780273, "global_step": 10091, "epoch": 240} {"train_loss": -5.032759666442871, "global_step": 10092, "epoch": 240} {"train_loss": -4.955570220947266, "global_step": 10093, "epoch": 240} {"train_loss": -4.940670013427734, "global_step": 10094, "epoch": 240} {"train_loss": -4.982721328735352, "global_step": 10095, "epoch": 240} {"train_loss": -5.167512893676758, "global_step": 10096, "epoch": 240} {"train_loss": -4.957372188568115, "global_step": 10097, "epoch": 240} {"train_loss": -5.04817533493042, "global_step": 10098, "epoch": 240} {"train_loss": -5.019682884216309, "global_step": 10099, "epoch": 240} {"train_loss": -4.915714740753174, "global_step": 10100, "epoch": 240} {"train_loss": -4.968786239624023, "global_step": 10101, "epoch": 240} {"train_loss": -4.987741470336914, "global_step": 10102, "epoch": 240} {"train_loss": -4.77972412109375, "global_step": 10103, "epoch": 240} {"train_loss": -4.939254283905029, "global_step": 10104, "epoch": 240} {"train_loss": -5.092512130737305, "global_step": 10105, "epoch": 240} {"train_loss": -4.922873020172119, "global_step": 10106, "epoch": 240} {"train_loss": -5.004483222961426, "global_step": 10107, "epoch": 240} {"train_loss": -5.179840564727783, "global_step": 10108, "epoch": 240} {"train_loss": -5.115139484405518, "global_step": 10109, "epoch": 240} {"train_loss": -5.141967296600342, "global_step": 10110, "epoch": 240} {"train_loss": -5.022268295288086, "global_step": 10111, "epoch": 240} {"train_loss": -5.072787284851074, "global_step": 10112, "epoch": 240} {"train_loss": -5.059431076049805, "global_step": 10113, "epoch": 240} {"train_loss": -5.016737937927246, "global_step": 10114, "epoch": 240} {"train_loss": -4.936675071716309, "global_step": 10115, "epoch": 240} {"train_loss": -5.125808238983154, "global_step": 10116, "epoch": 240} {"train_loss": -5.053204536437988, "global_step": 10117, "epoch": 240} {"train_loss": -5.113486289978027, "global_step": 10118, "epoch": 240} {"train_loss": -5.056066513061523, "global_step": 10119, "epoch": 240} {"train_loss": -4.965188980102539, "global_step": 10120, "epoch": 240} {"train_loss": -5.03212004616147, "global_step": 10121, "epoch": 240, "val_loss": 71278.5} {"train_loss": -4.958395957946777, "global_step": 10122, "epoch": 241} {"train_loss": -4.908974647521973, "global_step": 10123, "epoch": 241} {"train_loss": -5.050684928894043, "global_step": 10124, "epoch": 241} {"train_loss": -5.071589469909668, "global_step": 10125, "epoch": 241} {"train_loss": -4.939728736877441, "global_step": 10126, "epoch": 241} {"train_loss": -4.884965419769287, "global_step": 10127, "epoch": 241} {"train_loss": -5.1250481605529785, "global_step": 10128, "epoch": 241} {"train_loss": -4.872699737548828, "global_step": 10129, "epoch": 241} {"train_loss": -5.0412092208862305, "global_step": 10130, "epoch": 241} {"train_loss": -5.038771152496338, "global_step": 10131, "epoch": 241} {"train_loss": -4.945420265197754, "global_step": 10132, "epoch": 241} {"train_loss": -5.190629005432129, "global_step": 10133, "epoch": 241} {"train_loss": -4.969120979309082, "global_step": 10134, "epoch": 241} {"train_loss": -4.868567943572998, "global_step": 10135, "epoch": 241} {"train_loss": -5.063105583190918, "global_step": 10136, "epoch": 241} {"train_loss": -4.923968315124512, "global_step": 10137, "epoch": 241} {"train_loss": -5.033864498138428, "global_step": 10138, "epoch": 241} {"train_loss": -5.079143524169922, "global_step": 10139, "epoch": 241} {"train_loss": -4.946006774902344, "global_step": 10140, "epoch": 241} {"train_loss": -5.020019054412842, "global_step": 10141, "epoch": 241} {"train_loss": -4.996995449066162, "global_step": 10142, "epoch": 241} {"train_loss": -5.0030317306518555, "global_step": 10143, "epoch": 241} {"train_loss": -5.124733924865723, "global_step": 10144, "epoch": 241} {"train_loss": -5.063997745513916, "global_step": 10145, "epoch": 241} {"train_loss": -4.942823886871338, "global_step": 10146, "epoch": 241} {"train_loss": -5.0020341873168945, "global_step": 10147, "epoch": 241} {"train_loss": -5.0250325202941895, "global_step": 10148, "epoch": 241} {"train_loss": -5.175427436828613, "global_step": 10149, "epoch": 241} {"train_loss": -5.004878520965576, "global_step": 10150, "epoch": 241} {"train_loss": -5.107080459594727, "global_step": 10151, "epoch": 241} {"train_loss": -5.082376480102539, "global_step": 10152, "epoch": 241} {"train_loss": -5.103763580322266, "global_step": 10153, "epoch": 241} {"train_loss": -5.10732889175415, "global_step": 10154, "epoch": 241} {"train_loss": -5.013433456420898, "global_step": 10155, "epoch": 241} {"train_loss": -5.112792491912842, "global_step": 10156, "epoch": 241} {"train_loss": -4.955183982849121, "global_step": 10157, "epoch": 241} {"train_loss": -5.013624668121338, "global_step": 10158, "epoch": 241} {"train_loss": -4.822312355041504, "global_step": 10159, "epoch": 241} {"train_loss": -4.909785270690918, "global_step": 10160, "epoch": 241} {"train_loss": -5.100196838378906, "global_step": 10161, "epoch": 241} {"train_loss": -4.948422431945801, "global_step": 10162, "epoch": 241} {"train_loss": -5.013437906901042, "global_step": 10163, "epoch": 241, "val_loss": 70847.1015625} {"train_loss": -5.065412998199463, "global_step": 10164, "epoch": 242} {"train_loss": -5.134148120880127, "global_step": 10165, "epoch": 242} {"train_loss": -5.102993011474609, "global_step": 10166, "epoch": 242} {"train_loss": -5.050002574920654, "global_step": 10167, "epoch": 242} {"train_loss": -5.121363639831543, "global_step": 10168, "epoch": 242} {"train_loss": -4.968049049377441, "global_step": 10169, "epoch": 242} {"train_loss": -5.120144844055176, "global_step": 10170, "epoch": 242} {"train_loss": -5.1178202629089355, "global_step": 10171, "epoch": 242} {"train_loss": -5.210086822509766, "global_step": 10172, "epoch": 242} {"train_loss": -5.08071231842041, "global_step": 10173, "epoch": 242} {"train_loss": -4.973240852355957, "global_step": 10174, "epoch": 242} {"train_loss": -5.030896186828613, "global_step": 10175, "epoch": 242} {"train_loss": -5.059617042541504, "global_step": 10176, "epoch": 242} {"train_loss": -5.120264053344727, "global_step": 10177, "epoch": 242} {"train_loss": -5.154145240783691, "global_step": 10178, "epoch": 242} {"train_loss": -5.04020881652832, "global_step": 10179, "epoch": 242} {"train_loss": -5.019634246826172, "global_step": 10180, "epoch": 242} {"train_loss": -5.1629638671875, "global_step": 10181, "epoch": 242} {"train_loss": -4.986071586608887, "global_step": 10182, "epoch": 242} {"train_loss": -4.9980645179748535, "global_step": 10183, "epoch": 242} {"train_loss": -5.026636123657227, "global_step": 10184, "epoch": 242} {"train_loss": -5.123073577880859, "global_step": 10185, "epoch": 242} {"train_loss": -5.1108269691467285, "global_step": 10186, "epoch": 242} {"train_loss": -4.985361099243164, "global_step": 10187, "epoch": 242} {"train_loss": -5.0993523597717285, "global_step": 10188, "epoch": 242} {"train_loss": -5.140058517456055, "global_step": 10189, "epoch": 242} {"train_loss": -5.138008117675781, "global_step": 10190, "epoch": 242} {"train_loss": -5.101992130279541, "global_step": 10191, "epoch": 242} {"train_loss": -4.998704433441162, "global_step": 10192, "epoch": 242} {"train_loss": -5.051090240478516, "global_step": 10193, "epoch": 242} {"train_loss": -4.96311092376709, "global_step": 10194, "epoch": 242} {"train_loss": -5.192860126495361, "global_step": 10195, "epoch": 242} {"train_loss": -4.98968505859375, "global_step": 10196, "epoch": 242} {"train_loss": -4.8852152824401855, "global_step": 10197, "epoch": 242} {"train_loss": -4.890070915222168, "global_step": 10198, "epoch": 242} {"train_loss": -5.0102434158325195, "global_step": 10199, "epoch": 242} {"train_loss": -4.922396659851074, "global_step": 10200, "epoch": 242} {"train_loss": -5.0114874839782715, "global_step": 10201, "epoch": 242} {"train_loss": -5.155895233154297, "global_step": 10202, "epoch": 242} {"train_loss": -5.032217979431152, "global_step": 10203, "epoch": 242} {"train_loss": -5.137296199798584, "global_step": 10204, "epoch": 242} {"train_loss": -5.057743163335891, "global_step": 10205, "epoch": 242, "val_loss": 71235.46875} {"train_loss": -5.017754554748535, "global_step": 10206, "epoch": 243} {"train_loss": -5.129551887512207, "global_step": 10207, "epoch": 243} {"train_loss": -5.066318511962891, "global_step": 10208, "epoch": 243} {"train_loss": -4.977227210998535, "global_step": 10209, "epoch": 243} {"train_loss": -5.144388198852539, "global_step": 10210, "epoch": 243} {"train_loss": -4.938513278961182, "global_step": 10211, "epoch": 243} {"train_loss": -5.033725738525391, "global_step": 10212, "epoch": 243} {"train_loss": -5.060054779052734, "global_step": 10213, "epoch": 243} {"train_loss": -5.008664131164551, "global_step": 10214, "epoch": 243} {"train_loss": -4.963812828063965, "global_step": 10215, "epoch": 243} {"train_loss": -5.0353684425354, "global_step": 10216, "epoch": 243} {"train_loss": -5.030298233032227, "global_step": 10217, "epoch": 243} {"train_loss": -4.857119560241699, "global_step": 10218, "epoch": 243} {"train_loss": -4.954305648803711, "global_step": 10219, "epoch": 243} {"train_loss": -4.997932434082031, "global_step": 10220, "epoch": 243} {"train_loss": -4.934319496154785, "global_step": 10221, "epoch": 243} {"train_loss": -5.143691062927246, "global_step": 10222, "epoch": 243} {"train_loss": -5.025972843170166, "global_step": 10223, "epoch": 243} {"train_loss": -5.049124717712402, "global_step": 10224, "epoch": 243} {"train_loss": -5.119296550750732, "global_step": 10225, "epoch": 243} {"train_loss": -5.0847249031066895, "global_step": 10226, "epoch": 243} {"train_loss": -5.140719413757324, "global_step": 10227, "epoch": 243} {"train_loss": -5.089602470397949, "global_step": 10228, "epoch": 243} {"train_loss": -5.132826328277588, "global_step": 10229, "epoch": 243} {"train_loss": -4.962601661682129, "global_step": 10230, "epoch": 243} {"train_loss": -5.04620361328125, "global_step": 10231, "epoch": 243} {"train_loss": -5.074620723724365, "global_step": 10232, "epoch": 243} {"train_loss": -5.055211544036865, "global_step": 10233, "epoch": 243} {"train_loss": -5.013113021850586, "global_step": 10234, "epoch": 243} {"train_loss": -5.089203357696533, "global_step": 10235, "epoch": 243} {"train_loss": -5.036701202392578, "global_step": 10236, "epoch": 243} {"train_loss": -5.0248260498046875, "global_step": 10237, "epoch": 243} {"train_loss": -4.990663051605225, "global_step": 10238, "epoch": 243} {"train_loss": -4.9676995277404785, "global_step": 10239, "epoch": 243} {"train_loss": -5.03122615814209, "global_step": 10240, "epoch": 243} {"train_loss": -5.102651596069336, "global_step": 10241, "epoch": 243} {"train_loss": -5.13453483581543, "global_step": 10242, "epoch": 243} {"train_loss": -5.066045761108398, "global_step": 10243, "epoch": 243} {"train_loss": -5.080993175506592, "global_step": 10244, "epoch": 243} {"train_loss": -5.005626678466797, "global_step": 10245, "epoch": 243} {"train_loss": -4.998218536376953, "global_step": 10246, "epoch": 243} {"train_loss": -5.0394325142815, "global_step": 10247, "epoch": 243, "val_loss": 70426.828125} {"train_loss": -5.151932239532471, "global_step": 10248, "epoch": 244} {"train_loss": -5.125060081481934, "global_step": 10249, "epoch": 244} {"train_loss": -5.207706451416016, "global_step": 10250, "epoch": 244} {"train_loss": -4.976666450500488, "global_step": 10251, "epoch": 244} {"train_loss": -5.077241897583008, "global_step": 10252, "epoch": 244} {"train_loss": -5.008990287780762, "global_step": 10253, "epoch": 244} {"train_loss": -5.116119384765625, "global_step": 10254, "epoch": 244} {"train_loss": -4.833286285400391, "global_step": 10255, "epoch": 244} {"train_loss": -5.004035472869873, "global_step": 10256, "epoch": 244} {"train_loss": -5.110344409942627, "global_step": 10257, "epoch": 244} {"train_loss": -5.110713958740234, "global_step": 10258, "epoch": 244} {"train_loss": -4.876060485839844, "global_step": 10259, "epoch": 244} {"train_loss": -4.936324119567871, "global_step": 10260, "epoch": 244} {"train_loss": -5.083022117614746, "global_step": 10261, "epoch": 244} {"train_loss": -4.884208679199219, "global_step": 10262, "epoch": 244} {"train_loss": -4.902997970581055, "global_step": 10263, "epoch": 244} {"train_loss": -4.987425327301025, "global_step": 10264, "epoch": 244} {"train_loss": -5.080511569976807, "global_step": 10265, "epoch": 244} {"train_loss": -5.117098808288574, "global_step": 10266, "epoch": 244} {"train_loss": -5.121041297912598, "global_step": 10267, "epoch": 244} {"train_loss": -5.0333099365234375, "global_step": 10268, "epoch": 244} {"train_loss": -5.015233039855957, "global_step": 10269, "epoch": 244} {"train_loss": -4.9635748863220215, "global_step": 10270, "epoch": 244} {"train_loss": -4.872312545776367, "global_step": 10271, "epoch": 244} {"train_loss": -4.986610412597656, "global_step": 10272, "epoch": 244} {"train_loss": -4.937410354614258, "global_step": 10273, "epoch": 244} {"train_loss": -4.9712324142456055, "global_step": 10274, "epoch": 244} {"train_loss": -5.125619888305664, "global_step": 10275, "epoch": 244} {"train_loss": -5.10578727722168, "global_step": 10276, "epoch": 244} {"train_loss": -5.051836013793945, "global_step": 10277, "epoch": 244} {"train_loss": -4.957610130310059, "global_step": 10278, "epoch": 244} {"train_loss": -4.868025779724121, "global_step": 10279, "epoch": 244} {"train_loss": -4.917422771453857, "global_step": 10280, "epoch": 244} {"train_loss": -5.197532653808594, "global_step": 10281, "epoch": 244} {"train_loss": -5.025881767272949, "global_step": 10282, "epoch": 244} {"train_loss": -5.092121124267578, "global_step": 10283, "epoch": 244} {"train_loss": -4.937554359436035, "global_step": 10284, "epoch": 244} {"train_loss": -5.026473522186279, "global_step": 10285, "epoch": 244} {"train_loss": -5.023792266845703, "global_step": 10286, "epoch": 244} {"train_loss": -5.06593132019043, "global_step": 10287, "epoch": 244} {"train_loss": -5.0185322761535645, "global_step": 10288, "epoch": 244} {"train_loss": -5.022161824362619, "global_step": 10289, "epoch": 244, "val_loss": 70944.0546875} {"train_loss": -5.063158988952637, "global_step": 10290, "epoch": 245} {"train_loss": -5.061497688293457, "global_step": 10291, "epoch": 245} {"train_loss": -5.063873291015625, "global_step": 10292, "epoch": 245} {"train_loss": -5.181084156036377, "global_step": 10293, "epoch": 245} {"train_loss": -5.282814979553223, "global_step": 10294, "epoch": 245} {"train_loss": -5.183426856994629, "global_step": 10295, "epoch": 245} {"train_loss": -5.101827144622803, "global_step": 10296, "epoch": 245} {"train_loss": -5.05666446685791, "global_step": 10297, "epoch": 245} {"train_loss": -4.99941873550415, "global_step": 10298, "epoch": 245} {"train_loss": -4.895877361297607, "global_step": 10299, "epoch": 245} {"train_loss": -5.0378522872924805, "global_step": 10300, "epoch": 245} {"train_loss": -5.066742897033691, "global_step": 10301, "epoch": 245} {"train_loss": -5.0363569259643555, "global_step": 10302, "epoch": 245} {"train_loss": -5.0459394454956055, "global_step": 10303, "epoch": 245} {"train_loss": -4.927233695983887, "global_step": 10304, "epoch": 245} {"train_loss": -4.866046905517578, "global_step": 10305, "epoch": 245} {"train_loss": -5.105085372924805, "global_step": 10306, "epoch": 245} {"train_loss": -4.672336578369141, "global_step": 10307, "epoch": 245} {"train_loss": -4.842514991760254, "global_step": 10308, "epoch": 245} {"train_loss": -4.914340019226074, "global_step": 10309, "epoch": 245} {"train_loss": -4.899861812591553, "global_step": 10310, "epoch": 245} {"train_loss": -5.093438148498535, "global_step": 10311, "epoch": 245} {"train_loss": -5.050221920013428, "global_step": 10312, "epoch": 245} {"train_loss": -5.1138410568237305, "global_step": 10313, "epoch": 245} {"train_loss": -5.10732364654541, "global_step": 10314, "epoch": 245} {"train_loss": -4.996208190917969, "global_step": 10315, "epoch": 245} {"train_loss": -4.895623683929443, "global_step": 10316, "epoch": 245} {"train_loss": -5.033537864685059, "global_step": 10317, "epoch": 245} {"train_loss": -5.00371789932251, "global_step": 10318, "epoch": 245} {"train_loss": -5.027057647705078, "global_step": 10319, "epoch": 245} {"train_loss": -5.0435261726379395, "global_step": 10320, "epoch": 245} {"train_loss": -4.861607551574707, "global_step": 10321, "epoch": 245} {"train_loss": -5.075894832611084, "global_step": 10322, "epoch": 245} {"train_loss": -4.943625450134277, "global_step": 10323, "epoch": 245} {"train_loss": -4.829654216766357, "global_step": 10324, "epoch": 245} {"train_loss": -4.961557388305664, "global_step": 10325, "epoch": 245} {"train_loss": -5.13093376159668, "global_step": 10326, "epoch": 245} {"train_loss": -5.065032958984375, "global_step": 10327, "epoch": 245} {"train_loss": -4.8918657302856445, "global_step": 10328, "epoch": 245} {"train_loss": -4.972586631774902, "global_step": 10329, "epoch": 245} {"train_loss": -5.098211288452148, "global_step": 10330, "epoch": 245} {"train_loss": -5.008354879560924, "global_step": 10331, "epoch": 245, "val_loss": 70679.1015625} {"train_loss": -5.205011367797852, "global_step": 10332, "epoch": 246} {"train_loss": -4.988473415374756, "global_step": 10333, "epoch": 246} {"train_loss": -5.192281723022461, "global_step": 10334, "epoch": 246} {"train_loss": -4.907941818237305, "global_step": 10335, "epoch": 246} {"train_loss": -5.110045909881592, "global_step": 10336, "epoch": 246} {"train_loss": -5.024375915527344, "global_step": 10337, "epoch": 246} {"train_loss": -5.139255523681641, "global_step": 10338, "epoch": 246} {"train_loss": -4.993457794189453, "global_step": 10339, "epoch": 246} {"train_loss": -5.053714275360107, "global_step": 10340, "epoch": 246} {"train_loss": -5.106970310211182, "global_step": 10341, "epoch": 246} {"train_loss": -4.996572971343994, "global_step": 10342, "epoch": 246} {"train_loss": -4.919872283935547, "global_step": 10343, "epoch": 246} {"train_loss": -5.102611064910889, "global_step": 10344, "epoch": 246} {"train_loss": -4.888028621673584, "global_step": 10345, "epoch": 246} {"train_loss": -5.132345199584961, "global_step": 10346, "epoch": 246} {"train_loss": -5.010490417480469, "global_step": 10347, "epoch": 246} {"train_loss": -4.998625755310059, "global_step": 10348, "epoch": 246} {"train_loss": -5.101708889007568, "global_step": 10349, "epoch": 246} {"train_loss": -5.161892890930176, "global_step": 10350, "epoch": 246} {"train_loss": -5.0583295822143555, "global_step": 10351, "epoch": 246} {"train_loss": -4.847377777099609, "global_step": 10352, "epoch": 246} {"train_loss": -5.00766134262085, "global_step": 10353, "epoch": 246} {"train_loss": -4.995619773864746, "global_step": 10354, "epoch": 246} {"train_loss": -5.045607566833496, "global_step": 10355, "epoch": 246} {"train_loss": -4.8837080001831055, "global_step": 10356, "epoch": 246} {"train_loss": -5.0758209228515625, "global_step": 10357, "epoch": 246} {"train_loss": -5.044924736022949, "global_step": 10358, "epoch": 246} {"train_loss": -5.011284351348877, "global_step": 10359, "epoch": 246} {"train_loss": -5.139914035797119, "global_step": 10360, "epoch": 246} {"train_loss": -5.1127214431762695, "global_step": 10361, "epoch": 246} {"train_loss": -5.069847583770752, "global_step": 10362, "epoch": 246} {"train_loss": -5.228395462036133, "global_step": 10363, "epoch": 246} {"train_loss": -5.053576469421387, "global_step": 10364, "epoch": 246} {"train_loss": -5.048409938812256, "global_step": 10365, "epoch": 246} {"train_loss": -5.002190113067627, "global_step": 10366, "epoch": 246} {"train_loss": -4.697620868682861, "global_step": 10367, "epoch": 246} {"train_loss": -5.077632904052734, "global_step": 10368, "epoch": 246} {"train_loss": -5.186168193817139, "global_step": 10369, "epoch": 246} {"train_loss": -5.12012243270874, "global_step": 10370, "epoch": 246} {"train_loss": -5.081374168395996, "global_step": 10371, "epoch": 246} {"train_loss": -5.08104133605957, "global_step": 10372, "epoch": 246} {"train_loss": -5.050605966931298, "global_step": 10373, "epoch": 246, "val_loss": 70415.46875} {"train_loss": -4.979709148406982, "global_step": 10374, "epoch": 247} {"train_loss": -5.042856693267822, "global_step": 10375, "epoch": 247} {"train_loss": -5.1236677169799805, "global_step": 10376, "epoch": 247} {"train_loss": -5.204605579376221, "global_step": 10377, "epoch": 247} {"train_loss": -5.163081645965576, "global_step": 10378, "epoch": 247} {"train_loss": -5.086705684661865, "global_step": 10379, "epoch": 247} {"train_loss": -5.024569511413574, "global_step": 10380, "epoch": 247} {"train_loss": -5.050209045410156, "global_step": 10381, "epoch": 247} {"train_loss": -5.091862678527832, "global_step": 10382, "epoch": 247} {"train_loss": -5.038860321044922, "global_step": 10383, "epoch": 247} {"train_loss": -5.08233642578125, "global_step": 10384, "epoch": 247} {"train_loss": -5.118468284606934, "global_step": 10385, "epoch": 247} {"train_loss": -4.9879231452941895, "global_step": 10386, "epoch": 247} {"train_loss": -4.950878620147705, "global_step": 10387, "epoch": 247} {"train_loss": -5.106036186218262, "global_step": 10388, "epoch": 247} {"train_loss": -5.002135276794434, "global_step": 10389, "epoch": 247} {"train_loss": -4.902328968048096, "global_step": 10390, "epoch": 247} {"train_loss": -4.924835205078125, "global_step": 10391, "epoch": 247} {"train_loss": -5.051412582397461, "global_step": 10392, "epoch": 247} {"train_loss": -5.020860195159912, "global_step": 10393, "epoch": 247} {"train_loss": -5.089362144470215, "global_step": 10394, "epoch": 247} {"train_loss": -5.165999412536621, "global_step": 10395, "epoch": 247} {"train_loss": -5.132050037384033, "global_step": 10396, "epoch": 247} {"train_loss": -5.189185619354248, "global_step": 10397, "epoch": 247} {"train_loss": -5.123011589050293, "global_step": 10398, "epoch": 247} {"train_loss": -5.046469688415527, "global_step": 10399, "epoch": 247} {"train_loss": -5.2126054763793945, "global_step": 10400, "epoch": 247} {"train_loss": -5.111225128173828, "global_step": 10401, "epoch": 247} {"train_loss": -5.0725908279418945, "global_step": 10402, "epoch": 247} {"train_loss": -5.128855228424072, "global_step": 10403, "epoch": 247} {"train_loss": -5.066731929779053, "global_step": 10404, "epoch": 247} {"train_loss": -5.121650695800781, "global_step": 10405, "epoch": 247} {"train_loss": -5.153785705566406, "global_step": 10406, "epoch": 247} {"train_loss": -5.091788291931152, "global_step": 10407, "epoch": 247} {"train_loss": -4.94721794128418, "global_step": 10408, "epoch": 247} {"train_loss": -5.133217811584473, "global_step": 10409, "epoch": 247} {"train_loss": -5.099137783050537, "global_step": 10410, "epoch": 247} {"train_loss": -5.0609564781188965, "global_step": 10411, "epoch": 247} {"train_loss": -5.021612167358398, "global_step": 10412, "epoch": 247} {"train_loss": -5.125515460968018, "global_step": 10413, "epoch": 247} {"train_loss": -5.080200672149658, "global_step": 10414, "epoch": 247} {"train_loss": -5.078507639112926, "global_step": 10415, "epoch": 247, "val_loss": 70705.1015625} {"train_loss": -5.131646633148193, "global_step": 10416, "epoch": 248} {"train_loss": -5.192793369293213, "global_step": 10417, "epoch": 248} {"train_loss": -5.038022041320801, "global_step": 10418, "epoch": 248} {"train_loss": -5.005415439605713, "global_step": 10419, "epoch": 248} {"train_loss": -5.127179145812988, "global_step": 10420, "epoch": 248} {"train_loss": -5.033383846282959, "global_step": 10421, "epoch": 248} {"train_loss": -5.135545253753662, "global_step": 10422, "epoch": 248} {"train_loss": -5.061245441436768, "global_step": 10423, "epoch": 248} {"train_loss": -4.925358772277832, "global_step": 10424, "epoch": 248} {"train_loss": -4.645411491394043, "global_step": 10425, "epoch": 248} {"train_loss": -4.9787492752075195, "global_step": 10426, "epoch": 248} {"train_loss": -4.93080997467041, "global_step": 10427, "epoch": 248} {"train_loss": -4.740786075592041, "global_step": 10428, "epoch": 248} {"train_loss": -5.192183494567871, "global_step": 10429, "epoch": 248} {"train_loss": -4.911958694458008, "global_step": 10430, "epoch": 248} {"train_loss": -4.919765472412109, "global_step": 10431, "epoch": 248} {"train_loss": -4.991538047790527, "global_step": 10432, "epoch": 248} {"train_loss": -4.926151752471924, "global_step": 10433, "epoch": 248} {"train_loss": -5.08250093460083, "global_step": 10434, "epoch": 248} {"train_loss": -4.978858947753906, "global_step": 10435, "epoch": 248} {"train_loss": -5.000050067901611, "global_step": 10436, "epoch": 248} {"train_loss": -5.107223987579346, "global_step": 10437, "epoch": 248} {"train_loss": -5.001408576965332, "global_step": 10438, "epoch": 248} {"train_loss": -5.123403072357178, "global_step": 10439, "epoch": 248} {"train_loss": -5.058603286743164, "global_step": 10440, "epoch": 248} {"train_loss": -5.181879043579102, "global_step": 10441, "epoch": 248} {"train_loss": -5.119283199310303, "global_step": 10442, "epoch": 248} {"train_loss": -4.999101161956787, "global_step": 10443, "epoch": 248} {"train_loss": -5.050524711608887, "global_step": 10444, "epoch": 248} {"train_loss": -5.10875129699707, "global_step": 10445, "epoch": 248} {"train_loss": -5.127317428588867, "global_step": 10446, "epoch": 248} {"train_loss": -5.136130332946777, "global_step": 10447, "epoch": 248} {"train_loss": -5.1833977699279785, "global_step": 10448, "epoch": 248} {"train_loss": -5.054672718048096, "global_step": 10449, "epoch": 248} {"train_loss": -5.103636741638184, "global_step": 10450, "epoch": 248} {"train_loss": -5.091492176055908, "global_step": 10451, "epoch": 248} {"train_loss": -4.859580993652344, "global_step": 10452, "epoch": 248} {"train_loss": -5.049046993255615, "global_step": 10453, "epoch": 248} {"train_loss": -5.143534183502197, "global_step": 10454, "epoch": 248} {"train_loss": -4.842257499694824, "global_step": 10455, "epoch": 248} {"train_loss": -5.1872382164001465, "global_step": 10456, "epoch": 248} {"train_loss": -5.037303572609311, "global_step": 10457, "epoch": 248, "val_loss": 71154.015625} {"train_loss": -4.91973876953125, "global_step": 10458, "epoch": 249} {"train_loss": -5.0819172859191895, "global_step": 10459, "epoch": 249} {"train_loss": -5.022805690765381, "global_step": 10460, "epoch": 249} {"train_loss": -5.1456451416015625, "global_step": 10461, "epoch": 249} {"train_loss": -4.993992328643799, "global_step": 10462, "epoch": 249} {"train_loss": -4.996124267578125, "global_step": 10463, "epoch": 249} {"train_loss": -5.07766056060791, "global_step": 10464, "epoch": 249} {"train_loss": -4.950685024261475, "global_step": 10465, "epoch": 249} {"train_loss": -5.0134077072143555, "global_step": 10466, "epoch": 249} {"train_loss": -5.039235591888428, "global_step": 10467, "epoch": 249} {"train_loss": -5.123510837554932, "global_step": 10468, "epoch": 249} {"train_loss": -5.140420913696289, "global_step": 10469, "epoch": 249} {"train_loss": -4.864035129547119, "global_step": 10470, "epoch": 249} {"train_loss": -4.973899841308594, "global_step": 10471, "epoch": 249} {"train_loss": -5.022783279418945, "global_step": 10472, "epoch": 249} {"train_loss": -4.978166103363037, "global_step": 10473, "epoch": 249} {"train_loss": -5.210129261016846, "global_step": 10474, "epoch": 249} {"train_loss": -5.020175933837891, "global_step": 10475, "epoch": 249} {"train_loss": -4.832176208496094, "global_step": 10476, "epoch": 249} {"train_loss": -5.037136554718018, "global_step": 10477, "epoch": 249} {"train_loss": -5.007115364074707, "global_step": 10478, "epoch": 249} {"train_loss": -5.046394348144531, "global_step": 10479, "epoch": 249} {"train_loss": -5.042867660522461, "global_step": 10480, "epoch": 249} {"train_loss": -4.9397077560424805, "global_step": 10481, "epoch": 249} {"train_loss": -5.029751300811768, "global_step": 10482, "epoch": 249} {"train_loss": -4.947259902954102, "global_step": 10483, "epoch": 249} {"train_loss": -5.029550552368164, "global_step": 10484, "epoch": 249} {"train_loss": -5.009671211242676, "global_step": 10485, "epoch": 249} {"train_loss": -4.939716815948486, "global_step": 10486, "epoch": 249} {"train_loss": -5.01863956451416, "global_step": 10487, "epoch": 249} {"train_loss": -5.1507568359375, "global_step": 10488, "epoch": 249} {"train_loss": -5.025688171386719, "global_step": 10489, "epoch": 249} {"train_loss": -5.078917026519775, "global_step": 10490, "epoch": 249} {"train_loss": -5.075058937072754, "global_step": 10491, "epoch": 249} {"train_loss": -5.102797508239746, "global_step": 10492, "epoch": 249} {"train_loss": -4.984387397766113, "global_step": 10493, "epoch": 249} {"train_loss": -4.893843650817871, "global_step": 10494, "epoch": 249} {"train_loss": -4.999837398529053, "global_step": 10495, "epoch": 249} {"train_loss": -5.057074546813965, "global_step": 10496, "epoch": 249} {"train_loss": -4.954410076141357, "global_step": 10497, "epoch": 249} {"train_loss": -5.015440940856934, "global_step": 10498, "epoch": 249} {"train_loss": -5.018630561374483, "global_step": 10499, "epoch": 249, "val_loss": 71017.6328125} {"train_loss": -4.977858543395996, "global_step": 10500, "epoch": 250} {"train_loss": -4.984460353851318, "global_step": 10501, "epoch": 250} {"train_loss": -5.165711402893066, "global_step": 10502, "epoch": 250} {"train_loss": -5.183821678161621, "global_step": 10503, "epoch": 250} {"train_loss": -5.089992046356201, "global_step": 10504, "epoch": 250} {"train_loss": -5.0047688484191895, "global_step": 10505, "epoch": 250} {"train_loss": -5.14918327331543, "global_step": 10506, "epoch": 250} {"train_loss": -5.063599586486816, "global_step": 10507, "epoch": 250} {"train_loss": -5.060764312744141, "global_step": 10508, "epoch": 250} {"train_loss": -4.923171043395996, "global_step": 10509, "epoch": 250} {"train_loss": -5.093204498291016, "global_step": 10510, "epoch": 250} {"train_loss": -5.003704071044922, "global_step": 10511, "epoch": 250} {"train_loss": -5.134382247924805, "global_step": 10512, "epoch": 250} {"train_loss": -5.064383029937744, "global_step": 10513, "epoch": 250} {"train_loss": -5.097109317779541, "global_step": 10514, "epoch": 250} {"train_loss": -5.203706741333008, "global_step": 10515, "epoch": 250} {"train_loss": -5.0236663818359375, "global_step": 10516, "epoch": 250} {"train_loss": -5.051214218139648, "global_step": 10517, "epoch": 250} {"train_loss": -5.049783706665039, "global_step": 10518, "epoch": 250} {"train_loss": -5.029421329498291, "global_step": 10519, "epoch": 250} {"train_loss": -5.11552619934082, "global_step": 10520, "epoch": 250} {"train_loss": -5.177098274230957, "global_step": 10521, "epoch": 250} {"train_loss": -5.061646461486816, "global_step": 10522, "epoch": 250} {"train_loss": -5.051630020141602, "global_step": 10523, "epoch": 250} {"train_loss": -5.094508171081543, "global_step": 10524, "epoch": 250} {"train_loss": -5.092555999755859, "global_step": 10525, "epoch": 250} {"train_loss": -4.779852390289307, "global_step": 10526, "epoch": 250} {"train_loss": -4.9361891746521, "global_step": 10527, "epoch": 250} {"train_loss": -5.0382561683654785, "global_step": 10528, "epoch": 250} {"train_loss": -4.807140350341797, "global_step": 10529, "epoch": 250} {"train_loss": -4.888049125671387, "global_step": 10530, "epoch": 250} {"train_loss": -5.042610168457031, "global_step": 10531, "epoch": 250} {"train_loss": -5.250932693481445, "global_step": 10532, "epoch": 250} {"train_loss": -4.904389381408691, "global_step": 10533, "epoch": 250} {"train_loss": -5.0851874351501465, "global_step": 10534, "epoch": 250} {"train_loss": -4.993402481079102, "global_step": 10535, "epoch": 250} {"train_loss": -5.044214248657227, "global_step": 10536, "epoch": 250} {"train_loss": -5.0767621994018555, "global_step": 10537, "epoch": 250} {"train_loss": -4.911397933959961, "global_step": 10538, "epoch": 250} {"train_loss": -5.027194023132324, "global_step": 10539, "epoch": 250} {"train_loss": -5.003540992736816, "global_step": 10540, "epoch": 250} {"train_loss": -5.044253099532354, "global_step": 10541, "epoch": 250, "train/sim_max_reward_0": 0.45171215442188084, "train/sim_max_reward_1": 0.09227727667750892, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.027789540685877006, "train/sim_max_reward_4": 0.16827808423824636, "train/sim_max_reward_5": 0.5389366153493004, "test/sim_max_reward_4300000": 0.16052584494130281, "test/sim_max_reward_4300001": 0.11040222298838198, "test/sim_max_reward_4300002": 0.2020777294251233, "test/sim_max_reward_4300003": 0.30672526811954937, "test/sim_max_reward_4300004": 0.8194230191844276, "test/sim_max_reward_4300005": 0.1777831566362923, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.4056907279296584, "test/sim_max_reward_4300008": 0.0, "test/sim_max_reward_4300009": 0.030231373978292127, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.1193775321576803, "test/sim_max_reward_4300012": 0.3895087549213664, "test/sim_max_reward_4300013": 0.40696453060518933, "test/sim_max_reward_4300014": 0.4015574859126985, "test/sim_max_reward_4300015": 0.26217830500475087, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.12840223876894113, "test/sim_max_reward_4300018": 0.0, "test/sim_max_reward_4300019": 0.185046968779379, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.2691145024774011, "test/sim_max_reward_4300022": 0.034310507912677715, "test/sim_max_reward_4300023": 0.2057529789273333, "test/sim_max_reward_4300024": 0.27755674161259575, "test/sim_max_reward_4300025": 0.32296331078070006, "test/sim_max_reward_4300026": 0.671195584967275, "test/sim_max_reward_4300027": 2.1069658945713764e-05, "test/sim_max_reward_4300028": 4.1466577934108704e-05, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.24851642628578416, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.43259806130716233, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.4303571749392499, "test/sim_max_reward_4300037": 0.5527122599440878, "test/sim_max_reward_4300038": 0.24713777349324995, "test/sim_max_reward_4300039": 0.018002034542211644, "test/sim_max_reward_4300040": 0.14926551129157645, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.3207614496330381, "test/sim_max_reward_4300043": 0.30374113293775296, "test/sim_max_reward_4300044": 0.08949017026976878, "test/sim_max_reward_4300045": 0.24015585323382113, "test/sim_max_reward_4300046": 0.06056981559363221, "test/sim_max_reward_4300047": 0.25969494031096396, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.21316561189546893, "test/mean_score": 0.18848872480399698, "val_loss": 71447.390625} {"train_loss": -4.987406253814697, "global_step": 10542, "epoch": 251} {"train_loss": -4.970825672149658, "global_step": 10543, "epoch": 251} {"train_loss": -4.982627868652344, "global_step": 10544, "epoch": 251} {"train_loss": -4.850805282592773, "global_step": 10545, "epoch": 251} {"train_loss": -5.102459907531738, "global_step": 10546, "epoch": 251} {"train_loss": -4.912130832672119, "global_step": 10547, "epoch": 251} {"train_loss": -4.933872222900391, "global_step": 10548, "epoch": 251} {"train_loss": -5.0719523429870605, "global_step": 10549, "epoch": 251} {"train_loss": -4.908623695373535, "global_step": 10550, "epoch": 251} {"train_loss": -4.843038082122803, "global_step": 10551, "epoch": 251} {"train_loss": -5.108658313751221, "global_step": 10552, "epoch": 251} {"train_loss": -4.968325138092041, "global_step": 10553, "epoch": 251} {"train_loss": -5.070335388183594, "global_step": 10554, "epoch": 251} {"train_loss": -5.029542922973633, "global_step": 10555, "epoch": 251} {"train_loss": -4.9933576583862305, "global_step": 10556, "epoch": 251} {"train_loss": -5.055607795715332, "global_step": 10557, "epoch": 251} {"train_loss": -4.809049606323242, "global_step": 10558, "epoch": 251} {"train_loss": -4.9995598793029785, "global_step": 10559, "epoch": 251} {"train_loss": -4.954077243804932, "global_step": 10560, "epoch": 251} {"train_loss": -5.097367286682129, "global_step": 10561, "epoch": 251} {"train_loss": -5.047260284423828, "global_step": 10562, "epoch": 251} {"train_loss": -5.0636491775512695, "global_step": 10563, "epoch": 251} {"train_loss": -5.167695045471191, "global_step": 10564, "epoch": 251} {"train_loss": -5.006763458251953, "global_step": 10565, "epoch": 251} {"train_loss": -5.13676643371582, "global_step": 10566, "epoch": 251} {"train_loss": -5.047593116760254, "global_step": 10567, "epoch": 251} {"train_loss": -5.054244041442871, "global_step": 10568, "epoch": 251} {"train_loss": -5.071497917175293, "global_step": 10569, "epoch": 251} {"train_loss": -5.127787113189697, "global_step": 10570, "epoch": 251} {"train_loss": -5.238311767578125, "global_step": 10571, "epoch": 251} {"train_loss": -5.097560405731201, "global_step": 10572, "epoch": 251} {"train_loss": -5.128528594970703, "global_step": 10573, "epoch": 251} {"train_loss": -5.168983459472656, "global_step": 10574, "epoch": 251} {"train_loss": -5.030557632446289, "global_step": 10575, "epoch": 251} {"train_loss": -4.941578388214111, "global_step": 10576, "epoch": 251} {"train_loss": -5.110755920410156, "global_step": 10577, "epoch": 251} {"train_loss": -5.127786636352539, "global_step": 10578, "epoch": 251} {"train_loss": -4.932347774505615, "global_step": 10579, "epoch": 251} {"train_loss": -5.29958438873291, "global_step": 10580, "epoch": 251} {"train_loss": -4.905633926391602, "global_step": 10581, "epoch": 251} {"train_loss": -5.040292739868164, "global_step": 10582, "epoch": 251} {"train_loss": -5.034292482194447, "global_step": 10583, "epoch": 251, "val_loss": 70199.2734375} {"train_loss": -5.20960807800293, "global_step": 10584, "epoch": 252} {"train_loss": -5.064682483673096, "global_step": 10585, "epoch": 252} {"train_loss": -5.163723468780518, "global_step": 10586, "epoch": 252} {"train_loss": -5.146594524383545, "global_step": 10587, "epoch": 252} {"train_loss": -5.122763156890869, "global_step": 10588, "epoch": 252} {"train_loss": -5.0309648513793945, "global_step": 10589, "epoch": 252} {"train_loss": -5.019437313079834, "global_step": 10590, "epoch": 252} {"train_loss": -5.044365406036377, "global_step": 10591, "epoch": 252} {"train_loss": -4.904761791229248, "global_step": 10592, "epoch": 252} {"train_loss": -5.166114330291748, "global_step": 10593, "epoch": 252} {"train_loss": -5.11448860168457, "global_step": 10594, "epoch": 252} {"train_loss": -4.820984363555908, "global_step": 10595, "epoch": 252} {"train_loss": -5.016363143920898, "global_step": 10596, "epoch": 252} {"train_loss": -5.229259014129639, "global_step": 10597, "epoch": 252} {"train_loss": -5.124085903167725, "global_step": 10598, "epoch": 252} {"train_loss": -4.971449851989746, "global_step": 10599, "epoch": 252} {"train_loss": -5.10626745223999, "global_step": 10600, "epoch": 252} {"train_loss": -5.14255428314209, "global_step": 10601, "epoch": 252} {"train_loss": -5.145153999328613, "global_step": 10602, "epoch": 252} {"train_loss": -5.035953521728516, "global_step": 10603, "epoch": 252} {"train_loss": -5.087379455566406, "global_step": 10604, "epoch": 252} {"train_loss": -4.926453590393066, "global_step": 10605, "epoch": 252} {"train_loss": -4.932952880859375, "global_step": 10606, "epoch": 252} {"train_loss": -5.093241214752197, "global_step": 10607, "epoch": 252} {"train_loss": -5.032952308654785, "global_step": 10608, "epoch": 252} {"train_loss": -4.897541046142578, "global_step": 10609, "epoch": 252} {"train_loss": -4.955704689025879, "global_step": 10610, "epoch": 252} {"train_loss": -4.998891353607178, "global_step": 10611, "epoch": 252} {"train_loss": -4.819819450378418, "global_step": 10612, "epoch": 252} {"train_loss": -4.9731292724609375, "global_step": 10613, "epoch": 252} {"train_loss": -5.12955379486084, "global_step": 10614, "epoch": 252} {"train_loss": -4.9429931640625, "global_step": 10615, "epoch": 252} {"train_loss": -4.984200477600098, "global_step": 10616, "epoch": 252} {"train_loss": -5.113166809082031, "global_step": 10617, "epoch": 252} {"train_loss": -5.092453956604004, "global_step": 10618, "epoch": 252} {"train_loss": -5.125667572021484, "global_step": 10619, "epoch": 252} {"train_loss": -5.201327800750732, "global_step": 10620, "epoch": 252} {"train_loss": -5.12158203125, "global_step": 10621, "epoch": 252} {"train_loss": -5.155653953552246, "global_step": 10622, "epoch": 252} {"train_loss": -5.008550643920898, "global_step": 10623, "epoch": 252} {"train_loss": -5.081653594970703, "global_step": 10624, "epoch": 252} {"train_loss": -5.056866044089908, "global_step": 10625, "epoch": 252, "val_loss": 71715.5390625} {"train_loss": -4.805719375610352, "global_step": 10626, "epoch": 253} {"train_loss": -5.015545845031738, "global_step": 10627, "epoch": 253} {"train_loss": -5.105116367340088, "global_step": 10628, "epoch": 253} {"train_loss": -4.936082363128662, "global_step": 10629, "epoch": 253} {"train_loss": -4.991266250610352, "global_step": 10630, "epoch": 253} {"train_loss": -5.312563419342041, "global_step": 10631, "epoch": 253} {"train_loss": -5.034334659576416, "global_step": 10632, "epoch": 253} {"train_loss": -4.9526519775390625, "global_step": 10633, "epoch": 253} {"train_loss": -5.1837358474731445, "global_step": 10634, "epoch": 253} {"train_loss": -5.168398857116699, "global_step": 10635, "epoch": 253} {"train_loss": -5.134341239929199, "global_step": 10636, "epoch": 253} {"train_loss": -5.036946773529053, "global_step": 10637, "epoch": 253} {"train_loss": -5.09088134765625, "global_step": 10638, "epoch": 253} {"train_loss": -5.011630058288574, "global_step": 10639, "epoch": 253} {"train_loss": -5.0716657638549805, "global_step": 10640, "epoch": 253} {"train_loss": -5.045392036437988, "global_step": 10641, "epoch": 253} {"train_loss": -5.104179382324219, "global_step": 10642, "epoch": 253} {"train_loss": -5.004349708557129, "global_step": 10643, "epoch": 253} {"train_loss": -4.999017715454102, "global_step": 10644, "epoch": 253} {"train_loss": -4.83973503112793, "global_step": 10645, "epoch": 253} {"train_loss": -5.046611309051514, "global_step": 10646, "epoch": 253} {"train_loss": -5.069681167602539, "global_step": 10647, "epoch": 253} {"train_loss": -4.891186714172363, "global_step": 10648, "epoch": 253} {"train_loss": -5.237922668457031, "global_step": 10649, "epoch": 253} {"train_loss": -5.1070380210876465, "global_step": 10650, "epoch": 253} {"train_loss": -5.1220927238464355, "global_step": 10651, "epoch": 253} {"train_loss": -5.121031761169434, "global_step": 10652, "epoch": 253} {"train_loss": -5.086142539978027, "global_step": 10653, "epoch": 253} {"train_loss": -5.023783206939697, "global_step": 10654, "epoch": 253} {"train_loss": -5.084410667419434, "global_step": 10655, "epoch": 253} {"train_loss": -5.111764907836914, "global_step": 10656, "epoch": 253} {"train_loss": -5.134402275085449, "global_step": 10657, "epoch": 253} {"train_loss": -4.992176055908203, "global_step": 10658, "epoch": 253} {"train_loss": -5.055330753326416, "global_step": 10659, "epoch": 253} {"train_loss": -5.029719352722168, "global_step": 10660, "epoch": 253} {"train_loss": -5.043788433074951, "global_step": 10661, "epoch": 253} {"train_loss": -5.178718566894531, "global_step": 10662, "epoch": 253} {"train_loss": -5.254240989685059, "global_step": 10663, "epoch": 253} {"train_loss": -5.049668312072754, "global_step": 10664, "epoch": 253} {"train_loss": -5.125557899475098, "global_step": 10665, "epoch": 253} {"train_loss": -5.04189395904541, "global_step": 10666, "epoch": 253} {"train_loss": -5.065668446677072, "global_step": 10667, "epoch": 253, "val_loss": 70473.3359375} {"train_loss": -5.076660633087158, "global_step": 10668, "epoch": 254} {"train_loss": -4.998095512390137, "global_step": 10669, "epoch": 254} {"train_loss": -5.063055038452148, "global_step": 10670, "epoch": 254} {"train_loss": -5.008735656738281, "global_step": 10671, "epoch": 254} {"train_loss": -5.087440013885498, "global_step": 10672, "epoch": 254} {"train_loss": -5.02390718460083, "global_step": 10673, "epoch": 254} {"train_loss": -5.001600742340088, "global_step": 10674, "epoch": 254} {"train_loss": -5.173128128051758, "global_step": 10675, "epoch": 254} {"train_loss": -5.184177398681641, "global_step": 10676, "epoch": 254} {"train_loss": -5.087512969970703, "global_step": 10677, "epoch": 254} {"train_loss": -5.081594467163086, "global_step": 10678, "epoch": 254} {"train_loss": -5.0154876708984375, "global_step": 10679, "epoch": 254} {"train_loss": -4.883647441864014, "global_step": 10680, "epoch": 254} {"train_loss": -5.20728874206543, "global_step": 10681, "epoch": 254} {"train_loss": -4.9290547370910645, "global_step": 10682, "epoch": 254} {"train_loss": -5.0661211013793945, "global_step": 10683, "epoch": 254} {"train_loss": -5.184247970581055, "global_step": 10684, "epoch": 254} {"train_loss": -5.078418731689453, "global_step": 10685, "epoch": 254} {"train_loss": -5.037421226501465, "global_step": 10686, "epoch": 254} {"train_loss": -5.11285400390625, "global_step": 10687, "epoch": 254} {"train_loss": -5.102272033691406, "global_step": 10688, "epoch": 254} {"train_loss": -5.095483303070068, "global_step": 10689, "epoch": 254} {"train_loss": -5.116814136505127, "global_step": 10690, "epoch": 254} {"train_loss": -4.957240104675293, "global_step": 10691, "epoch": 254} {"train_loss": -4.983872890472412, "global_step": 10692, "epoch": 254} {"train_loss": -5.060542106628418, "global_step": 10693, "epoch": 254} {"train_loss": -5.032215595245361, "global_step": 10694, "epoch": 254} {"train_loss": -5.059850215911865, "global_step": 10695, "epoch": 254} {"train_loss": -5.141584873199463, "global_step": 10696, "epoch": 254} {"train_loss": -4.97015380859375, "global_step": 10697, "epoch": 254} {"train_loss": -5.228309631347656, "global_step": 10698, "epoch": 254} {"train_loss": -4.984463691711426, "global_step": 10699, "epoch": 254} {"train_loss": -5.102766036987305, "global_step": 10700, "epoch": 254} {"train_loss": -5.115416526794434, "global_step": 10701, "epoch": 254} {"train_loss": -5.125672340393066, "global_step": 10702, "epoch": 254} {"train_loss": -5.085161209106445, "global_step": 10703, "epoch": 254} {"train_loss": -4.97474479675293, "global_step": 10704, "epoch": 254} {"train_loss": -4.900927543640137, "global_step": 10705, "epoch": 254} {"train_loss": -5.144892692565918, "global_step": 10706, "epoch": 254} {"train_loss": -5.164494514465332, "global_step": 10707, "epoch": 254} {"train_loss": -5.048938751220703, "global_step": 10708, "epoch": 254} {"train_loss": -5.0666668982732865, "global_step": 10709, "epoch": 254, "val_loss": 70736.234375} {"train_loss": -5.2574357986450195, "global_step": 10710, "epoch": 255} {"train_loss": -4.997976303100586, "global_step": 10711, "epoch": 255} {"train_loss": -5.148022174835205, "global_step": 10712, "epoch": 255} {"train_loss": -5.066875457763672, "global_step": 10713, "epoch": 255} {"train_loss": -5.298776149749756, "global_step": 10714, "epoch": 255} {"train_loss": -5.130166053771973, "global_step": 10715, "epoch": 255} {"train_loss": -5.1058197021484375, "global_step": 10716, "epoch": 255} {"train_loss": -4.943553924560547, "global_step": 10717, "epoch": 255} {"train_loss": -5.172297477722168, "global_step": 10718, "epoch": 255} {"train_loss": -5.072260856628418, "global_step": 10719, "epoch": 255} {"train_loss": -5.0724382400512695, "global_step": 10720, "epoch": 255} {"train_loss": -5.099609375, "global_step": 10721, "epoch": 255} {"train_loss": -5.059579849243164, "global_step": 10722, "epoch": 255} {"train_loss": -5.054055213928223, "global_step": 10723, "epoch": 255} {"train_loss": -5.060836315155029, "global_step": 10724, "epoch": 255} {"train_loss": -4.973306655883789, "global_step": 10725, "epoch": 255} {"train_loss": -5.016814231872559, "global_step": 10726, "epoch": 255} {"train_loss": -5.025212287902832, "global_step": 10727, "epoch": 255} {"train_loss": -4.964511871337891, "global_step": 10728, "epoch": 255} {"train_loss": -4.798709392547607, "global_step": 10729, "epoch": 255} {"train_loss": -4.7974443435668945, "global_step": 10730, "epoch": 255} {"train_loss": -5.079291343688965, "global_step": 10731, "epoch": 255} {"train_loss": -5.054049491882324, "global_step": 10732, "epoch": 255} {"train_loss": -4.995244979858398, "global_step": 10733, "epoch": 255} {"train_loss": -4.655532360076904, "global_step": 10734, "epoch": 255} {"train_loss": -4.989112854003906, "global_step": 10735, "epoch": 255} {"train_loss": -4.789380073547363, "global_step": 10736, "epoch": 255} {"train_loss": -4.997196197509766, "global_step": 10737, "epoch": 255} {"train_loss": -5.135507583618164, "global_step": 10738, "epoch": 255} {"train_loss": -4.921600341796875, "global_step": 10739, "epoch": 255} {"train_loss": -4.968221187591553, "global_step": 10740, "epoch": 255} {"train_loss": -5.129334449768066, "global_step": 10741, "epoch": 255} {"train_loss": -4.864053249359131, "global_step": 10742, "epoch": 255} {"train_loss": -5.136504173278809, "global_step": 10743, "epoch": 255} {"train_loss": -4.935442924499512, "global_step": 10744, "epoch": 255} {"train_loss": -4.92652702331543, "global_step": 10745, "epoch": 255} {"train_loss": -4.902561187744141, "global_step": 10746, "epoch": 255} {"train_loss": -4.899000644683838, "global_step": 10747, "epoch": 255} {"train_loss": -4.95297908782959, "global_step": 10748, "epoch": 255} {"train_loss": -4.99186897277832, "global_step": 10749, "epoch": 255} {"train_loss": -5.156700611114502, "global_step": 10750, "epoch": 255} {"train_loss": -5.011104424794515, "global_step": 10751, "epoch": 255, "val_loss": 71779.7421875} {"train_loss": -4.898739814758301, "global_step": 10752, "epoch": 256} {"train_loss": -4.828458309173584, "global_step": 10753, "epoch": 256} {"train_loss": -5.036972999572754, "global_step": 10754, "epoch": 256} {"train_loss": -4.951469898223877, "global_step": 10755, "epoch": 256} {"train_loss": -4.712931156158447, "global_step": 10756, "epoch": 256} {"train_loss": -5.0301032066345215, "global_step": 10757, "epoch": 256} {"train_loss": -5.010951519012451, "global_step": 10758, "epoch": 256} {"train_loss": -4.801543235778809, "global_step": 10759, "epoch": 256} {"train_loss": -5.044798851013184, "global_step": 10760, "epoch": 256} {"train_loss": -4.8279008865356445, "global_step": 10761, "epoch": 256} {"train_loss": -4.796814918518066, "global_step": 10762, "epoch": 256} {"train_loss": -5.058788776397705, "global_step": 10763, "epoch": 256} {"train_loss": -4.704442024230957, "global_step": 10764, "epoch": 256} {"train_loss": -5.102797508239746, "global_step": 10765, "epoch": 256} {"train_loss": -4.8955583572387695, "global_step": 10766, "epoch": 256} {"train_loss": -4.895941734313965, "global_step": 10767, "epoch": 256} {"train_loss": -4.896515846252441, "global_step": 10768, "epoch": 256} {"train_loss": -4.91340970993042, "global_step": 10769, "epoch": 256} {"train_loss": -5.091164588928223, "global_step": 10770, "epoch": 256} {"train_loss": -4.805846214294434, "global_step": 10771, "epoch": 256} {"train_loss": -5.040947437286377, "global_step": 10772, "epoch": 256} {"train_loss": -5.028900146484375, "global_step": 10773, "epoch": 256} {"train_loss": -5.157835483551025, "global_step": 10774, "epoch": 256} {"train_loss": -4.995730876922607, "global_step": 10775, "epoch": 256} {"train_loss": -5.111319541931152, "global_step": 10776, "epoch": 256} {"train_loss": -5.202493190765381, "global_step": 10777, "epoch": 256} {"train_loss": -4.936570167541504, "global_step": 10778, "epoch": 256} {"train_loss": -5.0268354415893555, "global_step": 10779, "epoch": 256} {"train_loss": -4.985138893127441, "global_step": 10780, "epoch": 256} {"train_loss": -5.1025390625, "global_step": 10781, "epoch": 256} {"train_loss": -5.076381206512451, "global_step": 10782, "epoch": 256} {"train_loss": -5.0606207847595215, "global_step": 10783, "epoch": 256} {"train_loss": -5.002211570739746, "global_step": 10784, "epoch": 256} {"train_loss": -5.065069198608398, "global_step": 10785, "epoch": 256} {"train_loss": -5.05183219909668, "global_step": 10786, "epoch": 256} {"train_loss": -5.139876365661621, "global_step": 10787, "epoch": 256} {"train_loss": -5.030385494232178, "global_step": 10788, "epoch": 256} {"train_loss": -5.07511043548584, "global_step": 10789, "epoch": 256} {"train_loss": -5.015224456787109, "global_step": 10790, "epoch": 256} {"train_loss": -5.059661865234375, "global_step": 10791, "epoch": 256} {"train_loss": -5.068129539489746, "global_step": 10792, "epoch": 256} {"train_loss": -4.991284938085647, "global_step": 10793, "epoch": 256, "val_loss": 71078.078125} {"train_loss": -5.155478000640869, "global_step": 10794, "epoch": 257} {"train_loss": -4.9864501953125, "global_step": 10795, "epoch": 257} {"train_loss": -5.102627754211426, "global_step": 10796, "epoch": 257} {"train_loss": -5.087606906890869, "global_step": 10797, "epoch": 257} {"train_loss": -5.072762489318848, "global_step": 10798, "epoch": 257} {"train_loss": -5.019539833068848, "global_step": 10799, "epoch": 257} {"train_loss": -5.068456649780273, "global_step": 10800, "epoch": 257} {"train_loss": -5.105780601501465, "global_step": 10801, "epoch": 257} {"train_loss": -4.982718467712402, "global_step": 10802, "epoch": 257} {"train_loss": -4.982342720031738, "global_step": 10803, "epoch": 257} {"train_loss": -5.043751239776611, "global_step": 10804, "epoch": 257} {"train_loss": -5.0062785148620605, "global_step": 10805, "epoch": 257} {"train_loss": -4.968993186950684, "global_step": 10806, "epoch": 257} {"train_loss": -5.049561500549316, "global_step": 10807, "epoch": 257} {"train_loss": -5.279373645782471, "global_step": 10808, "epoch": 257} {"train_loss": -5.1625871658325195, "global_step": 10809, "epoch": 257} {"train_loss": -5.093507766723633, "global_step": 10810, "epoch": 257} {"train_loss": -5.105863094329834, "global_step": 10811, "epoch": 257} {"train_loss": -5.206738471984863, "global_step": 10812, "epoch": 257} {"train_loss": -5.140763759613037, "global_step": 10813, "epoch": 257} {"train_loss": -5.0007219314575195, "global_step": 10814, "epoch": 257} {"train_loss": -5.091897964477539, "global_step": 10815, "epoch": 257} {"train_loss": -5.055411338806152, "global_step": 10816, "epoch": 257} {"train_loss": -5.073619842529297, "global_step": 10817, "epoch": 257} {"train_loss": -5.167740821838379, "global_step": 10818, "epoch": 257} {"train_loss": -5.055387496948242, "global_step": 10819, "epoch": 257} {"train_loss": -5.262569427490234, "global_step": 10820, "epoch": 257} {"train_loss": -5.149041175842285, "global_step": 10821, "epoch": 257} {"train_loss": -5.062263488769531, "global_step": 10822, "epoch": 257} {"train_loss": -5.078624725341797, "global_step": 10823, "epoch": 257} {"train_loss": -5.070253849029541, "global_step": 10824, "epoch": 257} {"train_loss": -4.9920759201049805, "global_step": 10825, "epoch": 257} {"train_loss": -5.025587558746338, "global_step": 10826, "epoch": 257} {"train_loss": -5.101868629455566, "global_step": 10827, "epoch": 257} {"train_loss": -5.0025634765625, "global_step": 10828, "epoch": 257} {"train_loss": -4.945478439331055, "global_step": 10829, "epoch": 257} {"train_loss": -4.94478178024292, "global_step": 10830, "epoch": 257} {"train_loss": -5.0649333000183105, "global_step": 10831, "epoch": 257} {"train_loss": -5.0046234130859375, "global_step": 10832, "epoch": 257} {"train_loss": -5.01361083984375, "global_step": 10833, "epoch": 257} {"train_loss": -5.011663913726807, "global_step": 10834, "epoch": 257} {"train_loss": -5.066756169001262, "global_step": 10835, "epoch": 257, "val_loss": 71179.4609375} {"train_loss": -5.0503435134887695, "global_step": 10836, "epoch": 258} {"train_loss": -5.058180809020996, "global_step": 10837, "epoch": 258} {"train_loss": -5.118157386779785, "global_step": 10838, "epoch": 258} {"train_loss": -5.059260845184326, "global_step": 10839, "epoch": 258} {"train_loss": -5.014240741729736, "global_step": 10840, "epoch": 258} {"train_loss": -4.979976654052734, "global_step": 10841, "epoch": 258} {"train_loss": -5.02672004699707, "global_step": 10842, "epoch": 258} {"train_loss": -5.147963523864746, "global_step": 10843, "epoch": 258} {"train_loss": -4.897745132446289, "global_step": 10844, "epoch": 258} {"train_loss": -5.072660446166992, "global_step": 10845, "epoch": 258} {"train_loss": -5.038086891174316, "global_step": 10846, "epoch": 258} {"train_loss": -5.018389701843262, "global_step": 10847, "epoch": 258} {"train_loss": -5.194498062133789, "global_step": 10848, "epoch": 258} {"train_loss": -4.872858047485352, "global_step": 10849, "epoch": 258} {"train_loss": -5.088085174560547, "global_step": 10850, "epoch": 258} {"train_loss": -5.215197563171387, "global_step": 10851, "epoch": 258} {"train_loss": -5.065617561340332, "global_step": 10852, "epoch": 258} {"train_loss": -5.074304103851318, "global_step": 10853, "epoch": 258} {"train_loss": -5.181185722351074, "global_step": 10854, "epoch": 258} {"train_loss": -5.014250755310059, "global_step": 10855, "epoch": 258} {"train_loss": -4.95189094543457, "global_step": 10856, "epoch": 258} {"train_loss": -5.188052177429199, "global_step": 10857, "epoch": 258} {"train_loss": -5.121297359466553, "global_step": 10858, "epoch": 258} {"train_loss": -5.041754722595215, "global_step": 10859, "epoch": 258} {"train_loss": -5.112910270690918, "global_step": 10860, "epoch": 258} {"train_loss": -5.218318939208984, "global_step": 10861, "epoch": 258} {"train_loss": -4.967057228088379, "global_step": 10862, "epoch": 258} {"train_loss": -5.160180568695068, "global_step": 10863, "epoch": 258} {"train_loss": -5.057920455932617, "global_step": 10864, "epoch": 258} {"train_loss": -5.11512565612793, "global_step": 10865, "epoch": 258} {"train_loss": -5.106748580932617, "global_step": 10866, "epoch": 258} {"train_loss": -5.2337141036987305, "global_step": 10867, "epoch": 258} {"train_loss": -5.036894798278809, "global_step": 10868, "epoch": 258} {"train_loss": -5.109773635864258, "global_step": 10869, "epoch": 258} {"train_loss": -5.026678085327148, "global_step": 10870, "epoch": 258} {"train_loss": -5.081677436828613, "global_step": 10871, "epoch": 258} {"train_loss": -5.1924238204956055, "global_step": 10872, "epoch": 258} {"train_loss": -5.084475517272949, "global_step": 10873, "epoch": 258} {"train_loss": -5.071267604827881, "global_step": 10874, "epoch": 258} {"train_loss": -5.127615928649902, "global_step": 10875, "epoch": 258} {"train_loss": -5.059289932250977, "global_step": 10876, "epoch": 258} {"train_loss": -5.0814912886846635, "global_step": 10877, "epoch": 258, "val_loss": 70665.0390625} {"train_loss": -5.029995918273926, "global_step": 10878, "epoch": 259} {"train_loss": -5.150839805603027, "global_step": 10879, "epoch": 259} {"train_loss": -5.05875301361084, "global_step": 10880, "epoch": 259} {"train_loss": -5.049816131591797, "global_step": 10881, "epoch": 259} {"train_loss": -5.015554904937744, "global_step": 10882, "epoch": 259} {"train_loss": -5.043352127075195, "global_step": 10883, "epoch": 259} {"train_loss": -5.171835899353027, "global_step": 10884, "epoch": 259} {"train_loss": -5.089056491851807, "global_step": 10885, "epoch": 259} {"train_loss": -5.178535461425781, "global_step": 10886, "epoch": 259} {"train_loss": -5.1890668869018555, "global_step": 10887, "epoch": 259} {"train_loss": -5.041919708251953, "global_step": 10888, "epoch": 259} {"train_loss": -4.7906365394592285, "global_step": 10889, "epoch": 259} {"train_loss": -5.01265811920166, "global_step": 10890, "epoch": 259} {"train_loss": -4.935173511505127, "global_step": 10891, "epoch": 259} {"train_loss": -4.765761852264404, "global_step": 10892, "epoch": 259} {"train_loss": -5.000772476196289, "global_step": 10893, "epoch": 259} {"train_loss": -4.926517009735107, "global_step": 10894, "epoch": 259} {"train_loss": -4.849268913269043, "global_step": 10895, "epoch": 259} {"train_loss": -5.14096212387085, "global_step": 10896, "epoch": 259} {"train_loss": -4.901366233825684, "global_step": 10897, "epoch": 259} {"train_loss": -4.806077003479004, "global_step": 10898, "epoch": 259} {"train_loss": -5.1491899490356445, "global_step": 10899, "epoch": 259} {"train_loss": -4.7807440757751465, "global_step": 10900, "epoch": 259} {"train_loss": -4.97722053527832, "global_step": 10901, "epoch": 259} {"train_loss": -5.036533355712891, "global_step": 10902, "epoch": 259} {"train_loss": -4.907686233520508, "global_step": 10903, "epoch": 259} {"train_loss": -5.103959083557129, "global_step": 10904, "epoch": 259} {"train_loss": -5.058703422546387, "global_step": 10905, "epoch": 259} {"train_loss": -4.877617835998535, "global_step": 10906, "epoch": 259} {"train_loss": -5.151108264923096, "global_step": 10907, "epoch": 259} {"train_loss": -5.0079874992370605, "global_step": 10908, "epoch": 259} {"train_loss": -5.143296241760254, "global_step": 10909, "epoch": 259} {"train_loss": -4.94365930557251, "global_step": 10910, "epoch": 259} {"train_loss": -5.0540771484375, "global_step": 10911, "epoch": 259} {"train_loss": -5.118213653564453, "global_step": 10912, "epoch": 259} {"train_loss": -5.177772045135498, "global_step": 10913, "epoch": 259} {"train_loss": -5.024455547332764, "global_step": 10914, "epoch": 259} {"train_loss": -5.0285868644714355, "global_step": 10915, "epoch": 259} {"train_loss": -5.018452167510986, "global_step": 10916, "epoch": 259} {"train_loss": -5.088658332824707, "global_step": 10917, "epoch": 259} {"train_loss": -5.133482456207275, "global_step": 10918, "epoch": 259} {"train_loss": -5.023056268692017, "global_step": 10919, "epoch": 259, "val_loss": 70957.2421875} {"train_loss": -5.103326797485352, "global_step": 10920, "epoch": 260} {"train_loss": -5.091724395751953, "global_step": 10921, "epoch": 260} {"train_loss": -5.096854209899902, "global_step": 10922, "epoch": 260} {"train_loss": -5.008028030395508, "global_step": 10923, "epoch": 260} {"train_loss": -5.071186065673828, "global_step": 10924, "epoch": 260} {"train_loss": -5.172364234924316, "global_step": 10925, "epoch": 260} {"train_loss": -4.795395851135254, "global_step": 10926, "epoch": 260} {"train_loss": -4.976332187652588, "global_step": 10927, "epoch": 260} {"train_loss": -5.121829032897949, "global_step": 10928, "epoch": 260} {"train_loss": -4.946846008300781, "global_step": 10929, "epoch": 260} {"train_loss": -4.990866184234619, "global_step": 10930, "epoch": 260} {"train_loss": -5.160552024841309, "global_step": 10931, "epoch": 260} {"train_loss": -5.048542022705078, "global_step": 10932, "epoch": 260} {"train_loss": -4.8677144050598145, "global_step": 10933, "epoch": 260} {"train_loss": -4.982321262359619, "global_step": 10934, "epoch": 260} {"train_loss": -5.189380645751953, "global_step": 10935, "epoch": 260} {"train_loss": -4.840065002441406, "global_step": 10936, "epoch": 260} {"train_loss": -4.985888957977295, "global_step": 10937, "epoch": 260} {"train_loss": -5.140676975250244, "global_step": 10938, "epoch": 260} {"train_loss": -5.049312114715576, "global_step": 10939, "epoch": 260} {"train_loss": -5.148896217346191, "global_step": 10940, "epoch": 260} {"train_loss": -4.991483211517334, "global_step": 10941, "epoch": 260} {"train_loss": -5.192237854003906, "global_step": 10942, "epoch": 260} {"train_loss": -5.006757736206055, "global_step": 10943, "epoch": 260} {"train_loss": -5.009122371673584, "global_step": 10944, "epoch": 260} {"train_loss": -5.201416015625, "global_step": 10945, "epoch": 260} {"train_loss": -5.117120265960693, "global_step": 10946, "epoch": 260} {"train_loss": -5.15615701675415, "global_step": 10947, "epoch": 260} {"train_loss": -5.040445804595947, "global_step": 10948, "epoch": 260} {"train_loss": -5.102752685546875, "global_step": 10949, "epoch": 260} {"train_loss": -5.027659893035889, "global_step": 10950, "epoch": 260} {"train_loss": -5.174310684204102, "global_step": 10951, "epoch": 260} {"train_loss": -4.908026695251465, "global_step": 10952, "epoch": 260} {"train_loss": -5.021168231964111, "global_step": 10953, "epoch": 260} {"train_loss": -5.06766414642334, "global_step": 10954, "epoch": 260} {"train_loss": -5.073167324066162, "global_step": 10955, "epoch": 260} {"train_loss": -5.113405227661133, "global_step": 10956, "epoch": 260} {"train_loss": -5.0845627784729, "global_step": 10957, "epoch": 260} {"train_loss": -5.012263298034668, "global_step": 10958, "epoch": 260} {"train_loss": -5.110082626342773, "global_step": 10959, "epoch": 260} {"train_loss": -5.220694541931152, "global_step": 10960, "epoch": 260} {"train_loss": -5.0630862939925425, "global_step": 10961, "epoch": 260, "val_loss": 70271.5390625} {"train_loss": -5.148744583129883, "global_step": 10962, "epoch": 261} {"train_loss": -5.087160110473633, "global_step": 10963, "epoch": 261} {"train_loss": -5.113649368286133, "global_step": 10964, "epoch": 261} {"train_loss": -5.090899467468262, "global_step": 10965, "epoch": 261} {"train_loss": -5.140283584594727, "global_step": 10966, "epoch": 261} {"train_loss": -5.074837684631348, "global_step": 10967, "epoch": 261} {"train_loss": -5.0969133377075195, "global_step": 10968, "epoch": 261} {"train_loss": -5.029735565185547, "global_step": 10969, "epoch": 261} {"train_loss": -5.062490463256836, "global_step": 10970, "epoch": 261} {"train_loss": -5.140676498413086, "global_step": 10971, "epoch": 261} {"train_loss": -5.263504505157471, "global_step": 10972, "epoch": 261} {"train_loss": -5.014895439147949, "global_step": 10973, "epoch": 261} {"train_loss": -4.948179721832275, "global_step": 10974, "epoch": 261} {"train_loss": -5.068488121032715, "global_step": 10975, "epoch": 261} {"train_loss": -5.025413990020752, "global_step": 10976, "epoch": 261} {"train_loss": -4.953151702880859, "global_step": 10977, "epoch": 261} {"train_loss": -5.160159587860107, "global_step": 10978, "epoch": 261} {"train_loss": -5.013872146606445, "global_step": 10979, "epoch": 261} {"train_loss": -5.099217414855957, "global_step": 10980, "epoch": 261} {"train_loss": -5.1397600173950195, "global_step": 10981, "epoch": 261} {"train_loss": -5.074295520782471, "global_step": 10982, "epoch": 261} {"train_loss": -4.999566078186035, "global_step": 10983, "epoch": 261} {"train_loss": -5.047772407531738, "global_step": 10984, "epoch": 261} {"train_loss": -5.081276893615723, "global_step": 10985, "epoch": 261} {"train_loss": -5.106902599334717, "global_step": 10986, "epoch": 261} {"train_loss": -4.9740190505981445, "global_step": 10987, "epoch": 261} {"train_loss": -5.088068962097168, "global_step": 10988, "epoch": 261} {"train_loss": -5.127819061279297, "global_step": 10989, "epoch": 261} {"train_loss": -5.093055248260498, "global_step": 10990, "epoch": 261} {"train_loss": -5.127470016479492, "global_step": 10991, "epoch": 261} {"train_loss": -5.060450077056885, "global_step": 10992, "epoch": 261} {"train_loss": -5.061841011047363, "global_step": 10993, "epoch": 261} {"train_loss": -5.282729148864746, "global_step": 10994, "epoch": 261} {"train_loss": -5.06646728515625, "global_step": 10995, "epoch": 261} {"train_loss": -5.080838203430176, "global_step": 10996, "epoch": 261} {"train_loss": -4.961076736450195, "global_step": 10997, "epoch": 261} {"train_loss": -5.071444034576416, "global_step": 10998, "epoch": 261} {"train_loss": -4.926470756530762, "global_step": 10999, "epoch": 261} {"train_loss": -5.012368202209473, "global_step": 11000, "epoch": 261} {"train_loss": -4.995346546173096, "global_step": 11001, "epoch": 261} {"train_loss": -4.970833778381348, "global_step": 11002, "epoch": 261} {"train_loss": -5.069818837302072, "global_step": 11003, "epoch": 261, "val_loss": 70256.1875} {"train_loss": -5.066020488739014, "global_step": 11004, "epoch": 262} {"train_loss": -5.054466724395752, "global_step": 11005, "epoch": 262} {"train_loss": -5.098165512084961, "global_step": 11006, "epoch": 262} {"train_loss": -5.038608551025391, "global_step": 11007, "epoch": 262} {"train_loss": -5.123022079467773, "global_step": 11008, "epoch": 262} {"train_loss": -4.98062801361084, "global_step": 11009, "epoch": 262} {"train_loss": -5.043555736541748, "global_step": 11010, "epoch": 262} {"train_loss": -5.03558874130249, "global_step": 11011, "epoch": 262} {"train_loss": -5.050286293029785, "global_step": 11012, "epoch": 262} {"train_loss": -4.991249084472656, "global_step": 11013, "epoch": 262} {"train_loss": -5.056336402893066, "global_step": 11014, "epoch": 262} {"train_loss": -5.087510585784912, "global_step": 11015, "epoch": 262} {"train_loss": -5.11539363861084, "global_step": 11016, "epoch": 262} {"train_loss": -5.072059154510498, "global_step": 11017, "epoch": 262} {"train_loss": -5.130934715270996, "global_step": 11018, "epoch": 262} {"train_loss": -5.113210201263428, "global_step": 11019, "epoch": 262} {"train_loss": -5.168633460998535, "global_step": 11020, "epoch": 262} {"train_loss": -5.078301906585693, "global_step": 11021, "epoch": 262} {"train_loss": -5.166649341583252, "global_step": 11022, "epoch": 262} {"train_loss": -5.111937522888184, "global_step": 11023, "epoch": 262} {"train_loss": -5.0896100997924805, "global_step": 11024, "epoch": 262} {"train_loss": -5.064297676086426, "global_step": 11025, "epoch": 262} {"train_loss": -5.061946868896484, "global_step": 11026, "epoch": 262} {"train_loss": -5.077939033508301, "global_step": 11027, "epoch": 262} {"train_loss": -5.20107364654541, "global_step": 11028, "epoch": 262} {"train_loss": -5.064727783203125, "global_step": 11029, "epoch": 262} {"train_loss": -5.139954566955566, "global_step": 11030, "epoch": 262} {"train_loss": -5.046630382537842, "global_step": 11031, "epoch": 262} {"train_loss": -5.114310264587402, "global_step": 11032, "epoch": 262} {"train_loss": -5.114261627197266, "global_step": 11033, "epoch": 262} {"train_loss": -5.080182075500488, "global_step": 11034, "epoch": 262} {"train_loss": -5.062816619873047, "global_step": 11035, "epoch": 262} {"train_loss": -5.119362831115723, "global_step": 11036, "epoch": 262} {"train_loss": -5.117681503295898, "global_step": 11037, "epoch": 262} {"train_loss": -5.002657413482666, "global_step": 11038, "epoch": 262} {"train_loss": -5.107927322387695, "global_step": 11039, "epoch": 262} {"train_loss": -5.1219258308410645, "global_step": 11040, "epoch": 262} {"train_loss": -5.008142471313477, "global_step": 11041, "epoch": 262} {"train_loss": -5.119426727294922, "global_step": 11042, "epoch": 262} {"train_loss": -5.207599639892578, "global_step": 11043, "epoch": 262} {"train_loss": -5.157644271850586, "global_step": 11044, "epoch": 262} {"train_loss": -5.091643106369745, "global_step": 11045, "epoch": 262, "val_loss": 70518.3515625} {"train_loss": -5.201211929321289, "global_step": 11046, "epoch": 263} {"train_loss": -5.126850605010986, "global_step": 11047, "epoch": 263} {"train_loss": -5.146193027496338, "global_step": 11048, "epoch": 263} {"train_loss": -5.178250312805176, "global_step": 11049, "epoch": 263} {"train_loss": -5.103870868682861, "global_step": 11050, "epoch": 263} {"train_loss": -5.287925720214844, "global_step": 11051, "epoch": 263} {"train_loss": -4.991811752319336, "global_step": 11052, "epoch": 263} {"train_loss": -4.912174224853516, "global_step": 11053, "epoch": 263} {"train_loss": -5.094655513763428, "global_step": 11054, "epoch": 263} {"train_loss": -5.112769603729248, "global_step": 11055, "epoch": 263} {"train_loss": -5.157352447509766, "global_step": 11056, "epoch": 263} {"train_loss": -5.20506477355957, "global_step": 11057, "epoch": 263} {"train_loss": -5.0640177726745605, "global_step": 11058, "epoch": 263} {"train_loss": -5.188007354736328, "global_step": 11059, "epoch": 263} {"train_loss": -5.084361553192139, "global_step": 11060, "epoch": 263} {"train_loss": -5.11900520324707, "global_step": 11061, "epoch": 263} {"train_loss": -4.932827949523926, "global_step": 11062, "epoch": 263} {"train_loss": -5.113527297973633, "global_step": 11063, "epoch": 263} {"train_loss": -5.159505844116211, "global_step": 11064, "epoch": 263} {"train_loss": -5.11577033996582, "global_step": 11065, "epoch": 263} {"train_loss": -5.110601902008057, "global_step": 11066, "epoch": 263} {"train_loss": -5.156618595123291, "global_step": 11067, "epoch": 263} {"train_loss": -5.1192121505737305, "global_step": 11068, "epoch": 263} {"train_loss": -5.129283428192139, "global_step": 11069, "epoch": 263} {"train_loss": -5.077943801879883, "global_step": 11070, "epoch": 263} {"train_loss": -5.097485542297363, "global_step": 11071, "epoch": 263} {"train_loss": -5.142478942871094, "global_step": 11072, "epoch": 263} {"train_loss": -5.133125305175781, "global_step": 11073, "epoch": 263} {"train_loss": -5.215769290924072, "global_step": 11074, "epoch": 263} {"train_loss": -5.1767988204956055, "global_step": 11075, "epoch": 263} {"train_loss": -5.075733661651611, "global_step": 11076, "epoch": 263} {"train_loss": -4.981356620788574, "global_step": 11077, "epoch": 263} {"train_loss": -4.922744274139404, "global_step": 11078, "epoch": 263} {"train_loss": -5.109950065612793, "global_step": 11079, "epoch": 263} {"train_loss": -4.971192836761475, "global_step": 11080, "epoch": 263} {"train_loss": -5.152559757232666, "global_step": 11081, "epoch": 263} {"train_loss": -5.095200061798096, "global_step": 11082, "epoch": 263} {"train_loss": -5.00129508972168, "global_step": 11083, "epoch": 263} {"train_loss": -5.044500827789307, "global_step": 11084, "epoch": 263} {"train_loss": -5.077450752258301, "global_step": 11085, "epoch": 263} {"train_loss": -5.061357021331787, "global_step": 11086, "epoch": 263} {"train_loss": -5.09954123269944, "global_step": 11087, "epoch": 263, "val_loss": 70792.1328125} {"train_loss": -4.933493614196777, "global_step": 11088, "epoch": 264} {"train_loss": -5.07130241394043, "global_step": 11089, "epoch": 264} {"train_loss": -5.149349212646484, "global_step": 11090, "epoch": 264} {"train_loss": -5.105229377746582, "global_step": 11091, "epoch": 264} {"train_loss": -5.163422584533691, "global_step": 11092, "epoch": 264} {"train_loss": -5.0720672607421875, "global_step": 11093, "epoch": 264} {"train_loss": -5.093868255615234, "global_step": 11094, "epoch": 264} {"train_loss": -5.0975799560546875, "global_step": 11095, "epoch": 264} {"train_loss": -4.952971458435059, "global_step": 11096, "epoch": 264} {"train_loss": -5.094758033752441, "global_step": 11097, "epoch": 264} {"train_loss": -5.119367599487305, "global_step": 11098, "epoch": 264} {"train_loss": -4.8832221031188965, "global_step": 11099, "epoch": 264} {"train_loss": -5.093223571777344, "global_step": 11100, "epoch": 264} {"train_loss": -5.089604377746582, "global_step": 11101, "epoch": 264} {"train_loss": -5.1452436447143555, "global_step": 11102, "epoch": 264} {"train_loss": -5.0175395011901855, "global_step": 11103, "epoch": 264} {"train_loss": -5.012522220611572, "global_step": 11104, "epoch": 264} {"train_loss": -5.0408782958984375, "global_step": 11105, "epoch": 264} {"train_loss": -5.238332748413086, "global_step": 11106, "epoch": 264} {"train_loss": -5.12588357925415, "global_step": 11107, "epoch": 264} {"train_loss": -5.042270183563232, "global_step": 11108, "epoch": 264} {"train_loss": -5.127253532409668, "global_step": 11109, "epoch": 264} {"train_loss": -5.040206432342529, "global_step": 11110, "epoch": 264} {"train_loss": -5.090265274047852, "global_step": 11111, "epoch": 264} {"train_loss": -5.133925437927246, "global_step": 11112, "epoch": 264} {"train_loss": -5.135899543762207, "global_step": 11113, "epoch": 264} {"train_loss": -4.991114139556885, "global_step": 11114, "epoch": 264} {"train_loss": -5.076076030731201, "global_step": 11115, "epoch": 264} {"train_loss": -5.265704154968262, "global_step": 11116, "epoch": 264} {"train_loss": -5.0805983543396, "global_step": 11117, "epoch": 264} {"train_loss": -4.962596893310547, "global_step": 11118, "epoch": 264} {"train_loss": -5.090424537658691, "global_step": 11119, "epoch": 264} {"train_loss": -5.114116191864014, "global_step": 11120, "epoch": 264} {"train_loss": -5.051675319671631, "global_step": 11121, "epoch": 264} {"train_loss": -5.166875839233398, "global_step": 11122, "epoch": 264} {"train_loss": -5.017864227294922, "global_step": 11123, "epoch": 264} {"train_loss": -5.036176681518555, "global_step": 11124, "epoch": 264} {"train_loss": -4.987739562988281, "global_step": 11125, "epoch": 264} {"train_loss": -5.132577896118164, "global_step": 11126, "epoch": 264} {"train_loss": -4.88645076751709, "global_step": 11127, "epoch": 264} {"train_loss": -5.071888446807861, "global_step": 11128, "epoch": 264} {"train_loss": -5.073138032640729, "global_step": 11129, "epoch": 264, "val_loss": 70869.3125} {"train_loss": -5.028360366821289, "global_step": 11130, "epoch": 265} {"train_loss": -5.16947078704834, "global_step": 11131, "epoch": 265} {"train_loss": -5.064168453216553, "global_step": 11132, "epoch": 265} {"train_loss": -5.106984615325928, "global_step": 11133, "epoch": 265} {"train_loss": -4.954545974731445, "global_step": 11134, "epoch": 265} {"train_loss": -5.124032974243164, "global_step": 11135, "epoch": 265} {"train_loss": -4.875801086425781, "global_step": 11136, "epoch": 265} {"train_loss": -5.200634956359863, "global_step": 11137, "epoch": 265} {"train_loss": -5.030669212341309, "global_step": 11138, "epoch": 265} {"train_loss": -5.02890682220459, "global_step": 11139, "epoch": 265} {"train_loss": -5.084358215332031, "global_step": 11140, "epoch": 265} {"train_loss": -5.076574325561523, "global_step": 11141, "epoch": 265} {"train_loss": -5.072445869445801, "global_step": 11142, "epoch": 265} {"train_loss": -5.064310073852539, "global_step": 11143, "epoch": 265} {"train_loss": -5.168112754821777, "global_step": 11144, "epoch": 265} {"train_loss": -5.1584296226501465, "global_step": 11145, "epoch": 265} {"train_loss": -5.134652137756348, "global_step": 11146, "epoch": 265} {"train_loss": -5.1681318283081055, "global_step": 11147, "epoch": 265} {"train_loss": -5.170003890991211, "global_step": 11148, "epoch": 265} {"train_loss": -5.109491348266602, "global_step": 11149, "epoch": 265} {"train_loss": -5.1786675453186035, "global_step": 11150, "epoch": 265} {"train_loss": -5.041836738586426, "global_step": 11151, "epoch": 265} {"train_loss": -5.039995193481445, "global_step": 11152, "epoch": 265} {"train_loss": -5.107314109802246, "global_step": 11153, "epoch": 265} {"train_loss": -5.13333797454834, "global_step": 11154, "epoch": 265} {"train_loss": -5.004146575927734, "global_step": 11155, "epoch": 265} {"train_loss": -5.037344932556152, "global_step": 11156, "epoch": 265} {"train_loss": -5.0891547203063965, "global_step": 11157, "epoch": 265} {"train_loss": -5.100678443908691, "global_step": 11158, "epoch": 265} {"train_loss": -4.985990524291992, "global_step": 11159, "epoch": 265} {"train_loss": -5.061436653137207, "global_step": 11160, "epoch": 265} {"train_loss": -5.176802635192871, "global_step": 11161, "epoch": 265} {"train_loss": -5.077934741973877, "global_step": 11162, "epoch": 265} {"train_loss": -4.9196882247924805, "global_step": 11163, "epoch": 265} {"train_loss": -5.032192230224609, "global_step": 11164, "epoch": 265} {"train_loss": -5.140657901763916, "global_step": 11165, "epoch": 265} {"train_loss": -5.064743995666504, "global_step": 11166, "epoch": 265} {"train_loss": -4.929074764251709, "global_step": 11167, "epoch": 265} {"train_loss": -4.985286712646484, "global_step": 11168, "epoch": 265} {"train_loss": -5.10780143737793, "global_step": 11169, "epoch": 265} {"train_loss": -5.078779220581055, "global_step": 11170, "epoch": 265} {"train_loss": -5.071710700080509, "global_step": 11171, "epoch": 265, "val_loss": 72708.2734375} {"train_loss": -4.928635597229004, "global_step": 11172, "epoch": 266} {"train_loss": -4.915963649749756, "global_step": 11173, "epoch": 266} {"train_loss": -5.024428367614746, "global_step": 11174, "epoch": 266} {"train_loss": -4.871950149536133, "global_step": 11175, "epoch": 266} {"train_loss": -5.115283012390137, "global_step": 11176, "epoch": 266} {"train_loss": -4.985142230987549, "global_step": 11177, "epoch": 266} {"train_loss": -5.112489700317383, "global_step": 11178, "epoch": 266} {"train_loss": -5.0538411140441895, "global_step": 11179, "epoch": 266} {"train_loss": -5.069065093994141, "global_step": 11180, "epoch": 266} {"train_loss": -5.066336631774902, "global_step": 11181, "epoch": 266} {"train_loss": -5.043385982513428, "global_step": 11182, "epoch": 266} {"train_loss": -4.879891872406006, "global_step": 11183, "epoch": 266} {"train_loss": -5.1037092208862305, "global_step": 11184, "epoch": 266} {"train_loss": -5.105403900146484, "global_step": 11185, "epoch": 266} {"train_loss": -5.118157863616943, "global_step": 11186, "epoch": 266} {"train_loss": -5.178672790527344, "global_step": 11187, "epoch": 266} {"train_loss": -5.088058948516846, "global_step": 11188, "epoch": 266} {"train_loss": -5.062287330627441, "global_step": 11189, "epoch": 266} {"train_loss": -5.0519938468933105, "global_step": 11190, "epoch": 266} {"train_loss": -5.079318046569824, "global_step": 11191, "epoch": 266} {"train_loss": -5.1047139167785645, "global_step": 11192, "epoch": 266} {"train_loss": -5.0974040031433105, "global_step": 11193, "epoch": 266} {"train_loss": -5.136117935180664, "global_step": 11194, "epoch": 266} {"train_loss": -5.140105724334717, "global_step": 11195, "epoch": 266} {"train_loss": -5.151981353759766, "global_step": 11196, "epoch": 266} {"train_loss": -4.924955368041992, "global_step": 11197, "epoch": 266} {"train_loss": -5.0237321853637695, "global_step": 11198, "epoch": 266} {"train_loss": -5.147814750671387, "global_step": 11199, "epoch": 266} {"train_loss": -5.142597675323486, "global_step": 11200, "epoch": 266} {"train_loss": -5.117433071136475, "global_step": 11201, "epoch": 266} {"train_loss": -4.816308975219727, "global_step": 11202, "epoch": 266} {"train_loss": -5.083539962768555, "global_step": 11203, "epoch": 266} {"train_loss": -5.145773887634277, "global_step": 11204, "epoch": 266} {"train_loss": -4.965912342071533, "global_step": 11205, "epoch": 266} {"train_loss": -4.91435432434082, "global_step": 11206, "epoch": 266} {"train_loss": -5.007112503051758, "global_step": 11207, "epoch": 266} {"train_loss": -5.04171085357666, "global_step": 11208, "epoch": 266} {"train_loss": -4.888129234313965, "global_step": 11209, "epoch": 266} {"train_loss": -5.132403373718262, "global_step": 11210, "epoch": 266} {"train_loss": -5.121921539306641, "global_step": 11211, "epoch": 266} {"train_loss": -5.084733486175537, "global_step": 11212, "epoch": 266} {"train_loss": -5.050463494800386, "global_step": 11213, "epoch": 266, "val_loss": 70930.390625} {"train_loss": -5.078125953674316, "global_step": 11214, "epoch": 267} {"train_loss": -5.163485527038574, "global_step": 11215, "epoch": 267} {"train_loss": -5.133462429046631, "global_step": 11216, "epoch": 267} {"train_loss": -5.063246250152588, "global_step": 11217, "epoch": 267} {"train_loss": -5.104480743408203, "global_step": 11218, "epoch": 267} {"train_loss": -5.055867671966553, "global_step": 11219, "epoch": 267} {"train_loss": -5.138507843017578, "global_step": 11220, "epoch": 267} {"train_loss": -5.040037155151367, "global_step": 11221, "epoch": 267} {"train_loss": -5.126660346984863, "global_step": 11222, "epoch": 267} {"train_loss": -5.056216239929199, "global_step": 11223, "epoch": 267} {"train_loss": -5.129556655883789, "global_step": 11224, "epoch": 267} {"train_loss": -5.138057231903076, "global_step": 11225, "epoch": 267} {"train_loss": -5.224477767944336, "global_step": 11226, "epoch": 267} {"train_loss": -5.142633438110352, "global_step": 11227, "epoch": 267} {"train_loss": -5.127356052398682, "global_step": 11228, "epoch": 267} {"train_loss": -5.24899959564209, "global_step": 11229, "epoch": 267} {"train_loss": -5.1073455810546875, "global_step": 11230, "epoch": 267} {"train_loss": -5.0416035652160645, "global_step": 11231, "epoch": 267} {"train_loss": -5.228066444396973, "global_step": 11232, "epoch": 267} {"train_loss": -5.100449085235596, "global_step": 11233, "epoch": 267} {"train_loss": -4.9525861740112305, "global_step": 11234, "epoch": 267} {"train_loss": -5.129246234893799, "global_step": 11235, "epoch": 267} {"train_loss": -5.027382850646973, "global_step": 11236, "epoch": 267} {"train_loss": -5.063491344451904, "global_step": 11237, "epoch": 267} {"train_loss": -5.138482093811035, "global_step": 11238, "epoch": 267} {"train_loss": -5.1760101318359375, "global_step": 11239, "epoch": 267} {"train_loss": -5.120499610900879, "global_step": 11240, "epoch": 267} {"train_loss": -5.095692157745361, "global_step": 11241, "epoch": 267} {"train_loss": -4.988457202911377, "global_step": 11242, "epoch": 267} {"train_loss": -4.918819427490234, "global_step": 11243, "epoch": 267} {"train_loss": -5.074886322021484, "global_step": 11244, "epoch": 267} {"train_loss": -4.97280216217041, "global_step": 11245, "epoch": 267} {"train_loss": -5.024025917053223, "global_step": 11246, "epoch": 267} {"train_loss": -5.1443939208984375, "global_step": 11247, "epoch": 267} {"train_loss": -4.958662986755371, "global_step": 11248, "epoch": 267} {"train_loss": -5.047751426696777, "global_step": 11249, "epoch": 267} {"train_loss": -5.015724182128906, "global_step": 11250, "epoch": 267} {"train_loss": -4.931276798248291, "global_step": 11251, "epoch": 267} {"train_loss": -5.0473833084106445, "global_step": 11252, "epoch": 267} {"train_loss": -5.097704887390137, "global_step": 11253, "epoch": 267} {"train_loss": -5.072537422180176, "global_step": 11254, "epoch": 267} {"train_loss": -5.08013315427871, "global_step": 11255, "epoch": 267, "val_loss": 70544.6015625} {"train_loss": -5.156612396240234, "global_step": 11256, "epoch": 268} {"train_loss": -4.998329162597656, "global_step": 11257, "epoch": 268} {"train_loss": -4.933011054992676, "global_step": 11258, "epoch": 268} {"train_loss": -4.973827838897705, "global_step": 11259, "epoch": 268} {"train_loss": -5.0936079025268555, "global_step": 11260, "epoch": 268} {"train_loss": -5.151349067687988, "global_step": 11261, "epoch": 268} {"train_loss": -5.197628498077393, "global_step": 11262, "epoch": 268} {"train_loss": -5.131999969482422, "global_step": 11263, "epoch": 268} {"train_loss": -5.002511501312256, "global_step": 11264, "epoch": 268} {"train_loss": -5.021994590759277, "global_step": 11265, "epoch": 268} {"train_loss": -5.139089584350586, "global_step": 11266, "epoch": 268} {"train_loss": -5.174612998962402, "global_step": 11267, "epoch": 268} {"train_loss": -5.025765419006348, "global_step": 11268, "epoch": 268} {"train_loss": -5.026985168457031, "global_step": 11269, "epoch": 268} {"train_loss": -5.005793571472168, "global_step": 11270, "epoch": 268} {"train_loss": -5.066641330718994, "global_step": 11271, "epoch": 268} {"train_loss": -5.063717842102051, "global_step": 11272, "epoch": 268} {"train_loss": -5.057045936584473, "global_step": 11273, "epoch": 268} {"train_loss": -5.058529853820801, "global_step": 11274, "epoch": 268} {"train_loss": -5.149231910705566, "global_step": 11275, "epoch": 268} {"train_loss": -4.98781681060791, "global_step": 11276, "epoch": 268} {"train_loss": -5.048015594482422, "global_step": 11277, "epoch": 268} {"train_loss": -5.044323921203613, "global_step": 11278, "epoch": 268} {"train_loss": -5.1292805671691895, "global_step": 11279, "epoch": 268} {"train_loss": -4.969765663146973, "global_step": 11280, "epoch": 268} {"train_loss": -5.177210330963135, "global_step": 11281, "epoch": 268} {"train_loss": -5.0437750816345215, "global_step": 11282, "epoch": 268} {"train_loss": -5.109458923339844, "global_step": 11283, "epoch": 268} {"train_loss": -5.0621867179870605, "global_step": 11284, "epoch": 268} {"train_loss": -5.061470031738281, "global_step": 11285, "epoch": 268} {"train_loss": -5.142078399658203, "global_step": 11286, "epoch": 268} {"train_loss": -5.0886125564575195, "global_step": 11287, "epoch": 268} {"train_loss": -5.094707489013672, "global_step": 11288, "epoch": 268} {"train_loss": -5.102388381958008, "global_step": 11289, "epoch": 268} {"train_loss": -5.275192737579346, "global_step": 11290, "epoch": 268} {"train_loss": -4.904818058013916, "global_step": 11291, "epoch": 268} {"train_loss": -5.0826945304870605, "global_step": 11292, "epoch": 268} {"train_loss": -5.226785659790039, "global_step": 11293, "epoch": 268} {"train_loss": -5.039839744567871, "global_step": 11294, "epoch": 268} {"train_loss": -4.969764709472656, "global_step": 11295, "epoch": 268} {"train_loss": -5.180919647216797, "global_step": 11296, "epoch": 268} {"train_loss": -5.0764049007779075, "global_step": 11297, "epoch": 268, "val_loss": 70349.4765625} {"train_loss": -5.059819221496582, "global_step": 11298, "epoch": 269} {"train_loss": -5.1086530685424805, "global_step": 11299, "epoch": 269} {"train_loss": -5.079484939575195, "global_step": 11300, "epoch": 269} {"train_loss": -5.003493309020996, "global_step": 11301, "epoch": 269} {"train_loss": -5.2654523849487305, "global_step": 11302, "epoch": 269} {"train_loss": -5.093121528625488, "global_step": 11303, "epoch": 269} {"train_loss": -5.026460647583008, "global_step": 11304, "epoch": 269} {"train_loss": -5.045805931091309, "global_step": 11305, "epoch": 269} {"train_loss": -5.155573844909668, "global_step": 11306, "epoch": 269} {"train_loss": -5.102039337158203, "global_step": 11307, "epoch": 269} {"train_loss": -5.2186279296875, "global_step": 11308, "epoch": 269} {"train_loss": -5.124285697937012, "global_step": 11309, "epoch": 269} {"train_loss": -5.061283111572266, "global_step": 11310, "epoch": 269} {"train_loss": -5.3150224685668945, "global_step": 11311, "epoch": 269} {"train_loss": -5.113957405090332, "global_step": 11312, "epoch": 269} {"train_loss": -5.034376621246338, "global_step": 11313, "epoch": 269} {"train_loss": -5.077861309051514, "global_step": 11314, "epoch": 269} {"train_loss": -5.2119951248168945, "global_step": 11315, "epoch": 269} {"train_loss": -5.027466773986816, "global_step": 11316, "epoch": 269} {"train_loss": -5.06199836730957, "global_step": 11317, "epoch": 269} {"train_loss": -5.193426132202148, "global_step": 11318, "epoch": 269} {"train_loss": -5.216373443603516, "global_step": 11319, "epoch": 269} {"train_loss": -5.100241184234619, "global_step": 11320, "epoch": 269} {"train_loss": -5.145919322967529, "global_step": 11321, "epoch": 269} {"train_loss": -5.084728240966797, "global_step": 11322, "epoch": 269} {"train_loss": -4.975154876708984, "global_step": 11323, "epoch": 269} {"train_loss": -4.93206262588501, "global_step": 11324, "epoch": 269} {"train_loss": -5.089750289916992, "global_step": 11325, "epoch": 269} {"train_loss": -5.083991050720215, "global_step": 11326, "epoch": 269} {"train_loss": -5.133721351623535, "global_step": 11327, "epoch": 269} {"train_loss": -5.017386436462402, "global_step": 11328, "epoch": 269} {"train_loss": -4.981104850769043, "global_step": 11329, "epoch": 269} {"train_loss": -5.015188217163086, "global_step": 11330, "epoch": 269} {"train_loss": -5.114052772521973, "global_step": 11331, "epoch": 269} {"train_loss": -5.072768211364746, "global_step": 11332, "epoch": 269} {"train_loss": -5.113310813903809, "global_step": 11333, "epoch": 269} {"train_loss": -5.11466121673584, "global_step": 11334, "epoch": 269} {"train_loss": -5.126869201660156, "global_step": 11335, "epoch": 269} {"train_loss": -5.186890125274658, "global_step": 11336, "epoch": 269} {"train_loss": -5.0244293212890625, "global_step": 11337, "epoch": 269} {"train_loss": -5.054892539978027, "global_step": 11338, "epoch": 269} {"train_loss": -5.096821251369658, "global_step": 11339, "epoch": 269, "val_loss": 70760.078125} {"train_loss": -5.144812107086182, "global_step": 11340, "epoch": 270} {"train_loss": -5.105617523193359, "global_step": 11341, "epoch": 270} {"train_loss": -4.924154281616211, "global_step": 11342, "epoch": 270} {"train_loss": -5.174691200256348, "global_step": 11343, "epoch": 270} {"train_loss": -5.17540979385376, "global_step": 11344, "epoch": 270} {"train_loss": -5.143511772155762, "global_step": 11345, "epoch": 270} {"train_loss": -5.089818954467773, "global_step": 11346, "epoch": 270} {"train_loss": -5.169288635253906, "global_step": 11347, "epoch": 270} {"train_loss": -5.197038650512695, "global_step": 11348, "epoch": 270} {"train_loss": -5.227713584899902, "global_step": 11349, "epoch": 270} {"train_loss": -5.1683783531188965, "global_step": 11350, "epoch": 270} {"train_loss": -5.165148735046387, "global_step": 11351, "epoch": 270} {"train_loss": -4.982635974884033, "global_step": 11352, "epoch": 270} {"train_loss": -5.095099449157715, "global_step": 11353, "epoch": 270} {"train_loss": -5.117621898651123, "global_step": 11354, "epoch": 270} {"train_loss": -5.1749749183654785, "global_step": 11355, "epoch": 270} {"train_loss": -4.920168876647949, "global_step": 11356, "epoch": 270} {"train_loss": -4.963726043701172, "global_step": 11357, "epoch": 270} {"train_loss": -5.1209716796875, "global_step": 11358, "epoch": 270} {"train_loss": -5.118193626403809, "global_step": 11359, "epoch": 270} {"train_loss": -5.089485168457031, "global_step": 11360, "epoch": 270} {"train_loss": -5.098421096801758, "global_step": 11361, "epoch": 270} {"train_loss": -5.149967193603516, "global_step": 11362, "epoch": 270} {"train_loss": -5.047974586486816, "global_step": 11363, "epoch": 270} {"train_loss": -5.092850685119629, "global_step": 11364, "epoch": 270} {"train_loss": -5.070058822631836, "global_step": 11365, "epoch": 270} {"train_loss": -5.086014270782471, "global_step": 11366, "epoch": 270} {"train_loss": -5.11885929107666, "global_step": 11367, "epoch": 270} {"train_loss": -5.15627384185791, "global_step": 11368, "epoch": 270} {"train_loss": -5.14039421081543, "global_step": 11369, "epoch": 270} {"train_loss": -5.1119232177734375, "global_step": 11370, "epoch": 270} {"train_loss": -5.210217475891113, "global_step": 11371, "epoch": 270} {"train_loss": -5.084364891052246, "global_step": 11372, "epoch": 270} {"train_loss": -5.078409671783447, "global_step": 11373, "epoch": 270} {"train_loss": -5.237261772155762, "global_step": 11374, "epoch": 270} {"train_loss": -5.134741306304932, "global_step": 11375, "epoch": 270} {"train_loss": -5.073123455047607, "global_step": 11376, "epoch": 270} {"train_loss": -5.209785461425781, "global_step": 11377, "epoch": 270} {"train_loss": -5.167815208435059, "global_step": 11378, "epoch": 270} {"train_loss": -5.002058982849121, "global_step": 11379, "epoch": 270} {"train_loss": -5.058811664581299, "global_step": 11380, "epoch": 270} {"train_loss": -5.111275786445255, "global_step": 11381, "epoch": 270, "val_loss": 70674.8046875} {"train_loss": -5.064915657043457, "global_step": 11382, "epoch": 271} {"train_loss": -5.077132225036621, "global_step": 11383, "epoch": 271} {"train_loss": -5.084399223327637, "global_step": 11384, "epoch": 271} {"train_loss": -4.960414886474609, "global_step": 11385, "epoch": 271} {"train_loss": -5.073156356811523, "global_step": 11386, "epoch": 271} {"train_loss": -4.931696891784668, "global_step": 11387, "epoch": 271} {"train_loss": -5.029913902282715, "global_step": 11388, "epoch": 271} {"train_loss": -5.187894821166992, "global_step": 11389, "epoch": 271} {"train_loss": -5.060966491699219, "global_step": 11390, "epoch": 271} {"train_loss": -4.983253479003906, "global_step": 11391, "epoch": 271} {"train_loss": -5.14455509185791, "global_step": 11392, "epoch": 271} {"train_loss": -5.125764846801758, "global_step": 11393, "epoch": 271} {"train_loss": -4.953248023986816, "global_step": 11394, "epoch": 271} {"train_loss": -5.0047149658203125, "global_step": 11395, "epoch": 271} {"train_loss": -5.126622200012207, "global_step": 11396, "epoch": 271} {"train_loss": -4.988458633422852, "global_step": 11397, "epoch": 271} {"train_loss": -5.0769243240356445, "global_step": 11398, "epoch": 271} {"train_loss": -4.949885368347168, "global_step": 11399, "epoch": 271} {"train_loss": -5.047266960144043, "global_step": 11400, "epoch": 271} {"train_loss": -5.093649864196777, "global_step": 11401, "epoch": 271} {"train_loss": -5.071662902832031, "global_step": 11402, "epoch": 271} {"train_loss": -4.967133522033691, "global_step": 11403, "epoch": 271} {"train_loss": -5.0877838134765625, "global_step": 11404, "epoch": 271} {"train_loss": -5.092410564422607, "global_step": 11405, "epoch": 271} {"train_loss": -4.995948791503906, "global_step": 11406, "epoch": 271} {"train_loss": -4.99428653717041, "global_step": 11407, "epoch": 271} {"train_loss": -5.108294486999512, "global_step": 11408, "epoch": 271} {"train_loss": -5.103765964508057, "global_step": 11409, "epoch": 271} {"train_loss": -5.1056742668151855, "global_step": 11410, "epoch": 271} {"train_loss": -5.146550178527832, "global_step": 11411, "epoch": 271} {"train_loss": -4.938898086547852, "global_step": 11412, "epoch": 271} {"train_loss": -4.987282752990723, "global_step": 11413, "epoch": 271} {"train_loss": -5.081131458282471, "global_step": 11414, "epoch": 271} {"train_loss": -5.270603179931641, "global_step": 11415, "epoch": 271} {"train_loss": -5.134991645812988, "global_step": 11416, "epoch": 271} {"train_loss": -5.042695999145508, "global_step": 11417, "epoch": 271} {"train_loss": -5.0770111083984375, "global_step": 11418, "epoch": 271} {"train_loss": -5.124873161315918, "global_step": 11419, "epoch": 271} {"train_loss": -5.077726364135742, "global_step": 11420, "epoch": 271} {"train_loss": -5.141425132751465, "global_step": 11421, "epoch": 271} {"train_loss": -5.147838592529297, "global_step": 11422, "epoch": 271} {"train_loss": -5.0674118882133845, "global_step": 11423, "epoch": 271, "val_loss": 70616.6953125} {"train_loss": -5.177721977233887, "global_step": 11424, "epoch": 272} {"train_loss": -5.094537258148193, "global_step": 11425, "epoch": 272} {"train_loss": -5.163174629211426, "global_step": 11426, "epoch": 272} {"train_loss": -5.03166389465332, "global_step": 11427, "epoch": 272} {"train_loss": -5.036283493041992, "global_step": 11428, "epoch": 272} {"train_loss": -5.070998191833496, "global_step": 11429, "epoch": 272} {"train_loss": -5.038948059082031, "global_step": 11430, "epoch": 272} {"train_loss": -5.025974273681641, "global_step": 11431, "epoch": 272} {"train_loss": -5.205404758453369, "global_step": 11432, "epoch": 272} {"train_loss": -5.042181015014648, "global_step": 11433, "epoch": 272} {"train_loss": -5.026264667510986, "global_step": 11434, "epoch": 272} {"train_loss": -5.215250015258789, "global_step": 11435, "epoch": 272} {"train_loss": -5.013946533203125, "global_step": 11436, "epoch": 272} {"train_loss": -4.8934478759765625, "global_step": 11437, "epoch": 272} {"train_loss": -5.079708099365234, "global_step": 11438, "epoch": 272} {"train_loss": -5.101139068603516, "global_step": 11439, "epoch": 272} {"train_loss": -5.052581310272217, "global_step": 11440, "epoch": 272} {"train_loss": -5.13275671005249, "global_step": 11441, "epoch": 272} {"train_loss": -5.098730564117432, "global_step": 11442, "epoch": 272} {"train_loss": -5.076051235198975, "global_step": 11443, "epoch": 272} {"train_loss": -5.123035430908203, "global_step": 11444, "epoch": 272} {"train_loss": -5.167928695678711, "global_step": 11445, "epoch": 272} {"train_loss": -5.006715297698975, "global_step": 11446, "epoch": 272} {"train_loss": -5.1082634925842285, "global_step": 11447, "epoch": 272} {"train_loss": -5.088145732879639, "global_step": 11448, "epoch": 272} {"train_loss": -5.1579155921936035, "global_step": 11449, "epoch": 272} {"train_loss": -4.941742897033691, "global_step": 11450, "epoch": 272} {"train_loss": -5.0989155769348145, "global_step": 11451, "epoch": 272} {"train_loss": -5.094143867492676, "global_step": 11452, "epoch": 272} {"train_loss": -5.095432758331299, "global_step": 11453, "epoch": 272} {"train_loss": -5.090755939483643, "global_step": 11454, "epoch": 272} {"train_loss": -5.009903907775879, "global_step": 11455, "epoch": 272} {"train_loss": -5.077993392944336, "global_step": 11456, "epoch": 272} {"train_loss": -5.042799949645996, "global_step": 11457, "epoch": 272} {"train_loss": -4.945122718811035, "global_step": 11458, "epoch": 272} {"train_loss": -4.915459156036377, "global_step": 11459, "epoch": 272} {"train_loss": -5.096330165863037, "global_step": 11460, "epoch": 272} {"train_loss": -5.120595932006836, "global_step": 11461, "epoch": 272} {"train_loss": -5.163440704345703, "global_step": 11462, "epoch": 272} {"train_loss": -5.048251152038574, "global_step": 11463, "epoch": 272} {"train_loss": -5.092039585113525, "global_step": 11464, "epoch": 272} {"train_loss": -5.073562656130109, "global_step": 11465, "epoch": 272, "val_loss": 71178.5859375} {"train_loss": -5.053952217102051, "global_step": 11466, "epoch": 273} {"train_loss": -5.164026260375977, "global_step": 11467, "epoch": 273} {"train_loss": -5.250896453857422, "global_step": 11468, "epoch": 273} {"train_loss": -5.100645065307617, "global_step": 11469, "epoch": 273} {"train_loss": -5.093789100646973, "global_step": 11470, "epoch": 273} {"train_loss": -5.079712390899658, "global_step": 11471, "epoch": 273} {"train_loss": -5.069580078125, "global_step": 11472, "epoch": 273} {"train_loss": -5.172121047973633, "global_step": 11473, "epoch": 273} {"train_loss": -5.082159042358398, "global_step": 11474, "epoch": 273} {"train_loss": -5.155589580535889, "global_step": 11475, "epoch": 273} {"train_loss": -5.09388542175293, "global_step": 11476, "epoch": 273} {"train_loss": -5.159825325012207, "global_step": 11477, "epoch": 273} {"train_loss": -5.1046552658081055, "global_step": 11478, "epoch": 273} {"train_loss": -5.037428855895996, "global_step": 11479, "epoch": 273} {"train_loss": -5.135369300842285, "global_step": 11480, "epoch": 273} {"train_loss": -5.224996566772461, "global_step": 11481, "epoch": 273} {"train_loss": -5.232140064239502, "global_step": 11482, "epoch": 273} {"train_loss": -5.095717430114746, "global_step": 11483, "epoch": 273} {"train_loss": -5.134166240692139, "global_step": 11484, "epoch": 273} {"train_loss": -5.096491813659668, "global_step": 11485, "epoch": 273} {"train_loss": -4.9400763511657715, "global_step": 11486, "epoch": 273} {"train_loss": -5.158969879150391, "global_step": 11487, "epoch": 273} {"train_loss": -5.107789039611816, "global_step": 11488, "epoch": 273} {"train_loss": -4.974088668823242, "global_step": 11489, "epoch": 273} {"train_loss": -4.955239772796631, "global_step": 11490, "epoch": 273} {"train_loss": -4.940778732299805, "global_step": 11491, "epoch": 273} {"train_loss": -5.0913496017456055, "global_step": 11492, "epoch": 273} {"train_loss": -5.141213417053223, "global_step": 11493, "epoch": 273} {"train_loss": -4.890293121337891, "global_step": 11494, "epoch": 273} {"train_loss": -4.935177803039551, "global_step": 11495, "epoch": 273} {"train_loss": -5.142627716064453, "global_step": 11496, "epoch": 273} {"train_loss": -4.928089141845703, "global_step": 11497, "epoch": 273} {"train_loss": -5.042506217956543, "global_step": 11498, "epoch": 273} {"train_loss": -4.9832587242126465, "global_step": 11499, "epoch": 273} {"train_loss": -5.0961456298828125, "global_step": 11500, "epoch": 273} {"train_loss": -5.018796920776367, "global_step": 11501, "epoch": 273} {"train_loss": -5.198332786560059, "global_step": 11502, "epoch": 273} {"train_loss": -4.9436726570129395, "global_step": 11503, "epoch": 273} {"train_loss": -5.155195236206055, "global_step": 11504, "epoch": 273} {"train_loss": -5.057358741760254, "global_step": 11505, "epoch": 273} {"train_loss": -5.089512825012207, "global_step": 11506, "epoch": 273} {"train_loss": -5.083408185413906, "global_step": 11507, "epoch": 273, "val_loss": 70956.9765625} {"train_loss": -5.156418800354004, "global_step": 11508, "epoch": 274} {"train_loss": -5.113738059997559, "global_step": 11509, "epoch": 274} {"train_loss": -5.277606964111328, "global_step": 11510, "epoch": 274} {"train_loss": -5.004398345947266, "global_step": 11511, "epoch": 274} {"train_loss": -5.0920796394348145, "global_step": 11512, "epoch": 274} {"train_loss": -5.171483039855957, "global_step": 11513, "epoch": 274} {"train_loss": -5.148603916168213, "global_step": 11514, "epoch": 274} {"train_loss": -5.025474548339844, "global_step": 11515, "epoch": 274} {"train_loss": -5.205007076263428, "global_step": 11516, "epoch": 274} {"train_loss": -5.1147379875183105, "global_step": 11517, "epoch": 274} {"train_loss": -5.088237762451172, "global_step": 11518, "epoch": 274} {"train_loss": -5.063602447509766, "global_step": 11519, "epoch": 274} {"train_loss": -5.0243024826049805, "global_step": 11520, "epoch": 274} {"train_loss": -5.0411057472229, "global_step": 11521, "epoch": 274} {"train_loss": -4.990513324737549, "global_step": 11522, "epoch": 274} {"train_loss": -5.208431243896484, "global_step": 11523, "epoch": 274} {"train_loss": -5.14928674697876, "global_step": 11524, "epoch": 274} {"train_loss": -5.216819763183594, "global_step": 11525, "epoch": 274} {"train_loss": -5.044083595275879, "global_step": 11526, "epoch": 274} {"train_loss": -5.160515785217285, "global_step": 11527, "epoch": 274} {"train_loss": -5.153679370880127, "global_step": 11528, "epoch": 274} {"train_loss": -4.980914115905762, "global_step": 11529, "epoch": 274} {"train_loss": -5.0799994468688965, "global_step": 11530, "epoch": 274} {"train_loss": -5.039941787719727, "global_step": 11531, "epoch": 274} {"train_loss": -5.1622419357299805, "global_step": 11532, "epoch": 274} {"train_loss": -5.174972057342529, "global_step": 11533, "epoch": 274} {"train_loss": -5.083536624908447, "global_step": 11534, "epoch": 274} {"train_loss": -5.007377624511719, "global_step": 11535, "epoch": 274} {"train_loss": -5.038407802581787, "global_step": 11536, "epoch": 274} {"train_loss": -5.0662641525268555, "global_step": 11537, "epoch": 274} {"train_loss": -5.1197686195373535, "global_step": 11538, "epoch": 274} {"train_loss": -5.022992134094238, "global_step": 11539, "epoch": 274} {"train_loss": -5.022911548614502, "global_step": 11540, "epoch": 274} {"train_loss": -5.132761001586914, "global_step": 11541, "epoch": 274} {"train_loss": -5.163200378417969, "global_step": 11542, "epoch": 274} {"train_loss": -5.040164947509766, "global_step": 11543, "epoch": 274} {"train_loss": -5.102909088134766, "global_step": 11544, "epoch": 274} {"train_loss": -5.147489070892334, "global_step": 11545, "epoch": 274} {"train_loss": -5.094979286193848, "global_step": 11546, "epoch": 274} {"train_loss": -5.0432891845703125, "global_step": 11547, "epoch": 274} {"train_loss": -5.096965312957764, "global_step": 11548, "epoch": 274} {"train_loss": -5.101460604440598, "global_step": 11549, "epoch": 274, "val_loss": 70541.5546875} {"train_loss": -4.979545593261719, "global_step": 11550, "epoch": 275} {"train_loss": -5.162283897399902, "global_step": 11551, "epoch": 275} {"train_loss": -5.111979007720947, "global_step": 11552, "epoch": 275} {"train_loss": -5.153273582458496, "global_step": 11553, "epoch": 275} {"train_loss": -5.086353778839111, "global_step": 11554, "epoch": 275} {"train_loss": -5.1319074630737305, "global_step": 11555, "epoch": 275} {"train_loss": -5.127922534942627, "global_step": 11556, "epoch": 275} {"train_loss": -5.1680908203125, "global_step": 11557, "epoch": 275} {"train_loss": -5.182989597320557, "global_step": 11558, "epoch": 275} {"train_loss": -5.082367420196533, "global_step": 11559, "epoch": 275} {"train_loss": -5.041351318359375, "global_step": 11560, "epoch": 275} {"train_loss": -5.169044494628906, "global_step": 11561, "epoch": 275} {"train_loss": -4.973320007324219, "global_step": 11562, "epoch": 275} {"train_loss": -5.085709095001221, "global_step": 11563, "epoch": 275} {"train_loss": -5.081808090209961, "global_step": 11564, "epoch": 275} {"train_loss": -5.143651008605957, "global_step": 11565, "epoch": 275} {"train_loss": -5.189307689666748, "global_step": 11566, "epoch": 275} {"train_loss": -5.095113754272461, "global_step": 11567, "epoch": 275} {"train_loss": -5.009075164794922, "global_step": 11568, "epoch": 275} {"train_loss": -5.15281867980957, "global_step": 11569, "epoch": 275} {"train_loss": -5.151318073272705, "global_step": 11570, "epoch": 275} {"train_loss": -5.176177024841309, "global_step": 11571, "epoch": 275} {"train_loss": -5.0945210456848145, "global_step": 11572, "epoch": 275} {"train_loss": -5.1648054122924805, "global_step": 11573, "epoch": 275} {"train_loss": -5.0274858474731445, "global_step": 11574, "epoch": 275} {"train_loss": -5.138190269470215, "global_step": 11575, "epoch": 275} {"train_loss": -5.02069091796875, "global_step": 11576, "epoch": 275} {"train_loss": -5.163558483123779, "global_step": 11577, "epoch": 275} {"train_loss": -5.033991813659668, "global_step": 11578, "epoch": 275} {"train_loss": -5.028848648071289, "global_step": 11579, "epoch": 275} {"train_loss": -5.073378562927246, "global_step": 11580, "epoch": 275} {"train_loss": -5.1493730545043945, "global_step": 11581, "epoch": 275} {"train_loss": -4.937146186828613, "global_step": 11582, "epoch": 275} {"train_loss": -5.051349639892578, "global_step": 11583, "epoch": 275} {"train_loss": -5.1550140380859375, "global_step": 11584, "epoch": 275} {"train_loss": -5.135691165924072, "global_step": 11585, "epoch": 275} {"train_loss": -4.988260269165039, "global_step": 11586, "epoch": 275} {"train_loss": -5.219657897949219, "global_step": 11587, "epoch": 275} {"train_loss": -4.992427825927734, "global_step": 11588, "epoch": 275} {"train_loss": -4.989563465118408, "global_step": 11589, "epoch": 275} {"train_loss": -5.096424102783203, "global_step": 11590, "epoch": 275} {"train_loss": -5.093929495130267, "global_step": 11591, "epoch": 275, "val_loss": 71324.703125} {"train_loss": -5.1663970947265625, "global_step": 11592, "epoch": 276} {"train_loss": -5.008173942565918, "global_step": 11593, "epoch": 276} {"train_loss": -5.144176483154297, "global_step": 11594, "epoch": 276} {"train_loss": -5.048413276672363, "global_step": 11595, "epoch": 276} {"train_loss": -5.006439208984375, "global_step": 11596, "epoch": 276} {"train_loss": -5.002270221710205, "global_step": 11597, "epoch": 276} {"train_loss": -4.983410358428955, "global_step": 11598, "epoch": 276} {"train_loss": -5.064882278442383, "global_step": 11599, "epoch": 276} {"train_loss": -5.010902404785156, "global_step": 11600, "epoch": 276} {"train_loss": -4.997674942016602, "global_step": 11601, "epoch": 276} {"train_loss": -5.17720890045166, "global_step": 11602, "epoch": 276} {"train_loss": -4.9602179527282715, "global_step": 11603, "epoch": 276} {"train_loss": -5.086864471435547, "global_step": 11604, "epoch": 276} {"train_loss": -5.093967437744141, "global_step": 11605, "epoch": 276} {"train_loss": -5.2853851318359375, "global_step": 11606, "epoch": 276} {"train_loss": -4.971912384033203, "global_step": 11607, "epoch": 276} {"train_loss": -5.029773712158203, "global_step": 11608, "epoch": 276} {"train_loss": -5.091904640197754, "global_step": 11609, "epoch": 276} {"train_loss": -5.0789618492126465, "global_step": 11610, "epoch": 276} {"train_loss": -5.1154398918151855, "global_step": 11611, "epoch": 276} {"train_loss": -5.2114338874816895, "global_step": 11612, "epoch": 276} {"train_loss": -5.151475429534912, "global_step": 11613, "epoch": 276} {"train_loss": -5.111559867858887, "global_step": 11614, "epoch": 276} {"train_loss": -5.184040546417236, "global_step": 11615, "epoch": 276} {"train_loss": -5.082084655761719, "global_step": 11616, "epoch": 276} {"train_loss": -5.154794692993164, "global_step": 11617, "epoch": 276} {"train_loss": -5.132341384887695, "global_step": 11618, "epoch": 276} {"train_loss": -5.19179630279541, "global_step": 11619, "epoch": 276} {"train_loss": -5.195797920227051, "global_step": 11620, "epoch": 276} {"train_loss": -4.958850860595703, "global_step": 11621, "epoch": 276} {"train_loss": -5.1127166748046875, "global_step": 11622, "epoch": 276} {"train_loss": -5.057307720184326, "global_step": 11623, "epoch": 276} {"train_loss": -5.0063066482543945, "global_step": 11624, "epoch": 276} {"train_loss": -5.110983848571777, "global_step": 11625, "epoch": 276} {"train_loss": -5.0999040603637695, "global_step": 11626, "epoch": 276} {"train_loss": -5.0856828689575195, "global_step": 11627, "epoch": 276} {"train_loss": -5.120413303375244, "global_step": 11628, "epoch": 276} {"train_loss": -5.073692798614502, "global_step": 11629, "epoch": 276} {"train_loss": -5.076960563659668, "global_step": 11630, "epoch": 276} {"train_loss": -5.206778526306152, "global_step": 11631, "epoch": 276} {"train_loss": -5.125599384307861, "global_step": 11632, "epoch": 276} {"train_loss": -5.09043010075887, "global_step": 11633, "epoch": 276, "val_loss": 70684.6953125} {"train_loss": -5.159788131713867, "global_step": 11634, "epoch": 277} {"train_loss": -5.120300769805908, "global_step": 11635, "epoch": 277} {"train_loss": -5.147500038146973, "global_step": 11636, "epoch": 277} {"train_loss": -5.139469146728516, "global_step": 11637, "epoch": 277} {"train_loss": -5.136462211608887, "global_step": 11638, "epoch": 277} {"train_loss": -5.154663562774658, "global_step": 11639, "epoch": 277} {"train_loss": -5.000010013580322, "global_step": 11640, "epoch": 277} {"train_loss": -4.939736843109131, "global_step": 11641, "epoch": 277} {"train_loss": -5.282271385192871, "global_step": 11642, "epoch": 277} {"train_loss": -5.247183322906494, "global_step": 11643, "epoch": 277} {"train_loss": -5.071045398712158, "global_step": 11644, "epoch": 277} {"train_loss": -4.911412239074707, "global_step": 11645, "epoch": 277} {"train_loss": -4.9020514488220215, "global_step": 11646, "epoch": 277} {"train_loss": -5.139190673828125, "global_step": 11647, "epoch": 277} {"train_loss": -4.803296089172363, "global_step": 11648, "epoch": 277} {"train_loss": -4.930142402648926, "global_step": 11649, "epoch": 277} {"train_loss": -5.166431427001953, "global_step": 11650, "epoch": 277} {"train_loss": -4.948113918304443, "global_step": 11651, "epoch": 277} {"train_loss": -5.070079326629639, "global_step": 11652, "epoch": 277} {"train_loss": -5.007238388061523, "global_step": 11653, "epoch": 277} {"train_loss": -5.028568267822266, "global_step": 11654, "epoch": 277} {"train_loss": -5.1400628089904785, "global_step": 11655, "epoch": 277} {"train_loss": -5.027419567108154, "global_step": 11656, "epoch": 277} {"train_loss": -4.962217807769775, "global_step": 11657, "epoch": 277} {"train_loss": -5.035586357116699, "global_step": 11658, "epoch": 277} {"train_loss": -5.142664432525635, "global_step": 11659, "epoch": 277} {"train_loss": -5.011374473571777, "global_step": 11660, "epoch": 277} {"train_loss": -5.1699442863464355, "global_step": 11661, "epoch": 277} {"train_loss": -5.198470115661621, "global_step": 11662, "epoch": 277} {"train_loss": -5.342101097106934, "global_step": 11663, "epoch": 277} {"train_loss": -5.075515270233154, "global_step": 11664, "epoch": 277} {"train_loss": -5.158086776733398, "global_step": 11665, "epoch": 277} {"train_loss": -5.163019180297852, "global_step": 11666, "epoch": 277} {"train_loss": -5.041709899902344, "global_step": 11667, "epoch": 277} {"train_loss": -5.113297462463379, "global_step": 11668, "epoch": 277} {"train_loss": -5.124236583709717, "global_step": 11669, "epoch": 277} {"train_loss": -5.055963039398193, "global_step": 11670, "epoch": 277} {"train_loss": -5.164271354675293, "global_step": 11671, "epoch": 277} {"train_loss": -5.155577659606934, "global_step": 11672, "epoch": 277} {"train_loss": -5.100070953369141, "global_step": 11673, "epoch": 277} {"train_loss": -5.062898635864258, "global_step": 11674, "epoch": 277} {"train_loss": -5.085142135620117, "global_step": 11675, "epoch": 277, "val_loss": 70809.859375} {"train_loss": -5.0810441970825195, "global_step": 11676, "epoch": 278} {"train_loss": -5.063576698303223, "global_step": 11677, "epoch": 278} {"train_loss": -5.144003391265869, "global_step": 11678, "epoch": 278} {"train_loss": -5.085700035095215, "global_step": 11679, "epoch": 278} {"train_loss": -5.123566627502441, "global_step": 11680, "epoch": 278} {"train_loss": -5.0635762214660645, "global_step": 11681, "epoch": 278} {"train_loss": -4.970348358154297, "global_step": 11682, "epoch": 278} {"train_loss": -5.070838451385498, "global_step": 11683, "epoch": 278} {"train_loss": -5.235469818115234, "global_step": 11684, "epoch": 278} {"train_loss": -5.250555038452148, "global_step": 11685, "epoch": 278} {"train_loss": -4.908910751342773, "global_step": 11686, "epoch": 278} {"train_loss": -4.927437782287598, "global_step": 11687, "epoch": 278} {"train_loss": -5.213973045349121, "global_step": 11688, "epoch": 278} {"train_loss": -4.981203079223633, "global_step": 11689, "epoch": 278} {"train_loss": -4.9186811447143555, "global_step": 11690, "epoch": 278} {"train_loss": -5.080755710601807, "global_step": 11691, "epoch": 278} {"train_loss": -4.958878517150879, "global_step": 11692, "epoch": 278} {"train_loss": -5.026122093200684, "global_step": 11693, "epoch": 278} {"train_loss": -5.136107921600342, "global_step": 11694, "epoch": 278} {"train_loss": -4.974004745483398, "global_step": 11695, "epoch": 278} {"train_loss": -5.1056108474731445, "global_step": 11696, "epoch": 278} {"train_loss": -5.071475028991699, "global_step": 11697, "epoch": 278} {"train_loss": -4.977929592132568, "global_step": 11698, "epoch": 278} {"train_loss": -4.993149280548096, "global_step": 11699, "epoch": 278} {"train_loss": -5.091655254364014, "global_step": 11700, "epoch": 278} {"train_loss": -4.934615135192871, "global_step": 11701, "epoch": 278} {"train_loss": -5.170438289642334, "global_step": 11702, "epoch": 278} {"train_loss": -4.970986366271973, "global_step": 11703, "epoch": 278} {"train_loss": -5.114956855773926, "global_step": 11704, "epoch": 278} {"train_loss": -5.117537975311279, "global_step": 11705, "epoch": 278} {"train_loss": -4.933382034301758, "global_step": 11706, "epoch": 278} {"train_loss": -5.17691707611084, "global_step": 11707, "epoch": 278} {"train_loss": -5.026803493499756, "global_step": 11708, "epoch": 278} {"train_loss": -5.19029426574707, "global_step": 11709, "epoch": 278} {"train_loss": -4.995989799499512, "global_step": 11710, "epoch": 278} {"train_loss": -4.976045608520508, "global_step": 11711, "epoch": 278} {"train_loss": -5.045692443847656, "global_step": 11712, "epoch": 278} {"train_loss": -5.07990837097168, "global_step": 11713, "epoch": 278} {"train_loss": -5.079398155212402, "global_step": 11714, "epoch": 278} {"train_loss": -5.1447882652282715, "global_step": 11715, "epoch": 278} {"train_loss": -4.968517303466797, "global_step": 11716, "epoch": 278} {"train_loss": -5.061216331663585, "global_step": 11717, "epoch": 278, "val_loss": 71760.6328125} {"train_loss": -5.0646233558654785, "global_step": 11718, "epoch": 279} {"train_loss": -5.031030654907227, "global_step": 11719, "epoch": 279} {"train_loss": -4.867185592651367, "global_step": 11720, "epoch": 279} {"train_loss": -5.168240547180176, "global_step": 11721, "epoch": 279} {"train_loss": -5.15975284576416, "global_step": 11722, "epoch": 279} {"train_loss": -5.128565311431885, "global_step": 11723, "epoch": 279} {"train_loss": -5.228298187255859, "global_step": 11724, "epoch": 279} {"train_loss": -4.94508171081543, "global_step": 11725, "epoch": 279} {"train_loss": -4.821536540985107, "global_step": 11726, "epoch": 279} {"train_loss": -4.984899520874023, "global_step": 11727, "epoch": 279} {"train_loss": -5.071258544921875, "global_step": 11728, "epoch": 279} {"train_loss": -4.861560821533203, "global_step": 11729, "epoch": 279} {"train_loss": -4.978144645690918, "global_step": 11730, "epoch": 279} {"train_loss": -4.951525688171387, "global_step": 11731, "epoch": 279} {"train_loss": -4.947525978088379, "global_step": 11732, "epoch": 279} {"train_loss": -5.104068756103516, "global_step": 11733, "epoch": 279} {"train_loss": -5.0838470458984375, "global_step": 11734, "epoch": 279} {"train_loss": -4.928629398345947, "global_step": 11735, "epoch": 279} {"train_loss": -4.938834190368652, "global_step": 11736, "epoch": 279} {"train_loss": -5.092357635498047, "global_step": 11737, "epoch": 279} {"train_loss": -4.956320285797119, "global_step": 11738, "epoch": 279} {"train_loss": -4.962653160095215, "global_step": 11739, "epoch": 279} {"train_loss": -4.9910993576049805, "global_step": 11740, "epoch": 279} {"train_loss": -5.047199726104736, "global_step": 11741, "epoch": 279} {"train_loss": -4.9688920974731445, "global_step": 11742, "epoch": 279} {"train_loss": -5.131442070007324, "global_step": 11743, "epoch": 279} {"train_loss": -5.223848819732666, "global_step": 11744, "epoch": 279} {"train_loss": -4.975404739379883, "global_step": 11745, "epoch": 279} {"train_loss": -5.035223007202148, "global_step": 11746, "epoch": 279} {"train_loss": -5.076897621154785, "global_step": 11747, "epoch": 279} {"train_loss": -5.044600486755371, "global_step": 11748, "epoch": 279} {"train_loss": -5.025656223297119, "global_step": 11749, "epoch": 279} {"train_loss": -5.199559211730957, "global_step": 11750, "epoch": 279} {"train_loss": -4.997713088989258, "global_step": 11751, "epoch": 279} {"train_loss": -5.010700225830078, "global_step": 11752, "epoch": 279} {"train_loss": -4.94918155670166, "global_step": 11753, "epoch": 279} {"train_loss": -5.086376190185547, "global_step": 11754, "epoch": 279} {"train_loss": -5.1145710945129395, "global_step": 11755, "epoch": 279} {"train_loss": -5.088897705078125, "global_step": 11756, "epoch": 279} {"train_loss": -5.185894966125488, "global_step": 11757, "epoch": 279} {"train_loss": -5.117455959320068, "global_step": 11758, "epoch": 279} {"train_loss": -5.040189901987712, "global_step": 11759, "epoch": 279, "val_loss": 71480.5078125} {"train_loss": -5.042881965637207, "global_step": 11760, "epoch": 280} {"train_loss": -5.004223823547363, "global_step": 11761, "epoch": 280} {"train_loss": -5.079327583312988, "global_step": 11762, "epoch": 280} {"train_loss": -4.939545154571533, "global_step": 11763, "epoch": 280} {"train_loss": -5.0530595779418945, "global_step": 11764, "epoch": 280} {"train_loss": -5.076174259185791, "global_step": 11765, "epoch": 280} {"train_loss": -5.0213117599487305, "global_step": 11766, "epoch": 280} {"train_loss": -5.104741096496582, "global_step": 11767, "epoch": 280} {"train_loss": -5.140764236450195, "global_step": 11768, "epoch": 280} {"train_loss": -4.981581687927246, "global_step": 11769, "epoch": 280} {"train_loss": -5.095851421356201, "global_step": 11770, "epoch": 280} {"train_loss": -5.028135299682617, "global_step": 11771, "epoch": 280} {"train_loss": -5.121816635131836, "global_step": 11772, "epoch": 280} {"train_loss": -5.242521286010742, "global_step": 11773, "epoch": 280} {"train_loss": -5.207272529602051, "global_step": 11774, "epoch": 280} {"train_loss": -5.150854587554932, "global_step": 11775, "epoch": 280} {"train_loss": -5.205597877502441, "global_step": 11776, "epoch": 280} {"train_loss": -5.0395402908325195, "global_step": 11777, "epoch": 280} {"train_loss": -5.2888383865356445, "global_step": 11778, "epoch": 280} {"train_loss": -5.168825149536133, "global_step": 11779, "epoch": 280} {"train_loss": -5.239009380340576, "global_step": 11780, "epoch": 280} {"train_loss": -5.084780216217041, "global_step": 11781, "epoch": 280} {"train_loss": -5.139402389526367, "global_step": 11782, "epoch": 280} {"train_loss": -5.039891242980957, "global_step": 11783, "epoch": 280} {"train_loss": -5.032054901123047, "global_step": 11784, "epoch": 280} {"train_loss": -5.099510192871094, "global_step": 11785, "epoch": 280} {"train_loss": -4.913211822509766, "global_step": 11786, "epoch": 280} {"train_loss": -5.088052272796631, "global_step": 11787, "epoch": 280} {"train_loss": -5.166475296020508, "global_step": 11788, "epoch": 280} {"train_loss": -5.028742790222168, "global_step": 11789, "epoch": 280} {"train_loss": -5.0437493324279785, "global_step": 11790, "epoch": 280} {"train_loss": -4.9965362548828125, "global_step": 11791, "epoch": 280} {"train_loss": -5.039613723754883, "global_step": 11792, "epoch": 280} {"train_loss": -4.937304496765137, "global_step": 11793, "epoch": 280} {"train_loss": -5.189303398132324, "global_step": 11794, "epoch": 280} {"train_loss": -5.001169204711914, "global_step": 11795, "epoch": 280} {"train_loss": -4.935762405395508, "global_step": 11796, "epoch": 280} {"train_loss": -5.193848609924316, "global_step": 11797, "epoch": 280} {"train_loss": -4.828400611877441, "global_step": 11798, "epoch": 280} {"train_loss": -4.900289535522461, "global_step": 11799, "epoch": 280} {"train_loss": -5.09878396987915, "global_step": 11800, "epoch": 280} {"train_loss": -5.064114377612159, "global_step": 11801, "epoch": 280, "val_loss": 70418.4296875} {"train_loss": -5.112848281860352, "global_step": 11802, "epoch": 281} {"train_loss": -4.780107498168945, "global_step": 11803, "epoch": 281} {"train_loss": -4.941579818725586, "global_step": 11804, "epoch": 281} {"train_loss": -5.001744270324707, "global_step": 11805, "epoch": 281} {"train_loss": -4.8964524269104, "global_step": 11806, "epoch": 281} {"train_loss": -4.987022399902344, "global_step": 11807, "epoch": 281} {"train_loss": -4.945857048034668, "global_step": 11808, "epoch": 281} {"train_loss": -5.041134357452393, "global_step": 11809, "epoch": 281} {"train_loss": -4.932336330413818, "global_step": 11810, "epoch": 281} {"train_loss": -5.0137939453125, "global_step": 11811, "epoch": 281} {"train_loss": -4.875475883483887, "global_step": 11812, "epoch": 281} {"train_loss": -5.113974571228027, "global_step": 11813, "epoch": 281} {"train_loss": -4.944156646728516, "global_step": 11814, "epoch": 281} {"train_loss": -5.126006126403809, "global_step": 11815, "epoch": 281} {"train_loss": -5.000052452087402, "global_step": 11816, "epoch": 281} {"train_loss": -5.214588165283203, "global_step": 11817, "epoch": 281} {"train_loss": -5.0604448318481445, "global_step": 11818, "epoch": 281} {"train_loss": -5.206907272338867, "global_step": 11819, "epoch": 281} {"train_loss": -4.925695896148682, "global_step": 11820, "epoch": 281} {"train_loss": -5.067708969116211, "global_step": 11821, "epoch": 281} {"train_loss": -5.097884654998779, "global_step": 11822, "epoch": 281} {"train_loss": -5.043253421783447, "global_step": 11823, "epoch": 281} {"train_loss": -5.10915994644165, "global_step": 11824, "epoch": 281} {"train_loss": -5.076251983642578, "global_step": 11825, "epoch": 281} {"train_loss": -5.122851848602295, "global_step": 11826, "epoch": 281} {"train_loss": -4.983573913574219, "global_step": 11827, "epoch": 281} {"train_loss": -5.093827247619629, "global_step": 11828, "epoch": 281} {"train_loss": -4.871471405029297, "global_step": 11829, "epoch": 281} {"train_loss": -5.00301456451416, "global_step": 11830, "epoch": 281} {"train_loss": -5.1382012367248535, "global_step": 11831, "epoch": 281} {"train_loss": -5.1199469566345215, "global_step": 11832, "epoch": 281} {"train_loss": -5.09988260269165, "global_step": 11833, "epoch": 281} {"train_loss": -5.042441368103027, "global_step": 11834, "epoch": 281} {"train_loss": -5.152400970458984, "global_step": 11835, "epoch": 281} {"train_loss": -5.106427192687988, "global_step": 11836, "epoch": 281} {"train_loss": -4.9085493087768555, "global_step": 11837, "epoch": 281} {"train_loss": -5.149527549743652, "global_step": 11838, "epoch": 281} {"train_loss": -5.070590019226074, "global_step": 11839, "epoch": 281} {"train_loss": -5.15621280670166, "global_step": 11840, "epoch": 281} {"train_loss": -5.097330570220947, "global_step": 11841, "epoch": 281} {"train_loss": -5.098715782165527, "global_step": 11842, "epoch": 281} {"train_loss": -5.0422902674902055, "global_step": 11843, "epoch": 281, "val_loss": 70769.46875} {"train_loss": -5.16253662109375, "global_step": 11844, "epoch": 282} {"train_loss": -5.086430549621582, "global_step": 11845, "epoch": 282} {"train_loss": -5.31027364730835, "global_step": 11846, "epoch": 282} {"train_loss": -5.12104606628418, "global_step": 11847, "epoch": 282} {"train_loss": -5.0192551612854, "global_step": 11848, "epoch": 282} {"train_loss": -4.962104320526123, "global_step": 11849, "epoch": 282} {"train_loss": -5.1873087882995605, "global_step": 11850, "epoch": 282} {"train_loss": -5.152458190917969, "global_step": 11851, "epoch": 282} {"train_loss": -5.236392498016357, "global_step": 11852, "epoch": 282} {"train_loss": -5.1933794021606445, "global_step": 11853, "epoch": 282} {"train_loss": -4.961357116699219, "global_step": 11854, "epoch": 282} {"train_loss": -5.221256732940674, "global_step": 11855, "epoch": 282} {"train_loss": -5.232419967651367, "global_step": 11856, "epoch": 282} {"train_loss": -4.945190906524658, "global_step": 11857, "epoch": 282} {"train_loss": -5.212483882904053, "global_step": 11858, "epoch": 282} {"train_loss": -5.0441389083862305, "global_step": 11859, "epoch": 282} {"train_loss": -5.046517848968506, "global_step": 11860, "epoch": 282} {"train_loss": -4.976105690002441, "global_step": 11861, "epoch": 282} {"train_loss": -5.13862943649292, "global_step": 11862, "epoch": 282} {"train_loss": -5.007109642028809, "global_step": 11863, "epoch": 282} {"train_loss": -5.160589218139648, "global_step": 11864, "epoch": 282} {"train_loss": -5.082632541656494, "global_step": 11865, "epoch": 282} {"train_loss": -5.113898277282715, "global_step": 11866, "epoch": 282} {"train_loss": -5.0166215896606445, "global_step": 11867, "epoch": 282} {"train_loss": -5.090629577636719, "global_step": 11868, "epoch": 282} {"train_loss": -5.140830993652344, "global_step": 11869, "epoch": 282} {"train_loss": -5.063745975494385, "global_step": 11870, "epoch": 282} {"train_loss": -5.097620964050293, "global_step": 11871, "epoch": 282} {"train_loss": -5.01168155670166, "global_step": 11872, "epoch": 282} {"train_loss": -5.113853931427002, "global_step": 11873, "epoch": 282} {"train_loss": -5.171184539794922, "global_step": 11874, "epoch": 282} {"train_loss": -5.08724308013916, "global_step": 11875, "epoch": 282} {"train_loss": -5.054750919342041, "global_step": 11876, "epoch": 282} {"train_loss": -5.036233901977539, "global_step": 11877, "epoch": 282} {"train_loss": -5.19134521484375, "global_step": 11878, "epoch": 282} {"train_loss": -5.224088191986084, "global_step": 11879, "epoch": 282} {"train_loss": -5.248508930206299, "global_step": 11880, "epoch": 282} {"train_loss": -5.130383491516113, "global_step": 11881, "epoch": 282} {"train_loss": -5.09328031539917, "global_step": 11882, "epoch": 282} {"train_loss": -5.133657455444336, "global_step": 11883, "epoch": 282} {"train_loss": -5.0631103515625, "global_step": 11884, "epoch": 282} {"train_loss": -5.108701615106492, "global_step": 11885, "epoch": 282, "val_loss": 70448.859375} {"train_loss": -5.0889739990234375, "global_step": 11886, "epoch": 283} {"train_loss": -5.098372459411621, "global_step": 11887, "epoch": 283} {"train_loss": -5.109810829162598, "global_step": 11888, "epoch": 283} {"train_loss": -5.049908638000488, "global_step": 11889, "epoch": 283} {"train_loss": -5.181039333343506, "global_step": 11890, "epoch": 283} {"train_loss": -5.1063947677612305, "global_step": 11891, "epoch": 283} {"train_loss": -5.114243030548096, "global_step": 11892, "epoch": 283} {"train_loss": -5.2047810554504395, "global_step": 11893, "epoch": 283} {"train_loss": -5.170819282531738, "global_step": 11894, "epoch": 283} {"train_loss": -5.129085540771484, "global_step": 11895, "epoch": 283} {"train_loss": -5.05706262588501, "global_step": 11896, "epoch": 283} {"train_loss": -5.138385772705078, "global_step": 11897, "epoch": 283} {"train_loss": -5.244687557220459, "global_step": 11898, "epoch": 283} {"train_loss": -5.138352394104004, "global_step": 11899, "epoch": 283} {"train_loss": -5.037029266357422, "global_step": 11900, "epoch": 283} {"train_loss": -5.144795894622803, "global_step": 11901, "epoch": 283} {"train_loss": -5.116170883178711, "global_step": 11902, "epoch": 283} {"train_loss": -5.072526931762695, "global_step": 11903, "epoch": 283} {"train_loss": -4.785268783569336, "global_step": 11904, "epoch": 283} {"train_loss": -5.02936315536499, "global_step": 11905, "epoch": 283} {"train_loss": -5.143926620483398, "global_step": 11906, "epoch": 283} {"train_loss": -4.994625091552734, "global_step": 11907, "epoch": 283} {"train_loss": -4.844897270202637, "global_step": 11908, "epoch": 283} {"train_loss": -5.09008264541626, "global_step": 11909, "epoch": 283} {"train_loss": -5.039978981018066, "global_step": 11910, "epoch": 283} {"train_loss": -4.96707010269165, "global_step": 11911, "epoch": 283} {"train_loss": -5.2168965339660645, "global_step": 11912, "epoch": 283} {"train_loss": -5.035440444946289, "global_step": 11913, "epoch": 283} {"train_loss": -4.992948055267334, "global_step": 11914, "epoch": 283} {"train_loss": -5.327770233154297, "global_step": 11915, "epoch": 283} {"train_loss": -4.951866626739502, "global_step": 11916, "epoch": 283} {"train_loss": -4.9320549964904785, "global_step": 11917, "epoch": 283} {"train_loss": -5.040767669677734, "global_step": 11918, "epoch": 283} {"train_loss": -4.865508079528809, "global_step": 11919, "epoch": 283} {"train_loss": -5.008198261260986, "global_step": 11920, "epoch": 283} {"train_loss": -5.061748504638672, "global_step": 11921, "epoch": 283} {"train_loss": -5.112068176269531, "global_step": 11922, "epoch": 283} {"train_loss": -5.0871992111206055, "global_step": 11923, "epoch": 283} {"train_loss": -5.018393516540527, "global_step": 11924, "epoch": 283} {"train_loss": -5.155514240264893, "global_step": 11925, "epoch": 283} {"train_loss": -5.059943675994873, "global_step": 11926, "epoch": 283} {"train_loss": -5.070623375120617, "global_step": 11927, "epoch": 283, "val_loss": 70179.8125} {"train_loss": -5.192165374755859, "global_step": 11928, "epoch": 284} {"train_loss": -5.120612621307373, "global_step": 11929, "epoch": 284} {"train_loss": -5.064202308654785, "global_step": 11930, "epoch": 284} {"train_loss": -5.197976112365723, "global_step": 11931, "epoch": 284} {"train_loss": -5.099178314208984, "global_step": 11932, "epoch": 284} {"train_loss": -5.066938877105713, "global_step": 11933, "epoch": 284} {"train_loss": -5.103716850280762, "global_step": 11934, "epoch": 284} {"train_loss": -4.991729736328125, "global_step": 11935, "epoch": 284} {"train_loss": -5.166021823883057, "global_step": 11936, "epoch": 284} {"train_loss": -5.093274116516113, "global_step": 11937, "epoch": 284} {"train_loss": -5.197324752807617, "global_step": 11938, "epoch": 284} {"train_loss": -5.1689629554748535, "global_step": 11939, "epoch": 284} {"train_loss": -5.104334831237793, "global_step": 11940, "epoch": 284} {"train_loss": -5.319296836853027, "global_step": 11941, "epoch": 284} {"train_loss": -5.122196674346924, "global_step": 11942, "epoch": 284} {"train_loss": -5.141150951385498, "global_step": 11943, "epoch": 284} {"train_loss": -5.114529132843018, "global_step": 11944, "epoch": 284} {"train_loss": -5.103737831115723, "global_step": 11945, "epoch": 284} {"train_loss": -5.166126251220703, "global_step": 11946, "epoch": 284} {"train_loss": -5.095777988433838, "global_step": 11947, "epoch": 284} {"train_loss": -5.160233497619629, "global_step": 11948, "epoch": 284} {"train_loss": -5.187482833862305, "global_step": 11949, "epoch": 284} {"train_loss": -5.037167072296143, "global_step": 11950, "epoch": 284} {"train_loss": -5.042901992797852, "global_step": 11951, "epoch": 284} {"train_loss": -5.012799263000488, "global_step": 11952, "epoch": 284} {"train_loss": -4.971625328063965, "global_step": 11953, "epoch": 284} {"train_loss": -4.934035301208496, "global_step": 11954, "epoch": 284} {"train_loss": -5.175254821777344, "global_step": 11955, "epoch": 284} {"train_loss": -4.990435600280762, "global_step": 11956, "epoch": 284} {"train_loss": -4.840802192687988, "global_step": 11957, "epoch": 284} {"train_loss": -5.103847026824951, "global_step": 11958, "epoch": 284} {"train_loss": -5.10715913772583, "global_step": 11959, "epoch": 284} {"train_loss": -4.939274787902832, "global_step": 11960, "epoch": 284} {"train_loss": -5.0934834480285645, "global_step": 11961, "epoch": 284} {"train_loss": -5.244933128356934, "global_step": 11962, "epoch": 284} {"train_loss": -5.136425018310547, "global_step": 11963, "epoch": 284} {"train_loss": -5.006109714508057, "global_step": 11964, "epoch": 284} {"train_loss": -5.105518341064453, "global_step": 11965, "epoch": 284} {"train_loss": -5.027588844299316, "global_step": 11966, "epoch": 284} {"train_loss": -5.184882640838623, "global_step": 11967, "epoch": 284} {"train_loss": -5.214095115661621, "global_step": 11968, "epoch": 284} {"train_loss": -5.101189136505127, "global_step": 11969, "epoch": 284, "val_loss": 70717.59375} {"train_loss": -5.0958170890808105, "global_step": 11970, "epoch": 285} {"train_loss": -5.071761131286621, "global_step": 11971, "epoch": 285} {"train_loss": -5.107179164886475, "global_step": 11972, "epoch": 285} {"train_loss": -5.099123477935791, "global_step": 11973, "epoch": 285} {"train_loss": -5.193501949310303, "global_step": 11974, "epoch": 285} {"train_loss": -5.118574142456055, "global_step": 11975, "epoch": 285} {"train_loss": -5.036983489990234, "global_step": 11976, "epoch": 285} {"train_loss": -5.1793951988220215, "global_step": 11977, "epoch": 285} {"train_loss": -5.156712055206299, "global_step": 11978, "epoch": 285} {"train_loss": -5.095452308654785, "global_step": 11979, "epoch": 285} {"train_loss": -4.9183244705200195, "global_step": 11980, "epoch": 285} {"train_loss": -5.090623378753662, "global_step": 11981, "epoch": 285} {"train_loss": -5.145242691040039, "global_step": 11982, "epoch": 285} {"train_loss": -5.003411769866943, "global_step": 11983, "epoch": 285} {"train_loss": -5.035514831542969, "global_step": 11984, "epoch": 285} {"train_loss": -5.111511707305908, "global_step": 11985, "epoch": 285} {"train_loss": -4.85933780670166, "global_step": 11986, "epoch": 285} {"train_loss": -5.2179436683654785, "global_step": 11987, "epoch": 285} {"train_loss": -4.991950035095215, "global_step": 11988, "epoch": 285} {"train_loss": -5.013586521148682, "global_step": 11989, "epoch": 285} {"train_loss": -5.036462306976318, "global_step": 11990, "epoch": 285} {"train_loss": -5.046538352966309, "global_step": 11991, "epoch": 285} {"train_loss": -5.071380615234375, "global_step": 11992, "epoch": 285} {"train_loss": -5.116847038269043, "global_step": 11993, "epoch": 285} {"train_loss": -5.17820930480957, "global_step": 11994, "epoch": 285} {"train_loss": -5.11195182800293, "global_step": 11995, "epoch": 285} {"train_loss": -5.046407699584961, "global_step": 11996, "epoch": 285} {"train_loss": -5.1051716804504395, "global_step": 11997, "epoch": 285} {"train_loss": -5.023922920227051, "global_step": 11998, "epoch": 285} {"train_loss": -5.254450798034668, "global_step": 11999, "epoch": 285} {"train_loss": -5.161405563354492, "global_step": 12000, "epoch": 285} {"train_loss": -4.898360252380371, "global_step": 12001, "epoch": 285} {"train_loss": -5.138130187988281, "global_step": 12002, "epoch": 285} {"train_loss": -5.013703346252441, "global_step": 12003, "epoch": 285} {"train_loss": -5.24185848236084, "global_step": 12004, "epoch": 285} {"train_loss": -5.038349628448486, "global_step": 12005, "epoch": 285} {"train_loss": -5.1194987297058105, "global_step": 12006, "epoch": 285} {"train_loss": -5.049984931945801, "global_step": 12007, "epoch": 285} {"train_loss": -5.1436357498168945, "global_step": 12008, "epoch": 285} {"train_loss": -5.170901298522949, "global_step": 12009, "epoch": 285} {"train_loss": -5.14414119720459, "global_step": 12010, "epoch": 285} {"train_loss": -5.092877739951724, "global_step": 12011, "epoch": 285, "val_loss": 71413.7109375} {"train_loss": -4.936614513397217, "global_step": 12012, "epoch": 286} {"train_loss": -5.124246597290039, "global_step": 12013, "epoch": 286} {"train_loss": -5.111846923828125, "global_step": 12014, "epoch": 286} {"train_loss": -5.211940765380859, "global_step": 12015, "epoch": 286} {"train_loss": -5.083536624908447, "global_step": 12016, "epoch": 286} {"train_loss": -5.024498462677002, "global_step": 12017, "epoch": 286} {"train_loss": -5.159341812133789, "global_step": 12018, "epoch": 286} {"train_loss": -5.22953987121582, "global_step": 12019, "epoch": 286} {"train_loss": -5.085527420043945, "global_step": 12020, "epoch": 286} {"train_loss": -5.076667785644531, "global_step": 12021, "epoch": 286} {"train_loss": -5.23538875579834, "global_step": 12022, "epoch": 286} {"train_loss": -5.217266082763672, "global_step": 12023, "epoch": 286} {"train_loss": -5.152703285217285, "global_step": 12024, "epoch": 286} {"train_loss": -5.138988494873047, "global_step": 12025, "epoch": 286} {"train_loss": -5.080256938934326, "global_step": 12026, "epoch": 286} {"train_loss": -5.1054253578186035, "global_step": 12027, "epoch": 286} {"train_loss": -5.226911544799805, "global_step": 12028, "epoch": 286} {"train_loss": -5.09013557434082, "global_step": 12029, "epoch": 286} {"train_loss": -5.071345329284668, "global_step": 12030, "epoch": 286} {"train_loss": -5.143054485321045, "global_step": 12031, "epoch": 286} {"train_loss": -5.07850456237793, "global_step": 12032, "epoch": 286} {"train_loss": -5.166876792907715, "global_step": 12033, "epoch": 286} {"train_loss": -5.07609748840332, "global_step": 12034, "epoch": 286} {"train_loss": -4.985638618469238, "global_step": 12035, "epoch": 286} {"train_loss": -5.160127639770508, "global_step": 12036, "epoch": 286} {"train_loss": -5.145727157592773, "global_step": 12037, "epoch": 286} {"train_loss": -5.053099632263184, "global_step": 12038, "epoch": 286} {"train_loss": -5.095647811889648, "global_step": 12039, "epoch": 286} {"train_loss": -5.165071487426758, "global_step": 12040, "epoch": 286} {"train_loss": -4.962542533874512, "global_step": 12041, "epoch": 286} {"train_loss": -5.0552978515625, "global_step": 12042, "epoch": 286} {"train_loss": -5.068758964538574, "global_step": 12043, "epoch": 286} {"train_loss": -5.082606315612793, "global_step": 12044, "epoch": 286} {"train_loss": -5.038506031036377, "global_step": 12045, "epoch": 286} {"train_loss": -5.039279460906982, "global_step": 12046, "epoch": 286} {"train_loss": -5.02054500579834, "global_step": 12047, "epoch": 286} {"train_loss": -5.093685150146484, "global_step": 12048, "epoch": 286} {"train_loss": -5.150642395019531, "global_step": 12049, "epoch": 286} {"train_loss": -5.082897186279297, "global_step": 12050, "epoch": 286} {"train_loss": -5.085264205932617, "global_step": 12051, "epoch": 286} {"train_loss": -4.998624801635742, "global_step": 12052, "epoch": 286} {"train_loss": -5.100918849309285, "global_step": 12053, "epoch": 286, "val_loss": 71438.4375} {"train_loss": -5.16569709777832, "global_step": 12054, "epoch": 287} {"train_loss": -5.09531831741333, "global_step": 12055, "epoch": 287} {"train_loss": -5.166288375854492, "global_step": 12056, "epoch": 287} {"train_loss": -5.145951747894287, "global_step": 12057, "epoch": 287} {"train_loss": -5.0929155349731445, "global_step": 12058, "epoch": 287} {"train_loss": -5.157806873321533, "global_step": 12059, "epoch": 287} {"train_loss": -5.143731117248535, "global_step": 12060, "epoch": 287} {"train_loss": -5.200812339782715, "global_step": 12061, "epoch": 287} {"train_loss": -5.016474723815918, "global_step": 12062, "epoch": 287} {"train_loss": -5.0619001388549805, "global_step": 12063, "epoch": 287} {"train_loss": -5.150437355041504, "global_step": 12064, "epoch": 287} {"train_loss": -5.129497528076172, "global_step": 12065, "epoch": 287} {"train_loss": -5.142935752868652, "global_step": 12066, "epoch": 287} {"train_loss": -5.025483131408691, "global_step": 12067, "epoch": 287} {"train_loss": -5.1092400550842285, "global_step": 12068, "epoch": 287} {"train_loss": -5.082662582397461, "global_step": 12069, "epoch": 287} {"train_loss": -5.15826940536499, "global_step": 12070, "epoch": 287} {"train_loss": -5.195219039916992, "global_step": 12071, "epoch": 287} {"train_loss": -5.118734359741211, "global_step": 12072, "epoch": 287} {"train_loss": -5.050336837768555, "global_step": 12073, "epoch": 287} {"train_loss": -5.1901421546936035, "global_step": 12074, "epoch": 287} {"train_loss": -5.00301456451416, "global_step": 12075, "epoch": 287} {"train_loss": -5.0055694580078125, "global_step": 12076, "epoch": 287} {"train_loss": -5.164851188659668, "global_step": 12077, "epoch": 287} {"train_loss": -5.042488098144531, "global_step": 12078, "epoch": 287} {"train_loss": -5.107728481292725, "global_step": 12079, "epoch": 287} {"train_loss": -5.006939888000488, "global_step": 12080, "epoch": 287} {"train_loss": -5.1183929443359375, "global_step": 12081, "epoch": 287} {"train_loss": -5.165173530578613, "global_step": 12082, "epoch": 287} {"train_loss": -5.11076021194458, "global_step": 12083, "epoch": 287} {"train_loss": -5.103959083557129, "global_step": 12084, "epoch": 287} {"train_loss": -5.015974998474121, "global_step": 12085, "epoch": 287} {"train_loss": -5.2353010177612305, "global_step": 12086, "epoch": 287} {"train_loss": -5.173572063446045, "global_step": 12087, "epoch": 287} {"train_loss": -5.078680992126465, "global_step": 12088, "epoch": 287} {"train_loss": -5.2140960693359375, "global_step": 12089, "epoch": 287} {"train_loss": -5.208197593688965, "global_step": 12090, "epoch": 287} {"train_loss": -5.059027194976807, "global_step": 12091, "epoch": 287} {"train_loss": -5.083644390106201, "global_step": 12092, "epoch": 287} {"train_loss": -5.011854648590088, "global_step": 12093, "epoch": 287} {"train_loss": -5.202683448791504, "global_step": 12094, "epoch": 287} {"train_loss": -5.115613165355864, "global_step": 12095, "epoch": 287, "val_loss": 71024.6796875} {"train_loss": -5.015539646148682, "global_step": 12096, "epoch": 288} {"train_loss": -5.07797908782959, "global_step": 12097, "epoch": 288} {"train_loss": -5.0053911209106445, "global_step": 12098, "epoch": 288} {"train_loss": -5.059499263763428, "global_step": 12099, "epoch": 288} {"train_loss": -5.1400556564331055, "global_step": 12100, "epoch": 288} {"train_loss": -5.03523588180542, "global_step": 12101, "epoch": 288} {"train_loss": -4.968982696533203, "global_step": 12102, "epoch": 288} {"train_loss": -5.12071418762207, "global_step": 12103, "epoch": 288} {"train_loss": -5.1220197677612305, "global_step": 12104, "epoch": 288} {"train_loss": -5.281399250030518, "global_step": 12105, "epoch": 288} {"train_loss": -5.186059951782227, "global_step": 12106, "epoch": 288} {"train_loss": -5.144195556640625, "global_step": 12107, "epoch": 288} {"train_loss": -5.286886692047119, "global_step": 12108, "epoch": 288} {"train_loss": -5.076745986938477, "global_step": 12109, "epoch": 288} {"train_loss": -5.230252265930176, "global_step": 12110, "epoch": 288} {"train_loss": -5.115530967712402, "global_step": 12111, "epoch": 288} {"train_loss": -5.110786437988281, "global_step": 12112, "epoch": 288} {"train_loss": -5.1122636795043945, "global_step": 12113, "epoch": 288} {"train_loss": -5.106072425842285, "global_step": 12114, "epoch": 288} {"train_loss": -5.114414691925049, "global_step": 12115, "epoch": 288} {"train_loss": -5.293097496032715, "global_step": 12116, "epoch": 288} {"train_loss": -5.083393573760986, "global_step": 12117, "epoch": 288} {"train_loss": -4.952310562133789, "global_step": 12118, "epoch": 288} {"train_loss": -5.0556745529174805, "global_step": 12119, "epoch": 288} {"train_loss": -5.16180419921875, "global_step": 12120, "epoch": 288} {"train_loss": -5.208551406860352, "global_step": 12121, "epoch": 288} {"train_loss": -4.999371528625488, "global_step": 12122, "epoch": 288} {"train_loss": -5.110895156860352, "global_step": 12123, "epoch": 288} {"train_loss": -5.1020660400390625, "global_step": 12124, "epoch": 288} {"train_loss": -5.081110000610352, "global_step": 12125, "epoch": 288} {"train_loss": -5.014006614685059, "global_step": 12126, "epoch": 288} {"train_loss": -5.215635299682617, "global_step": 12127, "epoch": 288} {"train_loss": -5.13075590133667, "global_step": 12128, "epoch": 288} {"train_loss": -4.989808082580566, "global_step": 12129, "epoch": 288} {"train_loss": -4.991161346435547, "global_step": 12130, "epoch": 288} {"train_loss": -5.070548057556152, "global_step": 12131, "epoch": 288} {"train_loss": -5.056109428405762, "global_step": 12132, "epoch": 288} {"train_loss": -5.124837398529053, "global_step": 12133, "epoch": 288} {"train_loss": -5.04047966003418, "global_step": 12134, "epoch": 288} {"train_loss": -5.089991569519043, "global_step": 12135, "epoch": 288} {"train_loss": -5.125014781951904, "global_step": 12136, "epoch": 288} {"train_loss": -5.103596210479736, "global_step": 12137, "epoch": 288, "val_loss": 70469.5625} {"train_loss": -5.127925872802734, "global_step": 12138, "epoch": 289} {"train_loss": -5.082473278045654, "global_step": 12139, "epoch": 289} {"train_loss": -5.302099227905273, "global_step": 12140, "epoch": 289} {"train_loss": -4.999691009521484, "global_step": 12141, "epoch": 289} {"train_loss": -5.223703384399414, "global_step": 12142, "epoch": 289} {"train_loss": -5.182286739349365, "global_step": 12143, "epoch": 289} {"train_loss": -5.135316371917725, "global_step": 12144, "epoch": 289} {"train_loss": -5.163827419281006, "global_step": 12145, "epoch": 289} {"train_loss": -5.077085494995117, "global_step": 12146, "epoch": 289} {"train_loss": -5.0982842445373535, "global_step": 12147, "epoch": 289} {"train_loss": -5.082093238830566, "global_step": 12148, "epoch": 289} {"train_loss": -5.148879051208496, "global_step": 12149, "epoch": 289} {"train_loss": -5.118044853210449, "global_step": 12150, "epoch": 289} {"train_loss": -5.159907341003418, "global_step": 12151, "epoch": 289} {"train_loss": -5.1453351974487305, "global_step": 12152, "epoch": 289} {"train_loss": -5.171228408813477, "global_step": 12153, "epoch": 289} {"train_loss": -5.038909435272217, "global_step": 12154, "epoch": 289} {"train_loss": -5.090506553649902, "global_step": 12155, "epoch": 289} {"train_loss": -5.1387529373168945, "global_step": 12156, "epoch": 289} {"train_loss": -5.140976905822754, "global_step": 12157, "epoch": 289} {"train_loss": -5.021125793457031, "global_step": 12158, "epoch": 289} {"train_loss": -5.048608779907227, "global_step": 12159, "epoch": 289} {"train_loss": -5.198427200317383, "global_step": 12160, "epoch": 289} {"train_loss": -5.198253631591797, "global_step": 12161, "epoch": 289} {"train_loss": -5.063277721405029, "global_step": 12162, "epoch": 289} {"train_loss": -4.986662864685059, "global_step": 12163, "epoch": 289} {"train_loss": -5.187260627746582, "global_step": 12164, "epoch": 289} {"train_loss": -5.0632710456848145, "global_step": 12165, "epoch": 289} {"train_loss": -4.961152076721191, "global_step": 12166, "epoch": 289} {"train_loss": -4.896770477294922, "global_step": 12167, "epoch": 289} {"train_loss": -5.065039157867432, "global_step": 12168, "epoch": 289} {"train_loss": -4.982221603393555, "global_step": 12169, "epoch": 289} {"train_loss": -4.942666053771973, "global_step": 12170, "epoch": 289} {"train_loss": -5.071540832519531, "global_step": 12171, "epoch": 289} {"train_loss": -4.9633283615112305, "global_step": 12172, "epoch": 289} {"train_loss": -5.068743705749512, "global_step": 12173, "epoch": 289} {"train_loss": -5.177709102630615, "global_step": 12174, "epoch": 289} {"train_loss": -5.074532985687256, "global_step": 12175, "epoch": 289} {"train_loss": -5.199904441833496, "global_step": 12176, "epoch": 289} {"train_loss": -4.898177146911621, "global_step": 12177, "epoch": 289} {"train_loss": -4.97991943359375, "global_step": 12178, "epoch": 289} {"train_loss": -5.091712713241577, "global_step": 12179, "epoch": 289, "val_loss": 71750.9453125} {"train_loss": -4.820294380187988, "global_step": 12180, "epoch": 290} {"train_loss": -5.022773742675781, "global_step": 12181, "epoch": 290} {"train_loss": -5.050196647644043, "global_step": 12182, "epoch": 290} {"train_loss": -5.041606903076172, "global_step": 12183, "epoch": 290} {"train_loss": -4.819184303283691, "global_step": 12184, "epoch": 290} {"train_loss": -5.088603496551514, "global_step": 12185, "epoch": 290} {"train_loss": -4.913382053375244, "global_step": 12186, "epoch": 290} {"train_loss": -5.1635894775390625, "global_step": 12187, "epoch": 290} {"train_loss": -5.1146135330200195, "global_step": 12188, "epoch": 290} {"train_loss": -5.096036434173584, "global_step": 12189, "epoch": 290} {"train_loss": -5.2024335861206055, "global_step": 12190, "epoch": 290} {"train_loss": -4.987400531768799, "global_step": 12191, "epoch": 290} {"train_loss": -5.122414588928223, "global_step": 12192, "epoch": 290} {"train_loss": -5.099954605102539, "global_step": 12193, "epoch": 290} {"train_loss": -5.113834381103516, "global_step": 12194, "epoch": 290} {"train_loss": -5.007547378540039, "global_step": 12195, "epoch": 290} {"train_loss": -5.128819465637207, "global_step": 12196, "epoch": 290} {"train_loss": -5.036734580993652, "global_step": 12197, "epoch": 290} {"train_loss": -5.065720081329346, "global_step": 12198, "epoch": 290} {"train_loss": -5.202859878540039, "global_step": 12199, "epoch": 290} {"train_loss": -5.027626991271973, "global_step": 12200, "epoch": 290} {"train_loss": -5.0472822189331055, "global_step": 12201, "epoch": 290} {"train_loss": -5.118303298950195, "global_step": 12202, "epoch": 290} {"train_loss": -4.968677520751953, "global_step": 12203, "epoch": 290} {"train_loss": -5.022568702697754, "global_step": 12204, "epoch": 290} {"train_loss": -5.109529495239258, "global_step": 12205, "epoch": 290} {"train_loss": -5.252805709838867, "global_step": 12206, "epoch": 290} {"train_loss": -5.229907035827637, "global_step": 12207, "epoch": 290} {"train_loss": -5.140182018280029, "global_step": 12208, "epoch": 290} {"train_loss": -5.29386568069458, "global_step": 12209, "epoch": 290} {"train_loss": -5.168167591094971, "global_step": 12210, "epoch": 290} {"train_loss": -5.203387260437012, "global_step": 12211, "epoch": 290} {"train_loss": -5.074686050415039, "global_step": 12212, "epoch": 290} {"train_loss": -5.175846099853516, "global_step": 12213, "epoch": 290} {"train_loss": -5.106840133666992, "global_step": 12214, "epoch": 290} {"train_loss": -5.133994102478027, "global_step": 12215, "epoch": 290} {"train_loss": -5.123434543609619, "global_step": 12216, "epoch": 290} {"train_loss": -5.007816314697266, "global_step": 12217, "epoch": 290} {"train_loss": -5.151760101318359, "global_step": 12218, "epoch": 290} {"train_loss": -5.116795063018799, "global_step": 12219, "epoch": 290} {"train_loss": -5.147426605224609, "global_step": 12220, "epoch": 290} {"train_loss": -5.093639214833577, "global_step": 12221, "epoch": 290, "val_loss": 70638.1640625} {"train_loss": -5.106926441192627, "global_step": 12222, "epoch": 291} {"train_loss": -5.095630168914795, "global_step": 12223, "epoch": 291} {"train_loss": -5.2484846115112305, "global_step": 12224, "epoch": 291} {"train_loss": -5.018467426300049, "global_step": 12225, "epoch": 291} {"train_loss": -5.217877388000488, "global_step": 12226, "epoch": 291} {"train_loss": -5.090009689331055, "global_step": 12227, "epoch": 291} {"train_loss": -5.012688159942627, "global_step": 12228, "epoch": 291} {"train_loss": -5.286249160766602, "global_step": 12229, "epoch": 291} {"train_loss": -5.053787708282471, "global_step": 12230, "epoch": 291} {"train_loss": -5.130054473876953, "global_step": 12231, "epoch": 291} {"train_loss": -5.167435646057129, "global_step": 12232, "epoch": 291} {"train_loss": -5.114889144897461, "global_step": 12233, "epoch": 291} {"train_loss": -5.084847450256348, "global_step": 12234, "epoch": 291} {"train_loss": -5.194303512573242, "global_step": 12235, "epoch": 291} {"train_loss": -5.03215217590332, "global_step": 12236, "epoch": 291} {"train_loss": -5.085173606872559, "global_step": 12237, "epoch": 291} {"train_loss": -5.1623992919921875, "global_step": 12238, "epoch": 291} {"train_loss": -5.093015670776367, "global_step": 12239, "epoch": 291} {"train_loss": -5.090597152709961, "global_step": 12240, "epoch": 291} {"train_loss": -5.116426467895508, "global_step": 12241, "epoch": 291} {"train_loss": -5.091773986816406, "global_step": 12242, "epoch": 291} {"train_loss": -5.0797882080078125, "global_step": 12243, "epoch": 291} {"train_loss": -5.104500770568848, "global_step": 12244, "epoch": 291} {"train_loss": -5.220897197723389, "global_step": 12245, "epoch": 291} {"train_loss": -5.191013336181641, "global_step": 12246, "epoch": 291} {"train_loss": -5.178502082824707, "global_step": 12247, "epoch": 291} {"train_loss": -5.113541603088379, "global_step": 12248, "epoch": 291} {"train_loss": -5.213668346405029, "global_step": 12249, "epoch": 291} {"train_loss": -4.991643905639648, "global_step": 12250, "epoch": 291} {"train_loss": -5.089387893676758, "global_step": 12251, "epoch": 291} {"train_loss": -5.243466377258301, "global_step": 12252, "epoch": 291} {"train_loss": -5.119604110717773, "global_step": 12253, "epoch": 291} {"train_loss": -5.166929244995117, "global_step": 12254, "epoch": 291} {"train_loss": -5.1287336349487305, "global_step": 12255, "epoch": 291} {"train_loss": -5.147724151611328, "global_step": 12256, "epoch": 291} {"train_loss": -5.096290588378906, "global_step": 12257, "epoch": 291} {"train_loss": -5.203412055969238, "global_step": 12258, "epoch": 291} {"train_loss": -5.0692243576049805, "global_step": 12259, "epoch": 291} {"train_loss": -5.166796684265137, "global_step": 12260, "epoch": 291} {"train_loss": -5.059291839599609, "global_step": 12261, "epoch": 291} {"train_loss": -5.228740692138672, "global_step": 12262, "epoch": 291} {"train_loss": -5.132191623960223, "global_step": 12263, "epoch": 291, "val_loss": 70991.0234375} {"train_loss": -5.0652618408203125, "global_step": 12264, "epoch": 292} {"train_loss": -5.117039203643799, "global_step": 12265, "epoch": 292} {"train_loss": -5.188879013061523, "global_step": 12266, "epoch": 292} {"train_loss": -5.018415451049805, "global_step": 12267, "epoch": 292} {"train_loss": -5.0883469581604, "global_step": 12268, "epoch": 292} {"train_loss": -5.151291847229004, "global_step": 12269, "epoch": 292} {"train_loss": -5.170618057250977, "global_step": 12270, "epoch": 292} {"train_loss": -5.248022556304932, "global_step": 12271, "epoch": 292} {"train_loss": -5.102888107299805, "global_step": 12272, "epoch": 292} {"train_loss": -5.166658401489258, "global_step": 12273, "epoch": 292} {"train_loss": -5.152997016906738, "global_step": 12274, "epoch": 292} {"train_loss": -5.1072611808776855, "global_step": 12275, "epoch": 292} {"train_loss": -5.120023250579834, "global_step": 12276, "epoch": 292} {"train_loss": -4.985345363616943, "global_step": 12277, "epoch": 292} {"train_loss": -5.0481791496276855, "global_step": 12278, "epoch": 292} {"train_loss": -5.024469375610352, "global_step": 12279, "epoch": 292} {"train_loss": -5.113407135009766, "global_step": 12280, "epoch": 292} {"train_loss": -4.994813919067383, "global_step": 12281, "epoch": 292} {"train_loss": -5.038819313049316, "global_step": 12282, "epoch": 292} {"train_loss": -5.138516426086426, "global_step": 12283, "epoch": 292} {"train_loss": -4.882734298706055, "global_step": 12284, "epoch": 292} {"train_loss": -5.158123016357422, "global_step": 12285, "epoch": 292} {"train_loss": -5.017097473144531, "global_step": 12286, "epoch": 292} {"train_loss": -4.761463642120361, "global_step": 12287, "epoch": 292} {"train_loss": -5.182348251342773, "global_step": 12288, "epoch": 292} {"train_loss": -5.038049221038818, "global_step": 12289, "epoch": 292} {"train_loss": -4.782792091369629, "global_step": 12290, "epoch": 292} {"train_loss": -5.106429100036621, "global_step": 12291, "epoch": 292} {"train_loss": -4.796130180358887, "global_step": 12292, "epoch": 292} {"train_loss": -4.8471150398254395, "global_step": 12293, "epoch": 292} {"train_loss": -5.0783915519714355, "global_step": 12294, "epoch": 292} {"train_loss": -4.646156311035156, "global_step": 12295, "epoch": 292} {"train_loss": -5.151745796203613, "global_step": 12296, "epoch": 292} {"train_loss": -4.679654121398926, "global_step": 12297, "epoch": 292} {"train_loss": -5.165138244628906, "global_step": 12298, "epoch": 292} {"train_loss": -4.8621673583984375, "global_step": 12299, "epoch": 292} {"train_loss": -5.0217814445495605, "global_step": 12300, "epoch": 292} {"train_loss": -4.900010108947754, "global_step": 12301, "epoch": 292} {"train_loss": -4.926181316375732, "global_step": 12302, "epoch": 292} {"train_loss": -4.8672895431518555, "global_step": 12303, "epoch": 292} {"train_loss": -5.145503997802734, "global_step": 12304, "epoch": 292} {"train_loss": -5.022850956235613, "global_step": 12305, "epoch": 292, "val_loss": 69997.78125} {"train_loss": -5.005739688873291, "global_step": 12306, "epoch": 293} {"train_loss": -4.989406108856201, "global_step": 12307, "epoch": 293} {"train_loss": -5.052742004394531, "global_step": 12308, "epoch": 293} {"train_loss": -4.909978866577148, "global_step": 12309, "epoch": 293} {"train_loss": -5.049041748046875, "global_step": 12310, "epoch": 293} {"train_loss": -5.086598873138428, "global_step": 12311, "epoch": 293} {"train_loss": -5.109095573425293, "global_step": 12312, "epoch": 293} {"train_loss": -5.082056999206543, "global_step": 12313, "epoch": 293} {"train_loss": -5.050888538360596, "global_step": 12314, "epoch": 293} {"train_loss": -5.1529693603515625, "global_step": 12315, "epoch": 293} {"train_loss": -5.170663833618164, "global_step": 12316, "epoch": 293} {"train_loss": -5.150051116943359, "global_step": 12317, "epoch": 293} {"train_loss": -5.115985870361328, "global_step": 12318, "epoch": 293} {"train_loss": -5.084575653076172, "global_step": 12319, "epoch": 293} {"train_loss": -5.021164894104004, "global_step": 12320, "epoch": 293} {"train_loss": -5.144634246826172, "global_step": 12321, "epoch": 293} {"train_loss": -5.0728302001953125, "global_step": 12322, "epoch": 293} {"train_loss": -4.9961934089660645, "global_step": 12323, "epoch": 293} {"train_loss": -5.211974620819092, "global_step": 12324, "epoch": 293} {"train_loss": -5.193332672119141, "global_step": 12325, "epoch": 293} {"train_loss": -4.957083702087402, "global_step": 12326, "epoch": 293} {"train_loss": -5.151662826538086, "global_step": 12327, "epoch": 293} {"train_loss": -5.0995283126831055, "global_step": 12328, "epoch": 293} {"train_loss": -5.173013687133789, "global_step": 12329, "epoch": 293} {"train_loss": -5.172715187072754, "global_step": 12330, "epoch": 293} {"train_loss": -5.070019245147705, "global_step": 12331, "epoch": 293} {"train_loss": -5.156930446624756, "global_step": 12332, "epoch": 293} {"train_loss": -5.280718803405762, "global_step": 12333, "epoch": 293} {"train_loss": -5.032878875732422, "global_step": 12334, "epoch": 293} {"train_loss": -5.0695414543151855, "global_step": 12335, "epoch": 293} {"train_loss": -5.125141143798828, "global_step": 12336, "epoch": 293} {"train_loss": -5.206105709075928, "global_step": 12337, "epoch": 293} {"train_loss": -5.18414306640625, "global_step": 12338, "epoch": 293} {"train_loss": -5.21507453918457, "global_step": 12339, "epoch": 293} {"train_loss": -5.180019378662109, "global_step": 12340, "epoch": 293} {"train_loss": -5.162196636199951, "global_step": 12341, "epoch": 293} {"train_loss": -5.211983680725098, "global_step": 12342, "epoch": 293} {"train_loss": -5.176711082458496, "global_step": 12343, "epoch": 293} {"train_loss": -5.243800640106201, "global_step": 12344, "epoch": 293} {"train_loss": -5.144855499267578, "global_step": 12345, "epoch": 293} {"train_loss": -5.1398468017578125, "global_step": 12346, "epoch": 293} {"train_loss": -5.118659008116949, "global_step": 12347, "epoch": 293, "val_loss": 70558.296875} {"train_loss": -5.245891571044922, "global_step": 12348, "epoch": 294} {"train_loss": -5.287534713745117, "global_step": 12349, "epoch": 294} {"train_loss": -5.158600807189941, "global_step": 12350, "epoch": 294} {"train_loss": -5.2053422927856445, "global_step": 12351, "epoch": 294} {"train_loss": -5.145303726196289, "global_step": 12352, "epoch": 294} {"train_loss": -4.864770889282227, "global_step": 12353, "epoch": 294} {"train_loss": -5.179686069488525, "global_step": 12354, "epoch": 294} {"train_loss": -5.076807975769043, "global_step": 12355, "epoch": 294} {"train_loss": -4.703672409057617, "global_step": 12356, "epoch": 294} {"train_loss": -5.100351333618164, "global_step": 12357, "epoch": 294} {"train_loss": -5.031836032867432, "global_step": 12358, "epoch": 294} {"train_loss": -4.839107513427734, "global_step": 12359, "epoch": 294} {"train_loss": -5.048141002655029, "global_step": 12360, "epoch": 294} {"train_loss": -5.013152122497559, "global_step": 12361, "epoch": 294} {"train_loss": -4.953166484832764, "global_step": 12362, "epoch": 294} {"train_loss": -5.112622261047363, "global_step": 12363, "epoch": 294} {"train_loss": -5.136415004730225, "global_step": 12364, "epoch": 294} {"train_loss": -5.001013278961182, "global_step": 12365, "epoch": 294} {"train_loss": -5.205540180206299, "global_step": 12366, "epoch": 294} {"train_loss": -5.039466857910156, "global_step": 12367, "epoch": 294} {"train_loss": -4.99615478515625, "global_step": 12368, "epoch": 294} {"train_loss": -5.202588081359863, "global_step": 12369, "epoch": 294} {"train_loss": -5.104154586791992, "global_step": 12370, "epoch": 294} {"train_loss": -5.031100749969482, "global_step": 12371, "epoch": 294} {"train_loss": -5.301584243774414, "global_step": 12372, "epoch": 294} {"train_loss": -4.988439559936523, "global_step": 12373, "epoch": 294} {"train_loss": -5.125331401824951, "global_step": 12374, "epoch": 294} {"train_loss": -5.101380348205566, "global_step": 12375, "epoch": 294} {"train_loss": -5.151635646820068, "global_step": 12376, "epoch": 294} {"train_loss": -5.098142623901367, "global_step": 12377, "epoch": 294} {"train_loss": -5.167942047119141, "global_step": 12378, "epoch": 294} {"train_loss": -5.130283355712891, "global_step": 12379, "epoch": 294} {"train_loss": -5.137024402618408, "global_step": 12380, "epoch": 294} {"train_loss": -5.311573028564453, "global_step": 12381, "epoch": 294} {"train_loss": -5.20396614074707, "global_step": 12382, "epoch": 294} {"train_loss": -5.093197345733643, "global_step": 12383, "epoch": 294} {"train_loss": -5.1045026779174805, "global_step": 12384, "epoch": 294} {"train_loss": -5.146328926086426, "global_step": 12385, "epoch": 294} {"train_loss": -5.069348335266113, "global_step": 12386, "epoch": 294} {"train_loss": -5.21207332611084, "global_step": 12387, "epoch": 294} {"train_loss": -5.042179107666016, "global_step": 12388, "epoch": 294} {"train_loss": -5.097882986068726, "global_step": 12389, "epoch": 294, "val_loss": 70591.828125} {"train_loss": -5.109244346618652, "global_step": 12390, "epoch": 295} {"train_loss": -5.206156253814697, "global_step": 12391, "epoch": 295} {"train_loss": -5.086238861083984, "global_step": 12392, "epoch": 295} {"train_loss": -5.032477855682373, "global_step": 12393, "epoch": 295} {"train_loss": -5.074493408203125, "global_step": 12394, "epoch": 295} {"train_loss": -5.182677745819092, "global_step": 12395, "epoch": 295} {"train_loss": -5.139124870300293, "global_step": 12396, "epoch": 295} {"train_loss": -5.143655776977539, "global_step": 12397, "epoch": 295} {"train_loss": -4.932562351226807, "global_step": 12398, "epoch": 295} {"train_loss": -5.149069786071777, "global_step": 12399, "epoch": 295} {"train_loss": -4.945355415344238, "global_step": 12400, "epoch": 295} {"train_loss": -4.975016117095947, "global_step": 12401, "epoch": 295} {"train_loss": -5.096238136291504, "global_step": 12402, "epoch": 295} {"train_loss": -5.1302947998046875, "global_step": 12403, "epoch": 295} {"train_loss": -5.016922473907471, "global_step": 12404, "epoch": 295} {"train_loss": -5.139449119567871, "global_step": 12405, "epoch": 295} {"train_loss": -5.043120384216309, "global_step": 12406, "epoch": 295} {"train_loss": -4.956353187561035, "global_step": 12407, "epoch": 295} {"train_loss": -5.188371658325195, "global_step": 12408, "epoch": 295} {"train_loss": -5.163418769836426, "global_step": 12409, "epoch": 295} {"train_loss": -5.025832653045654, "global_step": 12410, "epoch": 295} {"train_loss": -5.091981410980225, "global_step": 12411, "epoch": 295} {"train_loss": -5.137847900390625, "global_step": 12412, "epoch": 295} {"train_loss": -5.235358715057373, "global_step": 12413, "epoch": 295} {"train_loss": -5.08245849609375, "global_step": 12414, "epoch": 295} {"train_loss": -5.216311454772949, "global_step": 12415, "epoch": 295} {"train_loss": -5.184006690979004, "global_step": 12416, "epoch": 295} {"train_loss": -5.144621849060059, "global_step": 12417, "epoch": 295} {"train_loss": -5.107233047485352, "global_step": 12418, "epoch": 295} {"train_loss": -5.238048553466797, "global_step": 12419, "epoch": 295} {"train_loss": -4.974637985229492, "global_step": 12420, "epoch": 295} {"train_loss": -5.033902168273926, "global_step": 12421, "epoch": 295} {"train_loss": -5.2019500732421875, "global_step": 12422, "epoch": 295} {"train_loss": -5.056755065917969, "global_step": 12423, "epoch": 295} {"train_loss": -5.075435638427734, "global_step": 12424, "epoch": 295} {"train_loss": -5.217299461364746, "global_step": 12425, "epoch": 295} {"train_loss": -5.092554092407227, "global_step": 12426, "epoch": 295} {"train_loss": -5.105138778686523, "global_step": 12427, "epoch": 295} {"train_loss": -4.994492053985596, "global_step": 12428, "epoch": 295} {"train_loss": -5.174726486206055, "global_step": 12429, "epoch": 295} {"train_loss": -5.20182991027832, "global_step": 12430, "epoch": 295} {"train_loss": -5.105554535275414, "global_step": 12431, "epoch": 295, "val_loss": 71205.6328125} {"train_loss": -4.973443031311035, "global_step": 12432, "epoch": 296} {"train_loss": -4.982000827789307, "global_step": 12433, "epoch": 296} {"train_loss": -5.1573615074157715, "global_step": 12434, "epoch": 296} {"train_loss": -5.054738998413086, "global_step": 12435, "epoch": 296} {"train_loss": -5.112454414367676, "global_step": 12436, "epoch": 296} {"train_loss": -5.014790058135986, "global_step": 12437, "epoch": 296} {"train_loss": -5.118849277496338, "global_step": 12438, "epoch": 296} {"train_loss": -5.020146369934082, "global_step": 12439, "epoch": 296} {"train_loss": -5.005422592163086, "global_step": 12440, "epoch": 296} {"train_loss": -5.116174697875977, "global_step": 12441, "epoch": 296} {"train_loss": -4.864020824432373, "global_step": 12442, "epoch": 296} {"train_loss": -5.228427886962891, "global_step": 12443, "epoch": 296} {"train_loss": -5.040844440460205, "global_step": 12444, "epoch": 296} {"train_loss": -5.030205726623535, "global_step": 12445, "epoch": 296} {"train_loss": -5.230759620666504, "global_step": 12446, "epoch": 296} {"train_loss": -5.123328685760498, "global_step": 12447, "epoch": 296} {"train_loss": -4.965912818908691, "global_step": 12448, "epoch": 296} {"train_loss": -5.189275741577148, "global_step": 12449, "epoch": 296} {"train_loss": -5.118934631347656, "global_step": 12450, "epoch": 296} {"train_loss": -5.158592700958252, "global_step": 12451, "epoch": 296} {"train_loss": -5.058064937591553, "global_step": 12452, "epoch": 296} {"train_loss": -5.0631303787231445, "global_step": 12453, "epoch": 296} {"train_loss": -5.079978942871094, "global_step": 12454, "epoch": 296} {"train_loss": -4.979518890380859, "global_step": 12455, "epoch": 296} {"train_loss": -5.180129051208496, "global_step": 12456, "epoch": 296} {"train_loss": -5.242241859436035, "global_step": 12457, "epoch": 296} {"train_loss": -5.0719146728515625, "global_step": 12458, "epoch": 296} {"train_loss": -5.19290828704834, "global_step": 12459, "epoch": 296} {"train_loss": -5.039315223693848, "global_step": 12460, "epoch": 296} {"train_loss": -5.071514129638672, "global_step": 12461, "epoch": 296} {"train_loss": -5.267033100128174, "global_step": 12462, "epoch": 296} {"train_loss": -5.031700134277344, "global_step": 12463, "epoch": 296} {"train_loss": -4.91524600982666, "global_step": 12464, "epoch": 296} {"train_loss": -5.097224235534668, "global_step": 12465, "epoch": 296} {"train_loss": -5.149722099304199, "global_step": 12466, "epoch": 296} {"train_loss": -5.164267063140869, "global_step": 12467, "epoch": 296} {"train_loss": -5.20878791809082, "global_step": 12468, "epoch": 296} {"train_loss": -5.160728931427002, "global_step": 12469, "epoch": 296} {"train_loss": -5.115069389343262, "global_step": 12470, "epoch": 296} {"train_loss": -5.187965393066406, "global_step": 12471, "epoch": 296} {"train_loss": -5.201312065124512, "global_step": 12472, "epoch": 296} {"train_loss": -5.099743230002267, "global_step": 12473, "epoch": 296, "val_loss": 70593.1875} {"train_loss": -4.964354038238525, "global_step": 12474, "epoch": 297} {"train_loss": -5.219209671020508, "global_step": 12475, "epoch": 297} {"train_loss": -5.176661014556885, "global_step": 12476, "epoch": 297} {"train_loss": -5.091047763824463, "global_step": 12477, "epoch": 297} {"train_loss": -5.037675380706787, "global_step": 12478, "epoch": 297} {"train_loss": -5.147761344909668, "global_step": 12479, "epoch": 297} {"train_loss": -5.093158721923828, "global_step": 12480, "epoch": 297} {"train_loss": -5.081271171569824, "global_step": 12481, "epoch": 297} {"train_loss": -5.1582417488098145, "global_step": 12482, "epoch": 297} {"train_loss": -5.1199750900268555, "global_step": 12483, "epoch": 297} {"train_loss": -5.180640697479248, "global_step": 12484, "epoch": 297} {"train_loss": -4.933647632598877, "global_step": 12485, "epoch": 297} {"train_loss": -5.201475143432617, "global_step": 12486, "epoch": 297} {"train_loss": -5.048020839691162, "global_step": 12487, "epoch": 297} {"train_loss": -4.908389091491699, "global_step": 12488, "epoch": 297} {"train_loss": -5.042347431182861, "global_step": 12489, "epoch": 297} {"train_loss": -5.025586128234863, "global_step": 12490, "epoch": 297} {"train_loss": -4.875443935394287, "global_step": 12491, "epoch": 297} {"train_loss": -5.076424598693848, "global_step": 12492, "epoch": 297} {"train_loss": -5.024114608764648, "global_step": 12493, "epoch": 297} {"train_loss": -4.943391799926758, "global_step": 12494, "epoch": 297} {"train_loss": -5.184713363647461, "global_step": 12495, "epoch": 297} {"train_loss": -5.001503944396973, "global_step": 12496, "epoch": 297} {"train_loss": -5.09586238861084, "global_step": 12497, "epoch": 297} {"train_loss": -5.096341133117676, "global_step": 12498, "epoch": 297} {"train_loss": -4.966504096984863, "global_step": 12499, "epoch": 297} {"train_loss": -5.278450965881348, "global_step": 12500, "epoch": 297} {"train_loss": -5.089807033538818, "global_step": 12501, "epoch": 297} {"train_loss": -5.124433517456055, "global_step": 12502, "epoch": 297} {"train_loss": -4.993589401245117, "global_step": 12503, "epoch": 297} {"train_loss": -5.149386405944824, "global_step": 12504, "epoch": 297} {"train_loss": -5.143979072570801, "global_step": 12505, "epoch": 297} {"train_loss": -5.149870872497559, "global_step": 12506, "epoch": 297} {"train_loss": -5.108893394470215, "global_step": 12507, "epoch": 297} {"train_loss": -5.156647682189941, "global_step": 12508, "epoch": 297} {"train_loss": -5.0921149253845215, "global_step": 12509, "epoch": 297} {"train_loss": -5.202572345733643, "global_step": 12510, "epoch": 297} {"train_loss": -5.236445426940918, "global_step": 12511, "epoch": 297} {"train_loss": -5.056199073791504, "global_step": 12512, "epoch": 297} {"train_loss": -5.011933326721191, "global_step": 12513, "epoch": 297} {"train_loss": -5.048671722412109, "global_step": 12514, "epoch": 297} {"train_loss": -5.0887367725372314, "global_step": 12515, "epoch": 297, "val_loss": 70742.5625} {"train_loss": -5.108506202697754, "global_step": 12516, "epoch": 298} {"train_loss": -5.121325492858887, "global_step": 12517, "epoch": 298} {"train_loss": -5.225552082061768, "global_step": 12518, "epoch": 298} {"train_loss": -5.001420021057129, "global_step": 12519, "epoch": 298} {"train_loss": -5.321931838989258, "global_step": 12520, "epoch": 298} {"train_loss": -5.323019027709961, "global_step": 12521, "epoch": 298} {"train_loss": -5.184562683105469, "global_step": 12522, "epoch": 298} {"train_loss": -5.182860374450684, "global_step": 12523, "epoch": 298} {"train_loss": -5.143167972564697, "global_step": 12524, "epoch": 298} {"train_loss": -5.200871467590332, "global_step": 12525, "epoch": 298} {"train_loss": -5.312460422515869, "global_step": 12526, "epoch": 298} {"train_loss": -5.109431266784668, "global_step": 12527, "epoch": 298} {"train_loss": -5.097768783569336, "global_step": 12528, "epoch": 298} {"train_loss": -5.075382232666016, "global_step": 12529, "epoch": 298} {"train_loss": -5.178572654724121, "global_step": 12530, "epoch": 298} {"train_loss": -5.1076555252075195, "global_step": 12531, "epoch": 298} {"train_loss": -5.063624382019043, "global_step": 12532, "epoch": 298} {"train_loss": -5.103524208068848, "global_step": 12533, "epoch": 298} {"train_loss": -5.135091781616211, "global_step": 12534, "epoch": 298} {"train_loss": -5.2295379638671875, "global_step": 12535, "epoch": 298} {"train_loss": -5.058969497680664, "global_step": 12536, "epoch": 298} {"train_loss": -5.118545055389404, "global_step": 12537, "epoch": 298} {"train_loss": -5.128592014312744, "global_step": 12538, "epoch": 298} {"train_loss": -5.248225212097168, "global_step": 12539, "epoch": 298} {"train_loss": -5.1343488693237305, "global_step": 12540, "epoch": 298} {"train_loss": -5.029945373535156, "global_step": 12541, "epoch": 298} {"train_loss": -5.021812438964844, "global_step": 12542, "epoch": 298} {"train_loss": -5.0914530754089355, "global_step": 12543, "epoch": 298} {"train_loss": -5.085672378540039, "global_step": 12544, "epoch": 298} {"train_loss": -4.954550743103027, "global_step": 12545, "epoch": 298} {"train_loss": -5.015212059020996, "global_step": 12546, "epoch": 298} {"train_loss": -5.179363250732422, "global_step": 12547, "epoch": 298} {"train_loss": -5.015776634216309, "global_step": 12548, "epoch": 298} {"train_loss": -4.959722518920898, "global_step": 12549, "epoch": 298} {"train_loss": -4.980195999145508, "global_step": 12550, "epoch": 298} {"train_loss": -5.010765552520752, "global_step": 12551, "epoch": 298} {"train_loss": -5.1342010498046875, "global_step": 12552, "epoch": 298} {"train_loss": -5.156797409057617, "global_step": 12553, "epoch": 298} {"train_loss": -5.054779052734375, "global_step": 12554, "epoch": 298} {"train_loss": -5.065239906311035, "global_step": 12555, "epoch": 298} {"train_loss": -5.0042195320129395, "global_step": 12556, "epoch": 298} {"train_loss": -5.114188307807559, "global_step": 12557, "epoch": 298, "val_loss": 70883.078125} {"train_loss": -5.174897193908691, "global_step": 12558, "epoch": 299} {"train_loss": -5.0454020500183105, "global_step": 12559, "epoch": 299} {"train_loss": -5.067002296447754, "global_step": 12560, "epoch": 299} {"train_loss": -5.019586563110352, "global_step": 12561, "epoch": 299} {"train_loss": -5.088895797729492, "global_step": 12562, "epoch": 299} {"train_loss": -4.935624122619629, "global_step": 12563, "epoch": 299} {"train_loss": -5.131994247436523, "global_step": 12564, "epoch": 299} {"train_loss": -5.061044692993164, "global_step": 12565, "epoch": 299} {"train_loss": -5.094403266906738, "global_step": 12566, "epoch": 299} {"train_loss": -5.171438217163086, "global_step": 12567, "epoch": 299} {"train_loss": -5.287017822265625, "global_step": 12568, "epoch": 299} {"train_loss": -5.119463920593262, "global_step": 12569, "epoch": 299} {"train_loss": -5.0874481201171875, "global_step": 12570, "epoch": 299} {"train_loss": -5.0686259269714355, "global_step": 12571, "epoch": 299} {"train_loss": -5.0360331535339355, "global_step": 12572, "epoch": 299} {"train_loss": -5.219507694244385, "global_step": 12573, "epoch": 299} {"train_loss": -5.069573402404785, "global_step": 12574, "epoch": 299} {"train_loss": -5.227503776550293, "global_step": 12575, "epoch": 299} {"train_loss": -5.062385082244873, "global_step": 12576, "epoch": 299} {"train_loss": -5.151967525482178, "global_step": 12577, "epoch": 299} {"train_loss": -5.054525375366211, "global_step": 12578, "epoch": 299} {"train_loss": -4.935746669769287, "global_step": 12579, "epoch": 299} {"train_loss": -5.123614311218262, "global_step": 12580, "epoch": 299} {"train_loss": -5.138874053955078, "global_step": 12581, "epoch": 299} {"train_loss": -4.938088417053223, "global_step": 12582, "epoch": 299} {"train_loss": -5.0566487312316895, "global_step": 12583, "epoch": 299} {"train_loss": -5.1224822998046875, "global_step": 12584, "epoch": 299} {"train_loss": -5.145359039306641, "global_step": 12585, "epoch": 299} {"train_loss": -5.037773609161377, "global_step": 12586, "epoch": 299} {"train_loss": -5.090580940246582, "global_step": 12587, "epoch": 299} {"train_loss": -4.9663920402526855, "global_step": 12588, "epoch": 299} {"train_loss": -5.172792911529541, "global_step": 12589, "epoch": 299} {"train_loss": -4.979788303375244, "global_step": 12590, "epoch": 299} {"train_loss": -5.1434736251831055, "global_step": 12591, "epoch": 299} {"train_loss": -5.114652633666992, "global_step": 12592, "epoch": 299} {"train_loss": -4.93541145324707, "global_step": 12593, "epoch": 299} {"train_loss": -5.1982245445251465, "global_step": 12594, "epoch": 299} {"train_loss": -5.130125999450684, "global_step": 12595, "epoch": 299} {"train_loss": -5.130260944366455, "global_step": 12596, "epoch": 299} {"train_loss": -5.221983909606934, "global_step": 12597, "epoch": 299} {"train_loss": -5.0961809158325195, "global_step": 12598, "epoch": 299} {"train_loss": -5.093445698420207, "global_step": 12599, "epoch": 299, "val_loss": 70794.515625} {"train_loss": -5.110015869140625, "global_step": 12600, "epoch": 300} {"train_loss": -4.948992729187012, "global_step": 12601, "epoch": 300} {"train_loss": -5.069268703460693, "global_step": 12602, "epoch": 300} {"train_loss": -5.069177150726318, "global_step": 12603, "epoch": 300} {"train_loss": -4.967833518981934, "global_step": 12604, "epoch": 300} {"train_loss": -5.0556488037109375, "global_step": 12605, "epoch": 300} {"train_loss": -5.077737808227539, "global_step": 12606, "epoch": 300} {"train_loss": -5.164634704589844, "global_step": 12607, "epoch": 300} {"train_loss": -5.0238752365112305, "global_step": 12608, "epoch": 300} {"train_loss": -5.290790557861328, "global_step": 12609, "epoch": 300} {"train_loss": -5.193070411682129, "global_step": 12610, "epoch": 300} {"train_loss": -5.050029754638672, "global_step": 12611, "epoch": 300} {"train_loss": -5.218836784362793, "global_step": 12612, "epoch": 300} {"train_loss": -5.273240566253662, "global_step": 12613, "epoch": 300} {"train_loss": -5.183513641357422, "global_step": 12614, "epoch": 300} {"train_loss": -5.1634721755981445, "global_step": 12615, "epoch": 300} {"train_loss": -5.000557899475098, "global_step": 12616, "epoch": 300} {"train_loss": -5.0952582359313965, "global_step": 12617, "epoch": 300} {"train_loss": -5.212552070617676, "global_step": 12618, "epoch": 300} {"train_loss": -5.19219970703125, "global_step": 12619, "epoch": 300} {"train_loss": -5.034724235534668, "global_step": 12620, "epoch": 300} {"train_loss": -5.0798845291137695, "global_step": 12621, "epoch": 300} {"train_loss": -5.092290878295898, "global_step": 12622, "epoch": 300} {"train_loss": -5.317141532897949, "global_step": 12623, "epoch": 300} {"train_loss": -5.215461254119873, "global_step": 12624, "epoch": 300} {"train_loss": -5.027571678161621, "global_step": 12625, "epoch": 300} {"train_loss": -5.113955497741699, "global_step": 12626, "epoch": 300} {"train_loss": -5.037860870361328, "global_step": 12627, "epoch": 300} {"train_loss": -5.169382095336914, "global_step": 12628, "epoch": 300} {"train_loss": -5.20234489440918, "global_step": 12629, "epoch": 300} {"train_loss": -5.100140571594238, "global_step": 12630, "epoch": 300} {"train_loss": -4.997373104095459, "global_step": 12631, "epoch": 300} {"train_loss": -5.184760093688965, "global_step": 12632, "epoch": 300} {"train_loss": -4.958539962768555, "global_step": 12633, "epoch": 300} {"train_loss": -5.057377815246582, "global_step": 12634, "epoch": 300} {"train_loss": -5.309776306152344, "global_step": 12635, "epoch": 300} {"train_loss": -5.149044036865234, "global_step": 12636, "epoch": 300} {"train_loss": -5.075979232788086, "global_step": 12637, "epoch": 300} {"train_loss": -5.187335014343262, "global_step": 12638, "epoch": 300} {"train_loss": -5.171672821044922, "global_step": 12639, "epoch": 300} {"train_loss": -5.241988182067871, "global_step": 12640, "epoch": 300} {"train_loss": -5.128280367170062, "global_step": 12641, "epoch": 300, "train/sim_max_reward_0": 0.3122197639710132, "train/sim_max_reward_1": 0.12407080164302736, "train/sim_max_reward_2": 0.3353378607468339, "train/sim_max_reward_3": 0.1691788967630818, "train/sim_max_reward_4": 0.32060754325222035, "train/sim_max_reward_5": 0.5842578542661259, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.0, "test/sim_max_reward_4300002": 0.39272350392799477, "test/sim_max_reward_4300003": 0.42141342590981223, "test/sim_max_reward_4300004": 0.7045203420489915, "test/sim_max_reward_4300005": 0.2708997502350247, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.4073517620496003, "test/sim_max_reward_4300008": 0.3908217651313845, "test/sim_max_reward_4300009": 0.8159258450000546, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.3211283389473018, "test/sim_max_reward_4300012": 0.37819239325353776, "test/sim_max_reward_4300013": 0.4073185844067948, "test/sim_max_reward_4300014": 0.40489897344037307, "test/sim_max_reward_4300015": 0.2651780245509828, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.4190504084407928, "test/sim_max_reward_4300018": 0.34804843257885776, "test/sim_max_reward_4300019": 0.18530216804968253, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.43264373011416, "test/sim_max_reward_4300022": 0.4631760168662577, "test/sim_max_reward_4300023": 0.5518495455616507, "test/sim_max_reward_4300024": 0.35574308816459127, "test/sim_max_reward_4300025": 0.09373540851361992, "test/sim_max_reward_4300026": 0.5761882071657437, "test/sim_max_reward_4300027": 0.0, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.21823580950557822, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.2603000335592396, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.40082183890926454, "test/sim_max_reward_4300037": 0.647214019362484, "test/sim_max_reward_4300038": 0.5118474275313852, "test/sim_max_reward_4300039": 0.63859631408402, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.5997775904124151, "test/sim_max_reward_4300043": 0.19123131521142075, "test/sim_max_reward_4300044": 0.3766914107273907, "test/sim_max_reward_4300045": 0.13759037425972614, "test/sim_max_reward_4300046": 0.38592035780539863, "test/sim_max_reward_4300047": 0.7176462618680951, "test/sim_max_reward_4300048": 0.2970406831937573, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.3076121201070504, "test/mean_score": 0.2997804630157477, "val_loss": 70641.3828125} {"train_loss": -5.047049522399902, "global_step": 12642, "epoch": 301} {"train_loss": -5.180996894836426, "global_step": 12643, "epoch": 301} {"train_loss": -4.994221210479736, "global_step": 12644, "epoch": 301} {"train_loss": -5.212893486022949, "global_step": 12645, "epoch": 301} {"train_loss": -5.23360538482666, "global_step": 12646, "epoch": 301} {"train_loss": -5.041414260864258, "global_step": 12647, "epoch": 301} {"train_loss": -5.225674152374268, "global_step": 12648, "epoch": 301} {"train_loss": -5.077228546142578, "global_step": 12649, "epoch": 301} {"train_loss": -5.085766792297363, "global_step": 12650, "epoch": 301} {"train_loss": -5.184010028839111, "global_step": 12651, "epoch": 301} {"train_loss": -5.210529327392578, "global_step": 12652, "epoch": 301} {"train_loss": -5.129391670227051, "global_step": 12653, "epoch": 301} {"train_loss": -5.052318096160889, "global_step": 12654, "epoch": 301} {"train_loss": -5.155912399291992, "global_step": 12655, "epoch": 301} {"train_loss": -5.1540446281433105, "global_step": 12656, "epoch": 301} {"train_loss": -5.012350082397461, "global_step": 12657, "epoch": 301} {"train_loss": -5.007948875427246, "global_step": 12658, "epoch": 301} {"train_loss": -5.168447494506836, "global_step": 12659, "epoch": 301} {"train_loss": -5.155729293823242, "global_step": 12660, "epoch": 301} {"train_loss": -5.148800849914551, "global_step": 12661, "epoch": 301} {"train_loss": -4.92567777633667, "global_step": 12662, "epoch": 301} {"train_loss": -5.124238967895508, "global_step": 12663, "epoch": 301} {"train_loss": -5.261716365814209, "global_step": 12664, "epoch": 301} {"train_loss": -5.038549423217773, "global_step": 12665, "epoch": 301} {"train_loss": -5.170722961425781, "global_step": 12666, "epoch": 301} {"train_loss": -5.113191604614258, "global_step": 12667, "epoch": 301} {"train_loss": -5.089317321777344, "global_step": 12668, "epoch": 301} {"train_loss": -5.186515808105469, "global_step": 12669, "epoch": 301} {"train_loss": -5.129647254943848, "global_step": 12670, "epoch": 301} {"train_loss": -5.082571983337402, "global_step": 12671, "epoch": 301} {"train_loss": -5.087501525878906, "global_step": 12672, "epoch": 301} {"train_loss": -5.15297794342041, "global_step": 12673, "epoch": 301} {"train_loss": -5.161559104919434, "global_step": 12674, "epoch": 301} {"train_loss": -5.176050186157227, "global_step": 12675, "epoch": 301} {"train_loss": -5.141075134277344, "global_step": 12676, "epoch": 301} {"train_loss": -5.0060272216796875, "global_step": 12677, "epoch": 301} {"train_loss": -5.227522373199463, "global_step": 12678, "epoch": 301} {"train_loss": -5.1343278884887695, "global_step": 12679, "epoch": 301} {"train_loss": -4.963297367095947, "global_step": 12680, "epoch": 301} {"train_loss": -5.048451900482178, "global_step": 12681, "epoch": 301} {"train_loss": -5.099912643432617, "global_step": 12682, "epoch": 301} {"train_loss": -5.1154608726501465, "global_step": 12683, "epoch": 301, "val_loss": 71094.9609375} {"train_loss": -5.196038246154785, "global_step": 12684, "epoch": 302} {"train_loss": -5.208789825439453, "global_step": 12685, "epoch": 302} {"train_loss": -5.118035316467285, "global_step": 12686, "epoch": 302} {"train_loss": -5.068838596343994, "global_step": 12687, "epoch": 302} {"train_loss": -5.188885688781738, "global_step": 12688, "epoch": 302} {"train_loss": -5.132507801055908, "global_step": 12689, "epoch": 302} {"train_loss": -5.165563583374023, "global_step": 12690, "epoch": 302} {"train_loss": -5.042471408843994, "global_step": 12691, "epoch": 302} {"train_loss": -5.225012302398682, "global_step": 12692, "epoch": 302} {"train_loss": -5.051618576049805, "global_step": 12693, "epoch": 302} {"train_loss": -5.049120903015137, "global_step": 12694, "epoch": 302} {"train_loss": -4.9334516525268555, "global_step": 12695, "epoch": 302} {"train_loss": -5.13409948348999, "global_step": 12696, "epoch": 302} {"train_loss": -4.862185955047607, "global_step": 12697, "epoch": 302} {"train_loss": -5.079929351806641, "global_step": 12698, "epoch": 302} {"train_loss": -5.085047245025635, "global_step": 12699, "epoch": 302} {"train_loss": -4.956796169281006, "global_step": 12700, "epoch": 302} {"train_loss": -5.079833030700684, "global_step": 12701, "epoch": 302} {"train_loss": -5.195078372955322, "global_step": 12702, "epoch": 302} {"train_loss": -4.9141693115234375, "global_step": 12703, "epoch": 302} {"train_loss": -5.0966339111328125, "global_step": 12704, "epoch": 302} {"train_loss": -5.058650493621826, "global_step": 12705, "epoch": 302} {"train_loss": -5.028515338897705, "global_step": 12706, "epoch": 302} {"train_loss": -5.1718549728393555, "global_step": 12707, "epoch": 302} {"train_loss": -5.113377571105957, "global_step": 12708, "epoch": 302} {"train_loss": -5.1641082763671875, "global_step": 12709, "epoch": 302} {"train_loss": -5.246749401092529, "global_step": 12710, "epoch": 302} {"train_loss": -5.108823299407959, "global_step": 12711, "epoch": 302} {"train_loss": -5.051007270812988, "global_step": 12712, "epoch": 302} {"train_loss": -5.11261510848999, "global_step": 12713, "epoch": 302} {"train_loss": -5.216938018798828, "global_step": 12714, "epoch": 302} {"train_loss": -5.013522148132324, "global_step": 12715, "epoch": 302} {"train_loss": -5.130199432373047, "global_step": 12716, "epoch": 302} {"train_loss": -5.051851272583008, "global_step": 12717, "epoch": 302} {"train_loss": -5.051496505737305, "global_step": 12718, "epoch": 302} {"train_loss": -5.1115336418151855, "global_step": 12719, "epoch": 302} {"train_loss": -5.282722473144531, "global_step": 12720, "epoch": 302} {"train_loss": -5.206913471221924, "global_step": 12721, "epoch": 302} {"train_loss": -5.1392903327941895, "global_step": 12722, "epoch": 302} {"train_loss": -5.204516410827637, "global_step": 12723, "epoch": 302} {"train_loss": -5.129795551300049, "global_step": 12724, "epoch": 302} {"train_loss": -5.11170490582784, "global_step": 12725, "epoch": 302, "val_loss": 70731.6171875} {"train_loss": -5.127593994140625, "global_step": 12726, "epoch": 303} {"train_loss": -5.285272121429443, "global_step": 12727, "epoch": 303} {"train_loss": -5.281169414520264, "global_step": 12728, "epoch": 303} {"train_loss": -5.1960625648498535, "global_step": 12729, "epoch": 303} {"train_loss": -5.090179920196533, "global_step": 12730, "epoch": 303} {"train_loss": -5.31422758102417, "global_step": 12731, "epoch": 303} {"train_loss": -5.105693817138672, "global_step": 12732, "epoch": 303} {"train_loss": -5.132505416870117, "global_step": 12733, "epoch": 303} {"train_loss": -5.133452415466309, "global_step": 12734, "epoch": 303} {"train_loss": -5.082038879394531, "global_step": 12735, "epoch": 303} {"train_loss": -5.05290412902832, "global_step": 12736, "epoch": 303} {"train_loss": -5.14804744720459, "global_step": 12737, "epoch": 303} {"train_loss": -5.043027877807617, "global_step": 12738, "epoch": 303} {"train_loss": -5.187677383422852, "global_step": 12739, "epoch": 303} {"train_loss": -5.01036262512207, "global_step": 12740, "epoch": 303} {"train_loss": -5.034589767456055, "global_step": 12741, "epoch": 303} {"train_loss": -5.195775985717773, "global_step": 12742, "epoch": 303} {"train_loss": -4.8184661865234375, "global_step": 12743, "epoch": 303} {"train_loss": -5.110682487487793, "global_step": 12744, "epoch": 303} {"train_loss": -5.161238670349121, "global_step": 12745, "epoch": 303} {"train_loss": -4.973422527313232, "global_step": 12746, "epoch": 303} {"train_loss": -4.997708320617676, "global_step": 12747, "epoch": 303} {"train_loss": -5.120312213897705, "global_step": 12748, "epoch": 303} {"train_loss": -5.017601013183594, "global_step": 12749, "epoch": 303} {"train_loss": -5.1402692794799805, "global_step": 12750, "epoch": 303} {"train_loss": -5.044022560119629, "global_step": 12751, "epoch": 303} {"train_loss": -5.032405853271484, "global_step": 12752, "epoch": 303} {"train_loss": -5.239461898803711, "global_step": 12753, "epoch": 303} {"train_loss": -4.98983907699585, "global_step": 12754, "epoch": 303} {"train_loss": -5.045637130737305, "global_step": 12755, "epoch": 303} {"train_loss": -5.149651527404785, "global_step": 12756, "epoch": 303} {"train_loss": -5.173824310302734, "global_step": 12757, "epoch": 303} {"train_loss": -5.2743096351623535, "global_step": 12758, "epoch": 303} {"train_loss": -4.924365043640137, "global_step": 12759, "epoch": 303} {"train_loss": -5.191217422485352, "global_step": 12760, "epoch": 303} {"train_loss": -4.895872116088867, "global_step": 12761, "epoch": 303} {"train_loss": -5.028323173522949, "global_step": 12762, "epoch": 303} {"train_loss": -5.040932655334473, "global_step": 12763, "epoch": 303} {"train_loss": -5.17405366897583, "global_step": 12764, "epoch": 303} {"train_loss": -5.214069366455078, "global_step": 12765, "epoch": 303} {"train_loss": -5.110480308532715, "global_step": 12766, "epoch": 303} {"train_loss": -5.104366563615345, "global_step": 12767, "epoch": 303, "val_loss": 70655.609375} {"train_loss": -5.113834381103516, "global_step": 12768, "epoch": 304} {"train_loss": -5.205248832702637, "global_step": 12769, "epoch": 304} {"train_loss": -5.1417999267578125, "global_step": 12770, "epoch": 304} {"train_loss": -5.053241729736328, "global_step": 12771, "epoch": 304} {"train_loss": -5.172013282775879, "global_step": 12772, "epoch": 304} {"train_loss": -5.093044281005859, "global_step": 12773, "epoch": 304} {"train_loss": -5.192417144775391, "global_step": 12774, "epoch": 304} {"train_loss": -5.066205024719238, "global_step": 12775, "epoch": 304} {"train_loss": -5.046931266784668, "global_step": 12776, "epoch": 304} {"train_loss": -5.0686726570129395, "global_step": 12777, "epoch": 304} {"train_loss": -5.278352737426758, "global_step": 12778, "epoch": 304} {"train_loss": -5.054624557495117, "global_step": 12779, "epoch": 304} {"train_loss": -5.116206169128418, "global_step": 12780, "epoch": 304} {"train_loss": -5.148005962371826, "global_step": 12781, "epoch": 304} {"train_loss": -5.177180767059326, "global_step": 12782, "epoch": 304} {"train_loss": -5.132221221923828, "global_step": 12783, "epoch": 304} {"train_loss": -5.162891387939453, "global_step": 12784, "epoch": 304} {"train_loss": -5.16614294052124, "global_step": 12785, "epoch": 304} {"train_loss": -5.240286350250244, "global_step": 12786, "epoch": 304} {"train_loss": -5.171143531799316, "global_step": 12787, "epoch": 304} {"train_loss": -5.19465446472168, "global_step": 12788, "epoch": 304} {"train_loss": -5.246977806091309, "global_step": 12789, "epoch": 304} {"train_loss": -5.151782512664795, "global_step": 12790, "epoch": 304} {"train_loss": -5.137470722198486, "global_step": 12791, "epoch": 304} {"train_loss": -5.115347385406494, "global_step": 12792, "epoch": 304} {"train_loss": -5.084619998931885, "global_step": 12793, "epoch": 304} {"train_loss": -5.061535835266113, "global_step": 12794, "epoch": 304} {"train_loss": -5.1744232177734375, "global_step": 12795, "epoch": 304} {"train_loss": -5.210577487945557, "global_step": 12796, "epoch": 304} {"train_loss": -5.141631603240967, "global_step": 12797, "epoch": 304} {"train_loss": -5.065408229827881, "global_step": 12798, "epoch": 304} {"train_loss": -5.231252670288086, "global_step": 12799, "epoch": 304} {"train_loss": -5.073415756225586, "global_step": 12800, "epoch": 304} {"train_loss": -5.014649868011475, "global_step": 12801, "epoch": 304} {"train_loss": -4.967350006103516, "global_step": 12802, "epoch": 304} {"train_loss": -5.153953552246094, "global_step": 12803, "epoch": 304} {"train_loss": -5.127114295959473, "global_step": 12804, "epoch": 304} {"train_loss": -5.083855628967285, "global_step": 12805, "epoch": 304} {"train_loss": -5.081368923187256, "global_step": 12806, "epoch": 304} {"train_loss": -4.998308181762695, "global_step": 12807, "epoch": 304} {"train_loss": -5.133317470550537, "global_step": 12808, "epoch": 304} {"train_loss": -5.127194279716129, "global_step": 12809, "epoch": 304, "val_loss": 70835.1875} {"train_loss": -5.082178115844727, "global_step": 12810, "epoch": 305} {"train_loss": -5.16421365737915, "global_step": 12811, "epoch": 305} {"train_loss": -5.221189498901367, "global_step": 12812, "epoch": 305} {"train_loss": -5.058353424072266, "global_step": 12813, "epoch": 305} {"train_loss": -5.28325080871582, "global_step": 12814, "epoch": 305} {"train_loss": -5.07388973236084, "global_step": 12815, "epoch": 305} {"train_loss": -5.165283203125, "global_step": 12816, "epoch": 305} {"train_loss": -5.126721382141113, "global_step": 12817, "epoch": 305} {"train_loss": -5.214868545532227, "global_step": 12818, "epoch": 305} {"train_loss": -5.238529682159424, "global_step": 12819, "epoch": 305} {"train_loss": -5.240446090698242, "global_step": 12820, "epoch": 305} {"train_loss": -5.102802276611328, "global_step": 12821, "epoch": 305} {"train_loss": -5.239597797393799, "global_step": 12822, "epoch": 305} {"train_loss": -5.216070175170898, "global_step": 12823, "epoch": 305} {"train_loss": -5.171937942504883, "global_step": 12824, "epoch": 305} {"train_loss": -5.120985984802246, "global_step": 12825, "epoch": 305} {"train_loss": -5.2185893058776855, "global_step": 12826, "epoch": 305} {"train_loss": -5.121380805969238, "global_step": 12827, "epoch": 305} {"train_loss": -5.141678333282471, "global_step": 12828, "epoch": 305} {"train_loss": -5.266544342041016, "global_step": 12829, "epoch": 305} {"train_loss": -4.839768409729004, "global_step": 12830, "epoch": 305} {"train_loss": -5.129785537719727, "global_step": 12831, "epoch": 305} {"train_loss": -5.273479461669922, "global_step": 12832, "epoch": 305} {"train_loss": -5.155972003936768, "global_step": 12833, "epoch": 305} {"train_loss": -5.130005836486816, "global_step": 12834, "epoch": 305} {"train_loss": -5.089562892913818, "global_step": 12835, "epoch": 305} {"train_loss": -5.024112701416016, "global_step": 12836, "epoch": 305} {"train_loss": -5.077649116516113, "global_step": 12837, "epoch": 305} {"train_loss": -5.112851142883301, "global_step": 12838, "epoch": 305} {"train_loss": -5.164444446563721, "global_step": 12839, "epoch": 305} {"train_loss": -4.911937713623047, "global_step": 12840, "epoch": 305} {"train_loss": -5.0824737548828125, "global_step": 12841, "epoch": 305} {"train_loss": -5.084750175476074, "global_step": 12842, "epoch": 305} {"train_loss": -5.026633262634277, "global_step": 12843, "epoch": 305} {"train_loss": -5.243300914764404, "global_step": 12844, "epoch": 305} {"train_loss": -5.175152778625488, "global_step": 12845, "epoch": 305} {"train_loss": -5.118904113769531, "global_step": 12846, "epoch": 305} {"train_loss": -4.9029974937438965, "global_step": 12847, "epoch": 305} {"train_loss": -5.120563507080078, "global_step": 12848, "epoch": 305} {"train_loss": -5.009566307067871, "global_step": 12849, "epoch": 305} {"train_loss": -5.218660831451416, "global_step": 12850, "epoch": 305} {"train_loss": -5.130505209877377, "global_step": 12851, "epoch": 305, "val_loss": 70499.9140625} {"train_loss": -5.11019229888916, "global_step": 12852, "epoch": 306} {"train_loss": -5.122749328613281, "global_step": 12853, "epoch": 306} {"train_loss": -5.218278408050537, "global_step": 12854, "epoch": 306} {"train_loss": -5.132145404815674, "global_step": 12855, "epoch": 306} {"train_loss": -5.2285614013671875, "global_step": 12856, "epoch": 306} {"train_loss": -5.094083786010742, "global_step": 12857, "epoch": 306} {"train_loss": -5.099337577819824, "global_step": 12858, "epoch": 306} {"train_loss": -5.202066421508789, "global_step": 12859, "epoch": 306} {"train_loss": -5.0614118576049805, "global_step": 12860, "epoch": 306} {"train_loss": -5.236442565917969, "global_step": 12861, "epoch": 306} {"train_loss": -5.064549922943115, "global_step": 12862, "epoch": 306} {"train_loss": -5.191075801849365, "global_step": 12863, "epoch": 306} {"train_loss": -5.241419315338135, "global_step": 12864, "epoch": 306} {"train_loss": -5.203955173492432, "global_step": 12865, "epoch": 306} {"train_loss": -5.113614082336426, "global_step": 12866, "epoch": 306} {"train_loss": -5.095242500305176, "global_step": 12867, "epoch": 306} {"train_loss": -5.133817672729492, "global_step": 12868, "epoch": 306} {"train_loss": -5.134172439575195, "global_step": 12869, "epoch": 306} {"train_loss": -5.192497730255127, "global_step": 12870, "epoch": 306} {"train_loss": -5.078337669372559, "global_step": 12871, "epoch": 306} {"train_loss": -5.176841735839844, "global_step": 12872, "epoch": 306} {"train_loss": -5.2055253982543945, "global_step": 12873, "epoch": 306} {"train_loss": -5.1430463790893555, "global_step": 12874, "epoch": 306} {"train_loss": -5.128575801849365, "global_step": 12875, "epoch": 306} {"train_loss": -5.164236068725586, "global_step": 12876, "epoch": 306} {"train_loss": -5.0606689453125, "global_step": 12877, "epoch": 306} {"train_loss": -5.118165969848633, "global_step": 12878, "epoch": 306} {"train_loss": -5.057235240936279, "global_step": 12879, "epoch": 306} {"train_loss": -5.1888885498046875, "global_step": 12880, "epoch": 306} {"train_loss": -5.157162666320801, "global_step": 12881, "epoch": 306} {"train_loss": -5.142182350158691, "global_step": 12882, "epoch": 306} {"train_loss": -5.123164176940918, "global_step": 12883, "epoch": 306} {"train_loss": -5.274148941040039, "global_step": 12884, "epoch": 306} {"train_loss": -5.208029747009277, "global_step": 12885, "epoch": 306} {"train_loss": -5.116995811462402, "global_step": 12886, "epoch": 306} {"train_loss": -5.197179794311523, "global_step": 12887, "epoch": 306} {"train_loss": -5.17811393737793, "global_step": 12888, "epoch": 306} {"train_loss": -5.094058036804199, "global_step": 12889, "epoch": 306} {"train_loss": -5.069070816040039, "global_step": 12890, "epoch": 306} {"train_loss": -5.134149074554443, "global_step": 12891, "epoch": 306} {"train_loss": -5.264065742492676, "global_step": 12892, "epoch": 306} {"train_loss": -5.15005654380435, "global_step": 12893, "epoch": 306, "val_loss": 70615.015625} {"train_loss": -5.183622360229492, "global_step": 12894, "epoch": 307} {"train_loss": -5.116518974304199, "global_step": 12895, "epoch": 307} {"train_loss": -5.260606288909912, "global_step": 12896, "epoch": 307} {"train_loss": -5.048187732696533, "global_step": 12897, "epoch": 307} {"train_loss": -5.06534481048584, "global_step": 12898, "epoch": 307} {"train_loss": -5.042620658874512, "global_step": 12899, "epoch": 307} {"train_loss": -5.157726287841797, "global_step": 12900, "epoch": 307} {"train_loss": -5.291496276855469, "global_step": 12901, "epoch": 307} {"train_loss": -5.178752899169922, "global_step": 12902, "epoch": 307} {"train_loss": -5.304515361785889, "global_step": 12903, "epoch": 307} {"train_loss": -5.113487720489502, "global_step": 12904, "epoch": 307} {"train_loss": -5.179976463317871, "global_step": 12905, "epoch": 307} {"train_loss": -5.041445732116699, "global_step": 12906, "epoch": 307} {"train_loss": -5.186927795410156, "global_step": 12907, "epoch": 307} {"train_loss": -5.080249786376953, "global_step": 12908, "epoch": 307} {"train_loss": -5.116082191467285, "global_step": 12909, "epoch": 307} {"train_loss": -5.006735801696777, "global_step": 12910, "epoch": 307} {"train_loss": -5.1653218269348145, "global_step": 12911, "epoch": 307} {"train_loss": -5.06831169128418, "global_step": 12912, "epoch": 307} {"train_loss": -4.945520877838135, "global_step": 12913, "epoch": 307} {"train_loss": -5.153050899505615, "global_step": 12914, "epoch": 307} {"train_loss": -5.113392353057861, "global_step": 12915, "epoch": 307} {"train_loss": -4.944450378417969, "global_step": 12916, "epoch": 307} {"train_loss": -5.105725288391113, "global_step": 12917, "epoch": 307} {"train_loss": -5.078914642333984, "global_step": 12918, "epoch": 307} {"train_loss": -5.0741963386535645, "global_step": 12919, "epoch": 307} {"train_loss": -5.139318466186523, "global_step": 12920, "epoch": 307} {"train_loss": -5.226813316345215, "global_step": 12921, "epoch": 307} {"train_loss": -5.111779689788818, "global_step": 12922, "epoch": 307} {"train_loss": -5.069825172424316, "global_step": 12923, "epoch": 307} {"train_loss": -5.03582763671875, "global_step": 12924, "epoch": 307} {"train_loss": -5.186034679412842, "global_step": 12925, "epoch": 307} {"train_loss": -5.162116527557373, "global_step": 12926, "epoch": 307} {"train_loss": -5.09583854675293, "global_step": 12927, "epoch": 307} {"train_loss": -5.210051536560059, "global_step": 12928, "epoch": 307} {"train_loss": -4.997900009155273, "global_step": 12929, "epoch": 307} {"train_loss": -5.0729475021362305, "global_step": 12930, "epoch": 307} {"train_loss": -5.016241073608398, "global_step": 12931, "epoch": 307} {"train_loss": -5.009726524353027, "global_step": 12932, "epoch": 307} {"train_loss": -5.179405212402344, "global_step": 12933, "epoch": 307} {"train_loss": -5.207472801208496, "global_step": 12934, "epoch": 307} {"train_loss": -5.113191786266508, "global_step": 12935, "epoch": 307, "val_loss": 71145.578125} {"train_loss": -4.996936798095703, "global_step": 12936, "epoch": 308} {"train_loss": -5.18731689453125, "global_step": 12937, "epoch": 308} {"train_loss": -5.070855617523193, "global_step": 12938, "epoch": 308} {"train_loss": -5.111784934997559, "global_step": 12939, "epoch": 308} {"train_loss": -5.143707275390625, "global_step": 12940, "epoch": 308} {"train_loss": -5.014852523803711, "global_step": 12941, "epoch": 308} {"train_loss": -5.134812355041504, "global_step": 12942, "epoch": 308} {"train_loss": -5.08462381362915, "global_step": 12943, "epoch": 308} {"train_loss": -5.222779273986816, "global_step": 12944, "epoch": 308} {"train_loss": -5.13712739944458, "global_step": 12945, "epoch": 308} {"train_loss": -5.186375617980957, "global_step": 12946, "epoch": 308} {"train_loss": -5.154208183288574, "global_step": 12947, "epoch": 308} {"train_loss": -5.233174800872803, "global_step": 12948, "epoch": 308} {"train_loss": -4.973372936248779, "global_step": 12949, "epoch": 308} {"train_loss": -5.0618486404418945, "global_step": 12950, "epoch": 308} {"train_loss": -5.17963981628418, "global_step": 12951, "epoch": 308} {"train_loss": -5.223161697387695, "global_step": 12952, "epoch": 308} {"train_loss": -5.1412129402160645, "global_step": 12953, "epoch": 308} {"train_loss": -5.090763568878174, "global_step": 12954, "epoch": 308} {"train_loss": -5.183587074279785, "global_step": 12955, "epoch": 308} {"train_loss": -5.092864990234375, "global_step": 12956, "epoch": 308} {"train_loss": -5.079148769378662, "global_step": 12957, "epoch": 308} {"train_loss": -5.070744514465332, "global_step": 12958, "epoch": 308} {"train_loss": -5.340301036834717, "global_step": 12959, "epoch": 308} {"train_loss": -5.185497283935547, "global_step": 12960, "epoch": 308} {"train_loss": -5.225724220275879, "global_step": 12961, "epoch": 308} {"train_loss": -4.994009017944336, "global_step": 12962, "epoch": 308} {"train_loss": -5.209484100341797, "global_step": 12963, "epoch": 308} {"train_loss": -5.191329002380371, "global_step": 12964, "epoch": 308} {"train_loss": -5.217484951019287, "global_step": 12965, "epoch": 308} {"train_loss": -5.183978080749512, "global_step": 12966, "epoch": 308} {"train_loss": -5.15473747253418, "global_step": 12967, "epoch": 308} {"train_loss": -5.081912994384766, "global_step": 12968, "epoch": 308} {"train_loss": -5.1489362716674805, "global_step": 12969, "epoch": 308} {"train_loss": -5.16195011138916, "global_step": 12970, "epoch": 308} {"train_loss": -5.0268235206604, "global_step": 12971, "epoch": 308} {"train_loss": -5.159175872802734, "global_step": 12972, "epoch": 308} {"train_loss": -5.212642669677734, "global_step": 12973, "epoch": 308} {"train_loss": -5.158502578735352, "global_step": 12974, "epoch": 308} {"train_loss": -5.1240034103393555, "global_step": 12975, "epoch": 308} {"train_loss": -5.16037130355835, "global_step": 12976, "epoch": 308} {"train_loss": -5.1348502068292525, "global_step": 12977, "epoch": 308, "val_loss": 70694.3203125} {"train_loss": -5.112337112426758, "global_step": 12978, "epoch": 309} {"train_loss": -5.18984317779541, "global_step": 12979, "epoch": 309} {"train_loss": -5.189168930053711, "global_step": 12980, "epoch": 309} {"train_loss": -5.197922706604004, "global_step": 12981, "epoch": 309} {"train_loss": -5.173428058624268, "global_step": 12982, "epoch": 309} {"train_loss": -4.936936378479004, "global_step": 12983, "epoch": 309} {"train_loss": -5.15226936340332, "global_step": 12984, "epoch": 309} {"train_loss": -5.134308338165283, "global_step": 12985, "epoch": 309} {"train_loss": -5.116357326507568, "global_step": 12986, "epoch": 309} {"train_loss": -5.112024307250977, "global_step": 12987, "epoch": 309} {"train_loss": -5.261482238769531, "global_step": 12988, "epoch": 309} {"train_loss": -5.11707878112793, "global_step": 12989, "epoch": 309} {"train_loss": -5.1186981201171875, "global_step": 12990, "epoch": 309} {"train_loss": -5.25290584564209, "global_step": 12991, "epoch": 309} {"train_loss": -5.193426132202148, "global_step": 12992, "epoch": 309} {"train_loss": -5.163434982299805, "global_step": 12993, "epoch": 309} {"train_loss": -5.144342422485352, "global_step": 12994, "epoch": 309} {"train_loss": -5.147974014282227, "global_step": 12995, "epoch": 309} {"train_loss": -5.1802592277526855, "global_step": 12996, "epoch": 309} {"train_loss": -5.104697227478027, "global_step": 12997, "epoch": 309} {"train_loss": -5.206199645996094, "global_step": 12998, "epoch": 309} {"train_loss": -5.211978912353516, "global_step": 12999, "epoch": 309} {"train_loss": -5.171260833740234, "global_step": 13000, "epoch": 309} {"train_loss": -5.229739189147949, "global_step": 13001, "epoch": 309} {"train_loss": -5.113995552062988, "global_step": 13002, "epoch": 309} {"train_loss": -5.077783584594727, "global_step": 13003, "epoch": 309} {"train_loss": -5.068138599395752, "global_step": 13004, "epoch": 309} {"train_loss": -5.211764335632324, "global_step": 13005, "epoch": 309} {"train_loss": -5.138751029968262, "global_step": 13006, "epoch": 309} {"train_loss": -5.260120868682861, "global_step": 13007, "epoch": 309} {"train_loss": -5.228148460388184, "global_step": 13008, "epoch": 309} {"train_loss": -5.108698844909668, "global_step": 13009, "epoch": 309} {"train_loss": -5.27999210357666, "global_step": 13010, "epoch": 309} {"train_loss": -5.223391532897949, "global_step": 13011, "epoch": 309} {"train_loss": -5.159811019897461, "global_step": 13012, "epoch": 309} {"train_loss": -5.265142440795898, "global_step": 13013, "epoch": 309} {"train_loss": -5.036993026733398, "global_step": 13014, "epoch": 309} {"train_loss": -5.136787414550781, "global_step": 13015, "epoch": 309} {"train_loss": -4.9738945960998535, "global_step": 13016, "epoch": 309} {"train_loss": -4.905384063720703, "global_step": 13017, "epoch": 309} {"train_loss": -5.125427722930908, "global_step": 13018, "epoch": 309} {"train_loss": -5.148841789790562, "global_step": 13019, "epoch": 309, "val_loss": 70630.0859375} {"train_loss": -5.171937942504883, "global_step": 13020, "epoch": 310} {"train_loss": -5.195713520050049, "global_step": 13021, "epoch": 310} {"train_loss": -5.068850994110107, "global_step": 13022, "epoch": 310} {"train_loss": -5.156285285949707, "global_step": 13023, "epoch": 310} {"train_loss": -5.020603656768799, "global_step": 13024, "epoch": 310} {"train_loss": -4.9823102951049805, "global_step": 13025, "epoch": 310} {"train_loss": -5.096152305603027, "global_step": 13026, "epoch": 310} {"train_loss": -5.070189952850342, "global_step": 13027, "epoch": 310} {"train_loss": -5.061200141906738, "global_step": 13028, "epoch": 310} {"train_loss": -5.044114589691162, "global_step": 13029, "epoch": 310} {"train_loss": -5.161616325378418, "global_step": 13030, "epoch": 310} {"train_loss": -5.078702926635742, "global_step": 13031, "epoch": 310} {"train_loss": -5.10391902923584, "global_step": 13032, "epoch": 310} {"train_loss": -5.078804969787598, "global_step": 13033, "epoch": 310} {"train_loss": -5.149824142456055, "global_step": 13034, "epoch": 310} {"train_loss": -5.111468315124512, "global_step": 13035, "epoch": 310} {"train_loss": -5.202582359313965, "global_step": 13036, "epoch": 310} {"train_loss": -5.019280433654785, "global_step": 13037, "epoch": 310} {"train_loss": -5.169452667236328, "global_step": 13038, "epoch": 310} {"train_loss": -5.026743412017822, "global_step": 13039, "epoch": 310} {"train_loss": -5.102733612060547, "global_step": 13040, "epoch": 310} {"train_loss": -5.056819438934326, "global_step": 13041, "epoch": 310} {"train_loss": -5.0866804122924805, "global_step": 13042, "epoch": 310} {"train_loss": -4.926012992858887, "global_step": 13043, "epoch": 310} {"train_loss": -5.190394878387451, "global_step": 13044, "epoch": 310} {"train_loss": -5.151853561401367, "global_step": 13045, "epoch": 310} {"train_loss": -5.163286209106445, "global_step": 13046, "epoch": 310} {"train_loss": -5.172798156738281, "global_step": 13047, "epoch": 310} {"train_loss": -5.222306251525879, "global_step": 13048, "epoch": 310} {"train_loss": -5.261155605316162, "global_step": 13049, "epoch": 310} {"train_loss": -5.01440954208374, "global_step": 13050, "epoch": 310} {"train_loss": -5.168055534362793, "global_step": 13051, "epoch": 310} {"train_loss": -5.154766082763672, "global_step": 13052, "epoch": 310} {"train_loss": -4.966709136962891, "global_step": 13053, "epoch": 310} {"train_loss": -5.1783294677734375, "global_step": 13054, "epoch": 310} {"train_loss": -5.223267078399658, "global_step": 13055, "epoch": 310} {"train_loss": -5.092432022094727, "global_step": 13056, "epoch": 310} {"train_loss": -5.038584232330322, "global_step": 13057, "epoch": 310} {"train_loss": -5.152182579040527, "global_step": 13058, "epoch": 310} {"train_loss": -5.103149890899658, "global_step": 13059, "epoch": 310} {"train_loss": -5.132412433624268, "global_step": 13060, "epoch": 310} {"train_loss": -5.1117890902927945, "global_step": 13061, "epoch": 310, "val_loss": 71278.4453125} {"train_loss": -4.946234226226807, "global_step": 13062, "epoch": 311} {"train_loss": -5.231224060058594, "global_step": 13063, "epoch": 311} {"train_loss": -5.039764404296875, "global_step": 13064, "epoch": 311} {"train_loss": -5.146315097808838, "global_step": 13065, "epoch": 311} {"train_loss": -5.151947975158691, "global_step": 13066, "epoch": 311} {"train_loss": -5.027766227722168, "global_step": 13067, "epoch": 311} {"train_loss": -4.942192077636719, "global_step": 13068, "epoch": 311} {"train_loss": -5.138734340667725, "global_step": 13069, "epoch": 311} {"train_loss": -4.931373596191406, "global_step": 13070, "epoch": 311} {"train_loss": -5.281524181365967, "global_step": 13071, "epoch": 311} {"train_loss": -4.950788497924805, "global_step": 13072, "epoch": 311} {"train_loss": -5.101073265075684, "global_step": 13073, "epoch": 311} {"train_loss": -5.079200744628906, "global_step": 13074, "epoch": 311} {"train_loss": -5.104515075683594, "global_step": 13075, "epoch": 311} {"train_loss": -5.004230499267578, "global_step": 13076, "epoch": 311} {"train_loss": -4.8945088386535645, "global_step": 13077, "epoch": 311} {"train_loss": -5.1306304931640625, "global_step": 13078, "epoch": 311} {"train_loss": -5.129515647888184, "global_step": 13079, "epoch": 311} {"train_loss": -4.993609428405762, "global_step": 13080, "epoch": 311} {"train_loss": -5.050957202911377, "global_step": 13081, "epoch": 311} {"train_loss": -5.0277791023254395, "global_step": 13082, "epoch": 311} {"train_loss": -5.2732696533203125, "global_step": 13083, "epoch": 311} {"train_loss": -4.912465572357178, "global_step": 13084, "epoch": 311} {"train_loss": -5.17732048034668, "global_step": 13085, "epoch": 311} {"train_loss": -5.067589282989502, "global_step": 13086, "epoch": 311} {"train_loss": -5.12979793548584, "global_step": 13087, "epoch": 311} {"train_loss": -5.2330427169799805, "global_step": 13088, "epoch": 311} {"train_loss": -4.986787796020508, "global_step": 13089, "epoch": 311} {"train_loss": -5.151187896728516, "global_step": 13090, "epoch": 311} {"train_loss": -5.324294090270996, "global_step": 13091, "epoch": 311} {"train_loss": -5.204982757568359, "global_step": 13092, "epoch": 311} {"train_loss": -5.108340740203857, "global_step": 13093, "epoch": 311} {"train_loss": -5.189982891082764, "global_step": 13094, "epoch": 311} {"train_loss": -5.25518798828125, "global_step": 13095, "epoch": 311} {"train_loss": -5.1204633712768555, "global_step": 13096, "epoch": 311} {"train_loss": -5.222306251525879, "global_step": 13097, "epoch": 311} {"train_loss": -5.185473918914795, "global_step": 13098, "epoch": 311} {"train_loss": -5.230024337768555, "global_step": 13099, "epoch": 311} {"train_loss": -5.1370439529418945, "global_step": 13100, "epoch": 311} {"train_loss": -5.149496078491211, "global_step": 13101, "epoch": 311} {"train_loss": -5.194264888763428, "global_step": 13102, "epoch": 311} {"train_loss": -5.114168723424275, "global_step": 13103, "epoch": 311, "val_loss": 70338.3984375} {"train_loss": -5.02504825592041, "global_step": 13104, "epoch": 312} {"train_loss": -4.993108749389648, "global_step": 13105, "epoch": 312} {"train_loss": -5.167361259460449, "global_step": 13106, "epoch": 312} {"train_loss": -5.153351306915283, "global_step": 13107, "epoch": 312} {"train_loss": -5.1750288009643555, "global_step": 13108, "epoch": 312} {"train_loss": -5.184113502502441, "global_step": 13109, "epoch": 312} {"train_loss": -5.081140518188477, "global_step": 13110, "epoch": 312} {"train_loss": -5.179718971252441, "global_step": 13111, "epoch": 312} {"train_loss": -5.0433549880981445, "global_step": 13112, "epoch": 312} {"train_loss": -5.184934616088867, "global_step": 13113, "epoch": 312} {"train_loss": -5.212774276733398, "global_step": 13114, "epoch": 312} {"train_loss": -5.2060699462890625, "global_step": 13115, "epoch": 312} {"train_loss": -5.015350818634033, "global_step": 13116, "epoch": 312} {"train_loss": -5.115852355957031, "global_step": 13117, "epoch": 312} {"train_loss": -5.022875785827637, "global_step": 13118, "epoch": 312} {"train_loss": -4.934605598449707, "global_step": 13119, "epoch": 312} {"train_loss": -4.9855732917785645, "global_step": 13120, "epoch": 312} {"train_loss": -5.163527011871338, "global_step": 13121, "epoch": 312} {"train_loss": -5.19996452331543, "global_step": 13122, "epoch": 312} {"train_loss": -5.172895431518555, "global_step": 13123, "epoch": 312} {"train_loss": -5.0369486808776855, "global_step": 13124, "epoch": 312} {"train_loss": -5.200175762176514, "global_step": 13125, "epoch": 312} {"train_loss": -5.23415994644165, "global_step": 13126, "epoch": 312} {"train_loss": -5.118294715881348, "global_step": 13127, "epoch": 312} {"train_loss": -5.227148532867432, "global_step": 13128, "epoch": 312} {"train_loss": -5.085733413696289, "global_step": 13129, "epoch": 312} {"train_loss": -5.298084735870361, "global_step": 13130, "epoch": 312} {"train_loss": -5.04101037979126, "global_step": 13131, "epoch": 312} {"train_loss": -5.164865493774414, "global_step": 13132, "epoch": 312} {"train_loss": -5.207846641540527, "global_step": 13133, "epoch": 312} {"train_loss": -5.162188529968262, "global_step": 13134, "epoch": 312} {"train_loss": -5.162644386291504, "global_step": 13135, "epoch": 312} {"train_loss": -5.097178936004639, "global_step": 13136, "epoch": 312} {"train_loss": -5.191264629364014, "global_step": 13137, "epoch": 312} {"train_loss": -5.208681106567383, "global_step": 13138, "epoch": 312} {"train_loss": -5.080719947814941, "global_step": 13139, "epoch": 312} {"train_loss": -5.210811614990234, "global_step": 13140, "epoch": 312} {"train_loss": -5.133890151977539, "global_step": 13141, "epoch": 312} {"train_loss": -5.054669380187988, "global_step": 13142, "epoch": 312} {"train_loss": -5.005161285400391, "global_step": 13143, "epoch": 312} {"train_loss": -5.256224632263184, "global_step": 13144, "epoch": 312} {"train_loss": -5.129488172985258, "global_step": 13145, "epoch": 312, "val_loss": 71408.828125} {"train_loss": -5.035119533538818, "global_step": 13146, "epoch": 313} {"train_loss": -5.187196731567383, "global_step": 13147, "epoch": 313} {"train_loss": -5.115113258361816, "global_step": 13148, "epoch": 313} {"train_loss": -5.091838836669922, "global_step": 13149, "epoch": 313} {"train_loss": -5.131276607513428, "global_step": 13150, "epoch": 313} {"train_loss": -5.220477104187012, "global_step": 13151, "epoch": 313} {"train_loss": -5.0253520011901855, "global_step": 13152, "epoch": 313} {"train_loss": -5.109811782836914, "global_step": 13153, "epoch": 313} {"train_loss": -4.991613388061523, "global_step": 13154, "epoch": 313} {"train_loss": -5.213581562042236, "global_step": 13155, "epoch": 313} {"train_loss": -5.273015022277832, "global_step": 13156, "epoch": 313} {"train_loss": -5.115224838256836, "global_step": 13157, "epoch": 313} {"train_loss": -5.195400238037109, "global_step": 13158, "epoch": 313} {"train_loss": -5.187302589416504, "global_step": 13159, "epoch": 313} {"train_loss": -5.339735984802246, "global_step": 13160, "epoch": 313} {"train_loss": -5.0794677734375, "global_step": 13161, "epoch": 313} {"train_loss": -5.200468063354492, "global_step": 13162, "epoch": 313} {"train_loss": -5.084016799926758, "global_step": 13163, "epoch": 313} {"train_loss": -5.244659900665283, "global_step": 13164, "epoch": 313} {"train_loss": -5.180458068847656, "global_step": 13165, "epoch": 313} {"train_loss": -5.3150224685668945, "global_step": 13166, "epoch": 313} {"train_loss": -5.23322057723999, "global_step": 13167, "epoch": 313} {"train_loss": -5.231278419494629, "global_step": 13168, "epoch": 313} {"train_loss": -5.056711673736572, "global_step": 13169, "epoch": 313} {"train_loss": -5.062557220458984, "global_step": 13170, "epoch": 313} {"train_loss": -4.995833396911621, "global_step": 13171, "epoch": 313} {"train_loss": -5.0628862380981445, "global_step": 13172, "epoch": 313} {"train_loss": -5.2336883544921875, "global_step": 13173, "epoch": 313} {"train_loss": -5.288331985473633, "global_step": 13174, "epoch": 313} {"train_loss": -5.136981010437012, "global_step": 13175, "epoch": 313} {"train_loss": -5.214618682861328, "global_step": 13176, "epoch": 313} {"train_loss": -5.035409450531006, "global_step": 13177, "epoch": 313} {"train_loss": -5.261693954467773, "global_step": 13178, "epoch": 313} {"train_loss": -5.145513534545898, "global_step": 13179, "epoch": 313} {"train_loss": -5.099094390869141, "global_step": 13180, "epoch": 313} {"train_loss": -5.130959510803223, "global_step": 13181, "epoch": 313} {"train_loss": -5.236979961395264, "global_step": 13182, "epoch": 313} {"train_loss": -5.179386615753174, "global_step": 13183, "epoch": 313} {"train_loss": -5.169351577758789, "global_step": 13184, "epoch": 313} {"train_loss": -5.153315544128418, "global_step": 13185, "epoch": 313} {"train_loss": -5.058708190917969, "global_step": 13186, "epoch": 313} {"train_loss": -5.154938731874738, "global_step": 13187, "epoch": 313, "val_loss": 70804.171875} {"train_loss": -5.164568901062012, "global_step": 13188, "epoch": 314} {"train_loss": -5.060517311096191, "global_step": 13189, "epoch": 314} {"train_loss": -5.139636039733887, "global_step": 13190, "epoch": 314} {"train_loss": -5.218256950378418, "global_step": 13191, "epoch": 314} {"train_loss": -5.225475311279297, "global_step": 13192, "epoch": 314} {"train_loss": -5.16165828704834, "global_step": 13193, "epoch": 314} {"train_loss": -5.061153411865234, "global_step": 13194, "epoch": 314} {"train_loss": -5.171912670135498, "global_step": 13195, "epoch": 314} {"train_loss": -5.141305923461914, "global_step": 13196, "epoch": 314} {"train_loss": -5.152369022369385, "global_step": 13197, "epoch": 314} {"train_loss": -5.235945701599121, "global_step": 13198, "epoch": 314} {"train_loss": -5.303055763244629, "global_step": 13199, "epoch": 314} {"train_loss": -5.243464469909668, "global_step": 13200, "epoch": 314} {"train_loss": -5.254388809204102, "global_step": 13201, "epoch": 314} {"train_loss": -5.055577754974365, "global_step": 13202, "epoch": 314} {"train_loss": -5.0154242515563965, "global_step": 13203, "epoch": 314} {"train_loss": -5.147113800048828, "global_step": 13204, "epoch": 314} {"train_loss": -5.280728816986084, "global_step": 13205, "epoch": 314} {"train_loss": -4.973697185516357, "global_step": 13206, "epoch": 314} {"train_loss": -5.037744522094727, "global_step": 13207, "epoch": 314} {"train_loss": -5.094451904296875, "global_step": 13208, "epoch": 314} {"train_loss": -5.095682621002197, "global_step": 13209, "epoch": 314} {"train_loss": -5.102672576904297, "global_step": 13210, "epoch": 314} {"train_loss": -5.125085830688477, "global_step": 13211, "epoch": 314} {"train_loss": -5.140023231506348, "global_step": 13212, "epoch": 314} {"train_loss": -5.132659912109375, "global_step": 13213, "epoch": 314} {"train_loss": -5.275699615478516, "global_step": 13214, "epoch": 314} {"train_loss": -5.281015396118164, "global_step": 13215, "epoch": 314} {"train_loss": -5.192780494689941, "global_step": 13216, "epoch": 314} {"train_loss": -5.125441551208496, "global_step": 13217, "epoch": 314} {"train_loss": -5.263986587524414, "global_step": 13218, "epoch": 314} {"train_loss": -5.200130462646484, "global_step": 13219, "epoch": 314} {"train_loss": -5.232236862182617, "global_step": 13220, "epoch": 314} {"train_loss": -5.136375904083252, "global_step": 13221, "epoch": 314} {"train_loss": -5.20512580871582, "global_step": 13222, "epoch": 314} {"train_loss": -5.194188594818115, "global_step": 13223, "epoch": 314} {"train_loss": -5.134366989135742, "global_step": 13224, "epoch": 314} {"train_loss": -5.193374156951904, "global_step": 13225, "epoch": 314} {"train_loss": -5.087854385375977, "global_step": 13226, "epoch": 314} {"train_loss": -5.209808349609375, "global_step": 13227, "epoch": 314} {"train_loss": -5.172762870788574, "global_step": 13228, "epoch": 314} {"train_loss": -5.157269239425659, "global_step": 13229, "epoch": 314, "val_loss": 70939.984375} {"train_loss": -5.238040924072266, "global_step": 13230, "epoch": 315} {"train_loss": -4.922964096069336, "global_step": 13231, "epoch": 315} {"train_loss": -5.22403621673584, "global_step": 13232, "epoch": 315} {"train_loss": -5.222135543823242, "global_step": 13233, "epoch": 315} {"train_loss": -4.746773719787598, "global_step": 13234, "epoch": 315} {"train_loss": -4.925224304199219, "global_step": 13235, "epoch": 315} {"train_loss": -5.256711959838867, "global_step": 13236, "epoch": 315} {"train_loss": -5.148599147796631, "global_step": 13237, "epoch": 315} {"train_loss": -5.14801549911499, "global_step": 13238, "epoch": 315} {"train_loss": -5.105269908905029, "global_step": 13239, "epoch": 315} {"train_loss": -5.066815376281738, "global_step": 13240, "epoch": 315} {"train_loss": -4.983431816101074, "global_step": 13241, "epoch": 315} {"train_loss": -5.06321907043457, "global_step": 13242, "epoch": 315} {"train_loss": -5.181950569152832, "global_step": 13243, "epoch": 315} {"train_loss": -5.034566879272461, "global_step": 13244, "epoch": 315} {"train_loss": -5.169868469238281, "global_step": 13245, "epoch": 315} {"train_loss": -5.096088409423828, "global_step": 13246, "epoch": 315} {"train_loss": -5.160085201263428, "global_step": 13247, "epoch": 315} {"train_loss": -5.183981418609619, "global_step": 13248, "epoch": 315} {"train_loss": -5.145195007324219, "global_step": 13249, "epoch": 315} {"train_loss": -5.145961284637451, "global_step": 13250, "epoch": 315} {"train_loss": -5.0857930183410645, "global_step": 13251, "epoch": 315} {"train_loss": -5.100987911224365, "global_step": 13252, "epoch": 315} {"train_loss": -5.1457366943359375, "global_step": 13253, "epoch": 315} {"train_loss": -5.176032066345215, "global_step": 13254, "epoch": 315} {"train_loss": -5.066987037658691, "global_step": 13255, "epoch": 315} {"train_loss": -5.212486267089844, "global_step": 13256, "epoch": 315} {"train_loss": -5.277176856994629, "global_step": 13257, "epoch": 315} {"train_loss": -5.189740180969238, "global_step": 13258, "epoch": 315} {"train_loss": -5.184038162231445, "global_step": 13259, "epoch": 315} {"train_loss": -5.184623718261719, "global_step": 13260, "epoch": 315} {"train_loss": -5.071903228759766, "global_step": 13261, "epoch": 315} {"train_loss": -4.928031921386719, "global_step": 13262, "epoch": 315} {"train_loss": -5.070522308349609, "global_step": 13263, "epoch": 315} {"train_loss": -4.886262893676758, "global_step": 13264, "epoch": 315} {"train_loss": -4.947248458862305, "global_step": 13265, "epoch": 315} {"train_loss": -4.963588237762451, "global_step": 13266, "epoch": 315} {"train_loss": -4.923864841461182, "global_step": 13267, "epoch": 315} {"train_loss": -5.0980072021484375, "global_step": 13268, "epoch": 315} {"train_loss": -5.017963409423828, "global_step": 13269, "epoch": 315} {"train_loss": -5.1175432205200195, "global_step": 13270, "epoch": 315} {"train_loss": -5.09231804666065, "global_step": 13271, "epoch": 315, "val_loss": 71302.375} {"train_loss": -5.1290602684021, "global_step": 13272, "epoch": 316} {"train_loss": -5.154277801513672, "global_step": 13273, "epoch": 316} {"train_loss": -5.107607841491699, "global_step": 13274, "epoch": 316} {"train_loss": -5.031623840332031, "global_step": 13275, "epoch": 316} {"train_loss": -5.1221208572387695, "global_step": 13276, "epoch": 316} {"train_loss": -5.084475994110107, "global_step": 13277, "epoch": 316} {"train_loss": -5.135959625244141, "global_step": 13278, "epoch": 316} {"train_loss": -5.141307830810547, "global_step": 13279, "epoch": 316} {"train_loss": -5.114357948303223, "global_step": 13280, "epoch": 316} {"train_loss": -5.154330253601074, "global_step": 13281, "epoch": 316} {"train_loss": -5.136264801025391, "global_step": 13282, "epoch": 316} {"train_loss": -5.0636444091796875, "global_step": 13283, "epoch": 316} {"train_loss": -5.248898029327393, "global_step": 13284, "epoch": 316} {"train_loss": -5.267400741577148, "global_step": 13285, "epoch": 316} {"train_loss": -5.033042907714844, "global_step": 13286, "epoch": 316} {"train_loss": -5.06948184967041, "global_step": 13287, "epoch": 316} {"train_loss": -5.1603827476501465, "global_step": 13288, "epoch": 316} {"train_loss": -5.034261226654053, "global_step": 13289, "epoch": 316} {"train_loss": -5.081120491027832, "global_step": 13290, "epoch": 316} {"train_loss": -5.215279579162598, "global_step": 13291, "epoch": 316} {"train_loss": -4.896152496337891, "global_step": 13292, "epoch": 316} {"train_loss": -5.211183547973633, "global_step": 13293, "epoch": 316} {"train_loss": -5.261362075805664, "global_step": 13294, "epoch": 316} {"train_loss": -5.09212064743042, "global_step": 13295, "epoch": 316} {"train_loss": -5.089759826660156, "global_step": 13296, "epoch": 316} {"train_loss": -5.099793434143066, "global_step": 13297, "epoch": 316} {"train_loss": -5.221810340881348, "global_step": 13298, "epoch": 316} {"train_loss": -5.089326858520508, "global_step": 13299, "epoch": 316} {"train_loss": -5.234442710876465, "global_step": 13300, "epoch": 316} {"train_loss": -5.109775066375732, "global_step": 13301, "epoch": 316} {"train_loss": -5.177918910980225, "global_step": 13302, "epoch": 316} {"train_loss": -5.064455986022949, "global_step": 13303, "epoch": 316} {"train_loss": -5.280682563781738, "global_step": 13304, "epoch": 316} {"train_loss": -5.112856388092041, "global_step": 13305, "epoch": 316} {"train_loss": -5.098687171936035, "global_step": 13306, "epoch": 316} {"train_loss": -5.174063682556152, "global_step": 13307, "epoch": 316} {"train_loss": -5.075863838195801, "global_step": 13308, "epoch": 316} {"train_loss": -5.156520843505859, "global_step": 13309, "epoch": 316} {"train_loss": -5.235664367675781, "global_step": 13310, "epoch": 316} {"train_loss": -5.170891761779785, "global_step": 13311, "epoch": 316} {"train_loss": -5.175797939300537, "global_step": 13312, "epoch": 316} {"train_loss": -5.137523900894892, "global_step": 13313, "epoch": 316, "val_loss": 70661.3046875} {"train_loss": -5.037199974060059, "global_step": 13314, "epoch": 317} {"train_loss": -5.113105773925781, "global_step": 13315, "epoch": 317} {"train_loss": -5.121167182922363, "global_step": 13316, "epoch": 317} {"train_loss": -5.228001594543457, "global_step": 13317, "epoch": 317} {"train_loss": -5.1773881912231445, "global_step": 13318, "epoch": 317} {"train_loss": -5.076725959777832, "global_step": 13319, "epoch": 317} {"train_loss": -5.35422420501709, "global_step": 13320, "epoch": 317} {"train_loss": -5.13754940032959, "global_step": 13321, "epoch": 317} {"train_loss": -5.188682556152344, "global_step": 13322, "epoch": 317} {"train_loss": -5.168004035949707, "global_step": 13323, "epoch": 317} {"train_loss": -5.121822357177734, "global_step": 13324, "epoch": 317} {"train_loss": -5.11690092086792, "global_step": 13325, "epoch": 317} {"train_loss": -5.2046051025390625, "global_step": 13326, "epoch": 317} {"train_loss": -5.239994049072266, "global_step": 13327, "epoch": 317} {"train_loss": -5.138002872467041, "global_step": 13328, "epoch": 317} {"train_loss": -5.256740570068359, "global_step": 13329, "epoch": 317} {"train_loss": -5.139007568359375, "global_step": 13330, "epoch": 317} {"train_loss": -5.166295051574707, "global_step": 13331, "epoch": 317} {"train_loss": -5.249090194702148, "global_step": 13332, "epoch": 317} {"train_loss": -5.079663276672363, "global_step": 13333, "epoch": 317} {"train_loss": -5.142115592956543, "global_step": 13334, "epoch": 317} {"train_loss": -5.176421165466309, "global_step": 13335, "epoch": 317} {"train_loss": -5.244553089141846, "global_step": 13336, "epoch": 317} {"train_loss": -5.099830627441406, "global_step": 13337, "epoch": 317} {"train_loss": -5.066446304321289, "global_step": 13338, "epoch": 317} {"train_loss": -5.2499823570251465, "global_step": 13339, "epoch": 317} {"train_loss": -5.252597332000732, "global_step": 13340, "epoch": 317} {"train_loss": -5.285695552825928, "global_step": 13341, "epoch": 317} {"train_loss": -5.065394401550293, "global_step": 13342, "epoch": 317} {"train_loss": -5.128029823303223, "global_step": 13343, "epoch": 317} {"train_loss": -5.21041202545166, "global_step": 13344, "epoch": 317} {"train_loss": -5.112486839294434, "global_step": 13345, "epoch": 317} {"train_loss": -5.185938835144043, "global_step": 13346, "epoch": 317} {"train_loss": -5.02232551574707, "global_step": 13347, "epoch": 317} {"train_loss": -5.0538530349731445, "global_step": 13348, "epoch": 317} {"train_loss": -5.184625625610352, "global_step": 13349, "epoch": 317} {"train_loss": -5.036319732666016, "global_step": 13350, "epoch": 317} {"train_loss": -5.0268964767456055, "global_step": 13351, "epoch": 317} {"train_loss": -4.894280433654785, "global_step": 13352, "epoch": 317} {"train_loss": -5.023909568786621, "global_step": 13353, "epoch": 317} {"train_loss": -5.249153137207031, "global_step": 13354, "epoch": 317} {"train_loss": -5.145849477677118, "global_step": 13355, "epoch": 317, "val_loss": 70999.671875} {"train_loss": -5.028280258178711, "global_step": 13356, "epoch": 318} {"train_loss": -5.068436622619629, "global_step": 13357, "epoch": 318} {"train_loss": -4.992213726043701, "global_step": 13358, "epoch": 318} {"train_loss": -4.98165225982666, "global_step": 13359, "epoch": 318} {"train_loss": -5.057135581970215, "global_step": 13360, "epoch": 318} {"train_loss": -5.082891464233398, "global_step": 13361, "epoch": 318} {"train_loss": -5.110706329345703, "global_step": 13362, "epoch": 318} {"train_loss": -5.126825332641602, "global_step": 13363, "epoch": 318} {"train_loss": -5.036501884460449, "global_step": 13364, "epoch": 318} {"train_loss": -4.880103588104248, "global_step": 13365, "epoch": 318} {"train_loss": -5.145319938659668, "global_step": 13366, "epoch": 318} {"train_loss": -5.067415714263916, "global_step": 13367, "epoch": 318} {"train_loss": -5.143034934997559, "global_step": 13368, "epoch": 318} {"train_loss": -5.130633354187012, "global_step": 13369, "epoch": 318} {"train_loss": -5.02199649810791, "global_step": 13370, "epoch": 318} {"train_loss": -5.084039688110352, "global_step": 13371, "epoch": 318} {"train_loss": -5.141086101531982, "global_step": 13372, "epoch": 318} {"train_loss": -4.877726078033447, "global_step": 13373, "epoch": 318} {"train_loss": -5.128442764282227, "global_step": 13374, "epoch": 318} {"train_loss": -5.069644927978516, "global_step": 13375, "epoch": 318} {"train_loss": -5.020914077758789, "global_step": 13376, "epoch": 318} {"train_loss": -5.189810752868652, "global_step": 13377, "epoch": 318} {"train_loss": -5.077276229858398, "global_step": 13378, "epoch": 318} {"train_loss": -5.076420307159424, "global_step": 13379, "epoch": 318} {"train_loss": -5.072607040405273, "global_step": 13380, "epoch": 318} {"train_loss": -5.006805419921875, "global_step": 13381, "epoch": 318} {"train_loss": -5.212627410888672, "global_step": 13382, "epoch": 318} {"train_loss": -5.17852783203125, "global_step": 13383, "epoch": 318} {"train_loss": -5.215057849884033, "global_step": 13384, "epoch": 318} {"train_loss": -5.190896034240723, "global_step": 13385, "epoch": 318} {"train_loss": -4.9827704429626465, "global_step": 13386, "epoch": 318} {"train_loss": -5.2058868408203125, "global_step": 13387, "epoch": 318} {"train_loss": -5.232576370239258, "global_step": 13388, "epoch": 318} {"train_loss": -4.9750823974609375, "global_step": 13389, "epoch": 318} {"train_loss": -5.1625494956970215, "global_step": 13390, "epoch": 318} {"train_loss": -5.2415452003479, "global_step": 13391, "epoch": 318} {"train_loss": -5.192068099975586, "global_step": 13392, "epoch": 318} {"train_loss": -5.046179294586182, "global_step": 13393, "epoch": 318} {"train_loss": -5.155825614929199, "global_step": 13394, "epoch": 318} {"train_loss": -5.172457695007324, "global_step": 13395, "epoch": 318} {"train_loss": -5.168992042541504, "global_step": 13396, "epoch": 318} {"train_loss": -5.098833379291353, "global_step": 13397, "epoch": 318, "val_loss": 71060.0703125} {"train_loss": -4.990583419799805, "global_step": 13398, "epoch": 319} {"train_loss": -5.090820789337158, "global_step": 13399, "epoch": 319} {"train_loss": -5.147637367248535, "global_step": 13400, "epoch": 319} {"train_loss": -5.176002025604248, "global_step": 13401, "epoch": 319} {"train_loss": -5.124110221862793, "global_step": 13402, "epoch": 319} {"train_loss": -5.220921993255615, "global_step": 13403, "epoch": 319} {"train_loss": -5.130995750427246, "global_step": 13404, "epoch": 319} {"train_loss": -5.217730522155762, "global_step": 13405, "epoch": 319} {"train_loss": -5.049654006958008, "global_step": 13406, "epoch": 319} {"train_loss": -4.976090431213379, "global_step": 13407, "epoch": 319} {"train_loss": -5.070455551147461, "global_step": 13408, "epoch": 319} {"train_loss": -5.278504371643066, "global_step": 13409, "epoch": 319} {"train_loss": -5.1740922927856445, "global_step": 13410, "epoch": 319} {"train_loss": -5.148001194000244, "global_step": 13411, "epoch": 319} {"train_loss": -5.018796920776367, "global_step": 13412, "epoch": 319} {"train_loss": -5.2322678565979, "global_step": 13413, "epoch": 319} {"train_loss": -5.172986030578613, "global_step": 13414, "epoch": 319} {"train_loss": -5.203367710113525, "global_step": 13415, "epoch": 319} {"train_loss": -5.030355453491211, "global_step": 13416, "epoch": 319} {"train_loss": -5.107226371765137, "global_step": 13417, "epoch": 319} {"train_loss": -5.279233932495117, "global_step": 13418, "epoch": 319} {"train_loss": -5.180608749389648, "global_step": 13419, "epoch": 319} {"train_loss": -4.974327564239502, "global_step": 13420, "epoch": 319} {"train_loss": -5.216412544250488, "global_step": 13421, "epoch": 319} {"train_loss": -4.994546890258789, "global_step": 13422, "epoch": 319} {"train_loss": -5.0158538818359375, "global_step": 13423, "epoch": 319} {"train_loss": -5.156348705291748, "global_step": 13424, "epoch": 319} {"train_loss": -5.056118011474609, "global_step": 13425, "epoch": 319} {"train_loss": -5.115601539611816, "global_step": 13426, "epoch": 319} {"train_loss": -5.0094194412231445, "global_step": 13427, "epoch": 319} {"train_loss": -5.237821578979492, "global_step": 13428, "epoch": 319} {"train_loss": -5.031133651733398, "global_step": 13429, "epoch": 319} {"train_loss": -5.165685176849365, "global_step": 13430, "epoch": 319} {"train_loss": -5.123621940612793, "global_step": 13431, "epoch": 319} {"train_loss": -5.222019195556641, "global_step": 13432, "epoch": 319} {"train_loss": -5.181615352630615, "global_step": 13433, "epoch": 319} {"train_loss": -5.092998504638672, "global_step": 13434, "epoch": 319} {"train_loss": -5.121918678283691, "global_step": 13435, "epoch": 319} {"train_loss": -5.055012226104736, "global_step": 13436, "epoch": 319} {"train_loss": -5.220432281494141, "global_step": 13437, "epoch": 319} {"train_loss": -5.116260528564453, "global_step": 13438, "epoch": 319} {"train_loss": -5.12692437853132, "global_step": 13439, "epoch": 319, "val_loss": 70674.7421875} {"train_loss": -5.009176254272461, "global_step": 13440, "epoch": 320} {"train_loss": -5.170833587646484, "global_step": 13441, "epoch": 320} {"train_loss": -5.188340663909912, "global_step": 13442, "epoch": 320} {"train_loss": -5.077209949493408, "global_step": 13443, "epoch": 320} {"train_loss": -5.1567912101745605, "global_step": 13444, "epoch": 320} {"train_loss": -5.1971940994262695, "global_step": 13445, "epoch": 320} {"train_loss": -5.167575359344482, "global_step": 13446, "epoch": 320} {"train_loss": -4.999383449554443, "global_step": 13447, "epoch": 320} {"train_loss": -5.386500358581543, "global_step": 13448, "epoch": 320} {"train_loss": -5.128317832946777, "global_step": 13449, "epoch": 320} {"train_loss": -5.191766262054443, "global_step": 13450, "epoch": 320} {"train_loss": -5.116162300109863, "global_step": 13451, "epoch": 320} {"train_loss": -5.259773254394531, "global_step": 13452, "epoch": 320} {"train_loss": -5.201043128967285, "global_step": 13453, "epoch": 320} {"train_loss": -5.1462249755859375, "global_step": 13454, "epoch": 320} {"train_loss": -5.058980464935303, "global_step": 13455, "epoch": 320} {"train_loss": -5.060497283935547, "global_step": 13456, "epoch": 320} {"train_loss": -5.027112007141113, "global_step": 13457, "epoch": 320} {"train_loss": -5.1923980712890625, "global_step": 13458, "epoch": 320} {"train_loss": -5.172562122344971, "global_step": 13459, "epoch": 320} {"train_loss": -5.212711334228516, "global_step": 13460, "epoch": 320} {"train_loss": -4.8845038414001465, "global_step": 13461, "epoch": 320} {"train_loss": -5.129800319671631, "global_step": 13462, "epoch": 320} {"train_loss": -5.228823661804199, "global_step": 13463, "epoch": 320} {"train_loss": -4.8746538162231445, "global_step": 13464, "epoch": 320} {"train_loss": -5.14280891418457, "global_step": 13465, "epoch": 320} {"train_loss": -5.170488357543945, "global_step": 13466, "epoch": 320} {"train_loss": -5.100456237792969, "global_step": 13467, "epoch": 320} {"train_loss": -5.089475631713867, "global_step": 13468, "epoch": 320} {"train_loss": -5.093038558959961, "global_step": 13469, "epoch": 320} {"train_loss": -5.187293529510498, "global_step": 13470, "epoch": 320} {"train_loss": -5.137413024902344, "global_step": 13471, "epoch": 320} {"train_loss": -5.057530879974365, "global_step": 13472, "epoch": 320} {"train_loss": -5.229937553405762, "global_step": 13473, "epoch": 320} {"train_loss": -4.994610786437988, "global_step": 13474, "epoch": 320} {"train_loss": -5.066644668579102, "global_step": 13475, "epoch": 320} {"train_loss": -5.12698221206665, "global_step": 13476, "epoch": 320} {"train_loss": -5.180693626403809, "global_step": 13477, "epoch": 320} {"train_loss": -5.125382423400879, "global_step": 13478, "epoch": 320} {"train_loss": -5.152379989624023, "global_step": 13479, "epoch": 320} {"train_loss": -5.0727858543396, "global_step": 13480, "epoch": 320} {"train_loss": -5.124931176503499, "global_step": 13481, "epoch": 320, "val_loss": 70456.734375} {"train_loss": -5.2001566886901855, "global_step": 13482, "epoch": 321} {"train_loss": -5.115026473999023, "global_step": 13483, "epoch": 321} {"train_loss": -5.099837303161621, "global_step": 13484, "epoch": 321} {"train_loss": -5.069591522216797, "global_step": 13485, "epoch": 321} {"train_loss": -5.146052360534668, "global_step": 13486, "epoch": 321} {"train_loss": -5.182823181152344, "global_step": 13487, "epoch": 321} {"train_loss": -5.110994815826416, "global_step": 13488, "epoch": 321} {"train_loss": -5.2340264320373535, "global_step": 13489, "epoch": 321} {"train_loss": -5.145008087158203, "global_step": 13490, "epoch": 321} {"train_loss": -5.081287860870361, "global_step": 13491, "epoch": 321} {"train_loss": -5.074984550476074, "global_step": 13492, "epoch": 321} {"train_loss": -5.083500862121582, "global_step": 13493, "epoch": 321} {"train_loss": -5.1007304191589355, "global_step": 13494, "epoch": 321} {"train_loss": -5.127682209014893, "global_step": 13495, "epoch": 321} {"train_loss": -5.173158645629883, "global_step": 13496, "epoch": 321} {"train_loss": -4.947545051574707, "global_step": 13497, "epoch": 321} {"train_loss": -5.16121244430542, "global_step": 13498, "epoch": 321} {"train_loss": -5.130781173706055, "global_step": 13499, "epoch": 321} {"train_loss": -5.024096488952637, "global_step": 13500, "epoch": 321} {"train_loss": -4.957828998565674, "global_step": 13501, "epoch": 321} {"train_loss": -5.05668830871582, "global_step": 13502, "epoch": 321} {"train_loss": -5.18813419342041, "global_step": 13503, "epoch": 321} {"train_loss": -5.059283256530762, "global_step": 13504, "epoch": 321} {"train_loss": -5.145899772644043, "global_step": 13505, "epoch": 321} {"train_loss": -5.070947170257568, "global_step": 13506, "epoch": 321} {"train_loss": -5.147210597991943, "global_step": 13507, "epoch": 321} {"train_loss": -5.334857940673828, "global_step": 13508, "epoch": 321} {"train_loss": -5.223306179046631, "global_step": 13509, "epoch": 321} {"train_loss": -5.057657241821289, "global_step": 13510, "epoch": 321} {"train_loss": -5.151458740234375, "global_step": 13511, "epoch": 321} {"train_loss": -5.115379333496094, "global_step": 13512, "epoch": 321} {"train_loss": -5.08416748046875, "global_step": 13513, "epoch": 321} {"train_loss": -5.151689529418945, "global_step": 13514, "epoch": 321} {"train_loss": -5.130764484405518, "global_step": 13515, "epoch": 321} {"train_loss": -5.174727439880371, "global_step": 13516, "epoch": 321} {"train_loss": -5.258176803588867, "global_step": 13517, "epoch": 321} {"train_loss": -5.238971710205078, "global_step": 13518, "epoch": 321} {"train_loss": -5.1388349533081055, "global_step": 13519, "epoch": 321} {"train_loss": -5.300400257110596, "global_step": 13520, "epoch": 321} {"train_loss": -5.122746467590332, "global_step": 13521, "epoch": 321} {"train_loss": -5.120272636413574, "global_step": 13522, "epoch": 321} {"train_loss": -5.133466186977568, "global_step": 13523, "epoch": 321, "val_loss": 70322.8984375} {"train_loss": -5.116719722747803, "global_step": 13524, "epoch": 322} {"train_loss": -5.115671157836914, "global_step": 13525, "epoch": 322} {"train_loss": -4.992145538330078, "global_step": 13526, "epoch": 322} {"train_loss": -5.231365203857422, "global_step": 13527, "epoch": 322} {"train_loss": -5.224462509155273, "global_step": 13528, "epoch": 322} {"train_loss": -5.168384552001953, "global_step": 13529, "epoch": 322} {"train_loss": -5.198945999145508, "global_step": 13530, "epoch": 322} {"train_loss": -5.1371684074401855, "global_step": 13531, "epoch": 322} {"train_loss": -5.215920448303223, "global_step": 13532, "epoch": 322} {"train_loss": -5.096671104431152, "global_step": 13533, "epoch": 322} {"train_loss": -5.182559967041016, "global_step": 13534, "epoch": 322} {"train_loss": -5.187797546386719, "global_step": 13535, "epoch": 322} {"train_loss": -5.174777507781982, "global_step": 13536, "epoch": 322} {"train_loss": -5.166744709014893, "global_step": 13537, "epoch": 322} {"train_loss": -5.112100601196289, "global_step": 13538, "epoch": 322} {"train_loss": -5.197517395019531, "global_step": 13539, "epoch": 322} {"train_loss": -5.330256938934326, "global_step": 13540, "epoch": 322} {"train_loss": -5.316888809204102, "global_step": 13541, "epoch": 322} {"train_loss": -5.048285961151123, "global_step": 13542, "epoch": 322} {"train_loss": -5.175240516662598, "global_step": 13543, "epoch": 322} {"train_loss": -5.182931423187256, "global_step": 13544, "epoch": 322} {"train_loss": -5.144838333129883, "global_step": 13545, "epoch": 322} {"train_loss": -5.189121723175049, "global_step": 13546, "epoch": 322} {"train_loss": -5.060091495513916, "global_step": 13547, "epoch": 322} {"train_loss": -5.24440336227417, "global_step": 13548, "epoch": 322} {"train_loss": -5.178350448608398, "global_step": 13549, "epoch": 322} {"train_loss": -5.065887928009033, "global_step": 13550, "epoch": 322} {"train_loss": -5.185776233673096, "global_step": 13551, "epoch": 322} {"train_loss": -5.148638725280762, "global_step": 13552, "epoch": 322} {"train_loss": -5.033932685852051, "global_step": 13553, "epoch": 322} {"train_loss": -5.082457065582275, "global_step": 13554, "epoch": 322} {"train_loss": -5.171431541442871, "global_step": 13555, "epoch": 322} {"train_loss": -5.169802665710449, "global_step": 13556, "epoch": 322} {"train_loss": -5.053291320800781, "global_step": 13557, "epoch": 322} {"train_loss": -4.892148017883301, "global_step": 13558, "epoch": 322} {"train_loss": -5.231505393981934, "global_step": 13559, "epoch": 322} {"train_loss": -5.119117736816406, "global_step": 13560, "epoch": 322} {"train_loss": -4.967463970184326, "global_step": 13561, "epoch": 322} {"train_loss": -5.061150550842285, "global_step": 13562, "epoch": 322} {"train_loss": -5.21073579788208, "global_step": 13563, "epoch": 322} {"train_loss": -5.166162490844727, "global_step": 13564, "epoch": 322} {"train_loss": -5.145602033251808, "global_step": 13565, "epoch": 322, "val_loss": 70877.6640625} {"train_loss": -5.0897674560546875, "global_step": 13566, "epoch": 323} {"train_loss": -5.245800971984863, "global_step": 13567, "epoch": 323} {"train_loss": -5.199066638946533, "global_step": 13568, "epoch": 323} {"train_loss": -5.032188415527344, "global_step": 13569, "epoch": 323} {"train_loss": -5.139690399169922, "global_step": 13570, "epoch": 323} {"train_loss": -5.095376491546631, "global_step": 13571, "epoch": 323} {"train_loss": -5.25754976272583, "global_step": 13572, "epoch": 323} {"train_loss": -5.179764270782471, "global_step": 13573, "epoch": 323} {"train_loss": -4.981749534606934, "global_step": 13574, "epoch": 323} {"train_loss": -5.221587181091309, "global_step": 13575, "epoch": 323} {"train_loss": -5.020954132080078, "global_step": 13576, "epoch": 323} {"train_loss": -5.216976165771484, "global_step": 13577, "epoch": 323} {"train_loss": -5.035950660705566, "global_step": 13578, "epoch": 323} {"train_loss": -5.229136943817139, "global_step": 13579, "epoch": 323} {"train_loss": -5.063774108886719, "global_step": 13580, "epoch": 323} {"train_loss": -5.022278308868408, "global_step": 13581, "epoch": 323} {"train_loss": -5.219425201416016, "global_step": 13582, "epoch": 323} {"train_loss": -5.160341262817383, "global_step": 13583, "epoch": 323} {"train_loss": -5.053022861480713, "global_step": 13584, "epoch": 323} {"train_loss": -5.077085018157959, "global_step": 13585, "epoch": 323} {"train_loss": -5.162947177886963, "global_step": 13586, "epoch": 323} {"train_loss": -5.03558349609375, "global_step": 13587, "epoch": 323} {"train_loss": -5.127955436706543, "global_step": 13588, "epoch": 323} {"train_loss": -5.071454048156738, "global_step": 13589, "epoch": 323} {"train_loss": -5.083424091339111, "global_step": 13590, "epoch": 323} {"train_loss": -5.119937896728516, "global_step": 13591, "epoch": 323} {"train_loss": -4.977947235107422, "global_step": 13592, "epoch": 323} {"train_loss": -5.120216369628906, "global_step": 13593, "epoch": 323} {"train_loss": -5.109590530395508, "global_step": 13594, "epoch": 323} {"train_loss": -5.187614917755127, "global_step": 13595, "epoch": 323} {"train_loss": -5.152309417724609, "global_step": 13596, "epoch": 323} {"train_loss": -5.167448997497559, "global_step": 13597, "epoch": 323} {"train_loss": -5.136626243591309, "global_step": 13598, "epoch": 323} {"train_loss": -5.2186665534973145, "global_step": 13599, "epoch": 323} {"train_loss": -5.097210884094238, "global_step": 13600, "epoch": 323} {"train_loss": -5.208643913269043, "global_step": 13601, "epoch": 323} {"train_loss": -5.149084091186523, "global_step": 13602, "epoch": 323} {"train_loss": -5.140900611877441, "global_step": 13603, "epoch": 323} {"train_loss": -5.319867134094238, "global_step": 13604, "epoch": 323} {"train_loss": -5.0009355545043945, "global_step": 13605, "epoch": 323} {"train_loss": -5.228306293487549, "global_step": 13606, "epoch": 323} {"train_loss": -5.129285017649333, "global_step": 13607, "epoch": 323, "val_loss": 70274.9609375} {"train_loss": -5.132625579833984, "global_step": 13608, "epoch": 324} {"train_loss": -5.1934494972229, "global_step": 13609, "epoch": 324} {"train_loss": -5.248895168304443, "global_step": 13610, "epoch": 324} {"train_loss": -5.136578559875488, "global_step": 13611, "epoch": 324} {"train_loss": -5.114534378051758, "global_step": 13612, "epoch": 324} {"train_loss": -5.23982048034668, "global_step": 13613, "epoch": 324} {"train_loss": -5.1471967697143555, "global_step": 13614, "epoch": 324} {"train_loss": -5.162560939788818, "global_step": 13615, "epoch": 324} {"train_loss": -5.289419174194336, "global_step": 13616, "epoch": 324} {"train_loss": -5.147820472717285, "global_step": 13617, "epoch": 324} {"train_loss": -5.096896171569824, "global_step": 13618, "epoch": 324} {"train_loss": -5.249351501464844, "global_step": 13619, "epoch": 324} {"train_loss": -5.3212480545043945, "global_step": 13620, "epoch": 324} {"train_loss": -5.0935959815979, "global_step": 13621, "epoch": 324} {"train_loss": -5.087440490722656, "global_step": 13622, "epoch": 324} {"train_loss": -5.129640579223633, "global_step": 13623, "epoch": 324} {"train_loss": -5.297760963439941, "global_step": 13624, "epoch": 324} {"train_loss": -5.002942085266113, "global_step": 13625, "epoch": 324} {"train_loss": -5.141498565673828, "global_step": 13626, "epoch": 324} {"train_loss": -5.087340354919434, "global_step": 13627, "epoch": 324} {"train_loss": -5.160331726074219, "global_step": 13628, "epoch": 324} {"train_loss": -5.138969421386719, "global_step": 13629, "epoch": 324} {"train_loss": -5.168363571166992, "global_step": 13630, "epoch": 324} {"train_loss": -4.990453243255615, "global_step": 13631, "epoch": 324} {"train_loss": -5.241501808166504, "global_step": 13632, "epoch": 324} {"train_loss": -5.143054962158203, "global_step": 13633, "epoch": 324} {"train_loss": -5.105649471282959, "global_step": 13634, "epoch": 324} {"train_loss": -5.127923011779785, "global_step": 13635, "epoch": 324} {"train_loss": -5.195260047912598, "global_step": 13636, "epoch": 324} {"train_loss": -5.169435977935791, "global_step": 13637, "epoch": 324} {"train_loss": -5.17832088470459, "global_step": 13638, "epoch": 324} {"train_loss": -4.9854736328125, "global_step": 13639, "epoch": 324} {"train_loss": -5.251428604125977, "global_step": 13640, "epoch": 324} {"train_loss": -5.217800140380859, "global_step": 13641, "epoch": 324} {"train_loss": -5.294220924377441, "global_step": 13642, "epoch": 324} {"train_loss": -5.1326189041137695, "global_step": 13643, "epoch": 324} {"train_loss": -5.0723114013671875, "global_step": 13644, "epoch": 324} {"train_loss": -5.243677139282227, "global_step": 13645, "epoch": 324} {"train_loss": -5.081906795501709, "global_step": 13646, "epoch": 324} {"train_loss": -5.109002590179443, "global_step": 13647, "epoch": 324} {"train_loss": -5.09246301651001, "global_step": 13648, "epoch": 324} {"train_loss": -5.155487083253407, "global_step": 13649, "epoch": 324, "val_loss": 70719.3671875} {"train_loss": -5.197513580322266, "global_step": 13650, "epoch": 325} {"train_loss": -5.025806903839111, "global_step": 13651, "epoch": 325} {"train_loss": -5.184922218322754, "global_step": 13652, "epoch": 325} {"train_loss": -5.118648529052734, "global_step": 13653, "epoch": 325} {"train_loss": -5.174474716186523, "global_step": 13654, "epoch": 325} {"train_loss": -5.000449180603027, "global_step": 13655, "epoch": 325} {"train_loss": -5.255039215087891, "global_step": 13656, "epoch": 325} {"train_loss": -5.075453758239746, "global_step": 13657, "epoch": 325} {"train_loss": -5.007734775543213, "global_step": 13658, "epoch": 325} {"train_loss": -5.122322082519531, "global_step": 13659, "epoch": 325} {"train_loss": -5.191728591918945, "global_step": 13660, "epoch": 325} {"train_loss": -5.047482490539551, "global_step": 13661, "epoch": 325} {"train_loss": -5.169689178466797, "global_step": 13662, "epoch": 325} {"train_loss": -5.089000701904297, "global_step": 13663, "epoch": 325} {"train_loss": -5.353532314300537, "global_step": 13664, "epoch": 325} {"train_loss": -5.2218403816223145, "global_step": 13665, "epoch": 325} {"train_loss": -5.056967735290527, "global_step": 13666, "epoch": 325} {"train_loss": -5.010585308074951, "global_step": 13667, "epoch": 325} {"train_loss": -5.185807228088379, "global_step": 13668, "epoch": 325} {"train_loss": -5.034917831420898, "global_step": 13669, "epoch": 325} {"train_loss": -5.096643447875977, "global_step": 13670, "epoch": 325} {"train_loss": -5.008182048797607, "global_step": 13671, "epoch": 325} {"train_loss": -5.051257610321045, "global_step": 13672, "epoch": 325} {"train_loss": -5.157711982727051, "global_step": 13673, "epoch": 325} {"train_loss": -5.0661821365356445, "global_step": 13674, "epoch": 325} {"train_loss": -5.193470001220703, "global_step": 13675, "epoch": 325} {"train_loss": -5.167170524597168, "global_step": 13676, "epoch": 325} {"train_loss": -5.276321887969971, "global_step": 13677, "epoch": 325} {"train_loss": -5.077133655548096, "global_step": 13678, "epoch": 325} {"train_loss": -5.240008354187012, "global_step": 13679, "epoch": 325} {"train_loss": -5.094141960144043, "global_step": 13680, "epoch": 325} {"train_loss": -5.19086217880249, "global_step": 13681, "epoch": 325} {"train_loss": -5.169649124145508, "global_step": 13682, "epoch": 325} {"train_loss": -5.162230968475342, "global_step": 13683, "epoch": 325} {"train_loss": -5.16734504699707, "global_step": 13684, "epoch": 325} {"train_loss": -5.259387016296387, "global_step": 13685, "epoch": 325} {"train_loss": -5.075207233428955, "global_step": 13686, "epoch": 325} {"train_loss": -5.015635967254639, "global_step": 13687, "epoch": 325} {"train_loss": -5.173765659332275, "global_step": 13688, "epoch": 325} {"train_loss": -4.998804092407227, "global_step": 13689, "epoch": 325} {"train_loss": -5.157958030700684, "global_step": 13690, "epoch": 325} {"train_loss": -5.130878346306937, "global_step": 13691, "epoch": 325, "val_loss": 70857.1875} {"train_loss": -5.102437496185303, "global_step": 13692, "epoch": 326} {"train_loss": -5.172189235687256, "global_step": 13693, "epoch": 326} {"train_loss": -5.073668956756592, "global_step": 13694, "epoch": 326} {"train_loss": -5.023597717285156, "global_step": 13695, "epoch": 326} {"train_loss": -5.001605033874512, "global_step": 13696, "epoch": 326} {"train_loss": -5.275737285614014, "global_step": 13697, "epoch": 326} {"train_loss": -5.099057674407959, "global_step": 13698, "epoch": 326} {"train_loss": -5.061570167541504, "global_step": 13699, "epoch": 326} {"train_loss": -4.993129730224609, "global_step": 13700, "epoch": 326} {"train_loss": -5.292412757873535, "global_step": 13701, "epoch": 326} {"train_loss": -4.96956729888916, "global_step": 13702, "epoch": 326} {"train_loss": -5.030128479003906, "global_step": 13703, "epoch": 326} {"train_loss": -5.116001129150391, "global_step": 13704, "epoch": 326} {"train_loss": -5.251885414123535, "global_step": 13705, "epoch": 326} {"train_loss": -5.146297454833984, "global_step": 13706, "epoch": 326} {"train_loss": -5.177902698516846, "global_step": 13707, "epoch": 326} {"train_loss": -5.212862491607666, "global_step": 13708, "epoch": 326} {"train_loss": -5.065201759338379, "global_step": 13709, "epoch": 326} {"train_loss": -5.143824100494385, "global_step": 13710, "epoch": 326} {"train_loss": -5.210304260253906, "global_step": 13711, "epoch": 326} {"train_loss": -5.103281021118164, "global_step": 13712, "epoch": 326} {"train_loss": -5.1827239990234375, "global_step": 13713, "epoch": 326} {"train_loss": -5.1529083251953125, "global_step": 13714, "epoch": 326} {"train_loss": -5.094366550445557, "global_step": 13715, "epoch": 326} {"train_loss": -5.123286247253418, "global_step": 13716, "epoch": 326} {"train_loss": -5.101006984710693, "global_step": 13717, "epoch": 326} {"train_loss": -5.197222709655762, "global_step": 13718, "epoch": 326} {"train_loss": -5.113164901733398, "global_step": 13719, "epoch": 326} {"train_loss": -5.083341598510742, "global_step": 13720, "epoch": 326} {"train_loss": -5.157275199890137, "global_step": 13721, "epoch": 326} {"train_loss": -5.141844749450684, "global_step": 13722, "epoch": 326} {"train_loss": -5.05935001373291, "global_step": 13723, "epoch": 326} {"train_loss": -5.144095420837402, "global_step": 13724, "epoch": 326} {"train_loss": -5.210620403289795, "global_step": 13725, "epoch": 326} {"train_loss": -5.108794212341309, "global_step": 13726, "epoch": 326} {"train_loss": -5.127354621887207, "global_step": 13727, "epoch": 326} {"train_loss": -5.105393886566162, "global_step": 13728, "epoch": 326} {"train_loss": -5.065117835998535, "global_step": 13729, "epoch": 326} {"train_loss": -5.0283660888671875, "global_step": 13730, "epoch": 326} {"train_loss": -5.1637725830078125, "global_step": 13731, "epoch": 326} {"train_loss": -5.256572246551514, "global_step": 13732, "epoch": 326} {"train_loss": -5.127554223650978, "global_step": 13733, "epoch": 326, "val_loss": 70098.5546875} {"train_loss": -5.173105239868164, "global_step": 13734, "epoch": 327} {"train_loss": -5.173646926879883, "global_step": 13735, "epoch": 327} {"train_loss": -5.0594048500061035, "global_step": 13736, "epoch": 327} {"train_loss": -5.2972412109375, "global_step": 13737, "epoch": 327} {"train_loss": -5.176079750061035, "global_step": 13738, "epoch": 327} {"train_loss": -5.27318000793457, "global_step": 13739, "epoch": 327} {"train_loss": -5.216915130615234, "global_step": 13740, "epoch": 327} {"train_loss": -5.153790473937988, "global_step": 13741, "epoch": 327} {"train_loss": -5.059462547302246, "global_step": 13742, "epoch": 327} {"train_loss": -5.142327308654785, "global_step": 13743, "epoch": 327} {"train_loss": -5.036072731018066, "global_step": 13744, "epoch": 327} {"train_loss": -5.112782955169678, "global_step": 13745, "epoch": 327} {"train_loss": -5.24517822265625, "global_step": 13746, "epoch": 327} {"train_loss": -5.21621561050415, "global_step": 13747, "epoch": 327} {"train_loss": -5.00484037399292, "global_step": 13748, "epoch": 327} {"train_loss": -5.198484420776367, "global_step": 13749, "epoch": 327} {"train_loss": -5.386919021606445, "global_step": 13750, "epoch": 327} {"train_loss": -5.125915050506592, "global_step": 13751, "epoch": 327} {"train_loss": -5.162151336669922, "global_step": 13752, "epoch": 327} {"train_loss": -5.225592613220215, "global_step": 13753, "epoch": 327} {"train_loss": -5.122528076171875, "global_step": 13754, "epoch": 327} {"train_loss": -4.96354341506958, "global_step": 13755, "epoch": 327} {"train_loss": -5.129837989807129, "global_step": 13756, "epoch": 327} {"train_loss": -5.005025863647461, "global_step": 13757, "epoch": 327} {"train_loss": -5.094942092895508, "global_step": 13758, "epoch": 327} {"train_loss": -5.183388710021973, "global_step": 13759, "epoch": 327} {"train_loss": -4.948070526123047, "global_step": 13760, "epoch": 327} {"train_loss": -4.906660079956055, "global_step": 13761, "epoch": 327} {"train_loss": -5.186842441558838, "global_step": 13762, "epoch": 327} {"train_loss": -4.757206916809082, "global_step": 13763, "epoch": 327} {"train_loss": -5.056005001068115, "global_step": 13764, "epoch": 327} {"train_loss": -4.884765625, "global_step": 13765, "epoch": 327} {"train_loss": -5.058326721191406, "global_step": 13766, "epoch": 327} {"train_loss": -4.90629243850708, "global_step": 13767, "epoch": 327} {"train_loss": -5.122991561889648, "global_step": 13768, "epoch": 327} {"train_loss": -5.036809921264648, "global_step": 13769, "epoch": 327} {"train_loss": -5.047553062438965, "global_step": 13770, "epoch": 327} {"train_loss": -5.271234512329102, "global_step": 13771, "epoch": 327} {"train_loss": -5.0246734619140625, "global_step": 13772, "epoch": 327} {"train_loss": -5.133297443389893, "global_step": 13773, "epoch": 327} {"train_loss": -5.020570755004883, "global_step": 13774, "epoch": 327} {"train_loss": -5.101321731294904, "global_step": 13775, "epoch": 327, "val_loss": 71365.3125} {"train_loss": -5.213483810424805, "global_step": 13776, "epoch": 328} {"train_loss": -5.112173080444336, "global_step": 13777, "epoch": 328} {"train_loss": -5.10700798034668, "global_step": 13778, "epoch": 328} {"train_loss": -5.057135581970215, "global_step": 13779, "epoch": 328} {"train_loss": -5.197634696960449, "global_step": 13780, "epoch": 328} {"train_loss": -5.199409484863281, "global_step": 13781, "epoch": 328} {"train_loss": -5.170053005218506, "global_step": 13782, "epoch": 328} {"train_loss": -5.092999458312988, "global_step": 13783, "epoch": 328} {"train_loss": -5.146886825561523, "global_step": 13784, "epoch": 328} {"train_loss": -5.155652046203613, "global_step": 13785, "epoch": 328} {"train_loss": -5.2158732414245605, "global_step": 13786, "epoch": 328} {"train_loss": -5.216035842895508, "global_step": 13787, "epoch": 328} {"train_loss": -5.112728595733643, "global_step": 13788, "epoch": 328} {"train_loss": -5.110698223114014, "global_step": 13789, "epoch": 328} {"train_loss": -5.14274263381958, "global_step": 13790, "epoch": 328} {"train_loss": -5.108420372009277, "global_step": 13791, "epoch": 328} {"train_loss": -5.107921600341797, "global_step": 13792, "epoch": 328} {"train_loss": -5.291459560394287, "global_step": 13793, "epoch": 328} {"train_loss": -5.20566463470459, "global_step": 13794, "epoch": 328} {"train_loss": -5.144182205200195, "global_step": 13795, "epoch": 328} {"train_loss": -5.146175861358643, "global_step": 13796, "epoch": 328} {"train_loss": -5.1954498291015625, "global_step": 13797, "epoch": 328} {"train_loss": -5.20045280456543, "global_step": 13798, "epoch": 328} {"train_loss": -5.236542701721191, "global_step": 13799, "epoch": 328} {"train_loss": -5.2267255783081055, "global_step": 13800, "epoch": 328} {"train_loss": -5.04831600189209, "global_step": 13801, "epoch": 328} {"train_loss": -5.171863555908203, "global_step": 13802, "epoch": 328} {"train_loss": -5.096371650695801, "global_step": 13803, "epoch": 328} {"train_loss": -5.010953903198242, "global_step": 13804, "epoch": 328} {"train_loss": -5.18157958984375, "global_step": 13805, "epoch": 328} {"train_loss": -5.2069196701049805, "global_step": 13806, "epoch": 328} {"train_loss": -5.226898193359375, "global_step": 13807, "epoch": 328} {"train_loss": -5.135301113128662, "global_step": 13808, "epoch": 328} {"train_loss": -5.19827938079834, "global_step": 13809, "epoch": 328} {"train_loss": -5.199167251586914, "global_step": 13810, "epoch": 328} {"train_loss": -5.142256259918213, "global_step": 13811, "epoch": 328} {"train_loss": -5.229946136474609, "global_step": 13812, "epoch": 328} {"train_loss": -5.172567367553711, "global_step": 13813, "epoch": 328} {"train_loss": -5.176631927490234, "global_step": 13814, "epoch": 328} {"train_loss": -5.156726837158203, "global_step": 13815, "epoch": 328} {"train_loss": -5.158522129058838, "global_step": 13816, "epoch": 328} {"train_loss": -5.161850282124111, "global_step": 13817, "epoch": 328, "val_loss": 70004.4140625} {"train_loss": -5.25390625, "global_step": 13818, "epoch": 329} {"train_loss": -5.195585250854492, "global_step": 13819, "epoch": 329} {"train_loss": -5.283579349517822, "global_step": 13820, "epoch": 329} {"train_loss": -5.037939071655273, "global_step": 13821, "epoch": 329} {"train_loss": -5.124525547027588, "global_step": 13822, "epoch": 329} {"train_loss": -5.078860282897949, "global_step": 13823, "epoch": 329} {"train_loss": -5.259688377380371, "global_step": 13824, "epoch": 329} {"train_loss": -5.093128204345703, "global_step": 13825, "epoch": 329} {"train_loss": -5.141054153442383, "global_step": 13826, "epoch": 329} {"train_loss": -5.24867582321167, "global_step": 13827, "epoch": 329} {"train_loss": -5.114821910858154, "global_step": 13828, "epoch": 329} {"train_loss": -5.178373336791992, "global_step": 13829, "epoch": 329} {"train_loss": -5.209221363067627, "global_step": 13830, "epoch": 329} {"train_loss": -5.182060241699219, "global_step": 13831, "epoch": 329} {"train_loss": -5.256387710571289, "global_step": 13832, "epoch": 329} {"train_loss": -5.245001792907715, "global_step": 13833, "epoch": 329} {"train_loss": -5.247615814208984, "global_step": 13834, "epoch": 329} {"train_loss": -5.253701686859131, "global_step": 13835, "epoch": 329} {"train_loss": -5.244832992553711, "global_step": 13836, "epoch": 329} {"train_loss": -5.109746932983398, "global_step": 13837, "epoch": 329} {"train_loss": -5.268310070037842, "global_step": 13838, "epoch": 329} {"train_loss": -5.024519443511963, "global_step": 13839, "epoch": 329} {"train_loss": -5.087041854858398, "global_step": 13840, "epoch": 329} {"train_loss": -5.154306888580322, "global_step": 13841, "epoch": 329} {"train_loss": -5.009761333465576, "global_step": 13842, "epoch": 329} {"train_loss": -5.150874137878418, "global_step": 13843, "epoch": 329} {"train_loss": -5.237698554992676, "global_step": 13844, "epoch": 329} {"train_loss": -5.009570121765137, "global_step": 13845, "epoch": 329} {"train_loss": -5.180129051208496, "global_step": 13846, "epoch": 329} {"train_loss": -5.35628604888916, "global_step": 13847, "epoch": 329} {"train_loss": -5.233754634857178, "global_step": 13848, "epoch": 329} {"train_loss": -5.16726016998291, "global_step": 13849, "epoch": 329} {"train_loss": -5.130037307739258, "global_step": 13850, "epoch": 329} {"train_loss": -5.267724990844727, "global_step": 13851, "epoch": 329} {"train_loss": -5.192184925079346, "global_step": 13852, "epoch": 329} {"train_loss": -5.190879821777344, "global_step": 13853, "epoch": 329} {"train_loss": -5.172541618347168, "global_step": 13854, "epoch": 329} {"train_loss": -5.012683868408203, "global_step": 13855, "epoch": 329} {"train_loss": -5.235593318939209, "global_step": 13856, "epoch": 329} {"train_loss": -5.244115352630615, "global_step": 13857, "epoch": 329} {"train_loss": -5.2690935134887695, "global_step": 13858, "epoch": 329} {"train_loss": -5.178680204209828, "global_step": 13859, "epoch": 329, "val_loss": 70327.3125} {"train_loss": -5.225760459899902, "global_step": 13860, "epoch": 330} {"train_loss": -5.121294021606445, "global_step": 13861, "epoch": 330} {"train_loss": -5.19334602355957, "global_step": 13862, "epoch": 330} {"train_loss": -5.135983943939209, "global_step": 13863, "epoch": 330} {"train_loss": -5.116552352905273, "global_step": 13864, "epoch": 330} {"train_loss": -5.072177886962891, "global_step": 13865, "epoch": 330} {"train_loss": -5.072760581970215, "global_step": 13866, "epoch": 330} {"train_loss": -5.152569770812988, "global_step": 13867, "epoch": 330} {"train_loss": -5.028858184814453, "global_step": 13868, "epoch": 330} {"train_loss": -5.037991523742676, "global_step": 13869, "epoch": 330} {"train_loss": -5.324776649475098, "global_step": 13870, "epoch": 330} {"train_loss": -5.1959147453308105, "global_step": 13871, "epoch": 330} {"train_loss": -4.928167819976807, "global_step": 13872, "epoch": 330} {"train_loss": -5.118010520935059, "global_step": 13873, "epoch": 330} {"train_loss": -5.102001667022705, "global_step": 13874, "epoch": 330} {"train_loss": -5.039811134338379, "global_step": 13875, "epoch": 330} {"train_loss": -5.309587478637695, "global_step": 13876, "epoch": 330} {"train_loss": -5.020066261291504, "global_step": 13877, "epoch": 330} {"train_loss": -5.0900068283081055, "global_step": 13878, "epoch": 330} {"train_loss": -5.207108497619629, "global_step": 13879, "epoch": 330} {"train_loss": -5.156440734863281, "global_step": 13880, "epoch": 330} {"train_loss": -5.02058219909668, "global_step": 13881, "epoch": 330} {"train_loss": -5.131340503692627, "global_step": 13882, "epoch": 330} {"train_loss": -5.166363716125488, "global_step": 13883, "epoch": 330} {"train_loss": -5.212065696716309, "global_step": 13884, "epoch": 330} {"train_loss": -5.239660739898682, "global_step": 13885, "epoch": 330} {"train_loss": -5.223509311676025, "global_step": 13886, "epoch": 330} {"train_loss": -5.218197822570801, "global_step": 13887, "epoch": 330} {"train_loss": -5.253671646118164, "global_step": 13888, "epoch": 330} {"train_loss": -5.150973320007324, "global_step": 13889, "epoch": 330} {"train_loss": -5.124969482421875, "global_step": 13890, "epoch": 330} {"train_loss": -5.0872697830200195, "global_step": 13891, "epoch": 330} {"train_loss": -5.177202224731445, "global_step": 13892, "epoch": 330} {"train_loss": -5.134716987609863, "global_step": 13893, "epoch": 330} {"train_loss": -5.160524368286133, "global_step": 13894, "epoch": 330} {"train_loss": -5.093959808349609, "global_step": 13895, "epoch": 330} {"train_loss": -5.246673107147217, "global_step": 13896, "epoch": 330} {"train_loss": -5.131677627563477, "global_step": 13897, "epoch": 330} {"train_loss": -5.212062835693359, "global_step": 13898, "epoch": 330} {"train_loss": -4.987788200378418, "global_step": 13899, "epoch": 330} {"train_loss": -4.867875576019287, "global_step": 13900, "epoch": 330} {"train_loss": -5.135632639839535, "global_step": 13901, "epoch": 330, "val_loss": 70590.4375} {"train_loss": -5.130077362060547, "global_step": 13902, "epoch": 331} {"train_loss": -5.074423313140869, "global_step": 13903, "epoch": 331} {"train_loss": -5.215060710906982, "global_step": 13904, "epoch": 331} {"train_loss": -5.22271728515625, "global_step": 13905, "epoch": 331} {"train_loss": -5.187450408935547, "global_step": 13906, "epoch": 331} {"train_loss": -5.076664447784424, "global_step": 13907, "epoch": 331} {"train_loss": -5.159831523895264, "global_step": 13908, "epoch": 331} {"train_loss": -5.0713372230529785, "global_step": 13909, "epoch": 331} {"train_loss": -5.2255682945251465, "global_step": 13910, "epoch": 331} {"train_loss": -5.174978733062744, "global_step": 13911, "epoch": 331} {"train_loss": -5.0703582763671875, "global_step": 13912, "epoch": 331} {"train_loss": -5.190876007080078, "global_step": 13913, "epoch": 331} {"train_loss": -5.271320343017578, "global_step": 13914, "epoch": 331} {"train_loss": -5.2047929763793945, "global_step": 13915, "epoch": 331} {"train_loss": -5.157768249511719, "global_step": 13916, "epoch": 331} {"train_loss": -5.211735248565674, "global_step": 13917, "epoch": 331} {"train_loss": -5.174447059631348, "global_step": 13918, "epoch": 331} {"train_loss": -5.017866134643555, "global_step": 13919, "epoch": 331} {"train_loss": -5.108303070068359, "global_step": 13920, "epoch": 331} {"train_loss": -5.195950031280518, "global_step": 13921, "epoch": 331} {"train_loss": -5.187267303466797, "global_step": 13922, "epoch": 331} {"train_loss": -5.268651962280273, "global_step": 13923, "epoch": 331} {"train_loss": -5.247396945953369, "global_step": 13924, "epoch": 331} {"train_loss": -5.106015682220459, "global_step": 13925, "epoch": 331} {"train_loss": -5.0934600830078125, "global_step": 13926, "epoch": 331} {"train_loss": -5.108851909637451, "global_step": 13927, "epoch": 331} {"train_loss": -5.1781907081604, "global_step": 13928, "epoch": 331} {"train_loss": -5.130899429321289, "global_step": 13929, "epoch": 331} {"train_loss": -5.0322065353393555, "global_step": 13930, "epoch": 331} {"train_loss": -5.2290754318237305, "global_step": 13931, "epoch": 331} {"train_loss": -5.133073806762695, "global_step": 13932, "epoch": 331} {"train_loss": -5.122769832611084, "global_step": 13933, "epoch": 331} {"train_loss": -5.303524971008301, "global_step": 13934, "epoch": 331} {"train_loss": -5.139946937561035, "global_step": 13935, "epoch": 331} {"train_loss": -5.0189971923828125, "global_step": 13936, "epoch": 331} {"train_loss": -4.99730110168457, "global_step": 13937, "epoch": 331} {"train_loss": -5.211822032928467, "global_step": 13938, "epoch": 331} {"train_loss": -5.138242721557617, "global_step": 13939, "epoch": 331} {"train_loss": -5.041430473327637, "global_step": 13940, "epoch": 331} {"train_loss": -5.20438289642334, "global_step": 13941, "epoch": 331} {"train_loss": -5.097825050354004, "global_step": 13942, "epoch": 331} {"train_loss": -5.150252603349232, "global_step": 13943, "epoch": 331, "val_loss": 70158.375} {"train_loss": -5.192776679992676, "global_step": 13944, "epoch": 332} {"train_loss": -5.180237770080566, "global_step": 13945, "epoch": 332} {"train_loss": -5.24102258682251, "global_step": 13946, "epoch": 332} {"train_loss": -5.0888214111328125, "global_step": 13947, "epoch": 332} {"train_loss": -5.182149887084961, "global_step": 13948, "epoch": 332} {"train_loss": -5.176158905029297, "global_step": 13949, "epoch": 332} {"train_loss": -5.100846290588379, "global_step": 13950, "epoch": 332} {"train_loss": -5.143226623535156, "global_step": 13951, "epoch": 332} {"train_loss": -5.277451515197754, "global_step": 13952, "epoch": 332} {"train_loss": -5.2393293380737305, "global_step": 13953, "epoch": 332} {"train_loss": -5.1845502853393555, "global_step": 13954, "epoch": 332} {"train_loss": -5.136984825134277, "global_step": 13955, "epoch": 332} {"train_loss": -4.99277400970459, "global_step": 13956, "epoch": 332} {"train_loss": -5.250705718994141, "global_step": 13957, "epoch": 332} {"train_loss": -5.246572494506836, "global_step": 13958, "epoch": 332} {"train_loss": -5.161452293395996, "global_step": 13959, "epoch": 332} {"train_loss": -5.0963239669799805, "global_step": 13960, "epoch": 332} {"train_loss": -5.192233085632324, "global_step": 13961, "epoch": 332} {"train_loss": -5.141129016876221, "global_step": 13962, "epoch": 332} {"train_loss": -5.116260051727295, "global_step": 13963, "epoch": 332} {"train_loss": -5.250053405761719, "global_step": 13964, "epoch": 332} {"train_loss": -5.045393466949463, "global_step": 13965, "epoch": 332} {"train_loss": -5.2008771896362305, "global_step": 13966, "epoch": 332} {"train_loss": -5.000469207763672, "global_step": 13967, "epoch": 332} {"train_loss": -5.191646575927734, "global_step": 13968, "epoch": 332} {"train_loss": -5.0388078689575195, "global_step": 13969, "epoch": 332} {"train_loss": -5.2068376541137695, "global_step": 13970, "epoch": 332} {"train_loss": -5.191579341888428, "global_step": 13971, "epoch": 332} {"train_loss": -5.196671962738037, "global_step": 13972, "epoch": 332} {"train_loss": -5.120743274688721, "global_step": 13973, "epoch": 332} {"train_loss": -5.212984085083008, "global_step": 13974, "epoch": 332} {"train_loss": -5.0859856605529785, "global_step": 13975, "epoch": 332} {"train_loss": -5.291348934173584, "global_step": 13976, "epoch": 332} {"train_loss": -5.0117340087890625, "global_step": 13977, "epoch": 332} {"train_loss": -5.136396408081055, "global_step": 13978, "epoch": 332} {"train_loss": -5.202114105224609, "global_step": 13979, "epoch": 332} {"train_loss": -5.167725563049316, "global_step": 13980, "epoch": 332} {"train_loss": -5.149590969085693, "global_step": 13981, "epoch": 332} {"train_loss": -5.213773727416992, "global_step": 13982, "epoch": 332} {"train_loss": -5.256252288818359, "global_step": 13983, "epoch": 332} {"train_loss": -5.15077018737793, "global_step": 13984, "epoch": 332} {"train_loss": -5.161360331944057, "global_step": 13985, "epoch": 332, "val_loss": 70210.15625} {"train_loss": -5.1148905754089355, "global_step": 13986, "epoch": 333} {"train_loss": -5.2072224617004395, "global_step": 13987, "epoch": 333} {"train_loss": -5.163331508636475, "global_step": 13988, "epoch": 333} {"train_loss": -5.188688278198242, "global_step": 13989, "epoch": 333} {"train_loss": -5.238358020782471, "global_step": 13990, "epoch": 333} {"train_loss": -5.127926826477051, "global_step": 13991, "epoch": 333} {"train_loss": -5.14018440246582, "global_step": 13992, "epoch": 333} {"train_loss": -5.121504783630371, "global_step": 13993, "epoch": 333} {"train_loss": -5.244585990905762, "global_step": 13994, "epoch": 333} {"train_loss": -5.250842094421387, "global_step": 13995, "epoch": 333} {"train_loss": -5.091228008270264, "global_step": 13996, "epoch": 333} {"train_loss": -5.224654674530029, "global_step": 13997, "epoch": 333} {"train_loss": -5.163652420043945, "global_step": 13998, "epoch": 333} {"train_loss": -5.17521858215332, "global_step": 13999, "epoch": 333} {"train_loss": -5.087986946105957, "global_step": 14000, "epoch": 333} {"train_loss": -5.195540428161621, "global_step": 14001, "epoch": 333} {"train_loss": -4.952877044677734, "global_step": 14002, "epoch": 333} {"train_loss": -5.197178840637207, "global_step": 14003, "epoch": 333} {"train_loss": -5.11100435256958, "global_step": 14004, "epoch": 333} {"train_loss": -5.070437431335449, "global_step": 14005, "epoch": 333} {"train_loss": -5.028936862945557, "global_step": 14006, "epoch": 333} {"train_loss": -5.16845703125, "global_step": 14007, "epoch": 333} {"train_loss": -5.135298252105713, "global_step": 14008, "epoch": 333} {"train_loss": -5.108036041259766, "global_step": 14009, "epoch": 333} {"train_loss": -5.062833309173584, "global_step": 14010, "epoch": 333} {"train_loss": -5.250936985015869, "global_step": 14011, "epoch": 333} {"train_loss": -5.291382312774658, "global_step": 14012, "epoch": 333} {"train_loss": -5.005120754241943, "global_step": 14013, "epoch": 333} {"train_loss": -4.992328643798828, "global_step": 14014, "epoch": 333} {"train_loss": -5.198490142822266, "global_step": 14015, "epoch": 333} {"train_loss": -5.238083362579346, "global_step": 14016, "epoch": 333} {"train_loss": -5.112815856933594, "global_step": 14017, "epoch": 333} {"train_loss": -5.058634281158447, "global_step": 14018, "epoch": 333} {"train_loss": -5.210865020751953, "global_step": 14019, "epoch": 333} {"train_loss": -5.17215633392334, "global_step": 14020, "epoch": 333} {"train_loss": -5.208086013793945, "global_step": 14021, "epoch": 333} {"train_loss": -5.021091461181641, "global_step": 14022, "epoch": 333} {"train_loss": -5.0806708335876465, "global_step": 14023, "epoch": 333} {"train_loss": -5.053379535675049, "global_step": 14024, "epoch": 333} {"train_loss": -5.170942306518555, "global_step": 14025, "epoch": 333} {"train_loss": -5.214369773864746, "global_step": 14026, "epoch": 333} {"train_loss": -5.141508295422509, "global_step": 14027, "epoch": 333, "val_loss": 70495.140625} {"train_loss": -5.1845808029174805, "global_step": 14028, "epoch": 334} {"train_loss": -5.374125003814697, "global_step": 14029, "epoch": 334} {"train_loss": -5.2235612869262695, "global_step": 14030, "epoch": 334} {"train_loss": -5.146520614624023, "global_step": 14031, "epoch": 334} {"train_loss": -5.180863380432129, "global_step": 14032, "epoch": 334} {"train_loss": -5.229068756103516, "global_step": 14033, "epoch": 334} {"train_loss": -5.05476713180542, "global_step": 14034, "epoch": 334} {"train_loss": -5.112061500549316, "global_step": 14035, "epoch": 334} {"train_loss": -5.245077133178711, "global_step": 14036, "epoch": 334} {"train_loss": -5.159264087677002, "global_step": 14037, "epoch": 334} {"train_loss": -5.31752872467041, "global_step": 14038, "epoch": 334} {"train_loss": -5.116999626159668, "global_step": 14039, "epoch": 334} {"train_loss": -5.110809326171875, "global_step": 14040, "epoch": 334} {"train_loss": -5.203680038452148, "global_step": 14041, "epoch": 334} {"train_loss": -5.253631114959717, "global_step": 14042, "epoch": 334} {"train_loss": -5.246077537536621, "global_step": 14043, "epoch": 334} {"train_loss": -5.211394309997559, "global_step": 14044, "epoch": 334} {"train_loss": -4.998266220092773, "global_step": 14045, "epoch": 334} {"train_loss": -5.095295429229736, "global_step": 14046, "epoch": 334} {"train_loss": -5.158601760864258, "global_step": 14047, "epoch": 334} {"train_loss": -5.2241034507751465, "global_step": 14048, "epoch": 334} {"train_loss": -5.207975387573242, "global_step": 14049, "epoch": 334} {"train_loss": -5.144721031188965, "global_step": 14050, "epoch": 334} {"train_loss": -5.36409330368042, "global_step": 14051, "epoch": 334} {"train_loss": -5.132116794586182, "global_step": 14052, "epoch": 334} {"train_loss": -5.162482261657715, "global_step": 14053, "epoch": 334} {"train_loss": -5.059312343597412, "global_step": 14054, "epoch": 334} {"train_loss": -5.267510414123535, "global_step": 14055, "epoch": 334} {"train_loss": -5.267117977142334, "global_step": 14056, "epoch": 334} {"train_loss": -5.208094120025635, "global_step": 14057, "epoch": 334} {"train_loss": -5.167023181915283, "global_step": 14058, "epoch": 334} {"train_loss": -5.137785911560059, "global_step": 14059, "epoch": 334} {"train_loss": -5.184117317199707, "global_step": 14060, "epoch": 334} {"train_loss": -5.071348190307617, "global_step": 14061, "epoch": 334} {"train_loss": -5.055577278137207, "global_step": 14062, "epoch": 334} {"train_loss": -5.102962970733643, "global_step": 14063, "epoch": 334} {"train_loss": -4.986822128295898, "global_step": 14064, "epoch": 334} {"train_loss": -5.06801176071167, "global_step": 14065, "epoch": 334} {"train_loss": -5.211586952209473, "global_step": 14066, "epoch": 334} {"train_loss": -5.021144390106201, "global_step": 14067, "epoch": 334} {"train_loss": -4.984291076660156, "global_step": 14068, "epoch": 334} {"train_loss": -5.163720403398786, "global_step": 14069, "epoch": 334, "val_loss": 71392.90625} {"train_loss": -5.037992477416992, "global_step": 14070, "epoch": 335} {"train_loss": -5.106600761413574, "global_step": 14071, "epoch": 335} {"train_loss": -5.151006698608398, "global_step": 14072, "epoch": 335} {"train_loss": -5.087875843048096, "global_step": 14073, "epoch": 335} {"train_loss": -5.087316513061523, "global_step": 14074, "epoch": 335} {"train_loss": -5.109044075012207, "global_step": 14075, "epoch": 335} {"train_loss": -5.256891250610352, "global_step": 14076, "epoch": 335} {"train_loss": -5.140650749206543, "global_step": 14077, "epoch": 335} {"train_loss": -5.177652359008789, "global_step": 14078, "epoch": 335} {"train_loss": -5.193926811218262, "global_step": 14079, "epoch": 335} {"train_loss": -5.1085124015808105, "global_step": 14080, "epoch": 335} {"train_loss": -5.021811485290527, "global_step": 14081, "epoch": 335} {"train_loss": -5.112719535827637, "global_step": 14082, "epoch": 335} {"train_loss": -5.1803812980651855, "global_step": 14083, "epoch": 335} {"train_loss": -5.180744647979736, "global_step": 14084, "epoch": 335} {"train_loss": -5.155424118041992, "global_step": 14085, "epoch": 335} {"train_loss": -5.225279808044434, "global_step": 14086, "epoch": 335} {"train_loss": -5.097504615783691, "global_step": 14087, "epoch": 335} {"train_loss": -5.159883499145508, "global_step": 14088, "epoch": 335} {"train_loss": -5.163670063018799, "global_step": 14089, "epoch": 335} {"train_loss": -5.224851608276367, "global_step": 14090, "epoch": 335} {"train_loss": -5.121173858642578, "global_step": 14091, "epoch": 335} {"train_loss": -5.164862632751465, "global_step": 14092, "epoch": 335} {"train_loss": -5.188624382019043, "global_step": 14093, "epoch": 335} {"train_loss": -5.077646255493164, "global_step": 14094, "epoch": 335} {"train_loss": -5.186589241027832, "global_step": 14095, "epoch": 335} {"train_loss": -5.235618591308594, "global_step": 14096, "epoch": 335} {"train_loss": -5.228095054626465, "global_step": 14097, "epoch": 335} {"train_loss": -5.260417938232422, "global_step": 14098, "epoch": 335} {"train_loss": -5.1796369552612305, "global_step": 14099, "epoch": 335} {"train_loss": -5.181271076202393, "global_step": 14100, "epoch": 335} {"train_loss": -5.199572563171387, "global_step": 14101, "epoch": 335} {"train_loss": -5.203720569610596, "global_step": 14102, "epoch": 335} {"train_loss": -5.182016372680664, "global_step": 14103, "epoch": 335} {"train_loss": -5.10721492767334, "global_step": 14104, "epoch": 335} {"train_loss": -5.184076309204102, "global_step": 14105, "epoch": 335} {"train_loss": -5.185400009155273, "global_step": 14106, "epoch": 335} {"train_loss": -5.3090620040893555, "global_step": 14107, "epoch": 335} {"train_loss": -5.03884220123291, "global_step": 14108, "epoch": 335} {"train_loss": -5.151096343994141, "global_step": 14109, "epoch": 335} {"train_loss": -5.087825775146484, "global_step": 14110, "epoch": 335} {"train_loss": -5.156538804372151, "global_step": 14111, "epoch": 335, "val_loss": 70405.109375} {"train_loss": -5.274126052856445, "global_step": 14112, "epoch": 336} {"train_loss": -5.259394645690918, "global_step": 14113, "epoch": 336} {"train_loss": -5.087607383728027, "global_step": 14114, "epoch": 336} {"train_loss": -5.234792709350586, "global_step": 14115, "epoch": 336} {"train_loss": -5.174718856811523, "global_step": 14116, "epoch": 336} {"train_loss": -5.133838653564453, "global_step": 14117, "epoch": 336} {"train_loss": -5.185930252075195, "global_step": 14118, "epoch": 336} {"train_loss": -5.251900672912598, "global_step": 14119, "epoch": 336} {"train_loss": -5.203427314758301, "global_step": 14120, "epoch": 336} {"train_loss": -5.076071739196777, "global_step": 14121, "epoch": 336} {"train_loss": -5.1404314041137695, "global_step": 14122, "epoch": 336} {"train_loss": -5.349430561065674, "global_step": 14123, "epoch": 336} {"train_loss": -5.3523149490356445, "global_step": 14124, "epoch": 336} {"train_loss": -5.212826251983643, "global_step": 14125, "epoch": 336} {"train_loss": -5.111828327178955, "global_step": 14126, "epoch": 336} {"train_loss": -5.1552734375, "global_step": 14127, "epoch": 336} {"train_loss": -4.907016754150391, "global_step": 14128, "epoch": 336} {"train_loss": -5.079967498779297, "global_step": 14129, "epoch": 336} {"train_loss": -5.11160135269165, "global_step": 14130, "epoch": 336} {"train_loss": -5.175422668457031, "global_step": 14131, "epoch": 336} {"train_loss": -5.118722915649414, "global_step": 14132, "epoch": 336} {"train_loss": -5.186012268066406, "global_step": 14133, "epoch": 336} {"train_loss": -5.166170120239258, "global_step": 14134, "epoch": 336} {"train_loss": -5.160492420196533, "global_step": 14135, "epoch": 336} {"train_loss": -5.218098163604736, "global_step": 14136, "epoch": 336} {"train_loss": -5.211814880371094, "global_step": 14137, "epoch": 336} {"train_loss": -5.192099094390869, "global_step": 14138, "epoch": 336} {"train_loss": -5.129883766174316, "global_step": 14139, "epoch": 336} {"train_loss": -5.091188907623291, "global_step": 14140, "epoch": 336} {"train_loss": -5.254385948181152, "global_step": 14141, "epoch": 336} {"train_loss": -5.126572608947754, "global_step": 14142, "epoch": 336} {"train_loss": -5.248838424682617, "global_step": 14143, "epoch": 336} {"train_loss": -5.14954948425293, "global_step": 14144, "epoch": 336} {"train_loss": -5.077090263366699, "global_step": 14145, "epoch": 336} {"train_loss": -5.2629008293151855, "global_step": 14146, "epoch": 336} {"train_loss": -5.277432918548584, "global_step": 14147, "epoch": 336} {"train_loss": -5.161388397216797, "global_step": 14148, "epoch": 336} {"train_loss": -5.163797855377197, "global_step": 14149, "epoch": 336} {"train_loss": -5.17365026473999, "global_step": 14150, "epoch": 336} {"train_loss": -5.204432487487793, "global_step": 14151, "epoch": 336} {"train_loss": -5.21273136138916, "global_step": 14152, "epoch": 336} {"train_loss": -5.180804070972261, "global_step": 14153, "epoch": 336, "val_loss": 70467.765625} {"train_loss": -5.32915735244751, "global_step": 14154, "epoch": 337} {"train_loss": -5.059500694274902, "global_step": 14155, "epoch": 337} {"train_loss": -5.163804054260254, "global_step": 14156, "epoch": 337} {"train_loss": -5.115880012512207, "global_step": 14157, "epoch": 337} {"train_loss": -5.152456283569336, "global_step": 14158, "epoch": 337} {"train_loss": -5.091046333312988, "global_step": 14159, "epoch": 337} {"train_loss": -5.038479804992676, "global_step": 14160, "epoch": 337} {"train_loss": -5.202901363372803, "global_step": 14161, "epoch": 337} {"train_loss": -5.232208251953125, "global_step": 14162, "epoch": 337} {"train_loss": -5.083118438720703, "global_step": 14163, "epoch": 337} {"train_loss": -5.114729881286621, "global_step": 14164, "epoch": 337} {"train_loss": -5.208310604095459, "global_step": 14165, "epoch": 337} {"train_loss": -5.199688911437988, "global_step": 14166, "epoch": 337} {"train_loss": -5.141860008239746, "global_step": 14167, "epoch": 337} {"train_loss": -5.224484920501709, "global_step": 14168, "epoch": 337} {"train_loss": -5.191537857055664, "global_step": 14169, "epoch": 337} {"train_loss": -5.234680652618408, "global_step": 14170, "epoch": 337} {"train_loss": -5.143146991729736, "global_step": 14171, "epoch": 337} {"train_loss": -5.105197429656982, "global_step": 14172, "epoch": 337} {"train_loss": -5.217907428741455, "global_step": 14173, "epoch": 337} {"train_loss": -5.1809515953063965, "global_step": 14174, "epoch": 337} {"train_loss": -5.282713890075684, "global_step": 14175, "epoch": 337} {"train_loss": -5.184223651885986, "global_step": 14176, "epoch": 337} {"train_loss": -5.233624458312988, "global_step": 14177, "epoch": 337} {"train_loss": -5.1316728591918945, "global_step": 14178, "epoch": 337} {"train_loss": -5.224917411804199, "global_step": 14179, "epoch": 337} {"train_loss": -5.094028472900391, "global_step": 14180, "epoch": 337} {"train_loss": -5.263671875, "global_step": 14181, "epoch": 337} {"train_loss": -5.143564701080322, "global_step": 14182, "epoch": 337} {"train_loss": -5.070620059967041, "global_step": 14183, "epoch": 337} {"train_loss": -4.96095609664917, "global_step": 14184, "epoch": 337} {"train_loss": -5.2340545654296875, "global_step": 14185, "epoch": 337} {"train_loss": -5.18734073638916, "global_step": 14186, "epoch": 337} {"train_loss": -4.97990608215332, "global_step": 14187, "epoch": 337} {"train_loss": -5.187088489532471, "global_step": 14188, "epoch": 337} {"train_loss": -5.115928649902344, "global_step": 14189, "epoch": 337} {"train_loss": -5.118734359741211, "global_step": 14190, "epoch": 337} {"train_loss": -5.077993869781494, "global_step": 14191, "epoch": 337} {"train_loss": -5.086709499359131, "global_step": 14192, "epoch": 337} {"train_loss": -5.22694206237793, "global_step": 14193, "epoch": 337} {"train_loss": -5.106270790100098, "global_step": 14194, "epoch": 337} {"train_loss": -5.154962289901007, "global_step": 14195, "epoch": 337, "val_loss": 70696.3984375} {"train_loss": -5.097194671630859, "global_step": 14196, "epoch": 338} {"train_loss": -5.156150817871094, "global_step": 14197, "epoch": 338} {"train_loss": -5.153341770172119, "global_step": 14198, "epoch": 338} {"train_loss": -5.154554843902588, "global_step": 14199, "epoch": 338} {"train_loss": -5.090648651123047, "global_step": 14200, "epoch": 338} {"train_loss": -5.168666839599609, "global_step": 14201, "epoch": 338} {"train_loss": -5.297882556915283, "global_step": 14202, "epoch": 338} {"train_loss": -4.882741451263428, "global_step": 14203, "epoch": 338} {"train_loss": -5.208318710327148, "global_step": 14204, "epoch": 338} {"train_loss": -5.129266738891602, "global_step": 14205, "epoch": 338} {"train_loss": -5.176600456237793, "global_step": 14206, "epoch": 338} {"train_loss": -5.1170477867126465, "global_step": 14207, "epoch": 338} {"train_loss": -5.232190132141113, "global_step": 14208, "epoch": 338} {"train_loss": -5.207673072814941, "global_step": 14209, "epoch": 338} {"train_loss": -5.235217094421387, "global_step": 14210, "epoch": 338} {"train_loss": -5.172900199890137, "global_step": 14211, "epoch": 338} {"train_loss": -5.181766510009766, "global_step": 14212, "epoch": 338} {"train_loss": -5.061519622802734, "global_step": 14213, "epoch": 338} {"train_loss": -5.2248854637146, "global_step": 14214, "epoch": 338} {"train_loss": -5.20792293548584, "global_step": 14215, "epoch": 338} {"train_loss": -5.138528347015381, "global_step": 14216, "epoch": 338} {"train_loss": -5.141350746154785, "global_step": 14217, "epoch": 338} {"train_loss": -5.255490303039551, "global_step": 14218, "epoch": 338} {"train_loss": -5.128863334655762, "global_step": 14219, "epoch": 338} {"train_loss": -5.112575054168701, "global_step": 14220, "epoch": 338} {"train_loss": -4.888180732727051, "global_step": 14221, "epoch": 338} {"train_loss": -5.11508321762085, "global_step": 14222, "epoch": 338} {"train_loss": -5.069405555725098, "global_step": 14223, "epoch": 338} {"train_loss": -5.051787376403809, "global_step": 14224, "epoch": 338} {"train_loss": -5.15788459777832, "global_step": 14225, "epoch": 338} {"train_loss": -4.982245445251465, "global_step": 14226, "epoch": 338} {"train_loss": -4.881567001342773, "global_step": 14227, "epoch": 338} {"train_loss": -5.164990425109863, "global_step": 14228, "epoch": 338} {"train_loss": -4.972394943237305, "global_step": 14229, "epoch": 338} {"train_loss": -5.155824184417725, "global_step": 14230, "epoch": 338} {"train_loss": -5.193559169769287, "global_step": 14231, "epoch": 338} {"train_loss": -5.029487609863281, "global_step": 14232, "epoch": 338} {"train_loss": -5.089111328125, "global_step": 14233, "epoch": 338} {"train_loss": -5.076995849609375, "global_step": 14234, "epoch": 338} {"train_loss": -5.0091705322265625, "global_step": 14235, "epoch": 338} {"train_loss": -5.11492919921875, "global_step": 14236, "epoch": 338} {"train_loss": -5.119426318577358, "global_step": 14237, "epoch": 338, "val_loss": 70396.515625} {"train_loss": -5.149806022644043, "global_step": 14238, "epoch": 339} {"train_loss": -5.071837425231934, "global_step": 14239, "epoch": 339} {"train_loss": -5.065720558166504, "global_step": 14240, "epoch": 339} {"train_loss": -5.120294094085693, "global_step": 14241, "epoch": 339} {"train_loss": -5.169848442077637, "global_step": 14242, "epoch": 339} {"train_loss": -5.03056001663208, "global_step": 14243, "epoch": 339} {"train_loss": -5.173456192016602, "global_step": 14244, "epoch": 339} {"train_loss": -5.217416763305664, "global_step": 14245, "epoch": 339} {"train_loss": -5.143779277801514, "global_step": 14246, "epoch": 339} {"train_loss": -5.018729209899902, "global_step": 14247, "epoch": 339} {"train_loss": -5.161970138549805, "global_step": 14248, "epoch": 339} {"train_loss": -5.032682418823242, "global_step": 14249, "epoch": 339} {"train_loss": -5.185229778289795, "global_step": 14250, "epoch": 339} {"train_loss": -5.147703170776367, "global_step": 14251, "epoch": 339} {"train_loss": -5.131557464599609, "global_step": 14252, "epoch": 339} {"train_loss": -5.097279071807861, "global_step": 14253, "epoch": 339} {"train_loss": -5.211735248565674, "global_step": 14254, "epoch": 339} {"train_loss": -5.215640544891357, "global_step": 14255, "epoch": 339} {"train_loss": -5.200739860534668, "global_step": 14256, "epoch": 339} {"train_loss": -5.170226573944092, "global_step": 14257, "epoch": 339} {"train_loss": -5.175293922424316, "global_step": 14258, "epoch": 339} {"train_loss": -5.223555564880371, "global_step": 14259, "epoch": 339} {"train_loss": -5.197253704071045, "global_step": 14260, "epoch": 339} {"train_loss": -5.202302932739258, "global_step": 14261, "epoch": 339} {"train_loss": -5.081465721130371, "global_step": 14262, "epoch": 339} {"train_loss": -5.247716426849365, "global_step": 14263, "epoch": 339} {"train_loss": -5.208402633666992, "global_step": 14264, "epoch": 339} {"train_loss": -5.232151031494141, "global_step": 14265, "epoch": 339} {"train_loss": -5.18646240234375, "global_step": 14266, "epoch": 339} {"train_loss": -5.033976078033447, "global_step": 14267, "epoch": 339} {"train_loss": -5.147067070007324, "global_step": 14268, "epoch": 339} {"train_loss": -5.106556415557861, "global_step": 14269, "epoch": 339} {"train_loss": -5.113617420196533, "global_step": 14270, "epoch": 339} {"train_loss": -5.234837055206299, "global_step": 14271, "epoch": 339} {"train_loss": -5.132107257843018, "global_step": 14272, "epoch": 339} {"train_loss": -5.318996906280518, "global_step": 14273, "epoch": 339} {"train_loss": -5.23527193069458, "global_step": 14274, "epoch": 339} {"train_loss": -5.116288185119629, "global_step": 14275, "epoch": 339} {"train_loss": -5.1669793128967285, "global_step": 14276, "epoch": 339} {"train_loss": -5.187501907348633, "global_step": 14277, "epoch": 339} {"train_loss": -5.111695289611816, "global_step": 14278, "epoch": 339} {"train_loss": -5.1563593319484164, "global_step": 14279, "epoch": 339, "val_loss": 70467.2109375} {"train_loss": -5.130172252655029, "global_step": 14280, "epoch": 340} {"train_loss": -5.033843040466309, "global_step": 14281, "epoch": 340} {"train_loss": -5.243119716644287, "global_step": 14282, "epoch": 340} {"train_loss": -5.164836883544922, "global_step": 14283, "epoch": 340} {"train_loss": -5.155262470245361, "global_step": 14284, "epoch": 340} {"train_loss": -5.037088394165039, "global_step": 14285, "epoch": 340} {"train_loss": -5.284862041473389, "global_step": 14286, "epoch": 340} {"train_loss": -5.114587783813477, "global_step": 14287, "epoch": 340} {"train_loss": -5.172682285308838, "global_step": 14288, "epoch": 340} {"train_loss": -5.301909923553467, "global_step": 14289, "epoch": 340} {"train_loss": -5.144191741943359, "global_step": 14290, "epoch": 340} {"train_loss": -5.083171844482422, "global_step": 14291, "epoch": 340} {"train_loss": -5.127791404724121, "global_step": 14292, "epoch": 340} {"train_loss": -5.169974327087402, "global_step": 14293, "epoch": 340} {"train_loss": -5.0812883377075195, "global_step": 14294, "epoch": 340} {"train_loss": -5.140353679656982, "global_step": 14295, "epoch": 340} {"train_loss": -5.238275527954102, "global_step": 14296, "epoch": 340} {"train_loss": -5.102297782897949, "global_step": 14297, "epoch": 340} {"train_loss": -5.132060527801514, "global_step": 14298, "epoch": 340} {"train_loss": -5.122746467590332, "global_step": 14299, "epoch": 340} {"train_loss": -5.054677963256836, "global_step": 14300, "epoch": 340} {"train_loss": -5.0517072677612305, "global_step": 14301, "epoch": 340} {"train_loss": -5.124894142150879, "global_step": 14302, "epoch": 340} {"train_loss": -5.2196431159973145, "global_step": 14303, "epoch": 340} {"train_loss": -5.160303115844727, "global_step": 14304, "epoch": 340} {"train_loss": -5.087628364562988, "global_step": 14305, "epoch": 340} {"train_loss": -5.273545265197754, "global_step": 14306, "epoch": 340} {"train_loss": -5.095089912414551, "global_step": 14307, "epoch": 340} {"train_loss": -5.144888401031494, "global_step": 14308, "epoch": 340} {"train_loss": -4.930550575256348, "global_step": 14309, "epoch": 340} {"train_loss": -5.088065147399902, "global_step": 14310, "epoch": 340} {"train_loss": -5.289798259735107, "global_step": 14311, "epoch": 340} {"train_loss": -4.93197774887085, "global_step": 14312, "epoch": 340} {"train_loss": -5.233304977416992, "global_step": 14313, "epoch": 340} {"train_loss": -5.1233110427856445, "global_step": 14314, "epoch": 340} {"train_loss": -5.033510208129883, "global_step": 14315, "epoch": 340} {"train_loss": -5.201210975646973, "global_step": 14316, "epoch": 340} {"train_loss": -5.083085060119629, "global_step": 14317, "epoch": 340} {"train_loss": -5.114617347717285, "global_step": 14318, "epoch": 340} {"train_loss": -5.16525936126709, "global_step": 14319, "epoch": 340} {"train_loss": -5.065918922424316, "global_step": 14320, "epoch": 340} {"train_loss": -5.131872074944632, "global_step": 14321, "epoch": 340, "val_loss": 71107.171875} {"train_loss": -5.097392559051514, "global_step": 14322, "epoch": 341} {"train_loss": -5.108753681182861, "global_step": 14323, "epoch": 341} {"train_loss": -5.220712661743164, "global_step": 14324, "epoch": 341} {"train_loss": -5.197028636932373, "global_step": 14325, "epoch": 341} {"train_loss": -5.199640274047852, "global_step": 14326, "epoch": 341} {"train_loss": -5.102938652038574, "global_step": 14327, "epoch": 341} {"train_loss": -5.274242401123047, "global_step": 14328, "epoch": 341} {"train_loss": -5.1954121589660645, "global_step": 14329, "epoch": 341} {"train_loss": -5.08561897277832, "global_step": 14330, "epoch": 341} {"train_loss": -5.114115238189697, "global_step": 14331, "epoch": 341} {"train_loss": -5.2229156494140625, "global_step": 14332, "epoch": 341} {"train_loss": -5.26923942565918, "global_step": 14333, "epoch": 341} {"train_loss": -5.277774810791016, "global_step": 14334, "epoch": 341} {"train_loss": -5.042057991027832, "global_step": 14335, "epoch": 341} {"train_loss": -5.1893205642700195, "global_step": 14336, "epoch": 341} {"train_loss": -5.33088493347168, "global_step": 14337, "epoch": 341} {"train_loss": -5.2090959548950195, "global_step": 14338, "epoch": 341} {"train_loss": -5.171871185302734, "global_step": 14339, "epoch": 341} {"train_loss": -4.984658241271973, "global_step": 14340, "epoch": 341} {"train_loss": -5.16135311126709, "global_step": 14341, "epoch": 341} {"train_loss": -5.233639717102051, "global_step": 14342, "epoch": 341} {"train_loss": -5.129184722900391, "global_step": 14343, "epoch": 341} {"train_loss": -5.016086578369141, "global_step": 14344, "epoch": 341} {"train_loss": -5.357382774353027, "global_step": 14345, "epoch": 341} {"train_loss": -5.049862861633301, "global_step": 14346, "epoch": 341} {"train_loss": -5.004500389099121, "global_step": 14347, "epoch": 341} {"train_loss": -5.223291873931885, "global_step": 14348, "epoch": 341} {"train_loss": -5.075298309326172, "global_step": 14349, "epoch": 341} {"train_loss": -5.100175380706787, "global_step": 14350, "epoch": 341} {"train_loss": -5.191324234008789, "global_step": 14351, "epoch": 341} {"train_loss": -5.25083065032959, "global_step": 14352, "epoch": 341} {"train_loss": -5.148263931274414, "global_step": 14353, "epoch": 341} {"train_loss": -5.054103374481201, "global_step": 14354, "epoch": 341} {"train_loss": -5.093844413757324, "global_step": 14355, "epoch": 341} {"train_loss": -4.97916316986084, "global_step": 14356, "epoch": 341} {"train_loss": -5.024609088897705, "global_step": 14357, "epoch": 341} {"train_loss": -5.0069684982299805, "global_step": 14358, "epoch": 341} {"train_loss": -5.166644096374512, "global_step": 14359, "epoch": 341} {"train_loss": -5.179177284240723, "global_step": 14360, "epoch": 341} {"train_loss": -5.128772735595703, "global_step": 14361, "epoch": 341} {"train_loss": -5.220203399658203, "global_step": 14362, "epoch": 341} {"train_loss": -5.147784482865107, "global_step": 14363, "epoch": 341, "val_loss": 70277.375} {"train_loss": -5.1071319580078125, "global_step": 14364, "epoch": 342} {"train_loss": -5.185308933258057, "global_step": 14365, "epoch": 342} {"train_loss": -5.411449432373047, "global_step": 14366, "epoch": 342} {"train_loss": -5.295943737030029, "global_step": 14367, "epoch": 342} {"train_loss": -5.161483287811279, "global_step": 14368, "epoch": 342} {"train_loss": -5.2487077713012695, "global_step": 14369, "epoch": 342} {"train_loss": -5.186521530151367, "global_step": 14370, "epoch": 342} {"train_loss": -5.164986610412598, "global_step": 14371, "epoch": 342} {"train_loss": -5.10245418548584, "global_step": 14372, "epoch": 342} {"train_loss": -5.188533306121826, "global_step": 14373, "epoch": 342} {"train_loss": -5.185429573059082, "global_step": 14374, "epoch": 342} {"train_loss": -5.316281318664551, "global_step": 14375, "epoch": 342} {"train_loss": -5.270960807800293, "global_step": 14376, "epoch": 342} {"train_loss": -5.025084972381592, "global_step": 14377, "epoch": 342} {"train_loss": -5.087569236755371, "global_step": 14378, "epoch": 342} {"train_loss": -5.244420528411865, "global_step": 14379, "epoch": 342} {"train_loss": -5.128793716430664, "global_step": 14380, "epoch": 342} {"train_loss": -5.246631622314453, "global_step": 14381, "epoch": 342} {"train_loss": -5.165044784545898, "global_step": 14382, "epoch": 342} {"train_loss": -5.213043212890625, "global_step": 14383, "epoch": 342} {"train_loss": -4.981801986694336, "global_step": 14384, "epoch": 342} {"train_loss": -5.179430961608887, "global_step": 14385, "epoch": 342} {"train_loss": -5.0963826179504395, "global_step": 14386, "epoch": 342} {"train_loss": -5.162335395812988, "global_step": 14387, "epoch": 342} {"train_loss": -5.095137596130371, "global_step": 14388, "epoch": 342} {"train_loss": -5.027575492858887, "global_step": 14389, "epoch": 342} {"train_loss": -5.192815780639648, "global_step": 14390, "epoch": 342} {"train_loss": -5.160739421844482, "global_step": 14391, "epoch": 342} {"train_loss": -5.128256320953369, "global_step": 14392, "epoch": 342} {"train_loss": -5.242543697357178, "global_step": 14393, "epoch": 342} {"train_loss": -5.148164749145508, "global_step": 14394, "epoch": 342} {"train_loss": -5.232995510101318, "global_step": 14395, "epoch": 342} {"train_loss": -5.285186767578125, "global_step": 14396, "epoch": 342} {"train_loss": -4.993226528167725, "global_step": 14397, "epoch": 342} {"train_loss": -5.132612228393555, "global_step": 14398, "epoch": 342} {"train_loss": -5.156835556030273, "global_step": 14399, "epoch": 342} {"train_loss": -5.220416069030762, "global_step": 14400, "epoch": 342} {"train_loss": -5.04149055480957, "global_step": 14401, "epoch": 342} {"train_loss": -5.105981349945068, "global_step": 14402, "epoch": 342} {"train_loss": -5.125402450561523, "global_step": 14403, "epoch": 342} {"train_loss": -5.228708744049072, "global_step": 14404, "epoch": 342} {"train_loss": -5.166010323024931, "global_step": 14405, "epoch": 342, "val_loss": 71126.546875} {"train_loss": -4.926436424255371, "global_step": 14406, "epoch": 343} {"train_loss": -5.186712265014648, "global_step": 14407, "epoch": 343} {"train_loss": -5.143596172332764, "global_step": 14408, "epoch": 343} {"train_loss": -5.246682167053223, "global_step": 14409, "epoch": 343} {"train_loss": -5.248050689697266, "global_step": 14410, "epoch": 343} {"train_loss": -5.304717540740967, "global_step": 14411, "epoch": 343} {"train_loss": -5.075608253479004, "global_step": 14412, "epoch": 343} {"train_loss": -5.1685895919799805, "global_step": 14413, "epoch": 343} {"train_loss": -5.166039943695068, "global_step": 14414, "epoch": 343} {"train_loss": -5.090892791748047, "global_step": 14415, "epoch": 343} {"train_loss": -5.140858173370361, "global_step": 14416, "epoch": 343} {"train_loss": -5.262407302856445, "global_step": 14417, "epoch": 343} {"train_loss": -5.177101135253906, "global_step": 14418, "epoch": 343} {"train_loss": -5.152638912200928, "global_step": 14419, "epoch": 343} {"train_loss": -5.188753128051758, "global_step": 14420, "epoch": 343} {"train_loss": -5.1570353507995605, "global_step": 14421, "epoch": 343} {"train_loss": -5.172752380371094, "global_step": 14422, "epoch": 343} {"train_loss": -5.136012077331543, "global_step": 14423, "epoch": 343} {"train_loss": -5.115861415863037, "global_step": 14424, "epoch": 343} {"train_loss": -5.213207721710205, "global_step": 14425, "epoch": 343} {"train_loss": -5.223810195922852, "global_step": 14426, "epoch": 343} {"train_loss": -5.214798927307129, "global_step": 14427, "epoch": 343} {"train_loss": -5.23326301574707, "global_step": 14428, "epoch": 343} {"train_loss": -5.20973539352417, "global_step": 14429, "epoch": 343} {"train_loss": -5.11005973815918, "global_step": 14430, "epoch": 343} {"train_loss": -5.1431779861450195, "global_step": 14431, "epoch": 343} {"train_loss": -5.1436052322387695, "global_step": 14432, "epoch": 343} {"train_loss": -5.152378082275391, "global_step": 14433, "epoch": 343} {"train_loss": -5.126501560211182, "global_step": 14434, "epoch": 343} {"train_loss": -5.140364170074463, "global_step": 14435, "epoch": 343} {"train_loss": -5.084745407104492, "global_step": 14436, "epoch": 343} {"train_loss": -5.162842750549316, "global_step": 14437, "epoch": 343} {"train_loss": -5.0853447914123535, "global_step": 14438, "epoch": 343} {"train_loss": -5.227293014526367, "global_step": 14439, "epoch": 343} {"train_loss": -5.2149810791015625, "global_step": 14440, "epoch": 343} {"train_loss": -5.2659454345703125, "global_step": 14441, "epoch": 343} {"train_loss": -5.072833061218262, "global_step": 14442, "epoch": 343} {"train_loss": -5.291193008422852, "global_step": 14443, "epoch": 343} {"train_loss": -5.287234306335449, "global_step": 14444, "epoch": 343} {"train_loss": -5.050099849700928, "global_step": 14445, "epoch": 343} {"train_loss": -5.18842887878418, "global_step": 14446, "epoch": 343} {"train_loss": -5.165903897512527, "global_step": 14447, "epoch": 343, "val_loss": 70959.78125} {"train_loss": -4.992031574249268, "global_step": 14448, "epoch": 344} {"train_loss": -5.231509208679199, "global_step": 14449, "epoch": 344} {"train_loss": -4.826746463775635, "global_step": 14450, "epoch": 344} {"train_loss": -4.900230407714844, "global_step": 14451, "epoch": 344} {"train_loss": -5.017190933227539, "global_step": 14452, "epoch": 344} {"train_loss": -4.923975944519043, "global_step": 14453, "epoch": 344} {"train_loss": -5.178924083709717, "global_step": 14454, "epoch": 344} {"train_loss": -4.989498138427734, "global_step": 14455, "epoch": 344} {"train_loss": -5.197442054748535, "global_step": 14456, "epoch": 344} {"train_loss": -5.132751941680908, "global_step": 14457, "epoch": 344} {"train_loss": -5.128373146057129, "global_step": 14458, "epoch": 344} {"train_loss": -5.192318439483643, "global_step": 14459, "epoch": 344} {"train_loss": -5.065675735473633, "global_step": 14460, "epoch": 344} {"train_loss": -5.113169193267822, "global_step": 14461, "epoch": 344} {"train_loss": -5.109850883483887, "global_step": 14462, "epoch": 344} {"train_loss": -5.154384613037109, "global_step": 14463, "epoch": 344} {"train_loss": -5.218235015869141, "global_step": 14464, "epoch": 344} {"train_loss": -5.11998176574707, "global_step": 14465, "epoch": 344} {"train_loss": -5.168391704559326, "global_step": 14466, "epoch": 344} {"train_loss": -5.04946231842041, "global_step": 14467, "epoch": 344} {"train_loss": -5.158376693725586, "global_step": 14468, "epoch": 344} {"train_loss": -5.0925493240356445, "global_step": 14469, "epoch": 344} {"train_loss": -5.178367614746094, "global_step": 14470, "epoch": 344} {"train_loss": -5.190812587738037, "global_step": 14471, "epoch": 344} {"train_loss": -5.107893943786621, "global_step": 14472, "epoch": 344} {"train_loss": -5.220260143280029, "global_step": 14473, "epoch": 344} {"train_loss": -5.203821182250977, "global_step": 14474, "epoch": 344} {"train_loss": -5.299490928649902, "global_step": 14475, "epoch": 344} {"train_loss": -5.097378730773926, "global_step": 14476, "epoch": 344} {"train_loss": -5.157397270202637, "global_step": 14477, "epoch": 344} {"train_loss": -5.2191667556762695, "global_step": 14478, "epoch": 344} {"train_loss": -5.163389205932617, "global_step": 14479, "epoch": 344} {"train_loss": -5.082867622375488, "global_step": 14480, "epoch": 344} {"train_loss": -5.103392601013184, "global_step": 14481, "epoch": 344} {"train_loss": -5.143006324768066, "global_step": 14482, "epoch": 344} {"train_loss": -5.24229621887207, "global_step": 14483, "epoch": 344} {"train_loss": -5.222255229949951, "global_step": 14484, "epoch": 344} {"train_loss": -5.0984086990356445, "global_step": 14485, "epoch": 344} {"train_loss": -5.259332180023193, "global_step": 14486, "epoch": 344} {"train_loss": -5.130995273590088, "global_step": 14487, "epoch": 344} {"train_loss": -5.245105743408203, "global_step": 14488, "epoch": 344} {"train_loss": -5.1321907724652975, "global_step": 14489, "epoch": 344, "val_loss": 70092.7890625} {"train_loss": -5.36037540435791, "global_step": 14490, "epoch": 345} {"train_loss": -5.113722801208496, "global_step": 14491, "epoch": 345} {"train_loss": -5.149321556091309, "global_step": 14492, "epoch": 345} {"train_loss": -5.154722213745117, "global_step": 14493, "epoch": 345} {"train_loss": -5.135489463806152, "global_step": 14494, "epoch": 345} {"train_loss": -5.2500715255737305, "global_step": 14495, "epoch": 345} {"train_loss": -5.219210147857666, "global_step": 14496, "epoch": 345} {"train_loss": -5.242563247680664, "global_step": 14497, "epoch": 345} {"train_loss": -5.127813339233398, "global_step": 14498, "epoch": 345} {"train_loss": -5.25114631652832, "global_step": 14499, "epoch": 345} {"train_loss": -5.16002082824707, "global_step": 14500, "epoch": 345} {"train_loss": -5.250508785247803, "global_step": 14501, "epoch": 345} {"train_loss": -5.160727024078369, "global_step": 14502, "epoch": 345} {"train_loss": -5.273005485534668, "global_step": 14503, "epoch": 345} {"train_loss": -5.1886887550354, "global_step": 14504, "epoch": 345} {"train_loss": -5.229469299316406, "global_step": 14505, "epoch": 345} {"train_loss": -5.075718879699707, "global_step": 14506, "epoch": 345} {"train_loss": -5.201637268066406, "global_step": 14507, "epoch": 345} {"train_loss": -5.032549858093262, "global_step": 14508, "epoch": 345} {"train_loss": -5.1611738204956055, "global_step": 14509, "epoch": 345} {"train_loss": -5.151233196258545, "global_step": 14510, "epoch": 345} {"train_loss": -5.126435279846191, "global_step": 14511, "epoch": 345} {"train_loss": -5.213994026184082, "global_step": 14512, "epoch": 345} {"train_loss": -5.289119720458984, "global_step": 14513, "epoch": 345} {"train_loss": -5.123342514038086, "global_step": 14514, "epoch": 345} {"train_loss": -5.183322429656982, "global_step": 14515, "epoch": 345} {"train_loss": -5.179604530334473, "global_step": 14516, "epoch": 345} {"train_loss": -5.158334732055664, "global_step": 14517, "epoch": 345} {"train_loss": -5.129061698913574, "global_step": 14518, "epoch": 345} {"train_loss": -5.143582344055176, "global_step": 14519, "epoch": 345} {"train_loss": -5.16957950592041, "global_step": 14520, "epoch": 345} {"train_loss": -5.040016174316406, "global_step": 14521, "epoch": 345} {"train_loss": -5.197467803955078, "global_step": 14522, "epoch": 345} {"train_loss": -5.208826065063477, "global_step": 14523, "epoch": 345} {"train_loss": -5.117339134216309, "global_step": 14524, "epoch": 345} {"train_loss": -5.20955753326416, "global_step": 14525, "epoch": 345} {"train_loss": -5.2219719886779785, "global_step": 14526, "epoch": 345} {"train_loss": -5.144124507904053, "global_step": 14527, "epoch": 345} {"train_loss": -5.141982078552246, "global_step": 14528, "epoch": 345} {"train_loss": -5.067773818969727, "global_step": 14529, "epoch": 345} {"train_loss": -5.038915634155273, "global_step": 14530, "epoch": 345} {"train_loss": -5.169189816429501, "global_step": 14531, "epoch": 345, "val_loss": 70795.0234375} {"train_loss": -5.1431684494018555, "global_step": 14532, "epoch": 346} {"train_loss": -4.95869255065918, "global_step": 14533, "epoch": 346} {"train_loss": -5.170922756195068, "global_step": 14534, "epoch": 346} {"train_loss": -5.195331573486328, "global_step": 14535, "epoch": 346} {"train_loss": -5.072531223297119, "global_step": 14536, "epoch": 346} {"train_loss": -5.167413711547852, "global_step": 14537, "epoch": 346} {"train_loss": -4.968203544616699, "global_step": 14538, "epoch": 346} {"train_loss": -5.101834297180176, "global_step": 14539, "epoch": 346} {"train_loss": -5.282439231872559, "global_step": 14540, "epoch": 346} {"train_loss": -5.068484306335449, "global_step": 14541, "epoch": 346} {"train_loss": -5.096068859100342, "global_step": 14542, "epoch": 346} {"train_loss": -5.364284515380859, "global_step": 14543, "epoch": 346} {"train_loss": -5.226667404174805, "global_step": 14544, "epoch": 346} {"train_loss": -5.267049312591553, "global_step": 14545, "epoch": 346} {"train_loss": -5.117487907409668, "global_step": 14546, "epoch": 346} {"train_loss": -5.1766157150268555, "global_step": 14547, "epoch": 346} {"train_loss": -5.115731716156006, "global_step": 14548, "epoch": 346} {"train_loss": -5.092817783355713, "global_step": 14549, "epoch": 346} {"train_loss": -5.262838363647461, "global_step": 14550, "epoch": 346} {"train_loss": -5.121647834777832, "global_step": 14551, "epoch": 346} {"train_loss": -5.188485145568848, "global_step": 14552, "epoch": 346} {"train_loss": -5.133272647857666, "global_step": 14553, "epoch": 346} {"train_loss": -4.99583625793457, "global_step": 14554, "epoch": 346} {"train_loss": -5.071245193481445, "global_step": 14555, "epoch": 346} {"train_loss": -5.135659217834473, "global_step": 14556, "epoch": 346} {"train_loss": -5.156647682189941, "global_step": 14557, "epoch": 346} {"train_loss": -5.132871627807617, "global_step": 14558, "epoch": 346} {"train_loss": -5.253464221954346, "global_step": 14559, "epoch": 346} {"train_loss": -5.260259628295898, "global_step": 14560, "epoch": 346} {"train_loss": -5.204800128936768, "global_step": 14561, "epoch": 346} {"train_loss": -5.202481269836426, "global_step": 14562, "epoch": 346} {"train_loss": -5.209155082702637, "global_step": 14563, "epoch": 346} {"train_loss": -5.232834815979004, "global_step": 14564, "epoch": 346} {"train_loss": -5.250436782836914, "global_step": 14565, "epoch": 346} {"train_loss": -5.202594757080078, "global_step": 14566, "epoch": 346} {"train_loss": -5.295724391937256, "global_step": 14567, "epoch": 346} {"train_loss": -5.2063446044921875, "global_step": 14568, "epoch": 346} {"train_loss": -5.215609073638916, "global_step": 14569, "epoch": 346} {"train_loss": -5.236810684204102, "global_step": 14570, "epoch": 346} {"train_loss": -5.1337809562683105, "global_step": 14571, "epoch": 346} {"train_loss": -5.201587677001953, "global_step": 14572, "epoch": 346} {"train_loss": -5.167915832428705, "global_step": 14573, "epoch": 346, "val_loss": 69918.3828125} {"train_loss": -5.323604583740234, "global_step": 14574, "epoch": 347} {"train_loss": -5.235595703125, "global_step": 14575, "epoch": 347} {"train_loss": -5.098318099975586, "global_step": 14576, "epoch": 347} {"train_loss": -5.355974197387695, "global_step": 14577, "epoch": 347} {"train_loss": -5.061262130737305, "global_step": 14578, "epoch": 347} {"train_loss": -5.13416862487793, "global_step": 14579, "epoch": 347} {"train_loss": -5.043623924255371, "global_step": 14580, "epoch": 347} {"train_loss": -5.233551025390625, "global_step": 14581, "epoch": 347} {"train_loss": -5.1594743728637695, "global_step": 14582, "epoch": 347} {"train_loss": -4.9055938720703125, "global_step": 14583, "epoch": 347} {"train_loss": -5.374096870422363, "global_step": 14584, "epoch": 347} {"train_loss": -5.175986289978027, "global_step": 14585, "epoch": 347} {"train_loss": -5.228433132171631, "global_step": 14586, "epoch": 347} {"train_loss": -5.173915863037109, "global_step": 14587, "epoch": 347} {"train_loss": -5.304687023162842, "global_step": 14588, "epoch": 347} {"train_loss": -5.134098529815674, "global_step": 14589, "epoch": 347} {"train_loss": -5.134006977081299, "global_step": 14590, "epoch": 347} {"train_loss": -5.280229568481445, "global_step": 14591, "epoch": 347} {"train_loss": -5.159295082092285, "global_step": 14592, "epoch": 347} {"train_loss": -5.216250419616699, "global_step": 14593, "epoch": 347} {"train_loss": -5.1162943840026855, "global_step": 14594, "epoch": 347} {"train_loss": -5.3207783699035645, "global_step": 14595, "epoch": 347} {"train_loss": -5.279187202453613, "global_step": 14596, "epoch": 347} {"train_loss": -5.258004188537598, "global_step": 14597, "epoch": 347} {"train_loss": -5.215102195739746, "global_step": 14598, "epoch": 347} {"train_loss": -5.206606388092041, "global_step": 14599, "epoch": 347} {"train_loss": -5.168243885040283, "global_step": 14600, "epoch": 347} {"train_loss": -5.323242664337158, "global_step": 14601, "epoch": 347} {"train_loss": -5.125085830688477, "global_step": 14602, "epoch": 347} {"train_loss": -5.113140106201172, "global_step": 14603, "epoch": 347} {"train_loss": -5.219066619873047, "global_step": 14604, "epoch": 347} {"train_loss": -5.067930221557617, "global_step": 14605, "epoch": 347} {"train_loss": -5.035462379455566, "global_step": 14606, "epoch": 347} {"train_loss": -5.180213451385498, "global_step": 14607, "epoch": 347} {"train_loss": -5.288527965545654, "global_step": 14608, "epoch": 347} {"train_loss": -5.13849401473999, "global_step": 14609, "epoch": 347} {"train_loss": -5.231477737426758, "global_step": 14610, "epoch": 347} {"train_loss": -5.166893005371094, "global_step": 14611, "epoch": 347} {"train_loss": -5.369012355804443, "global_step": 14612, "epoch": 347} {"train_loss": -5.30673360824585, "global_step": 14613, "epoch": 347} {"train_loss": -5.1650495529174805, "global_step": 14614, "epoch": 347} {"train_loss": -5.192606608072917, "global_step": 14615, "epoch": 347, "val_loss": 69900.1484375} {"train_loss": -5.125800609588623, "global_step": 14616, "epoch": 348} {"train_loss": -5.214349269866943, "global_step": 14617, "epoch": 348} {"train_loss": -5.110435962677002, "global_step": 14618, "epoch": 348} {"train_loss": -5.065185546875, "global_step": 14619, "epoch": 348} {"train_loss": -5.112548828125, "global_step": 14620, "epoch": 348} {"train_loss": -5.178411960601807, "global_step": 14621, "epoch": 348} {"train_loss": -5.100461483001709, "global_step": 14622, "epoch": 348} {"train_loss": -5.066178321838379, "global_step": 14623, "epoch": 348} {"train_loss": -5.10060977935791, "global_step": 14624, "epoch": 348} {"train_loss": -5.341552734375, "global_step": 14625, "epoch": 348} {"train_loss": -4.939502716064453, "global_step": 14626, "epoch": 348} {"train_loss": -4.962588310241699, "global_step": 14627, "epoch": 348} {"train_loss": -5.196817398071289, "global_step": 14628, "epoch": 348} {"train_loss": -5.124479293823242, "global_step": 14629, "epoch": 348} {"train_loss": -5.093540668487549, "global_step": 14630, "epoch": 348} {"train_loss": -5.160832405090332, "global_step": 14631, "epoch": 348} {"train_loss": -5.123884677886963, "global_step": 14632, "epoch": 348} {"train_loss": -5.196422100067139, "global_step": 14633, "epoch": 348} {"train_loss": -5.267444610595703, "global_step": 14634, "epoch": 348} {"train_loss": -5.214756488800049, "global_step": 14635, "epoch": 348} {"train_loss": -5.2140960693359375, "global_step": 14636, "epoch": 348} {"train_loss": -5.2063188552856445, "global_step": 14637, "epoch": 348} {"train_loss": -5.121352195739746, "global_step": 14638, "epoch": 348} {"train_loss": -5.2193284034729, "global_step": 14639, "epoch": 348} {"train_loss": -5.144655227661133, "global_step": 14640, "epoch": 348} {"train_loss": -5.203587532043457, "global_step": 14641, "epoch": 348} {"train_loss": -5.150442600250244, "global_step": 14642, "epoch": 348} {"train_loss": -5.062110900878906, "global_step": 14643, "epoch": 348} {"train_loss": -5.159374237060547, "global_step": 14644, "epoch": 348} {"train_loss": -5.19612979888916, "global_step": 14645, "epoch": 348} {"train_loss": -5.050243377685547, "global_step": 14646, "epoch": 348} {"train_loss": -5.173949718475342, "global_step": 14647, "epoch": 348} {"train_loss": -5.127969264984131, "global_step": 14648, "epoch": 348} {"train_loss": -5.1669464111328125, "global_step": 14649, "epoch": 348} {"train_loss": -5.089631080627441, "global_step": 14650, "epoch": 348} {"train_loss": -5.245861053466797, "global_step": 14651, "epoch": 348} {"train_loss": -5.244050025939941, "global_step": 14652, "epoch": 348} {"train_loss": -5.301584243774414, "global_step": 14653, "epoch": 348} {"train_loss": -5.081085205078125, "global_step": 14654, "epoch": 348} {"train_loss": -5.203084945678711, "global_step": 14655, "epoch": 348} {"train_loss": -5.1975226402282715, "global_step": 14656, "epoch": 348} {"train_loss": -5.153854517709641, "global_step": 14657, "epoch": 348, "val_loss": 70304.4140625} {"train_loss": -5.2261857986450195, "global_step": 14658, "epoch": 349} {"train_loss": -5.319437026977539, "global_step": 14659, "epoch": 349} {"train_loss": -5.245975494384766, "global_step": 14660, "epoch": 349} {"train_loss": -5.28715705871582, "global_step": 14661, "epoch": 349} {"train_loss": -5.202718734741211, "global_step": 14662, "epoch": 349} {"train_loss": -5.1684184074401855, "global_step": 14663, "epoch": 349} {"train_loss": -5.214982032775879, "global_step": 14664, "epoch": 349} {"train_loss": -5.171578407287598, "global_step": 14665, "epoch": 349} {"train_loss": -5.15600061416626, "global_step": 14666, "epoch": 349} {"train_loss": -5.162352561950684, "global_step": 14667, "epoch": 349} {"train_loss": -5.256890296936035, "global_step": 14668, "epoch": 349} {"train_loss": -5.151134014129639, "global_step": 14669, "epoch": 349} {"train_loss": -5.169586181640625, "global_step": 14670, "epoch": 349} {"train_loss": -5.311270713806152, "global_step": 14671, "epoch": 349} {"train_loss": -5.171987533569336, "global_step": 14672, "epoch": 349} {"train_loss": -5.197282791137695, "global_step": 14673, "epoch": 349} {"train_loss": -5.330179214477539, "global_step": 14674, "epoch": 349} {"train_loss": -5.091931343078613, "global_step": 14675, "epoch": 349} {"train_loss": -5.115764141082764, "global_step": 14676, "epoch": 349} {"train_loss": -5.156378746032715, "global_step": 14677, "epoch": 349} {"train_loss": -5.202209949493408, "global_step": 14678, "epoch": 349} {"train_loss": -5.088305473327637, "global_step": 14679, "epoch": 349} {"train_loss": -5.150893211364746, "global_step": 14680, "epoch": 349} {"train_loss": -5.195425510406494, "global_step": 14681, "epoch": 349} {"train_loss": -5.236797332763672, "global_step": 14682, "epoch": 349} {"train_loss": -5.13974666595459, "global_step": 14683, "epoch": 349} {"train_loss": -5.257779598236084, "global_step": 14684, "epoch": 349} {"train_loss": -5.156766414642334, "global_step": 14685, "epoch": 349} {"train_loss": -5.167210102081299, "global_step": 14686, "epoch": 349} {"train_loss": -5.237699031829834, "global_step": 14687, "epoch": 349} {"train_loss": -5.299168586730957, "global_step": 14688, "epoch": 349} {"train_loss": -5.180556774139404, "global_step": 14689, "epoch": 349} {"train_loss": -5.181317329406738, "global_step": 14690, "epoch": 349} {"train_loss": -5.267446517944336, "global_step": 14691, "epoch": 349} {"train_loss": -5.095311641693115, "global_step": 14692, "epoch": 349} {"train_loss": -5.113138198852539, "global_step": 14693, "epoch": 349} {"train_loss": -5.176314353942871, "global_step": 14694, "epoch": 349} {"train_loss": -5.320807933807373, "global_step": 14695, "epoch": 349} {"train_loss": -5.173287391662598, "global_step": 14696, "epoch": 349} {"train_loss": -5.061997413635254, "global_step": 14697, "epoch": 349} {"train_loss": -5.173612117767334, "global_step": 14698, "epoch": 349} {"train_loss": -5.195761930374872, "global_step": 14699, "epoch": 349, "val_loss": 70087.2109375} {"train_loss": -5.268597602844238, "global_step": 14700, "epoch": 350} {"train_loss": -5.112157821655273, "global_step": 14701, "epoch": 350} {"train_loss": -5.112544536590576, "global_step": 14702, "epoch": 350} {"train_loss": -5.16657829284668, "global_step": 14703, "epoch": 350} {"train_loss": -5.21317195892334, "global_step": 14704, "epoch": 350} {"train_loss": -5.121957778930664, "global_step": 14705, "epoch": 350} {"train_loss": -5.170941352844238, "global_step": 14706, "epoch": 350} {"train_loss": -5.125759601593018, "global_step": 14707, "epoch": 350} {"train_loss": -5.073559761047363, "global_step": 14708, "epoch": 350} {"train_loss": -5.080096244812012, "global_step": 14709, "epoch": 350} {"train_loss": -5.246345520019531, "global_step": 14710, "epoch": 350} {"train_loss": -5.1165385246276855, "global_step": 14711, "epoch": 350} {"train_loss": -5.116622447967529, "global_step": 14712, "epoch": 350} {"train_loss": -5.183078765869141, "global_step": 14713, "epoch": 350} {"train_loss": -5.138839244842529, "global_step": 14714, "epoch": 350} {"train_loss": -5.135379314422607, "global_step": 14715, "epoch": 350} {"train_loss": -5.156159400939941, "global_step": 14716, "epoch": 350} {"train_loss": -5.075563430786133, "global_step": 14717, "epoch": 350} {"train_loss": -5.06679630279541, "global_step": 14718, "epoch": 350} {"train_loss": -5.17116117477417, "global_step": 14719, "epoch": 350} {"train_loss": -5.235498428344727, "global_step": 14720, "epoch": 350} {"train_loss": -5.265355110168457, "global_step": 14721, "epoch": 350} {"train_loss": -5.136770725250244, "global_step": 14722, "epoch": 350} {"train_loss": -5.172287464141846, "global_step": 14723, "epoch": 350} {"train_loss": -5.219538688659668, "global_step": 14724, "epoch": 350} {"train_loss": -5.183561325073242, "global_step": 14725, "epoch": 350} {"train_loss": -5.219748497009277, "global_step": 14726, "epoch": 350} {"train_loss": -5.2784342765808105, "global_step": 14727, "epoch": 350} {"train_loss": -5.135367393493652, "global_step": 14728, "epoch": 350} {"train_loss": -5.21144962310791, "global_step": 14729, "epoch": 350} {"train_loss": -5.237617492675781, "global_step": 14730, "epoch": 350} {"train_loss": -5.179262161254883, "global_step": 14731, "epoch": 350} {"train_loss": -5.235023498535156, "global_step": 14732, "epoch": 350} {"train_loss": -5.1836748123168945, "global_step": 14733, "epoch": 350} {"train_loss": -5.168074607849121, "global_step": 14734, "epoch": 350} {"train_loss": -5.34336519241333, "global_step": 14735, "epoch": 350} {"train_loss": -5.082921981811523, "global_step": 14736, "epoch": 350} {"train_loss": -5.323366165161133, "global_step": 14737, "epoch": 350} {"train_loss": -5.236475944519043, "global_step": 14738, "epoch": 350} {"train_loss": -5.067614555358887, "global_step": 14739, "epoch": 350} {"train_loss": -5.250619888305664, "global_step": 14740, "epoch": 350} {"train_loss": -5.17389532497951, "global_step": 14741, "epoch": 350, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.16107820167804537, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.16551695291283075, "train/sim_max_reward_4": 0.3218573070933244, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0707613752114159, "test/sim_max_reward_4300001": 0.0, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.6784170041041857, "test/sim_max_reward_4300004": 0.8274270788242308, "test/sim_max_reward_4300005": 0.40233073027212973, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.630234158558647, "test/sim_max_reward_4300008": 0.4905082568934818, "test/sim_max_reward_4300009": 0.7652713283195672, "test/sim_max_reward_4300010": 0.06545712635023546, "test/sim_max_reward_4300011": 0.6931139418032062, "test/sim_max_reward_4300012": 0.3869132816175258, "test/sim_max_reward_4300013": 0.5045476967777758, "test/sim_max_reward_4300014": 0.4111581021329718, "test/sim_max_reward_4300015": 0.262943226921178, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.4297643195245451, "test/sim_max_reward_4300018": 0.4847906021099302, "test/sim_max_reward_4300019": 0.18529716336539434, "test/sim_max_reward_4300020": 0.01775428007182679, "test/sim_max_reward_4300021": 0.45262441445867374, "test/sim_max_reward_4300022": 3.7006314069507585e-06, "test/sim_max_reward_4300023": 0.3973420978017782, "test/sim_max_reward_4300024": 0.3707748098322852, "test/sim_max_reward_4300025": 0.4407318662614461, "test/sim_max_reward_4300026": 0.501474560178411, "test/sim_max_reward_4300027": 0.09589028854496824, "test/sim_max_reward_4300028": 0.007370499467179962, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.6338990638540211, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.7018638621229896, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.330205544848247, "test/sim_max_reward_4300037": 0.6804975428867411, "test/sim_max_reward_4300038": 0.9787845692616102, "test/sim_max_reward_4300039": 0.8505411920072168, "test/sim_max_reward_4300040": 0.001228810832348408, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.9420240096352743, "test/sim_max_reward_4300043": 0.6743765410469515, "test/sim_max_reward_4300044": 0.6942354009408891, "test/sim_max_reward_4300045": 0.12125946200790035, "test/sim_max_reward_4300046": 0.0, "test/sim_max_reward_4300047": 0.49362826645833, "test/sim_max_reward_4300048": 0.6740717743530844, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.17195578627540667, "test/mean_score": 0.3541627326186178, "val_loss": 69827.578125} {"train_loss": -5.193556785583496, "global_step": 14742, "epoch": 351} {"train_loss": -5.1920576095581055, "global_step": 14743, "epoch": 351} {"train_loss": -5.157349109649658, "global_step": 14744, "epoch": 351} {"train_loss": -5.210833549499512, "global_step": 14745, "epoch": 351} {"train_loss": -5.258399486541748, "global_step": 14746, "epoch": 351} {"train_loss": -5.220552444458008, "global_step": 14747, "epoch": 351} {"train_loss": -5.196995735168457, "global_step": 14748, "epoch": 351} {"train_loss": -5.167224884033203, "global_step": 14749, "epoch": 351} {"train_loss": -5.021195411682129, "global_step": 14750, "epoch": 351} {"train_loss": -5.199744701385498, "global_step": 14751, "epoch": 351} {"train_loss": -5.247618675231934, "global_step": 14752, "epoch": 351} {"train_loss": -5.1491804122924805, "global_step": 14753, "epoch": 351} {"train_loss": -5.084168910980225, "global_step": 14754, "epoch": 351} {"train_loss": -5.264737129211426, "global_step": 14755, "epoch": 351} {"train_loss": -5.209722518920898, "global_step": 14756, "epoch": 351} {"train_loss": -5.1634063720703125, "global_step": 14757, "epoch": 351} {"train_loss": -5.149509429931641, "global_step": 14758, "epoch": 351} {"train_loss": -5.246468544006348, "global_step": 14759, "epoch": 351} {"train_loss": -5.245529651641846, "global_step": 14760, "epoch": 351} {"train_loss": -5.292628765106201, "global_step": 14761, "epoch": 351} {"train_loss": -4.989788055419922, "global_step": 14762, "epoch": 351} {"train_loss": -5.086555480957031, "global_step": 14763, "epoch": 351} {"train_loss": -5.243955612182617, "global_step": 14764, "epoch": 351} {"train_loss": -5.202436923980713, "global_step": 14765, "epoch": 351} {"train_loss": -5.205532550811768, "global_step": 14766, "epoch": 351} {"train_loss": -5.146868705749512, "global_step": 14767, "epoch": 351} {"train_loss": -5.2704973220825195, "global_step": 14768, "epoch": 351} {"train_loss": -5.179469108581543, "global_step": 14769, "epoch": 351} {"train_loss": -5.199296951293945, "global_step": 14770, "epoch": 351} {"train_loss": -5.210603713989258, "global_step": 14771, "epoch": 351} {"train_loss": -5.266151428222656, "global_step": 14772, "epoch": 351} {"train_loss": -5.218585014343262, "global_step": 14773, "epoch": 351} {"train_loss": -5.109709739685059, "global_step": 14774, "epoch": 351} {"train_loss": -5.081040382385254, "global_step": 14775, "epoch": 351} {"train_loss": -5.250316619873047, "global_step": 14776, "epoch": 351} {"train_loss": -5.241635322570801, "global_step": 14777, "epoch": 351} {"train_loss": -5.013829231262207, "global_step": 14778, "epoch": 351} {"train_loss": -4.991363525390625, "global_step": 14779, "epoch": 351} {"train_loss": -5.264375686645508, "global_step": 14780, "epoch": 351} {"train_loss": -5.180366039276123, "global_step": 14781, "epoch": 351} {"train_loss": -5.219881057739258, "global_step": 14782, "epoch": 351} {"train_loss": -5.180153245017642, "global_step": 14783, "epoch": 351, "val_loss": 70020.828125} {"train_loss": -5.105992317199707, "global_step": 14784, "epoch": 352} {"train_loss": -5.228940963745117, "global_step": 14785, "epoch": 352} {"train_loss": -5.270656108856201, "global_step": 14786, "epoch": 352} {"train_loss": -5.201224327087402, "global_step": 14787, "epoch": 352} {"train_loss": -5.215167999267578, "global_step": 14788, "epoch": 352} {"train_loss": -5.18560791015625, "global_step": 14789, "epoch": 352} {"train_loss": -5.2132649421691895, "global_step": 14790, "epoch": 352} {"train_loss": -5.1792097091674805, "global_step": 14791, "epoch": 352} {"train_loss": -5.217036724090576, "global_step": 14792, "epoch": 352} {"train_loss": -5.203625679016113, "global_step": 14793, "epoch": 352} {"train_loss": -5.108072757720947, "global_step": 14794, "epoch": 352} {"train_loss": -5.223578453063965, "global_step": 14795, "epoch": 352} {"train_loss": -5.174664497375488, "global_step": 14796, "epoch": 352} {"train_loss": -5.198681354522705, "global_step": 14797, "epoch": 352} {"train_loss": -5.134010314941406, "global_step": 14798, "epoch": 352} {"train_loss": -5.273272514343262, "global_step": 14799, "epoch": 352} {"train_loss": -5.094160079956055, "global_step": 14800, "epoch": 352} {"train_loss": -5.141834259033203, "global_step": 14801, "epoch": 352} {"train_loss": -5.1726813316345215, "global_step": 14802, "epoch": 352} {"train_loss": -5.100508689880371, "global_step": 14803, "epoch": 352} {"train_loss": -5.27001428604126, "global_step": 14804, "epoch": 352} {"train_loss": -5.244202613830566, "global_step": 14805, "epoch": 352} {"train_loss": -5.1335768699646, "global_step": 14806, "epoch": 352} {"train_loss": -5.294475555419922, "global_step": 14807, "epoch": 352} {"train_loss": -5.24622106552124, "global_step": 14808, "epoch": 352} {"train_loss": -5.083309173583984, "global_step": 14809, "epoch": 352} {"train_loss": -5.246025085449219, "global_step": 14810, "epoch": 352} {"train_loss": -5.1934123039245605, "global_step": 14811, "epoch": 352} {"train_loss": -5.104990482330322, "global_step": 14812, "epoch": 352} {"train_loss": -5.196002006530762, "global_step": 14813, "epoch": 352} {"train_loss": -5.102518081665039, "global_step": 14814, "epoch": 352} {"train_loss": -5.089202404022217, "global_step": 14815, "epoch": 352} {"train_loss": -5.325326919555664, "global_step": 14816, "epoch": 352} {"train_loss": -5.263865947723389, "global_step": 14817, "epoch": 352} {"train_loss": -5.08351993560791, "global_step": 14818, "epoch": 352} {"train_loss": -5.233950138092041, "global_step": 14819, "epoch": 352} {"train_loss": -5.086569786071777, "global_step": 14820, "epoch": 352} {"train_loss": -5.3276166915893555, "global_step": 14821, "epoch": 352} {"train_loss": -5.285182952880859, "global_step": 14822, "epoch": 352} {"train_loss": -5.200092792510986, "global_step": 14823, "epoch": 352} {"train_loss": -5.302741527557373, "global_step": 14824, "epoch": 352} {"train_loss": -5.194919767833891, "global_step": 14825, "epoch": 352, "val_loss": 69773.9609375} {"train_loss": -5.22705078125, "global_step": 14826, "epoch": 353} {"train_loss": -5.195669651031494, "global_step": 14827, "epoch": 353} {"train_loss": -5.1488037109375, "global_step": 14828, "epoch": 353} {"train_loss": -5.075540065765381, "global_step": 14829, "epoch": 353} {"train_loss": -5.306883811950684, "global_step": 14830, "epoch": 353} {"train_loss": -5.256223201751709, "global_step": 14831, "epoch": 353} {"train_loss": -5.114089012145996, "global_step": 14832, "epoch": 353} {"train_loss": -5.256425857543945, "global_step": 14833, "epoch": 353} {"train_loss": -5.2039031982421875, "global_step": 14834, "epoch": 353} {"train_loss": -5.146974563598633, "global_step": 14835, "epoch": 353} {"train_loss": -5.236907958984375, "global_step": 14836, "epoch": 353} {"train_loss": -5.299095153808594, "global_step": 14837, "epoch": 353} {"train_loss": -5.231668472290039, "global_step": 14838, "epoch": 353} {"train_loss": -5.060976028442383, "global_step": 14839, "epoch": 353} {"train_loss": -5.307782173156738, "global_step": 14840, "epoch": 353} {"train_loss": -5.307765007019043, "global_step": 14841, "epoch": 353} {"train_loss": -5.139628887176514, "global_step": 14842, "epoch": 353} {"train_loss": -5.147723197937012, "global_step": 14843, "epoch": 353} {"train_loss": -5.216483116149902, "global_step": 14844, "epoch": 353} {"train_loss": -4.8891801834106445, "global_step": 14845, "epoch": 353} {"train_loss": -5.050699234008789, "global_step": 14846, "epoch": 353} {"train_loss": -5.170880317687988, "global_step": 14847, "epoch": 353} {"train_loss": -5.091094970703125, "global_step": 14848, "epoch": 353} {"train_loss": -5.066021919250488, "global_step": 14849, "epoch": 353} {"train_loss": -5.216585159301758, "global_step": 14850, "epoch": 353} {"train_loss": -5.106107711791992, "global_step": 14851, "epoch": 353} {"train_loss": -5.15931510925293, "global_step": 14852, "epoch": 353} {"train_loss": -5.2536725997924805, "global_step": 14853, "epoch": 353} {"train_loss": -5.220580577850342, "global_step": 14854, "epoch": 353} {"train_loss": -5.264305591583252, "global_step": 14855, "epoch": 353} {"train_loss": -5.212118148803711, "global_step": 14856, "epoch": 353} {"train_loss": -5.358123779296875, "global_step": 14857, "epoch": 353} {"train_loss": -5.049691200256348, "global_step": 14858, "epoch": 353} {"train_loss": -5.251445770263672, "global_step": 14859, "epoch": 353} {"train_loss": -5.151742935180664, "global_step": 14860, "epoch": 353} {"train_loss": -5.29416036605835, "global_step": 14861, "epoch": 353} {"train_loss": -5.221902847290039, "global_step": 14862, "epoch": 353} {"train_loss": -5.2576751708984375, "global_step": 14863, "epoch": 353} {"train_loss": -5.221521377563477, "global_step": 14864, "epoch": 353} {"train_loss": -5.103116989135742, "global_step": 14865, "epoch": 353} {"train_loss": -5.225715637207031, "global_step": 14866, "epoch": 353} {"train_loss": -5.1861537638164705, "global_step": 14867, "epoch": 353, "val_loss": 69786.9375} {"train_loss": -5.2558183670043945, "global_step": 14868, "epoch": 354} {"train_loss": -5.152463436126709, "global_step": 14869, "epoch": 354} {"train_loss": -5.368771076202393, "global_step": 14870, "epoch": 354} {"train_loss": -5.166413307189941, "global_step": 14871, "epoch": 354} {"train_loss": -5.156975269317627, "global_step": 14872, "epoch": 354} {"train_loss": -5.259564399719238, "global_step": 14873, "epoch": 354} {"train_loss": -5.2169036865234375, "global_step": 14874, "epoch": 354} {"train_loss": -5.023645401000977, "global_step": 14875, "epoch": 354} {"train_loss": -5.261313438415527, "global_step": 14876, "epoch": 354} {"train_loss": -5.117055892944336, "global_step": 14877, "epoch": 354} {"train_loss": -5.098049163818359, "global_step": 14878, "epoch": 354} {"train_loss": -5.217523574829102, "global_step": 14879, "epoch": 354} {"train_loss": -5.22176456451416, "global_step": 14880, "epoch": 354} {"train_loss": -5.133685111999512, "global_step": 14881, "epoch": 354} {"train_loss": -5.123729228973389, "global_step": 14882, "epoch": 354} {"train_loss": -5.163504600524902, "global_step": 14883, "epoch": 354} {"train_loss": -5.229952812194824, "global_step": 14884, "epoch": 354} {"train_loss": -5.029879570007324, "global_step": 14885, "epoch": 354} {"train_loss": -5.2319231033325195, "global_step": 14886, "epoch": 354} {"train_loss": -5.326227188110352, "global_step": 14887, "epoch": 354} {"train_loss": -5.117020606994629, "global_step": 14888, "epoch": 354} {"train_loss": -5.116067409515381, "global_step": 14889, "epoch": 354} {"train_loss": -5.220978260040283, "global_step": 14890, "epoch": 354} {"train_loss": -5.2965545654296875, "global_step": 14891, "epoch": 354} {"train_loss": -5.1690802574157715, "global_step": 14892, "epoch": 354} {"train_loss": -5.159706115722656, "global_step": 14893, "epoch": 354} {"train_loss": -5.296899795532227, "global_step": 14894, "epoch": 354} {"train_loss": -5.288610935211182, "global_step": 14895, "epoch": 354} {"train_loss": -5.131134510040283, "global_step": 14896, "epoch": 354} {"train_loss": -5.223386764526367, "global_step": 14897, "epoch": 354} {"train_loss": -5.238424777984619, "global_step": 14898, "epoch": 354} {"train_loss": -5.153707504272461, "global_step": 14899, "epoch": 354} {"train_loss": -5.005215644836426, "global_step": 14900, "epoch": 354} {"train_loss": -5.268060207366943, "global_step": 14901, "epoch": 354} {"train_loss": -5.063641548156738, "global_step": 14902, "epoch": 354} {"train_loss": -5.07029390335083, "global_step": 14903, "epoch": 354} {"train_loss": -5.196966171264648, "global_step": 14904, "epoch": 354} {"train_loss": -5.152295112609863, "global_step": 14905, "epoch": 354} {"train_loss": -5.135895729064941, "global_step": 14906, "epoch": 354} {"train_loss": -5.277949333190918, "global_step": 14907, "epoch": 354} {"train_loss": -5.218416213989258, "global_step": 14908, "epoch": 354} {"train_loss": -5.185560317266555, "global_step": 14909, "epoch": 354, "val_loss": 70052.7109375} {"train_loss": -5.122566223144531, "global_step": 14910, "epoch": 355} {"train_loss": -5.16331672668457, "global_step": 14911, "epoch": 355} {"train_loss": -5.273136138916016, "global_step": 14912, "epoch": 355} {"train_loss": -5.110306262969971, "global_step": 14913, "epoch": 355} {"train_loss": -5.234920501708984, "global_step": 14914, "epoch": 355} {"train_loss": -5.113956451416016, "global_step": 14915, "epoch": 355} {"train_loss": -5.110085487365723, "global_step": 14916, "epoch": 355} {"train_loss": -5.04569149017334, "global_step": 14917, "epoch": 355} {"train_loss": -5.165854454040527, "global_step": 14918, "epoch": 355} {"train_loss": -5.177371501922607, "global_step": 14919, "epoch": 355} {"train_loss": -5.161623001098633, "global_step": 14920, "epoch": 355} {"train_loss": -5.153786659240723, "global_step": 14921, "epoch": 355} {"train_loss": -5.149211883544922, "global_step": 14922, "epoch": 355} {"train_loss": -5.334697723388672, "global_step": 14923, "epoch": 355} {"train_loss": -5.132244110107422, "global_step": 14924, "epoch": 355} {"train_loss": -5.337760925292969, "global_step": 14925, "epoch": 355} {"train_loss": -5.219928741455078, "global_step": 14926, "epoch": 355} {"train_loss": -5.142439365386963, "global_step": 14927, "epoch": 355} {"train_loss": -5.135577201843262, "global_step": 14928, "epoch": 355} {"train_loss": -5.171998977661133, "global_step": 14929, "epoch": 355} {"train_loss": -5.14564323425293, "global_step": 14930, "epoch": 355} {"train_loss": -5.248769760131836, "global_step": 14931, "epoch": 355} {"train_loss": -5.089390277862549, "global_step": 14932, "epoch": 355} {"train_loss": -5.006635665893555, "global_step": 14933, "epoch": 355} {"train_loss": -5.131420135498047, "global_step": 14934, "epoch": 355} {"train_loss": -5.245762825012207, "global_step": 14935, "epoch": 355} {"train_loss": -5.074476718902588, "global_step": 14936, "epoch": 355} {"train_loss": -5.072734832763672, "global_step": 14937, "epoch": 355} {"train_loss": -5.327500343322754, "global_step": 14938, "epoch": 355} {"train_loss": -5.175868988037109, "global_step": 14939, "epoch": 355} {"train_loss": -5.178869247436523, "global_step": 14940, "epoch": 355} {"train_loss": -5.097040176391602, "global_step": 14941, "epoch": 355} {"train_loss": -5.09978723526001, "global_step": 14942, "epoch": 355} {"train_loss": -5.233748912811279, "global_step": 14943, "epoch": 355} {"train_loss": -5.139892578125, "global_step": 14944, "epoch": 355} {"train_loss": -5.160935401916504, "global_step": 14945, "epoch": 355} {"train_loss": -5.000462055206299, "global_step": 14946, "epoch": 355} {"train_loss": -5.305044651031494, "global_step": 14947, "epoch": 355} {"train_loss": -5.1220574378967285, "global_step": 14948, "epoch": 355} {"train_loss": -5.173488616943359, "global_step": 14949, "epoch": 355} {"train_loss": -5.193402290344238, "global_step": 14950, "epoch": 355} {"train_loss": -5.1662711302439375, "global_step": 14951, "epoch": 355, "val_loss": 70350.8828125} {"train_loss": -5.200467109680176, "global_step": 14952, "epoch": 356} {"train_loss": -5.163898468017578, "global_step": 14953, "epoch": 356} {"train_loss": -5.181312561035156, "global_step": 14954, "epoch": 356} {"train_loss": -5.140427589416504, "global_step": 14955, "epoch": 356} {"train_loss": -5.112332820892334, "global_step": 14956, "epoch": 356} {"train_loss": -5.287908554077148, "global_step": 14957, "epoch": 356} {"train_loss": -5.336113929748535, "global_step": 14958, "epoch": 356} {"train_loss": -5.244803428649902, "global_step": 14959, "epoch": 356} {"train_loss": -5.171913146972656, "global_step": 14960, "epoch": 356} {"train_loss": -5.250736236572266, "global_step": 14961, "epoch": 356} {"train_loss": -5.211604118347168, "global_step": 14962, "epoch": 356} {"train_loss": -5.179758548736572, "global_step": 14963, "epoch": 356} {"train_loss": -5.067368984222412, "global_step": 14964, "epoch": 356} {"train_loss": -5.173249244689941, "global_step": 14965, "epoch": 356} {"train_loss": -5.170289993286133, "global_step": 14966, "epoch": 356} {"train_loss": -4.9960618019104, "global_step": 14967, "epoch": 356} {"train_loss": -5.2452921867370605, "global_step": 14968, "epoch": 356} {"train_loss": -5.188070297241211, "global_step": 14969, "epoch": 356} {"train_loss": -5.245685577392578, "global_step": 14970, "epoch": 356} {"train_loss": -5.22594690322876, "global_step": 14971, "epoch": 356} {"train_loss": -5.175304889678955, "global_step": 14972, "epoch": 356} {"train_loss": -5.189939975738525, "global_step": 14973, "epoch": 356} {"train_loss": -5.221963882446289, "global_step": 14974, "epoch": 356} {"train_loss": -5.092890739440918, "global_step": 14975, "epoch": 356} {"train_loss": -5.171974182128906, "global_step": 14976, "epoch": 356} {"train_loss": -5.0936479568481445, "global_step": 14977, "epoch": 356} {"train_loss": -5.112377166748047, "global_step": 14978, "epoch": 356} {"train_loss": -5.1718668937683105, "global_step": 14979, "epoch": 356} {"train_loss": -5.139455795288086, "global_step": 14980, "epoch": 356} {"train_loss": -5.269844055175781, "global_step": 14981, "epoch": 356} {"train_loss": -5.155815124511719, "global_step": 14982, "epoch": 356} {"train_loss": -5.14335823059082, "global_step": 14983, "epoch": 356} {"train_loss": -5.197271823883057, "global_step": 14984, "epoch": 356} {"train_loss": -5.041909694671631, "global_step": 14985, "epoch": 356} {"train_loss": -5.157938003540039, "global_step": 14986, "epoch": 356} {"train_loss": -5.249755859375, "global_step": 14987, "epoch": 356} {"train_loss": -5.069119930267334, "global_step": 14988, "epoch": 356} {"train_loss": -5.129612445831299, "global_step": 14989, "epoch": 356} {"train_loss": -5.244343280792236, "global_step": 14990, "epoch": 356} {"train_loss": -5.201225280761719, "global_step": 14991, "epoch": 356} {"train_loss": -5.210509300231934, "global_step": 14992, "epoch": 356} {"train_loss": -5.179635240918114, "global_step": 14993, "epoch": 356, "val_loss": 69541.9921875} {"train_loss": -5.100635051727295, "global_step": 14994, "epoch": 357} {"train_loss": -5.188877105712891, "global_step": 14995, "epoch": 357} {"train_loss": -5.111846923828125, "global_step": 14996, "epoch": 357} {"train_loss": -5.175278663635254, "global_step": 14997, "epoch": 357} {"train_loss": -5.2316508293151855, "global_step": 14998, "epoch": 357} {"train_loss": -5.262115478515625, "global_step": 14999, "epoch": 357} {"train_loss": -5.251752853393555, "global_step": 15000, "epoch": 357} {"train_loss": -5.365339279174805, "global_step": 15001, "epoch": 357} {"train_loss": -5.1942949295043945, "global_step": 15002, "epoch": 357} {"train_loss": -5.066960334777832, "global_step": 15003, "epoch": 357} {"train_loss": -5.1902546882629395, "global_step": 15004, "epoch": 357} {"train_loss": -5.252774238586426, "global_step": 15005, "epoch": 357} {"train_loss": -5.282144546508789, "global_step": 15006, "epoch": 357} {"train_loss": -5.223306655883789, "global_step": 15007, "epoch": 357} {"train_loss": -5.289316177368164, "global_step": 15008, "epoch": 357} {"train_loss": -5.162113189697266, "global_step": 15009, "epoch": 357} {"train_loss": -5.2335052490234375, "global_step": 15010, "epoch": 357} {"train_loss": -5.222984313964844, "global_step": 15011, "epoch": 357} {"train_loss": -5.323119163513184, "global_step": 15012, "epoch": 357} {"train_loss": -5.215324401855469, "global_step": 15013, "epoch": 357} {"train_loss": -5.056680679321289, "global_step": 15014, "epoch": 357} {"train_loss": -5.181887626647949, "global_step": 15015, "epoch": 357} {"train_loss": -5.174518585205078, "global_step": 15016, "epoch": 357} {"train_loss": -5.292306900024414, "global_step": 15017, "epoch": 357} {"train_loss": -5.265263557434082, "global_step": 15018, "epoch": 357} {"train_loss": -5.3654279708862305, "global_step": 15019, "epoch": 357} {"train_loss": -5.21835470199585, "global_step": 15020, "epoch": 357} {"train_loss": -5.170005798339844, "global_step": 15021, "epoch": 357} {"train_loss": -5.253110885620117, "global_step": 15022, "epoch": 357} {"train_loss": -5.117400646209717, "global_step": 15023, "epoch": 357} {"train_loss": -5.135053634643555, "global_step": 15024, "epoch": 357} {"train_loss": -5.178647994995117, "global_step": 15025, "epoch": 357} {"train_loss": -5.250194549560547, "global_step": 15026, "epoch": 357} {"train_loss": -5.175188064575195, "global_step": 15027, "epoch": 357} {"train_loss": -5.287151336669922, "global_step": 15028, "epoch": 357} {"train_loss": -5.13187313079834, "global_step": 15029, "epoch": 357} {"train_loss": -5.2491655349731445, "global_step": 15030, "epoch": 357} {"train_loss": -5.163602352142334, "global_step": 15031, "epoch": 357} {"train_loss": -5.289464950561523, "global_step": 15032, "epoch": 357} {"train_loss": -5.222438335418701, "global_step": 15033, "epoch": 357} {"train_loss": -5.157978057861328, "global_step": 15034, "epoch": 357} {"train_loss": -5.210408063161941, "global_step": 15035, "epoch": 357, "val_loss": 70021.5078125} {"train_loss": -5.269631385803223, "global_step": 15036, "epoch": 358} {"train_loss": -5.137430191040039, "global_step": 15037, "epoch": 358} {"train_loss": -5.203400611877441, "global_step": 15038, "epoch": 358} {"train_loss": -5.121413230895996, "global_step": 15039, "epoch": 358} {"train_loss": -5.178248882293701, "global_step": 15040, "epoch": 358} {"train_loss": -5.204439163208008, "global_step": 15041, "epoch": 358} {"train_loss": -5.151074409484863, "global_step": 15042, "epoch": 358} {"train_loss": -5.154294967651367, "global_step": 15043, "epoch": 358} {"train_loss": -5.05985164642334, "global_step": 15044, "epoch": 358} {"train_loss": -5.18032169342041, "global_step": 15045, "epoch": 358} {"train_loss": -5.09283971786499, "global_step": 15046, "epoch": 358} {"train_loss": -5.010281562805176, "global_step": 15047, "epoch": 358} {"train_loss": -5.15519905090332, "global_step": 15048, "epoch": 358} {"train_loss": -5.120569229125977, "global_step": 15049, "epoch": 358} {"train_loss": -5.207884311676025, "global_step": 15050, "epoch": 358} {"train_loss": -5.255471229553223, "global_step": 15051, "epoch": 358} {"train_loss": -5.115025043487549, "global_step": 15052, "epoch": 358} {"train_loss": -5.200569152832031, "global_step": 15053, "epoch": 358} {"train_loss": -5.220778942108154, "global_step": 15054, "epoch": 358} {"train_loss": -5.11940860748291, "global_step": 15055, "epoch": 358} {"train_loss": -5.233526229858398, "global_step": 15056, "epoch": 358} {"train_loss": -5.165905952453613, "global_step": 15057, "epoch": 358} {"train_loss": -5.134913444519043, "global_step": 15058, "epoch": 358} {"train_loss": -5.212437629699707, "global_step": 15059, "epoch": 358} {"train_loss": -5.076333045959473, "global_step": 15060, "epoch": 358} {"train_loss": -5.258537292480469, "global_step": 15061, "epoch": 358} {"train_loss": -5.183158874511719, "global_step": 15062, "epoch": 358} {"train_loss": -5.132556915283203, "global_step": 15063, "epoch": 358} {"train_loss": -5.235991477966309, "global_step": 15064, "epoch": 358} {"train_loss": -5.125503063201904, "global_step": 15065, "epoch": 358} {"train_loss": -5.118414878845215, "global_step": 15066, "epoch": 358} {"train_loss": -5.345236301422119, "global_step": 15067, "epoch": 358} {"train_loss": -5.101839065551758, "global_step": 15068, "epoch": 358} {"train_loss": -5.304994106292725, "global_step": 15069, "epoch": 358} {"train_loss": -5.172879219055176, "global_step": 15070, "epoch": 358} {"train_loss": -5.286643028259277, "global_step": 15071, "epoch": 358} {"train_loss": -5.134320259094238, "global_step": 15072, "epoch": 358} {"train_loss": -5.116585731506348, "global_step": 15073, "epoch": 358} {"train_loss": -5.174671173095703, "global_step": 15074, "epoch": 358} {"train_loss": -5.043548583984375, "global_step": 15075, "epoch": 358} {"train_loss": -5.1366190910339355, "global_step": 15076, "epoch": 358} {"train_loss": -5.168561356408255, "global_step": 15077, "epoch": 358, "val_loss": 70194.9140625} {"train_loss": -5.135373115539551, "global_step": 15078, "epoch": 359} {"train_loss": -5.070563793182373, "global_step": 15079, "epoch": 359} {"train_loss": -5.334319114685059, "global_step": 15080, "epoch": 359} {"train_loss": -5.089164733886719, "global_step": 15081, "epoch": 359} {"train_loss": -5.079499244689941, "global_step": 15082, "epoch": 359} {"train_loss": -5.13680362701416, "global_step": 15083, "epoch": 359} {"train_loss": -5.1190185546875, "global_step": 15084, "epoch": 359} {"train_loss": -5.217584133148193, "global_step": 15085, "epoch": 359} {"train_loss": -5.133251190185547, "global_step": 15086, "epoch": 359} {"train_loss": -5.155799865722656, "global_step": 15087, "epoch": 359} {"train_loss": -5.0015974044799805, "global_step": 15088, "epoch": 359} {"train_loss": -5.101351261138916, "global_step": 15089, "epoch": 359} {"train_loss": -5.0958709716796875, "global_step": 15090, "epoch": 359} {"train_loss": -5.297544002532959, "global_step": 15091, "epoch": 359} {"train_loss": -5.1660332679748535, "global_step": 15092, "epoch": 359} {"train_loss": -5.225947380065918, "global_step": 15093, "epoch": 359} {"train_loss": -5.167247772216797, "global_step": 15094, "epoch": 359} {"train_loss": -5.194243907928467, "global_step": 15095, "epoch": 359} {"train_loss": -5.041814804077148, "global_step": 15096, "epoch": 359} {"train_loss": -5.157370567321777, "global_step": 15097, "epoch": 359} {"train_loss": -5.100731372833252, "global_step": 15098, "epoch": 359} {"train_loss": -5.342885971069336, "global_step": 15099, "epoch": 359} {"train_loss": -5.166076183319092, "global_step": 15100, "epoch": 359} {"train_loss": -5.050776958465576, "global_step": 15101, "epoch": 359} {"train_loss": -5.23881721496582, "global_step": 15102, "epoch": 359} {"train_loss": -5.040748596191406, "global_step": 15103, "epoch": 359} {"train_loss": -5.145537376403809, "global_step": 15104, "epoch": 359} {"train_loss": -5.202412128448486, "global_step": 15105, "epoch": 359} {"train_loss": -5.148201942443848, "global_step": 15106, "epoch": 359} {"train_loss": -5.142410755157471, "global_step": 15107, "epoch": 359} {"train_loss": -5.110537528991699, "global_step": 15108, "epoch": 359} {"train_loss": -5.199216842651367, "global_step": 15109, "epoch": 359} {"train_loss": -5.035445690155029, "global_step": 15110, "epoch": 359} {"train_loss": -5.04630184173584, "global_step": 15111, "epoch": 359} {"train_loss": -5.283002853393555, "global_step": 15112, "epoch": 359} {"train_loss": -5.137862205505371, "global_step": 15113, "epoch": 359} {"train_loss": -5.100295066833496, "global_step": 15114, "epoch": 359} {"train_loss": -5.176116943359375, "global_step": 15115, "epoch": 359} {"train_loss": -5.1376543045043945, "global_step": 15116, "epoch": 359} {"train_loss": -5.260702610015869, "global_step": 15117, "epoch": 359} {"train_loss": -5.113495349884033, "global_step": 15118, "epoch": 359} {"train_loss": -5.150721595400856, "global_step": 15119, "epoch": 359, "val_loss": 69948.0859375} {"train_loss": -5.02414083480835, "global_step": 15120, "epoch": 360} {"train_loss": -5.153721809387207, "global_step": 15121, "epoch": 360} {"train_loss": -5.308611869812012, "global_step": 15122, "epoch": 360} {"train_loss": -5.288387298583984, "global_step": 15123, "epoch": 360} {"train_loss": -5.30276346206665, "global_step": 15124, "epoch": 360} {"train_loss": -5.286080360412598, "global_step": 15125, "epoch": 360} {"train_loss": -5.212944984436035, "global_step": 15126, "epoch": 360} {"train_loss": -5.168437957763672, "global_step": 15127, "epoch": 360} {"train_loss": -5.211085796356201, "global_step": 15128, "epoch": 360} {"train_loss": -5.27963924407959, "global_step": 15129, "epoch": 360} {"train_loss": -5.248607635498047, "global_step": 15130, "epoch": 360} {"train_loss": -5.186849594116211, "global_step": 15131, "epoch": 360} {"train_loss": -5.366990089416504, "global_step": 15132, "epoch": 360} {"train_loss": -5.218717575073242, "global_step": 15133, "epoch": 360} {"train_loss": -4.986970901489258, "global_step": 15134, "epoch": 360} {"train_loss": -5.299896240234375, "global_step": 15135, "epoch": 360} {"train_loss": -5.166406631469727, "global_step": 15136, "epoch": 360} {"train_loss": -5.206501007080078, "global_step": 15137, "epoch": 360} {"train_loss": -5.108524322509766, "global_step": 15138, "epoch": 360} {"train_loss": -5.070062637329102, "global_step": 15139, "epoch": 360} {"train_loss": -5.276419639587402, "global_step": 15140, "epoch": 360} {"train_loss": -5.147171974182129, "global_step": 15141, "epoch": 360} {"train_loss": -5.2551703453063965, "global_step": 15142, "epoch": 360} {"train_loss": -5.159452438354492, "global_step": 15143, "epoch": 360} {"train_loss": -5.031500816345215, "global_step": 15144, "epoch": 360} {"train_loss": -5.052159786224365, "global_step": 15145, "epoch": 360} {"train_loss": -5.271425724029541, "global_step": 15146, "epoch": 360} {"train_loss": -5.282548427581787, "global_step": 15147, "epoch": 360} {"train_loss": -5.0908942222595215, "global_step": 15148, "epoch": 360} {"train_loss": -5.212790012359619, "global_step": 15149, "epoch": 360} {"train_loss": -5.2680511474609375, "global_step": 15150, "epoch": 360} {"train_loss": -5.1156511306762695, "global_step": 15151, "epoch": 360} {"train_loss": -5.122191905975342, "global_step": 15152, "epoch": 360} {"train_loss": -5.259259223937988, "global_step": 15153, "epoch": 360} {"train_loss": -5.0868425369262695, "global_step": 15154, "epoch": 360} {"train_loss": -5.125185012817383, "global_step": 15155, "epoch": 360} {"train_loss": -5.0634894371032715, "global_step": 15156, "epoch": 360} {"train_loss": -5.238670349121094, "global_step": 15157, "epoch": 360} {"train_loss": -5.192567825317383, "global_step": 15158, "epoch": 360} {"train_loss": -5.14907169342041, "global_step": 15159, "epoch": 360} {"train_loss": -5.053441047668457, "global_step": 15160, "epoch": 360} {"train_loss": -5.1822987624577115, "global_step": 15161, "epoch": 360, "val_loss": 70292.71875} {"train_loss": -5.24036169052124, "global_step": 15162, "epoch": 361} {"train_loss": -5.301121234893799, "global_step": 15163, "epoch": 361} {"train_loss": -5.120667457580566, "global_step": 15164, "epoch": 361} {"train_loss": -5.246298789978027, "global_step": 15165, "epoch": 361} {"train_loss": -5.141806602478027, "global_step": 15166, "epoch": 361} {"train_loss": -5.072737216949463, "global_step": 15167, "epoch": 361} {"train_loss": -5.2001729011535645, "global_step": 15168, "epoch": 361} {"train_loss": -5.2292609214782715, "global_step": 15169, "epoch": 361} {"train_loss": -5.286388874053955, "global_step": 15170, "epoch": 361} {"train_loss": -5.061666488647461, "global_step": 15171, "epoch": 361} {"train_loss": -5.279933452606201, "global_step": 15172, "epoch": 361} {"train_loss": -5.112990856170654, "global_step": 15173, "epoch": 361} {"train_loss": -5.192949295043945, "global_step": 15174, "epoch": 361} {"train_loss": -5.27657413482666, "global_step": 15175, "epoch": 361} {"train_loss": -4.96146297454834, "global_step": 15176, "epoch": 361} {"train_loss": -4.978772163391113, "global_step": 15177, "epoch": 361} {"train_loss": -5.196655750274658, "global_step": 15178, "epoch": 361} {"train_loss": -5.155909061431885, "global_step": 15179, "epoch": 361} {"train_loss": -5.170238494873047, "global_step": 15180, "epoch": 361} {"train_loss": -4.950596809387207, "global_step": 15181, "epoch": 361} {"train_loss": -5.073502063751221, "global_step": 15182, "epoch": 361} {"train_loss": -5.201847076416016, "global_step": 15183, "epoch": 361} {"train_loss": -5.172913074493408, "global_step": 15184, "epoch": 361} {"train_loss": -4.964419364929199, "global_step": 15185, "epoch": 361} {"train_loss": -5.089234828948975, "global_step": 15186, "epoch": 361} {"train_loss": -5.022749900817871, "global_step": 15187, "epoch": 361} {"train_loss": -5.079008102416992, "global_step": 15188, "epoch": 361} {"train_loss": -5.178272247314453, "global_step": 15189, "epoch": 361} {"train_loss": -5.153553485870361, "global_step": 15190, "epoch": 361} {"train_loss": -5.233772277832031, "global_step": 15191, "epoch": 361} {"train_loss": -5.1162109375, "global_step": 15192, "epoch": 361} {"train_loss": -5.151681423187256, "global_step": 15193, "epoch": 361} {"train_loss": -5.356076240539551, "global_step": 15194, "epoch": 361} {"train_loss": -5.200718402862549, "global_step": 15195, "epoch": 361} {"train_loss": -5.093850612640381, "global_step": 15196, "epoch": 361} {"train_loss": -5.138077735900879, "global_step": 15197, "epoch": 361} {"train_loss": -5.110340595245361, "global_step": 15198, "epoch": 361} {"train_loss": -5.2379655838012695, "global_step": 15199, "epoch": 361} {"train_loss": -5.100987434387207, "global_step": 15200, "epoch": 361} {"train_loss": -5.093329906463623, "global_step": 15201, "epoch": 361} {"train_loss": -5.210790634155273, "global_step": 15202, "epoch": 361} {"train_loss": -5.151819274539039, "global_step": 15203, "epoch": 361, "val_loss": 69639.515625} {"train_loss": -5.154794692993164, "global_step": 15204, "epoch": 362} {"train_loss": -5.357602119445801, "global_step": 15205, "epoch": 362} {"train_loss": -5.19858455657959, "global_step": 15206, "epoch": 362} {"train_loss": -5.163087368011475, "global_step": 15207, "epoch": 362} {"train_loss": -5.282934188842773, "global_step": 15208, "epoch": 362} {"train_loss": -5.152829170227051, "global_step": 15209, "epoch": 362} {"train_loss": -5.109528541564941, "global_step": 15210, "epoch": 362} {"train_loss": -5.19227409362793, "global_step": 15211, "epoch": 362} {"train_loss": -5.33685827255249, "global_step": 15212, "epoch": 362} {"train_loss": -5.128561973571777, "global_step": 15213, "epoch": 362} {"train_loss": -5.180872917175293, "global_step": 15214, "epoch": 362} {"train_loss": -5.266932010650635, "global_step": 15215, "epoch": 362} {"train_loss": -5.055986404418945, "global_step": 15216, "epoch": 362} {"train_loss": -5.141054153442383, "global_step": 15217, "epoch": 362} {"train_loss": -5.150397300720215, "global_step": 15218, "epoch": 362} {"train_loss": -5.06865930557251, "global_step": 15219, "epoch": 362} {"train_loss": -5.246562480926514, "global_step": 15220, "epoch": 362} {"train_loss": -5.178018569946289, "global_step": 15221, "epoch": 362} {"train_loss": -5.169051647186279, "global_step": 15222, "epoch": 362} {"train_loss": -5.072033882141113, "global_step": 15223, "epoch": 362} {"train_loss": -5.302071571350098, "global_step": 15224, "epoch": 362} {"train_loss": -5.123065948486328, "global_step": 15225, "epoch": 362} {"train_loss": -5.173608303070068, "global_step": 15226, "epoch": 362} {"train_loss": -5.268902778625488, "global_step": 15227, "epoch": 362} {"train_loss": -5.120002746582031, "global_step": 15228, "epoch": 362} {"train_loss": -5.192659854888916, "global_step": 15229, "epoch": 362} {"train_loss": -5.021819591522217, "global_step": 15230, "epoch": 362} {"train_loss": -5.0852155685424805, "global_step": 15231, "epoch": 362} {"train_loss": -5.163330078125, "global_step": 15232, "epoch": 362} {"train_loss": -5.13383674621582, "global_step": 15233, "epoch": 362} {"train_loss": -5.294478416442871, "global_step": 15234, "epoch": 362} {"train_loss": -5.124763488769531, "global_step": 15235, "epoch": 362} {"train_loss": -5.133273124694824, "global_step": 15236, "epoch": 362} {"train_loss": -5.263880252838135, "global_step": 15237, "epoch": 362} {"train_loss": -5.193355560302734, "global_step": 15238, "epoch": 362} {"train_loss": -5.1201982498168945, "global_step": 15239, "epoch": 362} {"train_loss": -5.336915493011475, "global_step": 15240, "epoch": 362} {"train_loss": -5.202947616577148, "global_step": 15241, "epoch": 362} {"train_loss": -5.037843704223633, "global_step": 15242, "epoch": 362} {"train_loss": -5.120957374572754, "global_step": 15243, "epoch": 362} {"train_loss": -5.127756595611572, "global_step": 15244, "epoch": 362} {"train_loss": -5.172967150097802, "global_step": 15245, "epoch": 362, "val_loss": 69885.4375} {"train_loss": -5.118741035461426, "global_step": 15246, "epoch": 363} {"train_loss": -5.213430404663086, "global_step": 15247, "epoch": 363} {"train_loss": -5.246481418609619, "global_step": 15248, "epoch": 363} {"train_loss": -5.189269065856934, "global_step": 15249, "epoch": 363} {"train_loss": -5.296759605407715, "global_step": 15250, "epoch": 363} {"train_loss": -5.011512756347656, "global_step": 15251, "epoch": 363} {"train_loss": -5.127126693725586, "global_step": 15252, "epoch": 363} {"train_loss": -5.124670028686523, "global_step": 15253, "epoch": 363} {"train_loss": -5.19657564163208, "global_step": 15254, "epoch": 363} {"train_loss": -5.254158020019531, "global_step": 15255, "epoch": 363} {"train_loss": -4.985762596130371, "global_step": 15256, "epoch": 363} {"train_loss": -5.18171501159668, "global_step": 15257, "epoch": 363} {"train_loss": -5.23882532119751, "global_step": 15258, "epoch": 363} {"train_loss": -5.171675682067871, "global_step": 15259, "epoch": 363} {"train_loss": -5.137582778930664, "global_step": 15260, "epoch": 363} {"train_loss": -5.161229610443115, "global_step": 15261, "epoch": 363} {"train_loss": -5.255676746368408, "global_step": 15262, "epoch": 363} {"train_loss": -5.159854888916016, "global_step": 15263, "epoch": 363} {"train_loss": -5.253963470458984, "global_step": 15264, "epoch": 363} {"train_loss": -5.143640518188477, "global_step": 15265, "epoch": 363} {"train_loss": -5.197870254516602, "global_step": 15266, "epoch": 363} {"train_loss": -5.143420219421387, "global_step": 15267, "epoch": 363} {"train_loss": -5.08458137512207, "global_step": 15268, "epoch": 363} {"train_loss": -5.226763725280762, "global_step": 15269, "epoch": 363} {"train_loss": -5.168147087097168, "global_step": 15270, "epoch": 363} {"train_loss": -5.041624546051025, "global_step": 15271, "epoch": 363} {"train_loss": -5.137066841125488, "global_step": 15272, "epoch": 363} {"train_loss": -5.3463873863220215, "global_step": 15273, "epoch": 363} {"train_loss": -4.9482831954956055, "global_step": 15274, "epoch": 363} {"train_loss": -5.207109451293945, "global_step": 15275, "epoch": 363} {"train_loss": -5.170368194580078, "global_step": 15276, "epoch": 363} {"train_loss": -5.016620635986328, "global_step": 15277, "epoch": 363} {"train_loss": -5.076196670532227, "global_step": 15278, "epoch": 363} {"train_loss": -5.2514328956604, "global_step": 15279, "epoch": 363} {"train_loss": -5.097102165222168, "global_step": 15280, "epoch": 363} {"train_loss": -5.194868087768555, "global_step": 15281, "epoch": 363} {"train_loss": -5.3022236824035645, "global_step": 15282, "epoch": 363} {"train_loss": -5.121111869812012, "global_step": 15283, "epoch": 363} {"train_loss": -5.1578803062438965, "global_step": 15284, "epoch": 363} {"train_loss": -5.334606170654297, "global_step": 15285, "epoch": 363} {"train_loss": -5.111326217651367, "global_step": 15286, "epoch": 363} {"train_loss": -5.165887412570772, "global_step": 15287, "epoch": 363, "val_loss": 69335.75} {"train_loss": -5.0630035400390625, "global_step": 15288, "epoch": 364} {"train_loss": -5.266966819763184, "global_step": 15289, "epoch": 364} {"train_loss": -5.252431392669678, "global_step": 15290, "epoch": 364} {"train_loss": -5.15591287612915, "global_step": 15291, "epoch": 364} {"train_loss": -5.312490463256836, "global_step": 15292, "epoch": 364} {"train_loss": -5.2295403480529785, "global_step": 15293, "epoch": 364} {"train_loss": -5.280646324157715, "global_step": 15294, "epoch": 364} {"train_loss": -5.123495578765869, "global_step": 15295, "epoch": 364} {"train_loss": -5.138603687286377, "global_step": 15296, "epoch": 364} {"train_loss": -5.205638885498047, "global_step": 15297, "epoch": 364} {"train_loss": -5.178226470947266, "global_step": 15298, "epoch": 364} {"train_loss": -5.0648627281188965, "global_step": 15299, "epoch": 364} {"train_loss": -5.183035850524902, "global_step": 15300, "epoch": 364} {"train_loss": -5.194271087646484, "global_step": 15301, "epoch": 364} {"train_loss": -5.197118282318115, "global_step": 15302, "epoch": 364} {"train_loss": -5.296545028686523, "global_step": 15303, "epoch": 364} {"train_loss": -5.109886169433594, "global_step": 15304, "epoch": 364} {"train_loss": -5.224741458892822, "global_step": 15305, "epoch": 364} {"train_loss": -5.188416957855225, "global_step": 15306, "epoch": 364} {"train_loss": -5.294602394104004, "global_step": 15307, "epoch": 364} {"train_loss": -5.174878120422363, "global_step": 15308, "epoch": 364} {"train_loss": -5.133331298828125, "global_step": 15309, "epoch": 364} {"train_loss": -5.221891403198242, "global_step": 15310, "epoch": 364} {"train_loss": -5.189386367797852, "global_step": 15311, "epoch": 364} {"train_loss": -5.298402786254883, "global_step": 15312, "epoch": 364} {"train_loss": -5.038776397705078, "global_step": 15313, "epoch": 364} {"train_loss": -5.2257795333862305, "global_step": 15314, "epoch": 364} {"train_loss": -5.171441078186035, "global_step": 15315, "epoch": 364} {"train_loss": -5.257506370544434, "global_step": 15316, "epoch": 364} {"train_loss": -5.072667598724365, "global_step": 15317, "epoch": 364} {"train_loss": -5.263954162597656, "global_step": 15318, "epoch": 364} {"train_loss": -5.3057050704956055, "global_step": 15319, "epoch": 364} {"train_loss": -5.319799423217773, "global_step": 15320, "epoch": 364} {"train_loss": -5.1673431396484375, "global_step": 15321, "epoch": 364} {"train_loss": -5.212066650390625, "global_step": 15322, "epoch": 364} {"train_loss": -5.257510185241699, "global_step": 15323, "epoch": 364} {"train_loss": -5.0046491622924805, "global_step": 15324, "epoch": 364} {"train_loss": -5.261039733886719, "global_step": 15325, "epoch": 364} {"train_loss": -5.222628593444824, "global_step": 15326, "epoch": 364} {"train_loss": -5.171276092529297, "global_step": 15327, "epoch": 364} {"train_loss": -5.323686122894287, "global_step": 15328, "epoch": 364} {"train_loss": -5.202543292726789, "global_step": 15329, "epoch": 364, "val_loss": 69876.9453125} {"train_loss": -5.202723503112793, "global_step": 15330, "epoch": 365} {"train_loss": -5.202686309814453, "global_step": 15331, "epoch": 365} {"train_loss": -5.219893455505371, "global_step": 15332, "epoch": 365} {"train_loss": -5.3379082679748535, "global_step": 15333, "epoch": 365} {"train_loss": -5.29754114151001, "global_step": 15334, "epoch": 365} {"train_loss": -5.211720943450928, "global_step": 15335, "epoch": 365} {"train_loss": -5.116548538208008, "global_step": 15336, "epoch": 365} {"train_loss": -5.275087356567383, "global_step": 15337, "epoch": 365} {"train_loss": -5.303190231323242, "global_step": 15338, "epoch": 365} {"train_loss": -5.290899276733398, "global_step": 15339, "epoch": 365} {"train_loss": -5.247018814086914, "global_step": 15340, "epoch": 365} {"train_loss": -5.1609039306640625, "global_step": 15341, "epoch": 365} {"train_loss": -5.29833459854126, "global_step": 15342, "epoch": 365} {"train_loss": -5.292991638183594, "global_step": 15343, "epoch": 365} {"train_loss": -5.229804992675781, "global_step": 15344, "epoch": 365} {"train_loss": -5.031396865844727, "global_step": 15345, "epoch": 365} {"train_loss": -5.143443584442139, "global_step": 15346, "epoch": 365} {"train_loss": -5.127008438110352, "global_step": 15347, "epoch": 365} {"train_loss": -5.201554298400879, "global_step": 15348, "epoch": 365} {"train_loss": -5.0763044357299805, "global_step": 15349, "epoch": 365} {"train_loss": -5.013505935668945, "global_step": 15350, "epoch": 365} {"train_loss": -5.227451324462891, "global_step": 15351, "epoch": 365} {"train_loss": -5.085944175720215, "global_step": 15352, "epoch": 365} {"train_loss": -4.934122562408447, "global_step": 15353, "epoch": 365} {"train_loss": -5.147218704223633, "global_step": 15354, "epoch": 365} {"train_loss": -5.0963850021362305, "global_step": 15355, "epoch": 365} {"train_loss": -4.935918807983398, "global_step": 15356, "epoch": 365} {"train_loss": -5.101798057556152, "global_step": 15357, "epoch": 365} {"train_loss": -5.101685523986816, "global_step": 15358, "epoch": 365} {"train_loss": -5.137916088104248, "global_step": 15359, "epoch": 365} {"train_loss": -5.213527679443359, "global_step": 15360, "epoch": 365} {"train_loss": -5.230226516723633, "global_step": 15361, "epoch": 365} {"train_loss": -5.2189178466796875, "global_step": 15362, "epoch": 365} {"train_loss": -5.197101593017578, "global_step": 15363, "epoch": 365} {"train_loss": -5.308056354522705, "global_step": 15364, "epoch": 365} {"train_loss": -5.11737060546875, "global_step": 15365, "epoch": 365} {"train_loss": -5.206930160522461, "global_step": 15366, "epoch": 365} {"train_loss": -5.089232444763184, "global_step": 15367, "epoch": 365} {"train_loss": -5.124351501464844, "global_step": 15368, "epoch": 365} {"train_loss": -5.089571952819824, "global_step": 15369, "epoch": 365} {"train_loss": -5.045897483825684, "global_step": 15370, "epoch": 365} {"train_loss": -5.165932371502831, "global_step": 15371, "epoch": 365, "val_loss": 69508.6796875} {"train_loss": -5.182546615600586, "global_step": 15372, "epoch": 366} {"train_loss": -5.231440544128418, "global_step": 15373, "epoch": 366} {"train_loss": -5.241462230682373, "global_step": 15374, "epoch": 366} {"train_loss": -5.165369510650635, "global_step": 15375, "epoch": 366} {"train_loss": -5.127174377441406, "global_step": 15376, "epoch": 366} {"train_loss": -5.264223098754883, "global_step": 15377, "epoch": 366} {"train_loss": -5.176608085632324, "global_step": 15378, "epoch": 366} {"train_loss": -5.297204971313477, "global_step": 15379, "epoch": 366} {"train_loss": -5.224878311157227, "global_step": 15380, "epoch": 366} {"train_loss": -5.139150619506836, "global_step": 15381, "epoch": 366} {"train_loss": -5.165004730224609, "global_step": 15382, "epoch": 366} {"train_loss": -5.19266414642334, "global_step": 15383, "epoch": 366} {"train_loss": -5.217153549194336, "global_step": 15384, "epoch": 366} {"train_loss": -5.133627891540527, "global_step": 15385, "epoch": 366} {"train_loss": -5.289702415466309, "global_step": 15386, "epoch": 366} {"train_loss": -5.3073930740356445, "global_step": 15387, "epoch": 366} {"train_loss": -5.202197551727295, "global_step": 15388, "epoch": 366} {"train_loss": -5.321711540222168, "global_step": 15389, "epoch": 366} {"train_loss": -5.275776386260986, "global_step": 15390, "epoch": 366} {"train_loss": -5.132353782653809, "global_step": 15391, "epoch": 366} {"train_loss": -5.145759582519531, "global_step": 15392, "epoch": 366} {"train_loss": -5.149724006652832, "global_step": 15393, "epoch": 366} {"train_loss": -5.118481636047363, "global_step": 15394, "epoch": 366} {"train_loss": -5.123352527618408, "global_step": 15395, "epoch": 366} {"train_loss": -5.139822006225586, "global_step": 15396, "epoch": 366} {"train_loss": -5.132457733154297, "global_step": 15397, "epoch": 366} {"train_loss": -5.172239303588867, "global_step": 15398, "epoch": 366} {"train_loss": -5.140552520751953, "global_step": 15399, "epoch": 366} {"train_loss": -5.264756202697754, "global_step": 15400, "epoch": 366} {"train_loss": -5.298249244689941, "global_step": 15401, "epoch": 366} {"train_loss": -5.089540004730225, "global_step": 15402, "epoch": 366} {"train_loss": -5.260990142822266, "global_step": 15403, "epoch": 366} {"train_loss": -5.096776962280273, "global_step": 15404, "epoch": 366} {"train_loss": -5.244580268859863, "global_step": 15405, "epoch": 366} {"train_loss": -5.251031875610352, "global_step": 15406, "epoch": 366} {"train_loss": -5.264298439025879, "global_step": 15407, "epoch": 366} {"train_loss": -5.09170389175415, "global_step": 15408, "epoch": 366} {"train_loss": -5.260855674743652, "global_step": 15409, "epoch": 366} {"train_loss": -5.16534948348999, "global_step": 15410, "epoch": 366} {"train_loss": -5.253438472747803, "global_step": 15411, "epoch": 366} {"train_loss": -5.28092098236084, "global_step": 15412, "epoch": 366} {"train_loss": -5.200699034191313, "global_step": 15413, "epoch": 366, "val_loss": 69545.0625} {"train_loss": -5.124913692474365, "global_step": 15414, "epoch": 367} {"train_loss": -5.26128625869751, "global_step": 15415, "epoch": 367} {"train_loss": -5.193364143371582, "global_step": 15416, "epoch": 367} {"train_loss": -5.1473894119262695, "global_step": 15417, "epoch": 367} {"train_loss": -5.095221996307373, "global_step": 15418, "epoch": 367} {"train_loss": -5.18359375, "global_step": 15419, "epoch": 367} {"train_loss": -5.145586967468262, "global_step": 15420, "epoch": 367} {"train_loss": -5.042661666870117, "global_step": 15421, "epoch": 367} {"train_loss": -5.211773872375488, "global_step": 15422, "epoch": 367} {"train_loss": -5.228663444519043, "global_step": 15423, "epoch": 367} {"train_loss": -5.235593795776367, "global_step": 15424, "epoch": 367} {"train_loss": -5.246630668640137, "global_step": 15425, "epoch": 367} {"train_loss": -5.157546043395996, "global_step": 15426, "epoch": 367} {"train_loss": -5.236078262329102, "global_step": 15427, "epoch": 367} {"train_loss": -5.297572135925293, "global_step": 15428, "epoch": 367} {"train_loss": -5.260661602020264, "global_step": 15429, "epoch": 367} {"train_loss": -5.093393325805664, "global_step": 15430, "epoch": 367} {"train_loss": -5.250178813934326, "global_step": 15431, "epoch": 367} {"train_loss": -5.128823757171631, "global_step": 15432, "epoch": 367} {"train_loss": -5.164901256561279, "global_step": 15433, "epoch": 367} {"train_loss": -5.121457099914551, "global_step": 15434, "epoch": 367} {"train_loss": -5.213171005249023, "global_step": 15435, "epoch": 367} {"train_loss": -5.196717739105225, "global_step": 15436, "epoch": 367} {"train_loss": -5.204679012298584, "global_step": 15437, "epoch": 367} {"train_loss": -5.14908504486084, "global_step": 15438, "epoch": 367} {"train_loss": -5.241176605224609, "global_step": 15439, "epoch": 367} {"train_loss": -5.348362445831299, "global_step": 15440, "epoch": 367} {"train_loss": -5.181241512298584, "global_step": 15441, "epoch": 367} {"train_loss": -5.149112701416016, "global_step": 15442, "epoch": 367} {"train_loss": -5.257777690887451, "global_step": 15443, "epoch": 367} {"train_loss": -5.071846961975098, "global_step": 15444, "epoch": 367} {"train_loss": -5.268193244934082, "global_step": 15445, "epoch": 367} {"train_loss": -5.059048652648926, "global_step": 15446, "epoch": 367} {"train_loss": -5.16762638092041, "global_step": 15447, "epoch": 367} {"train_loss": -5.343517780303955, "global_step": 15448, "epoch": 367} {"train_loss": -5.159594535827637, "global_step": 15449, "epoch": 367} {"train_loss": -5.132478713989258, "global_step": 15450, "epoch": 367} {"train_loss": -5.430316925048828, "global_step": 15451, "epoch": 367} {"train_loss": -5.233736991882324, "global_step": 15452, "epoch": 367} {"train_loss": -5.0921711921691895, "global_step": 15453, "epoch": 367} {"train_loss": -5.234775543212891, "global_step": 15454, "epoch": 367} {"train_loss": -5.197581972394671, "global_step": 15455, "epoch": 367, "val_loss": 70441.5859375} {"train_loss": -5.124688148498535, "global_step": 15456, "epoch": 368} {"train_loss": -5.199840545654297, "global_step": 15457, "epoch": 368} {"train_loss": -5.129489421844482, "global_step": 15458, "epoch": 368} {"train_loss": -5.1474199295043945, "global_step": 15459, "epoch": 368} {"train_loss": -5.308205604553223, "global_step": 15460, "epoch": 368} {"train_loss": -5.311477184295654, "global_step": 15461, "epoch": 368} {"train_loss": -5.180882453918457, "global_step": 15462, "epoch": 368} {"train_loss": -5.193606376647949, "global_step": 15463, "epoch": 368} {"train_loss": -4.948601722717285, "global_step": 15464, "epoch": 368} {"train_loss": -5.293283462524414, "global_step": 15465, "epoch": 368} {"train_loss": -5.196300029754639, "global_step": 15466, "epoch": 368} {"train_loss": -5.124756813049316, "global_step": 15467, "epoch": 368} {"train_loss": -5.266661643981934, "global_step": 15468, "epoch": 368} {"train_loss": -5.064884185791016, "global_step": 15469, "epoch": 368} {"train_loss": -5.2151618003845215, "global_step": 15470, "epoch": 368} {"train_loss": -5.29264497756958, "global_step": 15471, "epoch": 368} {"train_loss": -5.226083755493164, "global_step": 15472, "epoch": 368} {"train_loss": -5.1474103927612305, "global_step": 15473, "epoch": 368} {"train_loss": -5.255982875823975, "global_step": 15474, "epoch": 368} {"train_loss": -5.13065242767334, "global_step": 15475, "epoch": 368} {"train_loss": -5.104382038116455, "global_step": 15476, "epoch": 368} {"train_loss": -5.265030860900879, "global_step": 15477, "epoch": 368} {"train_loss": -5.137125015258789, "global_step": 15478, "epoch": 368} {"train_loss": -5.150337219238281, "global_step": 15479, "epoch": 368} {"train_loss": -5.143059730529785, "global_step": 15480, "epoch": 368} {"train_loss": -5.147607803344727, "global_step": 15481, "epoch": 368} {"train_loss": -5.175446510314941, "global_step": 15482, "epoch": 368} {"train_loss": -5.24348783493042, "global_step": 15483, "epoch": 368} {"train_loss": -5.064145565032959, "global_step": 15484, "epoch": 368} {"train_loss": -5.164448261260986, "global_step": 15485, "epoch": 368} {"train_loss": -5.209600448608398, "global_step": 15486, "epoch": 368} {"train_loss": -5.3416428565979, "global_step": 15487, "epoch": 368} {"train_loss": -5.243688106536865, "global_step": 15488, "epoch": 368} {"train_loss": -5.273114204406738, "global_step": 15489, "epoch": 368} {"train_loss": -5.203621864318848, "global_step": 15490, "epoch": 368} {"train_loss": -5.166043281555176, "global_step": 15491, "epoch": 368} {"train_loss": -5.102703094482422, "global_step": 15492, "epoch": 368} {"train_loss": -5.172170639038086, "global_step": 15493, "epoch": 368} {"train_loss": -5.2213544845581055, "global_step": 15494, "epoch": 368} {"train_loss": -5.099697113037109, "global_step": 15495, "epoch": 368} {"train_loss": -5.275482654571533, "global_step": 15496, "epoch": 368} {"train_loss": -5.183379581996372, "global_step": 15497, "epoch": 368, "val_loss": 70274.375} {"train_loss": -5.017576217651367, "global_step": 15498, "epoch": 369} {"train_loss": -5.34251070022583, "global_step": 15499, "epoch": 369} {"train_loss": -5.047643661499023, "global_step": 15500, "epoch": 369} {"train_loss": -5.005623817443848, "global_step": 15501, "epoch": 369} {"train_loss": -5.329552173614502, "global_step": 15502, "epoch": 369} {"train_loss": -5.0912580490112305, "global_step": 15503, "epoch": 369} {"train_loss": -5.066461563110352, "global_step": 15504, "epoch": 369} {"train_loss": -5.195723056793213, "global_step": 15505, "epoch": 369} {"train_loss": -5.1896796226501465, "global_step": 15506, "epoch": 369} {"train_loss": -5.168344020843506, "global_step": 15507, "epoch": 369} {"train_loss": -5.050515174865723, "global_step": 15508, "epoch": 369} {"train_loss": -5.1087727546691895, "global_step": 15509, "epoch": 369} {"train_loss": -5.272042751312256, "global_step": 15510, "epoch": 369} {"train_loss": -5.122590065002441, "global_step": 15511, "epoch": 369} {"train_loss": -5.284286022186279, "global_step": 15512, "epoch": 369} {"train_loss": -5.193504333496094, "global_step": 15513, "epoch": 369} {"train_loss": -5.187279224395752, "global_step": 15514, "epoch": 369} {"train_loss": -5.208343029022217, "global_step": 15515, "epoch": 369} {"train_loss": -5.309798717498779, "global_step": 15516, "epoch": 369} {"train_loss": -5.2956061363220215, "global_step": 15517, "epoch": 369} {"train_loss": -5.281243324279785, "global_step": 15518, "epoch": 369} {"train_loss": -5.276203155517578, "global_step": 15519, "epoch": 369} {"train_loss": -5.208034992218018, "global_step": 15520, "epoch": 369} {"train_loss": -5.221560955047607, "global_step": 15521, "epoch": 369} {"train_loss": -5.171534538269043, "global_step": 15522, "epoch": 369} {"train_loss": -5.165194511413574, "global_step": 15523, "epoch": 369} {"train_loss": -5.263629913330078, "global_step": 15524, "epoch": 369} {"train_loss": -5.211589813232422, "global_step": 15525, "epoch": 369} {"train_loss": -5.222479820251465, "global_step": 15526, "epoch": 369} {"train_loss": -5.222092151641846, "global_step": 15527, "epoch": 369} {"train_loss": -5.188775062561035, "global_step": 15528, "epoch": 369} {"train_loss": -5.200057506561279, "global_step": 15529, "epoch": 369} {"train_loss": -5.096160888671875, "global_step": 15530, "epoch": 369} {"train_loss": -5.119581699371338, "global_step": 15531, "epoch": 369} {"train_loss": -5.137541770935059, "global_step": 15532, "epoch": 369} {"train_loss": -5.014317512512207, "global_step": 15533, "epoch": 369} {"train_loss": -5.166014194488525, "global_step": 15534, "epoch": 369} {"train_loss": -5.176887035369873, "global_step": 15535, "epoch": 369} {"train_loss": -5.208118438720703, "global_step": 15536, "epoch": 369} {"train_loss": -5.032528877258301, "global_step": 15537, "epoch": 369} {"train_loss": -5.112583637237549, "global_step": 15538, "epoch": 369} {"train_loss": -5.1770516236623125, "global_step": 15539, "epoch": 369, "val_loss": 70086.03125} {"train_loss": -5.1292033195495605, "global_step": 15540, "epoch": 370} {"train_loss": -5.17131233215332, "global_step": 15541, "epoch": 370} {"train_loss": -5.161828994750977, "global_step": 15542, "epoch": 370} {"train_loss": -5.141207218170166, "global_step": 15543, "epoch": 370} {"train_loss": -5.224435806274414, "global_step": 15544, "epoch": 370} {"train_loss": -5.088752746582031, "global_step": 15545, "epoch": 370} {"train_loss": -5.240464210510254, "global_step": 15546, "epoch": 370} {"train_loss": -5.347477436065674, "global_step": 15547, "epoch": 370} {"train_loss": -5.155707359313965, "global_step": 15548, "epoch": 370} {"train_loss": -5.085936546325684, "global_step": 15549, "epoch": 370} {"train_loss": -5.18350887298584, "global_step": 15550, "epoch": 370} {"train_loss": -5.200014114379883, "global_step": 15551, "epoch": 370} {"train_loss": -5.137925148010254, "global_step": 15552, "epoch": 370} {"train_loss": -5.080171585083008, "global_step": 15553, "epoch": 370} {"train_loss": -5.100611686706543, "global_step": 15554, "epoch": 370} {"train_loss": -5.16357421875, "global_step": 15555, "epoch": 370} {"train_loss": -5.181654930114746, "global_step": 15556, "epoch": 370} {"train_loss": -5.132955551147461, "global_step": 15557, "epoch": 370} {"train_loss": -5.188162803649902, "global_step": 15558, "epoch": 370} {"train_loss": -5.319094657897949, "global_step": 15559, "epoch": 370} {"train_loss": -5.06494140625, "global_step": 15560, "epoch": 370} {"train_loss": -5.182447910308838, "global_step": 15561, "epoch": 370} {"train_loss": -5.333407402038574, "global_step": 15562, "epoch": 370} {"train_loss": -5.030544757843018, "global_step": 15563, "epoch": 370} {"train_loss": -5.023453712463379, "global_step": 15564, "epoch": 370} {"train_loss": -5.3123459815979, "global_step": 15565, "epoch": 370} {"train_loss": -4.995021820068359, "global_step": 15566, "epoch": 370} {"train_loss": -5.222524642944336, "global_step": 15567, "epoch": 370} {"train_loss": -5.209162712097168, "global_step": 15568, "epoch": 370} {"train_loss": -4.918857574462891, "global_step": 15569, "epoch": 370} {"train_loss": -5.198423385620117, "global_step": 15570, "epoch": 370} {"train_loss": -5.208105087280273, "global_step": 15571, "epoch": 370} {"train_loss": -4.947784423828125, "global_step": 15572, "epoch": 370} {"train_loss": -5.257922172546387, "global_step": 15573, "epoch": 370} {"train_loss": -5.053455352783203, "global_step": 15574, "epoch": 370} {"train_loss": -5.086789131164551, "global_step": 15575, "epoch": 370} {"train_loss": -5.143685340881348, "global_step": 15576, "epoch": 370} {"train_loss": -5.156803131103516, "global_step": 15577, "epoch": 370} {"train_loss": -5.2353105545043945, "global_step": 15578, "epoch": 370} {"train_loss": -5.116776943206787, "global_step": 15579, "epoch": 370} {"train_loss": -5.110479354858398, "global_step": 15580, "epoch": 370} {"train_loss": -5.152513424555461, "global_step": 15581, "epoch": 370, "val_loss": 69963.390625} {"train_loss": -5.1251020431518555, "global_step": 15582, "epoch": 371} {"train_loss": -5.153940200805664, "global_step": 15583, "epoch": 371} {"train_loss": -5.127877235412598, "global_step": 15584, "epoch": 371} {"train_loss": -5.2819318771362305, "global_step": 15585, "epoch": 371} {"train_loss": -5.072723388671875, "global_step": 15586, "epoch": 371} {"train_loss": -5.210837364196777, "global_step": 15587, "epoch": 371} {"train_loss": -5.167448043823242, "global_step": 15588, "epoch": 371} {"train_loss": -5.154166221618652, "global_step": 15589, "epoch": 371} {"train_loss": -5.184809684753418, "global_step": 15590, "epoch": 371} {"train_loss": -5.214788436889648, "global_step": 15591, "epoch": 371} {"train_loss": -5.232388019561768, "global_step": 15592, "epoch": 371} {"train_loss": -5.30573034286499, "global_step": 15593, "epoch": 371} {"train_loss": -5.147225379943848, "global_step": 15594, "epoch": 371} {"train_loss": -5.212366104125977, "global_step": 15595, "epoch": 371} {"train_loss": -5.158825397491455, "global_step": 15596, "epoch": 371} {"train_loss": -5.083165168762207, "global_step": 15597, "epoch": 371} {"train_loss": -5.234283447265625, "global_step": 15598, "epoch": 371} {"train_loss": -5.253791809082031, "global_step": 15599, "epoch": 371} {"train_loss": -5.248179912567139, "global_step": 15600, "epoch": 371} {"train_loss": -5.039035320281982, "global_step": 15601, "epoch": 371} {"train_loss": -5.162239074707031, "global_step": 15602, "epoch": 371} {"train_loss": -5.250764846801758, "global_step": 15603, "epoch": 371} {"train_loss": -5.2371978759765625, "global_step": 15604, "epoch": 371} {"train_loss": -5.364865779876709, "global_step": 15605, "epoch": 371} {"train_loss": -5.219768524169922, "global_step": 15606, "epoch": 371} {"train_loss": -5.142251014709473, "global_step": 15607, "epoch": 371} {"train_loss": -5.275390625, "global_step": 15608, "epoch": 371} {"train_loss": -5.108725547790527, "global_step": 15609, "epoch": 371} {"train_loss": -5.185732841491699, "global_step": 15610, "epoch": 371} {"train_loss": -5.203834533691406, "global_step": 15611, "epoch": 371} {"train_loss": -5.2223358154296875, "global_step": 15612, "epoch": 371} {"train_loss": -5.187079429626465, "global_step": 15613, "epoch": 371} {"train_loss": -5.0970072746276855, "global_step": 15614, "epoch": 371} {"train_loss": -5.228801727294922, "global_step": 15615, "epoch": 371} {"train_loss": -5.175833702087402, "global_step": 15616, "epoch": 371} {"train_loss": -5.238753318786621, "global_step": 15617, "epoch": 371} {"train_loss": -5.286501884460449, "global_step": 15618, "epoch": 371} {"train_loss": -5.136761665344238, "global_step": 15619, "epoch": 371} {"train_loss": -5.20255184173584, "global_step": 15620, "epoch": 371} {"train_loss": -5.213573932647705, "global_step": 15621, "epoch": 371} {"train_loss": -5.303579330444336, "global_step": 15622, "epoch": 371} {"train_loss": -5.197182712100801, "global_step": 15623, "epoch": 371, "val_loss": 69656.125} {"train_loss": -5.226780414581299, "global_step": 15624, "epoch": 372} {"train_loss": -5.27888298034668, "global_step": 15625, "epoch": 372} {"train_loss": -5.191361427307129, "global_step": 15626, "epoch": 372} {"train_loss": -5.176130294799805, "global_step": 15627, "epoch": 372} {"train_loss": -5.266674041748047, "global_step": 15628, "epoch": 372} {"train_loss": -5.180047035217285, "global_step": 15629, "epoch": 372} {"train_loss": -5.241804122924805, "global_step": 15630, "epoch": 372} {"train_loss": -5.271422386169434, "global_step": 15631, "epoch": 372} {"train_loss": -5.208230972290039, "global_step": 15632, "epoch": 372} {"train_loss": -5.087360382080078, "global_step": 15633, "epoch": 372} {"train_loss": -5.249917984008789, "global_step": 15634, "epoch": 372} {"train_loss": -5.1891279220581055, "global_step": 15635, "epoch": 372} {"train_loss": -5.178414344787598, "global_step": 15636, "epoch": 372} {"train_loss": -5.285484313964844, "global_step": 15637, "epoch": 372} {"train_loss": -5.166386604309082, "global_step": 15638, "epoch": 372} {"train_loss": -5.208027362823486, "global_step": 15639, "epoch": 372} {"train_loss": -5.235037326812744, "global_step": 15640, "epoch": 372} {"train_loss": -5.260720252990723, "global_step": 15641, "epoch": 372} {"train_loss": -5.133417129516602, "global_step": 15642, "epoch": 372} {"train_loss": -5.258369445800781, "global_step": 15643, "epoch": 372} {"train_loss": -5.234090805053711, "global_step": 15644, "epoch": 372} {"train_loss": -5.311746597290039, "global_step": 15645, "epoch": 372} {"train_loss": -5.110580921173096, "global_step": 15646, "epoch": 372} {"train_loss": -5.1739726066589355, "global_step": 15647, "epoch": 372} {"train_loss": -5.297386646270752, "global_step": 15648, "epoch": 372} {"train_loss": -5.3977813720703125, "global_step": 15649, "epoch": 372} {"train_loss": -5.255072593688965, "global_step": 15650, "epoch": 372} {"train_loss": -5.230273723602295, "global_step": 15651, "epoch": 372} {"train_loss": -5.173550605773926, "global_step": 15652, "epoch": 372} {"train_loss": -5.244425296783447, "global_step": 15653, "epoch": 372} {"train_loss": -5.186578750610352, "global_step": 15654, "epoch": 372} {"train_loss": -5.057683944702148, "global_step": 15655, "epoch": 372} {"train_loss": -5.376940727233887, "global_step": 15656, "epoch": 372} {"train_loss": -5.225945472717285, "global_step": 15657, "epoch": 372} {"train_loss": -5.26692008972168, "global_step": 15658, "epoch": 372} {"train_loss": -5.262490272521973, "global_step": 15659, "epoch": 372} {"train_loss": -5.3832244873046875, "global_step": 15660, "epoch": 372} {"train_loss": -5.1632256507873535, "global_step": 15661, "epoch": 372} {"train_loss": -5.213563919067383, "global_step": 15662, "epoch": 372} {"train_loss": -5.100345134735107, "global_step": 15663, "epoch": 372} {"train_loss": -5.304262161254883, "global_step": 15664, "epoch": 372} {"train_loss": -5.221092519306001, "global_step": 15665, "epoch": 372, "val_loss": 69931.6015625} {"train_loss": -5.1758599281311035, "global_step": 15666, "epoch": 373} {"train_loss": -5.166858673095703, "global_step": 15667, "epoch": 373} {"train_loss": -5.309859752655029, "global_step": 15668, "epoch": 373} {"train_loss": -5.206756591796875, "global_step": 15669, "epoch": 373} {"train_loss": -5.11624813079834, "global_step": 15670, "epoch": 373} {"train_loss": -5.204287528991699, "global_step": 15671, "epoch": 373} {"train_loss": -5.250297546386719, "global_step": 15672, "epoch": 373} {"train_loss": -5.309295654296875, "global_step": 15673, "epoch": 373} {"train_loss": -5.281444549560547, "global_step": 15674, "epoch": 373} {"train_loss": -5.183941841125488, "global_step": 15675, "epoch": 373} {"train_loss": -5.163082122802734, "global_step": 15676, "epoch": 373} {"train_loss": -5.162707328796387, "global_step": 15677, "epoch": 373} {"train_loss": -5.239383697509766, "global_step": 15678, "epoch": 373} {"train_loss": -5.2374067306518555, "global_step": 15679, "epoch": 373} {"train_loss": -5.138487815856934, "global_step": 15680, "epoch": 373} {"train_loss": -5.292632102966309, "global_step": 15681, "epoch": 373} {"train_loss": -5.298458099365234, "global_step": 15682, "epoch": 373} {"train_loss": -5.1903300285339355, "global_step": 15683, "epoch": 373} {"train_loss": -5.204596042633057, "global_step": 15684, "epoch": 373} {"train_loss": -5.1349663734436035, "global_step": 15685, "epoch": 373} {"train_loss": -5.183699607849121, "global_step": 15686, "epoch": 373} {"train_loss": -5.2147979736328125, "global_step": 15687, "epoch": 373} {"train_loss": -5.095033645629883, "global_step": 15688, "epoch": 373} {"train_loss": -5.271839618682861, "global_step": 15689, "epoch": 373} {"train_loss": -5.054325103759766, "global_step": 15690, "epoch": 373} {"train_loss": -5.121578216552734, "global_step": 15691, "epoch": 373} {"train_loss": -5.245273113250732, "global_step": 15692, "epoch": 373} {"train_loss": -5.0830793380737305, "global_step": 15693, "epoch": 373} {"train_loss": -5.193629264831543, "global_step": 15694, "epoch": 373} {"train_loss": -5.252468109130859, "global_step": 15695, "epoch": 373} {"train_loss": -5.083010673522949, "global_step": 15696, "epoch": 373} {"train_loss": -5.0815629959106445, "global_step": 15697, "epoch": 373} {"train_loss": -5.149012565612793, "global_step": 15698, "epoch": 373} {"train_loss": -5.169035911560059, "global_step": 15699, "epoch": 373} {"train_loss": -4.964847564697266, "global_step": 15700, "epoch": 373} {"train_loss": -5.2476654052734375, "global_step": 15701, "epoch": 373} {"train_loss": -5.262639999389648, "global_step": 15702, "epoch": 373} {"train_loss": -5.03742790222168, "global_step": 15703, "epoch": 373} {"train_loss": -5.23512601852417, "global_step": 15704, "epoch": 373} {"train_loss": -5.242776870727539, "global_step": 15705, "epoch": 373} {"train_loss": -5.22374153137207, "global_step": 15706, "epoch": 373} {"train_loss": -5.191664218902588, "global_step": 15707, "epoch": 373, "val_loss": 69741.7265625} {"train_loss": -5.182623863220215, "global_step": 15708, "epoch": 374} {"train_loss": -5.130638599395752, "global_step": 15709, "epoch": 374} {"train_loss": -5.291294574737549, "global_step": 15710, "epoch": 374} {"train_loss": -5.233330726623535, "global_step": 15711, "epoch": 374} {"train_loss": -5.081685543060303, "global_step": 15712, "epoch": 374} {"train_loss": -5.174289703369141, "global_step": 15713, "epoch": 374} {"train_loss": -5.2986040115356445, "global_step": 15714, "epoch": 374} {"train_loss": -5.260003089904785, "global_step": 15715, "epoch": 374} {"train_loss": -5.250772476196289, "global_step": 15716, "epoch": 374} {"train_loss": -5.080167770385742, "global_step": 15717, "epoch": 374} {"train_loss": -5.24757719039917, "global_step": 15718, "epoch": 374} {"train_loss": -5.262093544006348, "global_step": 15719, "epoch": 374} {"train_loss": -5.163300514221191, "global_step": 15720, "epoch": 374} {"train_loss": -5.257232189178467, "global_step": 15721, "epoch": 374} {"train_loss": -5.197425842285156, "global_step": 15722, "epoch": 374} {"train_loss": -5.088476181030273, "global_step": 15723, "epoch": 374} {"train_loss": -5.282960414886475, "global_step": 15724, "epoch": 374} {"train_loss": -5.19111442565918, "global_step": 15725, "epoch": 374} {"train_loss": -5.315370559692383, "global_step": 15726, "epoch": 374} {"train_loss": -5.020102024078369, "global_step": 15727, "epoch": 374} {"train_loss": -4.982067108154297, "global_step": 15728, "epoch": 374} {"train_loss": -5.2279558181762695, "global_step": 15729, "epoch": 374} {"train_loss": -5.2277116775512695, "global_step": 15730, "epoch": 374} {"train_loss": -5.157732009887695, "global_step": 15731, "epoch": 374} {"train_loss": -5.316489219665527, "global_step": 15732, "epoch": 374} {"train_loss": -5.2527546882629395, "global_step": 15733, "epoch": 374} {"train_loss": -5.006007194519043, "global_step": 15734, "epoch": 374} {"train_loss": -5.253591537475586, "global_step": 15735, "epoch": 374} {"train_loss": -5.052995681762695, "global_step": 15736, "epoch": 374} {"train_loss": -5.184257507324219, "global_step": 15737, "epoch": 374} {"train_loss": -5.151240348815918, "global_step": 15738, "epoch": 374} {"train_loss": -5.225100994110107, "global_step": 15739, "epoch": 374} {"train_loss": -5.322813034057617, "global_step": 15740, "epoch": 374} {"train_loss": -5.1112236976623535, "global_step": 15741, "epoch": 374} {"train_loss": -5.256531715393066, "global_step": 15742, "epoch": 374} {"train_loss": -5.263864517211914, "global_step": 15743, "epoch": 374} {"train_loss": -5.038273334503174, "global_step": 15744, "epoch": 374} {"train_loss": -5.298322677612305, "global_step": 15745, "epoch": 374} {"train_loss": -5.190607070922852, "global_step": 15746, "epoch": 374} {"train_loss": -5.340576171875, "global_step": 15747, "epoch": 374} {"train_loss": -5.3269195556640625, "global_step": 15748, "epoch": 374} {"train_loss": -5.198141994930449, "global_step": 15749, "epoch": 374, "val_loss": 69629.4140625} {"train_loss": -5.1910719871521, "global_step": 15750, "epoch": 375} {"train_loss": -5.251189708709717, "global_step": 15751, "epoch": 375} {"train_loss": -5.176342964172363, "global_step": 15752, "epoch": 375} {"train_loss": -5.137502670288086, "global_step": 15753, "epoch": 375} {"train_loss": -5.217110633850098, "global_step": 15754, "epoch": 375} {"train_loss": -5.343934059143066, "global_step": 15755, "epoch": 375} {"train_loss": -5.095633506774902, "global_step": 15756, "epoch": 375} {"train_loss": -5.030561447143555, "global_step": 15757, "epoch": 375} {"train_loss": -5.261369228363037, "global_step": 15758, "epoch": 375} {"train_loss": -5.329937934875488, "global_step": 15759, "epoch": 375} {"train_loss": -5.111522674560547, "global_step": 15760, "epoch": 375} {"train_loss": -5.081104278564453, "global_step": 15761, "epoch": 375} {"train_loss": -5.289399147033691, "global_step": 15762, "epoch": 375} {"train_loss": -5.128568649291992, "global_step": 15763, "epoch": 375} {"train_loss": -5.066433429718018, "global_step": 15764, "epoch": 375} {"train_loss": -5.185733795166016, "global_step": 15765, "epoch": 375} {"train_loss": -5.307548522949219, "global_step": 15766, "epoch": 375} {"train_loss": -5.059520244598389, "global_step": 15767, "epoch": 375} {"train_loss": -5.259889602661133, "global_step": 15768, "epoch": 375} {"train_loss": -5.329169750213623, "global_step": 15769, "epoch": 375} {"train_loss": -5.296908378601074, "global_step": 15770, "epoch": 375} {"train_loss": -5.238891124725342, "global_step": 15771, "epoch": 375} {"train_loss": -5.309032440185547, "global_step": 15772, "epoch": 375} {"train_loss": -5.2219390869140625, "global_step": 15773, "epoch": 375} {"train_loss": -5.187681198120117, "global_step": 15774, "epoch": 375} {"train_loss": -5.278844833374023, "global_step": 15775, "epoch": 375} {"train_loss": -5.113681793212891, "global_step": 15776, "epoch": 375} {"train_loss": -5.205362319946289, "global_step": 15777, "epoch": 375} {"train_loss": -5.179096221923828, "global_step": 15778, "epoch": 375} {"train_loss": -5.199132919311523, "global_step": 15779, "epoch": 375} {"train_loss": -5.24263334274292, "global_step": 15780, "epoch": 375} {"train_loss": -5.102667808532715, "global_step": 15781, "epoch": 375} {"train_loss": -5.263615131378174, "global_step": 15782, "epoch": 375} {"train_loss": -5.294323921203613, "global_step": 15783, "epoch": 375} {"train_loss": -5.260973930358887, "global_step": 15784, "epoch": 375} {"train_loss": -5.225829601287842, "global_step": 15785, "epoch": 375} {"train_loss": -5.259549140930176, "global_step": 15786, "epoch": 375} {"train_loss": -5.0796403884887695, "global_step": 15787, "epoch": 375} {"train_loss": -5.302350997924805, "global_step": 15788, "epoch": 375} {"train_loss": -5.195852279663086, "global_step": 15789, "epoch": 375} {"train_loss": -5.235342025756836, "global_step": 15790, "epoch": 375} {"train_loss": -5.207784016927083, "global_step": 15791, "epoch": 375, "val_loss": 69487.75} {"train_loss": -5.353577136993408, "global_step": 15792, "epoch": 376} {"train_loss": -5.15895938873291, "global_step": 15793, "epoch": 376} {"train_loss": -5.042361736297607, "global_step": 15794, "epoch": 376} {"train_loss": -5.263997554779053, "global_step": 15795, "epoch": 376} {"train_loss": -5.070556163787842, "global_step": 15796, "epoch": 376} {"train_loss": -5.301414489746094, "global_step": 15797, "epoch": 376} {"train_loss": -5.211827278137207, "global_step": 15798, "epoch": 376} {"train_loss": -5.21502685546875, "global_step": 15799, "epoch": 376} {"train_loss": -5.180583477020264, "global_step": 15800, "epoch": 376} {"train_loss": -5.286561012268066, "global_step": 15801, "epoch": 376} {"train_loss": -5.239595890045166, "global_step": 15802, "epoch": 376} {"train_loss": -5.106113910675049, "global_step": 15803, "epoch": 376} {"train_loss": -5.312788963317871, "global_step": 15804, "epoch": 376} {"train_loss": -5.173023223876953, "global_step": 15805, "epoch": 376} {"train_loss": -5.295608043670654, "global_step": 15806, "epoch": 376} {"train_loss": -5.160159587860107, "global_step": 15807, "epoch": 376} {"train_loss": -5.176230430603027, "global_step": 15808, "epoch": 376} {"train_loss": -5.0980377197265625, "global_step": 15809, "epoch": 376} {"train_loss": -5.192829608917236, "global_step": 15810, "epoch": 376} {"train_loss": -5.367181777954102, "global_step": 15811, "epoch": 376} {"train_loss": -5.189915657043457, "global_step": 15812, "epoch": 376} {"train_loss": -5.250786781311035, "global_step": 15813, "epoch": 376} {"train_loss": -5.204853057861328, "global_step": 15814, "epoch": 376} {"train_loss": -5.352163314819336, "global_step": 15815, "epoch": 376} {"train_loss": -5.232961654663086, "global_step": 15816, "epoch": 376} {"train_loss": -5.129961013793945, "global_step": 15817, "epoch": 376} {"train_loss": -5.300675868988037, "global_step": 15818, "epoch": 376} {"train_loss": -5.036545276641846, "global_step": 15819, "epoch": 376} {"train_loss": -5.21455717086792, "global_step": 15820, "epoch": 376} {"train_loss": -5.07447624206543, "global_step": 15821, "epoch": 376} {"train_loss": -5.069727897644043, "global_step": 15822, "epoch": 376} {"train_loss": -5.176979064941406, "global_step": 15823, "epoch": 376} {"train_loss": -5.339230060577393, "global_step": 15824, "epoch": 376} {"train_loss": -5.2518720626831055, "global_step": 15825, "epoch": 376} {"train_loss": -5.07999324798584, "global_step": 15826, "epoch": 376} {"train_loss": -5.235955715179443, "global_step": 15827, "epoch": 376} {"train_loss": -5.159899711608887, "global_step": 15828, "epoch": 376} {"train_loss": -5.183876991271973, "global_step": 15829, "epoch": 376} {"train_loss": -5.212244033813477, "global_step": 15830, "epoch": 376} {"train_loss": -5.258542060852051, "global_step": 15831, "epoch": 376} {"train_loss": -5.210689544677734, "global_step": 15832, "epoch": 376} {"train_loss": -5.203906127384731, "global_step": 15833, "epoch": 376, "val_loss": 69291.796875} {"train_loss": -5.268855094909668, "global_step": 15834, "epoch": 377} {"train_loss": -5.043083190917969, "global_step": 15835, "epoch": 377} {"train_loss": -5.194890022277832, "global_step": 15836, "epoch": 377} {"train_loss": -5.144880771636963, "global_step": 15837, "epoch": 377} {"train_loss": -5.125044822692871, "global_step": 15838, "epoch": 377} {"train_loss": -5.121648788452148, "global_step": 15839, "epoch": 377} {"train_loss": -5.079168319702148, "global_step": 15840, "epoch": 377} {"train_loss": -5.0990495681762695, "global_step": 15841, "epoch": 377} {"train_loss": -5.140801429748535, "global_step": 15842, "epoch": 377} {"train_loss": -5.149593830108643, "global_step": 15843, "epoch": 377} {"train_loss": -5.150609970092773, "global_step": 15844, "epoch": 377} {"train_loss": -5.1837334632873535, "global_step": 15845, "epoch": 377} {"train_loss": -5.202301025390625, "global_step": 15846, "epoch": 377} {"train_loss": -5.203717231750488, "global_step": 15847, "epoch": 377} {"train_loss": -5.219877243041992, "global_step": 15848, "epoch": 377} {"train_loss": -5.305763244628906, "global_step": 15849, "epoch": 377} {"train_loss": -5.30156135559082, "global_step": 15850, "epoch": 377} {"train_loss": -5.268078327178955, "global_step": 15851, "epoch": 377} {"train_loss": -5.257585048675537, "global_step": 15852, "epoch": 377} {"train_loss": -5.3251848220825195, "global_step": 15853, "epoch": 377} {"train_loss": -5.1516804695129395, "global_step": 15854, "epoch": 377} {"train_loss": -5.2852888107299805, "global_step": 15855, "epoch": 377} {"train_loss": -5.376019477844238, "global_step": 15856, "epoch": 377} {"train_loss": -5.138767242431641, "global_step": 15857, "epoch": 377} {"train_loss": -5.309694290161133, "global_step": 15858, "epoch": 377} {"train_loss": -5.266263008117676, "global_step": 15859, "epoch": 377} {"train_loss": -5.370598793029785, "global_step": 15860, "epoch": 377} {"train_loss": -5.1871232986450195, "global_step": 15861, "epoch": 377} {"train_loss": -5.169222354888916, "global_step": 15862, "epoch": 377} {"train_loss": -5.2709760665893555, "global_step": 15863, "epoch": 377} {"train_loss": -5.239833831787109, "global_step": 15864, "epoch": 377} {"train_loss": -5.2675299644470215, "global_step": 15865, "epoch": 377} {"train_loss": -5.230923652648926, "global_step": 15866, "epoch": 377} {"train_loss": -5.262238025665283, "global_step": 15867, "epoch": 377} {"train_loss": -5.216835021972656, "global_step": 15868, "epoch": 377} {"train_loss": -5.17891263961792, "global_step": 15869, "epoch": 377} {"train_loss": -5.179178714752197, "global_step": 15870, "epoch": 377} {"train_loss": -5.2296142578125, "global_step": 15871, "epoch": 377} {"train_loss": -5.313765525817871, "global_step": 15872, "epoch": 377} {"train_loss": -5.178592681884766, "global_step": 15873, "epoch": 377} {"train_loss": -5.2808074951171875, "global_step": 15874, "epoch": 377} {"train_loss": -5.216339837937128, "global_step": 15875, "epoch": 377, "val_loss": 69245.0390625} {"train_loss": -5.259346961975098, "global_step": 15876, "epoch": 378} {"train_loss": -5.140254020690918, "global_step": 15877, "epoch": 378} {"train_loss": -5.183576583862305, "global_step": 15878, "epoch": 378} {"train_loss": -5.203524589538574, "global_step": 15879, "epoch": 378} {"train_loss": -5.306629657745361, "global_step": 15880, "epoch": 378} {"train_loss": -5.180282115936279, "global_step": 15881, "epoch": 378} {"train_loss": -5.262749671936035, "global_step": 15882, "epoch": 378} {"train_loss": -5.1603684425354, "global_step": 15883, "epoch": 378} {"train_loss": -5.31817626953125, "global_step": 15884, "epoch": 378} {"train_loss": -5.257783889770508, "global_step": 15885, "epoch": 378} {"train_loss": -5.285384178161621, "global_step": 15886, "epoch": 378} {"train_loss": -5.197754859924316, "global_step": 15887, "epoch": 378} {"train_loss": -5.215376377105713, "global_step": 15888, "epoch": 378} {"train_loss": -5.130873680114746, "global_step": 15889, "epoch": 378} {"train_loss": -5.117258548736572, "global_step": 15890, "epoch": 378} {"train_loss": -5.18774938583374, "global_step": 15891, "epoch": 378} {"train_loss": -5.259735107421875, "global_step": 15892, "epoch": 378} {"train_loss": -5.191492080688477, "global_step": 15893, "epoch": 378} {"train_loss": -5.189438819885254, "global_step": 15894, "epoch": 378} {"train_loss": -5.005396842956543, "global_step": 15895, "epoch": 378} {"train_loss": -5.311857223510742, "global_step": 15896, "epoch": 378} {"train_loss": -5.285370826721191, "global_step": 15897, "epoch": 378} {"train_loss": -5.204675197601318, "global_step": 15898, "epoch": 378} {"train_loss": -5.1064629554748535, "global_step": 15899, "epoch": 378} {"train_loss": -5.2477006912231445, "global_step": 15900, "epoch": 378} {"train_loss": -5.098275661468506, "global_step": 15901, "epoch": 378} {"train_loss": -5.097836971282959, "global_step": 15902, "epoch": 378} {"train_loss": -5.249916076660156, "global_step": 15903, "epoch": 378} {"train_loss": -5.104115009307861, "global_step": 15904, "epoch": 378} {"train_loss": -5.10910701751709, "global_step": 15905, "epoch": 378} {"train_loss": -5.173769950866699, "global_step": 15906, "epoch": 378} {"train_loss": -5.070655822753906, "global_step": 15907, "epoch": 378} {"train_loss": -5.056241035461426, "global_step": 15908, "epoch": 378} {"train_loss": -5.194192886352539, "global_step": 15909, "epoch": 378} {"train_loss": -5.208938121795654, "global_step": 15910, "epoch": 378} {"train_loss": -5.220267295837402, "global_step": 15911, "epoch": 378} {"train_loss": -5.157821178436279, "global_step": 15912, "epoch": 378} {"train_loss": -5.091561794281006, "global_step": 15913, "epoch": 378} {"train_loss": -5.374743938446045, "global_step": 15914, "epoch": 378} {"train_loss": -5.113603591918945, "global_step": 15915, "epoch": 378} {"train_loss": -5.020693778991699, "global_step": 15916, "epoch": 378} {"train_loss": -5.183355308714367, "global_step": 15917, "epoch": 378, "val_loss": 70742.7265625} {"train_loss": -5.111988067626953, "global_step": 15918, "epoch": 379} {"train_loss": -5.03587532043457, "global_step": 15919, "epoch": 379} {"train_loss": -4.891666889190674, "global_step": 15920, "epoch": 379} {"train_loss": -5.04506778717041, "global_step": 15921, "epoch": 379} {"train_loss": -5.06934928894043, "global_step": 15922, "epoch": 379} {"train_loss": -5.077788352966309, "global_step": 15923, "epoch": 379} {"train_loss": -5.1732282638549805, "global_step": 15924, "epoch": 379} {"train_loss": -5.130917072296143, "global_step": 15925, "epoch": 379} {"train_loss": -5.132577896118164, "global_step": 15926, "epoch": 379} {"train_loss": -5.159160614013672, "global_step": 15927, "epoch": 379} {"train_loss": -5.145452499389648, "global_step": 15928, "epoch": 379} {"train_loss": -5.2332658767700195, "global_step": 15929, "epoch": 379} {"train_loss": -5.0721659660339355, "global_step": 15930, "epoch": 379} {"train_loss": -5.290245532989502, "global_step": 15931, "epoch": 379} {"train_loss": -5.0539093017578125, "global_step": 15932, "epoch": 379} {"train_loss": -5.156153678894043, "global_step": 15933, "epoch": 379} {"train_loss": -5.328382968902588, "global_step": 15934, "epoch": 379} {"train_loss": -5.195804595947266, "global_step": 15935, "epoch": 379} {"train_loss": -5.0851640701293945, "global_step": 15936, "epoch": 379} {"train_loss": -5.341365337371826, "global_step": 15937, "epoch": 379} {"train_loss": -5.118570327758789, "global_step": 15938, "epoch": 379} {"train_loss": -5.237890243530273, "global_step": 15939, "epoch": 379} {"train_loss": -5.2515668869018555, "global_step": 15940, "epoch": 379} {"train_loss": -5.0455121994018555, "global_step": 15941, "epoch": 379} {"train_loss": -5.233300685882568, "global_step": 15942, "epoch": 379} {"train_loss": -5.023200035095215, "global_step": 15943, "epoch": 379} {"train_loss": -5.072964668273926, "global_step": 15944, "epoch": 379} {"train_loss": -5.160882949829102, "global_step": 15945, "epoch": 379} {"train_loss": -5.234604358673096, "global_step": 15946, "epoch": 379} {"train_loss": -5.146790504455566, "global_step": 15947, "epoch": 379} {"train_loss": -5.085812091827393, "global_step": 15948, "epoch": 379} {"train_loss": -5.281037330627441, "global_step": 15949, "epoch": 379} {"train_loss": -5.233107566833496, "global_step": 15950, "epoch": 379} {"train_loss": -5.172104835510254, "global_step": 15951, "epoch": 379} {"train_loss": -5.333935737609863, "global_step": 15952, "epoch": 379} {"train_loss": -5.213695049285889, "global_step": 15953, "epoch": 379} {"train_loss": -5.16773796081543, "global_step": 15954, "epoch": 379} {"train_loss": -5.158208847045898, "global_step": 15955, "epoch": 379} {"train_loss": -5.172331809997559, "global_step": 15956, "epoch": 379} {"train_loss": -5.1832475662231445, "global_step": 15957, "epoch": 379} {"train_loss": -5.1205735206604, "global_step": 15958, "epoch": 379} {"train_loss": -5.1551736650012785, "global_step": 15959, "epoch": 379, "val_loss": 69625.921875} {"train_loss": -5.237526893615723, "global_step": 15960, "epoch": 380} {"train_loss": -5.137683868408203, "global_step": 15961, "epoch": 380} {"train_loss": -5.249101161956787, "global_step": 15962, "epoch": 380} {"train_loss": -5.2339630126953125, "global_step": 15963, "epoch": 380} {"train_loss": -5.155827045440674, "global_step": 15964, "epoch": 380} {"train_loss": -5.02135705947876, "global_step": 15965, "epoch": 380} {"train_loss": -5.17730712890625, "global_step": 15966, "epoch": 380} {"train_loss": -5.218816757202148, "global_step": 15967, "epoch": 380} {"train_loss": -5.266787528991699, "global_step": 15968, "epoch": 380} {"train_loss": -5.253024101257324, "global_step": 15969, "epoch": 380} {"train_loss": -5.24078369140625, "global_step": 15970, "epoch": 380} {"train_loss": -5.1104583740234375, "global_step": 15971, "epoch": 380} {"train_loss": -5.1722517013549805, "global_step": 15972, "epoch": 380} {"train_loss": -5.177865982055664, "global_step": 15973, "epoch": 380} {"train_loss": -5.226400852203369, "global_step": 15974, "epoch": 380} {"train_loss": -5.326895236968994, "global_step": 15975, "epoch": 380} {"train_loss": -5.329571723937988, "global_step": 15976, "epoch": 380} {"train_loss": -5.127242088317871, "global_step": 15977, "epoch": 380} {"train_loss": -5.181058406829834, "global_step": 15978, "epoch": 380} {"train_loss": -5.2061872482299805, "global_step": 15979, "epoch": 380} {"train_loss": -5.1538190841674805, "global_step": 15980, "epoch": 380} {"train_loss": -5.244271755218506, "global_step": 15981, "epoch": 380} {"train_loss": -5.328360080718994, "global_step": 15982, "epoch": 380} {"train_loss": -5.199920654296875, "global_step": 15983, "epoch": 380} {"train_loss": -5.194088459014893, "global_step": 15984, "epoch": 380} {"train_loss": -5.222043037414551, "global_step": 15985, "epoch": 380} {"train_loss": -5.2483720779418945, "global_step": 15986, "epoch": 380} {"train_loss": -5.140590190887451, "global_step": 15987, "epoch": 380} {"train_loss": -5.312251567840576, "global_step": 15988, "epoch": 380} {"train_loss": -5.221347808837891, "global_step": 15989, "epoch": 380} {"train_loss": -5.1697916984558105, "global_step": 15990, "epoch": 380} {"train_loss": -5.258307456970215, "global_step": 15991, "epoch": 380} {"train_loss": -5.1841206550598145, "global_step": 15992, "epoch": 380} {"train_loss": -5.194964408874512, "global_step": 15993, "epoch": 380} {"train_loss": -5.209564685821533, "global_step": 15994, "epoch": 380} {"train_loss": -5.371829986572266, "global_step": 15995, "epoch": 380} {"train_loss": -5.2207183837890625, "global_step": 15996, "epoch": 380} {"train_loss": -5.1274027824401855, "global_step": 15997, "epoch": 380} {"train_loss": -5.145599365234375, "global_step": 15998, "epoch": 380} {"train_loss": -5.070965766906738, "global_step": 15999, "epoch": 380} {"train_loss": -5.133519172668457, "global_step": 16000, "epoch": 380} {"train_loss": -5.2027785664512995, "global_step": 16001, "epoch": 380, "val_loss": 70127.671875} {"train_loss": -5.005056858062744, "global_step": 16002, "epoch": 381} {"train_loss": -5.233043670654297, "global_step": 16003, "epoch": 381} {"train_loss": -5.119839668273926, "global_step": 16004, "epoch": 381} {"train_loss": -5.2163987159729, "global_step": 16005, "epoch": 381} {"train_loss": -5.2373151779174805, "global_step": 16006, "epoch": 381} {"train_loss": -5.301853179931641, "global_step": 16007, "epoch": 381} {"train_loss": -5.2413010597229, "global_step": 16008, "epoch": 381} {"train_loss": -5.189841270446777, "global_step": 16009, "epoch": 381} {"train_loss": -5.286541938781738, "global_step": 16010, "epoch": 381} {"train_loss": -5.111136436462402, "global_step": 16011, "epoch": 381} {"train_loss": -5.279268264770508, "global_step": 16012, "epoch": 381} {"train_loss": -5.145233154296875, "global_step": 16013, "epoch": 381} {"train_loss": -5.162890434265137, "global_step": 16014, "epoch": 381} {"train_loss": -5.206171989440918, "global_step": 16015, "epoch": 381} {"train_loss": -5.196321964263916, "global_step": 16016, "epoch": 381} {"train_loss": -5.333462715148926, "global_step": 16017, "epoch": 381} {"train_loss": -5.194413185119629, "global_step": 16018, "epoch": 381} {"train_loss": -5.220338344573975, "global_step": 16019, "epoch": 381} {"train_loss": -5.26288366317749, "global_step": 16020, "epoch": 381} {"train_loss": -5.279277324676514, "global_step": 16021, "epoch": 381} {"train_loss": -5.182111740112305, "global_step": 16022, "epoch": 381} {"train_loss": -5.300278663635254, "global_step": 16023, "epoch": 381} {"train_loss": -5.239297866821289, "global_step": 16024, "epoch": 381} {"train_loss": -5.141468524932861, "global_step": 16025, "epoch": 381} {"train_loss": -5.126086711883545, "global_step": 16026, "epoch": 381} {"train_loss": -5.159760475158691, "global_step": 16027, "epoch": 381} {"train_loss": -5.14658784866333, "global_step": 16028, "epoch": 381} {"train_loss": -5.090861797332764, "global_step": 16029, "epoch": 381} {"train_loss": -5.206888198852539, "global_step": 16030, "epoch": 381} {"train_loss": -5.217665672302246, "global_step": 16031, "epoch": 381} {"train_loss": -5.262157440185547, "global_step": 16032, "epoch": 381} {"train_loss": -5.151861190795898, "global_step": 16033, "epoch": 381} {"train_loss": -5.229483604431152, "global_step": 16034, "epoch": 381} {"train_loss": -5.271660804748535, "global_step": 16035, "epoch": 381} {"train_loss": -5.115734100341797, "global_step": 16036, "epoch": 381} {"train_loss": -5.192836761474609, "global_step": 16037, "epoch": 381} {"train_loss": -5.031529426574707, "global_step": 16038, "epoch": 381} {"train_loss": -5.1987409591674805, "global_step": 16039, "epoch": 381} {"train_loss": -5.141831398010254, "global_step": 16040, "epoch": 381} {"train_loss": -5.097470283508301, "global_step": 16041, "epoch": 381} {"train_loss": -5.192636489868164, "global_step": 16042, "epoch": 381} {"train_loss": -5.189897037687755, "global_step": 16043, "epoch": 381, "val_loss": 69559.0625} {"train_loss": -5.1470947265625, "global_step": 16044, "epoch": 382} {"train_loss": -5.138458251953125, "global_step": 16045, "epoch": 382} {"train_loss": -5.235119819641113, "global_step": 16046, "epoch": 382} {"train_loss": -5.149240493774414, "global_step": 16047, "epoch": 382} {"train_loss": -5.344001293182373, "global_step": 16048, "epoch": 382} {"train_loss": -5.280501365661621, "global_step": 16049, "epoch": 382} {"train_loss": -5.206113815307617, "global_step": 16050, "epoch": 382} {"train_loss": -5.289155960083008, "global_step": 16051, "epoch": 382} {"train_loss": -5.139902591705322, "global_step": 16052, "epoch": 382} {"train_loss": -5.28081750869751, "global_step": 16053, "epoch": 382} {"train_loss": -5.169577598571777, "global_step": 16054, "epoch": 382} {"train_loss": -5.264335632324219, "global_step": 16055, "epoch": 382} {"train_loss": -5.204804420471191, "global_step": 16056, "epoch": 382} {"train_loss": -5.200511455535889, "global_step": 16057, "epoch": 382} {"train_loss": -5.216169834136963, "global_step": 16058, "epoch": 382} {"train_loss": -5.199857234954834, "global_step": 16059, "epoch": 382} {"train_loss": -5.237993240356445, "global_step": 16060, "epoch": 382} {"train_loss": -5.194941997528076, "global_step": 16061, "epoch": 382} {"train_loss": -5.260091781616211, "global_step": 16062, "epoch": 382} {"train_loss": -5.18367862701416, "global_step": 16063, "epoch": 382} {"train_loss": -5.156774997711182, "global_step": 16064, "epoch": 382} {"train_loss": -5.113321304321289, "global_step": 16065, "epoch": 382} {"train_loss": -5.2124528884887695, "global_step": 16066, "epoch": 382} {"train_loss": -5.264284133911133, "global_step": 16067, "epoch": 382} {"train_loss": -5.323916912078857, "global_step": 16068, "epoch": 382} {"train_loss": -5.183294296264648, "global_step": 16069, "epoch": 382} {"train_loss": -5.149112701416016, "global_step": 16070, "epoch": 382} {"train_loss": -5.211327075958252, "global_step": 16071, "epoch": 382} {"train_loss": -5.238402366638184, "global_step": 16072, "epoch": 382} {"train_loss": -5.38095760345459, "global_step": 16073, "epoch": 382} {"train_loss": -5.1792311668396, "global_step": 16074, "epoch": 382} {"train_loss": -5.175248146057129, "global_step": 16075, "epoch": 382} {"train_loss": -5.294247627258301, "global_step": 16076, "epoch": 382} {"train_loss": -5.085036277770996, "global_step": 16077, "epoch": 382} {"train_loss": -5.374242782592773, "global_step": 16078, "epoch": 382} {"train_loss": -5.217639446258545, "global_step": 16079, "epoch": 382} {"train_loss": -5.19992733001709, "global_step": 16080, "epoch": 382} {"train_loss": -5.173841953277588, "global_step": 16081, "epoch": 382} {"train_loss": -5.101733207702637, "global_step": 16082, "epoch": 382} {"train_loss": -5.197793006896973, "global_step": 16083, "epoch": 382} {"train_loss": -5.27994441986084, "global_step": 16084, "epoch": 382} {"train_loss": -5.214710905438378, "global_step": 16085, "epoch": 382, "val_loss": 69704.234375} {"train_loss": -5.139867782592773, "global_step": 16086, "epoch": 383} {"train_loss": -5.138753890991211, "global_step": 16087, "epoch": 383} {"train_loss": -5.3183770179748535, "global_step": 16088, "epoch": 383} {"train_loss": -5.267683982849121, "global_step": 16089, "epoch": 383} {"train_loss": -5.258956432342529, "global_step": 16090, "epoch": 383} {"train_loss": -5.141547203063965, "global_step": 16091, "epoch": 383} {"train_loss": -5.295767307281494, "global_step": 16092, "epoch": 383} {"train_loss": -5.192895412445068, "global_step": 16093, "epoch": 383} {"train_loss": -5.247323989868164, "global_step": 16094, "epoch": 383} {"train_loss": -5.23719596862793, "global_step": 16095, "epoch": 383} {"train_loss": -5.148008823394775, "global_step": 16096, "epoch": 383} {"train_loss": -5.0678887367248535, "global_step": 16097, "epoch": 383} {"train_loss": -5.199879169464111, "global_step": 16098, "epoch": 383} {"train_loss": -5.047197341918945, "global_step": 16099, "epoch": 383} {"train_loss": -5.094815731048584, "global_step": 16100, "epoch": 383} {"train_loss": -5.234030246734619, "global_step": 16101, "epoch": 383} {"train_loss": -5.137054920196533, "global_step": 16102, "epoch": 383} {"train_loss": -5.101133346557617, "global_step": 16103, "epoch": 383} {"train_loss": -5.2329511642456055, "global_step": 16104, "epoch": 383} {"train_loss": -5.073549270629883, "global_step": 16105, "epoch": 383} {"train_loss": -5.1710920333862305, "global_step": 16106, "epoch": 383} {"train_loss": -5.306800842285156, "global_step": 16107, "epoch": 383} {"train_loss": -5.108780860900879, "global_step": 16108, "epoch": 383} {"train_loss": -5.191156387329102, "global_step": 16109, "epoch": 383} {"train_loss": -5.1792216300964355, "global_step": 16110, "epoch": 383} {"train_loss": -5.094531059265137, "global_step": 16111, "epoch": 383} {"train_loss": -5.096358299255371, "global_step": 16112, "epoch": 383} {"train_loss": -5.35878849029541, "global_step": 16113, "epoch": 383} {"train_loss": -5.311203956604004, "global_step": 16114, "epoch": 383} {"train_loss": -5.222991943359375, "global_step": 16115, "epoch": 383} {"train_loss": -5.383088111877441, "global_step": 16116, "epoch": 383} {"train_loss": -5.30715274810791, "global_step": 16117, "epoch": 383} {"train_loss": -5.321249008178711, "global_step": 16118, "epoch": 383} {"train_loss": -5.243114471435547, "global_step": 16119, "epoch": 383} {"train_loss": -5.23279333114624, "global_step": 16120, "epoch": 383} {"train_loss": -5.219134330749512, "global_step": 16121, "epoch": 383} {"train_loss": -5.157894134521484, "global_step": 16122, "epoch": 383} {"train_loss": -5.27239990234375, "global_step": 16123, "epoch": 383} {"train_loss": -5.113876819610596, "global_step": 16124, "epoch": 383} {"train_loss": -5.283725261688232, "global_step": 16125, "epoch": 383} {"train_loss": -5.314255714416504, "global_step": 16126, "epoch": 383} {"train_loss": -5.204901933670044, "global_step": 16127, "epoch": 383, "val_loss": 69593.71875} {"train_loss": -5.251914024353027, "global_step": 16128, "epoch": 384} {"train_loss": -5.209980010986328, "global_step": 16129, "epoch": 384} {"train_loss": -5.115962505340576, "global_step": 16130, "epoch": 384} {"train_loss": -5.151382923126221, "global_step": 16131, "epoch": 384} {"train_loss": -5.174750804901123, "global_step": 16132, "epoch": 384} {"train_loss": -5.222258567810059, "global_step": 16133, "epoch": 384} {"train_loss": -5.093311786651611, "global_step": 16134, "epoch": 384} {"train_loss": -5.232021331787109, "global_step": 16135, "epoch": 384} {"train_loss": -5.267885208129883, "global_step": 16136, "epoch": 384} {"train_loss": -5.191183090209961, "global_step": 16137, "epoch": 384} {"train_loss": -5.276838302612305, "global_step": 16138, "epoch": 384} {"train_loss": -5.238702774047852, "global_step": 16139, "epoch": 384} {"train_loss": -5.33073091506958, "global_step": 16140, "epoch": 384} {"train_loss": -5.210071563720703, "global_step": 16141, "epoch": 384} {"train_loss": -5.356471538543701, "global_step": 16142, "epoch": 384} {"train_loss": -5.247703552246094, "global_step": 16143, "epoch": 384} {"train_loss": -5.353631973266602, "global_step": 16144, "epoch": 384} {"train_loss": -5.366691589355469, "global_step": 16145, "epoch": 384} {"train_loss": -5.180854797363281, "global_step": 16146, "epoch": 384} {"train_loss": -5.23036003112793, "global_step": 16147, "epoch": 384} {"train_loss": -5.252172470092773, "global_step": 16148, "epoch": 384} {"train_loss": -5.310338020324707, "global_step": 16149, "epoch": 384} {"train_loss": -5.221295356750488, "global_step": 16150, "epoch": 384} {"train_loss": -5.207160949707031, "global_step": 16151, "epoch": 384} {"train_loss": -5.225977420806885, "global_step": 16152, "epoch": 384} {"train_loss": -5.268158912658691, "global_step": 16153, "epoch": 384} {"train_loss": -5.195888996124268, "global_step": 16154, "epoch": 384} {"train_loss": -5.23829460144043, "global_step": 16155, "epoch": 384} {"train_loss": -5.174059867858887, "global_step": 16156, "epoch": 384} {"train_loss": -5.162015438079834, "global_step": 16157, "epoch": 384} {"train_loss": -5.301399230957031, "global_step": 16158, "epoch": 384} {"train_loss": -5.16413688659668, "global_step": 16159, "epoch": 384} {"train_loss": -5.10720157623291, "global_step": 16160, "epoch": 384} {"train_loss": -5.394715785980225, "global_step": 16161, "epoch": 384} {"train_loss": -5.145671844482422, "global_step": 16162, "epoch": 384} {"train_loss": -5.119968414306641, "global_step": 16163, "epoch": 384} {"train_loss": -5.29206657409668, "global_step": 16164, "epoch": 384} {"train_loss": -5.241899490356445, "global_step": 16165, "epoch": 384} {"train_loss": -5.092945098876953, "global_step": 16166, "epoch": 384} {"train_loss": -5.2887372970581055, "global_step": 16167, "epoch": 384} {"train_loss": -5.329686164855957, "global_step": 16168, "epoch": 384} {"train_loss": -5.229586658023653, "global_step": 16169, "epoch": 384, "val_loss": 69634.125} {"train_loss": -5.2467041015625, "global_step": 16170, "epoch": 385} {"train_loss": -5.276265621185303, "global_step": 16171, "epoch": 385} {"train_loss": -5.163657188415527, "global_step": 16172, "epoch": 385} {"train_loss": -5.097873210906982, "global_step": 16173, "epoch": 385} {"train_loss": -5.193286895751953, "global_step": 16174, "epoch": 385} {"train_loss": -5.18948221206665, "global_step": 16175, "epoch": 385} {"train_loss": -5.074037551879883, "global_step": 16176, "epoch": 385} {"train_loss": -5.273763656616211, "global_step": 16177, "epoch": 385} {"train_loss": -5.128083229064941, "global_step": 16178, "epoch": 385} {"train_loss": -5.125783920288086, "global_step": 16179, "epoch": 385} {"train_loss": -5.132748603820801, "global_step": 16180, "epoch": 385} {"train_loss": -5.306308746337891, "global_step": 16181, "epoch": 385} {"train_loss": -5.037253379821777, "global_step": 16182, "epoch": 385} {"train_loss": -4.952625751495361, "global_step": 16183, "epoch": 385} {"train_loss": -5.172713756561279, "global_step": 16184, "epoch": 385} {"train_loss": -5.310637474060059, "global_step": 16185, "epoch": 385} {"train_loss": -4.959002494812012, "global_step": 16186, "epoch": 385} {"train_loss": -5.145898818969727, "global_step": 16187, "epoch": 385} {"train_loss": -5.077632904052734, "global_step": 16188, "epoch": 385} {"train_loss": -5.187010288238525, "global_step": 16189, "epoch": 385} {"train_loss": -5.096808433532715, "global_step": 16190, "epoch": 385} {"train_loss": -4.975895881652832, "global_step": 16191, "epoch": 385} {"train_loss": -5.18485164642334, "global_step": 16192, "epoch": 385} {"train_loss": -4.902429103851318, "global_step": 16193, "epoch": 385} {"train_loss": -5.239137172698975, "global_step": 16194, "epoch": 385} {"train_loss": -5.1082844734191895, "global_step": 16195, "epoch": 385} {"train_loss": -5.00971794128418, "global_step": 16196, "epoch": 385} {"train_loss": -5.10869026184082, "global_step": 16197, "epoch": 385} {"train_loss": -5.06232213973999, "global_step": 16198, "epoch": 385} {"train_loss": -5.200700283050537, "global_step": 16199, "epoch": 385} {"train_loss": -5.118138313293457, "global_step": 16200, "epoch": 385} {"train_loss": -5.118542194366455, "global_step": 16201, "epoch": 385} {"train_loss": -5.076943397521973, "global_step": 16202, "epoch": 385} {"train_loss": -5.298369407653809, "global_step": 16203, "epoch": 385} {"train_loss": -5.129648208618164, "global_step": 16204, "epoch": 385} {"train_loss": -5.113736152648926, "global_step": 16205, "epoch": 385} {"train_loss": -5.064863681793213, "global_step": 16206, "epoch": 385} {"train_loss": -5.167609214782715, "global_step": 16207, "epoch": 385} {"train_loss": -5.151096343994141, "global_step": 16208, "epoch": 385} {"train_loss": -5.138691425323486, "global_step": 16209, "epoch": 385} {"train_loss": -5.310137748718262, "global_step": 16210, "epoch": 385} {"train_loss": -5.14030629112607, "global_step": 16211, "epoch": 385, "val_loss": 69426.25} {"train_loss": -5.233454704284668, "global_step": 16212, "epoch": 386} {"train_loss": -5.3129963874816895, "global_step": 16213, "epoch": 386} {"train_loss": -5.216346263885498, "global_step": 16214, "epoch": 386} {"train_loss": -5.249641418457031, "global_step": 16215, "epoch": 386} {"train_loss": -5.203186988830566, "global_step": 16216, "epoch": 386} {"train_loss": -5.264518737792969, "global_step": 16217, "epoch": 386} {"train_loss": -5.263084411621094, "global_step": 16218, "epoch": 386} {"train_loss": -5.237783908843994, "global_step": 16219, "epoch": 386} {"train_loss": -5.272554397583008, "global_step": 16220, "epoch": 386} {"train_loss": -5.148717403411865, "global_step": 16221, "epoch": 386} {"train_loss": -5.157741546630859, "global_step": 16222, "epoch": 386} {"train_loss": -5.147953033447266, "global_step": 16223, "epoch": 386} {"train_loss": -5.229074478149414, "global_step": 16224, "epoch": 386} {"train_loss": -5.199604511260986, "global_step": 16225, "epoch": 386} {"train_loss": -5.294525146484375, "global_step": 16226, "epoch": 386} {"train_loss": -5.081470489501953, "global_step": 16227, "epoch": 386} {"train_loss": -5.2539215087890625, "global_step": 16228, "epoch": 386} {"train_loss": -5.132592678070068, "global_step": 16229, "epoch": 386} {"train_loss": -5.066473484039307, "global_step": 16230, "epoch": 386} {"train_loss": -5.07485818862915, "global_step": 16231, "epoch": 386} {"train_loss": -5.142696380615234, "global_step": 16232, "epoch": 386} {"train_loss": -5.101761341094971, "global_step": 16233, "epoch": 386} {"train_loss": -5.10014533996582, "global_step": 16234, "epoch": 386} {"train_loss": -5.210912704467773, "global_step": 16235, "epoch": 386} {"train_loss": -5.177604675292969, "global_step": 16236, "epoch": 386} {"train_loss": -5.16782283782959, "global_step": 16237, "epoch": 386} {"train_loss": -5.199158668518066, "global_step": 16238, "epoch": 386} {"train_loss": -5.322793960571289, "global_step": 16239, "epoch": 386} {"train_loss": -5.289168834686279, "global_step": 16240, "epoch": 386} {"train_loss": -5.201117992401123, "global_step": 16241, "epoch": 386} {"train_loss": -5.116952896118164, "global_step": 16242, "epoch": 386} {"train_loss": -5.265342712402344, "global_step": 16243, "epoch": 386} {"train_loss": -5.331692218780518, "global_step": 16244, "epoch": 386} {"train_loss": -5.239089012145996, "global_step": 16245, "epoch": 386} {"train_loss": -5.292540550231934, "global_step": 16246, "epoch": 386} {"train_loss": -5.234450817108154, "global_step": 16247, "epoch": 386} {"train_loss": -5.17789363861084, "global_step": 16248, "epoch": 386} {"train_loss": -5.242161750793457, "global_step": 16249, "epoch": 386} {"train_loss": -5.139025688171387, "global_step": 16250, "epoch": 386} {"train_loss": -5.110288619995117, "global_step": 16251, "epoch": 386} {"train_loss": -5.242740631103516, "global_step": 16252, "epoch": 386} {"train_loss": -5.205131144750686, "global_step": 16253, "epoch": 386, "val_loss": 70254.265625} {"train_loss": -5.126812934875488, "global_step": 16254, "epoch": 387} {"train_loss": -5.085864067077637, "global_step": 16255, "epoch": 387} {"train_loss": -5.2192769050598145, "global_step": 16256, "epoch": 387} {"train_loss": -5.163669586181641, "global_step": 16257, "epoch": 387} {"train_loss": -5.240565299987793, "global_step": 16258, "epoch": 387} {"train_loss": -5.241816997528076, "global_step": 16259, "epoch": 387} {"train_loss": -5.034485816955566, "global_step": 16260, "epoch": 387} {"train_loss": -5.194509029388428, "global_step": 16261, "epoch": 387} {"train_loss": -5.191961288452148, "global_step": 16262, "epoch": 387} {"train_loss": -5.124358177185059, "global_step": 16263, "epoch": 387} {"train_loss": -5.196499347686768, "global_step": 16264, "epoch": 387} {"train_loss": -5.3029680252075195, "global_step": 16265, "epoch": 387} {"train_loss": -5.191449165344238, "global_step": 16266, "epoch": 387} {"train_loss": -5.079745292663574, "global_step": 16267, "epoch": 387} {"train_loss": -5.241445541381836, "global_step": 16268, "epoch": 387} {"train_loss": -5.16457986831665, "global_step": 16269, "epoch": 387} {"train_loss": -5.161940574645996, "global_step": 16270, "epoch": 387} {"train_loss": -5.290102005004883, "global_step": 16271, "epoch": 387} {"train_loss": -5.13675594329834, "global_step": 16272, "epoch": 387} {"train_loss": -5.137035369873047, "global_step": 16273, "epoch": 387} {"train_loss": -5.087068557739258, "global_step": 16274, "epoch": 387} {"train_loss": -5.071700572967529, "global_step": 16275, "epoch": 387} {"train_loss": -5.23390531539917, "global_step": 16276, "epoch": 387} {"train_loss": -5.113252639770508, "global_step": 16277, "epoch": 387} {"train_loss": -5.146665573120117, "global_step": 16278, "epoch": 387} {"train_loss": -5.319258689880371, "global_step": 16279, "epoch": 387} {"train_loss": -5.11694860458374, "global_step": 16280, "epoch": 387} {"train_loss": -5.170078277587891, "global_step": 16281, "epoch": 387} {"train_loss": -5.173884391784668, "global_step": 16282, "epoch": 387} {"train_loss": -5.152525901794434, "global_step": 16283, "epoch": 387} {"train_loss": -5.17749547958374, "global_step": 16284, "epoch": 387} {"train_loss": -5.327448844909668, "global_step": 16285, "epoch": 387} {"train_loss": -5.093491077423096, "global_step": 16286, "epoch": 387} {"train_loss": -5.276803493499756, "global_step": 16287, "epoch": 387} {"train_loss": -5.20676326751709, "global_step": 16288, "epoch": 387} {"train_loss": -5.049410820007324, "global_step": 16289, "epoch": 387} {"train_loss": -5.260311603546143, "global_step": 16290, "epoch": 387} {"train_loss": -5.128777503967285, "global_step": 16291, "epoch": 387} {"train_loss": -5.13560676574707, "global_step": 16292, "epoch": 387} {"train_loss": -5.240440368652344, "global_step": 16293, "epoch": 387} {"train_loss": -5.267844200134277, "global_step": 16294, "epoch": 387} {"train_loss": -5.177083163034348, "global_step": 16295, "epoch": 387, "val_loss": 69566.3515625} {"train_loss": -5.237548828125, "global_step": 16296, "epoch": 388} {"train_loss": -5.1210808753967285, "global_step": 16297, "epoch": 388} {"train_loss": -5.30301570892334, "global_step": 16298, "epoch": 388} {"train_loss": -5.271463871002197, "global_step": 16299, "epoch": 388} {"train_loss": -5.171329498291016, "global_step": 16300, "epoch": 388} {"train_loss": -5.116368293762207, "global_step": 16301, "epoch": 388} {"train_loss": -5.437635898590088, "global_step": 16302, "epoch": 388} {"train_loss": -5.21651029586792, "global_step": 16303, "epoch": 388} {"train_loss": -5.333676338195801, "global_step": 16304, "epoch": 388} {"train_loss": -5.290634632110596, "global_step": 16305, "epoch": 388} {"train_loss": -5.209903717041016, "global_step": 16306, "epoch": 388} {"train_loss": -5.2167277336120605, "global_step": 16307, "epoch": 388} {"train_loss": -5.384897232055664, "global_step": 16308, "epoch": 388} {"train_loss": -5.233508110046387, "global_step": 16309, "epoch": 388} {"train_loss": -5.159720420837402, "global_step": 16310, "epoch": 388} {"train_loss": -5.173954486846924, "global_step": 16311, "epoch": 388} {"train_loss": -5.278648376464844, "global_step": 16312, "epoch": 388} {"train_loss": -5.176455974578857, "global_step": 16313, "epoch": 388} {"train_loss": -5.239011764526367, "global_step": 16314, "epoch": 388} {"train_loss": -5.246045112609863, "global_step": 16315, "epoch": 388} {"train_loss": -5.273262977600098, "global_step": 16316, "epoch": 388} {"train_loss": -5.116863250732422, "global_step": 16317, "epoch": 388} {"train_loss": -5.187342166900635, "global_step": 16318, "epoch": 388} {"train_loss": -5.240837097167969, "global_step": 16319, "epoch": 388} {"train_loss": -5.247227191925049, "global_step": 16320, "epoch": 388} {"train_loss": -5.143287658691406, "global_step": 16321, "epoch": 388} {"train_loss": -5.150793552398682, "global_step": 16322, "epoch": 388} {"train_loss": -5.274996757507324, "global_step": 16323, "epoch": 388} {"train_loss": -5.34323263168335, "global_step": 16324, "epoch": 388} {"train_loss": -5.137935161590576, "global_step": 16325, "epoch": 388} {"train_loss": -5.274502277374268, "global_step": 16326, "epoch": 388} {"train_loss": -5.2720232009887695, "global_step": 16327, "epoch": 388} {"train_loss": -5.1756591796875, "global_step": 16328, "epoch": 388} {"train_loss": -5.2870774269104, "global_step": 16329, "epoch": 388} {"train_loss": -5.229378700256348, "global_step": 16330, "epoch": 388} {"train_loss": -5.2910919189453125, "global_step": 16331, "epoch": 388} {"train_loss": -5.226170539855957, "global_step": 16332, "epoch": 388} {"train_loss": -5.1672797203063965, "global_step": 16333, "epoch": 388} {"train_loss": -5.19438362121582, "global_step": 16334, "epoch": 388} {"train_loss": -5.259965896606445, "global_step": 16335, "epoch": 388} {"train_loss": -5.278698921203613, "global_step": 16336, "epoch": 388} {"train_loss": -5.23337595803397, "global_step": 16337, "epoch": 388, "val_loss": 69130.21875} {"train_loss": -5.40835428237915, "global_step": 16338, "epoch": 389} {"train_loss": -5.283207893371582, "global_step": 16339, "epoch": 389} {"train_loss": -5.350950241088867, "global_step": 16340, "epoch": 389} {"train_loss": -5.236800193786621, "global_step": 16341, "epoch": 389} {"train_loss": -5.132810592651367, "global_step": 16342, "epoch": 389} {"train_loss": -5.181643486022949, "global_step": 16343, "epoch": 389} {"train_loss": -5.406057357788086, "global_step": 16344, "epoch": 389} {"train_loss": -5.396327018737793, "global_step": 16345, "epoch": 389} {"train_loss": -5.288405418395996, "global_step": 16346, "epoch": 389} {"train_loss": -5.244189262390137, "global_step": 16347, "epoch": 389} {"train_loss": -5.244349956512451, "global_step": 16348, "epoch": 389} {"train_loss": -5.333596229553223, "global_step": 16349, "epoch": 389} {"train_loss": -5.179616928100586, "global_step": 16350, "epoch": 389} {"train_loss": -5.278197288513184, "global_step": 16351, "epoch": 389} {"train_loss": -5.239072799682617, "global_step": 16352, "epoch": 389} {"train_loss": -5.212798118591309, "global_step": 16353, "epoch": 389} {"train_loss": -5.173431396484375, "global_step": 16354, "epoch": 389} {"train_loss": -5.190456390380859, "global_step": 16355, "epoch": 389} {"train_loss": -5.289226531982422, "global_step": 16356, "epoch": 389} {"train_loss": -5.304285526275635, "global_step": 16357, "epoch": 389} {"train_loss": -5.301685333251953, "global_step": 16358, "epoch": 389} {"train_loss": -5.066170692443848, "global_step": 16359, "epoch": 389} {"train_loss": -5.148989677429199, "global_step": 16360, "epoch": 389} {"train_loss": -5.204055309295654, "global_step": 16361, "epoch": 389} {"train_loss": -5.324056625366211, "global_step": 16362, "epoch": 389} {"train_loss": -5.017325401306152, "global_step": 16363, "epoch": 389} {"train_loss": -5.058302879333496, "global_step": 16364, "epoch": 389} {"train_loss": -5.308960914611816, "global_step": 16365, "epoch": 389} {"train_loss": -5.071937084197998, "global_step": 16366, "epoch": 389} {"train_loss": -5.176888465881348, "global_step": 16367, "epoch": 389} {"train_loss": -5.2649688720703125, "global_step": 16368, "epoch": 389} {"train_loss": -5.1493120193481445, "global_step": 16369, "epoch": 389} {"train_loss": -5.247118949890137, "global_step": 16370, "epoch": 389} {"train_loss": -5.244929313659668, "global_step": 16371, "epoch": 389} {"train_loss": -5.130295276641846, "global_step": 16372, "epoch": 389} {"train_loss": -5.159419059753418, "global_step": 16373, "epoch": 389} {"train_loss": -5.329471588134766, "global_step": 16374, "epoch": 389} {"train_loss": -5.084865093231201, "global_step": 16375, "epoch": 389} {"train_loss": -5.123992919921875, "global_step": 16376, "epoch": 389} {"train_loss": -5.241843223571777, "global_step": 16377, "epoch": 389} {"train_loss": -5.1070780754089355, "global_step": 16378, "epoch": 389} {"train_loss": -5.220326014927456, "global_step": 16379, "epoch": 389, "val_loss": 69223.3515625} {"train_loss": -5.331666946411133, "global_step": 16380, "epoch": 390} {"train_loss": -5.126654148101807, "global_step": 16381, "epoch": 390} {"train_loss": -5.244391441345215, "global_step": 16382, "epoch": 390} {"train_loss": -5.219343185424805, "global_step": 16383, "epoch": 390} {"train_loss": -5.158146858215332, "global_step": 16384, "epoch": 390} {"train_loss": -5.2201762199401855, "global_step": 16385, "epoch": 390} {"train_loss": -5.143485069274902, "global_step": 16386, "epoch": 390} {"train_loss": -5.230948448181152, "global_step": 16387, "epoch": 390} {"train_loss": -5.223562240600586, "global_step": 16388, "epoch": 390} {"train_loss": -5.155796051025391, "global_step": 16389, "epoch": 390} {"train_loss": -5.1779255867004395, "global_step": 16390, "epoch": 390} {"train_loss": -5.111692428588867, "global_step": 16391, "epoch": 390} {"train_loss": -5.22591495513916, "global_step": 16392, "epoch": 390} {"train_loss": -5.137478351593018, "global_step": 16393, "epoch": 390} {"train_loss": -5.144576072692871, "global_step": 16394, "epoch": 390} {"train_loss": -5.292680740356445, "global_step": 16395, "epoch": 390} {"train_loss": -5.125788688659668, "global_step": 16396, "epoch": 390} {"train_loss": -5.2720842361450195, "global_step": 16397, "epoch": 390} {"train_loss": -5.226471900939941, "global_step": 16398, "epoch": 390} {"train_loss": -5.252260684967041, "global_step": 16399, "epoch": 390} {"train_loss": -5.2409162521362305, "global_step": 16400, "epoch": 390} {"train_loss": -5.269905090332031, "global_step": 16401, "epoch": 390} {"train_loss": -5.175207614898682, "global_step": 16402, "epoch": 390} {"train_loss": -5.171035289764404, "global_step": 16403, "epoch": 390} {"train_loss": -5.3087992668151855, "global_step": 16404, "epoch": 390} {"train_loss": -5.142561912536621, "global_step": 16405, "epoch": 390} {"train_loss": -5.20184326171875, "global_step": 16406, "epoch": 390} {"train_loss": -5.087557792663574, "global_step": 16407, "epoch": 390} {"train_loss": -5.042022705078125, "global_step": 16408, "epoch": 390} {"train_loss": -5.25062370300293, "global_step": 16409, "epoch": 390} {"train_loss": -5.239319801330566, "global_step": 16410, "epoch": 390} {"train_loss": -5.241096019744873, "global_step": 16411, "epoch": 390} {"train_loss": -5.284716606140137, "global_step": 16412, "epoch": 390} {"train_loss": -5.1879472732543945, "global_step": 16413, "epoch": 390} {"train_loss": -5.164400100708008, "global_step": 16414, "epoch": 390} {"train_loss": -5.380610942840576, "global_step": 16415, "epoch": 390} {"train_loss": -5.1709885597229, "global_step": 16416, "epoch": 390} {"train_loss": -5.090914726257324, "global_step": 16417, "epoch": 390} {"train_loss": -5.247470855712891, "global_step": 16418, "epoch": 390} {"train_loss": -5.038665771484375, "global_step": 16419, "epoch": 390} {"train_loss": -5.1881914138793945, "global_step": 16420, "epoch": 390} {"train_loss": -5.201206343514579, "global_step": 16421, "epoch": 390, "val_loss": 69061.2421875} {"train_loss": -5.328561782836914, "global_step": 16422, "epoch": 391} {"train_loss": -5.227042198181152, "global_step": 16423, "epoch": 391} {"train_loss": -5.031704902648926, "global_step": 16424, "epoch": 391} {"train_loss": -5.300463676452637, "global_step": 16425, "epoch": 391} {"train_loss": -5.3075337409973145, "global_step": 16426, "epoch": 391} {"train_loss": -5.3265557289123535, "global_step": 16427, "epoch": 391} {"train_loss": -5.111592769622803, "global_step": 16428, "epoch": 391} {"train_loss": -5.182985305786133, "global_step": 16429, "epoch": 391} {"train_loss": -5.279552936553955, "global_step": 16430, "epoch": 391} {"train_loss": -5.2169084548950195, "global_step": 16431, "epoch": 391} {"train_loss": -5.131056785583496, "global_step": 16432, "epoch": 391} {"train_loss": -5.244978427886963, "global_step": 16433, "epoch": 391} {"train_loss": -5.174031734466553, "global_step": 16434, "epoch": 391} {"train_loss": -5.182301998138428, "global_step": 16435, "epoch": 391} {"train_loss": -5.242220878601074, "global_step": 16436, "epoch": 391} {"train_loss": -5.3748321533203125, "global_step": 16437, "epoch": 391} {"train_loss": -5.1931257247924805, "global_step": 16438, "epoch": 391} {"train_loss": -5.348282814025879, "global_step": 16439, "epoch": 391} {"train_loss": -5.072336196899414, "global_step": 16440, "epoch": 391} {"train_loss": -5.0899152755737305, "global_step": 16441, "epoch": 391} {"train_loss": -5.187255859375, "global_step": 16442, "epoch": 391} {"train_loss": -5.244236946105957, "global_step": 16443, "epoch": 391} {"train_loss": -5.076953887939453, "global_step": 16444, "epoch": 391} {"train_loss": -5.175017356872559, "global_step": 16445, "epoch": 391} {"train_loss": -5.095277786254883, "global_step": 16446, "epoch": 391} {"train_loss": -5.160754203796387, "global_step": 16447, "epoch": 391} {"train_loss": -5.134521961212158, "global_step": 16448, "epoch": 391} {"train_loss": -5.208215713500977, "global_step": 16449, "epoch": 391} {"train_loss": -5.18843936920166, "global_step": 16450, "epoch": 391} {"train_loss": -5.158770561218262, "global_step": 16451, "epoch": 391} {"train_loss": -5.169245719909668, "global_step": 16452, "epoch": 391} {"train_loss": -5.365686416625977, "global_step": 16453, "epoch": 391} {"train_loss": -5.11091423034668, "global_step": 16454, "epoch": 391} {"train_loss": -5.2655744552612305, "global_step": 16455, "epoch": 391} {"train_loss": -5.260034084320068, "global_step": 16456, "epoch": 391} {"train_loss": -5.191169738769531, "global_step": 16457, "epoch": 391} {"train_loss": -5.138119697570801, "global_step": 16458, "epoch": 391} {"train_loss": -5.28914737701416, "global_step": 16459, "epoch": 391} {"train_loss": -5.216935157775879, "global_step": 16460, "epoch": 391} {"train_loss": -5.306163311004639, "global_step": 16461, "epoch": 391} {"train_loss": -5.135213851928711, "global_step": 16462, "epoch": 391} {"train_loss": -5.205276091893514, "global_step": 16463, "epoch": 391, "val_loss": 69568.4921875} {"train_loss": -5.242745399475098, "global_step": 16464, "epoch": 392} {"train_loss": -5.284361839294434, "global_step": 16465, "epoch": 392} {"train_loss": -5.181190490722656, "global_step": 16466, "epoch": 392} {"train_loss": -5.143563747406006, "global_step": 16467, "epoch": 392} {"train_loss": -4.988226890563965, "global_step": 16468, "epoch": 392} {"train_loss": -5.025211334228516, "global_step": 16469, "epoch": 392} {"train_loss": -5.159358978271484, "global_step": 16470, "epoch": 392} {"train_loss": -5.18082332611084, "global_step": 16471, "epoch": 392} {"train_loss": -5.179373264312744, "global_step": 16472, "epoch": 392} {"train_loss": -5.17378044128418, "global_step": 16473, "epoch": 392} {"train_loss": -5.178927421569824, "global_step": 16474, "epoch": 392} {"train_loss": -5.149287700653076, "global_step": 16475, "epoch": 392} {"train_loss": -5.186433792114258, "global_step": 16476, "epoch": 392} {"train_loss": -5.202488899230957, "global_step": 16477, "epoch": 392} {"train_loss": -5.138027191162109, "global_step": 16478, "epoch": 392} {"train_loss": -5.220904350280762, "global_step": 16479, "epoch": 392} {"train_loss": -5.1926469802856445, "global_step": 16480, "epoch": 392} {"train_loss": -5.098822593688965, "global_step": 16481, "epoch": 392} {"train_loss": -5.328195095062256, "global_step": 16482, "epoch": 392} {"train_loss": -4.9828267097473145, "global_step": 16483, "epoch": 392} {"train_loss": -5.137444496154785, "global_step": 16484, "epoch": 392} {"train_loss": -5.316375732421875, "global_step": 16485, "epoch": 392} {"train_loss": -5.258021831512451, "global_step": 16486, "epoch": 392} {"train_loss": -5.104317665100098, "global_step": 16487, "epoch": 392} {"train_loss": -5.194058418273926, "global_step": 16488, "epoch": 392} {"train_loss": -5.09150505065918, "global_step": 16489, "epoch": 392} {"train_loss": -5.3510284423828125, "global_step": 16490, "epoch": 392} {"train_loss": -5.112041473388672, "global_step": 16491, "epoch": 392} {"train_loss": -5.058335304260254, "global_step": 16492, "epoch": 392} {"train_loss": -5.293806076049805, "global_step": 16493, "epoch": 392} {"train_loss": -5.302865505218506, "global_step": 16494, "epoch": 392} {"train_loss": -5.092630386352539, "global_step": 16495, "epoch": 392} {"train_loss": -5.225610733032227, "global_step": 16496, "epoch": 392} {"train_loss": -5.198598861694336, "global_step": 16497, "epoch": 392} {"train_loss": -5.210634231567383, "global_step": 16498, "epoch": 392} {"train_loss": -5.220983505249023, "global_step": 16499, "epoch": 392} {"train_loss": -5.174985885620117, "global_step": 16500, "epoch": 392} {"train_loss": -5.2253642082214355, "global_step": 16501, "epoch": 392} {"train_loss": -5.200638294219971, "global_step": 16502, "epoch": 392} {"train_loss": -5.277620315551758, "global_step": 16503, "epoch": 392} {"train_loss": -5.269628524780273, "global_step": 16504, "epoch": 392} {"train_loss": -5.192079941431682, "global_step": 16505, "epoch": 392, "val_loss": 69187.46875} {"train_loss": -5.154857635498047, "global_step": 16506, "epoch": 393} {"train_loss": -5.213353157043457, "global_step": 16507, "epoch": 393} {"train_loss": -5.2338361740112305, "global_step": 16508, "epoch": 393} {"train_loss": -5.292904853820801, "global_step": 16509, "epoch": 393} {"train_loss": -5.1714396476745605, "global_step": 16510, "epoch": 393} {"train_loss": -5.030752182006836, "global_step": 16511, "epoch": 393} {"train_loss": -5.131695747375488, "global_step": 16512, "epoch": 393} {"train_loss": -5.267704486846924, "global_step": 16513, "epoch": 393} {"train_loss": -5.0511627197265625, "global_step": 16514, "epoch": 393} {"train_loss": -5.121058464050293, "global_step": 16515, "epoch": 393} {"train_loss": -5.161025047302246, "global_step": 16516, "epoch": 393} {"train_loss": -5.115808486938477, "global_step": 16517, "epoch": 393} {"train_loss": -5.105649948120117, "global_step": 16518, "epoch": 393} {"train_loss": -5.060506820678711, "global_step": 16519, "epoch": 393} {"train_loss": -5.261442184448242, "global_step": 16520, "epoch": 393} {"train_loss": -5.2215070724487305, "global_step": 16521, "epoch": 393} {"train_loss": -5.06950044631958, "global_step": 16522, "epoch": 393} {"train_loss": -5.1701979637146, "global_step": 16523, "epoch": 393} {"train_loss": -5.046009063720703, "global_step": 16524, "epoch": 393} {"train_loss": -5.1049580574035645, "global_step": 16525, "epoch": 393} {"train_loss": -5.310285568237305, "global_step": 16526, "epoch": 393} {"train_loss": -5.286395072937012, "global_step": 16527, "epoch": 393} {"train_loss": -5.257853984832764, "global_step": 16528, "epoch": 393} {"train_loss": -5.265005588531494, "global_step": 16529, "epoch": 393} {"train_loss": -5.0612263679504395, "global_step": 16530, "epoch": 393} {"train_loss": -5.417686462402344, "global_step": 16531, "epoch": 393} {"train_loss": -5.206093788146973, "global_step": 16532, "epoch": 393} {"train_loss": -5.152617931365967, "global_step": 16533, "epoch": 393} {"train_loss": -5.242020606994629, "global_step": 16534, "epoch": 393} {"train_loss": -5.187730312347412, "global_step": 16535, "epoch": 393} {"train_loss": -5.226282119750977, "global_step": 16536, "epoch": 393} {"train_loss": -5.300777435302734, "global_step": 16537, "epoch": 393} {"train_loss": -5.186201095581055, "global_step": 16538, "epoch": 393} {"train_loss": -5.238816261291504, "global_step": 16539, "epoch": 393} {"train_loss": -5.221243858337402, "global_step": 16540, "epoch": 393} {"train_loss": -5.1931352615356445, "global_step": 16541, "epoch": 393} {"train_loss": -5.1606526374816895, "global_step": 16542, "epoch": 393} {"train_loss": -5.239302635192871, "global_step": 16543, "epoch": 393} {"train_loss": -5.29799222946167, "global_step": 16544, "epoch": 393} {"train_loss": -5.373204708099365, "global_step": 16545, "epoch": 393} {"train_loss": -5.206690788269043, "global_step": 16546, "epoch": 393} {"train_loss": -5.19677946681068, "global_step": 16547, "epoch": 393, "val_loss": 69259.6015625} {"train_loss": -5.201063632965088, "global_step": 16548, "epoch": 394} {"train_loss": -5.351507186889648, "global_step": 16549, "epoch": 394} {"train_loss": -5.272224426269531, "global_step": 16550, "epoch": 394} {"train_loss": -5.19840145111084, "global_step": 16551, "epoch": 394} {"train_loss": -5.288235664367676, "global_step": 16552, "epoch": 394} {"train_loss": -5.187192916870117, "global_step": 16553, "epoch": 394} {"train_loss": -5.201298236846924, "global_step": 16554, "epoch": 394} {"train_loss": -5.262137413024902, "global_step": 16555, "epoch": 394} {"train_loss": -5.153301239013672, "global_step": 16556, "epoch": 394} {"train_loss": -5.266362190246582, "global_step": 16557, "epoch": 394} {"train_loss": -5.047445297241211, "global_step": 16558, "epoch": 394} {"train_loss": -5.084059238433838, "global_step": 16559, "epoch": 394} {"train_loss": -5.2996826171875, "global_step": 16560, "epoch": 394} {"train_loss": -5.148956775665283, "global_step": 16561, "epoch": 394} {"train_loss": -5.149570465087891, "global_step": 16562, "epoch": 394} {"train_loss": -5.208765506744385, "global_step": 16563, "epoch": 394} {"train_loss": -4.994719505310059, "global_step": 16564, "epoch": 394} {"train_loss": -5.263697624206543, "global_step": 16565, "epoch": 394} {"train_loss": -5.15846061706543, "global_step": 16566, "epoch": 394} {"train_loss": -5.335514068603516, "global_step": 16567, "epoch": 394} {"train_loss": -5.122800827026367, "global_step": 16568, "epoch": 394} {"train_loss": -5.234173774719238, "global_step": 16569, "epoch": 394} {"train_loss": -5.231497764587402, "global_step": 16570, "epoch": 394} {"train_loss": -5.091031074523926, "global_step": 16571, "epoch": 394} {"train_loss": -5.414120674133301, "global_step": 16572, "epoch": 394} {"train_loss": -5.148818016052246, "global_step": 16573, "epoch": 394} {"train_loss": -5.383266925811768, "global_step": 16574, "epoch": 394} {"train_loss": -5.207589149475098, "global_step": 16575, "epoch": 394} {"train_loss": -5.2013020515441895, "global_step": 16576, "epoch": 394} {"train_loss": -5.234774589538574, "global_step": 16577, "epoch": 394} {"train_loss": -5.273954391479492, "global_step": 16578, "epoch": 394} {"train_loss": -5.226494789123535, "global_step": 16579, "epoch": 394} {"train_loss": -5.254219055175781, "global_step": 16580, "epoch": 394} {"train_loss": -5.339705467224121, "global_step": 16581, "epoch": 394} {"train_loss": -5.275077819824219, "global_step": 16582, "epoch": 394} {"train_loss": -5.244510173797607, "global_step": 16583, "epoch": 394} {"train_loss": -5.386492729187012, "global_step": 16584, "epoch": 394} {"train_loss": -5.254325866699219, "global_step": 16585, "epoch": 394} {"train_loss": -5.248710632324219, "global_step": 16586, "epoch": 394} {"train_loss": -5.208189964294434, "global_step": 16587, "epoch": 394} {"train_loss": -5.058350563049316, "global_step": 16588, "epoch": 394} {"train_loss": -5.225730123974028, "global_step": 16589, "epoch": 394, "val_loss": 69268.015625} {"train_loss": -5.305791854858398, "global_step": 16590, "epoch": 395} {"train_loss": -5.280852317810059, "global_step": 16591, "epoch": 395} {"train_loss": -5.3189778327941895, "global_step": 16592, "epoch": 395} {"train_loss": -5.177967071533203, "global_step": 16593, "epoch": 395} {"train_loss": -5.206903457641602, "global_step": 16594, "epoch": 395} {"train_loss": -5.199448585510254, "global_step": 16595, "epoch": 395} {"train_loss": -5.261983871459961, "global_step": 16596, "epoch": 395} {"train_loss": -5.282428741455078, "global_step": 16597, "epoch": 395} {"train_loss": -5.25806999206543, "global_step": 16598, "epoch": 395} {"train_loss": -5.23117733001709, "global_step": 16599, "epoch": 395} {"train_loss": -5.228292942047119, "global_step": 16600, "epoch": 395} {"train_loss": -5.147549629211426, "global_step": 16601, "epoch": 395} {"train_loss": -5.344906806945801, "global_step": 16602, "epoch": 395} {"train_loss": -5.130092620849609, "global_step": 16603, "epoch": 395} {"train_loss": -5.195172309875488, "global_step": 16604, "epoch": 395} {"train_loss": -5.249153137207031, "global_step": 16605, "epoch": 395} {"train_loss": -5.330198287963867, "global_step": 16606, "epoch": 395} {"train_loss": -5.179643630981445, "global_step": 16607, "epoch": 395} {"train_loss": -5.11944580078125, "global_step": 16608, "epoch": 395} {"train_loss": -5.0506439208984375, "global_step": 16609, "epoch": 395} {"train_loss": -5.131161689758301, "global_step": 16610, "epoch": 395} {"train_loss": -5.197746276855469, "global_step": 16611, "epoch": 395} {"train_loss": -5.2787981033325195, "global_step": 16612, "epoch": 395} {"train_loss": -5.228424072265625, "global_step": 16613, "epoch": 395} {"train_loss": -5.274641036987305, "global_step": 16614, "epoch": 395} {"train_loss": -5.116824626922607, "global_step": 16615, "epoch": 395} {"train_loss": -5.130468845367432, "global_step": 16616, "epoch": 395} {"train_loss": -5.329738140106201, "global_step": 16617, "epoch": 395} {"train_loss": -5.221151351928711, "global_step": 16618, "epoch": 395} {"train_loss": -5.3173418045043945, "global_step": 16619, "epoch": 395} {"train_loss": -5.400414943695068, "global_step": 16620, "epoch": 395} {"train_loss": -5.167620658874512, "global_step": 16621, "epoch": 395} {"train_loss": -5.23548698425293, "global_step": 16622, "epoch": 395} {"train_loss": -5.237377166748047, "global_step": 16623, "epoch": 395} {"train_loss": -5.122982978820801, "global_step": 16624, "epoch": 395} {"train_loss": -5.134583950042725, "global_step": 16625, "epoch": 395} {"train_loss": -5.307120323181152, "global_step": 16626, "epoch": 395} {"train_loss": -5.173795700073242, "global_step": 16627, "epoch": 395} {"train_loss": -5.291386127471924, "global_step": 16628, "epoch": 395} {"train_loss": -5.233584880828857, "global_step": 16629, "epoch": 395} {"train_loss": -5.220700263977051, "global_step": 16630, "epoch": 395} {"train_loss": -5.223815997441609, "global_step": 16631, "epoch": 395, "val_loss": 69009.4921875} {"train_loss": -5.402378559112549, "global_step": 16632, "epoch": 396} {"train_loss": -5.1032209396362305, "global_step": 16633, "epoch": 396} {"train_loss": -5.271936416625977, "global_step": 16634, "epoch": 396} {"train_loss": -5.346034049987793, "global_step": 16635, "epoch": 396} {"train_loss": -5.270082473754883, "global_step": 16636, "epoch": 396} {"train_loss": -5.2524871826171875, "global_step": 16637, "epoch": 396} {"train_loss": -5.12095832824707, "global_step": 16638, "epoch": 396} {"train_loss": -5.147222518920898, "global_step": 16639, "epoch": 396} {"train_loss": -5.193905830383301, "global_step": 16640, "epoch": 396} {"train_loss": -5.018040657043457, "global_step": 16641, "epoch": 396} {"train_loss": -5.163309097290039, "global_step": 16642, "epoch": 396} {"train_loss": -5.271962642669678, "global_step": 16643, "epoch": 396} {"train_loss": -5.021580696105957, "global_step": 16644, "epoch": 396} {"train_loss": -5.408031463623047, "global_step": 16645, "epoch": 396} {"train_loss": -5.220782279968262, "global_step": 16646, "epoch": 396} {"train_loss": -5.104994297027588, "global_step": 16647, "epoch": 396} {"train_loss": -5.1978840827941895, "global_step": 16648, "epoch": 396} {"train_loss": -5.289127826690674, "global_step": 16649, "epoch": 396} {"train_loss": -5.128810405731201, "global_step": 16650, "epoch": 396} {"train_loss": -5.219056606292725, "global_step": 16651, "epoch": 396} {"train_loss": -5.193621635437012, "global_step": 16652, "epoch": 396} {"train_loss": -5.178865432739258, "global_step": 16653, "epoch": 396} {"train_loss": -5.228372097015381, "global_step": 16654, "epoch": 396} {"train_loss": -5.290250778198242, "global_step": 16655, "epoch": 396} {"train_loss": -5.24893045425415, "global_step": 16656, "epoch": 396} {"train_loss": -5.325445652008057, "global_step": 16657, "epoch": 396} {"train_loss": -5.29034423828125, "global_step": 16658, "epoch": 396} {"train_loss": -5.06278133392334, "global_step": 16659, "epoch": 396} {"train_loss": -5.1630859375, "global_step": 16660, "epoch": 396} {"train_loss": -5.291236877441406, "global_step": 16661, "epoch": 396} {"train_loss": -5.184179306030273, "global_step": 16662, "epoch": 396} {"train_loss": -5.200356483459473, "global_step": 16663, "epoch": 396} {"train_loss": -5.381407737731934, "global_step": 16664, "epoch": 396} {"train_loss": -5.254626750946045, "global_step": 16665, "epoch": 396} {"train_loss": -5.194392204284668, "global_step": 16666, "epoch": 396} {"train_loss": -5.264496803283691, "global_step": 16667, "epoch": 396} {"train_loss": -5.152902603149414, "global_step": 16668, "epoch": 396} {"train_loss": -5.127662658691406, "global_step": 16669, "epoch": 396} {"train_loss": -5.327301502227783, "global_step": 16670, "epoch": 396} {"train_loss": -5.194696426391602, "global_step": 16671, "epoch": 396} {"train_loss": -5.207408905029297, "global_step": 16672, "epoch": 396} {"train_loss": -5.215102400098528, "global_step": 16673, "epoch": 396, "val_loss": 68992.5} {"train_loss": -5.126715183258057, "global_step": 16674, "epoch": 397} {"train_loss": -5.193085670471191, "global_step": 16675, "epoch": 397} {"train_loss": -5.11869478225708, "global_step": 16676, "epoch": 397} {"train_loss": -5.277261734008789, "global_step": 16677, "epoch": 397} {"train_loss": -5.18974494934082, "global_step": 16678, "epoch": 397} {"train_loss": -5.026151657104492, "global_step": 16679, "epoch": 397} {"train_loss": -5.135595321655273, "global_step": 16680, "epoch": 397} {"train_loss": -5.163601875305176, "global_step": 16681, "epoch": 397} {"train_loss": -5.038451671600342, "global_step": 16682, "epoch": 397} {"train_loss": -5.161428451538086, "global_step": 16683, "epoch": 397} {"train_loss": -5.122345447540283, "global_step": 16684, "epoch": 397} {"train_loss": -5.205296039581299, "global_step": 16685, "epoch": 397} {"train_loss": -5.2793498039245605, "global_step": 16686, "epoch": 397} {"train_loss": -5.192121505737305, "global_step": 16687, "epoch": 397} {"train_loss": -5.237098693847656, "global_step": 16688, "epoch": 397} {"train_loss": -5.394139766693115, "global_step": 16689, "epoch": 397} {"train_loss": -5.27651834487915, "global_step": 16690, "epoch": 397} {"train_loss": -5.239228248596191, "global_step": 16691, "epoch": 397} {"train_loss": -5.197693347930908, "global_step": 16692, "epoch": 397} {"train_loss": -5.27922248840332, "global_step": 16693, "epoch": 397} {"train_loss": -5.232381343841553, "global_step": 16694, "epoch": 397} {"train_loss": -5.307074069976807, "global_step": 16695, "epoch": 397} {"train_loss": -5.18817138671875, "global_step": 16696, "epoch": 397} {"train_loss": -5.209999084472656, "global_step": 16697, "epoch": 397} {"train_loss": -5.325976371765137, "global_step": 16698, "epoch": 397} {"train_loss": -5.325555801391602, "global_step": 16699, "epoch": 397} {"train_loss": -5.246159553527832, "global_step": 16700, "epoch": 397} {"train_loss": -5.162267684936523, "global_step": 16701, "epoch": 397} {"train_loss": -5.17344856262207, "global_step": 16702, "epoch": 397} {"train_loss": -5.119019985198975, "global_step": 16703, "epoch": 397} {"train_loss": -5.274652481079102, "global_step": 16704, "epoch": 397} {"train_loss": -5.2550153732299805, "global_step": 16705, "epoch": 397} {"train_loss": -5.131746768951416, "global_step": 16706, "epoch": 397} {"train_loss": -5.0656962394714355, "global_step": 16707, "epoch": 397} {"train_loss": -5.2225847244262695, "global_step": 16708, "epoch": 397} {"train_loss": -5.100218772888184, "global_step": 16709, "epoch": 397} {"train_loss": -5.070561408996582, "global_step": 16710, "epoch": 397} {"train_loss": -5.200990676879883, "global_step": 16711, "epoch": 397} {"train_loss": -4.976140022277832, "global_step": 16712, "epoch": 397} {"train_loss": -5.319076061248779, "global_step": 16713, "epoch": 397} {"train_loss": -5.199860095977783, "global_step": 16714, "epoch": 397} {"train_loss": -5.189933084306263, "global_step": 16715, "epoch": 397, "val_loss": 69154.578125} {"train_loss": -5.180423736572266, "global_step": 16716, "epoch": 398} {"train_loss": -5.105376243591309, "global_step": 16717, "epoch": 398} {"train_loss": -5.2005109786987305, "global_step": 16718, "epoch": 398} {"train_loss": -5.323610782623291, "global_step": 16719, "epoch": 398} {"train_loss": -5.29781436920166, "global_step": 16720, "epoch": 398} {"train_loss": -5.285980701446533, "global_step": 16721, "epoch": 398} {"train_loss": -5.072892189025879, "global_step": 16722, "epoch": 398} {"train_loss": -5.152755260467529, "global_step": 16723, "epoch": 398} {"train_loss": -5.152191162109375, "global_step": 16724, "epoch": 398} {"train_loss": -5.1679792404174805, "global_step": 16725, "epoch": 398} {"train_loss": -5.150996208190918, "global_step": 16726, "epoch": 398} {"train_loss": -5.283712387084961, "global_step": 16727, "epoch": 398} {"train_loss": -5.168094158172607, "global_step": 16728, "epoch": 398} {"train_loss": -5.090217113494873, "global_step": 16729, "epoch": 398} {"train_loss": -5.203555107116699, "global_step": 16730, "epoch": 398} {"train_loss": -5.182618618011475, "global_step": 16731, "epoch": 398} {"train_loss": -5.189206600189209, "global_step": 16732, "epoch": 398} {"train_loss": -5.095372676849365, "global_step": 16733, "epoch": 398} {"train_loss": -5.421594619750977, "global_step": 16734, "epoch": 398} {"train_loss": -5.122024059295654, "global_step": 16735, "epoch": 398} {"train_loss": -5.240942001342773, "global_step": 16736, "epoch": 398} {"train_loss": -5.311432838439941, "global_step": 16737, "epoch": 398} {"train_loss": -5.220828056335449, "global_step": 16738, "epoch": 398} {"train_loss": -5.32979154586792, "global_step": 16739, "epoch": 398} {"train_loss": -5.267244338989258, "global_step": 16740, "epoch": 398} {"train_loss": -5.317389488220215, "global_step": 16741, "epoch": 398} {"train_loss": -5.309643268585205, "global_step": 16742, "epoch": 398} {"train_loss": -5.282082557678223, "global_step": 16743, "epoch": 398} {"train_loss": -5.173226356506348, "global_step": 16744, "epoch": 398} {"train_loss": -5.162757396697998, "global_step": 16745, "epoch": 398} {"train_loss": -5.173069000244141, "global_step": 16746, "epoch": 398} {"train_loss": -5.177599906921387, "global_step": 16747, "epoch": 398} {"train_loss": -5.145625114440918, "global_step": 16748, "epoch": 398} {"train_loss": -5.300407409667969, "global_step": 16749, "epoch": 398} {"train_loss": -5.140913486480713, "global_step": 16750, "epoch": 398} {"train_loss": -5.253109931945801, "global_step": 16751, "epoch": 398} {"train_loss": -5.241805076599121, "global_step": 16752, "epoch": 398} {"train_loss": -5.14793586730957, "global_step": 16753, "epoch": 398} {"train_loss": -5.056494235992432, "global_step": 16754, "epoch": 398} {"train_loss": -5.175479888916016, "global_step": 16755, "epoch": 398} {"train_loss": -5.2076873779296875, "global_step": 16756, "epoch": 398} {"train_loss": -5.202274299803234, "global_step": 16757, "epoch": 398, "val_loss": 69287.8515625} {"train_loss": -5.232550144195557, "global_step": 16758, "epoch": 399} {"train_loss": -5.136697769165039, "global_step": 16759, "epoch": 399} {"train_loss": -5.122832775115967, "global_step": 16760, "epoch": 399} {"train_loss": -5.269070625305176, "global_step": 16761, "epoch": 399} {"train_loss": -5.206544876098633, "global_step": 16762, "epoch": 399} {"train_loss": -5.1621928215026855, "global_step": 16763, "epoch": 399} {"train_loss": -5.195331573486328, "global_step": 16764, "epoch": 399} {"train_loss": -5.1617431640625, "global_step": 16765, "epoch": 399} {"train_loss": -5.125604629516602, "global_step": 16766, "epoch": 399} {"train_loss": -5.231986999511719, "global_step": 16767, "epoch": 399} {"train_loss": -5.186866283416748, "global_step": 16768, "epoch": 399} {"train_loss": -5.043277740478516, "global_step": 16769, "epoch": 399} {"train_loss": -5.242002487182617, "global_step": 16770, "epoch": 399} {"train_loss": -5.1534037590026855, "global_step": 16771, "epoch": 399} {"train_loss": -5.066385269165039, "global_step": 16772, "epoch": 399} {"train_loss": -5.269516468048096, "global_step": 16773, "epoch": 399} {"train_loss": -5.041501998901367, "global_step": 16774, "epoch": 399} {"train_loss": -5.195963382720947, "global_step": 16775, "epoch": 399} {"train_loss": -5.185056686401367, "global_step": 16776, "epoch": 399} {"train_loss": -5.035167694091797, "global_step": 16777, "epoch": 399} {"train_loss": -5.250008583068848, "global_step": 16778, "epoch": 399} {"train_loss": -5.075698375701904, "global_step": 16779, "epoch": 399} {"train_loss": -5.2648515701293945, "global_step": 16780, "epoch": 399} {"train_loss": -5.227415084838867, "global_step": 16781, "epoch": 399} {"train_loss": -5.251729965209961, "global_step": 16782, "epoch": 399} {"train_loss": -5.088824272155762, "global_step": 16783, "epoch": 399} {"train_loss": -5.302987575531006, "global_step": 16784, "epoch": 399} {"train_loss": -5.212867259979248, "global_step": 16785, "epoch": 399} {"train_loss": -5.2536396980285645, "global_step": 16786, "epoch": 399} {"train_loss": -5.324967384338379, "global_step": 16787, "epoch": 399} {"train_loss": -5.1362199783325195, "global_step": 16788, "epoch": 399} {"train_loss": -5.269857883453369, "global_step": 16789, "epoch": 399} {"train_loss": -5.13504695892334, "global_step": 16790, "epoch": 399} {"train_loss": -5.251140594482422, "global_step": 16791, "epoch": 399} {"train_loss": -5.320062637329102, "global_step": 16792, "epoch": 399} {"train_loss": -5.189122200012207, "global_step": 16793, "epoch": 399} {"train_loss": -5.213551998138428, "global_step": 16794, "epoch": 399} {"train_loss": -5.126700401306152, "global_step": 16795, "epoch": 399} {"train_loss": -5.319900989532471, "global_step": 16796, "epoch": 399} {"train_loss": -5.2424116134643555, "global_step": 16797, "epoch": 399} {"train_loss": -5.264559745788574, "global_step": 16798, "epoch": 399} {"train_loss": -5.195561488469441, "global_step": 16799, "epoch": 399, "val_loss": 68827.96875} {"train_loss": -5.341963291168213, "global_step": 16800, "epoch": 400} {"train_loss": -5.284829616546631, "global_step": 16801, "epoch": 400} {"train_loss": -5.143149375915527, "global_step": 16802, "epoch": 400} {"train_loss": -5.294139385223389, "global_step": 16803, "epoch": 400} {"train_loss": -5.317105293273926, "global_step": 16804, "epoch": 400} {"train_loss": -5.198624610900879, "global_step": 16805, "epoch": 400} {"train_loss": -5.0560760498046875, "global_step": 16806, "epoch": 400} {"train_loss": -5.337536811828613, "global_step": 16807, "epoch": 400} {"train_loss": -5.026913642883301, "global_step": 16808, "epoch": 400} {"train_loss": -5.121549606323242, "global_step": 16809, "epoch": 400} {"train_loss": -5.192014694213867, "global_step": 16810, "epoch": 400} {"train_loss": -5.115564346313477, "global_step": 16811, "epoch": 400} {"train_loss": -5.186396598815918, "global_step": 16812, "epoch": 400} {"train_loss": -5.163775444030762, "global_step": 16813, "epoch": 400} {"train_loss": -5.110318660736084, "global_step": 16814, "epoch": 400} {"train_loss": -5.396678924560547, "global_step": 16815, "epoch": 400} {"train_loss": -5.280313491821289, "global_step": 16816, "epoch": 400} {"train_loss": -5.230926513671875, "global_step": 16817, "epoch": 400} {"train_loss": -5.352720260620117, "global_step": 16818, "epoch": 400} {"train_loss": -5.167206764221191, "global_step": 16819, "epoch": 400} {"train_loss": -5.313942909240723, "global_step": 16820, "epoch": 400} {"train_loss": -5.078066825866699, "global_step": 16821, "epoch": 400} {"train_loss": -5.277581691741943, "global_step": 16822, "epoch": 400} {"train_loss": -5.246259689331055, "global_step": 16823, "epoch": 400} {"train_loss": -5.172860622406006, "global_step": 16824, "epoch": 400} {"train_loss": -5.096706390380859, "global_step": 16825, "epoch": 400} {"train_loss": -5.213364601135254, "global_step": 16826, "epoch": 400} {"train_loss": -5.263022422790527, "global_step": 16827, "epoch": 400} {"train_loss": -5.224051475524902, "global_step": 16828, "epoch": 400} {"train_loss": -5.097434043884277, "global_step": 16829, "epoch": 400} {"train_loss": -5.285000801086426, "global_step": 16830, "epoch": 400} {"train_loss": -5.288051605224609, "global_step": 16831, "epoch": 400} {"train_loss": -5.166953086853027, "global_step": 16832, "epoch": 400} {"train_loss": -5.0984787940979, "global_step": 16833, "epoch": 400} {"train_loss": -5.176163673400879, "global_step": 16834, "epoch": 400} {"train_loss": -5.2395477294921875, "global_step": 16835, "epoch": 400} {"train_loss": -5.197338104248047, "global_step": 16836, "epoch": 400} {"train_loss": -5.334901332855225, "global_step": 16837, "epoch": 400} {"train_loss": -5.279884338378906, "global_step": 16838, "epoch": 400} {"train_loss": -5.165219306945801, "global_step": 16839, "epoch": 400} {"train_loss": -5.258380889892578, "global_step": 16840, "epoch": 400} {"train_loss": -5.214954115095592, "global_step": 16841, "epoch": 400, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.17866582207360657, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.13296693985349356, "train/sim_max_reward_4": 0.6872176964437908, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.0, "test/sim_max_reward_4300002": 0.47038990895136795, "test/sim_max_reward_4300003": 0.4057574778773398, "test/sim_max_reward_4300004": 0.5251340656536758, "test/sim_max_reward_4300005": 0.4244552066550228, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.28306890563637555, "test/sim_max_reward_4300008": 0.1939854333389353, "test/sim_max_reward_4300009": 0.08449405830810773, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.13203558975308574, "test/sim_max_reward_4300012": 0.3836963034986307, "test/sim_max_reward_4300013": 0.3735263863250828, "test/sim_max_reward_4300014": 0.42015102681870337, "test/sim_max_reward_4300015": 0.36427290694651815, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.4568383342679663, "test/sim_max_reward_4300018": 0.38574185528962923, "test/sim_max_reward_4300019": 0.17040466261515588, "test/sim_max_reward_4300020": 0.10041001002901379, "test/sim_max_reward_4300021": 0.1837328458411909, "test/sim_max_reward_4300022": 0.04117439532564052, "test/sim_max_reward_4300023": 0.3446043638239847, "test/sim_max_reward_4300024": 0.3300437614133009, "test/sim_max_reward_4300025": 0.08847875242732427, "test/sim_max_reward_4300026": 0.20509367173120643, "test/sim_max_reward_4300027": 0.0, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.10454369721778754, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.47761637808531227, "test/sim_max_reward_4300034": 0.5151422662791116, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.6573651736764728, "test/sim_max_reward_4300038": 0.5830522545943015, "test/sim_max_reward_4300039": 0.47179877468029285, "test/sim_max_reward_4300040": 0.0742514929086571, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7253830801952529, "test/sim_max_reward_4300043": 0.39392039434290654, "test/sim_max_reward_4300044": 0.06334236656334567, "test/sim_max_reward_4300045": 0.0, "test/sim_max_reward_4300046": 0.0, "test/sim_max_reward_4300047": 0.6072605069197713, "test/sim_max_reward_4300048": 0.4940832760862799, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.23035545238985508, "test/mean_score": 0.2383805202757977, "val_loss": 69912.90625} {"train_loss": -5.1530280113220215, "global_step": 16842, "epoch": 401} {"train_loss": -5.283010482788086, "global_step": 16843, "epoch": 401} {"train_loss": -5.15394926071167, "global_step": 16844, "epoch": 401} {"train_loss": -5.23266077041626, "global_step": 16845, "epoch": 401} {"train_loss": -5.3057026863098145, "global_step": 16846, "epoch": 401} {"train_loss": -5.248561859130859, "global_step": 16847, "epoch": 401} {"train_loss": -5.223555564880371, "global_step": 16848, "epoch": 401} {"train_loss": -5.201125144958496, "global_step": 16849, "epoch": 401} {"train_loss": -5.092988967895508, "global_step": 16850, "epoch": 401} {"train_loss": -5.205018997192383, "global_step": 16851, "epoch": 401} {"train_loss": -5.193053722381592, "global_step": 16852, "epoch": 401} {"train_loss": -5.254558086395264, "global_step": 16853, "epoch": 401} {"train_loss": -5.306268692016602, "global_step": 16854, "epoch": 401} {"train_loss": -5.036201477050781, "global_step": 16855, "epoch": 401} {"train_loss": -5.138575553894043, "global_step": 16856, "epoch": 401} {"train_loss": -5.279559135437012, "global_step": 16857, "epoch": 401} {"train_loss": -5.273860454559326, "global_step": 16858, "epoch": 401} {"train_loss": -5.072871685028076, "global_step": 16859, "epoch": 401} {"train_loss": -5.417268753051758, "global_step": 16860, "epoch": 401} {"train_loss": -5.088852882385254, "global_step": 16861, "epoch": 401} {"train_loss": -5.078281879425049, "global_step": 16862, "epoch": 401} {"train_loss": -5.18271541595459, "global_step": 16863, "epoch": 401} {"train_loss": -5.067531585693359, "global_step": 16864, "epoch": 401} {"train_loss": -5.258378028869629, "global_step": 16865, "epoch": 401} {"train_loss": -5.237462997436523, "global_step": 16866, "epoch": 401} {"train_loss": -5.116204738616943, "global_step": 16867, "epoch": 401} {"train_loss": -5.346929550170898, "global_step": 16868, "epoch": 401} {"train_loss": -5.256145477294922, "global_step": 16869, "epoch": 401} {"train_loss": -5.112973213195801, "global_step": 16870, "epoch": 401} {"train_loss": -5.126524925231934, "global_step": 16871, "epoch": 401} {"train_loss": -4.9647393226623535, "global_step": 16872, "epoch": 401} {"train_loss": -5.301263809204102, "global_step": 16873, "epoch": 401} {"train_loss": -5.199784755706787, "global_step": 16874, "epoch": 401} {"train_loss": -5.125434398651123, "global_step": 16875, "epoch": 401} {"train_loss": -5.2797698974609375, "global_step": 16876, "epoch": 401} {"train_loss": -5.162035942077637, "global_step": 16877, "epoch": 401} {"train_loss": -5.253836631774902, "global_step": 16878, "epoch": 401} {"train_loss": -5.317384719848633, "global_step": 16879, "epoch": 401} {"train_loss": -5.1704535484313965, "global_step": 16880, "epoch": 401} {"train_loss": -5.1908063888549805, "global_step": 16881, "epoch": 401} {"train_loss": -5.277456760406494, "global_step": 16882, "epoch": 401} {"train_loss": -5.20250712122236, "global_step": 16883, "epoch": 401, "val_loss": 69600.3359375} {"train_loss": -5.349523544311523, "global_step": 16884, "epoch": 402} {"train_loss": -5.140676498413086, "global_step": 16885, "epoch": 402} {"train_loss": -5.185479640960693, "global_step": 16886, "epoch": 402} {"train_loss": -5.238068580627441, "global_step": 16887, "epoch": 402} {"train_loss": -5.240171432495117, "global_step": 16888, "epoch": 402} {"train_loss": -5.127132415771484, "global_step": 16889, "epoch": 402} {"train_loss": -5.2463579177856445, "global_step": 16890, "epoch": 402} {"train_loss": -5.214938163757324, "global_step": 16891, "epoch": 402} {"train_loss": -5.100014686584473, "global_step": 16892, "epoch": 402} {"train_loss": -5.074872016906738, "global_step": 16893, "epoch": 402} {"train_loss": -5.321430206298828, "global_step": 16894, "epoch": 402} {"train_loss": -5.137342929840088, "global_step": 16895, "epoch": 402} {"train_loss": -5.311129570007324, "global_step": 16896, "epoch": 402} {"train_loss": -5.247675895690918, "global_step": 16897, "epoch": 402} {"train_loss": -5.057238578796387, "global_step": 16898, "epoch": 402} {"train_loss": -5.295521259307861, "global_step": 16899, "epoch": 402} {"train_loss": -5.24884033203125, "global_step": 16900, "epoch": 402} {"train_loss": -5.226017951965332, "global_step": 16901, "epoch": 402} {"train_loss": -5.1455559730529785, "global_step": 16902, "epoch": 402} {"train_loss": -5.073581695556641, "global_step": 16903, "epoch": 402} {"train_loss": -5.231438636779785, "global_step": 16904, "epoch": 402} {"train_loss": -5.150122165679932, "global_step": 16905, "epoch": 402} {"train_loss": -5.139822006225586, "global_step": 16906, "epoch": 402} {"train_loss": -5.2628936767578125, "global_step": 16907, "epoch": 402} {"train_loss": -5.2529683113098145, "global_step": 16908, "epoch": 402} {"train_loss": -5.187167167663574, "global_step": 16909, "epoch": 402} {"train_loss": -5.31535530090332, "global_step": 16910, "epoch": 402} {"train_loss": -5.235779762268066, "global_step": 16911, "epoch": 402} {"train_loss": -5.120828151702881, "global_step": 16912, "epoch": 402} {"train_loss": -5.3987250328063965, "global_step": 16913, "epoch": 402} {"train_loss": -5.209030628204346, "global_step": 16914, "epoch": 402} {"train_loss": -5.197634220123291, "global_step": 16915, "epoch": 402} {"train_loss": -5.387584686279297, "global_step": 16916, "epoch": 402} {"train_loss": -5.315255165100098, "global_step": 16917, "epoch": 402} {"train_loss": -5.271322250366211, "global_step": 16918, "epoch": 402} {"train_loss": -5.328762054443359, "global_step": 16919, "epoch": 402} {"train_loss": -5.253565788269043, "global_step": 16920, "epoch": 402} {"train_loss": -5.213711738586426, "global_step": 16921, "epoch": 402} {"train_loss": -5.21151876449585, "global_step": 16922, "epoch": 402} {"train_loss": -5.184179306030273, "global_step": 16923, "epoch": 402} {"train_loss": -5.189691543579102, "global_step": 16924, "epoch": 402} {"train_loss": -5.220137425831386, "global_step": 16925, "epoch": 402, "val_loss": 68876.1015625} {"train_loss": -5.358527183532715, "global_step": 16926, "epoch": 403} {"train_loss": -5.061286926269531, "global_step": 16927, "epoch": 403} {"train_loss": -5.245007038116455, "global_step": 16928, "epoch": 403} {"train_loss": -5.353789329528809, "global_step": 16929, "epoch": 403} {"train_loss": -5.370065689086914, "global_step": 16930, "epoch": 403} {"train_loss": -5.191083908081055, "global_step": 16931, "epoch": 403} {"train_loss": -5.270731449127197, "global_step": 16932, "epoch": 403} {"train_loss": -5.193758964538574, "global_step": 16933, "epoch": 403} {"train_loss": -5.213050842285156, "global_step": 16934, "epoch": 403} {"train_loss": -5.121920108795166, "global_step": 16935, "epoch": 403} {"train_loss": -5.270286560058594, "global_step": 16936, "epoch": 403} {"train_loss": -5.237452983856201, "global_step": 16937, "epoch": 403} {"train_loss": -5.065953731536865, "global_step": 16938, "epoch": 403} {"train_loss": -5.367511749267578, "global_step": 16939, "epoch": 403} {"train_loss": -5.262031555175781, "global_step": 16940, "epoch": 403} {"train_loss": -5.260199069976807, "global_step": 16941, "epoch": 403} {"train_loss": -5.310177803039551, "global_step": 16942, "epoch": 403} {"train_loss": -5.10039758682251, "global_step": 16943, "epoch": 403} {"train_loss": -5.300715923309326, "global_step": 16944, "epoch": 403} {"train_loss": -5.179673671722412, "global_step": 16945, "epoch": 403} {"train_loss": -5.298940658569336, "global_step": 16946, "epoch": 403} {"train_loss": -5.149324417114258, "global_step": 16947, "epoch": 403} {"train_loss": -5.288378715515137, "global_step": 16948, "epoch": 403} {"train_loss": -5.149764060974121, "global_step": 16949, "epoch": 403} {"train_loss": -5.224429607391357, "global_step": 16950, "epoch": 403} {"train_loss": -5.19672966003418, "global_step": 16951, "epoch": 403} {"train_loss": -5.107882499694824, "global_step": 16952, "epoch": 403} {"train_loss": -5.304904937744141, "global_step": 16953, "epoch": 403} {"train_loss": -5.152020454406738, "global_step": 16954, "epoch": 403} {"train_loss": -5.223649024963379, "global_step": 16955, "epoch": 403} {"train_loss": -5.346717834472656, "global_step": 16956, "epoch": 403} {"train_loss": -5.2423505783081055, "global_step": 16957, "epoch": 403} {"train_loss": -5.175187110900879, "global_step": 16958, "epoch": 403} {"train_loss": -5.221297740936279, "global_step": 16959, "epoch": 403} {"train_loss": -5.216736316680908, "global_step": 16960, "epoch": 403} {"train_loss": -5.170187473297119, "global_step": 16961, "epoch": 403} {"train_loss": -5.109369277954102, "global_step": 16962, "epoch": 403} {"train_loss": -5.190806865692139, "global_step": 16963, "epoch": 403} {"train_loss": -5.24085807800293, "global_step": 16964, "epoch": 403} {"train_loss": -5.178371429443359, "global_step": 16965, "epoch": 403} {"train_loss": -5.351111888885498, "global_step": 16966, "epoch": 403} {"train_loss": -5.2245335805983775, "global_step": 16967, "epoch": 403, "val_loss": 69351.59375} {"train_loss": -5.180618762969971, "global_step": 16968, "epoch": 404} {"train_loss": -5.263446807861328, "global_step": 16969, "epoch": 404} {"train_loss": -5.247315406799316, "global_step": 16970, "epoch": 404} {"train_loss": -5.169893264770508, "global_step": 16971, "epoch": 404} {"train_loss": -5.2541184425354, "global_step": 16972, "epoch": 404} {"train_loss": -5.25393009185791, "global_step": 16973, "epoch": 404} {"train_loss": -5.264621734619141, "global_step": 16974, "epoch": 404} {"train_loss": -5.296277046203613, "global_step": 16975, "epoch": 404} {"train_loss": -5.1698102951049805, "global_step": 16976, "epoch": 404} {"train_loss": -5.370743751525879, "global_step": 16977, "epoch": 404} {"train_loss": -5.304570198059082, "global_step": 16978, "epoch": 404} {"train_loss": -5.324192523956299, "global_step": 16979, "epoch": 404} {"train_loss": -5.4267096519470215, "global_step": 16980, "epoch": 404} {"train_loss": -5.277294158935547, "global_step": 16981, "epoch": 404} {"train_loss": -5.2100677490234375, "global_step": 16982, "epoch": 404} {"train_loss": -5.281899929046631, "global_step": 16983, "epoch": 404} {"train_loss": -5.3340559005737305, "global_step": 16984, "epoch": 404} {"train_loss": -5.248693943023682, "global_step": 16985, "epoch": 404} {"train_loss": -5.2096099853515625, "global_step": 16986, "epoch": 404} {"train_loss": -5.272793769836426, "global_step": 16987, "epoch": 404} {"train_loss": -5.3507843017578125, "global_step": 16988, "epoch": 404} {"train_loss": -5.2649641036987305, "global_step": 16989, "epoch": 404} {"train_loss": -5.2434234619140625, "global_step": 16990, "epoch": 404} {"train_loss": -5.320653915405273, "global_step": 16991, "epoch": 404} {"train_loss": -5.317038536071777, "global_step": 16992, "epoch": 404} {"train_loss": -5.369235038757324, "global_step": 16993, "epoch": 404} {"train_loss": -5.291358947753906, "global_step": 16994, "epoch": 404} {"train_loss": -5.162898063659668, "global_step": 16995, "epoch": 404} {"train_loss": -5.315120697021484, "global_step": 16996, "epoch": 404} {"train_loss": -5.29849910736084, "global_step": 16997, "epoch": 404} {"train_loss": -5.205733776092529, "global_step": 16998, "epoch": 404} {"train_loss": -5.292963981628418, "global_step": 16999, "epoch": 404} {"train_loss": -5.102977275848389, "global_step": 17000, "epoch": 404} {"train_loss": -5.2019524574279785, "global_step": 17001, "epoch": 404} {"train_loss": -5.089400291442871, "global_step": 17002, "epoch": 404} {"train_loss": -5.209312438964844, "global_step": 17003, "epoch": 404} {"train_loss": -5.251186847686768, "global_step": 17004, "epoch": 404} {"train_loss": -5.187978744506836, "global_step": 17005, "epoch": 404} {"train_loss": -5.197604656219482, "global_step": 17006, "epoch": 404} {"train_loss": -5.319089889526367, "global_step": 17007, "epoch": 404} {"train_loss": -5.258077621459961, "global_step": 17008, "epoch": 404} {"train_loss": -5.254832710538592, "global_step": 17009, "epoch": 404, "val_loss": 68580.3359375} {"train_loss": -5.245721817016602, "global_step": 17010, "epoch": 405} {"train_loss": -5.236501216888428, "global_step": 17011, "epoch": 405} {"train_loss": -5.244418144226074, "global_step": 17012, "epoch": 405} {"train_loss": -5.1031084060668945, "global_step": 17013, "epoch": 405} {"train_loss": -5.353834629058838, "global_step": 17014, "epoch": 405} {"train_loss": -5.18395471572876, "global_step": 17015, "epoch": 405} {"train_loss": -4.971460342407227, "global_step": 17016, "epoch": 405} {"train_loss": -5.170337200164795, "global_step": 17017, "epoch": 405} {"train_loss": -5.1663031578063965, "global_step": 17018, "epoch": 405} {"train_loss": -5.141145706176758, "global_step": 17019, "epoch": 405} {"train_loss": -5.189248085021973, "global_step": 17020, "epoch": 405} {"train_loss": -5.230708122253418, "global_step": 17021, "epoch": 405} {"train_loss": -5.244431495666504, "global_step": 17022, "epoch": 405} {"train_loss": -5.139261722564697, "global_step": 17023, "epoch": 405} {"train_loss": -5.204169273376465, "global_step": 17024, "epoch": 405} {"train_loss": -5.16348934173584, "global_step": 17025, "epoch": 405} {"train_loss": -5.239737510681152, "global_step": 17026, "epoch": 405} {"train_loss": -5.279660224914551, "global_step": 17027, "epoch": 405} {"train_loss": -5.340778350830078, "global_step": 17028, "epoch": 405} {"train_loss": -5.375077247619629, "global_step": 17029, "epoch": 405} {"train_loss": -5.2226667404174805, "global_step": 17030, "epoch": 405} {"train_loss": -5.318322658538818, "global_step": 17031, "epoch": 405} {"train_loss": -5.249734878540039, "global_step": 17032, "epoch": 405} {"train_loss": -5.263495445251465, "global_step": 17033, "epoch": 405} {"train_loss": -5.348643779754639, "global_step": 17034, "epoch": 405} {"train_loss": -5.15240478515625, "global_step": 17035, "epoch": 405} {"train_loss": -5.281996250152588, "global_step": 17036, "epoch": 405} {"train_loss": -5.221706867218018, "global_step": 17037, "epoch": 405} {"train_loss": -5.213468551635742, "global_step": 17038, "epoch": 405} {"train_loss": -5.264898300170898, "global_step": 17039, "epoch": 405} {"train_loss": -5.0251641273498535, "global_step": 17040, "epoch": 405} {"train_loss": -5.16538667678833, "global_step": 17041, "epoch": 405} {"train_loss": -5.349897384643555, "global_step": 17042, "epoch": 405} {"train_loss": -5.15861701965332, "global_step": 17043, "epoch": 405} {"train_loss": -5.234546661376953, "global_step": 17044, "epoch": 405} {"train_loss": -5.129614353179932, "global_step": 17045, "epoch": 405} {"train_loss": -5.2183380126953125, "global_step": 17046, "epoch": 405} {"train_loss": -5.03790283203125, "global_step": 17047, "epoch": 405} {"train_loss": -5.313056945800781, "global_step": 17048, "epoch": 405} {"train_loss": -5.3400678634643555, "global_step": 17049, "epoch": 405} {"train_loss": -5.126343727111816, "global_step": 17050, "epoch": 405} {"train_loss": -5.217393931888399, "global_step": 17051, "epoch": 405, "val_loss": 69146.234375} {"train_loss": -5.137598991394043, "global_step": 17052, "epoch": 406} {"train_loss": -5.167410373687744, "global_step": 17053, "epoch": 406} {"train_loss": -5.5409650802612305, "global_step": 17054, "epoch": 406} {"train_loss": -5.294053077697754, "global_step": 17055, "epoch": 406} {"train_loss": -5.228772163391113, "global_step": 17056, "epoch": 406} {"train_loss": -5.195257663726807, "global_step": 17057, "epoch": 406} {"train_loss": -5.094363212585449, "global_step": 17058, "epoch": 406} {"train_loss": -5.1330671310424805, "global_step": 17059, "epoch": 406} {"train_loss": -5.167567253112793, "global_step": 17060, "epoch": 406} {"train_loss": -5.073188781738281, "global_step": 17061, "epoch": 406} {"train_loss": -5.196732521057129, "global_step": 17062, "epoch": 406} {"train_loss": -5.199296474456787, "global_step": 17063, "epoch": 406} {"train_loss": -5.344079971313477, "global_step": 17064, "epoch": 406} {"train_loss": -5.317605972290039, "global_step": 17065, "epoch": 406} {"train_loss": -5.193886756896973, "global_step": 17066, "epoch": 406} {"train_loss": -5.184377670288086, "global_step": 17067, "epoch": 406} {"train_loss": -5.243395805358887, "global_step": 17068, "epoch": 406} {"train_loss": -5.268903732299805, "global_step": 17069, "epoch": 406} {"train_loss": -5.227778434753418, "global_step": 17070, "epoch": 406} {"train_loss": -5.316828727722168, "global_step": 17071, "epoch": 406} {"train_loss": -5.1963300704956055, "global_step": 17072, "epoch": 406} {"train_loss": -5.271697521209717, "global_step": 17073, "epoch": 406} {"train_loss": -5.39026403427124, "global_step": 17074, "epoch": 406} {"train_loss": -5.326410293579102, "global_step": 17075, "epoch": 406} {"train_loss": -5.246293067932129, "global_step": 17076, "epoch": 406} {"train_loss": -5.176606178283691, "global_step": 17077, "epoch": 406} {"train_loss": -5.285715579986572, "global_step": 17078, "epoch": 406} {"train_loss": -5.241238594055176, "global_step": 17079, "epoch": 406} {"train_loss": -5.097554683685303, "global_step": 17080, "epoch": 406} {"train_loss": -5.351509094238281, "global_step": 17081, "epoch": 406} {"train_loss": -5.332000732421875, "global_step": 17082, "epoch": 406} {"train_loss": -5.171830177307129, "global_step": 17083, "epoch": 406} {"train_loss": -5.098237991333008, "global_step": 17084, "epoch": 406} {"train_loss": -5.346600532531738, "global_step": 17085, "epoch": 406} {"train_loss": -5.248430252075195, "global_step": 17086, "epoch": 406} {"train_loss": -5.1887054443359375, "global_step": 17087, "epoch": 406} {"train_loss": -5.295125484466553, "global_step": 17088, "epoch": 406} {"train_loss": -5.291299343109131, "global_step": 17089, "epoch": 406} {"train_loss": -5.095561504364014, "global_step": 17090, "epoch": 406} {"train_loss": -5.210929870605469, "global_step": 17091, "epoch": 406} {"train_loss": -5.188580513000488, "global_step": 17092, "epoch": 406} {"train_loss": -5.232481911068871, "global_step": 17093, "epoch": 406, "val_loss": 69102.0625} {"train_loss": -5.2873640060424805, "global_step": 17094, "epoch": 407} {"train_loss": -5.027918815612793, "global_step": 17095, "epoch": 407} {"train_loss": -5.301329612731934, "global_step": 17096, "epoch": 407} {"train_loss": -5.163731575012207, "global_step": 17097, "epoch": 407} {"train_loss": -5.11012601852417, "global_step": 17098, "epoch": 407} {"train_loss": -5.3928728103637695, "global_step": 17099, "epoch": 407} {"train_loss": -5.358067035675049, "global_step": 17100, "epoch": 407} {"train_loss": -5.189662933349609, "global_step": 17101, "epoch": 407} {"train_loss": -5.341300964355469, "global_step": 17102, "epoch": 407} {"train_loss": -5.205008506774902, "global_step": 17103, "epoch": 407} {"train_loss": -5.253021240234375, "global_step": 17104, "epoch": 407} {"train_loss": -5.138974189758301, "global_step": 17105, "epoch": 407} {"train_loss": -5.33410120010376, "global_step": 17106, "epoch": 407} {"train_loss": -5.375578880310059, "global_step": 17107, "epoch": 407} {"train_loss": -5.176488876342773, "global_step": 17108, "epoch": 407} {"train_loss": -5.38587760925293, "global_step": 17109, "epoch": 407} {"train_loss": -5.161094665527344, "global_step": 17110, "epoch": 407} {"train_loss": -5.180665969848633, "global_step": 17111, "epoch": 407} {"train_loss": -5.320332050323486, "global_step": 17112, "epoch": 407} {"train_loss": -5.270251274108887, "global_step": 17113, "epoch": 407} {"train_loss": -5.103906154632568, "global_step": 17114, "epoch": 407} {"train_loss": -5.2079925537109375, "global_step": 17115, "epoch": 407} {"train_loss": -5.209005832672119, "global_step": 17116, "epoch": 407} {"train_loss": -5.267334461212158, "global_step": 17117, "epoch": 407} {"train_loss": -5.21378231048584, "global_step": 17118, "epoch": 407} {"train_loss": -5.252089500427246, "global_step": 17119, "epoch": 407} {"train_loss": -5.06689977645874, "global_step": 17120, "epoch": 407} {"train_loss": -5.1525373458862305, "global_step": 17121, "epoch": 407} {"train_loss": -5.133954048156738, "global_step": 17122, "epoch": 407} {"train_loss": -4.983747959136963, "global_step": 17123, "epoch": 407} {"train_loss": -5.245058536529541, "global_step": 17124, "epoch": 407} {"train_loss": -5.297347545623779, "global_step": 17125, "epoch": 407} {"train_loss": -5.2605485916137695, "global_step": 17126, "epoch": 407} {"train_loss": -5.137704849243164, "global_step": 17127, "epoch": 407} {"train_loss": -5.232083320617676, "global_step": 17128, "epoch": 407} {"train_loss": -5.32398796081543, "global_step": 17129, "epoch": 407} {"train_loss": -5.284581184387207, "global_step": 17130, "epoch": 407} {"train_loss": -5.181140899658203, "global_step": 17131, "epoch": 407} {"train_loss": -5.229597091674805, "global_step": 17132, "epoch": 407} {"train_loss": -5.278035640716553, "global_step": 17133, "epoch": 407} {"train_loss": -5.318202972412109, "global_step": 17134, "epoch": 407} {"train_loss": -5.230022578012376, "global_step": 17135, "epoch": 407, "val_loss": 68701.71875} {"train_loss": -5.25303840637207, "global_step": 17136, "epoch": 408} {"train_loss": -5.367317199707031, "global_step": 17137, "epoch": 408} {"train_loss": -5.390016555786133, "global_step": 17138, "epoch": 408} {"train_loss": -5.141196250915527, "global_step": 17139, "epoch": 408} {"train_loss": -5.216114521026611, "global_step": 17140, "epoch": 408} {"train_loss": -5.27752685546875, "global_step": 17141, "epoch": 408} {"train_loss": -5.266073226928711, "global_step": 17142, "epoch": 408} {"train_loss": -5.2564873695373535, "global_step": 17143, "epoch": 408} {"train_loss": -5.174189567565918, "global_step": 17144, "epoch": 408} {"train_loss": -5.002951622009277, "global_step": 17145, "epoch": 408} {"train_loss": -5.334990501403809, "global_step": 17146, "epoch": 408} {"train_loss": -5.400263786315918, "global_step": 17147, "epoch": 408} {"train_loss": -5.139176368713379, "global_step": 17148, "epoch": 408} {"train_loss": -5.235605716705322, "global_step": 17149, "epoch": 408} {"train_loss": -5.141261100769043, "global_step": 17150, "epoch": 408} {"train_loss": -5.2324676513671875, "global_step": 17151, "epoch": 408} {"train_loss": -5.227643966674805, "global_step": 17152, "epoch": 408} {"train_loss": -5.245424270629883, "global_step": 17153, "epoch": 408} {"train_loss": -5.233338356018066, "global_step": 17154, "epoch": 408} {"train_loss": -5.314384937286377, "global_step": 17155, "epoch": 408} {"train_loss": -5.203164100646973, "global_step": 17156, "epoch": 408} {"train_loss": -5.289736270904541, "global_step": 17157, "epoch": 408} {"train_loss": -5.183052062988281, "global_step": 17158, "epoch": 408} {"train_loss": -5.189062118530273, "global_step": 17159, "epoch": 408} {"train_loss": -5.285647392272949, "global_step": 17160, "epoch": 408} {"train_loss": -5.370165824890137, "global_step": 17161, "epoch": 408} {"train_loss": -5.2437028884887695, "global_step": 17162, "epoch": 408} {"train_loss": -5.158696174621582, "global_step": 17163, "epoch": 408} {"train_loss": -5.227921485900879, "global_step": 17164, "epoch": 408} {"train_loss": -5.334566593170166, "global_step": 17165, "epoch": 408} {"train_loss": -5.324705123901367, "global_step": 17166, "epoch": 408} {"train_loss": -5.267429828643799, "global_step": 17167, "epoch": 408} {"train_loss": -5.317111968994141, "global_step": 17168, "epoch": 408} {"train_loss": -5.24933385848999, "global_step": 17169, "epoch": 408} {"train_loss": -5.268357276916504, "global_step": 17170, "epoch": 408} {"train_loss": -5.17866849899292, "global_step": 17171, "epoch": 408} {"train_loss": -5.2934722900390625, "global_step": 17172, "epoch": 408} {"train_loss": -5.252820014953613, "global_step": 17173, "epoch": 408} {"train_loss": -5.272395133972168, "global_step": 17174, "epoch": 408} {"train_loss": -5.3101806640625, "global_step": 17175, "epoch": 408} {"train_loss": -5.2936553955078125, "global_step": 17176, "epoch": 408} {"train_loss": -5.25441388856797, "global_step": 17177, "epoch": 408, "val_loss": 68990.296875} {"train_loss": -5.1921539306640625, "global_step": 17178, "epoch": 409} {"train_loss": -5.207100868225098, "global_step": 17179, "epoch": 409} {"train_loss": -5.261031150817871, "global_step": 17180, "epoch": 409} {"train_loss": -5.0918121337890625, "global_step": 17181, "epoch": 409} {"train_loss": -5.149797439575195, "global_step": 17182, "epoch": 409} {"train_loss": -5.078452110290527, "global_step": 17183, "epoch": 409} {"train_loss": -5.245652198791504, "global_step": 17184, "epoch": 409} {"train_loss": -5.2958083152771, "global_step": 17185, "epoch": 409} {"train_loss": -5.320778846740723, "global_step": 17186, "epoch": 409} {"train_loss": -5.250059604644775, "global_step": 17187, "epoch": 409} {"train_loss": -5.148151397705078, "global_step": 17188, "epoch": 409} {"train_loss": -5.188323020935059, "global_step": 17189, "epoch": 409} {"train_loss": -5.341869354248047, "global_step": 17190, "epoch": 409} {"train_loss": -5.241040229797363, "global_step": 17191, "epoch": 409} {"train_loss": -5.165567398071289, "global_step": 17192, "epoch": 409} {"train_loss": -5.281932830810547, "global_step": 17193, "epoch": 409} {"train_loss": -5.221063613891602, "global_step": 17194, "epoch": 409} {"train_loss": -5.1746745109558105, "global_step": 17195, "epoch": 409} {"train_loss": -5.229552268981934, "global_step": 17196, "epoch": 409} {"train_loss": -5.162961959838867, "global_step": 17197, "epoch": 409} {"train_loss": -5.246048927307129, "global_step": 17198, "epoch": 409} {"train_loss": -5.195585250854492, "global_step": 17199, "epoch": 409} {"train_loss": -5.082123756408691, "global_step": 17200, "epoch": 409} {"train_loss": -5.195147514343262, "global_step": 17201, "epoch": 409} {"train_loss": -5.255860805511475, "global_step": 17202, "epoch": 409} {"train_loss": -5.186732292175293, "global_step": 17203, "epoch": 409} {"train_loss": -5.371756553649902, "global_step": 17204, "epoch": 409} {"train_loss": -5.181393623352051, "global_step": 17205, "epoch": 409} {"train_loss": -5.338068962097168, "global_step": 17206, "epoch": 409} {"train_loss": -5.308332443237305, "global_step": 17207, "epoch": 409} {"train_loss": -5.270780563354492, "global_step": 17208, "epoch": 409} {"train_loss": -5.382079124450684, "global_step": 17209, "epoch": 409} {"train_loss": -5.325142860412598, "global_step": 17210, "epoch": 409} {"train_loss": -5.404937744140625, "global_step": 17211, "epoch": 409} {"train_loss": -5.209533214569092, "global_step": 17212, "epoch": 409} {"train_loss": -5.417025566101074, "global_step": 17213, "epoch": 409} {"train_loss": -5.192501068115234, "global_step": 17214, "epoch": 409} {"train_loss": -5.338360786437988, "global_step": 17215, "epoch": 409} {"train_loss": -5.210914134979248, "global_step": 17216, "epoch": 409} {"train_loss": -5.254297256469727, "global_step": 17217, "epoch": 409} {"train_loss": -5.282833099365234, "global_step": 17218, "epoch": 409} {"train_loss": -5.240285566874912, "global_step": 17219, "epoch": 409, "val_loss": 68972.2265625} {"train_loss": -5.183191776275635, "global_step": 17220, "epoch": 410} {"train_loss": -5.228658676147461, "global_step": 17221, "epoch": 410} {"train_loss": -5.275261878967285, "global_step": 17222, "epoch": 410} {"train_loss": -5.300900936126709, "global_step": 17223, "epoch": 410} {"train_loss": -5.233328342437744, "global_step": 17224, "epoch": 410} {"train_loss": -5.209288597106934, "global_step": 17225, "epoch": 410} {"train_loss": -5.274702072143555, "global_step": 17226, "epoch": 410} {"train_loss": -5.202439308166504, "global_step": 17227, "epoch": 410} {"train_loss": -5.1849517822265625, "global_step": 17228, "epoch": 410} {"train_loss": -5.3451995849609375, "global_step": 17229, "epoch": 410} {"train_loss": -5.200594902038574, "global_step": 17230, "epoch": 410} {"train_loss": -5.25286865234375, "global_step": 17231, "epoch": 410} {"train_loss": -5.179435729980469, "global_step": 17232, "epoch": 410} {"train_loss": -5.184553146362305, "global_step": 17233, "epoch": 410} {"train_loss": -5.153098106384277, "global_step": 17234, "epoch": 410} {"train_loss": -5.179198265075684, "global_step": 17235, "epoch": 410} {"train_loss": -5.250080108642578, "global_step": 17236, "epoch": 410} {"train_loss": -5.035721778869629, "global_step": 17237, "epoch": 410} {"train_loss": -5.153682708740234, "global_step": 17238, "epoch": 410} {"train_loss": -5.233609199523926, "global_step": 17239, "epoch": 410} {"train_loss": -5.107244491577148, "global_step": 17240, "epoch": 410} {"train_loss": -5.2754411697387695, "global_step": 17241, "epoch": 410} {"train_loss": -5.104160308837891, "global_step": 17242, "epoch": 410} {"train_loss": -5.3136820793151855, "global_step": 17243, "epoch": 410} {"train_loss": -5.260025501251221, "global_step": 17244, "epoch": 410} {"train_loss": -5.304397106170654, "global_step": 17245, "epoch": 410} {"train_loss": -5.284808158874512, "global_step": 17246, "epoch": 410} {"train_loss": -5.244712829589844, "global_step": 17247, "epoch": 410} {"train_loss": -5.128451824188232, "global_step": 17248, "epoch": 410} {"train_loss": -5.158390045166016, "global_step": 17249, "epoch": 410} {"train_loss": -5.413784980773926, "global_step": 17250, "epoch": 410} {"train_loss": -5.151850700378418, "global_step": 17251, "epoch": 410} {"train_loss": -5.286555290222168, "global_step": 17252, "epoch": 410} {"train_loss": -5.206753730773926, "global_step": 17253, "epoch": 410} {"train_loss": -5.257318019866943, "global_step": 17254, "epoch": 410} {"train_loss": -5.139851093292236, "global_step": 17255, "epoch": 410} {"train_loss": -5.2318549156188965, "global_step": 17256, "epoch": 410} {"train_loss": -5.319244861602783, "global_step": 17257, "epoch": 410} {"train_loss": -5.332955360412598, "global_step": 17258, "epoch": 410} {"train_loss": -5.19893741607666, "global_step": 17259, "epoch": 410} {"train_loss": -5.176604270935059, "global_step": 17260, "epoch": 410} {"train_loss": -5.221230086826143, "global_step": 17261, "epoch": 410, "val_loss": 69345.2890625} {"train_loss": -5.114445686340332, "global_step": 17262, "epoch": 411} {"train_loss": -5.231107234954834, "global_step": 17263, "epoch": 411} {"train_loss": -5.297710418701172, "global_step": 17264, "epoch": 411} {"train_loss": -5.2598557472229, "global_step": 17265, "epoch": 411} {"train_loss": -5.145148277282715, "global_step": 17266, "epoch": 411} {"train_loss": -5.172867298126221, "global_step": 17267, "epoch": 411} {"train_loss": -5.131491661071777, "global_step": 17268, "epoch": 411} {"train_loss": -5.176352500915527, "global_step": 17269, "epoch": 411} {"train_loss": -5.360668182373047, "global_step": 17270, "epoch": 411} {"train_loss": -5.1557698249816895, "global_step": 17271, "epoch": 411} {"train_loss": -5.306488037109375, "global_step": 17272, "epoch": 411} {"train_loss": -5.310990333557129, "global_step": 17273, "epoch": 411} {"train_loss": -5.296591758728027, "global_step": 17274, "epoch": 411} {"train_loss": -5.25614070892334, "global_step": 17275, "epoch": 411} {"train_loss": -5.2467193603515625, "global_step": 17276, "epoch": 411} {"train_loss": -5.213072776794434, "global_step": 17277, "epoch": 411} {"train_loss": -5.281737327575684, "global_step": 17278, "epoch": 411} {"train_loss": -5.249813079833984, "global_step": 17279, "epoch": 411} {"train_loss": -5.2978410720825195, "global_step": 17280, "epoch": 411} {"train_loss": -5.288818836212158, "global_step": 17281, "epoch": 411} {"train_loss": -5.328531265258789, "global_step": 17282, "epoch": 411} {"train_loss": -5.223171234130859, "global_step": 17283, "epoch": 411} {"train_loss": -5.197912693023682, "global_step": 17284, "epoch": 411} {"train_loss": -5.153280258178711, "global_step": 17285, "epoch": 411} {"train_loss": -5.193726539611816, "global_step": 17286, "epoch": 411} {"train_loss": -5.160374641418457, "global_step": 17287, "epoch": 411} {"train_loss": -5.103190898895264, "global_step": 17288, "epoch": 411} {"train_loss": -5.198152542114258, "global_step": 17289, "epoch": 411} {"train_loss": -5.288166522979736, "global_step": 17290, "epoch": 411} {"train_loss": -5.091340065002441, "global_step": 17291, "epoch": 411} {"train_loss": -5.201099395751953, "global_step": 17292, "epoch": 411} {"train_loss": -5.1084489822387695, "global_step": 17293, "epoch": 411} {"train_loss": -5.136136531829834, "global_step": 17294, "epoch": 411} {"train_loss": -5.135409832000732, "global_step": 17295, "epoch": 411} {"train_loss": -5.299769878387451, "global_step": 17296, "epoch": 411} {"train_loss": -5.261016845703125, "global_step": 17297, "epoch": 411} {"train_loss": -5.342890739440918, "global_step": 17298, "epoch": 411} {"train_loss": -5.043342590332031, "global_step": 17299, "epoch": 411} {"train_loss": -5.195655345916748, "global_step": 17300, "epoch": 411} {"train_loss": -5.322739124298096, "global_step": 17301, "epoch": 411} {"train_loss": -5.2351884841918945, "global_step": 17302, "epoch": 411} {"train_loss": -5.2192879517873125, "global_step": 17303, "epoch": 411, "val_loss": 68770.2109375} {"train_loss": -5.343803405761719, "global_step": 17304, "epoch": 412} {"train_loss": -5.333062648773193, "global_step": 17305, "epoch": 412} {"train_loss": -5.338574409484863, "global_step": 17306, "epoch": 412} {"train_loss": -5.234513759613037, "global_step": 17307, "epoch": 412} {"train_loss": -5.291967391967773, "global_step": 17308, "epoch": 412} {"train_loss": -5.159914016723633, "global_step": 17309, "epoch": 412} {"train_loss": -5.316073417663574, "global_step": 17310, "epoch": 412} {"train_loss": -5.165794849395752, "global_step": 17311, "epoch": 412} {"train_loss": -5.341689109802246, "global_step": 17312, "epoch": 412} {"train_loss": -5.161307334899902, "global_step": 17313, "epoch": 412} {"train_loss": -5.168144226074219, "global_step": 17314, "epoch": 412} {"train_loss": -5.37225866317749, "global_step": 17315, "epoch": 412} {"train_loss": -5.0484724044799805, "global_step": 17316, "epoch": 412} {"train_loss": -5.027276992797852, "global_step": 17317, "epoch": 412} {"train_loss": -5.228482723236084, "global_step": 17318, "epoch": 412} {"train_loss": -5.04042911529541, "global_step": 17319, "epoch": 412} {"train_loss": -5.235700607299805, "global_step": 17320, "epoch": 412} {"train_loss": -5.272818088531494, "global_step": 17321, "epoch": 412} {"train_loss": -5.049948692321777, "global_step": 17322, "epoch": 412} {"train_loss": -5.200279712677002, "global_step": 17323, "epoch": 412} {"train_loss": -5.273997783660889, "global_step": 17324, "epoch": 412} {"train_loss": -5.206245422363281, "global_step": 17325, "epoch": 412} {"train_loss": -5.229532718658447, "global_step": 17326, "epoch": 412} {"train_loss": -5.217404842376709, "global_step": 17327, "epoch": 412} {"train_loss": -5.239441871643066, "global_step": 17328, "epoch": 412} {"train_loss": -5.28706693649292, "global_step": 17329, "epoch": 412} {"train_loss": -5.307254791259766, "global_step": 17330, "epoch": 412} {"train_loss": -5.227281093597412, "global_step": 17331, "epoch": 412} {"train_loss": -5.124510288238525, "global_step": 17332, "epoch": 412} {"train_loss": -5.209586143493652, "global_step": 17333, "epoch": 412} {"train_loss": -5.245921611785889, "global_step": 17334, "epoch": 412} {"train_loss": -5.168832778930664, "global_step": 17335, "epoch": 412} {"train_loss": -5.238661289215088, "global_step": 17336, "epoch": 412} {"train_loss": -5.270564556121826, "global_step": 17337, "epoch": 412} {"train_loss": -5.2993364334106445, "global_step": 17338, "epoch": 412} {"train_loss": -5.30596399307251, "global_step": 17339, "epoch": 412} {"train_loss": -5.279218673706055, "global_step": 17340, "epoch": 412} {"train_loss": -5.2098798751831055, "global_step": 17341, "epoch": 412} {"train_loss": -5.347761154174805, "global_step": 17342, "epoch": 412} {"train_loss": -5.189791679382324, "global_step": 17343, "epoch": 412} {"train_loss": -5.265070915222168, "global_step": 17344, "epoch": 412} {"train_loss": -5.229189123426165, "global_step": 17345, "epoch": 412, "val_loss": 68926.9921875} {"train_loss": -5.322607040405273, "global_step": 17346, "epoch": 413} {"train_loss": -5.388963222503662, "global_step": 17347, "epoch": 413} {"train_loss": -5.263850688934326, "global_step": 17348, "epoch": 413} {"train_loss": -5.162739276885986, "global_step": 17349, "epoch": 413} {"train_loss": -5.175229072570801, "global_step": 17350, "epoch": 413} {"train_loss": -5.161478519439697, "global_step": 17351, "epoch": 413} {"train_loss": -5.178986549377441, "global_step": 17352, "epoch": 413} {"train_loss": -5.324038982391357, "global_step": 17353, "epoch": 413} {"train_loss": -5.325594902038574, "global_step": 17354, "epoch": 413} {"train_loss": -5.288138389587402, "global_step": 17355, "epoch": 413} {"train_loss": -5.191126823425293, "global_step": 17356, "epoch": 413} {"train_loss": -5.254875659942627, "global_step": 17357, "epoch": 413} {"train_loss": -5.1069746017456055, "global_step": 17358, "epoch": 413} {"train_loss": -5.204320907592773, "global_step": 17359, "epoch": 413} {"train_loss": -5.098163604736328, "global_step": 17360, "epoch": 413} {"train_loss": -5.314034461975098, "global_step": 17361, "epoch": 413} {"train_loss": -5.241647720336914, "global_step": 17362, "epoch": 413} {"train_loss": -5.031369209289551, "global_step": 17363, "epoch": 413} {"train_loss": -4.989213943481445, "global_step": 17364, "epoch": 413} {"train_loss": -5.35482931137085, "global_step": 17365, "epoch": 413} {"train_loss": -4.892514228820801, "global_step": 17366, "epoch": 413} {"train_loss": -5.268250942230225, "global_step": 17367, "epoch": 413} {"train_loss": -5.243682861328125, "global_step": 17368, "epoch": 413} {"train_loss": -5.160449981689453, "global_step": 17369, "epoch": 413} {"train_loss": -5.202688217163086, "global_step": 17370, "epoch": 413} {"train_loss": -5.158836364746094, "global_step": 17371, "epoch": 413} {"train_loss": -5.0821638107299805, "global_step": 17372, "epoch": 413} {"train_loss": -5.349961280822754, "global_step": 17373, "epoch": 413} {"train_loss": -5.08359432220459, "global_step": 17374, "epoch": 413} {"train_loss": -5.363661289215088, "global_step": 17375, "epoch": 413} {"train_loss": -5.236843109130859, "global_step": 17376, "epoch": 413} {"train_loss": -5.233839511871338, "global_step": 17377, "epoch": 413} {"train_loss": -5.146173477172852, "global_step": 17378, "epoch": 413} {"train_loss": -5.055054664611816, "global_step": 17379, "epoch": 413} {"train_loss": -5.1789398193359375, "global_step": 17380, "epoch": 413} {"train_loss": -5.197965145111084, "global_step": 17381, "epoch": 413} {"train_loss": -5.279420375823975, "global_step": 17382, "epoch": 413} {"train_loss": -5.316727161407471, "global_step": 17383, "epoch": 413} {"train_loss": -5.185771942138672, "global_step": 17384, "epoch": 413} {"train_loss": -5.278843402862549, "global_step": 17385, "epoch": 413} {"train_loss": -5.224714279174805, "global_step": 17386, "epoch": 413} {"train_loss": -5.209410406294323, "global_step": 17387, "epoch": 413, "val_loss": 69129.609375} {"train_loss": -5.249992370605469, "global_step": 17388, "epoch": 414} {"train_loss": -5.231579780578613, "global_step": 17389, "epoch": 414} {"train_loss": -5.246155738830566, "global_step": 17390, "epoch": 414} {"train_loss": -5.208845615386963, "global_step": 17391, "epoch": 414} {"train_loss": -5.367597579956055, "global_step": 17392, "epoch": 414} {"train_loss": -5.472799777984619, "global_step": 17393, "epoch": 414} {"train_loss": -5.189962387084961, "global_step": 17394, "epoch": 414} {"train_loss": -5.180998802185059, "global_step": 17395, "epoch": 414} {"train_loss": -5.302967071533203, "global_step": 17396, "epoch": 414} {"train_loss": -5.272912979125977, "global_step": 17397, "epoch": 414} {"train_loss": -5.0907111167907715, "global_step": 17398, "epoch": 414} {"train_loss": -5.188582420349121, "global_step": 17399, "epoch": 414} {"train_loss": -5.338733673095703, "global_step": 17400, "epoch": 414} {"train_loss": -5.228199005126953, "global_step": 17401, "epoch": 414} {"train_loss": -5.355506896972656, "global_step": 17402, "epoch": 414} {"train_loss": -5.228992462158203, "global_step": 17403, "epoch": 414} {"train_loss": -5.128387451171875, "global_step": 17404, "epoch": 414} {"train_loss": -5.112326622009277, "global_step": 17405, "epoch": 414} {"train_loss": -5.281468391418457, "global_step": 17406, "epoch": 414} {"train_loss": -5.252901077270508, "global_step": 17407, "epoch": 414} {"train_loss": -5.103339195251465, "global_step": 17408, "epoch": 414} {"train_loss": -5.259724140167236, "global_step": 17409, "epoch": 414} {"train_loss": -5.199623107910156, "global_step": 17410, "epoch": 414} {"train_loss": -5.108880043029785, "global_step": 17411, "epoch": 414} {"train_loss": -5.305883407592773, "global_step": 17412, "epoch": 414} {"train_loss": -5.291706085205078, "global_step": 17413, "epoch": 414} {"train_loss": -5.2514967918396, "global_step": 17414, "epoch": 414} {"train_loss": -5.299360275268555, "global_step": 17415, "epoch": 414} {"train_loss": -5.120567321777344, "global_step": 17416, "epoch": 414} {"train_loss": -5.426972389221191, "global_step": 17417, "epoch": 414} {"train_loss": -5.098014831542969, "global_step": 17418, "epoch": 414} {"train_loss": -5.1912007331848145, "global_step": 17419, "epoch": 414} {"train_loss": -5.226003646850586, "global_step": 17420, "epoch": 414} {"train_loss": -5.210814476013184, "global_step": 17421, "epoch": 414} {"train_loss": -5.1861891746521, "global_step": 17422, "epoch": 414} {"train_loss": -5.303540229797363, "global_step": 17423, "epoch": 414} {"train_loss": -5.238689422607422, "global_step": 17424, "epoch": 414} {"train_loss": -5.347555637359619, "global_step": 17425, "epoch": 414} {"train_loss": -5.312827110290527, "global_step": 17426, "epoch": 414} {"train_loss": -5.300826072692871, "global_step": 17427, "epoch": 414} {"train_loss": -5.168663024902344, "global_step": 17428, "epoch": 414} {"train_loss": -5.245237486703055, "global_step": 17429, "epoch": 414, "val_loss": 69078.609375} {"train_loss": -5.276505947113037, "global_step": 17430, "epoch": 415} {"train_loss": -5.032044887542725, "global_step": 17431, "epoch": 415} {"train_loss": -5.251692295074463, "global_step": 17432, "epoch": 415} {"train_loss": -5.215025901794434, "global_step": 17433, "epoch": 415} {"train_loss": -5.225986480712891, "global_step": 17434, "epoch": 415} {"train_loss": -5.279141426086426, "global_step": 17435, "epoch": 415} {"train_loss": -5.119533061981201, "global_step": 17436, "epoch": 415} {"train_loss": -5.2342424392700195, "global_step": 17437, "epoch": 415} {"train_loss": -5.225112438201904, "global_step": 17438, "epoch": 415} {"train_loss": -5.209856033325195, "global_step": 17439, "epoch": 415} {"train_loss": -5.094002723693848, "global_step": 17440, "epoch": 415} {"train_loss": -5.155331134796143, "global_step": 17441, "epoch": 415} {"train_loss": -5.250352382659912, "global_step": 17442, "epoch": 415} {"train_loss": -5.194619178771973, "global_step": 17443, "epoch": 415} {"train_loss": -5.16510009765625, "global_step": 17444, "epoch": 415} {"train_loss": -5.339173316955566, "global_step": 17445, "epoch": 415} {"train_loss": -5.252071380615234, "global_step": 17446, "epoch": 415} {"train_loss": -5.197220802307129, "global_step": 17447, "epoch": 415} {"train_loss": -5.318720817565918, "global_step": 17448, "epoch": 415} {"train_loss": -5.062691688537598, "global_step": 17449, "epoch": 415} {"train_loss": -5.12811279296875, "global_step": 17450, "epoch": 415} {"train_loss": -5.209174156188965, "global_step": 17451, "epoch": 415} {"train_loss": -5.217755317687988, "global_step": 17452, "epoch": 415} {"train_loss": -5.267077445983887, "global_step": 17453, "epoch": 415} {"train_loss": -5.225197792053223, "global_step": 17454, "epoch": 415} {"train_loss": -5.159136772155762, "global_step": 17455, "epoch": 415} {"train_loss": -5.23078727722168, "global_step": 17456, "epoch": 415} {"train_loss": -5.393824577331543, "global_step": 17457, "epoch": 415} {"train_loss": -5.098209857940674, "global_step": 17458, "epoch": 415} {"train_loss": -5.285094738006592, "global_step": 17459, "epoch": 415} {"train_loss": -5.251795768737793, "global_step": 17460, "epoch": 415} {"train_loss": -5.132742881774902, "global_step": 17461, "epoch": 415} {"train_loss": -5.2349138259887695, "global_step": 17462, "epoch": 415} {"train_loss": -5.207219123840332, "global_step": 17463, "epoch": 415} {"train_loss": -4.983242034912109, "global_step": 17464, "epoch": 415} {"train_loss": -5.147365570068359, "global_step": 17465, "epoch": 415} {"train_loss": -5.266166687011719, "global_step": 17466, "epoch": 415} {"train_loss": -5.075806617736816, "global_step": 17467, "epoch": 415} {"train_loss": -5.260663032531738, "global_step": 17468, "epoch": 415} {"train_loss": -5.310559272766113, "global_step": 17469, "epoch": 415} {"train_loss": -5.173617362976074, "global_step": 17470, "epoch": 415} {"train_loss": -5.20725891703651, "global_step": 17471, "epoch": 415, "val_loss": 70063.1953125} {"train_loss": -5.157060146331787, "global_step": 17472, "epoch": 416} {"train_loss": -5.323995590209961, "global_step": 17473, "epoch": 416} {"train_loss": -5.1823015213012695, "global_step": 17474, "epoch": 416} {"train_loss": -5.214768409729004, "global_step": 17475, "epoch": 416} {"train_loss": -5.111085891723633, "global_step": 17476, "epoch": 416} {"train_loss": -5.19956111907959, "global_step": 17477, "epoch": 416} {"train_loss": -5.30446195602417, "global_step": 17478, "epoch": 416} {"train_loss": -5.181580543518066, "global_step": 17479, "epoch": 416} {"train_loss": -5.401460647583008, "global_step": 17480, "epoch": 416} {"train_loss": -5.158016204833984, "global_step": 17481, "epoch": 416} {"train_loss": -5.253052234649658, "global_step": 17482, "epoch": 416} {"train_loss": -5.324740409851074, "global_step": 17483, "epoch": 416} {"train_loss": -5.324960708618164, "global_step": 17484, "epoch": 416} {"train_loss": -5.379026412963867, "global_step": 17485, "epoch": 416} {"train_loss": -5.194651126861572, "global_step": 17486, "epoch": 416} {"train_loss": -5.207270622253418, "global_step": 17487, "epoch": 416} {"train_loss": -5.181540489196777, "global_step": 17488, "epoch": 416} {"train_loss": -4.981778144836426, "global_step": 17489, "epoch": 416} {"train_loss": -5.283841133117676, "global_step": 17490, "epoch": 416} {"train_loss": -5.103606224060059, "global_step": 17491, "epoch": 416} {"train_loss": -5.162021160125732, "global_step": 17492, "epoch": 416} {"train_loss": -5.125008583068848, "global_step": 17493, "epoch": 416} {"train_loss": -5.299448013305664, "global_step": 17494, "epoch": 416} {"train_loss": -5.288227081298828, "global_step": 17495, "epoch": 416} {"train_loss": -5.201574325561523, "global_step": 17496, "epoch": 416} {"train_loss": -5.243862628936768, "global_step": 17497, "epoch": 416} {"train_loss": -5.313918590545654, "global_step": 17498, "epoch": 416} {"train_loss": -5.238340854644775, "global_step": 17499, "epoch": 416} {"train_loss": -5.276476860046387, "global_step": 17500, "epoch": 416} {"train_loss": -5.194929599761963, "global_step": 17501, "epoch": 416} {"train_loss": -5.260319232940674, "global_step": 17502, "epoch": 416} {"train_loss": -5.265529632568359, "global_step": 17503, "epoch": 416} {"train_loss": -5.31406307220459, "global_step": 17504, "epoch": 416} {"train_loss": -5.341131210327148, "global_step": 17505, "epoch": 416} {"train_loss": -5.32133674621582, "global_step": 17506, "epoch": 416} {"train_loss": -5.239288330078125, "global_step": 17507, "epoch": 416} {"train_loss": -5.2675933837890625, "global_step": 17508, "epoch": 416} {"train_loss": -5.23685359954834, "global_step": 17509, "epoch": 416} {"train_loss": -5.329193115234375, "global_step": 17510, "epoch": 416} {"train_loss": -5.335118293762207, "global_step": 17511, "epoch": 416} {"train_loss": -5.192837715148926, "global_step": 17512, "epoch": 416} {"train_loss": -5.239665076846168, "global_step": 17513, "epoch": 416, "val_loss": 68913.9453125} {"train_loss": -5.173345565795898, "global_step": 17514, "epoch": 417} {"train_loss": -5.094821453094482, "global_step": 17515, "epoch": 417} {"train_loss": -5.224606513977051, "global_step": 17516, "epoch": 417} {"train_loss": -5.399835586547852, "global_step": 17517, "epoch": 417} {"train_loss": -5.103039264678955, "global_step": 17518, "epoch": 417} {"train_loss": -5.178915500640869, "global_step": 17519, "epoch": 417} {"train_loss": -5.291192054748535, "global_step": 17520, "epoch": 417} {"train_loss": -5.221105575561523, "global_step": 17521, "epoch": 417} {"train_loss": -5.363303184509277, "global_step": 17522, "epoch": 417} {"train_loss": -5.268835544586182, "global_step": 17523, "epoch": 417} {"train_loss": -5.164064407348633, "global_step": 17524, "epoch": 417} {"train_loss": -5.258221626281738, "global_step": 17525, "epoch": 417} {"train_loss": -5.150324821472168, "global_step": 17526, "epoch": 417} {"train_loss": -5.101110458374023, "global_step": 17527, "epoch": 417} {"train_loss": -5.279375076293945, "global_step": 17528, "epoch": 417} {"train_loss": -5.210062026977539, "global_step": 17529, "epoch": 417} {"train_loss": -5.35076379776001, "global_step": 17530, "epoch": 417} {"train_loss": -5.13999080657959, "global_step": 17531, "epoch": 417} {"train_loss": -5.138232707977295, "global_step": 17532, "epoch": 417} {"train_loss": -5.234011650085449, "global_step": 17533, "epoch": 417} {"train_loss": -5.273932456970215, "global_step": 17534, "epoch": 417} {"train_loss": -5.158360481262207, "global_step": 17535, "epoch": 417} {"train_loss": -5.284726142883301, "global_step": 17536, "epoch": 417} {"train_loss": -5.40385627746582, "global_step": 17537, "epoch": 417} {"train_loss": -5.258742809295654, "global_step": 17538, "epoch": 417} {"train_loss": -5.021128177642822, "global_step": 17539, "epoch": 417} {"train_loss": -5.155956745147705, "global_step": 17540, "epoch": 417} {"train_loss": -5.284292221069336, "global_step": 17541, "epoch": 417} {"train_loss": -5.034523010253906, "global_step": 17542, "epoch": 417} {"train_loss": -4.965861797332764, "global_step": 17543, "epoch": 417} {"train_loss": -5.3969831466674805, "global_step": 17544, "epoch": 417} {"train_loss": -5.19624137878418, "global_step": 17545, "epoch": 417} {"train_loss": -5.218979358673096, "global_step": 17546, "epoch": 417} {"train_loss": -5.271085739135742, "global_step": 17547, "epoch": 417} {"train_loss": -5.232852935791016, "global_step": 17548, "epoch": 417} {"train_loss": -5.085391998291016, "global_step": 17549, "epoch": 417} {"train_loss": -5.2603960037231445, "global_step": 17550, "epoch": 417} {"train_loss": -5.25660514831543, "global_step": 17551, "epoch": 417} {"train_loss": -5.204102039337158, "global_step": 17552, "epoch": 417} {"train_loss": -5.1735429763793945, "global_step": 17553, "epoch": 417} {"train_loss": -5.072759628295898, "global_step": 17554, "epoch": 417} {"train_loss": -5.209492944535755, "global_step": 17555, "epoch": 417, "val_loss": 69230.5234375} {"train_loss": -5.222921848297119, "global_step": 17556, "epoch": 418} {"train_loss": -5.153858184814453, "global_step": 17557, "epoch": 418} {"train_loss": -5.404820919036865, "global_step": 17558, "epoch": 418} {"train_loss": -5.136643409729004, "global_step": 17559, "epoch": 418} {"train_loss": -5.246307849884033, "global_step": 17560, "epoch": 418} {"train_loss": -5.067795276641846, "global_step": 17561, "epoch": 418} {"train_loss": -5.191644668579102, "global_step": 17562, "epoch": 418} {"train_loss": -5.268157482147217, "global_step": 17563, "epoch": 418} {"train_loss": -5.1779351234436035, "global_step": 17564, "epoch": 418} {"train_loss": -5.278839111328125, "global_step": 17565, "epoch": 418} {"train_loss": -5.2233076095581055, "global_step": 17566, "epoch": 418} {"train_loss": -5.193425178527832, "global_step": 17567, "epoch": 418} {"train_loss": -5.199881553649902, "global_step": 17568, "epoch": 418} {"train_loss": -5.2415080070495605, "global_step": 17569, "epoch": 418} {"train_loss": -5.389349937438965, "global_step": 17570, "epoch": 418} {"train_loss": -5.269312858581543, "global_step": 17571, "epoch": 418} {"train_loss": -5.267195701599121, "global_step": 17572, "epoch": 418} {"train_loss": -5.282217979431152, "global_step": 17573, "epoch": 418} {"train_loss": -5.2368903160095215, "global_step": 17574, "epoch": 418} {"train_loss": -5.171252250671387, "global_step": 17575, "epoch": 418} {"train_loss": -5.38570499420166, "global_step": 17576, "epoch": 418} {"train_loss": -5.279665946960449, "global_step": 17577, "epoch": 418} {"train_loss": -5.32919979095459, "global_step": 17578, "epoch": 418} {"train_loss": -5.176785469055176, "global_step": 17579, "epoch": 418} {"train_loss": -5.211451053619385, "global_step": 17580, "epoch": 418} {"train_loss": -5.264682769775391, "global_step": 17581, "epoch": 418} {"train_loss": -5.122661113739014, "global_step": 17582, "epoch": 418} {"train_loss": -5.1944780349731445, "global_step": 17583, "epoch": 418} {"train_loss": -5.267622947692871, "global_step": 17584, "epoch": 418} {"train_loss": -5.309179782867432, "global_step": 17585, "epoch": 418} {"train_loss": -5.229599952697754, "global_step": 17586, "epoch": 418} {"train_loss": -5.244016647338867, "global_step": 17587, "epoch": 418} {"train_loss": -5.230948448181152, "global_step": 17588, "epoch": 418} {"train_loss": -5.112963676452637, "global_step": 17589, "epoch": 418} {"train_loss": -5.2755842208862305, "global_step": 17590, "epoch": 418} {"train_loss": -5.137666702270508, "global_step": 17591, "epoch": 418} {"train_loss": -5.314034938812256, "global_step": 17592, "epoch": 418} {"train_loss": -5.223552703857422, "global_step": 17593, "epoch": 418} {"train_loss": -5.29036808013916, "global_step": 17594, "epoch": 418} {"train_loss": -5.128055572509766, "global_step": 17595, "epoch": 418} {"train_loss": -5.263059139251709, "global_step": 17596, "epoch": 418} {"train_loss": -5.239083256040301, "global_step": 17597, "epoch": 418, "val_loss": 68754.8203125} {"train_loss": -5.246840476989746, "global_step": 17598, "epoch": 419} {"train_loss": -5.289222717285156, "global_step": 17599, "epoch": 419} {"train_loss": -5.25913667678833, "global_step": 17600, "epoch": 419} {"train_loss": -5.243812084197998, "global_step": 17601, "epoch": 419} {"train_loss": -5.278841018676758, "global_step": 17602, "epoch": 419} {"train_loss": -5.36375617980957, "global_step": 17603, "epoch": 419} {"train_loss": -5.245551109313965, "global_step": 17604, "epoch": 419} {"train_loss": -5.332937240600586, "global_step": 17605, "epoch": 419} {"train_loss": -5.3039045333862305, "global_step": 17606, "epoch": 419} {"train_loss": -5.245365619659424, "global_step": 17607, "epoch": 419} {"train_loss": -5.345272064208984, "global_step": 17608, "epoch": 419} {"train_loss": -5.291200637817383, "global_step": 17609, "epoch": 419} {"train_loss": -5.325129508972168, "global_step": 17610, "epoch": 419} {"train_loss": -5.309494495391846, "global_step": 17611, "epoch": 419} {"train_loss": -5.314637184143066, "global_step": 17612, "epoch": 419} {"train_loss": -5.2085490226745605, "global_step": 17613, "epoch": 419} {"train_loss": -5.263855934143066, "global_step": 17614, "epoch": 419} {"train_loss": -5.256325721740723, "global_step": 17615, "epoch": 419} {"train_loss": -5.321032524108887, "global_step": 17616, "epoch": 419} {"train_loss": -5.1567888259887695, "global_step": 17617, "epoch": 419} {"train_loss": -5.160224914550781, "global_step": 17618, "epoch": 419} {"train_loss": -5.311339378356934, "global_step": 17619, "epoch": 419} {"train_loss": -5.1486687660217285, "global_step": 17620, "epoch": 419} {"train_loss": -5.227304458618164, "global_step": 17621, "epoch": 419} {"train_loss": -5.194746494293213, "global_step": 17622, "epoch": 419} {"train_loss": -5.279565811157227, "global_step": 17623, "epoch": 419} {"train_loss": -5.295546531677246, "global_step": 17624, "epoch": 419} {"train_loss": -5.289041042327881, "global_step": 17625, "epoch": 419} {"train_loss": -5.252010345458984, "global_step": 17626, "epoch": 419} {"train_loss": -5.2084479331970215, "global_step": 17627, "epoch": 419} {"train_loss": -5.3567399978637695, "global_step": 17628, "epoch": 419} {"train_loss": -5.231179237365723, "global_step": 17629, "epoch": 419} {"train_loss": -5.166444778442383, "global_step": 17630, "epoch": 419} {"train_loss": -5.234641075134277, "global_step": 17631, "epoch": 419} {"train_loss": -5.327737808227539, "global_step": 17632, "epoch": 419} {"train_loss": -5.214587211608887, "global_step": 17633, "epoch": 419} {"train_loss": -5.288482666015625, "global_step": 17634, "epoch": 419} {"train_loss": -5.306178092956543, "global_step": 17635, "epoch": 419} {"train_loss": -5.277895927429199, "global_step": 17636, "epoch": 419} {"train_loss": -5.293361663818359, "global_step": 17637, "epoch": 419} {"train_loss": -5.18156623840332, "global_step": 17638, "epoch": 419} {"train_loss": -5.261377493540446, "global_step": 17639, "epoch": 419, "val_loss": 68355.4296875} {"train_loss": -5.184881687164307, "global_step": 17640, "epoch": 420} {"train_loss": -5.1075334548950195, "global_step": 17641, "epoch": 420} {"train_loss": -5.312906265258789, "global_step": 17642, "epoch": 420} {"train_loss": -5.2931108474731445, "global_step": 17643, "epoch": 420} {"train_loss": -5.27694034576416, "global_step": 17644, "epoch": 420} {"train_loss": -5.248515605926514, "global_step": 17645, "epoch": 420} {"train_loss": -5.278099060058594, "global_step": 17646, "epoch": 420} {"train_loss": -5.172694683074951, "global_step": 17647, "epoch": 420} {"train_loss": -5.184055328369141, "global_step": 17648, "epoch": 420} {"train_loss": -5.3527631759643555, "global_step": 17649, "epoch": 420} {"train_loss": -5.208787441253662, "global_step": 17650, "epoch": 420} {"train_loss": -5.2045674324035645, "global_step": 17651, "epoch": 420} {"train_loss": -5.167179584503174, "global_step": 17652, "epoch": 420} {"train_loss": -5.370726585388184, "global_step": 17653, "epoch": 420} {"train_loss": -5.158728122711182, "global_step": 17654, "epoch": 420} {"train_loss": -5.209920883178711, "global_step": 17655, "epoch": 420} {"train_loss": -5.314120292663574, "global_step": 17656, "epoch": 420} {"train_loss": -5.326175689697266, "global_step": 17657, "epoch": 420} {"train_loss": -5.10656213760376, "global_step": 17658, "epoch": 420} {"train_loss": -5.292713165283203, "global_step": 17659, "epoch": 420} {"train_loss": -5.284396648406982, "global_step": 17660, "epoch": 420} {"train_loss": -5.20335054397583, "global_step": 17661, "epoch": 420} {"train_loss": -5.23940372467041, "global_step": 17662, "epoch": 420} {"train_loss": -5.214204788208008, "global_step": 17663, "epoch": 420} {"train_loss": -5.275545597076416, "global_step": 17664, "epoch": 420} {"train_loss": -5.362349510192871, "global_step": 17665, "epoch": 420} {"train_loss": -5.219890594482422, "global_step": 17666, "epoch": 420} {"train_loss": -5.12422513961792, "global_step": 17667, "epoch": 420} {"train_loss": -5.261869430541992, "global_step": 17668, "epoch": 420} {"train_loss": -5.28973388671875, "global_step": 17669, "epoch": 420} {"train_loss": -5.324472904205322, "global_step": 17670, "epoch": 420} {"train_loss": -5.175717830657959, "global_step": 17671, "epoch": 420} {"train_loss": -5.305163383483887, "global_step": 17672, "epoch": 420} {"train_loss": -5.335570335388184, "global_step": 17673, "epoch": 420} {"train_loss": -5.204373359680176, "global_step": 17674, "epoch": 420} {"train_loss": -5.10247802734375, "global_step": 17675, "epoch": 420} {"train_loss": -5.321327209472656, "global_step": 17676, "epoch": 420} {"train_loss": -5.190058708190918, "global_step": 17677, "epoch": 420} {"train_loss": -5.081782341003418, "global_step": 17678, "epoch": 420} {"train_loss": -5.279941082000732, "global_step": 17679, "epoch": 420} {"train_loss": -5.346047878265381, "global_step": 17680, "epoch": 420} {"train_loss": -5.240281207220895, "global_step": 17681, "epoch": 420, "val_loss": 68744.984375} {"train_loss": -5.153633117675781, "global_step": 17682, "epoch": 421} {"train_loss": -5.165539741516113, "global_step": 17683, "epoch": 421} {"train_loss": -5.304818153381348, "global_step": 17684, "epoch": 421} {"train_loss": -5.166821002960205, "global_step": 17685, "epoch": 421} {"train_loss": -5.197799205780029, "global_step": 17686, "epoch": 421} {"train_loss": -5.206640243530273, "global_step": 17687, "epoch": 421} {"train_loss": -5.275629043579102, "global_step": 17688, "epoch": 421} {"train_loss": -5.327788352966309, "global_step": 17689, "epoch": 421} {"train_loss": -5.170989036560059, "global_step": 17690, "epoch": 421} {"train_loss": -5.414592742919922, "global_step": 17691, "epoch": 421} {"train_loss": -5.130467891693115, "global_step": 17692, "epoch": 421} {"train_loss": -5.329643249511719, "global_step": 17693, "epoch": 421} {"train_loss": -5.220294952392578, "global_step": 17694, "epoch": 421} {"train_loss": -5.159843444824219, "global_step": 17695, "epoch": 421} {"train_loss": -5.316778182983398, "global_step": 17696, "epoch": 421} {"train_loss": -5.290948867797852, "global_step": 17697, "epoch": 421} {"train_loss": -5.200987815856934, "global_step": 17698, "epoch": 421} {"train_loss": -5.311304569244385, "global_step": 17699, "epoch": 421} {"train_loss": -5.254983425140381, "global_step": 17700, "epoch": 421} {"train_loss": -5.157000541687012, "global_step": 17701, "epoch": 421} {"train_loss": -5.126009941101074, "global_step": 17702, "epoch": 421} {"train_loss": -5.147764682769775, "global_step": 17703, "epoch": 421} {"train_loss": -5.361965179443359, "global_step": 17704, "epoch": 421} {"train_loss": -5.09149169921875, "global_step": 17705, "epoch": 421} {"train_loss": -5.2376604080200195, "global_step": 17706, "epoch": 421} {"train_loss": -5.235518932342529, "global_step": 17707, "epoch": 421} {"train_loss": -5.229593753814697, "global_step": 17708, "epoch": 421} {"train_loss": -5.2189531326293945, "global_step": 17709, "epoch": 421} {"train_loss": -5.33054256439209, "global_step": 17710, "epoch": 421} {"train_loss": -5.13621711730957, "global_step": 17711, "epoch": 421} {"train_loss": -5.223552703857422, "global_step": 17712, "epoch": 421} {"train_loss": -5.296844005584717, "global_step": 17713, "epoch": 421} {"train_loss": -5.352694034576416, "global_step": 17714, "epoch": 421} {"train_loss": -5.071475028991699, "global_step": 17715, "epoch": 421} {"train_loss": -5.222677230834961, "global_step": 17716, "epoch": 421} {"train_loss": -5.288638591766357, "global_step": 17717, "epoch": 421} {"train_loss": -5.2336320877075195, "global_step": 17718, "epoch": 421} {"train_loss": -5.148114204406738, "global_step": 17719, "epoch": 421} {"train_loss": -5.480475425720215, "global_step": 17720, "epoch": 421} {"train_loss": -5.249816417694092, "global_step": 17721, "epoch": 421} {"train_loss": -5.227396488189697, "global_step": 17722, "epoch": 421} {"train_loss": -5.234232459749494, "global_step": 17723, "epoch": 421, "val_loss": 68765.5078125} {"train_loss": -5.219645977020264, "global_step": 17724, "epoch": 422} {"train_loss": -5.093574523925781, "global_step": 17725, "epoch": 422} {"train_loss": -5.281391143798828, "global_step": 17726, "epoch": 422} {"train_loss": -5.2382731437683105, "global_step": 17727, "epoch": 422} {"train_loss": -5.1016459465026855, "global_step": 17728, "epoch": 422} {"train_loss": -5.1860456466674805, "global_step": 17729, "epoch": 422} {"train_loss": -5.2015180587768555, "global_step": 17730, "epoch": 422} {"train_loss": -5.0314106941223145, "global_step": 17731, "epoch": 422} {"train_loss": -5.2791547775268555, "global_step": 17732, "epoch": 422} {"train_loss": -5.092418670654297, "global_step": 17733, "epoch": 422} {"train_loss": -5.2563042640686035, "global_step": 17734, "epoch": 422} {"train_loss": -5.2325544357299805, "global_step": 17735, "epoch": 422} {"train_loss": -5.271590232849121, "global_step": 17736, "epoch": 422} {"train_loss": -5.284133434295654, "global_step": 17737, "epoch": 422} {"train_loss": -5.431605339050293, "global_step": 17738, "epoch": 422} {"train_loss": -5.315243721008301, "global_step": 17739, "epoch": 422} {"train_loss": -5.2227783203125, "global_step": 17740, "epoch": 422} {"train_loss": -5.180166244506836, "global_step": 17741, "epoch": 422} {"train_loss": -5.120298385620117, "global_step": 17742, "epoch": 422} {"train_loss": -5.135436058044434, "global_step": 17743, "epoch": 422} {"train_loss": -5.218963623046875, "global_step": 17744, "epoch": 422} {"train_loss": -5.28171968460083, "global_step": 17745, "epoch": 422} {"train_loss": -5.257147312164307, "global_step": 17746, "epoch": 422} {"train_loss": -5.234396934509277, "global_step": 17747, "epoch": 422} {"train_loss": -5.222063064575195, "global_step": 17748, "epoch": 422} {"train_loss": -5.277763843536377, "global_step": 17749, "epoch": 422} {"train_loss": -5.1173095703125, "global_step": 17750, "epoch": 422} {"train_loss": -5.052371501922607, "global_step": 17751, "epoch": 422} {"train_loss": -5.291573524475098, "global_step": 17752, "epoch": 422} {"train_loss": -5.0401434898376465, "global_step": 17753, "epoch": 422} {"train_loss": -5.155372142791748, "global_step": 17754, "epoch": 422} {"train_loss": -5.189915657043457, "global_step": 17755, "epoch": 422} {"train_loss": -5.091800212860107, "global_step": 17756, "epoch": 422} {"train_loss": -5.186984062194824, "global_step": 17757, "epoch": 422} {"train_loss": -5.233086585998535, "global_step": 17758, "epoch": 422} {"train_loss": -5.075572967529297, "global_step": 17759, "epoch": 422} {"train_loss": -5.240790367126465, "global_step": 17760, "epoch": 422} {"train_loss": -5.145946025848389, "global_step": 17761, "epoch": 422} {"train_loss": -5.131459712982178, "global_step": 17762, "epoch": 422} {"train_loss": -5.268580913543701, "global_step": 17763, "epoch": 422} {"train_loss": -5.074709892272949, "global_step": 17764, "epoch": 422} {"train_loss": -5.196761494591122, "global_step": 17765, "epoch": 422, "val_loss": 69708.28125} {"train_loss": -5.098796367645264, "global_step": 17766, "epoch": 423} {"train_loss": -5.200948238372803, "global_step": 17767, "epoch": 423} {"train_loss": -5.279245376586914, "global_step": 17768, "epoch": 423} {"train_loss": -5.03392219543457, "global_step": 17769, "epoch": 423} {"train_loss": -5.285557270050049, "global_step": 17770, "epoch": 423} {"train_loss": -4.991781711578369, "global_step": 17771, "epoch": 423} {"train_loss": -5.203086853027344, "global_step": 17772, "epoch": 423} {"train_loss": -5.201696395874023, "global_step": 17773, "epoch": 423} {"train_loss": -5.281407356262207, "global_step": 17774, "epoch": 423} {"train_loss": -5.12238883972168, "global_step": 17775, "epoch": 423} {"train_loss": -5.278406143188477, "global_step": 17776, "epoch": 423} {"train_loss": -5.204285621643066, "global_step": 17777, "epoch": 423} {"train_loss": -5.317809104919434, "global_step": 17778, "epoch": 423} {"train_loss": -5.279460430145264, "global_step": 17779, "epoch": 423} {"train_loss": -5.271212577819824, "global_step": 17780, "epoch": 423} {"train_loss": -5.169593334197998, "global_step": 17781, "epoch": 423} {"train_loss": -5.435766220092773, "global_step": 17782, "epoch": 423} {"train_loss": -5.279706001281738, "global_step": 17783, "epoch": 423} {"train_loss": -5.224571228027344, "global_step": 17784, "epoch": 423} {"train_loss": -5.371421813964844, "global_step": 17785, "epoch": 423} {"train_loss": -5.2956953048706055, "global_step": 17786, "epoch": 423} {"train_loss": -5.18511962890625, "global_step": 17787, "epoch": 423} {"train_loss": -5.410527229309082, "global_step": 17788, "epoch": 423} {"train_loss": -5.183651924133301, "global_step": 17789, "epoch": 423} {"train_loss": -5.373088836669922, "global_step": 17790, "epoch": 423} {"train_loss": -5.109685897827148, "global_step": 17791, "epoch": 423} {"train_loss": -5.183486461639404, "global_step": 17792, "epoch": 423} {"train_loss": -5.288161277770996, "global_step": 17793, "epoch": 423} {"train_loss": -5.21944522857666, "global_step": 17794, "epoch": 423} {"train_loss": -5.232853889465332, "global_step": 17795, "epoch": 423} {"train_loss": -5.172134876251221, "global_step": 17796, "epoch": 423} {"train_loss": -5.362522602081299, "global_step": 17797, "epoch": 423} {"train_loss": -5.28526496887207, "global_step": 17798, "epoch": 423} {"train_loss": -5.15797233581543, "global_step": 17799, "epoch": 423} {"train_loss": -5.174975395202637, "global_step": 17800, "epoch": 423} {"train_loss": -5.202659606933594, "global_step": 17801, "epoch": 423} {"train_loss": -5.238253593444824, "global_step": 17802, "epoch": 423} {"train_loss": -5.142792701721191, "global_step": 17803, "epoch": 423} {"train_loss": -5.189817428588867, "global_step": 17804, "epoch": 423} {"train_loss": -5.285152435302734, "global_step": 17805, "epoch": 423} {"train_loss": -5.2629499435424805, "global_step": 17806, "epoch": 423} {"train_loss": -5.232653799511137, "global_step": 17807, "epoch": 423, "val_loss": 68955.9375} {"train_loss": -5.216496467590332, "global_step": 17808, "epoch": 424} {"train_loss": -5.340200424194336, "global_step": 17809, "epoch": 424} {"train_loss": -5.315184593200684, "global_step": 17810, "epoch": 424} {"train_loss": -5.276802062988281, "global_step": 17811, "epoch": 424} {"train_loss": -5.4135870933532715, "global_step": 17812, "epoch": 424} {"train_loss": -5.211793422698975, "global_step": 17813, "epoch": 424} {"train_loss": -5.335652828216553, "global_step": 17814, "epoch": 424} {"train_loss": -5.249260425567627, "global_step": 17815, "epoch": 424} {"train_loss": -5.247344970703125, "global_step": 17816, "epoch": 424} {"train_loss": -5.3845014572143555, "global_step": 17817, "epoch": 424} {"train_loss": -5.238323211669922, "global_step": 17818, "epoch": 424} {"train_loss": -5.212814807891846, "global_step": 17819, "epoch": 424} {"train_loss": -5.391690254211426, "global_step": 17820, "epoch": 424} {"train_loss": -5.373390197753906, "global_step": 17821, "epoch": 424} {"train_loss": -5.2555413246154785, "global_step": 17822, "epoch": 424} {"train_loss": -5.346285820007324, "global_step": 17823, "epoch": 424} {"train_loss": -5.317307472229004, "global_step": 17824, "epoch": 424} {"train_loss": -5.224972724914551, "global_step": 17825, "epoch": 424} {"train_loss": -5.253867149353027, "global_step": 17826, "epoch": 424} {"train_loss": -5.339639186859131, "global_step": 17827, "epoch": 424} {"train_loss": -5.132641792297363, "global_step": 17828, "epoch": 424} {"train_loss": -5.289864540100098, "global_step": 17829, "epoch": 424} {"train_loss": -5.20729923248291, "global_step": 17830, "epoch": 424} {"train_loss": -5.211726188659668, "global_step": 17831, "epoch": 424} {"train_loss": -5.027393341064453, "global_step": 17832, "epoch": 424} {"train_loss": -5.1891889572143555, "global_step": 17833, "epoch": 424} {"train_loss": -5.210197448730469, "global_step": 17834, "epoch": 424} {"train_loss": -5.185260772705078, "global_step": 17835, "epoch": 424} {"train_loss": -5.144103050231934, "global_step": 17836, "epoch": 424} {"train_loss": -5.255771636962891, "global_step": 17837, "epoch": 424} {"train_loss": -5.2100629806518555, "global_step": 17838, "epoch": 424} {"train_loss": -5.229494094848633, "global_step": 17839, "epoch": 424} {"train_loss": -5.2120208740234375, "global_step": 17840, "epoch": 424} {"train_loss": -5.261101722717285, "global_step": 17841, "epoch": 424} {"train_loss": -5.221710681915283, "global_step": 17842, "epoch": 424} {"train_loss": -5.237362861633301, "global_step": 17843, "epoch": 424} {"train_loss": -5.263637542724609, "global_step": 17844, "epoch": 424} {"train_loss": -5.136725425720215, "global_step": 17845, "epoch": 424} {"train_loss": -5.372933387756348, "global_step": 17846, "epoch": 424} {"train_loss": -5.384282112121582, "global_step": 17847, "epoch": 424} {"train_loss": -5.26690673828125, "global_step": 17848, "epoch": 424} {"train_loss": -5.25322083064488, "global_step": 17849, "epoch": 424, "val_loss": 68398.3203125} {"train_loss": -5.356313705444336, "global_step": 17850, "epoch": 425} {"train_loss": -5.059678077697754, "global_step": 17851, "epoch": 425} {"train_loss": -5.15940523147583, "global_step": 17852, "epoch": 425} {"train_loss": -5.25267219543457, "global_step": 17853, "epoch": 425} {"train_loss": -5.237006187438965, "global_step": 17854, "epoch": 425} {"train_loss": -5.188806533813477, "global_step": 17855, "epoch": 425} {"train_loss": -5.098410606384277, "global_step": 17856, "epoch": 425} {"train_loss": -5.208399295806885, "global_step": 17857, "epoch": 425} {"train_loss": -5.306772232055664, "global_step": 17858, "epoch": 425} {"train_loss": -5.1615800857543945, "global_step": 17859, "epoch": 425} {"train_loss": -5.324952125549316, "global_step": 17860, "epoch": 425} {"train_loss": -5.277507305145264, "global_step": 17861, "epoch": 425} {"train_loss": -5.127697944641113, "global_step": 17862, "epoch": 425} {"train_loss": -5.168474197387695, "global_step": 17863, "epoch": 425} {"train_loss": -5.086239814758301, "global_step": 17864, "epoch": 425} {"train_loss": -5.204432010650635, "global_step": 17865, "epoch": 425} {"train_loss": -5.3292741775512695, "global_step": 17866, "epoch": 425} {"train_loss": -5.250937461853027, "global_step": 17867, "epoch": 425} {"train_loss": -5.176335334777832, "global_step": 17868, "epoch": 425} {"train_loss": -5.220206260681152, "global_step": 17869, "epoch": 425} {"train_loss": -5.121021270751953, "global_step": 17870, "epoch": 425} {"train_loss": -5.200493812561035, "global_step": 17871, "epoch": 425} {"train_loss": -5.3038859367370605, "global_step": 17872, "epoch": 425} {"train_loss": -5.298951148986816, "global_step": 17873, "epoch": 425} {"train_loss": -5.355654716491699, "global_step": 17874, "epoch": 425} {"train_loss": -5.2801618576049805, "global_step": 17875, "epoch": 425} {"train_loss": -5.323352813720703, "global_step": 17876, "epoch": 425} {"train_loss": -5.250713348388672, "global_step": 17877, "epoch": 425} {"train_loss": -5.171560287475586, "global_step": 17878, "epoch": 425} {"train_loss": -5.302277565002441, "global_step": 17879, "epoch": 425} {"train_loss": -5.227995872497559, "global_step": 17880, "epoch": 425} {"train_loss": -5.340609550476074, "global_step": 17881, "epoch": 425} {"train_loss": -5.172425270080566, "global_step": 17882, "epoch": 425} {"train_loss": -5.337114334106445, "global_step": 17883, "epoch": 425} {"train_loss": -5.277224540710449, "global_step": 17884, "epoch": 425} {"train_loss": -5.29161262512207, "global_step": 17885, "epoch": 425} {"train_loss": -5.114833354949951, "global_step": 17886, "epoch": 425} {"train_loss": -5.372346878051758, "global_step": 17887, "epoch": 425} {"train_loss": -5.146751403808594, "global_step": 17888, "epoch": 425} {"train_loss": -5.510622501373291, "global_step": 17889, "epoch": 425} {"train_loss": -5.387042999267578, "global_step": 17890, "epoch": 425} {"train_loss": -5.241738784880865, "global_step": 17891, "epoch": 425, "val_loss": 68639.0625} {"train_loss": -5.142946243286133, "global_step": 17892, "epoch": 426} {"train_loss": -5.332319259643555, "global_step": 17893, "epoch": 426} {"train_loss": -5.182708740234375, "global_step": 17894, "epoch": 426} {"train_loss": -5.448441028594971, "global_step": 17895, "epoch": 426} {"train_loss": -5.1026811599731445, "global_step": 17896, "epoch": 426} {"train_loss": -5.17521333694458, "global_step": 17897, "epoch": 426} {"train_loss": -5.335171699523926, "global_step": 17898, "epoch": 426} {"train_loss": -5.1247100830078125, "global_step": 17899, "epoch": 426} {"train_loss": -5.042463779449463, "global_step": 17900, "epoch": 426} {"train_loss": -5.220466613769531, "global_step": 17901, "epoch": 426} {"train_loss": -5.07728385925293, "global_step": 17902, "epoch": 426} {"train_loss": -5.30049467086792, "global_step": 17903, "epoch": 426} {"train_loss": -5.178873062133789, "global_step": 17904, "epoch": 426} {"train_loss": -5.188889980316162, "global_step": 17905, "epoch": 426} {"train_loss": -5.192261695861816, "global_step": 17906, "epoch": 426} {"train_loss": -5.264740943908691, "global_step": 17907, "epoch": 426} {"train_loss": -5.314931392669678, "global_step": 17908, "epoch": 426} {"train_loss": -5.321590423583984, "global_step": 17909, "epoch": 426} {"train_loss": -5.212857246398926, "global_step": 17910, "epoch": 426} {"train_loss": -5.311222553253174, "global_step": 17911, "epoch": 426} {"train_loss": -5.240050792694092, "global_step": 17912, "epoch": 426} {"train_loss": -5.251397132873535, "global_step": 17913, "epoch": 426} {"train_loss": -5.260765552520752, "global_step": 17914, "epoch": 426} {"train_loss": -5.18208122253418, "global_step": 17915, "epoch": 426} {"train_loss": -5.313112258911133, "global_step": 17916, "epoch": 426} {"train_loss": -5.191939353942871, "global_step": 17917, "epoch": 426} {"train_loss": -5.299609184265137, "global_step": 17918, "epoch": 426} {"train_loss": -5.162297248840332, "global_step": 17919, "epoch": 426} {"train_loss": -5.243322372436523, "global_step": 17920, "epoch": 426} {"train_loss": -5.2125115394592285, "global_step": 17921, "epoch": 426} {"train_loss": -5.374919891357422, "global_step": 17922, "epoch": 426} {"train_loss": -5.362714767456055, "global_step": 17923, "epoch": 426} {"train_loss": -5.294066905975342, "global_step": 17924, "epoch": 426} {"train_loss": -5.250009536743164, "global_step": 17925, "epoch": 426} {"train_loss": -5.126330375671387, "global_step": 17926, "epoch": 426} {"train_loss": -5.314836502075195, "global_step": 17927, "epoch": 426} {"train_loss": -5.368361473083496, "global_step": 17928, "epoch": 426} {"train_loss": -5.31797981262207, "global_step": 17929, "epoch": 426} {"train_loss": -5.338388442993164, "global_step": 17930, "epoch": 426} {"train_loss": -5.295577526092529, "global_step": 17931, "epoch": 426} {"train_loss": -5.338388919830322, "global_step": 17932, "epoch": 426} {"train_loss": -5.247106154759725, "global_step": 17933, "epoch": 426, "val_loss": 68948.5234375} {"train_loss": -5.22592830657959, "global_step": 17934, "epoch": 427} {"train_loss": -5.375052452087402, "global_step": 17935, "epoch": 427} {"train_loss": -5.215584754943848, "global_step": 17936, "epoch": 427} {"train_loss": -5.143845558166504, "global_step": 17937, "epoch": 427} {"train_loss": -5.348372459411621, "global_step": 17938, "epoch": 427} {"train_loss": -5.330100059509277, "global_step": 17939, "epoch": 427} {"train_loss": -5.269941329956055, "global_step": 17940, "epoch": 427} {"train_loss": -5.324093818664551, "global_step": 17941, "epoch": 427} {"train_loss": -5.331757545471191, "global_step": 17942, "epoch": 427} {"train_loss": -5.2300286293029785, "global_step": 17943, "epoch": 427} {"train_loss": -5.111264228820801, "global_step": 17944, "epoch": 427} {"train_loss": -5.352023124694824, "global_step": 17945, "epoch": 427} {"train_loss": -5.032461166381836, "global_step": 17946, "epoch": 427} {"train_loss": -5.250605583190918, "global_step": 17947, "epoch": 427} {"train_loss": -5.23883056640625, "global_step": 17948, "epoch": 427} {"train_loss": -5.240694999694824, "global_step": 17949, "epoch": 427} {"train_loss": -5.15012264251709, "global_step": 17950, "epoch": 427} {"train_loss": -5.227940082550049, "global_step": 17951, "epoch": 427} {"train_loss": -5.252898216247559, "global_step": 17952, "epoch": 427} {"train_loss": -5.318882942199707, "global_step": 17953, "epoch": 427} {"train_loss": -5.185067653656006, "global_step": 17954, "epoch": 427} {"train_loss": -5.202825546264648, "global_step": 17955, "epoch": 427} {"train_loss": -5.161541938781738, "global_step": 17956, "epoch": 427} {"train_loss": -5.238862037658691, "global_step": 17957, "epoch": 427} {"train_loss": -5.2009711265563965, "global_step": 17958, "epoch": 427} {"train_loss": -5.130465984344482, "global_step": 17959, "epoch": 427} {"train_loss": -5.369162082672119, "global_step": 17960, "epoch": 427} {"train_loss": -5.2398576736450195, "global_step": 17961, "epoch": 427} {"train_loss": -5.200770854949951, "global_step": 17962, "epoch": 427} {"train_loss": -5.233602523803711, "global_step": 17963, "epoch": 427} {"train_loss": -5.2100934982299805, "global_step": 17964, "epoch": 427} {"train_loss": -5.291954517364502, "global_step": 17965, "epoch": 427} {"train_loss": -5.283577919006348, "global_step": 17966, "epoch": 427} {"train_loss": -5.233379364013672, "global_step": 17967, "epoch": 427} {"train_loss": -5.321150302886963, "global_step": 17968, "epoch": 427} {"train_loss": -5.206724643707275, "global_step": 17969, "epoch": 427} {"train_loss": -5.076594352722168, "global_step": 17970, "epoch": 427} {"train_loss": -5.341381549835205, "global_step": 17971, "epoch": 427} {"train_loss": -5.27775764465332, "global_step": 17972, "epoch": 427} {"train_loss": -5.197976112365723, "global_step": 17973, "epoch": 427} {"train_loss": -5.098884582519531, "global_step": 17974, "epoch": 427} {"train_loss": -5.232967331295922, "global_step": 17975, "epoch": 427, "val_loss": 68446.9375} {"train_loss": -5.40664005279541, "global_step": 17976, "epoch": 428} {"train_loss": -4.924463748931885, "global_step": 17977, "epoch": 428} {"train_loss": -5.180397987365723, "global_step": 17978, "epoch": 428} {"train_loss": -5.037018299102783, "global_step": 17979, "epoch": 428} {"train_loss": -4.997959136962891, "global_step": 17980, "epoch": 428} {"train_loss": -5.2666778564453125, "global_step": 17981, "epoch": 428} {"train_loss": -4.928864479064941, "global_step": 17982, "epoch": 428} {"train_loss": -5.162330627441406, "global_step": 17983, "epoch": 428} {"train_loss": -5.175164699554443, "global_step": 17984, "epoch": 428} {"train_loss": -5.20137882232666, "global_step": 17985, "epoch": 428} {"train_loss": -5.12577486038208, "global_step": 17986, "epoch": 428} {"train_loss": -5.098993301391602, "global_step": 17987, "epoch": 428} {"train_loss": -5.319331645965576, "global_step": 17988, "epoch": 428} {"train_loss": -5.171852111816406, "global_step": 17989, "epoch": 428} {"train_loss": -5.289604187011719, "global_step": 17990, "epoch": 428} {"train_loss": -5.2075605392456055, "global_step": 17991, "epoch": 428} {"train_loss": -5.318554878234863, "global_step": 17992, "epoch": 428} {"train_loss": -5.079866886138916, "global_step": 17993, "epoch": 428} {"train_loss": -5.243649482727051, "global_step": 17994, "epoch": 428} {"train_loss": -5.314065933227539, "global_step": 17995, "epoch": 428} {"train_loss": -5.267959117889404, "global_step": 17996, "epoch": 428} {"train_loss": -5.290496349334717, "global_step": 17997, "epoch": 428} {"train_loss": -5.15703010559082, "global_step": 17998, "epoch": 428} {"train_loss": -5.195023059844971, "global_step": 17999, "epoch": 428} {"train_loss": -5.187746047973633, "global_step": 18000, "epoch": 428} {"train_loss": -5.158055305480957, "global_step": 18001, "epoch": 428} {"train_loss": -5.152830123901367, "global_step": 18002, "epoch": 428} {"train_loss": -5.268047332763672, "global_step": 18003, "epoch": 428} {"train_loss": -5.1600213050842285, "global_step": 18004, "epoch": 428} {"train_loss": -5.254158973693848, "global_step": 18005, "epoch": 428} {"train_loss": -5.227431297302246, "global_step": 18006, "epoch": 428} {"train_loss": -5.130128860473633, "global_step": 18007, "epoch": 428} {"train_loss": -5.250857830047607, "global_step": 18008, "epoch": 428} {"train_loss": -5.2207932472229, "global_step": 18009, "epoch": 428} {"train_loss": -5.211002349853516, "global_step": 18010, "epoch": 428} {"train_loss": -5.444489479064941, "global_step": 18011, "epoch": 428} {"train_loss": -5.298885345458984, "global_step": 18012, "epoch": 428} {"train_loss": -5.258625030517578, "global_step": 18013, "epoch": 428} {"train_loss": -5.290335655212402, "global_step": 18014, "epoch": 428} {"train_loss": -5.358534336090088, "global_step": 18015, "epoch": 428} {"train_loss": -5.265336990356445, "global_step": 18016, "epoch": 428} {"train_loss": -5.209129901159377, "global_step": 18017, "epoch": 428, "val_loss": 68980.1484375} {"train_loss": -5.180127143859863, "global_step": 18018, "epoch": 429} {"train_loss": -5.244109153747559, "global_step": 18019, "epoch": 429} {"train_loss": -5.3525776863098145, "global_step": 18020, "epoch": 429} {"train_loss": -5.152164459228516, "global_step": 18021, "epoch": 429} {"train_loss": -5.261016845703125, "global_step": 18022, "epoch": 429} {"train_loss": -5.351679801940918, "global_step": 18023, "epoch": 429} {"train_loss": -5.255359649658203, "global_step": 18024, "epoch": 429} {"train_loss": -5.254002571105957, "global_step": 18025, "epoch": 429} {"train_loss": -5.288028717041016, "global_step": 18026, "epoch": 429} {"train_loss": -5.146052837371826, "global_step": 18027, "epoch": 429} {"train_loss": -5.286015510559082, "global_step": 18028, "epoch": 429} {"train_loss": -5.15472412109375, "global_step": 18029, "epoch": 429} {"train_loss": -5.317022800445557, "global_step": 18030, "epoch": 429} {"train_loss": -5.417960166931152, "global_step": 18031, "epoch": 429} {"train_loss": -5.2308149337768555, "global_step": 18032, "epoch": 429} {"train_loss": -5.176348686218262, "global_step": 18033, "epoch": 429} {"train_loss": -5.356849193572998, "global_step": 18034, "epoch": 429} {"train_loss": -5.317337512969971, "global_step": 18035, "epoch": 429} {"train_loss": -5.2214460372924805, "global_step": 18036, "epoch": 429} {"train_loss": -5.354147434234619, "global_step": 18037, "epoch": 429} {"train_loss": -5.342555999755859, "global_step": 18038, "epoch": 429} {"train_loss": -5.301662445068359, "global_step": 18039, "epoch": 429} {"train_loss": -5.257514476776123, "global_step": 18040, "epoch": 429} {"train_loss": -5.3911824226379395, "global_step": 18041, "epoch": 429} {"train_loss": -5.222075939178467, "global_step": 18042, "epoch": 429} {"train_loss": -5.360739707946777, "global_step": 18043, "epoch": 429} {"train_loss": -5.310977458953857, "global_step": 18044, "epoch": 429} {"train_loss": -5.1735334396362305, "global_step": 18045, "epoch": 429} {"train_loss": -5.2785468101501465, "global_step": 18046, "epoch": 429} {"train_loss": -5.231700897216797, "global_step": 18047, "epoch": 429} {"train_loss": -5.224178314208984, "global_step": 18048, "epoch": 429} {"train_loss": -5.292693138122559, "global_step": 18049, "epoch": 429} {"train_loss": -5.251896858215332, "global_step": 18050, "epoch": 429} {"train_loss": -5.189263343811035, "global_step": 18051, "epoch": 429} {"train_loss": -5.297505855560303, "global_step": 18052, "epoch": 429} {"train_loss": -5.2342329025268555, "global_step": 18053, "epoch": 429} {"train_loss": -5.229726791381836, "global_step": 18054, "epoch": 429} {"train_loss": -5.327239036560059, "global_step": 18055, "epoch": 429} {"train_loss": -5.334322929382324, "global_step": 18056, "epoch": 429} {"train_loss": -5.35471773147583, "global_step": 18057, "epoch": 429} {"train_loss": -5.310825347900391, "global_step": 18058, "epoch": 429} {"train_loss": -5.272989443370274, "global_step": 18059, "epoch": 429, "val_loss": 68784.1640625} {"train_loss": -5.27482795715332, "global_step": 18060, "epoch": 430} {"train_loss": -5.242611885070801, "global_step": 18061, "epoch": 430} {"train_loss": -5.234935283660889, "global_step": 18062, "epoch": 430} {"train_loss": -5.247551441192627, "global_step": 18063, "epoch": 430} {"train_loss": -5.311873435974121, "global_step": 18064, "epoch": 430} {"train_loss": -5.1983642578125, "global_step": 18065, "epoch": 430} {"train_loss": -5.262856483459473, "global_step": 18066, "epoch": 430} {"train_loss": -5.353021144866943, "global_step": 18067, "epoch": 430} {"train_loss": -5.341170787811279, "global_step": 18068, "epoch": 430} {"train_loss": -5.349438667297363, "global_step": 18069, "epoch": 430} {"train_loss": -5.426374912261963, "global_step": 18070, "epoch": 430} {"train_loss": -5.317990779876709, "global_step": 18071, "epoch": 430} {"train_loss": -5.247702598571777, "global_step": 18072, "epoch": 430} {"train_loss": -5.131248474121094, "global_step": 18073, "epoch": 430} {"train_loss": -5.188892364501953, "global_step": 18074, "epoch": 430} {"train_loss": -5.280630111694336, "global_step": 18075, "epoch": 430} {"train_loss": -5.181656837463379, "global_step": 18076, "epoch": 430} {"train_loss": -5.247829914093018, "global_step": 18077, "epoch": 430} {"train_loss": -5.149603366851807, "global_step": 18078, "epoch": 430} {"train_loss": -5.212009429931641, "global_step": 18079, "epoch": 430} {"train_loss": -5.253671169281006, "global_step": 18080, "epoch": 430} {"train_loss": -4.99600887298584, "global_step": 18081, "epoch": 430} {"train_loss": -5.140627384185791, "global_step": 18082, "epoch": 430} {"train_loss": -5.114359378814697, "global_step": 18083, "epoch": 430} {"train_loss": -5.042093276977539, "global_step": 18084, "epoch": 430} {"train_loss": -5.300440788269043, "global_step": 18085, "epoch": 430} {"train_loss": -5.079106330871582, "global_step": 18086, "epoch": 430} {"train_loss": -5.269142150878906, "global_step": 18087, "epoch": 430} {"train_loss": -5.143819332122803, "global_step": 18088, "epoch": 430} {"train_loss": -5.2703046798706055, "global_step": 18089, "epoch": 430} {"train_loss": -5.224915504455566, "global_step": 18090, "epoch": 430} {"train_loss": -5.209177494049072, "global_step": 18091, "epoch": 430} {"train_loss": -5.182886123657227, "global_step": 18092, "epoch": 430} {"train_loss": -5.302055358886719, "global_step": 18093, "epoch": 430} {"train_loss": -5.1979899406433105, "global_step": 18094, "epoch": 430} {"train_loss": -5.301602363586426, "global_step": 18095, "epoch": 430} {"train_loss": -5.1858906745910645, "global_step": 18096, "epoch": 430} {"train_loss": -5.2955498695373535, "global_step": 18097, "epoch": 430} {"train_loss": -5.233963489532471, "global_step": 18098, "epoch": 430} {"train_loss": -5.247225761413574, "global_step": 18099, "epoch": 430} {"train_loss": -5.319766998291016, "global_step": 18100, "epoch": 430} {"train_loss": -5.2301164127531505, "global_step": 18101, "epoch": 430, "val_loss": 68738.71875} {"train_loss": -5.280713081359863, "global_step": 18102, "epoch": 431} {"train_loss": -5.322443962097168, "global_step": 18103, "epoch": 431} {"train_loss": -5.085422515869141, "global_step": 18104, "epoch": 431} {"train_loss": -5.251345634460449, "global_step": 18105, "epoch": 431} {"train_loss": -5.167051315307617, "global_step": 18106, "epoch": 431} {"train_loss": -5.2263689041137695, "global_step": 18107, "epoch": 431} {"train_loss": -5.285002708435059, "global_step": 18108, "epoch": 431} {"train_loss": -5.466255187988281, "global_step": 18109, "epoch": 431} {"train_loss": -5.285304546356201, "global_step": 18110, "epoch": 431} {"train_loss": -5.2075910568237305, "global_step": 18111, "epoch": 431} {"train_loss": -5.333417892456055, "global_step": 18112, "epoch": 431} {"train_loss": -5.284041404724121, "global_step": 18113, "epoch": 431} {"train_loss": -5.285251617431641, "global_step": 18114, "epoch": 431} {"train_loss": -5.229942321777344, "global_step": 18115, "epoch": 431} {"train_loss": -5.259028911590576, "global_step": 18116, "epoch": 431} {"train_loss": -5.225039005279541, "global_step": 18117, "epoch": 431} {"train_loss": -5.174166679382324, "global_step": 18118, "epoch": 431} {"train_loss": -5.5232696533203125, "global_step": 18119, "epoch": 431} {"train_loss": -5.242345333099365, "global_step": 18120, "epoch": 431} {"train_loss": -5.190494537353516, "global_step": 18121, "epoch": 431} {"train_loss": -5.38795280456543, "global_step": 18122, "epoch": 431} {"train_loss": -5.140969753265381, "global_step": 18123, "epoch": 431} {"train_loss": -5.308114528656006, "global_step": 18124, "epoch": 431} {"train_loss": -5.337241172790527, "global_step": 18125, "epoch": 431} {"train_loss": -5.3799943923950195, "global_step": 18126, "epoch": 431} {"train_loss": -5.30178165435791, "global_step": 18127, "epoch": 431} {"train_loss": -5.119697570800781, "global_step": 18128, "epoch": 431} {"train_loss": -5.2778167724609375, "global_step": 18129, "epoch": 431} {"train_loss": -5.311902046203613, "global_step": 18130, "epoch": 431} {"train_loss": -5.170235633850098, "global_step": 18131, "epoch": 431} {"train_loss": -5.2888994216918945, "global_step": 18132, "epoch": 431} {"train_loss": -5.205423831939697, "global_step": 18133, "epoch": 431} {"train_loss": -5.437908172607422, "global_step": 18134, "epoch": 431} {"train_loss": -5.233919143676758, "global_step": 18135, "epoch": 431} {"train_loss": -5.25786018371582, "global_step": 18136, "epoch": 431} {"train_loss": -5.362333297729492, "global_step": 18137, "epoch": 431} {"train_loss": -5.139519214630127, "global_step": 18138, "epoch": 431} {"train_loss": -5.105856895446777, "global_step": 18139, "epoch": 431} {"train_loss": -5.421611785888672, "global_step": 18140, "epoch": 431} {"train_loss": -5.2974138259887695, "global_step": 18141, "epoch": 431} {"train_loss": -5.266197681427002, "global_step": 18142, "epoch": 431} {"train_loss": -5.270221835091, "global_step": 18143, "epoch": 431, "val_loss": 68304.5078125} {"train_loss": -5.178233623504639, "global_step": 18144, "epoch": 432} {"train_loss": -5.0842461585998535, "global_step": 18145, "epoch": 432} {"train_loss": -5.271903991699219, "global_step": 18146, "epoch": 432} {"train_loss": -5.129096984863281, "global_step": 18147, "epoch": 432} {"train_loss": -5.273097038269043, "global_step": 18148, "epoch": 432} {"train_loss": -5.146916389465332, "global_step": 18149, "epoch": 432} {"train_loss": -5.287961959838867, "global_step": 18150, "epoch": 432} {"train_loss": -5.1487321853637695, "global_step": 18151, "epoch": 432} {"train_loss": -5.2672834396362305, "global_step": 18152, "epoch": 432} {"train_loss": -5.195674419403076, "global_step": 18153, "epoch": 432} {"train_loss": -5.375581741333008, "global_step": 18154, "epoch": 432} {"train_loss": -5.297379493713379, "global_step": 18155, "epoch": 432} {"train_loss": -5.383297920227051, "global_step": 18156, "epoch": 432} {"train_loss": -5.301137924194336, "global_step": 18157, "epoch": 432} {"train_loss": -5.263348579406738, "global_step": 18158, "epoch": 432} {"train_loss": -5.2883477210998535, "global_step": 18159, "epoch": 432} {"train_loss": -5.334344863891602, "global_step": 18160, "epoch": 432} {"train_loss": -5.322827339172363, "global_step": 18161, "epoch": 432} {"train_loss": -5.062438011169434, "global_step": 18162, "epoch": 432} {"train_loss": -5.340039253234863, "global_step": 18163, "epoch": 432} {"train_loss": -5.18751859664917, "global_step": 18164, "epoch": 432} {"train_loss": -5.277318954467773, "global_step": 18165, "epoch": 432} {"train_loss": -5.290188312530518, "global_step": 18166, "epoch": 432} {"train_loss": -5.242770195007324, "global_step": 18167, "epoch": 432} {"train_loss": -5.312744140625, "global_step": 18168, "epoch": 432} {"train_loss": -5.251777172088623, "global_step": 18169, "epoch": 432} {"train_loss": -5.372470378875732, "global_step": 18170, "epoch": 432} {"train_loss": -5.2828497886657715, "global_step": 18171, "epoch": 432} {"train_loss": -5.401524066925049, "global_step": 18172, "epoch": 432} {"train_loss": -5.061452388763428, "global_step": 18173, "epoch": 432} {"train_loss": -5.1785054206848145, "global_step": 18174, "epoch": 432} {"train_loss": -5.321563243865967, "global_step": 18175, "epoch": 432} {"train_loss": -5.104640007019043, "global_step": 18176, "epoch": 432} {"train_loss": -5.40244722366333, "global_step": 18177, "epoch": 432} {"train_loss": -5.284787178039551, "global_step": 18178, "epoch": 432} {"train_loss": -5.329557418823242, "global_step": 18179, "epoch": 432} {"train_loss": -5.187223434448242, "global_step": 18180, "epoch": 432} {"train_loss": -5.275354385375977, "global_step": 18181, "epoch": 432} {"train_loss": -5.4143967628479, "global_step": 18182, "epoch": 432} {"train_loss": -5.164279460906982, "global_step": 18183, "epoch": 432} {"train_loss": -5.373604774475098, "global_step": 18184, "epoch": 432} {"train_loss": -5.260090101332891, "global_step": 18185, "epoch": 432, "val_loss": 68121.359375} {"train_loss": -5.188061714172363, "global_step": 18186, "epoch": 433} {"train_loss": -5.3393964767456055, "global_step": 18187, "epoch": 433} {"train_loss": -5.137457370758057, "global_step": 18188, "epoch": 433} {"train_loss": -5.265966415405273, "global_step": 18189, "epoch": 433} {"train_loss": -5.287785530090332, "global_step": 18190, "epoch": 433} {"train_loss": -5.268000602722168, "global_step": 18191, "epoch": 433} {"train_loss": -5.232442855834961, "global_step": 18192, "epoch": 433} {"train_loss": -5.163234233856201, "global_step": 18193, "epoch": 433} {"train_loss": -5.446761131286621, "global_step": 18194, "epoch": 433} {"train_loss": -5.347946643829346, "global_step": 18195, "epoch": 433} {"train_loss": -5.320412635803223, "global_step": 18196, "epoch": 433} {"train_loss": -5.204975128173828, "global_step": 18197, "epoch": 433} {"train_loss": -5.266358375549316, "global_step": 18198, "epoch": 433} {"train_loss": -5.236697196960449, "global_step": 18199, "epoch": 433} {"train_loss": -5.224610805511475, "global_step": 18200, "epoch": 433} {"train_loss": -5.170762062072754, "global_step": 18201, "epoch": 433} {"train_loss": -5.358822822570801, "global_step": 18202, "epoch": 433} {"train_loss": -5.206352710723877, "global_step": 18203, "epoch": 433} {"train_loss": -5.127546310424805, "global_step": 18204, "epoch": 433} {"train_loss": -5.242273807525635, "global_step": 18205, "epoch": 433} {"train_loss": -5.185946941375732, "global_step": 18206, "epoch": 433} {"train_loss": -5.188808441162109, "global_step": 18207, "epoch": 433} {"train_loss": -5.251477241516113, "global_step": 18208, "epoch": 433} {"train_loss": -5.139242649078369, "global_step": 18209, "epoch": 433} {"train_loss": -5.2970733642578125, "global_step": 18210, "epoch": 433} {"train_loss": -5.199552059173584, "global_step": 18211, "epoch": 433} {"train_loss": -5.236499309539795, "global_step": 18212, "epoch": 433} {"train_loss": -5.414320468902588, "global_step": 18213, "epoch": 433} {"train_loss": -5.353942394256592, "global_step": 18214, "epoch": 433} {"train_loss": -5.200812339782715, "global_step": 18215, "epoch": 433} {"train_loss": -5.253899574279785, "global_step": 18216, "epoch": 433} {"train_loss": -5.28451681137085, "global_step": 18217, "epoch": 433} {"train_loss": -5.198993682861328, "global_step": 18218, "epoch": 433} {"train_loss": -5.425959587097168, "global_step": 18219, "epoch": 433} {"train_loss": -5.205936431884766, "global_step": 18220, "epoch": 433} {"train_loss": -5.255295753479004, "global_step": 18221, "epoch": 433} {"train_loss": -5.233394622802734, "global_step": 18222, "epoch": 433} {"train_loss": -5.2220635414123535, "global_step": 18223, "epoch": 433} {"train_loss": -5.386387825012207, "global_step": 18224, "epoch": 433} {"train_loss": -5.308258056640625, "global_step": 18225, "epoch": 433} {"train_loss": -5.25083589553833, "global_step": 18226, "epoch": 433} {"train_loss": -5.25911249433245, "global_step": 18227, "epoch": 433, "val_loss": 68151.578125} {"train_loss": -5.2417192459106445, "global_step": 18228, "epoch": 434} {"train_loss": -5.2661356925964355, "global_step": 18229, "epoch": 434} {"train_loss": -5.221462249755859, "global_step": 18230, "epoch": 434} {"train_loss": -5.362251281738281, "global_step": 18231, "epoch": 434} {"train_loss": -5.225248336791992, "global_step": 18232, "epoch": 434} {"train_loss": -5.269569396972656, "global_step": 18233, "epoch": 434} {"train_loss": -5.327583312988281, "global_step": 18234, "epoch": 434} {"train_loss": -5.191575050354004, "global_step": 18235, "epoch": 434} {"train_loss": -5.203487396240234, "global_step": 18236, "epoch": 434} {"train_loss": -5.240724563598633, "global_step": 18237, "epoch": 434} {"train_loss": -5.278135776519775, "global_step": 18238, "epoch": 434} {"train_loss": -5.186300277709961, "global_step": 18239, "epoch": 434} {"train_loss": -5.323638439178467, "global_step": 18240, "epoch": 434} {"train_loss": -5.213438034057617, "global_step": 18241, "epoch": 434} {"train_loss": -5.298995018005371, "global_step": 18242, "epoch": 434} {"train_loss": -5.279980659484863, "global_step": 18243, "epoch": 434} {"train_loss": -5.395627498626709, "global_step": 18244, "epoch": 434} {"train_loss": -5.3440399169921875, "global_step": 18245, "epoch": 434} {"train_loss": -5.307497978210449, "global_step": 18246, "epoch": 434} {"train_loss": -5.164527893066406, "global_step": 18247, "epoch": 434} {"train_loss": -5.263370990753174, "global_step": 18248, "epoch": 434} {"train_loss": -5.199225902557373, "global_step": 18249, "epoch": 434} {"train_loss": -5.311607360839844, "global_step": 18250, "epoch": 434} {"train_loss": -5.25214958190918, "global_step": 18251, "epoch": 434} {"train_loss": -5.1789751052856445, "global_step": 18252, "epoch": 434} {"train_loss": -5.294643402099609, "global_step": 18253, "epoch": 434} {"train_loss": -5.3389081954956055, "global_step": 18254, "epoch": 434} {"train_loss": -5.169852256774902, "global_step": 18255, "epoch": 434} {"train_loss": -5.118930816650391, "global_step": 18256, "epoch": 434} {"train_loss": -5.318533420562744, "global_step": 18257, "epoch": 434} {"train_loss": -5.284780502319336, "global_step": 18258, "epoch": 434} {"train_loss": -5.272549152374268, "global_step": 18259, "epoch": 434} {"train_loss": -5.328574180603027, "global_step": 18260, "epoch": 434} {"train_loss": -5.253607273101807, "global_step": 18261, "epoch": 434} {"train_loss": -5.367853164672852, "global_step": 18262, "epoch": 434} {"train_loss": -5.421202659606934, "global_step": 18263, "epoch": 434} {"train_loss": -5.165234088897705, "global_step": 18264, "epoch": 434} {"train_loss": -5.2041730880737305, "global_step": 18265, "epoch": 434} {"train_loss": -5.288257598876953, "global_step": 18266, "epoch": 434} {"train_loss": -5.237495422363281, "global_step": 18267, "epoch": 434} {"train_loss": -5.324389457702637, "global_step": 18268, "epoch": 434} {"train_loss": -5.2647819973173595, "global_step": 18269, "epoch": 434, "val_loss": 68572.703125} {"train_loss": -5.31694221496582, "global_step": 18270, "epoch": 435} {"train_loss": -5.312317848205566, "global_step": 18271, "epoch": 435} {"train_loss": -5.140645980834961, "global_step": 18272, "epoch": 435} {"train_loss": -5.39504861831665, "global_step": 18273, "epoch": 435} {"train_loss": -5.337220668792725, "global_step": 18274, "epoch": 435} {"train_loss": -5.08738899230957, "global_step": 18275, "epoch": 435} {"train_loss": -5.223308563232422, "global_step": 18276, "epoch": 435} {"train_loss": -5.329685211181641, "global_step": 18277, "epoch": 435} {"train_loss": -5.2208099365234375, "global_step": 18278, "epoch": 435} {"train_loss": -5.282412052154541, "global_step": 18279, "epoch": 435} {"train_loss": -5.303910255432129, "global_step": 18280, "epoch": 435} {"train_loss": -5.328772068023682, "global_step": 18281, "epoch": 435} {"train_loss": -5.379079341888428, "global_step": 18282, "epoch": 435} {"train_loss": -5.289471626281738, "global_step": 18283, "epoch": 435} {"train_loss": -5.333837985992432, "global_step": 18284, "epoch": 435} {"train_loss": -5.257458686828613, "global_step": 18285, "epoch": 435} {"train_loss": -5.308740139007568, "global_step": 18286, "epoch": 435} {"train_loss": -5.268756866455078, "global_step": 18287, "epoch": 435} {"train_loss": -5.244524955749512, "global_step": 18288, "epoch": 435} {"train_loss": -5.288370609283447, "global_step": 18289, "epoch": 435} {"train_loss": -5.316508769989014, "global_step": 18290, "epoch": 435} {"train_loss": -5.215689182281494, "global_step": 18291, "epoch": 435} {"train_loss": -5.238482475280762, "global_step": 18292, "epoch": 435} {"train_loss": -5.173542022705078, "global_step": 18293, "epoch": 435} {"train_loss": -5.342844009399414, "global_step": 18294, "epoch": 435} {"train_loss": -5.306015968322754, "global_step": 18295, "epoch": 435} {"train_loss": -5.131230354309082, "global_step": 18296, "epoch": 435} {"train_loss": -5.210688591003418, "global_step": 18297, "epoch": 435} {"train_loss": -5.344769477844238, "global_step": 18298, "epoch": 435} {"train_loss": -5.168723106384277, "global_step": 18299, "epoch": 435} {"train_loss": -5.279475212097168, "global_step": 18300, "epoch": 435} {"train_loss": -5.126429557800293, "global_step": 18301, "epoch": 435} {"train_loss": -5.215937614440918, "global_step": 18302, "epoch": 435} {"train_loss": -5.254018306732178, "global_step": 18303, "epoch": 435} {"train_loss": -5.128671646118164, "global_step": 18304, "epoch": 435} {"train_loss": -5.237488746643066, "global_step": 18305, "epoch": 435} {"train_loss": -5.349740982055664, "global_step": 18306, "epoch": 435} {"train_loss": -5.222491264343262, "global_step": 18307, "epoch": 435} {"train_loss": -5.207948207855225, "global_step": 18308, "epoch": 435} {"train_loss": -5.313902854919434, "global_step": 18309, "epoch": 435} {"train_loss": -5.1061320304870605, "global_step": 18310, "epoch": 435} {"train_loss": -5.2564039457412, "global_step": 18311, "epoch": 435, "val_loss": 68682.421875} {"train_loss": -5.207200050354004, "global_step": 18312, "epoch": 436} {"train_loss": -5.244909286499023, "global_step": 18313, "epoch": 436} {"train_loss": -5.3693084716796875, "global_step": 18314, "epoch": 436} {"train_loss": -5.259941577911377, "global_step": 18315, "epoch": 436} {"train_loss": -5.274094581604004, "global_step": 18316, "epoch": 436} {"train_loss": -5.238667964935303, "global_step": 18317, "epoch": 436} {"train_loss": -5.183872222900391, "global_step": 18318, "epoch": 436} {"train_loss": -5.319141387939453, "global_step": 18319, "epoch": 436} {"train_loss": -5.181314945220947, "global_step": 18320, "epoch": 436} {"train_loss": -5.186140060424805, "global_step": 18321, "epoch": 436} {"train_loss": -5.3935041427612305, "global_step": 18322, "epoch": 436} {"train_loss": -5.292425155639648, "global_step": 18323, "epoch": 436} {"train_loss": -5.283202171325684, "global_step": 18324, "epoch": 436} {"train_loss": -5.243091106414795, "global_step": 18325, "epoch": 436} {"train_loss": -5.364500999450684, "global_step": 18326, "epoch": 436} {"train_loss": -5.215384006500244, "global_step": 18327, "epoch": 436} {"train_loss": -5.41912841796875, "global_step": 18328, "epoch": 436} {"train_loss": -5.303164482116699, "global_step": 18329, "epoch": 436} {"train_loss": -5.358019828796387, "global_step": 18330, "epoch": 436} {"train_loss": -5.348445892333984, "global_step": 18331, "epoch": 436} {"train_loss": -5.345649719238281, "global_step": 18332, "epoch": 436} {"train_loss": -5.128256797790527, "global_step": 18333, "epoch": 436} {"train_loss": -5.256089210510254, "global_step": 18334, "epoch": 436} {"train_loss": -5.430083751678467, "global_step": 18335, "epoch": 436} {"train_loss": -5.212177753448486, "global_step": 18336, "epoch": 436} {"train_loss": -5.053763389587402, "global_step": 18337, "epoch": 436} {"train_loss": -5.257107734680176, "global_step": 18338, "epoch": 436} {"train_loss": -5.283595085144043, "global_step": 18339, "epoch": 436} {"train_loss": -5.179713249206543, "global_step": 18340, "epoch": 436} {"train_loss": -5.137697219848633, "global_step": 18341, "epoch": 436} {"train_loss": -5.285150527954102, "global_step": 18342, "epoch": 436} {"train_loss": -5.275503158569336, "global_step": 18343, "epoch": 436} {"train_loss": -5.278409957885742, "global_step": 18344, "epoch": 436} {"train_loss": -5.236868858337402, "global_step": 18345, "epoch": 436} {"train_loss": -5.21387243270874, "global_step": 18346, "epoch": 436} {"train_loss": -5.3277482986450195, "global_step": 18347, "epoch": 436} {"train_loss": -5.246903419494629, "global_step": 18348, "epoch": 436} {"train_loss": -5.251367092132568, "global_step": 18349, "epoch": 436} {"train_loss": -5.377518653869629, "global_step": 18350, "epoch": 436} {"train_loss": -5.207246780395508, "global_step": 18351, "epoch": 436} {"train_loss": -5.179825782775879, "global_step": 18352, "epoch": 436} {"train_loss": -5.267103444962275, "global_step": 18353, "epoch": 436, "val_loss": 68102.53125} {"train_loss": -5.278907775878906, "global_step": 18354, "epoch": 437} {"train_loss": -5.269285202026367, "global_step": 18355, "epoch": 437} {"train_loss": -5.3069658279418945, "global_step": 18356, "epoch": 437} {"train_loss": -5.389227867126465, "global_step": 18357, "epoch": 437} {"train_loss": -5.2264180183410645, "global_step": 18358, "epoch": 437} {"train_loss": -5.341946601867676, "global_step": 18359, "epoch": 437} {"train_loss": -5.241127014160156, "global_step": 18360, "epoch": 437} {"train_loss": -5.1369452476501465, "global_step": 18361, "epoch": 437} {"train_loss": -5.203077793121338, "global_step": 18362, "epoch": 437} {"train_loss": -5.29628849029541, "global_step": 18363, "epoch": 437} {"train_loss": -5.3372602462768555, "global_step": 18364, "epoch": 437} {"train_loss": -5.255261421203613, "global_step": 18365, "epoch": 437} {"train_loss": -5.4066972732543945, "global_step": 18366, "epoch": 437} {"train_loss": -5.277889251708984, "global_step": 18367, "epoch": 437} {"train_loss": -5.171680927276611, "global_step": 18368, "epoch": 437} {"train_loss": -5.121407985687256, "global_step": 18369, "epoch": 437} {"train_loss": -5.138873100280762, "global_step": 18370, "epoch": 437} {"train_loss": -5.206265926361084, "global_step": 18371, "epoch": 437} {"train_loss": -5.2199931144714355, "global_step": 18372, "epoch": 437} {"train_loss": -5.207827091217041, "global_step": 18373, "epoch": 437} {"train_loss": -5.326847076416016, "global_step": 18374, "epoch": 437} {"train_loss": -5.315263748168945, "global_step": 18375, "epoch": 437} {"train_loss": -5.335554122924805, "global_step": 18376, "epoch": 437} {"train_loss": -5.301372528076172, "global_step": 18377, "epoch": 437} {"train_loss": -5.252324104309082, "global_step": 18378, "epoch": 437} {"train_loss": -5.391756057739258, "global_step": 18379, "epoch": 437} {"train_loss": -5.245800495147705, "global_step": 18380, "epoch": 437} {"train_loss": -5.336031913757324, "global_step": 18381, "epoch": 437} {"train_loss": -5.2805585861206055, "global_step": 18382, "epoch": 437} {"train_loss": -5.203911781311035, "global_step": 18383, "epoch": 437} {"train_loss": -5.244093418121338, "global_step": 18384, "epoch": 437} {"train_loss": -5.364253520965576, "global_step": 18385, "epoch": 437} {"train_loss": -5.177987098693848, "global_step": 18386, "epoch": 437} {"train_loss": -5.06191873550415, "global_step": 18387, "epoch": 437} {"train_loss": -5.0356879234313965, "global_step": 18388, "epoch": 437} {"train_loss": -5.377668380737305, "global_step": 18389, "epoch": 437} {"train_loss": -5.241279602050781, "global_step": 18390, "epoch": 437} {"train_loss": -5.207855701446533, "global_step": 18391, "epoch": 437} {"train_loss": -5.318323612213135, "global_step": 18392, "epoch": 437} {"train_loss": -5.166587829589844, "global_step": 18393, "epoch": 437} {"train_loss": -5.248621940612793, "global_step": 18394, "epoch": 437} {"train_loss": -5.256294715972174, "global_step": 18395, "epoch": 437, "val_loss": 68582.5625} {"train_loss": -5.239490985870361, "global_step": 18396, "epoch": 438} {"train_loss": -5.394491195678711, "global_step": 18397, "epoch": 438} {"train_loss": -5.197141647338867, "global_step": 18398, "epoch": 438} {"train_loss": -5.1991682052612305, "global_step": 18399, "epoch": 438} {"train_loss": -5.163412094116211, "global_step": 18400, "epoch": 438} {"train_loss": -5.135855674743652, "global_step": 18401, "epoch": 438} {"train_loss": -5.2394256591796875, "global_step": 18402, "epoch": 438} {"train_loss": -5.268123626708984, "global_step": 18403, "epoch": 438} {"train_loss": -5.183305740356445, "global_step": 18404, "epoch": 438} {"train_loss": -5.242589950561523, "global_step": 18405, "epoch": 438} {"train_loss": -5.198793411254883, "global_step": 18406, "epoch": 438} {"train_loss": -5.283517837524414, "global_step": 18407, "epoch": 438} {"train_loss": -5.300935745239258, "global_step": 18408, "epoch": 438} {"train_loss": -5.263833522796631, "global_step": 18409, "epoch": 438} {"train_loss": -5.238439559936523, "global_step": 18410, "epoch": 438} {"train_loss": -5.288105487823486, "global_step": 18411, "epoch": 438} {"train_loss": -5.114079475402832, "global_step": 18412, "epoch": 438} {"train_loss": -5.375456809997559, "global_step": 18413, "epoch": 438} {"train_loss": -5.08894157409668, "global_step": 18414, "epoch": 438} {"train_loss": -5.284252166748047, "global_step": 18415, "epoch": 438} {"train_loss": -5.299189567565918, "global_step": 18416, "epoch": 438} {"train_loss": -5.122227668762207, "global_step": 18417, "epoch": 438} {"train_loss": -5.242156505584717, "global_step": 18418, "epoch": 438} {"train_loss": -5.187103271484375, "global_step": 18419, "epoch": 438} {"train_loss": -5.319209098815918, "global_step": 18420, "epoch": 438} {"train_loss": -5.321962833404541, "global_step": 18421, "epoch": 438} {"train_loss": -5.280361175537109, "global_step": 18422, "epoch": 438} {"train_loss": -5.201853275299072, "global_step": 18423, "epoch": 438} {"train_loss": -5.335191249847412, "global_step": 18424, "epoch": 438} {"train_loss": -5.212458610534668, "global_step": 18425, "epoch": 438} {"train_loss": -5.196151256561279, "global_step": 18426, "epoch": 438} {"train_loss": -5.244040489196777, "global_step": 18427, "epoch": 438} {"train_loss": -5.182769775390625, "global_step": 18428, "epoch": 438} {"train_loss": -5.269889831542969, "global_step": 18429, "epoch": 438} {"train_loss": -5.286478519439697, "global_step": 18430, "epoch": 438} {"train_loss": -5.3212890625, "global_step": 18431, "epoch": 438} {"train_loss": -5.139049530029297, "global_step": 18432, "epoch": 438} {"train_loss": -5.313365936279297, "global_step": 18433, "epoch": 438} {"train_loss": -5.132709503173828, "global_step": 18434, "epoch": 438} {"train_loss": -5.390780448913574, "global_step": 18435, "epoch": 438} {"train_loss": -5.108573913574219, "global_step": 18436, "epoch": 438} {"train_loss": -5.235496134985061, "global_step": 18437, "epoch": 438, "val_loss": 68164.875} {"train_loss": -5.215117931365967, "global_step": 18438, "epoch": 439} {"train_loss": -4.984439849853516, "global_step": 18439, "epoch": 439} {"train_loss": -5.278563976287842, "global_step": 18440, "epoch": 439} {"train_loss": -5.260318756103516, "global_step": 18441, "epoch": 439} {"train_loss": -5.134198188781738, "global_step": 18442, "epoch": 439} {"train_loss": -5.002848148345947, "global_step": 18443, "epoch": 439} {"train_loss": -5.364249229431152, "global_step": 18444, "epoch": 439} {"train_loss": -5.189472198486328, "global_step": 18445, "epoch": 439} {"train_loss": -5.22935676574707, "global_step": 18446, "epoch": 439} {"train_loss": -5.303999423980713, "global_step": 18447, "epoch": 439} {"train_loss": -5.200870513916016, "global_step": 18448, "epoch": 439} {"train_loss": -5.223067760467529, "global_step": 18449, "epoch": 439} {"train_loss": -5.347928047180176, "global_step": 18450, "epoch": 439} {"train_loss": -5.22531270980835, "global_step": 18451, "epoch": 439} {"train_loss": -5.148778438568115, "global_step": 18452, "epoch": 439} {"train_loss": -5.202754974365234, "global_step": 18453, "epoch": 439} {"train_loss": -5.121171951293945, "global_step": 18454, "epoch": 439} {"train_loss": -5.332380294799805, "global_step": 18455, "epoch": 439} {"train_loss": -5.223454475402832, "global_step": 18456, "epoch": 439} {"train_loss": -5.097599506378174, "global_step": 18457, "epoch": 439} {"train_loss": -5.348000526428223, "global_step": 18458, "epoch": 439} {"train_loss": -5.263169288635254, "global_step": 18459, "epoch": 439} {"train_loss": -5.183321952819824, "global_step": 18460, "epoch": 439} {"train_loss": -5.363698959350586, "global_step": 18461, "epoch": 439} {"train_loss": -5.236681938171387, "global_step": 18462, "epoch": 439} {"train_loss": -5.352764129638672, "global_step": 18463, "epoch": 439} {"train_loss": -5.309234619140625, "global_step": 18464, "epoch": 439} {"train_loss": -5.380099296569824, "global_step": 18465, "epoch": 439} {"train_loss": -5.227025508880615, "global_step": 18466, "epoch": 439} {"train_loss": -5.320295810699463, "global_step": 18467, "epoch": 439} {"train_loss": -5.143535137176514, "global_step": 18468, "epoch": 439} {"train_loss": -5.3940582275390625, "global_step": 18469, "epoch": 439} {"train_loss": -5.400025844573975, "global_step": 18470, "epoch": 439} {"train_loss": -5.146990776062012, "global_step": 18471, "epoch": 439} {"train_loss": -5.270442962646484, "global_step": 18472, "epoch": 439} {"train_loss": -5.3310441970825195, "global_step": 18473, "epoch": 439} {"train_loss": -5.302159309387207, "global_step": 18474, "epoch": 439} {"train_loss": -5.324979782104492, "global_step": 18475, "epoch": 439} {"train_loss": -5.252169609069824, "global_step": 18476, "epoch": 439} {"train_loss": -5.361432075500488, "global_step": 18477, "epoch": 439} {"train_loss": -5.305459022521973, "global_step": 18478, "epoch": 439} {"train_loss": -5.251154842830839, "global_step": 18479, "epoch": 439, "val_loss": 68505.703125} {"train_loss": -5.293793678283691, "global_step": 18480, "epoch": 440} {"train_loss": -5.316165924072266, "global_step": 18481, "epoch": 440} {"train_loss": -5.304687023162842, "global_step": 18482, "epoch": 440} {"train_loss": -5.281940460205078, "global_step": 18483, "epoch": 440} {"train_loss": -5.265839576721191, "global_step": 18484, "epoch": 440} {"train_loss": -5.477234840393066, "global_step": 18485, "epoch": 440} {"train_loss": -5.115564823150635, "global_step": 18486, "epoch": 440} {"train_loss": -5.157144069671631, "global_step": 18487, "epoch": 440} {"train_loss": -5.247210502624512, "global_step": 18488, "epoch": 440} {"train_loss": -5.255013465881348, "global_step": 18489, "epoch": 440} {"train_loss": -5.0509352684021, "global_step": 18490, "epoch": 440} {"train_loss": -5.246935844421387, "global_step": 18491, "epoch": 440} {"train_loss": -5.3665690422058105, "global_step": 18492, "epoch": 440} {"train_loss": -5.260713577270508, "global_step": 18493, "epoch": 440} {"train_loss": -5.2941694259643555, "global_step": 18494, "epoch": 440} {"train_loss": -5.27349853515625, "global_step": 18495, "epoch": 440} {"train_loss": -5.212574481964111, "global_step": 18496, "epoch": 440} {"train_loss": -5.202435493469238, "global_step": 18497, "epoch": 440} {"train_loss": -5.238129615783691, "global_step": 18498, "epoch": 440} {"train_loss": -5.343010902404785, "global_step": 18499, "epoch": 440} {"train_loss": -5.322385787963867, "global_step": 18500, "epoch": 440} {"train_loss": -5.3103532791137695, "global_step": 18501, "epoch": 440} {"train_loss": -5.327780246734619, "global_step": 18502, "epoch": 440} {"train_loss": -5.29233455657959, "global_step": 18503, "epoch": 440} {"train_loss": -5.290166854858398, "global_step": 18504, "epoch": 440} {"train_loss": -5.278865814208984, "global_step": 18505, "epoch": 440} {"train_loss": -5.090056419372559, "global_step": 18506, "epoch": 440} {"train_loss": -5.294819355010986, "global_step": 18507, "epoch": 440} {"train_loss": -5.225917816162109, "global_step": 18508, "epoch": 440} {"train_loss": -5.302065849304199, "global_step": 18509, "epoch": 440} {"train_loss": -5.277386665344238, "global_step": 18510, "epoch": 440} {"train_loss": -5.196273326873779, "global_step": 18511, "epoch": 440} {"train_loss": -5.308233261108398, "global_step": 18512, "epoch": 440} {"train_loss": -5.238308906555176, "global_step": 18513, "epoch": 440} {"train_loss": -5.115640640258789, "global_step": 18514, "epoch": 440} {"train_loss": -5.131708145141602, "global_step": 18515, "epoch": 440} {"train_loss": -5.2986979484558105, "global_step": 18516, "epoch": 440} {"train_loss": -5.187069892883301, "global_step": 18517, "epoch": 440} {"train_loss": -5.216617107391357, "global_step": 18518, "epoch": 440} {"train_loss": -5.2963433265686035, "global_step": 18519, "epoch": 440} {"train_loss": -5.3059539794921875, "global_step": 18520, "epoch": 440} {"train_loss": -5.254501274653843, "global_step": 18521, "epoch": 440, "val_loss": 68424.703125} {"train_loss": -5.277402400970459, "global_step": 18522, "epoch": 441} {"train_loss": -5.339598655700684, "global_step": 18523, "epoch": 441} {"train_loss": -5.211451530456543, "global_step": 18524, "epoch": 441} {"train_loss": -5.296042442321777, "global_step": 18525, "epoch": 441} {"train_loss": -5.232415199279785, "global_step": 18526, "epoch": 441} {"train_loss": -5.172271251678467, "global_step": 18527, "epoch": 441} {"train_loss": -5.293002128601074, "global_step": 18528, "epoch": 441} {"train_loss": -5.170870304107666, "global_step": 18529, "epoch": 441} {"train_loss": -5.24371337890625, "global_step": 18530, "epoch": 441} {"train_loss": -5.206068992614746, "global_step": 18531, "epoch": 441} {"train_loss": -5.37791633605957, "global_step": 18532, "epoch": 441} {"train_loss": -5.3114519119262695, "global_step": 18533, "epoch": 441} {"train_loss": -5.1034159660339355, "global_step": 18534, "epoch": 441} {"train_loss": -5.452885150909424, "global_step": 18535, "epoch": 441} {"train_loss": -5.29573917388916, "global_step": 18536, "epoch": 441} {"train_loss": -5.405633926391602, "global_step": 18537, "epoch": 441} {"train_loss": -5.36995792388916, "global_step": 18538, "epoch": 441} {"train_loss": -5.2515950202941895, "global_step": 18539, "epoch": 441} {"train_loss": -5.306739807128906, "global_step": 18540, "epoch": 441} {"train_loss": -5.233309745788574, "global_step": 18541, "epoch": 441} {"train_loss": -5.369001388549805, "global_step": 18542, "epoch": 441} {"train_loss": -5.18934440612793, "global_step": 18543, "epoch": 441} {"train_loss": -5.308081150054932, "global_step": 18544, "epoch": 441} {"train_loss": -5.2872819900512695, "global_step": 18545, "epoch": 441} {"train_loss": -5.414615154266357, "global_step": 18546, "epoch": 441} {"train_loss": -5.31258487701416, "global_step": 18547, "epoch": 441} {"train_loss": -5.354111671447754, "global_step": 18548, "epoch": 441} {"train_loss": -5.349399566650391, "global_step": 18549, "epoch": 441} {"train_loss": -5.183127403259277, "global_step": 18550, "epoch": 441} {"train_loss": -5.336874961853027, "global_step": 18551, "epoch": 441} {"train_loss": -5.270997047424316, "global_step": 18552, "epoch": 441} {"train_loss": -5.320745468139648, "global_step": 18553, "epoch": 441} {"train_loss": -5.162112236022949, "global_step": 18554, "epoch": 441} {"train_loss": -5.245171070098877, "global_step": 18555, "epoch": 441} {"train_loss": -5.202548980712891, "global_step": 18556, "epoch": 441} {"train_loss": -5.234997749328613, "global_step": 18557, "epoch": 441} {"train_loss": -5.178516387939453, "global_step": 18558, "epoch": 441} {"train_loss": -5.346790790557861, "global_step": 18559, "epoch": 441} {"train_loss": -5.340518951416016, "global_step": 18560, "epoch": 441} {"train_loss": -5.4342265129089355, "global_step": 18561, "epoch": 441} {"train_loss": -5.242993354797363, "global_step": 18562, "epoch": 441} {"train_loss": -5.280693349384126, "global_step": 18563, "epoch": 441, "val_loss": 67991.09375} {"train_loss": -5.220623970031738, "global_step": 18564, "epoch": 442} {"train_loss": -5.305403232574463, "global_step": 18565, "epoch": 442} {"train_loss": -5.309915065765381, "global_step": 18566, "epoch": 442} {"train_loss": -5.241668701171875, "global_step": 18567, "epoch": 442} {"train_loss": -5.2157135009765625, "global_step": 18568, "epoch": 442} {"train_loss": -5.232635498046875, "global_step": 18569, "epoch": 442} {"train_loss": -5.290996551513672, "global_step": 18570, "epoch": 442} {"train_loss": -5.303289890289307, "global_step": 18571, "epoch": 442} {"train_loss": -5.271904468536377, "global_step": 18572, "epoch": 442} {"train_loss": -5.189715385437012, "global_step": 18573, "epoch": 442} {"train_loss": -5.303094863891602, "global_step": 18574, "epoch": 442} {"train_loss": -5.391301155090332, "global_step": 18575, "epoch": 442} {"train_loss": -5.325583457946777, "global_step": 18576, "epoch": 442} {"train_loss": -5.404815673828125, "global_step": 18577, "epoch": 442} {"train_loss": -5.122771263122559, "global_step": 18578, "epoch": 442} {"train_loss": -5.300256252288818, "global_step": 18579, "epoch": 442} {"train_loss": -5.28138542175293, "global_step": 18580, "epoch": 442} {"train_loss": -5.337885856628418, "global_step": 18581, "epoch": 442} {"train_loss": -5.26923942565918, "global_step": 18582, "epoch": 442} {"train_loss": -5.286992073059082, "global_step": 18583, "epoch": 442} {"train_loss": -5.28231143951416, "global_step": 18584, "epoch": 442} {"train_loss": -5.3426899909973145, "global_step": 18585, "epoch": 442} {"train_loss": -5.262972831726074, "global_step": 18586, "epoch": 442} {"train_loss": -5.290545463562012, "global_step": 18587, "epoch": 442} {"train_loss": -5.191805362701416, "global_step": 18588, "epoch": 442} {"train_loss": -5.208499908447266, "global_step": 18589, "epoch": 442} {"train_loss": -5.2901434898376465, "global_step": 18590, "epoch": 442} {"train_loss": -5.1741251945495605, "global_step": 18591, "epoch": 442} {"train_loss": -5.366423606872559, "global_step": 18592, "epoch": 442} {"train_loss": -5.3451032638549805, "global_step": 18593, "epoch": 442} {"train_loss": -5.177611351013184, "global_step": 18594, "epoch": 442} {"train_loss": -5.3984375, "global_step": 18595, "epoch": 442} {"train_loss": -5.337636947631836, "global_step": 18596, "epoch": 442} {"train_loss": -5.415188789367676, "global_step": 18597, "epoch": 442} {"train_loss": -5.2590837478637695, "global_step": 18598, "epoch": 442} {"train_loss": -5.279438018798828, "global_step": 18599, "epoch": 442} {"train_loss": -5.243159294128418, "global_step": 18600, "epoch": 442} {"train_loss": -5.3673505783081055, "global_step": 18601, "epoch": 442} {"train_loss": -5.2088823318481445, "global_step": 18602, "epoch": 442} {"train_loss": -5.340080738067627, "global_step": 18603, "epoch": 442} {"train_loss": -5.386425971984863, "global_step": 18604, "epoch": 442} {"train_loss": -5.283257132484799, "global_step": 18605, "epoch": 442, "val_loss": 68079.9609375} {"train_loss": -5.296858787536621, "global_step": 18606, "epoch": 443} {"train_loss": -5.317378044128418, "global_step": 18607, "epoch": 443} {"train_loss": -5.313199043273926, "global_step": 18608, "epoch": 443} {"train_loss": -5.3077778816223145, "global_step": 18609, "epoch": 443} {"train_loss": -5.180206775665283, "global_step": 18610, "epoch": 443} {"train_loss": -5.332845687866211, "global_step": 18611, "epoch": 443} {"train_loss": -5.157660961151123, "global_step": 18612, "epoch": 443} {"train_loss": -5.1660332679748535, "global_step": 18613, "epoch": 443} {"train_loss": -5.2865471839904785, "global_step": 18614, "epoch": 443} {"train_loss": -5.25788688659668, "global_step": 18615, "epoch": 443} {"train_loss": -4.981264114379883, "global_step": 18616, "epoch": 443} {"train_loss": -5.338013172149658, "global_step": 18617, "epoch": 443} {"train_loss": -5.176144599914551, "global_step": 18618, "epoch": 443} {"train_loss": -5.10366153717041, "global_step": 18619, "epoch": 443} {"train_loss": -5.2993645668029785, "global_step": 18620, "epoch": 443} {"train_loss": -5.212803840637207, "global_step": 18621, "epoch": 443} {"train_loss": -5.232629776000977, "global_step": 18622, "epoch": 443} {"train_loss": -5.332615375518799, "global_step": 18623, "epoch": 443} {"train_loss": -5.055575847625732, "global_step": 18624, "epoch": 443} {"train_loss": -5.192034721374512, "global_step": 18625, "epoch": 443} {"train_loss": -5.2744598388671875, "global_step": 18626, "epoch": 443} {"train_loss": -5.163968563079834, "global_step": 18627, "epoch": 443} {"train_loss": -5.364418029785156, "global_step": 18628, "epoch": 443} {"train_loss": -5.300260543823242, "global_step": 18629, "epoch": 443} {"train_loss": -5.226423740386963, "global_step": 18630, "epoch": 443} {"train_loss": -5.347843170166016, "global_step": 18631, "epoch": 443} {"train_loss": -5.273067951202393, "global_step": 18632, "epoch": 443} {"train_loss": -5.260280609130859, "global_step": 18633, "epoch": 443} {"train_loss": -5.247895240783691, "global_step": 18634, "epoch": 443} {"train_loss": -5.313289642333984, "global_step": 18635, "epoch": 443} {"train_loss": -5.240789890289307, "global_step": 18636, "epoch": 443} {"train_loss": -5.387948989868164, "global_step": 18637, "epoch": 443} {"train_loss": -5.2467360496521, "global_step": 18638, "epoch": 443} {"train_loss": -5.215914726257324, "global_step": 18639, "epoch": 443} {"train_loss": -5.2660980224609375, "global_step": 18640, "epoch": 443} {"train_loss": -5.390316009521484, "global_step": 18641, "epoch": 443} {"train_loss": -5.323349475860596, "global_step": 18642, "epoch": 443} {"train_loss": -5.296057224273682, "global_step": 18643, "epoch": 443} {"train_loss": -5.274604797363281, "global_step": 18644, "epoch": 443} {"train_loss": -5.406391143798828, "global_step": 18645, "epoch": 443} {"train_loss": -5.205702781677246, "global_step": 18646, "epoch": 443} {"train_loss": -5.25364401226952, "global_step": 18647, "epoch": 443, "val_loss": 68049.234375} {"train_loss": -5.280405521392822, "global_step": 18648, "epoch": 444} {"train_loss": -5.291808605194092, "global_step": 18649, "epoch": 444} {"train_loss": -5.346342086791992, "global_step": 18650, "epoch": 444} {"train_loss": -5.336415767669678, "global_step": 18651, "epoch": 444} {"train_loss": -5.326597213745117, "global_step": 18652, "epoch": 444} {"train_loss": -5.451066017150879, "global_step": 18653, "epoch": 444} {"train_loss": -5.378875732421875, "global_step": 18654, "epoch": 444} {"train_loss": -5.406070709228516, "global_step": 18655, "epoch": 444} {"train_loss": -5.1629533767700195, "global_step": 18656, "epoch": 444} {"train_loss": -5.050322532653809, "global_step": 18657, "epoch": 444} {"train_loss": -5.264686107635498, "global_step": 18658, "epoch": 444} {"train_loss": -5.345654487609863, "global_step": 18659, "epoch": 444} {"train_loss": -5.136685848236084, "global_step": 18660, "epoch": 444} {"train_loss": -5.105629920959473, "global_step": 18661, "epoch": 444} {"train_loss": -5.158449649810791, "global_step": 18662, "epoch": 444} {"train_loss": -5.015835762023926, "global_step": 18663, "epoch": 444} {"train_loss": -5.219814300537109, "global_step": 18664, "epoch": 444} {"train_loss": -5.228283882141113, "global_step": 18665, "epoch": 444} {"train_loss": -5.16279411315918, "global_step": 18666, "epoch": 444} {"train_loss": -5.216188430786133, "global_step": 18667, "epoch": 444} {"train_loss": -5.181492805480957, "global_step": 18668, "epoch": 444} {"train_loss": -5.098985195159912, "global_step": 18669, "epoch": 444} {"train_loss": -5.133768081665039, "global_step": 18670, "epoch": 444} {"train_loss": -5.218105792999268, "global_step": 18671, "epoch": 444} {"train_loss": -5.23189640045166, "global_step": 18672, "epoch": 444} {"train_loss": -5.245197296142578, "global_step": 18673, "epoch": 444} {"train_loss": -5.281253814697266, "global_step": 18674, "epoch": 444} {"train_loss": -5.216396331787109, "global_step": 18675, "epoch": 444} {"train_loss": -5.162369728088379, "global_step": 18676, "epoch": 444} {"train_loss": -5.344394207000732, "global_step": 18677, "epoch": 444} {"train_loss": -5.282366752624512, "global_step": 18678, "epoch": 444} {"train_loss": -5.392200469970703, "global_step": 18679, "epoch": 444} {"train_loss": -5.218644618988037, "global_step": 18680, "epoch": 444} {"train_loss": -5.295008659362793, "global_step": 18681, "epoch": 444} {"train_loss": -5.3471527099609375, "global_step": 18682, "epoch": 444} {"train_loss": -5.176446914672852, "global_step": 18683, "epoch": 444} {"train_loss": -5.286226749420166, "global_step": 18684, "epoch": 444} {"train_loss": -5.3314595222473145, "global_step": 18685, "epoch": 444} {"train_loss": -5.25248908996582, "global_step": 18686, "epoch": 444} {"train_loss": -5.317968368530273, "global_step": 18687, "epoch": 444} {"train_loss": -5.291087627410889, "global_step": 18688, "epoch": 444} {"train_loss": -5.246666658492315, "global_step": 18689, "epoch": 444, "val_loss": 68120.9453125} {"train_loss": -5.24981164932251, "global_step": 18690, "epoch": 445} {"train_loss": -5.285739898681641, "global_step": 18691, "epoch": 445} {"train_loss": -5.304177284240723, "global_step": 18692, "epoch": 445} {"train_loss": -5.44089412689209, "global_step": 18693, "epoch": 445} {"train_loss": -5.317298889160156, "global_step": 18694, "epoch": 445} {"train_loss": -5.250339031219482, "global_step": 18695, "epoch": 445} {"train_loss": -5.229965686798096, "global_step": 18696, "epoch": 445} {"train_loss": -5.255439281463623, "global_step": 18697, "epoch": 445} {"train_loss": -5.236952781677246, "global_step": 18698, "epoch": 445} {"train_loss": -5.300763130187988, "global_step": 18699, "epoch": 445} {"train_loss": -5.217494010925293, "global_step": 18700, "epoch": 445} {"train_loss": -5.281095027923584, "global_step": 18701, "epoch": 445} {"train_loss": -5.285289764404297, "global_step": 18702, "epoch": 445} {"train_loss": -5.100601673126221, "global_step": 18703, "epoch": 445} {"train_loss": -5.2144951820373535, "global_step": 18704, "epoch": 445} {"train_loss": -5.371691703796387, "global_step": 18705, "epoch": 445} {"train_loss": -5.230461597442627, "global_step": 18706, "epoch": 445} {"train_loss": -5.169517517089844, "global_step": 18707, "epoch": 445} {"train_loss": -5.332024574279785, "global_step": 18708, "epoch": 445} {"train_loss": -5.255561351776123, "global_step": 18709, "epoch": 445} {"train_loss": -5.253996849060059, "global_step": 18710, "epoch": 445} {"train_loss": -5.271928310394287, "global_step": 18711, "epoch": 445} {"train_loss": -5.228211402893066, "global_step": 18712, "epoch": 445} {"train_loss": -5.2282562255859375, "global_step": 18713, "epoch": 445} {"train_loss": -5.135282039642334, "global_step": 18714, "epoch": 445} {"train_loss": -5.220541477203369, "global_step": 18715, "epoch": 445} {"train_loss": -5.220065116882324, "global_step": 18716, "epoch": 445} {"train_loss": -5.314855098724365, "global_step": 18717, "epoch": 445} {"train_loss": -5.212209701538086, "global_step": 18718, "epoch": 445} {"train_loss": -5.28160285949707, "global_step": 18719, "epoch": 445} {"train_loss": -5.244731903076172, "global_step": 18720, "epoch": 445} {"train_loss": -5.201752662658691, "global_step": 18721, "epoch": 445} {"train_loss": -5.145650386810303, "global_step": 18722, "epoch": 445} {"train_loss": -5.249424934387207, "global_step": 18723, "epoch": 445} {"train_loss": -5.2729082107543945, "global_step": 18724, "epoch": 445} {"train_loss": -5.277839660644531, "global_step": 18725, "epoch": 445} {"train_loss": -5.275333404541016, "global_step": 18726, "epoch": 445} {"train_loss": -5.31256103515625, "global_step": 18727, "epoch": 445} {"train_loss": -5.311640739440918, "global_step": 18728, "epoch": 445} {"train_loss": -5.259557723999023, "global_step": 18729, "epoch": 445} {"train_loss": -5.299435615539551, "global_step": 18730, "epoch": 445} {"train_loss": -5.257904892876034, "global_step": 18731, "epoch": 445, "val_loss": 68736.328125} {"train_loss": -5.173859596252441, "global_step": 18732, "epoch": 446} {"train_loss": -5.256138801574707, "global_step": 18733, "epoch": 446} {"train_loss": -5.217016220092773, "global_step": 18734, "epoch": 446} {"train_loss": -5.15817928314209, "global_step": 18735, "epoch": 446} {"train_loss": -5.323614120483398, "global_step": 18736, "epoch": 446} {"train_loss": -5.189381122589111, "global_step": 18737, "epoch": 446} {"train_loss": -5.259385108947754, "global_step": 18738, "epoch": 446} {"train_loss": -5.3826003074646, "global_step": 18739, "epoch": 446} {"train_loss": -5.393562316894531, "global_step": 18740, "epoch": 446} {"train_loss": -5.223607540130615, "global_step": 18741, "epoch": 446} {"train_loss": -5.322231292724609, "global_step": 18742, "epoch": 446} {"train_loss": -5.222363471984863, "global_step": 18743, "epoch": 446} {"train_loss": -5.389377593994141, "global_step": 18744, "epoch": 446} {"train_loss": -5.39520263671875, "global_step": 18745, "epoch": 446} {"train_loss": -5.227763652801514, "global_step": 18746, "epoch": 446} {"train_loss": -5.288919925689697, "global_step": 18747, "epoch": 446} {"train_loss": -5.203120708465576, "global_step": 18748, "epoch": 446} {"train_loss": -5.322483539581299, "global_step": 18749, "epoch": 446} {"train_loss": -5.225139617919922, "global_step": 18750, "epoch": 446} {"train_loss": -5.360891342163086, "global_step": 18751, "epoch": 446} {"train_loss": -5.191720962524414, "global_step": 18752, "epoch": 446} {"train_loss": -5.361671447753906, "global_step": 18753, "epoch": 446} {"train_loss": -5.207047939300537, "global_step": 18754, "epoch": 446} {"train_loss": -5.2065582275390625, "global_step": 18755, "epoch": 446} {"train_loss": -5.335293769836426, "global_step": 18756, "epoch": 446} {"train_loss": -5.2659454345703125, "global_step": 18757, "epoch": 446} {"train_loss": -5.242165565490723, "global_step": 18758, "epoch": 446} {"train_loss": -5.267528533935547, "global_step": 18759, "epoch": 446} {"train_loss": -5.353407859802246, "global_step": 18760, "epoch": 446} {"train_loss": -5.194256782531738, "global_step": 18761, "epoch": 446} {"train_loss": -5.196540832519531, "global_step": 18762, "epoch": 446} {"train_loss": -5.255762577056885, "global_step": 18763, "epoch": 446} {"train_loss": -5.291327476501465, "global_step": 18764, "epoch": 446} {"train_loss": -5.28614616394043, "global_step": 18765, "epoch": 446} {"train_loss": -5.0789666175842285, "global_step": 18766, "epoch": 446} {"train_loss": -5.236555576324463, "global_step": 18767, "epoch": 446} {"train_loss": -5.264463901519775, "global_step": 18768, "epoch": 446} {"train_loss": -5.331222057342529, "global_step": 18769, "epoch": 446} {"train_loss": -5.247981071472168, "global_step": 18770, "epoch": 446} {"train_loss": -5.071542739868164, "global_step": 18771, "epoch": 446} {"train_loss": -5.248592376708984, "global_step": 18772, "epoch": 446} {"train_loss": -5.258724292119344, "global_step": 18773, "epoch": 446, "val_loss": 68274.3984375} {"train_loss": -5.278133392333984, "global_step": 18774, "epoch": 447} {"train_loss": -5.3834686279296875, "global_step": 18775, "epoch": 447} {"train_loss": -5.052847385406494, "global_step": 18776, "epoch": 447} {"train_loss": -5.269362449645996, "global_step": 18777, "epoch": 447} {"train_loss": -5.170722961425781, "global_step": 18778, "epoch": 447} {"train_loss": -5.182318687438965, "global_step": 18779, "epoch": 447} {"train_loss": -5.32529354095459, "global_step": 18780, "epoch": 447} {"train_loss": -5.2407145500183105, "global_step": 18781, "epoch": 447} {"train_loss": -5.139740943908691, "global_step": 18782, "epoch": 447} {"train_loss": -5.141165733337402, "global_step": 18783, "epoch": 447} {"train_loss": -5.288417816162109, "global_step": 18784, "epoch": 447} {"train_loss": -5.168279647827148, "global_step": 18785, "epoch": 447} {"train_loss": -5.235504627227783, "global_step": 18786, "epoch": 447} {"train_loss": -5.256485939025879, "global_step": 18787, "epoch": 447} {"train_loss": -5.360910415649414, "global_step": 18788, "epoch": 447} {"train_loss": -5.274129390716553, "global_step": 18789, "epoch": 447} {"train_loss": -5.294858932495117, "global_step": 18790, "epoch": 447} {"train_loss": -5.234719276428223, "global_step": 18791, "epoch": 447} {"train_loss": -5.244982719421387, "global_step": 18792, "epoch": 447} {"train_loss": -5.180216312408447, "global_step": 18793, "epoch": 447} {"train_loss": -5.359122276306152, "global_step": 18794, "epoch": 447} {"train_loss": -5.247225761413574, "global_step": 18795, "epoch": 447} {"train_loss": -5.188732147216797, "global_step": 18796, "epoch": 447} {"train_loss": -5.2705278396606445, "global_step": 18797, "epoch": 447} {"train_loss": -5.19553279876709, "global_step": 18798, "epoch": 447} {"train_loss": -5.121977806091309, "global_step": 18799, "epoch": 447} {"train_loss": -5.055270195007324, "global_step": 18800, "epoch": 447} {"train_loss": -5.092442989349365, "global_step": 18801, "epoch": 447} {"train_loss": -5.2903032302856445, "global_step": 18802, "epoch": 447} {"train_loss": -5.180530548095703, "global_step": 18803, "epoch": 447} {"train_loss": -5.106171607971191, "global_step": 18804, "epoch": 447} {"train_loss": -5.219078063964844, "global_step": 18805, "epoch": 447} {"train_loss": -5.094942092895508, "global_step": 18806, "epoch": 447} {"train_loss": -5.230045318603516, "global_step": 18807, "epoch": 447} {"train_loss": -5.247520446777344, "global_step": 18808, "epoch": 447} {"train_loss": -5.127316474914551, "global_step": 18809, "epoch": 447} {"train_loss": -5.220061779022217, "global_step": 18810, "epoch": 447} {"train_loss": -5.307661056518555, "global_step": 18811, "epoch": 447} {"train_loss": -5.261174201965332, "global_step": 18812, "epoch": 447} {"train_loss": -5.221700668334961, "global_step": 18813, "epoch": 447} {"train_loss": -5.317455291748047, "global_step": 18814, "epoch": 447} {"train_loss": -5.222877014250982, "global_step": 18815, "epoch": 447, "val_loss": 68099.8359375} {"train_loss": -5.2053985595703125, "global_step": 18816, "epoch": 448} {"train_loss": -5.478818416595459, "global_step": 18817, "epoch": 448} {"train_loss": -5.315448760986328, "global_step": 18818, "epoch": 448} {"train_loss": -5.231055736541748, "global_step": 18819, "epoch": 448} {"train_loss": -5.27374267578125, "global_step": 18820, "epoch": 448} {"train_loss": -5.058789253234863, "global_step": 18821, "epoch": 448} {"train_loss": -5.27700138092041, "global_step": 18822, "epoch": 448} {"train_loss": -5.270611763000488, "global_step": 18823, "epoch": 448} {"train_loss": -5.367908477783203, "global_step": 18824, "epoch": 448} {"train_loss": -5.43834924697876, "global_step": 18825, "epoch": 448} {"train_loss": -5.215862274169922, "global_step": 18826, "epoch": 448} {"train_loss": -5.201880931854248, "global_step": 18827, "epoch": 448} {"train_loss": -5.28239631652832, "global_step": 18828, "epoch": 448} {"train_loss": -5.277669429779053, "global_step": 18829, "epoch": 448} {"train_loss": -5.255062103271484, "global_step": 18830, "epoch": 448} {"train_loss": -5.395323276519775, "global_step": 18831, "epoch": 448} {"train_loss": -5.160272121429443, "global_step": 18832, "epoch": 448} {"train_loss": -5.230539321899414, "global_step": 18833, "epoch": 448} {"train_loss": -5.403807640075684, "global_step": 18834, "epoch": 448} {"train_loss": -5.09447717666626, "global_step": 18835, "epoch": 448} {"train_loss": -5.124360084533691, "global_step": 18836, "epoch": 448} {"train_loss": -5.389005661010742, "global_step": 18837, "epoch": 448} {"train_loss": -5.225420951843262, "global_step": 18838, "epoch": 448} {"train_loss": -5.172420501708984, "global_step": 18839, "epoch": 448} {"train_loss": -5.255102157592773, "global_step": 18840, "epoch": 448} {"train_loss": -5.234866142272949, "global_step": 18841, "epoch": 448} {"train_loss": -5.186643600463867, "global_step": 18842, "epoch": 448} {"train_loss": -5.140942573547363, "global_step": 18843, "epoch": 448} {"train_loss": -5.236021518707275, "global_step": 18844, "epoch": 448} {"train_loss": -5.294515609741211, "global_step": 18845, "epoch": 448} {"train_loss": -5.29619026184082, "global_step": 18846, "epoch": 448} {"train_loss": -5.343291282653809, "global_step": 18847, "epoch": 448} {"train_loss": -5.168745994567871, "global_step": 18848, "epoch": 448} {"train_loss": -5.226037979125977, "global_step": 18849, "epoch": 448} {"train_loss": -5.213841915130615, "global_step": 18850, "epoch": 448} {"train_loss": -5.296210289001465, "global_step": 18851, "epoch": 448} {"train_loss": -5.26163387298584, "global_step": 18852, "epoch": 448} {"train_loss": -5.229086399078369, "global_step": 18853, "epoch": 448} {"train_loss": -5.316473007202148, "global_step": 18854, "epoch": 448} {"train_loss": -5.145819664001465, "global_step": 18855, "epoch": 448} {"train_loss": -5.171535015106201, "global_step": 18856, "epoch": 448} {"train_loss": -5.255178394771757, "global_step": 18857, "epoch": 448, "val_loss": 68419.5546875} {"train_loss": -5.135264873504639, "global_step": 18858, "epoch": 449} {"train_loss": -5.202879905700684, "global_step": 18859, "epoch": 449} {"train_loss": -5.395138740539551, "global_step": 18860, "epoch": 449} {"train_loss": -5.356866836547852, "global_step": 18861, "epoch": 449} {"train_loss": -5.3430891036987305, "global_step": 18862, "epoch": 449} {"train_loss": -5.197227478027344, "global_step": 18863, "epoch": 449} {"train_loss": -5.111973762512207, "global_step": 18864, "epoch": 449} {"train_loss": -5.206389427185059, "global_step": 18865, "epoch": 449} {"train_loss": -5.27064847946167, "global_step": 18866, "epoch": 449} {"train_loss": -5.221200466156006, "global_step": 18867, "epoch": 449} {"train_loss": -5.345943927764893, "global_step": 18868, "epoch": 449} {"train_loss": -5.288791656494141, "global_step": 18869, "epoch": 449} {"train_loss": -5.271570205688477, "global_step": 18870, "epoch": 449} {"train_loss": -5.31158971786499, "global_step": 18871, "epoch": 449} {"train_loss": -5.324037075042725, "global_step": 18872, "epoch": 449} {"train_loss": -5.310193061828613, "global_step": 18873, "epoch": 449} {"train_loss": -5.460871696472168, "global_step": 18874, "epoch": 449} {"train_loss": -5.357758522033691, "global_step": 18875, "epoch": 449} {"train_loss": -5.294559478759766, "global_step": 18876, "epoch": 449} {"train_loss": -5.282436370849609, "global_step": 18877, "epoch": 449} {"train_loss": -5.426810264587402, "global_step": 18878, "epoch": 449} {"train_loss": -5.345871925354004, "global_step": 18879, "epoch": 449} {"train_loss": -5.159387588500977, "global_step": 18880, "epoch": 449} {"train_loss": -5.270132064819336, "global_step": 18881, "epoch": 449} {"train_loss": -5.296963214874268, "global_step": 18882, "epoch": 449} {"train_loss": -5.180380821228027, "global_step": 18883, "epoch": 449} {"train_loss": -5.217683792114258, "global_step": 18884, "epoch": 449} {"train_loss": -5.260003089904785, "global_step": 18885, "epoch": 449} {"train_loss": -5.177783966064453, "global_step": 18886, "epoch": 449} {"train_loss": -5.233672618865967, "global_step": 18887, "epoch": 449} {"train_loss": -5.33213996887207, "global_step": 18888, "epoch": 449} {"train_loss": -5.272913455963135, "global_step": 18889, "epoch": 449} {"train_loss": -5.3042378425598145, "global_step": 18890, "epoch": 449} {"train_loss": -5.15723991394043, "global_step": 18891, "epoch": 449} {"train_loss": -5.2858567237854, "global_step": 18892, "epoch": 449} {"train_loss": -5.249624252319336, "global_step": 18893, "epoch": 449} {"train_loss": -5.164043426513672, "global_step": 18894, "epoch": 449} {"train_loss": -5.2508440017700195, "global_step": 18895, "epoch": 449} {"train_loss": -5.272473335266113, "global_step": 18896, "epoch": 449} {"train_loss": -5.208059310913086, "global_step": 18897, "epoch": 449} {"train_loss": -5.376092433929443, "global_step": 18898, "epoch": 449} {"train_loss": -5.2723072710491365, "global_step": 18899, "epoch": 449, "val_loss": 68129.0625} {"train_loss": -5.252586364746094, "global_step": 18900, "epoch": 450} {"train_loss": -5.164820671081543, "global_step": 18901, "epoch": 450} {"train_loss": -5.132417678833008, "global_step": 18902, "epoch": 450} {"train_loss": -5.190389633178711, "global_step": 18903, "epoch": 450} {"train_loss": -5.251182556152344, "global_step": 18904, "epoch": 450} {"train_loss": -5.287347793579102, "global_step": 18905, "epoch": 450} {"train_loss": -5.312128067016602, "global_step": 18906, "epoch": 450} {"train_loss": -5.0460076332092285, "global_step": 18907, "epoch": 450} {"train_loss": -5.392925262451172, "global_step": 18908, "epoch": 450} {"train_loss": -5.373795032501221, "global_step": 18909, "epoch": 450} {"train_loss": -5.333932876586914, "global_step": 18910, "epoch": 450} {"train_loss": -5.243059158325195, "global_step": 18911, "epoch": 450} {"train_loss": -5.344906806945801, "global_step": 18912, "epoch": 450} {"train_loss": -5.3527960777282715, "global_step": 18913, "epoch": 450} {"train_loss": -5.337080955505371, "global_step": 18914, "epoch": 450} {"train_loss": -5.430019855499268, "global_step": 18915, "epoch": 450} {"train_loss": -5.2396345138549805, "global_step": 18916, "epoch": 450} {"train_loss": -5.283834457397461, "global_step": 18917, "epoch": 450} {"train_loss": -5.265597343444824, "global_step": 18918, "epoch": 450} {"train_loss": -5.254558563232422, "global_step": 18919, "epoch": 450} {"train_loss": -5.237022399902344, "global_step": 18920, "epoch": 450} {"train_loss": -5.34881591796875, "global_step": 18921, "epoch": 450} {"train_loss": -5.342678070068359, "global_step": 18922, "epoch": 450} {"train_loss": -5.340569496154785, "global_step": 18923, "epoch": 450} {"train_loss": -5.2397050857543945, "global_step": 18924, "epoch": 450} {"train_loss": -5.05437707901001, "global_step": 18925, "epoch": 450} {"train_loss": -5.11884880065918, "global_step": 18926, "epoch": 450} {"train_loss": -5.354091644287109, "global_step": 18927, "epoch": 450} {"train_loss": -5.182831764221191, "global_step": 18928, "epoch": 450} {"train_loss": -5.175409317016602, "global_step": 18929, "epoch": 450} {"train_loss": -5.252713680267334, "global_step": 18930, "epoch": 450} {"train_loss": -5.31480598449707, "global_step": 18931, "epoch": 450} {"train_loss": -5.2423095703125, "global_step": 18932, "epoch": 450} {"train_loss": -5.346185684204102, "global_step": 18933, "epoch": 450} {"train_loss": -5.431532382965088, "global_step": 18934, "epoch": 450} {"train_loss": -5.178762435913086, "global_step": 18935, "epoch": 450} {"train_loss": -5.2779083251953125, "global_step": 18936, "epoch": 450} {"train_loss": -5.350618362426758, "global_step": 18937, "epoch": 450} {"train_loss": -5.270927429199219, "global_step": 18938, "epoch": 450} {"train_loss": -5.397430896759033, "global_step": 18939, "epoch": 450} {"train_loss": -5.218503475189209, "global_step": 18940, "epoch": 450} {"train_loss": -5.270252852212815, "global_step": 18941, "epoch": 450, "train/sim_max_reward_0": 0.19140185969291962, "train/sim_max_reward_1": 0.03818057007018244, "train/sim_max_reward_2": 0.15136560618071837, "train/sim_max_reward_3": 0.1549121559803521, "train/sim_max_reward_4": 0.298040830122367, "train/sim_max_reward_5": 0.5806250646880464, "test/sim_max_reward_4300000": 0.37539860066426917, "test/sim_max_reward_4300001": 0.11327709552421976, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.27937153809368176, "test/sim_max_reward_4300004": 0.14669857466925312, "test/sim_max_reward_4300005": 0.4265569949493318, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.18883521194361585, "test/sim_max_reward_4300008": 0.42259062261943237, "test/sim_max_reward_4300009": 0.40260928520533823, "test/sim_max_reward_4300010": 0.3704519320599487, "test/sim_max_reward_4300011": 0.27754601573202636, "test/sim_max_reward_4300012": 0.3829803875218628, "test/sim_max_reward_4300013": 0.37930108394783, "test/sim_max_reward_4300014": 0.4031600494677527, "test/sim_max_reward_4300015": 0.265754464364404, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.3469594691935784, "test/sim_max_reward_4300018": 0.0014847533587073602, "test/sim_max_reward_4300019": 0.18559212355227922, "test/sim_max_reward_4300020": 0.07132014387970505, "test/sim_max_reward_4300021": 0.24592966849684234, "test/sim_max_reward_4300022": 0.3436223187657942, "test/sim_max_reward_4300023": 0.31591061215511934, "test/sim_max_reward_4300024": 0.42851611208172335, "test/sim_max_reward_4300025": 0.08926896594497934, "test/sim_max_reward_4300026": 0.472220363215156, "test/sim_max_reward_4300027": 0.272836229996341, "test/sim_max_reward_4300028": 0.18617593168339056, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.24340892104441367, "test/sim_max_reward_4300031": 0.17085448646386833, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.4012453689262033, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.28295660101427333, "test/sim_max_reward_4300037": 0.5527122599440878, "test/sim_max_reward_4300038": 0.3077829756152674, "test/sim_max_reward_4300039": 0.24911456294804254, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.5764476479946988, "test/sim_max_reward_4300043": 0.5831248493137033, "test/sim_max_reward_4300044": 0.06352498797803412, "test/sim_max_reward_4300045": 0.1722033333335087, "test/sim_max_reward_4300046": 0.057935626471608125, "test/sim_max_reward_4300047": 0.5709762221621706, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.18763922875168723, "train/mean_score": 0.23575434778909765, "test/mean_score": 0.2434582860337808, "val_loss": 68437.2890625} {"train_loss": -5.197264194488525, "global_step": 18942, "epoch": 451} {"train_loss": -5.358983993530273, "global_step": 18943, "epoch": 451} {"train_loss": -5.345523357391357, "global_step": 18944, "epoch": 451} {"train_loss": -5.29572057723999, "global_step": 18945, "epoch": 451} {"train_loss": -5.1990203857421875, "global_step": 18946, "epoch": 451} {"train_loss": -5.259754180908203, "global_step": 18947, "epoch": 451} {"train_loss": -5.268405914306641, "global_step": 18948, "epoch": 451} {"train_loss": -5.261940956115723, "global_step": 18949, "epoch": 451} {"train_loss": -5.323145389556885, "global_step": 18950, "epoch": 451} {"train_loss": -5.241264343261719, "global_step": 18951, "epoch": 451} {"train_loss": -5.200504779815674, "global_step": 18952, "epoch": 451} {"train_loss": -5.321290016174316, "global_step": 18953, "epoch": 451} {"train_loss": -5.263594150543213, "global_step": 18954, "epoch": 451} {"train_loss": -5.246271133422852, "global_step": 18955, "epoch": 451} {"train_loss": -5.24588680267334, "global_step": 18956, "epoch": 451} {"train_loss": -5.196512699127197, "global_step": 18957, "epoch": 451} {"train_loss": -5.32555627822876, "global_step": 18958, "epoch": 451} {"train_loss": -5.254138946533203, "global_step": 18959, "epoch": 451} {"train_loss": -5.29189395904541, "global_step": 18960, "epoch": 451} {"train_loss": -5.385200023651123, "global_step": 18961, "epoch": 451} {"train_loss": -5.365243434906006, "global_step": 18962, "epoch": 451} {"train_loss": -5.19499397277832, "global_step": 18963, "epoch": 451} {"train_loss": -5.221329212188721, "global_step": 18964, "epoch": 451} {"train_loss": -5.236432075500488, "global_step": 18965, "epoch": 451} {"train_loss": -5.367704391479492, "global_step": 18966, "epoch": 451} {"train_loss": -5.315900802612305, "global_step": 18967, "epoch": 451} {"train_loss": -5.2855224609375, "global_step": 18968, "epoch": 451} {"train_loss": -5.322428226470947, "global_step": 18969, "epoch": 451} {"train_loss": -5.42274284362793, "global_step": 18970, "epoch": 451} {"train_loss": -5.069765567779541, "global_step": 18971, "epoch": 451} {"train_loss": -5.262408256530762, "global_step": 18972, "epoch": 451} {"train_loss": -5.411843299865723, "global_step": 18973, "epoch": 451} {"train_loss": -5.193633079528809, "global_step": 18974, "epoch": 451} {"train_loss": -5.149463176727295, "global_step": 18975, "epoch": 451} {"train_loss": -5.330905914306641, "global_step": 18976, "epoch": 451} {"train_loss": -5.170856475830078, "global_step": 18977, "epoch": 451} {"train_loss": -5.225958347320557, "global_step": 18978, "epoch": 451} {"train_loss": -5.232458591461182, "global_step": 18979, "epoch": 451} {"train_loss": -5.140227317810059, "global_step": 18980, "epoch": 451} {"train_loss": -5.2509565353393555, "global_step": 18981, "epoch": 451} {"train_loss": -5.229765892028809, "global_step": 18982, "epoch": 451} {"train_loss": -5.266805274145944, "global_step": 18983, "epoch": 451, "val_loss": 68033.8984375} {"train_loss": -5.288280487060547, "global_step": 18984, "epoch": 452} {"train_loss": -5.320097923278809, "global_step": 18985, "epoch": 452} {"train_loss": -5.38121223449707, "global_step": 18986, "epoch": 452} {"train_loss": -5.322113037109375, "global_step": 18987, "epoch": 452} {"train_loss": -5.263399124145508, "global_step": 18988, "epoch": 452} {"train_loss": -5.242406845092773, "global_step": 18989, "epoch": 452} {"train_loss": -5.135109901428223, "global_step": 18990, "epoch": 452} {"train_loss": -5.357631683349609, "global_step": 18991, "epoch": 452} {"train_loss": -5.338286399841309, "global_step": 18992, "epoch": 452} {"train_loss": -5.314404487609863, "global_step": 18993, "epoch": 452} {"train_loss": -5.335296630859375, "global_step": 18994, "epoch": 452} {"train_loss": -5.320138931274414, "global_step": 18995, "epoch": 452} {"train_loss": -5.313076972961426, "global_step": 18996, "epoch": 452} {"train_loss": -5.429189682006836, "global_step": 18997, "epoch": 452} {"train_loss": -5.268477439880371, "global_step": 18998, "epoch": 452} {"train_loss": -5.393180847167969, "global_step": 18999, "epoch": 452} {"train_loss": -5.228623390197754, "global_step": 19000, "epoch": 452} {"train_loss": -5.393579483032227, "global_step": 19001, "epoch": 452} {"train_loss": -5.293182373046875, "global_step": 19002, "epoch": 452} {"train_loss": -5.2234601974487305, "global_step": 19003, "epoch": 452} {"train_loss": -5.377908229827881, "global_step": 19004, "epoch": 452} {"train_loss": -5.188573360443115, "global_step": 19005, "epoch": 452} {"train_loss": -5.334850788116455, "global_step": 19006, "epoch": 452} {"train_loss": -5.227176666259766, "global_step": 19007, "epoch": 452} {"train_loss": -5.343526363372803, "global_step": 19008, "epoch": 452} {"train_loss": -5.2581682205200195, "global_step": 19009, "epoch": 452} {"train_loss": -5.380273342132568, "global_step": 19010, "epoch": 452} {"train_loss": -5.297028541564941, "global_step": 19011, "epoch": 452} {"train_loss": -5.265021800994873, "global_step": 19012, "epoch": 452} {"train_loss": -5.2213568687438965, "global_step": 19013, "epoch": 452} {"train_loss": -5.143231391906738, "global_step": 19014, "epoch": 452} {"train_loss": -5.424211502075195, "global_step": 19015, "epoch": 452} {"train_loss": -5.210182189941406, "global_step": 19016, "epoch": 452} {"train_loss": -5.130558967590332, "global_step": 19017, "epoch": 452} {"train_loss": -5.292652130126953, "global_step": 19018, "epoch": 452} {"train_loss": -5.396932601928711, "global_step": 19019, "epoch": 452} {"train_loss": -5.256823539733887, "global_step": 19020, "epoch": 452} {"train_loss": -5.158184051513672, "global_step": 19021, "epoch": 452} {"train_loss": -5.308082580566406, "global_step": 19022, "epoch": 452} {"train_loss": -5.3071417808532715, "global_step": 19023, "epoch": 452} {"train_loss": -5.248968124389648, "global_step": 19024, "epoch": 452} {"train_loss": -5.291174071175711, "global_step": 19025, "epoch": 452, "val_loss": 67919.1015625} {"train_loss": -5.426872253417969, "global_step": 19026, "epoch": 453} {"train_loss": -5.241646766662598, "global_step": 19027, "epoch": 453} {"train_loss": -5.256085395812988, "global_step": 19028, "epoch": 453} {"train_loss": -5.228279113769531, "global_step": 19029, "epoch": 453} {"train_loss": -5.269218444824219, "global_step": 19030, "epoch": 453} {"train_loss": -5.287867546081543, "global_step": 19031, "epoch": 453} {"train_loss": -5.214607238769531, "global_step": 19032, "epoch": 453} {"train_loss": -5.368419647216797, "global_step": 19033, "epoch": 453} {"train_loss": -5.321995735168457, "global_step": 19034, "epoch": 453} {"train_loss": -5.180569171905518, "global_step": 19035, "epoch": 453} {"train_loss": -5.319604873657227, "global_step": 19036, "epoch": 453} {"train_loss": -5.389161109924316, "global_step": 19037, "epoch": 453} {"train_loss": -5.18981409072876, "global_step": 19038, "epoch": 453} {"train_loss": -5.297285556793213, "global_step": 19039, "epoch": 453} {"train_loss": -5.18147087097168, "global_step": 19040, "epoch": 453} {"train_loss": -5.305070400238037, "global_step": 19041, "epoch": 453} {"train_loss": -5.393303394317627, "global_step": 19042, "epoch": 453} {"train_loss": -5.2532639503479, "global_step": 19043, "epoch": 453} {"train_loss": -5.259953498840332, "global_step": 19044, "epoch": 453} {"train_loss": -5.155575752258301, "global_step": 19045, "epoch": 453} {"train_loss": -5.291775703430176, "global_step": 19046, "epoch": 453} {"train_loss": -5.249987602233887, "global_step": 19047, "epoch": 453} {"train_loss": -5.247806549072266, "global_step": 19048, "epoch": 453} {"train_loss": -5.412225723266602, "global_step": 19049, "epoch": 453} {"train_loss": -5.284526824951172, "global_step": 19050, "epoch": 453} {"train_loss": -5.111609935760498, "global_step": 19051, "epoch": 453} {"train_loss": -5.363761901855469, "global_step": 19052, "epoch": 453} {"train_loss": -5.211176872253418, "global_step": 19053, "epoch": 453} {"train_loss": -5.386529922485352, "global_step": 19054, "epoch": 453} {"train_loss": -5.178830623626709, "global_step": 19055, "epoch": 453} {"train_loss": -5.215877532958984, "global_step": 19056, "epoch": 453} {"train_loss": -5.140700340270996, "global_step": 19057, "epoch": 453} {"train_loss": -5.29704475402832, "global_step": 19058, "epoch": 453} {"train_loss": -5.301640033721924, "global_step": 19059, "epoch": 453} {"train_loss": -5.261692047119141, "global_step": 19060, "epoch": 453} {"train_loss": -5.299338340759277, "global_step": 19061, "epoch": 453} {"train_loss": -5.198486328125, "global_step": 19062, "epoch": 453} {"train_loss": -5.282801628112793, "global_step": 19063, "epoch": 453} {"train_loss": -5.3519511222839355, "global_step": 19064, "epoch": 453} {"train_loss": -5.2982988357543945, "global_step": 19065, "epoch": 453} {"train_loss": -5.421551704406738, "global_step": 19066, "epoch": 453} {"train_loss": -5.279490811484201, "global_step": 19067, "epoch": 453, "val_loss": 68211.375} {"train_loss": -5.315845489501953, "global_step": 19068, "epoch": 454} {"train_loss": -5.260739803314209, "global_step": 19069, "epoch": 454} {"train_loss": -5.351322650909424, "global_step": 19070, "epoch": 454} {"train_loss": -5.364268779754639, "global_step": 19071, "epoch": 454} {"train_loss": -5.174588203430176, "global_step": 19072, "epoch": 454} {"train_loss": -5.366306304931641, "global_step": 19073, "epoch": 454} {"train_loss": -5.3338847160339355, "global_step": 19074, "epoch": 454} {"train_loss": -5.24485969543457, "global_step": 19075, "epoch": 454} {"train_loss": -5.2852396965026855, "global_step": 19076, "epoch": 454} {"train_loss": -5.311740875244141, "global_step": 19077, "epoch": 454} {"train_loss": -5.267519950866699, "global_step": 19078, "epoch": 454} {"train_loss": -5.3605241775512695, "global_step": 19079, "epoch": 454} {"train_loss": -5.391796588897705, "global_step": 19080, "epoch": 454} {"train_loss": -5.104691028594971, "global_step": 19081, "epoch": 454} {"train_loss": -5.251053333282471, "global_step": 19082, "epoch": 454} {"train_loss": -5.225808143615723, "global_step": 19083, "epoch": 454} {"train_loss": -5.327496528625488, "global_step": 19084, "epoch": 454} {"train_loss": -5.1718268394470215, "global_step": 19085, "epoch": 454} {"train_loss": -5.186005592346191, "global_step": 19086, "epoch": 454} {"train_loss": -5.287322044372559, "global_step": 19087, "epoch": 454} {"train_loss": -5.067998886108398, "global_step": 19088, "epoch": 454} {"train_loss": -5.29343318939209, "global_step": 19089, "epoch": 454} {"train_loss": -5.291895866394043, "global_step": 19090, "epoch": 454} {"train_loss": -5.132716178894043, "global_step": 19091, "epoch": 454} {"train_loss": -5.238157749176025, "global_step": 19092, "epoch": 454} {"train_loss": -5.2609076499938965, "global_step": 19093, "epoch": 454} {"train_loss": -5.16419792175293, "global_step": 19094, "epoch": 454} {"train_loss": -5.226236343383789, "global_step": 19095, "epoch": 454} {"train_loss": -5.265320301055908, "global_step": 19096, "epoch": 454} {"train_loss": -5.232778549194336, "global_step": 19097, "epoch": 454} {"train_loss": -5.306201934814453, "global_step": 19098, "epoch": 454} {"train_loss": -5.241218566894531, "global_step": 19099, "epoch": 454} {"train_loss": -5.328095436096191, "global_step": 19100, "epoch": 454} {"train_loss": -5.330185413360596, "global_step": 19101, "epoch": 454} {"train_loss": -5.296182632446289, "global_step": 19102, "epoch": 454} {"train_loss": -5.340419292449951, "global_step": 19103, "epoch": 454} {"train_loss": -5.340672492980957, "global_step": 19104, "epoch": 454} {"train_loss": -5.156830787658691, "global_step": 19105, "epoch": 454} {"train_loss": -5.207264423370361, "global_step": 19106, "epoch": 454} {"train_loss": -5.174081325531006, "global_step": 19107, "epoch": 454} {"train_loss": -5.419759750366211, "global_step": 19108, "epoch": 454} {"train_loss": -5.268809863499233, "global_step": 19109, "epoch": 454, "val_loss": 68141.140625} {"train_loss": -5.292795658111572, "global_step": 19110, "epoch": 455} {"train_loss": -5.349063873291016, "global_step": 19111, "epoch": 455} {"train_loss": -5.276850700378418, "global_step": 19112, "epoch": 455} {"train_loss": -5.428428649902344, "global_step": 19113, "epoch": 455} {"train_loss": -5.376041412353516, "global_step": 19114, "epoch": 455} {"train_loss": -5.108412265777588, "global_step": 19115, "epoch": 455} {"train_loss": -5.411861419677734, "global_step": 19116, "epoch": 455} {"train_loss": -5.2581071853637695, "global_step": 19117, "epoch": 455} {"train_loss": -5.389842510223389, "global_step": 19118, "epoch": 455} {"train_loss": -5.296958923339844, "global_step": 19119, "epoch": 455} {"train_loss": -5.402570724487305, "global_step": 19120, "epoch": 455} {"train_loss": -5.24785852432251, "global_step": 19121, "epoch": 455} {"train_loss": -5.286421298980713, "global_step": 19122, "epoch": 455} {"train_loss": -5.268142223358154, "global_step": 19123, "epoch": 455} {"train_loss": -5.349822521209717, "global_step": 19124, "epoch": 455} {"train_loss": -5.305839538574219, "global_step": 19125, "epoch": 455} {"train_loss": -5.394124507904053, "global_step": 19126, "epoch": 455} {"train_loss": -5.308464527130127, "global_step": 19127, "epoch": 455} {"train_loss": -5.311660289764404, "global_step": 19128, "epoch": 455} {"train_loss": -5.161121845245361, "global_step": 19129, "epoch": 455} {"train_loss": -5.278343200683594, "global_step": 19130, "epoch": 455} {"train_loss": -5.2690582275390625, "global_step": 19131, "epoch": 455} {"train_loss": -5.298029899597168, "global_step": 19132, "epoch": 455} {"train_loss": -5.172423362731934, "global_step": 19133, "epoch": 455} {"train_loss": -5.346541404724121, "global_step": 19134, "epoch": 455} {"train_loss": -5.261407852172852, "global_step": 19135, "epoch": 455} {"train_loss": -5.292015075683594, "global_step": 19136, "epoch": 455} {"train_loss": -5.269972801208496, "global_step": 19137, "epoch": 455} {"train_loss": -5.455143928527832, "global_step": 19138, "epoch": 455} {"train_loss": -5.1889519691467285, "global_step": 19139, "epoch": 455} {"train_loss": -5.215786457061768, "global_step": 19140, "epoch": 455} {"train_loss": -5.202993392944336, "global_step": 19141, "epoch": 455} {"train_loss": -5.158988952636719, "global_step": 19142, "epoch": 455} {"train_loss": -5.397464752197266, "global_step": 19143, "epoch": 455} {"train_loss": -5.32021427154541, "global_step": 19144, "epoch": 455} {"train_loss": -5.1171159744262695, "global_step": 19145, "epoch": 455} {"train_loss": -5.31934118270874, "global_step": 19146, "epoch": 455} {"train_loss": -5.256058692932129, "global_step": 19147, "epoch": 455} {"train_loss": -5.144640922546387, "global_step": 19148, "epoch": 455} {"train_loss": -5.250828742980957, "global_step": 19149, "epoch": 455} {"train_loss": -5.575977325439453, "global_step": 19150, "epoch": 455} {"train_loss": -5.290175437927246, "global_step": 19151, "epoch": 455, "val_loss": 67831.328125} {"train_loss": -5.2848029136657715, "global_step": 19152, "epoch": 456} {"train_loss": -5.306687831878662, "global_step": 19153, "epoch": 456} {"train_loss": -5.095616340637207, "global_step": 19154, "epoch": 456} {"train_loss": -5.375433921813965, "global_step": 19155, "epoch": 456} {"train_loss": -5.343288421630859, "global_step": 19156, "epoch": 456} {"train_loss": -5.188487529754639, "global_step": 19157, "epoch": 456} {"train_loss": -5.315968036651611, "global_step": 19158, "epoch": 456} {"train_loss": -5.221507549285889, "global_step": 19159, "epoch": 456} {"train_loss": -5.290973663330078, "global_step": 19160, "epoch": 456} {"train_loss": -5.336392402648926, "global_step": 19161, "epoch": 456} {"train_loss": -5.313974857330322, "global_step": 19162, "epoch": 456} {"train_loss": -5.335395336151123, "global_step": 19163, "epoch": 456} {"train_loss": -5.336148262023926, "global_step": 19164, "epoch": 456} {"train_loss": -5.350561141967773, "global_step": 19165, "epoch": 456} {"train_loss": -5.368395805358887, "global_step": 19166, "epoch": 456} {"train_loss": -5.206259727478027, "global_step": 19167, "epoch": 456} {"train_loss": -5.2542314529418945, "global_step": 19168, "epoch": 456} {"train_loss": -5.415622711181641, "global_step": 19169, "epoch": 456} {"train_loss": -5.390787124633789, "global_step": 19170, "epoch": 456} {"train_loss": -5.141591548919678, "global_step": 19171, "epoch": 456} {"train_loss": -5.274823188781738, "global_step": 19172, "epoch": 456} {"train_loss": -5.165256500244141, "global_step": 19173, "epoch": 456} {"train_loss": -5.119935989379883, "global_step": 19174, "epoch": 456} {"train_loss": -5.116316318511963, "global_step": 19175, "epoch": 456} {"train_loss": -5.3345441818237305, "global_step": 19176, "epoch": 456} {"train_loss": -5.115185737609863, "global_step": 19177, "epoch": 456} {"train_loss": -5.196735858917236, "global_step": 19178, "epoch": 456} {"train_loss": -5.24751091003418, "global_step": 19179, "epoch": 456} {"train_loss": -5.202474594116211, "global_step": 19180, "epoch": 456} {"train_loss": -5.322144031524658, "global_step": 19181, "epoch": 456} {"train_loss": -5.141383171081543, "global_step": 19182, "epoch": 456} {"train_loss": -5.26052188873291, "global_step": 19183, "epoch": 456} {"train_loss": -5.338268756866455, "global_step": 19184, "epoch": 456} {"train_loss": -5.245703220367432, "global_step": 19185, "epoch": 456} {"train_loss": -5.321754455566406, "global_step": 19186, "epoch": 456} {"train_loss": -5.251704216003418, "global_step": 19187, "epoch": 456} {"train_loss": -5.313292503356934, "global_step": 19188, "epoch": 456} {"train_loss": -5.38800573348999, "global_step": 19189, "epoch": 456} {"train_loss": -5.300052642822266, "global_step": 19190, "epoch": 456} {"train_loss": -5.260443687438965, "global_step": 19191, "epoch": 456} {"train_loss": -5.286712169647217, "global_step": 19192, "epoch": 456} {"train_loss": -5.269717114312308, "global_step": 19193, "epoch": 456, "val_loss": 68059.9921875} {"train_loss": -5.281429290771484, "global_step": 19194, "epoch": 457} {"train_loss": -5.318150043487549, "global_step": 19195, "epoch": 457} {"train_loss": -5.2766804695129395, "global_step": 19196, "epoch": 457} {"train_loss": -5.309601783752441, "global_step": 19197, "epoch": 457} {"train_loss": -5.234038352966309, "global_step": 19198, "epoch": 457} {"train_loss": -5.222970485687256, "global_step": 19199, "epoch": 457} {"train_loss": -5.258233547210693, "global_step": 19200, "epoch": 457} {"train_loss": -5.174221992492676, "global_step": 19201, "epoch": 457} {"train_loss": -5.278608798980713, "global_step": 19202, "epoch": 457} {"train_loss": -5.3693437576293945, "global_step": 19203, "epoch": 457} {"train_loss": -5.191901683807373, "global_step": 19204, "epoch": 457} {"train_loss": -5.229975700378418, "global_step": 19205, "epoch": 457} {"train_loss": -5.2267961502075195, "global_step": 19206, "epoch": 457} {"train_loss": -5.377669334411621, "global_step": 19207, "epoch": 457} {"train_loss": -5.025599956512451, "global_step": 19208, "epoch": 457} {"train_loss": -5.209741592407227, "global_step": 19209, "epoch": 457} {"train_loss": -5.281991958618164, "global_step": 19210, "epoch": 457} {"train_loss": -5.146119117736816, "global_step": 19211, "epoch": 457} {"train_loss": -5.27260684967041, "global_step": 19212, "epoch": 457} {"train_loss": -5.3243303298950195, "global_step": 19213, "epoch": 457} {"train_loss": -5.3381266593933105, "global_step": 19214, "epoch": 457} {"train_loss": -5.082840919494629, "global_step": 19215, "epoch": 457} {"train_loss": -5.231198310852051, "global_step": 19216, "epoch": 457} {"train_loss": -5.252704620361328, "global_step": 19217, "epoch": 457} {"train_loss": -5.321941375732422, "global_step": 19218, "epoch": 457} {"train_loss": -5.410560607910156, "global_step": 19219, "epoch": 457} {"train_loss": -5.235236644744873, "global_step": 19220, "epoch": 457} {"train_loss": -5.26027774810791, "global_step": 19221, "epoch": 457} {"train_loss": -5.257729530334473, "global_step": 19222, "epoch": 457} {"train_loss": -5.381899356842041, "global_step": 19223, "epoch": 457} {"train_loss": -5.349689960479736, "global_step": 19224, "epoch": 457} {"train_loss": -5.342155456542969, "global_step": 19225, "epoch": 457} {"train_loss": -5.300911903381348, "global_step": 19226, "epoch": 457} {"train_loss": -5.222841262817383, "global_step": 19227, "epoch": 457} {"train_loss": -5.213672637939453, "global_step": 19228, "epoch": 457} {"train_loss": -5.205238342285156, "global_step": 19229, "epoch": 457} {"train_loss": -5.381364822387695, "global_step": 19230, "epoch": 457} {"train_loss": -5.222327709197998, "global_step": 19231, "epoch": 457} {"train_loss": -5.317933559417725, "global_step": 19232, "epoch": 457} {"train_loss": -5.18405818939209, "global_step": 19233, "epoch": 457} {"train_loss": -5.218395233154297, "global_step": 19234, "epoch": 457} {"train_loss": -5.2647070089976, "global_step": 19235, "epoch": 457, "val_loss": 68782.875} {"train_loss": -5.057711601257324, "global_step": 19236, "epoch": 458} {"train_loss": -5.351740837097168, "global_step": 19237, "epoch": 458} {"train_loss": -5.297123908996582, "global_step": 19238, "epoch": 458} {"train_loss": -5.180877685546875, "global_step": 19239, "epoch": 458} {"train_loss": -5.234060764312744, "global_step": 19240, "epoch": 458} {"train_loss": -5.1978349685668945, "global_step": 19241, "epoch": 458} {"train_loss": -5.231064319610596, "global_step": 19242, "epoch": 458} {"train_loss": -5.21527099609375, "global_step": 19243, "epoch": 458} {"train_loss": -5.2180891036987305, "global_step": 19244, "epoch": 458} {"train_loss": -5.167158126831055, "global_step": 19245, "epoch": 458} {"train_loss": -5.1834306716918945, "global_step": 19246, "epoch": 458} {"train_loss": -5.135565757751465, "global_step": 19247, "epoch": 458} {"train_loss": -5.15472412109375, "global_step": 19248, "epoch": 458} {"train_loss": -5.23927116394043, "global_step": 19249, "epoch": 458} {"train_loss": -5.065253257751465, "global_step": 19250, "epoch": 458} {"train_loss": -5.222230434417725, "global_step": 19251, "epoch": 458} {"train_loss": -5.285890102386475, "global_step": 19252, "epoch": 458} {"train_loss": -5.169528007507324, "global_step": 19253, "epoch": 458} {"train_loss": -5.200390815734863, "global_step": 19254, "epoch": 458} {"train_loss": -5.344324111938477, "global_step": 19255, "epoch": 458} {"train_loss": -5.343100547790527, "global_step": 19256, "epoch": 458} {"train_loss": -5.154714584350586, "global_step": 19257, "epoch": 458} {"train_loss": -5.4109110832214355, "global_step": 19258, "epoch": 458} {"train_loss": -5.099225997924805, "global_step": 19259, "epoch": 458} {"train_loss": -5.257503509521484, "global_step": 19260, "epoch": 458} {"train_loss": -5.256643772125244, "global_step": 19261, "epoch": 458} {"train_loss": -5.280773162841797, "global_step": 19262, "epoch": 458} {"train_loss": -5.471729278564453, "global_step": 19263, "epoch": 458} {"train_loss": -5.267219066619873, "global_step": 19264, "epoch": 458} {"train_loss": -5.308612823486328, "global_step": 19265, "epoch": 458} {"train_loss": -5.359977722167969, "global_step": 19266, "epoch": 458} {"train_loss": -5.132171630859375, "global_step": 19267, "epoch": 458} {"train_loss": -5.386495113372803, "global_step": 19268, "epoch": 458} {"train_loss": -5.257122993469238, "global_step": 19269, "epoch": 458} {"train_loss": -5.186766147613525, "global_step": 19270, "epoch": 458} {"train_loss": -5.358089447021484, "global_step": 19271, "epoch": 458} {"train_loss": -5.1921844482421875, "global_step": 19272, "epoch": 458} {"train_loss": -5.278320789337158, "global_step": 19273, "epoch": 458} {"train_loss": -5.242404937744141, "global_step": 19274, "epoch": 458} {"train_loss": -5.334637641906738, "global_step": 19275, "epoch": 458} {"train_loss": -5.256153583526611, "global_step": 19276, "epoch": 458} {"train_loss": -5.245475087847028, "global_step": 19277, "epoch": 458, "val_loss": 67873.953125} {"train_loss": -5.266273498535156, "global_step": 19278, "epoch": 459} {"train_loss": -5.228460311889648, "global_step": 19279, "epoch": 459} {"train_loss": -5.298765182495117, "global_step": 19280, "epoch": 459} {"train_loss": -5.365334510803223, "global_step": 19281, "epoch": 459} {"train_loss": -5.2226643562316895, "global_step": 19282, "epoch": 459} {"train_loss": -5.11890172958374, "global_step": 19283, "epoch": 459} {"train_loss": -5.27710485458374, "global_step": 19284, "epoch": 459} {"train_loss": -5.216804504394531, "global_step": 19285, "epoch": 459} {"train_loss": -5.2189435958862305, "global_step": 19286, "epoch": 459} {"train_loss": -5.240784645080566, "global_step": 19287, "epoch": 459} {"train_loss": -5.306851863861084, "global_step": 19288, "epoch": 459} {"train_loss": -5.412107467651367, "global_step": 19289, "epoch": 459} {"train_loss": -5.318501949310303, "global_step": 19290, "epoch": 459} {"train_loss": -5.381204605102539, "global_step": 19291, "epoch": 459} {"train_loss": -5.254208564758301, "global_step": 19292, "epoch": 459} {"train_loss": -5.233165740966797, "global_step": 19293, "epoch": 459} {"train_loss": -5.33640193939209, "global_step": 19294, "epoch": 459} {"train_loss": -5.178587913513184, "global_step": 19295, "epoch": 459} {"train_loss": -5.201482772827148, "global_step": 19296, "epoch": 459} {"train_loss": -5.34890079498291, "global_step": 19297, "epoch": 459} {"train_loss": -5.2740607261657715, "global_step": 19298, "epoch": 459} {"train_loss": -5.237160682678223, "global_step": 19299, "epoch": 459} {"train_loss": -5.0385942459106445, "global_step": 19300, "epoch": 459} {"train_loss": -5.307018756866455, "global_step": 19301, "epoch": 459} {"train_loss": -5.454342842102051, "global_step": 19302, "epoch": 459} {"train_loss": -5.099164009094238, "global_step": 19303, "epoch": 459} {"train_loss": -5.3265275955200195, "global_step": 19304, "epoch": 459} {"train_loss": -5.300936698913574, "global_step": 19305, "epoch": 459} {"train_loss": -5.120683670043945, "global_step": 19306, "epoch": 459} {"train_loss": -5.238464832305908, "global_step": 19307, "epoch": 459} {"train_loss": -5.178359031677246, "global_step": 19308, "epoch": 459} {"train_loss": -5.191621780395508, "global_step": 19309, "epoch": 459} {"train_loss": -5.228357315063477, "global_step": 19310, "epoch": 459} {"train_loss": -5.214661598205566, "global_step": 19311, "epoch": 459} {"train_loss": -5.117494583129883, "global_step": 19312, "epoch": 459} {"train_loss": -5.281582832336426, "global_step": 19313, "epoch": 459} {"train_loss": -5.1032490730285645, "global_step": 19314, "epoch": 459} {"train_loss": -5.311796188354492, "global_step": 19315, "epoch": 459} {"train_loss": -5.270996570587158, "global_step": 19316, "epoch": 459} {"train_loss": -5.191364288330078, "global_step": 19317, "epoch": 459} {"train_loss": -5.251133918762207, "global_step": 19318, "epoch": 459} {"train_loss": -5.245730752036685, "global_step": 19319, "epoch": 459, "val_loss": 68193.1875} {"train_loss": -5.308320999145508, "global_step": 19320, "epoch": 460} {"train_loss": -5.124197959899902, "global_step": 19321, "epoch": 460} {"train_loss": -5.193716049194336, "global_step": 19322, "epoch": 460} {"train_loss": -5.4156599044799805, "global_step": 19323, "epoch": 460} {"train_loss": -5.230475425720215, "global_step": 19324, "epoch": 460} {"train_loss": -5.331738471984863, "global_step": 19325, "epoch": 460} {"train_loss": -5.319565296173096, "global_step": 19326, "epoch": 460} {"train_loss": -5.288502216339111, "global_step": 19327, "epoch": 460} {"train_loss": -5.411327838897705, "global_step": 19328, "epoch": 460} {"train_loss": -5.241843223571777, "global_step": 19329, "epoch": 460} {"train_loss": -5.266049385070801, "global_step": 19330, "epoch": 460} {"train_loss": -5.402588844299316, "global_step": 19331, "epoch": 460} {"train_loss": -5.383138179779053, "global_step": 19332, "epoch": 460} {"train_loss": -5.329951763153076, "global_step": 19333, "epoch": 460} {"train_loss": -5.312222480773926, "global_step": 19334, "epoch": 460} {"train_loss": -5.325389385223389, "global_step": 19335, "epoch": 460} {"train_loss": -5.323663234710693, "global_step": 19336, "epoch": 460} {"train_loss": -5.392995357513428, "global_step": 19337, "epoch": 460} {"train_loss": -5.422272682189941, "global_step": 19338, "epoch": 460} {"train_loss": -5.314305305480957, "global_step": 19339, "epoch": 460} {"train_loss": -5.185976982116699, "global_step": 19340, "epoch": 460} {"train_loss": -5.42380428314209, "global_step": 19341, "epoch": 460} {"train_loss": -5.163699626922607, "global_step": 19342, "epoch": 460} {"train_loss": -5.315868377685547, "global_step": 19343, "epoch": 460} {"train_loss": -5.274471282958984, "global_step": 19344, "epoch": 460} {"train_loss": -5.240581035614014, "global_step": 19345, "epoch": 460} {"train_loss": -5.18822717666626, "global_step": 19346, "epoch": 460} {"train_loss": -5.13322639465332, "global_step": 19347, "epoch": 460} {"train_loss": -5.215200901031494, "global_step": 19348, "epoch": 460} {"train_loss": -5.205192565917969, "global_step": 19349, "epoch": 460} {"train_loss": -5.308943748474121, "global_step": 19350, "epoch": 460} {"train_loss": -5.273219585418701, "global_step": 19351, "epoch": 460} {"train_loss": -5.162519454956055, "global_step": 19352, "epoch": 460} {"train_loss": -5.236844062805176, "global_step": 19353, "epoch": 460} {"train_loss": -5.195279121398926, "global_step": 19354, "epoch": 460} {"train_loss": -5.374917030334473, "global_step": 19355, "epoch": 460} {"train_loss": -5.363487243652344, "global_step": 19356, "epoch": 460} {"train_loss": -5.249644756317139, "global_step": 19357, "epoch": 460} {"train_loss": -5.30940055847168, "global_step": 19358, "epoch": 460} {"train_loss": -5.404366493225098, "global_step": 19359, "epoch": 460} {"train_loss": -5.106534957885742, "global_step": 19360, "epoch": 460} {"train_loss": -5.284424634206863, "global_step": 19361, "epoch": 460, "val_loss": 67870.0} {"train_loss": -5.262521266937256, "global_step": 19362, "epoch": 461} {"train_loss": -5.195847511291504, "global_step": 19363, "epoch": 461} {"train_loss": -5.181967735290527, "global_step": 19364, "epoch": 461} {"train_loss": -5.355096340179443, "global_step": 19365, "epoch": 461} {"train_loss": -5.148025989532471, "global_step": 19366, "epoch": 461} {"train_loss": -5.203017234802246, "global_step": 19367, "epoch": 461} {"train_loss": -5.404568672180176, "global_step": 19368, "epoch": 461} {"train_loss": -5.287336826324463, "global_step": 19369, "epoch": 461} {"train_loss": -5.241010665893555, "global_step": 19370, "epoch": 461} {"train_loss": -5.299378395080566, "global_step": 19371, "epoch": 461} {"train_loss": -5.31257438659668, "global_step": 19372, "epoch": 461} {"train_loss": -5.210062026977539, "global_step": 19373, "epoch": 461} {"train_loss": -5.112072944641113, "global_step": 19374, "epoch": 461} {"train_loss": -5.262208461761475, "global_step": 19375, "epoch": 461} {"train_loss": -5.298801422119141, "global_step": 19376, "epoch": 461} {"train_loss": -5.270113468170166, "global_step": 19377, "epoch": 461} {"train_loss": -5.238614082336426, "global_step": 19378, "epoch": 461} {"train_loss": -5.330819129943848, "global_step": 19379, "epoch": 461} {"train_loss": -5.284488677978516, "global_step": 19380, "epoch": 461} {"train_loss": -5.269445419311523, "global_step": 19381, "epoch": 461} {"train_loss": -5.376257419586182, "global_step": 19382, "epoch": 461} {"train_loss": -5.3491973876953125, "global_step": 19383, "epoch": 461} {"train_loss": -5.363180637359619, "global_step": 19384, "epoch": 461} {"train_loss": -5.358750343322754, "global_step": 19385, "epoch": 461} {"train_loss": -5.248009204864502, "global_step": 19386, "epoch": 461} {"train_loss": -5.126511096954346, "global_step": 19387, "epoch": 461} {"train_loss": -5.298366546630859, "global_step": 19388, "epoch": 461} {"train_loss": -5.3933916091918945, "global_step": 19389, "epoch": 461} {"train_loss": -5.305510520935059, "global_step": 19390, "epoch": 461} {"train_loss": -5.22946834564209, "global_step": 19391, "epoch": 461} {"train_loss": -5.19444465637207, "global_step": 19392, "epoch": 461} {"train_loss": -5.260439872741699, "global_step": 19393, "epoch": 461} {"train_loss": -5.202666759490967, "global_step": 19394, "epoch": 461} {"train_loss": -5.367424964904785, "global_step": 19395, "epoch": 461} {"train_loss": -5.238775253295898, "global_step": 19396, "epoch": 461} {"train_loss": -5.200891971588135, "global_step": 19397, "epoch": 461} {"train_loss": -5.233665466308594, "global_step": 19398, "epoch": 461} {"train_loss": -5.264966011047363, "global_step": 19399, "epoch": 461} {"train_loss": -5.105136871337891, "global_step": 19400, "epoch": 461} {"train_loss": -5.266493797302246, "global_step": 19401, "epoch": 461} {"train_loss": -5.152053356170654, "global_step": 19402, "epoch": 461} {"train_loss": -5.2610435372307185, "global_step": 19403, "epoch": 461, "val_loss": 67812.859375} {"train_loss": -5.115670680999756, "global_step": 19404, "epoch": 462} {"train_loss": -5.289153099060059, "global_step": 19405, "epoch": 462} {"train_loss": -5.16873025894165, "global_step": 19406, "epoch": 462} {"train_loss": -5.2636237144470215, "global_step": 19407, "epoch": 462} {"train_loss": -5.220333099365234, "global_step": 19408, "epoch": 462} {"train_loss": -5.2811713218688965, "global_step": 19409, "epoch": 462} {"train_loss": -5.415292739868164, "global_step": 19410, "epoch": 462} {"train_loss": -5.110634803771973, "global_step": 19411, "epoch": 462} {"train_loss": -5.276561737060547, "global_step": 19412, "epoch": 462} {"train_loss": -5.245762348175049, "global_step": 19413, "epoch": 462} {"train_loss": -5.131762504577637, "global_step": 19414, "epoch": 462} {"train_loss": -5.35210657119751, "global_step": 19415, "epoch": 462} {"train_loss": -5.241096496582031, "global_step": 19416, "epoch": 462} {"train_loss": -5.133853912353516, "global_step": 19417, "epoch": 462} {"train_loss": -5.264125823974609, "global_step": 19418, "epoch": 462} {"train_loss": -5.234269142150879, "global_step": 19419, "epoch": 462} {"train_loss": -5.1856818199157715, "global_step": 19420, "epoch": 462} {"train_loss": -5.4120683670043945, "global_step": 19421, "epoch": 462} {"train_loss": -5.499833106994629, "global_step": 19422, "epoch": 462} {"train_loss": -5.195535659790039, "global_step": 19423, "epoch": 462} {"train_loss": -5.226616859436035, "global_step": 19424, "epoch": 462} {"train_loss": -5.280940055847168, "global_step": 19425, "epoch": 462} {"train_loss": -5.24085807800293, "global_step": 19426, "epoch": 462} {"train_loss": -5.320113182067871, "global_step": 19427, "epoch": 462} {"train_loss": -5.383660316467285, "global_step": 19428, "epoch": 462} {"train_loss": -5.364805698394775, "global_step": 19429, "epoch": 462} {"train_loss": -5.415445804595947, "global_step": 19430, "epoch": 462} {"train_loss": -5.2010345458984375, "global_step": 19431, "epoch": 462} {"train_loss": -5.2546186447143555, "global_step": 19432, "epoch": 462} {"train_loss": -5.354900360107422, "global_step": 19433, "epoch": 462} {"train_loss": -5.319878101348877, "global_step": 19434, "epoch": 462} {"train_loss": -5.480012893676758, "global_step": 19435, "epoch": 462} {"train_loss": -5.281922340393066, "global_step": 19436, "epoch": 462} {"train_loss": -5.354719161987305, "global_step": 19437, "epoch": 462} {"train_loss": -5.282260894775391, "global_step": 19438, "epoch": 462} {"train_loss": -5.306769371032715, "global_step": 19439, "epoch": 462} {"train_loss": -5.451725959777832, "global_step": 19440, "epoch": 462} {"train_loss": -5.254962921142578, "global_step": 19441, "epoch": 462} {"train_loss": -5.2686052322387695, "global_step": 19442, "epoch": 462} {"train_loss": -5.263277053833008, "global_step": 19443, "epoch": 462} {"train_loss": -5.329165458679199, "global_step": 19444, "epoch": 462} {"train_loss": -5.282452787671771, "global_step": 19445, "epoch": 462, "val_loss": 68563.7734375} {"train_loss": -5.198627948760986, "global_step": 19446, "epoch": 463} {"train_loss": -5.156973361968994, "global_step": 19447, "epoch": 463} {"train_loss": -5.127115726470947, "global_step": 19448, "epoch": 463} {"train_loss": -5.257080078125, "global_step": 19449, "epoch": 463} {"train_loss": -5.358282566070557, "global_step": 19450, "epoch": 463} {"train_loss": -5.130784034729004, "global_step": 19451, "epoch": 463} {"train_loss": -5.325902938842773, "global_step": 19452, "epoch": 463} {"train_loss": -5.441411972045898, "global_step": 19453, "epoch": 463} {"train_loss": -5.407553672790527, "global_step": 19454, "epoch": 463} {"train_loss": -5.304234981536865, "global_step": 19455, "epoch": 463} {"train_loss": -5.277454376220703, "global_step": 19456, "epoch": 463} {"train_loss": -5.279726028442383, "global_step": 19457, "epoch": 463} {"train_loss": -5.321372985839844, "global_step": 19458, "epoch": 463} {"train_loss": -5.273963451385498, "global_step": 19459, "epoch": 463} {"train_loss": -5.2033867835998535, "global_step": 19460, "epoch": 463} {"train_loss": -5.2072906494140625, "global_step": 19461, "epoch": 463} {"train_loss": -5.464512825012207, "global_step": 19462, "epoch": 463} {"train_loss": -5.221493721008301, "global_step": 19463, "epoch": 463} {"train_loss": -5.219480514526367, "global_step": 19464, "epoch": 463} {"train_loss": -5.234673500061035, "global_step": 19465, "epoch": 463} {"train_loss": -5.24635124206543, "global_step": 19466, "epoch": 463} {"train_loss": -5.197671890258789, "global_step": 19467, "epoch": 463} {"train_loss": -5.277609348297119, "global_step": 19468, "epoch": 463} {"train_loss": -5.282891273498535, "global_step": 19469, "epoch": 463} {"train_loss": -5.252834320068359, "global_step": 19470, "epoch": 463} {"train_loss": -5.388737201690674, "global_step": 19471, "epoch": 463} {"train_loss": -5.257412433624268, "global_step": 19472, "epoch": 463} {"train_loss": -5.317727088928223, "global_step": 19473, "epoch": 463} {"train_loss": -5.379549980163574, "global_step": 19474, "epoch": 463} {"train_loss": -5.353901386260986, "global_step": 19475, "epoch": 463} {"train_loss": -5.268756866455078, "global_step": 19476, "epoch": 463} {"train_loss": -5.2862348556518555, "global_step": 19477, "epoch": 463} {"train_loss": -5.257072448730469, "global_step": 19478, "epoch": 463} {"train_loss": -5.276890754699707, "global_step": 19479, "epoch": 463} {"train_loss": -5.353150367736816, "global_step": 19480, "epoch": 463} {"train_loss": -5.379264831542969, "global_step": 19481, "epoch": 463} {"train_loss": -5.246850490570068, "global_step": 19482, "epoch": 463} {"train_loss": -5.295548915863037, "global_step": 19483, "epoch": 463} {"train_loss": -5.343658447265625, "global_step": 19484, "epoch": 463} {"train_loss": -5.249667167663574, "global_step": 19485, "epoch": 463} {"train_loss": -5.303288459777832, "global_step": 19486, "epoch": 463} {"train_loss": -5.282735097975958, "global_step": 19487, "epoch": 463, "val_loss": 67810.71875} {"train_loss": -5.445397853851318, "global_step": 19488, "epoch": 464} {"train_loss": -5.349187850952148, "global_step": 19489, "epoch": 464} {"train_loss": -5.3766608238220215, "global_step": 19490, "epoch": 464} {"train_loss": -5.349440574645996, "global_step": 19491, "epoch": 464} {"train_loss": -5.29263162612915, "global_step": 19492, "epoch": 464} {"train_loss": -5.406071186065674, "global_step": 19493, "epoch": 464} {"train_loss": -5.306319713592529, "global_step": 19494, "epoch": 464} {"train_loss": -5.178346633911133, "global_step": 19495, "epoch": 464} {"train_loss": -5.260077476501465, "global_step": 19496, "epoch": 464} {"train_loss": -5.348746299743652, "global_step": 19497, "epoch": 464} {"train_loss": -5.281789779663086, "global_step": 19498, "epoch": 464} {"train_loss": -5.344663619995117, "global_step": 19499, "epoch": 464} {"train_loss": -5.180073261260986, "global_step": 19500, "epoch": 464} {"train_loss": -5.2323760986328125, "global_step": 19501, "epoch": 464} {"train_loss": -5.1423234939575195, "global_step": 19502, "epoch": 464} {"train_loss": -5.156420707702637, "global_step": 19503, "epoch": 464} {"train_loss": -5.378615379333496, "global_step": 19504, "epoch": 464} {"train_loss": -5.2055206298828125, "global_step": 19505, "epoch": 464} {"train_loss": -5.2035627365112305, "global_step": 19506, "epoch": 464} {"train_loss": -5.27182674407959, "global_step": 19507, "epoch": 464} {"train_loss": -5.367469787597656, "global_step": 19508, "epoch": 464} {"train_loss": -5.345236301422119, "global_step": 19509, "epoch": 464} {"train_loss": -5.389311790466309, "global_step": 19510, "epoch": 464} {"train_loss": -5.320651531219482, "global_step": 19511, "epoch": 464} {"train_loss": -5.320981025695801, "global_step": 19512, "epoch": 464} {"train_loss": -5.24050235748291, "global_step": 19513, "epoch": 464} {"train_loss": -5.31356143951416, "global_step": 19514, "epoch": 464} {"train_loss": -5.255892753601074, "global_step": 19515, "epoch": 464} {"train_loss": -5.273584365844727, "global_step": 19516, "epoch": 464} {"train_loss": -5.194399356842041, "global_step": 19517, "epoch": 464} {"train_loss": -5.2526140213012695, "global_step": 19518, "epoch": 464} {"train_loss": -5.247262001037598, "global_step": 19519, "epoch": 464} {"train_loss": -5.236374855041504, "global_step": 19520, "epoch": 464} {"train_loss": -5.246599197387695, "global_step": 19521, "epoch": 464} {"train_loss": -5.2676849365234375, "global_step": 19522, "epoch": 464} {"train_loss": -5.3122944831848145, "global_step": 19523, "epoch": 464} {"train_loss": -5.206218242645264, "global_step": 19524, "epoch": 464} {"train_loss": -5.440306663513184, "global_step": 19525, "epoch": 464} {"train_loss": -5.307088375091553, "global_step": 19526, "epoch": 464} {"train_loss": -5.344414234161377, "global_step": 19527, "epoch": 464} {"train_loss": -5.208003520965576, "global_step": 19528, "epoch": 464} {"train_loss": -5.2891993182046075, "global_step": 19529, "epoch": 464, "val_loss": 67598.3046875} {"train_loss": -5.461493968963623, "global_step": 19530, "epoch": 465} {"train_loss": -5.289801597595215, "global_step": 19531, "epoch": 465} {"train_loss": -5.242956161499023, "global_step": 19532, "epoch": 465} {"train_loss": -5.348665237426758, "global_step": 19533, "epoch": 465} {"train_loss": -5.293126583099365, "global_step": 19534, "epoch": 465} {"train_loss": -5.267786502838135, "global_step": 19535, "epoch": 465} {"train_loss": -5.30938196182251, "global_step": 19536, "epoch": 465} {"train_loss": -5.307713508605957, "global_step": 19537, "epoch": 465} {"train_loss": -5.206249237060547, "global_step": 19538, "epoch": 465} {"train_loss": -5.335972785949707, "global_step": 19539, "epoch": 465} {"train_loss": -5.413336277008057, "global_step": 19540, "epoch": 465} {"train_loss": -5.416120529174805, "global_step": 19541, "epoch": 465} {"train_loss": -5.334726810455322, "global_step": 19542, "epoch": 465} {"train_loss": -5.2446722984313965, "global_step": 19543, "epoch": 465} {"train_loss": -5.283026695251465, "global_step": 19544, "epoch": 465} {"train_loss": -5.403677463531494, "global_step": 19545, "epoch": 465} {"train_loss": -5.159070014953613, "global_step": 19546, "epoch": 465} {"train_loss": -5.1648969650268555, "global_step": 19547, "epoch": 465} {"train_loss": -5.347028732299805, "global_step": 19548, "epoch": 465} {"train_loss": -5.087271213531494, "global_step": 19549, "epoch": 465} {"train_loss": -5.22784423828125, "global_step": 19550, "epoch": 465} {"train_loss": -5.199152946472168, "global_step": 19551, "epoch": 465} {"train_loss": -5.085270881652832, "global_step": 19552, "epoch": 465} {"train_loss": -5.249989032745361, "global_step": 19553, "epoch": 465} {"train_loss": -5.032557964324951, "global_step": 19554, "epoch": 465} {"train_loss": -5.13402795791626, "global_step": 19555, "epoch": 465} {"train_loss": -5.182702541351318, "global_step": 19556, "epoch": 465} {"train_loss": -4.906200408935547, "global_step": 19557, "epoch": 465} {"train_loss": -5.269351005554199, "global_step": 19558, "epoch": 465} {"train_loss": -5.143074989318848, "global_step": 19559, "epoch": 465} {"train_loss": -5.2242889404296875, "global_step": 19560, "epoch": 465} {"train_loss": -5.2061448097229, "global_step": 19561, "epoch": 465} {"train_loss": -5.234586715698242, "global_step": 19562, "epoch": 465} {"train_loss": -5.2570414543151855, "global_step": 19563, "epoch": 465} {"train_loss": -5.327325820922852, "global_step": 19564, "epoch": 465} {"train_loss": -5.269627094268799, "global_step": 19565, "epoch": 465} {"train_loss": -5.226969242095947, "global_step": 19566, "epoch": 465} {"train_loss": -5.291971206665039, "global_step": 19567, "epoch": 465} {"train_loss": -5.413055419921875, "global_step": 19568, "epoch": 465} {"train_loss": -5.3788981437683105, "global_step": 19569, "epoch": 465} {"train_loss": -5.296245574951172, "global_step": 19570, "epoch": 465} {"train_loss": -5.256335247130621, "global_step": 19571, "epoch": 465, "val_loss": 67757.8046875} {"train_loss": -5.328197479248047, "global_step": 19572, "epoch": 466} {"train_loss": -5.213724613189697, "global_step": 19573, "epoch": 466} {"train_loss": -5.215221405029297, "global_step": 19574, "epoch": 466} {"train_loss": -5.3962554931640625, "global_step": 19575, "epoch": 466} {"train_loss": -5.181840896606445, "global_step": 19576, "epoch": 466} {"train_loss": -5.123794078826904, "global_step": 19577, "epoch": 466} {"train_loss": -5.264278411865234, "global_step": 19578, "epoch": 466} {"train_loss": -5.371969223022461, "global_step": 19579, "epoch": 466} {"train_loss": -5.144863128662109, "global_step": 19580, "epoch": 466} {"train_loss": -5.274449348449707, "global_step": 19581, "epoch": 466} {"train_loss": -5.172694206237793, "global_step": 19582, "epoch": 466} {"train_loss": -5.354974746704102, "global_step": 19583, "epoch": 466} {"train_loss": -5.232797145843506, "global_step": 19584, "epoch": 466} {"train_loss": -5.059338092803955, "global_step": 19585, "epoch": 466} {"train_loss": -5.335630416870117, "global_step": 19586, "epoch": 466} {"train_loss": -5.218417644500732, "global_step": 19587, "epoch": 466} {"train_loss": -5.127849578857422, "global_step": 19588, "epoch": 466} {"train_loss": -5.321215629577637, "global_step": 19589, "epoch": 466} {"train_loss": -5.25905704498291, "global_step": 19590, "epoch": 466} {"train_loss": -5.332987308502197, "global_step": 19591, "epoch": 466} {"train_loss": -5.173832416534424, "global_step": 19592, "epoch": 466} {"train_loss": -5.070549011230469, "global_step": 19593, "epoch": 466} {"train_loss": -5.297353744506836, "global_step": 19594, "epoch": 466} {"train_loss": -5.169245719909668, "global_step": 19595, "epoch": 466} {"train_loss": -5.055806636810303, "global_step": 19596, "epoch": 466} {"train_loss": -5.3740997314453125, "global_step": 19597, "epoch": 466} {"train_loss": -5.245706558227539, "global_step": 19598, "epoch": 466} {"train_loss": -5.212244033813477, "global_step": 19599, "epoch": 466} {"train_loss": -5.157619476318359, "global_step": 19600, "epoch": 466} {"train_loss": -5.164305686950684, "global_step": 19601, "epoch": 466} {"train_loss": -5.319302558898926, "global_step": 19602, "epoch": 466} {"train_loss": -5.336471080780029, "global_step": 19603, "epoch": 466} {"train_loss": -5.137667655944824, "global_step": 19604, "epoch": 466} {"train_loss": -5.267398834228516, "global_step": 19605, "epoch": 466} {"train_loss": -5.371228218078613, "global_step": 19606, "epoch": 466} {"train_loss": -5.31449031829834, "global_step": 19607, "epoch": 466} {"train_loss": -5.380522727966309, "global_step": 19608, "epoch": 466} {"train_loss": -5.2700114250183105, "global_step": 19609, "epoch": 466} {"train_loss": -5.2239766120910645, "global_step": 19610, "epoch": 466} {"train_loss": -5.390962600708008, "global_step": 19611, "epoch": 466} {"train_loss": -5.456942558288574, "global_step": 19612, "epoch": 466} {"train_loss": -5.2531477610270185, "global_step": 19613, "epoch": 466, "val_loss": 67518.8984375} {"train_loss": -5.363932132720947, "global_step": 19614, "epoch": 467} {"train_loss": -5.2661590576171875, "global_step": 19615, "epoch": 467} {"train_loss": -5.329990386962891, "global_step": 19616, "epoch": 467} {"train_loss": -5.124807357788086, "global_step": 19617, "epoch": 467} {"train_loss": -5.350510597229004, "global_step": 19618, "epoch": 467} {"train_loss": -5.326303482055664, "global_step": 19619, "epoch": 467} {"train_loss": -5.266346454620361, "global_step": 19620, "epoch": 467} {"train_loss": -5.141024589538574, "global_step": 19621, "epoch": 467} {"train_loss": -5.218193054199219, "global_step": 19622, "epoch": 467} {"train_loss": -5.347314834594727, "global_step": 19623, "epoch": 467} {"train_loss": -5.316373348236084, "global_step": 19624, "epoch": 467} {"train_loss": -5.297844886779785, "global_step": 19625, "epoch": 467} {"train_loss": -5.366837024688721, "global_step": 19626, "epoch": 467} {"train_loss": -5.400538444519043, "global_step": 19627, "epoch": 467} {"train_loss": -5.287410736083984, "global_step": 19628, "epoch": 467} {"train_loss": -5.283486366271973, "global_step": 19629, "epoch": 467} {"train_loss": -5.08234167098999, "global_step": 19630, "epoch": 467} {"train_loss": -5.296889305114746, "global_step": 19631, "epoch": 467} {"train_loss": -5.201115608215332, "global_step": 19632, "epoch": 467} {"train_loss": -5.298422813415527, "global_step": 19633, "epoch": 467} {"train_loss": -5.256103038787842, "global_step": 19634, "epoch": 467} {"train_loss": -5.208491325378418, "global_step": 19635, "epoch": 467} {"train_loss": -5.290683746337891, "global_step": 19636, "epoch": 467} {"train_loss": -5.225489139556885, "global_step": 19637, "epoch": 467} {"train_loss": -5.325714588165283, "global_step": 19638, "epoch": 467} {"train_loss": -5.235660552978516, "global_step": 19639, "epoch": 467} {"train_loss": -5.407098770141602, "global_step": 19640, "epoch": 467} {"train_loss": -5.16943359375, "global_step": 19641, "epoch": 467} {"train_loss": -5.182671070098877, "global_step": 19642, "epoch": 467} {"train_loss": -5.223947525024414, "global_step": 19643, "epoch": 467} {"train_loss": -5.271315574645996, "global_step": 19644, "epoch": 467} {"train_loss": -5.2610368728637695, "global_step": 19645, "epoch": 467} {"train_loss": -5.25742244720459, "global_step": 19646, "epoch": 467} {"train_loss": -5.2795000076293945, "global_step": 19647, "epoch": 467} {"train_loss": -5.17302131652832, "global_step": 19648, "epoch": 467} {"train_loss": -5.293929576873779, "global_step": 19649, "epoch": 467} {"train_loss": -5.277474403381348, "global_step": 19650, "epoch": 467} {"train_loss": -5.195432186126709, "global_step": 19651, "epoch": 467} {"train_loss": -5.290863513946533, "global_step": 19652, "epoch": 467} {"train_loss": -5.258981704711914, "global_step": 19653, "epoch": 467} {"train_loss": -5.155889987945557, "global_step": 19654, "epoch": 467} {"train_loss": -5.262953531174433, "global_step": 19655, "epoch": 467, "val_loss": 68020.0859375} {"train_loss": -5.328464508056641, "global_step": 19656, "epoch": 468} {"train_loss": -5.35170841217041, "global_step": 19657, "epoch": 468} {"train_loss": -5.302148342132568, "global_step": 19658, "epoch": 468} {"train_loss": -5.404512405395508, "global_step": 19659, "epoch": 468} {"train_loss": -5.322321891784668, "global_step": 19660, "epoch": 468} {"train_loss": -5.2574357986450195, "global_step": 19661, "epoch": 468} {"train_loss": -5.241050720214844, "global_step": 19662, "epoch": 468} {"train_loss": -5.326163291931152, "global_step": 19663, "epoch": 468} {"train_loss": -5.284730911254883, "global_step": 19664, "epoch": 468} {"train_loss": -5.123558521270752, "global_step": 19665, "epoch": 468} {"train_loss": -5.2775068283081055, "global_step": 19666, "epoch": 468} {"train_loss": -5.406842231750488, "global_step": 19667, "epoch": 468} {"train_loss": -5.177672386169434, "global_step": 19668, "epoch": 468} {"train_loss": -5.241103649139404, "global_step": 19669, "epoch": 468} {"train_loss": -5.256401538848877, "global_step": 19670, "epoch": 468} {"train_loss": -5.159573554992676, "global_step": 19671, "epoch": 468} {"train_loss": -5.287650108337402, "global_step": 19672, "epoch": 468} {"train_loss": -5.352866172790527, "global_step": 19673, "epoch": 468} {"train_loss": -5.302645683288574, "global_step": 19674, "epoch": 468} {"train_loss": -5.194287300109863, "global_step": 19675, "epoch": 468} {"train_loss": -5.151411056518555, "global_step": 19676, "epoch": 468} {"train_loss": -5.343170166015625, "global_step": 19677, "epoch": 468} {"train_loss": -5.269559383392334, "global_step": 19678, "epoch": 468} {"train_loss": -5.170170783996582, "global_step": 19679, "epoch": 468} {"train_loss": -5.348562240600586, "global_step": 19680, "epoch": 468} {"train_loss": -5.340484619140625, "global_step": 19681, "epoch": 468} {"train_loss": -5.168157577514648, "global_step": 19682, "epoch": 468} {"train_loss": -5.289923667907715, "global_step": 19683, "epoch": 468} {"train_loss": -5.420897483825684, "global_step": 19684, "epoch": 468} {"train_loss": -5.300942897796631, "global_step": 19685, "epoch": 468} {"train_loss": -5.294220924377441, "global_step": 19686, "epoch": 468} {"train_loss": -5.39974308013916, "global_step": 19687, "epoch": 468} {"train_loss": -5.3204026222229, "global_step": 19688, "epoch": 468} {"train_loss": -5.336491107940674, "global_step": 19689, "epoch": 468} {"train_loss": -5.379518032073975, "global_step": 19690, "epoch": 468} {"train_loss": -5.174437522888184, "global_step": 19691, "epoch": 468} {"train_loss": -5.32651948928833, "global_step": 19692, "epoch": 468} {"train_loss": -5.38077449798584, "global_step": 19693, "epoch": 468} {"train_loss": -5.1682586669921875, "global_step": 19694, "epoch": 468} {"train_loss": -5.339828968048096, "global_step": 19695, "epoch": 468} {"train_loss": -5.315179347991943, "global_step": 19696, "epoch": 468} {"train_loss": -5.2891042459578745, "global_step": 19697, "epoch": 468, "val_loss": 67676.5390625} {"train_loss": -5.234777450561523, "global_step": 19698, "epoch": 469} {"train_loss": -5.42563533782959, "global_step": 19699, "epoch": 469} {"train_loss": -5.302206993103027, "global_step": 19700, "epoch": 469} {"train_loss": -5.255623817443848, "global_step": 19701, "epoch": 469} {"train_loss": -5.230342864990234, "global_step": 19702, "epoch": 469} {"train_loss": -5.377948760986328, "global_step": 19703, "epoch": 469} {"train_loss": -5.2718825340271, "global_step": 19704, "epoch": 469} {"train_loss": -5.345282554626465, "global_step": 19705, "epoch": 469} {"train_loss": -5.413620948791504, "global_step": 19706, "epoch": 469} {"train_loss": -5.37737512588501, "global_step": 19707, "epoch": 469} {"train_loss": -5.313201904296875, "global_step": 19708, "epoch": 469} {"train_loss": -5.425204277038574, "global_step": 19709, "epoch": 469} {"train_loss": -5.388064861297607, "global_step": 19710, "epoch": 469} {"train_loss": -5.284282207489014, "global_step": 19711, "epoch": 469} {"train_loss": -5.415814399719238, "global_step": 19712, "epoch": 469} {"train_loss": -5.113049507141113, "global_step": 19713, "epoch": 469} {"train_loss": -5.056285381317139, "global_step": 19714, "epoch": 469} {"train_loss": -5.221799373626709, "global_step": 19715, "epoch": 469} {"train_loss": -5.111472129821777, "global_step": 19716, "epoch": 469} {"train_loss": -5.140861988067627, "global_step": 19717, "epoch": 469} {"train_loss": -5.248791694641113, "global_step": 19718, "epoch": 469} {"train_loss": -5.25776481628418, "global_step": 19719, "epoch": 469} {"train_loss": -4.984298229217529, "global_step": 19720, "epoch": 469} {"train_loss": -5.469515800476074, "global_step": 19721, "epoch": 469} {"train_loss": -5.113926887512207, "global_step": 19722, "epoch": 469} {"train_loss": -5.134424209594727, "global_step": 19723, "epoch": 469} {"train_loss": -5.565866470336914, "global_step": 19724, "epoch": 469} {"train_loss": -5.220383644104004, "global_step": 19725, "epoch": 469} {"train_loss": -5.316638946533203, "global_step": 19726, "epoch": 469} {"train_loss": -5.2970781326293945, "global_step": 19727, "epoch": 469} {"train_loss": -5.140109062194824, "global_step": 19728, "epoch": 469} {"train_loss": -5.274549961090088, "global_step": 19729, "epoch": 469} {"train_loss": -5.355474472045898, "global_step": 19730, "epoch": 469} {"train_loss": -5.273675918579102, "global_step": 19731, "epoch": 469} {"train_loss": -5.22945499420166, "global_step": 19732, "epoch": 469} {"train_loss": -5.1711859703063965, "global_step": 19733, "epoch": 469} {"train_loss": -5.199254989624023, "global_step": 19734, "epoch": 469} {"train_loss": -5.2688093185424805, "global_step": 19735, "epoch": 469} {"train_loss": -5.236541748046875, "global_step": 19736, "epoch": 469} {"train_loss": -5.328814506530762, "global_step": 19737, "epoch": 469} {"train_loss": -5.145843505859375, "global_step": 19738, "epoch": 469} {"train_loss": -5.265794050125849, "global_step": 19739, "epoch": 469, "val_loss": 68384.703125} {"train_loss": -5.165379524230957, "global_step": 19740, "epoch": 470} {"train_loss": -5.2522358894348145, "global_step": 19741, "epoch": 470} {"train_loss": -5.213000297546387, "global_step": 19742, "epoch": 470} {"train_loss": -5.3891096115112305, "global_step": 19743, "epoch": 470} {"train_loss": -5.38693904876709, "global_step": 19744, "epoch": 470} {"train_loss": -5.227181434631348, "global_step": 19745, "epoch": 470} {"train_loss": -5.162798881530762, "global_step": 19746, "epoch": 470} {"train_loss": -5.307981491088867, "global_step": 19747, "epoch": 470} {"train_loss": -5.159201622009277, "global_step": 19748, "epoch": 470} {"train_loss": -5.226059913635254, "global_step": 19749, "epoch": 470} {"train_loss": -5.2168779373168945, "global_step": 19750, "epoch": 470} {"train_loss": -5.285630226135254, "global_step": 19751, "epoch": 470} {"train_loss": -5.409374713897705, "global_step": 19752, "epoch": 470} {"train_loss": -5.2738776206970215, "global_step": 19753, "epoch": 470} {"train_loss": -5.251914024353027, "global_step": 19754, "epoch": 470} {"train_loss": -5.257904529571533, "global_step": 19755, "epoch": 470} {"train_loss": -5.324029445648193, "global_step": 19756, "epoch": 470} {"train_loss": -5.436079978942871, "global_step": 19757, "epoch": 470} {"train_loss": -5.33951473236084, "global_step": 19758, "epoch": 470} {"train_loss": -5.21645450592041, "global_step": 19759, "epoch": 470} {"train_loss": -5.283219337463379, "global_step": 19760, "epoch": 470} {"train_loss": -5.192338943481445, "global_step": 19761, "epoch": 470} {"train_loss": -5.432004928588867, "global_step": 19762, "epoch": 470} {"train_loss": -5.435908317565918, "global_step": 19763, "epoch": 470} {"train_loss": -5.530875205993652, "global_step": 19764, "epoch": 470} {"train_loss": -5.278465270996094, "global_step": 19765, "epoch": 470} {"train_loss": -5.333080291748047, "global_step": 19766, "epoch": 470} {"train_loss": -5.391295433044434, "global_step": 19767, "epoch": 470} {"train_loss": -5.373528003692627, "global_step": 19768, "epoch": 470} {"train_loss": -5.381087303161621, "global_step": 19769, "epoch": 470} {"train_loss": -5.339879989624023, "global_step": 19770, "epoch": 470} {"train_loss": -5.460980415344238, "global_step": 19771, "epoch": 470} {"train_loss": -5.164678573608398, "global_step": 19772, "epoch": 470} {"train_loss": -5.358173370361328, "global_step": 19773, "epoch": 470} {"train_loss": -5.397854804992676, "global_step": 19774, "epoch": 470} {"train_loss": -5.297174453735352, "global_step": 19775, "epoch": 470} {"train_loss": -5.2295637130737305, "global_step": 19776, "epoch": 470} {"train_loss": -5.256828308105469, "global_step": 19777, "epoch": 470} {"train_loss": -5.345438003540039, "global_step": 19778, "epoch": 470} {"train_loss": -5.299811840057373, "global_step": 19779, "epoch": 470} {"train_loss": -5.244431972503662, "global_step": 19780, "epoch": 470} {"train_loss": -5.304658095041911, "global_step": 19781, "epoch": 470, "val_loss": 67825.1484375} {"train_loss": -5.2889227867126465, "global_step": 19782, "epoch": 471} {"train_loss": -5.244383335113525, "global_step": 19783, "epoch": 471} {"train_loss": -5.221158027648926, "global_step": 19784, "epoch": 471} {"train_loss": -5.28782320022583, "global_step": 19785, "epoch": 471} {"train_loss": -5.438549995422363, "global_step": 19786, "epoch": 471} {"train_loss": -5.176800727844238, "global_step": 19787, "epoch": 471} {"train_loss": -5.119246482849121, "global_step": 19788, "epoch": 471} {"train_loss": -5.404694557189941, "global_step": 19789, "epoch": 471} {"train_loss": -5.296368598937988, "global_step": 19790, "epoch": 471} {"train_loss": -5.2598772048950195, "global_step": 19791, "epoch": 471} {"train_loss": -5.371565818786621, "global_step": 19792, "epoch": 471} {"train_loss": -5.162373065948486, "global_step": 19793, "epoch": 471} {"train_loss": -5.312782287597656, "global_step": 19794, "epoch": 471} {"train_loss": -5.2142438888549805, "global_step": 19795, "epoch": 471} {"train_loss": -5.323212146759033, "global_step": 19796, "epoch": 471} {"train_loss": -5.323380470275879, "global_step": 19797, "epoch": 471} {"train_loss": -5.346086025238037, "global_step": 19798, "epoch": 471} {"train_loss": -5.21417236328125, "global_step": 19799, "epoch": 471} {"train_loss": -5.338654518127441, "global_step": 19800, "epoch": 471} {"train_loss": -5.308935165405273, "global_step": 19801, "epoch": 471} {"train_loss": -5.245330810546875, "global_step": 19802, "epoch": 471} {"train_loss": -5.19044303894043, "global_step": 19803, "epoch": 471} {"train_loss": -5.229079246520996, "global_step": 19804, "epoch": 471} {"train_loss": -5.229746341705322, "global_step": 19805, "epoch": 471} {"train_loss": -5.164366245269775, "global_step": 19806, "epoch": 471} {"train_loss": -5.225801467895508, "global_step": 19807, "epoch": 471} {"train_loss": -5.329112529754639, "global_step": 19808, "epoch": 471} {"train_loss": -5.230504035949707, "global_step": 19809, "epoch": 471} {"train_loss": -5.339735984802246, "global_step": 19810, "epoch": 471} {"train_loss": -5.274611949920654, "global_step": 19811, "epoch": 471} {"train_loss": -5.258871078491211, "global_step": 19812, "epoch": 471} {"train_loss": -5.382499694824219, "global_step": 19813, "epoch": 471} {"train_loss": -5.24539852142334, "global_step": 19814, "epoch": 471} {"train_loss": -5.391510009765625, "global_step": 19815, "epoch": 471} {"train_loss": -5.24733304977417, "global_step": 19816, "epoch": 471} {"train_loss": -5.316178798675537, "global_step": 19817, "epoch": 471} {"train_loss": -5.3454203605651855, "global_step": 19818, "epoch": 471} {"train_loss": -5.281749725341797, "global_step": 19819, "epoch": 471} {"train_loss": -5.313462257385254, "global_step": 19820, "epoch": 471} {"train_loss": -5.331954002380371, "global_step": 19821, "epoch": 471} {"train_loss": -5.369729518890381, "global_step": 19822, "epoch": 471} {"train_loss": -5.280288684935797, "global_step": 19823, "epoch": 471, "val_loss": 67738.2734375} {"train_loss": -5.217601776123047, "global_step": 19824, "epoch": 472} {"train_loss": -5.328612804412842, "global_step": 19825, "epoch": 472} {"train_loss": -5.242000579833984, "global_step": 19826, "epoch": 472} {"train_loss": -5.2641754150390625, "global_step": 19827, "epoch": 472} {"train_loss": -5.2740631103515625, "global_step": 19828, "epoch": 472} {"train_loss": -5.253718376159668, "global_step": 19829, "epoch": 472} {"train_loss": -5.233659267425537, "global_step": 19830, "epoch": 472} {"train_loss": -5.2978925704956055, "global_step": 19831, "epoch": 472} {"train_loss": -5.220944404602051, "global_step": 19832, "epoch": 472} {"train_loss": -5.345186233520508, "global_step": 19833, "epoch": 472} {"train_loss": -5.247812271118164, "global_step": 19834, "epoch": 472} {"train_loss": -5.200260162353516, "global_step": 19835, "epoch": 472} {"train_loss": -5.311794281005859, "global_step": 19836, "epoch": 472} {"train_loss": -5.2880120277404785, "global_step": 19837, "epoch": 472} {"train_loss": -5.280966758728027, "global_step": 19838, "epoch": 472} {"train_loss": -5.195356369018555, "global_step": 19839, "epoch": 472} {"train_loss": -5.3197102546691895, "global_step": 19840, "epoch": 472} {"train_loss": -5.403469562530518, "global_step": 19841, "epoch": 472} {"train_loss": -5.380744934082031, "global_step": 19842, "epoch": 472} {"train_loss": -5.200629711151123, "global_step": 19843, "epoch": 472} {"train_loss": -5.302087306976318, "global_step": 19844, "epoch": 472} {"train_loss": -5.24920654296875, "global_step": 19845, "epoch": 472} {"train_loss": -5.297238349914551, "global_step": 19846, "epoch": 472} {"train_loss": -5.208968162536621, "global_step": 19847, "epoch": 472} {"train_loss": -5.296566963195801, "global_step": 19848, "epoch": 472} {"train_loss": -5.258659362792969, "global_step": 19849, "epoch": 472} {"train_loss": -5.155295372009277, "global_step": 19850, "epoch": 472} {"train_loss": -5.230304718017578, "global_step": 19851, "epoch": 472} {"train_loss": -5.409207344055176, "global_step": 19852, "epoch": 472} {"train_loss": -5.259609222412109, "global_step": 19853, "epoch": 472} {"train_loss": -5.377415180206299, "global_step": 19854, "epoch": 472} {"train_loss": -5.326455116271973, "global_step": 19855, "epoch": 472} {"train_loss": -5.16342830657959, "global_step": 19856, "epoch": 472} {"train_loss": -5.236062049865723, "global_step": 19857, "epoch": 472} {"train_loss": -5.34140682220459, "global_step": 19858, "epoch": 472} {"train_loss": -5.412304401397705, "global_step": 19859, "epoch": 472} {"train_loss": -5.381649971008301, "global_step": 19860, "epoch": 472} {"train_loss": -5.234450340270996, "global_step": 19861, "epoch": 472} {"train_loss": -5.441607475280762, "global_step": 19862, "epoch": 472} {"train_loss": -5.308791160583496, "global_step": 19863, "epoch": 472} {"train_loss": -5.140341281890869, "global_step": 19864, "epoch": 472} {"train_loss": -5.283026638485136, "global_step": 19865, "epoch": 472, "val_loss": 67375.921875} {"train_loss": -5.350743770599365, "global_step": 19866, "epoch": 473} {"train_loss": -5.428207874298096, "global_step": 19867, "epoch": 473} {"train_loss": -5.367251396179199, "global_step": 19868, "epoch": 473} {"train_loss": -5.181851387023926, "global_step": 19869, "epoch": 473} {"train_loss": -5.290383338928223, "global_step": 19870, "epoch": 473} {"train_loss": -5.255971908569336, "global_step": 19871, "epoch": 473} {"train_loss": -5.546167373657227, "global_step": 19872, "epoch": 473} {"train_loss": -5.210020065307617, "global_step": 19873, "epoch": 473} {"train_loss": -5.363595008850098, "global_step": 19874, "epoch": 473} {"train_loss": -5.309913635253906, "global_step": 19875, "epoch": 473} {"train_loss": -5.484552383422852, "global_step": 19876, "epoch": 473} {"train_loss": -5.306119441986084, "global_step": 19877, "epoch": 473} {"train_loss": -5.248476028442383, "global_step": 19878, "epoch": 473} {"train_loss": -5.397290229797363, "global_step": 19879, "epoch": 473} {"train_loss": -5.293692588806152, "global_step": 19880, "epoch": 473} {"train_loss": -5.139441013336182, "global_step": 19881, "epoch": 473} {"train_loss": -5.247745513916016, "global_step": 19882, "epoch": 473} {"train_loss": -5.252032279968262, "global_step": 19883, "epoch": 473} {"train_loss": -5.348313808441162, "global_step": 19884, "epoch": 473} {"train_loss": -5.2510576248168945, "global_step": 19885, "epoch": 473} {"train_loss": -5.374432563781738, "global_step": 19886, "epoch": 473} {"train_loss": -5.399108409881592, "global_step": 19887, "epoch": 473} {"train_loss": -5.228419303894043, "global_step": 19888, "epoch": 473} {"train_loss": -5.333650588989258, "global_step": 19889, "epoch": 473} {"train_loss": -5.017273902893066, "global_step": 19890, "epoch": 473} {"train_loss": -5.307802200317383, "global_step": 19891, "epoch": 473} {"train_loss": -5.343446731567383, "global_step": 19892, "epoch": 473} {"train_loss": -5.272574424743652, "global_step": 19893, "epoch": 473} {"train_loss": -5.3026814460754395, "global_step": 19894, "epoch": 473} {"train_loss": -5.270904541015625, "global_step": 19895, "epoch": 473} {"train_loss": -5.3156280517578125, "global_step": 19896, "epoch": 473} {"train_loss": -5.370059490203857, "global_step": 19897, "epoch": 473} {"train_loss": -5.281811237335205, "global_step": 19898, "epoch": 473} {"train_loss": -5.354744911193848, "global_step": 19899, "epoch": 473} {"train_loss": -5.139606475830078, "global_step": 19900, "epoch": 473} {"train_loss": -5.267960548400879, "global_step": 19901, "epoch": 473} {"train_loss": -5.316440105438232, "global_step": 19902, "epoch": 473} {"train_loss": -5.25160026550293, "global_step": 19903, "epoch": 473} {"train_loss": -5.214916706085205, "global_step": 19904, "epoch": 473} {"train_loss": -5.306742191314697, "global_step": 19905, "epoch": 473} {"train_loss": -5.379773139953613, "global_step": 19906, "epoch": 473} {"train_loss": -5.300188064575195, "global_step": 19907, "epoch": 473, "val_loss": 67444.9609375} {"train_loss": -5.354788780212402, "global_step": 19908, "epoch": 474} {"train_loss": -5.323031425476074, "global_step": 19909, "epoch": 474} {"train_loss": -5.446907997131348, "global_step": 19910, "epoch": 474} {"train_loss": -5.311076641082764, "global_step": 19911, "epoch": 474} {"train_loss": -5.3668928146362305, "global_step": 19912, "epoch": 474} {"train_loss": -5.389842510223389, "global_step": 19913, "epoch": 474} {"train_loss": -5.305776119232178, "global_step": 19914, "epoch": 474} {"train_loss": -5.3256754875183105, "global_step": 19915, "epoch": 474} {"train_loss": -5.378769874572754, "global_step": 19916, "epoch": 474} {"train_loss": -5.298769474029541, "global_step": 19917, "epoch": 474} {"train_loss": -5.4173431396484375, "global_step": 19918, "epoch": 474} {"train_loss": -5.417085647583008, "global_step": 19919, "epoch": 474} {"train_loss": -5.437737464904785, "global_step": 19920, "epoch": 474} {"train_loss": -5.21888542175293, "global_step": 19921, "epoch": 474} {"train_loss": -5.266031265258789, "global_step": 19922, "epoch": 474} {"train_loss": -5.300577163696289, "global_step": 19923, "epoch": 474} {"train_loss": -5.347914695739746, "global_step": 19924, "epoch": 474} {"train_loss": -5.222283840179443, "global_step": 19925, "epoch": 474} {"train_loss": -5.370126724243164, "global_step": 19926, "epoch": 474} {"train_loss": -5.378889083862305, "global_step": 19927, "epoch": 474} {"train_loss": -5.409453868865967, "global_step": 19928, "epoch": 474} {"train_loss": -5.3815436363220215, "global_step": 19929, "epoch": 474} {"train_loss": -5.297738075256348, "global_step": 19930, "epoch": 474} {"train_loss": -5.244609832763672, "global_step": 19931, "epoch": 474} {"train_loss": -5.285027980804443, "global_step": 19932, "epoch": 474} {"train_loss": -5.2667646408081055, "global_step": 19933, "epoch": 474} {"train_loss": -5.294631004333496, "global_step": 19934, "epoch": 474} {"train_loss": -5.303590774536133, "global_step": 19935, "epoch": 474} {"train_loss": -5.140875816345215, "global_step": 19936, "epoch": 474} {"train_loss": -5.278982639312744, "global_step": 19937, "epoch": 474} {"train_loss": -5.212831974029541, "global_step": 19938, "epoch": 474} {"train_loss": -5.053998947143555, "global_step": 19939, "epoch": 474} {"train_loss": -5.202516078948975, "global_step": 19940, "epoch": 474} {"train_loss": -5.470180511474609, "global_step": 19941, "epoch": 474} {"train_loss": -5.179765701293945, "global_step": 19942, "epoch": 474} {"train_loss": -5.132715702056885, "global_step": 19943, "epoch": 474} {"train_loss": -5.362643718719482, "global_step": 19944, "epoch": 474} {"train_loss": -5.185826301574707, "global_step": 19945, "epoch": 474} {"train_loss": -5.261746883392334, "global_step": 19946, "epoch": 474} {"train_loss": -5.132201194763184, "global_step": 19947, "epoch": 474} {"train_loss": -5.19169807434082, "global_step": 19948, "epoch": 474} {"train_loss": -5.294784682137625, "global_step": 19949, "epoch": 474, "val_loss": 67527.0078125} {"train_loss": -5.364618301391602, "global_step": 19950, "epoch": 475} {"train_loss": -5.3164873123168945, "global_step": 19951, "epoch": 475} {"train_loss": -5.15821647644043, "global_step": 19952, "epoch": 475} {"train_loss": -5.297674179077148, "global_step": 19953, "epoch": 475} {"train_loss": -5.419057846069336, "global_step": 19954, "epoch": 475} {"train_loss": -5.212368011474609, "global_step": 19955, "epoch": 475} {"train_loss": -5.281881332397461, "global_step": 19956, "epoch": 475} {"train_loss": -5.28638219833374, "global_step": 19957, "epoch": 475} {"train_loss": -5.080600738525391, "global_step": 19958, "epoch": 475} {"train_loss": -5.298398971557617, "global_step": 19959, "epoch": 475} {"train_loss": -5.324126243591309, "global_step": 19960, "epoch": 475} {"train_loss": -5.144880294799805, "global_step": 19961, "epoch": 475} {"train_loss": -5.272189140319824, "global_step": 19962, "epoch": 475} {"train_loss": -5.314739227294922, "global_step": 19963, "epoch": 475} {"train_loss": -5.333477973937988, "global_step": 19964, "epoch": 475} {"train_loss": -5.2952561378479, "global_step": 19965, "epoch": 475} {"train_loss": -5.335760116577148, "global_step": 19966, "epoch": 475} {"train_loss": -5.227807998657227, "global_step": 19967, "epoch": 475} {"train_loss": -5.261146068572998, "global_step": 19968, "epoch": 475} {"train_loss": -5.334743499755859, "global_step": 19969, "epoch": 475} {"train_loss": -5.42808723449707, "global_step": 19970, "epoch": 475} {"train_loss": -5.409184455871582, "global_step": 19971, "epoch": 475} {"train_loss": -5.310965538024902, "global_step": 19972, "epoch": 475} {"train_loss": -5.310208320617676, "global_step": 19973, "epoch": 475} {"train_loss": -5.327936172485352, "global_step": 19974, "epoch": 475} {"train_loss": -5.4201459884643555, "global_step": 19975, "epoch": 475} {"train_loss": -5.500924587249756, "global_step": 19976, "epoch": 475} {"train_loss": -5.3199357986450195, "global_step": 19977, "epoch": 475} {"train_loss": -5.443670749664307, "global_step": 19978, "epoch": 475} {"train_loss": -5.324429512023926, "global_step": 19979, "epoch": 475} {"train_loss": -5.325999736785889, "global_step": 19980, "epoch": 475} {"train_loss": -5.3199920654296875, "global_step": 19981, "epoch": 475} {"train_loss": -5.335880756378174, "global_step": 19982, "epoch": 475} {"train_loss": -5.197394371032715, "global_step": 19983, "epoch": 475} {"train_loss": -5.150940895080566, "global_step": 19984, "epoch": 475} {"train_loss": -5.215909957885742, "global_step": 19985, "epoch": 475} {"train_loss": -5.291225910186768, "global_step": 19986, "epoch": 475} {"train_loss": -5.265825271606445, "global_step": 19987, "epoch": 475} {"train_loss": -5.357790946960449, "global_step": 19988, "epoch": 475} {"train_loss": -5.256232261657715, "global_step": 19989, "epoch": 475} {"train_loss": -5.234164237976074, "global_step": 19990, "epoch": 475} {"train_loss": -5.299974725359962, "global_step": 19991, "epoch": 475, "val_loss": 67264.578125} {"train_loss": -5.28175687789917, "global_step": 19992, "epoch": 476} {"train_loss": -5.387572765350342, "global_step": 19993, "epoch": 476} {"train_loss": -5.274728298187256, "global_step": 19994, "epoch": 476} {"train_loss": -5.191710472106934, "global_step": 19995, "epoch": 476} {"train_loss": -5.242380142211914, "global_step": 19996, "epoch": 476} {"train_loss": -5.2249932289123535, "global_step": 19997, "epoch": 476} {"train_loss": -5.3572468757629395, "global_step": 19998, "epoch": 476} {"train_loss": -5.144378185272217, "global_step": 19999, "epoch": 476} {"train_loss": -5.150349140167236, "global_step": 20000, "epoch": 476} {"train_loss": -5.279543876647949, "global_step": 20001, "epoch": 476} {"train_loss": -5.153480529785156, "global_step": 20002, "epoch": 476} {"train_loss": -5.194536209106445, "global_step": 20003, "epoch": 476} {"train_loss": -5.442587852478027, "global_step": 20004, "epoch": 476} {"train_loss": -5.246567249298096, "global_step": 20005, "epoch": 476} {"train_loss": -5.2195844650268555, "global_step": 20006, "epoch": 476} {"train_loss": -5.372097969055176, "global_step": 20007, "epoch": 476} {"train_loss": -5.38697624206543, "global_step": 20008, "epoch": 476} {"train_loss": -5.357792854309082, "global_step": 20009, "epoch": 476} {"train_loss": -5.237306118011475, "global_step": 20010, "epoch": 476} {"train_loss": -5.339154243469238, "global_step": 20011, "epoch": 476} {"train_loss": -5.358404636383057, "global_step": 20012, "epoch": 476} {"train_loss": -5.288999557495117, "global_step": 20013, "epoch": 476} {"train_loss": -5.324005126953125, "global_step": 20014, "epoch": 476} {"train_loss": -5.351912021636963, "global_step": 20015, "epoch": 476} {"train_loss": -5.268344402313232, "global_step": 20016, "epoch": 476} {"train_loss": -5.40264892578125, "global_step": 20017, "epoch": 476} {"train_loss": -5.383056640625, "global_step": 20018, "epoch": 476} {"train_loss": -5.298216819763184, "global_step": 20019, "epoch": 476} {"train_loss": -5.3362274169921875, "global_step": 20020, "epoch": 476} {"train_loss": -5.295921325683594, "global_step": 20021, "epoch": 476} {"train_loss": -5.234868049621582, "global_step": 20022, "epoch": 476} {"train_loss": -5.317441940307617, "global_step": 20023, "epoch": 476} {"train_loss": -5.230189323425293, "global_step": 20024, "epoch": 476} {"train_loss": -5.320569038391113, "global_step": 20025, "epoch": 476} {"train_loss": -5.338273048400879, "global_step": 20026, "epoch": 476} {"train_loss": -5.343901634216309, "global_step": 20027, "epoch": 476} {"train_loss": -5.1664719581604, "global_step": 20028, "epoch": 476} {"train_loss": -5.049393653869629, "global_step": 20029, "epoch": 476} {"train_loss": -5.25922155380249, "global_step": 20030, "epoch": 476} {"train_loss": -5.355798244476318, "global_step": 20031, "epoch": 476} {"train_loss": -5.107665061950684, "global_step": 20032, "epoch": 476} {"train_loss": -5.27992844581604, "global_step": 20033, "epoch": 476, "val_loss": 67229.0} {"train_loss": -5.350168228149414, "global_step": 20034, "epoch": 477} {"train_loss": -5.3239359855651855, "global_step": 20035, "epoch": 477} {"train_loss": -5.284553527832031, "global_step": 20036, "epoch": 477} {"train_loss": -5.395033836364746, "global_step": 20037, "epoch": 477} {"train_loss": -5.370954513549805, "global_step": 20038, "epoch": 477} {"train_loss": -5.195159912109375, "global_step": 20039, "epoch": 477} {"train_loss": -5.36803674697876, "global_step": 20040, "epoch": 477} {"train_loss": -5.221797466278076, "global_step": 20041, "epoch": 477} {"train_loss": -5.1576738357543945, "global_step": 20042, "epoch": 477} {"train_loss": -5.401012897491455, "global_step": 20043, "epoch": 477} {"train_loss": -5.37300443649292, "global_step": 20044, "epoch": 477} {"train_loss": -5.258066177368164, "global_step": 20045, "epoch": 477} {"train_loss": -5.373541831970215, "global_step": 20046, "epoch": 477} {"train_loss": -5.270940780639648, "global_step": 20047, "epoch": 477} {"train_loss": -5.210442543029785, "global_step": 20048, "epoch": 477} {"train_loss": -5.13413143157959, "global_step": 20049, "epoch": 477} {"train_loss": -5.3515238761901855, "global_step": 20050, "epoch": 477} {"train_loss": -5.284205913543701, "global_step": 20051, "epoch": 477} {"train_loss": -5.24862003326416, "global_step": 20052, "epoch": 477} {"train_loss": -5.3270463943481445, "global_step": 20053, "epoch": 477} {"train_loss": -5.208832263946533, "global_step": 20054, "epoch": 477} {"train_loss": -5.470398902893066, "global_step": 20055, "epoch": 477} {"train_loss": -5.234298229217529, "global_step": 20056, "epoch": 477} {"train_loss": -5.19893741607666, "global_step": 20057, "epoch": 477} {"train_loss": -5.326077938079834, "global_step": 20058, "epoch": 477} {"train_loss": -5.365944862365723, "global_step": 20059, "epoch": 477} {"train_loss": -5.400997161865234, "global_step": 20060, "epoch": 477} {"train_loss": -5.444522857666016, "global_step": 20061, "epoch": 477} {"train_loss": -5.441195487976074, "global_step": 20062, "epoch": 477} {"train_loss": -5.298135280609131, "global_step": 20063, "epoch": 477} {"train_loss": -5.429214954376221, "global_step": 20064, "epoch": 477} {"train_loss": -5.300827980041504, "global_step": 20065, "epoch": 477} {"train_loss": -5.243515968322754, "global_step": 20066, "epoch": 477} {"train_loss": -5.3002777099609375, "global_step": 20067, "epoch": 477} {"train_loss": -5.25759220123291, "global_step": 20068, "epoch": 477} {"train_loss": -5.340620994567871, "global_step": 20069, "epoch": 477} {"train_loss": -5.4243927001953125, "global_step": 20070, "epoch": 477} {"train_loss": -5.21675968170166, "global_step": 20071, "epoch": 477} {"train_loss": -5.160039901733398, "global_step": 20072, "epoch": 477} {"train_loss": -5.239691734313965, "global_step": 20073, "epoch": 477} {"train_loss": -5.177272319793701, "global_step": 20074, "epoch": 477} {"train_loss": -5.300385906582787, "global_step": 20075, "epoch": 477, "val_loss": 67216.4140625} {"train_loss": -5.387845039367676, "global_step": 20076, "epoch": 478} {"train_loss": -5.155787467956543, "global_step": 20077, "epoch": 478} {"train_loss": -5.357538223266602, "global_step": 20078, "epoch": 478} {"train_loss": -5.4232988357543945, "global_step": 20079, "epoch": 478} {"train_loss": -5.222245216369629, "global_step": 20080, "epoch": 478} {"train_loss": -5.271408557891846, "global_step": 20081, "epoch": 478} {"train_loss": -5.419105529785156, "global_step": 20082, "epoch": 478} {"train_loss": -5.345460891723633, "global_step": 20083, "epoch": 478} {"train_loss": -5.378597259521484, "global_step": 20084, "epoch": 478} {"train_loss": -5.288797378540039, "global_step": 20085, "epoch": 478} {"train_loss": -5.4102582931518555, "global_step": 20086, "epoch": 478} {"train_loss": -5.284512519836426, "global_step": 20087, "epoch": 478} {"train_loss": -5.312813758850098, "global_step": 20088, "epoch": 478} {"train_loss": -5.1956658363342285, "global_step": 20089, "epoch": 478} {"train_loss": -5.303172588348389, "global_step": 20090, "epoch": 478} {"train_loss": -5.299005508422852, "global_step": 20091, "epoch": 478} {"train_loss": -5.265976905822754, "global_step": 20092, "epoch": 478} {"train_loss": -5.266840934753418, "global_step": 20093, "epoch": 478} {"train_loss": -5.26242208480835, "global_step": 20094, "epoch": 478} {"train_loss": -5.301250457763672, "global_step": 20095, "epoch": 478} {"train_loss": -5.302342414855957, "global_step": 20096, "epoch": 478} {"train_loss": -5.264465808868408, "global_step": 20097, "epoch": 478} {"train_loss": -5.285726070404053, "global_step": 20098, "epoch": 478} {"train_loss": -5.091470718383789, "global_step": 20099, "epoch": 478} {"train_loss": -5.448532581329346, "global_step": 20100, "epoch": 478} {"train_loss": -5.307919502258301, "global_step": 20101, "epoch": 478} {"train_loss": -5.210176944732666, "global_step": 20102, "epoch": 478} {"train_loss": -5.298393249511719, "global_step": 20103, "epoch": 478} {"train_loss": -5.411209583282471, "global_step": 20104, "epoch": 478} {"train_loss": -5.28856086730957, "global_step": 20105, "epoch": 478} {"train_loss": -5.292397975921631, "global_step": 20106, "epoch": 478} {"train_loss": -5.411282539367676, "global_step": 20107, "epoch": 478} {"train_loss": -5.335173606872559, "global_step": 20108, "epoch": 478} {"train_loss": -5.215029716491699, "global_step": 20109, "epoch": 478} {"train_loss": -5.37397575378418, "global_step": 20110, "epoch": 478} {"train_loss": -5.151509761810303, "global_step": 20111, "epoch": 478} {"train_loss": -5.225581169128418, "global_step": 20112, "epoch": 478} {"train_loss": -5.350746154785156, "global_step": 20113, "epoch": 478} {"train_loss": -5.325898170471191, "global_step": 20114, "epoch": 478} {"train_loss": -5.465399265289307, "global_step": 20115, "epoch": 478} {"train_loss": -5.2375664710998535, "global_step": 20116, "epoch": 478} {"train_loss": -5.300339278720674, "global_step": 20117, "epoch": 478, "val_loss": 67375.5234375} {"train_loss": -5.357038497924805, "global_step": 20118, "epoch": 479} {"train_loss": -5.338402271270752, "global_step": 20119, "epoch": 479} {"train_loss": -5.331556797027588, "global_step": 20120, "epoch": 479} {"train_loss": -5.280341148376465, "global_step": 20121, "epoch": 479} {"train_loss": -5.217388153076172, "global_step": 20122, "epoch": 479} {"train_loss": -5.504537582397461, "global_step": 20123, "epoch": 479} {"train_loss": -5.3572282791137695, "global_step": 20124, "epoch": 479} {"train_loss": -5.282580375671387, "global_step": 20125, "epoch": 479} {"train_loss": -5.233338832855225, "global_step": 20126, "epoch": 479} {"train_loss": -5.5094194412231445, "global_step": 20127, "epoch": 479} {"train_loss": -5.171655654907227, "global_step": 20128, "epoch": 479} {"train_loss": -5.241642951965332, "global_step": 20129, "epoch": 479} {"train_loss": -5.286028861999512, "global_step": 20130, "epoch": 479} {"train_loss": -5.208051681518555, "global_step": 20131, "epoch": 479} {"train_loss": -5.545722961425781, "global_step": 20132, "epoch": 479} {"train_loss": -5.350828170776367, "global_step": 20133, "epoch": 479} {"train_loss": -5.183870315551758, "global_step": 20134, "epoch": 479} {"train_loss": -5.296550750732422, "global_step": 20135, "epoch": 479} {"train_loss": -5.3284783363342285, "global_step": 20136, "epoch": 479} {"train_loss": -5.261048316955566, "global_step": 20137, "epoch": 479} {"train_loss": -5.346729278564453, "global_step": 20138, "epoch": 479} {"train_loss": -5.232290267944336, "global_step": 20139, "epoch": 479} {"train_loss": -5.414558410644531, "global_step": 20140, "epoch": 479} {"train_loss": -5.3631463050842285, "global_step": 20141, "epoch": 479} {"train_loss": -5.29455041885376, "global_step": 20142, "epoch": 479} {"train_loss": -5.322680473327637, "global_step": 20143, "epoch": 479} {"train_loss": -5.269033432006836, "global_step": 20144, "epoch": 479} {"train_loss": -5.287839889526367, "global_step": 20145, "epoch": 479} {"train_loss": -5.451764106750488, "global_step": 20146, "epoch": 479} {"train_loss": -5.459432601928711, "global_step": 20147, "epoch": 479} {"train_loss": -5.182995796203613, "global_step": 20148, "epoch": 479} {"train_loss": -5.335793495178223, "global_step": 20149, "epoch": 479} {"train_loss": -5.24235200881958, "global_step": 20150, "epoch": 479} {"train_loss": -5.149385452270508, "global_step": 20151, "epoch": 479} {"train_loss": -5.3216776847839355, "global_step": 20152, "epoch": 479} {"train_loss": -5.369929313659668, "global_step": 20153, "epoch": 479} {"train_loss": -5.369766712188721, "global_step": 20154, "epoch": 479} {"train_loss": -5.239795684814453, "global_step": 20155, "epoch": 479} {"train_loss": -5.379110336303711, "global_step": 20156, "epoch": 479} {"train_loss": -5.352071285247803, "global_step": 20157, "epoch": 479} {"train_loss": -5.090806007385254, "global_step": 20158, "epoch": 479} {"train_loss": -5.307092155729022, "global_step": 20159, "epoch": 479, "val_loss": 67437.65625} {"train_loss": -5.167325496673584, "global_step": 20160, "epoch": 480} {"train_loss": -5.175357818603516, "global_step": 20161, "epoch": 480} {"train_loss": -5.319513320922852, "global_step": 20162, "epoch": 480} {"train_loss": -5.291492938995361, "global_step": 20163, "epoch": 480} {"train_loss": -5.378594875335693, "global_step": 20164, "epoch": 480} {"train_loss": -5.218692779541016, "global_step": 20165, "epoch": 480} {"train_loss": -5.280093669891357, "global_step": 20166, "epoch": 480} {"train_loss": -5.319750785827637, "global_step": 20167, "epoch": 480} {"train_loss": -5.185042381286621, "global_step": 20168, "epoch": 480} {"train_loss": -5.35839319229126, "global_step": 20169, "epoch": 480} {"train_loss": -5.330382347106934, "global_step": 20170, "epoch": 480} {"train_loss": -5.218024253845215, "global_step": 20171, "epoch": 480} {"train_loss": -5.361407279968262, "global_step": 20172, "epoch": 480} {"train_loss": -5.136141777038574, "global_step": 20173, "epoch": 480} {"train_loss": -5.1230926513671875, "global_step": 20174, "epoch": 480} {"train_loss": -5.3441314697265625, "global_step": 20175, "epoch": 480} {"train_loss": -5.276740074157715, "global_step": 20176, "epoch": 480} {"train_loss": -5.341703414916992, "global_step": 20177, "epoch": 480} {"train_loss": -5.210421085357666, "global_step": 20178, "epoch": 480} {"train_loss": -5.372549533843994, "global_step": 20179, "epoch": 480} {"train_loss": -5.366392612457275, "global_step": 20180, "epoch": 480} {"train_loss": -5.393472671508789, "global_step": 20181, "epoch": 480} {"train_loss": -5.297229766845703, "global_step": 20182, "epoch": 480} {"train_loss": -5.2005934715271, "global_step": 20183, "epoch": 480} {"train_loss": -5.254961967468262, "global_step": 20184, "epoch": 480} {"train_loss": -5.274723529815674, "global_step": 20185, "epoch": 480} {"train_loss": -5.293155670166016, "global_step": 20186, "epoch": 480} {"train_loss": -5.332211494445801, "global_step": 20187, "epoch": 480} {"train_loss": -5.270627498626709, "global_step": 20188, "epoch": 480} {"train_loss": -5.342930316925049, "global_step": 20189, "epoch": 480} {"train_loss": -5.417520046234131, "global_step": 20190, "epoch": 480} {"train_loss": -5.367830276489258, "global_step": 20191, "epoch": 480} {"train_loss": -5.413702011108398, "global_step": 20192, "epoch": 480} {"train_loss": -5.306670188903809, "global_step": 20193, "epoch": 480} {"train_loss": -5.40866231918335, "global_step": 20194, "epoch": 480} {"train_loss": -5.185183048248291, "global_step": 20195, "epoch": 480} {"train_loss": -5.238277435302734, "global_step": 20196, "epoch": 480} {"train_loss": -5.352762699127197, "global_step": 20197, "epoch": 480} {"train_loss": -5.296031475067139, "global_step": 20198, "epoch": 480} {"train_loss": -5.30444860458374, "global_step": 20199, "epoch": 480} {"train_loss": -5.210207939147949, "global_step": 20200, "epoch": 480} {"train_loss": -5.291547627676101, "global_step": 20201, "epoch": 480, "val_loss": 67546.609375} {"train_loss": -5.322904586791992, "global_step": 20202, "epoch": 481} {"train_loss": -5.363616943359375, "global_step": 20203, "epoch": 481} {"train_loss": -5.329303741455078, "global_step": 20204, "epoch": 481} {"train_loss": -5.10093879699707, "global_step": 20205, "epoch": 481} {"train_loss": -5.3484978675842285, "global_step": 20206, "epoch": 481} {"train_loss": -5.379823684692383, "global_step": 20207, "epoch": 481} {"train_loss": -5.353230953216553, "global_step": 20208, "epoch": 481} {"train_loss": -5.309929847717285, "global_step": 20209, "epoch": 481} {"train_loss": -5.35298490524292, "global_step": 20210, "epoch": 481} {"train_loss": -5.358973026275635, "global_step": 20211, "epoch": 481} {"train_loss": -5.220965385437012, "global_step": 20212, "epoch": 481} {"train_loss": -5.322977542877197, "global_step": 20213, "epoch": 481} {"train_loss": -5.280554294586182, "global_step": 20214, "epoch": 481} {"train_loss": -5.353004455566406, "global_step": 20215, "epoch": 481} {"train_loss": -5.460434913635254, "global_step": 20216, "epoch": 481} {"train_loss": -5.155764579772949, "global_step": 20217, "epoch": 481} {"train_loss": -5.322146415710449, "global_step": 20218, "epoch": 481} {"train_loss": -5.180802345275879, "global_step": 20219, "epoch": 481} {"train_loss": -5.377196311950684, "global_step": 20220, "epoch": 481} {"train_loss": -5.350763320922852, "global_step": 20221, "epoch": 481} {"train_loss": -5.326805114746094, "global_step": 20222, "epoch": 481} {"train_loss": -5.1585893630981445, "global_step": 20223, "epoch": 481} {"train_loss": -5.3705153465271, "global_step": 20224, "epoch": 481} {"train_loss": -5.304581642150879, "global_step": 20225, "epoch": 481} {"train_loss": -5.361788749694824, "global_step": 20226, "epoch": 481} {"train_loss": -5.335507392883301, "global_step": 20227, "epoch": 481} {"train_loss": -5.266320705413818, "global_step": 20228, "epoch": 481} {"train_loss": -5.368162155151367, "global_step": 20229, "epoch": 481} {"train_loss": -5.228856086730957, "global_step": 20230, "epoch": 481} {"train_loss": -5.296276569366455, "global_step": 20231, "epoch": 481} {"train_loss": -5.30591344833374, "global_step": 20232, "epoch": 481} {"train_loss": -5.277382850646973, "global_step": 20233, "epoch": 481} {"train_loss": -5.27011775970459, "global_step": 20234, "epoch": 481} {"train_loss": -5.291510581970215, "global_step": 20235, "epoch": 481} {"train_loss": -5.288445949554443, "global_step": 20236, "epoch": 481} {"train_loss": -5.347958564758301, "global_step": 20237, "epoch": 481} {"train_loss": -5.400933265686035, "global_step": 20238, "epoch": 481} {"train_loss": -5.14909553527832, "global_step": 20239, "epoch": 481} {"train_loss": -5.275415420532227, "global_step": 20240, "epoch": 481} {"train_loss": -5.303584098815918, "global_step": 20241, "epoch": 481} {"train_loss": -5.30924654006958, "global_step": 20242, "epoch": 481} {"train_loss": -5.308945599056425, "global_step": 20243, "epoch": 481, "val_loss": 67481.65625} {"train_loss": -5.233817100524902, "global_step": 20244, "epoch": 482} {"train_loss": -5.272865295410156, "global_step": 20245, "epoch": 482} {"train_loss": -5.302375793457031, "global_step": 20246, "epoch": 482} {"train_loss": -5.322622299194336, "global_step": 20247, "epoch": 482} {"train_loss": -5.302684307098389, "global_step": 20248, "epoch": 482} {"train_loss": -5.198207855224609, "global_step": 20249, "epoch": 482} {"train_loss": -5.327434539794922, "global_step": 20250, "epoch": 482} {"train_loss": -5.384753227233887, "global_step": 20251, "epoch": 482} {"train_loss": -5.099739074707031, "global_step": 20252, "epoch": 482} {"train_loss": -5.211916923522949, "global_step": 20253, "epoch": 482} {"train_loss": -5.227195739746094, "global_step": 20254, "epoch": 482} {"train_loss": -5.398486614227295, "global_step": 20255, "epoch": 482} {"train_loss": -5.4322099685668945, "global_step": 20256, "epoch": 482} {"train_loss": -5.269304275512695, "global_step": 20257, "epoch": 482} {"train_loss": -5.417103290557861, "global_step": 20258, "epoch": 482} {"train_loss": -5.247261047363281, "global_step": 20259, "epoch": 482} {"train_loss": -5.357960224151611, "global_step": 20260, "epoch": 482} {"train_loss": -5.333263397216797, "global_step": 20261, "epoch": 482} {"train_loss": -5.228200912475586, "global_step": 20262, "epoch": 482} {"train_loss": -5.226273536682129, "global_step": 20263, "epoch": 482} {"train_loss": -5.4000678062438965, "global_step": 20264, "epoch": 482} {"train_loss": -5.338543891906738, "global_step": 20265, "epoch": 482} {"train_loss": -5.125863075256348, "global_step": 20266, "epoch": 482} {"train_loss": -5.241117477416992, "global_step": 20267, "epoch": 482} {"train_loss": -5.179265022277832, "global_step": 20268, "epoch": 482} {"train_loss": -5.272498607635498, "global_step": 20269, "epoch": 482} {"train_loss": -5.350970268249512, "global_step": 20270, "epoch": 482} {"train_loss": -5.323321342468262, "global_step": 20271, "epoch": 482} {"train_loss": -5.291718482971191, "global_step": 20272, "epoch": 482} {"train_loss": -5.362981796264648, "global_step": 20273, "epoch": 482} {"train_loss": -5.310378074645996, "global_step": 20274, "epoch": 482} {"train_loss": -5.373282432556152, "global_step": 20275, "epoch": 482} {"train_loss": -5.346038818359375, "global_step": 20276, "epoch": 482} {"train_loss": -5.4002685546875, "global_step": 20277, "epoch": 482} {"train_loss": -5.3569231033325195, "global_step": 20278, "epoch": 482} {"train_loss": -5.239596366882324, "global_step": 20279, "epoch": 482} {"train_loss": -5.4650492668151855, "global_step": 20280, "epoch": 482} {"train_loss": -5.365143775939941, "global_step": 20281, "epoch": 482} {"train_loss": -5.272641181945801, "global_step": 20282, "epoch": 482} {"train_loss": -5.346565246582031, "global_step": 20283, "epoch": 482} {"train_loss": -5.348723411560059, "global_step": 20284, "epoch": 482} {"train_loss": -5.307535001209804, "global_step": 20285, "epoch": 482, "val_loss": 67506.8125} {"train_loss": -5.319982528686523, "global_step": 20286, "epoch": 483} {"train_loss": -5.245855808258057, "global_step": 20287, "epoch": 483} {"train_loss": -5.478201866149902, "global_step": 20288, "epoch": 483} {"train_loss": -5.4007039070129395, "global_step": 20289, "epoch": 483} {"train_loss": -5.408446311950684, "global_step": 20290, "epoch": 483} {"train_loss": -5.2127604484558105, "global_step": 20291, "epoch": 483} {"train_loss": -5.302513599395752, "global_step": 20292, "epoch": 483} {"train_loss": -5.2025346755981445, "global_step": 20293, "epoch": 483} {"train_loss": -5.392871379852295, "global_step": 20294, "epoch": 483} {"train_loss": -5.312580108642578, "global_step": 20295, "epoch": 483} {"train_loss": -5.216421127319336, "global_step": 20296, "epoch": 483} {"train_loss": -5.140069961547852, "global_step": 20297, "epoch": 483} {"train_loss": -5.270259380340576, "global_step": 20298, "epoch": 483} {"train_loss": -5.362724304199219, "global_step": 20299, "epoch": 483} {"train_loss": -5.1375274658203125, "global_step": 20300, "epoch": 483} {"train_loss": -5.192925930023193, "global_step": 20301, "epoch": 483} {"train_loss": -5.24739933013916, "global_step": 20302, "epoch": 483} {"train_loss": -5.33443546295166, "global_step": 20303, "epoch": 483} {"train_loss": -5.256260871887207, "global_step": 20304, "epoch": 483} {"train_loss": -5.333498954772949, "global_step": 20305, "epoch": 483} {"train_loss": -5.12807559967041, "global_step": 20306, "epoch": 483} {"train_loss": -5.3536529541015625, "global_step": 20307, "epoch": 483} {"train_loss": -5.349664211273193, "global_step": 20308, "epoch": 483} {"train_loss": -5.269025802612305, "global_step": 20309, "epoch": 483} {"train_loss": -5.322920799255371, "global_step": 20310, "epoch": 483} {"train_loss": -5.352599620819092, "global_step": 20311, "epoch": 483} {"train_loss": -5.3164777755737305, "global_step": 20312, "epoch": 483} {"train_loss": -5.275100231170654, "global_step": 20313, "epoch": 483} {"train_loss": -5.289207935333252, "global_step": 20314, "epoch": 483} {"train_loss": -5.325750827789307, "global_step": 20315, "epoch": 483} {"train_loss": -5.37223482131958, "global_step": 20316, "epoch": 483} {"train_loss": -5.3769755363464355, "global_step": 20317, "epoch": 483} {"train_loss": -5.369804382324219, "global_step": 20318, "epoch": 483} {"train_loss": -5.371657371520996, "global_step": 20319, "epoch": 483} {"train_loss": -5.311790466308594, "global_step": 20320, "epoch": 483} {"train_loss": -5.472069263458252, "global_step": 20321, "epoch": 483} {"train_loss": -5.1879658699035645, "global_step": 20322, "epoch": 483} {"train_loss": -5.336956024169922, "global_step": 20323, "epoch": 483} {"train_loss": -5.419318199157715, "global_step": 20324, "epoch": 483} {"train_loss": -5.160958290100098, "global_step": 20325, "epoch": 483} {"train_loss": -5.030387878417969, "global_step": 20326, "epoch": 483} {"train_loss": -5.2947202410016745, "global_step": 20327, "epoch": 483, "val_loss": 67336.46875} {"train_loss": -5.2116312980651855, "global_step": 20328, "epoch": 484} {"train_loss": -5.229144096374512, "global_step": 20329, "epoch": 484} {"train_loss": -5.208795547485352, "global_step": 20330, "epoch": 484} {"train_loss": -5.3971710205078125, "global_step": 20331, "epoch": 484} {"train_loss": -5.289618968963623, "global_step": 20332, "epoch": 484} {"train_loss": -5.324331283569336, "global_step": 20333, "epoch": 484} {"train_loss": -5.270967960357666, "global_step": 20334, "epoch": 484} {"train_loss": -5.310464859008789, "global_step": 20335, "epoch": 484} {"train_loss": -5.178118705749512, "global_step": 20336, "epoch": 484} {"train_loss": -5.211226940155029, "global_step": 20337, "epoch": 484} {"train_loss": -5.273496627807617, "global_step": 20338, "epoch": 484} {"train_loss": -5.193703651428223, "global_step": 20339, "epoch": 484} {"train_loss": -5.433907508850098, "global_step": 20340, "epoch": 484} {"train_loss": -5.356893062591553, "global_step": 20341, "epoch": 484} {"train_loss": -5.237099647521973, "global_step": 20342, "epoch": 484} {"train_loss": -5.283083438873291, "global_step": 20343, "epoch": 484} {"train_loss": -5.262271404266357, "global_step": 20344, "epoch": 484} {"train_loss": -5.284151077270508, "global_step": 20345, "epoch": 484} {"train_loss": -5.203108310699463, "global_step": 20346, "epoch": 484} {"train_loss": -5.2697529792785645, "global_step": 20347, "epoch": 484} {"train_loss": -5.356633186340332, "global_step": 20348, "epoch": 484} {"train_loss": -5.16461181640625, "global_step": 20349, "epoch": 484} {"train_loss": -5.231481552124023, "global_step": 20350, "epoch": 484} {"train_loss": -5.237821578979492, "global_step": 20351, "epoch": 484} {"train_loss": -5.290706157684326, "global_step": 20352, "epoch": 484} {"train_loss": -5.388628959655762, "global_step": 20353, "epoch": 484} {"train_loss": -5.3159661293029785, "global_step": 20354, "epoch": 484} {"train_loss": -5.281489849090576, "global_step": 20355, "epoch": 484} {"train_loss": -5.267333030700684, "global_step": 20356, "epoch": 484} {"train_loss": -5.265999794006348, "global_step": 20357, "epoch": 484} {"train_loss": -5.4168009757995605, "global_step": 20358, "epoch": 484} {"train_loss": -5.422450065612793, "global_step": 20359, "epoch": 484} {"train_loss": -5.2550458908081055, "global_step": 20360, "epoch": 484} {"train_loss": -5.338836669921875, "global_step": 20361, "epoch": 484} {"train_loss": -5.449182987213135, "global_step": 20362, "epoch": 484} {"train_loss": -5.376601219177246, "global_step": 20363, "epoch": 484} {"train_loss": -5.385885238647461, "global_step": 20364, "epoch": 484} {"train_loss": -5.263738632202148, "global_step": 20365, "epoch": 484} {"train_loss": -5.240733623504639, "global_step": 20366, "epoch": 484} {"train_loss": -5.350179672241211, "global_step": 20367, "epoch": 484} {"train_loss": -5.327267646789551, "global_step": 20368, "epoch": 484} {"train_loss": -5.295868839536395, "global_step": 20369, "epoch": 484, "val_loss": 67208.484375} {"train_loss": -5.263134002685547, "global_step": 20370, "epoch": 485} {"train_loss": -5.359050273895264, "global_step": 20371, "epoch": 485} {"train_loss": -5.341818332672119, "global_step": 20372, "epoch": 485} {"train_loss": -5.346055030822754, "global_step": 20373, "epoch": 485} {"train_loss": -5.345513343811035, "global_step": 20374, "epoch": 485} {"train_loss": -5.369053363800049, "global_step": 20375, "epoch": 485} {"train_loss": -5.365696907043457, "global_step": 20376, "epoch": 485} {"train_loss": -5.1837968826293945, "global_step": 20377, "epoch": 485} {"train_loss": -5.355032920837402, "global_step": 20378, "epoch": 485} {"train_loss": -5.273028373718262, "global_step": 20379, "epoch": 485} {"train_loss": -5.249362945556641, "global_step": 20380, "epoch": 485} {"train_loss": -5.224722385406494, "global_step": 20381, "epoch": 485} {"train_loss": -5.506956100463867, "global_step": 20382, "epoch": 485} {"train_loss": -5.220186710357666, "global_step": 20383, "epoch": 485} {"train_loss": -5.293262958526611, "global_step": 20384, "epoch": 485} {"train_loss": -5.199867248535156, "global_step": 20385, "epoch": 485} {"train_loss": -5.541730880737305, "global_step": 20386, "epoch": 485} {"train_loss": -5.363468170166016, "global_step": 20387, "epoch": 485} {"train_loss": -5.339352607727051, "global_step": 20388, "epoch": 485} {"train_loss": -5.294675827026367, "global_step": 20389, "epoch": 485} {"train_loss": -5.41252326965332, "global_step": 20390, "epoch": 485} {"train_loss": -5.4398651123046875, "global_step": 20391, "epoch": 485} {"train_loss": -5.459606647491455, "global_step": 20392, "epoch": 485} {"train_loss": -5.285648822784424, "global_step": 20393, "epoch": 485} {"train_loss": -5.2782392501831055, "global_step": 20394, "epoch": 485} {"train_loss": -5.337952613830566, "global_step": 20395, "epoch": 485} {"train_loss": -5.183732986450195, "global_step": 20396, "epoch": 485} {"train_loss": -5.332427978515625, "global_step": 20397, "epoch": 485} {"train_loss": -5.221675395965576, "global_step": 20398, "epoch": 485} {"train_loss": -5.2709059715271, "global_step": 20399, "epoch": 485} {"train_loss": -5.337518692016602, "global_step": 20400, "epoch": 485} {"train_loss": -5.290535926818848, "global_step": 20401, "epoch": 485} {"train_loss": -5.421847820281982, "global_step": 20402, "epoch": 485} {"train_loss": -5.267696380615234, "global_step": 20403, "epoch": 485} {"train_loss": -5.324585437774658, "global_step": 20404, "epoch": 485} {"train_loss": -5.31046724319458, "global_step": 20405, "epoch": 485} {"train_loss": -5.261944770812988, "global_step": 20406, "epoch": 485} {"train_loss": -5.316069602966309, "global_step": 20407, "epoch": 485} {"train_loss": -5.296656608581543, "global_step": 20408, "epoch": 485} {"train_loss": -5.268415451049805, "global_step": 20409, "epoch": 485} {"train_loss": -5.325372695922852, "global_step": 20410, "epoch": 485} {"train_loss": -5.319264230274019, "global_step": 20411, "epoch": 485, "val_loss": 67127.9453125} {"train_loss": -5.309761047363281, "global_step": 20412, "epoch": 486} {"train_loss": -5.461299419403076, "global_step": 20413, "epoch": 486} {"train_loss": -5.245328426361084, "global_step": 20414, "epoch": 486} {"train_loss": -5.204428672790527, "global_step": 20415, "epoch": 486} {"train_loss": -5.30572509765625, "global_step": 20416, "epoch": 486} {"train_loss": -5.383203506469727, "global_step": 20417, "epoch": 486} {"train_loss": -5.203283786773682, "global_step": 20418, "epoch": 486} {"train_loss": -5.295134544372559, "global_step": 20419, "epoch": 486} {"train_loss": -5.220534324645996, "global_step": 20420, "epoch": 486} {"train_loss": -5.281452178955078, "global_step": 20421, "epoch": 486} {"train_loss": -5.337052822113037, "global_step": 20422, "epoch": 486} {"train_loss": -5.167019367218018, "global_step": 20423, "epoch": 486} {"train_loss": -5.2567243576049805, "global_step": 20424, "epoch": 486} {"train_loss": -5.267566680908203, "global_step": 20425, "epoch": 486} {"train_loss": -5.3456902503967285, "global_step": 20426, "epoch": 486} {"train_loss": -5.360770225524902, "global_step": 20427, "epoch": 486} {"train_loss": -5.332104682922363, "global_step": 20428, "epoch": 486} {"train_loss": -5.25259256362915, "global_step": 20429, "epoch": 486} {"train_loss": -5.2739996910095215, "global_step": 20430, "epoch": 486} {"train_loss": -5.372715473175049, "global_step": 20431, "epoch": 486} {"train_loss": -5.212651252746582, "global_step": 20432, "epoch": 486} {"train_loss": -5.260720729827881, "global_step": 20433, "epoch": 486} {"train_loss": -5.333787441253662, "global_step": 20434, "epoch": 486} {"train_loss": -5.305359840393066, "global_step": 20435, "epoch": 486} {"train_loss": -5.292126178741455, "global_step": 20436, "epoch": 486} {"train_loss": -5.294149398803711, "global_step": 20437, "epoch": 486} {"train_loss": -5.147719860076904, "global_step": 20438, "epoch": 486} {"train_loss": -5.221531391143799, "global_step": 20439, "epoch": 486} {"train_loss": -5.276722431182861, "global_step": 20440, "epoch": 486} {"train_loss": -5.236628532409668, "global_step": 20441, "epoch": 486} {"train_loss": -5.182550430297852, "global_step": 20442, "epoch": 486} {"train_loss": -5.443347930908203, "global_step": 20443, "epoch": 486} {"train_loss": -5.272402286529541, "global_step": 20444, "epoch": 486} {"train_loss": -5.205937385559082, "global_step": 20445, "epoch": 486} {"train_loss": -5.334075927734375, "global_step": 20446, "epoch": 486} {"train_loss": -5.174769401550293, "global_step": 20447, "epoch": 486} {"train_loss": -5.1694135665893555, "global_step": 20448, "epoch": 486} {"train_loss": -5.260984420776367, "global_step": 20449, "epoch": 486} {"train_loss": -5.209203243255615, "global_step": 20450, "epoch": 486} {"train_loss": -5.209922790527344, "global_step": 20451, "epoch": 486} {"train_loss": -5.351208686828613, "global_step": 20452, "epoch": 486} {"train_loss": -5.275401263009934, "global_step": 20453, "epoch": 486, "val_loss": 67134.4453125} {"train_loss": -5.305506706237793, "global_step": 20454, "epoch": 487} {"train_loss": -5.283418655395508, "global_step": 20455, "epoch": 487} {"train_loss": -5.209565162658691, "global_step": 20456, "epoch": 487} {"train_loss": -5.315552711486816, "global_step": 20457, "epoch": 487} {"train_loss": -5.387531280517578, "global_step": 20458, "epoch": 487} {"train_loss": -5.317661285400391, "global_step": 20459, "epoch": 487} {"train_loss": -5.373377323150635, "global_step": 20460, "epoch": 487} {"train_loss": -5.274285793304443, "global_step": 20461, "epoch": 487} {"train_loss": -5.549540042877197, "global_step": 20462, "epoch": 487} {"train_loss": -5.300281047821045, "global_step": 20463, "epoch": 487} {"train_loss": -5.24757194519043, "global_step": 20464, "epoch": 487} {"train_loss": -5.311008453369141, "global_step": 20465, "epoch": 487} {"train_loss": -5.353125095367432, "global_step": 20466, "epoch": 487} {"train_loss": -5.3213090896606445, "global_step": 20467, "epoch": 487} {"train_loss": -5.370578765869141, "global_step": 20468, "epoch": 487} {"train_loss": -5.348909378051758, "global_step": 20469, "epoch": 487} {"train_loss": -5.225734233856201, "global_step": 20470, "epoch": 487} {"train_loss": -5.2525200843811035, "global_step": 20471, "epoch": 487} {"train_loss": -5.210209846496582, "global_step": 20472, "epoch": 487} {"train_loss": -5.2431640625, "global_step": 20473, "epoch": 487} {"train_loss": -5.2905378341674805, "global_step": 20474, "epoch": 487} {"train_loss": -5.263133525848389, "global_step": 20475, "epoch": 487} {"train_loss": -5.211545944213867, "global_step": 20476, "epoch": 487} {"train_loss": -5.321948528289795, "global_step": 20477, "epoch": 487} {"train_loss": -5.475386142730713, "global_step": 20478, "epoch": 487} {"train_loss": -5.3731842041015625, "global_step": 20479, "epoch": 487} {"train_loss": -5.333194732666016, "global_step": 20480, "epoch": 487} {"train_loss": -5.455948829650879, "global_step": 20481, "epoch": 487} {"train_loss": -5.2698822021484375, "global_step": 20482, "epoch": 487} {"train_loss": -5.312685966491699, "global_step": 20483, "epoch": 487} {"train_loss": -5.362519264221191, "global_step": 20484, "epoch": 487} {"train_loss": -5.285259246826172, "global_step": 20485, "epoch": 487} {"train_loss": -5.269600868225098, "global_step": 20486, "epoch": 487} {"train_loss": -5.254776477813721, "global_step": 20487, "epoch": 487} {"train_loss": -5.390092849731445, "global_step": 20488, "epoch": 487} {"train_loss": -5.297465801239014, "global_step": 20489, "epoch": 487} {"train_loss": -5.226574897766113, "global_step": 20490, "epoch": 487} {"train_loss": -5.301093101501465, "global_step": 20491, "epoch": 487} {"train_loss": -5.312969207763672, "global_step": 20492, "epoch": 487} {"train_loss": -5.192468166351318, "global_step": 20493, "epoch": 487} {"train_loss": -5.140806674957275, "global_step": 20494, "epoch": 487} {"train_loss": -5.30664815221514, "global_step": 20495, "epoch": 487, "val_loss": 67108.03125} {"train_loss": -5.234148025512695, "global_step": 20496, "epoch": 488} {"train_loss": -5.2544145584106445, "global_step": 20497, "epoch": 488} {"train_loss": -5.216666221618652, "global_step": 20498, "epoch": 488} {"train_loss": -5.27487850189209, "global_step": 20499, "epoch": 488} {"train_loss": -5.156478404998779, "global_step": 20500, "epoch": 488} {"train_loss": -5.402667999267578, "global_step": 20501, "epoch": 488} {"train_loss": -5.295888900756836, "global_step": 20502, "epoch": 488} {"train_loss": -5.304990291595459, "global_step": 20503, "epoch": 488} {"train_loss": -5.1728315353393555, "global_step": 20504, "epoch": 488} {"train_loss": -5.429446220397949, "global_step": 20505, "epoch": 488} {"train_loss": -5.223873615264893, "global_step": 20506, "epoch": 488} {"train_loss": -5.182910919189453, "global_step": 20507, "epoch": 488} {"train_loss": -5.4019269943237305, "global_step": 20508, "epoch": 488} {"train_loss": -5.094337463378906, "global_step": 20509, "epoch": 488} {"train_loss": -5.31800651550293, "global_step": 20510, "epoch": 488} {"train_loss": -5.278100490570068, "global_step": 20511, "epoch": 488} {"train_loss": -5.376483917236328, "global_step": 20512, "epoch": 488} {"train_loss": -5.140105724334717, "global_step": 20513, "epoch": 488} {"train_loss": -5.331700801849365, "global_step": 20514, "epoch": 488} {"train_loss": -5.284464359283447, "global_step": 20515, "epoch": 488} {"train_loss": -5.245073318481445, "global_step": 20516, "epoch": 488} {"train_loss": -5.288582801818848, "global_step": 20517, "epoch": 488} {"train_loss": -5.383779048919678, "global_step": 20518, "epoch": 488} {"train_loss": -5.320188522338867, "global_step": 20519, "epoch": 488} {"train_loss": -5.227516174316406, "global_step": 20520, "epoch": 488} {"train_loss": -5.335697174072266, "global_step": 20521, "epoch": 488} {"train_loss": -5.272418022155762, "global_step": 20522, "epoch": 488} {"train_loss": -5.191798210144043, "global_step": 20523, "epoch": 488} {"train_loss": -5.301713466644287, "global_step": 20524, "epoch": 488} {"train_loss": -5.266170024871826, "global_step": 20525, "epoch": 488} {"train_loss": -5.2181549072265625, "global_step": 20526, "epoch": 488} {"train_loss": -5.314803123474121, "global_step": 20527, "epoch": 488} {"train_loss": -5.311502456665039, "global_step": 20528, "epoch": 488} {"train_loss": -5.44690465927124, "global_step": 20529, "epoch": 488} {"train_loss": -5.244163513183594, "global_step": 20530, "epoch": 488} {"train_loss": -5.332934379577637, "global_step": 20531, "epoch": 488} {"train_loss": -5.252566337585449, "global_step": 20532, "epoch": 488} {"train_loss": -5.26456356048584, "global_step": 20533, "epoch": 488} {"train_loss": -5.377538204193115, "global_step": 20534, "epoch": 488} {"train_loss": -5.2979631423950195, "global_step": 20535, "epoch": 488} {"train_loss": -5.321501731872559, "global_step": 20536, "epoch": 488} {"train_loss": -5.2817447412581675, "global_step": 20537, "epoch": 488, "val_loss": 67128.234375} {"train_loss": -5.387473106384277, "global_step": 20538, "epoch": 489} {"train_loss": -5.363128662109375, "global_step": 20539, "epoch": 489} {"train_loss": -5.404311180114746, "global_step": 20540, "epoch": 489} {"train_loss": -5.353339672088623, "global_step": 20541, "epoch": 489} {"train_loss": -5.300694465637207, "global_step": 20542, "epoch": 489} {"train_loss": -5.295642852783203, "global_step": 20543, "epoch": 489} {"train_loss": -5.2010297775268555, "global_step": 20544, "epoch": 489} {"train_loss": -5.23447322845459, "global_step": 20545, "epoch": 489} {"train_loss": -5.328907012939453, "global_step": 20546, "epoch": 489} {"train_loss": -5.358205795288086, "global_step": 20547, "epoch": 489} {"train_loss": -5.063695907592773, "global_step": 20548, "epoch": 489} {"train_loss": -5.252562522888184, "global_step": 20549, "epoch": 489} {"train_loss": -5.443708419799805, "global_step": 20550, "epoch": 489} {"train_loss": -5.23367977142334, "global_step": 20551, "epoch": 489} {"train_loss": -5.1743550300598145, "global_step": 20552, "epoch": 489} {"train_loss": -5.3711628913879395, "global_step": 20553, "epoch": 489} {"train_loss": -5.207357406616211, "global_step": 20554, "epoch": 489} {"train_loss": -5.168320655822754, "global_step": 20555, "epoch": 489} {"train_loss": -5.241184711456299, "global_step": 20556, "epoch": 489} {"train_loss": -5.23923397064209, "global_step": 20557, "epoch": 489} {"train_loss": -5.2232208251953125, "global_step": 20558, "epoch": 489} {"train_loss": -5.11348819732666, "global_step": 20559, "epoch": 489} {"train_loss": -5.231474876403809, "global_step": 20560, "epoch": 489} {"train_loss": -5.18474006652832, "global_step": 20561, "epoch": 489} {"train_loss": -5.234807968139648, "global_step": 20562, "epoch": 489} {"train_loss": -5.233705997467041, "global_step": 20563, "epoch": 489} {"train_loss": -5.23879337310791, "global_step": 20564, "epoch": 489} {"train_loss": -5.060851097106934, "global_step": 20565, "epoch": 489} {"train_loss": -5.421142101287842, "global_step": 20566, "epoch": 489} {"train_loss": -5.211026191711426, "global_step": 20567, "epoch": 489} {"train_loss": -5.330607891082764, "global_step": 20568, "epoch": 489} {"train_loss": -5.389575004577637, "global_step": 20569, "epoch": 489} {"train_loss": -5.292881488800049, "global_step": 20570, "epoch": 489} {"train_loss": -5.205709457397461, "global_step": 20571, "epoch": 489} {"train_loss": -5.318330764770508, "global_step": 20572, "epoch": 489} {"train_loss": -5.324568748474121, "global_step": 20573, "epoch": 489} {"train_loss": -5.319153785705566, "global_step": 20574, "epoch": 489} {"train_loss": -5.316554069519043, "global_step": 20575, "epoch": 489} {"train_loss": -5.327110290527344, "global_step": 20576, "epoch": 489} {"train_loss": -5.450459003448486, "global_step": 20577, "epoch": 489} {"train_loss": -5.271378517150879, "global_step": 20578, "epoch": 489} {"train_loss": -5.276650110880534, "global_step": 20579, "epoch": 489, "val_loss": 67685.0078125} {"train_loss": -5.409008979797363, "global_step": 20580, "epoch": 490} {"train_loss": -5.384307384490967, "global_step": 20581, "epoch": 490} {"train_loss": -5.308392524719238, "global_step": 20582, "epoch": 490} {"train_loss": -5.408286094665527, "global_step": 20583, "epoch": 490} {"train_loss": -5.038389205932617, "global_step": 20584, "epoch": 490} {"train_loss": -5.194528579711914, "global_step": 20585, "epoch": 490} {"train_loss": -5.290767669677734, "global_step": 20586, "epoch": 490} {"train_loss": -5.335289001464844, "global_step": 20587, "epoch": 490} {"train_loss": -5.26816463470459, "global_step": 20588, "epoch": 490} {"train_loss": -5.3642897605896, "global_step": 20589, "epoch": 490} {"train_loss": -5.395942687988281, "global_step": 20590, "epoch": 490} {"train_loss": -5.365448474884033, "global_step": 20591, "epoch": 490} {"train_loss": -5.417200088500977, "global_step": 20592, "epoch": 490} {"train_loss": -5.406778812408447, "global_step": 20593, "epoch": 490} {"train_loss": -5.30683708190918, "global_step": 20594, "epoch": 490} {"train_loss": -5.374011993408203, "global_step": 20595, "epoch": 490} {"train_loss": -5.332675933837891, "global_step": 20596, "epoch": 490} {"train_loss": -5.353682041168213, "global_step": 20597, "epoch": 490} {"train_loss": -5.25190544128418, "global_step": 20598, "epoch": 490} {"train_loss": -5.263955116271973, "global_step": 20599, "epoch": 490} {"train_loss": -5.302319049835205, "global_step": 20600, "epoch": 490} {"train_loss": -5.217561721801758, "global_step": 20601, "epoch": 490} {"train_loss": -5.261198997497559, "global_step": 20602, "epoch": 490} {"train_loss": -5.281299591064453, "global_step": 20603, "epoch": 490} {"train_loss": -5.3441901206970215, "global_step": 20604, "epoch": 490} {"train_loss": -5.364737510681152, "global_step": 20605, "epoch": 490} {"train_loss": -5.240604877471924, "global_step": 20606, "epoch": 490} {"train_loss": -5.400173187255859, "global_step": 20607, "epoch": 490} {"train_loss": -5.3533935546875, "global_step": 20608, "epoch": 490} {"train_loss": -5.250646591186523, "global_step": 20609, "epoch": 490} {"train_loss": -5.191823959350586, "global_step": 20610, "epoch": 490} {"train_loss": -5.134681224822998, "global_step": 20611, "epoch": 490} {"train_loss": -5.411331653594971, "global_step": 20612, "epoch": 490} {"train_loss": -5.323188304901123, "global_step": 20613, "epoch": 490} {"train_loss": -5.31203556060791, "global_step": 20614, "epoch": 490} {"train_loss": -5.36170768737793, "global_step": 20615, "epoch": 490} {"train_loss": -5.1772356033325195, "global_step": 20616, "epoch": 490} {"train_loss": -5.296032905578613, "global_step": 20617, "epoch": 490} {"train_loss": -5.281145095825195, "global_step": 20618, "epoch": 490} {"train_loss": -5.311306953430176, "global_step": 20619, "epoch": 490} {"train_loss": -5.340939998626709, "global_step": 20620, "epoch": 490} {"train_loss": -5.306848105930147, "global_step": 20621, "epoch": 490, "val_loss": 67103.9609375} {"train_loss": -5.369053840637207, "global_step": 20622, "epoch": 491} {"train_loss": -5.3298444747924805, "global_step": 20623, "epoch": 491} {"train_loss": -5.29447078704834, "global_step": 20624, "epoch": 491} {"train_loss": -5.364414215087891, "global_step": 20625, "epoch": 491} {"train_loss": -5.204023838043213, "global_step": 20626, "epoch": 491} {"train_loss": -5.274456024169922, "global_step": 20627, "epoch": 491} {"train_loss": -5.4021196365356445, "global_step": 20628, "epoch": 491} {"train_loss": -5.220839023590088, "global_step": 20629, "epoch": 491} {"train_loss": -5.217845916748047, "global_step": 20630, "epoch": 491} {"train_loss": -5.442564487457275, "global_step": 20631, "epoch": 491} {"train_loss": -5.345514297485352, "global_step": 20632, "epoch": 491} {"train_loss": -5.323548316955566, "global_step": 20633, "epoch": 491} {"train_loss": -5.2274298667907715, "global_step": 20634, "epoch": 491} {"train_loss": -5.222182273864746, "global_step": 20635, "epoch": 491} {"train_loss": -5.182159423828125, "global_step": 20636, "epoch": 491} {"train_loss": -5.175653457641602, "global_step": 20637, "epoch": 491} {"train_loss": -5.310230255126953, "global_step": 20638, "epoch": 491} {"train_loss": -5.287940502166748, "global_step": 20639, "epoch": 491} {"train_loss": -5.390041351318359, "global_step": 20640, "epoch": 491} {"train_loss": -5.250587463378906, "global_step": 20641, "epoch": 491} {"train_loss": -5.154111862182617, "global_step": 20642, "epoch": 491} {"train_loss": -5.266763687133789, "global_step": 20643, "epoch": 491} {"train_loss": -5.342333793640137, "global_step": 20644, "epoch": 491} {"train_loss": -5.3306803703308105, "global_step": 20645, "epoch": 491} {"train_loss": -5.323487281799316, "global_step": 20646, "epoch": 491} {"train_loss": -5.248008728027344, "global_step": 20647, "epoch": 491} {"train_loss": -5.2712082862854, "global_step": 20648, "epoch": 491} {"train_loss": -5.250552177429199, "global_step": 20649, "epoch": 491} {"train_loss": -5.097533226013184, "global_step": 20650, "epoch": 491} {"train_loss": -5.261160850524902, "global_step": 20651, "epoch": 491} {"train_loss": -5.244067192077637, "global_step": 20652, "epoch": 491} {"train_loss": -5.228517055511475, "global_step": 20653, "epoch": 491} {"train_loss": -5.16804313659668, "global_step": 20654, "epoch": 491} {"train_loss": -5.203995704650879, "global_step": 20655, "epoch": 491} {"train_loss": -5.249544143676758, "global_step": 20656, "epoch": 491} {"train_loss": -5.183832168579102, "global_step": 20657, "epoch": 491} {"train_loss": -5.362448692321777, "global_step": 20658, "epoch": 491} {"train_loss": -5.382320404052734, "global_step": 20659, "epoch": 491} {"train_loss": -5.23975133895874, "global_step": 20660, "epoch": 491} {"train_loss": -5.388209342956543, "global_step": 20661, "epoch": 491} {"train_loss": -5.272439956665039, "global_step": 20662, "epoch": 491} {"train_loss": -5.2768074217296785, "global_step": 20663, "epoch": 491, "val_loss": 67367.234375} {"train_loss": -5.4083170890808105, "global_step": 20664, "epoch": 492} {"train_loss": -5.1749186515808105, "global_step": 20665, "epoch": 492} {"train_loss": -5.382063865661621, "global_step": 20666, "epoch": 492} {"train_loss": -5.30488395690918, "global_step": 20667, "epoch": 492} {"train_loss": -5.278109550476074, "global_step": 20668, "epoch": 492} {"train_loss": -5.380399703979492, "global_step": 20669, "epoch": 492} {"train_loss": -5.292392730712891, "global_step": 20670, "epoch": 492} {"train_loss": -5.151267051696777, "global_step": 20671, "epoch": 492} {"train_loss": -5.254804611206055, "global_step": 20672, "epoch": 492} {"train_loss": -5.263116836547852, "global_step": 20673, "epoch": 492} {"train_loss": -5.136021614074707, "global_step": 20674, "epoch": 492} {"train_loss": -5.348087310791016, "global_step": 20675, "epoch": 492} {"train_loss": -5.151302337646484, "global_step": 20676, "epoch": 492} {"train_loss": -4.988497734069824, "global_step": 20677, "epoch": 492} {"train_loss": -5.418824672698975, "global_step": 20678, "epoch": 492} {"train_loss": -5.1970319747924805, "global_step": 20679, "epoch": 492} {"train_loss": -5.311745643615723, "global_step": 20680, "epoch": 492} {"train_loss": -5.3028082847595215, "global_step": 20681, "epoch": 492} {"train_loss": -5.253795623779297, "global_step": 20682, "epoch": 492} {"train_loss": -5.301361083984375, "global_step": 20683, "epoch": 492} {"train_loss": -5.229828834533691, "global_step": 20684, "epoch": 492} {"train_loss": -5.313439846038818, "global_step": 20685, "epoch": 492} {"train_loss": -5.174422264099121, "global_step": 20686, "epoch": 492} {"train_loss": -5.292597770690918, "global_step": 20687, "epoch": 492} {"train_loss": -5.297117233276367, "global_step": 20688, "epoch": 492} {"train_loss": -5.257609844207764, "global_step": 20689, "epoch": 492} {"train_loss": -5.280473232269287, "global_step": 20690, "epoch": 492} {"train_loss": -5.318034648895264, "global_step": 20691, "epoch": 492} {"train_loss": -5.322597503662109, "global_step": 20692, "epoch": 492} {"train_loss": -5.324708938598633, "global_step": 20693, "epoch": 492} {"train_loss": -5.276881694793701, "global_step": 20694, "epoch": 492} {"train_loss": -5.228093147277832, "global_step": 20695, "epoch": 492} {"train_loss": -5.296065330505371, "global_step": 20696, "epoch": 492} {"train_loss": -5.065321922302246, "global_step": 20697, "epoch": 492} {"train_loss": -5.234624862670898, "global_step": 20698, "epoch": 492} {"train_loss": -5.386366844177246, "global_step": 20699, "epoch": 492} {"train_loss": -5.2336201667785645, "global_step": 20700, "epoch": 492} {"train_loss": -5.156981468200684, "global_step": 20701, "epoch": 492} {"train_loss": -5.2965087890625, "global_step": 20702, "epoch": 492} {"train_loss": -5.221116542816162, "global_step": 20703, "epoch": 492} {"train_loss": -5.291121482849121, "global_step": 20704, "epoch": 492} {"train_loss": -5.265545879091535, "global_step": 20705, "epoch": 492, "val_loss": 67101.0546875} {"train_loss": -5.173311233520508, "global_step": 20706, "epoch": 493} {"train_loss": -5.175654411315918, "global_step": 20707, "epoch": 493} {"train_loss": -5.227581977844238, "global_step": 20708, "epoch": 493} {"train_loss": -5.394146919250488, "global_step": 20709, "epoch": 493} {"train_loss": -5.366547584533691, "global_step": 20710, "epoch": 493} {"train_loss": -5.387778282165527, "global_step": 20711, "epoch": 493} {"train_loss": -5.414723873138428, "global_step": 20712, "epoch": 493} {"train_loss": -5.407049179077148, "global_step": 20713, "epoch": 493} {"train_loss": -5.393913269042969, "global_step": 20714, "epoch": 493} {"train_loss": -5.354829788208008, "global_step": 20715, "epoch": 493} {"train_loss": -5.35115909576416, "global_step": 20716, "epoch": 493} {"train_loss": -5.305088043212891, "global_step": 20717, "epoch": 493} {"train_loss": -5.3108229637146, "global_step": 20718, "epoch": 493} {"train_loss": -5.399677276611328, "global_step": 20719, "epoch": 493} {"train_loss": -5.221615314483643, "global_step": 20720, "epoch": 493} {"train_loss": -5.303004264831543, "global_step": 20721, "epoch": 493} {"train_loss": -5.356283187866211, "global_step": 20722, "epoch": 493} {"train_loss": -5.2863569259643555, "global_step": 20723, "epoch": 493} {"train_loss": -5.24083137512207, "global_step": 20724, "epoch": 493} {"train_loss": -5.391792297363281, "global_step": 20725, "epoch": 493} {"train_loss": -5.331547737121582, "global_step": 20726, "epoch": 493} {"train_loss": -5.47653341293335, "global_step": 20727, "epoch": 493} {"train_loss": -5.5133819580078125, "global_step": 20728, "epoch": 493} {"train_loss": -5.290818691253662, "global_step": 20729, "epoch": 493} {"train_loss": -5.160670280456543, "global_step": 20730, "epoch": 493} {"train_loss": -5.278380870819092, "global_step": 20731, "epoch": 493} {"train_loss": -5.316074371337891, "global_step": 20732, "epoch": 493} {"train_loss": -5.2425031661987305, "global_step": 20733, "epoch": 493} {"train_loss": -5.3430070877075195, "global_step": 20734, "epoch": 493} {"train_loss": -5.183382034301758, "global_step": 20735, "epoch": 493} {"train_loss": -5.1890740394592285, "global_step": 20736, "epoch": 493} {"train_loss": -5.369341850280762, "global_step": 20737, "epoch": 493} {"train_loss": -5.128108978271484, "global_step": 20738, "epoch": 493} {"train_loss": -5.275141716003418, "global_step": 20739, "epoch": 493} {"train_loss": -5.406679153442383, "global_step": 20740, "epoch": 493} {"train_loss": -5.378111362457275, "global_step": 20741, "epoch": 493} {"train_loss": -5.345941543579102, "global_step": 20742, "epoch": 493} {"train_loss": -5.42584228515625, "global_step": 20743, "epoch": 493} {"train_loss": -5.272363662719727, "global_step": 20744, "epoch": 493} {"train_loss": -5.251741409301758, "global_step": 20745, "epoch": 493} {"train_loss": -5.312451362609863, "global_step": 20746, "epoch": 493} {"train_loss": -5.313213053203764, "global_step": 20747, "epoch": 493, "val_loss": 67225.125} {"train_loss": -5.366072654724121, "global_step": 20748, "epoch": 494} {"train_loss": -5.339053153991699, "global_step": 20749, "epoch": 494} {"train_loss": -5.459164142608643, "global_step": 20750, "epoch": 494} {"train_loss": -5.279609680175781, "global_step": 20751, "epoch": 494} {"train_loss": -5.285780429840088, "global_step": 20752, "epoch": 494} {"train_loss": -5.354846954345703, "global_step": 20753, "epoch": 494} {"train_loss": -5.239313125610352, "global_step": 20754, "epoch": 494} {"train_loss": -5.277397632598877, "global_step": 20755, "epoch": 494} {"train_loss": -5.367800235748291, "global_step": 20756, "epoch": 494} {"train_loss": -5.382752418518066, "global_step": 20757, "epoch": 494} {"train_loss": -5.268820762634277, "global_step": 20758, "epoch": 494} {"train_loss": -5.323838710784912, "global_step": 20759, "epoch": 494} {"train_loss": -5.234077453613281, "global_step": 20760, "epoch": 494} {"train_loss": -5.324527740478516, "global_step": 20761, "epoch": 494} {"train_loss": -5.270739555358887, "global_step": 20762, "epoch": 494} {"train_loss": -5.338669776916504, "global_step": 20763, "epoch": 494} {"train_loss": -5.302415370941162, "global_step": 20764, "epoch": 494} {"train_loss": -5.190186023712158, "global_step": 20765, "epoch": 494} {"train_loss": -5.3634819984436035, "global_step": 20766, "epoch": 494} {"train_loss": -5.186427116394043, "global_step": 20767, "epoch": 494} {"train_loss": -5.307819843292236, "global_step": 20768, "epoch": 494} {"train_loss": -5.434333801269531, "global_step": 20769, "epoch": 494} {"train_loss": -5.294528007507324, "global_step": 20770, "epoch": 494} {"train_loss": -5.333340644836426, "global_step": 20771, "epoch": 494} {"train_loss": -5.273870468139648, "global_step": 20772, "epoch": 494} {"train_loss": -5.275632858276367, "global_step": 20773, "epoch": 494} {"train_loss": -5.26439094543457, "global_step": 20774, "epoch": 494} {"train_loss": -5.378058910369873, "global_step": 20775, "epoch": 494} {"train_loss": -5.300410270690918, "global_step": 20776, "epoch": 494} {"train_loss": -5.457887172698975, "global_step": 20777, "epoch": 494} {"train_loss": -5.179818153381348, "global_step": 20778, "epoch": 494} {"train_loss": -5.214478492736816, "global_step": 20779, "epoch": 494} {"train_loss": -5.5212883949279785, "global_step": 20780, "epoch": 494} {"train_loss": -5.286007404327393, "global_step": 20781, "epoch": 494} {"train_loss": -5.218462944030762, "global_step": 20782, "epoch": 494} {"train_loss": -5.359694004058838, "global_step": 20783, "epoch": 494} {"train_loss": -5.353679656982422, "global_step": 20784, "epoch": 494} {"train_loss": -5.244426727294922, "global_step": 20785, "epoch": 494} {"train_loss": -5.215179443359375, "global_step": 20786, "epoch": 494} {"train_loss": -5.085672378540039, "global_step": 20787, "epoch": 494} {"train_loss": -5.31434440612793, "global_step": 20788, "epoch": 494} {"train_loss": -5.300574030194964, "global_step": 20789, "epoch": 494, "val_loss": 67895.171875} {"train_loss": -5.249788284301758, "global_step": 20790, "epoch": 495} {"train_loss": -5.369187355041504, "global_step": 20791, "epoch": 495} {"train_loss": -5.237833023071289, "global_step": 20792, "epoch": 495} {"train_loss": -5.342873573303223, "global_step": 20793, "epoch": 495} {"train_loss": -5.185556888580322, "global_step": 20794, "epoch": 495} {"train_loss": -5.32696533203125, "global_step": 20795, "epoch": 495} {"train_loss": -5.293199062347412, "global_step": 20796, "epoch": 495} {"train_loss": -5.090608596801758, "global_step": 20797, "epoch": 495} {"train_loss": -5.4628729820251465, "global_step": 20798, "epoch": 495} {"train_loss": -5.358642578125, "global_step": 20799, "epoch": 495} {"train_loss": -5.2455549240112305, "global_step": 20800, "epoch": 495} {"train_loss": -5.261362075805664, "global_step": 20801, "epoch": 495} {"train_loss": -5.208596229553223, "global_step": 20802, "epoch": 495} {"train_loss": -5.366499900817871, "global_step": 20803, "epoch": 495} {"train_loss": -5.357476711273193, "global_step": 20804, "epoch": 495} {"train_loss": -5.309456825256348, "global_step": 20805, "epoch": 495} {"train_loss": -5.352912902832031, "global_step": 20806, "epoch": 495} {"train_loss": -5.3108720779418945, "global_step": 20807, "epoch": 495} {"train_loss": -5.14907169342041, "global_step": 20808, "epoch": 495} {"train_loss": -5.382499694824219, "global_step": 20809, "epoch": 495} {"train_loss": -5.201193809509277, "global_step": 20810, "epoch": 495} {"train_loss": -5.418854713439941, "global_step": 20811, "epoch": 495} {"train_loss": -5.30533504486084, "global_step": 20812, "epoch": 495} {"train_loss": -5.442147731781006, "global_step": 20813, "epoch": 495} {"train_loss": -5.1411452293396, "global_step": 20814, "epoch": 495} {"train_loss": -5.295638084411621, "global_step": 20815, "epoch": 495} {"train_loss": -5.370552062988281, "global_step": 20816, "epoch": 495} {"train_loss": -5.077805519104004, "global_step": 20817, "epoch": 495} {"train_loss": -5.293776035308838, "global_step": 20818, "epoch": 495} {"train_loss": -5.338081359863281, "global_step": 20819, "epoch": 495} {"train_loss": -5.2114715576171875, "global_step": 20820, "epoch": 495} {"train_loss": -5.39207124710083, "global_step": 20821, "epoch": 495} {"train_loss": -5.249939918518066, "global_step": 20822, "epoch": 495} {"train_loss": -5.318064212799072, "global_step": 20823, "epoch": 495} {"train_loss": -5.3152174949646, "global_step": 20824, "epoch": 495} {"train_loss": -5.233685493469238, "global_step": 20825, "epoch": 495} {"train_loss": -5.38343620300293, "global_step": 20826, "epoch": 495} {"train_loss": -5.248790740966797, "global_step": 20827, "epoch": 495} {"train_loss": -5.2506279945373535, "global_step": 20828, "epoch": 495} {"train_loss": -5.374711036682129, "global_step": 20829, "epoch": 495} {"train_loss": -5.187312126159668, "global_step": 20830, "epoch": 495} {"train_loss": -5.291996887751988, "global_step": 20831, "epoch": 495, "val_loss": 67456.9453125} {"train_loss": -5.2360029220581055, "global_step": 20832, "epoch": 496} {"train_loss": -5.486782073974609, "global_step": 20833, "epoch": 496} {"train_loss": -5.319316864013672, "global_step": 20834, "epoch": 496} {"train_loss": -5.383782386779785, "global_step": 20835, "epoch": 496} {"train_loss": -5.313297748565674, "global_step": 20836, "epoch": 496} {"train_loss": -5.387089729309082, "global_step": 20837, "epoch": 496} {"train_loss": -5.40140438079834, "global_step": 20838, "epoch": 496} {"train_loss": -5.222334861755371, "global_step": 20839, "epoch": 496} {"train_loss": -5.216235637664795, "global_step": 20840, "epoch": 496} {"train_loss": -5.189003944396973, "global_step": 20841, "epoch": 496} {"train_loss": -5.256186485290527, "global_step": 20842, "epoch": 496} {"train_loss": -5.249157905578613, "global_step": 20843, "epoch": 496} {"train_loss": -5.313055038452148, "global_step": 20844, "epoch": 496} {"train_loss": -5.228760719299316, "global_step": 20845, "epoch": 496} {"train_loss": -5.264482021331787, "global_step": 20846, "epoch": 496} {"train_loss": -5.316025733947754, "global_step": 20847, "epoch": 496} {"train_loss": -5.201982498168945, "global_step": 20848, "epoch": 496} {"train_loss": -5.195228576660156, "global_step": 20849, "epoch": 496} {"train_loss": -5.320931434631348, "global_step": 20850, "epoch": 496} {"train_loss": -5.188035488128662, "global_step": 20851, "epoch": 496} {"train_loss": -5.115357398986816, "global_step": 20852, "epoch": 496} {"train_loss": -5.162196159362793, "global_step": 20853, "epoch": 496} {"train_loss": -5.1319260597229, "global_step": 20854, "epoch": 496} {"train_loss": -5.298346042633057, "global_step": 20855, "epoch": 496} {"train_loss": -5.140905857086182, "global_step": 20856, "epoch": 496} {"train_loss": -5.052468776702881, "global_step": 20857, "epoch": 496} {"train_loss": -5.287176132202148, "global_step": 20858, "epoch": 496} {"train_loss": -5.226661682128906, "global_step": 20859, "epoch": 496} {"train_loss": -5.314146041870117, "global_step": 20860, "epoch": 496} {"train_loss": -5.211670875549316, "global_step": 20861, "epoch": 496} {"train_loss": -5.4381208419799805, "global_step": 20862, "epoch": 496} {"train_loss": -5.2632155418396, "global_step": 20863, "epoch": 496} {"train_loss": -5.298389434814453, "global_step": 20864, "epoch": 496} {"train_loss": -5.320347309112549, "global_step": 20865, "epoch": 496} {"train_loss": -5.2350006103515625, "global_step": 20866, "epoch": 496} {"train_loss": -5.326350212097168, "global_step": 20867, "epoch": 496} {"train_loss": -5.161772727966309, "global_step": 20868, "epoch": 496} {"train_loss": -5.171573638916016, "global_step": 20869, "epoch": 496} {"train_loss": -5.300177097320557, "global_step": 20870, "epoch": 496} {"train_loss": -5.221693992614746, "global_step": 20871, "epoch": 496} {"train_loss": -5.403475761413574, "global_step": 20872, "epoch": 496} {"train_loss": -5.262006260099865, "global_step": 20873, "epoch": 496, "val_loss": 67194.5859375} {"train_loss": -5.400659561157227, "global_step": 20874, "epoch": 497} {"train_loss": -5.2829179763793945, "global_step": 20875, "epoch": 497} {"train_loss": -5.306686878204346, "global_step": 20876, "epoch": 497} {"train_loss": -5.255646228790283, "global_step": 20877, "epoch": 497} {"train_loss": -5.364438056945801, "global_step": 20878, "epoch": 497} {"train_loss": -5.172277450561523, "global_step": 20879, "epoch": 497} {"train_loss": -5.2967119216918945, "global_step": 20880, "epoch": 497} {"train_loss": -5.260753154754639, "global_step": 20881, "epoch": 497} {"train_loss": -5.319235324859619, "global_step": 20882, "epoch": 497} {"train_loss": -5.337977409362793, "global_step": 20883, "epoch": 497} {"train_loss": -5.321751594543457, "global_step": 20884, "epoch": 497} {"train_loss": -5.286032676696777, "global_step": 20885, "epoch": 497} {"train_loss": -5.297921180725098, "global_step": 20886, "epoch": 497} {"train_loss": -5.432607650756836, "global_step": 20887, "epoch": 497} {"train_loss": -5.310312747955322, "global_step": 20888, "epoch": 497} {"train_loss": -5.255890369415283, "global_step": 20889, "epoch": 497} {"train_loss": -5.334867000579834, "global_step": 20890, "epoch": 497} {"train_loss": -5.232614040374756, "global_step": 20891, "epoch": 497} {"train_loss": -5.279388904571533, "global_step": 20892, "epoch": 497} {"train_loss": -5.275190353393555, "global_step": 20893, "epoch": 497} {"train_loss": -5.1843791007995605, "global_step": 20894, "epoch": 497} {"train_loss": -5.386127948760986, "global_step": 20895, "epoch": 497} {"train_loss": -5.276041030883789, "global_step": 20896, "epoch": 497} {"train_loss": -5.328958511352539, "global_step": 20897, "epoch": 497} {"train_loss": -5.39008092880249, "global_step": 20898, "epoch": 497} {"train_loss": -5.271786212921143, "global_step": 20899, "epoch": 497} {"train_loss": -5.368309020996094, "global_step": 20900, "epoch": 497} {"train_loss": -5.436176300048828, "global_step": 20901, "epoch": 497} {"train_loss": -5.409326553344727, "global_step": 20902, "epoch": 497} {"train_loss": -5.3423004150390625, "global_step": 20903, "epoch": 497} {"train_loss": -5.267443656921387, "global_step": 20904, "epoch": 497} {"train_loss": -5.420365810394287, "global_step": 20905, "epoch": 497} {"train_loss": -5.212077617645264, "global_step": 20906, "epoch": 497} {"train_loss": -5.437811851501465, "global_step": 20907, "epoch": 497} {"train_loss": -5.217410087585449, "global_step": 20908, "epoch": 497} {"train_loss": -5.340461730957031, "global_step": 20909, "epoch": 497} {"train_loss": -5.312971591949463, "global_step": 20910, "epoch": 497} {"train_loss": -5.4052886962890625, "global_step": 20911, "epoch": 497} {"train_loss": -5.2931742668151855, "global_step": 20912, "epoch": 497} {"train_loss": -5.240512847900391, "global_step": 20913, "epoch": 497} {"train_loss": -5.343306541442871, "global_step": 20914, "epoch": 497} {"train_loss": -5.3116584391821, "global_step": 20915, "epoch": 497, "val_loss": 66842.2890625} {"train_loss": -5.4319047927856445, "global_step": 20916, "epoch": 498} {"train_loss": -5.428768634796143, "global_step": 20917, "epoch": 498} {"train_loss": -5.237061500549316, "global_step": 20918, "epoch": 498} {"train_loss": -5.298896789550781, "global_step": 20919, "epoch": 498} {"train_loss": -5.239023208618164, "global_step": 20920, "epoch": 498} {"train_loss": -5.307908535003662, "global_step": 20921, "epoch": 498} {"train_loss": -5.275939464569092, "global_step": 20922, "epoch": 498} {"train_loss": -5.339957237243652, "global_step": 20923, "epoch": 498} {"train_loss": -5.207439422607422, "global_step": 20924, "epoch": 498} {"train_loss": -5.27228307723999, "global_step": 20925, "epoch": 498} {"train_loss": -5.4434614181518555, "global_step": 20926, "epoch": 498} {"train_loss": -5.365126609802246, "global_step": 20927, "epoch": 498} {"train_loss": -5.242625713348389, "global_step": 20928, "epoch": 498} {"train_loss": -5.382841110229492, "global_step": 20929, "epoch": 498} {"train_loss": -5.3725385665893555, "global_step": 20930, "epoch": 498} {"train_loss": -5.168735504150391, "global_step": 20931, "epoch": 498} {"train_loss": -5.254082679748535, "global_step": 20932, "epoch": 498} {"train_loss": -5.405617713928223, "global_step": 20933, "epoch": 498} {"train_loss": -5.333688735961914, "global_step": 20934, "epoch": 498} {"train_loss": -5.157475471496582, "global_step": 20935, "epoch": 498} {"train_loss": -5.284619331359863, "global_step": 20936, "epoch": 498} {"train_loss": -5.330849647521973, "global_step": 20937, "epoch": 498} {"train_loss": -5.326907157897949, "global_step": 20938, "epoch": 498} {"train_loss": -5.283285617828369, "global_step": 20939, "epoch": 498} {"train_loss": -5.339699745178223, "global_step": 20940, "epoch": 498} {"train_loss": -5.204703330993652, "global_step": 20941, "epoch": 498} {"train_loss": -5.364701271057129, "global_step": 20942, "epoch": 498} {"train_loss": -5.337647438049316, "global_step": 20943, "epoch": 498} {"train_loss": -5.33216667175293, "global_step": 20944, "epoch": 498} {"train_loss": -5.229464530944824, "global_step": 20945, "epoch": 498} {"train_loss": -5.208773136138916, "global_step": 20946, "epoch": 498} {"train_loss": -5.460002899169922, "global_step": 20947, "epoch": 498} {"train_loss": -5.247514724731445, "global_step": 20948, "epoch": 498} {"train_loss": -5.299346923828125, "global_step": 20949, "epoch": 498} {"train_loss": -5.351132392883301, "global_step": 20950, "epoch": 498} {"train_loss": -5.28477668762207, "global_step": 20951, "epoch": 498} {"train_loss": -5.344781875610352, "global_step": 20952, "epoch": 498} {"train_loss": -5.224061012268066, "global_step": 20953, "epoch": 498} {"train_loss": -5.244709491729736, "global_step": 20954, "epoch": 498} {"train_loss": -5.440374851226807, "global_step": 20955, "epoch": 498} {"train_loss": -5.323097229003906, "global_step": 20956, "epoch": 498} {"train_loss": -5.307889359337943, "global_step": 20957, "epoch": 498, "val_loss": 66902.8984375} {"train_loss": -5.330410003662109, "global_step": 20958, "epoch": 499} {"train_loss": -5.276389122009277, "global_step": 20959, "epoch": 499} {"train_loss": -5.276748180389404, "global_step": 20960, "epoch": 499} {"train_loss": -5.198105335235596, "global_step": 20961, "epoch": 499} {"train_loss": -5.310847282409668, "global_step": 20962, "epoch": 499} {"train_loss": -5.4288330078125, "global_step": 20963, "epoch": 499} {"train_loss": -5.317684650421143, "global_step": 20964, "epoch": 499} {"train_loss": -5.168272018432617, "global_step": 20965, "epoch": 499} {"train_loss": -5.35677433013916, "global_step": 20966, "epoch": 499} {"train_loss": -5.267292022705078, "global_step": 20967, "epoch": 499} {"train_loss": -5.235566139221191, "global_step": 20968, "epoch": 499} {"train_loss": -5.2735443115234375, "global_step": 20969, "epoch": 499} {"train_loss": -5.281497001647949, "global_step": 20970, "epoch": 499} {"train_loss": -5.401935577392578, "global_step": 20971, "epoch": 499} {"train_loss": -5.2033586502075195, "global_step": 20972, "epoch": 499} {"train_loss": -5.150909423828125, "global_step": 20973, "epoch": 499} {"train_loss": -5.299816131591797, "global_step": 20974, "epoch": 499} {"train_loss": -5.317296981811523, "global_step": 20975, "epoch": 499} {"train_loss": -5.347936630249023, "global_step": 20976, "epoch": 499} {"train_loss": -5.349277496337891, "global_step": 20977, "epoch": 499} {"train_loss": -5.362198352813721, "global_step": 20978, "epoch": 499} {"train_loss": -5.281410217285156, "global_step": 20979, "epoch": 499} {"train_loss": -5.33326530456543, "global_step": 20980, "epoch": 499} {"train_loss": -5.319927215576172, "global_step": 20981, "epoch": 499} {"train_loss": -5.41472864151001, "global_step": 20982, "epoch": 499} {"train_loss": -5.369167327880859, "global_step": 20983, "epoch": 499} {"train_loss": -5.41940450668335, "global_step": 20984, "epoch": 499} {"train_loss": -5.233105182647705, "global_step": 20985, "epoch": 499} {"train_loss": -5.284329891204834, "global_step": 20986, "epoch": 499} {"train_loss": -5.307758331298828, "global_step": 20987, "epoch": 499} {"train_loss": -5.322004318237305, "global_step": 20988, "epoch": 499} {"train_loss": -5.325181484222412, "global_step": 20989, "epoch": 499} {"train_loss": -5.378048896789551, "global_step": 20990, "epoch": 499} {"train_loss": -5.375980377197266, "global_step": 20991, "epoch": 499} {"train_loss": -5.39920711517334, "global_step": 20992, "epoch": 499} {"train_loss": -5.356379508972168, "global_step": 20993, "epoch": 499} {"train_loss": -5.355574131011963, "global_step": 20994, "epoch": 499} {"train_loss": -5.230579853057861, "global_step": 20995, "epoch": 499} {"train_loss": -5.159406661987305, "global_step": 20996, "epoch": 499} {"train_loss": -5.428411483764648, "global_step": 20997, "epoch": 499} {"train_loss": -5.170121669769287, "global_step": 20998, "epoch": 499} {"train_loss": -5.307705652146113, "global_step": 20999, "epoch": 499, "val_loss": 67080.984375} {"train_loss": -5.331371784210205, "global_step": 21000, "epoch": 500} {"train_loss": -5.2363080978393555, "global_step": 21001, "epoch": 500} {"train_loss": -5.310425758361816, "global_step": 21002, "epoch": 500} {"train_loss": -5.424187660217285, "global_step": 21003, "epoch": 500} {"train_loss": -5.308692932128906, "global_step": 21004, "epoch": 500} {"train_loss": -5.366043567657471, "global_step": 21005, "epoch": 500} {"train_loss": -5.389789581298828, "global_step": 21006, "epoch": 500} {"train_loss": -5.332728385925293, "global_step": 21007, "epoch": 500} {"train_loss": -5.340630531311035, "global_step": 21008, "epoch": 500} {"train_loss": -5.260605812072754, "global_step": 21009, "epoch": 500} {"train_loss": -5.419934272766113, "global_step": 21010, "epoch": 500} {"train_loss": -5.262588977813721, "global_step": 21011, "epoch": 500} {"train_loss": -5.348041534423828, "global_step": 21012, "epoch": 500} {"train_loss": -5.396764755249023, "global_step": 21013, "epoch": 500} {"train_loss": -5.376534461975098, "global_step": 21014, "epoch": 500} {"train_loss": -5.481306552886963, "global_step": 21015, "epoch": 500} {"train_loss": -5.462913513183594, "global_step": 21016, "epoch": 500} {"train_loss": -5.323432445526123, "global_step": 21017, "epoch": 500} {"train_loss": -5.290177345275879, "global_step": 21018, "epoch": 500} {"train_loss": -5.260663032531738, "global_step": 21019, "epoch": 500} {"train_loss": -5.299720764160156, "global_step": 21020, "epoch": 500} {"train_loss": -5.308631896972656, "global_step": 21021, "epoch": 500} {"train_loss": -5.397695541381836, "global_step": 21022, "epoch": 500} {"train_loss": -5.301621437072754, "global_step": 21023, "epoch": 500} {"train_loss": -5.285678863525391, "global_step": 21024, "epoch": 500} {"train_loss": -5.331531524658203, "global_step": 21025, "epoch": 500} {"train_loss": -5.345159530639648, "global_step": 21026, "epoch": 500} {"train_loss": -5.387352466583252, "global_step": 21027, "epoch": 500} {"train_loss": -5.287448883056641, "global_step": 21028, "epoch": 500} {"train_loss": -5.341161727905273, "global_step": 21029, "epoch": 500} {"train_loss": -5.258315563201904, "global_step": 21030, "epoch": 500} {"train_loss": -5.2725396156311035, "global_step": 21031, "epoch": 500} {"train_loss": -5.239711284637451, "global_step": 21032, "epoch": 500} {"train_loss": -5.4905900955200195, "global_step": 21033, "epoch": 500} {"train_loss": -5.297798156738281, "global_step": 21034, "epoch": 500} {"train_loss": -5.40226936340332, "global_step": 21035, "epoch": 500} {"train_loss": -5.327829360961914, "global_step": 21036, "epoch": 500} {"train_loss": -5.2772722244262695, "global_step": 21037, "epoch": 500} {"train_loss": -5.284865379333496, "global_step": 21038, "epoch": 500} {"train_loss": -5.365166664123535, "global_step": 21039, "epoch": 500} {"train_loss": -5.291179180145264, "global_step": 21040, "epoch": 500} {"train_loss": -5.3343387217748734, "global_step": 21041, "epoch": 500, "train/sim_max_reward_0": 0.2642767483248173, "train/sim_max_reward_1": 0.19592010807995655, "train/sim_max_reward_2": 0.24924698154527047, "train/sim_max_reward_3": 0.15704750979817161, "train/sim_max_reward_4": 0.5807642890044791, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.3411849943719029, "test/sim_max_reward_4300001": 0.0, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.8533484233660239, "test/sim_max_reward_4300004": 0.334902754188734, "test/sim_max_reward_4300005": 0.34956154040241694, "test/sim_max_reward_4300006": 0.11955412694195634, "test/sim_max_reward_4300007": 0.045127646075307386, "test/sim_max_reward_4300008": 0.44729847955176655, "test/sim_max_reward_4300009": 0.43942067977849075, "test/sim_max_reward_4300010": 0.39221693775397776, "test/sim_max_reward_4300011": 0.4069063244122624, "test/sim_max_reward_4300012": 0.16123959756641615, "test/sim_max_reward_4300013": 0.32831378206508116, "test/sim_max_reward_4300014": 0.8761417056033923, "test/sim_max_reward_4300015": 0.22434380981056135, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.28996073114420845, "test/sim_max_reward_4300018": 0.8124186733898142, "test/sim_max_reward_4300019": 0.18564181011739253, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.32833121247453534, "test/sim_max_reward_4300022": 0.03735053514621588, "test/sim_max_reward_4300023": 0.20575297892733313, "test/sim_max_reward_4300024": 0.47421495396739016, "test/sim_max_reward_4300025": 0.08847875242732427, "test/sim_max_reward_4300026": 0.050878423390650566, "test/sim_max_reward_4300027": 0.012710212659616702, "test/sim_max_reward_4300028": 0.023687706799202367, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.5024396762423783, "test/sim_max_reward_4300031": 0.4079008440017574, "test/sim_max_reward_4300032": 0.49908701833519914, "test/sim_max_reward_4300033": 0.5153683895530069, "test/sim_max_reward_4300034": 0.2292727570600145, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.20061665546987054, "test/sim_max_reward_4300037": 0.9822634985708856, "test/sim_max_reward_4300038": 0.6611404295610479, "test/sim_max_reward_4300039": 0.07052801797089818, "test/sim_max_reward_4300040": 0.4755516874445597, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.377535275025676, "test/sim_max_reward_4300043": 0.49957098270252454, "test/sim_max_reward_4300044": 0.22156664887348643, "test/sim_max_reward_4300045": 0.16225724695577334, "test/sim_max_reward_4300046": 0.44566036797943637, "test/sim_max_reward_4300047": 0.3106058478003593, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.2733733993524804, "test/mean_score": 0.29128777004740164, "val_loss": 67099.3984375} {"train_loss": -5.363334655761719, "global_step": 21042, "epoch": 501} {"train_loss": -5.298250198364258, "global_step": 21043, "epoch": 501} {"train_loss": -5.28658390045166, "global_step": 21044, "epoch": 501} {"train_loss": -5.303162574768066, "global_step": 21045, "epoch": 501} {"train_loss": -5.4228057861328125, "global_step": 21046, "epoch": 501} {"train_loss": -5.2393574714660645, "global_step": 21047, "epoch": 501} {"train_loss": -5.34199333190918, "global_step": 21048, "epoch": 501} {"train_loss": -5.3822431564331055, "global_step": 21049, "epoch": 501} {"train_loss": -5.313704013824463, "global_step": 21050, "epoch": 501} {"train_loss": -5.417276382446289, "global_step": 21051, "epoch": 501} {"train_loss": -5.205238342285156, "global_step": 21052, "epoch": 501} {"train_loss": -5.321963310241699, "global_step": 21053, "epoch": 501} {"train_loss": -5.048413276672363, "global_step": 21054, "epoch": 501} {"train_loss": -5.417035102844238, "global_step": 21055, "epoch": 501} {"train_loss": -5.302240371704102, "global_step": 21056, "epoch": 501} {"train_loss": -5.206854820251465, "global_step": 21057, "epoch": 501} {"train_loss": -5.375116348266602, "global_step": 21058, "epoch": 501} {"train_loss": -5.307699680328369, "global_step": 21059, "epoch": 501} {"train_loss": -5.239945411682129, "global_step": 21060, "epoch": 501} {"train_loss": -5.350046634674072, "global_step": 21061, "epoch": 501} {"train_loss": -5.141279220581055, "global_step": 21062, "epoch": 501} {"train_loss": -5.346071243286133, "global_step": 21063, "epoch": 501} {"train_loss": -5.218459129333496, "global_step": 21064, "epoch": 501} {"train_loss": -5.242463111877441, "global_step": 21065, "epoch": 501} {"train_loss": -5.479238510131836, "global_step": 21066, "epoch": 501} {"train_loss": -5.358551025390625, "global_step": 21067, "epoch": 501} {"train_loss": -5.375833511352539, "global_step": 21068, "epoch": 501} {"train_loss": -5.267908573150635, "global_step": 21069, "epoch": 501} {"train_loss": -5.366208076477051, "global_step": 21070, "epoch": 501} {"train_loss": -5.326893329620361, "global_step": 21071, "epoch": 501} {"train_loss": -5.373283386230469, "global_step": 21072, "epoch": 501} {"train_loss": -5.338366508483887, "global_step": 21073, "epoch": 501} {"train_loss": -5.254633903503418, "global_step": 21074, "epoch": 501} {"train_loss": -5.270221710205078, "global_step": 21075, "epoch": 501} {"train_loss": -5.364802360534668, "global_step": 21076, "epoch": 501} {"train_loss": -5.331332683563232, "global_step": 21077, "epoch": 501} {"train_loss": -5.375008583068848, "global_step": 21078, "epoch": 501} {"train_loss": -5.2442193031311035, "global_step": 21079, "epoch": 501} {"train_loss": -5.371517181396484, "global_step": 21080, "epoch": 501} {"train_loss": -5.460238456726074, "global_step": 21081, "epoch": 501} {"train_loss": -5.337823390960693, "global_step": 21082, "epoch": 501} {"train_loss": -5.317928870519002, "global_step": 21083, "epoch": 501, "val_loss": 67323.96875} {"train_loss": -5.367926597595215, "global_step": 21084, "epoch": 502} {"train_loss": -5.296983242034912, "global_step": 21085, "epoch": 502} {"train_loss": -5.301225662231445, "global_step": 21086, "epoch": 502} {"train_loss": -5.241390228271484, "global_step": 21087, "epoch": 502} {"train_loss": -5.176796913146973, "global_step": 21088, "epoch": 502} {"train_loss": -5.213590145111084, "global_step": 21089, "epoch": 502} {"train_loss": -5.355827808380127, "global_step": 21090, "epoch": 502} {"train_loss": -5.365927696228027, "global_step": 21091, "epoch": 502} {"train_loss": -5.364132881164551, "global_step": 21092, "epoch": 502} {"train_loss": -5.280568599700928, "global_step": 21093, "epoch": 502} {"train_loss": -5.26753044128418, "global_step": 21094, "epoch": 502} {"train_loss": -5.329022407531738, "global_step": 21095, "epoch": 502} {"train_loss": -5.2768096923828125, "global_step": 21096, "epoch": 502} {"train_loss": -5.342110633850098, "global_step": 21097, "epoch": 502} {"train_loss": -5.2731475830078125, "global_step": 21098, "epoch": 502} {"train_loss": -5.229680061340332, "global_step": 21099, "epoch": 502} {"train_loss": -5.23742151260376, "global_step": 21100, "epoch": 502} {"train_loss": -5.388002395629883, "global_step": 21101, "epoch": 502} {"train_loss": -5.259096145629883, "global_step": 21102, "epoch": 502} {"train_loss": -5.4041948318481445, "global_step": 21103, "epoch": 502} {"train_loss": -5.349977493286133, "global_step": 21104, "epoch": 502} {"train_loss": -5.35228157043457, "global_step": 21105, "epoch": 502} {"train_loss": -5.202898025512695, "global_step": 21106, "epoch": 502} {"train_loss": -5.331420421600342, "global_step": 21107, "epoch": 502} {"train_loss": -5.160920143127441, "global_step": 21108, "epoch": 502} {"train_loss": -5.332978248596191, "global_step": 21109, "epoch": 502} {"train_loss": -5.360863208770752, "global_step": 21110, "epoch": 502} {"train_loss": -5.375089168548584, "global_step": 21111, "epoch": 502} {"train_loss": -5.333716869354248, "global_step": 21112, "epoch": 502} {"train_loss": -5.2921223640441895, "global_step": 21113, "epoch": 502} {"train_loss": -5.275996208190918, "global_step": 21114, "epoch": 502} {"train_loss": -5.323731422424316, "global_step": 21115, "epoch": 502} {"train_loss": -5.313297271728516, "global_step": 21116, "epoch": 502} {"train_loss": -5.306394577026367, "global_step": 21117, "epoch": 502} {"train_loss": -5.365504741668701, "global_step": 21118, "epoch": 502} {"train_loss": -5.20886754989624, "global_step": 21119, "epoch": 502} {"train_loss": -5.351364612579346, "global_step": 21120, "epoch": 502} {"train_loss": -5.305567741394043, "global_step": 21121, "epoch": 502} {"train_loss": -5.299690246582031, "global_step": 21122, "epoch": 502} {"train_loss": -5.354787826538086, "global_step": 21123, "epoch": 502} {"train_loss": -5.26648473739624, "global_step": 21124, "epoch": 502} {"train_loss": -5.304254395621164, "global_step": 21125, "epoch": 502, "val_loss": 67057.390625} {"train_loss": -5.4271559715271, "global_step": 21126, "epoch": 503} {"train_loss": -5.330879211425781, "global_step": 21127, "epoch": 503} {"train_loss": -5.408082962036133, "global_step": 21128, "epoch": 503} {"train_loss": -5.433116912841797, "global_step": 21129, "epoch": 503} {"train_loss": -5.411274433135986, "global_step": 21130, "epoch": 503} {"train_loss": -5.353351593017578, "global_step": 21131, "epoch": 503} {"train_loss": -5.329730033874512, "global_step": 21132, "epoch": 503} {"train_loss": -5.313425540924072, "global_step": 21133, "epoch": 503} {"train_loss": -5.231270790100098, "global_step": 21134, "epoch": 503} {"train_loss": -5.129340648651123, "global_step": 21135, "epoch": 503} {"train_loss": -5.193058967590332, "global_step": 21136, "epoch": 503} {"train_loss": -5.231201171875, "global_step": 21137, "epoch": 503} {"train_loss": -5.280074119567871, "global_step": 21138, "epoch": 503} {"train_loss": -5.327481269836426, "global_step": 21139, "epoch": 503} {"train_loss": -5.235316753387451, "global_step": 21140, "epoch": 503} {"train_loss": -5.391623020172119, "global_step": 21141, "epoch": 503} {"train_loss": -5.287358283996582, "global_step": 21142, "epoch": 503} {"train_loss": -5.2748236656188965, "global_step": 21143, "epoch": 503} {"train_loss": -5.3469157218933105, "global_step": 21144, "epoch": 503} {"train_loss": -5.295169353485107, "global_step": 21145, "epoch": 503} {"train_loss": -5.434502601623535, "global_step": 21146, "epoch": 503} {"train_loss": -5.38603401184082, "global_step": 21147, "epoch": 503} {"train_loss": -5.313726425170898, "global_step": 21148, "epoch": 503} {"train_loss": -5.3343353271484375, "global_step": 21149, "epoch": 503} {"train_loss": -5.316773414611816, "global_step": 21150, "epoch": 503} {"train_loss": -5.278350830078125, "global_step": 21151, "epoch": 503} {"train_loss": -5.356908321380615, "global_step": 21152, "epoch": 503} {"train_loss": -5.3091230392456055, "global_step": 21153, "epoch": 503} {"train_loss": -5.350569725036621, "global_step": 21154, "epoch": 503} {"train_loss": -5.490504741668701, "global_step": 21155, "epoch": 503} {"train_loss": -5.367433071136475, "global_step": 21156, "epoch": 503} {"train_loss": -5.349283218383789, "global_step": 21157, "epoch": 503} {"train_loss": -5.342897415161133, "global_step": 21158, "epoch": 503} {"train_loss": -5.37458610534668, "global_step": 21159, "epoch": 503} {"train_loss": -5.43173360824585, "global_step": 21160, "epoch": 503} {"train_loss": -5.242259979248047, "global_step": 21161, "epoch": 503} {"train_loss": -5.204578399658203, "global_step": 21162, "epoch": 503} {"train_loss": -5.3538994789123535, "global_step": 21163, "epoch": 503} {"train_loss": -5.418663501739502, "global_step": 21164, "epoch": 503} {"train_loss": -5.213863849639893, "global_step": 21165, "epoch": 503} {"train_loss": -5.216567039489746, "global_step": 21166, "epoch": 503} {"train_loss": -5.3225294181278775, "global_step": 21167, "epoch": 503, "val_loss": 66793.921875} {"train_loss": -5.398558139801025, "global_step": 21168, "epoch": 504} {"train_loss": -5.35689640045166, "global_step": 21169, "epoch": 504} {"train_loss": -5.362388610839844, "global_step": 21170, "epoch": 504} {"train_loss": -5.465916633605957, "global_step": 21171, "epoch": 504} {"train_loss": -5.233122825622559, "global_step": 21172, "epoch": 504} {"train_loss": -5.258444786071777, "global_step": 21173, "epoch": 504} {"train_loss": -5.434321403503418, "global_step": 21174, "epoch": 504} {"train_loss": -5.336745262145996, "global_step": 21175, "epoch": 504} {"train_loss": -5.289116382598877, "global_step": 21176, "epoch": 504} {"train_loss": -5.240605354309082, "global_step": 21177, "epoch": 504} {"train_loss": -5.326273441314697, "global_step": 21178, "epoch": 504} {"train_loss": -5.41658353805542, "global_step": 21179, "epoch": 504} {"train_loss": -5.371233940124512, "global_step": 21180, "epoch": 504} {"train_loss": -5.3702392578125, "global_step": 21181, "epoch": 504} {"train_loss": -5.3812174797058105, "global_step": 21182, "epoch": 504} {"train_loss": -5.2862443923950195, "global_step": 21183, "epoch": 504} {"train_loss": -5.186644554138184, "global_step": 21184, "epoch": 504} {"train_loss": -5.308142185211182, "global_step": 21185, "epoch": 504} {"train_loss": -5.379207611083984, "global_step": 21186, "epoch": 504} {"train_loss": -5.353364944458008, "global_step": 21187, "epoch": 504} {"train_loss": -5.399086952209473, "global_step": 21188, "epoch": 504} {"train_loss": -5.377416610717773, "global_step": 21189, "epoch": 504} {"train_loss": -5.404516696929932, "global_step": 21190, "epoch": 504} {"train_loss": -5.314319133758545, "global_step": 21191, "epoch": 504} {"train_loss": -5.391326904296875, "global_step": 21192, "epoch": 504} {"train_loss": -5.344221115112305, "global_step": 21193, "epoch": 504} {"train_loss": -5.238354682922363, "global_step": 21194, "epoch": 504} {"train_loss": -5.352266311645508, "global_step": 21195, "epoch": 504} {"train_loss": -5.321393013000488, "global_step": 21196, "epoch": 504} {"train_loss": -5.37153434753418, "global_step": 21197, "epoch": 504} {"train_loss": -5.259364128112793, "global_step": 21198, "epoch": 504} {"train_loss": -5.207433223724365, "global_step": 21199, "epoch": 504} {"train_loss": -5.454366683959961, "global_step": 21200, "epoch": 504} {"train_loss": -5.376965522766113, "global_step": 21201, "epoch": 504} {"train_loss": -5.27006721496582, "global_step": 21202, "epoch": 504} {"train_loss": -5.247384071350098, "global_step": 21203, "epoch": 504} {"train_loss": -5.237949371337891, "global_step": 21204, "epoch": 504} {"train_loss": -5.368182182312012, "global_step": 21205, "epoch": 504} {"train_loss": -5.137845039367676, "global_step": 21206, "epoch": 504} {"train_loss": -5.322304725646973, "global_step": 21207, "epoch": 504} {"train_loss": -5.333089828491211, "global_step": 21208, "epoch": 504} {"train_loss": -5.326584645680019, "global_step": 21209, "epoch": 504, "val_loss": 67304.0} {"train_loss": -5.191706657409668, "global_step": 21210, "epoch": 505} {"train_loss": -5.5277581214904785, "global_step": 21211, "epoch": 505} {"train_loss": -5.228774547576904, "global_step": 21212, "epoch": 505} {"train_loss": -5.3158769607543945, "global_step": 21213, "epoch": 505} {"train_loss": -5.339291095733643, "global_step": 21214, "epoch": 505} {"train_loss": -5.140198707580566, "global_step": 21215, "epoch": 505} {"train_loss": -5.334087371826172, "global_step": 21216, "epoch": 505} {"train_loss": -5.2469801902771, "global_step": 21217, "epoch": 505} {"train_loss": -5.386441230773926, "global_step": 21218, "epoch": 505} {"train_loss": -5.368181228637695, "global_step": 21219, "epoch": 505} {"train_loss": -5.348170280456543, "global_step": 21220, "epoch": 505} {"train_loss": -5.342424392700195, "global_step": 21221, "epoch": 505} {"train_loss": -5.40657901763916, "global_step": 21222, "epoch": 505} {"train_loss": -5.352486610412598, "global_step": 21223, "epoch": 505} {"train_loss": -5.256972312927246, "global_step": 21224, "epoch": 505} {"train_loss": -5.235172748565674, "global_step": 21225, "epoch": 505} {"train_loss": -5.283392429351807, "global_step": 21226, "epoch": 505} {"train_loss": -5.264596939086914, "global_step": 21227, "epoch": 505} {"train_loss": -5.523734092712402, "global_step": 21228, "epoch": 505} {"train_loss": -5.44988489151001, "global_step": 21229, "epoch": 505} {"train_loss": -5.337155818939209, "global_step": 21230, "epoch": 505} {"train_loss": -5.360047340393066, "global_step": 21231, "epoch": 505} {"train_loss": -5.229106903076172, "global_step": 21232, "epoch": 505} {"train_loss": -5.3190202713012695, "global_step": 21233, "epoch": 505} {"train_loss": -5.40535306930542, "global_step": 21234, "epoch": 505} {"train_loss": -5.397159576416016, "global_step": 21235, "epoch": 505} {"train_loss": -5.347572326660156, "global_step": 21236, "epoch": 505} {"train_loss": -5.43037223815918, "global_step": 21237, "epoch": 505} {"train_loss": -5.284815788269043, "global_step": 21238, "epoch": 505} {"train_loss": -5.352475166320801, "global_step": 21239, "epoch": 505} {"train_loss": -5.2279157638549805, "global_step": 21240, "epoch": 505} {"train_loss": -5.387317657470703, "global_step": 21241, "epoch": 505} {"train_loss": -5.313767433166504, "global_step": 21242, "epoch": 505} {"train_loss": -5.3416643142700195, "global_step": 21243, "epoch": 505} {"train_loss": -5.234196662902832, "global_step": 21244, "epoch": 505} {"train_loss": -5.320628643035889, "global_step": 21245, "epoch": 505} {"train_loss": -5.25260066986084, "global_step": 21246, "epoch": 505} {"train_loss": -5.292985916137695, "global_step": 21247, "epoch": 505} {"train_loss": -5.3380913734436035, "global_step": 21248, "epoch": 505} {"train_loss": -5.24935245513916, "global_step": 21249, "epoch": 505} {"train_loss": -5.175681114196777, "global_step": 21250, "epoch": 505} {"train_loss": -5.319380612600417, "global_step": 21251, "epoch": 505, "val_loss": 66839.71875} {"train_loss": -5.317985534667969, "global_step": 21252, "epoch": 506} {"train_loss": -5.31987190246582, "global_step": 21253, "epoch": 506} {"train_loss": -5.328582763671875, "global_step": 21254, "epoch": 506} {"train_loss": -5.327958106994629, "global_step": 21255, "epoch": 506} {"train_loss": -5.211297988891602, "global_step": 21256, "epoch": 506} {"train_loss": -5.370014190673828, "global_step": 21257, "epoch": 506} {"train_loss": -5.489535331726074, "global_step": 21258, "epoch": 506} {"train_loss": -5.205471038818359, "global_step": 21259, "epoch": 506} {"train_loss": -5.092294692993164, "global_step": 21260, "epoch": 506} {"train_loss": -5.185783386230469, "global_step": 21261, "epoch": 506} {"train_loss": -5.337969779968262, "global_step": 21262, "epoch": 506} {"train_loss": -5.312648773193359, "global_step": 21263, "epoch": 506} {"train_loss": -5.185000419616699, "global_step": 21264, "epoch": 506} {"train_loss": -5.394819259643555, "global_step": 21265, "epoch": 506} {"train_loss": -5.203402042388916, "global_step": 21266, "epoch": 506} {"train_loss": -5.340431213378906, "global_step": 21267, "epoch": 506} {"train_loss": -5.388200283050537, "global_step": 21268, "epoch": 506} {"train_loss": -5.365985870361328, "global_step": 21269, "epoch": 506} {"train_loss": -5.376359939575195, "global_step": 21270, "epoch": 506} {"train_loss": -5.326416969299316, "global_step": 21271, "epoch": 506} {"train_loss": -5.407819747924805, "global_step": 21272, "epoch": 506} {"train_loss": -5.209646224975586, "global_step": 21273, "epoch": 506} {"train_loss": -5.381109237670898, "global_step": 21274, "epoch": 506} {"train_loss": -5.4568071365356445, "global_step": 21275, "epoch": 506} {"train_loss": -5.112260818481445, "global_step": 21276, "epoch": 506} {"train_loss": -5.302424430847168, "global_step": 21277, "epoch": 506} {"train_loss": -5.346144199371338, "global_step": 21278, "epoch": 506} {"train_loss": -5.241829872131348, "global_step": 21279, "epoch": 506} {"train_loss": -5.182474136352539, "global_step": 21280, "epoch": 506} {"train_loss": -5.304222106933594, "global_step": 21281, "epoch": 506} {"train_loss": -5.2701826095581055, "global_step": 21282, "epoch": 506} {"train_loss": -5.290341377258301, "global_step": 21283, "epoch": 506} {"train_loss": -5.3504180908203125, "global_step": 21284, "epoch": 506} {"train_loss": -5.302988052368164, "global_step": 21285, "epoch": 506} {"train_loss": -5.422873020172119, "global_step": 21286, "epoch": 506} {"train_loss": -5.290989398956299, "global_step": 21287, "epoch": 506} {"train_loss": -5.377346515655518, "global_step": 21288, "epoch": 506} {"train_loss": -5.300477027893066, "global_step": 21289, "epoch": 506} {"train_loss": -5.377133369445801, "global_step": 21290, "epoch": 506} {"train_loss": -5.319295406341553, "global_step": 21291, "epoch": 506} {"train_loss": -5.208978176116943, "global_step": 21292, "epoch": 506} {"train_loss": -5.312022311346872, "global_step": 21293, "epoch": 506, "val_loss": 67176.8984375} {"train_loss": -5.382172107696533, "global_step": 21294, "epoch": 507} {"train_loss": -5.326230525970459, "global_step": 21295, "epoch": 507} {"train_loss": -5.166779518127441, "global_step": 21296, "epoch": 507} {"train_loss": -5.474386215209961, "global_step": 21297, "epoch": 507} {"train_loss": -5.346400260925293, "global_step": 21298, "epoch": 507} {"train_loss": -5.165392875671387, "global_step": 21299, "epoch": 507} {"train_loss": -5.265542984008789, "global_step": 21300, "epoch": 507} {"train_loss": -5.27203893661499, "global_step": 21301, "epoch": 507} {"train_loss": -5.248730659484863, "global_step": 21302, "epoch": 507} {"train_loss": -5.298007965087891, "global_step": 21303, "epoch": 507} {"train_loss": -5.366079330444336, "global_step": 21304, "epoch": 507} {"train_loss": -5.365682601928711, "global_step": 21305, "epoch": 507} {"train_loss": -5.325615406036377, "global_step": 21306, "epoch": 507} {"train_loss": -5.292356491088867, "global_step": 21307, "epoch": 507} {"train_loss": -5.355388164520264, "global_step": 21308, "epoch": 507} {"train_loss": -5.338897705078125, "global_step": 21309, "epoch": 507} {"train_loss": -5.282674312591553, "global_step": 21310, "epoch": 507} {"train_loss": -5.1985602378845215, "global_step": 21311, "epoch": 507} {"train_loss": -5.202272415161133, "global_step": 21312, "epoch": 507} {"train_loss": -5.221221923828125, "global_step": 21313, "epoch": 507} {"train_loss": -5.341439247131348, "global_step": 21314, "epoch": 507} {"train_loss": -5.407788276672363, "global_step": 21315, "epoch": 507} {"train_loss": -5.218778133392334, "global_step": 21316, "epoch": 507} {"train_loss": -5.296750545501709, "global_step": 21317, "epoch": 507} {"train_loss": -5.372517108917236, "global_step": 21318, "epoch": 507} {"train_loss": -5.4120941162109375, "global_step": 21319, "epoch": 507} {"train_loss": -5.295980453491211, "global_step": 21320, "epoch": 507} {"train_loss": -5.246827125549316, "global_step": 21321, "epoch": 507} {"train_loss": -5.270984172821045, "global_step": 21322, "epoch": 507} {"train_loss": -5.439377784729004, "global_step": 21323, "epoch": 507} {"train_loss": -5.309052467346191, "global_step": 21324, "epoch": 507} {"train_loss": -5.237485408782959, "global_step": 21325, "epoch": 507} {"train_loss": -5.376847267150879, "global_step": 21326, "epoch": 507} {"train_loss": -5.230847358703613, "global_step": 21327, "epoch": 507} {"train_loss": -5.184026718139648, "global_step": 21328, "epoch": 507} {"train_loss": -5.498147964477539, "global_step": 21329, "epoch": 507} {"train_loss": -5.227717399597168, "global_step": 21330, "epoch": 507} {"train_loss": -5.333941459655762, "global_step": 21331, "epoch": 507} {"train_loss": -5.325348377227783, "global_step": 21332, "epoch": 507} {"train_loss": -5.305948257446289, "global_step": 21333, "epoch": 507} {"train_loss": -5.249471664428711, "global_step": 21334, "epoch": 507} {"train_loss": -5.304663397016979, "global_step": 21335, "epoch": 507, "val_loss": 66891.3515625} {"train_loss": -5.2274675369262695, "global_step": 21336, "epoch": 508} {"train_loss": -5.290353298187256, "global_step": 21337, "epoch": 508} {"train_loss": -5.374023914337158, "global_step": 21338, "epoch": 508} {"train_loss": -5.270718574523926, "global_step": 21339, "epoch": 508} {"train_loss": -5.4199676513671875, "global_step": 21340, "epoch": 508} {"train_loss": -5.3800764083862305, "global_step": 21341, "epoch": 508} {"train_loss": -5.292085647583008, "global_step": 21342, "epoch": 508} {"train_loss": -5.320910930633545, "global_step": 21343, "epoch": 508} {"train_loss": -5.280016899108887, "global_step": 21344, "epoch": 508} {"train_loss": -5.269255638122559, "global_step": 21345, "epoch": 508} {"train_loss": -5.219203948974609, "global_step": 21346, "epoch": 508} {"train_loss": -5.200918197631836, "global_step": 21347, "epoch": 508} {"train_loss": -5.237797737121582, "global_step": 21348, "epoch": 508} {"train_loss": -5.376307964324951, "global_step": 21349, "epoch": 508} {"train_loss": -5.30092716217041, "global_step": 21350, "epoch": 508} {"train_loss": -5.229736804962158, "global_step": 21351, "epoch": 508} {"train_loss": -5.364856243133545, "global_step": 21352, "epoch": 508} {"train_loss": -5.313839912414551, "global_step": 21353, "epoch": 508} {"train_loss": -5.2108540534973145, "global_step": 21354, "epoch": 508} {"train_loss": -5.232698440551758, "global_step": 21355, "epoch": 508} {"train_loss": -5.280823707580566, "global_step": 21356, "epoch": 508} {"train_loss": -5.281788349151611, "global_step": 21357, "epoch": 508} {"train_loss": -5.146869659423828, "global_step": 21358, "epoch": 508} {"train_loss": -5.307504177093506, "global_step": 21359, "epoch": 508} {"train_loss": -5.344269275665283, "global_step": 21360, "epoch": 508} {"train_loss": -5.207023620605469, "global_step": 21361, "epoch": 508} {"train_loss": -5.3940606117248535, "global_step": 21362, "epoch": 508} {"train_loss": -5.298466682434082, "global_step": 21363, "epoch": 508} {"train_loss": -5.305375099182129, "global_step": 21364, "epoch": 508} {"train_loss": -5.347624778747559, "global_step": 21365, "epoch": 508} {"train_loss": -5.229435443878174, "global_step": 21366, "epoch": 508} {"train_loss": -5.286124229431152, "global_step": 21367, "epoch": 508} {"train_loss": -5.292330741882324, "global_step": 21368, "epoch": 508} {"train_loss": -5.123135566711426, "global_step": 21369, "epoch": 508} {"train_loss": -5.358982563018799, "global_step": 21370, "epoch": 508} {"train_loss": -5.299431800842285, "global_step": 21371, "epoch": 508} {"train_loss": -5.150700569152832, "global_step": 21372, "epoch": 508} {"train_loss": -5.257145404815674, "global_step": 21373, "epoch": 508} {"train_loss": -5.233869552612305, "global_step": 21374, "epoch": 508} {"train_loss": -5.20186185836792, "global_step": 21375, "epoch": 508} {"train_loss": -5.187939643859863, "global_step": 21376, "epoch": 508} {"train_loss": -5.2770238263266425, "global_step": 21377, "epoch": 508, "val_loss": 67088.28125} {"train_loss": -5.217236042022705, "global_step": 21378, "epoch": 509} {"train_loss": -5.185591220855713, "global_step": 21379, "epoch": 509} {"train_loss": -5.380483627319336, "global_step": 21380, "epoch": 509} {"train_loss": -5.155806064605713, "global_step": 21381, "epoch": 509} {"train_loss": -5.391218185424805, "global_step": 21382, "epoch": 509} {"train_loss": -5.293745994567871, "global_step": 21383, "epoch": 509} {"train_loss": -5.347745418548584, "global_step": 21384, "epoch": 509} {"train_loss": -5.392544746398926, "global_step": 21385, "epoch": 509} {"train_loss": -5.33927059173584, "global_step": 21386, "epoch": 509} {"train_loss": -5.452299118041992, "global_step": 21387, "epoch": 509} {"train_loss": -5.29061222076416, "global_step": 21388, "epoch": 509} {"train_loss": -5.264758110046387, "global_step": 21389, "epoch": 509} {"train_loss": -5.365556716918945, "global_step": 21390, "epoch": 509} {"train_loss": -5.295295715332031, "global_step": 21391, "epoch": 509} {"train_loss": -5.349638938903809, "global_step": 21392, "epoch": 509} {"train_loss": -5.3242669105529785, "global_step": 21393, "epoch": 509} {"train_loss": -5.248257637023926, "global_step": 21394, "epoch": 509} {"train_loss": -5.315549850463867, "global_step": 21395, "epoch": 509} {"train_loss": -5.39241886138916, "global_step": 21396, "epoch": 509} {"train_loss": -5.276196479797363, "global_step": 21397, "epoch": 509} {"train_loss": -5.306491851806641, "global_step": 21398, "epoch": 509} {"train_loss": -5.19449520111084, "global_step": 21399, "epoch": 509} {"train_loss": -5.316944599151611, "global_step": 21400, "epoch": 509} {"train_loss": -5.373252868652344, "global_step": 21401, "epoch": 509} {"train_loss": -5.316744804382324, "global_step": 21402, "epoch": 509} {"train_loss": -5.315517902374268, "global_step": 21403, "epoch": 509} {"train_loss": -5.354715347290039, "global_step": 21404, "epoch": 509} {"train_loss": -5.241843223571777, "global_step": 21405, "epoch": 509} {"train_loss": -5.321521759033203, "global_step": 21406, "epoch": 509} {"train_loss": -5.38129997253418, "global_step": 21407, "epoch": 509} {"train_loss": -5.2560529708862305, "global_step": 21408, "epoch": 509} {"train_loss": -5.401906490325928, "global_step": 21409, "epoch": 509} {"train_loss": -5.294261932373047, "global_step": 21410, "epoch": 509} {"train_loss": -5.263689994812012, "global_step": 21411, "epoch": 509} {"train_loss": -5.369554042816162, "global_step": 21412, "epoch": 509} {"train_loss": -5.319149017333984, "global_step": 21413, "epoch": 509} {"train_loss": -5.198545455932617, "global_step": 21414, "epoch": 509} {"train_loss": -5.2929887771606445, "global_step": 21415, "epoch": 509} {"train_loss": -5.203641414642334, "global_step": 21416, "epoch": 509} {"train_loss": -5.236218452453613, "global_step": 21417, "epoch": 509} {"train_loss": -5.295716285705566, "global_step": 21418, "epoch": 509} {"train_loss": -5.3044507049378895, "global_step": 21419, "epoch": 509, "val_loss": 67316.640625} {"train_loss": -5.357046127319336, "global_step": 21420, "epoch": 510} {"train_loss": -5.432478904724121, "global_step": 21421, "epoch": 510} {"train_loss": -5.2408061027526855, "global_step": 21422, "epoch": 510} {"train_loss": -5.3240966796875, "global_step": 21423, "epoch": 510} {"train_loss": -5.279886245727539, "global_step": 21424, "epoch": 510} {"train_loss": -5.223613739013672, "global_step": 21425, "epoch": 510} {"train_loss": -5.3852715492248535, "global_step": 21426, "epoch": 510} {"train_loss": -5.313508033752441, "global_step": 21427, "epoch": 510} {"train_loss": -5.389744758605957, "global_step": 21428, "epoch": 510} {"train_loss": -5.154870986938477, "global_step": 21429, "epoch": 510} {"train_loss": -5.2511677742004395, "global_step": 21430, "epoch": 510} {"train_loss": -5.368007183074951, "global_step": 21431, "epoch": 510} {"train_loss": -5.371168613433838, "global_step": 21432, "epoch": 510} {"train_loss": -5.33646297454834, "global_step": 21433, "epoch": 510} {"train_loss": -5.2902913093566895, "global_step": 21434, "epoch": 510} {"train_loss": -5.350480079650879, "global_step": 21435, "epoch": 510} {"train_loss": -5.34495735168457, "global_step": 21436, "epoch": 510} {"train_loss": -5.382274150848389, "global_step": 21437, "epoch": 510} {"train_loss": -5.234658241271973, "global_step": 21438, "epoch": 510} {"train_loss": -5.3019914627075195, "global_step": 21439, "epoch": 510} {"train_loss": -5.3848981857299805, "global_step": 21440, "epoch": 510} {"train_loss": -5.3719916343688965, "global_step": 21441, "epoch": 510} {"train_loss": -5.291638374328613, "global_step": 21442, "epoch": 510} {"train_loss": -5.387150764465332, "global_step": 21443, "epoch": 510} {"train_loss": -5.4178361892700195, "global_step": 21444, "epoch": 510} {"train_loss": -5.2773332595825195, "global_step": 21445, "epoch": 510} {"train_loss": -5.390712738037109, "global_step": 21446, "epoch": 510} {"train_loss": -5.2397685050964355, "global_step": 21447, "epoch": 510} {"train_loss": -5.353883266448975, "global_step": 21448, "epoch": 510} {"train_loss": -5.142769813537598, "global_step": 21449, "epoch": 510} {"train_loss": -5.202743053436279, "global_step": 21450, "epoch": 510} {"train_loss": -5.2767767906188965, "global_step": 21451, "epoch": 510} {"train_loss": -5.2416486740112305, "global_step": 21452, "epoch": 510} {"train_loss": -5.243471145629883, "global_step": 21453, "epoch": 510} {"train_loss": -5.384791374206543, "global_step": 21454, "epoch": 510} {"train_loss": -5.214774131774902, "global_step": 21455, "epoch": 510} {"train_loss": -5.372870445251465, "global_step": 21456, "epoch": 510} {"train_loss": -5.257176876068115, "global_step": 21457, "epoch": 510} {"train_loss": -5.319814205169678, "global_step": 21458, "epoch": 510} {"train_loss": -5.133034706115723, "global_step": 21459, "epoch": 510} {"train_loss": -5.335695266723633, "global_step": 21460, "epoch": 510} {"train_loss": -5.307181392397199, "global_step": 21461, "epoch": 510, "val_loss": 67737.4921875} {"train_loss": -5.139326095581055, "global_step": 21462, "epoch": 511} {"train_loss": -5.40250301361084, "global_step": 21463, "epoch": 511} {"train_loss": -5.30356502532959, "global_step": 21464, "epoch": 511} {"train_loss": -5.268272399902344, "global_step": 21465, "epoch": 511} {"train_loss": -5.268487930297852, "global_step": 21466, "epoch": 511} {"train_loss": -5.443254470825195, "global_step": 21467, "epoch": 511} {"train_loss": -5.165138244628906, "global_step": 21468, "epoch": 511} {"train_loss": -5.259089469909668, "global_step": 21469, "epoch": 511} {"train_loss": -5.243633270263672, "global_step": 21470, "epoch": 511} {"train_loss": -5.363515853881836, "global_step": 21471, "epoch": 511} {"train_loss": -5.2689971923828125, "global_step": 21472, "epoch": 511} {"train_loss": -5.251893997192383, "global_step": 21473, "epoch": 511} {"train_loss": -5.403855323791504, "global_step": 21474, "epoch": 511} {"train_loss": -5.3622283935546875, "global_step": 21475, "epoch": 511} {"train_loss": -5.354131698608398, "global_step": 21476, "epoch": 511} {"train_loss": -5.4497175216674805, "global_step": 21477, "epoch": 511} {"train_loss": -5.383957862854004, "global_step": 21478, "epoch": 511} {"train_loss": -5.448533058166504, "global_step": 21479, "epoch": 511} {"train_loss": -5.39682149887085, "global_step": 21480, "epoch": 511} {"train_loss": -5.410822868347168, "global_step": 21481, "epoch": 511} {"train_loss": -5.450596809387207, "global_step": 21482, "epoch": 511} {"train_loss": -5.322203159332275, "global_step": 21483, "epoch": 511} {"train_loss": -5.325408458709717, "global_step": 21484, "epoch": 511} {"train_loss": -5.138639450073242, "global_step": 21485, "epoch": 511} {"train_loss": -5.434569358825684, "global_step": 21486, "epoch": 511} {"train_loss": -5.298064231872559, "global_step": 21487, "epoch": 511} {"train_loss": -5.353883266448975, "global_step": 21488, "epoch": 511} {"train_loss": -5.237137794494629, "global_step": 21489, "epoch": 511} {"train_loss": -5.297863960266113, "global_step": 21490, "epoch": 511} {"train_loss": -5.325486183166504, "global_step": 21491, "epoch": 511} {"train_loss": -5.270851135253906, "global_step": 21492, "epoch": 511} {"train_loss": -5.417288780212402, "global_step": 21493, "epoch": 511} {"train_loss": -5.4012250900268555, "global_step": 21494, "epoch": 511} {"train_loss": -5.425624847412109, "global_step": 21495, "epoch": 511} {"train_loss": -5.386480331420898, "global_step": 21496, "epoch": 511} {"train_loss": -5.432769775390625, "global_step": 21497, "epoch": 511} {"train_loss": -5.319169998168945, "global_step": 21498, "epoch": 511} {"train_loss": -5.363028526306152, "global_step": 21499, "epoch": 511} {"train_loss": -5.188488006591797, "global_step": 21500, "epoch": 511} {"train_loss": -5.379159927368164, "global_step": 21501, "epoch": 511} {"train_loss": -5.39445161819458, "global_step": 21502, "epoch": 511} {"train_loss": -5.333657253356207, "global_step": 21503, "epoch": 511, "val_loss": 67053.59375} {"train_loss": -5.382530212402344, "global_step": 21504, "epoch": 512} {"train_loss": -5.375432968139648, "global_step": 21505, "epoch": 512} {"train_loss": -5.251782417297363, "global_step": 21506, "epoch": 512} {"train_loss": -5.362046241760254, "global_step": 21507, "epoch": 512} {"train_loss": -5.452624320983887, "global_step": 21508, "epoch": 512} {"train_loss": -5.201961517333984, "global_step": 21509, "epoch": 512} {"train_loss": -5.321555137634277, "global_step": 21510, "epoch": 512} {"train_loss": -5.3141350746154785, "global_step": 21511, "epoch": 512} {"train_loss": -5.234350204467773, "global_step": 21512, "epoch": 512} {"train_loss": -5.290354251861572, "global_step": 21513, "epoch": 512} {"train_loss": -5.378964900970459, "global_step": 21514, "epoch": 512} {"train_loss": -5.394582748413086, "global_step": 21515, "epoch": 512} {"train_loss": -5.332087516784668, "global_step": 21516, "epoch": 512} {"train_loss": -5.341485977172852, "global_step": 21517, "epoch": 512} {"train_loss": -5.358495712280273, "global_step": 21518, "epoch": 512} {"train_loss": -5.284897327423096, "global_step": 21519, "epoch": 512} {"train_loss": -5.251346588134766, "global_step": 21520, "epoch": 512} {"train_loss": -5.417069435119629, "global_step": 21521, "epoch": 512} {"train_loss": -5.390603542327881, "global_step": 21522, "epoch": 512} {"train_loss": -5.29329776763916, "global_step": 21523, "epoch": 512} {"train_loss": -5.267007350921631, "global_step": 21524, "epoch": 512} {"train_loss": -5.397306442260742, "global_step": 21525, "epoch": 512} {"train_loss": -5.324330806732178, "global_step": 21526, "epoch": 512} {"train_loss": -5.3263115882873535, "global_step": 21527, "epoch": 512} {"train_loss": -5.332597732543945, "global_step": 21528, "epoch": 512} {"train_loss": -5.337098121643066, "global_step": 21529, "epoch": 512} {"train_loss": -5.351835250854492, "global_step": 21530, "epoch": 512} {"train_loss": -5.309718132019043, "global_step": 21531, "epoch": 512} {"train_loss": -5.326468467712402, "global_step": 21532, "epoch": 512} {"train_loss": -5.406556129455566, "global_step": 21533, "epoch": 512} {"train_loss": -5.250225067138672, "global_step": 21534, "epoch": 512} {"train_loss": -5.209847450256348, "global_step": 21535, "epoch": 512} {"train_loss": -5.342618942260742, "global_step": 21536, "epoch": 512} {"train_loss": -5.222341060638428, "global_step": 21537, "epoch": 512} {"train_loss": -5.453512191772461, "global_step": 21538, "epoch": 512} {"train_loss": -5.427633762359619, "global_step": 21539, "epoch": 512} {"train_loss": -5.211690425872803, "global_step": 21540, "epoch": 512} {"train_loss": -5.33232307434082, "global_step": 21541, "epoch": 512} {"train_loss": -5.372678279876709, "global_step": 21542, "epoch": 512} {"train_loss": -5.243962287902832, "global_step": 21543, "epoch": 512} {"train_loss": -5.310075759887695, "global_step": 21544, "epoch": 512} {"train_loss": -5.326495136533465, "global_step": 21545, "epoch": 512, "val_loss": 67063.90625} {"train_loss": -5.393730163574219, "global_step": 21546, "epoch": 513} {"train_loss": -5.2843523025512695, "global_step": 21547, "epoch": 513} {"train_loss": -5.270266532897949, "global_step": 21548, "epoch": 513} {"train_loss": -5.3654890060424805, "global_step": 21549, "epoch": 513} {"train_loss": -5.26312255859375, "global_step": 21550, "epoch": 513} {"train_loss": -5.260001182556152, "global_step": 21551, "epoch": 513} {"train_loss": -5.363617897033691, "global_step": 21552, "epoch": 513} {"train_loss": -5.239013671875, "global_step": 21553, "epoch": 513} {"train_loss": -5.360426902770996, "global_step": 21554, "epoch": 513} {"train_loss": -5.386814117431641, "global_step": 21555, "epoch": 513} {"train_loss": -5.186582565307617, "global_step": 21556, "epoch": 513} {"train_loss": -5.360055923461914, "global_step": 21557, "epoch": 513} {"train_loss": -5.331250190734863, "global_step": 21558, "epoch": 513} {"train_loss": -5.340647220611572, "global_step": 21559, "epoch": 513} {"train_loss": -5.4298176765441895, "global_step": 21560, "epoch": 513} {"train_loss": -5.361011505126953, "global_step": 21561, "epoch": 513} {"train_loss": -5.369096755981445, "global_step": 21562, "epoch": 513} {"train_loss": -5.486821174621582, "global_step": 21563, "epoch": 513} {"train_loss": -5.299569129943848, "global_step": 21564, "epoch": 513} {"train_loss": -5.429156303405762, "global_step": 21565, "epoch": 513} {"train_loss": -5.281345367431641, "global_step": 21566, "epoch": 513} {"train_loss": -5.279214382171631, "global_step": 21567, "epoch": 513} {"train_loss": -5.379264831542969, "global_step": 21568, "epoch": 513} {"train_loss": -5.403642177581787, "global_step": 21569, "epoch": 513} {"train_loss": -5.368647575378418, "global_step": 21570, "epoch": 513} {"train_loss": -5.232706546783447, "global_step": 21571, "epoch": 513} {"train_loss": -5.239114761352539, "global_step": 21572, "epoch": 513} {"train_loss": -5.280618190765381, "global_step": 21573, "epoch": 513} {"train_loss": -5.269078731536865, "global_step": 21574, "epoch": 513} {"train_loss": -5.1249494552612305, "global_step": 21575, "epoch": 513} {"train_loss": -5.374246597290039, "global_step": 21576, "epoch": 513} {"train_loss": -5.333012580871582, "global_step": 21577, "epoch": 513} {"train_loss": -5.267149448394775, "global_step": 21578, "epoch": 513} {"train_loss": -5.292755603790283, "global_step": 21579, "epoch": 513} {"train_loss": -5.331192970275879, "global_step": 21580, "epoch": 513} {"train_loss": -5.1700439453125, "global_step": 21581, "epoch": 513} {"train_loss": -5.3100738525390625, "global_step": 21582, "epoch": 513} {"train_loss": -5.226352691650391, "global_step": 21583, "epoch": 513} {"train_loss": -5.284359931945801, "global_step": 21584, "epoch": 513} {"train_loss": -5.4479660987854, "global_step": 21585, "epoch": 513} {"train_loss": -5.325584411621094, "global_step": 21586, "epoch": 513} {"train_loss": -5.3190078508286245, "global_step": 21587, "epoch": 513, "val_loss": 66757.5078125} {"train_loss": -5.320630073547363, "global_step": 21588, "epoch": 514} {"train_loss": -5.248415946960449, "global_step": 21589, "epoch": 514} {"train_loss": -5.260039329528809, "global_step": 21590, "epoch": 514} {"train_loss": -5.244772911071777, "global_step": 21591, "epoch": 514} {"train_loss": -5.28704833984375, "global_step": 21592, "epoch": 514} {"train_loss": -5.3348164558410645, "global_step": 21593, "epoch": 514} {"train_loss": -5.309642791748047, "global_step": 21594, "epoch": 514} {"train_loss": -5.356579303741455, "global_step": 21595, "epoch": 514} {"train_loss": -5.473040580749512, "global_step": 21596, "epoch": 514} {"train_loss": -5.311446189880371, "global_step": 21597, "epoch": 514} {"train_loss": -5.253381729125977, "global_step": 21598, "epoch": 514} {"train_loss": -5.301851749420166, "global_step": 21599, "epoch": 514} {"train_loss": -5.56793212890625, "global_step": 21600, "epoch": 514} {"train_loss": -5.3877034187316895, "global_step": 21601, "epoch": 514} {"train_loss": -5.475008010864258, "global_step": 21602, "epoch": 514} {"train_loss": -5.43563175201416, "global_step": 21603, "epoch": 514} {"train_loss": -5.328665733337402, "global_step": 21604, "epoch": 514} {"train_loss": -5.459866523742676, "global_step": 21605, "epoch": 514} {"train_loss": -5.456623077392578, "global_step": 21606, "epoch": 514} {"train_loss": -5.315138816833496, "global_step": 21607, "epoch": 514} {"train_loss": -5.356322288513184, "global_step": 21608, "epoch": 514} {"train_loss": -5.401201248168945, "global_step": 21609, "epoch": 514} {"train_loss": -5.343422889709473, "global_step": 21610, "epoch": 514} {"train_loss": -5.207796096801758, "global_step": 21611, "epoch": 514} {"train_loss": -5.273787498474121, "global_step": 21612, "epoch": 514} {"train_loss": -5.406185626983643, "global_step": 21613, "epoch": 514} {"train_loss": -5.249279975891113, "global_step": 21614, "epoch": 514} {"train_loss": -5.144492149353027, "global_step": 21615, "epoch": 514} {"train_loss": -5.24796199798584, "global_step": 21616, "epoch": 514} {"train_loss": -5.231511116027832, "global_step": 21617, "epoch": 514} {"train_loss": -5.202428817749023, "global_step": 21618, "epoch": 514} {"train_loss": -5.374179840087891, "global_step": 21619, "epoch": 514} {"train_loss": -5.295657634735107, "global_step": 21620, "epoch": 514} {"train_loss": -5.251165390014648, "global_step": 21621, "epoch": 514} {"train_loss": -5.311992168426514, "global_step": 21622, "epoch": 514} {"train_loss": -5.308793067932129, "global_step": 21623, "epoch": 514} {"train_loss": -5.239658355712891, "global_step": 21624, "epoch": 514} {"train_loss": -5.417669296264648, "global_step": 21625, "epoch": 514} {"train_loss": -5.4605937004089355, "global_step": 21626, "epoch": 514} {"train_loss": -5.249677658081055, "global_step": 21627, "epoch": 514} {"train_loss": -5.426169395446777, "global_step": 21628, "epoch": 514} {"train_loss": -5.332748640151251, "global_step": 21629, "epoch": 514, "val_loss": 66684.5859375} {"train_loss": -5.364423751831055, "global_step": 21630, "epoch": 515} {"train_loss": -5.399376392364502, "global_step": 21631, "epoch": 515} {"train_loss": -5.438359260559082, "global_step": 21632, "epoch": 515} {"train_loss": -5.354598045349121, "global_step": 21633, "epoch": 515} {"train_loss": -5.371991157531738, "global_step": 21634, "epoch": 515} {"train_loss": -5.314579010009766, "global_step": 21635, "epoch": 515} {"train_loss": -5.299092769622803, "global_step": 21636, "epoch": 515} {"train_loss": -5.214177131652832, "global_step": 21637, "epoch": 515} {"train_loss": -5.26105260848999, "global_step": 21638, "epoch": 515} {"train_loss": -5.340770244598389, "global_step": 21639, "epoch": 515} {"train_loss": -5.326084136962891, "global_step": 21640, "epoch": 515} {"train_loss": -5.355982780456543, "global_step": 21641, "epoch": 515} {"train_loss": -5.396206855773926, "global_step": 21642, "epoch": 515} {"train_loss": -5.1354875564575195, "global_step": 21643, "epoch": 515} {"train_loss": -5.373443603515625, "global_step": 21644, "epoch": 515} {"train_loss": -5.374545097351074, "global_step": 21645, "epoch": 515} {"train_loss": -5.305666446685791, "global_step": 21646, "epoch": 515} {"train_loss": -5.187465667724609, "global_step": 21647, "epoch": 515} {"train_loss": -5.348661422729492, "global_step": 21648, "epoch": 515} {"train_loss": -5.287092685699463, "global_step": 21649, "epoch": 515} {"train_loss": -5.301347732543945, "global_step": 21650, "epoch": 515} {"train_loss": -5.3887434005737305, "global_step": 21651, "epoch": 515} {"train_loss": -5.2471513748168945, "global_step": 21652, "epoch": 515} {"train_loss": -5.168048858642578, "global_step": 21653, "epoch": 515} {"train_loss": -5.45156717300415, "global_step": 21654, "epoch": 515} {"train_loss": -5.2265543937683105, "global_step": 21655, "epoch": 515} {"train_loss": -5.324544906616211, "global_step": 21656, "epoch": 515} {"train_loss": -5.323772430419922, "global_step": 21657, "epoch": 515} {"train_loss": -5.273227214813232, "global_step": 21658, "epoch": 515} {"train_loss": -5.329509735107422, "global_step": 21659, "epoch": 515} {"train_loss": -5.348193168640137, "global_step": 21660, "epoch": 515} {"train_loss": -5.2445220947265625, "global_step": 21661, "epoch": 515} {"train_loss": -5.200506210327148, "global_step": 21662, "epoch": 515} {"train_loss": -5.332785129547119, "global_step": 21663, "epoch": 515} {"train_loss": -5.256706237792969, "global_step": 21664, "epoch": 515} {"train_loss": -5.29594087600708, "global_step": 21665, "epoch": 515} {"train_loss": -5.19843864440918, "global_step": 21666, "epoch": 515} {"train_loss": -5.323775291442871, "global_step": 21667, "epoch": 515} {"train_loss": -5.433821678161621, "global_step": 21668, "epoch": 515} {"train_loss": -5.373686790466309, "global_step": 21669, "epoch": 515} {"train_loss": -5.197305679321289, "global_step": 21670, "epoch": 515} {"train_loss": -5.312756549744379, "global_step": 21671, "epoch": 515, "val_loss": 66922.3359375} {"train_loss": -5.255091667175293, "global_step": 21672, "epoch": 516} {"train_loss": -5.352579593658447, "global_step": 21673, "epoch": 516} {"train_loss": -5.438624858856201, "global_step": 21674, "epoch": 516} {"train_loss": -5.346567153930664, "global_step": 21675, "epoch": 516} {"train_loss": -5.479152202606201, "global_step": 21676, "epoch": 516} {"train_loss": -5.298239231109619, "global_step": 21677, "epoch": 516} {"train_loss": -5.355983734130859, "global_step": 21678, "epoch": 516} {"train_loss": -5.394908428192139, "global_step": 21679, "epoch": 516} {"train_loss": -5.3670654296875, "global_step": 21680, "epoch": 516} {"train_loss": -5.521188735961914, "global_step": 21681, "epoch": 516} {"train_loss": -5.429044723510742, "global_step": 21682, "epoch": 516} {"train_loss": -5.389759063720703, "global_step": 21683, "epoch": 516} {"train_loss": -5.321829795837402, "global_step": 21684, "epoch": 516} {"train_loss": -5.41541862487793, "global_step": 21685, "epoch": 516} {"train_loss": -5.353908061981201, "global_step": 21686, "epoch": 516} {"train_loss": -5.2154951095581055, "global_step": 21687, "epoch": 516} {"train_loss": -5.21382474899292, "global_step": 21688, "epoch": 516} {"train_loss": -5.327640533447266, "global_step": 21689, "epoch": 516} {"train_loss": -5.454684257507324, "global_step": 21690, "epoch": 516} {"train_loss": -5.28398323059082, "global_step": 21691, "epoch": 516} {"train_loss": -5.312971115112305, "global_step": 21692, "epoch": 516} {"train_loss": -5.30349588394165, "global_step": 21693, "epoch": 516} {"train_loss": -5.286597728729248, "global_step": 21694, "epoch": 516} {"train_loss": -5.2635297775268555, "global_step": 21695, "epoch": 516} {"train_loss": -5.321272373199463, "global_step": 21696, "epoch": 516} {"train_loss": -5.276954650878906, "global_step": 21697, "epoch": 516} {"train_loss": -5.274003028869629, "global_step": 21698, "epoch": 516} {"train_loss": -5.395933151245117, "global_step": 21699, "epoch": 516} {"train_loss": -5.304497718811035, "global_step": 21700, "epoch": 516} {"train_loss": -5.354405403137207, "global_step": 21701, "epoch": 516} {"train_loss": -5.406467914581299, "global_step": 21702, "epoch": 516} {"train_loss": -5.391729831695557, "global_step": 21703, "epoch": 516} {"train_loss": -5.4905548095703125, "global_step": 21704, "epoch": 516} {"train_loss": -5.384482383728027, "global_step": 21705, "epoch": 516} {"train_loss": -5.397696495056152, "global_step": 21706, "epoch": 516} {"train_loss": -5.302683353424072, "global_step": 21707, "epoch": 516} {"train_loss": -5.253055095672607, "global_step": 21708, "epoch": 516} {"train_loss": -5.347041606903076, "global_step": 21709, "epoch": 516} {"train_loss": -5.365212440490723, "global_step": 21710, "epoch": 516} {"train_loss": -5.267256259918213, "global_step": 21711, "epoch": 516} {"train_loss": -5.356701850891113, "global_step": 21712, "epoch": 516} {"train_loss": -5.3489376817430765, "global_step": 21713, "epoch": 516, "val_loss": 66654.0} {"train_loss": -5.371420383453369, "global_step": 21714, "epoch": 517} {"train_loss": -5.263287544250488, "global_step": 21715, "epoch": 517} {"train_loss": -5.27852725982666, "global_step": 21716, "epoch": 517} {"train_loss": -5.270712852478027, "global_step": 21717, "epoch": 517} {"train_loss": -5.130281448364258, "global_step": 21718, "epoch": 517} {"train_loss": -5.3399505615234375, "global_step": 21719, "epoch": 517} {"train_loss": -5.414880752563477, "global_step": 21720, "epoch": 517} {"train_loss": -5.286931991577148, "global_step": 21721, "epoch": 517} {"train_loss": -5.243309020996094, "global_step": 21722, "epoch": 517} {"train_loss": -5.378536701202393, "global_step": 21723, "epoch": 517} {"train_loss": -5.135868072509766, "global_step": 21724, "epoch": 517} {"train_loss": -5.37489128112793, "global_step": 21725, "epoch": 517} {"train_loss": -5.288684368133545, "global_step": 21726, "epoch": 517} {"train_loss": -5.294856071472168, "global_step": 21727, "epoch": 517} {"train_loss": -5.27580451965332, "global_step": 21728, "epoch": 517} {"train_loss": -5.357779026031494, "global_step": 21729, "epoch": 517} {"train_loss": -5.3578386306762695, "global_step": 21730, "epoch": 517} {"train_loss": -5.200073719024658, "global_step": 21731, "epoch": 517} {"train_loss": -5.2779011726379395, "global_step": 21732, "epoch": 517} {"train_loss": -5.357163429260254, "global_step": 21733, "epoch": 517} {"train_loss": -5.273324012756348, "global_step": 21734, "epoch": 517} {"train_loss": -5.389334201812744, "global_step": 21735, "epoch": 517} {"train_loss": -5.443787574768066, "global_step": 21736, "epoch": 517} {"train_loss": -5.267200946807861, "global_step": 21737, "epoch": 517} {"train_loss": -5.311864376068115, "global_step": 21738, "epoch": 517} {"train_loss": -5.391467571258545, "global_step": 21739, "epoch": 517} {"train_loss": -5.345391273498535, "global_step": 21740, "epoch": 517} {"train_loss": -5.458623886108398, "global_step": 21741, "epoch": 517} {"train_loss": -5.375588417053223, "global_step": 21742, "epoch": 517} {"train_loss": -5.314384937286377, "global_step": 21743, "epoch": 517} {"train_loss": -5.349026679992676, "global_step": 21744, "epoch": 517} {"train_loss": -5.315014839172363, "global_step": 21745, "epoch": 517} {"train_loss": -5.141537189483643, "global_step": 21746, "epoch": 517} {"train_loss": -5.4022345542907715, "global_step": 21747, "epoch": 517} {"train_loss": -5.350050926208496, "global_step": 21748, "epoch": 517} {"train_loss": -5.2461628913879395, "global_step": 21749, "epoch": 517} {"train_loss": -5.215326309204102, "global_step": 21750, "epoch": 517} {"train_loss": -5.315000534057617, "global_step": 21751, "epoch": 517} {"train_loss": -5.39655876159668, "global_step": 21752, "epoch": 517} {"train_loss": -5.359679222106934, "global_step": 21753, "epoch": 517} {"train_loss": -5.230642318725586, "global_step": 21754, "epoch": 517} {"train_loss": -5.313101382482619, "global_step": 21755, "epoch": 517, "val_loss": 66657.6875} {"train_loss": -5.3251543045043945, "global_step": 21756, "epoch": 518} {"train_loss": -5.288668632507324, "global_step": 21757, "epoch": 518} {"train_loss": -5.323119163513184, "global_step": 21758, "epoch": 518} {"train_loss": -5.397843360900879, "global_step": 21759, "epoch": 518} {"train_loss": -5.312094211578369, "global_step": 21760, "epoch": 518} {"train_loss": -5.304006576538086, "global_step": 21761, "epoch": 518} {"train_loss": -5.475461959838867, "global_step": 21762, "epoch": 518} {"train_loss": -5.3933210372924805, "global_step": 21763, "epoch": 518} {"train_loss": -5.377866744995117, "global_step": 21764, "epoch": 518} {"train_loss": -5.265807151794434, "global_step": 21765, "epoch": 518} {"train_loss": -5.419201374053955, "global_step": 21766, "epoch": 518} {"train_loss": -5.374538421630859, "global_step": 21767, "epoch": 518} {"train_loss": -5.305828094482422, "global_step": 21768, "epoch": 518} {"train_loss": -5.272678375244141, "global_step": 21769, "epoch": 518} {"train_loss": -5.410816192626953, "global_step": 21770, "epoch": 518} {"train_loss": -5.459568023681641, "global_step": 21771, "epoch": 518} {"train_loss": -5.402675151824951, "global_step": 21772, "epoch": 518} {"train_loss": -5.315510272979736, "global_step": 21773, "epoch": 518} {"train_loss": -5.29091739654541, "global_step": 21774, "epoch": 518} {"train_loss": -5.389194488525391, "global_step": 21775, "epoch": 518} {"train_loss": -5.319658279418945, "global_step": 21776, "epoch": 518} {"train_loss": -5.393423557281494, "global_step": 21777, "epoch": 518} {"train_loss": -5.318097114562988, "global_step": 21778, "epoch": 518} {"train_loss": -5.446009635925293, "global_step": 21779, "epoch": 518} {"train_loss": -5.395847320556641, "global_step": 21780, "epoch": 518} {"train_loss": -5.263197898864746, "global_step": 21781, "epoch": 518} {"train_loss": -5.175991535186768, "global_step": 21782, "epoch": 518} {"train_loss": -5.33785343170166, "global_step": 21783, "epoch": 518} {"train_loss": -5.310997486114502, "global_step": 21784, "epoch": 518} {"train_loss": -5.358800888061523, "global_step": 21785, "epoch": 518} {"train_loss": -5.306012153625488, "global_step": 21786, "epoch": 518} {"train_loss": -5.302960395812988, "global_step": 21787, "epoch": 518} {"train_loss": -5.273784160614014, "global_step": 21788, "epoch": 518} {"train_loss": -5.341958045959473, "global_step": 21789, "epoch": 518} {"train_loss": -5.217228889465332, "global_step": 21790, "epoch": 518} {"train_loss": -5.334288597106934, "global_step": 21791, "epoch": 518} {"train_loss": -5.043560028076172, "global_step": 21792, "epoch": 518} {"train_loss": -5.319382667541504, "global_step": 21793, "epoch": 518} {"train_loss": -5.273281574249268, "global_step": 21794, "epoch": 518} {"train_loss": -5.183953285217285, "global_step": 21795, "epoch": 518} {"train_loss": -5.234821319580078, "global_step": 21796, "epoch": 518} {"train_loss": -5.322595323835101, "global_step": 21797, "epoch": 518, "val_loss": 67961.9453125} {"train_loss": -5.168658256530762, "global_step": 21798, "epoch": 519} {"train_loss": -5.338712692260742, "global_step": 21799, "epoch": 519} {"train_loss": -5.276517868041992, "global_step": 21800, "epoch": 519} {"train_loss": -5.2621660232543945, "global_step": 21801, "epoch": 519} {"train_loss": -5.300714492797852, "global_step": 21802, "epoch": 519} {"train_loss": -5.20845890045166, "global_step": 21803, "epoch": 519} {"train_loss": -5.292814254760742, "global_step": 21804, "epoch": 519} {"train_loss": -5.371187686920166, "global_step": 21805, "epoch": 519} {"train_loss": -5.1920576095581055, "global_step": 21806, "epoch": 519} {"train_loss": -5.316762924194336, "global_step": 21807, "epoch": 519} {"train_loss": -5.200767517089844, "global_step": 21808, "epoch": 519} {"train_loss": -5.403704643249512, "global_step": 21809, "epoch": 519} {"train_loss": -5.400579452514648, "global_step": 21810, "epoch": 519} {"train_loss": -5.149711608886719, "global_step": 21811, "epoch": 519} {"train_loss": -5.3640336990356445, "global_step": 21812, "epoch": 519} {"train_loss": -5.125410079956055, "global_step": 21813, "epoch": 519} {"train_loss": -5.158947944641113, "global_step": 21814, "epoch": 519} {"train_loss": -5.216161727905273, "global_step": 21815, "epoch": 519} {"train_loss": -5.282963752746582, "global_step": 21816, "epoch": 519} {"train_loss": -5.205092906951904, "global_step": 21817, "epoch": 519} {"train_loss": -5.354725360870361, "global_step": 21818, "epoch": 519} {"train_loss": -5.384616851806641, "global_step": 21819, "epoch": 519} {"train_loss": -5.284167289733887, "global_step": 21820, "epoch": 519} {"train_loss": -5.240354061126709, "global_step": 21821, "epoch": 519} {"train_loss": -5.387720584869385, "global_step": 21822, "epoch": 519} {"train_loss": -5.332669734954834, "global_step": 21823, "epoch": 519} {"train_loss": -5.336601257324219, "global_step": 21824, "epoch": 519} {"train_loss": -5.334753036499023, "global_step": 21825, "epoch": 519} {"train_loss": -5.185394287109375, "global_step": 21826, "epoch": 519} {"train_loss": -5.237826824188232, "global_step": 21827, "epoch": 519} {"train_loss": -5.336663246154785, "global_step": 21828, "epoch": 519} {"train_loss": -5.244670867919922, "global_step": 21829, "epoch": 519} {"train_loss": -5.368710517883301, "global_step": 21830, "epoch": 519} {"train_loss": -5.152601718902588, "global_step": 21831, "epoch": 519} {"train_loss": -5.426150321960449, "global_step": 21832, "epoch": 519} {"train_loss": -5.069610595703125, "global_step": 21833, "epoch": 519} {"train_loss": -5.201889991760254, "global_step": 21834, "epoch": 519} {"train_loss": -5.262969017028809, "global_step": 21835, "epoch": 519} {"train_loss": -5.1217474937438965, "global_step": 21836, "epoch": 519} {"train_loss": -5.449141025543213, "global_step": 21837, "epoch": 519} {"train_loss": -5.3345208168029785, "global_step": 21838, "epoch": 519} {"train_loss": -5.276312192281087, "global_step": 21839, "epoch": 519, "val_loss": 66555.7890625} {"train_loss": -5.192020416259766, "global_step": 21840, "epoch": 520} {"train_loss": -5.233377933502197, "global_step": 21841, "epoch": 520} {"train_loss": -5.371321678161621, "global_step": 21842, "epoch": 520} {"train_loss": -5.288253307342529, "global_step": 21843, "epoch": 520} {"train_loss": -5.358400344848633, "global_step": 21844, "epoch": 520} {"train_loss": -5.4670844078063965, "global_step": 21845, "epoch": 520} {"train_loss": -5.164546966552734, "global_step": 21846, "epoch": 520} {"train_loss": -5.275995254516602, "global_step": 21847, "epoch": 520} {"train_loss": -5.387392997741699, "global_step": 21848, "epoch": 520} {"train_loss": -5.425985336303711, "global_step": 21849, "epoch": 520} {"train_loss": -5.340280532836914, "global_step": 21850, "epoch": 520} {"train_loss": -5.28813362121582, "global_step": 21851, "epoch": 520} {"train_loss": -5.340314865112305, "global_step": 21852, "epoch": 520} {"train_loss": -5.33582067489624, "global_step": 21853, "epoch": 520} {"train_loss": -5.449960708618164, "global_step": 21854, "epoch": 520} {"train_loss": -5.380661964416504, "global_step": 21855, "epoch": 520} {"train_loss": -5.2502946853637695, "global_step": 21856, "epoch": 520} {"train_loss": -5.343315124511719, "global_step": 21857, "epoch": 520} {"train_loss": -5.305254936218262, "global_step": 21858, "epoch": 520} {"train_loss": -5.310206413269043, "global_step": 21859, "epoch": 520} {"train_loss": -5.2486724853515625, "global_step": 21860, "epoch": 520} {"train_loss": -5.4229888916015625, "global_step": 21861, "epoch": 520} {"train_loss": -5.178194046020508, "global_step": 21862, "epoch": 520} {"train_loss": -5.367250442504883, "global_step": 21863, "epoch": 520} {"train_loss": -5.245718002319336, "global_step": 21864, "epoch": 520} {"train_loss": -5.374513626098633, "global_step": 21865, "epoch": 520} {"train_loss": -5.33804988861084, "global_step": 21866, "epoch": 520} {"train_loss": -5.391408920288086, "global_step": 21867, "epoch": 520} {"train_loss": -5.289576053619385, "global_step": 21868, "epoch": 520} {"train_loss": -5.259007453918457, "global_step": 21869, "epoch": 520} {"train_loss": -5.316320896148682, "global_step": 21870, "epoch": 520} {"train_loss": -5.351311683654785, "global_step": 21871, "epoch": 520} {"train_loss": -5.2507524490356445, "global_step": 21872, "epoch": 520} {"train_loss": -5.222625732421875, "global_step": 21873, "epoch": 520} {"train_loss": -5.37973165512085, "global_step": 21874, "epoch": 520} {"train_loss": -5.284424781799316, "global_step": 21875, "epoch": 520} {"train_loss": -5.230347156524658, "global_step": 21876, "epoch": 520} {"train_loss": -5.4791951179504395, "global_step": 21877, "epoch": 520} {"train_loss": -5.336980819702148, "global_step": 21878, "epoch": 520} {"train_loss": -5.312425136566162, "global_step": 21879, "epoch": 520} {"train_loss": -5.297817230224609, "global_step": 21880, "epoch": 520} {"train_loss": -5.319171440033686, "global_step": 21881, "epoch": 520, "val_loss": 66652.203125} {"train_loss": -5.306677341461182, "global_step": 21882, "epoch": 521} {"train_loss": -5.364317417144775, "global_step": 21883, "epoch": 521} {"train_loss": -5.290128231048584, "global_step": 21884, "epoch": 521} {"train_loss": -5.176580429077148, "global_step": 21885, "epoch": 521} {"train_loss": -5.292909145355225, "global_step": 21886, "epoch": 521} {"train_loss": -5.23311710357666, "global_step": 21887, "epoch": 521} {"train_loss": -5.303850173950195, "global_step": 21888, "epoch": 521} {"train_loss": -5.40936803817749, "global_step": 21889, "epoch": 521} {"train_loss": -5.232179641723633, "global_step": 21890, "epoch": 521} {"train_loss": -5.312248229980469, "global_step": 21891, "epoch": 521} {"train_loss": -5.094623565673828, "global_step": 21892, "epoch": 521} {"train_loss": -5.298504829406738, "global_step": 21893, "epoch": 521} {"train_loss": -5.223830223083496, "global_step": 21894, "epoch": 521} {"train_loss": -5.315461158752441, "global_step": 21895, "epoch": 521} {"train_loss": -5.349453926086426, "global_step": 21896, "epoch": 521} {"train_loss": -5.238983631134033, "global_step": 21897, "epoch": 521} {"train_loss": -5.3698410987854, "global_step": 21898, "epoch": 521} {"train_loss": -5.243465423583984, "global_step": 21899, "epoch": 521} {"train_loss": -5.374077796936035, "global_step": 21900, "epoch": 521} {"train_loss": -5.326239585876465, "global_step": 21901, "epoch": 521} {"train_loss": -5.31514835357666, "global_step": 21902, "epoch": 521} {"train_loss": -5.430424213409424, "global_step": 21903, "epoch": 521} {"train_loss": -5.289670944213867, "global_step": 21904, "epoch": 521} {"train_loss": -5.264344215393066, "global_step": 21905, "epoch": 521} {"train_loss": -5.253882884979248, "global_step": 21906, "epoch": 521} {"train_loss": -5.340940475463867, "global_step": 21907, "epoch": 521} {"train_loss": -5.355710506439209, "global_step": 21908, "epoch": 521} {"train_loss": -5.193213939666748, "global_step": 21909, "epoch": 521} {"train_loss": -5.3649115562438965, "global_step": 21910, "epoch": 521} {"train_loss": -5.3202009201049805, "global_step": 21911, "epoch": 521} {"train_loss": -5.289560317993164, "global_step": 21912, "epoch": 521} {"train_loss": -5.354571342468262, "global_step": 21913, "epoch": 521} {"train_loss": -5.40696382522583, "global_step": 21914, "epoch": 521} {"train_loss": -5.288010597229004, "global_step": 21915, "epoch": 521} {"train_loss": -5.241254806518555, "global_step": 21916, "epoch": 521} {"train_loss": -5.288890838623047, "global_step": 21917, "epoch": 521} {"train_loss": -5.219118595123291, "global_step": 21918, "epoch": 521} {"train_loss": -5.282678604125977, "global_step": 21919, "epoch": 521} {"train_loss": -5.398290634155273, "global_step": 21920, "epoch": 521} {"train_loss": -5.279794692993164, "global_step": 21921, "epoch": 521} {"train_loss": -5.270524024963379, "global_step": 21922, "epoch": 521} {"train_loss": -5.29876496678307, "global_step": 21923, "epoch": 521, "val_loss": 66432.71875} {"train_loss": -5.3002166748046875, "global_step": 21924, "epoch": 522} {"train_loss": -5.311163902282715, "global_step": 21925, "epoch": 522} {"train_loss": -5.279234409332275, "global_step": 21926, "epoch": 522} {"train_loss": -5.1280598640441895, "global_step": 21927, "epoch": 522} {"train_loss": -5.178391456604004, "global_step": 21928, "epoch": 522} {"train_loss": -5.2840576171875, "global_step": 21929, "epoch": 522} {"train_loss": -5.43011474609375, "global_step": 21930, "epoch": 522} {"train_loss": -5.457723140716553, "global_step": 21931, "epoch": 522} {"train_loss": -5.343072414398193, "global_step": 21932, "epoch": 522} {"train_loss": -5.4112701416015625, "global_step": 21933, "epoch": 522} {"train_loss": -5.33726692199707, "global_step": 21934, "epoch": 522} {"train_loss": -5.372042655944824, "global_step": 21935, "epoch": 522} {"train_loss": -5.446804046630859, "global_step": 21936, "epoch": 522} {"train_loss": -5.3670196533203125, "global_step": 21937, "epoch": 522} {"train_loss": -5.4466376304626465, "global_step": 21938, "epoch": 522} {"train_loss": -5.499027729034424, "global_step": 21939, "epoch": 522} {"train_loss": -5.384034156799316, "global_step": 21940, "epoch": 522} {"train_loss": -5.375299453735352, "global_step": 21941, "epoch": 522} {"train_loss": -5.367966651916504, "global_step": 21942, "epoch": 522} {"train_loss": -5.438128471374512, "global_step": 21943, "epoch": 522} {"train_loss": -5.446761131286621, "global_step": 21944, "epoch": 522} {"train_loss": -5.25360107421875, "global_step": 21945, "epoch": 522} {"train_loss": -5.304635047912598, "global_step": 21946, "epoch": 522} {"train_loss": -5.405971527099609, "global_step": 21947, "epoch": 522} {"train_loss": -5.4820051193237305, "global_step": 21948, "epoch": 522} {"train_loss": -5.235102653503418, "global_step": 21949, "epoch": 522} {"train_loss": -5.373104572296143, "global_step": 21950, "epoch": 522} {"train_loss": -5.339629650115967, "global_step": 21951, "epoch": 522} {"train_loss": -5.358230113983154, "global_step": 21952, "epoch": 522} {"train_loss": -5.296682357788086, "global_step": 21953, "epoch": 522} {"train_loss": -5.323905944824219, "global_step": 21954, "epoch": 522} {"train_loss": -5.449099063873291, "global_step": 21955, "epoch": 522} {"train_loss": -5.186397075653076, "global_step": 21956, "epoch": 522} {"train_loss": -5.357850074768066, "global_step": 21957, "epoch": 522} {"train_loss": -5.337719917297363, "global_step": 21958, "epoch": 522} {"train_loss": -5.306041240692139, "global_step": 21959, "epoch": 522} {"train_loss": -5.4162750244140625, "global_step": 21960, "epoch": 522} {"train_loss": -5.404541492462158, "global_step": 21961, "epoch": 522} {"train_loss": -5.3069634437561035, "global_step": 21962, "epoch": 522} {"train_loss": -5.2805562019348145, "global_step": 21963, "epoch": 522} {"train_loss": -5.3217267990112305, "global_step": 21964, "epoch": 522} {"train_loss": -5.348557597114926, "global_step": 21965, "epoch": 522, "val_loss": 66674.7734375} {"train_loss": -5.25352668762207, "global_step": 21966, "epoch": 523} {"train_loss": -5.313838958740234, "global_step": 21967, "epoch": 523} {"train_loss": -5.396467208862305, "global_step": 21968, "epoch": 523} {"train_loss": -5.413416862487793, "global_step": 21969, "epoch": 523} {"train_loss": -5.276479721069336, "global_step": 21970, "epoch": 523} {"train_loss": -5.3857927322387695, "global_step": 21971, "epoch": 523} {"train_loss": -5.481426239013672, "global_step": 21972, "epoch": 523} {"train_loss": -5.299467086791992, "global_step": 21973, "epoch": 523} {"train_loss": -5.33648681640625, "global_step": 21974, "epoch": 523} {"train_loss": -5.370356559753418, "global_step": 21975, "epoch": 523} {"train_loss": -5.358572959899902, "global_step": 21976, "epoch": 523} {"train_loss": -5.14012336730957, "global_step": 21977, "epoch": 523} {"train_loss": -5.527575492858887, "global_step": 21978, "epoch": 523} {"train_loss": -5.2866363525390625, "global_step": 21979, "epoch": 523} {"train_loss": -5.333428382873535, "global_step": 21980, "epoch": 523} {"train_loss": -5.3309478759765625, "global_step": 21981, "epoch": 523} {"train_loss": -5.364166736602783, "global_step": 21982, "epoch": 523} {"train_loss": -5.197339057922363, "global_step": 21983, "epoch": 523} {"train_loss": -5.482224464416504, "global_step": 21984, "epoch": 523} {"train_loss": -5.494219779968262, "global_step": 21985, "epoch": 523} {"train_loss": -5.494895935058594, "global_step": 21986, "epoch": 523} {"train_loss": -5.438910007476807, "global_step": 21987, "epoch": 523} {"train_loss": -5.433107376098633, "global_step": 21988, "epoch": 523} {"train_loss": -5.26967716217041, "global_step": 21989, "epoch": 523} {"train_loss": -5.197981834411621, "global_step": 21990, "epoch": 523} {"train_loss": -5.411012649536133, "global_step": 21991, "epoch": 523} {"train_loss": -5.37470817565918, "global_step": 21992, "epoch": 523} {"train_loss": -5.2445831298828125, "global_step": 21993, "epoch": 523} {"train_loss": -5.31549596786499, "global_step": 21994, "epoch": 523} {"train_loss": -5.352395534515381, "global_step": 21995, "epoch": 523} {"train_loss": -5.333683013916016, "global_step": 21996, "epoch": 523} {"train_loss": -5.397027969360352, "global_step": 21997, "epoch": 523} {"train_loss": -5.305294990539551, "global_step": 21998, "epoch": 523} {"train_loss": -5.283679962158203, "global_step": 21999, "epoch": 523} {"train_loss": -5.324897289276123, "global_step": 22000, "epoch": 523} {"train_loss": -5.26450252532959, "global_step": 22001, "epoch": 523} {"train_loss": -5.341778755187988, "global_step": 22002, "epoch": 523} {"train_loss": -5.4137983322143555, "global_step": 22003, "epoch": 523} {"train_loss": -5.268263816833496, "global_step": 22004, "epoch": 523} {"train_loss": -5.3118815422058105, "global_step": 22005, "epoch": 523} {"train_loss": -5.32620096206665, "global_step": 22006, "epoch": 523} {"train_loss": -5.345217931838262, "global_step": 22007, "epoch": 523, "val_loss": 66699.8671875} {"train_loss": -5.29918098449707, "global_step": 22008, "epoch": 524} {"train_loss": -5.378090858459473, "global_step": 22009, "epoch": 524} {"train_loss": -5.2963714599609375, "global_step": 22010, "epoch": 524} {"train_loss": -5.292618274688721, "global_step": 22011, "epoch": 524} {"train_loss": -5.335390090942383, "global_step": 22012, "epoch": 524} {"train_loss": -5.355678558349609, "global_step": 22013, "epoch": 524} {"train_loss": -5.344521522521973, "global_step": 22014, "epoch": 524} {"train_loss": -5.236556053161621, "global_step": 22015, "epoch": 524} {"train_loss": -5.394526481628418, "global_step": 22016, "epoch": 524} {"train_loss": -5.252618789672852, "global_step": 22017, "epoch": 524} {"train_loss": -5.156367778778076, "global_step": 22018, "epoch": 524} {"train_loss": -5.257291793823242, "global_step": 22019, "epoch": 524} {"train_loss": -5.361066818237305, "global_step": 22020, "epoch": 524} {"train_loss": -5.271200180053711, "global_step": 22021, "epoch": 524} {"train_loss": -5.276196479797363, "global_step": 22022, "epoch": 524} {"train_loss": -5.281847953796387, "global_step": 22023, "epoch": 524} {"train_loss": -5.404914379119873, "global_step": 22024, "epoch": 524} {"train_loss": -5.189934730529785, "global_step": 22025, "epoch": 524} {"train_loss": -5.483467102050781, "global_step": 22026, "epoch": 524} {"train_loss": -5.175899505615234, "global_step": 22027, "epoch": 524} {"train_loss": -5.235243797302246, "global_step": 22028, "epoch": 524} {"train_loss": -5.411402225494385, "global_step": 22029, "epoch": 524} {"train_loss": -5.298285961151123, "global_step": 22030, "epoch": 524} {"train_loss": -5.358245849609375, "global_step": 22031, "epoch": 524} {"train_loss": -5.255954742431641, "global_step": 22032, "epoch": 524} {"train_loss": -5.399495601654053, "global_step": 22033, "epoch": 524} {"train_loss": -5.33640193939209, "global_step": 22034, "epoch": 524} {"train_loss": -5.335535049438477, "global_step": 22035, "epoch": 524} {"train_loss": -5.392111778259277, "global_step": 22036, "epoch": 524} {"train_loss": -5.208832263946533, "global_step": 22037, "epoch": 524} {"train_loss": -5.303097724914551, "global_step": 22038, "epoch": 524} {"train_loss": -5.304432392120361, "global_step": 22039, "epoch": 524} {"train_loss": -5.381321907043457, "global_step": 22040, "epoch": 524} {"train_loss": -5.277929306030273, "global_step": 22041, "epoch": 524} {"train_loss": -5.314623832702637, "global_step": 22042, "epoch": 524} {"train_loss": -5.39985990524292, "global_step": 22043, "epoch": 524} {"train_loss": -5.440799713134766, "global_step": 22044, "epoch": 524} {"train_loss": -5.320798873901367, "global_step": 22045, "epoch": 524} {"train_loss": -5.246487617492676, "global_step": 22046, "epoch": 524} {"train_loss": -5.379731178283691, "global_step": 22047, "epoch": 524} {"train_loss": -5.202192783355713, "global_step": 22048, "epoch": 524} {"train_loss": -5.310641334170387, "global_step": 22049, "epoch": 524, "val_loss": 66757.2421875} {"train_loss": -5.402219295501709, "global_step": 22050, "epoch": 525} {"train_loss": -5.15403938293457, "global_step": 22051, "epoch": 525} {"train_loss": -5.291630744934082, "global_step": 22052, "epoch": 525} {"train_loss": -5.244351387023926, "global_step": 22053, "epoch": 525} {"train_loss": -5.381292343139648, "global_step": 22054, "epoch": 525} {"train_loss": -5.209435939788818, "global_step": 22055, "epoch": 525} {"train_loss": -5.268928527832031, "global_step": 22056, "epoch": 525} {"train_loss": -5.151277542114258, "global_step": 22057, "epoch": 525} {"train_loss": -5.30170202255249, "global_step": 22058, "epoch": 525} {"train_loss": -5.291006088256836, "global_step": 22059, "epoch": 525} {"train_loss": -5.336860656738281, "global_step": 22060, "epoch": 525} {"train_loss": -5.473575592041016, "global_step": 22061, "epoch": 525} {"train_loss": -5.402694225311279, "global_step": 22062, "epoch": 525} {"train_loss": -5.30903434753418, "global_step": 22063, "epoch": 525} {"train_loss": -5.24924898147583, "global_step": 22064, "epoch": 525} {"train_loss": -5.3819146156311035, "global_step": 22065, "epoch": 525} {"train_loss": -5.497672080993652, "global_step": 22066, "epoch": 525} {"train_loss": -5.431915283203125, "global_step": 22067, "epoch": 525} {"train_loss": -5.349111080169678, "global_step": 22068, "epoch": 525} {"train_loss": -5.38899040222168, "global_step": 22069, "epoch": 525} {"train_loss": -5.451385498046875, "global_step": 22070, "epoch": 525} {"train_loss": -5.2603678703308105, "global_step": 22071, "epoch": 525} {"train_loss": -5.368001937866211, "global_step": 22072, "epoch": 525} {"train_loss": -5.381922721862793, "global_step": 22073, "epoch": 525} {"train_loss": -5.263647079467773, "global_step": 22074, "epoch": 525} {"train_loss": -5.186481475830078, "global_step": 22075, "epoch": 525} {"train_loss": -5.419562816619873, "global_step": 22076, "epoch": 525} {"train_loss": -5.155341625213623, "global_step": 22077, "epoch": 525} {"train_loss": -5.285623550415039, "global_step": 22078, "epoch": 525} {"train_loss": -5.27093505859375, "global_step": 22079, "epoch": 525} {"train_loss": -5.075028896331787, "global_step": 22080, "epoch": 525} {"train_loss": -5.201451301574707, "global_step": 22081, "epoch": 525} {"train_loss": -5.399356365203857, "global_step": 22082, "epoch": 525} {"train_loss": -5.311446666717529, "global_step": 22083, "epoch": 525} {"train_loss": -5.220203399658203, "global_step": 22084, "epoch": 525} {"train_loss": -5.359677314758301, "global_step": 22085, "epoch": 525} {"train_loss": -5.370534896850586, "global_step": 22086, "epoch": 525} {"train_loss": -5.2379069328308105, "global_step": 22087, "epoch": 525} {"train_loss": -5.3056488037109375, "global_step": 22088, "epoch": 525} {"train_loss": -5.348199844360352, "global_step": 22089, "epoch": 525} {"train_loss": -5.2471394538879395, "global_step": 22090, "epoch": 525} {"train_loss": -5.3079212847210115, "global_step": 22091, "epoch": 525, "val_loss": 66859.4296875} {"train_loss": -5.292322158813477, "global_step": 22092, "epoch": 526} {"train_loss": -5.385401248931885, "global_step": 22093, "epoch": 526} {"train_loss": -5.343244552612305, "global_step": 22094, "epoch": 526} {"train_loss": -5.31450080871582, "global_step": 22095, "epoch": 526} {"train_loss": -5.439696788787842, "global_step": 22096, "epoch": 526} {"train_loss": -5.386096000671387, "global_step": 22097, "epoch": 526} {"train_loss": -5.26269006729126, "global_step": 22098, "epoch": 526} {"train_loss": -5.4199066162109375, "global_step": 22099, "epoch": 526} {"train_loss": -5.265921115875244, "global_step": 22100, "epoch": 526} {"train_loss": -5.367443084716797, "global_step": 22101, "epoch": 526} {"train_loss": -5.369353294372559, "global_step": 22102, "epoch": 526} {"train_loss": -5.270874500274658, "global_step": 22103, "epoch": 526} {"train_loss": -5.3306379318237305, "global_step": 22104, "epoch": 526} {"train_loss": -5.285508155822754, "global_step": 22105, "epoch": 526} {"train_loss": -5.333135604858398, "global_step": 22106, "epoch": 526} {"train_loss": -5.3808393478393555, "global_step": 22107, "epoch": 526} {"train_loss": -5.325493812561035, "global_step": 22108, "epoch": 526} {"train_loss": -5.2444868087768555, "global_step": 22109, "epoch": 526} {"train_loss": -5.308629512786865, "global_step": 22110, "epoch": 526} {"train_loss": -5.320319652557373, "global_step": 22111, "epoch": 526} {"train_loss": -5.164432525634766, "global_step": 22112, "epoch": 526} {"train_loss": -5.390295028686523, "global_step": 22113, "epoch": 526} {"train_loss": -5.176364421844482, "global_step": 22114, "epoch": 526} {"train_loss": -5.334794044494629, "global_step": 22115, "epoch": 526} {"train_loss": -5.341294765472412, "global_step": 22116, "epoch": 526} {"train_loss": -5.127032279968262, "global_step": 22117, "epoch": 526} {"train_loss": -5.240818977355957, "global_step": 22118, "epoch": 526} {"train_loss": -5.100748062133789, "global_step": 22119, "epoch": 526} {"train_loss": -5.234490394592285, "global_step": 22120, "epoch": 526} {"train_loss": -5.204714775085449, "global_step": 22121, "epoch": 526} {"train_loss": -5.234855651855469, "global_step": 22122, "epoch": 526} {"train_loss": -5.325709342956543, "global_step": 22123, "epoch": 526} {"train_loss": -5.314770221710205, "global_step": 22124, "epoch": 526} {"train_loss": -5.3130998611450195, "global_step": 22125, "epoch": 526} {"train_loss": -5.237672805786133, "global_step": 22126, "epoch": 526} {"train_loss": -5.374362945556641, "global_step": 22127, "epoch": 526} {"train_loss": -5.239283084869385, "global_step": 22128, "epoch": 526} {"train_loss": -5.271302223205566, "global_step": 22129, "epoch": 526} {"train_loss": -5.411513328552246, "global_step": 22130, "epoch": 526} {"train_loss": -5.190058708190918, "global_step": 22131, "epoch": 526} {"train_loss": -5.18752384185791, "global_step": 22132, "epoch": 526} {"train_loss": -5.293962478637695, "global_step": 22133, "epoch": 526, "val_loss": 66526.0390625} {"train_loss": -5.428382873535156, "global_step": 22134, "epoch": 527} {"train_loss": -5.309826850891113, "global_step": 22135, "epoch": 527} {"train_loss": -5.351717948913574, "global_step": 22136, "epoch": 527} {"train_loss": -5.4523115158081055, "global_step": 22137, "epoch": 527} {"train_loss": -5.336749076843262, "global_step": 22138, "epoch": 527} {"train_loss": -5.364087104797363, "global_step": 22139, "epoch": 527} {"train_loss": -5.2641191482543945, "global_step": 22140, "epoch": 527} {"train_loss": -5.405130386352539, "global_step": 22141, "epoch": 527} {"train_loss": -5.413338661193848, "global_step": 22142, "epoch": 527} {"train_loss": -5.3332014083862305, "global_step": 22143, "epoch": 527} {"train_loss": -5.292580604553223, "global_step": 22144, "epoch": 527} {"train_loss": -5.327447891235352, "global_step": 22145, "epoch": 527} {"train_loss": -5.357897758483887, "global_step": 22146, "epoch": 527} {"train_loss": -5.3640546798706055, "global_step": 22147, "epoch": 527} {"train_loss": -5.172336578369141, "global_step": 22148, "epoch": 527} {"train_loss": -5.368501663208008, "global_step": 22149, "epoch": 527} {"train_loss": -5.301243782043457, "global_step": 22150, "epoch": 527} {"train_loss": -5.151001930236816, "global_step": 22151, "epoch": 527} {"train_loss": -5.422699451446533, "global_step": 22152, "epoch": 527} {"train_loss": -5.315346717834473, "global_step": 22153, "epoch": 527} {"train_loss": -5.25184965133667, "global_step": 22154, "epoch": 527} {"train_loss": -5.338352203369141, "global_step": 22155, "epoch": 527} {"train_loss": -5.420221328735352, "global_step": 22156, "epoch": 527} {"train_loss": -5.299814224243164, "global_step": 22157, "epoch": 527} {"train_loss": -5.158670425415039, "global_step": 22158, "epoch": 527} {"train_loss": -5.221726417541504, "global_step": 22159, "epoch": 527} {"train_loss": -5.377880096435547, "global_step": 22160, "epoch": 527} {"train_loss": -5.240633964538574, "global_step": 22161, "epoch": 527} {"train_loss": -5.401452541351318, "global_step": 22162, "epoch": 527} {"train_loss": -5.303656578063965, "global_step": 22163, "epoch": 527} {"train_loss": -5.30839729309082, "global_step": 22164, "epoch": 527} {"train_loss": -5.364048480987549, "global_step": 22165, "epoch": 527} {"train_loss": -5.35796594619751, "global_step": 22166, "epoch": 527} {"train_loss": -5.41396427154541, "global_step": 22167, "epoch": 527} {"train_loss": -5.3467254638671875, "global_step": 22168, "epoch": 527} {"train_loss": -5.332829475402832, "global_step": 22169, "epoch": 527} {"train_loss": -5.487645149230957, "global_step": 22170, "epoch": 527} {"train_loss": -5.1621270179748535, "global_step": 22171, "epoch": 527} {"train_loss": -5.367780685424805, "global_step": 22172, "epoch": 527} {"train_loss": -5.436838150024414, "global_step": 22173, "epoch": 527} {"train_loss": -5.332896709442139, "global_step": 22174, "epoch": 527} {"train_loss": -5.331236748468308, "global_step": 22175, "epoch": 527, "val_loss": 66265.296875} {"train_loss": -5.301098346710205, "global_step": 22176, "epoch": 528} {"train_loss": -5.37440299987793, "global_step": 22177, "epoch": 528} {"train_loss": -5.319329261779785, "global_step": 22178, "epoch": 528} {"train_loss": -5.259537220001221, "global_step": 22179, "epoch": 528} {"train_loss": -5.314813137054443, "global_step": 22180, "epoch": 528} {"train_loss": -5.10114860534668, "global_step": 22181, "epoch": 528} {"train_loss": -5.250136375427246, "global_step": 22182, "epoch": 528} {"train_loss": -5.367280006408691, "global_step": 22183, "epoch": 528} {"train_loss": -5.2832183837890625, "global_step": 22184, "epoch": 528} {"train_loss": -5.248327255249023, "global_step": 22185, "epoch": 528} {"train_loss": -5.305086135864258, "global_step": 22186, "epoch": 528} {"train_loss": -5.429701328277588, "global_step": 22187, "epoch": 528} {"train_loss": -5.304673194885254, "global_step": 22188, "epoch": 528} {"train_loss": -5.4117326736450195, "global_step": 22189, "epoch": 528} {"train_loss": -5.420066833496094, "global_step": 22190, "epoch": 528} {"train_loss": -5.322168350219727, "global_step": 22191, "epoch": 528} {"train_loss": -5.316524505615234, "global_step": 22192, "epoch": 528} {"train_loss": -5.265944480895996, "global_step": 22193, "epoch": 528} {"train_loss": -5.339530944824219, "global_step": 22194, "epoch": 528} {"train_loss": -5.404144763946533, "global_step": 22195, "epoch": 528} {"train_loss": -5.351316452026367, "global_step": 22196, "epoch": 528} {"train_loss": -5.243453025817871, "global_step": 22197, "epoch": 528} {"train_loss": -5.273789405822754, "global_step": 22198, "epoch": 528} {"train_loss": -5.310036659240723, "global_step": 22199, "epoch": 528} {"train_loss": -5.28515100479126, "global_step": 22200, "epoch": 528} {"train_loss": -5.282650947570801, "global_step": 22201, "epoch": 528} {"train_loss": -5.266374588012695, "global_step": 22202, "epoch": 528} {"train_loss": -5.392819404602051, "global_step": 22203, "epoch": 528} {"train_loss": -5.252209186553955, "global_step": 22204, "epoch": 528} {"train_loss": -5.467528343200684, "global_step": 22205, "epoch": 528} {"train_loss": -5.3610920906066895, "global_step": 22206, "epoch": 528} {"train_loss": -5.461248874664307, "global_step": 22207, "epoch": 528} {"train_loss": -5.241912364959717, "global_step": 22208, "epoch": 528} {"train_loss": -5.3257293701171875, "global_step": 22209, "epoch": 528} {"train_loss": -5.37727165222168, "global_step": 22210, "epoch": 528} {"train_loss": -5.291089057922363, "global_step": 22211, "epoch": 528} {"train_loss": -5.366689682006836, "global_step": 22212, "epoch": 528} {"train_loss": -5.344290256500244, "global_step": 22213, "epoch": 528} {"train_loss": -5.445357322692871, "global_step": 22214, "epoch": 528} {"train_loss": -5.44600772857666, "global_step": 22215, "epoch": 528} {"train_loss": -5.332901477813721, "global_step": 22216, "epoch": 528} {"train_loss": -5.328937280745733, "global_step": 22217, "epoch": 528, "val_loss": 66620.3359375} {"train_loss": -5.436210632324219, "global_step": 22218, "epoch": 529} {"train_loss": -5.328117847442627, "global_step": 22219, "epoch": 529} {"train_loss": -5.319328308105469, "global_step": 22220, "epoch": 529} {"train_loss": -5.301136016845703, "global_step": 22221, "epoch": 529} {"train_loss": -5.27171516418457, "global_step": 22222, "epoch": 529} {"train_loss": -5.234385013580322, "global_step": 22223, "epoch": 529} {"train_loss": -5.42223596572876, "global_step": 22224, "epoch": 529} {"train_loss": -5.370058059692383, "global_step": 22225, "epoch": 529} {"train_loss": -5.3833208084106445, "global_step": 22226, "epoch": 529} {"train_loss": -5.490273475646973, "global_step": 22227, "epoch": 529} {"train_loss": -5.354177474975586, "global_step": 22228, "epoch": 529} {"train_loss": -5.382424831390381, "global_step": 22229, "epoch": 529} {"train_loss": -5.294064998626709, "global_step": 22230, "epoch": 529} {"train_loss": -5.21571683883667, "global_step": 22231, "epoch": 529} {"train_loss": -5.4659881591796875, "global_step": 22232, "epoch": 529} {"train_loss": -5.295886516571045, "global_step": 22233, "epoch": 529} {"train_loss": -5.212257385253906, "global_step": 22234, "epoch": 529} {"train_loss": -5.386056900024414, "global_step": 22235, "epoch": 529} {"train_loss": -5.3353729248046875, "global_step": 22236, "epoch": 529} {"train_loss": -5.307511806488037, "global_step": 22237, "epoch": 529} {"train_loss": -5.281052589416504, "global_step": 22238, "epoch": 529} {"train_loss": -5.16656494140625, "global_step": 22239, "epoch": 529} {"train_loss": -5.338410377502441, "global_step": 22240, "epoch": 529} {"train_loss": -5.367923736572266, "global_step": 22241, "epoch": 529} {"train_loss": -5.355679512023926, "global_step": 22242, "epoch": 529} {"train_loss": -5.434145927429199, "global_step": 22243, "epoch": 529} {"train_loss": -5.353940486907959, "global_step": 22244, "epoch": 529} {"train_loss": -5.332701206207275, "global_step": 22245, "epoch": 529} {"train_loss": -5.269782066345215, "global_step": 22246, "epoch": 529} {"train_loss": -5.313852310180664, "global_step": 22247, "epoch": 529} {"train_loss": -5.284374237060547, "global_step": 22248, "epoch": 529} {"train_loss": -5.301662445068359, "global_step": 22249, "epoch": 529} {"train_loss": -5.203164100646973, "global_step": 22250, "epoch": 529} {"train_loss": -5.353640556335449, "global_step": 22251, "epoch": 529} {"train_loss": -5.240984916687012, "global_step": 22252, "epoch": 529} {"train_loss": -5.286399841308594, "global_step": 22253, "epoch": 529} {"train_loss": -5.270847320556641, "global_step": 22254, "epoch": 529} {"train_loss": -5.266855716705322, "global_step": 22255, "epoch": 529} {"train_loss": -5.422536849975586, "global_step": 22256, "epoch": 529} {"train_loss": -5.251081943511963, "global_step": 22257, "epoch": 529} {"train_loss": -5.264988899230957, "global_step": 22258, "epoch": 529} {"train_loss": -5.322876260394142, "global_step": 22259, "epoch": 529, "val_loss": 66497.3671875} {"train_loss": -5.402679443359375, "global_step": 22260, "epoch": 530} {"train_loss": -5.245383262634277, "global_step": 22261, "epoch": 530} {"train_loss": -5.360311508178711, "global_step": 22262, "epoch": 530} {"train_loss": -5.368167400360107, "global_step": 22263, "epoch": 530} {"train_loss": -5.400519371032715, "global_step": 22264, "epoch": 530} {"train_loss": -5.2313032150268555, "global_step": 22265, "epoch": 530} {"train_loss": -5.212017059326172, "global_step": 22266, "epoch": 530} {"train_loss": -5.263608932495117, "global_step": 22267, "epoch": 530} {"train_loss": -5.456250190734863, "global_step": 22268, "epoch": 530} {"train_loss": -5.282495498657227, "global_step": 22269, "epoch": 530} {"train_loss": -5.403120994567871, "global_step": 22270, "epoch": 530} {"train_loss": -5.25329065322876, "global_step": 22271, "epoch": 530} {"train_loss": -5.461236953735352, "global_step": 22272, "epoch": 530} {"train_loss": -5.33908748626709, "global_step": 22273, "epoch": 530} {"train_loss": -5.447488307952881, "global_step": 22274, "epoch": 530} {"train_loss": -5.455338954925537, "global_step": 22275, "epoch": 530} {"train_loss": -5.354480266571045, "global_step": 22276, "epoch": 530} {"train_loss": -5.352965831756592, "global_step": 22277, "epoch": 530} {"train_loss": -5.391228199005127, "global_step": 22278, "epoch": 530} {"train_loss": -5.355090141296387, "global_step": 22279, "epoch": 530} {"train_loss": -5.419068813323975, "global_step": 22280, "epoch": 530} {"train_loss": -5.380380630493164, "global_step": 22281, "epoch": 530} {"train_loss": -5.415773391723633, "global_step": 22282, "epoch": 530} {"train_loss": -5.167895317077637, "global_step": 22283, "epoch": 530} {"train_loss": -5.16769552230835, "global_step": 22284, "epoch": 530} {"train_loss": -5.361690998077393, "global_step": 22285, "epoch": 530} {"train_loss": -5.248308181762695, "global_step": 22286, "epoch": 530} {"train_loss": -5.377738952636719, "global_step": 22287, "epoch": 530} {"train_loss": -5.301619529724121, "global_step": 22288, "epoch": 530} {"train_loss": -5.332394599914551, "global_step": 22289, "epoch": 530} {"train_loss": -5.429854393005371, "global_step": 22290, "epoch": 530} {"train_loss": -5.301905155181885, "global_step": 22291, "epoch": 530} {"train_loss": -5.401613712310791, "global_step": 22292, "epoch": 530} {"train_loss": -5.1995439529418945, "global_step": 22293, "epoch": 530} {"train_loss": -5.417638778686523, "global_step": 22294, "epoch": 530} {"train_loss": -5.245030403137207, "global_step": 22295, "epoch": 530} {"train_loss": -5.3397536277771, "global_step": 22296, "epoch": 530} {"train_loss": -5.329113960266113, "global_step": 22297, "epoch": 530} {"train_loss": -5.295042037963867, "global_step": 22298, "epoch": 530} {"train_loss": -5.207090854644775, "global_step": 22299, "epoch": 530} {"train_loss": -5.19918155670166, "global_step": 22300, "epoch": 530} {"train_loss": -5.3294999940054755, "global_step": 22301, "epoch": 530, "val_loss": 67225.625} {"train_loss": -5.2362060546875, "global_step": 22302, "epoch": 531} {"train_loss": -5.218006610870361, "global_step": 22303, "epoch": 531} {"train_loss": -5.340803623199463, "global_step": 22304, "epoch": 531} {"train_loss": -5.382425308227539, "global_step": 22305, "epoch": 531} {"train_loss": -5.22652530670166, "global_step": 22306, "epoch": 531} {"train_loss": -5.216587066650391, "global_step": 22307, "epoch": 531} {"train_loss": -5.243642330169678, "global_step": 22308, "epoch": 531} {"train_loss": -5.210108757019043, "global_step": 22309, "epoch": 531} {"train_loss": -5.307003021240234, "global_step": 22310, "epoch": 531} {"train_loss": -5.372457504272461, "global_step": 22311, "epoch": 531} {"train_loss": -5.282933235168457, "global_step": 22312, "epoch": 531} {"train_loss": -5.323245048522949, "global_step": 22313, "epoch": 531} {"train_loss": -5.329638481140137, "global_step": 22314, "epoch": 531} {"train_loss": -5.356748104095459, "global_step": 22315, "epoch": 531} {"train_loss": -5.268637180328369, "global_step": 22316, "epoch": 531} {"train_loss": -5.363319396972656, "global_step": 22317, "epoch": 531} {"train_loss": -5.302491188049316, "global_step": 22318, "epoch": 531} {"train_loss": -5.388121604919434, "global_step": 22319, "epoch": 531} {"train_loss": -5.325984001159668, "global_step": 22320, "epoch": 531} {"train_loss": -5.415168762207031, "global_step": 22321, "epoch": 531} {"train_loss": -5.287209510803223, "global_step": 22322, "epoch": 531} {"train_loss": -5.425087928771973, "global_step": 22323, "epoch": 531} {"train_loss": -5.345007419586182, "global_step": 22324, "epoch": 531} {"train_loss": -5.406196117401123, "global_step": 22325, "epoch": 531} {"train_loss": -5.370227813720703, "global_step": 22326, "epoch": 531} {"train_loss": -5.306683540344238, "global_step": 22327, "epoch": 531} {"train_loss": -5.251598834991455, "global_step": 22328, "epoch": 531} {"train_loss": -5.337429523468018, "global_step": 22329, "epoch": 531} {"train_loss": -5.460063457489014, "global_step": 22330, "epoch": 531} {"train_loss": -5.486362457275391, "global_step": 22331, "epoch": 531} {"train_loss": -5.351215839385986, "global_step": 22332, "epoch": 531} {"train_loss": -5.341135025024414, "global_step": 22333, "epoch": 531} {"train_loss": -5.352219581604004, "global_step": 22334, "epoch": 531} {"train_loss": -5.372361183166504, "global_step": 22335, "epoch": 531} {"train_loss": -5.322486877441406, "global_step": 22336, "epoch": 531} {"train_loss": -5.333378791809082, "global_step": 22337, "epoch": 531} {"train_loss": -5.368803024291992, "global_step": 22338, "epoch": 531} {"train_loss": -5.445293426513672, "global_step": 22339, "epoch": 531} {"train_loss": -5.305779457092285, "global_step": 22340, "epoch": 531} {"train_loss": -5.395934104919434, "global_step": 22341, "epoch": 531} {"train_loss": -5.238564491271973, "global_step": 22342, "epoch": 531} {"train_loss": -5.337039050601778, "global_step": 22343, "epoch": 531, "val_loss": 66320.1640625} {"train_loss": -5.389464378356934, "global_step": 22344, "epoch": 532} {"train_loss": -5.251962661743164, "global_step": 22345, "epoch": 532} {"train_loss": -5.346240043640137, "global_step": 22346, "epoch": 532} {"train_loss": -5.517978668212891, "global_step": 22347, "epoch": 532} {"train_loss": -5.412152290344238, "global_step": 22348, "epoch": 532} {"train_loss": -5.389664173126221, "global_step": 22349, "epoch": 532} {"train_loss": -5.297567367553711, "global_step": 22350, "epoch": 532} {"train_loss": -5.3996992111206055, "global_step": 22351, "epoch": 532} {"train_loss": -5.542111396789551, "global_step": 22352, "epoch": 532} {"train_loss": -5.261897087097168, "global_step": 22353, "epoch": 532} {"train_loss": -5.418758869171143, "global_step": 22354, "epoch": 532} {"train_loss": -5.322315216064453, "global_step": 22355, "epoch": 532} {"train_loss": -5.359962463378906, "global_step": 22356, "epoch": 532} {"train_loss": -5.366502285003662, "global_step": 22357, "epoch": 532} {"train_loss": -5.410713195800781, "global_step": 22358, "epoch": 532} {"train_loss": -5.3220109939575195, "global_step": 22359, "epoch": 532} {"train_loss": -5.375307083129883, "global_step": 22360, "epoch": 532} {"train_loss": -5.300280570983887, "global_step": 22361, "epoch": 532} {"train_loss": -5.428118705749512, "global_step": 22362, "epoch": 532} {"train_loss": -5.436161518096924, "global_step": 22363, "epoch": 532} {"train_loss": -5.415600299835205, "global_step": 22364, "epoch": 532} {"train_loss": -5.392376899719238, "global_step": 22365, "epoch": 532} {"train_loss": -5.286351203918457, "global_step": 22366, "epoch": 532} {"train_loss": -5.338505744934082, "global_step": 22367, "epoch": 532} {"train_loss": -5.318059921264648, "global_step": 22368, "epoch": 532} {"train_loss": -5.3707990646362305, "global_step": 22369, "epoch": 532} {"train_loss": -5.342801570892334, "global_step": 22370, "epoch": 532} {"train_loss": -5.335056304931641, "global_step": 22371, "epoch": 532} {"train_loss": -5.407271385192871, "global_step": 22372, "epoch": 532} {"train_loss": -5.333303928375244, "global_step": 22373, "epoch": 532} {"train_loss": -5.4408040046691895, "global_step": 22374, "epoch": 532} {"train_loss": -5.388582706451416, "global_step": 22375, "epoch": 532} {"train_loss": -5.397540092468262, "global_step": 22376, "epoch": 532} {"train_loss": -5.490633487701416, "global_step": 22377, "epoch": 532} {"train_loss": -5.3265790939331055, "global_step": 22378, "epoch": 532} {"train_loss": -5.2548394203186035, "global_step": 22379, "epoch": 532} {"train_loss": -5.3119401931762695, "global_step": 22380, "epoch": 532} {"train_loss": -5.300383567810059, "global_step": 22381, "epoch": 532} {"train_loss": -5.317076683044434, "global_step": 22382, "epoch": 532} {"train_loss": -5.3201398849487305, "global_step": 22383, "epoch": 532} {"train_loss": -5.424180507659912, "global_step": 22384, "epoch": 532} {"train_loss": -5.368560915901547, "global_step": 22385, "epoch": 532, "val_loss": 66441.2421875} {"train_loss": -5.315661430358887, "global_step": 22386, "epoch": 533} {"train_loss": -5.172675132751465, "global_step": 22387, "epoch": 533} {"train_loss": -5.231428146362305, "global_step": 22388, "epoch": 533} {"train_loss": -5.288731575012207, "global_step": 22389, "epoch": 533} {"train_loss": -5.375264644622803, "global_step": 22390, "epoch": 533} {"train_loss": -5.289363384246826, "global_step": 22391, "epoch": 533} {"train_loss": -5.557966232299805, "global_step": 22392, "epoch": 533} {"train_loss": -5.47381591796875, "global_step": 22393, "epoch": 533} {"train_loss": -5.375374794006348, "global_step": 22394, "epoch": 533} {"train_loss": -5.437942981719971, "global_step": 22395, "epoch": 533} {"train_loss": -5.385225296020508, "global_step": 22396, "epoch": 533} {"train_loss": -5.182231903076172, "global_step": 22397, "epoch": 533} {"train_loss": -5.231388568878174, "global_step": 22398, "epoch": 533} {"train_loss": -5.42505407333374, "global_step": 22399, "epoch": 533} {"train_loss": -5.387768745422363, "global_step": 22400, "epoch": 533} {"train_loss": -5.300442695617676, "global_step": 22401, "epoch": 533} {"train_loss": -5.246093273162842, "global_step": 22402, "epoch": 533} {"train_loss": -5.401327610015869, "global_step": 22403, "epoch": 533} {"train_loss": -5.328092575073242, "global_step": 22404, "epoch": 533} {"train_loss": -5.270816326141357, "global_step": 22405, "epoch": 533} {"train_loss": -5.308349132537842, "global_step": 22406, "epoch": 533} {"train_loss": -5.365320682525635, "global_step": 22407, "epoch": 533} {"train_loss": -5.396457672119141, "global_step": 22408, "epoch": 533} {"train_loss": -5.235376834869385, "global_step": 22409, "epoch": 533} {"train_loss": -5.290783405303955, "global_step": 22410, "epoch": 533} {"train_loss": -5.201517105102539, "global_step": 22411, "epoch": 533} {"train_loss": -5.4315104484558105, "global_step": 22412, "epoch": 533} {"train_loss": -5.278017044067383, "global_step": 22413, "epoch": 533} {"train_loss": -5.246010780334473, "global_step": 22414, "epoch": 533} {"train_loss": -5.289013385772705, "global_step": 22415, "epoch": 533} {"train_loss": -5.3396711349487305, "global_step": 22416, "epoch": 533} {"train_loss": -5.359188079833984, "global_step": 22417, "epoch": 533} {"train_loss": -5.227547645568848, "global_step": 22418, "epoch": 533} {"train_loss": -5.318336009979248, "global_step": 22419, "epoch": 533} {"train_loss": -5.498926639556885, "global_step": 22420, "epoch": 533} {"train_loss": -5.2215471267700195, "global_step": 22421, "epoch": 533} {"train_loss": -5.491561412811279, "global_step": 22422, "epoch": 533} {"train_loss": -5.431427001953125, "global_step": 22423, "epoch": 533} {"train_loss": -5.26448917388916, "global_step": 22424, "epoch": 533} {"train_loss": -5.386111259460449, "global_step": 22425, "epoch": 533} {"train_loss": -5.404760360717773, "global_step": 22426, "epoch": 533} {"train_loss": -5.331935178665888, "global_step": 22427, "epoch": 533, "val_loss": 66178.984375} {"train_loss": -5.2643585205078125, "global_step": 22428, "epoch": 534} {"train_loss": -5.438558578491211, "global_step": 22429, "epoch": 534} {"train_loss": -5.328111171722412, "global_step": 22430, "epoch": 534} {"train_loss": -5.251717567443848, "global_step": 22431, "epoch": 534} {"train_loss": -5.304385662078857, "global_step": 22432, "epoch": 534} {"train_loss": -5.32054328918457, "global_step": 22433, "epoch": 534} {"train_loss": -5.148471832275391, "global_step": 22434, "epoch": 534} {"train_loss": -5.424142837524414, "global_step": 22435, "epoch": 534} {"train_loss": -5.248434066772461, "global_step": 22436, "epoch": 534} {"train_loss": -5.209166526794434, "global_step": 22437, "epoch": 534} {"train_loss": -5.366859436035156, "global_step": 22438, "epoch": 534} {"train_loss": -5.303102493286133, "global_step": 22439, "epoch": 534} {"train_loss": -5.311158180236816, "global_step": 22440, "epoch": 534} {"train_loss": -5.32703161239624, "global_step": 22441, "epoch": 534} {"train_loss": -5.251980781555176, "global_step": 22442, "epoch": 534} {"train_loss": -5.266890525817871, "global_step": 22443, "epoch": 534} {"train_loss": -5.306005477905273, "global_step": 22444, "epoch": 534} {"train_loss": -5.299023628234863, "global_step": 22445, "epoch": 534} {"train_loss": -5.4439239501953125, "global_step": 22446, "epoch": 534} {"train_loss": -5.257413864135742, "global_step": 22447, "epoch": 534} {"train_loss": -5.314676284790039, "global_step": 22448, "epoch": 534} {"train_loss": -5.392849922180176, "global_step": 22449, "epoch": 534} {"train_loss": -5.341869354248047, "global_step": 22450, "epoch": 534} {"train_loss": -5.420228958129883, "global_step": 22451, "epoch": 534} {"train_loss": -5.346371650695801, "global_step": 22452, "epoch": 534} {"train_loss": -5.357611656188965, "global_step": 22453, "epoch": 534} {"train_loss": -5.3930511474609375, "global_step": 22454, "epoch": 534} {"train_loss": -5.450716018676758, "global_step": 22455, "epoch": 534} {"train_loss": -5.3127546310424805, "global_step": 22456, "epoch": 534} {"train_loss": -5.421439170837402, "global_step": 22457, "epoch": 534} {"train_loss": -5.374242782592773, "global_step": 22458, "epoch": 534} {"train_loss": -5.424648284912109, "global_step": 22459, "epoch": 534} {"train_loss": -5.286601543426514, "global_step": 22460, "epoch": 534} {"train_loss": -5.392363548278809, "global_step": 22461, "epoch": 534} {"train_loss": -5.3856353759765625, "global_step": 22462, "epoch": 534} {"train_loss": -5.441058158874512, "global_step": 22463, "epoch": 534} {"train_loss": -5.326910018920898, "global_step": 22464, "epoch": 534} {"train_loss": -5.322512149810791, "global_step": 22465, "epoch": 534} {"train_loss": -5.367775917053223, "global_step": 22466, "epoch": 534} {"train_loss": -5.289096832275391, "global_step": 22467, "epoch": 534} {"train_loss": -5.228646278381348, "global_step": 22468, "epoch": 534} {"train_loss": -5.336025385629563, "global_step": 22469, "epoch": 534, "val_loss": 66980.5078125} {"train_loss": -5.201691627502441, "global_step": 22470, "epoch": 535} {"train_loss": -5.097333908081055, "global_step": 22471, "epoch": 535} {"train_loss": -5.380167484283447, "global_step": 22472, "epoch": 535} {"train_loss": -5.14491605758667, "global_step": 22473, "epoch": 535} {"train_loss": -5.2413330078125, "global_step": 22474, "epoch": 535} {"train_loss": -5.5116095542907715, "global_step": 22475, "epoch": 535} {"train_loss": -5.324590682983398, "global_step": 22476, "epoch": 535} {"train_loss": -5.358218193054199, "global_step": 22477, "epoch": 535} {"train_loss": -5.416298866271973, "global_step": 22478, "epoch": 535} {"train_loss": -5.365166187286377, "global_step": 22479, "epoch": 535} {"train_loss": -5.173396587371826, "global_step": 22480, "epoch": 535} {"train_loss": -5.3841118812561035, "global_step": 22481, "epoch": 535} {"train_loss": -5.371232032775879, "global_step": 22482, "epoch": 535} {"train_loss": -5.346125602722168, "global_step": 22483, "epoch": 535} {"train_loss": -5.350560188293457, "global_step": 22484, "epoch": 535} {"train_loss": -5.246894836425781, "global_step": 22485, "epoch": 535} {"train_loss": -5.461094379425049, "global_step": 22486, "epoch": 535} {"train_loss": -5.1992902755737305, "global_step": 22487, "epoch": 535} {"train_loss": -5.34788703918457, "global_step": 22488, "epoch": 535} {"train_loss": -5.418215751647949, "global_step": 22489, "epoch": 535} {"train_loss": -5.32017183303833, "global_step": 22490, "epoch": 535} {"train_loss": -5.370223045349121, "global_step": 22491, "epoch": 535} {"train_loss": -5.376038551330566, "global_step": 22492, "epoch": 535} {"train_loss": -5.276206016540527, "global_step": 22493, "epoch": 535} {"train_loss": -5.325145721435547, "global_step": 22494, "epoch": 535} {"train_loss": -5.369101524353027, "global_step": 22495, "epoch": 535} {"train_loss": -5.388962745666504, "global_step": 22496, "epoch": 535} {"train_loss": -5.30246639251709, "global_step": 22497, "epoch": 535} {"train_loss": -5.329327583312988, "global_step": 22498, "epoch": 535} {"train_loss": -5.407573699951172, "global_step": 22499, "epoch": 535} {"train_loss": -5.187108993530273, "global_step": 22500, "epoch": 535} {"train_loss": -5.288199424743652, "global_step": 22501, "epoch": 535} {"train_loss": -5.385641574859619, "global_step": 22502, "epoch": 535} {"train_loss": -5.282507419586182, "global_step": 22503, "epoch": 535} {"train_loss": -5.358536720275879, "global_step": 22504, "epoch": 535} {"train_loss": -5.254034042358398, "global_step": 22505, "epoch": 535} {"train_loss": -5.406333923339844, "global_step": 22506, "epoch": 535} {"train_loss": -5.322999000549316, "global_step": 22507, "epoch": 535} {"train_loss": -5.2768049240112305, "global_step": 22508, "epoch": 535} {"train_loss": -5.298301696777344, "global_step": 22509, "epoch": 535} {"train_loss": -5.345667839050293, "global_step": 22510, "epoch": 535} {"train_loss": -5.32128229595366, "global_step": 22511, "epoch": 535, "val_loss": 66344.2890625} {"train_loss": -5.440980911254883, "global_step": 22512, "epoch": 536} {"train_loss": -5.444606304168701, "global_step": 22513, "epoch": 536} {"train_loss": -5.287858486175537, "global_step": 22514, "epoch": 536} {"train_loss": -5.363886833190918, "global_step": 22515, "epoch": 536} {"train_loss": -5.486860275268555, "global_step": 22516, "epoch": 536} {"train_loss": -5.374515056610107, "global_step": 22517, "epoch": 536} {"train_loss": -5.338404655456543, "global_step": 22518, "epoch": 536} {"train_loss": -5.304585933685303, "global_step": 22519, "epoch": 536} {"train_loss": -5.376010894775391, "global_step": 22520, "epoch": 536} {"train_loss": -5.120418548583984, "global_step": 22521, "epoch": 536} {"train_loss": -5.293259143829346, "global_step": 22522, "epoch": 536} {"train_loss": -5.506935119628906, "global_step": 22523, "epoch": 536} {"train_loss": -5.368898391723633, "global_step": 22524, "epoch": 536} {"train_loss": -5.282320976257324, "global_step": 22525, "epoch": 536} {"train_loss": -5.459780693054199, "global_step": 22526, "epoch": 536} {"train_loss": -5.39324426651001, "global_step": 22527, "epoch": 536} {"train_loss": -5.482787609100342, "global_step": 22528, "epoch": 536} {"train_loss": -5.411595344543457, "global_step": 22529, "epoch": 536} {"train_loss": -5.2558417320251465, "global_step": 22530, "epoch": 536} {"train_loss": -5.381906986236572, "global_step": 22531, "epoch": 536} {"train_loss": -5.1881489753723145, "global_step": 22532, "epoch": 536} {"train_loss": -5.298437118530273, "global_step": 22533, "epoch": 536} {"train_loss": -5.43654727935791, "global_step": 22534, "epoch": 536} {"train_loss": -5.346927642822266, "global_step": 22535, "epoch": 536} {"train_loss": -5.423638343811035, "global_step": 22536, "epoch": 536} {"train_loss": -5.338716506958008, "global_step": 22537, "epoch": 536} {"train_loss": -5.231268882751465, "global_step": 22538, "epoch": 536} {"train_loss": -5.470134258270264, "global_step": 22539, "epoch": 536} {"train_loss": -5.244345664978027, "global_step": 22540, "epoch": 536} {"train_loss": -5.30451774597168, "global_step": 22541, "epoch": 536} {"train_loss": -5.52272891998291, "global_step": 22542, "epoch": 536} {"train_loss": -5.267691612243652, "global_step": 22543, "epoch": 536} {"train_loss": -5.3182268142700195, "global_step": 22544, "epoch": 536} {"train_loss": -5.307387351989746, "global_step": 22545, "epoch": 536} {"train_loss": -5.34445858001709, "global_step": 22546, "epoch": 536} {"train_loss": -5.355700492858887, "global_step": 22547, "epoch": 536} {"train_loss": -5.355930328369141, "global_step": 22548, "epoch": 536} {"train_loss": -5.25560998916626, "global_step": 22549, "epoch": 536} {"train_loss": -5.160802841186523, "global_step": 22550, "epoch": 536} {"train_loss": -5.507917404174805, "global_step": 22551, "epoch": 536} {"train_loss": -5.33300256729126, "global_step": 22552, "epoch": 536} {"train_loss": -5.351288295927501, "global_step": 22553, "epoch": 536, "val_loss": 66206.46875} {"train_loss": -5.367029666900635, "global_step": 22554, "epoch": 537} {"train_loss": -5.299768447875977, "global_step": 22555, "epoch": 537} {"train_loss": -5.368036270141602, "global_step": 22556, "epoch": 537} {"train_loss": -5.446006774902344, "global_step": 22557, "epoch": 537} {"train_loss": -5.286860942840576, "global_step": 22558, "epoch": 537} {"train_loss": -5.387117385864258, "global_step": 22559, "epoch": 537} {"train_loss": -5.449669361114502, "global_step": 22560, "epoch": 537} {"train_loss": -5.409173011779785, "global_step": 22561, "epoch": 537} {"train_loss": -5.313934326171875, "global_step": 22562, "epoch": 537} {"train_loss": -5.267718315124512, "global_step": 22563, "epoch": 537} {"train_loss": -5.414251327514648, "global_step": 22564, "epoch": 537} {"train_loss": -5.335676670074463, "global_step": 22565, "epoch": 537} {"train_loss": -5.373430252075195, "global_step": 22566, "epoch": 537} {"train_loss": -5.336004257202148, "global_step": 22567, "epoch": 537} {"train_loss": -5.364089012145996, "global_step": 22568, "epoch": 537} {"train_loss": -5.447912216186523, "global_step": 22569, "epoch": 537} {"train_loss": -5.330594062805176, "global_step": 22570, "epoch": 537} {"train_loss": -5.445232391357422, "global_step": 22571, "epoch": 537} {"train_loss": -5.404942989349365, "global_step": 22572, "epoch": 537} {"train_loss": -5.46199369430542, "global_step": 22573, "epoch": 537} {"train_loss": -5.453479290008545, "global_step": 22574, "epoch": 537} {"train_loss": -5.2709550857543945, "global_step": 22575, "epoch": 537} {"train_loss": -5.248788356781006, "global_step": 22576, "epoch": 537} {"train_loss": -5.271012783050537, "global_step": 22577, "epoch": 537} {"train_loss": -5.368032455444336, "global_step": 22578, "epoch": 537} {"train_loss": -5.412286758422852, "global_step": 22579, "epoch": 537} {"train_loss": -5.424614906311035, "global_step": 22580, "epoch": 537} {"train_loss": -5.3746442794799805, "global_step": 22581, "epoch": 537} {"train_loss": -5.342650413513184, "global_step": 22582, "epoch": 537} {"train_loss": -5.322081089019775, "global_step": 22583, "epoch": 537} {"train_loss": -5.344768524169922, "global_step": 22584, "epoch": 537} {"train_loss": -5.308625221252441, "global_step": 22585, "epoch": 537} {"train_loss": -5.282464981079102, "global_step": 22586, "epoch": 537} {"train_loss": -5.41520357131958, "global_step": 22587, "epoch": 537} {"train_loss": -5.360556602478027, "global_step": 22588, "epoch": 537} {"train_loss": -5.39469051361084, "global_step": 22589, "epoch": 537} {"train_loss": -5.522073745727539, "global_step": 22590, "epoch": 537} {"train_loss": -5.261565208435059, "global_step": 22591, "epoch": 537} {"train_loss": -5.275000095367432, "global_step": 22592, "epoch": 537} {"train_loss": -5.4471354484558105, "global_step": 22593, "epoch": 537} {"train_loss": -5.289405822753906, "global_step": 22594, "epoch": 537} {"train_loss": -5.361752510070801, "global_step": 22595, "epoch": 537, "val_loss": 66179.3515625} {"train_loss": -5.455705642700195, "global_step": 22596, "epoch": 538} {"train_loss": -5.344383239746094, "global_step": 22597, "epoch": 538} {"train_loss": -5.347273349761963, "global_step": 22598, "epoch": 538} {"train_loss": -5.374471664428711, "global_step": 22599, "epoch": 538} {"train_loss": -5.394585132598877, "global_step": 22600, "epoch": 538} {"train_loss": -5.418832778930664, "global_step": 22601, "epoch": 538} {"train_loss": -5.451105117797852, "global_step": 22602, "epoch": 538} {"train_loss": -5.359438419342041, "global_step": 22603, "epoch": 538} {"train_loss": -5.3078131675720215, "global_step": 22604, "epoch": 538} {"train_loss": -5.269753932952881, "global_step": 22605, "epoch": 538} {"train_loss": -5.360581398010254, "global_step": 22606, "epoch": 538} {"train_loss": -5.360927104949951, "global_step": 22607, "epoch": 538} {"train_loss": -5.198129653930664, "global_step": 22608, "epoch": 538} {"train_loss": -5.28690242767334, "global_step": 22609, "epoch": 538} {"train_loss": -5.341063499450684, "global_step": 22610, "epoch": 538} {"train_loss": -5.280511856079102, "global_step": 22611, "epoch": 538} {"train_loss": -5.186247825622559, "global_step": 22612, "epoch": 538} {"train_loss": -5.372993469238281, "global_step": 22613, "epoch": 538} {"train_loss": -5.247437477111816, "global_step": 22614, "epoch": 538} {"train_loss": -5.289083003997803, "global_step": 22615, "epoch": 538} {"train_loss": -5.371919631958008, "global_step": 22616, "epoch": 538} {"train_loss": -5.362100601196289, "global_step": 22617, "epoch": 538} {"train_loss": -5.303516387939453, "global_step": 22618, "epoch": 538} {"train_loss": -5.310909748077393, "global_step": 22619, "epoch": 538} {"train_loss": -5.411943435668945, "global_step": 22620, "epoch": 538} {"train_loss": -5.272091865539551, "global_step": 22621, "epoch": 538} {"train_loss": -5.3436126708984375, "global_step": 22622, "epoch": 538} {"train_loss": -5.426558494567871, "global_step": 22623, "epoch": 538} {"train_loss": -5.40537166595459, "global_step": 22624, "epoch": 538} {"train_loss": -5.390955924987793, "global_step": 22625, "epoch": 538} {"train_loss": -5.318437099456787, "global_step": 22626, "epoch": 538} {"train_loss": -5.191465377807617, "global_step": 22627, "epoch": 538} {"train_loss": -5.460600852966309, "global_step": 22628, "epoch": 538} {"train_loss": -5.317250728607178, "global_step": 22629, "epoch": 538} {"train_loss": -5.396597862243652, "global_step": 22630, "epoch": 538} {"train_loss": -5.466200828552246, "global_step": 22631, "epoch": 538} {"train_loss": -5.393318176269531, "global_step": 22632, "epoch": 538} {"train_loss": -5.24336051940918, "global_step": 22633, "epoch": 538} {"train_loss": -5.336504936218262, "global_step": 22634, "epoch": 538} {"train_loss": -5.311383247375488, "global_step": 22635, "epoch": 538} {"train_loss": -5.354820728302002, "global_step": 22636, "epoch": 538} {"train_loss": -5.3400726318359375, "global_step": 22637, "epoch": 538, "val_loss": 66049.421875} {"train_loss": -5.413468837738037, "global_step": 22638, "epoch": 539} {"train_loss": -5.400432109832764, "global_step": 22639, "epoch": 539} {"train_loss": -5.161746501922607, "global_step": 22640, "epoch": 539} {"train_loss": -5.3376054763793945, "global_step": 22641, "epoch": 539} {"train_loss": -5.419357776641846, "global_step": 22642, "epoch": 539} {"train_loss": -5.174570083618164, "global_step": 22643, "epoch": 539} {"train_loss": -5.368646144866943, "global_step": 22644, "epoch": 539} {"train_loss": -5.401268482208252, "global_step": 22645, "epoch": 539} {"train_loss": -5.3258957862854, "global_step": 22646, "epoch": 539} {"train_loss": -5.2337164878845215, "global_step": 22647, "epoch": 539} {"train_loss": -5.351574420928955, "global_step": 22648, "epoch": 539} {"train_loss": -5.36618709564209, "global_step": 22649, "epoch": 539} {"train_loss": -5.247341156005859, "global_step": 22650, "epoch": 539} {"train_loss": -5.3470587730407715, "global_step": 22651, "epoch": 539} {"train_loss": -5.288698196411133, "global_step": 22652, "epoch": 539} {"train_loss": -5.357240676879883, "global_step": 22653, "epoch": 539} {"train_loss": -5.228630065917969, "global_step": 22654, "epoch": 539} {"train_loss": -5.311104774475098, "global_step": 22655, "epoch": 539} {"train_loss": -5.3181843757629395, "global_step": 22656, "epoch": 539} {"train_loss": -5.3495025634765625, "global_step": 22657, "epoch": 539} {"train_loss": -5.337838649749756, "global_step": 22658, "epoch": 539} {"train_loss": -5.377274513244629, "global_step": 22659, "epoch": 539} {"train_loss": -5.409987449645996, "global_step": 22660, "epoch": 539} {"train_loss": -5.3875250816345215, "global_step": 22661, "epoch": 539} {"train_loss": -5.356681823730469, "global_step": 22662, "epoch": 539} {"train_loss": -5.267232418060303, "global_step": 22663, "epoch": 539} {"train_loss": -5.429412841796875, "global_step": 22664, "epoch": 539} {"train_loss": -5.332121849060059, "global_step": 22665, "epoch": 539} {"train_loss": -5.266944885253906, "global_step": 22666, "epoch": 539} {"train_loss": -5.373132705688477, "global_step": 22667, "epoch": 539} {"train_loss": -5.285261154174805, "global_step": 22668, "epoch": 539} {"train_loss": -5.280560493469238, "global_step": 22669, "epoch": 539} {"train_loss": -5.291991233825684, "global_step": 22670, "epoch": 539} {"train_loss": -5.307783126831055, "global_step": 22671, "epoch": 539} {"train_loss": -5.207295894622803, "global_step": 22672, "epoch": 539} {"train_loss": -5.421261310577393, "global_step": 22673, "epoch": 539} {"train_loss": -5.321563720703125, "global_step": 22674, "epoch": 539} {"train_loss": -5.25730037689209, "global_step": 22675, "epoch": 539} {"train_loss": -5.404356002807617, "global_step": 22676, "epoch": 539} {"train_loss": -5.360716819763184, "global_step": 22677, "epoch": 539} {"train_loss": -5.235548496246338, "global_step": 22678, "epoch": 539} {"train_loss": -5.3225053037915915, "global_step": 22679, "epoch": 539, "val_loss": 66485.453125} {"train_loss": -5.288410186767578, "global_step": 22680, "epoch": 540} {"train_loss": -5.333564281463623, "global_step": 22681, "epoch": 540} {"train_loss": -5.320775032043457, "global_step": 22682, "epoch": 540} {"train_loss": -5.308597564697266, "global_step": 22683, "epoch": 540} {"train_loss": -5.240999698638916, "global_step": 22684, "epoch": 540} {"train_loss": -5.329397201538086, "global_step": 22685, "epoch": 540} {"train_loss": -5.284818172454834, "global_step": 22686, "epoch": 540} {"train_loss": -5.187575340270996, "global_step": 22687, "epoch": 540} {"train_loss": -5.382566928863525, "global_step": 22688, "epoch": 540} {"train_loss": -5.405111312866211, "global_step": 22689, "epoch": 540} {"train_loss": -5.328122138977051, "global_step": 22690, "epoch": 540} {"train_loss": -5.362950325012207, "global_step": 22691, "epoch": 540} {"train_loss": -5.325568199157715, "global_step": 22692, "epoch": 540} {"train_loss": -5.3574018478393555, "global_step": 22693, "epoch": 540} {"train_loss": -5.456833362579346, "global_step": 22694, "epoch": 540} {"train_loss": -5.3092041015625, "global_step": 22695, "epoch": 540} {"train_loss": -5.433296203613281, "global_step": 22696, "epoch": 540} {"train_loss": -5.349701881408691, "global_step": 22697, "epoch": 540} {"train_loss": -5.441181182861328, "global_step": 22698, "epoch": 540} {"train_loss": -5.285804748535156, "global_step": 22699, "epoch": 540} {"train_loss": -5.295413494110107, "global_step": 22700, "epoch": 540} {"train_loss": -5.383781909942627, "global_step": 22701, "epoch": 540} {"train_loss": -5.314181327819824, "global_step": 22702, "epoch": 540} {"train_loss": -5.150407314300537, "global_step": 22703, "epoch": 540} {"train_loss": -5.370340347290039, "global_step": 22704, "epoch": 540} {"train_loss": -5.283994197845459, "global_step": 22705, "epoch": 540} {"train_loss": -5.153609752655029, "global_step": 22706, "epoch": 540} {"train_loss": -5.28435754776001, "global_step": 22707, "epoch": 540} {"train_loss": -5.300225257873535, "global_step": 22708, "epoch": 540} {"train_loss": -5.303627014160156, "global_step": 22709, "epoch": 540} {"train_loss": -5.385809898376465, "global_step": 22710, "epoch": 540} {"train_loss": -5.193462371826172, "global_step": 22711, "epoch": 540} {"train_loss": -5.376910209655762, "global_step": 22712, "epoch": 540} {"train_loss": -5.401029586791992, "global_step": 22713, "epoch": 540} {"train_loss": -5.224519729614258, "global_step": 22714, "epoch": 540} {"train_loss": -5.452798366546631, "global_step": 22715, "epoch": 540} {"train_loss": -5.308371543884277, "global_step": 22716, "epoch": 540} {"train_loss": -5.324636459350586, "global_step": 22717, "epoch": 540} {"train_loss": -5.377636432647705, "global_step": 22718, "epoch": 540} {"train_loss": -5.323427200317383, "global_step": 22719, "epoch": 540} {"train_loss": -5.4180755615234375, "global_step": 22720, "epoch": 540} {"train_loss": -5.322953190122332, "global_step": 22721, "epoch": 540, "val_loss": 66814.6953125} {"train_loss": -5.28762149810791, "global_step": 22722, "epoch": 541} {"train_loss": -5.346222400665283, "global_step": 22723, "epoch": 541} {"train_loss": -5.503986358642578, "global_step": 22724, "epoch": 541} {"train_loss": -5.183249473571777, "global_step": 22725, "epoch": 541} {"train_loss": -5.341455459594727, "global_step": 22726, "epoch": 541} {"train_loss": -5.336956024169922, "global_step": 22727, "epoch": 541} {"train_loss": -5.276296615600586, "global_step": 22728, "epoch": 541} {"train_loss": -5.302488327026367, "global_step": 22729, "epoch": 541} {"train_loss": -5.215081214904785, "global_step": 22730, "epoch": 541} {"train_loss": -5.2754011154174805, "global_step": 22731, "epoch": 541} {"train_loss": -5.434134483337402, "global_step": 22732, "epoch": 541} {"train_loss": -5.300416469573975, "global_step": 22733, "epoch": 541} {"train_loss": -5.326579570770264, "global_step": 22734, "epoch": 541} {"train_loss": -5.350441932678223, "global_step": 22735, "epoch": 541} {"train_loss": -5.459184646606445, "global_step": 22736, "epoch": 541} {"train_loss": -5.2800493240356445, "global_step": 22737, "epoch": 541} {"train_loss": -5.365311145782471, "global_step": 22738, "epoch": 541} {"train_loss": -5.43327522277832, "global_step": 22739, "epoch": 541} {"train_loss": -5.181897163391113, "global_step": 22740, "epoch": 541} {"train_loss": -5.338075637817383, "global_step": 22741, "epoch": 541} {"train_loss": -5.386574745178223, "global_step": 22742, "epoch": 541} {"train_loss": -5.419463157653809, "global_step": 22743, "epoch": 541} {"train_loss": -5.410900115966797, "global_step": 22744, "epoch": 541} {"train_loss": -5.361246109008789, "global_step": 22745, "epoch": 541} {"train_loss": -5.438838481903076, "global_step": 22746, "epoch": 541} {"train_loss": -5.3123979568481445, "global_step": 22747, "epoch": 541} {"train_loss": -5.307300090789795, "global_step": 22748, "epoch": 541} {"train_loss": -5.506990432739258, "global_step": 22749, "epoch": 541} {"train_loss": -5.357393264770508, "global_step": 22750, "epoch": 541} {"train_loss": -5.277983665466309, "global_step": 22751, "epoch": 541} {"train_loss": -5.330648422241211, "global_step": 22752, "epoch": 541} {"train_loss": -5.399364471435547, "global_step": 22753, "epoch": 541} {"train_loss": -5.175258636474609, "global_step": 22754, "epoch": 541} {"train_loss": -5.1444091796875, "global_step": 22755, "epoch": 541} {"train_loss": -5.517836570739746, "global_step": 22756, "epoch": 541} {"train_loss": -5.249792098999023, "global_step": 22757, "epoch": 541} {"train_loss": -5.249325752258301, "global_step": 22758, "epoch": 541} {"train_loss": -5.378929138183594, "global_step": 22759, "epoch": 541} {"train_loss": -5.305501461029053, "global_step": 22760, "epoch": 541} {"train_loss": -5.194843292236328, "global_step": 22761, "epoch": 541} {"train_loss": -5.415535926818848, "global_step": 22762, "epoch": 541} {"train_loss": -5.334755704516456, "global_step": 22763, "epoch": 541, "val_loss": 66699.84375} {"train_loss": -5.325301170349121, "global_step": 22764, "epoch": 542} {"train_loss": -5.397936820983887, "global_step": 22765, "epoch": 542} {"train_loss": -5.302105903625488, "global_step": 22766, "epoch": 542} {"train_loss": -5.384746551513672, "global_step": 22767, "epoch": 542} {"train_loss": -5.3880205154418945, "global_step": 22768, "epoch": 542} {"train_loss": -5.284360408782959, "global_step": 22769, "epoch": 542} {"train_loss": -5.371167182922363, "global_step": 22770, "epoch": 542} {"train_loss": -5.2429962158203125, "global_step": 22771, "epoch": 542} {"train_loss": -5.418416976928711, "global_step": 22772, "epoch": 542} {"train_loss": -5.196015357971191, "global_step": 22773, "epoch": 542} {"train_loss": -5.389898777008057, "global_step": 22774, "epoch": 542} {"train_loss": -5.295176982879639, "global_step": 22775, "epoch": 542} {"train_loss": -5.326243877410889, "global_step": 22776, "epoch": 542} {"train_loss": -5.342462539672852, "global_step": 22777, "epoch": 542} {"train_loss": -5.387822151184082, "global_step": 22778, "epoch": 542} {"train_loss": -5.335777759552002, "global_step": 22779, "epoch": 542} {"train_loss": -5.347252368927002, "global_step": 22780, "epoch": 542} {"train_loss": -5.352339744567871, "global_step": 22781, "epoch": 542} {"train_loss": -5.387411117553711, "global_step": 22782, "epoch": 542} {"train_loss": -5.45669412612915, "global_step": 22783, "epoch": 542} {"train_loss": -5.281416893005371, "global_step": 22784, "epoch": 542} {"train_loss": -5.153974533081055, "global_step": 22785, "epoch": 542} {"train_loss": -5.429229736328125, "global_step": 22786, "epoch": 542} {"train_loss": -5.399713516235352, "global_step": 22787, "epoch": 542} {"train_loss": -5.256299018859863, "global_step": 22788, "epoch": 542} {"train_loss": -5.249672889709473, "global_step": 22789, "epoch": 542} {"train_loss": -5.458714485168457, "global_step": 22790, "epoch": 542} {"train_loss": -5.305056095123291, "global_step": 22791, "epoch": 542} {"train_loss": -5.40377140045166, "global_step": 22792, "epoch": 542} {"train_loss": -5.354606628417969, "global_step": 22793, "epoch": 542} {"train_loss": -5.369601249694824, "global_step": 22794, "epoch": 542} {"train_loss": -5.334042549133301, "global_step": 22795, "epoch": 542} {"train_loss": -5.374998092651367, "global_step": 22796, "epoch": 542} {"train_loss": -5.307629585266113, "global_step": 22797, "epoch": 542} {"train_loss": -5.313851833343506, "global_step": 22798, "epoch": 542} {"train_loss": -5.279080390930176, "global_step": 22799, "epoch": 542} {"train_loss": -5.270421981811523, "global_step": 22800, "epoch": 542} {"train_loss": -5.379096031188965, "global_step": 22801, "epoch": 542} {"train_loss": -5.32127571105957, "global_step": 22802, "epoch": 542} {"train_loss": -5.230222702026367, "global_step": 22803, "epoch": 542} {"train_loss": -5.373263835906982, "global_step": 22804, "epoch": 542} {"train_loss": -5.337096373240153, "global_step": 22805, "epoch": 542, "val_loss": 66542.2734375} {"train_loss": -5.247827053070068, "global_step": 22806, "epoch": 543} {"train_loss": -5.389500617980957, "global_step": 22807, "epoch": 543} {"train_loss": -5.1564717292785645, "global_step": 22808, "epoch": 543} {"train_loss": -5.424059867858887, "global_step": 22809, "epoch": 543} {"train_loss": -5.362970352172852, "global_step": 22810, "epoch": 543} {"train_loss": -5.404059410095215, "global_step": 22811, "epoch": 543} {"train_loss": -5.364192008972168, "global_step": 22812, "epoch": 543} {"train_loss": -5.381916046142578, "global_step": 22813, "epoch": 543} {"train_loss": -5.290915489196777, "global_step": 22814, "epoch": 543} {"train_loss": -5.416085243225098, "global_step": 22815, "epoch": 543} {"train_loss": -5.375738620758057, "global_step": 22816, "epoch": 543} {"train_loss": -5.400241374969482, "global_step": 22817, "epoch": 543} {"train_loss": -5.30143404006958, "global_step": 22818, "epoch": 543} {"train_loss": -5.281791687011719, "global_step": 22819, "epoch": 543} {"train_loss": -5.342307090759277, "global_step": 22820, "epoch": 543} {"train_loss": -5.370595455169678, "global_step": 22821, "epoch": 543} {"train_loss": -5.4388108253479, "global_step": 22822, "epoch": 543} {"train_loss": -5.177781105041504, "global_step": 22823, "epoch": 543} {"train_loss": -5.36361026763916, "global_step": 22824, "epoch": 543} {"train_loss": -5.400657653808594, "global_step": 22825, "epoch": 543} {"train_loss": -5.36391019821167, "global_step": 22826, "epoch": 543} {"train_loss": -5.345682144165039, "global_step": 22827, "epoch": 543} {"train_loss": -5.407783508300781, "global_step": 22828, "epoch": 543} {"train_loss": -5.327579021453857, "global_step": 22829, "epoch": 543} {"train_loss": -5.360491752624512, "global_step": 22830, "epoch": 543} {"train_loss": -5.3995361328125, "global_step": 22831, "epoch": 543} {"train_loss": -5.361773490905762, "global_step": 22832, "epoch": 543} {"train_loss": -5.31606388092041, "global_step": 22833, "epoch": 543} {"train_loss": -5.341775894165039, "global_step": 22834, "epoch": 543} {"train_loss": -5.314265251159668, "global_step": 22835, "epoch": 543} {"train_loss": -5.39951753616333, "global_step": 22836, "epoch": 543} {"train_loss": -5.374355792999268, "global_step": 22837, "epoch": 543} {"train_loss": -5.265924453735352, "global_step": 22838, "epoch": 543} {"train_loss": -5.348719596862793, "global_step": 22839, "epoch": 543} {"train_loss": -5.497454643249512, "global_step": 22840, "epoch": 543} {"train_loss": -5.359172821044922, "global_step": 22841, "epoch": 543} {"train_loss": -5.46304988861084, "global_step": 22842, "epoch": 543} {"train_loss": -5.489319801330566, "global_step": 22843, "epoch": 543} {"train_loss": -5.446793556213379, "global_step": 22844, "epoch": 543} {"train_loss": -5.563236236572266, "global_step": 22845, "epoch": 543} {"train_loss": -5.275400161743164, "global_step": 22846, "epoch": 543} {"train_loss": -5.363839580899193, "global_step": 22847, "epoch": 543, "val_loss": 66294.015625} {"train_loss": -5.310343265533447, "global_step": 22848, "epoch": 544} {"train_loss": -5.486242294311523, "global_step": 22849, "epoch": 544} {"train_loss": -5.441370964050293, "global_step": 22850, "epoch": 544} {"train_loss": -5.320723533630371, "global_step": 22851, "epoch": 544} {"train_loss": -5.283700942993164, "global_step": 22852, "epoch": 544} {"train_loss": -5.2916412353515625, "global_step": 22853, "epoch": 544} {"train_loss": -5.272220611572266, "global_step": 22854, "epoch": 544} {"train_loss": -5.274903297424316, "global_step": 22855, "epoch": 544} {"train_loss": -5.3023505210876465, "global_step": 22856, "epoch": 544} {"train_loss": -5.319156169891357, "global_step": 22857, "epoch": 544} {"train_loss": -5.296124458312988, "global_step": 22858, "epoch": 544} {"train_loss": -5.35992956161499, "global_step": 22859, "epoch": 544} {"train_loss": -5.452155590057373, "global_step": 22860, "epoch": 544} {"train_loss": -5.315079689025879, "global_step": 22861, "epoch": 544} {"train_loss": -5.279951572418213, "global_step": 22862, "epoch": 544} {"train_loss": -5.377579689025879, "global_step": 22863, "epoch": 544} {"train_loss": -5.390005111694336, "global_step": 22864, "epoch": 544} {"train_loss": -5.298969745635986, "global_step": 22865, "epoch": 544} {"train_loss": -5.421289443969727, "global_step": 22866, "epoch": 544} {"train_loss": -5.39968729019165, "global_step": 22867, "epoch": 544} {"train_loss": -5.343550682067871, "global_step": 22868, "epoch": 544} {"train_loss": -5.252218723297119, "global_step": 22869, "epoch": 544} {"train_loss": -5.280374526977539, "global_step": 22870, "epoch": 544} {"train_loss": -5.320295810699463, "global_step": 22871, "epoch": 544} {"train_loss": -5.228486061096191, "global_step": 22872, "epoch": 544} {"train_loss": -5.123260021209717, "global_step": 22873, "epoch": 544} {"train_loss": -5.283847808837891, "global_step": 22874, "epoch": 544} {"train_loss": -5.12443208694458, "global_step": 22875, "epoch": 544} {"train_loss": -5.2975006103515625, "global_step": 22876, "epoch": 544} {"train_loss": -5.367067337036133, "global_step": 22877, "epoch": 544} {"train_loss": -5.3198561668396, "global_step": 22878, "epoch": 544} {"train_loss": -5.292040824890137, "global_step": 22879, "epoch": 544} {"train_loss": -5.4109086990356445, "global_step": 22880, "epoch": 544} {"train_loss": -5.312270164489746, "global_step": 22881, "epoch": 544} {"train_loss": -5.4306254386901855, "global_step": 22882, "epoch": 544} {"train_loss": -5.326994895935059, "global_step": 22883, "epoch": 544} {"train_loss": -5.312704086303711, "global_step": 22884, "epoch": 544} {"train_loss": -5.490909576416016, "global_step": 22885, "epoch": 544} {"train_loss": -5.323188781738281, "global_step": 22886, "epoch": 544} {"train_loss": -5.398968696594238, "global_step": 22887, "epoch": 544} {"train_loss": -5.211730480194092, "global_step": 22888, "epoch": 544} {"train_loss": -5.326798393612816, "global_step": 22889, "epoch": 544, "val_loss": 66116.2265625} {"train_loss": -5.397292137145996, "global_step": 22890, "epoch": 545} {"train_loss": -5.441139221191406, "global_step": 22891, "epoch": 545} {"train_loss": -5.39267635345459, "global_step": 22892, "epoch": 545} {"train_loss": -5.361113548278809, "global_step": 22893, "epoch": 545} {"train_loss": -5.419529438018799, "global_step": 22894, "epoch": 545} {"train_loss": -5.470721244812012, "global_step": 22895, "epoch": 545} {"train_loss": -5.268056392669678, "global_step": 22896, "epoch": 545} {"train_loss": -5.383151054382324, "global_step": 22897, "epoch": 545} {"train_loss": -5.326160430908203, "global_step": 22898, "epoch": 545} {"train_loss": -5.315868854522705, "global_step": 22899, "epoch": 545} {"train_loss": -5.530766487121582, "global_step": 22900, "epoch": 545} {"train_loss": -5.360536575317383, "global_step": 22901, "epoch": 545} {"train_loss": -5.3445234298706055, "global_step": 22902, "epoch": 545} {"train_loss": -5.140004634857178, "global_step": 22903, "epoch": 545} {"train_loss": -5.321364402770996, "global_step": 22904, "epoch": 545} {"train_loss": -5.333229064941406, "global_step": 22905, "epoch": 545} {"train_loss": -5.39663553237915, "global_step": 22906, "epoch": 545} {"train_loss": -5.430887222290039, "global_step": 22907, "epoch": 545} {"train_loss": -5.3203535079956055, "global_step": 22908, "epoch": 545} {"train_loss": -5.435429573059082, "global_step": 22909, "epoch": 545} {"train_loss": -5.274557590484619, "global_step": 22910, "epoch": 545} {"train_loss": -5.310544490814209, "global_step": 22911, "epoch": 545} {"train_loss": -5.31081485748291, "global_step": 22912, "epoch": 545} {"train_loss": -5.252274513244629, "global_step": 22913, "epoch": 545} {"train_loss": -5.2407073974609375, "global_step": 22914, "epoch": 545} {"train_loss": -5.413868427276611, "global_step": 22915, "epoch": 545} {"train_loss": -5.367218017578125, "global_step": 22916, "epoch": 545} {"train_loss": -5.358577728271484, "global_step": 22917, "epoch": 545} {"train_loss": -5.304726600646973, "global_step": 22918, "epoch": 545} {"train_loss": -5.354683876037598, "global_step": 22919, "epoch": 545} {"train_loss": -5.375021934509277, "global_step": 22920, "epoch": 545} {"train_loss": -5.219318866729736, "global_step": 22921, "epoch": 545} {"train_loss": -5.298863410949707, "global_step": 22922, "epoch": 545} {"train_loss": -5.47585391998291, "global_step": 22923, "epoch": 545} {"train_loss": -5.313057899475098, "global_step": 22924, "epoch": 545} {"train_loss": -5.190778732299805, "global_step": 22925, "epoch": 545} {"train_loss": -5.395071029663086, "global_step": 22926, "epoch": 545} {"train_loss": -5.313398838043213, "global_step": 22927, "epoch": 545} {"train_loss": -5.261666297912598, "global_step": 22928, "epoch": 545} {"train_loss": -5.31069278717041, "global_step": 22929, "epoch": 545} {"train_loss": -5.354722023010254, "global_step": 22930, "epoch": 545} {"train_loss": -5.33828634307498, "global_step": 22931, "epoch": 545, "val_loss": 66083.71875} {"train_loss": -5.272705554962158, "global_step": 22932, "epoch": 546} {"train_loss": -5.22567081451416, "global_step": 22933, "epoch": 546} {"train_loss": -5.346981048583984, "global_step": 22934, "epoch": 546} {"train_loss": -5.183230400085449, "global_step": 22935, "epoch": 546} {"train_loss": -5.320656776428223, "global_step": 22936, "epoch": 546} {"train_loss": -5.2365922927856445, "global_step": 22937, "epoch": 546} {"train_loss": -5.419767379760742, "global_step": 22938, "epoch": 546} {"train_loss": -5.161128520965576, "global_step": 22939, "epoch": 546} {"train_loss": -5.234993934631348, "global_step": 22940, "epoch": 546} {"train_loss": -5.344460487365723, "global_step": 22941, "epoch": 546} {"train_loss": -5.309880256652832, "global_step": 22942, "epoch": 546} {"train_loss": -5.300634384155273, "global_step": 22943, "epoch": 546} {"train_loss": -5.401611328125, "global_step": 22944, "epoch": 546} {"train_loss": -5.447333335876465, "global_step": 22945, "epoch": 546} {"train_loss": -5.270482063293457, "global_step": 22946, "epoch": 546} {"train_loss": -5.286508560180664, "global_step": 22947, "epoch": 546} {"train_loss": -5.391618251800537, "global_step": 22948, "epoch": 546} {"train_loss": -5.23878288269043, "global_step": 22949, "epoch": 546} {"train_loss": -5.300213813781738, "global_step": 22950, "epoch": 546} {"train_loss": -5.415897846221924, "global_step": 22951, "epoch": 546} {"train_loss": -5.277613639831543, "global_step": 22952, "epoch": 546} {"train_loss": -5.386646747589111, "global_step": 22953, "epoch": 546} {"train_loss": -5.283721923828125, "global_step": 22954, "epoch": 546} {"train_loss": -5.427236557006836, "global_step": 22955, "epoch": 546} {"train_loss": -5.298344135284424, "global_step": 22956, "epoch": 546} {"train_loss": -5.293635368347168, "global_step": 22957, "epoch": 546} {"train_loss": -5.34262752532959, "global_step": 22958, "epoch": 546} {"train_loss": -5.324366569519043, "global_step": 22959, "epoch": 546} {"train_loss": -5.300195693969727, "global_step": 22960, "epoch": 546} {"train_loss": -5.295027732849121, "global_step": 22961, "epoch": 546} {"train_loss": -5.285297870635986, "global_step": 22962, "epoch": 546} {"train_loss": -5.426786422729492, "global_step": 22963, "epoch": 546} {"train_loss": -5.364818572998047, "global_step": 22964, "epoch": 546} {"train_loss": -5.218142986297607, "global_step": 22965, "epoch": 546} {"train_loss": -5.420328140258789, "global_step": 22966, "epoch": 546} {"train_loss": -5.461403846740723, "global_step": 22967, "epoch": 546} {"train_loss": -5.412186145782471, "global_step": 22968, "epoch": 546} {"train_loss": -5.331028461456299, "global_step": 22969, "epoch": 546} {"train_loss": -5.362797260284424, "global_step": 22970, "epoch": 546} {"train_loss": -5.3025102615356445, "global_step": 22971, "epoch": 546} {"train_loss": -5.4902262687683105, "global_step": 22972, "epoch": 546} {"train_loss": -5.330146358126686, "global_step": 22973, "epoch": 546, "val_loss": 66330.453125} {"train_loss": -5.458068370819092, "global_step": 22974, "epoch": 547} {"train_loss": -5.4357500076293945, "global_step": 22975, "epoch": 547} {"train_loss": -5.262386322021484, "global_step": 22976, "epoch": 547} {"train_loss": -5.309737682342529, "global_step": 22977, "epoch": 547} {"train_loss": -5.33736515045166, "global_step": 22978, "epoch": 547} {"train_loss": -5.383244514465332, "global_step": 22979, "epoch": 547} {"train_loss": -5.204183578491211, "global_step": 22980, "epoch": 547} {"train_loss": -5.312027454376221, "global_step": 22981, "epoch": 547} {"train_loss": -5.44720458984375, "global_step": 22982, "epoch": 547} {"train_loss": -5.264827728271484, "global_step": 22983, "epoch": 547} {"train_loss": -5.314484596252441, "global_step": 22984, "epoch": 547} {"train_loss": -5.2057576179504395, "global_step": 22985, "epoch": 547} {"train_loss": -5.36107063293457, "global_step": 22986, "epoch": 547} {"train_loss": -5.323624610900879, "global_step": 22987, "epoch": 547} {"train_loss": -5.468326568603516, "global_step": 22988, "epoch": 547} {"train_loss": -5.167392730712891, "global_step": 22989, "epoch": 547} {"train_loss": -5.208216667175293, "global_step": 22990, "epoch": 547} {"train_loss": -5.28008508682251, "global_step": 22991, "epoch": 547} {"train_loss": -5.26387357711792, "global_step": 22992, "epoch": 547} {"train_loss": -5.2296552658081055, "global_step": 22993, "epoch": 547} {"train_loss": -5.210073947906494, "global_step": 22994, "epoch": 547} {"train_loss": -5.340301513671875, "global_step": 22995, "epoch": 547} {"train_loss": -5.452306270599365, "global_step": 22996, "epoch": 547} {"train_loss": -5.355252742767334, "global_step": 22997, "epoch": 547} {"train_loss": -5.202786445617676, "global_step": 22998, "epoch": 547} {"train_loss": -5.239811420440674, "global_step": 22999, "epoch": 547} {"train_loss": -5.338863372802734, "global_step": 23000, "epoch": 547} {"train_loss": -5.28231954574585, "global_step": 23001, "epoch": 547} {"train_loss": -5.376428127288818, "global_step": 23002, "epoch": 547} {"train_loss": -5.232748985290527, "global_step": 23003, "epoch": 547} {"train_loss": -5.319911003112793, "global_step": 23004, "epoch": 547} {"train_loss": -5.317055702209473, "global_step": 23005, "epoch": 547} {"train_loss": -5.41451358795166, "global_step": 23006, "epoch": 547} {"train_loss": -5.2433271408081055, "global_step": 23007, "epoch": 547} {"train_loss": -5.410857677459717, "global_step": 23008, "epoch": 547} {"train_loss": -5.3174896240234375, "global_step": 23009, "epoch": 547} {"train_loss": -5.351326942443848, "global_step": 23010, "epoch": 547} {"train_loss": -5.494190692901611, "global_step": 23011, "epoch": 547} {"train_loss": -5.4419450759887695, "global_step": 23012, "epoch": 547} {"train_loss": -5.367666244506836, "global_step": 23013, "epoch": 547} {"train_loss": -5.425347328186035, "global_step": 23014, "epoch": 547} {"train_loss": -5.328319878805251, "global_step": 23015, "epoch": 547, "val_loss": 66861.671875} {"train_loss": -5.275551795959473, "global_step": 23016, "epoch": 548} {"train_loss": -5.385897159576416, "global_step": 23017, "epoch": 548} {"train_loss": -5.326776504516602, "global_step": 23018, "epoch": 548} {"train_loss": -5.232128143310547, "global_step": 23019, "epoch": 548} {"train_loss": -5.215344429016113, "global_step": 23020, "epoch": 548} {"train_loss": -5.271755695343018, "global_step": 23021, "epoch": 548} {"train_loss": -5.4271650314331055, "global_step": 23022, "epoch": 548} {"train_loss": -5.426609039306641, "global_step": 23023, "epoch": 548} {"train_loss": -5.359626770019531, "global_step": 23024, "epoch": 548} {"train_loss": -5.147296905517578, "global_step": 23025, "epoch": 548} {"train_loss": -5.440456390380859, "global_step": 23026, "epoch": 548} {"train_loss": -5.2841057777404785, "global_step": 23027, "epoch": 548} {"train_loss": -5.281750202178955, "global_step": 23028, "epoch": 548} {"train_loss": -5.360905647277832, "global_step": 23029, "epoch": 548} {"train_loss": -5.443046569824219, "global_step": 23030, "epoch": 548} {"train_loss": -5.420345306396484, "global_step": 23031, "epoch": 548} {"train_loss": -5.256253242492676, "global_step": 23032, "epoch": 548} {"train_loss": -5.42244815826416, "global_step": 23033, "epoch": 548} {"train_loss": -5.325922966003418, "global_step": 23034, "epoch": 548} {"train_loss": -5.340527534484863, "global_step": 23035, "epoch": 548} {"train_loss": -5.607476711273193, "global_step": 23036, "epoch": 548} {"train_loss": -5.448361396789551, "global_step": 23037, "epoch": 548} {"train_loss": -5.353195667266846, "global_step": 23038, "epoch": 548} {"train_loss": -5.263733386993408, "global_step": 23039, "epoch": 548} {"train_loss": -5.387302398681641, "global_step": 23040, "epoch": 548} {"train_loss": -5.406669616699219, "global_step": 23041, "epoch": 548} {"train_loss": -5.381450176239014, "global_step": 23042, "epoch": 548} {"train_loss": -5.323644638061523, "global_step": 23043, "epoch": 548} {"train_loss": -5.27786922454834, "global_step": 23044, "epoch": 548} {"train_loss": -5.363845348358154, "global_step": 23045, "epoch": 548} {"train_loss": -5.44422721862793, "global_step": 23046, "epoch": 548} {"train_loss": -5.251862525939941, "global_step": 23047, "epoch": 548} {"train_loss": -5.289605140686035, "global_step": 23048, "epoch": 548} {"train_loss": -5.399328231811523, "global_step": 23049, "epoch": 548} {"train_loss": -5.3956475257873535, "global_step": 23050, "epoch": 548} {"train_loss": -5.371448040008545, "global_step": 23051, "epoch": 548} {"train_loss": -5.330127239227295, "global_step": 23052, "epoch": 548} {"train_loss": -5.318572521209717, "global_step": 23053, "epoch": 548} {"train_loss": -5.324594497680664, "global_step": 23054, "epoch": 548} {"train_loss": -5.505147457122803, "global_step": 23055, "epoch": 548} {"train_loss": -5.3188676834106445, "global_step": 23056, "epoch": 548} {"train_loss": -5.351189772288005, "global_step": 23057, "epoch": 548, "val_loss": 65742.3203125} {"train_loss": -5.507442474365234, "global_step": 23058, "epoch": 549} {"train_loss": -5.303434371948242, "global_step": 23059, "epoch": 549} {"train_loss": -5.480278015136719, "global_step": 23060, "epoch": 549} {"train_loss": -5.433627128601074, "global_step": 23061, "epoch": 549} {"train_loss": -5.244352340698242, "global_step": 23062, "epoch": 549} {"train_loss": -5.287900447845459, "global_step": 23063, "epoch": 549} {"train_loss": -5.085049629211426, "global_step": 23064, "epoch": 549} {"train_loss": -5.354746341705322, "global_step": 23065, "epoch": 549} {"train_loss": -5.247443675994873, "global_step": 23066, "epoch": 549} {"train_loss": -5.298915863037109, "global_step": 23067, "epoch": 549} {"train_loss": -5.216534614562988, "global_step": 23068, "epoch": 549} {"train_loss": -5.3599958419799805, "global_step": 23069, "epoch": 549} {"train_loss": -5.287264823913574, "global_step": 23070, "epoch": 549} {"train_loss": -5.285479545593262, "global_step": 23071, "epoch": 549} {"train_loss": -5.266087532043457, "global_step": 23072, "epoch": 549} {"train_loss": -5.260500907897949, "global_step": 23073, "epoch": 549} {"train_loss": -5.449753284454346, "global_step": 23074, "epoch": 549} {"train_loss": -5.241735935211182, "global_step": 23075, "epoch": 549} {"train_loss": -5.3934526443481445, "global_step": 23076, "epoch": 549} {"train_loss": -5.245646953582764, "global_step": 23077, "epoch": 549} {"train_loss": -5.381473541259766, "global_step": 23078, "epoch": 549} {"train_loss": -5.326986789703369, "global_step": 23079, "epoch": 549} {"train_loss": -5.201382637023926, "global_step": 23080, "epoch": 549} {"train_loss": -5.387571334838867, "global_step": 23081, "epoch": 549} {"train_loss": -5.368913650512695, "global_step": 23082, "epoch": 549} {"train_loss": -5.261746406555176, "global_step": 23083, "epoch": 549} {"train_loss": -5.249145030975342, "global_step": 23084, "epoch": 549} {"train_loss": -5.336495399475098, "global_step": 23085, "epoch": 549} {"train_loss": -5.334054946899414, "global_step": 23086, "epoch": 549} {"train_loss": -5.267429351806641, "global_step": 23087, "epoch": 549} {"train_loss": -5.294209003448486, "global_step": 23088, "epoch": 549} {"train_loss": -5.373744010925293, "global_step": 23089, "epoch": 549} {"train_loss": -5.2920966148376465, "global_step": 23090, "epoch": 549} {"train_loss": -5.501262187957764, "global_step": 23091, "epoch": 549} {"train_loss": -5.380058288574219, "global_step": 23092, "epoch": 549} {"train_loss": -5.305751323699951, "global_step": 23093, "epoch": 549} {"train_loss": -5.318305015563965, "global_step": 23094, "epoch": 549} {"train_loss": -5.3448991775512695, "global_step": 23095, "epoch": 549} {"train_loss": -5.329896926879883, "global_step": 23096, "epoch": 549} {"train_loss": -5.235465049743652, "global_step": 23097, "epoch": 549} {"train_loss": -5.375894546508789, "global_step": 23098, "epoch": 549} {"train_loss": -5.3217022986639115, "global_step": 23099, "epoch": 549, "val_loss": 66087.984375} {"train_loss": -5.286470413208008, "global_step": 23100, "epoch": 550} {"train_loss": -5.187281131744385, "global_step": 23101, "epoch": 550} {"train_loss": -5.36555290222168, "global_step": 23102, "epoch": 550} {"train_loss": -5.277320861816406, "global_step": 23103, "epoch": 550} {"train_loss": -5.329836845397949, "global_step": 23104, "epoch": 550} {"train_loss": -5.430861473083496, "global_step": 23105, "epoch": 550} {"train_loss": -5.285589694976807, "global_step": 23106, "epoch": 550} {"train_loss": -5.162354469299316, "global_step": 23107, "epoch": 550} {"train_loss": -5.314615726470947, "global_step": 23108, "epoch": 550} {"train_loss": -5.197384357452393, "global_step": 23109, "epoch": 550} {"train_loss": -5.199954509735107, "global_step": 23110, "epoch": 550} {"train_loss": -5.299180030822754, "global_step": 23111, "epoch": 550} {"train_loss": -5.199879169464111, "global_step": 23112, "epoch": 550} {"train_loss": -5.295751571655273, "global_step": 23113, "epoch": 550} {"train_loss": -5.334016799926758, "global_step": 23114, "epoch": 550} {"train_loss": -5.197804927825928, "global_step": 23115, "epoch": 550} {"train_loss": -5.38239860534668, "global_step": 23116, "epoch": 550} {"train_loss": -5.194478511810303, "global_step": 23117, "epoch": 550} {"train_loss": -5.263424873352051, "global_step": 23118, "epoch": 550} {"train_loss": -5.2397661209106445, "global_step": 23119, "epoch": 550} {"train_loss": -5.412628173828125, "global_step": 23120, "epoch": 550} {"train_loss": -5.3175530433654785, "global_step": 23121, "epoch": 550} {"train_loss": -5.370701789855957, "global_step": 23122, "epoch": 550} {"train_loss": -5.1786627769470215, "global_step": 23123, "epoch": 550} {"train_loss": -5.274754524230957, "global_step": 23124, "epoch": 550} {"train_loss": -5.4022088050842285, "global_step": 23125, "epoch": 550} {"train_loss": -5.28369140625, "global_step": 23126, "epoch": 550} {"train_loss": -5.2884650230407715, "global_step": 23127, "epoch": 550} {"train_loss": -5.221898555755615, "global_step": 23128, "epoch": 550} {"train_loss": -5.461174964904785, "global_step": 23129, "epoch": 550} {"train_loss": -5.46840763092041, "global_step": 23130, "epoch": 550} {"train_loss": -5.170103073120117, "global_step": 23131, "epoch": 550} {"train_loss": -5.328217029571533, "global_step": 23132, "epoch": 550} {"train_loss": -5.473904132843018, "global_step": 23133, "epoch": 550} {"train_loss": -5.157575607299805, "global_step": 23134, "epoch": 550} {"train_loss": -5.401371002197266, "global_step": 23135, "epoch": 550} {"train_loss": -5.330726146697998, "global_step": 23136, "epoch": 550} {"train_loss": -5.3287224769592285, "global_step": 23137, "epoch": 550} {"train_loss": -5.277649879455566, "global_step": 23138, "epoch": 550} {"train_loss": -5.361277103424072, "global_step": 23139, "epoch": 550} {"train_loss": -5.386629104614258, "global_step": 23140, "epoch": 550} {"train_loss": -5.303874697004046, "global_step": 23141, "epoch": 550, "train/sim_max_reward_0": 0.3242187732536867, "train/sim_max_reward_1": 0.2539109829969636, "train/sim_max_reward_2": 0.12107727543753007, "train/sim_max_reward_3": 0.20560200581998833, "train/sim_max_reward_4": 0.28014560695573903, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.0, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.27937153809368176, "test/sim_max_reward_4300004": 0.12898200459825743, "test/sim_max_reward_4300005": 0.6579870489806159, "test/sim_max_reward_4300006": 0.017356841766926354, "test/sim_max_reward_4300007": 0.045127646075307386, "test/sim_max_reward_4300008": 0.7872920567839088, "test/sim_max_reward_4300009": 0.5585037248074946, "test/sim_max_reward_4300010": 0.1644747105253395, "test/sim_max_reward_4300011": 0.3441929812777999, "test/sim_max_reward_4300012": 0.6880630555370679, "test/sim_max_reward_4300013": 0.3309570131974975, "test/sim_max_reward_4300014": 0.7302918971457923, "test/sim_max_reward_4300015": 0.22434380981056135, "test/sim_max_reward_4300016": 0.43991770777672473, "test/sim_max_reward_4300017": 0.19979935123743434, "test/sim_max_reward_4300018": 0.6299354269911813, "test/sim_max_reward_4300019": 0.18561635007374946, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.43809573863447443, "test/sim_max_reward_4300022": 0.21771512263947854, "test/sim_max_reward_4300023": 0.2057529789273333, "test/sim_max_reward_4300024": 0.15667214530015655, "test/sim_max_reward_4300025": 0.3226153832150274, "test/sim_max_reward_4300026": 0.6471065999039903, "test/sim_max_reward_4300027": 0.6072571712246848, "test/sim_max_reward_4300028": 0.000462342666379851, "test/sim_max_reward_4300029": 0.4158118436429497, "test/sim_max_reward_4300030": 0.6294738224285802, "test/sim_max_reward_4300031": 0.0, "test/sim_max_reward_4300032": 0.575792945019948, "test/sim_max_reward_4300033": 0.31060138928363556, "test/sim_max_reward_4300034": 0.3496052249838678, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.7117570740252275, "test/sim_max_reward_4300038": 0.5443205837934887, "test/sim_max_reward_4300039": 0.8182690531307566, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.1468798120308548, "test/sim_max_reward_4300042": 0.3237743702534597, "test/sim_max_reward_4300043": 0.10852054139245296, "test/sim_max_reward_4300044": 0.8341078274237755, "test/sim_max_reward_4300045": 0.27572507192470974, "test/sim_max_reward_4300046": 0.0, "test/sim_max_reward_4300047": 0.08948637990958103, "test/sim_max_reward_4300048": 0.019976638649722385, "test/sim_max_reward_4300049": 0.4509461320553569, "train/mean_score": 0.22965656730434916, "test/mean_score": 0.31972339678387895, "val_loss": 66176.875} {"train_loss": -5.330634117126465, "global_step": 23142, "epoch": 551} {"train_loss": -5.246528625488281, "global_step": 23143, "epoch": 551} {"train_loss": -5.353592872619629, "global_step": 23144, "epoch": 551} {"train_loss": -5.362874507904053, "global_step": 23145, "epoch": 551} {"train_loss": -5.468254566192627, "global_step": 23146, "epoch": 551} {"train_loss": -5.4442033767700195, "global_step": 23147, "epoch": 551} {"train_loss": -5.372773170471191, "global_step": 23148, "epoch": 551} {"train_loss": -5.307528495788574, "global_step": 23149, "epoch": 551} {"train_loss": -5.3352437019348145, "global_step": 23150, "epoch": 551} {"train_loss": -5.3249688148498535, "global_step": 23151, "epoch": 551} {"train_loss": -5.301102638244629, "global_step": 23152, "epoch": 551} {"train_loss": -5.302147388458252, "global_step": 23153, "epoch": 551} {"train_loss": -5.364381790161133, "global_step": 23154, "epoch": 551} {"train_loss": -5.369123935699463, "global_step": 23155, "epoch": 551} {"train_loss": -5.381618022918701, "global_step": 23156, "epoch": 551} {"train_loss": -5.3157548904418945, "global_step": 23157, "epoch": 551} {"train_loss": -5.380588531494141, "global_step": 23158, "epoch": 551} {"train_loss": -5.25830078125, "global_step": 23159, "epoch": 551} {"train_loss": -5.384194850921631, "global_step": 23160, "epoch": 551} {"train_loss": -5.293696880340576, "global_step": 23161, "epoch": 551} {"train_loss": -5.347447872161865, "global_step": 23162, "epoch": 551} {"train_loss": -5.431681156158447, "global_step": 23163, "epoch": 551} {"train_loss": -5.336414337158203, "global_step": 23164, "epoch": 551} {"train_loss": -5.358712196350098, "global_step": 23165, "epoch": 551} {"train_loss": -5.387673854827881, "global_step": 23166, "epoch": 551} {"train_loss": -5.314659118652344, "global_step": 23167, "epoch": 551} {"train_loss": -5.426191329956055, "global_step": 23168, "epoch": 551} {"train_loss": -5.44643497467041, "global_step": 23169, "epoch": 551} {"train_loss": -5.172266006469727, "global_step": 23170, "epoch": 551} {"train_loss": -5.342659950256348, "global_step": 23171, "epoch": 551} {"train_loss": -5.371574401855469, "global_step": 23172, "epoch": 551} {"train_loss": -5.356238842010498, "global_step": 23173, "epoch": 551} {"train_loss": -5.168961048126221, "global_step": 23174, "epoch": 551} {"train_loss": -5.288718223571777, "global_step": 23175, "epoch": 551} {"train_loss": -5.262495040893555, "global_step": 23176, "epoch": 551} {"train_loss": -5.145041465759277, "global_step": 23177, "epoch": 551} {"train_loss": -5.2173051834106445, "global_step": 23178, "epoch": 551} {"train_loss": -5.219513893127441, "global_step": 23179, "epoch": 551} {"train_loss": -5.246741771697998, "global_step": 23180, "epoch": 551} {"train_loss": -5.4147257804870605, "global_step": 23181, "epoch": 551} {"train_loss": -5.203790664672852, "global_step": 23182, "epoch": 551} {"train_loss": -5.322839998063587, "global_step": 23183, "epoch": 551, "val_loss": 66718.6015625} {"train_loss": -5.354025363922119, "global_step": 23184, "epoch": 552} {"train_loss": -5.176161766052246, "global_step": 23185, "epoch": 552} {"train_loss": -5.365731716156006, "global_step": 23186, "epoch": 552} {"train_loss": -5.125787734985352, "global_step": 23187, "epoch": 552} {"train_loss": -5.37337589263916, "global_step": 23188, "epoch": 552} {"train_loss": -5.346994876861572, "global_step": 23189, "epoch": 552} {"train_loss": -5.247540473937988, "global_step": 23190, "epoch": 552} {"train_loss": -5.435196876525879, "global_step": 23191, "epoch": 552} {"train_loss": -5.284041404724121, "global_step": 23192, "epoch": 552} {"train_loss": -5.13801383972168, "global_step": 23193, "epoch": 552} {"train_loss": -5.2146124839782715, "global_step": 23194, "epoch": 552} {"train_loss": -5.347002983093262, "global_step": 23195, "epoch": 552} {"train_loss": -5.1821184158325195, "global_step": 23196, "epoch": 552} {"train_loss": -5.3833723068237305, "global_step": 23197, "epoch": 552} {"train_loss": -5.318985939025879, "global_step": 23198, "epoch": 552} {"train_loss": -5.26200008392334, "global_step": 23199, "epoch": 552} {"train_loss": -5.287570953369141, "global_step": 23200, "epoch": 552} {"train_loss": -5.211377143859863, "global_step": 23201, "epoch": 552} {"train_loss": -5.373323440551758, "global_step": 23202, "epoch": 552} {"train_loss": -5.307489395141602, "global_step": 23203, "epoch": 552} {"train_loss": -5.341096878051758, "global_step": 23204, "epoch": 552} {"train_loss": -5.325007915496826, "global_step": 23205, "epoch": 552} {"train_loss": -5.40372371673584, "global_step": 23206, "epoch": 552} {"train_loss": -5.372509956359863, "global_step": 23207, "epoch": 552} {"train_loss": -5.262331008911133, "global_step": 23208, "epoch": 552} {"train_loss": -5.485511302947998, "global_step": 23209, "epoch": 552} {"train_loss": -5.2674736976623535, "global_step": 23210, "epoch": 552} {"train_loss": -5.347543716430664, "global_step": 23211, "epoch": 552} {"train_loss": -5.463222026824951, "global_step": 23212, "epoch": 552} {"train_loss": -5.213567733764648, "global_step": 23213, "epoch": 552} {"train_loss": -5.380038261413574, "global_step": 23214, "epoch": 552} {"train_loss": -5.3394083976745605, "global_step": 23215, "epoch": 552} {"train_loss": -5.304346561431885, "global_step": 23216, "epoch": 552} {"train_loss": -5.4111008644104, "global_step": 23217, "epoch": 552} {"train_loss": -5.344588279724121, "global_step": 23218, "epoch": 552} {"train_loss": -5.390027046203613, "global_step": 23219, "epoch": 552} {"train_loss": -5.466987609863281, "global_step": 23220, "epoch": 552} {"train_loss": -5.255516052246094, "global_step": 23221, "epoch": 552} {"train_loss": -5.4440460205078125, "global_step": 23222, "epoch": 552} {"train_loss": -5.445334434509277, "global_step": 23223, "epoch": 552} {"train_loss": -5.325450897216797, "global_step": 23224, "epoch": 552} {"train_loss": -5.326773677553449, "global_step": 23225, "epoch": 552, "val_loss": 66420.59375} {"train_loss": -5.350688934326172, "global_step": 23226, "epoch": 553} {"train_loss": -5.268617630004883, "global_step": 23227, "epoch": 553} {"train_loss": -5.451617240905762, "global_step": 23228, "epoch": 553} {"train_loss": -5.388973712921143, "global_step": 23229, "epoch": 553} {"train_loss": -5.365010738372803, "global_step": 23230, "epoch": 553} {"train_loss": -5.36517333984375, "global_step": 23231, "epoch": 553} {"train_loss": -5.513428211212158, "global_step": 23232, "epoch": 553} {"train_loss": -5.284763336181641, "global_step": 23233, "epoch": 553} {"train_loss": -5.376766681671143, "global_step": 23234, "epoch": 553} {"train_loss": -5.4293646812438965, "global_step": 23235, "epoch": 553} {"train_loss": -5.3816118240356445, "global_step": 23236, "epoch": 553} {"train_loss": -5.216558933258057, "global_step": 23237, "epoch": 553} {"train_loss": -5.32661771774292, "global_step": 23238, "epoch": 553} {"train_loss": -5.355191230773926, "global_step": 23239, "epoch": 553} {"train_loss": -5.259453773498535, "global_step": 23240, "epoch": 553} {"train_loss": -5.321305274963379, "global_step": 23241, "epoch": 553} {"train_loss": -5.27625846862793, "global_step": 23242, "epoch": 553} {"train_loss": -5.290987491607666, "global_step": 23243, "epoch": 553} {"train_loss": -5.254665374755859, "global_step": 23244, "epoch": 553} {"train_loss": -5.214662551879883, "global_step": 23245, "epoch": 553} {"train_loss": -5.260542869567871, "global_step": 23246, "epoch": 553} {"train_loss": -5.212491989135742, "global_step": 23247, "epoch": 553} {"train_loss": -5.194501876831055, "global_step": 23248, "epoch": 553} {"train_loss": -5.407972812652588, "global_step": 23249, "epoch": 553} {"train_loss": -5.156922817230225, "global_step": 23250, "epoch": 553} {"train_loss": -5.311641693115234, "global_step": 23251, "epoch": 553} {"train_loss": -5.344579696655273, "global_step": 23252, "epoch": 553} {"train_loss": -5.29774284362793, "global_step": 23253, "epoch": 553} {"train_loss": -5.465908527374268, "global_step": 23254, "epoch": 553} {"train_loss": -5.260279178619385, "global_step": 23255, "epoch": 553} {"train_loss": -5.440826416015625, "global_step": 23256, "epoch": 553} {"train_loss": -5.235585689544678, "global_step": 23257, "epoch": 553} {"train_loss": -5.353403568267822, "global_step": 23258, "epoch": 553} {"train_loss": -5.369890213012695, "global_step": 23259, "epoch": 553} {"train_loss": -5.32138729095459, "global_step": 23260, "epoch": 553} {"train_loss": -5.329807281494141, "global_step": 23261, "epoch": 553} {"train_loss": -5.358724117279053, "global_step": 23262, "epoch": 553} {"train_loss": -5.410378932952881, "global_step": 23263, "epoch": 553} {"train_loss": -5.460243225097656, "global_step": 23264, "epoch": 553} {"train_loss": -5.331159591674805, "global_step": 23265, "epoch": 553} {"train_loss": -5.3739728927612305, "global_step": 23266, "epoch": 553} {"train_loss": -5.329096078872681, "global_step": 23267, "epoch": 553, "val_loss": 66051.3359375} {"train_loss": -5.4115190505981445, "global_step": 23268, "epoch": 554} {"train_loss": -5.40372371673584, "global_step": 23269, "epoch": 554} {"train_loss": -5.377734184265137, "global_step": 23270, "epoch": 554} {"train_loss": -5.332943916320801, "global_step": 23271, "epoch": 554} {"train_loss": -5.297203063964844, "global_step": 23272, "epoch": 554} {"train_loss": -5.288922309875488, "global_step": 23273, "epoch": 554} {"train_loss": -5.460001468658447, "global_step": 23274, "epoch": 554} {"train_loss": -5.220619201660156, "global_step": 23275, "epoch": 554} {"train_loss": -5.340334892272949, "global_step": 23276, "epoch": 554} {"train_loss": -5.501980304718018, "global_step": 23277, "epoch": 554} {"train_loss": -5.114989280700684, "global_step": 23278, "epoch": 554} {"train_loss": -5.39546537399292, "global_step": 23279, "epoch": 554} {"train_loss": -5.266356945037842, "global_step": 23280, "epoch": 554} {"train_loss": -5.14445686340332, "global_step": 23281, "epoch": 554} {"train_loss": -5.36917781829834, "global_step": 23282, "epoch": 554} {"train_loss": -5.24415397644043, "global_step": 23283, "epoch": 554} {"train_loss": -5.354123115539551, "global_step": 23284, "epoch": 554} {"train_loss": -5.340437412261963, "global_step": 23285, "epoch": 554} {"train_loss": -5.262197017669678, "global_step": 23286, "epoch": 554} {"train_loss": -5.290970802307129, "global_step": 23287, "epoch": 554} {"train_loss": -5.351005554199219, "global_step": 23288, "epoch": 554} {"train_loss": -5.22089958190918, "global_step": 23289, "epoch": 554} {"train_loss": -5.438523292541504, "global_step": 23290, "epoch": 554} {"train_loss": -5.336115837097168, "global_step": 23291, "epoch": 554} {"train_loss": -5.339010238647461, "global_step": 23292, "epoch": 554} {"train_loss": -5.277454376220703, "global_step": 23293, "epoch": 554} {"train_loss": -5.139644145965576, "global_step": 23294, "epoch": 554} {"train_loss": -5.265734672546387, "global_step": 23295, "epoch": 554} {"train_loss": -5.309784889221191, "global_step": 23296, "epoch": 554} {"train_loss": -5.314446449279785, "global_step": 23297, "epoch": 554} {"train_loss": -5.337222099304199, "global_step": 23298, "epoch": 554} {"train_loss": -5.479044437408447, "global_step": 23299, "epoch": 554} {"train_loss": -5.301601409912109, "global_step": 23300, "epoch": 554} {"train_loss": -5.326449394226074, "global_step": 23301, "epoch": 554} {"train_loss": -5.472897529602051, "global_step": 23302, "epoch": 554} {"train_loss": -5.412361145019531, "global_step": 23303, "epoch": 554} {"train_loss": -5.368032455444336, "global_step": 23304, "epoch": 554} {"train_loss": -5.364455699920654, "global_step": 23305, "epoch": 554} {"train_loss": -5.316665172576904, "global_step": 23306, "epoch": 554} {"train_loss": -5.333583831787109, "global_step": 23307, "epoch": 554} {"train_loss": -5.349607944488525, "global_step": 23308, "epoch": 554} {"train_loss": -5.326034863789876, "global_step": 23309, "epoch": 554, "val_loss": 65811.578125} {"train_loss": -5.41977596282959, "global_step": 23310, "epoch": 555} {"train_loss": -5.375221252441406, "global_step": 23311, "epoch": 555} {"train_loss": -5.319473743438721, "global_step": 23312, "epoch": 555} {"train_loss": -5.4186015129089355, "global_step": 23313, "epoch": 555} {"train_loss": -5.311647891998291, "global_step": 23314, "epoch": 555} {"train_loss": -5.195404052734375, "global_step": 23315, "epoch": 555} {"train_loss": -5.473545551300049, "global_step": 23316, "epoch": 555} {"train_loss": -5.35213565826416, "global_step": 23317, "epoch": 555} {"train_loss": -5.491093635559082, "global_step": 23318, "epoch": 555} {"train_loss": -5.480618953704834, "global_step": 23319, "epoch": 555} {"train_loss": -5.379067420959473, "global_step": 23320, "epoch": 555} {"train_loss": -5.323000907897949, "global_step": 23321, "epoch": 555} {"train_loss": -5.256232738494873, "global_step": 23322, "epoch": 555} {"train_loss": -5.436755180358887, "global_step": 23323, "epoch": 555} {"train_loss": -5.333867073059082, "global_step": 23324, "epoch": 555} {"train_loss": -5.272228240966797, "global_step": 23325, "epoch": 555} {"train_loss": -5.34402322769165, "global_step": 23326, "epoch": 555} {"train_loss": -5.439626216888428, "global_step": 23327, "epoch": 555} {"train_loss": -5.423971652984619, "global_step": 23328, "epoch": 555} {"train_loss": -5.323602676391602, "global_step": 23329, "epoch": 555} {"train_loss": -5.249438762664795, "global_step": 23330, "epoch": 555} {"train_loss": -5.369724750518799, "global_step": 23331, "epoch": 555} {"train_loss": -5.43510627746582, "global_step": 23332, "epoch": 555} {"train_loss": -5.4690093994140625, "global_step": 23333, "epoch": 555} {"train_loss": -5.297074317932129, "global_step": 23334, "epoch": 555} {"train_loss": -5.2843170166015625, "global_step": 23335, "epoch": 555} {"train_loss": -5.362551689147949, "global_step": 23336, "epoch": 555} {"train_loss": -5.249462127685547, "global_step": 23337, "epoch": 555} {"train_loss": -5.385249137878418, "global_step": 23338, "epoch": 555} {"train_loss": -5.292983055114746, "global_step": 23339, "epoch": 555} {"train_loss": -5.316519737243652, "global_step": 23340, "epoch": 555} {"train_loss": -5.367468357086182, "global_step": 23341, "epoch": 555} {"train_loss": -5.492709636688232, "global_step": 23342, "epoch": 555} {"train_loss": -5.23558235168457, "global_step": 23343, "epoch": 555} {"train_loss": -5.373419284820557, "global_step": 23344, "epoch": 555} {"train_loss": -5.299242973327637, "global_step": 23345, "epoch": 555} {"train_loss": -5.308346748352051, "global_step": 23346, "epoch": 555} {"train_loss": -5.424924850463867, "global_step": 23347, "epoch": 555} {"train_loss": -5.31886100769043, "global_step": 23348, "epoch": 555} {"train_loss": -5.344668388366699, "global_step": 23349, "epoch": 555} {"train_loss": -5.428504943847656, "global_step": 23350, "epoch": 555} {"train_loss": -5.357745919908796, "global_step": 23351, "epoch": 555, "val_loss": 65888.4453125} {"train_loss": -5.3257365226745605, "global_step": 23352, "epoch": 556} {"train_loss": -5.4432549476623535, "global_step": 23353, "epoch": 556} {"train_loss": -5.344587326049805, "global_step": 23354, "epoch": 556} {"train_loss": -5.396141529083252, "global_step": 23355, "epoch": 556} {"train_loss": -5.429849147796631, "global_step": 23356, "epoch": 556} {"train_loss": -5.430129051208496, "global_step": 23357, "epoch": 556} {"train_loss": -5.456378936767578, "global_step": 23358, "epoch": 556} {"train_loss": -5.3612213134765625, "global_step": 23359, "epoch": 556} {"train_loss": -5.424723148345947, "global_step": 23360, "epoch": 556} {"train_loss": -5.324697971343994, "global_step": 23361, "epoch": 556} {"train_loss": -5.314274787902832, "global_step": 23362, "epoch": 556} {"train_loss": -5.429150581359863, "global_step": 23363, "epoch": 556} {"train_loss": -5.41349458694458, "global_step": 23364, "epoch": 556} {"train_loss": -5.390913963317871, "global_step": 23365, "epoch": 556} {"train_loss": -5.35257625579834, "global_step": 23366, "epoch": 556} {"train_loss": -5.348788261413574, "global_step": 23367, "epoch": 556} {"train_loss": -5.39586067199707, "global_step": 23368, "epoch": 556} {"train_loss": -5.345920562744141, "global_step": 23369, "epoch": 556} {"train_loss": -5.372653007507324, "global_step": 23370, "epoch": 556} {"train_loss": -5.308187961578369, "global_step": 23371, "epoch": 556} {"train_loss": -5.296730995178223, "global_step": 23372, "epoch": 556} {"train_loss": -5.259038925170898, "global_step": 23373, "epoch": 556} {"train_loss": -5.409832000732422, "global_step": 23374, "epoch": 556} {"train_loss": -5.360179901123047, "global_step": 23375, "epoch": 556} {"train_loss": -5.363306045532227, "global_step": 23376, "epoch": 556} {"train_loss": -5.4699811935424805, "global_step": 23377, "epoch": 556} {"train_loss": -5.398371696472168, "global_step": 23378, "epoch": 556} {"train_loss": -5.43261194229126, "global_step": 23379, "epoch": 556} {"train_loss": -5.445367813110352, "global_step": 23380, "epoch": 556} {"train_loss": -5.424957752227783, "global_step": 23381, "epoch": 556} {"train_loss": -5.386955261230469, "global_step": 23382, "epoch": 556} {"train_loss": -5.286769866943359, "global_step": 23383, "epoch": 556} {"train_loss": -5.245428085327148, "global_step": 23384, "epoch": 556} {"train_loss": -5.401567459106445, "global_step": 23385, "epoch": 556} {"train_loss": -5.405725002288818, "global_step": 23386, "epoch": 556} {"train_loss": -5.404019355773926, "global_step": 23387, "epoch": 556} {"train_loss": -5.384484767913818, "global_step": 23388, "epoch": 556} {"train_loss": -5.4756855964660645, "global_step": 23389, "epoch": 556} {"train_loss": -5.540587425231934, "global_step": 23390, "epoch": 556} {"train_loss": -5.307775497436523, "global_step": 23391, "epoch": 556} {"train_loss": -5.361567497253418, "global_step": 23392, "epoch": 556} {"train_loss": -5.382125865845453, "global_step": 23393, "epoch": 556, "val_loss": 65793.328125} {"train_loss": -5.465576648712158, "global_step": 23394, "epoch": 557} {"train_loss": -5.4228973388671875, "global_step": 23395, "epoch": 557} {"train_loss": -5.3909149169921875, "global_step": 23396, "epoch": 557} {"train_loss": -5.516437530517578, "global_step": 23397, "epoch": 557} {"train_loss": -5.379880428314209, "global_step": 23398, "epoch": 557} {"train_loss": -5.383974075317383, "global_step": 23399, "epoch": 557} {"train_loss": -5.43031120300293, "global_step": 23400, "epoch": 557} {"train_loss": -5.39525032043457, "global_step": 23401, "epoch": 557} {"train_loss": -5.555083751678467, "global_step": 23402, "epoch": 557} {"train_loss": -5.365372657775879, "global_step": 23403, "epoch": 557} {"train_loss": -5.34053897857666, "global_step": 23404, "epoch": 557} {"train_loss": -5.34705114364624, "global_step": 23405, "epoch": 557} {"train_loss": -5.371686935424805, "global_step": 23406, "epoch": 557} {"train_loss": -5.570865154266357, "global_step": 23407, "epoch": 557} {"train_loss": -5.469086647033691, "global_step": 23408, "epoch": 557} {"train_loss": -5.389682769775391, "global_step": 23409, "epoch": 557} {"train_loss": -5.429693222045898, "global_step": 23410, "epoch": 557} {"train_loss": -5.362671852111816, "global_step": 23411, "epoch": 557} {"train_loss": -5.371741771697998, "global_step": 23412, "epoch": 557} {"train_loss": -5.250516891479492, "global_step": 23413, "epoch": 557} {"train_loss": -5.3704514503479, "global_step": 23414, "epoch": 557} {"train_loss": -5.245510101318359, "global_step": 23415, "epoch": 557} {"train_loss": -5.337926387786865, "global_step": 23416, "epoch": 557} {"train_loss": -5.411102771759033, "global_step": 23417, "epoch": 557} {"train_loss": -5.214723587036133, "global_step": 23418, "epoch": 557} {"train_loss": -5.330730438232422, "global_step": 23419, "epoch": 557} {"train_loss": -5.299887180328369, "global_step": 23420, "epoch": 557} {"train_loss": -5.367893218994141, "global_step": 23421, "epoch": 557} {"train_loss": -5.502594947814941, "global_step": 23422, "epoch": 557} {"train_loss": -5.350878715515137, "global_step": 23423, "epoch": 557} {"train_loss": -5.4924821853637695, "global_step": 23424, "epoch": 557} {"train_loss": -5.432790756225586, "global_step": 23425, "epoch": 557} {"train_loss": -5.424593925476074, "global_step": 23426, "epoch": 557} {"train_loss": -5.3158416748046875, "global_step": 23427, "epoch": 557} {"train_loss": -5.4423017501831055, "global_step": 23428, "epoch": 557} {"train_loss": -5.410669326782227, "global_step": 23429, "epoch": 557} {"train_loss": -5.301564693450928, "global_step": 23430, "epoch": 557} {"train_loss": -5.2174248695373535, "global_step": 23431, "epoch": 557} {"train_loss": -5.445595741271973, "global_step": 23432, "epoch": 557} {"train_loss": -5.390286922454834, "global_step": 23433, "epoch": 557} {"train_loss": -5.222891807556152, "global_step": 23434, "epoch": 557} {"train_loss": -5.381722450256348, "global_step": 23435, "epoch": 557, "val_loss": 65916.125} {"train_loss": -5.285064697265625, "global_step": 23436, "epoch": 558} {"train_loss": -5.332640647888184, "global_step": 23437, "epoch": 558} {"train_loss": -5.3268327713012695, "global_step": 23438, "epoch": 558} {"train_loss": -5.32181978225708, "global_step": 23439, "epoch": 558} {"train_loss": -5.422398567199707, "global_step": 23440, "epoch": 558} {"train_loss": -5.206827163696289, "global_step": 23441, "epoch": 558} {"train_loss": -5.451572895050049, "global_step": 23442, "epoch": 558} {"train_loss": -5.320470809936523, "global_step": 23443, "epoch": 558} {"train_loss": -5.501204490661621, "global_step": 23444, "epoch": 558} {"train_loss": -5.300129413604736, "global_step": 23445, "epoch": 558} {"train_loss": -5.368583679199219, "global_step": 23446, "epoch": 558} {"train_loss": -5.419374465942383, "global_step": 23447, "epoch": 558} {"train_loss": -5.4361419677734375, "global_step": 23448, "epoch": 558} {"train_loss": -5.462127685546875, "global_step": 23449, "epoch": 558} {"train_loss": -5.264423370361328, "global_step": 23450, "epoch": 558} {"train_loss": -5.252557754516602, "global_step": 23451, "epoch": 558} {"train_loss": -5.46278190612793, "global_step": 23452, "epoch": 558} {"train_loss": -5.335495948791504, "global_step": 23453, "epoch": 558} {"train_loss": -5.337329864501953, "global_step": 23454, "epoch": 558} {"train_loss": -5.410439491271973, "global_step": 23455, "epoch": 558} {"train_loss": -5.378148078918457, "global_step": 23456, "epoch": 558} {"train_loss": -5.3480000495910645, "global_step": 23457, "epoch": 558} {"train_loss": -5.382917404174805, "global_step": 23458, "epoch": 558} {"train_loss": -5.4007368087768555, "global_step": 23459, "epoch": 558} {"train_loss": -5.407092094421387, "global_step": 23460, "epoch": 558} {"train_loss": -5.413308143615723, "global_step": 23461, "epoch": 558} {"train_loss": -5.354245185852051, "global_step": 23462, "epoch": 558} {"train_loss": -5.364928722381592, "global_step": 23463, "epoch": 558} {"train_loss": -5.400731086730957, "global_step": 23464, "epoch": 558} {"train_loss": -5.370901107788086, "global_step": 23465, "epoch": 558} {"train_loss": -5.35363245010376, "global_step": 23466, "epoch": 558} {"train_loss": -5.2869439125061035, "global_step": 23467, "epoch": 558} {"train_loss": -5.274575233459473, "global_step": 23468, "epoch": 558} {"train_loss": -5.2889299392700195, "global_step": 23469, "epoch": 558} {"train_loss": -5.369991302490234, "global_step": 23470, "epoch": 558} {"train_loss": -5.390759468078613, "global_step": 23471, "epoch": 558} {"train_loss": -5.351973533630371, "global_step": 23472, "epoch": 558} {"train_loss": -5.3351545333862305, "global_step": 23473, "epoch": 558} {"train_loss": -5.359461784362793, "global_step": 23474, "epoch": 558} {"train_loss": -5.194035530090332, "global_step": 23475, "epoch": 558} {"train_loss": -5.393383979797363, "global_step": 23476, "epoch": 558} {"train_loss": -5.359487385976882, "global_step": 23477, "epoch": 558, "val_loss": 65903.890625} {"train_loss": -5.440971374511719, "global_step": 23478, "epoch": 559} {"train_loss": -5.325924396514893, "global_step": 23479, "epoch": 559} {"train_loss": -5.520295143127441, "global_step": 23480, "epoch": 559} {"train_loss": -5.372890949249268, "global_step": 23481, "epoch": 559} {"train_loss": -5.300021648406982, "global_step": 23482, "epoch": 559} {"train_loss": -5.438322067260742, "global_step": 23483, "epoch": 559} {"train_loss": -5.416790008544922, "global_step": 23484, "epoch": 559} {"train_loss": -5.417115211486816, "global_step": 23485, "epoch": 559} {"train_loss": -5.357457160949707, "global_step": 23486, "epoch": 559} {"train_loss": -5.208624362945557, "global_step": 23487, "epoch": 559} {"train_loss": -5.50553560256958, "global_step": 23488, "epoch": 559} {"train_loss": -5.432498931884766, "global_step": 23489, "epoch": 559} {"train_loss": -5.313261032104492, "global_step": 23490, "epoch": 559} {"train_loss": -5.4490647315979, "global_step": 23491, "epoch": 559} {"train_loss": -5.395676612854004, "global_step": 23492, "epoch": 559} {"train_loss": -5.2962775230407715, "global_step": 23493, "epoch": 559} {"train_loss": -5.374958038330078, "global_step": 23494, "epoch": 559} {"train_loss": -5.352696418762207, "global_step": 23495, "epoch": 559} {"train_loss": -5.474918365478516, "global_step": 23496, "epoch": 559} {"train_loss": -5.337340354919434, "global_step": 23497, "epoch": 559} {"train_loss": -5.307613372802734, "global_step": 23498, "epoch": 559} {"train_loss": -5.278896808624268, "global_step": 23499, "epoch": 559} {"train_loss": -5.382236957550049, "global_step": 23500, "epoch": 559} {"train_loss": -5.511700630187988, "global_step": 23501, "epoch": 559} {"train_loss": -5.463801383972168, "global_step": 23502, "epoch": 559} {"train_loss": -5.257932186126709, "global_step": 23503, "epoch": 559} {"train_loss": -5.312989234924316, "global_step": 23504, "epoch": 559} {"train_loss": -5.359724521636963, "global_step": 23505, "epoch": 559} {"train_loss": -5.425246238708496, "global_step": 23506, "epoch": 559} {"train_loss": -5.251729488372803, "global_step": 23507, "epoch": 559} {"train_loss": -5.228397846221924, "global_step": 23508, "epoch": 559} {"train_loss": -5.371518135070801, "global_step": 23509, "epoch": 559} {"train_loss": -5.286899566650391, "global_step": 23510, "epoch": 559} {"train_loss": -5.434496879577637, "global_step": 23511, "epoch": 559} {"train_loss": -5.314504146575928, "global_step": 23512, "epoch": 559} {"train_loss": -5.283665180206299, "global_step": 23513, "epoch": 559} {"train_loss": -5.266824245452881, "global_step": 23514, "epoch": 559} {"train_loss": -5.207238674163818, "global_step": 23515, "epoch": 559} {"train_loss": -5.355740547180176, "global_step": 23516, "epoch": 559} {"train_loss": -5.263209342956543, "global_step": 23517, "epoch": 559} {"train_loss": -5.2917399406433105, "global_step": 23518, "epoch": 559} {"train_loss": -5.357289893286569, "global_step": 23519, "epoch": 559, "val_loss": 66480.8359375} {"train_loss": -5.249613285064697, "global_step": 23520, "epoch": 560} {"train_loss": -5.420103549957275, "global_step": 23521, "epoch": 560} {"train_loss": -5.447231769561768, "global_step": 23522, "epoch": 560} {"train_loss": -5.354792594909668, "global_step": 23523, "epoch": 560} {"train_loss": -5.381655693054199, "global_step": 23524, "epoch": 560} {"train_loss": -5.345493316650391, "global_step": 23525, "epoch": 560} {"train_loss": -5.432866096496582, "global_step": 23526, "epoch": 560} {"train_loss": -5.228459358215332, "global_step": 23527, "epoch": 560} {"train_loss": -5.414667129516602, "global_step": 23528, "epoch": 560} {"train_loss": -5.409251689910889, "global_step": 23529, "epoch": 560} {"train_loss": -5.190295696258545, "global_step": 23530, "epoch": 560} {"train_loss": -5.28099250793457, "global_step": 23531, "epoch": 560} {"train_loss": -5.365131378173828, "global_step": 23532, "epoch": 560} {"train_loss": -5.288311958312988, "global_step": 23533, "epoch": 560} {"train_loss": -5.287845611572266, "global_step": 23534, "epoch": 560} {"train_loss": -5.46897029876709, "global_step": 23535, "epoch": 560} {"train_loss": -5.404855251312256, "global_step": 23536, "epoch": 560} {"train_loss": -5.217271327972412, "global_step": 23537, "epoch": 560} {"train_loss": -5.466073989868164, "global_step": 23538, "epoch": 560} {"train_loss": -5.438796043395996, "global_step": 23539, "epoch": 560} {"train_loss": -5.42005729675293, "global_step": 23540, "epoch": 560} {"train_loss": -5.329413414001465, "global_step": 23541, "epoch": 560} {"train_loss": -5.298974514007568, "global_step": 23542, "epoch": 560} {"train_loss": -5.370754241943359, "global_step": 23543, "epoch": 560} {"train_loss": -5.4062395095825195, "global_step": 23544, "epoch": 560} {"train_loss": -5.440943717956543, "global_step": 23545, "epoch": 560} {"train_loss": -5.34626579284668, "global_step": 23546, "epoch": 560} {"train_loss": -5.290840148925781, "global_step": 23547, "epoch": 560} {"train_loss": -5.291512489318848, "global_step": 23548, "epoch": 560} {"train_loss": -5.565279960632324, "global_step": 23549, "epoch": 560} {"train_loss": -5.275765419006348, "global_step": 23550, "epoch": 560} {"train_loss": -5.239385604858398, "global_step": 23551, "epoch": 560} {"train_loss": -5.390368461608887, "global_step": 23552, "epoch": 560} {"train_loss": -5.223579406738281, "global_step": 23553, "epoch": 560} {"train_loss": -5.2155914306640625, "global_step": 23554, "epoch": 560} {"train_loss": -5.292885780334473, "global_step": 23555, "epoch": 560} {"train_loss": -5.277275085449219, "global_step": 23556, "epoch": 560} {"train_loss": -5.313686370849609, "global_step": 23557, "epoch": 560} {"train_loss": -5.278004169464111, "global_step": 23558, "epoch": 560} {"train_loss": -5.406668663024902, "global_step": 23559, "epoch": 560} {"train_loss": -5.2585978507995605, "global_step": 23560, "epoch": 560} {"train_loss": -5.343781686964489, "global_step": 23561, "epoch": 560, "val_loss": 65956.921875} {"train_loss": -5.324384689331055, "global_step": 23562, "epoch": 561} {"train_loss": -5.254262924194336, "global_step": 23563, "epoch": 561} {"train_loss": -5.358308792114258, "global_step": 23564, "epoch": 561} {"train_loss": -5.4500532150268555, "global_step": 23565, "epoch": 561} {"train_loss": -5.3927202224731445, "global_step": 23566, "epoch": 561} {"train_loss": -5.395071029663086, "global_step": 23567, "epoch": 561} {"train_loss": -5.3506364822387695, "global_step": 23568, "epoch": 561} {"train_loss": -5.297572135925293, "global_step": 23569, "epoch": 561} {"train_loss": -5.249151706695557, "global_step": 23570, "epoch": 561} {"train_loss": -5.3983917236328125, "global_step": 23571, "epoch": 561} {"train_loss": -5.300332546234131, "global_step": 23572, "epoch": 561} {"train_loss": -5.362342357635498, "global_step": 23573, "epoch": 561} {"train_loss": -5.230973243713379, "global_step": 23574, "epoch": 561} {"train_loss": -5.324089050292969, "global_step": 23575, "epoch": 561} {"train_loss": -5.388487815856934, "global_step": 23576, "epoch": 561} {"train_loss": -5.392612934112549, "global_step": 23577, "epoch": 561} {"train_loss": -5.269461631774902, "global_step": 23578, "epoch": 561} {"train_loss": -5.327640533447266, "global_step": 23579, "epoch": 561} {"train_loss": -5.459002494812012, "global_step": 23580, "epoch": 561} {"train_loss": -5.4215850830078125, "global_step": 23581, "epoch": 561} {"train_loss": -5.205082416534424, "global_step": 23582, "epoch": 561} {"train_loss": -5.4147047996521, "global_step": 23583, "epoch": 561} {"train_loss": -5.347893714904785, "global_step": 23584, "epoch": 561} {"train_loss": -5.250436305999756, "global_step": 23585, "epoch": 561} {"train_loss": -5.279874801635742, "global_step": 23586, "epoch": 561} {"train_loss": -5.366682529449463, "global_step": 23587, "epoch": 561} {"train_loss": -5.374881744384766, "global_step": 23588, "epoch": 561} {"train_loss": -5.361090660095215, "global_step": 23589, "epoch": 561} {"train_loss": -5.2418060302734375, "global_step": 23590, "epoch": 561} {"train_loss": -5.492502212524414, "global_step": 23591, "epoch": 561} {"train_loss": -5.382391929626465, "global_step": 23592, "epoch": 561} {"train_loss": -5.3910064697265625, "global_step": 23593, "epoch": 561} {"train_loss": -5.3598151206970215, "global_step": 23594, "epoch": 561} {"train_loss": -5.442160606384277, "global_step": 23595, "epoch": 561} {"train_loss": -5.274986267089844, "global_step": 23596, "epoch": 561} {"train_loss": -5.286867141723633, "global_step": 23597, "epoch": 561} {"train_loss": -5.39296817779541, "global_step": 23598, "epoch": 561} {"train_loss": -5.433632850646973, "global_step": 23599, "epoch": 561} {"train_loss": -5.575350761413574, "global_step": 23600, "epoch": 561} {"train_loss": -5.330346584320068, "global_step": 23601, "epoch": 561} {"train_loss": -5.377250671386719, "global_step": 23602, "epoch": 561} {"train_loss": -5.355104650769915, "global_step": 23603, "epoch": 561, "val_loss": 65887.8515625} {"train_loss": -5.371543884277344, "global_step": 23604, "epoch": 562} {"train_loss": -5.244297504425049, "global_step": 23605, "epoch": 562} {"train_loss": -5.3734211921691895, "global_step": 23606, "epoch": 562} {"train_loss": -5.379543781280518, "global_step": 23607, "epoch": 562} {"train_loss": -5.342275142669678, "global_step": 23608, "epoch": 562} {"train_loss": -5.46135139465332, "global_step": 23609, "epoch": 562} {"train_loss": -5.452980995178223, "global_step": 23610, "epoch": 562} {"train_loss": -5.413589000701904, "global_step": 23611, "epoch": 562} {"train_loss": -5.299781799316406, "global_step": 23612, "epoch": 562} {"train_loss": -5.393922328948975, "global_step": 23613, "epoch": 562} {"train_loss": -5.283153533935547, "global_step": 23614, "epoch": 562} {"train_loss": -5.1746625900268555, "global_step": 23615, "epoch": 562} {"train_loss": -5.307936191558838, "global_step": 23616, "epoch": 562} {"train_loss": -5.423561096191406, "global_step": 23617, "epoch": 562} {"train_loss": -5.330887794494629, "global_step": 23618, "epoch": 562} {"train_loss": -5.193610191345215, "global_step": 23619, "epoch": 562} {"train_loss": -5.359463691711426, "global_step": 23620, "epoch": 562} {"train_loss": -5.2695441246032715, "global_step": 23621, "epoch": 562} {"train_loss": -5.422791481018066, "global_step": 23622, "epoch": 562} {"train_loss": -5.204852104187012, "global_step": 23623, "epoch": 562} {"train_loss": -5.280388832092285, "global_step": 23624, "epoch": 562} {"train_loss": -5.327643871307373, "global_step": 23625, "epoch": 562} {"train_loss": -5.300223350524902, "global_step": 23626, "epoch": 562} {"train_loss": -5.258309364318848, "global_step": 23627, "epoch": 562} {"train_loss": -5.399955749511719, "global_step": 23628, "epoch": 562} {"train_loss": -5.24603271484375, "global_step": 23629, "epoch": 562} {"train_loss": -5.353376865386963, "global_step": 23630, "epoch": 562} {"train_loss": -5.495771884918213, "global_step": 23631, "epoch": 562} {"train_loss": -5.313808917999268, "global_step": 23632, "epoch": 562} {"train_loss": -5.486443519592285, "global_step": 23633, "epoch": 562} {"train_loss": -5.393977165222168, "global_step": 23634, "epoch": 562} {"train_loss": -5.457709312438965, "global_step": 23635, "epoch": 562} {"train_loss": -5.298982620239258, "global_step": 23636, "epoch": 562} {"train_loss": -5.32620906829834, "global_step": 23637, "epoch": 562} {"train_loss": -5.386795997619629, "global_step": 23638, "epoch": 562} {"train_loss": -5.345909118652344, "global_step": 23639, "epoch": 562} {"train_loss": -5.362425804138184, "global_step": 23640, "epoch": 562} {"train_loss": -5.40999698638916, "global_step": 23641, "epoch": 562} {"train_loss": -5.595191955566406, "global_step": 23642, "epoch": 562} {"train_loss": -5.457423210144043, "global_step": 23643, "epoch": 562} {"train_loss": -5.376784324645996, "global_step": 23644, "epoch": 562} {"train_loss": -5.359975848879133, "global_step": 23645, "epoch": 562, "val_loss": 65484.5078125} {"train_loss": -5.44797945022583, "global_step": 23646, "epoch": 563} {"train_loss": -5.4934916496276855, "global_step": 23647, "epoch": 563} {"train_loss": -5.379385948181152, "global_step": 23648, "epoch": 563} {"train_loss": -5.455613136291504, "global_step": 23649, "epoch": 563} {"train_loss": -5.40838098526001, "global_step": 23650, "epoch": 563} {"train_loss": -5.435790061950684, "global_step": 23651, "epoch": 563} {"train_loss": -5.4100022315979, "global_step": 23652, "epoch": 563} {"train_loss": -5.4626994132995605, "global_step": 23653, "epoch": 563} {"train_loss": -5.372189044952393, "global_step": 23654, "epoch": 563} {"train_loss": -5.387458801269531, "global_step": 23655, "epoch": 563} {"train_loss": -5.455438137054443, "global_step": 23656, "epoch": 563} {"train_loss": -5.310595512390137, "global_step": 23657, "epoch": 563} {"train_loss": -5.3664350509643555, "global_step": 23658, "epoch": 563} {"train_loss": -5.4659576416015625, "global_step": 23659, "epoch": 563} {"train_loss": -5.345315933227539, "global_step": 23660, "epoch": 563} {"train_loss": -5.3205060958862305, "global_step": 23661, "epoch": 563} {"train_loss": -5.299408912658691, "global_step": 23662, "epoch": 563} {"train_loss": -5.257113456726074, "global_step": 23663, "epoch": 563} {"train_loss": -5.429620265960693, "global_step": 23664, "epoch": 563} {"train_loss": -5.385033130645752, "global_step": 23665, "epoch": 563} {"train_loss": -5.289967060089111, "global_step": 23666, "epoch": 563} {"train_loss": -5.3053178787231445, "global_step": 23667, "epoch": 563} {"train_loss": -5.341301918029785, "global_step": 23668, "epoch": 563} {"train_loss": -5.3635382652282715, "global_step": 23669, "epoch": 563} {"train_loss": -5.2917304039001465, "global_step": 23670, "epoch": 563} {"train_loss": -5.451070785522461, "global_step": 23671, "epoch": 563} {"train_loss": -5.276309013366699, "global_step": 23672, "epoch": 563} {"train_loss": -5.2478227615356445, "global_step": 23673, "epoch": 563} {"train_loss": -5.412814140319824, "global_step": 23674, "epoch": 563} {"train_loss": -5.421966552734375, "global_step": 23675, "epoch": 563} {"train_loss": -5.408111572265625, "global_step": 23676, "epoch": 563} {"train_loss": -5.2728118896484375, "global_step": 23677, "epoch": 563} {"train_loss": -5.303590774536133, "global_step": 23678, "epoch": 563} {"train_loss": -5.349230766296387, "global_step": 23679, "epoch": 563} {"train_loss": -5.441472053527832, "global_step": 23680, "epoch": 563} {"train_loss": -5.254775047302246, "global_step": 23681, "epoch": 563} {"train_loss": -5.360579967498779, "global_step": 23682, "epoch": 563} {"train_loss": -5.407320976257324, "global_step": 23683, "epoch": 563} {"train_loss": -5.305378437042236, "global_step": 23684, "epoch": 563} {"train_loss": -5.40503454208374, "global_step": 23685, "epoch": 563} {"train_loss": -5.301694869995117, "global_step": 23686, "epoch": 563} {"train_loss": -5.368906986145746, "global_step": 23687, "epoch": 563, "val_loss": 65772.9453125} {"train_loss": -5.547435760498047, "global_step": 23688, "epoch": 564} {"train_loss": -5.37650203704834, "global_step": 23689, "epoch": 564} {"train_loss": -5.39315128326416, "global_step": 23690, "epoch": 564} {"train_loss": -5.424723148345947, "global_step": 23691, "epoch": 564} {"train_loss": -5.305673122406006, "global_step": 23692, "epoch": 564} {"train_loss": -5.352892875671387, "global_step": 23693, "epoch": 564} {"train_loss": -5.376164436340332, "global_step": 23694, "epoch": 564} {"train_loss": -5.206447601318359, "global_step": 23695, "epoch": 564} {"train_loss": -5.423867225646973, "global_step": 23696, "epoch": 564} {"train_loss": -5.376315116882324, "global_step": 23697, "epoch": 564} {"train_loss": -5.2939558029174805, "global_step": 23698, "epoch": 564} {"train_loss": -5.566318511962891, "global_step": 23699, "epoch": 564} {"train_loss": -5.355950832366943, "global_step": 23700, "epoch": 564} {"train_loss": -5.364422798156738, "global_step": 23701, "epoch": 564} {"train_loss": -5.364562034606934, "global_step": 23702, "epoch": 564} {"train_loss": -5.347064971923828, "global_step": 23703, "epoch": 564} {"train_loss": -5.428589820861816, "global_step": 23704, "epoch": 564} {"train_loss": -5.472203254699707, "global_step": 23705, "epoch": 564} {"train_loss": -5.349194526672363, "global_step": 23706, "epoch": 564} {"train_loss": -5.433386325836182, "global_step": 23707, "epoch": 564} {"train_loss": -5.443262100219727, "global_step": 23708, "epoch": 564} {"train_loss": -5.369784355163574, "global_step": 23709, "epoch": 564} {"train_loss": -5.414383888244629, "global_step": 23710, "epoch": 564} {"train_loss": -5.332857608795166, "global_step": 23711, "epoch": 564} {"train_loss": -5.512331962585449, "global_step": 23712, "epoch": 564} {"train_loss": -5.395854949951172, "global_step": 23713, "epoch": 564} {"train_loss": -5.302305221557617, "global_step": 23714, "epoch": 564} {"train_loss": -5.190647125244141, "global_step": 23715, "epoch": 564} {"train_loss": -5.2596516609191895, "global_step": 23716, "epoch": 564} {"train_loss": -5.3240509033203125, "global_step": 23717, "epoch": 564} {"train_loss": -5.415143966674805, "global_step": 23718, "epoch": 564} {"train_loss": -5.3844828605651855, "global_step": 23719, "epoch": 564} {"train_loss": -5.338569641113281, "global_step": 23720, "epoch": 564} {"train_loss": -5.329604148864746, "global_step": 23721, "epoch": 564} {"train_loss": -5.271297931671143, "global_step": 23722, "epoch": 564} {"train_loss": -5.390394687652588, "global_step": 23723, "epoch": 564} {"train_loss": -5.332547187805176, "global_step": 23724, "epoch": 564} {"train_loss": -5.3919477462768555, "global_step": 23725, "epoch": 564} {"train_loss": -5.341303825378418, "global_step": 23726, "epoch": 564} {"train_loss": -5.361036777496338, "global_step": 23727, "epoch": 564} {"train_loss": -5.294997215270996, "global_step": 23728, "epoch": 564} {"train_loss": -5.368986254646664, "global_step": 23729, "epoch": 564, "val_loss": 66207.421875} {"train_loss": -5.288181304931641, "global_step": 23730, "epoch": 565} {"train_loss": -5.265159606933594, "global_step": 23731, "epoch": 565} {"train_loss": -5.44571590423584, "global_step": 23732, "epoch": 565} {"train_loss": -5.364826679229736, "global_step": 23733, "epoch": 565} {"train_loss": -5.3910136222839355, "global_step": 23734, "epoch": 565} {"train_loss": -5.42845344543457, "global_step": 23735, "epoch": 565} {"train_loss": -5.464142799377441, "global_step": 23736, "epoch": 565} {"train_loss": -5.529568195343018, "global_step": 23737, "epoch": 565} {"train_loss": -5.409843921661377, "global_step": 23738, "epoch": 565} {"train_loss": -5.463201522827148, "global_step": 23739, "epoch": 565} {"train_loss": -5.383868217468262, "global_step": 23740, "epoch": 565} {"train_loss": -5.3774333000183105, "global_step": 23741, "epoch": 565} {"train_loss": -5.466936111450195, "global_step": 23742, "epoch": 565} {"train_loss": -5.391282081604004, "global_step": 23743, "epoch": 565} {"train_loss": -5.37122917175293, "global_step": 23744, "epoch": 565} {"train_loss": -5.34108304977417, "global_step": 23745, "epoch": 565} {"train_loss": -5.384167194366455, "global_step": 23746, "epoch": 565} {"train_loss": -5.349525451660156, "global_step": 23747, "epoch": 565} {"train_loss": -5.277237892150879, "global_step": 23748, "epoch": 565} {"train_loss": -5.304518222808838, "global_step": 23749, "epoch": 565} {"train_loss": -5.195633411407471, "global_step": 23750, "epoch": 565} {"train_loss": -5.278665542602539, "global_step": 23751, "epoch": 565} {"train_loss": -5.152885437011719, "global_step": 23752, "epoch": 565} {"train_loss": -5.306329250335693, "global_step": 23753, "epoch": 565} {"train_loss": -5.333797931671143, "global_step": 23754, "epoch": 565} {"train_loss": -5.339286804199219, "global_step": 23755, "epoch": 565} {"train_loss": -5.323295593261719, "global_step": 23756, "epoch": 565} {"train_loss": -5.402144908905029, "global_step": 23757, "epoch": 565} {"train_loss": -5.394007205963135, "global_step": 23758, "epoch": 565} {"train_loss": -5.242909908294678, "global_step": 23759, "epoch": 565} {"train_loss": -5.421731948852539, "global_step": 23760, "epoch": 565} {"train_loss": -5.398298740386963, "global_step": 23761, "epoch": 565} {"train_loss": -5.44306755065918, "global_step": 23762, "epoch": 565} {"train_loss": -5.4142961502075195, "global_step": 23763, "epoch": 565} {"train_loss": -5.455935955047607, "global_step": 23764, "epoch": 565} {"train_loss": -5.373063564300537, "global_step": 23765, "epoch": 565} {"train_loss": -5.4489030838012695, "global_step": 23766, "epoch": 565} {"train_loss": -5.384366035461426, "global_step": 23767, "epoch": 565} {"train_loss": -5.2532877922058105, "global_step": 23768, "epoch": 565} {"train_loss": -5.2653608322143555, "global_step": 23769, "epoch": 565} {"train_loss": -5.273847579956055, "global_step": 23770, "epoch": 565} {"train_loss": -5.360259873526437, "global_step": 23771, "epoch": 565, "val_loss": 65631.234375} {"train_loss": -5.331930160522461, "global_step": 23772, "epoch": 566} {"train_loss": -5.406181335449219, "global_step": 23773, "epoch": 566} {"train_loss": -5.31595516204834, "global_step": 23774, "epoch": 566} {"train_loss": -5.424956798553467, "global_step": 23775, "epoch": 566} {"train_loss": -5.302855014801025, "global_step": 23776, "epoch": 566} {"train_loss": -5.176314830780029, "global_step": 23777, "epoch": 566} {"train_loss": -5.410003185272217, "global_step": 23778, "epoch": 566} {"train_loss": -5.473447799682617, "global_step": 23779, "epoch": 566} {"train_loss": -5.2747368812561035, "global_step": 23780, "epoch": 566} {"train_loss": -5.284454345703125, "global_step": 23781, "epoch": 566} {"train_loss": -5.419053077697754, "global_step": 23782, "epoch": 566} {"train_loss": -5.306469440460205, "global_step": 23783, "epoch": 566} {"train_loss": -5.402165412902832, "global_step": 23784, "epoch": 566} {"train_loss": -5.4923248291015625, "global_step": 23785, "epoch": 566} {"train_loss": -5.425512790679932, "global_step": 23786, "epoch": 566} {"train_loss": -5.364291667938232, "global_step": 23787, "epoch": 566} {"train_loss": -5.272777557373047, "global_step": 23788, "epoch": 566} {"train_loss": -5.407488822937012, "global_step": 23789, "epoch": 566} {"train_loss": -5.431282043457031, "global_step": 23790, "epoch": 566} {"train_loss": -5.4862380027771, "global_step": 23791, "epoch": 566} {"train_loss": -5.492624759674072, "global_step": 23792, "epoch": 566} {"train_loss": -5.370587348937988, "global_step": 23793, "epoch": 566} {"train_loss": -5.267951965332031, "global_step": 23794, "epoch": 566} {"train_loss": -5.365928649902344, "global_step": 23795, "epoch": 566} {"train_loss": -5.281381607055664, "global_step": 23796, "epoch": 566} {"train_loss": -5.410364151000977, "global_step": 23797, "epoch": 566} {"train_loss": -5.406203269958496, "global_step": 23798, "epoch": 566} {"train_loss": -5.228787422180176, "global_step": 23799, "epoch": 566} {"train_loss": -5.4420599937438965, "global_step": 23800, "epoch": 566} {"train_loss": -5.524381160736084, "global_step": 23801, "epoch": 566} {"train_loss": -5.399928092956543, "global_step": 23802, "epoch": 566} {"train_loss": -5.165143013000488, "global_step": 23803, "epoch": 566} {"train_loss": -5.407585144042969, "global_step": 23804, "epoch": 566} {"train_loss": -5.415571212768555, "global_step": 23805, "epoch": 566} {"train_loss": -5.3133368492126465, "global_step": 23806, "epoch": 566} {"train_loss": -5.277833938598633, "global_step": 23807, "epoch": 566} {"train_loss": -5.325599670410156, "global_step": 23808, "epoch": 566} {"train_loss": -5.2411651611328125, "global_step": 23809, "epoch": 566} {"train_loss": -5.460201740264893, "global_step": 23810, "epoch": 566} {"train_loss": -5.316088676452637, "global_step": 23811, "epoch": 566} {"train_loss": -5.3885908126831055, "global_step": 23812, "epoch": 566} {"train_loss": -5.366482587087722, "global_step": 23813, "epoch": 566, "val_loss": 66058.390625} {"train_loss": -5.180086612701416, "global_step": 23814, "epoch": 567} {"train_loss": -5.3682026863098145, "global_step": 23815, "epoch": 567} {"train_loss": -5.354637145996094, "global_step": 23816, "epoch": 567} {"train_loss": -5.306894302368164, "global_step": 23817, "epoch": 567} {"train_loss": -5.45150899887085, "global_step": 23818, "epoch": 567} {"train_loss": -5.153936386108398, "global_step": 23819, "epoch": 567} {"train_loss": -5.352579593658447, "global_step": 23820, "epoch": 567} {"train_loss": -5.25398588180542, "global_step": 23821, "epoch": 567} {"train_loss": -5.423700332641602, "global_step": 23822, "epoch": 567} {"train_loss": -5.4146647453308105, "global_step": 23823, "epoch": 567} {"train_loss": -5.471831321716309, "global_step": 23824, "epoch": 567} {"train_loss": -5.210940361022949, "global_step": 23825, "epoch": 567} {"train_loss": -5.236593246459961, "global_step": 23826, "epoch": 567} {"train_loss": -5.432426452636719, "global_step": 23827, "epoch": 567} {"train_loss": -5.2864789962768555, "global_step": 23828, "epoch": 567} {"train_loss": -5.357454776763916, "global_step": 23829, "epoch": 567} {"train_loss": -5.28334903717041, "global_step": 23830, "epoch": 567} {"train_loss": -5.322271347045898, "global_step": 23831, "epoch": 567} {"train_loss": -5.420360565185547, "global_step": 23832, "epoch": 567} {"train_loss": -5.347988128662109, "global_step": 23833, "epoch": 567} {"train_loss": -5.235227584838867, "global_step": 23834, "epoch": 567} {"train_loss": -5.420688629150391, "global_step": 23835, "epoch": 567} {"train_loss": -5.463078022003174, "global_step": 23836, "epoch": 567} {"train_loss": -5.287494659423828, "global_step": 23837, "epoch": 567} {"train_loss": -5.381965637207031, "global_step": 23838, "epoch": 567} {"train_loss": -5.239246368408203, "global_step": 23839, "epoch": 567} {"train_loss": -5.322509765625, "global_step": 23840, "epoch": 567} {"train_loss": -5.485107421875, "global_step": 23841, "epoch": 567} {"train_loss": -5.309327125549316, "global_step": 23842, "epoch": 567} {"train_loss": -5.245944023132324, "global_step": 23843, "epoch": 567} {"train_loss": -5.377046585083008, "global_step": 23844, "epoch": 567} {"train_loss": -5.247102737426758, "global_step": 23845, "epoch": 567} {"train_loss": -5.420087814331055, "global_step": 23846, "epoch": 567} {"train_loss": -5.2903900146484375, "global_step": 23847, "epoch": 567} {"train_loss": -5.297292232513428, "global_step": 23848, "epoch": 567} {"train_loss": -5.356801986694336, "global_step": 23849, "epoch": 567} {"train_loss": -5.478153228759766, "global_step": 23850, "epoch": 567} {"train_loss": -5.2224202156066895, "global_step": 23851, "epoch": 567} {"train_loss": -5.380006790161133, "global_step": 23852, "epoch": 567} {"train_loss": -5.180874824523926, "global_step": 23853, "epoch": 567} {"train_loss": -5.349632263183594, "global_step": 23854, "epoch": 567} {"train_loss": -5.330213455926804, "global_step": 23855, "epoch": 567, "val_loss": 66070.4921875} {"train_loss": -5.280295372009277, "global_step": 23856, "epoch": 568} {"train_loss": -5.460526466369629, "global_step": 23857, "epoch": 568} {"train_loss": -5.50412130355835, "global_step": 23858, "epoch": 568} {"train_loss": -5.308961391448975, "global_step": 23859, "epoch": 568} {"train_loss": -5.421494007110596, "global_step": 23860, "epoch": 568} {"train_loss": -5.257447242736816, "global_step": 23861, "epoch": 568} {"train_loss": -5.301339149475098, "global_step": 23862, "epoch": 568} {"train_loss": -5.385025501251221, "global_step": 23863, "epoch": 568} {"train_loss": -5.290226936340332, "global_step": 23864, "epoch": 568} {"train_loss": -5.272697925567627, "global_step": 23865, "epoch": 568} {"train_loss": -5.332858085632324, "global_step": 23866, "epoch": 568} {"train_loss": -5.350369453430176, "global_step": 23867, "epoch": 568} {"train_loss": -5.232907295227051, "global_step": 23868, "epoch": 568} {"train_loss": -5.423947334289551, "global_step": 23869, "epoch": 568} {"train_loss": -5.398591995239258, "global_step": 23870, "epoch": 568} {"train_loss": -5.360567092895508, "global_step": 23871, "epoch": 568} {"train_loss": -5.2944512367248535, "global_step": 23872, "epoch": 568} {"train_loss": -5.358711242675781, "global_step": 23873, "epoch": 568} {"train_loss": -5.359853744506836, "global_step": 23874, "epoch": 568} {"train_loss": -5.440280437469482, "global_step": 23875, "epoch": 568} {"train_loss": -5.432976245880127, "global_step": 23876, "epoch": 568} {"train_loss": -5.2879743576049805, "global_step": 23877, "epoch": 568} {"train_loss": -5.324404716491699, "global_step": 23878, "epoch": 568} {"train_loss": -5.468626022338867, "global_step": 23879, "epoch": 568} {"train_loss": -5.375119209289551, "global_step": 23880, "epoch": 568} {"train_loss": -5.3741912841796875, "global_step": 23881, "epoch": 568} {"train_loss": -5.3824920654296875, "global_step": 23882, "epoch": 568} {"train_loss": -5.3694353103637695, "global_step": 23883, "epoch": 568} {"train_loss": -5.331300735473633, "global_step": 23884, "epoch": 568} {"train_loss": -5.43856143951416, "global_step": 23885, "epoch": 568} {"train_loss": -5.3587236404418945, "global_step": 23886, "epoch": 568} {"train_loss": -5.434642791748047, "global_step": 23887, "epoch": 568} {"train_loss": -5.417540073394775, "global_step": 23888, "epoch": 568} {"train_loss": -5.242679595947266, "global_step": 23889, "epoch": 568} {"train_loss": -5.383993148803711, "global_step": 23890, "epoch": 568} {"train_loss": -5.375283241271973, "global_step": 23891, "epoch": 568} {"train_loss": -5.391475677490234, "global_step": 23892, "epoch": 568} {"train_loss": -5.200344085693359, "global_step": 23893, "epoch": 568} {"train_loss": -5.440669536590576, "global_step": 23894, "epoch": 568} {"train_loss": -5.274572849273682, "global_step": 23895, "epoch": 568} {"train_loss": -5.425004005432129, "global_step": 23896, "epoch": 568} {"train_loss": -5.3579377219790505, "global_step": 23897, "epoch": 568, "val_loss": 65576.5390625} {"train_loss": -5.451739311218262, "global_step": 23898, "epoch": 569} {"train_loss": -5.522651672363281, "global_step": 23899, "epoch": 569} {"train_loss": -5.467248916625977, "global_step": 23900, "epoch": 569} {"train_loss": -5.507355213165283, "global_step": 23901, "epoch": 569} {"train_loss": -5.425244331359863, "global_step": 23902, "epoch": 569} {"train_loss": -5.2787909507751465, "global_step": 23903, "epoch": 569} {"train_loss": -5.306373596191406, "global_step": 23904, "epoch": 569} {"train_loss": -5.236007213592529, "global_step": 23905, "epoch": 569} {"train_loss": -5.369370937347412, "global_step": 23906, "epoch": 569} {"train_loss": -5.426434516906738, "global_step": 23907, "epoch": 569} {"train_loss": -5.276460647583008, "global_step": 23908, "epoch": 569} {"train_loss": -5.354556083679199, "global_step": 23909, "epoch": 569} {"train_loss": -5.435268402099609, "global_step": 23910, "epoch": 569} {"train_loss": -5.338722229003906, "global_step": 23911, "epoch": 569} {"train_loss": -5.365830421447754, "global_step": 23912, "epoch": 569} {"train_loss": -5.317349433898926, "global_step": 23913, "epoch": 569} {"train_loss": -5.355526924133301, "global_step": 23914, "epoch": 569} {"train_loss": -5.354890823364258, "global_step": 23915, "epoch": 569} {"train_loss": -5.305911540985107, "global_step": 23916, "epoch": 569} {"train_loss": -5.3241472244262695, "global_step": 23917, "epoch": 569} {"train_loss": -5.548163414001465, "global_step": 23918, "epoch": 569} {"train_loss": -5.247440814971924, "global_step": 23919, "epoch": 569} {"train_loss": -5.349860668182373, "global_step": 23920, "epoch": 569} {"train_loss": -5.314732551574707, "global_step": 23921, "epoch": 569} {"train_loss": -5.238142013549805, "global_step": 23922, "epoch": 569} {"train_loss": -5.331564903259277, "global_step": 23923, "epoch": 569} {"train_loss": -5.2793288230896, "global_step": 23924, "epoch": 569} {"train_loss": -5.454026222229004, "global_step": 23925, "epoch": 569} {"train_loss": -5.362753391265869, "global_step": 23926, "epoch": 569} {"train_loss": -5.514305591583252, "global_step": 23927, "epoch": 569} {"train_loss": -5.383401870727539, "global_step": 23928, "epoch": 569} {"train_loss": -5.419172763824463, "global_step": 23929, "epoch": 569} {"train_loss": -5.5171003341674805, "global_step": 23930, "epoch": 569} {"train_loss": -5.425739765167236, "global_step": 23931, "epoch": 569} {"train_loss": -5.23527717590332, "global_step": 23932, "epoch": 569} {"train_loss": -5.358611106872559, "global_step": 23933, "epoch": 569} {"train_loss": -5.329582691192627, "global_step": 23934, "epoch": 569} {"train_loss": -5.240234375, "global_step": 23935, "epoch": 569} {"train_loss": -5.447971343994141, "global_step": 23936, "epoch": 569} {"train_loss": -5.331815719604492, "global_step": 23937, "epoch": 569} {"train_loss": -5.3049187660217285, "global_step": 23938, "epoch": 569} {"train_loss": -5.364827349072411, "global_step": 23939, "epoch": 569, "val_loss": 65496.00390625} {"train_loss": -5.372748851776123, "global_step": 23940, "epoch": 570} {"train_loss": -5.383350849151611, "global_step": 23941, "epoch": 570} {"train_loss": -5.502641201019287, "global_step": 23942, "epoch": 570} {"train_loss": -5.360101222991943, "global_step": 23943, "epoch": 570} {"train_loss": -5.379256725311279, "global_step": 23944, "epoch": 570} {"train_loss": -5.368133544921875, "global_step": 23945, "epoch": 570} {"train_loss": -5.4822821617126465, "global_step": 23946, "epoch": 570} {"train_loss": -5.49839973449707, "global_step": 23947, "epoch": 570} {"train_loss": -5.436224937438965, "global_step": 23948, "epoch": 570} {"train_loss": -5.392909049987793, "global_step": 23949, "epoch": 570} {"train_loss": -5.199108123779297, "global_step": 23950, "epoch": 570} {"train_loss": -5.393967628479004, "global_step": 23951, "epoch": 570} {"train_loss": -5.184326171875, "global_step": 23952, "epoch": 570} {"train_loss": -5.297800540924072, "global_step": 23953, "epoch": 570} {"train_loss": -5.325956344604492, "global_step": 23954, "epoch": 570} {"train_loss": -5.393946647644043, "global_step": 23955, "epoch": 570} {"train_loss": -5.289100646972656, "global_step": 23956, "epoch": 570} {"train_loss": -5.466220378875732, "global_step": 23957, "epoch": 570} {"train_loss": -5.351519584655762, "global_step": 23958, "epoch": 570} {"train_loss": -5.310730934143066, "global_step": 23959, "epoch": 570} {"train_loss": -5.381285667419434, "global_step": 23960, "epoch": 570} {"train_loss": -5.314295768737793, "global_step": 23961, "epoch": 570} {"train_loss": -5.271087646484375, "global_step": 23962, "epoch": 570} {"train_loss": -5.439695358276367, "global_step": 23963, "epoch": 570} {"train_loss": -5.528136730194092, "global_step": 23964, "epoch": 570} {"train_loss": -5.480442047119141, "global_step": 23965, "epoch": 570} {"train_loss": -5.286592960357666, "global_step": 23966, "epoch": 570} {"train_loss": -5.433055877685547, "global_step": 23967, "epoch": 570} {"train_loss": -5.359127521514893, "global_step": 23968, "epoch": 570} {"train_loss": -5.33730411529541, "global_step": 23969, "epoch": 570} {"train_loss": -5.34915828704834, "global_step": 23970, "epoch": 570} {"train_loss": -5.3397016525268555, "global_step": 23971, "epoch": 570} {"train_loss": -5.205689907073975, "global_step": 23972, "epoch": 570} {"train_loss": -5.347879886627197, "global_step": 23973, "epoch": 570} {"train_loss": -5.4749627113342285, "global_step": 23974, "epoch": 570} {"train_loss": -5.458308696746826, "global_step": 23975, "epoch": 570} {"train_loss": -5.46561336517334, "global_step": 23976, "epoch": 570} {"train_loss": -5.447347640991211, "global_step": 23977, "epoch": 570} {"train_loss": -5.338879585266113, "global_step": 23978, "epoch": 570} {"train_loss": -5.415188789367676, "global_step": 23979, "epoch": 570} {"train_loss": -5.286070823669434, "global_step": 23980, "epoch": 570} {"train_loss": -5.373654070354643, "global_step": 23981, "epoch": 570, "val_loss": 66103.65625} {"train_loss": -5.285683631896973, "global_step": 23982, "epoch": 571} {"train_loss": -5.358261585235596, "global_step": 23983, "epoch": 571} {"train_loss": -5.277830123901367, "global_step": 23984, "epoch": 571} {"train_loss": -5.3230881690979, "global_step": 23985, "epoch": 571} {"train_loss": -5.24399995803833, "global_step": 23986, "epoch": 571} {"train_loss": -5.415474891662598, "global_step": 23987, "epoch": 571} {"train_loss": -5.34298849105835, "global_step": 23988, "epoch": 571} {"train_loss": -5.227227210998535, "global_step": 23989, "epoch": 571} {"train_loss": -5.402010917663574, "global_step": 23990, "epoch": 571} {"train_loss": -5.396664619445801, "global_step": 23991, "epoch": 571} {"train_loss": -5.370823860168457, "global_step": 23992, "epoch": 571} {"train_loss": -5.418475151062012, "global_step": 23993, "epoch": 571} {"train_loss": -5.445036888122559, "global_step": 23994, "epoch": 571} {"train_loss": -5.299330711364746, "global_step": 23995, "epoch": 571} {"train_loss": -5.42531681060791, "global_step": 23996, "epoch": 571} {"train_loss": -5.4156494140625, "global_step": 23997, "epoch": 571} {"train_loss": -5.249497413635254, "global_step": 23998, "epoch": 571} {"train_loss": -5.426675319671631, "global_step": 23999, "epoch": 571} {"train_loss": -5.418328285217285, "global_step": 24000, "epoch": 571} {"train_loss": -5.431670188903809, "global_step": 24001, "epoch": 571} {"train_loss": -5.166856288909912, "global_step": 24002, "epoch": 571} {"train_loss": -5.265939235687256, "global_step": 24003, "epoch": 571} {"train_loss": -5.442397117614746, "global_step": 24004, "epoch": 571} {"train_loss": -5.332427978515625, "global_step": 24005, "epoch": 571} {"train_loss": -5.261041641235352, "global_step": 24006, "epoch": 571} {"train_loss": -5.3744964599609375, "global_step": 24007, "epoch": 571} {"train_loss": -5.295665740966797, "global_step": 24008, "epoch": 571} {"train_loss": -5.2364935874938965, "global_step": 24009, "epoch": 571} {"train_loss": -5.200725078582764, "global_step": 24010, "epoch": 571} {"train_loss": -5.4074883460998535, "global_step": 24011, "epoch": 571} {"train_loss": -5.298680305480957, "global_step": 24012, "epoch": 571} {"train_loss": -5.325910568237305, "global_step": 24013, "epoch": 571} {"train_loss": -5.388073921203613, "global_step": 24014, "epoch": 571} {"train_loss": -5.150364875793457, "global_step": 24015, "epoch": 571} {"train_loss": -5.411411285400391, "global_step": 24016, "epoch": 571} {"train_loss": -5.290133476257324, "global_step": 24017, "epoch": 571} {"train_loss": -5.3250017166137695, "global_step": 24018, "epoch": 571} {"train_loss": -5.1881890296936035, "global_step": 24019, "epoch": 571} {"train_loss": -5.277742862701416, "global_step": 24020, "epoch": 571} {"train_loss": -5.341063499450684, "global_step": 24021, "epoch": 571} {"train_loss": -5.404630661010742, "global_step": 24022, "epoch": 571} {"train_loss": -5.333007142657325, "global_step": 24023, "epoch": 571, "val_loss": 65651.8515625} {"train_loss": -5.3611531257629395, "global_step": 24024, "epoch": 572} {"train_loss": -5.386641025543213, "global_step": 24025, "epoch": 572} {"train_loss": -5.339766025543213, "global_step": 24026, "epoch": 572} {"train_loss": -5.445652008056641, "global_step": 24027, "epoch": 572} {"train_loss": -5.316621780395508, "global_step": 24028, "epoch": 572} {"train_loss": -5.197887897491455, "global_step": 24029, "epoch": 572} {"train_loss": -5.202633857727051, "global_step": 24030, "epoch": 572} {"train_loss": -5.374446868896484, "global_step": 24031, "epoch": 572} {"train_loss": -5.338748455047607, "global_step": 24032, "epoch": 572} {"train_loss": -5.248480796813965, "global_step": 24033, "epoch": 572} {"train_loss": -5.476768970489502, "global_step": 24034, "epoch": 572} {"train_loss": -5.362419128417969, "global_step": 24035, "epoch": 572} {"train_loss": -5.365963935852051, "global_step": 24036, "epoch": 572} {"train_loss": -5.438493728637695, "global_step": 24037, "epoch": 572} {"train_loss": -5.449800968170166, "global_step": 24038, "epoch": 572} {"train_loss": -5.379993438720703, "global_step": 24039, "epoch": 572} {"train_loss": -5.237281799316406, "global_step": 24040, "epoch": 572} {"train_loss": -5.403102874755859, "global_step": 24041, "epoch": 572} {"train_loss": -5.281905174255371, "global_step": 24042, "epoch": 572} {"train_loss": -5.234316349029541, "global_step": 24043, "epoch": 572} {"train_loss": -5.604061126708984, "global_step": 24044, "epoch": 572} {"train_loss": -5.270669937133789, "global_step": 24045, "epoch": 572} {"train_loss": -5.3550333976745605, "global_step": 24046, "epoch": 572} {"train_loss": -5.306617736816406, "global_step": 24047, "epoch": 572} {"train_loss": -5.34869384765625, "global_step": 24048, "epoch": 572} {"train_loss": -5.370876312255859, "global_step": 24049, "epoch": 572} {"train_loss": -5.431790828704834, "global_step": 24050, "epoch": 572} {"train_loss": -5.271978378295898, "global_step": 24051, "epoch": 572} {"train_loss": -5.316794395446777, "global_step": 24052, "epoch": 572} {"train_loss": -5.444045543670654, "global_step": 24053, "epoch": 572} {"train_loss": -5.399712085723877, "global_step": 24054, "epoch": 572} {"train_loss": -5.344569683074951, "global_step": 24055, "epoch": 572} {"train_loss": -5.118655681610107, "global_step": 24056, "epoch": 572} {"train_loss": -5.525198936462402, "global_step": 24057, "epoch": 572} {"train_loss": -5.410541534423828, "global_step": 24058, "epoch": 572} {"train_loss": -5.343044281005859, "global_step": 24059, "epoch": 572} {"train_loss": -5.412631988525391, "global_step": 24060, "epoch": 572} {"train_loss": -5.437397480010986, "global_step": 24061, "epoch": 572} {"train_loss": -5.311676979064941, "global_step": 24062, "epoch": 572} {"train_loss": -5.480410099029541, "global_step": 24063, "epoch": 572} {"train_loss": -5.432183265686035, "global_step": 24064, "epoch": 572} {"train_loss": -5.359110014779227, "global_step": 24065, "epoch": 572, "val_loss": 65647.8984375} {"train_loss": -5.313403129577637, "global_step": 24066, "epoch": 573} {"train_loss": -5.473725318908691, "global_step": 24067, "epoch": 573} {"train_loss": -5.215187072753906, "global_step": 24068, "epoch": 573} {"train_loss": -5.434906005859375, "global_step": 24069, "epoch": 573} {"train_loss": -5.320503234863281, "global_step": 24070, "epoch": 573} {"train_loss": -5.095502853393555, "global_step": 24071, "epoch": 573} {"train_loss": -5.283267974853516, "global_step": 24072, "epoch": 573} {"train_loss": -5.141487121582031, "global_step": 24073, "epoch": 573} {"train_loss": -5.376167297363281, "global_step": 24074, "epoch": 573} {"train_loss": -5.316710472106934, "global_step": 24075, "epoch": 573} {"train_loss": -5.348553657531738, "global_step": 24076, "epoch": 573} {"train_loss": -5.406252384185791, "global_step": 24077, "epoch": 573} {"train_loss": -5.3109517097473145, "global_step": 24078, "epoch": 573} {"train_loss": -5.505777359008789, "global_step": 24079, "epoch": 573} {"train_loss": -5.330826759338379, "global_step": 24080, "epoch": 573} {"train_loss": -5.2242937088012695, "global_step": 24081, "epoch": 573} {"train_loss": -5.266010284423828, "global_step": 24082, "epoch": 573} {"train_loss": -5.443246841430664, "global_step": 24083, "epoch": 573} {"train_loss": -5.414558410644531, "global_step": 24084, "epoch": 573} {"train_loss": -5.340207099914551, "global_step": 24085, "epoch": 573} {"train_loss": -5.391602516174316, "global_step": 24086, "epoch": 573} {"train_loss": -5.319685459136963, "global_step": 24087, "epoch": 573} {"train_loss": -5.366162300109863, "global_step": 24088, "epoch": 573} {"train_loss": -5.340751647949219, "global_step": 24089, "epoch": 573} {"train_loss": -5.3315839767456055, "global_step": 24090, "epoch": 573} {"train_loss": -5.277122497558594, "global_step": 24091, "epoch": 573} {"train_loss": -5.405857563018799, "global_step": 24092, "epoch": 573} {"train_loss": -5.371621608734131, "global_step": 24093, "epoch": 573} {"train_loss": -5.357728958129883, "global_step": 24094, "epoch": 573} {"train_loss": -5.43238639831543, "global_step": 24095, "epoch": 573} {"train_loss": -5.238560676574707, "global_step": 24096, "epoch": 573} {"train_loss": -5.318463325500488, "global_step": 24097, "epoch": 573} {"train_loss": -5.323851585388184, "global_step": 24098, "epoch": 573} {"train_loss": -5.3219404220581055, "global_step": 24099, "epoch": 573} {"train_loss": -5.290157794952393, "global_step": 24100, "epoch": 573} {"train_loss": -5.356180667877197, "global_step": 24101, "epoch": 573} {"train_loss": -5.385746955871582, "global_step": 24102, "epoch": 573} {"train_loss": -5.4869384765625, "global_step": 24103, "epoch": 573} {"train_loss": -5.370606422424316, "global_step": 24104, "epoch": 573} {"train_loss": -5.403719902038574, "global_step": 24105, "epoch": 573} {"train_loss": -5.341858863830566, "global_step": 24106, "epoch": 573} {"train_loss": -5.340442453111921, "global_step": 24107, "epoch": 573, "val_loss": 65522.56640625} {"train_loss": -5.437692642211914, "global_step": 24108, "epoch": 574} {"train_loss": -5.35670804977417, "global_step": 24109, "epoch": 574} {"train_loss": -5.432323932647705, "global_step": 24110, "epoch": 574} {"train_loss": -5.311217784881592, "global_step": 24111, "epoch": 574} {"train_loss": -5.390229225158691, "global_step": 24112, "epoch": 574} {"train_loss": -5.389472484588623, "global_step": 24113, "epoch": 574} {"train_loss": -5.414283275604248, "global_step": 24114, "epoch": 574} {"train_loss": -5.51883602142334, "global_step": 24115, "epoch": 574} {"train_loss": -5.444340229034424, "global_step": 24116, "epoch": 574} {"train_loss": -5.264440059661865, "global_step": 24117, "epoch": 574} {"train_loss": -5.4154510498046875, "global_step": 24118, "epoch": 574} {"train_loss": -5.441545009613037, "global_step": 24119, "epoch": 574} {"train_loss": -5.3686089515686035, "global_step": 24120, "epoch": 574} {"train_loss": -5.293168067932129, "global_step": 24121, "epoch": 574} {"train_loss": -5.312221527099609, "global_step": 24122, "epoch": 574} {"train_loss": -5.296965599060059, "global_step": 24123, "epoch": 574} {"train_loss": -5.372838973999023, "global_step": 24124, "epoch": 574} {"train_loss": -5.39996337890625, "global_step": 24125, "epoch": 574} {"train_loss": -5.391000270843506, "global_step": 24126, "epoch": 574} {"train_loss": -5.462515830993652, "global_step": 24127, "epoch": 574} {"train_loss": -5.386253356933594, "global_step": 24128, "epoch": 574} {"train_loss": -5.33741569519043, "global_step": 24129, "epoch": 574} {"train_loss": -5.22160530090332, "global_step": 24130, "epoch": 574} {"train_loss": -5.298026084899902, "global_step": 24131, "epoch": 574} {"train_loss": -5.420315742492676, "global_step": 24132, "epoch": 574} {"train_loss": -5.391365051269531, "global_step": 24133, "epoch": 574} {"train_loss": -5.486571788787842, "global_step": 24134, "epoch": 574} {"train_loss": -5.468780517578125, "global_step": 24135, "epoch": 574} {"train_loss": -5.502675533294678, "global_step": 24136, "epoch": 574} {"train_loss": -5.446813583374023, "global_step": 24137, "epoch": 574} {"train_loss": -5.185525894165039, "global_step": 24138, "epoch": 574} {"train_loss": -5.2444305419921875, "global_step": 24139, "epoch": 574} {"train_loss": -5.402636528015137, "global_step": 24140, "epoch": 574} {"train_loss": -5.496295928955078, "global_step": 24141, "epoch": 574} {"train_loss": -5.334474563598633, "global_step": 24142, "epoch": 574} {"train_loss": -5.428000450134277, "global_step": 24143, "epoch": 574} {"train_loss": -5.364360809326172, "global_step": 24144, "epoch": 574} {"train_loss": -5.45745849609375, "global_step": 24145, "epoch": 574} {"train_loss": -5.431561470031738, "global_step": 24146, "epoch": 574} {"train_loss": -5.383312225341797, "global_step": 24147, "epoch": 574} {"train_loss": -5.36252498626709, "global_step": 24148, "epoch": 574} {"train_loss": -5.386281285967145, "global_step": 24149, "epoch": 574, "val_loss": 65532.015625} {"train_loss": -5.325521469116211, "global_step": 24150, "epoch": 575} {"train_loss": -5.34791898727417, "global_step": 24151, "epoch": 575} {"train_loss": -5.463846206665039, "global_step": 24152, "epoch": 575} {"train_loss": -5.421023368835449, "global_step": 24153, "epoch": 575} {"train_loss": -5.318019866943359, "global_step": 24154, "epoch": 575} {"train_loss": -5.385354042053223, "global_step": 24155, "epoch": 575} {"train_loss": -5.4298577308654785, "global_step": 24156, "epoch": 575} {"train_loss": -5.402667999267578, "global_step": 24157, "epoch": 575} {"train_loss": -5.377154350280762, "global_step": 24158, "epoch": 575} {"train_loss": -5.377192497253418, "global_step": 24159, "epoch": 575} {"train_loss": -5.398326396942139, "global_step": 24160, "epoch": 575} {"train_loss": -5.453342437744141, "global_step": 24161, "epoch": 575} {"train_loss": -5.424571990966797, "global_step": 24162, "epoch": 575} {"train_loss": -5.374279022216797, "global_step": 24163, "epoch": 575} {"train_loss": -5.300844192504883, "global_step": 24164, "epoch": 575} {"train_loss": -5.3159942626953125, "global_step": 24165, "epoch": 575} {"train_loss": -5.391473293304443, "global_step": 24166, "epoch": 575} {"train_loss": -5.373819828033447, "global_step": 24167, "epoch": 575} {"train_loss": -5.308905601501465, "global_step": 24168, "epoch": 575} {"train_loss": -5.426717281341553, "global_step": 24169, "epoch": 575} {"train_loss": -5.395317554473877, "global_step": 24170, "epoch": 575} {"train_loss": -5.466973304748535, "global_step": 24171, "epoch": 575} {"train_loss": -5.3349714279174805, "global_step": 24172, "epoch": 575} {"train_loss": -5.408829689025879, "global_step": 24173, "epoch": 575} {"train_loss": -5.415801525115967, "global_step": 24174, "epoch": 575} {"train_loss": -5.483238220214844, "global_step": 24175, "epoch": 575} {"train_loss": -5.29218864440918, "global_step": 24176, "epoch": 575} {"train_loss": -5.292224407196045, "global_step": 24177, "epoch": 575} {"train_loss": -5.310911178588867, "global_step": 24178, "epoch": 575} {"train_loss": -5.109146595001221, "global_step": 24179, "epoch": 575} {"train_loss": -5.3832855224609375, "global_step": 24180, "epoch": 575} {"train_loss": -5.360937118530273, "global_step": 24181, "epoch": 575} {"train_loss": -5.181614875793457, "global_step": 24182, "epoch": 575} {"train_loss": -5.315774917602539, "global_step": 24183, "epoch": 575} {"train_loss": -5.271917343139648, "global_step": 24184, "epoch": 575} {"train_loss": -5.235655784606934, "global_step": 24185, "epoch": 575} {"train_loss": -5.405642509460449, "global_step": 24186, "epoch": 575} {"train_loss": -5.391380310058594, "global_step": 24187, "epoch": 575} {"train_loss": -5.362654685974121, "global_step": 24188, "epoch": 575} {"train_loss": -5.440003395080566, "global_step": 24189, "epoch": 575} {"train_loss": -5.332244873046875, "global_step": 24190, "epoch": 575} {"train_loss": -5.362380152656918, "global_step": 24191, "epoch": 575, "val_loss": 65687.4296875} {"train_loss": -5.293052673339844, "global_step": 24192, "epoch": 576} {"train_loss": -5.414731979370117, "global_step": 24193, "epoch": 576} {"train_loss": -5.361136436462402, "global_step": 24194, "epoch": 576} {"train_loss": -5.438821792602539, "global_step": 24195, "epoch": 576} {"train_loss": -5.446906089782715, "global_step": 24196, "epoch": 576} {"train_loss": -5.358267307281494, "global_step": 24197, "epoch": 576} {"train_loss": -5.3267598152160645, "global_step": 24198, "epoch": 576} {"train_loss": -5.36391019821167, "global_step": 24199, "epoch": 576} {"train_loss": -5.466239929199219, "global_step": 24200, "epoch": 576} {"train_loss": -5.3712921142578125, "global_step": 24201, "epoch": 576} {"train_loss": -5.470011234283447, "global_step": 24202, "epoch": 576} {"train_loss": -5.273475646972656, "global_step": 24203, "epoch": 576} {"train_loss": -5.467376708984375, "global_step": 24204, "epoch": 576} {"train_loss": -5.29272985458374, "global_step": 24205, "epoch": 576} {"train_loss": -5.460990905761719, "global_step": 24206, "epoch": 576} {"train_loss": -5.50474214553833, "global_step": 24207, "epoch": 576} {"train_loss": -5.495928764343262, "global_step": 24208, "epoch": 576} {"train_loss": -5.375115394592285, "global_step": 24209, "epoch": 576} {"train_loss": -5.287692070007324, "global_step": 24210, "epoch": 576} {"train_loss": -5.408524990081787, "global_step": 24211, "epoch": 576} {"train_loss": -5.346538543701172, "global_step": 24212, "epoch": 576} {"train_loss": -5.280437469482422, "global_step": 24213, "epoch": 576} {"train_loss": -5.279514312744141, "global_step": 24214, "epoch": 576} {"train_loss": -5.426614761352539, "global_step": 24215, "epoch": 576} {"train_loss": -5.261434555053711, "global_step": 24216, "epoch": 576} {"train_loss": -5.312823295593262, "global_step": 24217, "epoch": 576} {"train_loss": -5.332989692687988, "global_step": 24218, "epoch": 576} {"train_loss": -5.469830513000488, "global_step": 24219, "epoch": 576} {"train_loss": -5.370825290679932, "global_step": 24220, "epoch": 576} {"train_loss": -5.3426194190979, "global_step": 24221, "epoch": 576} {"train_loss": -5.407894134521484, "global_step": 24222, "epoch": 576} {"train_loss": -5.386782169342041, "global_step": 24223, "epoch": 576} {"train_loss": -5.331591606140137, "global_step": 24224, "epoch": 576} {"train_loss": -5.233250141143799, "global_step": 24225, "epoch": 576} {"train_loss": -5.377485752105713, "global_step": 24226, "epoch": 576} {"train_loss": -5.370021820068359, "global_step": 24227, "epoch": 576} {"train_loss": -5.328841209411621, "global_step": 24228, "epoch": 576} {"train_loss": -5.381265640258789, "global_step": 24229, "epoch": 576} {"train_loss": -5.217740058898926, "global_step": 24230, "epoch": 576} {"train_loss": -5.475874900817871, "global_step": 24231, "epoch": 576} {"train_loss": -5.446646690368652, "global_step": 24232, "epoch": 576} {"train_loss": -5.370874688738868, "global_step": 24233, "epoch": 576, "val_loss": 65778.859375} {"train_loss": -5.44744873046875, "global_step": 24234, "epoch": 577} {"train_loss": -5.279552936553955, "global_step": 24235, "epoch": 577} {"train_loss": -5.377381324768066, "global_step": 24236, "epoch": 577} {"train_loss": -5.488956451416016, "global_step": 24237, "epoch": 577} {"train_loss": -5.392026901245117, "global_step": 24238, "epoch": 577} {"train_loss": -5.360072135925293, "global_step": 24239, "epoch": 577} {"train_loss": -5.33122444152832, "global_step": 24240, "epoch": 577} {"train_loss": -5.323454856872559, "global_step": 24241, "epoch": 577} {"train_loss": -5.441773414611816, "global_step": 24242, "epoch": 577} {"train_loss": -5.2992048263549805, "global_step": 24243, "epoch": 577} {"train_loss": -5.433485984802246, "global_step": 24244, "epoch": 577} {"train_loss": -5.470627784729004, "global_step": 24245, "epoch": 577} {"train_loss": -5.452790260314941, "global_step": 24246, "epoch": 577} {"train_loss": -5.374849319458008, "global_step": 24247, "epoch": 577} {"train_loss": -5.401557922363281, "global_step": 24248, "epoch": 577} {"train_loss": -5.293668746948242, "global_step": 24249, "epoch": 577} {"train_loss": -5.311567306518555, "global_step": 24250, "epoch": 577} {"train_loss": -5.3116631507873535, "global_step": 24251, "epoch": 577} {"train_loss": -5.4547553062438965, "global_step": 24252, "epoch": 577} {"train_loss": -5.411694049835205, "global_step": 24253, "epoch": 577} {"train_loss": -5.268550395965576, "global_step": 24254, "epoch": 577} {"train_loss": -5.359286308288574, "global_step": 24255, "epoch": 577} {"train_loss": -5.391590118408203, "global_step": 24256, "epoch": 577} {"train_loss": -5.2562150955200195, "global_step": 24257, "epoch": 577} {"train_loss": -5.374616622924805, "global_step": 24258, "epoch": 577} {"train_loss": -5.461970329284668, "global_step": 24259, "epoch": 577} {"train_loss": -5.223940372467041, "global_step": 24260, "epoch": 577} {"train_loss": -5.334436416625977, "global_step": 24261, "epoch": 577} {"train_loss": -5.371166229248047, "global_step": 24262, "epoch": 577} {"train_loss": -5.373956203460693, "global_step": 24263, "epoch": 577} {"train_loss": -5.278395652770996, "global_step": 24264, "epoch": 577} {"train_loss": -5.370347023010254, "global_step": 24265, "epoch": 577} {"train_loss": -5.446621894836426, "global_step": 24266, "epoch": 577} {"train_loss": -5.268476486206055, "global_step": 24267, "epoch": 577} {"train_loss": -5.290378570556641, "global_step": 24268, "epoch": 577} {"train_loss": -5.342231750488281, "global_step": 24269, "epoch": 577} {"train_loss": -5.404717445373535, "global_step": 24270, "epoch": 577} {"train_loss": -5.406294822692871, "global_step": 24271, "epoch": 577} {"train_loss": -5.380616664886475, "global_step": 24272, "epoch": 577} {"train_loss": -5.407642841339111, "global_step": 24273, "epoch": 577} {"train_loss": -5.356112957000732, "global_step": 24274, "epoch": 577} {"train_loss": -5.368422417413621, "global_step": 24275, "epoch": 577, "val_loss": 65690.265625} {"train_loss": -5.405328750610352, "global_step": 24276, "epoch": 578} {"train_loss": -5.3109307289123535, "global_step": 24277, "epoch": 578} {"train_loss": -5.303737163543701, "global_step": 24278, "epoch": 578} {"train_loss": -5.520641326904297, "global_step": 24279, "epoch": 578} {"train_loss": -5.470651626586914, "global_step": 24280, "epoch": 578} {"train_loss": -5.200846195220947, "global_step": 24281, "epoch": 578} {"train_loss": -5.455487251281738, "global_step": 24282, "epoch": 578} {"train_loss": -5.40393590927124, "global_step": 24283, "epoch": 578} {"train_loss": -5.19306755065918, "global_step": 24284, "epoch": 578} {"train_loss": -5.374404430389404, "global_step": 24285, "epoch": 578} {"train_loss": -5.265748977661133, "global_step": 24286, "epoch": 578} {"train_loss": -5.28823709487915, "global_step": 24287, "epoch": 578} {"train_loss": -5.366522789001465, "global_step": 24288, "epoch": 578} {"train_loss": -5.404173851013184, "global_step": 24289, "epoch": 578} {"train_loss": -5.252395153045654, "global_step": 24290, "epoch": 578} {"train_loss": -5.431441307067871, "global_step": 24291, "epoch": 578} {"train_loss": -5.245487213134766, "global_step": 24292, "epoch": 578} {"train_loss": -5.298015594482422, "global_step": 24293, "epoch": 578} {"train_loss": -5.348947048187256, "global_step": 24294, "epoch": 578} {"train_loss": -5.390851974487305, "global_step": 24295, "epoch": 578} {"train_loss": -5.280917644500732, "global_step": 24296, "epoch": 578} {"train_loss": -5.312276363372803, "global_step": 24297, "epoch": 578} {"train_loss": -5.341196060180664, "global_step": 24298, "epoch": 578} {"train_loss": -5.401174068450928, "global_step": 24299, "epoch": 578} {"train_loss": -5.3254289627075195, "global_step": 24300, "epoch": 578} {"train_loss": -5.290397644042969, "global_step": 24301, "epoch": 578} {"train_loss": -5.239258289337158, "global_step": 24302, "epoch": 578} {"train_loss": -5.44752311706543, "global_step": 24303, "epoch": 578} {"train_loss": -5.131189346313477, "global_step": 24304, "epoch": 578} {"train_loss": -5.221175193786621, "global_step": 24305, "epoch": 578} {"train_loss": -5.429959297180176, "global_step": 24306, "epoch": 578} {"train_loss": -5.2532958984375, "global_step": 24307, "epoch": 578} {"train_loss": -5.215141773223877, "global_step": 24308, "epoch": 578} {"train_loss": -5.286009788513184, "global_step": 24309, "epoch": 578} {"train_loss": -5.302618980407715, "global_step": 24310, "epoch": 578} {"train_loss": -5.269820213317871, "global_step": 24311, "epoch": 578} {"train_loss": -5.241516590118408, "global_step": 24312, "epoch": 578} {"train_loss": -5.268439292907715, "global_step": 24313, "epoch": 578} {"train_loss": -5.306028366088867, "global_step": 24314, "epoch": 578} {"train_loss": -5.374994277954102, "global_step": 24315, "epoch": 578} {"train_loss": -5.222862243652344, "global_step": 24316, "epoch": 578} {"train_loss": -5.3172285216195245, "global_step": 24317, "epoch": 578, "val_loss": 66070.3515625} {"train_loss": -5.355518341064453, "global_step": 24318, "epoch": 579} {"train_loss": -5.43377685546875, "global_step": 24319, "epoch": 579} {"train_loss": -5.329475402832031, "global_step": 24320, "epoch": 579} {"train_loss": -5.414355278015137, "global_step": 24321, "epoch": 579} {"train_loss": -5.456869125366211, "global_step": 24322, "epoch": 579} {"train_loss": -5.4362077713012695, "global_step": 24323, "epoch": 579} {"train_loss": -5.321107864379883, "global_step": 24324, "epoch": 579} {"train_loss": -5.280462741851807, "global_step": 24325, "epoch": 579} {"train_loss": -5.382840156555176, "global_step": 24326, "epoch": 579} {"train_loss": -5.42326545715332, "global_step": 24327, "epoch": 579} {"train_loss": -5.3958845138549805, "global_step": 24328, "epoch": 579} {"train_loss": -5.459672451019287, "global_step": 24329, "epoch": 579} {"train_loss": -5.251214981079102, "global_step": 24330, "epoch": 579} {"train_loss": -5.316612243652344, "global_step": 24331, "epoch": 579} {"train_loss": -5.231288909912109, "global_step": 24332, "epoch": 579} {"train_loss": -5.302498817443848, "global_step": 24333, "epoch": 579} {"train_loss": -5.333817005157471, "global_step": 24334, "epoch": 579} {"train_loss": -5.279900074005127, "global_step": 24335, "epoch": 579} {"train_loss": -5.355433464050293, "global_step": 24336, "epoch": 579} {"train_loss": -5.201257705688477, "global_step": 24337, "epoch": 579} {"train_loss": -5.233614921569824, "global_step": 24338, "epoch": 579} {"train_loss": -5.4527387619018555, "global_step": 24339, "epoch": 579} {"train_loss": -5.469413757324219, "global_step": 24340, "epoch": 579} {"train_loss": -5.334700107574463, "global_step": 24341, "epoch": 579} {"train_loss": -5.461655139923096, "global_step": 24342, "epoch": 579} {"train_loss": -5.416467666625977, "global_step": 24343, "epoch": 579} {"train_loss": -5.46807861328125, "global_step": 24344, "epoch": 579} {"train_loss": -5.303125381469727, "global_step": 24345, "epoch": 579} {"train_loss": -5.246858596801758, "global_step": 24346, "epoch": 579} {"train_loss": -5.227242469787598, "global_step": 24347, "epoch": 579} {"train_loss": -5.357407569885254, "global_step": 24348, "epoch": 579} {"train_loss": -5.278708457946777, "global_step": 24349, "epoch": 579} {"train_loss": -5.244430065155029, "global_step": 24350, "epoch": 579} {"train_loss": -5.358344078063965, "global_step": 24351, "epoch": 579} {"train_loss": -5.327658653259277, "global_step": 24352, "epoch": 579} {"train_loss": -5.372647285461426, "global_step": 24353, "epoch": 579} {"train_loss": -5.314698219299316, "global_step": 24354, "epoch": 579} {"train_loss": -5.459685325622559, "global_step": 24355, "epoch": 579} {"train_loss": -5.409126281738281, "global_step": 24356, "epoch": 579} {"train_loss": -5.384025573730469, "global_step": 24357, "epoch": 579} {"train_loss": -5.216186046600342, "global_step": 24358, "epoch": 579} {"train_loss": -5.3486705507550925, "global_step": 24359, "epoch": 579, "val_loss": 65459.39453125} {"train_loss": -5.32004451751709, "global_step": 24360, "epoch": 580} {"train_loss": -5.3228960037231445, "global_step": 24361, "epoch": 580} {"train_loss": -5.371535301208496, "global_step": 24362, "epoch": 580} {"train_loss": -5.306416034698486, "global_step": 24363, "epoch": 580} {"train_loss": -5.3634514808654785, "global_step": 24364, "epoch": 580} {"train_loss": -5.360926151275635, "global_step": 24365, "epoch": 580} {"train_loss": -5.296554088592529, "global_step": 24366, "epoch": 580} {"train_loss": -5.435912132263184, "global_step": 24367, "epoch": 580} {"train_loss": -5.273711204528809, "global_step": 24368, "epoch": 580} {"train_loss": -5.293865203857422, "global_step": 24369, "epoch": 580} {"train_loss": -5.401558876037598, "global_step": 24370, "epoch": 580} {"train_loss": -5.397089004516602, "global_step": 24371, "epoch": 580} {"train_loss": -5.307875633239746, "global_step": 24372, "epoch": 580} {"train_loss": -5.3425493240356445, "global_step": 24373, "epoch": 580} {"train_loss": -5.4029459953308105, "global_step": 24374, "epoch": 580} {"train_loss": -5.44392204284668, "global_step": 24375, "epoch": 580} {"train_loss": -5.438993453979492, "global_step": 24376, "epoch": 580} {"train_loss": -5.420904636383057, "global_step": 24377, "epoch": 580} {"train_loss": -5.35934591293335, "global_step": 24378, "epoch": 580} {"train_loss": -5.455662250518799, "global_step": 24379, "epoch": 580} {"train_loss": -5.334836959838867, "global_step": 24380, "epoch": 580} {"train_loss": -5.283839225769043, "global_step": 24381, "epoch": 580} {"train_loss": -5.340302467346191, "global_step": 24382, "epoch": 580} {"train_loss": -5.465710639953613, "global_step": 24383, "epoch": 580} {"train_loss": -5.241273880004883, "global_step": 24384, "epoch": 580} {"train_loss": -5.201974868774414, "global_step": 24385, "epoch": 580} {"train_loss": -5.39712381362915, "global_step": 24386, "epoch": 580} {"train_loss": -5.37151575088501, "global_step": 24387, "epoch": 580} {"train_loss": -5.363128662109375, "global_step": 24388, "epoch": 580} {"train_loss": -5.357298851013184, "global_step": 24389, "epoch": 580} {"train_loss": -5.382864952087402, "global_step": 24390, "epoch": 580} {"train_loss": -5.311827182769775, "global_step": 24391, "epoch": 580} {"train_loss": -5.357037544250488, "global_step": 24392, "epoch": 580} {"train_loss": -5.466313362121582, "global_step": 24393, "epoch": 580} {"train_loss": -5.394631385803223, "global_step": 24394, "epoch": 580} {"train_loss": -5.531240463256836, "global_step": 24395, "epoch": 580} {"train_loss": -5.403611183166504, "global_step": 24396, "epoch": 580} {"train_loss": -5.333805561065674, "global_step": 24397, "epoch": 580} {"train_loss": -5.338216781616211, "global_step": 24398, "epoch": 580} {"train_loss": -5.484902858734131, "global_step": 24399, "epoch": 580} {"train_loss": -5.302380561828613, "global_step": 24400, "epoch": 580} {"train_loss": -5.367697238922119, "global_step": 24401, "epoch": 580, "val_loss": 65600.15625} {"train_loss": -5.284537315368652, "global_step": 24402, "epoch": 581} {"train_loss": -5.215484619140625, "global_step": 24403, "epoch": 581} {"train_loss": -5.428318023681641, "global_step": 24404, "epoch": 581} {"train_loss": -5.377324104309082, "global_step": 24405, "epoch": 581} {"train_loss": -5.402009963989258, "global_step": 24406, "epoch": 581} {"train_loss": -5.3630523681640625, "global_step": 24407, "epoch": 581} {"train_loss": -5.451240062713623, "global_step": 24408, "epoch": 581} {"train_loss": -5.339646339416504, "global_step": 24409, "epoch": 581} {"train_loss": -5.440185070037842, "global_step": 24410, "epoch": 581} {"train_loss": -5.437549114227295, "global_step": 24411, "epoch": 581} {"train_loss": -5.255431175231934, "global_step": 24412, "epoch": 581} {"train_loss": -5.523460388183594, "global_step": 24413, "epoch": 581} {"train_loss": -5.233526229858398, "global_step": 24414, "epoch": 581} {"train_loss": -5.383222579956055, "global_step": 24415, "epoch": 581} {"train_loss": -5.4738383293151855, "global_step": 24416, "epoch": 581} {"train_loss": -5.4315290451049805, "global_step": 24417, "epoch": 581} {"train_loss": -5.43819522857666, "global_step": 24418, "epoch": 581} {"train_loss": -5.560437202453613, "global_step": 24419, "epoch": 581} {"train_loss": -5.292078018188477, "global_step": 24420, "epoch": 581} {"train_loss": -5.455794334411621, "global_step": 24421, "epoch": 581} {"train_loss": -5.442903518676758, "global_step": 24422, "epoch": 581} {"train_loss": -5.380090236663818, "global_step": 24423, "epoch": 581} {"train_loss": -5.4645891189575195, "global_step": 24424, "epoch": 581} {"train_loss": -5.424560546875, "global_step": 24425, "epoch": 581} {"train_loss": -5.342101097106934, "global_step": 24426, "epoch": 581} {"train_loss": -5.2817463874816895, "global_step": 24427, "epoch": 581} {"train_loss": -5.436801910400391, "global_step": 24428, "epoch": 581} {"train_loss": -5.548151969909668, "global_step": 24429, "epoch": 581} {"train_loss": -5.276808261871338, "global_step": 24430, "epoch": 581} {"train_loss": -5.422789096832275, "global_step": 24431, "epoch": 581} {"train_loss": -5.386078834533691, "global_step": 24432, "epoch": 581} {"train_loss": -5.268919467926025, "global_step": 24433, "epoch": 581} {"train_loss": -5.39184045791626, "global_step": 24434, "epoch": 581} {"train_loss": -5.326129913330078, "global_step": 24435, "epoch": 581} {"train_loss": -5.372163772583008, "global_step": 24436, "epoch": 581} {"train_loss": -5.368030071258545, "global_step": 24437, "epoch": 581} {"train_loss": -5.277793884277344, "global_step": 24438, "epoch": 581} {"train_loss": -5.385682582855225, "global_step": 24439, "epoch": 581} {"train_loss": -5.424088954925537, "global_step": 24440, "epoch": 581} {"train_loss": -5.30012321472168, "global_step": 24441, "epoch": 581} {"train_loss": -5.339988708496094, "global_step": 24442, "epoch": 581} {"train_loss": -5.381187200546265, "global_step": 24443, "epoch": 581, "val_loss": 65551.28125} {"train_loss": -5.322730541229248, "global_step": 24444, "epoch": 582} {"train_loss": -5.305480003356934, "global_step": 24445, "epoch": 582} {"train_loss": -5.290329456329346, "global_step": 24446, "epoch": 582} {"train_loss": -5.291647911071777, "global_step": 24447, "epoch": 582} {"train_loss": -5.455275535583496, "global_step": 24448, "epoch": 582} {"train_loss": -5.4931182861328125, "global_step": 24449, "epoch": 582} {"train_loss": -5.407919883728027, "global_step": 24450, "epoch": 582} {"train_loss": -5.442912578582764, "global_step": 24451, "epoch": 582} {"train_loss": -5.466578483581543, "global_step": 24452, "epoch": 582} {"train_loss": -5.246119976043701, "global_step": 24453, "epoch": 582} {"train_loss": -5.448909759521484, "global_step": 24454, "epoch": 582} {"train_loss": -5.473575115203857, "global_step": 24455, "epoch": 582} {"train_loss": -5.255693435668945, "global_step": 24456, "epoch": 582} {"train_loss": -5.3750152587890625, "global_step": 24457, "epoch": 582} {"train_loss": -5.28568172454834, "global_step": 24458, "epoch": 582} {"train_loss": -5.452261924743652, "global_step": 24459, "epoch": 582} {"train_loss": -5.394516944885254, "global_step": 24460, "epoch": 582} {"train_loss": -5.399471282958984, "global_step": 24461, "epoch": 582} {"train_loss": -5.341000556945801, "global_step": 24462, "epoch": 582} {"train_loss": -5.434445858001709, "global_step": 24463, "epoch": 582} {"train_loss": -5.30376672744751, "global_step": 24464, "epoch": 582} {"train_loss": -5.385618209838867, "global_step": 24465, "epoch": 582} {"train_loss": -5.398151397705078, "global_step": 24466, "epoch": 582} {"train_loss": -5.229565620422363, "global_step": 24467, "epoch": 582} {"train_loss": -5.3708319664001465, "global_step": 24468, "epoch": 582} {"train_loss": -5.286593437194824, "global_step": 24469, "epoch": 582} {"train_loss": -5.3266825675964355, "global_step": 24470, "epoch": 582} {"train_loss": -5.301764011383057, "global_step": 24471, "epoch": 582} {"train_loss": -5.303321838378906, "global_step": 24472, "epoch": 582} {"train_loss": -5.357080459594727, "global_step": 24473, "epoch": 582} {"train_loss": -5.388227462768555, "global_step": 24474, "epoch": 582} {"train_loss": -5.228476524353027, "global_step": 24475, "epoch": 582} {"train_loss": -5.467225074768066, "global_step": 24476, "epoch": 582} {"train_loss": -5.2764058113098145, "global_step": 24477, "epoch": 582} {"train_loss": -5.487764358520508, "global_step": 24478, "epoch": 582} {"train_loss": -5.3257036209106445, "global_step": 24479, "epoch": 582} {"train_loss": -5.305723190307617, "global_step": 24480, "epoch": 582} {"train_loss": -5.35984468460083, "global_step": 24481, "epoch": 582} {"train_loss": -5.288937568664551, "global_step": 24482, "epoch": 582} {"train_loss": -5.356891632080078, "global_step": 24483, "epoch": 582} {"train_loss": -5.500011444091797, "global_step": 24484, "epoch": 582} {"train_loss": -5.361239228929792, "global_step": 24485, "epoch": 582, "val_loss": 65712.4453125} {"train_loss": -5.2232561111450195, "global_step": 24486, "epoch": 583} {"train_loss": -5.425937652587891, "global_step": 24487, "epoch": 583} {"train_loss": -5.212387561798096, "global_step": 24488, "epoch": 583} {"train_loss": -5.421655654907227, "global_step": 24489, "epoch": 583} {"train_loss": -5.313416481018066, "global_step": 24490, "epoch": 583} {"train_loss": -5.327692031860352, "global_step": 24491, "epoch": 583} {"train_loss": -5.353584289550781, "global_step": 24492, "epoch": 583} {"train_loss": -5.2740020751953125, "global_step": 24493, "epoch": 583} {"train_loss": -5.323638916015625, "global_step": 24494, "epoch": 583} {"train_loss": -5.438379764556885, "global_step": 24495, "epoch": 583} {"train_loss": -5.267332553863525, "global_step": 24496, "epoch": 583} {"train_loss": -5.2523603439331055, "global_step": 24497, "epoch": 583} {"train_loss": -5.196615219116211, "global_step": 24498, "epoch": 583} {"train_loss": -5.427742004394531, "global_step": 24499, "epoch": 583} {"train_loss": -5.387434482574463, "global_step": 24500, "epoch": 583} {"train_loss": -5.3856635093688965, "global_step": 24501, "epoch": 583} {"train_loss": -5.463674545288086, "global_step": 24502, "epoch": 583} {"train_loss": -5.399613380432129, "global_step": 24503, "epoch": 583} {"train_loss": -5.315851211547852, "global_step": 24504, "epoch": 583} {"train_loss": -5.423973083496094, "global_step": 24505, "epoch": 583} {"train_loss": -5.376462936401367, "global_step": 24506, "epoch": 583} {"train_loss": -5.058351993560791, "global_step": 24507, "epoch": 583} {"train_loss": -5.357572555541992, "global_step": 24508, "epoch": 583} {"train_loss": -5.3433146476745605, "global_step": 24509, "epoch": 583} {"train_loss": -5.423900127410889, "global_step": 24510, "epoch": 583} {"train_loss": -5.295130729675293, "global_step": 24511, "epoch": 583} {"train_loss": -5.2959489822387695, "global_step": 24512, "epoch": 583} {"train_loss": -5.343445301055908, "global_step": 24513, "epoch": 583} {"train_loss": -5.378098964691162, "global_step": 24514, "epoch": 583} {"train_loss": -5.440210342407227, "global_step": 24515, "epoch": 583} {"train_loss": -5.398376941680908, "global_step": 24516, "epoch": 583} {"train_loss": -5.4712934494018555, "global_step": 24517, "epoch": 583} {"train_loss": -5.537824630737305, "global_step": 24518, "epoch": 583} {"train_loss": -5.281065464019775, "global_step": 24519, "epoch": 583} {"train_loss": -5.4645538330078125, "global_step": 24520, "epoch": 583} {"train_loss": -5.35571813583374, "global_step": 24521, "epoch": 583} {"train_loss": -5.2899017333984375, "global_step": 24522, "epoch": 583} {"train_loss": -5.348484039306641, "global_step": 24523, "epoch": 583} {"train_loss": -5.309004306793213, "global_step": 24524, "epoch": 583} {"train_loss": -5.379754066467285, "global_step": 24525, "epoch": 583} {"train_loss": -5.360396385192871, "global_step": 24526, "epoch": 583} {"train_loss": -5.35128649075826, "global_step": 24527, "epoch": 583, "val_loss": 65595.453125} {"train_loss": -5.282311916351318, "global_step": 24528, "epoch": 584} {"train_loss": -5.3884172439575195, "global_step": 24529, "epoch": 584} {"train_loss": -5.354870319366455, "global_step": 24530, "epoch": 584} {"train_loss": -5.3038177490234375, "global_step": 24531, "epoch": 584} {"train_loss": -5.306161403656006, "global_step": 24532, "epoch": 584} {"train_loss": -5.468230247497559, "global_step": 24533, "epoch": 584} {"train_loss": -5.556187629699707, "global_step": 24534, "epoch": 584} {"train_loss": -5.34953498840332, "global_step": 24535, "epoch": 584} {"train_loss": -5.3920464515686035, "global_step": 24536, "epoch": 584} {"train_loss": -5.316831588745117, "global_step": 24537, "epoch": 584} {"train_loss": -5.3941450119018555, "global_step": 24538, "epoch": 584} {"train_loss": -5.382462501525879, "global_step": 24539, "epoch": 584} {"train_loss": -5.454109191894531, "global_step": 24540, "epoch": 584} {"train_loss": -5.3403639793396, "global_step": 24541, "epoch": 584} {"train_loss": -5.2945051193237305, "global_step": 24542, "epoch": 584} {"train_loss": -5.335330009460449, "global_step": 24543, "epoch": 584} {"train_loss": -5.438362121582031, "global_step": 24544, "epoch": 584} {"train_loss": -5.5520830154418945, "global_step": 24545, "epoch": 584} {"train_loss": -5.314591407775879, "global_step": 24546, "epoch": 584} {"train_loss": -5.413420677185059, "global_step": 24547, "epoch": 584} {"train_loss": -5.395191669464111, "global_step": 24548, "epoch": 584} {"train_loss": -5.462535381317139, "global_step": 24549, "epoch": 584} {"train_loss": -5.491415977478027, "global_step": 24550, "epoch": 584} {"train_loss": -5.197576522827148, "global_step": 24551, "epoch": 584} {"train_loss": -5.27891731262207, "global_step": 24552, "epoch": 584} {"train_loss": -5.34465217590332, "global_step": 24553, "epoch": 584} {"train_loss": -5.307268142700195, "global_step": 24554, "epoch": 584} {"train_loss": -5.335039138793945, "global_step": 24555, "epoch": 584} {"train_loss": -5.368387222290039, "global_step": 24556, "epoch": 584} {"train_loss": -5.4257121086120605, "global_step": 24557, "epoch": 584} {"train_loss": -5.4439897537231445, "global_step": 24558, "epoch": 584} {"train_loss": -5.312044143676758, "global_step": 24559, "epoch": 584} {"train_loss": -5.327790260314941, "global_step": 24560, "epoch": 584} {"train_loss": -5.422918319702148, "global_step": 24561, "epoch": 584} {"train_loss": -5.319115161895752, "global_step": 24562, "epoch": 584} {"train_loss": -5.341091632843018, "global_step": 24563, "epoch": 584} {"train_loss": -5.27170467376709, "global_step": 24564, "epoch": 584} {"train_loss": -5.361075401306152, "global_step": 24565, "epoch": 584} {"train_loss": -5.247792720794678, "global_step": 24566, "epoch": 584} {"train_loss": -5.426447868347168, "global_step": 24567, "epoch": 584} {"train_loss": -5.349218845367432, "global_step": 24568, "epoch": 584} {"train_loss": -5.37040680930728, "global_step": 24569, "epoch": 584, "val_loss": 65520.2109375} {"train_loss": -5.511300563812256, "global_step": 24570, "epoch": 585} {"train_loss": -5.291689395904541, "global_step": 24571, "epoch": 585} {"train_loss": -5.313105583190918, "global_step": 24572, "epoch": 585} {"train_loss": -5.441865921020508, "global_step": 24573, "epoch": 585} {"train_loss": -5.508279800415039, "global_step": 24574, "epoch": 585} {"train_loss": -5.333085536956787, "global_step": 24575, "epoch": 585} {"train_loss": -5.4917731285095215, "global_step": 24576, "epoch": 585} {"train_loss": -5.271878719329834, "global_step": 24577, "epoch": 585} {"train_loss": -5.542876243591309, "global_step": 24578, "epoch": 585} {"train_loss": -5.240395545959473, "global_step": 24579, "epoch": 585} {"train_loss": -5.313074111938477, "global_step": 24580, "epoch": 585} {"train_loss": -5.408923149108887, "global_step": 24581, "epoch": 585} {"train_loss": -5.338205814361572, "global_step": 24582, "epoch": 585} {"train_loss": -5.229376316070557, "global_step": 24583, "epoch": 585} {"train_loss": -5.534731864929199, "global_step": 24584, "epoch": 585} {"train_loss": -5.410959243774414, "global_step": 24585, "epoch": 585} {"train_loss": -5.2053914070129395, "global_step": 24586, "epoch": 585} {"train_loss": -5.427254676818848, "global_step": 24587, "epoch": 585} {"train_loss": -5.254515647888184, "global_step": 24588, "epoch": 585} {"train_loss": -5.278955459594727, "global_step": 24589, "epoch": 585} {"train_loss": -5.444348335266113, "global_step": 24590, "epoch": 585} {"train_loss": -5.24334716796875, "global_step": 24591, "epoch": 585} {"train_loss": -5.328962802886963, "global_step": 24592, "epoch": 585} {"train_loss": -5.340239524841309, "global_step": 24593, "epoch": 585} {"train_loss": -5.239737510681152, "global_step": 24594, "epoch": 585} {"train_loss": -5.414206504821777, "global_step": 24595, "epoch": 585} {"train_loss": -5.358419418334961, "global_step": 24596, "epoch": 585} {"train_loss": -5.444565296173096, "global_step": 24597, "epoch": 585} {"train_loss": -5.477494239807129, "global_step": 24598, "epoch": 585} {"train_loss": -5.3900980949401855, "global_step": 24599, "epoch": 585} {"train_loss": -5.279045104980469, "global_step": 24600, "epoch": 585} {"train_loss": -5.308241844177246, "global_step": 24601, "epoch": 585} {"train_loss": -5.270517349243164, "global_step": 24602, "epoch": 585} {"train_loss": -5.368508338928223, "global_step": 24603, "epoch": 585} {"train_loss": -5.387935638427734, "global_step": 24604, "epoch": 585} {"train_loss": -5.355633735656738, "global_step": 24605, "epoch": 585} {"train_loss": -5.2906389236450195, "global_step": 24606, "epoch": 585} {"train_loss": -5.296961784362793, "global_step": 24607, "epoch": 585} {"train_loss": -5.432041168212891, "global_step": 24608, "epoch": 585} {"train_loss": -5.357242584228516, "global_step": 24609, "epoch": 585} {"train_loss": -5.320755481719971, "global_step": 24610, "epoch": 585} {"train_loss": -5.356902894519624, "global_step": 24611, "epoch": 585, "val_loss": 65118.8828125} {"train_loss": -5.317074775695801, "global_step": 24612, "epoch": 586} {"train_loss": -5.457675457000732, "global_step": 24613, "epoch": 586} {"train_loss": -5.367404460906982, "global_step": 24614, "epoch": 586} {"train_loss": -5.450371742248535, "global_step": 24615, "epoch": 586} {"train_loss": -5.4047722816467285, "global_step": 24616, "epoch": 586} {"train_loss": -5.443243026733398, "global_step": 24617, "epoch": 586} {"train_loss": -5.3238983154296875, "global_step": 24618, "epoch": 586} {"train_loss": -5.362985134124756, "global_step": 24619, "epoch": 586} {"train_loss": -5.3832855224609375, "global_step": 24620, "epoch": 586} {"train_loss": -5.419325828552246, "global_step": 24621, "epoch": 586} {"train_loss": -5.310554504394531, "global_step": 24622, "epoch": 586} {"train_loss": -5.369130611419678, "global_step": 24623, "epoch": 586} {"train_loss": -5.460171699523926, "global_step": 24624, "epoch": 586} {"train_loss": -5.3057379722595215, "global_step": 24625, "epoch": 586} {"train_loss": -5.439899921417236, "global_step": 24626, "epoch": 586} {"train_loss": -5.311140060424805, "global_step": 24627, "epoch": 586} {"train_loss": -5.45078706741333, "global_step": 24628, "epoch": 586} {"train_loss": -5.431612014770508, "global_step": 24629, "epoch": 586} {"train_loss": -5.525811195373535, "global_step": 24630, "epoch": 586} {"train_loss": -5.366498947143555, "global_step": 24631, "epoch": 586} {"train_loss": -5.42118501663208, "global_step": 24632, "epoch": 586} {"train_loss": -5.329801559448242, "global_step": 24633, "epoch": 586} {"train_loss": -5.444222450256348, "global_step": 24634, "epoch": 586} {"train_loss": -5.3867902755737305, "global_step": 24635, "epoch": 586} {"train_loss": -5.373069763183594, "global_step": 24636, "epoch": 586} {"train_loss": -5.551677703857422, "global_step": 24637, "epoch": 586} {"train_loss": -5.363075256347656, "global_step": 24638, "epoch": 586} {"train_loss": -5.395684719085693, "global_step": 24639, "epoch": 586} {"train_loss": -5.333925247192383, "global_step": 24640, "epoch": 586} {"train_loss": -5.335371971130371, "global_step": 24641, "epoch": 586} {"train_loss": -5.351456642150879, "global_step": 24642, "epoch": 586} {"train_loss": -5.43325138092041, "global_step": 24643, "epoch": 586} {"train_loss": -5.440638065338135, "global_step": 24644, "epoch": 586} {"train_loss": -5.403766632080078, "global_step": 24645, "epoch": 586} {"train_loss": -5.307498931884766, "global_step": 24646, "epoch": 586} {"train_loss": -5.387112140655518, "global_step": 24647, "epoch": 586} {"train_loss": -5.354758262634277, "global_step": 24648, "epoch": 586} {"train_loss": -5.577885150909424, "global_step": 24649, "epoch": 586} {"train_loss": -5.388856887817383, "global_step": 24650, "epoch": 586} {"train_loss": -5.510072231292725, "global_step": 24651, "epoch": 586} {"train_loss": -5.360172748565674, "global_step": 24652, "epoch": 586} {"train_loss": -5.39923003741673, "global_step": 24653, "epoch": 586, "val_loss": 65814.8203125} {"train_loss": -5.34005069732666, "global_step": 24654, "epoch": 587} {"train_loss": -5.48173189163208, "global_step": 24655, "epoch": 587} {"train_loss": -5.427910327911377, "global_step": 24656, "epoch": 587} {"train_loss": -5.455633163452148, "global_step": 24657, "epoch": 587} {"train_loss": -5.394230842590332, "global_step": 24658, "epoch": 587} {"train_loss": -5.335888862609863, "global_step": 24659, "epoch": 587} {"train_loss": -5.408641815185547, "global_step": 24660, "epoch": 587} {"train_loss": -5.37988805770874, "global_step": 24661, "epoch": 587} {"train_loss": -5.145003318786621, "global_step": 24662, "epoch": 587} {"train_loss": -5.383183479309082, "global_step": 24663, "epoch": 587} {"train_loss": -5.378561496734619, "global_step": 24664, "epoch": 587} {"train_loss": -5.177422523498535, "global_step": 24665, "epoch": 587} {"train_loss": -5.38771390914917, "global_step": 24666, "epoch": 587} {"train_loss": -5.463127136230469, "global_step": 24667, "epoch": 587} {"train_loss": -5.153017997741699, "global_step": 24668, "epoch": 587} {"train_loss": -5.305891513824463, "global_step": 24669, "epoch": 587} {"train_loss": -5.516707897186279, "global_step": 24670, "epoch": 587} {"train_loss": -5.122172832489014, "global_step": 24671, "epoch": 587} {"train_loss": -5.2849650382995605, "global_step": 24672, "epoch": 587} {"train_loss": -5.342959403991699, "global_step": 24673, "epoch": 587} {"train_loss": -5.312150955200195, "global_step": 24674, "epoch": 587} {"train_loss": -5.370766639709473, "global_step": 24675, "epoch": 587} {"train_loss": -5.603763580322266, "global_step": 24676, "epoch": 587} {"train_loss": -5.424138069152832, "global_step": 24677, "epoch": 587} {"train_loss": -5.460938453674316, "global_step": 24678, "epoch": 587} {"train_loss": -5.348967552185059, "global_step": 24679, "epoch": 587} {"train_loss": -5.339371681213379, "global_step": 24680, "epoch": 587} {"train_loss": -5.491615295410156, "global_step": 24681, "epoch": 587} {"train_loss": -5.285754203796387, "global_step": 24682, "epoch": 587} {"train_loss": -5.381886959075928, "global_step": 24683, "epoch": 587} {"train_loss": -5.323564529418945, "global_step": 24684, "epoch": 587} {"train_loss": -5.325921058654785, "global_step": 24685, "epoch": 587} {"train_loss": -5.438776016235352, "global_step": 24686, "epoch": 587} {"train_loss": -5.4877119064331055, "global_step": 24687, "epoch": 587} {"train_loss": -5.347474098205566, "global_step": 24688, "epoch": 587} {"train_loss": -5.432672500610352, "global_step": 24689, "epoch": 587} {"train_loss": -5.43610143661499, "global_step": 24690, "epoch": 587} {"train_loss": -5.331818580627441, "global_step": 24691, "epoch": 587} {"train_loss": -5.439120769500732, "global_step": 24692, "epoch": 587} {"train_loss": -5.490292549133301, "global_step": 24693, "epoch": 587} {"train_loss": -5.323237419128418, "global_step": 24694, "epoch": 587} {"train_loss": -5.373118661698841, "global_step": 24695, "epoch": 587, "val_loss": 65126.13671875} {"train_loss": -5.337589263916016, "global_step": 24696, "epoch": 588} {"train_loss": -5.443450927734375, "global_step": 24697, "epoch": 588} {"train_loss": -5.359559059143066, "global_step": 24698, "epoch": 588} {"train_loss": -5.243136405944824, "global_step": 24699, "epoch": 588} {"train_loss": -5.375550746917725, "global_step": 24700, "epoch": 588} {"train_loss": -5.382773399353027, "global_step": 24701, "epoch": 588} {"train_loss": -5.304485321044922, "global_step": 24702, "epoch": 588} {"train_loss": -5.425233840942383, "global_step": 24703, "epoch": 588} {"train_loss": -5.404857635498047, "global_step": 24704, "epoch": 588} {"train_loss": -5.392608165740967, "global_step": 24705, "epoch": 588} {"train_loss": -5.460586071014404, "global_step": 24706, "epoch": 588} {"train_loss": -5.390021324157715, "global_step": 24707, "epoch": 588} {"train_loss": -5.392669677734375, "global_step": 24708, "epoch": 588} {"train_loss": -5.372766494750977, "global_step": 24709, "epoch": 588} {"train_loss": -5.292172431945801, "global_step": 24710, "epoch": 588} {"train_loss": -5.470228672027588, "global_step": 24711, "epoch": 588} {"train_loss": -5.281519889831543, "global_step": 24712, "epoch": 588} {"train_loss": -5.284859657287598, "global_step": 24713, "epoch": 588} {"train_loss": -5.360726833343506, "global_step": 24714, "epoch": 588} {"train_loss": -5.397744655609131, "global_step": 24715, "epoch": 588} {"train_loss": -5.36867618560791, "global_step": 24716, "epoch": 588} {"train_loss": -5.334741592407227, "global_step": 24717, "epoch": 588} {"train_loss": -5.371567249298096, "global_step": 24718, "epoch": 588} {"train_loss": -5.352168560028076, "global_step": 24719, "epoch": 588} {"train_loss": -5.411767959594727, "global_step": 24720, "epoch": 588} {"train_loss": -5.273571014404297, "global_step": 24721, "epoch": 588} {"train_loss": -5.450230598449707, "global_step": 24722, "epoch": 588} {"train_loss": -5.262375831604004, "global_step": 24723, "epoch": 588} {"train_loss": -5.459163665771484, "global_step": 24724, "epoch": 588} {"train_loss": -5.493618488311768, "global_step": 24725, "epoch": 588} {"train_loss": -5.490009307861328, "global_step": 24726, "epoch": 588} {"train_loss": -5.357939720153809, "global_step": 24727, "epoch": 588} {"train_loss": -5.416266441345215, "global_step": 24728, "epoch": 588} {"train_loss": -5.445477485656738, "global_step": 24729, "epoch": 588} {"train_loss": -5.4644551277160645, "global_step": 24730, "epoch": 588} {"train_loss": -5.396491527557373, "global_step": 24731, "epoch": 588} {"train_loss": -5.393157958984375, "global_step": 24732, "epoch": 588} {"train_loss": -5.575107574462891, "global_step": 24733, "epoch": 588} {"train_loss": -5.476127624511719, "global_step": 24734, "epoch": 588} {"train_loss": -5.4362030029296875, "global_step": 24735, "epoch": 588} {"train_loss": -5.379131317138672, "global_step": 24736, "epoch": 588} {"train_loss": -5.3910939920516245, "global_step": 24737, "epoch": 588, "val_loss": 65619.234375} {"train_loss": -5.363638401031494, "global_step": 24738, "epoch": 589} {"train_loss": -5.4064860343933105, "global_step": 24739, "epoch": 589} {"train_loss": -5.309268474578857, "global_step": 24740, "epoch": 589} {"train_loss": -5.4573493003845215, "global_step": 24741, "epoch": 589} {"train_loss": -5.240069389343262, "global_step": 24742, "epoch": 589} {"train_loss": -5.433595657348633, "global_step": 24743, "epoch": 589} {"train_loss": -5.22657585144043, "global_step": 24744, "epoch": 589} {"train_loss": -5.276777744293213, "global_step": 24745, "epoch": 589} {"train_loss": -5.4192728996276855, "global_step": 24746, "epoch": 589} {"train_loss": -5.4102582931518555, "global_step": 24747, "epoch": 589} {"train_loss": -5.264562606811523, "global_step": 24748, "epoch": 589} {"train_loss": -5.442527770996094, "global_step": 24749, "epoch": 589} {"train_loss": -5.369534492492676, "global_step": 24750, "epoch": 589} {"train_loss": -5.264364719390869, "global_step": 24751, "epoch": 589} {"train_loss": -5.338635444641113, "global_step": 24752, "epoch": 589} {"train_loss": -5.3918328285217285, "global_step": 24753, "epoch": 589} {"train_loss": -5.270650863647461, "global_step": 24754, "epoch": 589} {"train_loss": -5.302420139312744, "global_step": 24755, "epoch": 589} {"train_loss": -5.416712760925293, "global_step": 24756, "epoch": 589} {"train_loss": -5.493352890014648, "global_step": 24757, "epoch": 589} {"train_loss": -5.3966875076293945, "global_step": 24758, "epoch": 589} {"train_loss": -5.454096794128418, "global_step": 24759, "epoch": 589} {"train_loss": -5.279228210449219, "global_step": 24760, "epoch": 589} {"train_loss": -5.275085926055908, "global_step": 24761, "epoch": 589} {"train_loss": -5.420082092285156, "global_step": 24762, "epoch": 589} {"train_loss": -5.303432464599609, "global_step": 24763, "epoch": 589} {"train_loss": -5.426307678222656, "global_step": 24764, "epoch": 589} {"train_loss": -5.421550750732422, "global_step": 24765, "epoch": 589} {"train_loss": -5.275733947753906, "global_step": 24766, "epoch": 589} {"train_loss": -5.383691310882568, "global_step": 24767, "epoch": 589} {"train_loss": -5.422654151916504, "global_step": 24768, "epoch": 589} {"train_loss": -5.292370319366455, "global_step": 24769, "epoch": 589} {"train_loss": -5.432768821716309, "global_step": 24770, "epoch": 589} {"train_loss": -5.397958755493164, "global_step": 24771, "epoch": 589} {"train_loss": -5.436931610107422, "global_step": 24772, "epoch": 589} {"train_loss": -5.468652725219727, "global_step": 24773, "epoch": 589} {"train_loss": -5.341762542724609, "global_step": 24774, "epoch": 589} {"train_loss": -5.324704647064209, "global_step": 24775, "epoch": 589} {"train_loss": -5.436802864074707, "global_step": 24776, "epoch": 589} {"train_loss": -5.4549360275268555, "global_step": 24777, "epoch": 589} {"train_loss": -5.289522647857666, "global_step": 24778, "epoch": 589} {"train_loss": -5.369834241412935, "global_step": 24779, "epoch": 589, "val_loss": 65297.109375} {"train_loss": -5.376614570617676, "global_step": 24780, "epoch": 590} {"train_loss": -5.369967937469482, "global_step": 24781, "epoch": 590} {"train_loss": -5.376412391662598, "global_step": 24782, "epoch": 590} {"train_loss": -5.345484733581543, "global_step": 24783, "epoch": 590} {"train_loss": -5.3965911865234375, "global_step": 24784, "epoch": 590} {"train_loss": -5.430952072143555, "global_step": 24785, "epoch": 590} {"train_loss": -5.517470359802246, "global_step": 24786, "epoch": 590} {"train_loss": -5.297704696655273, "global_step": 24787, "epoch": 590} {"train_loss": -5.482017993927002, "global_step": 24788, "epoch": 590} {"train_loss": -5.315352916717529, "global_step": 24789, "epoch": 590} {"train_loss": -5.341422080993652, "global_step": 24790, "epoch": 590} {"train_loss": -5.357369422912598, "global_step": 24791, "epoch": 590} {"train_loss": -5.404925346374512, "global_step": 24792, "epoch": 590} {"train_loss": -5.297418594360352, "global_step": 24793, "epoch": 590} {"train_loss": -5.315613746643066, "global_step": 24794, "epoch": 590} {"train_loss": -5.330527305603027, "global_step": 24795, "epoch": 590} {"train_loss": -5.229816436767578, "global_step": 24796, "epoch": 590} {"train_loss": -5.427622318267822, "global_step": 24797, "epoch": 590} {"train_loss": -5.375397682189941, "global_step": 24798, "epoch": 590} {"train_loss": -5.26539421081543, "global_step": 24799, "epoch": 590} {"train_loss": -5.452538013458252, "global_step": 24800, "epoch": 590} {"train_loss": -5.329771995544434, "global_step": 24801, "epoch": 590} {"train_loss": -5.349996089935303, "global_step": 24802, "epoch": 590} {"train_loss": -5.465769290924072, "global_step": 24803, "epoch": 590} {"train_loss": -5.374107360839844, "global_step": 24804, "epoch": 590} {"train_loss": -5.391340255737305, "global_step": 24805, "epoch": 590} {"train_loss": -5.4756927490234375, "global_step": 24806, "epoch": 590} {"train_loss": -5.3383636474609375, "global_step": 24807, "epoch": 590} {"train_loss": -5.368350982666016, "global_step": 24808, "epoch": 590} {"train_loss": -5.373973846435547, "global_step": 24809, "epoch": 590} {"train_loss": -5.483651161193848, "global_step": 24810, "epoch": 590} {"train_loss": -5.4237470626831055, "global_step": 24811, "epoch": 590} {"train_loss": -5.297901630401611, "global_step": 24812, "epoch": 590} {"train_loss": -5.389902591705322, "global_step": 24813, "epoch": 590} {"train_loss": -5.352735996246338, "global_step": 24814, "epoch": 590} {"train_loss": -5.375277042388916, "global_step": 24815, "epoch": 590} {"train_loss": -5.328298091888428, "global_step": 24816, "epoch": 590} {"train_loss": -5.410191535949707, "global_step": 24817, "epoch": 590} {"train_loss": -5.501147747039795, "global_step": 24818, "epoch": 590} {"train_loss": -5.298409461975098, "global_step": 24819, "epoch": 590} {"train_loss": -5.472333908081055, "global_step": 24820, "epoch": 590} {"train_loss": -5.3764366535913375, "global_step": 24821, "epoch": 590, "val_loss": 65293.90625} {"train_loss": -5.403643608093262, "global_step": 24822, "epoch": 591} {"train_loss": -5.293636322021484, "global_step": 24823, "epoch": 591} {"train_loss": -5.342977523803711, "global_step": 24824, "epoch": 591} {"train_loss": -5.5504150390625, "global_step": 24825, "epoch": 591} {"train_loss": -5.352787017822266, "global_step": 24826, "epoch": 591} {"train_loss": -5.2189483642578125, "global_step": 24827, "epoch": 591} {"train_loss": -5.488404273986816, "global_step": 24828, "epoch": 591} {"train_loss": -5.332553863525391, "global_step": 24829, "epoch": 591} {"train_loss": -5.5200958251953125, "global_step": 24830, "epoch": 591} {"train_loss": -5.410855770111084, "global_step": 24831, "epoch": 591} {"train_loss": -5.354174613952637, "global_step": 24832, "epoch": 591} {"train_loss": -5.3675689697265625, "global_step": 24833, "epoch": 591} {"train_loss": -5.410953998565674, "global_step": 24834, "epoch": 591} {"train_loss": -5.385856628417969, "global_step": 24835, "epoch": 591} {"train_loss": -5.386501312255859, "global_step": 24836, "epoch": 591} {"train_loss": -5.482985496520996, "global_step": 24837, "epoch": 591} {"train_loss": -5.436136245727539, "global_step": 24838, "epoch": 591} {"train_loss": -5.451002597808838, "global_step": 24839, "epoch": 591} {"train_loss": -5.337888717651367, "global_step": 24840, "epoch": 591} {"train_loss": -5.448325157165527, "global_step": 24841, "epoch": 591} {"train_loss": -5.362854957580566, "global_step": 24842, "epoch": 591} {"train_loss": -5.373037338256836, "global_step": 24843, "epoch": 591} {"train_loss": -5.4906768798828125, "global_step": 24844, "epoch": 591} {"train_loss": -5.412215232849121, "global_step": 24845, "epoch": 591} {"train_loss": -5.415461540222168, "global_step": 24846, "epoch": 591} {"train_loss": -5.324483394622803, "global_step": 24847, "epoch": 591} {"train_loss": -5.408748149871826, "global_step": 24848, "epoch": 591} {"train_loss": -5.401721477508545, "global_step": 24849, "epoch": 591} {"train_loss": -5.417629718780518, "global_step": 24850, "epoch": 591} {"train_loss": -5.386570930480957, "global_step": 24851, "epoch": 591} {"train_loss": -5.461702346801758, "global_step": 24852, "epoch": 591} {"train_loss": -5.406874179840088, "global_step": 24853, "epoch": 591} {"train_loss": -5.408007621765137, "global_step": 24854, "epoch": 591} {"train_loss": -5.3920159339904785, "global_step": 24855, "epoch": 591} {"train_loss": -5.483678817749023, "global_step": 24856, "epoch": 591} {"train_loss": -5.2090253829956055, "global_step": 24857, "epoch": 591} {"train_loss": -5.232370376586914, "global_step": 24858, "epoch": 591} {"train_loss": -5.584981918334961, "global_step": 24859, "epoch": 591} {"train_loss": -5.424759864807129, "global_step": 24860, "epoch": 591} {"train_loss": -5.343737602233887, "global_step": 24861, "epoch": 591} {"train_loss": -5.448999404907227, "global_step": 24862, "epoch": 591} {"train_loss": -5.398774022147769, "global_step": 24863, "epoch": 591, "val_loss": 65441.49609375} {"train_loss": -5.399267196655273, "global_step": 24864, "epoch": 592} {"train_loss": -5.323783874511719, "global_step": 24865, "epoch": 592} {"train_loss": -5.46077823638916, "global_step": 24866, "epoch": 592} {"train_loss": -5.350779056549072, "global_step": 24867, "epoch": 592} {"train_loss": -5.302333831787109, "global_step": 24868, "epoch": 592} {"train_loss": -5.482259750366211, "global_step": 24869, "epoch": 592} {"train_loss": -5.466882705688477, "global_step": 24870, "epoch": 592} {"train_loss": -5.3235273361206055, "global_step": 24871, "epoch": 592} {"train_loss": -5.391246795654297, "global_step": 24872, "epoch": 592} {"train_loss": -5.496647834777832, "global_step": 24873, "epoch": 592} {"train_loss": -5.389067649841309, "global_step": 24874, "epoch": 592} {"train_loss": -5.333192825317383, "global_step": 24875, "epoch": 592} {"train_loss": -5.2815260887146, "global_step": 24876, "epoch": 592} {"train_loss": -5.481025695800781, "global_step": 24877, "epoch": 592} {"train_loss": -5.385290145874023, "global_step": 24878, "epoch": 592} {"train_loss": -5.451655864715576, "global_step": 24879, "epoch": 592} {"train_loss": -5.29828405380249, "global_step": 24880, "epoch": 592} {"train_loss": -5.404937744140625, "global_step": 24881, "epoch": 592} {"train_loss": -5.312393665313721, "global_step": 24882, "epoch": 592} {"train_loss": -5.3317060470581055, "global_step": 24883, "epoch": 592} {"train_loss": -5.343804836273193, "global_step": 24884, "epoch": 592} {"train_loss": -5.421354293823242, "global_step": 24885, "epoch": 592} {"train_loss": -5.446376800537109, "global_step": 24886, "epoch": 592} {"train_loss": -5.269817352294922, "global_step": 24887, "epoch": 592} {"train_loss": -5.432611465454102, "global_step": 24888, "epoch": 592} {"train_loss": -5.412756443023682, "global_step": 24889, "epoch": 592} {"train_loss": -5.385188102722168, "global_step": 24890, "epoch": 592} {"train_loss": -5.3595781326293945, "global_step": 24891, "epoch": 592} {"train_loss": -5.493875503540039, "global_step": 24892, "epoch": 592} {"train_loss": -5.407270908355713, "global_step": 24893, "epoch": 592} {"train_loss": -5.3907670974731445, "global_step": 24894, "epoch": 592} {"train_loss": -5.524137496948242, "global_step": 24895, "epoch": 592} {"train_loss": -5.39002799987793, "global_step": 24896, "epoch": 592} {"train_loss": -5.4636125564575195, "global_step": 24897, "epoch": 592} {"train_loss": -5.4188032150268555, "global_step": 24898, "epoch": 592} {"train_loss": -5.417633056640625, "global_step": 24899, "epoch": 592} {"train_loss": -5.396676063537598, "global_step": 24900, "epoch": 592} {"train_loss": -5.309350967407227, "global_step": 24901, "epoch": 592} {"train_loss": -5.350835800170898, "global_step": 24902, "epoch": 592} {"train_loss": -5.367300033569336, "global_step": 24903, "epoch": 592} {"train_loss": -5.482661247253418, "global_step": 24904, "epoch": 592} {"train_loss": -5.391742763065157, "global_step": 24905, "epoch": 592, "val_loss": 65488.2421875} {"train_loss": -5.4306230545043945, "global_step": 24906, "epoch": 593} {"train_loss": -5.392820358276367, "global_step": 24907, "epoch": 593} {"train_loss": -5.444818496704102, "global_step": 24908, "epoch": 593} {"train_loss": -5.453739643096924, "global_step": 24909, "epoch": 593} {"train_loss": -5.2762322425842285, "global_step": 24910, "epoch": 593} {"train_loss": -5.423442363739014, "global_step": 24911, "epoch": 593} {"train_loss": -5.505951881408691, "global_step": 24912, "epoch": 593} {"train_loss": -5.364741325378418, "global_step": 24913, "epoch": 593} {"train_loss": -5.388080596923828, "global_step": 24914, "epoch": 593} {"train_loss": -5.373963356018066, "global_step": 24915, "epoch": 593} {"train_loss": -5.468336582183838, "global_step": 24916, "epoch": 593} {"train_loss": -5.436293125152588, "global_step": 24917, "epoch": 593} {"train_loss": -5.362430572509766, "global_step": 24918, "epoch": 593} {"train_loss": -5.415207862854004, "global_step": 24919, "epoch": 593} {"train_loss": -5.439031600952148, "global_step": 24920, "epoch": 593} {"train_loss": -5.525294303894043, "global_step": 24921, "epoch": 593} {"train_loss": -5.471196174621582, "global_step": 24922, "epoch": 593} {"train_loss": -5.3018646240234375, "global_step": 24923, "epoch": 593} {"train_loss": -5.437708377838135, "global_step": 24924, "epoch": 593} {"train_loss": -5.352882385253906, "global_step": 24925, "epoch": 593} {"train_loss": -5.356382369995117, "global_step": 24926, "epoch": 593} {"train_loss": -5.40401029586792, "global_step": 24927, "epoch": 593} {"train_loss": -5.3377275466918945, "global_step": 24928, "epoch": 593} {"train_loss": -5.268615245819092, "global_step": 24929, "epoch": 593} {"train_loss": -5.453753471374512, "global_step": 24930, "epoch": 593} {"train_loss": -5.342979431152344, "global_step": 24931, "epoch": 593} {"train_loss": -5.406269073486328, "global_step": 24932, "epoch": 593} {"train_loss": -5.440052509307861, "global_step": 24933, "epoch": 593} {"train_loss": -5.2962541580200195, "global_step": 24934, "epoch": 593} {"train_loss": -5.354413986206055, "global_step": 24935, "epoch": 593} {"train_loss": -5.442479133605957, "global_step": 24936, "epoch": 593} {"train_loss": -5.373889446258545, "global_step": 24937, "epoch": 593} {"train_loss": -5.35695743560791, "global_step": 24938, "epoch": 593} {"train_loss": -5.509735107421875, "global_step": 24939, "epoch": 593} {"train_loss": -5.280213356018066, "global_step": 24940, "epoch": 593} {"train_loss": -5.370894432067871, "global_step": 24941, "epoch": 593} {"train_loss": -5.332634449005127, "global_step": 24942, "epoch": 593} {"train_loss": -5.292685508728027, "global_step": 24943, "epoch": 593} {"train_loss": -5.371647834777832, "global_step": 24944, "epoch": 593} {"train_loss": -5.458674907684326, "global_step": 24945, "epoch": 593} {"train_loss": -5.332736015319824, "global_step": 24946, "epoch": 593} {"train_loss": -5.388924485161191, "global_step": 24947, "epoch": 593, "val_loss": 65031.9296875} {"train_loss": -5.443556785583496, "global_step": 24948, "epoch": 594} {"train_loss": -5.370135307312012, "global_step": 24949, "epoch": 594} {"train_loss": -5.311831951141357, "global_step": 24950, "epoch": 594} {"train_loss": -5.37816858291626, "global_step": 24951, "epoch": 594} {"train_loss": -5.4796833992004395, "global_step": 24952, "epoch": 594} {"train_loss": -5.374746322631836, "global_step": 24953, "epoch": 594} {"train_loss": -5.37537145614624, "global_step": 24954, "epoch": 594} {"train_loss": -5.274406909942627, "global_step": 24955, "epoch": 594} {"train_loss": -5.400975227355957, "global_step": 24956, "epoch": 594} {"train_loss": -5.432397842407227, "global_step": 24957, "epoch": 594} {"train_loss": -5.414692401885986, "global_step": 24958, "epoch": 594} {"train_loss": -5.386115074157715, "global_step": 24959, "epoch": 594} {"train_loss": -5.393193244934082, "global_step": 24960, "epoch": 594} {"train_loss": -5.432247161865234, "global_step": 24961, "epoch": 594} {"train_loss": -5.523841381072998, "global_step": 24962, "epoch": 594} {"train_loss": -5.34304141998291, "global_step": 24963, "epoch": 594} {"train_loss": -5.355179786682129, "global_step": 24964, "epoch": 594} {"train_loss": -5.377317428588867, "global_step": 24965, "epoch": 594} {"train_loss": -5.40676736831665, "global_step": 24966, "epoch": 594} {"train_loss": -5.46649169921875, "global_step": 24967, "epoch": 594} {"train_loss": -5.298801422119141, "global_step": 24968, "epoch": 594} {"train_loss": -5.250452041625977, "global_step": 24969, "epoch": 594} {"train_loss": -5.541072845458984, "global_step": 24970, "epoch": 594} {"train_loss": -5.370917320251465, "global_step": 24971, "epoch": 594} {"train_loss": -5.348203659057617, "global_step": 24972, "epoch": 594} {"train_loss": -5.426027297973633, "global_step": 24973, "epoch": 594} {"train_loss": -5.2896270751953125, "global_step": 24974, "epoch": 594} {"train_loss": -5.4776177406311035, "global_step": 24975, "epoch": 594} {"train_loss": -5.233110427856445, "global_step": 24976, "epoch": 594} {"train_loss": -5.271507263183594, "global_step": 24977, "epoch": 594} {"train_loss": -5.503766059875488, "global_step": 24978, "epoch": 594} {"train_loss": -5.299602031707764, "global_step": 24979, "epoch": 594} {"train_loss": -5.418523788452148, "global_step": 24980, "epoch": 594} {"train_loss": -5.500724792480469, "global_step": 24981, "epoch": 594} {"train_loss": -5.127717971801758, "global_step": 24982, "epoch": 594} {"train_loss": -5.3133673667907715, "global_step": 24983, "epoch": 594} {"train_loss": -5.493612766265869, "global_step": 24984, "epoch": 594} {"train_loss": -5.284215927124023, "global_step": 24985, "epoch": 594} {"train_loss": -5.450415134429932, "global_step": 24986, "epoch": 594} {"train_loss": -5.460198402404785, "global_step": 24987, "epoch": 594} {"train_loss": -5.4067583084106445, "global_step": 24988, "epoch": 594} {"train_loss": -5.385703983761015, "global_step": 24989, "epoch": 594, "val_loss": 64949.90625} {"train_loss": -5.438632965087891, "global_step": 24990, "epoch": 595} {"train_loss": -5.477771759033203, "global_step": 24991, "epoch": 595} {"train_loss": -5.3876190185546875, "global_step": 24992, "epoch": 595} {"train_loss": -5.494643688201904, "global_step": 24993, "epoch": 595} {"train_loss": -5.48787784576416, "global_step": 24994, "epoch": 595} {"train_loss": -5.241192817687988, "global_step": 24995, "epoch": 595} {"train_loss": -5.540602684020996, "global_step": 24996, "epoch": 595} {"train_loss": -5.252957820892334, "global_step": 24997, "epoch": 595} {"train_loss": -5.341653823852539, "global_step": 24998, "epoch": 595} {"train_loss": -5.39240026473999, "global_step": 24999, "epoch": 595} {"train_loss": -5.353342056274414, "global_step": 25000, "epoch": 595} {"train_loss": -5.357672214508057, "global_step": 25001, "epoch": 595} {"train_loss": -5.29556941986084, "global_step": 25002, "epoch": 595} {"train_loss": -5.332252025604248, "global_step": 25003, "epoch": 595} {"train_loss": -5.217492580413818, "global_step": 25004, "epoch": 595} {"train_loss": -5.226773262023926, "global_step": 25005, "epoch": 595} {"train_loss": -5.395051956176758, "global_step": 25006, "epoch": 595} {"train_loss": -5.227651596069336, "global_step": 25007, "epoch": 595} {"train_loss": -5.353323936462402, "global_step": 25008, "epoch": 595} {"train_loss": -5.384681701660156, "global_step": 25009, "epoch": 595} {"train_loss": -5.458396911621094, "global_step": 25010, "epoch": 595} {"train_loss": -5.374353408813477, "global_step": 25011, "epoch": 595} {"train_loss": -5.459047317504883, "global_step": 25012, "epoch": 595} {"train_loss": -5.456396102905273, "global_step": 25013, "epoch": 595} {"train_loss": -5.326581954956055, "global_step": 25014, "epoch": 595} {"train_loss": -5.386512279510498, "global_step": 25015, "epoch": 595} {"train_loss": -5.332400321960449, "global_step": 25016, "epoch": 595} {"train_loss": -5.359945774078369, "global_step": 25017, "epoch": 595} {"train_loss": -5.3815999031066895, "global_step": 25018, "epoch": 595} {"train_loss": -5.399026870727539, "global_step": 25019, "epoch": 595} {"train_loss": -5.453439235687256, "global_step": 25020, "epoch": 595} {"train_loss": -5.430657386779785, "global_step": 25021, "epoch": 595} {"train_loss": -5.5213727951049805, "global_step": 25022, "epoch": 595} {"train_loss": -5.47080135345459, "global_step": 25023, "epoch": 595} {"train_loss": -5.427857398986816, "global_step": 25024, "epoch": 595} {"train_loss": -5.47145414352417, "global_step": 25025, "epoch": 595} {"train_loss": -5.436993598937988, "global_step": 25026, "epoch": 595} {"train_loss": -5.321377754211426, "global_step": 25027, "epoch": 595} {"train_loss": -5.270796775817871, "global_step": 25028, "epoch": 595} {"train_loss": -5.50836706161499, "global_step": 25029, "epoch": 595} {"train_loss": -5.406139850616455, "global_step": 25030, "epoch": 595} {"train_loss": -5.385746626626878, "global_step": 25031, "epoch": 595, "val_loss": 65315.046875} {"train_loss": -5.439957618713379, "global_step": 25032, "epoch": 596} {"train_loss": -5.370175361633301, "global_step": 25033, "epoch": 596} {"train_loss": -5.3319411277771, "global_step": 25034, "epoch": 596} {"train_loss": -5.381100654602051, "global_step": 25035, "epoch": 596} {"train_loss": -5.375625133514404, "global_step": 25036, "epoch": 596} {"train_loss": -5.454066753387451, "global_step": 25037, "epoch": 596} {"train_loss": -5.507706642150879, "global_step": 25038, "epoch": 596} {"train_loss": -5.402420997619629, "global_step": 25039, "epoch": 596} {"train_loss": -5.430754661560059, "global_step": 25040, "epoch": 596} {"train_loss": -5.573633193969727, "global_step": 25041, "epoch": 596} {"train_loss": -5.339433670043945, "global_step": 25042, "epoch": 596} {"train_loss": -5.414059638977051, "global_step": 25043, "epoch": 596} {"train_loss": -5.343084335327148, "global_step": 25044, "epoch": 596} {"train_loss": -5.346853256225586, "global_step": 25045, "epoch": 596} {"train_loss": -5.480985164642334, "global_step": 25046, "epoch": 596} {"train_loss": -5.4759202003479, "global_step": 25047, "epoch": 596} {"train_loss": -5.490197658538818, "global_step": 25048, "epoch": 596} {"train_loss": -5.402276039123535, "global_step": 25049, "epoch": 596} {"train_loss": -5.477687835693359, "global_step": 25050, "epoch": 596} {"train_loss": -5.364819049835205, "global_step": 25051, "epoch": 596} {"train_loss": -5.312856197357178, "global_step": 25052, "epoch": 596} {"train_loss": -5.464860916137695, "global_step": 25053, "epoch": 596} {"train_loss": -5.386948108673096, "global_step": 25054, "epoch": 596} {"train_loss": -5.335309982299805, "global_step": 25055, "epoch": 596} {"train_loss": -5.332237720489502, "global_step": 25056, "epoch": 596} {"train_loss": -5.3903398513793945, "global_step": 25057, "epoch": 596} {"train_loss": -5.345938682556152, "global_step": 25058, "epoch": 596} {"train_loss": -5.319038391113281, "global_step": 25059, "epoch": 596} {"train_loss": -5.458209037780762, "global_step": 25060, "epoch": 596} {"train_loss": -5.391513824462891, "global_step": 25061, "epoch": 596} {"train_loss": -5.338505744934082, "global_step": 25062, "epoch": 596} {"train_loss": -5.354514122009277, "global_step": 25063, "epoch": 596} {"train_loss": -5.382332801818848, "global_step": 25064, "epoch": 596} {"train_loss": -5.340077877044678, "global_step": 25065, "epoch": 596} {"train_loss": -5.421864032745361, "global_step": 25066, "epoch": 596} {"train_loss": -5.435712814331055, "global_step": 25067, "epoch": 596} {"train_loss": -5.355784893035889, "global_step": 25068, "epoch": 596} {"train_loss": -5.36531925201416, "global_step": 25069, "epoch": 596} {"train_loss": -5.395413875579834, "global_step": 25070, "epoch": 596} {"train_loss": -5.393826961517334, "global_step": 25071, "epoch": 596} {"train_loss": -5.242785453796387, "global_step": 25072, "epoch": 596} {"train_loss": -5.393467630658831, "global_step": 25073, "epoch": 596, "val_loss": 65298.0859375} {"train_loss": -5.448221206665039, "global_step": 25074, "epoch": 597} {"train_loss": -5.39246940612793, "global_step": 25075, "epoch": 597} {"train_loss": -5.444079399108887, "global_step": 25076, "epoch": 597} {"train_loss": -5.489336013793945, "global_step": 25077, "epoch": 597} {"train_loss": -5.298288345336914, "global_step": 25078, "epoch": 597} {"train_loss": -5.377748489379883, "global_step": 25079, "epoch": 597} {"train_loss": -5.345488548278809, "global_step": 25080, "epoch": 597} {"train_loss": -5.390833854675293, "global_step": 25081, "epoch": 597} {"train_loss": -5.442956447601318, "global_step": 25082, "epoch": 597} {"train_loss": -5.366750717163086, "global_step": 25083, "epoch": 597} {"train_loss": -5.258275985717773, "global_step": 25084, "epoch": 597} {"train_loss": -5.355252265930176, "global_step": 25085, "epoch": 597} {"train_loss": -5.346752643585205, "global_step": 25086, "epoch": 597} {"train_loss": -5.359318256378174, "global_step": 25087, "epoch": 597} {"train_loss": -5.320323944091797, "global_step": 25088, "epoch": 597} {"train_loss": -5.334698677062988, "global_step": 25089, "epoch": 597} {"train_loss": -5.321794509887695, "global_step": 25090, "epoch": 597} {"train_loss": -5.409830093383789, "global_step": 25091, "epoch": 597} {"train_loss": -5.540769100189209, "global_step": 25092, "epoch": 597} {"train_loss": -5.409167289733887, "global_step": 25093, "epoch": 597} {"train_loss": -5.400991439819336, "global_step": 25094, "epoch": 597} {"train_loss": -5.335031032562256, "global_step": 25095, "epoch": 597} {"train_loss": -5.372102737426758, "global_step": 25096, "epoch": 597} {"train_loss": -5.3554911613464355, "global_step": 25097, "epoch": 597} {"train_loss": -5.425188064575195, "global_step": 25098, "epoch": 597} {"train_loss": -5.416224479675293, "global_step": 25099, "epoch": 597} {"train_loss": -5.372230529785156, "global_step": 25100, "epoch": 597} {"train_loss": -5.4417724609375, "global_step": 25101, "epoch": 597} {"train_loss": -5.4299187660217285, "global_step": 25102, "epoch": 597} {"train_loss": -5.383085250854492, "global_step": 25103, "epoch": 597} {"train_loss": -5.330589294433594, "global_step": 25104, "epoch": 597} {"train_loss": -5.457291603088379, "global_step": 25105, "epoch": 597} {"train_loss": -5.389958381652832, "global_step": 25106, "epoch": 597} {"train_loss": -5.393718719482422, "global_step": 25107, "epoch": 597} {"train_loss": -5.3926496505737305, "global_step": 25108, "epoch": 597} {"train_loss": -5.455086708068848, "global_step": 25109, "epoch": 597} {"train_loss": -5.264708518981934, "global_step": 25110, "epoch": 597} {"train_loss": -5.329695224761963, "global_step": 25111, "epoch": 597} {"train_loss": -5.45197868347168, "global_step": 25112, "epoch": 597} {"train_loss": -5.461315155029297, "global_step": 25113, "epoch": 597} {"train_loss": -5.305593967437744, "global_step": 25114, "epoch": 597} {"train_loss": -5.384549345288958, "global_step": 25115, "epoch": 597, "val_loss": 65320.96875} {"train_loss": -5.393985748291016, "global_step": 25116, "epoch": 598} {"train_loss": -5.362803936004639, "global_step": 25117, "epoch": 598} {"train_loss": -5.37393856048584, "global_step": 25118, "epoch": 598} {"train_loss": -5.458412170410156, "global_step": 25119, "epoch": 598} {"train_loss": -5.392631530761719, "global_step": 25120, "epoch": 598} {"train_loss": -5.326262950897217, "global_step": 25121, "epoch": 598} {"train_loss": -5.4039506912231445, "global_step": 25122, "epoch": 598} {"train_loss": -5.217271327972412, "global_step": 25123, "epoch": 598} {"train_loss": -5.389499664306641, "global_step": 25124, "epoch": 598} {"train_loss": -5.40800142288208, "global_step": 25125, "epoch": 598} {"train_loss": -5.288248062133789, "global_step": 25126, "epoch": 598} {"train_loss": -5.401772975921631, "global_step": 25127, "epoch": 598} {"train_loss": -5.320704460144043, "global_step": 25128, "epoch": 598} {"train_loss": -5.3511643409729, "global_step": 25129, "epoch": 598} {"train_loss": -5.255939483642578, "global_step": 25130, "epoch": 598} {"train_loss": -5.383540153503418, "global_step": 25131, "epoch": 598} {"train_loss": -5.468639373779297, "global_step": 25132, "epoch": 598} {"train_loss": -5.4453125, "global_step": 25133, "epoch": 598} {"train_loss": -5.350358009338379, "global_step": 25134, "epoch": 598} {"train_loss": -5.285794258117676, "global_step": 25135, "epoch": 598} {"train_loss": -5.3201985359191895, "global_step": 25136, "epoch": 598} {"train_loss": -5.240095615386963, "global_step": 25137, "epoch": 598} {"train_loss": -5.369860649108887, "global_step": 25138, "epoch": 598} {"train_loss": -5.428566932678223, "global_step": 25139, "epoch": 598} {"train_loss": -5.344260215759277, "global_step": 25140, "epoch": 598} {"train_loss": -5.538806915283203, "global_step": 25141, "epoch": 598} {"train_loss": -5.377823829650879, "global_step": 25142, "epoch": 598} {"train_loss": -5.332754135131836, "global_step": 25143, "epoch": 598} {"train_loss": -5.4387898445129395, "global_step": 25144, "epoch": 598} {"train_loss": -5.411136627197266, "global_step": 25145, "epoch": 598} {"train_loss": -5.307650566101074, "global_step": 25146, "epoch": 598} {"train_loss": -5.496342658996582, "global_step": 25147, "epoch": 598} {"train_loss": -5.460429668426514, "global_step": 25148, "epoch": 598} {"train_loss": -5.340904235839844, "global_step": 25149, "epoch": 598} {"train_loss": -5.399623870849609, "global_step": 25150, "epoch": 598} {"train_loss": -5.29573917388916, "global_step": 25151, "epoch": 598} {"train_loss": -5.348468780517578, "global_step": 25152, "epoch": 598} {"train_loss": -5.566363334655762, "global_step": 25153, "epoch": 598} {"train_loss": -5.396934509277344, "global_step": 25154, "epoch": 598} {"train_loss": -5.135709762573242, "global_step": 25155, "epoch": 598} {"train_loss": -5.384166240692139, "global_step": 25156, "epoch": 598} {"train_loss": -5.3714723359970815, "global_step": 25157, "epoch": 598, "val_loss": 65611.1328125} {"train_loss": -5.346518516540527, "global_step": 25158, "epoch": 599} {"train_loss": -5.3712592124938965, "global_step": 25159, "epoch": 599} {"train_loss": -5.393329620361328, "global_step": 25160, "epoch": 599} {"train_loss": -5.323192596435547, "global_step": 25161, "epoch": 599} {"train_loss": -5.277700424194336, "global_step": 25162, "epoch": 599} {"train_loss": -5.438638210296631, "global_step": 25163, "epoch": 599} {"train_loss": -5.2935075759887695, "global_step": 25164, "epoch": 599} {"train_loss": -5.2985520362854, "global_step": 25165, "epoch": 599} {"train_loss": -5.450343132019043, "global_step": 25166, "epoch": 599} {"train_loss": -5.260595321655273, "global_step": 25167, "epoch": 599} {"train_loss": -5.482337474822998, "global_step": 25168, "epoch": 599} {"train_loss": -5.405309677124023, "global_step": 25169, "epoch": 599} {"train_loss": -5.222684860229492, "global_step": 25170, "epoch": 599} {"train_loss": -5.357610702514648, "global_step": 25171, "epoch": 599} {"train_loss": -5.295726299285889, "global_step": 25172, "epoch": 599} {"train_loss": -5.241695404052734, "global_step": 25173, "epoch": 599} {"train_loss": -5.4717864990234375, "global_step": 25174, "epoch": 599} {"train_loss": -5.3458638191223145, "global_step": 25175, "epoch": 599} {"train_loss": -5.371001243591309, "global_step": 25176, "epoch": 599} {"train_loss": -5.407741069793701, "global_step": 25177, "epoch": 599} {"train_loss": -5.274528503417969, "global_step": 25178, "epoch": 599} {"train_loss": -5.388154029846191, "global_step": 25179, "epoch": 599} {"train_loss": -5.425724983215332, "global_step": 25180, "epoch": 599} {"train_loss": -5.326543807983398, "global_step": 25181, "epoch": 599} {"train_loss": -5.485300064086914, "global_step": 25182, "epoch": 599} {"train_loss": -5.338515758514404, "global_step": 25183, "epoch": 599} {"train_loss": -5.472916603088379, "global_step": 25184, "epoch": 599} {"train_loss": -5.366970062255859, "global_step": 25185, "epoch": 599} {"train_loss": -5.257174968719482, "global_step": 25186, "epoch": 599} {"train_loss": -5.321789741516113, "global_step": 25187, "epoch": 599} {"train_loss": -5.417647838592529, "global_step": 25188, "epoch": 599} {"train_loss": -5.464613437652588, "global_step": 25189, "epoch": 599} {"train_loss": -5.4378275871276855, "global_step": 25190, "epoch": 599} {"train_loss": -5.415426254272461, "global_step": 25191, "epoch": 599} {"train_loss": -5.382602691650391, "global_step": 25192, "epoch": 599} {"train_loss": -5.476739883422852, "global_step": 25193, "epoch": 599} {"train_loss": -5.476106643676758, "global_step": 25194, "epoch": 599} {"train_loss": -5.38188362121582, "global_step": 25195, "epoch": 599} {"train_loss": -5.195083141326904, "global_step": 25196, "epoch": 599} {"train_loss": -5.464835166931152, "global_step": 25197, "epoch": 599} {"train_loss": -5.45310640335083, "global_step": 25198, "epoch": 599} {"train_loss": -5.373130014964512, "global_step": 25199, "epoch": 599, "val_loss": 65065.6171875} {"train_loss": -5.413696765899658, "global_step": 25200, "epoch": 600} {"train_loss": -5.451338768005371, "global_step": 25201, "epoch": 600} {"train_loss": -5.333981513977051, "global_step": 25202, "epoch": 600} {"train_loss": -5.303159713745117, "global_step": 25203, "epoch": 600} {"train_loss": -5.33134651184082, "global_step": 25204, "epoch": 600} {"train_loss": -5.490067958831787, "global_step": 25205, "epoch": 600} {"train_loss": -5.1974005699157715, "global_step": 25206, "epoch": 600} {"train_loss": -5.385358810424805, "global_step": 25207, "epoch": 600} {"train_loss": -5.3679656982421875, "global_step": 25208, "epoch": 600} {"train_loss": -5.451727390289307, "global_step": 25209, "epoch": 600} {"train_loss": -5.304543495178223, "global_step": 25210, "epoch": 600} {"train_loss": -5.379421710968018, "global_step": 25211, "epoch": 600} {"train_loss": -5.415279865264893, "global_step": 25212, "epoch": 600} {"train_loss": -5.422544479370117, "global_step": 25213, "epoch": 600} {"train_loss": -5.4682207107543945, "global_step": 25214, "epoch": 600} {"train_loss": -5.422924995422363, "global_step": 25215, "epoch": 600} {"train_loss": -5.445830821990967, "global_step": 25216, "epoch": 600} {"train_loss": -5.301542282104492, "global_step": 25217, "epoch": 600} {"train_loss": -5.420994758605957, "global_step": 25218, "epoch": 600} {"train_loss": -5.230807304382324, "global_step": 25219, "epoch": 600} {"train_loss": -5.304708480834961, "global_step": 25220, "epoch": 600} {"train_loss": -5.401474952697754, "global_step": 25221, "epoch": 600} {"train_loss": -5.333095550537109, "global_step": 25222, "epoch": 600} {"train_loss": -5.377572059631348, "global_step": 25223, "epoch": 600} {"train_loss": -5.278465270996094, "global_step": 25224, "epoch": 600} {"train_loss": -5.460547924041748, "global_step": 25225, "epoch": 600} {"train_loss": -5.325013637542725, "global_step": 25226, "epoch": 600} {"train_loss": -5.524785041809082, "global_step": 25227, "epoch": 600} {"train_loss": -5.334977149963379, "global_step": 25228, "epoch": 600} {"train_loss": -5.408445358276367, "global_step": 25229, "epoch": 600} {"train_loss": -5.412641525268555, "global_step": 25230, "epoch": 600} {"train_loss": -5.446098804473877, "global_step": 25231, "epoch": 600} {"train_loss": -5.341062068939209, "global_step": 25232, "epoch": 600} {"train_loss": -5.388012886047363, "global_step": 25233, "epoch": 600} {"train_loss": -5.384023666381836, "global_step": 25234, "epoch": 600} {"train_loss": -5.394367218017578, "global_step": 25235, "epoch": 600} {"train_loss": -5.406092643737793, "global_step": 25236, "epoch": 600} {"train_loss": -5.448153018951416, "global_step": 25237, "epoch": 600} {"train_loss": -5.485603332519531, "global_step": 25238, "epoch": 600} {"train_loss": -5.363873481750488, "global_step": 25239, "epoch": 600} {"train_loss": -5.556374549865723, "global_step": 25240, "epoch": 600} {"train_loss": -5.387241840362549, "global_step": 25241, "epoch": 600, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.23234839850895042, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.14566561068743653, "train/sim_max_reward_4": 0.0472806455854592, "train/sim_max_reward_5": 0.4870812819909495, "test/sim_max_reward_4300000": 0.20952128681682083, "test/sim_max_reward_4300001": 0.3414635810108589, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.42667235271950005, "test/sim_max_reward_4300004": 0.08564831313439639, "test/sim_max_reward_4300005": 0.4457659830534889, "test/sim_max_reward_4300006": 0.2671279399955025, "test/sim_max_reward_4300007": 0.3810722783098511, "test/sim_max_reward_4300008": 0.4158651562365626, "test/sim_max_reward_4300009": 0.45032311599025426, "test/sim_max_reward_4300010": 0.012790151159028287, "test/sim_max_reward_4300011": 0.2865233768428725, "test/sim_max_reward_4300012": 0.38983451812117087, "test/sim_max_reward_4300013": 0.5634564070231727, "test/sim_max_reward_4300014": 0.40111585410789957, "test/sim_max_reward_4300015": 0.26615142642428413, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.4165445322446399, "test/sim_max_reward_4300018": 0.3440544603876045, "test/sim_max_reward_4300019": 0.18524323211101573, "test/sim_max_reward_4300020": 0.059741756166619635, "test/sim_max_reward_4300021": 0.17556854544280004, "test/sim_max_reward_4300022": 0.12682108415468402, "test/sim_max_reward_4300023": 0.3660484948700527, "test/sim_max_reward_4300024": 0.47430025213920096, "test/sim_max_reward_4300025": 0.09442110783698536, "test/sim_max_reward_4300026": 0.5342922330650152, "test/sim_max_reward_4300027": 0.03946913744235638, "test/sim_max_reward_4300028": 0.026974730536877958, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.9440931529184703, "test/sim_max_reward_4300031": 0.2167692816599736, "test/sim_max_reward_4300032": 0.18458231414965443, "test/sim_max_reward_4300033": 0.7199481281860552, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.5527122599440878, "test/sim_max_reward_4300038": 0.5932316996586897, "test/sim_max_reward_4300039": 0.41631604660833355, "test/sim_max_reward_4300040": 0.3998001335281375, "test/sim_max_reward_4300041": 0.13586536415100345, "test/sim_max_reward_4300042": 0.708075137983155, "test/sim_max_reward_4300043": 0.35561926098744434, "test/sim_max_reward_4300044": 0.055933065647975115, "test/sim_max_reward_4300045": 0.16817884575198255, "test/sim_max_reward_4300046": 0.14295381522378137, "test/sim_max_reward_4300047": 0.5316196189634935, "test/sim_max_reward_4300048": 0.18167654118760912, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.18377890556314128, "test/mean_score": 0.2893483291189615, "val_loss": 65717.1640625} {"train_loss": -5.281525611877441, "global_step": 25242, "epoch": 601} {"train_loss": -5.404746055603027, "global_step": 25243, "epoch": 601} {"train_loss": -5.4040021896362305, "global_step": 25244, "epoch": 601} {"train_loss": -5.400548934936523, "global_step": 25245, "epoch": 601} {"train_loss": -5.408206939697266, "global_step": 25246, "epoch": 601} {"train_loss": -5.4102630615234375, "global_step": 25247, "epoch": 601} {"train_loss": -5.397669315338135, "global_step": 25248, "epoch": 601} {"train_loss": -5.521718978881836, "global_step": 25249, "epoch": 601} {"train_loss": -5.446120738983154, "global_step": 25250, "epoch": 601} {"train_loss": -5.410114288330078, "global_step": 25251, "epoch": 601} {"train_loss": -5.397397994995117, "global_step": 25252, "epoch": 601} {"train_loss": -5.400879383087158, "global_step": 25253, "epoch": 601} {"train_loss": -5.446130275726318, "global_step": 25254, "epoch": 601} {"train_loss": -5.192250728607178, "global_step": 25255, "epoch": 601} {"train_loss": -5.467432022094727, "global_step": 25256, "epoch": 601} {"train_loss": -5.345577239990234, "global_step": 25257, "epoch": 601} {"train_loss": -5.398693561553955, "global_step": 25258, "epoch": 601} {"train_loss": -5.423572063446045, "global_step": 25259, "epoch": 601} {"train_loss": -5.373595237731934, "global_step": 25260, "epoch": 601} {"train_loss": -5.358676910400391, "global_step": 25261, "epoch": 601} {"train_loss": -5.535853385925293, "global_step": 25262, "epoch": 601} {"train_loss": -5.375833511352539, "global_step": 25263, "epoch": 601} {"train_loss": -5.235593795776367, "global_step": 25264, "epoch": 601} {"train_loss": -5.496194839477539, "global_step": 25265, "epoch": 601} {"train_loss": -5.42221212387085, "global_step": 25266, "epoch": 601} {"train_loss": -5.262319564819336, "global_step": 25267, "epoch": 601} {"train_loss": -5.467006683349609, "global_step": 25268, "epoch": 601} {"train_loss": -5.332342147827148, "global_step": 25269, "epoch": 601} {"train_loss": -5.351621150970459, "global_step": 25270, "epoch": 601} {"train_loss": -5.3784966468811035, "global_step": 25271, "epoch": 601} {"train_loss": -5.500988960266113, "global_step": 25272, "epoch": 601} {"train_loss": -5.3025336265563965, "global_step": 25273, "epoch": 601} {"train_loss": -5.369022369384766, "global_step": 25274, "epoch": 601} {"train_loss": -5.3615288734436035, "global_step": 25275, "epoch": 601} {"train_loss": -5.333978652954102, "global_step": 25276, "epoch": 601} {"train_loss": -5.187704563140869, "global_step": 25277, "epoch": 601} {"train_loss": -5.422981262207031, "global_step": 25278, "epoch": 601} {"train_loss": -5.442300796508789, "global_step": 25279, "epoch": 601} {"train_loss": -5.202047348022461, "global_step": 25280, "epoch": 601} {"train_loss": -5.443305492401123, "global_step": 25281, "epoch": 601} {"train_loss": -5.27360200881958, "global_step": 25282, "epoch": 601} {"train_loss": -5.373075235457647, "global_step": 25283, "epoch": 601, "val_loss": 65164.18359375} {"train_loss": -5.384796142578125, "global_step": 25284, "epoch": 602} {"train_loss": -5.241642951965332, "global_step": 25285, "epoch": 602} {"train_loss": -5.330625534057617, "global_step": 25286, "epoch": 602} {"train_loss": -5.348578453063965, "global_step": 25287, "epoch": 602} {"train_loss": -5.3285675048828125, "global_step": 25288, "epoch": 602} {"train_loss": -5.471199035644531, "global_step": 25289, "epoch": 602} {"train_loss": -5.2853102684021, "global_step": 25290, "epoch": 602} {"train_loss": -5.506281852722168, "global_step": 25291, "epoch": 602} {"train_loss": -5.33847713470459, "global_step": 25292, "epoch": 602} {"train_loss": -5.4323930740356445, "global_step": 25293, "epoch": 602} {"train_loss": -5.37823486328125, "global_step": 25294, "epoch": 602} {"train_loss": -5.3326311111450195, "global_step": 25295, "epoch": 602} {"train_loss": -5.420108795166016, "global_step": 25296, "epoch": 602} {"train_loss": -5.391921043395996, "global_step": 25297, "epoch": 602} {"train_loss": -5.282069206237793, "global_step": 25298, "epoch": 602} {"train_loss": -5.223959922790527, "global_step": 25299, "epoch": 602} {"train_loss": -5.21015739440918, "global_step": 25300, "epoch": 602} {"train_loss": -5.367762088775635, "global_step": 25301, "epoch": 602} {"train_loss": -5.226038455963135, "global_step": 25302, "epoch": 602} {"train_loss": -5.19687032699585, "global_step": 25303, "epoch": 602} {"train_loss": -5.346304416656494, "global_step": 25304, "epoch": 602} {"train_loss": -5.291609764099121, "global_step": 25305, "epoch": 602} {"train_loss": -5.3773298263549805, "global_step": 25306, "epoch": 602} {"train_loss": -5.455014705657959, "global_step": 25307, "epoch": 602} {"train_loss": -5.256841659545898, "global_step": 25308, "epoch": 602} {"train_loss": -5.482211589813232, "global_step": 25309, "epoch": 602} {"train_loss": -5.443454742431641, "global_step": 25310, "epoch": 602} {"train_loss": -5.406102180480957, "global_step": 25311, "epoch": 602} {"train_loss": -5.456056118011475, "global_step": 25312, "epoch": 602} {"train_loss": -5.470177173614502, "global_step": 25313, "epoch": 602} {"train_loss": -5.264760971069336, "global_step": 25314, "epoch": 602} {"train_loss": -5.4280548095703125, "global_step": 25315, "epoch": 602} {"train_loss": -5.3601179122924805, "global_step": 25316, "epoch": 602} {"train_loss": -5.5113067626953125, "global_step": 25317, "epoch": 602} {"train_loss": -5.459267616271973, "global_step": 25318, "epoch": 602} {"train_loss": -5.396877288818359, "global_step": 25319, "epoch": 602} {"train_loss": -5.422224044799805, "global_step": 25320, "epoch": 602} {"train_loss": -5.439376354217529, "global_step": 25321, "epoch": 602} {"train_loss": -5.390875339508057, "global_step": 25322, "epoch": 602} {"train_loss": -5.446636199951172, "global_step": 25323, "epoch": 602} {"train_loss": -5.332985877990723, "global_step": 25324, "epoch": 602} {"train_loss": -5.368973766054426, "global_step": 25325, "epoch": 602, "val_loss": 65124.01953125} {"train_loss": -5.42288064956665, "global_step": 25326, "epoch": 603} {"train_loss": -5.340780735015869, "global_step": 25327, "epoch": 603} {"train_loss": -5.410066604614258, "global_step": 25328, "epoch": 603} {"train_loss": -5.5481767654418945, "global_step": 25329, "epoch": 603} {"train_loss": -5.407248020172119, "global_step": 25330, "epoch": 603} {"train_loss": -5.419955730438232, "global_step": 25331, "epoch": 603} {"train_loss": -5.2691850662231445, "global_step": 25332, "epoch": 603} {"train_loss": -5.3311567306518555, "global_step": 25333, "epoch": 603} {"train_loss": -5.492615699768066, "global_step": 25334, "epoch": 603} {"train_loss": -5.455831527709961, "global_step": 25335, "epoch": 603} {"train_loss": -5.395506858825684, "global_step": 25336, "epoch": 603} {"train_loss": -5.462087631225586, "global_step": 25337, "epoch": 603} {"train_loss": -5.3949785232543945, "global_step": 25338, "epoch": 603} {"train_loss": -5.417129993438721, "global_step": 25339, "epoch": 603} {"train_loss": -5.380273818969727, "global_step": 25340, "epoch": 603} {"train_loss": -5.383246421813965, "global_step": 25341, "epoch": 603} {"train_loss": -5.330565452575684, "global_step": 25342, "epoch": 603} {"train_loss": -5.307309150695801, "global_step": 25343, "epoch": 603} {"train_loss": -5.379980087280273, "global_step": 25344, "epoch": 603} {"train_loss": -5.448047637939453, "global_step": 25345, "epoch": 603} {"train_loss": -5.417354106903076, "global_step": 25346, "epoch": 603} {"train_loss": -5.465471267700195, "global_step": 25347, "epoch": 603} {"train_loss": -5.43797492980957, "global_step": 25348, "epoch": 603} {"train_loss": -5.526933670043945, "global_step": 25349, "epoch": 603} {"train_loss": -5.485982894897461, "global_step": 25350, "epoch": 603} {"train_loss": -5.414264678955078, "global_step": 25351, "epoch": 603} {"train_loss": -5.335747718811035, "global_step": 25352, "epoch": 603} {"train_loss": -5.5876593589782715, "global_step": 25353, "epoch": 603} {"train_loss": -5.457357883453369, "global_step": 25354, "epoch": 603} {"train_loss": -5.364986419677734, "global_step": 25355, "epoch": 603} {"train_loss": -5.295053958892822, "global_step": 25356, "epoch": 603} {"train_loss": -5.462071418762207, "global_step": 25357, "epoch": 603} {"train_loss": -5.447975158691406, "global_step": 25358, "epoch": 603} {"train_loss": -5.358380317687988, "global_step": 25359, "epoch": 603} {"train_loss": -5.339599132537842, "global_step": 25360, "epoch": 603} {"train_loss": -5.239712715148926, "global_step": 25361, "epoch": 603} {"train_loss": -5.347506999969482, "global_step": 25362, "epoch": 603} {"train_loss": -5.4689435958862305, "global_step": 25363, "epoch": 603} {"train_loss": -5.369312286376953, "global_step": 25364, "epoch": 603} {"train_loss": -5.436392307281494, "global_step": 25365, "epoch": 603} {"train_loss": -5.44611930847168, "global_step": 25366, "epoch": 603} {"train_loss": -5.406703460784185, "global_step": 25367, "epoch": 603, "val_loss": 65109.1796875} {"train_loss": -5.497407913208008, "global_step": 25368, "epoch": 604} {"train_loss": -5.3080010414123535, "global_step": 25369, "epoch": 604} {"train_loss": -5.396261215209961, "global_step": 25370, "epoch": 604} {"train_loss": -5.466958045959473, "global_step": 25371, "epoch": 604} {"train_loss": -5.448774814605713, "global_step": 25372, "epoch": 604} {"train_loss": -5.312543869018555, "global_step": 25373, "epoch": 604} {"train_loss": -5.4947099685668945, "global_step": 25374, "epoch": 604} {"train_loss": -5.383975982666016, "global_step": 25375, "epoch": 604} {"train_loss": -5.472512722015381, "global_step": 25376, "epoch": 604} {"train_loss": -5.4289350509643555, "global_step": 25377, "epoch": 604} {"train_loss": -5.470709800720215, "global_step": 25378, "epoch": 604} {"train_loss": -5.411894798278809, "global_step": 25379, "epoch": 604} {"train_loss": -5.336475372314453, "global_step": 25380, "epoch": 604} {"train_loss": -5.4704084396362305, "global_step": 25381, "epoch": 604} {"train_loss": -5.415806770324707, "global_step": 25382, "epoch": 604} {"train_loss": -5.466034889221191, "global_step": 25383, "epoch": 604} {"train_loss": -5.363180160522461, "global_step": 25384, "epoch": 604} {"train_loss": -5.375993251800537, "global_step": 25385, "epoch": 604} {"train_loss": -5.457313060760498, "global_step": 25386, "epoch": 604} {"train_loss": -5.400301456451416, "global_step": 25387, "epoch": 604} {"train_loss": -5.239978790283203, "global_step": 25388, "epoch": 604} {"train_loss": -5.264781951904297, "global_step": 25389, "epoch": 604} {"train_loss": -5.3266096115112305, "global_step": 25390, "epoch": 604} {"train_loss": -5.377915382385254, "global_step": 25391, "epoch": 604} {"train_loss": -5.410801887512207, "global_step": 25392, "epoch": 604} {"train_loss": -5.502330303192139, "global_step": 25393, "epoch": 604} {"train_loss": -5.22735595703125, "global_step": 25394, "epoch": 604} {"train_loss": -5.270402431488037, "global_step": 25395, "epoch": 604} {"train_loss": -5.414776802062988, "global_step": 25396, "epoch": 604} {"train_loss": -5.2820658683776855, "global_step": 25397, "epoch": 604} {"train_loss": -5.331804275512695, "global_step": 25398, "epoch": 604} {"train_loss": -5.458030700683594, "global_step": 25399, "epoch": 604} {"train_loss": -5.480452060699463, "global_step": 25400, "epoch": 604} {"train_loss": -5.317971229553223, "global_step": 25401, "epoch": 604} {"train_loss": -5.406065940856934, "global_step": 25402, "epoch": 604} {"train_loss": -5.409704208374023, "global_step": 25403, "epoch": 604} {"train_loss": -5.442972183227539, "global_step": 25404, "epoch": 604} {"train_loss": -5.36688232421875, "global_step": 25405, "epoch": 604} {"train_loss": -5.243738174438477, "global_step": 25406, "epoch": 604} {"train_loss": -5.3363447189331055, "global_step": 25407, "epoch": 604} {"train_loss": -5.313858985900879, "global_step": 25408, "epoch": 604} {"train_loss": -5.384695064453852, "global_step": 25409, "epoch": 604, "val_loss": 65130.54296875} {"train_loss": -5.491922378540039, "global_step": 25410, "epoch": 605} {"train_loss": -5.38375186920166, "global_step": 25411, "epoch": 605} {"train_loss": -5.472866058349609, "global_step": 25412, "epoch": 605} {"train_loss": -5.502097129821777, "global_step": 25413, "epoch": 605} {"train_loss": -5.343301773071289, "global_step": 25414, "epoch": 605} {"train_loss": -5.3032708168029785, "global_step": 25415, "epoch": 605} {"train_loss": -5.496332168579102, "global_step": 25416, "epoch": 605} {"train_loss": -5.332440376281738, "global_step": 25417, "epoch": 605} {"train_loss": -5.328639507293701, "global_step": 25418, "epoch": 605} {"train_loss": -5.451537132263184, "global_step": 25419, "epoch": 605} {"train_loss": -5.401297569274902, "global_step": 25420, "epoch": 605} {"train_loss": -5.267041206359863, "global_step": 25421, "epoch": 605} {"train_loss": -5.32715368270874, "global_step": 25422, "epoch": 605} {"train_loss": -5.29295015335083, "global_step": 25423, "epoch": 605} {"train_loss": -5.3750786781311035, "global_step": 25424, "epoch": 605} {"train_loss": -5.385784149169922, "global_step": 25425, "epoch": 605} {"train_loss": -5.2036027908325195, "global_step": 25426, "epoch": 605} {"train_loss": -5.450718879699707, "global_step": 25427, "epoch": 605} {"train_loss": -5.461709499359131, "global_step": 25428, "epoch": 605} {"train_loss": -5.172325611114502, "global_step": 25429, "epoch": 605} {"train_loss": -5.370480537414551, "global_step": 25430, "epoch": 605} {"train_loss": -5.1429901123046875, "global_step": 25431, "epoch": 605} {"train_loss": -5.441538333892822, "global_step": 25432, "epoch": 605} {"train_loss": -5.479311466217041, "global_step": 25433, "epoch": 605} {"train_loss": -5.325186729431152, "global_step": 25434, "epoch": 605} {"train_loss": -5.432467937469482, "global_step": 25435, "epoch": 605} {"train_loss": -5.405769348144531, "global_step": 25436, "epoch": 605} {"train_loss": -5.400269508361816, "global_step": 25437, "epoch": 605} {"train_loss": -5.340658187866211, "global_step": 25438, "epoch": 605} {"train_loss": -5.507671356201172, "global_step": 25439, "epoch": 605} {"train_loss": -5.384310722351074, "global_step": 25440, "epoch": 605} {"train_loss": -5.532847881317139, "global_step": 25441, "epoch": 605} {"train_loss": -5.409089088439941, "global_step": 25442, "epoch": 605} {"train_loss": -5.420666217803955, "global_step": 25443, "epoch": 605} {"train_loss": -5.555327892303467, "global_step": 25444, "epoch": 605} {"train_loss": -5.396867752075195, "global_step": 25445, "epoch": 605} {"train_loss": -5.430593013763428, "global_step": 25446, "epoch": 605} {"train_loss": -5.5745625495910645, "global_step": 25447, "epoch": 605} {"train_loss": -5.291073799133301, "global_step": 25448, "epoch": 605} {"train_loss": -5.3318071365356445, "global_step": 25449, "epoch": 605} {"train_loss": -5.317851543426514, "global_step": 25450, "epoch": 605} {"train_loss": -5.389180047171457, "global_step": 25451, "epoch": 605, "val_loss": 64803.25} {"train_loss": -5.426427364349365, "global_step": 25452, "epoch": 606} {"train_loss": -5.477601051330566, "global_step": 25453, "epoch": 606} {"train_loss": -5.542036056518555, "global_step": 25454, "epoch": 606} {"train_loss": -5.4997382164001465, "global_step": 25455, "epoch": 606} {"train_loss": -5.478615760803223, "global_step": 25456, "epoch": 606} {"train_loss": -5.459396839141846, "global_step": 25457, "epoch": 606} {"train_loss": -5.339709281921387, "global_step": 25458, "epoch": 606} {"train_loss": -5.425865173339844, "global_step": 25459, "epoch": 606} {"train_loss": -5.428908348083496, "global_step": 25460, "epoch": 606} {"train_loss": -5.451836585998535, "global_step": 25461, "epoch": 606} {"train_loss": -5.4118757247924805, "global_step": 25462, "epoch": 606} {"train_loss": -5.452937126159668, "global_step": 25463, "epoch": 606} {"train_loss": -5.453184127807617, "global_step": 25464, "epoch": 606} {"train_loss": -5.387867450714111, "global_step": 25465, "epoch": 606} {"train_loss": -5.29673957824707, "global_step": 25466, "epoch": 606} {"train_loss": -5.414887428283691, "global_step": 25467, "epoch": 606} {"train_loss": -5.484000205993652, "global_step": 25468, "epoch": 606} {"train_loss": -5.372222900390625, "global_step": 25469, "epoch": 606} {"train_loss": -5.282900810241699, "global_step": 25470, "epoch": 606} {"train_loss": -5.366257667541504, "global_step": 25471, "epoch": 606} {"train_loss": -5.367763042449951, "global_step": 25472, "epoch": 606} {"train_loss": -5.239548683166504, "global_step": 25473, "epoch": 606} {"train_loss": -5.4565019607543945, "global_step": 25474, "epoch": 606} {"train_loss": -5.268337726593018, "global_step": 25475, "epoch": 606} {"train_loss": -5.295808792114258, "global_step": 25476, "epoch": 606} {"train_loss": -5.42588472366333, "global_step": 25477, "epoch": 606} {"train_loss": -5.320528030395508, "global_step": 25478, "epoch": 606} {"train_loss": -5.30360221862793, "global_step": 25479, "epoch": 606} {"train_loss": -5.500975608825684, "global_step": 25480, "epoch": 606} {"train_loss": -5.438602447509766, "global_step": 25481, "epoch": 606} {"train_loss": -5.254358291625977, "global_step": 25482, "epoch": 606} {"train_loss": -5.429681777954102, "global_step": 25483, "epoch": 606} {"train_loss": -5.34459114074707, "global_step": 25484, "epoch": 606} {"train_loss": -5.371004581451416, "global_step": 25485, "epoch": 606} {"train_loss": -5.3870768547058105, "global_step": 25486, "epoch": 606} {"train_loss": -5.4249420166015625, "global_step": 25487, "epoch": 606} {"train_loss": -5.495409965515137, "global_step": 25488, "epoch": 606} {"train_loss": -5.423858165740967, "global_step": 25489, "epoch": 606} {"train_loss": -5.372566223144531, "global_step": 25490, "epoch": 606} {"train_loss": -5.353604316711426, "global_step": 25491, "epoch": 606} {"train_loss": -5.438274383544922, "global_step": 25492, "epoch": 606} {"train_loss": -5.401581957226708, "global_step": 25493, "epoch": 606, "val_loss": 65643.5546875} {"train_loss": -5.33931827545166, "global_step": 25494, "epoch": 607} {"train_loss": -5.343581676483154, "global_step": 25495, "epoch": 607} {"train_loss": -5.445377349853516, "global_step": 25496, "epoch": 607} {"train_loss": -5.404012203216553, "global_step": 25497, "epoch": 607} {"train_loss": -5.382358074188232, "global_step": 25498, "epoch": 607} {"train_loss": -5.371672630310059, "global_step": 25499, "epoch": 607} {"train_loss": -5.352248668670654, "global_step": 25500, "epoch": 607} {"train_loss": -5.361054420471191, "global_step": 25501, "epoch": 607} {"train_loss": -5.426348686218262, "global_step": 25502, "epoch": 607} {"train_loss": -5.533612251281738, "global_step": 25503, "epoch": 607} {"train_loss": -5.441816329956055, "global_step": 25504, "epoch": 607} {"train_loss": -5.508179664611816, "global_step": 25505, "epoch": 607} {"train_loss": -5.462779521942139, "global_step": 25506, "epoch": 607} {"train_loss": -5.4431867599487305, "global_step": 25507, "epoch": 607} {"train_loss": -5.497684001922607, "global_step": 25508, "epoch": 607} {"train_loss": -5.435705661773682, "global_step": 25509, "epoch": 607} {"train_loss": -5.402656078338623, "global_step": 25510, "epoch": 607} {"train_loss": -5.320516586303711, "global_step": 25511, "epoch": 607} {"train_loss": -5.587386131286621, "global_step": 25512, "epoch": 607} {"train_loss": -5.278209209442139, "global_step": 25513, "epoch": 607} {"train_loss": -5.260894775390625, "global_step": 25514, "epoch": 607} {"train_loss": -5.361738204956055, "global_step": 25515, "epoch": 607} {"train_loss": -5.431803226470947, "global_step": 25516, "epoch": 607} {"train_loss": -5.313760757446289, "global_step": 25517, "epoch": 607} {"train_loss": -5.350351333618164, "global_step": 25518, "epoch": 607} {"train_loss": -5.442697525024414, "global_step": 25519, "epoch": 607} {"train_loss": -5.496680736541748, "global_step": 25520, "epoch": 607} {"train_loss": -5.483813285827637, "global_step": 25521, "epoch": 607} {"train_loss": -5.36490535736084, "global_step": 25522, "epoch": 607} {"train_loss": -5.3842573165893555, "global_step": 25523, "epoch": 607} {"train_loss": -5.161435127258301, "global_step": 25524, "epoch": 607} {"train_loss": -5.327489852905273, "global_step": 25525, "epoch": 607} {"train_loss": -5.39799165725708, "global_step": 25526, "epoch": 607} {"train_loss": -5.260038375854492, "global_step": 25527, "epoch": 607} {"train_loss": -5.338743209838867, "global_step": 25528, "epoch": 607} {"train_loss": -5.403860092163086, "global_step": 25529, "epoch": 607} {"train_loss": -5.192779541015625, "global_step": 25530, "epoch": 607} {"train_loss": -5.294520378112793, "global_step": 25531, "epoch": 607} {"train_loss": -5.373199462890625, "global_step": 25532, "epoch": 607} {"train_loss": -5.236230850219727, "global_step": 25533, "epoch": 607} {"train_loss": -5.362919807434082, "global_step": 25534, "epoch": 607} {"train_loss": -5.377273423331125, "global_step": 25535, "epoch": 607, "val_loss": 64752.359375} {"train_loss": -5.475147247314453, "global_step": 25536, "epoch": 608} {"train_loss": -5.365011215209961, "global_step": 25537, "epoch": 608} {"train_loss": -5.347410202026367, "global_step": 25538, "epoch": 608} {"train_loss": -5.342349052429199, "global_step": 25539, "epoch": 608} {"train_loss": -5.300776481628418, "global_step": 25540, "epoch": 608} {"train_loss": -5.4393205642700195, "global_step": 25541, "epoch": 608} {"train_loss": -5.381101608276367, "global_step": 25542, "epoch": 608} {"train_loss": -5.427938461303711, "global_step": 25543, "epoch": 608} {"train_loss": -5.347438335418701, "global_step": 25544, "epoch": 608} {"train_loss": -5.373557090759277, "global_step": 25545, "epoch": 608} {"train_loss": -5.466988563537598, "global_step": 25546, "epoch": 608} {"train_loss": -5.330709457397461, "global_step": 25547, "epoch": 608} {"train_loss": -5.3501715660095215, "global_step": 25548, "epoch": 608} {"train_loss": -5.4592156410217285, "global_step": 25549, "epoch": 608} {"train_loss": -5.445062637329102, "global_step": 25550, "epoch": 608} {"train_loss": -5.317387580871582, "global_step": 25551, "epoch": 608} {"train_loss": -5.31016731262207, "global_step": 25552, "epoch": 608} {"train_loss": -5.396252632141113, "global_step": 25553, "epoch": 608} {"train_loss": -5.309707164764404, "global_step": 25554, "epoch": 608} {"train_loss": -5.335501670837402, "global_step": 25555, "epoch": 608} {"train_loss": -5.332590103149414, "global_step": 25556, "epoch": 608} {"train_loss": -5.36798095703125, "global_step": 25557, "epoch": 608} {"train_loss": -5.348780632019043, "global_step": 25558, "epoch": 608} {"train_loss": -5.3780059814453125, "global_step": 25559, "epoch": 608} {"train_loss": -5.436458587646484, "global_step": 25560, "epoch": 608} {"train_loss": -5.313197135925293, "global_step": 25561, "epoch": 608} {"train_loss": -5.403505802154541, "global_step": 25562, "epoch": 608} {"train_loss": -5.465904235839844, "global_step": 25563, "epoch": 608} {"train_loss": -5.428955554962158, "global_step": 25564, "epoch": 608} {"train_loss": -5.376469612121582, "global_step": 25565, "epoch": 608} {"train_loss": -5.379169940948486, "global_step": 25566, "epoch": 608} {"train_loss": -5.521557807922363, "global_step": 25567, "epoch": 608} {"train_loss": -5.431568622589111, "global_step": 25568, "epoch": 608} {"train_loss": -5.535485744476318, "global_step": 25569, "epoch": 608} {"train_loss": -5.5609211921691895, "global_step": 25570, "epoch": 608} {"train_loss": -5.646969795227051, "global_step": 25571, "epoch": 608} {"train_loss": -5.500911712646484, "global_step": 25572, "epoch": 608} {"train_loss": -5.459149360656738, "global_step": 25573, "epoch": 608} {"train_loss": -5.447058200836182, "global_step": 25574, "epoch": 608} {"train_loss": -5.32002592086792, "global_step": 25575, "epoch": 608} {"train_loss": -5.3175048828125, "global_step": 25576, "epoch": 608} {"train_loss": -5.399470703942435, "global_step": 25577, "epoch": 608, "val_loss": 65078.40234375} {"train_loss": -5.528632164001465, "global_step": 25578, "epoch": 609} {"train_loss": -5.216611385345459, "global_step": 25579, "epoch": 609} {"train_loss": -5.450557708740234, "global_step": 25580, "epoch": 609} {"train_loss": -5.218881607055664, "global_step": 25581, "epoch": 609} {"train_loss": -5.401714324951172, "global_step": 25582, "epoch": 609} {"train_loss": -5.504169464111328, "global_step": 25583, "epoch": 609} {"train_loss": -5.441425800323486, "global_step": 25584, "epoch": 609} {"train_loss": -5.342482089996338, "global_step": 25585, "epoch": 609} {"train_loss": -5.393510341644287, "global_step": 25586, "epoch": 609} {"train_loss": -5.445282936096191, "global_step": 25587, "epoch": 609} {"train_loss": -5.392693042755127, "global_step": 25588, "epoch": 609} {"train_loss": -5.393802642822266, "global_step": 25589, "epoch": 609} {"train_loss": -5.424323081970215, "global_step": 25590, "epoch": 609} {"train_loss": -5.527987480163574, "global_step": 25591, "epoch": 609} {"train_loss": -5.432826995849609, "global_step": 25592, "epoch": 609} {"train_loss": -5.303900718688965, "global_step": 25593, "epoch": 609} {"train_loss": -5.363955497741699, "global_step": 25594, "epoch": 609} {"train_loss": -5.216346740722656, "global_step": 25595, "epoch": 609} {"train_loss": -5.347631454467773, "global_step": 25596, "epoch": 609} {"train_loss": -5.495429039001465, "global_step": 25597, "epoch": 609} {"train_loss": -5.397086143493652, "global_step": 25598, "epoch": 609} {"train_loss": -5.446820259094238, "global_step": 25599, "epoch": 609} {"train_loss": -5.433979034423828, "global_step": 25600, "epoch": 609} {"train_loss": -5.3943891525268555, "global_step": 25601, "epoch": 609} {"train_loss": -5.375271320343018, "global_step": 25602, "epoch": 609} {"train_loss": -5.398898601531982, "global_step": 25603, "epoch": 609} {"train_loss": -5.411925315856934, "global_step": 25604, "epoch": 609} {"train_loss": -5.426096439361572, "global_step": 25605, "epoch": 609} {"train_loss": -5.470261573791504, "global_step": 25606, "epoch": 609} {"train_loss": -5.358014106750488, "global_step": 25607, "epoch": 609} {"train_loss": -5.375890731811523, "global_step": 25608, "epoch": 609} {"train_loss": -5.339911460876465, "global_step": 25609, "epoch": 609} {"train_loss": -5.371246814727783, "global_step": 25610, "epoch": 609} {"train_loss": -5.4841814041137695, "global_step": 25611, "epoch": 609} {"train_loss": -5.437039852142334, "global_step": 25612, "epoch": 609} {"train_loss": -5.388699054718018, "global_step": 25613, "epoch": 609} {"train_loss": -5.35997200012207, "global_step": 25614, "epoch": 609} {"train_loss": -5.4526567459106445, "global_step": 25615, "epoch": 609} {"train_loss": -5.304777145385742, "global_step": 25616, "epoch": 609} {"train_loss": -5.393561840057373, "global_step": 25617, "epoch": 609} {"train_loss": -5.264017581939697, "global_step": 25618, "epoch": 609} {"train_loss": -5.396575553076608, "global_step": 25619, "epoch": 609, "val_loss": 64766.46875} {"train_loss": -5.343674659729004, "global_step": 25620, "epoch": 610} {"train_loss": -5.446822166442871, "global_step": 25621, "epoch": 610} {"train_loss": -5.323990821838379, "global_step": 25622, "epoch": 610} {"train_loss": -5.467596054077148, "global_step": 25623, "epoch": 610} {"train_loss": -5.522618293762207, "global_step": 25624, "epoch": 610} {"train_loss": -5.269536018371582, "global_step": 25625, "epoch": 610} {"train_loss": -5.482786178588867, "global_step": 25626, "epoch": 610} {"train_loss": -5.348398208618164, "global_step": 25627, "epoch": 610} {"train_loss": -5.166446685791016, "global_step": 25628, "epoch": 610} {"train_loss": -5.369235038757324, "global_step": 25629, "epoch": 610} {"train_loss": -5.406129360198975, "global_step": 25630, "epoch": 610} {"train_loss": -5.451566696166992, "global_step": 25631, "epoch": 610} {"train_loss": -5.5127363204956055, "global_step": 25632, "epoch": 610} {"train_loss": -5.292868137359619, "global_step": 25633, "epoch": 610} {"train_loss": -5.354547023773193, "global_step": 25634, "epoch": 610} {"train_loss": -5.38297700881958, "global_step": 25635, "epoch": 610} {"train_loss": -5.337538719177246, "global_step": 25636, "epoch": 610} {"train_loss": -5.414254188537598, "global_step": 25637, "epoch": 610} {"train_loss": -5.392650127410889, "global_step": 25638, "epoch": 610} {"train_loss": -5.304984092712402, "global_step": 25639, "epoch": 610} {"train_loss": -5.394546985626221, "global_step": 25640, "epoch": 610} {"train_loss": -5.376778602600098, "global_step": 25641, "epoch": 610} {"train_loss": -5.368990421295166, "global_step": 25642, "epoch": 610} {"train_loss": -5.402059555053711, "global_step": 25643, "epoch": 610} {"train_loss": -5.424388885498047, "global_step": 25644, "epoch": 610} {"train_loss": -5.375011444091797, "global_step": 25645, "epoch": 610} {"train_loss": -5.337551593780518, "global_step": 25646, "epoch": 610} {"train_loss": -5.274923324584961, "global_step": 25647, "epoch": 610} {"train_loss": -5.424386024475098, "global_step": 25648, "epoch": 610} {"train_loss": -5.321688175201416, "global_step": 25649, "epoch": 610} {"train_loss": -5.313318729400635, "global_step": 25650, "epoch": 610} {"train_loss": -5.2922515869140625, "global_step": 25651, "epoch": 610} {"train_loss": -5.29723596572876, "global_step": 25652, "epoch": 610} {"train_loss": -5.497293472290039, "global_step": 25653, "epoch": 610} {"train_loss": -5.251927375793457, "global_step": 25654, "epoch": 610} {"train_loss": -5.364585876464844, "global_step": 25655, "epoch": 610} {"train_loss": -5.356098175048828, "global_step": 25656, "epoch": 610} {"train_loss": -5.521924018859863, "global_step": 25657, "epoch": 610} {"train_loss": -5.429561614990234, "global_step": 25658, "epoch": 610} {"train_loss": -5.491499423980713, "global_step": 25659, "epoch": 610} {"train_loss": -5.243008136749268, "global_step": 25660, "epoch": 610} {"train_loss": -5.373528707595098, "global_step": 25661, "epoch": 610, "val_loss": 65145.1875} {"train_loss": -5.294022560119629, "global_step": 25662, "epoch": 611} {"train_loss": -5.486777305603027, "global_step": 25663, "epoch": 611} {"train_loss": -5.395429611206055, "global_step": 25664, "epoch": 611} {"train_loss": -5.493271827697754, "global_step": 25665, "epoch": 611} {"train_loss": -5.4018731117248535, "global_step": 25666, "epoch": 611} {"train_loss": -5.469531059265137, "global_step": 25667, "epoch": 611} {"train_loss": -5.370968341827393, "global_step": 25668, "epoch": 611} {"train_loss": -5.562605381011963, "global_step": 25669, "epoch": 611} {"train_loss": -5.453662395477295, "global_step": 25670, "epoch": 611} {"train_loss": -5.347076416015625, "global_step": 25671, "epoch": 611} {"train_loss": -5.596759796142578, "global_step": 25672, "epoch": 611} {"train_loss": -5.415760040283203, "global_step": 25673, "epoch": 611} {"train_loss": -5.3595356941223145, "global_step": 25674, "epoch": 611} {"train_loss": -5.389233589172363, "global_step": 25675, "epoch": 611} {"train_loss": -5.455636024475098, "global_step": 25676, "epoch": 611} {"train_loss": -5.552984714508057, "global_step": 25677, "epoch": 611} {"train_loss": -5.326427936553955, "global_step": 25678, "epoch": 611} {"train_loss": -5.2394585609436035, "global_step": 25679, "epoch": 611} {"train_loss": -5.367674350738525, "global_step": 25680, "epoch": 611} {"train_loss": -5.377204895019531, "global_step": 25681, "epoch": 611} {"train_loss": -5.387450218200684, "global_step": 25682, "epoch": 611} {"train_loss": -5.3436174392700195, "global_step": 25683, "epoch": 611} {"train_loss": -5.374202728271484, "global_step": 25684, "epoch": 611} {"train_loss": -5.392292499542236, "global_step": 25685, "epoch": 611} {"train_loss": -5.359743595123291, "global_step": 25686, "epoch": 611} {"train_loss": -5.333993911743164, "global_step": 25687, "epoch": 611} {"train_loss": -5.213584899902344, "global_step": 25688, "epoch": 611} {"train_loss": -5.514041900634766, "global_step": 25689, "epoch": 611} {"train_loss": -5.372835159301758, "global_step": 25690, "epoch": 611} {"train_loss": -5.315153121948242, "global_step": 25691, "epoch": 611} {"train_loss": -5.431779861450195, "global_step": 25692, "epoch": 611} {"train_loss": -5.295827865600586, "global_step": 25693, "epoch": 611} {"train_loss": -5.370174407958984, "global_step": 25694, "epoch": 611} {"train_loss": -5.459052085876465, "global_step": 25695, "epoch": 611} {"train_loss": -5.276607036590576, "global_step": 25696, "epoch": 611} {"train_loss": -5.2701215744018555, "global_step": 25697, "epoch": 611} {"train_loss": -5.379939556121826, "global_step": 25698, "epoch": 611} {"train_loss": -5.310826301574707, "global_step": 25699, "epoch": 611} {"train_loss": -5.246671676635742, "global_step": 25700, "epoch": 611} {"train_loss": -5.355684280395508, "global_step": 25701, "epoch": 611} {"train_loss": -5.3952956199646, "global_step": 25702, "epoch": 611} {"train_loss": -5.382012594313848, "global_step": 25703, "epoch": 611, "val_loss": 65262.8671875} {"train_loss": -5.414597511291504, "global_step": 25704, "epoch": 612} {"train_loss": -5.376457214355469, "global_step": 25705, "epoch": 612} {"train_loss": -5.387508869171143, "global_step": 25706, "epoch": 612} {"train_loss": -5.362504005432129, "global_step": 25707, "epoch": 612} {"train_loss": -5.452291011810303, "global_step": 25708, "epoch": 612} {"train_loss": -5.393076419830322, "global_step": 25709, "epoch": 612} {"train_loss": -5.3775200843811035, "global_step": 25710, "epoch": 612} {"train_loss": -5.411631107330322, "global_step": 25711, "epoch": 612} {"train_loss": -5.508715629577637, "global_step": 25712, "epoch": 612} {"train_loss": -5.349597454071045, "global_step": 25713, "epoch": 612} {"train_loss": -5.417044162750244, "global_step": 25714, "epoch": 612} {"train_loss": -5.338495254516602, "global_step": 25715, "epoch": 612} {"train_loss": -5.314009189605713, "global_step": 25716, "epoch": 612} {"train_loss": -5.3809943199157715, "global_step": 25717, "epoch": 612} {"train_loss": -5.4523797035217285, "global_step": 25718, "epoch": 612} {"train_loss": -5.344552993774414, "global_step": 25719, "epoch": 612} {"train_loss": -5.249240875244141, "global_step": 25720, "epoch": 612} {"train_loss": -5.275877475738525, "global_step": 25721, "epoch": 612} {"train_loss": -5.449296951293945, "global_step": 25722, "epoch": 612} {"train_loss": -5.2768378257751465, "global_step": 25723, "epoch": 612} {"train_loss": -5.436636924743652, "global_step": 25724, "epoch": 612} {"train_loss": -5.463853359222412, "global_step": 25725, "epoch": 612} {"train_loss": -5.225444793701172, "global_step": 25726, "epoch": 612} {"train_loss": -5.427058219909668, "global_step": 25727, "epoch": 612} {"train_loss": -5.448051452636719, "global_step": 25728, "epoch": 612} {"train_loss": -5.434497356414795, "global_step": 25729, "epoch": 612} {"train_loss": -5.300311088562012, "global_step": 25730, "epoch": 612} {"train_loss": -5.460421085357666, "global_step": 25731, "epoch": 612} {"train_loss": -5.468939781188965, "global_step": 25732, "epoch": 612} {"train_loss": -5.502352714538574, "global_step": 25733, "epoch": 612} {"train_loss": -5.450990676879883, "global_step": 25734, "epoch": 612} {"train_loss": -5.42999267578125, "global_step": 25735, "epoch": 612} {"train_loss": -5.4850873947143555, "global_step": 25736, "epoch": 612} {"train_loss": -5.458608150482178, "global_step": 25737, "epoch": 612} {"train_loss": -5.528431415557861, "global_step": 25738, "epoch": 612} {"train_loss": -5.306406497955322, "global_step": 25739, "epoch": 612} {"train_loss": -5.39015007019043, "global_step": 25740, "epoch": 612} {"train_loss": -5.424000263214111, "global_step": 25741, "epoch": 612} {"train_loss": -5.34603214263916, "global_step": 25742, "epoch": 612} {"train_loss": -5.3360066413879395, "global_step": 25743, "epoch": 612} {"train_loss": -5.578638076782227, "global_step": 25744, "epoch": 612} {"train_loss": -5.401211284455799, "global_step": 25745, "epoch": 612, "val_loss": 65161.80078125} {"train_loss": -5.266550064086914, "global_step": 25746, "epoch": 613} {"train_loss": -5.349596977233887, "global_step": 25747, "epoch": 613} {"train_loss": -5.388894081115723, "global_step": 25748, "epoch": 613} {"train_loss": -5.120368957519531, "global_step": 25749, "epoch": 613} {"train_loss": -5.317177772521973, "global_step": 25750, "epoch": 613} {"train_loss": -5.36028528213501, "global_step": 25751, "epoch": 613} {"train_loss": -5.36769962310791, "global_step": 25752, "epoch": 613} {"train_loss": -5.3758931159973145, "global_step": 25753, "epoch": 613} {"train_loss": -5.310791015625, "global_step": 25754, "epoch": 613} {"train_loss": -5.346984386444092, "global_step": 25755, "epoch": 613} {"train_loss": -5.3609771728515625, "global_step": 25756, "epoch": 613} {"train_loss": -5.381382465362549, "global_step": 25757, "epoch": 613} {"train_loss": -5.337967872619629, "global_step": 25758, "epoch": 613} {"train_loss": -5.366001129150391, "global_step": 25759, "epoch": 613} {"train_loss": -5.4432854652404785, "global_step": 25760, "epoch": 613} {"train_loss": -5.267200469970703, "global_step": 25761, "epoch": 613} {"train_loss": -5.268063545227051, "global_step": 25762, "epoch": 613} {"train_loss": -5.472536563873291, "global_step": 25763, "epoch": 613} {"train_loss": -5.429886817932129, "global_step": 25764, "epoch": 613} {"train_loss": -5.496420860290527, "global_step": 25765, "epoch": 613} {"train_loss": -5.398803234100342, "global_step": 25766, "epoch": 613} {"train_loss": -5.541656970977783, "global_step": 25767, "epoch": 613} {"train_loss": -5.392797470092773, "global_step": 25768, "epoch": 613} {"train_loss": -5.342032432556152, "global_step": 25769, "epoch": 613} {"train_loss": -5.278051376342773, "global_step": 25770, "epoch": 613} {"train_loss": -5.393077850341797, "global_step": 25771, "epoch": 613} {"train_loss": -5.4123687744140625, "global_step": 25772, "epoch": 613} {"train_loss": -5.348470687866211, "global_step": 25773, "epoch": 613} {"train_loss": -5.531826019287109, "global_step": 25774, "epoch": 613} {"train_loss": -5.526625633239746, "global_step": 25775, "epoch": 613} {"train_loss": -5.389763355255127, "global_step": 25776, "epoch": 613} {"train_loss": -5.446450710296631, "global_step": 25777, "epoch": 613} {"train_loss": -5.48317813873291, "global_step": 25778, "epoch": 613} {"train_loss": -5.354346752166748, "global_step": 25779, "epoch": 613} {"train_loss": -5.346247673034668, "global_step": 25780, "epoch": 613} {"train_loss": -5.483549118041992, "global_step": 25781, "epoch": 613} {"train_loss": -5.4148712158203125, "global_step": 25782, "epoch": 613} {"train_loss": -5.45709228515625, "global_step": 25783, "epoch": 613} {"train_loss": -5.349072456359863, "global_step": 25784, "epoch": 613} {"train_loss": -5.318521499633789, "global_step": 25785, "epoch": 613} {"train_loss": -5.472927570343018, "global_step": 25786, "epoch": 613} {"train_loss": -5.382656665075393, "global_step": 25787, "epoch": 613, "val_loss": 64819.74609375} {"train_loss": -5.363739013671875, "global_step": 25788, "epoch": 614} {"train_loss": -5.410220146179199, "global_step": 25789, "epoch": 614} {"train_loss": -5.469203948974609, "global_step": 25790, "epoch": 614} {"train_loss": -5.268524646759033, "global_step": 25791, "epoch": 614} {"train_loss": -5.4071502685546875, "global_step": 25792, "epoch": 614} {"train_loss": -5.434408664703369, "global_step": 25793, "epoch": 614} {"train_loss": -5.2216620445251465, "global_step": 25794, "epoch": 614} {"train_loss": -5.528875350952148, "global_step": 25795, "epoch": 614} {"train_loss": -5.38860559463501, "global_step": 25796, "epoch": 614} {"train_loss": -5.354740619659424, "global_step": 25797, "epoch": 614} {"train_loss": -5.438652038574219, "global_step": 25798, "epoch": 614} {"train_loss": -5.50206995010376, "global_step": 25799, "epoch": 614} {"train_loss": -5.462158203125, "global_step": 25800, "epoch": 614} {"train_loss": -5.4992475509643555, "global_step": 25801, "epoch": 614} {"train_loss": -5.505383491516113, "global_step": 25802, "epoch": 614} {"train_loss": -5.406042098999023, "global_step": 25803, "epoch": 614} {"train_loss": -5.432253360748291, "global_step": 25804, "epoch": 614} {"train_loss": -5.5644636154174805, "global_step": 25805, "epoch": 614} {"train_loss": -5.44251823425293, "global_step": 25806, "epoch": 614} {"train_loss": -5.405344009399414, "global_step": 25807, "epoch": 614} {"train_loss": -5.484000205993652, "global_step": 25808, "epoch": 614} {"train_loss": -5.319624900817871, "global_step": 25809, "epoch": 614} {"train_loss": -5.455546855926514, "global_step": 25810, "epoch": 614} {"train_loss": -5.3875346183776855, "global_step": 25811, "epoch": 614} {"train_loss": -5.286080837249756, "global_step": 25812, "epoch": 614} {"train_loss": -5.248631954193115, "global_step": 25813, "epoch": 614} {"train_loss": -5.448112964630127, "global_step": 25814, "epoch": 614} {"train_loss": -5.277477741241455, "global_step": 25815, "epoch": 614} {"train_loss": -5.291367053985596, "global_step": 25816, "epoch": 614} {"train_loss": -5.422668933868408, "global_step": 25817, "epoch": 614} {"train_loss": -5.42379093170166, "global_step": 25818, "epoch": 614} {"train_loss": -5.278396129608154, "global_step": 25819, "epoch": 614} {"train_loss": -5.49345588684082, "global_step": 25820, "epoch": 614} {"train_loss": -5.291837692260742, "global_step": 25821, "epoch": 614} {"train_loss": -5.457643032073975, "global_step": 25822, "epoch": 614} {"train_loss": -5.461834907531738, "global_step": 25823, "epoch": 614} {"train_loss": -5.249287128448486, "global_step": 25824, "epoch": 614} {"train_loss": -5.481546401977539, "global_step": 25825, "epoch": 614} {"train_loss": -5.386415481567383, "global_step": 25826, "epoch": 614} {"train_loss": -5.305605888366699, "global_step": 25827, "epoch": 614} {"train_loss": -5.380243301391602, "global_step": 25828, "epoch": 614} {"train_loss": -5.400512173062279, "global_step": 25829, "epoch": 614, "val_loss": 65001.609375} {"train_loss": -5.33732795715332, "global_step": 25830, "epoch": 615} {"train_loss": -5.497923851013184, "global_step": 25831, "epoch": 615} {"train_loss": -5.44349479675293, "global_step": 25832, "epoch": 615} {"train_loss": -5.3305983543396, "global_step": 25833, "epoch": 615} {"train_loss": -5.466811656951904, "global_step": 25834, "epoch": 615} {"train_loss": -5.377511024475098, "global_step": 25835, "epoch": 615} {"train_loss": -5.239223480224609, "global_step": 25836, "epoch": 615} {"train_loss": -5.484866142272949, "global_step": 25837, "epoch": 615} {"train_loss": -5.420729160308838, "global_step": 25838, "epoch": 615} {"train_loss": -5.450976848602295, "global_step": 25839, "epoch": 615} {"train_loss": -5.398324012756348, "global_step": 25840, "epoch": 615} {"train_loss": -5.515862464904785, "global_step": 25841, "epoch": 615} {"train_loss": -5.28537130355835, "global_step": 25842, "epoch": 615} {"train_loss": -5.442153453826904, "global_step": 25843, "epoch": 615} {"train_loss": -5.450921058654785, "global_step": 25844, "epoch": 615} {"train_loss": -5.312255859375, "global_step": 25845, "epoch": 615} {"train_loss": -5.416735649108887, "global_step": 25846, "epoch": 615} {"train_loss": -5.421543121337891, "global_step": 25847, "epoch": 615} {"train_loss": -5.42240047454834, "global_step": 25848, "epoch": 615} {"train_loss": -5.57064151763916, "global_step": 25849, "epoch": 615} {"train_loss": -5.3400959968566895, "global_step": 25850, "epoch": 615} {"train_loss": -5.479430198669434, "global_step": 25851, "epoch": 615} {"train_loss": -5.558779239654541, "global_step": 25852, "epoch": 615} {"train_loss": -5.353891849517822, "global_step": 25853, "epoch": 615} {"train_loss": -5.2943315505981445, "global_step": 25854, "epoch": 615} {"train_loss": -5.41053581237793, "global_step": 25855, "epoch": 615} {"train_loss": -5.394458770751953, "global_step": 25856, "epoch": 615} {"train_loss": -5.395454406738281, "global_step": 25857, "epoch": 615} {"train_loss": -5.167520523071289, "global_step": 25858, "epoch": 615} {"train_loss": -5.262036323547363, "global_step": 25859, "epoch": 615} {"train_loss": -5.459504127502441, "global_step": 25860, "epoch": 615} {"train_loss": -5.428844928741455, "global_step": 25861, "epoch": 615} {"train_loss": -5.401120662689209, "global_step": 25862, "epoch": 615} {"train_loss": -5.351621150970459, "global_step": 25863, "epoch": 615} {"train_loss": -5.38694429397583, "global_step": 25864, "epoch": 615} {"train_loss": -5.27376651763916, "global_step": 25865, "epoch": 615} {"train_loss": -5.526233673095703, "global_step": 25866, "epoch": 615} {"train_loss": -5.378899574279785, "global_step": 25867, "epoch": 615} {"train_loss": -5.3149895668029785, "global_step": 25868, "epoch": 615} {"train_loss": -5.566744804382324, "global_step": 25869, "epoch": 615} {"train_loss": -5.53133487701416, "global_step": 25870, "epoch": 615} {"train_loss": -5.404524803161621, "global_step": 25871, "epoch": 615, "val_loss": 65254.33203125} {"train_loss": -5.239394187927246, "global_step": 25872, "epoch": 616} {"train_loss": -5.476819038391113, "global_step": 25873, "epoch": 616} {"train_loss": -5.492810249328613, "global_step": 25874, "epoch": 616} {"train_loss": -5.2432861328125, "global_step": 25875, "epoch": 616} {"train_loss": -5.439277648925781, "global_step": 25876, "epoch": 616} {"train_loss": -5.522982120513916, "global_step": 25877, "epoch": 616} {"train_loss": -5.29808235168457, "global_step": 25878, "epoch": 616} {"train_loss": -5.422138214111328, "global_step": 25879, "epoch": 616} {"train_loss": -5.417063236236572, "global_step": 25880, "epoch": 616} {"train_loss": -5.407151222229004, "global_step": 25881, "epoch": 616} {"train_loss": -5.493856430053711, "global_step": 25882, "epoch": 616} {"train_loss": -5.306221008300781, "global_step": 25883, "epoch": 616} {"train_loss": -5.32396125793457, "global_step": 25884, "epoch": 616} {"train_loss": -5.317734718322754, "global_step": 25885, "epoch": 616} {"train_loss": -5.365373611450195, "global_step": 25886, "epoch": 616} {"train_loss": -5.436842918395996, "global_step": 25887, "epoch": 616} {"train_loss": -5.522777557373047, "global_step": 25888, "epoch": 616} {"train_loss": -5.365030765533447, "global_step": 25889, "epoch": 616} {"train_loss": -5.387680530548096, "global_step": 25890, "epoch": 616} {"train_loss": -5.424294471740723, "global_step": 25891, "epoch": 616} {"train_loss": -5.329117774963379, "global_step": 25892, "epoch": 616} {"train_loss": -5.163778305053711, "global_step": 25893, "epoch": 616} {"train_loss": -5.509012699127197, "global_step": 25894, "epoch": 616} {"train_loss": -5.259878635406494, "global_step": 25895, "epoch": 616} {"train_loss": -5.486825466156006, "global_step": 25896, "epoch": 616} {"train_loss": -5.372204780578613, "global_step": 25897, "epoch": 616} {"train_loss": -5.328110218048096, "global_step": 25898, "epoch": 616} {"train_loss": -5.478818416595459, "global_step": 25899, "epoch": 616} {"train_loss": -5.4307861328125, "global_step": 25900, "epoch": 616} {"train_loss": -5.515837669372559, "global_step": 25901, "epoch": 616} {"train_loss": -5.535337924957275, "global_step": 25902, "epoch": 616} {"train_loss": -5.325042724609375, "global_step": 25903, "epoch": 616} {"train_loss": -5.3495893478393555, "global_step": 25904, "epoch": 616} {"train_loss": -5.415464401245117, "global_step": 25905, "epoch": 616} {"train_loss": -5.346235752105713, "global_step": 25906, "epoch": 616} {"train_loss": -5.462250232696533, "global_step": 25907, "epoch": 616} {"train_loss": -5.441061019897461, "global_step": 25908, "epoch": 616} {"train_loss": -5.356119632720947, "global_step": 25909, "epoch": 616} {"train_loss": -5.461435794830322, "global_step": 25910, "epoch": 616} {"train_loss": -5.489123821258545, "global_step": 25911, "epoch": 616} {"train_loss": -5.412166595458984, "global_step": 25912, "epoch": 616} {"train_loss": -5.396944034667242, "global_step": 25913, "epoch": 616, "val_loss": 64942.2265625} {"train_loss": -5.517731189727783, "global_step": 25914, "epoch": 617} {"train_loss": -5.3256402015686035, "global_step": 25915, "epoch": 617} {"train_loss": -5.319047927856445, "global_step": 25916, "epoch": 617} {"train_loss": -5.463280200958252, "global_step": 25917, "epoch": 617} {"train_loss": -5.364426136016846, "global_step": 25918, "epoch": 617} {"train_loss": -5.318243503570557, "global_step": 25919, "epoch": 617} {"train_loss": -5.358964920043945, "global_step": 25920, "epoch": 617} {"train_loss": -5.457000255584717, "global_step": 25921, "epoch": 617} {"train_loss": -5.300243854522705, "global_step": 25922, "epoch": 617} {"train_loss": -5.398865699768066, "global_step": 25923, "epoch": 617} {"train_loss": -5.475481986999512, "global_step": 25924, "epoch": 617} {"train_loss": -5.5324625968933105, "global_step": 25925, "epoch": 617} {"train_loss": -5.4683074951171875, "global_step": 25926, "epoch": 617} {"train_loss": -5.4589338302612305, "global_step": 25927, "epoch": 617} {"train_loss": -5.361507415771484, "global_step": 25928, "epoch": 617} {"train_loss": -5.362674713134766, "global_step": 25929, "epoch": 617} {"train_loss": -5.459555149078369, "global_step": 25930, "epoch": 617} {"train_loss": -5.409905433654785, "global_step": 25931, "epoch": 617} {"train_loss": -5.499740123748779, "global_step": 25932, "epoch": 617} {"train_loss": -5.376783847808838, "global_step": 25933, "epoch": 617} {"train_loss": -5.500631809234619, "global_step": 25934, "epoch": 617} {"train_loss": -5.403675556182861, "global_step": 25935, "epoch": 617} {"train_loss": -5.3870368003845215, "global_step": 25936, "epoch": 617} {"train_loss": -5.37341833114624, "global_step": 25937, "epoch": 617} {"train_loss": -5.3900675773620605, "global_step": 25938, "epoch": 617} {"train_loss": -5.443326473236084, "global_step": 25939, "epoch": 617} {"train_loss": -5.239348888397217, "global_step": 25940, "epoch": 617} {"train_loss": -5.528021335601807, "global_step": 25941, "epoch": 617} {"train_loss": -5.406104564666748, "global_step": 25942, "epoch": 617} {"train_loss": -5.469603538513184, "global_step": 25943, "epoch": 617} {"train_loss": -5.413793563842773, "global_step": 25944, "epoch": 617} {"train_loss": -5.287837028503418, "global_step": 25945, "epoch": 617} {"train_loss": -5.456364631652832, "global_step": 25946, "epoch": 617} {"train_loss": -5.41810417175293, "global_step": 25947, "epoch": 617} {"train_loss": -5.327851295471191, "global_step": 25948, "epoch": 617} {"train_loss": -5.276012420654297, "global_step": 25949, "epoch": 617} {"train_loss": -5.35395622253418, "global_step": 25950, "epoch": 617} {"train_loss": -5.234138488769531, "global_step": 25951, "epoch": 617} {"train_loss": -5.374354362487793, "global_step": 25952, "epoch": 617} {"train_loss": -5.24276065826416, "global_step": 25953, "epoch": 617} {"train_loss": -5.400680065155029, "global_step": 25954, "epoch": 617} {"train_loss": -5.394634700956798, "global_step": 25955, "epoch": 617, "val_loss": 65735.3671875} {"train_loss": -5.390401363372803, "global_step": 25956, "epoch": 618} {"train_loss": -5.4272847175598145, "global_step": 25957, "epoch": 618} {"train_loss": -5.26725959777832, "global_step": 25958, "epoch": 618} {"train_loss": -5.21140193939209, "global_step": 25959, "epoch": 618} {"train_loss": -5.43906307220459, "global_step": 25960, "epoch": 618} {"train_loss": -5.2540602684021, "global_step": 25961, "epoch": 618} {"train_loss": -5.34832763671875, "global_step": 25962, "epoch": 618} {"train_loss": -5.469252109527588, "global_step": 25963, "epoch": 618} {"train_loss": -5.384821891784668, "global_step": 25964, "epoch": 618} {"train_loss": -5.479377746582031, "global_step": 25965, "epoch": 618} {"train_loss": -5.349565029144287, "global_step": 25966, "epoch": 618} {"train_loss": -5.3462910652160645, "global_step": 25967, "epoch": 618} {"train_loss": -5.387316703796387, "global_step": 25968, "epoch": 618} {"train_loss": -5.351489543914795, "global_step": 25969, "epoch": 618} {"train_loss": -5.424065589904785, "global_step": 25970, "epoch": 618} {"train_loss": -5.471956253051758, "global_step": 25971, "epoch": 618} {"train_loss": -5.460812568664551, "global_step": 25972, "epoch": 618} {"train_loss": -5.40714168548584, "global_step": 25973, "epoch": 618} {"train_loss": -5.383790969848633, "global_step": 25974, "epoch": 618} {"train_loss": -5.4186811447143555, "global_step": 25975, "epoch": 618} {"train_loss": -5.456573963165283, "global_step": 25976, "epoch": 618} {"train_loss": -5.265138626098633, "global_step": 25977, "epoch": 618} {"train_loss": -5.456311225891113, "global_step": 25978, "epoch": 618} {"train_loss": -5.16396427154541, "global_step": 25979, "epoch": 618} {"train_loss": -5.3813252449035645, "global_step": 25980, "epoch": 618} {"train_loss": -5.44614315032959, "global_step": 25981, "epoch": 618} {"train_loss": -5.276556968688965, "global_step": 25982, "epoch": 618} {"train_loss": -5.392165184020996, "global_step": 25983, "epoch": 618} {"train_loss": -5.502407550811768, "global_step": 25984, "epoch": 618} {"train_loss": -5.522690773010254, "global_step": 25985, "epoch": 618} {"train_loss": -5.4334845542907715, "global_step": 25986, "epoch": 618} {"train_loss": -5.399112701416016, "global_step": 25987, "epoch": 618} {"train_loss": -5.373334884643555, "global_step": 25988, "epoch": 618} {"train_loss": -5.446158409118652, "global_step": 25989, "epoch": 618} {"train_loss": -5.486325263977051, "global_step": 25990, "epoch": 618} {"train_loss": -5.506621360778809, "global_step": 25991, "epoch": 618} {"train_loss": -5.487300395965576, "global_step": 25992, "epoch": 618} {"train_loss": -5.388114929199219, "global_step": 25993, "epoch": 618} {"train_loss": -5.370292663574219, "global_step": 25994, "epoch": 618} {"train_loss": -5.271721839904785, "global_step": 25995, "epoch": 618} {"train_loss": -5.259059429168701, "global_step": 25996, "epoch": 618} {"train_loss": -5.391019991465977, "global_step": 25997, "epoch": 618, "val_loss": 65589.0625} {"train_loss": -5.329956531524658, "global_step": 25998, "epoch": 619} {"train_loss": -5.457923889160156, "global_step": 25999, "epoch": 619} {"train_loss": -5.417624473571777, "global_step": 26000, "epoch": 619} {"train_loss": -5.3988189697265625, "global_step": 26001, "epoch": 619} {"train_loss": -5.464301109313965, "global_step": 26002, "epoch": 619} {"train_loss": -5.461907386779785, "global_step": 26003, "epoch": 619} {"train_loss": -5.439251899719238, "global_step": 26004, "epoch": 619} {"train_loss": -5.452023506164551, "global_step": 26005, "epoch": 619} {"train_loss": -5.393976211547852, "global_step": 26006, "epoch": 619} {"train_loss": -5.424620628356934, "global_step": 26007, "epoch": 619} {"train_loss": -5.412958145141602, "global_step": 26008, "epoch": 619} {"train_loss": -5.415839672088623, "global_step": 26009, "epoch": 619} {"train_loss": -5.395404815673828, "global_step": 26010, "epoch": 619} {"train_loss": -5.286054611206055, "global_step": 26011, "epoch": 619} {"train_loss": -5.2854108810424805, "global_step": 26012, "epoch": 619} {"train_loss": -5.271117210388184, "global_step": 26013, "epoch": 619} {"train_loss": -5.314840316772461, "global_step": 26014, "epoch": 619} {"train_loss": -5.302812576293945, "global_step": 26015, "epoch": 619} {"train_loss": -5.387451648712158, "global_step": 26016, "epoch": 619} {"train_loss": -5.479204177856445, "global_step": 26017, "epoch": 619} {"train_loss": -5.4870405197143555, "global_step": 26018, "epoch": 619} {"train_loss": -5.404788017272949, "global_step": 26019, "epoch": 619} {"train_loss": -5.337686061859131, "global_step": 26020, "epoch": 619} {"train_loss": -5.278838157653809, "global_step": 26021, "epoch": 619} {"train_loss": -5.455205917358398, "global_step": 26022, "epoch": 619} {"train_loss": -5.26961612701416, "global_step": 26023, "epoch": 619} {"train_loss": -5.487198829650879, "global_step": 26024, "epoch": 619} {"train_loss": -5.32130765914917, "global_step": 26025, "epoch": 619} {"train_loss": -5.415895462036133, "global_step": 26026, "epoch": 619} {"train_loss": -5.4061737060546875, "global_step": 26027, "epoch": 619} {"train_loss": -5.428788661956787, "global_step": 26028, "epoch": 619} {"train_loss": -5.3402910232543945, "global_step": 26029, "epoch": 619} {"train_loss": -5.496264934539795, "global_step": 26030, "epoch": 619} {"train_loss": -5.496894359588623, "global_step": 26031, "epoch": 619} {"train_loss": -5.360210418701172, "global_step": 26032, "epoch": 619} {"train_loss": -5.353497505187988, "global_step": 26033, "epoch": 619} {"train_loss": -5.595602035522461, "global_step": 26034, "epoch": 619} {"train_loss": -5.477485656738281, "global_step": 26035, "epoch": 619} {"train_loss": -5.44877815246582, "global_step": 26036, "epoch": 619} {"train_loss": -5.32509708404541, "global_step": 26037, "epoch": 619} {"train_loss": -5.393082618713379, "global_step": 26038, "epoch": 619} {"train_loss": -5.397475617272513, "global_step": 26039, "epoch": 619, "val_loss": 64511.52734375} {"train_loss": -5.379927635192871, "global_step": 26040, "epoch": 620} {"train_loss": -5.4370598793029785, "global_step": 26041, "epoch": 620} {"train_loss": -5.363198280334473, "global_step": 26042, "epoch": 620} {"train_loss": -5.426607131958008, "global_step": 26043, "epoch": 620} {"train_loss": -5.4147162437438965, "global_step": 26044, "epoch": 620} {"train_loss": -5.341083526611328, "global_step": 26045, "epoch": 620} {"train_loss": -5.310994625091553, "global_step": 26046, "epoch": 620} {"train_loss": -5.482836723327637, "global_step": 26047, "epoch": 620} {"train_loss": -5.263774871826172, "global_step": 26048, "epoch": 620} {"train_loss": -5.3993940353393555, "global_step": 26049, "epoch": 620} {"train_loss": -5.338972091674805, "global_step": 26050, "epoch": 620} {"train_loss": -5.405125617980957, "global_step": 26051, "epoch": 620} {"train_loss": -5.471381187438965, "global_step": 26052, "epoch": 620} {"train_loss": -5.308250427246094, "global_step": 26053, "epoch": 620} {"train_loss": -5.386889457702637, "global_step": 26054, "epoch": 620} {"train_loss": -5.432299613952637, "global_step": 26055, "epoch": 620} {"train_loss": -5.366253852844238, "global_step": 26056, "epoch": 620} {"train_loss": -5.376528739929199, "global_step": 26057, "epoch": 620} {"train_loss": -5.492960453033447, "global_step": 26058, "epoch": 620} {"train_loss": -5.427977561950684, "global_step": 26059, "epoch": 620} {"train_loss": -5.473268032073975, "global_step": 26060, "epoch": 620} {"train_loss": -5.422852993011475, "global_step": 26061, "epoch": 620} {"train_loss": -5.448259353637695, "global_step": 26062, "epoch": 620} {"train_loss": -5.463980674743652, "global_step": 26063, "epoch": 620} {"train_loss": -5.479681968688965, "global_step": 26064, "epoch": 620} {"train_loss": -5.520486831665039, "global_step": 26065, "epoch": 620} {"train_loss": -5.363931655883789, "global_step": 26066, "epoch": 620} {"train_loss": -5.330945014953613, "global_step": 26067, "epoch": 620} {"train_loss": -5.406922340393066, "global_step": 26068, "epoch": 620} {"train_loss": -5.415937900543213, "global_step": 26069, "epoch": 620} {"train_loss": -5.3985748291015625, "global_step": 26070, "epoch": 620} {"train_loss": -5.473690509796143, "global_step": 26071, "epoch": 620} {"train_loss": -5.417564392089844, "global_step": 26072, "epoch": 620} {"train_loss": -5.357492446899414, "global_step": 26073, "epoch": 620} {"train_loss": -5.325996398925781, "global_step": 26074, "epoch": 620} {"train_loss": -5.5436272621154785, "global_step": 26075, "epoch": 620} {"train_loss": -5.4899396896362305, "global_step": 26076, "epoch": 620} {"train_loss": -5.472372531890869, "global_step": 26077, "epoch": 620} {"train_loss": -5.430161952972412, "global_step": 26078, "epoch": 620} {"train_loss": -5.493992805480957, "global_step": 26079, "epoch": 620} {"train_loss": -5.616069793701172, "global_step": 26080, "epoch": 620} {"train_loss": -5.417066267558506, "global_step": 26081, "epoch": 620, "val_loss": 64975.09375} {"train_loss": -5.4601030349731445, "global_step": 26082, "epoch": 621} {"train_loss": -5.422060012817383, "global_step": 26083, "epoch": 621} {"train_loss": -5.417834758758545, "global_step": 26084, "epoch": 621} {"train_loss": -5.378532409667969, "global_step": 26085, "epoch": 621} {"train_loss": -5.548576831817627, "global_step": 26086, "epoch": 621} {"train_loss": -5.448602676391602, "global_step": 26087, "epoch": 621} {"train_loss": -5.476298809051514, "global_step": 26088, "epoch": 621} {"train_loss": -5.401906967163086, "global_step": 26089, "epoch": 621} {"train_loss": -5.3857035636901855, "global_step": 26090, "epoch": 621} {"train_loss": -5.383116245269775, "global_step": 26091, "epoch": 621} {"train_loss": -5.529900550842285, "global_step": 26092, "epoch": 621} {"train_loss": -5.3503522872924805, "global_step": 26093, "epoch": 621} {"train_loss": -5.349692344665527, "global_step": 26094, "epoch": 621} {"train_loss": -5.484038829803467, "global_step": 26095, "epoch": 621} {"train_loss": -5.353306770324707, "global_step": 26096, "epoch": 621} {"train_loss": -5.399415493011475, "global_step": 26097, "epoch": 621} {"train_loss": -5.397336959838867, "global_step": 26098, "epoch": 621} {"train_loss": -5.491744518280029, "global_step": 26099, "epoch": 621} {"train_loss": -5.316476821899414, "global_step": 26100, "epoch": 621} {"train_loss": -5.306271553039551, "global_step": 26101, "epoch": 621} {"train_loss": -5.317048072814941, "global_step": 26102, "epoch": 621} {"train_loss": -5.209766387939453, "global_step": 26103, "epoch": 621} {"train_loss": -5.3867998123168945, "global_step": 26104, "epoch": 621} {"train_loss": -5.243805408477783, "global_step": 26105, "epoch": 621} {"train_loss": -5.183060169219971, "global_step": 26106, "epoch": 621} {"train_loss": -5.3183722496032715, "global_step": 26107, "epoch": 621} {"train_loss": -5.147457122802734, "global_step": 26108, "epoch": 621} {"train_loss": -5.232774257659912, "global_step": 26109, "epoch": 621} {"train_loss": -5.27488899230957, "global_step": 26110, "epoch": 621} {"train_loss": -5.294519424438477, "global_step": 26111, "epoch": 621} {"train_loss": -5.256330966949463, "global_step": 26112, "epoch": 621} {"train_loss": -5.336237907409668, "global_step": 26113, "epoch": 621} {"train_loss": -5.360703945159912, "global_step": 26114, "epoch": 621} {"train_loss": -5.4826178550720215, "global_step": 26115, "epoch": 621} {"train_loss": -5.418113708496094, "global_step": 26116, "epoch": 621} {"train_loss": -5.441452503204346, "global_step": 26117, "epoch": 621} {"train_loss": -5.376283645629883, "global_step": 26118, "epoch": 621} {"train_loss": -5.333711624145508, "global_step": 26119, "epoch": 621} {"train_loss": -5.367714881896973, "global_step": 26120, "epoch": 621} {"train_loss": -5.4601335525512695, "global_step": 26121, "epoch": 621} {"train_loss": -5.221555709838867, "global_step": 26122, "epoch": 621} {"train_loss": -5.368631953284854, "global_step": 26123, "epoch": 621, "val_loss": 64767.2578125} {"train_loss": -5.442318916320801, "global_step": 26124, "epoch": 622} {"train_loss": -5.269949913024902, "global_step": 26125, "epoch": 622} {"train_loss": -5.303732872009277, "global_step": 26126, "epoch": 622} {"train_loss": -5.419521331787109, "global_step": 26127, "epoch": 622} {"train_loss": -5.5361785888671875, "global_step": 26128, "epoch": 622} {"train_loss": -5.412255764007568, "global_step": 26129, "epoch": 622} {"train_loss": -5.451329708099365, "global_step": 26130, "epoch": 622} {"train_loss": -5.366070747375488, "global_step": 26131, "epoch": 622} {"train_loss": -5.3927812576293945, "global_step": 26132, "epoch": 622} {"train_loss": -5.472329616546631, "global_step": 26133, "epoch": 622} {"train_loss": -5.476625919342041, "global_step": 26134, "epoch": 622} {"train_loss": -5.333971977233887, "global_step": 26135, "epoch": 622} {"train_loss": -5.561479568481445, "global_step": 26136, "epoch": 622} {"train_loss": -5.422795295715332, "global_step": 26137, "epoch": 622} {"train_loss": -5.447612285614014, "global_step": 26138, "epoch": 622} {"train_loss": -5.402584075927734, "global_step": 26139, "epoch": 622} {"train_loss": -5.456012725830078, "global_step": 26140, "epoch": 622} {"train_loss": -5.553274154663086, "global_step": 26141, "epoch": 622} {"train_loss": -5.375923156738281, "global_step": 26142, "epoch": 622} {"train_loss": -5.348735809326172, "global_step": 26143, "epoch": 622} {"train_loss": -5.38267183303833, "global_step": 26144, "epoch": 622} {"train_loss": -5.45598030090332, "global_step": 26145, "epoch": 622} {"train_loss": -5.3013715744018555, "global_step": 26146, "epoch": 622} {"train_loss": -5.38718843460083, "global_step": 26147, "epoch": 622} {"train_loss": -5.440492630004883, "global_step": 26148, "epoch": 622} {"train_loss": -5.365241050720215, "global_step": 26149, "epoch": 622} {"train_loss": -5.2516279220581055, "global_step": 26150, "epoch": 622} {"train_loss": -5.365187644958496, "global_step": 26151, "epoch": 622} {"train_loss": -5.429640769958496, "global_step": 26152, "epoch": 622} {"train_loss": -5.200164794921875, "global_step": 26153, "epoch": 622} {"train_loss": -5.324820041656494, "global_step": 26154, "epoch": 622} {"train_loss": -5.195714950561523, "global_step": 26155, "epoch": 622} {"train_loss": -5.048974990844727, "global_step": 26156, "epoch": 622} {"train_loss": -5.331241130828857, "global_step": 26157, "epoch": 622} {"train_loss": -5.250162601470947, "global_step": 26158, "epoch": 622} {"train_loss": -5.282374382019043, "global_step": 26159, "epoch": 622} {"train_loss": -5.314335346221924, "global_step": 26160, "epoch": 622} {"train_loss": -5.325607776641846, "global_step": 26161, "epoch": 622} {"train_loss": -5.41732120513916, "global_step": 26162, "epoch": 622} {"train_loss": -5.458162307739258, "global_step": 26163, "epoch": 622} {"train_loss": -5.254655838012695, "global_step": 26164, "epoch": 622} {"train_loss": -5.372775100526356, "global_step": 26165, "epoch": 622, "val_loss": 64866.9609375} {"train_loss": -5.495244979858398, "global_step": 26166, "epoch": 623} {"train_loss": -5.397129058837891, "global_step": 26167, "epoch": 623} {"train_loss": -5.267845153808594, "global_step": 26168, "epoch": 623} {"train_loss": -5.4323225021362305, "global_step": 26169, "epoch": 623} {"train_loss": -5.362096786499023, "global_step": 26170, "epoch": 623} {"train_loss": -5.2980451583862305, "global_step": 26171, "epoch": 623} {"train_loss": -5.4571990966796875, "global_step": 26172, "epoch": 623} {"train_loss": -5.415813446044922, "global_step": 26173, "epoch": 623} {"train_loss": -5.3783278465271, "global_step": 26174, "epoch": 623} {"train_loss": -5.532047271728516, "global_step": 26175, "epoch": 623} {"train_loss": -5.461504936218262, "global_step": 26176, "epoch": 623} {"train_loss": -5.473499298095703, "global_step": 26177, "epoch": 623} {"train_loss": -5.34119987487793, "global_step": 26178, "epoch": 623} {"train_loss": -5.34440803527832, "global_step": 26179, "epoch": 623} {"train_loss": -5.574225425720215, "global_step": 26180, "epoch": 623} {"train_loss": -5.40450382232666, "global_step": 26181, "epoch": 623} {"train_loss": -5.497311115264893, "global_step": 26182, "epoch": 623} {"train_loss": -5.394538879394531, "global_step": 26183, "epoch": 623} {"train_loss": -5.3522868156433105, "global_step": 26184, "epoch": 623} {"train_loss": -5.298623085021973, "global_step": 26185, "epoch": 623} {"train_loss": -5.42629337310791, "global_step": 26186, "epoch": 623} {"train_loss": -5.234550476074219, "global_step": 26187, "epoch": 623} {"train_loss": -5.31180477142334, "global_step": 26188, "epoch": 623} {"train_loss": -5.502494812011719, "global_step": 26189, "epoch": 623} {"train_loss": -5.4134063720703125, "global_step": 26190, "epoch": 623} {"train_loss": -5.371521472930908, "global_step": 26191, "epoch": 623} {"train_loss": -5.299480438232422, "global_step": 26192, "epoch": 623} {"train_loss": -5.362705707550049, "global_step": 26193, "epoch": 623} {"train_loss": -5.122992038726807, "global_step": 26194, "epoch": 623} {"train_loss": -5.377975940704346, "global_step": 26195, "epoch": 623} {"train_loss": -5.283254623413086, "global_step": 26196, "epoch": 623} {"train_loss": -5.270792007446289, "global_step": 26197, "epoch": 623} {"train_loss": -5.338046073913574, "global_step": 26198, "epoch": 623} {"train_loss": -5.317602157592773, "global_step": 26199, "epoch": 623} {"train_loss": -5.379457473754883, "global_step": 26200, "epoch": 623} {"train_loss": -5.3661088943481445, "global_step": 26201, "epoch": 623} {"train_loss": -5.290518283843994, "global_step": 26202, "epoch": 623} {"train_loss": -5.440875053405762, "global_step": 26203, "epoch": 623} {"train_loss": -5.292224407196045, "global_step": 26204, "epoch": 623} {"train_loss": -5.355681896209717, "global_step": 26205, "epoch": 623} {"train_loss": -5.476891994476318, "global_step": 26206, "epoch": 623} {"train_loss": -5.374711059388661, "global_step": 26207, "epoch": 623, "val_loss": 64623.140625} {"train_loss": -5.354146957397461, "global_step": 26208, "epoch": 624} {"train_loss": -5.489284992218018, "global_step": 26209, "epoch": 624} {"train_loss": -5.461620330810547, "global_step": 26210, "epoch": 624} {"train_loss": -5.425241470336914, "global_step": 26211, "epoch": 624} {"train_loss": -5.204767227172852, "global_step": 26212, "epoch": 624} {"train_loss": -5.542149543762207, "global_step": 26213, "epoch": 624} {"train_loss": -5.4815263748168945, "global_step": 26214, "epoch": 624} {"train_loss": -5.4478325843811035, "global_step": 26215, "epoch": 624} {"train_loss": -5.40308141708374, "global_step": 26216, "epoch": 624} {"train_loss": -5.443181991577148, "global_step": 26217, "epoch": 624} {"train_loss": -5.387012958526611, "global_step": 26218, "epoch": 624} {"train_loss": -5.434279918670654, "global_step": 26219, "epoch": 624} {"train_loss": -5.416214942932129, "global_step": 26220, "epoch": 624} {"train_loss": -5.4302215576171875, "global_step": 26221, "epoch": 624} {"train_loss": -5.521461009979248, "global_step": 26222, "epoch": 624} {"train_loss": -5.396334648132324, "global_step": 26223, "epoch": 624} {"train_loss": -5.368599891662598, "global_step": 26224, "epoch": 624} {"train_loss": -5.5335283279418945, "global_step": 26225, "epoch": 624} {"train_loss": -5.373526096343994, "global_step": 26226, "epoch": 624} {"train_loss": -5.46665096282959, "global_step": 26227, "epoch": 624} {"train_loss": -5.374020099639893, "global_step": 26228, "epoch": 624} {"train_loss": -5.413201332092285, "global_step": 26229, "epoch": 624} {"train_loss": -5.448239326477051, "global_step": 26230, "epoch": 624} {"train_loss": -5.571114540100098, "global_step": 26231, "epoch": 624} {"train_loss": -5.481592655181885, "global_step": 26232, "epoch": 624} {"train_loss": -5.445979118347168, "global_step": 26233, "epoch": 624} {"train_loss": -5.48510217666626, "global_step": 26234, "epoch": 624} {"train_loss": -5.375920295715332, "global_step": 26235, "epoch": 624} {"train_loss": -5.448336601257324, "global_step": 26236, "epoch": 624} {"train_loss": -5.469385147094727, "global_step": 26237, "epoch": 624} {"train_loss": -5.284296035766602, "global_step": 26238, "epoch": 624} {"train_loss": -5.421754837036133, "global_step": 26239, "epoch": 624} {"train_loss": -5.401601791381836, "global_step": 26240, "epoch": 624} {"train_loss": -5.275920391082764, "global_step": 26241, "epoch": 624} {"train_loss": -5.319029808044434, "global_step": 26242, "epoch": 624} {"train_loss": -5.250187873840332, "global_step": 26243, "epoch": 624} {"train_loss": -5.442756175994873, "global_step": 26244, "epoch": 624} {"train_loss": -5.313451290130615, "global_step": 26245, "epoch": 624} {"train_loss": -5.404529094696045, "global_step": 26246, "epoch": 624} {"train_loss": -5.343619346618652, "global_step": 26247, "epoch": 624} {"train_loss": -5.4377031326293945, "global_step": 26248, "epoch": 624} {"train_loss": -5.414831104732695, "global_step": 26249, "epoch": 624, "val_loss": 64858.0234375} {"train_loss": -5.577204704284668, "global_step": 26250, "epoch": 625} {"train_loss": -5.389675617218018, "global_step": 26251, "epoch": 625} {"train_loss": -5.413220405578613, "global_step": 26252, "epoch": 625} {"train_loss": -5.6042938232421875, "global_step": 26253, "epoch": 625} {"train_loss": -5.352687358856201, "global_step": 26254, "epoch": 625} {"train_loss": -5.408940315246582, "global_step": 26255, "epoch": 625} {"train_loss": -5.535216808319092, "global_step": 26256, "epoch": 625} {"train_loss": -5.455639839172363, "global_step": 26257, "epoch": 625} {"train_loss": -5.4141106605529785, "global_step": 26258, "epoch": 625} {"train_loss": -5.47631311416626, "global_step": 26259, "epoch": 625} {"train_loss": -5.42471981048584, "global_step": 26260, "epoch": 625} {"train_loss": -5.479426383972168, "global_step": 26261, "epoch": 625} {"train_loss": -5.309425354003906, "global_step": 26262, "epoch": 625} {"train_loss": -5.445311546325684, "global_step": 26263, "epoch": 625} {"train_loss": -5.3531646728515625, "global_step": 26264, "epoch": 625} {"train_loss": -5.428978443145752, "global_step": 26265, "epoch": 625} {"train_loss": -5.25843620300293, "global_step": 26266, "epoch": 625} {"train_loss": -5.576001167297363, "global_step": 26267, "epoch": 625} {"train_loss": -5.384270668029785, "global_step": 26268, "epoch": 625} {"train_loss": -5.368010520935059, "global_step": 26269, "epoch": 625} {"train_loss": -5.434556007385254, "global_step": 26270, "epoch": 625} {"train_loss": -5.432503700256348, "global_step": 26271, "epoch": 625} {"train_loss": -5.420342445373535, "global_step": 26272, "epoch": 625} {"train_loss": -5.38466739654541, "global_step": 26273, "epoch": 625} {"train_loss": -5.4651288986206055, "global_step": 26274, "epoch": 625} {"train_loss": -5.479706764221191, "global_step": 26275, "epoch": 625} {"train_loss": -5.44500732421875, "global_step": 26276, "epoch": 625} {"train_loss": -5.3095550537109375, "global_step": 26277, "epoch": 625} {"train_loss": -5.260540962219238, "global_step": 26278, "epoch": 625} {"train_loss": -5.404605865478516, "global_step": 26279, "epoch": 625} {"train_loss": -5.402385234832764, "global_step": 26280, "epoch": 625} {"train_loss": -5.374656677246094, "global_step": 26281, "epoch": 625} {"train_loss": -5.4006667137146, "global_step": 26282, "epoch": 625} {"train_loss": -5.404035568237305, "global_step": 26283, "epoch": 625} {"train_loss": -5.415853500366211, "global_step": 26284, "epoch": 625} {"train_loss": -5.456462383270264, "global_step": 26285, "epoch": 625} {"train_loss": -5.449057102203369, "global_step": 26286, "epoch": 625} {"train_loss": -5.472212791442871, "global_step": 26287, "epoch": 625} {"train_loss": -5.507855415344238, "global_step": 26288, "epoch": 625} {"train_loss": -5.35970401763916, "global_step": 26289, "epoch": 625} {"train_loss": -5.428090572357178, "global_step": 26290, "epoch": 625} {"train_loss": -5.4234877768017, "global_step": 26291, "epoch": 625, "val_loss": 64596.390625} {"train_loss": -5.402587413787842, "global_step": 26292, "epoch": 626} {"train_loss": -5.437771797180176, "global_step": 26293, "epoch": 626} {"train_loss": -5.246622085571289, "global_step": 26294, "epoch": 626} {"train_loss": -5.356756210327148, "global_step": 26295, "epoch": 626} {"train_loss": -5.417895317077637, "global_step": 26296, "epoch": 626} {"train_loss": -5.222033977508545, "global_step": 26297, "epoch": 626} {"train_loss": -5.488693714141846, "global_step": 26298, "epoch": 626} {"train_loss": -5.368144989013672, "global_step": 26299, "epoch": 626} {"train_loss": -5.467506408691406, "global_step": 26300, "epoch": 626} {"train_loss": -5.43316650390625, "global_step": 26301, "epoch": 626} {"train_loss": -5.463863372802734, "global_step": 26302, "epoch": 626} {"train_loss": -5.440530300140381, "global_step": 26303, "epoch": 626} {"train_loss": -5.461482048034668, "global_step": 26304, "epoch": 626} {"train_loss": -5.481295108795166, "global_step": 26305, "epoch": 626} {"train_loss": -5.617397785186768, "global_step": 26306, "epoch": 626} {"train_loss": -5.431756019592285, "global_step": 26307, "epoch": 626} {"train_loss": -5.444854259490967, "global_step": 26308, "epoch": 626} {"train_loss": -5.501001834869385, "global_step": 26309, "epoch": 626} {"train_loss": -5.201520919799805, "global_step": 26310, "epoch": 626} {"train_loss": -5.395089149475098, "global_step": 26311, "epoch": 626} {"train_loss": -5.3614182472229, "global_step": 26312, "epoch": 626} {"train_loss": -5.355007171630859, "global_step": 26313, "epoch": 626} {"train_loss": -5.362970352172852, "global_step": 26314, "epoch": 626} {"train_loss": -5.3557538986206055, "global_step": 26315, "epoch": 626} {"train_loss": -5.534403324127197, "global_step": 26316, "epoch": 626} {"train_loss": -5.262751579284668, "global_step": 26317, "epoch": 626} {"train_loss": -5.283989429473877, "global_step": 26318, "epoch": 626} {"train_loss": -5.394963264465332, "global_step": 26319, "epoch": 626} {"train_loss": -5.321033954620361, "global_step": 26320, "epoch": 626} {"train_loss": -5.39111328125, "global_step": 26321, "epoch": 626} {"train_loss": -5.494625568389893, "global_step": 26322, "epoch": 626} {"train_loss": -5.331645488739014, "global_step": 26323, "epoch": 626} {"train_loss": -5.311408996582031, "global_step": 26324, "epoch": 626} {"train_loss": -5.485564231872559, "global_step": 26325, "epoch": 626} {"train_loss": -5.339550018310547, "global_step": 26326, "epoch": 626} {"train_loss": -5.315769672393799, "global_step": 26327, "epoch": 626} {"train_loss": -5.415606498718262, "global_step": 26328, "epoch": 626} {"train_loss": -5.355986595153809, "global_step": 26329, "epoch": 626} {"train_loss": -5.306873321533203, "global_step": 26330, "epoch": 626} {"train_loss": -5.334829807281494, "global_step": 26331, "epoch": 626} {"train_loss": -5.434357166290283, "global_step": 26332, "epoch": 626} {"train_loss": -5.392475434712002, "global_step": 26333, "epoch": 626, "val_loss": 65208.1875} {"train_loss": -5.291977405548096, "global_step": 26334, "epoch": 627} {"train_loss": -5.384010314941406, "global_step": 26335, "epoch": 627} {"train_loss": -5.430751323699951, "global_step": 26336, "epoch": 627} {"train_loss": -5.342779159545898, "global_step": 26337, "epoch": 627} {"train_loss": -5.350518703460693, "global_step": 26338, "epoch": 627} {"train_loss": -5.412616729736328, "global_step": 26339, "epoch": 627} {"train_loss": -5.467832565307617, "global_step": 26340, "epoch": 627} {"train_loss": -5.251307487487793, "global_step": 26341, "epoch": 627} {"train_loss": -5.360012054443359, "global_step": 26342, "epoch": 627} {"train_loss": -5.401718616485596, "global_step": 26343, "epoch": 627} {"train_loss": -5.375497817993164, "global_step": 26344, "epoch": 627} {"train_loss": -5.315428733825684, "global_step": 26345, "epoch": 627} {"train_loss": -5.317502498626709, "global_step": 26346, "epoch": 627} {"train_loss": -5.373501777648926, "global_step": 26347, "epoch": 627} {"train_loss": -5.391592025756836, "global_step": 26348, "epoch": 627} {"train_loss": -5.444099426269531, "global_step": 26349, "epoch": 627} {"train_loss": -5.553472518920898, "global_step": 26350, "epoch": 627} {"train_loss": -5.364612579345703, "global_step": 26351, "epoch": 627} {"train_loss": -5.33637809753418, "global_step": 26352, "epoch": 627} {"train_loss": -5.354635238647461, "global_step": 26353, "epoch": 627} {"train_loss": -5.443410873413086, "global_step": 26354, "epoch": 627} {"train_loss": -5.367857456207275, "global_step": 26355, "epoch": 627} {"train_loss": -5.4082932472229, "global_step": 26356, "epoch": 627} {"train_loss": -5.402439117431641, "global_step": 26357, "epoch": 627} {"train_loss": -5.537755966186523, "global_step": 26358, "epoch": 627} {"train_loss": -5.422004699707031, "global_step": 26359, "epoch": 627} {"train_loss": -5.447826385498047, "global_step": 26360, "epoch": 627} {"train_loss": -5.395915985107422, "global_step": 26361, "epoch": 627} {"train_loss": -5.456992149353027, "global_step": 26362, "epoch": 627} {"train_loss": -5.502549648284912, "global_step": 26363, "epoch": 627} {"train_loss": -5.4657793045043945, "global_step": 26364, "epoch": 627} {"train_loss": -5.449469089508057, "global_step": 26365, "epoch": 627} {"train_loss": -5.369288921356201, "global_step": 26366, "epoch": 627} {"train_loss": -5.335201263427734, "global_step": 26367, "epoch": 627} {"train_loss": -5.424656391143799, "global_step": 26368, "epoch": 627} {"train_loss": -5.4047136306762695, "global_step": 26369, "epoch": 627} {"train_loss": -5.374162673950195, "global_step": 26370, "epoch": 627} {"train_loss": -5.32692813873291, "global_step": 26371, "epoch": 627} {"train_loss": -5.441819190979004, "global_step": 26372, "epoch": 627} {"train_loss": -5.444586753845215, "global_step": 26373, "epoch": 627} {"train_loss": -5.343559265136719, "global_step": 26374, "epoch": 627} {"train_loss": -5.398737839290074, "global_step": 26375, "epoch": 627, "val_loss": 65215.796875} {"train_loss": -5.338207244873047, "global_step": 26376, "epoch": 628} {"train_loss": -5.345088005065918, "global_step": 26377, "epoch": 628} {"train_loss": -5.334497451782227, "global_step": 26378, "epoch": 628} {"train_loss": -5.2211198806762695, "global_step": 26379, "epoch": 628} {"train_loss": -5.467196464538574, "global_step": 26380, "epoch": 628} {"train_loss": -5.226900100708008, "global_step": 26381, "epoch": 628} {"train_loss": -5.25844669342041, "global_step": 26382, "epoch": 628} {"train_loss": -5.208244323730469, "global_step": 26383, "epoch": 628} {"train_loss": -5.3359222412109375, "global_step": 26384, "epoch": 628} {"train_loss": -5.288921356201172, "global_step": 26385, "epoch": 628} {"train_loss": -5.4277167320251465, "global_step": 26386, "epoch": 628} {"train_loss": -5.49985408782959, "global_step": 26387, "epoch": 628} {"train_loss": -5.48246955871582, "global_step": 26388, "epoch": 628} {"train_loss": -5.258048057556152, "global_step": 26389, "epoch": 628} {"train_loss": -5.531103134155273, "global_step": 26390, "epoch": 628} {"train_loss": -5.254676818847656, "global_step": 26391, "epoch": 628} {"train_loss": -5.419817924499512, "global_step": 26392, "epoch": 628} {"train_loss": -5.463930606842041, "global_step": 26393, "epoch": 628} {"train_loss": -5.332990646362305, "global_step": 26394, "epoch": 628} {"train_loss": -5.486314296722412, "global_step": 26395, "epoch": 628} {"train_loss": -5.290632724761963, "global_step": 26396, "epoch": 628} {"train_loss": -5.367891311645508, "global_step": 26397, "epoch": 628} {"train_loss": -5.253273010253906, "global_step": 26398, "epoch": 628} {"train_loss": -5.455350875854492, "global_step": 26399, "epoch": 628} {"train_loss": -5.292325496673584, "global_step": 26400, "epoch": 628} {"train_loss": -5.401400089263916, "global_step": 26401, "epoch": 628} {"train_loss": -5.379372596740723, "global_step": 26402, "epoch": 628} {"train_loss": -5.375940799713135, "global_step": 26403, "epoch": 628} {"train_loss": -5.456781387329102, "global_step": 26404, "epoch": 628} {"train_loss": -5.493094444274902, "global_step": 26405, "epoch": 628} {"train_loss": -5.457701206207275, "global_step": 26406, "epoch": 628} {"train_loss": -5.335731029510498, "global_step": 26407, "epoch": 628} {"train_loss": -5.319077968597412, "global_step": 26408, "epoch": 628} {"train_loss": -5.420615196228027, "global_step": 26409, "epoch": 628} {"train_loss": -5.599056243896484, "global_step": 26410, "epoch": 628} {"train_loss": -5.457425117492676, "global_step": 26411, "epoch": 628} {"train_loss": -5.488064289093018, "global_step": 26412, "epoch": 628} {"train_loss": -5.574565887451172, "global_step": 26413, "epoch": 628} {"train_loss": -5.460154056549072, "global_step": 26414, "epoch": 628} {"train_loss": -5.385117530822754, "global_step": 26415, "epoch": 628} {"train_loss": -5.3743438720703125, "global_step": 26416, "epoch": 628} {"train_loss": -5.3891578288305375, "global_step": 26417, "epoch": 628, "val_loss": 64528.234375} {"train_loss": -5.466272830963135, "global_step": 26418, "epoch": 629} {"train_loss": -5.550895690917969, "global_step": 26419, "epoch": 629} {"train_loss": -5.517124176025391, "global_step": 26420, "epoch": 629} {"train_loss": -5.4704060554504395, "global_step": 26421, "epoch": 629} {"train_loss": -5.41987419128418, "global_step": 26422, "epoch": 629} {"train_loss": -5.3767991065979, "global_step": 26423, "epoch": 629} {"train_loss": -5.370248317718506, "global_step": 26424, "epoch": 629} {"train_loss": -5.322046756744385, "global_step": 26425, "epoch": 629} {"train_loss": -5.301419258117676, "global_step": 26426, "epoch": 629} {"train_loss": -5.423676490783691, "global_step": 26427, "epoch": 629} {"train_loss": -5.446202278137207, "global_step": 26428, "epoch": 629} {"train_loss": -5.211620807647705, "global_step": 26429, "epoch": 629} {"train_loss": -5.4627532958984375, "global_step": 26430, "epoch": 629} {"train_loss": -5.378572463989258, "global_step": 26431, "epoch": 629} {"train_loss": -5.455388069152832, "global_step": 26432, "epoch": 629} {"train_loss": -5.410529136657715, "global_step": 26433, "epoch": 629} {"train_loss": -5.490373134613037, "global_step": 26434, "epoch": 629} {"train_loss": -5.266016006469727, "global_step": 26435, "epoch": 629} {"train_loss": -5.2877960205078125, "global_step": 26436, "epoch": 629} {"train_loss": -5.406205654144287, "global_step": 26437, "epoch": 629} {"train_loss": -5.384230613708496, "global_step": 26438, "epoch": 629} {"train_loss": -5.4447245597839355, "global_step": 26439, "epoch": 629} {"train_loss": -5.383007049560547, "global_step": 26440, "epoch": 629} {"train_loss": -5.195213794708252, "global_step": 26441, "epoch": 629} {"train_loss": -5.301725387573242, "global_step": 26442, "epoch": 629} {"train_loss": -5.436805248260498, "global_step": 26443, "epoch": 629} {"train_loss": -5.4511637687683105, "global_step": 26444, "epoch": 629} {"train_loss": -5.444133758544922, "global_step": 26445, "epoch": 629} {"train_loss": -5.391793251037598, "global_step": 26446, "epoch": 629} {"train_loss": -5.422451019287109, "global_step": 26447, "epoch": 629} {"train_loss": -5.501494407653809, "global_step": 26448, "epoch": 629} {"train_loss": -5.408334255218506, "global_step": 26449, "epoch": 629} {"train_loss": -5.400343894958496, "global_step": 26450, "epoch": 629} {"train_loss": -5.423041343688965, "global_step": 26451, "epoch": 629} {"train_loss": -5.425416469573975, "global_step": 26452, "epoch": 629} {"train_loss": -5.368792533874512, "global_step": 26453, "epoch": 629} {"train_loss": -5.511534214019775, "global_step": 26454, "epoch": 629} {"train_loss": -5.391109943389893, "global_step": 26455, "epoch": 629} {"train_loss": -5.558562278747559, "global_step": 26456, "epoch": 629} {"train_loss": -5.372081756591797, "global_step": 26457, "epoch": 629} {"train_loss": -5.536472320556641, "global_step": 26458, "epoch": 629} {"train_loss": -5.410906144550869, "global_step": 26459, "epoch": 629, "val_loss": 64612.984375} {"train_loss": -5.445331573486328, "global_step": 26460, "epoch": 630} {"train_loss": -5.17136287689209, "global_step": 26461, "epoch": 630} {"train_loss": -5.332162857055664, "global_step": 26462, "epoch": 630} {"train_loss": -5.362972259521484, "global_step": 26463, "epoch": 630} {"train_loss": -5.338254928588867, "global_step": 26464, "epoch": 630} {"train_loss": -5.373302936553955, "global_step": 26465, "epoch": 630} {"train_loss": -5.450478553771973, "global_step": 26466, "epoch": 630} {"train_loss": -5.517358779907227, "global_step": 26467, "epoch": 630} {"train_loss": -5.523088455200195, "global_step": 26468, "epoch": 630} {"train_loss": -5.413123607635498, "global_step": 26469, "epoch": 630} {"train_loss": -5.346072196960449, "global_step": 26470, "epoch": 630} {"train_loss": -5.324121475219727, "global_step": 26471, "epoch": 630} {"train_loss": -5.536764144897461, "global_step": 26472, "epoch": 630} {"train_loss": -5.49354362487793, "global_step": 26473, "epoch": 630} {"train_loss": -5.398264408111572, "global_step": 26474, "epoch": 630} {"train_loss": -5.295351982116699, "global_step": 26475, "epoch": 630} {"train_loss": -5.408159255981445, "global_step": 26476, "epoch": 630} {"train_loss": -5.511984825134277, "global_step": 26477, "epoch": 630} {"train_loss": -5.546975612640381, "global_step": 26478, "epoch": 630} {"train_loss": -5.517453670501709, "global_step": 26479, "epoch": 630} {"train_loss": -5.420228004455566, "global_step": 26480, "epoch": 630} {"train_loss": -5.3724212646484375, "global_step": 26481, "epoch": 630} {"train_loss": -5.495175361633301, "global_step": 26482, "epoch": 630} {"train_loss": -5.4115095138549805, "global_step": 26483, "epoch": 630} {"train_loss": -5.314548015594482, "global_step": 26484, "epoch": 630} {"train_loss": -5.502645015716553, "global_step": 26485, "epoch": 630} {"train_loss": -5.4715070724487305, "global_step": 26486, "epoch": 630} {"train_loss": -5.504514694213867, "global_step": 26487, "epoch": 630} {"train_loss": -5.390527725219727, "global_step": 26488, "epoch": 630} {"train_loss": -5.4622392654418945, "global_step": 26489, "epoch": 630} {"train_loss": -5.378405570983887, "global_step": 26490, "epoch": 630} {"train_loss": -5.356245517730713, "global_step": 26491, "epoch": 630} {"train_loss": -5.351945877075195, "global_step": 26492, "epoch": 630} {"train_loss": -5.521542549133301, "global_step": 26493, "epoch": 630} {"train_loss": -5.433711051940918, "global_step": 26494, "epoch": 630} {"train_loss": -5.391383171081543, "global_step": 26495, "epoch": 630} {"train_loss": -5.424503326416016, "global_step": 26496, "epoch": 630} {"train_loss": -5.270864486694336, "global_step": 26497, "epoch": 630} {"train_loss": -5.4321160316467285, "global_step": 26498, "epoch": 630} {"train_loss": -5.503921031951904, "global_step": 26499, "epoch": 630} {"train_loss": -5.211080074310303, "global_step": 26500, "epoch": 630} {"train_loss": -5.41332889738537, "global_step": 26501, "epoch": 630, "val_loss": 64914.30078125} {"train_loss": -5.321166515350342, "global_step": 26502, "epoch": 631} {"train_loss": -5.275025367736816, "global_step": 26503, "epoch": 631} {"train_loss": -5.445207118988037, "global_step": 26504, "epoch": 631} {"train_loss": -5.288363456726074, "global_step": 26505, "epoch": 631} {"train_loss": -5.374464988708496, "global_step": 26506, "epoch": 631} {"train_loss": -5.53317403793335, "global_step": 26507, "epoch": 631} {"train_loss": -5.418373107910156, "global_step": 26508, "epoch": 631} {"train_loss": -5.409540176391602, "global_step": 26509, "epoch": 631} {"train_loss": -5.334469795227051, "global_step": 26510, "epoch": 631} {"train_loss": -5.5049214363098145, "global_step": 26511, "epoch": 631} {"train_loss": -5.418045520782471, "global_step": 26512, "epoch": 631} {"train_loss": -5.432352542877197, "global_step": 26513, "epoch": 631} {"train_loss": -5.380756378173828, "global_step": 26514, "epoch": 631} {"train_loss": -5.471575736999512, "global_step": 26515, "epoch": 631} {"train_loss": -5.261054992675781, "global_step": 26516, "epoch": 631} {"train_loss": -5.3657732009887695, "global_step": 26517, "epoch": 631} {"train_loss": -5.537308216094971, "global_step": 26518, "epoch": 631} {"train_loss": -5.360320568084717, "global_step": 26519, "epoch": 631} {"train_loss": -5.339465618133545, "global_step": 26520, "epoch": 631} {"train_loss": -5.42871618270874, "global_step": 26521, "epoch": 631} {"train_loss": -5.515511512756348, "global_step": 26522, "epoch": 631} {"train_loss": -5.41017484664917, "global_step": 26523, "epoch": 631} {"train_loss": -5.434340476989746, "global_step": 26524, "epoch": 631} {"train_loss": -5.45487642288208, "global_step": 26525, "epoch": 631} {"train_loss": -5.368121147155762, "global_step": 26526, "epoch": 631} {"train_loss": -5.4088873863220215, "global_step": 26527, "epoch": 631} {"train_loss": -5.3618011474609375, "global_step": 26528, "epoch": 631} {"train_loss": -5.3389177322387695, "global_step": 26529, "epoch": 631} {"train_loss": -5.372762203216553, "global_step": 26530, "epoch": 631} {"train_loss": -5.484515190124512, "global_step": 26531, "epoch": 631} {"train_loss": -5.595728397369385, "global_step": 26532, "epoch": 631} {"train_loss": -5.410865783691406, "global_step": 26533, "epoch": 631} {"train_loss": -5.587339401245117, "global_step": 26534, "epoch": 631} {"train_loss": -5.369050979614258, "global_step": 26535, "epoch": 631} {"train_loss": -5.41200065612793, "global_step": 26536, "epoch": 631} {"train_loss": -5.422460556030273, "global_step": 26537, "epoch": 631} {"train_loss": -5.437478065490723, "global_step": 26538, "epoch": 631} {"train_loss": -5.507325649261475, "global_step": 26539, "epoch": 631} {"train_loss": -5.420498371124268, "global_step": 26540, "epoch": 631} {"train_loss": -5.420427322387695, "global_step": 26541, "epoch": 631} {"train_loss": -5.330036163330078, "global_step": 26542, "epoch": 631} {"train_loss": -5.413890861329579, "global_step": 26543, "epoch": 631, "val_loss": 64561.2265625} {"train_loss": -5.473886966705322, "global_step": 26544, "epoch": 632} {"train_loss": -5.490265369415283, "global_step": 26545, "epoch": 632} {"train_loss": -5.38352108001709, "global_step": 26546, "epoch": 632} {"train_loss": -5.385936737060547, "global_step": 26547, "epoch": 632} {"train_loss": -5.334719657897949, "global_step": 26548, "epoch": 632} {"train_loss": -5.453290939331055, "global_step": 26549, "epoch": 632} {"train_loss": -5.45472526550293, "global_step": 26550, "epoch": 632} {"train_loss": -5.533221244812012, "global_step": 26551, "epoch": 632} {"train_loss": -5.38333797454834, "global_step": 26552, "epoch": 632} {"train_loss": -5.537723541259766, "global_step": 26553, "epoch": 632} {"train_loss": -5.453824520111084, "global_step": 26554, "epoch": 632} {"train_loss": -5.418886184692383, "global_step": 26555, "epoch": 632} {"train_loss": -5.4163947105407715, "global_step": 26556, "epoch": 632} {"train_loss": -5.374100685119629, "global_step": 26557, "epoch": 632} {"train_loss": -5.5628437995910645, "global_step": 26558, "epoch": 632} {"train_loss": -5.364275932312012, "global_step": 26559, "epoch": 632} {"train_loss": -5.450646877288818, "global_step": 26560, "epoch": 632} {"train_loss": -5.417167663574219, "global_step": 26561, "epoch": 632} {"train_loss": -5.378298759460449, "global_step": 26562, "epoch": 632} {"train_loss": -5.2017316818237305, "global_step": 26563, "epoch": 632} {"train_loss": -5.33107852935791, "global_step": 26564, "epoch": 632} {"train_loss": -5.393350601196289, "global_step": 26565, "epoch": 632} {"train_loss": -5.342901229858398, "global_step": 26566, "epoch": 632} {"train_loss": -5.3707594871521, "global_step": 26567, "epoch": 632} {"train_loss": -5.441030025482178, "global_step": 26568, "epoch": 632} {"train_loss": -5.366622447967529, "global_step": 26569, "epoch": 632} {"train_loss": -5.45518684387207, "global_step": 26570, "epoch": 632} {"train_loss": -5.433807849884033, "global_step": 26571, "epoch": 632} {"train_loss": -5.48222541809082, "global_step": 26572, "epoch": 632} {"train_loss": -5.352481842041016, "global_step": 26573, "epoch": 632} {"train_loss": -5.4805450439453125, "global_step": 26574, "epoch": 632} {"train_loss": -5.447759628295898, "global_step": 26575, "epoch": 632} {"train_loss": -5.442073822021484, "global_step": 26576, "epoch": 632} {"train_loss": -5.3148345947265625, "global_step": 26577, "epoch": 632} {"train_loss": -5.457602024078369, "global_step": 26578, "epoch": 632} {"train_loss": -5.413364410400391, "global_step": 26579, "epoch": 632} {"train_loss": -5.456391334533691, "global_step": 26580, "epoch": 632} {"train_loss": -5.450153350830078, "global_step": 26581, "epoch": 632} {"train_loss": -5.376672744750977, "global_step": 26582, "epoch": 632} {"train_loss": -5.3476176261901855, "global_step": 26583, "epoch": 632} {"train_loss": -5.376688003540039, "global_step": 26584, "epoch": 632} {"train_loss": -5.414388543083554, "global_step": 26585, "epoch": 632, "val_loss": 64773.41015625} {"train_loss": -5.4195356369018555, "global_step": 26586, "epoch": 633} {"train_loss": -5.464442253112793, "global_step": 26587, "epoch": 633} {"train_loss": -5.3077073097229, "global_step": 26588, "epoch": 633} {"train_loss": -5.471189498901367, "global_step": 26589, "epoch": 633} {"train_loss": -5.350553512573242, "global_step": 26590, "epoch": 633} {"train_loss": -5.298189163208008, "global_step": 26591, "epoch": 633} {"train_loss": -5.496587753295898, "global_step": 26592, "epoch": 633} {"train_loss": -5.360946178436279, "global_step": 26593, "epoch": 633} {"train_loss": -5.485813140869141, "global_step": 26594, "epoch": 633} {"train_loss": -5.501830101013184, "global_step": 26595, "epoch": 633} {"train_loss": -5.341554641723633, "global_step": 26596, "epoch": 633} {"train_loss": -5.359832286834717, "global_step": 26597, "epoch": 633} {"train_loss": -5.480717658996582, "global_step": 26598, "epoch": 633} {"train_loss": -5.3956990242004395, "global_step": 26599, "epoch": 633} {"train_loss": -5.457201957702637, "global_step": 26600, "epoch": 633} {"train_loss": -5.494128704071045, "global_step": 26601, "epoch": 633} {"train_loss": -5.522614479064941, "global_step": 26602, "epoch": 633} {"train_loss": -5.3748555183410645, "global_step": 26603, "epoch": 633} {"train_loss": -5.479233264923096, "global_step": 26604, "epoch": 633} {"train_loss": -5.406749725341797, "global_step": 26605, "epoch": 633} {"train_loss": -5.456175327301025, "global_step": 26606, "epoch": 633} {"train_loss": -5.438717842102051, "global_step": 26607, "epoch": 633} {"train_loss": -5.404253959655762, "global_step": 26608, "epoch": 633} {"train_loss": -5.370232105255127, "global_step": 26609, "epoch": 633} {"train_loss": -5.426032066345215, "global_step": 26610, "epoch": 633} {"train_loss": -5.338451385498047, "global_step": 26611, "epoch": 633} {"train_loss": -5.3643903732299805, "global_step": 26612, "epoch": 633} {"train_loss": -5.41711950302124, "global_step": 26613, "epoch": 633} {"train_loss": -5.381199836730957, "global_step": 26614, "epoch": 633} {"train_loss": -5.424450874328613, "global_step": 26615, "epoch": 633} {"train_loss": -5.495530128479004, "global_step": 26616, "epoch": 633} {"train_loss": -5.425906658172607, "global_step": 26617, "epoch": 633} {"train_loss": -5.425359725952148, "global_step": 26618, "epoch": 633} {"train_loss": -5.337040424346924, "global_step": 26619, "epoch": 633} {"train_loss": -5.392208099365234, "global_step": 26620, "epoch": 633} {"train_loss": -5.384408950805664, "global_step": 26621, "epoch": 633} {"train_loss": -5.5217695236206055, "global_step": 26622, "epoch": 633} {"train_loss": -5.421521186828613, "global_step": 26623, "epoch": 633} {"train_loss": -5.302567481994629, "global_step": 26624, "epoch": 633} {"train_loss": -5.396399974822998, "global_step": 26625, "epoch": 633} {"train_loss": -5.489951133728027, "global_step": 26626, "epoch": 633} {"train_loss": -5.415841465904599, "global_step": 26627, "epoch": 633, "val_loss": 64479.0} {"train_loss": -5.462176322937012, "global_step": 26628, "epoch": 634} {"train_loss": -5.405651092529297, "global_step": 26629, "epoch": 634} {"train_loss": -5.402116298675537, "global_step": 26630, "epoch": 634} {"train_loss": -5.387337684631348, "global_step": 26631, "epoch": 634} {"train_loss": -5.449517250061035, "global_step": 26632, "epoch": 634} {"train_loss": -5.408417701721191, "global_step": 26633, "epoch": 634} {"train_loss": -5.437167644500732, "global_step": 26634, "epoch": 634} {"train_loss": -5.385983943939209, "global_step": 26635, "epoch": 634} {"train_loss": -5.492918968200684, "global_step": 26636, "epoch": 634} {"train_loss": -5.3767852783203125, "global_step": 26637, "epoch": 634} {"train_loss": -5.496872901916504, "global_step": 26638, "epoch": 634} {"train_loss": -5.4146013259887695, "global_step": 26639, "epoch": 634} {"train_loss": -5.516181468963623, "global_step": 26640, "epoch": 634} {"train_loss": -5.443916320800781, "global_step": 26641, "epoch": 634} {"train_loss": -5.346988201141357, "global_step": 26642, "epoch": 634} {"train_loss": -5.419058799743652, "global_step": 26643, "epoch": 634} {"train_loss": -5.5067291259765625, "global_step": 26644, "epoch": 634} {"train_loss": -5.430810928344727, "global_step": 26645, "epoch": 634} {"train_loss": -5.4825663566589355, "global_step": 26646, "epoch": 634} {"train_loss": -5.501941680908203, "global_step": 26647, "epoch": 634} {"train_loss": -5.314842224121094, "global_step": 26648, "epoch": 634} {"train_loss": -5.3776092529296875, "global_step": 26649, "epoch": 634} {"train_loss": -5.342717170715332, "global_step": 26650, "epoch": 634} {"train_loss": -5.47531270980835, "global_step": 26651, "epoch": 634} {"train_loss": -5.365320205688477, "global_step": 26652, "epoch": 634} {"train_loss": -5.422595500946045, "global_step": 26653, "epoch": 634} {"train_loss": -5.536691665649414, "global_step": 26654, "epoch": 634} {"train_loss": -5.33660888671875, "global_step": 26655, "epoch": 634} {"train_loss": -5.400573253631592, "global_step": 26656, "epoch": 634} {"train_loss": -5.353890419006348, "global_step": 26657, "epoch": 634} {"train_loss": -5.459102153778076, "global_step": 26658, "epoch": 634} {"train_loss": -5.4219770431518555, "global_step": 26659, "epoch": 634} {"train_loss": -5.451855659484863, "global_step": 26660, "epoch": 634} {"train_loss": -5.523736000061035, "global_step": 26661, "epoch": 634} {"train_loss": -5.421610355377197, "global_step": 26662, "epoch": 634} {"train_loss": -5.394710540771484, "global_step": 26663, "epoch": 634} {"train_loss": -5.510858535766602, "global_step": 26664, "epoch": 634} {"train_loss": -5.455799102783203, "global_step": 26665, "epoch": 634} {"train_loss": -5.2902374267578125, "global_step": 26666, "epoch": 634} {"train_loss": -5.385686874389648, "global_step": 26667, "epoch": 634} {"train_loss": -5.588984489440918, "global_step": 26668, "epoch": 634} {"train_loss": -5.427863484337216, "global_step": 26669, "epoch": 634, "val_loss": 64348.84375} {"train_loss": -5.329789638519287, "global_step": 26670, "epoch": 635} {"train_loss": -5.5119805335998535, "global_step": 26671, "epoch": 635} {"train_loss": -5.411962509155273, "global_step": 26672, "epoch": 635} {"train_loss": -5.311726093292236, "global_step": 26673, "epoch": 635} {"train_loss": -5.323980331420898, "global_step": 26674, "epoch": 635} {"train_loss": -5.376514911651611, "global_step": 26675, "epoch": 635} {"train_loss": -5.3933515548706055, "global_step": 26676, "epoch": 635} {"train_loss": -5.152047634124756, "global_step": 26677, "epoch": 635} {"train_loss": -5.354942798614502, "global_step": 26678, "epoch": 635} {"train_loss": -5.377009391784668, "global_step": 26679, "epoch": 635} {"train_loss": -5.2930684089660645, "global_step": 26680, "epoch": 635} {"train_loss": -5.4499969482421875, "global_step": 26681, "epoch": 635} {"train_loss": -5.5367512702941895, "global_step": 26682, "epoch": 635} {"train_loss": -5.342161178588867, "global_step": 26683, "epoch": 635} {"train_loss": -5.322632789611816, "global_step": 26684, "epoch": 635} {"train_loss": -5.456606864929199, "global_step": 26685, "epoch": 635} {"train_loss": -5.410892963409424, "global_step": 26686, "epoch": 635} {"train_loss": -5.32871150970459, "global_step": 26687, "epoch": 635} {"train_loss": -5.301830291748047, "global_step": 26688, "epoch": 635} {"train_loss": -5.419847011566162, "global_step": 26689, "epoch": 635} {"train_loss": -5.326225757598877, "global_step": 26690, "epoch": 635} {"train_loss": -5.3801093101501465, "global_step": 26691, "epoch": 635} {"train_loss": -5.381707191467285, "global_step": 26692, "epoch": 635} {"train_loss": -5.465244293212891, "global_step": 26693, "epoch": 635} {"train_loss": -5.386643886566162, "global_step": 26694, "epoch": 635} {"train_loss": -5.26944637298584, "global_step": 26695, "epoch": 635} {"train_loss": -5.339202404022217, "global_step": 26696, "epoch": 635} {"train_loss": -5.570068359375, "global_step": 26697, "epoch": 635} {"train_loss": -5.349875450134277, "global_step": 26698, "epoch": 635} {"train_loss": -5.482822418212891, "global_step": 26699, "epoch": 635} {"train_loss": -5.334768295288086, "global_step": 26700, "epoch": 635} {"train_loss": -5.432481288909912, "global_step": 26701, "epoch": 635} {"train_loss": -5.4145002365112305, "global_step": 26702, "epoch": 635} {"train_loss": -5.488764762878418, "global_step": 26703, "epoch": 635} {"train_loss": -5.452386379241943, "global_step": 26704, "epoch": 635} {"train_loss": -5.4188151359558105, "global_step": 26705, "epoch": 635} {"train_loss": -5.404848575592041, "global_step": 26706, "epoch": 635} {"train_loss": -5.446366310119629, "global_step": 26707, "epoch": 635} {"train_loss": -5.482303619384766, "global_step": 26708, "epoch": 635} {"train_loss": -5.320654392242432, "global_step": 26709, "epoch": 635} {"train_loss": -5.360138893127441, "global_step": 26710, "epoch": 635} {"train_loss": -5.387990894771757, "global_step": 26711, "epoch": 635, "val_loss": 64506.45703125} {"train_loss": -5.348260879516602, "global_step": 26712, "epoch": 636} {"train_loss": -5.454237937927246, "global_step": 26713, "epoch": 636} {"train_loss": -5.346527099609375, "global_step": 26714, "epoch": 636} {"train_loss": -5.380949974060059, "global_step": 26715, "epoch": 636} {"train_loss": -5.319695949554443, "global_step": 26716, "epoch": 636} {"train_loss": -5.381628036499023, "global_step": 26717, "epoch": 636} {"train_loss": -5.628751754760742, "global_step": 26718, "epoch": 636} {"train_loss": -5.327995777130127, "global_step": 26719, "epoch": 636} {"train_loss": -5.284914016723633, "global_step": 26720, "epoch": 636} {"train_loss": -5.478904724121094, "global_step": 26721, "epoch": 636} {"train_loss": -5.426551342010498, "global_step": 26722, "epoch": 636} {"train_loss": -5.608451843261719, "global_step": 26723, "epoch": 636} {"train_loss": -5.517751216888428, "global_step": 26724, "epoch": 636} {"train_loss": -5.417847633361816, "global_step": 26725, "epoch": 636} {"train_loss": -5.480104923248291, "global_step": 26726, "epoch": 636} {"train_loss": -5.435777187347412, "global_step": 26727, "epoch": 636} {"train_loss": -5.454141616821289, "global_step": 26728, "epoch": 636} {"train_loss": -5.364238739013672, "global_step": 26729, "epoch": 636} {"train_loss": -5.617865562438965, "global_step": 26730, "epoch": 636} {"train_loss": -5.327521800994873, "global_step": 26731, "epoch": 636} {"train_loss": -5.556052207946777, "global_step": 26732, "epoch": 636} {"train_loss": -5.409348487854004, "global_step": 26733, "epoch": 636} {"train_loss": -5.439722061157227, "global_step": 26734, "epoch": 636} {"train_loss": -5.43095588684082, "global_step": 26735, "epoch": 636} {"train_loss": -5.5352325439453125, "global_step": 26736, "epoch": 636} {"train_loss": -5.451042652130127, "global_step": 26737, "epoch": 636} {"train_loss": -5.380537509918213, "global_step": 26738, "epoch": 636} {"train_loss": -5.415809154510498, "global_step": 26739, "epoch": 636} {"train_loss": -5.544126510620117, "global_step": 26740, "epoch": 636} {"train_loss": -5.412785530090332, "global_step": 26741, "epoch": 636} {"train_loss": -5.514591693878174, "global_step": 26742, "epoch": 636} {"train_loss": -5.306934356689453, "global_step": 26743, "epoch": 636} {"train_loss": -5.3622307777404785, "global_step": 26744, "epoch": 636} {"train_loss": -5.5280022621154785, "global_step": 26745, "epoch": 636} {"train_loss": -5.4529924392700195, "global_step": 26746, "epoch": 636} {"train_loss": -5.373935699462891, "global_step": 26747, "epoch": 636} {"train_loss": -5.4183349609375, "global_step": 26748, "epoch": 636} {"train_loss": -5.371659278869629, "global_step": 26749, "epoch": 636} {"train_loss": -5.398584365844727, "global_step": 26750, "epoch": 636} {"train_loss": -5.4121575355529785, "global_step": 26751, "epoch": 636} {"train_loss": -5.510588645935059, "global_step": 26752, "epoch": 636} {"train_loss": -5.435746476763771, "global_step": 26753, "epoch": 636, "val_loss": 64757.54296875} {"train_loss": -5.370258808135986, "global_step": 26754, "epoch": 637} {"train_loss": -5.414222717285156, "global_step": 26755, "epoch": 637} {"train_loss": -5.403807163238525, "global_step": 26756, "epoch": 637} {"train_loss": -5.384942054748535, "global_step": 26757, "epoch": 637} {"train_loss": -5.530757427215576, "global_step": 26758, "epoch": 637} {"train_loss": -5.386193752288818, "global_step": 26759, "epoch": 637} {"train_loss": -5.379697322845459, "global_step": 26760, "epoch": 637} {"train_loss": -5.402769088745117, "global_step": 26761, "epoch": 637} {"train_loss": -5.367463111877441, "global_step": 26762, "epoch": 637} {"train_loss": -5.3812150955200195, "global_step": 26763, "epoch": 637} {"train_loss": -5.466093063354492, "global_step": 26764, "epoch": 637} {"train_loss": -5.575041770935059, "global_step": 26765, "epoch": 637} {"train_loss": -5.5109477043151855, "global_step": 26766, "epoch": 637} {"train_loss": -5.489799499511719, "global_step": 26767, "epoch": 637} {"train_loss": -5.392729759216309, "global_step": 26768, "epoch": 637} {"train_loss": -5.417559623718262, "global_step": 26769, "epoch": 637} {"train_loss": -5.379965305328369, "global_step": 26770, "epoch": 637} {"train_loss": -5.446332931518555, "global_step": 26771, "epoch": 637} {"train_loss": -5.36708927154541, "global_step": 26772, "epoch": 637} {"train_loss": -5.447997093200684, "global_step": 26773, "epoch": 637} {"train_loss": -5.494743347167969, "global_step": 26774, "epoch": 637} {"train_loss": -5.39803409576416, "global_step": 26775, "epoch": 637} {"train_loss": -5.366770267486572, "global_step": 26776, "epoch": 637} {"train_loss": -5.208168983459473, "global_step": 26777, "epoch": 637} {"train_loss": -5.415216445922852, "global_step": 26778, "epoch": 637} {"train_loss": -5.311153411865234, "global_step": 26779, "epoch": 637} {"train_loss": -5.378724098205566, "global_step": 26780, "epoch": 637} {"train_loss": -5.442765235900879, "global_step": 26781, "epoch": 637} {"train_loss": -5.430074214935303, "global_step": 26782, "epoch": 637} {"train_loss": -5.34617805480957, "global_step": 26783, "epoch": 637} {"train_loss": -5.319087982177734, "global_step": 26784, "epoch": 637} {"train_loss": -5.374137878417969, "global_step": 26785, "epoch": 637} {"train_loss": -5.49003791809082, "global_step": 26786, "epoch": 637} {"train_loss": -5.433743953704834, "global_step": 26787, "epoch": 637} {"train_loss": -5.494542121887207, "global_step": 26788, "epoch": 637} {"train_loss": -5.316580772399902, "global_step": 26789, "epoch": 637} {"train_loss": -5.426944732666016, "global_step": 26790, "epoch": 637} {"train_loss": -5.5298662185668945, "global_step": 26791, "epoch": 637} {"train_loss": -5.363470077514648, "global_step": 26792, "epoch": 637} {"train_loss": -5.408127307891846, "global_step": 26793, "epoch": 637} {"train_loss": -5.499189853668213, "global_step": 26794, "epoch": 637} {"train_loss": -5.412221238726661, "global_step": 26795, "epoch": 637, "val_loss": 64507.20703125} {"train_loss": -5.388652801513672, "global_step": 26796, "epoch": 638} {"train_loss": -5.404486656188965, "global_step": 26797, "epoch": 638} {"train_loss": -5.433293342590332, "global_step": 26798, "epoch": 638} {"train_loss": -5.425586700439453, "global_step": 26799, "epoch": 638} {"train_loss": -5.448563098907471, "global_step": 26800, "epoch": 638} {"train_loss": -5.361427307128906, "global_step": 26801, "epoch": 638} {"train_loss": -5.370645523071289, "global_step": 26802, "epoch": 638} {"train_loss": -5.501055717468262, "global_step": 26803, "epoch": 638} {"train_loss": -5.3773274421691895, "global_step": 26804, "epoch": 638} {"train_loss": -5.3390374183654785, "global_step": 26805, "epoch": 638} {"train_loss": -5.437426567077637, "global_step": 26806, "epoch": 638} {"train_loss": -5.307596206665039, "global_step": 26807, "epoch": 638} {"train_loss": -5.411308288574219, "global_step": 26808, "epoch": 638} {"train_loss": -5.469635009765625, "global_step": 26809, "epoch": 638} {"train_loss": -5.428758144378662, "global_step": 26810, "epoch": 638} {"train_loss": -5.480086326599121, "global_step": 26811, "epoch": 638} {"train_loss": -5.443876266479492, "global_step": 26812, "epoch": 638} {"train_loss": -5.509152412414551, "global_step": 26813, "epoch": 638} {"train_loss": -5.392975807189941, "global_step": 26814, "epoch": 638} {"train_loss": -5.315996170043945, "global_step": 26815, "epoch": 638} {"train_loss": -5.353463172912598, "global_step": 26816, "epoch": 638} {"train_loss": -5.341522216796875, "global_step": 26817, "epoch": 638} {"train_loss": -5.407919883728027, "global_step": 26818, "epoch": 638} {"train_loss": -5.420819282531738, "global_step": 26819, "epoch": 638} {"train_loss": -5.396300315856934, "global_step": 26820, "epoch": 638} {"train_loss": -5.398014068603516, "global_step": 26821, "epoch": 638} {"train_loss": -5.374228477478027, "global_step": 26822, "epoch": 638} {"train_loss": -5.310885906219482, "global_step": 26823, "epoch": 638} {"train_loss": -5.461713790893555, "global_step": 26824, "epoch": 638} {"train_loss": -5.431903839111328, "global_step": 26825, "epoch": 638} {"train_loss": -5.26255989074707, "global_step": 26826, "epoch": 638} {"train_loss": -5.469574928283691, "global_step": 26827, "epoch": 638} {"train_loss": -5.258308410644531, "global_step": 26828, "epoch": 638} {"train_loss": -5.473847389221191, "global_step": 26829, "epoch": 638} {"train_loss": -5.291205406188965, "global_step": 26830, "epoch": 638} {"train_loss": -5.383841037750244, "global_step": 26831, "epoch": 638} {"train_loss": -5.443162441253662, "global_step": 26832, "epoch": 638} {"train_loss": -5.4782490730285645, "global_step": 26833, "epoch": 638} {"train_loss": -5.437252044677734, "global_step": 26834, "epoch": 638} {"train_loss": -5.261186122894287, "global_step": 26835, "epoch": 638} {"train_loss": -5.382193565368652, "global_step": 26836, "epoch": 638} {"train_loss": -5.398008619035993, "global_step": 26837, "epoch": 638, "val_loss": 64320.83984375} {"train_loss": -5.3489837646484375, "global_step": 26838, "epoch": 639} {"train_loss": -5.425248622894287, "global_step": 26839, "epoch": 639} {"train_loss": -5.3655686378479, "global_step": 26840, "epoch": 639} {"train_loss": -5.545497417449951, "global_step": 26841, "epoch": 639} {"train_loss": -5.3991475105285645, "global_step": 26842, "epoch": 639} {"train_loss": -5.27899694442749, "global_step": 26843, "epoch": 639} {"train_loss": -5.4104509353637695, "global_step": 26844, "epoch": 639} {"train_loss": -5.290739059448242, "global_step": 26845, "epoch": 639} {"train_loss": -5.554591178894043, "global_step": 26846, "epoch": 639} {"train_loss": -5.281210899353027, "global_step": 26847, "epoch": 639} {"train_loss": -5.37790584564209, "global_step": 26848, "epoch": 639} {"train_loss": -5.418922424316406, "global_step": 26849, "epoch": 639} {"train_loss": -5.255007743835449, "global_step": 26850, "epoch": 639} {"train_loss": -5.280273914337158, "global_step": 26851, "epoch": 639} {"train_loss": -5.484640121459961, "global_step": 26852, "epoch": 639} {"train_loss": -5.115218162536621, "global_step": 26853, "epoch": 639} {"train_loss": -5.51820182800293, "global_step": 26854, "epoch": 639} {"train_loss": -5.469917297363281, "global_step": 26855, "epoch": 639} {"train_loss": -5.376267910003662, "global_step": 26856, "epoch": 639} {"train_loss": -5.417295932769775, "global_step": 26857, "epoch": 639} {"train_loss": -5.3271002769470215, "global_step": 26858, "epoch": 639} {"train_loss": -5.32684326171875, "global_step": 26859, "epoch": 639} {"train_loss": -5.329423904418945, "global_step": 26860, "epoch": 639} {"train_loss": -5.254636764526367, "global_step": 26861, "epoch": 639} {"train_loss": -5.238577842712402, "global_step": 26862, "epoch": 639} {"train_loss": -5.387054443359375, "global_step": 26863, "epoch": 639} {"train_loss": -5.329061508178711, "global_step": 26864, "epoch": 639} {"train_loss": -5.182601451873779, "global_step": 26865, "epoch": 639} {"train_loss": -5.416638374328613, "global_step": 26866, "epoch": 639} {"train_loss": -5.294959545135498, "global_step": 26867, "epoch": 639} {"train_loss": -5.270916938781738, "global_step": 26868, "epoch": 639} {"train_loss": -5.227804660797119, "global_step": 26869, "epoch": 639} {"train_loss": -5.434966087341309, "global_step": 26870, "epoch": 639} {"train_loss": -5.161239147186279, "global_step": 26871, "epoch": 639} {"train_loss": -5.499402046203613, "global_step": 26872, "epoch": 639} {"train_loss": -5.320725440979004, "global_step": 26873, "epoch": 639} {"train_loss": -5.414355278015137, "global_step": 26874, "epoch": 639} {"train_loss": -5.363349914550781, "global_step": 26875, "epoch": 639} {"train_loss": -5.329771995544434, "global_step": 26876, "epoch": 639} {"train_loss": -5.283782005310059, "global_step": 26877, "epoch": 639} {"train_loss": -5.346534729003906, "global_step": 26878, "epoch": 639} {"train_loss": -5.348431780224755, "global_step": 26879, "epoch": 639, "val_loss": 64745.9921875} {"train_loss": -5.336138725280762, "global_step": 26880, "epoch": 640} {"train_loss": -5.433460712432861, "global_step": 26881, "epoch": 640} {"train_loss": -5.4259114265441895, "global_step": 26882, "epoch": 640} {"train_loss": -5.463435649871826, "global_step": 26883, "epoch": 640} {"train_loss": -5.3853912353515625, "global_step": 26884, "epoch": 640} {"train_loss": -5.46225118637085, "global_step": 26885, "epoch": 640} {"train_loss": -5.482893943786621, "global_step": 26886, "epoch": 640} {"train_loss": -5.342198371887207, "global_step": 26887, "epoch": 640} {"train_loss": -5.3497314453125, "global_step": 26888, "epoch": 640} {"train_loss": -5.448373317718506, "global_step": 26889, "epoch": 640} {"train_loss": -5.46091365814209, "global_step": 26890, "epoch": 640} {"train_loss": -5.421479225158691, "global_step": 26891, "epoch": 640} {"train_loss": -5.462191104888916, "global_step": 26892, "epoch": 640} {"train_loss": -5.325356483459473, "global_step": 26893, "epoch": 640} {"train_loss": -5.417745113372803, "global_step": 26894, "epoch": 640} {"train_loss": -5.500960350036621, "global_step": 26895, "epoch": 640} {"train_loss": -5.473278045654297, "global_step": 26896, "epoch": 640} {"train_loss": -5.534836769104004, "global_step": 26897, "epoch": 640} {"train_loss": -5.413119316101074, "global_step": 26898, "epoch": 640} {"train_loss": -5.252874374389648, "global_step": 26899, "epoch": 640} {"train_loss": -5.545536994934082, "global_step": 26900, "epoch": 640} {"train_loss": -5.262587547302246, "global_step": 26901, "epoch": 640} {"train_loss": -5.27639102935791, "global_step": 26902, "epoch": 640} {"train_loss": -5.360729217529297, "global_step": 26903, "epoch": 640} {"train_loss": -5.52626895904541, "global_step": 26904, "epoch": 640} {"train_loss": -5.399928569793701, "global_step": 26905, "epoch": 640} {"train_loss": -5.433361053466797, "global_step": 26906, "epoch": 640} {"train_loss": -5.330511093139648, "global_step": 26907, "epoch": 640} {"train_loss": -5.285590171813965, "global_step": 26908, "epoch": 640} {"train_loss": -5.377814769744873, "global_step": 26909, "epoch": 640} {"train_loss": -5.386341094970703, "global_step": 26910, "epoch": 640} {"train_loss": -5.32114839553833, "global_step": 26911, "epoch": 640} {"train_loss": -5.305372714996338, "global_step": 26912, "epoch": 640} {"train_loss": -5.417693138122559, "global_step": 26913, "epoch": 640} {"train_loss": -5.364862442016602, "global_step": 26914, "epoch": 640} {"train_loss": -5.3232221603393555, "global_step": 26915, "epoch": 640} {"train_loss": -5.353203773498535, "global_step": 26916, "epoch": 640} {"train_loss": -5.5508012771606445, "global_step": 26917, "epoch": 640} {"train_loss": -5.422581672668457, "global_step": 26918, "epoch": 640} {"train_loss": -5.297848224639893, "global_step": 26919, "epoch": 640} {"train_loss": -5.329940319061279, "global_step": 26920, "epoch": 640} {"train_loss": -5.3941356000446135, "global_step": 26921, "epoch": 640, "val_loss": 64537.62109375} {"train_loss": -5.506971836090088, "global_step": 26922, "epoch": 641} {"train_loss": -5.491436004638672, "global_step": 26923, "epoch": 641} {"train_loss": -5.299417972564697, "global_step": 26924, "epoch": 641} {"train_loss": -5.390516757965088, "global_step": 26925, "epoch": 641} {"train_loss": -5.381682395935059, "global_step": 26926, "epoch": 641} {"train_loss": -5.361172676086426, "global_step": 26927, "epoch": 641} {"train_loss": -5.519407272338867, "global_step": 26928, "epoch": 641} {"train_loss": -5.353328704833984, "global_step": 26929, "epoch": 641} {"train_loss": -5.376840114593506, "global_step": 26930, "epoch": 641} {"train_loss": -5.580176830291748, "global_step": 26931, "epoch": 641} {"train_loss": -5.360102653503418, "global_step": 26932, "epoch": 641} {"train_loss": -5.43215274810791, "global_step": 26933, "epoch": 641} {"train_loss": -5.506508827209473, "global_step": 26934, "epoch": 641} {"train_loss": -5.4537458419799805, "global_step": 26935, "epoch": 641} {"train_loss": -5.437572479248047, "global_step": 26936, "epoch": 641} {"train_loss": -5.292735576629639, "global_step": 26937, "epoch": 641} {"train_loss": -5.45377254486084, "global_step": 26938, "epoch": 641} {"train_loss": -5.362293243408203, "global_step": 26939, "epoch": 641} {"train_loss": -5.347842216491699, "global_step": 26940, "epoch": 641} {"train_loss": -5.47330379486084, "global_step": 26941, "epoch": 641} {"train_loss": -5.354846477508545, "global_step": 26942, "epoch": 641} {"train_loss": -5.474924087524414, "global_step": 26943, "epoch": 641} {"train_loss": -5.407156467437744, "global_step": 26944, "epoch": 641} {"train_loss": -5.428328514099121, "global_step": 26945, "epoch": 641} {"train_loss": -5.334729194641113, "global_step": 26946, "epoch": 641} {"train_loss": -5.452972888946533, "global_step": 26947, "epoch": 641} {"train_loss": -5.404705047607422, "global_step": 26948, "epoch": 641} {"train_loss": -5.514988899230957, "global_step": 26949, "epoch": 641} {"train_loss": -5.337521553039551, "global_step": 26950, "epoch": 641} {"train_loss": -5.403724193572998, "global_step": 26951, "epoch": 641} {"train_loss": -5.391075611114502, "global_step": 26952, "epoch": 641} {"train_loss": -5.424413681030273, "global_step": 26953, "epoch": 641} {"train_loss": -5.385952949523926, "global_step": 26954, "epoch": 641} {"train_loss": -5.350344657897949, "global_step": 26955, "epoch": 641} {"train_loss": -5.286951541900635, "global_step": 26956, "epoch": 641} {"train_loss": -5.444461822509766, "global_step": 26957, "epoch": 641} {"train_loss": -5.349216938018799, "global_step": 26958, "epoch": 641} {"train_loss": -5.232964992523193, "global_step": 26959, "epoch": 641} {"train_loss": -5.293877601623535, "global_step": 26960, "epoch": 641} {"train_loss": -5.388432502746582, "global_step": 26961, "epoch": 641} {"train_loss": -5.215794563293457, "global_step": 26962, "epoch": 641} {"train_loss": -5.398546173459008, "global_step": 26963, "epoch": 641, "val_loss": 65505.0859375} {"train_loss": -5.246070861816406, "global_step": 26964, "epoch": 642} {"train_loss": -5.2350640296936035, "global_step": 26965, "epoch": 642} {"train_loss": -5.479292869567871, "global_step": 26966, "epoch": 642} {"train_loss": -5.188936233520508, "global_step": 26967, "epoch": 642} {"train_loss": -5.248266220092773, "global_step": 26968, "epoch": 642} {"train_loss": -5.306509971618652, "global_step": 26969, "epoch": 642} {"train_loss": -5.28571891784668, "global_step": 26970, "epoch": 642} {"train_loss": -5.284534454345703, "global_step": 26971, "epoch": 642} {"train_loss": -5.352799415588379, "global_step": 26972, "epoch": 642} {"train_loss": -5.284518241882324, "global_step": 26973, "epoch": 642} {"train_loss": -5.359375, "global_step": 26974, "epoch": 642} {"train_loss": -5.426728248596191, "global_step": 26975, "epoch": 642} {"train_loss": -5.350813865661621, "global_step": 26976, "epoch": 642} {"train_loss": -5.359090805053711, "global_step": 26977, "epoch": 642} {"train_loss": -5.500735759735107, "global_step": 26978, "epoch": 642} {"train_loss": -5.468462944030762, "global_step": 26979, "epoch": 642} {"train_loss": -5.3287248611450195, "global_step": 26980, "epoch": 642} {"train_loss": -5.4104509353637695, "global_step": 26981, "epoch": 642} {"train_loss": -5.526881217956543, "global_step": 26982, "epoch": 642} {"train_loss": -5.330992698669434, "global_step": 26983, "epoch": 642} {"train_loss": -5.459291458129883, "global_step": 26984, "epoch": 642} {"train_loss": -5.505536079406738, "global_step": 26985, "epoch": 642} {"train_loss": -5.30957555770874, "global_step": 26986, "epoch": 642} {"train_loss": -5.400634288787842, "global_step": 26987, "epoch": 642} {"train_loss": -5.336550712585449, "global_step": 26988, "epoch": 642} {"train_loss": -5.346383571624756, "global_step": 26989, "epoch": 642} {"train_loss": -5.3714447021484375, "global_step": 26990, "epoch": 642} {"train_loss": -5.3431901931762695, "global_step": 26991, "epoch": 642} {"train_loss": -5.400415420532227, "global_step": 26992, "epoch": 642} {"train_loss": -5.284255027770996, "global_step": 26993, "epoch": 642} {"train_loss": -5.290374279022217, "global_step": 26994, "epoch": 642} {"train_loss": -5.435851097106934, "global_step": 26995, "epoch": 642} {"train_loss": -5.213691234588623, "global_step": 26996, "epoch": 642} {"train_loss": -5.397677421569824, "global_step": 26997, "epoch": 642} {"train_loss": -5.405369758605957, "global_step": 26998, "epoch": 642} {"train_loss": -5.34190034866333, "global_step": 26999, "epoch": 642} {"train_loss": -5.385533332824707, "global_step": 27000, "epoch": 642} {"train_loss": -5.405641555786133, "global_step": 27001, "epoch": 642} {"train_loss": -5.623055458068848, "global_step": 27002, "epoch": 642} {"train_loss": -5.320505619049072, "global_step": 27003, "epoch": 642} {"train_loss": -5.434481143951416, "global_step": 27004, "epoch": 642} {"train_loss": -5.366284676960537, "global_step": 27005, "epoch": 642, "val_loss": 64532.95703125} {"train_loss": -5.292820930480957, "global_step": 27006, "epoch": 643} {"train_loss": -5.302084922790527, "global_step": 27007, "epoch": 643} {"train_loss": -5.386768341064453, "global_step": 27008, "epoch": 643} {"train_loss": -5.469079971313477, "global_step": 27009, "epoch": 643} {"train_loss": -5.3587446212768555, "global_step": 27010, "epoch": 643} {"train_loss": -5.4641008377075195, "global_step": 27011, "epoch": 643} {"train_loss": -5.403357028961182, "global_step": 27012, "epoch": 643} {"train_loss": -5.462172031402588, "global_step": 27013, "epoch": 643} {"train_loss": -5.286645889282227, "global_step": 27014, "epoch": 643} {"train_loss": -5.408426284790039, "global_step": 27015, "epoch": 643} {"train_loss": -5.455624580383301, "global_step": 27016, "epoch": 643} {"train_loss": -5.372048377990723, "global_step": 27017, "epoch": 643} {"train_loss": -5.348025321960449, "global_step": 27018, "epoch": 643} {"train_loss": -5.410035133361816, "global_step": 27019, "epoch": 643} {"train_loss": -5.360474586486816, "global_step": 27020, "epoch": 643} {"train_loss": -5.390506267547607, "global_step": 27021, "epoch": 643} {"train_loss": -5.417623519897461, "global_step": 27022, "epoch": 643} {"train_loss": -5.407411575317383, "global_step": 27023, "epoch": 643} {"train_loss": -5.423598766326904, "global_step": 27024, "epoch": 643} {"train_loss": -5.487483501434326, "global_step": 27025, "epoch": 643} {"train_loss": -5.551599979400635, "global_step": 27026, "epoch": 643} {"train_loss": -5.568032264709473, "global_step": 27027, "epoch": 643} {"train_loss": -5.416591644287109, "global_step": 27028, "epoch": 643} {"train_loss": -5.471231460571289, "global_step": 27029, "epoch": 643} {"train_loss": -5.458990097045898, "global_step": 27030, "epoch": 643} {"train_loss": -5.457592010498047, "global_step": 27031, "epoch": 643} {"train_loss": -5.426477432250977, "global_step": 27032, "epoch": 643} {"train_loss": -5.448214530944824, "global_step": 27033, "epoch": 643} {"train_loss": -5.427947998046875, "global_step": 27034, "epoch": 643} {"train_loss": -5.481776237487793, "global_step": 27035, "epoch": 643} {"train_loss": -5.522086143493652, "global_step": 27036, "epoch": 643} {"train_loss": -5.48716926574707, "global_step": 27037, "epoch": 643} {"train_loss": -5.245976448059082, "global_step": 27038, "epoch": 643} {"train_loss": -5.513571739196777, "global_step": 27039, "epoch": 643} {"train_loss": -5.408201217651367, "global_step": 27040, "epoch": 643} {"train_loss": -5.372483253479004, "global_step": 27041, "epoch": 643} {"train_loss": -5.458832740783691, "global_step": 27042, "epoch": 643} {"train_loss": -5.139032363891602, "global_step": 27043, "epoch": 643} {"train_loss": -5.3950347900390625, "global_step": 27044, "epoch": 643} {"train_loss": -5.355384826660156, "global_step": 27045, "epoch": 643} {"train_loss": -5.34902811050415, "global_step": 27046, "epoch": 643} {"train_loss": -5.41243330637614, "global_step": 27047, "epoch": 643, "val_loss": 64446.62109375} {"train_loss": -5.424959182739258, "global_step": 27048, "epoch": 644} {"train_loss": -5.374194145202637, "global_step": 27049, "epoch": 644} {"train_loss": -5.523874282836914, "global_step": 27050, "epoch": 644} {"train_loss": -5.303592681884766, "global_step": 27051, "epoch": 644} {"train_loss": -5.389978408813477, "global_step": 27052, "epoch": 644} {"train_loss": -5.34121561050415, "global_step": 27053, "epoch": 644} {"train_loss": -5.425940990447998, "global_step": 27054, "epoch": 644} {"train_loss": -5.3820695877075195, "global_step": 27055, "epoch": 644} {"train_loss": -5.389239311218262, "global_step": 27056, "epoch": 644} {"train_loss": -5.476726055145264, "global_step": 27057, "epoch": 644} {"train_loss": -5.480212211608887, "global_step": 27058, "epoch": 644} {"train_loss": -5.429877758026123, "global_step": 27059, "epoch": 644} {"train_loss": -5.4054155349731445, "global_step": 27060, "epoch": 644} {"train_loss": -5.433325290679932, "global_step": 27061, "epoch": 644} {"train_loss": -5.389639854431152, "global_step": 27062, "epoch": 644} {"train_loss": -5.504018783569336, "global_step": 27063, "epoch": 644} {"train_loss": -5.446398735046387, "global_step": 27064, "epoch": 644} {"train_loss": -5.513720512390137, "global_step": 27065, "epoch": 644} {"train_loss": -5.440251350402832, "global_step": 27066, "epoch": 644} {"train_loss": -5.226577281951904, "global_step": 27067, "epoch": 644} {"train_loss": -5.419291973114014, "global_step": 27068, "epoch": 644} {"train_loss": -5.5099897384643555, "global_step": 27069, "epoch": 644} {"train_loss": -5.446010112762451, "global_step": 27070, "epoch": 644} {"train_loss": -5.394486427307129, "global_step": 27071, "epoch": 644} {"train_loss": -5.435672283172607, "global_step": 27072, "epoch": 644} {"train_loss": -5.3699750900268555, "global_step": 27073, "epoch": 644} {"train_loss": -5.346912384033203, "global_step": 27074, "epoch": 644} {"train_loss": -5.408596515655518, "global_step": 27075, "epoch": 644} {"train_loss": -5.447261333465576, "global_step": 27076, "epoch": 644} {"train_loss": -5.36386251449585, "global_step": 27077, "epoch": 644} {"train_loss": -5.390614032745361, "global_step": 27078, "epoch": 644} {"train_loss": -5.3055806159973145, "global_step": 27079, "epoch": 644} {"train_loss": -5.366350173950195, "global_step": 27080, "epoch": 644} {"train_loss": -5.457718849182129, "global_step": 27081, "epoch": 644} {"train_loss": -5.304393768310547, "global_step": 27082, "epoch": 644} {"train_loss": -5.322293281555176, "global_step": 27083, "epoch": 644} {"train_loss": -5.342201232910156, "global_step": 27084, "epoch": 644} {"train_loss": -5.513119697570801, "global_step": 27085, "epoch": 644} {"train_loss": -5.484666347503662, "global_step": 27086, "epoch": 644} {"train_loss": -5.462135314941406, "global_step": 27087, "epoch": 644} {"train_loss": -5.446131229400635, "global_step": 27088, "epoch": 644} {"train_loss": -5.41245759101141, "global_step": 27089, "epoch": 644, "val_loss": 64462.58984375} {"train_loss": -5.385695457458496, "global_step": 27090, "epoch": 645} {"train_loss": -5.438733100891113, "global_step": 27091, "epoch": 645} {"train_loss": -5.481447219848633, "global_step": 27092, "epoch": 645} {"train_loss": -5.410463809967041, "global_step": 27093, "epoch": 645} {"train_loss": -5.3892035484313965, "global_step": 27094, "epoch": 645} {"train_loss": -5.431593894958496, "global_step": 27095, "epoch": 645} {"train_loss": -5.422936916351318, "global_step": 27096, "epoch": 645} {"train_loss": -5.317424774169922, "global_step": 27097, "epoch": 645} {"train_loss": -5.278008460998535, "global_step": 27098, "epoch": 645} {"train_loss": -5.4386396408081055, "global_step": 27099, "epoch": 645} {"train_loss": -5.423196792602539, "global_step": 27100, "epoch": 645} {"train_loss": -5.525477409362793, "global_step": 27101, "epoch": 645} {"train_loss": -5.453173637390137, "global_step": 27102, "epoch": 645} {"train_loss": -5.4264397621154785, "global_step": 27103, "epoch": 645} {"train_loss": -5.384430408477783, "global_step": 27104, "epoch": 645} {"train_loss": -5.423275947570801, "global_step": 27105, "epoch": 645} {"train_loss": -5.532229900360107, "global_step": 27106, "epoch": 645} {"train_loss": -5.405697345733643, "global_step": 27107, "epoch": 645} {"train_loss": -5.429259300231934, "global_step": 27108, "epoch": 645} {"train_loss": -5.4600725173950195, "global_step": 27109, "epoch": 645} {"train_loss": -5.5275373458862305, "global_step": 27110, "epoch": 645} {"train_loss": -5.3321075439453125, "global_step": 27111, "epoch": 645} {"train_loss": -5.417404651641846, "global_step": 27112, "epoch": 645} {"train_loss": -5.470882415771484, "global_step": 27113, "epoch": 645} {"train_loss": -5.454246520996094, "global_step": 27114, "epoch": 645} {"train_loss": -5.400460243225098, "global_step": 27115, "epoch": 645} {"train_loss": -5.402271270751953, "global_step": 27116, "epoch": 645} {"train_loss": -5.362236976623535, "global_step": 27117, "epoch": 645} {"train_loss": -5.327150344848633, "global_step": 27118, "epoch": 645} {"train_loss": -5.452483177185059, "global_step": 27119, "epoch": 645} {"train_loss": -5.357464790344238, "global_step": 27120, "epoch": 645} {"train_loss": -5.432484149932861, "global_step": 27121, "epoch": 645} {"train_loss": -5.425689697265625, "global_step": 27122, "epoch": 645} {"train_loss": -5.469485282897949, "global_step": 27123, "epoch": 645} {"train_loss": -5.480197906494141, "global_step": 27124, "epoch": 645} {"train_loss": -5.441685676574707, "global_step": 27125, "epoch": 645} {"train_loss": -5.322673320770264, "global_step": 27126, "epoch": 645} {"train_loss": -5.376255512237549, "global_step": 27127, "epoch": 645} {"train_loss": -5.430559158325195, "global_step": 27128, "epoch": 645} {"train_loss": -5.4207763671875, "global_step": 27129, "epoch": 645} {"train_loss": -5.378649711608887, "global_step": 27130, "epoch": 645} {"train_loss": -5.41537340482076, "global_step": 27131, "epoch": 645, "val_loss": 64028.84765625} {"train_loss": -5.424252510070801, "global_step": 27132, "epoch": 646} {"train_loss": -5.51999568939209, "global_step": 27133, "epoch": 646} {"train_loss": -5.346566200256348, "global_step": 27134, "epoch": 646} {"train_loss": -5.407736301422119, "global_step": 27135, "epoch": 646} {"train_loss": -5.438330173492432, "global_step": 27136, "epoch": 646} {"train_loss": -5.335536003112793, "global_step": 27137, "epoch": 646} {"train_loss": -5.472836017608643, "global_step": 27138, "epoch": 646} {"train_loss": -5.435632705688477, "global_step": 27139, "epoch": 646} {"train_loss": -5.362083435058594, "global_step": 27140, "epoch": 646} {"train_loss": -5.50531530380249, "global_step": 27141, "epoch": 646} {"train_loss": -5.521862506866455, "global_step": 27142, "epoch": 646} {"train_loss": -5.4609222412109375, "global_step": 27143, "epoch": 646} {"train_loss": -5.470208168029785, "global_step": 27144, "epoch": 646} {"train_loss": -5.490992546081543, "global_step": 27145, "epoch": 646} {"train_loss": -5.390450477600098, "global_step": 27146, "epoch": 646} {"train_loss": -5.513154983520508, "global_step": 27147, "epoch": 646} {"train_loss": -5.297480583190918, "global_step": 27148, "epoch": 646} {"train_loss": -5.4729905128479, "global_step": 27149, "epoch": 646} {"train_loss": -5.438661575317383, "global_step": 27150, "epoch": 646} {"train_loss": -5.3802714347839355, "global_step": 27151, "epoch": 646} {"train_loss": -5.406564712524414, "global_step": 27152, "epoch": 646} {"train_loss": -5.37865686416626, "global_step": 27153, "epoch": 646} {"train_loss": -5.370797157287598, "global_step": 27154, "epoch": 646} {"train_loss": -5.346122741699219, "global_step": 27155, "epoch": 646} {"train_loss": -5.259462356567383, "global_step": 27156, "epoch": 646} {"train_loss": -5.385458946228027, "global_step": 27157, "epoch": 646} {"train_loss": -5.346090316772461, "global_step": 27158, "epoch": 646} {"train_loss": -5.541918754577637, "global_step": 27159, "epoch": 646} {"train_loss": -5.353476524353027, "global_step": 27160, "epoch": 646} {"train_loss": -5.483100891113281, "global_step": 27161, "epoch": 646} {"train_loss": -5.473414421081543, "global_step": 27162, "epoch": 646} {"train_loss": -5.3304009437561035, "global_step": 27163, "epoch": 646} {"train_loss": -5.332358360290527, "global_step": 27164, "epoch": 646} {"train_loss": -5.392061710357666, "global_step": 27165, "epoch": 646} {"train_loss": -5.220093250274658, "global_step": 27166, "epoch": 646} {"train_loss": -5.394763946533203, "global_step": 27167, "epoch": 646} {"train_loss": -5.341337203979492, "global_step": 27168, "epoch": 646} {"train_loss": -5.318811893463135, "global_step": 27169, "epoch": 646} {"train_loss": -5.469937801361084, "global_step": 27170, "epoch": 646} {"train_loss": -5.385417938232422, "global_step": 27171, "epoch": 646} {"train_loss": -5.4446516036987305, "global_step": 27172, "epoch": 646} {"train_loss": -5.40452097711109, "global_step": 27173, "epoch": 646, "val_loss": 64073.52734375} {"train_loss": -5.521724700927734, "global_step": 27174, "epoch": 647} {"train_loss": -5.354247093200684, "global_step": 27175, "epoch": 647} {"train_loss": -5.428271770477295, "global_step": 27176, "epoch": 647} {"train_loss": -5.5013604164123535, "global_step": 27177, "epoch": 647} {"train_loss": -5.421048164367676, "global_step": 27178, "epoch": 647} {"train_loss": -5.361649036407471, "global_step": 27179, "epoch": 647} {"train_loss": -5.491898536682129, "global_step": 27180, "epoch": 647} {"train_loss": -5.3531293869018555, "global_step": 27181, "epoch": 647} {"train_loss": -5.451957702636719, "global_step": 27182, "epoch": 647} {"train_loss": -5.397034168243408, "global_step": 27183, "epoch": 647} {"train_loss": -5.384981155395508, "global_step": 27184, "epoch": 647} {"train_loss": -5.4296135902404785, "global_step": 27185, "epoch": 647} {"train_loss": -5.310516834259033, "global_step": 27186, "epoch": 647} {"train_loss": -5.475095748901367, "global_step": 27187, "epoch": 647} {"train_loss": -5.401952743530273, "global_step": 27188, "epoch": 647} {"train_loss": -5.446345806121826, "global_step": 27189, "epoch": 647} {"train_loss": -5.3081889152526855, "global_step": 27190, "epoch": 647} {"train_loss": -5.493695259094238, "global_step": 27191, "epoch": 647} {"train_loss": -5.365914821624756, "global_step": 27192, "epoch": 647} {"train_loss": -5.415946960449219, "global_step": 27193, "epoch": 647} {"train_loss": -5.4630022048950195, "global_step": 27194, "epoch": 647} {"train_loss": -5.496814727783203, "global_step": 27195, "epoch": 647} {"train_loss": -5.415258407592773, "global_step": 27196, "epoch": 647} {"train_loss": -5.387617111206055, "global_step": 27197, "epoch": 647} {"train_loss": -5.343514442443848, "global_step": 27198, "epoch": 647} {"train_loss": -5.397529125213623, "global_step": 27199, "epoch": 647} {"train_loss": -5.392487049102783, "global_step": 27200, "epoch": 647} {"train_loss": -5.337469577789307, "global_step": 27201, "epoch": 647} {"train_loss": -5.474225044250488, "global_step": 27202, "epoch": 647} {"train_loss": -5.492297649383545, "global_step": 27203, "epoch": 647} {"train_loss": -5.3360676765441895, "global_step": 27204, "epoch": 647} {"train_loss": -5.2971601486206055, "global_step": 27205, "epoch": 647} {"train_loss": -5.405066967010498, "global_step": 27206, "epoch": 647} {"train_loss": -5.529723167419434, "global_step": 27207, "epoch": 647} {"train_loss": -5.234776496887207, "global_step": 27208, "epoch": 647} {"train_loss": -5.451906681060791, "global_step": 27209, "epoch": 647} {"train_loss": -5.347747325897217, "global_step": 27210, "epoch": 647} {"train_loss": -5.517664432525635, "global_step": 27211, "epoch": 647} {"train_loss": -5.461241722106934, "global_step": 27212, "epoch": 647} {"train_loss": -5.442882061004639, "global_step": 27213, "epoch": 647} {"train_loss": -5.469422340393066, "global_step": 27214, "epoch": 647} {"train_loss": -5.415646598452613, "global_step": 27215, "epoch": 647, "val_loss": 64323.5078125} {"train_loss": -5.503060340881348, "global_step": 27216, "epoch": 648} {"train_loss": -5.49090576171875, "global_step": 27217, "epoch": 648} {"train_loss": -5.420848369598389, "global_step": 27218, "epoch": 648} {"train_loss": -5.359021186828613, "global_step": 27219, "epoch": 648} {"train_loss": -5.416081428527832, "global_step": 27220, "epoch": 648} {"train_loss": -5.595132827758789, "global_step": 27221, "epoch": 648} {"train_loss": -5.319484710693359, "global_step": 27222, "epoch": 648} {"train_loss": -5.475245475769043, "global_step": 27223, "epoch": 648} {"train_loss": -5.349750518798828, "global_step": 27224, "epoch": 648} {"train_loss": -5.380259990692139, "global_step": 27225, "epoch": 648} {"train_loss": -5.527240753173828, "global_step": 27226, "epoch": 648} {"train_loss": -5.42212438583374, "global_step": 27227, "epoch": 648} {"train_loss": -5.495611667633057, "global_step": 27228, "epoch": 648} {"train_loss": -5.465044021606445, "global_step": 27229, "epoch": 648} {"train_loss": -5.536497116088867, "global_step": 27230, "epoch": 648} {"train_loss": -5.511010646820068, "global_step": 27231, "epoch": 648} {"train_loss": -5.388556480407715, "global_step": 27232, "epoch": 648} {"train_loss": -5.508284091949463, "global_step": 27233, "epoch": 648} {"train_loss": -5.454805374145508, "global_step": 27234, "epoch": 648} {"train_loss": -5.411899089813232, "global_step": 27235, "epoch": 648} {"train_loss": -5.419749736785889, "global_step": 27236, "epoch": 648} {"train_loss": -5.398403167724609, "global_step": 27237, "epoch": 648} {"train_loss": -5.420304298400879, "global_step": 27238, "epoch": 648} {"train_loss": -5.417287826538086, "global_step": 27239, "epoch": 648} {"train_loss": -5.450658321380615, "global_step": 27240, "epoch": 648} {"train_loss": -5.451510906219482, "global_step": 27241, "epoch": 648} {"train_loss": -5.424320220947266, "global_step": 27242, "epoch": 648} {"train_loss": -5.431620121002197, "global_step": 27243, "epoch": 648} {"train_loss": -5.238313674926758, "global_step": 27244, "epoch": 648} {"train_loss": -5.412883281707764, "global_step": 27245, "epoch": 648} {"train_loss": -5.387524604797363, "global_step": 27246, "epoch": 648} {"train_loss": -5.428058624267578, "global_step": 27247, "epoch": 648} {"train_loss": -5.411708831787109, "global_step": 27248, "epoch": 648} {"train_loss": -5.390536785125732, "global_step": 27249, "epoch": 648} {"train_loss": -5.4553704261779785, "global_step": 27250, "epoch": 648} {"train_loss": -5.479798316955566, "global_step": 27251, "epoch": 648} {"train_loss": -5.508766174316406, "global_step": 27252, "epoch": 648} {"train_loss": -5.416735649108887, "global_step": 27253, "epoch": 648} {"train_loss": -5.380772590637207, "global_step": 27254, "epoch": 648} {"train_loss": -5.33112907409668, "global_step": 27255, "epoch": 648} {"train_loss": -5.510856628417969, "global_step": 27256, "epoch": 648} {"train_loss": -5.435100805191767, "global_step": 27257, "epoch": 648, "val_loss": 64396.9140625} {"train_loss": -5.379018783569336, "global_step": 27258, "epoch": 649} {"train_loss": -5.520820617675781, "global_step": 27259, "epoch": 649} {"train_loss": -5.377496719360352, "global_step": 27260, "epoch": 649} {"train_loss": -5.404356956481934, "global_step": 27261, "epoch": 649} {"train_loss": -5.4180402755737305, "global_step": 27262, "epoch": 649} {"train_loss": -5.320120811462402, "global_step": 27263, "epoch": 649} {"train_loss": -5.411591529846191, "global_step": 27264, "epoch": 649} {"train_loss": -5.4401164054870605, "global_step": 27265, "epoch": 649} {"train_loss": -5.435671806335449, "global_step": 27266, "epoch": 649} {"train_loss": -5.367252349853516, "global_step": 27267, "epoch": 649} {"train_loss": -5.484504699707031, "global_step": 27268, "epoch": 649} {"train_loss": -5.302862644195557, "global_step": 27269, "epoch": 649} {"train_loss": -5.485735893249512, "global_step": 27270, "epoch": 649} {"train_loss": -5.4421892166137695, "global_step": 27271, "epoch": 649} {"train_loss": -5.483060836791992, "global_step": 27272, "epoch": 649} {"train_loss": -5.4071526527404785, "global_step": 27273, "epoch": 649} {"train_loss": -5.445958614349365, "global_step": 27274, "epoch": 649} {"train_loss": -5.47819185256958, "global_step": 27275, "epoch": 649} {"train_loss": -5.529789924621582, "global_step": 27276, "epoch": 649} {"train_loss": -5.315910339355469, "global_step": 27277, "epoch": 649} {"train_loss": -5.4967145919799805, "global_step": 27278, "epoch": 649} {"train_loss": -5.403695583343506, "global_step": 27279, "epoch": 649} {"train_loss": -5.521130084991455, "global_step": 27280, "epoch": 649} {"train_loss": -5.456845283508301, "global_step": 27281, "epoch": 649} {"train_loss": -5.4061737060546875, "global_step": 27282, "epoch": 649} {"train_loss": -5.325338363647461, "global_step": 27283, "epoch": 649} {"train_loss": -5.565982341766357, "global_step": 27284, "epoch": 649} {"train_loss": -5.480801105499268, "global_step": 27285, "epoch": 649} {"train_loss": -5.435601234436035, "global_step": 27286, "epoch": 649} {"train_loss": -5.392140865325928, "global_step": 27287, "epoch": 649} {"train_loss": -5.48643159866333, "global_step": 27288, "epoch": 649} {"train_loss": -5.465217113494873, "global_step": 27289, "epoch": 649} {"train_loss": -5.403545379638672, "global_step": 27290, "epoch": 649} {"train_loss": -5.52632999420166, "global_step": 27291, "epoch": 649} {"train_loss": -5.455364227294922, "global_step": 27292, "epoch": 649} {"train_loss": -5.538846969604492, "global_step": 27293, "epoch": 649} {"train_loss": -5.3447771072387695, "global_step": 27294, "epoch": 649} {"train_loss": -5.425346374511719, "global_step": 27295, "epoch": 649} {"train_loss": -5.535090446472168, "global_step": 27296, "epoch": 649} {"train_loss": -5.322703838348389, "global_step": 27297, "epoch": 649} {"train_loss": -5.456838607788086, "global_step": 27298, "epoch": 649} {"train_loss": -5.43552607581729, "global_step": 27299, "epoch": 649, "val_loss": 64462.71875} {"train_loss": -5.358326435089111, "global_step": 27300, "epoch": 650} {"train_loss": -5.435535430908203, "global_step": 27301, "epoch": 650} {"train_loss": -5.438445091247559, "global_step": 27302, "epoch": 650} {"train_loss": -5.335305213928223, "global_step": 27303, "epoch": 650} {"train_loss": -5.517596244812012, "global_step": 27304, "epoch": 650} {"train_loss": -5.46104097366333, "global_step": 27305, "epoch": 650} {"train_loss": -5.435386657714844, "global_step": 27306, "epoch": 650} {"train_loss": -5.461867332458496, "global_step": 27307, "epoch": 650} {"train_loss": -5.56264591217041, "global_step": 27308, "epoch": 650} {"train_loss": -5.446239948272705, "global_step": 27309, "epoch": 650} {"train_loss": -5.437534809112549, "global_step": 27310, "epoch": 650} {"train_loss": -5.239659309387207, "global_step": 27311, "epoch": 650} {"train_loss": -5.461799144744873, "global_step": 27312, "epoch": 650} {"train_loss": -5.40848445892334, "global_step": 27313, "epoch": 650} {"train_loss": -5.363168716430664, "global_step": 27314, "epoch": 650} {"train_loss": -5.39923095703125, "global_step": 27315, "epoch": 650} {"train_loss": -5.330863952636719, "global_step": 27316, "epoch": 650} {"train_loss": -5.3211822509765625, "global_step": 27317, "epoch": 650} {"train_loss": -5.542332172393799, "global_step": 27318, "epoch": 650} {"train_loss": -5.372628688812256, "global_step": 27319, "epoch": 650} {"train_loss": -5.524505615234375, "global_step": 27320, "epoch": 650} {"train_loss": -5.406304359436035, "global_step": 27321, "epoch": 650} {"train_loss": -5.241194725036621, "global_step": 27322, "epoch": 650} {"train_loss": -5.468080043792725, "global_step": 27323, "epoch": 650} {"train_loss": -5.333045959472656, "global_step": 27324, "epoch": 650} {"train_loss": -5.407819747924805, "global_step": 27325, "epoch": 650} {"train_loss": -5.360538005828857, "global_step": 27326, "epoch": 650} {"train_loss": -5.6231865882873535, "global_step": 27327, "epoch": 650} {"train_loss": -5.51884126663208, "global_step": 27328, "epoch": 650} {"train_loss": -5.40909481048584, "global_step": 27329, "epoch": 650} {"train_loss": -5.3714599609375, "global_step": 27330, "epoch": 650} {"train_loss": -5.338973045349121, "global_step": 27331, "epoch": 650} {"train_loss": -5.465649604797363, "global_step": 27332, "epoch": 650} {"train_loss": -5.388299942016602, "global_step": 27333, "epoch": 650} {"train_loss": -5.316934108734131, "global_step": 27334, "epoch": 650} {"train_loss": -5.427681922912598, "global_step": 27335, "epoch": 650} {"train_loss": -5.424893856048584, "global_step": 27336, "epoch": 650} {"train_loss": -5.355693817138672, "global_step": 27337, "epoch": 650} {"train_loss": -5.449173927307129, "global_step": 27338, "epoch": 650} {"train_loss": -5.300197601318359, "global_step": 27339, "epoch": 650} {"train_loss": -5.391905784606934, "global_step": 27340, "epoch": 650} {"train_loss": -5.411004441125052, "global_step": 27341, "epoch": 650, "train/sim_max_reward_0": 0.19065661455283497, "train/sim_max_reward_1": 0.21343409950570252, "train/sim_max_reward_2": 0.878314705819023, "train/sim_max_reward_3": 0.13927883287754148, "train/sim_max_reward_4": 0.7238478740353048, "train/sim_max_reward_5": 0.5702769830773149, "test/sim_max_reward_4300000": 0.8248057950982214, "test/sim_max_reward_4300001": 0.4052302867857222, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.5901417888227468, "test/sim_max_reward_4300004": 0.03686095384827931, "test/sim_max_reward_4300005": 0.4195597726560397, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.04984133841500196, "test/sim_max_reward_4300008": 0.41868532214081444, "test/sim_max_reward_4300009": 0.5536080099700202, "test/sim_max_reward_4300010": 0.17825873362314268, "test/sim_max_reward_4300011": 0.3461088780969491, "test/sim_max_reward_4300012": 0.38375575147981106, "test/sim_max_reward_4300013": 0.4336696594049678, "test/sim_max_reward_4300014": 0.5627704390960542, "test/sim_max_reward_4300015": 0.22434380981056135, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.409767673178003, "test/sim_max_reward_4300018": 0.615888855898312, "test/sim_max_reward_4300019": 0.1847953758832184, "test/sim_max_reward_4300020": 0.11191576601800068, "test/sim_max_reward_4300021": 0.04121036281522732, "test/sim_max_reward_4300022": 0.07478519069348595, "test/sim_max_reward_4300023": 0.33613171648875206, "test/sim_max_reward_4300024": 0.41500805474283126, "test/sim_max_reward_4300025": 0.09051605050742449, "test/sim_max_reward_4300026": 0.05146617344268851, "test/sim_max_reward_4300027": 0.18207958318175615, "test/sim_max_reward_4300028": 0.058834814787470296, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.4372403122296674, "test/sim_max_reward_4300031": 0.10612891995760429, "test/sim_max_reward_4300032": 0.5574235576191312, "test/sim_max_reward_4300033": 0.38445867361033176, "test/sim_max_reward_4300034": 0.11821777950830155, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.6623912107939115, "test/sim_max_reward_4300038": 0.5656112066476927, "test/sim_max_reward_4300039": 0.3692226976332519, "test/sim_max_reward_4300040": 0.4256312145799289, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7232415264877333, "test/sim_max_reward_4300043": 0.1364339804899307, "test/sim_max_reward_4300044": 0.06276195934133298, "test/sim_max_reward_4300045": 0.039317777054417906, "test/sim_max_reward_4300046": 0.19858329124495888, "test/sim_max_reward_4300047": 0.13990825225435058, "test/sim_max_reward_4300048": 0.2953492483413508, "test/sim_max_reward_4300049": 0.19478615864007645, "train/mean_score": 0.4526348516446203, "test/mean_score": 0.2757995681074838, "val_loss": 64219.95703125} {"train_loss": -5.522549629211426, "global_step": 27342, "epoch": 651} {"train_loss": -5.509221076965332, "global_step": 27343, "epoch": 651} {"train_loss": -5.363663673400879, "global_step": 27344, "epoch": 651} {"train_loss": -5.414593696594238, "global_step": 27345, "epoch": 651} {"train_loss": -5.442401885986328, "global_step": 27346, "epoch": 651} {"train_loss": -5.505527496337891, "global_step": 27347, "epoch": 651} {"train_loss": -5.525751113891602, "global_step": 27348, "epoch": 651} {"train_loss": -5.452592849731445, "global_step": 27349, "epoch": 651} {"train_loss": -5.370617866516113, "global_step": 27350, "epoch": 651} {"train_loss": -5.511174201965332, "global_step": 27351, "epoch": 651} {"train_loss": -5.51671028137207, "global_step": 27352, "epoch": 651} {"train_loss": -5.326576232910156, "global_step": 27353, "epoch": 651} {"train_loss": -5.430842399597168, "global_step": 27354, "epoch": 651} {"train_loss": -5.504620552062988, "global_step": 27355, "epoch": 651} {"train_loss": -5.4235992431640625, "global_step": 27356, "epoch": 651} {"train_loss": -5.511074066162109, "global_step": 27357, "epoch": 651} {"train_loss": -5.453069686889648, "global_step": 27358, "epoch": 651} {"train_loss": -5.424210548400879, "global_step": 27359, "epoch": 651} {"train_loss": -5.4770989418029785, "global_step": 27360, "epoch": 651} {"train_loss": -5.3706254959106445, "global_step": 27361, "epoch": 651} {"train_loss": -5.415687561035156, "global_step": 27362, "epoch": 651} {"train_loss": -5.517993927001953, "global_step": 27363, "epoch": 651} {"train_loss": -5.5569658279418945, "global_step": 27364, "epoch": 651} {"train_loss": -5.548037528991699, "global_step": 27365, "epoch": 651} {"train_loss": -5.434650421142578, "global_step": 27366, "epoch": 651} {"train_loss": -5.431125164031982, "global_step": 27367, "epoch": 651} {"train_loss": -5.334591865539551, "global_step": 27368, "epoch": 651} {"train_loss": -5.503990173339844, "global_step": 27369, "epoch": 651} {"train_loss": -5.4695234298706055, "global_step": 27370, "epoch": 651} {"train_loss": -5.556339263916016, "global_step": 27371, "epoch": 651} {"train_loss": -5.3720855712890625, "global_step": 27372, "epoch": 651} {"train_loss": -5.473165035247803, "global_step": 27373, "epoch": 651} {"train_loss": -5.349061489105225, "global_step": 27374, "epoch": 651} {"train_loss": -5.452267169952393, "global_step": 27375, "epoch": 651} {"train_loss": -5.397839546203613, "global_step": 27376, "epoch": 651} {"train_loss": -5.3952836990356445, "global_step": 27377, "epoch": 651} {"train_loss": -5.404260635375977, "global_step": 27378, "epoch": 651} {"train_loss": -5.483579635620117, "global_step": 27379, "epoch": 651} {"train_loss": -5.409336090087891, "global_step": 27380, "epoch": 651} {"train_loss": -5.311491012573242, "global_step": 27381, "epoch": 651} {"train_loss": -5.36701774597168, "global_step": 27382, "epoch": 651} {"train_loss": -5.444890147163754, "global_step": 27383, "epoch": 651, "val_loss": 64030.30078125} {"train_loss": -5.414163589477539, "global_step": 27384, "epoch": 652} {"train_loss": -5.412496566772461, "global_step": 27385, "epoch": 652} {"train_loss": -5.4813313484191895, "global_step": 27386, "epoch": 652} {"train_loss": -5.309370994567871, "global_step": 27387, "epoch": 652} {"train_loss": -5.566208839416504, "global_step": 27388, "epoch": 652} {"train_loss": -5.425498008728027, "global_step": 27389, "epoch": 652} {"train_loss": -5.518766403198242, "global_step": 27390, "epoch": 652} {"train_loss": -5.398942947387695, "global_step": 27391, "epoch": 652} {"train_loss": -5.333654403686523, "global_step": 27392, "epoch": 652} {"train_loss": -5.481820106506348, "global_step": 27393, "epoch": 652} {"train_loss": -5.364327907562256, "global_step": 27394, "epoch": 652} {"train_loss": -5.458274841308594, "global_step": 27395, "epoch": 652} {"train_loss": -5.506010055541992, "global_step": 27396, "epoch": 652} {"train_loss": -5.343278884887695, "global_step": 27397, "epoch": 652} {"train_loss": -5.408132553100586, "global_step": 27398, "epoch": 652} {"train_loss": -5.444280624389648, "global_step": 27399, "epoch": 652} {"train_loss": -5.519272804260254, "global_step": 27400, "epoch": 652} {"train_loss": -5.451863765716553, "global_step": 27401, "epoch": 652} {"train_loss": -5.460353374481201, "global_step": 27402, "epoch": 652} {"train_loss": -5.29757833480835, "global_step": 27403, "epoch": 652} {"train_loss": -5.442039966583252, "global_step": 27404, "epoch": 652} {"train_loss": -5.406054496765137, "global_step": 27405, "epoch": 652} {"train_loss": -5.416647911071777, "global_step": 27406, "epoch": 652} {"train_loss": -5.423107147216797, "global_step": 27407, "epoch": 652} {"train_loss": -5.403694152832031, "global_step": 27408, "epoch": 652} {"train_loss": -5.389240264892578, "global_step": 27409, "epoch": 652} {"train_loss": -5.456582069396973, "global_step": 27410, "epoch": 652} {"train_loss": -5.432753562927246, "global_step": 27411, "epoch": 652} {"train_loss": -5.386538028717041, "global_step": 27412, "epoch": 652} {"train_loss": -5.343664169311523, "global_step": 27413, "epoch": 652} {"train_loss": -5.57405424118042, "global_step": 27414, "epoch": 652} {"train_loss": -5.367880344390869, "global_step": 27415, "epoch": 652} {"train_loss": -5.446415901184082, "global_step": 27416, "epoch": 652} {"train_loss": -5.371598243713379, "global_step": 27417, "epoch": 652} {"train_loss": -5.310690879821777, "global_step": 27418, "epoch": 652} {"train_loss": -5.344257354736328, "global_step": 27419, "epoch": 652} {"train_loss": -5.469927787780762, "global_step": 27420, "epoch": 652} {"train_loss": -5.384153366088867, "global_step": 27421, "epoch": 652} {"train_loss": -5.5179009437561035, "global_step": 27422, "epoch": 652} {"train_loss": -5.33702278137207, "global_step": 27423, "epoch": 652} {"train_loss": -5.466679573059082, "global_step": 27424, "epoch": 652} {"train_loss": -5.418706734975179, "global_step": 27425, "epoch": 652, "val_loss": 64477.12890625} {"train_loss": -5.411218643188477, "global_step": 27426, "epoch": 653} {"train_loss": -5.61204719543457, "global_step": 27427, "epoch": 653} {"train_loss": -5.327841758728027, "global_step": 27428, "epoch": 653} {"train_loss": -5.4029951095581055, "global_step": 27429, "epoch": 653} {"train_loss": -5.430984020233154, "global_step": 27430, "epoch": 653} {"train_loss": -5.4703898429870605, "global_step": 27431, "epoch": 653} {"train_loss": -5.51963996887207, "global_step": 27432, "epoch": 653} {"train_loss": -5.471430778503418, "global_step": 27433, "epoch": 653} {"train_loss": -5.445857048034668, "global_step": 27434, "epoch": 653} {"train_loss": -5.476508140563965, "global_step": 27435, "epoch": 653} {"train_loss": -5.513790607452393, "global_step": 27436, "epoch": 653} {"train_loss": -5.465667724609375, "global_step": 27437, "epoch": 653} {"train_loss": -5.43876838684082, "global_step": 27438, "epoch": 653} {"train_loss": -5.373979091644287, "global_step": 27439, "epoch": 653} {"train_loss": -5.453758716583252, "global_step": 27440, "epoch": 653} {"train_loss": -5.381024360656738, "global_step": 27441, "epoch": 653} {"train_loss": -5.525430202484131, "global_step": 27442, "epoch": 653} {"train_loss": -5.551597595214844, "global_step": 27443, "epoch": 653} {"train_loss": -5.544791221618652, "global_step": 27444, "epoch": 653} {"train_loss": -5.309161186218262, "global_step": 27445, "epoch": 653} {"train_loss": -5.372120380401611, "global_step": 27446, "epoch": 653} {"train_loss": -5.471424579620361, "global_step": 27447, "epoch": 653} {"train_loss": -5.415410041809082, "global_step": 27448, "epoch": 653} {"train_loss": -5.302153587341309, "global_step": 27449, "epoch": 653} {"train_loss": -5.5491533279418945, "global_step": 27450, "epoch": 653} {"train_loss": -5.360593795776367, "global_step": 27451, "epoch": 653} {"train_loss": -5.372462749481201, "global_step": 27452, "epoch": 653} {"train_loss": -5.456116199493408, "global_step": 27453, "epoch": 653} {"train_loss": -5.33359432220459, "global_step": 27454, "epoch": 653} {"train_loss": -5.2879638671875, "global_step": 27455, "epoch": 653} {"train_loss": -5.364980697631836, "global_step": 27456, "epoch": 653} {"train_loss": -5.390604019165039, "global_step": 27457, "epoch": 653} {"train_loss": -5.442328453063965, "global_step": 27458, "epoch": 653} {"train_loss": -5.353705406188965, "global_step": 27459, "epoch": 653} {"train_loss": -5.30689811706543, "global_step": 27460, "epoch": 653} {"train_loss": -5.481351852416992, "global_step": 27461, "epoch": 653} {"train_loss": -5.403354644775391, "global_step": 27462, "epoch": 653} {"train_loss": -5.556880950927734, "global_step": 27463, "epoch": 653} {"train_loss": -5.498712062835693, "global_step": 27464, "epoch": 653} {"train_loss": -5.43184232711792, "global_step": 27465, "epoch": 653} {"train_loss": -5.5340399742126465, "global_step": 27466, "epoch": 653} {"train_loss": -5.436262573514666, "global_step": 27467, "epoch": 653, "val_loss": 64111.25390625} {"train_loss": -5.498646259307861, "global_step": 27468, "epoch": 654} {"train_loss": -5.462177753448486, "global_step": 27469, "epoch": 654} {"train_loss": -5.515707015991211, "global_step": 27470, "epoch": 654} {"train_loss": -5.6041259765625, "global_step": 27471, "epoch": 654} {"train_loss": -5.396965026855469, "global_step": 27472, "epoch": 654} {"train_loss": -5.4945855140686035, "global_step": 27473, "epoch": 654} {"train_loss": -5.519674777984619, "global_step": 27474, "epoch": 654} {"train_loss": -5.458813667297363, "global_step": 27475, "epoch": 654} {"train_loss": -5.588434219360352, "global_step": 27476, "epoch": 654} {"train_loss": -5.427937984466553, "global_step": 27477, "epoch": 654} {"train_loss": -5.520867347717285, "global_step": 27478, "epoch": 654} {"train_loss": -5.440147876739502, "global_step": 27479, "epoch": 654} {"train_loss": -5.4167280197143555, "global_step": 27480, "epoch": 654} {"train_loss": -5.317292213439941, "global_step": 27481, "epoch": 654} {"train_loss": -5.41693115234375, "global_step": 27482, "epoch": 654} {"train_loss": -5.310585021972656, "global_step": 27483, "epoch": 654} {"train_loss": -5.441092491149902, "global_step": 27484, "epoch": 654} {"train_loss": -5.534168243408203, "global_step": 27485, "epoch": 654} {"train_loss": -5.277677059173584, "global_step": 27486, "epoch": 654} {"train_loss": -5.436944007873535, "global_step": 27487, "epoch": 654} {"train_loss": -5.2150421142578125, "global_step": 27488, "epoch": 654} {"train_loss": -5.363848686218262, "global_step": 27489, "epoch": 654} {"train_loss": -5.495492935180664, "global_step": 27490, "epoch": 654} {"train_loss": -5.313302993774414, "global_step": 27491, "epoch": 654} {"train_loss": -5.458384037017822, "global_step": 27492, "epoch": 654} {"train_loss": -5.570408821105957, "global_step": 27493, "epoch": 654} {"train_loss": -5.485069274902344, "global_step": 27494, "epoch": 654} {"train_loss": -5.392488479614258, "global_step": 27495, "epoch": 654} {"train_loss": -5.507602691650391, "global_step": 27496, "epoch": 654} {"train_loss": -5.516119003295898, "global_step": 27497, "epoch": 654} {"train_loss": -5.397281646728516, "global_step": 27498, "epoch": 654} {"train_loss": -5.413801193237305, "global_step": 27499, "epoch": 654} {"train_loss": -5.412088394165039, "global_step": 27500, "epoch": 654} {"train_loss": -5.388692378997803, "global_step": 27501, "epoch": 654} {"train_loss": -5.471471786499023, "global_step": 27502, "epoch": 654} {"train_loss": -5.3273749351501465, "global_step": 27503, "epoch": 654} {"train_loss": -5.215887069702148, "global_step": 27504, "epoch": 654} {"train_loss": -5.591269493103027, "global_step": 27505, "epoch": 654} {"train_loss": -5.143121719360352, "global_step": 27506, "epoch": 654} {"train_loss": -5.28304386138916, "global_step": 27507, "epoch": 654} {"train_loss": -5.409698963165283, "global_step": 27508, "epoch": 654} {"train_loss": -5.4188057127453035, "global_step": 27509, "epoch": 654, "val_loss": 64453.77734375} {"train_loss": -5.377306938171387, "global_step": 27510, "epoch": 655} {"train_loss": -5.1181793212890625, "global_step": 27511, "epoch": 655} {"train_loss": -5.2355241775512695, "global_step": 27512, "epoch": 655} {"train_loss": -5.33875846862793, "global_step": 27513, "epoch": 655} {"train_loss": -5.043712615966797, "global_step": 27514, "epoch": 655} {"train_loss": -5.4271392822265625, "global_step": 27515, "epoch": 655} {"train_loss": -5.082925796508789, "global_step": 27516, "epoch": 655} {"train_loss": -5.444810390472412, "global_step": 27517, "epoch": 655} {"train_loss": -5.238916873931885, "global_step": 27518, "epoch": 655} {"train_loss": -5.260596752166748, "global_step": 27519, "epoch": 655} {"train_loss": -5.344162464141846, "global_step": 27520, "epoch": 655} {"train_loss": -5.15233039855957, "global_step": 27521, "epoch": 655} {"train_loss": -5.226057529449463, "global_step": 27522, "epoch": 655} {"train_loss": -5.390564918518066, "global_step": 27523, "epoch": 655} {"train_loss": -5.268718242645264, "global_step": 27524, "epoch": 655} {"train_loss": -5.403537750244141, "global_step": 27525, "epoch": 655} {"train_loss": -5.432701110839844, "global_step": 27526, "epoch": 655} {"train_loss": -5.449860572814941, "global_step": 27527, "epoch": 655} {"train_loss": -5.375064373016357, "global_step": 27528, "epoch": 655} {"train_loss": -5.42839241027832, "global_step": 27529, "epoch": 655} {"train_loss": -5.318022727966309, "global_step": 27530, "epoch": 655} {"train_loss": -5.448935508728027, "global_step": 27531, "epoch": 655} {"train_loss": -5.345770359039307, "global_step": 27532, "epoch": 655} {"train_loss": -5.435540676116943, "global_step": 27533, "epoch": 655} {"train_loss": -5.388091087341309, "global_step": 27534, "epoch": 655} {"train_loss": -5.328821659088135, "global_step": 27535, "epoch": 655} {"train_loss": -5.442238807678223, "global_step": 27536, "epoch": 655} {"train_loss": -5.488998889923096, "global_step": 27537, "epoch": 655} {"train_loss": -5.468330383300781, "global_step": 27538, "epoch": 655} {"train_loss": -5.382478713989258, "global_step": 27539, "epoch": 655} {"train_loss": -5.491571426391602, "global_step": 27540, "epoch": 655} {"train_loss": -5.441238880157471, "global_step": 27541, "epoch": 655} {"train_loss": -5.375737190246582, "global_step": 27542, "epoch": 655} {"train_loss": -5.426421165466309, "global_step": 27543, "epoch": 655} {"train_loss": -5.528604507446289, "global_step": 27544, "epoch": 655} {"train_loss": -5.381784439086914, "global_step": 27545, "epoch": 655} {"train_loss": -5.461779594421387, "global_step": 27546, "epoch": 655} {"train_loss": -5.399736404418945, "global_step": 27547, "epoch": 655} {"train_loss": -5.535276412963867, "global_step": 27548, "epoch": 655} {"train_loss": -5.468688011169434, "global_step": 27549, "epoch": 655} {"train_loss": -5.449461460113525, "global_step": 27550, "epoch": 655} {"train_loss": -5.367098104386103, "global_step": 27551, "epoch": 655, "val_loss": 64289.31640625} {"train_loss": -5.457868576049805, "global_step": 27552, "epoch": 656} {"train_loss": -5.4791412353515625, "global_step": 27553, "epoch": 656} {"train_loss": -5.3125901222229, "global_step": 27554, "epoch": 656} {"train_loss": -5.463047504425049, "global_step": 27555, "epoch": 656} {"train_loss": -5.505964756011963, "global_step": 27556, "epoch": 656} {"train_loss": -5.303654193878174, "global_step": 27557, "epoch": 656} {"train_loss": -5.489365100860596, "global_step": 27558, "epoch": 656} {"train_loss": -5.429632663726807, "global_step": 27559, "epoch": 656} {"train_loss": -5.403543472290039, "global_step": 27560, "epoch": 656} {"train_loss": -5.370522975921631, "global_step": 27561, "epoch": 656} {"train_loss": -5.470243453979492, "global_step": 27562, "epoch": 656} {"train_loss": -5.491675853729248, "global_step": 27563, "epoch": 656} {"train_loss": -5.4762163162231445, "global_step": 27564, "epoch": 656} {"train_loss": -5.471404075622559, "global_step": 27565, "epoch": 656} {"train_loss": -5.413154125213623, "global_step": 27566, "epoch": 656} {"train_loss": -5.4793381690979, "global_step": 27567, "epoch": 656} {"train_loss": -5.324416160583496, "global_step": 27568, "epoch": 656} {"train_loss": -5.4735870361328125, "global_step": 27569, "epoch": 656} {"train_loss": -5.513444423675537, "global_step": 27570, "epoch": 656} {"train_loss": -5.465959548950195, "global_step": 27571, "epoch": 656} {"train_loss": -5.534392356872559, "global_step": 27572, "epoch": 656} {"train_loss": -5.503625869750977, "global_step": 27573, "epoch": 656} {"train_loss": -5.315887451171875, "global_step": 27574, "epoch": 656} {"train_loss": -5.428860664367676, "global_step": 27575, "epoch": 656} {"train_loss": -5.547679424285889, "global_step": 27576, "epoch": 656} {"train_loss": -5.38417387008667, "global_step": 27577, "epoch": 656} {"train_loss": -5.222867488861084, "global_step": 27578, "epoch": 656} {"train_loss": -5.2549943923950195, "global_step": 27579, "epoch": 656} {"train_loss": -5.496128082275391, "global_step": 27580, "epoch": 656} {"train_loss": -5.328322410583496, "global_step": 27581, "epoch": 656} {"train_loss": -5.401442527770996, "global_step": 27582, "epoch": 656} {"train_loss": -5.537667274475098, "global_step": 27583, "epoch": 656} {"train_loss": -5.524816513061523, "global_step": 27584, "epoch": 656} {"train_loss": -5.444924354553223, "global_step": 27585, "epoch": 656} {"train_loss": -5.332298278808594, "global_step": 27586, "epoch": 656} {"train_loss": -5.498307704925537, "global_step": 27587, "epoch": 656} {"train_loss": -5.202981948852539, "global_step": 27588, "epoch": 656} {"train_loss": -5.339656829833984, "global_step": 27589, "epoch": 656} {"train_loss": -5.456387519836426, "global_step": 27590, "epoch": 656} {"train_loss": -5.328249931335449, "global_step": 27591, "epoch": 656} {"train_loss": -5.427944183349609, "global_step": 27592, "epoch": 656} {"train_loss": -5.424485263370332, "global_step": 27593, "epoch": 656, "val_loss": 64846.51953125} {"train_loss": -5.33544921875, "global_step": 27594, "epoch": 657} {"train_loss": -5.372364044189453, "global_step": 27595, "epoch": 657} {"train_loss": -5.454143524169922, "global_step": 27596, "epoch": 657} {"train_loss": -5.383815288543701, "global_step": 27597, "epoch": 657} {"train_loss": -5.310527801513672, "global_step": 27598, "epoch": 657} {"train_loss": -5.47041654586792, "global_step": 27599, "epoch": 657} {"train_loss": -5.472734451293945, "global_step": 27600, "epoch": 657} {"train_loss": -5.467868328094482, "global_step": 27601, "epoch": 657} {"train_loss": -5.443764686584473, "global_step": 27602, "epoch": 657} {"train_loss": -5.412391662597656, "global_step": 27603, "epoch": 657} {"train_loss": -5.3981828689575195, "global_step": 27604, "epoch": 657} {"train_loss": -5.364350318908691, "global_step": 27605, "epoch": 657} {"train_loss": -5.459484577178955, "global_step": 27606, "epoch": 657} {"train_loss": -5.392744541168213, "global_step": 27607, "epoch": 657} {"train_loss": -5.334501266479492, "global_step": 27608, "epoch": 657} {"train_loss": -5.492465972900391, "global_step": 27609, "epoch": 657} {"train_loss": -5.493555068969727, "global_step": 27610, "epoch": 657} {"train_loss": -5.356174468994141, "global_step": 27611, "epoch": 657} {"train_loss": -5.3531270027160645, "global_step": 27612, "epoch": 657} {"train_loss": -5.466691017150879, "global_step": 27613, "epoch": 657} {"train_loss": -5.483002185821533, "global_step": 27614, "epoch": 657} {"train_loss": -5.600505828857422, "global_step": 27615, "epoch": 657} {"train_loss": -5.511807441711426, "global_step": 27616, "epoch": 657} {"train_loss": -5.474137306213379, "global_step": 27617, "epoch": 657} {"train_loss": -5.444637298583984, "global_step": 27618, "epoch": 657} {"train_loss": -5.509958267211914, "global_step": 27619, "epoch": 657} {"train_loss": -5.377995491027832, "global_step": 27620, "epoch": 657} {"train_loss": -5.457950592041016, "global_step": 27621, "epoch": 657} {"train_loss": -5.451276779174805, "global_step": 27622, "epoch": 657} {"train_loss": -5.477171897888184, "global_step": 27623, "epoch": 657} {"train_loss": -5.390929698944092, "global_step": 27624, "epoch": 657} {"train_loss": -5.461682319641113, "global_step": 27625, "epoch": 657} {"train_loss": -5.318246841430664, "global_step": 27626, "epoch": 657} {"train_loss": -5.27066707611084, "global_step": 27627, "epoch": 657} {"train_loss": -5.3872599601745605, "global_step": 27628, "epoch": 657} {"train_loss": -5.195352554321289, "global_step": 27629, "epoch": 657} {"train_loss": -5.3647332191467285, "global_step": 27630, "epoch": 657} {"train_loss": -5.450875282287598, "global_step": 27631, "epoch": 657} {"train_loss": -5.203159332275391, "global_step": 27632, "epoch": 657} {"train_loss": -5.384406566619873, "global_step": 27633, "epoch": 657} {"train_loss": -5.288079261779785, "global_step": 27634, "epoch": 657} {"train_loss": -5.408521391096569, "global_step": 27635, "epoch": 657, "val_loss": 64007.58984375} {"train_loss": -5.498684406280518, "global_step": 27636, "epoch": 658} {"train_loss": -5.417825698852539, "global_step": 27637, "epoch": 658} {"train_loss": -5.404337406158447, "global_step": 27638, "epoch": 658} {"train_loss": -5.36965274810791, "global_step": 27639, "epoch": 658} {"train_loss": -5.470785617828369, "global_step": 27640, "epoch": 658} {"train_loss": -5.369314193725586, "global_step": 27641, "epoch": 658} {"train_loss": -5.446697235107422, "global_step": 27642, "epoch": 658} {"train_loss": -5.419211387634277, "global_step": 27643, "epoch": 658} {"train_loss": -5.515877723693848, "global_step": 27644, "epoch": 658} {"train_loss": -5.499817371368408, "global_step": 27645, "epoch": 658} {"train_loss": -5.392996788024902, "global_step": 27646, "epoch": 658} {"train_loss": -5.420327186584473, "global_step": 27647, "epoch": 658} {"train_loss": -5.360930442810059, "global_step": 27648, "epoch": 658} {"train_loss": -5.517909526824951, "global_step": 27649, "epoch": 658} {"train_loss": -5.346717834472656, "global_step": 27650, "epoch": 658} {"train_loss": -5.361131191253662, "global_step": 27651, "epoch": 658} {"train_loss": -5.379755973815918, "global_step": 27652, "epoch": 658} {"train_loss": -5.4470367431640625, "global_step": 27653, "epoch": 658} {"train_loss": -5.370016098022461, "global_step": 27654, "epoch": 658} {"train_loss": -5.4272966384887695, "global_step": 27655, "epoch": 658} {"train_loss": -5.443212032318115, "global_step": 27656, "epoch": 658} {"train_loss": -5.405299186706543, "global_step": 27657, "epoch": 658} {"train_loss": -5.391295433044434, "global_step": 27658, "epoch": 658} {"train_loss": -5.472504138946533, "global_step": 27659, "epoch": 658} {"train_loss": -5.574113845825195, "global_step": 27660, "epoch": 658} {"train_loss": -5.431641578674316, "global_step": 27661, "epoch": 658} {"train_loss": -5.4034423828125, "global_step": 27662, "epoch": 658} {"train_loss": -5.4958696365356445, "global_step": 27663, "epoch": 658} {"train_loss": -5.498279571533203, "global_step": 27664, "epoch": 658} {"train_loss": -5.41565465927124, "global_step": 27665, "epoch": 658} {"train_loss": -5.489629745483398, "global_step": 27666, "epoch": 658} {"train_loss": -5.425481796264648, "global_step": 27667, "epoch": 658} {"train_loss": -5.402883052825928, "global_step": 27668, "epoch": 658} {"train_loss": -5.484683513641357, "global_step": 27669, "epoch": 658} {"train_loss": -5.428544044494629, "global_step": 27670, "epoch": 658} {"train_loss": -5.470859527587891, "global_step": 27671, "epoch": 658} {"train_loss": -5.530153751373291, "global_step": 27672, "epoch": 658} {"train_loss": -5.3789191246032715, "global_step": 27673, "epoch": 658} {"train_loss": -5.29039192199707, "global_step": 27674, "epoch": 658} {"train_loss": -5.4922332763671875, "global_step": 27675, "epoch": 658} {"train_loss": -5.307437896728516, "global_step": 27676, "epoch": 658} {"train_loss": -5.431063288734073, "global_step": 27677, "epoch": 658, "val_loss": 64475.34765625} {"train_loss": -5.480351448059082, "global_step": 27678, "epoch": 659} {"train_loss": -5.418588638305664, "global_step": 27679, "epoch": 659} {"train_loss": -5.36545467376709, "global_step": 27680, "epoch": 659} {"train_loss": -5.4929046630859375, "global_step": 27681, "epoch": 659} {"train_loss": -5.308185577392578, "global_step": 27682, "epoch": 659} {"train_loss": -5.622079849243164, "global_step": 27683, "epoch": 659} {"train_loss": -5.363616943359375, "global_step": 27684, "epoch": 659} {"train_loss": -5.421509265899658, "global_step": 27685, "epoch": 659} {"train_loss": -5.345314979553223, "global_step": 27686, "epoch": 659} {"train_loss": -5.521683216094971, "global_step": 27687, "epoch": 659} {"train_loss": -5.378486633300781, "global_step": 27688, "epoch": 659} {"train_loss": -5.40250301361084, "global_step": 27689, "epoch": 659} {"train_loss": -5.400547027587891, "global_step": 27690, "epoch": 659} {"train_loss": -5.437700271606445, "global_step": 27691, "epoch": 659} {"train_loss": -5.369731426239014, "global_step": 27692, "epoch": 659} {"train_loss": -5.37033224105835, "global_step": 27693, "epoch": 659} {"train_loss": -5.393603324890137, "global_step": 27694, "epoch": 659} {"train_loss": -5.290868759155273, "global_step": 27695, "epoch": 659} {"train_loss": -5.37872314453125, "global_step": 27696, "epoch": 659} {"train_loss": -5.543280601501465, "global_step": 27697, "epoch": 659} {"train_loss": -5.554252624511719, "global_step": 27698, "epoch": 659} {"train_loss": -5.4784345626831055, "global_step": 27699, "epoch": 659} {"train_loss": -5.49594783782959, "global_step": 27700, "epoch": 659} {"train_loss": -5.483100891113281, "global_step": 27701, "epoch": 659} {"train_loss": -5.446028232574463, "global_step": 27702, "epoch": 659} {"train_loss": -5.423500061035156, "global_step": 27703, "epoch": 659} {"train_loss": -5.399320602416992, "global_step": 27704, "epoch": 659} {"train_loss": -5.346324920654297, "global_step": 27705, "epoch": 659} {"train_loss": -5.4742045402526855, "global_step": 27706, "epoch": 659} {"train_loss": -5.398334980010986, "global_step": 27707, "epoch": 659} {"train_loss": -5.40737247467041, "global_step": 27708, "epoch": 659} {"train_loss": -5.46562385559082, "global_step": 27709, "epoch": 659} {"train_loss": -5.530294418334961, "global_step": 27710, "epoch": 659} {"train_loss": -5.3947553634643555, "global_step": 27711, "epoch": 659} {"train_loss": -5.435113906860352, "global_step": 27712, "epoch": 659} {"train_loss": -5.689708709716797, "global_step": 27713, "epoch": 659} {"train_loss": -5.424916744232178, "global_step": 27714, "epoch": 659} {"train_loss": -5.490811347961426, "global_step": 27715, "epoch": 659} {"train_loss": -5.396895408630371, "global_step": 27716, "epoch": 659} {"train_loss": -5.481631755828857, "global_step": 27717, "epoch": 659} {"train_loss": -5.370238304138184, "global_step": 27718, "epoch": 659} {"train_loss": -5.433801980245681, "global_step": 27719, "epoch": 659, "val_loss": 64335.515625} {"train_loss": -5.386938095092773, "global_step": 27720, "epoch": 660} {"train_loss": -5.393299579620361, "global_step": 27721, "epoch": 660} {"train_loss": -5.430473327636719, "global_step": 27722, "epoch": 660} {"train_loss": -5.347380638122559, "global_step": 27723, "epoch": 660} {"train_loss": -5.395044803619385, "global_step": 27724, "epoch": 660} {"train_loss": -5.4047136306762695, "global_step": 27725, "epoch": 660} {"train_loss": -5.3069047927856445, "global_step": 27726, "epoch": 660} {"train_loss": -5.457187175750732, "global_step": 27727, "epoch": 660} {"train_loss": -5.2627363204956055, "global_step": 27728, "epoch": 660} {"train_loss": -5.484745025634766, "global_step": 27729, "epoch": 660} {"train_loss": -5.4921979904174805, "global_step": 27730, "epoch": 660} {"train_loss": -5.379672050476074, "global_step": 27731, "epoch": 660} {"train_loss": -5.390204906463623, "global_step": 27732, "epoch": 660} {"train_loss": -5.426333427429199, "global_step": 27733, "epoch": 660} {"train_loss": -5.433063507080078, "global_step": 27734, "epoch": 660} {"train_loss": -5.444726943969727, "global_step": 27735, "epoch": 660} {"train_loss": -5.385073661804199, "global_step": 27736, "epoch": 660} {"train_loss": -5.4191131591796875, "global_step": 27737, "epoch": 660} {"train_loss": -5.3608622550964355, "global_step": 27738, "epoch": 660} {"train_loss": -5.43435001373291, "global_step": 27739, "epoch": 660} {"train_loss": -5.419375419616699, "global_step": 27740, "epoch": 660} {"train_loss": -5.382388591766357, "global_step": 27741, "epoch": 660} {"train_loss": -5.368206977844238, "global_step": 27742, "epoch": 660} {"train_loss": -5.407327651977539, "global_step": 27743, "epoch": 660} {"train_loss": -5.355541229248047, "global_step": 27744, "epoch": 660} {"train_loss": -5.474961280822754, "global_step": 27745, "epoch": 660} {"train_loss": -5.486153602600098, "global_step": 27746, "epoch": 660} {"train_loss": -5.481386184692383, "global_step": 27747, "epoch": 660} {"train_loss": -5.5153913497924805, "global_step": 27748, "epoch": 660} {"train_loss": -5.587252140045166, "global_step": 27749, "epoch": 660} {"train_loss": -5.444851398468018, "global_step": 27750, "epoch": 660} {"train_loss": -5.3912506103515625, "global_step": 27751, "epoch": 660} {"train_loss": -5.543668746948242, "global_step": 27752, "epoch": 660} {"train_loss": -5.41297721862793, "global_step": 27753, "epoch": 660} {"train_loss": -5.471579551696777, "global_step": 27754, "epoch": 660} {"train_loss": -5.420570373535156, "global_step": 27755, "epoch": 660} {"train_loss": -5.397867202758789, "global_step": 27756, "epoch": 660} {"train_loss": -5.337406635284424, "global_step": 27757, "epoch": 660} {"train_loss": -5.505408763885498, "global_step": 27758, "epoch": 660} {"train_loss": -5.5028157234191895, "global_step": 27759, "epoch": 660} {"train_loss": -5.605014324188232, "global_step": 27760, "epoch": 660} {"train_loss": -5.429563022795177, "global_step": 27761, "epoch": 660, "val_loss": 64314.52734375} {"train_loss": -5.441680431365967, "global_step": 27762, "epoch": 661} {"train_loss": -5.362579345703125, "global_step": 27763, "epoch": 661} {"train_loss": -5.477851867675781, "global_step": 27764, "epoch": 661} {"train_loss": -5.496196746826172, "global_step": 27765, "epoch": 661} {"train_loss": -5.350595474243164, "global_step": 27766, "epoch": 661} {"train_loss": -5.375266075134277, "global_step": 27767, "epoch": 661} {"train_loss": -5.504180908203125, "global_step": 27768, "epoch": 661} {"train_loss": -5.3963942527771, "global_step": 27769, "epoch": 661} {"train_loss": -5.330437660217285, "global_step": 27770, "epoch": 661} {"train_loss": -5.475222110748291, "global_step": 27771, "epoch": 661} {"train_loss": -5.319636344909668, "global_step": 27772, "epoch": 661} {"train_loss": -5.420555114746094, "global_step": 27773, "epoch": 661} {"train_loss": -5.341619491577148, "global_step": 27774, "epoch": 661} {"train_loss": -5.34379768371582, "global_step": 27775, "epoch": 661} {"train_loss": -5.423043251037598, "global_step": 27776, "epoch": 661} {"train_loss": -5.351323127746582, "global_step": 27777, "epoch": 661} {"train_loss": -5.476980686187744, "global_step": 27778, "epoch": 661} {"train_loss": -5.482434272766113, "global_step": 27779, "epoch": 661} {"train_loss": -5.404019832611084, "global_step": 27780, "epoch": 661} {"train_loss": -5.459663391113281, "global_step": 27781, "epoch": 661} {"train_loss": -5.445184707641602, "global_step": 27782, "epoch": 661} {"train_loss": -5.320174694061279, "global_step": 27783, "epoch": 661} {"train_loss": -5.555300712585449, "global_step": 27784, "epoch": 661} {"train_loss": -5.510800361633301, "global_step": 27785, "epoch": 661} {"train_loss": -5.3586530685424805, "global_step": 27786, "epoch": 661} {"train_loss": -5.483147621154785, "global_step": 27787, "epoch": 661} {"train_loss": -5.595564842224121, "global_step": 27788, "epoch": 661} {"train_loss": -5.325229167938232, "global_step": 27789, "epoch": 661} {"train_loss": -5.492592811584473, "global_step": 27790, "epoch": 661} {"train_loss": -5.430102825164795, "global_step": 27791, "epoch": 661} {"train_loss": -5.502552032470703, "global_step": 27792, "epoch": 661} {"train_loss": -5.318324089050293, "global_step": 27793, "epoch": 661} {"train_loss": -5.351330757141113, "global_step": 27794, "epoch": 661} {"train_loss": -5.481666564941406, "global_step": 27795, "epoch": 661} {"train_loss": -5.417791366577148, "global_step": 27796, "epoch": 661} {"train_loss": -5.4180803298950195, "global_step": 27797, "epoch": 661} {"train_loss": -5.388924598693848, "global_step": 27798, "epoch": 661} {"train_loss": -5.39251708984375, "global_step": 27799, "epoch": 661} {"train_loss": -5.479507923126221, "global_step": 27800, "epoch": 661} {"train_loss": -5.498290061950684, "global_step": 27801, "epoch": 661} {"train_loss": -5.375892162322998, "global_step": 27802, "epoch": 661} {"train_loss": -5.4250471364884145, "global_step": 27803, "epoch": 661, "val_loss": 63973.3046875} {"train_loss": -5.438085079193115, "global_step": 27804, "epoch": 662} {"train_loss": -5.331057548522949, "global_step": 27805, "epoch": 662} {"train_loss": -5.341999530792236, "global_step": 27806, "epoch": 662} {"train_loss": -5.381816387176514, "global_step": 27807, "epoch": 662} {"train_loss": -5.355745315551758, "global_step": 27808, "epoch": 662} {"train_loss": -5.3715996742248535, "global_step": 27809, "epoch": 662} {"train_loss": -5.47654914855957, "global_step": 27810, "epoch": 662} {"train_loss": -5.280328750610352, "global_step": 27811, "epoch": 662} {"train_loss": -5.401655197143555, "global_step": 27812, "epoch": 662} {"train_loss": -5.441232681274414, "global_step": 27813, "epoch": 662} {"train_loss": -5.468343734741211, "global_step": 27814, "epoch": 662} {"train_loss": -5.463356018066406, "global_step": 27815, "epoch": 662} {"train_loss": -5.600902557373047, "global_step": 27816, "epoch": 662} {"train_loss": -5.484837532043457, "global_step": 27817, "epoch": 662} {"train_loss": -5.439057350158691, "global_step": 27818, "epoch": 662} {"train_loss": -5.440632343292236, "global_step": 27819, "epoch": 662} {"train_loss": -5.435655117034912, "global_step": 27820, "epoch": 662} {"train_loss": -5.378931999206543, "global_step": 27821, "epoch": 662} {"train_loss": -5.317120552062988, "global_step": 27822, "epoch": 662} {"train_loss": -5.413596153259277, "global_step": 27823, "epoch": 662} {"train_loss": -5.516098976135254, "global_step": 27824, "epoch": 662} {"train_loss": -5.369110584259033, "global_step": 27825, "epoch": 662} {"train_loss": -5.446384429931641, "global_step": 27826, "epoch": 662} {"train_loss": -5.516522407531738, "global_step": 27827, "epoch": 662} {"train_loss": -5.430237770080566, "global_step": 27828, "epoch": 662} {"train_loss": -5.445838451385498, "global_step": 27829, "epoch": 662} {"train_loss": -5.538008689880371, "global_step": 27830, "epoch": 662} {"train_loss": -5.499636173248291, "global_step": 27831, "epoch": 662} {"train_loss": -5.409196376800537, "global_step": 27832, "epoch": 662} {"train_loss": -5.511255741119385, "global_step": 27833, "epoch": 662} {"train_loss": -5.466193675994873, "global_step": 27834, "epoch": 662} {"train_loss": -5.368600845336914, "global_step": 27835, "epoch": 662} {"train_loss": -5.461284637451172, "global_step": 27836, "epoch": 662} {"train_loss": -5.480004787445068, "global_step": 27837, "epoch": 662} {"train_loss": -5.518684387207031, "global_step": 27838, "epoch": 662} {"train_loss": -5.479594707489014, "global_step": 27839, "epoch": 662} {"train_loss": -5.382904052734375, "global_step": 27840, "epoch": 662} {"train_loss": -5.487921237945557, "global_step": 27841, "epoch": 662} {"train_loss": -5.445684432983398, "global_step": 27842, "epoch": 662} {"train_loss": -5.538531303405762, "global_step": 27843, "epoch": 662} {"train_loss": -5.427498817443848, "global_step": 27844, "epoch": 662} {"train_loss": -5.4412281059083485, "global_step": 27845, "epoch": 662, "val_loss": 64060.8046875} {"train_loss": -5.390224456787109, "global_step": 27846, "epoch": 663} {"train_loss": -5.545378684997559, "global_step": 27847, "epoch": 663} {"train_loss": -5.481706619262695, "global_step": 27848, "epoch": 663} {"train_loss": -5.431652545928955, "global_step": 27849, "epoch": 663} {"train_loss": -5.47590446472168, "global_step": 27850, "epoch": 663} {"train_loss": -5.525580406188965, "global_step": 27851, "epoch": 663} {"train_loss": -5.5649518966674805, "global_step": 27852, "epoch": 663} {"train_loss": -5.359842777252197, "global_step": 27853, "epoch": 663} {"train_loss": -5.372702598571777, "global_step": 27854, "epoch": 663} {"train_loss": -5.31058931350708, "global_step": 27855, "epoch": 663} {"train_loss": -5.3488593101501465, "global_step": 27856, "epoch": 663} {"train_loss": -5.548684597015381, "global_step": 27857, "epoch": 663} {"train_loss": -5.4005126953125, "global_step": 27858, "epoch": 663} {"train_loss": -5.40654182434082, "global_step": 27859, "epoch": 663} {"train_loss": -5.604000091552734, "global_step": 27860, "epoch": 663} {"train_loss": -5.622941493988037, "global_step": 27861, "epoch": 663} {"train_loss": -5.534159183502197, "global_step": 27862, "epoch": 663} {"train_loss": -5.44817590713501, "global_step": 27863, "epoch": 663} {"train_loss": -5.474964141845703, "global_step": 27864, "epoch": 663} {"train_loss": -5.372858047485352, "global_step": 27865, "epoch": 663} {"train_loss": -5.439242362976074, "global_step": 27866, "epoch": 663} {"train_loss": -5.431352615356445, "global_step": 27867, "epoch": 663} {"train_loss": -5.390902042388916, "global_step": 27868, "epoch": 663} {"train_loss": -5.338686943054199, "global_step": 27869, "epoch": 663} {"train_loss": -5.303163051605225, "global_step": 27870, "epoch": 663} {"train_loss": -5.380642890930176, "global_step": 27871, "epoch": 663} {"train_loss": -5.362522602081299, "global_step": 27872, "epoch": 663} {"train_loss": -5.40617036819458, "global_step": 27873, "epoch": 663} {"train_loss": -5.287813663482666, "global_step": 27874, "epoch": 663} {"train_loss": -5.40709114074707, "global_step": 27875, "epoch": 663} {"train_loss": -5.470632076263428, "global_step": 27876, "epoch": 663} {"train_loss": -5.407752990722656, "global_step": 27877, "epoch": 663} {"train_loss": -5.404877662658691, "global_step": 27878, "epoch": 663} {"train_loss": -5.333308219909668, "global_step": 27879, "epoch": 663} {"train_loss": -5.378166675567627, "global_step": 27880, "epoch": 663} {"train_loss": -5.416923999786377, "global_step": 27881, "epoch": 663} {"train_loss": -5.328496932983398, "global_step": 27882, "epoch": 663} {"train_loss": -5.5352888107299805, "global_step": 27883, "epoch": 663} {"train_loss": -5.525705337524414, "global_step": 27884, "epoch": 663} {"train_loss": -5.488741874694824, "global_step": 27885, "epoch": 663} {"train_loss": -5.499073028564453, "global_step": 27886, "epoch": 663} {"train_loss": -5.433594556081863, "global_step": 27887, "epoch": 663, "val_loss": 63855.0} {"train_loss": -5.413452625274658, "global_step": 27888, "epoch": 664} {"train_loss": -5.381792068481445, "global_step": 27889, "epoch": 664} {"train_loss": -5.592413425445557, "global_step": 27890, "epoch": 664} {"train_loss": -5.4984049797058105, "global_step": 27891, "epoch": 664} {"train_loss": -5.579132080078125, "global_step": 27892, "epoch": 664} {"train_loss": -5.580943584442139, "global_step": 27893, "epoch": 664} {"train_loss": -5.4505438804626465, "global_step": 27894, "epoch": 664} {"train_loss": -5.5204620361328125, "global_step": 27895, "epoch": 664} {"train_loss": -5.350364685058594, "global_step": 27896, "epoch": 664} {"train_loss": -5.3473920822143555, "global_step": 27897, "epoch": 664} {"train_loss": -5.483415126800537, "global_step": 27898, "epoch": 664} {"train_loss": -5.470937728881836, "global_step": 27899, "epoch": 664} {"train_loss": -5.443917751312256, "global_step": 27900, "epoch": 664} {"train_loss": -5.413368225097656, "global_step": 27901, "epoch": 664} {"train_loss": -5.522536277770996, "global_step": 27902, "epoch": 664} {"train_loss": -5.446696758270264, "global_step": 27903, "epoch": 664} {"train_loss": -5.483654022216797, "global_step": 27904, "epoch": 664} {"train_loss": -5.322847366333008, "global_step": 27905, "epoch": 664} {"train_loss": -5.405856132507324, "global_step": 27906, "epoch": 664} {"train_loss": -5.4609174728393555, "global_step": 27907, "epoch": 664} {"train_loss": -5.526846885681152, "global_step": 27908, "epoch": 664} {"train_loss": -5.349861145019531, "global_step": 27909, "epoch": 664} {"train_loss": -5.52762508392334, "global_step": 27910, "epoch": 664} {"train_loss": -5.509054183959961, "global_step": 27911, "epoch": 664} {"train_loss": -5.369078636169434, "global_step": 27912, "epoch": 664} {"train_loss": -5.489936828613281, "global_step": 27913, "epoch": 664} {"train_loss": -5.45549201965332, "global_step": 27914, "epoch": 664} {"train_loss": -5.487043380737305, "global_step": 27915, "epoch": 664} {"train_loss": -5.443000793457031, "global_step": 27916, "epoch": 664} {"train_loss": -5.46993350982666, "global_step": 27917, "epoch": 664} {"train_loss": -5.36273193359375, "global_step": 27918, "epoch": 664} {"train_loss": -5.387113094329834, "global_step": 27919, "epoch": 664} {"train_loss": -5.400017738342285, "global_step": 27920, "epoch": 664} {"train_loss": -5.427063941955566, "global_step": 27921, "epoch": 664} {"train_loss": -5.464548587799072, "global_step": 27922, "epoch": 664} {"train_loss": -5.467545032501221, "global_step": 27923, "epoch": 664} {"train_loss": -5.451143264770508, "global_step": 27924, "epoch": 664} {"train_loss": -5.376791000366211, "global_step": 27925, "epoch": 664} {"train_loss": -5.54707670211792, "global_step": 27926, "epoch": 664} {"train_loss": -5.436375617980957, "global_step": 27927, "epoch": 664} {"train_loss": -5.382100582122803, "global_step": 27928, "epoch": 664} {"train_loss": -5.450332914079938, "global_step": 27929, "epoch": 664, "val_loss": 63892.17578125} {"train_loss": -5.487318515777588, "global_step": 27930, "epoch": 665} {"train_loss": -5.396306037902832, "global_step": 27931, "epoch": 665} {"train_loss": -5.529048919677734, "global_step": 27932, "epoch": 665} {"train_loss": -5.397711753845215, "global_step": 27933, "epoch": 665} {"train_loss": -5.468715667724609, "global_step": 27934, "epoch": 665} {"train_loss": -5.513025760650635, "global_step": 27935, "epoch": 665} {"train_loss": -5.4392619132995605, "global_step": 27936, "epoch": 665} {"train_loss": -5.451233386993408, "global_step": 27937, "epoch": 665} {"train_loss": -5.342001914978027, "global_step": 27938, "epoch": 665} {"train_loss": -5.279941558837891, "global_step": 27939, "epoch": 665} {"train_loss": -5.519828796386719, "global_step": 27940, "epoch": 665} {"train_loss": -5.3114776611328125, "global_step": 27941, "epoch": 665} {"train_loss": -5.4189863204956055, "global_step": 27942, "epoch": 665} {"train_loss": -5.4416608810424805, "global_step": 27943, "epoch": 665} {"train_loss": -5.3841352462768555, "global_step": 27944, "epoch": 665} {"train_loss": -5.366977691650391, "global_step": 27945, "epoch": 665} {"train_loss": -5.446324348449707, "global_step": 27946, "epoch": 665} {"train_loss": -5.266107559204102, "global_step": 27947, "epoch": 665} {"train_loss": -5.56007719039917, "global_step": 27948, "epoch": 665} {"train_loss": -5.3575663566589355, "global_step": 27949, "epoch": 665} {"train_loss": -5.463863372802734, "global_step": 27950, "epoch": 665} {"train_loss": -5.425527095794678, "global_step": 27951, "epoch": 665} {"train_loss": -5.370950698852539, "global_step": 27952, "epoch": 665} {"train_loss": -5.345210075378418, "global_step": 27953, "epoch": 665} {"train_loss": -5.442286491394043, "global_step": 27954, "epoch": 665} {"train_loss": -5.419517517089844, "global_step": 27955, "epoch": 665} {"train_loss": -5.396059036254883, "global_step": 27956, "epoch": 665} {"train_loss": -5.33555793762207, "global_step": 27957, "epoch": 665} {"train_loss": -5.538192272186279, "global_step": 27958, "epoch": 665} {"train_loss": -5.41861629486084, "global_step": 27959, "epoch": 665} {"train_loss": -5.406813621520996, "global_step": 27960, "epoch": 665} {"train_loss": -5.507043361663818, "global_step": 27961, "epoch": 665} {"train_loss": -5.429586887359619, "global_step": 27962, "epoch": 665} {"train_loss": -5.391366958618164, "global_step": 27963, "epoch": 665} {"train_loss": -5.3781657218933105, "global_step": 27964, "epoch": 665} {"train_loss": -5.304389476776123, "global_step": 27965, "epoch": 665} {"train_loss": -5.515313148498535, "global_step": 27966, "epoch": 665} {"train_loss": -5.384117126464844, "global_step": 27967, "epoch": 665} {"train_loss": -5.429093360900879, "global_step": 27968, "epoch": 665} {"train_loss": -5.340323448181152, "global_step": 27969, "epoch": 665} {"train_loss": -5.342382431030273, "global_step": 27970, "epoch": 665} {"train_loss": -5.413308620452881, "global_step": 27971, "epoch": 665, "val_loss": 63914.0703125} {"train_loss": -5.5149149894714355, "global_step": 27972, "epoch": 666} {"train_loss": -5.5679216384887695, "global_step": 27973, "epoch": 666} {"train_loss": -5.375199794769287, "global_step": 27974, "epoch": 666} {"train_loss": -5.471278190612793, "global_step": 27975, "epoch": 666} {"train_loss": -5.623804092407227, "global_step": 27976, "epoch": 666} {"train_loss": -5.537932395935059, "global_step": 27977, "epoch": 666} {"train_loss": -5.4002580642700195, "global_step": 27978, "epoch": 666} {"train_loss": -5.527923583984375, "global_step": 27979, "epoch": 666} {"train_loss": -5.413142204284668, "global_step": 27980, "epoch": 666} {"train_loss": -5.348614692687988, "global_step": 27981, "epoch": 666} {"train_loss": -5.406755447387695, "global_step": 27982, "epoch": 666} {"train_loss": -5.428885459899902, "global_step": 27983, "epoch": 666} {"train_loss": -5.631991386413574, "global_step": 27984, "epoch": 666} {"train_loss": -5.4241228103637695, "global_step": 27985, "epoch": 666} {"train_loss": -5.439191818237305, "global_step": 27986, "epoch": 666} {"train_loss": -5.48012638092041, "global_step": 27987, "epoch": 666} {"train_loss": -5.5703349113464355, "global_step": 27988, "epoch": 666} {"train_loss": -5.246432781219482, "global_step": 27989, "epoch": 666} {"train_loss": -5.420848846435547, "global_step": 27990, "epoch": 666} {"train_loss": -5.52427864074707, "global_step": 27991, "epoch": 666} {"train_loss": -5.371522426605225, "global_step": 27992, "epoch": 666} {"train_loss": -5.430865287780762, "global_step": 27993, "epoch": 666} {"train_loss": -5.442661285400391, "global_step": 27994, "epoch": 666} {"train_loss": -5.440609455108643, "global_step": 27995, "epoch": 666} {"train_loss": -5.384272575378418, "global_step": 27996, "epoch": 666} {"train_loss": -5.421375274658203, "global_step": 27997, "epoch": 666} {"train_loss": -5.391255855560303, "global_step": 27998, "epoch": 666} {"train_loss": -5.3339738845825195, "global_step": 27999, "epoch": 666} {"train_loss": -5.425076961517334, "global_step": 28000, "epoch": 666} {"train_loss": -5.248344898223877, "global_step": 28001, "epoch": 666} {"train_loss": -5.5917277336120605, "global_step": 28002, "epoch": 666} {"train_loss": -5.270175457000732, "global_step": 28003, "epoch": 666} {"train_loss": -5.367331027984619, "global_step": 28004, "epoch": 666} {"train_loss": -5.377124786376953, "global_step": 28005, "epoch": 666} {"train_loss": -5.278305530548096, "global_step": 28006, "epoch": 666} {"train_loss": -5.42337703704834, "global_step": 28007, "epoch": 666} {"train_loss": -5.391789436340332, "global_step": 28008, "epoch": 666} {"train_loss": -5.3982930183410645, "global_step": 28009, "epoch": 666} {"train_loss": -5.435883522033691, "global_step": 28010, "epoch": 666} {"train_loss": -5.357850551605225, "global_step": 28011, "epoch": 666} {"train_loss": -5.596720218658447, "global_step": 28012, "epoch": 666} {"train_loss": -5.430918841134934, "global_step": 28013, "epoch": 666, "val_loss": 64201.7265625} {"train_loss": -5.526947975158691, "global_step": 28014, "epoch": 667} {"train_loss": -5.351218223571777, "global_step": 28015, "epoch": 667} {"train_loss": -5.36849308013916, "global_step": 28016, "epoch": 667} {"train_loss": -5.481082916259766, "global_step": 28017, "epoch": 667} {"train_loss": -5.427177429199219, "global_step": 28018, "epoch": 667} {"train_loss": -5.425333499908447, "global_step": 28019, "epoch": 667} {"train_loss": -5.471329689025879, "global_step": 28020, "epoch": 667} {"train_loss": -5.3831682205200195, "global_step": 28021, "epoch": 667} {"train_loss": -5.3086066246032715, "global_step": 28022, "epoch": 667} {"train_loss": -5.379190921783447, "global_step": 28023, "epoch": 667} {"train_loss": -5.476421356201172, "global_step": 28024, "epoch": 667} {"train_loss": -5.345720291137695, "global_step": 28025, "epoch": 667} {"train_loss": -5.498678684234619, "global_step": 28026, "epoch": 667} {"train_loss": -5.410768508911133, "global_step": 28027, "epoch": 667} {"train_loss": -5.520417213439941, "global_step": 28028, "epoch": 667} {"train_loss": -5.384991645812988, "global_step": 28029, "epoch": 667} {"train_loss": -5.503691673278809, "global_step": 28030, "epoch": 667} {"train_loss": -5.466425895690918, "global_step": 28031, "epoch": 667} {"train_loss": -5.356546401977539, "global_step": 28032, "epoch": 667} {"train_loss": -5.508350372314453, "global_step": 28033, "epoch": 667} {"train_loss": -5.494945049285889, "global_step": 28034, "epoch": 667} {"train_loss": -5.3919148445129395, "global_step": 28035, "epoch": 667} {"train_loss": -5.386001110076904, "global_step": 28036, "epoch": 667} {"train_loss": -5.51146125793457, "global_step": 28037, "epoch": 667} {"train_loss": -5.4811601638793945, "global_step": 28038, "epoch": 667} {"train_loss": -5.407711029052734, "global_step": 28039, "epoch": 667} {"train_loss": -5.411515235900879, "global_step": 28040, "epoch": 667} {"train_loss": -5.462568759918213, "global_step": 28041, "epoch": 667} {"train_loss": -5.4389142990112305, "global_step": 28042, "epoch": 667} {"train_loss": -5.506734848022461, "global_step": 28043, "epoch": 667} {"train_loss": -5.4871320724487305, "global_step": 28044, "epoch": 667} {"train_loss": -5.5276899337768555, "global_step": 28045, "epoch": 667} {"train_loss": -5.516657829284668, "global_step": 28046, "epoch": 667} {"train_loss": -5.486767292022705, "global_step": 28047, "epoch": 667} {"train_loss": -5.570313453674316, "global_step": 28048, "epoch": 667} {"train_loss": -5.453993320465088, "global_step": 28049, "epoch": 667} {"train_loss": -5.585927963256836, "global_step": 28050, "epoch": 667} {"train_loss": -5.44220495223999, "global_step": 28051, "epoch": 667} {"train_loss": -5.468776702880859, "global_step": 28052, "epoch": 667} {"train_loss": -5.362492561340332, "global_step": 28053, "epoch": 667} {"train_loss": -5.354007720947266, "global_step": 28054, "epoch": 667} {"train_loss": -5.446208794911702, "global_step": 28055, "epoch": 667, "val_loss": 64292.95703125} {"train_loss": -5.482605457305908, "global_step": 28056, "epoch": 668} {"train_loss": -5.447370529174805, "global_step": 28057, "epoch": 668} {"train_loss": -5.613915920257568, "global_step": 28058, "epoch": 668} {"train_loss": -5.241517543792725, "global_step": 28059, "epoch": 668} {"train_loss": -5.494831562042236, "global_step": 28060, "epoch": 668} {"train_loss": -5.385073184967041, "global_step": 28061, "epoch": 668} {"train_loss": -5.410647392272949, "global_step": 28062, "epoch": 668} {"train_loss": -5.494941711425781, "global_step": 28063, "epoch": 668} {"train_loss": -5.355246543884277, "global_step": 28064, "epoch": 668} {"train_loss": -5.344548225402832, "global_step": 28065, "epoch": 668} {"train_loss": -5.432663917541504, "global_step": 28066, "epoch": 668} {"train_loss": -5.487321853637695, "global_step": 28067, "epoch": 668} {"train_loss": -5.399989604949951, "global_step": 28068, "epoch": 668} {"train_loss": -5.4264068603515625, "global_step": 28069, "epoch": 668} {"train_loss": -5.528048515319824, "global_step": 28070, "epoch": 668} {"train_loss": -5.495128154754639, "global_step": 28071, "epoch": 668} {"train_loss": -5.48731803894043, "global_step": 28072, "epoch": 668} {"train_loss": -5.407841205596924, "global_step": 28073, "epoch": 668} {"train_loss": -5.3368730545043945, "global_step": 28074, "epoch": 668} {"train_loss": -5.454617500305176, "global_step": 28075, "epoch": 668} {"train_loss": -5.307211875915527, "global_step": 28076, "epoch": 668} {"train_loss": -5.389736175537109, "global_step": 28077, "epoch": 668} {"train_loss": -5.575002193450928, "global_step": 28078, "epoch": 668} {"train_loss": -5.387094974517822, "global_step": 28079, "epoch": 668} {"train_loss": -5.534390449523926, "global_step": 28080, "epoch": 668} {"train_loss": -5.470900535583496, "global_step": 28081, "epoch": 668} {"train_loss": -5.461529731750488, "global_step": 28082, "epoch": 668} {"train_loss": -5.514599800109863, "global_step": 28083, "epoch": 668} {"train_loss": -5.532057762145996, "global_step": 28084, "epoch": 668} {"train_loss": -5.516811370849609, "global_step": 28085, "epoch": 668} {"train_loss": -5.30472993850708, "global_step": 28086, "epoch": 668} {"train_loss": -5.404747009277344, "global_step": 28087, "epoch": 668} {"train_loss": -5.355554580688477, "global_step": 28088, "epoch": 668} {"train_loss": -5.330350875854492, "global_step": 28089, "epoch": 668} {"train_loss": -5.310337543487549, "global_step": 28090, "epoch": 668} {"train_loss": -5.401032447814941, "global_step": 28091, "epoch": 668} {"train_loss": -5.465025901794434, "global_step": 28092, "epoch": 668} {"train_loss": -5.467887878417969, "global_step": 28093, "epoch": 668} {"train_loss": -5.376533508300781, "global_step": 28094, "epoch": 668} {"train_loss": -5.366303443908691, "global_step": 28095, "epoch": 668} {"train_loss": -5.525386333465576, "global_step": 28096, "epoch": 668} {"train_loss": -5.431065593447004, "global_step": 28097, "epoch": 668, "val_loss": 64289.546875} {"train_loss": -5.444136619567871, "global_step": 28098, "epoch": 669} {"train_loss": -5.4664459228515625, "global_step": 28099, "epoch": 669} {"train_loss": -5.4274797439575195, "global_step": 28100, "epoch": 669} {"train_loss": -5.418063640594482, "global_step": 28101, "epoch": 669} {"train_loss": -5.51910924911499, "global_step": 28102, "epoch": 669} {"train_loss": -5.418181419372559, "global_step": 28103, "epoch": 669} {"train_loss": -5.402678489685059, "global_step": 28104, "epoch": 669} {"train_loss": -5.581892013549805, "global_step": 28105, "epoch": 669} {"train_loss": -5.352394104003906, "global_step": 28106, "epoch": 669} {"train_loss": -5.339546203613281, "global_step": 28107, "epoch": 669} {"train_loss": -5.5857834815979, "global_step": 28108, "epoch": 669} {"train_loss": -5.354043483734131, "global_step": 28109, "epoch": 669} {"train_loss": -5.4760847091674805, "global_step": 28110, "epoch": 669} {"train_loss": -5.3273515701293945, "global_step": 28111, "epoch": 669} {"train_loss": -5.411218166351318, "global_step": 28112, "epoch": 669} {"train_loss": -5.491806983947754, "global_step": 28113, "epoch": 669} {"train_loss": -5.270224571228027, "global_step": 28114, "epoch": 669} {"train_loss": -5.44166374206543, "global_step": 28115, "epoch": 669} {"train_loss": -5.465337753295898, "global_step": 28116, "epoch": 669} {"train_loss": -5.320571422576904, "global_step": 28117, "epoch": 669} {"train_loss": -5.489079475402832, "global_step": 28118, "epoch": 669} {"train_loss": -5.316943645477295, "global_step": 28119, "epoch": 669} {"train_loss": -5.46259069442749, "global_step": 28120, "epoch": 669} {"train_loss": -5.393826961517334, "global_step": 28121, "epoch": 669} {"train_loss": -5.357431411743164, "global_step": 28122, "epoch": 669} {"train_loss": -5.440524578094482, "global_step": 28123, "epoch": 669} {"train_loss": -5.375773906707764, "global_step": 28124, "epoch": 669} {"train_loss": -5.442159175872803, "global_step": 28125, "epoch": 669} {"train_loss": -5.409224510192871, "global_step": 28126, "epoch": 669} {"train_loss": -5.360699653625488, "global_step": 28127, "epoch": 669} {"train_loss": -5.391756057739258, "global_step": 28128, "epoch": 669} {"train_loss": -5.432372093200684, "global_step": 28129, "epoch": 669} {"train_loss": -5.346584320068359, "global_step": 28130, "epoch": 669} {"train_loss": -5.4111480712890625, "global_step": 28131, "epoch": 669} {"train_loss": -5.5130181312561035, "global_step": 28132, "epoch": 669} {"train_loss": -5.496129989624023, "global_step": 28133, "epoch": 669} {"train_loss": -5.513632297515869, "global_step": 28134, "epoch": 669} {"train_loss": -5.348905086517334, "global_step": 28135, "epoch": 669} {"train_loss": -5.60498571395874, "global_step": 28136, "epoch": 669} {"train_loss": -5.391222953796387, "global_step": 28137, "epoch": 669} {"train_loss": -5.456758499145508, "global_step": 28138, "epoch": 669} {"train_loss": -5.425941421872094, "global_step": 28139, "epoch": 669, "val_loss": 63845.5625} {"train_loss": -5.459277153015137, "global_step": 28140, "epoch": 670} {"train_loss": -5.413415431976318, "global_step": 28141, "epoch": 670} {"train_loss": -5.482385635375977, "global_step": 28142, "epoch": 670} {"train_loss": -5.50221061706543, "global_step": 28143, "epoch": 670} {"train_loss": -5.391458034515381, "global_step": 28144, "epoch": 670} {"train_loss": -5.4159746170043945, "global_step": 28145, "epoch": 670} {"train_loss": -5.405235290527344, "global_step": 28146, "epoch": 670} {"train_loss": -5.637187957763672, "global_step": 28147, "epoch": 670} {"train_loss": -5.496951103210449, "global_step": 28148, "epoch": 670} {"train_loss": -5.469959259033203, "global_step": 28149, "epoch": 670} {"train_loss": -5.4459123611450195, "global_step": 28150, "epoch": 670} {"train_loss": -5.371007919311523, "global_step": 28151, "epoch": 670} {"train_loss": -5.530119895935059, "global_step": 28152, "epoch": 670} {"train_loss": -5.419321060180664, "global_step": 28153, "epoch": 670} {"train_loss": -5.383934020996094, "global_step": 28154, "epoch": 670} {"train_loss": -5.444479465484619, "global_step": 28155, "epoch": 670} {"train_loss": -5.379883289337158, "global_step": 28156, "epoch": 670} {"train_loss": -5.484149932861328, "global_step": 28157, "epoch": 670} {"train_loss": -5.374396324157715, "global_step": 28158, "epoch": 670} {"train_loss": -5.377022743225098, "global_step": 28159, "epoch": 670} {"train_loss": -5.413644790649414, "global_step": 28160, "epoch": 670} {"train_loss": -5.447845458984375, "global_step": 28161, "epoch": 670} {"train_loss": -5.45388126373291, "global_step": 28162, "epoch": 670} {"train_loss": -5.3629326820373535, "global_step": 28163, "epoch": 670} {"train_loss": -5.488551139831543, "global_step": 28164, "epoch": 670} {"train_loss": -5.485784530639648, "global_step": 28165, "epoch": 670} {"train_loss": -5.39993953704834, "global_step": 28166, "epoch": 670} {"train_loss": -5.503833770751953, "global_step": 28167, "epoch": 670} {"train_loss": -5.435103416442871, "global_step": 28168, "epoch": 670} {"train_loss": -5.316780090332031, "global_step": 28169, "epoch": 670} {"train_loss": -5.535412788391113, "global_step": 28170, "epoch": 670} {"train_loss": -5.219743251800537, "global_step": 28171, "epoch": 670} {"train_loss": -5.497319221496582, "global_step": 28172, "epoch": 670} {"train_loss": -5.603731155395508, "global_step": 28173, "epoch": 670} {"train_loss": -5.402090549468994, "global_step": 28174, "epoch": 670} {"train_loss": -5.4001569747924805, "global_step": 28175, "epoch": 670} {"train_loss": -5.319297790527344, "global_step": 28176, "epoch": 670} {"train_loss": -5.485152721405029, "global_step": 28177, "epoch": 670} {"train_loss": -5.484929084777832, "global_step": 28178, "epoch": 670} {"train_loss": -5.437170028686523, "global_step": 28179, "epoch": 670} {"train_loss": -5.56950569152832, "global_step": 28180, "epoch": 670} {"train_loss": -5.441682395480928, "global_step": 28181, "epoch": 670, "val_loss": 63985.09765625} {"train_loss": -5.472440719604492, "global_step": 28182, "epoch": 671} {"train_loss": -5.544919490814209, "global_step": 28183, "epoch": 671} {"train_loss": -5.439850330352783, "global_step": 28184, "epoch": 671} {"train_loss": -5.399049758911133, "global_step": 28185, "epoch": 671} {"train_loss": -5.553191661834717, "global_step": 28186, "epoch": 671} {"train_loss": -5.450522422790527, "global_step": 28187, "epoch": 671} {"train_loss": -5.297910213470459, "global_step": 28188, "epoch": 671} {"train_loss": -5.41180419921875, "global_step": 28189, "epoch": 671} {"train_loss": -5.4207682609558105, "global_step": 28190, "epoch": 671} {"train_loss": -5.391529083251953, "global_step": 28191, "epoch": 671} {"train_loss": -5.388714790344238, "global_step": 28192, "epoch": 671} {"train_loss": -5.339376926422119, "global_step": 28193, "epoch": 671} {"train_loss": -5.408449172973633, "global_step": 28194, "epoch": 671} {"train_loss": -5.555553436279297, "global_step": 28195, "epoch": 671} {"train_loss": -5.503339767456055, "global_step": 28196, "epoch": 671} {"train_loss": -5.354227542877197, "global_step": 28197, "epoch": 671} {"train_loss": -5.453921318054199, "global_step": 28198, "epoch": 671} {"train_loss": -5.4015727043151855, "global_step": 28199, "epoch": 671} {"train_loss": -5.438532829284668, "global_step": 28200, "epoch": 671} {"train_loss": -5.477081775665283, "global_step": 28201, "epoch": 671} {"train_loss": -5.245680332183838, "global_step": 28202, "epoch": 671} {"train_loss": -5.491028308868408, "global_step": 28203, "epoch": 671} {"train_loss": -5.392901420593262, "global_step": 28204, "epoch": 671} {"train_loss": -5.432186603546143, "global_step": 28205, "epoch": 671} {"train_loss": -5.389993667602539, "global_step": 28206, "epoch": 671} {"train_loss": -5.399696350097656, "global_step": 28207, "epoch": 671} {"train_loss": -5.529479503631592, "global_step": 28208, "epoch": 671} {"train_loss": -5.409420013427734, "global_step": 28209, "epoch": 671} {"train_loss": -5.382662296295166, "global_step": 28210, "epoch": 671} {"train_loss": -5.458375453948975, "global_step": 28211, "epoch": 671} {"train_loss": -5.472248554229736, "global_step": 28212, "epoch": 671} {"train_loss": -5.4887800216674805, "global_step": 28213, "epoch": 671} {"train_loss": -5.547794342041016, "global_step": 28214, "epoch": 671} {"train_loss": -5.56281042098999, "global_step": 28215, "epoch": 671} {"train_loss": -5.302091121673584, "global_step": 28216, "epoch": 671} {"train_loss": -5.483744144439697, "global_step": 28217, "epoch": 671} {"train_loss": -5.508499622344971, "global_step": 28218, "epoch": 671} {"train_loss": -5.442031383514404, "global_step": 28219, "epoch": 671} {"train_loss": -5.532248020172119, "global_step": 28220, "epoch": 671} {"train_loss": -5.477877616882324, "global_step": 28221, "epoch": 671} {"train_loss": -5.4880690574646, "global_step": 28222, "epoch": 671} {"train_loss": -5.44015866234189, "global_step": 28223, "epoch": 671, "val_loss": 63839.04296875} {"train_loss": -5.5192766189575195, "global_step": 28224, "epoch": 672} {"train_loss": -5.471258163452148, "global_step": 28225, "epoch": 672} {"train_loss": -5.362969875335693, "global_step": 28226, "epoch": 672} {"train_loss": -5.396345138549805, "global_step": 28227, "epoch": 672} {"train_loss": -5.362720489501953, "global_step": 28228, "epoch": 672} {"train_loss": -5.382198333740234, "global_step": 28229, "epoch": 672} {"train_loss": -5.362723350524902, "global_step": 28230, "epoch": 672} {"train_loss": -5.433958053588867, "global_step": 28231, "epoch": 672} {"train_loss": -5.461508750915527, "global_step": 28232, "epoch": 672} {"train_loss": -5.5464324951171875, "global_step": 28233, "epoch": 672} {"train_loss": -5.4397687911987305, "global_step": 28234, "epoch": 672} {"train_loss": -5.399287223815918, "global_step": 28235, "epoch": 672} {"train_loss": -5.41194486618042, "global_step": 28236, "epoch": 672} {"train_loss": -5.498978614807129, "global_step": 28237, "epoch": 672} {"train_loss": -5.455384731292725, "global_step": 28238, "epoch": 672} {"train_loss": -5.402176856994629, "global_step": 28239, "epoch": 672} {"train_loss": -5.517322540283203, "global_step": 28240, "epoch": 672} {"train_loss": -5.3581085205078125, "global_step": 28241, "epoch": 672} {"train_loss": -5.424264430999756, "global_step": 28242, "epoch": 672} {"train_loss": -5.37161111831665, "global_step": 28243, "epoch": 672} {"train_loss": -5.355551719665527, "global_step": 28244, "epoch": 672} {"train_loss": -5.404581069946289, "global_step": 28245, "epoch": 672} {"train_loss": -5.437971115112305, "global_step": 28246, "epoch": 672} {"train_loss": -5.3398637771606445, "global_step": 28247, "epoch": 672} {"train_loss": -5.418673038482666, "global_step": 28248, "epoch": 672} {"train_loss": -5.435849189758301, "global_step": 28249, "epoch": 672} {"train_loss": -5.39643669128418, "global_step": 28250, "epoch": 672} {"train_loss": -5.456746578216553, "global_step": 28251, "epoch": 672} {"train_loss": -5.478096961975098, "global_step": 28252, "epoch": 672} {"train_loss": -5.424670219421387, "global_step": 28253, "epoch": 672} {"train_loss": -5.375789642333984, "global_step": 28254, "epoch": 672} {"train_loss": -5.416747093200684, "global_step": 28255, "epoch": 672} {"train_loss": -5.373767375946045, "global_step": 28256, "epoch": 672} {"train_loss": -5.406034469604492, "global_step": 28257, "epoch": 672} {"train_loss": -5.47928524017334, "global_step": 28258, "epoch": 672} {"train_loss": -5.406583786010742, "global_step": 28259, "epoch": 672} {"train_loss": -5.429143905639648, "global_step": 28260, "epoch": 672} {"train_loss": -5.450218200683594, "global_step": 28261, "epoch": 672} {"train_loss": -5.309945106506348, "global_step": 28262, "epoch": 672} {"train_loss": -5.422347068786621, "global_step": 28263, "epoch": 672} {"train_loss": -5.506012916564941, "global_step": 28264, "epoch": 672} {"train_loss": -5.419450214930943, "global_step": 28265, "epoch": 672, "val_loss": 64042.33984375} {"train_loss": -5.471322059631348, "global_step": 28266, "epoch": 673} {"train_loss": -5.400057315826416, "global_step": 28267, "epoch": 673} {"train_loss": -5.390459060668945, "global_step": 28268, "epoch": 673} {"train_loss": -5.415404796600342, "global_step": 28269, "epoch": 673} {"train_loss": -5.366689682006836, "global_step": 28270, "epoch": 673} {"train_loss": -5.33608341217041, "global_step": 28271, "epoch": 673} {"train_loss": -5.4629058837890625, "global_step": 28272, "epoch": 673} {"train_loss": -5.415461540222168, "global_step": 28273, "epoch": 673} {"train_loss": -5.417929649353027, "global_step": 28274, "epoch": 673} {"train_loss": -5.420022010803223, "global_step": 28275, "epoch": 673} {"train_loss": -5.4779276847839355, "global_step": 28276, "epoch": 673} {"train_loss": -5.419914245605469, "global_step": 28277, "epoch": 673} {"train_loss": -5.447438716888428, "global_step": 28278, "epoch": 673} {"train_loss": -5.346892356872559, "global_step": 28279, "epoch": 673} {"train_loss": -5.5181660652160645, "global_step": 28280, "epoch": 673} {"train_loss": -5.5092315673828125, "global_step": 28281, "epoch": 673} {"train_loss": -5.452765464782715, "global_step": 28282, "epoch": 673} {"train_loss": -5.426542282104492, "global_step": 28283, "epoch": 673} {"train_loss": -5.4804277420043945, "global_step": 28284, "epoch": 673} {"train_loss": -5.469366073608398, "global_step": 28285, "epoch": 673} {"train_loss": -5.425030708312988, "global_step": 28286, "epoch": 673} {"train_loss": -5.516866683959961, "global_step": 28287, "epoch": 673} {"train_loss": -5.454158306121826, "global_step": 28288, "epoch": 673} {"train_loss": -5.433523178100586, "global_step": 28289, "epoch": 673} {"train_loss": -5.531318664550781, "global_step": 28290, "epoch": 673} {"train_loss": -5.48051643371582, "global_step": 28291, "epoch": 673} {"train_loss": -5.432271957397461, "global_step": 28292, "epoch": 673} {"train_loss": -5.30825138092041, "global_step": 28293, "epoch": 673} {"train_loss": -5.395510673522949, "global_step": 28294, "epoch": 673} {"train_loss": -5.550897598266602, "global_step": 28295, "epoch": 673} {"train_loss": -5.437849998474121, "global_step": 28296, "epoch": 673} {"train_loss": -5.4882049560546875, "global_step": 28297, "epoch": 673} {"train_loss": -5.462949752807617, "global_step": 28298, "epoch": 673} {"train_loss": -5.402463912963867, "global_step": 28299, "epoch": 673} {"train_loss": -5.423825263977051, "global_step": 28300, "epoch": 673} {"train_loss": -5.481747627258301, "global_step": 28301, "epoch": 673} {"train_loss": -5.518746376037598, "global_step": 28302, "epoch": 673} {"train_loss": -5.319760322570801, "global_step": 28303, "epoch": 673} {"train_loss": -5.422638416290283, "global_step": 28304, "epoch": 673} {"train_loss": -5.431088447570801, "global_step": 28305, "epoch": 673} {"train_loss": -5.57049560546875, "global_step": 28306, "epoch": 673} {"train_loss": -5.441700526646206, "global_step": 28307, "epoch": 673, "val_loss": 63831.9140625} {"train_loss": -5.49542760848999, "global_step": 28308, "epoch": 674} {"train_loss": -5.510785102844238, "global_step": 28309, "epoch": 674} {"train_loss": -5.433584213256836, "global_step": 28310, "epoch": 674} {"train_loss": -5.57131290435791, "global_step": 28311, "epoch": 674} {"train_loss": -5.413117408752441, "global_step": 28312, "epoch": 674} {"train_loss": -5.631318092346191, "global_step": 28313, "epoch": 674} {"train_loss": -5.471604347229004, "global_step": 28314, "epoch": 674} {"train_loss": -5.422255516052246, "global_step": 28315, "epoch": 674} {"train_loss": -5.527609825134277, "global_step": 28316, "epoch": 674} {"train_loss": -5.347932815551758, "global_step": 28317, "epoch": 674} {"train_loss": -5.403825283050537, "global_step": 28318, "epoch": 674} {"train_loss": -5.411750793457031, "global_step": 28319, "epoch": 674} {"train_loss": -5.380334854125977, "global_step": 28320, "epoch": 674} {"train_loss": -5.409417629241943, "global_step": 28321, "epoch": 674} {"train_loss": -5.338900566101074, "global_step": 28322, "epoch": 674} {"train_loss": -5.409592628479004, "global_step": 28323, "epoch": 674} {"train_loss": -5.299448013305664, "global_step": 28324, "epoch": 674} {"train_loss": -5.410000801086426, "global_step": 28325, "epoch": 674} {"train_loss": -5.526450157165527, "global_step": 28326, "epoch": 674} {"train_loss": -5.4141058921813965, "global_step": 28327, "epoch": 674} {"train_loss": -5.423496246337891, "global_step": 28328, "epoch": 674} {"train_loss": -5.5888261795043945, "global_step": 28329, "epoch": 674} {"train_loss": -5.460951805114746, "global_step": 28330, "epoch": 674} {"train_loss": -5.389336109161377, "global_step": 28331, "epoch": 674} {"train_loss": -5.470847129821777, "global_step": 28332, "epoch": 674} {"train_loss": -5.477995872497559, "global_step": 28333, "epoch": 674} {"train_loss": -5.484469413757324, "global_step": 28334, "epoch": 674} {"train_loss": -5.517079830169678, "global_step": 28335, "epoch": 674} {"train_loss": -5.527199745178223, "global_step": 28336, "epoch": 674} {"train_loss": -5.515822410583496, "global_step": 28337, "epoch": 674} {"train_loss": -5.412058353424072, "global_step": 28338, "epoch": 674} {"train_loss": -5.403120040893555, "global_step": 28339, "epoch": 674} {"train_loss": -5.470232963562012, "global_step": 28340, "epoch": 674} {"train_loss": -5.359801769256592, "global_step": 28341, "epoch": 674} {"train_loss": -5.325339317321777, "global_step": 28342, "epoch": 674} {"train_loss": -5.519335746765137, "global_step": 28343, "epoch": 674} {"train_loss": -5.412811756134033, "global_step": 28344, "epoch": 674} {"train_loss": -5.397953987121582, "global_step": 28345, "epoch": 674} {"train_loss": -5.45155668258667, "global_step": 28346, "epoch": 674} {"train_loss": -5.530072212219238, "global_step": 28347, "epoch": 674} {"train_loss": -5.375205993652344, "global_step": 28348, "epoch": 674} {"train_loss": -5.445430914560954, "global_step": 28349, "epoch": 674, "val_loss": 63921.14453125} {"train_loss": -5.3374481201171875, "global_step": 28350, "epoch": 675} {"train_loss": -5.4798736572265625, "global_step": 28351, "epoch": 675} {"train_loss": -5.437009334564209, "global_step": 28352, "epoch": 675} {"train_loss": -5.375374794006348, "global_step": 28353, "epoch": 675} {"train_loss": -5.626716613769531, "global_step": 28354, "epoch": 675} {"train_loss": -5.542649269104004, "global_step": 28355, "epoch": 675} {"train_loss": -5.484063148498535, "global_step": 28356, "epoch": 675} {"train_loss": -5.372552394866943, "global_step": 28357, "epoch": 675} {"train_loss": -5.436190128326416, "global_step": 28358, "epoch": 675} {"train_loss": -5.364188194274902, "global_step": 28359, "epoch": 675} {"train_loss": -5.4954047203063965, "global_step": 28360, "epoch": 675} {"train_loss": -5.512240409851074, "global_step": 28361, "epoch": 675} {"train_loss": -5.441996097564697, "global_step": 28362, "epoch": 675} {"train_loss": -5.468382358551025, "global_step": 28363, "epoch": 675} {"train_loss": -5.418407440185547, "global_step": 28364, "epoch": 675} {"train_loss": -5.4940571784973145, "global_step": 28365, "epoch": 675} {"train_loss": -5.403196811676025, "global_step": 28366, "epoch": 675} {"train_loss": -5.508813381195068, "global_step": 28367, "epoch": 675} {"train_loss": -5.437240123748779, "global_step": 28368, "epoch": 675} {"train_loss": -5.411029815673828, "global_step": 28369, "epoch": 675} {"train_loss": -5.558279037475586, "global_step": 28370, "epoch": 675} {"train_loss": -5.492133617401123, "global_step": 28371, "epoch": 675} {"train_loss": -5.618009090423584, "global_step": 28372, "epoch": 675} {"train_loss": -5.354553699493408, "global_step": 28373, "epoch": 675} {"train_loss": -5.412173748016357, "global_step": 28374, "epoch": 675} {"train_loss": -5.375572204589844, "global_step": 28375, "epoch": 675} {"train_loss": -5.218229293823242, "global_step": 28376, "epoch": 675} {"train_loss": -5.560946941375732, "global_step": 28377, "epoch": 675} {"train_loss": -5.412448883056641, "global_step": 28378, "epoch": 675} {"train_loss": -5.22453498840332, "global_step": 28379, "epoch": 675} {"train_loss": -5.3681511878967285, "global_step": 28380, "epoch": 675} {"train_loss": -5.438704967498779, "global_step": 28381, "epoch": 675} {"train_loss": -5.221784591674805, "global_step": 28382, "epoch": 675} {"train_loss": -5.521737098693848, "global_step": 28383, "epoch": 675} {"train_loss": -5.36521053314209, "global_step": 28384, "epoch": 675} {"train_loss": -5.405992031097412, "global_step": 28385, "epoch": 675} {"train_loss": -5.236064910888672, "global_step": 28386, "epoch": 675} {"train_loss": -5.413209438323975, "global_step": 28387, "epoch": 675} {"train_loss": -5.474465847015381, "global_step": 28388, "epoch": 675} {"train_loss": -5.373367786407471, "global_step": 28389, "epoch": 675} {"train_loss": -5.458892345428467, "global_step": 28390, "epoch": 675} {"train_loss": -5.428222826548985, "global_step": 28391, "epoch": 675, "val_loss": 64463.72265625} {"train_loss": -5.37546443939209, "global_step": 28392, "epoch": 676} {"train_loss": -5.364070892333984, "global_step": 28393, "epoch": 676} {"train_loss": -5.285321235656738, "global_step": 28394, "epoch": 676} {"train_loss": -5.592288494110107, "global_step": 28395, "epoch": 676} {"train_loss": -5.38895320892334, "global_step": 28396, "epoch": 676} {"train_loss": -5.39398193359375, "global_step": 28397, "epoch": 676} {"train_loss": -5.484270095825195, "global_step": 28398, "epoch": 676} {"train_loss": -5.346909999847412, "global_step": 28399, "epoch": 676} {"train_loss": -5.543520927429199, "global_step": 28400, "epoch": 676} {"train_loss": -5.486855506896973, "global_step": 28401, "epoch": 676} {"train_loss": -5.223085880279541, "global_step": 28402, "epoch": 676} {"train_loss": -5.457214832305908, "global_step": 28403, "epoch": 676} {"train_loss": -5.437419891357422, "global_step": 28404, "epoch": 676} {"train_loss": -5.28138542175293, "global_step": 28405, "epoch": 676} {"train_loss": -5.412139892578125, "global_step": 28406, "epoch": 676} {"train_loss": -5.338892936706543, "global_step": 28407, "epoch": 676} {"train_loss": -5.338476181030273, "global_step": 28408, "epoch": 676} {"train_loss": -5.414301872253418, "global_step": 28409, "epoch": 676} {"train_loss": -5.363964080810547, "global_step": 28410, "epoch": 676} {"train_loss": -5.336784362792969, "global_step": 28411, "epoch": 676} {"train_loss": -5.456169128417969, "global_step": 28412, "epoch": 676} {"train_loss": -5.149179458618164, "global_step": 28413, "epoch": 676} {"train_loss": -5.33104133605957, "global_step": 28414, "epoch": 676} {"train_loss": -5.397401809692383, "global_step": 28415, "epoch": 676} {"train_loss": -5.237840175628662, "global_step": 28416, "epoch": 676} {"train_loss": -5.494169235229492, "global_step": 28417, "epoch": 676} {"train_loss": -5.4885101318359375, "global_step": 28418, "epoch": 676} {"train_loss": -5.413175106048584, "global_step": 28419, "epoch": 676} {"train_loss": -5.393642425537109, "global_step": 28420, "epoch": 676} {"train_loss": -5.3860063552856445, "global_step": 28421, "epoch": 676} {"train_loss": -5.473031044006348, "global_step": 28422, "epoch": 676} {"train_loss": -5.3506269454956055, "global_step": 28423, "epoch": 676} {"train_loss": -5.386575222015381, "global_step": 28424, "epoch": 676} {"train_loss": -5.34756326675415, "global_step": 28425, "epoch": 676} {"train_loss": -5.312894344329834, "global_step": 28426, "epoch": 676} {"train_loss": -5.51816463470459, "global_step": 28427, "epoch": 676} {"train_loss": -5.453749656677246, "global_step": 28428, "epoch": 676} {"train_loss": -5.565652847290039, "global_step": 28429, "epoch": 676} {"train_loss": -5.380971908569336, "global_step": 28430, "epoch": 676} {"train_loss": -5.428224086761475, "global_step": 28431, "epoch": 676} {"train_loss": -5.367295742034912, "global_step": 28432, "epoch": 676} {"train_loss": -5.3968433652605325, "global_step": 28433, "epoch": 676, "val_loss": 63555.98046875} {"train_loss": -5.569003582000732, "global_step": 28434, "epoch": 677} {"train_loss": -5.450979232788086, "global_step": 28435, "epoch": 677} {"train_loss": -5.476722240447998, "global_step": 28436, "epoch": 677} {"train_loss": -5.496372222900391, "global_step": 28437, "epoch": 677} {"train_loss": -5.468782424926758, "global_step": 28438, "epoch": 677} {"train_loss": -5.161920070648193, "global_step": 28439, "epoch": 677} {"train_loss": -5.510959148406982, "global_step": 28440, "epoch": 677} {"train_loss": -5.530799865722656, "global_step": 28441, "epoch": 677} {"train_loss": -5.365601539611816, "global_step": 28442, "epoch": 677} {"train_loss": -5.554116249084473, "global_step": 28443, "epoch": 677} {"train_loss": -5.294079303741455, "global_step": 28444, "epoch": 677} {"train_loss": -5.481942176818848, "global_step": 28445, "epoch": 677} {"train_loss": -5.445394992828369, "global_step": 28446, "epoch": 677} {"train_loss": -5.278149604797363, "global_step": 28447, "epoch": 677} {"train_loss": -5.373780727386475, "global_step": 28448, "epoch": 677} {"train_loss": -5.565158843994141, "global_step": 28449, "epoch": 677} {"train_loss": -5.4558563232421875, "global_step": 28450, "epoch": 677} {"train_loss": -5.535244464874268, "global_step": 28451, "epoch": 677} {"train_loss": -5.5324530601501465, "global_step": 28452, "epoch": 677} {"train_loss": -5.575200080871582, "global_step": 28453, "epoch": 677} {"train_loss": -5.411147594451904, "global_step": 28454, "epoch": 677} {"train_loss": -5.423632621765137, "global_step": 28455, "epoch": 677} {"train_loss": -5.438492774963379, "global_step": 28456, "epoch": 677} {"train_loss": -5.534812927246094, "global_step": 28457, "epoch": 677} {"train_loss": -5.568595886230469, "global_step": 28458, "epoch": 677} {"train_loss": -5.52567195892334, "global_step": 28459, "epoch": 677} {"train_loss": -5.4436750411987305, "global_step": 28460, "epoch": 677} {"train_loss": -5.466839790344238, "global_step": 28461, "epoch": 677} {"train_loss": -5.488977909088135, "global_step": 28462, "epoch": 677} {"train_loss": -5.4859161376953125, "global_step": 28463, "epoch": 677} {"train_loss": -5.376224994659424, "global_step": 28464, "epoch": 677} {"train_loss": -5.410252571105957, "global_step": 28465, "epoch": 677} {"train_loss": -5.359638690948486, "global_step": 28466, "epoch": 677} {"train_loss": -5.50358772277832, "global_step": 28467, "epoch": 677} {"train_loss": -5.355008125305176, "global_step": 28468, "epoch": 677} {"train_loss": -5.455146789550781, "global_step": 28469, "epoch": 677} {"train_loss": -5.418489456176758, "global_step": 28470, "epoch": 677} {"train_loss": -5.505358695983887, "global_step": 28471, "epoch": 677} {"train_loss": -5.5666399002075195, "global_step": 28472, "epoch": 677} {"train_loss": -5.461061477661133, "global_step": 28473, "epoch": 677} {"train_loss": -5.5187249183654785, "global_step": 28474, "epoch": 677} {"train_loss": -5.457796051388695, "global_step": 28475, "epoch": 677, "val_loss": 63707.2890625} {"train_loss": -5.526211261749268, "global_step": 28476, "epoch": 678} {"train_loss": -5.525767803192139, "global_step": 28477, "epoch": 678} {"train_loss": -5.595587253570557, "global_step": 28478, "epoch": 678} {"train_loss": -5.435203552246094, "global_step": 28479, "epoch": 678} {"train_loss": -5.441730976104736, "global_step": 28480, "epoch": 678} {"train_loss": -5.392555236816406, "global_step": 28481, "epoch": 678} {"train_loss": -5.463761329650879, "global_step": 28482, "epoch": 678} {"train_loss": -5.285764694213867, "global_step": 28483, "epoch": 678} {"train_loss": -5.313477516174316, "global_step": 28484, "epoch": 678} {"train_loss": -5.521241664886475, "global_step": 28485, "epoch": 678} {"train_loss": -5.437858581542969, "global_step": 28486, "epoch": 678} {"train_loss": -5.467019081115723, "global_step": 28487, "epoch": 678} {"train_loss": -5.512388229370117, "global_step": 28488, "epoch": 678} {"train_loss": -5.287720680236816, "global_step": 28489, "epoch": 678} {"train_loss": -5.594940662384033, "global_step": 28490, "epoch": 678} {"train_loss": -5.389366149902344, "global_step": 28491, "epoch": 678} {"train_loss": -5.643173694610596, "global_step": 28492, "epoch": 678} {"train_loss": -5.412869453430176, "global_step": 28493, "epoch": 678} {"train_loss": -5.374303817749023, "global_step": 28494, "epoch": 678} {"train_loss": -5.411199569702148, "global_step": 28495, "epoch": 678} {"train_loss": -5.494622707366943, "global_step": 28496, "epoch": 678} {"train_loss": -5.507619380950928, "global_step": 28497, "epoch": 678} {"train_loss": -5.377384185791016, "global_step": 28498, "epoch": 678} {"train_loss": -5.4909467697143555, "global_step": 28499, "epoch": 678} {"train_loss": -5.445126533508301, "global_step": 28500, "epoch": 678} {"train_loss": -5.472780227661133, "global_step": 28501, "epoch": 678} {"train_loss": -5.4328742027282715, "global_step": 28502, "epoch": 678} {"train_loss": -5.430548667907715, "global_step": 28503, "epoch": 678} {"train_loss": -5.476958751678467, "global_step": 28504, "epoch": 678} {"train_loss": -5.499902248382568, "global_step": 28505, "epoch": 678} {"train_loss": -5.421236991882324, "global_step": 28506, "epoch": 678} {"train_loss": -5.375617980957031, "global_step": 28507, "epoch": 678} {"train_loss": -5.354475021362305, "global_step": 28508, "epoch": 678} {"train_loss": -5.4469709396362305, "global_step": 28509, "epoch": 678} {"train_loss": -5.576557636260986, "global_step": 28510, "epoch": 678} {"train_loss": -5.497529983520508, "global_step": 28511, "epoch": 678} {"train_loss": -5.357551097869873, "global_step": 28512, "epoch": 678} {"train_loss": -5.446648597717285, "global_step": 28513, "epoch": 678} {"train_loss": -5.501736640930176, "global_step": 28514, "epoch": 678} {"train_loss": -5.473544120788574, "global_step": 28515, "epoch": 678} {"train_loss": -5.4426589012146, "global_step": 28516, "epoch": 678} {"train_loss": -5.454043785730998, "global_step": 28517, "epoch": 678, "val_loss": 63717.515625} {"train_loss": -5.445599555969238, "global_step": 28518, "epoch": 679} {"train_loss": -5.433527946472168, "global_step": 28519, "epoch": 679} {"train_loss": -5.482049942016602, "global_step": 28520, "epoch": 679} {"train_loss": -5.461793422698975, "global_step": 28521, "epoch": 679} {"train_loss": -5.472831726074219, "global_step": 28522, "epoch": 679} {"train_loss": -5.5342302322387695, "global_step": 28523, "epoch": 679} {"train_loss": -5.555635452270508, "global_step": 28524, "epoch": 679} {"train_loss": -5.523130893707275, "global_step": 28525, "epoch": 679} {"train_loss": -5.512949466705322, "global_step": 28526, "epoch": 679} {"train_loss": -5.524762153625488, "global_step": 28527, "epoch": 679} {"train_loss": -5.426671981811523, "global_step": 28528, "epoch": 679} {"train_loss": -5.556941032409668, "global_step": 28529, "epoch": 679} {"train_loss": -5.4025115966796875, "global_step": 28530, "epoch": 679} {"train_loss": -5.4944562911987305, "global_step": 28531, "epoch": 679} {"train_loss": -5.485555648803711, "global_step": 28532, "epoch": 679} {"train_loss": -5.486193656921387, "global_step": 28533, "epoch": 679} {"train_loss": -5.515972137451172, "global_step": 28534, "epoch": 679} {"train_loss": -5.426015853881836, "global_step": 28535, "epoch": 679} {"train_loss": -5.592177391052246, "global_step": 28536, "epoch": 679} {"train_loss": -5.430037498474121, "global_step": 28537, "epoch": 679} {"train_loss": -5.332779884338379, "global_step": 28538, "epoch": 679} {"train_loss": -5.428377151489258, "global_step": 28539, "epoch": 679} {"train_loss": -5.559183120727539, "global_step": 28540, "epoch": 679} {"train_loss": -5.525196075439453, "global_step": 28541, "epoch": 679} {"train_loss": -5.423135280609131, "global_step": 28542, "epoch": 679} {"train_loss": -5.507504940032959, "global_step": 28543, "epoch": 679} {"train_loss": -5.606281757354736, "global_step": 28544, "epoch": 679} {"train_loss": -5.454468727111816, "global_step": 28545, "epoch": 679} {"train_loss": -5.37773323059082, "global_step": 28546, "epoch": 679} {"train_loss": -5.324650287628174, "global_step": 28547, "epoch": 679} {"train_loss": -5.481074810028076, "global_step": 28548, "epoch": 679} {"train_loss": -5.3794169425964355, "global_step": 28549, "epoch": 679} {"train_loss": -5.3927083015441895, "global_step": 28550, "epoch": 679} {"train_loss": -5.462265968322754, "global_step": 28551, "epoch": 679} {"train_loss": -5.408224105834961, "global_step": 28552, "epoch": 679} {"train_loss": -5.45482063293457, "global_step": 28553, "epoch": 679} {"train_loss": -5.440389156341553, "global_step": 28554, "epoch": 679} {"train_loss": -5.456225395202637, "global_step": 28555, "epoch": 679} {"train_loss": -5.4720611572265625, "global_step": 28556, "epoch": 679} {"train_loss": -5.4729719161987305, "global_step": 28557, "epoch": 679} {"train_loss": -5.445094108581543, "global_step": 28558, "epoch": 679} {"train_loss": -5.466764574959164, "global_step": 28559, "epoch": 679, "val_loss": 64096.85546875} {"train_loss": -5.306214332580566, "global_step": 28560, "epoch": 680} {"train_loss": -5.455672264099121, "global_step": 28561, "epoch": 680} {"train_loss": -5.353032112121582, "global_step": 28562, "epoch": 680} {"train_loss": -5.223234176635742, "global_step": 28563, "epoch": 680} {"train_loss": -5.5189619064331055, "global_step": 28564, "epoch": 680} {"train_loss": -5.345991611480713, "global_step": 28565, "epoch": 680} {"train_loss": -5.288463592529297, "global_step": 28566, "epoch": 680} {"train_loss": -5.431860446929932, "global_step": 28567, "epoch": 680} {"train_loss": -5.43916130065918, "global_step": 28568, "epoch": 680} {"train_loss": -5.358221054077148, "global_step": 28569, "epoch": 680} {"train_loss": -5.368283271789551, "global_step": 28570, "epoch": 680} {"train_loss": -5.385776519775391, "global_step": 28571, "epoch": 680} {"train_loss": -5.3180036544799805, "global_step": 28572, "epoch": 680} {"train_loss": -5.400777816772461, "global_step": 28573, "epoch": 680} {"train_loss": -5.412118911743164, "global_step": 28574, "epoch": 680} {"train_loss": -5.421621322631836, "global_step": 28575, "epoch": 680} {"train_loss": -5.38279914855957, "global_step": 28576, "epoch": 680} {"train_loss": -5.407650947570801, "global_step": 28577, "epoch": 680} {"train_loss": -5.407999515533447, "global_step": 28578, "epoch": 680} {"train_loss": -5.4465131759643555, "global_step": 28579, "epoch": 680} {"train_loss": -5.495204925537109, "global_step": 28580, "epoch": 680} {"train_loss": -5.318392276763916, "global_step": 28581, "epoch": 680} {"train_loss": -5.575388431549072, "global_step": 28582, "epoch": 680} {"train_loss": -5.502391815185547, "global_step": 28583, "epoch": 680} {"train_loss": -5.533175945281982, "global_step": 28584, "epoch": 680} {"train_loss": -5.4562668800354, "global_step": 28585, "epoch": 680} {"train_loss": -5.470769882202148, "global_step": 28586, "epoch": 680} {"train_loss": -5.5031561851501465, "global_step": 28587, "epoch": 680} {"train_loss": -5.489007949829102, "global_step": 28588, "epoch": 680} {"train_loss": -5.36337947845459, "global_step": 28589, "epoch": 680} {"train_loss": -5.618374824523926, "global_step": 28590, "epoch": 680} {"train_loss": -5.448622226715088, "global_step": 28591, "epoch": 680} {"train_loss": -5.490120887756348, "global_step": 28592, "epoch": 680} {"train_loss": -5.409786701202393, "global_step": 28593, "epoch": 680} {"train_loss": -5.339850902557373, "global_step": 28594, "epoch": 680} {"train_loss": -5.394439220428467, "global_step": 28595, "epoch": 680} {"train_loss": -5.498762130737305, "global_step": 28596, "epoch": 680} {"train_loss": -5.559685707092285, "global_step": 28597, "epoch": 680} {"train_loss": -5.504853248596191, "global_step": 28598, "epoch": 680} {"train_loss": -5.591451644897461, "global_step": 28599, "epoch": 680} {"train_loss": -5.473431587219238, "global_step": 28600, "epoch": 680} {"train_loss": -5.43274280003139, "global_step": 28601, "epoch": 680, "val_loss": 63512.953125} {"train_loss": -5.520697593688965, "global_step": 28602, "epoch": 681} {"train_loss": -5.562910556793213, "global_step": 28603, "epoch": 681} {"train_loss": -5.517089366912842, "global_step": 28604, "epoch": 681} {"train_loss": -5.521602630615234, "global_step": 28605, "epoch": 681} {"train_loss": -5.591046333312988, "global_step": 28606, "epoch": 681} {"train_loss": -5.46733283996582, "global_step": 28607, "epoch": 681} {"train_loss": -5.465630531311035, "global_step": 28608, "epoch": 681} {"train_loss": -5.383973121643066, "global_step": 28609, "epoch": 681} {"train_loss": -5.422959327697754, "global_step": 28610, "epoch": 681} {"train_loss": -5.387057781219482, "global_step": 28611, "epoch": 681} {"train_loss": -5.4403076171875, "global_step": 28612, "epoch": 681} {"train_loss": -5.659995079040527, "global_step": 28613, "epoch": 681} {"train_loss": -5.374961853027344, "global_step": 28614, "epoch": 681} {"train_loss": -5.488807201385498, "global_step": 28615, "epoch": 681} {"train_loss": -5.381699085235596, "global_step": 28616, "epoch": 681} {"train_loss": -5.70308780670166, "global_step": 28617, "epoch": 681} {"train_loss": -5.4219794273376465, "global_step": 28618, "epoch": 681} {"train_loss": -5.418645858764648, "global_step": 28619, "epoch": 681} {"train_loss": -5.560820579528809, "global_step": 28620, "epoch": 681} {"train_loss": -5.323397159576416, "global_step": 28621, "epoch": 681} {"train_loss": -5.464487075805664, "global_step": 28622, "epoch": 681} {"train_loss": -5.514034271240234, "global_step": 28623, "epoch": 681} {"train_loss": -5.548338890075684, "global_step": 28624, "epoch": 681} {"train_loss": -5.4998345375061035, "global_step": 28625, "epoch": 681} {"train_loss": -5.501591205596924, "global_step": 28626, "epoch": 681} {"train_loss": -5.45871639251709, "global_step": 28627, "epoch": 681} {"train_loss": -5.424261569976807, "global_step": 28628, "epoch": 681} {"train_loss": -5.403586387634277, "global_step": 28629, "epoch": 681} {"train_loss": -5.371153354644775, "global_step": 28630, "epoch": 681} {"train_loss": -5.426371097564697, "global_step": 28631, "epoch": 681} {"train_loss": -5.457228183746338, "global_step": 28632, "epoch": 681} {"train_loss": -5.4431657791137695, "global_step": 28633, "epoch": 681} {"train_loss": -5.383554458618164, "global_step": 28634, "epoch": 681} {"train_loss": -5.467511177062988, "global_step": 28635, "epoch": 681} {"train_loss": -5.476632118225098, "global_step": 28636, "epoch": 681} {"train_loss": -5.262627124786377, "global_step": 28637, "epoch": 681} {"train_loss": -5.491880893707275, "global_step": 28638, "epoch": 681} {"train_loss": -5.337629795074463, "global_step": 28639, "epoch": 681} {"train_loss": -5.2718400955200195, "global_step": 28640, "epoch": 681} {"train_loss": -5.482831954956055, "global_step": 28641, "epoch": 681} {"train_loss": -5.392541885375977, "global_step": 28642, "epoch": 681} {"train_loss": -5.454176403227306, "global_step": 28643, "epoch": 681, "val_loss": 63798.43359375} {"train_loss": -5.429403305053711, "global_step": 28644, "epoch": 682} {"train_loss": -5.507768630981445, "global_step": 28645, "epoch": 682} {"train_loss": -5.396476745605469, "global_step": 28646, "epoch": 682} {"train_loss": -5.504654884338379, "global_step": 28647, "epoch": 682} {"train_loss": -5.441378593444824, "global_step": 28648, "epoch": 682} {"train_loss": -5.36529541015625, "global_step": 28649, "epoch": 682} {"train_loss": -5.457832336425781, "global_step": 28650, "epoch": 682} {"train_loss": -5.455324172973633, "global_step": 28651, "epoch": 682} {"train_loss": -5.357895851135254, "global_step": 28652, "epoch": 682} {"train_loss": -5.451784133911133, "global_step": 28653, "epoch": 682} {"train_loss": -5.338407516479492, "global_step": 28654, "epoch": 682} {"train_loss": -5.547778129577637, "global_step": 28655, "epoch": 682} {"train_loss": -5.296162128448486, "global_step": 28656, "epoch": 682} {"train_loss": -5.378458499908447, "global_step": 28657, "epoch": 682} {"train_loss": -5.459826469421387, "global_step": 28658, "epoch": 682} {"train_loss": -5.319675445556641, "global_step": 28659, "epoch": 682} {"train_loss": -5.339242935180664, "global_step": 28660, "epoch": 682} {"train_loss": -5.4179487228393555, "global_step": 28661, "epoch": 682} {"train_loss": -5.280032157897949, "global_step": 28662, "epoch": 682} {"train_loss": -5.457897186279297, "global_step": 28663, "epoch": 682} {"train_loss": -5.385644912719727, "global_step": 28664, "epoch": 682} {"train_loss": -5.413949012756348, "global_step": 28665, "epoch": 682} {"train_loss": -5.55023193359375, "global_step": 28666, "epoch": 682} {"train_loss": -5.396556377410889, "global_step": 28667, "epoch": 682} {"train_loss": -5.474018096923828, "global_step": 28668, "epoch": 682} {"train_loss": -5.464023590087891, "global_step": 28669, "epoch": 682} {"train_loss": -5.450140953063965, "global_step": 28670, "epoch": 682} {"train_loss": -5.599671363830566, "global_step": 28671, "epoch": 682} {"train_loss": -5.380789279937744, "global_step": 28672, "epoch": 682} {"train_loss": -5.287304878234863, "global_step": 28673, "epoch": 682} {"train_loss": -5.459887504577637, "global_step": 28674, "epoch": 682} {"train_loss": -5.340946674346924, "global_step": 28675, "epoch": 682} {"train_loss": -5.451509952545166, "global_step": 28676, "epoch": 682} {"train_loss": -5.402657985687256, "global_step": 28677, "epoch": 682} {"train_loss": -5.380560398101807, "global_step": 28678, "epoch": 682} {"train_loss": -5.430308818817139, "global_step": 28679, "epoch": 682} {"train_loss": -5.363550662994385, "global_step": 28680, "epoch": 682} {"train_loss": -5.584756851196289, "global_step": 28681, "epoch": 682} {"train_loss": -5.448873043060303, "global_step": 28682, "epoch": 682} {"train_loss": -5.387939453125, "global_step": 28683, "epoch": 682} {"train_loss": -5.574240684509277, "global_step": 28684, "epoch": 682} {"train_loss": -5.424807446343558, "global_step": 28685, "epoch": 682, "val_loss": 63926.78125} {"train_loss": -5.442793369293213, "global_step": 28686, "epoch": 683} {"train_loss": -5.466698169708252, "global_step": 28687, "epoch": 683} {"train_loss": -5.546403408050537, "global_step": 28688, "epoch": 683} {"train_loss": -5.422172546386719, "global_step": 28689, "epoch": 683} {"train_loss": -5.5514421463012695, "global_step": 28690, "epoch": 683} {"train_loss": -5.429987907409668, "global_step": 28691, "epoch": 683} {"train_loss": -5.469012260437012, "global_step": 28692, "epoch": 683} {"train_loss": -5.36613130569458, "global_step": 28693, "epoch": 683} {"train_loss": -5.4693145751953125, "global_step": 28694, "epoch": 683} {"train_loss": -5.413120746612549, "global_step": 28695, "epoch": 683} {"train_loss": -5.50714111328125, "global_step": 28696, "epoch": 683} {"train_loss": -5.416814804077148, "global_step": 28697, "epoch": 683} {"train_loss": -5.435471534729004, "global_step": 28698, "epoch": 683} {"train_loss": -5.536220550537109, "global_step": 28699, "epoch": 683} {"train_loss": -5.369641304016113, "global_step": 28700, "epoch": 683} {"train_loss": -5.563767910003662, "global_step": 28701, "epoch": 683} {"train_loss": -5.525234699249268, "global_step": 28702, "epoch": 683} {"train_loss": -5.5801591873168945, "global_step": 28703, "epoch": 683} {"train_loss": -5.434959411621094, "global_step": 28704, "epoch": 683} {"train_loss": -5.303953647613525, "global_step": 28705, "epoch": 683} {"train_loss": -5.338085174560547, "global_step": 28706, "epoch": 683} {"train_loss": -5.578116416931152, "global_step": 28707, "epoch": 683} {"train_loss": -5.4166669845581055, "global_step": 28708, "epoch": 683} {"train_loss": -5.413650989532471, "global_step": 28709, "epoch": 683} {"train_loss": -5.463283538818359, "global_step": 28710, "epoch": 683} {"train_loss": -5.390811920166016, "global_step": 28711, "epoch": 683} {"train_loss": -5.465465545654297, "global_step": 28712, "epoch": 683} {"train_loss": -5.363489627838135, "global_step": 28713, "epoch": 683} {"train_loss": -5.466105937957764, "global_step": 28714, "epoch": 683} {"train_loss": -5.335014820098877, "global_step": 28715, "epoch": 683} {"train_loss": -5.442622184753418, "global_step": 28716, "epoch": 683} {"train_loss": -5.522422790527344, "global_step": 28717, "epoch": 683} {"train_loss": -5.39345121383667, "global_step": 28718, "epoch": 683} {"train_loss": -5.539331436157227, "global_step": 28719, "epoch": 683} {"train_loss": -5.542634010314941, "global_step": 28720, "epoch": 683} {"train_loss": -5.438224792480469, "global_step": 28721, "epoch": 683} {"train_loss": -5.3670196533203125, "global_step": 28722, "epoch": 683} {"train_loss": -5.419070720672607, "global_step": 28723, "epoch": 683} {"train_loss": -5.3943047523498535, "global_step": 28724, "epoch": 683} {"train_loss": -5.407188415527344, "global_step": 28725, "epoch": 683} {"train_loss": -5.408761024475098, "global_step": 28726, "epoch": 683} {"train_loss": -5.445314679827009, "global_step": 28727, "epoch": 683, "val_loss": 63957.37890625} {"train_loss": -5.367191314697266, "global_step": 28728, "epoch": 684} {"train_loss": -5.419193267822266, "global_step": 28729, "epoch": 684} {"train_loss": -5.3912153244018555, "global_step": 28730, "epoch": 684} {"train_loss": -5.4789276123046875, "global_step": 28731, "epoch": 684} {"train_loss": -5.447385787963867, "global_step": 28732, "epoch": 684} {"train_loss": -5.507735252380371, "global_step": 28733, "epoch": 684} {"train_loss": -5.464776039123535, "global_step": 28734, "epoch": 684} {"train_loss": -5.394305229187012, "global_step": 28735, "epoch": 684} {"train_loss": -5.545313835144043, "global_step": 28736, "epoch": 684} {"train_loss": -5.50139045715332, "global_step": 28737, "epoch": 684} {"train_loss": -5.428454399108887, "global_step": 28738, "epoch": 684} {"train_loss": -5.511202812194824, "global_step": 28739, "epoch": 684} {"train_loss": -5.4162397384643555, "global_step": 28740, "epoch": 684} {"train_loss": -5.409583568572998, "global_step": 28741, "epoch": 684} {"train_loss": -5.518061637878418, "global_step": 28742, "epoch": 684} {"train_loss": -5.556720733642578, "global_step": 28743, "epoch": 684} {"train_loss": -5.4031267166137695, "global_step": 28744, "epoch": 684} {"train_loss": -5.361196994781494, "global_step": 28745, "epoch": 684} {"train_loss": -5.422399044036865, "global_step": 28746, "epoch": 684} {"train_loss": -5.532073497772217, "global_step": 28747, "epoch": 684} {"train_loss": -5.39980411529541, "global_step": 28748, "epoch": 684} {"train_loss": -5.2996320724487305, "global_step": 28749, "epoch": 684} {"train_loss": -5.384378433227539, "global_step": 28750, "epoch": 684} {"train_loss": -5.466242790222168, "global_step": 28751, "epoch": 684} {"train_loss": -5.391379356384277, "global_step": 28752, "epoch": 684} {"train_loss": -5.545853614807129, "global_step": 28753, "epoch": 684} {"train_loss": -5.3810882568359375, "global_step": 28754, "epoch": 684} {"train_loss": -5.387742042541504, "global_step": 28755, "epoch": 684} {"train_loss": -5.421573638916016, "global_step": 28756, "epoch": 684} {"train_loss": -5.360411167144775, "global_step": 28757, "epoch": 684} {"train_loss": -5.497480392456055, "global_step": 28758, "epoch": 684} {"train_loss": -5.4747443199157715, "global_step": 28759, "epoch": 684} {"train_loss": -5.345824241638184, "global_step": 28760, "epoch": 684} {"train_loss": -5.396592617034912, "global_step": 28761, "epoch": 684} {"train_loss": -5.51059627532959, "global_step": 28762, "epoch": 684} {"train_loss": -5.459441184997559, "global_step": 28763, "epoch": 684} {"train_loss": -5.461856842041016, "global_step": 28764, "epoch": 684} {"train_loss": -5.462695598602295, "global_step": 28765, "epoch": 684} {"train_loss": -5.387186527252197, "global_step": 28766, "epoch": 684} {"train_loss": -5.462876319885254, "global_step": 28767, "epoch": 684} {"train_loss": -5.4033966064453125, "global_step": 28768, "epoch": 684} {"train_loss": -5.4392933050791425, "global_step": 28769, "epoch": 684, "val_loss": 63648.26953125} {"train_loss": -5.456240653991699, "global_step": 28770, "epoch": 685} {"train_loss": -5.3287272453308105, "global_step": 28771, "epoch": 685} {"train_loss": -5.482290267944336, "global_step": 28772, "epoch": 685} {"train_loss": -5.477851867675781, "global_step": 28773, "epoch": 685} {"train_loss": -5.507316589355469, "global_step": 28774, "epoch": 685} {"train_loss": -5.467827320098877, "global_step": 28775, "epoch": 685} {"train_loss": -5.515868186950684, "global_step": 28776, "epoch": 685} {"train_loss": -5.36986780166626, "global_step": 28777, "epoch": 685} {"train_loss": -5.493978500366211, "global_step": 28778, "epoch": 685} {"train_loss": -5.502690315246582, "global_step": 28779, "epoch": 685} {"train_loss": -5.405106067657471, "global_step": 28780, "epoch": 685} {"train_loss": -5.470135688781738, "global_step": 28781, "epoch": 685} {"train_loss": -5.477684497833252, "global_step": 28782, "epoch": 685} {"train_loss": -5.50149393081665, "global_step": 28783, "epoch": 685} {"train_loss": -5.485279083251953, "global_step": 28784, "epoch": 685} {"train_loss": -5.31906270980835, "global_step": 28785, "epoch": 685} {"train_loss": -5.552222728729248, "global_step": 28786, "epoch": 685} {"train_loss": -5.428318023681641, "global_step": 28787, "epoch": 685} {"train_loss": -5.593193054199219, "global_step": 28788, "epoch": 685} {"train_loss": -5.546056747436523, "global_step": 28789, "epoch": 685} {"train_loss": -5.361783027648926, "global_step": 28790, "epoch": 685} {"train_loss": -5.567244529724121, "global_step": 28791, "epoch": 685} {"train_loss": -5.464550971984863, "global_step": 28792, "epoch": 685} {"train_loss": -5.450213432312012, "global_step": 28793, "epoch": 685} {"train_loss": -5.449626445770264, "global_step": 28794, "epoch": 685} {"train_loss": -5.572301864624023, "global_step": 28795, "epoch": 685} {"train_loss": -5.595048904418945, "global_step": 28796, "epoch": 685} {"train_loss": -5.356833457946777, "global_step": 28797, "epoch": 685} {"train_loss": -5.406078338623047, "global_step": 28798, "epoch": 685} {"train_loss": -5.417762756347656, "global_step": 28799, "epoch": 685} {"train_loss": -5.482997417449951, "global_step": 28800, "epoch": 685} {"train_loss": -5.405657768249512, "global_step": 28801, "epoch": 685} {"train_loss": -5.432842254638672, "global_step": 28802, "epoch": 685} {"train_loss": -5.482782363891602, "global_step": 28803, "epoch": 685} {"train_loss": -5.391801357269287, "global_step": 28804, "epoch": 685} {"train_loss": -5.58772087097168, "global_step": 28805, "epoch": 685} {"train_loss": -5.236118316650391, "global_step": 28806, "epoch": 685} {"train_loss": -5.452536582946777, "global_step": 28807, "epoch": 685} {"train_loss": -5.419217586517334, "global_step": 28808, "epoch": 685} {"train_loss": -5.481184959411621, "global_step": 28809, "epoch": 685} {"train_loss": -5.388193130493164, "global_step": 28810, "epoch": 685} {"train_loss": -5.456007083257039, "global_step": 28811, "epoch": 685, "val_loss": 63513.1328125} {"train_loss": -5.49167013168335, "global_step": 28812, "epoch": 686} {"train_loss": -5.423346519470215, "global_step": 28813, "epoch": 686} {"train_loss": -5.465910911560059, "global_step": 28814, "epoch": 686} {"train_loss": -5.545598030090332, "global_step": 28815, "epoch": 686} {"train_loss": -5.489813804626465, "global_step": 28816, "epoch": 686} {"train_loss": -5.54960823059082, "global_step": 28817, "epoch": 686} {"train_loss": -5.5259857177734375, "global_step": 28818, "epoch": 686} {"train_loss": -5.51218318939209, "global_step": 28819, "epoch": 686} {"train_loss": -5.4742207527160645, "global_step": 28820, "epoch": 686} {"train_loss": -5.494768142700195, "global_step": 28821, "epoch": 686} {"train_loss": -5.461206436157227, "global_step": 28822, "epoch": 686} {"train_loss": -5.315522193908691, "global_step": 28823, "epoch": 686} {"train_loss": -5.498273849487305, "global_step": 28824, "epoch": 686} {"train_loss": -5.387164115905762, "global_step": 28825, "epoch": 686} {"train_loss": -5.473694324493408, "global_step": 28826, "epoch": 686} {"train_loss": -5.50492000579834, "global_step": 28827, "epoch": 686} {"train_loss": -5.326613426208496, "global_step": 28828, "epoch": 686} {"train_loss": -5.415134429931641, "global_step": 28829, "epoch": 686} {"train_loss": -5.420366287231445, "global_step": 28830, "epoch": 686} {"train_loss": -5.605456352233887, "global_step": 28831, "epoch": 686} {"train_loss": -5.416057586669922, "global_step": 28832, "epoch": 686} {"train_loss": -5.352581024169922, "global_step": 28833, "epoch": 686} {"train_loss": -5.518153190612793, "global_step": 28834, "epoch": 686} {"train_loss": -5.440160751342773, "global_step": 28835, "epoch": 686} {"train_loss": -5.498568534851074, "global_step": 28836, "epoch": 686} {"train_loss": -5.495756149291992, "global_step": 28837, "epoch": 686} {"train_loss": -5.521811485290527, "global_step": 28838, "epoch": 686} {"train_loss": -5.517468452453613, "global_step": 28839, "epoch": 686} {"train_loss": -5.4357147216796875, "global_step": 28840, "epoch": 686} {"train_loss": -5.398756504058838, "global_step": 28841, "epoch": 686} {"train_loss": -5.301937580108643, "global_step": 28842, "epoch": 686} {"train_loss": -5.387155532836914, "global_step": 28843, "epoch": 686} {"train_loss": -5.526922225952148, "global_step": 28844, "epoch": 686} {"train_loss": -5.36791467666626, "global_step": 28845, "epoch": 686} {"train_loss": -5.310214519500732, "global_step": 28846, "epoch": 686} {"train_loss": -5.566376686096191, "global_step": 28847, "epoch": 686} {"train_loss": -5.3303375244140625, "global_step": 28848, "epoch": 686} {"train_loss": -5.438920021057129, "global_step": 28849, "epoch": 686} {"train_loss": -5.372049808502197, "global_step": 28850, "epoch": 686} {"train_loss": -5.266023635864258, "global_step": 28851, "epoch": 686} {"train_loss": -5.395820140838623, "global_step": 28852, "epoch": 686} {"train_loss": -5.439216625122797, "global_step": 28853, "epoch": 686, "val_loss": 63502.32421875} {"train_loss": -5.470522403717041, "global_step": 28854, "epoch": 687} {"train_loss": -5.287521839141846, "global_step": 28855, "epoch": 687} {"train_loss": -5.364599227905273, "global_step": 28856, "epoch": 687} {"train_loss": -5.450552940368652, "global_step": 28857, "epoch": 687} {"train_loss": -5.420875549316406, "global_step": 28858, "epoch": 687} {"train_loss": -5.4651079177856445, "global_step": 28859, "epoch": 687} {"train_loss": -5.489264488220215, "global_step": 28860, "epoch": 687} {"train_loss": -5.377076625823975, "global_step": 28861, "epoch": 687} {"train_loss": -5.490085601806641, "global_step": 28862, "epoch": 687} {"train_loss": -5.387446403503418, "global_step": 28863, "epoch": 687} {"train_loss": -5.456128120422363, "global_step": 28864, "epoch": 687} {"train_loss": -5.414203643798828, "global_step": 28865, "epoch": 687} {"train_loss": -5.388720512390137, "global_step": 28866, "epoch": 687} {"train_loss": -5.343022346496582, "global_step": 28867, "epoch": 687} {"train_loss": -5.5347065925598145, "global_step": 28868, "epoch": 687} {"train_loss": -5.394529342651367, "global_step": 28869, "epoch": 687} {"train_loss": -5.473525047302246, "global_step": 28870, "epoch": 687} {"train_loss": -5.564939975738525, "global_step": 28871, "epoch": 687} {"train_loss": -5.436189651489258, "global_step": 28872, "epoch": 687} {"train_loss": -5.235230445861816, "global_step": 28873, "epoch": 687} {"train_loss": -5.491756916046143, "global_step": 28874, "epoch": 687} {"train_loss": -5.4671831130981445, "global_step": 28875, "epoch": 687} {"train_loss": -5.522998332977295, "global_step": 28876, "epoch": 687} {"train_loss": -5.443437576293945, "global_step": 28877, "epoch": 687} {"train_loss": -5.445539474487305, "global_step": 28878, "epoch": 687} {"train_loss": -5.408590316772461, "global_step": 28879, "epoch": 687} {"train_loss": -5.638763427734375, "global_step": 28880, "epoch": 687} {"train_loss": -5.4944987297058105, "global_step": 28881, "epoch": 687} {"train_loss": -5.489610195159912, "global_step": 28882, "epoch": 687} {"train_loss": -5.4481000900268555, "global_step": 28883, "epoch": 687} {"train_loss": -5.350873947143555, "global_step": 28884, "epoch": 687} {"train_loss": -5.405004501342773, "global_step": 28885, "epoch": 687} {"train_loss": -5.387655258178711, "global_step": 28886, "epoch": 687} {"train_loss": -5.403940677642822, "global_step": 28887, "epoch": 687} {"train_loss": -5.395463943481445, "global_step": 28888, "epoch": 687} {"train_loss": -5.392453193664551, "global_step": 28889, "epoch": 687} {"train_loss": -5.453920364379883, "global_step": 28890, "epoch": 687} {"train_loss": -5.286921501159668, "global_step": 28891, "epoch": 687} {"train_loss": -5.482558250427246, "global_step": 28892, "epoch": 687} {"train_loss": -5.423595905303955, "global_step": 28893, "epoch": 687} {"train_loss": -5.430803298950195, "global_step": 28894, "epoch": 687} {"train_loss": -5.434563035056705, "global_step": 28895, "epoch": 687, "val_loss": 63597.3203125} {"train_loss": -5.325923919677734, "global_step": 28896, "epoch": 688} {"train_loss": -5.5950517654418945, "global_step": 28897, "epoch": 688} {"train_loss": -5.416959762573242, "global_step": 28898, "epoch": 688} {"train_loss": -5.461287498474121, "global_step": 28899, "epoch": 688} {"train_loss": -5.55099630355835, "global_step": 28900, "epoch": 688} {"train_loss": -5.5391845703125, "global_step": 28901, "epoch": 688} {"train_loss": -5.583597660064697, "global_step": 28902, "epoch": 688} {"train_loss": -5.500388145446777, "global_step": 28903, "epoch": 688} {"train_loss": -5.3646721839904785, "global_step": 28904, "epoch": 688} {"train_loss": -5.523247718811035, "global_step": 28905, "epoch": 688} {"train_loss": -5.492116451263428, "global_step": 28906, "epoch": 688} {"train_loss": -5.317713737487793, "global_step": 28907, "epoch": 688} {"train_loss": -5.353357315063477, "global_step": 28908, "epoch": 688} {"train_loss": -5.509032249450684, "global_step": 28909, "epoch": 688} {"train_loss": -5.387508392333984, "global_step": 28910, "epoch": 688} {"train_loss": -5.518794059753418, "global_step": 28911, "epoch": 688} {"train_loss": -5.409734725952148, "global_step": 28912, "epoch": 688} {"train_loss": -5.428371429443359, "global_step": 28913, "epoch": 688} {"train_loss": -5.359949588775635, "global_step": 28914, "epoch": 688} {"train_loss": -5.464779853820801, "global_step": 28915, "epoch": 688} {"train_loss": -5.504056930541992, "global_step": 28916, "epoch": 688} {"train_loss": -5.415024280548096, "global_step": 28917, "epoch": 688} {"train_loss": -5.407538414001465, "global_step": 28918, "epoch": 688} {"train_loss": -5.401890754699707, "global_step": 28919, "epoch": 688} {"train_loss": -5.361794471740723, "global_step": 28920, "epoch": 688} {"train_loss": -5.428184509277344, "global_step": 28921, "epoch": 688} {"train_loss": -5.451365947723389, "global_step": 28922, "epoch": 688} {"train_loss": -5.326129913330078, "global_step": 28923, "epoch": 688} {"train_loss": -5.405205726623535, "global_step": 28924, "epoch": 688} {"train_loss": -5.56159782409668, "global_step": 28925, "epoch": 688} {"train_loss": -5.399565696716309, "global_step": 28926, "epoch": 688} {"train_loss": -5.429073333740234, "global_step": 28927, "epoch": 688} {"train_loss": -5.527457237243652, "global_step": 28928, "epoch": 688} {"train_loss": -5.341070652008057, "global_step": 28929, "epoch": 688} {"train_loss": -5.397636413574219, "global_step": 28930, "epoch": 688} {"train_loss": -5.446476459503174, "global_step": 28931, "epoch": 688} {"train_loss": -5.383940696716309, "global_step": 28932, "epoch": 688} {"train_loss": -5.456941604614258, "global_step": 28933, "epoch": 688} {"train_loss": -5.389684200286865, "global_step": 28934, "epoch": 688} {"train_loss": -5.509178161621094, "global_step": 28935, "epoch": 688} {"train_loss": -5.46467399597168, "global_step": 28936, "epoch": 688} {"train_loss": -5.43924465633574, "global_step": 28937, "epoch": 688, "val_loss": 63890.015625} {"train_loss": -5.441497802734375, "global_step": 28938, "epoch": 689} {"train_loss": -5.414948463439941, "global_step": 28939, "epoch": 689} {"train_loss": -5.517002105712891, "global_step": 28940, "epoch": 689} {"train_loss": -5.4106364250183105, "global_step": 28941, "epoch": 689} {"train_loss": -5.499355316162109, "global_step": 28942, "epoch": 689} {"train_loss": -5.42225456237793, "global_step": 28943, "epoch": 689} {"train_loss": -5.426593780517578, "global_step": 28944, "epoch": 689} {"train_loss": -5.336101531982422, "global_step": 28945, "epoch": 689} {"train_loss": -5.503885269165039, "global_step": 28946, "epoch": 689} {"train_loss": -5.492415428161621, "global_step": 28947, "epoch": 689} {"train_loss": -5.324582576751709, "global_step": 28948, "epoch": 689} {"train_loss": -5.389786720275879, "global_step": 28949, "epoch": 689} {"train_loss": -5.524757385253906, "global_step": 28950, "epoch": 689} {"train_loss": -5.444332599639893, "global_step": 28951, "epoch": 689} {"train_loss": -5.357671737670898, "global_step": 28952, "epoch": 689} {"train_loss": -5.537201881408691, "global_step": 28953, "epoch": 689} {"train_loss": -5.417299270629883, "global_step": 28954, "epoch": 689} {"train_loss": -5.556695938110352, "global_step": 28955, "epoch": 689} {"train_loss": -5.48213005065918, "global_step": 28956, "epoch": 689} {"train_loss": -5.551450729370117, "global_step": 28957, "epoch": 689} {"train_loss": -5.381457328796387, "global_step": 28958, "epoch": 689} {"train_loss": -5.429777145385742, "global_step": 28959, "epoch": 689} {"train_loss": -5.411266326904297, "global_step": 28960, "epoch": 689} {"train_loss": -5.410526275634766, "global_step": 28961, "epoch": 689} {"train_loss": -5.398766040802002, "global_step": 28962, "epoch": 689} {"train_loss": -5.508557319641113, "global_step": 28963, "epoch": 689} {"train_loss": -5.436661243438721, "global_step": 28964, "epoch": 689} {"train_loss": -5.400059700012207, "global_step": 28965, "epoch": 689} {"train_loss": -5.491667747497559, "global_step": 28966, "epoch": 689} {"train_loss": -5.442745208740234, "global_step": 28967, "epoch": 689} {"train_loss": -5.459708213806152, "global_step": 28968, "epoch": 689} {"train_loss": -5.3973846435546875, "global_step": 28969, "epoch": 689} {"train_loss": -5.442720413208008, "global_step": 28970, "epoch": 689} {"train_loss": -5.4354448318481445, "global_step": 28971, "epoch": 689} {"train_loss": -5.436559200286865, "global_step": 28972, "epoch": 689} {"train_loss": -5.407649993896484, "global_step": 28973, "epoch": 689} {"train_loss": -5.546980857849121, "global_step": 28974, "epoch": 689} {"train_loss": -5.45719051361084, "global_step": 28975, "epoch": 689} {"train_loss": -5.438554763793945, "global_step": 28976, "epoch": 689} {"train_loss": -5.548699855804443, "global_step": 28977, "epoch": 689} {"train_loss": -5.510586738586426, "global_step": 28978, "epoch": 689} {"train_loss": -5.451343320664906, "global_step": 28979, "epoch": 689, "val_loss": 63947.390625} {"train_loss": -5.447863578796387, "global_step": 28980, "epoch": 690} {"train_loss": -5.437648296356201, "global_step": 28981, "epoch": 690} {"train_loss": -5.528225898742676, "global_step": 28982, "epoch": 690} {"train_loss": -5.307926177978516, "global_step": 28983, "epoch": 690} {"train_loss": -5.421652793884277, "global_step": 28984, "epoch": 690} {"train_loss": -5.422189712524414, "global_step": 28985, "epoch": 690} {"train_loss": -5.480937957763672, "global_step": 28986, "epoch": 690} {"train_loss": -5.4496235847473145, "global_step": 28987, "epoch": 690} {"train_loss": -5.3991312980651855, "global_step": 28988, "epoch": 690} {"train_loss": -5.505266189575195, "global_step": 28989, "epoch": 690} {"train_loss": -5.352568626403809, "global_step": 28990, "epoch": 690} {"train_loss": -5.418128490447998, "global_step": 28991, "epoch": 690} {"train_loss": -5.375545978546143, "global_step": 28992, "epoch": 690} {"train_loss": -5.34566593170166, "global_step": 28993, "epoch": 690} {"train_loss": -5.50177001953125, "global_step": 28994, "epoch": 690} {"train_loss": -5.549013137817383, "global_step": 28995, "epoch": 690} {"train_loss": -5.5332794189453125, "global_step": 28996, "epoch": 690} {"train_loss": -5.570082187652588, "global_step": 28997, "epoch": 690} {"train_loss": -5.5161943435668945, "global_step": 28998, "epoch": 690} {"train_loss": -5.595732688903809, "global_step": 28999, "epoch": 690} {"train_loss": -5.460399627685547, "global_step": 29000, "epoch": 690} {"train_loss": -5.343392372131348, "global_step": 29001, "epoch": 690} {"train_loss": -5.489797592163086, "global_step": 29002, "epoch": 690} {"train_loss": -5.451336860656738, "global_step": 29003, "epoch": 690} {"train_loss": -5.4798784255981445, "global_step": 29004, "epoch": 690} {"train_loss": -5.407436370849609, "global_step": 29005, "epoch": 690} {"train_loss": -5.371781349182129, "global_step": 29006, "epoch": 690} {"train_loss": -5.521250247955322, "global_step": 29007, "epoch": 690} {"train_loss": -5.570771217346191, "global_step": 29008, "epoch": 690} {"train_loss": -5.535083293914795, "global_step": 29009, "epoch": 690} {"train_loss": -5.35012149810791, "global_step": 29010, "epoch": 690} {"train_loss": -5.301551818847656, "global_step": 29011, "epoch": 690} {"train_loss": -5.4888715744018555, "global_step": 29012, "epoch": 690} {"train_loss": -5.506490707397461, "global_step": 29013, "epoch": 690} {"train_loss": -5.467075347900391, "global_step": 29014, "epoch": 690} {"train_loss": -5.478955268859863, "global_step": 29015, "epoch": 690} {"train_loss": -5.423474311828613, "global_step": 29016, "epoch": 690} {"train_loss": -5.517607688903809, "global_step": 29017, "epoch": 690} {"train_loss": -5.465147495269775, "global_step": 29018, "epoch": 690} {"train_loss": -5.3941240310668945, "global_step": 29019, "epoch": 690} {"train_loss": -5.436363220214844, "global_step": 29020, "epoch": 690} {"train_loss": -5.45344572975522, "global_step": 29021, "epoch": 690, "val_loss": 63908.734375} {"train_loss": -5.5512566566467285, "global_step": 29022, "epoch": 691} {"train_loss": -5.408028602600098, "global_step": 29023, "epoch": 691} {"train_loss": -5.204328536987305, "global_step": 29024, "epoch": 691} {"train_loss": -5.397424221038818, "global_step": 29025, "epoch": 691} {"train_loss": -5.433205604553223, "global_step": 29026, "epoch": 691} {"train_loss": -5.492149353027344, "global_step": 29027, "epoch": 691} {"train_loss": -5.53035831451416, "global_step": 29028, "epoch": 691} {"train_loss": -5.400113105773926, "global_step": 29029, "epoch": 691} {"train_loss": -5.532255172729492, "global_step": 29030, "epoch": 691} {"train_loss": -5.500377178192139, "global_step": 29031, "epoch": 691} {"train_loss": -5.349123954772949, "global_step": 29032, "epoch": 691} {"train_loss": -5.420886039733887, "global_step": 29033, "epoch": 691} {"train_loss": -5.382328987121582, "global_step": 29034, "epoch": 691} {"train_loss": -5.373903751373291, "global_step": 29035, "epoch": 691} {"train_loss": -5.49497652053833, "global_step": 29036, "epoch": 691} {"train_loss": -5.363358497619629, "global_step": 29037, "epoch": 691} {"train_loss": -5.362200736999512, "global_step": 29038, "epoch": 691} {"train_loss": -5.486118316650391, "global_step": 29039, "epoch": 691} {"train_loss": -5.490695476531982, "global_step": 29040, "epoch": 691} {"train_loss": -5.509181022644043, "global_step": 29041, "epoch": 691} {"train_loss": -5.446281433105469, "global_step": 29042, "epoch": 691} {"train_loss": -5.41243839263916, "global_step": 29043, "epoch": 691} {"train_loss": -5.399391174316406, "global_step": 29044, "epoch": 691} {"train_loss": -5.445821285247803, "global_step": 29045, "epoch": 691} {"train_loss": -5.526785373687744, "global_step": 29046, "epoch": 691} {"train_loss": -5.372222900390625, "global_step": 29047, "epoch": 691} {"train_loss": -5.429959297180176, "global_step": 29048, "epoch": 691} {"train_loss": -5.440371513366699, "global_step": 29049, "epoch": 691} {"train_loss": -5.450781345367432, "global_step": 29050, "epoch": 691} {"train_loss": -5.511100769042969, "global_step": 29051, "epoch": 691} {"train_loss": -5.36423397064209, "global_step": 29052, "epoch": 691} {"train_loss": -5.443586826324463, "global_step": 29053, "epoch": 691} {"train_loss": -5.448813438415527, "global_step": 29054, "epoch": 691} {"train_loss": -5.4233198165893555, "global_step": 29055, "epoch": 691} {"train_loss": -5.3578996658325195, "global_step": 29056, "epoch": 691} {"train_loss": -5.386508941650391, "global_step": 29057, "epoch": 691} {"train_loss": -5.489935874938965, "global_step": 29058, "epoch": 691} {"train_loss": -5.390020847320557, "global_step": 29059, "epoch": 691} {"train_loss": -5.350773811340332, "global_step": 29060, "epoch": 691} {"train_loss": -5.456508159637451, "global_step": 29061, "epoch": 691} {"train_loss": -5.458452224731445, "global_step": 29062, "epoch": 691} {"train_loss": -5.433911766324725, "global_step": 29063, "epoch": 691, "val_loss": 63463.73046875} {"train_loss": -5.37630558013916, "global_step": 29064, "epoch": 692} {"train_loss": -5.440117359161377, "global_step": 29065, "epoch": 692} {"train_loss": -5.46988582611084, "global_step": 29066, "epoch": 692} {"train_loss": -5.575442314147949, "global_step": 29067, "epoch": 692} {"train_loss": -5.384436130523682, "global_step": 29068, "epoch": 692} {"train_loss": -5.484188079833984, "global_step": 29069, "epoch": 692} {"train_loss": -5.322284698486328, "global_step": 29070, "epoch": 692} {"train_loss": -5.378699779510498, "global_step": 29071, "epoch": 692} {"train_loss": -5.370430946350098, "global_step": 29072, "epoch": 692} {"train_loss": -5.418406963348389, "global_step": 29073, "epoch": 692} {"train_loss": -5.475481986999512, "global_step": 29074, "epoch": 692} {"train_loss": -5.420040130615234, "global_step": 29075, "epoch": 692} {"train_loss": -5.443799018859863, "global_step": 29076, "epoch": 692} {"train_loss": -5.504855155944824, "global_step": 29077, "epoch": 692} {"train_loss": -5.4391865730285645, "global_step": 29078, "epoch": 692} {"train_loss": -5.352407455444336, "global_step": 29079, "epoch": 692} {"train_loss": -5.46528434753418, "global_step": 29080, "epoch": 692} {"train_loss": -5.459807872772217, "global_step": 29081, "epoch": 692} {"train_loss": -5.5022807121276855, "global_step": 29082, "epoch": 692} {"train_loss": -5.538538932800293, "global_step": 29083, "epoch": 692} {"train_loss": -5.454497337341309, "global_step": 29084, "epoch": 692} {"train_loss": -5.501109600067139, "global_step": 29085, "epoch": 692} {"train_loss": -5.481389999389648, "global_step": 29086, "epoch": 692} {"train_loss": -5.506622314453125, "global_step": 29087, "epoch": 692} {"train_loss": -5.57450532913208, "global_step": 29088, "epoch": 692} {"train_loss": -5.562775135040283, "global_step": 29089, "epoch": 692} {"train_loss": -5.313205242156982, "global_step": 29090, "epoch": 692} {"train_loss": -5.5167555809021, "global_step": 29091, "epoch": 692} {"train_loss": -5.433655738830566, "global_step": 29092, "epoch": 692} {"train_loss": -5.380005359649658, "global_step": 29093, "epoch": 692} {"train_loss": -5.481420993804932, "global_step": 29094, "epoch": 692} {"train_loss": -5.334768295288086, "global_step": 29095, "epoch": 692} {"train_loss": -5.4371657371521, "global_step": 29096, "epoch": 692} {"train_loss": -5.546104431152344, "global_step": 29097, "epoch": 692} {"train_loss": -5.494894981384277, "global_step": 29098, "epoch": 692} {"train_loss": -5.505039215087891, "global_step": 29099, "epoch": 692} {"train_loss": -5.507032871246338, "global_step": 29100, "epoch": 692} {"train_loss": -5.529980659484863, "global_step": 29101, "epoch": 692} {"train_loss": -5.425493240356445, "global_step": 29102, "epoch": 692} {"train_loss": -5.514765739440918, "global_step": 29103, "epoch": 692} {"train_loss": -5.4467058181762695, "global_step": 29104, "epoch": 692} {"train_loss": -5.456171149299259, "global_step": 29105, "epoch": 692, "val_loss": 63727.83984375} {"train_loss": -5.596447944641113, "global_step": 29106, "epoch": 693} {"train_loss": -5.509675025939941, "global_step": 29107, "epoch": 693} {"train_loss": -5.44464111328125, "global_step": 29108, "epoch": 693} {"train_loss": -5.3047614097595215, "global_step": 29109, "epoch": 693} {"train_loss": -5.536618232727051, "global_step": 29110, "epoch": 693} {"train_loss": -5.382111549377441, "global_step": 29111, "epoch": 693} {"train_loss": -5.442079544067383, "global_step": 29112, "epoch": 693} {"train_loss": -5.553396224975586, "global_step": 29113, "epoch": 693} {"train_loss": -5.3710618019104, "global_step": 29114, "epoch": 693} {"train_loss": -5.4847917556762695, "global_step": 29115, "epoch": 693} {"train_loss": -5.412570953369141, "global_step": 29116, "epoch": 693} {"train_loss": -5.519129276275635, "global_step": 29117, "epoch": 693} {"train_loss": -5.362261772155762, "global_step": 29118, "epoch": 693} {"train_loss": -5.468472003936768, "global_step": 29119, "epoch": 693} {"train_loss": -5.394937515258789, "global_step": 29120, "epoch": 693} {"train_loss": -5.481631278991699, "global_step": 29121, "epoch": 693} {"train_loss": -5.578347682952881, "global_step": 29122, "epoch": 693} {"train_loss": -5.47036075592041, "global_step": 29123, "epoch": 693} {"train_loss": -5.483224868774414, "global_step": 29124, "epoch": 693} {"train_loss": -5.500814914703369, "global_step": 29125, "epoch": 693} {"train_loss": -5.474720001220703, "global_step": 29126, "epoch": 693} {"train_loss": -5.390488624572754, "global_step": 29127, "epoch": 693} {"train_loss": -5.473753452301025, "global_step": 29128, "epoch": 693} {"train_loss": -5.520453929901123, "global_step": 29129, "epoch": 693} {"train_loss": -5.392416954040527, "global_step": 29130, "epoch": 693} {"train_loss": -5.490388870239258, "global_step": 29131, "epoch": 693} {"train_loss": -5.533262252807617, "global_step": 29132, "epoch": 693} {"train_loss": -5.508242607116699, "global_step": 29133, "epoch": 693} {"train_loss": -5.5531463623046875, "global_step": 29134, "epoch": 693} {"train_loss": -5.417664527893066, "global_step": 29135, "epoch": 693} {"train_loss": -5.504796981811523, "global_step": 29136, "epoch": 693} {"train_loss": -5.503820419311523, "global_step": 29137, "epoch": 693} {"train_loss": -5.317339897155762, "global_step": 29138, "epoch": 693} {"train_loss": -5.363781929016113, "global_step": 29139, "epoch": 693} {"train_loss": -5.477790832519531, "global_step": 29140, "epoch": 693} {"train_loss": -5.321303844451904, "global_step": 29141, "epoch": 693} {"train_loss": -5.549653053283691, "global_step": 29142, "epoch": 693} {"train_loss": -5.43582820892334, "global_step": 29143, "epoch": 693} {"train_loss": -5.508523941040039, "global_step": 29144, "epoch": 693} {"train_loss": -5.512040615081787, "global_step": 29145, "epoch": 693} {"train_loss": -5.616446018218994, "global_step": 29146, "epoch": 693} {"train_loss": -5.4705372878483365, "global_step": 29147, "epoch": 693, "val_loss": 63307.33984375} {"train_loss": -5.524290084838867, "global_step": 29148, "epoch": 694} {"train_loss": -5.5106706619262695, "global_step": 29149, "epoch": 694} {"train_loss": -5.500907897949219, "global_step": 29150, "epoch": 694} {"train_loss": -5.5614142417907715, "global_step": 29151, "epoch": 694} {"train_loss": -5.5211286544799805, "global_step": 29152, "epoch": 694} {"train_loss": -5.535242557525635, "global_step": 29153, "epoch": 694} {"train_loss": -5.471473217010498, "global_step": 29154, "epoch": 694} {"train_loss": -5.57228946685791, "global_step": 29155, "epoch": 694} {"train_loss": -5.571920871734619, "global_step": 29156, "epoch": 694} {"train_loss": -5.378364086151123, "global_step": 29157, "epoch": 694} {"train_loss": -5.413415908813477, "global_step": 29158, "epoch": 694} {"train_loss": -5.4477386474609375, "global_step": 29159, "epoch": 694} {"train_loss": -5.506286144256592, "global_step": 29160, "epoch": 694} {"train_loss": -5.370292663574219, "global_step": 29161, "epoch": 694} {"train_loss": -5.381531715393066, "global_step": 29162, "epoch": 694} {"train_loss": -5.507334232330322, "global_step": 29163, "epoch": 694} {"train_loss": -5.564748287200928, "global_step": 29164, "epoch": 694} {"train_loss": -5.542895317077637, "global_step": 29165, "epoch": 694} {"train_loss": -5.46895694732666, "global_step": 29166, "epoch": 694} {"train_loss": -5.5544633865356445, "global_step": 29167, "epoch": 694} {"train_loss": -5.4179158210754395, "global_step": 29168, "epoch": 694} {"train_loss": -5.486603736877441, "global_step": 29169, "epoch": 694} {"train_loss": -5.459603309631348, "global_step": 29170, "epoch": 694} {"train_loss": -5.428805351257324, "global_step": 29171, "epoch": 694} {"train_loss": -5.512011528015137, "global_step": 29172, "epoch": 694} {"train_loss": -5.426483631134033, "global_step": 29173, "epoch": 694} {"train_loss": -5.514553070068359, "global_step": 29174, "epoch": 694} {"train_loss": -5.520174980163574, "global_step": 29175, "epoch": 694} {"train_loss": -5.530299186706543, "global_step": 29176, "epoch": 694} {"train_loss": -5.559405326843262, "global_step": 29177, "epoch": 694} {"train_loss": -5.500528335571289, "global_step": 29178, "epoch": 694} {"train_loss": -5.302905559539795, "global_step": 29179, "epoch": 694} {"train_loss": -5.323904991149902, "global_step": 29180, "epoch": 694} {"train_loss": -5.482305526733398, "global_step": 29181, "epoch": 694} {"train_loss": -5.340603828430176, "global_step": 29182, "epoch": 694} {"train_loss": -5.401111602783203, "global_step": 29183, "epoch": 694} {"train_loss": -5.598903656005859, "global_step": 29184, "epoch": 694} {"train_loss": -5.4448065757751465, "global_step": 29185, "epoch": 694} {"train_loss": -5.4440083503723145, "global_step": 29186, "epoch": 694} {"train_loss": -5.465994834899902, "global_step": 29187, "epoch": 694} {"train_loss": -5.379537582397461, "global_step": 29188, "epoch": 694} {"train_loss": -5.472422202428182, "global_step": 29189, "epoch": 694, "val_loss": 63673.25} {"train_loss": -5.430397033691406, "global_step": 29190, "epoch": 695} {"train_loss": -5.528165340423584, "global_step": 29191, "epoch": 695} {"train_loss": -5.288473129272461, "global_step": 29192, "epoch": 695} {"train_loss": -5.551850318908691, "global_step": 29193, "epoch": 695} {"train_loss": -5.342278480529785, "global_step": 29194, "epoch": 695} {"train_loss": -5.471635818481445, "global_step": 29195, "epoch": 695} {"train_loss": -5.470357418060303, "global_step": 29196, "epoch": 695} {"train_loss": -5.365545272827148, "global_step": 29197, "epoch": 695} {"train_loss": -5.594759464263916, "global_step": 29198, "epoch": 695} {"train_loss": -5.533405780792236, "global_step": 29199, "epoch": 695} {"train_loss": -5.359240531921387, "global_step": 29200, "epoch": 695} {"train_loss": -5.436344146728516, "global_step": 29201, "epoch": 695} {"train_loss": -5.256223678588867, "global_step": 29202, "epoch": 695} {"train_loss": -5.273747444152832, "global_step": 29203, "epoch": 695} {"train_loss": -5.463944435119629, "global_step": 29204, "epoch": 695} {"train_loss": -5.463479518890381, "global_step": 29205, "epoch": 695} {"train_loss": -5.330347537994385, "global_step": 29206, "epoch": 695} {"train_loss": -5.6226487159729, "global_step": 29207, "epoch": 695} {"train_loss": -5.331165790557861, "global_step": 29208, "epoch": 695} {"train_loss": -5.513853073120117, "global_step": 29209, "epoch": 695} {"train_loss": -5.419349193572998, "global_step": 29210, "epoch": 695} {"train_loss": -5.454965114593506, "global_step": 29211, "epoch": 695} {"train_loss": -5.6095499992370605, "global_step": 29212, "epoch": 695} {"train_loss": -5.337975978851318, "global_step": 29213, "epoch": 695} {"train_loss": -5.462780475616455, "global_step": 29214, "epoch": 695} {"train_loss": -5.376767635345459, "global_step": 29215, "epoch": 695} {"train_loss": -5.39604377746582, "global_step": 29216, "epoch": 695} {"train_loss": -5.404587745666504, "global_step": 29217, "epoch": 695} {"train_loss": -5.5084075927734375, "global_step": 29218, "epoch": 695} {"train_loss": -5.358578681945801, "global_step": 29219, "epoch": 695} {"train_loss": -5.490597724914551, "global_step": 29220, "epoch": 695} {"train_loss": -5.481388568878174, "global_step": 29221, "epoch": 695} {"train_loss": -5.425993919372559, "global_step": 29222, "epoch": 695} {"train_loss": -5.519128322601318, "global_step": 29223, "epoch": 695} {"train_loss": -5.489843368530273, "global_step": 29224, "epoch": 695} {"train_loss": -5.562933444976807, "global_step": 29225, "epoch": 695} {"train_loss": -5.465176582336426, "global_step": 29226, "epoch": 695} {"train_loss": -5.427834510803223, "global_step": 29227, "epoch": 695} {"train_loss": -5.445889472961426, "global_step": 29228, "epoch": 695} {"train_loss": -5.398052215576172, "global_step": 29229, "epoch": 695} {"train_loss": -5.606239318847656, "global_step": 29230, "epoch": 695} {"train_loss": -5.444812922250657, "global_step": 29231, "epoch": 695, "val_loss": 63725.97265625} {"train_loss": -5.5191802978515625, "global_step": 29232, "epoch": 696} {"train_loss": -5.441549301147461, "global_step": 29233, "epoch": 696} {"train_loss": -5.509343147277832, "global_step": 29234, "epoch": 696} {"train_loss": -5.606505393981934, "global_step": 29235, "epoch": 696} {"train_loss": -5.450496196746826, "global_step": 29236, "epoch": 696} {"train_loss": -5.485084056854248, "global_step": 29237, "epoch": 696} {"train_loss": -5.430350303649902, "global_step": 29238, "epoch": 696} {"train_loss": -5.517794132232666, "global_step": 29239, "epoch": 696} {"train_loss": -5.6115522384643555, "global_step": 29240, "epoch": 696} {"train_loss": -5.4147114753723145, "global_step": 29241, "epoch": 696} {"train_loss": -5.476149559020996, "global_step": 29242, "epoch": 696} {"train_loss": -5.4238128662109375, "global_step": 29243, "epoch": 696} {"train_loss": -5.460563659667969, "global_step": 29244, "epoch": 696} {"train_loss": -5.466978073120117, "global_step": 29245, "epoch": 696} {"train_loss": -5.313243389129639, "global_step": 29246, "epoch": 696} {"train_loss": -5.304619789123535, "global_step": 29247, "epoch": 696} {"train_loss": -5.512529373168945, "global_step": 29248, "epoch": 696} {"train_loss": -5.4321513175964355, "global_step": 29249, "epoch": 696} {"train_loss": -5.417328834533691, "global_step": 29250, "epoch": 696} {"train_loss": -5.4416913986206055, "global_step": 29251, "epoch": 696} {"train_loss": -5.434873580932617, "global_step": 29252, "epoch": 696} {"train_loss": -5.490010738372803, "global_step": 29253, "epoch": 696} {"train_loss": -5.4176740646362305, "global_step": 29254, "epoch": 696} {"train_loss": -5.593222618103027, "global_step": 29255, "epoch": 696} {"train_loss": -5.4373297691345215, "global_step": 29256, "epoch": 696} {"train_loss": -5.366746425628662, "global_step": 29257, "epoch": 696} {"train_loss": -5.645811080932617, "global_step": 29258, "epoch": 696} {"train_loss": -5.257194519042969, "global_step": 29259, "epoch": 696} {"train_loss": -5.45054292678833, "global_step": 29260, "epoch": 696} {"train_loss": -5.613554000854492, "global_step": 29261, "epoch": 696} {"train_loss": -5.484866142272949, "global_step": 29262, "epoch": 696} {"train_loss": -5.423454284667969, "global_step": 29263, "epoch": 696} {"train_loss": -5.463257789611816, "global_step": 29264, "epoch": 696} {"train_loss": -5.418451309204102, "global_step": 29265, "epoch": 696} {"train_loss": -5.374586582183838, "global_step": 29266, "epoch": 696} {"train_loss": -5.527769565582275, "global_step": 29267, "epoch": 696} {"train_loss": -5.5698347091674805, "global_step": 29268, "epoch": 696} {"train_loss": -5.608160495758057, "global_step": 29269, "epoch": 696} {"train_loss": -5.439831733703613, "global_step": 29270, "epoch": 696} {"train_loss": -5.5293684005737305, "global_step": 29271, "epoch": 696} {"train_loss": -5.465756893157959, "global_step": 29272, "epoch": 696} {"train_loss": -5.466874031793504, "global_step": 29273, "epoch": 696, "val_loss": 63835.75} {"train_loss": -5.6166534423828125, "global_step": 29274, "epoch": 697} {"train_loss": -5.587822914123535, "global_step": 29275, "epoch": 697} {"train_loss": -5.4455461502075195, "global_step": 29276, "epoch": 697} {"train_loss": -5.4371819496154785, "global_step": 29277, "epoch": 697} {"train_loss": -5.45099401473999, "global_step": 29278, "epoch": 697} {"train_loss": -5.390966415405273, "global_step": 29279, "epoch": 697} {"train_loss": -5.561505317687988, "global_step": 29280, "epoch": 697} {"train_loss": -5.525075912475586, "global_step": 29281, "epoch": 697} {"train_loss": -5.380343437194824, "global_step": 29282, "epoch": 697} {"train_loss": -5.42597770690918, "global_step": 29283, "epoch": 697} {"train_loss": -5.516120910644531, "global_step": 29284, "epoch": 697} {"train_loss": -5.460651397705078, "global_step": 29285, "epoch": 697} {"train_loss": -5.452179908752441, "global_step": 29286, "epoch": 697} {"train_loss": -5.489749908447266, "global_step": 29287, "epoch": 697} {"train_loss": -5.5235185623168945, "global_step": 29288, "epoch": 697} {"train_loss": -5.510068893432617, "global_step": 29289, "epoch": 697} {"train_loss": -5.458144664764404, "global_step": 29290, "epoch": 697} {"train_loss": -5.378167629241943, "global_step": 29291, "epoch": 697} {"train_loss": -5.470525741577148, "global_step": 29292, "epoch": 697} {"train_loss": -5.462085723876953, "global_step": 29293, "epoch": 697} {"train_loss": -5.5111165046691895, "global_step": 29294, "epoch": 697} {"train_loss": -5.410557746887207, "global_step": 29295, "epoch": 697} {"train_loss": -5.393754959106445, "global_step": 29296, "epoch": 697} {"train_loss": -5.482497215270996, "global_step": 29297, "epoch": 697} {"train_loss": -5.458686351776123, "global_step": 29298, "epoch": 697} {"train_loss": -5.529057502746582, "global_step": 29299, "epoch": 697} {"train_loss": -5.413448810577393, "global_step": 29300, "epoch": 697} {"train_loss": -5.485170364379883, "global_step": 29301, "epoch": 697} {"train_loss": -5.5289306640625, "global_step": 29302, "epoch": 697} {"train_loss": -5.480930328369141, "global_step": 29303, "epoch": 697} {"train_loss": -5.4063615798950195, "global_step": 29304, "epoch": 697} {"train_loss": -5.466705322265625, "global_step": 29305, "epoch": 697} {"train_loss": -5.515907287597656, "global_step": 29306, "epoch": 697} {"train_loss": -5.351517677307129, "global_step": 29307, "epoch": 697} {"train_loss": -5.520564079284668, "global_step": 29308, "epoch": 697} {"train_loss": -5.4742431640625, "global_step": 29309, "epoch": 697} {"train_loss": -5.502342224121094, "global_step": 29310, "epoch": 697} {"train_loss": -5.283673286437988, "global_step": 29311, "epoch": 697} {"train_loss": -5.457065105438232, "global_step": 29312, "epoch": 697} {"train_loss": -5.401464462280273, "global_step": 29313, "epoch": 697} {"train_loss": -5.364750862121582, "global_step": 29314, "epoch": 697} {"train_loss": -5.458598193668184, "global_step": 29315, "epoch": 697, "val_loss": 64089.09375} {"train_loss": -5.3851752281188965, "global_step": 29316, "epoch": 698} {"train_loss": -5.387186050415039, "global_step": 29317, "epoch": 698} {"train_loss": -5.484816551208496, "global_step": 29318, "epoch": 698} {"train_loss": -5.448068141937256, "global_step": 29319, "epoch": 698} {"train_loss": -5.354893207550049, "global_step": 29320, "epoch": 698} {"train_loss": -5.4708967208862305, "global_step": 29321, "epoch": 698} {"train_loss": -5.388781547546387, "global_step": 29322, "epoch": 698} {"train_loss": -5.430882453918457, "global_step": 29323, "epoch": 698} {"train_loss": -5.343527317047119, "global_step": 29324, "epoch": 698} {"train_loss": -5.235163688659668, "global_step": 29325, "epoch": 698} {"train_loss": -5.566194534301758, "global_step": 29326, "epoch": 698} {"train_loss": -5.471212387084961, "global_step": 29327, "epoch": 698} {"train_loss": -5.533636093139648, "global_step": 29328, "epoch": 698} {"train_loss": -5.393424987792969, "global_step": 29329, "epoch": 698} {"train_loss": -5.3803253173828125, "global_step": 29330, "epoch": 698} {"train_loss": -5.448834419250488, "global_step": 29331, "epoch": 698} {"train_loss": -5.4762349128723145, "global_step": 29332, "epoch": 698} {"train_loss": -5.539910793304443, "global_step": 29333, "epoch": 698} {"train_loss": -5.452864170074463, "global_step": 29334, "epoch": 698} {"train_loss": -5.527355194091797, "global_step": 29335, "epoch": 698} {"train_loss": -5.536929130554199, "global_step": 29336, "epoch": 698} {"train_loss": -5.345671653747559, "global_step": 29337, "epoch": 698} {"train_loss": -5.50615930557251, "global_step": 29338, "epoch": 698} {"train_loss": -5.396781921386719, "global_step": 29339, "epoch": 698} {"train_loss": -5.339085578918457, "global_step": 29340, "epoch": 698} {"train_loss": -5.33696985244751, "global_step": 29341, "epoch": 698} {"train_loss": -5.444573879241943, "global_step": 29342, "epoch": 698} {"train_loss": -5.545861721038818, "global_step": 29343, "epoch": 698} {"train_loss": -5.440432071685791, "global_step": 29344, "epoch": 698} {"train_loss": -5.410586833953857, "global_step": 29345, "epoch": 698} {"train_loss": -5.473443031311035, "global_step": 29346, "epoch": 698} {"train_loss": -5.433342933654785, "global_step": 29347, "epoch": 698} {"train_loss": -5.430735111236572, "global_step": 29348, "epoch": 698} {"train_loss": -5.379454612731934, "global_step": 29349, "epoch": 698} {"train_loss": -5.540571212768555, "global_step": 29350, "epoch": 698} {"train_loss": -5.530742168426514, "global_step": 29351, "epoch": 698} {"train_loss": -5.545388221740723, "global_step": 29352, "epoch": 698} {"train_loss": -5.562424182891846, "global_step": 29353, "epoch": 698} {"train_loss": -5.4755964279174805, "global_step": 29354, "epoch": 698} {"train_loss": -5.476555824279785, "global_step": 29355, "epoch": 698} {"train_loss": -5.429741382598877, "global_step": 29356, "epoch": 698} {"train_loss": -5.444428670974005, "global_step": 29357, "epoch": 698, "val_loss": 63850.015625} {"train_loss": -5.493112564086914, "global_step": 29358, "epoch": 699} {"train_loss": -5.425260543823242, "global_step": 29359, "epoch": 699} {"train_loss": -5.4149394035339355, "global_step": 29360, "epoch": 699} {"train_loss": -5.477330684661865, "global_step": 29361, "epoch": 699} {"train_loss": -5.325655460357666, "global_step": 29362, "epoch": 699} {"train_loss": -5.391797065734863, "global_step": 29363, "epoch": 699} {"train_loss": -5.491857051849365, "global_step": 29364, "epoch": 699} {"train_loss": -5.512337684631348, "global_step": 29365, "epoch": 699} {"train_loss": -5.26151180267334, "global_step": 29366, "epoch": 699} {"train_loss": -5.582674980163574, "global_step": 29367, "epoch": 699} {"train_loss": -5.543549537658691, "global_step": 29368, "epoch": 699} {"train_loss": -5.447610855102539, "global_step": 29369, "epoch": 699} {"train_loss": -5.575498104095459, "global_step": 29370, "epoch": 699} {"train_loss": -5.468099594116211, "global_step": 29371, "epoch": 699} {"train_loss": -5.391180515289307, "global_step": 29372, "epoch": 699} {"train_loss": -5.525008201599121, "global_step": 29373, "epoch": 699} {"train_loss": -5.516247749328613, "global_step": 29374, "epoch": 699} {"train_loss": -5.385945796966553, "global_step": 29375, "epoch": 699} {"train_loss": -5.478527545928955, "global_step": 29376, "epoch": 699} {"train_loss": -5.397769451141357, "global_step": 29377, "epoch": 699} {"train_loss": -5.405390739440918, "global_step": 29378, "epoch": 699} {"train_loss": -5.509629249572754, "global_step": 29379, "epoch": 699} {"train_loss": -5.3940958976745605, "global_step": 29380, "epoch": 699} {"train_loss": -5.458400249481201, "global_step": 29381, "epoch": 699} {"train_loss": -5.517562389373779, "global_step": 29382, "epoch": 699} {"train_loss": -5.375950813293457, "global_step": 29383, "epoch": 699} {"train_loss": -5.562702178955078, "global_step": 29384, "epoch": 699} {"train_loss": -5.420031547546387, "global_step": 29385, "epoch": 699} {"train_loss": -5.409549713134766, "global_step": 29386, "epoch": 699} {"train_loss": -5.4884772300720215, "global_step": 29387, "epoch": 699} {"train_loss": -5.5472235679626465, "global_step": 29388, "epoch": 699} {"train_loss": -5.413840293884277, "global_step": 29389, "epoch": 699} {"train_loss": -5.455460071563721, "global_step": 29390, "epoch": 699} {"train_loss": -5.544192790985107, "global_step": 29391, "epoch": 699} {"train_loss": -5.554558277130127, "global_step": 29392, "epoch": 699} {"train_loss": -5.5594892501831055, "global_step": 29393, "epoch": 699} {"train_loss": -5.342580795288086, "global_step": 29394, "epoch": 699} {"train_loss": -5.4861650466918945, "global_step": 29395, "epoch": 699} {"train_loss": -5.406550884246826, "global_step": 29396, "epoch": 699} {"train_loss": -5.474360942840576, "global_step": 29397, "epoch": 699} {"train_loss": -5.4209394454956055, "global_step": 29398, "epoch": 699} {"train_loss": -5.457854429880778, "global_step": 29399, "epoch": 699, "val_loss": 63975.23046875} {"train_loss": -5.284977912902832, "global_step": 29400, "epoch": 700} {"train_loss": -5.501501560211182, "global_step": 29401, "epoch": 700} {"train_loss": -5.484449863433838, "global_step": 29402, "epoch": 700} {"train_loss": -5.3301849365234375, "global_step": 29403, "epoch": 700} {"train_loss": -5.520320415496826, "global_step": 29404, "epoch": 700} {"train_loss": -5.416777610778809, "global_step": 29405, "epoch": 700} {"train_loss": -5.324491500854492, "global_step": 29406, "epoch": 700} {"train_loss": -5.478268146514893, "global_step": 29407, "epoch": 700} {"train_loss": -5.431035995483398, "global_step": 29408, "epoch": 700} {"train_loss": -5.482524871826172, "global_step": 29409, "epoch": 700} {"train_loss": -5.407390594482422, "global_step": 29410, "epoch": 700} {"train_loss": -5.512042045593262, "global_step": 29411, "epoch": 700} {"train_loss": -5.469432353973389, "global_step": 29412, "epoch": 700} {"train_loss": -5.4008588790893555, "global_step": 29413, "epoch": 700} {"train_loss": -5.4678473472595215, "global_step": 29414, "epoch": 700} {"train_loss": -5.477633476257324, "global_step": 29415, "epoch": 700} {"train_loss": -5.472733497619629, "global_step": 29416, "epoch": 700} {"train_loss": -5.52659273147583, "global_step": 29417, "epoch": 700} {"train_loss": -5.524443626403809, "global_step": 29418, "epoch": 700} {"train_loss": -5.577641487121582, "global_step": 29419, "epoch": 700} {"train_loss": -5.3717122077941895, "global_step": 29420, "epoch": 700} {"train_loss": -5.423065662384033, "global_step": 29421, "epoch": 700} {"train_loss": -5.536918640136719, "global_step": 29422, "epoch": 700} {"train_loss": -5.377246856689453, "global_step": 29423, "epoch": 700} {"train_loss": -5.479988098144531, "global_step": 29424, "epoch": 700} {"train_loss": -5.405107498168945, "global_step": 29425, "epoch": 700} {"train_loss": -5.375948905944824, "global_step": 29426, "epoch": 700} {"train_loss": -5.4563679695129395, "global_step": 29427, "epoch": 700} {"train_loss": -5.3210225105285645, "global_step": 29428, "epoch": 700} {"train_loss": -5.479285717010498, "global_step": 29429, "epoch": 700} {"train_loss": -5.480673313140869, "global_step": 29430, "epoch": 700} {"train_loss": -5.470861911773682, "global_step": 29431, "epoch": 700} {"train_loss": -5.383144855499268, "global_step": 29432, "epoch": 700} {"train_loss": -5.491653919219971, "global_step": 29433, "epoch": 700} {"train_loss": -5.469334602355957, "global_step": 29434, "epoch": 700} {"train_loss": -5.482691764831543, "global_step": 29435, "epoch": 700} {"train_loss": -5.496420383453369, "global_step": 29436, "epoch": 700} {"train_loss": -5.545406341552734, "global_step": 29437, "epoch": 700} {"train_loss": -5.334010124206543, "global_step": 29438, "epoch": 700} {"train_loss": -5.500653266906738, "global_step": 29439, "epoch": 700} {"train_loss": -5.584098815917969, "global_step": 29440, "epoch": 700} {"train_loss": -5.454535257248652, "global_step": 29441, "epoch": 700, "train/sim_max_reward_0": 0.5795489323713581, "train/sim_max_reward_1": 0.21074763419040607, "train/sim_max_reward_2": 0.14284055500467788, "train/sim_max_reward_3": 0.3071681267826772, "train/sim_max_reward_4": 0.926051713869228, "train/sim_max_reward_5": 0.8860273774176226, "test/sim_max_reward_4300000": 0.25424063916200723, "test/sim_max_reward_4300001": 0.2833187041885098, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.5264872973053449, "test/sim_max_reward_4300004": 0.11491224159273251, "test/sim_max_reward_4300005": 0.48763197282505183, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.04552410958929821, "test/sim_max_reward_4300008": 0.8853586698834075, "test/sim_max_reward_4300009": 0.6472593311508767, "test/sim_max_reward_4300010": 0.4701129908615904, "test/sim_max_reward_4300011": 0.8494218958923001, "test/sim_max_reward_4300012": 0.9300514646966673, "test/sim_max_reward_4300013": 0.3944953224944173, "test/sim_max_reward_4300014": 0.47248113524104957, "test/sim_max_reward_4300015": 0.24797638775528857, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.4079586268930027, "test/sim_max_reward_4300018": 0.6057748981286153, "test/sim_max_reward_4300019": 0.18586157527147085, "test/sim_max_reward_4300020": 0.02999079805574855, "test/sim_max_reward_4300021": 0.46241127623215306, "test/sim_max_reward_4300022": 0.23185730490412743, "test/sim_max_reward_4300023": 0.34242371234903624, "test/sim_max_reward_4300024": 0.4906902071564744, "test/sim_max_reward_4300025": 0.16195769313964947, "test/sim_max_reward_4300026": 0.19098110225497242, "test/sim_max_reward_4300027": 0.0019207765700590752, "test/sim_max_reward_4300028": 0.0020832658135955338, "test/sim_max_reward_4300029": 0.20758208064773978, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.00814537682613156, "test/sim_max_reward_4300032": 0.5888282949517171, "test/sim_max_reward_4300033": 0.40336445955922406, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8114469093923745, "test/sim_max_reward_4300038": 0.49022241173342446, "test/sim_max_reward_4300039": 0.5006973148783394, "test/sim_max_reward_4300040": 0.2493320331731271, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.6731947824285102, "test/sim_max_reward_4300043": 0.21024745172708037, "test/sim_max_reward_4300044": 0.04345707006804553, "test/sim_max_reward_4300045": 0.1763579764115077, "test/sim_max_reward_4300046": 0.02831479959922337, "test/sim_max_reward_4300047": 0.5860054314758356, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.5087307232726617, "test/mean_score": 0.30147220548668885, "val_loss": 63441.83984375} {"train_loss": -5.55928897857666, "global_step": 29442, "epoch": 701} {"train_loss": -5.419286251068115, "global_step": 29443, "epoch": 701} {"train_loss": -5.384671211242676, "global_step": 29444, "epoch": 701} {"train_loss": -5.4579925537109375, "global_step": 29445, "epoch": 701} {"train_loss": -5.470407009124756, "global_step": 29446, "epoch": 701} {"train_loss": -5.505449295043945, "global_step": 29447, "epoch": 701} {"train_loss": -5.403786659240723, "global_step": 29448, "epoch": 701} {"train_loss": -5.413874626159668, "global_step": 29449, "epoch": 701} {"train_loss": -5.461555004119873, "global_step": 29450, "epoch": 701} {"train_loss": -5.346960067749023, "global_step": 29451, "epoch": 701} {"train_loss": -5.3037848472595215, "global_step": 29452, "epoch": 701} {"train_loss": -5.503654479980469, "global_step": 29453, "epoch": 701} {"train_loss": -5.447748184204102, "global_step": 29454, "epoch": 701} {"train_loss": -5.366013050079346, "global_step": 29455, "epoch": 701} {"train_loss": -5.465461730957031, "global_step": 29456, "epoch": 701} {"train_loss": -5.4862260818481445, "global_step": 29457, "epoch": 701} {"train_loss": -5.372533321380615, "global_step": 29458, "epoch": 701} {"train_loss": -5.410891056060791, "global_step": 29459, "epoch": 701} {"train_loss": -5.509212493896484, "global_step": 29460, "epoch": 701} {"train_loss": -5.412434101104736, "global_step": 29461, "epoch": 701} {"train_loss": -5.345490455627441, "global_step": 29462, "epoch": 701} {"train_loss": -5.464250564575195, "global_step": 29463, "epoch": 701} {"train_loss": -5.395475387573242, "global_step": 29464, "epoch": 701} {"train_loss": -5.6139936447143555, "global_step": 29465, "epoch": 701} {"train_loss": -5.42616081237793, "global_step": 29466, "epoch": 701} {"train_loss": -5.469783306121826, "global_step": 29467, "epoch": 701} {"train_loss": -5.456345558166504, "global_step": 29468, "epoch": 701} {"train_loss": -5.440704822540283, "global_step": 29469, "epoch": 701} {"train_loss": -5.481492042541504, "global_step": 29470, "epoch": 701} {"train_loss": -5.477324962615967, "global_step": 29471, "epoch": 701} {"train_loss": -5.522261619567871, "global_step": 29472, "epoch": 701} {"train_loss": -5.537515163421631, "global_step": 29473, "epoch": 701} {"train_loss": -5.435186386108398, "global_step": 29474, "epoch": 701} {"train_loss": -5.550310134887695, "global_step": 29475, "epoch": 701} {"train_loss": -5.403592109680176, "global_step": 29476, "epoch": 701} {"train_loss": -5.489931583404541, "global_step": 29477, "epoch": 701} {"train_loss": -5.47524356842041, "global_step": 29478, "epoch": 701} {"train_loss": -5.48008918762207, "global_step": 29479, "epoch": 701} {"train_loss": -5.523263454437256, "global_step": 29480, "epoch": 701} {"train_loss": -5.447164535522461, "global_step": 29481, "epoch": 701} {"train_loss": -5.518926620483398, "global_step": 29482, "epoch": 701} {"train_loss": -5.453971192950294, "global_step": 29483, "epoch": 701, "val_loss": 63442.33984375} {"train_loss": -5.3943376541137695, "global_step": 29484, "epoch": 702} {"train_loss": -5.359694004058838, "global_step": 29485, "epoch": 702} {"train_loss": -5.412618637084961, "global_step": 29486, "epoch": 702} {"train_loss": -5.532124996185303, "global_step": 29487, "epoch": 702} {"train_loss": -5.5886688232421875, "global_step": 29488, "epoch": 702} {"train_loss": -5.571563243865967, "global_step": 29489, "epoch": 702} {"train_loss": -5.497910976409912, "global_step": 29490, "epoch": 702} {"train_loss": -5.484488010406494, "global_step": 29491, "epoch": 702} {"train_loss": -5.467533111572266, "global_step": 29492, "epoch": 702} {"train_loss": -5.421416282653809, "global_step": 29493, "epoch": 702} {"train_loss": -5.385804176330566, "global_step": 29494, "epoch": 702} {"train_loss": -5.308829307556152, "global_step": 29495, "epoch": 702} {"train_loss": -5.476299285888672, "global_step": 29496, "epoch": 702} {"train_loss": -5.546947002410889, "global_step": 29497, "epoch": 702} {"train_loss": -5.4665703773498535, "global_step": 29498, "epoch": 702} {"train_loss": -5.556540012359619, "global_step": 29499, "epoch": 702} {"train_loss": -5.41729736328125, "global_step": 29500, "epoch": 702} {"train_loss": -5.416181564331055, "global_step": 29501, "epoch": 702} {"train_loss": -5.430636405944824, "global_step": 29502, "epoch": 702} {"train_loss": -5.456202030181885, "global_step": 29503, "epoch": 702} {"train_loss": -5.352461814880371, "global_step": 29504, "epoch": 702} {"train_loss": -5.451669692993164, "global_step": 29505, "epoch": 702} {"train_loss": -5.476232051849365, "global_step": 29506, "epoch": 702} {"train_loss": -5.428711414337158, "global_step": 29507, "epoch": 702} {"train_loss": -5.497218132019043, "global_step": 29508, "epoch": 702} {"train_loss": -5.446468353271484, "global_step": 29509, "epoch": 702} {"train_loss": -5.52320671081543, "global_step": 29510, "epoch": 702} {"train_loss": -5.527681350708008, "global_step": 29511, "epoch": 702} {"train_loss": -5.517430782318115, "global_step": 29512, "epoch": 702} {"train_loss": -5.385676860809326, "global_step": 29513, "epoch": 702} {"train_loss": -5.457228660583496, "global_step": 29514, "epoch": 702} {"train_loss": -5.466036796569824, "global_step": 29515, "epoch": 702} {"train_loss": -5.477290630340576, "global_step": 29516, "epoch": 702} {"train_loss": -5.510504722595215, "global_step": 29517, "epoch": 702} {"train_loss": -5.457123279571533, "global_step": 29518, "epoch": 702} {"train_loss": -5.542562484741211, "global_step": 29519, "epoch": 702} {"train_loss": -5.453620910644531, "global_step": 29520, "epoch": 702} {"train_loss": -5.490650177001953, "global_step": 29521, "epoch": 702} {"train_loss": -5.375077247619629, "global_step": 29522, "epoch": 702} {"train_loss": -5.393206596374512, "global_step": 29523, "epoch": 702} {"train_loss": -5.451434135437012, "global_step": 29524, "epoch": 702} {"train_loss": -5.461422863460722, "global_step": 29525, "epoch": 702, "val_loss": 63579.6328125} {"train_loss": -5.468473434448242, "global_step": 29526, "epoch": 703} {"train_loss": -5.498166084289551, "global_step": 29527, "epoch": 703} {"train_loss": -5.521056175231934, "global_step": 29528, "epoch": 703} {"train_loss": -5.441648483276367, "global_step": 29529, "epoch": 703} {"train_loss": -5.4842209815979, "global_step": 29530, "epoch": 703} {"train_loss": -5.484869003295898, "global_step": 29531, "epoch": 703} {"train_loss": -5.314094543457031, "global_step": 29532, "epoch": 703} {"train_loss": -5.518707752227783, "global_step": 29533, "epoch": 703} {"train_loss": -5.396533966064453, "global_step": 29534, "epoch": 703} {"train_loss": -5.599872589111328, "global_step": 29535, "epoch": 703} {"train_loss": -5.370616912841797, "global_step": 29536, "epoch": 703} {"train_loss": -5.458374977111816, "global_step": 29537, "epoch": 703} {"train_loss": -5.549855709075928, "global_step": 29538, "epoch": 703} {"train_loss": -5.397912979125977, "global_step": 29539, "epoch": 703} {"train_loss": -5.495025634765625, "global_step": 29540, "epoch": 703} {"train_loss": -5.531936168670654, "global_step": 29541, "epoch": 703} {"train_loss": -5.470862865447998, "global_step": 29542, "epoch": 703} {"train_loss": -5.5749921798706055, "global_step": 29543, "epoch": 703} {"train_loss": -5.514822006225586, "global_step": 29544, "epoch": 703} {"train_loss": -5.506656646728516, "global_step": 29545, "epoch": 703} {"train_loss": -5.394172191619873, "global_step": 29546, "epoch": 703} {"train_loss": -5.482829570770264, "global_step": 29547, "epoch": 703} {"train_loss": -5.549343109130859, "global_step": 29548, "epoch": 703} {"train_loss": -5.529488563537598, "global_step": 29549, "epoch": 703} {"train_loss": -5.454946517944336, "global_step": 29550, "epoch": 703} {"train_loss": -5.554482460021973, "global_step": 29551, "epoch": 703} {"train_loss": -5.4735002517700195, "global_step": 29552, "epoch": 703} {"train_loss": -5.281359672546387, "global_step": 29553, "epoch": 703} {"train_loss": -5.5259552001953125, "global_step": 29554, "epoch": 703} {"train_loss": -5.5115556716918945, "global_step": 29555, "epoch": 703} {"train_loss": -5.277116298675537, "global_step": 29556, "epoch": 703} {"train_loss": -5.552396774291992, "global_step": 29557, "epoch": 703} {"train_loss": -5.511573314666748, "global_step": 29558, "epoch": 703} {"train_loss": -5.318748474121094, "global_step": 29559, "epoch": 703} {"train_loss": -5.5305585861206055, "global_step": 29560, "epoch": 703} {"train_loss": -5.36822509765625, "global_step": 29561, "epoch": 703} {"train_loss": -5.42222785949707, "global_step": 29562, "epoch": 703} {"train_loss": -5.425543785095215, "global_step": 29563, "epoch": 703} {"train_loss": -5.222120761871338, "global_step": 29564, "epoch": 703} {"train_loss": -5.579894542694092, "global_step": 29565, "epoch": 703} {"train_loss": -5.394269943237305, "global_step": 29566, "epoch": 703} {"train_loss": -5.462381737572806, "global_step": 29567, "epoch": 703, "val_loss": 63353.38671875} {"train_loss": -5.466634750366211, "global_step": 29568, "epoch": 704} {"train_loss": -5.4685845375061035, "global_step": 29569, "epoch": 704} {"train_loss": -5.461939811706543, "global_step": 29570, "epoch": 704} {"train_loss": -5.5040082931518555, "global_step": 29571, "epoch": 704} {"train_loss": -5.398825645446777, "global_step": 29572, "epoch": 704} {"train_loss": -5.357511520385742, "global_step": 29573, "epoch": 704} {"train_loss": -5.428971290588379, "global_step": 29574, "epoch": 704} {"train_loss": -5.446368217468262, "global_step": 29575, "epoch": 704} {"train_loss": -5.535297393798828, "global_step": 29576, "epoch": 704} {"train_loss": -5.4589009284973145, "global_step": 29577, "epoch": 704} {"train_loss": -5.459427356719971, "global_step": 29578, "epoch": 704} {"train_loss": -5.419244766235352, "global_step": 29579, "epoch": 704} {"train_loss": -5.424806594848633, "global_step": 29580, "epoch": 704} {"train_loss": -5.4817633628845215, "global_step": 29581, "epoch": 704} {"train_loss": -5.462661266326904, "global_step": 29582, "epoch": 704} {"train_loss": -5.352499961853027, "global_step": 29583, "epoch": 704} {"train_loss": -5.4242963790893555, "global_step": 29584, "epoch": 704} {"train_loss": -5.568658828735352, "global_step": 29585, "epoch": 704} {"train_loss": -5.512042999267578, "global_step": 29586, "epoch": 704} {"train_loss": -5.505572319030762, "global_step": 29587, "epoch": 704} {"train_loss": -5.430893898010254, "global_step": 29588, "epoch": 704} {"train_loss": -5.516478538513184, "global_step": 29589, "epoch": 704} {"train_loss": -5.54004430770874, "global_step": 29590, "epoch": 704} {"train_loss": -5.531614780426025, "global_step": 29591, "epoch": 704} {"train_loss": -5.441588401794434, "global_step": 29592, "epoch": 704} {"train_loss": -5.375213623046875, "global_step": 29593, "epoch": 704} {"train_loss": -5.489162921905518, "global_step": 29594, "epoch": 704} {"train_loss": -5.362771987915039, "global_step": 29595, "epoch": 704} {"train_loss": -5.459573745727539, "global_step": 29596, "epoch": 704} {"train_loss": -5.467350006103516, "global_step": 29597, "epoch": 704} {"train_loss": -5.42182731628418, "global_step": 29598, "epoch": 704} {"train_loss": -5.513645648956299, "global_step": 29599, "epoch": 704} {"train_loss": -5.4385223388671875, "global_step": 29600, "epoch": 704} {"train_loss": -5.461394309997559, "global_step": 29601, "epoch": 704} {"train_loss": -5.581716060638428, "global_step": 29602, "epoch": 704} {"train_loss": -5.6802873611450195, "global_step": 29603, "epoch": 704} {"train_loss": -5.4380035400390625, "global_step": 29604, "epoch": 704} {"train_loss": -5.536953926086426, "global_step": 29605, "epoch": 704} {"train_loss": -5.519815444946289, "global_step": 29606, "epoch": 704} {"train_loss": -5.576452255249023, "global_step": 29607, "epoch": 704} {"train_loss": -5.533731460571289, "global_step": 29608, "epoch": 704} {"train_loss": -5.474956149146671, "global_step": 29609, "epoch": 704, "val_loss": 63616.05078125} {"train_loss": -5.522076606750488, "global_step": 29610, "epoch": 705} {"train_loss": -5.551321029663086, "global_step": 29611, "epoch": 705} {"train_loss": -5.39796781539917, "global_step": 29612, "epoch": 705} {"train_loss": -5.498462200164795, "global_step": 29613, "epoch": 705} {"train_loss": -5.4381866455078125, "global_step": 29614, "epoch": 705} {"train_loss": -5.498093605041504, "global_step": 29615, "epoch": 705} {"train_loss": -5.502038955688477, "global_step": 29616, "epoch": 705} {"train_loss": -5.31932258605957, "global_step": 29617, "epoch": 705} {"train_loss": -5.4099836349487305, "global_step": 29618, "epoch": 705} {"train_loss": -5.443005561828613, "global_step": 29619, "epoch": 705} {"train_loss": -5.3990936279296875, "global_step": 29620, "epoch": 705} {"train_loss": -5.471741676330566, "global_step": 29621, "epoch": 705} {"train_loss": -5.51975154876709, "global_step": 29622, "epoch": 705} {"train_loss": -5.395229816436768, "global_step": 29623, "epoch": 705} {"train_loss": -5.483595848083496, "global_step": 29624, "epoch": 705} {"train_loss": -5.506171226501465, "global_step": 29625, "epoch": 705} {"train_loss": -5.374600410461426, "global_step": 29626, "epoch": 705} {"train_loss": -5.413468360900879, "global_step": 29627, "epoch": 705} {"train_loss": -5.407871246337891, "global_step": 29628, "epoch": 705} {"train_loss": -5.577700138092041, "global_step": 29629, "epoch": 705} {"train_loss": -5.564062118530273, "global_step": 29630, "epoch": 705} {"train_loss": -5.437339782714844, "global_step": 29631, "epoch": 705} {"train_loss": -5.457317352294922, "global_step": 29632, "epoch": 705} {"train_loss": -5.366870880126953, "global_step": 29633, "epoch": 705} {"train_loss": -5.413614273071289, "global_step": 29634, "epoch": 705} {"train_loss": -5.426302909851074, "global_step": 29635, "epoch": 705} {"train_loss": -5.39088249206543, "global_step": 29636, "epoch": 705} {"train_loss": -5.457930564880371, "global_step": 29637, "epoch": 705} {"train_loss": -5.4073333740234375, "global_step": 29638, "epoch": 705} {"train_loss": -5.559205055236816, "global_step": 29639, "epoch": 705} {"train_loss": -5.582680702209473, "global_step": 29640, "epoch": 705} {"train_loss": -5.533506393432617, "global_step": 29641, "epoch": 705} {"train_loss": -5.4583539962768555, "global_step": 29642, "epoch": 705} {"train_loss": -5.487010955810547, "global_step": 29643, "epoch": 705} {"train_loss": -5.499792098999023, "global_step": 29644, "epoch": 705} {"train_loss": -5.450049877166748, "global_step": 29645, "epoch": 705} {"train_loss": -5.448875427246094, "global_step": 29646, "epoch": 705} {"train_loss": -5.436264991760254, "global_step": 29647, "epoch": 705} {"train_loss": -5.391087532043457, "global_step": 29648, "epoch": 705} {"train_loss": -5.531444072723389, "global_step": 29649, "epoch": 705} {"train_loss": -5.450239181518555, "global_step": 29650, "epoch": 705} {"train_loss": -5.462471507844471, "global_step": 29651, "epoch": 705, "val_loss": 63172.015625} {"train_loss": -5.418668746948242, "global_step": 29652, "epoch": 706} {"train_loss": -5.486660480499268, "global_step": 29653, "epoch": 706} {"train_loss": -5.5996809005737305, "global_step": 29654, "epoch": 706} {"train_loss": -5.591277599334717, "global_step": 29655, "epoch": 706} {"train_loss": -5.460531234741211, "global_step": 29656, "epoch": 706} {"train_loss": -5.515627861022949, "global_step": 29657, "epoch": 706} {"train_loss": -5.446981906890869, "global_step": 29658, "epoch": 706} {"train_loss": -5.428757667541504, "global_step": 29659, "epoch": 706} {"train_loss": -5.474115371704102, "global_step": 29660, "epoch": 706} {"train_loss": -5.541930198669434, "global_step": 29661, "epoch": 706} {"train_loss": -5.350202560424805, "global_step": 29662, "epoch": 706} {"train_loss": -5.475231170654297, "global_step": 29663, "epoch": 706} {"train_loss": -5.59321403503418, "global_step": 29664, "epoch": 706} {"train_loss": -5.635268211364746, "global_step": 29665, "epoch": 706} {"train_loss": -5.572765350341797, "global_step": 29666, "epoch": 706} {"train_loss": -5.287509918212891, "global_step": 29667, "epoch": 706} {"train_loss": -5.436954021453857, "global_step": 29668, "epoch": 706} {"train_loss": -5.5177788734436035, "global_step": 29669, "epoch": 706} {"train_loss": -5.306561470031738, "global_step": 29670, "epoch": 706} {"train_loss": -5.521564960479736, "global_step": 29671, "epoch": 706} {"train_loss": -5.465692520141602, "global_step": 29672, "epoch": 706} {"train_loss": -5.451632976531982, "global_step": 29673, "epoch": 706} {"train_loss": -5.458376407623291, "global_step": 29674, "epoch": 706} {"train_loss": -5.526611328125, "global_step": 29675, "epoch": 706} {"train_loss": -5.506165504455566, "global_step": 29676, "epoch": 706} {"train_loss": -5.454438209533691, "global_step": 29677, "epoch": 706} {"train_loss": -5.568150997161865, "global_step": 29678, "epoch": 706} {"train_loss": -5.566245079040527, "global_step": 29679, "epoch": 706} {"train_loss": -5.411841869354248, "global_step": 29680, "epoch": 706} {"train_loss": -5.29794979095459, "global_step": 29681, "epoch": 706} {"train_loss": -5.491055011749268, "global_step": 29682, "epoch": 706} {"train_loss": -5.324826240539551, "global_step": 29683, "epoch": 706} {"train_loss": -5.434347152709961, "global_step": 29684, "epoch": 706} {"train_loss": -5.573945045471191, "global_step": 29685, "epoch": 706} {"train_loss": -5.426832675933838, "global_step": 29686, "epoch": 706} {"train_loss": -5.4269561767578125, "global_step": 29687, "epoch": 706} {"train_loss": -5.3626389503479, "global_step": 29688, "epoch": 706} {"train_loss": -5.429028511047363, "global_step": 29689, "epoch": 706} {"train_loss": -5.450845718383789, "global_step": 29690, "epoch": 706} {"train_loss": -5.543432235717773, "global_step": 29691, "epoch": 706} {"train_loss": -5.322265625, "global_step": 29692, "epoch": 706} {"train_loss": -5.465801976975941, "global_step": 29693, "epoch": 706, "val_loss": 63605.2578125} {"train_loss": -5.3889641761779785, "global_step": 29694, "epoch": 707} {"train_loss": -5.516353607177734, "global_step": 29695, "epoch": 707} {"train_loss": -5.464173316955566, "global_step": 29696, "epoch": 707} {"train_loss": -5.465290546417236, "global_step": 29697, "epoch": 707} {"train_loss": -5.416598796844482, "global_step": 29698, "epoch": 707} {"train_loss": -5.521960735321045, "global_step": 29699, "epoch": 707} {"train_loss": -5.476430892944336, "global_step": 29700, "epoch": 707} {"train_loss": -5.374577522277832, "global_step": 29701, "epoch": 707} {"train_loss": -5.536708831787109, "global_step": 29702, "epoch": 707} {"train_loss": -5.3710174560546875, "global_step": 29703, "epoch": 707} {"train_loss": -5.445954322814941, "global_step": 29704, "epoch": 707} {"train_loss": -5.366449356079102, "global_step": 29705, "epoch": 707} {"train_loss": -5.333006858825684, "global_step": 29706, "epoch": 707} {"train_loss": -5.513106822967529, "global_step": 29707, "epoch": 707} {"train_loss": -5.295013427734375, "global_step": 29708, "epoch": 707} {"train_loss": -5.541186332702637, "global_step": 29709, "epoch": 707} {"train_loss": -5.470907688140869, "global_step": 29710, "epoch": 707} {"train_loss": -5.452147483825684, "global_step": 29711, "epoch": 707} {"train_loss": -5.4516682624816895, "global_step": 29712, "epoch": 707} {"train_loss": -5.575653076171875, "global_step": 29713, "epoch": 707} {"train_loss": -5.423413276672363, "global_step": 29714, "epoch": 707} {"train_loss": -5.492462158203125, "global_step": 29715, "epoch": 707} {"train_loss": -5.314530372619629, "global_step": 29716, "epoch": 707} {"train_loss": -5.537844181060791, "global_step": 29717, "epoch": 707} {"train_loss": -5.378777503967285, "global_step": 29718, "epoch": 707} {"train_loss": -5.446712970733643, "global_step": 29719, "epoch": 707} {"train_loss": -5.467912673950195, "global_step": 29720, "epoch": 707} {"train_loss": -5.607074737548828, "global_step": 29721, "epoch": 707} {"train_loss": -5.43857479095459, "global_step": 29722, "epoch": 707} {"train_loss": -5.536886215209961, "global_step": 29723, "epoch": 707} {"train_loss": -5.464964866638184, "global_step": 29724, "epoch": 707} {"train_loss": -5.458204746246338, "global_step": 29725, "epoch": 707} {"train_loss": -5.412644863128662, "global_step": 29726, "epoch": 707} {"train_loss": -5.511155128479004, "global_step": 29727, "epoch": 707} {"train_loss": -5.562460422515869, "global_step": 29728, "epoch": 707} {"train_loss": -5.411367416381836, "global_step": 29729, "epoch": 707} {"train_loss": -5.41909122467041, "global_step": 29730, "epoch": 707} {"train_loss": -5.492362022399902, "global_step": 29731, "epoch": 707} {"train_loss": -5.463033199310303, "global_step": 29732, "epoch": 707} {"train_loss": -5.296308517456055, "global_step": 29733, "epoch": 707} {"train_loss": -5.3694047927856445, "global_step": 29734, "epoch": 707} {"train_loss": -5.449411596570696, "global_step": 29735, "epoch": 707, "val_loss": 63956.66015625} {"train_loss": -5.41280460357666, "global_step": 29736, "epoch": 708} {"train_loss": -5.4474101066589355, "global_step": 29737, "epoch": 708} {"train_loss": -5.383234024047852, "global_step": 29738, "epoch": 708} {"train_loss": -5.326539993286133, "global_step": 29739, "epoch": 708} {"train_loss": -5.505185127258301, "global_step": 29740, "epoch": 708} {"train_loss": -5.282832622528076, "global_step": 29741, "epoch": 708} {"train_loss": -5.467341899871826, "global_step": 29742, "epoch": 708} {"train_loss": -5.43106746673584, "global_step": 29743, "epoch": 708} {"train_loss": -5.270103931427002, "global_step": 29744, "epoch": 708} {"train_loss": -5.4404497146606445, "global_step": 29745, "epoch": 708} {"train_loss": -5.443061828613281, "global_step": 29746, "epoch": 708} {"train_loss": -5.354939937591553, "global_step": 29747, "epoch": 708} {"train_loss": -5.349180221557617, "global_step": 29748, "epoch": 708} {"train_loss": -5.620673656463623, "global_step": 29749, "epoch": 708} {"train_loss": -5.452064514160156, "global_step": 29750, "epoch": 708} {"train_loss": -5.446992874145508, "global_step": 29751, "epoch": 708} {"train_loss": -5.365989685058594, "global_step": 29752, "epoch": 708} {"train_loss": -5.584691047668457, "global_step": 29753, "epoch": 708} {"train_loss": -5.384964942932129, "global_step": 29754, "epoch": 708} {"train_loss": -5.509634017944336, "global_step": 29755, "epoch": 708} {"train_loss": -5.49675178527832, "global_step": 29756, "epoch": 708} {"train_loss": -5.461707592010498, "global_step": 29757, "epoch": 708} {"train_loss": -5.667796611785889, "global_step": 29758, "epoch": 708} {"train_loss": -5.4862871170043945, "global_step": 29759, "epoch": 708} {"train_loss": -5.411859035491943, "global_step": 29760, "epoch": 708} {"train_loss": -5.415444374084473, "global_step": 29761, "epoch": 708} {"train_loss": -5.471996307373047, "global_step": 29762, "epoch": 708} {"train_loss": -5.511859893798828, "global_step": 29763, "epoch": 708} {"train_loss": -5.447839736938477, "global_step": 29764, "epoch": 708} {"train_loss": -5.494907855987549, "global_step": 29765, "epoch": 708} {"train_loss": -5.373973369598389, "global_step": 29766, "epoch": 708} {"train_loss": -5.354429721832275, "global_step": 29767, "epoch": 708} {"train_loss": -5.340724945068359, "global_step": 29768, "epoch": 708} {"train_loss": -5.425141334533691, "global_step": 29769, "epoch": 708} {"train_loss": -5.37741231918335, "global_step": 29770, "epoch": 708} {"train_loss": -5.531719207763672, "global_step": 29771, "epoch": 708} {"train_loss": -5.411415100097656, "global_step": 29772, "epoch": 708} {"train_loss": -5.386702060699463, "global_step": 29773, "epoch": 708} {"train_loss": -5.389359474182129, "global_step": 29774, "epoch": 708} {"train_loss": -5.498104095458984, "global_step": 29775, "epoch": 708} {"train_loss": -5.463244438171387, "global_step": 29776, "epoch": 708} {"train_loss": -5.436998662494478, "global_step": 29777, "epoch": 708, "val_loss": 63724.0546875} {"train_loss": -5.5045013427734375, "global_step": 29778, "epoch": 709} {"train_loss": -5.452933311462402, "global_step": 29779, "epoch": 709} {"train_loss": -5.373344421386719, "global_step": 29780, "epoch": 709} {"train_loss": -5.510458469390869, "global_step": 29781, "epoch": 709} {"train_loss": -5.5626726150512695, "global_step": 29782, "epoch": 709} {"train_loss": -5.358565330505371, "global_step": 29783, "epoch": 709} {"train_loss": -5.349064826965332, "global_step": 29784, "epoch": 709} {"train_loss": -5.529236793518066, "global_step": 29785, "epoch": 709} {"train_loss": -5.335946559906006, "global_step": 29786, "epoch": 709} {"train_loss": -5.475772857666016, "global_step": 29787, "epoch": 709} {"train_loss": -5.529650688171387, "global_step": 29788, "epoch": 709} {"train_loss": -5.283267021179199, "global_step": 29789, "epoch": 709} {"train_loss": -5.507073402404785, "global_step": 29790, "epoch": 709} {"train_loss": -5.335821628570557, "global_step": 29791, "epoch": 709} {"train_loss": -5.37368106842041, "global_step": 29792, "epoch": 709} {"train_loss": -5.397162914276123, "global_step": 29793, "epoch": 709} {"train_loss": -5.365322113037109, "global_step": 29794, "epoch": 709} {"train_loss": -5.472746849060059, "global_step": 29795, "epoch": 709} {"train_loss": -5.3421831130981445, "global_step": 29796, "epoch": 709} {"train_loss": -5.439031600952148, "global_step": 29797, "epoch": 709} {"train_loss": -5.3707146644592285, "global_step": 29798, "epoch": 709} {"train_loss": -5.4156575202941895, "global_step": 29799, "epoch": 709} {"train_loss": -5.291168689727783, "global_step": 29800, "epoch": 709} {"train_loss": -5.4521918296813965, "global_step": 29801, "epoch": 709} {"train_loss": -5.419833183288574, "global_step": 29802, "epoch": 709} {"train_loss": -5.337878227233887, "global_step": 29803, "epoch": 709} {"train_loss": -5.413494110107422, "global_step": 29804, "epoch": 709} {"train_loss": -5.288363933563232, "global_step": 29805, "epoch": 709} {"train_loss": -5.454145908355713, "global_step": 29806, "epoch": 709} {"train_loss": -5.260242462158203, "global_step": 29807, "epoch": 709} {"train_loss": -5.434174537658691, "global_step": 29808, "epoch": 709} {"train_loss": -5.571135520935059, "global_step": 29809, "epoch": 709} {"train_loss": -5.492712497711182, "global_step": 29810, "epoch": 709} {"train_loss": -5.480484485626221, "global_step": 29811, "epoch": 709} {"train_loss": -5.340768814086914, "global_step": 29812, "epoch": 709} {"train_loss": -5.256053924560547, "global_step": 29813, "epoch": 709} {"train_loss": -5.51450777053833, "global_step": 29814, "epoch": 709} {"train_loss": -5.399971961975098, "global_step": 29815, "epoch": 709} {"train_loss": -5.376317977905273, "global_step": 29816, "epoch": 709} {"train_loss": -5.361823081970215, "global_step": 29817, "epoch": 709} {"train_loss": -5.299107074737549, "global_step": 29818, "epoch": 709} {"train_loss": -5.409365858350482, "global_step": 29819, "epoch": 709, "val_loss": 63738.32421875} {"train_loss": -5.502685546875, "global_step": 29820, "epoch": 710} {"train_loss": -5.259950637817383, "global_step": 29821, "epoch": 710} {"train_loss": -5.529661178588867, "global_step": 29822, "epoch": 710} {"train_loss": -5.410719871520996, "global_step": 29823, "epoch": 710} {"train_loss": -5.38994836807251, "global_step": 29824, "epoch": 710} {"train_loss": -5.35658597946167, "global_step": 29825, "epoch": 710} {"train_loss": -5.435288429260254, "global_step": 29826, "epoch": 710} {"train_loss": -5.412628173828125, "global_step": 29827, "epoch": 710} {"train_loss": -5.39872932434082, "global_step": 29828, "epoch": 710} {"train_loss": -5.394561767578125, "global_step": 29829, "epoch": 710} {"train_loss": -5.613173961639404, "global_step": 29830, "epoch": 710} {"train_loss": -5.404719829559326, "global_step": 29831, "epoch": 710} {"train_loss": -5.455328464508057, "global_step": 29832, "epoch": 710} {"train_loss": -5.512831687927246, "global_step": 29833, "epoch": 710} {"train_loss": -5.356076240539551, "global_step": 29834, "epoch": 710} {"train_loss": -5.431031703948975, "global_step": 29835, "epoch": 710} {"train_loss": -5.443394184112549, "global_step": 29836, "epoch": 710} {"train_loss": -5.463509559631348, "global_step": 29837, "epoch": 710} {"train_loss": -5.448050498962402, "global_step": 29838, "epoch": 710} {"train_loss": -5.3259100914001465, "global_step": 29839, "epoch": 710} {"train_loss": -5.547999382019043, "global_step": 29840, "epoch": 710} {"train_loss": -5.372333526611328, "global_step": 29841, "epoch": 710} {"train_loss": -5.491667747497559, "global_step": 29842, "epoch": 710} {"train_loss": -5.526357650756836, "global_step": 29843, "epoch": 710} {"train_loss": -5.476051330566406, "global_step": 29844, "epoch": 710} {"train_loss": -5.383774757385254, "global_step": 29845, "epoch": 710} {"train_loss": -5.549088478088379, "global_step": 29846, "epoch": 710} {"train_loss": -5.348291397094727, "global_step": 29847, "epoch": 710} {"train_loss": -5.508941650390625, "global_step": 29848, "epoch": 710} {"train_loss": -5.452695846557617, "global_step": 29849, "epoch": 710} {"train_loss": -5.356869697570801, "global_step": 29850, "epoch": 710} {"train_loss": -5.511447906494141, "global_step": 29851, "epoch": 710} {"train_loss": -5.47737979888916, "global_step": 29852, "epoch": 710} {"train_loss": -5.533127784729004, "global_step": 29853, "epoch": 710} {"train_loss": -5.400495529174805, "global_step": 29854, "epoch": 710} {"train_loss": -5.456412315368652, "global_step": 29855, "epoch": 710} {"train_loss": -5.479043483734131, "global_step": 29856, "epoch": 710} {"train_loss": -5.529759407043457, "global_step": 29857, "epoch": 710} {"train_loss": -5.409419059753418, "global_step": 29858, "epoch": 710} {"train_loss": -5.478710174560547, "global_step": 29859, "epoch": 710} {"train_loss": -5.471868515014648, "global_step": 29860, "epoch": 710} {"train_loss": -5.4457262470608665, "global_step": 29861, "epoch": 710, "val_loss": 63280.1953125} {"train_loss": -5.49957275390625, "global_step": 29862, "epoch": 711} {"train_loss": -5.488556861877441, "global_step": 29863, "epoch": 711} {"train_loss": -5.444195747375488, "global_step": 29864, "epoch": 711} {"train_loss": -5.505311012268066, "global_step": 29865, "epoch": 711} {"train_loss": -5.363529682159424, "global_step": 29866, "epoch": 711} {"train_loss": -5.449437141418457, "global_step": 29867, "epoch": 711} {"train_loss": -5.40789794921875, "global_step": 29868, "epoch": 711} {"train_loss": -5.400389194488525, "global_step": 29869, "epoch": 711} {"train_loss": -5.362601280212402, "global_step": 29870, "epoch": 711} {"train_loss": -5.524214744567871, "global_step": 29871, "epoch": 711} {"train_loss": -5.402631759643555, "global_step": 29872, "epoch": 711} {"train_loss": -5.521562576293945, "global_step": 29873, "epoch": 711} {"train_loss": -5.381096363067627, "global_step": 29874, "epoch": 711} {"train_loss": -5.432134628295898, "global_step": 29875, "epoch": 711} {"train_loss": -5.467312812805176, "global_step": 29876, "epoch": 711} {"train_loss": -5.429696083068848, "global_step": 29877, "epoch": 711} {"train_loss": -5.47086763381958, "global_step": 29878, "epoch": 711} {"train_loss": -5.3637285232543945, "global_step": 29879, "epoch": 711} {"train_loss": -5.449074745178223, "global_step": 29880, "epoch": 711} {"train_loss": -5.361383438110352, "global_step": 29881, "epoch": 711} {"train_loss": -5.440131187438965, "global_step": 29882, "epoch": 711} {"train_loss": -5.454159736633301, "global_step": 29883, "epoch": 711} {"train_loss": -5.431639671325684, "global_step": 29884, "epoch": 711} {"train_loss": -5.569332122802734, "global_step": 29885, "epoch": 711} {"train_loss": -5.377270698547363, "global_step": 29886, "epoch": 711} {"train_loss": -5.481551170349121, "global_step": 29887, "epoch": 711} {"train_loss": -5.567346096038818, "global_step": 29888, "epoch": 711} {"train_loss": -5.447653770446777, "global_step": 29889, "epoch": 711} {"train_loss": -5.571732521057129, "global_step": 29890, "epoch": 711} {"train_loss": -5.451565742492676, "global_step": 29891, "epoch": 711} {"train_loss": -5.414167881011963, "global_step": 29892, "epoch": 711} {"train_loss": -5.518786430358887, "global_step": 29893, "epoch": 711} {"train_loss": -5.499255180358887, "global_step": 29894, "epoch": 711} {"train_loss": -5.4710307121276855, "global_step": 29895, "epoch": 711} {"train_loss": -5.6011457443237305, "global_step": 29896, "epoch": 711} {"train_loss": -5.577820777893066, "global_step": 29897, "epoch": 711} {"train_loss": -5.481095790863037, "global_step": 29898, "epoch": 711} {"train_loss": -5.523528099060059, "global_step": 29899, "epoch": 711} {"train_loss": -5.604569911956787, "global_step": 29900, "epoch": 711} {"train_loss": -5.468427658081055, "global_step": 29901, "epoch": 711} {"train_loss": -5.464293479919434, "global_step": 29902, "epoch": 711} {"train_loss": -5.465331236521403, "global_step": 29903, "epoch": 711, "val_loss": 63160.14453125} {"train_loss": -5.503403186798096, "global_step": 29904, "epoch": 712} {"train_loss": -5.494482040405273, "global_step": 29905, "epoch": 712} {"train_loss": -5.431570529937744, "global_step": 29906, "epoch": 712} {"train_loss": -5.514250755310059, "global_step": 29907, "epoch": 712} {"train_loss": -5.497052192687988, "global_step": 29908, "epoch": 712} {"train_loss": -5.498258113861084, "global_step": 29909, "epoch": 712} {"train_loss": -5.535377502441406, "global_step": 29910, "epoch": 712} {"train_loss": -5.667906761169434, "global_step": 29911, "epoch": 712} {"train_loss": -5.5829548835754395, "global_step": 29912, "epoch": 712} {"train_loss": -5.479689598083496, "global_step": 29913, "epoch": 712} {"train_loss": -5.323781967163086, "global_step": 29914, "epoch": 712} {"train_loss": -5.542899131774902, "global_step": 29915, "epoch": 712} {"train_loss": -5.342523574829102, "global_step": 29916, "epoch": 712} {"train_loss": -5.375885963439941, "global_step": 29917, "epoch": 712} {"train_loss": -5.605137825012207, "global_step": 29918, "epoch": 712} {"train_loss": -5.463913440704346, "global_step": 29919, "epoch": 712} {"train_loss": -5.432997703552246, "global_step": 29920, "epoch": 712} {"train_loss": -5.462495803833008, "global_step": 29921, "epoch": 712} {"train_loss": -5.465479850769043, "global_step": 29922, "epoch": 712} {"train_loss": -5.523784160614014, "global_step": 29923, "epoch": 712} {"train_loss": -5.513004302978516, "global_step": 29924, "epoch": 712} {"train_loss": -5.443578720092773, "global_step": 29925, "epoch": 712} {"train_loss": -5.4444098472595215, "global_step": 29926, "epoch": 712} {"train_loss": -5.457897186279297, "global_step": 29927, "epoch": 712} {"train_loss": -5.469808578491211, "global_step": 29928, "epoch": 712} {"train_loss": -5.479172706604004, "global_step": 29929, "epoch": 712} {"train_loss": -5.5041656494140625, "global_step": 29930, "epoch": 712} {"train_loss": -5.471598148345947, "global_step": 29931, "epoch": 712} {"train_loss": -5.504103660583496, "global_step": 29932, "epoch": 712} {"train_loss": -5.595150947570801, "global_step": 29933, "epoch": 712} {"train_loss": -5.456726551055908, "global_step": 29934, "epoch": 712} {"train_loss": -5.377248287200928, "global_step": 29935, "epoch": 712} {"train_loss": -5.580638885498047, "global_step": 29936, "epoch": 712} {"train_loss": -5.39245080947876, "global_step": 29937, "epoch": 712} {"train_loss": -5.4630889892578125, "global_step": 29938, "epoch": 712} {"train_loss": -5.458396911621094, "global_step": 29939, "epoch": 712} {"train_loss": -5.3510518074035645, "global_step": 29940, "epoch": 712} {"train_loss": -5.533079624176025, "global_step": 29941, "epoch": 712} {"train_loss": -5.412971496582031, "global_step": 29942, "epoch": 712} {"train_loss": -5.2314839363098145, "global_step": 29943, "epoch": 712} {"train_loss": -5.388605117797852, "global_step": 29944, "epoch": 712} {"train_loss": -5.466566562652588, "global_step": 29945, "epoch": 712, "val_loss": 63614.81640625} {"train_loss": -5.362551689147949, "global_step": 29946, "epoch": 713} {"train_loss": -5.381661415100098, "global_step": 29947, "epoch": 713} {"train_loss": -5.49881649017334, "global_step": 29948, "epoch": 713} {"train_loss": -5.402898788452148, "global_step": 29949, "epoch": 713} {"train_loss": -5.581705093383789, "global_step": 29950, "epoch": 713} {"train_loss": -5.555626392364502, "global_step": 29951, "epoch": 713} {"train_loss": -5.3895649909973145, "global_step": 29952, "epoch": 713} {"train_loss": -5.5815839767456055, "global_step": 29953, "epoch": 713} {"train_loss": -5.366730690002441, "global_step": 29954, "epoch": 713} {"train_loss": -5.586915969848633, "global_step": 29955, "epoch": 713} {"train_loss": -5.4958953857421875, "global_step": 29956, "epoch": 713} {"train_loss": -5.501461982727051, "global_step": 29957, "epoch": 713} {"train_loss": -5.448541164398193, "global_step": 29958, "epoch": 713} {"train_loss": -5.366792678833008, "global_step": 29959, "epoch": 713} {"train_loss": -5.4578399658203125, "global_step": 29960, "epoch": 713} {"train_loss": -5.493507385253906, "global_step": 29961, "epoch": 713} {"train_loss": -5.5321431159973145, "global_step": 29962, "epoch": 713} {"train_loss": -5.494848251342773, "global_step": 29963, "epoch": 713} {"train_loss": -5.530499458312988, "global_step": 29964, "epoch": 713} {"train_loss": -5.576655387878418, "global_step": 29965, "epoch": 713} {"train_loss": -5.497690200805664, "global_step": 29966, "epoch": 713} {"train_loss": -5.53019905090332, "global_step": 29967, "epoch": 713} {"train_loss": -5.431140899658203, "global_step": 29968, "epoch": 713} {"train_loss": -5.640749454498291, "global_step": 29969, "epoch": 713} {"train_loss": -5.480551719665527, "global_step": 29970, "epoch": 713} {"train_loss": -5.506436347961426, "global_step": 29971, "epoch": 713} {"train_loss": -5.410701751708984, "global_step": 29972, "epoch": 713} {"train_loss": -5.5773725509643555, "global_step": 29973, "epoch": 713} {"train_loss": -5.505668640136719, "global_step": 29974, "epoch": 713} {"train_loss": -5.567728042602539, "global_step": 29975, "epoch": 713} {"train_loss": -5.472034931182861, "global_step": 29976, "epoch": 713} {"train_loss": -5.381730556488037, "global_step": 29977, "epoch": 713} {"train_loss": -5.568307876586914, "global_step": 29978, "epoch": 713} {"train_loss": -5.406545639038086, "global_step": 29979, "epoch": 713} {"train_loss": -5.305005073547363, "global_step": 29980, "epoch": 713} {"train_loss": -5.45325231552124, "global_step": 29981, "epoch": 713} {"train_loss": -5.477746963500977, "global_step": 29982, "epoch": 713} {"train_loss": -5.3429179191589355, "global_step": 29983, "epoch": 713} {"train_loss": -5.315197467803955, "global_step": 29984, "epoch": 713} {"train_loss": -5.473998069763184, "global_step": 29985, "epoch": 713} {"train_loss": -5.2612504959106445, "global_step": 29986, "epoch": 713} {"train_loss": -5.466205472037906, "global_step": 29987, "epoch": 713, "val_loss": 63715.66015625} {"train_loss": -5.418661594390869, "global_step": 29988, "epoch": 714} {"train_loss": -5.486575126647949, "global_step": 29989, "epoch": 714} {"train_loss": -5.363466262817383, "global_step": 29990, "epoch": 714} {"train_loss": -5.433332443237305, "global_step": 29991, "epoch": 714} {"train_loss": -5.293084621429443, "global_step": 29992, "epoch": 714} {"train_loss": -5.5610504150390625, "global_step": 29993, "epoch": 714} {"train_loss": -5.5341010093688965, "global_step": 29994, "epoch": 714} {"train_loss": -5.416655540466309, "global_step": 29995, "epoch": 714} {"train_loss": -5.493544578552246, "global_step": 29996, "epoch": 714} {"train_loss": -5.47735595703125, "global_step": 29997, "epoch": 714} {"train_loss": -5.478140830993652, "global_step": 29998, "epoch": 714} {"train_loss": -5.614433288574219, "global_step": 29999, "epoch": 714} {"train_loss": -5.464128494262695, "global_step": 30000, "epoch": 714} {"train_loss": -5.461451530456543, "global_step": 30001, "epoch": 714} {"train_loss": -5.373263359069824, "global_step": 30002, "epoch": 714} {"train_loss": -5.719929218292236, "global_step": 30003, "epoch": 714} {"train_loss": -5.482190132141113, "global_step": 30004, "epoch": 714} {"train_loss": -5.541989803314209, "global_step": 30005, "epoch": 714} {"train_loss": -5.4678120613098145, "global_step": 30006, "epoch": 714} {"train_loss": -5.396905899047852, "global_step": 30007, "epoch": 714} {"train_loss": -5.482025623321533, "global_step": 30008, "epoch": 714} {"train_loss": -5.444977760314941, "global_step": 30009, "epoch": 714} {"train_loss": -5.440451145172119, "global_step": 30010, "epoch": 714} {"train_loss": -5.547191143035889, "global_step": 30011, "epoch": 714} {"train_loss": -5.516773700714111, "global_step": 30012, "epoch": 714} {"train_loss": -5.537069320678711, "global_step": 30013, "epoch": 714} {"train_loss": -5.456576347351074, "global_step": 30014, "epoch": 714} {"train_loss": -5.531966209411621, "global_step": 30015, "epoch": 714} {"train_loss": -5.439308166503906, "global_step": 30016, "epoch": 714} {"train_loss": -5.652309417724609, "global_step": 30017, "epoch": 714} {"train_loss": -5.338740348815918, "global_step": 30018, "epoch": 714} {"train_loss": -5.428600311279297, "global_step": 30019, "epoch": 714} {"train_loss": -5.5474066734313965, "global_step": 30020, "epoch": 714} {"train_loss": -5.580685138702393, "global_step": 30021, "epoch": 714} {"train_loss": -5.554582595825195, "global_step": 30022, "epoch": 714} {"train_loss": -5.390338897705078, "global_step": 30023, "epoch": 714} {"train_loss": -5.385237693786621, "global_step": 30024, "epoch": 714} {"train_loss": -5.54193639755249, "global_step": 30025, "epoch": 714} {"train_loss": -5.536255836486816, "global_step": 30026, "epoch": 714} {"train_loss": -5.455707550048828, "global_step": 30027, "epoch": 714} {"train_loss": -5.444666862487793, "global_step": 30028, "epoch": 714} {"train_loss": -5.480924924214681, "global_step": 30029, "epoch": 714, "val_loss": 63050.79296875} {"train_loss": -5.4049763679504395, "global_step": 30030, "epoch": 715} {"train_loss": -5.4928388595581055, "global_step": 30031, "epoch": 715} {"train_loss": -5.622659683227539, "global_step": 30032, "epoch": 715} {"train_loss": -5.403860092163086, "global_step": 30033, "epoch": 715} {"train_loss": -5.412997722625732, "global_step": 30034, "epoch": 715} {"train_loss": -5.432281494140625, "global_step": 30035, "epoch": 715} {"train_loss": -5.4545440673828125, "global_step": 30036, "epoch": 715} {"train_loss": -5.45888090133667, "global_step": 30037, "epoch": 715} {"train_loss": -5.558167457580566, "global_step": 30038, "epoch": 715} {"train_loss": -5.392886161804199, "global_step": 30039, "epoch": 715} {"train_loss": -5.538990020751953, "global_step": 30040, "epoch": 715} {"train_loss": -5.498106002807617, "global_step": 30041, "epoch": 715} {"train_loss": -5.369414329528809, "global_step": 30042, "epoch": 715} {"train_loss": -5.43779993057251, "global_step": 30043, "epoch": 715} {"train_loss": -5.488550186157227, "global_step": 30044, "epoch": 715} {"train_loss": -5.346421241760254, "global_step": 30045, "epoch": 715} {"train_loss": -5.548216342926025, "global_step": 30046, "epoch": 715} {"train_loss": -5.554495811462402, "global_step": 30047, "epoch": 715} {"train_loss": -5.500027656555176, "global_step": 30048, "epoch": 715} {"train_loss": -5.520893573760986, "global_step": 30049, "epoch": 715} {"train_loss": -5.52149772644043, "global_step": 30050, "epoch": 715} {"train_loss": -5.439670085906982, "global_step": 30051, "epoch": 715} {"train_loss": -5.493303298950195, "global_step": 30052, "epoch": 715} {"train_loss": -5.507740020751953, "global_step": 30053, "epoch": 715} {"train_loss": -5.614723205566406, "global_step": 30054, "epoch": 715} {"train_loss": -5.497923851013184, "global_step": 30055, "epoch": 715} {"train_loss": -5.4383955001831055, "global_step": 30056, "epoch": 715} {"train_loss": -5.43736457824707, "global_step": 30057, "epoch": 715} {"train_loss": -5.406074523925781, "global_step": 30058, "epoch": 715} {"train_loss": -5.525179862976074, "global_step": 30059, "epoch": 715} {"train_loss": -5.542978286743164, "global_step": 30060, "epoch": 715} {"train_loss": -5.509963035583496, "global_step": 30061, "epoch": 715} {"train_loss": -5.32943868637085, "global_step": 30062, "epoch": 715} {"train_loss": -5.432724952697754, "global_step": 30063, "epoch": 715} {"train_loss": -5.540308475494385, "global_step": 30064, "epoch": 715} {"train_loss": -5.308036804199219, "global_step": 30065, "epoch": 715} {"train_loss": -5.518862724304199, "global_step": 30066, "epoch": 715} {"train_loss": -5.338885307312012, "global_step": 30067, "epoch": 715} {"train_loss": -5.451955795288086, "global_step": 30068, "epoch": 715} {"train_loss": -5.396392822265625, "global_step": 30069, "epoch": 715} {"train_loss": -5.315624237060547, "global_step": 30070, "epoch": 715} {"train_loss": -5.465169066474552, "global_step": 30071, "epoch": 715, "val_loss": 63346.08203125} {"train_loss": -5.350541114807129, "global_step": 30072, "epoch": 716} {"train_loss": -5.520120620727539, "global_step": 30073, "epoch": 716} {"train_loss": -5.454877853393555, "global_step": 30074, "epoch": 716} {"train_loss": -5.463009834289551, "global_step": 30075, "epoch": 716} {"train_loss": -5.463796615600586, "global_step": 30076, "epoch": 716} {"train_loss": -5.489101409912109, "global_step": 30077, "epoch": 716} {"train_loss": -5.5861735343933105, "global_step": 30078, "epoch": 716} {"train_loss": -5.536287307739258, "global_step": 30079, "epoch": 716} {"train_loss": -5.409163475036621, "global_step": 30080, "epoch": 716} {"train_loss": -5.442633152008057, "global_step": 30081, "epoch": 716} {"train_loss": -5.382449150085449, "global_step": 30082, "epoch": 716} {"train_loss": -5.534953594207764, "global_step": 30083, "epoch": 716} {"train_loss": -5.53590202331543, "global_step": 30084, "epoch": 716} {"train_loss": -5.5329389572143555, "global_step": 30085, "epoch": 716} {"train_loss": -5.303734302520752, "global_step": 30086, "epoch": 716} {"train_loss": -5.481149196624756, "global_step": 30087, "epoch": 716} {"train_loss": -5.434288024902344, "global_step": 30088, "epoch": 716} {"train_loss": -5.383754730224609, "global_step": 30089, "epoch": 716} {"train_loss": -5.480567932128906, "global_step": 30090, "epoch": 716} {"train_loss": -5.4657745361328125, "global_step": 30091, "epoch": 716} {"train_loss": -5.5246124267578125, "global_step": 30092, "epoch": 716} {"train_loss": -5.442227363586426, "global_step": 30093, "epoch": 716} {"train_loss": -5.435583114624023, "global_step": 30094, "epoch": 716} {"train_loss": -5.415626525878906, "global_step": 30095, "epoch": 716} {"train_loss": -5.560160160064697, "global_step": 30096, "epoch": 716} {"train_loss": -5.419787406921387, "global_step": 30097, "epoch": 716} {"train_loss": -5.459587097167969, "global_step": 30098, "epoch": 716} {"train_loss": -5.337891578674316, "global_step": 30099, "epoch": 716} {"train_loss": -5.383745193481445, "global_step": 30100, "epoch": 716} {"train_loss": -5.369234085083008, "global_step": 30101, "epoch": 716} {"train_loss": -5.477421760559082, "global_step": 30102, "epoch": 716} {"train_loss": -5.34412956237793, "global_step": 30103, "epoch": 716} {"train_loss": -5.55417537689209, "global_step": 30104, "epoch": 716} {"train_loss": -5.715639114379883, "global_step": 30105, "epoch": 716} {"train_loss": -5.420583724975586, "global_step": 30106, "epoch": 716} {"train_loss": -5.424996376037598, "global_step": 30107, "epoch": 716} {"train_loss": -5.470714569091797, "global_step": 30108, "epoch": 716} {"train_loss": -5.448464393615723, "global_step": 30109, "epoch": 716} {"train_loss": -5.461467742919922, "global_step": 30110, "epoch": 716} {"train_loss": -5.456942081451416, "global_step": 30111, "epoch": 716} {"train_loss": -5.503173828125, "global_step": 30112, "epoch": 716} {"train_loss": -5.463692040670486, "global_step": 30113, "epoch": 716, "val_loss": 63202.6796875} {"train_loss": -5.690082550048828, "global_step": 30114, "epoch": 717} {"train_loss": -5.485516548156738, "global_step": 30115, "epoch": 717} {"train_loss": -5.538375377655029, "global_step": 30116, "epoch": 717} {"train_loss": -5.424965858459473, "global_step": 30117, "epoch": 717} {"train_loss": -5.462858200073242, "global_step": 30118, "epoch": 717} {"train_loss": -5.573626518249512, "global_step": 30119, "epoch": 717} {"train_loss": -5.390442848205566, "global_step": 30120, "epoch": 717} {"train_loss": -5.55518102645874, "global_step": 30121, "epoch": 717} {"train_loss": -5.63146448135376, "global_step": 30122, "epoch": 717} {"train_loss": -5.552537441253662, "global_step": 30123, "epoch": 717} {"train_loss": -5.481175422668457, "global_step": 30124, "epoch": 717} {"train_loss": -5.4387526512146, "global_step": 30125, "epoch": 717} {"train_loss": -5.598438262939453, "global_step": 30126, "epoch": 717} {"train_loss": -5.445830345153809, "global_step": 30127, "epoch": 717} {"train_loss": -5.421949863433838, "global_step": 30128, "epoch": 717} {"train_loss": -5.619879722595215, "global_step": 30129, "epoch": 717} {"train_loss": -5.459486961364746, "global_step": 30130, "epoch": 717} {"train_loss": -5.4779462814331055, "global_step": 30131, "epoch": 717} {"train_loss": -5.418357849121094, "global_step": 30132, "epoch": 717} {"train_loss": -5.442856788635254, "global_step": 30133, "epoch": 717} {"train_loss": -5.476076602935791, "global_step": 30134, "epoch": 717} {"train_loss": -5.4241132736206055, "global_step": 30135, "epoch": 717} {"train_loss": -5.551913261413574, "global_step": 30136, "epoch": 717} {"train_loss": -5.465800762176514, "global_step": 30137, "epoch": 717} {"train_loss": -5.524538516998291, "global_step": 30138, "epoch": 717} {"train_loss": -5.4047088623046875, "global_step": 30139, "epoch": 717} {"train_loss": -5.514782905578613, "global_step": 30140, "epoch": 717} {"train_loss": -5.495020389556885, "global_step": 30141, "epoch": 717} {"train_loss": -5.519867420196533, "global_step": 30142, "epoch": 717} {"train_loss": -5.501217842102051, "global_step": 30143, "epoch": 717} {"train_loss": -5.514006614685059, "global_step": 30144, "epoch": 717} {"train_loss": -5.380220413208008, "global_step": 30145, "epoch": 717} {"train_loss": -5.490447044372559, "global_step": 30146, "epoch": 717} {"train_loss": -5.588868618011475, "global_step": 30147, "epoch": 717} {"train_loss": -5.451746940612793, "global_step": 30148, "epoch": 717} {"train_loss": -5.592860221862793, "global_step": 30149, "epoch": 717} {"train_loss": -5.497978210449219, "global_step": 30150, "epoch": 717} {"train_loss": -5.5385236740112305, "global_step": 30151, "epoch": 717} {"train_loss": -5.386353969573975, "global_step": 30152, "epoch": 717} {"train_loss": -5.5462188720703125, "global_step": 30153, "epoch": 717} {"train_loss": -5.4344024658203125, "global_step": 30154, "epoch": 717} {"train_loss": -5.498978489921207, "global_step": 30155, "epoch": 717, "val_loss": 63532.38671875} {"train_loss": -5.491979122161865, "global_step": 30156, "epoch": 718} {"train_loss": -5.566141128540039, "global_step": 30157, "epoch": 718} {"train_loss": -5.490466117858887, "global_step": 30158, "epoch": 718} {"train_loss": -5.45882511138916, "global_step": 30159, "epoch": 718} {"train_loss": -5.471757888793945, "global_step": 30160, "epoch": 718} {"train_loss": -5.521509170532227, "global_step": 30161, "epoch": 718} {"train_loss": -5.54753303527832, "global_step": 30162, "epoch": 718} {"train_loss": -5.582131385803223, "global_step": 30163, "epoch": 718} {"train_loss": -5.490914821624756, "global_step": 30164, "epoch": 718} {"train_loss": -5.526227951049805, "global_step": 30165, "epoch": 718} {"train_loss": -5.563758850097656, "global_step": 30166, "epoch": 718} {"train_loss": -5.446471691131592, "global_step": 30167, "epoch": 718} {"train_loss": -5.550310134887695, "global_step": 30168, "epoch": 718} {"train_loss": -5.236047744750977, "global_step": 30169, "epoch": 718} {"train_loss": -5.443537712097168, "global_step": 30170, "epoch": 718} {"train_loss": -5.413420677185059, "global_step": 30171, "epoch": 718} {"train_loss": -5.37647008895874, "global_step": 30172, "epoch": 718} {"train_loss": -5.378664016723633, "global_step": 30173, "epoch": 718} {"train_loss": -5.467013835906982, "global_step": 30174, "epoch": 718} {"train_loss": -5.272550582885742, "global_step": 30175, "epoch": 718} {"train_loss": -5.449535369873047, "global_step": 30176, "epoch": 718} {"train_loss": -5.4581475257873535, "global_step": 30177, "epoch": 718} {"train_loss": -5.4384613037109375, "global_step": 30178, "epoch": 718} {"train_loss": -5.519960880279541, "global_step": 30179, "epoch": 718} {"train_loss": -5.439714431762695, "global_step": 30180, "epoch": 718} {"train_loss": -5.508876323699951, "global_step": 30181, "epoch": 718} {"train_loss": -5.485605239868164, "global_step": 30182, "epoch": 718} {"train_loss": -5.3812255859375, "global_step": 30183, "epoch": 718} {"train_loss": -5.544100761413574, "global_step": 30184, "epoch": 718} {"train_loss": -5.489956855773926, "global_step": 30185, "epoch": 718} {"train_loss": -5.446056365966797, "global_step": 30186, "epoch": 718} {"train_loss": -5.495237350463867, "global_step": 30187, "epoch": 718} {"train_loss": -5.468890190124512, "global_step": 30188, "epoch": 718} {"train_loss": -5.420631408691406, "global_step": 30189, "epoch": 718} {"train_loss": -5.343646049499512, "global_step": 30190, "epoch": 718} {"train_loss": -5.380270957946777, "global_step": 30191, "epoch": 718} {"train_loss": -5.485124588012695, "global_step": 30192, "epoch": 718} {"train_loss": -5.380002975463867, "global_step": 30193, "epoch": 718} {"train_loss": -5.457612037658691, "global_step": 30194, "epoch": 718} {"train_loss": -5.40585470199585, "global_step": 30195, "epoch": 718} {"train_loss": -5.317381858825684, "global_step": 30196, "epoch": 718} {"train_loss": -5.453542675290789, "global_step": 30197, "epoch": 718, "val_loss": 63364.0} {"train_loss": -5.483464241027832, "global_step": 30198, "epoch": 719} {"train_loss": -5.454286575317383, "global_step": 30199, "epoch": 719} {"train_loss": -5.450006484985352, "global_step": 30200, "epoch": 719} {"train_loss": -5.491477012634277, "global_step": 30201, "epoch": 719} {"train_loss": -5.506552696228027, "global_step": 30202, "epoch": 719} {"train_loss": -5.641228199005127, "global_step": 30203, "epoch": 719} {"train_loss": -5.425378799438477, "global_step": 30204, "epoch": 719} {"train_loss": -5.583984375, "global_step": 30205, "epoch": 719} {"train_loss": -5.644029140472412, "global_step": 30206, "epoch": 719} {"train_loss": -5.359476089477539, "global_step": 30207, "epoch": 719} {"train_loss": -5.393085956573486, "global_step": 30208, "epoch": 719} {"train_loss": -5.553452968597412, "global_step": 30209, "epoch": 719} {"train_loss": -5.345431327819824, "global_step": 30210, "epoch": 719} {"train_loss": -5.42720890045166, "global_step": 30211, "epoch": 719} {"train_loss": -5.459437370300293, "global_step": 30212, "epoch": 719} {"train_loss": -5.378255844116211, "global_step": 30213, "epoch": 719} {"train_loss": -5.485400199890137, "global_step": 30214, "epoch": 719} {"train_loss": -5.400735855102539, "global_step": 30215, "epoch": 719} {"train_loss": -5.452381610870361, "global_step": 30216, "epoch": 719} {"train_loss": -5.431909561157227, "global_step": 30217, "epoch": 719} {"train_loss": -5.375905513763428, "global_step": 30218, "epoch": 719} {"train_loss": -5.375268936157227, "global_step": 30219, "epoch": 719} {"train_loss": -5.385268211364746, "global_step": 30220, "epoch": 719} {"train_loss": -5.443485260009766, "global_step": 30221, "epoch": 719} {"train_loss": -5.341424942016602, "global_step": 30222, "epoch": 719} {"train_loss": -5.379002571105957, "global_step": 30223, "epoch": 719} {"train_loss": -5.469783306121826, "global_step": 30224, "epoch": 719} {"train_loss": -5.359112739562988, "global_step": 30225, "epoch": 719} {"train_loss": -5.572344779968262, "global_step": 30226, "epoch": 719} {"train_loss": -5.553084373474121, "global_step": 30227, "epoch": 719} {"train_loss": -5.402167320251465, "global_step": 30228, "epoch": 719} {"train_loss": -5.4227800369262695, "global_step": 30229, "epoch": 719} {"train_loss": -5.444883346557617, "global_step": 30230, "epoch": 719} {"train_loss": -5.492664337158203, "global_step": 30231, "epoch": 719} {"train_loss": -5.4958977699279785, "global_step": 30232, "epoch": 719} {"train_loss": -5.548566818237305, "global_step": 30233, "epoch": 719} {"train_loss": -5.536388397216797, "global_step": 30234, "epoch": 719} {"train_loss": -5.527456283569336, "global_step": 30235, "epoch": 719} {"train_loss": -5.5007758140563965, "global_step": 30236, "epoch": 719} {"train_loss": -5.477343559265137, "global_step": 30237, "epoch": 719} {"train_loss": -5.570395469665527, "global_step": 30238, "epoch": 719} {"train_loss": -5.461824383054461, "global_step": 30239, "epoch": 719, "val_loss": 63600.88671875} {"train_loss": -5.530068874359131, "global_step": 30240, "epoch": 720} {"train_loss": -5.538023471832275, "global_step": 30241, "epoch": 720} {"train_loss": -5.532068729400635, "global_step": 30242, "epoch": 720} {"train_loss": -5.515617847442627, "global_step": 30243, "epoch": 720} {"train_loss": -5.537392616271973, "global_step": 30244, "epoch": 720} {"train_loss": -5.383683204650879, "global_step": 30245, "epoch": 720} {"train_loss": -5.439492225646973, "global_step": 30246, "epoch": 720} {"train_loss": -5.438230037689209, "global_step": 30247, "epoch": 720} {"train_loss": -5.3991594314575195, "global_step": 30248, "epoch": 720} {"train_loss": -5.405282020568848, "global_step": 30249, "epoch": 720} {"train_loss": -5.472524642944336, "global_step": 30250, "epoch": 720} {"train_loss": -5.416305065155029, "global_step": 30251, "epoch": 720} {"train_loss": -5.518590927124023, "global_step": 30252, "epoch": 720} {"train_loss": -5.447732925415039, "global_step": 30253, "epoch": 720} {"train_loss": -5.4452362060546875, "global_step": 30254, "epoch": 720} {"train_loss": -5.4428277015686035, "global_step": 30255, "epoch": 720} {"train_loss": -5.4387311935424805, "global_step": 30256, "epoch": 720} {"train_loss": -5.552310943603516, "global_step": 30257, "epoch": 720} {"train_loss": -5.436967849731445, "global_step": 30258, "epoch": 720} {"train_loss": -5.547980308532715, "global_step": 30259, "epoch": 720} {"train_loss": -5.430258750915527, "global_step": 30260, "epoch": 720} {"train_loss": -5.59459924697876, "global_step": 30261, "epoch": 720} {"train_loss": -5.456503868103027, "global_step": 30262, "epoch": 720} {"train_loss": -5.504334449768066, "global_step": 30263, "epoch": 720} {"train_loss": -5.47852897644043, "global_step": 30264, "epoch": 720} {"train_loss": -5.409330368041992, "global_step": 30265, "epoch": 720} {"train_loss": -5.431380748748779, "global_step": 30266, "epoch": 720} {"train_loss": -5.416799545288086, "global_step": 30267, "epoch": 720} {"train_loss": -5.434203147888184, "global_step": 30268, "epoch": 720} {"train_loss": -5.421201705932617, "global_step": 30269, "epoch": 720} {"train_loss": -5.473005294799805, "global_step": 30270, "epoch": 720} {"train_loss": -5.400619983673096, "global_step": 30271, "epoch": 720} {"train_loss": -5.479576110839844, "global_step": 30272, "epoch": 720} {"train_loss": -5.516960144042969, "global_step": 30273, "epoch": 720} {"train_loss": -5.410370826721191, "global_step": 30274, "epoch": 720} {"train_loss": -5.437936305999756, "global_step": 30275, "epoch": 720} {"train_loss": -5.598237037658691, "global_step": 30276, "epoch": 720} {"train_loss": -5.413789749145508, "global_step": 30277, "epoch": 720} {"train_loss": -5.376919746398926, "global_step": 30278, "epoch": 720} {"train_loss": -5.522462368011475, "global_step": 30279, "epoch": 720} {"train_loss": -5.484174728393555, "global_step": 30280, "epoch": 720} {"train_loss": -5.466789938154674, "global_step": 30281, "epoch": 720, "val_loss": 63123.29296875} {"train_loss": -5.416104316711426, "global_step": 30282, "epoch": 721} {"train_loss": -5.452263355255127, "global_step": 30283, "epoch": 721} {"train_loss": -5.355478763580322, "global_step": 30284, "epoch": 721} {"train_loss": -5.408363342285156, "global_step": 30285, "epoch": 721} {"train_loss": -5.458608627319336, "global_step": 30286, "epoch": 721} {"train_loss": -5.445716381072998, "global_step": 30287, "epoch": 721} {"train_loss": -5.5884857177734375, "global_step": 30288, "epoch": 721} {"train_loss": -5.408947944641113, "global_step": 30289, "epoch": 721} {"train_loss": -5.602273941040039, "global_step": 30290, "epoch": 721} {"train_loss": -5.578127861022949, "global_step": 30291, "epoch": 721} {"train_loss": -5.583992004394531, "global_step": 30292, "epoch": 721} {"train_loss": -5.420414924621582, "global_step": 30293, "epoch": 721} {"train_loss": -5.574624061584473, "global_step": 30294, "epoch": 721} {"train_loss": -5.624220371246338, "global_step": 30295, "epoch": 721} {"train_loss": -5.413487911224365, "global_step": 30296, "epoch": 721} {"train_loss": -5.5269951820373535, "global_step": 30297, "epoch": 721} {"train_loss": -5.446783065795898, "global_step": 30298, "epoch": 721} {"train_loss": -5.409228801727295, "global_step": 30299, "epoch": 721} {"train_loss": -5.518180847167969, "global_step": 30300, "epoch": 721} {"train_loss": -5.487124919891357, "global_step": 30301, "epoch": 721} {"train_loss": -5.422089576721191, "global_step": 30302, "epoch": 721} {"train_loss": -5.33709716796875, "global_step": 30303, "epoch": 721} {"train_loss": -5.508792877197266, "global_step": 30304, "epoch": 721} {"train_loss": -5.483577728271484, "global_step": 30305, "epoch": 721} {"train_loss": -5.345554828643799, "global_step": 30306, "epoch": 721} {"train_loss": -5.513050079345703, "global_step": 30307, "epoch": 721} {"train_loss": -5.387316703796387, "global_step": 30308, "epoch": 721} {"train_loss": -5.523138999938965, "global_step": 30309, "epoch": 721} {"train_loss": -5.41356897354126, "global_step": 30310, "epoch": 721} {"train_loss": -5.473165035247803, "global_step": 30311, "epoch": 721} {"train_loss": -5.6075873374938965, "global_step": 30312, "epoch": 721} {"train_loss": -5.500865936279297, "global_step": 30313, "epoch": 721} {"train_loss": -5.5198893547058105, "global_step": 30314, "epoch": 721} {"train_loss": -5.527510643005371, "global_step": 30315, "epoch": 721} {"train_loss": -5.515895366668701, "global_step": 30316, "epoch": 721} {"train_loss": -5.512779235839844, "global_step": 30317, "epoch": 721} {"train_loss": -5.4684367179870605, "global_step": 30318, "epoch": 721} {"train_loss": -5.442261695861816, "global_step": 30319, "epoch": 721} {"train_loss": -5.42708158493042, "global_step": 30320, "epoch": 721} {"train_loss": -5.353192329406738, "global_step": 30321, "epoch": 721} {"train_loss": -5.3508687019348145, "global_step": 30322, "epoch": 721} {"train_loss": -5.473479566119966, "global_step": 30323, "epoch": 721, "val_loss": 63102.4140625} {"train_loss": -5.559391975402832, "global_step": 30324, "epoch": 722} {"train_loss": -5.512155532836914, "global_step": 30325, "epoch": 722} {"train_loss": -5.547568321228027, "global_step": 30326, "epoch": 722} {"train_loss": -5.503243446350098, "global_step": 30327, "epoch": 722} {"train_loss": -5.42629337310791, "global_step": 30328, "epoch": 722} {"train_loss": -5.416253089904785, "global_step": 30329, "epoch": 722} {"train_loss": -5.491030216217041, "global_step": 30330, "epoch": 722} {"train_loss": -5.496993541717529, "global_step": 30331, "epoch": 722} {"train_loss": -5.353724002838135, "global_step": 30332, "epoch": 722} {"train_loss": -5.5067973136901855, "global_step": 30333, "epoch": 722} {"train_loss": -5.424267768859863, "global_step": 30334, "epoch": 722} {"train_loss": -5.440421104431152, "global_step": 30335, "epoch": 722} {"train_loss": -5.489053249359131, "global_step": 30336, "epoch": 722} {"train_loss": -5.387901782989502, "global_step": 30337, "epoch": 722} {"train_loss": -5.561750411987305, "global_step": 30338, "epoch": 722} {"train_loss": -5.578522682189941, "global_step": 30339, "epoch": 722} {"train_loss": -5.446169853210449, "global_step": 30340, "epoch": 722} {"train_loss": -5.47324275970459, "global_step": 30341, "epoch": 722} {"train_loss": -5.431182861328125, "global_step": 30342, "epoch": 722} {"train_loss": -5.574132919311523, "global_step": 30343, "epoch": 722} {"train_loss": -5.495575904846191, "global_step": 30344, "epoch": 722} {"train_loss": -5.625890731811523, "global_step": 30345, "epoch": 722} {"train_loss": -5.535313606262207, "global_step": 30346, "epoch": 722} {"train_loss": -5.506793975830078, "global_step": 30347, "epoch": 722} {"train_loss": -5.369895935058594, "global_step": 30348, "epoch": 722} {"train_loss": -5.526826858520508, "global_step": 30349, "epoch": 722} {"train_loss": -5.5311784744262695, "global_step": 30350, "epoch": 722} {"train_loss": -5.555237293243408, "global_step": 30351, "epoch": 722} {"train_loss": -5.505429267883301, "global_step": 30352, "epoch": 722} {"train_loss": -5.36981201171875, "global_step": 30353, "epoch": 722} {"train_loss": -5.54379415512085, "global_step": 30354, "epoch": 722} {"train_loss": -5.342561721801758, "global_step": 30355, "epoch": 722} {"train_loss": -5.456579208374023, "global_step": 30356, "epoch": 722} {"train_loss": -5.522707939147949, "global_step": 30357, "epoch": 722} {"train_loss": -5.530332088470459, "global_step": 30358, "epoch": 722} {"train_loss": -5.436328887939453, "global_step": 30359, "epoch": 722} {"train_loss": -5.550429344177246, "global_step": 30360, "epoch": 722} {"train_loss": -5.448749542236328, "global_step": 30361, "epoch": 722} {"train_loss": -5.501121520996094, "global_step": 30362, "epoch": 722} {"train_loss": -5.515483856201172, "global_step": 30363, "epoch": 722} {"train_loss": -5.520049571990967, "global_step": 30364, "epoch": 722} {"train_loss": -5.490740696589152, "global_step": 30365, "epoch": 722, "val_loss": 63099.2578125} {"train_loss": -5.469880104064941, "global_step": 30366, "epoch": 723} {"train_loss": -5.525388717651367, "global_step": 30367, "epoch": 723} {"train_loss": -5.5260210037231445, "global_step": 30368, "epoch": 723} {"train_loss": -5.623841285705566, "global_step": 30369, "epoch": 723} {"train_loss": -5.507442474365234, "global_step": 30370, "epoch": 723} {"train_loss": -5.614459991455078, "global_step": 30371, "epoch": 723} {"train_loss": -5.489027976989746, "global_step": 30372, "epoch": 723} {"train_loss": -5.593703269958496, "global_step": 30373, "epoch": 723} {"train_loss": -5.5596208572387695, "global_step": 30374, "epoch": 723} {"train_loss": -5.489645004272461, "global_step": 30375, "epoch": 723} {"train_loss": -5.526185512542725, "global_step": 30376, "epoch": 723} {"train_loss": -5.571243762969971, "global_step": 30377, "epoch": 723} {"train_loss": -5.48359489440918, "global_step": 30378, "epoch": 723} {"train_loss": -5.331657886505127, "global_step": 30379, "epoch": 723} {"train_loss": -5.476741790771484, "global_step": 30380, "epoch": 723} {"train_loss": -5.577725887298584, "global_step": 30381, "epoch": 723} {"train_loss": -5.514736175537109, "global_step": 30382, "epoch": 723} {"train_loss": -5.469796180725098, "global_step": 30383, "epoch": 723} {"train_loss": -5.522956848144531, "global_step": 30384, "epoch": 723} {"train_loss": -5.493888854980469, "global_step": 30385, "epoch": 723} {"train_loss": -5.359377861022949, "global_step": 30386, "epoch": 723} {"train_loss": -5.416825294494629, "global_step": 30387, "epoch": 723} {"train_loss": -5.495817184448242, "global_step": 30388, "epoch": 723} {"train_loss": -5.406551361083984, "global_step": 30389, "epoch": 723} {"train_loss": -5.322580337524414, "global_step": 30390, "epoch": 723} {"train_loss": -5.401729583740234, "global_step": 30391, "epoch": 723} {"train_loss": -5.450260639190674, "global_step": 30392, "epoch": 723} {"train_loss": -5.450262069702148, "global_step": 30393, "epoch": 723} {"train_loss": -5.497623443603516, "global_step": 30394, "epoch": 723} {"train_loss": -5.483131408691406, "global_step": 30395, "epoch": 723} {"train_loss": -5.43679141998291, "global_step": 30396, "epoch": 723} {"train_loss": -5.521114349365234, "global_step": 30397, "epoch": 723} {"train_loss": -5.410945415496826, "global_step": 30398, "epoch": 723} {"train_loss": -5.6573286056518555, "global_step": 30399, "epoch": 723} {"train_loss": -5.397592544555664, "global_step": 30400, "epoch": 723} {"train_loss": -5.44760799407959, "global_step": 30401, "epoch": 723} {"train_loss": -5.51320219039917, "global_step": 30402, "epoch": 723} {"train_loss": -5.5339202880859375, "global_step": 30403, "epoch": 723} {"train_loss": -5.53220272064209, "global_step": 30404, "epoch": 723} {"train_loss": -5.5527238845825195, "global_step": 30405, "epoch": 723} {"train_loss": -5.54218864440918, "global_step": 30406, "epoch": 723} {"train_loss": -5.491322233563378, "global_step": 30407, "epoch": 723, "val_loss": 63387.984375} {"train_loss": -5.499537467956543, "global_step": 30408, "epoch": 724} {"train_loss": -5.539289474487305, "global_step": 30409, "epoch": 724} {"train_loss": -5.442813873291016, "global_step": 30410, "epoch": 724} {"train_loss": -5.514163970947266, "global_step": 30411, "epoch": 724} {"train_loss": -5.463052749633789, "global_step": 30412, "epoch": 724} {"train_loss": -5.552352428436279, "global_step": 30413, "epoch": 724} {"train_loss": -5.489992141723633, "global_step": 30414, "epoch": 724} {"train_loss": -5.565889358520508, "global_step": 30415, "epoch": 724} {"train_loss": -5.525449752807617, "global_step": 30416, "epoch": 724} {"train_loss": -5.547076225280762, "global_step": 30417, "epoch": 724} {"train_loss": -5.410686492919922, "global_step": 30418, "epoch": 724} {"train_loss": -5.573577880859375, "global_step": 30419, "epoch": 724} {"train_loss": -5.568934440612793, "global_step": 30420, "epoch": 724} {"train_loss": -5.316123962402344, "global_step": 30421, "epoch": 724} {"train_loss": -5.439610481262207, "global_step": 30422, "epoch": 724} {"train_loss": -5.617892742156982, "global_step": 30423, "epoch": 724} {"train_loss": -5.598889350891113, "global_step": 30424, "epoch": 724} {"train_loss": -5.432342529296875, "global_step": 30425, "epoch": 724} {"train_loss": -5.484712600708008, "global_step": 30426, "epoch": 724} {"train_loss": -5.555953025817871, "global_step": 30427, "epoch": 724} {"train_loss": -5.3943352699279785, "global_step": 30428, "epoch": 724} {"train_loss": -5.512953758239746, "global_step": 30429, "epoch": 724} {"train_loss": -5.500998497009277, "global_step": 30430, "epoch": 724} {"train_loss": -5.391828536987305, "global_step": 30431, "epoch": 724} {"train_loss": -5.540024757385254, "global_step": 30432, "epoch": 724} {"train_loss": -5.511192321777344, "global_step": 30433, "epoch": 724} {"train_loss": -5.3687214851379395, "global_step": 30434, "epoch": 724} {"train_loss": -5.554347515106201, "global_step": 30435, "epoch": 724} {"train_loss": -5.330047607421875, "global_step": 30436, "epoch": 724} {"train_loss": -5.534458160400391, "global_step": 30437, "epoch": 724} {"train_loss": -5.485422134399414, "global_step": 30438, "epoch": 724} {"train_loss": -5.359636306762695, "global_step": 30439, "epoch": 724} {"train_loss": -5.364475250244141, "global_step": 30440, "epoch": 724} {"train_loss": -5.325130462646484, "global_step": 30441, "epoch": 724} {"train_loss": -5.439120292663574, "global_step": 30442, "epoch": 724} {"train_loss": -5.398443222045898, "global_step": 30443, "epoch": 724} {"train_loss": -5.50076961517334, "global_step": 30444, "epoch": 724} {"train_loss": -5.538216590881348, "global_step": 30445, "epoch": 724} {"train_loss": -5.375336170196533, "global_step": 30446, "epoch": 724} {"train_loss": -5.455997943878174, "global_step": 30447, "epoch": 724} {"train_loss": -5.429161071777344, "global_step": 30448, "epoch": 724} {"train_loss": -5.473777123859951, "global_step": 30449, "epoch": 724, "val_loss": 63399.7421875} {"train_loss": -5.625887870788574, "global_step": 30450, "epoch": 725} {"train_loss": -5.4653778076171875, "global_step": 30451, "epoch": 725} {"train_loss": -5.493275165557861, "global_step": 30452, "epoch": 725} {"train_loss": -5.361148834228516, "global_step": 30453, "epoch": 725} {"train_loss": -5.537264347076416, "global_step": 30454, "epoch": 725} {"train_loss": -5.433168411254883, "global_step": 30455, "epoch": 725} {"train_loss": -5.431277275085449, "global_step": 30456, "epoch": 725} {"train_loss": -5.4526777267456055, "global_step": 30457, "epoch": 725} {"train_loss": -5.420461177825928, "global_step": 30458, "epoch": 725} {"train_loss": -5.483410835266113, "global_step": 30459, "epoch": 725} {"train_loss": -5.517607688903809, "global_step": 30460, "epoch": 725} {"train_loss": -5.385526657104492, "global_step": 30461, "epoch": 725} {"train_loss": -5.54895544052124, "global_step": 30462, "epoch": 725} {"train_loss": -5.473649024963379, "global_step": 30463, "epoch": 725} {"train_loss": -5.416513442993164, "global_step": 30464, "epoch": 725} {"train_loss": -5.585453033447266, "global_step": 30465, "epoch": 725} {"train_loss": -5.504940986633301, "global_step": 30466, "epoch": 725} {"train_loss": -5.531078815460205, "global_step": 30467, "epoch": 725} {"train_loss": -5.431540012359619, "global_step": 30468, "epoch": 725} {"train_loss": -5.449804782867432, "global_step": 30469, "epoch": 725} {"train_loss": -5.474450588226318, "global_step": 30470, "epoch": 725} {"train_loss": -5.519600868225098, "global_step": 30471, "epoch": 725} {"train_loss": -5.435572624206543, "global_step": 30472, "epoch": 725} {"train_loss": -5.493579864501953, "global_step": 30473, "epoch": 725} {"train_loss": -5.367332458496094, "global_step": 30474, "epoch": 725} {"train_loss": -5.482619285583496, "global_step": 30475, "epoch": 725} {"train_loss": -5.486822128295898, "global_step": 30476, "epoch": 725} {"train_loss": -5.3356499671936035, "global_step": 30477, "epoch": 725} {"train_loss": -5.463974952697754, "global_step": 30478, "epoch": 725} {"train_loss": -5.378026008605957, "global_step": 30479, "epoch": 725} {"train_loss": -5.554885387420654, "global_step": 30480, "epoch": 725} {"train_loss": -5.403825759887695, "global_step": 30481, "epoch": 725} {"train_loss": -5.44734001159668, "global_step": 30482, "epoch": 725} {"train_loss": -5.466582298278809, "global_step": 30483, "epoch": 725} {"train_loss": -5.457924842834473, "global_step": 30484, "epoch": 725} {"train_loss": -5.552671432495117, "global_step": 30485, "epoch": 725} {"train_loss": -5.372733116149902, "global_step": 30486, "epoch": 725} {"train_loss": -5.495443344116211, "global_step": 30487, "epoch": 725} {"train_loss": -5.4800872802734375, "global_step": 30488, "epoch": 725} {"train_loss": -5.439386367797852, "global_step": 30489, "epoch": 725} {"train_loss": -5.379063129425049, "global_step": 30490, "epoch": 725} {"train_loss": -5.460933446884155, "global_step": 30491, "epoch": 725, "val_loss": 63135.77734375} {"train_loss": -5.488410949707031, "global_step": 30492, "epoch": 726} {"train_loss": -5.498353004455566, "global_step": 30493, "epoch": 726} {"train_loss": -5.442396640777588, "global_step": 30494, "epoch": 726} {"train_loss": -5.554859161376953, "global_step": 30495, "epoch": 726} {"train_loss": -5.474572658538818, "global_step": 30496, "epoch": 726} {"train_loss": -5.5049147605896, "global_step": 30497, "epoch": 726} {"train_loss": -5.562248229980469, "global_step": 30498, "epoch": 726} {"train_loss": -5.330151557922363, "global_step": 30499, "epoch": 726} {"train_loss": -5.476073265075684, "global_step": 30500, "epoch": 726} {"train_loss": -5.382544040679932, "global_step": 30501, "epoch": 726} {"train_loss": -5.452702522277832, "global_step": 30502, "epoch": 726} {"train_loss": -5.641664505004883, "global_step": 30503, "epoch": 726} {"train_loss": -5.452695846557617, "global_step": 30504, "epoch": 726} {"train_loss": -5.413719177246094, "global_step": 30505, "epoch": 726} {"train_loss": -5.443157196044922, "global_step": 30506, "epoch": 726} {"train_loss": -5.629549026489258, "global_step": 30507, "epoch": 726} {"train_loss": -5.414235591888428, "global_step": 30508, "epoch": 726} {"train_loss": -5.445542335510254, "global_step": 30509, "epoch": 726} {"train_loss": -5.4059038162231445, "global_step": 30510, "epoch": 726} {"train_loss": -5.403110027313232, "global_step": 30511, "epoch": 726} {"train_loss": -5.421384811401367, "global_step": 30512, "epoch": 726} {"train_loss": -5.446319103240967, "global_step": 30513, "epoch": 726} {"train_loss": -5.372697353363037, "global_step": 30514, "epoch": 726} {"train_loss": -5.446422576904297, "global_step": 30515, "epoch": 726} {"train_loss": -5.414899826049805, "global_step": 30516, "epoch": 726} {"train_loss": -5.479828834533691, "global_step": 30517, "epoch": 726} {"train_loss": -5.532985687255859, "global_step": 30518, "epoch": 726} {"train_loss": -5.377803802490234, "global_step": 30519, "epoch": 726} {"train_loss": -5.541886329650879, "global_step": 30520, "epoch": 726} {"train_loss": -5.3968963623046875, "global_step": 30521, "epoch": 726} {"train_loss": -5.318173408508301, "global_step": 30522, "epoch": 726} {"train_loss": -5.536186218261719, "global_step": 30523, "epoch": 726} {"train_loss": -5.4818854331970215, "global_step": 30524, "epoch": 726} {"train_loss": -5.4027814865112305, "global_step": 30525, "epoch": 726} {"train_loss": -5.381511211395264, "global_step": 30526, "epoch": 726} {"train_loss": -5.579598426818848, "global_step": 30527, "epoch": 726} {"train_loss": -5.511519432067871, "global_step": 30528, "epoch": 726} {"train_loss": -5.355642318725586, "global_step": 30529, "epoch": 726} {"train_loss": -5.532540798187256, "global_step": 30530, "epoch": 726} {"train_loss": -5.3829345703125, "global_step": 30531, "epoch": 726} {"train_loss": -5.478729248046875, "global_step": 30532, "epoch": 726} {"train_loss": -5.456742706752959, "global_step": 30533, "epoch": 726, "val_loss": 63240.37890625} {"train_loss": -5.411155700683594, "global_step": 30534, "epoch": 727} {"train_loss": -5.516570091247559, "global_step": 30535, "epoch": 727} {"train_loss": -5.52860164642334, "global_step": 30536, "epoch": 727} {"train_loss": -5.6117634773254395, "global_step": 30537, "epoch": 727} {"train_loss": -5.4150190353393555, "global_step": 30538, "epoch": 727} {"train_loss": -5.518354415893555, "global_step": 30539, "epoch": 727} {"train_loss": -5.25960636138916, "global_step": 30540, "epoch": 727} {"train_loss": -5.5194220542907715, "global_step": 30541, "epoch": 727} {"train_loss": -5.583475112915039, "global_step": 30542, "epoch": 727} {"train_loss": -5.537746429443359, "global_step": 30543, "epoch": 727} {"train_loss": -5.462083339691162, "global_step": 30544, "epoch": 727} {"train_loss": -5.479892730712891, "global_step": 30545, "epoch": 727} {"train_loss": -5.427058219909668, "global_step": 30546, "epoch": 727} {"train_loss": -5.63962984085083, "global_step": 30547, "epoch": 727} {"train_loss": -5.472934722900391, "global_step": 30548, "epoch": 727} {"train_loss": -5.568853855133057, "global_step": 30549, "epoch": 727} {"train_loss": -5.428667068481445, "global_step": 30550, "epoch": 727} {"train_loss": -5.408663272857666, "global_step": 30551, "epoch": 727} {"train_loss": -5.455050945281982, "global_step": 30552, "epoch": 727} {"train_loss": -5.51981258392334, "global_step": 30553, "epoch": 727} {"train_loss": -5.386754989624023, "global_step": 30554, "epoch": 727} {"train_loss": -5.500931739807129, "global_step": 30555, "epoch": 727} {"train_loss": -5.493769645690918, "global_step": 30556, "epoch": 727} {"train_loss": -5.460838794708252, "global_step": 30557, "epoch": 727} {"train_loss": -5.55897855758667, "global_step": 30558, "epoch": 727} {"train_loss": -5.523810386657715, "global_step": 30559, "epoch": 727} {"train_loss": -5.542688846588135, "global_step": 30560, "epoch": 727} {"train_loss": -5.481054306030273, "global_step": 30561, "epoch": 727} {"train_loss": -5.5950164794921875, "global_step": 30562, "epoch": 727} {"train_loss": -5.536961555480957, "global_step": 30563, "epoch": 727} {"train_loss": -5.440431594848633, "global_step": 30564, "epoch": 727} {"train_loss": -5.504161834716797, "global_step": 30565, "epoch": 727} {"train_loss": -5.452654838562012, "global_step": 30566, "epoch": 727} {"train_loss": -5.491458892822266, "global_step": 30567, "epoch": 727} {"train_loss": -5.572896957397461, "global_step": 30568, "epoch": 727} {"train_loss": -5.459205627441406, "global_step": 30569, "epoch": 727} {"train_loss": -5.562368869781494, "global_step": 30570, "epoch": 727} {"train_loss": -5.484493255615234, "global_step": 30571, "epoch": 727} {"train_loss": -5.46595573425293, "global_step": 30572, "epoch": 727} {"train_loss": -5.561811923980713, "global_step": 30573, "epoch": 727} {"train_loss": -5.548442840576172, "global_step": 30574, "epoch": 727} {"train_loss": -5.493758587610154, "global_step": 30575, "epoch": 727, "val_loss": 63195.6171875} {"train_loss": -5.593779563903809, "global_step": 30576, "epoch": 728} {"train_loss": -5.281306266784668, "global_step": 30577, "epoch": 728} {"train_loss": -5.442019462585449, "global_step": 30578, "epoch": 728} {"train_loss": -5.51913595199585, "global_step": 30579, "epoch": 728} {"train_loss": -5.490606307983398, "global_step": 30580, "epoch": 728} {"train_loss": -5.431445121765137, "global_step": 30581, "epoch": 728} {"train_loss": -5.496360778808594, "global_step": 30582, "epoch": 728} {"train_loss": -5.521729469299316, "global_step": 30583, "epoch": 728} {"train_loss": -5.520963191986084, "global_step": 30584, "epoch": 728} {"train_loss": -5.5523681640625, "global_step": 30585, "epoch": 728} {"train_loss": -5.565280914306641, "global_step": 30586, "epoch": 728} {"train_loss": -5.42078971862793, "global_step": 30587, "epoch": 728} {"train_loss": -5.491568565368652, "global_step": 30588, "epoch": 728} {"train_loss": -5.628963470458984, "global_step": 30589, "epoch": 728} {"train_loss": -5.37067174911499, "global_step": 30590, "epoch": 728} {"train_loss": -5.366607666015625, "global_step": 30591, "epoch": 728} {"train_loss": -5.407610893249512, "global_step": 30592, "epoch": 728} {"train_loss": -5.339023113250732, "global_step": 30593, "epoch": 728} {"train_loss": -5.426659107208252, "global_step": 30594, "epoch": 728} {"train_loss": -5.46048641204834, "global_step": 30595, "epoch": 728} {"train_loss": -5.420269966125488, "global_step": 30596, "epoch": 728} {"train_loss": -5.543503761291504, "global_step": 30597, "epoch": 728} {"train_loss": -5.441885471343994, "global_step": 30598, "epoch": 728} {"train_loss": -5.398540496826172, "global_step": 30599, "epoch": 728} {"train_loss": -5.498927593231201, "global_step": 30600, "epoch": 728} {"train_loss": -5.338864326477051, "global_step": 30601, "epoch": 728} {"train_loss": -5.5507683753967285, "global_step": 30602, "epoch": 728} {"train_loss": -5.437054634094238, "global_step": 30603, "epoch": 728} {"train_loss": -5.516800880432129, "global_step": 30604, "epoch": 728} {"train_loss": -5.513298034667969, "global_step": 30605, "epoch": 728} {"train_loss": -5.5226545333862305, "global_step": 30606, "epoch": 728} {"train_loss": -5.509097099304199, "global_step": 30607, "epoch": 728} {"train_loss": -5.469200134277344, "global_step": 30608, "epoch": 728} {"train_loss": -5.603341102600098, "global_step": 30609, "epoch": 728} {"train_loss": -5.363247394561768, "global_step": 30610, "epoch": 728} {"train_loss": -5.518928527832031, "global_step": 30611, "epoch": 728} {"train_loss": -5.570306777954102, "global_step": 30612, "epoch": 728} {"train_loss": -5.407474517822266, "global_step": 30613, "epoch": 728} {"train_loss": -5.478416919708252, "global_step": 30614, "epoch": 728} {"train_loss": -5.40717887878418, "global_step": 30615, "epoch": 728} {"train_loss": -5.460527420043945, "global_step": 30616, "epoch": 728} {"train_loss": -5.4729180335998535, "global_step": 30617, "epoch": 728, "val_loss": 63012.64453125} {"train_loss": -5.4483466148376465, "global_step": 30618, "epoch": 729} {"train_loss": -5.467939376831055, "global_step": 30619, "epoch": 729} {"train_loss": -5.6378889083862305, "global_step": 30620, "epoch": 729} {"train_loss": -5.698282241821289, "global_step": 30621, "epoch": 729} {"train_loss": -5.419983863830566, "global_step": 30622, "epoch": 729} {"train_loss": -5.497586250305176, "global_step": 30623, "epoch": 729} {"train_loss": -5.519346237182617, "global_step": 30624, "epoch": 729} {"train_loss": -5.334554672241211, "global_step": 30625, "epoch": 729} {"train_loss": -5.470084190368652, "global_step": 30626, "epoch": 729} {"train_loss": -5.420458793640137, "global_step": 30627, "epoch": 729} {"train_loss": -5.371330738067627, "global_step": 30628, "epoch": 729} {"train_loss": -5.449668884277344, "global_step": 30629, "epoch": 729} {"train_loss": -5.363112926483154, "global_step": 30630, "epoch": 729} {"train_loss": -5.4961395263671875, "global_step": 30631, "epoch": 729} {"train_loss": -5.592660427093506, "global_step": 30632, "epoch": 729} {"train_loss": -5.4419145584106445, "global_step": 30633, "epoch": 729} {"train_loss": -5.544015407562256, "global_step": 30634, "epoch": 729} {"train_loss": -5.397028923034668, "global_step": 30635, "epoch": 729} {"train_loss": -5.430995941162109, "global_step": 30636, "epoch": 729} {"train_loss": -5.552038192749023, "global_step": 30637, "epoch": 729} {"train_loss": -5.569891929626465, "global_step": 30638, "epoch": 729} {"train_loss": -5.548591613769531, "global_step": 30639, "epoch": 729} {"train_loss": -5.466004371643066, "global_step": 30640, "epoch": 729} {"train_loss": -5.3661603927612305, "global_step": 30641, "epoch": 729} {"train_loss": -5.51760721206665, "global_step": 30642, "epoch": 729} {"train_loss": -5.487486362457275, "global_step": 30643, "epoch": 729} {"train_loss": -5.3696393966674805, "global_step": 30644, "epoch": 729} {"train_loss": -5.509101867675781, "global_step": 30645, "epoch": 729} {"train_loss": -5.477316856384277, "global_step": 30646, "epoch": 729} {"train_loss": -5.527723789215088, "global_step": 30647, "epoch": 729} {"train_loss": -5.492383003234863, "global_step": 30648, "epoch": 729} {"train_loss": -5.494046688079834, "global_step": 30649, "epoch": 729} {"train_loss": -5.476839065551758, "global_step": 30650, "epoch": 729} {"train_loss": -5.531881809234619, "global_step": 30651, "epoch": 729} {"train_loss": -5.497896194458008, "global_step": 30652, "epoch": 729} {"train_loss": -5.487859725952148, "global_step": 30653, "epoch": 729} {"train_loss": -5.519735336303711, "global_step": 30654, "epoch": 729} {"train_loss": -5.465426445007324, "global_step": 30655, "epoch": 729} {"train_loss": -5.502189636230469, "global_step": 30656, "epoch": 729} {"train_loss": -5.535458087921143, "global_step": 30657, "epoch": 729} {"train_loss": -5.464235305786133, "global_step": 30658, "epoch": 729} {"train_loss": -5.484329916182018, "global_step": 30659, "epoch": 729, "val_loss": 63457.0703125} {"train_loss": -5.4840545654296875, "global_step": 30660, "epoch": 730} {"train_loss": -5.514399528503418, "global_step": 30661, "epoch": 730} {"train_loss": -5.4393510818481445, "global_step": 30662, "epoch": 730} {"train_loss": -5.546331882476807, "global_step": 30663, "epoch": 730} {"train_loss": -5.537647724151611, "global_step": 30664, "epoch": 730} {"train_loss": -5.480504035949707, "global_step": 30665, "epoch": 730} {"train_loss": -5.501569747924805, "global_step": 30666, "epoch": 730} {"train_loss": -5.455148696899414, "global_step": 30667, "epoch": 730} {"train_loss": -5.488779067993164, "global_step": 30668, "epoch": 730} {"train_loss": -5.387134552001953, "global_step": 30669, "epoch": 730} {"train_loss": -5.348838806152344, "global_step": 30670, "epoch": 730} {"train_loss": -5.513967514038086, "global_step": 30671, "epoch": 730} {"train_loss": -5.526797294616699, "global_step": 30672, "epoch": 730} {"train_loss": -5.602335453033447, "global_step": 30673, "epoch": 730} {"train_loss": -5.56338357925415, "global_step": 30674, "epoch": 730} {"train_loss": -5.5365495681762695, "global_step": 30675, "epoch": 730} {"train_loss": -5.533659934997559, "global_step": 30676, "epoch": 730} {"train_loss": -5.457104206085205, "global_step": 30677, "epoch": 730} {"train_loss": -5.585017681121826, "global_step": 30678, "epoch": 730} {"train_loss": -5.548434734344482, "global_step": 30679, "epoch": 730} {"train_loss": -5.554972171783447, "global_step": 30680, "epoch": 730} {"train_loss": -5.593387603759766, "global_step": 30681, "epoch": 730} {"train_loss": -5.4364776611328125, "global_step": 30682, "epoch": 730} {"train_loss": -5.402486801147461, "global_step": 30683, "epoch": 730} {"train_loss": -5.500662326812744, "global_step": 30684, "epoch": 730} {"train_loss": -5.592299461364746, "global_step": 30685, "epoch": 730} {"train_loss": -5.593109130859375, "global_step": 30686, "epoch": 730} {"train_loss": -5.4586968421936035, "global_step": 30687, "epoch": 730} {"train_loss": -5.574902534484863, "global_step": 30688, "epoch": 730} {"train_loss": -5.491410255432129, "global_step": 30689, "epoch": 730} {"train_loss": -5.566957473754883, "global_step": 30690, "epoch": 730} {"train_loss": -5.446386337280273, "global_step": 30691, "epoch": 730} {"train_loss": -5.476770877838135, "global_step": 30692, "epoch": 730} {"train_loss": -5.368408203125, "global_step": 30693, "epoch": 730} {"train_loss": -5.421603202819824, "global_step": 30694, "epoch": 730} {"train_loss": -5.474055290222168, "global_step": 30695, "epoch": 730} {"train_loss": -5.457219123840332, "global_step": 30696, "epoch": 730} {"train_loss": -5.308590888977051, "global_step": 30697, "epoch": 730} {"train_loss": -5.5358734130859375, "global_step": 30698, "epoch": 730} {"train_loss": -5.424693584442139, "global_step": 30699, "epoch": 730} {"train_loss": -5.421019554138184, "global_step": 30700, "epoch": 730} {"train_loss": -5.488965295609974, "global_step": 30701, "epoch": 730, "val_loss": 63247.42578125} {"train_loss": -5.408352375030518, "global_step": 30702, "epoch": 731} {"train_loss": -5.493961334228516, "global_step": 30703, "epoch": 731} {"train_loss": -5.389715194702148, "global_step": 30704, "epoch": 731} {"train_loss": -5.495875358581543, "global_step": 30705, "epoch": 731} {"train_loss": -5.5893025398254395, "global_step": 30706, "epoch": 731} {"train_loss": -5.4952168464660645, "global_step": 30707, "epoch": 731} {"train_loss": -5.674756050109863, "global_step": 30708, "epoch": 731} {"train_loss": -5.435359001159668, "global_step": 30709, "epoch": 731} {"train_loss": -5.361556053161621, "global_step": 30710, "epoch": 731} {"train_loss": -5.507973670959473, "global_step": 30711, "epoch": 731} {"train_loss": -5.551083087921143, "global_step": 30712, "epoch": 731} {"train_loss": -5.40080451965332, "global_step": 30713, "epoch": 731} {"train_loss": -5.442202091217041, "global_step": 30714, "epoch": 731} {"train_loss": -5.510000228881836, "global_step": 30715, "epoch": 731} {"train_loss": -5.519241809844971, "global_step": 30716, "epoch": 731} {"train_loss": -5.496515274047852, "global_step": 30717, "epoch": 731} {"train_loss": -5.443730354309082, "global_step": 30718, "epoch": 731} {"train_loss": -5.484311580657959, "global_step": 30719, "epoch": 731} {"train_loss": -5.40495491027832, "global_step": 30720, "epoch": 731} {"train_loss": -5.469449996948242, "global_step": 30721, "epoch": 731} {"train_loss": -5.391106605529785, "global_step": 30722, "epoch": 731} {"train_loss": -5.372003555297852, "global_step": 30723, "epoch": 731} {"train_loss": -5.5973801612854, "global_step": 30724, "epoch": 731} {"train_loss": -5.426077365875244, "global_step": 30725, "epoch": 731} {"train_loss": -5.553610801696777, "global_step": 30726, "epoch": 731} {"train_loss": -5.562697410583496, "global_step": 30727, "epoch": 731} {"train_loss": -5.49725341796875, "global_step": 30728, "epoch": 731} {"train_loss": -5.482710838317871, "global_step": 30729, "epoch": 731} {"train_loss": -5.4329633712768555, "global_step": 30730, "epoch": 731} {"train_loss": -5.496697425842285, "global_step": 30731, "epoch": 731} {"train_loss": -5.431319236755371, "global_step": 30732, "epoch": 731} {"train_loss": -5.4351115226745605, "global_step": 30733, "epoch": 731} {"train_loss": -5.45759916305542, "global_step": 30734, "epoch": 731} {"train_loss": -5.574995040893555, "global_step": 30735, "epoch": 731} {"train_loss": -5.465221405029297, "global_step": 30736, "epoch": 731} {"train_loss": -5.656569480895996, "global_step": 30737, "epoch": 731} {"train_loss": -5.461944580078125, "global_step": 30738, "epoch": 731} {"train_loss": -5.4638471603393555, "global_step": 30739, "epoch": 731} {"train_loss": -5.452094078063965, "global_step": 30740, "epoch": 731} {"train_loss": -5.547853946685791, "global_step": 30741, "epoch": 731} {"train_loss": -5.539783477783203, "global_step": 30742, "epoch": 731} {"train_loss": -5.4858113924662275, "global_step": 30743, "epoch": 731, "val_loss": 63635.2734375} {"train_loss": -5.427206993103027, "global_step": 30744, "epoch": 732} {"train_loss": -5.401017189025879, "global_step": 30745, "epoch": 732} {"train_loss": -5.489816665649414, "global_step": 30746, "epoch": 732} {"train_loss": -5.50648307800293, "global_step": 30747, "epoch": 732} {"train_loss": -5.497003555297852, "global_step": 30748, "epoch": 732} {"train_loss": -5.474200248718262, "global_step": 30749, "epoch": 732} {"train_loss": -5.357295989990234, "global_step": 30750, "epoch": 732} {"train_loss": -5.467766761779785, "global_step": 30751, "epoch": 732} {"train_loss": -5.513982772827148, "global_step": 30752, "epoch": 732} {"train_loss": -5.501354217529297, "global_step": 30753, "epoch": 732} {"train_loss": -5.580144882202148, "global_step": 30754, "epoch": 732} {"train_loss": -5.410350322723389, "global_step": 30755, "epoch": 732} {"train_loss": -5.566732406616211, "global_step": 30756, "epoch": 732} {"train_loss": -5.485315322875977, "global_step": 30757, "epoch": 732} {"train_loss": -5.5161871910095215, "global_step": 30758, "epoch": 732} {"train_loss": -5.5192551612854, "global_step": 30759, "epoch": 732} {"train_loss": -5.446077346801758, "global_step": 30760, "epoch": 732} {"train_loss": -5.474879741668701, "global_step": 30761, "epoch": 732} {"train_loss": -5.395040035247803, "global_step": 30762, "epoch": 732} {"train_loss": -5.483976364135742, "global_step": 30763, "epoch": 732} {"train_loss": -5.371715545654297, "global_step": 30764, "epoch": 732} {"train_loss": -5.401029109954834, "global_step": 30765, "epoch": 732} {"train_loss": -5.480281829833984, "global_step": 30766, "epoch": 732} {"train_loss": -5.449082851409912, "global_step": 30767, "epoch": 732} {"train_loss": -5.550498962402344, "global_step": 30768, "epoch": 732} {"train_loss": -5.624199867248535, "global_step": 30769, "epoch": 732} {"train_loss": -5.302496910095215, "global_step": 30770, "epoch": 732} {"train_loss": -5.384528160095215, "global_step": 30771, "epoch": 732} {"train_loss": -5.3644609451293945, "global_step": 30772, "epoch": 732} {"train_loss": -5.4568939208984375, "global_step": 30773, "epoch": 732} {"train_loss": -5.541922569274902, "global_step": 30774, "epoch": 732} {"train_loss": -5.497808456420898, "global_step": 30775, "epoch": 732} {"train_loss": -5.620257377624512, "global_step": 30776, "epoch": 732} {"train_loss": -5.5040388107299805, "global_step": 30777, "epoch": 732} {"train_loss": -5.546331405639648, "global_step": 30778, "epoch": 732} {"train_loss": -5.486627578735352, "global_step": 30779, "epoch": 732} {"train_loss": -5.627645492553711, "global_step": 30780, "epoch": 732} {"train_loss": -5.604307174682617, "global_step": 30781, "epoch": 732} {"train_loss": -5.455660820007324, "global_step": 30782, "epoch": 732} {"train_loss": -5.467947959899902, "global_step": 30783, "epoch": 732} {"train_loss": -5.534458160400391, "global_step": 30784, "epoch": 732} {"train_loss": -5.4830854052589055, "global_step": 30785, "epoch": 732, "val_loss": 63167.3203125} {"train_loss": -5.4904327392578125, "global_step": 30786, "epoch": 733} {"train_loss": -5.544078350067139, "global_step": 30787, "epoch": 733} {"train_loss": -5.582981109619141, "global_step": 30788, "epoch": 733} {"train_loss": -5.496877193450928, "global_step": 30789, "epoch": 733} {"train_loss": -5.5100836753845215, "global_step": 30790, "epoch": 733} {"train_loss": -5.433957099914551, "global_step": 30791, "epoch": 733} {"train_loss": -5.626073837280273, "global_step": 30792, "epoch": 733} {"train_loss": -5.449538707733154, "global_step": 30793, "epoch": 733} {"train_loss": -5.539252758026123, "global_step": 30794, "epoch": 733} {"train_loss": -5.472538948059082, "global_step": 30795, "epoch": 733} {"train_loss": -5.448882102966309, "global_step": 30796, "epoch": 733} {"train_loss": -5.540943145751953, "global_step": 30797, "epoch": 733} {"train_loss": -5.523035526275635, "global_step": 30798, "epoch": 733} {"train_loss": -5.379088401794434, "global_step": 30799, "epoch": 733} {"train_loss": -5.517792701721191, "global_step": 30800, "epoch": 733} {"train_loss": -5.579854488372803, "global_step": 30801, "epoch": 733} {"train_loss": -5.525128364562988, "global_step": 30802, "epoch": 733} {"train_loss": -5.499820709228516, "global_step": 30803, "epoch": 733} {"train_loss": -5.444873809814453, "global_step": 30804, "epoch": 733} {"train_loss": -5.488265514373779, "global_step": 30805, "epoch": 733} {"train_loss": -5.288980960845947, "global_step": 30806, "epoch": 733} {"train_loss": -5.440025329589844, "global_step": 30807, "epoch": 733} {"train_loss": -5.449284553527832, "global_step": 30808, "epoch": 733} {"train_loss": -5.422845363616943, "global_step": 30809, "epoch": 733} {"train_loss": -5.565101146697998, "global_step": 30810, "epoch": 733} {"train_loss": -5.565164089202881, "global_step": 30811, "epoch": 733} {"train_loss": -5.4817070960998535, "global_step": 30812, "epoch": 733} {"train_loss": -5.466817855834961, "global_step": 30813, "epoch": 733} {"train_loss": -5.450884819030762, "global_step": 30814, "epoch": 733} {"train_loss": -5.471266746520996, "global_step": 30815, "epoch": 733} {"train_loss": -5.498837471008301, "global_step": 30816, "epoch": 733} {"train_loss": -5.336399555206299, "global_step": 30817, "epoch": 733} {"train_loss": -5.540009021759033, "global_step": 30818, "epoch": 733} {"train_loss": -5.487604141235352, "global_step": 30819, "epoch": 733} {"train_loss": -5.453859329223633, "global_step": 30820, "epoch": 733} {"train_loss": -5.43674898147583, "global_step": 30821, "epoch": 733} {"train_loss": -5.464815616607666, "global_step": 30822, "epoch": 733} {"train_loss": -5.439599990844727, "global_step": 30823, "epoch": 733} {"train_loss": -5.44529914855957, "global_step": 30824, "epoch": 733} {"train_loss": -5.3687849044799805, "global_step": 30825, "epoch": 733} {"train_loss": -5.543214797973633, "global_step": 30826, "epoch": 733} {"train_loss": -5.4786833467937655, "global_step": 30827, "epoch": 733, "val_loss": 63565.5078125} {"train_loss": -5.532650947570801, "global_step": 30828, "epoch": 734} {"train_loss": -5.618054389953613, "global_step": 30829, "epoch": 734} {"train_loss": -5.489199638366699, "global_step": 30830, "epoch": 734} {"train_loss": -5.441483497619629, "global_step": 30831, "epoch": 734} {"train_loss": -5.537015914916992, "global_step": 30832, "epoch": 734} {"train_loss": -5.664276123046875, "global_step": 30833, "epoch": 734} {"train_loss": -5.476158142089844, "global_step": 30834, "epoch": 734} {"train_loss": -5.3871307373046875, "global_step": 30835, "epoch": 734} {"train_loss": -5.402932167053223, "global_step": 30836, "epoch": 734} {"train_loss": -5.5189008712768555, "global_step": 30837, "epoch": 734} {"train_loss": -5.5571441650390625, "global_step": 30838, "epoch": 734} {"train_loss": -5.451104164123535, "global_step": 30839, "epoch": 734} {"train_loss": -5.434812545776367, "global_step": 30840, "epoch": 734} {"train_loss": -5.584668159484863, "global_step": 30841, "epoch": 734} {"train_loss": -5.545868873596191, "global_step": 30842, "epoch": 734} {"train_loss": -5.552421569824219, "global_step": 30843, "epoch": 734} {"train_loss": -5.487451076507568, "global_step": 30844, "epoch": 734} {"train_loss": -5.432738304138184, "global_step": 30845, "epoch": 734} {"train_loss": -5.392285346984863, "global_step": 30846, "epoch": 734} {"train_loss": -5.505795478820801, "global_step": 30847, "epoch": 734} {"train_loss": -5.470013618469238, "global_step": 30848, "epoch": 734} {"train_loss": -5.559383392333984, "global_step": 30849, "epoch": 734} {"train_loss": -5.555472373962402, "global_step": 30850, "epoch": 734} {"train_loss": -5.4041643142700195, "global_step": 30851, "epoch": 734} {"train_loss": -5.446432113647461, "global_step": 30852, "epoch": 734} {"train_loss": -5.46657133102417, "global_step": 30853, "epoch": 734} {"train_loss": -5.536113262176514, "global_step": 30854, "epoch": 734} {"train_loss": -5.652778625488281, "global_step": 30855, "epoch": 734} {"train_loss": -5.466350078582764, "global_step": 30856, "epoch": 734} {"train_loss": -5.498848915100098, "global_step": 30857, "epoch": 734} {"train_loss": -5.396481513977051, "global_step": 30858, "epoch": 734} {"train_loss": -5.581554412841797, "global_step": 30859, "epoch": 734} {"train_loss": -5.579491138458252, "global_step": 30860, "epoch": 734} {"train_loss": -5.591106414794922, "global_step": 30861, "epoch": 734} {"train_loss": -5.541600227355957, "global_step": 30862, "epoch": 734} {"train_loss": -5.507329940795898, "global_step": 30863, "epoch": 734} {"train_loss": -5.594888210296631, "global_step": 30864, "epoch": 734} {"train_loss": -5.572545051574707, "global_step": 30865, "epoch": 734} {"train_loss": -5.5295867919921875, "global_step": 30866, "epoch": 734} {"train_loss": -5.458636283874512, "global_step": 30867, "epoch": 734} {"train_loss": -5.4528093338012695, "global_step": 30868, "epoch": 734} {"train_loss": -5.513328881490798, "global_step": 30869, "epoch": 734, "val_loss": 63211.08203125} {"train_loss": -5.445682048797607, "global_step": 30870, "epoch": 735} {"train_loss": -5.5228729248046875, "global_step": 30871, "epoch": 735} {"train_loss": -5.467740535736084, "global_step": 30872, "epoch": 735} {"train_loss": -5.517749786376953, "global_step": 30873, "epoch": 735} {"train_loss": -5.4832258224487305, "global_step": 30874, "epoch": 735} {"train_loss": -5.594706058502197, "global_step": 30875, "epoch": 735} {"train_loss": -5.521306991577148, "global_step": 30876, "epoch": 735} {"train_loss": -5.356368064880371, "global_step": 30877, "epoch": 735} {"train_loss": -5.5602850914001465, "global_step": 30878, "epoch": 735} {"train_loss": -5.509665012359619, "global_step": 30879, "epoch": 735} {"train_loss": -5.412632465362549, "global_step": 30880, "epoch": 735} {"train_loss": -5.426598072052002, "global_step": 30881, "epoch": 735} {"train_loss": -5.476598739624023, "global_step": 30882, "epoch": 735} {"train_loss": -5.557327747344971, "global_step": 30883, "epoch": 735} {"train_loss": -5.487144470214844, "global_step": 30884, "epoch": 735} {"train_loss": -5.591437816619873, "global_step": 30885, "epoch": 735} {"train_loss": -5.567190170288086, "global_step": 30886, "epoch": 735} {"train_loss": -5.540763854980469, "global_step": 30887, "epoch": 735} {"train_loss": -5.585501670837402, "global_step": 30888, "epoch": 735} {"train_loss": -5.440518856048584, "global_step": 30889, "epoch": 735} {"train_loss": -5.513557434082031, "global_step": 30890, "epoch": 735} {"train_loss": -5.5875043869018555, "global_step": 30891, "epoch": 735} {"train_loss": -5.354950428009033, "global_step": 30892, "epoch": 735} {"train_loss": -5.423994064331055, "global_step": 30893, "epoch": 735} {"train_loss": -5.529801845550537, "global_step": 30894, "epoch": 735} {"train_loss": -5.418938636779785, "global_step": 30895, "epoch": 735} {"train_loss": -5.4826531410217285, "global_step": 30896, "epoch": 735} {"train_loss": -5.564309597015381, "global_step": 30897, "epoch": 735} {"train_loss": -5.613435745239258, "global_step": 30898, "epoch": 735} {"train_loss": -5.435956954956055, "global_step": 30899, "epoch": 735} {"train_loss": -5.395838260650635, "global_step": 30900, "epoch": 735} {"train_loss": -5.503118515014648, "global_step": 30901, "epoch": 735} {"train_loss": -5.490002632141113, "global_step": 30902, "epoch": 735} {"train_loss": -5.505063533782959, "global_step": 30903, "epoch": 735} {"train_loss": -5.523046493530273, "global_step": 30904, "epoch": 735} {"train_loss": -5.506425857543945, "global_step": 30905, "epoch": 735} {"train_loss": -5.539475917816162, "global_step": 30906, "epoch": 735} {"train_loss": -5.492274761199951, "global_step": 30907, "epoch": 735} {"train_loss": -5.482392311096191, "global_step": 30908, "epoch": 735} {"train_loss": -5.536374092102051, "global_step": 30909, "epoch": 735} {"train_loss": -5.4583048820495605, "global_step": 30910, "epoch": 735} {"train_loss": -5.49835163071042, "global_step": 30911, "epoch": 735, "val_loss": 63608.1953125} {"train_loss": -5.439996242523193, "global_step": 30912, "epoch": 736} {"train_loss": -5.221616744995117, "global_step": 30913, "epoch": 736} {"train_loss": -5.465084075927734, "global_step": 30914, "epoch": 736} {"train_loss": -5.423885822296143, "global_step": 30915, "epoch": 736} {"train_loss": -5.310997486114502, "global_step": 30916, "epoch": 736} {"train_loss": -5.4105377197265625, "global_step": 30917, "epoch": 736} {"train_loss": -5.406467914581299, "global_step": 30918, "epoch": 736} {"train_loss": -5.454094409942627, "global_step": 30919, "epoch": 736} {"train_loss": -5.473062992095947, "global_step": 30920, "epoch": 736} {"train_loss": -5.494972229003906, "global_step": 30921, "epoch": 736} {"train_loss": -5.39735221862793, "global_step": 30922, "epoch": 736} {"train_loss": -5.507956027984619, "global_step": 30923, "epoch": 736} {"train_loss": -5.464775085449219, "global_step": 30924, "epoch": 736} {"train_loss": -5.497439861297607, "global_step": 30925, "epoch": 736} {"train_loss": -5.466131210327148, "global_step": 30926, "epoch": 736} {"train_loss": -5.425329208374023, "global_step": 30927, "epoch": 736} {"train_loss": -5.411324501037598, "global_step": 30928, "epoch": 736} {"train_loss": -5.520187854766846, "global_step": 30929, "epoch": 736} {"train_loss": -5.479848861694336, "global_step": 30930, "epoch": 736} {"train_loss": -5.523655891418457, "global_step": 30931, "epoch": 736} {"train_loss": -5.493547439575195, "global_step": 30932, "epoch": 736} {"train_loss": -5.353943824768066, "global_step": 30933, "epoch": 736} {"train_loss": -5.44399356842041, "global_step": 30934, "epoch": 736} {"train_loss": -5.428829193115234, "global_step": 30935, "epoch": 736} {"train_loss": -5.45805549621582, "global_step": 30936, "epoch": 736} {"train_loss": -5.6047587394714355, "global_step": 30937, "epoch": 736} {"train_loss": -5.5874128341674805, "global_step": 30938, "epoch": 736} {"train_loss": -5.397505283355713, "global_step": 30939, "epoch": 736} {"train_loss": -5.485886573791504, "global_step": 30940, "epoch": 736} {"train_loss": -5.586797714233398, "global_step": 30941, "epoch": 736} {"train_loss": -5.513679504394531, "global_step": 30942, "epoch": 736} {"train_loss": -5.470237731933594, "global_step": 30943, "epoch": 736} {"train_loss": -5.521761417388916, "global_step": 30944, "epoch": 736} {"train_loss": -5.504149436950684, "global_step": 30945, "epoch": 736} {"train_loss": -5.450335502624512, "global_step": 30946, "epoch": 736} {"train_loss": -5.501687049865723, "global_step": 30947, "epoch": 736} {"train_loss": -5.469730377197266, "global_step": 30948, "epoch": 736} {"train_loss": -5.404803276062012, "global_step": 30949, "epoch": 736} {"train_loss": -5.36787223815918, "global_step": 30950, "epoch": 736} {"train_loss": -5.27561092376709, "global_step": 30951, "epoch": 736} {"train_loss": -5.472970008850098, "global_step": 30952, "epoch": 736} {"train_loss": -5.455032076154437, "global_step": 30953, "epoch": 736, "val_loss": 63273.90234375} {"train_loss": -5.4604172706604, "global_step": 30954, "epoch": 737} {"train_loss": -5.53930139541626, "global_step": 30955, "epoch": 737} {"train_loss": -5.405228614807129, "global_step": 30956, "epoch": 737} {"train_loss": -5.474499702453613, "global_step": 30957, "epoch": 737} {"train_loss": -5.4052324295043945, "global_step": 30958, "epoch": 737} {"train_loss": -5.5772857666015625, "global_step": 30959, "epoch": 737} {"train_loss": -5.386646270751953, "global_step": 30960, "epoch": 737} {"train_loss": -5.433239936828613, "global_step": 30961, "epoch": 737} {"train_loss": -5.552584648132324, "global_step": 30962, "epoch": 737} {"train_loss": -5.321476459503174, "global_step": 30963, "epoch": 737} {"train_loss": -5.3563690185546875, "global_step": 30964, "epoch": 737} {"train_loss": -5.631919860839844, "global_step": 30965, "epoch": 737} {"train_loss": -5.46555233001709, "global_step": 30966, "epoch": 737} {"train_loss": -5.566393852233887, "global_step": 30967, "epoch": 737} {"train_loss": -5.421887397766113, "global_step": 30968, "epoch": 737} {"train_loss": -5.543915748596191, "global_step": 30969, "epoch": 737} {"train_loss": -5.560074806213379, "global_step": 30970, "epoch": 737} {"train_loss": -5.581380844116211, "global_step": 30971, "epoch": 737} {"train_loss": -5.457409381866455, "global_step": 30972, "epoch": 737} {"train_loss": -5.459246635437012, "global_step": 30973, "epoch": 737} {"train_loss": -5.480844497680664, "global_step": 30974, "epoch": 737} {"train_loss": -5.529360771179199, "global_step": 30975, "epoch": 737} {"train_loss": -5.456026077270508, "global_step": 30976, "epoch": 737} {"train_loss": -5.498188018798828, "global_step": 30977, "epoch": 737} {"train_loss": -5.3644609451293945, "global_step": 30978, "epoch": 737} {"train_loss": -5.391646385192871, "global_step": 30979, "epoch": 737} {"train_loss": -5.4843645095825195, "global_step": 30980, "epoch": 737} {"train_loss": -5.37115478515625, "global_step": 30981, "epoch": 737} {"train_loss": -5.445834159851074, "global_step": 30982, "epoch": 737} {"train_loss": -5.4146728515625, "global_step": 30983, "epoch": 737} {"train_loss": -5.387221336364746, "global_step": 30984, "epoch": 737} {"train_loss": -5.374894142150879, "global_step": 30985, "epoch": 737} {"train_loss": -5.631648063659668, "global_step": 30986, "epoch": 737} {"train_loss": -5.379836559295654, "global_step": 30987, "epoch": 737} {"train_loss": -5.343865394592285, "global_step": 30988, "epoch": 737} {"train_loss": -5.499297618865967, "global_step": 30989, "epoch": 737} {"train_loss": -5.264815330505371, "global_step": 30990, "epoch": 737} {"train_loss": -5.5724592208862305, "global_step": 30991, "epoch": 737} {"train_loss": -5.360698223114014, "global_step": 30992, "epoch": 737} {"train_loss": -5.328001976013184, "global_step": 30993, "epoch": 737} {"train_loss": -5.4289679527282715, "global_step": 30994, "epoch": 737} {"train_loss": -5.451245330628895, "global_step": 30995, "epoch": 737, "val_loss": 63191.65625} {"train_loss": -5.431605339050293, "global_step": 30996, "epoch": 738} {"train_loss": -5.380939483642578, "global_step": 30997, "epoch": 738} {"train_loss": -5.611513614654541, "global_step": 30998, "epoch": 738} {"train_loss": -5.511232376098633, "global_step": 30999, "epoch": 738} {"train_loss": -5.470144271850586, "global_step": 31000, "epoch": 738} {"train_loss": -5.4128923416137695, "global_step": 31001, "epoch": 738} {"train_loss": -5.540752410888672, "global_step": 31002, "epoch": 738} {"train_loss": -5.4106011390686035, "global_step": 31003, "epoch": 738} {"train_loss": -5.4607439041137695, "global_step": 31004, "epoch": 738} {"train_loss": -5.548163414001465, "global_step": 31005, "epoch": 738} {"train_loss": -5.414699554443359, "global_step": 31006, "epoch": 738} {"train_loss": -5.466145038604736, "global_step": 31007, "epoch": 738} {"train_loss": -5.456625938415527, "global_step": 31008, "epoch": 738} {"train_loss": -5.363608360290527, "global_step": 31009, "epoch": 738} {"train_loss": -5.245304584503174, "global_step": 31010, "epoch": 738} {"train_loss": -5.555437088012695, "global_step": 31011, "epoch": 738} {"train_loss": -5.351016044616699, "global_step": 31012, "epoch": 738} {"train_loss": -5.4707112312316895, "global_step": 31013, "epoch": 738} {"train_loss": -5.48898983001709, "global_step": 31014, "epoch": 738} {"train_loss": -5.47536563873291, "global_step": 31015, "epoch": 738} {"train_loss": -5.574728012084961, "global_step": 31016, "epoch": 738} {"train_loss": -5.570378303527832, "global_step": 31017, "epoch": 738} {"train_loss": -5.490281105041504, "global_step": 31018, "epoch": 738} {"train_loss": -5.493473052978516, "global_step": 31019, "epoch": 738} {"train_loss": -5.474352836608887, "global_step": 31020, "epoch": 738} {"train_loss": -5.464300632476807, "global_step": 31021, "epoch": 738} {"train_loss": -5.505913734436035, "global_step": 31022, "epoch": 738} {"train_loss": -5.469321250915527, "global_step": 31023, "epoch": 738} {"train_loss": -5.544116020202637, "global_step": 31024, "epoch": 738} {"train_loss": -5.433233261108398, "global_step": 31025, "epoch": 738} {"train_loss": -5.536561012268066, "global_step": 31026, "epoch": 738} {"train_loss": -5.542111396789551, "global_step": 31027, "epoch": 738} {"train_loss": -5.389708995819092, "global_step": 31028, "epoch": 738} {"train_loss": -5.6325554847717285, "global_step": 31029, "epoch": 738} {"train_loss": -5.398015022277832, "global_step": 31030, "epoch": 738} {"train_loss": -5.551984786987305, "global_step": 31031, "epoch": 738} {"train_loss": -5.468877792358398, "global_step": 31032, "epoch": 738} {"train_loss": -5.49111270904541, "global_step": 31033, "epoch": 738} {"train_loss": -5.5376458168029785, "global_step": 31034, "epoch": 738} {"train_loss": -5.496641635894775, "global_step": 31035, "epoch": 738} {"train_loss": -5.529831886291504, "global_step": 31036, "epoch": 738} {"train_loss": -5.4763228098551435, "global_step": 31037, "epoch": 738, "val_loss": 62809.7578125} {"train_loss": -5.5398454666137695, "global_step": 31038, "epoch": 739} {"train_loss": -5.570525646209717, "global_step": 31039, "epoch": 739} {"train_loss": -5.480066299438477, "global_step": 31040, "epoch": 739} {"train_loss": -5.518209934234619, "global_step": 31041, "epoch": 739} {"train_loss": -5.557008743286133, "global_step": 31042, "epoch": 739} {"train_loss": -5.468283176422119, "global_step": 31043, "epoch": 739} {"train_loss": -5.4341044425964355, "global_step": 31044, "epoch": 739} {"train_loss": -5.427942276000977, "global_step": 31045, "epoch": 739} {"train_loss": -5.493964195251465, "global_step": 31046, "epoch": 739} {"train_loss": -5.383574485778809, "global_step": 31047, "epoch": 739} {"train_loss": -5.469335556030273, "global_step": 31048, "epoch": 739} {"train_loss": -5.3917131423950195, "global_step": 31049, "epoch": 739} {"train_loss": -5.494219779968262, "global_step": 31050, "epoch": 739} {"train_loss": -5.422104835510254, "global_step": 31051, "epoch": 739} {"train_loss": -5.527647972106934, "global_step": 31052, "epoch": 739} {"train_loss": -5.562126159667969, "global_step": 31053, "epoch": 739} {"train_loss": -5.344522953033447, "global_step": 31054, "epoch": 739} {"train_loss": -5.487532615661621, "global_step": 31055, "epoch": 739} {"train_loss": -5.633731365203857, "global_step": 31056, "epoch": 739} {"train_loss": -5.453707218170166, "global_step": 31057, "epoch": 739} {"train_loss": -5.522499084472656, "global_step": 31058, "epoch": 739} {"train_loss": -5.553173065185547, "global_step": 31059, "epoch": 739} {"train_loss": -5.496744155883789, "global_step": 31060, "epoch": 739} {"train_loss": -5.533019065856934, "global_step": 31061, "epoch": 739} {"train_loss": -5.376835823059082, "global_step": 31062, "epoch": 739} {"train_loss": -5.342951774597168, "global_step": 31063, "epoch": 739} {"train_loss": -5.631256580352783, "global_step": 31064, "epoch": 739} {"train_loss": -5.548723220825195, "global_step": 31065, "epoch": 739} {"train_loss": -5.539165496826172, "global_step": 31066, "epoch": 739} {"train_loss": -5.482535362243652, "global_step": 31067, "epoch": 739} {"train_loss": -5.428079128265381, "global_step": 31068, "epoch": 739} {"train_loss": -5.474966049194336, "global_step": 31069, "epoch": 739} {"train_loss": -5.618839740753174, "global_step": 31070, "epoch": 739} {"train_loss": -5.39383602142334, "global_step": 31071, "epoch": 739} {"train_loss": -5.344761848449707, "global_step": 31072, "epoch": 739} {"train_loss": -5.368401527404785, "global_step": 31073, "epoch": 739} {"train_loss": -5.416826248168945, "global_step": 31074, "epoch": 739} {"train_loss": -5.564242839813232, "global_step": 31075, "epoch": 739} {"train_loss": -5.50880241394043, "global_step": 31076, "epoch": 739} {"train_loss": -5.4780073165893555, "global_step": 31077, "epoch": 739} {"train_loss": -5.460861682891846, "global_step": 31078, "epoch": 739} {"train_loss": -5.480687754494803, "global_step": 31079, "epoch": 739, "val_loss": 63203.609375} {"train_loss": -5.5624494552612305, "global_step": 31080, "epoch": 740} {"train_loss": -5.310907363891602, "global_step": 31081, "epoch": 740} {"train_loss": -5.5484466552734375, "global_step": 31082, "epoch": 740} {"train_loss": -5.359712600708008, "global_step": 31083, "epoch": 740} {"train_loss": -5.57496976852417, "global_step": 31084, "epoch": 740} {"train_loss": -5.386829376220703, "global_step": 31085, "epoch": 740} {"train_loss": -5.482181549072266, "global_step": 31086, "epoch": 740} {"train_loss": -5.422264099121094, "global_step": 31087, "epoch": 740} {"train_loss": -5.384415626525879, "global_step": 31088, "epoch": 740} {"train_loss": -5.546919822692871, "global_step": 31089, "epoch": 740} {"train_loss": -5.411284446716309, "global_step": 31090, "epoch": 740} {"train_loss": -5.527348518371582, "global_step": 31091, "epoch": 740} {"train_loss": -5.5460615158081055, "global_step": 31092, "epoch": 740} {"train_loss": -5.397554397583008, "global_step": 31093, "epoch": 740} {"train_loss": -5.523358345031738, "global_step": 31094, "epoch": 740} {"train_loss": -5.641940116882324, "global_step": 31095, "epoch": 740} {"train_loss": -5.443729877471924, "global_step": 31096, "epoch": 740} {"train_loss": -5.338939666748047, "global_step": 31097, "epoch": 740} {"train_loss": -5.35292911529541, "global_step": 31098, "epoch": 740} {"train_loss": -5.4485979080200195, "global_step": 31099, "epoch": 740} {"train_loss": -5.434051513671875, "global_step": 31100, "epoch": 740} {"train_loss": -5.392894744873047, "global_step": 31101, "epoch": 740} {"train_loss": -5.497231960296631, "global_step": 31102, "epoch": 740} {"train_loss": -5.450336456298828, "global_step": 31103, "epoch": 740} {"train_loss": -5.320050239562988, "global_step": 31104, "epoch": 740} {"train_loss": -5.477539539337158, "global_step": 31105, "epoch": 740} {"train_loss": -5.450534820556641, "global_step": 31106, "epoch": 740} {"train_loss": -5.4314961433410645, "global_step": 31107, "epoch": 740} {"train_loss": -5.554317474365234, "global_step": 31108, "epoch": 740} {"train_loss": -5.5537943840026855, "global_step": 31109, "epoch": 740} {"train_loss": -5.469498157501221, "global_step": 31110, "epoch": 740} {"train_loss": -5.493609428405762, "global_step": 31111, "epoch": 740} {"train_loss": -5.424602508544922, "global_step": 31112, "epoch": 740} {"train_loss": -5.441436767578125, "global_step": 31113, "epoch": 740} {"train_loss": -5.583846092224121, "global_step": 31114, "epoch": 740} {"train_loss": -5.490398406982422, "global_step": 31115, "epoch": 740} {"train_loss": -5.463238716125488, "global_step": 31116, "epoch": 740} {"train_loss": -5.398426532745361, "global_step": 31117, "epoch": 740} {"train_loss": -5.469162940979004, "global_step": 31118, "epoch": 740} {"train_loss": -5.441646575927734, "global_step": 31119, "epoch": 740} {"train_loss": -5.482999801635742, "global_step": 31120, "epoch": 740} {"train_loss": -5.4633631479172475, "global_step": 31121, "epoch": 740, "val_loss": 63155.0859375} {"train_loss": -5.513211250305176, "global_step": 31122, "epoch": 741} {"train_loss": -5.583916187286377, "global_step": 31123, "epoch": 741} {"train_loss": -5.491655349731445, "global_step": 31124, "epoch": 741} {"train_loss": -5.46464729309082, "global_step": 31125, "epoch": 741} {"train_loss": -5.496007919311523, "global_step": 31126, "epoch": 741} {"train_loss": -5.51346492767334, "global_step": 31127, "epoch": 741} {"train_loss": -5.4366044998168945, "global_step": 31128, "epoch": 741} {"train_loss": -5.508936882019043, "global_step": 31129, "epoch": 741} {"train_loss": -5.428427696228027, "global_step": 31130, "epoch": 741} {"train_loss": -5.414236068725586, "global_step": 31131, "epoch": 741} {"train_loss": -5.633941650390625, "global_step": 31132, "epoch": 741} {"train_loss": -5.373471260070801, "global_step": 31133, "epoch": 741} {"train_loss": -5.370993614196777, "global_step": 31134, "epoch": 741} {"train_loss": -5.495126247406006, "global_step": 31135, "epoch": 741} {"train_loss": -5.5166497230529785, "global_step": 31136, "epoch": 741} {"train_loss": -5.396766662597656, "global_step": 31137, "epoch": 741} {"train_loss": -5.3945136070251465, "global_step": 31138, "epoch": 741} {"train_loss": -5.467077255249023, "global_step": 31139, "epoch": 741} {"train_loss": -5.558541774749756, "global_step": 31140, "epoch": 741} {"train_loss": -5.651078224182129, "global_step": 31141, "epoch": 741} {"train_loss": -5.512892723083496, "global_step": 31142, "epoch": 741} {"train_loss": -5.492988109588623, "global_step": 31143, "epoch": 741} {"train_loss": -5.392848968505859, "global_step": 31144, "epoch": 741} {"train_loss": -5.451850414276123, "global_step": 31145, "epoch": 741} {"train_loss": -5.504752159118652, "global_step": 31146, "epoch": 741} {"train_loss": -5.488685607910156, "global_step": 31147, "epoch": 741} {"train_loss": -5.577925682067871, "global_step": 31148, "epoch": 741} {"train_loss": -5.704445838928223, "global_step": 31149, "epoch": 741} {"train_loss": -5.461832046508789, "global_step": 31150, "epoch": 741} {"train_loss": -5.501931190490723, "global_step": 31151, "epoch": 741} {"train_loss": -5.556552886962891, "global_step": 31152, "epoch": 741} {"train_loss": -5.43936824798584, "global_step": 31153, "epoch": 741} {"train_loss": -5.422203063964844, "global_step": 31154, "epoch": 741} {"train_loss": -5.3896331787109375, "global_step": 31155, "epoch": 741} {"train_loss": -5.646710395812988, "global_step": 31156, "epoch": 741} {"train_loss": -5.334619045257568, "global_step": 31157, "epoch": 741} {"train_loss": -5.5477519035339355, "global_step": 31158, "epoch": 741} {"train_loss": -5.448779106140137, "global_step": 31159, "epoch": 741} {"train_loss": -5.497320175170898, "global_step": 31160, "epoch": 741} {"train_loss": -5.550751686096191, "global_step": 31161, "epoch": 741} {"train_loss": -5.462218284606934, "global_step": 31162, "epoch": 741} {"train_loss": -5.490353516169956, "global_step": 31163, "epoch": 741, "val_loss": 63103.0390625} {"train_loss": -5.5276198387146, "global_step": 31164, "epoch": 742} {"train_loss": -5.562212944030762, "global_step": 31165, "epoch": 742} {"train_loss": -5.530178070068359, "global_step": 31166, "epoch": 742} {"train_loss": -5.447822093963623, "global_step": 31167, "epoch": 742} {"train_loss": -5.636143684387207, "global_step": 31168, "epoch": 742} {"train_loss": -5.44894552230835, "global_step": 31169, "epoch": 742} {"train_loss": -5.380368232727051, "global_step": 31170, "epoch": 742} {"train_loss": -5.474998474121094, "global_step": 31171, "epoch": 742} {"train_loss": -5.476646423339844, "global_step": 31172, "epoch": 742} {"train_loss": -5.491439342498779, "global_step": 31173, "epoch": 742} {"train_loss": -5.583714008331299, "global_step": 31174, "epoch": 742} {"train_loss": -5.498108863830566, "global_step": 31175, "epoch": 742} {"train_loss": -5.468966484069824, "global_step": 31176, "epoch": 742} {"train_loss": -5.502997398376465, "global_step": 31177, "epoch": 742} {"train_loss": -5.481128692626953, "global_step": 31178, "epoch": 742} {"train_loss": -5.429233074188232, "global_step": 31179, "epoch": 742} {"train_loss": -5.55126953125, "global_step": 31180, "epoch": 742} {"train_loss": -5.458613395690918, "global_step": 31181, "epoch": 742} {"train_loss": -5.501806259155273, "global_step": 31182, "epoch": 742} {"train_loss": -5.525440216064453, "global_step": 31183, "epoch": 742} {"train_loss": -5.4774651527404785, "global_step": 31184, "epoch": 742} {"train_loss": -5.43864631652832, "global_step": 31185, "epoch": 742} {"train_loss": -5.467146873474121, "global_step": 31186, "epoch": 742} {"train_loss": -5.528716087341309, "global_step": 31187, "epoch": 742} {"train_loss": -5.299468994140625, "global_step": 31188, "epoch": 742} {"train_loss": -5.396455764770508, "global_step": 31189, "epoch": 742} {"train_loss": -5.554666996002197, "global_step": 31190, "epoch": 742} {"train_loss": -5.303071975708008, "global_step": 31191, "epoch": 742} {"train_loss": -5.499905586242676, "global_step": 31192, "epoch": 742} {"train_loss": -5.542863845825195, "global_step": 31193, "epoch": 742} {"train_loss": -5.529878616333008, "global_step": 31194, "epoch": 742} {"train_loss": -5.4178619384765625, "global_step": 31195, "epoch": 742} {"train_loss": -5.500986099243164, "global_step": 31196, "epoch": 742} {"train_loss": -5.416566371917725, "global_step": 31197, "epoch": 742} {"train_loss": -5.440786838531494, "global_step": 31198, "epoch": 742} {"train_loss": -5.329753875732422, "global_step": 31199, "epoch": 742} {"train_loss": -5.550233840942383, "global_step": 31200, "epoch": 742} {"train_loss": -5.4946513175964355, "global_step": 31201, "epoch": 742} {"train_loss": -5.587635040283203, "global_step": 31202, "epoch": 742} {"train_loss": -5.5827741622924805, "global_step": 31203, "epoch": 742} {"train_loss": -5.58078145980835, "global_step": 31204, "epoch": 742} {"train_loss": -5.488214946928478, "global_step": 31205, "epoch": 742, "val_loss": 63205.74609375} {"train_loss": -5.495351791381836, "global_step": 31206, "epoch": 743} {"train_loss": -5.412895202636719, "global_step": 31207, "epoch": 743} {"train_loss": -5.4931559562683105, "global_step": 31208, "epoch": 743} {"train_loss": -5.404862403869629, "global_step": 31209, "epoch": 743} {"train_loss": -5.4630022048950195, "global_step": 31210, "epoch": 743} {"train_loss": -5.508459568023682, "global_step": 31211, "epoch": 743} {"train_loss": -5.5217437744140625, "global_step": 31212, "epoch": 743} {"train_loss": -5.4497761726379395, "global_step": 31213, "epoch": 743} {"train_loss": -5.493587970733643, "global_step": 31214, "epoch": 743} {"train_loss": -5.576203346252441, "global_step": 31215, "epoch": 743} {"train_loss": -5.432364463806152, "global_step": 31216, "epoch": 743} {"train_loss": -5.673644065856934, "global_step": 31217, "epoch": 743} {"train_loss": -5.6658735275268555, "global_step": 31218, "epoch": 743} {"train_loss": -5.564990520477295, "global_step": 31219, "epoch": 743} {"train_loss": -5.57305908203125, "global_step": 31220, "epoch": 743} {"train_loss": -5.493938446044922, "global_step": 31221, "epoch": 743} {"train_loss": -5.479544639587402, "global_step": 31222, "epoch": 743} {"train_loss": -5.442398548126221, "global_step": 31223, "epoch": 743} {"train_loss": -5.5268025398254395, "global_step": 31224, "epoch": 743} {"train_loss": -5.4188079833984375, "global_step": 31225, "epoch": 743} {"train_loss": -5.431324481964111, "global_step": 31226, "epoch": 743} {"train_loss": -5.614757061004639, "global_step": 31227, "epoch": 743} {"train_loss": -5.47872257232666, "global_step": 31228, "epoch": 743} {"train_loss": -5.570423126220703, "global_step": 31229, "epoch": 743} {"train_loss": -5.64603328704834, "global_step": 31230, "epoch": 743} {"train_loss": -5.478422164916992, "global_step": 31231, "epoch": 743} {"train_loss": -5.574613571166992, "global_step": 31232, "epoch": 743} {"train_loss": -5.384120941162109, "global_step": 31233, "epoch": 743} {"train_loss": -5.554841995239258, "global_step": 31234, "epoch": 743} {"train_loss": -5.611285209655762, "global_step": 31235, "epoch": 743} {"train_loss": -5.365537643432617, "global_step": 31236, "epoch": 743} {"train_loss": -5.550853729248047, "global_step": 31237, "epoch": 743} {"train_loss": -5.437228202819824, "global_step": 31238, "epoch": 743} {"train_loss": -5.5941667556762695, "global_step": 31239, "epoch": 743} {"train_loss": -5.453464031219482, "global_step": 31240, "epoch": 743} {"train_loss": -5.446348190307617, "global_step": 31241, "epoch": 743} {"train_loss": -5.413269996643066, "global_step": 31242, "epoch": 743} {"train_loss": -5.549973964691162, "global_step": 31243, "epoch": 743} {"train_loss": -5.545426368713379, "global_step": 31244, "epoch": 743} {"train_loss": -5.517498970031738, "global_step": 31245, "epoch": 743} {"train_loss": -5.554450988769531, "global_step": 31246, "epoch": 743} {"train_loss": -5.511964377902803, "global_step": 31247, "epoch": 743, "val_loss": 63111.4609375} {"train_loss": -5.428319931030273, "global_step": 31248, "epoch": 744} {"train_loss": -5.569362640380859, "global_step": 31249, "epoch": 744} {"train_loss": -5.622857093811035, "global_step": 31250, "epoch": 744} {"train_loss": -5.479288101196289, "global_step": 31251, "epoch": 744} {"train_loss": -5.453797340393066, "global_step": 31252, "epoch": 744} {"train_loss": -5.451970100402832, "global_step": 31253, "epoch": 744} {"train_loss": -5.543919563293457, "global_step": 31254, "epoch": 744} {"train_loss": -5.381758689880371, "global_step": 31255, "epoch": 744} {"train_loss": -5.480547904968262, "global_step": 31256, "epoch": 744} {"train_loss": -5.4841508865356445, "global_step": 31257, "epoch": 744} {"train_loss": -5.451355457305908, "global_step": 31258, "epoch": 744} {"train_loss": -5.631258964538574, "global_step": 31259, "epoch": 744} {"train_loss": -5.503699779510498, "global_step": 31260, "epoch": 744} {"train_loss": -5.558091163635254, "global_step": 31261, "epoch": 744} {"train_loss": -5.500532150268555, "global_step": 31262, "epoch": 744} {"train_loss": -5.44767427444458, "global_step": 31263, "epoch": 744} {"train_loss": -5.469612121582031, "global_step": 31264, "epoch": 744} {"train_loss": -5.458721160888672, "global_step": 31265, "epoch": 744} {"train_loss": -5.545320510864258, "global_step": 31266, "epoch": 744} {"train_loss": -5.524442672729492, "global_step": 31267, "epoch": 744} {"train_loss": -5.496661186218262, "global_step": 31268, "epoch": 744} {"train_loss": -5.652753829956055, "global_step": 31269, "epoch": 744} {"train_loss": -5.517096519470215, "global_step": 31270, "epoch": 744} {"train_loss": -5.467774391174316, "global_step": 31271, "epoch": 744} {"train_loss": -5.540865421295166, "global_step": 31272, "epoch": 744} {"train_loss": -5.585459232330322, "global_step": 31273, "epoch": 744} {"train_loss": -5.420722961425781, "global_step": 31274, "epoch": 744} {"train_loss": -5.450445175170898, "global_step": 31275, "epoch": 744} {"train_loss": -5.457322120666504, "global_step": 31276, "epoch": 744} {"train_loss": -5.516979217529297, "global_step": 31277, "epoch": 744} {"train_loss": -5.510756015777588, "global_step": 31278, "epoch": 744} {"train_loss": -5.532225608825684, "global_step": 31279, "epoch": 744} {"train_loss": -5.420177459716797, "global_step": 31280, "epoch": 744} {"train_loss": -5.480246543884277, "global_step": 31281, "epoch": 744} {"train_loss": -5.377554893493652, "global_step": 31282, "epoch": 744} {"train_loss": -5.447053909301758, "global_step": 31283, "epoch": 744} {"train_loss": -5.464130401611328, "global_step": 31284, "epoch": 744} {"train_loss": -5.4587883949279785, "global_step": 31285, "epoch": 744} {"train_loss": -5.597214221954346, "global_step": 31286, "epoch": 744} {"train_loss": -5.47072696685791, "global_step": 31287, "epoch": 744} {"train_loss": -5.489996910095215, "global_step": 31288, "epoch": 744} {"train_loss": -5.493869327363514, "global_step": 31289, "epoch": 744, "val_loss": 63537.74609375} {"train_loss": -5.416593551635742, "global_step": 31290, "epoch": 745} {"train_loss": -5.4944610595703125, "global_step": 31291, "epoch": 745} {"train_loss": -5.501655578613281, "global_step": 31292, "epoch": 745} {"train_loss": -5.47660493850708, "global_step": 31293, "epoch": 745} {"train_loss": -5.493474960327148, "global_step": 31294, "epoch": 745} {"train_loss": -5.495547294616699, "global_step": 31295, "epoch": 745} {"train_loss": -5.5907745361328125, "global_step": 31296, "epoch": 745} {"train_loss": -5.413289546966553, "global_step": 31297, "epoch": 745} {"train_loss": -5.499820709228516, "global_step": 31298, "epoch": 745} {"train_loss": -5.446272850036621, "global_step": 31299, "epoch": 745} {"train_loss": -5.638367652893066, "global_step": 31300, "epoch": 745} {"train_loss": -5.559698104858398, "global_step": 31301, "epoch": 745} {"train_loss": -5.669002056121826, "global_step": 31302, "epoch": 745} {"train_loss": -5.551183700561523, "global_step": 31303, "epoch": 745} {"train_loss": -5.607520580291748, "global_step": 31304, "epoch": 745} {"train_loss": -5.395481109619141, "global_step": 31305, "epoch": 745} {"train_loss": -5.357290267944336, "global_step": 31306, "epoch": 745} {"train_loss": -5.429430961608887, "global_step": 31307, "epoch": 745} {"train_loss": -5.562699317932129, "global_step": 31308, "epoch": 745} {"train_loss": -5.493749618530273, "global_step": 31309, "epoch": 745} {"train_loss": -5.561223030090332, "global_step": 31310, "epoch": 745} {"train_loss": -5.436546325683594, "global_step": 31311, "epoch": 745} {"train_loss": -5.5075225830078125, "global_step": 31312, "epoch": 745} {"train_loss": -5.417903423309326, "global_step": 31313, "epoch": 745} {"train_loss": -5.58931827545166, "global_step": 31314, "epoch": 745} {"train_loss": -5.419842720031738, "global_step": 31315, "epoch": 745} {"train_loss": -5.510335922241211, "global_step": 31316, "epoch": 745} {"train_loss": -5.440271377563477, "global_step": 31317, "epoch": 745} {"train_loss": -5.5501203536987305, "global_step": 31318, "epoch": 745} {"train_loss": -5.415128707885742, "global_step": 31319, "epoch": 745} {"train_loss": -5.466927528381348, "global_step": 31320, "epoch": 745} {"train_loss": -5.536441802978516, "global_step": 31321, "epoch": 745} {"train_loss": -5.456376075744629, "global_step": 31322, "epoch": 745} {"train_loss": -5.356015205383301, "global_step": 31323, "epoch": 745} {"train_loss": -5.490562438964844, "global_step": 31324, "epoch": 745} {"train_loss": -5.479979991912842, "global_step": 31325, "epoch": 745} {"train_loss": -5.422722339630127, "global_step": 31326, "epoch": 745} {"train_loss": -5.439993858337402, "global_step": 31327, "epoch": 745} {"train_loss": -5.579949378967285, "global_step": 31328, "epoch": 745} {"train_loss": -5.517172813415527, "global_step": 31329, "epoch": 745} {"train_loss": -5.531282901763916, "global_step": 31330, "epoch": 745} {"train_loss": -5.492213408152263, "global_step": 31331, "epoch": 745, "val_loss": 63167.2421875} {"train_loss": -5.490029335021973, "global_step": 31332, "epoch": 746} {"train_loss": -5.3977556228637695, "global_step": 31333, "epoch": 746} {"train_loss": -5.4254655838012695, "global_step": 31334, "epoch": 746} {"train_loss": -5.4696197509765625, "global_step": 31335, "epoch": 746} {"train_loss": -5.551607131958008, "global_step": 31336, "epoch": 746} {"train_loss": -5.468601226806641, "global_step": 31337, "epoch": 746} {"train_loss": -5.445156097412109, "global_step": 31338, "epoch": 746} {"train_loss": -5.562246322631836, "global_step": 31339, "epoch": 746} {"train_loss": -5.418878555297852, "global_step": 31340, "epoch": 746} {"train_loss": -5.493846893310547, "global_step": 31341, "epoch": 746} {"train_loss": -5.373297691345215, "global_step": 31342, "epoch": 746} {"train_loss": -5.401607036590576, "global_step": 31343, "epoch": 746} {"train_loss": -5.4834136962890625, "global_step": 31344, "epoch": 746} {"train_loss": -5.377877712249756, "global_step": 31345, "epoch": 746} {"train_loss": -5.375680446624756, "global_step": 31346, "epoch": 746} {"train_loss": -5.557806968688965, "global_step": 31347, "epoch": 746} {"train_loss": -5.607743263244629, "global_step": 31348, "epoch": 746} {"train_loss": -5.452394485473633, "global_step": 31349, "epoch": 746} {"train_loss": -5.535994052886963, "global_step": 31350, "epoch": 746} {"train_loss": -5.464078903198242, "global_step": 31351, "epoch": 746} {"train_loss": -5.46024227142334, "global_step": 31352, "epoch": 746} {"train_loss": -5.374190807342529, "global_step": 31353, "epoch": 746} {"train_loss": -5.418222904205322, "global_step": 31354, "epoch": 746} {"train_loss": -5.412126064300537, "global_step": 31355, "epoch": 746} {"train_loss": -5.532215595245361, "global_step": 31356, "epoch": 746} {"train_loss": -5.503835201263428, "global_step": 31357, "epoch": 746} {"train_loss": -5.375387668609619, "global_step": 31358, "epoch": 746} {"train_loss": -5.449435234069824, "global_step": 31359, "epoch": 746} {"train_loss": -5.412877559661865, "global_step": 31360, "epoch": 746} {"train_loss": -5.478035926818848, "global_step": 31361, "epoch": 746} {"train_loss": -5.453861713409424, "global_step": 31362, "epoch": 746} {"train_loss": -5.5523786544799805, "global_step": 31363, "epoch": 746} {"train_loss": -5.444531440734863, "global_step": 31364, "epoch": 746} {"train_loss": -5.34185791015625, "global_step": 31365, "epoch": 746} {"train_loss": -5.445735454559326, "global_step": 31366, "epoch": 746} {"train_loss": -5.511288642883301, "global_step": 31367, "epoch": 746} {"train_loss": -5.48812198638916, "global_step": 31368, "epoch": 746} {"train_loss": -5.512096405029297, "global_step": 31369, "epoch": 746} {"train_loss": -5.549880504608154, "global_step": 31370, "epoch": 746} {"train_loss": -5.437353610992432, "global_step": 31371, "epoch": 746} {"train_loss": -5.513802528381348, "global_step": 31372, "epoch": 746} {"train_loss": -5.464924596604847, "global_step": 31373, "epoch": 746, "val_loss": 63203.19921875} {"train_loss": -5.4721221923828125, "global_step": 31374, "epoch": 747} {"train_loss": -5.649281978607178, "global_step": 31375, "epoch": 747} {"train_loss": -5.565135955810547, "global_step": 31376, "epoch": 747} {"train_loss": -5.594240188598633, "global_step": 31377, "epoch": 747} {"train_loss": -5.539969444274902, "global_step": 31378, "epoch": 747} {"train_loss": -5.46782112121582, "global_step": 31379, "epoch": 747} {"train_loss": -5.451289653778076, "global_step": 31380, "epoch": 747} {"train_loss": -5.517444610595703, "global_step": 31381, "epoch": 747} {"train_loss": -5.521681785583496, "global_step": 31382, "epoch": 747} {"train_loss": -5.549770355224609, "global_step": 31383, "epoch": 747} {"train_loss": -5.461615562438965, "global_step": 31384, "epoch": 747} {"train_loss": -5.547371864318848, "global_step": 31385, "epoch": 747} {"train_loss": -5.535682201385498, "global_step": 31386, "epoch": 747} {"train_loss": -5.630996227264404, "global_step": 31387, "epoch": 747} {"train_loss": -5.492153167724609, "global_step": 31388, "epoch": 747} {"train_loss": -5.47984504699707, "global_step": 31389, "epoch": 747} {"train_loss": -5.548061847686768, "global_step": 31390, "epoch": 747} {"train_loss": -5.470104217529297, "global_step": 31391, "epoch": 747} {"train_loss": -5.59104585647583, "global_step": 31392, "epoch": 747} {"train_loss": -5.531851291656494, "global_step": 31393, "epoch": 747} {"train_loss": -5.443197727203369, "global_step": 31394, "epoch": 747} {"train_loss": -5.531195640563965, "global_step": 31395, "epoch": 747} {"train_loss": -5.644992351531982, "global_step": 31396, "epoch": 747} {"train_loss": -5.748350143432617, "global_step": 31397, "epoch": 747} {"train_loss": -5.651092529296875, "global_step": 31398, "epoch": 747} {"train_loss": -5.460240364074707, "global_step": 31399, "epoch": 747} {"train_loss": -5.362508773803711, "global_step": 31400, "epoch": 747} {"train_loss": -5.574591636657715, "global_step": 31401, "epoch": 747} {"train_loss": -5.500117301940918, "global_step": 31402, "epoch": 747} {"train_loss": -5.465304374694824, "global_step": 31403, "epoch": 747} {"train_loss": -5.398314476013184, "global_step": 31404, "epoch": 747} {"train_loss": -5.461348533630371, "global_step": 31405, "epoch": 747} {"train_loss": -5.659354209899902, "global_step": 31406, "epoch": 747} {"train_loss": -5.454278945922852, "global_step": 31407, "epoch": 747} {"train_loss": -5.293667793273926, "global_step": 31408, "epoch": 747} {"train_loss": -5.543490886688232, "global_step": 31409, "epoch": 747} {"train_loss": -5.568394660949707, "global_step": 31410, "epoch": 747} {"train_loss": -5.518182754516602, "global_step": 31411, "epoch": 747} {"train_loss": -5.4450883865356445, "global_step": 31412, "epoch": 747} {"train_loss": -5.390023231506348, "global_step": 31413, "epoch": 747} {"train_loss": -5.410650253295898, "global_step": 31414, "epoch": 747} {"train_loss": -5.513746148064023, "global_step": 31415, "epoch": 747, "val_loss": 63236.48046875} {"train_loss": -5.438146591186523, "global_step": 31416, "epoch": 748} {"train_loss": -5.368243217468262, "global_step": 31417, "epoch": 748} {"train_loss": -5.503875732421875, "global_step": 31418, "epoch": 748} {"train_loss": -5.447023391723633, "global_step": 31419, "epoch": 748} {"train_loss": -5.497360706329346, "global_step": 31420, "epoch": 748} {"train_loss": -5.561281681060791, "global_step": 31421, "epoch": 748} {"train_loss": -5.400393962860107, "global_step": 31422, "epoch": 748} {"train_loss": -5.400824546813965, "global_step": 31423, "epoch": 748} {"train_loss": -5.500282287597656, "global_step": 31424, "epoch": 748} {"train_loss": -5.589648246765137, "global_step": 31425, "epoch": 748} {"train_loss": -5.381870269775391, "global_step": 31426, "epoch": 748} {"train_loss": -5.416874408721924, "global_step": 31427, "epoch": 748} {"train_loss": -5.500100135803223, "global_step": 31428, "epoch": 748} {"train_loss": -5.446324825286865, "global_step": 31429, "epoch": 748} {"train_loss": -5.516049385070801, "global_step": 31430, "epoch": 748} {"train_loss": -5.576229095458984, "global_step": 31431, "epoch": 748} {"train_loss": -5.464909553527832, "global_step": 31432, "epoch": 748} {"train_loss": -5.499292373657227, "global_step": 31433, "epoch": 748} {"train_loss": -5.625820159912109, "global_step": 31434, "epoch": 748} {"train_loss": -5.441263675689697, "global_step": 31435, "epoch": 748} {"train_loss": -5.4013285636901855, "global_step": 31436, "epoch": 748} {"train_loss": -5.4876275062561035, "global_step": 31437, "epoch": 748} {"train_loss": -5.447509288787842, "global_step": 31438, "epoch": 748} {"train_loss": -5.562121391296387, "global_step": 31439, "epoch": 748} {"train_loss": -5.5050201416015625, "global_step": 31440, "epoch": 748} {"train_loss": -5.513740062713623, "global_step": 31441, "epoch": 748} {"train_loss": -5.313385009765625, "global_step": 31442, "epoch": 748} {"train_loss": -5.5662641525268555, "global_step": 31443, "epoch": 748} {"train_loss": -5.500387191772461, "global_step": 31444, "epoch": 748} {"train_loss": -5.491122245788574, "global_step": 31445, "epoch": 748} {"train_loss": -5.485516548156738, "global_step": 31446, "epoch": 748} {"train_loss": -5.517833709716797, "global_step": 31447, "epoch": 748} {"train_loss": -5.4918622970581055, "global_step": 31448, "epoch": 748} {"train_loss": -5.359379291534424, "global_step": 31449, "epoch": 748} {"train_loss": -5.558899879455566, "global_step": 31450, "epoch": 748} {"train_loss": -5.537160396575928, "global_step": 31451, "epoch": 748} {"train_loss": -5.505589962005615, "global_step": 31452, "epoch": 748} {"train_loss": -5.433047294616699, "global_step": 31453, "epoch": 748} {"train_loss": -5.446139335632324, "global_step": 31454, "epoch": 748} {"train_loss": -5.571677207946777, "global_step": 31455, "epoch": 748} {"train_loss": -5.5494561195373535, "global_step": 31456, "epoch": 748} {"train_loss": -5.483567726044428, "global_step": 31457, "epoch": 748, "val_loss": 62918.3203125} {"train_loss": -5.5928192138671875, "global_step": 31458, "epoch": 749} {"train_loss": -5.388323783874512, "global_step": 31459, "epoch": 749} {"train_loss": -5.427107334136963, "global_step": 31460, "epoch": 749} {"train_loss": -5.495186805725098, "global_step": 31461, "epoch": 749} {"train_loss": -5.4475789070129395, "global_step": 31462, "epoch": 749} {"train_loss": -5.491013526916504, "global_step": 31463, "epoch": 749} {"train_loss": -5.377724647521973, "global_step": 31464, "epoch": 749} {"train_loss": -5.526810646057129, "global_step": 31465, "epoch": 749} {"train_loss": -5.444344997406006, "global_step": 31466, "epoch": 749} {"train_loss": -5.554378032684326, "global_step": 31467, "epoch": 749} {"train_loss": -5.599825859069824, "global_step": 31468, "epoch": 749} {"train_loss": -5.510977268218994, "global_step": 31469, "epoch": 749} {"train_loss": -5.559626579284668, "global_step": 31470, "epoch": 749} {"train_loss": -5.460940361022949, "global_step": 31471, "epoch": 749} {"train_loss": -5.544704914093018, "global_step": 31472, "epoch": 749} {"train_loss": -5.595942497253418, "global_step": 31473, "epoch": 749} {"train_loss": -5.44856071472168, "global_step": 31474, "epoch": 749} {"train_loss": -5.567607879638672, "global_step": 31475, "epoch": 749} {"train_loss": -5.5326385498046875, "global_step": 31476, "epoch": 749} {"train_loss": -5.4959516525268555, "global_step": 31477, "epoch": 749} {"train_loss": -5.491004943847656, "global_step": 31478, "epoch": 749} {"train_loss": -5.538380146026611, "global_step": 31479, "epoch": 749} {"train_loss": -5.529533386230469, "global_step": 31480, "epoch": 749} {"train_loss": -5.428257942199707, "global_step": 31481, "epoch": 749} {"train_loss": -5.622253894805908, "global_step": 31482, "epoch": 749} {"train_loss": -5.451951503753662, "global_step": 31483, "epoch": 749} {"train_loss": -5.421972274780273, "global_step": 31484, "epoch": 749} {"train_loss": -5.636327266693115, "global_step": 31485, "epoch": 749} {"train_loss": -5.531716346740723, "global_step": 31486, "epoch": 749} {"train_loss": -5.471889495849609, "global_step": 31487, "epoch": 749} {"train_loss": -5.473484039306641, "global_step": 31488, "epoch": 749} {"train_loss": -5.495016098022461, "global_step": 31489, "epoch": 749} {"train_loss": -5.541924476623535, "global_step": 31490, "epoch": 749} {"train_loss": -5.5034565925598145, "global_step": 31491, "epoch": 749} {"train_loss": -5.451328754425049, "global_step": 31492, "epoch": 749} {"train_loss": -5.483464241027832, "global_step": 31493, "epoch": 749} {"train_loss": -5.522263526916504, "global_step": 31494, "epoch": 749} {"train_loss": -5.440920829772949, "global_step": 31495, "epoch": 749} {"train_loss": -5.473585605621338, "global_step": 31496, "epoch": 749} {"train_loss": -5.585532188415527, "global_step": 31497, "epoch": 749} {"train_loss": -5.493478775024414, "global_step": 31498, "epoch": 749} {"train_loss": -5.503390607379732, "global_step": 31499, "epoch": 749, "val_loss": 63117.2109375} {"train_loss": -5.454595565795898, "global_step": 31500, "epoch": 750} {"train_loss": -5.525235176086426, "global_step": 31501, "epoch": 750} {"train_loss": -5.681081295013428, "global_step": 31502, "epoch": 750} {"train_loss": -5.5480475425720215, "global_step": 31503, "epoch": 750} {"train_loss": -5.535495281219482, "global_step": 31504, "epoch": 750} {"train_loss": -5.49812126159668, "global_step": 31505, "epoch": 750} {"train_loss": -5.6648335456848145, "global_step": 31506, "epoch": 750} {"train_loss": -5.471807479858398, "global_step": 31507, "epoch": 750} {"train_loss": -5.510760307312012, "global_step": 31508, "epoch": 750} {"train_loss": -5.52314567565918, "global_step": 31509, "epoch": 750} {"train_loss": -5.530390739440918, "global_step": 31510, "epoch": 750} {"train_loss": -5.449109077453613, "global_step": 31511, "epoch": 750} {"train_loss": -5.533063888549805, "global_step": 31512, "epoch": 750} {"train_loss": -5.312432289123535, "global_step": 31513, "epoch": 750} {"train_loss": -5.56163215637207, "global_step": 31514, "epoch": 750} {"train_loss": -5.637345314025879, "global_step": 31515, "epoch": 750} {"train_loss": -5.424768924713135, "global_step": 31516, "epoch": 750} {"train_loss": -5.470824718475342, "global_step": 31517, "epoch": 750} {"train_loss": -5.561062335968018, "global_step": 31518, "epoch": 750} {"train_loss": -5.393068313598633, "global_step": 31519, "epoch": 750} {"train_loss": -5.543117523193359, "global_step": 31520, "epoch": 750} {"train_loss": -5.430330753326416, "global_step": 31521, "epoch": 750} {"train_loss": -5.440254211425781, "global_step": 31522, "epoch": 750} {"train_loss": -5.533366680145264, "global_step": 31523, "epoch": 750} {"train_loss": -5.366024017333984, "global_step": 31524, "epoch": 750} {"train_loss": -5.552285194396973, "global_step": 31525, "epoch": 750} {"train_loss": -5.587608814239502, "global_step": 31526, "epoch": 750} {"train_loss": -5.464931964874268, "global_step": 31527, "epoch": 750} {"train_loss": -5.469300746917725, "global_step": 31528, "epoch": 750} {"train_loss": -5.496491432189941, "global_step": 31529, "epoch": 750} {"train_loss": -5.3564958572387695, "global_step": 31530, "epoch": 750} {"train_loss": -5.366528034210205, "global_step": 31531, "epoch": 750} {"train_loss": -5.354953289031982, "global_step": 31532, "epoch": 750} {"train_loss": -5.434819221496582, "global_step": 31533, "epoch": 750} {"train_loss": -5.479081153869629, "global_step": 31534, "epoch": 750} {"train_loss": -5.371400833129883, "global_step": 31535, "epoch": 750} {"train_loss": -5.4951276779174805, "global_step": 31536, "epoch": 750} {"train_loss": -5.511224746704102, "global_step": 31537, "epoch": 750} {"train_loss": -5.468151569366455, "global_step": 31538, "epoch": 750} {"train_loss": -5.526921272277832, "global_step": 31539, "epoch": 750} {"train_loss": -5.301765441894531, "global_step": 31540, "epoch": 750} {"train_loss": -5.482643570218768, "global_step": 31541, "epoch": 750, "train/sim_max_reward_0": 0.8809573467898018, "train/sim_max_reward_1": 0.14863934342159105, "train/sim_max_reward_2": 0.5411916746483602, "train/sim_max_reward_3": 0.892167601669008, "train/sim_max_reward_4": 0.7935159150998655, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8160055404571143, "test/sim_max_reward_4300001": 0.24971282056142935, "test/sim_max_reward_4300002": 0.267820414540632, "test/sim_max_reward_4300003": 0.6751558468752268, "test/sim_max_reward_4300004": 0.8697734380512371, "test/sim_max_reward_4300005": 0.7592209471449161, "test/sim_max_reward_4300006": 0.055826380543584124, "test/sim_max_reward_4300007": 0.5884362107237022, "test/sim_max_reward_4300008": 0.7272277693993555, "test/sim_max_reward_4300009": 0.9934153448495056, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.2829632760526362, "test/sim_max_reward_4300012": 0.5904210052389676, "test/sim_max_reward_4300013": 0.803343353636351, "test/sim_max_reward_4300014": 0.6152281935491363, "test/sim_max_reward_4300015": 0.2458551979564409, "test/sim_max_reward_4300016": 0.5906477675227892, "test/sim_max_reward_4300017": 0.44941210562292766, "test/sim_max_reward_4300018": 0.5350869041994226, "test/sim_max_reward_4300019": 0.1857141960684877, "test/sim_max_reward_4300020": 0.05389271990249906, "test/sim_max_reward_4300021": 0.28965873612481835, "test/sim_max_reward_4300022": 0.1742072945878765, "test/sim_max_reward_4300023": 0.20575297892733313, "test/sim_max_reward_4300024": 0.48432012049327106, "test/sim_max_reward_4300025": 0.34009477423889395, "test/sim_max_reward_4300026": 0.17802640095713912, "test/sim_max_reward_4300027": 0.28158186438129246, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.016860943807830632, "test/sim_max_reward_4300032": 0.6079917613763934, "test/sim_max_reward_4300033": 0.9758107173733679, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.20630684269213323, "test/sim_max_reward_4300037": 0.5744988257398995, "test/sim_max_reward_4300038": 0.4919486326751865, "test/sim_max_reward_4300039": 0.6295531394917484, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.6919721150542972, "test/sim_max_reward_4300043": 0.16797433890990868, "test/sim_max_reward_4300044": 0.3975957136627618, "test/sim_max_reward_4300045": 0.18597519411576105, "test/sim_max_reward_4300046": 0.3009065931910665, "test/sim_max_reward_4300047": 0.12783368899292635, "test/sim_max_reward_4300048": 0.31592437409773055, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.5749094401651357, "test/mean_score": 0.3599990896757599, "val_loss": 62922.4921875} {"train_loss": -5.595640659332275, "global_step": 31542, "epoch": 751} {"train_loss": -5.496779441833496, "global_step": 31543, "epoch": 751} {"train_loss": -5.426609992980957, "global_step": 31544, "epoch": 751} {"train_loss": -5.540379524230957, "global_step": 31545, "epoch": 751} {"train_loss": -5.49597692489624, "global_step": 31546, "epoch": 751} {"train_loss": -5.381191253662109, "global_step": 31547, "epoch": 751} {"train_loss": -5.597336769104004, "global_step": 31548, "epoch": 751} {"train_loss": -5.517192840576172, "global_step": 31549, "epoch": 751} {"train_loss": -5.407131195068359, "global_step": 31550, "epoch": 751} {"train_loss": -5.464910507202148, "global_step": 31551, "epoch": 751} {"train_loss": -5.513336181640625, "global_step": 31552, "epoch": 751} {"train_loss": -5.473697662353516, "global_step": 31553, "epoch": 751} {"train_loss": -5.542376518249512, "global_step": 31554, "epoch": 751} {"train_loss": -5.535201549530029, "global_step": 31555, "epoch": 751} {"train_loss": -5.450566291809082, "global_step": 31556, "epoch": 751} {"train_loss": -5.577340126037598, "global_step": 31557, "epoch": 751} {"train_loss": -5.459861755371094, "global_step": 31558, "epoch": 751} {"train_loss": -5.288601875305176, "global_step": 31559, "epoch": 751} {"train_loss": -5.588662624359131, "global_step": 31560, "epoch": 751} {"train_loss": -5.529333591461182, "global_step": 31561, "epoch": 751} {"train_loss": -5.523460388183594, "global_step": 31562, "epoch": 751} {"train_loss": -5.571916103363037, "global_step": 31563, "epoch": 751} {"train_loss": -5.555852890014648, "global_step": 31564, "epoch": 751} {"train_loss": -5.471012115478516, "global_step": 31565, "epoch": 751} {"train_loss": -5.523615837097168, "global_step": 31566, "epoch": 751} {"train_loss": -5.427772521972656, "global_step": 31567, "epoch": 751} {"train_loss": -5.442922115325928, "global_step": 31568, "epoch": 751} {"train_loss": -5.425516128540039, "global_step": 31569, "epoch": 751} {"train_loss": -5.462027072906494, "global_step": 31570, "epoch": 751} {"train_loss": -5.4112677574157715, "global_step": 31571, "epoch": 751} {"train_loss": -5.566436767578125, "global_step": 31572, "epoch": 751} {"train_loss": -5.380794525146484, "global_step": 31573, "epoch": 751} {"train_loss": -5.558249473571777, "global_step": 31574, "epoch": 751} {"train_loss": -5.47322940826416, "global_step": 31575, "epoch": 751} {"train_loss": -5.47089147567749, "global_step": 31576, "epoch": 751} {"train_loss": -5.427421569824219, "global_step": 31577, "epoch": 751} {"train_loss": -5.599921226501465, "global_step": 31578, "epoch": 751} {"train_loss": -5.484986305236816, "global_step": 31579, "epoch": 751} {"train_loss": -5.518367767333984, "global_step": 31580, "epoch": 751} {"train_loss": -5.4232988357543945, "global_step": 31581, "epoch": 751} {"train_loss": -5.449593544006348, "global_step": 31582, "epoch": 751} {"train_loss": -5.48718904313587, "global_step": 31583, "epoch": 751, "val_loss": 63057.33203125} {"train_loss": -5.423462867736816, "global_step": 31584, "epoch": 752} {"train_loss": -5.594599723815918, "global_step": 31585, "epoch": 752} {"train_loss": -5.515931606292725, "global_step": 31586, "epoch": 752} {"train_loss": -5.4763336181640625, "global_step": 31587, "epoch": 752} {"train_loss": -5.510566711425781, "global_step": 31588, "epoch": 752} {"train_loss": -5.580566883087158, "global_step": 31589, "epoch": 752} {"train_loss": -5.423730850219727, "global_step": 31590, "epoch": 752} {"train_loss": -5.519299030303955, "global_step": 31591, "epoch": 752} {"train_loss": -5.52556848526001, "global_step": 31592, "epoch": 752} {"train_loss": -5.5450639724731445, "global_step": 31593, "epoch": 752} {"train_loss": -5.526663303375244, "global_step": 31594, "epoch": 752} {"train_loss": -5.490077018737793, "global_step": 31595, "epoch": 752} {"train_loss": -5.546703338623047, "global_step": 31596, "epoch": 752} {"train_loss": -5.471282958984375, "global_step": 31597, "epoch": 752} {"train_loss": -5.4458818435668945, "global_step": 31598, "epoch": 752} {"train_loss": -5.532258033752441, "global_step": 31599, "epoch": 752} {"train_loss": -5.5192742347717285, "global_step": 31600, "epoch": 752} {"train_loss": -5.503988742828369, "global_step": 31601, "epoch": 752} {"train_loss": -5.563654899597168, "global_step": 31602, "epoch": 752} {"train_loss": -5.457314968109131, "global_step": 31603, "epoch": 752} {"train_loss": -5.498910903930664, "global_step": 31604, "epoch": 752} {"train_loss": -5.502861976623535, "global_step": 31605, "epoch": 752} {"train_loss": -5.595266819000244, "global_step": 31606, "epoch": 752} {"train_loss": -5.452653884887695, "global_step": 31607, "epoch": 752} {"train_loss": -5.484630584716797, "global_step": 31608, "epoch": 752} {"train_loss": -5.556499481201172, "global_step": 31609, "epoch": 752} {"train_loss": -5.468526363372803, "global_step": 31610, "epoch": 752} {"train_loss": -5.506819725036621, "global_step": 31611, "epoch": 752} {"train_loss": -5.408662796020508, "global_step": 31612, "epoch": 752} {"train_loss": -5.614830017089844, "global_step": 31613, "epoch": 752} {"train_loss": -5.478394031524658, "global_step": 31614, "epoch": 752} {"train_loss": -5.506441116333008, "global_step": 31615, "epoch": 752} {"train_loss": -5.415009498596191, "global_step": 31616, "epoch": 752} {"train_loss": -5.450168609619141, "global_step": 31617, "epoch": 752} {"train_loss": -5.674671649932861, "global_step": 31618, "epoch": 752} {"train_loss": -5.408697128295898, "global_step": 31619, "epoch": 752} {"train_loss": -5.449749946594238, "global_step": 31620, "epoch": 752} {"train_loss": -5.38027811050415, "global_step": 31621, "epoch": 752} {"train_loss": -5.444597244262695, "global_step": 31622, "epoch": 752} {"train_loss": -5.489987373352051, "global_step": 31623, "epoch": 752} {"train_loss": -5.543927192687988, "global_step": 31624, "epoch": 752} {"train_loss": -5.500240927650815, "global_step": 31625, "epoch": 752, "val_loss": 63038.51953125} {"train_loss": -5.538207530975342, "global_step": 31626, "epoch": 753} {"train_loss": -5.5841264724731445, "global_step": 31627, "epoch": 753} {"train_loss": -5.585205554962158, "global_step": 31628, "epoch": 753} {"train_loss": -5.575783729553223, "global_step": 31629, "epoch": 753} {"train_loss": -5.532613277435303, "global_step": 31630, "epoch": 753} {"train_loss": -5.612337112426758, "global_step": 31631, "epoch": 753} {"train_loss": -5.476522445678711, "global_step": 31632, "epoch": 753} {"train_loss": -5.4604997634887695, "global_step": 31633, "epoch": 753} {"train_loss": -5.5139875411987305, "global_step": 31634, "epoch": 753} {"train_loss": -5.405948638916016, "global_step": 31635, "epoch": 753} {"train_loss": -5.365838050842285, "global_step": 31636, "epoch": 753} {"train_loss": -5.549038410186768, "global_step": 31637, "epoch": 753} {"train_loss": -5.52195930480957, "global_step": 31638, "epoch": 753} {"train_loss": -5.483336925506592, "global_step": 31639, "epoch": 753} {"train_loss": -5.291529178619385, "global_step": 31640, "epoch": 753} {"train_loss": -5.559443473815918, "global_step": 31641, "epoch": 753} {"train_loss": -5.401510238647461, "global_step": 31642, "epoch": 753} {"train_loss": -5.560094833374023, "global_step": 31643, "epoch": 753} {"train_loss": -5.551204681396484, "global_step": 31644, "epoch": 753} {"train_loss": -5.477879047393799, "global_step": 31645, "epoch": 753} {"train_loss": -5.684889793395996, "global_step": 31646, "epoch": 753} {"train_loss": -5.494146347045898, "global_step": 31647, "epoch": 753} {"train_loss": -5.636726379394531, "global_step": 31648, "epoch": 753} {"train_loss": -5.396303653717041, "global_step": 31649, "epoch": 753} {"train_loss": -5.602365970611572, "global_step": 31650, "epoch": 753} {"train_loss": -5.430156707763672, "global_step": 31651, "epoch": 753} {"train_loss": -5.350466251373291, "global_step": 31652, "epoch": 753} {"train_loss": -5.451756477355957, "global_step": 31653, "epoch": 753} {"train_loss": -5.548393249511719, "global_step": 31654, "epoch": 753} {"train_loss": -5.480253219604492, "global_step": 31655, "epoch": 753} {"train_loss": -5.590903282165527, "global_step": 31656, "epoch": 753} {"train_loss": -5.508960247039795, "global_step": 31657, "epoch": 753} {"train_loss": -5.451216697692871, "global_step": 31658, "epoch": 753} {"train_loss": -5.534640312194824, "global_step": 31659, "epoch": 753} {"train_loss": -5.643957138061523, "global_step": 31660, "epoch": 753} {"train_loss": -5.496831893920898, "global_step": 31661, "epoch": 753} {"train_loss": -5.493350028991699, "global_step": 31662, "epoch": 753} {"train_loss": -5.578578948974609, "global_step": 31663, "epoch": 753} {"train_loss": -5.577191352844238, "global_step": 31664, "epoch": 753} {"train_loss": -5.522464275360107, "global_step": 31665, "epoch": 753} {"train_loss": -5.406833648681641, "global_step": 31666, "epoch": 753} {"train_loss": -5.511345182146345, "global_step": 31667, "epoch": 753, "val_loss": 62910.9453125} {"train_loss": -5.568614482879639, "global_step": 31668, "epoch": 754} {"train_loss": -5.436154365539551, "global_step": 31669, "epoch": 754} {"train_loss": -5.431794166564941, "global_step": 31670, "epoch": 754} {"train_loss": -5.59033203125, "global_step": 31671, "epoch": 754} {"train_loss": -5.518958568572998, "global_step": 31672, "epoch": 754} {"train_loss": -5.496918201446533, "global_step": 31673, "epoch": 754} {"train_loss": -5.543123722076416, "global_step": 31674, "epoch": 754} {"train_loss": -5.318076133728027, "global_step": 31675, "epoch": 754} {"train_loss": -5.608248710632324, "global_step": 31676, "epoch": 754} {"train_loss": -5.542219161987305, "global_step": 31677, "epoch": 754} {"train_loss": -5.540137767791748, "global_step": 31678, "epoch": 754} {"train_loss": -5.550594329833984, "global_step": 31679, "epoch": 754} {"train_loss": -5.5123138427734375, "global_step": 31680, "epoch": 754} {"train_loss": -5.447870254516602, "global_step": 31681, "epoch": 754} {"train_loss": -5.503909111022949, "global_step": 31682, "epoch": 754} {"train_loss": -5.7043375968933105, "global_step": 31683, "epoch": 754} {"train_loss": -5.594372749328613, "global_step": 31684, "epoch": 754} {"train_loss": -5.59552001953125, "global_step": 31685, "epoch": 754} {"train_loss": -5.418543815612793, "global_step": 31686, "epoch": 754} {"train_loss": -5.360426902770996, "global_step": 31687, "epoch": 754} {"train_loss": -5.412708759307861, "global_step": 31688, "epoch": 754} {"train_loss": -5.40488338470459, "global_step": 31689, "epoch": 754} {"train_loss": -5.4769673347473145, "global_step": 31690, "epoch": 754} {"train_loss": -5.523688316345215, "global_step": 31691, "epoch": 754} {"train_loss": -5.313486099243164, "global_step": 31692, "epoch": 754} {"train_loss": -5.381200313568115, "global_step": 31693, "epoch": 754} {"train_loss": -5.550025939941406, "global_step": 31694, "epoch": 754} {"train_loss": -5.419099807739258, "global_step": 31695, "epoch": 754} {"train_loss": -5.492432594299316, "global_step": 31696, "epoch": 754} {"train_loss": -5.419785976409912, "global_step": 31697, "epoch": 754} {"train_loss": -5.4709625244140625, "global_step": 31698, "epoch": 754} {"train_loss": -5.463323593139648, "global_step": 31699, "epoch": 754} {"train_loss": -5.583363056182861, "global_step": 31700, "epoch": 754} {"train_loss": -5.590474605560303, "global_step": 31701, "epoch": 754} {"train_loss": -5.513565540313721, "global_step": 31702, "epoch": 754} {"train_loss": -5.454524040222168, "global_step": 31703, "epoch": 754} {"train_loss": -5.4789323806762695, "global_step": 31704, "epoch": 754} {"train_loss": -5.416496276855469, "global_step": 31705, "epoch": 754} {"train_loss": -5.566194534301758, "global_step": 31706, "epoch": 754} {"train_loss": -5.490419387817383, "global_step": 31707, "epoch": 754} {"train_loss": -5.748118877410889, "global_step": 31708, "epoch": 754} {"train_loss": -5.494435957499912, "global_step": 31709, "epoch": 754, "val_loss": 62740.04296875} {"train_loss": -5.682611465454102, "global_step": 31710, "epoch": 755} {"train_loss": -5.49343204498291, "global_step": 31711, "epoch": 755} {"train_loss": -5.386770248413086, "global_step": 31712, "epoch": 755} {"train_loss": -5.39604377746582, "global_step": 31713, "epoch": 755} {"train_loss": -5.505703926086426, "global_step": 31714, "epoch": 755} {"train_loss": -5.479621887207031, "global_step": 31715, "epoch": 755} {"train_loss": -5.567187309265137, "global_step": 31716, "epoch": 755} {"train_loss": -5.470446586608887, "global_step": 31717, "epoch": 755} {"train_loss": -5.587843894958496, "global_step": 31718, "epoch": 755} {"train_loss": -5.609350681304932, "global_step": 31719, "epoch": 755} {"train_loss": -5.6248860359191895, "global_step": 31720, "epoch": 755} {"train_loss": -5.4453301429748535, "global_step": 31721, "epoch": 755} {"train_loss": -5.548261642456055, "global_step": 31722, "epoch": 755} {"train_loss": -5.457409381866455, "global_step": 31723, "epoch": 755} {"train_loss": -5.489418983459473, "global_step": 31724, "epoch": 755} {"train_loss": -5.545119285583496, "global_step": 31725, "epoch": 755} {"train_loss": -5.623706817626953, "global_step": 31726, "epoch": 755} {"train_loss": -5.487438678741455, "global_step": 31727, "epoch": 755} {"train_loss": -5.438005447387695, "global_step": 31728, "epoch": 755} {"train_loss": -5.499053955078125, "global_step": 31729, "epoch": 755} {"train_loss": -5.334364414215088, "global_step": 31730, "epoch": 755} {"train_loss": -5.53377103805542, "global_step": 31731, "epoch": 755} {"train_loss": -5.496331214904785, "global_step": 31732, "epoch": 755} {"train_loss": -5.487043857574463, "global_step": 31733, "epoch": 755} {"train_loss": -5.60701322555542, "global_step": 31734, "epoch": 755} {"train_loss": -5.604197978973389, "global_step": 31735, "epoch": 755} {"train_loss": -5.443304061889648, "global_step": 31736, "epoch": 755} {"train_loss": -5.4577860832214355, "global_step": 31737, "epoch": 755} {"train_loss": -5.613170623779297, "global_step": 31738, "epoch": 755} {"train_loss": -5.494653701782227, "global_step": 31739, "epoch": 755} {"train_loss": -5.415996551513672, "global_step": 31740, "epoch": 755} {"train_loss": -5.596308708190918, "global_step": 31741, "epoch": 755} {"train_loss": -5.512800693511963, "global_step": 31742, "epoch": 755} {"train_loss": -5.400859832763672, "global_step": 31743, "epoch": 755} {"train_loss": -5.503233909606934, "global_step": 31744, "epoch": 755} {"train_loss": -5.438478469848633, "global_step": 31745, "epoch": 755} {"train_loss": -5.506058692932129, "global_step": 31746, "epoch": 755} {"train_loss": -5.4606709480285645, "global_step": 31747, "epoch": 755} {"train_loss": -5.420159816741943, "global_step": 31748, "epoch": 755} {"train_loss": -5.567182540893555, "global_step": 31749, "epoch": 755} {"train_loss": -5.481768608093262, "global_step": 31750, "epoch": 755} {"train_loss": -5.506340480986095, "global_step": 31751, "epoch": 755, "val_loss": 62898.984375} {"train_loss": -5.567194938659668, "global_step": 31752, "epoch": 756} {"train_loss": -5.5253987312316895, "global_step": 31753, "epoch": 756} {"train_loss": -5.643712043762207, "global_step": 31754, "epoch": 756} {"train_loss": -5.4814605712890625, "global_step": 31755, "epoch": 756} {"train_loss": -5.587902545928955, "global_step": 31756, "epoch": 756} {"train_loss": -5.623965263366699, "global_step": 31757, "epoch": 756} {"train_loss": -5.382266044616699, "global_step": 31758, "epoch": 756} {"train_loss": -5.508525371551514, "global_step": 31759, "epoch": 756} {"train_loss": -5.523989677429199, "global_step": 31760, "epoch": 756} {"train_loss": -5.46158504486084, "global_step": 31761, "epoch": 756} {"train_loss": -5.479172706604004, "global_step": 31762, "epoch": 756} {"train_loss": -5.243227958679199, "global_step": 31763, "epoch": 756} {"train_loss": -5.502419948577881, "global_step": 31764, "epoch": 756} {"train_loss": -5.510634422302246, "global_step": 31765, "epoch": 756} {"train_loss": -5.4694132804870605, "global_step": 31766, "epoch": 756} {"train_loss": -5.5381622314453125, "global_step": 31767, "epoch": 756} {"train_loss": -5.364863395690918, "global_step": 31768, "epoch": 756} {"train_loss": -5.509489059448242, "global_step": 31769, "epoch": 756} {"train_loss": -5.500434398651123, "global_step": 31770, "epoch": 756} {"train_loss": -5.523641109466553, "global_step": 31771, "epoch": 756} {"train_loss": -5.609516143798828, "global_step": 31772, "epoch": 756} {"train_loss": -5.4548726081848145, "global_step": 31773, "epoch": 756} {"train_loss": -5.448713302612305, "global_step": 31774, "epoch": 756} {"train_loss": -5.492671012878418, "global_step": 31775, "epoch": 756} {"train_loss": -5.618562698364258, "global_step": 31776, "epoch": 756} {"train_loss": -5.597415924072266, "global_step": 31777, "epoch": 756} {"train_loss": -5.62773323059082, "global_step": 31778, "epoch": 756} {"train_loss": -5.657467842102051, "global_step": 31779, "epoch": 756} {"train_loss": -5.420637130737305, "global_step": 31780, "epoch": 756} {"train_loss": -5.491262435913086, "global_step": 31781, "epoch": 756} {"train_loss": -5.500782012939453, "global_step": 31782, "epoch": 756} {"train_loss": -5.63505220413208, "global_step": 31783, "epoch": 756} {"train_loss": -5.6238861083984375, "global_step": 31784, "epoch": 756} {"train_loss": -5.637951850891113, "global_step": 31785, "epoch": 756} {"train_loss": -5.3967814445495605, "global_step": 31786, "epoch": 756} {"train_loss": -5.508722305297852, "global_step": 31787, "epoch": 756} {"train_loss": -5.458055019378662, "global_step": 31788, "epoch": 756} {"train_loss": -5.387537002563477, "global_step": 31789, "epoch": 756} {"train_loss": -5.4769978523254395, "global_step": 31790, "epoch": 756} {"train_loss": -5.469510078430176, "global_step": 31791, "epoch": 756} {"train_loss": -5.613653182983398, "global_step": 31792, "epoch": 756} {"train_loss": -5.513156345912388, "global_step": 31793, "epoch": 756, "val_loss": 62909.6640625} {"train_loss": -5.467351913452148, "global_step": 31794, "epoch": 757} {"train_loss": -5.448428153991699, "global_step": 31795, "epoch": 757} {"train_loss": -5.577897548675537, "global_step": 31796, "epoch": 757} {"train_loss": -5.540257453918457, "global_step": 31797, "epoch": 757} {"train_loss": -5.638859748840332, "global_step": 31798, "epoch": 757} {"train_loss": -5.41008186340332, "global_step": 31799, "epoch": 757} {"train_loss": -5.450814247131348, "global_step": 31800, "epoch": 757} {"train_loss": -5.475172519683838, "global_step": 31801, "epoch": 757} {"train_loss": -5.381961822509766, "global_step": 31802, "epoch": 757} {"train_loss": -5.594087600708008, "global_step": 31803, "epoch": 757} {"train_loss": -5.426810264587402, "global_step": 31804, "epoch": 757} {"train_loss": -5.540940761566162, "global_step": 31805, "epoch": 757} {"train_loss": -5.4342145919799805, "global_step": 31806, "epoch": 757} {"train_loss": -5.408818244934082, "global_step": 31807, "epoch": 757} {"train_loss": -5.423048973083496, "global_step": 31808, "epoch": 757} {"train_loss": -5.3398847579956055, "global_step": 31809, "epoch": 757} {"train_loss": -5.423046112060547, "global_step": 31810, "epoch": 757} {"train_loss": -5.5089006423950195, "global_step": 31811, "epoch": 757} {"train_loss": -5.598525047302246, "global_step": 31812, "epoch": 757} {"train_loss": -5.472926139831543, "global_step": 31813, "epoch": 757} {"train_loss": -5.527395725250244, "global_step": 31814, "epoch": 757} {"train_loss": -5.412510395050049, "global_step": 31815, "epoch": 757} {"train_loss": -5.632811546325684, "global_step": 31816, "epoch": 757} {"train_loss": -5.502730846405029, "global_step": 31817, "epoch": 757} {"train_loss": -5.540800094604492, "global_step": 31818, "epoch": 757} {"train_loss": -5.488909721374512, "global_step": 31819, "epoch": 757} {"train_loss": -5.587921142578125, "global_step": 31820, "epoch": 757} {"train_loss": -5.513559341430664, "global_step": 31821, "epoch": 757} {"train_loss": -5.473696708679199, "global_step": 31822, "epoch": 757} {"train_loss": -5.521923065185547, "global_step": 31823, "epoch": 757} {"train_loss": -5.529818534851074, "global_step": 31824, "epoch": 757} {"train_loss": -5.446396350860596, "global_step": 31825, "epoch": 757} {"train_loss": -5.510072708129883, "global_step": 31826, "epoch": 757} {"train_loss": -5.524769306182861, "global_step": 31827, "epoch": 757} {"train_loss": -5.624449729919434, "global_step": 31828, "epoch": 757} {"train_loss": -5.542497634887695, "global_step": 31829, "epoch": 757} {"train_loss": -5.570128440856934, "global_step": 31830, "epoch": 757} {"train_loss": -5.5532708168029785, "global_step": 31831, "epoch": 757} {"train_loss": -5.521231651306152, "global_step": 31832, "epoch": 757} {"train_loss": -5.451623439788818, "global_step": 31833, "epoch": 757} {"train_loss": -5.536108493804932, "global_step": 31834, "epoch": 757} {"train_loss": -5.501167933146159, "global_step": 31835, "epoch": 757, "val_loss": 62782.2578125} {"train_loss": -5.594393730163574, "global_step": 31836, "epoch": 758} {"train_loss": -5.620966911315918, "global_step": 31837, "epoch": 758} {"train_loss": -5.297061920166016, "global_step": 31838, "epoch": 758} {"train_loss": -5.566570281982422, "global_step": 31839, "epoch": 758} {"train_loss": -5.460928440093994, "global_step": 31840, "epoch": 758} {"train_loss": -5.417985916137695, "global_step": 31841, "epoch": 758} {"train_loss": -5.681282997131348, "global_step": 31842, "epoch": 758} {"train_loss": -5.284261703491211, "global_step": 31843, "epoch": 758} {"train_loss": -5.413196563720703, "global_step": 31844, "epoch": 758} {"train_loss": -5.5643744468688965, "global_step": 31845, "epoch": 758} {"train_loss": -5.346205711364746, "global_step": 31846, "epoch": 758} {"train_loss": -5.5440354347229, "global_step": 31847, "epoch": 758} {"train_loss": -5.450952529907227, "global_step": 31848, "epoch": 758} {"train_loss": -5.311773300170898, "global_step": 31849, "epoch": 758} {"train_loss": -5.386910438537598, "global_step": 31850, "epoch": 758} {"train_loss": -5.462586879730225, "global_step": 31851, "epoch": 758} {"train_loss": -5.383957862854004, "global_step": 31852, "epoch": 758} {"train_loss": -5.438867568969727, "global_step": 31853, "epoch": 758} {"train_loss": -5.540315628051758, "global_step": 31854, "epoch": 758} {"train_loss": -5.309394359588623, "global_step": 31855, "epoch": 758} {"train_loss": -5.454638481140137, "global_step": 31856, "epoch": 758} {"train_loss": -5.413561820983887, "global_step": 31857, "epoch": 758} {"train_loss": -5.545652389526367, "global_step": 31858, "epoch": 758} {"train_loss": -5.502495288848877, "global_step": 31859, "epoch": 758} {"train_loss": -5.427107810974121, "global_step": 31860, "epoch": 758} {"train_loss": -5.445925712585449, "global_step": 31861, "epoch": 758} {"train_loss": -5.457980155944824, "global_step": 31862, "epoch": 758} {"train_loss": -5.404355049133301, "global_step": 31863, "epoch": 758} {"train_loss": -5.60988712310791, "global_step": 31864, "epoch": 758} {"train_loss": -5.471059322357178, "global_step": 31865, "epoch": 758} {"train_loss": -5.463008880615234, "global_step": 31866, "epoch": 758} {"train_loss": -5.560234069824219, "global_step": 31867, "epoch": 758} {"train_loss": -5.463332176208496, "global_step": 31868, "epoch": 758} {"train_loss": -5.543143272399902, "global_step": 31869, "epoch": 758} {"train_loss": -5.488372325897217, "global_step": 31870, "epoch": 758} {"train_loss": -5.4521484375, "global_step": 31871, "epoch": 758} {"train_loss": -5.488753318786621, "global_step": 31872, "epoch": 758} {"train_loss": -5.485678672790527, "global_step": 31873, "epoch": 758} {"train_loss": -5.501775741577148, "global_step": 31874, "epoch": 758} {"train_loss": -5.653225421905518, "global_step": 31875, "epoch": 758} {"train_loss": -5.422410011291504, "global_step": 31876, "epoch": 758} {"train_loss": -5.473703475225539, "global_step": 31877, "epoch": 758, "val_loss": 63000.484375} {"train_loss": -5.545389652252197, "global_step": 31878, "epoch": 759} {"train_loss": -5.422968864440918, "global_step": 31879, "epoch": 759} {"train_loss": -5.550797462463379, "global_step": 31880, "epoch": 759} {"train_loss": -5.561186790466309, "global_step": 31881, "epoch": 759} {"train_loss": -5.40201473236084, "global_step": 31882, "epoch": 759} {"train_loss": -5.474071979522705, "global_step": 31883, "epoch": 759} {"train_loss": -5.464763641357422, "global_step": 31884, "epoch": 759} {"train_loss": -5.612025737762451, "global_step": 31885, "epoch": 759} {"train_loss": -5.495417594909668, "global_step": 31886, "epoch": 759} {"train_loss": -5.485813617706299, "global_step": 31887, "epoch": 759} {"train_loss": -5.558040618896484, "global_step": 31888, "epoch": 759} {"train_loss": -5.606350898742676, "global_step": 31889, "epoch": 759} {"train_loss": -5.5728583335876465, "global_step": 31890, "epoch": 759} {"train_loss": -5.537205219268799, "global_step": 31891, "epoch": 759} {"train_loss": -5.470256805419922, "global_step": 31892, "epoch": 759} {"train_loss": -5.357887268066406, "global_step": 31893, "epoch": 759} {"train_loss": -5.558156967163086, "global_step": 31894, "epoch": 759} {"train_loss": -5.561919689178467, "global_step": 31895, "epoch": 759} {"train_loss": -5.3698625564575195, "global_step": 31896, "epoch": 759} {"train_loss": -5.497276782989502, "global_step": 31897, "epoch": 759} {"train_loss": -5.585962295532227, "global_step": 31898, "epoch": 759} {"train_loss": -5.554845333099365, "global_step": 31899, "epoch": 759} {"train_loss": -5.480255603790283, "global_step": 31900, "epoch": 759} {"train_loss": -5.491396903991699, "global_step": 31901, "epoch": 759} {"train_loss": -5.400208473205566, "global_step": 31902, "epoch": 759} {"train_loss": -5.390083312988281, "global_step": 31903, "epoch": 759} {"train_loss": -5.574898719787598, "global_step": 31904, "epoch": 759} {"train_loss": -5.379876136779785, "global_step": 31905, "epoch": 759} {"train_loss": -5.62690544128418, "global_step": 31906, "epoch": 759} {"train_loss": -5.571983337402344, "global_step": 31907, "epoch": 759} {"train_loss": -5.458423614501953, "global_step": 31908, "epoch": 759} {"train_loss": -5.51613187789917, "global_step": 31909, "epoch": 759} {"train_loss": -5.435756683349609, "global_step": 31910, "epoch": 759} {"train_loss": -5.348816871643066, "global_step": 31911, "epoch": 759} {"train_loss": -5.470606803894043, "global_step": 31912, "epoch": 759} {"train_loss": -5.490495681762695, "global_step": 31913, "epoch": 759} {"train_loss": -5.530004978179932, "global_step": 31914, "epoch": 759} {"train_loss": -5.264515399932861, "global_step": 31915, "epoch": 759} {"train_loss": -5.603333473205566, "global_step": 31916, "epoch": 759} {"train_loss": -5.50123929977417, "global_step": 31917, "epoch": 759} {"train_loss": -5.612713813781738, "global_step": 31918, "epoch": 759} {"train_loss": -5.497427202406383, "global_step": 31919, "epoch": 759, "val_loss": 63172.21875} {"train_loss": -5.555802345275879, "global_step": 31920, "epoch": 760} {"train_loss": -5.393628120422363, "global_step": 31921, "epoch": 760} {"train_loss": -5.594302654266357, "global_step": 31922, "epoch": 760} {"train_loss": -5.578322410583496, "global_step": 31923, "epoch": 760} {"train_loss": -5.559382915496826, "global_step": 31924, "epoch": 760} {"train_loss": -5.508547782897949, "global_step": 31925, "epoch": 760} {"train_loss": -5.548785209655762, "global_step": 31926, "epoch": 760} {"train_loss": -5.564205169677734, "global_step": 31927, "epoch": 760} {"train_loss": -5.4022417068481445, "global_step": 31928, "epoch": 760} {"train_loss": -5.490067481994629, "global_step": 31929, "epoch": 760} {"train_loss": -5.446364879608154, "global_step": 31930, "epoch": 760} {"train_loss": -5.546381950378418, "global_step": 31931, "epoch": 760} {"train_loss": -5.6173014640808105, "global_step": 31932, "epoch": 760} {"train_loss": -5.489193916320801, "global_step": 31933, "epoch": 760} {"train_loss": -5.574359893798828, "global_step": 31934, "epoch": 760} {"train_loss": -5.512301445007324, "global_step": 31935, "epoch": 760} {"train_loss": -5.548699378967285, "global_step": 31936, "epoch": 760} {"train_loss": -5.513213634490967, "global_step": 31937, "epoch": 760} {"train_loss": -5.512530326843262, "global_step": 31938, "epoch": 760} {"train_loss": -5.58095645904541, "global_step": 31939, "epoch": 760} {"train_loss": -5.510188579559326, "global_step": 31940, "epoch": 760} {"train_loss": -5.4215898513793945, "global_step": 31941, "epoch": 760} {"train_loss": -5.445978164672852, "global_step": 31942, "epoch": 760} {"train_loss": -5.587950229644775, "global_step": 31943, "epoch": 760} {"train_loss": -5.524864196777344, "global_step": 31944, "epoch": 760} {"train_loss": -5.398314476013184, "global_step": 31945, "epoch": 760} {"train_loss": -5.386053562164307, "global_step": 31946, "epoch": 760} {"train_loss": -5.490236282348633, "global_step": 31947, "epoch": 760} {"train_loss": -5.4371867179870605, "global_step": 31948, "epoch": 760} {"train_loss": -5.375000953674316, "global_step": 31949, "epoch": 760} {"train_loss": -5.451298713684082, "global_step": 31950, "epoch": 760} {"train_loss": -5.381413459777832, "global_step": 31951, "epoch": 760} {"train_loss": -5.50386905670166, "global_step": 31952, "epoch": 760} {"train_loss": -5.365893840789795, "global_step": 31953, "epoch": 760} {"train_loss": -5.473376274108887, "global_step": 31954, "epoch": 760} {"train_loss": -5.499934196472168, "global_step": 31955, "epoch": 760} {"train_loss": -5.270469665527344, "global_step": 31956, "epoch": 760} {"train_loss": -5.569558143615723, "global_step": 31957, "epoch": 760} {"train_loss": -5.433730602264404, "global_step": 31958, "epoch": 760} {"train_loss": -5.540161609649658, "global_step": 31959, "epoch": 760} {"train_loss": -5.554412841796875, "global_step": 31960, "epoch": 760} {"train_loss": -5.490423281987508, "global_step": 31961, "epoch": 760, "val_loss": 62901.7734375} {"train_loss": -5.479462623596191, "global_step": 31962, "epoch": 761} {"train_loss": -5.551254749298096, "global_step": 31963, "epoch": 761} {"train_loss": -5.570008277893066, "global_step": 31964, "epoch": 761} {"train_loss": -5.496278285980225, "global_step": 31965, "epoch": 761} {"train_loss": -5.550682544708252, "global_step": 31966, "epoch": 761} {"train_loss": -5.610248565673828, "global_step": 31967, "epoch": 761} {"train_loss": -5.569563865661621, "global_step": 31968, "epoch": 761} {"train_loss": -5.47674560546875, "global_step": 31969, "epoch": 761} {"train_loss": -5.497381687164307, "global_step": 31970, "epoch": 761} {"train_loss": -5.547228813171387, "global_step": 31971, "epoch": 761} {"train_loss": -5.503561496734619, "global_step": 31972, "epoch": 761} {"train_loss": -5.481022357940674, "global_step": 31973, "epoch": 761} {"train_loss": -5.565823554992676, "global_step": 31974, "epoch": 761} {"train_loss": -5.474119186401367, "global_step": 31975, "epoch": 761} {"train_loss": -5.529437065124512, "global_step": 31976, "epoch": 761} {"train_loss": -5.5562896728515625, "global_step": 31977, "epoch": 761} {"train_loss": -5.26485538482666, "global_step": 31978, "epoch": 761} {"train_loss": -5.5522379875183105, "global_step": 31979, "epoch": 761} {"train_loss": -5.406633377075195, "global_step": 31980, "epoch": 761} {"train_loss": -5.446142673492432, "global_step": 31981, "epoch": 761} {"train_loss": -5.529975891113281, "global_step": 31982, "epoch": 761} {"train_loss": -5.43480110168457, "global_step": 31983, "epoch": 761} {"train_loss": -5.545802116394043, "global_step": 31984, "epoch": 761} {"train_loss": -5.397362232208252, "global_step": 31985, "epoch": 761} {"train_loss": -5.498381614685059, "global_step": 31986, "epoch": 761} {"train_loss": -5.506719589233398, "global_step": 31987, "epoch": 761} {"train_loss": -5.4724626541137695, "global_step": 31988, "epoch": 761} {"train_loss": -5.5713396072387695, "global_step": 31989, "epoch": 761} {"train_loss": -5.643792629241943, "global_step": 31990, "epoch": 761} {"train_loss": -5.404635429382324, "global_step": 31991, "epoch": 761} {"train_loss": -5.463067531585693, "global_step": 31992, "epoch": 761} {"train_loss": -5.464204788208008, "global_step": 31993, "epoch": 761} {"train_loss": -5.546823501586914, "global_step": 31994, "epoch": 761} {"train_loss": -5.489307403564453, "global_step": 31995, "epoch": 761} {"train_loss": -5.468671798706055, "global_step": 31996, "epoch": 761} {"train_loss": -5.444972038269043, "global_step": 31997, "epoch": 761} {"train_loss": -5.60556173324585, "global_step": 31998, "epoch": 761} {"train_loss": -5.424185752868652, "global_step": 31999, "epoch": 761} {"train_loss": -5.528077125549316, "global_step": 32000, "epoch": 761} {"train_loss": -5.415839672088623, "global_step": 32001, "epoch": 761} {"train_loss": -5.532196998596191, "global_step": 32002, "epoch": 761} {"train_loss": -5.503772474470592, "global_step": 32003, "epoch": 761, "val_loss": 62889.84765625} {"train_loss": -5.384337902069092, "global_step": 32004, "epoch": 762} {"train_loss": -5.662487983703613, "global_step": 32005, "epoch": 762} {"train_loss": -5.5239644050598145, "global_step": 32006, "epoch": 762} {"train_loss": -5.4807448387146, "global_step": 32007, "epoch": 762} {"train_loss": -5.570163249969482, "global_step": 32008, "epoch": 762} {"train_loss": -5.544399738311768, "global_step": 32009, "epoch": 762} {"train_loss": -5.525629043579102, "global_step": 32010, "epoch": 762} {"train_loss": -5.5740509033203125, "global_step": 32011, "epoch": 762} {"train_loss": -5.605325698852539, "global_step": 32012, "epoch": 762} {"train_loss": -5.471829414367676, "global_step": 32013, "epoch": 762} {"train_loss": -5.382409572601318, "global_step": 32014, "epoch": 762} {"train_loss": -5.653451919555664, "global_step": 32015, "epoch": 762} {"train_loss": -5.564212799072266, "global_step": 32016, "epoch": 762} {"train_loss": -5.546265602111816, "global_step": 32017, "epoch": 762} {"train_loss": -5.527424335479736, "global_step": 32018, "epoch": 762} {"train_loss": -5.449633598327637, "global_step": 32019, "epoch": 762} {"train_loss": -5.534745216369629, "global_step": 32020, "epoch": 762} {"train_loss": -5.523284912109375, "global_step": 32021, "epoch": 762} {"train_loss": -5.522705078125, "global_step": 32022, "epoch": 762} {"train_loss": -5.438889026641846, "global_step": 32023, "epoch": 762} {"train_loss": -5.50508975982666, "global_step": 32024, "epoch": 762} {"train_loss": -5.425270080566406, "global_step": 32025, "epoch": 762} {"train_loss": -5.435972690582275, "global_step": 32026, "epoch": 762} {"train_loss": -5.48518705368042, "global_step": 32027, "epoch": 762} {"train_loss": -5.2434282302856445, "global_step": 32028, "epoch": 762} {"train_loss": -5.458418369293213, "global_step": 32029, "epoch": 762} {"train_loss": -5.456482887268066, "global_step": 32030, "epoch": 762} {"train_loss": -5.403285980224609, "global_step": 32031, "epoch": 762} {"train_loss": -5.564999103546143, "global_step": 32032, "epoch": 762} {"train_loss": -5.430824279785156, "global_step": 32033, "epoch": 762} {"train_loss": -5.439684867858887, "global_step": 32034, "epoch": 762} {"train_loss": -5.591269493103027, "global_step": 32035, "epoch": 762} {"train_loss": -5.505797863006592, "global_step": 32036, "epoch": 762} {"train_loss": -5.557738304138184, "global_step": 32037, "epoch": 762} {"train_loss": -5.479514122009277, "global_step": 32038, "epoch": 762} {"train_loss": -5.441511154174805, "global_step": 32039, "epoch": 762} {"train_loss": -5.518332004547119, "global_step": 32040, "epoch": 762} {"train_loss": -5.431095123291016, "global_step": 32041, "epoch": 762} {"train_loss": -5.510807037353516, "global_step": 32042, "epoch": 762} {"train_loss": -5.558293342590332, "global_step": 32043, "epoch": 762} {"train_loss": -5.451938152313232, "global_step": 32044, "epoch": 762} {"train_loss": -5.498300461542039, "global_step": 32045, "epoch": 762, "val_loss": 62829.6640625} {"train_loss": -5.516084671020508, "global_step": 32046, "epoch": 763} {"train_loss": -5.55027961730957, "global_step": 32047, "epoch": 763} {"train_loss": -5.450644493103027, "global_step": 32048, "epoch": 763} {"train_loss": -5.545223712921143, "global_step": 32049, "epoch": 763} {"train_loss": -5.440210819244385, "global_step": 32050, "epoch": 763} {"train_loss": -5.446329116821289, "global_step": 32051, "epoch": 763} {"train_loss": -5.50201416015625, "global_step": 32052, "epoch": 763} {"train_loss": -5.533106327056885, "global_step": 32053, "epoch": 763} {"train_loss": -5.413234233856201, "global_step": 32054, "epoch": 763} {"train_loss": -5.445843696594238, "global_step": 32055, "epoch": 763} {"train_loss": -5.535297393798828, "global_step": 32056, "epoch": 763} {"train_loss": -5.556589126586914, "global_step": 32057, "epoch": 763} {"train_loss": -5.467948913574219, "global_step": 32058, "epoch": 763} {"train_loss": -5.5378007888793945, "global_step": 32059, "epoch": 763} {"train_loss": -5.508291244506836, "global_step": 32060, "epoch": 763} {"train_loss": -5.463773727416992, "global_step": 32061, "epoch": 763} {"train_loss": -5.480113983154297, "global_step": 32062, "epoch": 763} {"train_loss": -5.5342183113098145, "global_step": 32063, "epoch": 763} {"train_loss": -5.374744892120361, "global_step": 32064, "epoch": 763} {"train_loss": -5.481196403503418, "global_step": 32065, "epoch": 763} {"train_loss": -5.5833845138549805, "global_step": 32066, "epoch": 763} {"train_loss": -5.3396077156066895, "global_step": 32067, "epoch": 763} {"train_loss": -5.478403568267822, "global_step": 32068, "epoch": 763} {"train_loss": -5.476215839385986, "global_step": 32069, "epoch": 763} {"train_loss": -5.4066667556762695, "global_step": 32070, "epoch": 763} {"train_loss": -5.421193599700928, "global_step": 32071, "epoch": 763} {"train_loss": -5.49196195602417, "global_step": 32072, "epoch": 763} {"train_loss": -5.49808406829834, "global_step": 32073, "epoch": 763} {"train_loss": -5.613715171813965, "global_step": 32074, "epoch": 763} {"train_loss": -5.645877838134766, "global_step": 32075, "epoch": 763} {"train_loss": -5.6322431564331055, "global_step": 32076, "epoch": 763} {"train_loss": -5.495621681213379, "global_step": 32077, "epoch": 763} {"train_loss": -5.515111446380615, "global_step": 32078, "epoch": 763} {"train_loss": -5.464969158172607, "global_step": 32079, "epoch": 763} {"train_loss": -5.496586799621582, "global_step": 32080, "epoch": 763} {"train_loss": -5.558328628540039, "global_step": 32081, "epoch": 763} {"train_loss": -5.5729899406433105, "global_step": 32082, "epoch": 763} {"train_loss": -5.663609027862549, "global_step": 32083, "epoch": 763} {"train_loss": -5.518638610839844, "global_step": 32084, "epoch": 763} {"train_loss": -5.464969635009766, "global_step": 32085, "epoch": 763} {"train_loss": -5.6039605140686035, "global_step": 32086, "epoch": 763} {"train_loss": -5.503438438688006, "global_step": 32087, "epoch": 763, "val_loss": 62849.1953125} {"train_loss": -5.563875198364258, "global_step": 32088, "epoch": 764} {"train_loss": -5.602673053741455, "global_step": 32089, "epoch": 764} {"train_loss": -5.598550319671631, "global_step": 32090, "epoch": 764} {"train_loss": -5.658648490905762, "global_step": 32091, "epoch": 764} {"train_loss": -5.532408714294434, "global_step": 32092, "epoch": 764} {"train_loss": -5.490744113922119, "global_step": 32093, "epoch": 764} {"train_loss": -5.576305389404297, "global_step": 32094, "epoch": 764} {"train_loss": -5.405149936676025, "global_step": 32095, "epoch": 764} {"train_loss": -5.51484489440918, "global_step": 32096, "epoch": 764} {"train_loss": -5.460062026977539, "global_step": 32097, "epoch": 764} {"train_loss": -5.512458801269531, "global_step": 32098, "epoch": 764} {"train_loss": -5.548929214477539, "global_step": 32099, "epoch": 764} {"train_loss": -5.562914848327637, "global_step": 32100, "epoch": 764} {"train_loss": -5.403660774230957, "global_step": 32101, "epoch": 764} {"train_loss": -5.447924613952637, "global_step": 32102, "epoch": 764} {"train_loss": -5.315780162811279, "global_step": 32103, "epoch": 764} {"train_loss": -5.598148345947266, "global_step": 32104, "epoch": 764} {"train_loss": -5.387503623962402, "global_step": 32105, "epoch": 764} {"train_loss": -5.380481243133545, "global_step": 32106, "epoch": 764} {"train_loss": -5.4533891677856445, "global_step": 32107, "epoch": 764} {"train_loss": -5.455531120300293, "global_step": 32108, "epoch": 764} {"train_loss": -5.4555983543396, "global_step": 32109, "epoch": 764} {"train_loss": -5.467012882232666, "global_step": 32110, "epoch": 764} {"train_loss": -5.497527122497559, "global_step": 32111, "epoch": 764} {"train_loss": -5.422073841094971, "global_step": 32112, "epoch": 764} {"train_loss": -5.40674352645874, "global_step": 32113, "epoch": 764} {"train_loss": -5.404397964477539, "global_step": 32114, "epoch": 764} {"train_loss": -5.539826393127441, "global_step": 32115, "epoch": 764} {"train_loss": -5.4414753913879395, "global_step": 32116, "epoch": 764} {"train_loss": -5.49422550201416, "global_step": 32117, "epoch": 764} {"train_loss": -5.323790073394775, "global_step": 32118, "epoch": 764} {"train_loss": -5.485999584197998, "global_step": 32119, "epoch": 764} {"train_loss": -5.357386112213135, "global_step": 32120, "epoch": 764} {"train_loss": -5.578305721282959, "global_step": 32121, "epoch": 764} {"train_loss": -5.4479875564575195, "global_step": 32122, "epoch": 764} {"train_loss": -5.431249141693115, "global_step": 32123, "epoch": 764} {"train_loss": -5.509720802307129, "global_step": 32124, "epoch": 764} {"train_loss": -5.37520694732666, "global_step": 32125, "epoch": 764} {"train_loss": -5.509264945983887, "global_step": 32126, "epoch": 764} {"train_loss": -5.4651198387146, "global_step": 32127, "epoch": 764} {"train_loss": -5.457577705383301, "global_step": 32128, "epoch": 764} {"train_loss": -5.477083319709415, "global_step": 32129, "epoch": 764, "val_loss": 62983.92578125} {"train_loss": -5.398369789123535, "global_step": 32130, "epoch": 765} {"train_loss": -5.472259998321533, "global_step": 32131, "epoch": 765} {"train_loss": -5.427580833435059, "global_step": 32132, "epoch": 765} {"train_loss": -5.610470294952393, "global_step": 32133, "epoch": 765} {"train_loss": -5.412696838378906, "global_step": 32134, "epoch": 765} {"train_loss": -5.482393741607666, "global_step": 32135, "epoch": 765} {"train_loss": -5.431474685668945, "global_step": 32136, "epoch": 765} {"train_loss": -5.473040580749512, "global_step": 32137, "epoch": 765} {"train_loss": -5.5274553298950195, "global_step": 32138, "epoch": 765} {"train_loss": -5.520130157470703, "global_step": 32139, "epoch": 765} {"train_loss": -5.691437721252441, "global_step": 32140, "epoch": 765} {"train_loss": -5.506482124328613, "global_step": 32141, "epoch": 765} {"train_loss": -5.416596412658691, "global_step": 32142, "epoch": 765} {"train_loss": -5.593998908996582, "global_step": 32143, "epoch": 765} {"train_loss": -5.682430267333984, "global_step": 32144, "epoch": 765} {"train_loss": -5.40445613861084, "global_step": 32145, "epoch": 765} {"train_loss": -5.413320541381836, "global_step": 32146, "epoch": 765} {"train_loss": -5.515103816986084, "global_step": 32147, "epoch": 765} {"train_loss": -5.523392200469971, "global_step": 32148, "epoch": 765} {"train_loss": -5.557552814483643, "global_step": 32149, "epoch": 765} {"train_loss": -5.430456161499023, "global_step": 32150, "epoch": 765} {"train_loss": -5.556451797485352, "global_step": 32151, "epoch": 765} {"train_loss": -5.469935417175293, "global_step": 32152, "epoch": 765} {"train_loss": -5.551792621612549, "global_step": 32153, "epoch": 765} {"train_loss": -5.547579765319824, "global_step": 32154, "epoch": 765} {"train_loss": -5.550883769989014, "global_step": 32155, "epoch": 765} {"train_loss": -5.471346855163574, "global_step": 32156, "epoch": 765} {"train_loss": -5.530455112457275, "global_step": 32157, "epoch": 765} {"train_loss": -5.609199523925781, "global_step": 32158, "epoch": 765} {"train_loss": -5.402531623840332, "global_step": 32159, "epoch": 765} {"train_loss": -5.518255710601807, "global_step": 32160, "epoch": 765} {"train_loss": -5.622247219085693, "global_step": 32161, "epoch": 765} {"train_loss": -5.42582893371582, "global_step": 32162, "epoch": 765} {"train_loss": -5.6537065505981445, "global_step": 32163, "epoch": 765} {"train_loss": -5.525524139404297, "global_step": 32164, "epoch": 765} {"train_loss": -5.425258636474609, "global_step": 32165, "epoch": 765} {"train_loss": -5.587307929992676, "global_step": 32166, "epoch": 765} {"train_loss": -5.445286750793457, "global_step": 32167, "epoch": 765} {"train_loss": -5.452373027801514, "global_step": 32168, "epoch": 765} {"train_loss": -5.52851676940918, "global_step": 32169, "epoch": 765} {"train_loss": -5.498385429382324, "global_step": 32170, "epoch": 765} {"train_loss": -5.509585494086856, "global_step": 32171, "epoch": 765, "val_loss": 62712.8203125} {"train_loss": -5.682954788208008, "global_step": 32172, "epoch": 766} {"train_loss": -5.445916175842285, "global_step": 32173, "epoch": 766} {"train_loss": -5.536396026611328, "global_step": 32174, "epoch": 766} {"train_loss": -5.529217720031738, "global_step": 32175, "epoch": 766} {"train_loss": -5.545863628387451, "global_step": 32176, "epoch": 766} {"train_loss": -5.467496395111084, "global_step": 32177, "epoch": 766} {"train_loss": -5.53703498840332, "global_step": 32178, "epoch": 766} {"train_loss": -5.440180778503418, "global_step": 32179, "epoch": 766} {"train_loss": -5.484429359436035, "global_step": 32180, "epoch": 766} {"train_loss": -5.366467475891113, "global_step": 32181, "epoch": 766} {"train_loss": -5.520798683166504, "global_step": 32182, "epoch": 766} {"train_loss": -5.49329948425293, "global_step": 32183, "epoch": 766} {"train_loss": -5.528786659240723, "global_step": 32184, "epoch": 766} {"train_loss": -5.368981838226318, "global_step": 32185, "epoch": 766} {"train_loss": -5.464529514312744, "global_step": 32186, "epoch": 766} {"train_loss": -5.361510276794434, "global_step": 32187, "epoch": 766} {"train_loss": -5.419832229614258, "global_step": 32188, "epoch": 766} {"train_loss": -5.559689521789551, "global_step": 32189, "epoch": 766} {"train_loss": -5.435702323913574, "global_step": 32190, "epoch": 766} {"train_loss": -5.518069744110107, "global_step": 32191, "epoch": 766} {"train_loss": -5.530399322509766, "global_step": 32192, "epoch": 766} {"train_loss": -5.398532867431641, "global_step": 32193, "epoch": 766} {"train_loss": -5.5808820724487305, "global_step": 32194, "epoch": 766} {"train_loss": -5.502198696136475, "global_step": 32195, "epoch": 766} {"train_loss": -5.575822830200195, "global_step": 32196, "epoch": 766} {"train_loss": -5.570776462554932, "global_step": 32197, "epoch": 766} {"train_loss": -5.560196876525879, "global_step": 32198, "epoch": 766} {"train_loss": -5.538225173950195, "global_step": 32199, "epoch": 766} {"train_loss": -5.512270450592041, "global_step": 32200, "epoch": 766} {"train_loss": -5.538727760314941, "global_step": 32201, "epoch": 766} {"train_loss": -5.665040016174316, "global_step": 32202, "epoch": 766} {"train_loss": -5.581282615661621, "global_step": 32203, "epoch": 766} {"train_loss": -5.565642833709717, "global_step": 32204, "epoch": 766} {"train_loss": -5.4762468338012695, "global_step": 32205, "epoch": 766} {"train_loss": -5.609408378601074, "global_step": 32206, "epoch": 766} {"train_loss": -5.431000709533691, "global_step": 32207, "epoch": 766} {"train_loss": -5.458725929260254, "global_step": 32208, "epoch": 766} {"train_loss": -5.577685832977295, "global_step": 32209, "epoch": 766} {"train_loss": -5.6219940185546875, "global_step": 32210, "epoch": 766} {"train_loss": -5.447028160095215, "global_step": 32211, "epoch": 766} {"train_loss": -5.453728199005127, "global_step": 32212, "epoch": 766} {"train_loss": -5.511183920360747, "global_step": 32213, "epoch": 766, "val_loss": 62753.3125} {"train_loss": -5.492820739746094, "global_step": 32214, "epoch": 767} {"train_loss": -5.500828266143799, "global_step": 32215, "epoch": 767} {"train_loss": -5.582777976989746, "global_step": 32216, "epoch": 767} {"train_loss": -5.550408840179443, "global_step": 32217, "epoch": 767} {"train_loss": -5.500556945800781, "global_step": 32218, "epoch": 767} {"train_loss": -5.5763654708862305, "global_step": 32219, "epoch": 767} {"train_loss": -5.3960161209106445, "global_step": 32220, "epoch": 767} {"train_loss": -5.509518623352051, "global_step": 32221, "epoch": 767} {"train_loss": -5.372955322265625, "global_step": 32222, "epoch": 767} {"train_loss": -5.489351272583008, "global_step": 32223, "epoch": 767} {"train_loss": -5.377657890319824, "global_step": 32224, "epoch": 767} {"train_loss": -5.45979642868042, "global_step": 32225, "epoch": 767} {"train_loss": -5.5612006187438965, "global_step": 32226, "epoch": 767} {"train_loss": -5.515009880065918, "global_step": 32227, "epoch": 767} {"train_loss": -5.436866760253906, "global_step": 32228, "epoch": 767} {"train_loss": -5.426057815551758, "global_step": 32229, "epoch": 767} {"train_loss": -5.445014953613281, "global_step": 32230, "epoch": 767} {"train_loss": -5.554605484008789, "global_step": 32231, "epoch": 767} {"train_loss": -5.4407806396484375, "global_step": 32232, "epoch": 767} {"train_loss": -5.6911773681640625, "global_step": 32233, "epoch": 767} {"train_loss": -5.424737453460693, "global_step": 32234, "epoch": 767} {"train_loss": -5.546886444091797, "global_step": 32235, "epoch": 767} {"train_loss": -5.5639142990112305, "global_step": 32236, "epoch": 767} {"train_loss": -5.446678638458252, "global_step": 32237, "epoch": 767} {"train_loss": -5.550042152404785, "global_step": 32238, "epoch": 767} {"train_loss": -5.556365966796875, "global_step": 32239, "epoch": 767} {"train_loss": -5.4698991775512695, "global_step": 32240, "epoch": 767} {"train_loss": -5.415862560272217, "global_step": 32241, "epoch": 767} {"train_loss": -5.5191426277160645, "global_step": 32242, "epoch": 767} {"train_loss": -5.508353233337402, "global_step": 32243, "epoch": 767} {"train_loss": -5.562174320220947, "global_step": 32244, "epoch": 767} {"train_loss": -5.419466018676758, "global_step": 32245, "epoch": 767} {"train_loss": -5.423595428466797, "global_step": 32246, "epoch": 767} {"train_loss": -5.531529426574707, "global_step": 32247, "epoch": 767} {"train_loss": -5.539720058441162, "global_step": 32248, "epoch": 767} {"train_loss": -5.371339797973633, "global_step": 32249, "epoch": 767} {"train_loss": -5.4762163162231445, "global_step": 32250, "epoch": 767} {"train_loss": -5.640186309814453, "global_step": 32251, "epoch": 767} {"train_loss": -5.411290168762207, "global_step": 32252, "epoch": 767} {"train_loss": -5.460484504699707, "global_step": 32253, "epoch": 767} {"train_loss": -5.36712646484375, "global_step": 32254, "epoch": 767} {"train_loss": -5.488568601154146, "global_step": 32255, "epoch": 767, "val_loss": 62954.31640625} {"train_loss": -5.552987575531006, "global_step": 32256, "epoch": 768} {"train_loss": -5.387438774108887, "global_step": 32257, "epoch": 768} {"train_loss": -5.507998466491699, "global_step": 32258, "epoch": 768} {"train_loss": -5.529784202575684, "global_step": 32259, "epoch": 768} {"train_loss": -5.350019931793213, "global_step": 32260, "epoch": 768} {"train_loss": -5.541069030761719, "global_step": 32261, "epoch": 768} {"train_loss": -5.384674072265625, "global_step": 32262, "epoch": 768} {"train_loss": -5.584249496459961, "global_step": 32263, "epoch": 768} {"train_loss": -5.530160427093506, "global_step": 32264, "epoch": 768} {"train_loss": -5.523776054382324, "global_step": 32265, "epoch": 768} {"train_loss": -5.514335632324219, "global_step": 32266, "epoch": 768} {"train_loss": -5.542967796325684, "global_step": 32267, "epoch": 768} {"train_loss": -5.564738750457764, "global_step": 32268, "epoch": 768} {"train_loss": -5.471588134765625, "global_step": 32269, "epoch": 768} {"train_loss": -5.569958209991455, "global_step": 32270, "epoch": 768} {"train_loss": -5.641518592834473, "global_step": 32271, "epoch": 768} {"train_loss": -5.477272033691406, "global_step": 32272, "epoch": 768} {"train_loss": -5.405986785888672, "global_step": 32273, "epoch": 768} {"train_loss": -5.519695281982422, "global_step": 32274, "epoch": 768} {"train_loss": -5.45914888381958, "global_step": 32275, "epoch": 768} {"train_loss": -5.539101600646973, "global_step": 32276, "epoch": 768} {"train_loss": -5.532548427581787, "global_step": 32277, "epoch": 768} {"train_loss": -5.484959602355957, "global_step": 32278, "epoch": 768} {"train_loss": -5.558157920837402, "global_step": 32279, "epoch": 768} {"train_loss": -5.519980430603027, "global_step": 32280, "epoch": 768} {"train_loss": -5.564652442932129, "global_step": 32281, "epoch": 768} {"train_loss": -5.549579620361328, "global_step": 32282, "epoch": 768} {"train_loss": -5.534848213195801, "global_step": 32283, "epoch": 768} {"train_loss": -5.503303050994873, "global_step": 32284, "epoch": 768} {"train_loss": -5.574297904968262, "global_step": 32285, "epoch": 768} {"train_loss": -5.457209587097168, "global_step": 32286, "epoch": 768} {"train_loss": -5.611806869506836, "global_step": 32287, "epoch": 768} {"train_loss": -5.5949602127075195, "global_step": 32288, "epoch": 768} {"train_loss": -5.4534149169921875, "global_step": 32289, "epoch": 768} {"train_loss": -5.574281215667725, "global_step": 32290, "epoch": 768} {"train_loss": -5.398082733154297, "global_step": 32291, "epoch": 768} {"train_loss": -5.514191150665283, "global_step": 32292, "epoch": 768} {"train_loss": -5.510533332824707, "global_step": 32293, "epoch": 768} {"train_loss": -5.426862716674805, "global_step": 32294, "epoch": 768} {"train_loss": -5.710670471191406, "global_step": 32295, "epoch": 768} {"train_loss": -5.553631782531738, "global_step": 32296, "epoch": 768} {"train_loss": -5.519358169464838, "global_step": 32297, "epoch": 768, "val_loss": 62851.3671875} {"train_loss": -5.546568870544434, "global_step": 32298, "epoch": 769} {"train_loss": -5.569547653198242, "global_step": 32299, "epoch": 769} {"train_loss": -5.471117973327637, "global_step": 32300, "epoch": 769} {"train_loss": -5.473194599151611, "global_step": 32301, "epoch": 769} {"train_loss": -5.5580596923828125, "global_step": 32302, "epoch": 769} {"train_loss": -5.419819355010986, "global_step": 32303, "epoch": 769} {"train_loss": -5.438052177429199, "global_step": 32304, "epoch": 769} {"train_loss": -5.555412769317627, "global_step": 32305, "epoch": 769} {"train_loss": -5.454171180725098, "global_step": 32306, "epoch": 769} {"train_loss": -5.656184673309326, "global_step": 32307, "epoch": 769} {"train_loss": -5.631115913391113, "global_step": 32308, "epoch": 769} {"train_loss": -5.4619221687316895, "global_step": 32309, "epoch": 769} {"train_loss": -5.445533752441406, "global_step": 32310, "epoch": 769} {"train_loss": -5.471538543701172, "global_step": 32311, "epoch": 769} {"train_loss": -5.3964643478393555, "global_step": 32312, "epoch": 769} {"train_loss": -5.5035810470581055, "global_step": 32313, "epoch": 769} {"train_loss": -5.509547233581543, "global_step": 32314, "epoch": 769} {"train_loss": -5.438802719116211, "global_step": 32315, "epoch": 769} {"train_loss": -5.509990215301514, "global_step": 32316, "epoch": 769} {"train_loss": -5.529114723205566, "global_step": 32317, "epoch": 769} {"train_loss": -5.432254791259766, "global_step": 32318, "epoch": 769} {"train_loss": -5.471856117248535, "global_step": 32319, "epoch": 769} {"train_loss": -5.53902530670166, "global_step": 32320, "epoch": 769} {"train_loss": -5.4643120765686035, "global_step": 32321, "epoch": 769} {"train_loss": -5.606400966644287, "global_step": 32322, "epoch": 769} {"train_loss": -5.59455680847168, "global_step": 32323, "epoch": 769} {"train_loss": -5.417399883270264, "global_step": 32324, "epoch": 769} {"train_loss": -5.550717353820801, "global_step": 32325, "epoch": 769} {"train_loss": -5.4945478439331055, "global_step": 32326, "epoch": 769} {"train_loss": -5.402673721313477, "global_step": 32327, "epoch": 769} {"train_loss": -5.511356830596924, "global_step": 32328, "epoch": 769} {"train_loss": -5.390352725982666, "global_step": 32329, "epoch": 769} {"train_loss": -5.490218639373779, "global_step": 32330, "epoch": 769} {"train_loss": -5.411365509033203, "global_step": 32331, "epoch": 769} {"train_loss": -5.484063625335693, "global_step": 32332, "epoch": 769} {"train_loss": -5.464908599853516, "global_step": 32333, "epoch": 769} {"train_loss": -5.63713264465332, "global_step": 32334, "epoch": 769} {"train_loss": -5.464406490325928, "global_step": 32335, "epoch": 769} {"train_loss": -5.380040168762207, "global_step": 32336, "epoch": 769} {"train_loss": -5.516176223754883, "global_step": 32337, "epoch": 769} {"train_loss": -5.574035167694092, "global_step": 32338, "epoch": 769} {"train_loss": -5.4969093799591064, "global_step": 32339, "epoch": 769, "val_loss": 63204.75} {"train_loss": -5.484058380126953, "global_step": 32340, "epoch": 770} {"train_loss": -5.398232460021973, "global_step": 32341, "epoch": 770} {"train_loss": -5.629308700561523, "global_step": 32342, "epoch": 770} {"train_loss": -5.6218671798706055, "global_step": 32343, "epoch": 770} {"train_loss": -5.482403755187988, "global_step": 32344, "epoch": 770} {"train_loss": -5.434210777282715, "global_step": 32345, "epoch": 770} {"train_loss": -5.429110527038574, "global_step": 32346, "epoch": 770} {"train_loss": -5.444007873535156, "global_step": 32347, "epoch": 770} {"train_loss": -5.380776882171631, "global_step": 32348, "epoch": 770} {"train_loss": -5.444936275482178, "global_step": 32349, "epoch": 770} {"train_loss": -5.5829668045043945, "global_step": 32350, "epoch": 770} {"train_loss": -5.3311052322387695, "global_step": 32351, "epoch": 770} {"train_loss": -5.580263614654541, "global_step": 32352, "epoch": 770} {"train_loss": -5.424798011779785, "global_step": 32353, "epoch": 770} {"train_loss": -5.482193946838379, "global_step": 32354, "epoch": 770} {"train_loss": -5.455409049987793, "global_step": 32355, "epoch": 770} {"train_loss": -5.4470295906066895, "global_step": 32356, "epoch": 770} {"train_loss": -5.582839012145996, "global_step": 32357, "epoch": 770} {"train_loss": -5.5492401123046875, "global_step": 32358, "epoch": 770} {"train_loss": -5.54168701171875, "global_step": 32359, "epoch": 770} {"train_loss": -5.5850348472595215, "global_step": 32360, "epoch": 770} {"train_loss": -5.620548725128174, "global_step": 32361, "epoch": 770} {"train_loss": -5.457573890686035, "global_step": 32362, "epoch": 770} {"train_loss": -5.487540245056152, "global_step": 32363, "epoch": 770} {"train_loss": -5.689664363861084, "global_step": 32364, "epoch": 770} {"train_loss": -5.598973751068115, "global_step": 32365, "epoch": 770} {"train_loss": -5.512018203735352, "global_step": 32366, "epoch": 770} {"train_loss": -5.568149566650391, "global_step": 32367, "epoch": 770} {"train_loss": -5.486172676086426, "global_step": 32368, "epoch": 770} {"train_loss": -5.538496971130371, "global_step": 32369, "epoch": 770} {"train_loss": -5.575433731079102, "global_step": 32370, "epoch": 770} {"train_loss": -5.464958190917969, "global_step": 32371, "epoch": 770} {"train_loss": -5.6703338623046875, "global_step": 32372, "epoch": 770} {"train_loss": -5.620186805725098, "global_step": 32373, "epoch": 770} {"train_loss": -5.538002967834473, "global_step": 32374, "epoch": 770} {"train_loss": -5.579875946044922, "global_step": 32375, "epoch": 770} {"train_loss": -5.568528175354004, "global_step": 32376, "epoch": 770} {"train_loss": -5.3979692459106445, "global_step": 32377, "epoch": 770} {"train_loss": -5.586050987243652, "global_step": 32378, "epoch": 770} {"train_loss": -5.3982343673706055, "global_step": 32379, "epoch": 770} {"train_loss": -5.406146049499512, "global_step": 32380, "epoch": 770} {"train_loss": -5.511592104321434, "global_step": 32381, "epoch": 770, "val_loss": 62978.9453125} {"train_loss": -5.586749076843262, "global_step": 32382, "epoch": 771} {"train_loss": -5.554173469543457, "global_step": 32383, "epoch": 771} {"train_loss": -5.540392875671387, "global_step": 32384, "epoch": 771} {"train_loss": -5.455814361572266, "global_step": 32385, "epoch": 771} {"train_loss": -5.485379219055176, "global_step": 32386, "epoch": 771} {"train_loss": -5.438558578491211, "global_step": 32387, "epoch": 771} {"train_loss": -5.406946182250977, "global_step": 32388, "epoch": 771} {"train_loss": -5.402829170227051, "global_step": 32389, "epoch": 771} {"train_loss": -5.506621360778809, "global_step": 32390, "epoch": 771} {"train_loss": -5.594486236572266, "global_step": 32391, "epoch": 771} {"train_loss": -5.753787040710449, "global_step": 32392, "epoch": 771} {"train_loss": -5.5525288581848145, "global_step": 32393, "epoch": 771} {"train_loss": -5.638349533081055, "global_step": 32394, "epoch": 771} {"train_loss": -5.487878322601318, "global_step": 32395, "epoch": 771} {"train_loss": -5.379847526550293, "global_step": 32396, "epoch": 771} {"train_loss": -5.677905559539795, "global_step": 32397, "epoch": 771} {"train_loss": -5.710643768310547, "global_step": 32398, "epoch": 771} {"train_loss": -5.499728202819824, "global_step": 32399, "epoch": 771} {"train_loss": -5.4632039070129395, "global_step": 32400, "epoch": 771} {"train_loss": -5.417552471160889, "global_step": 32401, "epoch": 771} {"train_loss": -5.539205551147461, "global_step": 32402, "epoch": 771} {"train_loss": -5.569893836975098, "global_step": 32403, "epoch": 771} {"train_loss": -5.533576011657715, "global_step": 32404, "epoch": 771} {"train_loss": -5.487703800201416, "global_step": 32405, "epoch": 771} {"train_loss": -5.449128150939941, "global_step": 32406, "epoch": 771} {"train_loss": -5.298050403594971, "global_step": 32407, "epoch": 771} {"train_loss": -5.529687881469727, "global_step": 32408, "epoch": 771} {"train_loss": -5.4262471199035645, "global_step": 32409, "epoch": 771} {"train_loss": -5.525676727294922, "global_step": 32410, "epoch": 771} {"train_loss": -5.651905059814453, "global_step": 32411, "epoch": 771} {"train_loss": -5.418434143066406, "global_step": 32412, "epoch": 771} {"train_loss": -5.539475440979004, "global_step": 32413, "epoch": 771} {"train_loss": -5.482490062713623, "global_step": 32414, "epoch": 771} {"train_loss": -5.5214385986328125, "global_step": 32415, "epoch": 771} {"train_loss": -5.5128679275512695, "global_step": 32416, "epoch": 771} {"train_loss": -5.502407073974609, "global_step": 32417, "epoch": 771} {"train_loss": -5.636384010314941, "global_step": 32418, "epoch": 771} {"train_loss": -5.4646406173706055, "global_step": 32419, "epoch": 771} {"train_loss": -5.523148536682129, "global_step": 32420, "epoch": 771} {"train_loss": -5.505829811096191, "global_step": 32421, "epoch": 771} {"train_loss": -5.521634101867676, "global_step": 32422, "epoch": 771} {"train_loss": -5.518441313789005, "global_step": 32423, "epoch": 771, "val_loss": 63035.36328125} {"train_loss": -5.510030746459961, "global_step": 32424, "epoch": 772} {"train_loss": -5.465576648712158, "global_step": 32425, "epoch": 772} {"train_loss": -5.506635665893555, "global_step": 32426, "epoch": 772} {"train_loss": -5.4110260009765625, "global_step": 32427, "epoch": 772} {"train_loss": -5.623772621154785, "global_step": 32428, "epoch": 772} {"train_loss": -5.644048690795898, "global_step": 32429, "epoch": 772} {"train_loss": -5.40630578994751, "global_step": 32430, "epoch": 772} {"train_loss": -5.570091247558594, "global_step": 32431, "epoch": 772} {"train_loss": -5.605110168457031, "global_step": 32432, "epoch": 772} {"train_loss": -5.618753433227539, "global_step": 32433, "epoch": 772} {"train_loss": -5.480087757110596, "global_step": 32434, "epoch": 772} {"train_loss": -5.647964954376221, "global_step": 32435, "epoch": 772} {"train_loss": -5.497829437255859, "global_step": 32436, "epoch": 772} {"train_loss": -5.629943370819092, "global_step": 32437, "epoch": 772} {"train_loss": -5.375088691711426, "global_step": 32438, "epoch": 772} {"train_loss": -5.535892486572266, "global_step": 32439, "epoch": 772} {"train_loss": -5.485600471496582, "global_step": 32440, "epoch": 772} {"train_loss": -5.516716957092285, "global_step": 32441, "epoch": 772} {"train_loss": -5.596774101257324, "global_step": 32442, "epoch": 772} {"train_loss": -5.4889631271362305, "global_step": 32443, "epoch": 772} {"train_loss": -5.616629600524902, "global_step": 32444, "epoch": 772} {"train_loss": -5.650227069854736, "global_step": 32445, "epoch": 772} {"train_loss": -5.4401044845581055, "global_step": 32446, "epoch": 772} {"train_loss": -5.5634918212890625, "global_step": 32447, "epoch": 772} {"train_loss": -5.547855854034424, "global_step": 32448, "epoch": 772} {"train_loss": -5.467423439025879, "global_step": 32449, "epoch": 772} {"train_loss": -5.52346134185791, "global_step": 32450, "epoch": 772} {"train_loss": -5.531399250030518, "global_step": 32451, "epoch": 772} {"train_loss": -5.54934024810791, "global_step": 32452, "epoch": 772} {"train_loss": -5.433671474456787, "global_step": 32453, "epoch": 772} {"train_loss": -5.475738525390625, "global_step": 32454, "epoch": 772} {"train_loss": -5.478819847106934, "global_step": 32455, "epoch": 772} {"train_loss": -5.494547367095947, "global_step": 32456, "epoch": 772} {"train_loss": -5.506495952606201, "global_step": 32457, "epoch": 772} {"train_loss": -5.526034832000732, "global_step": 32458, "epoch": 772} {"train_loss": -5.5609893798828125, "global_step": 32459, "epoch": 772} {"train_loss": -5.471277713775635, "global_step": 32460, "epoch": 772} {"train_loss": -5.500068187713623, "global_step": 32461, "epoch": 772} {"train_loss": -5.562455654144287, "global_step": 32462, "epoch": 772} {"train_loss": -5.468681335449219, "global_step": 32463, "epoch": 772} {"train_loss": -5.607366561889648, "global_step": 32464, "epoch": 772} {"train_loss": -5.525592803955078, "global_step": 32465, "epoch": 772, "val_loss": 62910.38671875} {"train_loss": -5.569921970367432, "global_step": 32466, "epoch": 773} {"train_loss": -5.62859582901001, "global_step": 32467, "epoch": 773} {"train_loss": -5.566773414611816, "global_step": 32468, "epoch": 773} {"train_loss": -5.470834732055664, "global_step": 32469, "epoch": 773} {"train_loss": -5.378653526306152, "global_step": 32470, "epoch": 773} {"train_loss": -5.536938667297363, "global_step": 32471, "epoch": 773} {"train_loss": -5.559451103210449, "global_step": 32472, "epoch": 773} {"train_loss": -5.419236183166504, "global_step": 32473, "epoch": 773} {"train_loss": -5.525712490081787, "global_step": 32474, "epoch": 773} {"train_loss": -5.63162899017334, "global_step": 32475, "epoch": 773} {"train_loss": -5.405777454376221, "global_step": 32476, "epoch": 773} {"train_loss": -5.438429355621338, "global_step": 32477, "epoch": 773} {"train_loss": -5.443665504455566, "global_step": 32478, "epoch": 773} {"train_loss": -5.446704864501953, "global_step": 32479, "epoch": 773} {"train_loss": -5.430713176727295, "global_step": 32480, "epoch": 773} {"train_loss": -5.378567218780518, "global_step": 32481, "epoch": 773} {"train_loss": -5.480493545532227, "global_step": 32482, "epoch": 773} {"train_loss": -5.450954437255859, "global_step": 32483, "epoch": 773} {"train_loss": -5.371849060058594, "global_step": 32484, "epoch": 773} {"train_loss": -5.4683966636657715, "global_step": 32485, "epoch": 773} {"train_loss": -5.4802398681640625, "global_step": 32486, "epoch": 773} {"train_loss": -5.434762954711914, "global_step": 32487, "epoch": 773} {"train_loss": -5.679805755615234, "global_step": 32488, "epoch": 773} {"train_loss": -5.488587379455566, "global_step": 32489, "epoch": 773} {"train_loss": -5.579648971557617, "global_step": 32490, "epoch": 773} {"train_loss": -5.499843120574951, "global_step": 32491, "epoch": 773} {"train_loss": -5.506701469421387, "global_step": 32492, "epoch": 773} {"train_loss": -5.419325351715088, "global_step": 32493, "epoch": 773} {"train_loss": -5.478902816772461, "global_step": 32494, "epoch": 773} {"train_loss": -5.612232208251953, "global_step": 32495, "epoch": 773} {"train_loss": -5.554614543914795, "global_step": 32496, "epoch": 773} {"train_loss": -5.567926406860352, "global_step": 32497, "epoch": 773} {"train_loss": -5.427697658538818, "global_step": 32498, "epoch": 773} {"train_loss": -5.435867786407471, "global_step": 32499, "epoch": 773} {"train_loss": -5.499856948852539, "global_step": 32500, "epoch": 773} {"train_loss": -5.550174713134766, "global_step": 32501, "epoch": 773} {"train_loss": -5.52454948425293, "global_step": 32502, "epoch": 773} {"train_loss": -5.52171516418457, "global_step": 32503, "epoch": 773} {"train_loss": -5.480806350708008, "global_step": 32504, "epoch": 773} {"train_loss": -5.711711883544922, "global_step": 32505, "epoch": 773} {"train_loss": -5.6007080078125, "global_step": 32506, "epoch": 773} {"train_loss": -5.502923511323475, "global_step": 32507, "epoch": 773, "val_loss": 62890.609375} {"train_loss": -5.462055206298828, "global_step": 32508, "epoch": 774} {"train_loss": -5.45005989074707, "global_step": 32509, "epoch": 774} {"train_loss": -5.541972637176514, "global_step": 32510, "epoch": 774} {"train_loss": -5.459556579589844, "global_step": 32511, "epoch": 774} {"train_loss": -5.4230194091796875, "global_step": 32512, "epoch": 774} {"train_loss": -5.468221664428711, "global_step": 32513, "epoch": 774} {"train_loss": -5.569493293762207, "global_step": 32514, "epoch": 774} {"train_loss": -5.674107074737549, "global_step": 32515, "epoch": 774} {"train_loss": -5.559152126312256, "global_step": 32516, "epoch": 774} {"train_loss": -5.470756530761719, "global_step": 32517, "epoch": 774} {"train_loss": -5.540244102478027, "global_step": 32518, "epoch": 774} {"train_loss": -5.6619873046875, "global_step": 32519, "epoch": 774} {"train_loss": -5.578977584838867, "global_step": 32520, "epoch": 774} {"train_loss": -5.378289222717285, "global_step": 32521, "epoch": 774} {"train_loss": -5.634683132171631, "global_step": 32522, "epoch": 774} {"train_loss": -5.5062456130981445, "global_step": 32523, "epoch": 774} {"train_loss": -5.508494853973389, "global_step": 32524, "epoch": 774} {"train_loss": -5.397503852844238, "global_step": 32525, "epoch": 774} {"train_loss": -5.403414249420166, "global_step": 32526, "epoch": 774} {"train_loss": -5.576173305511475, "global_step": 32527, "epoch": 774} {"train_loss": -5.5374908447265625, "global_step": 32528, "epoch": 774} {"train_loss": -5.608373165130615, "global_step": 32529, "epoch": 774} {"train_loss": -5.404444694519043, "global_step": 32530, "epoch": 774} {"train_loss": -5.709864616394043, "global_step": 32531, "epoch": 774} {"train_loss": -5.434859752655029, "global_step": 32532, "epoch": 774} {"train_loss": -5.557798385620117, "global_step": 32533, "epoch": 774} {"train_loss": -5.613961219787598, "global_step": 32534, "epoch": 774} {"train_loss": -5.584236145019531, "global_step": 32535, "epoch": 774} {"train_loss": -5.631908893585205, "global_step": 32536, "epoch": 774} {"train_loss": -5.6730475425720215, "global_step": 32537, "epoch": 774} {"train_loss": -5.519173622131348, "global_step": 32538, "epoch": 774} {"train_loss": -5.58089542388916, "global_step": 32539, "epoch": 774} {"train_loss": -5.528390884399414, "global_step": 32540, "epoch": 774} {"train_loss": -5.500494480133057, "global_step": 32541, "epoch": 774} {"train_loss": -5.574763298034668, "global_step": 32542, "epoch": 774} {"train_loss": -5.463367938995361, "global_step": 32543, "epoch": 774} {"train_loss": -5.492661952972412, "global_step": 32544, "epoch": 774} {"train_loss": -5.638394355773926, "global_step": 32545, "epoch": 774} {"train_loss": -5.484706878662109, "global_step": 32546, "epoch": 774} {"train_loss": -5.533298492431641, "global_step": 32547, "epoch": 774} {"train_loss": -5.5142436027526855, "global_step": 32548, "epoch": 774} {"train_loss": -5.530110120773315, "global_step": 32549, "epoch": 774, "val_loss": 63061.99609375} {"train_loss": -5.504126071929932, "global_step": 32550, "epoch": 775} {"train_loss": -5.532118320465088, "global_step": 32551, "epoch": 775} {"train_loss": -5.291552543640137, "global_step": 32552, "epoch": 775} {"train_loss": -5.463142395019531, "global_step": 32553, "epoch": 775} {"train_loss": -5.467616081237793, "global_step": 32554, "epoch": 775} {"train_loss": -5.500246047973633, "global_step": 32555, "epoch": 775} {"train_loss": -5.614360809326172, "global_step": 32556, "epoch": 775} {"train_loss": -5.492129325866699, "global_step": 32557, "epoch": 775} {"train_loss": -5.537596702575684, "global_step": 32558, "epoch": 775} {"train_loss": -5.439890384674072, "global_step": 32559, "epoch": 775} {"train_loss": -5.51492977142334, "global_step": 32560, "epoch": 775} {"train_loss": -5.496152877807617, "global_step": 32561, "epoch": 775} {"train_loss": -5.5205254554748535, "global_step": 32562, "epoch": 775} {"train_loss": -5.522436141967773, "global_step": 32563, "epoch": 775} {"train_loss": -5.508535861968994, "global_step": 32564, "epoch": 775} {"train_loss": -5.553121566772461, "global_step": 32565, "epoch": 775} {"train_loss": -5.331812381744385, "global_step": 32566, "epoch": 775} {"train_loss": -5.57242488861084, "global_step": 32567, "epoch": 775} {"train_loss": -5.504973411560059, "global_step": 32568, "epoch": 775} {"train_loss": -5.419316291809082, "global_step": 32569, "epoch": 775} {"train_loss": -5.362821578979492, "global_step": 32570, "epoch": 775} {"train_loss": -5.557843208312988, "global_step": 32571, "epoch": 775} {"train_loss": -5.506003379821777, "global_step": 32572, "epoch": 775} {"train_loss": -5.501584053039551, "global_step": 32573, "epoch": 775} {"train_loss": -5.487644195556641, "global_step": 32574, "epoch": 775} {"train_loss": -5.388305187225342, "global_step": 32575, "epoch": 775} {"train_loss": -5.644867420196533, "global_step": 32576, "epoch": 775} {"train_loss": -5.432674407958984, "global_step": 32577, "epoch": 775} {"train_loss": -5.588756084442139, "global_step": 32578, "epoch": 775} {"train_loss": -5.536424160003662, "global_step": 32579, "epoch": 775} {"train_loss": -5.535635948181152, "global_step": 32580, "epoch": 775} {"train_loss": -5.486257553100586, "global_step": 32581, "epoch": 775} {"train_loss": -5.553167343139648, "global_step": 32582, "epoch": 775} {"train_loss": -5.472067356109619, "global_step": 32583, "epoch": 775} {"train_loss": -5.540557861328125, "global_step": 32584, "epoch": 775} {"train_loss": -5.638426780700684, "global_step": 32585, "epoch": 775} {"train_loss": -5.4560956954956055, "global_step": 32586, "epoch": 775} {"train_loss": -5.601840019226074, "global_step": 32587, "epoch": 775} {"train_loss": -5.537110805511475, "global_step": 32588, "epoch": 775} {"train_loss": -5.420358657836914, "global_step": 32589, "epoch": 775} {"train_loss": -5.632533073425293, "global_step": 32590, "epoch": 775} {"train_loss": -5.505598942438762, "global_step": 32591, "epoch": 775, "val_loss": 62892.3125} {"train_loss": -5.4357428550720215, "global_step": 32592, "epoch": 776} {"train_loss": -5.464759349822998, "global_step": 32593, "epoch": 776} {"train_loss": -5.364214897155762, "global_step": 32594, "epoch": 776} {"train_loss": -5.527259349822998, "global_step": 32595, "epoch": 776} {"train_loss": -5.508035182952881, "global_step": 32596, "epoch": 776} {"train_loss": -5.362495422363281, "global_step": 32597, "epoch": 776} {"train_loss": -5.4695963859558105, "global_step": 32598, "epoch": 776} {"train_loss": -5.485396385192871, "global_step": 32599, "epoch": 776} {"train_loss": -5.57049560546875, "global_step": 32600, "epoch": 776} {"train_loss": -5.511073112487793, "global_step": 32601, "epoch": 776} {"train_loss": -5.479207992553711, "global_step": 32602, "epoch": 776} {"train_loss": -5.393536567687988, "global_step": 32603, "epoch": 776} {"train_loss": -5.510585784912109, "global_step": 32604, "epoch": 776} {"train_loss": -5.702369689941406, "global_step": 32605, "epoch": 776} {"train_loss": -5.456063270568848, "global_step": 32606, "epoch": 776} {"train_loss": -5.528980255126953, "global_step": 32607, "epoch": 776} {"train_loss": -5.421025276184082, "global_step": 32608, "epoch": 776} {"train_loss": -5.536925792694092, "global_step": 32609, "epoch": 776} {"train_loss": -5.543344497680664, "global_step": 32610, "epoch": 776} {"train_loss": -5.449390411376953, "global_step": 32611, "epoch": 776} {"train_loss": -5.600925922393799, "global_step": 32612, "epoch": 776} {"train_loss": -5.561656951904297, "global_step": 32613, "epoch": 776} {"train_loss": -5.479521751403809, "global_step": 32614, "epoch": 776} {"train_loss": -5.604918479919434, "global_step": 32615, "epoch": 776} {"train_loss": -5.494874954223633, "global_step": 32616, "epoch": 776} {"train_loss": -5.5388689041137695, "global_step": 32617, "epoch": 776} {"train_loss": -5.639718055725098, "global_step": 32618, "epoch": 776} {"train_loss": -5.460278511047363, "global_step": 32619, "epoch": 776} {"train_loss": -5.433744430541992, "global_step": 32620, "epoch": 776} {"train_loss": -5.562561988830566, "global_step": 32621, "epoch": 776} {"train_loss": -5.489423751831055, "global_step": 32622, "epoch": 776} {"train_loss": -5.435766220092773, "global_step": 32623, "epoch": 776} {"train_loss": -5.596576690673828, "global_step": 32624, "epoch": 776} {"train_loss": -5.5853590965271, "global_step": 32625, "epoch": 776} {"train_loss": -5.636857986450195, "global_step": 32626, "epoch": 776} {"train_loss": -5.577144622802734, "global_step": 32627, "epoch": 776} {"train_loss": -5.450418472290039, "global_step": 32628, "epoch": 776} {"train_loss": -5.616735935211182, "global_step": 32629, "epoch": 776} {"train_loss": -5.493496894836426, "global_step": 32630, "epoch": 776} {"train_loss": -5.5490336418151855, "global_step": 32631, "epoch": 776} {"train_loss": -5.504242897033691, "global_step": 32632, "epoch": 776} {"train_loss": -5.513510011491322, "global_step": 32633, "epoch": 776, "val_loss": 63096.65234375} {"train_loss": -5.6567535400390625, "global_step": 32634, "epoch": 777} {"train_loss": -5.513577938079834, "global_step": 32635, "epoch": 777} {"train_loss": -5.481338024139404, "global_step": 32636, "epoch": 777} {"train_loss": -5.446026802062988, "global_step": 32637, "epoch": 777} {"train_loss": -5.419246673583984, "global_step": 32638, "epoch": 777} {"train_loss": -5.564565181732178, "global_step": 32639, "epoch": 777} {"train_loss": -5.422782897949219, "global_step": 32640, "epoch": 777} {"train_loss": -5.459038257598877, "global_step": 32641, "epoch": 777} {"train_loss": -5.495495796203613, "global_step": 32642, "epoch": 777} {"train_loss": -5.522489547729492, "global_step": 32643, "epoch": 777} {"train_loss": -5.512822151184082, "global_step": 32644, "epoch": 777} {"train_loss": -5.640296936035156, "global_step": 32645, "epoch": 777} {"train_loss": -5.358644008636475, "global_step": 32646, "epoch": 777} {"train_loss": -5.462813377380371, "global_step": 32647, "epoch": 777} {"train_loss": -5.527270317077637, "global_step": 32648, "epoch": 777} {"train_loss": -5.434844970703125, "global_step": 32649, "epoch": 777} {"train_loss": -5.555389881134033, "global_step": 32650, "epoch": 777} {"train_loss": -5.444443702697754, "global_step": 32651, "epoch": 777} {"train_loss": -5.390995979309082, "global_step": 32652, "epoch": 777} {"train_loss": -5.454463958740234, "global_step": 32653, "epoch": 777} {"train_loss": -5.3978071212768555, "global_step": 32654, "epoch": 777} {"train_loss": -5.596278190612793, "global_step": 32655, "epoch": 777} {"train_loss": -5.555612564086914, "global_step": 32656, "epoch": 777} {"train_loss": -5.582422256469727, "global_step": 32657, "epoch": 777} {"train_loss": -5.606470584869385, "global_step": 32658, "epoch": 777} {"train_loss": -5.354251384735107, "global_step": 32659, "epoch": 777} {"train_loss": -5.5261454582214355, "global_step": 32660, "epoch": 777} {"train_loss": -5.601894378662109, "global_step": 32661, "epoch": 777} {"train_loss": -5.555499076843262, "global_step": 32662, "epoch": 777} {"train_loss": -5.550175189971924, "global_step": 32663, "epoch": 777} {"train_loss": -5.580695152282715, "global_step": 32664, "epoch": 777} {"train_loss": -5.535642147064209, "global_step": 32665, "epoch": 777} {"train_loss": -5.439963340759277, "global_step": 32666, "epoch": 777} {"train_loss": -5.610053062438965, "global_step": 32667, "epoch": 777} {"train_loss": -5.6333112716674805, "global_step": 32668, "epoch": 777} {"train_loss": -5.613759994506836, "global_step": 32669, "epoch": 777} {"train_loss": -5.53023624420166, "global_step": 32670, "epoch": 777} {"train_loss": -5.453900337219238, "global_step": 32671, "epoch": 777} {"train_loss": -5.533963203430176, "global_step": 32672, "epoch": 777} {"train_loss": -5.409670352935791, "global_step": 32673, "epoch": 777} {"train_loss": -5.533028602600098, "global_step": 32674, "epoch": 777} {"train_loss": -5.510871705554781, "global_step": 32675, "epoch": 777, "val_loss": 63073.26953125} {"train_loss": -5.439400672912598, "global_step": 32676, "epoch": 778} {"train_loss": -5.616015434265137, "global_step": 32677, "epoch": 778} {"train_loss": -5.476885795593262, "global_step": 32678, "epoch": 778} {"train_loss": -5.473770618438721, "global_step": 32679, "epoch": 778} {"train_loss": -5.436321258544922, "global_step": 32680, "epoch": 778} {"train_loss": -5.573659896850586, "global_step": 32681, "epoch": 778} {"train_loss": -5.5067138671875, "global_step": 32682, "epoch": 778} {"train_loss": -5.582034587860107, "global_step": 32683, "epoch": 778} {"train_loss": -5.644096374511719, "global_step": 32684, "epoch": 778} {"train_loss": -5.355039596557617, "global_step": 32685, "epoch": 778} {"train_loss": -5.4018073081970215, "global_step": 32686, "epoch": 778} {"train_loss": -5.438011646270752, "global_step": 32687, "epoch": 778} {"train_loss": -5.391892433166504, "global_step": 32688, "epoch": 778} {"train_loss": -5.4988627433776855, "global_step": 32689, "epoch": 778} {"train_loss": -5.452798843383789, "global_step": 32690, "epoch": 778} {"train_loss": -5.350414276123047, "global_step": 32691, "epoch": 778} {"train_loss": -5.600869178771973, "global_step": 32692, "epoch": 778} {"train_loss": -5.435461044311523, "global_step": 32693, "epoch": 778} {"train_loss": -5.476968288421631, "global_step": 32694, "epoch": 778} {"train_loss": -5.458953857421875, "global_step": 32695, "epoch": 778} {"train_loss": -5.295188903808594, "global_step": 32696, "epoch": 778} {"train_loss": -5.64202880859375, "global_step": 32697, "epoch": 778} {"train_loss": -5.5118513107299805, "global_step": 32698, "epoch": 778} {"train_loss": -5.5029401779174805, "global_step": 32699, "epoch": 778} {"train_loss": -5.537819862365723, "global_step": 32700, "epoch": 778} {"train_loss": -5.502073287963867, "global_step": 32701, "epoch": 778} {"train_loss": -5.445240020751953, "global_step": 32702, "epoch": 778} {"train_loss": -5.513718128204346, "global_step": 32703, "epoch": 778} {"train_loss": -5.6013593673706055, "global_step": 32704, "epoch": 778} {"train_loss": -5.56069278717041, "global_step": 32705, "epoch": 778} {"train_loss": -5.442540168762207, "global_step": 32706, "epoch": 778} {"train_loss": -5.596671104431152, "global_step": 32707, "epoch": 778} {"train_loss": -5.475341796875, "global_step": 32708, "epoch": 778} {"train_loss": -5.402059078216553, "global_step": 32709, "epoch": 778} {"train_loss": -5.614323139190674, "global_step": 32710, "epoch": 778} {"train_loss": -5.490659713745117, "global_step": 32711, "epoch": 778} {"train_loss": -5.454204559326172, "global_step": 32712, "epoch": 778} {"train_loss": -5.434168815612793, "global_step": 32713, "epoch": 778} {"train_loss": -5.584342956542969, "global_step": 32714, "epoch": 778} {"train_loss": -5.471026420593262, "global_step": 32715, "epoch": 778} {"train_loss": -5.478293418884277, "global_step": 32716, "epoch": 778} {"train_loss": -5.4927581037793844, "global_step": 32717, "epoch": 778, "val_loss": 63692.77734375} {"train_loss": -5.2719807624816895, "global_step": 32718, "epoch": 779} {"train_loss": -5.442269325256348, "global_step": 32719, "epoch": 779} {"train_loss": -5.501200199127197, "global_step": 32720, "epoch": 779} {"train_loss": -5.405148029327393, "global_step": 32721, "epoch": 779} {"train_loss": -5.5688886642456055, "global_step": 32722, "epoch": 779} {"train_loss": -5.530788421630859, "global_step": 32723, "epoch": 779} {"train_loss": -5.4794111251831055, "global_step": 32724, "epoch": 779} {"train_loss": -5.366527557373047, "global_step": 32725, "epoch": 779} {"train_loss": -5.422508716583252, "global_step": 32726, "epoch": 779} {"train_loss": -5.4983062744140625, "global_step": 32727, "epoch": 779} {"train_loss": -5.418676376342773, "global_step": 32728, "epoch": 779} {"train_loss": -5.575589656829834, "global_step": 32729, "epoch": 779} {"train_loss": -5.492063045501709, "global_step": 32730, "epoch": 779} {"train_loss": -5.509427547454834, "global_step": 32731, "epoch": 779} {"train_loss": -5.405355453491211, "global_step": 32732, "epoch": 779} {"train_loss": -5.591158866882324, "global_step": 32733, "epoch": 779} {"train_loss": -5.444174766540527, "global_step": 32734, "epoch": 779} {"train_loss": -5.454705715179443, "global_step": 32735, "epoch": 779} {"train_loss": -5.562405586242676, "global_step": 32736, "epoch": 779} {"train_loss": -5.518765449523926, "global_step": 32737, "epoch": 779} {"train_loss": -5.495939254760742, "global_step": 32738, "epoch": 779} {"train_loss": -5.380260944366455, "global_step": 32739, "epoch": 779} {"train_loss": -5.539092063903809, "global_step": 32740, "epoch": 779} {"train_loss": -5.59909725189209, "global_step": 32741, "epoch": 779} {"train_loss": -5.540890693664551, "global_step": 32742, "epoch": 779} {"train_loss": -5.575549602508545, "global_step": 32743, "epoch": 779} {"train_loss": -5.5463056564331055, "global_step": 32744, "epoch": 779} {"train_loss": -5.496181011199951, "global_step": 32745, "epoch": 779} {"train_loss": -5.475734710693359, "global_step": 32746, "epoch": 779} {"train_loss": -5.500431060791016, "global_step": 32747, "epoch": 779} {"train_loss": -5.435149192810059, "global_step": 32748, "epoch": 779} {"train_loss": -5.454231262207031, "global_step": 32749, "epoch": 779} {"train_loss": -5.545929908752441, "global_step": 32750, "epoch": 779} {"train_loss": -5.388815402984619, "global_step": 32751, "epoch": 779} {"train_loss": -5.436701774597168, "global_step": 32752, "epoch": 779} {"train_loss": -5.590629577636719, "global_step": 32753, "epoch": 779} {"train_loss": -5.449253082275391, "global_step": 32754, "epoch": 779} {"train_loss": -5.398722171783447, "global_step": 32755, "epoch": 779} {"train_loss": -5.590748310089111, "global_step": 32756, "epoch": 779} {"train_loss": -5.660738945007324, "global_step": 32757, "epoch": 779} {"train_loss": -5.560086250305176, "global_step": 32758, "epoch": 779} {"train_loss": -5.488995109285627, "global_step": 32759, "epoch": 779, "val_loss": 62998.52734375} {"train_loss": -5.454073905944824, "global_step": 32760, "epoch": 780} {"train_loss": -5.561983585357666, "global_step": 32761, "epoch": 780} {"train_loss": -5.475454330444336, "global_step": 32762, "epoch": 780} {"train_loss": -5.5785112380981445, "global_step": 32763, "epoch": 780} {"train_loss": -5.579395294189453, "global_step": 32764, "epoch": 780} {"train_loss": -5.535335540771484, "global_step": 32765, "epoch": 780} {"train_loss": -5.404347896575928, "global_step": 32766, "epoch": 780} {"train_loss": -5.475359916687012, "global_step": 32767, "epoch": 780} {"train_loss": -5.60693359375, "global_step": 32768, "epoch": 780} {"train_loss": -5.503044128417969, "global_step": 32769, "epoch": 780} {"train_loss": -5.421750068664551, "global_step": 32770, "epoch": 780} {"train_loss": -5.508967876434326, "global_step": 32771, "epoch": 780} {"train_loss": -5.541990280151367, "global_step": 32772, "epoch": 780} {"train_loss": -5.616389751434326, "global_step": 32773, "epoch": 780} {"train_loss": -5.648637771606445, "global_step": 32774, "epoch": 780} {"train_loss": -5.536844253540039, "global_step": 32775, "epoch": 780} {"train_loss": -5.595081329345703, "global_step": 32776, "epoch": 780} {"train_loss": -5.461205959320068, "global_step": 32777, "epoch": 780} {"train_loss": -5.517148971557617, "global_step": 32778, "epoch": 780} {"train_loss": -5.561635971069336, "global_step": 32779, "epoch": 780} {"train_loss": -5.724740028381348, "global_step": 32780, "epoch": 780} {"train_loss": -5.609165668487549, "global_step": 32781, "epoch": 780} {"train_loss": -5.557894706726074, "global_step": 32782, "epoch": 780} {"train_loss": -5.398051738739014, "global_step": 32783, "epoch": 780} {"train_loss": -5.479887008666992, "global_step": 32784, "epoch": 780} {"train_loss": -5.541045665740967, "global_step": 32785, "epoch": 780} {"train_loss": -5.656169891357422, "global_step": 32786, "epoch": 780} {"train_loss": -5.480930328369141, "global_step": 32787, "epoch": 780} {"train_loss": -5.57881498336792, "global_step": 32788, "epoch": 780} {"train_loss": -5.697248458862305, "global_step": 32789, "epoch": 780} {"train_loss": -5.491721153259277, "global_step": 32790, "epoch": 780} {"train_loss": -5.465890884399414, "global_step": 32791, "epoch": 780} {"train_loss": -5.600989818572998, "global_step": 32792, "epoch": 780} {"train_loss": -5.512432098388672, "global_step": 32793, "epoch": 780} {"train_loss": -5.461036205291748, "global_step": 32794, "epoch": 780} {"train_loss": -5.588326454162598, "global_step": 32795, "epoch": 780} {"train_loss": -5.598763465881348, "global_step": 32796, "epoch": 780} {"train_loss": -5.442364692687988, "global_step": 32797, "epoch": 780} {"train_loss": -5.48426628112793, "global_step": 32798, "epoch": 780} {"train_loss": -5.50943660736084, "global_step": 32799, "epoch": 780} {"train_loss": -5.5315022468566895, "global_step": 32800, "epoch": 780} {"train_loss": -5.537661949793498, "global_step": 32801, "epoch": 780, "val_loss": 62558.06640625} {"train_loss": -5.502693176269531, "global_step": 32802, "epoch": 781} {"train_loss": -5.458409309387207, "global_step": 32803, "epoch": 781} {"train_loss": -5.441122055053711, "global_step": 32804, "epoch": 781} {"train_loss": -5.605186462402344, "global_step": 32805, "epoch": 781} {"train_loss": -5.579285621643066, "global_step": 32806, "epoch": 781} {"train_loss": -5.404117584228516, "global_step": 32807, "epoch": 781} {"train_loss": -5.4661865234375, "global_step": 32808, "epoch": 781} {"train_loss": -5.569867134094238, "global_step": 32809, "epoch": 781} {"train_loss": -5.610528469085693, "global_step": 32810, "epoch": 781} {"train_loss": -5.579017639160156, "global_step": 32811, "epoch": 781} {"train_loss": -5.5429182052612305, "global_step": 32812, "epoch": 781} {"train_loss": -5.5161542892456055, "global_step": 32813, "epoch": 781} {"train_loss": -5.562945365905762, "global_step": 32814, "epoch": 781} {"train_loss": -5.549221515655518, "global_step": 32815, "epoch": 781} {"train_loss": -5.562678813934326, "global_step": 32816, "epoch": 781} {"train_loss": -5.48146915435791, "global_step": 32817, "epoch": 781} {"train_loss": -5.5851922035217285, "global_step": 32818, "epoch": 781} {"train_loss": -5.5377631187438965, "global_step": 32819, "epoch": 781} {"train_loss": -5.505892753601074, "global_step": 32820, "epoch": 781} {"train_loss": -5.485175609588623, "global_step": 32821, "epoch": 781} {"train_loss": -5.559425354003906, "global_step": 32822, "epoch": 781} {"train_loss": -5.659419536590576, "global_step": 32823, "epoch": 781} {"train_loss": -5.496372222900391, "global_step": 32824, "epoch": 781} {"train_loss": -5.435192108154297, "global_step": 32825, "epoch": 781} {"train_loss": -5.55172061920166, "global_step": 32826, "epoch": 781} {"train_loss": -5.595662593841553, "global_step": 32827, "epoch": 781} {"train_loss": -5.434126853942871, "global_step": 32828, "epoch": 781} {"train_loss": -5.498391628265381, "global_step": 32829, "epoch": 781} {"train_loss": -5.5434136390686035, "global_step": 32830, "epoch": 781} {"train_loss": -5.563472270965576, "global_step": 32831, "epoch": 781} {"train_loss": -5.451685905456543, "global_step": 32832, "epoch": 781} {"train_loss": -5.577288627624512, "global_step": 32833, "epoch": 781} {"train_loss": -5.520454406738281, "global_step": 32834, "epoch": 781} {"train_loss": -5.452906608581543, "global_step": 32835, "epoch": 781} {"train_loss": -5.567086696624756, "global_step": 32836, "epoch": 781} {"train_loss": -5.503256797790527, "global_step": 32837, "epoch": 781} {"train_loss": -5.440828323364258, "global_step": 32838, "epoch": 781} {"train_loss": -5.468398094177246, "global_step": 32839, "epoch": 781} {"train_loss": -5.33676815032959, "global_step": 32840, "epoch": 781} {"train_loss": -5.480010986328125, "global_step": 32841, "epoch": 781} {"train_loss": -5.528068542480469, "global_step": 32842, "epoch": 781} {"train_loss": -5.5142365637279696, "global_step": 32843, "epoch": 781, "val_loss": 62981.4609375} {"train_loss": -5.4094367027282715, "global_step": 32844, "epoch": 782} {"train_loss": -5.4519805908203125, "global_step": 32845, "epoch": 782} {"train_loss": -5.3487443923950195, "global_step": 32846, "epoch": 782} {"train_loss": -5.515000820159912, "global_step": 32847, "epoch": 782} {"train_loss": -5.399655818939209, "global_step": 32848, "epoch": 782} {"train_loss": -5.545557022094727, "global_step": 32849, "epoch": 782} {"train_loss": -5.438786506652832, "global_step": 32850, "epoch": 782} {"train_loss": -5.395795822143555, "global_step": 32851, "epoch": 782} {"train_loss": -5.51315975189209, "global_step": 32852, "epoch": 782} {"train_loss": -5.333677291870117, "global_step": 32853, "epoch": 782} {"train_loss": -5.5004143714904785, "global_step": 32854, "epoch": 782} {"train_loss": -5.444715976715088, "global_step": 32855, "epoch": 782} {"train_loss": -5.630678653717041, "global_step": 32856, "epoch": 782} {"train_loss": -5.5728020668029785, "global_step": 32857, "epoch": 782} {"train_loss": -5.460760116577148, "global_step": 32858, "epoch": 782} {"train_loss": -5.647772789001465, "global_step": 32859, "epoch": 782} {"train_loss": -5.543221473693848, "global_step": 32860, "epoch": 782} {"train_loss": -5.433742523193359, "global_step": 32861, "epoch": 782} {"train_loss": -5.475542068481445, "global_step": 32862, "epoch": 782} {"train_loss": -5.408168792724609, "global_step": 32863, "epoch": 782} {"train_loss": -5.545183181762695, "global_step": 32864, "epoch": 782} {"train_loss": -5.434730529785156, "global_step": 32865, "epoch": 782} {"train_loss": -5.494693756103516, "global_step": 32866, "epoch": 782} {"train_loss": -5.545683860778809, "global_step": 32867, "epoch": 782} {"train_loss": -5.538193702697754, "global_step": 32868, "epoch": 782} {"train_loss": -5.4767351150512695, "global_step": 32869, "epoch": 782} {"train_loss": -5.539954662322998, "global_step": 32870, "epoch": 782} {"train_loss": -5.486459255218506, "global_step": 32871, "epoch": 782} {"train_loss": -5.590915679931641, "global_step": 32872, "epoch": 782} {"train_loss": -5.513547897338867, "global_step": 32873, "epoch": 782} {"train_loss": -5.584378242492676, "global_step": 32874, "epoch": 782} {"train_loss": -5.511709690093994, "global_step": 32875, "epoch": 782} {"train_loss": -5.507251739501953, "global_step": 32876, "epoch": 782} {"train_loss": -5.529301643371582, "global_step": 32877, "epoch": 782} {"train_loss": -5.539522171020508, "global_step": 32878, "epoch": 782} {"train_loss": -5.3979902267456055, "global_step": 32879, "epoch": 782} {"train_loss": -5.470049858093262, "global_step": 32880, "epoch": 782} {"train_loss": -5.518338203430176, "global_step": 32881, "epoch": 782} {"train_loss": -5.509568214416504, "global_step": 32882, "epoch": 782} {"train_loss": -5.557499885559082, "global_step": 32883, "epoch": 782} {"train_loss": -5.463698863983154, "global_step": 32884, "epoch": 782} {"train_loss": -5.491355998175485, "global_step": 32885, "epoch": 782, "val_loss": 62374.5546875} {"train_loss": -5.503508567810059, "global_step": 32886, "epoch": 783} {"train_loss": -5.473492622375488, "global_step": 32887, "epoch": 783} {"train_loss": -5.61695671081543, "global_step": 32888, "epoch": 783} {"train_loss": -5.583272933959961, "global_step": 32889, "epoch": 783} {"train_loss": -5.533540725708008, "global_step": 32890, "epoch": 783} {"train_loss": -5.490854263305664, "global_step": 32891, "epoch": 783} {"train_loss": -5.582939147949219, "global_step": 32892, "epoch": 783} {"train_loss": -5.570197105407715, "global_step": 32893, "epoch": 783} {"train_loss": -5.509037017822266, "global_step": 32894, "epoch": 783} {"train_loss": -5.539233207702637, "global_step": 32895, "epoch": 783} {"train_loss": -5.607604026794434, "global_step": 32896, "epoch": 783} {"train_loss": -5.614336013793945, "global_step": 32897, "epoch": 783} {"train_loss": -5.492907524108887, "global_step": 32898, "epoch": 783} {"train_loss": -5.526787757873535, "global_step": 32899, "epoch": 783} {"train_loss": -5.5337677001953125, "global_step": 32900, "epoch": 783} {"train_loss": -5.61677360534668, "global_step": 32901, "epoch": 783} {"train_loss": -5.416263103485107, "global_step": 32902, "epoch": 783} {"train_loss": -5.557111740112305, "global_step": 32903, "epoch": 783} {"train_loss": -5.5499982833862305, "global_step": 32904, "epoch": 783} {"train_loss": -5.5240678787231445, "global_step": 32905, "epoch": 783} {"train_loss": -5.509033203125, "global_step": 32906, "epoch": 783} {"train_loss": -5.522211074829102, "global_step": 32907, "epoch": 783} {"train_loss": -5.439258098602295, "global_step": 32908, "epoch": 783} {"train_loss": -5.448417663574219, "global_step": 32909, "epoch": 783} {"train_loss": -5.530710220336914, "global_step": 32910, "epoch": 783} {"train_loss": -5.4755964279174805, "global_step": 32911, "epoch": 783} {"train_loss": -5.482921600341797, "global_step": 32912, "epoch": 783} {"train_loss": -5.472038745880127, "global_step": 32913, "epoch": 783} {"train_loss": -5.476651191711426, "global_step": 32914, "epoch": 783} {"train_loss": -5.488927364349365, "global_step": 32915, "epoch": 783} {"train_loss": -5.522157669067383, "global_step": 32916, "epoch": 783} {"train_loss": -5.507391929626465, "global_step": 32917, "epoch": 783} {"train_loss": -5.527976036071777, "global_step": 32918, "epoch": 783} {"train_loss": -5.622130393981934, "global_step": 32919, "epoch": 783} {"train_loss": -5.390434265136719, "global_step": 32920, "epoch": 783} {"train_loss": -5.511804580688477, "global_step": 32921, "epoch": 783} {"train_loss": -5.491621017456055, "global_step": 32922, "epoch": 783} {"train_loss": -5.583489418029785, "global_step": 32923, "epoch": 783} {"train_loss": -5.366472244262695, "global_step": 32924, "epoch": 783} {"train_loss": -5.511337757110596, "global_step": 32925, "epoch": 783} {"train_loss": -5.53195858001709, "global_step": 32926, "epoch": 783} {"train_loss": -5.52262114343189, "global_step": 32927, "epoch": 783, "val_loss": 62783.58984375} {"train_loss": -5.6513776779174805, "global_step": 32928, "epoch": 784} {"train_loss": -5.431565761566162, "global_step": 32929, "epoch": 784} {"train_loss": -5.568894386291504, "global_step": 32930, "epoch": 784} {"train_loss": -5.470095157623291, "global_step": 32931, "epoch": 784} {"train_loss": -5.4871368408203125, "global_step": 32932, "epoch": 784} {"train_loss": -5.447334289550781, "global_step": 32933, "epoch": 784} {"train_loss": -5.619253158569336, "global_step": 32934, "epoch": 784} {"train_loss": -5.550027370452881, "global_step": 32935, "epoch": 784} {"train_loss": -5.563149452209473, "global_step": 32936, "epoch": 784} {"train_loss": -5.592369556427002, "global_step": 32937, "epoch": 784} {"train_loss": -5.496338844299316, "global_step": 32938, "epoch": 784} {"train_loss": -5.488034248352051, "global_step": 32939, "epoch": 784} {"train_loss": -5.5653276443481445, "global_step": 32940, "epoch": 784} {"train_loss": -5.59206485748291, "global_step": 32941, "epoch": 784} {"train_loss": -5.462864875793457, "global_step": 32942, "epoch": 784} {"train_loss": -5.474832534790039, "global_step": 32943, "epoch": 784} {"train_loss": -5.603835105895996, "global_step": 32944, "epoch": 784} {"train_loss": -5.641560077667236, "global_step": 32945, "epoch": 784} {"train_loss": -5.512568473815918, "global_step": 32946, "epoch": 784} {"train_loss": -5.623680114746094, "global_step": 32947, "epoch": 784} {"train_loss": -5.454590797424316, "global_step": 32948, "epoch": 784} {"train_loss": -5.616161346435547, "global_step": 32949, "epoch": 784} {"train_loss": -5.467663764953613, "global_step": 32950, "epoch": 784} {"train_loss": -5.560455322265625, "global_step": 32951, "epoch": 784} {"train_loss": -5.580223083496094, "global_step": 32952, "epoch": 784} {"train_loss": -5.588201522827148, "global_step": 32953, "epoch": 784} {"train_loss": -5.49488639831543, "global_step": 32954, "epoch": 784} {"train_loss": -5.5062479972839355, "global_step": 32955, "epoch": 784} {"train_loss": -5.617682456970215, "global_step": 32956, "epoch": 784} {"train_loss": -5.516299247741699, "global_step": 32957, "epoch": 784} {"train_loss": -5.319957256317139, "global_step": 32958, "epoch": 784} {"train_loss": -5.598980903625488, "global_step": 32959, "epoch": 784} {"train_loss": -5.495790958404541, "global_step": 32960, "epoch": 784} {"train_loss": -5.398014545440674, "global_step": 32961, "epoch": 784} {"train_loss": -5.409255027770996, "global_step": 32962, "epoch": 784} {"train_loss": -5.439847946166992, "global_step": 32963, "epoch": 784} {"train_loss": -5.570061683654785, "global_step": 32964, "epoch": 784} {"train_loss": -5.493749618530273, "global_step": 32965, "epoch": 784} {"train_loss": -5.488544464111328, "global_step": 32966, "epoch": 784} {"train_loss": -5.499328136444092, "global_step": 32967, "epoch": 784} {"train_loss": -5.506938457489014, "global_step": 32968, "epoch": 784} {"train_loss": -5.526234115873065, "global_step": 32969, "epoch": 784, "val_loss": 62921.59375} {"train_loss": -5.4102654457092285, "global_step": 32970, "epoch": 785} {"train_loss": -5.534962177276611, "global_step": 32971, "epoch": 785} {"train_loss": -5.4676833152771, "global_step": 32972, "epoch": 785} {"train_loss": -5.484374046325684, "global_step": 32973, "epoch": 785} {"train_loss": -5.646576881408691, "global_step": 32974, "epoch": 785} {"train_loss": -5.402392387390137, "global_step": 32975, "epoch": 785} {"train_loss": -5.430663108825684, "global_step": 32976, "epoch": 785} {"train_loss": -5.508657932281494, "global_step": 32977, "epoch": 785} {"train_loss": -5.531008720397949, "global_step": 32978, "epoch": 785} {"train_loss": -5.388387203216553, "global_step": 32979, "epoch": 785} {"train_loss": -5.468648910522461, "global_step": 32980, "epoch": 785} {"train_loss": -5.3322272300720215, "global_step": 32981, "epoch": 785} {"train_loss": -5.37379789352417, "global_step": 32982, "epoch": 785} {"train_loss": -5.470558166503906, "global_step": 32983, "epoch": 785} {"train_loss": -5.395964622497559, "global_step": 32984, "epoch": 785} {"train_loss": -5.477762222290039, "global_step": 32985, "epoch": 785} {"train_loss": -5.467705726623535, "global_step": 32986, "epoch": 785} {"train_loss": -5.457929611206055, "global_step": 32987, "epoch": 785} {"train_loss": -5.414557456970215, "global_step": 32988, "epoch": 785} {"train_loss": -5.467065811157227, "global_step": 32989, "epoch": 785} {"train_loss": -5.513736724853516, "global_step": 32990, "epoch": 785} {"train_loss": -5.601354598999023, "global_step": 32991, "epoch": 785} {"train_loss": -5.582537651062012, "global_step": 32992, "epoch": 785} {"train_loss": -5.535798072814941, "global_step": 32993, "epoch": 785} {"train_loss": -5.513372421264648, "global_step": 32994, "epoch": 785} {"train_loss": -5.436425685882568, "global_step": 32995, "epoch": 785} {"train_loss": -5.621101379394531, "global_step": 32996, "epoch": 785} {"train_loss": -5.474841117858887, "global_step": 32997, "epoch": 785} {"train_loss": -5.534113883972168, "global_step": 32998, "epoch": 785} {"train_loss": -5.607609748840332, "global_step": 32999, "epoch": 785} {"train_loss": -5.3666672706604, "global_step": 33000, "epoch": 785} {"train_loss": -5.598223686218262, "global_step": 33001, "epoch": 785} {"train_loss": -5.353086471557617, "global_step": 33002, "epoch": 785} {"train_loss": -5.594277381896973, "global_step": 33003, "epoch": 785} {"train_loss": -5.40403938293457, "global_step": 33004, "epoch": 785} {"train_loss": -5.430606842041016, "global_step": 33005, "epoch": 785} {"train_loss": -5.486981391906738, "global_step": 33006, "epoch": 785} {"train_loss": -5.326593399047852, "global_step": 33007, "epoch": 785} {"train_loss": -5.48073673248291, "global_step": 33008, "epoch": 785} {"train_loss": -5.380017280578613, "global_step": 33009, "epoch": 785} {"train_loss": -5.627763748168945, "global_step": 33010, "epoch": 785} {"train_loss": -5.4756319636390325, "global_step": 33011, "epoch": 785, "val_loss": 62948.2578125} {"train_loss": -5.420195579528809, "global_step": 33012, "epoch": 786} {"train_loss": -5.350427627563477, "global_step": 33013, "epoch": 786} {"train_loss": -5.430078029632568, "global_step": 33014, "epoch": 786} {"train_loss": -5.417664527893066, "global_step": 33015, "epoch": 786} {"train_loss": -5.425146102905273, "global_step": 33016, "epoch": 786} {"train_loss": -5.555874824523926, "global_step": 33017, "epoch": 786} {"train_loss": -5.586227893829346, "global_step": 33018, "epoch": 786} {"train_loss": -5.5398406982421875, "global_step": 33019, "epoch": 786} {"train_loss": -5.5840654373168945, "global_step": 33020, "epoch": 786} {"train_loss": -5.6243062019348145, "global_step": 33021, "epoch": 786} {"train_loss": -5.500967979431152, "global_step": 33022, "epoch": 786} {"train_loss": -5.553899765014648, "global_step": 33023, "epoch": 786} {"train_loss": -5.4608869552612305, "global_step": 33024, "epoch": 786} {"train_loss": -5.614043235778809, "global_step": 33025, "epoch": 786} {"train_loss": -5.460208892822266, "global_step": 33026, "epoch": 786} {"train_loss": -5.464395523071289, "global_step": 33027, "epoch": 786} {"train_loss": -5.669873237609863, "global_step": 33028, "epoch": 786} {"train_loss": -5.527146339416504, "global_step": 33029, "epoch": 786} {"train_loss": -5.496101379394531, "global_step": 33030, "epoch": 786} {"train_loss": -5.327784538269043, "global_step": 33031, "epoch": 786} {"train_loss": -5.432696342468262, "global_step": 33032, "epoch": 786} {"train_loss": -5.437010288238525, "global_step": 33033, "epoch": 786} {"train_loss": -5.4151082038879395, "global_step": 33034, "epoch": 786} {"train_loss": -5.360157489776611, "global_step": 33035, "epoch": 786} {"train_loss": -5.297358512878418, "global_step": 33036, "epoch": 786} {"train_loss": -5.487224578857422, "global_step": 33037, "epoch": 786} {"train_loss": -5.500712871551514, "global_step": 33038, "epoch": 786} {"train_loss": -5.315195083618164, "global_step": 33039, "epoch": 786} {"train_loss": -5.502161502838135, "global_step": 33040, "epoch": 786} {"train_loss": -5.354290008544922, "global_step": 33041, "epoch": 786} {"train_loss": -5.539958953857422, "global_step": 33042, "epoch": 786} {"train_loss": -5.42903470993042, "global_step": 33043, "epoch": 786} {"train_loss": -5.610203742980957, "global_step": 33044, "epoch": 786} {"train_loss": -5.387681484222412, "global_step": 33045, "epoch": 786} {"train_loss": -5.5390424728393555, "global_step": 33046, "epoch": 786} {"train_loss": -5.420199394226074, "global_step": 33047, "epoch": 786} {"train_loss": -5.454704284667969, "global_step": 33048, "epoch": 786} {"train_loss": -5.30118989944458, "global_step": 33049, "epoch": 786} {"train_loss": -5.555501461029053, "global_step": 33050, "epoch": 786} {"train_loss": -5.399986743927002, "global_step": 33051, "epoch": 786} {"train_loss": -5.582418441772461, "global_step": 33052, "epoch": 786} {"train_loss": -5.471064204261417, "global_step": 33053, "epoch": 786, "val_loss": 62612.6640625} {"train_loss": -5.621397972106934, "global_step": 33054, "epoch": 787} {"train_loss": -5.547004699707031, "global_step": 33055, "epoch": 787} {"train_loss": -5.445094585418701, "global_step": 33056, "epoch": 787} {"train_loss": -5.517281532287598, "global_step": 33057, "epoch": 787} {"train_loss": -5.483606338500977, "global_step": 33058, "epoch": 787} {"train_loss": -5.520909309387207, "global_step": 33059, "epoch": 787} {"train_loss": -5.526764392852783, "global_step": 33060, "epoch": 787} {"train_loss": -5.6158246994018555, "global_step": 33061, "epoch": 787} {"train_loss": -5.46724271774292, "global_step": 33062, "epoch": 787} {"train_loss": -5.5657477378845215, "global_step": 33063, "epoch": 787} {"train_loss": -5.613554000854492, "global_step": 33064, "epoch": 787} {"train_loss": -5.4709272384643555, "global_step": 33065, "epoch": 787} {"train_loss": -5.629101753234863, "global_step": 33066, "epoch": 787} {"train_loss": -5.423279762268066, "global_step": 33067, "epoch": 787} {"train_loss": -5.514484405517578, "global_step": 33068, "epoch": 787} {"train_loss": -5.613251686096191, "global_step": 33069, "epoch": 787} {"train_loss": -5.39219856262207, "global_step": 33070, "epoch": 787} {"train_loss": -5.456754684448242, "global_step": 33071, "epoch": 787} {"train_loss": -5.532474517822266, "global_step": 33072, "epoch": 787} {"train_loss": -5.551994323730469, "global_step": 33073, "epoch": 787} {"train_loss": -5.495502471923828, "global_step": 33074, "epoch": 787} {"train_loss": -5.615399360656738, "global_step": 33075, "epoch": 787} {"train_loss": -5.521808624267578, "global_step": 33076, "epoch": 787} {"train_loss": -5.437828063964844, "global_step": 33077, "epoch": 787} {"train_loss": -5.454897880554199, "global_step": 33078, "epoch": 787} {"train_loss": -5.528194427490234, "global_step": 33079, "epoch": 787} {"train_loss": -5.5184125900268555, "global_step": 33080, "epoch": 787} {"train_loss": -5.46580696105957, "global_step": 33081, "epoch": 787} {"train_loss": -5.49281120300293, "global_step": 33082, "epoch": 787} {"train_loss": -5.576286315917969, "global_step": 33083, "epoch": 787} {"train_loss": -5.426009178161621, "global_step": 33084, "epoch": 787} {"train_loss": -5.584411144256592, "global_step": 33085, "epoch": 787} {"train_loss": -5.531711578369141, "global_step": 33086, "epoch": 787} {"train_loss": -5.549269676208496, "global_step": 33087, "epoch": 787} {"train_loss": -5.460142135620117, "global_step": 33088, "epoch": 787} {"train_loss": -5.496529579162598, "global_step": 33089, "epoch": 787} {"train_loss": -5.395472526550293, "global_step": 33090, "epoch": 787} {"train_loss": -5.549100875854492, "global_step": 33091, "epoch": 787} {"train_loss": -5.549074172973633, "global_step": 33092, "epoch": 787} {"train_loss": -5.468694686889648, "global_step": 33093, "epoch": 787} {"train_loss": -5.575296401977539, "global_step": 33094, "epoch": 787} {"train_loss": -5.515532334645589, "global_step": 33095, "epoch": 787, "val_loss": 62553.1796875} {"train_loss": -5.533710479736328, "global_step": 33096, "epoch": 788} {"train_loss": -5.514496803283691, "global_step": 33097, "epoch": 788} {"train_loss": -5.5471601486206055, "global_step": 33098, "epoch": 788} {"train_loss": -5.5837225914001465, "global_step": 33099, "epoch": 788} {"train_loss": -5.521069526672363, "global_step": 33100, "epoch": 788} {"train_loss": -5.489490985870361, "global_step": 33101, "epoch": 788} {"train_loss": -5.469453811645508, "global_step": 33102, "epoch": 788} {"train_loss": -5.559970378875732, "global_step": 33103, "epoch": 788} {"train_loss": -5.482340335845947, "global_step": 33104, "epoch": 788} {"train_loss": -5.369220733642578, "global_step": 33105, "epoch": 788} {"train_loss": -5.6080169677734375, "global_step": 33106, "epoch": 788} {"train_loss": -5.4426069259643555, "global_step": 33107, "epoch": 788} {"train_loss": -5.579600811004639, "global_step": 33108, "epoch": 788} {"train_loss": -5.479977607727051, "global_step": 33109, "epoch": 788} {"train_loss": -5.542364120483398, "global_step": 33110, "epoch": 788} {"train_loss": -5.6027727127075195, "global_step": 33111, "epoch": 788} {"train_loss": -5.603814125061035, "global_step": 33112, "epoch": 788} {"train_loss": -5.483869552612305, "global_step": 33113, "epoch": 788} {"train_loss": -5.492901802062988, "global_step": 33114, "epoch": 788} {"train_loss": -5.609250068664551, "global_step": 33115, "epoch": 788} {"train_loss": -5.499792098999023, "global_step": 33116, "epoch": 788} {"train_loss": -5.541934013366699, "global_step": 33117, "epoch": 788} {"train_loss": -5.49448299407959, "global_step": 33118, "epoch": 788} {"train_loss": -5.445110321044922, "global_step": 33119, "epoch": 788} {"train_loss": -5.596217632293701, "global_step": 33120, "epoch": 788} {"train_loss": -5.580903053283691, "global_step": 33121, "epoch": 788} {"train_loss": -5.673842430114746, "global_step": 33122, "epoch": 788} {"train_loss": -5.561328887939453, "global_step": 33123, "epoch": 788} {"train_loss": -5.492212295532227, "global_step": 33124, "epoch": 788} {"train_loss": -5.540048599243164, "global_step": 33125, "epoch": 788} {"train_loss": -5.561521053314209, "global_step": 33126, "epoch": 788} {"train_loss": -5.532102584838867, "global_step": 33127, "epoch": 788} {"train_loss": -5.578683853149414, "global_step": 33128, "epoch": 788} {"train_loss": -5.5322065353393555, "global_step": 33129, "epoch": 788} {"train_loss": -5.458869934082031, "global_step": 33130, "epoch": 788} {"train_loss": -5.638463020324707, "global_step": 33131, "epoch": 788} {"train_loss": -5.454374313354492, "global_step": 33132, "epoch": 788} {"train_loss": -5.583571434020996, "global_step": 33133, "epoch": 788} {"train_loss": -5.634922027587891, "global_step": 33134, "epoch": 788} {"train_loss": -5.49971866607666, "global_step": 33135, "epoch": 788} {"train_loss": -5.502517223358154, "global_step": 33136, "epoch": 788} {"train_loss": -5.5336122285752065, "global_step": 33137, "epoch": 788, "val_loss": 62664.734375} {"train_loss": -5.640152931213379, "global_step": 33138, "epoch": 789} {"train_loss": -5.566306114196777, "global_step": 33139, "epoch": 789} {"train_loss": -5.492159843444824, "global_step": 33140, "epoch": 789} {"train_loss": -5.365617752075195, "global_step": 33141, "epoch": 789} {"train_loss": -5.525470733642578, "global_step": 33142, "epoch": 789} {"train_loss": -5.574074745178223, "global_step": 33143, "epoch": 789} {"train_loss": -5.544641017913818, "global_step": 33144, "epoch": 789} {"train_loss": -5.529464244842529, "global_step": 33145, "epoch": 789} {"train_loss": -5.606061935424805, "global_step": 33146, "epoch": 789} {"train_loss": -5.517974853515625, "global_step": 33147, "epoch": 789} {"train_loss": -5.386263847351074, "global_step": 33148, "epoch": 789} {"train_loss": -5.542457580566406, "global_step": 33149, "epoch": 789} {"train_loss": -5.551727294921875, "global_step": 33150, "epoch": 789} {"train_loss": -5.547563076019287, "global_step": 33151, "epoch": 789} {"train_loss": -5.557627201080322, "global_step": 33152, "epoch": 789} {"train_loss": -5.5848283767700195, "global_step": 33153, "epoch": 789} {"train_loss": -5.5679097175598145, "global_step": 33154, "epoch": 789} {"train_loss": -5.601557731628418, "global_step": 33155, "epoch": 789} {"train_loss": -5.587061882019043, "global_step": 33156, "epoch": 789} {"train_loss": -5.469610691070557, "global_step": 33157, "epoch": 789} {"train_loss": -5.532525062561035, "global_step": 33158, "epoch": 789} {"train_loss": -5.463530540466309, "global_step": 33159, "epoch": 789} {"train_loss": -5.497846603393555, "global_step": 33160, "epoch": 789} {"train_loss": -5.485330581665039, "global_step": 33161, "epoch": 789} {"train_loss": -5.488350868225098, "global_step": 33162, "epoch": 789} {"train_loss": -5.599206924438477, "global_step": 33163, "epoch": 789} {"train_loss": -5.51018762588501, "global_step": 33164, "epoch": 789} {"train_loss": -5.502405643463135, "global_step": 33165, "epoch": 789} {"train_loss": -5.403587818145752, "global_step": 33166, "epoch": 789} {"train_loss": -5.426064968109131, "global_step": 33167, "epoch": 789} {"train_loss": -5.535844326019287, "global_step": 33168, "epoch": 789} {"train_loss": -5.489698886871338, "global_step": 33169, "epoch": 789} {"train_loss": -5.422894477844238, "global_step": 33170, "epoch": 789} {"train_loss": -5.553474426269531, "global_step": 33171, "epoch": 789} {"train_loss": -5.342092037200928, "global_step": 33172, "epoch": 789} {"train_loss": -5.538083553314209, "global_step": 33173, "epoch": 789} {"train_loss": -5.371636867523193, "global_step": 33174, "epoch": 789} {"train_loss": -5.413361549377441, "global_step": 33175, "epoch": 789} {"train_loss": -5.515315055847168, "global_step": 33176, "epoch": 789} {"train_loss": -5.391626358032227, "global_step": 33177, "epoch": 789} {"train_loss": -5.423664093017578, "global_step": 33178, "epoch": 789} {"train_loss": -5.500453483490717, "global_step": 33179, "epoch": 789, "val_loss": 62917.7265625} {"train_loss": -5.532196044921875, "global_step": 33180, "epoch": 790} {"train_loss": -5.4794511795043945, "global_step": 33181, "epoch": 790} {"train_loss": -5.498003005981445, "global_step": 33182, "epoch": 790} {"train_loss": -5.496820449829102, "global_step": 33183, "epoch": 790} {"train_loss": -5.425706386566162, "global_step": 33184, "epoch": 790} {"train_loss": -5.575402736663818, "global_step": 33185, "epoch": 790} {"train_loss": -5.514711380004883, "global_step": 33186, "epoch": 790} {"train_loss": -5.474366664886475, "global_step": 33187, "epoch": 790} {"train_loss": -5.579261779785156, "global_step": 33188, "epoch": 790} {"train_loss": -5.4458112716674805, "global_step": 33189, "epoch": 790} {"train_loss": -5.497523307800293, "global_step": 33190, "epoch": 790} {"train_loss": -5.662139892578125, "global_step": 33191, "epoch": 790} {"train_loss": -5.442263603210449, "global_step": 33192, "epoch": 790} {"train_loss": -5.624908447265625, "global_step": 33193, "epoch": 790} {"train_loss": -5.558500289916992, "global_step": 33194, "epoch": 790} {"train_loss": -5.520611763000488, "global_step": 33195, "epoch": 790} {"train_loss": -5.598174571990967, "global_step": 33196, "epoch": 790} {"train_loss": -5.531039237976074, "global_step": 33197, "epoch": 790} {"train_loss": -5.434393882751465, "global_step": 33198, "epoch": 790} {"train_loss": -5.5739617347717285, "global_step": 33199, "epoch": 790} {"train_loss": -5.525236129760742, "global_step": 33200, "epoch": 790} {"train_loss": -5.471074104309082, "global_step": 33201, "epoch": 790} {"train_loss": -5.488104820251465, "global_step": 33202, "epoch": 790} {"train_loss": -5.530963897705078, "global_step": 33203, "epoch": 790} {"train_loss": -5.527261734008789, "global_step": 33204, "epoch": 790} {"train_loss": -5.528872013092041, "global_step": 33205, "epoch": 790} {"train_loss": -5.637468338012695, "global_step": 33206, "epoch": 790} {"train_loss": -5.556028366088867, "global_step": 33207, "epoch": 790} {"train_loss": -5.6178178787231445, "global_step": 33208, "epoch": 790} {"train_loss": -5.517552375793457, "global_step": 33209, "epoch": 790} {"train_loss": -5.646251678466797, "global_step": 33210, "epoch": 790} {"train_loss": -5.471922874450684, "global_step": 33211, "epoch": 790} {"train_loss": -5.533071041107178, "global_step": 33212, "epoch": 790} {"train_loss": -5.616198539733887, "global_step": 33213, "epoch": 790} {"train_loss": -5.521718978881836, "global_step": 33214, "epoch": 790} {"train_loss": -5.492880821228027, "global_step": 33215, "epoch": 790} {"train_loss": -5.390484809875488, "global_step": 33216, "epoch": 790} {"train_loss": -5.467690944671631, "global_step": 33217, "epoch": 790} {"train_loss": -5.435061931610107, "global_step": 33218, "epoch": 790} {"train_loss": -5.491868019104004, "global_step": 33219, "epoch": 790} {"train_loss": -5.626653671264648, "global_step": 33220, "epoch": 790} {"train_loss": -5.525355793180919, "global_step": 33221, "epoch": 790, "val_loss": 63110.00390625} {"train_loss": -5.530943870544434, "global_step": 33222, "epoch": 791} {"train_loss": -5.580909252166748, "global_step": 33223, "epoch": 791} {"train_loss": -5.432340621948242, "global_step": 33224, "epoch": 791} {"train_loss": -5.573756217956543, "global_step": 33225, "epoch": 791} {"train_loss": -5.55222225189209, "global_step": 33226, "epoch": 791} {"train_loss": -5.48292350769043, "global_step": 33227, "epoch": 791} {"train_loss": -5.591680526733398, "global_step": 33228, "epoch": 791} {"train_loss": -5.521940231323242, "global_step": 33229, "epoch": 791} {"train_loss": -5.456621170043945, "global_step": 33230, "epoch": 791} {"train_loss": -5.622100830078125, "global_step": 33231, "epoch": 791} {"train_loss": -5.460829734802246, "global_step": 33232, "epoch": 791} {"train_loss": -5.501079559326172, "global_step": 33233, "epoch": 791} {"train_loss": -5.554439544677734, "global_step": 33234, "epoch": 791} {"train_loss": -5.666671276092529, "global_step": 33235, "epoch": 791} {"train_loss": -5.560657501220703, "global_step": 33236, "epoch": 791} {"train_loss": -5.672767639160156, "global_step": 33237, "epoch": 791} {"train_loss": -5.484467506408691, "global_step": 33238, "epoch": 791} {"train_loss": -5.583588600158691, "global_step": 33239, "epoch": 791} {"train_loss": -5.468932151794434, "global_step": 33240, "epoch": 791} {"train_loss": -5.4559550285339355, "global_step": 33241, "epoch": 791} {"train_loss": -5.405942916870117, "global_step": 33242, "epoch": 791} {"train_loss": -5.497236251831055, "global_step": 33243, "epoch": 791} {"train_loss": -5.493139266967773, "global_step": 33244, "epoch": 791} {"train_loss": -5.522601127624512, "global_step": 33245, "epoch": 791} {"train_loss": -5.49659538269043, "global_step": 33246, "epoch": 791} {"train_loss": -5.546570777893066, "global_step": 33247, "epoch": 791} {"train_loss": -5.503560543060303, "global_step": 33248, "epoch": 791} {"train_loss": -5.6212005615234375, "global_step": 33249, "epoch": 791} {"train_loss": -5.461673736572266, "global_step": 33250, "epoch": 791} {"train_loss": -5.512558937072754, "global_step": 33251, "epoch": 791} {"train_loss": -5.570541858673096, "global_step": 33252, "epoch": 791} {"train_loss": -5.442843437194824, "global_step": 33253, "epoch": 791} {"train_loss": -5.414885520935059, "global_step": 33254, "epoch": 791} {"train_loss": -5.471726417541504, "global_step": 33255, "epoch": 791} {"train_loss": -5.513172149658203, "global_step": 33256, "epoch": 791} {"train_loss": -5.598584175109863, "global_step": 33257, "epoch": 791} {"train_loss": -5.662609100341797, "global_step": 33258, "epoch": 791} {"train_loss": -5.569056034088135, "global_step": 33259, "epoch": 791} {"train_loss": -5.575407028198242, "global_step": 33260, "epoch": 791} {"train_loss": -5.611077308654785, "global_step": 33261, "epoch": 791} {"train_loss": -5.666040420532227, "global_step": 33262, "epoch": 791} {"train_loss": -5.529915809631348, "global_step": 33263, "epoch": 791, "val_loss": 62813.27734375} {"train_loss": -5.565732955932617, "global_step": 33264, "epoch": 792} {"train_loss": -5.511917591094971, "global_step": 33265, "epoch": 792} {"train_loss": -5.4114580154418945, "global_step": 33266, "epoch": 792} {"train_loss": -5.531430244445801, "global_step": 33267, "epoch": 792} {"train_loss": -5.520811557769775, "global_step": 33268, "epoch": 792} {"train_loss": -5.503264427185059, "global_step": 33269, "epoch": 792} {"train_loss": -5.498107433319092, "global_step": 33270, "epoch": 792} {"train_loss": -5.437869071960449, "global_step": 33271, "epoch": 792} {"train_loss": -5.483829975128174, "global_step": 33272, "epoch": 792} {"train_loss": -5.5985894203186035, "global_step": 33273, "epoch": 792} {"train_loss": -5.465530872344971, "global_step": 33274, "epoch": 792} {"train_loss": -5.626977443695068, "global_step": 33275, "epoch": 792} {"train_loss": -5.602614402770996, "global_step": 33276, "epoch": 792} {"train_loss": -5.424882888793945, "global_step": 33277, "epoch": 792} {"train_loss": -5.64496374130249, "global_step": 33278, "epoch": 792} {"train_loss": -5.493807792663574, "global_step": 33279, "epoch": 792} {"train_loss": -5.582834243774414, "global_step": 33280, "epoch": 792} {"train_loss": -5.559612274169922, "global_step": 33281, "epoch": 792} {"train_loss": -5.5648345947265625, "global_step": 33282, "epoch": 792} {"train_loss": -5.616050720214844, "global_step": 33283, "epoch": 792} {"train_loss": -5.655591011047363, "global_step": 33284, "epoch": 792} {"train_loss": -5.404794216156006, "global_step": 33285, "epoch": 792} {"train_loss": -5.5090837478637695, "global_step": 33286, "epoch": 792} {"train_loss": -5.660240173339844, "global_step": 33287, "epoch": 792} {"train_loss": -5.6639604568481445, "global_step": 33288, "epoch": 792} {"train_loss": -5.548275470733643, "global_step": 33289, "epoch": 792} {"train_loss": -5.535466194152832, "global_step": 33290, "epoch": 792} {"train_loss": -5.3997392654418945, "global_step": 33291, "epoch": 792} {"train_loss": -5.672884941101074, "global_step": 33292, "epoch": 792} {"train_loss": -5.382595062255859, "global_step": 33293, "epoch": 792} {"train_loss": -5.4996657371521, "global_step": 33294, "epoch": 792} {"train_loss": -5.533385753631592, "global_step": 33295, "epoch": 792} {"train_loss": -5.5303850173950195, "global_step": 33296, "epoch": 792} {"train_loss": -5.403360843658447, "global_step": 33297, "epoch": 792} {"train_loss": -5.648687362670898, "global_step": 33298, "epoch": 792} {"train_loss": -5.396823883056641, "global_step": 33299, "epoch": 792} {"train_loss": -5.594881534576416, "global_step": 33300, "epoch": 792} {"train_loss": -5.484631061553955, "global_step": 33301, "epoch": 792} {"train_loss": -5.392406463623047, "global_step": 33302, "epoch": 792} {"train_loss": -5.532235145568848, "global_step": 33303, "epoch": 792} {"train_loss": -5.456148147583008, "global_step": 33304, "epoch": 792} {"train_loss": -5.528033937726702, "global_step": 33305, "epoch": 792, "val_loss": 62412.16796875} {"train_loss": -5.529187202453613, "global_step": 33306, "epoch": 793} {"train_loss": -5.642021179199219, "global_step": 33307, "epoch": 793} {"train_loss": -5.5221099853515625, "global_step": 33308, "epoch": 793} {"train_loss": -5.407393455505371, "global_step": 33309, "epoch": 793} {"train_loss": -5.400953769683838, "global_step": 33310, "epoch": 793} {"train_loss": -5.631157875061035, "global_step": 33311, "epoch": 793} {"train_loss": -5.453433036804199, "global_step": 33312, "epoch": 793} {"train_loss": -5.49527645111084, "global_step": 33313, "epoch": 793} {"train_loss": -5.655818462371826, "global_step": 33314, "epoch": 793} {"train_loss": -5.557708263397217, "global_step": 33315, "epoch": 793} {"train_loss": -5.479154586791992, "global_step": 33316, "epoch": 793} {"train_loss": -5.574516296386719, "global_step": 33317, "epoch": 793} {"train_loss": -5.544925689697266, "global_step": 33318, "epoch": 793} {"train_loss": -5.636900901794434, "global_step": 33319, "epoch": 793} {"train_loss": -5.459860324859619, "global_step": 33320, "epoch": 793} {"train_loss": -5.623624801635742, "global_step": 33321, "epoch": 793} {"train_loss": -5.567106246948242, "global_step": 33322, "epoch": 793} {"train_loss": -5.587851524353027, "global_step": 33323, "epoch": 793} {"train_loss": -5.56123161315918, "global_step": 33324, "epoch": 793} {"train_loss": -5.363719463348389, "global_step": 33325, "epoch": 793} {"train_loss": -5.487029075622559, "global_step": 33326, "epoch": 793} {"train_loss": -5.520569801330566, "global_step": 33327, "epoch": 793} {"train_loss": -5.544066905975342, "global_step": 33328, "epoch": 793} {"train_loss": -5.555485725402832, "global_step": 33329, "epoch": 793} {"train_loss": -5.481295585632324, "global_step": 33330, "epoch": 793} {"train_loss": -5.357885837554932, "global_step": 33331, "epoch": 793} {"train_loss": -5.683509349822998, "global_step": 33332, "epoch": 793} {"train_loss": -5.501890182495117, "global_step": 33333, "epoch": 793} {"train_loss": -5.649500846862793, "global_step": 33334, "epoch": 793} {"train_loss": -5.573009490966797, "global_step": 33335, "epoch": 793} {"train_loss": -5.6021318435668945, "global_step": 33336, "epoch": 793} {"train_loss": -5.613621711730957, "global_step": 33337, "epoch": 793} {"train_loss": -5.570451736450195, "global_step": 33338, "epoch": 793} {"train_loss": -5.508266925811768, "global_step": 33339, "epoch": 793} {"train_loss": -5.629176139831543, "global_step": 33340, "epoch": 793} {"train_loss": -5.507469654083252, "global_step": 33341, "epoch": 793} {"train_loss": -5.589242935180664, "global_step": 33342, "epoch": 793} {"train_loss": -5.491148471832275, "global_step": 33343, "epoch": 793} {"train_loss": -5.513857841491699, "global_step": 33344, "epoch": 793} {"train_loss": -5.4943695068359375, "global_step": 33345, "epoch": 793} {"train_loss": -5.442153453826904, "global_step": 33346, "epoch": 793} {"train_loss": -5.539435761315482, "global_step": 33347, "epoch": 793, "val_loss": 62611.41015625} {"train_loss": -5.543271541595459, "global_step": 33348, "epoch": 794} {"train_loss": -5.385625839233398, "global_step": 33349, "epoch": 794} {"train_loss": -5.444736003875732, "global_step": 33350, "epoch": 794} {"train_loss": -5.534767150878906, "global_step": 33351, "epoch": 794} {"train_loss": -5.4132819175720215, "global_step": 33352, "epoch": 794} {"train_loss": -5.555364608764648, "global_step": 33353, "epoch": 794} {"train_loss": -5.369227886199951, "global_step": 33354, "epoch": 794} {"train_loss": -5.483678340911865, "global_step": 33355, "epoch": 794} {"train_loss": -5.545331001281738, "global_step": 33356, "epoch": 794} {"train_loss": -5.444491863250732, "global_step": 33357, "epoch": 794} {"train_loss": -5.643390655517578, "global_step": 33358, "epoch": 794} {"train_loss": -5.5346784591674805, "global_step": 33359, "epoch": 794} {"train_loss": -5.569622993469238, "global_step": 33360, "epoch": 794} {"train_loss": -5.485196113586426, "global_step": 33361, "epoch": 794} {"train_loss": -5.50368595123291, "global_step": 33362, "epoch": 794} {"train_loss": -5.454461574554443, "global_step": 33363, "epoch": 794} {"train_loss": -5.4116339683532715, "global_step": 33364, "epoch": 794} {"train_loss": -5.463050365447998, "global_step": 33365, "epoch": 794} {"train_loss": -5.491430282592773, "global_step": 33366, "epoch": 794} {"train_loss": -5.418483734130859, "global_step": 33367, "epoch": 794} {"train_loss": -5.602404594421387, "global_step": 33368, "epoch": 794} {"train_loss": -5.4760332107543945, "global_step": 33369, "epoch": 794} {"train_loss": -5.517151355743408, "global_step": 33370, "epoch": 794} {"train_loss": -5.466497421264648, "global_step": 33371, "epoch": 794} {"train_loss": -5.571080207824707, "global_step": 33372, "epoch": 794} {"train_loss": -5.563786506652832, "global_step": 33373, "epoch": 794} {"train_loss": -5.553349494934082, "global_step": 33374, "epoch": 794} {"train_loss": -5.460453033447266, "global_step": 33375, "epoch": 794} {"train_loss": -5.473060607910156, "global_step": 33376, "epoch": 794} {"train_loss": -5.44549560546875, "global_step": 33377, "epoch": 794} {"train_loss": -5.506803512573242, "global_step": 33378, "epoch": 794} {"train_loss": -5.589756011962891, "global_step": 33379, "epoch": 794} {"train_loss": -5.613203048706055, "global_step": 33380, "epoch": 794} {"train_loss": -5.513775825500488, "global_step": 33381, "epoch": 794} {"train_loss": -5.681882858276367, "global_step": 33382, "epoch": 794} {"train_loss": -5.627388000488281, "global_step": 33383, "epoch": 794} {"train_loss": -5.547365188598633, "global_step": 33384, "epoch": 794} {"train_loss": -5.544282913208008, "global_step": 33385, "epoch": 794} {"train_loss": -5.622932434082031, "global_step": 33386, "epoch": 794} {"train_loss": -5.588274955749512, "global_step": 33387, "epoch": 794} {"train_loss": -5.581552028656006, "global_step": 33388, "epoch": 794} {"train_loss": -5.520856119337536, "global_step": 33389, "epoch": 794, "val_loss": 62627.359375} {"train_loss": -5.3842453956604, "global_step": 33390, "epoch": 795} {"train_loss": -5.691736221313477, "global_step": 33391, "epoch": 795} {"train_loss": -5.526884078979492, "global_step": 33392, "epoch": 795} {"train_loss": -5.543037414550781, "global_step": 33393, "epoch": 795} {"train_loss": -5.626230716705322, "global_step": 33394, "epoch": 795} {"train_loss": -5.605951309204102, "global_step": 33395, "epoch": 795} {"train_loss": -5.571372985839844, "global_step": 33396, "epoch": 795} {"train_loss": -5.537013053894043, "global_step": 33397, "epoch": 795} {"train_loss": -5.64127254486084, "global_step": 33398, "epoch": 795} {"train_loss": -5.5615010261535645, "global_step": 33399, "epoch": 795} {"train_loss": -5.42451286315918, "global_step": 33400, "epoch": 795} {"train_loss": -5.721019268035889, "global_step": 33401, "epoch": 795} {"train_loss": -5.658885955810547, "global_step": 33402, "epoch": 795} {"train_loss": -5.559023380279541, "global_step": 33403, "epoch": 795} {"train_loss": -5.61223030090332, "global_step": 33404, "epoch": 795} {"train_loss": -5.472519874572754, "global_step": 33405, "epoch": 795} {"train_loss": -5.433207988739014, "global_step": 33406, "epoch": 795} {"train_loss": -5.561524391174316, "global_step": 33407, "epoch": 795} {"train_loss": -5.583015441894531, "global_step": 33408, "epoch": 795} {"train_loss": -5.420068264007568, "global_step": 33409, "epoch": 795} {"train_loss": -5.568987846374512, "global_step": 33410, "epoch": 795} {"train_loss": -5.539244651794434, "global_step": 33411, "epoch": 795} {"train_loss": -5.530977249145508, "global_step": 33412, "epoch": 795} {"train_loss": -5.523451805114746, "global_step": 33413, "epoch": 795} {"train_loss": -5.62402868270874, "global_step": 33414, "epoch": 795} {"train_loss": -5.439191818237305, "global_step": 33415, "epoch": 795} {"train_loss": -5.469364166259766, "global_step": 33416, "epoch": 795} {"train_loss": -5.564831733703613, "global_step": 33417, "epoch": 795} {"train_loss": -5.413703918457031, "global_step": 33418, "epoch": 795} {"train_loss": -5.49594783782959, "global_step": 33419, "epoch": 795} {"train_loss": -5.506953239440918, "global_step": 33420, "epoch": 795} {"train_loss": -5.443357467651367, "global_step": 33421, "epoch": 795} {"train_loss": -5.5747222900390625, "global_step": 33422, "epoch": 795} {"train_loss": -5.551912307739258, "global_step": 33423, "epoch": 795} {"train_loss": -5.568478584289551, "global_step": 33424, "epoch": 795} {"train_loss": -5.522930145263672, "global_step": 33425, "epoch": 795} {"train_loss": -5.568769454956055, "global_step": 33426, "epoch": 795} {"train_loss": -5.646628379821777, "global_step": 33427, "epoch": 795} {"train_loss": -5.48441743850708, "global_step": 33428, "epoch": 795} {"train_loss": -5.299459457397461, "global_step": 33429, "epoch": 795} {"train_loss": -5.4600934982299805, "global_step": 33430, "epoch": 795} {"train_loss": -5.5316585926782516, "global_step": 33431, "epoch": 795, "val_loss": 62943.36328125} {"train_loss": -5.524271488189697, "global_step": 33432, "epoch": 796} {"train_loss": -5.597644329071045, "global_step": 33433, "epoch": 796} {"train_loss": -5.516927242279053, "global_step": 33434, "epoch": 796} {"train_loss": -5.517511367797852, "global_step": 33435, "epoch": 796} {"train_loss": -5.628434181213379, "global_step": 33436, "epoch": 796} {"train_loss": -5.489433288574219, "global_step": 33437, "epoch": 796} {"train_loss": -5.640891075134277, "global_step": 33438, "epoch": 796} {"train_loss": -5.5958452224731445, "global_step": 33439, "epoch": 796} {"train_loss": -5.4523515701293945, "global_step": 33440, "epoch": 796} {"train_loss": -5.429934501647949, "global_step": 33441, "epoch": 796} {"train_loss": -5.47309684753418, "global_step": 33442, "epoch": 796} {"train_loss": -5.452062129974365, "global_step": 33443, "epoch": 796} {"train_loss": -5.441619396209717, "global_step": 33444, "epoch": 796} {"train_loss": -5.511290550231934, "global_step": 33445, "epoch": 796} {"train_loss": -5.377658367156982, "global_step": 33446, "epoch": 796} {"train_loss": -5.478529930114746, "global_step": 33447, "epoch": 796} {"train_loss": -5.440182209014893, "global_step": 33448, "epoch": 796} {"train_loss": -5.569727420806885, "global_step": 33449, "epoch": 796} {"train_loss": -5.526782989501953, "global_step": 33450, "epoch": 796} {"train_loss": -5.604748725891113, "global_step": 33451, "epoch": 796} {"train_loss": -5.519728660583496, "global_step": 33452, "epoch": 796} {"train_loss": -5.4195146560668945, "global_step": 33453, "epoch": 796} {"train_loss": -5.470273971557617, "global_step": 33454, "epoch": 796} {"train_loss": -5.504192352294922, "global_step": 33455, "epoch": 796} {"train_loss": -5.644969940185547, "global_step": 33456, "epoch": 796} {"train_loss": -5.584314346313477, "global_step": 33457, "epoch": 796} {"train_loss": -5.498450756072998, "global_step": 33458, "epoch": 796} {"train_loss": -5.4952168464660645, "global_step": 33459, "epoch": 796} {"train_loss": -5.488142967224121, "global_step": 33460, "epoch": 796} {"train_loss": -5.568338394165039, "global_step": 33461, "epoch": 796} {"train_loss": -5.544580459594727, "global_step": 33462, "epoch": 796} {"train_loss": -5.56866455078125, "global_step": 33463, "epoch": 796} {"train_loss": -5.482577323913574, "global_step": 33464, "epoch": 796} {"train_loss": -5.620984077453613, "global_step": 33465, "epoch": 796} {"train_loss": -5.636759281158447, "global_step": 33466, "epoch": 796} {"train_loss": -5.5077972412109375, "global_step": 33467, "epoch": 796} {"train_loss": -5.580801963806152, "global_step": 33468, "epoch": 796} {"train_loss": -5.572053909301758, "global_step": 33469, "epoch": 796} {"train_loss": -5.4624834060668945, "global_step": 33470, "epoch": 796} {"train_loss": -5.582408905029297, "global_step": 33471, "epoch": 796} {"train_loss": -5.565291404724121, "global_step": 33472, "epoch": 796} {"train_loss": -5.5277626514434814, "global_step": 33473, "epoch": 796, "val_loss": 62526.3125} {"train_loss": -5.536253929138184, "global_step": 33474, "epoch": 797} {"train_loss": -5.537288665771484, "global_step": 33475, "epoch": 797} {"train_loss": -5.438602447509766, "global_step": 33476, "epoch": 797} {"train_loss": -5.6238532066345215, "global_step": 33477, "epoch": 797} {"train_loss": -5.524535179138184, "global_step": 33478, "epoch": 797} {"train_loss": -5.4753570556640625, "global_step": 33479, "epoch": 797} {"train_loss": -5.4981689453125, "global_step": 33480, "epoch": 797} {"train_loss": -5.489354133605957, "global_step": 33481, "epoch": 797} {"train_loss": -5.669227600097656, "global_step": 33482, "epoch": 797} {"train_loss": -5.432727813720703, "global_step": 33483, "epoch": 797} {"train_loss": -5.492048263549805, "global_step": 33484, "epoch": 797} {"train_loss": -5.485335350036621, "global_step": 33485, "epoch": 797} {"train_loss": -5.600961685180664, "global_step": 33486, "epoch": 797} {"train_loss": -5.4736785888671875, "global_step": 33487, "epoch": 797} {"train_loss": -5.7278923988342285, "global_step": 33488, "epoch": 797} {"train_loss": -5.614599704742432, "global_step": 33489, "epoch": 797} {"train_loss": -5.536828994750977, "global_step": 33490, "epoch": 797} {"train_loss": -5.511228561401367, "global_step": 33491, "epoch": 797} {"train_loss": -5.630352973937988, "global_step": 33492, "epoch": 797} {"train_loss": -5.4088134765625, "global_step": 33493, "epoch": 797} {"train_loss": -5.573216438293457, "global_step": 33494, "epoch": 797} {"train_loss": -5.682875633239746, "global_step": 33495, "epoch": 797} {"train_loss": -5.472966194152832, "global_step": 33496, "epoch": 797} {"train_loss": -5.567877292633057, "global_step": 33497, "epoch": 797} {"train_loss": -5.456244945526123, "global_step": 33498, "epoch": 797} {"train_loss": -5.64713191986084, "global_step": 33499, "epoch": 797} {"train_loss": -5.523192882537842, "global_step": 33500, "epoch": 797} {"train_loss": -5.479788780212402, "global_step": 33501, "epoch": 797} {"train_loss": -5.573379993438721, "global_step": 33502, "epoch": 797} {"train_loss": -5.480062484741211, "global_step": 33503, "epoch": 797} {"train_loss": -5.38564395904541, "global_step": 33504, "epoch": 797} {"train_loss": -5.509681224822998, "global_step": 33505, "epoch": 797} {"train_loss": -5.5433125495910645, "global_step": 33506, "epoch": 797} {"train_loss": -5.415092945098877, "global_step": 33507, "epoch": 797} {"train_loss": -5.44774055480957, "global_step": 33508, "epoch": 797} {"train_loss": -5.518250465393066, "global_step": 33509, "epoch": 797} {"train_loss": -5.627712726593018, "global_step": 33510, "epoch": 797} {"train_loss": -5.514899253845215, "global_step": 33511, "epoch": 797} {"train_loss": -5.520598888397217, "global_step": 33512, "epoch": 797} {"train_loss": -5.713402271270752, "global_step": 33513, "epoch": 797} {"train_loss": -5.549727439880371, "global_step": 33514, "epoch": 797} {"train_loss": -5.534878322056362, "global_step": 33515, "epoch": 797, "val_loss": 62456.36328125} {"train_loss": -5.679258823394775, "global_step": 33516, "epoch": 798} {"train_loss": -5.531000137329102, "global_step": 33517, "epoch": 798} {"train_loss": -5.511375427246094, "global_step": 33518, "epoch": 798} {"train_loss": -5.546871185302734, "global_step": 33519, "epoch": 798} {"train_loss": -5.4871110916137695, "global_step": 33520, "epoch": 798} {"train_loss": -5.533949851989746, "global_step": 33521, "epoch": 798} {"train_loss": -5.560531139373779, "global_step": 33522, "epoch": 798} {"train_loss": -5.392831325531006, "global_step": 33523, "epoch": 798} {"train_loss": -5.594595909118652, "global_step": 33524, "epoch": 798} {"train_loss": -5.584552764892578, "global_step": 33525, "epoch": 798} {"train_loss": -5.519248962402344, "global_step": 33526, "epoch": 798} {"train_loss": -5.552490234375, "global_step": 33527, "epoch": 798} {"train_loss": -5.629577159881592, "global_step": 33528, "epoch": 798} {"train_loss": -5.618809700012207, "global_step": 33529, "epoch": 798} {"train_loss": -5.561336040496826, "global_step": 33530, "epoch": 798} {"train_loss": -5.548379898071289, "global_step": 33531, "epoch": 798} {"train_loss": -5.578671932220459, "global_step": 33532, "epoch": 798} {"train_loss": -5.6192731857299805, "global_step": 33533, "epoch": 798} {"train_loss": -5.4352641105651855, "global_step": 33534, "epoch": 798} {"train_loss": -5.652557373046875, "global_step": 33535, "epoch": 798} {"train_loss": -5.346190452575684, "global_step": 33536, "epoch": 798} {"train_loss": -5.527035713195801, "global_step": 33537, "epoch": 798} {"train_loss": -5.6722025871276855, "global_step": 33538, "epoch": 798} {"train_loss": -5.450564384460449, "global_step": 33539, "epoch": 798} {"train_loss": -5.502540588378906, "global_step": 33540, "epoch": 798} {"train_loss": -5.571714401245117, "global_step": 33541, "epoch": 798} {"train_loss": -5.52774715423584, "global_step": 33542, "epoch": 798} {"train_loss": -5.627399444580078, "global_step": 33543, "epoch": 798} {"train_loss": -5.519247055053711, "global_step": 33544, "epoch": 798} {"train_loss": -5.580506801605225, "global_step": 33545, "epoch": 798} {"train_loss": -5.552060604095459, "global_step": 33546, "epoch": 798} {"train_loss": -5.5613555908203125, "global_step": 33547, "epoch": 798} {"train_loss": -5.436976432800293, "global_step": 33548, "epoch": 798} {"train_loss": -5.545109272003174, "global_step": 33549, "epoch": 798} {"train_loss": -5.533792972564697, "global_step": 33550, "epoch": 798} {"train_loss": -5.680930137634277, "global_step": 33551, "epoch": 798} {"train_loss": -5.5414276123046875, "global_step": 33552, "epoch": 798} {"train_loss": -5.66701602935791, "global_step": 33553, "epoch": 798} {"train_loss": -5.598412036895752, "global_step": 33554, "epoch": 798} {"train_loss": -5.503637313842773, "global_step": 33555, "epoch": 798} {"train_loss": -5.58768367767334, "global_step": 33556, "epoch": 798} {"train_loss": -5.554527328127906, "global_step": 33557, "epoch": 798, "val_loss": 62727.25} {"train_loss": -5.474018096923828, "global_step": 33558, "epoch": 799} {"train_loss": -5.488804817199707, "global_step": 33559, "epoch": 799} {"train_loss": -5.630315780639648, "global_step": 33560, "epoch": 799} {"train_loss": -5.527435302734375, "global_step": 33561, "epoch": 799} {"train_loss": -5.513197898864746, "global_step": 33562, "epoch": 799} {"train_loss": -5.627478122711182, "global_step": 33563, "epoch": 799} {"train_loss": -5.548602104187012, "global_step": 33564, "epoch": 799} {"train_loss": -5.5084004402160645, "global_step": 33565, "epoch": 799} {"train_loss": -5.474942207336426, "global_step": 33566, "epoch": 799} {"train_loss": -5.482097148895264, "global_step": 33567, "epoch": 799} {"train_loss": -5.530154228210449, "global_step": 33568, "epoch": 799} {"train_loss": -5.602965354919434, "global_step": 33569, "epoch": 799} {"train_loss": -5.489473819732666, "global_step": 33570, "epoch": 799} {"train_loss": -5.548653602600098, "global_step": 33571, "epoch": 799} {"train_loss": -5.561463356018066, "global_step": 33572, "epoch": 799} {"train_loss": -5.463295936584473, "global_step": 33573, "epoch": 799} {"train_loss": -5.530275821685791, "global_step": 33574, "epoch": 799} {"train_loss": -5.583375453948975, "global_step": 33575, "epoch": 799} {"train_loss": -5.574058532714844, "global_step": 33576, "epoch": 799} {"train_loss": -5.545920372009277, "global_step": 33577, "epoch": 799} {"train_loss": -5.552706718444824, "global_step": 33578, "epoch": 799} {"train_loss": -5.528468132019043, "global_step": 33579, "epoch": 799} {"train_loss": -5.492408752441406, "global_step": 33580, "epoch": 799} {"train_loss": -5.684144020080566, "global_step": 33581, "epoch": 799} {"train_loss": -5.544127941131592, "global_step": 33582, "epoch": 799} {"train_loss": -5.536995887756348, "global_step": 33583, "epoch": 799} {"train_loss": -5.508886337280273, "global_step": 33584, "epoch": 799} {"train_loss": -5.581854820251465, "global_step": 33585, "epoch": 799} {"train_loss": -5.545880317687988, "global_step": 33586, "epoch": 799} {"train_loss": -5.4545111656188965, "global_step": 33587, "epoch": 799} {"train_loss": -5.531374931335449, "global_step": 33588, "epoch": 799} {"train_loss": -5.572731018066406, "global_step": 33589, "epoch": 799} {"train_loss": -5.673623085021973, "global_step": 33590, "epoch": 799} {"train_loss": -5.574113845825195, "global_step": 33591, "epoch": 799} {"train_loss": -5.574273109436035, "global_step": 33592, "epoch": 799} {"train_loss": -5.463080406188965, "global_step": 33593, "epoch": 799} {"train_loss": -5.464908123016357, "global_step": 33594, "epoch": 799} {"train_loss": -5.4682111740112305, "global_step": 33595, "epoch": 799} {"train_loss": -5.491631031036377, "global_step": 33596, "epoch": 799} {"train_loss": -5.466195106506348, "global_step": 33597, "epoch": 799} {"train_loss": -5.5305328369140625, "global_step": 33598, "epoch": 799} {"train_loss": -5.5344598179771785, "global_step": 33599, "epoch": 799, "val_loss": 62781.5234375} {"train_loss": -5.4587626457214355, "global_step": 33600, "epoch": 800} {"train_loss": -5.565308570861816, "global_step": 33601, "epoch": 800} {"train_loss": -5.536074161529541, "global_step": 33602, "epoch": 800} {"train_loss": -5.494533538818359, "global_step": 33603, "epoch": 800} {"train_loss": -5.479465484619141, "global_step": 33604, "epoch": 800} {"train_loss": -5.57256555557251, "global_step": 33605, "epoch": 800} {"train_loss": -5.536799907684326, "global_step": 33606, "epoch": 800} {"train_loss": -5.42353630065918, "global_step": 33607, "epoch": 800} {"train_loss": -5.535539627075195, "global_step": 33608, "epoch": 800} {"train_loss": -5.529335975646973, "global_step": 33609, "epoch": 800} {"train_loss": -5.585587501525879, "global_step": 33610, "epoch": 800} {"train_loss": -5.50470495223999, "global_step": 33611, "epoch": 800} {"train_loss": -5.664244651794434, "global_step": 33612, "epoch": 800} {"train_loss": -5.593972206115723, "global_step": 33613, "epoch": 800} {"train_loss": -5.585957050323486, "global_step": 33614, "epoch": 800} {"train_loss": -5.492697715759277, "global_step": 33615, "epoch": 800} {"train_loss": -5.509152412414551, "global_step": 33616, "epoch": 800} {"train_loss": -5.660302639007568, "global_step": 33617, "epoch": 800} {"train_loss": -5.417262077331543, "global_step": 33618, "epoch": 800} {"train_loss": -5.344342231750488, "global_step": 33619, "epoch": 800} {"train_loss": -5.562584400177002, "global_step": 33620, "epoch": 800} {"train_loss": -5.3105621337890625, "global_step": 33621, "epoch": 800} {"train_loss": -5.302278518676758, "global_step": 33622, "epoch": 800} {"train_loss": -5.605883598327637, "global_step": 33623, "epoch": 800} {"train_loss": -5.436308860778809, "global_step": 33624, "epoch": 800} {"train_loss": -5.549842834472656, "global_step": 33625, "epoch": 800} {"train_loss": -5.417412757873535, "global_step": 33626, "epoch": 800} {"train_loss": -5.454017639160156, "global_step": 33627, "epoch": 800} {"train_loss": -5.498281002044678, "global_step": 33628, "epoch": 800} {"train_loss": -5.4177751541137695, "global_step": 33629, "epoch": 800} {"train_loss": -5.452192306518555, "global_step": 33630, "epoch": 800} {"train_loss": -5.5402984619140625, "global_step": 33631, "epoch": 800} {"train_loss": -5.582768440246582, "global_step": 33632, "epoch": 800} {"train_loss": -5.596674919128418, "global_step": 33633, "epoch": 800} {"train_loss": -5.39405632019043, "global_step": 33634, "epoch": 800} {"train_loss": -5.525079727172852, "global_step": 33635, "epoch": 800} {"train_loss": -5.643983840942383, "global_step": 33636, "epoch": 800} {"train_loss": -5.490171909332275, "global_step": 33637, "epoch": 800} {"train_loss": -5.47957181930542, "global_step": 33638, "epoch": 800} {"train_loss": -5.657343864440918, "global_step": 33639, "epoch": 800} {"train_loss": -5.542417049407959, "global_step": 33640, "epoch": 800} {"train_loss": -5.511689821879069, "global_step": 33641, "epoch": 800, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.15876566240153964, "train/sim_max_reward_2": 0.8468098547160496, "train/sim_max_reward_3": 0.44419860215614676, "train/sim_max_reward_4": 0.5716892428689433, "train/sim_max_reward_5": 0.5554135647638916, "test/sim_max_reward_4300000": 0.6920836209670878, "test/sim_max_reward_4300001": 0.21297798392493852, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.488364411534757, "test/sim_max_reward_4300004": 0.1836873671187524, "test/sim_max_reward_4300005": 0.8135765077962267, "test/sim_max_reward_4300006": 0.15345251388302827, "test/sim_max_reward_4300007": 0.11108468494450646, "test/sim_max_reward_4300008": 0.24854348736638632, "test/sim_max_reward_4300009": 0.3963009479848965, "test/sim_max_reward_4300010": 0.0935457820905869, "test/sim_max_reward_4300011": 0.9497969293080769, "test/sim_max_reward_4300012": 0.4155566431995979, "test/sim_max_reward_4300013": 0.6909258296593697, "test/sim_max_reward_4300014": 0.9170090731445997, "test/sim_max_reward_4300015": 0.22434380981056135, "test/sim_max_reward_4300016": 0.48881699704158327, "test/sim_max_reward_4300017": 0.3949931435264752, "test/sim_max_reward_4300018": 0.5686911536651782, "test/sim_max_reward_4300019": 0.2673702402303409, "test/sim_max_reward_4300020": 0.14688705615174333, "test/sim_max_reward_4300021": 0.4830148230796257, "test/sim_max_reward_4300022": 0.18771616794897295, "test/sim_max_reward_4300023": 0.3984347314294953, "test/sim_max_reward_4300024": 0.051293508089026635, "test/sim_max_reward_4300025": 0.5628224323953439, "test/sim_max_reward_4300026": 0.24633989273506918, "test/sim_max_reward_4300027": 0.3227115042215418, "test/sim_max_reward_4300028": 0.8885300669684868, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.3341109314162276, "test/sim_max_reward_4300031": 0.48694165508679765, "test/sim_max_reward_4300032": 0.5670670603941244, "test/sim_max_reward_4300033": 0.39996836076483194, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.6535188820005793, "test/sim_max_reward_4300038": 0.0, "test/sim_max_reward_4300039": 0.0, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.20495070567680057, "test/sim_max_reward_4300042": 0.9268043409444181, "test/sim_max_reward_4300043": 0.19939451641555786, "test/sim_max_reward_4300044": 0.05181251721881018, "test/sim_max_reward_4300045": 0.41042987230149675, "test/sim_max_reward_4300046": 0.33914129435474094, "test/sim_max_reward_4300047": 0.3426615308056475, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.5430408487261817, "train/mean_score": 0.46119573725210383, "test/mean_score": 0.34863888616754374, "val_loss": 62700.07421875} {"train_loss": -5.535312652587891, "global_step": 33642, "epoch": 801} {"train_loss": -5.633387565612793, "global_step": 33643, "epoch": 801} {"train_loss": -5.58420991897583, "global_step": 33644, "epoch": 801} {"train_loss": -5.607118606567383, "global_step": 33645, "epoch": 801} {"train_loss": -5.604038238525391, "global_step": 33646, "epoch": 801} {"train_loss": -5.496456146240234, "global_step": 33647, "epoch": 801} {"train_loss": -5.581177711486816, "global_step": 33648, "epoch": 801} {"train_loss": -5.652981758117676, "global_step": 33649, "epoch": 801} {"train_loss": -5.6354899406433105, "global_step": 33650, "epoch": 801} {"train_loss": -5.641605854034424, "global_step": 33651, "epoch": 801} {"train_loss": -5.567101001739502, "global_step": 33652, "epoch": 801} {"train_loss": -5.485050201416016, "global_step": 33653, "epoch": 801} {"train_loss": -5.443760395050049, "global_step": 33654, "epoch": 801} {"train_loss": -5.571027755737305, "global_step": 33655, "epoch": 801} {"train_loss": -5.506430149078369, "global_step": 33656, "epoch": 801} {"train_loss": -5.619631767272949, "global_step": 33657, "epoch": 801} {"train_loss": -5.497331619262695, "global_step": 33658, "epoch": 801} {"train_loss": -5.635982513427734, "global_step": 33659, "epoch": 801} {"train_loss": -5.480797290802002, "global_step": 33660, "epoch": 801} {"train_loss": -5.649543762207031, "global_step": 33661, "epoch": 801} {"train_loss": -5.538183689117432, "global_step": 33662, "epoch": 801} {"train_loss": -5.669597148895264, "global_step": 33663, "epoch": 801} {"train_loss": -5.433085918426514, "global_step": 33664, "epoch": 801} {"train_loss": -5.554763317108154, "global_step": 33665, "epoch": 801} {"train_loss": -5.520195484161377, "global_step": 33666, "epoch": 801} {"train_loss": -5.464994430541992, "global_step": 33667, "epoch": 801} {"train_loss": -5.531786918640137, "global_step": 33668, "epoch": 801} {"train_loss": -5.586675643920898, "global_step": 33669, "epoch": 801} {"train_loss": -5.527285099029541, "global_step": 33670, "epoch": 801} {"train_loss": -5.6355485916137695, "global_step": 33671, "epoch": 801} {"train_loss": -5.56723690032959, "global_step": 33672, "epoch": 801} {"train_loss": -5.61970329284668, "global_step": 33673, "epoch": 801} {"train_loss": -5.511983871459961, "global_step": 33674, "epoch": 801} {"train_loss": -5.666610240936279, "global_step": 33675, "epoch": 801} {"train_loss": -5.509044647216797, "global_step": 33676, "epoch": 801} {"train_loss": -5.4355878829956055, "global_step": 33677, "epoch": 801} {"train_loss": -5.479485511779785, "global_step": 33678, "epoch": 801} {"train_loss": -5.509922027587891, "global_step": 33679, "epoch": 801} {"train_loss": -5.590751647949219, "global_step": 33680, "epoch": 801} {"train_loss": -5.491551399230957, "global_step": 33681, "epoch": 801} {"train_loss": -5.604304790496826, "global_step": 33682, "epoch": 801} {"train_loss": -5.557298353740147, "global_step": 33683, "epoch": 801, "val_loss": 62371.14453125} {"train_loss": -5.4938507080078125, "global_step": 33684, "epoch": 802} {"train_loss": -5.533492088317871, "global_step": 33685, "epoch": 802} {"train_loss": -5.614883899688721, "global_step": 33686, "epoch": 802} {"train_loss": -5.608572006225586, "global_step": 33687, "epoch": 802} {"train_loss": -5.455914497375488, "global_step": 33688, "epoch": 802} {"train_loss": -5.504240036010742, "global_step": 33689, "epoch": 802} {"train_loss": -5.633413314819336, "global_step": 33690, "epoch": 802} {"train_loss": -5.543373107910156, "global_step": 33691, "epoch": 802} {"train_loss": -5.643115043640137, "global_step": 33692, "epoch": 802} {"train_loss": -5.480199813842773, "global_step": 33693, "epoch": 802} {"train_loss": -5.469831466674805, "global_step": 33694, "epoch": 802} {"train_loss": -5.608713626861572, "global_step": 33695, "epoch": 802} {"train_loss": -5.571246147155762, "global_step": 33696, "epoch": 802} {"train_loss": -5.63235330581665, "global_step": 33697, "epoch": 802} {"train_loss": -5.515589714050293, "global_step": 33698, "epoch": 802} {"train_loss": -5.613173007965088, "global_step": 33699, "epoch": 802} {"train_loss": -5.533481597900391, "global_step": 33700, "epoch": 802} {"train_loss": -5.51240873336792, "global_step": 33701, "epoch": 802} {"train_loss": -5.576605796813965, "global_step": 33702, "epoch": 802} {"train_loss": -5.539942264556885, "global_step": 33703, "epoch": 802} {"train_loss": -5.623151779174805, "global_step": 33704, "epoch": 802} {"train_loss": -5.627104759216309, "global_step": 33705, "epoch": 802} {"train_loss": -5.502407073974609, "global_step": 33706, "epoch": 802} {"train_loss": -5.54535436630249, "global_step": 33707, "epoch": 802} {"train_loss": -5.550327777862549, "global_step": 33708, "epoch": 802} {"train_loss": -5.674197673797607, "global_step": 33709, "epoch": 802} {"train_loss": -5.491560935974121, "global_step": 33710, "epoch": 802} {"train_loss": -5.590310096740723, "global_step": 33711, "epoch": 802} {"train_loss": -5.445191383361816, "global_step": 33712, "epoch": 802} {"train_loss": -5.4422407150268555, "global_step": 33713, "epoch": 802} {"train_loss": -5.5024871826171875, "global_step": 33714, "epoch": 802} {"train_loss": -5.555424690246582, "global_step": 33715, "epoch": 802} {"train_loss": -5.556070327758789, "global_step": 33716, "epoch": 802} {"train_loss": -5.455174446105957, "global_step": 33717, "epoch": 802} {"train_loss": -5.350037574768066, "global_step": 33718, "epoch": 802} {"train_loss": -5.532846450805664, "global_step": 33719, "epoch": 802} {"train_loss": -5.442083358764648, "global_step": 33720, "epoch": 802} {"train_loss": -5.478673458099365, "global_step": 33721, "epoch": 802} {"train_loss": -5.558826923370361, "global_step": 33722, "epoch": 802} {"train_loss": -5.442541122436523, "global_step": 33723, "epoch": 802} {"train_loss": -5.459251403808594, "global_step": 33724, "epoch": 802} {"train_loss": -5.536820264089675, "global_step": 33725, "epoch": 802, "val_loss": 62691.58984375} {"train_loss": -5.53800106048584, "global_step": 33726, "epoch": 803} {"train_loss": -5.672493934631348, "global_step": 33727, "epoch": 803} {"train_loss": -5.49014949798584, "global_step": 33728, "epoch": 803} {"train_loss": -5.525611400604248, "global_step": 33729, "epoch": 803} {"train_loss": -5.478593349456787, "global_step": 33730, "epoch": 803} {"train_loss": -5.538673400878906, "global_step": 33731, "epoch": 803} {"train_loss": -5.625572681427002, "global_step": 33732, "epoch": 803} {"train_loss": -5.581219673156738, "global_step": 33733, "epoch": 803} {"train_loss": -5.488363265991211, "global_step": 33734, "epoch": 803} {"train_loss": -5.6475300788879395, "global_step": 33735, "epoch": 803} {"train_loss": -5.516430377960205, "global_step": 33736, "epoch": 803} {"train_loss": -5.560956001281738, "global_step": 33737, "epoch": 803} {"train_loss": -5.486810207366943, "global_step": 33738, "epoch": 803} {"train_loss": -5.535621643066406, "global_step": 33739, "epoch": 803} {"train_loss": -5.4240851402282715, "global_step": 33740, "epoch": 803} {"train_loss": -5.470956802368164, "global_step": 33741, "epoch": 803} {"train_loss": -5.594409465789795, "global_step": 33742, "epoch": 803} {"train_loss": -5.605652332305908, "global_step": 33743, "epoch": 803} {"train_loss": -5.538025379180908, "global_step": 33744, "epoch": 803} {"train_loss": -5.477383613586426, "global_step": 33745, "epoch": 803} {"train_loss": -5.542806148529053, "global_step": 33746, "epoch": 803} {"train_loss": -5.360940456390381, "global_step": 33747, "epoch": 803} {"train_loss": -5.593990325927734, "global_step": 33748, "epoch": 803} {"train_loss": -5.549400329589844, "global_step": 33749, "epoch": 803} {"train_loss": -5.5349578857421875, "global_step": 33750, "epoch": 803} {"train_loss": -5.571164131164551, "global_step": 33751, "epoch": 803} {"train_loss": -5.558688163757324, "global_step": 33752, "epoch": 803} {"train_loss": -5.400152206420898, "global_step": 33753, "epoch": 803} {"train_loss": -5.536565780639648, "global_step": 33754, "epoch": 803} {"train_loss": -5.539265155792236, "global_step": 33755, "epoch": 803} {"train_loss": -5.522563457489014, "global_step": 33756, "epoch": 803} {"train_loss": -5.496377468109131, "global_step": 33757, "epoch": 803} {"train_loss": -5.514345169067383, "global_step": 33758, "epoch": 803} {"train_loss": -5.647002220153809, "global_step": 33759, "epoch": 803} {"train_loss": -5.477441310882568, "global_step": 33760, "epoch": 803} {"train_loss": -5.518111228942871, "global_step": 33761, "epoch": 803} {"train_loss": -5.429109573364258, "global_step": 33762, "epoch": 803} {"train_loss": -5.581199645996094, "global_step": 33763, "epoch": 803} {"train_loss": -5.526104927062988, "global_step": 33764, "epoch": 803} {"train_loss": -5.54399299621582, "global_step": 33765, "epoch": 803} {"train_loss": -5.562380313873291, "global_step": 33766, "epoch": 803} {"train_loss": -5.530468259538923, "global_step": 33767, "epoch": 803, "val_loss": 62659.15625} {"train_loss": -5.590819358825684, "global_step": 33768, "epoch": 804} {"train_loss": -5.560650825500488, "global_step": 33769, "epoch": 804} {"train_loss": -5.670167922973633, "global_step": 33770, "epoch": 804} {"train_loss": -5.62220573425293, "global_step": 33771, "epoch": 804} {"train_loss": -5.592204570770264, "global_step": 33772, "epoch": 804} {"train_loss": -5.471480369567871, "global_step": 33773, "epoch": 804} {"train_loss": -5.627096176147461, "global_step": 33774, "epoch": 804} {"train_loss": -5.575567245483398, "global_step": 33775, "epoch": 804} {"train_loss": -5.50593900680542, "global_step": 33776, "epoch": 804} {"train_loss": -5.560479164123535, "global_step": 33777, "epoch": 804} {"train_loss": -5.474593162536621, "global_step": 33778, "epoch": 804} {"train_loss": -5.607355117797852, "global_step": 33779, "epoch": 804} {"train_loss": -5.555694580078125, "global_step": 33780, "epoch": 804} {"train_loss": -5.563180923461914, "global_step": 33781, "epoch": 804} {"train_loss": -5.5600666999816895, "global_step": 33782, "epoch": 804} {"train_loss": -5.592625141143799, "global_step": 33783, "epoch": 804} {"train_loss": -5.472461700439453, "global_step": 33784, "epoch": 804} {"train_loss": -5.594047546386719, "global_step": 33785, "epoch": 804} {"train_loss": -5.523617744445801, "global_step": 33786, "epoch": 804} {"train_loss": -5.5269975662231445, "global_step": 33787, "epoch": 804} {"train_loss": -5.601498603820801, "global_step": 33788, "epoch": 804} {"train_loss": -5.4384541511535645, "global_step": 33789, "epoch": 804} {"train_loss": -5.3864312171936035, "global_step": 33790, "epoch": 804} {"train_loss": -5.350444793701172, "global_step": 33791, "epoch": 804} {"train_loss": -5.515416145324707, "global_step": 33792, "epoch": 804} {"train_loss": -5.336191177368164, "global_step": 33793, "epoch": 804} {"train_loss": -5.5875244140625, "global_step": 33794, "epoch": 804} {"train_loss": -5.60585880279541, "global_step": 33795, "epoch": 804} {"train_loss": -5.516990661621094, "global_step": 33796, "epoch": 804} {"train_loss": -5.556136608123779, "global_step": 33797, "epoch": 804} {"train_loss": -5.4632487297058105, "global_step": 33798, "epoch": 804} {"train_loss": -5.61982536315918, "global_step": 33799, "epoch": 804} {"train_loss": -5.4792985916137695, "global_step": 33800, "epoch": 804} {"train_loss": -5.443302154541016, "global_step": 33801, "epoch": 804} {"train_loss": -5.650487899780273, "global_step": 33802, "epoch": 804} {"train_loss": -5.504957675933838, "global_step": 33803, "epoch": 804} {"train_loss": -5.568454742431641, "global_step": 33804, "epoch": 804} {"train_loss": -5.535335540771484, "global_step": 33805, "epoch": 804} {"train_loss": -5.4853010177612305, "global_step": 33806, "epoch": 804} {"train_loss": -5.609317779541016, "global_step": 33807, "epoch": 804} {"train_loss": -5.5731706619262695, "global_step": 33808, "epoch": 804} {"train_loss": -5.537830920446487, "global_step": 33809, "epoch": 804, "val_loss": 62670.08984375} {"train_loss": -5.557595252990723, "global_step": 33810, "epoch": 805} {"train_loss": -5.43595027923584, "global_step": 33811, "epoch": 805} {"train_loss": -5.577197074890137, "global_step": 33812, "epoch": 805} {"train_loss": -5.492151737213135, "global_step": 33813, "epoch": 805} {"train_loss": -5.422019958496094, "global_step": 33814, "epoch": 805} {"train_loss": -5.477818965911865, "global_step": 33815, "epoch": 805} {"train_loss": -5.556776523590088, "global_step": 33816, "epoch": 805} {"train_loss": -5.510631561279297, "global_step": 33817, "epoch": 805} {"train_loss": -5.5564727783203125, "global_step": 33818, "epoch": 805} {"train_loss": -5.634138107299805, "global_step": 33819, "epoch": 805} {"train_loss": -5.5475969314575195, "global_step": 33820, "epoch": 805} {"train_loss": -5.513042449951172, "global_step": 33821, "epoch": 805} {"train_loss": -5.662418365478516, "global_step": 33822, "epoch": 805} {"train_loss": -5.568211555480957, "global_step": 33823, "epoch": 805} {"train_loss": -5.571967601776123, "global_step": 33824, "epoch": 805} {"train_loss": -5.618350982666016, "global_step": 33825, "epoch": 805} {"train_loss": -5.545672416687012, "global_step": 33826, "epoch": 805} {"train_loss": -5.612392425537109, "global_step": 33827, "epoch": 805} {"train_loss": -5.462876319885254, "global_step": 33828, "epoch": 805} {"train_loss": -5.47304630279541, "global_step": 33829, "epoch": 805} {"train_loss": -5.5867204666137695, "global_step": 33830, "epoch": 805} {"train_loss": -5.526150226593018, "global_step": 33831, "epoch": 805} {"train_loss": -5.660954475402832, "global_step": 33832, "epoch": 805} {"train_loss": -5.47709846496582, "global_step": 33833, "epoch": 805} {"train_loss": -5.547325134277344, "global_step": 33834, "epoch": 805} {"train_loss": -5.4827680587768555, "global_step": 33835, "epoch": 805} {"train_loss": -5.509284973144531, "global_step": 33836, "epoch": 805} {"train_loss": -5.589799880981445, "global_step": 33837, "epoch": 805} {"train_loss": -5.554229736328125, "global_step": 33838, "epoch": 805} {"train_loss": -5.602436065673828, "global_step": 33839, "epoch": 805} {"train_loss": -5.544826030731201, "global_step": 33840, "epoch": 805} {"train_loss": -5.551865577697754, "global_step": 33841, "epoch": 805} {"train_loss": -5.515773296356201, "global_step": 33842, "epoch": 805} {"train_loss": -5.41326904296875, "global_step": 33843, "epoch": 805} {"train_loss": -5.5749359130859375, "global_step": 33844, "epoch": 805} {"train_loss": -5.555639266967773, "global_step": 33845, "epoch": 805} {"train_loss": -5.5111918449401855, "global_step": 33846, "epoch": 805} {"train_loss": -5.522007942199707, "global_step": 33847, "epoch": 805} {"train_loss": -5.526252269744873, "global_step": 33848, "epoch": 805} {"train_loss": -5.623084545135498, "global_step": 33849, "epoch": 805} {"train_loss": -5.68636417388916, "global_step": 33850, "epoch": 805} {"train_loss": -5.546086141041347, "global_step": 33851, "epoch": 805, "val_loss": 62465.203125} {"train_loss": -5.590538024902344, "global_step": 33852, "epoch": 806} {"train_loss": -5.713429927825928, "global_step": 33853, "epoch": 806} {"train_loss": -5.557249069213867, "global_step": 33854, "epoch": 806} {"train_loss": -5.408515930175781, "global_step": 33855, "epoch": 806} {"train_loss": -5.601992130279541, "global_step": 33856, "epoch": 806} {"train_loss": -5.407038688659668, "global_step": 33857, "epoch": 806} {"train_loss": -5.5508599281311035, "global_step": 33858, "epoch": 806} {"train_loss": -5.598175525665283, "global_step": 33859, "epoch": 806} {"train_loss": -5.596820831298828, "global_step": 33860, "epoch": 806} {"train_loss": -5.550368309020996, "global_step": 33861, "epoch": 806} {"train_loss": -5.4446001052856445, "global_step": 33862, "epoch": 806} {"train_loss": -5.608457565307617, "global_step": 33863, "epoch": 806} {"train_loss": -5.4784040451049805, "global_step": 33864, "epoch": 806} {"train_loss": -5.630431175231934, "global_step": 33865, "epoch": 806} {"train_loss": -5.495902061462402, "global_step": 33866, "epoch": 806} {"train_loss": -5.547991752624512, "global_step": 33867, "epoch": 806} {"train_loss": -5.5180511474609375, "global_step": 33868, "epoch": 806} {"train_loss": -5.541172027587891, "global_step": 33869, "epoch": 806} {"train_loss": -5.487072944641113, "global_step": 33870, "epoch": 806} {"train_loss": -5.58085823059082, "global_step": 33871, "epoch": 806} {"train_loss": -5.563247203826904, "global_step": 33872, "epoch": 806} {"train_loss": -5.560082912445068, "global_step": 33873, "epoch": 806} {"train_loss": -5.6150994300842285, "global_step": 33874, "epoch": 806} {"train_loss": -5.753152847290039, "global_step": 33875, "epoch": 806} {"train_loss": -5.522796630859375, "global_step": 33876, "epoch": 806} {"train_loss": -5.432631492614746, "global_step": 33877, "epoch": 806} {"train_loss": -5.616873741149902, "global_step": 33878, "epoch": 806} {"train_loss": -5.578619956970215, "global_step": 33879, "epoch": 806} {"train_loss": -5.541555881500244, "global_step": 33880, "epoch": 806} {"train_loss": -5.497034072875977, "global_step": 33881, "epoch": 806} {"train_loss": -5.628509044647217, "global_step": 33882, "epoch": 806} {"train_loss": -5.557685852050781, "global_step": 33883, "epoch": 806} {"train_loss": -5.575882911682129, "global_step": 33884, "epoch": 806} {"train_loss": -5.505427360534668, "global_step": 33885, "epoch": 806} {"train_loss": -5.612673282623291, "global_step": 33886, "epoch": 806} {"train_loss": -5.5364556312561035, "global_step": 33887, "epoch": 806} {"train_loss": -5.614645957946777, "global_step": 33888, "epoch": 806} {"train_loss": -5.573307991027832, "global_step": 33889, "epoch": 806} {"train_loss": -5.540716171264648, "global_step": 33890, "epoch": 806} {"train_loss": -5.530825138092041, "global_step": 33891, "epoch": 806} {"train_loss": -5.562991142272949, "global_step": 33892, "epoch": 806} {"train_loss": -5.554985818408785, "global_step": 33893, "epoch": 806, "val_loss": 62912.8671875} {"train_loss": -5.476445198059082, "global_step": 33894, "epoch": 807} {"train_loss": -5.556758880615234, "global_step": 33895, "epoch": 807} {"train_loss": -5.491791725158691, "global_step": 33896, "epoch": 807} {"train_loss": -5.458512306213379, "global_step": 33897, "epoch": 807} {"train_loss": -5.441102981567383, "global_step": 33898, "epoch": 807} {"train_loss": -5.480619430541992, "global_step": 33899, "epoch": 807} {"train_loss": -5.408822059631348, "global_step": 33900, "epoch": 807} {"train_loss": -5.517786026000977, "global_step": 33901, "epoch": 807} {"train_loss": -5.444510459899902, "global_step": 33902, "epoch": 807} {"train_loss": -5.481633186340332, "global_step": 33903, "epoch": 807} {"train_loss": -5.655300617218018, "global_step": 33904, "epoch": 807} {"train_loss": -5.422546863555908, "global_step": 33905, "epoch": 807} {"train_loss": -5.511136531829834, "global_step": 33906, "epoch": 807} {"train_loss": -5.595769882202148, "global_step": 33907, "epoch": 807} {"train_loss": -5.331157684326172, "global_step": 33908, "epoch": 807} {"train_loss": -5.457045078277588, "global_step": 33909, "epoch": 807} {"train_loss": -5.464595794677734, "global_step": 33910, "epoch": 807} {"train_loss": -5.4496660232543945, "global_step": 33911, "epoch": 807} {"train_loss": -5.4918437004089355, "global_step": 33912, "epoch": 807} {"train_loss": -5.468314170837402, "global_step": 33913, "epoch": 807} {"train_loss": -5.501007556915283, "global_step": 33914, "epoch": 807} {"train_loss": -5.414637565612793, "global_step": 33915, "epoch": 807} {"train_loss": -5.493807792663574, "global_step": 33916, "epoch": 807} {"train_loss": -5.598979949951172, "global_step": 33917, "epoch": 807} {"train_loss": -5.398606300354004, "global_step": 33918, "epoch": 807} {"train_loss": -5.572890281677246, "global_step": 33919, "epoch": 807} {"train_loss": -5.585995674133301, "global_step": 33920, "epoch": 807} {"train_loss": -5.59475040435791, "global_step": 33921, "epoch": 807} {"train_loss": -5.633189678192139, "global_step": 33922, "epoch": 807} {"train_loss": -5.560286521911621, "global_step": 33923, "epoch": 807} {"train_loss": -5.568493843078613, "global_step": 33924, "epoch": 807} {"train_loss": -5.515216827392578, "global_step": 33925, "epoch": 807} {"train_loss": -5.607724189758301, "global_step": 33926, "epoch": 807} {"train_loss": -5.577417373657227, "global_step": 33927, "epoch": 807} {"train_loss": -5.4807000160217285, "global_step": 33928, "epoch": 807} {"train_loss": -5.503806114196777, "global_step": 33929, "epoch": 807} {"train_loss": -5.6271257400512695, "global_step": 33930, "epoch": 807} {"train_loss": -5.534152984619141, "global_step": 33931, "epoch": 807} {"train_loss": -5.419417381286621, "global_step": 33932, "epoch": 807} {"train_loss": -5.612058639526367, "global_step": 33933, "epoch": 807} {"train_loss": -5.366336822509766, "global_step": 33934, "epoch": 807} {"train_loss": -5.505098569960821, "global_step": 33935, "epoch": 807, "val_loss": 62618.9375} {"train_loss": -5.5238752365112305, "global_step": 33936, "epoch": 808} {"train_loss": -5.527895927429199, "global_step": 33937, "epoch": 808} {"train_loss": -5.49822998046875, "global_step": 33938, "epoch": 808} {"train_loss": -5.521461486816406, "global_step": 33939, "epoch": 808} {"train_loss": -5.6763505935668945, "global_step": 33940, "epoch": 808} {"train_loss": -5.519073009490967, "global_step": 33941, "epoch": 808} {"train_loss": -5.513893127441406, "global_step": 33942, "epoch": 808} {"train_loss": -5.58762264251709, "global_step": 33943, "epoch": 808} {"train_loss": -5.47597599029541, "global_step": 33944, "epoch": 808} {"train_loss": -5.53276252746582, "global_step": 33945, "epoch": 808} {"train_loss": -5.452307224273682, "global_step": 33946, "epoch": 808} {"train_loss": -5.523621559143066, "global_step": 33947, "epoch": 808} {"train_loss": -5.49008846282959, "global_step": 33948, "epoch": 808} {"train_loss": -5.496352672576904, "global_step": 33949, "epoch": 808} {"train_loss": -5.539392471313477, "global_step": 33950, "epoch": 808} {"train_loss": -5.549039840698242, "global_step": 33951, "epoch": 808} {"train_loss": -5.404719352722168, "global_step": 33952, "epoch": 808} {"train_loss": -5.458703517913818, "global_step": 33953, "epoch": 808} {"train_loss": -5.531414031982422, "global_step": 33954, "epoch": 808} {"train_loss": -5.577883720397949, "global_step": 33955, "epoch": 808} {"train_loss": -5.529656410217285, "global_step": 33956, "epoch": 808} {"train_loss": -5.561326503753662, "global_step": 33957, "epoch": 808} {"train_loss": -5.400111198425293, "global_step": 33958, "epoch": 808} {"train_loss": -5.49311637878418, "global_step": 33959, "epoch": 808} {"train_loss": -5.505904674530029, "global_step": 33960, "epoch": 808} {"train_loss": -5.470893859863281, "global_step": 33961, "epoch": 808} {"train_loss": -5.4269561767578125, "global_step": 33962, "epoch": 808} {"train_loss": -5.4472856521606445, "global_step": 33963, "epoch": 808} {"train_loss": -5.577246189117432, "global_step": 33964, "epoch": 808} {"train_loss": -5.467241287231445, "global_step": 33965, "epoch": 808} {"train_loss": -5.551939010620117, "global_step": 33966, "epoch": 808} {"train_loss": -5.529938697814941, "global_step": 33967, "epoch": 808} {"train_loss": -5.3351335525512695, "global_step": 33968, "epoch": 808} {"train_loss": -5.497568130493164, "global_step": 33969, "epoch": 808} {"train_loss": -5.2735161781311035, "global_step": 33970, "epoch": 808} {"train_loss": -5.553470134735107, "global_step": 33971, "epoch": 808} {"train_loss": -5.462974548339844, "global_step": 33972, "epoch": 808} {"train_loss": -5.3711371421813965, "global_step": 33973, "epoch": 808} {"train_loss": -5.513072967529297, "global_step": 33974, "epoch": 808} {"train_loss": -5.5184760093688965, "global_step": 33975, "epoch": 808} {"train_loss": -5.484192371368408, "global_step": 33976, "epoch": 808} {"train_loss": -5.498955340612502, "global_step": 33977, "epoch": 808, "val_loss": 62729.41015625} {"train_loss": -5.46117639541626, "global_step": 33978, "epoch": 809} {"train_loss": -5.476423263549805, "global_step": 33979, "epoch": 809} {"train_loss": -5.392827987670898, "global_step": 33980, "epoch": 809} {"train_loss": -5.583197593688965, "global_step": 33981, "epoch": 809} {"train_loss": -5.526975631713867, "global_step": 33982, "epoch": 809} {"train_loss": -5.415189743041992, "global_step": 33983, "epoch": 809} {"train_loss": -5.481932163238525, "global_step": 33984, "epoch": 809} {"train_loss": -5.493697166442871, "global_step": 33985, "epoch": 809} {"train_loss": -5.542573928833008, "global_step": 33986, "epoch": 809} {"train_loss": -5.623928070068359, "global_step": 33987, "epoch": 809} {"train_loss": -5.560877799987793, "global_step": 33988, "epoch": 809} {"train_loss": -5.480968475341797, "global_step": 33989, "epoch": 809} {"train_loss": -5.582805633544922, "global_step": 33990, "epoch": 809} {"train_loss": -5.447218894958496, "global_step": 33991, "epoch": 809} {"train_loss": -5.516854286193848, "global_step": 33992, "epoch": 809} {"train_loss": -5.520960807800293, "global_step": 33993, "epoch": 809} {"train_loss": -5.628246307373047, "global_step": 33994, "epoch": 809} {"train_loss": -5.4925761222839355, "global_step": 33995, "epoch": 809} {"train_loss": -5.586637496948242, "global_step": 33996, "epoch": 809} {"train_loss": -5.466341018676758, "global_step": 33997, "epoch": 809} {"train_loss": -5.634096622467041, "global_step": 33998, "epoch": 809} {"train_loss": -5.569969177246094, "global_step": 33999, "epoch": 809} {"train_loss": -5.597438812255859, "global_step": 34000, "epoch": 809} {"train_loss": -5.641365051269531, "global_step": 34001, "epoch": 809} {"train_loss": -5.441376686096191, "global_step": 34002, "epoch": 809} {"train_loss": -5.607102394104004, "global_step": 34003, "epoch": 809} {"train_loss": -5.5972747802734375, "global_step": 34004, "epoch": 809} {"train_loss": -5.601459503173828, "global_step": 34005, "epoch": 809} {"train_loss": -5.612297058105469, "global_step": 34006, "epoch": 809} {"train_loss": -5.587614059448242, "global_step": 34007, "epoch": 809} {"train_loss": -5.684650421142578, "global_step": 34008, "epoch": 809} {"train_loss": -5.584680557250977, "global_step": 34009, "epoch": 809} {"train_loss": -5.432799339294434, "global_step": 34010, "epoch": 809} {"train_loss": -5.577957630157471, "global_step": 34011, "epoch": 809} {"train_loss": -5.517346382141113, "global_step": 34012, "epoch": 809} {"train_loss": -5.468427658081055, "global_step": 34013, "epoch": 809} {"train_loss": -5.431984901428223, "global_step": 34014, "epoch": 809} {"train_loss": -5.569550514221191, "global_step": 34015, "epoch": 809} {"train_loss": -5.638623237609863, "global_step": 34016, "epoch": 809} {"train_loss": -5.479930877685547, "global_step": 34017, "epoch": 809} {"train_loss": -5.577169418334961, "global_step": 34018, "epoch": 809} {"train_loss": -5.542971066066197, "global_step": 34019, "epoch": 809, "val_loss": 63044.390625} {"train_loss": -5.3908233642578125, "global_step": 34020, "epoch": 810} {"train_loss": -5.649911880493164, "global_step": 34021, "epoch": 810} {"train_loss": -5.460793495178223, "global_step": 34022, "epoch": 810} {"train_loss": -5.458272457122803, "global_step": 34023, "epoch": 810} {"train_loss": -5.543519020080566, "global_step": 34024, "epoch": 810} {"train_loss": -5.54831075668335, "global_step": 34025, "epoch": 810} {"train_loss": -5.429372787475586, "global_step": 34026, "epoch": 810} {"train_loss": -5.6447672843933105, "global_step": 34027, "epoch": 810} {"train_loss": -5.665739059448242, "global_step": 34028, "epoch": 810} {"train_loss": -5.644613265991211, "global_step": 34029, "epoch": 810} {"train_loss": -5.558022499084473, "global_step": 34030, "epoch": 810} {"train_loss": -5.543784141540527, "global_step": 34031, "epoch": 810} {"train_loss": -5.503905773162842, "global_step": 34032, "epoch": 810} {"train_loss": -5.457886695861816, "global_step": 34033, "epoch": 810} {"train_loss": -5.582450866699219, "global_step": 34034, "epoch": 810} {"train_loss": -5.684005260467529, "global_step": 34035, "epoch": 810} {"train_loss": -5.487034797668457, "global_step": 34036, "epoch": 810} {"train_loss": -5.6639404296875, "global_step": 34037, "epoch": 810} {"train_loss": -5.497910022735596, "global_step": 34038, "epoch": 810} {"train_loss": -5.484001636505127, "global_step": 34039, "epoch": 810} {"train_loss": -5.514029026031494, "global_step": 34040, "epoch": 810} {"train_loss": -5.716105937957764, "global_step": 34041, "epoch": 810} {"train_loss": -5.53999662399292, "global_step": 34042, "epoch": 810} {"train_loss": -5.604419708251953, "global_step": 34043, "epoch": 810} {"train_loss": -5.582942962646484, "global_step": 34044, "epoch": 810} {"train_loss": -5.5395121574401855, "global_step": 34045, "epoch": 810} {"train_loss": -5.414991855621338, "global_step": 34046, "epoch": 810} {"train_loss": -5.583791732788086, "global_step": 34047, "epoch": 810} {"train_loss": -5.4966254234313965, "global_step": 34048, "epoch": 810} {"train_loss": -5.546259880065918, "global_step": 34049, "epoch": 810} {"train_loss": -5.441429615020752, "global_step": 34050, "epoch": 810} {"train_loss": -5.52700138092041, "global_step": 34051, "epoch": 810} {"train_loss": -5.51154088973999, "global_step": 34052, "epoch": 810} {"train_loss": -5.604131698608398, "global_step": 34053, "epoch": 810} {"train_loss": -5.480339050292969, "global_step": 34054, "epoch": 810} {"train_loss": -5.6449174880981445, "global_step": 34055, "epoch": 810} {"train_loss": -5.533566474914551, "global_step": 34056, "epoch": 810} {"train_loss": -5.628398418426514, "global_step": 34057, "epoch": 810} {"train_loss": -5.4911627769470215, "global_step": 34058, "epoch": 810} {"train_loss": -5.519142150878906, "global_step": 34059, "epoch": 810} {"train_loss": -5.48801326751709, "global_step": 34060, "epoch": 810} {"train_loss": -5.548586096082415, "global_step": 34061, "epoch": 810, "val_loss": 62701.36328125} {"train_loss": -5.5151166915893555, "global_step": 34062, "epoch": 811} {"train_loss": -5.6025848388671875, "global_step": 34063, "epoch": 811} {"train_loss": -5.527745723724365, "global_step": 34064, "epoch": 811} {"train_loss": -5.643063545227051, "global_step": 34065, "epoch": 811} {"train_loss": -5.5223894119262695, "global_step": 34066, "epoch": 811} {"train_loss": -5.56053352355957, "global_step": 34067, "epoch": 811} {"train_loss": -5.508026123046875, "global_step": 34068, "epoch": 811} {"train_loss": -5.577510833740234, "global_step": 34069, "epoch": 811} {"train_loss": -5.573670387268066, "global_step": 34070, "epoch": 811} {"train_loss": -5.468570709228516, "global_step": 34071, "epoch": 811} {"train_loss": -5.7036848068237305, "global_step": 34072, "epoch": 811} {"train_loss": -5.579145908355713, "global_step": 34073, "epoch": 811} {"train_loss": -5.493773460388184, "global_step": 34074, "epoch": 811} {"train_loss": -5.600202560424805, "global_step": 34075, "epoch": 811} {"train_loss": -5.538928985595703, "global_step": 34076, "epoch": 811} {"train_loss": -5.599501132965088, "global_step": 34077, "epoch": 811} {"train_loss": -5.6188883781433105, "global_step": 34078, "epoch": 811} {"train_loss": -5.564268112182617, "global_step": 34079, "epoch": 811} {"train_loss": -5.5216474533081055, "global_step": 34080, "epoch": 811} {"train_loss": -5.573019027709961, "global_step": 34081, "epoch": 811} {"train_loss": -5.465083122253418, "global_step": 34082, "epoch": 811} {"train_loss": -5.59991979598999, "global_step": 34083, "epoch": 811} {"train_loss": -5.450693130493164, "global_step": 34084, "epoch": 811} {"train_loss": -5.45817756652832, "global_step": 34085, "epoch": 811} {"train_loss": -5.585561752319336, "global_step": 34086, "epoch": 811} {"train_loss": -5.610767364501953, "global_step": 34087, "epoch": 811} {"train_loss": -5.356689453125, "global_step": 34088, "epoch": 811} {"train_loss": -5.557925701141357, "global_step": 34089, "epoch": 811} {"train_loss": -5.5051069259643555, "global_step": 34090, "epoch": 811} {"train_loss": -5.532350540161133, "global_step": 34091, "epoch": 811} {"train_loss": -5.682077407836914, "global_step": 34092, "epoch": 811} {"train_loss": -5.468236923217773, "global_step": 34093, "epoch": 811} {"train_loss": -5.402019500732422, "global_step": 34094, "epoch": 811} {"train_loss": -5.582276344299316, "global_step": 34095, "epoch": 811} {"train_loss": -5.564223289489746, "global_step": 34096, "epoch": 811} {"train_loss": -5.487408638000488, "global_step": 34097, "epoch": 811} {"train_loss": -5.623841285705566, "global_step": 34098, "epoch": 811} {"train_loss": -5.560101509094238, "global_step": 34099, "epoch": 811} {"train_loss": -5.563950061798096, "global_step": 34100, "epoch": 811} {"train_loss": -5.598446369171143, "global_step": 34101, "epoch": 811} {"train_loss": -5.468172550201416, "global_step": 34102, "epoch": 811} {"train_loss": -5.547654049737113, "global_step": 34103, "epoch": 811, "val_loss": 62988.15234375} {"train_loss": -5.478076934814453, "global_step": 34104, "epoch": 812} {"train_loss": -5.550076961517334, "global_step": 34105, "epoch": 812} {"train_loss": -5.5442023277282715, "global_step": 34106, "epoch": 812} {"train_loss": -5.47205114364624, "global_step": 34107, "epoch": 812} {"train_loss": -5.64206600189209, "global_step": 34108, "epoch": 812} {"train_loss": -5.501246929168701, "global_step": 34109, "epoch": 812} {"train_loss": -5.46626091003418, "global_step": 34110, "epoch": 812} {"train_loss": -5.554781913757324, "global_step": 34111, "epoch": 812} {"train_loss": -5.657872676849365, "global_step": 34112, "epoch": 812} {"train_loss": -5.619201183319092, "global_step": 34113, "epoch": 812} {"train_loss": -5.532319068908691, "global_step": 34114, "epoch": 812} {"train_loss": -5.517531871795654, "global_step": 34115, "epoch": 812} {"train_loss": -5.480245590209961, "global_step": 34116, "epoch": 812} {"train_loss": -5.448916435241699, "global_step": 34117, "epoch": 812} {"train_loss": -5.417986869812012, "global_step": 34118, "epoch": 812} {"train_loss": -5.514804840087891, "global_step": 34119, "epoch": 812} {"train_loss": -5.4972028732299805, "global_step": 34120, "epoch": 812} {"train_loss": -5.392357349395752, "global_step": 34121, "epoch": 812} {"train_loss": -5.559981822967529, "global_step": 34122, "epoch": 812} {"train_loss": -5.394722938537598, "global_step": 34123, "epoch": 812} {"train_loss": -5.590938091278076, "global_step": 34124, "epoch": 812} {"train_loss": -5.374954700469971, "global_step": 34125, "epoch": 812} {"train_loss": -5.6385698318481445, "global_step": 34126, "epoch": 812} {"train_loss": -5.49245023727417, "global_step": 34127, "epoch": 812} {"train_loss": -5.531693458557129, "global_step": 34128, "epoch": 812} {"train_loss": -5.5438313484191895, "global_step": 34129, "epoch": 812} {"train_loss": -5.3592143058776855, "global_step": 34130, "epoch": 812} {"train_loss": -5.6438493728637695, "global_step": 34131, "epoch": 812} {"train_loss": -5.590959548950195, "global_step": 34132, "epoch": 812} {"train_loss": -5.657973289489746, "global_step": 34133, "epoch": 812} {"train_loss": -5.48409366607666, "global_step": 34134, "epoch": 812} {"train_loss": -5.522893905639648, "global_step": 34135, "epoch": 812} {"train_loss": -5.50958251953125, "global_step": 34136, "epoch": 812} {"train_loss": -5.56407356262207, "global_step": 34137, "epoch": 812} {"train_loss": -5.441187381744385, "global_step": 34138, "epoch": 812} {"train_loss": -5.505161762237549, "global_step": 34139, "epoch": 812} {"train_loss": -5.4217529296875, "global_step": 34140, "epoch": 812} {"train_loss": -5.442443370819092, "global_step": 34141, "epoch": 812} {"train_loss": -5.566583156585693, "global_step": 34142, "epoch": 812} {"train_loss": -5.34893798828125, "global_step": 34143, "epoch": 812} {"train_loss": -5.489350318908691, "global_step": 34144, "epoch": 812} {"train_loss": -5.510104133969262, "global_step": 34145, "epoch": 812, "val_loss": 63303.7265625} {"train_loss": -5.35325813293457, "global_step": 34146, "epoch": 813} {"train_loss": -5.588701248168945, "global_step": 34147, "epoch": 813} {"train_loss": -5.40794038772583, "global_step": 34148, "epoch": 813} {"train_loss": -5.587289810180664, "global_step": 34149, "epoch": 813} {"train_loss": -5.440227508544922, "global_step": 34150, "epoch": 813} {"train_loss": -5.477503299713135, "global_step": 34151, "epoch": 813} {"train_loss": -5.629499912261963, "global_step": 34152, "epoch": 813} {"train_loss": -5.413580417633057, "global_step": 34153, "epoch": 813} {"train_loss": -5.482962608337402, "global_step": 34154, "epoch": 813} {"train_loss": -5.545462608337402, "global_step": 34155, "epoch": 813} {"train_loss": -5.578341484069824, "global_step": 34156, "epoch": 813} {"train_loss": -5.558168411254883, "global_step": 34157, "epoch": 813} {"train_loss": -5.604482650756836, "global_step": 34158, "epoch": 813} {"train_loss": -5.643271446228027, "global_step": 34159, "epoch": 813} {"train_loss": -5.666838645935059, "global_step": 34160, "epoch": 813} {"train_loss": -5.527379512786865, "global_step": 34161, "epoch": 813} {"train_loss": -5.5054612159729, "global_step": 34162, "epoch": 813} {"train_loss": -5.539032936096191, "global_step": 34163, "epoch": 813} {"train_loss": -5.4960103034973145, "global_step": 34164, "epoch": 813} {"train_loss": -5.592259407043457, "global_step": 34165, "epoch": 813} {"train_loss": -5.562893867492676, "global_step": 34166, "epoch": 813} {"train_loss": -5.517210006713867, "global_step": 34167, "epoch": 813} {"train_loss": -5.470688819885254, "global_step": 34168, "epoch": 813} {"train_loss": -5.511043071746826, "global_step": 34169, "epoch": 813} {"train_loss": -5.5015974044799805, "global_step": 34170, "epoch": 813} {"train_loss": -5.660778999328613, "global_step": 34171, "epoch": 813} {"train_loss": -5.571608543395996, "global_step": 34172, "epoch": 813} {"train_loss": -5.44753360748291, "global_step": 34173, "epoch": 813} {"train_loss": -5.642397880554199, "global_step": 34174, "epoch": 813} {"train_loss": -5.461607933044434, "global_step": 34175, "epoch": 813} {"train_loss": -5.523889064788818, "global_step": 34176, "epoch": 813} {"train_loss": -5.558398246765137, "global_step": 34177, "epoch": 813} {"train_loss": -5.491184234619141, "global_step": 34178, "epoch": 813} {"train_loss": -5.524936676025391, "global_step": 34179, "epoch": 813} {"train_loss": -5.510134696960449, "global_step": 34180, "epoch": 813} {"train_loss": -5.58589506149292, "global_step": 34181, "epoch": 813} {"train_loss": -5.60495662689209, "global_step": 34182, "epoch": 813} {"train_loss": -5.63413143157959, "global_step": 34183, "epoch": 813} {"train_loss": -5.44766092300415, "global_step": 34184, "epoch": 813} {"train_loss": -5.592744827270508, "global_step": 34185, "epoch": 813} {"train_loss": -5.6195831298828125, "global_step": 34186, "epoch": 813} {"train_loss": -5.540902205875942, "global_step": 34187, "epoch": 813, "val_loss": 62743.44921875} {"train_loss": -5.479160308837891, "global_step": 34188, "epoch": 814} {"train_loss": -5.5271992683410645, "global_step": 34189, "epoch": 814} {"train_loss": -5.457529067993164, "global_step": 34190, "epoch": 814} {"train_loss": -5.30107307434082, "global_step": 34191, "epoch": 814} {"train_loss": -5.477912425994873, "global_step": 34192, "epoch": 814} {"train_loss": -5.413766384124756, "global_step": 34193, "epoch": 814} {"train_loss": -5.466930389404297, "global_step": 34194, "epoch": 814} {"train_loss": -5.716226577758789, "global_step": 34195, "epoch": 814} {"train_loss": -5.3727827072143555, "global_step": 34196, "epoch": 814} {"train_loss": -5.423254013061523, "global_step": 34197, "epoch": 814} {"train_loss": -5.625033378601074, "global_step": 34198, "epoch": 814} {"train_loss": -5.366158485412598, "global_step": 34199, "epoch": 814} {"train_loss": -5.570615291595459, "global_step": 34200, "epoch": 814} {"train_loss": -5.566854953765869, "global_step": 34201, "epoch": 814} {"train_loss": -5.587242603302002, "global_step": 34202, "epoch": 814} {"train_loss": -5.480670928955078, "global_step": 34203, "epoch": 814} {"train_loss": -5.509520530700684, "global_step": 34204, "epoch": 814} {"train_loss": -5.64372444152832, "global_step": 34205, "epoch": 814} {"train_loss": -5.557476997375488, "global_step": 34206, "epoch": 814} {"train_loss": -5.521042346954346, "global_step": 34207, "epoch": 814} {"train_loss": -5.428195953369141, "global_step": 34208, "epoch": 814} {"train_loss": -5.633112907409668, "global_step": 34209, "epoch": 814} {"train_loss": -5.463558197021484, "global_step": 34210, "epoch": 814} {"train_loss": -5.516972064971924, "global_step": 34211, "epoch": 814} {"train_loss": -5.70832633972168, "global_step": 34212, "epoch": 814} {"train_loss": -5.343791484832764, "global_step": 34213, "epoch": 814} {"train_loss": -5.566409587860107, "global_step": 34214, "epoch": 814} {"train_loss": -5.508415699005127, "global_step": 34215, "epoch": 814} {"train_loss": -5.582569122314453, "global_step": 34216, "epoch": 814} {"train_loss": -5.563910484313965, "global_step": 34217, "epoch": 814} {"train_loss": -5.496707439422607, "global_step": 34218, "epoch": 814} {"train_loss": -5.60236120223999, "global_step": 34219, "epoch": 814} {"train_loss": -5.410503387451172, "global_step": 34220, "epoch": 814} {"train_loss": -5.500619888305664, "global_step": 34221, "epoch": 814} {"train_loss": -5.474604606628418, "global_step": 34222, "epoch": 814} {"train_loss": -5.622941017150879, "global_step": 34223, "epoch": 814} {"train_loss": -5.574864387512207, "global_step": 34224, "epoch": 814} {"train_loss": -5.554450035095215, "global_step": 34225, "epoch": 814} {"train_loss": -5.531242847442627, "global_step": 34226, "epoch": 814} {"train_loss": -5.395995140075684, "global_step": 34227, "epoch": 814} {"train_loss": -5.57240104675293, "global_step": 34228, "epoch": 814} {"train_loss": -5.516961472375052, "global_step": 34229, "epoch": 814, "val_loss": 62823.79296875} {"train_loss": -5.50924015045166, "global_step": 34230, "epoch": 815} {"train_loss": -5.540175437927246, "global_step": 34231, "epoch": 815} {"train_loss": -5.527020454406738, "global_step": 34232, "epoch": 815} {"train_loss": -5.587532997131348, "global_step": 34233, "epoch": 815} {"train_loss": -5.635201454162598, "global_step": 34234, "epoch": 815} {"train_loss": -5.549481391906738, "global_step": 34235, "epoch": 815} {"train_loss": -5.452585697174072, "global_step": 34236, "epoch": 815} {"train_loss": -5.548252105712891, "global_step": 34237, "epoch": 815} {"train_loss": -5.51576042175293, "global_step": 34238, "epoch": 815} {"train_loss": -5.568174362182617, "global_step": 34239, "epoch": 815} {"train_loss": -5.536492347717285, "global_step": 34240, "epoch": 815} {"train_loss": -5.431330680847168, "global_step": 34241, "epoch": 815} {"train_loss": -5.515610694885254, "global_step": 34242, "epoch": 815} {"train_loss": -5.629596710205078, "global_step": 34243, "epoch": 815} {"train_loss": -5.5392069816589355, "global_step": 34244, "epoch": 815} {"train_loss": -5.416706085205078, "global_step": 34245, "epoch": 815} {"train_loss": -5.424843788146973, "global_step": 34246, "epoch": 815} {"train_loss": -5.442074298858643, "global_step": 34247, "epoch": 815} {"train_loss": -5.620141983032227, "global_step": 34248, "epoch": 815} {"train_loss": -5.605581283569336, "global_step": 34249, "epoch": 815} {"train_loss": -5.42473030090332, "global_step": 34250, "epoch": 815} {"train_loss": -5.44028377532959, "global_step": 34251, "epoch": 815} {"train_loss": -5.572781562805176, "global_step": 34252, "epoch": 815} {"train_loss": -5.478165626525879, "global_step": 34253, "epoch": 815} {"train_loss": -5.555595397949219, "global_step": 34254, "epoch": 815} {"train_loss": -5.610439777374268, "global_step": 34255, "epoch": 815} {"train_loss": -5.633363723754883, "global_step": 34256, "epoch": 815} {"train_loss": -5.7093305587768555, "global_step": 34257, "epoch": 815} {"train_loss": -5.493308067321777, "global_step": 34258, "epoch": 815} {"train_loss": -5.558680534362793, "global_step": 34259, "epoch": 815} {"train_loss": -5.547957420349121, "global_step": 34260, "epoch": 815} {"train_loss": -5.648061752319336, "global_step": 34261, "epoch": 815} {"train_loss": -5.570557117462158, "global_step": 34262, "epoch": 815} {"train_loss": -5.473855972290039, "global_step": 34263, "epoch": 815} {"train_loss": -5.599449157714844, "global_step": 34264, "epoch": 815} {"train_loss": -5.612992763519287, "global_step": 34265, "epoch": 815} {"train_loss": -5.646390438079834, "global_step": 34266, "epoch": 815} {"train_loss": -5.655041217803955, "global_step": 34267, "epoch": 815} {"train_loss": -5.565075874328613, "global_step": 34268, "epoch": 815} {"train_loss": -5.5598907470703125, "global_step": 34269, "epoch": 815} {"train_loss": -5.4704742431640625, "global_step": 34270, "epoch": 815} {"train_loss": -5.545438777832758, "global_step": 34271, "epoch": 815, "val_loss": 62088.09375} {"train_loss": -5.544733047485352, "global_step": 34272, "epoch": 816} {"train_loss": -5.643954277038574, "global_step": 34273, "epoch": 816} {"train_loss": -5.515947341918945, "global_step": 34274, "epoch": 816} {"train_loss": -5.566140174865723, "global_step": 34275, "epoch": 816} {"train_loss": -5.63284969329834, "global_step": 34276, "epoch": 816} {"train_loss": -5.555746555328369, "global_step": 34277, "epoch": 816} {"train_loss": -5.561911106109619, "global_step": 34278, "epoch": 816} {"train_loss": -5.568490028381348, "global_step": 34279, "epoch": 816} {"train_loss": -5.658172607421875, "global_step": 34280, "epoch": 816} {"train_loss": -5.61789608001709, "global_step": 34281, "epoch": 816} {"train_loss": -5.66218900680542, "global_step": 34282, "epoch": 816} {"train_loss": -5.618475914001465, "global_step": 34283, "epoch": 816} {"train_loss": -5.668429374694824, "global_step": 34284, "epoch": 816} {"train_loss": -5.545989036560059, "global_step": 34285, "epoch": 816} {"train_loss": -5.426434516906738, "global_step": 34286, "epoch": 816} {"train_loss": -5.562796592712402, "global_step": 34287, "epoch": 816} {"train_loss": -5.643601417541504, "global_step": 34288, "epoch": 816} {"train_loss": -5.511911869049072, "global_step": 34289, "epoch": 816} {"train_loss": -5.652816295623779, "global_step": 34290, "epoch": 816} {"train_loss": -5.529991626739502, "global_step": 34291, "epoch": 816} {"train_loss": -5.415629863739014, "global_step": 34292, "epoch": 816} {"train_loss": -5.504005432128906, "global_step": 34293, "epoch": 816} {"train_loss": -5.397442817687988, "global_step": 34294, "epoch": 816} {"train_loss": -5.570981025695801, "global_step": 34295, "epoch": 816} {"train_loss": -5.66286563873291, "global_step": 34296, "epoch": 816} {"train_loss": -5.518555641174316, "global_step": 34297, "epoch": 816} {"train_loss": -5.465716361999512, "global_step": 34298, "epoch": 816} {"train_loss": -5.478488922119141, "global_step": 34299, "epoch": 816} {"train_loss": -5.47763204574585, "global_step": 34300, "epoch": 816} {"train_loss": -5.545322418212891, "global_step": 34301, "epoch": 816} {"train_loss": -5.501091957092285, "global_step": 34302, "epoch": 816} {"train_loss": -5.676910877227783, "global_step": 34303, "epoch": 816} {"train_loss": -5.521122932434082, "global_step": 34304, "epoch": 816} {"train_loss": -5.593137741088867, "global_step": 34305, "epoch": 816} {"train_loss": -5.542742729187012, "global_step": 34306, "epoch": 816} {"train_loss": -5.580986976623535, "global_step": 34307, "epoch": 816} {"train_loss": -5.666258811950684, "global_step": 34308, "epoch": 816} {"train_loss": -5.5845136642456055, "global_step": 34309, "epoch": 816} {"train_loss": -5.551522254943848, "global_step": 34310, "epoch": 816} {"train_loss": -5.560858249664307, "global_step": 34311, "epoch": 816} {"train_loss": -5.653202056884766, "global_step": 34312, "epoch": 816} {"train_loss": -5.563910665966215, "global_step": 34313, "epoch": 816, "val_loss": 62566.3828125} {"train_loss": -5.605555057525635, "global_step": 34314, "epoch": 817} {"train_loss": -5.576966285705566, "global_step": 34315, "epoch": 817} {"train_loss": -5.622331619262695, "global_step": 34316, "epoch": 817} {"train_loss": -5.691261291503906, "global_step": 34317, "epoch": 817} {"train_loss": -5.568894386291504, "global_step": 34318, "epoch": 817} {"train_loss": -5.654205799102783, "global_step": 34319, "epoch": 817} {"train_loss": -5.467055797576904, "global_step": 34320, "epoch": 817} {"train_loss": -5.571207523345947, "global_step": 34321, "epoch": 817} {"train_loss": -5.388694763183594, "global_step": 34322, "epoch": 817} {"train_loss": -5.513161659240723, "global_step": 34323, "epoch": 817} {"train_loss": -5.4795684814453125, "global_step": 34324, "epoch": 817} {"train_loss": -5.470602035522461, "global_step": 34325, "epoch": 817} {"train_loss": -5.4905924797058105, "global_step": 34326, "epoch": 817} {"train_loss": -5.458745002746582, "global_step": 34327, "epoch": 817} {"train_loss": -5.605369567871094, "global_step": 34328, "epoch": 817} {"train_loss": -5.447729110717773, "global_step": 34329, "epoch": 817} {"train_loss": -5.617247581481934, "global_step": 34330, "epoch": 817} {"train_loss": -5.564745903015137, "global_step": 34331, "epoch": 817} {"train_loss": -5.428259372711182, "global_step": 34332, "epoch": 817} {"train_loss": -5.490508079528809, "global_step": 34333, "epoch": 817} {"train_loss": -5.429769515991211, "global_step": 34334, "epoch": 817} {"train_loss": -5.491999626159668, "global_step": 34335, "epoch": 817} {"train_loss": -5.5680694580078125, "global_step": 34336, "epoch": 817} {"train_loss": -5.529151439666748, "global_step": 34337, "epoch": 817} {"train_loss": -5.51518440246582, "global_step": 34338, "epoch": 817} {"train_loss": -5.414130210876465, "global_step": 34339, "epoch": 817} {"train_loss": -5.5598273277282715, "global_step": 34340, "epoch": 817} {"train_loss": -5.559774875640869, "global_step": 34341, "epoch": 817} {"train_loss": -5.477026462554932, "global_step": 34342, "epoch": 817} {"train_loss": -5.537630558013916, "global_step": 34343, "epoch": 817} {"train_loss": -5.621843338012695, "global_step": 34344, "epoch": 817} {"train_loss": -5.4754767417907715, "global_step": 34345, "epoch": 817} {"train_loss": -5.61276912689209, "global_step": 34346, "epoch": 817} {"train_loss": -5.471498489379883, "global_step": 34347, "epoch": 817} {"train_loss": -5.551074504852295, "global_step": 34348, "epoch": 817} {"train_loss": -5.525615215301514, "global_step": 34349, "epoch": 817} {"train_loss": -5.594969749450684, "global_step": 34350, "epoch": 817} {"train_loss": -5.4781036376953125, "global_step": 34351, "epoch": 817} {"train_loss": -5.537384510040283, "global_step": 34352, "epoch": 817} {"train_loss": -5.506988525390625, "global_step": 34353, "epoch": 817} {"train_loss": -5.513664722442627, "global_step": 34354, "epoch": 817} {"train_loss": -5.527472257614136, "global_step": 34355, "epoch": 817, "val_loss": 62678.3203125} {"train_loss": -5.417146682739258, "global_step": 34356, "epoch": 818} {"train_loss": -5.6263813972473145, "global_step": 34357, "epoch": 818} {"train_loss": -5.412385940551758, "global_step": 34358, "epoch": 818} {"train_loss": -5.524874210357666, "global_step": 34359, "epoch": 818} {"train_loss": -5.591956615447998, "global_step": 34360, "epoch": 818} {"train_loss": -5.50100564956665, "global_step": 34361, "epoch": 818} {"train_loss": -5.447995185852051, "global_step": 34362, "epoch": 818} {"train_loss": -5.47629451751709, "global_step": 34363, "epoch": 818} {"train_loss": -5.484356880187988, "global_step": 34364, "epoch": 818} {"train_loss": -5.503904342651367, "global_step": 34365, "epoch": 818} {"train_loss": -5.558903694152832, "global_step": 34366, "epoch": 818} {"train_loss": -5.6098222732543945, "global_step": 34367, "epoch": 818} {"train_loss": -5.534157752990723, "global_step": 34368, "epoch": 818} {"train_loss": -5.486786842346191, "global_step": 34369, "epoch": 818} {"train_loss": -5.623256683349609, "global_step": 34370, "epoch": 818} {"train_loss": -5.59052848815918, "global_step": 34371, "epoch": 818} {"train_loss": -5.557517051696777, "global_step": 34372, "epoch": 818} {"train_loss": -5.553194522857666, "global_step": 34373, "epoch": 818} {"train_loss": -5.410295486450195, "global_step": 34374, "epoch": 818} {"train_loss": -5.63194465637207, "global_step": 34375, "epoch": 818} {"train_loss": -5.463290214538574, "global_step": 34376, "epoch": 818} {"train_loss": -5.512567520141602, "global_step": 34377, "epoch": 818} {"train_loss": -5.528937339782715, "global_step": 34378, "epoch": 818} {"train_loss": -5.50870943069458, "global_step": 34379, "epoch": 818} {"train_loss": -5.451767921447754, "global_step": 34380, "epoch": 818} {"train_loss": -5.585444450378418, "global_step": 34381, "epoch": 818} {"train_loss": -5.454051971435547, "global_step": 34382, "epoch": 818} {"train_loss": -5.669240951538086, "global_step": 34383, "epoch": 818} {"train_loss": -5.5237274169921875, "global_step": 34384, "epoch": 818} {"train_loss": -5.669615268707275, "global_step": 34385, "epoch": 818} {"train_loss": -5.556914806365967, "global_step": 34386, "epoch": 818} {"train_loss": -5.523364067077637, "global_step": 34387, "epoch": 818} {"train_loss": -5.518968105316162, "global_step": 34388, "epoch": 818} {"train_loss": -5.439146995544434, "global_step": 34389, "epoch": 818} {"train_loss": -5.563523292541504, "global_step": 34390, "epoch": 818} {"train_loss": -5.418817520141602, "global_step": 34391, "epoch": 818} {"train_loss": -5.556602954864502, "global_step": 34392, "epoch": 818} {"train_loss": -5.5353922843933105, "global_step": 34393, "epoch": 818} {"train_loss": -5.536183834075928, "global_step": 34394, "epoch": 818} {"train_loss": -5.670895099639893, "global_step": 34395, "epoch": 818} {"train_loss": -5.526837348937988, "global_step": 34396, "epoch": 818} {"train_loss": -5.529352721713838, "global_step": 34397, "epoch": 818, "val_loss": 62431.0859375} {"train_loss": -5.421056747436523, "global_step": 34398, "epoch": 819} {"train_loss": -5.60067892074585, "global_step": 34399, "epoch": 819} {"train_loss": -5.5734453201293945, "global_step": 34400, "epoch": 819} {"train_loss": -5.542409896850586, "global_step": 34401, "epoch": 819} {"train_loss": -5.713905334472656, "global_step": 34402, "epoch": 819} {"train_loss": -5.586235523223877, "global_step": 34403, "epoch": 819} {"train_loss": -5.525273323059082, "global_step": 34404, "epoch": 819} {"train_loss": -5.718565940856934, "global_step": 34405, "epoch": 819} {"train_loss": -5.6417436599731445, "global_step": 34406, "epoch": 819} {"train_loss": -5.41886043548584, "global_step": 34407, "epoch": 819} {"train_loss": -5.5740461349487305, "global_step": 34408, "epoch": 819} {"train_loss": -5.553605079650879, "global_step": 34409, "epoch": 819} {"train_loss": -5.560098648071289, "global_step": 34410, "epoch": 819} {"train_loss": -5.640647888183594, "global_step": 34411, "epoch": 819} {"train_loss": -5.6657633781433105, "global_step": 34412, "epoch": 819} {"train_loss": -5.537910461425781, "global_step": 34413, "epoch": 819} {"train_loss": -5.668684959411621, "global_step": 34414, "epoch": 819} {"train_loss": -5.566008567810059, "global_step": 34415, "epoch": 819} {"train_loss": -5.590083122253418, "global_step": 34416, "epoch": 819} {"train_loss": -5.639060020446777, "global_step": 34417, "epoch": 819} {"train_loss": -5.677618026733398, "global_step": 34418, "epoch": 819} {"train_loss": -5.521818161010742, "global_step": 34419, "epoch": 819} {"train_loss": -5.60776948928833, "global_step": 34420, "epoch": 819} {"train_loss": -5.498393535614014, "global_step": 34421, "epoch": 819} {"train_loss": -5.470869064331055, "global_step": 34422, "epoch": 819} {"train_loss": -5.540290832519531, "global_step": 34423, "epoch": 819} {"train_loss": -5.628435134887695, "global_step": 34424, "epoch": 819} {"train_loss": -5.514785289764404, "global_step": 34425, "epoch": 819} {"train_loss": -5.684232711791992, "global_step": 34426, "epoch": 819} {"train_loss": -5.4386701583862305, "global_step": 34427, "epoch": 819} {"train_loss": -5.586330413818359, "global_step": 34428, "epoch": 819} {"train_loss": -5.441163063049316, "global_step": 34429, "epoch": 819} {"train_loss": -5.518777847290039, "global_step": 34430, "epoch": 819} {"train_loss": -5.671032428741455, "global_step": 34431, "epoch": 819} {"train_loss": -5.49307918548584, "global_step": 34432, "epoch": 819} {"train_loss": -5.4436798095703125, "global_step": 34433, "epoch": 819} {"train_loss": -5.465288162231445, "global_step": 34434, "epoch": 819} {"train_loss": -5.515595436096191, "global_step": 34435, "epoch": 819} {"train_loss": -5.635861396789551, "global_step": 34436, "epoch": 819} {"train_loss": -5.391582489013672, "global_step": 34437, "epoch": 819} {"train_loss": -5.569314956665039, "global_step": 34438, "epoch": 819} {"train_loss": -5.564321972074962, "global_step": 34439, "epoch": 819, "val_loss": 62442.61328125} {"train_loss": -5.656289100646973, "global_step": 34440, "epoch": 820} {"train_loss": -5.593891143798828, "global_step": 34441, "epoch": 820} {"train_loss": -5.451905727386475, "global_step": 34442, "epoch": 820} {"train_loss": -5.511007785797119, "global_step": 34443, "epoch": 820} {"train_loss": -5.491861343383789, "global_step": 34444, "epoch": 820} {"train_loss": -5.551791191101074, "global_step": 34445, "epoch": 820} {"train_loss": -5.5836992263793945, "global_step": 34446, "epoch": 820} {"train_loss": -5.595468997955322, "global_step": 34447, "epoch": 820} {"train_loss": -5.454780578613281, "global_step": 34448, "epoch": 820} {"train_loss": -5.603981018066406, "global_step": 34449, "epoch": 820} {"train_loss": -5.52736759185791, "global_step": 34450, "epoch": 820} {"train_loss": -5.535392761230469, "global_step": 34451, "epoch": 820} {"train_loss": -5.474522113800049, "global_step": 34452, "epoch": 820} {"train_loss": -5.484556198120117, "global_step": 34453, "epoch": 820} {"train_loss": -5.59565544128418, "global_step": 34454, "epoch": 820} {"train_loss": -5.540804862976074, "global_step": 34455, "epoch": 820} {"train_loss": -5.554944038391113, "global_step": 34456, "epoch": 820} {"train_loss": -5.705331802368164, "global_step": 34457, "epoch": 820} {"train_loss": -5.572293281555176, "global_step": 34458, "epoch": 820} {"train_loss": -5.518517017364502, "global_step": 34459, "epoch": 820} {"train_loss": -5.448747634887695, "global_step": 34460, "epoch": 820} {"train_loss": -5.528277397155762, "global_step": 34461, "epoch": 820} {"train_loss": -5.5721282958984375, "global_step": 34462, "epoch": 820} {"train_loss": -5.599487781524658, "global_step": 34463, "epoch": 820} {"train_loss": -5.602007865905762, "global_step": 34464, "epoch": 820} {"train_loss": -5.6736650466918945, "global_step": 34465, "epoch": 820} {"train_loss": -5.5781965255737305, "global_step": 34466, "epoch": 820} {"train_loss": -5.585906028747559, "global_step": 34467, "epoch": 820} {"train_loss": -5.641904830932617, "global_step": 34468, "epoch": 820} {"train_loss": -5.576696395874023, "global_step": 34469, "epoch": 820} {"train_loss": -5.65079402923584, "global_step": 34470, "epoch": 820} {"train_loss": -5.559455871582031, "global_step": 34471, "epoch": 820} {"train_loss": -5.609047889709473, "global_step": 34472, "epoch": 820} {"train_loss": -5.699939727783203, "global_step": 34473, "epoch": 820} {"train_loss": -5.593091011047363, "global_step": 34474, "epoch": 820} {"train_loss": -5.5836567878723145, "global_step": 34475, "epoch": 820} {"train_loss": -5.708324909210205, "global_step": 34476, "epoch": 820} {"train_loss": -5.575791358947754, "global_step": 34477, "epoch": 820} {"train_loss": -5.478165626525879, "global_step": 34478, "epoch": 820} {"train_loss": -5.373276710510254, "global_step": 34479, "epoch": 820} {"train_loss": -5.5067949295043945, "global_step": 34480, "epoch": 820} {"train_loss": -5.5645003999982565, "global_step": 34481, "epoch": 820, "val_loss": 62248.06640625} {"train_loss": -5.53285026550293, "global_step": 34482, "epoch": 821} {"train_loss": -5.569420337677002, "global_step": 34483, "epoch": 821} {"train_loss": -5.557615756988525, "global_step": 34484, "epoch": 821} {"train_loss": -5.588641166687012, "global_step": 34485, "epoch": 821} {"train_loss": -5.508405685424805, "global_step": 34486, "epoch": 821} {"train_loss": -5.428336143493652, "global_step": 34487, "epoch": 821} {"train_loss": -5.589897155761719, "global_step": 34488, "epoch": 821} {"train_loss": -5.6357221603393555, "global_step": 34489, "epoch": 821} {"train_loss": -5.613607406616211, "global_step": 34490, "epoch": 821} {"train_loss": -5.424517631530762, "global_step": 34491, "epoch": 821} {"train_loss": -5.623478889465332, "global_step": 34492, "epoch": 821} {"train_loss": -5.430447101593018, "global_step": 34493, "epoch": 821} {"train_loss": -5.580883026123047, "global_step": 34494, "epoch": 821} {"train_loss": -5.626165390014648, "global_step": 34495, "epoch": 821} {"train_loss": -5.527252197265625, "global_step": 34496, "epoch": 821} {"train_loss": -5.442081451416016, "global_step": 34497, "epoch": 821} {"train_loss": -5.557308673858643, "global_step": 34498, "epoch": 821} {"train_loss": -5.587767601013184, "global_step": 34499, "epoch": 821} {"train_loss": -5.55381965637207, "global_step": 34500, "epoch": 821} {"train_loss": -5.606056213378906, "global_step": 34501, "epoch": 821} {"train_loss": -5.473238468170166, "global_step": 34502, "epoch": 821} {"train_loss": -5.595521926879883, "global_step": 34503, "epoch": 821} {"train_loss": -5.605802536010742, "global_step": 34504, "epoch": 821} {"train_loss": -5.58858585357666, "global_step": 34505, "epoch": 821} {"train_loss": -5.55178689956665, "global_step": 34506, "epoch": 821} {"train_loss": -5.476288795471191, "global_step": 34507, "epoch": 821} {"train_loss": -5.5698652267456055, "global_step": 34508, "epoch": 821} {"train_loss": -5.492923736572266, "global_step": 34509, "epoch": 821} {"train_loss": -5.503560543060303, "global_step": 34510, "epoch": 821} {"train_loss": -5.606071472167969, "global_step": 34511, "epoch": 821} {"train_loss": -5.694544792175293, "global_step": 34512, "epoch": 821} {"train_loss": -5.633033752441406, "global_step": 34513, "epoch": 821} {"train_loss": -5.60725212097168, "global_step": 34514, "epoch": 821} {"train_loss": -5.568624973297119, "global_step": 34515, "epoch": 821} {"train_loss": -5.543959617614746, "global_step": 34516, "epoch": 821} {"train_loss": -5.543450832366943, "global_step": 34517, "epoch": 821} {"train_loss": -5.625818252563477, "global_step": 34518, "epoch": 821} {"train_loss": -5.692228317260742, "global_step": 34519, "epoch": 821} {"train_loss": -5.645964622497559, "global_step": 34520, "epoch": 821} {"train_loss": -5.427957534790039, "global_step": 34521, "epoch": 821} {"train_loss": -5.61135196685791, "global_step": 34522, "epoch": 821} {"train_loss": -5.561934266771589, "global_step": 34523, "epoch": 821, "val_loss": 62344.5} {"train_loss": -5.522505760192871, "global_step": 34524, "epoch": 822} {"train_loss": -5.528934478759766, "global_step": 34525, "epoch": 822} {"train_loss": -5.576019287109375, "global_step": 34526, "epoch": 822} {"train_loss": -5.6525139808654785, "global_step": 34527, "epoch": 822} {"train_loss": -5.518412113189697, "global_step": 34528, "epoch": 822} {"train_loss": -5.674061298370361, "global_step": 34529, "epoch": 822} {"train_loss": -5.6243181228637695, "global_step": 34530, "epoch": 822} {"train_loss": -5.520532131195068, "global_step": 34531, "epoch": 822} {"train_loss": -5.644542217254639, "global_step": 34532, "epoch": 822} {"train_loss": -5.555733680725098, "global_step": 34533, "epoch": 822} {"train_loss": -5.53884220123291, "global_step": 34534, "epoch": 822} {"train_loss": -5.669432163238525, "global_step": 34535, "epoch": 822} {"train_loss": -5.644175052642822, "global_step": 34536, "epoch": 822} {"train_loss": -5.473204612731934, "global_step": 34537, "epoch": 822} {"train_loss": -5.554131507873535, "global_step": 34538, "epoch": 822} {"train_loss": -5.550824165344238, "global_step": 34539, "epoch": 822} {"train_loss": -5.500093460083008, "global_step": 34540, "epoch": 822} {"train_loss": -5.6138916015625, "global_step": 34541, "epoch": 822} {"train_loss": -5.607040882110596, "global_step": 34542, "epoch": 822} {"train_loss": -5.529115676879883, "global_step": 34543, "epoch": 822} {"train_loss": -5.568628311157227, "global_step": 34544, "epoch": 822} {"train_loss": -5.493060111999512, "global_step": 34545, "epoch": 822} {"train_loss": -5.655731201171875, "global_step": 34546, "epoch": 822} {"train_loss": -5.651089668273926, "global_step": 34547, "epoch": 822} {"train_loss": -5.594840049743652, "global_step": 34548, "epoch": 822} {"train_loss": -5.40286922454834, "global_step": 34549, "epoch": 822} {"train_loss": -5.539661407470703, "global_step": 34550, "epoch": 822} {"train_loss": -5.481729507446289, "global_step": 34551, "epoch": 822} {"train_loss": -5.560458660125732, "global_step": 34552, "epoch": 822} {"train_loss": -5.512406349182129, "global_step": 34553, "epoch": 822} {"train_loss": -5.561744689941406, "global_step": 34554, "epoch": 822} {"train_loss": -5.600646495819092, "global_step": 34555, "epoch": 822} {"train_loss": -5.543321132659912, "global_step": 34556, "epoch": 822} {"train_loss": -5.584869384765625, "global_step": 34557, "epoch": 822} {"train_loss": -5.564906597137451, "global_step": 34558, "epoch": 822} {"train_loss": -5.482956886291504, "global_step": 34559, "epoch": 822} {"train_loss": -5.585849761962891, "global_step": 34560, "epoch": 822} {"train_loss": -5.448304176330566, "global_step": 34561, "epoch": 822} {"train_loss": -5.669221878051758, "global_step": 34562, "epoch": 822} {"train_loss": -5.601741790771484, "global_step": 34563, "epoch": 822} {"train_loss": -5.5933942794799805, "global_step": 34564, "epoch": 822} {"train_loss": -5.567741780054002, "global_step": 34565, "epoch": 822, "val_loss": 62588.37109375} {"train_loss": -5.489785194396973, "global_step": 34566, "epoch": 823} {"train_loss": -5.633916854858398, "global_step": 34567, "epoch": 823} {"train_loss": -5.5723114013671875, "global_step": 34568, "epoch": 823} {"train_loss": -5.444097518920898, "global_step": 34569, "epoch": 823} {"train_loss": -5.518515586853027, "global_step": 34570, "epoch": 823} {"train_loss": -5.5687336921691895, "global_step": 34571, "epoch": 823} {"train_loss": -5.578857421875, "global_step": 34572, "epoch": 823} {"train_loss": -5.668792724609375, "global_step": 34573, "epoch": 823} {"train_loss": -5.518835067749023, "global_step": 34574, "epoch": 823} {"train_loss": -5.7039666175842285, "global_step": 34575, "epoch": 823} {"train_loss": -5.72159481048584, "global_step": 34576, "epoch": 823} {"train_loss": -5.493605613708496, "global_step": 34577, "epoch": 823} {"train_loss": -5.51537561416626, "global_step": 34578, "epoch": 823} {"train_loss": -5.591722011566162, "global_step": 34579, "epoch": 823} {"train_loss": -5.466573715209961, "global_step": 34580, "epoch": 823} {"train_loss": -5.404699325561523, "global_step": 34581, "epoch": 823} {"train_loss": -5.577214241027832, "global_step": 34582, "epoch": 823} {"train_loss": -5.444311618804932, "global_step": 34583, "epoch": 823} {"train_loss": -5.563838958740234, "global_step": 34584, "epoch": 823} {"train_loss": -5.531546115875244, "global_step": 34585, "epoch": 823} {"train_loss": -5.530617713928223, "global_step": 34586, "epoch": 823} {"train_loss": -5.676538467407227, "global_step": 34587, "epoch": 823} {"train_loss": -5.581840515136719, "global_step": 34588, "epoch": 823} {"train_loss": -5.608649253845215, "global_step": 34589, "epoch": 823} {"train_loss": -5.613245010375977, "global_step": 34590, "epoch": 823} {"train_loss": -5.679579734802246, "global_step": 34591, "epoch": 823} {"train_loss": -5.582245349884033, "global_step": 34592, "epoch": 823} {"train_loss": -5.58453369140625, "global_step": 34593, "epoch": 823} {"train_loss": -5.502150058746338, "global_step": 34594, "epoch": 823} {"train_loss": -5.57581901550293, "global_step": 34595, "epoch": 823} {"train_loss": -5.72838020324707, "global_step": 34596, "epoch": 823} {"train_loss": -5.647405624389648, "global_step": 34597, "epoch": 823} {"train_loss": -5.469222068786621, "global_step": 34598, "epoch": 823} {"train_loss": -5.546814441680908, "global_step": 34599, "epoch": 823} {"train_loss": -5.669402122497559, "global_step": 34600, "epoch": 823} {"train_loss": -5.473248481750488, "global_step": 34601, "epoch": 823} {"train_loss": -5.4990315437316895, "global_step": 34602, "epoch": 823} {"train_loss": -5.599727630615234, "global_step": 34603, "epoch": 823} {"train_loss": -5.658997058868408, "global_step": 34604, "epoch": 823} {"train_loss": -5.553468704223633, "global_step": 34605, "epoch": 823} {"train_loss": -5.542530059814453, "global_step": 34606, "epoch": 823} {"train_loss": -5.5673552467709495, "global_step": 34607, "epoch": 823, "val_loss": 62352.40234375} {"train_loss": -5.562808990478516, "global_step": 34608, "epoch": 824} {"train_loss": -5.459963321685791, "global_step": 34609, "epoch": 824} {"train_loss": -5.541446208953857, "global_step": 34610, "epoch": 824} {"train_loss": -5.613353729248047, "global_step": 34611, "epoch": 824} {"train_loss": -5.57684326171875, "global_step": 34612, "epoch": 824} {"train_loss": -5.5370025634765625, "global_step": 34613, "epoch": 824} {"train_loss": -5.574821472167969, "global_step": 34614, "epoch": 824} {"train_loss": -5.514151573181152, "global_step": 34615, "epoch": 824} {"train_loss": -5.575216293334961, "global_step": 34616, "epoch": 824} {"train_loss": -5.553838729858398, "global_step": 34617, "epoch": 824} {"train_loss": -5.594965934753418, "global_step": 34618, "epoch": 824} {"train_loss": -5.603559494018555, "global_step": 34619, "epoch": 824} {"train_loss": -5.7309184074401855, "global_step": 34620, "epoch": 824} {"train_loss": -5.6476240158081055, "global_step": 34621, "epoch": 824} {"train_loss": -5.473637580871582, "global_step": 34622, "epoch": 824} {"train_loss": -5.5200514793396, "global_step": 34623, "epoch": 824} {"train_loss": -5.441225051879883, "global_step": 34624, "epoch": 824} {"train_loss": -5.548283576965332, "global_step": 34625, "epoch": 824} {"train_loss": -5.591163635253906, "global_step": 34626, "epoch": 824} {"train_loss": -5.4037580490112305, "global_step": 34627, "epoch": 824} {"train_loss": -5.604380130767822, "global_step": 34628, "epoch": 824} {"train_loss": -5.504885673522949, "global_step": 34629, "epoch": 824} {"train_loss": -5.542819023132324, "global_step": 34630, "epoch": 824} {"train_loss": -5.572144985198975, "global_step": 34631, "epoch": 824} {"train_loss": -5.609182357788086, "global_step": 34632, "epoch": 824} {"train_loss": -5.493613243103027, "global_step": 34633, "epoch": 824} {"train_loss": -5.5090179443359375, "global_step": 34634, "epoch": 824} {"train_loss": -5.51774787902832, "global_step": 34635, "epoch": 824} {"train_loss": -5.495710849761963, "global_step": 34636, "epoch": 824} {"train_loss": -5.564314842224121, "global_step": 34637, "epoch": 824} {"train_loss": -5.607658386230469, "global_step": 34638, "epoch": 824} {"train_loss": -5.623824119567871, "global_step": 34639, "epoch": 824} {"train_loss": -5.646481513977051, "global_step": 34640, "epoch": 824} {"train_loss": -5.643772125244141, "global_step": 34641, "epoch": 824} {"train_loss": -5.589474678039551, "global_step": 34642, "epoch": 824} {"train_loss": -5.444487571716309, "global_step": 34643, "epoch": 824} {"train_loss": -5.631617546081543, "global_step": 34644, "epoch": 824} {"train_loss": -5.707695007324219, "global_step": 34645, "epoch": 824} {"train_loss": -5.422994613647461, "global_step": 34646, "epoch": 824} {"train_loss": -5.432453155517578, "global_step": 34647, "epoch": 824} {"train_loss": -5.705589294433594, "global_step": 34648, "epoch": 824} {"train_loss": -5.558568602516537, "global_step": 34649, "epoch": 824, "val_loss": 62487.5703125} {"train_loss": -5.688469886779785, "global_step": 34650, "epoch": 825} {"train_loss": -5.572369575500488, "global_step": 34651, "epoch": 825} {"train_loss": -5.355827331542969, "global_step": 34652, "epoch": 825} {"train_loss": -5.557043075561523, "global_step": 34653, "epoch": 825} {"train_loss": -5.514437675476074, "global_step": 34654, "epoch": 825} {"train_loss": -5.477892875671387, "global_step": 34655, "epoch": 825} {"train_loss": -5.623176574707031, "global_step": 34656, "epoch": 825} {"train_loss": -5.595964431762695, "global_step": 34657, "epoch": 825} {"train_loss": -5.427036285400391, "global_step": 34658, "epoch": 825} {"train_loss": -5.619403839111328, "global_step": 34659, "epoch": 825} {"train_loss": -5.468236446380615, "global_step": 34660, "epoch": 825} {"train_loss": -5.644287109375, "global_step": 34661, "epoch": 825} {"train_loss": -5.5159711837768555, "global_step": 34662, "epoch": 825} {"train_loss": -5.487016201019287, "global_step": 34663, "epoch": 825} {"train_loss": -5.602975368499756, "global_step": 34664, "epoch": 825} {"train_loss": -5.632725715637207, "global_step": 34665, "epoch": 825} {"train_loss": -5.614426612854004, "global_step": 34666, "epoch": 825} {"train_loss": -5.566720962524414, "global_step": 34667, "epoch": 825} {"train_loss": -5.478785991668701, "global_step": 34668, "epoch": 825} {"train_loss": -5.478674411773682, "global_step": 34669, "epoch": 825} {"train_loss": -5.5674309730529785, "global_step": 34670, "epoch": 825} {"train_loss": -5.5427350997924805, "global_step": 34671, "epoch": 825} {"train_loss": -5.478461265563965, "global_step": 34672, "epoch": 825} {"train_loss": -5.48497200012207, "global_step": 34673, "epoch": 825} {"train_loss": -5.588704586029053, "global_step": 34674, "epoch": 825} {"train_loss": -5.604190826416016, "global_step": 34675, "epoch": 825} {"train_loss": -5.591151237487793, "global_step": 34676, "epoch": 825} {"train_loss": -5.569611549377441, "global_step": 34677, "epoch": 825} {"train_loss": -5.661470413208008, "global_step": 34678, "epoch": 825} {"train_loss": -5.606649398803711, "global_step": 34679, "epoch": 825} {"train_loss": -5.593923568725586, "global_step": 34680, "epoch": 825} {"train_loss": -5.547938346862793, "global_step": 34681, "epoch": 825} {"train_loss": -5.406732082366943, "global_step": 34682, "epoch": 825} {"train_loss": -5.616590976715088, "global_step": 34683, "epoch": 825} {"train_loss": -5.623298168182373, "global_step": 34684, "epoch": 825} {"train_loss": -5.612322807312012, "global_step": 34685, "epoch": 825} {"train_loss": -5.456730365753174, "global_step": 34686, "epoch": 825} {"train_loss": -5.508538722991943, "global_step": 34687, "epoch": 825} {"train_loss": -5.490846157073975, "global_step": 34688, "epoch": 825} {"train_loss": -5.315577507019043, "global_step": 34689, "epoch": 825} {"train_loss": -5.529474258422852, "global_step": 34690, "epoch": 825} {"train_loss": -5.543406679516747, "global_step": 34691, "epoch": 825, "val_loss": 63108.2421875} {"train_loss": -5.44399356842041, "global_step": 34692, "epoch": 826} {"train_loss": -5.5831499099731445, "global_step": 34693, "epoch": 826} {"train_loss": -5.584314346313477, "global_step": 34694, "epoch": 826} {"train_loss": -5.504508018493652, "global_step": 34695, "epoch": 826} {"train_loss": -5.516788005828857, "global_step": 34696, "epoch": 826} {"train_loss": -5.450386047363281, "global_step": 34697, "epoch": 826} {"train_loss": -5.652680397033691, "global_step": 34698, "epoch": 826} {"train_loss": -5.448294639587402, "global_step": 34699, "epoch": 826} {"train_loss": -5.626672744750977, "global_step": 34700, "epoch": 826} {"train_loss": -5.516395568847656, "global_step": 34701, "epoch": 826} {"train_loss": -5.263421535491943, "global_step": 34702, "epoch": 826} {"train_loss": -5.592723846435547, "global_step": 34703, "epoch": 826} {"train_loss": -5.502896785736084, "global_step": 34704, "epoch": 826} {"train_loss": -5.410423278808594, "global_step": 34705, "epoch": 826} {"train_loss": -5.369146347045898, "global_step": 34706, "epoch": 826} {"train_loss": -5.403267860412598, "global_step": 34707, "epoch": 826} {"train_loss": -5.450789451599121, "global_step": 34708, "epoch": 826} {"train_loss": -5.390749931335449, "global_step": 34709, "epoch": 826} {"train_loss": -5.480576515197754, "global_step": 34710, "epoch": 826} {"train_loss": -5.317861080169678, "global_step": 34711, "epoch": 826} {"train_loss": -5.439576148986816, "global_step": 34712, "epoch": 826} {"train_loss": -5.325065612792969, "global_step": 34713, "epoch": 826} {"train_loss": -5.444469451904297, "global_step": 34714, "epoch": 826} {"train_loss": -5.523308753967285, "global_step": 34715, "epoch": 826} {"train_loss": -5.533656120300293, "global_step": 34716, "epoch": 826} {"train_loss": -5.469200134277344, "global_step": 34717, "epoch": 826} {"train_loss": -5.491487503051758, "global_step": 34718, "epoch": 826} {"train_loss": -5.45488166809082, "global_step": 34719, "epoch": 826} {"train_loss": -5.690863609313965, "global_step": 34720, "epoch": 826} {"train_loss": -5.458166122436523, "global_step": 34721, "epoch": 826} {"train_loss": -5.517430782318115, "global_step": 34722, "epoch": 826} {"train_loss": -5.402982711791992, "global_step": 34723, "epoch": 826} {"train_loss": -5.442176818847656, "global_step": 34724, "epoch": 826} {"train_loss": -5.6234893798828125, "global_step": 34725, "epoch": 826} {"train_loss": -5.469413757324219, "global_step": 34726, "epoch": 826} {"train_loss": -5.6251139640808105, "global_step": 34727, "epoch": 826} {"train_loss": -5.440674781799316, "global_step": 34728, "epoch": 826} {"train_loss": -5.470272064208984, "global_step": 34729, "epoch": 826} {"train_loss": -5.573541164398193, "global_step": 34730, "epoch": 826} {"train_loss": -5.49246072769165, "global_step": 34731, "epoch": 826} {"train_loss": -5.5306196212768555, "global_step": 34732, "epoch": 826} {"train_loss": -5.4855392546880815, "global_step": 34733, "epoch": 826, "val_loss": 62515.2265625} {"train_loss": -5.440654754638672, "global_step": 34734, "epoch": 827} {"train_loss": -5.538912296295166, "global_step": 34735, "epoch": 827} {"train_loss": -5.571115493774414, "global_step": 34736, "epoch": 827} {"train_loss": -5.717343807220459, "global_step": 34737, "epoch": 827} {"train_loss": -5.4255475997924805, "global_step": 34738, "epoch": 827} {"train_loss": -5.5877790451049805, "global_step": 34739, "epoch": 827} {"train_loss": -5.475007057189941, "global_step": 34740, "epoch": 827} {"train_loss": -5.479636192321777, "global_step": 34741, "epoch": 827} {"train_loss": -5.368936538696289, "global_step": 34742, "epoch": 827} {"train_loss": -5.544124603271484, "global_step": 34743, "epoch": 827} {"train_loss": -5.579676628112793, "global_step": 34744, "epoch": 827} {"train_loss": -5.585151195526123, "global_step": 34745, "epoch": 827} {"train_loss": -5.668543815612793, "global_step": 34746, "epoch": 827} {"train_loss": -5.501710414886475, "global_step": 34747, "epoch": 827} {"train_loss": -5.630124092102051, "global_step": 34748, "epoch": 827} {"train_loss": -5.634537696838379, "global_step": 34749, "epoch": 827} {"train_loss": -5.559366226196289, "global_step": 34750, "epoch": 827} {"train_loss": -5.493831157684326, "global_step": 34751, "epoch": 827} {"train_loss": -5.6998701095581055, "global_step": 34752, "epoch": 827} {"train_loss": -5.391890525817871, "global_step": 34753, "epoch": 827} {"train_loss": -5.5890398025512695, "global_step": 34754, "epoch": 827} {"train_loss": -5.654263496398926, "global_step": 34755, "epoch": 827} {"train_loss": -5.482275009155273, "global_step": 34756, "epoch": 827} {"train_loss": -5.575587272644043, "global_step": 34757, "epoch": 827} {"train_loss": -5.486502170562744, "global_step": 34758, "epoch": 827} {"train_loss": -5.542661666870117, "global_step": 34759, "epoch": 827} {"train_loss": -5.5563812255859375, "global_step": 34760, "epoch": 827} {"train_loss": -5.612178325653076, "global_step": 34761, "epoch": 827} {"train_loss": -5.603882789611816, "global_step": 34762, "epoch": 827} {"train_loss": -5.387500286102295, "global_step": 34763, "epoch": 827} {"train_loss": -5.594078540802002, "global_step": 34764, "epoch": 827} {"train_loss": -5.536428451538086, "global_step": 34765, "epoch": 827} {"train_loss": -5.544913291931152, "global_step": 34766, "epoch": 827} {"train_loss": -5.504141330718994, "global_step": 34767, "epoch": 827} {"train_loss": -5.547737121582031, "global_step": 34768, "epoch": 827} {"train_loss": -5.539007186889648, "global_step": 34769, "epoch": 827} {"train_loss": -5.454993724822998, "global_step": 34770, "epoch": 827} {"train_loss": -5.460116863250732, "global_step": 34771, "epoch": 827} {"train_loss": -5.569511413574219, "global_step": 34772, "epoch": 827} {"train_loss": -5.582767486572266, "global_step": 34773, "epoch": 827} {"train_loss": -5.533740997314453, "global_step": 34774, "epoch": 827} {"train_loss": -5.543113958267939, "global_step": 34775, "epoch": 827, "val_loss": 62309.57421875} {"train_loss": -5.531386375427246, "global_step": 34776, "epoch": 828} {"train_loss": -5.618462562561035, "global_step": 34777, "epoch": 828} {"train_loss": -5.589842796325684, "global_step": 34778, "epoch": 828} {"train_loss": -5.485356330871582, "global_step": 34779, "epoch": 828} {"train_loss": -5.609374046325684, "global_step": 34780, "epoch": 828} {"train_loss": -5.523066520690918, "global_step": 34781, "epoch": 828} {"train_loss": -5.484622955322266, "global_step": 34782, "epoch": 828} {"train_loss": -5.394976615905762, "global_step": 34783, "epoch": 828} {"train_loss": -5.4081621170043945, "global_step": 34784, "epoch": 828} {"train_loss": -5.602095603942871, "global_step": 34785, "epoch": 828} {"train_loss": -5.512875080108643, "global_step": 34786, "epoch": 828} {"train_loss": -5.583722114562988, "global_step": 34787, "epoch": 828} {"train_loss": -5.654256343841553, "global_step": 34788, "epoch": 828} {"train_loss": -5.773357391357422, "global_step": 34789, "epoch": 828} {"train_loss": -5.555076599121094, "global_step": 34790, "epoch": 828} {"train_loss": -5.489289283752441, "global_step": 34791, "epoch": 828} {"train_loss": -5.593545436859131, "global_step": 34792, "epoch": 828} {"train_loss": -5.5660223960876465, "global_step": 34793, "epoch": 828} {"train_loss": -5.579250812530518, "global_step": 34794, "epoch": 828} {"train_loss": -5.65056848526001, "global_step": 34795, "epoch": 828} {"train_loss": -5.550683498382568, "global_step": 34796, "epoch": 828} {"train_loss": -5.611035346984863, "global_step": 34797, "epoch": 828} {"train_loss": -5.504091739654541, "global_step": 34798, "epoch": 828} {"train_loss": -5.57490873336792, "global_step": 34799, "epoch": 828} {"train_loss": -5.476077079772949, "global_step": 34800, "epoch": 828} {"train_loss": -5.50645637512207, "global_step": 34801, "epoch": 828} {"train_loss": -5.658365249633789, "global_step": 34802, "epoch": 828} {"train_loss": -5.574331283569336, "global_step": 34803, "epoch": 828} {"train_loss": -5.683250427246094, "global_step": 34804, "epoch": 828} {"train_loss": -5.515987396240234, "global_step": 34805, "epoch": 828} {"train_loss": -5.627890586853027, "global_step": 34806, "epoch": 828} {"train_loss": -5.608880043029785, "global_step": 34807, "epoch": 828} {"train_loss": -5.500178813934326, "global_step": 34808, "epoch": 828} {"train_loss": -5.426819801330566, "global_step": 34809, "epoch": 828} {"train_loss": -5.541562080383301, "global_step": 34810, "epoch": 828} {"train_loss": -5.479560852050781, "global_step": 34811, "epoch": 828} {"train_loss": -5.44501256942749, "global_step": 34812, "epoch": 828} {"train_loss": -5.4866228103637695, "global_step": 34813, "epoch": 828} {"train_loss": -5.505519866943359, "global_step": 34814, "epoch": 828} {"train_loss": -5.48435640335083, "global_step": 34815, "epoch": 828} {"train_loss": -5.582014083862305, "global_step": 34816, "epoch": 828} {"train_loss": -5.5512296585809615, "global_step": 34817, "epoch": 828, "val_loss": 62419.5234375} {"train_loss": -5.445466041564941, "global_step": 34818, "epoch": 829} {"train_loss": -5.585821151733398, "global_step": 34819, "epoch": 829} {"train_loss": -5.597599506378174, "global_step": 34820, "epoch": 829} {"train_loss": -5.629181385040283, "global_step": 34821, "epoch": 829} {"train_loss": -5.590512275695801, "global_step": 34822, "epoch": 829} {"train_loss": -5.526336669921875, "global_step": 34823, "epoch": 829} {"train_loss": -5.6502156257629395, "global_step": 34824, "epoch": 829} {"train_loss": -5.698398590087891, "global_step": 34825, "epoch": 829} {"train_loss": -5.661468505859375, "global_step": 34826, "epoch": 829} {"train_loss": -5.570834159851074, "global_step": 34827, "epoch": 829} {"train_loss": -5.5576372146606445, "global_step": 34828, "epoch": 829} {"train_loss": -5.477682113647461, "global_step": 34829, "epoch": 829} {"train_loss": -5.542863845825195, "global_step": 34830, "epoch": 829} {"train_loss": -5.566351890563965, "global_step": 34831, "epoch": 829} {"train_loss": -5.597128868103027, "global_step": 34832, "epoch": 829} {"train_loss": -5.502453804016113, "global_step": 34833, "epoch": 829} {"train_loss": -5.658387660980225, "global_step": 34834, "epoch": 829} {"train_loss": -5.477199554443359, "global_step": 34835, "epoch": 829} {"train_loss": -5.460554599761963, "global_step": 34836, "epoch": 829} {"train_loss": -5.5249176025390625, "global_step": 34837, "epoch": 829} {"train_loss": -5.499791145324707, "global_step": 34838, "epoch": 829} {"train_loss": -5.508718013763428, "global_step": 34839, "epoch": 829} {"train_loss": -5.5171918869018555, "global_step": 34840, "epoch": 829} {"train_loss": -5.448647975921631, "global_step": 34841, "epoch": 829} {"train_loss": -5.594022750854492, "global_step": 34842, "epoch": 829} {"train_loss": -5.561507701873779, "global_step": 34843, "epoch": 829} {"train_loss": -5.484077453613281, "global_step": 34844, "epoch": 829} {"train_loss": -5.559062957763672, "global_step": 34845, "epoch": 829} {"train_loss": -5.630897521972656, "global_step": 34846, "epoch": 829} {"train_loss": -5.553503513336182, "global_step": 34847, "epoch": 829} {"train_loss": -5.68227481842041, "global_step": 34848, "epoch": 829} {"train_loss": -5.528132438659668, "global_step": 34849, "epoch": 829} {"train_loss": -5.439826488494873, "global_step": 34850, "epoch": 829} {"train_loss": -5.475671768188477, "global_step": 34851, "epoch": 829} {"train_loss": -5.4058637619018555, "global_step": 34852, "epoch": 829} {"train_loss": -5.64887809753418, "global_step": 34853, "epoch": 829} {"train_loss": -5.561281681060791, "global_step": 34854, "epoch": 829} {"train_loss": -5.451590061187744, "global_step": 34855, "epoch": 829} {"train_loss": -5.500079154968262, "global_step": 34856, "epoch": 829} {"train_loss": -5.490457534790039, "global_step": 34857, "epoch": 829} {"train_loss": -5.564276695251465, "global_step": 34858, "epoch": 829} {"train_loss": -5.545979817708333, "global_step": 34859, "epoch": 829, "val_loss": 62656.859375} {"train_loss": -5.614384174346924, "global_step": 34860, "epoch": 830} {"train_loss": -5.521393775939941, "global_step": 34861, "epoch": 830} {"train_loss": -5.636282920837402, "global_step": 34862, "epoch": 830} {"train_loss": -5.415055751800537, "global_step": 34863, "epoch": 830} {"train_loss": -5.406230926513672, "global_step": 34864, "epoch": 830} {"train_loss": -5.606770992279053, "global_step": 34865, "epoch": 830} {"train_loss": -5.683080196380615, "global_step": 34866, "epoch": 830} {"train_loss": -5.458381652832031, "global_step": 34867, "epoch": 830} {"train_loss": -5.467574119567871, "global_step": 34868, "epoch": 830} {"train_loss": -5.673892974853516, "global_step": 34869, "epoch": 830} {"train_loss": -5.5104756355285645, "global_step": 34870, "epoch": 830} {"train_loss": -5.669096946716309, "global_step": 34871, "epoch": 830} {"train_loss": -5.559046745300293, "global_step": 34872, "epoch": 830} {"train_loss": -5.494303226470947, "global_step": 34873, "epoch": 830} {"train_loss": -5.594257354736328, "global_step": 34874, "epoch": 830} {"train_loss": -5.629489898681641, "global_step": 34875, "epoch": 830} {"train_loss": -5.565115928649902, "global_step": 34876, "epoch": 830} {"train_loss": -5.548850059509277, "global_step": 34877, "epoch": 830} {"train_loss": -5.521925926208496, "global_step": 34878, "epoch": 830} {"train_loss": -5.658197402954102, "global_step": 34879, "epoch": 830} {"train_loss": -5.534028053283691, "global_step": 34880, "epoch": 830} {"train_loss": -5.529942989349365, "global_step": 34881, "epoch": 830} {"train_loss": -5.768183708190918, "global_step": 34882, "epoch": 830} {"train_loss": -5.581609725952148, "global_step": 34883, "epoch": 830} {"train_loss": -5.5874528884887695, "global_step": 34884, "epoch": 830} {"train_loss": -5.528822898864746, "global_step": 34885, "epoch": 830} {"train_loss": -5.383625030517578, "global_step": 34886, "epoch": 830} {"train_loss": -5.540862560272217, "global_step": 34887, "epoch": 830} {"train_loss": -5.695945739746094, "global_step": 34888, "epoch": 830} {"train_loss": -5.557252883911133, "global_step": 34889, "epoch": 830} {"train_loss": -5.5384674072265625, "global_step": 34890, "epoch": 830} {"train_loss": -5.598143100738525, "global_step": 34891, "epoch": 830} {"train_loss": -5.516454219818115, "global_step": 34892, "epoch": 830} {"train_loss": -5.7001237869262695, "global_step": 34893, "epoch": 830} {"train_loss": -5.495074272155762, "global_step": 34894, "epoch": 830} {"train_loss": -5.6382598876953125, "global_step": 34895, "epoch": 830} {"train_loss": -5.5649566650390625, "global_step": 34896, "epoch": 830} {"train_loss": -5.56852912902832, "global_step": 34897, "epoch": 830} {"train_loss": -5.578579425811768, "global_step": 34898, "epoch": 830} {"train_loss": -5.458161354064941, "global_step": 34899, "epoch": 830} {"train_loss": -5.510891437530518, "global_step": 34900, "epoch": 830} {"train_loss": -5.565228518985567, "global_step": 34901, "epoch": 830, "val_loss": 62509.9296875} {"train_loss": -5.606727600097656, "global_step": 34902, "epoch": 831} {"train_loss": -5.587076187133789, "global_step": 34903, "epoch": 831} {"train_loss": -5.526182174682617, "global_step": 34904, "epoch": 831} {"train_loss": -5.618703842163086, "global_step": 34905, "epoch": 831} {"train_loss": -5.544539451599121, "global_step": 34906, "epoch": 831} {"train_loss": -5.608994483947754, "global_step": 34907, "epoch": 831} {"train_loss": -5.483279228210449, "global_step": 34908, "epoch": 831} {"train_loss": -5.49305534362793, "global_step": 34909, "epoch": 831} {"train_loss": -5.459272384643555, "global_step": 34910, "epoch": 831} {"train_loss": -5.651585578918457, "global_step": 34911, "epoch": 831} {"train_loss": -5.564383506774902, "global_step": 34912, "epoch": 831} {"train_loss": -5.621130466461182, "global_step": 34913, "epoch": 831} {"train_loss": -5.642477035522461, "global_step": 34914, "epoch": 831} {"train_loss": -5.3911662101745605, "global_step": 34915, "epoch": 831} {"train_loss": -5.529414176940918, "global_step": 34916, "epoch": 831} {"train_loss": -5.635435104370117, "global_step": 34917, "epoch": 831} {"train_loss": -5.5477142333984375, "global_step": 34918, "epoch": 831} {"train_loss": -5.7047576904296875, "global_step": 34919, "epoch": 831} {"train_loss": -5.536649703979492, "global_step": 34920, "epoch": 831} {"train_loss": -5.616821765899658, "global_step": 34921, "epoch": 831} {"train_loss": -5.4727888107299805, "global_step": 34922, "epoch": 831} {"train_loss": -5.600773811340332, "global_step": 34923, "epoch": 831} {"train_loss": -5.649937152862549, "global_step": 34924, "epoch": 831} {"train_loss": -5.593930244445801, "global_step": 34925, "epoch": 831} {"train_loss": -5.56102180480957, "global_step": 34926, "epoch": 831} {"train_loss": -5.503952980041504, "global_step": 34927, "epoch": 831} {"train_loss": -5.60132360458374, "global_step": 34928, "epoch": 831} {"train_loss": -5.563742637634277, "global_step": 34929, "epoch": 831} {"train_loss": -5.74031925201416, "global_step": 34930, "epoch": 831} {"train_loss": -5.500622749328613, "global_step": 34931, "epoch": 831} {"train_loss": -5.573369026184082, "global_step": 34932, "epoch": 831} {"train_loss": -5.4861345291137695, "global_step": 34933, "epoch": 831} {"train_loss": -5.56967830657959, "global_step": 34934, "epoch": 831} {"train_loss": -5.507009506225586, "global_step": 34935, "epoch": 831} {"train_loss": -5.601102352142334, "global_step": 34936, "epoch": 831} {"train_loss": -5.542889595031738, "global_step": 34937, "epoch": 831} {"train_loss": -5.620813369750977, "global_step": 34938, "epoch": 831} {"train_loss": -5.732941627502441, "global_step": 34939, "epoch": 831} {"train_loss": -5.4880266189575195, "global_step": 34940, "epoch": 831} {"train_loss": -5.639989852905273, "global_step": 34941, "epoch": 831} {"train_loss": -5.486702919006348, "global_step": 34942, "epoch": 831} {"train_loss": -5.568254096167428, "global_step": 34943, "epoch": 831, "val_loss": 62570.0546875} {"train_loss": -5.603067874908447, "global_step": 34944, "epoch": 832} {"train_loss": -5.608465194702148, "global_step": 34945, "epoch": 832} {"train_loss": -5.457795143127441, "global_step": 34946, "epoch": 832} {"train_loss": -5.56117057800293, "global_step": 34947, "epoch": 832} {"train_loss": -5.4839324951171875, "global_step": 34948, "epoch": 832} {"train_loss": -5.2328338623046875, "global_step": 34949, "epoch": 832} {"train_loss": -5.612154960632324, "global_step": 34950, "epoch": 832} {"train_loss": -5.5605058670043945, "global_step": 34951, "epoch": 832} {"train_loss": -5.359805107116699, "global_step": 34952, "epoch": 832} {"train_loss": -5.493677139282227, "global_step": 34953, "epoch": 832} {"train_loss": -5.434126377105713, "global_step": 34954, "epoch": 832} {"train_loss": -5.495221138000488, "global_step": 34955, "epoch": 832} {"train_loss": -5.434295654296875, "global_step": 34956, "epoch": 832} {"train_loss": -5.562084197998047, "global_step": 34957, "epoch": 832} {"train_loss": -5.4949822425842285, "global_step": 34958, "epoch": 832} {"train_loss": -5.4162397384643555, "global_step": 34959, "epoch": 832} {"train_loss": -5.437649726867676, "global_step": 34960, "epoch": 832} {"train_loss": -5.580484867095947, "global_step": 34961, "epoch": 832} {"train_loss": -5.678836822509766, "global_step": 34962, "epoch": 832} {"train_loss": -5.573389053344727, "global_step": 34963, "epoch": 832} {"train_loss": -5.512067794799805, "global_step": 34964, "epoch": 832} {"train_loss": -5.477462291717529, "global_step": 34965, "epoch": 832} {"train_loss": -5.786718368530273, "global_step": 34966, "epoch": 832} {"train_loss": -5.593132019042969, "global_step": 34967, "epoch": 832} {"train_loss": -5.616503715515137, "global_step": 34968, "epoch": 832} {"train_loss": -5.527289390563965, "global_step": 34969, "epoch": 832} {"train_loss": -5.578330993652344, "global_step": 34970, "epoch": 832} {"train_loss": -5.621347427368164, "global_step": 34971, "epoch": 832} {"train_loss": -5.589475631713867, "global_step": 34972, "epoch": 832} {"train_loss": -5.604249000549316, "global_step": 34973, "epoch": 832} {"train_loss": -5.416993141174316, "global_step": 34974, "epoch": 832} {"train_loss": -5.512241363525391, "global_step": 34975, "epoch": 832} {"train_loss": -5.540415287017822, "global_step": 34976, "epoch": 832} {"train_loss": -5.633421897888184, "global_step": 34977, "epoch": 832} {"train_loss": -5.3114447593688965, "global_step": 34978, "epoch": 832} {"train_loss": -5.565779685974121, "global_step": 34979, "epoch": 832} {"train_loss": -5.423121929168701, "global_step": 34980, "epoch": 832} {"train_loss": -5.458728790283203, "global_step": 34981, "epoch": 832} {"train_loss": -5.494805335998535, "global_step": 34982, "epoch": 832} {"train_loss": -5.59052848815918, "global_step": 34983, "epoch": 832} {"train_loss": -5.59700870513916, "global_step": 34984, "epoch": 832} {"train_loss": -5.52750453494844, "global_step": 34985, "epoch": 832, "val_loss": 62520.26953125} {"train_loss": -5.443382263183594, "global_step": 34986, "epoch": 833} {"train_loss": -5.643702507019043, "global_step": 34987, "epoch": 833} {"train_loss": -5.44814395904541, "global_step": 34988, "epoch": 833} {"train_loss": -5.525263786315918, "global_step": 34989, "epoch": 833} {"train_loss": -5.527012825012207, "global_step": 34990, "epoch": 833} {"train_loss": -5.601367473602295, "global_step": 34991, "epoch": 833} {"train_loss": -5.514577388763428, "global_step": 34992, "epoch": 833} {"train_loss": -5.5570173263549805, "global_step": 34993, "epoch": 833} {"train_loss": -5.6360554695129395, "global_step": 34994, "epoch": 833} {"train_loss": -5.381360054016113, "global_step": 34995, "epoch": 833} {"train_loss": -5.495746612548828, "global_step": 34996, "epoch": 833} {"train_loss": -5.498690128326416, "global_step": 34997, "epoch": 833} {"train_loss": -5.633650779724121, "global_step": 34998, "epoch": 833} {"train_loss": -5.487117767333984, "global_step": 34999, "epoch": 833} {"train_loss": -5.503961563110352, "global_step": 35000, "epoch": 833} {"train_loss": -5.5839948654174805, "global_step": 35001, "epoch": 833} {"train_loss": -5.605401992797852, "global_step": 35002, "epoch": 833} {"train_loss": -5.4878716468811035, "global_step": 35003, "epoch": 833} {"train_loss": -5.554263114929199, "global_step": 35004, "epoch": 833} {"train_loss": -5.483803749084473, "global_step": 35005, "epoch": 833} {"train_loss": -5.430093765258789, "global_step": 35006, "epoch": 833} {"train_loss": -5.43146276473999, "global_step": 35007, "epoch": 833} {"train_loss": -5.550301551818848, "global_step": 35008, "epoch": 833} {"train_loss": -5.422247409820557, "global_step": 35009, "epoch": 833} {"train_loss": -5.4935407638549805, "global_step": 35010, "epoch": 833} {"train_loss": -5.511965751647949, "global_step": 35011, "epoch": 833} {"train_loss": -5.506773948669434, "global_step": 35012, "epoch": 833} {"train_loss": -5.619275093078613, "global_step": 35013, "epoch": 833} {"train_loss": -5.6219072341918945, "global_step": 35014, "epoch": 833} {"train_loss": -5.502172470092773, "global_step": 35015, "epoch": 833} {"train_loss": -5.473913192749023, "global_step": 35016, "epoch": 833} {"train_loss": -5.663290977478027, "global_step": 35017, "epoch": 833} {"train_loss": -5.5901899337768555, "global_step": 35018, "epoch": 833} {"train_loss": -5.701218605041504, "global_step": 35019, "epoch": 833} {"train_loss": -5.5388288497924805, "global_step": 35020, "epoch": 833} {"train_loss": -5.695832252502441, "global_step": 35021, "epoch": 833} {"train_loss": -5.653565406799316, "global_step": 35022, "epoch": 833} {"train_loss": -5.630061149597168, "global_step": 35023, "epoch": 833} {"train_loss": -5.599641799926758, "global_step": 35024, "epoch": 833} {"train_loss": -5.635887145996094, "global_step": 35025, "epoch": 833} {"train_loss": -5.638412952423096, "global_step": 35026, "epoch": 833} {"train_loss": -5.548820768083845, "global_step": 35027, "epoch": 833, "val_loss": 62480.74609375} {"train_loss": -5.534094333648682, "global_step": 35028, "epoch": 834} {"train_loss": -5.589179992675781, "global_step": 35029, "epoch": 834} {"train_loss": -5.505410671234131, "global_step": 35030, "epoch": 834} {"train_loss": -5.569242477416992, "global_step": 35031, "epoch": 834} {"train_loss": -5.5939412117004395, "global_step": 35032, "epoch": 834} {"train_loss": -5.543389320373535, "global_step": 35033, "epoch": 834} {"train_loss": -5.509843826293945, "global_step": 35034, "epoch": 834} {"train_loss": -5.698538780212402, "global_step": 35035, "epoch": 834} {"train_loss": -5.645170211791992, "global_step": 35036, "epoch": 834} {"train_loss": -5.751341342926025, "global_step": 35037, "epoch": 834} {"train_loss": -5.523097038269043, "global_step": 35038, "epoch": 834} {"train_loss": -5.5196638107299805, "global_step": 35039, "epoch": 834} {"train_loss": -5.555486679077148, "global_step": 35040, "epoch": 834} {"train_loss": -5.516515731811523, "global_step": 35041, "epoch": 834} {"train_loss": -5.521857261657715, "global_step": 35042, "epoch": 834} {"train_loss": -5.573749542236328, "global_step": 35043, "epoch": 834} {"train_loss": -5.483392715454102, "global_step": 35044, "epoch": 834} {"train_loss": -5.503182411193848, "global_step": 35045, "epoch": 834} {"train_loss": -5.564851760864258, "global_step": 35046, "epoch": 834} {"train_loss": -5.423454284667969, "global_step": 35047, "epoch": 834} {"train_loss": -5.612068176269531, "global_step": 35048, "epoch": 834} {"train_loss": -5.542716026306152, "global_step": 35049, "epoch": 834} {"train_loss": -5.668763160705566, "global_step": 35050, "epoch": 834} {"train_loss": -5.587235450744629, "global_step": 35051, "epoch": 834} {"train_loss": -5.570135593414307, "global_step": 35052, "epoch": 834} {"train_loss": -5.636237144470215, "global_step": 35053, "epoch": 834} {"train_loss": -5.594572067260742, "global_step": 35054, "epoch": 834} {"train_loss": -5.504861354827881, "global_step": 35055, "epoch": 834} {"train_loss": -5.42186164855957, "global_step": 35056, "epoch": 834} {"train_loss": -5.557557106018066, "global_step": 35057, "epoch": 834} {"train_loss": -5.433891773223877, "global_step": 35058, "epoch": 834} {"train_loss": -5.507440090179443, "global_step": 35059, "epoch": 834} {"train_loss": -5.574944496154785, "global_step": 35060, "epoch": 834} {"train_loss": -5.661476135253906, "global_step": 35061, "epoch": 834} {"train_loss": -5.5876617431640625, "global_step": 35062, "epoch": 834} {"train_loss": -5.604805946350098, "global_step": 35063, "epoch": 834} {"train_loss": -5.469818115234375, "global_step": 35064, "epoch": 834} {"train_loss": -5.528843879699707, "global_step": 35065, "epoch": 834} {"train_loss": -5.487869739532471, "global_step": 35066, "epoch": 834} {"train_loss": -5.616799354553223, "global_step": 35067, "epoch": 834} {"train_loss": -5.614829063415527, "global_step": 35068, "epoch": 834} {"train_loss": -5.558267797742571, "global_step": 35069, "epoch": 834, "val_loss": 62724.84765625} {"train_loss": -5.654639720916748, "global_step": 35070, "epoch": 835} {"train_loss": -5.548586368560791, "global_step": 35071, "epoch": 835} {"train_loss": -5.554191589355469, "global_step": 35072, "epoch": 835} {"train_loss": -5.649684429168701, "global_step": 35073, "epoch": 835} {"train_loss": -5.683182239532471, "global_step": 35074, "epoch": 835} {"train_loss": -5.614395618438721, "global_step": 35075, "epoch": 835} {"train_loss": -5.508749961853027, "global_step": 35076, "epoch": 835} {"train_loss": -5.4689435958862305, "global_step": 35077, "epoch": 835} {"train_loss": -5.519381523132324, "global_step": 35078, "epoch": 835} {"train_loss": -5.47083044052124, "global_step": 35079, "epoch": 835} {"train_loss": -5.572743892669678, "global_step": 35080, "epoch": 835} {"train_loss": -5.545357704162598, "global_step": 35081, "epoch": 835} {"train_loss": -5.674807548522949, "global_step": 35082, "epoch": 835} {"train_loss": -5.587166786193848, "global_step": 35083, "epoch": 835} {"train_loss": -5.509868621826172, "global_step": 35084, "epoch": 835} {"train_loss": -5.605986595153809, "global_step": 35085, "epoch": 835} {"train_loss": -5.455526351928711, "global_step": 35086, "epoch": 835} {"train_loss": -5.5731401443481445, "global_step": 35087, "epoch": 835} {"train_loss": -5.514449119567871, "global_step": 35088, "epoch": 835} {"train_loss": -5.501415729522705, "global_step": 35089, "epoch": 835} {"train_loss": -5.600553512573242, "global_step": 35090, "epoch": 835} {"train_loss": -5.604816436767578, "global_step": 35091, "epoch": 835} {"train_loss": -5.600907325744629, "global_step": 35092, "epoch": 835} {"train_loss": -5.533478736877441, "global_step": 35093, "epoch": 835} {"train_loss": -5.460799694061279, "global_step": 35094, "epoch": 835} {"train_loss": -5.627643585205078, "global_step": 35095, "epoch": 835} {"train_loss": -5.3985161781311035, "global_step": 35096, "epoch": 835} {"train_loss": -5.398955345153809, "global_step": 35097, "epoch": 835} {"train_loss": -5.586899757385254, "global_step": 35098, "epoch": 835} {"train_loss": -5.4213409423828125, "global_step": 35099, "epoch": 835} {"train_loss": -5.533651351928711, "global_step": 35100, "epoch": 835} {"train_loss": -5.558697700500488, "global_step": 35101, "epoch": 835} {"train_loss": -5.4148993492126465, "global_step": 35102, "epoch": 835} {"train_loss": -5.442435264587402, "global_step": 35103, "epoch": 835} {"train_loss": -5.565258026123047, "global_step": 35104, "epoch": 835} {"train_loss": -5.572871208190918, "global_step": 35105, "epoch": 835} {"train_loss": -5.5826616287231445, "global_step": 35106, "epoch": 835} {"train_loss": -5.319263458251953, "global_step": 35107, "epoch": 835} {"train_loss": -5.505369186401367, "global_step": 35108, "epoch": 835} {"train_loss": -5.5164899826049805, "global_step": 35109, "epoch": 835} {"train_loss": -5.559739112854004, "global_step": 35110, "epoch": 835} {"train_loss": -5.5328642300197055, "global_step": 35111, "epoch": 835, "val_loss": 62372.2734375} {"train_loss": -5.555294036865234, "global_step": 35112, "epoch": 836} {"train_loss": -5.493918418884277, "global_step": 35113, "epoch": 836} {"train_loss": -5.624232769012451, "global_step": 35114, "epoch": 836} {"train_loss": -5.444340705871582, "global_step": 35115, "epoch": 836} {"train_loss": -5.528755187988281, "global_step": 35116, "epoch": 836} {"train_loss": -5.59128475189209, "global_step": 35117, "epoch": 836} {"train_loss": -5.466446399688721, "global_step": 35118, "epoch": 836} {"train_loss": -5.605210304260254, "global_step": 35119, "epoch": 836} {"train_loss": -5.494011878967285, "global_step": 35120, "epoch": 836} {"train_loss": -5.666776657104492, "global_step": 35121, "epoch": 836} {"train_loss": -5.485128402709961, "global_step": 35122, "epoch": 836} {"train_loss": -5.585247039794922, "global_step": 35123, "epoch": 836} {"train_loss": -5.586387634277344, "global_step": 35124, "epoch": 836} {"train_loss": -5.496618747711182, "global_step": 35125, "epoch": 836} {"train_loss": -5.694052696228027, "global_step": 35126, "epoch": 836} {"train_loss": -5.479860305786133, "global_step": 35127, "epoch": 836} {"train_loss": -5.568902969360352, "global_step": 35128, "epoch": 836} {"train_loss": -5.5692877769470215, "global_step": 35129, "epoch": 836} {"train_loss": -5.5351762771606445, "global_step": 35130, "epoch": 836} {"train_loss": -5.523526191711426, "global_step": 35131, "epoch": 836} {"train_loss": -5.578092098236084, "global_step": 35132, "epoch": 836} {"train_loss": -5.352176666259766, "global_step": 35133, "epoch": 836} {"train_loss": -5.398338317871094, "global_step": 35134, "epoch": 836} {"train_loss": -5.494433879852295, "global_step": 35135, "epoch": 836} {"train_loss": -5.440263748168945, "global_step": 35136, "epoch": 836} {"train_loss": -5.3768310546875, "global_step": 35137, "epoch": 836} {"train_loss": -5.576535224914551, "global_step": 35138, "epoch": 836} {"train_loss": -5.616061210632324, "global_step": 35139, "epoch": 836} {"train_loss": -5.447930812835693, "global_step": 35140, "epoch": 836} {"train_loss": -5.5432586669921875, "global_step": 35141, "epoch": 836} {"train_loss": -5.516874313354492, "global_step": 35142, "epoch": 836} {"train_loss": -5.528664588928223, "global_step": 35143, "epoch": 836} {"train_loss": -5.622149467468262, "global_step": 35144, "epoch": 836} {"train_loss": -5.50106954574585, "global_step": 35145, "epoch": 836} {"train_loss": -5.497007369995117, "global_step": 35146, "epoch": 836} {"train_loss": -5.531819820404053, "global_step": 35147, "epoch": 836} {"train_loss": -5.537474632263184, "global_step": 35148, "epoch": 836} {"train_loss": -5.5513787269592285, "global_step": 35149, "epoch": 836} {"train_loss": -5.616549491882324, "global_step": 35150, "epoch": 836} {"train_loss": -5.452375411987305, "global_step": 35151, "epoch": 836} {"train_loss": -5.461907386779785, "global_step": 35152, "epoch": 836} {"train_loss": -5.5276658421471, "global_step": 35153, "epoch": 836, "val_loss": 62355.37890625} {"train_loss": -5.612326622009277, "global_step": 35154, "epoch": 837} {"train_loss": -5.543716907501221, "global_step": 35155, "epoch": 837} {"train_loss": -5.300482273101807, "global_step": 35156, "epoch": 837} {"train_loss": -5.53253173828125, "global_step": 35157, "epoch": 837} {"train_loss": -5.592141151428223, "global_step": 35158, "epoch": 837} {"train_loss": -5.575629234313965, "global_step": 35159, "epoch": 837} {"train_loss": -5.620111465454102, "global_step": 35160, "epoch": 837} {"train_loss": -5.641745090484619, "global_step": 35161, "epoch": 837} {"train_loss": -5.484321594238281, "global_step": 35162, "epoch": 837} {"train_loss": -5.485949993133545, "global_step": 35163, "epoch": 837} {"train_loss": -5.521728515625, "global_step": 35164, "epoch": 837} {"train_loss": -5.537216663360596, "global_step": 35165, "epoch": 837} {"train_loss": -5.661401748657227, "global_step": 35166, "epoch": 837} {"train_loss": -5.65207052230835, "global_step": 35167, "epoch": 837} {"train_loss": -5.503109931945801, "global_step": 35168, "epoch": 837} {"train_loss": -5.6426591873168945, "global_step": 35169, "epoch": 837} {"train_loss": -5.623776435852051, "global_step": 35170, "epoch": 837} {"train_loss": -5.56405782699585, "global_step": 35171, "epoch": 837} {"train_loss": -5.6272759437561035, "global_step": 35172, "epoch": 837} {"train_loss": -5.584133625030518, "global_step": 35173, "epoch": 837} {"train_loss": -5.409831523895264, "global_step": 35174, "epoch": 837} {"train_loss": -5.645726203918457, "global_step": 35175, "epoch": 837} {"train_loss": -5.3965911865234375, "global_step": 35176, "epoch": 837} {"train_loss": -5.535482883453369, "global_step": 35177, "epoch": 837} {"train_loss": -5.526780128479004, "global_step": 35178, "epoch": 837} {"train_loss": -5.7250261306762695, "global_step": 35179, "epoch": 837} {"train_loss": -5.60954475402832, "global_step": 35180, "epoch": 837} {"train_loss": -5.618134021759033, "global_step": 35181, "epoch": 837} {"train_loss": -5.572775840759277, "global_step": 35182, "epoch": 837} {"train_loss": -5.618195533752441, "global_step": 35183, "epoch": 837} {"train_loss": -5.4306745529174805, "global_step": 35184, "epoch": 837} {"train_loss": -5.5120849609375, "global_step": 35185, "epoch": 837} {"train_loss": -5.409927845001221, "global_step": 35186, "epoch": 837} {"train_loss": -5.703697204589844, "global_step": 35187, "epoch": 837} {"train_loss": -5.643934726715088, "global_step": 35188, "epoch": 837} {"train_loss": -5.56500244140625, "global_step": 35189, "epoch": 837} {"train_loss": -5.609014511108398, "global_step": 35190, "epoch": 837} {"train_loss": -5.382174968719482, "global_step": 35191, "epoch": 837} {"train_loss": -5.553615570068359, "global_step": 35192, "epoch": 837} {"train_loss": -5.6042938232421875, "global_step": 35193, "epoch": 837} {"train_loss": -5.607946395874023, "global_step": 35194, "epoch": 837} {"train_loss": -5.560183513732183, "global_step": 35195, "epoch": 837, "val_loss": 62251.859375} {"train_loss": -5.5379414558410645, "global_step": 35196, "epoch": 838} {"train_loss": -5.556525230407715, "global_step": 35197, "epoch": 838} {"train_loss": -5.6280412673950195, "global_step": 35198, "epoch": 838} {"train_loss": -5.6375732421875, "global_step": 35199, "epoch": 838} {"train_loss": -5.556272506713867, "global_step": 35200, "epoch": 838} {"train_loss": -5.46366024017334, "global_step": 35201, "epoch": 838} {"train_loss": -5.660928726196289, "global_step": 35202, "epoch": 838} {"train_loss": -5.6059889793396, "global_step": 35203, "epoch": 838} {"train_loss": -5.4844279289245605, "global_step": 35204, "epoch": 838} {"train_loss": -5.551696300506592, "global_step": 35205, "epoch": 838} {"train_loss": -5.649998188018799, "global_step": 35206, "epoch": 838} {"train_loss": -5.6011857986450195, "global_step": 35207, "epoch": 838} {"train_loss": -5.532610893249512, "global_step": 35208, "epoch": 838} {"train_loss": -5.526042938232422, "global_step": 35209, "epoch": 838} {"train_loss": -5.518299102783203, "global_step": 35210, "epoch": 838} {"train_loss": -5.665550231933594, "global_step": 35211, "epoch": 838} {"train_loss": -5.654780387878418, "global_step": 35212, "epoch": 838} {"train_loss": -5.52130126953125, "global_step": 35213, "epoch": 838} {"train_loss": -5.5863800048828125, "global_step": 35214, "epoch": 838} {"train_loss": -5.718092918395996, "global_step": 35215, "epoch": 838} {"train_loss": -5.533734321594238, "global_step": 35216, "epoch": 838} {"train_loss": -5.615882873535156, "global_step": 35217, "epoch": 838} {"train_loss": -5.624667167663574, "global_step": 35218, "epoch": 838} {"train_loss": -5.589677810668945, "global_step": 35219, "epoch": 838} {"train_loss": -5.5988569259643555, "global_step": 35220, "epoch": 838} {"train_loss": -5.50764274597168, "global_step": 35221, "epoch": 838} {"train_loss": -5.555523872375488, "global_step": 35222, "epoch": 838} {"train_loss": -5.621254920959473, "global_step": 35223, "epoch": 838} {"train_loss": -5.417508125305176, "global_step": 35224, "epoch": 838} {"train_loss": -5.612733364105225, "global_step": 35225, "epoch": 838} {"train_loss": -5.405791759490967, "global_step": 35226, "epoch": 838} {"train_loss": -5.498437404632568, "global_step": 35227, "epoch": 838} {"train_loss": -5.590012550354004, "global_step": 35228, "epoch": 838} {"train_loss": -5.538244247436523, "global_step": 35229, "epoch": 838} {"train_loss": -5.634868621826172, "global_step": 35230, "epoch": 838} {"train_loss": -5.517239093780518, "global_step": 35231, "epoch": 838} {"train_loss": -5.442468643188477, "global_step": 35232, "epoch": 838} {"train_loss": -5.503446578979492, "global_step": 35233, "epoch": 838} {"train_loss": -5.522120952606201, "global_step": 35234, "epoch": 838} {"train_loss": -5.706340789794922, "global_step": 35235, "epoch": 838} {"train_loss": -5.677431583404541, "global_step": 35236, "epoch": 838} {"train_loss": -5.573956046785627, "global_step": 35237, "epoch": 838, "val_loss": 62596.890625} {"train_loss": -5.53693151473999, "global_step": 35238, "epoch": 839} {"train_loss": -5.600864887237549, "global_step": 35239, "epoch": 839} {"train_loss": -5.682852745056152, "global_step": 35240, "epoch": 839} {"train_loss": -5.4068450927734375, "global_step": 35241, "epoch": 839} {"train_loss": -5.602336883544922, "global_step": 35242, "epoch": 839} {"train_loss": -5.6969499588012695, "global_step": 35243, "epoch": 839} {"train_loss": -5.531688690185547, "global_step": 35244, "epoch": 839} {"train_loss": -5.452375411987305, "global_step": 35245, "epoch": 839} {"train_loss": -5.600559234619141, "global_step": 35246, "epoch": 839} {"train_loss": -5.504762649536133, "global_step": 35247, "epoch": 839} {"train_loss": -5.479686260223389, "global_step": 35248, "epoch": 839} {"train_loss": -5.356749057769775, "global_step": 35249, "epoch": 839} {"train_loss": -5.626339912414551, "global_step": 35250, "epoch": 839} {"train_loss": -5.432230472564697, "global_step": 35251, "epoch": 839} {"train_loss": -5.538850784301758, "global_step": 35252, "epoch": 839} {"train_loss": -5.397141456604004, "global_step": 35253, "epoch": 839} {"train_loss": -5.607598304748535, "global_step": 35254, "epoch": 839} {"train_loss": -5.572368621826172, "global_step": 35255, "epoch": 839} {"train_loss": -5.439199447631836, "global_step": 35256, "epoch": 839} {"train_loss": -5.548753261566162, "global_step": 35257, "epoch": 839} {"train_loss": -5.433039665222168, "global_step": 35258, "epoch": 839} {"train_loss": -5.44865608215332, "global_step": 35259, "epoch": 839} {"train_loss": -5.428223609924316, "global_step": 35260, "epoch": 839} {"train_loss": -5.510153770446777, "global_step": 35261, "epoch": 839} {"train_loss": -5.493400573730469, "global_step": 35262, "epoch": 839} {"train_loss": -5.525881767272949, "global_step": 35263, "epoch": 839} {"train_loss": -5.487520217895508, "global_step": 35264, "epoch": 839} {"train_loss": -5.511680603027344, "global_step": 35265, "epoch": 839} {"train_loss": -5.477551460266113, "global_step": 35266, "epoch": 839} {"train_loss": -5.474843978881836, "global_step": 35267, "epoch": 839} {"train_loss": -5.519021987915039, "global_step": 35268, "epoch": 839} {"train_loss": -5.488068103790283, "global_step": 35269, "epoch": 839} {"train_loss": -5.521027565002441, "global_step": 35270, "epoch": 839} {"train_loss": -5.616961479187012, "global_step": 35271, "epoch": 839} {"train_loss": -5.495922088623047, "global_step": 35272, "epoch": 839} {"train_loss": -5.660560607910156, "global_step": 35273, "epoch": 839} {"train_loss": -5.547328948974609, "global_step": 35274, "epoch": 839} {"train_loss": -5.559911727905273, "global_step": 35275, "epoch": 839} {"train_loss": -5.433518409729004, "global_step": 35276, "epoch": 839} {"train_loss": -5.598925590515137, "global_step": 35277, "epoch": 839} {"train_loss": -5.475936412811279, "global_step": 35278, "epoch": 839} {"train_loss": -5.524220943450928, "global_step": 35279, "epoch": 839, "val_loss": 62338.42578125} {"train_loss": -5.4607954025268555, "global_step": 35280, "epoch": 840} {"train_loss": -5.5565571784973145, "global_step": 35281, "epoch": 840} {"train_loss": -5.505664825439453, "global_step": 35282, "epoch": 840} {"train_loss": -5.563019752502441, "global_step": 35283, "epoch": 840} {"train_loss": -5.632205486297607, "global_step": 35284, "epoch": 840} {"train_loss": -5.526735305786133, "global_step": 35285, "epoch": 840} {"train_loss": -5.474936008453369, "global_step": 35286, "epoch": 840} {"train_loss": -5.648625373840332, "global_step": 35287, "epoch": 840} {"train_loss": -5.5613579750061035, "global_step": 35288, "epoch": 840} {"train_loss": -5.5866851806640625, "global_step": 35289, "epoch": 840} {"train_loss": -5.672277927398682, "global_step": 35290, "epoch": 840} {"train_loss": -5.538629531860352, "global_step": 35291, "epoch": 840} {"train_loss": -5.525899887084961, "global_step": 35292, "epoch": 840} {"train_loss": -5.601278781890869, "global_step": 35293, "epoch": 840} {"train_loss": -5.637136936187744, "global_step": 35294, "epoch": 840} {"train_loss": -5.651724815368652, "global_step": 35295, "epoch": 840} {"train_loss": -5.593231678009033, "global_step": 35296, "epoch": 840} {"train_loss": -5.549332618713379, "global_step": 35297, "epoch": 840} {"train_loss": -5.605356693267822, "global_step": 35298, "epoch": 840} {"train_loss": -5.65421199798584, "global_step": 35299, "epoch": 840} {"train_loss": -5.633654594421387, "global_step": 35300, "epoch": 840} {"train_loss": -5.653477668762207, "global_step": 35301, "epoch": 840} {"train_loss": -5.590742588043213, "global_step": 35302, "epoch": 840} {"train_loss": -5.5695061683654785, "global_step": 35303, "epoch": 840} {"train_loss": -5.578226089477539, "global_step": 35304, "epoch": 840} {"train_loss": -5.4801483154296875, "global_step": 35305, "epoch": 840} {"train_loss": -5.498335838317871, "global_step": 35306, "epoch": 840} {"train_loss": -5.592947006225586, "global_step": 35307, "epoch": 840} {"train_loss": -5.53812313079834, "global_step": 35308, "epoch": 840} {"train_loss": -5.48343563079834, "global_step": 35309, "epoch": 840} {"train_loss": -5.525239944458008, "global_step": 35310, "epoch": 840} {"train_loss": -5.515160083770752, "global_step": 35311, "epoch": 840} {"train_loss": -5.636723518371582, "global_step": 35312, "epoch": 840} {"train_loss": -5.643918991088867, "global_step": 35313, "epoch": 840} {"train_loss": -5.583338737487793, "global_step": 35314, "epoch": 840} {"train_loss": -5.541887283325195, "global_step": 35315, "epoch": 840} {"train_loss": -5.573615550994873, "global_step": 35316, "epoch": 840} {"train_loss": -5.542340278625488, "global_step": 35317, "epoch": 840} {"train_loss": -5.543042182922363, "global_step": 35318, "epoch": 840} {"train_loss": -5.521886825561523, "global_step": 35319, "epoch": 840} {"train_loss": -5.576706886291504, "global_step": 35320, "epoch": 840} {"train_loss": -5.571709133329845, "global_step": 35321, "epoch": 840, "val_loss": 62472.265625} {"train_loss": -5.591473579406738, "global_step": 35322, "epoch": 841} {"train_loss": -5.497133255004883, "global_step": 35323, "epoch": 841} {"train_loss": -5.607255935668945, "global_step": 35324, "epoch": 841} {"train_loss": -5.643880844116211, "global_step": 35325, "epoch": 841} {"train_loss": -5.600481986999512, "global_step": 35326, "epoch": 841} {"train_loss": -5.5076093673706055, "global_step": 35327, "epoch": 841} {"train_loss": -5.341695785522461, "global_step": 35328, "epoch": 841} {"train_loss": -5.610448837280273, "global_step": 35329, "epoch": 841} {"train_loss": -5.5691680908203125, "global_step": 35330, "epoch": 841} {"train_loss": -5.517844200134277, "global_step": 35331, "epoch": 841} {"train_loss": -5.532028675079346, "global_step": 35332, "epoch": 841} {"train_loss": -5.589489459991455, "global_step": 35333, "epoch": 841} {"train_loss": -5.611012935638428, "global_step": 35334, "epoch": 841} {"train_loss": -5.638263702392578, "global_step": 35335, "epoch": 841} {"train_loss": -5.605203628540039, "global_step": 35336, "epoch": 841} {"train_loss": -5.56593132019043, "global_step": 35337, "epoch": 841} {"train_loss": -5.611069202423096, "global_step": 35338, "epoch": 841} {"train_loss": -5.578173637390137, "global_step": 35339, "epoch": 841} {"train_loss": -5.619312286376953, "global_step": 35340, "epoch": 841} {"train_loss": -5.572526931762695, "global_step": 35341, "epoch": 841} {"train_loss": -5.670190334320068, "global_step": 35342, "epoch": 841} {"train_loss": -5.649924278259277, "global_step": 35343, "epoch": 841} {"train_loss": -5.6001081466674805, "global_step": 35344, "epoch": 841} {"train_loss": -5.537980556488037, "global_step": 35345, "epoch": 841} {"train_loss": -5.63809061050415, "global_step": 35346, "epoch": 841} {"train_loss": -5.578911781311035, "global_step": 35347, "epoch": 841} {"train_loss": -5.7258806228637695, "global_step": 35348, "epoch": 841} {"train_loss": -5.541996002197266, "global_step": 35349, "epoch": 841} {"train_loss": -5.669363021850586, "global_step": 35350, "epoch": 841} {"train_loss": -5.590904235839844, "global_step": 35351, "epoch": 841} {"train_loss": -5.4859771728515625, "global_step": 35352, "epoch": 841} {"train_loss": -5.548647880554199, "global_step": 35353, "epoch": 841} {"train_loss": -5.562066078186035, "global_step": 35354, "epoch": 841} {"train_loss": -5.4121599197387695, "global_step": 35355, "epoch": 841} {"train_loss": -5.509600639343262, "global_step": 35356, "epoch": 841} {"train_loss": -5.581780433654785, "global_step": 35357, "epoch": 841} {"train_loss": -5.541597366333008, "global_step": 35358, "epoch": 841} {"train_loss": -5.43257999420166, "global_step": 35359, "epoch": 841} {"train_loss": -5.385041236877441, "global_step": 35360, "epoch": 841} {"train_loss": -5.505118370056152, "global_step": 35361, "epoch": 841} {"train_loss": -5.55831241607666, "global_step": 35362, "epoch": 841} {"train_loss": -5.563200280779884, "global_step": 35363, "epoch": 841, "val_loss": 62312.84375} {"train_loss": -5.6084160804748535, "global_step": 35364, "epoch": 842} {"train_loss": -5.667020797729492, "global_step": 35365, "epoch": 842} {"train_loss": -5.438688278198242, "global_step": 35366, "epoch": 842} {"train_loss": -5.564304351806641, "global_step": 35367, "epoch": 842} {"train_loss": -5.56492805480957, "global_step": 35368, "epoch": 842} {"train_loss": -5.488330364227295, "global_step": 35369, "epoch": 842} {"train_loss": -5.52915620803833, "global_step": 35370, "epoch": 842} {"train_loss": -5.586119651794434, "global_step": 35371, "epoch": 842} {"train_loss": -5.601741790771484, "global_step": 35372, "epoch": 842} {"train_loss": -5.5185227394104, "global_step": 35373, "epoch": 842} {"train_loss": -5.559995174407959, "global_step": 35374, "epoch": 842} {"train_loss": -5.427172660827637, "global_step": 35375, "epoch": 842} {"train_loss": -5.4987711906433105, "global_step": 35376, "epoch": 842} {"train_loss": -5.54806661605835, "global_step": 35377, "epoch": 842} {"train_loss": -5.483578681945801, "global_step": 35378, "epoch": 842} {"train_loss": -5.404434680938721, "global_step": 35379, "epoch": 842} {"train_loss": -5.566849708557129, "global_step": 35380, "epoch": 842} {"train_loss": -5.468432426452637, "global_step": 35381, "epoch": 842} {"train_loss": -5.475602149963379, "global_step": 35382, "epoch": 842} {"train_loss": -5.500392913818359, "global_step": 35383, "epoch": 842} {"train_loss": -5.619403839111328, "global_step": 35384, "epoch": 842} {"train_loss": -5.552422046661377, "global_step": 35385, "epoch": 842} {"train_loss": -5.5611066818237305, "global_step": 35386, "epoch": 842} {"train_loss": -5.501762390136719, "global_step": 35387, "epoch": 842} {"train_loss": -5.631063461303711, "global_step": 35388, "epoch": 842} {"train_loss": -5.526302337646484, "global_step": 35389, "epoch": 842} {"train_loss": -5.510473728179932, "global_step": 35390, "epoch": 842} {"train_loss": -5.633769989013672, "global_step": 35391, "epoch": 842} {"train_loss": -5.691349029541016, "global_step": 35392, "epoch": 842} {"train_loss": -5.642055988311768, "global_step": 35393, "epoch": 842} {"train_loss": -5.545306205749512, "global_step": 35394, "epoch": 842} {"train_loss": -5.569300651550293, "global_step": 35395, "epoch": 842} {"train_loss": -5.533936500549316, "global_step": 35396, "epoch": 842} {"train_loss": -5.493146896362305, "global_step": 35397, "epoch": 842} {"train_loss": -5.4803314208984375, "global_step": 35398, "epoch": 842} {"train_loss": -5.649916648864746, "global_step": 35399, "epoch": 842} {"train_loss": -5.601078033447266, "global_step": 35400, "epoch": 842} {"train_loss": -5.5140461921691895, "global_step": 35401, "epoch": 842} {"train_loss": -5.763205528259277, "global_step": 35402, "epoch": 842} {"train_loss": -5.577990531921387, "global_step": 35403, "epoch": 842} {"train_loss": -5.521268844604492, "global_step": 35404, "epoch": 842} {"train_loss": -5.5531575452713735, "global_step": 35405, "epoch": 842, "val_loss": 62539.1875} {"train_loss": -5.52371883392334, "global_step": 35406, "epoch": 843} {"train_loss": -5.537349700927734, "global_step": 35407, "epoch": 843} {"train_loss": -5.541868209838867, "global_step": 35408, "epoch": 843} {"train_loss": -5.520308017730713, "global_step": 35409, "epoch": 843} {"train_loss": -5.538999557495117, "global_step": 35410, "epoch": 843} {"train_loss": -5.564250946044922, "global_step": 35411, "epoch": 843} {"train_loss": -5.573843002319336, "global_step": 35412, "epoch": 843} {"train_loss": -5.434601783752441, "global_step": 35413, "epoch": 843} {"train_loss": -5.437004089355469, "global_step": 35414, "epoch": 843} {"train_loss": -5.6480207443237305, "global_step": 35415, "epoch": 843} {"train_loss": -5.575288772583008, "global_step": 35416, "epoch": 843} {"train_loss": -5.42424201965332, "global_step": 35417, "epoch": 843} {"train_loss": -5.618704795837402, "global_step": 35418, "epoch": 843} {"train_loss": -5.573056221008301, "global_step": 35419, "epoch": 843} {"train_loss": -5.479645252227783, "global_step": 35420, "epoch": 843} {"train_loss": -5.563720703125, "global_step": 35421, "epoch": 843} {"train_loss": -5.637622833251953, "global_step": 35422, "epoch": 843} {"train_loss": -5.564876079559326, "global_step": 35423, "epoch": 843} {"train_loss": -5.5924072265625, "global_step": 35424, "epoch": 843} {"train_loss": -5.41708517074585, "global_step": 35425, "epoch": 843} {"train_loss": -5.591909408569336, "global_step": 35426, "epoch": 843} {"train_loss": -5.55629301071167, "global_step": 35427, "epoch": 843} {"train_loss": -5.462882041931152, "global_step": 35428, "epoch": 843} {"train_loss": -5.5456132888793945, "global_step": 35429, "epoch": 843} {"train_loss": -5.545063018798828, "global_step": 35430, "epoch": 843} {"train_loss": -5.550872802734375, "global_step": 35431, "epoch": 843} {"train_loss": -5.672560214996338, "global_step": 35432, "epoch": 843} {"train_loss": -5.403308391571045, "global_step": 35433, "epoch": 843} {"train_loss": -5.599649429321289, "global_step": 35434, "epoch": 843} {"train_loss": -5.585622787475586, "global_step": 35435, "epoch": 843} {"train_loss": -5.561280727386475, "global_step": 35436, "epoch": 843} {"train_loss": -5.581394195556641, "global_step": 35437, "epoch": 843} {"train_loss": -5.645505905151367, "global_step": 35438, "epoch": 843} {"train_loss": -5.556948661804199, "global_step": 35439, "epoch": 843} {"train_loss": -5.652090549468994, "global_step": 35440, "epoch": 843} {"train_loss": -5.479299068450928, "global_step": 35441, "epoch": 843} {"train_loss": -5.620710372924805, "global_step": 35442, "epoch": 843} {"train_loss": -5.567953109741211, "global_step": 35443, "epoch": 843} {"train_loss": -5.612592697143555, "global_step": 35444, "epoch": 843} {"train_loss": -5.553750991821289, "global_step": 35445, "epoch": 843} {"train_loss": -5.464076995849609, "global_step": 35446, "epoch": 843} {"train_loss": -5.552590869721913, "global_step": 35447, "epoch": 843, "val_loss": 62368.55078125} {"train_loss": -5.466914176940918, "global_step": 35448, "epoch": 844} {"train_loss": -5.479001045227051, "global_step": 35449, "epoch": 844} {"train_loss": -5.6735382080078125, "global_step": 35450, "epoch": 844} {"train_loss": -5.647337436676025, "global_step": 35451, "epoch": 844} {"train_loss": -5.47825813293457, "global_step": 35452, "epoch": 844} {"train_loss": -5.651219367980957, "global_step": 35453, "epoch": 844} {"train_loss": -5.466976642608643, "global_step": 35454, "epoch": 844} {"train_loss": -5.42710018157959, "global_step": 35455, "epoch": 844} {"train_loss": -5.664098262786865, "global_step": 35456, "epoch": 844} {"train_loss": -5.665022850036621, "global_step": 35457, "epoch": 844} {"train_loss": -5.561800003051758, "global_step": 35458, "epoch": 844} {"train_loss": -5.656762599945068, "global_step": 35459, "epoch": 844} {"train_loss": -5.6388983726501465, "global_step": 35460, "epoch": 844} {"train_loss": -5.600610733032227, "global_step": 35461, "epoch": 844} {"train_loss": -5.649892330169678, "global_step": 35462, "epoch": 844} {"train_loss": -5.626775741577148, "global_step": 35463, "epoch": 844} {"train_loss": -5.537763595581055, "global_step": 35464, "epoch": 844} {"train_loss": -5.56901216506958, "global_step": 35465, "epoch": 844} {"train_loss": -5.64386510848999, "global_step": 35466, "epoch": 844} {"train_loss": -5.465085983276367, "global_step": 35467, "epoch": 844} {"train_loss": -5.557449817657471, "global_step": 35468, "epoch": 844} {"train_loss": -5.46358585357666, "global_step": 35469, "epoch": 844} {"train_loss": -5.572136878967285, "global_step": 35470, "epoch": 844} {"train_loss": -5.6011247634887695, "global_step": 35471, "epoch": 844} {"train_loss": -5.479372978210449, "global_step": 35472, "epoch": 844} {"train_loss": -5.430444717407227, "global_step": 35473, "epoch": 844} {"train_loss": -5.487468719482422, "global_step": 35474, "epoch": 844} {"train_loss": -5.512153148651123, "global_step": 35475, "epoch": 844} {"train_loss": -5.491800785064697, "global_step": 35476, "epoch": 844} {"train_loss": -5.471081256866455, "global_step": 35477, "epoch": 844} {"train_loss": -5.394766807556152, "global_step": 35478, "epoch": 844} {"train_loss": -5.773266792297363, "global_step": 35479, "epoch": 844} {"train_loss": -5.664122581481934, "global_step": 35480, "epoch": 844} {"train_loss": -5.543615818023682, "global_step": 35481, "epoch": 844} {"train_loss": -5.656825065612793, "global_step": 35482, "epoch": 844} {"train_loss": -5.531111717224121, "global_step": 35483, "epoch": 844} {"train_loss": -5.526232719421387, "global_step": 35484, "epoch": 844} {"train_loss": -5.535731792449951, "global_step": 35485, "epoch": 844} {"train_loss": -5.602579116821289, "global_step": 35486, "epoch": 844} {"train_loss": -5.48857307434082, "global_step": 35487, "epoch": 844} {"train_loss": -5.6494903564453125, "global_step": 35488, "epoch": 844} {"train_loss": -5.561949377968197, "global_step": 35489, "epoch": 844, "val_loss": 62412.97265625} {"train_loss": -5.530204772949219, "global_step": 35490, "epoch": 845} {"train_loss": -5.632806777954102, "global_step": 35491, "epoch": 845} {"train_loss": -5.646693706512451, "global_step": 35492, "epoch": 845} {"train_loss": -5.572371006011963, "global_step": 35493, "epoch": 845} {"train_loss": -5.6644673347473145, "global_step": 35494, "epoch": 845} {"train_loss": -5.611061096191406, "global_step": 35495, "epoch": 845} {"train_loss": -5.59956169128418, "global_step": 35496, "epoch": 845} {"train_loss": -5.595880031585693, "global_step": 35497, "epoch": 845} {"train_loss": -5.448610305786133, "global_step": 35498, "epoch": 845} {"train_loss": -5.5694427490234375, "global_step": 35499, "epoch": 845} {"train_loss": -5.740339756011963, "global_step": 35500, "epoch": 845} {"train_loss": -5.618402481079102, "global_step": 35501, "epoch": 845} {"train_loss": -5.552629470825195, "global_step": 35502, "epoch": 845} {"train_loss": -5.455132961273193, "global_step": 35503, "epoch": 845} {"train_loss": -5.689023971557617, "global_step": 35504, "epoch": 845} {"train_loss": -5.576983451843262, "global_step": 35505, "epoch": 845} {"train_loss": -5.707557678222656, "global_step": 35506, "epoch": 845} {"train_loss": -5.547092437744141, "global_step": 35507, "epoch": 845} {"train_loss": -5.563333511352539, "global_step": 35508, "epoch": 845} {"train_loss": -5.620143890380859, "global_step": 35509, "epoch": 845} {"train_loss": -5.618250846862793, "global_step": 35510, "epoch": 845} {"train_loss": -5.551056861877441, "global_step": 35511, "epoch": 845} {"train_loss": -5.474551677703857, "global_step": 35512, "epoch": 845} {"train_loss": -5.478094100952148, "global_step": 35513, "epoch": 845} {"train_loss": -5.488314151763916, "global_step": 35514, "epoch": 845} {"train_loss": -5.509091377258301, "global_step": 35515, "epoch": 845} {"train_loss": -5.446966648101807, "global_step": 35516, "epoch": 845} {"train_loss": -5.470720291137695, "global_step": 35517, "epoch": 845} {"train_loss": -5.583652496337891, "global_step": 35518, "epoch": 845} {"train_loss": -5.384101390838623, "global_step": 35519, "epoch": 845} {"train_loss": -5.554884910583496, "global_step": 35520, "epoch": 845} {"train_loss": -5.465023040771484, "global_step": 35521, "epoch": 845} {"train_loss": -5.523441314697266, "global_step": 35522, "epoch": 845} {"train_loss": -5.550366401672363, "global_step": 35523, "epoch": 845} {"train_loss": -5.402459621429443, "global_step": 35524, "epoch": 845} {"train_loss": -5.496436595916748, "global_step": 35525, "epoch": 845} {"train_loss": -5.46581506729126, "global_step": 35526, "epoch": 845} {"train_loss": -5.574397087097168, "global_step": 35527, "epoch": 845} {"train_loss": -5.516815185546875, "global_step": 35528, "epoch": 845} {"train_loss": -5.476376056671143, "global_step": 35529, "epoch": 845} {"train_loss": -5.544835090637207, "global_step": 35530, "epoch": 845} {"train_loss": -5.54696189789545, "global_step": 35531, "epoch": 845, "val_loss": 62630.1171875} {"train_loss": -5.619367599487305, "global_step": 35532, "epoch": 846} {"train_loss": -5.538690567016602, "global_step": 35533, "epoch": 846} {"train_loss": -5.517129898071289, "global_step": 35534, "epoch": 846} {"train_loss": -5.586454391479492, "global_step": 35535, "epoch": 846} {"train_loss": -5.483311653137207, "global_step": 35536, "epoch": 846} {"train_loss": -5.676212310791016, "global_step": 35537, "epoch": 846} {"train_loss": -5.51278829574585, "global_step": 35538, "epoch": 846} {"train_loss": -5.640827178955078, "global_step": 35539, "epoch": 846} {"train_loss": -5.463119983673096, "global_step": 35540, "epoch": 846} {"train_loss": -5.58529806137085, "global_step": 35541, "epoch": 846} {"train_loss": -5.663335800170898, "global_step": 35542, "epoch": 846} {"train_loss": -5.620786666870117, "global_step": 35543, "epoch": 846} {"train_loss": -5.585880279541016, "global_step": 35544, "epoch": 846} {"train_loss": -5.585297584533691, "global_step": 35545, "epoch": 846} {"train_loss": -5.640205383300781, "global_step": 35546, "epoch": 846} {"train_loss": -5.503145217895508, "global_step": 35547, "epoch": 846} {"train_loss": -5.5275654792785645, "global_step": 35548, "epoch": 846} {"train_loss": -5.646768569946289, "global_step": 35549, "epoch": 846} {"train_loss": -5.344182014465332, "global_step": 35550, "epoch": 846} {"train_loss": -5.482324600219727, "global_step": 35551, "epoch": 846} {"train_loss": -5.502119064331055, "global_step": 35552, "epoch": 846} {"train_loss": -5.537076950073242, "global_step": 35553, "epoch": 846} {"train_loss": -5.553241729736328, "global_step": 35554, "epoch": 846} {"train_loss": -5.566118240356445, "global_step": 35555, "epoch": 846} {"train_loss": -5.584024906158447, "global_step": 35556, "epoch": 846} {"train_loss": -5.535807132720947, "global_step": 35557, "epoch": 846} {"train_loss": -5.652006149291992, "global_step": 35558, "epoch": 846} {"train_loss": -5.527393341064453, "global_step": 35559, "epoch": 846} {"train_loss": -5.602602958679199, "global_step": 35560, "epoch": 846} {"train_loss": -5.565953731536865, "global_step": 35561, "epoch": 846} {"train_loss": -5.538902282714844, "global_step": 35562, "epoch": 846} {"train_loss": -5.4644694328308105, "global_step": 35563, "epoch": 846} {"train_loss": -5.564355850219727, "global_step": 35564, "epoch": 846} {"train_loss": -5.484196662902832, "global_step": 35565, "epoch": 846} {"train_loss": -5.575118064880371, "global_step": 35566, "epoch": 846} {"train_loss": -5.574845314025879, "global_step": 35567, "epoch": 846} {"train_loss": -5.633052825927734, "global_step": 35568, "epoch": 846} {"train_loss": -5.693523406982422, "global_step": 35569, "epoch": 846} {"train_loss": -5.550045013427734, "global_step": 35570, "epoch": 846} {"train_loss": -5.623087406158447, "global_step": 35571, "epoch": 846} {"train_loss": -5.7191996574401855, "global_step": 35572, "epoch": 846} {"train_loss": -5.568127087184361, "global_step": 35573, "epoch": 846, "val_loss": 62285.046875} {"train_loss": -5.617481231689453, "global_step": 35574, "epoch": 847} {"train_loss": -5.559669494628906, "global_step": 35575, "epoch": 847} {"train_loss": -5.552915096282959, "global_step": 35576, "epoch": 847} {"train_loss": -5.506871700286865, "global_step": 35577, "epoch": 847} {"train_loss": -5.5648016929626465, "global_step": 35578, "epoch": 847} {"train_loss": -5.583118438720703, "global_step": 35579, "epoch": 847} {"train_loss": -5.4550557136535645, "global_step": 35580, "epoch": 847} {"train_loss": -5.483121871948242, "global_step": 35581, "epoch": 847} {"train_loss": -5.457364559173584, "global_step": 35582, "epoch": 847} {"train_loss": -5.541658401489258, "global_step": 35583, "epoch": 847} {"train_loss": -5.584890842437744, "global_step": 35584, "epoch": 847} {"train_loss": -5.621535301208496, "global_step": 35585, "epoch": 847} {"train_loss": -5.444319725036621, "global_step": 35586, "epoch": 847} {"train_loss": -5.614355087280273, "global_step": 35587, "epoch": 847} {"train_loss": -5.690270900726318, "global_step": 35588, "epoch": 847} {"train_loss": -5.6158013343811035, "global_step": 35589, "epoch": 847} {"train_loss": -5.6666765213012695, "global_step": 35590, "epoch": 847} {"train_loss": -5.475675106048584, "global_step": 35591, "epoch": 847} {"train_loss": -5.5726728439331055, "global_step": 35592, "epoch": 847} {"train_loss": -5.510754108428955, "global_step": 35593, "epoch": 847} {"train_loss": -5.49811315536499, "global_step": 35594, "epoch": 847} {"train_loss": -5.619838714599609, "global_step": 35595, "epoch": 847} {"train_loss": -5.6275739669799805, "global_step": 35596, "epoch": 847} {"train_loss": -5.617256164550781, "global_step": 35597, "epoch": 847} {"train_loss": -5.597377777099609, "global_step": 35598, "epoch": 847} {"train_loss": -5.526451587677002, "global_step": 35599, "epoch": 847} {"train_loss": -5.805206775665283, "global_step": 35600, "epoch": 847} {"train_loss": -5.6558685302734375, "global_step": 35601, "epoch": 847} {"train_loss": -5.445351600646973, "global_step": 35602, "epoch": 847} {"train_loss": -5.636664390563965, "global_step": 35603, "epoch": 847} {"train_loss": -5.6174774169921875, "global_step": 35604, "epoch": 847} {"train_loss": -5.42533016204834, "global_step": 35605, "epoch": 847} {"train_loss": -5.550548553466797, "global_step": 35606, "epoch": 847} {"train_loss": -5.623533248901367, "global_step": 35607, "epoch": 847} {"train_loss": -5.375565052032471, "global_step": 35608, "epoch": 847} {"train_loss": -5.56186580657959, "global_step": 35609, "epoch": 847} {"train_loss": -5.598608493804932, "global_step": 35610, "epoch": 847} {"train_loss": -5.546731948852539, "global_step": 35611, "epoch": 847} {"train_loss": -5.4485931396484375, "global_step": 35612, "epoch": 847} {"train_loss": -5.489634990692139, "global_step": 35613, "epoch": 847} {"train_loss": -5.5096659660339355, "global_step": 35614, "epoch": 847} {"train_loss": -5.5615408307030085, "global_step": 35615, "epoch": 847, "val_loss": 62335.265625} {"train_loss": -5.5062150955200195, "global_step": 35616, "epoch": 848} {"train_loss": -5.449604034423828, "global_step": 35617, "epoch": 848} {"train_loss": -5.576508522033691, "global_step": 35618, "epoch": 848} {"train_loss": -5.471304893493652, "global_step": 35619, "epoch": 848} {"train_loss": -5.585797309875488, "global_step": 35620, "epoch": 848} {"train_loss": -5.427526473999023, "global_step": 35621, "epoch": 848} {"train_loss": -5.554215431213379, "global_step": 35622, "epoch": 848} {"train_loss": -5.592084884643555, "global_step": 35623, "epoch": 848} {"train_loss": -5.689434051513672, "global_step": 35624, "epoch": 848} {"train_loss": -5.572376251220703, "global_step": 35625, "epoch": 848} {"train_loss": -5.637434959411621, "global_step": 35626, "epoch": 848} {"train_loss": -5.510969161987305, "global_step": 35627, "epoch": 848} {"train_loss": -5.497493743896484, "global_step": 35628, "epoch": 848} {"train_loss": -5.497150421142578, "global_step": 35629, "epoch": 848} {"train_loss": -5.500940322875977, "global_step": 35630, "epoch": 848} {"train_loss": -5.472448825836182, "global_step": 35631, "epoch": 848} {"train_loss": -5.528233051300049, "global_step": 35632, "epoch": 848} {"train_loss": -5.656679153442383, "global_step": 35633, "epoch": 848} {"train_loss": -5.478427410125732, "global_step": 35634, "epoch": 848} {"train_loss": -5.647701740264893, "global_step": 35635, "epoch": 848} {"train_loss": -5.576430320739746, "global_step": 35636, "epoch": 848} {"train_loss": -5.598677158355713, "global_step": 35637, "epoch": 848} {"train_loss": -5.611301898956299, "global_step": 35638, "epoch": 848} {"train_loss": -5.74368143081665, "global_step": 35639, "epoch": 848} {"train_loss": -5.602387428283691, "global_step": 35640, "epoch": 848} {"train_loss": -5.708045959472656, "global_step": 35641, "epoch": 848} {"train_loss": -5.57829475402832, "global_step": 35642, "epoch": 848} {"train_loss": -5.590651988983154, "global_step": 35643, "epoch": 848} {"train_loss": -5.538762092590332, "global_step": 35644, "epoch": 848} {"train_loss": -5.47019624710083, "global_step": 35645, "epoch": 848} {"train_loss": -5.508462905883789, "global_step": 35646, "epoch": 848} {"train_loss": -5.565910816192627, "global_step": 35647, "epoch": 848} {"train_loss": -5.557609558105469, "global_step": 35648, "epoch": 848} {"train_loss": -5.573526859283447, "global_step": 35649, "epoch": 848} {"train_loss": -5.554780006408691, "global_step": 35650, "epoch": 848} {"train_loss": -5.482359409332275, "global_step": 35651, "epoch": 848} {"train_loss": -5.618938446044922, "global_step": 35652, "epoch": 848} {"train_loss": -5.6752424240112305, "global_step": 35653, "epoch": 848} {"train_loss": -5.661850929260254, "global_step": 35654, "epoch": 848} {"train_loss": -5.578422546386719, "global_step": 35655, "epoch": 848} {"train_loss": -5.579573154449463, "global_step": 35656, "epoch": 848} {"train_loss": -5.567364851633708, "global_step": 35657, "epoch": 848, "val_loss": 62390.8828125} {"train_loss": -5.683799743652344, "global_step": 35658, "epoch": 849} {"train_loss": -5.599581718444824, "global_step": 35659, "epoch": 849} {"train_loss": -5.5736236572265625, "global_step": 35660, "epoch": 849} {"train_loss": -5.569869518280029, "global_step": 35661, "epoch": 849} {"train_loss": -5.4966230392456055, "global_step": 35662, "epoch": 849} {"train_loss": -5.411558151245117, "global_step": 35663, "epoch": 849} {"train_loss": -5.49768590927124, "global_step": 35664, "epoch": 849} {"train_loss": -5.504025936126709, "global_step": 35665, "epoch": 849} {"train_loss": -5.446796417236328, "global_step": 35666, "epoch": 849} {"train_loss": -5.66457462310791, "global_step": 35667, "epoch": 849} {"train_loss": -5.596550464630127, "global_step": 35668, "epoch": 849} {"train_loss": -5.52805233001709, "global_step": 35669, "epoch": 849} {"train_loss": -5.728346824645996, "global_step": 35670, "epoch": 849} {"train_loss": -5.66057014465332, "global_step": 35671, "epoch": 849} {"train_loss": -5.515936851501465, "global_step": 35672, "epoch": 849} {"train_loss": -5.557662010192871, "global_step": 35673, "epoch": 849} {"train_loss": -5.746701717376709, "global_step": 35674, "epoch": 849} {"train_loss": -5.549416542053223, "global_step": 35675, "epoch": 849} {"train_loss": -5.50851583480835, "global_step": 35676, "epoch": 849} {"train_loss": -5.5522942543029785, "global_step": 35677, "epoch": 849} {"train_loss": -5.597165584564209, "global_step": 35678, "epoch": 849} {"train_loss": -5.450718402862549, "global_step": 35679, "epoch": 849} {"train_loss": -5.69677734375, "global_step": 35680, "epoch": 849} {"train_loss": -5.418497562408447, "global_step": 35681, "epoch": 849} {"train_loss": -5.400350570678711, "global_step": 35682, "epoch": 849} {"train_loss": -5.469064235687256, "global_step": 35683, "epoch": 849} {"train_loss": -5.418473243713379, "global_step": 35684, "epoch": 849} {"train_loss": -5.571776866912842, "global_step": 35685, "epoch": 849} {"train_loss": -5.532784461975098, "global_step": 35686, "epoch": 849} {"train_loss": -5.426522731781006, "global_step": 35687, "epoch": 849} {"train_loss": -5.613804817199707, "global_step": 35688, "epoch": 849} {"train_loss": -5.388280868530273, "global_step": 35689, "epoch": 849} {"train_loss": -5.628883361816406, "global_step": 35690, "epoch": 849} {"train_loss": -5.507970809936523, "global_step": 35691, "epoch": 849} {"train_loss": -5.5505781173706055, "global_step": 35692, "epoch": 849} {"train_loss": -5.590821743011475, "global_step": 35693, "epoch": 849} {"train_loss": -5.5803937911987305, "global_step": 35694, "epoch": 849} {"train_loss": -5.531150817871094, "global_step": 35695, "epoch": 849} {"train_loss": -5.443731307983398, "global_step": 35696, "epoch": 849} {"train_loss": -5.542072772979736, "global_step": 35697, "epoch": 849} {"train_loss": -5.611645221710205, "global_step": 35698, "epoch": 849} {"train_loss": -5.547359682264782, "global_step": 35699, "epoch": 849, "val_loss": 62437.93359375} {"train_loss": -5.57296085357666, "global_step": 35700, "epoch": 850} {"train_loss": -5.576206207275391, "global_step": 35701, "epoch": 850} {"train_loss": -5.675858497619629, "global_step": 35702, "epoch": 850} {"train_loss": -5.5594072341918945, "global_step": 35703, "epoch": 850} {"train_loss": -5.519650459289551, "global_step": 35704, "epoch": 850} {"train_loss": -5.609860420227051, "global_step": 35705, "epoch": 850} {"train_loss": -5.543521881103516, "global_step": 35706, "epoch": 850} {"train_loss": -5.522453308105469, "global_step": 35707, "epoch": 850} {"train_loss": -5.463688850402832, "global_step": 35708, "epoch": 850} {"train_loss": -5.486212253570557, "global_step": 35709, "epoch": 850} {"train_loss": -5.525200843811035, "global_step": 35710, "epoch": 850} {"train_loss": -5.5468292236328125, "global_step": 35711, "epoch": 850} {"train_loss": -5.626291275024414, "global_step": 35712, "epoch": 850} {"train_loss": -5.456570625305176, "global_step": 35713, "epoch": 850} {"train_loss": -5.540164470672607, "global_step": 35714, "epoch": 850} {"train_loss": -5.616541862487793, "global_step": 35715, "epoch": 850} {"train_loss": -5.505751609802246, "global_step": 35716, "epoch": 850} {"train_loss": -5.512444496154785, "global_step": 35717, "epoch": 850} {"train_loss": -5.644621849060059, "global_step": 35718, "epoch": 850} {"train_loss": -5.573858737945557, "global_step": 35719, "epoch": 850} {"train_loss": -5.704407691955566, "global_step": 35720, "epoch": 850} {"train_loss": -5.568913459777832, "global_step": 35721, "epoch": 850} {"train_loss": -5.53856086730957, "global_step": 35722, "epoch": 850} {"train_loss": -5.545422554016113, "global_step": 35723, "epoch": 850} {"train_loss": -5.510951995849609, "global_step": 35724, "epoch": 850} {"train_loss": -5.648845672607422, "global_step": 35725, "epoch": 850} {"train_loss": -5.5683794021606445, "global_step": 35726, "epoch": 850} {"train_loss": -5.477055549621582, "global_step": 35727, "epoch": 850} {"train_loss": -5.6101603507995605, "global_step": 35728, "epoch": 850} {"train_loss": -5.519346237182617, "global_step": 35729, "epoch": 850} {"train_loss": -5.409216403961182, "global_step": 35730, "epoch": 850} {"train_loss": -5.60333251953125, "global_step": 35731, "epoch": 850} {"train_loss": -5.490156173706055, "global_step": 35732, "epoch": 850} {"train_loss": -5.461818218231201, "global_step": 35733, "epoch": 850} {"train_loss": -5.4898576736450195, "global_step": 35734, "epoch": 850} {"train_loss": -5.531933784484863, "global_step": 35735, "epoch": 850} {"train_loss": -5.412400245666504, "global_step": 35736, "epoch": 850} {"train_loss": -5.472863674163818, "global_step": 35737, "epoch": 850} {"train_loss": -5.300346374511719, "global_step": 35738, "epoch": 850} {"train_loss": -5.59050989151001, "global_step": 35739, "epoch": 850} {"train_loss": -5.418631553649902, "global_step": 35740, "epoch": 850} {"train_loss": -5.5388420422871905, "global_step": 35741, "epoch": 850, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.18332603675350218, "train/sim_max_reward_2": 0.11607944687054993, "train/sim_max_reward_3": 0.17749851761672272, "train/sim_max_reward_4": 0.3193247535782358, "train/sim_max_reward_5": 0.512299923614995, "test/sim_max_reward_4300000": 0.34939060514721193, "test/sim_max_reward_4300001": 0.3511806753215328, "test/sim_max_reward_4300002": 0.17763190228676132, "test/sim_max_reward_4300003": 0.7103163147517162, "test/sim_max_reward_4300004": 1.0, "test/sim_max_reward_4300005": 0.4369026570216892, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.25558140681094005, "test/sim_max_reward_4300008": 0.5168103577053378, "test/sim_max_reward_4300009": 0.7744867701525379, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.3098539596714524, "test/sim_max_reward_4300012": 0.887033743043216, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 0.9045994847841181, "test/sim_max_reward_4300015": 0.2581940040118648, "test/sim_max_reward_4300016": 0.4253677419951281, "test/sim_max_reward_4300017": 0.667557770093271, "test/sim_max_reward_4300018": 0.7162801002662745, "test/sim_max_reward_4300019": 0.18534865074803783, "test/sim_max_reward_4300020": 0.29705871845869186, "test/sim_max_reward_4300021": 0.7688201133513091, "test/sim_max_reward_4300022": 0.31469404593055955, "test/sim_max_reward_4300023": 0.45622066130639344, "test/sim_max_reward_4300024": 0.4313127964395651, "test/sim_max_reward_4300025": 0.6956866253789671, "test/sim_max_reward_4300026": 0.1467977713052626, "test/sim_max_reward_4300027": 0.007008402939615648, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.40428788387904574, "test/sim_max_reward_4300031": 0.16931727596817542, "test/sim_max_reward_4300032": 0.4659827348408965, "test/sim_max_reward_4300033": 0.6230492956271594, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.7038217181292584, "test/sim_max_reward_4300038": 0.0, "test/sim_max_reward_4300039": 0.511730056511877, "test/sim_max_reward_4300040": 0.4143029478506269, "test/sim_max_reward_4300041": 0.1860714493097263, "test/sim_max_reward_4300042": 0.6845238831015091, "test/sim_max_reward_4300043": 0.28031526697425363, "test/sim_max_reward_4300044": 0.2713607740649884, "test/sim_max_reward_4300045": 0.646389345649399, "test/sim_max_reward_4300046": 0.12937319258808422, "test/sim_max_reward_4300047": 0.09005287383320744, "test/sim_max_reward_4300048": 0.42040490964105837, "test/sim_max_reward_4300049": 0.03568824403420864, "train/mean_score": 0.2498043625066763, "test/mean_score": 0.38560002492976814, "val_loss": 62901.16015625} {"train_loss": -5.501876354217529, "global_step": 35742, "epoch": 851} {"train_loss": -5.49660062789917, "global_step": 35743, "epoch": 851} {"train_loss": -5.630465984344482, "global_step": 35744, "epoch": 851} {"train_loss": -5.509550094604492, "global_step": 35745, "epoch": 851} {"train_loss": -5.626220703125, "global_step": 35746, "epoch": 851} {"train_loss": -5.564306259155273, "global_step": 35747, "epoch": 851} {"train_loss": -5.506540298461914, "global_step": 35748, "epoch": 851} {"train_loss": -5.558084011077881, "global_step": 35749, "epoch": 851} {"train_loss": -5.46027135848999, "global_step": 35750, "epoch": 851} {"train_loss": -5.444343090057373, "global_step": 35751, "epoch": 851} {"train_loss": -5.41689395904541, "global_step": 35752, "epoch": 851} {"train_loss": -5.567081451416016, "global_step": 35753, "epoch": 851} {"train_loss": -5.6235151290893555, "global_step": 35754, "epoch": 851} {"train_loss": -5.613983154296875, "global_step": 35755, "epoch": 851} {"train_loss": -5.51995849609375, "global_step": 35756, "epoch": 851} {"train_loss": -5.606163024902344, "global_step": 35757, "epoch": 851} {"train_loss": -5.504595756530762, "global_step": 35758, "epoch": 851} {"train_loss": -5.624146461486816, "global_step": 35759, "epoch": 851} {"train_loss": -5.549996376037598, "global_step": 35760, "epoch": 851} {"train_loss": -5.536375522613525, "global_step": 35761, "epoch": 851} {"train_loss": -5.585510730743408, "global_step": 35762, "epoch": 851} {"train_loss": -5.637289047241211, "global_step": 35763, "epoch": 851} {"train_loss": -5.458356857299805, "global_step": 35764, "epoch": 851} {"train_loss": -5.524666786193848, "global_step": 35765, "epoch": 851} {"train_loss": -5.579174041748047, "global_step": 35766, "epoch": 851} {"train_loss": -5.4098615646362305, "global_step": 35767, "epoch": 851} {"train_loss": -5.5274152755737305, "global_step": 35768, "epoch": 851} {"train_loss": -5.505227088928223, "global_step": 35769, "epoch": 851} {"train_loss": -5.4433674812316895, "global_step": 35770, "epoch": 851} {"train_loss": -5.5157670974731445, "global_step": 35771, "epoch": 851} {"train_loss": -5.572419166564941, "global_step": 35772, "epoch": 851} {"train_loss": -5.474937915802002, "global_step": 35773, "epoch": 851} {"train_loss": -5.5030059814453125, "global_step": 35774, "epoch": 851} {"train_loss": -5.449592590332031, "global_step": 35775, "epoch": 851} {"train_loss": -5.661639213562012, "global_step": 35776, "epoch": 851} {"train_loss": -5.609180450439453, "global_step": 35777, "epoch": 851} {"train_loss": -5.413232803344727, "global_step": 35778, "epoch": 851} {"train_loss": -5.605697154998779, "global_step": 35779, "epoch": 851} {"train_loss": -5.532322883605957, "global_step": 35780, "epoch": 851} {"train_loss": -5.512755393981934, "global_step": 35781, "epoch": 851} {"train_loss": -5.648464202880859, "global_step": 35782, "epoch": 851} {"train_loss": -5.540149473008656, "global_step": 35783, "epoch": 851, "val_loss": 62523.19921875} {"train_loss": -5.550273895263672, "global_step": 35784, "epoch": 852} {"train_loss": -5.517600059509277, "global_step": 35785, "epoch": 852} {"train_loss": -5.763428211212158, "global_step": 35786, "epoch": 852} {"train_loss": -5.5107316970825195, "global_step": 35787, "epoch": 852} {"train_loss": -5.5611958503723145, "global_step": 35788, "epoch": 852} {"train_loss": -5.590994358062744, "global_step": 35789, "epoch": 852} {"train_loss": -5.569599151611328, "global_step": 35790, "epoch": 852} {"train_loss": -5.672794342041016, "global_step": 35791, "epoch": 852} {"train_loss": -5.606172561645508, "global_step": 35792, "epoch": 852} {"train_loss": -5.611591815948486, "global_step": 35793, "epoch": 852} {"train_loss": -5.570732116699219, "global_step": 35794, "epoch": 852} {"train_loss": -5.532506942749023, "global_step": 35795, "epoch": 852} {"train_loss": -5.4209465980529785, "global_step": 35796, "epoch": 852} {"train_loss": -5.675625324249268, "global_step": 35797, "epoch": 852} {"train_loss": -5.505379676818848, "global_step": 35798, "epoch": 852} {"train_loss": -5.606542587280273, "global_step": 35799, "epoch": 852} {"train_loss": -5.517431735992432, "global_step": 35800, "epoch": 852} {"train_loss": -5.5112199783325195, "global_step": 35801, "epoch": 852} {"train_loss": -5.574361801147461, "global_step": 35802, "epoch": 852} {"train_loss": -5.597117900848389, "global_step": 35803, "epoch": 852} {"train_loss": -5.444944858551025, "global_step": 35804, "epoch": 852} {"train_loss": -5.524720191955566, "global_step": 35805, "epoch": 852} {"train_loss": -5.575584411621094, "global_step": 35806, "epoch": 852} {"train_loss": -5.533363342285156, "global_step": 35807, "epoch": 852} {"train_loss": -5.61522102355957, "global_step": 35808, "epoch": 852} {"train_loss": -5.621859550476074, "global_step": 35809, "epoch": 852} {"train_loss": -5.667516708374023, "global_step": 35810, "epoch": 852} {"train_loss": -5.545415878295898, "global_step": 35811, "epoch": 852} {"train_loss": -5.54599142074585, "global_step": 35812, "epoch": 852} {"train_loss": -5.622344493865967, "global_step": 35813, "epoch": 852} {"train_loss": -5.598532199859619, "global_step": 35814, "epoch": 852} {"train_loss": -5.582516670227051, "global_step": 35815, "epoch": 852} {"train_loss": -5.532075881958008, "global_step": 35816, "epoch": 852} {"train_loss": -5.56764554977417, "global_step": 35817, "epoch": 852} {"train_loss": -5.611454010009766, "global_step": 35818, "epoch": 852} {"train_loss": -5.628255367279053, "global_step": 35819, "epoch": 852} {"train_loss": -5.587535858154297, "global_step": 35820, "epoch": 852} {"train_loss": -5.385534286499023, "global_step": 35821, "epoch": 852} {"train_loss": -5.700901985168457, "global_step": 35822, "epoch": 852} {"train_loss": -5.592792987823486, "global_step": 35823, "epoch": 852} {"train_loss": -5.646716117858887, "global_step": 35824, "epoch": 852} {"train_loss": -5.575101534525554, "global_step": 35825, "epoch": 852, "val_loss": 62364.22265625} {"train_loss": -5.594958305358887, "global_step": 35826, "epoch": 853} {"train_loss": -5.502000331878662, "global_step": 35827, "epoch": 853} {"train_loss": -5.598432540893555, "global_step": 35828, "epoch": 853} {"train_loss": -5.5723090171813965, "global_step": 35829, "epoch": 853} {"train_loss": -5.647801399230957, "global_step": 35830, "epoch": 853} {"train_loss": -5.634515762329102, "global_step": 35831, "epoch": 853} {"train_loss": -5.511784076690674, "global_step": 35832, "epoch": 853} {"train_loss": -5.641599655151367, "global_step": 35833, "epoch": 853} {"train_loss": -5.504868984222412, "global_step": 35834, "epoch": 853} {"train_loss": -5.685027122497559, "global_step": 35835, "epoch": 853} {"train_loss": -5.620460510253906, "global_step": 35836, "epoch": 853} {"train_loss": -5.6142425537109375, "global_step": 35837, "epoch": 853} {"train_loss": -5.690257549285889, "global_step": 35838, "epoch": 853} {"train_loss": -5.543753623962402, "global_step": 35839, "epoch": 853} {"train_loss": -5.619068145751953, "global_step": 35840, "epoch": 853} {"train_loss": -5.575343132019043, "global_step": 35841, "epoch": 853} {"train_loss": -5.63798713684082, "global_step": 35842, "epoch": 853} {"train_loss": -5.575080871582031, "global_step": 35843, "epoch": 853} {"train_loss": -5.519769191741943, "global_step": 35844, "epoch": 853} {"train_loss": -5.478343963623047, "global_step": 35845, "epoch": 853} {"train_loss": -5.491557598114014, "global_step": 35846, "epoch": 853} {"train_loss": -5.529041290283203, "global_step": 35847, "epoch": 853} {"train_loss": -5.649431228637695, "global_step": 35848, "epoch": 853} {"train_loss": -5.583788871765137, "global_step": 35849, "epoch": 853} {"train_loss": -5.604316711425781, "global_step": 35850, "epoch": 853} {"train_loss": -5.514747142791748, "global_step": 35851, "epoch": 853} {"train_loss": -5.458864688873291, "global_step": 35852, "epoch": 853} {"train_loss": -5.540622711181641, "global_step": 35853, "epoch": 853} {"train_loss": -5.508114337921143, "global_step": 35854, "epoch": 853} {"train_loss": -5.502723217010498, "global_step": 35855, "epoch": 853} {"train_loss": -5.561722755432129, "global_step": 35856, "epoch": 853} {"train_loss": -5.618593215942383, "global_step": 35857, "epoch": 853} {"train_loss": -5.569055557250977, "global_step": 35858, "epoch": 853} {"train_loss": -5.496107578277588, "global_step": 35859, "epoch": 853} {"train_loss": -5.644440650939941, "global_step": 35860, "epoch": 853} {"train_loss": -5.6848835945129395, "global_step": 35861, "epoch": 853} {"train_loss": -5.6067585945129395, "global_step": 35862, "epoch": 853} {"train_loss": -5.708982467651367, "global_step": 35863, "epoch": 853} {"train_loss": -5.622945308685303, "global_step": 35864, "epoch": 853} {"train_loss": -5.5650482177734375, "global_step": 35865, "epoch": 853} {"train_loss": -5.58340311050415, "global_step": 35866, "epoch": 853} {"train_loss": -5.579798448653448, "global_step": 35867, "epoch": 853, "val_loss": 63025.5546875} {"train_loss": -5.47646427154541, "global_step": 35868, "epoch": 854} {"train_loss": -5.53116512298584, "global_step": 35869, "epoch": 854} {"train_loss": -5.452162742614746, "global_step": 35870, "epoch": 854} {"train_loss": -5.460649490356445, "global_step": 35871, "epoch": 854} {"train_loss": -5.508142471313477, "global_step": 35872, "epoch": 854} {"train_loss": -5.672970771789551, "global_step": 35873, "epoch": 854} {"train_loss": -5.378037929534912, "global_step": 35874, "epoch": 854} {"train_loss": -5.576373100280762, "global_step": 35875, "epoch": 854} {"train_loss": -5.545539855957031, "global_step": 35876, "epoch": 854} {"train_loss": -5.456406116485596, "global_step": 35877, "epoch": 854} {"train_loss": -5.611563682556152, "global_step": 35878, "epoch": 854} {"train_loss": -5.573136806488037, "global_step": 35879, "epoch": 854} {"train_loss": -5.509271144866943, "global_step": 35880, "epoch": 854} {"train_loss": -5.5289692878723145, "global_step": 35881, "epoch": 854} {"train_loss": -5.456895351409912, "global_step": 35882, "epoch": 854} {"train_loss": -5.590007781982422, "global_step": 35883, "epoch": 854} {"train_loss": -5.586930274963379, "global_step": 35884, "epoch": 854} {"train_loss": -5.552267074584961, "global_step": 35885, "epoch": 854} {"train_loss": -5.554708480834961, "global_step": 35886, "epoch": 854} {"train_loss": -5.472246170043945, "global_step": 35887, "epoch": 854} {"train_loss": -5.579615592956543, "global_step": 35888, "epoch": 854} {"train_loss": -5.751997947692871, "global_step": 35889, "epoch": 854} {"train_loss": -5.485307216644287, "global_step": 35890, "epoch": 854} {"train_loss": -5.593505859375, "global_step": 35891, "epoch": 854} {"train_loss": -5.603154182434082, "global_step": 35892, "epoch": 854} {"train_loss": -5.656323432922363, "global_step": 35893, "epoch": 854} {"train_loss": -5.601210117340088, "global_step": 35894, "epoch": 854} {"train_loss": -5.524928092956543, "global_step": 35895, "epoch": 854} {"train_loss": -5.524206161499023, "global_step": 35896, "epoch": 854} {"train_loss": -5.656241416931152, "global_step": 35897, "epoch": 854} {"train_loss": -5.6111578941345215, "global_step": 35898, "epoch": 854} {"train_loss": -5.57297420501709, "global_step": 35899, "epoch": 854} {"train_loss": -5.493854522705078, "global_step": 35900, "epoch": 854} {"train_loss": -5.541568756103516, "global_step": 35901, "epoch": 854} {"train_loss": -5.558166027069092, "global_step": 35902, "epoch": 854} {"train_loss": -5.697772026062012, "global_step": 35903, "epoch": 854} {"train_loss": -5.577771186828613, "global_step": 35904, "epoch": 854} {"train_loss": -5.538571834564209, "global_step": 35905, "epoch": 854} {"train_loss": -5.755884170532227, "global_step": 35906, "epoch": 854} {"train_loss": -5.409276485443115, "global_step": 35907, "epoch": 854} {"train_loss": -5.669169902801514, "global_step": 35908, "epoch": 854} {"train_loss": -5.559901282900856, "global_step": 35909, "epoch": 854, "val_loss": 62520.6875} {"train_loss": -5.495062828063965, "global_step": 35910, "epoch": 855} {"train_loss": -5.504693984985352, "global_step": 35911, "epoch": 855} {"train_loss": -5.479034423828125, "global_step": 35912, "epoch": 855} {"train_loss": -5.461103439331055, "global_step": 35913, "epoch": 855} {"train_loss": -5.5637640953063965, "global_step": 35914, "epoch": 855} {"train_loss": -5.441141128540039, "global_step": 35915, "epoch": 855} {"train_loss": -5.527204990386963, "global_step": 35916, "epoch": 855} {"train_loss": -5.578225135803223, "global_step": 35917, "epoch": 855} {"train_loss": -5.505863189697266, "global_step": 35918, "epoch": 855} {"train_loss": -5.396925926208496, "global_step": 35919, "epoch": 855} {"train_loss": -5.69660758972168, "global_step": 35920, "epoch": 855} {"train_loss": -5.566229820251465, "global_step": 35921, "epoch": 855} {"train_loss": -5.457083225250244, "global_step": 35922, "epoch": 855} {"train_loss": -5.617290496826172, "global_step": 35923, "epoch": 855} {"train_loss": -5.462792873382568, "global_step": 35924, "epoch": 855} {"train_loss": -5.568299770355225, "global_step": 35925, "epoch": 855} {"train_loss": -5.623170375823975, "global_step": 35926, "epoch": 855} {"train_loss": -5.5547685623168945, "global_step": 35927, "epoch": 855} {"train_loss": -5.664000511169434, "global_step": 35928, "epoch": 855} {"train_loss": -5.51140022277832, "global_step": 35929, "epoch": 855} {"train_loss": -5.620510101318359, "global_step": 35930, "epoch": 855} {"train_loss": -5.529536724090576, "global_step": 35931, "epoch": 855} {"train_loss": -5.6125359535217285, "global_step": 35932, "epoch": 855} {"train_loss": -5.412484169006348, "global_step": 35933, "epoch": 855} {"train_loss": -5.39959192276001, "global_step": 35934, "epoch": 855} {"train_loss": -5.601973533630371, "global_step": 35935, "epoch": 855} {"train_loss": -5.526291847229004, "global_step": 35936, "epoch": 855} {"train_loss": -5.692798614501953, "global_step": 35937, "epoch": 855} {"train_loss": -5.619663715362549, "global_step": 35938, "epoch": 855} {"train_loss": -5.506567001342773, "global_step": 35939, "epoch": 855} {"train_loss": -5.448552131652832, "global_step": 35940, "epoch": 855} {"train_loss": -5.507887840270996, "global_step": 35941, "epoch": 855} {"train_loss": -5.555697441101074, "global_step": 35942, "epoch": 855} {"train_loss": -5.3892822265625, "global_step": 35943, "epoch": 855} {"train_loss": -5.576486587524414, "global_step": 35944, "epoch": 855} {"train_loss": -5.591405391693115, "global_step": 35945, "epoch": 855} {"train_loss": -5.487817764282227, "global_step": 35946, "epoch": 855} {"train_loss": -5.697630882263184, "global_step": 35947, "epoch": 855} {"train_loss": -5.673733711242676, "global_step": 35948, "epoch": 855} {"train_loss": -5.439142227172852, "global_step": 35949, "epoch": 855} {"train_loss": -5.626003265380859, "global_step": 35950, "epoch": 855} {"train_loss": -5.542836007617769, "global_step": 35951, "epoch": 855, "val_loss": 62556.4140625} {"train_loss": -5.482487201690674, "global_step": 35952, "epoch": 856} {"train_loss": -5.519062042236328, "global_step": 35953, "epoch": 856} {"train_loss": -5.486963272094727, "global_step": 35954, "epoch": 856} {"train_loss": -5.437005996704102, "global_step": 35955, "epoch": 856} {"train_loss": -5.3619771003723145, "global_step": 35956, "epoch": 856} {"train_loss": -5.569159030914307, "global_step": 35957, "epoch": 856} {"train_loss": -5.404843330383301, "global_step": 35958, "epoch": 856} {"train_loss": -5.555928707122803, "global_step": 35959, "epoch": 856} {"train_loss": -5.53426456451416, "global_step": 35960, "epoch": 856} {"train_loss": -5.373287677764893, "global_step": 35961, "epoch": 856} {"train_loss": -5.568879127502441, "global_step": 35962, "epoch": 856} {"train_loss": -5.582433700561523, "global_step": 35963, "epoch": 856} {"train_loss": -5.494453430175781, "global_step": 35964, "epoch": 856} {"train_loss": -5.705191612243652, "global_step": 35965, "epoch": 856} {"train_loss": -5.50730562210083, "global_step": 35966, "epoch": 856} {"train_loss": -5.411533355712891, "global_step": 35967, "epoch": 856} {"train_loss": -5.550079822540283, "global_step": 35968, "epoch": 856} {"train_loss": -5.449847221374512, "global_step": 35969, "epoch": 856} {"train_loss": -5.607328414916992, "global_step": 35970, "epoch": 856} {"train_loss": -5.536798477172852, "global_step": 35971, "epoch": 856} {"train_loss": -5.600923538208008, "global_step": 35972, "epoch": 856} {"train_loss": -5.551253318786621, "global_step": 35973, "epoch": 856} {"train_loss": -5.519807815551758, "global_step": 35974, "epoch": 856} {"train_loss": -5.51981782913208, "global_step": 35975, "epoch": 856} {"train_loss": -5.561287879943848, "global_step": 35976, "epoch": 856} {"train_loss": -5.516137599945068, "global_step": 35977, "epoch": 856} {"train_loss": -5.5814948081970215, "global_step": 35978, "epoch": 856} {"train_loss": -5.5672688484191895, "global_step": 35979, "epoch": 856} {"train_loss": -5.615011692047119, "global_step": 35980, "epoch": 856} {"train_loss": -5.562582969665527, "global_step": 35981, "epoch": 856} {"train_loss": -5.516358852386475, "global_step": 35982, "epoch": 856} {"train_loss": -5.477810382843018, "global_step": 35983, "epoch": 856} {"train_loss": -5.572240829467773, "global_step": 35984, "epoch": 856} {"train_loss": -5.5354156494140625, "global_step": 35985, "epoch": 856} {"train_loss": -5.636045932769775, "global_step": 35986, "epoch": 856} {"train_loss": -5.534529685974121, "global_step": 35987, "epoch": 856} {"train_loss": -5.572977066040039, "global_step": 35988, "epoch": 856} {"train_loss": -5.494476318359375, "global_step": 35989, "epoch": 856} {"train_loss": -5.5229926109313965, "global_step": 35990, "epoch": 856} {"train_loss": -5.565065383911133, "global_step": 35991, "epoch": 856} {"train_loss": -5.537261009216309, "global_step": 35992, "epoch": 856} {"train_loss": -5.526105846677508, "global_step": 35993, "epoch": 856, "val_loss": 62293.22265625} {"train_loss": -5.505559921264648, "global_step": 35994, "epoch": 857} {"train_loss": -5.4332075119018555, "global_step": 35995, "epoch": 857} {"train_loss": -5.7989935874938965, "global_step": 35996, "epoch": 857} {"train_loss": -5.433940887451172, "global_step": 35997, "epoch": 857} {"train_loss": -5.398509502410889, "global_step": 35998, "epoch": 857} {"train_loss": -5.434761047363281, "global_step": 35999, "epoch": 857} {"train_loss": -5.482282638549805, "global_step": 36000, "epoch": 857} {"train_loss": -5.409717559814453, "global_step": 36001, "epoch": 857} {"train_loss": -5.605879783630371, "global_step": 36002, "epoch": 857} {"train_loss": -5.5588788986206055, "global_step": 36003, "epoch": 857} {"train_loss": -5.35341739654541, "global_step": 36004, "epoch": 857} {"train_loss": -5.550528526306152, "global_step": 36005, "epoch": 857} {"train_loss": -5.5670952796936035, "global_step": 36006, "epoch": 857} {"train_loss": -5.558097839355469, "global_step": 36007, "epoch": 857} {"train_loss": -5.635739803314209, "global_step": 36008, "epoch": 857} {"train_loss": -5.371822834014893, "global_step": 36009, "epoch": 857} {"train_loss": -5.631755828857422, "global_step": 36010, "epoch": 857} {"train_loss": -5.622500419616699, "global_step": 36011, "epoch": 857} {"train_loss": -5.610743522644043, "global_step": 36012, "epoch": 857} {"train_loss": -5.4972333908081055, "global_step": 36013, "epoch": 857} {"train_loss": -5.489253044128418, "global_step": 36014, "epoch": 857} {"train_loss": -5.648090362548828, "global_step": 36015, "epoch": 857} {"train_loss": -5.662118434906006, "global_step": 36016, "epoch": 857} {"train_loss": -5.49308967590332, "global_step": 36017, "epoch": 857} {"train_loss": -5.606345176696777, "global_step": 36018, "epoch": 857} {"train_loss": -5.5863752365112305, "global_step": 36019, "epoch": 857} {"train_loss": -5.626156806945801, "global_step": 36020, "epoch": 857} {"train_loss": -5.570488452911377, "global_step": 36021, "epoch": 857} {"train_loss": -5.5948405265808105, "global_step": 36022, "epoch": 857} {"train_loss": -5.694844722747803, "global_step": 36023, "epoch": 857} {"train_loss": -5.521967887878418, "global_step": 36024, "epoch": 857} {"train_loss": -5.503198623657227, "global_step": 36025, "epoch": 857} {"train_loss": -5.602763652801514, "global_step": 36026, "epoch": 857} {"train_loss": -5.635791301727295, "global_step": 36027, "epoch": 857} {"train_loss": -5.439695358276367, "global_step": 36028, "epoch": 857} {"train_loss": -5.532287120819092, "global_step": 36029, "epoch": 857} {"train_loss": -5.48803186416626, "global_step": 36030, "epoch": 857} {"train_loss": -5.518052101135254, "global_step": 36031, "epoch": 857} {"train_loss": -5.670732498168945, "global_step": 36032, "epoch": 857} {"train_loss": -5.531564712524414, "global_step": 36033, "epoch": 857} {"train_loss": -5.45474910736084, "global_step": 36034, "epoch": 857} {"train_loss": -5.543793349038987, "global_step": 36035, "epoch": 857, "val_loss": 62508.1875} {"train_loss": -5.6430511474609375, "global_step": 36036, "epoch": 858} {"train_loss": -5.547208786010742, "global_step": 36037, "epoch": 858} {"train_loss": -5.458723068237305, "global_step": 36038, "epoch": 858} {"train_loss": -5.577853202819824, "global_step": 36039, "epoch": 858} {"train_loss": -5.573112487792969, "global_step": 36040, "epoch": 858} {"train_loss": -5.5487236976623535, "global_step": 36041, "epoch": 858} {"train_loss": -5.622260093688965, "global_step": 36042, "epoch": 858} {"train_loss": -5.60544490814209, "global_step": 36043, "epoch": 858} {"train_loss": -5.591900825500488, "global_step": 36044, "epoch": 858} {"train_loss": -5.601156711578369, "global_step": 36045, "epoch": 858} {"train_loss": -5.4467315673828125, "global_step": 36046, "epoch": 858} {"train_loss": -5.6202192306518555, "global_step": 36047, "epoch": 858} {"train_loss": -5.638377666473389, "global_step": 36048, "epoch": 858} {"train_loss": -5.568670272827148, "global_step": 36049, "epoch": 858} {"train_loss": -5.670594215393066, "global_step": 36050, "epoch": 858} {"train_loss": -5.4879584312438965, "global_step": 36051, "epoch": 858} {"train_loss": -5.528074264526367, "global_step": 36052, "epoch": 858} {"train_loss": -5.52557373046875, "global_step": 36053, "epoch": 858} {"train_loss": -5.529921531677246, "global_step": 36054, "epoch": 858} {"train_loss": -5.528188705444336, "global_step": 36055, "epoch": 858} {"train_loss": -5.607303142547607, "global_step": 36056, "epoch": 858} {"train_loss": -5.430315971374512, "global_step": 36057, "epoch": 858} {"train_loss": -5.69281005859375, "global_step": 36058, "epoch": 858} {"train_loss": -5.648820877075195, "global_step": 36059, "epoch": 858} {"train_loss": -5.68086051940918, "global_step": 36060, "epoch": 858} {"train_loss": -5.527878761291504, "global_step": 36061, "epoch": 858} {"train_loss": -5.621854305267334, "global_step": 36062, "epoch": 858} {"train_loss": -5.7062602043151855, "global_step": 36063, "epoch": 858} {"train_loss": -5.6992645263671875, "global_step": 36064, "epoch": 858} {"train_loss": -5.6641845703125, "global_step": 36065, "epoch": 858} {"train_loss": -5.616735458374023, "global_step": 36066, "epoch": 858} {"train_loss": -5.615909099578857, "global_step": 36067, "epoch": 858} {"train_loss": -5.545204162597656, "global_step": 36068, "epoch": 858} {"train_loss": -5.54139518737793, "global_step": 36069, "epoch": 858} {"train_loss": -5.55800724029541, "global_step": 36070, "epoch": 858} {"train_loss": -5.571085453033447, "global_step": 36071, "epoch": 858} {"train_loss": -5.614279747009277, "global_step": 36072, "epoch": 858} {"train_loss": -5.676115989685059, "global_step": 36073, "epoch": 858} {"train_loss": -5.558407783508301, "global_step": 36074, "epoch": 858} {"train_loss": -5.538300514221191, "global_step": 36075, "epoch": 858} {"train_loss": -5.4615068435668945, "global_step": 36076, "epoch": 858} {"train_loss": -5.5836030188060946, "global_step": 36077, "epoch": 858, "val_loss": 62426.91796875} {"train_loss": -5.68171501159668, "global_step": 36078, "epoch": 859} {"train_loss": -5.5914201736450195, "global_step": 36079, "epoch": 859} {"train_loss": -5.594873905181885, "global_step": 36080, "epoch": 859} {"train_loss": -5.506217002868652, "global_step": 36081, "epoch": 859} {"train_loss": -5.583168029785156, "global_step": 36082, "epoch": 859} {"train_loss": -5.5246171951293945, "global_step": 36083, "epoch": 859} {"train_loss": -5.616982460021973, "global_step": 36084, "epoch": 859} {"train_loss": -5.641417026519775, "global_step": 36085, "epoch": 859} {"train_loss": -5.51777458190918, "global_step": 36086, "epoch": 859} {"train_loss": -5.617927551269531, "global_step": 36087, "epoch": 859} {"train_loss": -5.592438697814941, "global_step": 36088, "epoch": 859} {"train_loss": -5.57682466506958, "global_step": 36089, "epoch": 859} {"train_loss": -5.570605278015137, "global_step": 36090, "epoch": 859} {"train_loss": -5.644491195678711, "global_step": 36091, "epoch": 859} {"train_loss": -5.631276607513428, "global_step": 36092, "epoch": 859} {"train_loss": -5.607726097106934, "global_step": 36093, "epoch": 859} {"train_loss": -5.6742448806762695, "global_step": 36094, "epoch": 859} {"train_loss": -5.667147636413574, "global_step": 36095, "epoch": 859} {"train_loss": -5.526881217956543, "global_step": 36096, "epoch": 859} {"train_loss": -5.720800399780273, "global_step": 36097, "epoch": 859} {"train_loss": -5.559228897094727, "global_step": 36098, "epoch": 859} {"train_loss": -5.580475330352783, "global_step": 36099, "epoch": 859} {"train_loss": -5.589325428009033, "global_step": 36100, "epoch": 859} {"train_loss": -5.633575439453125, "global_step": 36101, "epoch": 859} {"train_loss": -5.5023193359375, "global_step": 36102, "epoch": 859} {"train_loss": -5.479423522949219, "global_step": 36103, "epoch": 859} {"train_loss": -5.474950790405273, "global_step": 36104, "epoch": 859} {"train_loss": -5.5811238288879395, "global_step": 36105, "epoch": 859} {"train_loss": -5.7871198654174805, "global_step": 36106, "epoch": 859} {"train_loss": -5.5174102783203125, "global_step": 36107, "epoch": 859} {"train_loss": -5.627106666564941, "global_step": 36108, "epoch": 859} {"train_loss": -5.508150100708008, "global_step": 36109, "epoch": 859} {"train_loss": -5.59760046005249, "global_step": 36110, "epoch": 859} {"train_loss": -5.56389045715332, "global_step": 36111, "epoch": 859} {"train_loss": -5.629733085632324, "global_step": 36112, "epoch": 859} {"train_loss": -5.4486894607543945, "global_step": 36113, "epoch": 859} {"train_loss": -5.600152969360352, "global_step": 36114, "epoch": 859} {"train_loss": -5.611294746398926, "global_step": 36115, "epoch": 859} {"train_loss": -5.559698104858398, "global_step": 36116, "epoch": 859} {"train_loss": -5.6041741371154785, "global_step": 36117, "epoch": 859} {"train_loss": -5.650701522827148, "global_step": 36118, "epoch": 859} {"train_loss": -5.590398198082333, "global_step": 36119, "epoch": 859, "val_loss": 62368.33203125} {"train_loss": -5.5140275955200195, "global_step": 36120, "epoch": 860} {"train_loss": -5.664170265197754, "global_step": 36121, "epoch": 860} {"train_loss": -5.49577522277832, "global_step": 36122, "epoch": 860} {"train_loss": -5.558127403259277, "global_step": 36123, "epoch": 860} {"train_loss": -5.547033309936523, "global_step": 36124, "epoch": 860} {"train_loss": -5.5872697830200195, "global_step": 36125, "epoch": 860} {"train_loss": -5.602579593658447, "global_step": 36126, "epoch": 860} {"train_loss": -5.535874843597412, "global_step": 36127, "epoch": 860} {"train_loss": -5.466280937194824, "global_step": 36128, "epoch": 860} {"train_loss": -5.603819847106934, "global_step": 36129, "epoch": 860} {"train_loss": -5.572583198547363, "global_step": 36130, "epoch": 860} {"train_loss": -5.5085344314575195, "global_step": 36131, "epoch": 860} {"train_loss": -5.394193172454834, "global_step": 36132, "epoch": 860} {"train_loss": -5.609441757202148, "global_step": 36133, "epoch": 860} {"train_loss": -5.5760087966918945, "global_step": 36134, "epoch": 860} {"train_loss": -5.559859275817871, "global_step": 36135, "epoch": 860} {"train_loss": -5.634875297546387, "global_step": 36136, "epoch": 860} {"train_loss": -5.365741729736328, "global_step": 36137, "epoch": 860} {"train_loss": -5.557096481323242, "global_step": 36138, "epoch": 860} {"train_loss": -5.646246910095215, "global_step": 36139, "epoch": 860} {"train_loss": -5.608879566192627, "global_step": 36140, "epoch": 860} {"train_loss": -5.534886360168457, "global_step": 36141, "epoch": 860} {"train_loss": -5.609330177307129, "global_step": 36142, "epoch": 860} {"train_loss": -5.690007209777832, "global_step": 36143, "epoch": 860} {"train_loss": -5.572849750518799, "global_step": 36144, "epoch": 860} {"train_loss": -5.599428653717041, "global_step": 36145, "epoch": 860} {"train_loss": -5.55466890335083, "global_step": 36146, "epoch": 860} {"train_loss": -5.628620147705078, "global_step": 36147, "epoch": 860} {"train_loss": -5.579106330871582, "global_step": 36148, "epoch": 860} {"train_loss": -5.475557327270508, "global_step": 36149, "epoch": 860} {"train_loss": -5.638124465942383, "global_step": 36150, "epoch": 860} {"train_loss": -5.782410144805908, "global_step": 36151, "epoch": 860} {"train_loss": -5.634807586669922, "global_step": 36152, "epoch": 860} {"train_loss": -5.665524482727051, "global_step": 36153, "epoch": 860} {"train_loss": -5.498231887817383, "global_step": 36154, "epoch": 860} {"train_loss": -5.502471923828125, "global_step": 36155, "epoch": 860} {"train_loss": -5.609920501708984, "global_step": 36156, "epoch": 860} {"train_loss": -5.572083950042725, "global_step": 36157, "epoch": 860} {"train_loss": -5.740708351135254, "global_step": 36158, "epoch": 860} {"train_loss": -5.607564449310303, "global_step": 36159, "epoch": 860} {"train_loss": -5.69793176651001, "global_step": 36160, "epoch": 860} {"train_loss": -5.581019049599057, "global_step": 36161, "epoch": 860, "val_loss": 62125.66015625} {"train_loss": -5.661165714263916, "global_step": 36162, "epoch": 861} {"train_loss": -5.638288974761963, "global_step": 36163, "epoch": 861} {"train_loss": -5.579174041748047, "global_step": 36164, "epoch": 861} {"train_loss": -5.577258586883545, "global_step": 36165, "epoch": 861} {"train_loss": -5.684167861938477, "global_step": 36166, "epoch": 861} {"train_loss": -5.492886066436768, "global_step": 36167, "epoch": 861} {"train_loss": -5.708813190460205, "global_step": 36168, "epoch": 861} {"train_loss": -5.54833459854126, "global_step": 36169, "epoch": 861} {"train_loss": -5.5980072021484375, "global_step": 36170, "epoch": 861} {"train_loss": -5.440306186676025, "global_step": 36171, "epoch": 861} {"train_loss": -5.530900955200195, "global_step": 36172, "epoch": 861} {"train_loss": -5.465260028839111, "global_step": 36173, "epoch": 861} {"train_loss": -5.668355464935303, "global_step": 36174, "epoch": 861} {"train_loss": -5.744717597961426, "global_step": 36175, "epoch": 861} {"train_loss": -5.584981918334961, "global_step": 36176, "epoch": 861} {"train_loss": -5.649959564208984, "global_step": 36177, "epoch": 861} {"train_loss": -5.4396772384643555, "global_step": 36178, "epoch": 861} {"train_loss": -5.656750679016113, "global_step": 36179, "epoch": 861} {"train_loss": -5.668569564819336, "global_step": 36180, "epoch": 861} {"train_loss": -5.566433906555176, "global_step": 36181, "epoch": 861} {"train_loss": -5.696811676025391, "global_step": 36182, "epoch": 861} {"train_loss": -5.606093406677246, "global_step": 36183, "epoch": 861} {"train_loss": -5.634433746337891, "global_step": 36184, "epoch": 861} {"train_loss": -5.632493019104004, "global_step": 36185, "epoch": 861} {"train_loss": -5.583253860473633, "global_step": 36186, "epoch": 861} {"train_loss": -5.63997220993042, "global_step": 36187, "epoch": 861} {"train_loss": -5.5995965003967285, "global_step": 36188, "epoch": 861} {"train_loss": -5.5918354988098145, "global_step": 36189, "epoch": 861} {"train_loss": -5.605611801147461, "global_step": 36190, "epoch": 861} {"train_loss": -5.6561994552612305, "global_step": 36191, "epoch": 861} {"train_loss": -5.540826797485352, "global_step": 36192, "epoch": 861} {"train_loss": -5.595032691955566, "global_step": 36193, "epoch": 861} {"train_loss": -5.435029983520508, "global_step": 36194, "epoch": 861} {"train_loss": -5.540258407592773, "global_step": 36195, "epoch": 861} {"train_loss": -5.46572208404541, "global_step": 36196, "epoch": 861} {"train_loss": -5.54278039932251, "global_step": 36197, "epoch": 861} {"train_loss": -5.507219314575195, "global_step": 36198, "epoch": 861} {"train_loss": -5.615736961364746, "global_step": 36199, "epoch": 861} {"train_loss": -5.568955421447754, "global_step": 36200, "epoch": 861} {"train_loss": -5.6268310546875, "global_step": 36201, "epoch": 861} {"train_loss": -5.456376552581787, "global_step": 36202, "epoch": 861} {"train_loss": -5.584880896977016, "global_step": 36203, "epoch": 861, "val_loss": 62551.58984375} {"train_loss": -5.540025234222412, "global_step": 36204, "epoch": 862} {"train_loss": -5.40129280090332, "global_step": 36205, "epoch": 862} {"train_loss": -5.774280548095703, "global_step": 36206, "epoch": 862} {"train_loss": -5.4701080322265625, "global_step": 36207, "epoch": 862} {"train_loss": -5.637860298156738, "global_step": 36208, "epoch": 862} {"train_loss": -5.535411834716797, "global_step": 36209, "epoch": 862} {"train_loss": -5.585892677307129, "global_step": 36210, "epoch": 862} {"train_loss": -5.536066055297852, "global_step": 36211, "epoch": 862} {"train_loss": -5.617135047912598, "global_step": 36212, "epoch": 862} {"train_loss": -5.517174243927002, "global_step": 36213, "epoch": 862} {"train_loss": -5.4075493812561035, "global_step": 36214, "epoch": 862} {"train_loss": -5.476612091064453, "global_step": 36215, "epoch": 862} {"train_loss": -5.561341285705566, "global_step": 36216, "epoch": 862} {"train_loss": -5.636270523071289, "global_step": 36217, "epoch": 862} {"train_loss": -5.534416675567627, "global_step": 36218, "epoch": 862} {"train_loss": -5.570509433746338, "global_step": 36219, "epoch": 862} {"train_loss": -5.571717262268066, "global_step": 36220, "epoch": 862} {"train_loss": -5.512208461761475, "global_step": 36221, "epoch": 862} {"train_loss": -5.635490417480469, "global_step": 36222, "epoch": 862} {"train_loss": -5.524378776550293, "global_step": 36223, "epoch": 862} {"train_loss": -5.555459499359131, "global_step": 36224, "epoch": 862} {"train_loss": -5.471908092498779, "global_step": 36225, "epoch": 862} {"train_loss": -5.627231597900391, "global_step": 36226, "epoch": 862} {"train_loss": -5.639254570007324, "global_step": 36227, "epoch": 862} {"train_loss": -5.672146797180176, "global_step": 36228, "epoch": 862} {"train_loss": -5.654244422912598, "global_step": 36229, "epoch": 862} {"train_loss": -5.5877580642700195, "global_step": 36230, "epoch": 862} {"train_loss": -5.476792812347412, "global_step": 36231, "epoch": 862} {"train_loss": -5.5428056716918945, "global_step": 36232, "epoch": 862} {"train_loss": -5.654140472412109, "global_step": 36233, "epoch": 862} {"train_loss": -5.553064823150635, "global_step": 36234, "epoch": 862} {"train_loss": -5.663148880004883, "global_step": 36235, "epoch": 862} {"train_loss": -5.467279434204102, "global_step": 36236, "epoch": 862} {"train_loss": -5.396533966064453, "global_step": 36237, "epoch": 862} {"train_loss": -5.422194480895996, "global_step": 36238, "epoch": 862} {"train_loss": -5.615939140319824, "global_step": 36239, "epoch": 862} {"train_loss": -5.529166221618652, "global_step": 36240, "epoch": 862} {"train_loss": -5.586209297180176, "global_step": 36241, "epoch": 862} {"train_loss": -5.679038047790527, "global_step": 36242, "epoch": 862} {"train_loss": -5.602104187011719, "global_step": 36243, "epoch": 862} {"train_loss": -5.531954765319824, "global_step": 36244, "epoch": 862} {"train_loss": -5.56159648441133, "global_step": 36245, "epoch": 862, "val_loss": 62774.4765625} {"train_loss": -5.49183464050293, "global_step": 36246, "epoch": 863} {"train_loss": -5.562499046325684, "global_step": 36247, "epoch": 863} {"train_loss": -5.713719367980957, "global_step": 36248, "epoch": 863} {"train_loss": -5.522698402404785, "global_step": 36249, "epoch": 863} {"train_loss": -5.514768123626709, "global_step": 36250, "epoch": 863} {"train_loss": -5.495425224304199, "global_step": 36251, "epoch": 863} {"train_loss": -5.626034736633301, "global_step": 36252, "epoch": 863} {"train_loss": -5.49189567565918, "global_step": 36253, "epoch": 863} {"train_loss": -5.549259185791016, "global_step": 36254, "epoch": 863} {"train_loss": -5.501593589782715, "global_step": 36255, "epoch": 863} {"train_loss": -5.512611389160156, "global_step": 36256, "epoch": 863} {"train_loss": -5.483776569366455, "global_step": 36257, "epoch": 863} {"train_loss": -5.542788982391357, "global_step": 36258, "epoch": 863} {"train_loss": -5.651247024536133, "global_step": 36259, "epoch": 863} {"train_loss": -5.544587135314941, "global_step": 36260, "epoch": 863} {"train_loss": -5.4112467765808105, "global_step": 36261, "epoch": 863} {"train_loss": -5.618569850921631, "global_step": 36262, "epoch": 863} {"train_loss": -5.412275314331055, "global_step": 36263, "epoch": 863} {"train_loss": -5.55871057510376, "global_step": 36264, "epoch": 863} {"train_loss": -5.589961528778076, "global_step": 36265, "epoch": 863} {"train_loss": -5.578384876251221, "global_step": 36266, "epoch": 863} {"train_loss": -5.58766508102417, "global_step": 36267, "epoch": 863} {"train_loss": -5.559267044067383, "global_step": 36268, "epoch": 863} {"train_loss": -5.69704532623291, "global_step": 36269, "epoch": 863} {"train_loss": -5.526013374328613, "global_step": 36270, "epoch": 863} {"train_loss": -5.579373359680176, "global_step": 36271, "epoch": 863} {"train_loss": -5.527262210845947, "global_step": 36272, "epoch": 863} {"train_loss": -5.539361953735352, "global_step": 36273, "epoch": 863} {"train_loss": -5.492923736572266, "global_step": 36274, "epoch": 863} {"train_loss": -5.539600849151611, "global_step": 36275, "epoch": 863} {"train_loss": -5.619202613830566, "global_step": 36276, "epoch": 863} {"train_loss": -5.488421440124512, "global_step": 36277, "epoch": 863} {"train_loss": -5.5039472579956055, "global_step": 36278, "epoch": 863} {"train_loss": -5.646205902099609, "global_step": 36279, "epoch": 863} {"train_loss": -5.5308942794799805, "global_step": 36280, "epoch": 863} {"train_loss": -5.539582252502441, "global_step": 36281, "epoch": 863} {"train_loss": -5.581174850463867, "global_step": 36282, "epoch": 863} {"train_loss": -5.650308609008789, "global_step": 36283, "epoch": 863} {"train_loss": -5.525630950927734, "global_step": 36284, "epoch": 863} {"train_loss": -5.664968967437744, "global_step": 36285, "epoch": 863} {"train_loss": -5.628688335418701, "global_step": 36286, "epoch": 863} {"train_loss": -5.555206185295468, "global_step": 36287, "epoch": 863, "val_loss": 62340.5234375} {"train_loss": -5.636165142059326, "global_step": 36288, "epoch": 864} {"train_loss": -5.566780090332031, "global_step": 36289, "epoch": 864} {"train_loss": -5.675782203674316, "global_step": 36290, "epoch": 864} {"train_loss": -5.483046054840088, "global_step": 36291, "epoch": 864} {"train_loss": -5.588453769683838, "global_step": 36292, "epoch": 864} {"train_loss": -5.5174760818481445, "global_step": 36293, "epoch": 864} {"train_loss": -5.495332717895508, "global_step": 36294, "epoch": 864} {"train_loss": -5.510875225067139, "global_step": 36295, "epoch": 864} {"train_loss": -5.507960319519043, "global_step": 36296, "epoch": 864} {"train_loss": -5.564915657043457, "global_step": 36297, "epoch": 864} {"train_loss": -5.551094055175781, "global_step": 36298, "epoch": 864} {"train_loss": -5.626313209533691, "global_step": 36299, "epoch": 864} {"train_loss": -5.597982883453369, "global_step": 36300, "epoch": 864} {"train_loss": -5.66977596282959, "global_step": 36301, "epoch": 864} {"train_loss": -5.620780944824219, "global_step": 36302, "epoch": 864} {"train_loss": -5.6258225440979, "global_step": 36303, "epoch": 864} {"train_loss": -5.522439956665039, "global_step": 36304, "epoch": 864} {"train_loss": -5.557544708251953, "global_step": 36305, "epoch": 864} {"train_loss": -5.64805269241333, "global_step": 36306, "epoch": 864} {"train_loss": -5.692637920379639, "global_step": 36307, "epoch": 864} {"train_loss": -5.674201965332031, "global_step": 36308, "epoch": 864} {"train_loss": -5.51461124420166, "global_step": 36309, "epoch": 864} {"train_loss": -5.532331466674805, "global_step": 36310, "epoch": 864} {"train_loss": -5.60847282409668, "global_step": 36311, "epoch": 864} {"train_loss": -5.635878562927246, "global_step": 36312, "epoch": 864} {"train_loss": -5.6251702308654785, "global_step": 36313, "epoch": 864} {"train_loss": -5.6043901443481445, "global_step": 36314, "epoch": 864} {"train_loss": -5.427734851837158, "global_step": 36315, "epoch": 864} {"train_loss": -5.455931663513184, "global_step": 36316, "epoch": 864} {"train_loss": -5.6812567710876465, "global_step": 36317, "epoch": 864} {"train_loss": -5.489068984985352, "global_step": 36318, "epoch": 864} {"train_loss": -5.461367607116699, "global_step": 36319, "epoch": 864} {"train_loss": -5.5362958908081055, "global_step": 36320, "epoch": 864} {"train_loss": -5.50645637512207, "global_step": 36321, "epoch": 864} {"train_loss": -5.525907516479492, "global_step": 36322, "epoch": 864} {"train_loss": -5.536758899688721, "global_step": 36323, "epoch": 864} {"train_loss": -5.445878982543945, "global_step": 36324, "epoch": 864} {"train_loss": -5.6084794998168945, "global_step": 36325, "epoch": 864} {"train_loss": -5.516289710998535, "global_step": 36326, "epoch": 864} {"train_loss": -5.505096435546875, "global_step": 36327, "epoch": 864} {"train_loss": -5.550485610961914, "global_step": 36328, "epoch": 864} {"train_loss": -5.564159223011562, "global_step": 36329, "epoch": 864, "val_loss": 62870.82421875} {"train_loss": -5.583195686340332, "global_step": 36330, "epoch": 865} {"train_loss": -5.6513566970825195, "global_step": 36331, "epoch": 865} {"train_loss": -5.481563568115234, "global_step": 36332, "epoch": 865} {"train_loss": -5.536805152893066, "global_step": 36333, "epoch": 865} {"train_loss": -5.648186683654785, "global_step": 36334, "epoch": 865} {"train_loss": -5.540897369384766, "global_step": 36335, "epoch": 865} {"train_loss": -5.575279235839844, "global_step": 36336, "epoch": 865} {"train_loss": -5.529732704162598, "global_step": 36337, "epoch": 865} {"train_loss": -5.588142395019531, "global_step": 36338, "epoch": 865} {"train_loss": -5.636224746704102, "global_step": 36339, "epoch": 865} {"train_loss": -5.558213710784912, "global_step": 36340, "epoch": 865} {"train_loss": -5.5315961837768555, "global_step": 36341, "epoch": 865} {"train_loss": -5.61391544342041, "global_step": 36342, "epoch": 865} {"train_loss": -5.624969959259033, "global_step": 36343, "epoch": 865} {"train_loss": -5.566132068634033, "global_step": 36344, "epoch": 865} {"train_loss": -5.627277374267578, "global_step": 36345, "epoch": 865} {"train_loss": -5.594265937805176, "global_step": 36346, "epoch": 865} {"train_loss": -5.600237846374512, "global_step": 36347, "epoch": 865} {"train_loss": -5.67310905456543, "global_step": 36348, "epoch": 865} {"train_loss": -5.59959077835083, "global_step": 36349, "epoch": 865} {"train_loss": -5.598110198974609, "global_step": 36350, "epoch": 865} {"train_loss": -5.55954647064209, "global_step": 36351, "epoch": 865} {"train_loss": -5.671281814575195, "global_step": 36352, "epoch": 865} {"train_loss": -5.537336349487305, "global_step": 36353, "epoch": 865} {"train_loss": -5.66453742980957, "global_step": 36354, "epoch": 865} {"train_loss": -5.612695693969727, "global_step": 36355, "epoch": 865} {"train_loss": -5.549073696136475, "global_step": 36356, "epoch": 865} {"train_loss": -5.586592197418213, "global_step": 36357, "epoch": 865} {"train_loss": -5.633145332336426, "global_step": 36358, "epoch": 865} {"train_loss": -5.614794731140137, "global_step": 36359, "epoch": 865} {"train_loss": -5.53270149230957, "global_step": 36360, "epoch": 865} {"train_loss": -5.479109764099121, "global_step": 36361, "epoch": 865} {"train_loss": -5.475297927856445, "global_step": 36362, "epoch": 865} {"train_loss": -5.506852149963379, "global_step": 36363, "epoch": 865} {"train_loss": -5.661144733428955, "global_step": 36364, "epoch": 865} {"train_loss": -5.562355995178223, "global_step": 36365, "epoch": 865} {"train_loss": -5.708371162414551, "global_step": 36366, "epoch": 865} {"train_loss": -5.609411716461182, "global_step": 36367, "epoch": 865} {"train_loss": -5.644052505493164, "global_step": 36368, "epoch": 865} {"train_loss": -5.556541442871094, "global_step": 36369, "epoch": 865} {"train_loss": -5.607196807861328, "global_step": 36370, "epoch": 865} {"train_loss": -5.590321688424973, "global_step": 36371, "epoch": 865, "val_loss": 62179.4453125} {"train_loss": -5.6602325439453125, "global_step": 36372, "epoch": 866} {"train_loss": -5.675699234008789, "global_step": 36373, "epoch": 866} {"train_loss": -5.5268235206604, "global_step": 36374, "epoch": 866} {"train_loss": -5.67981481552124, "global_step": 36375, "epoch": 866} {"train_loss": -5.51814603805542, "global_step": 36376, "epoch": 866} {"train_loss": -5.551085472106934, "global_step": 36377, "epoch": 866} {"train_loss": -5.659523963928223, "global_step": 36378, "epoch": 866} {"train_loss": -5.674433708190918, "global_step": 36379, "epoch": 866} {"train_loss": -5.685556411743164, "global_step": 36380, "epoch": 866} {"train_loss": -5.676673412322998, "global_step": 36381, "epoch": 866} {"train_loss": -5.613536834716797, "global_step": 36382, "epoch": 866} {"train_loss": -5.583253383636475, "global_step": 36383, "epoch": 866} {"train_loss": -5.562262058258057, "global_step": 36384, "epoch": 866} {"train_loss": -5.632134437561035, "global_step": 36385, "epoch": 866} {"train_loss": -5.605996131896973, "global_step": 36386, "epoch": 866} {"train_loss": -5.548645496368408, "global_step": 36387, "epoch": 866} {"train_loss": -5.420482635498047, "global_step": 36388, "epoch": 866} {"train_loss": -5.551461219787598, "global_step": 36389, "epoch": 866} {"train_loss": -5.569908618927002, "global_step": 36390, "epoch": 866} {"train_loss": -5.616496562957764, "global_step": 36391, "epoch": 866} {"train_loss": -5.632192611694336, "global_step": 36392, "epoch": 866} {"train_loss": -5.570556640625, "global_step": 36393, "epoch": 866} {"train_loss": -5.647873401641846, "global_step": 36394, "epoch": 866} {"train_loss": -5.483608245849609, "global_step": 36395, "epoch": 866} {"train_loss": -5.597062110900879, "global_step": 36396, "epoch": 866} {"train_loss": -5.4839701652526855, "global_step": 36397, "epoch": 866} {"train_loss": -5.513711929321289, "global_step": 36398, "epoch": 866} {"train_loss": -5.595855236053467, "global_step": 36399, "epoch": 866} {"train_loss": -5.652684211730957, "global_step": 36400, "epoch": 866} {"train_loss": -5.696737766265869, "global_step": 36401, "epoch": 866} {"train_loss": -5.613927841186523, "global_step": 36402, "epoch": 866} {"train_loss": -5.6447248458862305, "global_step": 36403, "epoch": 866} {"train_loss": -5.598780155181885, "global_step": 36404, "epoch": 866} {"train_loss": -5.559676647186279, "global_step": 36405, "epoch": 866} {"train_loss": -5.64163875579834, "global_step": 36406, "epoch": 866} {"train_loss": -5.469916343688965, "global_step": 36407, "epoch": 866} {"train_loss": -5.57981014251709, "global_step": 36408, "epoch": 866} {"train_loss": -5.539077281951904, "global_step": 36409, "epoch": 866} {"train_loss": -5.658069610595703, "global_step": 36410, "epoch": 866} {"train_loss": -5.507270812988281, "global_step": 36411, "epoch": 866} {"train_loss": -5.3256025314331055, "global_step": 36412, "epoch": 866} {"train_loss": -5.584493671144758, "global_step": 36413, "epoch": 866, "val_loss": 62153.8203125} {"train_loss": -5.5733323097229, "global_step": 36414, "epoch": 867} {"train_loss": -5.629042625427246, "global_step": 36415, "epoch": 867} {"train_loss": -5.5508952140808105, "global_step": 36416, "epoch": 867} {"train_loss": -5.618371486663818, "global_step": 36417, "epoch": 867} {"train_loss": -5.504030227661133, "global_step": 36418, "epoch": 867} {"train_loss": -5.56190299987793, "global_step": 36419, "epoch": 867} {"train_loss": -5.516026973724365, "global_step": 36420, "epoch": 867} {"train_loss": -5.440996170043945, "global_step": 36421, "epoch": 867} {"train_loss": -5.537095069885254, "global_step": 36422, "epoch": 867} {"train_loss": -5.5295562744140625, "global_step": 36423, "epoch": 867} {"train_loss": -5.519345283508301, "global_step": 36424, "epoch": 867} {"train_loss": -5.580010414123535, "global_step": 36425, "epoch": 867} {"train_loss": -5.707709789276123, "global_step": 36426, "epoch": 867} {"train_loss": -5.652599334716797, "global_step": 36427, "epoch": 867} {"train_loss": -5.749250888824463, "global_step": 36428, "epoch": 867} {"train_loss": -5.613297462463379, "global_step": 36429, "epoch": 867} {"train_loss": -5.651507377624512, "global_step": 36430, "epoch": 867} {"train_loss": -5.4718170166015625, "global_step": 36431, "epoch": 867} {"train_loss": -5.574853897094727, "global_step": 36432, "epoch": 867} {"train_loss": -5.38325309753418, "global_step": 36433, "epoch": 867} {"train_loss": -5.317584991455078, "global_step": 36434, "epoch": 867} {"train_loss": -5.649552345275879, "global_step": 36435, "epoch": 867} {"train_loss": -5.531180381774902, "global_step": 36436, "epoch": 867} {"train_loss": -5.554465293884277, "global_step": 36437, "epoch": 867} {"train_loss": -5.667089462280273, "global_step": 36438, "epoch": 867} {"train_loss": -5.554094314575195, "global_step": 36439, "epoch": 867} {"train_loss": -5.568167686462402, "global_step": 36440, "epoch": 867} {"train_loss": -5.621443271636963, "global_step": 36441, "epoch": 867} {"train_loss": -5.506970405578613, "global_step": 36442, "epoch": 867} {"train_loss": -5.505542755126953, "global_step": 36443, "epoch": 867} {"train_loss": -5.447361469268799, "global_step": 36444, "epoch": 867} {"train_loss": -5.611940383911133, "global_step": 36445, "epoch": 867} {"train_loss": -5.626804351806641, "global_step": 36446, "epoch": 867} {"train_loss": -5.415979385375977, "global_step": 36447, "epoch": 867} {"train_loss": -5.655741214752197, "global_step": 36448, "epoch": 867} {"train_loss": -5.589249610900879, "global_step": 36449, "epoch": 867} {"train_loss": -5.381124019622803, "global_step": 36450, "epoch": 867} {"train_loss": -5.56016731262207, "global_step": 36451, "epoch": 867} {"train_loss": -5.572068214416504, "global_step": 36452, "epoch": 867} {"train_loss": -5.539441108703613, "global_step": 36453, "epoch": 867} {"train_loss": -5.59428596496582, "global_step": 36454, "epoch": 867} {"train_loss": -5.556712547938029, "global_step": 36455, "epoch": 867, "val_loss": 62345.3125} {"train_loss": -5.543450832366943, "global_step": 36456, "epoch": 868} {"train_loss": -5.660076141357422, "global_step": 36457, "epoch": 868} {"train_loss": -5.529031276702881, "global_step": 36458, "epoch": 868} {"train_loss": -5.557933807373047, "global_step": 36459, "epoch": 868} {"train_loss": -5.633020401000977, "global_step": 36460, "epoch": 868} {"train_loss": -5.576353073120117, "global_step": 36461, "epoch": 868} {"train_loss": -5.57365608215332, "global_step": 36462, "epoch": 868} {"train_loss": -5.584786415100098, "global_step": 36463, "epoch": 868} {"train_loss": -5.503928184509277, "global_step": 36464, "epoch": 868} {"train_loss": -5.611837387084961, "global_step": 36465, "epoch": 868} {"train_loss": -5.5834856033325195, "global_step": 36466, "epoch": 868} {"train_loss": -5.677708625793457, "global_step": 36467, "epoch": 868} {"train_loss": -5.682085037231445, "global_step": 36468, "epoch": 868} {"train_loss": -5.579132080078125, "global_step": 36469, "epoch": 868} {"train_loss": -5.651388645172119, "global_step": 36470, "epoch": 868} {"train_loss": -5.528629779815674, "global_step": 36471, "epoch": 868} {"train_loss": -5.647214889526367, "global_step": 36472, "epoch": 868} {"train_loss": -5.55081844329834, "global_step": 36473, "epoch": 868} {"train_loss": -5.5636820793151855, "global_step": 36474, "epoch": 868} {"train_loss": -5.630160808563232, "global_step": 36475, "epoch": 868} {"train_loss": -5.629053115844727, "global_step": 36476, "epoch": 868} {"train_loss": -5.5066399574279785, "global_step": 36477, "epoch": 868} {"train_loss": -5.4700188636779785, "global_step": 36478, "epoch": 868} {"train_loss": -5.537429332733154, "global_step": 36479, "epoch": 868} {"train_loss": -5.642096996307373, "global_step": 36480, "epoch": 868} {"train_loss": -5.547450542449951, "global_step": 36481, "epoch": 868} {"train_loss": -5.642950534820557, "global_step": 36482, "epoch": 868} {"train_loss": -5.531496524810791, "global_step": 36483, "epoch": 868} {"train_loss": -5.630136013031006, "global_step": 36484, "epoch": 868} {"train_loss": -5.520280361175537, "global_step": 36485, "epoch": 868} {"train_loss": -5.532525062561035, "global_step": 36486, "epoch": 868} {"train_loss": -5.598085403442383, "global_step": 36487, "epoch": 868} {"train_loss": -5.565361022949219, "global_step": 36488, "epoch": 868} {"train_loss": -5.61142635345459, "global_step": 36489, "epoch": 868} {"train_loss": -5.723897457122803, "global_step": 36490, "epoch": 868} {"train_loss": -5.440361976623535, "global_step": 36491, "epoch": 868} {"train_loss": -5.686284065246582, "global_step": 36492, "epoch": 868} {"train_loss": -5.514732837677002, "global_step": 36493, "epoch": 868} {"train_loss": -5.44091796875, "global_step": 36494, "epoch": 868} {"train_loss": -5.636234760284424, "global_step": 36495, "epoch": 868} {"train_loss": -5.627538681030273, "global_step": 36496, "epoch": 868} {"train_loss": -5.584912572588239, "global_step": 36497, "epoch": 868, "val_loss": 62612.7265625} {"train_loss": -5.609740257263184, "global_step": 36498, "epoch": 869} {"train_loss": -5.453383922576904, "global_step": 36499, "epoch": 869} {"train_loss": -5.601473808288574, "global_step": 36500, "epoch": 869} {"train_loss": -5.641256332397461, "global_step": 36501, "epoch": 869} {"train_loss": -5.522125720977783, "global_step": 36502, "epoch": 869} {"train_loss": -5.558905601501465, "global_step": 36503, "epoch": 869} {"train_loss": -5.576913356781006, "global_step": 36504, "epoch": 869} {"train_loss": -5.571686744689941, "global_step": 36505, "epoch": 869} {"train_loss": -5.642847061157227, "global_step": 36506, "epoch": 869} {"train_loss": -5.6125898361206055, "global_step": 36507, "epoch": 869} {"train_loss": -5.433812618255615, "global_step": 36508, "epoch": 869} {"train_loss": -5.597137928009033, "global_step": 36509, "epoch": 869} {"train_loss": -5.568986892700195, "global_step": 36510, "epoch": 869} {"train_loss": -5.4578046798706055, "global_step": 36511, "epoch": 869} {"train_loss": -5.711394786834717, "global_step": 36512, "epoch": 869} {"train_loss": -5.5880584716796875, "global_step": 36513, "epoch": 869} {"train_loss": -5.5251970291137695, "global_step": 36514, "epoch": 869} {"train_loss": -5.523367404937744, "global_step": 36515, "epoch": 869} {"train_loss": -5.501401424407959, "global_step": 36516, "epoch": 869} {"train_loss": -5.653846263885498, "global_step": 36517, "epoch": 869} {"train_loss": -5.638609886169434, "global_step": 36518, "epoch": 869} {"train_loss": -5.433385848999023, "global_step": 36519, "epoch": 869} {"train_loss": -5.52178955078125, "global_step": 36520, "epoch": 869} {"train_loss": -5.633801460266113, "global_step": 36521, "epoch": 869} {"train_loss": -5.537632942199707, "global_step": 36522, "epoch": 869} {"train_loss": -5.713266372680664, "global_step": 36523, "epoch": 869} {"train_loss": -5.491415023803711, "global_step": 36524, "epoch": 869} {"train_loss": -5.541175842285156, "global_step": 36525, "epoch": 869} {"train_loss": -5.720044136047363, "global_step": 36526, "epoch": 869} {"train_loss": -5.65171480178833, "global_step": 36527, "epoch": 869} {"train_loss": -5.503220558166504, "global_step": 36528, "epoch": 869} {"train_loss": -5.58040714263916, "global_step": 36529, "epoch": 869} {"train_loss": -5.492725372314453, "global_step": 36530, "epoch": 869} {"train_loss": -5.4983744621276855, "global_step": 36531, "epoch": 869} {"train_loss": -5.6977715492248535, "global_step": 36532, "epoch": 869} {"train_loss": -5.420801162719727, "global_step": 36533, "epoch": 869} {"train_loss": -5.578129291534424, "global_step": 36534, "epoch": 869} {"train_loss": -5.422769546508789, "global_step": 36535, "epoch": 869} {"train_loss": -5.635396957397461, "global_step": 36536, "epoch": 869} {"train_loss": -5.48642635345459, "global_step": 36537, "epoch": 869} {"train_loss": -5.5639753341674805, "global_step": 36538, "epoch": 869} {"train_loss": -5.563153153374081, "global_step": 36539, "epoch": 869, "val_loss": 62199.0} {"train_loss": -5.571574687957764, "global_step": 36540, "epoch": 870} {"train_loss": -5.613173961639404, "global_step": 36541, "epoch": 870} {"train_loss": -5.601963996887207, "global_step": 36542, "epoch": 870} {"train_loss": -5.634427070617676, "global_step": 36543, "epoch": 870} {"train_loss": -5.567681312561035, "global_step": 36544, "epoch": 870} {"train_loss": -5.499485015869141, "global_step": 36545, "epoch": 870} {"train_loss": -5.658749103546143, "global_step": 36546, "epoch": 870} {"train_loss": -5.49395751953125, "global_step": 36547, "epoch": 870} {"train_loss": -5.663918972015381, "global_step": 36548, "epoch": 870} {"train_loss": -5.51101016998291, "global_step": 36549, "epoch": 870} {"train_loss": -5.612581253051758, "global_step": 36550, "epoch": 870} {"train_loss": -5.481093406677246, "global_step": 36551, "epoch": 870} {"train_loss": -5.3748345375061035, "global_step": 36552, "epoch": 870} {"train_loss": -5.4930572509765625, "global_step": 36553, "epoch": 870} {"train_loss": -5.559698104858398, "global_step": 36554, "epoch": 870} {"train_loss": -5.45637321472168, "global_step": 36555, "epoch": 870} {"train_loss": -5.542984485626221, "global_step": 36556, "epoch": 870} {"train_loss": -5.48356819152832, "global_step": 36557, "epoch": 870} {"train_loss": -5.514508247375488, "global_step": 36558, "epoch": 870} {"train_loss": -5.599613189697266, "global_step": 36559, "epoch": 870} {"train_loss": -5.5034966468811035, "global_step": 36560, "epoch": 870} {"train_loss": -5.535962104797363, "global_step": 36561, "epoch": 870} {"train_loss": -5.5703349113464355, "global_step": 36562, "epoch": 870} {"train_loss": -5.487483501434326, "global_step": 36563, "epoch": 870} {"train_loss": -5.659970283508301, "global_step": 36564, "epoch": 870} {"train_loss": -5.562802314758301, "global_step": 36565, "epoch": 870} {"train_loss": -5.456777572631836, "global_step": 36566, "epoch": 870} {"train_loss": -5.6065874099731445, "global_step": 36567, "epoch": 870} {"train_loss": -5.57415771484375, "global_step": 36568, "epoch": 870} {"train_loss": -5.440634250640869, "global_step": 36569, "epoch": 870} {"train_loss": -5.6453351974487305, "global_step": 36570, "epoch": 870} {"train_loss": -5.573938369750977, "global_step": 36571, "epoch": 870} {"train_loss": -5.5581817626953125, "global_step": 36572, "epoch": 870} {"train_loss": -5.587743759155273, "global_step": 36573, "epoch": 870} {"train_loss": -5.6416015625, "global_step": 36574, "epoch": 870} {"train_loss": -5.597841262817383, "global_step": 36575, "epoch": 870} {"train_loss": -5.766174793243408, "global_step": 36576, "epoch": 870} {"train_loss": -5.5154547691345215, "global_step": 36577, "epoch": 870} {"train_loss": -5.545910358428955, "global_step": 36578, "epoch": 870} {"train_loss": -5.557017803192139, "global_step": 36579, "epoch": 870} {"train_loss": -5.543129920959473, "global_step": 36580, "epoch": 870} {"train_loss": -5.561378115699405, "global_step": 36581, "epoch": 870, "val_loss": 62398.42578125} {"train_loss": -5.657627582550049, "global_step": 36582, "epoch": 871} {"train_loss": -5.566442966461182, "global_step": 36583, "epoch": 871} {"train_loss": -5.557705879211426, "global_step": 36584, "epoch": 871} {"train_loss": -5.576172351837158, "global_step": 36585, "epoch": 871} {"train_loss": -5.422058582305908, "global_step": 36586, "epoch": 871} {"train_loss": -5.682150840759277, "global_step": 36587, "epoch": 871} {"train_loss": -5.614770889282227, "global_step": 36588, "epoch": 871} {"train_loss": -5.518748760223389, "global_step": 36589, "epoch": 871} {"train_loss": -5.564797401428223, "global_step": 36590, "epoch": 871} {"train_loss": -5.568340301513672, "global_step": 36591, "epoch": 871} {"train_loss": -5.575605392456055, "global_step": 36592, "epoch": 871} {"train_loss": -5.483218193054199, "global_step": 36593, "epoch": 871} {"train_loss": -5.571305274963379, "global_step": 36594, "epoch": 871} {"train_loss": -5.556272506713867, "global_step": 36595, "epoch": 871} {"train_loss": -5.58889102935791, "global_step": 36596, "epoch": 871} {"train_loss": -5.594256401062012, "global_step": 36597, "epoch": 871} {"train_loss": -5.556407928466797, "global_step": 36598, "epoch": 871} {"train_loss": -5.687191963195801, "global_step": 36599, "epoch": 871} {"train_loss": -5.673281669616699, "global_step": 36600, "epoch": 871} {"train_loss": -5.489928245544434, "global_step": 36601, "epoch": 871} {"train_loss": -5.695584297180176, "global_step": 36602, "epoch": 871} {"train_loss": -5.680505275726318, "global_step": 36603, "epoch": 871} {"train_loss": -5.504571437835693, "global_step": 36604, "epoch": 871} {"train_loss": -5.593469619750977, "global_step": 36605, "epoch": 871} {"train_loss": -5.668526649475098, "global_step": 36606, "epoch": 871} {"train_loss": -5.531159400939941, "global_step": 36607, "epoch": 871} {"train_loss": -5.554885387420654, "global_step": 36608, "epoch": 871} {"train_loss": -5.483336925506592, "global_step": 36609, "epoch": 871} {"train_loss": -5.5355634689331055, "global_step": 36610, "epoch": 871} {"train_loss": -5.57958984375, "global_step": 36611, "epoch": 871} {"train_loss": -5.587396144866943, "global_step": 36612, "epoch": 871} {"train_loss": -5.6043620109558105, "global_step": 36613, "epoch": 871} {"train_loss": -5.602384567260742, "global_step": 36614, "epoch": 871} {"train_loss": -5.372269153594971, "global_step": 36615, "epoch": 871} {"train_loss": -5.641914367675781, "global_step": 36616, "epoch": 871} {"train_loss": -5.519913196563721, "global_step": 36617, "epoch": 871} {"train_loss": -5.629349231719971, "global_step": 36618, "epoch": 871} {"train_loss": -5.735326766967773, "global_step": 36619, "epoch": 871} {"train_loss": -5.379650592803955, "global_step": 36620, "epoch": 871} {"train_loss": -5.507472515106201, "global_step": 36621, "epoch": 871} {"train_loss": -5.588089466094971, "global_step": 36622, "epoch": 871} {"train_loss": -5.569882461002895, "global_step": 36623, "epoch": 871, "val_loss": 62475.39453125} {"train_loss": -5.503994941711426, "global_step": 36624, "epoch": 872} {"train_loss": -5.501935005187988, "global_step": 36625, "epoch": 872} {"train_loss": -5.553902626037598, "global_step": 36626, "epoch": 872} {"train_loss": -5.614083290100098, "global_step": 36627, "epoch": 872} {"train_loss": -5.321139812469482, "global_step": 36628, "epoch": 872} {"train_loss": -5.585995197296143, "global_step": 36629, "epoch": 872} {"train_loss": -5.446598529815674, "global_step": 36630, "epoch": 872} {"train_loss": -5.4889960289001465, "global_step": 36631, "epoch": 872} {"train_loss": -5.589382171630859, "global_step": 36632, "epoch": 872} {"train_loss": -5.464794635772705, "global_step": 36633, "epoch": 872} {"train_loss": -5.575759410858154, "global_step": 36634, "epoch": 872} {"train_loss": -5.479352951049805, "global_step": 36635, "epoch": 872} {"train_loss": -5.593133926391602, "global_step": 36636, "epoch": 872} {"train_loss": -5.413790702819824, "global_step": 36637, "epoch": 872} {"train_loss": -5.624258518218994, "global_step": 36638, "epoch": 872} {"train_loss": -5.549304962158203, "global_step": 36639, "epoch": 872} {"train_loss": -5.586124420166016, "global_step": 36640, "epoch": 872} {"train_loss": -5.523091793060303, "global_step": 36641, "epoch": 872} {"train_loss": -5.593609809875488, "global_step": 36642, "epoch": 872} {"train_loss": -5.5045671463012695, "global_step": 36643, "epoch": 872} {"train_loss": -5.63345193862915, "global_step": 36644, "epoch": 872} {"train_loss": -5.632878303527832, "global_step": 36645, "epoch": 872} {"train_loss": -5.469432353973389, "global_step": 36646, "epoch": 872} {"train_loss": -5.600465774536133, "global_step": 36647, "epoch": 872} {"train_loss": -5.604924201965332, "global_step": 36648, "epoch": 872} {"train_loss": -5.608712196350098, "global_step": 36649, "epoch": 872} {"train_loss": -5.669124126434326, "global_step": 36650, "epoch": 872} {"train_loss": -5.583985328674316, "global_step": 36651, "epoch": 872} {"train_loss": -5.623281955718994, "global_step": 36652, "epoch": 872} {"train_loss": -5.666202545166016, "global_step": 36653, "epoch": 872} {"train_loss": -5.50654411315918, "global_step": 36654, "epoch": 872} {"train_loss": -5.637637615203857, "global_step": 36655, "epoch": 872} {"train_loss": -5.5728840827941895, "global_step": 36656, "epoch": 872} {"train_loss": -5.584536075592041, "global_step": 36657, "epoch": 872} {"train_loss": -5.568089962005615, "global_step": 36658, "epoch": 872} {"train_loss": -5.608255386352539, "global_step": 36659, "epoch": 872} {"train_loss": -5.728309154510498, "global_step": 36660, "epoch": 872} {"train_loss": -5.748091697692871, "global_step": 36661, "epoch": 872} {"train_loss": -5.653557777404785, "global_step": 36662, "epoch": 872} {"train_loss": -5.597576141357422, "global_step": 36663, "epoch": 872} {"train_loss": -5.54927921295166, "global_step": 36664, "epoch": 872} {"train_loss": -5.571664605821882, "global_step": 36665, "epoch": 872, "val_loss": 62183.8125} {"train_loss": -5.657465934753418, "global_step": 36666, "epoch": 873} {"train_loss": -5.615913391113281, "global_step": 36667, "epoch": 873} {"train_loss": -5.535689353942871, "global_step": 36668, "epoch": 873} {"train_loss": -5.58114767074585, "global_step": 36669, "epoch": 873} {"train_loss": -5.7259745597839355, "global_step": 36670, "epoch": 873} {"train_loss": -5.60498571395874, "global_step": 36671, "epoch": 873} {"train_loss": -5.511425018310547, "global_step": 36672, "epoch": 873} {"train_loss": -5.558638572692871, "global_step": 36673, "epoch": 873} {"train_loss": -5.6208367347717285, "global_step": 36674, "epoch": 873} {"train_loss": -5.502737045288086, "global_step": 36675, "epoch": 873} {"train_loss": -5.689393997192383, "global_step": 36676, "epoch": 873} {"train_loss": -5.592806816101074, "global_step": 36677, "epoch": 873} {"train_loss": -5.62105131149292, "global_step": 36678, "epoch": 873} {"train_loss": -5.57511568069458, "global_step": 36679, "epoch": 873} {"train_loss": -5.628123760223389, "global_step": 36680, "epoch": 873} {"train_loss": -5.517945289611816, "global_step": 36681, "epoch": 873} {"train_loss": -5.575655937194824, "global_step": 36682, "epoch": 873} {"train_loss": -5.5629682540893555, "global_step": 36683, "epoch": 873} {"train_loss": -5.55953311920166, "global_step": 36684, "epoch": 873} {"train_loss": -5.504408836364746, "global_step": 36685, "epoch": 873} {"train_loss": -5.599787712097168, "global_step": 36686, "epoch": 873} {"train_loss": -5.528024673461914, "global_step": 36687, "epoch": 873} {"train_loss": -5.491880416870117, "global_step": 36688, "epoch": 873} {"train_loss": -5.605171203613281, "global_step": 36689, "epoch": 873} {"train_loss": -5.580597877502441, "global_step": 36690, "epoch": 873} {"train_loss": -5.6602559089660645, "global_step": 36691, "epoch": 873} {"train_loss": -5.5108747482299805, "global_step": 36692, "epoch": 873} {"train_loss": -5.455999851226807, "global_step": 36693, "epoch": 873} {"train_loss": -5.703963756561279, "global_step": 36694, "epoch": 873} {"train_loss": -5.576480388641357, "global_step": 36695, "epoch": 873} {"train_loss": -5.548427104949951, "global_step": 36696, "epoch": 873} {"train_loss": -5.6726484298706055, "global_step": 36697, "epoch": 873} {"train_loss": -5.494148254394531, "global_step": 36698, "epoch": 873} {"train_loss": -5.645110607147217, "global_step": 36699, "epoch": 873} {"train_loss": -5.606781005859375, "global_step": 36700, "epoch": 873} {"train_loss": -5.580341339111328, "global_step": 36701, "epoch": 873} {"train_loss": -5.478257179260254, "global_step": 36702, "epoch": 873} {"train_loss": -5.5055646896362305, "global_step": 36703, "epoch": 873} {"train_loss": -5.603499889373779, "global_step": 36704, "epoch": 873} {"train_loss": -5.6196088790893555, "global_step": 36705, "epoch": 873} {"train_loss": -5.601661205291748, "global_step": 36706, "epoch": 873} {"train_loss": -5.580249729610625, "global_step": 36707, "epoch": 873, "val_loss": 62039.2578125} {"train_loss": -5.6037397384643555, "global_step": 36708, "epoch": 874} {"train_loss": -5.535869598388672, "global_step": 36709, "epoch": 874} {"train_loss": -5.674343109130859, "global_step": 36710, "epoch": 874} {"train_loss": -5.660277366638184, "global_step": 36711, "epoch": 874} {"train_loss": -5.574906349182129, "global_step": 36712, "epoch": 874} {"train_loss": -5.557485580444336, "global_step": 36713, "epoch": 874} {"train_loss": -5.532341957092285, "global_step": 36714, "epoch": 874} {"train_loss": -5.528650283813477, "global_step": 36715, "epoch": 874} {"train_loss": -5.528022766113281, "global_step": 36716, "epoch": 874} {"train_loss": -5.634499549865723, "global_step": 36717, "epoch": 874} {"train_loss": -5.539938926696777, "global_step": 36718, "epoch": 874} {"train_loss": -5.549167633056641, "global_step": 36719, "epoch": 874} {"train_loss": -5.558229446411133, "global_step": 36720, "epoch": 874} {"train_loss": -5.473616600036621, "global_step": 36721, "epoch": 874} {"train_loss": -5.593069076538086, "global_step": 36722, "epoch": 874} {"train_loss": -5.602817535400391, "global_step": 36723, "epoch": 874} {"train_loss": -5.501588821411133, "global_step": 36724, "epoch": 874} {"train_loss": -5.456577777862549, "global_step": 36725, "epoch": 874} {"train_loss": -5.4987568855285645, "global_step": 36726, "epoch": 874} {"train_loss": -5.59324312210083, "global_step": 36727, "epoch": 874} {"train_loss": -5.673032760620117, "global_step": 36728, "epoch": 874} {"train_loss": -5.540362358093262, "global_step": 36729, "epoch": 874} {"train_loss": -5.625279426574707, "global_step": 36730, "epoch": 874} {"train_loss": -5.588387966156006, "global_step": 36731, "epoch": 874} {"train_loss": -5.603046417236328, "global_step": 36732, "epoch": 874} {"train_loss": -5.588348865509033, "global_step": 36733, "epoch": 874} {"train_loss": -5.688824653625488, "global_step": 36734, "epoch": 874} {"train_loss": -5.654391765594482, "global_step": 36735, "epoch": 874} {"train_loss": -5.567968368530273, "global_step": 36736, "epoch": 874} {"train_loss": -5.557855606079102, "global_step": 36737, "epoch": 874} {"train_loss": -5.5473527908325195, "global_step": 36738, "epoch": 874} {"train_loss": -5.55573844909668, "global_step": 36739, "epoch": 874} {"train_loss": -5.480156898498535, "global_step": 36740, "epoch": 874} {"train_loss": -5.597085952758789, "global_step": 36741, "epoch": 874} {"train_loss": -5.534809112548828, "global_step": 36742, "epoch": 874} {"train_loss": -5.608393669128418, "global_step": 36743, "epoch": 874} {"train_loss": -5.5946736335754395, "global_step": 36744, "epoch": 874} {"train_loss": -5.541760444641113, "global_step": 36745, "epoch": 874} {"train_loss": -5.636055946350098, "global_step": 36746, "epoch": 874} {"train_loss": -5.575967311859131, "global_step": 36747, "epoch": 874} {"train_loss": -5.576292037963867, "global_step": 36748, "epoch": 874} {"train_loss": -5.576492320923578, "global_step": 36749, "epoch": 874, "val_loss": 61949.13671875} {"train_loss": -5.700730800628662, "global_step": 36750, "epoch": 875} {"train_loss": -5.608380317687988, "global_step": 36751, "epoch": 875} {"train_loss": -5.6811604499816895, "global_step": 36752, "epoch": 875} {"train_loss": -5.678223609924316, "global_step": 36753, "epoch": 875} {"train_loss": -5.565489768981934, "global_step": 36754, "epoch": 875} {"train_loss": -5.615793228149414, "global_step": 36755, "epoch": 875} {"train_loss": -5.613917827606201, "global_step": 36756, "epoch": 875} {"train_loss": -5.6251349449157715, "global_step": 36757, "epoch": 875} {"train_loss": -5.7296247482299805, "global_step": 36758, "epoch": 875} {"train_loss": -5.57567024230957, "global_step": 36759, "epoch": 875} {"train_loss": -5.663290977478027, "global_step": 36760, "epoch": 875} {"train_loss": -5.669776439666748, "global_step": 36761, "epoch": 875} {"train_loss": -5.4695024490356445, "global_step": 36762, "epoch": 875} {"train_loss": -5.644869804382324, "global_step": 36763, "epoch": 875} {"train_loss": -5.558838844299316, "global_step": 36764, "epoch": 875} {"train_loss": -5.640435695648193, "global_step": 36765, "epoch": 875} {"train_loss": -5.630789279937744, "global_step": 36766, "epoch": 875} {"train_loss": -5.6883463859558105, "global_step": 36767, "epoch": 875} {"train_loss": -5.502686023712158, "global_step": 36768, "epoch": 875} {"train_loss": -5.701413154602051, "global_step": 36769, "epoch": 875} {"train_loss": -5.606695175170898, "global_step": 36770, "epoch": 875} {"train_loss": -5.635995388031006, "global_step": 36771, "epoch": 875} {"train_loss": -5.4881672859191895, "global_step": 36772, "epoch": 875} {"train_loss": -5.556650161743164, "global_step": 36773, "epoch": 875} {"train_loss": -5.59821891784668, "global_step": 36774, "epoch": 875} {"train_loss": -5.494378089904785, "global_step": 36775, "epoch": 875} {"train_loss": -5.65093469619751, "global_step": 36776, "epoch": 875} {"train_loss": -5.608227729797363, "global_step": 36777, "epoch": 875} {"train_loss": -5.565550804138184, "global_step": 36778, "epoch": 875} {"train_loss": -5.5483717918396, "global_step": 36779, "epoch": 875} {"train_loss": -5.505136966705322, "global_step": 36780, "epoch": 875} {"train_loss": -5.532279014587402, "global_step": 36781, "epoch": 875} {"train_loss": -5.537154674530029, "global_step": 36782, "epoch": 875} {"train_loss": -5.494873046875, "global_step": 36783, "epoch": 875} {"train_loss": -5.5177106857299805, "global_step": 36784, "epoch": 875} {"train_loss": -5.593950271606445, "global_step": 36785, "epoch": 875} {"train_loss": -5.6288065910339355, "global_step": 36786, "epoch": 875} {"train_loss": -5.569518089294434, "global_step": 36787, "epoch": 875} {"train_loss": -5.620769023895264, "global_step": 36788, "epoch": 875} {"train_loss": -5.648687362670898, "global_step": 36789, "epoch": 875} {"train_loss": -5.476100444793701, "global_step": 36790, "epoch": 875} {"train_loss": -5.595053241366432, "global_step": 36791, "epoch": 875, "val_loss": 62343.85546875} {"train_loss": -5.568327903747559, "global_step": 36792, "epoch": 876} {"train_loss": -5.560462951660156, "global_step": 36793, "epoch": 876} {"train_loss": -5.52488374710083, "global_step": 36794, "epoch": 876} {"train_loss": -5.657353401184082, "global_step": 36795, "epoch": 876} {"train_loss": -5.535003662109375, "global_step": 36796, "epoch": 876} {"train_loss": -5.494935035705566, "global_step": 36797, "epoch": 876} {"train_loss": -5.542919158935547, "global_step": 36798, "epoch": 876} {"train_loss": -5.683225631713867, "global_step": 36799, "epoch": 876} {"train_loss": -5.501292705535889, "global_step": 36800, "epoch": 876} {"train_loss": -5.520330905914307, "global_step": 36801, "epoch": 876} {"train_loss": -5.6058125495910645, "global_step": 36802, "epoch": 876} {"train_loss": -5.513228416442871, "global_step": 36803, "epoch": 876} {"train_loss": -5.592263221740723, "global_step": 36804, "epoch": 876} {"train_loss": -5.637783050537109, "global_step": 36805, "epoch": 876} {"train_loss": -5.511096000671387, "global_step": 36806, "epoch": 876} {"train_loss": -5.682390213012695, "global_step": 36807, "epoch": 876} {"train_loss": -5.609035491943359, "global_step": 36808, "epoch": 876} {"train_loss": -5.513617515563965, "global_step": 36809, "epoch": 876} {"train_loss": -5.644753932952881, "global_step": 36810, "epoch": 876} {"train_loss": -5.733641624450684, "global_step": 36811, "epoch": 876} {"train_loss": -5.455998420715332, "global_step": 36812, "epoch": 876} {"train_loss": -5.626550674438477, "global_step": 36813, "epoch": 876} {"train_loss": -5.643999099731445, "global_step": 36814, "epoch": 876} {"train_loss": -5.580448150634766, "global_step": 36815, "epoch": 876} {"train_loss": -5.528575897216797, "global_step": 36816, "epoch": 876} {"train_loss": -5.634151458740234, "global_step": 36817, "epoch": 876} {"train_loss": -5.649938583374023, "global_step": 36818, "epoch": 876} {"train_loss": -5.500401496887207, "global_step": 36819, "epoch": 876} {"train_loss": -5.508352279663086, "global_step": 36820, "epoch": 876} {"train_loss": -5.698785781860352, "global_step": 36821, "epoch": 876} {"train_loss": -5.72062873840332, "global_step": 36822, "epoch": 876} {"train_loss": -5.634401321411133, "global_step": 36823, "epoch": 876} {"train_loss": -5.629313945770264, "global_step": 36824, "epoch": 876} {"train_loss": -5.640262603759766, "global_step": 36825, "epoch": 876} {"train_loss": -5.585947036743164, "global_step": 36826, "epoch": 876} {"train_loss": -5.47165584564209, "global_step": 36827, "epoch": 876} {"train_loss": -5.702915191650391, "global_step": 36828, "epoch": 876} {"train_loss": -5.496831893920898, "global_step": 36829, "epoch": 876} {"train_loss": -5.664621353149414, "global_step": 36830, "epoch": 876} {"train_loss": -5.6224822998046875, "global_step": 36831, "epoch": 876} {"train_loss": -5.675543785095215, "global_step": 36832, "epoch": 876} {"train_loss": -5.592605306988671, "global_step": 36833, "epoch": 876, "val_loss": 62251.29296875} {"train_loss": -5.624122619628906, "global_step": 36834, "epoch": 877} {"train_loss": -5.606910705566406, "global_step": 36835, "epoch": 877} {"train_loss": -5.687154293060303, "global_step": 36836, "epoch": 877} {"train_loss": -5.54963493347168, "global_step": 36837, "epoch": 877} {"train_loss": -5.519830703735352, "global_step": 36838, "epoch": 877} {"train_loss": -5.655855178833008, "global_step": 36839, "epoch": 877} {"train_loss": -5.665212154388428, "global_step": 36840, "epoch": 877} {"train_loss": -5.502083778381348, "global_step": 36841, "epoch": 877} {"train_loss": -5.638280391693115, "global_step": 36842, "epoch": 877} {"train_loss": -5.686042785644531, "global_step": 36843, "epoch": 877} {"train_loss": -5.630988121032715, "global_step": 36844, "epoch": 877} {"train_loss": -5.556102752685547, "global_step": 36845, "epoch": 877} {"train_loss": -5.495064735412598, "global_step": 36846, "epoch": 877} {"train_loss": -5.587301254272461, "global_step": 36847, "epoch": 877} {"train_loss": -5.603248596191406, "global_step": 36848, "epoch": 877} {"train_loss": -5.253665447235107, "global_step": 36849, "epoch": 877} {"train_loss": -5.57961368560791, "global_step": 36850, "epoch": 877} {"train_loss": -5.553360939025879, "global_step": 36851, "epoch": 877} {"train_loss": -5.430895805358887, "global_step": 36852, "epoch": 877} {"train_loss": -5.638680458068848, "global_step": 36853, "epoch": 877} {"train_loss": -5.562806606292725, "global_step": 36854, "epoch": 877} {"train_loss": -5.3421735763549805, "global_step": 36855, "epoch": 877} {"train_loss": -5.5672197341918945, "global_step": 36856, "epoch": 877} {"train_loss": -5.487114906311035, "global_step": 36857, "epoch": 877} {"train_loss": -5.637067794799805, "global_step": 36858, "epoch": 877} {"train_loss": -5.560687065124512, "global_step": 36859, "epoch": 877} {"train_loss": -5.607053756713867, "global_step": 36860, "epoch": 877} {"train_loss": -5.573423385620117, "global_step": 36861, "epoch": 877} {"train_loss": -5.638698101043701, "global_step": 36862, "epoch": 877} {"train_loss": -5.67119026184082, "global_step": 36863, "epoch": 877} {"train_loss": -5.588870048522949, "global_step": 36864, "epoch": 877} {"train_loss": -5.6318864822387695, "global_step": 36865, "epoch": 877} {"train_loss": -5.575143337249756, "global_step": 36866, "epoch": 877} {"train_loss": -5.645226001739502, "global_step": 36867, "epoch": 877} {"train_loss": -5.562657356262207, "global_step": 36868, "epoch": 877} {"train_loss": -5.737668514251709, "global_step": 36869, "epoch": 877} {"train_loss": -5.670392036437988, "global_step": 36870, "epoch": 877} {"train_loss": -5.537537574768066, "global_step": 36871, "epoch": 877} {"train_loss": -5.62000036239624, "global_step": 36872, "epoch": 877} {"train_loss": -5.616385459899902, "global_step": 36873, "epoch": 877} {"train_loss": -5.599784851074219, "global_step": 36874, "epoch": 877} {"train_loss": -5.580989553814843, "global_step": 36875, "epoch": 877, "val_loss": 61999.06640625} {"train_loss": -5.6153459548950195, "global_step": 36876, "epoch": 878} {"train_loss": -5.583722114562988, "global_step": 36877, "epoch": 878} {"train_loss": -5.5662946701049805, "global_step": 36878, "epoch": 878} {"train_loss": -5.59375524520874, "global_step": 36879, "epoch": 878} {"train_loss": -5.642553806304932, "global_step": 36880, "epoch": 878} {"train_loss": -5.575033664703369, "global_step": 36881, "epoch": 878} {"train_loss": -5.653989791870117, "global_step": 36882, "epoch": 878} {"train_loss": -5.806265830993652, "global_step": 36883, "epoch": 878} {"train_loss": -5.558889389038086, "global_step": 36884, "epoch": 878} {"train_loss": -5.647397518157959, "global_step": 36885, "epoch": 878} {"train_loss": -5.553794860839844, "global_step": 36886, "epoch": 878} {"train_loss": -5.5405120849609375, "global_step": 36887, "epoch": 878} {"train_loss": -5.669105529785156, "global_step": 36888, "epoch": 878} {"train_loss": -5.675390720367432, "global_step": 36889, "epoch": 878} {"train_loss": -5.625633239746094, "global_step": 36890, "epoch": 878} {"train_loss": -5.502202033996582, "global_step": 36891, "epoch": 878} {"train_loss": -5.65263557434082, "global_step": 36892, "epoch": 878} {"train_loss": -5.55059289932251, "global_step": 36893, "epoch": 878} {"train_loss": -5.742424964904785, "global_step": 36894, "epoch": 878} {"train_loss": -5.574278831481934, "global_step": 36895, "epoch": 878} {"train_loss": -5.611684799194336, "global_step": 36896, "epoch": 878} {"train_loss": -5.499211311340332, "global_step": 36897, "epoch": 878} {"train_loss": -5.542723655700684, "global_step": 36898, "epoch": 878} {"train_loss": -5.517653465270996, "global_step": 36899, "epoch": 878} {"train_loss": -5.7056169509887695, "global_step": 36900, "epoch": 878} {"train_loss": -5.656806945800781, "global_step": 36901, "epoch": 878} {"train_loss": -5.54918098449707, "global_step": 36902, "epoch": 878} {"train_loss": -5.675411701202393, "global_step": 36903, "epoch": 878} {"train_loss": -5.567863464355469, "global_step": 36904, "epoch": 878} {"train_loss": -5.625035762786865, "global_step": 36905, "epoch": 878} {"train_loss": -5.489487648010254, "global_step": 36906, "epoch": 878} {"train_loss": -5.643665313720703, "global_step": 36907, "epoch": 878} {"train_loss": -5.738303184509277, "global_step": 36908, "epoch": 878} {"train_loss": -5.580693244934082, "global_step": 36909, "epoch": 878} {"train_loss": -5.604579448699951, "global_step": 36910, "epoch": 878} {"train_loss": -5.651701927185059, "global_step": 36911, "epoch": 878} {"train_loss": -5.541319370269775, "global_step": 36912, "epoch": 878} {"train_loss": -5.525363922119141, "global_step": 36913, "epoch": 878} {"train_loss": -5.578859806060791, "global_step": 36914, "epoch": 878} {"train_loss": -5.423130989074707, "global_step": 36915, "epoch": 878} {"train_loss": -5.442919731140137, "global_step": 36916, "epoch": 878} {"train_loss": -5.596239521389916, "global_step": 36917, "epoch": 878, "val_loss": 62664.35546875} {"train_loss": -5.637557029724121, "global_step": 36918, "epoch": 879} {"train_loss": -5.642789840698242, "global_step": 36919, "epoch": 879} {"train_loss": -5.5604658126831055, "global_step": 36920, "epoch": 879} {"train_loss": -5.538532733917236, "global_step": 36921, "epoch": 879} {"train_loss": -5.633594512939453, "global_step": 36922, "epoch": 879} {"train_loss": -5.562694072723389, "global_step": 36923, "epoch": 879} {"train_loss": -5.629646301269531, "global_step": 36924, "epoch": 879} {"train_loss": -5.661764144897461, "global_step": 36925, "epoch": 879} {"train_loss": -5.609525680541992, "global_step": 36926, "epoch": 879} {"train_loss": -5.671241760253906, "global_step": 36927, "epoch": 879} {"train_loss": -5.569522380828857, "global_step": 36928, "epoch": 879} {"train_loss": -5.449721813201904, "global_step": 36929, "epoch": 879} {"train_loss": -5.641315937042236, "global_step": 36930, "epoch": 879} {"train_loss": -5.6478166580200195, "global_step": 36931, "epoch": 879} {"train_loss": -5.639131546020508, "global_step": 36932, "epoch": 879} {"train_loss": -5.661594390869141, "global_step": 36933, "epoch": 879} {"train_loss": -5.621993064880371, "global_step": 36934, "epoch": 879} {"train_loss": -5.581231117248535, "global_step": 36935, "epoch": 879} {"train_loss": -5.572392463684082, "global_step": 36936, "epoch": 879} {"train_loss": -5.6940155029296875, "global_step": 36937, "epoch": 879} {"train_loss": -5.554833889007568, "global_step": 36938, "epoch": 879} {"train_loss": -5.65431547164917, "global_step": 36939, "epoch": 879} {"train_loss": -5.53678035736084, "global_step": 36940, "epoch": 879} {"train_loss": -5.561698913574219, "global_step": 36941, "epoch": 879} {"train_loss": -5.543107032775879, "global_step": 36942, "epoch": 879} {"train_loss": -5.661060810089111, "global_step": 36943, "epoch": 879} {"train_loss": -5.699045181274414, "global_step": 36944, "epoch": 879} {"train_loss": -5.651958465576172, "global_step": 36945, "epoch": 879} {"train_loss": -5.672572135925293, "global_step": 36946, "epoch": 879} {"train_loss": -5.678990840911865, "global_step": 36947, "epoch": 879} {"train_loss": -5.61046028137207, "global_step": 36948, "epoch": 879} {"train_loss": -5.611639022827148, "global_step": 36949, "epoch": 879} {"train_loss": -5.6095733642578125, "global_step": 36950, "epoch": 879} {"train_loss": -5.517330169677734, "global_step": 36951, "epoch": 879} {"train_loss": -5.504737854003906, "global_step": 36952, "epoch": 879} {"train_loss": -5.541589736938477, "global_step": 36953, "epoch": 879} {"train_loss": -5.635406494140625, "global_step": 36954, "epoch": 879} {"train_loss": -5.510457992553711, "global_step": 36955, "epoch": 879} {"train_loss": -5.375273704528809, "global_step": 36956, "epoch": 879} {"train_loss": -5.671498775482178, "global_step": 36957, "epoch": 879} {"train_loss": -5.404717922210693, "global_step": 36958, "epoch": 879} {"train_loss": -5.598522924241566, "global_step": 36959, "epoch": 879, "val_loss": 62304.79296875} {"train_loss": -5.582247734069824, "global_step": 36960, "epoch": 880} {"train_loss": -5.4982452392578125, "global_step": 36961, "epoch": 880} {"train_loss": -5.689555644989014, "global_step": 36962, "epoch": 880} {"train_loss": -5.537217140197754, "global_step": 36963, "epoch": 880} {"train_loss": -5.607182502746582, "global_step": 36964, "epoch": 880} {"train_loss": -5.631504058837891, "global_step": 36965, "epoch": 880} {"train_loss": -5.523184776306152, "global_step": 36966, "epoch": 880} {"train_loss": -5.563554763793945, "global_step": 36967, "epoch": 880} {"train_loss": -5.520862579345703, "global_step": 36968, "epoch": 880} {"train_loss": -5.4149651527404785, "global_step": 36969, "epoch": 880} {"train_loss": -5.609864234924316, "global_step": 36970, "epoch": 880} {"train_loss": -5.489768981933594, "global_step": 36971, "epoch": 880} {"train_loss": -5.476820945739746, "global_step": 36972, "epoch": 880} {"train_loss": -5.641545295715332, "global_step": 36973, "epoch": 880} {"train_loss": -5.506340026855469, "global_step": 36974, "epoch": 880} {"train_loss": -5.6143293380737305, "global_step": 36975, "epoch": 880} {"train_loss": -5.564030647277832, "global_step": 36976, "epoch": 880} {"train_loss": -5.489319801330566, "global_step": 36977, "epoch": 880} {"train_loss": -5.651790142059326, "global_step": 36978, "epoch": 880} {"train_loss": -5.4978437423706055, "global_step": 36979, "epoch": 880} {"train_loss": -5.603333473205566, "global_step": 36980, "epoch": 880} {"train_loss": -5.541202068328857, "global_step": 36981, "epoch": 880} {"train_loss": -5.545843124389648, "global_step": 36982, "epoch": 880} {"train_loss": -5.540163040161133, "global_step": 36983, "epoch": 880} {"train_loss": -5.604430198669434, "global_step": 36984, "epoch": 880} {"train_loss": -5.770505428314209, "global_step": 36985, "epoch": 880} {"train_loss": -5.713046073913574, "global_step": 36986, "epoch": 880} {"train_loss": -5.469472885131836, "global_step": 36987, "epoch": 880} {"train_loss": -5.593812942504883, "global_step": 36988, "epoch": 880} {"train_loss": -5.517624855041504, "global_step": 36989, "epoch": 880} {"train_loss": -5.59124755859375, "global_step": 36990, "epoch": 880} {"train_loss": -5.612553596496582, "global_step": 36991, "epoch": 880} {"train_loss": -5.360549449920654, "global_step": 36992, "epoch": 880} {"train_loss": -5.533408164978027, "global_step": 36993, "epoch": 880} {"train_loss": -5.564297676086426, "global_step": 36994, "epoch": 880} {"train_loss": -5.6899094581604, "global_step": 36995, "epoch": 880} {"train_loss": -5.6773271560668945, "global_step": 36996, "epoch": 880} {"train_loss": -5.5863847732543945, "global_step": 36997, "epoch": 880} {"train_loss": -5.58189582824707, "global_step": 36998, "epoch": 880} {"train_loss": -5.513958930969238, "global_step": 36999, "epoch": 880} {"train_loss": -5.509957790374756, "global_step": 37000, "epoch": 880} {"train_loss": -5.567151273999896, "global_step": 37001, "epoch": 880, "val_loss": 62451.203125} {"train_loss": -5.524646759033203, "global_step": 37002, "epoch": 881} {"train_loss": -5.6900715827941895, "global_step": 37003, "epoch": 881} {"train_loss": -5.696345329284668, "global_step": 37004, "epoch": 881} {"train_loss": -5.627402305603027, "global_step": 37005, "epoch": 881} {"train_loss": -5.653937339782715, "global_step": 37006, "epoch": 881} {"train_loss": -5.71990966796875, "global_step": 37007, "epoch": 881} {"train_loss": -5.568370342254639, "global_step": 37008, "epoch": 881} {"train_loss": -5.688437461853027, "global_step": 37009, "epoch": 881} {"train_loss": -5.759304523468018, "global_step": 37010, "epoch": 881} {"train_loss": -5.760929107666016, "global_step": 37011, "epoch": 881} {"train_loss": -5.612131595611572, "global_step": 37012, "epoch": 881} {"train_loss": -5.541781902313232, "global_step": 37013, "epoch": 881} {"train_loss": -5.596275329589844, "global_step": 37014, "epoch": 881} {"train_loss": -5.515761375427246, "global_step": 37015, "epoch": 881} {"train_loss": -5.5811767578125, "global_step": 37016, "epoch": 881} {"train_loss": -5.705207824707031, "global_step": 37017, "epoch": 881} {"train_loss": -5.526576042175293, "global_step": 37018, "epoch": 881} {"train_loss": -5.658685684204102, "global_step": 37019, "epoch": 881} {"train_loss": -5.597521781921387, "global_step": 37020, "epoch": 881} {"train_loss": -5.553049564361572, "global_step": 37021, "epoch": 881} {"train_loss": -5.58746337890625, "global_step": 37022, "epoch": 881} {"train_loss": -5.701643943786621, "global_step": 37023, "epoch": 881} {"train_loss": -5.580552101135254, "global_step": 37024, "epoch": 881} {"train_loss": -5.606521129608154, "global_step": 37025, "epoch": 881} {"train_loss": -5.700469970703125, "global_step": 37026, "epoch": 881} {"train_loss": -5.581929683685303, "global_step": 37027, "epoch": 881} {"train_loss": -5.600970268249512, "global_step": 37028, "epoch": 881} {"train_loss": -5.584031581878662, "global_step": 37029, "epoch": 881} {"train_loss": -5.525349140167236, "global_step": 37030, "epoch": 881} {"train_loss": -5.682432174682617, "global_step": 37031, "epoch": 881} {"train_loss": -5.5419206619262695, "global_step": 37032, "epoch": 881} {"train_loss": -5.683001518249512, "global_step": 37033, "epoch": 881} {"train_loss": -5.401671886444092, "global_step": 37034, "epoch": 881} {"train_loss": -5.575407028198242, "global_step": 37035, "epoch": 881} {"train_loss": -5.473986625671387, "global_step": 37036, "epoch": 881} {"train_loss": -5.632088661193848, "global_step": 37037, "epoch": 881} {"train_loss": -5.473899841308594, "global_step": 37038, "epoch": 881} {"train_loss": -5.466580390930176, "global_step": 37039, "epoch": 881} {"train_loss": -5.633149147033691, "global_step": 37040, "epoch": 881} {"train_loss": -5.436058044433594, "global_step": 37041, "epoch": 881} {"train_loss": -5.606497764587402, "global_step": 37042, "epoch": 881} {"train_loss": -5.600733473187401, "global_step": 37043, "epoch": 881, "val_loss": 62234.16015625} {"train_loss": -5.6634626388549805, "global_step": 37044, "epoch": 882} {"train_loss": -5.689223289489746, "global_step": 37045, "epoch": 882} {"train_loss": -5.684606552124023, "global_step": 37046, "epoch": 882} {"train_loss": -5.4946746826171875, "global_step": 37047, "epoch": 882} {"train_loss": -5.648359775543213, "global_step": 37048, "epoch": 882} {"train_loss": -5.531549453735352, "global_step": 37049, "epoch": 882} {"train_loss": -5.5468902587890625, "global_step": 37050, "epoch": 882} {"train_loss": -5.5898823738098145, "global_step": 37051, "epoch": 882} {"train_loss": -5.480808258056641, "global_step": 37052, "epoch": 882} {"train_loss": -5.656951427459717, "global_step": 37053, "epoch": 882} {"train_loss": -5.538519859313965, "global_step": 37054, "epoch": 882} {"train_loss": -5.6197052001953125, "global_step": 37055, "epoch": 882} {"train_loss": -5.513375759124756, "global_step": 37056, "epoch": 882} {"train_loss": -5.558101654052734, "global_step": 37057, "epoch": 882} {"train_loss": -5.69356632232666, "global_step": 37058, "epoch": 882} {"train_loss": -5.7305169105529785, "global_step": 37059, "epoch": 882} {"train_loss": -5.621253967285156, "global_step": 37060, "epoch": 882} {"train_loss": -5.635293006896973, "global_step": 37061, "epoch": 882} {"train_loss": -5.539247989654541, "global_step": 37062, "epoch": 882} {"train_loss": -5.515715599060059, "global_step": 37063, "epoch": 882} {"train_loss": -5.526681423187256, "global_step": 37064, "epoch": 882} {"train_loss": -5.502567291259766, "global_step": 37065, "epoch": 882} {"train_loss": -5.563300609588623, "global_step": 37066, "epoch": 882} {"train_loss": -5.643965721130371, "global_step": 37067, "epoch": 882} {"train_loss": -5.633256435394287, "global_step": 37068, "epoch": 882} {"train_loss": -5.666798114776611, "global_step": 37069, "epoch": 882} {"train_loss": -5.657331466674805, "global_step": 37070, "epoch": 882} {"train_loss": -5.487428188323975, "global_step": 37071, "epoch": 882} {"train_loss": -5.649361610412598, "global_step": 37072, "epoch": 882} {"train_loss": -5.539782524108887, "global_step": 37073, "epoch": 882} {"train_loss": -5.575087547302246, "global_step": 37074, "epoch": 882} {"train_loss": -5.4881205558776855, "global_step": 37075, "epoch": 882} {"train_loss": -5.642123222351074, "global_step": 37076, "epoch": 882} {"train_loss": -5.571029186248779, "global_step": 37077, "epoch": 882} {"train_loss": -5.621102333068848, "global_step": 37078, "epoch": 882} {"train_loss": -5.547457218170166, "global_step": 37079, "epoch": 882} {"train_loss": -5.522711277008057, "global_step": 37080, "epoch": 882} {"train_loss": -5.605362415313721, "global_step": 37081, "epoch": 882} {"train_loss": -5.525381088256836, "global_step": 37082, "epoch": 882} {"train_loss": -5.500757217407227, "global_step": 37083, "epoch": 882} {"train_loss": -5.47212028503418, "global_step": 37084, "epoch": 882} {"train_loss": -5.57961554754348, "global_step": 37085, "epoch": 882, "val_loss": 62359.85546875} {"train_loss": -5.556416034698486, "global_step": 37086, "epoch": 883} {"train_loss": -5.558265209197998, "global_step": 37087, "epoch": 883} {"train_loss": -5.473182201385498, "global_step": 37088, "epoch": 883} {"train_loss": -5.624809265136719, "global_step": 37089, "epoch": 883} {"train_loss": -5.436466217041016, "global_step": 37090, "epoch": 883} {"train_loss": -5.425412654876709, "global_step": 37091, "epoch": 883} {"train_loss": -5.561465263366699, "global_step": 37092, "epoch": 883} {"train_loss": -5.512104034423828, "global_step": 37093, "epoch": 883} {"train_loss": -5.566100597381592, "global_step": 37094, "epoch": 883} {"train_loss": -5.623702049255371, "global_step": 37095, "epoch": 883} {"train_loss": -5.652416706085205, "global_step": 37096, "epoch": 883} {"train_loss": -5.657994270324707, "global_step": 37097, "epoch": 883} {"train_loss": -5.511329650878906, "global_step": 37098, "epoch": 883} {"train_loss": -5.702422142028809, "global_step": 37099, "epoch": 883} {"train_loss": -5.523700714111328, "global_step": 37100, "epoch": 883} {"train_loss": -5.7042107582092285, "global_step": 37101, "epoch": 883} {"train_loss": -5.539137840270996, "global_step": 37102, "epoch": 883} {"train_loss": -5.6089630126953125, "global_step": 37103, "epoch": 883} {"train_loss": -5.5845537185668945, "global_step": 37104, "epoch": 883} {"train_loss": -5.564164161682129, "global_step": 37105, "epoch": 883} {"train_loss": -5.5708537101745605, "global_step": 37106, "epoch": 883} {"train_loss": -5.675973892211914, "global_step": 37107, "epoch": 883} {"train_loss": -5.429293632507324, "global_step": 37108, "epoch": 883} {"train_loss": -5.5650177001953125, "global_step": 37109, "epoch": 883} {"train_loss": -5.54676628112793, "global_step": 37110, "epoch": 883} {"train_loss": -5.630568504333496, "global_step": 37111, "epoch": 883} {"train_loss": -5.518771171569824, "global_step": 37112, "epoch": 883} {"train_loss": -5.556434154510498, "global_step": 37113, "epoch": 883} {"train_loss": -5.634621620178223, "global_step": 37114, "epoch": 883} {"train_loss": -5.505453586578369, "global_step": 37115, "epoch": 883} {"train_loss": -5.63455867767334, "global_step": 37116, "epoch": 883} {"train_loss": -5.511099815368652, "global_step": 37117, "epoch": 883} {"train_loss": -5.546761512756348, "global_step": 37118, "epoch": 883} {"train_loss": -5.549120903015137, "global_step": 37119, "epoch": 883} {"train_loss": -5.5339460372924805, "global_step": 37120, "epoch": 883} {"train_loss": -5.583335876464844, "global_step": 37121, "epoch": 883} {"train_loss": -5.530047416687012, "global_step": 37122, "epoch": 883} {"train_loss": -5.604511737823486, "global_step": 37123, "epoch": 883} {"train_loss": -5.643612861633301, "global_step": 37124, "epoch": 883} {"train_loss": -5.465564727783203, "global_step": 37125, "epoch": 883} {"train_loss": -5.478768825531006, "global_step": 37126, "epoch": 883} {"train_loss": -5.568760576702299, "global_step": 37127, "epoch": 883, "val_loss": 62501.1875} {"train_loss": -5.628334045410156, "global_step": 37128, "epoch": 884} {"train_loss": -5.63031005859375, "global_step": 37129, "epoch": 884} {"train_loss": -5.61890983581543, "global_step": 37130, "epoch": 884} {"train_loss": -5.622584342956543, "global_step": 37131, "epoch": 884} {"train_loss": -5.598513603210449, "global_step": 37132, "epoch": 884} {"train_loss": -5.59468412399292, "global_step": 37133, "epoch": 884} {"train_loss": -5.49688196182251, "global_step": 37134, "epoch": 884} {"train_loss": -5.60589599609375, "global_step": 37135, "epoch": 884} {"train_loss": -5.690597057342529, "global_step": 37136, "epoch": 884} {"train_loss": -5.655305862426758, "global_step": 37137, "epoch": 884} {"train_loss": -5.658531188964844, "global_step": 37138, "epoch": 884} {"train_loss": -5.564266204833984, "global_step": 37139, "epoch": 884} {"train_loss": -5.690934658050537, "global_step": 37140, "epoch": 884} {"train_loss": -5.681303977966309, "global_step": 37141, "epoch": 884} {"train_loss": -5.643654823303223, "global_step": 37142, "epoch": 884} {"train_loss": -5.537014961242676, "global_step": 37143, "epoch": 884} {"train_loss": -5.684029579162598, "global_step": 37144, "epoch": 884} {"train_loss": -5.654740333557129, "global_step": 37145, "epoch": 884} {"train_loss": -5.516479015350342, "global_step": 37146, "epoch": 884} {"train_loss": -5.584637641906738, "global_step": 37147, "epoch": 884} {"train_loss": -5.633796691894531, "global_step": 37148, "epoch": 884} {"train_loss": -5.748165130615234, "global_step": 37149, "epoch": 884} {"train_loss": -5.596950531005859, "global_step": 37150, "epoch": 884} {"train_loss": -5.657721996307373, "global_step": 37151, "epoch": 884} {"train_loss": -5.519094467163086, "global_step": 37152, "epoch": 884} {"train_loss": -5.619061470031738, "global_step": 37153, "epoch": 884} {"train_loss": -5.671317100524902, "global_step": 37154, "epoch": 884} {"train_loss": -5.518221855163574, "global_step": 37155, "epoch": 884} {"train_loss": -5.6037726402282715, "global_step": 37156, "epoch": 884} {"train_loss": -5.493943691253662, "global_step": 37157, "epoch": 884} {"train_loss": -5.574406623840332, "global_step": 37158, "epoch": 884} {"train_loss": -5.585163116455078, "global_step": 37159, "epoch": 884} {"train_loss": -5.6159467697143555, "global_step": 37160, "epoch": 884} {"train_loss": -5.666866302490234, "global_step": 37161, "epoch": 884} {"train_loss": -5.631702423095703, "global_step": 37162, "epoch": 884} {"train_loss": -5.610088348388672, "global_step": 37163, "epoch": 884} {"train_loss": -5.661969184875488, "global_step": 37164, "epoch": 884} {"train_loss": -5.617520809173584, "global_step": 37165, "epoch": 884} {"train_loss": -5.4735107421875, "global_step": 37166, "epoch": 884} {"train_loss": -5.532732009887695, "global_step": 37167, "epoch": 884} {"train_loss": -5.505490303039551, "global_step": 37168, "epoch": 884} {"train_loss": -5.6048564456758045, "global_step": 37169, "epoch": 884, "val_loss": 61998.44921875} {"train_loss": -5.588056564331055, "global_step": 37170, "epoch": 885} {"train_loss": -5.467564105987549, "global_step": 37171, "epoch": 885} {"train_loss": -5.559243202209473, "global_step": 37172, "epoch": 885} {"train_loss": -5.499814033508301, "global_step": 37173, "epoch": 885} {"train_loss": -5.466328144073486, "global_step": 37174, "epoch": 885} {"train_loss": -5.66961145401001, "global_step": 37175, "epoch": 885} {"train_loss": -5.5630903244018555, "global_step": 37176, "epoch": 885} {"train_loss": -5.591302394866943, "global_step": 37177, "epoch": 885} {"train_loss": -5.551779747009277, "global_step": 37178, "epoch": 885} {"train_loss": -5.614266395568848, "global_step": 37179, "epoch": 885} {"train_loss": -5.715478420257568, "global_step": 37180, "epoch": 885} {"train_loss": -5.584873676300049, "global_step": 37181, "epoch": 885} {"train_loss": -5.6432905197143555, "global_step": 37182, "epoch": 885} {"train_loss": -5.616341590881348, "global_step": 37183, "epoch": 885} {"train_loss": -5.63881778717041, "global_step": 37184, "epoch": 885} {"train_loss": -5.545116424560547, "global_step": 37185, "epoch": 885} {"train_loss": -5.7203264236450195, "global_step": 37186, "epoch": 885} {"train_loss": -5.620764255523682, "global_step": 37187, "epoch": 885} {"train_loss": -5.410297393798828, "global_step": 37188, "epoch": 885} {"train_loss": -5.652897357940674, "global_step": 37189, "epoch": 885} {"train_loss": -5.735306262969971, "global_step": 37190, "epoch": 885} {"train_loss": -5.62649393081665, "global_step": 37191, "epoch": 885} {"train_loss": -5.553627967834473, "global_step": 37192, "epoch": 885} {"train_loss": -5.557323455810547, "global_step": 37193, "epoch": 885} {"train_loss": -5.6476240158081055, "global_step": 37194, "epoch": 885} {"train_loss": -5.590327262878418, "global_step": 37195, "epoch": 885} {"train_loss": -5.539671421051025, "global_step": 37196, "epoch": 885} {"train_loss": -5.58866548538208, "global_step": 37197, "epoch": 885} {"train_loss": -5.607826232910156, "global_step": 37198, "epoch": 885} {"train_loss": -5.636468887329102, "global_step": 37199, "epoch": 885} {"train_loss": -5.625019550323486, "global_step": 37200, "epoch": 885} {"train_loss": -5.625370025634766, "global_step": 37201, "epoch": 885} {"train_loss": -5.616565704345703, "global_step": 37202, "epoch": 885} {"train_loss": -5.58344841003418, "global_step": 37203, "epoch": 885} {"train_loss": -5.584033966064453, "global_step": 37204, "epoch": 885} {"train_loss": -5.516063213348389, "global_step": 37205, "epoch": 885} {"train_loss": -5.594625473022461, "global_step": 37206, "epoch": 885} {"train_loss": -5.587609767913818, "global_step": 37207, "epoch": 885} {"train_loss": -5.580375671386719, "global_step": 37208, "epoch": 885} {"train_loss": -5.657470703125, "global_step": 37209, "epoch": 885} {"train_loss": -5.54049015045166, "global_step": 37210, "epoch": 885} {"train_loss": -5.59326620328994, "global_step": 37211, "epoch": 885, "val_loss": 62140.06640625} {"train_loss": -5.4643473625183105, "global_step": 37212, "epoch": 886} {"train_loss": -5.691420078277588, "global_step": 37213, "epoch": 886} {"train_loss": -5.558653831481934, "global_step": 37214, "epoch": 886} {"train_loss": -5.5787224769592285, "global_step": 37215, "epoch": 886} {"train_loss": -5.693305015563965, "global_step": 37216, "epoch": 886} {"train_loss": -5.558437347412109, "global_step": 37217, "epoch": 886} {"train_loss": -5.575135231018066, "global_step": 37218, "epoch": 886} {"train_loss": -5.5445098876953125, "global_step": 37219, "epoch": 886} {"train_loss": -5.497690200805664, "global_step": 37220, "epoch": 886} {"train_loss": -5.6510138511657715, "global_step": 37221, "epoch": 886} {"train_loss": -5.712673664093018, "global_step": 37222, "epoch": 886} {"train_loss": -5.597833633422852, "global_step": 37223, "epoch": 886} {"train_loss": -5.533016204833984, "global_step": 37224, "epoch": 886} {"train_loss": -5.68095588684082, "global_step": 37225, "epoch": 886} {"train_loss": -5.733997344970703, "global_step": 37226, "epoch": 886} {"train_loss": -5.670219421386719, "global_step": 37227, "epoch": 886} {"train_loss": -5.560446739196777, "global_step": 37228, "epoch": 886} {"train_loss": -5.462485313415527, "global_step": 37229, "epoch": 886} {"train_loss": -5.637458324432373, "global_step": 37230, "epoch": 886} {"train_loss": -5.593904972076416, "global_step": 37231, "epoch": 886} {"train_loss": -5.59432315826416, "global_step": 37232, "epoch": 886} {"train_loss": -5.606910228729248, "global_step": 37233, "epoch": 886} {"train_loss": -5.550968647003174, "global_step": 37234, "epoch": 886} {"train_loss": -5.644187927246094, "global_step": 37235, "epoch": 886} {"train_loss": -5.555877208709717, "global_step": 37236, "epoch": 886} {"train_loss": -5.714455604553223, "global_step": 37237, "epoch": 886} {"train_loss": -5.65284538269043, "global_step": 37238, "epoch": 886} {"train_loss": -5.741340637207031, "global_step": 37239, "epoch": 886} {"train_loss": -5.621549606323242, "global_step": 37240, "epoch": 886} {"train_loss": -5.596978187561035, "global_step": 37241, "epoch": 886} {"train_loss": -5.582292556762695, "global_step": 37242, "epoch": 886} {"train_loss": -5.747939109802246, "global_step": 37243, "epoch": 886} {"train_loss": -5.674829006195068, "global_step": 37244, "epoch": 886} {"train_loss": -5.834178447723389, "global_step": 37245, "epoch": 886} {"train_loss": -5.561559677124023, "global_step": 37246, "epoch": 886} {"train_loss": -5.582039833068848, "global_step": 37247, "epoch": 886} {"train_loss": -5.622091770172119, "global_step": 37248, "epoch": 886} {"train_loss": -5.458356857299805, "global_step": 37249, "epoch": 886} {"train_loss": -5.648320198059082, "global_step": 37250, "epoch": 886} {"train_loss": -5.6851983070373535, "global_step": 37251, "epoch": 886} {"train_loss": -5.498211860656738, "global_step": 37252, "epoch": 886} {"train_loss": -5.612884249005999, "global_step": 37253, "epoch": 886, "val_loss": 62249.87109375} {"train_loss": -5.531566143035889, "global_step": 37254, "epoch": 887} {"train_loss": -5.571384906768799, "global_step": 37255, "epoch": 887} {"train_loss": -5.726558685302734, "global_step": 37256, "epoch": 887} {"train_loss": -5.55754280090332, "global_step": 37257, "epoch": 887} {"train_loss": -5.529034614562988, "global_step": 37258, "epoch": 887} {"train_loss": -5.571317672729492, "global_step": 37259, "epoch": 887} {"train_loss": -5.687232971191406, "global_step": 37260, "epoch": 887} {"train_loss": -5.647952556610107, "global_step": 37261, "epoch": 887} {"train_loss": -5.604704856872559, "global_step": 37262, "epoch": 887} {"train_loss": -5.605296611785889, "global_step": 37263, "epoch": 887} {"train_loss": -5.644365310668945, "global_step": 37264, "epoch": 887} {"train_loss": -5.694156646728516, "global_step": 37265, "epoch": 887} {"train_loss": -5.6469902992248535, "global_step": 37266, "epoch": 887} {"train_loss": -5.508586883544922, "global_step": 37267, "epoch": 887} {"train_loss": -5.624527454376221, "global_step": 37268, "epoch": 887} {"train_loss": -5.671677589416504, "global_step": 37269, "epoch": 887} {"train_loss": -5.608587265014648, "global_step": 37270, "epoch": 887} {"train_loss": -5.499152183532715, "global_step": 37271, "epoch": 887} {"train_loss": -5.643500328063965, "global_step": 37272, "epoch": 887} {"train_loss": -5.622208118438721, "global_step": 37273, "epoch": 887} {"train_loss": -5.52189826965332, "global_step": 37274, "epoch": 887} {"train_loss": -5.655684947967529, "global_step": 37275, "epoch": 887} {"train_loss": -5.631833076477051, "global_step": 37276, "epoch": 887} {"train_loss": -5.663193702697754, "global_step": 37277, "epoch": 887} {"train_loss": -5.706912994384766, "global_step": 37278, "epoch": 887} {"train_loss": -5.5384016036987305, "global_step": 37279, "epoch": 887} {"train_loss": -5.550451278686523, "global_step": 37280, "epoch": 887} {"train_loss": -5.644768714904785, "global_step": 37281, "epoch": 887} {"train_loss": -5.642407417297363, "global_step": 37282, "epoch": 887} {"train_loss": -5.494119644165039, "global_step": 37283, "epoch": 887} {"train_loss": -5.501589775085449, "global_step": 37284, "epoch": 887} {"train_loss": -5.539237022399902, "global_step": 37285, "epoch": 887} {"train_loss": -5.481268882751465, "global_step": 37286, "epoch": 887} {"train_loss": -5.578396797180176, "global_step": 37287, "epoch": 887} {"train_loss": -5.552829742431641, "global_step": 37288, "epoch": 887} {"train_loss": -5.69886589050293, "global_step": 37289, "epoch": 887} {"train_loss": -5.6549906730651855, "global_step": 37290, "epoch": 887} {"train_loss": -5.621777534484863, "global_step": 37291, "epoch": 887} {"train_loss": -5.633889675140381, "global_step": 37292, "epoch": 887} {"train_loss": -5.470657825469971, "global_step": 37293, "epoch": 887} {"train_loss": -5.710607528686523, "global_step": 37294, "epoch": 887} {"train_loss": -5.602512836456299, "global_step": 37295, "epoch": 887, "val_loss": 61974.0390625} {"train_loss": -5.551662445068359, "global_step": 37296, "epoch": 888} {"train_loss": -5.517983436584473, "global_step": 37297, "epoch": 888} {"train_loss": -5.488167762756348, "global_step": 37298, "epoch": 888} {"train_loss": -5.678572177886963, "global_step": 37299, "epoch": 888} {"train_loss": -5.504385948181152, "global_step": 37300, "epoch": 888} {"train_loss": -5.443656921386719, "global_step": 37301, "epoch": 888} {"train_loss": -5.581813812255859, "global_step": 37302, "epoch": 888} {"train_loss": -5.565694808959961, "global_step": 37303, "epoch": 888} {"train_loss": -5.565682888031006, "global_step": 37304, "epoch": 888} {"train_loss": -5.585033416748047, "global_step": 37305, "epoch": 888} {"train_loss": -5.618685245513916, "global_step": 37306, "epoch": 888} {"train_loss": -5.576699256896973, "global_step": 37307, "epoch": 888} {"train_loss": -5.453683376312256, "global_step": 37308, "epoch": 888} {"train_loss": -5.591681957244873, "global_step": 37309, "epoch": 888} {"train_loss": -5.5272088050842285, "global_step": 37310, "epoch": 888} {"train_loss": -5.502139568328857, "global_step": 37311, "epoch": 888} {"train_loss": -5.606918811798096, "global_step": 37312, "epoch": 888} {"train_loss": -5.472555160522461, "global_step": 37313, "epoch": 888} {"train_loss": -5.541518688201904, "global_step": 37314, "epoch": 888} {"train_loss": -5.507409572601318, "global_step": 37315, "epoch": 888} {"train_loss": -5.535438060760498, "global_step": 37316, "epoch": 888} {"train_loss": -5.640776634216309, "global_step": 37317, "epoch": 888} {"train_loss": -5.53281307220459, "global_step": 37318, "epoch": 888} {"train_loss": -5.595078468322754, "global_step": 37319, "epoch": 888} {"train_loss": -5.645131587982178, "global_step": 37320, "epoch": 888} {"train_loss": -5.543156623840332, "global_step": 37321, "epoch": 888} {"train_loss": -5.641007423400879, "global_step": 37322, "epoch": 888} {"train_loss": -5.513495445251465, "global_step": 37323, "epoch": 888} {"train_loss": -5.591829776763916, "global_step": 37324, "epoch": 888} {"train_loss": -5.6664838790893555, "global_step": 37325, "epoch": 888} {"train_loss": -5.6203999519348145, "global_step": 37326, "epoch": 888} {"train_loss": -5.670053005218506, "global_step": 37327, "epoch": 888} {"train_loss": -5.63702392578125, "global_step": 37328, "epoch": 888} {"train_loss": -5.638614177703857, "global_step": 37329, "epoch": 888} {"train_loss": -5.704469680786133, "global_step": 37330, "epoch": 888} {"train_loss": -5.610383987426758, "global_step": 37331, "epoch": 888} {"train_loss": -5.597141265869141, "global_step": 37332, "epoch": 888} {"train_loss": -5.659902095794678, "global_step": 37333, "epoch": 888} {"train_loss": -5.570469379425049, "global_step": 37334, "epoch": 888} {"train_loss": -5.40938663482666, "global_step": 37335, "epoch": 888} {"train_loss": -5.564350128173828, "global_step": 37336, "epoch": 888} {"train_loss": -5.5726660660334995, "global_step": 37337, "epoch": 888, "val_loss": 62648.10546875} {"train_loss": -5.422680854797363, "global_step": 37338, "epoch": 889} {"train_loss": -5.5952301025390625, "global_step": 37339, "epoch": 889} {"train_loss": -5.719429969787598, "global_step": 37340, "epoch": 889} {"train_loss": -5.45269250869751, "global_step": 37341, "epoch": 889} {"train_loss": -5.655876159667969, "global_step": 37342, "epoch": 889} {"train_loss": -5.460495948791504, "global_step": 37343, "epoch": 889} {"train_loss": -5.638130187988281, "global_step": 37344, "epoch": 889} {"train_loss": -5.600643157958984, "global_step": 37345, "epoch": 889} {"train_loss": -5.706292152404785, "global_step": 37346, "epoch": 889} {"train_loss": -5.623015403747559, "global_step": 37347, "epoch": 889} {"train_loss": -5.732534408569336, "global_step": 37348, "epoch": 889} {"train_loss": -5.526553153991699, "global_step": 37349, "epoch": 889} {"train_loss": -5.659292221069336, "global_step": 37350, "epoch": 889} {"train_loss": -5.571223735809326, "global_step": 37351, "epoch": 889} {"train_loss": -5.727400302886963, "global_step": 37352, "epoch": 889} {"train_loss": -5.5654296875, "global_step": 37353, "epoch": 889} {"train_loss": -5.511874198913574, "global_step": 37354, "epoch": 889} {"train_loss": -5.501743316650391, "global_step": 37355, "epoch": 889} {"train_loss": -5.540031433105469, "global_step": 37356, "epoch": 889} {"train_loss": -5.641493320465088, "global_step": 37357, "epoch": 889} {"train_loss": -5.435094833374023, "global_step": 37358, "epoch": 889} {"train_loss": -5.548539161682129, "global_step": 37359, "epoch": 889} {"train_loss": -5.645761489868164, "global_step": 37360, "epoch": 889} {"train_loss": -5.705803871154785, "global_step": 37361, "epoch": 889} {"train_loss": -5.644054889678955, "global_step": 37362, "epoch": 889} {"train_loss": -5.600351333618164, "global_step": 37363, "epoch": 889} {"train_loss": -5.515052318572998, "global_step": 37364, "epoch": 889} {"train_loss": -5.5385589599609375, "global_step": 37365, "epoch": 889} {"train_loss": -5.58094596862793, "global_step": 37366, "epoch": 889} {"train_loss": -5.689975738525391, "global_step": 37367, "epoch": 889} {"train_loss": -5.7405900955200195, "global_step": 37368, "epoch": 889} {"train_loss": -5.576656341552734, "global_step": 37369, "epoch": 889} {"train_loss": -5.590902328491211, "global_step": 37370, "epoch": 889} {"train_loss": -5.728063106536865, "global_step": 37371, "epoch": 889} {"train_loss": -5.605542182922363, "global_step": 37372, "epoch": 889} {"train_loss": -5.670248985290527, "global_step": 37373, "epoch": 889} {"train_loss": -5.585748672485352, "global_step": 37374, "epoch": 889} {"train_loss": -5.538264751434326, "global_step": 37375, "epoch": 889} {"train_loss": -5.6007208824157715, "global_step": 37376, "epoch": 889} {"train_loss": -5.631838798522949, "global_step": 37377, "epoch": 889} {"train_loss": -5.642054557800293, "global_step": 37378, "epoch": 889} {"train_loss": -5.600589082354591, "global_step": 37379, "epoch": 889, "val_loss": 62268.70703125} {"train_loss": -5.604088306427002, "global_step": 37380, "epoch": 890} {"train_loss": -5.526749610900879, "global_step": 37381, "epoch": 890} {"train_loss": -5.53691291809082, "global_step": 37382, "epoch": 890} {"train_loss": -5.610475540161133, "global_step": 37383, "epoch": 890} {"train_loss": -5.491948127746582, "global_step": 37384, "epoch": 890} {"train_loss": -5.589940071105957, "global_step": 37385, "epoch": 890} {"train_loss": -5.7445831298828125, "global_step": 37386, "epoch": 890} {"train_loss": -5.515239715576172, "global_step": 37387, "epoch": 890} {"train_loss": -5.662006378173828, "global_step": 37388, "epoch": 890} {"train_loss": -5.678380012512207, "global_step": 37389, "epoch": 890} {"train_loss": -5.627917766571045, "global_step": 37390, "epoch": 890} {"train_loss": -5.618514537811279, "global_step": 37391, "epoch": 890} {"train_loss": -5.516315937042236, "global_step": 37392, "epoch": 890} {"train_loss": -5.696723937988281, "global_step": 37393, "epoch": 890} {"train_loss": -5.51289701461792, "global_step": 37394, "epoch": 890} {"train_loss": -5.5975847244262695, "global_step": 37395, "epoch": 890} {"train_loss": -5.584662914276123, "global_step": 37396, "epoch": 890} {"train_loss": -5.519754409790039, "global_step": 37397, "epoch": 890} {"train_loss": -5.776954650878906, "global_step": 37398, "epoch": 890} {"train_loss": -5.556515693664551, "global_step": 37399, "epoch": 890} {"train_loss": -5.77168083190918, "global_step": 37400, "epoch": 890} {"train_loss": -5.574953556060791, "global_step": 37401, "epoch": 890} {"train_loss": -5.64632511138916, "global_step": 37402, "epoch": 890} {"train_loss": -5.607820510864258, "global_step": 37403, "epoch": 890} {"train_loss": -5.59292459487915, "global_step": 37404, "epoch": 890} {"train_loss": -5.71185302734375, "global_step": 37405, "epoch": 890} {"train_loss": -5.4914445877075195, "global_step": 37406, "epoch": 890} {"train_loss": -5.574739456176758, "global_step": 37407, "epoch": 890} {"train_loss": -5.526198387145996, "global_step": 37408, "epoch": 890} {"train_loss": -5.657315254211426, "global_step": 37409, "epoch": 890} {"train_loss": -5.674205780029297, "global_step": 37410, "epoch": 890} {"train_loss": -5.474925994873047, "global_step": 37411, "epoch": 890} {"train_loss": -5.554431915283203, "global_step": 37412, "epoch": 890} {"train_loss": -5.503275394439697, "global_step": 37413, "epoch": 890} {"train_loss": -5.654378890991211, "global_step": 37414, "epoch": 890} {"train_loss": -5.683752536773682, "global_step": 37415, "epoch": 890} {"train_loss": -5.581292152404785, "global_step": 37416, "epoch": 890} {"train_loss": -5.738091468811035, "global_step": 37417, "epoch": 890} {"train_loss": -5.795830726623535, "global_step": 37418, "epoch": 890} {"train_loss": -5.5120086669921875, "global_step": 37419, "epoch": 890} {"train_loss": -5.592505931854248, "global_step": 37420, "epoch": 890} {"train_loss": -5.608971084867205, "global_step": 37421, "epoch": 890, "val_loss": 62186.89453125} {"train_loss": -5.565241813659668, "global_step": 37422, "epoch": 891} {"train_loss": -5.5775651931762695, "global_step": 37423, "epoch": 891} {"train_loss": -5.510087966918945, "global_step": 37424, "epoch": 891} {"train_loss": -5.516883850097656, "global_step": 37425, "epoch": 891} {"train_loss": -5.6885809898376465, "global_step": 37426, "epoch": 891} {"train_loss": -5.466848850250244, "global_step": 37427, "epoch": 891} {"train_loss": -5.453138828277588, "global_step": 37428, "epoch": 891} {"train_loss": -5.722429275512695, "global_step": 37429, "epoch": 891} {"train_loss": -5.622906684875488, "global_step": 37430, "epoch": 891} {"train_loss": -5.5535149574279785, "global_step": 37431, "epoch": 891} {"train_loss": -5.690149784088135, "global_step": 37432, "epoch": 891} {"train_loss": -5.564033508300781, "global_step": 37433, "epoch": 891} {"train_loss": -5.623570442199707, "global_step": 37434, "epoch": 891} {"train_loss": -5.5913496017456055, "global_step": 37435, "epoch": 891} {"train_loss": -5.619894027709961, "global_step": 37436, "epoch": 891} {"train_loss": -5.610768795013428, "global_step": 37437, "epoch": 891} {"train_loss": -5.537221431732178, "global_step": 37438, "epoch": 891} {"train_loss": -5.747443199157715, "global_step": 37439, "epoch": 891} {"train_loss": -5.651694297790527, "global_step": 37440, "epoch": 891} {"train_loss": -5.740001201629639, "global_step": 37441, "epoch": 891} {"train_loss": -5.597341537475586, "global_step": 37442, "epoch": 891} {"train_loss": -5.723407745361328, "global_step": 37443, "epoch": 891} {"train_loss": -5.527053356170654, "global_step": 37444, "epoch": 891} {"train_loss": -5.659377098083496, "global_step": 37445, "epoch": 891} {"train_loss": -5.6139397621154785, "global_step": 37446, "epoch": 891} {"train_loss": -5.660063743591309, "global_step": 37447, "epoch": 891} {"train_loss": -5.67714786529541, "global_step": 37448, "epoch": 891} {"train_loss": -5.667076110839844, "global_step": 37449, "epoch": 891} {"train_loss": -5.581609725952148, "global_step": 37450, "epoch": 891} {"train_loss": -5.614355564117432, "global_step": 37451, "epoch": 891} {"train_loss": -5.667491436004639, "global_step": 37452, "epoch": 891} {"train_loss": -5.550466060638428, "global_step": 37453, "epoch": 891} {"train_loss": -5.567257881164551, "global_step": 37454, "epoch": 891} {"train_loss": -5.526087760925293, "global_step": 37455, "epoch": 891} {"train_loss": -5.48322868347168, "global_step": 37456, "epoch": 891} {"train_loss": -5.691042423248291, "global_step": 37457, "epoch": 891} {"train_loss": -5.59251070022583, "global_step": 37458, "epoch": 891} {"train_loss": -5.579110145568848, "global_step": 37459, "epoch": 891} {"train_loss": -5.596521377563477, "global_step": 37460, "epoch": 891} {"train_loss": -5.60344934463501, "global_step": 37461, "epoch": 891} {"train_loss": -5.666958332061768, "global_step": 37462, "epoch": 891} {"train_loss": -5.607241585141137, "global_step": 37463, "epoch": 891, "val_loss": 61893.484375} {"train_loss": -5.644425868988037, "global_step": 37464, "epoch": 892} {"train_loss": -5.741832733154297, "global_step": 37465, "epoch": 892} {"train_loss": -5.652693748474121, "global_step": 37466, "epoch": 892} {"train_loss": -5.734397888183594, "global_step": 37467, "epoch": 892} {"train_loss": -5.555143356323242, "global_step": 37468, "epoch": 892} {"train_loss": -5.720024108886719, "global_step": 37469, "epoch": 892} {"train_loss": -5.711084365844727, "global_step": 37470, "epoch": 892} {"train_loss": -5.481784820556641, "global_step": 37471, "epoch": 892} {"train_loss": -5.58742618560791, "global_step": 37472, "epoch": 892} {"train_loss": -5.626613616943359, "global_step": 37473, "epoch": 892} {"train_loss": -5.729153633117676, "global_step": 37474, "epoch": 892} {"train_loss": -5.559114456176758, "global_step": 37475, "epoch": 892} {"train_loss": -5.571357250213623, "global_step": 37476, "epoch": 892} {"train_loss": -5.538387298583984, "global_step": 37477, "epoch": 892} {"train_loss": -5.683473110198975, "global_step": 37478, "epoch": 892} {"train_loss": -5.41928243637085, "global_step": 37479, "epoch": 892} {"train_loss": -5.5352277755737305, "global_step": 37480, "epoch": 892} {"train_loss": -5.648342132568359, "global_step": 37481, "epoch": 892} {"train_loss": -5.678005218505859, "global_step": 37482, "epoch": 892} {"train_loss": -5.678997039794922, "global_step": 37483, "epoch": 892} {"train_loss": -5.625313758850098, "global_step": 37484, "epoch": 892} {"train_loss": -5.64335823059082, "global_step": 37485, "epoch": 892} {"train_loss": -5.625561237335205, "global_step": 37486, "epoch": 892} {"train_loss": -5.504105091094971, "global_step": 37487, "epoch": 892} {"train_loss": -5.620933532714844, "global_step": 37488, "epoch": 892} {"train_loss": -5.577264785766602, "global_step": 37489, "epoch": 892} {"train_loss": -5.505685806274414, "global_step": 37490, "epoch": 892} {"train_loss": -5.801464080810547, "global_step": 37491, "epoch": 892} {"train_loss": -5.609781265258789, "global_step": 37492, "epoch": 892} {"train_loss": -5.503930568695068, "global_step": 37493, "epoch": 892} {"train_loss": -5.478531837463379, "global_step": 37494, "epoch": 892} {"train_loss": -5.633814334869385, "global_step": 37495, "epoch": 892} {"train_loss": -5.6451416015625, "global_step": 37496, "epoch": 892} {"train_loss": -5.598236560821533, "global_step": 37497, "epoch": 892} {"train_loss": -5.608786582946777, "global_step": 37498, "epoch": 892} {"train_loss": -5.605737209320068, "global_step": 37499, "epoch": 892} {"train_loss": -5.648434638977051, "global_step": 37500, "epoch": 892} {"train_loss": -5.603641033172607, "global_step": 37501, "epoch": 892} {"train_loss": -5.7137908935546875, "global_step": 37502, "epoch": 892} {"train_loss": -5.67989444732666, "global_step": 37503, "epoch": 892} {"train_loss": -5.547616004943848, "global_step": 37504, "epoch": 892} {"train_loss": -5.615720941906884, "global_step": 37505, "epoch": 892, "val_loss": 62100.46875} {"train_loss": -5.650330066680908, "global_step": 37506, "epoch": 893} {"train_loss": -5.6465253829956055, "global_step": 37507, "epoch": 893} {"train_loss": -5.619452476501465, "global_step": 37508, "epoch": 893} {"train_loss": -5.55698299407959, "global_step": 37509, "epoch": 893} {"train_loss": -5.6752028465271, "global_step": 37510, "epoch": 893} {"train_loss": -5.631988525390625, "global_step": 37511, "epoch": 893} {"train_loss": -5.643856048583984, "global_step": 37512, "epoch": 893} {"train_loss": -5.527790069580078, "global_step": 37513, "epoch": 893} {"train_loss": -5.593262672424316, "global_step": 37514, "epoch": 893} {"train_loss": -5.593425750732422, "global_step": 37515, "epoch": 893} {"train_loss": -5.693098545074463, "global_step": 37516, "epoch": 893} {"train_loss": -5.617011070251465, "global_step": 37517, "epoch": 893} {"train_loss": -5.442195892333984, "global_step": 37518, "epoch": 893} {"train_loss": -5.528193473815918, "global_step": 37519, "epoch": 893} {"train_loss": -5.640132904052734, "global_step": 37520, "epoch": 893} {"train_loss": -5.4358978271484375, "global_step": 37521, "epoch": 893} {"train_loss": -5.438922882080078, "global_step": 37522, "epoch": 893} {"train_loss": -5.629086494445801, "global_step": 37523, "epoch": 893} {"train_loss": -5.5160369873046875, "global_step": 37524, "epoch": 893} {"train_loss": -5.455410003662109, "global_step": 37525, "epoch": 893} {"train_loss": -5.52127742767334, "global_step": 37526, "epoch": 893} {"train_loss": -5.661049842834473, "global_step": 37527, "epoch": 893} {"train_loss": -5.690611839294434, "global_step": 37528, "epoch": 893} {"train_loss": -5.494795799255371, "global_step": 37529, "epoch": 893} {"train_loss": -5.554786205291748, "global_step": 37530, "epoch": 893} {"train_loss": -5.553356170654297, "global_step": 37531, "epoch": 893} {"train_loss": -5.557070255279541, "global_step": 37532, "epoch": 893} {"train_loss": -5.569034576416016, "global_step": 37533, "epoch": 893} {"train_loss": -5.530696868896484, "global_step": 37534, "epoch": 893} {"train_loss": -5.562911033630371, "global_step": 37535, "epoch": 893} {"train_loss": -5.643595218658447, "global_step": 37536, "epoch": 893} {"train_loss": -5.472348213195801, "global_step": 37537, "epoch": 893} {"train_loss": -5.554769515991211, "global_step": 37538, "epoch": 893} {"train_loss": -5.581296920776367, "global_step": 37539, "epoch": 893} {"train_loss": -5.470473766326904, "global_step": 37540, "epoch": 893} {"train_loss": -5.723464488983154, "global_step": 37541, "epoch": 893} {"train_loss": -5.37483549118042, "global_step": 37542, "epoch": 893} {"train_loss": -5.391903877258301, "global_step": 37543, "epoch": 893} {"train_loss": -5.559937477111816, "global_step": 37544, "epoch": 893} {"train_loss": -5.525787353515625, "global_step": 37545, "epoch": 893} {"train_loss": -5.642228603363037, "global_step": 37546, "epoch": 893} {"train_loss": -5.5616942927950905, "global_step": 37547, "epoch": 893, "val_loss": 62297.6953125} {"train_loss": -5.482773780822754, "global_step": 37548, "epoch": 894} {"train_loss": -5.527681350708008, "global_step": 37549, "epoch": 894} {"train_loss": -5.643391132354736, "global_step": 37550, "epoch": 894} {"train_loss": -5.33073091506958, "global_step": 37551, "epoch": 894} {"train_loss": -5.587058067321777, "global_step": 37552, "epoch": 894} {"train_loss": -5.509439945220947, "global_step": 37553, "epoch": 894} {"train_loss": -5.490979194641113, "global_step": 37554, "epoch": 894} {"train_loss": -5.606348037719727, "global_step": 37555, "epoch": 894} {"train_loss": -5.690131187438965, "global_step": 37556, "epoch": 894} {"train_loss": -5.676671028137207, "global_step": 37557, "epoch": 894} {"train_loss": -5.465787887573242, "global_step": 37558, "epoch": 894} {"train_loss": -5.513150215148926, "global_step": 37559, "epoch": 894} {"train_loss": -5.804909706115723, "global_step": 37560, "epoch": 894} {"train_loss": -5.625370979309082, "global_step": 37561, "epoch": 894} {"train_loss": -5.588685989379883, "global_step": 37562, "epoch": 894} {"train_loss": -5.589099884033203, "global_step": 37563, "epoch": 894} {"train_loss": -5.556070804595947, "global_step": 37564, "epoch": 894} {"train_loss": -5.706234931945801, "global_step": 37565, "epoch": 894} {"train_loss": -5.614665985107422, "global_step": 37566, "epoch": 894} {"train_loss": -5.422056198120117, "global_step": 37567, "epoch": 894} {"train_loss": -5.522112846374512, "global_step": 37568, "epoch": 894} {"train_loss": -5.576944828033447, "global_step": 37569, "epoch": 894} {"train_loss": -5.588895797729492, "global_step": 37570, "epoch": 894} {"train_loss": -5.712589263916016, "global_step": 37571, "epoch": 894} {"train_loss": -5.696022033691406, "global_step": 37572, "epoch": 894} {"train_loss": -5.582598686218262, "global_step": 37573, "epoch": 894} {"train_loss": -5.608410835266113, "global_step": 37574, "epoch": 894} {"train_loss": -5.491612434387207, "global_step": 37575, "epoch": 894} {"train_loss": -5.486140251159668, "global_step": 37576, "epoch": 894} {"train_loss": -5.477397918701172, "global_step": 37577, "epoch": 894} {"train_loss": -5.473787307739258, "global_step": 37578, "epoch": 894} {"train_loss": -5.437893390655518, "global_step": 37579, "epoch": 894} {"train_loss": -5.640661239624023, "global_step": 37580, "epoch": 894} {"train_loss": -5.48917293548584, "global_step": 37581, "epoch": 894} {"train_loss": -5.547115325927734, "global_step": 37582, "epoch": 894} {"train_loss": -5.655138969421387, "global_step": 37583, "epoch": 894} {"train_loss": -5.471441745758057, "global_step": 37584, "epoch": 894} {"train_loss": -5.675644397735596, "global_step": 37585, "epoch": 894} {"train_loss": -5.555940628051758, "global_step": 37586, "epoch": 894} {"train_loss": -5.514315605163574, "global_step": 37587, "epoch": 894} {"train_loss": -5.526309013366699, "global_step": 37588, "epoch": 894} {"train_loss": -5.5660909698123024, "global_step": 37589, "epoch": 894, "val_loss": 62075.37890625} {"train_loss": -5.61952018737793, "global_step": 37590, "epoch": 895} {"train_loss": -5.602114200592041, "global_step": 37591, "epoch": 895} {"train_loss": -5.572210311889648, "global_step": 37592, "epoch": 895} {"train_loss": -5.5453782081604, "global_step": 37593, "epoch": 895} {"train_loss": -5.590633392333984, "global_step": 37594, "epoch": 895} {"train_loss": -5.567111492156982, "global_step": 37595, "epoch": 895} {"train_loss": -5.604711532592773, "global_step": 37596, "epoch": 895} {"train_loss": -5.604098320007324, "global_step": 37597, "epoch": 895} {"train_loss": -5.57033109664917, "global_step": 37598, "epoch": 895} {"train_loss": -5.503920555114746, "global_step": 37599, "epoch": 895} {"train_loss": -5.758591651916504, "global_step": 37600, "epoch": 895} {"train_loss": -5.554324150085449, "global_step": 37601, "epoch": 895} {"train_loss": -5.643813133239746, "global_step": 37602, "epoch": 895} {"train_loss": -5.615710258483887, "global_step": 37603, "epoch": 895} {"train_loss": -5.586270809173584, "global_step": 37604, "epoch": 895} {"train_loss": -5.545638561248779, "global_step": 37605, "epoch": 895} {"train_loss": -5.61743688583374, "global_step": 37606, "epoch": 895} {"train_loss": -5.634446144104004, "global_step": 37607, "epoch": 895} {"train_loss": -5.658944129943848, "global_step": 37608, "epoch": 895} {"train_loss": -5.535751819610596, "global_step": 37609, "epoch": 895} {"train_loss": -5.547196865081787, "global_step": 37610, "epoch": 895} {"train_loss": -5.569214820861816, "global_step": 37611, "epoch": 895} {"train_loss": -5.475864887237549, "global_step": 37612, "epoch": 895} {"train_loss": -5.629922866821289, "global_step": 37613, "epoch": 895} {"train_loss": -5.661338806152344, "global_step": 37614, "epoch": 895} {"train_loss": -5.637460708618164, "global_step": 37615, "epoch": 895} {"train_loss": -5.650755882263184, "global_step": 37616, "epoch": 895} {"train_loss": -5.608696937561035, "global_step": 37617, "epoch": 895} {"train_loss": -5.60258674621582, "global_step": 37618, "epoch": 895} {"train_loss": -5.6934003829956055, "global_step": 37619, "epoch": 895} {"train_loss": -5.815268516540527, "global_step": 37620, "epoch": 895} {"train_loss": -5.647573471069336, "global_step": 37621, "epoch": 895} {"train_loss": -5.646519660949707, "global_step": 37622, "epoch": 895} {"train_loss": -5.59251594543457, "global_step": 37623, "epoch": 895} {"train_loss": -5.634005069732666, "global_step": 37624, "epoch": 895} {"train_loss": -5.59916353225708, "global_step": 37625, "epoch": 895} {"train_loss": -5.643561840057373, "global_step": 37626, "epoch": 895} {"train_loss": -5.601315498352051, "global_step": 37627, "epoch": 895} {"train_loss": -5.6870598793029785, "global_step": 37628, "epoch": 895} {"train_loss": -5.687409400939941, "global_step": 37629, "epoch": 895} {"train_loss": -5.626316070556641, "global_step": 37630, "epoch": 895} {"train_loss": -5.6109454064142135, "global_step": 37631, "epoch": 895, "val_loss": 62219.2265625} {"train_loss": -5.643687725067139, "global_step": 37632, "epoch": 896} {"train_loss": -5.635209083557129, "global_step": 37633, "epoch": 896} {"train_loss": -5.697506904602051, "global_step": 37634, "epoch": 896} {"train_loss": -5.664763450622559, "global_step": 37635, "epoch": 896} {"train_loss": -5.623178958892822, "global_step": 37636, "epoch": 896} {"train_loss": -5.501816749572754, "global_step": 37637, "epoch": 896} {"train_loss": -5.609814643859863, "global_step": 37638, "epoch": 896} {"train_loss": -5.4494476318359375, "global_step": 37639, "epoch": 896} {"train_loss": -5.564544677734375, "global_step": 37640, "epoch": 896} {"train_loss": -5.5684614181518555, "global_step": 37641, "epoch": 896} {"train_loss": -5.594302177429199, "global_step": 37642, "epoch": 896} {"train_loss": -5.482454299926758, "global_step": 37643, "epoch": 896} {"train_loss": -5.530778408050537, "global_step": 37644, "epoch": 896} {"train_loss": -5.541501045227051, "global_step": 37645, "epoch": 896} {"train_loss": -5.588617324829102, "global_step": 37646, "epoch": 896} {"train_loss": -5.52707052230835, "global_step": 37647, "epoch": 896} {"train_loss": -5.50521183013916, "global_step": 37648, "epoch": 896} {"train_loss": -5.608735084533691, "global_step": 37649, "epoch": 896} {"train_loss": -5.648313045501709, "global_step": 37650, "epoch": 896} {"train_loss": -5.625359535217285, "global_step": 37651, "epoch": 896} {"train_loss": -5.5225067138671875, "global_step": 37652, "epoch": 896} {"train_loss": -5.730010509490967, "global_step": 37653, "epoch": 896} {"train_loss": -5.551172256469727, "global_step": 37654, "epoch": 896} {"train_loss": -5.6190185546875, "global_step": 37655, "epoch": 896} {"train_loss": -5.572091102600098, "global_step": 37656, "epoch": 896} {"train_loss": -5.60053825378418, "global_step": 37657, "epoch": 896} {"train_loss": -5.573272705078125, "global_step": 37658, "epoch": 896} {"train_loss": -5.570544242858887, "global_step": 37659, "epoch": 896} {"train_loss": -5.600275993347168, "global_step": 37660, "epoch": 896} {"train_loss": -5.472558975219727, "global_step": 37661, "epoch": 896} {"train_loss": -5.700834274291992, "global_step": 37662, "epoch": 896} {"train_loss": -5.535645484924316, "global_step": 37663, "epoch": 896} {"train_loss": -5.564022064208984, "global_step": 37664, "epoch": 896} {"train_loss": -5.635461807250977, "global_step": 37665, "epoch": 896} {"train_loss": -5.519381523132324, "global_step": 37666, "epoch": 896} {"train_loss": -5.435563087463379, "global_step": 37667, "epoch": 896} {"train_loss": -5.56093692779541, "global_step": 37668, "epoch": 896} {"train_loss": -5.52960729598999, "global_step": 37669, "epoch": 896} {"train_loss": -5.5265727043151855, "global_step": 37670, "epoch": 896} {"train_loss": -5.540002346038818, "global_step": 37671, "epoch": 896} {"train_loss": -5.474123001098633, "global_step": 37672, "epoch": 896} {"train_loss": -5.571090346290951, "global_step": 37673, "epoch": 896, "val_loss": 62413.99609375} {"train_loss": -5.632105350494385, "global_step": 37674, "epoch": 897} {"train_loss": -5.562685489654541, "global_step": 37675, "epoch": 897} {"train_loss": -5.545684814453125, "global_step": 37676, "epoch": 897} {"train_loss": -5.589552879333496, "global_step": 37677, "epoch": 897} {"train_loss": -5.7615461349487305, "global_step": 37678, "epoch": 897} {"train_loss": -5.6811394691467285, "global_step": 37679, "epoch": 897} {"train_loss": -5.661542892456055, "global_step": 37680, "epoch": 897} {"train_loss": -5.459281921386719, "global_step": 37681, "epoch": 897} {"train_loss": -5.631850242614746, "global_step": 37682, "epoch": 897} {"train_loss": -5.623171806335449, "global_step": 37683, "epoch": 897} {"train_loss": -5.587255477905273, "global_step": 37684, "epoch": 897} {"train_loss": -5.673941135406494, "global_step": 37685, "epoch": 897} {"train_loss": -5.680119514465332, "global_step": 37686, "epoch": 897} {"train_loss": -5.502402305603027, "global_step": 37687, "epoch": 897} {"train_loss": -5.610989570617676, "global_step": 37688, "epoch": 897} {"train_loss": -5.529126167297363, "global_step": 37689, "epoch": 897} {"train_loss": -5.68293571472168, "global_step": 37690, "epoch": 897} {"train_loss": -5.552812099456787, "global_step": 37691, "epoch": 897} {"train_loss": -5.6444993019104, "global_step": 37692, "epoch": 897} {"train_loss": -5.600706100463867, "global_step": 37693, "epoch": 897} {"train_loss": -5.619846343994141, "global_step": 37694, "epoch": 897} {"train_loss": -5.636641502380371, "global_step": 37695, "epoch": 897} {"train_loss": -5.644922733306885, "global_step": 37696, "epoch": 897} {"train_loss": -5.644432067871094, "global_step": 37697, "epoch": 897} {"train_loss": -5.517443656921387, "global_step": 37698, "epoch": 897} {"train_loss": -5.592311859130859, "global_step": 37699, "epoch": 897} {"train_loss": -5.7342987060546875, "global_step": 37700, "epoch": 897} {"train_loss": -5.607388019561768, "global_step": 37701, "epoch": 897} {"train_loss": -5.614820957183838, "global_step": 37702, "epoch": 897} {"train_loss": -5.625265598297119, "global_step": 37703, "epoch": 897} {"train_loss": -5.728000164031982, "global_step": 37704, "epoch": 897} {"train_loss": -5.5603413581848145, "global_step": 37705, "epoch": 897} {"train_loss": -5.623953819274902, "global_step": 37706, "epoch": 897} {"train_loss": -5.546682357788086, "global_step": 37707, "epoch": 897} {"train_loss": -5.646040916442871, "global_step": 37708, "epoch": 897} {"train_loss": -5.573189735412598, "global_step": 37709, "epoch": 897} {"train_loss": -5.565054893493652, "global_step": 37710, "epoch": 897} {"train_loss": -5.62922477722168, "global_step": 37711, "epoch": 897} {"train_loss": -5.543929576873779, "global_step": 37712, "epoch": 897} {"train_loss": -5.629580020904541, "global_step": 37713, "epoch": 897} {"train_loss": -5.662413120269775, "global_step": 37714, "epoch": 897} {"train_loss": -5.613584370840163, "global_step": 37715, "epoch": 897, "val_loss": 61935.2421875} {"train_loss": -5.66007137298584, "global_step": 37716, "epoch": 898} {"train_loss": -5.759803771972656, "global_step": 37717, "epoch": 898} {"train_loss": -5.674659729003906, "global_step": 37718, "epoch": 898} {"train_loss": -5.5871686935424805, "global_step": 37719, "epoch": 898} {"train_loss": -5.583913803100586, "global_step": 37720, "epoch": 898} {"train_loss": -5.73422908782959, "global_step": 37721, "epoch": 898} {"train_loss": -5.696301460266113, "global_step": 37722, "epoch": 898} {"train_loss": -5.588945388793945, "global_step": 37723, "epoch": 898} {"train_loss": -5.683319091796875, "global_step": 37724, "epoch": 898} {"train_loss": -5.658048629760742, "global_step": 37725, "epoch": 898} {"train_loss": -5.8050336837768555, "global_step": 37726, "epoch": 898} {"train_loss": -5.666731834411621, "global_step": 37727, "epoch": 898} {"train_loss": -5.600282669067383, "global_step": 37728, "epoch": 898} {"train_loss": -5.605388164520264, "global_step": 37729, "epoch": 898} {"train_loss": -5.612729549407959, "global_step": 37730, "epoch": 898} {"train_loss": -5.6604461669921875, "global_step": 37731, "epoch": 898} {"train_loss": -5.629328727722168, "global_step": 37732, "epoch": 898} {"train_loss": -5.663110256195068, "global_step": 37733, "epoch": 898} {"train_loss": -5.488672256469727, "global_step": 37734, "epoch": 898} {"train_loss": -5.594428062438965, "global_step": 37735, "epoch": 898} {"train_loss": -5.606274604797363, "global_step": 37736, "epoch": 898} {"train_loss": -5.508654594421387, "global_step": 37737, "epoch": 898} {"train_loss": -5.716006278991699, "global_step": 37738, "epoch": 898} {"train_loss": -5.516679286956787, "global_step": 37739, "epoch": 898} {"train_loss": -5.568856716156006, "global_step": 37740, "epoch": 898} {"train_loss": -5.6721930503845215, "global_step": 37741, "epoch": 898} {"train_loss": -5.536733627319336, "global_step": 37742, "epoch": 898} {"train_loss": -5.67758846282959, "global_step": 37743, "epoch": 898} {"train_loss": -5.601454734802246, "global_step": 37744, "epoch": 898} {"train_loss": -5.450178623199463, "global_step": 37745, "epoch": 898} {"train_loss": -5.54793643951416, "global_step": 37746, "epoch": 898} {"train_loss": -5.626435279846191, "global_step": 37747, "epoch": 898} {"train_loss": -5.521862506866455, "global_step": 37748, "epoch": 898} {"train_loss": -5.52199649810791, "global_step": 37749, "epoch": 898} {"train_loss": -5.546634674072266, "global_step": 37750, "epoch": 898} {"train_loss": -5.456510543823242, "global_step": 37751, "epoch": 898} {"train_loss": -5.551625728607178, "global_step": 37752, "epoch": 898} {"train_loss": -5.558687210083008, "global_step": 37753, "epoch": 898} {"train_loss": -5.524176597595215, "global_step": 37754, "epoch": 898} {"train_loss": -5.524672508239746, "global_step": 37755, "epoch": 898} {"train_loss": -5.559566974639893, "global_step": 37756, "epoch": 898} {"train_loss": -5.602742547080631, "global_step": 37757, "epoch": 898, "val_loss": 62277.68359375} {"train_loss": -5.581560134887695, "global_step": 37758, "epoch": 899} {"train_loss": -5.473302841186523, "global_step": 37759, "epoch": 899} {"train_loss": -5.6875176429748535, "global_step": 37760, "epoch": 899} {"train_loss": -5.620929718017578, "global_step": 37761, "epoch": 899} {"train_loss": -5.659304618835449, "global_step": 37762, "epoch": 899} {"train_loss": -5.664158344268799, "global_step": 37763, "epoch": 899} {"train_loss": -5.649715900421143, "global_step": 37764, "epoch": 899} {"train_loss": -5.66987943649292, "global_step": 37765, "epoch": 899} {"train_loss": -5.643404960632324, "global_step": 37766, "epoch": 899} {"train_loss": -5.632290840148926, "global_step": 37767, "epoch": 899} {"train_loss": -5.510679244995117, "global_step": 37768, "epoch": 899} {"train_loss": -5.6146979331970215, "global_step": 37769, "epoch": 899} {"train_loss": -5.611387729644775, "global_step": 37770, "epoch": 899} {"train_loss": -5.528220176696777, "global_step": 37771, "epoch": 899} {"train_loss": -5.495668411254883, "global_step": 37772, "epoch": 899} {"train_loss": -5.63101863861084, "global_step": 37773, "epoch": 899} {"train_loss": -5.680154800415039, "global_step": 37774, "epoch": 899} {"train_loss": -5.412137031555176, "global_step": 37775, "epoch": 899} {"train_loss": -5.4982805252075195, "global_step": 37776, "epoch": 899} {"train_loss": -5.5346598625183105, "global_step": 37777, "epoch": 899} {"train_loss": -5.492271900177002, "global_step": 37778, "epoch": 899} {"train_loss": -5.589144229888916, "global_step": 37779, "epoch": 899} {"train_loss": -5.66124153137207, "global_step": 37780, "epoch": 899} {"train_loss": -5.604532241821289, "global_step": 37781, "epoch": 899} {"train_loss": -5.582671165466309, "global_step": 37782, "epoch": 899} {"train_loss": -5.698633193969727, "global_step": 37783, "epoch": 899} {"train_loss": -5.586634635925293, "global_step": 37784, "epoch": 899} {"train_loss": -5.462151527404785, "global_step": 37785, "epoch": 899} {"train_loss": -5.569361686706543, "global_step": 37786, "epoch": 899} {"train_loss": -5.609228134155273, "global_step": 37787, "epoch": 899} {"train_loss": -5.648802757263184, "global_step": 37788, "epoch": 899} {"train_loss": -5.754726886749268, "global_step": 37789, "epoch": 899} {"train_loss": -5.73236083984375, "global_step": 37790, "epoch": 899} {"train_loss": -5.616002082824707, "global_step": 37791, "epoch": 899} {"train_loss": -5.67299222946167, "global_step": 37792, "epoch": 899} {"train_loss": -5.6598639488220215, "global_step": 37793, "epoch": 899} {"train_loss": -5.6809468269348145, "global_step": 37794, "epoch": 899} {"train_loss": -5.450952529907227, "global_step": 37795, "epoch": 899} {"train_loss": -5.437996864318848, "global_step": 37796, "epoch": 899} {"train_loss": -5.478396892547607, "global_step": 37797, "epoch": 899} {"train_loss": -5.511636734008789, "global_step": 37798, "epoch": 899} {"train_loss": -5.589809474490938, "global_step": 37799, "epoch": 899, "val_loss": 62154.640625} {"train_loss": -5.599841117858887, "global_step": 37800, "epoch": 900} {"train_loss": -5.640261173248291, "global_step": 37801, "epoch": 900} {"train_loss": -5.588964939117432, "global_step": 37802, "epoch": 900} {"train_loss": -5.4934773445129395, "global_step": 37803, "epoch": 900} {"train_loss": -5.528574466705322, "global_step": 37804, "epoch": 900} {"train_loss": -5.636866569519043, "global_step": 37805, "epoch": 900} {"train_loss": -5.5702409744262695, "global_step": 37806, "epoch": 900} {"train_loss": -5.6532697677612305, "global_step": 37807, "epoch": 900} {"train_loss": -5.6288042068481445, "global_step": 37808, "epoch": 900} {"train_loss": -5.629955768585205, "global_step": 37809, "epoch": 900} {"train_loss": -5.522615909576416, "global_step": 37810, "epoch": 900} {"train_loss": -5.68951416015625, "global_step": 37811, "epoch": 900} {"train_loss": -5.662328243255615, "global_step": 37812, "epoch": 900} {"train_loss": -5.503857612609863, "global_step": 37813, "epoch": 900} {"train_loss": -5.668633460998535, "global_step": 37814, "epoch": 900} {"train_loss": -5.539819240570068, "global_step": 37815, "epoch": 900} {"train_loss": -5.581338882446289, "global_step": 37816, "epoch": 900} {"train_loss": -5.640647888183594, "global_step": 37817, "epoch": 900} {"train_loss": -5.594676971435547, "global_step": 37818, "epoch": 900} {"train_loss": -5.741193771362305, "global_step": 37819, "epoch": 900} {"train_loss": -5.477409362792969, "global_step": 37820, "epoch": 900} {"train_loss": -5.583401679992676, "global_step": 37821, "epoch": 900} {"train_loss": -5.6865949630737305, "global_step": 37822, "epoch": 900} {"train_loss": -5.5545334815979, "global_step": 37823, "epoch": 900} {"train_loss": -5.509697914123535, "global_step": 37824, "epoch": 900} {"train_loss": -5.494946479797363, "global_step": 37825, "epoch": 900} {"train_loss": -5.545622825622559, "global_step": 37826, "epoch": 900} {"train_loss": -5.549625396728516, "global_step": 37827, "epoch": 900} {"train_loss": -5.4200615882873535, "global_step": 37828, "epoch": 900} {"train_loss": -5.639369487762451, "global_step": 37829, "epoch": 900} {"train_loss": -5.647355079650879, "global_step": 37830, "epoch": 900} {"train_loss": -5.585448265075684, "global_step": 37831, "epoch": 900} {"train_loss": -5.590313911437988, "global_step": 37832, "epoch": 900} {"train_loss": -5.589336395263672, "global_step": 37833, "epoch": 900} {"train_loss": -5.576622486114502, "global_step": 37834, "epoch": 900} {"train_loss": -5.5548906326293945, "global_step": 37835, "epoch": 900} {"train_loss": -5.674910068511963, "global_step": 37836, "epoch": 900} {"train_loss": -5.644256114959717, "global_step": 37837, "epoch": 900} {"train_loss": -5.682990074157715, "global_step": 37838, "epoch": 900} {"train_loss": -5.6303486824035645, "global_step": 37839, "epoch": 900} {"train_loss": -5.529071807861328, "global_step": 37840, "epoch": 900} {"train_loss": -5.591136421476092, "global_step": 37841, "epoch": 900, "train/sim_max_reward_0": 0.2096868915045649, "train/sim_max_reward_1": 0.48775284607146296, "train/sim_max_reward_2": 0.413384127228691, "train/sim_max_reward_3": 0.1199321632219586, "train/sim_max_reward_4": 0.9028256464058915, "train/sim_max_reward_5": 0.5389024516412589, "test/sim_max_reward_4300000": 0.40706922922060795, "test/sim_max_reward_4300001": 0.013894408966596014, "test/sim_max_reward_4300002": 0.23440640913349442, "test/sim_max_reward_4300003": 0.723143852813766, "test/sim_max_reward_4300004": 0.04665640326282213, "test/sim_max_reward_4300005": 0.4132422027617797, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3522753788975498, "test/sim_max_reward_4300008": 0.0, "test/sim_max_reward_4300009": 0.7834034548409253, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.2621044173971572, "test/sim_max_reward_4300012": 0.38942472439987336, "test/sim_max_reward_4300013": 0.48991436081503387, "test/sim_max_reward_4300014": 0.505177045682367, "test/sim_max_reward_4300015": 0.4794677515206023, "test/sim_max_reward_4300016": 0.4429627624881825, "test/sim_max_reward_4300017": 0.46290888524774326, "test/sim_max_reward_4300018": 0.30154188984375585, "test/sim_max_reward_4300019": 0.1853344929043627, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9696062270704208, "test/sim_max_reward_4300022": 0.8063903667151228, "test/sim_max_reward_4300023": 0.3494869832474777, "test/sim_max_reward_4300024": 0.4058096137710447, "test/sim_max_reward_4300025": 0.4659909128266152, "test/sim_max_reward_4300026": 0.31254741934637414, "test/sim_max_reward_4300027": 0.8863001004374887, "test/sim_max_reward_4300028": 0.013711081655819723, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.5196804543172596, "test/sim_max_reward_4300031": 0.0, "test/sim_max_reward_4300032": 0.7380402590966313, "test/sim_max_reward_4300033": 0.4751030714108889, "test/sim_max_reward_4300034": 6.409102722171371e-05, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.6460627260139455, "test/sim_max_reward_4300038": 0.5534836626577471, "test/sim_max_reward_4300039": 0.4176631603284335, "test/sim_max_reward_4300040": 0.13507492348370267, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7215325207792834, "test/sim_max_reward_4300043": 0.01912165197990456, "test/sim_max_reward_4300044": 0.41109389783795297, "test/sim_max_reward_4300045": 0.16305059105012143, "test/sim_max_reward_4300046": 0.0700145957927769, "test/sim_max_reward_4300047": 0.6955237091848123, "test/sim_max_reward_4300048": 0.4127921963093015, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.4454140210123046, "test/mean_score": 0.3376053200420089, "val_loss": 62723.31640625} {"train_loss": -5.410160064697266, "global_step": 37842, "epoch": 901} {"train_loss": -5.595659255981445, "global_step": 37843, "epoch": 901} {"train_loss": -5.608059406280518, "global_step": 37844, "epoch": 901} {"train_loss": -5.688918590545654, "global_step": 37845, "epoch": 901} {"train_loss": -5.591091156005859, "global_step": 37846, "epoch": 901} {"train_loss": -5.6119279861450195, "global_step": 37847, "epoch": 901} {"train_loss": -5.613259792327881, "global_step": 37848, "epoch": 901} {"train_loss": -5.5092387199401855, "global_step": 37849, "epoch": 901} {"train_loss": -5.54421854019165, "global_step": 37850, "epoch": 901} {"train_loss": -5.438248634338379, "global_step": 37851, "epoch": 901} {"train_loss": -5.536953449249268, "global_step": 37852, "epoch": 901} {"train_loss": -5.679813385009766, "global_step": 37853, "epoch": 901} {"train_loss": -5.438119888305664, "global_step": 37854, "epoch": 901} {"train_loss": -5.635148525238037, "global_step": 37855, "epoch": 901} {"train_loss": -5.6510233879089355, "global_step": 37856, "epoch": 901} {"train_loss": -5.510794162750244, "global_step": 37857, "epoch": 901} {"train_loss": -5.555238723754883, "global_step": 37858, "epoch": 901} {"train_loss": -5.585043907165527, "global_step": 37859, "epoch": 901} {"train_loss": -5.450618743896484, "global_step": 37860, "epoch": 901} {"train_loss": -5.561527729034424, "global_step": 37861, "epoch": 901} {"train_loss": -5.617242336273193, "global_step": 37862, "epoch": 901} {"train_loss": -5.682280540466309, "global_step": 37863, "epoch": 901} {"train_loss": -5.6787824630737305, "global_step": 37864, "epoch": 901} {"train_loss": -5.641441822052002, "global_step": 37865, "epoch": 901} {"train_loss": -5.576383113861084, "global_step": 37866, "epoch": 901} {"train_loss": -5.588200092315674, "global_step": 37867, "epoch": 901} {"train_loss": -5.619926452636719, "global_step": 37868, "epoch": 901} {"train_loss": -5.546486854553223, "global_step": 37869, "epoch": 901} {"train_loss": -5.510032653808594, "global_step": 37870, "epoch": 901} {"train_loss": -5.63871955871582, "global_step": 37871, "epoch": 901} {"train_loss": -5.617539405822754, "global_step": 37872, "epoch": 901} {"train_loss": -5.662449359893799, "global_step": 37873, "epoch": 901} {"train_loss": -5.625576972961426, "global_step": 37874, "epoch": 901} {"train_loss": -5.552746772766113, "global_step": 37875, "epoch": 901} {"train_loss": -5.644331932067871, "global_step": 37876, "epoch": 901} {"train_loss": -5.65773868560791, "global_step": 37877, "epoch": 901} {"train_loss": -5.667499542236328, "global_step": 37878, "epoch": 901} {"train_loss": -5.665255069732666, "global_step": 37879, "epoch": 901} {"train_loss": -5.530740737915039, "global_step": 37880, "epoch": 901} {"train_loss": -5.766348838806152, "global_step": 37881, "epoch": 901} {"train_loss": -5.602224349975586, "global_step": 37882, "epoch": 901} {"train_loss": -5.59305679230463, "global_step": 37883, "epoch": 901, "val_loss": 62101.46875} {"train_loss": -5.637671947479248, "global_step": 37884, "epoch": 902} {"train_loss": -5.696418762207031, "global_step": 37885, "epoch": 902} {"train_loss": -5.665609359741211, "global_step": 37886, "epoch": 902} {"train_loss": -5.629020690917969, "global_step": 37887, "epoch": 902} {"train_loss": -5.6790947914123535, "global_step": 37888, "epoch": 902} {"train_loss": -5.559474945068359, "global_step": 37889, "epoch": 902} {"train_loss": -5.535950660705566, "global_step": 37890, "epoch": 902} {"train_loss": -5.696837425231934, "global_step": 37891, "epoch": 902} {"train_loss": -5.5421600341796875, "global_step": 37892, "epoch": 902} {"train_loss": -5.628502368927002, "global_step": 37893, "epoch": 902} {"train_loss": -5.575056076049805, "global_step": 37894, "epoch": 902} {"train_loss": -5.633029937744141, "global_step": 37895, "epoch": 902} {"train_loss": -5.659163475036621, "global_step": 37896, "epoch": 902} {"train_loss": -5.63947868347168, "global_step": 37897, "epoch": 902} {"train_loss": -5.650306701660156, "global_step": 37898, "epoch": 902} {"train_loss": -5.528225898742676, "global_step": 37899, "epoch": 902} {"train_loss": -5.664978504180908, "global_step": 37900, "epoch": 902} {"train_loss": -5.581007957458496, "global_step": 37901, "epoch": 902} {"train_loss": -5.527624130249023, "global_step": 37902, "epoch": 902} {"train_loss": -5.635786533355713, "global_step": 37903, "epoch": 902} {"train_loss": -5.6741943359375, "global_step": 37904, "epoch": 902} {"train_loss": -5.663865089416504, "global_step": 37905, "epoch": 902} {"train_loss": -5.629199981689453, "global_step": 37906, "epoch": 902} {"train_loss": -5.7784576416015625, "global_step": 37907, "epoch": 902} {"train_loss": -5.537199974060059, "global_step": 37908, "epoch": 902} {"train_loss": -5.499295711517334, "global_step": 37909, "epoch": 902} {"train_loss": -5.714799880981445, "global_step": 37910, "epoch": 902} {"train_loss": -5.763907432556152, "global_step": 37911, "epoch": 902} {"train_loss": -5.6024909019470215, "global_step": 37912, "epoch": 902} {"train_loss": -5.671565055847168, "global_step": 37913, "epoch": 902} {"train_loss": -5.585355758666992, "global_step": 37914, "epoch": 902} {"train_loss": -5.395913124084473, "global_step": 37915, "epoch": 902} {"train_loss": -5.673087120056152, "global_step": 37916, "epoch": 902} {"train_loss": -5.54021692276001, "global_step": 37917, "epoch": 902} {"train_loss": -5.688092231750488, "global_step": 37918, "epoch": 902} {"train_loss": -5.55881404876709, "global_step": 37919, "epoch": 902} {"train_loss": -5.60655403137207, "global_step": 37920, "epoch": 902} {"train_loss": -5.540553569793701, "global_step": 37921, "epoch": 902} {"train_loss": -5.528180122375488, "global_step": 37922, "epoch": 902} {"train_loss": -5.6724138259887695, "global_step": 37923, "epoch": 902} {"train_loss": -5.546420097351074, "global_step": 37924, "epoch": 902} {"train_loss": -5.616007577805292, "global_step": 37925, "epoch": 902, "val_loss": 62178.4375} {"train_loss": -5.521735191345215, "global_step": 37926, "epoch": 903} {"train_loss": -5.5808916091918945, "global_step": 37927, "epoch": 903} {"train_loss": -5.560335159301758, "global_step": 37928, "epoch": 903} {"train_loss": -5.613553524017334, "global_step": 37929, "epoch": 903} {"train_loss": -5.665670394897461, "global_step": 37930, "epoch": 903} {"train_loss": -5.730151176452637, "global_step": 37931, "epoch": 903} {"train_loss": -5.6922149658203125, "global_step": 37932, "epoch": 903} {"train_loss": -5.691984176635742, "global_step": 37933, "epoch": 903} {"train_loss": -5.691125869750977, "global_step": 37934, "epoch": 903} {"train_loss": -5.519134044647217, "global_step": 37935, "epoch": 903} {"train_loss": -5.577852725982666, "global_step": 37936, "epoch": 903} {"train_loss": -5.642967224121094, "global_step": 37937, "epoch": 903} {"train_loss": -5.590095520019531, "global_step": 37938, "epoch": 903} {"train_loss": -5.65975284576416, "global_step": 37939, "epoch": 903} {"train_loss": -5.543173789978027, "global_step": 37940, "epoch": 903} {"train_loss": -5.664176940917969, "global_step": 37941, "epoch": 903} {"train_loss": -5.650666236877441, "global_step": 37942, "epoch": 903} {"train_loss": -5.76017951965332, "global_step": 37943, "epoch": 903} {"train_loss": -5.621731758117676, "global_step": 37944, "epoch": 903} {"train_loss": -5.642470359802246, "global_step": 37945, "epoch": 903} {"train_loss": -5.684139728546143, "global_step": 37946, "epoch": 903} {"train_loss": -5.612373352050781, "global_step": 37947, "epoch": 903} {"train_loss": -5.479260444641113, "global_step": 37948, "epoch": 903} {"train_loss": -5.544802188873291, "global_step": 37949, "epoch": 903} {"train_loss": -5.621669769287109, "global_step": 37950, "epoch": 903} {"train_loss": -5.563958168029785, "global_step": 37951, "epoch": 903} {"train_loss": -5.598516464233398, "global_step": 37952, "epoch": 903} {"train_loss": -5.610207557678223, "global_step": 37953, "epoch": 903} {"train_loss": -5.561406135559082, "global_step": 37954, "epoch": 903} {"train_loss": -5.601691246032715, "global_step": 37955, "epoch": 903} {"train_loss": -5.601987838745117, "global_step": 37956, "epoch": 903} {"train_loss": -5.632250785827637, "global_step": 37957, "epoch": 903} {"train_loss": -5.541403770446777, "global_step": 37958, "epoch": 903} {"train_loss": -5.517078399658203, "global_step": 37959, "epoch": 903} {"train_loss": -5.5949859619140625, "global_step": 37960, "epoch": 903} {"train_loss": -5.672895908355713, "global_step": 37961, "epoch": 903} {"train_loss": -5.544956207275391, "global_step": 37962, "epoch": 903} {"train_loss": -5.606264591217041, "global_step": 37963, "epoch": 903} {"train_loss": -5.698887825012207, "global_step": 37964, "epoch": 903} {"train_loss": -5.55537223815918, "global_step": 37965, "epoch": 903} {"train_loss": -5.546077251434326, "global_step": 37966, "epoch": 903} {"train_loss": -5.609071481795538, "global_step": 37967, "epoch": 903, "val_loss": 62102.41796875} {"train_loss": -5.664278507232666, "global_step": 37968, "epoch": 904} {"train_loss": -5.6127214431762695, "global_step": 37969, "epoch": 904} {"train_loss": -5.5792341232299805, "global_step": 37970, "epoch": 904} {"train_loss": -5.688863754272461, "global_step": 37971, "epoch": 904} {"train_loss": -5.480123519897461, "global_step": 37972, "epoch": 904} {"train_loss": -5.533478736877441, "global_step": 37973, "epoch": 904} {"train_loss": -5.658647537231445, "global_step": 37974, "epoch": 904} {"train_loss": -5.633727073669434, "global_step": 37975, "epoch": 904} {"train_loss": -5.6414899826049805, "global_step": 37976, "epoch": 904} {"train_loss": -5.739649295806885, "global_step": 37977, "epoch": 904} {"train_loss": -5.666172027587891, "global_step": 37978, "epoch": 904} {"train_loss": -5.495247840881348, "global_step": 37979, "epoch": 904} {"train_loss": -5.555106163024902, "global_step": 37980, "epoch": 904} {"train_loss": -5.548736572265625, "global_step": 37981, "epoch": 904} {"train_loss": -5.618084907531738, "global_step": 37982, "epoch": 904} {"train_loss": -5.5874457359313965, "global_step": 37983, "epoch": 904} {"train_loss": -5.5807414054870605, "global_step": 37984, "epoch": 904} {"train_loss": -5.549314498901367, "global_step": 37985, "epoch": 904} {"train_loss": -5.5758867263793945, "global_step": 37986, "epoch": 904} {"train_loss": -5.682295799255371, "global_step": 37987, "epoch": 904} {"train_loss": -5.407309532165527, "global_step": 37988, "epoch": 904} {"train_loss": -5.678765296936035, "global_step": 37989, "epoch": 904} {"train_loss": -5.589601516723633, "global_step": 37990, "epoch": 904} {"train_loss": -5.523756980895996, "global_step": 37991, "epoch": 904} {"train_loss": -5.472655773162842, "global_step": 37992, "epoch": 904} {"train_loss": -5.552155494689941, "global_step": 37993, "epoch": 904} {"train_loss": -5.534235954284668, "global_step": 37994, "epoch": 904} {"train_loss": -5.638031959533691, "global_step": 37995, "epoch": 904} {"train_loss": -5.629997253417969, "global_step": 37996, "epoch": 904} {"train_loss": -5.604874610900879, "global_step": 37997, "epoch": 904} {"train_loss": -5.6406354904174805, "global_step": 37998, "epoch": 904} {"train_loss": -5.614335536956787, "global_step": 37999, "epoch": 904} {"train_loss": -5.577898979187012, "global_step": 38000, "epoch": 904} {"train_loss": -5.563631057739258, "global_step": 38001, "epoch": 904} {"train_loss": -5.61368465423584, "global_step": 38002, "epoch": 904} {"train_loss": -5.41983699798584, "global_step": 38003, "epoch": 904} {"train_loss": -5.516243934631348, "global_step": 38004, "epoch": 904} {"train_loss": -5.577425956726074, "global_step": 38005, "epoch": 904} {"train_loss": -5.488592147827148, "global_step": 38006, "epoch": 904} {"train_loss": -5.568551063537598, "global_step": 38007, "epoch": 904} {"train_loss": -5.508753299713135, "global_step": 38008, "epoch": 904} {"train_loss": -5.580313875561669, "global_step": 38009, "epoch": 904, "val_loss": 62068.64453125} {"train_loss": -5.612461090087891, "global_step": 38010, "epoch": 905} {"train_loss": -5.42735481262207, "global_step": 38011, "epoch": 905} {"train_loss": -5.608562469482422, "global_step": 38012, "epoch": 905} {"train_loss": -5.61604118347168, "global_step": 38013, "epoch": 905} {"train_loss": -5.613985061645508, "global_step": 38014, "epoch": 905} {"train_loss": -5.458470821380615, "global_step": 38015, "epoch": 905} {"train_loss": -5.625762939453125, "global_step": 38016, "epoch": 905} {"train_loss": -5.63447904586792, "global_step": 38017, "epoch": 905} {"train_loss": -5.623758792877197, "global_step": 38018, "epoch": 905} {"train_loss": -5.5732808113098145, "global_step": 38019, "epoch": 905} {"train_loss": -5.605230808258057, "global_step": 38020, "epoch": 905} {"train_loss": -5.730800628662109, "global_step": 38021, "epoch": 905} {"train_loss": -5.649657249450684, "global_step": 38022, "epoch": 905} {"train_loss": -5.676408290863037, "global_step": 38023, "epoch": 905} {"train_loss": -5.653852939605713, "global_step": 38024, "epoch": 905} {"train_loss": -5.742937088012695, "global_step": 38025, "epoch": 905} {"train_loss": -5.519604682922363, "global_step": 38026, "epoch": 905} {"train_loss": -5.649637222290039, "global_step": 38027, "epoch": 905} {"train_loss": -5.5876946449279785, "global_step": 38028, "epoch": 905} {"train_loss": -5.610312461853027, "global_step": 38029, "epoch": 905} {"train_loss": -5.512819290161133, "global_step": 38030, "epoch": 905} {"train_loss": -5.653267860412598, "global_step": 38031, "epoch": 905} {"train_loss": -5.597864627838135, "global_step": 38032, "epoch": 905} {"train_loss": -5.561384201049805, "global_step": 38033, "epoch": 905} {"train_loss": -5.538932800292969, "global_step": 38034, "epoch": 905} {"train_loss": -5.544873237609863, "global_step": 38035, "epoch": 905} {"train_loss": -5.652952671051025, "global_step": 38036, "epoch": 905} {"train_loss": -5.578062057495117, "global_step": 38037, "epoch": 905} {"train_loss": -5.506247520446777, "global_step": 38038, "epoch": 905} {"train_loss": -5.514203071594238, "global_step": 38039, "epoch": 905} {"train_loss": -5.5322771072387695, "global_step": 38040, "epoch": 905} {"train_loss": -5.525678634643555, "global_step": 38041, "epoch": 905} {"train_loss": -5.557570457458496, "global_step": 38042, "epoch": 905} {"train_loss": -5.574748992919922, "global_step": 38043, "epoch": 905} {"train_loss": -5.478960037231445, "global_step": 38044, "epoch": 905} {"train_loss": -5.572599411010742, "global_step": 38045, "epoch": 905} {"train_loss": -5.55440616607666, "global_step": 38046, "epoch": 905} {"train_loss": -5.579648494720459, "global_step": 38047, "epoch": 905} {"train_loss": -5.596514701843262, "global_step": 38048, "epoch": 905} {"train_loss": -5.546810626983643, "global_step": 38049, "epoch": 905} {"train_loss": -5.628497123718262, "global_step": 38050, "epoch": 905} {"train_loss": -5.5852846304575605, "global_step": 38051, "epoch": 905, "val_loss": 62135.68359375} {"train_loss": -5.509381294250488, "global_step": 38052, "epoch": 906} {"train_loss": -5.589545249938965, "global_step": 38053, "epoch": 906} {"train_loss": -5.624833106994629, "global_step": 38054, "epoch": 906} {"train_loss": -5.510605812072754, "global_step": 38055, "epoch": 906} {"train_loss": -5.569983005523682, "global_step": 38056, "epoch": 906} {"train_loss": -5.580400466918945, "global_step": 38057, "epoch": 906} {"train_loss": -5.580012321472168, "global_step": 38058, "epoch": 906} {"train_loss": -5.668130874633789, "global_step": 38059, "epoch": 906} {"train_loss": -5.637188911437988, "global_step": 38060, "epoch": 906} {"train_loss": -5.550717353820801, "global_step": 38061, "epoch": 906} {"train_loss": -5.609098434448242, "global_step": 38062, "epoch": 906} {"train_loss": -5.586623668670654, "global_step": 38063, "epoch": 906} {"train_loss": -5.564477920532227, "global_step": 38064, "epoch": 906} {"train_loss": -5.6656084060668945, "global_step": 38065, "epoch": 906} {"train_loss": -5.590453147888184, "global_step": 38066, "epoch": 906} {"train_loss": -5.524097442626953, "global_step": 38067, "epoch": 906} {"train_loss": -5.597668647766113, "global_step": 38068, "epoch": 906} {"train_loss": -5.702991485595703, "global_step": 38069, "epoch": 906} {"train_loss": -5.599431991577148, "global_step": 38070, "epoch": 906} {"train_loss": -5.500084400177002, "global_step": 38071, "epoch": 906} {"train_loss": -5.4888691902160645, "global_step": 38072, "epoch": 906} {"train_loss": -5.628824710845947, "global_step": 38073, "epoch": 906} {"train_loss": -5.652331829071045, "global_step": 38074, "epoch": 906} {"train_loss": -5.675541877746582, "global_step": 38075, "epoch": 906} {"train_loss": -5.703474044799805, "global_step": 38076, "epoch": 906} {"train_loss": -5.746792793273926, "global_step": 38077, "epoch": 906} {"train_loss": -5.463555335998535, "global_step": 38078, "epoch": 906} {"train_loss": -5.722408771514893, "global_step": 38079, "epoch": 906} {"train_loss": -5.582231044769287, "global_step": 38080, "epoch": 906} {"train_loss": -5.593487739562988, "global_step": 38081, "epoch": 906} {"train_loss": -5.5977373123168945, "global_step": 38082, "epoch": 906} {"train_loss": -5.691054821014404, "global_step": 38083, "epoch": 906} {"train_loss": -5.564688682556152, "global_step": 38084, "epoch": 906} {"train_loss": -5.541026592254639, "global_step": 38085, "epoch": 906} {"train_loss": -5.465507507324219, "global_step": 38086, "epoch": 906} {"train_loss": -5.554685592651367, "global_step": 38087, "epoch": 906} {"train_loss": -5.465267181396484, "global_step": 38088, "epoch": 906} {"train_loss": -5.6219329833984375, "global_step": 38089, "epoch": 906} {"train_loss": -5.613838195800781, "global_step": 38090, "epoch": 906} {"train_loss": -5.632723808288574, "global_step": 38091, "epoch": 906} {"train_loss": -5.669742584228516, "global_step": 38092, "epoch": 906} {"train_loss": -5.595454976672218, "global_step": 38093, "epoch": 906, "val_loss": 62353.984375} {"train_loss": -5.577080249786377, "global_step": 38094, "epoch": 907} {"train_loss": -5.654558181762695, "global_step": 38095, "epoch": 907} {"train_loss": -5.590022087097168, "global_step": 38096, "epoch": 907} {"train_loss": -5.622028827667236, "global_step": 38097, "epoch": 907} {"train_loss": -5.640457630157471, "global_step": 38098, "epoch": 907} {"train_loss": -5.586007595062256, "global_step": 38099, "epoch": 907} {"train_loss": -5.595831871032715, "global_step": 38100, "epoch": 907} {"train_loss": -5.452083587646484, "global_step": 38101, "epoch": 907} {"train_loss": -5.575823783874512, "global_step": 38102, "epoch": 907} {"train_loss": -5.79532527923584, "global_step": 38103, "epoch": 907} {"train_loss": -5.547281742095947, "global_step": 38104, "epoch": 907} {"train_loss": -5.555976867675781, "global_step": 38105, "epoch": 907} {"train_loss": -5.557981491088867, "global_step": 38106, "epoch": 907} {"train_loss": -5.6316633224487305, "global_step": 38107, "epoch": 907} {"train_loss": -5.653249263763428, "global_step": 38108, "epoch": 907} {"train_loss": -5.499002933502197, "global_step": 38109, "epoch": 907} {"train_loss": -5.626483917236328, "global_step": 38110, "epoch": 907} {"train_loss": -5.480923652648926, "global_step": 38111, "epoch": 907} {"train_loss": -5.553099632263184, "global_step": 38112, "epoch": 907} {"train_loss": -5.464311599731445, "global_step": 38113, "epoch": 907} {"train_loss": -5.45583438873291, "global_step": 38114, "epoch": 907} {"train_loss": -5.536638259887695, "global_step": 38115, "epoch": 907} {"train_loss": -5.631556987762451, "global_step": 38116, "epoch": 907} {"train_loss": -5.585371971130371, "global_step": 38117, "epoch": 907} {"train_loss": -5.631594181060791, "global_step": 38118, "epoch": 907} {"train_loss": -5.542205810546875, "global_step": 38119, "epoch": 907} {"train_loss": -5.646289348602295, "global_step": 38120, "epoch": 907} {"train_loss": -5.611663818359375, "global_step": 38121, "epoch": 907} {"train_loss": -5.5231781005859375, "global_step": 38122, "epoch": 907} {"train_loss": -5.567439079284668, "global_step": 38123, "epoch": 907} {"train_loss": -5.580746650695801, "global_step": 38124, "epoch": 907} {"train_loss": -5.553261756896973, "global_step": 38125, "epoch": 907} {"train_loss": -5.639454364776611, "global_step": 38126, "epoch": 907} {"train_loss": -5.6325531005859375, "global_step": 38127, "epoch": 907} {"train_loss": -5.663571357727051, "global_step": 38128, "epoch": 907} {"train_loss": -5.5794878005981445, "global_step": 38129, "epoch": 907} {"train_loss": -5.6054182052612305, "global_step": 38130, "epoch": 907} {"train_loss": -5.58767032623291, "global_step": 38131, "epoch": 907} {"train_loss": -5.6218156814575195, "global_step": 38132, "epoch": 907} {"train_loss": -5.610097885131836, "global_step": 38133, "epoch": 907} {"train_loss": -5.641270160675049, "global_step": 38134, "epoch": 907} {"train_loss": -5.588243439084008, "global_step": 38135, "epoch": 907, "val_loss": 61996.2734375} {"train_loss": -5.562816143035889, "global_step": 38136, "epoch": 908} {"train_loss": -5.666558265686035, "global_step": 38137, "epoch": 908} {"train_loss": -5.60777473449707, "global_step": 38138, "epoch": 908} {"train_loss": -5.626091957092285, "global_step": 38139, "epoch": 908} {"train_loss": -5.64955997467041, "global_step": 38140, "epoch": 908} {"train_loss": -5.587603569030762, "global_step": 38141, "epoch": 908} {"train_loss": -5.542072296142578, "global_step": 38142, "epoch": 908} {"train_loss": -5.564061164855957, "global_step": 38143, "epoch": 908} {"train_loss": -5.714848518371582, "global_step": 38144, "epoch": 908} {"train_loss": -5.788275241851807, "global_step": 38145, "epoch": 908} {"train_loss": -5.643365859985352, "global_step": 38146, "epoch": 908} {"train_loss": -5.534689903259277, "global_step": 38147, "epoch": 908} {"train_loss": -5.593206405639648, "global_step": 38148, "epoch": 908} {"train_loss": -5.5908026695251465, "global_step": 38149, "epoch": 908} {"train_loss": -5.619885444641113, "global_step": 38150, "epoch": 908} {"train_loss": -5.718723773956299, "global_step": 38151, "epoch": 908} {"train_loss": -5.491758346557617, "global_step": 38152, "epoch": 908} {"train_loss": -5.554461479187012, "global_step": 38153, "epoch": 908} {"train_loss": -5.667731285095215, "global_step": 38154, "epoch": 908} {"train_loss": -5.590130805969238, "global_step": 38155, "epoch": 908} {"train_loss": -5.736988544464111, "global_step": 38156, "epoch": 908} {"train_loss": -5.611756324768066, "global_step": 38157, "epoch": 908} {"train_loss": -5.661148548126221, "global_step": 38158, "epoch": 908} {"train_loss": -5.65767240524292, "global_step": 38159, "epoch": 908} {"train_loss": -5.666751861572266, "global_step": 38160, "epoch": 908} {"train_loss": -5.574076175689697, "global_step": 38161, "epoch": 908} {"train_loss": -5.5249433517456055, "global_step": 38162, "epoch": 908} {"train_loss": -5.545540809631348, "global_step": 38163, "epoch": 908} {"train_loss": -5.706389427185059, "global_step": 38164, "epoch": 908} {"train_loss": -5.665159225463867, "global_step": 38165, "epoch": 908} {"train_loss": -5.519412040710449, "global_step": 38166, "epoch": 908} {"train_loss": -5.699416160583496, "global_step": 38167, "epoch": 908} {"train_loss": -5.634598731994629, "global_step": 38168, "epoch": 908} {"train_loss": -5.491129398345947, "global_step": 38169, "epoch": 908} {"train_loss": -5.667712688446045, "global_step": 38170, "epoch": 908} {"train_loss": -5.601478576660156, "global_step": 38171, "epoch": 908} {"train_loss": -5.497230529785156, "global_step": 38172, "epoch": 908} {"train_loss": -5.674344539642334, "global_step": 38173, "epoch": 908} {"train_loss": -5.590505599975586, "global_step": 38174, "epoch": 908} {"train_loss": -5.519309997558594, "global_step": 38175, "epoch": 908} {"train_loss": -5.661022186279297, "global_step": 38176, "epoch": 908} {"train_loss": -5.610932145799909, "global_step": 38177, "epoch": 908, "val_loss": 62073.8046875} {"train_loss": -5.583107948303223, "global_step": 38178, "epoch": 909} {"train_loss": -5.515580177307129, "global_step": 38179, "epoch": 909} {"train_loss": -5.606576919555664, "global_step": 38180, "epoch": 909} {"train_loss": -5.482370376586914, "global_step": 38181, "epoch": 909} {"train_loss": -5.541825294494629, "global_step": 38182, "epoch": 909} {"train_loss": -5.54661750793457, "global_step": 38183, "epoch": 909} {"train_loss": -5.598698616027832, "global_step": 38184, "epoch": 909} {"train_loss": -5.532137870788574, "global_step": 38185, "epoch": 909} {"train_loss": -5.514902591705322, "global_step": 38186, "epoch": 909} {"train_loss": -5.7511210441589355, "global_step": 38187, "epoch": 909} {"train_loss": -5.5403289794921875, "global_step": 38188, "epoch": 909} {"train_loss": -5.6930623054504395, "global_step": 38189, "epoch": 909} {"train_loss": -5.604078769683838, "global_step": 38190, "epoch": 909} {"train_loss": -5.683298110961914, "global_step": 38191, "epoch": 909} {"train_loss": -5.536883354187012, "global_step": 38192, "epoch": 909} {"train_loss": -5.587596893310547, "global_step": 38193, "epoch": 909} {"train_loss": -5.57380485534668, "global_step": 38194, "epoch": 909} {"train_loss": -5.637788772583008, "global_step": 38195, "epoch": 909} {"train_loss": -5.638913631439209, "global_step": 38196, "epoch": 909} {"train_loss": -5.471644401550293, "global_step": 38197, "epoch": 909} {"train_loss": -5.611695289611816, "global_step": 38198, "epoch": 909} {"train_loss": -5.612980365753174, "global_step": 38199, "epoch": 909} {"train_loss": -5.436635494232178, "global_step": 38200, "epoch": 909} {"train_loss": -5.627063274383545, "global_step": 38201, "epoch": 909} {"train_loss": -5.434272766113281, "global_step": 38202, "epoch": 909} {"train_loss": -5.719272613525391, "global_step": 38203, "epoch": 909} {"train_loss": -5.650910377502441, "global_step": 38204, "epoch": 909} {"train_loss": -5.543427467346191, "global_step": 38205, "epoch": 909} {"train_loss": -5.645008563995361, "global_step": 38206, "epoch": 909} {"train_loss": -5.552067756652832, "global_step": 38207, "epoch": 909} {"train_loss": -5.614408016204834, "global_step": 38208, "epoch": 909} {"train_loss": -5.700403690338135, "global_step": 38209, "epoch": 909} {"train_loss": -5.636418342590332, "global_step": 38210, "epoch": 909} {"train_loss": -5.592414855957031, "global_step": 38211, "epoch": 909} {"train_loss": -5.651142120361328, "global_step": 38212, "epoch": 909} {"train_loss": -5.659887313842773, "global_step": 38213, "epoch": 909} {"train_loss": -5.608712196350098, "global_step": 38214, "epoch": 909} {"train_loss": -5.5845627784729, "global_step": 38215, "epoch": 909} {"train_loss": -5.64290189743042, "global_step": 38216, "epoch": 909} {"train_loss": -5.632413864135742, "global_step": 38217, "epoch": 909} {"train_loss": -5.646084785461426, "global_step": 38218, "epoch": 909} {"train_loss": -5.599399589356922, "global_step": 38219, "epoch": 909, "val_loss": 62025.84765625} {"train_loss": -5.577181816101074, "global_step": 38220, "epoch": 910} {"train_loss": -5.670065879821777, "global_step": 38221, "epoch": 910} {"train_loss": -5.554116725921631, "global_step": 38222, "epoch": 910} {"train_loss": -5.438529014587402, "global_step": 38223, "epoch": 910} {"train_loss": -5.613029479980469, "global_step": 38224, "epoch": 910} {"train_loss": -5.686470985412598, "global_step": 38225, "epoch": 910} {"train_loss": -5.616446495056152, "global_step": 38226, "epoch": 910} {"train_loss": -5.65081787109375, "global_step": 38227, "epoch": 910} {"train_loss": -5.518884658813477, "global_step": 38228, "epoch": 910} {"train_loss": -5.553452491760254, "global_step": 38229, "epoch": 910} {"train_loss": -5.708542823791504, "global_step": 38230, "epoch": 910} {"train_loss": -5.551725387573242, "global_step": 38231, "epoch": 910} {"train_loss": -5.413829326629639, "global_step": 38232, "epoch": 910} {"train_loss": -5.7227091789245605, "global_step": 38233, "epoch": 910} {"train_loss": -5.704710960388184, "global_step": 38234, "epoch": 910} {"train_loss": -5.598082065582275, "global_step": 38235, "epoch": 910} {"train_loss": -5.614020347595215, "global_step": 38236, "epoch": 910} {"train_loss": -5.576653480529785, "global_step": 38237, "epoch": 910} {"train_loss": -5.505407333374023, "global_step": 38238, "epoch": 910} {"train_loss": -5.628635883331299, "global_step": 38239, "epoch": 910} {"train_loss": -5.668430328369141, "global_step": 38240, "epoch": 910} {"train_loss": -5.744786739349365, "global_step": 38241, "epoch": 910} {"train_loss": -5.593338966369629, "global_step": 38242, "epoch": 910} {"train_loss": -5.645723342895508, "global_step": 38243, "epoch": 910} {"train_loss": -5.558102130889893, "global_step": 38244, "epoch": 910} {"train_loss": -5.667935371398926, "global_step": 38245, "epoch": 910} {"train_loss": -5.637950897216797, "global_step": 38246, "epoch": 910} {"train_loss": -5.538926601409912, "global_step": 38247, "epoch": 910} {"train_loss": -5.692566871643066, "global_step": 38248, "epoch": 910} {"train_loss": -5.667171478271484, "global_step": 38249, "epoch": 910} {"train_loss": -5.731345176696777, "global_step": 38250, "epoch": 910} {"train_loss": -5.629137992858887, "global_step": 38251, "epoch": 910} {"train_loss": -5.609230041503906, "global_step": 38252, "epoch": 910} {"train_loss": -5.593930244445801, "global_step": 38253, "epoch": 910} {"train_loss": -5.524846076965332, "global_step": 38254, "epoch": 910} {"train_loss": -5.578324317932129, "global_step": 38255, "epoch": 910} {"train_loss": -5.639167785644531, "global_step": 38256, "epoch": 910} {"train_loss": -5.659214019775391, "global_step": 38257, "epoch": 910} {"train_loss": -5.582550525665283, "global_step": 38258, "epoch": 910} {"train_loss": -5.580069065093994, "global_step": 38259, "epoch": 910} {"train_loss": -5.608502388000488, "global_step": 38260, "epoch": 910} {"train_loss": -5.611115898404803, "global_step": 38261, "epoch": 910, "val_loss": 61727.99609375} {"train_loss": -5.779938220977783, "global_step": 38262, "epoch": 911} {"train_loss": -5.6278228759765625, "global_step": 38263, "epoch": 911} {"train_loss": -5.714573860168457, "global_step": 38264, "epoch": 911} {"train_loss": -5.672223091125488, "global_step": 38265, "epoch": 911} {"train_loss": -5.601565837860107, "global_step": 38266, "epoch": 911} {"train_loss": -5.649471759796143, "global_step": 38267, "epoch": 911} {"train_loss": -5.608704566955566, "global_step": 38268, "epoch": 911} {"train_loss": -5.738614082336426, "global_step": 38269, "epoch": 911} {"train_loss": -5.568108081817627, "global_step": 38270, "epoch": 911} {"train_loss": -5.54439115524292, "global_step": 38271, "epoch": 911} {"train_loss": -5.673816680908203, "global_step": 38272, "epoch": 911} {"train_loss": -5.622713088989258, "global_step": 38273, "epoch": 911} {"train_loss": -5.691702365875244, "global_step": 38274, "epoch": 911} {"train_loss": -5.603259086608887, "global_step": 38275, "epoch": 911} {"train_loss": -5.690346717834473, "global_step": 38276, "epoch": 911} {"train_loss": -5.660222053527832, "global_step": 38277, "epoch": 911} {"train_loss": -5.647475242614746, "global_step": 38278, "epoch": 911} {"train_loss": -5.639925003051758, "global_step": 38279, "epoch": 911} {"train_loss": -5.604689121246338, "global_step": 38280, "epoch": 911} {"train_loss": -5.683293342590332, "global_step": 38281, "epoch": 911} {"train_loss": -5.5522308349609375, "global_step": 38282, "epoch": 911} {"train_loss": -5.61436653137207, "global_step": 38283, "epoch": 911} {"train_loss": -5.644101142883301, "global_step": 38284, "epoch": 911} {"train_loss": -5.628055572509766, "global_step": 38285, "epoch": 911} {"train_loss": -5.615346431732178, "global_step": 38286, "epoch": 911} {"train_loss": -5.500653266906738, "global_step": 38287, "epoch": 911} {"train_loss": -5.617025375366211, "global_step": 38288, "epoch": 911} {"train_loss": -5.619357109069824, "global_step": 38289, "epoch": 911} {"train_loss": -5.647356033325195, "global_step": 38290, "epoch": 911} {"train_loss": -5.646914005279541, "global_step": 38291, "epoch": 911} {"train_loss": -5.624266147613525, "global_step": 38292, "epoch": 911} {"train_loss": -5.610574722290039, "global_step": 38293, "epoch": 911} {"train_loss": -5.568297863006592, "global_step": 38294, "epoch": 911} {"train_loss": -5.730123519897461, "global_step": 38295, "epoch": 911} {"train_loss": -5.694116592407227, "global_step": 38296, "epoch": 911} {"train_loss": -5.730820655822754, "global_step": 38297, "epoch": 911} {"train_loss": -5.693234443664551, "global_step": 38298, "epoch": 911} {"train_loss": -5.678759574890137, "global_step": 38299, "epoch": 911} {"train_loss": -5.4560370445251465, "global_step": 38300, "epoch": 911} {"train_loss": -5.67784309387207, "global_step": 38301, "epoch": 911} {"train_loss": -5.710094451904297, "global_step": 38302, "epoch": 911} {"train_loss": -5.636123078210013, "global_step": 38303, "epoch": 911, "val_loss": 62011.17578125} {"train_loss": -5.647639274597168, "global_step": 38304, "epoch": 912} {"train_loss": -5.658742427825928, "global_step": 38305, "epoch": 912} {"train_loss": -5.713264465332031, "global_step": 38306, "epoch": 912} {"train_loss": -5.654340744018555, "global_step": 38307, "epoch": 912} {"train_loss": -5.4943928718566895, "global_step": 38308, "epoch": 912} {"train_loss": -5.543531894683838, "global_step": 38309, "epoch": 912} {"train_loss": -5.72357177734375, "global_step": 38310, "epoch": 912} {"train_loss": -5.640013694763184, "global_step": 38311, "epoch": 912} {"train_loss": -5.476865768432617, "global_step": 38312, "epoch": 912} {"train_loss": -5.587363243103027, "global_step": 38313, "epoch": 912} {"train_loss": -5.487198829650879, "global_step": 38314, "epoch": 912} {"train_loss": -5.538330554962158, "global_step": 38315, "epoch": 912} {"train_loss": -5.4766035079956055, "global_step": 38316, "epoch": 912} {"train_loss": -5.675998210906982, "global_step": 38317, "epoch": 912} {"train_loss": -5.511183738708496, "global_step": 38318, "epoch": 912} {"train_loss": -5.531486511230469, "global_step": 38319, "epoch": 912} {"train_loss": -5.565674781799316, "global_step": 38320, "epoch": 912} {"train_loss": -5.605227470397949, "global_step": 38321, "epoch": 912} {"train_loss": -5.546002388000488, "global_step": 38322, "epoch": 912} {"train_loss": -5.630487442016602, "global_step": 38323, "epoch": 912} {"train_loss": -5.554814338684082, "global_step": 38324, "epoch": 912} {"train_loss": -5.571724891662598, "global_step": 38325, "epoch": 912} {"train_loss": -5.719753742218018, "global_step": 38326, "epoch": 912} {"train_loss": -5.545853614807129, "global_step": 38327, "epoch": 912} {"train_loss": -5.599492073059082, "global_step": 38328, "epoch": 912} {"train_loss": -5.625529766082764, "global_step": 38329, "epoch": 912} {"train_loss": -5.5828375816345215, "global_step": 38330, "epoch": 912} {"train_loss": -5.697387218475342, "global_step": 38331, "epoch": 912} {"train_loss": -5.623905658721924, "global_step": 38332, "epoch": 912} {"train_loss": -5.551985263824463, "global_step": 38333, "epoch": 912} {"train_loss": -5.742218494415283, "global_step": 38334, "epoch": 912} {"train_loss": -5.500229358673096, "global_step": 38335, "epoch": 912} {"train_loss": -5.677414894104004, "global_step": 38336, "epoch": 912} {"train_loss": -5.786785125732422, "global_step": 38337, "epoch": 912} {"train_loss": -5.56934928894043, "global_step": 38338, "epoch": 912} {"train_loss": -5.6173200607299805, "global_step": 38339, "epoch": 912} {"train_loss": -5.619096755981445, "global_step": 38340, "epoch": 912} {"train_loss": -5.496464729309082, "global_step": 38341, "epoch": 912} {"train_loss": -5.542336463928223, "global_step": 38342, "epoch": 912} {"train_loss": -5.595786094665527, "global_step": 38343, "epoch": 912} {"train_loss": -5.567420959472656, "global_step": 38344, "epoch": 912} {"train_loss": -5.59630655107044, "global_step": 38345, "epoch": 912, "val_loss": 61861.72265625} {"train_loss": -5.7135009765625, "global_step": 38346, "epoch": 913} {"train_loss": -5.59152364730835, "global_step": 38347, "epoch": 913} {"train_loss": -5.676279544830322, "global_step": 38348, "epoch": 913} {"train_loss": -5.613081455230713, "global_step": 38349, "epoch": 913} {"train_loss": -5.700582504272461, "global_step": 38350, "epoch": 913} {"train_loss": -5.625064849853516, "global_step": 38351, "epoch": 913} {"train_loss": -5.539704322814941, "global_step": 38352, "epoch": 913} {"train_loss": -5.584615230560303, "global_step": 38353, "epoch": 913} {"train_loss": -5.534219741821289, "global_step": 38354, "epoch": 913} {"train_loss": -5.577256679534912, "global_step": 38355, "epoch": 913} {"train_loss": -5.546897888183594, "global_step": 38356, "epoch": 913} {"train_loss": -5.51371955871582, "global_step": 38357, "epoch": 913} {"train_loss": -5.642865180969238, "global_step": 38358, "epoch": 913} {"train_loss": -5.713922023773193, "global_step": 38359, "epoch": 913} {"train_loss": -5.47022819519043, "global_step": 38360, "epoch": 913} {"train_loss": -5.636714935302734, "global_step": 38361, "epoch": 913} {"train_loss": -5.582748889923096, "global_step": 38362, "epoch": 913} {"train_loss": -5.656788349151611, "global_step": 38363, "epoch": 913} {"train_loss": -5.593622207641602, "global_step": 38364, "epoch": 913} {"train_loss": -5.655010223388672, "global_step": 38365, "epoch": 913} {"train_loss": -5.502737998962402, "global_step": 38366, "epoch": 913} {"train_loss": -5.635152339935303, "global_step": 38367, "epoch": 913} {"train_loss": -5.6758623123168945, "global_step": 38368, "epoch": 913} {"train_loss": -5.720115661621094, "global_step": 38369, "epoch": 913} {"train_loss": -5.623440742492676, "global_step": 38370, "epoch": 913} {"train_loss": -5.515956401824951, "global_step": 38371, "epoch": 913} {"train_loss": -5.633963584899902, "global_step": 38372, "epoch": 913} {"train_loss": -5.598880290985107, "global_step": 38373, "epoch": 913} {"train_loss": -5.625005722045898, "global_step": 38374, "epoch": 913} {"train_loss": -5.646749973297119, "global_step": 38375, "epoch": 913} {"train_loss": -5.624406814575195, "global_step": 38376, "epoch": 913} {"train_loss": -5.572295665740967, "global_step": 38377, "epoch": 913} {"train_loss": -5.6982574462890625, "global_step": 38378, "epoch": 913} {"train_loss": -5.654229164123535, "global_step": 38379, "epoch": 913} {"train_loss": -5.492053031921387, "global_step": 38380, "epoch": 913} {"train_loss": -5.59345817565918, "global_step": 38381, "epoch": 913} {"train_loss": -5.566657543182373, "global_step": 38382, "epoch": 913} {"train_loss": -5.67564582824707, "global_step": 38383, "epoch": 913} {"train_loss": -5.6090240478515625, "global_step": 38384, "epoch": 913} {"train_loss": -5.6986284255981445, "global_step": 38385, "epoch": 913} {"train_loss": -5.665637969970703, "global_step": 38386, "epoch": 913} {"train_loss": -5.61471962928772, "global_step": 38387, "epoch": 913, "val_loss": 62327.83984375} {"train_loss": -5.696662902832031, "global_step": 38388, "epoch": 914} {"train_loss": -5.630033493041992, "global_step": 38389, "epoch": 914} {"train_loss": -5.542076110839844, "global_step": 38390, "epoch": 914} {"train_loss": -5.601589202880859, "global_step": 38391, "epoch": 914} {"train_loss": -5.67764949798584, "global_step": 38392, "epoch": 914} {"train_loss": -5.59574556350708, "global_step": 38393, "epoch": 914} {"train_loss": -5.614583969116211, "global_step": 38394, "epoch": 914} {"train_loss": -5.609168529510498, "global_step": 38395, "epoch": 914} {"train_loss": -5.488771438598633, "global_step": 38396, "epoch": 914} {"train_loss": -5.456294059753418, "global_step": 38397, "epoch": 914} {"train_loss": -5.527294635772705, "global_step": 38398, "epoch": 914} {"train_loss": -5.541565895080566, "global_step": 38399, "epoch": 914} {"train_loss": -5.635555267333984, "global_step": 38400, "epoch": 914} {"train_loss": -5.585535526275635, "global_step": 38401, "epoch": 914} {"train_loss": -5.67091178894043, "global_step": 38402, "epoch": 914} {"train_loss": -5.63824987411499, "global_step": 38403, "epoch": 914} {"train_loss": -5.525681495666504, "global_step": 38404, "epoch": 914} {"train_loss": -5.661356449127197, "global_step": 38405, "epoch": 914} {"train_loss": -5.5598039627075195, "global_step": 38406, "epoch": 914} {"train_loss": -5.545567512512207, "global_step": 38407, "epoch": 914} {"train_loss": -5.627542495727539, "global_step": 38408, "epoch": 914} {"train_loss": -5.622320175170898, "global_step": 38409, "epoch": 914} {"train_loss": -5.649533748626709, "global_step": 38410, "epoch": 914} {"train_loss": -5.4647650718688965, "global_step": 38411, "epoch": 914} {"train_loss": -5.604104995727539, "global_step": 38412, "epoch": 914} {"train_loss": -5.590426445007324, "global_step": 38413, "epoch": 914} {"train_loss": -5.525417327880859, "global_step": 38414, "epoch": 914} {"train_loss": -5.63320255279541, "global_step": 38415, "epoch": 914} {"train_loss": -5.668214797973633, "global_step": 38416, "epoch": 914} {"train_loss": -5.674860000610352, "global_step": 38417, "epoch": 914} {"train_loss": -5.470190525054932, "global_step": 38418, "epoch": 914} {"train_loss": -5.6549882888793945, "global_step": 38419, "epoch": 914} {"train_loss": -5.564863681793213, "global_step": 38420, "epoch": 914} {"train_loss": -5.546721458435059, "global_step": 38421, "epoch": 914} {"train_loss": -5.669039726257324, "global_step": 38422, "epoch": 914} {"train_loss": -5.649317741394043, "global_step": 38423, "epoch": 914} {"train_loss": -5.537738800048828, "global_step": 38424, "epoch": 914} {"train_loss": -5.483834743499756, "global_step": 38425, "epoch": 914} {"train_loss": -5.689375400543213, "global_step": 38426, "epoch": 914} {"train_loss": -5.541103363037109, "global_step": 38427, "epoch": 914} {"train_loss": -5.477100849151611, "global_step": 38428, "epoch": 914} {"train_loss": -5.58885459672837, "global_step": 38429, "epoch": 914, "val_loss": 62525.5} {"train_loss": -5.575723171234131, "global_step": 38430, "epoch": 915} {"train_loss": -5.5229082107543945, "global_step": 38431, "epoch": 915} {"train_loss": -5.508485794067383, "global_step": 38432, "epoch": 915} {"train_loss": -5.516603469848633, "global_step": 38433, "epoch": 915} {"train_loss": -5.702652454376221, "global_step": 38434, "epoch": 915} {"train_loss": -5.541038513183594, "global_step": 38435, "epoch": 915} {"train_loss": -5.574319839477539, "global_step": 38436, "epoch": 915} {"train_loss": -5.669311046600342, "global_step": 38437, "epoch": 915} {"train_loss": -5.444003105163574, "global_step": 38438, "epoch": 915} {"train_loss": -5.664675712585449, "global_step": 38439, "epoch": 915} {"train_loss": -5.746726036071777, "global_step": 38440, "epoch": 915} {"train_loss": -5.558171272277832, "global_step": 38441, "epoch": 915} {"train_loss": -5.717629909515381, "global_step": 38442, "epoch": 915} {"train_loss": -5.613337993621826, "global_step": 38443, "epoch": 915} {"train_loss": -5.589089393615723, "global_step": 38444, "epoch": 915} {"train_loss": -5.5969648361206055, "global_step": 38445, "epoch": 915} {"train_loss": -5.704286575317383, "global_step": 38446, "epoch": 915} {"train_loss": -5.558557510375977, "global_step": 38447, "epoch": 915} {"train_loss": -5.686979293823242, "global_step": 38448, "epoch": 915} {"train_loss": -5.619450569152832, "global_step": 38449, "epoch": 915} {"train_loss": -5.53662109375, "global_step": 38450, "epoch": 915} {"train_loss": -5.680238723754883, "global_step": 38451, "epoch": 915} {"train_loss": -5.538496971130371, "global_step": 38452, "epoch": 915} {"train_loss": -5.6013593673706055, "global_step": 38453, "epoch": 915} {"train_loss": -5.539680004119873, "global_step": 38454, "epoch": 915} {"train_loss": -5.5500078201293945, "global_step": 38455, "epoch": 915} {"train_loss": -5.580038547515869, "global_step": 38456, "epoch": 915} {"train_loss": -5.553752899169922, "global_step": 38457, "epoch": 915} {"train_loss": -5.475865840911865, "global_step": 38458, "epoch": 915} {"train_loss": -5.598424911499023, "global_step": 38459, "epoch": 915} {"train_loss": -5.558821678161621, "global_step": 38460, "epoch": 915} {"train_loss": -5.4731245040893555, "global_step": 38461, "epoch": 915} {"train_loss": -5.756800651550293, "global_step": 38462, "epoch": 915} {"train_loss": -5.658799171447754, "global_step": 38463, "epoch": 915} {"train_loss": -5.677243232727051, "global_step": 38464, "epoch": 915} {"train_loss": -5.587506294250488, "global_step": 38465, "epoch": 915} {"train_loss": -5.756286144256592, "global_step": 38466, "epoch": 915} {"train_loss": -5.585607528686523, "global_step": 38467, "epoch": 915} {"train_loss": -5.539968013763428, "global_step": 38468, "epoch": 915} {"train_loss": -5.56150484085083, "global_step": 38469, "epoch": 915} {"train_loss": -5.557867050170898, "global_step": 38470, "epoch": 915} {"train_loss": -5.599922350474766, "global_step": 38471, "epoch": 915, "val_loss": 62152.00390625} {"train_loss": -5.674781322479248, "global_step": 38472, "epoch": 916} {"train_loss": -5.573009014129639, "global_step": 38473, "epoch": 916} {"train_loss": -5.645214080810547, "global_step": 38474, "epoch": 916} {"train_loss": -5.494494915008545, "global_step": 38475, "epoch": 916} {"train_loss": -5.600600719451904, "global_step": 38476, "epoch": 916} {"train_loss": -5.6666483879089355, "global_step": 38477, "epoch": 916} {"train_loss": -5.660976409912109, "global_step": 38478, "epoch": 916} {"train_loss": -5.490466117858887, "global_step": 38479, "epoch": 916} {"train_loss": -5.586475372314453, "global_step": 38480, "epoch": 916} {"train_loss": -5.661629676818848, "global_step": 38481, "epoch": 916} {"train_loss": -5.555617332458496, "global_step": 38482, "epoch": 916} {"train_loss": -5.5882978439331055, "global_step": 38483, "epoch": 916} {"train_loss": -5.715822219848633, "global_step": 38484, "epoch": 916} {"train_loss": -5.725358486175537, "global_step": 38485, "epoch": 916} {"train_loss": -5.5372748374938965, "global_step": 38486, "epoch": 916} {"train_loss": -5.56578254699707, "global_step": 38487, "epoch": 916} {"train_loss": -5.570306301116943, "global_step": 38488, "epoch": 916} {"train_loss": -5.63395881652832, "global_step": 38489, "epoch": 916} {"train_loss": -5.65563440322876, "global_step": 38490, "epoch": 916} {"train_loss": -5.525969505310059, "global_step": 38491, "epoch": 916} {"train_loss": -5.622617244720459, "global_step": 38492, "epoch": 916} {"train_loss": -5.467031478881836, "global_step": 38493, "epoch": 916} {"train_loss": -5.533688068389893, "global_step": 38494, "epoch": 916} {"train_loss": -5.641461372375488, "global_step": 38495, "epoch": 916} {"train_loss": -5.559089660644531, "global_step": 38496, "epoch": 916} {"train_loss": -5.497505187988281, "global_step": 38497, "epoch": 916} {"train_loss": -5.601083755493164, "global_step": 38498, "epoch": 916} {"train_loss": -5.581786155700684, "global_step": 38499, "epoch": 916} {"train_loss": -5.499087333679199, "global_step": 38500, "epoch": 916} {"train_loss": -5.589169502258301, "global_step": 38501, "epoch": 916} {"train_loss": -5.607278347015381, "global_step": 38502, "epoch": 916} {"train_loss": -5.569962501525879, "global_step": 38503, "epoch": 916} {"train_loss": -5.633798599243164, "global_step": 38504, "epoch": 916} {"train_loss": -5.642351150512695, "global_step": 38505, "epoch": 916} {"train_loss": -5.636483192443848, "global_step": 38506, "epoch": 916} {"train_loss": -5.570730686187744, "global_step": 38507, "epoch": 916} {"train_loss": -5.646665573120117, "global_step": 38508, "epoch": 916} {"train_loss": -5.647493362426758, "global_step": 38509, "epoch": 916} {"train_loss": -5.6842546463012695, "global_step": 38510, "epoch": 916} {"train_loss": -5.703341484069824, "global_step": 38511, "epoch": 916} {"train_loss": -5.607085227966309, "global_step": 38512, "epoch": 916} {"train_loss": -5.6012167022341774, "global_step": 38513, "epoch": 916, "val_loss": 62180.88671875} {"train_loss": -5.66267728805542, "global_step": 38514, "epoch": 917} {"train_loss": -5.663515567779541, "global_step": 38515, "epoch": 917} {"train_loss": -5.585691928863525, "global_step": 38516, "epoch": 917} {"train_loss": -5.5056939125061035, "global_step": 38517, "epoch": 917} {"train_loss": -5.600024700164795, "global_step": 38518, "epoch": 917} {"train_loss": -5.570931434631348, "global_step": 38519, "epoch": 917} {"train_loss": -5.578136444091797, "global_step": 38520, "epoch": 917} {"train_loss": -5.50644588470459, "global_step": 38521, "epoch": 917} {"train_loss": -5.571170806884766, "global_step": 38522, "epoch": 917} {"train_loss": -5.801877975463867, "global_step": 38523, "epoch": 917} {"train_loss": -5.744032859802246, "global_step": 38524, "epoch": 917} {"train_loss": -5.565310478210449, "global_step": 38525, "epoch": 917} {"train_loss": -5.647218227386475, "global_step": 38526, "epoch": 917} {"train_loss": -5.710624694824219, "global_step": 38527, "epoch": 917} {"train_loss": -5.570182800292969, "global_step": 38528, "epoch": 917} {"train_loss": -5.608577728271484, "global_step": 38529, "epoch": 917} {"train_loss": -5.6738739013671875, "global_step": 38530, "epoch": 917} {"train_loss": -5.690885543823242, "global_step": 38531, "epoch": 917} {"train_loss": -5.718014240264893, "global_step": 38532, "epoch": 917} {"train_loss": -5.529955863952637, "global_step": 38533, "epoch": 917} {"train_loss": -5.563645839691162, "global_step": 38534, "epoch": 917} {"train_loss": -5.651585102081299, "global_step": 38535, "epoch": 917} {"train_loss": -5.6825642585754395, "global_step": 38536, "epoch": 917} {"train_loss": -5.629431247711182, "global_step": 38537, "epoch": 917} {"train_loss": -5.615002632141113, "global_step": 38538, "epoch": 917} {"train_loss": -5.591629981994629, "global_step": 38539, "epoch": 917} {"train_loss": -5.676163196563721, "global_step": 38540, "epoch": 917} {"train_loss": -5.701531410217285, "global_step": 38541, "epoch": 917} {"train_loss": -5.557770729064941, "global_step": 38542, "epoch": 917} {"train_loss": -5.719684600830078, "global_step": 38543, "epoch": 917} {"train_loss": -5.515315055847168, "global_step": 38544, "epoch": 917} {"train_loss": -5.459684371948242, "global_step": 38545, "epoch": 917} {"train_loss": -5.594460964202881, "global_step": 38546, "epoch": 917} {"train_loss": -5.623022079467773, "global_step": 38547, "epoch": 917} {"train_loss": -5.644062519073486, "global_step": 38548, "epoch": 917} {"train_loss": -5.608914852142334, "global_step": 38549, "epoch": 917} {"train_loss": -5.627371788024902, "global_step": 38550, "epoch": 917} {"train_loss": -5.6118035316467285, "global_step": 38551, "epoch": 917} {"train_loss": -5.538812637329102, "global_step": 38552, "epoch": 917} {"train_loss": -5.5174946784973145, "global_step": 38553, "epoch": 917} {"train_loss": -5.533864974975586, "global_step": 38554, "epoch": 917} {"train_loss": -5.612267664500645, "global_step": 38555, "epoch": 917, "val_loss": 62035.3359375} {"train_loss": -5.64127779006958, "global_step": 38556, "epoch": 918} {"train_loss": -5.668935775756836, "global_step": 38557, "epoch": 918} {"train_loss": -5.618203163146973, "global_step": 38558, "epoch": 918} {"train_loss": -5.630908966064453, "global_step": 38559, "epoch": 918} {"train_loss": -5.6322126388549805, "global_step": 38560, "epoch": 918} {"train_loss": -5.536761283874512, "global_step": 38561, "epoch": 918} {"train_loss": -5.519935607910156, "global_step": 38562, "epoch": 918} {"train_loss": -5.583983421325684, "global_step": 38563, "epoch": 918} {"train_loss": -5.588348388671875, "global_step": 38564, "epoch": 918} {"train_loss": -5.574789047241211, "global_step": 38565, "epoch": 918} {"train_loss": -5.540579795837402, "global_step": 38566, "epoch": 918} {"train_loss": -5.57133674621582, "global_step": 38567, "epoch": 918} {"train_loss": -5.7337541580200195, "global_step": 38568, "epoch": 918} {"train_loss": -5.6775360107421875, "global_step": 38569, "epoch": 918} {"train_loss": -5.611894130706787, "global_step": 38570, "epoch": 918} {"train_loss": -5.740691184997559, "global_step": 38571, "epoch": 918} {"train_loss": -5.612789154052734, "global_step": 38572, "epoch": 918} {"train_loss": -5.568056106567383, "global_step": 38573, "epoch": 918} {"train_loss": -5.644211769104004, "global_step": 38574, "epoch": 918} {"train_loss": -5.627367973327637, "global_step": 38575, "epoch": 918} {"train_loss": -5.4635329246521, "global_step": 38576, "epoch": 918} {"train_loss": -5.552528381347656, "global_step": 38577, "epoch": 918} {"train_loss": -5.627107620239258, "global_step": 38578, "epoch": 918} {"train_loss": -5.625051498413086, "global_step": 38579, "epoch": 918} {"train_loss": -5.607211589813232, "global_step": 38580, "epoch": 918} {"train_loss": -5.590774059295654, "global_step": 38581, "epoch": 918} {"train_loss": -5.5019025802612305, "global_step": 38582, "epoch": 918} {"train_loss": -5.733438491821289, "global_step": 38583, "epoch": 918} {"train_loss": -5.7823991775512695, "global_step": 38584, "epoch": 918} {"train_loss": -5.536200046539307, "global_step": 38585, "epoch": 918} {"train_loss": -5.603246688842773, "global_step": 38586, "epoch": 918} {"train_loss": -5.629831314086914, "global_step": 38587, "epoch": 918} {"train_loss": -5.606690406799316, "global_step": 38588, "epoch": 918} {"train_loss": -5.7144060134887695, "global_step": 38589, "epoch": 918} {"train_loss": -5.737973690032959, "global_step": 38590, "epoch": 918} {"train_loss": -5.587761878967285, "global_step": 38591, "epoch": 918} {"train_loss": -5.54897403717041, "global_step": 38592, "epoch": 918} {"train_loss": -5.68361234664917, "global_step": 38593, "epoch": 918} {"train_loss": -5.619240760803223, "global_step": 38594, "epoch": 918} {"train_loss": -5.550868034362793, "global_step": 38595, "epoch": 918} {"train_loss": -5.5782060623168945, "global_step": 38596, "epoch": 918} {"train_loss": -5.614423479352679, "global_step": 38597, "epoch": 918, "val_loss": 62101.234375} {"train_loss": -5.633474349975586, "global_step": 38598, "epoch": 919} {"train_loss": -5.59446382522583, "global_step": 38599, "epoch": 919} {"train_loss": -5.5879740715026855, "global_step": 38600, "epoch": 919} {"train_loss": -5.712617874145508, "global_step": 38601, "epoch": 919} {"train_loss": -5.751848220825195, "global_step": 38602, "epoch": 919} {"train_loss": -5.595988750457764, "global_step": 38603, "epoch": 919} {"train_loss": -5.578272342681885, "global_step": 38604, "epoch": 919} {"train_loss": -5.61855411529541, "global_step": 38605, "epoch": 919} {"train_loss": -5.688015460968018, "global_step": 38606, "epoch": 919} {"train_loss": -5.670769214630127, "global_step": 38607, "epoch": 919} {"train_loss": -5.620078086853027, "global_step": 38608, "epoch": 919} {"train_loss": -5.5995025634765625, "global_step": 38609, "epoch": 919} {"train_loss": -5.552142143249512, "global_step": 38610, "epoch": 919} {"train_loss": -5.594722747802734, "global_step": 38611, "epoch": 919} {"train_loss": -5.664929389953613, "global_step": 38612, "epoch": 919} {"train_loss": -5.681422710418701, "global_step": 38613, "epoch": 919} {"train_loss": -5.696434020996094, "global_step": 38614, "epoch": 919} {"train_loss": -5.708654403686523, "global_step": 38615, "epoch": 919} {"train_loss": -5.738779067993164, "global_step": 38616, "epoch": 919} {"train_loss": -5.607404708862305, "global_step": 38617, "epoch": 919} {"train_loss": -5.639921188354492, "global_step": 38618, "epoch": 919} {"train_loss": -5.68035888671875, "global_step": 38619, "epoch": 919} {"train_loss": -5.599725246429443, "global_step": 38620, "epoch": 919} {"train_loss": -5.626440525054932, "global_step": 38621, "epoch": 919} {"train_loss": -5.52260160446167, "global_step": 38622, "epoch": 919} {"train_loss": -5.469433784484863, "global_step": 38623, "epoch": 919} {"train_loss": -5.557984352111816, "global_step": 38624, "epoch": 919} {"train_loss": -5.504340171813965, "global_step": 38625, "epoch": 919} {"train_loss": -5.261110305786133, "global_step": 38626, "epoch": 919} {"train_loss": -5.6021728515625, "global_step": 38627, "epoch": 919} {"train_loss": -5.319265365600586, "global_step": 38628, "epoch": 919} {"train_loss": -5.568421363830566, "global_step": 38629, "epoch": 919} {"train_loss": -5.423615455627441, "global_step": 38630, "epoch": 919} {"train_loss": -5.555541515350342, "global_step": 38631, "epoch": 919} {"train_loss": -5.523003578186035, "global_step": 38632, "epoch": 919} {"train_loss": -5.434301853179932, "global_step": 38633, "epoch": 919} {"train_loss": -5.546219825744629, "global_step": 38634, "epoch": 919} {"train_loss": -5.38758659362793, "global_step": 38635, "epoch": 919} {"train_loss": -5.522064208984375, "global_step": 38636, "epoch": 919} {"train_loss": -5.466141223907471, "global_step": 38637, "epoch": 919} {"train_loss": -5.480057716369629, "global_step": 38638, "epoch": 919} {"train_loss": -5.5748572917211625, "global_step": 38639, "epoch": 919, "val_loss": 62563.8125} {"train_loss": -5.435599327087402, "global_step": 38640, "epoch": 920} {"train_loss": -5.496292591094971, "global_step": 38641, "epoch": 920} {"train_loss": -5.5269365310668945, "global_step": 38642, "epoch": 920} {"train_loss": -5.5037431716918945, "global_step": 38643, "epoch": 920} {"train_loss": -5.445019721984863, "global_step": 38644, "epoch": 920} {"train_loss": -5.609745025634766, "global_step": 38645, "epoch": 920} {"train_loss": -5.530447959899902, "global_step": 38646, "epoch": 920} {"train_loss": -5.6026716232299805, "global_step": 38647, "epoch": 920} {"train_loss": -5.453038215637207, "global_step": 38648, "epoch": 920} {"train_loss": -5.661815166473389, "global_step": 38649, "epoch": 920} {"train_loss": -5.683399677276611, "global_step": 38650, "epoch": 920} {"train_loss": -5.7596282958984375, "global_step": 38651, "epoch": 920} {"train_loss": -5.521400451660156, "global_step": 38652, "epoch": 920} {"train_loss": -5.693563938140869, "global_step": 38653, "epoch": 920} {"train_loss": -5.570393085479736, "global_step": 38654, "epoch": 920} {"train_loss": -5.546233177185059, "global_step": 38655, "epoch": 920} {"train_loss": -5.616271495819092, "global_step": 38656, "epoch": 920} {"train_loss": -5.517755508422852, "global_step": 38657, "epoch": 920} {"train_loss": -5.5767741203308105, "global_step": 38658, "epoch": 920} {"train_loss": -5.587639808654785, "global_step": 38659, "epoch": 920} {"train_loss": -5.524208068847656, "global_step": 38660, "epoch": 920} {"train_loss": -5.687894344329834, "global_step": 38661, "epoch": 920} {"train_loss": -5.6112446784973145, "global_step": 38662, "epoch": 920} {"train_loss": -5.7998809814453125, "global_step": 38663, "epoch": 920} {"train_loss": -5.622613906860352, "global_step": 38664, "epoch": 920} {"train_loss": -5.698862075805664, "global_step": 38665, "epoch": 920} {"train_loss": -5.644824981689453, "global_step": 38666, "epoch": 920} {"train_loss": -5.6096343994140625, "global_step": 38667, "epoch": 920} {"train_loss": -5.717965602874756, "global_step": 38668, "epoch": 920} {"train_loss": -5.522649765014648, "global_step": 38669, "epoch": 920} {"train_loss": -5.593699932098389, "global_step": 38670, "epoch": 920} {"train_loss": -5.629627227783203, "global_step": 38671, "epoch": 920} {"train_loss": -5.590343475341797, "global_step": 38672, "epoch": 920} {"train_loss": -5.604350566864014, "global_step": 38673, "epoch": 920} {"train_loss": -5.625870704650879, "global_step": 38674, "epoch": 920} {"train_loss": -5.71613883972168, "global_step": 38675, "epoch": 920} {"train_loss": -5.568065643310547, "global_step": 38676, "epoch": 920} {"train_loss": -5.448450088500977, "global_step": 38677, "epoch": 920} {"train_loss": -5.604314804077148, "global_step": 38678, "epoch": 920} {"train_loss": -5.627103805541992, "global_step": 38679, "epoch": 920} {"train_loss": -5.703319549560547, "global_step": 38680, "epoch": 920} {"train_loss": -5.60041542280288, "global_step": 38681, "epoch": 920, "val_loss": 61821.62890625} {"train_loss": -5.64075231552124, "global_step": 38682, "epoch": 921} {"train_loss": -5.65032958984375, "global_step": 38683, "epoch": 921} {"train_loss": -5.8232269287109375, "global_step": 38684, "epoch": 921} {"train_loss": -5.557146072387695, "global_step": 38685, "epoch": 921} {"train_loss": -5.615682601928711, "global_step": 38686, "epoch": 921} {"train_loss": -5.635223865509033, "global_step": 38687, "epoch": 921} {"train_loss": -5.506575584411621, "global_step": 38688, "epoch": 921} {"train_loss": -5.673142433166504, "global_step": 38689, "epoch": 921} {"train_loss": -5.629212379455566, "global_step": 38690, "epoch": 921} {"train_loss": -5.60745906829834, "global_step": 38691, "epoch": 921} {"train_loss": -5.779322624206543, "global_step": 38692, "epoch": 921} {"train_loss": -5.700984954833984, "global_step": 38693, "epoch": 921} {"train_loss": -5.565800666809082, "global_step": 38694, "epoch": 921} {"train_loss": -5.6565937995910645, "global_step": 38695, "epoch": 921} {"train_loss": -5.641707420349121, "global_step": 38696, "epoch": 921} {"train_loss": -5.641442775726318, "global_step": 38697, "epoch": 921} {"train_loss": -5.5727434158325195, "global_step": 38698, "epoch": 921} {"train_loss": -5.611706733703613, "global_step": 38699, "epoch": 921} {"train_loss": -5.687441349029541, "global_step": 38700, "epoch": 921} {"train_loss": -5.68487548828125, "global_step": 38701, "epoch": 921} {"train_loss": -5.547717094421387, "global_step": 38702, "epoch": 921} {"train_loss": -5.453488826751709, "global_step": 38703, "epoch": 921} {"train_loss": -5.643594741821289, "global_step": 38704, "epoch": 921} {"train_loss": -5.639609336853027, "global_step": 38705, "epoch": 921} {"train_loss": -5.620123386383057, "global_step": 38706, "epoch": 921} {"train_loss": -5.5934858322143555, "global_step": 38707, "epoch": 921} {"train_loss": -5.756683349609375, "global_step": 38708, "epoch": 921} {"train_loss": -5.649240493774414, "global_step": 38709, "epoch": 921} {"train_loss": -5.569948673248291, "global_step": 38710, "epoch": 921} {"train_loss": -5.609318733215332, "global_step": 38711, "epoch": 921} {"train_loss": -5.667210578918457, "global_step": 38712, "epoch": 921} {"train_loss": -5.631967544555664, "global_step": 38713, "epoch": 921} {"train_loss": -5.7812957763671875, "global_step": 38714, "epoch": 921} {"train_loss": -5.603085517883301, "global_step": 38715, "epoch": 921} {"train_loss": -5.763187885284424, "global_step": 38716, "epoch": 921} {"train_loss": -5.555061340332031, "global_step": 38717, "epoch": 921} {"train_loss": -5.577751159667969, "global_step": 38718, "epoch": 921} {"train_loss": -5.645360469818115, "global_step": 38719, "epoch": 921} {"train_loss": -5.677524089813232, "global_step": 38720, "epoch": 921} {"train_loss": -5.529111385345459, "global_step": 38721, "epoch": 921} {"train_loss": -5.508857727050781, "global_step": 38722, "epoch": 921} {"train_loss": -5.632530019396827, "global_step": 38723, "epoch": 921, "val_loss": 61997.953125} {"train_loss": -5.467947006225586, "global_step": 38724, "epoch": 922} {"train_loss": -5.600597858428955, "global_step": 38725, "epoch": 922} {"train_loss": -5.710274696350098, "global_step": 38726, "epoch": 922} {"train_loss": -5.633512496948242, "global_step": 38727, "epoch": 922} {"train_loss": -5.550060272216797, "global_step": 38728, "epoch": 922} {"train_loss": -5.782083988189697, "global_step": 38729, "epoch": 922} {"train_loss": -5.69743537902832, "global_step": 38730, "epoch": 922} {"train_loss": -5.674848556518555, "global_step": 38731, "epoch": 922} {"train_loss": -5.567590713500977, "global_step": 38732, "epoch": 922} {"train_loss": -5.776644706726074, "global_step": 38733, "epoch": 922} {"train_loss": -5.740714073181152, "global_step": 38734, "epoch": 922} {"train_loss": -5.6293182373046875, "global_step": 38735, "epoch": 922} {"train_loss": -5.731548309326172, "global_step": 38736, "epoch": 922} {"train_loss": -5.768615245819092, "global_step": 38737, "epoch": 922} {"train_loss": -5.586910724639893, "global_step": 38738, "epoch": 922} {"train_loss": -5.665700435638428, "global_step": 38739, "epoch": 922} {"train_loss": -5.504765033721924, "global_step": 38740, "epoch": 922} {"train_loss": -5.6159210205078125, "global_step": 38741, "epoch": 922} {"train_loss": -5.596635818481445, "global_step": 38742, "epoch": 922} {"train_loss": -5.46311092376709, "global_step": 38743, "epoch": 922} {"train_loss": -5.726579666137695, "global_step": 38744, "epoch": 922} {"train_loss": -5.524410247802734, "global_step": 38745, "epoch": 922} {"train_loss": -5.664536476135254, "global_step": 38746, "epoch": 922} {"train_loss": -5.646994113922119, "global_step": 38747, "epoch": 922} {"train_loss": -5.51807975769043, "global_step": 38748, "epoch": 922} {"train_loss": -5.561199188232422, "global_step": 38749, "epoch": 922} {"train_loss": -5.641129016876221, "global_step": 38750, "epoch": 922} {"train_loss": -5.590397834777832, "global_step": 38751, "epoch": 922} {"train_loss": -5.672717571258545, "global_step": 38752, "epoch": 922} {"train_loss": -5.510671138763428, "global_step": 38753, "epoch": 922} {"train_loss": -5.757658004760742, "global_step": 38754, "epoch": 922} {"train_loss": -5.65986442565918, "global_step": 38755, "epoch": 922} {"train_loss": -5.509946823120117, "global_step": 38756, "epoch": 922} {"train_loss": -5.567328929901123, "global_step": 38757, "epoch": 922} {"train_loss": -5.62221097946167, "global_step": 38758, "epoch": 922} {"train_loss": -5.719092845916748, "global_step": 38759, "epoch": 922} {"train_loss": -5.455083847045898, "global_step": 38760, "epoch": 922} {"train_loss": -5.6071319580078125, "global_step": 38761, "epoch": 922} {"train_loss": -5.528194427490234, "global_step": 38762, "epoch": 922} {"train_loss": -5.667357444763184, "global_step": 38763, "epoch": 922} {"train_loss": -5.693028926849365, "global_step": 38764, "epoch": 922} {"train_loss": -5.6231997694287985, "global_step": 38765, "epoch": 922, "val_loss": 62054.734375} {"train_loss": -5.585644721984863, "global_step": 38766, "epoch": 923} {"train_loss": -5.560376167297363, "global_step": 38767, "epoch": 923} {"train_loss": -5.641724586486816, "global_step": 38768, "epoch": 923} {"train_loss": -5.624505043029785, "global_step": 38769, "epoch": 923} {"train_loss": -5.665558815002441, "global_step": 38770, "epoch": 923} {"train_loss": -5.71190071105957, "global_step": 38771, "epoch": 923} {"train_loss": -5.6929240226745605, "global_step": 38772, "epoch": 923} {"train_loss": -5.771859645843506, "global_step": 38773, "epoch": 923} {"train_loss": -5.5556535720825195, "global_step": 38774, "epoch": 923} {"train_loss": -5.611566543579102, "global_step": 38775, "epoch": 923} {"train_loss": -5.65087366104126, "global_step": 38776, "epoch": 923} {"train_loss": -5.516265869140625, "global_step": 38777, "epoch": 923} {"train_loss": -5.594531059265137, "global_step": 38778, "epoch": 923} {"train_loss": -5.678273677825928, "global_step": 38779, "epoch": 923} {"train_loss": -5.680545330047607, "global_step": 38780, "epoch": 923} {"train_loss": -5.549729824066162, "global_step": 38781, "epoch": 923} {"train_loss": -5.4929704666137695, "global_step": 38782, "epoch": 923} {"train_loss": -5.599933624267578, "global_step": 38783, "epoch": 923} {"train_loss": -5.488106727600098, "global_step": 38784, "epoch": 923} {"train_loss": -5.724696159362793, "global_step": 38785, "epoch": 923} {"train_loss": -5.657712459564209, "global_step": 38786, "epoch": 923} {"train_loss": -5.692844867706299, "global_step": 38787, "epoch": 923} {"train_loss": -5.6537346839904785, "global_step": 38788, "epoch": 923} {"train_loss": -5.675666809082031, "global_step": 38789, "epoch": 923} {"train_loss": -5.768003463745117, "global_step": 38790, "epoch": 923} {"train_loss": -5.526623725891113, "global_step": 38791, "epoch": 923} {"train_loss": -5.597731590270996, "global_step": 38792, "epoch": 923} {"train_loss": -5.636210918426514, "global_step": 38793, "epoch": 923} {"train_loss": -5.84512186050415, "global_step": 38794, "epoch": 923} {"train_loss": -5.5321760177612305, "global_step": 38795, "epoch": 923} {"train_loss": -5.6557512283325195, "global_step": 38796, "epoch": 923} {"train_loss": -5.696786880493164, "global_step": 38797, "epoch": 923} {"train_loss": -5.777275085449219, "global_step": 38798, "epoch": 923} {"train_loss": -5.745631217956543, "global_step": 38799, "epoch": 923} {"train_loss": -5.663069725036621, "global_step": 38800, "epoch": 923} {"train_loss": -5.581585884094238, "global_step": 38801, "epoch": 923} {"train_loss": -5.494355201721191, "global_step": 38802, "epoch": 923} {"train_loss": -5.618575096130371, "global_step": 38803, "epoch": 923} {"train_loss": -5.596007347106934, "global_step": 38804, "epoch": 923} {"train_loss": -5.505026340484619, "global_step": 38805, "epoch": 923} {"train_loss": -5.608951568603516, "global_step": 38806, "epoch": 923} {"train_loss": -5.630954435893467, "global_step": 38807, "epoch": 923, "val_loss": 62055.20703125} {"train_loss": -5.59826135635376, "global_step": 38808, "epoch": 924} {"train_loss": -5.598207950592041, "global_step": 38809, "epoch": 924} {"train_loss": -5.653860092163086, "global_step": 38810, "epoch": 924} {"train_loss": -5.696328163146973, "global_step": 38811, "epoch": 924} {"train_loss": -5.58621883392334, "global_step": 38812, "epoch": 924} {"train_loss": -5.61529541015625, "global_step": 38813, "epoch": 924} {"train_loss": -5.585604190826416, "global_step": 38814, "epoch": 924} {"train_loss": -5.499157905578613, "global_step": 38815, "epoch": 924} {"train_loss": -5.613025665283203, "global_step": 38816, "epoch": 924} {"train_loss": -5.720920562744141, "global_step": 38817, "epoch": 924} {"train_loss": -5.59379768371582, "global_step": 38818, "epoch": 924} {"train_loss": -5.5422563552856445, "global_step": 38819, "epoch": 924} {"train_loss": -5.568331241607666, "global_step": 38820, "epoch": 924} {"train_loss": -5.537671089172363, "global_step": 38821, "epoch": 924} {"train_loss": -5.634632110595703, "global_step": 38822, "epoch": 924} {"train_loss": -5.56559419631958, "global_step": 38823, "epoch": 924} {"train_loss": -5.539671421051025, "global_step": 38824, "epoch": 924} {"train_loss": -5.483067512512207, "global_step": 38825, "epoch": 924} {"train_loss": -5.581212997436523, "global_step": 38826, "epoch": 924} {"train_loss": -5.512362957000732, "global_step": 38827, "epoch": 924} {"train_loss": -5.540251731872559, "global_step": 38828, "epoch": 924} {"train_loss": -5.649223327636719, "global_step": 38829, "epoch": 924} {"train_loss": -5.500714302062988, "global_step": 38830, "epoch": 924} {"train_loss": -5.472318172454834, "global_step": 38831, "epoch": 924} {"train_loss": -5.594921588897705, "global_step": 38832, "epoch": 924} {"train_loss": -5.620142459869385, "global_step": 38833, "epoch": 924} {"train_loss": -5.661813735961914, "global_step": 38834, "epoch": 924} {"train_loss": -5.508254051208496, "global_step": 38835, "epoch": 924} {"train_loss": -5.602896213531494, "global_step": 38836, "epoch": 924} {"train_loss": -5.676814556121826, "global_step": 38837, "epoch": 924} {"train_loss": -5.68223762512207, "global_step": 38838, "epoch": 924} {"train_loss": -5.6010332107543945, "global_step": 38839, "epoch": 924} {"train_loss": -5.614504337310791, "global_step": 38840, "epoch": 924} {"train_loss": -5.6861443519592285, "global_step": 38841, "epoch": 924} {"train_loss": -5.727930068969727, "global_step": 38842, "epoch": 924} {"train_loss": -5.645782947540283, "global_step": 38843, "epoch": 924} {"train_loss": -5.576966285705566, "global_step": 38844, "epoch": 924} {"train_loss": -5.589862823486328, "global_step": 38845, "epoch": 924} {"train_loss": -5.636345863342285, "global_step": 38846, "epoch": 924} {"train_loss": -5.628386497497559, "global_step": 38847, "epoch": 924} {"train_loss": -5.80280065536499, "global_step": 38848, "epoch": 924} {"train_loss": -5.602162974221366, "global_step": 38849, "epoch": 924, "val_loss": 62080.51953125} {"train_loss": -5.685279846191406, "global_step": 38850, "epoch": 925} {"train_loss": -5.7079758644104, "global_step": 38851, "epoch": 925} {"train_loss": -5.562622547149658, "global_step": 38852, "epoch": 925} {"train_loss": -5.557644844055176, "global_step": 38853, "epoch": 925} {"train_loss": -5.629766464233398, "global_step": 38854, "epoch": 925} {"train_loss": -5.739285469055176, "global_step": 38855, "epoch": 925} {"train_loss": -5.561991214752197, "global_step": 38856, "epoch": 925} {"train_loss": -5.567941665649414, "global_step": 38857, "epoch": 925} {"train_loss": -5.607950210571289, "global_step": 38858, "epoch": 925} {"train_loss": -5.508045196533203, "global_step": 38859, "epoch": 925} {"train_loss": -5.614459991455078, "global_step": 38860, "epoch": 925} {"train_loss": -5.645598411560059, "global_step": 38861, "epoch": 925} {"train_loss": -5.552108287811279, "global_step": 38862, "epoch": 925} {"train_loss": -5.736659049987793, "global_step": 38863, "epoch": 925} {"train_loss": -5.6501617431640625, "global_step": 38864, "epoch": 925} {"train_loss": -5.4548749923706055, "global_step": 38865, "epoch": 925} {"train_loss": -5.618864059448242, "global_step": 38866, "epoch": 925} {"train_loss": -5.638705253601074, "global_step": 38867, "epoch": 925} {"train_loss": -5.439920425415039, "global_step": 38868, "epoch": 925} {"train_loss": -5.52799654006958, "global_step": 38869, "epoch": 925} {"train_loss": -5.681800842285156, "global_step": 38870, "epoch": 925} {"train_loss": -5.487300872802734, "global_step": 38871, "epoch": 925} {"train_loss": -5.586495876312256, "global_step": 38872, "epoch": 925} {"train_loss": -5.5799241065979, "global_step": 38873, "epoch": 925} {"train_loss": -5.655318260192871, "global_step": 38874, "epoch": 925} {"train_loss": -5.551455020904541, "global_step": 38875, "epoch": 925} {"train_loss": -5.43339729309082, "global_step": 38876, "epoch": 925} {"train_loss": -5.6530890464782715, "global_step": 38877, "epoch": 925} {"train_loss": -5.617213249206543, "global_step": 38878, "epoch": 925} {"train_loss": -5.543285369873047, "global_step": 38879, "epoch": 925} {"train_loss": -5.565868377685547, "global_step": 38880, "epoch": 925} {"train_loss": -5.5342817306518555, "global_step": 38881, "epoch": 925} {"train_loss": -5.673288822174072, "global_step": 38882, "epoch": 925} {"train_loss": -5.599545478820801, "global_step": 38883, "epoch": 925} {"train_loss": -5.532975196838379, "global_step": 38884, "epoch": 925} {"train_loss": -5.6579909324646, "global_step": 38885, "epoch": 925} {"train_loss": -5.449586391448975, "global_step": 38886, "epoch": 925} {"train_loss": -5.541927814483643, "global_step": 38887, "epoch": 925} {"train_loss": -5.703655242919922, "global_step": 38888, "epoch": 925} {"train_loss": -5.532581806182861, "global_step": 38889, "epoch": 925} {"train_loss": -5.570831298828125, "global_step": 38890, "epoch": 925} {"train_loss": -5.590500445592971, "global_step": 38891, "epoch": 925, "val_loss": 62231.32421875} {"train_loss": -5.531021595001221, "global_step": 38892, "epoch": 926} {"train_loss": -5.4893798828125, "global_step": 38893, "epoch": 926} {"train_loss": -5.672707557678223, "global_step": 38894, "epoch": 926} {"train_loss": -5.6536102294921875, "global_step": 38895, "epoch": 926} {"train_loss": -5.639931678771973, "global_step": 38896, "epoch": 926} {"train_loss": -5.574256420135498, "global_step": 38897, "epoch": 926} {"train_loss": -5.538470268249512, "global_step": 38898, "epoch": 926} {"train_loss": -5.654908657073975, "global_step": 38899, "epoch": 926} {"train_loss": -5.645040512084961, "global_step": 38900, "epoch": 926} {"train_loss": -5.61538028717041, "global_step": 38901, "epoch": 926} {"train_loss": -5.618714809417725, "global_step": 38902, "epoch": 926} {"train_loss": -5.682254791259766, "global_step": 38903, "epoch": 926} {"train_loss": -5.6637959480285645, "global_step": 38904, "epoch": 926} {"train_loss": -5.611795902252197, "global_step": 38905, "epoch": 926} {"train_loss": -5.589770317077637, "global_step": 38906, "epoch": 926} {"train_loss": -5.8355584144592285, "global_step": 38907, "epoch": 926} {"train_loss": -5.559226989746094, "global_step": 38908, "epoch": 926} {"train_loss": -5.542575836181641, "global_step": 38909, "epoch": 926} {"train_loss": -5.65633487701416, "global_step": 38910, "epoch": 926} {"train_loss": -5.67933464050293, "global_step": 38911, "epoch": 926} {"train_loss": -5.586592674255371, "global_step": 38912, "epoch": 926} {"train_loss": -5.497403144836426, "global_step": 38913, "epoch": 926} {"train_loss": -5.614325523376465, "global_step": 38914, "epoch": 926} {"train_loss": -5.587723731994629, "global_step": 38915, "epoch": 926} {"train_loss": -5.678750038146973, "global_step": 38916, "epoch": 926} {"train_loss": -5.534306526184082, "global_step": 38917, "epoch": 926} {"train_loss": -5.598301887512207, "global_step": 38918, "epoch": 926} {"train_loss": -5.537712097167969, "global_step": 38919, "epoch": 926} {"train_loss": -5.651930332183838, "global_step": 38920, "epoch": 926} {"train_loss": -5.592693328857422, "global_step": 38921, "epoch": 926} {"train_loss": -5.709260940551758, "global_step": 38922, "epoch": 926} {"train_loss": -5.736811637878418, "global_step": 38923, "epoch": 926} {"train_loss": -5.554586410522461, "global_step": 38924, "epoch": 926} {"train_loss": -5.5759968757629395, "global_step": 38925, "epoch": 926} {"train_loss": -5.579977035522461, "global_step": 38926, "epoch": 926} {"train_loss": -5.669470310211182, "global_step": 38927, "epoch": 926} {"train_loss": -5.613777160644531, "global_step": 38928, "epoch": 926} {"train_loss": -5.640071868896484, "global_step": 38929, "epoch": 926} {"train_loss": -5.604167938232422, "global_step": 38930, "epoch": 926} {"train_loss": -5.644795894622803, "global_step": 38931, "epoch": 926} {"train_loss": -5.582080841064453, "global_step": 38932, "epoch": 926} {"train_loss": -5.61817250932966, "global_step": 38933, "epoch": 926, "val_loss": 62230.6875} {"train_loss": -5.609038352966309, "global_step": 38934, "epoch": 927} {"train_loss": -5.580112457275391, "global_step": 38935, "epoch": 927} {"train_loss": -5.593652725219727, "global_step": 38936, "epoch": 927} {"train_loss": -5.650582790374756, "global_step": 38937, "epoch": 927} {"train_loss": -5.6712751388549805, "global_step": 38938, "epoch": 927} {"train_loss": -5.608999252319336, "global_step": 38939, "epoch": 927} {"train_loss": -5.639886856079102, "global_step": 38940, "epoch": 927} {"train_loss": -5.53624153137207, "global_step": 38941, "epoch": 927} {"train_loss": -5.694948196411133, "global_step": 38942, "epoch": 927} {"train_loss": -5.584901809692383, "global_step": 38943, "epoch": 927} {"train_loss": -5.648782730102539, "global_step": 38944, "epoch": 927} {"train_loss": -5.663671493530273, "global_step": 38945, "epoch": 927} {"train_loss": -5.572479248046875, "global_step": 38946, "epoch": 927} {"train_loss": -5.527212142944336, "global_step": 38947, "epoch": 927} {"train_loss": -5.551319599151611, "global_step": 38948, "epoch": 927} {"train_loss": -5.644680023193359, "global_step": 38949, "epoch": 927} {"train_loss": -5.6177659034729, "global_step": 38950, "epoch": 927} {"train_loss": -5.72587776184082, "global_step": 38951, "epoch": 927} {"train_loss": -5.594888687133789, "global_step": 38952, "epoch": 927} {"train_loss": -5.672170639038086, "global_step": 38953, "epoch": 927} {"train_loss": -5.685797214508057, "global_step": 38954, "epoch": 927} {"train_loss": -5.385518550872803, "global_step": 38955, "epoch": 927} {"train_loss": -5.691272258758545, "global_step": 38956, "epoch": 927} {"train_loss": -5.7063446044921875, "global_step": 38957, "epoch": 927} {"train_loss": -5.525370121002197, "global_step": 38958, "epoch": 927} {"train_loss": -5.626094818115234, "global_step": 38959, "epoch": 927} {"train_loss": -5.544017314910889, "global_step": 38960, "epoch": 927} {"train_loss": -5.698189735412598, "global_step": 38961, "epoch": 927} {"train_loss": -5.662605285644531, "global_step": 38962, "epoch": 927} {"train_loss": -5.62116813659668, "global_step": 38963, "epoch": 927} {"train_loss": -5.626004219055176, "global_step": 38964, "epoch": 927} {"train_loss": -5.621192932128906, "global_step": 38965, "epoch": 927} {"train_loss": -5.560578346252441, "global_step": 38966, "epoch": 927} {"train_loss": -5.552206993103027, "global_step": 38967, "epoch": 927} {"train_loss": -5.492184638977051, "global_step": 38968, "epoch": 927} {"train_loss": -5.653748512268066, "global_step": 38969, "epoch": 927} {"train_loss": -5.564191818237305, "global_step": 38970, "epoch": 927} {"train_loss": -5.645702362060547, "global_step": 38971, "epoch": 927} {"train_loss": -5.491632461547852, "global_step": 38972, "epoch": 927} {"train_loss": -5.708703994750977, "global_step": 38973, "epoch": 927} {"train_loss": -5.623782157897949, "global_step": 38974, "epoch": 927} {"train_loss": -5.614497139340355, "global_step": 38975, "epoch": 927, "val_loss": 61813.47265625} {"train_loss": -5.579104423522949, "global_step": 38976, "epoch": 928} {"train_loss": -5.5716962814331055, "global_step": 38977, "epoch": 928} {"train_loss": -5.687301158905029, "global_step": 38978, "epoch": 928} {"train_loss": -5.683165550231934, "global_step": 38979, "epoch": 928} {"train_loss": -5.686704635620117, "global_step": 38980, "epoch": 928} {"train_loss": -5.539020538330078, "global_step": 38981, "epoch": 928} {"train_loss": -5.705386161804199, "global_step": 38982, "epoch": 928} {"train_loss": -5.5377726554870605, "global_step": 38983, "epoch": 928} {"train_loss": -5.682683944702148, "global_step": 38984, "epoch": 928} {"train_loss": -5.633268356323242, "global_step": 38985, "epoch": 928} {"train_loss": -5.578207969665527, "global_step": 38986, "epoch": 928} {"train_loss": -5.610561370849609, "global_step": 38987, "epoch": 928} {"train_loss": -5.590432643890381, "global_step": 38988, "epoch": 928} {"train_loss": -5.701594352722168, "global_step": 38989, "epoch": 928} {"train_loss": -5.7154388427734375, "global_step": 38990, "epoch": 928} {"train_loss": -5.582482814788818, "global_step": 38991, "epoch": 928} {"train_loss": -5.615854263305664, "global_step": 38992, "epoch": 928} {"train_loss": -5.566753387451172, "global_step": 38993, "epoch": 928} {"train_loss": -5.71388053894043, "global_step": 38994, "epoch": 928} {"train_loss": -5.593671798706055, "global_step": 38995, "epoch": 928} {"train_loss": -5.5875654220581055, "global_step": 38996, "epoch": 928} {"train_loss": -5.602895736694336, "global_step": 38997, "epoch": 928} {"train_loss": -5.613216400146484, "global_step": 38998, "epoch": 928} {"train_loss": -5.57036018371582, "global_step": 38999, "epoch": 928} {"train_loss": -5.5742292404174805, "global_step": 39000, "epoch": 928} {"train_loss": -5.605670928955078, "global_step": 39001, "epoch": 928} {"train_loss": -5.465741157531738, "global_step": 39002, "epoch": 928} {"train_loss": -5.619277000427246, "global_step": 39003, "epoch": 928} {"train_loss": -5.482639789581299, "global_step": 39004, "epoch": 928} {"train_loss": -5.524740695953369, "global_step": 39005, "epoch": 928} {"train_loss": -5.57242488861084, "global_step": 39006, "epoch": 928} {"train_loss": -5.610546112060547, "global_step": 39007, "epoch": 928} {"train_loss": -5.688511848449707, "global_step": 39008, "epoch": 928} {"train_loss": -5.7365617752075195, "global_step": 39009, "epoch": 928} {"train_loss": -5.557954788208008, "global_step": 39010, "epoch": 928} {"train_loss": -5.633760452270508, "global_step": 39011, "epoch": 928} {"train_loss": -5.629482746124268, "global_step": 39012, "epoch": 928} {"train_loss": -5.657785415649414, "global_step": 39013, "epoch": 928} {"train_loss": -5.599387168884277, "global_step": 39014, "epoch": 928} {"train_loss": -5.671919822692871, "global_step": 39015, "epoch": 928} {"train_loss": -5.528604984283447, "global_step": 39016, "epoch": 928} {"train_loss": -5.615501551401048, "global_step": 39017, "epoch": 928, "val_loss": 61939.43359375} {"train_loss": -5.600688934326172, "global_step": 39018, "epoch": 929} {"train_loss": -5.666286468505859, "global_step": 39019, "epoch": 929} {"train_loss": -5.5522990226745605, "global_step": 39020, "epoch": 929} {"train_loss": -5.533939361572266, "global_step": 39021, "epoch": 929} {"train_loss": -5.712466239929199, "global_step": 39022, "epoch": 929} {"train_loss": -5.739089488983154, "global_step": 39023, "epoch": 929} {"train_loss": -5.690401554107666, "global_step": 39024, "epoch": 929} {"train_loss": -5.6525115966796875, "global_step": 39025, "epoch": 929} {"train_loss": -5.583280086517334, "global_step": 39026, "epoch": 929} {"train_loss": -5.6538286209106445, "global_step": 39027, "epoch": 929} {"train_loss": -5.613442420959473, "global_step": 39028, "epoch": 929} {"train_loss": -5.731484413146973, "global_step": 39029, "epoch": 929} {"train_loss": -5.71980094909668, "global_step": 39030, "epoch": 929} {"train_loss": -5.684783935546875, "global_step": 39031, "epoch": 929} {"train_loss": -5.663510322570801, "global_step": 39032, "epoch": 929} {"train_loss": -5.544971466064453, "global_step": 39033, "epoch": 929} {"train_loss": -5.65167236328125, "global_step": 39034, "epoch": 929} {"train_loss": -5.545909881591797, "global_step": 39035, "epoch": 929} {"train_loss": -5.704466819763184, "global_step": 39036, "epoch": 929} {"train_loss": -5.553822040557861, "global_step": 39037, "epoch": 929} {"train_loss": -5.5648651123046875, "global_step": 39038, "epoch": 929} {"train_loss": -5.586315631866455, "global_step": 39039, "epoch": 929} {"train_loss": -5.633126258850098, "global_step": 39040, "epoch": 929} {"train_loss": -5.631557941436768, "global_step": 39041, "epoch": 929} {"train_loss": -5.538075923919678, "global_step": 39042, "epoch": 929} {"train_loss": -5.639619827270508, "global_step": 39043, "epoch": 929} {"train_loss": -5.640931129455566, "global_step": 39044, "epoch": 929} {"train_loss": -5.5294904708862305, "global_step": 39045, "epoch": 929} {"train_loss": -5.607158184051514, "global_step": 39046, "epoch": 929} {"train_loss": -5.665580749511719, "global_step": 39047, "epoch": 929} {"train_loss": -5.536993980407715, "global_step": 39048, "epoch": 929} {"train_loss": -5.5534257888793945, "global_step": 39049, "epoch": 929} {"train_loss": -5.603719711303711, "global_step": 39050, "epoch": 929} {"train_loss": -5.594179630279541, "global_step": 39051, "epoch": 929} {"train_loss": -5.67659854888916, "global_step": 39052, "epoch": 929} {"train_loss": -5.555265426635742, "global_step": 39053, "epoch": 929} {"train_loss": -5.625722885131836, "global_step": 39054, "epoch": 929} {"train_loss": -5.617626667022705, "global_step": 39055, "epoch": 929} {"train_loss": -5.5549116134643555, "global_step": 39056, "epoch": 929} {"train_loss": -5.6295623779296875, "global_step": 39057, "epoch": 929} {"train_loss": -5.588047981262207, "global_step": 39058, "epoch": 929} {"train_loss": -5.618162756874447, "global_step": 39059, "epoch": 929, "val_loss": 61777.2734375} {"train_loss": -5.661550521850586, "global_step": 39060, "epoch": 930} {"train_loss": -5.58638334274292, "global_step": 39061, "epoch": 930} {"train_loss": -5.502403259277344, "global_step": 39062, "epoch": 930} {"train_loss": -5.596077919006348, "global_step": 39063, "epoch": 930} {"train_loss": -5.639797687530518, "global_step": 39064, "epoch": 930} {"train_loss": -5.72119140625, "global_step": 39065, "epoch": 930} {"train_loss": -5.757030010223389, "global_step": 39066, "epoch": 930} {"train_loss": -5.500336647033691, "global_step": 39067, "epoch": 930} {"train_loss": -5.576865196228027, "global_step": 39068, "epoch": 930} {"train_loss": -5.618238925933838, "global_step": 39069, "epoch": 930} {"train_loss": -5.549359321594238, "global_step": 39070, "epoch": 930} {"train_loss": -5.510372638702393, "global_step": 39071, "epoch": 930} {"train_loss": -5.612035274505615, "global_step": 39072, "epoch": 930} {"train_loss": -5.5516157150268555, "global_step": 39073, "epoch": 930} {"train_loss": -5.571369171142578, "global_step": 39074, "epoch": 930} {"train_loss": -5.533550262451172, "global_step": 39075, "epoch": 930} {"train_loss": -5.671143531799316, "global_step": 39076, "epoch": 930} {"train_loss": -5.69074821472168, "global_step": 39077, "epoch": 930} {"train_loss": -5.480855941772461, "global_step": 39078, "epoch": 930} {"train_loss": -5.636709690093994, "global_step": 39079, "epoch": 930} {"train_loss": -5.695093631744385, "global_step": 39080, "epoch": 930} {"train_loss": -5.575844764709473, "global_step": 39081, "epoch": 930} {"train_loss": -5.557498931884766, "global_step": 39082, "epoch": 930} {"train_loss": -5.6645612716674805, "global_step": 39083, "epoch": 930} {"train_loss": -5.6451416015625, "global_step": 39084, "epoch": 930} {"train_loss": -5.583944797515869, "global_step": 39085, "epoch": 930} {"train_loss": -5.67161750793457, "global_step": 39086, "epoch": 930} {"train_loss": -5.47475528717041, "global_step": 39087, "epoch": 930} {"train_loss": -5.618641376495361, "global_step": 39088, "epoch": 930} {"train_loss": -5.464438438415527, "global_step": 39089, "epoch": 930} {"train_loss": -5.510575771331787, "global_step": 39090, "epoch": 930} {"train_loss": -5.613849639892578, "global_step": 39091, "epoch": 930} {"train_loss": -5.553815841674805, "global_step": 39092, "epoch": 930} {"train_loss": -5.559657096862793, "global_step": 39093, "epoch": 930} {"train_loss": -5.531354904174805, "global_step": 39094, "epoch": 930} {"train_loss": -5.613617897033691, "global_step": 39095, "epoch": 930} {"train_loss": -5.660068511962891, "global_step": 39096, "epoch": 930} {"train_loss": -5.5436882972717285, "global_step": 39097, "epoch": 930} {"train_loss": -5.687562942504883, "global_step": 39098, "epoch": 930} {"train_loss": -5.423163414001465, "global_step": 39099, "epoch": 930} {"train_loss": -5.562094688415527, "global_step": 39100, "epoch": 930} {"train_loss": -5.588092395237514, "global_step": 39101, "epoch": 930, "val_loss": 62462.47265625} {"train_loss": -5.6773295402526855, "global_step": 39102, "epoch": 931} {"train_loss": -5.541501045227051, "global_step": 39103, "epoch": 931} {"train_loss": -5.61064338684082, "global_step": 39104, "epoch": 931} {"train_loss": -5.628852844238281, "global_step": 39105, "epoch": 931} {"train_loss": -5.512566089630127, "global_step": 39106, "epoch": 931} {"train_loss": -5.534759044647217, "global_step": 39107, "epoch": 931} {"train_loss": -5.5859761238098145, "global_step": 39108, "epoch": 931} {"train_loss": -5.526871204376221, "global_step": 39109, "epoch": 931} {"train_loss": -5.619873046875, "global_step": 39110, "epoch": 931} {"train_loss": -5.584532260894775, "global_step": 39111, "epoch": 931} {"train_loss": -5.519677639007568, "global_step": 39112, "epoch": 931} {"train_loss": -5.560487747192383, "global_step": 39113, "epoch": 931} {"train_loss": -5.545680046081543, "global_step": 39114, "epoch": 931} {"train_loss": -5.558952331542969, "global_step": 39115, "epoch": 931} {"train_loss": -5.692066192626953, "global_step": 39116, "epoch": 931} {"train_loss": -5.577112197875977, "global_step": 39117, "epoch": 931} {"train_loss": -5.73185920715332, "global_step": 39118, "epoch": 931} {"train_loss": -5.562171936035156, "global_step": 39119, "epoch": 931} {"train_loss": -5.578853130340576, "global_step": 39120, "epoch": 931} {"train_loss": -5.611828327178955, "global_step": 39121, "epoch": 931} {"train_loss": -5.501120567321777, "global_step": 39122, "epoch": 931} {"train_loss": -5.728475570678711, "global_step": 39123, "epoch": 931} {"train_loss": -5.57357120513916, "global_step": 39124, "epoch": 931} {"train_loss": -5.628552436828613, "global_step": 39125, "epoch": 931} {"train_loss": -5.539160251617432, "global_step": 39126, "epoch": 931} {"train_loss": -5.754806041717529, "global_step": 39127, "epoch": 931} {"train_loss": -5.630345821380615, "global_step": 39128, "epoch": 931} {"train_loss": -5.555595397949219, "global_step": 39129, "epoch": 931} {"train_loss": -5.6829705238342285, "global_step": 39130, "epoch": 931} {"train_loss": -5.619795799255371, "global_step": 39131, "epoch": 931} {"train_loss": -5.614252090454102, "global_step": 39132, "epoch": 931} {"train_loss": -5.403141021728516, "global_step": 39133, "epoch": 931} {"train_loss": -5.529424667358398, "global_step": 39134, "epoch": 931} {"train_loss": -5.54850959777832, "global_step": 39135, "epoch": 931} {"train_loss": -5.699626445770264, "global_step": 39136, "epoch": 931} {"train_loss": -5.6577372550964355, "global_step": 39137, "epoch": 931} {"train_loss": -5.512925624847412, "global_step": 39138, "epoch": 931} {"train_loss": -5.658790111541748, "global_step": 39139, "epoch": 931} {"train_loss": -5.628841400146484, "global_step": 39140, "epoch": 931} {"train_loss": -5.722645282745361, "global_step": 39141, "epoch": 931} {"train_loss": -5.6889519691467285, "global_step": 39142, "epoch": 931} {"train_loss": -5.601514010202317, "global_step": 39143, "epoch": 931, "val_loss": 61936.046875} {"train_loss": -5.588168621063232, "global_step": 39144, "epoch": 932} {"train_loss": -5.626025199890137, "global_step": 39145, "epoch": 932} {"train_loss": -5.61873197555542, "global_step": 39146, "epoch": 932} {"train_loss": -5.641525745391846, "global_step": 39147, "epoch": 932} {"train_loss": -5.730569362640381, "global_step": 39148, "epoch": 932} {"train_loss": -5.624885082244873, "global_step": 39149, "epoch": 932} {"train_loss": -5.687524795532227, "global_step": 39150, "epoch": 932} {"train_loss": -5.606435298919678, "global_step": 39151, "epoch": 932} {"train_loss": -5.548617362976074, "global_step": 39152, "epoch": 932} {"train_loss": -5.562423229217529, "global_step": 39153, "epoch": 932} {"train_loss": -5.597303867340088, "global_step": 39154, "epoch": 932} {"train_loss": -5.638433456420898, "global_step": 39155, "epoch": 932} {"train_loss": -5.420056343078613, "global_step": 39156, "epoch": 932} {"train_loss": -5.710199356079102, "global_step": 39157, "epoch": 932} {"train_loss": -5.745034694671631, "global_step": 39158, "epoch": 932} {"train_loss": -5.552115440368652, "global_step": 39159, "epoch": 932} {"train_loss": -5.7259674072265625, "global_step": 39160, "epoch": 932} {"train_loss": -5.59317684173584, "global_step": 39161, "epoch": 932} {"train_loss": -5.621264457702637, "global_step": 39162, "epoch": 932} {"train_loss": -5.628676414489746, "global_step": 39163, "epoch": 932} {"train_loss": -5.616819381713867, "global_step": 39164, "epoch": 932} {"train_loss": -5.605299949645996, "global_step": 39165, "epoch": 932} {"train_loss": -5.5686259269714355, "global_step": 39166, "epoch": 932} {"train_loss": -5.563790321350098, "global_step": 39167, "epoch": 932} {"train_loss": -5.548720359802246, "global_step": 39168, "epoch": 932} {"train_loss": -5.682731628417969, "global_step": 39169, "epoch": 932} {"train_loss": -5.659901142120361, "global_step": 39170, "epoch": 932} {"train_loss": -5.688096523284912, "global_step": 39171, "epoch": 932} {"train_loss": -5.700621604919434, "global_step": 39172, "epoch": 932} {"train_loss": -5.632214546203613, "global_step": 39173, "epoch": 932} {"train_loss": -5.71770715713501, "global_step": 39174, "epoch": 932} {"train_loss": -5.741144180297852, "global_step": 39175, "epoch": 932} {"train_loss": -5.579833984375, "global_step": 39176, "epoch": 932} {"train_loss": -5.543104648590088, "global_step": 39177, "epoch": 932} {"train_loss": -5.65766716003418, "global_step": 39178, "epoch": 932} {"train_loss": -5.649842262268066, "global_step": 39179, "epoch": 932} {"train_loss": -5.745511054992676, "global_step": 39180, "epoch": 932} {"train_loss": -5.755475997924805, "global_step": 39181, "epoch": 932} {"train_loss": -5.6801910400390625, "global_step": 39182, "epoch": 932} {"train_loss": -5.572351932525635, "global_step": 39183, "epoch": 932} {"train_loss": -5.669952392578125, "global_step": 39184, "epoch": 932} {"train_loss": -5.636703457151141, "global_step": 39185, "epoch": 932, "val_loss": 61928.40625} {"train_loss": -5.620114803314209, "global_step": 39186, "epoch": 933} {"train_loss": -5.590555191040039, "global_step": 39187, "epoch": 933} {"train_loss": -5.587759494781494, "global_step": 39188, "epoch": 933} {"train_loss": -5.511351585388184, "global_step": 39189, "epoch": 933} {"train_loss": -5.693397045135498, "global_step": 39190, "epoch": 933} {"train_loss": -5.631546974182129, "global_step": 39191, "epoch": 933} {"train_loss": -5.651808738708496, "global_step": 39192, "epoch": 933} {"train_loss": -5.636256217956543, "global_step": 39193, "epoch": 933} {"train_loss": -5.652953147888184, "global_step": 39194, "epoch": 933} {"train_loss": -5.651097774505615, "global_step": 39195, "epoch": 933} {"train_loss": -5.5281081199646, "global_step": 39196, "epoch": 933} {"train_loss": -5.662314414978027, "global_step": 39197, "epoch": 933} {"train_loss": -5.492022514343262, "global_step": 39198, "epoch": 933} {"train_loss": -5.658795356750488, "global_step": 39199, "epoch": 933} {"train_loss": -5.537053108215332, "global_step": 39200, "epoch": 933} {"train_loss": -5.5128607749938965, "global_step": 39201, "epoch": 933} {"train_loss": -5.500186443328857, "global_step": 39202, "epoch": 933} {"train_loss": -5.505520820617676, "global_step": 39203, "epoch": 933} {"train_loss": -5.47750186920166, "global_step": 39204, "epoch": 933} {"train_loss": -5.520928859710693, "global_step": 39205, "epoch": 933} {"train_loss": -5.653225898742676, "global_step": 39206, "epoch": 933} {"train_loss": -5.578577518463135, "global_step": 39207, "epoch": 933} {"train_loss": -5.64979362487793, "global_step": 39208, "epoch": 933} {"train_loss": -5.611582279205322, "global_step": 39209, "epoch": 933} {"train_loss": -5.727204322814941, "global_step": 39210, "epoch": 933} {"train_loss": -5.684360504150391, "global_step": 39211, "epoch": 933} {"train_loss": -5.498780250549316, "global_step": 39212, "epoch": 933} {"train_loss": -5.602473258972168, "global_step": 39213, "epoch": 933} {"train_loss": -5.711823463439941, "global_step": 39214, "epoch": 933} {"train_loss": -5.6144561767578125, "global_step": 39215, "epoch": 933} {"train_loss": -5.644750595092773, "global_step": 39216, "epoch": 933} {"train_loss": -5.547449111938477, "global_step": 39217, "epoch": 933} {"train_loss": -5.604283332824707, "global_step": 39218, "epoch": 933} {"train_loss": -5.656107425689697, "global_step": 39219, "epoch": 933} {"train_loss": -5.47266960144043, "global_step": 39220, "epoch": 933} {"train_loss": -5.485527038574219, "global_step": 39221, "epoch": 933} {"train_loss": -5.601946830749512, "global_step": 39222, "epoch": 933} {"train_loss": -5.515286445617676, "global_step": 39223, "epoch": 933} {"train_loss": -5.572854995727539, "global_step": 39224, "epoch": 933} {"train_loss": -5.543120384216309, "global_step": 39225, "epoch": 933} {"train_loss": -5.450764179229736, "global_step": 39226, "epoch": 933} {"train_loss": -5.583754096712385, "global_step": 39227, "epoch": 933, "val_loss": 62916.01953125} {"train_loss": -5.487976551055908, "global_step": 39228, "epoch": 934} {"train_loss": -5.637922286987305, "global_step": 39229, "epoch": 934} {"train_loss": -5.548067569732666, "global_step": 39230, "epoch": 934} {"train_loss": -5.762454986572266, "global_step": 39231, "epoch": 934} {"train_loss": -5.590908527374268, "global_step": 39232, "epoch": 934} {"train_loss": -5.5387091636657715, "global_step": 39233, "epoch": 934} {"train_loss": -5.479322910308838, "global_step": 39234, "epoch": 934} {"train_loss": -5.6089372634887695, "global_step": 39235, "epoch": 934} {"train_loss": -5.548811912536621, "global_step": 39236, "epoch": 934} {"train_loss": -5.705092430114746, "global_step": 39237, "epoch": 934} {"train_loss": -5.515710353851318, "global_step": 39238, "epoch": 934} {"train_loss": -5.705416679382324, "global_step": 39239, "epoch": 934} {"train_loss": -5.618714809417725, "global_step": 39240, "epoch": 934} {"train_loss": -5.546727180480957, "global_step": 39241, "epoch": 934} {"train_loss": -5.616373538970947, "global_step": 39242, "epoch": 934} {"train_loss": -5.639242172241211, "global_step": 39243, "epoch": 934} {"train_loss": -5.751862525939941, "global_step": 39244, "epoch": 934} {"train_loss": -5.665528297424316, "global_step": 39245, "epoch": 934} {"train_loss": -5.518133640289307, "global_step": 39246, "epoch": 934} {"train_loss": -5.582867622375488, "global_step": 39247, "epoch": 934} {"train_loss": -5.48983097076416, "global_step": 39248, "epoch": 934} {"train_loss": -5.388482093811035, "global_step": 39249, "epoch": 934} {"train_loss": -5.726860046386719, "global_step": 39250, "epoch": 934} {"train_loss": -5.59340763092041, "global_step": 39251, "epoch": 934} {"train_loss": -5.685708999633789, "global_step": 39252, "epoch": 934} {"train_loss": -5.485808849334717, "global_step": 39253, "epoch": 934} {"train_loss": -5.726940155029297, "global_step": 39254, "epoch": 934} {"train_loss": -5.561492919921875, "global_step": 39255, "epoch": 934} {"train_loss": -5.660067081451416, "global_step": 39256, "epoch": 934} {"train_loss": -5.719427108764648, "global_step": 39257, "epoch": 934} {"train_loss": -5.530158996582031, "global_step": 39258, "epoch": 934} {"train_loss": -5.721643447875977, "global_step": 39259, "epoch": 934} {"train_loss": -5.585999965667725, "global_step": 39260, "epoch": 934} {"train_loss": -5.624760150909424, "global_step": 39261, "epoch": 934} {"train_loss": -5.560109615325928, "global_step": 39262, "epoch": 934} {"train_loss": -5.656143665313721, "global_step": 39263, "epoch": 934} {"train_loss": -5.508518218994141, "global_step": 39264, "epoch": 934} {"train_loss": -5.692234039306641, "global_step": 39265, "epoch": 934} {"train_loss": -5.542999267578125, "global_step": 39266, "epoch": 934} {"train_loss": -5.420534133911133, "global_step": 39267, "epoch": 934} {"train_loss": -5.587152481079102, "global_step": 39268, "epoch": 934} {"train_loss": -5.599859782627651, "global_step": 39269, "epoch": 934, "val_loss": 61871.4296875} {"train_loss": -5.6664533615112305, "global_step": 39270, "epoch": 935} {"train_loss": -5.546506881713867, "global_step": 39271, "epoch": 935} {"train_loss": -5.5606279373168945, "global_step": 39272, "epoch": 935} {"train_loss": -5.68977689743042, "global_step": 39273, "epoch": 935} {"train_loss": -5.477482795715332, "global_step": 39274, "epoch": 935} {"train_loss": -5.534021377563477, "global_step": 39275, "epoch": 935} {"train_loss": -5.686872482299805, "global_step": 39276, "epoch": 935} {"train_loss": -5.650914192199707, "global_step": 39277, "epoch": 935} {"train_loss": -5.732950687408447, "global_step": 39278, "epoch": 935} {"train_loss": -5.512441635131836, "global_step": 39279, "epoch": 935} {"train_loss": -5.60410213470459, "global_step": 39280, "epoch": 935} {"train_loss": -5.717079162597656, "global_step": 39281, "epoch": 935} {"train_loss": -5.636160850524902, "global_step": 39282, "epoch": 935} {"train_loss": -5.522721290588379, "global_step": 39283, "epoch": 935} {"train_loss": -5.665542125701904, "global_step": 39284, "epoch": 935} {"train_loss": -5.790668487548828, "global_step": 39285, "epoch": 935} {"train_loss": -5.678954601287842, "global_step": 39286, "epoch": 935} {"train_loss": -5.726110458374023, "global_step": 39287, "epoch": 935} {"train_loss": -5.735724449157715, "global_step": 39288, "epoch": 935} {"train_loss": -5.719171524047852, "global_step": 39289, "epoch": 935} {"train_loss": -5.601772308349609, "global_step": 39290, "epoch": 935} {"train_loss": -5.5864410400390625, "global_step": 39291, "epoch": 935} {"train_loss": -5.4874348640441895, "global_step": 39292, "epoch": 935} {"train_loss": -5.622880935668945, "global_step": 39293, "epoch": 935} {"train_loss": -5.519268989562988, "global_step": 39294, "epoch": 935} {"train_loss": -5.611013412475586, "global_step": 39295, "epoch": 935} {"train_loss": -5.630517959594727, "global_step": 39296, "epoch": 935} {"train_loss": -5.566797256469727, "global_step": 39297, "epoch": 935} {"train_loss": -5.505583763122559, "global_step": 39298, "epoch": 935} {"train_loss": -5.535770416259766, "global_step": 39299, "epoch": 935} {"train_loss": -5.5114850997924805, "global_step": 39300, "epoch": 935} {"train_loss": -5.706624984741211, "global_step": 39301, "epoch": 935} {"train_loss": -5.5570149421691895, "global_step": 39302, "epoch": 935} {"train_loss": -5.632656097412109, "global_step": 39303, "epoch": 935} {"train_loss": -5.636130332946777, "global_step": 39304, "epoch": 935} {"train_loss": -5.617467880249023, "global_step": 39305, "epoch": 935} {"train_loss": -5.523867607116699, "global_step": 39306, "epoch": 935} {"train_loss": -5.773518085479736, "global_step": 39307, "epoch": 935} {"train_loss": -5.6290435791015625, "global_step": 39308, "epoch": 935} {"train_loss": -5.574040412902832, "global_step": 39309, "epoch": 935} {"train_loss": -5.616040229797363, "global_step": 39310, "epoch": 935} {"train_loss": -5.615838289260864, "global_step": 39311, "epoch": 935, "val_loss": 61879.0546875} {"train_loss": -5.45179557800293, "global_step": 39312, "epoch": 936} {"train_loss": -5.6420369148254395, "global_step": 39313, "epoch": 936} {"train_loss": -5.688460826873779, "global_step": 39314, "epoch": 936} {"train_loss": -5.6067585945129395, "global_step": 39315, "epoch": 936} {"train_loss": -5.525585174560547, "global_step": 39316, "epoch": 936} {"train_loss": -5.699206829071045, "global_step": 39317, "epoch": 936} {"train_loss": -5.826197147369385, "global_step": 39318, "epoch": 936} {"train_loss": -5.627713680267334, "global_step": 39319, "epoch": 936} {"train_loss": -5.690430641174316, "global_step": 39320, "epoch": 936} {"train_loss": -5.580955505371094, "global_step": 39321, "epoch": 936} {"train_loss": -5.661957263946533, "global_step": 39322, "epoch": 936} {"train_loss": -5.564156532287598, "global_step": 39323, "epoch": 936} {"train_loss": -5.71062707901001, "global_step": 39324, "epoch": 936} {"train_loss": -5.704437732696533, "global_step": 39325, "epoch": 936} {"train_loss": -5.633710861206055, "global_step": 39326, "epoch": 936} {"train_loss": -5.69611930847168, "global_step": 39327, "epoch": 936} {"train_loss": -5.587108612060547, "global_step": 39328, "epoch": 936} {"train_loss": -5.603097915649414, "global_step": 39329, "epoch": 936} {"train_loss": -5.635440826416016, "global_step": 39330, "epoch": 936} {"train_loss": -5.606417655944824, "global_step": 39331, "epoch": 936} {"train_loss": -5.623248100280762, "global_step": 39332, "epoch": 936} {"train_loss": -5.683507919311523, "global_step": 39333, "epoch": 936} {"train_loss": -5.641043663024902, "global_step": 39334, "epoch": 936} {"train_loss": -5.6705121994018555, "global_step": 39335, "epoch": 936} {"train_loss": -5.64374303817749, "global_step": 39336, "epoch": 936} {"train_loss": -5.571466445922852, "global_step": 39337, "epoch": 936} {"train_loss": -5.678038597106934, "global_step": 39338, "epoch": 936} {"train_loss": -5.5982346534729, "global_step": 39339, "epoch": 936} {"train_loss": -5.554004669189453, "global_step": 39340, "epoch": 936} {"train_loss": -5.659027576446533, "global_step": 39341, "epoch": 936} {"train_loss": -5.519220352172852, "global_step": 39342, "epoch": 936} {"train_loss": -5.514313697814941, "global_step": 39343, "epoch": 936} {"train_loss": -5.661717414855957, "global_step": 39344, "epoch": 936} {"train_loss": -5.6048407554626465, "global_step": 39345, "epoch": 936} {"train_loss": -5.577928066253662, "global_step": 39346, "epoch": 936} {"train_loss": -5.542959213256836, "global_step": 39347, "epoch": 936} {"train_loss": -5.4639716148376465, "global_step": 39348, "epoch": 936} {"train_loss": -5.50656795501709, "global_step": 39349, "epoch": 936} {"train_loss": -5.5792341232299805, "global_step": 39350, "epoch": 936} {"train_loss": -5.7196526527404785, "global_step": 39351, "epoch": 936} {"train_loss": -5.658227920532227, "global_step": 39352, "epoch": 936} {"train_loss": -5.622247786748977, "global_step": 39353, "epoch": 936, "val_loss": 62070.15625} {"train_loss": -5.556295394897461, "global_step": 39354, "epoch": 937} {"train_loss": -5.56278657913208, "global_step": 39355, "epoch": 937} {"train_loss": -5.65895938873291, "global_step": 39356, "epoch": 937} {"train_loss": -5.467222213745117, "global_step": 39357, "epoch": 937} {"train_loss": -5.647943496704102, "global_step": 39358, "epoch": 937} {"train_loss": -5.7138776779174805, "global_step": 39359, "epoch": 937} {"train_loss": -5.658870220184326, "global_step": 39360, "epoch": 937} {"train_loss": -5.568722248077393, "global_step": 39361, "epoch": 937} {"train_loss": -5.746786117553711, "global_step": 39362, "epoch": 937} {"train_loss": -5.589395046234131, "global_step": 39363, "epoch": 937} {"train_loss": -5.593011379241943, "global_step": 39364, "epoch": 937} {"train_loss": -5.632399559020996, "global_step": 39365, "epoch": 937} {"train_loss": -5.583207607269287, "global_step": 39366, "epoch": 937} {"train_loss": -5.60444974899292, "global_step": 39367, "epoch": 937} {"train_loss": -5.702455997467041, "global_step": 39368, "epoch": 937} {"train_loss": -5.5503950119018555, "global_step": 39369, "epoch": 937} {"train_loss": -5.572939872741699, "global_step": 39370, "epoch": 937} {"train_loss": -5.58809757232666, "global_step": 39371, "epoch": 937} {"train_loss": -5.567643165588379, "global_step": 39372, "epoch": 937} {"train_loss": -5.74397087097168, "global_step": 39373, "epoch": 937} {"train_loss": -5.6717424392700195, "global_step": 39374, "epoch": 937} {"train_loss": -5.564095497131348, "global_step": 39375, "epoch": 937} {"train_loss": -5.693142890930176, "global_step": 39376, "epoch": 937} {"train_loss": -5.569415092468262, "global_step": 39377, "epoch": 937} {"train_loss": -5.780562400817871, "global_step": 39378, "epoch": 937} {"train_loss": -5.687202453613281, "global_step": 39379, "epoch": 937} {"train_loss": -5.6247358322143555, "global_step": 39380, "epoch": 937} {"train_loss": -5.688617706298828, "global_step": 39381, "epoch": 937} {"train_loss": -5.707324981689453, "global_step": 39382, "epoch": 937} {"train_loss": -5.620730400085449, "global_step": 39383, "epoch": 937} {"train_loss": -5.640221118927002, "global_step": 39384, "epoch": 937} {"train_loss": -5.699079513549805, "global_step": 39385, "epoch": 937} {"train_loss": -5.486429214477539, "global_step": 39386, "epoch": 937} {"train_loss": -5.652954578399658, "global_step": 39387, "epoch": 937} {"train_loss": -5.697884559631348, "global_step": 39388, "epoch": 937} {"train_loss": -5.755492210388184, "global_step": 39389, "epoch": 937} {"train_loss": -5.545666694641113, "global_step": 39390, "epoch": 937} {"train_loss": -5.564847946166992, "global_step": 39391, "epoch": 937} {"train_loss": -5.658014297485352, "global_step": 39392, "epoch": 937} {"train_loss": -5.580937385559082, "global_step": 39393, "epoch": 937} {"train_loss": -5.548154830932617, "global_step": 39394, "epoch": 937} {"train_loss": -5.6284274487268355, "global_step": 39395, "epoch": 937, "val_loss": 62028.24609375} {"train_loss": -5.551129341125488, "global_step": 39396, "epoch": 938} {"train_loss": -5.457083702087402, "global_step": 39397, "epoch": 938} {"train_loss": -5.562827110290527, "global_step": 39398, "epoch": 938} {"train_loss": -5.5388593673706055, "global_step": 39399, "epoch": 938} {"train_loss": -5.509182929992676, "global_step": 39400, "epoch": 938} {"train_loss": -5.61600399017334, "global_step": 39401, "epoch": 938} {"train_loss": -5.564349174499512, "global_step": 39402, "epoch": 938} {"train_loss": -5.653098106384277, "global_step": 39403, "epoch": 938} {"train_loss": -5.585545063018799, "global_step": 39404, "epoch": 938} {"train_loss": -5.488195419311523, "global_step": 39405, "epoch": 938} {"train_loss": -5.629256725311279, "global_step": 39406, "epoch": 938} {"train_loss": -5.557497024536133, "global_step": 39407, "epoch": 938} {"train_loss": -5.600050926208496, "global_step": 39408, "epoch": 938} {"train_loss": -5.584567546844482, "global_step": 39409, "epoch": 938} {"train_loss": -5.350649356842041, "global_step": 39410, "epoch": 938} {"train_loss": -5.52202033996582, "global_step": 39411, "epoch": 938} {"train_loss": -5.526934623718262, "global_step": 39412, "epoch": 938} {"train_loss": -5.478392124176025, "global_step": 39413, "epoch": 938} {"train_loss": -5.61479377746582, "global_step": 39414, "epoch": 938} {"train_loss": -5.5454254150390625, "global_step": 39415, "epoch": 938} {"train_loss": -5.584193229675293, "global_step": 39416, "epoch": 938} {"train_loss": -5.688950538635254, "global_step": 39417, "epoch": 938} {"train_loss": -5.58377742767334, "global_step": 39418, "epoch": 938} {"train_loss": -5.629427909851074, "global_step": 39419, "epoch": 938} {"train_loss": -5.602487564086914, "global_step": 39420, "epoch": 938} {"train_loss": -5.774407386779785, "global_step": 39421, "epoch": 938} {"train_loss": -5.572384357452393, "global_step": 39422, "epoch": 938} {"train_loss": -5.759545803070068, "global_step": 39423, "epoch": 938} {"train_loss": -5.547789573669434, "global_step": 39424, "epoch": 938} {"train_loss": -5.544868469238281, "global_step": 39425, "epoch": 938} {"train_loss": -5.559823513031006, "global_step": 39426, "epoch": 938} {"train_loss": -5.562614440917969, "global_step": 39427, "epoch": 938} {"train_loss": -5.683479309082031, "global_step": 39428, "epoch": 938} {"train_loss": -5.646779537200928, "global_step": 39429, "epoch": 938} {"train_loss": -5.655068397521973, "global_step": 39430, "epoch": 938} {"train_loss": -5.775732040405273, "global_step": 39431, "epoch": 938} {"train_loss": -5.499396324157715, "global_step": 39432, "epoch": 938} {"train_loss": -5.751002788543701, "global_step": 39433, "epoch": 938} {"train_loss": -5.801765441894531, "global_step": 39434, "epoch": 938} {"train_loss": -5.570201873779297, "global_step": 39435, "epoch": 938} {"train_loss": -5.704442024230957, "global_step": 39436, "epoch": 938} {"train_loss": -5.5990013054439, "global_step": 39437, "epoch": 938, "val_loss": 62249.9140625} {"train_loss": -5.611050605773926, "global_step": 39438, "epoch": 939} {"train_loss": -5.516512870788574, "global_step": 39439, "epoch": 939} {"train_loss": -5.755380153656006, "global_step": 39440, "epoch": 939} {"train_loss": -5.508623123168945, "global_step": 39441, "epoch": 939} {"train_loss": -5.499917030334473, "global_step": 39442, "epoch": 939} {"train_loss": -5.561891555786133, "global_step": 39443, "epoch": 939} {"train_loss": -5.491325378417969, "global_step": 39444, "epoch": 939} {"train_loss": -5.548045635223389, "global_step": 39445, "epoch": 939} {"train_loss": -5.686429023742676, "global_step": 39446, "epoch": 939} {"train_loss": -5.45353889465332, "global_step": 39447, "epoch": 939} {"train_loss": -5.605591773986816, "global_step": 39448, "epoch": 939} {"train_loss": -5.465368747711182, "global_step": 39449, "epoch": 939} {"train_loss": -5.5986785888671875, "global_step": 39450, "epoch": 939} {"train_loss": -5.558316230773926, "global_step": 39451, "epoch": 939} {"train_loss": -5.759964466094971, "global_step": 39452, "epoch": 939} {"train_loss": -5.621496677398682, "global_step": 39453, "epoch": 939} {"train_loss": -5.557352542877197, "global_step": 39454, "epoch": 939} {"train_loss": -5.646162509918213, "global_step": 39455, "epoch": 939} {"train_loss": -5.580542087554932, "global_step": 39456, "epoch": 939} {"train_loss": -5.659874439239502, "global_step": 39457, "epoch": 939} {"train_loss": -5.6564836502075195, "global_step": 39458, "epoch": 939} {"train_loss": -5.627629280090332, "global_step": 39459, "epoch": 939} {"train_loss": -5.678381443023682, "global_step": 39460, "epoch": 939} {"train_loss": -5.653362274169922, "global_step": 39461, "epoch": 939} {"train_loss": -5.696227073669434, "global_step": 39462, "epoch": 939} {"train_loss": -5.574708938598633, "global_step": 39463, "epoch": 939} {"train_loss": -5.514134407043457, "global_step": 39464, "epoch": 939} {"train_loss": -5.624166011810303, "global_step": 39465, "epoch": 939} {"train_loss": -5.647241115570068, "global_step": 39466, "epoch": 939} {"train_loss": -5.6074628829956055, "global_step": 39467, "epoch": 939} {"train_loss": -5.506649971008301, "global_step": 39468, "epoch": 939} {"train_loss": -5.644588470458984, "global_step": 39469, "epoch": 939} {"train_loss": -5.652044296264648, "global_step": 39470, "epoch": 939} {"train_loss": -5.631360054016113, "global_step": 39471, "epoch": 939} {"train_loss": -5.605435848236084, "global_step": 39472, "epoch": 939} {"train_loss": -5.631911277770996, "global_step": 39473, "epoch": 939} {"train_loss": -5.572732448577881, "global_step": 39474, "epoch": 939} {"train_loss": -5.666587829589844, "global_step": 39475, "epoch": 939} {"train_loss": -5.689048767089844, "global_step": 39476, "epoch": 939} {"train_loss": -5.663442134857178, "global_step": 39477, "epoch": 939} {"train_loss": -5.707967281341553, "global_step": 39478, "epoch": 939} {"train_loss": -5.607324395860944, "global_step": 39479, "epoch": 939, "val_loss": 61960.73046875} {"train_loss": -5.693937301635742, "global_step": 39480, "epoch": 940} {"train_loss": -5.549768447875977, "global_step": 39481, "epoch": 940} {"train_loss": -5.688980579376221, "global_step": 39482, "epoch": 940} {"train_loss": -5.669466018676758, "global_step": 39483, "epoch": 940} {"train_loss": -5.760073661804199, "global_step": 39484, "epoch": 940} {"train_loss": -5.732924938201904, "global_step": 39485, "epoch": 940} {"train_loss": -5.689131259918213, "global_step": 39486, "epoch": 940} {"train_loss": -5.689697265625, "global_step": 39487, "epoch": 940} {"train_loss": -5.595344543457031, "global_step": 39488, "epoch": 940} {"train_loss": -5.69735050201416, "global_step": 39489, "epoch": 940} {"train_loss": -5.587973594665527, "global_step": 39490, "epoch": 940} {"train_loss": -5.673666954040527, "global_step": 39491, "epoch": 940} {"train_loss": -5.6555094718933105, "global_step": 39492, "epoch": 940} {"train_loss": -5.592154502868652, "global_step": 39493, "epoch": 940} {"train_loss": -5.588686943054199, "global_step": 39494, "epoch": 940} {"train_loss": -5.65692138671875, "global_step": 39495, "epoch": 940} {"train_loss": -5.578507423400879, "global_step": 39496, "epoch": 940} {"train_loss": -5.635809898376465, "global_step": 39497, "epoch": 940} {"train_loss": -5.574592113494873, "global_step": 39498, "epoch": 940} {"train_loss": -5.663860321044922, "global_step": 39499, "epoch": 940} {"train_loss": -5.662038803100586, "global_step": 39500, "epoch": 940} {"train_loss": -5.692774772644043, "global_step": 39501, "epoch": 940} {"train_loss": -5.599091053009033, "global_step": 39502, "epoch": 940} {"train_loss": -5.572887420654297, "global_step": 39503, "epoch": 940} {"train_loss": -5.630014419555664, "global_step": 39504, "epoch": 940} {"train_loss": -5.691269874572754, "global_step": 39505, "epoch": 940} {"train_loss": -5.655040740966797, "global_step": 39506, "epoch": 940} {"train_loss": -5.613438606262207, "global_step": 39507, "epoch": 940} {"train_loss": -5.728271484375, "global_step": 39508, "epoch": 940} {"train_loss": -5.654387474060059, "global_step": 39509, "epoch": 940} {"train_loss": -5.515719413757324, "global_step": 39510, "epoch": 940} {"train_loss": -5.60898494720459, "global_step": 39511, "epoch": 940} {"train_loss": -5.63570499420166, "global_step": 39512, "epoch": 940} {"train_loss": -5.646055221557617, "global_step": 39513, "epoch": 940} {"train_loss": -5.7144365310668945, "global_step": 39514, "epoch": 940} {"train_loss": -5.697286605834961, "global_step": 39515, "epoch": 940} {"train_loss": -5.602910041809082, "global_step": 39516, "epoch": 940} {"train_loss": -5.568659782409668, "global_step": 39517, "epoch": 940} {"train_loss": -5.641199111938477, "global_step": 39518, "epoch": 940} {"train_loss": -5.699533462524414, "global_step": 39519, "epoch": 940} {"train_loss": -5.687232971191406, "global_step": 39520, "epoch": 940} {"train_loss": -5.6447420460837225, "global_step": 39521, "epoch": 940, "val_loss": 61922.51953125} {"train_loss": -5.653539657592773, "global_step": 39522, "epoch": 941} {"train_loss": -5.774545669555664, "global_step": 39523, "epoch": 941} {"train_loss": -5.724152565002441, "global_step": 39524, "epoch": 941} {"train_loss": -5.620267868041992, "global_step": 39525, "epoch": 941} {"train_loss": -5.604460716247559, "global_step": 39526, "epoch": 941} {"train_loss": -5.508986473083496, "global_step": 39527, "epoch": 941} {"train_loss": -5.55320405960083, "global_step": 39528, "epoch": 941} {"train_loss": -5.598752975463867, "global_step": 39529, "epoch": 941} {"train_loss": -5.537412166595459, "global_step": 39530, "epoch": 941} {"train_loss": -5.556727886199951, "global_step": 39531, "epoch": 941} {"train_loss": -5.56151819229126, "global_step": 39532, "epoch": 941} {"train_loss": -5.572810649871826, "global_step": 39533, "epoch": 941} {"train_loss": -5.534628391265869, "global_step": 39534, "epoch": 941} {"train_loss": -5.569009780883789, "global_step": 39535, "epoch": 941} {"train_loss": -5.582653045654297, "global_step": 39536, "epoch": 941} {"train_loss": -5.606140613555908, "global_step": 39537, "epoch": 941} {"train_loss": -5.75786828994751, "global_step": 39538, "epoch": 941} {"train_loss": -5.647428512573242, "global_step": 39539, "epoch": 941} {"train_loss": -5.617298126220703, "global_step": 39540, "epoch": 941} {"train_loss": -5.635105133056641, "global_step": 39541, "epoch": 941} {"train_loss": -5.770559310913086, "global_step": 39542, "epoch": 941} {"train_loss": -5.674264907836914, "global_step": 39543, "epoch": 941} {"train_loss": -5.657257080078125, "global_step": 39544, "epoch": 941} {"train_loss": -5.585158824920654, "global_step": 39545, "epoch": 941} {"train_loss": -5.663897514343262, "global_step": 39546, "epoch": 941} {"train_loss": -5.736039161682129, "global_step": 39547, "epoch": 941} {"train_loss": -5.5574235916137695, "global_step": 39548, "epoch": 941} {"train_loss": -5.718019485473633, "global_step": 39549, "epoch": 941} {"train_loss": -5.687079906463623, "global_step": 39550, "epoch": 941} {"train_loss": -5.65135383605957, "global_step": 39551, "epoch": 941} {"train_loss": -5.632624626159668, "global_step": 39552, "epoch": 941} {"train_loss": -5.532088279724121, "global_step": 39553, "epoch": 941} {"train_loss": -5.656773567199707, "global_step": 39554, "epoch": 941} {"train_loss": -5.700981140136719, "global_step": 39555, "epoch": 941} {"train_loss": -5.627650260925293, "global_step": 39556, "epoch": 941} {"train_loss": -5.618583679199219, "global_step": 39557, "epoch": 941} {"train_loss": -5.60993766784668, "global_step": 39558, "epoch": 941} {"train_loss": -5.666465759277344, "global_step": 39559, "epoch": 941} {"train_loss": -5.740674018859863, "global_step": 39560, "epoch": 941} {"train_loss": -5.659304618835449, "global_step": 39561, "epoch": 941} {"train_loss": -5.654478073120117, "global_step": 39562, "epoch": 941} {"train_loss": -5.635404870623634, "global_step": 39563, "epoch": 941, "val_loss": 61778.66796875} {"train_loss": -5.6028947830200195, "global_step": 39564, "epoch": 942} {"train_loss": -5.612900733947754, "global_step": 39565, "epoch": 942} {"train_loss": -5.481235027313232, "global_step": 39566, "epoch": 942} {"train_loss": -5.692534446716309, "global_step": 39567, "epoch": 942} {"train_loss": -5.716223239898682, "global_step": 39568, "epoch": 942} {"train_loss": -5.529762268066406, "global_step": 39569, "epoch": 942} {"train_loss": -5.624200820922852, "global_step": 39570, "epoch": 942} {"train_loss": -5.667977333068848, "global_step": 39571, "epoch": 942} {"train_loss": -5.71649169921875, "global_step": 39572, "epoch": 942} {"train_loss": -5.600603103637695, "global_step": 39573, "epoch": 942} {"train_loss": -5.572723388671875, "global_step": 39574, "epoch": 942} {"train_loss": -5.637948989868164, "global_step": 39575, "epoch": 942} {"train_loss": -5.665004730224609, "global_step": 39576, "epoch": 942} {"train_loss": -5.778146743774414, "global_step": 39577, "epoch": 942} {"train_loss": -5.67764139175415, "global_step": 39578, "epoch": 942} {"train_loss": -5.592215538024902, "global_step": 39579, "epoch": 942} {"train_loss": -5.6090569496154785, "global_step": 39580, "epoch": 942} {"train_loss": -5.793316841125488, "global_step": 39581, "epoch": 942} {"train_loss": -5.572951316833496, "global_step": 39582, "epoch": 942} {"train_loss": -5.610369682312012, "global_step": 39583, "epoch": 942} {"train_loss": -5.775186538696289, "global_step": 39584, "epoch": 942} {"train_loss": -5.666143417358398, "global_step": 39585, "epoch": 942} {"train_loss": -5.646518707275391, "global_step": 39586, "epoch": 942} {"train_loss": -5.740159034729004, "global_step": 39587, "epoch": 942} {"train_loss": -5.587130546569824, "global_step": 39588, "epoch": 942} {"train_loss": -5.671368598937988, "global_step": 39589, "epoch": 942} {"train_loss": -5.528547286987305, "global_step": 39590, "epoch": 942} {"train_loss": -5.579836845397949, "global_step": 39591, "epoch": 942} {"train_loss": -5.570858001708984, "global_step": 39592, "epoch": 942} {"train_loss": -5.6197829246521, "global_step": 39593, "epoch": 942} {"train_loss": -5.549878120422363, "global_step": 39594, "epoch": 942} {"train_loss": -5.623977184295654, "global_step": 39595, "epoch": 942} {"train_loss": -5.576685905456543, "global_step": 39596, "epoch": 942} {"train_loss": -5.5403876304626465, "global_step": 39597, "epoch": 942} {"train_loss": -5.5960588455200195, "global_step": 39598, "epoch": 942} {"train_loss": -5.5223822593688965, "global_step": 39599, "epoch": 942} {"train_loss": -5.679173469543457, "global_step": 39600, "epoch": 942} {"train_loss": -5.561430931091309, "global_step": 39601, "epoch": 942} {"train_loss": -5.611146450042725, "global_step": 39602, "epoch": 942} {"train_loss": -5.61686372756958, "global_step": 39603, "epoch": 942} {"train_loss": -5.516916275024414, "global_step": 39604, "epoch": 942} {"train_loss": -5.6208786850883845, "global_step": 39605, "epoch": 942, "val_loss": 61820.9921875} {"train_loss": -5.691641807556152, "global_step": 39606, "epoch": 943} {"train_loss": -5.6558380126953125, "global_step": 39607, "epoch": 943} {"train_loss": -5.581408500671387, "global_step": 39608, "epoch": 943} {"train_loss": -5.529207229614258, "global_step": 39609, "epoch": 943} {"train_loss": -5.620439052581787, "global_step": 39610, "epoch": 943} {"train_loss": -5.625844955444336, "global_step": 39611, "epoch": 943} {"train_loss": -5.616562843322754, "global_step": 39612, "epoch": 943} {"train_loss": -5.642594337463379, "global_step": 39613, "epoch": 943} {"train_loss": -5.622661113739014, "global_step": 39614, "epoch": 943} {"train_loss": -5.766436576843262, "global_step": 39615, "epoch": 943} {"train_loss": -5.645638465881348, "global_step": 39616, "epoch": 943} {"train_loss": -5.619626045227051, "global_step": 39617, "epoch": 943} {"train_loss": -5.6052680015563965, "global_step": 39618, "epoch": 943} {"train_loss": -5.562953948974609, "global_step": 39619, "epoch": 943} {"train_loss": -5.653115272521973, "global_step": 39620, "epoch": 943} {"train_loss": -5.575331687927246, "global_step": 39621, "epoch": 943} {"train_loss": -5.47224235534668, "global_step": 39622, "epoch": 943} {"train_loss": -5.671536445617676, "global_step": 39623, "epoch": 943} {"train_loss": -5.688141345977783, "global_step": 39624, "epoch": 943} {"train_loss": -5.500473976135254, "global_step": 39625, "epoch": 943} {"train_loss": -5.679965019226074, "global_step": 39626, "epoch": 943} {"train_loss": -5.664154052734375, "global_step": 39627, "epoch": 943} {"train_loss": -5.402626037597656, "global_step": 39628, "epoch": 943} {"train_loss": -5.545114517211914, "global_step": 39629, "epoch": 943} {"train_loss": -5.517871856689453, "global_step": 39630, "epoch": 943} {"train_loss": -5.5437140464782715, "global_step": 39631, "epoch": 943} {"train_loss": -5.56235408782959, "global_step": 39632, "epoch": 943} {"train_loss": -5.5818305015563965, "global_step": 39633, "epoch": 943} {"train_loss": -5.630599021911621, "global_step": 39634, "epoch": 943} {"train_loss": -5.554723739624023, "global_step": 39635, "epoch": 943} {"train_loss": -5.6679816246032715, "global_step": 39636, "epoch": 943} {"train_loss": -5.575678825378418, "global_step": 39637, "epoch": 943} {"train_loss": -5.529833793640137, "global_step": 39638, "epoch": 943} {"train_loss": -5.6753034591674805, "global_step": 39639, "epoch": 943} {"train_loss": -5.543123245239258, "global_step": 39640, "epoch": 943} {"train_loss": -5.537346363067627, "global_step": 39641, "epoch": 943} {"train_loss": -5.519160270690918, "global_step": 39642, "epoch": 943} {"train_loss": -5.639235973358154, "global_step": 39643, "epoch": 943} {"train_loss": -5.74350643157959, "global_step": 39644, "epoch": 943} {"train_loss": -5.652411460876465, "global_step": 39645, "epoch": 943} {"train_loss": -5.6634111404418945, "global_step": 39646, "epoch": 943} {"train_loss": -5.603279215948922, "global_step": 39647, "epoch": 943, "val_loss": 61924.89453125} {"train_loss": -5.687168598175049, "global_step": 39648, "epoch": 944} {"train_loss": -5.555426597595215, "global_step": 39649, "epoch": 944} {"train_loss": -5.629890441894531, "global_step": 39650, "epoch": 944} {"train_loss": -5.65017032623291, "global_step": 39651, "epoch": 944} {"train_loss": -5.570684909820557, "global_step": 39652, "epoch": 944} {"train_loss": -5.691349029541016, "global_step": 39653, "epoch": 944} {"train_loss": -5.565448760986328, "global_step": 39654, "epoch": 944} {"train_loss": -5.524096488952637, "global_step": 39655, "epoch": 944} {"train_loss": -5.7309699058532715, "global_step": 39656, "epoch": 944} {"train_loss": -5.492161750793457, "global_step": 39657, "epoch": 944} {"train_loss": -5.664251327514648, "global_step": 39658, "epoch": 944} {"train_loss": -5.640655994415283, "global_step": 39659, "epoch": 944} {"train_loss": -5.700411319732666, "global_step": 39660, "epoch": 944} {"train_loss": -5.579211711883545, "global_step": 39661, "epoch": 944} {"train_loss": -5.772217750549316, "global_step": 39662, "epoch": 944} {"train_loss": -5.608354091644287, "global_step": 39663, "epoch": 944} {"train_loss": -5.6732587814331055, "global_step": 39664, "epoch": 944} {"train_loss": -5.583957672119141, "global_step": 39665, "epoch": 944} {"train_loss": -5.600773811340332, "global_step": 39666, "epoch": 944} {"train_loss": -5.586658477783203, "global_step": 39667, "epoch": 944} {"train_loss": -5.588894844055176, "global_step": 39668, "epoch": 944} {"train_loss": -5.648332595825195, "global_step": 39669, "epoch": 944} {"train_loss": -5.712546348571777, "global_step": 39670, "epoch": 944} {"train_loss": -5.6618547439575195, "global_step": 39671, "epoch": 944} {"train_loss": -5.549118995666504, "global_step": 39672, "epoch": 944} {"train_loss": -5.5751237869262695, "global_step": 39673, "epoch": 944} {"train_loss": -5.540008544921875, "global_step": 39674, "epoch": 944} {"train_loss": -5.72406005859375, "global_step": 39675, "epoch": 944} {"train_loss": -5.482843399047852, "global_step": 39676, "epoch": 944} {"train_loss": -5.7146806716918945, "global_step": 39677, "epoch": 944} {"train_loss": -5.6771063804626465, "global_step": 39678, "epoch": 944} {"train_loss": -5.702098369598389, "global_step": 39679, "epoch": 944} {"train_loss": -5.609419822692871, "global_step": 39680, "epoch": 944} {"train_loss": -5.733280181884766, "global_step": 39681, "epoch": 944} {"train_loss": -5.589259147644043, "global_step": 39682, "epoch": 944} {"train_loss": -5.69160795211792, "global_step": 39683, "epoch": 944} {"train_loss": -5.636171817779541, "global_step": 39684, "epoch": 944} {"train_loss": -5.694252967834473, "global_step": 39685, "epoch": 944} {"train_loss": -5.577406406402588, "global_step": 39686, "epoch": 944} {"train_loss": -5.755056381225586, "global_step": 39687, "epoch": 944} {"train_loss": -5.493963241577148, "global_step": 39688, "epoch": 944} {"train_loss": -5.630647897720337, "global_step": 39689, "epoch": 944, "val_loss": 62102.00390625} {"train_loss": -5.654919624328613, "global_step": 39690, "epoch": 945} {"train_loss": -5.616898536682129, "global_step": 39691, "epoch": 945} {"train_loss": -5.742323398590088, "global_step": 39692, "epoch": 945} {"train_loss": -5.637755393981934, "global_step": 39693, "epoch": 945} {"train_loss": -5.6568603515625, "global_step": 39694, "epoch": 945} {"train_loss": -5.576422214508057, "global_step": 39695, "epoch": 945} {"train_loss": -5.537080764770508, "global_step": 39696, "epoch": 945} {"train_loss": -5.623208999633789, "global_step": 39697, "epoch": 945} {"train_loss": -5.710672378540039, "global_step": 39698, "epoch": 945} {"train_loss": -5.623740196228027, "global_step": 39699, "epoch": 945} {"train_loss": -5.62272834777832, "global_step": 39700, "epoch": 945} {"train_loss": -5.650206089019775, "global_step": 39701, "epoch": 945} {"train_loss": -5.64864444732666, "global_step": 39702, "epoch": 945} {"train_loss": -5.612847805023193, "global_step": 39703, "epoch": 945} {"train_loss": -5.581050395965576, "global_step": 39704, "epoch": 945} {"train_loss": -5.517535209655762, "global_step": 39705, "epoch": 945} {"train_loss": -5.669645309448242, "global_step": 39706, "epoch": 945} {"train_loss": -5.563266754150391, "global_step": 39707, "epoch": 945} {"train_loss": -5.548009872436523, "global_step": 39708, "epoch": 945} {"train_loss": -5.598323822021484, "global_step": 39709, "epoch": 945} {"train_loss": -5.518947124481201, "global_step": 39710, "epoch": 945} {"train_loss": -5.670297622680664, "global_step": 39711, "epoch": 945} {"train_loss": -5.635805130004883, "global_step": 39712, "epoch": 945} {"train_loss": -5.597850322723389, "global_step": 39713, "epoch": 945} {"train_loss": -5.5732102394104, "global_step": 39714, "epoch": 945} {"train_loss": -5.646416187286377, "global_step": 39715, "epoch": 945} {"train_loss": -5.561934471130371, "global_step": 39716, "epoch": 945} {"train_loss": -5.530337333679199, "global_step": 39717, "epoch": 945} {"train_loss": -5.711312770843506, "global_step": 39718, "epoch": 945} {"train_loss": -5.553275108337402, "global_step": 39719, "epoch": 945} {"train_loss": -5.5532145500183105, "global_step": 39720, "epoch": 945} {"train_loss": -5.789839267730713, "global_step": 39721, "epoch": 945} {"train_loss": -5.52077054977417, "global_step": 39722, "epoch": 945} {"train_loss": -5.554540157318115, "global_step": 39723, "epoch": 945} {"train_loss": -5.568760871887207, "global_step": 39724, "epoch": 945} {"train_loss": -5.667641639709473, "global_step": 39725, "epoch": 945} {"train_loss": -5.501102447509766, "global_step": 39726, "epoch": 945} {"train_loss": -5.685123920440674, "global_step": 39727, "epoch": 945} {"train_loss": -5.725326061248779, "global_step": 39728, "epoch": 945} {"train_loss": -5.5590620040893555, "global_step": 39729, "epoch": 945} {"train_loss": -5.57619571685791, "global_step": 39730, "epoch": 945} {"train_loss": -5.6096184480757945, "global_step": 39731, "epoch": 945, "val_loss": 61600.06640625} {"train_loss": -5.656355857849121, "global_step": 39732, "epoch": 946} {"train_loss": -5.642212867736816, "global_step": 39733, "epoch": 946} {"train_loss": -5.695549964904785, "global_step": 39734, "epoch": 946} {"train_loss": -5.708712100982666, "global_step": 39735, "epoch": 946} {"train_loss": -5.625401020050049, "global_step": 39736, "epoch": 946} {"train_loss": -5.592809200286865, "global_step": 39737, "epoch": 946} {"train_loss": -5.561378479003906, "global_step": 39738, "epoch": 946} {"train_loss": -5.614529609680176, "global_step": 39739, "epoch": 946} {"train_loss": -5.585790634155273, "global_step": 39740, "epoch": 946} {"train_loss": -5.588799476623535, "global_step": 39741, "epoch": 946} {"train_loss": -5.724000930786133, "global_step": 39742, "epoch": 946} {"train_loss": -5.695154190063477, "global_step": 39743, "epoch": 946} {"train_loss": -5.549343109130859, "global_step": 39744, "epoch": 946} {"train_loss": -5.589040279388428, "global_step": 39745, "epoch": 946} {"train_loss": -5.599666595458984, "global_step": 39746, "epoch": 946} {"train_loss": -5.73429012298584, "global_step": 39747, "epoch": 946} {"train_loss": -5.600643157958984, "global_step": 39748, "epoch": 946} {"train_loss": -5.6591997146606445, "global_step": 39749, "epoch": 946} {"train_loss": -5.720502853393555, "global_step": 39750, "epoch": 946} {"train_loss": -5.628926753997803, "global_step": 39751, "epoch": 946} {"train_loss": -5.669857025146484, "global_step": 39752, "epoch": 946} {"train_loss": -5.500862121582031, "global_step": 39753, "epoch": 946} {"train_loss": -5.5925750732421875, "global_step": 39754, "epoch": 946} {"train_loss": -5.580502510070801, "global_step": 39755, "epoch": 946} {"train_loss": -5.585210800170898, "global_step": 39756, "epoch": 946} {"train_loss": -5.624964237213135, "global_step": 39757, "epoch": 946} {"train_loss": -5.610932350158691, "global_step": 39758, "epoch": 946} {"train_loss": -5.580924034118652, "global_step": 39759, "epoch": 946} {"train_loss": -5.635130405426025, "global_step": 39760, "epoch": 946} {"train_loss": -5.7692413330078125, "global_step": 39761, "epoch": 946} {"train_loss": -5.4928436279296875, "global_step": 39762, "epoch": 946} {"train_loss": -5.484551429748535, "global_step": 39763, "epoch": 946} {"train_loss": -5.643268585205078, "global_step": 39764, "epoch": 946} {"train_loss": -5.582431793212891, "global_step": 39765, "epoch": 946} {"train_loss": -5.456346035003662, "global_step": 39766, "epoch": 946} {"train_loss": -5.535346031188965, "global_step": 39767, "epoch": 946} {"train_loss": -5.597162246704102, "global_step": 39768, "epoch": 946} {"train_loss": -5.638863563537598, "global_step": 39769, "epoch": 946} {"train_loss": -5.632493019104004, "global_step": 39770, "epoch": 946} {"train_loss": -5.611579895019531, "global_step": 39771, "epoch": 946} {"train_loss": -5.4640607833862305, "global_step": 39772, "epoch": 946} {"train_loss": -5.61188116527739, "global_step": 39773, "epoch": 946, "val_loss": 62318.87890625} {"train_loss": -5.5419135093688965, "global_step": 39774, "epoch": 947} {"train_loss": -5.537113189697266, "global_step": 39775, "epoch": 947} {"train_loss": -5.548861503601074, "global_step": 39776, "epoch": 947} {"train_loss": -5.44772481918335, "global_step": 39777, "epoch": 947} {"train_loss": -5.522526741027832, "global_step": 39778, "epoch": 947} {"train_loss": -5.630672454833984, "global_step": 39779, "epoch": 947} {"train_loss": -5.625653266906738, "global_step": 39780, "epoch": 947} {"train_loss": -5.621604919433594, "global_step": 39781, "epoch": 947} {"train_loss": -5.632632732391357, "global_step": 39782, "epoch": 947} {"train_loss": -5.599330902099609, "global_step": 39783, "epoch": 947} {"train_loss": -5.725769996643066, "global_step": 39784, "epoch": 947} {"train_loss": -5.595816612243652, "global_step": 39785, "epoch": 947} {"train_loss": -5.705912113189697, "global_step": 39786, "epoch": 947} {"train_loss": -5.6194748878479, "global_step": 39787, "epoch": 947} {"train_loss": -5.475125312805176, "global_step": 39788, "epoch": 947} {"train_loss": -5.6535797119140625, "global_step": 39789, "epoch": 947} {"train_loss": -5.466482162475586, "global_step": 39790, "epoch": 947} {"train_loss": -5.707479000091553, "global_step": 39791, "epoch": 947} {"train_loss": -5.6444807052612305, "global_step": 39792, "epoch": 947} {"train_loss": -5.560647010803223, "global_step": 39793, "epoch": 947} {"train_loss": -5.613925933837891, "global_step": 39794, "epoch": 947} {"train_loss": -5.546294212341309, "global_step": 39795, "epoch": 947} {"train_loss": -5.594574928283691, "global_step": 39796, "epoch": 947} {"train_loss": -5.661882400512695, "global_step": 39797, "epoch": 947} {"train_loss": -5.549335479736328, "global_step": 39798, "epoch": 947} {"train_loss": -5.6180596351623535, "global_step": 39799, "epoch": 947} {"train_loss": -5.484006881713867, "global_step": 39800, "epoch": 947} {"train_loss": -5.6859660148620605, "global_step": 39801, "epoch": 947} {"train_loss": -5.487766265869141, "global_step": 39802, "epoch": 947} {"train_loss": -5.668874263763428, "global_step": 39803, "epoch": 947} {"train_loss": -5.590280532836914, "global_step": 39804, "epoch": 947} {"train_loss": -5.732622146606445, "global_step": 39805, "epoch": 947} {"train_loss": -5.613621234893799, "global_step": 39806, "epoch": 947} {"train_loss": -5.577756404876709, "global_step": 39807, "epoch": 947} {"train_loss": -5.638206481933594, "global_step": 39808, "epoch": 947} {"train_loss": -5.481189727783203, "global_step": 39809, "epoch": 947} {"train_loss": -5.644427299499512, "global_step": 39810, "epoch": 947} {"train_loss": -5.6216630935668945, "global_step": 39811, "epoch": 947} {"train_loss": -5.662140846252441, "global_step": 39812, "epoch": 947} {"train_loss": -5.55096435546875, "global_step": 39813, "epoch": 947} {"train_loss": -5.615859031677246, "global_step": 39814, "epoch": 947} {"train_loss": -5.599331412996564, "global_step": 39815, "epoch": 947, "val_loss": 62053.06640625} {"train_loss": -5.712900161743164, "global_step": 39816, "epoch": 948} {"train_loss": -5.637260437011719, "global_step": 39817, "epoch": 948} {"train_loss": -5.669753551483154, "global_step": 39818, "epoch": 948} {"train_loss": -5.613684177398682, "global_step": 39819, "epoch": 948} {"train_loss": -5.702126979827881, "global_step": 39820, "epoch": 948} {"train_loss": -5.732400894165039, "global_step": 39821, "epoch": 948} {"train_loss": -5.583475589752197, "global_step": 39822, "epoch": 948} {"train_loss": -5.633367538452148, "global_step": 39823, "epoch": 948} {"train_loss": -5.643268585205078, "global_step": 39824, "epoch": 948} {"train_loss": -5.523063659667969, "global_step": 39825, "epoch": 948} {"train_loss": -5.685417175292969, "global_step": 39826, "epoch": 948} {"train_loss": -5.706923961639404, "global_step": 39827, "epoch": 948} {"train_loss": -5.632294654846191, "global_step": 39828, "epoch": 948} {"train_loss": -5.764472961425781, "global_step": 39829, "epoch": 948} {"train_loss": -5.701091289520264, "global_step": 39830, "epoch": 948} {"train_loss": -5.56511116027832, "global_step": 39831, "epoch": 948} {"train_loss": -5.636305332183838, "global_step": 39832, "epoch": 948} {"train_loss": -5.624855041503906, "global_step": 39833, "epoch": 948} {"train_loss": -5.615011215209961, "global_step": 39834, "epoch": 948} {"train_loss": -5.508810043334961, "global_step": 39835, "epoch": 948} {"train_loss": -5.6394805908203125, "global_step": 39836, "epoch": 948} {"train_loss": -5.555870056152344, "global_step": 39837, "epoch": 948} {"train_loss": -5.637729644775391, "global_step": 39838, "epoch": 948} {"train_loss": -5.621860504150391, "global_step": 39839, "epoch": 948} {"train_loss": -5.5212907791137695, "global_step": 39840, "epoch": 948} {"train_loss": -5.4383134841918945, "global_step": 39841, "epoch": 948} {"train_loss": -5.434969902038574, "global_step": 39842, "epoch": 948} {"train_loss": -5.480432033538818, "global_step": 39843, "epoch": 948} {"train_loss": -5.605932235717773, "global_step": 39844, "epoch": 948} {"train_loss": -5.514719486236572, "global_step": 39845, "epoch": 948} {"train_loss": -5.6219801902771, "global_step": 39846, "epoch": 948} {"train_loss": -5.560630798339844, "global_step": 39847, "epoch": 948} {"train_loss": -5.515910625457764, "global_step": 39848, "epoch": 948} {"train_loss": -5.473148345947266, "global_step": 39849, "epoch": 948} {"train_loss": -5.7088541984558105, "global_step": 39850, "epoch": 948} {"train_loss": -5.705719470977783, "global_step": 39851, "epoch": 948} {"train_loss": -5.632555961608887, "global_step": 39852, "epoch": 948} {"train_loss": -5.659361839294434, "global_step": 39853, "epoch": 948} {"train_loss": -5.53342866897583, "global_step": 39854, "epoch": 948} {"train_loss": -5.621092796325684, "global_step": 39855, "epoch": 948} {"train_loss": -5.720372200012207, "global_step": 39856, "epoch": 948} {"train_loss": -5.6128580797286265, "global_step": 39857, "epoch": 948, "val_loss": 61749.07421875} {"train_loss": -5.743552207946777, "global_step": 39858, "epoch": 949} {"train_loss": -5.465294361114502, "global_step": 39859, "epoch": 949} {"train_loss": -5.550480842590332, "global_step": 39860, "epoch": 949} {"train_loss": -5.590129852294922, "global_step": 39861, "epoch": 949} {"train_loss": -5.493037223815918, "global_step": 39862, "epoch": 949} {"train_loss": -5.598845958709717, "global_step": 39863, "epoch": 949} {"train_loss": -5.768619537353516, "global_step": 39864, "epoch": 949} {"train_loss": -5.660562515258789, "global_step": 39865, "epoch": 949} {"train_loss": -5.754368782043457, "global_step": 39866, "epoch": 949} {"train_loss": -5.730430603027344, "global_step": 39867, "epoch": 949} {"train_loss": -5.556288242340088, "global_step": 39868, "epoch": 949} {"train_loss": -5.652286052703857, "global_step": 39869, "epoch": 949} {"train_loss": -5.722713470458984, "global_step": 39870, "epoch": 949} {"train_loss": -5.67405891418457, "global_step": 39871, "epoch": 949} {"train_loss": -5.646529197692871, "global_step": 39872, "epoch": 949} {"train_loss": -5.759427547454834, "global_step": 39873, "epoch": 949} {"train_loss": -5.667289733886719, "global_step": 39874, "epoch": 949} {"train_loss": -5.6033101081848145, "global_step": 39875, "epoch": 949} {"train_loss": -5.608567237854004, "global_step": 39876, "epoch": 949} {"train_loss": -5.684065341949463, "global_step": 39877, "epoch": 949} {"train_loss": -5.553435325622559, "global_step": 39878, "epoch": 949} {"train_loss": -5.513174057006836, "global_step": 39879, "epoch": 949} {"train_loss": -5.753573417663574, "global_step": 39880, "epoch": 949} {"train_loss": -5.523445129394531, "global_step": 39881, "epoch": 949} {"train_loss": -5.692312717437744, "global_step": 39882, "epoch": 949} {"train_loss": -5.681661128997803, "global_step": 39883, "epoch": 949} {"train_loss": -5.656274318695068, "global_step": 39884, "epoch": 949} {"train_loss": -5.744543075561523, "global_step": 39885, "epoch": 949} {"train_loss": -5.627940654754639, "global_step": 39886, "epoch": 949} {"train_loss": -5.567411422729492, "global_step": 39887, "epoch": 949} {"train_loss": -5.516279220581055, "global_step": 39888, "epoch": 949} {"train_loss": -5.611018657684326, "global_step": 39889, "epoch": 949} {"train_loss": -5.553094863891602, "global_step": 39890, "epoch": 949} {"train_loss": -5.64209508895874, "global_step": 39891, "epoch": 949} {"train_loss": -5.725881099700928, "global_step": 39892, "epoch": 949} {"train_loss": -5.6989288330078125, "global_step": 39893, "epoch": 949} {"train_loss": -5.713174819946289, "global_step": 39894, "epoch": 949} {"train_loss": -5.7228803634643555, "global_step": 39895, "epoch": 949} {"train_loss": -5.641349792480469, "global_step": 39896, "epoch": 949} {"train_loss": -5.705165386199951, "global_step": 39897, "epoch": 949} {"train_loss": -5.774796962738037, "global_step": 39898, "epoch": 949} {"train_loss": -5.648099660873413, "global_step": 39899, "epoch": 949, "val_loss": 61764.2265625} {"train_loss": -5.67238712310791, "global_step": 39900, "epoch": 950} {"train_loss": -5.732943534851074, "global_step": 39901, "epoch": 950} {"train_loss": -5.742063522338867, "global_step": 39902, "epoch": 950} {"train_loss": -5.587372779846191, "global_step": 39903, "epoch": 950} {"train_loss": -5.69648551940918, "global_step": 39904, "epoch": 950} {"train_loss": -5.891092777252197, "global_step": 39905, "epoch": 950} {"train_loss": -5.719062328338623, "global_step": 39906, "epoch": 950} {"train_loss": -5.665131568908691, "global_step": 39907, "epoch": 950} {"train_loss": -5.6038408279418945, "global_step": 39908, "epoch": 950} {"train_loss": -5.7052106857299805, "global_step": 39909, "epoch": 950} {"train_loss": -5.638002395629883, "global_step": 39910, "epoch": 950} {"train_loss": -5.596071720123291, "global_step": 39911, "epoch": 950} {"train_loss": -5.535955905914307, "global_step": 39912, "epoch": 950} {"train_loss": -5.630618095397949, "global_step": 39913, "epoch": 950} {"train_loss": -5.603022575378418, "global_step": 39914, "epoch": 950} {"train_loss": -5.478525161743164, "global_step": 39915, "epoch": 950} {"train_loss": -5.514551162719727, "global_step": 39916, "epoch": 950} {"train_loss": -5.678060054779053, "global_step": 39917, "epoch": 950} {"train_loss": -5.668108940124512, "global_step": 39918, "epoch": 950} {"train_loss": -5.699742794036865, "global_step": 39919, "epoch": 950} {"train_loss": -5.7711334228515625, "global_step": 39920, "epoch": 950} {"train_loss": -5.489398956298828, "global_step": 39921, "epoch": 950} {"train_loss": -5.679579734802246, "global_step": 39922, "epoch": 950} {"train_loss": -5.547983646392822, "global_step": 39923, "epoch": 950} {"train_loss": -5.622437953948975, "global_step": 39924, "epoch": 950} {"train_loss": -5.494585990905762, "global_step": 39925, "epoch": 950} {"train_loss": -5.569640159606934, "global_step": 39926, "epoch": 950} {"train_loss": -5.671785354614258, "global_step": 39927, "epoch": 950} {"train_loss": -5.546905517578125, "global_step": 39928, "epoch": 950} {"train_loss": -5.543478012084961, "global_step": 39929, "epoch": 950} {"train_loss": -5.588825225830078, "global_step": 39930, "epoch": 950} {"train_loss": -5.650015830993652, "global_step": 39931, "epoch": 950} {"train_loss": -5.563032150268555, "global_step": 39932, "epoch": 950} {"train_loss": -5.696965217590332, "global_step": 39933, "epoch": 950} {"train_loss": -5.670179843902588, "global_step": 39934, "epoch": 950} {"train_loss": -5.584997653961182, "global_step": 39935, "epoch": 950} {"train_loss": -5.645871639251709, "global_step": 39936, "epoch": 950} {"train_loss": -5.752805709838867, "global_step": 39937, "epoch": 950} {"train_loss": -5.714306831359863, "global_step": 39938, "epoch": 950} {"train_loss": -5.691936016082764, "global_step": 39939, "epoch": 950} {"train_loss": -5.577769756317139, "global_step": 39940, "epoch": 950} {"train_loss": -5.633672623407273, "global_step": 39941, "epoch": 950, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.16651351430131406, "train/sim_max_reward_2": 0.8452919133463725, "train/sim_max_reward_3": 0.21068682014661086, "train/sim_max_reward_4": 0.5797536203772691, "train/sim_max_reward_5": 0.5507338331551073, "test/sim_max_reward_4300000": 0.6218619429167233, "test/sim_max_reward_4300001": 0.2495319139801018, "test/sim_max_reward_4300002": 0.8552478362170165, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.2427652456223326, "test/sim_max_reward_4300005": 0.39153821664222155, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.20671853372702273, "test/sim_max_reward_4300008": 0.954615829051439, "test/sim_max_reward_4300009": 0.47330976425940835, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.27330675650238095, "test/sim_max_reward_4300012": 0.7877421138578953, "test/sim_max_reward_4300013": 0.8738568827098949, "test/sim_max_reward_4300014": 0.663111881493092, "test/sim_max_reward_4300015": 0.25540362236707215, "test/sim_max_reward_4300016": 0.3983976236039545, "test/sim_max_reward_4300017": 0.4432536098357256, "test/sim_max_reward_4300018": 0.30279058305052686, "test/sim_max_reward_4300019": 0.18617050504899404, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.7570724365382412, "test/sim_max_reward_4300022": 0.2845476971723737, "test/sim_max_reward_4300023": 0.38531619079744844, "test/sim_max_reward_4300024": 0.15263770977708568, "test/sim_max_reward_4300025": 0.13559709926761185, "test/sim_max_reward_4300026": 0.2222073250278588, "test/sim_max_reward_4300027": 0.10467558674810244, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.04893629033383653, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.10338754080585408, "test/sim_max_reward_4300032": 0.9586522089321119, "test/sim_max_reward_4300033": 0.9006480224961969, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.705094156115643, "test/sim_max_reward_4300038": 0.8001636887917785, "test/sim_max_reward_4300039": 0.439893077865472, "test/sim_max_reward_4300040": 0.35209815016660323, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7112474790485632, "test/sim_max_reward_4300043": 0.498409986814464, "test/sim_max_reward_4300044": 0.5241183882131157, "test/sim_max_reward_4300045": 0.1766813709545808, "test/sim_max_reward_4300046": 0.4958611064291045, "test/sim_max_reward_4300047": 0.10457380298568186, "test/sim_max_reward_4300048": 0.638312384700166, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.42387953298878767, "test/mean_score": 0.3775789735286235, "val_loss": 62192.16796875} {"train_loss": -5.645336627960205, "global_step": 39942, "epoch": 951} {"train_loss": -5.622523307800293, "global_step": 39943, "epoch": 951} {"train_loss": -5.555861473083496, "global_step": 39944, "epoch": 951} {"train_loss": -5.653636932373047, "global_step": 39945, "epoch": 951} {"train_loss": -5.5623040199279785, "global_step": 39946, "epoch": 951} {"train_loss": -5.566610336303711, "global_step": 39947, "epoch": 951} {"train_loss": -5.629494667053223, "global_step": 39948, "epoch": 951} {"train_loss": -5.455682277679443, "global_step": 39949, "epoch": 951} {"train_loss": -5.650700569152832, "global_step": 39950, "epoch": 951} {"train_loss": -5.514339447021484, "global_step": 39951, "epoch": 951} {"train_loss": -5.586352825164795, "global_step": 39952, "epoch": 951} {"train_loss": -5.603962421417236, "global_step": 39953, "epoch": 951} {"train_loss": -5.5709662437438965, "global_step": 39954, "epoch": 951} {"train_loss": -5.649544715881348, "global_step": 39955, "epoch": 951} {"train_loss": -5.756364822387695, "global_step": 39956, "epoch": 951} {"train_loss": -5.574573993682861, "global_step": 39957, "epoch": 951} {"train_loss": -5.588125228881836, "global_step": 39958, "epoch": 951} {"train_loss": -5.597696304321289, "global_step": 39959, "epoch": 951} {"train_loss": -5.611882209777832, "global_step": 39960, "epoch": 951} {"train_loss": -5.605123519897461, "global_step": 39961, "epoch": 951} {"train_loss": -5.58382511138916, "global_step": 39962, "epoch": 951} {"train_loss": -5.60526180267334, "global_step": 39963, "epoch": 951} {"train_loss": -5.5617218017578125, "global_step": 39964, "epoch": 951} {"train_loss": -5.658012390136719, "global_step": 39965, "epoch": 951} {"train_loss": -5.623748779296875, "global_step": 39966, "epoch": 951} {"train_loss": -5.630009651184082, "global_step": 39967, "epoch": 951} {"train_loss": -5.638265132904053, "global_step": 39968, "epoch": 951} {"train_loss": -5.525885581970215, "global_step": 39969, "epoch": 951} {"train_loss": -5.711142539978027, "global_step": 39970, "epoch": 951} {"train_loss": -5.73004150390625, "global_step": 39971, "epoch": 951} {"train_loss": -5.782923698425293, "global_step": 39972, "epoch": 951} {"train_loss": -5.5712971687316895, "global_step": 39973, "epoch": 951} {"train_loss": -5.610550880432129, "global_step": 39974, "epoch": 951} {"train_loss": -5.663755893707275, "global_step": 39975, "epoch": 951} {"train_loss": -5.624283790588379, "global_step": 39976, "epoch": 951} {"train_loss": -5.629970073699951, "global_step": 39977, "epoch": 951} {"train_loss": -5.639167785644531, "global_step": 39978, "epoch": 951} {"train_loss": -5.715944290161133, "global_step": 39979, "epoch": 951} {"train_loss": -5.675209045410156, "global_step": 39980, "epoch": 951} {"train_loss": -5.629360675811768, "global_step": 39981, "epoch": 951} {"train_loss": -5.6117658615112305, "global_step": 39982, "epoch": 951} {"train_loss": -5.62085907799857, "global_step": 39983, "epoch": 951, "val_loss": 62041.77734375} {"train_loss": -5.648481369018555, "global_step": 39984, "epoch": 952} {"train_loss": -5.763780117034912, "global_step": 39985, "epoch": 952} {"train_loss": -5.639981269836426, "global_step": 39986, "epoch": 952} {"train_loss": -5.613852500915527, "global_step": 39987, "epoch": 952} {"train_loss": -5.74024772644043, "global_step": 39988, "epoch": 952} {"train_loss": -5.711094856262207, "global_step": 39989, "epoch": 952} {"train_loss": -5.638197422027588, "global_step": 39990, "epoch": 952} {"train_loss": -5.656985282897949, "global_step": 39991, "epoch": 952} {"train_loss": -5.673434734344482, "global_step": 39992, "epoch": 952} {"train_loss": -5.660648345947266, "global_step": 39993, "epoch": 952} {"train_loss": -5.620100975036621, "global_step": 39994, "epoch": 952} {"train_loss": -5.663456916809082, "global_step": 39995, "epoch": 952} {"train_loss": -5.583860397338867, "global_step": 39996, "epoch": 952} {"train_loss": -5.6544318199157715, "global_step": 39997, "epoch": 952} {"train_loss": -5.612488269805908, "global_step": 39998, "epoch": 952} {"train_loss": -5.638102054595947, "global_step": 39999, "epoch": 952} {"train_loss": -5.661871910095215, "global_step": 40000, "epoch": 952} {"train_loss": -5.703512668609619, "global_step": 40001, "epoch": 952} {"train_loss": -5.675107002258301, "global_step": 40002, "epoch": 952} {"train_loss": -5.664894104003906, "global_step": 40003, "epoch": 952} {"train_loss": -5.651878833770752, "global_step": 40004, "epoch": 952} {"train_loss": -5.626866817474365, "global_step": 40005, "epoch": 952} {"train_loss": -5.720511436462402, "global_step": 40006, "epoch": 952} {"train_loss": -5.623968124389648, "global_step": 40007, "epoch": 952} {"train_loss": -5.631251335144043, "global_step": 40008, "epoch": 952} {"train_loss": -5.658013343811035, "global_step": 40009, "epoch": 952} {"train_loss": -5.652582168579102, "global_step": 40010, "epoch": 952} {"train_loss": -5.730872631072998, "global_step": 40011, "epoch": 952} {"train_loss": -5.619774341583252, "global_step": 40012, "epoch": 952} {"train_loss": -5.672862529754639, "global_step": 40013, "epoch": 952} {"train_loss": -5.669499397277832, "global_step": 40014, "epoch": 952} {"train_loss": -5.683077812194824, "global_step": 40015, "epoch": 952} {"train_loss": -5.722559452056885, "global_step": 40016, "epoch": 952} {"train_loss": -5.613785743713379, "global_step": 40017, "epoch": 952} {"train_loss": -5.711766242980957, "global_step": 40018, "epoch": 952} {"train_loss": -5.653168201446533, "global_step": 40019, "epoch": 952} {"train_loss": -5.70246696472168, "global_step": 40020, "epoch": 952} {"train_loss": -5.72189998626709, "global_step": 40021, "epoch": 952} {"train_loss": -5.616263389587402, "global_step": 40022, "epoch": 952} {"train_loss": -5.576349258422852, "global_step": 40023, "epoch": 952} {"train_loss": -5.702081680297852, "global_step": 40024, "epoch": 952} {"train_loss": -5.662691831588745, "global_step": 40025, "epoch": 952, "val_loss": 61866.12890625} {"train_loss": -5.585419654846191, "global_step": 40026, "epoch": 953} {"train_loss": -5.680675029754639, "global_step": 40027, "epoch": 953} {"train_loss": -5.615994453430176, "global_step": 40028, "epoch": 953} {"train_loss": -5.475284576416016, "global_step": 40029, "epoch": 953} {"train_loss": -5.634779930114746, "global_step": 40030, "epoch": 953} {"train_loss": -5.574648380279541, "global_step": 40031, "epoch": 953} {"train_loss": -5.6084675788879395, "global_step": 40032, "epoch": 953} {"train_loss": -5.598121643066406, "global_step": 40033, "epoch": 953} {"train_loss": -5.588704586029053, "global_step": 40034, "epoch": 953} {"train_loss": -5.6059770584106445, "global_step": 40035, "epoch": 953} {"train_loss": -5.496112823486328, "global_step": 40036, "epoch": 953} {"train_loss": -5.541742324829102, "global_step": 40037, "epoch": 953} {"train_loss": -5.681832313537598, "global_step": 40038, "epoch": 953} {"train_loss": -5.765686988830566, "global_step": 40039, "epoch": 953} {"train_loss": -5.731021881103516, "global_step": 40040, "epoch": 953} {"train_loss": -5.600222587585449, "global_step": 40041, "epoch": 953} {"train_loss": -5.706653594970703, "global_step": 40042, "epoch": 953} {"train_loss": -5.520260334014893, "global_step": 40043, "epoch": 953} {"train_loss": -5.649624824523926, "global_step": 40044, "epoch": 953} {"train_loss": -5.66688871383667, "global_step": 40045, "epoch": 953} {"train_loss": -5.640322685241699, "global_step": 40046, "epoch": 953} {"train_loss": -5.665273666381836, "global_step": 40047, "epoch": 953} {"train_loss": -5.622186660766602, "global_step": 40048, "epoch": 953} {"train_loss": -5.662698745727539, "global_step": 40049, "epoch": 953} {"train_loss": -5.6690144538879395, "global_step": 40050, "epoch": 953} {"train_loss": -5.5346245765686035, "global_step": 40051, "epoch": 953} {"train_loss": -5.575999736785889, "global_step": 40052, "epoch": 953} {"train_loss": -5.683464527130127, "global_step": 40053, "epoch": 953} {"train_loss": -5.414937973022461, "global_step": 40054, "epoch": 953} {"train_loss": -5.58304500579834, "global_step": 40055, "epoch": 953} {"train_loss": -5.566730499267578, "global_step": 40056, "epoch": 953} {"train_loss": -5.629556655883789, "global_step": 40057, "epoch": 953} {"train_loss": -5.6389970779418945, "global_step": 40058, "epoch": 953} {"train_loss": -5.431648254394531, "global_step": 40059, "epoch": 953} {"train_loss": -5.614941596984863, "global_step": 40060, "epoch": 953} {"train_loss": -5.684898853302002, "global_step": 40061, "epoch": 953} {"train_loss": -5.640179634094238, "global_step": 40062, "epoch": 953} {"train_loss": -5.651060581207275, "global_step": 40063, "epoch": 953} {"train_loss": -5.659847259521484, "global_step": 40064, "epoch": 953} {"train_loss": -5.617884635925293, "global_step": 40065, "epoch": 953} {"train_loss": -5.721844673156738, "global_step": 40066, "epoch": 953} {"train_loss": -5.616216432480585, "global_step": 40067, "epoch": 953, "val_loss": 61739.5078125} {"train_loss": -5.646536827087402, "global_step": 40068, "epoch": 954} {"train_loss": -5.562601566314697, "global_step": 40069, "epoch": 954} {"train_loss": -5.704707145690918, "global_step": 40070, "epoch": 954} {"train_loss": -5.6275410652160645, "global_step": 40071, "epoch": 954} {"train_loss": -5.692572116851807, "global_step": 40072, "epoch": 954} {"train_loss": -5.619055271148682, "global_step": 40073, "epoch": 954} {"train_loss": -5.643192291259766, "global_step": 40074, "epoch": 954} {"train_loss": -5.646096229553223, "global_step": 40075, "epoch": 954} {"train_loss": -5.697892189025879, "global_step": 40076, "epoch": 954} {"train_loss": -5.652111053466797, "global_step": 40077, "epoch": 954} {"train_loss": -5.495758056640625, "global_step": 40078, "epoch": 954} {"train_loss": -5.522038459777832, "global_step": 40079, "epoch": 954} {"train_loss": -5.636518478393555, "global_step": 40080, "epoch": 954} {"train_loss": -5.6260600090026855, "global_step": 40081, "epoch": 954} {"train_loss": -5.7112884521484375, "global_step": 40082, "epoch": 954} {"train_loss": -5.635389804840088, "global_step": 40083, "epoch": 954} {"train_loss": -5.612949371337891, "global_step": 40084, "epoch": 954} {"train_loss": -5.536314010620117, "global_step": 40085, "epoch": 954} {"train_loss": -5.594330787658691, "global_step": 40086, "epoch": 954} {"train_loss": -5.714702129364014, "global_step": 40087, "epoch": 954} {"train_loss": -5.633771896362305, "global_step": 40088, "epoch": 954} {"train_loss": -5.6129560470581055, "global_step": 40089, "epoch": 954} {"train_loss": -5.512541770935059, "global_step": 40090, "epoch": 954} {"train_loss": -5.718751907348633, "global_step": 40091, "epoch": 954} {"train_loss": -5.680401802062988, "global_step": 40092, "epoch": 954} {"train_loss": -5.6916704177856445, "global_step": 40093, "epoch": 954} {"train_loss": -5.473825931549072, "global_step": 40094, "epoch": 954} {"train_loss": -5.41286563873291, "global_step": 40095, "epoch": 954} {"train_loss": -5.6020827293396, "global_step": 40096, "epoch": 954} {"train_loss": -5.6410813331604, "global_step": 40097, "epoch": 954} {"train_loss": -5.601563453674316, "global_step": 40098, "epoch": 954} {"train_loss": -5.708806037902832, "global_step": 40099, "epoch": 954} {"train_loss": -5.603568077087402, "global_step": 40100, "epoch": 954} {"train_loss": -5.6025824546813965, "global_step": 40101, "epoch": 954} {"train_loss": -5.733017921447754, "global_step": 40102, "epoch": 954} {"train_loss": -5.744882583618164, "global_step": 40103, "epoch": 954} {"train_loss": -5.603787422180176, "global_step": 40104, "epoch": 954} {"train_loss": -5.602795600891113, "global_step": 40105, "epoch": 954} {"train_loss": -5.637148380279541, "global_step": 40106, "epoch": 954} {"train_loss": -5.669569492340088, "global_step": 40107, "epoch": 954} {"train_loss": -5.713051795959473, "global_step": 40108, "epoch": 954} {"train_loss": -5.628109228043329, "global_step": 40109, "epoch": 954, "val_loss": 62173.4375} {"train_loss": -5.626996040344238, "global_step": 40110, "epoch": 955} {"train_loss": -5.586679458618164, "global_step": 40111, "epoch": 955} {"train_loss": -5.674495697021484, "global_step": 40112, "epoch": 955} {"train_loss": -5.663329601287842, "global_step": 40113, "epoch": 955} {"train_loss": -5.692349433898926, "global_step": 40114, "epoch": 955} {"train_loss": -5.564812183380127, "global_step": 40115, "epoch": 955} {"train_loss": -5.616710186004639, "global_step": 40116, "epoch": 955} {"train_loss": -5.707237243652344, "global_step": 40117, "epoch": 955} {"train_loss": -5.730949401855469, "global_step": 40118, "epoch": 955} {"train_loss": -5.546306133270264, "global_step": 40119, "epoch": 955} {"train_loss": -5.700403213500977, "global_step": 40120, "epoch": 955} {"train_loss": -5.61118221282959, "global_step": 40121, "epoch": 955} {"train_loss": -5.608888626098633, "global_step": 40122, "epoch": 955} {"train_loss": -5.6806817054748535, "global_step": 40123, "epoch": 955} {"train_loss": -5.606815338134766, "global_step": 40124, "epoch": 955} {"train_loss": -5.657914161682129, "global_step": 40125, "epoch": 955} {"train_loss": -5.629868507385254, "global_step": 40126, "epoch": 955} {"train_loss": -5.584381103515625, "global_step": 40127, "epoch": 955} {"train_loss": -5.516741752624512, "global_step": 40128, "epoch": 955} {"train_loss": -5.687991142272949, "global_step": 40129, "epoch": 955} {"train_loss": -5.501758575439453, "global_step": 40130, "epoch": 955} {"train_loss": -5.672821998596191, "global_step": 40131, "epoch": 955} {"train_loss": -5.47178840637207, "global_step": 40132, "epoch": 955} {"train_loss": -5.523139953613281, "global_step": 40133, "epoch": 955} {"train_loss": -5.655204772949219, "global_step": 40134, "epoch": 955} {"train_loss": -5.430945873260498, "global_step": 40135, "epoch": 955} {"train_loss": -5.6545515060424805, "global_step": 40136, "epoch": 955} {"train_loss": -5.43387508392334, "global_step": 40137, "epoch": 955} {"train_loss": -5.715653419494629, "global_step": 40138, "epoch": 955} {"train_loss": -5.428537845611572, "global_step": 40139, "epoch": 955} {"train_loss": -5.671382427215576, "global_step": 40140, "epoch": 955} {"train_loss": -5.573275089263916, "global_step": 40141, "epoch": 955} {"train_loss": -5.66134786605835, "global_step": 40142, "epoch": 955} {"train_loss": -5.535378932952881, "global_step": 40143, "epoch": 955} {"train_loss": -5.442407608032227, "global_step": 40144, "epoch": 955} {"train_loss": -5.527057647705078, "global_step": 40145, "epoch": 955} {"train_loss": -5.532746315002441, "global_step": 40146, "epoch": 955} {"train_loss": -5.598455429077148, "global_step": 40147, "epoch": 955} {"train_loss": -5.521553993225098, "global_step": 40148, "epoch": 955} {"train_loss": -5.489007949829102, "global_step": 40149, "epoch": 955} {"train_loss": -5.529419898986816, "global_step": 40150, "epoch": 955} {"train_loss": -5.591812474387033, "global_step": 40151, "epoch": 955, "val_loss": 61704.28125} {"train_loss": -5.537100315093994, "global_step": 40152, "epoch": 956} {"train_loss": -5.662795066833496, "global_step": 40153, "epoch": 956} {"train_loss": -5.707060813903809, "global_step": 40154, "epoch": 956} {"train_loss": -5.663181781768799, "global_step": 40155, "epoch": 956} {"train_loss": -5.635165691375732, "global_step": 40156, "epoch": 956} {"train_loss": -5.544834136962891, "global_step": 40157, "epoch": 956} {"train_loss": -5.640066623687744, "global_step": 40158, "epoch": 956} {"train_loss": -5.570134162902832, "global_step": 40159, "epoch": 956} {"train_loss": -5.583154678344727, "global_step": 40160, "epoch": 956} {"train_loss": -5.654605865478516, "global_step": 40161, "epoch": 956} {"train_loss": -5.5633344650268555, "global_step": 40162, "epoch": 956} {"train_loss": -5.615313529968262, "global_step": 40163, "epoch": 956} {"train_loss": -5.711141586303711, "global_step": 40164, "epoch": 956} {"train_loss": -5.416260719299316, "global_step": 40165, "epoch": 956} {"train_loss": -5.5740227699279785, "global_step": 40166, "epoch": 956} {"train_loss": -5.602283000946045, "global_step": 40167, "epoch": 956} {"train_loss": -5.699941635131836, "global_step": 40168, "epoch": 956} {"train_loss": -5.663456916809082, "global_step": 40169, "epoch": 956} {"train_loss": -5.6409220695495605, "global_step": 40170, "epoch": 956} {"train_loss": -5.693977355957031, "global_step": 40171, "epoch": 956} {"train_loss": -5.593693733215332, "global_step": 40172, "epoch": 956} {"train_loss": -5.676474571228027, "global_step": 40173, "epoch": 956} {"train_loss": -5.554978370666504, "global_step": 40174, "epoch": 956} {"train_loss": -5.632110595703125, "global_step": 40175, "epoch": 956} {"train_loss": -5.659016132354736, "global_step": 40176, "epoch": 956} {"train_loss": -5.61737060546875, "global_step": 40177, "epoch": 956} {"train_loss": -5.70908784866333, "global_step": 40178, "epoch": 956} {"train_loss": -5.618597030639648, "global_step": 40179, "epoch": 956} {"train_loss": -5.652072906494141, "global_step": 40180, "epoch": 956} {"train_loss": -5.624744415283203, "global_step": 40181, "epoch": 956} {"train_loss": -5.55623197555542, "global_step": 40182, "epoch": 956} {"train_loss": -5.774324417114258, "global_step": 40183, "epoch": 956} {"train_loss": -5.592279434204102, "global_step": 40184, "epoch": 956} {"train_loss": -5.598639011383057, "global_step": 40185, "epoch": 956} {"train_loss": -5.58646297454834, "global_step": 40186, "epoch": 956} {"train_loss": -5.815918922424316, "global_step": 40187, "epoch": 956} {"train_loss": -5.663262844085693, "global_step": 40188, "epoch": 956} {"train_loss": -5.643893718719482, "global_step": 40189, "epoch": 956} {"train_loss": -5.712564945220947, "global_step": 40190, "epoch": 956} {"train_loss": -5.60164737701416, "global_step": 40191, "epoch": 956} {"train_loss": -5.600343227386475, "global_step": 40192, "epoch": 956} {"train_loss": -5.633938971019926, "global_step": 40193, "epoch": 956, "val_loss": 61998.9453125} {"train_loss": -5.677132606506348, "global_step": 40194, "epoch": 957} {"train_loss": -5.7624006271362305, "global_step": 40195, "epoch": 957} {"train_loss": -5.704314708709717, "global_step": 40196, "epoch": 957} {"train_loss": -5.646383285522461, "global_step": 40197, "epoch": 957} {"train_loss": -5.548784255981445, "global_step": 40198, "epoch": 957} {"train_loss": -5.606782913208008, "global_step": 40199, "epoch": 957} {"train_loss": -5.534119606018066, "global_step": 40200, "epoch": 957} {"train_loss": -5.621063709259033, "global_step": 40201, "epoch": 957} {"train_loss": -5.643062591552734, "global_step": 40202, "epoch": 957} {"train_loss": -5.645062446594238, "global_step": 40203, "epoch": 957} {"train_loss": -5.59079122543335, "global_step": 40204, "epoch": 957} {"train_loss": -5.743128776550293, "global_step": 40205, "epoch": 957} {"train_loss": -5.5456390380859375, "global_step": 40206, "epoch": 957} {"train_loss": -5.475831031799316, "global_step": 40207, "epoch": 957} {"train_loss": -5.50007963180542, "global_step": 40208, "epoch": 957} {"train_loss": -5.521113395690918, "global_step": 40209, "epoch": 957} {"train_loss": -5.508243083953857, "global_step": 40210, "epoch": 957} {"train_loss": -5.75140380859375, "global_step": 40211, "epoch": 957} {"train_loss": -5.714282035827637, "global_step": 40212, "epoch": 957} {"train_loss": -5.641191482543945, "global_step": 40213, "epoch": 957} {"train_loss": -5.4984283447265625, "global_step": 40214, "epoch": 957} {"train_loss": -5.612527847290039, "global_step": 40215, "epoch": 957} {"train_loss": -5.5443525314331055, "global_step": 40216, "epoch": 957} {"train_loss": -5.514660835266113, "global_step": 40217, "epoch": 957} {"train_loss": -5.509881019592285, "global_step": 40218, "epoch": 957} {"train_loss": -5.477235794067383, "global_step": 40219, "epoch": 957} {"train_loss": -5.597374439239502, "global_step": 40220, "epoch": 957} {"train_loss": -5.542064666748047, "global_step": 40221, "epoch": 957} {"train_loss": -5.419969081878662, "global_step": 40222, "epoch": 957} {"train_loss": -5.618382453918457, "global_step": 40223, "epoch": 957} {"train_loss": -5.561610221862793, "global_step": 40224, "epoch": 957} {"train_loss": -5.522261619567871, "global_step": 40225, "epoch": 957} {"train_loss": -5.605103015899658, "global_step": 40226, "epoch": 957} {"train_loss": -5.612539291381836, "global_step": 40227, "epoch": 957} {"train_loss": -5.686609745025635, "global_step": 40228, "epoch": 957} {"train_loss": -5.496417045593262, "global_step": 40229, "epoch": 957} {"train_loss": -5.6800103187561035, "global_step": 40230, "epoch": 957} {"train_loss": -5.643037796020508, "global_step": 40231, "epoch": 957} {"train_loss": -5.690160274505615, "global_step": 40232, "epoch": 957} {"train_loss": -5.706435203552246, "global_step": 40233, "epoch": 957} {"train_loss": -5.601325035095215, "global_step": 40234, "epoch": 957} {"train_loss": -5.603163764590309, "global_step": 40235, "epoch": 957, "val_loss": 61789.4375} {"train_loss": -5.669957160949707, "global_step": 40236, "epoch": 958} {"train_loss": -5.6765546798706055, "global_step": 40237, "epoch": 958} {"train_loss": -5.588007926940918, "global_step": 40238, "epoch": 958} {"train_loss": -5.618304252624512, "global_step": 40239, "epoch": 958} {"train_loss": -5.63558292388916, "global_step": 40240, "epoch": 958} {"train_loss": -5.651295185089111, "global_step": 40241, "epoch": 958} {"train_loss": -5.714689254760742, "global_step": 40242, "epoch": 958} {"train_loss": -5.698034286499023, "global_step": 40243, "epoch": 958} {"train_loss": -5.619793891906738, "global_step": 40244, "epoch": 958} {"train_loss": -5.708991527557373, "global_step": 40245, "epoch": 958} {"train_loss": -5.745108604431152, "global_step": 40246, "epoch": 958} {"train_loss": -5.862448692321777, "global_step": 40247, "epoch": 958} {"train_loss": -5.659179210662842, "global_step": 40248, "epoch": 958} {"train_loss": -5.5828704833984375, "global_step": 40249, "epoch": 958} {"train_loss": -5.648745536804199, "global_step": 40250, "epoch": 958} {"train_loss": -5.575814247131348, "global_step": 40251, "epoch": 958} {"train_loss": -5.7521867752075195, "global_step": 40252, "epoch": 958} {"train_loss": -5.614525318145752, "global_step": 40253, "epoch": 958} {"train_loss": -5.570372581481934, "global_step": 40254, "epoch": 958} {"train_loss": -5.636921405792236, "global_step": 40255, "epoch": 958} {"train_loss": -5.731975555419922, "global_step": 40256, "epoch": 958} {"train_loss": -5.7285003662109375, "global_step": 40257, "epoch": 958} {"train_loss": -5.675126552581787, "global_step": 40258, "epoch": 958} {"train_loss": -5.616826057434082, "global_step": 40259, "epoch": 958} {"train_loss": -5.650326728820801, "global_step": 40260, "epoch": 958} {"train_loss": -5.612565040588379, "global_step": 40261, "epoch": 958} {"train_loss": -5.665766716003418, "global_step": 40262, "epoch": 958} {"train_loss": -5.734292030334473, "global_step": 40263, "epoch": 958} {"train_loss": -5.5497541427612305, "global_step": 40264, "epoch": 958} {"train_loss": -5.5329437255859375, "global_step": 40265, "epoch": 958} {"train_loss": -5.523299694061279, "global_step": 40266, "epoch": 958} {"train_loss": -5.62437629699707, "global_step": 40267, "epoch": 958} {"train_loss": -5.685346603393555, "global_step": 40268, "epoch": 958} {"train_loss": -5.548166275024414, "global_step": 40269, "epoch": 958} {"train_loss": -5.639720916748047, "global_step": 40270, "epoch": 958} {"train_loss": -5.639990329742432, "global_step": 40271, "epoch": 958} {"train_loss": -5.651103973388672, "global_step": 40272, "epoch": 958} {"train_loss": -5.735369682312012, "global_step": 40273, "epoch": 958} {"train_loss": -5.746601104736328, "global_step": 40274, "epoch": 958} {"train_loss": -5.641643524169922, "global_step": 40275, "epoch": 958} {"train_loss": -5.56965446472168, "global_step": 40276, "epoch": 958} {"train_loss": -5.652695519583566, "global_step": 40277, "epoch": 958, "val_loss": 61773.83984375} {"train_loss": -5.693126678466797, "global_step": 40278, "epoch": 959} {"train_loss": -5.797729015350342, "global_step": 40279, "epoch": 959} {"train_loss": -5.746546268463135, "global_step": 40280, "epoch": 959} {"train_loss": -5.611797332763672, "global_step": 40281, "epoch": 959} {"train_loss": -5.700290679931641, "global_step": 40282, "epoch": 959} {"train_loss": -5.735522270202637, "global_step": 40283, "epoch": 959} {"train_loss": -5.7510833740234375, "global_step": 40284, "epoch": 959} {"train_loss": -5.661790370941162, "global_step": 40285, "epoch": 959} {"train_loss": -5.677797317504883, "global_step": 40286, "epoch": 959} {"train_loss": -5.527946949005127, "global_step": 40287, "epoch": 959} {"train_loss": -5.54489278793335, "global_step": 40288, "epoch": 959} {"train_loss": -5.6705522537231445, "global_step": 40289, "epoch": 959} {"train_loss": -5.61505651473999, "global_step": 40290, "epoch": 959} {"train_loss": -5.631656646728516, "global_step": 40291, "epoch": 959} {"train_loss": -5.509313583374023, "global_step": 40292, "epoch": 959} {"train_loss": -5.669480323791504, "global_step": 40293, "epoch": 959} {"train_loss": -5.649529933929443, "global_step": 40294, "epoch": 959} {"train_loss": -5.633421897888184, "global_step": 40295, "epoch": 959} {"train_loss": -5.5847039222717285, "global_step": 40296, "epoch": 959} {"train_loss": -5.647588729858398, "global_step": 40297, "epoch": 959} {"train_loss": -5.664670467376709, "global_step": 40298, "epoch": 959} {"train_loss": -5.804013729095459, "global_step": 40299, "epoch": 959} {"train_loss": -5.666749000549316, "global_step": 40300, "epoch": 959} {"train_loss": -5.619894027709961, "global_step": 40301, "epoch": 959} {"train_loss": -5.704015254974365, "global_step": 40302, "epoch": 959} {"train_loss": -5.690939426422119, "global_step": 40303, "epoch": 959} {"train_loss": -5.627651691436768, "global_step": 40304, "epoch": 959} {"train_loss": -5.5892205238342285, "global_step": 40305, "epoch": 959} {"train_loss": -5.606165409088135, "global_step": 40306, "epoch": 959} {"train_loss": -5.742102146148682, "global_step": 40307, "epoch": 959} {"train_loss": -5.710943222045898, "global_step": 40308, "epoch": 959} {"train_loss": -5.589328765869141, "global_step": 40309, "epoch": 959} {"train_loss": -5.538974285125732, "global_step": 40310, "epoch": 959} {"train_loss": -5.751081466674805, "global_step": 40311, "epoch": 959} {"train_loss": -5.720993995666504, "global_step": 40312, "epoch": 959} {"train_loss": -5.669118404388428, "global_step": 40313, "epoch": 959} {"train_loss": -5.545213222503662, "global_step": 40314, "epoch": 959} {"train_loss": -5.615296363830566, "global_step": 40315, "epoch": 959} {"train_loss": -5.637303829193115, "global_step": 40316, "epoch": 959} {"train_loss": -5.680978775024414, "global_step": 40317, "epoch": 959} {"train_loss": -5.552027225494385, "global_step": 40318, "epoch": 959} {"train_loss": -5.654556615012033, "global_step": 40319, "epoch": 959, "val_loss": 61669.59375} {"train_loss": -5.703411102294922, "global_step": 40320, "epoch": 960} {"train_loss": -5.743997097015381, "global_step": 40321, "epoch": 960} {"train_loss": -5.566123008728027, "global_step": 40322, "epoch": 960} {"train_loss": -5.655318260192871, "global_step": 40323, "epoch": 960} {"train_loss": -5.66077995300293, "global_step": 40324, "epoch": 960} {"train_loss": -5.776655197143555, "global_step": 40325, "epoch": 960} {"train_loss": -5.639947414398193, "global_step": 40326, "epoch": 960} {"train_loss": -5.577475547790527, "global_step": 40327, "epoch": 960} {"train_loss": -5.645294666290283, "global_step": 40328, "epoch": 960} {"train_loss": -5.680591583251953, "global_step": 40329, "epoch": 960} {"train_loss": -5.559444427490234, "global_step": 40330, "epoch": 960} {"train_loss": -5.507068634033203, "global_step": 40331, "epoch": 960} {"train_loss": -5.606152057647705, "global_step": 40332, "epoch": 960} {"train_loss": -5.553954124450684, "global_step": 40333, "epoch": 960} {"train_loss": -5.606009483337402, "global_step": 40334, "epoch": 960} {"train_loss": -5.683505535125732, "global_step": 40335, "epoch": 960} {"train_loss": -5.5525312423706055, "global_step": 40336, "epoch": 960} {"train_loss": -5.553256988525391, "global_step": 40337, "epoch": 960} {"train_loss": -5.689838886260986, "global_step": 40338, "epoch": 960} {"train_loss": -5.606856346130371, "global_step": 40339, "epoch": 960} {"train_loss": -5.60697078704834, "global_step": 40340, "epoch": 960} {"train_loss": -5.531315803527832, "global_step": 40341, "epoch": 960} {"train_loss": -5.696340560913086, "global_step": 40342, "epoch": 960} {"train_loss": -5.6130571365356445, "global_step": 40343, "epoch": 960} {"train_loss": -5.5998215675354, "global_step": 40344, "epoch": 960} {"train_loss": -5.6251397132873535, "global_step": 40345, "epoch": 960} {"train_loss": -5.6095476150512695, "global_step": 40346, "epoch": 960} {"train_loss": -5.749607086181641, "global_step": 40347, "epoch": 960} {"train_loss": -5.699323654174805, "global_step": 40348, "epoch": 960} {"train_loss": -5.656831741333008, "global_step": 40349, "epoch": 960} {"train_loss": -5.512271881103516, "global_step": 40350, "epoch": 960} {"train_loss": -5.632425785064697, "global_step": 40351, "epoch": 960} {"train_loss": -5.545854091644287, "global_step": 40352, "epoch": 960} {"train_loss": -5.665658950805664, "global_step": 40353, "epoch": 960} {"train_loss": -5.556778907775879, "global_step": 40354, "epoch": 960} {"train_loss": -5.635222434997559, "global_step": 40355, "epoch": 960} {"train_loss": -5.70600700378418, "global_step": 40356, "epoch": 960} {"train_loss": -5.647465229034424, "global_step": 40357, "epoch": 960} {"train_loss": -5.468522071838379, "global_step": 40358, "epoch": 960} {"train_loss": -5.599870681762695, "global_step": 40359, "epoch": 960} {"train_loss": -5.541954040527344, "global_step": 40360, "epoch": 960} {"train_loss": -5.621517124630156, "global_step": 40361, "epoch": 960, "val_loss": 61856.44921875} {"train_loss": -5.610462188720703, "global_step": 40362, "epoch": 961} {"train_loss": -5.651470184326172, "global_step": 40363, "epoch": 961} {"train_loss": -5.720931053161621, "global_step": 40364, "epoch": 961} {"train_loss": -5.723546028137207, "global_step": 40365, "epoch": 961} {"train_loss": -5.443106651306152, "global_step": 40366, "epoch": 961} {"train_loss": -5.675315856933594, "global_step": 40367, "epoch": 961} {"train_loss": -5.567981719970703, "global_step": 40368, "epoch": 961} {"train_loss": -5.494930267333984, "global_step": 40369, "epoch": 961} {"train_loss": -5.663922309875488, "global_step": 40370, "epoch": 961} {"train_loss": -5.693148612976074, "global_step": 40371, "epoch": 961} {"train_loss": -5.673888206481934, "global_step": 40372, "epoch": 961} {"train_loss": -5.914114952087402, "global_step": 40373, "epoch": 961} {"train_loss": -5.684544563293457, "global_step": 40374, "epoch": 961} {"train_loss": -5.568984031677246, "global_step": 40375, "epoch": 961} {"train_loss": -5.756441116333008, "global_step": 40376, "epoch": 961} {"train_loss": -5.585090160369873, "global_step": 40377, "epoch": 961} {"train_loss": -5.680614471435547, "global_step": 40378, "epoch": 961} {"train_loss": -5.59939432144165, "global_step": 40379, "epoch": 961} {"train_loss": -5.62431526184082, "global_step": 40380, "epoch": 961} {"train_loss": -5.597861289978027, "global_step": 40381, "epoch": 961} {"train_loss": -5.584754943847656, "global_step": 40382, "epoch": 961} {"train_loss": -5.5988640785217285, "global_step": 40383, "epoch": 961} {"train_loss": -5.450431823730469, "global_step": 40384, "epoch": 961} {"train_loss": -5.559331893920898, "global_step": 40385, "epoch": 961} {"train_loss": -5.626439571380615, "global_step": 40386, "epoch": 961} {"train_loss": -5.533965587615967, "global_step": 40387, "epoch": 961} {"train_loss": -5.639605522155762, "global_step": 40388, "epoch": 961} {"train_loss": -5.555368900299072, "global_step": 40389, "epoch": 961} {"train_loss": -5.468740463256836, "global_step": 40390, "epoch": 961} {"train_loss": -5.615633487701416, "global_step": 40391, "epoch": 961} {"train_loss": -5.4919753074646, "global_step": 40392, "epoch": 961} {"train_loss": -5.496380805969238, "global_step": 40393, "epoch": 961} {"train_loss": -5.602064609527588, "global_step": 40394, "epoch": 961} {"train_loss": -5.527017593383789, "global_step": 40395, "epoch": 961} {"train_loss": -5.698518753051758, "global_step": 40396, "epoch": 961} {"train_loss": -5.640271186828613, "global_step": 40397, "epoch": 961} {"train_loss": -5.577822685241699, "global_step": 40398, "epoch": 961} {"train_loss": -5.555977821350098, "global_step": 40399, "epoch": 961} {"train_loss": -5.593331813812256, "global_step": 40400, "epoch": 961} {"train_loss": -5.613852500915527, "global_step": 40401, "epoch": 961} {"train_loss": -5.688141822814941, "global_step": 40402, "epoch": 961} {"train_loss": -5.612656899860927, "global_step": 40403, "epoch": 961, "val_loss": 61875.65625} {"train_loss": -5.482648849487305, "global_step": 40404, "epoch": 962} {"train_loss": -5.678864479064941, "global_step": 40405, "epoch": 962} {"train_loss": -5.536249160766602, "global_step": 40406, "epoch": 962} {"train_loss": -5.718835830688477, "global_step": 40407, "epoch": 962} {"train_loss": -5.748334884643555, "global_step": 40408, "epoch": 962} {"train_loss": -5.730799674987793, "global_step": 40409, "epoch": 962} {"train_loss": -5.650115966796875, "global_step": 40410, "epoch": 962} {"train_loss": -5.65593957901001, "global_step": 40411, "epoch": 962} {"train_loss": -5.701846122741699, "global_step": 40412, "epoch": 962} {"train_loss": -5.657949447631836, "global_step": 40413, "epoch": 962} {"train_loss": -5.612173557281494, "global_step": 40414, "epoch": 962} {"train_loss": -5.649486541748047, "global_step": 40415, "epoch": 962} {"train_loss": -5.7705278396606445, "global_step": 40416, "epoch": 962} {"train_loss": -5.658727169036865, "global_step": 40417, "epoch": 962} {"train_loss": -5.6639862060546875, "global_step": 40418, "epoch": 962} {"train_loss": -5.729922771453857, "global_step": 40419, "epoch": 962} {"train_loss": -5.602598667144775, "global_step": 40420, "epoch": 962} {"train_loss": -5.5271992683410645, "global_step": 40421, "epoch": 962} {"train_loss": -5.794659614562988, "global_step": 40422, "epoch": 962} {"train_loss": -5.695016384124756, "global_step": 40423, "epoch": 962} {"train_loss": -5.70661735534668, "global_step": 40424, "epoch": 962} {"train_loss": -5.685455799102783, "global_step": 40425, "epoch": 962} {"train_loss": -5.49470329284668, "global_step": 40426, "epoch": 962} {"train_loss": -5.63510274887085, "global_step": 40427, "epoch": 962} {"train_loss": -5.692483425140381, "global_step": 40428, "epoch": 962} {"train_loss": -5.521363735198975, "global_step": 40429, "epoch": 962} {"train_loss": -5.61654806137085, "global_step": 40430, "epoch": 962} {"train_loss": -5.609903812408447, "global_step": 40431, "epoch": 962} {"train_loss": -5.685850143432617, "global_step": 40432, "epoch": 962} {"train_loss": -5.771026611328125, "global_step": 40433, "epoch": 962} {"train_loss": -5.567686557769775, "global_step": 40434, "epoch": 962} {"train_loss": -5.546474456787109, "global_step": 40435, "epoch": 962} {"train_loss": -5.76609992980957, "global_step": 40436, "epoch": 962} {"train_loss": -5.636453628540039, "global_step": 40437, "epoch": 962} {"train_loss": -5.45485782623291, "global_step": 40438, "epoch": 962} {"train_loss": -5.652673721313477, "global_step": 40439, "epoch": 962} {"train_loss": -5.6011061668396, "global_step": 40440, "epoch": 962} {"train_loss": -5.5862274169921875, "global_step": 40441, "epoch": 962} {"train_loss": -5.68239688873291, "global_step": 40442, "epoch": 962} {"train_loss": -5.503689765930176, "global_step": 40443, "epoch": 962} {"train_loss": -5.5664963722229, "global_step": 40444, "epoch": 962} {"train_loss": -5.63761195682344, "global_step": 40445, "epoch": 962, "val_loss": 62291.36328125} {"train_loss": -5.682283401489258, "global_step": 40446, "epoch": 963} {"train_loss": -5.655862808227539, "global_step": 40447, "epoch": 963} {"train_loss": -5.658046722412109, "global_step": 40448, "epoch": 963} {"train_loss": -5.536059379577637, "global_step": 40449, "epoch": 963} {"train_loss": -5.638286113739014, "global_step": 40450, "epoch": 963} {"train_loss": -5.658241271972656, "global_step": 40451, "epoch": 963} {"train_loss": -5.691339492797852, "global_step": 40452, "epoch": 963} {"train_loss": -5.607612609863281, "global_step": 40453, "epoch": 963} {"train_loss": -5.650538921356201, "global_step": 40454, "epoch": 963} {"train_loss": -5.672649383544922, "global_step": 40455, "epoch": 963} {"train_loss": -5.570642471313477, "global_step": 40456, "epoch": 963} {"train_loss": -5.612400054931641, "global_step": 40457, "epoch": 963} {"train_loss": -5.632299423217773, "global_step": 40458, "epoch": 963} {"train_loss": -5.616812705993652, "global_step": 40459, "epoch": 963} {"train_loss": -5.643441677093506, "global_step": 40460, "epoch": 963} {"train_loss": -5.640233039855957, "global_step": 40461, "epoch": 963} {"train_loss": -5.654449462890625, "global_step": 40462, "epoch": 963} {"train_loss": -5.633834362030029, "global_step": 40463, "epoch": 963} {"train_loss": -5.6465349197387695, "global_step": 40464, "epoch": 963} {"train_loss": -5.626285076141357, "global_step": 40465, "epoch": 963} {"train_loss": -5.649617671966553, "global_step": 40466, "epoch": 963} {"train_loss": -5.706395626068115, "global_step": 40467, "epoch": 963} {"train_loss": -5.548695087432861, "global_step": 40468, "epoch": 963} {"train_loss": -5.639371395111084, "global_step": 40469, "epoch": 963} {"train_loss": -5.67255163192749, "global_step": 40470, "epoch": 963} {"train_loss": -5.662405014038086, "global_step": 40471, "epoch": 963} {"train_loss": -5.624963283538818, "global_step": 40472, "epoch": 963} {"train_loss": -5.606274127960205, "global_step": 40473, "epoch": 963} {"train_loss": -5.6947407722473145, "global_step": 40474, "epoch": 963} {"train_loss": -5.665644645690918, "global_step": 40475, "epoch": 963} {"train_loss": -5.6524810791015625, "global_step": 40476, "epoch": 963} {"train_loss": -5.63712215423584, "global_step": 40477, "epoch": 963} {"train_loss": -5.624239921569824, "global_step": 40478, "epoch": 963} {"train_loss": -5.552685737609863, "global_step": 40479, "epoch": 963} {"train_loss": -5.684852600097656, "global_step": 40480, "epoch": 963} {"train_loss": -5.5899553298950195, "global_step": 40481, "epoch": 963} {"train_loss": -5.675085067749023, "global_step": 40482, "epoch": 963} {"train_loss": -5.733423233032227, "global_step": 40483, "epoch": 963} {"train_loss": -5.522640228271484, "global_step": 40484, "epoch": 963} {"train_loss": -5.610470771789551, "global_step": 40485, "epoch": 963} {"train_loss": -5.555177688598633, "global_step": 40486, "epoch": 963} {"train_loss": -5.632327216012137, "global_step": 40487, "epoch": 963, "val_loss": 61914.015625} {"train_loss": -5.586391925811768, "global_step": 40488, "epoch": 964} {"train_loss": -5.519729137420654, "global_step": 40489, "epoch": 964} {"train_loss": -5.631585121154785, "global_step": 40490, "epoch": 964} {"train_loss": -5.756239414215088, "global_step": 40491, "epoch": 964} {"train_loss": -5.6456708908081055, "global_step": 40492, "epoch": 964} {"train_loss": -5.514897346496582, "global_step": 40493, "epoch": 964} {"train_loss": -5.588740825653076, "global_step": 40494, "epoch": 964} {"train_loss": -5.709588050842285, "global_step": 40495, "epoch": 964} {"train_loss": -5.646151542663574, "global_step": 40496, "epoch": 964} {"train_loss": -5.53630256652832, "global_step": 40497, "epoch": 964} {"train_loss": -5.739603519439697, "global_step": 40498, "epoch": 964} {"train_loss": -5.749111175537109, "global_step": 40499, "epoch": 964} {"train_loss": -5.577861785888672, "global_step": 40500, "epoch": 964} {"train_loss": -5.513562202453613, "global_step": 40501, "epoch": 964} {"train_loss": -5.671878814697266, "global_step": 40502, "epoch": 964} {"train_loss": -5.5754714012146, "global_step": 40503, "epoch": 964} {"train_loss": -5.7275285720825195, "global_step": 40504, "epoch": 964} {"train_loss": -5.680231094360352, "global_step": 40505, "epoch": 964} {"train_loss": -5.605518341064453, "global_step": 40506, "epoch": 964} {"train_loss": -5.6861572265625, "global_step": 40507, "epoch": 964} {"train_loss": -5.605762004852295, "global_step": 40508, "epoch": 964} {"train_loss": -5.610793590545654, "global_step": 40509, "epoch": 964} {"train_loss": -5.696234703063965, "global_step": 40510, "epoch": 964} {"train_loss": -5.5418500900268555, "global_step": 40511, "epoch": 964} {"train_loss": -5.699914932250977, "global_step": 40512, "epoch": 964} {"train_loss": -5.726794719696045, "global_step": 40513, "epoch": 964} {"train_loss": -5.672632217407227, "global_step": 40514, "epoch": 964} {"train_loss": -5.578555107116699, "global_step": 40515, "epoch": 964} {"train_loss": -5.716059684753418, "global_step": 40516, "epoch": 964} {"train_loss": -5.5646562576293945, "global_step": 40517, "epoch": 964} {"train_loss": -5.50549840927124, "global_step": 40518, "epoch": 964} {"train_loss": -5.541669845581055, "global_step": 40519, "epoch": 964} {"train_loss": -5.653473854064941, "global_step": 40520, "epoch": 964} {"train_loss": -5.595249652862549, "global_step": 40521, "epoch": 964} {"train_loss": -5.684549331665039, "global_step": 40522, "epoch": 964} {"train_loss": -5.6757965087890625, "global_step": 40523, "epoch": 964} {"train_loss": -5.629687309265137, "global_step": 40524, "epoch": 964} {"train_loss": -5.707245349884033, "global_step": 40525, "epoch": 964} {"train_loss": -5.5361833572387695, "global_step": 40526, "epoch": 964} {"train_loss": -5.58917236328125, "global_step": 40527, "epoch": 964} {"train_loss": -5.677650451660156, "global_step": 40528, "epoch": 964} {"train_loss": -5.633115030470348, "global_step": 40529, "epoch": 964, "val_loss": 62470.265625} {"train_loss": -5.646435737609863, "global_step": 40530, "epoch": 965} {"train_loss": -5.553398609161377, "global_step": 40531, "epoch": 965} {"train_loss": -5.65676212310791, "global_step": 40532, "epoch": 965} {"train_loss": -5.472334384918213, "global_step": 40533, "epoch": 965} {"train_loss": -5.724455833435059, "global_step": 40534, "epoch": 965} {"train_loss": -5.725397109985352, "global_step": 40535, "epoch": 965} {"train_loss": -5.692783355712891, "global_step": 40536, "epoch": 965} {"train_loss": -5.616386890411377, "global_step": 40537, "epoch": 965} {"train_loss": -5.676541805267334, "global_step": 40538, "epoch": 965} {"train_loss": -5.7744293212890625, "global_step": 40539, "epoch": 965} {"train_loss": -5.645097732543945, "global_step": 40540, "epoch": 965} {"train_loss": -5.710684299468994, "global_step": 40541, "epoch": 965} {"train_loss": -5.72239351272583, "global_step": 40542, "epoch": 965} {"train_loss": -5.743518352508545, "global_step": 40543, "epoch": 965} {"train_loss": -5.56986141204834, "global_step": 40544, "epoch": 965} {"train_loss": -5.652881622314453, "global_step": 40545, "epoch": 965} {"train_loss": -5.6887898445129395, "global_step": 40546, "epoch": 965} {"train_loss": -5.690399646759033, "global_step": 40547, "epoch": 965} {"train_loss": -5.722126007080078, "global_step": 40548, "epoch": 965} {"train_loss": -5.755348205566406, "global_step": 40549, "epoch": 965} {"train_loss": -5.543858528137207, "global_step": 40550, "epoch": 965} {"train_loss": -5.678277969360352, "global_step": 40551, "epoch": 965} {"train_loss": -5.597643852233887, "global_step": 40552, "epoch": 965} {"train_loss": -5.512256145477295, "global_step": 40553, "epoch": 965} {"train_loss": -5.674020767211914, "global_step": 40554, "epoch": 965} {"train_loss": -5.6629438400268555, "global_step": 40555, "epoch": 965} {"train_loss": -5.555964469909668, "global_step": 40556, "epoch": 965} {"train_loss": -5.66188907623291, "global_step": 40557, "epoch": 965} {"train_loss": -5.514585971832275, "global_step": 40558, "epoch": 965} {"train_loss": -5.518246173858643, "global_step": 40559, "epoch": 965} {"train_loss": -5.576445579528809, "global_step": 40560, "epoch": 965} {"train_loss": -5.691993713378906, "global_step": 40561, "epoch": 965} {"train_loss": -5.654529094696045, "global_step": 40562, "epoch": 965} {"train_loss": -5.521330833435059, "global_step": 40563, "epoch": 965} {"train_loss": -5.567235469818115, "global_step": 40564, "epoch": 965} {"train_loss": -5.599431037902832, "global_step": 40565, "epoch": 965} {"train_loss": -5.648626327514648, "global_step": 40566, "epoch": 965} {"train_loss": -5.787365436553955, "global_step": 40567, "epoch": 965} {"train_loss": -5.645091533660889, "global_step": 40568, "epoch": 965} {"train_loss": -5.663652420043945, "global_step": 40569, "epoch": 965} {"train_loss": -5.616083145141602, "global_step": 40570, "epoch": 965} {"train_loss": -5.643253803253174, "global_step": 40571, "epoch": 965, "val_loss": 62093.39453125} {"train_loss": -5.495179653167725, "global_step": 40572, "epoch": 966} {"train_loss": -5.683413982391357, "global_step": 40573, "epoch": 966} {"train_loss": -5.553098678588867, "global_step": 40574, "epoch": 966} {"train_loss": -5.539494514465332, "global_step": 40575, "epoch": 966} {"train_loss": -5.53462028503418, "global_step": 40576, "epoch": 966} {"train_loss": -5.652322769165039, "global_step": 40577, "epoch": 966} {"train_loss": -5.74070930480957, "global_step": 40578, "epoch": 966} {"train_loss": -5.7297468185424805, "global_step": 40579, "epoch": 966} {"train_loss": -5.684688568115234, "global_step": 40580, "epoch": 966} {"train_loss": -5.6661553382873535, "global_step": 40581, "epoch": 966} {"train_loss": -5.588706970214844, "global_step": 40582, "epoch": 966} {"train_loss": -5.525835037231445, "global_step": 40583, "epoch": 966} {"train_loss": -5.79360818862915, "global_step": 40584, "epoch": 966} {"train_loss": -5.693532466888428, "global_step": 40585, "epoch": 966} {"train_loss": -5.647860527038574, "global_step": 40586, "epoch": 966} {"train_loss": -5.681546688079834, "global_step": 40587, "epoch": 966} {"train_loss": -5.6973371505737305, "global_step": 40588, "epoch": 966} {"train_loss": -5.550989151000977, "global_step": 40589, "epoch": 966} {"train_loss": -5.492788314819336, "global_step": 40590, "epoch": 966} {"train_loss": -5.631914138793945, "global_step": 40591, "epoch": 966} {"train_loss": -5.640692710876465, "global_step": 40592, "epoch": 966} {"train_loss": -5.584779262542725, "global_step": 40593, "epoch": 966} {"train_loss": -5.629100799560547, "global_step": 40594, "epoch": 966} {"train_loss": -5.616052150726318, "global_step": 40595, "epoch": 966} {"train_loss": -5.640038967132568, "global_step": 40596, "epoch": 966} {"train_loss": -5.700413703918457, "global_step": 40597, "epoch": 966} {"train_loss": -5.612272262573242, "global_step": 40598, "epoch": 966} {"train_loss": -5.60346794128418, "global_step": 40599, "epoch": 966} {"train_loss": -5.62945556640625, "global_step": 40600, "epoch": 966} {"train_loss": -5.707030296325684, "global_step": 40601, "epoch": 966} {"train_loss": -5.6527252197265625, "global_step": 40602, "epoch": 966} {"train_loss": -5.630977630615234, "global_step": 40603, "epoch": 966} {"train_loss": -5.569716453552246, "global_step": 40604, "epoch": 966} {"train_loss": -5.545066833496094, "global_step": 40605, "epoch": 966} {"train_loss": -5.6051106452941895, "global_step": 40606, "epoch": 966} {"train_loss": -5.619535446166992, "global_step": 40607, "epoch": 966} {"train_loss": -5.61617374420166, "global_step": 40608, "epoch": 966} {"train_loss": -5.64491081237793, "global_step": 40609, "epoch": 966} {"train_loss": -5.715958118438721, "global_step": 40610, "epoch": 966} {"train_loss": -5.635078430175781, "global_step": 40611, "epoch": 966} {"train_loss": -5.5302534103393555, "global_step": 40612, "epoch": 966} {"train_loss": -5.62772444316319, "global_step": 40613, "epoch": 966, "val_loss": 61755.23046875} {"train_loss": -5.710773468017578, "global_step": 40614, "epoch": 967} {"train_loss": -5.50468111038208, "global_step": 40615, "epoch": 967} {"train_loss": -5.770768165588379, "global_step": 40616, "epoch": 967} {"train_loss": -5.6453704833984375, "global_step": 40617, "epoch": 967} {"train_loss": -5.480074882507324, "global_step": 40618, "epoch": 967} {"train_loss": -5.6062164306640625, "global_step": 40619, "epoch": 967} {"train_loss": -5.623950004577637, "global_step": 40620, "epoch": 967} {"train_loss": -5.600951194763184, "global_step": 40621, "epoch": 967} {"train_loss": -5.472378730773926, "global_step": 40622, "epoch": 967} {"train_loss": -5.476108074188232, "global_step": 40623, "epoch": 967} {"train_loss": -5.636624813079834, "global_step": 40624, "epoch": 967} {"train_loss": -5.605683326721191, "global_step": 40625, "epoch": 967} {"train_loss": -5.621525764465332, "global_step": 40626, "epoch": 967} {"train_loss": -5.663027763366699, "global_step": 40627, "epoch": 967} {"train_loss": -5.613492965698242, "global_step": 40628, "epoch": 967} {"train_loss": -5.571598529815674, "global_step": 40629, "epoch": 967} {"train_loss": -5.621248245239258, "global_step": 40630, "epoch": 967} {"train_loss": -5.67474365234375, "global_step": 40631, "epoch": 967} {"train_loss": -5.61958122253418, "global_step": 40632, "epoch": 967} {"train_loss": -5.563192367553711, "global_step": 40633, "epoch": 967} {"train_loss": -5.6192827224731445, "global_step": 40634, "epoch": 967} {"train_loss": -5.606645584106445, "global_step": 40635, "epoch": 967} {"train_loss": -5.73898983001709, "global_step": 40636, "epoch": 967} {"train_loss": -5.6556501388549805, "global_step": 40637, "epoch": 967} {"train_loss": -5.656447410583496, "global_step": 40638, "epoch": 967} {"train_loss": -5.746028900146484, "global_step": 40639, "epoch": 967} {"train_loss": -5.616224765777588, "global_step": 40640, "epoch": 967} {"train_loss": -5.65997314453125, "global_step": 40641, "epoch": 967} {"train_loss": -5.649567604064941, "global_step": 40642, "epoch": 967} {"train_loss": -5.679324150085449, "global_step": 40643, "epoch": 967} {"train_loss": -5.614407539367676, "global_step": 40644, "epoch": 967} {"train_loss": -5.45119047164917, "global_step": 40645, "epoch": 967} {"train_loss": -5.722133636474609, "global_step": 40646, "epoch": 967} {"train_loss": -5.401916027069092, "global_step": 40647, "epoch": 967} {"train_loss": -5.718006134033203, "global_step": 40648, "epoch": 967} {"train_loss": -5.7242231369018555, "global_step": 40649, "epoch": 967} {"train_loss": -5.710000991821289, "global_step": 40650, "epoch": 967} {"train_loss": -5.621621131896973, "global_step": 40651, "epoch": 967} {"train_loss": -5.6492133140563965, "global_step": 40652, "epoch": 967} {"train_loss": -5.658514499664307, "global_step": 40653, "epoch": 967} {"train_loss": -5.626672744750977, "global_step": 40654, "epoch": 967} {"train_loss": -5.623635768890381, "global_step": 40655, "epoch": 967, "val_loss": 61832.94921875} {"train_loss": -5.575740814208984, "global_step": 40656, "epoch": 968} {"train_loss": -5.595861911773682, "global_step": 40657, "epoch": 968} {"train_loss": -5.640727996826172, "global_step": 40658, "epoch": 968} {"train_loss": -5.726155757904053, "global_step": 40659, "epoch": 968} {"train_loss": -5.660566329956055, "global_step": 40660, "epoch": 968} {"train_loss": -5.572890758514404, "global_step": 40661, "epoch": 968} {"train_loss": -5.756032943725586, "global_step": 40662, "epoch": 968} {"train_loss": -5.667036056518555, "global_step": 40663, "epoch": 968} {"train_loss": -5.612850189208984, "global_step": 40664, "epoch": 968} {"train_loss": -5.70637321472168, "global_step": 40665, "epoch": 968} {"train_loss": -5.506383895874023, "global_step": 40666, "epoch": 968} {"train_loss": -5.720310211181641, "global_step": 40667, "epoch": 968} {"train_loss": -5.620156764984131, "global_step": 40668, "epoch": 968} {"train_loss": -5.685385704040527, "global_step": 40669, "epoch": 968} {"train_loss": -5.577800273895264, "global_step": 40670, "epoch": 968} {"train_loss": -5.687192916870117, "global_step": 40671, "epoch": 968} {"train_loss": -5.609424591064453, "global_step": 40672, "epoch": 968} {"train_loss": -5.626204490661621, "global_step": 40673, "epoch": 968} {"train_loss": -5.506826400756836, "global_step": 40674, "epoch": 968} {"train_loss": -5.646624565124512, "global_step": 40675, "epoch": 968} {"train_loss": -5.610607624053955, "global_step": 40676, "epoch": 968} {"train_loss": -5.699868202209473, "global_step": 40677, "epoch": 968} {"train_loss": -5.673752784729004, "global_step": 40678, "epoch": 968} {"train_loss": -5.647576332092285, "global_step": 40679, "epoch": 968} {"train_loss": -5.748873710632324, "global_step": 40680, "epoch": 968} {"train_loss": -5.588768005371094, "global_step": 40681, "epoch": 968} {"train_loss": -5.69873046875, "global_step": 40682, "epoch": 968} {"train_loss": -5.713801383972168, "global_step": 40683, "epoch": 968} {"train_loss": -5.617799758911133, "global_step": 40684, "epoch": 968} {"train_loss": -5.665366172790527, "global_step": 40685, "epoch": 968} {"train_loss": -5.551833152770996, "global_step": 40686, "epoch": 968} {"train_loss": -5.598689079284668, "global_step": 40687, "epoch": 968} {"train_loss": -5.569238662719727, "global_step": 40688, "epoch": 968} {"train_loss": -5.7101898193359375, "global_step": 40689, "epoch": 968} {"train_loss": -5.567612648010254, "global_step": 40690, "epoch": 968} {"train_loss": -5.57968807220459, "global_step": 40691, "epoch": 968} {"train_loss": -5.597100257873535, "global_step": 40692, "epoch": 968} {"train_loss": -5.354816913604736, "global_step": 40693, "epoch": 968} {"train_loss": -5.700885772705078, "global_step": 40694, "epoch": 968} {"train_loss": -5.731527328491211, "global_step": 40695, "epoch": 968} {"train_loss": -5.613320350646973, "global_step": 40696, "epoch": 968} {"train_loss": -5.633941377912249, "global_step": 40697, "epoch": 968, "val_loss": 62202.734375} {"train_loss": -5.622504234313965, "global_step": 40698, "epoch": 969} {"train_loss": -5.556410789489746, "global_step": 40699, "epoch": 969} {"train_loss": -5.685859203338623, "global_step": 40700, "epoch": 969} {"train_loss": -5.623371601104736, "global_step": 40701, "epoch": 969} {"train_loss": -5.539844512939453, "global_step": 40702, "epoch": 969} {"train_loss": -5.548882961273193, "global_step": 40703, "epoch": 969} {"train_loss": -5.622026443481445, "global_step": 40704, "epoch": 969} {"train_loss": -5.739040374755859, "global_step": 40705, "epoch": 969} {"train_loss": -5.606577396392822, "global_step": 40706, "epoch": 969} {"train_loss": -5.651285171508789, "global_step": 40707, "epoch": 969} {"train_loss": -5.6368207931518555, "global_step": 40708, "epoch": 969} {"train_loss": -5.679037094116211, "global_step": 40709, "epoch": 969} {"train_loss": -5.633683681488037, "global_step": 40710, "epoch": 969} {"train_loss": -5.758173942565918, "global_step": 40711, "epoch": 969} {"train_loss": -5.642885208129883, "global_step": 40712, "epoch": 969} {"train_loss": -5.7422285079956055, "global_step": 40713, "epoch": 969} {"train_loss": -5.730085849761963, "global_step": 40714, "epoch": 969} {"train_loss": -5.669477462768555, "global_step": 40715, "epoch": 969} {"train_loss": -5.6360039710998535, "global_step": 40716, "epoch": 969} {"train_loss": -5.651559352874756, "global_step": 40717, "epoch": 969} {"train_loss": -5.640982627868652, "global_step": 40718, "epoch": 969} {"train_loss": -5.8020920753479, "global_step": 40719, "epoch": 969} {"train_loss": -5.686198711395264, "global_step": 40720, "epoch": 969} {"train_loss": -5.668959140777588, "global_step": 40721, "epoch": 969} {"train_loss": -5.569108963012695, "global_step": 40722, "epoch": 969} {"train_loss": -5.624610900878906, "global_step": 40723, "epoch": 969} {"train_loss": -5.6594038009643555, "global_step": 40724, "epoch": 969} {"train_loss": -5.6213788986206055, "global_step": 40725, "epoch": 969} {"train_loss": -5.744197845458984, "global_step": 40726, "epoch": 969} {"train_loss": -5.619037628173828, "global_step": 40727, "epoch": 969} {"train_loss": -5.737135887145996, "global_step": 40728, "epoch": 969} {"train_loss": -5.751416206359863, "global_step": 40729, "epoch": 969} {"train_loss": -5.611838340759277, "global_step": 40730, "epoch": 969} {"train_loss": -5.67868709564209, "global_step": 40731, "epoch": 969} {"train_loss": -5.718240737915039, "global_step": 40732, "epoch": 969} {"train_loss": -5.577752113342285, "global_step": 40733, "epoch": 969} {"train_loss": -5.536306381225586, "global_step": 40734, "epoch": 969} {"train_loss": -5.626305103302002, "global_step": 40735, "epoch": 969} {"train_loss": -5.496427536010742, "global_step": 40736, "epoch": 969} {"train_loss": -5.58789587020874, "global_step": 40737, "epoch": 969} {"train_loss": -5.688335418701172, "global_step": 40738, "epoch": 969} {"train_loss": -5.646886836914789, "global_step": 40739, "epoch": 969, "val_loss": 62013.01953125} {"train_loss": -5.686407089233398, "global_step": 40740, "epoch": 970} {"train_loss": -5.713493824005127, "global_step": 40741, "epoch": 970} {"train_loss": -5.625544548034668, "global_step": 40742, "epoch": 970} {"train_loss": -5.5411224365234375, "global_step": 40743, "epoch": 970} {"train_loss": -5.622817039489746, "global_step": 40744, "epoch": 970} {"train_loss": -5.653079509735107, "global_step": 40745, "epoch": 970} {"train_loss": -5.662642002105713, "global_step": 40746, "epoch": 970} {"train_loss": -5.683266639709473, "global_step": 40747, "epoch": 970} {"train_loss": -5.610933780670166, "global_step": 40748, "epoch": 970} {"train_loss": -5.691490173339844, "global_step": 40749, "epoch": 970} {"train_loss": -5.728574752807617, "global_step": 40750, "epoch": 970} {"train_loss": -5.548379898071289, "global_step": 40751, "epoch": 970} {"train_loss": -5.637308120727539, "global_step": 40752, "epoch": 970} {"train_loss": -5.705198287963867, "global_step": 40753, "epoch": 970} {"train_loss": -5.660432815551758, "global_step": 40754, "epoch": 970} {"train_loss": -5.6773247718811035, "global_step": 40755, "epoch": 970} {"train_loss": -5.639072418212891, "global_step": 40756, "epoch": 970} {"train_loss": -5.716182708740234, "global_step": 40757, "epoch": 970} {"train_loss": -5.6422271728515625, "global_step": 40758, "epoch": 970} {"train_loss": -5.590858459472656, "global_step": 40759, "epoch": 970} {"train_loss": -5.572169303894043, "global_step": 40760, "epoch": 970} {"train_loss": -5.673357963562012, "global_step": 40761, "epoch": 970} {"train_loss": -5.697949409484863, "global_step": 40762, "epoch": 970} {"train_loss": -5.58400821685791, "global_step": 40763, "epoch": 970} {"train_loss": -5.555730819702148, "global_step": 40764, "epoch": 970} {"train_loss": -5.459789752960205, "global_step": 40765, "epoch": 970} {"train_loss": -5.608346939086914, "global_step": 40766, "epoch": 970} {"train_loss": -5.655261039733887, "global_step": 40767, "epoch": 970} {"train_loss": -5.41634464263916, "global_step": 40768, "epoch": 970} {"train_loss": -5.535562038421631, "global_step": 40769, "epoch": 970} {"train_loss": -5.650424957275391, "global_step": 40770, "epoch": 970} {"train_loss": -5.404832363128662, "global_step": 40771, "epoch": 970} {"train_loss": -5.633714199066162, "global_step": 40772, "epoch": 970} {"train_loss": -5.410299777984619, "global_step": 40773, "epoch": 970} {"train_loss": -5.456431865692139, "global_step": 40774, "epoch": 970} {"train_loss": -5.643102645874023, "global_step": 40775, "epoch": 970} {"train_loss": -5.662168979644775, "global_step": 40776, "epoch": 970} {"train_loss": -5.6181640625, "global_step": 40777, "epoch": 970} {"train_loss": -5.693704128265381, "global_step": 40778, "epoch": 970} {"train_loss": -5.557673454284668, "global_step": 40779, "epoch": 970} {"train_loss": -5.666337966918945, "global_step": 40780, "epoch": 970} {"train_loss": -5.615616151264736, "global_step": 40781, "epoch": 970, "val_loss": 61978.5078125} {"train_loss": -5.5892181396484375, "global_step": 40782, "epoch": 971} {"train_loss": -5.691485404968262, "global_step": 40783, "epoch": 971} {"train_loss": -5.692623138427734, "global_step": 40784, "epoch": 971} {"train_loss": -5.6940131187438965, "global_step": 40785, "epoch": 971} {"train_loss": -5.56557559967041, "global_step": 40786, "epoch": 971} {"train_loss": -5.635168075561523, "global_step": 40787, "epoch": 971} {"train_loss": -5.676700592041016, "global_step": 40788, "epoch": 971} {"train_loss": -5.610237121582031, "global_step": 40789, "epoch": 971} {"train_loss": -5.623082160949707, "global_step": 40790, "epoch": 971} {"train_loss": -5.69811487197876, "global_step": 40791, "epoch": 971} {"train_loss": -5.704070091247559, "global_step": 40792, "epoch": 971} {"train_loss": -5.555788516998291, "global_step": 40793, "epoch": 971} {"train_loss": -5.643446922302246, "global_step": 40794, "epoch": 971} {"train_loss": -5.671082019805908, "global_step": 40795, "epoch": 971} {"train_loss": -5.623548984527588, "global_step": 40796, "epoch": 971} {"train_loss": -5.692769527435303, "global_step": 40797, "epoch": 971} {"train_loss": -5.603612899780273, "global_step": 40798, "epoch": 971} {"train_loss": -5.737506866455078, "global_step": 40799, "epoch": 971} {"train_loss": -5.48472785949707, "global_step": 40800, "epoch": 971} {"train_loss": -5.545245170593262, "global_step": 40801, "epoch": 971} {"train_loss": -5.555202007293701, "global_step": 40802, "epoch": 971} {"train_loss": -5.833239555358887, "global_step": 40803, "epoch": 971} {"train_loss": -5.678160667419434, "global_step": 40804, "epoch": 971} {"train_loss": -5.728107452392578, "global_step": 40805, "epoch": 971} {"train_loss": -5.704993724822998, "global_step": 40806, "epoch": 971} {"train_loss": -5.75118350982666, "global_step": 40807, "epoch": 971} {"train_loss": -5.7571282386779785, "global_step": 40808, "epoch": 971} {"train_loss": -5.640530109405518, "global_step": 40809, "epoch": 971} {"train_loss": -5.671487331390381, "global_step": 40810, "epoch": 971} {"train_loss": -5.5437211990356445, "global_step": 40811, "epoch": 971} {"train_loss": -5.6206583976745605, "global_step": 40812, "epoch": 971} {"train_loss": -5.595466613769531, "global_step": 40813, "epoch": 971} {"train_loss": -5.61020565032959, "global_step": 40814, "epoch": 971} {"train_loss": -5.600197792053223, "global_step": 40815, "epoch": 971} {"train_loss": -5.559676647186279, "global_step": 40816, "epoch": 971} {"train_loss": -5.808628082275391, "global_step": 40817, "epoch": 971} {"train_loss": -5.598626136779785, "global_step": 40818, "epoch": 971} {"train_loss": -5.624354839324951, "global_step": 40819, "epoch": 971} {"train_loss": -5.652946472167969, "global_step": 40820, "epoch": 971} {"train_loss": -5.571224212646484, "global_step": 40821, "epoch": 971} {"train_loss": -5.603826999664307, "global_step": 40822, "epoch": 971} {"train_loss": -5.6477261157262895, "global_step": 40823, "epoch": 971, "val_loss": 61938.58203125} {"train_loss": -5.7016143798828125, "global_step": 40824, "epoch": 972} {"train_loss": -5.691691875457764, "global_step": 40825, "epoch": 972} {"train_loss": -5.596440315246582, "global_step": 40826, "epoch": 972} {"train_loss": -5.668712139129639, "global_step": 40827, "epoch": 972} {"train_loss": -5.586802005767822, "global_step": 40828, "epoch": 972} {"train_loss": -5.678563117980957, "global_step": 40829, "epoch": 972} {"train_loss": -5.662327289581299, "global_step": 40830, "epoch": 972} {"train_loss": -5.751757621765137, "global_step": 40831, "epoch": 972} {"train_loss": -5.582368850708008, "global_step": 40832, "epoch": 972} {"train_loss": -5.6099934577941895, "global_step": 40833, "epoch": 972} {"train_loss": -5.640324115753174, "global_step": 40834, "epoch": 972} {"train_loss": -5.806351661682129, "global_step": 40835, "epoch": 972} {"train_loss": -5.5933356285095215, "global_step": 40836, "epoch": 972} {"train_loss": -5.656577110290527, "global_step": 40837, "epoch": 972} {"train_loss": -5.555225849151611, "global_step": 40838, "epoch": 972} {"train_loss": -5.781686305999756, "global_step": 40839, "epoch": 972} {"train_loss": -5.687554836273193, "global_step": 40840, "epoch": 972} {"train_loss": -5.670345306396484, "global_step": 40841, "epoch": 972} {"train_loss": -5.768080711364746, "global_step": 40842, "epoch": 972} {"train_loss": -5.602494239807129, "global_step": 40843, "epoch": 972} {"train_loss": -5.594513893127441, "global_step": 40844, "epoch": 972} {"train_loss": -5.770685195922852, "global_step": 40845, "epoch": 972} {"train_loss": -5.603731155395508, "global_step": 40846, "epoch": 972} {"train_loss": -5.788067817687988, "global_step": 40847, "epoch": 972} {"train_loss": -5.763747215270996, "global_step": 40848, "epoch": 972} {"train_loss": -5.743655204772949, "global_step": 40849, "epoch": 972} {"train_loss": -5.612072467803955, "global_step": 40850, "epoch": 972} {"train_loss": -5.593254089355469, "global_step": 40851, "epoch": 972} {"train_loss": -5.628229141235352, "global_step": 40852, "epoch": 972} {"train_loss": -5.794736862182617, "global_step": 40853, "epoch": 972} {"train_loss": -5.6835479736328125, "global_step": 40854, "epoch": 972} {"train_loss": -5.7407379150390625, "global_step": 40855, "epoch": 972} {"train_loss": -5.749114513397217, "global_step": 40856, "epoch": 972} {"train_loss": -5.686920166015625, "global_step": 40857, "epoch": 972} {"train_loss": -5.725151062011719, "global_step": 40858, "epoch": 972} {"train_loss": -5.514930725097656, "global_step": 40859, "epoch": 972} {"train_loss": -5.618031978607178, "global_step": 40860, "epoch": 972} {"train_loss": -5.672495365142822, "global_step": 40861, "epoch": 972} {"train_loss": -5.519962310791016, "global_step": 40862, "epoch": 972} {"train_loss": -5.605076313018799, "global_step": 40863, "epoch": 972} {"train_loss": -5.619051933288574, "global_step": 40864, "epoch": 972} {"train_loss": -5.6651038101741245, "global_step": 40865, "epoch": 972, "val_loss": 61834.74609375} {"train_loss": -5.604851722717285, "global_step": 40866, "epoch": 973} {"train_loss": -5.669580936431885, "global_step": 40867, "epoch": 973} {"train_loss": -5.73128604888916, "global_step": 40868, "epoch": 973} {"train_loss": -5.7298784255981445, "global_step": 40869, "epoch": 973} {"train_loss": -5.666254997253418, "global_step": 40870, "epoch": 973} {"train_loss": -5.702949523925781, "global_step": 40871, "epoch": 973} {"train_loss": -5.658265113830566, "global_step": 40872, "epoch": 973} {"train_loss": -5.649473667144775, "global_step": 40873, "epoch": 973} {"train_loss": -5.681983947753906, "global_step": 40874, "epoch": 973} {"train_loss": -5.803827285766602, "global_step": 40875, "epoch": 973} {"train_loss": -5.639543056488037, "global_step": 40876, "epoch": 973} {"train_loss": -5.626978874206543, "global_step": 40877, "epoch": 973} {"train_loss": -5.684056758880615, "global_step": 40878, "epoch": 973} {"train_loss": -5.577529430389404, "global_step": 40879, "epoch": 973} {"train_loss": -5.619582176208496, "global_step": 40880, "epoch": 973} {"train_loss": -5.62028694152832, "global_step": 40881, "epoch": 973} {"train_loss": -5.629579544067383, "global_step": 40882, "epoch": 973} {"train_loss": -5.806281089782715, "global_step": 40883, "epoch": 973} {"train_loss": -5.640858173370361, "global_step": 40884, "epoch": 973} {"train_loss": -5.633520126342773, "global_step": 40885, "epoch": 973} {"train_loss": -5.568613052368164, "global_step": 40886, "epoch": 973} {"train_loss": -5.691543102264404, "global_step": 40887, "epoch": 973} {"train_loss": -5.684769630432129, "global_step": 40888, "epoch": 973} {"train_loss": -5.690802574157715, "global_step": 40889, "epoch": 973} {"train_loss": -5.6287736892700195, "global_step": 40890, "epoch": 973} {"train_loss": -5.712709426879883, "global_step": 40891, "epoch": 973} {"train_loss": -5.668930530548096, "global_step": 40892, "epoch": 973} {"train_loss": -5.666224479675293, "global_step": 40893, "epoch": 973} {"train_loss": -5.708364486694336, "global_step": 40894, "epoch": 973} {"train_loss": -5.843419551849365, "global_step": 40895, "epoch": 973} {"train_loss": -5.654743194580078, "global_step": 40896, "epoch": 973} {"train_loss": -5.72068977355957, "global_step": 40897, "epoch": 973} {"train_loss": -5.666701316833496, "global_step": 40898, "epoch": 973} {"train_loss": -5.685737133026123, "global_step": 40899, "epoch": 973} {"train_loss": -5.7091169357299805, "global_step": 40900, "epoch": 973} {"train_loss": -5.667548179626465, "global_step": 40901, "epoch": 973} {"train_loss": -5.516084671020508, "global_step": 40902, "epoch": 973} {"train_loss": -5.6242780685424805, "global_step": 40903, "epoch": 973} {"train_loss": -5.626934051513672, "global_step": 40904, "epoch": 973} {"train_loss": -5.370943069458008, "global_step": 40905, "epoch": 973} {"train_loss": -5.663627624511719, "global_step": 40906, "epoch": 973} {"train_loss": -5.660805111839657, "global_step": 40907, "epoch": 973, "val_loss": 62483.8046875} {"train_loss": -5.52575159072876, "global_step": 40908, "epoch": 974} {"train_loss": -5.594318866729736, "global_step": 40909, "epoch": 974} {"train_loss": -5.72843074798584, "global_step": 40910, "epoch": 974} {"train_loss": -5.465610980987549, "global_step": 40911, "epoch": 974} {"train_loss": -5.725113391876221, "global_step": 40912, "epoch": 974} {"train_loss": -5.449635982513428, "global_step": 40913, "epoch": 974} {"train_loss": -5.568947792053223, "global_step": 40914, "epoch": 974} {"train_loss": -5.515163421630859, "global_step": 40915, "epoch": 974} {"train_loss": -5.495697021484375, "global_step": 40916, "epoch": 974} {"train_loss": -5.673513889312744, "global_step": 40917, "epoch": 974} {"train_loss": -5.649156093597412, "global_step": 40918, "epoch": 974} {"train_loss": -5.613173007965088, "global_step": 40919, "epoch": 974} {"train_loss": -5.599104881286621, "global_step": 40920, "epoch": 974} {"train_loss": -5.561769485473633, "global_step": 40921, "epoch": 974} {"train_loss": -5.652255058288574, "global_step": 40922, "epoch": 974} {"train_loss": -5.6701226234436035, "global_step": 40923, "epoch": 974} {"train_loss": -5.667937755584717, "global_step": 40924, "epoch": 974} {"train_loss": -5.773395538330078, "global_step": 40925, "epoch": 974} {"train_loss": -5.801730632781982, "global_step": 40926, "epoch": 974} {"train_loss": -5.672761917114258, "global_step": 40927, "epoch": 974} {"train_loss": -5.670244216918945, "global_step": 40928, "epoch": 974} {"train_loss": -5.66714334487915, "global_step": 40929, "epoch": 974} {"train_loss": -5.621318340301514, "global_step": 40930, "epoch": 974} {"train_loss": -5.659367084503174, "global_step": 40931, "epoch": 974} {"train_loss": -5.643640518188477, "global_step": 40932, "epoch": 974} {"train_loss": -5.681914806365967, "global_step": 40933, "epoch": 974} {"train_loss": -5.69171142578125, "global_step": 40934, "epoch": 974} {"train_loss": -5.576253890991211, "global_step": 40935, "epoch": 974} {"train_loss": -5.57079553604126, "global_step": 40936, "epoch": 974} {"train_loss": -5.667978286743164, "global_step": 40937, "epoch": 974} {"train_loss": -5.720139026641846, "global_step": 40938, "epoch": 974} {"train_loss": -5.722442626953125, "global_step": 40939, "epoch": 974} {"train_loss": -5.705651760101318, "global_step": 40940, "epoch": 974} {"train_loss": -5.615750789642334, "global_step": 40941, "epoch": 974} {"train_loss": -5.6453022956848145, "global_step": 40942, "epoch": 974} {"train_loss": -5.597524642944336, "global_step": 40943, "epoch": 974} {"train_loss": -5.728179931640625, "global_step": 40944, "epoch": 974} {"train_loss": -5.629299163818359, "global_step": 40945, "epoch": 974} {"train_loss": -5.617033004760742, "global_step": 40946, "epoch": 974} {"train_loss": -5.7000603675842285, "global_step": 40947, "epoch": 974} {"train_loss": -5.661133766174316, "global_step": 40948, "epoch": 974} {"train_loss": -5.641756205331712, "global_step": 40949, "epoch": 974, "val_loss": 61851.62109375} {"train_loss": -5.712389945983887, "global_step": 40950, "epoch": 975} {"train_loss": -5.662881851196289, "global_step": 40951, "epoch": 975} {"train_loss": -5.742359638214111, "global_step": 40952, "epoch": 975} {"train_loss": -5.5719475746154785, "global_step": 40953, "epoch": 975} {"train_loss": -5.624765872955322, "global_step": 40954, "epoch": 975} {"train_loss": -5.781526565551758, "global_step": 40955, "epoch": 975} {"train_loss": -5.600320816040039, "global_step": 40956, "epoch": 975} {"train_loss": -5.718891620635986, "global_step": 40957, "epoch": 975} {"train_loss": -5.668015003204346, "global_step": 40958, "epoch": 975} {"train_loss": -5.701531410217285, "global_step": 40959, "epoch": 975} {"train_loss": -5.676977157592773, "global_step": 40960, "epoch": 975} {"train_loss": -5.625797271728516, "global_step": 40961, "epoch": 975} {"train_loss": -5.606166362762451, "global_step": 40962, "epoch": 975} {"train_loss": -5.690352439880371, "global_step": 40963, "epoch": 975} {"train_loss": -5.822418689727783, "global_step": 40964, "epoch": 975} {"train_loss": -5.725950241088867, "global_step": 40965, "epoch": 975} {"train_loss": -5.72816801071167, "global_step": 40966, "epoch": 975} {"train_loss": -5.624300003051758, "global_step": 40967, "epoch": 975} {"train_loss": -5.647122383117676, "global_step": 40968, "epoch": 975} {"train_loss": -5.602907657623291, "global_step": 40969, "epoch": 975} {"train_loss": -5.661957740783691, "global_step": 40970, "epoch": 975} {"train_loss": -5.663064002990723, "global_step": 40971, "epoch": 975} {"train_loss": -5.670437335968018, "global_step": 40972, "epoch": 975} {"train_loss": -5.651747226715088, "global_step": 40973, "epoch": 975} {"train_loss": -5.62520170211792, "global_step": 40974, "epoch": 975} {"train_loss": -5.606148719787598, "global_step": 40975, "epoch": 975} {"train_loss": -5.642720699310303, "global_step": 40976, "epoch": 975} {"train_loss": -5.747626781463623, "global_step": 40977, "epoch": 975} {"train_loss": -5.6928181648254395, "global_step": 40978, "epoch": 975} {"train_loss": -5.729554653167725, "global_step": 40979, "epoch": 975} {"train_loss": -5.751326560974121, "global_step": 40980, "epoch": 975} {"train_loss": -5.721892356872559, "global_step": 40981, "epoch": 975} {"train_loss": -5.605737209320068, "global_step": 40982, "epoch": 975} {"train_loss": -5.707849502563477, "global_step": 40983, "epoch": 975} {"train_loss": -5.787145137786865, "global_step": 40984, "epoch": 975} {"train_loss": -5.739559650421143, "global_step": 40985, "epoch": 975} {"train_loss": -5.550246238708496, "global_step": 40986, "epoch": 975} {"train_loss": -5.749794960021973, "global_step": 40987, "epoch": 975} {"train_loss": -5.557283878326416, "global_step": 40988, "epoch": 975} {"train_loss": -5.672979354858398, "global_step": 40989, "epoch": 975} {"train_loss": -5.645555019378662, "global_step": 40990, "epoch": 975} {"train_loss": -5.6742774077824185, "global_step": 40991, "epoch": 975, "val_loss": 62149.6953125} {"train_loss": -5.629603385925293, "global_step": 40992, "epoch": 976} {"train_loss": -5.700631141662598, "global_step": 40993, "epoch": 976} {"train_loss": -5.684295177459717, "global_step": 40994, "epoch": 976} {"train_loss": -5.639636993408203, "global_step": 40995, "epoch": 976} {"train_loss": -5.6460723876953125, "global_step": 40996, "epoch": 976} {"train_loss": -5.712899208068848, "global_step": 40997, "epoch": 976} {"train_loss": -5.569901466369629, "global_step": 40998, "epoch": 976} {"train_loss": -5.721803665161133, "global_step": 40999, "epoch": 976} {"train_loss": -5.610156059265137, "global_step": 41000, "epoch": 976} {"train_loss": -5.5516157150268555, "global_step": 41001, "epoch": 976} {"train_loss": -5.633433818817139, "global_step": 41002, "epoch": 976} {"train_loss": -5.665473937988281, "global_step": 41003, "epoch": 976} {"train_loss": -5.551163673400879, "global_step": 41004, "epoch": 976} {"train_loss": -5.651790618896484, "global_step": 41005, "epoch": 976} {"train_loss": -5.651690483093262, "global_step": 41006, "epoch": 976} {"train_loss": -5.575825214385986, "global_step": 41007, "epoch": 976} {"train_loss": -5.725683212280273, "global_step": 41008, "epoch": 976} {"train_loss": -5.595707416534424, "global_step": 41009, "epoch": 976} {"train_loss": -5.635673522949219, "global_step": 41010, "epoch": 976} {"train_loss": -5.6066694259643555, "global_step": 41011, "epoch": 976} {"train_loss": -5.555024147033691, "global_step": 41012, "epoch": 976} {"train_loss": -5.608842372894287, "global_step": 41013, "epoch": 976} {"train_loss": -5.619002342224121, "global_step": 41014, "epoch": 976} {"train_loss": -5.525458335876465, "global_step": 41015, "epoch": 976} {"train_loss": -5.623717308044434, "global_step": 41016, "epoch": 976} {"train_loss": -5.559713363647461, "global_step": 41017, "epoch": 976} {"train_loss": -5.690106391906738, "global_step": 41018, "epoch": 976} {"train_loss": -5.546423435211182, "global_step": 41019, "epoch": 976} {"train_loss": -5.638815879821777, "global_step": 41020, "epoch": 976} {"train_loss": -5.621967315673828, "global_step": 41021, "epoch": 976} {"train_loss": -5.536428451538086, "global_step": 41022, "epoch": 976} {"train_loss": -5.686102867126465, "global_step": 41023, "epoch": 976} {"train_loss": -5.661725997924805, "global_step": 41024, "epoch": 976} {"train_loss": -5.646327495574951, "global_step": 41025, "epoch": 976} {"train_loss": -5.688682556152344, "global_step": 41026, "epoch": 976} {"train_loss": -5.757653713226318, "global_step": 41027, "epoch": 976} {"train_loss": -5.767483711242676, "global_step": 41028, "epoch": 976} {"train_loss": -5.614851951599121, "global_step": 41029, "epoch": 976} {"train_loss": -5.70747184753418, "global_step": 41030, "epoch": 976} {"train_loss": -5.680121421813965, "global_step": 41031, "epoch": 976} {"train_loss": -5.5668134689331055, "global_step": 41032, "epoch": 976} {"train_loss": -5.637095735186622, "global_step": 41033, "epoch": 976, "val_loss": 61994.296875} {"train_loss": -5.703312873840332, "global_step": 41034, "epoch": 977} {"train_loss": -5.765505313873291, "global_step": 41035, "epoch": 977} {"train_loss": -5.65848445892334, "global_step": 41036, "epoch": 977} {"train_loss": -5.733539581298828, "global_step": 41037, "epoch": 977} {"train_loss": -5.735109806060791, "global_step": 41038, "epoch": 977} {"train_loss": -5.612647533416748, "global_step": 41039, "epoch": 977} {"train_loss": -5.555036544799805, "global_step": 41040, "epoch": 977} {"train_loss": -5.680997848510742, "global_step": 41041, "epoch": 977} {"train_loss": -5.878779888153076, "global_step": 41042, "epoch": 977} {"train_loss": -5.508370399475098, "global_step": 41043, "epoch": 977} {"train_loss": -5.462608337402344, "global_step": 41044, "epoch": 977} {"train_loss": -5.723938941955566, "global_step": 41045, "epoch": 977} {"train_loss": -5.509232997894287, "global_step": 41046, "epoch": 977} {"train_loss": -5.639944076538086, "global_step": 41047, "epoch": 977} {"train_loss": -5.735241889953613, "global_step": 41048, "epoch": 977} {"train_loss": -5.575616836547852, "global_step": 41049, "epoch": 977} {"train_loss": -5.631497383117676, "global_step": 41050, "epoch": 977} {"train_loss": -5.756837368011475, "global_step": 41051, "epoch": 977} {"train_loss": -5.657527923583984, "global_step": 41052, "epoch": 977} {"train_loss": -5.605350017547607, "global_step": 41053, "epoch": 977} {"train_loss": -5.682094097137451, "global_step": 41054, "epoch": 977} {"train_loss": -5.54310941696167, "global_step": 41055, "epoch": 977} {"train_loss": -5.620349884033203, "global_step": 41056, "epoch": 977} {"train_loss": -5.548826217651367, "global_step": 41057, "epoch": 977} {"train_loss": -5.643444061279297, "global_step": 41058, "epoch": 977} {"train_loss": -5.645989418029785, "global_step": 41059, "epoch": 977} {"train_loss": -5.731328010559082, "global_step": 41060, "epoch": 977} {"train_loss": -5.59737491607666, "global_step": 41061, "epoch": 977} {"train_loss": -5.695724010467529, "global_step": 41062, "epoch": 977} {"train_loss": -5.620632171630859, "global_step": 41063, "epoch": 977} {"train_loss": -5.599835395812988, "global_step": 41064, "epoch": 977} {"train_loss": -5.70031213760376, "global_step": 41065, "epoch": 977} {"train_loss": -5.651030540466309, "global_step": 41066, "epoch": 977} {"train_loss": -5.535225868225098, "global_step": 41067, "epoch": 977} {"train_loss": -5.638053894042969, "global_step": 41068, "epoch": 977} {"train_loss": -5.492307662963867, "global_step": 41069, "epoch": 977} {"train_loss": -5.584173679351807, "global_step": 41070, "epoch": 977} {"train_loss": -5.491847038269043, "global_step": 41071, "epoch": 977} {"train_loss": -5.465902328491211, "global_step": 41072, "epoch": 977} {"train_loss": -5.732481956481934, "global_step": 41073, "epoch": 977} {"train_loss": -5.67758846282959, "global_step": 41074, "epoch": 977} {"train_loss": -5.6341109957013815, "global_step": 41075, "epoch": 977, "val_loss": 61493.59765625} {"train_loss": -5.725766658782959, "global_step": 41076, "epoch": 978} {"train_loss": -5.658712863922119, "global_step": 41077, "epoch": 978} {"train_loss": -5.487551689147949, "global_step": 41078, "epoch": 978} {"train_loss": -5.73239278793335, "global_step": 41079, "epoch": 978} {"train_loss": -5.7891435623168945, "global_step": 41080, "epoch": 978} {"train_loss": -5.6462297439575195, "global_step": 41081, "epoch": 978} {"train_loss": -5.646308898925781, "global_step": 41082, "epoch": 978} {"train_loss": -5.706605911254883, "global_step": 41083, "epoch": 978} {"train_loss": -5.557281494140625, "global_step": 41084, "epoch": 978} {"train_loss": -5.661789894104004, "global_step": 41085, "epoch": 978} {"train_loss": -5.678544998168945, "global_step": 41086, "epoch": 978} {"train_loss": -5.66379451751709, "global_step": 41087, "epoch": 978} {"train_loss": -5.550933361053467, "global_step": 41088, "epoch": 978} {"train_loss": -5.549111366271973, "global_step": 41089, "epoch": 978} {"train_loss": -5.647130966186523, "global_step": 41090, "epoch": 978} {"train_loss": -5.589839458465576, "global_step": 41091, "epoch": 978} {"train_loss": -5.679095268249512, "global_step": 41092, "epoch": 978} {"train_loss": -5.685245037078857, "global_step": 41093, "epoch": 978} {"train_loss": -5.562334060668945, "global_step": 41094, "epoch": 978} {"train_loss": -5.585256576538086, "global_step": 41095, "epoch": 978} {"train_loss": -5.710964202880859, "global_step": 41096, "epoch": 978} {"train_loss": -5.528007507324219, "global_step": 41097, "epoch": 978} {"train_loss": -5.754932403564453, "global_step": 41098, "epoch": 978} {"train_loss": -5.573770046234131, "global_step": 41099, "epoch": 978} {"train_loss": -5.643807411193848, "global_step": 41100, "epoch": 978} {"train_loss": -5.608283042907715, "global_step": 41101, "epoch": 978} {"train_loss": -5.635937690734863, "global_step": 41102, "epoch": 978} {"train_loss": -5.745021820068359, "global_step": 41103, "epoch": 978} {"train_loss": -5.635963439941406, "global_step": 41104, "epoch": 978} {"train_loss": -5.676923751831055, "global_step": 41105, "epoch": 978} {"train_loss": -5.775111198425293, "global_step": 41106, "epoch": 978} {"train_loss": -5.658263206481934, "global_step": 41107, "epoch": 978} {"train_loss": -5.602518081665039, "global_step": 41108, "epoch": 978} {"train_loss": -5.73250675201416, "global_step": 41109, "epoch": 978} {"train_loss": -5.664827346801758, "global_step": 41110, "epoch": 978} {"train_loss": -5.626434803009033, "global_step": 41111, "epoch": 978} {"train_loss": -5.783186912536621, "global_step": 41112, "epoch": 978} {"train_loss": -5.692115306854248, "global_step": 41113, "epoch": 978} {"train_loss": -5.691643238067627, "global_step": 41114, "epoch": 978} {"train_loss": -5.59326171875, "global_step": 41115, "epoch": 978} {"train_loss": -5.61975622177124, "global_step": 41116, "epoch": 978} {"train_loss": -5.649321964808872, "global_step": 41117, "epoch": 978, "val_loss": 61693.06640625} {"train_loss": -5.592197895050049, "global_step": 41118, "epoch": 979} {"train_loss": -5.678295612335205, "global_step": 41119, "epoch": 979} {"train_loss": -5.512418746948242, "global_step": 41120, "epoch": 979} {"train_loss": -5.594001770019531, "global_step": 41121, "epoch": 979} {"train_loss": -5.521486282348633, "global_step": 41122, "epoch": 979} {"train_loss": -5.872101783752441, "global_step": 41123, "epoch": 979} {"train_loss": -5.693960189819336, "global_step": 41124, "epoch": 979} {"train_loss": -5.673131942749023, "global_step": 41125, "epoch": 979} {"train_loss": -5.698887825012207, "global_step": 41126, "epoch": 979} {"train_loss": -5.683049201965332, "global_step": 41127, "epoch": 979} {"train_loss": -5.604937553405762, "global_step": 41128, "epoch": 979} {"train_loss": -5.682784080505371, "global_step": 41129, "epoch": 979} {"train_loss": -5.784223556518555, "global_step": 41130, "epoch": 979} {"train_loss": -5.710568428039551, "global_step": 41131, "epoch": 979} {"train_loss": -5.618749141693115, "global_step": 41132, "epoch": 979} {"train_loss": -5.614571571350098, "global_step": 41133, "epoch": 979} {"train_loss": -5.676811218261719, "global_step": 41134, "epoch": 979} {"train_loss": -5.732333660125732, "global_step": 41135, "epoch": 979} {"train_loss": -5.659270763397217, "global_step": 41136, "epoch": 979} {"train_loss": -5.5961456298828125, "global_step": 41137, "epoch": 979} {"train_loss": -5.748782157897949, "global_step": 41138, "epoch": 979} {"train_loss": -5.7419352531433105, "global_step": 41139, "epoch": 979} {"train_loss": -5.677169322967529, "global_step": 41140, "epoch": 979} {"train_loss": -5.669861316680908, "global_step": 41141, "epoch": 979} {"train_loss": -5.698113441467285, "global_step": 41142, "epoch": 979} {"train_loss": -5.75284481048584, "global_step": 41143, "epoch": 979} {"train_loss": -5.697221755981445, "global_step": 41144, "epoch": 979} {"train_loss": -5.644496440887451, "global_step": 41145, "epoch": 979} {"train_loss": -5.604999542236328, "global_step": 41146, "epoch": 979} {"train_loss": -5.615007400512695, "global_step": 41147, "epoch": 979} {"train_loss": -5.703474521636963, "global_step": 41148, "epoch": 979} {"train_loss": -5.556269645690918, "global_step": 41149, "epoch": 979} {"train_loss": -5.7372145652771, "global_step": 41150, "epoch": 979} {"train_loss": -5.701401710510254, "global_step": 41151, "epoch": 979} {"train_loss": -5.573890209197998, "global_step": 41152, "epoch": 979} {"train_loss": -5.644749641418457, "global_step": 41153, "epoch": 979} {"train_loss": -5.636693477630615, "global_step": 41154, "epoch": 979} {"train_loss": -5.627692699432373, "global_step": 41155, "epoch": 979} {"train_loss": -5.659750938415527, "global_step": 41156, "epoch": 979} {"train_loss": -5.704197883605957, "global_step": 41157, "epoch": 979} {"train_loss": -5.754773139953613, "global_step": 41158, "epoch": 979} {"train_loss": -5.668512946083432, "global_step": 41159, "epoch": 979, "val_loss": 61758.95703125} {"train_loss": -5.678525924682617, "global_step": 41160, "epoch": 980} {"train_loss": -5.691588401794434, "global_step": 41161, "epoch": 980} {"train_loss": -5.769800186157227, "global_step": 41162, "epoch": 980} {"train_loss": -5.689231872558594, "global_step": 41163, "epoch": 980} {"train_loss": -5.600189208984375, "global_step": 41164, "epoch": 980} {"train_loss": -5.566465377807617, "global_step": 41165, "epoch": 980} {"train_loss": -5.642513275146484, "global_step": 41166, "epoch": 980} {"train_loss": -5.704006195068359, "global_step": 41167, "epoch": 980} {"train_loss": -5.657431602478027, "global_step": 41168, "epoch": 980} {"train_loss": -5.666548728942871, "global_step": 41169, "epoch": 980} {"train_loss": -5.615143775939941, "global_step": 41170, "epoch": 980} {"train_loss": -5.523867130279541, "global_step": 41171, "epoch": 980} {"train_loss": -5.5853424072265625, "global_step": 41172, "epoch": 980} {"train_loss": -5.78665828704834, "global_step": 41173, "epoch": 980} {"train_loss": -5.694984436035156, "global_step": 41174, "epoch": 980} {"train_loss": -5.726663112640381, "global_step": 41175, "epoch": 980} {"train_loss": -5.617550849914551, "global_step": 41176, "epoch": 980} {"train_loss": -5.666008949279785, "global_step": 41177, "epoch": 980} {"train_loss": -5.731050491333008, "global_step": 41178, "epoch": 980} {"train_loss": -5.736407279968262, "global_step": 41179, "epoch": 980} {"train_loss": -5.798051834106445, "global_step": 41180, "epoch": 980} {"train_loss": -5.7019829750061035, "global_step": 41181, "epoch": 980} {"train_loss": -5.759951591491699, "global_step": 41182, "epoch": 980} {"train_loss": -5.575023174285889, "global_step": 41183, "epoch": 980} {"train_loss": -5.5741472244262695, "global_step": 41184, "epoch": 980} {"train_loss": -5.649565696716309, "global_step": 41185, "epoch": 980} {"train_loss": -5.695758819580078, "global_step": 41186, "epoch": 980} {"train_loss": -5.622257232666016, "global_step": 41187, "epoch": 980} {"train_loss": -5.612563133239746, "global_step": 41188, "epoch": 980} {"train_loss": -5.60257625579834, "global_step": 41189, "epoch": 980} {"train_loss": -5.754411697387695, "global_step": 41190, "epoch": 980} {"train_loss": -5.692193984985352, "global_step": 41191, "epoch": 980} {"train_loss": -5.638184547424316, "global_step": 41192, "epoch": 980} {"train_loss": -5.6880269050598145, "global_step": 41193, "epoch": 980} {"train_loss": -5.779354095458984, "global_step": 41194, "epoch": 980} {"train_loss": -5.581342697143555, "global_step": 41195, "epoch": 980} {"train_loss": -5.563633918762207, "global_step": 41196, "epoch": 980} {"train_loss": -5.7124433517456055, "global_step": 41197, "epoch": 980} {"train_loss": -5.663736343383789, "global_step": 41198, "epoch": 980} {"train_loss": -5.67255973815918, "global_step": 41199, "epoch": 980} {"train_loss": -5.745634078979492, "global_step": 41200, "epoch": 980} {"train_loss": -5.670567921229771, "global_step": 41201, "epoch": 980, "val_loss": 61947.39453125} {"train_loss": -5.678617000579834, "global_step": 41202, "epoch": 981} {"train_loss": -5.838208198547363, "global_step": 41203, "epoch": 981} {"train_loss": -5.696674346923828, "global_step": 41204, "epoch": 981} {"train_loss": -5.506433010101318, "global_step": 41205, "epoch": 981} {"train_loss": -5.650751113891602, "global_step": 41206, "epoch": 981} {"train_loss": -5.633782863616943, "global_step": 41207, "epoch": 981} {"train_loss": -5.643505096435547, "global_step": 41208, "epoch": 981} {"train_loss": -5.762645721435547, "global_step": 41209, "epoch": 981} {"train_loss": -5.736625671386719, "global_step": 41210, "epoch": 981} {"train_loss": -5.644699573516846, "global_step": 41211, "epoch": 981} {"train_loss": -5.610630035400391, "global_step": 41212, "epoch": 981} {"train_loss": -5.652310848236084, "global_step": 41213, "epoch": 981} {"train_loss": -5.663275718688965, "global_step": 41214, "epoch": 981} {"train_loss": -5.666433334350586, "global_step": 41215, "epoch": 981} {"train_loss": -5.635295391082764, "global_step": 41216, "epoch": 981} {"train_loss": -5.587013244628906, "global_step": 41217, "epoch": 981} {"train_loss": -5.672218322753906, "global_step": 41218, "epoch": 981} {"train_loss": -5.671060085296631, "global_step": 41219, "epoch": 981} {"train_loss": -5.707864761352539, "global_step": 41220, "epoch": 981} {"train_loss": -5.597687721252441, "global_step": 41221, "epoch": 981} {"train_loss": -5.8274383544921875, "global_step": 41222, "epoch": 981} {"train_loss": -5.695799827575684, "global_step": 41223, "epoch": 981} {"train_loss": -5.777631759643555, "global_step": 41224, "epoch": 981} {"train_loss": -5.66180944442749, "global_step": 41225, "epoch": 981} {"train_loss": -5.703007698059082, "global_step": 41226, "epoch": 981} {"train_loss": -5.702993869781494, "global_step": 41227, "epoch": 981} {"train_loss": -5.527594566345215, "global_step": 41228, "epoch": 981} {"train_loss": -5.7442803382873535, "global_step": 41229, "epoch": 981} {"train_loss": -5.725571155548096, "global_step": 41230, "epoch": 981} {"train_loss": -5.6910200119018555, "global_step": 41231, "epoch": 981} {"train_loss": -5.654232025146484, "global_step": 41232, "epoch": 981} {"train_loss": -5.750919818878174, "global_step": 41233, "epoch": 981} {"train_loss": -5.659564018249512, "global_step": 41234, "epoch": 981} {"train_loss": -5.617913246154785, "global_step": 41235, "epoch": 981} {"train_loss": -5.698389053344727, "global_step": 41236, "epoch": 981} {"train_loss": -5.687930583953857, "global_step": 41237, "epoch": 981} {"train_loss": -5.686623573303223, "global_step": 41238, "epoch": 981} {"train_loss": -5.605587005615234, "global_step": 41239, "epoch": 981} {"train_loss": -5.651740074157715, "global_step": 41240, "epoch": 981} {"train_loss": -5.677101135253906, "global_step": 41241, "epoch": 981} {"train_loss": -5.598525047302246, "global_step": 41242, "epoch": 981} {"train_loss": -5.669248387927101, "global_step": 41243, "epoch": 981, "val_loss": 61557.16796875} {"train_loss": -5.646927833557129, "global_step": 41244, "epoch": 982} {"train_loss": -5.569291114807129, "global_step": 41245, "epoch": 982} {"train_loss": -5.534030914306641, "global_step": 41246, "epoch": 982} {"train_loss": -5.709079742431641, "global_step": 41247, "epoch": 982} {"train_loss": -5.730910778045654, "global_step": 41248, "epoch": 982} {"train_loss": -5.579051494598389, "global_step": 41249, "epoch": 982} {"train_loss": -5.648748397827148, "global_step": 41250, "epoch": 982} {"train_loss": -5.652143478393555, "global_step": 41251, "epoch": 982} {"train_loss": -5.652150630950928, "global_step": 41252, "epoch": 982} {"train_loss": -5.587920665740967, "global_step": 41253, "epoch": 982} {"train_loss": -5.671333312988281, "global_step": 41254, "epoch": 982} {"train_loss": -5.655998229980469, "global_step": 41255, "epoch": 982} {"train_loss": -5.618785381317139, "global_step": 41256, "epoch": 982} {"train_loss": -5.57426118850708, "global_step": 41257, "epoch": 982} {"train_loss": -5.780614376068115, "global_step": 41258, "epoch": 982} {"train_loss": -5.684771537780762, "global_step": 41259, "epoch": 982} {"train_loss": -5.604877471923828, "global_step": 41260, "epoch": 982} {"train_loss": -5.551076889038086, "global_step": 41261, "epoch": 982} {"train_loss": -5.626176834106445, "global_step": 41262, "epoch": 982} {"train_loss": -5.682694911956787, "global_step": 41263, "epoch": 982} {"train_loss": -5.601888179779053, "global_step": 41264, "epoch": 982} {"train_loss": -5.693316459655762, "global_step": 41265, "epoch": 982} {"train_loss": -5.669445991516113, "global_step": 41266, "epoch": 982} {"train_loss": -5.640833854675293, "global_step": 41267, "epoch": 982} {"train_loss": -5.827153205871582, "global_step": 41268, "epoch": 982} {"train_loss": -5.562713623046875, "global_step": 41269, "epoch": 982} {"train_loss": -5.705879211425781, "global_step": 41270, "epoch": 982} {"train_loss": -5.6447649002075195, "global_step": 41271, "epoch": 982} {"train_loss": -5.634913444519043, "global_step": 41272, "epoch": 982} {"train_loss": -5.747158050537109, "global_step": 41273, "epoch": 982} {"train_loss": -5.656590938568115, "global_step": 41274, "epoch": 982} {"train_loss": -5.586455345153809, "global_step": 41275, "epoch": 982} {"train_loss": -5.664565086364746, "global_step": 41276, "epoch": 982} {"train_loss": -5.758711814880371, "global_step": 41277, "epoch": 982} {"train_loss": -5.490712642669678, "global_step": 41278, "epoch": 982} {"train_loss": -5.564966678619385, "global_step": 41279, "epoch": 982} {"train_loss": -5.669565200805664, "global_step": 41280, "epoch": 982} {"train_loss": -5.616731643676758, "global_step": 41281, "epoch": 982} {"train_loss": -5.682235240936279, "global_step": 41282, "epoch": 982} {"train_loss": -5.740897178649902, "global_step": 41283, "epoch": 982} {"train_loss": -5.6596479415893555, "global_step": 41284, "epoch": 982} {"train_loss": -5.650642826443627, "global_step": 41285, "epoch": 982, "val_loss": 61871.5390625} {"train_loss": -5.720259666442871, "global_step": 41286, "epoch": 983} {"train_loss": -5.622040271759033, "global_step": 41287, "epoch": 983} {"train_loss": -5.561887741088867, "global_step": 41288, "epoch": 983} {"train_loss": -5.633543491363525, "global_step": 41289, "epoch": 983} {"train_loss": -5.624658584594727, "global_step": 41290, "epoch": 983} {"train_loss": -5.601442337036133, "global_step": 41291, "epoch": 983} {"train_loss": -5.661428451538086, "global_step": 41292, "epoch": 983} {"train_loss": -5.594166278839111, "global_step": 41293, "epoch": 983} {"train_loss": -5.627036094665527, "global_step": 41294, "epoch": 983} {"train_loss": -5.511948585510254, "global_step": 41295, "epoch": 983} {"train_loss": -5.601710319519043, "global_step": 41296, "epoch": 983} {"train_loss": -5.6478166580200195, "global_step": 41297, "epoch": 983} {"train_loss": -5.669469833374023, "global_step": 41298, "epoch": 983} {"train_loss": -5.741229057312012, "global_step": 41299, "epoch": 983} {"train_loss": -5.721775531768799, "global_step": 41300, "epoch": 983} {"train_loss": -5.596884727478027, "global_step": 41301, "epoch": 983} {"train_loss": -5.676469802856445, "global_step": 41302, "epoch": 983} {"train_loss": -5.701892852783203, "global_step": 41303, "epoch": 983} {"train_loss": -5.674474239349365, "global_step": 41304, "epoch": 983} {"train_loss": -5.691591262817383, "global_step": 41305, "epoch": 983} {"train_loss": -5.579165935516357, "global_step": 41306, "epoch": 983} {"train_loss": -5.636070251464844, "global_step": 41307, "epoch": 983} {"train_loss": -5.6210527420043945, "global_step": 41308, "epoch": 983} {"train_loss": -5.632061958312988, "global_step": 41309, "epoch": 983} {"train_loss": -5.639416694641113, "global_step": 41310, "epoch": 983} {"train_loss": -5.68112850189209, "global_step": 41311, "epoch": 983} {"train_loss": -5.750443935394287, "global_step": 41312, "epoch": 983} {"train_loss": -5.787771701812744, "global_step": 41313, "epoch": 983} {"train_loss": -5.612584114074707, "global_step": 41314, "epoch": 983} {"train_loss": -5.586096286773682, "global_step": 41315, "epoch": 983} {"train_loss": -5.775040626525879, "global_step": 41316, "epoch": 983} {"train_loss": -5.655671119689941, "global_step": 41317, "epoch": 983} {"train_loss": -5.674986839294434, "global_step": 41318, "epoch": 983} {"train_loss": -5.686150550842285, "global_step": 41319, "epoch": 983} {"train_loss": -5.565638542175293, "global_step": 41320, "epoch": 983} {"train_loss": -5.5489349365234375, "global_step": 41321, "epoch": 983} {"train_loss": -5.732242584228516, "global_step": 41322, "epoch": 983} {"train_loss": -5.5755767822265625, "global_step": 41323, "epoch": 983} {"train_loss": -5.667593002319336, "global_step": 41324, "epoch": 983} {"train_loss": -5.739180564880371, "global_step": 41325, "epoch": 983} {"train_loss": -5.66838264465332, "global_step": 41326, "epoch": 983} {"train_loss": -5.650507574989682, "global_step": 41327, "epoch": 983, "val_loss": 61870.34765625} {"train_loss": -5.65221643447876, "global_step": 41328, "epoch": 984} {"train_loss": -5.614050388336182, "global_step": 41329, "epoch": 984} {"train_loss": -5.627860069274902, "global_step": 41330, "epoch": 984} {"train_loss": -5.692999839782715, "global_step": 41331, "epoch": 984} {"train_loss": -5.722802639007568, "global_step": 41332, "epoch": 984} {"train_loss": -5.5101423263549805, "global_step": 41333, "epoch": 984} {"train_loss": -5.541067123413086, "global_step": 41334, "epoch": 984} {"train_loss": -5.72734260559082, "global_step": 41335, "epoch": 984} {"train_loss": -5.804950714111328, "global_step": 41336, "epoch": 984} {"train_loss": -5.645665645599365, "global_step": 41337, "epoch": 984} {"train_loss": -5.630502223968506, "global_step": 41338, "epoch": 984} {"train_loss": -5.559253692626953, "global_step": 41339, "epoch": 984} {"train_loss": -5.5285563468933105, "global_step": 41340, "epoch": 984} {"train_loss": -5.761540412902832, "global_step": 41341, "epoch": 984} {"train_loss": -5.624436378479004, "global_step": 41342, "epoch": 984} {"train_loss": -5.52921199798584, "global_step": 41343, "epoch": 984} {"train_loss": -5.706401824951172, "global_step": 41344, "epoch": 984} {"train_loss": -5.590726852416992, "global_step": 41345, "epoch": 984} {"train_loss": -5.4888505935668945, "global_step": 41346, "epoch": 984} {"train_loss": -5.74052619934082, "global_step": 41347, "epoch": 984} {"train_loss": -5.677516937255859, "global_step": 41348, "epoch": 984} {"train_loss": -5.572968482971191, "global_step": 41349, "epoch": 984} {"train_loss": -5.714921951293945, "global_step": 41350, "epoch": 984} {"train_loss": -5.5481038093566895, "global_step": 41351, "epoch": 984} {"train_loss": -5.400325775146484, "global_step": 41352, "epoch": 984} {"train_loss": -5.536470413208008, "global_step": 41353, "epoch": 984} {"train_loss": -5.730435371398926, "global_step": 41354, "epoch": 984} {"train_loss": -5.403090476989746, "global_step": 41355, "epoch": 984} {"train_loss": -5.565884590148926, "global_step": 41356, "epoch": 984} {"train_loss": -5.593873023986816, "global_step": 41357, "epoch": 984} {"train_loss": -5.587063312530518, "global_step": 41358, "epoch": 984} {"train_loss": -5.558741569519043, "global_step": 41359, "epoch": 984} {"train_loss": -5.694736480712891, "global_step": 41360, "epoch": 984} {"train_loss": -5.696364879608154, "global_step": 41361, "epoch": 984} {"train_loss": -5.550710678100586, "global_step": 41362, "epoch": 984} {"train_loss": -5.741261005401611, "global_step": 41363, "epoch": 984} {"train_loss": -5.731659889221191, "global_step": 41364, "epoch": 984} {"train_loss": -5.554450035095215, "global_step": 41365, "epoch": 984} {"train_loss": -5.641788482666016, "global_step": 41366, "epoch": 984} {"train_loss": -5.70128059387207, "global_step": 41367, "epoch": 984} {"train_loss": -5.6212921142578125, "global_step": 41368, "epoch": 984} {"train_loss": -5.625031039828346, "global_step": 41369, "epoch": 984, "val_loss": 61910.90625} {"train_loss": -5.668231010437012, "global_step": 41370, "epoch": 985} {"train_loss": -5.586101531982422, "global_step": 41371, "epoch": 985} {"train_loss": -5.692081928253174, "global_step": 41372, "epoch": 985} {"train_loss": -5.603490829467773, "global_step": 41373, "epoch": 985} {"train_loss": -5.511518478393555, "global_step": 41374, "epoch": 985} {"train_loss": -5.702659606933594, "global_step": 41375, "epoch": 985} {"train_loss": -5.478790283203125, "global_step": 41376, "epoch": 985} {"train_loss": -5.65407133102417, "global_step": 41377, "epoch": 985} {"train_loss": -5.75717830657959, "global_step": 41378, "epoch": 985} {"train_loss": -5.4930524826049805, "global_step": 41379, "epoch": 985} {"train_loss": -5.666762351989746, "global_step": 41380, "epoch": 985} {"train_loss": -5.638762474060059, "global_step": 41381, "epoch": 985} {"train_loss": -5.524578094482422, "global_step": 41382, "epoch": 985} {"train_loss": -5.722723960876465, "global_step": 41383, "epoch": 985} {"train_loss": -5.477668762207031, "global_step": 41384, "epoch": 985} {"train_loss": -5.709714889526367, "global_step": 41385, "epoch": 985} {"train_loss": -5.6746063232421875, "global_step": 41386, "epoch": 985} {"train_loss": -5.674194812774658, "global_step": 41387, "epoch": 985} {"train_loss": -5.643199443817139, "global_step": 41388, "epoch": 985} {"train_loss": -5.622376441955566, "global_step": 41389, "epoch": 985} {"train_loss": -5.678603172302246, "global_step": 41390, "epoch": 985} {"train_loss": -5.711540222167969, "global_step": 41391, "epoch": 985} {"train_loss": -5.561021327972412, "global_step": 41392, "epoch": 985} {"train_loss": -5.480806350708008, "global_step": 41393, "epoch": 985} {"train_loss": -5.62374210357666, "global_step": 41394, "epoch": 985} {"train_loss": -5.537253379821777, "global_step": 41395, "epoch": 985} {"train_loss": -5.50270938873291, "global_step": 41396, "epoch": 985} {"train_loss": -5.567920684814453, "global_step": 41397, "epoch": 985} {"train_loss": -5.668352127075195, "global_step": 41398, "epoch": 985} {"train_loss": -5.647852897644043, "global_step": 41399, "epoch": 985} {"train_loss": -5.688642501831055, "global_step": 41400, "epoch": 985} {"train_loss": -5.6559953689575195, "global_step": 41401, "epoch": 985} {"train_loss": -5.641040802001953, "global_step": 41402, "epoch": 985} {"train_loss": -5.753901481628418, "global_step": 41403, "epoch": 985} {"train_loss": -5.643106460571289, "global_step": 41404, "epoch": 985} {"train_loss": -5.665205001831055, "global_step": 41405, "epoch": 985} {"train_loss": -5.581368446350098, "global_step": 41406, "epoch": 985} {"train_loss": -5.734584808349609, "global_step": 41407, "epoch": 985} {"train_loss": -5.750203609466553, "global_step": 41408, "epoch": 985} {"train_loss": -5.504237174987793, "global_step": 41409, "epoch": 985} {"train_loss": -5.53680419921875, "global_step": 41410, "epoch": 985} {"train_loss": -5.626750650860014, "global_step": 41411, "epoch": 985, "val_loss": 62022.77734375} {"train_loss": -5.638367652893066, "global_step": 41412, "epoch": 986} {"train_loss": -5.780898571014404, "global_step": 41413, "epoch": 986} {"train_loss": -5.656299114227295, "global_step": 41414, "epoch": 986} {"train_loss": -5.71876335144043, "global_step": 41415, "epoch": 986} {"train_loss": -5.554684162139893, "global_step": 41416, "epoch": 986} {"train_loss": -5.65782356262207, "global_step": 41417, "epoch": 986} {"train_loss": -5.73911190032959, "global_step": 41418, "epoch": 986} {"train_loss": -5.7184858322143555, "global_step": 41419, "epoch": 986} {"train_loss": -5.651761531829834, "global_step": 41420, "epoch": 986} {"train_loss": -5.755410194396973, "global_step": 41421, "epoch": 986} {"train_loss": -5.578707695007324, "global_step": 41422, "epoch": 986} {"train_loss": -5.559567451477051, "global_step": 41423, "epoch": 986} {"train_loss": -5.785141944885254, "global_step": 41424, "epoch": 986} {"train_loss": -5.588868141174316, "global_step": 41425, "epoch": 986} {"train_loss": -5.608697414398193, "global_step": 41426, "epoch": 986} {"train_loss": -5.635248184204102, "global_step": 41427, "epoch": 986} {"train_loss": -5.735404014587402, "global_step": 41428, "epoch": 986} {"train_loss": -5.602200031280518, "global_step": 41429, "epoch": 986} {"train_loss": -5.703275203704834, "global_step": 41430, "epoch": 986} {"train_loss": -5.497758865356445, "global_step": 41431, "epoch": 986} {"train_loss": -5.52656364440918, "global_step": 41432, "epoch": 986} {"train_loss": -5.744215965270996, "global_step": 41433, "epoch": 986} {"train_loss": -5.639819145202637, "global_step": 41434, "epoch": 986} {"train_loss": -5.726517677307129, "global_step": 41435, "epoch": 986} {"train_loss": -5.577352046966553, "global_step": 41436, "epoch": 986} {"train_loss": -5.588854789733887, "global_step": 41437, "epoch": 986} {"train_loss": -5.641774654388428, "global_step": 41438, "epoch": 986} {"train_loss": -5.597799301147461, "global_step": 41439, "epoch": 986} {"train_loss": -5.721039772033691, "global_step": 41440, "epoch": 986} {"train_loss": -5.601571083068848, "global_step": 41441, "epoch": 986} {"train_loss": -5.6376729011535645, "global_step": 41442, "epoch": 986} {"train_loss": -5.6429009437561035, "global_step": 41443, "epoch": 986} {"train_loss": -5.674526214599609, "global_step": 41444, "epoch": 986} {"train_loss": -5.570193290710449, "global_step": 41445, "epoch": 986} {"train_loss": -5.653972625732422, "global_step": 41446, "epoch": 986} {"train_loss": -5.7076802253723145, "global_step": 41447, "epoch": 986} {"train_loss": -5.565261363983154, "global_step": 41448, "epoch": 986} {"train_loss": -5.741425514221191, "global_step": 41449, "epoch": 986} {"train_loss": -5.639176368713379, "global_step": 41450, "epoch": 986} {"train_loss": -5.579085826873779, "global_step": 41451, "epoch": 986} {"train_loss": -5.560281753540039, "global_step": 41452, "epoch": 986} {"train_loss": -5.642607234773182, "global_step": 41453, "epoch": 986, "val_loss": 61663.83203125} {"train_loss": -5.738304138183594, "global_step": 41454, "epoch": 987} {"train_loss": -5.534291744232178, "global_step": 41455, "epoch": 987} {"train_loss": -5.633571624755859, "global_step": 41456, "epoch": 987} {"train_loss": -5.706419944763184, "global_step": 41457, "epoch": 987} {"train_loss": -5.652554512023926, "global_step": 41458, "epoch": 987} {"train_loss": -5.566300392150879, "global_step": 41459, "epoch": 987} {"train_loss": -5.774416923522949, "global_step": 41460, "epoch": 987} {"train_loss": -5.776564598083496, "global_step": 41461, "epoch": 987} {"train_loss": -5.661504745483398, "global_step": 41462, "epoch": 987} {"train_loss": -5.597404479980469, "global_step": 41463, "epoch": 987} {"train_loss": -5.629687786102295, "global_step": 41464, "epoch": 987} {"train_loss": -5.626772880554199, "global_step": 41465, "epoch": 987} {"train_loss": -5.682183265686035, "global_step": 41466, "epoch": 987} {"train_loss": -5.680790901184082, "global_step": 41467, "epoch": 987} {"train_loss": -5.766284465789795, "global_step": 41468, "epoch": 987} {"train_loss": -5.636136054992676, "global_step": 41469, "epoch": 987} {"train_loss": -5.717473983764648, "global_step": 41470, "epoch": 987} {"train_loss": -5.8465776443481445, "global_step": 41471, "epoch": 987} {"train_loss": -5.590878486633301, "global_step": 41472, "epoch": 987} {"train_loss": -5.658629417419434, "global_step": 41473, "epoch": 987} {"train_loss": -5.6939544677734375, "global_step": 41474, "epoch": 987} {"train_loss": -5.57170295715332, "global_step": 41475, "epoch": 987} {"train_loss": -5.670984268188477, "global_step": 41476, "epoch": 987} {"train_loss": -5.723302841186523, "global_step": 41477, "epoch": 987} {"train_loss": -5.677953720092773, "global_step": 41478, "epoch": 987} {"train_loss": -5.486139297485352, "global_step": 41479, "epoch": 987} {"train_loss": -5.63065242767334, "global_step": 41480, "epoch": 987} {"train_loss": -5.623204708099365, "global_step": 41481, "epoch": 987} {"train_loss": -5.627010822296143, "global_step": 41482, "epoch": 987} {"train_loss": -5.786199569702148, "global_step": 41483, "epoch": 987} {"train_loss": -5.622549533843994, "global_step": 41484, "epoch": 987} {"train_loss": -5.676729202270508, "global_step": 41485, "epoch": 987} {"train_loss": -5.627176284790039, "global_step": 41486, "epoch": 987} {"train_loss": -5.718594551086426, "global_step": 41487, "epoch": 987} {"train_loss": -5.6536760330200195, "global_step": 41488, "epoch": 987} {"train_loss": -5.627040863037109, "global_step": 41489, "epoch": 987} {"train_loss": -5.649500846862793, "global_step": 41490, "epoch": 987} {"train_loss": -5.587035179138184, "global_step": 41491, "epoch": 987} {"train_loss": -5.7037434577941895, "global_step": 41492, "epoch": 987} {"train_loss": -5.627867698669434, "global_step": 41493, "epoch": 987} {"train_loss": -5.650800704956055, "global_step": 41494, "epoch": 987} {"train_loss": -5.663474480311076, "global_step": 41495, "epoch": 987, "val_loss": 62025.16015625} {"train_loss": -5.666343688964844, "global_step": 41496, "epoch": 988} {"train_loss": -5.6578569412231445, "global_step": 41497, "epoch": 988} {"train_loss": -5.712771415710449, "global_step": 41498, "epoch": 988} {"train_loss": -5.569416522979736, "global_step": 41499, "epoch": 988} {"train_loss": -5.675650596618652, "global_step": 41500, "epoch": 988} {"train_loss": -5.728580951690674, "global_step": 41501, "epoch": 988} {"train_loss": -5.694765090942383, "global_step": 41502, "epoch": 988} {"train_loss": -5.479745388031006, "global_step": 41503, "epoch": 988} {"train_loss": -5.680391788482666, "global_step": 41504, "epoch": 988} {"train_loss": -5.7225341796875, "global_step": 41505, "epoch": 988} {"train_loss": -5.619271278381348, "global_step": 41506, "epoch": 988} {"train_loss": -5.806866645812988, "global_step": 41507, "epoch": 988} {"train_loss": -5.6783246994018555, "global_step": 41508, "epoch": 988} {"train_loss": -5.687742233276367, "global_step": 41509, "epoch": 988} {"train_loss": -5.733274459838867, "global_step": 41510, "epoch": 988} {"train_loss": -5.709860801696777, "global_step": 41511, "epoch": 988} {"train_loss": -5.560200214385986, "global_step": 41512, "epoch": 988} {"train_loss": -5.6770524978637695, "global_step": 41513, "epoch": 988} {"train_loss": -5.63271951675415, "global_step": 41514, "epoch": 988} {"train_loss": -5.573173522949219, "global_step": 41515, "epoch": 988} {"train_loss": -5.5076704025268555, "global_step": 41516, "epoch": 988} {"train_loss": -5.618661880493164, "global_step": 41517, "epoch": 988} {"train_loss": -5.587979316711426, "global_step": 41518, "epoch": 988} {"train_loss": -5.710357666015625, "global_step": 41519, "epoch": 988} {"train_loss": -5.627429008483887, "global_step": 41520, "epoch": 988} {"train_loss": -5.567409992218018, "global_step": 41521, "epoch": 988} {"train_loss": -5.649361610412598, "global_step": 41522, "epoch": 988} {"train_loss": -5.556632995605469, "global_step": 41523, "epoch": 988} {"train_loss": -5.629383087158203, "global_step": 41524, "epoch": 988} {"train_loss": -5.5427327156066895, "global_step": 41525, "epoch": 988} {"train_loss": -5.573649883270264, "global_step": 41526, "epoch": 988} {"train_loss": -5.6865434646606445, "global_step": 41527, "epoch": 988} {"train_loss": -5.809488296508789, "global_step": 41528, "epoch": 988} {"train_loss": -5.537497520446777, "global_step": 41529, "epoch": 988} {"train_loss": -5.5276899337768555, "global_step": 41530, "epoch": 988} {"train_loss": -5.766024112701416, "global_step": 41531, "epoch": 988} {"train_loss": -5.630702972412109, "global_step": 41532, "epoch": 988} {"train_loss": -5.749636650085449, "global_step": 41533, "epoch": 988} {"train_loss": -5.736844062805176, "global_step": 41534, "epoch": 988} {"train_loss": -5.624502658843994, "global_step": 41535, "epoch": 988} {"train_loss": -5.519859313964844, "global_step": 41536, "epoch": 988} {"train_loss": -5.645143020720709, "global_step": 41537, "epoch": 988, "val_loss": 61570.34765625} {"train_loss": -5.6572651863098145, "global_step": 41538, "epoch": 989} {"train_loss": -5.572710037231445, "global_step": 41539, "epoch": 989} {"train_loss": -5.663138389587402, "global_step": 41540, "epoch": 989} {"train_loss": -5.698090076446533, "global_step": 41541, "epoch": 989} {"train_loss": -5.592693328857422, "global_step": 41542, "epoch": 989} {"train_loss": -5.576668739318848, "global_step": 41543, "epoch": 989} {"train_loss": -5.741511344909668, "global_step": 41544, "epoch": 989} {"train_loss": -5.581483840942383, "global_step": 41545, "epoch": 989} {"train_loss": -5.432530403137207, "global_step": 41546, "epoch": 989} {"train_loss": -5.690828323364258, "global_step": 41547, "epoch": 989} {"train_loss": -5.620612144470215, "global_step": 41548, "epoch": 989} {"train_loss": -5.601051330566406, "global_step": 41549, "epoch": 989} {"train_loss": -5.594307899475098, "global_step": 41550, "epoch": 989} {"train_loss": -5.577588081359863, "global_step": 41551, "epoch": 989} {"train_loss": -5.618415832519531, "global_step": 41552, "epoch": 989} {"train_loss": -5.726598739624023, "global_step": 41553, "epoch": 989} {"train_loss": -5.663301944732666, "global_step": 41554, "epoch": 989} {"train_loss": -5.628211975097656, "global_step": 41555, "epoch": 989} {"train_loss": -5.729487895965576, "global_step": 41556, "epoch": 989} {"train_loss": -5.617383003234863, "global_step": 41557, "epoch": 989} {"train_loss": -5.744227886199951, "global_step": 41558, "epoch": 989} {"train_loss": -5.513158798217773, "global_step": 41559, "epoch": 989} {"train_loss": -5.644203186035156, "global_step": 41560, "epoch": 989} {"train_loss": -5.655220031738281, "global_step": 41561, "epoch": 989} {"train_loss": -5.6648359298706055, "global_step": 41562, "epoch": 989} {"train_loss": -5.770061016082764, "global_step": 41563, "epoch": 989} {"train_loss": -5.742320537567139, "global_step": 41564, "epoch": 989} {"train_loss": -5.563262939453125, "global_step": 41565, "epoch": 989} {"train_loss": -5.651503562927246, "global_step": 41566, "epoch": 989} {"train_loss": -5.605474472045898, "global_step": 41567, "epoch": 989} {"train_loss": -5.547332763671875, "global_step": 41568, "epoch": 989} {"train_loss": -5.558653831481934, "global_step": 41569, "epoch": 989} {"train_loss": -5.7463579177856445, "global_step": 41570, "epoch": 989} {"train_loss": -5.5920209884643555, "global_step": 41571, "epoch": 989} {"train_loss": -5.585328578948975, "global_step": 41572, "epoch": 989} {"train_loss": -5.673466205596924, "global_step": 41573, "epoch": 989} {"train_loss": -5.583900451660156, "global_step": 41574, "epoch": 989} {"train_loss": -5.6378278732299805, "global_step": 41575, "epoch": 989} {"train_loss": -5.559571266174316, "global_step": 41576, "epoch": 989} {"train_loss": -5.626426696777344, "global_step": 41577, "epoch": 989} {"train_loss": -5.727336883544922, "global_step": 41578, "epoch": 989} {"train_loss": -5.63286060378665, "global_step": 41579, "epoch": 989, "val_loss": 61931.17578125} {"train_loss": -5.710227966308594, "global_step": 41580, "epoch": 990} {"train_loss": -5.726715564727783, "global_step": 41581, "epoch": 990} {"train_loss": -5.644598484039307, "global_step": 41582, "epoch": 990} {"train_loss": -5.687216281890869, "global_step": 41583, "epoch": 990} {"train_loss": -5.701581954956055, "global_step": 41584, "epoch": 990} {"train_loss": -5.57658576965332, "global_step": 41585, "epoch": 990} {"train_loss": -5.62176513671875, "global_step": 41586, "epoch": 990} {"train_loss": -5.579209804534912, "global_step": 41587, "epoch": 990} {"train_loss": -5.682629585266113, "global_step": 41588, "epoch": 990} {"train_loss": -5.668359756469727, "global_step": 41589, "epoch": 990} {"train_loss": -5.5143537521362305, "global_step": 41590, "epoch": 990} {"train_loss": -5.640071392059326, "global_step": 41591, "epoch": 990} {"train_loss": -5.708507537841797, "global_step": 41592, "epoch": 990} {"train_loss": -5.657347202301025, "global_step": 41593, "epoch": 990} {"train_loss": -5.665582656860352, "global_step": 41594, "epoch": 990} {"train_loss": -5.652068138122559, "global_step": 41595, "epoch": 990} {"train_loss": -5.829349040985107, "global_step": 41596, "epoch": 990} {"train_loss": -5.520939826965332, "global_step": 41597, "epoch": 990} {"train_loss": -5.586812973022461, "global_step": 41598, "epoch": 990} {"train_loss": -5.70709228515625, "global_step": 41599, "epoch": 990} {"train_loss": -5.61406946182251, "global_step": 41600, "epoch": 990} {"train_loss": -5.679804801940918, "global_step": 41601, "epoch": 990} {"train_loss": -5.636520862579346, "global_step": 41602, "epoch": 990} {"train_loss": -5.736689567565918, "global_step": 41603, "epoch": 990} {"train_loss": -5.613819599151611, "global_step": 41604, "epoch": 990} {"train_loss": -5.696164131164551, "global_step": 41605, "epoch": 990} {"train_loss": -5.677325248718262, "global_step": 41606, "epoch": 990} {"train_loss": -5.721104145050049, "global_step": 41607, "epoch": 990} {"train_loss": -5.665633678436279, "global_step": 41608, "epoch": 990} {"train_loss": -5.755904197692871, "global_step": 41609, "epoch": 990} {"train_loss": -5.447869300842285, "global_step": 41610, "epoch": 990} {"train_loss": -5.596953392028809, "global_step": 41611, "epoch": 990} {"train_loss": -5.61245059967041, "global_step": 41612, "epoch": 990} {"train_loss": -5.394836902618408, "global_step": 41613, "epoch": 990} {"train_loss": -5.537275314331055, "global_step": 41614, "epoch": 990} {"train_loss": -5.477377891540527, "global_step": 41615, "epoch": 990} {"train_loss": -5.5138702392578125, "global_step": 41616, "epoch": 990} {"train_loss": -5.521415710449219, "global_step": 41617, "epoch": 990} {"train_loss": -5.69682502746582, "global_step": 41618, "epoch": 990} {"train_loss": -5.57615852355957, "global_step": 41619, "epoch": 990} {"train_loss": -5.6147141456604, "global_step": 41620, "epoch": 990} {"train_loss": -5.627499330611456, "global_step": 41621, "epoch": 990, "val_loss": 62045.5703125} {"train_loss": -5.71820068359375, "global_step": 41622, "epoch": 991} {"train_loss": -5.629591941833496, "global_step": 41623, "epoch": 991} {"train_loss": -5.735762596130371, "global_step": 41624, "epoch": 991} {"train_loss": -5.639256477355957, "global_step": 41625, "epoch": 991} {"train_loss": -5.655179023742676, "global_step": 41626, "epoch": 991} {"train_loss": -5.657543659210205, "global_step": 41627, "epoch": 991} {"train_loss": -5.617898941040039, "global_step": 41628, "epoch": 991} {"train_loss": -5.6503167152404785, "global_step": 41629, "epoch": 991} {"train_loss": -5.662379264831543, "global_step": 41630, "epoch": 991} {"train_loss": -5.713160514831543, "global_step": 41631, "epoch": 991} {"train_loss": -5.634040832519531, "global_step": 41632, "epoch": 991} {"train_loss": -5.814156532287598, "global_step": 41633, "epoch": 991} {"train_loss": -5.604844093322754, "global_step": 41634, "epoch": 991} {"train_loss": -5.801965236663818, "global_step": 41635, "epoch": 991} {"train_loss": -5.729659557342529, "global_step": 41636, "epoch": 991} {"train_loss": -5.630474090576172, "global_step": 41637, "epoch": 991} {"train_loss": -5.7007904052734375, "global_step": 41638, "epoch": 991} {"train_loss": -5.5880842208862305, "global_step": 41639, "epoch": 991} {"train_loss": -5.836958408355713, "global_step": 41640, "epoch": 991} {"train_loss": -5.6290998458862305, "global_step": 41641, "epoch": 991} {"train_loss": -5.69931697845459, "global_step": 41642, "epoch": 991} {"train_loss": -5.7333550453186035, "global_step": 41643, "epoch": 991} {"train_loss": -5.737176895141602, "global_step": 41644, "epoch": 991} {"train_loss": -5.734897136688232, "global_step": 41645, "epoch": 991} {"train_loss": -5.686012268066406, "global_step": 41646, "epoch": 991} {"train_loss": -5.5230021476745605, "global_step": 41647, "epoch": 991} {"train_loss": -5.73941707611084, "global_step": 41648, "epoch": 991} {"train_loss": -5.6363115310668945, "global_step": 41649, "epoch": 991} {"train_loss": -5.744512557983398, "global_step": 41650, "epoch": 991} {"train_loss": -5.626087188720703, "global_step": 41651, "epoch": 991} {"train_loss": -5.612283706665039, "global_step": 41652, "epoch": 991} {"train_loss": -5.667918682098389, "global_step": 41653, "epoch": 991} {"train_loss": -5.493368148803711, "global_step": 41654, "epoch": 991} {"train_loss": -5.678802013397217, "global_step": 41655, "epoch": 991} {"train_loss": -5.676508903503418, "global_step": 41656, "epoch": 991} {"train_loss": -5.524465560913086, "global_step": 41657, "epoch": 991} {"train_loss": -5.649569511413574, "global_step": 41658, "epoch": 991} {"train_loss": -5.486412048339844, "global_step": 41659, "epoch": 991} {"train_loss": -5.6951799392700195, "global_step": 41660, "epoch": 991} {"train_loss": -5.587618827819824, "global_step": 41661, "epoch": 991} {"train_loss": -5.675921440124512, "global_step": 41662, "epoch": 991} {"train_loss": -5.6631548291160945, "global_step": 41663, "epoch": 991, "val_loss": 61901.48046875} {"train_loss": -5.601184368133545, "global_step": 41664, "epoch": 992} {"train_loss": -5.745359420776367, "global_step": 41665, "epoch": 992} {"train_loss": -5.504703998565674, "global_step": 41666, "epoch": 992} {"train_loss": -5.649966239929199, "global_step": 41667, "epoch": 992} {"train_loss": -5.617162704467773, "global_step": 41668, "epoch": 992} {"train_loss": -5.673182487487793, "global_step": 41669, "epoch": 992} {"train_loss": -5.714683532714844, "global_step": 41670, "epoch": 992} {"train_loss": -5.74669075012207, "global_step": 41671, "epoch": 992} {"train_loss": -5.65086555480957, "global_step": 41672, "epoch": 992} {"train_loss": -5.636444091796875, "global_step": 41673, "epoch": 992} {"train_loss": -5.804042339324951, "global_step": 41674, "epoch": 992} {"train_loss": -5.655882358551025, "global_step": 41675, "epoch": 992} {"train_loss": -5.686866283416748, "global_step": 41676, "epoch": 992} {"train_loss": -5.716813564300537, "global_step": 41677, "epoch": 992} {"train_loss": -5.640436172485352, "global_step": 41678, "epoch": 992} {"train_loss": -5.517969131469727, "global_step": 41679, "epoch": 992} {"train_loss": -5.5634589195251465, "global_step": 41680, "epoch": 992} {"train_loss": -5.561784267425537, "global_step": 41681, "epoch": 992} {"train_loss": -5.513226509094238, "global_step": 41682, "epoch": 992} {"train_loss": -5.770415306091309, "global_step": 41683, "epoch": 992} {"train_loss": -5.634754657745361, "global_step": 41684, "epoch": 992} {"train_loss": -5.580376625061035, "global_step": 41685, "epoch": 992} {"train_loss": -5.68872594833374, "global_step": 41686, "epoch": 992} {"train_loss": -5.6797075271606445, "global_step": 41687, "epoch": 992} {"train_loss": -5.619431495666504, "global_step": 41688, "epoch": 992} {"train_loss": -5.695159912109375, "global_step": 41689, "epoch": 992} {"train_loss": -5.613187313079834, "global_step": 41690, "epoch": 992} {"train_loss": -5.687567234039307, "global_step": 41691, "epoch": 992} {"train_loss": -5.65756368637085, "global_step": 41692, "epoch": 992} {"train_loss": -5.861375331878662, "global_step": 41693, "epoch": 992} {"train_loss": -5.64414119720459, "global_step": 41694, "epoch": 992} {"train_loss": -5.606265068054199, "global_step": 41695, "epoch": 992} {"train_loss": -5.560585975646973, "global_step": 41696, "epoch": 992} {"train_loss": -5.583383083343506, "global_step": 41697, "epoch": 992} {"train_loss": -5.660745143890381, "global_step": 41698, "epoch": 992} {"train_loss": -5.6376190185546875, "global_step": 41699, "epoch": 992} {"train_loss": -5.563973903656006, "global_step": 41700, "epoch": 992} {"train_loss": -5.741377353668213, "global_step": 41701, "epoch": 992} {"train_loss": -5.703197479248047, "global_step": 41702, "epoch": 992} {"train_loss": -5.710436820983887, "global_step": 41703, "epoch": 992} {"train_loss": -5.666250228881836, "global_step": 41704, "epoch": 992} {"train_loss": -5.651229585920062, "global_step": 41705, "epoch": 992, "val_loss": 61853.6328125} {"train_loss": -5.622861385345459, "global_step": 41706, "epoch": 993} {"train_loss": -5.678318977355957, "global_step": 41707, "epoch": 993} {"train_loss": -5.650443077087402, "global_step": 41708, "epoch": 993} {"train_loss": -5.571225166320801, "global_step": 41709, "epoch": 993} {"train_loss": -5.674541473388672, "global_step": 41710, "epoch": 993} {"train_loss": -5.606575012207031, "global_step": 41711, "epoch": 993} {"train_loss": -5.7171478271484375, "global_step": 41712, "epoch": 993} {"train_loss": -5.755862236022949, "global_step": 41713, "epoch": 993} {"train_loss": -5.603582382202148, "global_step": 41714, "epoch": 993} {"train_loss": -5.572819709777832, "global_step": 41715, "epoch": 993} {"train_loss": -5.575401306152344, "global_step": 41716, "epoch": 993} {"train_loss": -5.66969108581543, "global_step": 41717, "epoch": 993} {"train_loss": -5.713153839111328, "global_step": 41718, "epoch": 993} {"train_loss": -5.7347917556762695, "global_step": 41719, "epoch": 993} {"train_loss": -5.738630294799805, "global_step": 41720, "epoch": 993} {"train_loss": -5.711402416229248, "global_step": 41721, "epoch": 993} {"train_loss": -5.7218732833862305, "global_step": 41722, "epoch": 993} {"train_loss": -5.705778121948242, "global_step": 41723, "epoch": 993} {"train_loss": -5.73089599609375, "global_step": 41724, "epoch": 993} {"train_loss": -5.661692142486572, "global_step": 41725, "epoch": 993} {"train_loss": -5.54442834854126, "global_step": 41726, "epoch": 993} {"train_loss": -5.541877746582031, "global_step": 41727, "epoch": 993} {"train_loss": -5.731428146362305, "global_step": 41728, "epoch": 993} {"train_loss": -5.716568470001221, "global_step": 41729, "epoch": 993} {"train_loss": -5.677437782287598, "global_step": 41730, "epoch": 993} {"train_loss": -5.605833053588867, "global_step": 41731, "epoch": 993} {"train_loss": -5.575512886047363, "global_step": 41732, "epoch": 993} {"train_loss": -5.54786491394043, "global_step": 41733, "epoch": 993} {"train_loss": -5.769964218139648, "global_step": 41734, "epoch": 993} {"train_loss": -5.554527282714844, "global_step": 41735, "epoch": 993} {"train_loss": -5.711831569671631, "global_step": 41736, "epoch": 993} {"train_loss": -5.689444541931152, "global_step": 41737, "epoch": 993} {"train_loss": -5.643588542938232, "global_step": 41738, "epoch": 993} {"train_loss": -5.681850910186768, "global_step": 41739, "epoch": 993} {"train_loss": -5.682990074157715, "global_step": 41740, "epoch": 993} {"train_loss": -5.7296342849731445, "global_step": 41741, "epoch": 993} {"train_loss": -5.657304286956787, "global_step": 41742, "epoch": 993} {"train_loss": -5.85684871673584, "global_step": 41743, "epoch": 993} {"train_loss": -5.762547492980957, "global_step": 41744, "epoch": 993} {"train_loss": -5.685997009277344, "global_step": 41745, "epoch": 993} {"train_loss": -5.705816745758057, "global_step": 41746, "epoch": 993} {"train_loss": -5.6695950258345835, "global_step": 41747, "epoch": 993, "val_loss": 61611.84765625} {"train_loss": -5.528472900390625, "global_step": 41748, "epoch": 994} {"train_loss": -5.7968339920043945, "global_step": 41749, "epoch": 994} {"train_loss": -5.734712600708008, "global_step": 41750, "epoch": 994} {"train_loss": -5.692757606506348, "global_step": 41751, "epoch": 994} {"train_loss": -5.563669204711914, "global_step": 41752, "epoch": 994} {"train_loss": -5.581587791442871, "global_step": 41753, "epoch": 994} {"train_loss": -5.615175247192383, "global_step": 41754, "epoch": 994} {"train_loss": -5.676955699920654, "global_step": 41755, "epoch": 994} {"train_loss": -5.681891918182373, "global_step": 41756, "epoch": 994} {"train_loss": -5.627780437469482, "global_step": 41757, "epoch": 994} {"train_loss": -5.710925102233887, "global_step": 41758, "epoch": 994} {"train_loss": -5.749319553375244, "global_step": 41759, "epoch": 994} {"train_loss": -5.666217803955078, "global_step": 41760, "epoch": 994} {"train_loss": -5.73818826675415, "global_step": 41761, "epoch": 994} {"train_loss": -5.667454719543457, "global_step": 41762, "epoch": 994} {"train_loss": -5.557294845581055, "global_step": 41763, "epoch": 994} {"train_loss": -5.7602410316467285, "global_step": 41764, "epoch": 994} {"train_loss": -5.766861915588379, "global_step": 41765, "epoch": 994} {"train_loss": -5.6407976150512695, "global_step": 41766, "epoch": 994} {"train_loss": -5.633957862854004, "global_step": 41767, "epoch": 994} {"train_loss": -5.720568656921387, "global_step": 41768, "epoch": 994} {"train_loss": -5.607919692993164, "global_step": 41769, "epoch": 994} {"train_loss": -5.650454521179199, "global_step": 41770, "epoch": 994} {"train_loss": -5.72337007522583, "global_step": 41771, "epoch": 994} {"train_loss": -5.768618583679199, "global_step": 41772, "epoch": 994} {"train_loss": -5.647430896759033, "global_step": 41773, "epoch": 994} {"train_loss": -5.6973981857299805, "global_step": 41774, "epoch": 994} {"train_loss": -5.627199649810791, "global_step": 41775, "epoch": 994} {"train_loss": -5.554879188537598, "global_step": 41776, "epoch": 994} {"train_loss": -5.591885089874268, "global_step": 41777, "epoch": 994} {"train_loss": -5.749636650085449, "global_step": 41778, "epoch": 994} {"train_loss": -5.683964252471924, "global_step": 41779, "epoch": 994} {"train_loss": -5.53923225402832, "global_step": 41780, "epoch": 994} {"train_loss": -5.71877908706665, "global_step": 41781, "epoch": 994} {"train_loss": -5.694114685058594, "global_step": 41782, "epoch": 994} {"train_loss": -5.648525238037109, "global_step": 41783, "epoch": 994} {"train_loss": -5.736623764038086, "global_step": 41784, "epoch": 994} {"train_loss": -5.699380874633789, "global_step": 41785, "epoch": 994} {"train_loss": -5.698489189147949, "global_step": 41786, "epoch": 994} {"train_loss": -5.766608715057373, "global_step": 41787, "epoch": 994} {"train_loss": -5.63640022277832, "global_step": 41788, "epoch": 994} {"train_loss": -5.671235663550241, "global_step": 41789, "epoch": 994, "val_loss": 61827.22265625} {"train_loss": -5.725426197052002, "global_step": 41790, "epoch": 995} {"train_loss": -5.58099889755249, "global_step": 41791, "epoch": 995} {"train_loss": -5.759441375732422, "global_step": 41792, "epoch": 995} {"train_loss": -5.746408939361572, "global_step": 41793, "epoch": 995} {"train_loss": -5.729768753051758, "global_step": 41794, "epoch": 995} {"train_loss": -5.683200836181641, "global_step": 41795, "epoch": 995} {"train_loss": -5.580201625823975, "global_step": 41796, "epoch": 995} {"train_loss": -5.781087875366211, "global_step": 41797, "epoch": 995} {"train_loss": -5.65692663192749, "global_step": 41798, "epoch": 995} {"train_loss": -5.670773983001709, "global_step": 41799, "epoch": 995} {"train_loss": -5.741241931915283, "global_step": 41800, "epoch": 995} {"train_loss": -5.707460403442383, "global_step": 41801, "epoch": 995} {"train_loss": -5.814830780029297, "global_step": 41802, "epoch": 995} {"train_loss": -5.7130889892578125, "global_step": 41803, "epoch": 995} {"train_loss": -5.680559158325195, "global_step": 41804, "epoch": 995} {"train_loss": -5.661980152130127, "global_step": 41805, "epoch": 995} {"train_loss": -5.628202438354492, "global_step": 41806, "epoch": 995} {"train_loss": -5.745510101318359, "global_step": 41807, "epoch": 995} {"train_loss": -5.574921131134033, "global_step": 41808, "epoch": 995} {"train_loss": -5.685256004333496, "global_step": 41809, "epoch": 995} {"train_loss": -5.662268161773682, "global_step": 41810, "epoch": 995} {"train_loss": -5.6414079666137695, "global_step": 41811, "epoch": 995} {"train_loss": -5.573660850524902, "global_step": 41812, "epoch": 995} {"train_loss": -5.681094169616699, "global_step": 41813, "epoch": 995} {"train_loss": -5.633234024047852, "global_step": 41814, "epoch": 995} {"train_loss": -5.70157527923584, "global_step": 41815, "epoch": 995} {"train_loss": -5.627565383911133, "global_step": 41816, "epoch": 995} {"train_loss": -5.553974628448486, "global_step": 41817, "epoch": 995} {"train_loss": -5.678623199462891, "global_step": 41818, "epoch": 995} {"train_loss": -5.700118064880371, "global_step": 41819, "epoch": 995} {"train_loss": -5.7405171394348145, "global_step": 41820, "epoch": 995} {"train_loss": -5.701459884643555, "global_step": 41821, "epoch": 995} {"train_loss": -5.750949859619141, "global_step": 41822, "epoch": 995} {"train_loss": -5.593820095062256, "global_step": 41823, "epoch": 995} {"train_loss": -5.604001998901367, "global_step": 41824, "epoch": 995} {"train_loss": -5.708901405334473, "global_step": 41825, "epoch": 995} {"train_loss": -5.548799514770508, "global_step": 41826, "epoch": 995} {"train_loss": -5.61836051940918, "global_step": 41827, "epoch": 995} {"train_loss": -5.7479448318481445, "global_step": 41828, "epoch": 995} {"train_loss": -5.694430351257324, "global_step": 41829, "epoch": 995} {"train_loss": -5.718534469604492, "global_step": 41830, "epoch": 995} {"train_loss": -5.6747508843739825, "global_step": 41831, "epoch": 995, "val_loss": 62029.24609375} {"train_loss": -5.7251787185668945, "global_step": 41832, "epoch": 996} {"train_loss": -5.6596198081970215, "global_step": 41833, "epoch": 996} {"train_loss": -5.752649784088135, "global_step": 41834, "epoch": 996} {"train_loss": -5.6165900230407715, "global_step": 41835, "epoch": 996} {"train_loss": -5.678247451782227, "global_step": 41836, "epoch": 996} {"train_loss": -5.689201831817627, "global_step": 41837, "epoch": 996} {"train_loss": -5.653759002685547, "global_step": 41838, "epoch": 996} {"train_loss": -5.689425468444824, "global_step": 41839, "epoch": 996} {"train_loss": -5.663381576538086, "global_step": 41840, "epoch": 996} {"train_loss": -5.579276084899902, "global_step": 41841, "epoch": 996} {"train_loss": -5.774656295776367, "global_step": 41842, "epoch": 996} {"train_loss": -5.590871334075928, "global_step": 41843, "epoch": 996} {"train_loss": -5.590109825134277, "global_step": 41844, "epoch": 996} {"train_loss": -5.785243034362793, "global_step": 41845, "epoch": 996} {"train_loss": -5.627401351928711, "global_step": 41846, "epoch": 996} {"train_loss": -5.617423057556152, "global_step": 41847, "epoch": 996} {"train_loss": -5.5476155281066895, "global_step": 41848, "epoch": 996} {"train_loss": -5.500640392303467, "global_step": 41849, "epoch": 996} {"train_loss": -5.742701530456543, "global_step": 41850, "epoch": 996} {"train_loss": -5.679485321044922, "global_step": 41851, "epoch": 996} {"train_loss": -5.71646785736084, "global_step": 41852, "epoch": 996} {"train_loss": -5.642078399658203, "global_step": 41853, "epoch": 996} {"train_loss": -5.573641777038574, "global_step": 41854, "epoch": 996} {"train_loss": -5.547934532165527, "global_step": 41855, "epoch": 996} {"train_loss": -5.674453258514404, "global_step": 41856, "epoch": 996} {"train_loss": -5.7023468017578125, "global_step": 41857, "epoch": 996} {"train_loss": -5.675065517425537, "global_step": 41858, "epoch": 996} {"train_loss": -5.496608734130859, "global_step": 41859, "epoch": 996} {"train_loss": -5.62640380859375, "global_step": 41860, "epoch": 996} {"train_loss": -5.495413303375244, "global_step": 41861, "epoch": 996} {"train_loss": -5.693875312805176, "global_step": 41862, "epoch": 996} {"train_loss": -5.803718566894531, "global_step": 41863, "epoch": 996} {"train_loss": -5.5131144523620605, "global_step": 41864, "epoch": 996} {"train_loss": -5.746946334838867, "global_step": 41865, "epoch": 996} {"train_loss": -5.675065040588379, "global_step": 41866, "epoch": 996} {"train_loss": -5.653644561767578, "global_step": 41867, "epoch": 996} {"train_loss": -5.680405616760254, "global_step": 41868, "epoch": 996} {"train_loss": -5.6795806884765625, "global_step": 41869, "epoch": 996} {"train_loss": -5.65385103225708, "global_step": 41870, "epoch": 996} {"train_loss": -5.735189437866211, "global_step": 41871, "epoch": 996} {"train_loss": -5.633144378662109, "global_step": 41872, "epoch": 996} {"train_loss": -5.652854385830107, "global_step": 41873, "epoch": 996, "val_loss": 61871.7265625} {"train_loss": -5.596258163452148, "global_step": 41874, "epoch": 997} {"train_loss": -5.619544982910156, "global_step": 41875, "epoch": 997} {"train_loss": -5.9110517501831055, "global_step": 41876, "epoch": 997} {"train_loss": -5.782038688659668, "global_step": 41877, "epoch": 997} {"train_loss": -5.637576103210449, "global_step": 41878, "epoch": 997} {"train_loss": -5.512414455413818, "global_step": 41879, "epoch": 997} {"train_loss": -5.711123943328857, "global_step": 41880, "epoch": 997} {"train_loss": -5.566112995147705, "global_step": 41881, "epoch": 997} {"train_loss": -5.679430961608887, "global_step": 41882, "epoch": 997} {"train_loss": -5.7676167488098145, "global_step": 41883, "epoch": 997} {"train_loss": -5.715380668640137, "global_step": 41884, "epoch": 997} {"train_loss": -5.567068576812744, "global_step": 41885, "epoch": 997} {"train_loss": -5.725747108459473, "global_step": 41886, "epoch": 997} {"train_loss": -5.649616241455078, "global_step": 41887, "epoch": 997} {"train_loss": -5.637170791625977, "global_step": 41888, "epoch": 997} {"train_loss": -5.668581008911133, "global_step": 41889, "epoch": 997} {"train_loss": -5.675800323486328, "global_step": 41890, "epoch": 997} {"train_loss": -5.744349956512451, "global_step": 41891, "epoch": 997} {"train_loss": -5.727834701538086, "global_step": 41892, "epoch": 997} {"train_loss": -5.7504754066467285, "global_step": 41893, "epoch": 997} {"train_loss": -5.561062812805176, "global_step": 41894, "epoch": 997} {"train_loss": -5.7471418380737305, "global_step": 41895, "epoch": 997} {"train_loss": -5.641690254211426, "global_step": 41896, "epoch": 997} {"train_loss": -5.669089317321777, "global_step": 41897, "epoch": 997} {"train_loss": -5.720047950744629, "global_step": 41898, "epoch": 997} {"train_loss": -5.687957763671875, "global_step": 41899, "epoch": 997} {"train_loss": -5.762409210205078, "global_step": 41900, "epoch": 997} {"train_loss": -5.790506362915039, "global_step": 41901, "epoch": 997} {"train_loss": -5.753515243530273, "global_step": 41902, "epoch": 997} {"train_loss": -5.786406517028809, "global_step": 41903, "epoch": 997} {"train_loss": -5.607760429382324, "global_step": 41904, "epoch": 997} {"train_loss": -5.733713626861572, "global_step": 41905, "epoch": 997} {"train_loss": -5.684906959533691, "global_step": 41906, "epoch": 997} {"train_loss": -5.641849994659424, "global_step": 41907, "epoch": 997} {"train_loss": -5.589090347290039, "global_step": 41908, "epoch": 997} {"train_loss": -5.701204299926758, "global_step": 41909, "epoch": 997} {"train_loss": -5.696419715881348, "global_step": 41910, "epoch": 997} {"train_loss": -5.690929412841797, "global_step": 41911, "epoch": 997} {"train_loss": -5.701974391937256, "global_step": 41912, "epoch": 997} {"train_loss": -5.532040119171143, "global_step": 41913, "epoch": 997} {"train_loss": -5.730799198150635, "global_step": 41914, "epoch": 997} {"train_loss": -5.686051993142991, "global_step": 41915, "epoch": 997, "val_loss": 61723.6640625} {"train_loss": -5.664111137390137, "global_step": 41916, "epoch": 998} {"train_loss": -5.576872825622559, "global_step": 41917, "epoch": 998} {"train_loss": -5.678546905517578, "global_step": 41918, "epoch": 998} {"train_loss": -5.488597869873047, "global_step": 41919, "epoch": 998} {"train_loss": -5.562166213989258, "global_step": 41920, "epoch": 998} {"train_loss": -5.6214213371276855, "global_step": 41921, "epoch": 998} {"train_loss": -5.64039945602417, "global_step": 41922, "epoch": 998} {"train_loss": -5.572498321533203, "global_step": 41923, "epoch": 998} {"train_loss": -5.7511444091796875, "global_step": 41924, "epoch": 998} {"train_loss": -5.564484596252441, "global_step": 41925, "epoch": 998} {"train_loss": -5.617485523223877, "global_step": 41926, "epoch": 998} {"train_loss": -5.674032688140869, "global_step": 41927, "epoch": 998} {"train_loss": -5.6318745613098145, "global_step": 41928, "epoch": 998} {"train_loss": -5.813371181488037, "global_step": 41929, "epoch": 998} {"train_loss": -5.620340824127197, "global_step": 41930, "epoch": 998} {"train_loss": -5.670431613922119, "global_step": 41931, "epoch": 998} {"train_loss": -5.5931901931762695, "global_step": 41932, "epoch": 998} {"train_loss": -5.709235668182373, "global_step": 41933, "epoch": 998} {"train_loss": -5.8121161460876465, "global_step": 41934, "epoch": 998} {"train_loss": -5.636284351348877, "global_step": 41935, "epoch": 998} {"train_loss": -5.605288982391357, "global_step": 41936, "epoch": 998} {"train_loss": -5.6201276779174805, "global_step": 41937, "epoch": 998} {"train_loss": -5.632245063781738, "global_step": 41938, "epoch": 998} {"train_loss": -5.607666969299316, "global_step": 41939, "epoch": 998} {"train_loss": -5.7104291915893555, "global_step": 41940, "epoch": 998} {"train_loss": -5.721335411071777, "global_step": 41941, "epoch": 998} {"train_loss": -5.773052215576172, "global_step": 41942, "epoch": 998} {"train_loss": -5.581543445587158, "global_step": 41943, "epoch": 998} {"train_loss": -5.584812164306641, "global_step": 41944, "epoch": 998} {"train_loss": -5.790469169616699, "global_step": 41945, "epoch": 998} {"train_loss": -5.637679576873779, "global_step": 41946, "epoch": 998} {"train_loss": -5.788043022155762, "global_step": 41947, "epoch": 998} {"train_loss": -5.684366703033447, "global_step": 41948, "epoch": 998} {"train_loss": -5.692456245422363, "global_step": 41949, "epoch": 998} {"train_loss": -5.715792655944824, "global_step": 41950, "epoch": 998} {"train_loss": -5.68275785446167, "global_step": 41951, "epoch": 998} {"train_loss": -5.747950077056885, "global_step": 41952, "epoch": 998} {"train_loss": -5.646188735961914, "global_step": 41953, "epoch": 998} {"train_loss": -5.723529815673828, "global_step": 41954, "epoch": 998} {"train_loss": -5.678211212158203, "global_step": 41955, "epoch": 998} {"train_loss": -5.702035903930664, "global_step": 41956, "epoch": 998} {"train_loss": -5.6641035079956055, "global_step": 41957, "epoch": 998, "val_loss": 61778.06640625} {"train_loss": -5.600335121154785, "global_step": 41958, "epoch": 999} {"train_loss": -5.680278778076172, "global_step": 41959, "epoch": 999} {"train_loss": -5.574873924255371, "global_step": 41960, "epoch": 999} {"train_loss": -5.749177932739258, "global_step": 41961, "epoch": 999} {"train_loss": -5.688813209533691, "global_step": 41962, "epoch": 999} {"train_loss": -5.542009353637695, "global_step": 41963, "epoch": 999} {"train_loss": -5.698107719421387, "global_step": 41964, "epoch": 999} {"train_loss": -5.563353061676025, "global_step": 41965, "epoch": 999} {"train_loss": -5.7176513671875, "global_step": 41966, "epoch": 999} {"train_loss": -5.637744903564453, "global_step": 41967, "epoch": 999} {"train_loss": -5.654791831970215, "global_step": 41968, "epoch": 999} {"train_loss": -5.680490493774414, "global_step": 41969, "epoch": 999} {"train_loss": -5.704084396362305, "global_step": 41970, "epoch": 999} {"train_loss": -5.649932861328125, "global_step": 41971, "epoch": 999} {"train_loss": -5.727595329284668, "global_step": 41972, "epoch": 999} {"train_loss": -5.616921424865723, "global_step": 41973, "epoch": 999} {"train_loss": -5.548954010009766, "global_step": 41974, "epoch": 999} {"train_loss": -5.752877712249756, "global_step": 41975, "epoch": 999} {"train_loss": -5.542819023132324, "global_step": 41976, "epoch": 999} {"train_loss": -5.660923957824707, "global_step": 41977, "epoch": 999} {"train_loss": -5.76432466506958, "global_step": 41978, "epoch": 999} {"train_loss": -5.751638412475586, "global_step": 41979, "epoch": 999} {"train_loss": -5.658838748931885, "global_step": 41980, "epoch": 999} {"train_loss": -5.751696586608887, "global_step": 41981, "epoch": 999} {"train_loss": -5.6481146812438965, "global_step": 41982, "epoch": 999} {"train_loss": -5.603131294250488, "global_step": 41983, "epoch": 999} {"train_loss": -5.685977935791016, "global_step": 41984, "epoch": 999} {"train_loss": -5.678521633148193, "global_step": 41985, "epoch": 999} {"train_loss": -5.644529342651367, "global_step": 41986, "epoch": 999} {"train_loss": -5.570209980010986, "global_step": 41987, "epoch": 999} {"train_loss": -5.714315414428711, "global_step": 41988, "epoch": 999} {"train_loss": -5.610161304473877, "global_step": 41989, "epoch": 999} {"train_loss": -5.68358039855957, "global_step": 41990, "epoch": 999} {"train_loss": -5.630083084106445, "global_step": 41991, "epoch": 999} {"train_loss": -5.6842451095581055, "global_step": 41992, "epoch": 999} {"train_loss": -5.7516865730285645, "global_step": 41993, "epoch": 999} {"train_loss": -5.71512508392334, "global_step": 41994, "epoch": 999} {"train_loss": -5.614743232727051, "global_step": 41995, "epoch": 999} {"train_loss": -5.755797863006592, "global_step": 41996, "epoch": 999} {"train_loss": -5.597094535827637, "global_step": 41997, "epoch": 999} {"train_loss": -5.544490337371826, "global_step": 41998, "epoch": 999} {"train_loss": -5.660887638727824, "global_step": 41999, "epoch": 999, "val_loss": 61628.703125} {"train_loss": -5.7473225593566895, "global_step": 42000, "epoch": 1000} {"train_loss": -5.773562908172607, "global_step": 42001, "epoch": 1000} {"train_loss": -5.647774696350098, "global_step": 42002, "epoch": 1000} {"train_loss": -5.636500358581543, "global_step": 42003, "epoch": 1000} {"train_loss": -5.663128852844238, "global_step": 42004, "epoch": 1000} {"train_loss": -5.663921356201172, "global_step": 42005, "epoch": 1000} {"train_loss": -5.598902702331543, "global_step": 42006, "epoch": 1000} {"train_loss": -5.776147842407227, "global_step": 42007, "epoch": 1000} {"train_loss": -5.688105583190918, "global_step": 42008, "epoch": 1000} {"train_loss": -5.700303554534912, "global_step": 42009, "epoch": 1000} {"train_loss": -5.641436576843262, "global_step": 42010, "epoch": 1000} {"train_loss": -5.755786895751953, "global_step": 42011, "epoch": 1000} {"train_loss": -5.6623759269714355, "global_step": 42012, "epoch": 1000} {"train_loss": -5.612997055053711, "global_step": 42013, "epoch": 1000} {"train_loss": -5.6174774169921875, "global_step": 42014, "epoch": 1000} {"train_loss": -5.53089714050293, "global_step": 42015, "epoch": 1000} {"train_loss": -5.6246843338012695, "global_step": 42016, "epoch": 1000} {"train_loss": -5.745547294616699, "global_step": 42017, "epoch": 1000} {"train_loss": -5.604400634765625, "global_step": 42018, "epoch": 1000} {"train_loss": -5.509837627410889, "global_step": 42019, "epoch": 1000} {"train_loss": -5.803466320037842, "global_step": 42020, "epoch": 1000} {"train_loss": -5.65720272064209, "global_step": 42021, "epoch": 1000} {"train_loss": -5.594747543334961, "global_step": 42022, "epoch": 1000} {"train_loss": -5.689223289489746, "global_step": 42023, "epoch": 1000} {"train_loss": -5.625619888305664, "global_step": 42024, "epoch": 1000} {"train_loss": -5.753920555114746, "global_step": 42025, "epoch": 1000} {"train_loss": -5.685537338256836, "global_step": 42026, "epoch": 1000} {"train_loss": -5.691987037658691, "global_step": 42027, "epoch": 1000} {"train_loss": -5.637972831726074, "global_step": 42028, "epoch": 1000} {"train_loss": -5.596229553222656, "global_step": 42029, "epoch": 1000} {"train_loss": -5.6790924072265625, "global_step": 42030, "epoch": 1000} {"train_loss": -5.675107955932617, "global_step": 42031, "epoch": 1000} {"train_loss": -5.679891586303711, "global_step": 42032, "epoch": 1000} {"train_loss": -5.690776824951172, "global_step": 42033, "epoch": 1000} {"train_loss": -5.589423179626465, "global_step": 42034, "epoch": 1000} {"train_loss": -5.656865119934082, "global_step": 42035, "epoch": 1000} {"train_loss": -5.524603843688965, "global_step": 42036, "epoch": 1000} {"train_loss": -5.659247398376465, "global_step": 42037, "epoch": 1000} {"train_loss": -5.677170753479004, "global_step": 42038, "epoch": 1000} {"train_loss": -5.702086448669434, "global_step": 42039, "epoch": 1000} {"train_loss": -5.713253021240234, "global_step": 42040, "epoch": 1000} {"train_loss": -5.658922445206415, "global_step": 42041, "epoch": 1000, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.5461756684777644, "train/sim_max_reward_2": 0.42729761947028594, "train/sim_max_reward_3": 0.1130570594954234, "train/sim_max_reward_4": 0.8235718760913548, "train/sim_max_reward_5": 0.577991948822858, "test/sim_max_reward_4300000": 0.3425102869542606, "test/sim_max_reward_4300001": 0.2736732516519333, "test/sim_max_reward_4300002": 0.43560188833654223, "test/sim_max_reward_4300003": 0.602389491863466, "test/sim_max_reward_4300004": 0.6647353572008565, "test/sim_max_reward_4300005": 0.7114615813248923, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.7095904917879237, "test/sim_max_reward_4300008": 0.7125449184212929, "test/sim_max_reward_4300009": 0.7753873037667643, "test/sim_max_reward_4300010": 0.4786849103294403, "test/sim_max_reward_4300011": 0.8739140851379338, "test/sim_max_reward_4300012": 0.6288888488992013, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 0.5946883574537725, "test/sim_max_reward_4300015": 0.5626341033862224, "test/sim_max_reward_4300016": 0.1106945166254321, "test/sim_max_reward_4300017": 0.49485780366334603, "test/sim_max_reward_4300018": 0.427607554494827, "test/sim_max_reward_4300019": 0.1860511627939772, "test/sim_max_reward_4300020": 0.3127016594354455, "test/sim_max_reward_4300021": 0.8778592206929993, "test/sim_max_reward_4300022": 0.21427755799724796, "test/sim_max_reward_4300023": 0.3568023062703421, "test/sim_max_reward_4300024": 0.5297130832260497, "test/sim_max_reward_4300025": 0.3652258919867038, "test/sim_max_reward_4300026": 0.17033371017263207, "test/sim_max_reward_4300027": 0.025131817423684817, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.3285099994019225, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.08999541554690058, "test/sim_max_reward_4300032": 0.8270364608679808, "test/sim_max_reward_4300033": 0.43276064874357695, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9712512429731289, "test/sim_max_reward_4300038": 0.9454368637190865, "test/sim_max_reward_4300039": 0.688415590298442, "test/sim_max_reward_4300040": 0.26455205665311865, "test/sim_max_reward_4300041": 0.4553272296434258, "test/sim_max_reward_4300042": 0.6760103952149052, "test/sim_max_reward_4300043": 0.2054464229366993, "test/sim_max_reward_4300044": 0.7647670341704095, "test/sim_max_reward_4300045": 0.17081040659987726, "test/sim_max_reward_4300046": 0.9919095461352783, "test/sim_max_reward_4300047": 0.1519135175074061, "test/sim_max_reward_4300048": 0.7614002140083097, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.44639861149395643, "test/mean_score": 0.44725396642562265, "val_loss": 62023.78125} {"train_loss": -5.6259870529174805, "global_step": 42042, "epoch": 1001} {"train_loss": -5.653410911560059, "global_step": 42043, "epoch": 1001} {"train_loss": -5.667616844177246, "global_step": 42044, "epoch": 1001} {"train_loss": -5.648349761962891, "global_step": 42045, "epoch": 1001} {"train_loss": -5.722020149230957, "global_step": 42046, "epoch": 1001} {"train_loss": -5.650605201721191, "global_step": 42047, "epoch": 1001} {"train_loss": -5.794069766998291, "global_step": 42048, "epoch": 1001} {"train_loss": -5.7085652351379395, "global_step": 42049, "epoch": 1001} {"train_loss": -5.715993881225586, "global_step": 42050, "epoch": 1001} {"train_loss": -5.671934127807617, "global_step": 42051, "epoch": 1001} {"train_loss": -5.674318313598633, "global_step": 42052, "epoch": 1001} {"train_loss": -5.721192359924316, "global_step": 42053, "epoch": 1001} {"train_loss": -5.701722145080566, "global_step": 42054, "epoch": 1001} {"train_loss": -5.616263389587402, "global_step": 42055, "epoch": 1001} {"train_loss": -5.711700439453125, "global_step": 42056, "epoch": 1001} {"train_loss": -5.486910820007324, "global_step": 42057, "epoch": 1001} {"train_loss": -5.647687911987305, "global_step": 42058, "epoch": 1001} {"train_loss": -5.6449995040893555, "global_step": 42059, "epoch": 1001} {"train_loss": -5.611567497253418, "global_step": 42060, "epoch": 1001} {"train_loss": -5.612909317016602, "global_step": 42061, "epoch": 1001} {"train_loss": -5.507209777832031, "global_step": 42062, "epoch": 1001} {"train_loss": -5.6768293380737305, "global_step": 42063, "epoch": 1001} {"train_loss": -5.789275169372559, "global_step": 42064, "epoch": 1001} {"train_loss": -5.80325984954834, "global_step": 42065, "epoch": 1001} {"train_loss": -5.611017227172852, "global_step": 42066, "epoch": 1001} {"train_loss": -5.714511871337891, "global_step": 42067, "epoch": 1001} {"train_loss": -5.571250915527344, "global_step": 42068, "epoch": 1001} {"train_loss": -5.643673419952393, "global_step": 42069, "epoch": 1001} {"train_loss": -5.7527265548706055, "global_step": 42070, "epoch": 1001} {"train_loss": -5.636040687561035, "global_step": 42071, "epoch": 1001} {"train_loss": -5.719967842102051, "global_step": 42072, "epoch": 1001} {"train_loss": -5.549216270446777, "global_step": 42073, "epoch": 1001} {"train_loss": -5.665112018585205, "global_step": 42074, "epoch": 1001} {"train_loss": -5.621894359588623, "global_step": 42075, "epoch": 1001} {"train_loss": -5.736922264099121, "global_step": 42076, "epoch": 1001} {"train_loss": -5.640472888946533, "global_step": 42077, "epoch": 1001} {"train_loss": -5.641546249389648, "global_step": 42078, "epoch": 1001} {"train_loss": -5.5777692794799805, "global_step": 42079, "epoch": 1001} {"train_loss": -5.620264530181885, "global_step": 42080, "epoch": 1001} {"train_loss": -5.641777038574219, "global_step": 42081, "epoch": 1001} {"train_loss": -5.522339820861816, "global_step": 42082, "epoch": 1001} {"train_loss": -5.657492285683041, "global_step": 42083, "epoch": 1001, "val_loss": 62075.17578125} {"train_loss": -5.69462776184082, "global_step": 42084, "epoch": 1002} {"train_loss": -5.638211250305176, "global_step": 42085, "epoch": 1002} {"train_loss": -5.719404220581055, "global_step": 42086, "epoch": 1002} {"train_loss": -5.682323932647705, "global_step": 42087, "epoch": 1002} {"train_loss": -5.742644309997559, "global_step": 42088, "epoch": 1002} {"train_loss": -5.673001289367676, "global_step": 42089, "epoch": 1002} {"train_loss": -5.7350850105285645, "global_step": 42090, "epoch": 1002} {"train_loss": -5.656092643737793, "global_step": 42091, "epoch": 1002} {"train_loss": -5.76157283782959, "global_step": 42092, "epoch": 1002} {"train_loss": -5.739309310913086, "global_step": 42093, "epoch": 1002} {"train_loss": -5.679786682128906, "global_step": 42094, "epoch": 1002} {"train_loss": -5.712703704833984, "global_step": 42095, "epoch": 1002} {"train_loss": -5.662442207336426, "global_step": 42096, "epoch": 1002} {"train_loss": -5.612335205078125, "global_step": 42097, "epoch": 1002} {"train_loss": -5.655004501342773, "global_step": 42098, "epoch": 1002} {"train_loss": -5.635366439819336, "global_step": 42099, "epoch": 1002} {"train_loss": -5.547940731048584, "global_step": 42100, "epoch": 1002} {"train_loss": -5.6521735191345215, "global_step": 42101, "epoch": 1002} {"train_loss": -5.760262489318848, "global_step": 42102, "epoch": 1002} {"train_loss": -5.779994964599609, "global_step": 42103, "epoch": 1002} {"train_loss": -5.750618934631348, "global_step": 42104, "epoch": 1002} {"train_loss": -5.7890095710754395, "global_step": 42105, "epoch": 1002} {"train_loss": -5.785465240478516, "global_step": 42106, "epoch": 1002} {"train_loss": -5.692876815795898, "global_step": 42107, "epoch": 1002} {"train_loss": -5.770090579986572, "global_step": 42108, "epoch": 1002} {"train_loss": -5.750886917114258, "global_step": 42109, "epoch": 1002} {"train_loss": -5.5898542404174805, "global_step": 42110, "epoch": 1002} {"train_loss": -5.715145111083984, "global_step": 42111, "epoch": 1002} {"train_loss": -5.727503299713135, "global_step": 42112, "epoch": 1002} {"train_loss": -5.612222671508789, "global_step": 42113, "epoch": 1002} {"train_loss": -5.5439043045043945, "global_step": 42114, "epoch": 1002} {"train_loss": -5.613792896270752, "global_step": 42115, "epoch": 1002} {"train_loss": -5.585568428039551, "global_step": 42116, "epoch": 1002} {"train_loss": -5.551483631134033, "global_step": 42117, "epoch": 1002} {"train_loss": -5.486376762390137, "global_step": 42118, "epoch": 1002} {"train_loss": -5.611724853515625, "global_step": 42119, "epoch": 1002} {"train_loss": -5.4024248123168945, "global_step": 42120, "epoch": 1002} {"train_loss": -5.601980209350586, "global_step": 42121, "epoch": 1002} {"train_loss": -5.608635902404785, "global_step": 42122, "epoch": 1002} {"train_loss": -5.464247703552246, "global_step": 42123, "epoch": 1002} {"train_loss": -5.5779829025268555, "global_step": 42124, "epoch": 1002} {"train_loss": -5.654588120324271, "global_step": 42125, "epoch": 1002, "val_loss": 62093.38671875} {"train_loss": -5.569292068481445, "global_step": 42126, "epoch": 1003} {"train_loss": -5.70876407623291, "global_step": 42127, "epoch": 1003} {"train_loss": -5.628823280334473, "global_step": 42128, "epoch": 1003} {"train_loss": -5.570804119110107, "global_step": 42129, "epoch": 1003} {"train_loss": -5.685988903045654, "global_step": 42130, "epoch": 1003} {"train_loss": -5.600915908813477, "global_step": 42131, "epoch": 1003} {"train_loss": -5.589432716369629, "global_step": 42132, "epoch": 1003} {"train_loss": -5.710577011108398, "global_step": 42133, "epoch": 1003} {"train_loss": -5.57137393951416, "global_step": 42134, "epoch": 1003} {"train_loss": -5.625792503356934, "global_step": 42135, "epoch": 1003} {"train_loss": -5.617014408111572, "global_step": 42136, "epoch": 1003} {"train_loss": -5.725900650024414, "global_step": 42137, "epoch": 1003} {"train_loss": -5.6109538078308105, "global_step": 42138, "epoch": 1003} {"train_loss": -5.691670894622803, "global_step": 42139, "epoch": 1003} {"train_loss": -5.545750617980957, "global_step": 42140, "epoch": 1003} {"train_loss": -5.585212707519531, "global_step": 42141, "epoch": 1003} {"train_loss": -5.524285316467285, "global_step": 42142, "epoch": 1003} {"train_loss": -5.626652240753174, "global_step": 42143, "epoch": 1003} {"train_loss": -5.661634922027588, "global_step": 42144, "epoch": 1003} {"train_loss": -5.737968921661377, "global_step": 42145, "epoch": 1003} {"train_loss": -5.573108196258545, "global_step": 42146, "epoch": 1003} {"train_loss": -5.643388748168945, "global_step": 42147, "epoch": 1003} {"train_loss": -5.721209526062012, "global_step": 42148, "epoch": 1003} {"train_loss": -5.558337688446045, "global_step": 42149, "epoch": 1003} {"train_loss": -5.7756805419921875, "global_step": 42150, "epoch": 1003} {"train_loss": -5.69654655456543, "global_step": 42151, "epoch": 1003} {"train_loss": -5.790409088134766, "global_step": 42152, "epoch": 1003} {"train_loss": -5.680896759033203, "global_step": 42153, "epoch": 1003} {"train_loss": -5.63419246673584, "global_step": 42154, "epoch": 1003} {"train_loss": -5.602777481079102, "global_step": 42155, "epoch": 1003} {"train_loss": -5.745545387268066, "global_step": 42156, "epoch": 1003} {"train_loss": -5.6774444580078125, "global_step": 42157, "epoch": 1003} {"train_loss": -5.619743824005127, "global_step": 42158, "epoch": 1003} {"train_loss": -5.686321258544922, "global_step": 42159, "epoch": 1003} {"train_loss": -5.698737621307373, "global_step": 42160, "epoch": 1003} {"train_loss": -5.694428443908691, "global_step": 42161, "epoch": 1003} {"train_loss": -5.743142127990723, "global_step": 42162, "epoch": 1003} {"train_loss": -5.760820388793945, "global_step": 42163, "epoch": 1003} {"train_loss": -5.68680477142334, "global_step": 42164, "epoch": 1003} {"train_loss": -5.683942794799805, "global_step": 42165, "epoch": 1003} {"train_loss": -5.6841206550598145, "global_step": 42166, "epoch": 1003} {"train_loss": -5.657753161021641, "global_step": 42167, "epoch": 1003, "val_loss": 61805.1171875} {"train_loss": -5.722880840301514, "global_step": 42168, "epoch": 1004} {"train_loss": -5.6641950607299805, "global_step": 42169, "epoch": 1004} {"train_loss": -5.739952564239502, "global_step": 42170, "epoch": 1004} {"train_loss": -5.7034220695495605, "global_step": 42171, "epoch": 1004} {"train_loss": -5.664144515991211, "global_step": 42172, "epoch": 1004} {"train_loss": -5.643930435180664, "global_step": 42173, "epoch": 1004} {"train_loss": -5.728846549987793, "global_step": 42174, "epoch": 1004} {"train_loss": -5.668044567108154, "global_step": 42175, "epoch": 1004} {"train_loss": -5.628179550170898, "global_step": 42176, "epoch": 1004} {"train_loss": -5.622939109802246, "global_step": 42177, "epoch": 1004} {"train_loss": -5.676224708557129, "global_step": 42178, "epoch": 1004} {"train_loss": -5.665942668914795, "global_step": 42179, "epoch": 1004} {"train_loss": -5.746150970458984, "global_step": 42180, "epoch": 1004} {"train_loss": -5.6624345779418945, "global_step": 42181, "epoch": 1004} {"train_loss": -5.812129974365234, "global_step": 42182, "epoch": 1004} {"train_loss": -5.654984474182129, "global_step": 42183, "epoch": 1004} {"train_loss": -5.820157051086426, "global_step": 42184, "epoch": 1004} {"train_loss": -5.665631294250488, "global_step": 42185, "epoch": 1004} {"train_loss": -5.724443435668945, "global_step": 42186, "epoch": 1004} {"train_loss": -5.627972602844238, "global_step": 42187, "epoch": 1004} {"train_loss": -5.738168239593506, "global_step": 42188, "epoch": 1004} {"train_loss": -5.609200477600098, "global_step": 42189, "epoch": 1004} {"train_loss": -5.580784797668457, "global_step": 42190, "epoch": 1004} {"train_loss": -5.710601806640625, "global_step": 42191, "epoch": 1004} {"train_loss": -5.736342430114746, "global_step": 42192, "epoch": 1004} {"train_loss": -5.697145938873291, "global_step": 42193, "epoch": 1004} {"train_loss": -5.773109436035156, "global_step": 42194, "epoch": 1004} {"train_loss": -5.577906131744385, "global_step": 42195, "epoch": 1004} {"train_loss": -5.699256896972656, "global_step": 42196, "epoch": 1004} {"train_loss": -5.628288269042969, "global_step": 42197, "epoch": 1004} {"train_loss": -5.785530090332031, "global_step": 42198, "epoch": 1004} {"train_loss": -5.679522514343262, "global_step": 42199, "epoch": 1004} {"train_loss": -5.768304347991943, "global_step": 42200, "epoch": 1004} {"train_loss": -5.566571235656738, "global_step": 42201, "epoch": 1004} {"train_loss": -5.707568645477295, "global_step": 42202, "epoch": 1004} {"train_loss": -5.67153787612915, "global_step": 42203, "epoch": 1004} {"train_loss": -5.687549591064453, "global_step": 42204, "epoch": 1004} {"train_loss": -5.560720920562744, "global_step": 42205, "epoch": 1004} {"train_loss": -5.656858444213867, "global_step": 42206, "epoch": 1004} {"train_loss": -5.679359436035156, "global_step": 42207, "epoch": 1004} {"train_loss": -5.729631423950195, "global_step": 42208, "epoch": 1004} {"train_loss": -5.684876510075161, "global_step": 42209, "epoch": 1004, "val_loss": 61705.12109375} {"train_loss": -5.669923782348633, "global_step": 42210, "epoch": 1005} {"train_loss": -5.742494583129883, "global_step": 42211, "epoch": 1005} {"train_loss": -5.7202558517456055, "global_step": 42212, "epoch": 1005} {"train_loss": -5.7944464683532715, "global_step": 42213, "epoch": 1005} {"train_loss": -5.640515327453613, "global_step": 42214, "epoch": 1005} {"train_loss": -5.522172451019287, "global_step": 42215, "epoch": 1005} {"train_loss": -5.70658016204834, "global_step": 42216, "epoch": 1005} {"train_loss": -5.697727203369141, "global_step": 42217, "epoch": 1005} {"train_loss": -5.614138126373291, "global_step": 42218, "epoch": 1005} {"train_loss": -5.7242631912231445, "global_step": 42219, "epoch": 1005} {"train_loss": -5.5362467765808105, "global_step": 42220, "epoch": 1005} {"train_loss": -5.584603309631348, "global_step": 42221, "epoch": 1005} {"train_loss": -5.720796585083008, "global_step": 42222, "epoch": 1005} {"train_loss": -5.745114803314209, "global_step": 42223, "epoch": 1005} {"train_loss": -5.6578192710876465, "global_step": 42224, "epoch": 1005} {"train_loss": -5.641911029815674, "global_step": 42225, "epoch": 1005} {"train_loss": -5.6739983558654785, "global_step": 42226, "epoch": 1005} {"train_loss": -5.590380668640137, "global_step": 42227, "epoch": 1005} {"train_loss": -5.6054301261901855, "global_step": 42228, "epoch": 1005} {"train_loss": -5.671504497528076, "global_step": 42229, "epoch": 1005} {"train_loss": -5.6997551918029785, "global_step": 42230, "epoch": 1005} {"train_loss": -5.688022136688232, "global_step": 42231, "epoch": 1005} {"train_loss": -5.665689468383789, "global_step": 42232, "epoch": 1005} {"train_loss": -5.723321437835693, "global_step": 42233, "epoch": 1005} {"train_loss": -5.604883193969727, "global_step": 42234, "epoch": 1005} {"train_loss": -5.611577987670898, "global_step": 42235, "epoch": 1005} {"train_loss": -5.707094192504883, "global_step": 42236, "epoch": 1005} {"train_loss": -5.745203971862793, "global_step": 42237, "epoch": 1005} {"train_loss": -5.694355487823486, "global_step": 42238, "epoch": 1005} {"train_loss": -5.61359977722168, "global_step": 42239, "epoch": 1005} {"train_loss": -5.698450088500977, "global_step": 42240, "epoch": 1005} {"train_loss": -5.500607013702393, "global_step": 42241, "epoch": 1005} {"train_loss": -5.782248497009277, "global_step": 42242, "epoch": 1005} {"train_loss": -5.60456657409668, "global_step": 42243, "epoch": 1005} {"train_loss": -5.599752902984619, "global_step": 42244, "epoch": 1005} {"train_loss": -5.6434712409973145, "global_step": 42245, "epoch": 1005} {"train_loss": -5.4816813468933105, "global_step": 42246, "epoch": 1005} {"train_loss": -5.592687606811523, "global_step": 42247, "epoch": 1005} {"train_loss": -5.701288223266602, "global_step": 42248, "epoch": 1005} {"train_loss": -5.64766263961792, "global_step": 42249, "epoch": 1005} {"train_loss": -5.716977119445801, "global_step": 42250, "epoch": 1005} {"train_loss": -5.658470380873907, "global_step": 42251, "epoch": 1005, "val_loss": 61499.86328125} {"train_loss": -5.710130214691162, "global_step": 42252, "epoch": 1006} {"train_loss": -5.518179893493652, "global_step": 42253, "epoch": 1006} {"train_loss": -5.714972496032715, "global_step": 42254, "epoch": 1006} {"train_loss": -5.575909614562988, "global_step": 42255, "epoch": 1006} {"train_loss": -5.654080390930176, "global_step": 42256, "epoch": 1006} {"train_loss": -5.764240264892578, "global_step": 42257, "epoch": 1006} {"train_loss": -5.671627521514893, "global_step": 42258, "epoch": 1006} {"train_loss": -5.67576265335083, "global_step": 42259, "epoch": 1006} {"train_loss": -5.7806291580200195, "global_step": 42260, "epoch": 1006} {"train_loss": -5.706172466278076, "global_step": 42261, "epoch": 1006} {"train_loss": -5.672515392303467, "global_step": 42262, "epoch": 1006} {"train_loss": -5.7165069580078125, "global_step": 42263, "epoch": 1006} {"train_loss": -5.737292289733887, "global_step": 42264, "epoch": 1006} {"train_loss": -5.71891450881958, "global_step": 42265, "epoch": 1006} {"train_loss": -5.557729721069336, "global_step": 42266, "epoch": 1006} {"train_loss": -5.703392028808594, "global_step": 42267, "epoch": 1006} {"train_loss": -5.601126194000244, "global_step": 42268, "epoch": 1006} {"train_loss": -5.623928070068359, "global_step": 42269, "epoch": 1006} {"train_loss": -5.688089370727539, "global_step": 42270, "epoch": 1006} {"train_loss": -5.700600624084473, "global_step": 42271, "epoch": 1006} {"train_loss": -5.832786560058594, "global_step": 42272, "epoch": 1006} {"train_loss": -5.671031475067139, "global_step": 42273, "epoch": 1006} {"train_loss": -5.7476725578308105, "global_step": 42274, "epoch": 1006} {"train_loss": -5.7620038986206055, "global_step": 42275, "epoch": 1006} {"train_loss": -5.774196147918701, "global_step": 42276, "epoch": 1006} {"train_loss": -5.676827907562256, "global_step": 42277, "epoch": 1006} {"train_loss": -5.6480631828308105, "global_step": 42278, "epoch": 1006} {"train_loss": -5.579113006591797, "global_step": 42279, "epoch": 1006} {"train_loss": -5.576315879821777, "global_step": 42280, "epoch": 1006} {"train_loss": -5.632688522338867, "global_step": 42281, "epoch": 1006} {"train_loss": -5.70607852935791, "global_step": 42282, "epoch": 1006} {"train_loss": -5.694952011108398, "global_step": 42283, "epoch": 1006} {"train_loss": -5.776728630065918, "global_step": 42284, "epoch": 1006} {"train_loss": -5.635378837585449, "global_step": 42285, "epoch": 1006} {"train_loss": -5.731356620788574, "global_step": 42286, "epoch": 1006} {"train_loss": -5.782343864440918, "global_step": 42287, "epoch": 1006} {"train_loss": -5.672094345092773, "global_step": 42288, "epoch": 1006} {"train_loss": -5.669066429138184, "global_step": 42289, "epoch": 1006} {"train_loss": -5.661548614501953, "global_step": 42290, "epoch": 1006} {"train_loss": -5.652173042297363, "global_step": 42291, "epoch": 1006} {"train_loss": -5.704620361328125, "global_step": 42292, "epoch": 1006} {"train_loss": -5.686535347075689, "global_step": 42293, "epoch": 1006, "val_loss": 61717.90234375} {"train_loss": -5.822926998138428, "global_step": 42294, "epoch": 1007} {"train_loss": -5.8008880615234375, "global_step": 42295, "epoch": 1007} {"train_loss": -5.618988037109375, "global_step": 42296, "epoch": 1007} {"train_loss": -5.593321800231934, "global_step": 42297, "epoch": 1007} {"train_loss": -5.68171501159668, "global_step": 42298, "epoch": 1007} {"train_loss": -5.623810768127441, "global_step": 42299, "epoch": 1007} {"train_loss": -5.7647504806518555, "global_step": 42300, "epoch": 1007} {"train_loss": -5.712275505065918, "global_step": 42301, "epoch": 1007} {"train_loss": -5.6440229415893555, "global_step": 42302, "epoch": 1007} {"train_loss": -5.666919231414795, "global_step": 42303, "epoch": 1007} {"train_loss": -5.575130462646484, "global_step": 42304, "epoch": 1007} {"train_loss": -5.722276210784912, "global_step": 42305, "epoch": 1007} {"train_loss": -5.730125427246094, "global_step": 42306, "epoch": 1007} {"train_loss": -5.580692768096924, "global_step": 42307, "epoch": 1007} {"train_loss": -5.619763374328613, "global_step": 42308, "epoch": 1007} {"train_loss": -5.595656871795654, "global_step": 42309, "epoch": 1007} {"train_loss": -5.664026260375977, "global_step": 42310, "epoch": 1007} {"train_loss": -5.68196964263916, "global_step": 42311, "epoch": 1007} {"train_loss": -5.698280334472656, "global_step": 42312, "epoch": 1007} {"train_loss": -5.631246089935303, "global_step": 42313, "epoch": 1007} {"train_loss": -5.749433517456055, "global_step": 42314, "epoch": 1007} {"train_loss": -5.505334377288818, "global_step": 42315, "epoch": 1007} {"train_loss": -5.68149995803833, "global_step": 42316, "epoch": 1007} {"train_loss": -5.588997840881348, "global_step": 42317, "epoch": 1007} {"train_loss": -5.696456432342529, "global_step": 42318, "epoch": 1007} {"train_loss": -5.542993068695068, "global_step": 42319, "epoch": 1007} {"train_loss": -5.715095520019531, "global_step": 42320, "epoch": 1007} {"train_loss": -5.65598201751709, "global_step": 42321, "epoch": 1007} {"train_loss": -5.622121810913086, "global_step": 42322, "epoch": 1007} {"train_loss": -5.7035932540893555, "global_step": 42323, "epoch": 1007} {"train_loss": -5.652340888977051, "global_step": 42324, "epoch": 1007} {"train_loss": -5.554528713226318, "global_step": 42325, "epoch": 1007} {"train_loss": -5.635190486907959, "global_step": 42326, "epoch": 1007} {"train_loss": -5.5537190437316895, "global_step": 42327, "epoch": 1007} {"train_loss": -5.646951675415039, "global_step": 42328, "epoch": 1007} {"train_loss": -5.653475761413574, "global_step": 42329, "epoch": 1007} {"train_loss": -5.683305263519287, "global_step": 42330, "epoch": 1007} {"train_loss": -5.523642063140869, "global_step": 42331, "epoch": 1007} {"train_loss": -5.639786720275879, "global_step": 42332, "epoch": 1007} {"train_loss": -5.6234869956970215, "global_step": 42333, "epoch": 1007} {"train_loss": -5.677502155303955, "global_step": 42334, "epoch": 1007} {"train_loss": -5.651281163806007, "global_step": 42335, "epoch": 1007, "val_loss": 61960.0546875} {"train_loss": -5.695121765136719, "global_step": 42336, "epoch": 1008} {"train_loss": -5.661924362182617, "global_step": 42337, "epoch": 1008} {"train_loss": -5.734580993652344, "global_step": 42338, "epoch": 1008} {"train_loss": -5.507784366607666, "global_step": 42339, "epoch": 1008} {"train_loss": -5.677095413208008, "global_step": 42340, "epoch": 1008} {"train_loss": -5.690602779388428, "global_step": 42341, "epoch": 1008} {"train_loss": -5.512383937835693, "global_step": 42342, "epoch": 1008} {"train_loss": -5.62769079208374, "global_step": 42343, "epoch": 1008} {"train_loss": -5.523619651794434, "global_step": 42344, "epoch": 1008} {"train_loss": -5.70267391204834, "global_step": 42345, "epoch": 1008} {"train_loss": -5.503478050231934, "global_step": 42346, "epoch": 1008} {"train_loss": -5.699626922607422, "global_step": 42347, "epoch": 1008} {"train_loss": -5.65986442565918, "global_step": 42348, "epoch": 1008} {"train_loss": -5.642507553100586, "global_step": 42349, "epoch": 1008} {"train_loss": -5.703978538513184, "global_step": 42350, "epoch": 1008} {"train_loss": -5.57352352142334, "global_step": 42351, "epoch": 1008} {"train_loss": -5.661784648895264, "global_step": 42352, "epoch": 1008} {"train_loss": -5.640069961547852, "global_step": 42353, "epoch": 1008} {"train_loss": -5.564387798309326, "global_step": 42354, "epoch": 1008} {"train_loss": -5.642261981964111, "global_step": 42355, "epoch": 1008} {"train_loss": -5.546976089477539, "global_step": 42356, "epoch": 1008} {"train_loss": -5.560869216918945, "global_step": 42357, "epoch": 1008} {"train_loss": -5.654116630554199, "global_step": 42358, "epoch": 1008} {"train_loss": -5.579862594604492, "global_step": 42359, "epoch": 1008} {"train_loss": -5.6048455238342285, "global_step": 42360, "epoch": 1008} {"train_loss": -5.745784759521484, "global_step": 42361, "epoch": 1008} {"train_loss": -5.487479209899902, "global_step": 42362, "epoch": 1008} {"train_loss": -5.596980094909668, "global_step": 42363, "epoch": 1008} {"train_loss": -5.5738525390625, "global_step": 42364, "epoch": 1008} {"train_loss": -5.547403812408447, "global_step": 42365, "epoch": 1008} {"train_loss": -5.731327533721924, "global_step": 42366, "epoch": 1008} {"train_loss": -5.650028228759766, "global_step": 42367, "epoch": 1008} {"train_loss": -5.68405818939209, "global_step": 42368, "epoch": 1008} {"train_loss": -5.590807914733887, "global_step": 42369, "epoch": 1008} {"train_loss": -5.610158443450928, "global_step": 42370, "epoch": 1008} {"train_loss": -5.537261009216309, "global_step": 42371, "epoch": 1008} {"train_loss": -5.695387363433838, "global_step": 42372, "epoch": 1008} {"train_loss": -5.530688285827637, "global_step": 42373, "epoch": 1008} {"train_loss": -5.6996235847473145, "global_step": 42374, "epoch": 1008} {"train_loss": -5.649290084838867, "global_step": 42375, "epoch": 1008} {"train_loss": -5.596330642700195, "global_step": 42376, "epoch": 1008} {"train_loss": -5.6233186948867075, "global_step": 42377, "epoch": 1008, "val_loss": 61615.15234375} {"train_loss": -5.483001708984375, "global_step": 42378, "epoch": 1009} {"train_loss": -5.639255046844482, "global_step": 42379, "epoch": 1009} {"train_loss": -5.612027168273926, "global_step": 42380, "epoch": 1009} {"train_loss": -5.708954811096191, "global_step": 42381, "epoch": 1009} {"train_loss": -5.732054233551025, "global_step": 42382, "epoch": 1009} {"train_loss": -5.530918121337891, "global_step": 42383, "epoch": 1009} {"train_loss": -5.6935625076293945, "global_step": 42384, "epoch": 1009} {"train_loss": -5.728444576263428, "global_step": 42385, "epoch": 1009} {"train_loss": -5.7255353927612305, "global_step": 42386, "epoch": 1009} {"train_loss": -5.723674774169922, "global_step": 42387, "epoch": 1009} {"train_loss": -5.625837326049805, "global_step": 42388, "epoch": 1009} {"train_loss": -5.613790512084961, "global_step": 42389, "epoch": 1009} {"train_loss": -5.731250762939453, "global_step": 42390, "epoch": 1009} {"train_loss": -5.5710248947143555, "global_step": 42391, "epoch": 1009} {"train_loss": -5.741054058074951, "global_step": 42392, "epoch": 1009} {"train_loss": -5.816433906555176, "global_step": 42393, "epoch": 1009} {"train_loss": -5.723407745361328, "global_step": 42394, "epoch": 1009} {"train_loss": -5.663142204284668, "global_step": 42395, "epoch": 1009} {"train_loss": -5.608528137207031, "global_step": 42396, "epoch": 1009} {"train_loss": -5.6786627769470215, "global_step": 42397, "epoch": 1009} {"train_loss": -5.728833198547363, "global_step": 42398, "epoch": 1009} {"train_loss": -5.800882339477539, "global_step": 42399, "epoch": 1009} {"train_loss": -5.521538257598877, "global_step": 42400, "epoch": 1009} {"train_loss": -5.705788612365723, "global_step": 42401, "epoch": 1009} {"train_loss": -5.64949893951416, "global_step": 42402, "epoch": 1009} {"train_loss": -5.550899505615234, "global_step": 42403, "epoch": 1009} {"train_loss": -5.731567859649658, "global_step": 42404, "epoch": 1009} {"train_loss": -5.713582992553711, "global_step": 42405, "epoch": 1009} {"train_loss": -5.560932159423828, "global_step": 42406, "epoch": 1009} {"train_loss": -5.819260120391846, "global_step": 42407, "epoch": 1009} {"train_loss": -5.647470951080322, "global_step": 42408, "epoch": 1009} {"train_loss": -5.506689071655273, "global_step": 42409, "epoch": 1009} {"train_loss": -5.706910133361816, "global_step": 42410, "epoch": 1009} {"train_loss": -5.5904951095581055, "global_step": 42411, "epoch": 1009} {"train_loss": -5.6604204177856445, "global_step": 42412, "epoch": 1009} {"train_loss": -5.56217098236084, "global_step": 42413, "epoch": 1009} {"train_loss": -5.551968574523926, "global_step": 42414, "epoch": 1009} {"train_loss": -5.686286926269531, "global_step": 42415, "epoch": 1009} {"train_loss": -5.632504463195801, "global_step": 42416, "epoch": 1009} {"train_loss": -5.443342208862305, "global_step": 42417, "epoch": 1009} {"train_loss": -5.728755950927734, "global_step": 42418, "epoch": 1009} {"train_loss": -5.6517073313395185, "global_step": 42419, "epoch": 1009, "val_loss": 61664.5859375} {"train_loss": -5.675608158111572, "global_step": 42420, "epoch": 1010} {"train_loss": -5.635136604309082, "global_step": 42421, "epoch": 1010} {"train_loss": -5.673961639404297, "global_step": 42422, "epoch": 1010} {"train_loss": -5.666799545288086, "global_step": 42423, "epoch": 1010} {"train_loss": -5.65882682800293, "global_step": 42424, "epoch": 1010} {"train_loss": -5.763494968414307, "global_step": 42425, "epoch": 1010} {"train_loss": -5.815227031707764, "global_step": 42426, "epoch": 1010} {"train_loss": -5.643675804138184, "global_step": 42427, "epoch": 1010} {"train_loss": -5.724059581756592, "global_step": 42428, "epoch": 1010} {"train_loss": -5.713915824890137, "global_step": 42429, "epoch": 1010} {"train_loss": -5.5637311935424805, "global_step": 42430, "epoch": 1010} {"train_loss": -5.587963104248047, "global_step": 42431, "epoch": 1010} {"train_loss": -5.773435592651367, "global_step": 42432, "epoch": 1010} {"train_loss": -5.688961029052734, "global_step": 42433, "epoch": 1010} {"train_loss": -5.564708709716797, "global_step": 42434, "epoch": 1010} {"train_loss": -5.712421417236328, "global_step": 42435, "epoch": 1010} {"train_loss": -5.645988464355469, "global_step": 42436, "epoch": 1010} {"train_loss": -5.6717963218688965, "global_step": 42437, "epoch": 1010} {"train_loss": -5.645868301391602, "global_step": 42438, "epoch": 1010} {"train_loss": -5.662707328796387, "global_step": 42439, "epoch": 1010} {"train_loss": -5.617097854614258, "global_step": 42440, "epoch": 1010} {"train_loss": -5.748546123504639, "global_step": 42441, "epoch": 1010} {"train_loss": -5.575796604156494, "global_step": 42442, "epoch": 1010} {"train_loss": -5.635668754577637, "global_step": 42443, "epoch": 1010} {"train_loss": -5.64064884185791, "global_step": 42444, "epoch": 1010} {"train_loss": -5.702258110046387, "global_step": 42445, "epoch": 1010} {"train_loss": -5.711223125457764, "global_step": 42446, "epoch": 1010} {"train_loss": -5.606787204742432, "global_step": 42447, "epoch": 1010} {"train_loss": -5.7531328201293945, "global_step": 42448, "epoch": 1010} {"train_loss": -5.744672775268555, "global_step": 42449, "epoch": 1010} {"train_loss": -5.729982376098633, "global_step": 42450, "epoch": 1010} {"train_loss": -5.612519264221191, "global_step": 42451, "epoch": 1010} {"train_loss": -5.634410381317139, "global_step": 42452, "epoch": 1010} {"train_loss": -5.532442092895508, "global_step": 42453, "epoch": 1010} {"train_loss": -5.608956813812256, "global_step": 42454, "epoch": 1010} {"train_loss": -5.620757102966309, "global_step": 42455, "epoch": 1010} {"train_loss": -5.52207088470459, "global_step": 42456, "epoch": 1010} {"train_loss": -5.49477481842041, "global_step": 42457, "epoch": 1010} {"train_loss": -5.629152297973633, "global_step": 42458, "epoch": 1010} {"train_loss": -5.718692302703857, "global_step": 42459, "epoch": 1010} {"train_loss": -5.675446510314941, "global_step": 42460, "epoch": 1010} {"train_loss": -5.6561806201934814, "global_step": 42461, "epoch": 1010, "val_loss": 61798.2265625} {"train_loss": -5.446695327758789, "global_step": 42462, "epoch": 1011} {"train_loss": -5.604544639587402, "global_step": 42463, "epoch": 1011} {"train_loss": -5.593391418457031, "global_step": 42464, "epoch": 1011} {"train_loss": -5.64857816696167, "global_step": 42465, "epoch": 1011} {"train_loss": -5.598090171813965, "global_step": 42466, "epoch": 1011} {"train_loss": -5.579580307006836, "global_step": 42467, "epoch": 1011} {"train_loss": -5.642302513122559, "global_step": 42468, "epoch": 1011} {"train_loss": -5.66856050491333, "global_step": 42469, "epoch": 1011} {"train_loss": -5.788492202758789, "global_step": 42470, "epoch": 1011} {"train_loss": -5.66972017288208, "global_step": 42471, "epoch": 1011} {"train_loss": -5.63706111907959, "global_step": 42472, "epoch": 1011} {"train_loss": -5.722204208374023, "global_step": 42473, "epoch": 1011} {"train_loss": -5.723669528961182, "global_step": 42474, "epoch": 1011} {"train_loss": -5.649604797363281, "global_step": 42475, "epoch": 1011} {"train_loss": -5.764863967895508, "global_step": 42476, "epoch": 1011} {"train_loss": -5.813863277435303, "global_step": 42477, "epoch": 1011} {"train_loss": -5.607245445251465, "global_step": 42478, "epoch": 1011} {"train_loss": -5.625533580780029, "global_step": 42479, "epoch": 1011} {"train_loss": -5.613467216491699, "global_step": 42480, "epoch": 1011} {"train_loss": -5.792608261108398, "global_step": 42481, "epoch": 1011} {"train_loss": -5.708089828491211, "global_step": 42482, "epoch": 1011} {"train_loss": -5.760315895080566, "global_step": 42483, "epoch": 1011} {"train_loss": -5.830001354217529, "global_step": 42484, "epoch": 1011} {"train_loss": -5.686150550842285, "global_step": 42485, "epoch": 1011} {"train_loss": -5.684967994689941, "global_step": 42486, "epoch": 1011} {"train_loss": -5.739609718322754, "global_step": 42487, "epoch": 1011} {"train_loss": -5.648064613342285, "global_step": 42488, "epoch": 1011} {"train_loss": -5.699470043182373, "global_step": 42489, "epoch": 1011} {"train_loss": -5.643241882324219, "global_step": 42490, "epoch": 1011} {"train_loss": -5.675431728363037, "global_step": 42491, "epoch": 1011} {"train_loss": -5.726409912109375, "global_step": 42492, "epoch": 1011} {"train_loss": -5.676353454589844, "global_step": 42493, "epoch": 1011} {"train_loss": -5.768562316894531, "global_step": 42494, "epoch": 1011} {"train_loss": -5.664023399353027, "global_step": 42495, "epoch": 1011} {"train_loss": -5.548155307769775, "global_step": 42496, "epoch": 1011} {"train_loss": -5.682056903839111, "global_step": 42497, "epoch": 1011} {"train_loss": -5.573248386383057, "global_step": 42498, "epoch": 1011} {"train_loss": -5.68374490737915, "global_step": 42499, "epoch": 1011} {"train_loss": -5.746922492980957, "global_step": 42500, "epoch": 1011} {"train_loss": -5.787042617797852, "global_step": 42501, "epoch": 1011} {"train_loss": -5.661283493041992, "global_step": 42502, "epoch": 1011} {"train_loss": -5.678407850719633, "global_step": 42503, "epoch": 1011, "val_loss": 61430.27734375} {"train_loss": -5.771191596984863, "global_step": 42504, "epoch": 1012} {"train_loss": -5.667329788208008, "global_step": 42505, "epoch": 1012} {"train_loss": -5.751607894897461, "global_step": 42506, "epoch": 1012} {"train_loss": -5.667911052703857, "global_step": 42507, "epoch": 1012} {"train_loss": -5.666747093200684, "global_step": 42508, "epoch": 1012} {"train_loss": -5.713846206665039, "global_step": 42509, "epoch": 1012} {"train_loss": -5.776432514190674, "global_step": 42510, "epoch": 1012} {"train_loss": -5.662297248840332, "global_step": 42511, "epoch": 1012} {"train_loss": -5.742328643798828, "global_step": 42512, "epoch": 1012} {"train_loss": -5.567154884338379, "global_step": 42513, "epoch": 1012} {"train_loss": -5.615828037261963, "global_step": 42514, "epoch": 1012} {"train_loss": -5.764966011047363, "global_step": 42515, "epoch": 1012} {"train_loss": -5.680861473083496, "global_step": 42516, "epoch": 1012} {"train_loss": -5.605952262878418, "global_step": 42517, "epoch": 1012} {"train_loss": -5.783485412597656, "global_step": 42518, "epoch": 1012} {"train_loss": -5.672132968902588, "global_step": 42519, "epoch": 1012} {"train_loss": -5.630911827087402, "global_step": 42520, "epoch": 1012} {"train_loss": -5.551086902618408, "global_step": 42521, "epoch": 1012} {"train_loss": -5.759984493255615, "global_step": 42522, "epoch": 1012} {"train_loss": -5.677326202392578, "global_step": 42523, "epoch": 1012} {"train_loss": -5.46132230758667, "global_step": 42524, "epoch": 1012} {"train_loss": -5.7069783210754395, "global_step": 42525, "epoch": 1012} {"train_loss": -5.77099609375, "global_step": 42526, "epoch": 1012} {"train_loss": -5.5924577713012695, "global_step": 42527, "epoch": 1012} {"train_loss": -5.713370323181152, "global_step": 42528, "epoch": 1012} {"train_loss": -5.551333904266357, "global_step": 42529, "epoch": 1012} {"train_loss": -5.756678104400635, "global_step": 42530, "epoch": 1012} {"train_loss": -5.57963752746582, "global_step": 42531, "epoch": 1012} {"train_loss": -5.779558181762695, "global_step": 42532, "epoch": 1012} {"train_loss": -5.84848690032959, "global_step": 42533, "epoch": 1012} {"train_loss": -5.6430206298828125, "global_step": 42534, "epoch": 1012} {"train_loss": -5.6968183517456055, "global_step": 42535, "epoch": 1012} {"train_loss": -5.750166893005371, "global_step": 42536, "epoch": 1012} {"train_loss": -5.791513919830322, "global_step": 42537, "epoch": 1012} {"train_loss": -5.657052516937256, "global_step": 42538, "epoch": 1012} {"train_loss": -5.47797966003418, "global_step": 42539, "epoch": 1012} {"train_loss": -5.653355598449707, "global_step": 42540, "epoch": 1012} {"train_loss": -5.6857500076293945, "global_step": 42541, "epoch": 1012} {"train_loss": -5.649941921234131, "global_step": 42542, "epoch": 1012} {"train_loss": -5.612282752990723, "global_step": 42543, "epoch": 1012} {"train_loss": -5.559281349182129, "global_step": 42544, "epoch": 1012} {"train_loss": -5.672640164693196, "global_step": 42545, "epoch": 1012, "val_loss": 61641.54296875} {"train_loss": -5.5803141593933105, "global_step": 42546, "epoch": 1013} {"train_loss": -5.707660675048828, "global_step": 42547, "epoch": 1013} {"train_loss": -5.692228317260742, "global_step": 42548, "epoch": 1013} {"train_loss": -5.682759761810303, "global_step": 42549, "epoch": 1013} {"train_loss": -5.698936939239502, "global_step": 42550, "epoch": 1013} {"train_loss": -5.696865081787109, "global_step": 42551, "epoch": 1013} {"train_loss": -5.68605899810791, "global_step": 42552, "epoch": 1013} {"train_loss": -5.646183967590332, "global_step": 42553, "epoch": 1013} {"train_loss": -5.656256675720215, "global_step": 42554, "epoch": 1013} {"train_loss": -5.621443748474121, "global_step": 42555, "epoch": 1013} {"train_loss": -5.701013565063477, "global_step": 42556, "epoch": 1013} {"train_loss": -5.6721014976501465, "global_step": 42557, "epoch": 1013} {"train_loss": -5.671465873718262, "global_step": 42558, "epoch": 1013} {"train_loss": -5.647390365600586, "global_step": 42559, "epoch": 1013} {"train_loss": -5.580426216125488, "global_step": 42560, "epoch": 1013} {"train_loss": -5.620295524597168, "global_step": 42561, "epoch": 1013} {"train_loss": -5.686650276184082, "global_step": 42562, "epoch": 1013} {"train_loss": -5.701016426086426, "global_step": 42563, "epoch": 1013} {"train_loss": -5.726556777954102, "global_step": 42564, "epoch": 1013} {"train_loss": -5.492429733276367, "global_step": 42565, "epoch": 1013} {"train_loss": -5.568704605102539, "global_step": 42566, "epoch": 1013} {"train_loss": -5.667527198791504, "global_step": 42567, "epoch": 1013} {"train_loss": -5.639300346374512, "global_step": 42568, "epoch": 1013} {"train_loss": -5.648900508880615, "global_step": 42569, "epoch": 1013} {"train_loss": -5.639535903930664, "global_step": 42570, "epoch": 1013} {"train_loss": -5.67769718170166, "global_step": 42571, "epoch": 1013} {"train_loss": -5.687238693237305, "global_step": 42572, "epoch": 1013} {"train_loss": -5.650333881378174, "global_step": 42573, "epoch": 1013} {"train_loss": -5.646363258361816, "global_step": 42574, "epoch": 1013} {"train_loss": -5.677484512329102, "global_step": 42575, "epoch": 1013} {"train_loss": -5.488730430603027, "global_step": 42576, "epoch": 1013} {"train_loss": -5.622770309448242, "global_step": 42577, "epoch": 1013} {"train_loss": -5.558173179626465, "global_step": 42578, "epoch": 1013} {"train_loss": -5.586430549621582, "global_step": 42579, "epoch": 1013} {"train_loss": -5.726888656616211, "global_step": 42580, "epoch": 1013} {"train_loss": -5.456279754638672, "global_step": 42581, "epoch": 1013} {"train_loss": -5.635744094848633, "global_step": 42582, "epoch": 1013} {"train_loss": -5.644413948059082, "global_step": 42583, "epoch": 1013} {"train_loss": -5.751391410827637, "global_step": 42584, "epoch": 1013} {"train_loss": -5.678114891052246, "global_step": 42585, "epoch": 1013} {"train_loss": -5.6499247550964355, "global_step": 42586, "epoch": 1013} {"train_loss": -5.644464867455619, "global_step": 42587, "epoch": 1013, "val_loss": 61855.45703125} {"train_loss": -5.817187309265137, "global_step": 42588, "epoch": 1014} {"train_loss": -5.642134666442871, "global_step": 42589, "epoch": 1014} {"train_loss": -5.624307632446289, "global_step": 42590, "epoch": 1014} {"train_loss": -5.6858367919921875, "global_step": 42591, "epoch": 1014} {"train_loss": -5.665311813354492, "global_step": 42592, "epoch": 1014} {"train_loss": -5.65084171295166, "global_step": 42593, "epoch": 1014} {"train_loss": -5.695311546325684, "global_step": 42594, "epoch": 1014} {"train_loss": -5.651385307312012, "global_step": 42595, "epoch": 1014} {"train_loss": -5.688235282897949, "global_step": 42596, "epoch": 1014} {"train_loss": -5.60496187210083, "global_step": 42597, "epoch": 1014} {"train_loss": -5.648129463195801, "global_step": 42598, "epoch": 1014} {"train_loss": -5.702029228210449, "global_step": 42599, "epoch": 1014} {"train_loss": -5.6181535720825195, "global_step": 42600, "epoch": 1014} {"train_loss": -5.636954307556152, "global_step": 42601, "epoch": 1014} {"train_loss": -5.6584367752075195, "global_step": 42602, "epoch": 1014} {"train_loss": -5.51505708694458, "global_step": 42603, "epoch": 1014} {"train_loss": -5.66298246383667, "global_step": 42604, "epoch": 1014} {"train_loss": -5.654249668121338, "global_step": 42605, "epoch": 1014} {"train_loss": -5.749227046966553, "global_step": 42606, "epoch": 1014} {"train_loss": -5.657868385314941, "global_step": 42607, "epoch": 1014} {"train_loss": -5.6729559898376465, "global_step": 42608, "epoch": 1014} {"train_loss": -5.729267120361328, "global_step": 42609, "epoch": 1014} {"train_loss": -5.596263885498047, "global_step": 42610, "epoch": 1014} {"train_loss": -5.71462345123291, "global_step": 42611, "epoch": 1014} {"train_loss": -5.598476409912109, "global_step": 42612, "epoch": 1014} {"train_loss": -5.670960426330566, "global_step": 42613, "epoch": 1014} {"train_loss": -5.554708480834961, "global_step": 42614, "epoch": 1014} {"train_loss": -5.576752185821533, "global_step": 42615, "epoch": 1014} {"train_loss": -5.744612693786621, "global_step": 42616, "epoch": 1014} {"train_loss": -5.709759712219238, "global_step": 42617, "epoch": 1014} {"train_loss": -5.649198055267334, "global_step": 42618, "epoch": 1014} {"train_loss": -5.7022247314453125, "global_step": 42619, "epoch": 1014} {"train_loss": -5.739712715148926, "global_step": 42620, "epoch": 1014} {"train_loss": -5.625649929046631, "global_step": 42621, "epoch": 1014} {"train_loss": -5.594890594482422, "global_step": 42622, "epoch": 1014} {"train_loss": -5.641232490539551, "global_step": 42623, "epoch": 1014} {"train_loss": -5.753171920776367, "global_step": 42624, "epoch": 1014} {"train_loss": -5.612865924835205, "global_step": 42625, "epoch": 1014} {"train_loss": -5.758255958557129, "global_step": 42626, "epoch": 1014} {"train_loss": -5.7024078369140625, "global_step": 42627, "epoch": 1014} {"train_loss": -5.630608558654785, "global_step": 42628, "epoch": 1014} {"train_loss": -5.663690794081915, "global_step": 42629, "epoch": 1014, "val_loss": 61840.4765625} {"train_loss": -5.590300559997559, "global_step": 42630, "epoch": 1015} {"train_loss": -5.729412078857422, "global_step": 42631, "epoch": 1015} {"train_loss": -5.534508228302002, "global_step": 42632, "epoch": 1015} {"train_loss": -5.59943962097168, "global_step": 42633, "epoch": 1015} {"train_loss": -5.744729042053223, "global_step": 42634, "epoch": 1015} {"train_loss": -5.649977684020996, "global_step": 42635, "epoch": 1015} {"train_loss": -5.717031478881836, "global_step": 42636, "epoch": 1015} {"train_loss": -5.656965255737305, "global_step": 42637, "epoch": 1015} {"train_loss": -5.642301559448242, "global_step": 42638, "epoch": 1015} {"train_loss": -5.686509132385254, "global_step": 42639, "epoch": 1015} {"train_loss": -5.615642547607422, "global_step": 42640, "epoch": 1015} {"train_loss": -5.5565266609191895, "global_step": 42641, "epoch": 1015} {"train_loss": -5.685533046722412, "global_step": 42642, "epoch": 1015} {"train_loss": -5.658815383911133, "global_step": 42643, "epoch": 1015} {"train_loss": -5.739916801452637, "global_step": 42644, "epoch": 1015} {"train_loss": -5.707742691040039, "global_step": 42645, "epoch": 1015} {"train_loss": -5.716009140014648, "global_step": 42646, "epoch": 1015} {"train_loss": -5.664029121398926, "global_step": 42647, "epoch": 1015} {"train_loss": -5.615200519561768, "global_step": 42648, "epoch": 1015} {"train_loss": -5.649595260620117, "global_step": 42649, "epoch": 1015} {"train_loss": -5.813654899597168, "global_step": 42650, "epoch": 1015} {"train_loss": -5.6863203048706055, "global_step": 42651, "epoch": 1015} {"train_loss": -5.6697235107421875, "global_step": 42652, "epoch": 1015} {"train_loss": -5.7341108322143555, "global_step": 42653, "epoch": 1015} {"train_loss": -5.537901878356934, "global_step": 42654, "epoch": 1015} {"train_loss": -5.69857120513916, "global_step": 42655, "epoch": 1015} {"train_loss": -5.713381290435791, "global_step": 42656, "epoch": 1015} {"train_loss": -5.784754753112793, "global_step": 42657, "epoch": 1015} {"train_loss": -5.626792907714844, "global_step": 42658, "epoch": 1015} {"train_loss": -5.6933417320251465, "global_step": 42659, "epoch": 1015} {"train_loss": -5.67595911026001, "global_step": 42660, "epoch": 1015} {"train_loss": -5.623084545135498, "global_step": 42661, "epoch": 1015} {"train_loss": -5.803587436676025, "global_step": 42662, "epoch": 1015} {"train_loss": -5.7291717529296875, "global_step": 42663, "epoch": 1015} {"train_loss": -5.747073173522949, "global_step": 42664, "epoch": 1015} {"train_loss": -5.609323501586914, "global_step": 42665, "epoch": 1015} {"train_loss": -5.533293724060059, "global_step": 42666, "epoch": 1015} {"train_loss": -5.659221649169922, "global_step": 42667, "epoch": 1015} {"train_loss": -5.610236167907715, "global_step": 42668, "epoch": 1015} {"train_loss": -5.6703596115112305, "global_step": 42669, "epoch": 1015} {"train_loss": -5.666975975036621, "global_step": 42670, "epoch": 1015} {"train_loss": -5.671637296676636, "global_step": 42671, "epoch": 1015, "val_loss": 61824.1640625} {"train_loss": -5.5494842529296875, "global_step": 42672, "epoch": 1016} {"train_loss": -5.66401481628418, "global_step": 42673, "epoch": 1016} {"train_loss": -5.662306785583496, "global_step": 42674, "epoch": 1016} {"train_loss": -5.6547465324401855, "global_step": 42675, "epoch": 1016} {"train_loss": -5.797133445739746, "global_step": 42676, "epoch": 1016} {"train_loss": -5.653957366943359, "global_step": 42677, "epoch": 1016} {"train_loss": -5.4603681564331055, "global_step": 42678, "epoch": 1016} {"train_loss": -5.712342262268066, "global_step": 42679, "epoch": 1016} {"train_loss": -5.636105537414551, "global_step": 42680, "epoch": 1016} {"train_loss": -5.411890983581543, "global_step": 42681, "epoch": 1016} {"train_loss": -5.575769424438477, "global_step": 42682, "epoch": 1016} {"train_loss": -5.429132461547852, "global_step": 42683, "epoch": 1016} {"train_loss": -5.516009330749512, "global_step": 42684, "epoch": 1016} {"train_loss": -5.587803840637207, "global_step": 42685, "epoch": 1016} {"train_loss": -5.4522223472595215, "global_step": 42686, "epoch": 1016} {"train_loss": -5.637411594390869, "global_step": 42687, "epoch": 1016} {"train_loss": -5.443509101867676, "global_step": 42688, "epoch": 1016} {"train_loss": -5.623531818389893, "global_step": 42689, "epoch": 1016} {"train_loss": -5.465033531188965, "global_step": 42690, "epoch": 1016} {"train_loss": -5.759652137756348, "global_step": 42691, "epoch": 1016} {"train_loss": -5.523347854614258, "global_step": 42692, "epoch": 1016} {"train_loss": -5.686773300170898, "global_step": 42693, "epoch": 1016} {"train_loss": -5.485840320587158, "global_step": 42694, "epoch": 1016} {"train_loss": -5.5134148597717285, "global_step": 42695, "epoch": 1016} {"train_loss": -5.615931034088135, "global_step": 42696, "epoch": 1016} {"train_loss": -5.591762542724609, "global_step": 42697, "epoch": 1016} {"train_loss": -5.493683815002441, "global_step": 42698, "epoch": 1016} {"train_loss": -5.507118225097656, "global_step": 42699, "epoch": 1016} {"train_loss": -5.690670967102051, "global_step": 42700, "epoch": 1016} {"train_loss": -5.563302993774414, "global_step": 42701, "epoch": 1016} {"train_loss": -5.579397201538086, "global_step": 42702, "epoch": 1016} {"train_loss": -5.6130523681640625, "global_step": 42703, "epoch": 1016} {"train_loss": -5.612483024597168, "global_step": 42704, "epoch": 1016} {"train_loss": -5.633627414703369, "global_step": 42705, "epoch": 1016} {"train_loss": -5.735467433929443, "global_step": 42706, "epoch": 1016} {"train_loss": -5.6358418464660645, "global_step": 42707, "epoch": 1016} {"train_loss": -5.56645393371582, "global_step": 42708, "epoch": 1016} {"train_loss": -5.517711639404297, "global_step": 42709, "epoch": 1016} {"train_loss": -5.667288780212402, "global_step": 42710, "epoch": 1016} {"train_loss": -5.591982841491699, "global_step": 42711, "epoch": 1016} {"train_loss": -5.615774631500244, "global_step": 42712, "epoch": 1016} {"train_loss": -5.5884398846399215, "global_step": 42713, "epoch": 1016, "val_loss": 61970.140625} {"train_loss": -5.688693046569824, "global_step": 42714, "epoch": 1017} {"train_loss": -5.700256824493408, "global_step": 42715, "epoch": 1017} {"train_loss": -5.658679962158203, "global_step": 42716, "epoch": 1017} {"train_loss": -5.6699018478393555, "global_step": 42717, "epoch": 1017} {"train_loss": -5.725376129150391, "global_step": 42718, "epoch": 1017} {"train_loss": -5.773189067840576, "global_step": 42719, "epoch": 1017} {"train_loss": -5.631908893585205, "global_step": 42720, "epoch": 1017} {"train_loss": -5.50042200088501, "global_step": 42721, "epoch": 1017} {"train_loss": -5.715042591094971, "global_step": 42722, "epoch": 1017} {"train_loss": -5.59564208984375, "global_step": 42723, "epoch": 1017} {"train_loss": -5.759676933288574, "global_step": 42724, "epoch": 1017} {"train_loss": -5.584625244140625, "global_step": 42725, "epoch": 1017} {"train_loss": -5.568713188171387, "global_step": 42726, "epoch": 1017} {"train_loss": -5.624904155731201, "global_step": 42727, "epoch": 1017} {"train_loss": -5.7466278076171875, "global_step": 42728, "epoch": 1017} {"train_loss": -5.616803169250488, "global_step": 42729, "epoch": 1017} {"train_loss": -5.649798393249512, "global_step": 42730, "epoch": 1017} {"train_loss": -5.674415588378906, "global_step": 42731, "epoch": 1017} {"train_loss": -5.604470729827881, "global_step": 42732, "epoch": 1017} {"train_loss": -5.749469757080078, "global_step": 42733, "epoch": 1017} {"train_loss": -5.722944736480713, "global_step": 42734, "epoch": 1017} {"train_loss": -5.676466464996338, "global_step": 42735, "epoch": 1017} {"train_loss": -5.690629959106445, "global_step": 42736, "epoch": 1017} {"train_loss": -5.806704521179199, "global_step": 42737, "epoch": 1017} {"train_loss": -5.614535331726074, "global_step": 42738, "epoch": 1017} {"train_loss": -5.61000919342041, "global_step": 42739, "epoch": 1017} {"train_loss": -5.727607727050781, "global_step": 42740, "epoch": 1017} {"train_loss": -5.757751941680908, "global_step": 42741, "epoch": 1017} {"train_loss": -5.626354217529297, "global_step": 42742, "epoch": 1017} {"train_loss": -5.588937282562256, "global_step": 42743, "epoch": 1017} {"train_loss": -5.706419944763184, "global_step": 42744, "epoch": 1017} {"train_loss": -5.734386920928955, "global_step": 42745, "epoch": 1017} {"train_loss": -5.5382232666015625, "global_step": 42746, "epoch": 1017} {"train_loss": -5.835207939147949, "global_step": 42747, "epoch": 1017} {"train_loss": -5.646111011505127, "global_step": 42748, "epoch": 1017} {"train_loss": -5.624971389770508, "global_step": 42749, "epoch": 1017} {"train_loss": -5.721858501434326, "global_step": 42750, "epoch": 1017} {"train_loss": -5.678439617156982, "global_step": 42751, "epoch": 1017} {"train_loss": -5.666357040405273, "global_step": 42752, "epoch": 1017} {"train_loss": -5.715911865234375, "global_step": 42753, "epoch": 1017} {"train_loss": -5.694470405578613, "global_step": 42754, "epoch": 1017} {"train_loss": -5.674763497852144, "global_step": 42755, "epoch": 1017, "val_loss": 61576.4296875} {"train_loss": -5.681365489959717, "global_step": 42756, "epoch": 1018} {"train_loss": -5.655835151672363, "global_step": 42757, "epoch": 1018} {"train_loss": -5.620426177978516, "global_step": 42758, "epoch": 1018} {"train_loss": -5.688900947570801, "global_step": 42759, "epoch": 1018} {"train_loss": -5.680630207061768, "global_step": 42760, "epoch": 1018} {"train_loss": -5.750220775604248, "global_step": 42761, "epoch": 1018} {"train_loss": -5.678396701812744, "global_step": 42762, "epoch": 1018} {"train_loss": -5.530820846557617, "global_step": 42763, "epoch": 1018} {"train_loss": -5.733672618865967, "global_step": 42764, "epoch": 1018} {"train_loss": -5.623570919036865, "global_step": 42765, "epoch": 1018} {"train_loss": -5.633745193481445, "global_step": 42766, "epoch": 1018} {"train_loss": -5.711796760559082, "global_step": 42767, "epoch": 1018} {"train_loss": -5.589228630065918, "global_step": 42768, "epoch": 1018} {"train_loss": -5.67987585067749, "global_step": 42769, "epoch": 1018} {"train_loss": -5.779296875, "global_step": 42770, "epoch": 1018} {"train_loss": -5.754921913146973, "global_step": 42771, "epoch": 1018} {"train_loss": -5.687803268432617, "global_step": 42772, "epoch": 1018} {"train_loss": -5.6283159255981445, "global_step": 42773, "epoch": 1018} {"train_loss": -5.6682233810424805, "global_step": 42774, "epoch": 1018} {"train_loss": -5.711785316467285, "global_step": 42775, "epoch": 1018} {"train_loss": -5.624767303466797, "global_step": 42776, "epoch": 1018} {"train_loss": -5.717280864715576, "global_step": 42777, "epoch": 1018} {"train_loss": -5.666691780090332, "global_step": 42778, "epoch": 1018} {"train_loss": -5.677846908569336, "global_step": 42779, "epoch": 1018} {"train_loss": -5.64083194732666, "global_step": 42780, "epoch": 1018} {"train_loss": -5.559401035308838, "global_step": 42781, "epoch": 1018} {"train_loss": -5.63037109375, "global_step": 42782, "epoch": 1018} {"train_loss": -5.841958045959473, "global_step": 42783, "epoch": 1018} {"train_loss": -5.661190509796143, "global_step": 42784, "epoch": 1018} {"train_loss": -5.798313140869141, "global_step": 42785, "epoch": 1018} {"train_loss": -5.778069496154785, "global_step": 42786, "epoch": 1018} {"train_loss": -5.840709686279297, "global_step": 42787, "epoch": 1018} {"train_loss": -5.673799514770508, "global_step": 42788, "epoch": 1018} {"train_loss": -5.777624130249023, "global_step": 42789, "epoch": 1018} {"train_loss": -5.6829328536987305, "global_step": 42790, "epoch": 1018} {"train_loss": -5.731535911560059, "global_step": 42791, "epoch": 1018} {"train_loss": -5.7539238929748535, "global_step": 42792, "epoch": 1018} {"train_loss": -5.719405174255371, "global_step": 42793, "epoch": 1018} {"train_loss": -5.740920066833496, "global_step": 42794, "epoch": 1018} {"train_loss": -5.665445804595947, "global_step": 42795, "epoch": 1018} {"train_loss": -5.626558780670166, "global_step": 42796, "epoch": 1018} {"train_loss": -5.694102889015561, "global_step": 42797, "epoch": 1018, "val_loss": 61822.81640625} {"train_loss": -5.6437273025512695, "global_step": 42798, "epoch": 1019} {"train_loss": -5.64940071105957, "global_step": 42799, "epoch": 1019} {"train_loss": -5.716777324676514, "global_step": 42800, "epoch": 1019} {"train_loss": -5.622442722320557, "global_step": 42801, "epoch": 1019} {"train_loss": -5.5678935050964355, "global_step": 42802, "epoch": 1019} {"train_loss": -5.762111663818359, "global_step": 42803, "epoch": 1019} {"train_loss": -5.626133918762207, "global_step": 42804, "epoch": 1019} {"train_loss": -5.652735710144043, "global_step": 42805, "epoch": 1019} {"train_loss": -5.625505447387695, "global_step": 42806, "epoch": 1019} {"train_loss": -5.721258163452148, "global_step": 42807, "epoch": 1019} {"train_loss": -5.747076511383057, "global_step": 42808, "epoch": 1019} {"train_loss": -5.749743461608887, "global_step": 42809, "epoch": 1019} {"train_loss": -5.612051010131836, "global_step": 42810, "epoch": 1019} {"train_loss": -5.784302234649658, "global_step": 42811, "epoch": 1019} {"train_loss": -5.602535724639893, "global_step": 42812, "epoch": 1019} {"train_loss": -5.549551486968994, "global_step": 42813, "epoch": 1019} {"train_loss": -5.628532409667969, "global_step": 42814, "epoch": 1019} {"train_loss": -5.592583656311035, "global_step": 42815, "epoch": 1019} {"train_loss": -5.653859615325928, "global_step": 42816, "epoch": 1019} {"train_loss": -5.664233684539795, "global_step": 42817, "epoch": 1019} {"train_loss": -5.617241382598877, "global_step": 42818, "epoch": 1019} {"train_loss": -5.76656436920166, "global_step": 42819, "epoch": 1019} {"train_loss": -5.635066986083984, "global_step": 42820, "epoch": 1019} {"train_loss": -5.665959358215332, "global_step": 42821, "epoch": 1019} {"train_loss": -5.714361667633057, "global_step": 42822, "epoch": 1019} {"train_loss": -5.617805004119873, "global_step": 42823, "epoch": 1019} {"train_loss": -5.746628761291504, "global_step": 42824, "epoch": 1019} {"train_loss": -5.702264785766602, "global_step": 42825, "epoch": 1019} {"train_loss": -5.580779075622559, "global_step": 42826, "epoch": 1019} {"train_loss": -5.589626312255859, "global_step": 42827, "epoch": 1019} {"train_loss": -5.717245101928711, "global_step": 42828, "epoch": 1019} {"train_loss": -5.591647148132324, "global_step": 42829, "epoch": 1019} {"train_loss": -5.7544169425964355, "global_step": 42830, "epoch": 1019} {"train_loss": -5.6308512687683105, "global_step": 42831, "epoch": 1019} {"train_loss": -5.64786958694458, "global_step": 42832, "epoch": 1019} {"train_loss": -5.5643744468688965, "global_step": 42833, "epoch": 1019} {"train_loss": -5.630717754364014, "global_step": 42834, "epoch": 1019} {"train_loss": -5.59127140045166, "global_step": 42835, "epoch": 1019} {"train_loss": -5.763860702514648, "global_step": 42836, "epoch": 1019} {"train_loss": -5.6820878982543945, "global_step": 42837, "epoch": 1019} {"train_loss": -5.643309116363525, "global_step": 42838, "epoch": 1019} {"train_loss": -5.657738560721988, "global_step": 42839, "epoch": 1019, "val_loss": 62042.2109375} {"train_loss": -5.708017349243164, "global_step": 42840, "epoch": 1020} {"train_loss": -5.666947364807129, "global_step": 42841, "epoch": 1020} {"train_loss": -5.614602565765381, "global_step": 42842, "epoch": 1020} {"train_loss": -5.669167995452881, "global_step": 42843, "epoch": 1020} {"train_loss": -5.624545097351074, "global_step": 42844, "epoch": 1020} {"train_loss": -5.540693759918213, "global_step": 42845, "epoch": 1020} {"train_loss": -5.750518798828125, "global_step": 42846, "epoch": 1020} {"train_loss": -5.699313163757324, "global_step": 42847, "epoch": 1020} {"train_loss": -5.7710113525390625, "global_step": 42848, "epoch": 1020} {"train_loss": -5.658255577087402, "global_step": 42849, "epoch": 1020} {"train_loss": -5.577030181884766, "global_step": 42850, "epoch": 1020} {"train_loss": -5.690694808959961, "global_step": 42851, "epoch": 1020} {"train_loss": -5.4070024490356445, "global_step": 42852, "epoch": 1020} {"train_loss": -5.459778308868408, "global_step": 42853, "epoch": 1020} {"train_loss": -5.4628753662109375, "global_step": 42854, "epoch": 1020} {"train_loss": -5.334668159484863, "global_step": 42855, "epoch": 1020} {"train_loss": -5.661986351013184, "global_step": 42856, "epoch": 1020} {"train_loss": -5.628259658813477, "global_step": 42857, "epoch": 1020} {"train_loss": -5.609602451324463, "global_step": 42858, "epoch": 1020} {"train_loss": -5.452254295349121, "global_step": 42859, "epoch": 1020} {"train_loss": -5.594932556152344, "global_step": 42860, "epoch": 1020} {"train_loss": -5.499604225158691, "global_step": 42861, "epoch": 1020} {"train_loss": -5.624327182769775, "global_step": 42862, "epoch": 1020} {"train_loss": -5.653470039367676, "global_step": 42863, "epoch": 1020} {"train_loss": -5.687251567840576, "global_step": 42864, "epoch": 1020} {"train_loss": -5.629631042480469, "global_step": 42865, "epoch": 1020} {"train_loss": -5.653104305267334, "global_step": 42866, "epoch": 1020} {"train_loss": -5.657163619995117, "global_step": 42867, "epoch": 1020} {"train_loss": -5.747994422912598, "global_step": 42868, "epoch": 1020} {"train_loss": -5.570376396179199, "global_step": 42869, "epoch": 1020} {"train_loss": -5.623435020446777, "global_step": 42870, "epoch": 1020} {"train_loss": -5.684826374053955, "global_step": 42871, "epoch": 1020} {"train_loss": -5.683343887329102, "global_step": 42872, "epoch": 1020} {"train_loss": -5.626401901245117, "global_step": 42873, "epoch": 1020} {"train_loss": -5.603933811187744, "global_step": 42874, "epoch": 1020} {"train_loss": -5.636805057525635, "global_step": 42875, "epoch": 1020} {"train_loss": -5.6363019943237305, "global_step": 42876, "epoch": 1020} {"train_loss": -5.721009731292725, "global_step": 42877, "epoch": 1020} {"train_loss": -5.745593070983887, "global_step": 42878, "epoch": 1020} {"train_loss": -5.713903903961182, "global_step": 42879, "epoch": 1020} {"train_loss": -5.601917743682861, "global_step": 42880, "epoch": 1020} {"train_loss": -5.621969086783273, "global_step": 42881, "epoch": 1020, "val_loss": 61907.5} {"train_loss": -5.572317123413086, "global_step": 42882, "epoch": 1021} {"train_loss": -5.6986985206604, "global_step": 42883, "epoch": 1021} {"train_loss": -5.792771339416504, "global_step": 42884, "epoch": 1021} {"train_loss": -5.72189474105835, "global_step": 42885, "epoch": 1021} {"train_loss": -5.665717124938965, "global_step": 42886, "epoch": 1021} {"train_loss": -5.766997814178467, "global_step": 42887, "epoch": 1021} {"train_loss": -5.712812423706055, "global_step": 42888, "epoch": 1021} {"train_loss": -5.651023864746094, "global_step": 42889, "epoch": 1021} {"train_loss": -5.6037116050720215, "global_step": 42890, "epoch": 1021} {"train_loss": -5.715428352355957, "global_step": 42891, "epoch": 1021} {"train_loss": -5.644139289855957, "global_step": 42892, "epoch": 1021} {"train_loss": -5.7880167961120605, "global_step": 42893, "epoch": 1021} {"train_loss": -5.794881820678711, "global_step": 42894, "epoch": 1021} {"train_loss": -5.748960494995117, "global_step": 42895, "epoch": 1021} {"train_loss": -5.59532356262207, "global_step": 42896, "epoch": 1021} {"train_loss": -5.625897407531738, "global_step": 42897, "epoch": 1021} {"train_loss": -5.61009407043457, "global_step": 42898, "epoch": 1021} {"train_loss": -5.739996433258057, "global_step": 42899, "epoch": 1021} {"train_loss": -5.596182823181152, "global_step": 42900, "epoch": 1021} {"train_loss": -5.615285873413086, "global_step": 42901, "epoch": 1021} {"train_loss": -5.665942668914795, "global_step": 42902, "epoch": 1021} {"train_loss": -5.569577217102051, "global_step": 42903, "epoch": 1021} {"train_loss": -5.6508097648620605, "global_step": 42904, "epoch": 1021} {"train_loss": -5.502999305725098, "global_step": 42905, "epoch": 1021} {"train_loss": -5.629022598266602, "global_step": 42906, "epoch": 1021} {"train_loss": -5.562295913696289, "global_step": 42907, "epoch": 1021} {"train_loss": -5.545010089874268, "global_step": 42908, "epoch": 1021} {"train_loss": -5.686884880065918, "global_step": 42909, "epoch": 1021} {"train_loss": -5.606078147888184, "global_step": 42910, "epoch": 1021} {"train_loss": -5.709369659423828, "global_step": 42911, "epoch": 1021} {"train_loss": -5.728178977966309, "global_step": 42912, "epoch": 1021} {"train_loss": -5.618257522583008, "global_step": 42913, "epoch": 1021} {"train_loss": -5.651511192321777, "global_step": 42914, "epoch": 1021} {"train_loss": -5.611558437347412, "global_step": 42915, "epoch": 1021} {"train_loss": -5.568513870239258, "global_step": 42916, "epoch": 1021} {"train_loss": -5.661226749420166, "global_step": 42917, "epoch": 1021} {"train_loss": -5.54047966003418, "global_step": 42918, "epoch": 1021} {"train_loss": -5.686064720153809, "global_step": 42919, "epoch": 1021} {"train_loss": -5.633472919464111, "global_step": 42920, "epoch": 1021} {"train_loss": -5.6953125, "global_step": 42921, "epoch": 1021} {"train_loss": -5.7881388664245605, "global_step": 42922, "epoch": 1021} {"train_loss": -5.657017072041829, "global_step": 42923, "epoch": 1021, "val_loss": 61337.2734375} {"train_loss": -5.848340034484863, "global_step": 42924, "epoch": 1022} {"train_loss": -5.6442437171936035, "global_step": 42925, "epoch": 1022} {"train_loss": -5.676105976104736, "global_step": 42926, "epoch": 1022} {"train_loss": -5.628944396972656, "global_step": 42927, "epoch": 1022} {"train_loss": -5.618860721588135, "global_step": 42928, "epoch": 1022} {"train_loss": -5.703957557678223, "global_step": 42929, "epoch": 1022} {"train_loss": -5.685143947601318, "global_step": 42930, "epoch": 1022} {"train_loss": -5.747491836547852, "global_step": 42931, "epoch": 1022} {"train_loss": -5.6856689453125, "global_step": 42932, "epoch": 1022} {"train_loss": -5.622331142425537, "global_step": 42933, "epoch": 1022} {"train_loss": -5.670439720153809, "global_step": 42934, "epoch": 1022} {"train_loss": -5.512032985687256, "global_step": 42935, "epoch": 1022} {"train_loss": -5.677263259887695, "global_step": 42936, "epoch": 1022} {"train_loss": -5.644306659698486, "global_step": 42937, "epoch": 1022} {"train_loss": -5.533530235290527, "global_step": 42938, "epoch": 1022} {"train_loss": -5.685665130615234, "global_step": 42939, "epoch": 1022} {"train_loss": -5.665993690490723, "global_step": 42940, "epoch": 1022} {"train_loss": -5.765413761138916, "global_step": 42941, "epoch": 1022} {"train_loss": -5.609539031982422, "global_step": 42942, "epoch": 1022} {"train_loss": -5.574227333068848, "global_step": 42943, "epoch": 1022} {"train_loss": -5.7662177085876465, "global_step": 42944, "epoch": 1022} {"train_loss": -5.570844650268555, "global_step": 42945, "epoch": 1022} {"train_loss": -5.609103202819824, "global_step": 42946, "epoch": 1022} {"train_loss": -5.6533050537109375, "global_step": 42947, "epoch": 1022} {"train_loss": -5.546271324157715, "global_step": 42948, "epoch": 1022} {"train_loss": -5.697605609893799, "global_step": 42949, "epoch": 1022} {"train_loss": -5.616374969482422, "global_step": 42950, "epoch": 1022} {"train_loss": -5.631862640380859, "global_step": 42951, "epoch": 1022} {"train_loss": -5.5480804443359375, "global_step": 42952, "epoch": 1022} {"train_loss": -5.631394863128662, "global_step": 42953, "epoch": 1022} {"train_loss": -5.796389579772949, "global_step": 42954, "epoch": 1022} {"train_loss": -5.574729919433594, "global_step": 42955, "epoch": 1022} {"train_loss": -5.605170249938965, "global_step": 42956, "epoch": 1022} {"train_loss": -5.606847763061523, "global_step": 42957, "epoch": 1022} {"train_loss": -5.488943099975586, "global_step": 42958, "epoch": 1022} {"train_loss": -5.8078389167785645, "global_step": 42959, "epoch": 1022} {"train_loss": -5.723580360412598, "global_step": 42960, "epoch": 1022} {"train_loss": -5.746079444885254, "global_step": 42961, "epoch": 1022} {"train_loss": -5.718650817871094, "global_step": 42962, "epoch": 1022} {"train_loss": -5.649454593658447, "global_step": 42963, "epoch": 1022} {"train_loss": -5.673598766326904, "global_step": 42964, "epoch": 1022} {"train_loss": -5.6559774194444925, "global_step": 42965, "epoch": 1022, "val_loss": 61858.83203125} {"train_loss": -5.77984619140625, "global_step": 42966, "epoch": 1023} {"train_loss": -5.689264297485352, "global_step": 42967, "epoch": 1023} {"train_loss": -5.661301612854004, "global_step": 42968, "epoch": 1023} {"train_loss": -5.66878080368042, "global_step": 42969, "epoch": 1023} {"train_loss": -5.68627405166626, "global_step": 42970, "epoch": 1023} {"train_loss": -5.500038146972656, "global_step": 42971, "epoch": 1023} {"train_loss": -5.718932151794434, "global_step": 42972, "epoch": 1023} {"train_loss": -5.5000224113464355, "global_step": 42973, "epoch": 1023} {"train_loss": -5.68848180770874, "global_step": 42974, "epoch": 1023} {"train_loss": -5.569118499755859, "global_step": 42975, "epoch": 1023} {"train_loss": -5.744728088378906, "global_step": 42976, "epoch": 1023} {"train_loss": -5.772366523742676, "global_step": 42977, "epoch": 1023} {"train_loss": -5.743244171142578, "global_step": 42978, "epoch": 1023} {"train_loss": -5.714550971984863, "global_step": 42979, "epoch": 1023} {"train_loss": -5.6795454025268555, "global_step": 42980, "epoch": 1023} {"train_loss": -5.723529815673828, "global_step": 42981, "epoch": 1023} {"train_loss": -5.731464862823486, "global_step": 42982, "epoch": 1023} {"train_loss": -5.7875075340271, "global_step": 42983, "epoch": 1023} {"train_loss": -5.712134838104248, "global_step": 42984, "epoch": 1023} {"train_loss": -5.730353355407715, "global_step": 42985, "epoch": 1023} {"train_loss": -5.661810874938965, "global_step": 42986, "epoch": 1023} {"train_loss": -5.686709403991699, "global_step": 42987, "epoch": 1023} {"train_loss": -5.634914398193359, "global_step": 42988, "epoch": 1023} {"train_loss": -5.800487995147705, "global_step": 42989, "epoch": 1023} {"train_loss": -5.666611671447754, "global_step": 42990, "epoch": 1023} {"train_loss": -5.674136161804199, "global_step": 42991, "epoch": 1023} {"train_loss": -5.7337846755981445, "global_step": 42992, "epoch": 1023} {"train_loss": -5.713295936584473, "global_step": 42993, "epoch": 1023} {"train_loss": -5.653648376464844, "global_step": 42994, "epoch": 1023} {"train_loss": -5.636770248413086, "global_step": 42995, "epoch": 1023} {"train_loss": -5.682411193847656, "global_step": 42996, "epoch": 1023} {"train_loss": -5.811543941497803, "global_step": 42997, "epoch": 1023} {"train_loss": -5.579304218292236, "global_step": 42998, "epoch": 1023} {"train_loss": -5.531010627746582, "global_step": 42999, "epoch": 1023} {"train_loss": -5.6071624755859375, "global_step": 43000, "epoch": 1023} {"train_loss": -5.797964096069336, "global_step": 43001, "epoch": 1023} {"train_loss": -5.679569244384766, "global_step": 43002, "epoch": 1023} {"train_loss": -5.77341890335083, "global_step": 43003, "epoch": 1023} {"train_loss": -5.6529645919799805, "global_step": 43004, "epoch": 1023} {"train_loss": -5.697414398193359, "global_step": 43005, "epoch": 1023} {"train_loss": -5.592668056488037, "global_step": 43006, "epoch": 1023} {"train_loss": -5.682417018072946, "global_step": 43007, "epoch": 1023, "val_loss": 61484.0859375} {"train_loss": -5.682060718536377, "global_step": 43008, "epoch": 1024} {"train_loss": -5.70886754989624, "global_step": 43009, "epoch": 1024} {"train_loss": -5.5935187339782715, "global_step": 43010, "epoch": 1024} {"train_loss": -5.6741557121276855, "global_step": 43011, "epoch": 1024} {"train_loss": -5.558601379394531, "global_step": 43012, "epoch": 1024} {"train_loss": -5.603026390075684, "global_step": 43013, "epoch": 1024} {"train_loss": -5.730561256408691, "global_step": 43014, "epoch": 1024} {"train_loss": -5.603947639465332, "global_step": 43015, "epoch": 1024} {"train_loss": -5.696549415588379, "global_step": 43016, "epoch": 1024} {"train_loss": -5.610868453979492, "global_step": 43017, "epoch": 1024} {"train_loss": -5.674494743347168, "global_step": 43018, "epoch": 1024} {"train_loss": -5.7953386306762695, "global_step": 43019, "epoch": 1024} {"train_loss": -5.692471504211426, "global_step": 43020, "epoch": 1024} {"train_loss": -5.649208068847656, "global_step": 43021, "epoch": 1024} {"train_loss": -5.75892448425293, "global_step": 43022, "epoch": 1024} {"train_loss": -5.730676651000977, "global_step": 43023, "epoch": 1024} {"train_loss": -5.664926528930664, "global_step": 43024, "epoch": 1024} {"train_loss": -5.7112321853637695, "global_step": 43025, "epoch": 1024} {"train_loss": -5.677529335021973, "global_step": 43026, "epoch": 1024} {"train_loss": -5.70085334777832, "global_step": 43027, "epoch": 1024} {"train_loss": -5.61650276184082, "global_step": 43028, "epoch": 1024} {"train_loss": -5.727225303649902, "global_step": 43029, "epoch": 1024} {"train_loss": -5.619237422943115, "global_step": 43030, "epoch": 1024} {"train_loss": -5.623104095458984, "global_step": 43031, "epoch": 1024} {"train_loss": -5.793241500854492, "global_step": 43032, "epoch": 1024} {"train_loss": -5.6770782470703125, "global_step": 43033, "epoch": 1024} {"train_loss": -5.637225151062012, "global_step": 43034, "epoch": 1024} {"train_loss": -5.558326721191406, "global_step": 43035, "epoch": 1024} {"train_loss": -5.577881813049316, "global_step": 43036, "epoch": 1024} {"train_loss": -5.707736015319824, "global_step": 43037, "epoch": 1024} {"train_loss": -5.586994171142578, "global_step": 43038, "epoch": 1024} {"train_loss": -5.675057411193848, "global_step": 43039, "epoch": 1024} {"train_loss": -5.549057960510254, "global_step": 43040, "epoch": 1024} {"train_loss": -5.7778496742248535, "global_step": 43041, "epoch": 1024} {"train_loss": -5.795845031738281, "global_step": 43042, "epoch": 1024} {"train_loss": -5.6534624099731445, "global_step": 43043, "epoch": 1024} {"train_loss": -5.6205291748046875, "global_step": 43044, "epoch": 1024} {"train_loss": -5.676754474639893, "global_step": 43045, "epoch": 1024} {"train_loss": -5.705829620361328, "global_step": 43046, "epoch": 1024} {"train_loss": -5.582493782043457, "global_step": 43047, "epoch": 1024} {"train_loss": -5.610544204711914, "global_step": 43048, "epoch": 1024} {"train_loss": -5.666274206978934, "global_step": 43049, "epoch": 1024, "val_loss": 61930.36328125} {"train_loss": -5.6330952644348145, "global_step": 43050, "epoch": 1025} {"train_loss": -5.5782880783081055, "global_step": 43051, "epoch": 1025} {"train_loss": -5.797162055969238, "global_step": 43052, "epoch": 1025} {"train_loss": -5.586235046386719, "global_step": 43053, "epoch": 1025} {"train_loss": -5.6377692222595215, "global_step": 43054, "epoch": 1025} {"train_loss": -5.803055763244629, "global_step": 43055, "epoch": 1025} {"train_loss": -5.813519477844238, "global_step": 43056, "epoch": 1025} {"train_loss": -5.810664176940918, "global_step": 43057, "epoch": 1025} {"train_loss": -5.697063446044922, "global_step": 43058, "epoch": 1025} {"train_loss": -5.6863274574279785, "global_step": 43059, "epoch": 1025} {"train_loss": -5.617789268493652, "global_step": 43060, "epoch": 1025} {"train_loss": -5.803867340087891, "global_step": 43061, "epoch": 1025} {"train_loss": -5.830625057220459, "global_step": 43062, "epoch": 1025} {"train_loss": -5.770623207092285, "global_step": 43063, "epoch": 1025} {"train_loss": -5.748348236083984, "global_step": 43064, "epoch": 1025} {"train_loss": -5.766312599182129, "global_step": 43065, "epoch": 1025} {"train_loss": -5.744822978973389, "global_step": 43066, "epoch": 1025} {"train_loss": -5.623117446899414, "global_step": 43067, "epoch": 1025} {"train_loss": -5.707005500793457, "global_step": 43068, "epoch": 1025} {"train_loss": -5.733147621154785, "global_step": 43069, "epoch": 1025} {"train_loss": -5.723077297210693, "global_step": 43070, "epoch": 1025} {"train_loss": -5.680829048156738, "global_step": 43071, "epoch": 1025} {"train_loss": -5.741787433624268, "global_step": 43072, "epoch": 1025} {"train_loss": -5.654208183288574, "global_step": 43073, "epoch": 1025} {"train_loss": -5.682838439941406, "global_step": 43074, "epoch": 1025} {"train_loss": -5.65162467956543, "global_step": 43075, "epoch": 1025} {"train_loss": -5.626820087432861, "global_step": 43076, "epoch": 1025} {"train_loss": -5.666034698486328, "global_step": 43077, "epoch": 1025} {"train_loss": -5.794069766998291, "global_step": 43078, "epoch": 1025} {"train_loss": -5.713184833526611, "global_step": 43079, "epoch": 1025} {"train_loss": -5.685523509979248, "global_step": 43080, "epoch": 1025} {"train_loss": -5.554431915283203, "global_step": 43081, "epoch": 1025} {"train_loss": -5.635831832885742, "global_step": 43082, "epoch": 1025} {"train_loss": -5.717971324920654, "global_step": 43083, "epoch": 1025} {"train_loss": -5.668540000915527, "global_step": 43084, "epoch": 1025} {"train_loss": -5.726587295532227, "global_step": 43085, "epoch": 1025} {"train_loss": -5.744584083557129, "global_step": 43086, "epoch": 1025} {"train_loss": -5.648291110992432, "global_step": 43087, "epoch": 1025} {"train_loss": -5.725375652313232, "global_step": 43088, "epoch": 1025} {"train_loss": -5.781414031982422, "global_step": 43089, "epoch": 1025} {"train_loss": -5.578388214111328, "global_step": 43090, "epoch": 1025} {"train_loss": -5.700249944414411, "global_step": 43091, "epoch": 1025, "val_loss": 61461.1875} {"train_loss": -5.61298942565918, "global_step": 43092, "epoch": 1026} {"train_loss": -5.738841533660889, "global_step": 43093, "epoch": 1026} {"train_loss": -5.809787750244141, "global_step": 43094, "epoch": 1026} {"train_loss": -5.556157112121582, "global_step": 43095, "epoch": 1026} {"train_loss": -5.5804667472839355, "global_step": 43096, "epoch": 1026} {"train_loss": -5.599318504333496, "global_step": 43097, "epoch": 1026} {"train_loss": -5.675018310546875, "global_step": 43098, "epoch": 1026} {"train_loss": -5.558295249938965, "global_step": 43099, "epoch": 1026} {"train_loss": -5.534521102905273, "global_step": 43100, "epoch": 1026} {"train_loss": -5.550415992736816, "global_step": 43101, "epoch": 1026} {"train_loss": -5.6687846183776855, "global_step": 43102, "epoch": 1026} {"train_loss": -5.57440185546875, "global_step": 43103, "epoch": 1026} {"train_loss": -5.688690662384033, "global_step": 43104, "epoch": 1026} {"train_loss": -5.775047302246094, "global_step": 43105, "epoch": 1026} {"train_loss": -5.689388275146484, "global_step": 43106, "epoch": 1026} {"train_loss": -5.776267051696777, "global_step": 43107, "epoch": 1026} {"train_loss": -5.658363342285156, "global_step": 43108, "epoch": 1026} {"train_loss": -5.684337139129639, "global_step": 43109, "epoch": 1026} {"train_loss": -5.633775234222412, "global_step": 43110, "epoch": 1026} {"train_loss": -5.726850509643555, "global_step": 43111, "epoch": 1026} {"train_loss": -5.725712299346924, "global_step": 43112, "epoch": 1026} {"train_loss": -5.729203701019287, "global_step": 43113, "epoch": 1026} {"train_loss": -5.800832748413086, "global_step": 43114, "epoch": 1026} {"train_loss": -5.751407146453857, "global_step": 43115, "epoch": 1026} {"train_loss": -5.669408321380615, "global_step": 43116, "epoch": 1026} {"train_loss": -5.731276512145996, "global_step": 43117, "epoch": 1026} {"train_loss": -5.710195541381836, "global_step": 43118, "epoch": 1026} {"train_loss": -5.800324440002441, "global_step": 43119, "epoch": 1026} {"train_loss": -5.757516860961914, "global_step": 43120, "epoch": 1026} {"train_loss": -5.679120063781738, "global_step": 43121, "epoch": 1026} {"train_loss": -5.740099906921387, "global_step": 43122, "epoch": 1026} {"train_loss": -5.749700546264648, "global_step": 43123, "epoch": 1026} {"train_loss": -5.768105506896973, "global_step": 43124, "epoch": 1026} {"train_loss": -5.706099510192871, "global_step": 43125, "epoch": 1026} {"train_loss": -5.7779340744018555, "global_step": 43126, "epoch": 1026} {"train_loss": -5.684935569763184, "global_step": 43127, "epoch": 1026} {"train_loss": -5.753311634063721, "global_step": 43128, "epoch": 1026} {"train_loss": -5.725847244262695, "global_step": 43129, "epoch": 1026} {"train_loss": -5.614189147949219, "global_step": 43130, "epoch": 1026} {"train_loss": -5.624126434326172, "global_step": 43131, "epoch": 1026} {"train_loss": -5.521434783935547, "global_step": 43132, "epoch": 1026} {"train_loss": -5.683781623840332, "global_step": 43133, "epoch": 1026, "val_loss": 61554.19921875} {"train_loss": -5.616460800170898, "global_step": 43134, "epoch": 1027} {"train_loss": -5.667942047119141, "global_step": 43135, "epoch": 1027} {"train_loss": -5.705438613891602, "global_step": 43136, "epoch": 1027} {"train_loss": -5.621511459350586, "global_step": 43137, "epoch": 1027} {"train_loss": -5.701361656188965, "global_step": 43138, "epoch": 1027} {"train_loss": -5.640954971313477, "global_step": 43139, "epoch": 1027} {"train_loss": -5.675143718719482, "global_step": 43140, "epoch": 1027} {"train_loss": -5.731629371643066, "global_step": 43141, "epoch": 1027} {"train_loss": -5.647804260253906, "global_step": 43142, "epoch": 1027} {"train_loss": -5.790442943572998, "global_step": 43143, "epoch": 1027} {"train_loss": -5.665859222412109, "global_step": 43144, "epoch": 1027} {"train_loss": -5.702521324157715, "global_step": 43145, "epoch": 1027} {"train_loss": -5.629744529724121, "global_step": 43146, "epoch": 1027} {"train_loss": -5.6399946212768555, "global_step": 43147, "epoch": 1027} {"train_loss": -5.726723670959473, "global_step": 43148, "epoch": 1027} {"train_loss": -5.592918872833252, "global_step": 43149, "epoch": 1027} {"train_loss": -5.692314147949219, "global_step": 43150, "epoch": 1027} {"train_loss": -5.566376209259033, "global_step": 43151, "epoch": 1027} {"train_loss": -5.780461311340332, "global_step": 43152, "epoch": 1027} {"train_loss": -5.718784332275391, "global_step": 43153, "epoch": 1027} {"train_loss": -5.636244773864746, "global_step": 43154, "epoch": 1027} {"train_loss": -5.756270885467529, "global_step": 43155, "epoch": 1027} {"train_loss": -5.748443603515625, "global_step": 43156, "epoch": 1027} {"train_loss": -5.703577995300293, "global_step": 43157, "epoch": 1027} {"train_loss": -5.737698554992676, "global_step": 43158, "epoch": 1027} {"train_loss": -5.8770432472229, "global_step": 43159, "epoch": 1027} {"train_loss": -5.681050777435303, "global_step": 43160, "epoch": 1027} {"train_loss": -5.792413711547852, "global_step": 43161, "epoch": 1027} {"train_loss": -5.642350196838379, "global_step": 43162, "epoch": 1027} {"train_loss": -5.607296943664551, "global_step": 43163, "epoch": 1027} {"train_loss": -5.6794939041137695, "global_step": 43164, "epoch": 1027} {"train_loss": -5.713172912597656, "global_step": 43165, "epoch": 1027} {"train_loss": -5.637402057647705, "global_step": 43166, "epoch": 1027} {"train_loss": -5.699893474578857, "global_step": 43167, "epoch": 1027} {"train_loss": -5.614607810974121, "global_step": 43168, "epoch": 1027} {"train_loss": -5.620587348937988, "global_step": 43169, "epoch": 1027} {"train_loss": -5.649518966674805, "global_step": 43170, "epoch": 1027} {"train_loss": -5.672847747802734, "global_step": 43171, "epoch": 1027} {"train_loss": -5.599594593048096, "global_step": 43172, "epoch": 1027} {"train_loss": -5.81069803237915, "global_step": 43173, "epoch": 1027} {"train_loss": -5.7209577560424805, "global_step": 43174, "epoch": 1027} {"train_loss": -5.686197155997867, "global_step": 43175, "epoch": 1027, "val_loss": 61913.36328125} {"train_loss": -5.660031318664551, "global_step": 43176, "epoch": 1028} {"train_loss": -5.594454765319824, "global_step": 43177, "epoch": 1028} {"train_loss": -5.728472709655762, "global_step": 43178, "epoch": 1028} {"train_loss": -5.787972450256348, "global_step": 43179, "epoch": 1028} {"train_loss": -5.820742607116699, "global_step": 43180, "epoch": 1028} {"train_loss": -5.759529113769531, "global_step": 43181, "epoch": 1028} {"train_loss": -5.6637444496154785, "global_step": 43182, "epoch": 1028} {"train_loss": -5.741702079772949, "global_step": 43183, "epoch": 1028} {"train_loss": -5.541375637054443, "global_step": 43184, "epoch": 1028} {"train_loss": -5.785041332244873, "global_step": 43185, "epoch": 1028} {"train_loss": -5.693388938903809, "global_step": 43186, "epoch": 1028} {"train_loss": -5.646211624145508, "global_step": 43187, "epoch": 1028} {"train_loss": -5.751100540161133, "global_step": 43188, "epoch": 1028} {"train_loss": -5.758509635925293, "global_step": 43189, "epoch": 1028} {"train_loss": -5.791954517364502, "global_step": 43190, "epoch": 1028} {"train_loss": -5.605341911315918, "global_step": 43191, "epoch": 1028} {"train_loss": -5.659238338470459, "global_step": 43192, "epoch": 1028} {"train_loss": -5.753638744354248, "global_step": 43193, "epoch": 1028} {"train_loss": -5.6832170486450195, "global_step": 43194, "epoch": 1028} {"train_loss": -5.684030055999756, "global_step": 43195, "epoch": 1028} {"train_loss": -5.604119300842285, "global_step": 43196, "epoch": 1028} {"train_loss": -5.629200458526611, "global_step": 43197, "epoch": 1028} {"train_loss": -5.580915927886963, "global_step": 43198, "epoch": 1028} {"train_loss": -5.643319129943848, "global_step": 43199, "epoch": 1028} {"train_loss": -5.680843353271484, "global_step": 43200, "epoch": 1028} {"train_loss": -5.668766021728516, "global_step": 43201, "epoch": 1028} {"train_loss": -5.6900739669799805, "global_step": 43202, "epoch": 1028} {"train_loss": -5.599054336547852, "global_step": 43203, "epoch": 1028} {"train_loss": -5.500941276550293, "global_step": 43204, "epoch": 1028} {"train_loss": -5.61104154586792, "global_step": 43205, "epoch": 1028} {"train_loss": -5.764496803283691, "global_step": 43206, "epoch": 1028} {"train_loss": -5.625154495239258, "global_step": 43207, "epoch": 1028} {"train_loss": -5.737723350524902, "global_step": 43208, "epoch": 1028} {"train_loss": -5.650671005249023, "global_step": 43209, "epoch": 1028} {"train_loss": -5.723056316375732, "global_step": 43210, "epoch": 1028} {"train_loss": -5.700412750244141, "global_step": 43211, "epoch": 1028} {"train_loss": -5.7326884269714355, "global_step": 43212, "epoch": 1028} {"train_loss": -5.5687384605407715, "global_step": 43213, "epoch": 1028} {"train_loss": -5.758947372436523, "global_step": 43214, "epoch": 1028} {"train_loss": -5.670036315917969, "global_step": 43215, "epoch": 1028} {"train_loss": -5.687821388244629, "global_step": 43216, "epoch": 1028} {"train_loss": -5.682024524325416, "global_step": 43217, "epoch": 1028, "val_loss": 61902.00390625} {"train_loss": -5.627851963043213, "global_step": 43218, "epoch": 1029} {"train_loss": -5.613933563232422, "global_step": 43219, "epoch": 1029} {"train_loss": -5.674895763397217, "global_step": 43220, "epoch": 1029} {"train_loss": -5.757951736450195, "global_step": 43221, "epoch": 1029} {"train_loss": -5.650177001953125, "global_step": 43222, "epoch": 1029} {"train_loss": -5.706302642822266, "global_step": 43223, "epoch": 1029} {"train_loss": -5.675961494445801, "global_step": 43224, "epoch": 1029} {"train_loss": -5.721831321716309, "global_step": 43225, "epoch": 1029} {"train_loss": -5.744028091430664, "global_step": 43226, "epoch": 1029} {"train_loss": -5.693703651428223, "global_step": 43227, "epoch": 1029} {"train_loss": -5.666478157043457, "global_step": 43228, "epoch": 1029} {"train_loss": -5.719566345214844, "global_step": 43229, "epoch": 1029} {"train_loss": -5.720457553863525, "global_step": 43230, "epoch": 1029} {"train_loss": -5.586606979370117, "global_step": 43231, "epoch": 1029} {"train_loss": -5.568756103515625, "global_step": 43232, "epoch": 1029} {"train_loss": -5.604822635650635, "global_step": 43233, "epoch": 1029} {"train_loss": -5.6419596672058105, "global_step": 43234, "epoch": 1029} {"train_loss": -5.604711055755615, "global_step": 43235, "epoch": 1029} {"train_loss": -5.713706016540527, "global_step": 43236, "epoch": 1029} {"train_loss": -5.77301549911499, "global_step": 43237, "epoch": 1029} {"train_loss": -5.564229965209961, "global_step": 43238, "epoch": 1029} {"train_loss": -5.728754997253418, "global_step": 43239, "epoch": 1029} {"train_loss": -5.618758201599121, "global_step": 43240, "epoch": 1029} {"train_loss": -5.683716773986816, "global_step": 43241, "epoch": 1029} {"train_loss": -5.667320251464844, "global_step": 43242, "epoch": 1029} {"train_loss": -5.627688884735107, "global_step": 43243, "epoch": 1029} {"train_loss": -5.634542465209961, "global_step": 43244, "epoch": 1029} {"train_loss": -5.781254768371582, "global_step": 43245, "epoch": 1029} {"train_loss": -5.642198085784912, "global_step": 43246, "epoch": 1029} {"train_loss": -5.735786437988281, "global_step": 43247, "epoch": 1029} {"train_loss": -5.675439357757568, "global_step": 43248, "epoch": 1029} {"train_loss": -5.603161811828613, "global_step": 43249, "epoch": 1029} {"train_loss": -5.683656692504883, "global_step": 43250, "epoch": 1029} {"train_loss": -5.616272926330566, "global_step": 43251, "epoch": 1029} {"train_loss": -5.656975746154785, "global_step": 43252, "epoch": 1029} {"train_loss": -5.608895301818848, "global_step": 43253, "epoch": 1029} {"train_loss": -5.580748081207275, "global_step": 43254, "epoch": 1029} {"train_loss": -5.690670013427734, "global_step": 43255, "epoch": 1029} {"train_loss": -5.697473526000977, "global_step": 43256, "epoch": 1029} {"train_loss": -5.742014408111572, "global_step": 43257, "epoch": 1029} {"train_loss": -5.718778610229492, "global_step": 43258, "epoch": 1029} {"train_loss": -5.667202529453096, "global_step": 43259, "epoch": 1029, "val_loss": 61764.0} {"train_loss": -5.666568279266357, "global_step": 43260, "epoch": 1030} {"train_loss": -5.690018653869629, "global_step": 43261, "epoch": 1030} {"train_loss": -5.703176498413086, "global_step": 43262, "epoch": 1030} {"train_loss": -5.567457675933838, "global_step": 43263, "epoch": 1030} {"train_loss": -5.603748321533203, "global_step": 43264, "epoch": 1030} {"train_loss": -5.572227954864502, "global_step": 43265, "epoch": 1030} {"train_loss": -5.73596715927124, "global_step": 43266, "epoch": 1030} {"train_loss": -5.713920593261719, "global_step": 43267, "epoch": 1030} {"train_loss": -5.670607566833496, "global_step": 43268, "epoch": 1030} {"train_loss": -5.66156005859375, "global_step": 43269, "epoch": 1030} {"train_loss": -5.674683094024658, "global_step": 43270, "epoch": 1030} {"train_loss": -5.584443092346191, "global_step": 43271, "epoch": 1030} {"train_loss": -5.600231647491455, "global_step": 43272, "epoch": 1030} {"train_loss": -5.668241500854492, "global_step": 43273, "epoch": 1030} {"train_loss": -5.6693620681762695, "global_step": 43274, "epoch": 1030} {"train_loss": -5.786718368530273, "global_step": 43275, "epoch": 1030} {"train_loss": -5.777371406555176, "global_step": 43276, "epoch": 1030} {"train_loss": -5.720058917999268, "global_step": 43277, "epoch": 1030} {"train_loss": -5.640610694885254, "global_step": 43278, "epoch": 1030} {"train_loss": -5.676613807678223, "global_step": 43279, "epoch": 1030} {"train_loss": -5.6754374504089355, "global_step": 43280, "epoch": 1030} {"train_loss": -5.7528276443481445, "global_step": 43281, "epoch": 1030} {"train_loss": -5.522086143493652, "global_step": 43282, "epoch": 1030} {"train_loss": -5.630936622619629, "global_step": 43283, "epoch": 1030} {"train_loss": -5.677076816558838, "global_step": 43284, "epoch": 1030} {"train_loss": -5.658561706542969, "global_step": 43285, "epoch": 1030} {"train_loss": -5.716768264770508, "global_step": 43286, "epoch": 1030} {"train_loss": -5.666810035705566, "global_step": 43287, "epoch": 1030} {"train_loss": -5.760837554931641, "global_step": 43288, "epoch": 1030} {"train_loss": -5.768898010253906, "global_step": 43289, "epoch": 1030} {"train_loss": -5.721741676330566, "global_step": 43290, "epoch": 1030} {"train_loss": -5.7929182052612305, "global_step": 43291, "epoch": 1030} {"train_loss": -5.6016645431518555, "global_step": 43292, "epoch": 1030} {"train_loss": -5.681527614593506, "global_step": 43293, "epoch": 1030} {"train_loss": -5.81816291809082, "global_step": 43294, "epoch": 1030} {"train_loss": -5.712183952331543, "global_step": 43295, "epoch": 1030} {"train_loss": -5.7243757247924805, "global_step": 43296, "epoch": 1030} {"train_loss": -5.740104675292969, "global_step": 43297, "epoch": 1030} {"train_loss": -5.652732849121094, "global_step": 43298, "epoch": 1030} {"train_loss": -5.7387614250183105, "global_step": 43299, "epoch": 1030} {"train_loss": -5.619072914123535, "global_step": 43300, "epoch": 1030} {"train_loss": -5.685366675967262, "global_step": 43301, "epoch": 1030, "val_loss": 61538.9765625} {"train_loss": -5.737337112426758, "global_step": 43302, "epoch": 1031} {"train_loss": -5.847036838531494, "global_step": 43303, "epoch": 1031} {"train_loss": -5.749827861785889, "global_step": 43304, "epoch": 1031} {"train_loss": -5.718145847320557, "global_step": 43305, "epoch": 1031} {"train_loss": -5.651333808898926, "global_step": 43306, "epoch": 1031} {"train_loss": -5.703516960144043, "global_step": 43307, "epoch": 1031} {"train_loss": -5.7718305587768555, "global_step": 43308, "epoch": 1031} {"train_loss": -5.6675214767456055, "global_step": 43309, "epoch": 1031} {"train_loss": -5.629607677459717, "global_step": 43310, "epoch": 1031} {"train_loss": -5.660862922668457, "global_step": 43311, "epoch": 1031} {"train_loss": -5.746244430541992, "global_step": 43312, "epoch": 1031} {"train_loss": -5.6455302238464355, "global_step": 43313, "epoch": 1031} {"train_loss": -5.708008766174316, "global_step": 43314, "epoch": 1031} {"train_loss": -5.708710670471191, "global_step": 43315, "epoch": 1031} {"train_loss": -5.5749053955078125, "global_step": 43316, "epoch": 1031} {"train_loss": -5.750968933105469, "global_step": 43317, "epoch": 1031} {"train_loss": -5.754850387573242, "global_step": 43318, "epoch": 1031} {"train_loss": -5.657021522521973, "global_step": 43319, "epoch": 1031} {"train_loss": -5.739254951477051, "global_step": 43320, "epoch": 1031} {"train_loss": -5.738592147827148, "global_step": 43321, "epoch": 1031} {"train_loss": -5.599653244018555, "global_step": 43322, "epoch": 1031} {"train_loss": -5.508693695068359, "global_step": 43323, "epoch": 1031} {"train_loss": -5.6163506507873535, "global_step": 43324, "epoch": 1031} {"train_loss": -5.474603652954102, "global_step": 43325, "epoch": 1031} {"train_loss": -5.695699691772461, "global_step": 43326, "epoch": 1031} {"train_loss": -5.848659515380859, "global_step": 43327, "epoch": 1031} {"train_loss": -5.488467693328857, "global_step": 43328, "epoch": 1031} {"train_loss": -5.765690803527832, "global_step": 43329, "epoch": 1031} {"train_loss": -5.579771518707275, "global_step": 43330, "epoch": 1031} {"train_loss": -5.607481002807617, "global_step": 43331, "epoch": 1031} {"train_loss": -5.749631881713867, "global_step": 43332, "epoch": 1031} {"train_loss": -5.625444412231445, "global_step": 43333, "epoch": 1031} {"train_loss": -5.76461124420166, "global_step": 43334, "epoch": 1031} {"train_loss": -5.717830657958984, "global_step": 43335, "epoch": 1031} {"train_loss": -5.69893741607666, "global_step": 43336, "epoch": 1031} {"train_loss": -5.795434951782227, "global_step": 43337, "epoch": 1031} {"train_loss": -5.691967487335205, "global_step": 43338, "epoch": 1031} {"train_loss": -5.718645095825195, "global_step": 43339, "epoch": 1031} {"train_loss": -5.732904434204102, "global_step": 43340, "epoch": 1031} {"train_loss": -5.80040168762207, "global_step": 43341, "epoch": 1031} {"train_loss": -5.6355109214782715, "global_step": 43342, "epoch": 1031} {"train_loss": -5.686342625390916, "global_step": 43343, "epoch": 1031, "val_loss": 61596.33984375} {"train_loss": -5.686779022216797, "global_step": 43344, "epoch": 1032} {"train_loss": -5.5792365074157715, "global_step": 43345, "epoch": 1032} {"train_loss": -5.610074996948242, "global_step": 43346, "epoch": 1032} {"train_loss": -5.679771423339844, "global_step": 43347, "epoch": 1032} {"train_loss": -5.733864784240723, "global_step": 43348, "epoch": 1032} {"train_loss": -5.535281181335449, "global_step": 43349, "epoch": 1032} {"train_loss": -5.716611862182617, "global_step": 43350, "epoch": 1032} {"train_loss": -5.623777389526367, "global_step": 43351, "epoch": 1032} {"train_loss": -5.6631646156311035, "global_step": 43352, "epoch": 1032} {"train_loss": -5.6500091552734375, "global_step": 43353, "epoch": 1032} {"train_loss": -5.63371467590332, "global_step": 43354, "epoch": 1032} {"train_loss": -5.6302995681762695, "global_step": 43355, "epoch": 1032} {"train_loss": -5.686540603637695, "global_step": 43356, "epoch": 1032} {"train_loss": -5.5612874031066895, "global_step": 43357, "epoch": 1032} {"train_loss": -5.624671936035156, "global_step": 43358, "epoch": 1032} {"train_loss": -5.7301483154296875, "global_step": 43359, "epoch": 1032} {"train_loss": -5.6670403480529785, "global_step": 43360, "epoch": 1032} {"train_loss": -5.63435173034668, "global_step": 43361, "epoch": 1032} {"train_loss": -5.768620491027832, "global_step": 43362, "epoch": 1032} {"train_loss": -5.624388217926025, "global_step": 43363, "epoch": 1032} {"train_loss": -5.693673133850098, "global_step": 43364, "epoch": 1032} {"train_loss": -5.739760875701904, "global_step": 43365, "epoch": 1032} {"train_loss": -5.6188764572143555, "global_step": 43366, "epoch": 1032} {"train_loss": -5.699109077453613, "global_step": 43367, "epoch": 1032} {"train_loss": -5.741563320159912, "global_step": 43368, "epoch": 1032} {"train_loss": -5.552448749542236, "global_step": 43369, "epoch": 1032} {"train_loss": -5.626770973205566, "global_step": 43370, "epoch": 1032} {"train_loss": -5.627051830291748, "global_step": 43371, "epoch": 1032} {"train_loss": -5.5886640548706055, "global_step": 43372, "epoch": 1032} {"train_loss": -5.718911170959473, "global_step": 43373, "epoch": 1032} {"train_loss": -5.5447998046875, "global_step": 43374, "epoch": 1032} {"train_loss": -5.659088134765625, "global_step": 43375, "epoch": 1032} {"train_loss": -5.788609504699707, "global_step": 43376, "epoch": 1032} {"train_loss": -5.49375581741333, "global_step": 43377, "epoch": 1032} {"train_loss": -5.7830634117126465, "global_step": 43378, "epoch": 1032} {"train_loss": -5.655686378479004, "global_step": 43379, "epoch": 1032} {"train_loss": -5.728169918060303, "global_step": 43380, "epoch": 1032} {"train_loss": -5.608243942260742, "global_step": 43381, "epoch": 1032} {"train_loss": -5.662062644958496, "global_step": 43382, "epoch": 1032} {"train_loss": -5.559975624084473, "global_step": 43383, "epoch": 1032} {"train_loss": -5.584139823913574, "global_step": 43384, "epoch": 1032} {"train_loss": -5.651770080838885, "global_step": 43385, "epoch": 1032, "val_loss": 62046.59375} {"train_loss": -5.692615985870361, "global_step": 43386, "epoch": 1033} {"train_loss": -5.780606269836426, "global_step": 43387, "epoch": 1033} {"train_loss": -5.632108211517334, "global_step": 43388, "epoch": 1033} {"train_loss": -5.70238733291626, "global_step": 43389, "epoch": 1033} {"train_loss": -5.813815116882324, "global_step": 43390, "epoch": 1033} {"train_loss": -5.710714817047119, "global_step": 43391, "epoch": 1033} {"train_loss": -5.854021072387695, "global_step": 43392, "epoch": 1033} {"train_loss": -5.666072368621826, "global_step": 43393, "epoch": 1033} {"train_loss": -5.661735534667969, "global_step": 43394, "epoch": 1033} {"train_loss": -5.755502700805664, "global_step": 43395, "epoch": 1033} {"train_loss": -5.654052257537842, "global_step": 43396, "epoch": 1033} {"train_loss": -5.766955375671387, "global_step": 43397, "epoch": 1033} {"train_loss": -5.776094436645508, "global_step": 43398, "epoch": 1033} {"train_loss": -5.668844699859619, "global_step": 43399, "epoch": 1033} {"train_loss": -5.713678359985352, "global_step": 43400, "epoch": 1033} {"train_loss": -5.657017707824707, "global_step": 43401, "epoch": 1033} {"train_loss": -5.709395408630371, "global_step": 43402, "epoch": 1033} {"train_loss": -5.665492534637451, "global_step": 43403, "epoch": 1033} {"train_loss": -5.7528791427612305, "global_step": 43404, "epoch": 1033} {"train_loss": -5.638066291809082, "global_step": 43405, "epoch": 1033} {"train_loss": -5.633884906768799, "global_step": 43406, "epoch": 1033} {"train_loss": -5.742472171783447, "global_step": 43407, "epoch": 1033} {"train_loss": -5.607673168182373, "global_step": 43408, "epoch": 1033} {"train_loss": -5.526749610900879, "global_step": 43409, "epoch": 1033} {"train_loss": -5.669851303100586, "global_step": 43410, "epoch": 1033} {"train_loss": -5.599693298339844, "global_step": 43411, "epoch": 1033} {"train_loss": -5.689328670501709, "global_step": 43412, "epoch": 1033} {"train_loss": -5.6772966384887695, "global_step": 43413, "epoch": 1033} {"train_loss": -5.603194236755371, "global_step": 43414, "epoch": 1033} {"train_loss": -5.631446361541748, "global_step": 43415, "epoch": 1033} {"train_loss": -5.6848602294921875, "global_step": 43416, "epoch": 1033} {"train_loss": -5.684422016143799, "global_step": 43417, "epoch": 1033} {"train_loss": -5.756772518157959, "global_step": 43418, "epoch": 1033} {"train_loss": -5.571511268615723, "global_step": 43419, "epoch": 1033} {"train_loss": -5.513158798217773, "global_step": 43420, "epoch": 1033} {"train_loss": -5.610849380493164, "global_step": 43421, "epoch": 1033} {"train_loss": -5.658574104309082, "global_step": 43422, "epoch": 1033} {"train_loss": -5.578859329223633, "global_step": 43423, "epoch": 1033} {"train_loss": -5.536026477813721, "global_step": 43424, "epoch": 1033} {"train_loss": -5.674073219299316, "global_step": 43425, "epoch": 1033} {"train_loss": -5.77515172958374, "global_step": 43426, "epoch": 1033} {"train_loss": -5.671175491242182, "global_step": 43427, "epoch": 1033, "val_loss": 61591.4375} {"train_loss": -5.689582824707031, "global_step": 43428, "epoch": 1034} {"train_loss": -5.624292850494385, "global_step": 43429, "epoch": 1034} {"train_loss": -5.592589378356934, "global_step": 43430, "epoch": 1034} {"train_loss": -5.6879754066467285, "global_step": 43431, "epoch": 1034} {"train_loss": -5.5586700439453125, "global_step": 43432, "epoch": 1034} {"train_loss": -5.7239484786987305, "global_step": 43433, "epoch": 1034} {"train_loss": -5.59774112701416, "global_step": 43434, "epoch": 1034} {"train_loss": -5.662911891937256, "global_step": 43435, "epoch": 1034} {"train_loss": -5.5797529220581055, "global_step": 43436, "epoch": 1034} {"train_loss": -5.581796646118164, "global_step": 43437, "epoch": 1034} {"train_loss": -5.692387580871582, "global_step": 43438, "epoch": 1034} {"train_loss": -5.79008150100708, "global_step": 43439, "epoch": 1034} {"train_loss": -5.626769065856934, "global_step": 43440, "epoch": 1034} {"train_loss": -5.815107345581055, "global_step": 43441, "epoch": 1034} {"train_loss": -5.649482727050781, "global_step": 43442, "epoch": 1034} {"train_loss": -5.703772068023682, "global_step": 43443, "epoch": 1034} {"train_loss": -5.754033088684082, "global_step": 43444, "epoch": 1034} {"train_loss": -5.708938121795654, "global_step": 43445, "epoch": 1034} {"train_loss": -5.608887672424316, "global_step": 43446, "epoch": 1034} {"train_loss": -5.655465126037598, "global_step": 43447, "epoch": 1034} {"train_loss": -5.804563522338867, "global_step": 43448, "epoch": 1034} {"train_loss": -5.5614423751831055, "global_step": 43449, "epoch": 1034} {"train_loss": -5.765589714050293, "global_step": 43450, "epoch": 1034} {"train_loss": -5.75062894821167, "global_step": 43451, "epoch": 1034} {"train_loss": -5.633857250213623, "global_step": 43452, "epoch": 1034} {"train_loss": -5.695013999938965, "global_step": 43453, "epoch": 1034} {"train_loss": -5.7787957191467285, "global_step": 43454, "epoch": 1034} {"train_loss": -5.731323719024658, "global_step": 43455, "epoch": 1034} {"train_loss": -5.751041412353516, "global_step": 43456, "epoch": 1034} {"train_loss": -5.757269382476807, "global_step": 43457, "epoch": 1034} {"train_loss": -5.5942888259887695, "global_step": 43458, "epoch": 1034} {"train_loss": -5.827345371246338, "global_step": 43459, "epoch": 1034} {"train_loss": -5.513758659362793, "global_step": 43460, "epoch": 1034} {"train_loss": -5.583720684051514, "global_step": 43461, "epoch": 1034} {"train_loss": -5.80520486831665, "global_step": 43462, "epoch": 1034} {"train_loss": -5.705533027648926, "global_step": 43463, "epoch": 1034} {"train_loss": -5.605408191680908, "global_step": 43464, "epoch": 1034} {"train_loss": -5.817194938659668, "global_step": 43465, "epoch": 1034} {"train_loss": -5.561166763305664, "global_step": 43466, "epoch": 1034} {"train_loss": -5.7360334396362305, "global_step": 43467, "epoch": 1034} {"train_loss": -5.547438144683838, "global_step": 43468, "epoch": 1034} {"train_loss": -5.6832610084896995, "global_step": 43469, "epoch": 1034, "val_loss": 61799.1953125} {"train_loss": -5.663789749145508, "global_step": 43470, "epoch": 1035} {"train_loss": -5.706171989440918, "global_step": 43471, "epoch": 1035} {"train_loss": -5.5879716873168945, "global_step": 43472, "epoch": 1035} {"train_loss": -5.815604209899902, "global_step": 43473, "epoch": 1035} {"train_loss": -5.711237907409668, "global_step": 43474, "epoch": 1035} {"train_loss": -5.709753513336182, "global_step": 43475, "epoch": 1035} {"train_loss": -5.67513370513916, "global_step": 43476, "epoch": 1035} {"train_loss": -5.8079071044921875, "global_step": 43477, "epoch": 1035} {"train_loss": -5.624709129333496, "global_step": 43478, "epoch": 1035} {"train_loss": -5.7807230949401855, "global_step": 43479, "epoch": 1035} {"train_loss": -5.7128753662109375, "global_step": 43480, "epoch": 1035} {"train_loss": -5.692241668701172, "global_step": 43481, "epoch": 1035} {"train_loss": -5.690101146697998, "global_step": 43482, "epoch": 1035} {"train_loss": -5.683734893798828, "global_step": 43483, "epoch": 1035} {"train_loss": -5.6628313064575195, "global_step": 43484, "epoch": 1035} {"train_loss": -5.696916580200195, "global_step": 43485, "epoch": 1035} {"train_loss": -5.7502760887146, "global_step": 43486, "epoch": 1035} {"train_loss": -5.613565921783447, "global_step": 43487, "epoch": 1035} {"train_loss": -5.675606727600098, "global_step": 43488, "epoch": 1035} {"train_loss": -5.588793754577637, "global_step": 43489, "epoch": 1035} {"train_loss": -5.641106605529785, "global_step": 43490, "epoch": 1035} {"train_loss": -5.728667736053467, "global_step": 43491, "epoch": 1035} {"train_loss": -5.639762878417969, "global_step": 43492, "epoch": 1035} {"train_loss": -5.74483060836792, "global_step": 43493, "epoch": 1035} {"train_loss": -5.701031684875488, "global_step": 43494, "epoch": 1035} {"train_loss": -5.6459808349609375, "global_step": 43495, "epoch": 1035} {"train_loss": -5.66087532043457, "global_step": 43496, "epoch": 1035} {"train_loss": -5.674293518066406, "global_step": 43497, "epoch": 1035} {"train_loss": -5.724666595458984, "global_step": 43498, "epoch": 1035} {"train_loss": -5.654600143432617, "global_step": 43499, "epoch": 1035} {"train_loss": -5.692927837371826, "global_step": 43500, "epoch": 1035} {"train_loss": -5.698772430419922, "global_step": 43501, "epoch": 1035} {"train_loss": -5.713428497314453, "global_step": 43502, "epoch": 1035} {"train_loss": -5.562224388122559, "global_step": 43503, "epoch": 1035} {"train_loss": -5.708208084106445, "global_step": 43504, "epoch": 1035} {"train_loss": -5.713344573974609, "global_step": 43505, "epoch": 1035} {"train_loss": -5.8673906326293945, "global_step": 43506, "epoch": 1035} {"train_loss": -5.78304386138916, "global_step": 43507, "epoch": 1035} {"train_loss": -5.752017974853516, "global_step": 43508, "epoch": 1035} {"train_loss": -5.83024787902832, "global_step": 43509, "epoch": 1035} {"train_loss": -5.636691570281982, "global_step": 43510, "epoch": 1035} {"train_loss": -5.6960385753994895, "global_step": 43511, "epoch": 1035, "val_loss": 61656.890625} {"train_loss": -5.856967926025391, "global_step": 43512, "epoch": 1036} {"train_loss": -5.663423538208008, "global_step": 43513, "epoch": 1036} {"train_loss": -5.676668167114258, "global_step": 43514, "epoch": 1036} {"train_loss": -5.703832626342773, "global_step": 43515, "epoch": 1036} {"train_loss": -5.654261589050293, "global_step": 43516, "epoch": 1036} {"train_loss": -5.662909507751465, "global_step": 43517, "epoch": 1036} {"train_loss": -5.741762161254883, "global_step": 43518, "epoch": 1036} {"train_loss": -5.643194675445557, "global_step": 43519, "epoch": 1036} {"train_loss": -5.713873863220215, "global_step": 43520, "epoch": 1036} {"train_loss": -5.680356025695801, "global_step": 43521, "epoch": 1036} {"train_loss": -5.607979774475098, "global_step": 43522, "epoch": 1036} {"train_loss": -5.672786712646484, "global_step": 43523, "epoch": 1036} {"train_loss": -5.74346923828125, "global_step": 43524, "epoch": 1036} {"train_loss": -5.8093976974487305, "global_step": 43525, "epoch": 1036} {"train_loss": -5.596166610717773, "global_step": 43526, "epoch": 1036} {"train_loss": -5.72455358505249, "global_step": 43527, "epoch": 1036} {"train_loss": -5.722668647766113, "global_step": 43528, "epoch": 1036} {"train_loss": -5.626041412353516, "global_step": 43529, "epoch": 1036} {"train_loss": -5.840188026428223, "global_step": 43530, "epoch": 1036} {"train_loss": -5.8203558921813965, "global_step": 43531, "epoch": 1036} {"train_loss": -5.7415666580200195, "global_step": 43532, "epoch": 1036} {"train_loss": -5.676558494567871, "global_step": 43533, "epoch": 1036} {"train_loss": -5.647396564483643, "global_step": 43534, "epoch": 1036} {"train_loss": -5.686203956604004, "global_step": 43535, "epoch": 1036} {"train_loss": -5.6677565574646, "global_step": 43536, "epoch": 1036} {"train_loss": -5.758197784423828, "global_step": 43537, "epoch": 1036} {"train_loss": -5.676177501678467, "global_step": 43538, "epoch": 1036} {"train_loss": -5.808785915374756, "global_step": 43539, "epoch": 1036} {"train_loss": -5.626186847686768, "global_step": 43540, "epoch": 1036} {"train_loss": -5.697451114654541, "global_step": 43541, "epoch": 1036} {"train_loss": -5.512899398803711, "global_step": 43542, "epoch": 1036} {"train_loss": -5.681170463562012, "global_step": 43543, "epoch": 1036} {"train_loss": -5.651773452758789, "global_step": 43544, "epoch": 1036} {"train_loss": -5.67186164855957, "global_step": 43545, "epoch": 1036} {"train_loss": -5.556143760681152, "global_step": 43546, "epoch": 1036} {"train_loss": -5.6241230964660645, "global_step": 43547, "epoch": 1036} {"train_loss": -5.638613700866699, "global_step": 43548, "epoch": 1036} {"train_loss": -5.5886077880859375, "global_step": 43549, "epoch": 1036} {"train_loss": -5.813748359680176, "global_step": 43550, "epoch": 1036} {"train_loss": -5.735151767730713, "global_step": 43551, "epoch": 1036} {"train_loss": -5.692598342895508, "global_step": 43552, "epoch": 1036} {"train_loss": -5.690664563860212, "global_step": 43553, "epoch": 1036, "val_loss": 61628.83984375} {"train_loss": -5.744885444641113, "global_step": 43554, "epoch": 1037} {"train_loss": -5.646542549133301, "global_step": 43555, "epoch": 1037} {"train_loss": -5.800547122955322, "global_step": 43556, "epoch": 1037} {"train_loss": -5.680137634277344, "global_step": 43557, "epoch": 1037} {"train_loss": -5.721043586730957, "global_step": 43558, "epoch": 1037} {"train_loss": -5.688414573669434, "global_step": 43559, "epoch": 1037} {"train_loss": -5.709502696990967, "global_step": 43560, "epoch": 1037} {"train_loss": -5.795724868774414, "global_step": 43561, "epoch": 1037} {"train_loss": -5.677818298339844, "global_step": 43562, "epoch": 1037} {"train_loss": -5.720267295837402, "global_step": 43563, "epoch": 1037} {"train_loss": -5.583789348602295, "global_step": 43564, "epoch": 1037} {"train_loss": -5.740461349487305, "global_step": 43565, "epoch": 1037} {"train_loss": -5.736451148986816, "global_step": 43566, "epoch": 1037} {"train_loss": -5.605250358581543, "global_step": 43567, "epoch": 1037} {"train_loss": -5.587745666503906, "global_step": 43568, "epoch": 1037} {"train_loss": -5.718637466430664, "global_step": 43569, "epoch": 1037} {"train_loss": -5.71042537689209, "global_step": 43570, "epoch": 1037} {"train_loss": -5.695370674133301, "global_step": 43571, "epoch": 1037} {"train_loss": -5.655872344970703, "global_step": 43572, "epoch": 1037} {"train_loss": -5.769511699676514, "global_step": 43573, "epoch": 1037} {"train_loss": -5.623715400695801, "global_step": 43574, "epoch": 1037} {"train_loss": -5.6571149826049805, "global_step": 43575, "epoch": 1037} {"train_loss": -5.6510090827941895, "global_step": 43576, "epoch": 1037} {"train_loss": -5.685789108276367, "global_step": 43577, "epoch": 1037} {"train_loss": -5.663597106933594, "global_step": 43578, "epoch": 1037} {"train_loss": -5.57234525680542, "global_step": 43579, "epoch": 1037} {"train_loss": -5.587727069854736, "global_step": 43580, "epoch": 1037} {"train_loss": -5.827085494995117, "global_step": 43581, "epoch": 1037} {"train_loss": -5.606021881103516, "global_step": 43582, "epoch": 1037} {"train_loss": -5.6427001953125, "global_step": 43583, "epoch": 1037} {"train_loss": -5.756310939788818, "global_step": 43584, "epoch": 1037} {"train_loss": -5.725820541381836, "global_step": 43585, "epoch": 1037} {"train_loss": -5.587769985198975, "global_step": 43586, "epoch": 1037} {"train_loss": -5.661938667297363, "global_step": 43587, "epoch": 1037} {"train_loss": -5.739612579345703, "global_step": 43588, "epoch": 1037} {"train_loss": -5.720637321472168, "global_step": 43589, "epoch": 1037} {"train_loss": -5.722614288330078, "global_step": 43590, "epoch": 1037} {"train_loss": -5.669408798217773, "global_step": 43591, "epoch": 1037} {"train_loss": -5.712972164154053, "global_step": 43592, "epoch": 1037} {"train_loss": -5.732144355773926, "global_step": 43593, "epoch": 1037} {"train_loss": -5.598259925842285, "global_step": 43594, "epoch": 1037} {"train_loss": -5.688562438601539, "global_step": 43595, "epoch": 1037, "val_loss": 61812.140625} {"train_loss": -5.716289043426514, "global_step": 43596, "epoch": 1038} {"train_loss": -5.68803596496582, "global_step": 43597, "epoch": 1038} {"train_loss": -5.720906734466553, "global_step": 43598, "epoch": 1038} {"train_loss": -5.689746856689453, "global_step": 43599, "epoch": 1038} {"train_loss": -5.749577522277832, "global_step": 43600, "epoch": 1038} {"train_loss": -5.775491714477539, "global_step": 43601, "epoch": 1038} {"train_loss": -5.616164207458496, "global_step": 43602, "epoch": 1038} {"train_loss": -5.692866325378418, "global_step": 43603, "epoch": 1038} {"train_loss": -5.672369956970215, "global_step": 43604, "epoch": 1038} {"train_loss": -5.590209007263184, "global_step": 43605, "epoch": 1038} {"train_loss": -5.72585916519165, "global_step": 43606, "epoch": 1038} {"train_loss": -5.689988613128662, "global_step": 43607, "epoch": 1038} {"train_loss": -5.546911239624023, "global_step": 43608, "epoch": 1038} {"train_loss": -5.775261878967285, "global_step": 43609, "epoch": 1038} {"train_loss": -5.587922096252441, "global_step": 43610, "epoch": 1038} {"train_loss": -5.748967170715332, "global_step": 43611, "epoch": 1038} {"train_loss": -5.721234321594238, "global_step": 43612, "epoch": 1038} {"train_loss": -5.571208953857422, "global_step": 43613, "epoch": 1038} {"train_loss": -5.587161064147949, "global_step": 43614, "epoch": 1038} {"train_loss": -5.66396951675415, "global_step": 43615, "epoch": 1038} {"train_loss": -5.698267936706543, "global_step": 43616, "epoch": 1038} {"train_loss": -5.846630096435547, "global_step": 43617, "epoch": 1038} {"train_loss": -5.788375377655029, "global_step": 43618, "epoch": 1038} {"train_loss": -5.740901947021484, "global_step": 43619, "epoch": 1038} {"train_loss": -5.759517669677734, "global_step": 43620, "epoch": 1038} {"train_loss": -5.623702049255371, "global_step": 43621, "epoch": 1038} {"train_loss": -5.663226127624512, "global_step": 43622, "epoch": 1038} {"train_loss": -5.72227144241333, "global_step": 43623, "epoch": 1038} {"train_loss": -5.739955902099609, "global_step": 43624, "epoch": 1038} {"train_loss": -5.671006202697754, "global_step": 43625, "epoch": 1038} {"train_loss": -5.763280868530273, "global_step": 43626, "epoch": 1038} {"train_loss": -5.605589866638184, "global_step": 43627, "epoch": 1038} {"train_loss": -5.644233703613281, "global_step": 43628, "epoch": 1038} {"train_loss": -5.709380626678467, "global_step": 43629, "epoch": 1038} {"train_loss": -5.725696563720703, "global_step": 43630, "epoch": 1038} {"train_loss": -5.766666412353516, "global_step": 43631, "epoch": 1038} {"train_loss": -5.757716655731201, "global_step": 43632, "epoch": 1038} {"train_loss": -5.763944625854492, "global_step": 43633, "epoch": 1038} {"train_loss": -5.566661357879639, "global_step": 43634, "epoch": 1038} {"train_loss": -5.726164817810059, "global_step": 43635, "epoch": 1038} {"train_loss": -5.652750015258789, "global_step": 43636, "epoch": 1038} {"train_loss": -5.692947035744076, "global_step": 43637, "epoch": 1038, "val_loss": 61579.8359375} {"train_loss": -5.785057067871094, "global_step": 43638, "epoch": 1039} {"train_loss": -5.673067569732666, "global_step": 43639, "epoch": 1039} {"train_loss": -5.818133354187012, "global_step": 43640, "epoch": 1039} {"train_loss": -5.793566703796387, "global_step": 43641, "epoch": 1039} {"train_loss": -5.70395040512085, "global_step": 43642, "epoch": 1039} {"train_loss": -5.703505992889404, "global_step": 43643, "epoch": 1039} {"train_loss": -5.756814956665039, "global_step": 43644, "epoch": 1039} {"train_loss": -5.735180854797363, "global_step": 43645, "epoch": 1039} {"train_loss": -5.721837043762207, "global_step": 43646, "epoch": 1039} {"train_loss": -5.675259590148926, "global_step": 43647, "epoch": 1039} {"train_loss": -5.720736503601074, "global_step": 43648, "epoch": 1039} {"train_loss": -5.703377723693848, "global_step": 43649, "epoch": 1039} {"train_loss": -5.584630012512207, "global_step": 43650, "epoch": 1039} {"train_loss": -5.636616230010986, "global_step": 43651, "epoch": 1039} {"train_loss": -5.710700035095215, "global_step": 43652, "epoch": 1039} {"train_loss": -5.736207962036133, "global_step": 43653, "epoch": 1039} {"train_loss": -5.818778991699219, "global_step": 43654, "epoch": 1039} {"train_loss": -5.66585111618042, "global_step": 43655, "epoch": 1039} {"train_loss": -5.775724411010742, "global_step": 43656, "epoch": 1039} {"train_loss": -5.637073516845703, "global_step": 43657, "epoch": 1039} {"train_loss": -5.77244758605957, "global_step": 43658, "epoch": 1039} {"train_loss": -5.726971626281738, "global_step": 43659, "epoch": 1039} {"train_loss": -5.786487579345703, "global_step": 43660, "epoch": 1039} {"train_loss": -5.513457298278809, "global_step": 43661, "epoch": 1039} {"train_loss": -5.614590167999268, "global_step": 43662, "epoch": 1039} {"train_loss": -5.767152786254883, "global_step": 43663, "epoch": 1039} {"train_loss": -5.75377082824707, "global_step": 43664, "epoch": 1039} {"train_loss": -5.755241394042969, "global_step": 43665, "epoch": 1039} {"train_loss": -5.622518539428711, "global_step": 43666, "epoch": 1039} {"train_loss": -5.589108943939209, "global_step": 43667, "epoch": 1039} {"train_loss": -5.833582878112793, "global_step": 43668, "epoch": 1039} {"train_loss": -5.719820976257324, "global_step": 43669, "epoch": 1039} {"train_loss": -5.62013053894043, "global_step": 43670, "epoch": 1039} {"train_loss": -5.742762565612793, "global_step": 43671, "epoch": 1039} {"train_loss": -5.631826877593994, "global_step": 43672, "epoch": 1039} {"train_loss": -5.680379867553711, "global_step": 43673, "epoch": 1039} {"train_loss": -5.751108646392822, "global_step": 43674, "epoch": 1039} {"train_loss": -5.705018997192383, "global_step": 43675, "epoch": 1039} {"train_loss": -5.601957321166992, "global_step": 43676, "epoch": 1039} {"train_loss": -5.683870792388916, "global_step": 43677, "epoch": 1039} {"train_loss": -5.68449068069458, "global_step": 43678, "epoch": 1039} {"train_loss": -5.702359449295771, "global_step": 43679, "epoch": 1039, "val_loss": 61751.2265625} {"train_loss": -5.61881685256958, "global_step": 43680, "epoch": 1040} {"train_loss": -5.801424503326416, "global_step": 43681, "epoch": 1040} {"train_loss": -5.607476234436035, "global_step": 43682, "epoch": 1040} {"train_loss": -5.697652339935303, "global_step": 43683, "epoch": 1040} {"train_loss": -5.596172332763672, "global_step": 43684, "epoch": 1040} {"train_loss": -5.565861701965332, "global_step": 43685, "epoch": 1040} {"train_loss": -5.594358444213867, "global_step": 43686, "epoch": 1040} {"train_loss": -5.709846496582031, "global_step": 43687, "epoch": 1040} {"train_loss": -5.69194221496582, "global_step": 43688, "epoch": 1040} {"train_loss": -5.700018882751465, "global_step": 43689, "epoch": 1040} {"train_loss": -5.800146102905273, "global_step": 43690, "epoch": 1040} {"train_loss": -5.718371391296387, "global_step": 43691, "epoch": 1040} {"train_loss": -5.629509925842285, "global_step": 43692, "epoch": 1040} {"train_loss": -5.814266204833984, "global_step": 43693, "epoch": 1040} {"train_loss": -5.74683141708374, "global_step": 43694, "epoch": 1040} {"train_loss": -5.619672775268555, "global_step": 43695, "epoch": 1040} {"train_loss": -5.719411373138428, "global_step": 43696, "epoch": 1040} {"train_loss": -5.636186599731445, "global_step": 43697, "epoch": 1040} {"train_loss": -5.610176086425781, "global_step": 43698, "epoch": 1040} {"train_loss": -5.610625267028809, "global_step": 43699, "epoch": 1040} {"train_loss": -5.652655124664307, "global_step": 43700, "epoch": 1040} {"train_loss": -5.632233142852783, "global_step": 43701, "epoch": 1040} {"train_loss": -5.629995822906494, "global_step": 43702, "epoch": 1040} {"train_loss": -5.595856666564941, "global_step": 43703, "epoch": 1040} {"train_loss": -5.665820121765137, "global_step": 43704, "epoch": 1040} {"train_loss": -5.830279350280762, "global_step": 43705, "epoch": 1040} {"train_loss": -5.5657148361206055, "global_step": 43706, "epoch": 1040} {"train_loss": -5.607574462890625, "global_step": 43707, "epoch": 1040} {"train_loss": -5.706296920776367, "global_step": 43708, "epoch": 1040} {"train_loss": -5.734463691711426, "global_step": 43709, "epoch": 1040} {"train_loss": -5.64845609664917, "global_step": 43710, "epoch": 1040} {"train_loss": -5.746890068054199, "global_step": 43711, "epoch": 1040} {"train_loss": -5.638465404510498, "global_step": 43712, "epoch": 1040} {"train_loss": -5.692896842956543, "global_step": 43713, "epoch": 1040} {"train_loss": -5.692157745361328, "global_step": 43714, "epoch": 1040} {"train_loss": -5.7333831787109375, "global_step": 43715, "epoch": 1040} {"train_loss": -5.681729316711426, "global_step": 43716, "epoch": 1040} {"train_loss": -5.622164249420166, "global_step": 43717, "epoch": 1040} {"train_loss": -5.660882472991943, "global_step": 43718, "epoch": 1040} {"train_loss": -5.563518047332764, "global_step": 43719, "epoch": 1040} {"train_loss": -5.674709320068359, "global_step": 43720, "epoch": 1040} {"train_loss": -5.669643595105126, "global_step": 43721, "epoch": 1040, "val_loss": 61978.2265625} {"train_loss": -5.691716194152832, "global_step": 43722, "epoch": 1041} {"train_loss": -5.702389240264893, "global_step": 43723, "epoch": 1041} {"train_loss": -5.729235649108887, "global_step": 43724, "epoch": 1041} {"train_loss": -5.6012067794799805, "global_step": 43725, "epoch": 1041} {"train_loss": -5.667083263397217, "global_step": 43726, "epoch": 1041} {"train_loss": -5.648697853088379, "global_step": 43727, "epoch": 1041} {"train_loss": -5.674259185791016, "global_step": 43728, "epoch": 1041} {"train_loss": -5.624825477600098, "global_step": 43729, "epoch": 1041} {"train_loss": -5.678984642028809, "global_step": 43730, "epoch": 1041} {"train_loss": -5.781989097595215, "global_step": 43731, "epoch": 1041} {"train_loss": -5.609324932098389, "global_step": 43732, "epoch": 1041} {"train_loss": -5.694667816162109, "global_step": 43733, "epoch": 1041} {"train_loss": -5.700014114379883, "global_step": 43734, "epoch": 1041} {"train_loss": -5.604966163635254, "global_step": 43735, "epoch": 1041} {"train_loss": -5.738653659820557, "global_step": 43736, "epoch": 1041} {"train_loss": -5.7462873458862305, "global_step": 43737, "epoch": 1041} {"train_loss": -5.731003761291504, "global_step": 43738, "epoch": 1041} {"train_loss": -5.745633125305176, "global_step": 43739, "epoch": 1041} {"train_loss": -5.640558242797852, "global_step": 43740, "epoch": 1041} {"train_loss": -5.727489471435547, "global_step": 43741, "epoch": 1041} {"train_loss": -5.765719413757324, "global_step": 43742, "epoch": 1041} {"train_loss": -5.618916034698486, "global_step": 43743, "epoch": 1041} {"train_loss": -5.735564231872559, "global_step": 43744, "epoch": 1041} {"train_loss": -5.790838241577148, "global_step": 43745, "epoch": 1041} {"train_loss": -5.753846168518066, "global_step": 43746, "epoch": 1041} {"train_loss": -5.839193344116211, "global_step": 43747, "epoch": 1041} {"train_loss": -5.696719169616699, "global_step": 43748, "epoch": 1041} {"train_loss": -5.722455024719238, "global_step": 43749, "epoch": 1041} {"train_loss": -5.713109016418457, "global_step": 43750, "epoch": 1041} {"train_loss": -5.742852687835693, "global_step": 43751, "epoch": 1041} {"train_loss": -5.744555950164795, "global_step": 43752, "epoch": 1041} {"train_loss": -5.700639247894287, "global_step": 43753, "epoch": 1041} {"train_loss": -5.6640424728393555, "global_step": 43754, "epoch": 1041} {"train_loss": -5.7898054122924805, "global_step": 43755, "epoch": 1041} {"train_loss": -5.706441879272461, "global_step": 43756, "epoch": 1041} {"train_loss": -5.570070266723633, "global_step": 43757, "epoch": 1041} {"train_loss": -5.712241172790527, "global_step": 43758, "epoch": 1041} {"train_loss": -5.629678249359131, "global_step": 43759, "epoch": 1041} {"train_loss": -5.617861747741699, "global_step": 43760, "epoch": 1041} {"train_loss": -5.657017707824707, "global_step": 43761, "epoch": 1041} {"train_loss": -5.61937141418457, "global_step": 43762, "epoch": 1041} {"train_loss": -5.695330540339152, "global_step": 43763, "epoch": 1041, "val_loss": 61563.37890625} {"train_loss": -5.725871562957764, "global_step": 43764, "epoch": 1042} {"train_loss": -5.679656028747559, "global_step": 43765, "epoch": 1042} {"train_loss": -5.595588684082031, "global_step": 43766, "epoch": 1042} {"train_loss": -5.747228622436523, "global_step": 43767, "epoch": 1042} {"train_loss": -5.734766960144043, "global_step": 43768, "epoch": 1042} {"train_loss": -5.679071426391602, "global_step": 43769, "epoch": 1042} {"train_loss": -5.571175575256348, "global_step": 43770, "epoch": 1042} {"train_loss": -5.721717834472656, "global_step": 43771, "epoch": 1042} {"train_loss": -5.741156578063965, "global_step": 43772, "epoch": 1042} {"train_loss": -5.747868061065674, "global_step": 43773, "epoch": 1042} {"train_loss": -5.661628723144531, "global_step": 43774, "epoch": 1042} {"train_loss": -5.815094947814941, "global_step": 43775, "epoch": 1042} {"train_loss": -5.660406112670898, "global_step": 43776, "epoch": 1042} {"train_loss": -5.605393409729004, "global_step": 43777, "epoch": 1042} {"train_loss": -5.626032829284668, "global_step": 43778, "epoch": 1042} {"train_loss": -5.761858940124512, "global_step": 43779, "epoch": 1042} {"train_loss": -5.655719757080078, "global_step": 43780, "epoch": 1042} {"train_loss": -5.826037406921387, "global_step": 43781, "epoch": 1042} {"train_loss": -5.705387115478516, "global_step": 43782, "epoch": 1042} {"train_loss": -5.697381019592285, "global_step": 43783, "epoch": 1042} {"train_loss": -5.639677047729492, "global_step": 43784, "epoch": 1042} {"train_loss": -5.709441184997559, "global_step": 43785, "epoch": 1042} {"train_loss": -5.641763687133789, "global_step": 43786, "epoch": 1042} {"train_loss": -5.695792198181152, "global_step": 43787, "epoch": 1042} {"train_loss": -5.826791763305664, "global_step": 43788, "epoch": 1042} {"train_loss": -5.71909761428833, "global_step": 43789, "epoch": 1042} {"train_loss": -5.690783500671387, "global_step": 43790, "epoch": 1042} {"train_loss": -5.743539810180664, "global_step": 43791, "epoch": 1042} {"train_loss": -5.770387172698975, "global_step": 43792, "epoch": 1042} {"train_loss": -5.757780075073242, "global_step": 43793, "epoch": 1042} {"train_loss": -5.672776699066162, "global_step": 43794, "epoch": 1042} {"train_loss": -5.620269775390625, "global_step": 43795, "epoch": 1042} {"train_loss": -5.701990127563477, "global_step": 43796, "epoch": 1042} {"train_loss": -5.717160224914551, "global_step": 43797, "epoch": 1042} {"train_loss": -5.642073631286621, "global_step": 43798, "epoch": 1042} {"train_loss": -5.801962852478027, "global_step": 43799, "epoch": 1042} {"train_loss": -5.62385892868042, "global_step": 43800, "epoch": 1042} {"train_loss": -5.6532206535339355, "global_step": 43801, "epoch": 1042} {"train_loss": -5.713068008422852, "global_step": 43802, "epoch": 1042} {"train_loss": -5.626264572143555, "global_step": 43803, "epoch": 1042} {"train_loss": -5.680395126342773, "global_step": 43804, "epoch": 1042} {"train_loss": -5.698371274130685, "global_step": 43805, "epoch": 1042, "val_loss": 61563.98046875} {"train_loss": -5.79977560043335, "global_step": 43806, "epoch": 1043} {"train_loss": -5.677620887756348, "global_step": 43807, "epoch": 1043} {"train_loss": -5.656863212585449, "global_step": 43808, "epoch": 1043} {"train_loss": -5.670838832855225, "global_step": 43809, "epoch": 1043} {"train_loss": -5.662825584411621, "global_step": 43810, "epoch": 1043} {"train_loss": -5.543134689331055, "global_step": 43811, "epoch": 1043} {"train_loss": -5.65431547164917, "global_step": 43812, "epoch": 1043} {"train_loss": -5.727781295776367, "global_step": 43813, "epoch": 1043} {"train_loss": -5.743950843811035, "global_step": 43814, "epoch": 1043} {"train_loss": -5.734995365142822, "global_step": 43815, "epoch": 1043} {"train_loss": -5.646791458129883, "global_step": 43816, "epoch": 1043} {"train_loss": -5.777850151062012, "global_step": 43817, "epoch": 1043} {"train_loss": -5.714700698852539, "global_step": 43818, "epoch": 1043} {"train_loss": -5.767057418823242, "global_step": 43819, "epoch": 1043} {"train_loss": -5.752164840698242, "global_step": 43820, "epoch": 1043} {"train_loss": -5.592529296875, "global_step": 43821, "epoch": 1043} {"train_loss": -5.697658061981201, "global_step": 43822, "epoch": 1043} {"train_loss": -5.6775593757629395, "global_step": 43823, "epoch": 1043} {"train_loss": -5.709287643432617, "global_step": 43824, "epoch": 1043} {"train_loss": -5.550496578216553, "global_step": 43825, "epoch": 1043} {"train_loss": -5.544600486755371, "global_step": 43826, "epoch": 1043} {"train_loss": -5.702597618103027, "global_step": 43827, "epoch": 1043} {"train_loss": -5.692569732666016, "global_step": 43828, "epoch": 1043} {"train_loss": -5.723010063171387, "global_step": 43829, "epoch": 1043} {"train_loss": -5.790859699249268, "global_step": 43830, "epoch": 1043} {"train_loss": -5.629598617553711, "global_step": 43831, "epoch": 1043} {"train_loss": -5.529183387756348, "global_step": 43832, "epoch": 1043} {"train_loss": -5.71917200088501, "global_step": 43833, "epoch": 1043} {"train_loss": -5.641828536987305, "global_step": 43834, "epoch": 1043} {"train_loss": -5.708286285400391, "global_step": 43835, "epoch": 1043} {"train_loss": -5.522559642791748, "global_step": 43836, "epoch": 1043} {"train_loss": -5.675539016723633, "global_step": 43837, "epoch": 1043} {"train_loss": -5.490049839019775, "global_step": 43838, "epoch": 1043} {"train_loss": -5.542993545532227, "global_step": 43839, "epoch": 1043} {"train_loss": -5.743035316467285, "global_step": 43840, "epoch": 1043} {"train_loss": -5.707066535949707, "global_step": 43841, "epoch": 1043} {"train_loss": -5.7497382164001465, "global_step": 43842, "epoch": 1043} {"train_loss": -5.772202491760254, "global_step": 43843, "epoch": 1043} {"train_loss": -5.757854461669922, "global_step": 43844, "epoch": 1043} {"train_loss": -5.7015485763549805, "global_step": 43845, "epoch": 1043} {"train_loss": -5.759995460510254, "global_step": 43846, "epoch": 1043} {"train_loss": -5.680050861267817, "global_step": 43847, "epoch": 1043, "val_loss": 61732.09375} {"train_loss": -5.676700592041016, "global_step": 43848, "epoch": 1044} {"train_loss": -5.794527053833008, "global_step": 43849, "epoch": 1044} {"train_loss": -5.603206634521484, "global_step": 43850, "epoch": 1044} {"train_loss": -5.684836387634277, "global_step": 43851, "epoch": 1044} {"train_loss": -5.762851238250732, "global_step": 43852, "epoch": 1044} {"train_loss": -5.625313758850098, "global_step": 43853, "epoch": 1044} {"train_loss": -5.718254089355469, "global_step": 43854, "epoch": 1044} {"train_loss": -5.659060001373291, "global_step": 43855, "epoch": 1044} {"train_loss": -5.6994948387146, "global_step": 43856, "epoch": 1044} {"train_loss": -5.693346977233887, "global_step": 43857, "epoch": 1044} {"train_loss": -5.584922790527344, "global_step": 43858, "epoch": 1044} {"train_loss": -5.81669807434082, "global_step": 43859, "epoch": 1044} {"train_loss": -5.693856239318848, "global_step": 43860, "epoch": 1044} {"train_loss": -5.736965179443359, "global_step": 43861, "epoch": 1044} {"train_loss": -5.716962814331055, "global_step": 43862, "epoch": 1044} {"train_loss": -5.570400714874268, "global_step": 43863, "epoch": 1044} {"train_loss": -5.720213890075684, "global_step": 43864, "epoch": 1044} {"train_loss": -5.791189670562744, "global_step": 43865, "epoch": 1044} {"train_loss": -5.653656959533691, "global_step": 43866, "epoch": 1044} {"train_loss": -5.736751079559326, "global_step": 43867, "epoch": 1044} {"train_loss": -5.630666255950928, "global_step": 43868, "epoch": 1044} {"train_loss": -5.662171363830566, "global_step": 43869, "epoch": 1044} {"train_loss": -5.705635070800781, "global_step": 43870, "epoch": 1044} {"train_loss": -5.700194358825684, "global_step": 43871, "epoch": 1044} {"train_loss": -5.742659568786621, "global_step": 43872, "epoch": 1044} {"train_loss": -5.7226057052612305, "global_step": 43873, "epoch": 1044} {"train_loss": -5.611615180969238, "global_step": 43874, "epoch": 1044} {"train_loss": -5.631186008453369, "global_step": 43875, "epoch": 1044} {"train_loss": -5.671176910400391, "global_step": 43876, "epoch": 1044} {"train_loss": -5.661317825317383, "global_step": 43877, "epoch": 1044} {"train_loss": -5.7387285232543945, "global_step": 43878, "epoch": 1044} {"train_loss": -5.758625030517578, "global_step": 43879, "epoch": 1044} {"train_loss": -5.626651763916016, "global_step": 43880, "epoch": 1044} {"train_loss": -5.751125812530518, "global_step": 43881, "epoch": 1044} {"train_loss": -5.707213401794434, "global_step": 43882, "epoch": 1044} {"train_loss": -5.582513332366943, "global_step": 43883, "epoch": 1044} {"train_loss": -5.709104537963867, "global_step": 43884, "epoch": 1044} {"train_loss": -5.596814155578613, "global_step": 43885, "epoch": 1044} {"train_loss": -5.644484519958496, "global_step": 43886, "epoch": 1044} {"train_loss": -5.732997894287109, "global_step": 43887, "epoch": 1044} {"train_loss": -5.708911895751953, "global_step": 43888, "epoch": 1044} {"train_loss": -5.688718966075352, "global_step": 43889, "epoch": 1044, "val_loss": 61668.64453125} {"train_loss": -5.651663303375244, "global_step": 43890, "epoch": 1045} {"train_loss": -5.668441295623779, "global_step": 43891, "epoch": 1045} {"train_loss": -5.848141670227051, "global_step": 43892, "epoch": 1045} {"train_loss": -5.748119831085205, "global_step": 43893, "epoch": 1045} {"train_loss": -5.663222312927246, "global_step": 43894, "epoch": 1045} {"train_loss": -5.706369876861572, "global_step": 43895, "epoch": 1045} {"train_loss": -5.70274019241333, "global_step": 43896, "epoch": 1045} {"train_loss": -5.729714870452881, "global_step": 43897, "epoch": 1045} {"train_loss": -5.690482139587402, "global_step": 43898, "epoch": 1045} {"train_loss": -5.733720302581787, "global_step": 43899, "epoch": 1045} {"train_loss": -5.648965835571289, "global_step": 43900, "epoch": 1045} {"train_loss": -5.693192958831787, "global_step": 43901, "epoch": 1045} {"train_loss": -5.572157859802246, "global_step": 43902, "epoch": 1045} {"train_loss": -5.553912162780762, "global_step": 43903, "epoch": 1045} {"train_loss": -5.803043842315674, "global_step": 43904, "epoch": 1045} {"train_loss": -5.529759883880615, "global_step": 43905, "epoch": 1045} {"train_loss": -5.596261024475098, "global_step": 43906, "epoch": 1045} {"train_loss": -5.60709285736084, "global_step": 43907, "epoch": 1045} {"train_loss": -5.653500556945801, "global_step": 43908, "epoch": 1045} {"train_loss": -5.656436443328857, "global_step": 43909, "epoch": 1045} {"train_loss": -5.5488739013671875, "global_step": 43910, "epoch": 1045} {"train_loss": -5.680035591125488, "global_step": 43911, "epoch": 1045} {"train_loss": -5.588886260986328, "global_step": 43912, "epoch": 1045} {"train_loss": -5.610073566436768, "global_step": 43913, "epoch": 1045} {"train_loss": -5.528854846954346, "global_step": 43914, "epoch": 1045} {"train_loss": -5.671482086181641, "global_step": 43915, "epoch": 1045} {"train_loss": -5.675165176391602, "global_step": 43916, "epoch": 1045} {"train_loss": -5.718708038330078, "global_step": 43917, "epoch": 1045} {"train_loss": -5.484517574310303, "global_step": 43918, "epoch": 1045} {"train_loss": -5.678194046020508, "global_step": 43919, "epoch": 1045} {"train_loss": -5.610357761383057, "global_step": 43920, "epoch": 1045} {"train_loss": -5.608182907104492, "global_step": 43921, "epoch": 1045} {"train_loss": -5.671102523803711, "global_step": 43922, "epoch": 1045} {"train_loss": -5.655559539794922, "global_step": 43923, "epoch": 1045} {"train_loss": -5.673365592956543, "global_step": 43924, "epoch": 1045} {"train_loss": -5.652921199798584, "global_step": 43925, "epoch": 1045} {"train_loss": -5.597355842590332, "global_step": 43926, "epoch": 1045} {"train_loss": -5.742495059967041, "global_step": 43927, "epoch": 1045} {"train_loss": -5.653556823730469, "global_step": 43928, "epoch": 1045} {"train_loss": -5.76286506652832, "global_step": 43929, "epoch": 1045} {"train_loss": -5.582740783691406, "global_step": 43930, "epoch": 1045} {"train_loss": -5.658099390211559, "global_step": 43931, "epoch": 1045, "val_loss": 61511.1171875} {"train_loss": -5.739435195922852, "global_step": 43932, "epoch": 1046} {"train_loss": -5.704615592956543, "global_step": 43933, "epoch": 1046} {"train_loss": -5.596479415893555, "global_step": 43934, "epoch": 1046} {"train_loss": -5.7187299728393555, "global_step": 43935, "epoch": 1046} {"train_loss": -5.678014278411865, "global_step": 43936, "epoch": 1046} {"train_loss": -5.658013343811035, "global_step": 43937, "epoch": 1046} {"train_loss": -5.720346450805664, "global_step": 43938, "epoch": 1046} {"train_loss": -5.5328288078308105, "global_step": 43939, "epoch": 1046} {"train_loss": -5.697995185852051, "global_step": 43940, "epoch": 1046} {"train_loss": -5.624367713928223, "global_step": 43941, "epoch": 1046} {"train_loss": -5.610421180725098, "global_step": 43942, "epoch": 1046} {"train_loss": -5.525455474853516, "global_step": 43943, "epoch": 1046} {"train_loss": -5.6722636222839355, "global_step": 43944, "epoch": 1046} {"train_loss": -5.523868560791016, "global_step": 43945, "epoch": 1046} {"train_loss": -5.767453670501709, "global_step": 43946, "epoch": 1046} {"train_loss": -5.650590896606445, "global_step": 43947, "epoch": 1046} {"train_loss": -5.649954795837402, "global_step": 43948, "epoch": 1046} {"train_loss": -5.731905937194824, "global_step": 43949, "epoch": 1046} {"train_loss": -5.7063517570495605, "global_step": 43950, "epoch": 1046} {"train_loss": -5.779500961303711, "global_step": 43951, "epoch": 1046} {"train_loss": -5.694504737854004, "global_step": 43952, "epoch": 1046} {"train_loss": -5.6682305335998535, "global_step": 43953, "epoch": 1046} {"train_loss": -5.743912220001221, "global_step": 43954, "epoch": 1046} {"train_loss": -5.654123306274414, "global_step": 43955, "epoch": 1046} {"train_loss": -5.6744561195373535, "global_step": 43956, "epoch": 1046} {"train_loss": -5.7566633224487305, "global_step": 43957, "epoch": 1046} {"train_loss": -5.710563659667969, "global_step": 43958, "epoch": 1046} {"train_loss": -5.544667720794678, "global_step": 43959, "epoch": 1046} {"train_loss": -5.656683921813965, "global_step": 43960, "epoch": 1046} {"train_loss": -5.517942428588867, "global_step": 43961, "epoch": 1046} {"train_loss": -5.650369644165039, "global_step": 43962, "epoch": 1046} {"train_loss": -5.603085517883301, "global_step": 43963, "epoch": 1046} {"train_loss": -5.777179718017578, "global_step": 43964, "epoch": 1046} {"train_loss": -5.685516357421875, "global_step": 43965, "epoch": 1046} {"train_loss": -5.67193078994751, "global_step": 43966, "epoch": 1046} {"train_loss": -5.705377578735352, "global_step": 43967, "epoch": 1046} {"train_loss": -5.702995300292969, "global_step": 43968, "epoch": 1046} {"train_loss": -5.547503471374512, "global_step": 43969, "epoch": 1046} {"train_loss": -5.743636131286621, "global_step": 43970, "epoch": 1046} {"train_loss": -5.574054718017578, "global_step": 43971, "epoch": 1046} {"train_loss": -5.695585250854492, "global_step": 43972, "epoch": 1046} {"train_loss": -5.66696454229809, "global_step": 43973, "epoch": 1046, "val_loss": 61924.93359375} {"train_loss": -5.476967811584473, "global_step": 43974, "epoch": 1047} {"train_loss": -5.366910934448242, "global_step": 43975, "epoch": 1047} {"train_loss": -5.693829536437988, "global_step": 43976, "epoch": 1047} {"train_loss": -5.5670485496521, "global_step": 43977, "epoch": 1047} {"train_loss": -5.56329870223999, "global_step": 43978, "epoch": 1047} {"train_loss": -5.627145767211914, "global_step": 43979, "epoch": 1047} {"train_loss": -5.487252712249756, "global_step": 43980, "epoch": 1047} {"train_loss": -5.594619274139404, "global_step": 43981, "epoch": 1047} {"train_loss": -5.642256259918213, "global_step": 43982, "epoch": 1047} {"train_loss": -5.693545341491699, "global_step": 43983, "epoch": 1047} {"train_loss": -5.697689533233643, "global_step": 43984, "epoch": 1047} {"train_loss": -5.650074005126953, "global_step": 43985, "epoch": 1047} {"train_loss": -5.563038349151611, "global_step": 43986, "epoch": 1047} {"train_loss": -5.790748119354248, "global_step": 43987, "epoch": 1047} {"train_loss": -5.747671127319336, "global_step": 43988, "epoch": 1047} {"train_loss": -5.564606189727783, "global_step": 43989, "epoch": 1047} {"train_loss": -5.659942626953125, "global_step": 43990, "epoch": 1047} {"train_loss": -5.797847747802734, "global_step": 43991, "epoch": 1047} {"train_loss": -5.767707824707031, "global_step": 43992, "epoch": 1047} {"train_loss": -5.703347206115723, "global_step": 43993, "epoch": 1047} {"train_loss": -5.732608795166016, "global_step": 43994, "epoch": 1047} {"train_loss": -5.703787803649902, "global_step": 43995, "epoch": 1047} {"train_loss": -5.614462852478027, "global_step": 43996, "epoch": 1047} {"train_loss": -5.788968086242676, "global_step": 43997, "epoch": 1047} {"train_loss": -5.771300315856934, "global_step": 43998, "epoch": 1047} {"train_loss": -5.736289024353027, "global_step": 43999, "epoch": 1047} {"train_loss": -5.732064247131348, "global_step": 44000, "epoch": 1047} {"train_loss": -5.636519908905029, "global_step": 44001, "epoch": 1047} {"train_loss": -5.7131452560424805, "global_step": 44002, "epoch": 1047} {"train_loss": -5.597702980041504, "global_step": 44003, "epoch": 1047} {"train_loss": -5.635746002197266, "global_step": 44004, "epoch": 1047} {"train_loss": -5.8172736167907715, "global_step": 44005, "epoch": 1047} {"train_loss": -5.815282344818115, "global_step": 44006, "epoch": 1047} {"train_loss": -5.728766441345215, "global_step": 44007, "epoch": 1047} {"train_loss": -5.627010822296143, "global_step": 44008, "epoch": 1047} {"train_loss": -5.762545108795166, "global_step": 44009, "epoch": 1047} {"train_loss": -5.6890459060668945, "global_step": 44010, "epoch": 1047} {"train_loss": -5.712719440460205, "global_step": 44011, "epoch": 1047} {"train_loss": -5.794170379638672, "global_step": 44012, "epoch": 1047} {"train_loss": -5.693734169006348, "global_step": 44013, "epoch": 1047} {"train_loss": -5.7425360679626465, "global_step": 44014, "epoch": 1047} {"train_loss": -5.6774963310786655, "global_step": 44015, "epoch": 1047, "val_loss": 61545.25390625} {"train_loss": -5.83074426651001, "global_step": 44016, "epoch": 1048} {"train_loss": -5.712616920471191, "global_step": 44017, "epoch": 1048} {"train_loss": -5.693778991699219, "global_step": 44018, "epoch": 1048} {"train_loss": -5.685715675354004, "global_step": 44019, "epoch": 1048} {"train_loss": -5.672050952911377, "global_step": 44020, "epoch": 1048} {"train_loss": -5.736676216125488, "global_step": 44021, "epoch": 1048} {"train_loss": -5.750133514404297, "global_step": 44022, "epoch": 1048} {"train_loss": -5.733821868896484, "global_step": 44023, "epoch": 1048} {"train_loss": -5.659511566162109, "global_step": 44024, "epoch": 1048} {"train_loss": -5.738247394561768, "global_step": 44025, "epoch": 1048} {"train_loss": -5.753662109375, "global_step": 44026, "epoch": 1048} {"train_loss": -5.7591705322265625, "global_step": 44027, "epoch": 1048} {"train_loss": -5.660274028778076, "global_step": 44028, "epoch": 1048} {"train_loss": -5.79345178604126, "global_step": 44029, "epoch": 1048} {"train_loss": -5.574995040893555, "global_step": 44030, "epoch": 1048} {"train_loss": -5.641117095947266, "global_step": 44031, "epoch": 1048} {"train_loss": -5.6390838623046875, "global_step": 44032, "epoch": 1048} {"train_loss": -5.75208854675293, "global_step": 44033, "epoch": 1048} {"train_loss": -5.64234733581543, "global_step": 44034, "epoch": 1048} {"train_loss": -5.72728157043457, "global_step": 44035, "epoch": 1048} {"train_loss": -5.659873008728027, "global_step": 44036, "epoch": 1048} {"train_loss": -5.840945243835449, "global_step": 44037, "epoch": 1048} {"train_loss": -5.628551959991455, "global_step": 44038, "epoch": 1048} {"train_loss": -5.74688196182251, "global_step": 44039, "epoch": 1048} {"train_loss": -5.794147968292236, "global_step": 44040, "epoch": 1048} {"train_loss": -5.687912940979004, "global_step": 44041, "epoch": 1048} {"train_loss": -5.763344764709473, "global_step": 44042, "epoch": 1048} {"train_loss": -5.599209308624268, "global_step": 44043, "epoch": 1048} {"train_loss": -5.74413537979126, "global_step": 44044, "epoch": 1048} {"train_loss": -5.655495643615723, "global_step": 44045, "epoch": 1048} {"train_loss": -5.726421356201172, "global_step": 44046, "epoch": 1048} {"train_loss": -5.648594856262207, "global_step": 44047, "epoch": 1048} {"train_loss": -5.5258026123046875, "global_step": 44048, "epoch": 1048} {"train_loss": -5.701503753662109, "global_step": 44049, "epoch": 1048} {"train_loss": -5.792889595031738, "global_step": 44050, "epoch": 1048} {"train_loss": -5.743501663208008, "global_step": 44051, "epoch": 1048} {"train_loss": -5.806880950927734, "global_step": 44052, "epoch": 1048} {"train_loss": -5.650835037231445, "global_step": 44053, "epoch": 1048} {"train_loss": -5.603304386138916, "global_step": 44054, "epoch": 1048} {"train_loss": -5.7333879470825195, "global_step": 44055, "epoch": 1048} {"train_loss": -5.846624374389648, "global_step": 44056, "epoch": 1048} {"train_loss": -5.710904075985863, "global_step": 44057, "epoch": 1048, "val_loss": 61344.2265625} {"train_loss": -5.619847297668457, "global_step": 44058, "epoch": 1049} {"train_loss": -5.780911445617676, "global_step": 44059, "epoch": 1049} {"train_loss": -5.677166938781738, "global_step": 44060, "epoch": 1049} {"train_loss": -5.646998405456543, "global_step": 44061, "epoch": 1049} {"train_loss": -5.753849983215332, "global_step": 44062, "epoch": 1049} {"train_loss": -5.706812381744385, "global_step": 44063, "epoch": 1049} {"train_loss": -5.604936599731445, "global_step": 44064, "epoch": 1049} {"train_loss": -5.712187767028809, "global_step": 44065, "epoch": 1049} {"train_loss": -5.688304424285889, "global_step": 44066, "epoch": 1049} {"train_loss": -5.665541648864746, "global_step": 44067, "epoch": 1049} {"train_loss": -5.5949625968933105, "global_step": 44068, "epoch": 1049} {"train_loss": -5.646200656890869, "global_step": 44069, "epoch": 1049} {"train_loss": -5.673983573913574, "global_step": 44070, "epoch": 1049} {"train_loss": -5.6102094650268555, "global_step": 44071, "epoch": 1049} {"train_loss": -5.712550163269043, "global_step": 44072, "epoch": 1049} {"train_loss": -5.4838547706604, "global_step": 44073, "epoch": 1049} {"train_loss": -5.748695373535156, "global_step": 44074, "epoch": 1049} {"train_loss": -5.547769546508789, "global_step": 44075, "epoch": 1049} {"train_loss": -5.620776653289795, "global_step": 44076, "epoch": 1049} {"train_loss": -5.7677717208862305, "global_step": 44077, "epoch": 1049} {"train_loss": -5.643311500549316, "global_step": 44078, "epoch": 1049} {"train_loss": -5.718991279602051, "global_step": 44079, "epoch": 1049} {"train_loss": -5.793300628662109, "global_step": 44080, "epoch": 1049} {"train_loss": -5.642394065856934, "global_step": 44081, "epoch": 1049} {"train_loss": -5.683123588562012, "global_step": 44082, "epoch": 1049} {"train_loss": -5.636260986328125, "global_step": 44083, "epoch": 1049} {"train_loss": -5.755152702331543, "global_step": 44084, "epoch": 1049} {"train_loss": -5.692843437194824, "global_step": 44085, "epoch": 1049} {"train_loss": -5.747432231903076, "global_step": 44086, "epoch": 1049} {"train_loss": -5.701033592224121, "global_step": 44087, "epoch": 1049} {"train_loss": -5.729037761688232, "global_step": 44088, "epoch": 1049} {"train_loss": -5.646320343017578, "global_step": 44089, "epoch": 1049} {"train_loss": -5.634101867675781, "global_step": 44090, "epoch": 1049} {"train_loss": -5.733682632446289, "global_step": 44091, "epoch": 1049} {"train_loss": -5.6534528732299805, "global_step": 44092, "epoch": 1049} {"train_loss": -5.658224105834961, "global_step": 44093, "epoch": 1049} {"train_loss": -5.630419731140137, "global_step": 44094, "epoch": 1049} {"train_loss": -5.724582195281982, "global_step": 44095, "epoch": 1049} {"train_loss": -5.6839919090271, "global_step": 44096, "epoch": 1049} {"train_loss": -5.716540336608887, "global_step": 44097, "epoch": 1049} {"train_loss": -5.658097267150879, "global_step": 44098, "epoch": 1049} {"train_loss": -5.674571934200468, "global_step": 44099, "epoch": 1049, "val_loss": 61595.84375} {"train_loss": -5.738212585449219, "global_step": 44100, "epoch": 1050} {"train_loss": -5.829848766326904, "global_step": 44101, "epoch": 1050} {"train_loss": -5.709795951843262, "global_step": 44102, "epoch": 1050} {"train_loss": -5.578530788421631, "global_step": 44103, "epoch": 1050} {"train_loss": -5.642797470092773, "global_step": 44104, "epoch": 1050} {"train_loss": -5.744236946105957, "global_step": 44105, "epoch": 1050} {"train_loss": -5.665005683898926, "global_step": 44106, "epoch": 1050} {"train_loss": -5.645633220672607, "global_step": 44107, "epoch": 1050} {"train_loss": -5.65379524230957, "global_step": 44108, "epoch": 1050} {"train_loss": -5.721263885498047, "global_step": 44109, "epoch": 1050} {"train_loss": -5.695793151855469, "global_step": 44110, "epoch": 1050} {"train_loss": -5.60377311706543, "global_step": 44111, "epoch": 1050} {"train_loss": -5.830260276794434, "global_step": 44112, "epoch": 1050} {"train_loss": -5.731808185577393, "global_step": 44113, "epoch": 1050} {"train_loss": -5.697896957397461, "global_step": 44114, "epoch": 1050} {"train_loss": -5.66835880279541, "global_step": 44115, "epoch": 1050} {"train_loss": -5.6528120040893555, "global_step": 44116, "epoch": 1050} {"train_loss": -5.872899532318115, "global_step": 44117, "epoch": 1050} {"train_loss": -5.666998863220215, "global_step": 44118, "epoch": 1050} {"train_loss": -5.690879821777344, "global_step": 44119, "epoch": 1050} {"train_loss": -5.729947090148926, "global_step": 44120, "epoch": 1050} {"train_loss": -5.641139030456543, "global_step": 44121, "epoch": 1050} {"train_loss": -5.666749000549316, "global_step": 44122, "epoch": 1050} {"train_loss": -5.507714748382568, "global_step": 44123, "epoch": 1050} {"train_loss": -5.65113639831543, "global_step": 44124, "epoch": 1050} {"train_loss": -5.631171226501465, "global_step": 44125, "epoch": 1050} {"train_loss": -5.702888011932373, "global_step": 44126, "epoch": 1050} {"train_loss": -5.587115287780762, "global_step": 44127, "epoch": 1050} {"train_loss": -5.696368217468262, "global_step": 44128, "epoch": 1050} {"train_loss": -5.69536018371582, "global_step": 44129, "epoch": 1050} {"train_loss": -5.7444610595703125, "global_step": 44130, "epoch": 1050} {"train_loss": -5.7811126708984375, "global_step": 44131, "epoch": 1050} {"train_loss": -5.714548110961914, "global_step": 44132, "epoch": 1050} {"train_loss": -5.641804218292236, "global_step": 44133, "epoch": 1050} {"train_loss": -5.738468647003174, "global_step": 44134, "epoch": 1050} {"train_loss": -5.628490447998047, "global_step": 44135, "epoch": 1050} {"train_loss": -5.70947265625, "global_step": 44136, "epoch": 1050} {"train_loss": -5.702254295349121, "global_step": 44137, "epoch": 1050} {"train_loss": -5.716302394866943, "global_step": 44138, "epoch": 1050} {"train_loss": -5.736324310302734, "global_step": 44139, "epoch": 1050} {"train_loss": -5.6095075607299805, "global_step": 44140, "epoch": 1050} {"train_loss": -5.687122742335002, "global_step": 44141, "epoch": 1050, "train/sim_max_reward_0": 0.1904064994813591, "train/sim_max_reward_1": 0.631352698062567, "train/sim_max_reward_2": 0.9150773197158604, "train/sim_max_reward_3": 0.5283967930075023, "train/sim_max_reward_4": 0.4865655627795202, "train/sim_max_reward_5": 0.19377497836788746, "test/sim_max_reward_4300000": 0.6767629504965222, "test/sim_max_reward_4300001": 0.1392156003268838, "test/sim_max_reward_4300002": 0.17403636649123597, "test/sim_max_reward_4300003": 0.9235537972679481, "test/sim_max_reward_4300004": 0.8446870076208067, "test/sim_max_reward_4300005": 0.7264574814253039, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3682342431310898, "test/sim_max_reward_4300008": 0.3529054310648043, "test/sim_max_reward_4300009": 0.4237879664873801, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.5756050780568701, "test/sim_max_reward_4300012": 0.92654611199431, "test/sim_max_reward_4300013": 0.3087005263470075, "test/sim_max_reward_4300014": 0.8000685603758548, "test/sim_max_reward_4300015": 0.4434244614857055, "test/sim_max_reward_4300016": 0.8511412059122327, "test/sim_max_reward_4300017": 0.5282061519542097, "test/sim_max_reward_4300018": 0.4514520529795256, "test/sim_max_reward_4300019": 0.18604780150252817, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.277852775107679, "test/sim_max_reward_4300022": 0.23093573431536363, "test/sim_max_reward_4300023": 0.34289655777470185, "test/sim_max_reward_4300024": 0.13817250073330564, "test/sim_max_reward_4300025": 0.9735324498825121, "test/sim_max_reward_4300026": 0.1377390175862662, "test/sim_max_reward_4300027": 0.738819210138778, "test/sim_max_reward_4300028": 0.005199555853560879, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.19818305229730476, "test/sim_max_reward_4300032": 0.6500873155696837, "test/sim_max_reward_4300033": 0.5668339818943339, "test/sim_max_reward_4300034": 0.18690448603781157, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.21168443987319124, "test/sim_max_reward_4300037": 0.7461674915644321, "test/sim_max_reward_4300038": 0.4448770784732612, "test/sim_max_reward_4300039": 0.6769955921608907, "test/sim_max_reward_4300040": 0.7896053862049045, "test/sim_max_reward_4300041": 0.23847892381614288, "test/sim_max_reward_4300042": 0.8214484969075189, "test/sim_max_reward_4300043": 0.11081873082262934, "test/sim_max_reward_4300044": 0.753150360402435, "test/sim_max_reward_4300045": 0.1794431984630625, "test/sim_max_reward_4300046": 0.5224611075163853, "test/sim_max_reward_4300047": 0.10789957637054805, "test/sim_max_reward_4300048": 0.48163292551799936, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.49092897523578266, "test/mean_score": 0.4046530548040984, "val_loss": 61746.546875} {"train_loss": -5.644042015075684, "global_step": 44142, "epoch": 1051} {"train_loss": -5.661373138427734, "global_step": 44143, "epoch": 1051} {"train_loss": -5.608591556549072, "global_step": 44144, "epoch": 1051} {"train_loss": -5.717844486236572, "global_step": 44145, "epoch": 1051} {"train_loss": -5.529506683349609, "global_step": 44146, "epoch": 1051} {"train_loss": -5.673995494842529, "global_step": 44147, "epoch": 1051} {"train_loss": -5.632303237915039, "global_step": 44148, "epoch": 1051} {"train_loss": -5.555987358093262, "global_step": 44149, "epoch": 1051} {"train_loss": -5.541373252868652, "global_step": 44150, "epoch": 1051} {"train_loss": -5.673774719238281, "global_step": 44151, "epoch": 1051} {"train_loss": -5.645110607147217, "global_step": 44152, "epoch": 1051} {"train_loss": -5.633892059326172, "global_step": 44153, "epoch": 1051} {"train_loss": -5.672144889831543, "global_step": 44154, "epoch": 1051} {"train_loss": -5.604207515716553, "global_step": 44155, "epoch": 1051} {"train_loss": -5.727250099182129, "global_step": 44156, "epoch": 1051} {"train_loss": -5.5323262214660645, "global_step": 44157, "epoch": 1051} {"train_loss": -5.694207668304443, "global_step": 44158, "epoch": 1051} {"train_loss": -5.6103363037109375, "global_step": 44159, "epoch": 1051} {"train_loss": -5.7030534744262695, "global_step": 44160, "epoch": 1051} {"train_loss": -5.651565074920654, "global_step": 44161, "epoch": 1051} {"train_loss": -5.7110795974731445, "global_step": 44162, "epoch": 1051} {"train_loss": -5.716147422790527, "global_step": 44163, "epoch": 1051} {"train_loss": -5.643136501312256, "global_step": 44164, "epoch": 1051} {"train_loss": -5.597680568695068, "global_step": 44165, "epoch": 1051} {"train_loss": -5.603570461273193, "global_step": 44166, "epoch": 1051} {"train_loss": -5.577859878540039, "global_step": 44167, "epoch": 1051} {"train_loss": -5.654747009277344, "global_step": 44168, "epoch": 1051} {"train_loss": -5.732665061950684, "global_step": 44169, "epoch": 1051} {"train_loss": -5.660155773162842, "global_step": 44170, "epoch": 1051} {"train_loss": -5.631597518920898, "global_step": 44171, "epoch": 1051} {"train_loss": -5.661434650421143, "global_step": 44172, "epoch": 1051} {"train_loss": -5.758004665374756, "global_step": 44173, "epoch": 1051} {"train_loss": -5.752304553985596, "global_step": 44174, "epoch": 1051} {"train_loss": -5.743651390075684, "global_step": 44175, "epoch": 1051} {"train_loss": -5.711687088012695, "global_step": 44176, "epoch": 1051} {"train_loss": -5.7253265380859375, "global_step": 44177, "epoch": 1051} {"train_loss": -5.596916198730469, "global_step": 44178, "epoch": 1051} {"train_loss": -5.731706619262695, "global_step": 44179, "epoch": 1051} {"train_loss": -5.777684211730957, "global_step": 44180, "epoch": 1051} {"train_loss": -5.6114726066589355, "global_step": 44181, "epoch": 1051} {"train_loss": -5.734502792358398, "global_step": 44182, "epoch": 1051} {"train_loss": -5.659897702080863, "global_step": 44183, "epoch": 1051, "val_loss": 61464.2421875} {"train_loss": -5.698107719421387, "global_step": 44184, "epoch": 1052} {"train_loss": -5.7901082038879395, "global_step": 44185, "epoch": 1052} {"train_loss": -5.713682174682617, "global_step": 44186, "epoch": 1052} {"train_loss": -5.62888240814209, "global_step": 44187, "epoch": 1052} {"train_loss": -5.624032020568848, "global_step": 44188, "epoch": 1052} {"train_loss": -5.762596130371094, "global_step": 44189, "epoch": 1052} {"train_loss": -5.690522193908691, "global_step": 44190, "epoch": 1052} {"train_loss": -5.726958751678467, "global_step": 44191, "epoch": 1052} {"train_loss": -5.850028991699219, "global_step": 44192, "epoch": 1052} {"train_loss": -5.660852909088135, "global_step": 44193, "epoch": 1052} {"train_loss": -5.632444381713867, "global_step": 44194, "epoch": 1052} {"train_loss": -5.736910820007324, "global_step": 44195, "epoch": 1052} {"train_loss": -5.641504287719727, "global_step": 44196, "epoch": 1052} {"train_loss": -5.533876419067383, "global_step": 44197, "epoch": 1052} {"train_loss": -5.706227779388428, "global_step": 44198, "epoch": 1052} {"train_loss": -5.599366664886475, "global_step": 44199, "epoch": 1052} {"train_loss": -5.720081806182861, "global_step": 44200, "epoch": 1052} {"train_loss": -5.589908599853516, "global_step": 44201, "epoch": 1052} {"train_loss": -5.684831142425537, "global_step": 44202, "epoch": 1052} {"train_loss": -5.699075698852539, "global_step": 44203, "epoch": 1052} {"train_loss": -5.623247146606445, "global_step": 44204, "epoch": 1052} {"train_loss": -5.6116485595703125, "global_step": 44205, "epoch": 1052} {"train_loss": -5.69968318939209, "global_step": 44206, "epoch": 1052} {"train_loss": -5.694884300231934, "global_step": 44207, "epoch": 1052} {"train_loss": -5.682921409606934, "global_step": 44208, "epoch": 1052} {"train_loss": -5.736833572387695, "global_step": 44209, "epoch": 1052} {"train_loss": -5.711761951446533, "global_step": 44210, "epoch": 1052} {"train_loss": -5.677098274230957, "global_step": 44211, "epoch": 1052} {"train_loss": -5.826342582702637, "global_step": 44212, "epoch": 1052} {"train_loss": -5.624963760375977, "global_step": 44213, "epoch": 1052} {"train_loss": -5.633103370666504, "global_step": 44214, "epoch": 1052} {"train_loss": -5.598973751068115, "global_step": 44215, "epoch": 1052} {"train_loss": -5.6586809158325195, "global_step": 44216, "epoch": 1052} {"train_loss": -5.652192115783691, "global_step": 44217, "epoch": 1052} {"train_loss": -5.80492639541626, "global_step": 44218, "epoch": 1052} {"train_loss": -5.751523971557617, "global_step": 44219, "epoch": 1052} {"train_loss": -5.710587501525879, "global_step": 44220, "epoch": 1052} {"train_loss": -5.728263854980469, "global_step": 44221, "epoch": 1052} {"train_loss": -5.676805019378662, "global_step": 44222, "epoch": 1052} {"train_loss": -5.606215476989746, "global_step": 44223, "epoch": 1052} {"train_loss": -5.595834732055664, "global_step": 44224, "epoch": 1052} {"train_loss": -5.68267780258542, "global_step": 44225, "epoch": 1052, "val_loss": 61798.734375} {"train_loss": -5.817928791046143, "global_step": 44226, "epoch": 1053} {"train_loss": -5.596580505371094, "global_step": 44227, "epoch": 1053} {"train_loss": -5.593324661254883, "global_step": 44228, "epoch": 1053} {"train_loss": -5.73674201965332, "global_step": 44229, "epoch": 1053} {"train_loss": -5.736885070800781, "global_step": 44230, "epoch": 1053} {"train_loss": -5.535470008850098, "global_step": 44231, "epoch": 1053} {"train_loss": -5.74395751953125, "global_step": 44232, "epoch": 1053} {"train_loss": -5.531440734863281, "global_step": 44233, "epoch": 1053} {"train_loss": -5.660431385040283, "global_step": 44234, "epoch": 1053} {"train_loss": -5.690217018127441, "global_step": 44235, "epoch": 1053} {"train_loss": -5.634563446044922, "global_step": 44236, "epoch": 1053} {"train_loss": -5.662023067474365, "global_step": 44237, "epoch": 1053} {"train_loss": -5.700850009918213, "global_step": 44238, "epoch": 1053} {"train_loss": -5.581447601318359, "global_step": 44239, "epoch": 1053} {"train_loss": -5.655483245849609, "global_step": 44240, "epoch": 1053} {"train_loss": -5.718319416046143, "global_step": 44241, "epoch": 1053} {"train_loss": -5.587040901184082, "global_step": 44242, "epoch": 1053} {"train_loss": -5.7316155433654785, "global_step": 44243, "epoch": 1053} {"train_loss": -5.595983505249023, "global_step": 44244, "epoch": 1053} {"train_loss": -5.551034927368164, "global_step": 44245, "epoch": 1053} {"train_loss": -5.554267406463623, "global_step": 44246, "epoch": 1053} {"train_loss": -5.577107906341553, "global_step": 44247, "epoch": 1053} {"train_loss": -5.690510272979736, "global_step": 44248, "epoch": 1053} {"train_loss": -5.557178497314453, "global_step": 44249, "epoch": 1053} {"train_loss": -5.744379997253418, "global_step": 44250, "epoch": 1053} {"train_loss": -5.517827987670898, "global_step": 44251, "epoch": 1053} {"train_loss": -5.619195938110352, "global_step": 44252, "epoch": 1053} {"train_loss": -5.782619476318359, "global_step": 44253, "epoch": 1053} {"train_loss": -5.659411430358887, "global_step": 44254, "epoch": 1053} {"train_loss": -5.810604095458984, "global_step": 44255, "epoch": 1053} {"train_loss": -5.785247802734375, "global_step": 44256, "epoch": 1053} {"train_loss": -5.624666213989258, "global_step": 44257, "epoch": 1053} {"train_loss": -5.664027214050293, "global_step": 44258, "epoch": 1053} {"train_loss": -5.511940002441406, "global_step": 44259, "epoch": 1053} {"train_loss": -5.701689720153809, "global_step": 44260, "epoch": 1053} {"train_loss": -5.792078018188477, "global_step": 44261, "epoch": 1053} {"train_loss": -5.668280601501465, "global_step": 44262, "epoch": 1053} {"train_loss": -5.700557708740234, "global_step": 44263, "epoch": 1053} {"train_loss": -5.735178470611572, "global_step": 44264, "epoch": 1053} {"train_loss": -5.742262363433838, "global_step": 44265, "epoch": 1053} {"train_loss": -5.797271728515625, "global_step": 44266, "epoch": 1053} {"train_loss": -5.665404387882778, "global_step": 44267, "epoch": 1053, "val_loss": 61479.87890625} {"train_loss": -5.718724250793457, "global_step": 44268, "epoch": 1054} {"train_loss": -5.603023052215576, "global_step": 44269, "epoch": 1054} {"train_loss": -5.716245651245117, "global_step": 44270, "epoch": 1054} {"train_loss": -5.711299419403076, "global_step": 44271, "epoch": 1054} {"train_loss": -5.797451496124268, "global_step": 44272, "epoch": 1054} {"train_loss": -5.720502853393555, "global_step": 44273, "epoch": 1054} {"train_loss": -5.70775842666626, "global_step": 44274, "epoch": 1054} {"train_loss": -5.853402614593506, "global_step": 44275, "epoch": 1054} {"train_loss": -5.792832374572754, "global_step": 44276, "epoch": 1054} {"train_loss": -5.638411521911621, "global_step": 44277, "epoch": 1054} {"train_loss": -5.641397476196289, "global_step": 44278, "epoch": 1054} {"train_loss": -5.753383636474609, "global_step": 44279, "epoch": 1054} {"train_loss": -5.728864669799805, "global_step": 44280, "epoch": 1054} {"train_loss": -5.707991600036621, "global_step": 44281, "epoch": 1054} {"train_loss": -5.657042980194092, "global_step": 44282, "epoch": 1054} {"train_loss": -5.667757034301758, "global_step": 44283, "epoch": 1054} {"train_loss": -5.714725017547607, "global_step": 44284, "epoch": 1054} {"train_loss": -5.5560526847839355, "global_step": 44285, "epoch": 1054} {"train_loss": -5.682363986968994, "global_step": 44286, "epoch": 1054} {"train_loss": -5.60581111907959, "global_step": 44287, "epoch": 1054} {"train_loss": -5.559041500091553, "global_step": 44288, "epoch": 1054} {"train_loss": -5.671916961669922, "global_step": 44289, "epoch": 1054} {"train_loss": -5.754437446594238, "global_step": 44290, "epoch": 1054} {"train_loss": -5.715524673461914, "global_step": 44291, "epoch": 1054} {"train_loss": -5.69099235534668, "global_step": 44292, "epoch": 1054} {"train_loss": -5.551911354064941, "global_step": 44293, "epoch": 1054} {"train_loss": -5.903077602386475, "global_step": 44294, "epoch": 1054} {"train_loss": -5.58853816986084, "global_step": 44295, "epoch": 1054} {"train_loss": -5.628700256347656, "global_step": 44296, "epoch": 1054} {"train_loss": -5.596672058105469, "global_step": 44297, "epoch": 1054} {"train_loss": -5.669806480407715, "global_step": 44298, "epoch": 1054} {"train_loss": -5.697772979736328, "global_step": 44299, "epoch": 1054} {"train_loss": -5.735633850097656, "global_step": 44300, "epoch": 1054} {"train_loss": -5.61468505859375, "global_step": 44301, "epoch": 1054} {"train_loss": -5.654468536376953, "global_step": 44302, "epoch": 1054} {"train_loss": -5.669949531555176, "global_step": 44303, "epoch": 1054} {"train_loss": -5.724529266357422, "global_step": 44304, "epoch": 1054} {"train_loss": -5.607534408569336, "global_step": 44305, "epoch": 1054} {"train_loss": -5.88581657409668, "global_step": 44306, "epoch": 1054} {"train_loss": -5.803827285766602, "global_step": 44307, "epoch": 1054} {"train_loss": -5.672791481018066, "global_step": 44308, "epoch": 1054} {"train_loss": -5.693551676613944, "global_step": 44309, "epoch": 1054, "val_loss": 61382.79296875} {"train_loss": -5.735605239868164, "global_step": 44310, "epoch": 1055} {"train_loss": -5.727376461029053, "global_step": 44311, "epoch": 1055} {"train_loss": -5.788148880004883, "global_step": 44312, "epoch": 1055} {"train_loss": -5.67041015625, "global_step": 44313, "epoch": 1055} {"train_loss": -5.67631721496582, "global_step": 44314, "epoch": 1055} {"train_loss": -5.803853511810303, "global_step": 44315, "epoch": 1055} {"train_loss": -5.61348295211792, "global_step": 44316, "epoch": 1055} {"train_loss": -5.753443717956543, "global_step": 44317, "epoch": 1055} {"train_loss": -5.733636379241943, "global_step": 44318, "epoch": 1055} {"train_loss": -5.709430694580078, "global_step": 44319, "epoch": 1055} {"train_loss": -5.790097236633301, "global_step": 44320, "epoch": 1055} {"train_loss": -5.65631103515625, "global_step": 44321, "epoch": 1055} {"train_loss": -5.793188571929932, "global_step": 44322, "epoch": 1055} {"train_loss": -5.558526515960693, "global_step": 44323, "epoch": 1055} {"train_loss": -5.563919544219971, "global_step": 44324, "epoch": 1055} {"train_loss": -5.688546180725098, "global_step": 44325, "epoch": 1055} {"train_loss": -5.636098384857178, "global_step": 44326, "epoch": 1055} {"train_loss": -5.646467208862305, "global_step": 44327, "epoch": 1055} {"train_loss": -5.7993268966674805, "global_step": 44328, "epoch": 1055} {"train_loss": -5.600274562835693, "global_step": 44329, "epoch": 1055} {"train_loss": -5.667884826660156, "global_step": 44330, "epoch": 1055} {"train_loss": -5.63273811340332, "global_step": 44331, "epoch": 1055} {"train_loss": -5.810215473175049, "global_step": 44332, "epoch": 1055} {"train_loss": -5.673596382141113, "global_step": 44333, "epoch": 1055} {"train_loss": -5.566671848297119, "global_step": 44334, "epoch": 1055} {"train_loss": -5.7691755294799805, "global_step": 44335, "epoch": 1055} {"train_loss": -5.716982841491699, "global_step": 44336, "epoch": 1055} {"train_loss": -5.760733604431152, "global_step": 44337, "epoch": 1055} {"train_loss": -5.683829307556152, "global_step": 44338, "epoch": 1055} {"train_loss": -5.700709819793701, "global_step": 44339, "epoch": 1055} {"train_loss": -5.74076509475708, "global_step": 44340, "epoch": 1055} {"train_loss": -5.711129188537598, "global_step": 44341, "epoch": 1055} {"train_loss": -5.736934661865234, "global_step": 44342, "epoch": 1055} {"train_loss": -5.600564002990723, "global_step": 44343, "epoch": 1055} {"train_loss": -5.644100189208984, "global_step": 44344, "epoch": 1055} {"train_loss": -5.756532192230225, "global_step": 44345, "epoch": 1055} {"train_loss": -5.645458221435547, "global_step": 44346, "epoch": 1055} {"train_loss": -5.74383020401001, "global_step": 44347, "epoch": 1055} {"train_loss": -5.669830799102783, "global_step": 44348, "epoch": 1055} {"train_loss": -5.712367057800293, "global_step": 44349, "epoch": 1055} {"train_loss": -5.766793251037598, "global_step": 44350, "epoch": 1055} {"train_loss": -5.697156974247524, "global_step": 44351, "epoch": 1055, "val_loss": 61729.91015625} {"train_loss": -5.675485134124756, "global_step": 44352, "epoch": 1056} {"train_loss": -5.598400115966797, "global_step": 44353, "epoch": 1056} {"train_loss": -5.828364372253418, "global_step": 44354, "epoch": 1056} {"train_loss": -5.723814487457275, "global_step": 44355, "epoch": 1056} {"train_loss": -5.647823333740234, "global_step": 44356, "epoch": 1056} {"train_loss": -5.714506149291992, "global_step": 44357, "epoch": 1056} {"train_loss": -5.610697269439697, "global_step": 44358, "epoch": 1056} {"train_loss": -5.70546817779541, "global_step": 44359, "epoch": 1056} {"train_loss": -5.657464027404785, "global_step": 44360, "epoch": 1056} {"train_loss": -5.673191070556641, "global_step": 44361, "epoch": 1056} {"train_loss": -5.608632564544678, "global_step": 44362, "epoch": 1056} {"train_loss": -5.750522613525391, "global_step": 44363, "epoch": 1056} {"train_loss": -5.62013053894043, "global_step": 44364, "epoch": 1056} {"train_loss": -5.876959800720215, "global_step": 44365, "epoch": 1056} {"train_loss": -5.6663713455200195, "global_step": 44366, "epoch": 1056} {"train_loss": -5.750343322753906, "global_step": 44367, "epoch": 1056} {"train_loss": -5.708127021789551, "global_step": 44368, "epoch": 1056} {"train_loss": -5.680885314941406, "global_step": 44369, "epoch": 1056} {"train_loss": -5.753174781799316, "global_step": 44370, "epoch": 1056} {"train_loss": -5.616781234741211, "global_step": 44371, "epoch": 1056} {"train_loss": -5.711121559143066, "global_step": 44372, "epoch": 1056} {"train_loss": -5.7671732902526855, "global_step": 44373, "epoch": 1056} {"train_loss": -5.772436141967773, "global_step": 44374, "epoch": 1056} {"train_loss": -5.807285308837891, "global_step": 44375, "epoch": 1056} {"train_loss": -5.750161647796631, "global_step": 44376, "epoch": 1056} {"train_loss": -5.749307632446289, "global_step": 44377, "epoch": 1056} {"train_loss": -5.775264739990234, "global_step": 44378, "epoch": 1056} {"train_loss": -5.682603359222412, "global_step": 44379, "epoch": 1056} {"train_loss": -5.678854942321777, "global_step": 44380, "epoch": 1056} {"train_loss": -5.767301082611084, "global_step": 44381, "epoch": 1056} {"train_loss": -5.668347358703613, "global_step": 44382, "epoch": 1056} {"train_loss": -5.713169097900391, "global_step": 44383, "epoch": 1056} {"train_loss": -5.747889518737793, "global_step": 44384, "epoch": 1056} {"train_loss": -5.5136518478393555, "global_step": 44385, "epoch": 1056} {"train_loss": -5.641631126403809, "global_step": 44386, "epoch": 1056} {"train_loss": -5.606328964233398, "global_step": 44387, "epoch": 1056} {"train_loss": -5.488303184509277, "global_step": 44388, "epoch": 1056} {"train_loss": -5.70244026184082, "global_step": 44389, "epoch": 1056} {"train_loss": -5.729353904724121, "global_step": 44390, "epoch": 1056} {"train_loss": -5.620040416717529, "global_step": 44391, "epoch": 1056} {"train_loss": -5.510841369628906, "global_step": 44392, "epoch": 1056} {"train_loss": -5.6854856468382335, "global_step": 44393, "epoch": 1056, "val_loss": 61822.72265625} {"train_loss": -5.564708709716797, "global_step": 44394, "epoch": 1057} {"train_loss": -5.656774520874023, "global_step": 44395, "epoch": 1057} {"train_loss": -5.561251163482666, "global_step": 44396, "epoch": 1057} {"train_loss": -5.814548492431641, "global_step": 44397, "epoch": 1057} {"train_loss": -5.532782077789307, "global_step": 44398, "epoch": 1057} {"train_loss": -5.646757125854492, "global_step": 44399, "epoch": 1057} {"train_loss": -5.648743152618408, "global_step": 44400, "epoch": 1057} {"train_loss": -5.694344520568848, "global_step": 44401, "epoch": 1057} {"train_loss": -5.582111835479736, "global_step": 44402, "epoch": 1057} {"train_loss": -5.688358306884766, "global_step": 44403, "epoch": 1057} {"train_loss": -5.803649425506592, "global_step": 44404, "epoch": 1057} {"train_loss": -5.526137828826904, "global_step": 44405, "epoch": 1057} {"train_loss": -5.705646514892578, "global_step": 44406, "epoch": 1057} {"train_loss": -5.656991958618164, "global_step": 44407, "epoch": 1057} {"train_loss": -5.6944260597229, "global_step": 44408, "epoch": 1057} {"train_loss": -5.790726661682129, "global_step": 44409, "epoch": 1057} {"train_loss": -5.635385513305664, "global_step": 44410, "epoch": 1057} {"train_loss": -5.7394304275512695, "global_step": 44411, "epoch": 1057} {"train_loss": -5.69572114944458, "global_step": 44412, "epoch": 1057} {"train_loss": -5.646633148193359, "global_step": 44413, "epoch": 1057} {"train_loss": -5.6833038330078125, "global_step": 44414, "epoch": 1057} {"train_loss": -5.7411932945251465, "global_step": 44415, "epoch": 1057} {"train_loss": -5.670021057128906, "global_step": 44416, "epoch": 1057} {"train_loss": -5.7934699058532715, "global_step": 44417, "epoch": 1057} {"train_loss": -5.7888102531433105, "global_step": 44418, "epoch": 1057} {"train_loss": -5.713958263397217, "global_step": 44419, "epoch": 1057} {"train_loss": -5.708228588104248, "global_step": 44420, "epoch": 1057} {"train_loss": -5.595441818237305, "global_step": 44421, "epoch": 1057} {"train_loss": -5.546402454376221, "global_step": 44422, "epoch": 1057} {"train_loss": -5.581158638000488, "global_step": 44423, "epoch": 1057} {"train_loss": -5.6720781326293945, "global_step": 44424, "epoch": 1057} {"train_loss": -5.574203014373779, "global_step": 44425, "epoch": 1057} {"train_loss": -5.687372207641602, "global_step": 44426, "epoch": 1057} {"train_loss": -5.654412269592285, "global_step": 44427, "epoch": 1057} {"train_loss": -5.7257843017578125, "global_step": 44428, "epoch": 1057} {"train_loss": -5.7517595291137695, "global_step": 44429, "epoch": 1057} {"train_loss": -5.714211463928223, "global_step": 44430, "epoch": 1057} {"train_loss": -5.523800849914551, "global_step": 44431, "epoch": 1057} {"train_loss": -5.792868137359619, "global_step": 44432, "epoch": 1057} {"train_loss": -5.650174140930176, "global_step": 44433, "epoch": 1057} {"train_loss": -5.568452835083008, "global_step": 44434, "epoch": 1057} {"train_loss": -5.6727409022195, "global_step": 44435, "epoch": 1057, "val_loss": 61767.97265625} {"train_loss": -5.754367828369141, "global_step": 44436, "epoch": 1058} {"train_loss": -5.81382417678833, "global_step": 44437, "epoch": 1058} {"train_loss": -5.6969099044799805, "global_step": 44438, "epoch": 1058} {"train_loss": -5.68326473236084, "global_step": 44439, "epoch": 1058} {"train_loss": -5.655320167541504, "global_step": 44440, "epoch": 1058} {"train_loss": -5.67691707611084, "global_step": 44441, "epoch": 1058} {"train_loss": -5.740853309631348, "global_step": 44442, "epoch": 1058} {"train_loss": -5.664506435394287, "global_step": 44443, "epoch": 1058} {"train_loss": -5.762070178985596, "global_step": 44444, "epoch": 1058} {"train_loss": -5.7012763023376465, "global_step": 44445, "epoch": 1058} {"train_loss": -5.704421520233154, "global_step": 44446, "epoch": 1058} {"train_loss": -5.675232887268066, "global_step": 44447, "epoch": 1058} {"train_loss": -5.688531398773193, "global_step": 44448, "epoch": 1058} {"train_loss": -5.743099212646484, "global_step": 44449, "epoch": 1058} {"train_loss": -5.767818450927734, "global_step": 44450, "epoch": 1058} {"train_loss": -5.836067199707031, "global_step": 44451, "epoch": 1058} {"train_loss": -5.685764312744141, "global_step": 44452, "epoch": 1058} {"train_loss": -5.603862285614014, "global_step": 44453, "epoch": 1058} {"train_loss": -5.680331707000732, "global_step": 44454, "epoch": 1058} {"train_loss": -5.724700927734375, "global_step": 44455, "epoch": 1058} {"train_loss": -5.769892692565918, "global_step": 44456, "epoch": 1058} {"train_loss": -5.78809928894043, "global_step": 44457, "epoch": 1058} {"train_loss": -5.692151069641113, "global_step": 44458, "epoch": 1058} {"train_loss": -5.593406677246094, "global_step": 44459, "epoch": 1058} {"train_loss": -5.766475200653076, "global_step": 44460, "epoch": 1058} {"train_loss": -5.675118446350098, "global_step": 44461, "epoch": 1058} {"train_loss": -5.579279899597168, "global_step": 44462, "epoch": 1058} {"train_loss": -5.723925590515137, "global_step": 44463, "epoch": 1058} {"train_loss": -5.705070495605469, "global_step": 44464, "epoch": 1058} {"train_loss": -5.683602809906006, "global_step": 44465, "epoch": 1058} {"train_loss": -5.6506428718566895, "global_step": 44466, "epoch": 1058} {"train_loss": -5.685697078704834, "global_step": 44467, "epoch": 1058} {"train_loss": -5.7556657791137695, "global_step": 44468, "epoch": 1058} {"train_loss": -5.710409641265869, "global_step": 44469, "epoch": 1058} {"train_loss": -5.676811218261719, "global_step": 44470, "epoch": 1058} {"train_loss": -5.794666290283203, "global_step": 44471, "epoch": 1058} {"train_loss": -5.699397563934326, "global_step": 44472, "epoch": 1058} {"train_loss": -5.774529457092285, "global_step": 44473, "epoch": 1058} {"train_loss": -5.867703437805176, "global_step": 44474, "epoch": 1058} {"train_loss": -5.6549506187438965, "global_step": 44475, "epoch": 1058} {"train_loss": -5.640409469604492, "global_step": 44476, "epoch": 1058} {"train_loss": -5.710408517292568, "global_step": 44477, "epoch": 1058, "val_loss": 61766.08984375} {"train_loss": -5.7453532218933105, "global_step": 44478, "epoch": 1059} {"train_loss": -5.534890174865723, "global_step": 44479, "epoch": 1059} {"train_loss": -5.686633110046387, "global_step": 44480, "epoch": 1059} {"train_loss": -5.640552043914795, "global_step": 44481, "epoch": 1059} {"train_loss": -5.654365062713623, "global_step": 44482, "epoch": 1059} {"train_loss": -5.813127040863037, "global_step": 44483, "epoch": 1059} {"train_loss": -5.633050441741943, "global_step": 44484, "epoch": 1059} {"train_loss": -5.6925272941589355, "global_step": 44485, "epoch": 1059} {"train_loss": -5.700449466705322, "global_step": 44486, "epoch": 1059} {"train_loss": -5.651930809020996, "global_step": 44487, "epoch": 1059} {"train_loss": -5.6216559410095215, "global_step": 44488, "epoch": 1059} {"train_loss": -5.5711870193481445, "global_step": 44489, "epoch": 1059} {"train_loss": -5.696683883666992, "global_step": 44490, "epoch": 1059} {"train_loss": -5.7394914627075195, "global_step": 44491, "epoch": 1059} {"train_loss": -5.574528694152832, "global_step": 44492, "epoch": 1059} {"train_loss": -5.672235488891602, "global_step": 44493, "epoch": 1059} {"train_loss": -5.656745433807373, "global_step": 44494, "epoch": 1059} {"train_loss": -5.623951435089111, "global_step": 44495, "epoch": 1059} {"train_loss": -5.670248031616211, "global_step": 44496, "epoch": 1059} {"train_loss": -5.70513916015625, "global_step": 44497, "epoch": 1059} {"train_loss": -5.777992248535156, "global_step": 44498, "epoch": 1059} {"train_loss": -5.640408039093018, "global_step": 44499, "epoch": 1059} {"train_loss": -5.828007698059082, "global_step": 44500, "epoch": 1059} {"train_loss": -5.691561698913574, "global_step": 44501, "epoch": 1059} {"train_loss": -5.616350173950195, "global_step": 44502, "epoch": 1059} {"train_loss": -5.650032043457031, "global_step": 44503, "epoch": 1059} {"train_loss": -5.623479843139648, "global_step": 44504, "epoch": 1059} {"train_loss": -5.677099227905273, "global_step": 44505, "epoch": 1059} {"train_loss": -5.682956695556641, "global_step": 44506, "epoch": 1059} {"train_loss": -5.670036792755127, "global_step": 44507, "epoch": 1059} {"train_loss": -5.814374923706055, "global_step": 44508, "epoch": 1059} {"train_loss": -5.662372589111328, "global_step": 44509, "epoch": 1059} {"train_loss": -5.7271409034729, "global_step": 44510, "epoch": 1059} {"train_loss": -5.687023162841797, "global_step": 44511, "epoch": 1059} {"train_loss": -5.718659400939941, "global_step": 44512, "epoch": 1059} {"train_loss": -5.685463905334473, "global_step": 44513, "epoch": 1059} {"train_loss": -5.7647552490234375, "global_step": 44514, "epoch": 1059} {"train_loss": -5.802585601806641, "global_step": 44515, "epoch": 1059} {"train_loss": -5.837732315063477, "global_step": 44516, "epoch": 1059} {"train_loss": -5.703120231628418, "global_step": 44517, "epoch": 1059} {"train_loss": -5.745361804962158, "global_step": 44518, "epoch": 1059} {"train_loss": -5.690943082173665, "global_step": 44519, "epoch": 1059, "val_loss": 61430.34375} {"train_loss": -5.797602653503418, "global_step": 44520, "epoch": 1060} {"train_loss": -5.6627702713012695, "global_step": 44521, "epoch": 1060} {"train_loss": -5.7817583084106445, "global_step": 44522, "epoch": 1060} {"train_loss": -5.756293296813965, "global_step": 44523, "epoch": 1060} {"train_loss": -5.7050557136535645, "global_step": 44524, "epoch": 1060} {"train_loss": -5.7761616706848145, "global_step": 44525, "epoch": 1060} {"train_loss": -5.755834579467773, "global_step": 44526, "epoch": 1060} {"train_loss": -5.703525543212891, "global_step": 44527, "epoch": 1060} {"train_loss": -5.74601936340332, "global_step": 44528, "epoch": 1060} {"train_loss": -5.587526321411133, "global_step": 44529, "epoch": 1060} {"train_loss": -5.7000732421875, "global_step": 44530, "epoch": 1060} {"train_loss": -5.657413482666016, "global_step": 44531, "epoch": 1060} {"train_loss": -5.802544593811035, "global_step": 44532, "epoch": 1060} {"train_loss": -5.770415306091309, "global_step": 44533, "epoch": 1060} {"train_loss": -5.763629913330078, "global_step": 44534, "epoch": 1060} {"train_loss": -5.65667200088501, "global_step": 44535, "epoch": 1060} {"train_loss": -5.706295490264893, "global_step": 44536, "epoch": 1060} {"train_loss": -5.776494026184082, "global_step": 44537, "epoch": 1060} {"train_loss": -5.7499284744262695, "global_step": 44538, "epoch": 1060} {"train_loss": -5.700541973114014, "global_step": 44539, "epoch": 1060} {"train_loss": -5.844989776611328, "global_step": 44540, "epoch": 1060} {"train_loss": -5.785748481750488, "global_step": 44541, "epoch": 1060} {"train_loss": -5.801322937011719, "global_step": 44542, "epoch": 1060} {"train_loss": -5.563690662384033, "global_step": 44543, "epoch": 1060} {"train_loss": -5.613796234130859, "global_step": 44544, "epoch": 1060} {"train_loss": -5.732985496520996, "global_step": 44545, "epoch": 1060} {"train_loss": -5.7579169273376465, "global_step": 44546, "epoch": 1060} {"train_loss": -5.717895030975342, "global_step": 44547, "epoch": 1060} {"train_loss": -5.692056179046631, "global_step": 44548, "epoch": 1060} {"train_loss": -5.742790699005127, "global_step": 44549, "epoch": 1060} {"train_loss": -5.704990863800049, "global_step": 44550, "epoch": 1060} {"train_loss": -5.59395694732666, "global_step": 44551, "epoch": 1060} {"train_loss": -5.69325065612793, "global_step": 44552, "epoch": 1060} {"train_loss": -5.688953876495361, "global_step": 44553, "epoch": 1060} {"train_loss": -5.706357955932617, "global_step": 44554, "epoch": 1060} {"train_loss": -5.677412033081055, "global_step": 44555, "epoch": 1060} {"train_loss": -5.652550220489502, "global_step": 44556, "epoch": 1060} {"train_loss": -5.734514236450195, "global_step": 44557, "epoch": 1060} {"train_loss": -5.6670308113098145, "global_step": 44558, "epoch": 1060} {"train_loss": -5.705654144287109, "global_step": 44559, "epoch": 1060} {"train_loss": -5.633411884307861, "global_step": 44560, "epoch": 1060} {"train_loss": -5.715601080939884, "global_step": 44561, "epoch": 1060, "val_loss": 61646.0234375} {"train_loss": -5.719757080078125, "global_step": 44562, "epoch": 1061} {"train_loss": -5.599249362945557, "global_step": 44563, "epoch": 1061} {"train_loss": -5.634149551391602, "global_step": 44564, "epoch": 1061} {"train_loss": -5.753193378448486, "global_step": 44565, "epoch": 1061} {"train_loss": -5.629657745361328, "global_step": 44566, "epoch": 1061} {"train_loss": -5.536628723144531, "global_step": 44567, "epoch": 1061} {"train_loss": -5.6173224449157715, "global_step": 44568, "epoch": 1061} {"train_loss": -5.594020843505859, "global_step": 44569, "epoch": 1061} {"train_loss": -5.622485637664795, "global_step": 44570, "epoch": 1061} {"train_loss": -5.6043477058410645, "global_step": 44571, "epoch": 1061} {"train_loss": -5.792989730834961, "global_step": 44572, "epoch": 1061} {"train_loss": -5.614524841308594, "global_step": 44573, "epoch": 1061} {"train_loss": -5.660818576812744, "global_step": 44574, "epoch": 1061} {"train_loss": -5.568558692932129, "global_step": 44575, "epoch": 1061} {"train_loss": -5.720422744750977, "global_step": 44576, "epoch": 1061} {"train_loss": -5.744864463806152, "global_step": 44577, "epoch": 1061} {"train_loss": -5.5392680168151855, "global_step": 44578, "epoch": 1061} {"train_loss": -5.794466018676758, "global_step": 44579, "epoch": 1061} {"train_loss": -5.750151634216309, "global_step": 44580, "epoch": 1061} {"train_loss": -5.540116310119629, "global_step": 44581, "epoch": 1061} {"train_loss": -5.661986351013184, "global_step": 44582, "epoch": 1061} {"train_loss": -5.7200798988342285, "global_step": 44583, "epoch": 1061} {"train_loss": -5.662886619567871, "global_step": 44584, "epoch": 1061} {"train_loss": -5.678586959838867, "global_step": 44585, "epoch": 1061} {"train_loss": -5.734373092651367, "global_step": 44586, "epoch": 1061} {"train_loss": -5.658171653747559, "global_step": 44587, "epoch": 1061} {"train_loss": -5.596962928771973, "global_step": 44588, "epoch": 1061} {"train_loss": -5.673041343688965, "global_step": 44589, "epoch": 1061} {"train_loss": -5.512289047241211, "global_step": 44590, "epoch": 1061} {"train_loss": -5.726837158203125, "global_step": 44591, "epoch": 1061} {"train_loss": -5.593329429626465, "global_step": 44592, "epoch": 1061} {"train_loss": -5.818183422088623, "global_step": 44593, "epoch": 1061} {"train_loss": -5.65838623046875, "global_step": 44594, "epoch": 1061} {"train_loss": -5.680196762084961, "global_step": 44595, "epoch": 1061} {"train_loss": -5.7702131271362305, "global_step": 44596, "epoch": 1061} {"train_loss": -5.645462989807129, "global_step": 44597, "epoch": 1061} {"train_loss": -5.723092555999756, "global_step": 44598, "epoch": 1061} {"train_loss": -5.718775272369385, "global_step": 44599, "epoch": 1061} {"train_loss": -5.5733208656311035, "global_step": 44600, "epoch": 1061} {"train_loss": -5.7070136070251465, "global_step": 44601, "epoch": 1061} {"train_loss": -5.662607192993164, "global_step": 44602, "epoch": 1061} {"train_loss": -5.664505073002407, "global_step": 44603, "epoch": 1061, "val_loss": 61517.1171875} {"train_loss": -5.719971656799316, "global_step": 44604, "epoch": 1062} {"train_loss": -5.76700496673584, "global_step": 44605, "epoch": 1062} {"train_loss": -5.689694881439209, "global_step": 44606, "epoch": 1062} {"train_loss": -5.752078056335449, "global_step": 44607, "epoch": 1062} {"train_loss": -5.656053066253662, "global_step": 44608, "epoch": 1062} {"train_loss": -5.761642932891846, "global_step": 44609, "epoch": 1062} {"train_loss": -5.708312034606934, "global_step": 44610, "epoch": 1062} {"train_loss": -5.720139503479004, "global_step": 44611, "epoch": 1062} {"train_loss": -5.6483964920043945, "global_step": 44612, "epoch": 1062} {"train_loss": -5.78571081161499, "global_step": 44613, "epoch": 1062} {"train_loss": -5.716033935546875, "global_step": 44614, "epoch": 1062} {"train_loss": -5.597801685333252, "global_step": 44615, "epoch": 1062} {"train_loss": -5.761134147644043, "global_step": 44616, "epoch": 1062} {"train_loss": -5.733608245849609, "global_step": 44617, "epoch": 1062} {"train_loss": -5.831944465637207, "global_step": 44618, "epoch": 1062} {"train_loss": -5.603032112121582, "global_step": 44619, "epoch": 1062} {"train_loss": -5.752042770385742, "global_step": 44620, "epoch": 1062} {"train_loss": -5.765809059143066, "global_step": 44621, "epoch": 1062} {"train_loss": -5.6822662353515625, "global_step": 44622, "epoch": 1062} {"train_loss": -5.722679138183594, "global_step": 44623, "epoch": 1062} {"train_loss": -5.685309410095215, "global_step": 44624, "epoch": 1062} {"train_loss": -5.700469970703125, "global_step": 44625, "epoch": 1062} {"train_loss": -5.682533264160156, "global_step": 44626, "epoch": 1062} {"train_loss": -5.527725696563721, "global_step": 44627, "epoch": 1062} {"train_loss": -5.662843227386475, "global_step": 44628, "epoch": 1062} {"train_loss": -5.6151323318481445, "global_step": 44629, "epoch": 1062} {"train_loss": -5.726312160491943, "global_step": 44630, "epoch": 1062} {"train_loss": -5.624807834625244, "global_step": 44631, "epoch": 1062} {"train_loss": -5.752466201782227, "global_step": 44632, "epoch": 1062} {"train_loss": -5.828557968139648, "global_step": 44633, "epoch": 1062} {"train_loss": -5.690916538238525, "global_step": 44634, "epoch": 1062} {"train_loss": -5.770120620727539, "global_step": 44635, "epoch": 1062} {"train_loss": -5.74638557434082, "global_step": 44636, "epoch": 1062} {"train_loss": -5.771854400634766, "global_step": 44637, "epoch": 1062} {"train_loss": -5.772377967834473, "global_step": 44638, "epoch": 1062} {"train_loss": -5.710176467895508, "global_step": 44639, "epoch": 1062} {"train_loss": -5.710758686065674, "global_step": 44640, "epoch": 1062} {"train_loss": -5.665824890136719, "global_step": 44641, "epoch": 1062} {"train_loss": -5.564226150512695, "global_step": 44642, "epoch": 1062} {"train_loss": -5.716217041015625, "global_step": 44643, "epoch": 1062} {"train_loss": -5.638309478759766, "global_step": 44644, "epoch": 1062} {"train_loss": -5.708200874782744, "global_step": 44645, "epoch": 1062, "val_loss": 61631.6640625} {"train_loss": -5.7389349937438965, "global_step": 44646, "epoch": 1063} {"train_loss": -5.693122386932373, "global_step": 44647, "epoch": 1063} {"train_loss": -5.702698707580566, "global_step": 44648, "epoch": 1063} {"train_loss": -5.737949848175049, "global_step": 44649, "epoch": 1063} {"train_loss": -5.6319379806518555, "global_step": 44650, "epoch": 1063} {"train_loss": -5.702958106994629, "global_step": 44651, "epoch": 1063} {"train_loss": -5.766988754272461, "global_step": 44652, "epoch": 1063} {"train_loss": -5.725904941558838, "global_step": 44653, "epoch": 1063} {"train_loss": -5.758595943450928, "global_step": 44654, "epoch": 1063} {"train_loss": -5.899227142333984, "global_step": 44655, "epoch": 1063} {"train_loss": -5.742859363555908, "global_step": 44656, "epoch": 1063} {"train_loss": -5.733950614929199, "global_step": 44657, "epoch": 1063} {"train_loss": -5.693587779998779, "global_step": 44658, "epoch": 1063} {"train_loss": -5.674715042114258, "global_step": 44659, "epoch": 1063} {"train_loss": -5.671302318572998, "global_step": 44660, "epoch": 1063} {"train_loss": -5.626082897186279, "global_step": 44661, "epoch": 1063} {"train_loss": -5.559147357940674, "global_step": 44662, "epoch": 1063} {"train_loss": -5.839219093322754, "global_step": 44663, "epoch": 1063} {"train_loss": -5.722830295562744, "global_step": 44664, "epoch": 1063} {"train_loss": -5.567045211791992, "global_step": 44665, "epoch": 1063} {"train_loss": -5.856117248535156, "global_step": 44666, "epoch": 1063} {"train_loss": -5.762173652648926, "global_step": 44667, "epoch": 1063} {"train_loss": -5.748741149902344, "global_step": 44668, "epoch": 1063} {"train_loss": -5.706336975097656, "global_step": 44669, "epoch": 1063} {"train_loss": -5.750302314758301, "global_step": 44670, "epoch": 1063} {"train_loss": -5.672814846038818, "global_step": 44671, "epoch": 1063} {"train_loss": -5.640417098999023, "global_step": 44672, "epoch": 1063} {"train_loss": -5.6973066329956055, "global_step": 44673, "epoch": 1063} {"train_loss": -5.8630547523498535, "global_step": 44674, "epoch": 1063} {"train_loss": -5.714605331420898, "global_step": 44675, "epoch": 1063} {"train_loss": -5.641674995422363, "global_step": 44676, "epoch": 1063} {"train_loss": -5.709249496459961, "global_step": 44677, "epoch": 1063} {"train_loss": -5.8190412521362305, "global_step": 44678, "epoch": 1063} {"train_loss": -5.707408905029297, "global_step": 44679, "epoch": 1063} {"train_loss": -5.723413944244385, "global_step": 44680, "epoch": 1063} {"train_loss": -5.548966884613037, "global_step": 44681, "epoch": 1063} {"train_loss": -5.629622936248779, "global_step": 44682, "epoch": 1063} {"train_loss": -5.653429985046387, "global_step": 44683, "epoch": 1063} {"train_loss": -5.776970386505127, "global_step": 44684, "epoch": 1063} {"train_loss": -5.681992053985596, "global_step": 44685, "epoch": 1063} {"train_loss": -5.709708213806152, "global_step": 44686, "epoch": 1063} {"train_loss": -5.7120443639301115, "global_step": 44687, "epoch": 1063, "val_loss": 61727.41015625} {"train_loss": -5.77388334274292, "global_step": 44688, "epoch": 1064} {"train_loss": -5.641629219055176, "global_step": 44689, "epoch": 1064} {"train_loss": -5.595249176025391, "global_step": 44690, "epoch": 1064} {"train_loss": -5.749554634094238, "global_step": 44691, "epoch": 1064} {"train_loss": -5.686527252197266, "global_step": 44692, "epoch": 1064} {"train_loss": -5.694113731384277, "global_step": 44693, "epoch": 1064} {"train_loss": -5.786083221435547, "global_step": 44694, "epoch": 1064} {"train_loss": -5.762362480163574, "global_step": 44695, "epoch": 1064} {"train_loss": -5.691500663757324, "global_step": 44696, "epoch": 1064} {"train_loss": -5.879540920257568, "global_step": 44697, "epoch": 1064} {"train_loss": -5.707267761230469, "global_step": 44698, "epoch": 1064} {"train_loss": -5.65336275100708, "global_step": 44699, "epoch": 1064} {"train_loss": -5.714738845825195, "global_step": 44700, "epoch": 1064} {"train_loss": -5.710336685180664, "global_step": 44701, "epoch": 1064} {"train_loss": -5.7947492599487305, "global_step": 44702, "epoch": 1064} {"train_loss": -5.770560264587402, "global_step": 44703, "epoch": 1064} {"train_loss": -5.720697402954102, "global_step": 44704, "epoch": 1064} {"train_loss": -5.662641525268555, "global_step": 44705, "epoch": 1064} {"train_loss": -5.6854400634765625, "global_step": 44706, "epoch": 1064} {"train_loss": -5.824418544769287, "global_step": 44707, "epoch": 1064} {"train_loss": -5.674506187438965, "global_step": 44708, "epoch": 1064} {"train_loss": -5.719025611877441, "global_step": 44709, "epoch": 1064} {"train_loss": -5.744817733764648, "global_step": 44710, "epoch": 1064} {"train_loss": -5.673921585083008, "global_step": 44711, "epoch": 1064} {"train_loss": -5.735739231109619, "global_step": 44712, "epoch": 1064} {"train_loss": -5.7306060791015625, "global_step": 44713, "epoch": 1064} {"train_loss": -5.700185298919678, "global_step": 44714, "epoch": 1064} {"train_loss": -5.5341691970825195, "global_step": 44715, "epoch": 1064} {"train_loss": -5.726200103759766, "global_step": 44716, "epoch": 1064} {"train_loss": -5.515277862548828, "global_step": 44717, "epoch": 1064} {"train_loss": -5.647448539733887, "global_step": 44718, "epoch": 1064} {"train_loss": -5.780301570892334, "global_step": 44719, "epoch": 1064} {"train_loss": -5.5717058181762695, "global_step": 44720, "epoch": 1064} {"train_loss": -5.633608818054199, "global_step": 44721, "epoch": 1064} {"train_loss": -5.677007675170898, "global_step": 44722, "epoch": 1064} {"train_loss": -5.65432071685791, "global_step": 44723, "epoch": 1064} {"train_loss": -5.791740417480469, "global_step": 44724, "epoch": 1064} {"train_loss": -5.658717155456543, "global_step": 44725, "epoch": 1064} {"train_loss": -5.772365093231201, "global_step": 44726, "epoch": 1064} {"train_loss": -5.641162872314453, "global_step": 44727, "epoch": 1064} {"train_loss": -5.6892876625061035, "global_step": 44728, "epoch": 1064} {"train_loss": -5.703461499441238, "global_step": 44729, "epoch": 1064, "val_loss": 61701.37109375} {"train_loss": -5.654962539672852, "global_step": 44730, "epoch": 1065} {"train_loss": -5.627820014953613, "global_step": 44731, "epoch": 1065} {"train_loss": -5.7622246742248535, "global_step": 44732, "epoch": 1065} {"train_loss": -5.646615982055664, "global_step": 44733, "epoch": 1065} {"train_loss": -5.655414581298828, "global_step": 44734, "epoch": 1065} {"train_loss": -5.754307746887207, "global_step": 44735, "epoch": 1065} {"train_loss": -5.701180458068848, "global_step": 44736, "epoch": 1065} {"train_loss": -5.7995781898498535, "global_step": 44737, "epoch": 1065} {"train_loss": -5.561037540435791, "global_step": 44738, "epoch": 1065} {"train_loss": -5.671010494232178, "global_step": 44739, "epoch": 1065} {"train_loss": -5.793024063110352, "global_step": 44740, "epoch": 1065} {"train_loss": -5.583786964416504, "global_step": 44741, "epoch": 1065} {"train_loss": -5.742394924163818, "global_step": 44742, "epoch": 1065} {"train_loss": -5.554292678833008, "global_step": 44743, "epoch": 1065} {"train_loss": -5.654852867126465, "global_step": 44744, "epoch": 1065} {"train_loss": -5.730916976928711, "global_step": 44745, "epoch": 1065} {"train_loss": -5.681739330291748, "global_step": 44746, "epoch": 1065} {"train_loss": -5.6349968910217285, "global_step": 44747, "epoch": 1065} {"train_loss": -5.787760257720947, "global_step": 44748, "epoch": 1065} {"train_loss": -5.541463851928711, "global_step": 44749, "epoch": 1065} {"train_loss": -5.636120796203613, "global_step": 44750, "epoch": 1065} {"train_loss": -5.8508076667785645, "global_step": 44751, "epoch": 1065} {"train_loss": -5.536325931549072, "global_step": 44752, "epoch": 1065} {"train_loss": -5.803339958190918, "global_step": 44753, "epoch": 1065} {"train_loss": -5.568807601928711, "global_step": 44754, "epoch": 1065} {"train_loss": -5.606942176818848, "global_step": 44755, "epoch": 1065} {"train_loss": -5.536659240722656, "global_step": 44756, "epoch": 1065} {"train_loss": -5.636056900024414, "global_step": 44757, "epoch": 1065} {"train_loss": -5.649904251098633, "global_step": 44758, "epoch": 1065} {"train_loss": -5.537378311157227, "global_step": 44759, "epoch": 1065} {"train_loss": -5.781928062438965, "global_step": 44760, "epoch": 1065} {"train_loss": -5.606444358825684, "global_step": 44761, "epoch": 1065} {"train_loss": -5.910744667053223, "global_step": 44762, "epoch": 1065} {"train_loss": -5.567333221435547, "global_step": 44763, "epoch": 1065} {"train_loss": -5.736532211303711, "global_step": 44764, "epoch": 1065} {"train_loss": -5.725635528564453, "global_step": 44765, "epoch": 1065} {"train_loss": -5.635819435119629, "global_step": 44766, "epoch": 1065} {"train_loss": -5.590883255004883, "global_step": 44767, "epoch": 1065} {"train_loss": -5.660207271575928, "global_step": 44768, "epoch": 1065} {"train_loss": -5.658367156982422, "global_step": 44769, "epoch": 1065} {"train_loss": -5.787511825561523, "global_step": 44770, "epoch": 1065} {"train_loss": -5.675974391755604, "global_step": 44771, "epoch": 1065, "val_loss": 61557.92578125} {"train_loss": -5.7699151039123535, "global_step": 44772, "epoch": 1066} {"train_loss": -5.799720287322998, "global_step": 44773, "epoch": 1066} {"train_loss": -5.76097297668457, "global_step": 44774, "epoch": 1066} {"train_loss": -5.740149974822998, "global_step": 44775, "epoch": 1066} {"train_loss": -5.773775100708008, "global_step": 44776, "epoch": 1066} {"train_loss": -5.631398677825928, "global_step": 44777, "epoch": 1066} {"train_loss": -5.630279541015625, "global_step": 44778, "epoch": 1066} {"train_loss": -5.697376728057861, "global_step": 44779, "epoch": 1066} {"train_loss": -5.651991844177246, "global_step": 44780, "epoch": 1066} {"train_loss": -5.774040699005127, "global_step": 44781, "epoch": 1066} {"train_loss": -5.704357147216797, "global_step": 44782, "epoch": 1066} {"train_loss": -5.790916919708252, "global_step": 44783, "epoch": 1066} {"train_loss": -5.786162853240967, "global_step": 44784, "epoch": 1066} {"train_loss": -5.6457061767578125, "global_step": 44785, "epoch": 1066} {"train_loss": -5.796283721923828, "global_step": 44786, "epoch": 1066} {"train_loss": -5.734872817993164, "global_step": 44787, "epoch": 1066} {"train_loss": -5.813309669494629, "global_step": 44788, "epoch": 1066} {"train_loss": -5.732111930847168, "global_step": 44789, "epoch": 1066} {"train_loss": -5.642935752868652, "global_step": 44790, "epoch": 1066} {"train_loss": -5.58137321472168, "global_step": 44791, "epoch": 1066} {"train_loss": -5.661512851715088, "global_step": 44792, "epoch": 1066} {"train_loss": -5.699312210083008, "global_step": 44793, "epoch": 1066} {"train_loss": -5.742815017700195, "global_step": 44794, "epoch": 1066} {"train_loss": -5.819207668304443, "global_step": 44795, "epoch": 1066} {"train_loss": -5.674007415771484, "global_step": 44796, "epoch": 1066} {"train_loss": -5.684276580810547, "global_step": 44797, "epoch": 1066} {"train_loss": -5.705496788024902, "global_step": 44798, "epoch": 1066} {"train_loss": -5.5680389404296875, "global_step": 44799, "epoch": 1066} {"train_loss": -5.637484550476074, "global_step": 44800, "epoch": 1066} {"train_loss": -5.666477203369141, "global_step": 44801, "epoch": 1066} {"train_loss": -5.577620506286621, "global_step": 44802, "epoch": 1066} {"train_loss": -5.820863723754883, "global_step": 44803, "epoch": 1066} {"train_loss": -5.69489860534668, "global_step": 44804, "epoch": 1066} {"train_loss": -5.572437286376953, "global_step": 44805, "epoch": 1066} {"train_loss": -5.746190071105957, "global_step": 44806, "epoch": 1066} {"train_loss": -5.629016876220703, "global_step": 44807, "epoch": 1066} {"train_loss": -5.6435065269470215, "global_step": 44808, "epoch": 1066} {"train_loss": -5.649553298950195, "global_step": 44809, "epoch": 1066} {"train_loss": -5.693211555480957, "global_step": 44810, "epoch": 1066} {"train_loss": -5.588244915008545, "global_step": 44811, "epoch": 1066} {"train_loss": -5.536332130432129, "global_step": 44812, "epoch": 1066} {"train_loss": -5.693039474033174, "global_step": 44813, "epoch": 1066, "val_loss": 61598.2734375} {"train_loss": -5.760292053222656, "global_step": 44814, "epoch": 1067} {"train_loss": -5.757669925689697, "global_step": 44815, "epoch": 1067} {"train_loss": -5.549654006958008, "global_step": 44816, "epoch": 1067} {"train_loss": -5.7353315353393555, "global_step": 44817, "epoch": 1067} {"train_loss": -5.721711158752441, "global_step": 44818, "epoch": 1067} {"train_loss": -5.726402282714844, "global_step": 44819, "epoch": 1067} {"train_loss": -5.718672752380371, "global_step": 44820, "epoch": 1067} {"train_loss": -5.785838603973389, "global_step": 44821, "epoch": 1067} {"train_loss": -5.763364315032959, "global_step": 44822, "epoch": 1067} {"train_loss": -5.754054069519043, "global_step": 44823, "epoch": 1067} {"train_loss": -5.662002086639404, "global_step": 44824, "epoch": 1067} {"train_loss": -5.763383865356445, "global_step": 44825, "epoch": 1067} {"train_loss": -5.57550048828125, "global_step": 44826, "epoch": 1067} {"train_loss": -5.674502372741699, "global_step": 44827, "epoch": 1067} {"train_loss": -5.7440690994262695, "global_step": 44828, "epoch": 1067} {"train_loss": -5.549851417541504, "global_step": 44829, "epoch": 1067} {"train_loss": -5.712836265563965, "global_step": 44830, "epoch": 1067} {"train_loss": -5.726408004760742, "global_step": 44831, "epoch": 1067} {"train_loss": -5.612812042236328, "global_step": 44832, "epoch": 1067} {"train_loss": -5.598297119140625, "global_step": 44833, "epoch": 1067} {"train_loss": -5.545869827270508, "global_step": 44834, "epoch": 1067} {"train_loss": -5.547214031219482, "global_step": 44835, "epoch": 1067} {"train_loss": -5.602887153625488, "global_step": 44836, "epoch": 1067} {"train_loss": -5.727175235748291, "global_step": 44837, "epoch": 1067} {"train_loss": -5.453268527984619, "global_step": 44838, "epoch": 1067} {"train_loss": -5.6834845542907715, "global_step": 44839, "epoch": 1067} {"train_loss": -5.659663200378418, "global_step": 44840, "epoch": 1067} {"train_loss": -5.5037102699279785, "global_step": 44841, "epoch": 1067} {"train_loss": -5.658666610717773, "global_step": 44842, "epoch": 1067} {"train_loss": -5.56430721282959, "global_step": 44843, "epoch": 1067} {"train_loss": -5.573056221008301, "global_step": 44844, "epoch": 1067} {"train_loss": -5.509363651275635, "global_step": 44845, "epoch": 1067} {"train_loss": -5.66971492767334, "global_step": 44846, "epoch": 1067} {"train_loss": -5.698681831359863, "global_step": 44847, "epoch": 1067} {"train_loss": -5.545536041259766, "global_step": 44848, "epoch": 1067} {"train_loss": -5.831939220428467, "global_step": 44849, "epoch": 1067} {"train_loss": -5.588940620422363, "global_step": 44850, "epoch": 1067} {"train_loss": -5.611083030700684, "global_step": 44851, "epoch": 1067} {"train_loss": -5.472102165222168, "global_step": 44852, "epoch": 1067} {"train_loss": -5.748942852020264, "global_step": 44853, "epoch": 1067} {"train_loss": -5.655484199523926, "global_step": 44854, "epoch": 1067} {"train_loss": -5.653378804524739, "global_step": 44855, "epoch": 1067, "val_loss": 61719.1640625} {"train_loss": -5.686152458190918, "global_step": 44856, "epoch": 1068} {"train_loss": -5.708423614501953, "global_step": 44857, "epoch": 1068} {"train_loss": -5.845705032348633, "global_step": 44858, "epoch": 1068} {"train_loss": -5.72916841506958, "global_step": 44859, "epoch": 1068} {"train_loss": -5.715019226074219, "global_step": 44860, "epoch": 1068} {"train_loss": -5.685169696807861, "global_step": 44861, "epoch": 1068} {"train_loss": -5.643062591552734, "global_step": 44862, "epoch": 1068} {"train_loss": -5.765000343322754, "global_step": 44863, "epoch": 1068} {"train_loss": -5.591974258422852, "global_step": 44864, "epoch": 1068} {"train_loss": -5.727385997772217, "global_step": 44865, "epoch": 1068} {"train_loss": -5.704787254333496, "global_step": 44866, "epoch": 1068} {"train_loss": -5.555405616760254, "global_step": 44867, "epoch": 1068} {"train_loss": -5.6695990562438965, "global_step": 44868, "epoch": 1068} {"train_loss": -5.742516994476318, "global_step": 44869, "epoch": 1068} {"train_loss": -5.6296281814575195, "global_step": 44870, "epoch": 1068} {"train_loss": -5.573276519775391, "global_step": 44871, "epoch": 1068} {"train_loss": -5.775559902191162, "global_step": 44872, "epoch": 1068} {"train_loss": -5.531354904174805, "global_step": 44873, "epoch": 1068} {"train_loss": -5.678699970245361, "global_step": 44874, "epoch": 1068} {"train_loss": -5.731513977050781, "global_step": 44875, "epoch": 1068} {"train_loss": -5.4627838134765625, "global_step": 44876, "epoch": 1068} {"train_loss": -5.76705265045166, "global_step": 44877, "epoch": 1068} {"train_loss": -5.724812030792236, "global_step": 44878, "epoch": 1068} {"train_loss": -5.706604957580566, "global_step": 44879, "epoch": 1068} {"train_loss": -5.774660110473633, "global_step": 44880, "epoch": 1068} {"train_loss": -5.729434013366699, "global_step": 44881, "epoch": 1068} {"train_loss": -5.772642612457275, "global_step": 44882, "epoch": 1068} {"train_loss": -5.758950233459473, "global_step": 44883, "epoch": 1068} {"train_loss": -5.686228275299072, "global_step": 44884, "epoch": 1068} {"train_loss": -5.803114891052246, "global_step": 44885, "epoch": 1068} {"train_loss": -5.635857105255127, "global_step": 44886, "epoch": 1068} {"train_loss": -5.878933429718018, "global_step": 44887, "epoch": 1068} {"train_loss": -5.747779846191406, "global_step": 44888, "epoch": 1068} {"train_loss": -5.773073196411133, "global_step": 44889, "epoch": 1068} {"train_loss": -5.66928768157959, "global_step": 44890, "epoch": 1068} {"train_loss": -5.576287269592285, "global_step": 44891, "epoch": 1068} {"train_loss": -5.7622222900390625, "global_step": 44892, "epoch": 1068} {"train_loss": -5.73178768157959, "global_step": 44893, "epoch": 1068} {"train_loss": -5.816332817077637, "global_step": 44894, "epoch": 1068} {"train_loss": -5.652979850769043, "global_step": 44895, "epoch": 1068} {"train_loss": -5.760280609130859, "global_step": 44896, "epoch": 1068} {"train_loss": -5.7040868032546275, "global_step": 44897, "epoch": 1068, "val_loss": 61764.046875} {"train_loss": -5.761837959289551, "global_step": 44898, "epoch": 1069} {"train_loss": -5.730436325073242, "global_step": 44899, "epoch": 1069} {"train_loss": -5.814334392547607, "global_step": 44900, "epoch": 1069} {"train_loss": -5.58944034576416, "global_step": 44901, "epoch": 1069} {"train_loss": -5.533195495605469, "global_step": 44902, "epoch": 1069} {"train_loss": -5.700377941131592, "global_step": 44903, "epoch": 1069} {"train_loss": -5.682103633880615, "global_step": 44904, "epoch": 1069} {"train_loss": -5.742495536804199, "global_step": 44905, "epoch": 1069} {"train_loss": -5.677512168884277, "global_step": 44906, "epoch": 1069} {"train_loss": -5.713098526000977, "global_step": 44907, "epoch": 1069} {"train_loss": -5.67907190322876, "global_step": 44908, "epoch": 1069} {"train_loss": -5.693874835968018, "global_step": 44909, "epoch": 1069} {"train_loss": -5.692639350891113, "global_step": 44910, "epoch": 1069} {"train_loss": -5.703907489776611, "global_step": 44911, "epoch": 1069} {"train_loss": -5.727869510650635, "global_step": 44912, "epoch": 1069} {"train_loss": -5.678869724273682, "global_step": 44913, "epoch": 1069} {"train_loss": -5.713153839111328, "global_step": 44914, "epoch": 1069} {"train_loss": -5.765851020812988, "global_step": 44915, "epoch": 1069} {"train_loss": -5.612217903137207, "global_step": 44916, "epoch": 1069} {"train_loss": -5.76439905166626, "global_step": 44917, "epoch": 1069} {"train_loss": -5.818919658660889, "global_step": 44918, "epoch": 1069} {"train_loss": -5.671202182769775, "global_step": 44919, "epoch": 1069} {"train_loss": -5.699576377868652, "global_step": 44920, "epoch": 1069} {"train_loss": -5.693619728088379, "global_step": 44921, "epoch": 1069} {"train_loss": -5.8629255294799805, "global_step": 44922, "epoch": 1069} {"train_loss": -5.7364606857299805, "global_step": 44923, "epoch": 1069} {"train_loss": -5.750107765197754, "global_step": 44924, "epoch": 1069} {"train_loss": -5.722243785858154, "global_step": 44925, "epoch": 1069} {"train_loss": -5.698387145996094, "global_step": 44926, "epoch": 1069} {"train_loss": -5.755704402923584, "global_step": 44927, "epoch": 1069} {"train_loss": -5.606581687927246, "global_step": 44928, "epoch": 1069} {"train_loss": -5.76840353012085, "global_step": 44929, "epoch": 1069} {"train_loss": -5.779157638549805, "global_step": 44930, "epoch": 1069} {"train_loss": -5.797659397125244, "global_step": 44931, "epoch": 1069} {"train_loss": -5.724864959716797, "global_step": 44932, "epoch": 1069} {"train_loss": -5.734480381011963, "global_step": 44933, "epoch": 1069} {"train_loss": -5.649928092956543, "global_step": 44934, "epoch": 1069} {"train_loss": -5.791108131408691, "global_step": 44935, "epoch": 1069} {"train_loss": -5.82772970199585, "global_step": 44936, "epoch": 1069} {"train_loss": -5.699456691741943, "global_step": 44937, "epoch": 1069} {"train_loss": -5.716748237609863, "global_step": 44938, "epoch": 1069} {"train_loss": -5.716494696480887, "global_step": 44939, "epoch": 1069, "val_loss": 61459.74609375} {"train_loss": -5.772724628448486, "global_step": 44940, "epoch": 1070} {"train_loss": -5.628339767456055, "global_step": 44941, "epoch": 1070} {"train_loss": -5.622758865356445, "global_step": 44942, "epoch": 1070} {"train_loss": -5.735355377197266, "global_step": 44943, "epoch": 1070} {"train_loss": -5.7274370193481445, "global_step": 44944, "epoch": 1070} {"train_loss": -5.692498207092285, "global_step": 44945, "epoch": 1070} {"train_loss": -5.808780670166016, "global_step": 44946, "epoch": 1070} {"train_loss": -5.762143611907959, "global_step": 44947, "epoch": 1070} {"train_loss": -5.750826835632324, "global_step": 44948, "epoch": 1070} {"train_loss": -5.7026591300964355, "global_step": 44949, "epoch": 1070} {"train_loss": -5.708831310272217, "global_step": 44950, "epoch": 1070} {"train_loss": -5.698866367340088, "global_step": 44951, "epoch": 1070} {"train_loss": -5.589718341827393, "global_step": 44952, "epoch": 1070} {"train_loss": -5.583725929260254, "global_step": 44953, "epoch": 1070} {"train_loss": -5.57274866104126, "global_step": 44954, "epoch": 1070} {"train_loss": -5.7239298820495605, "global_step": 44955, "epoch": 1070} {"train_loss": -5.742280006408691, "global_step": 44956, "epoch": 1070} {"train_loss": -5.601814270019531, "global_step": 44957, "epoch": 1070} {"train_loss": -5.714282035827637, "global_step": 44958, "epoch": 1070} {"train_loss": -5.788986682891846, "global_step": 44959, "epoch": 1070} {"train_loss": -5.624451160430908, "global_step": 44960, "epoch": 1070} {"train_loss": -5.462935924530029, "global_step": 44961, "epoch": 1070} {"train_loss": -5.664641380310059, "global_step": 44962, "epoch": 1070} {"train_loss": -5.683729648590088, "global_step": 44963, "epoch": 1070} {"train_loss": -5.608643054962158, "global_step": 44964, "epoch": 1070} {"train_loss": -5.591648578643799, "global_step": 44965, "epoch": 1070} {"train_loss": -5.797992706298828, "global_step": 44966, "epoch": 1070} {"train_loss": -5.687148094177246, "global_step": 44967, "epoch": 1070} {"train_loss": -5.753990173339844, "global_step": 44968, "epoch": 1070} {"train_loss": -5.572903633117676, "global_step": 44969, "epoch": 1070} {"train_loss": -5.751641273498535, "global_step": 44970, "epoch": 1070} {"train_loss": -5.693699836730957, "global_step": 44971, "epoch": 1070} {"train_loss": -5.700394630432129, "global_step": 44972, "epoch": 1070} {"train_loss": -5.715409278869629, "global_step": 44973, "epoch": 1070} {"train_loss": -5.4928154945373535, "global_step": 44974, "epoch": 1070} {"train_loss": -5.616972923278809, "global_step": 44975, "epoch": 1070} {"train_loss": -5.636065483093262, "global_step": 44976, "epoch": 1070} {"train_loss": -5.603628158569336, "global_step": 44977, "epoch": 1070} {"train_loss": -5.770509719848633, "global_step": 44978, "epoch": 1070} {"train_loss": -5.528186321258545, "global_step": 44979, "epoch": 1070} {"train_loss": -5.762506484985352, "global_step": 44980, "epoch": 1070} {"train_loss": -5.6779854865301225, "global_step": 44981, "epoch": 1070, "val_loss": 61789.75390625} {"train_loss": -5.607227325439453, "global_step": 44982, "epoch": 1071} {"train_loss": -5.662099838256836, "global_step": 44983, "epoch": 1071} {"train_loss": -5.700526714324951, "global_step": 44984, "epoch": 1071} {"train_loss": -5.723732948303223, "global_step": 44985, "epoch": 1071} {"train_loss": -5.786539077758789, "global_step": 44986, "epoch": 1071} {"train_loss": -5.670327186584473, "global_step": 44987, "epoch": 1071} {"train_loss": -5.696700096130371, "global_step": 44988, "epoch": 1071} {"train_loss": -5.646883964538574, "global_step": 44989, "epoch": 1071} {"train_loss": -5.641140460968018, "global_step": 44990, "epoch": 1071} {"train_loss": -5.791085243225098, "global_step": 44991, "epoch": 1071} {"train_loss": -5.589589595794678, "global_step": 44992, "epoch": 1071} {"train_loss": -5.778932571411133, "global_step": 44993, "epoch": 1071} {"train_loss": -5.732429504394531, "global_step": 44994, "epoch": 1071} {"train_loss": -5.613923072814941, "global_step": 44995, "epoch": 1071} {"train_loss": -5.728739261627197, "global_step": 44996, "epoch": 1071} {"train_loss": -5.696359634399414, "global_step": 44997, "epoch": 1071} {"train_loss": -5.7272233963012695, "global_step": 44998, "epoch": 1071} {"train_loss": -5.717233180999756, "global_step": 44999, "epoch": 1071} {"train_loss": -5.680441856384277, "global_step": 45000, "epoch": 1071} {"train_loss": -5.655569553375244, "global_step": 45001, "epoch": 1071} {"train_loss": -5.776197910308838, "global_step": 45002, "epoch": 1071} {"train_loss": -5.841880798339844, "global_step": 45003, "epoch": 1071} {"train_loss": -5.658461570739746, "global_step": 45004, "epoch": 1071} {"train_loss": -5.749289512634277, "global_step": 45005, "epoch": 1071} {"train_loss": -5.7039899826049805, "global_step": 45006, "epoch": 1071} {"train_loss": -5.716610908508301, "global_step": 45007, "epoch": 1071} {"train_loss": -5.816262722015381, "global_step": 45008, "epoch": 1071} {"train_loss": -5.7711381912231445, "global_step": 45009, "epoch": 1071} {"train_loss": -5.7896623611450195, "global_step": 45010, "epoch": 1071} {"train_loss": -5.713874340057373, "global_step": 45011, "epoch": 1071} {"train_loss": -5.6634345054626465, "global_step": 45012, "epoch": 1071} {"train_loss": -5.671998977661133, "global_step": 45013, "epoch": 1071} {"train_loss": -5.659287452697754, "global_step": 45014, "epoch": 1071} {"train_loss": -5.685805797576904, "global_step": 45015, "epoch": 1071} {"train_loss": -5.682837009429932, "global_step": 45016, "epoch": 1071} {"train_loss": -5.73688268661499, "global_step": 45017, "epoch": 1071} {"train_loss": -5.640413284301758, "global_step": 45018, "epoch": 1071} {"train_loss": -5.715405464172363, "global_step": 45019, "epoch": 1071} {"train_loss": -5.555620193481445, "global_step": 45020, "epoch": 1071} {"train_loss": -5.7460174560546875, "global_step": 45021, "epoch": 1071} {"train_loss": -5.791938781738281, "global_step": 45022, "epoch": 1071} {"train_loss": -5.702713455472674, "global_step": 45023, "epoch": 1071, "val_loss": 61734.85546875} {"train_loss": -5.597474098205566, "global_step": 45024, "epoch": 1072} {"train_loss": -5.603910446166992, "global_step": 45025, "epoch": 1072} {"train_loss": -5.656644821166992, "global_step": 45026, "epoch": 1072} {"train_loss": -5.686923980712891, "global_step": 45027, "epoch": 1072} {"train_loss": -5.818055152893066, "global_step": 45028, "epoch": 1072} {"train_loss": -5.623734951019287, "global_step": 45029, "epoch": 1072} {"train_loss": -5.73074197769165, "global_step": 45030, "epoch": 1072} {"train_loss": -5.715928077697754, "global_step": 45031, "epoch": 1072} {"train_loss": -5.732782363891602, "global_step": 45032, "epoch": 1072} {"train_loss": -5.622739315032959, "global_step": 45033, "epoch": 1072} {"train_loss": -5.761298179626465, "global_step": 45034, "epoch": 1072} {"train_loss": -5.864926338195801, "global_step": 45035, "epoch": 1072} {"train_loss": -5.760251522064209, "global_step": 45036, "epoch": 1072} {"train_loss": -5.591569900512695, "global_step": 45037, "epoch": 1072} {"train_loss": -5.74293327331543, "global_step": 45038, "epoch": 1072} {"train_loss": -5.525388717651367, "global_step": 45039, "epoch": 1072} {"train_loss": -5.710415363311768, "global_step": 45040, "epoch": 1072} {"train_loss": -5.720170974731445, "global_step": 45041, "epoch": 1072} {"train_loss": -5.677138328552246, "global_step": 45042, "epoch": 1072} {"train_loss": -5.760015487670898, "global_step": 45043, "epoch": 1072} {"train_loss": -5.5463032722473145, "global_step": 45044, "epoch": 1072} {"train_loss": -5.586833477020264, "global_step": 45045, "epoch": 1072} {"train_loss": -5.921571254730225, "global_step": 45046, "epoch": 1072} {"train_loss": -5.4467878341674805, "global_step": 45047, "epoch": 1072} {"train_loss": -5.683887958526611, "global_step": 45048, "epoch": 1072} {"train_loss": -5.682313919067383, "global_step": 45049, "epoch": 1072} {"train_loss": -5.661579132080078, "global_step": 45050, "epoch": 1072} {"train_loss": -5.5641703605651855, "global_step": 45051, "epoch": 1072} {"train_loss": -5.746123313903809, "global_step": 45052, "epoch": 1072} {"train_loss": -5.627884864807129, "global_step": 45053, "epoch": 1072} {"train_loss": -5.444911956787109, "global_step": 45054, "epoch": 1072} {"train_loss": -5.624981880187988, "global_step": 45055, "epoch": 1072} {"train_loss": -5.608166694641113, "global_step": 45056, "epoch": 1072} {"train_loss": -5.621509552001953, "global_step": 45057, "epoch": 1072} {"train_loss": -5.589921474456787, "global_step": 45058, "epoch": 1072} {"train_loss": -5.742003440856934, "global_step": 45059, "epoch": 1072} {"train_loss": -5.616681098937988, "global_step": 45060, "epoch": 1072} {"train_loss": -5.750792503356934, "global_step": 45061, "epoch": 1072} {"train_loss": -5.60595703125, "global_step": 45062, "epoch": 1072} {"train_loss": -5.708096504211426, "global_step": 45063, "epoch": 1072} {"train_loss": -5.741030693054199, "global_step": 45064, "epoch": 1072} {"train_loss": -5.669328042439052, "global_step": 45065, "epoch": 1072, "val_loss": 61688.33984375} {"train_loss": -5.659018516540527, "global_step": 45066, "epoch": 1073} {"train_loss": -5.738557815551758, "global_step": 45067, "epoch": 1073} {"train_loss": -5.79634952545166, "global_step": 45068, "epoch": 1073} {"train_loss": -5.655995845794678, "global_step": 45069, "epoch": 1073} {"train_loss": -5.710050106048584, "global_step": 45070, "epoch": 1073} {"train_loss": -5.670361518859863, "global_step": 45071, "epoch": 1073} {"train_loss": -5.709802627563477, "global_step": 45072, "epoch": 1073} {"train_loss": -5.671367645263672, "global_step": 45073, "epoch": 1073} {"train_loss": -5.731969833374023, "global_step": 45074, "epoch": 1073} {"train_loss": -5.729358673095703, "global_step": 45075, "epoch": 1073} {"train_loss": -5.635964870452881, "global_step": 45076, "epoch": 1073} {"train_loss": -5.679009914398193, "global_step": 45077, "epoch": 1073} {"train_loss": -5.655800819396973, "global_step": 45078, "epoch": 1073} {"train_loss": -5.60392951965332, "global_step": 45079, "epoch": 1073} {"train_loss": -5.772518157958984, "global_step": 45080, "epoch": 1073} {"train_loss": -5.69174861907959, "global_step": 45081, "epoch": 1073} {"train_loss": -5.688139915466309, "global_step": 45082, "epoch": 1073} {"train_loss": -5.81329345703125, "global_step": 45083, "epoch": 1073} {"train_loss": -5.73475456237793, "global_step": 45084, "epoch": 1073} {"train_loss": -5.815428256988525, "global_step": 45085, "epoch": 1073} {"train_loss": -5.527822494506836, "global_step": 45086, "epoch": 1073} {"train_loss": -5.659350395202637, "global_step": 45087, "epoch": 1073} {"train_loss": -5.698263168334961, "global_step": 45088, "epoch": 1073} {"train_loss": -5.783639430999756, "global_step": 45089, "epoch": 1073} {"train_loss": -5.768822193145752, "global_step": 45090, "epoch": 1073} {"train_loss": -5.8147430419921875, "global_step": 45091, "epoch": 1073} {"train_loss": -5.726973533630371, "global_step": 45092, "epoch": 1073} {"train_loss": -5.735136985778809, "global_step": 45093, "epoch": 1073} {"train_loss": -5.737287521362305, "global_step": 45094, "epoch": 1073} {"train_loss": -5.651303291320801, "global_step": 45095, "epoch": 1073} {"train_loss": -5.600323677062988, "global_step": 45096, "epoch": 1073} {"train_loss": -5.745508670806885, "global_step": 45097, "epoch": 1073} {"train_loss": -5.796184062957764, "global_step": 45098, "epoch": 1073} {"train_loss": -5.682151794433594, "global_step": 45099, "epoch": 1073} {"train_loss": -5.67072057723999, "global_step": 45100, "epoch": 1073} {"train_loss": -5.554285049438477, "global_step": 45101, "epoch": 1073} {"train_loss": -5.590942859649658, "global_step": 45102, "epoch": 1073} {"train_loss": -5.614939212799072, "global_step": 45103, "epoch": 1073} {"train_loss": -5.679659366607666, "global_step": 45104, "epoch": 1073} {"train_loss": -5.805871963500977, "global_step": 45105, "epoch": 1073} {"train_loss": -5.794251441955566, "global_step": 45106, "epoch": 1073} {"train_loss": -5.700989575613113, "global_step": 45107, "epoch": 1073, "val_loss": 61677.1171875} {"train_loss": -5.7911176681518555, "global_step": 45108, "epoch": 1074} {"train_loss": -5.74764347076416, "global_step": 45109, "epoch": 1074} {"train_loss": -5.646317481994629, "global_step": 45110, "epoch": 1074} {"train_loss": -5.730452537536621, "global_step": 45111, "epoch": 1074} {"train_loss": -5.77553653717041, "global_step": 45112, "epoch": 1074} {"train_loss": -5.796233177185059, "global_step": 45113, "epoch": 1074} {"train_loss": -5.726894378662109, "global_step": 45114, "epoch": 1074} {"train_loss": -5.688994407653809, "global_step": 45115, "epoch": 1074} {"train_loss": -5.675323963165283, "global_step": 45116, "epoch": 1074} {"train_loss": -5.716512680053711, "global_step": 45117, "epoch": 1074} {"train_loss": -5.7018327713012695, "global_step": 45118, "epoch": 1074} {"train_loss": -5.683629989624023, "global_step": 45119, "epoch": 1074} {"train_loss": -5.800963401794434, "global_step": 45120, "epoch": 1074} {"train_loss": -5.578909873962402, "global_step": 45121, "epoch": 1074} {"train_loss": -5.7484235763549805, "global_step": 45122, "epoch": 1074} {"train_loss": -5.690648555755615, "global_step": 45123, "epoch": 1074} {"train_loss": -5.694441795349121, "global_step": 45124, "epoch": 1074} {"train_loss": -5.741113185882568, "global_step": 45125, "epoch": 1074} {"train_loss": -5.719675064086914, "global_step": 45126, "epoch": 1074} {"train_loss": -5.652359962463379, "global_step": 45127, "epoch": 1074} {"train_loss": -5.65455961227417, "global_step": 45128, "epoch": 1074} {"train_loss": -5.741130352020264, "global_step": 45129, "epoch": 1074} {"train_loss": -5.867941856384277, "global_step": 45130, "epoch": 1074} {"train_loss": -5.636391639709473, "global_step": 45131, "epoch": 1074} {"train_loss": -5.753470420837402, "global_step": 45132, "epoch": 1074} {"train_loss": -5.673739433288574, "global_step": 45133, "epoch": 1074} {"train_loss": -5.705039024353027, "global_step": 45134, "epoch": 1074} {"train_loss": -5.781811714172363, "global_step": 45135, "epoch": 1074} {"train_loss": -5.703429222106934, "global_step": 45136, "epoch": 1074} {"train_loss": -5.523152828216553, "global_step": 45137, "epoch": 1074} {"train_loss": -5.786990165710449, "global_step": 45138, "epoch": 1074} {"train_loss": -5.690239429473877, "global_step": 45139, "epoch": 1074} {"train_loss": -5.592544078826904, "global_step": 45140, "epoch": 1074} {"train_loss": -5.709774971008301, "global_step": 45141, "epoch": 1074} {"train_loss": -5.664331436157227, "global_step": 45142, "epoch": 1074} {"train_loss": -5.788039207458496, "global_step": 45143, "epoch": 1074} {"train_loss": -5.7050347328186035, "global_step": 45144, "epoch": 1074} {"train_loss": -5.69297981262207, "global_step": 45145, "epoch": 1074} {"train_loss": -5.682624816894531, "global_step": 45146, "epoch": 1074} {"train_loss": -5.5916242599487305, "global_step": 45147, "epoch": 1074} {"train_loss": -5.622012138366699, "global_step": 45148, "epoch": 1074} {"train_loss": -5.7011927763621015, "global_step": 45149, "epoch": 1074, "val_loss": 61713.59765625} {"train_loss": -5.59210205078125, "global_step": 45150, "epoch": 1075} {"train_loss": -5.561189651489258, "global_step": 45151, "epoch": 1075} {"train_loss": -5.665467739105225, "global_step": 45152, "epoch": 1075} {"train_loss": -5.657364845275879, "global_step": 45153, "epoch": 1075} {"train_loss": -5.682405471801758, "global_step": 45154, "epoch": 1075} {"train_loss": -5.574031829833984, "global_step": 45155, "epoch": 1075} {"train_loss": -5.692835330963135, "global_step": 45156, "epoch": 1075} {"train_loss": -5.716643333435059, "global_step": 45157, "epoch": 1075} {"train_loss": -5.808864593505859, "global_step": 45158, "epoch": 1075} {"train_loss": -5.737635612487793, "global_step": 45159, "epoch": 1075} {"train_loss": -5.622931480407715, "global_step": 45160, "epoch": 1075} {"train_loss": -5.644313812255859, "global_step": 45161, "epoch": 1075} {"train_loss": -5.782871246337891, "global_step": 45162, "epoch": 1075} {"train_loss": -5.699725151062012, "global_step": 45163, "epoch": 1075} {"train_loss": -5.752918243408203, "global_step": 45164, "epoch": 1075} {"train_loss": -5.766094207763672, "global_step": 45165, "epoch": 1075} {"train_loss": -5.742979049682617, "global_step": 45166, "epoch": 1075} {"train_loss": -5.679931163787842, "global_step": 45167, "epoch": 1075} {"train_loss": -5.742204666137695, "global_step": 45168, "epoch": 1075} {"train_loss": -5.655703544616699, "global_step": 45169, "epoch": 1075} {"train_loss": -5.621971130371094, "global_step": 45170, "epoch": 1075} {"train_loss": -5.760026931762695, "global_step": 45171, "epoch": 1075} {"train_loss": -5.836698532104492, "global_step": 45172, "epoch": 1075} {"train_loss": -5.750619411468506, "global_step": 45173, "epoch": 1075} {"train_loss": -5.652093887329102, "global_step": 45174, "epoch": 1075} {"train_loss": -5.818257808685303, "global_step": 45175, "epoch": 1075} {"train_loss": -5.620119094848633, "global_step": 45176, "epoch": 1075} {"train_loss": -5.649660110473633, "global_step": 45177, "epoch": 1075} {"train_loss": -5.740011692047119, "global_step": 45178, "epoch": 1075} {"train_loss": -5.657830238342285, "global_step": 45179, "epoch": 1075} {"train_loss": -5.605800628662109, "global_step": 45180, "epoch": 1075} {"train_loss": -5.740509986877441, "global_step": 45181, "epoch": 1075} {"train_loss": -5.5598554611206055, "global_step": 45182, "epoch": 1075} {"train_loss": -5.597491264343262, "global_step": 45183, "epoch": 1075} {"train_loss": -5.547779083251953, "global_step": 45184, "epoch": 1075} {"train_loss": -5.578009605407715, "global_step": 45185, "epoch": 1075} {"train_loss": -5.599191665649414, "global_step": 45186, "epoch": 1075} {"train_loss": -5.858005523681641, "global_step": 45187, "epoch": 1075} {"train_loss": -5.737776756286621, "global_step": 45188, "epoch": 1075} {"train_loss": -5.625885009765625, "global_step": 45189, "epoch": 1075} {"train_loss": -5.579370498657227, "global_step": 45190, "epoch": 1075} {"train_loss": -5.681606179191952, "global_step": 45191, "epoch": 1075, "val_loss": 61319.86328125} {"train_loss": -5.820305347442627, "global_step": 45192, "epoch": 1076} {"train_loss": -5.74461555480957, "global_step": 45193, "epoch": 1076} {"train_loss": -5.6937408447265625, "global_step": 45194, "epoch": 1076} {"train_loss": -5.784243583679199, "global_step": 45195, "epoch": 1076} {"train_loss": -5.747048377990723, "global_step": 45196, "epoch": 1076} {"train_loss": -5.829548358917236, "global_step": 45197, "epoch": 1076} {"train_loss": -5.773748874664307, "global_step": 45198, "epoch": 1076} {"train_loss": -5.570809364318848, "global_step": 45199, "epoch": 1076} {"train_loss": -5.759843826293945, "global_step": 45200, "epoch": 1076} {"train_loss": -5.825770378112793, "global_step": 45201, "epoch": 1076} {"train_loss": -5.769710540771484, "global_step": 45202, "epoch": 1076} {"train_loss": -5.797221660614014, "global_step": 45203, "epoch": 1076} {"train_loss": -5.789261817932129, "global_step": 45204, "epoch": 1076} {"train_loss": -5.655850410461426, "global_step": 45205, "epoch": 1076} {"train_loss": -5.800446033477783, "global_step": 45206, "epoch": 1076} {"train_loss": -5.7293596267700195, "global_step": 45207, "epoch": 1076} {"train_loss": -5.741535663604736, "global_step": 45208, "epoch": 1076} {"train_loss": -5.792506217956543, "global_step": 45209, "epoch": 1076} {"train_loss": -5.797155857086182, "global_step": 45210, "epoch": 1076} {"train_loss": -5.652518272399902, "global_step": 45211, "epoch": 1076} {"train_loss": -5.829214096069336, "global_step": 45212, "epoch": 1076} {"train_loss": -5.683871269226074, "global_step": 45213, "epoch": 1076} {"train_loss": -5.749250411987305, "global_step": 45214, "epoch": 1076} {"train_loss": -5.737736701965332, "global_step": 45215, "epoch": 1076} {"train_loss": -5.64195442199707, "global_step": 45216, "epoch": 1076} {"train_loss": -5.6312761306762695, "global_step": 45217, "epoch": 1076} {"train_loss": -5.6516876220703125, "global_step": 45218, "epoch": 1076} {"train_loss": -5.639028072357178, "global_step": 45219, "epoch": 1076} {"train_loss": -5.655945301055908, "global_step": 45220, "epoch": 1076} {"train_loss": -5.7624053955078125, "global_step": 45221, "epoch": 1076} {"train_loss": -5.714468955993652, "global_step": 45222, "epoch": 1076} {"train_loss": -5.623312473297119, "global_step": 45223, "epoch": 1076} {"train_loss": -5.710975646972656, "global_step": 45224, "epoch": 1076} {"train_loss": -5.544092178344727, "global_step": 45225, "epoch": 1076} {"train_loss": -5.8563923835754395, "global_step": 45226, "epoch": 1076} {"train_loss": -5.640783786773682, "global_step": 45227, "epoch": 1076} {"train_loss": -5.685647964477539, "global_step": 45228, "epoch": 1076} {"train_loss": -5.5641398429870605, "global_step": 45229, "epoch": 1076} {"train_loss": -5.664549827575684, "global_step": 45230, "epoch": 1076} {"train_loss": -5.736249923706055, "global_step": 45231, "epoch": 1076} {"train_loss": -5.675258159637451, "global_step": 45232, "epoch": 1076} {"train_loss": -5.716219141369774, "global_step": 45233, "epoch": 1076, "val_loss": 61741.40234375} {"train_loss": -5.7064619064331055, "global_step": 45234, "epoch": 1077} {"train_loss": -5.727268218994141, "global_step": 45235, "epoch": 1077} {"train_loss": -5.665058612823486, "global_step": 45236, "epoch": 1077} {"train_loss": -5.7600579261779785, "global_step": 45237, "epoch": 1077} {"train_loss": -5.585476875305176, "global_step": 45238, "epoch": 1077} {"train_loss": -5.741181373596191, "global_step": 45239, "epoch": 1077} {"train_loss": -5.779379844665527, "global_step": 45240, "epoch": 1077} {"train_loss": -5.669220924377441, "global_step": 45241, "epoch": 1077} {"train_loss": -5.707695007324219, "global_step": 45242, "epoch": 1077} {"train_loss": -5.662167549133301, "global_step": 45243, "epoch": 1077} {"train_loss": -5.753946304321289, "global_step": 45244, "epoch": 1077} {"train_loss": -5.805848121643066, "global_step": 45245, "epoch": 1077} {"train_loss": -5.78855037689209, "global_step": 45246, "epoch": 1077} {"train_loss": -5.654446125030518, "global_step": 45247, "epoch": 1077} {"train_loss": -5.681639671325684, "global_step": 45248, "epoch": 1077} {"train_loss": -5.642413139343262, "global_step": 45249, "epoch": 1077} {"train_loss": -5.696088790893555, "global_step": 45250, "epoch": 1077} {"train_loss": -5.633143424987793, "global_step": 45251, "epoch": 1077} {"train_loss": -5.6708807945251465, "global_step": 45252, "epoch": 1077} {"train_loss": -5.757291793823242, "global_step": 45253, "epoch": 1077} {"train_loss": -5.757773399353027, "global_step": 45254, "epoch": 1077} {"train_loss": -5.666959285736084, "global_step": 45255, "epoch": 1077} {"train_loss": -5.664670944213867, "global_step": 45256, "epoch": 1077} {"train_loss": -5.635702610015869, "global_step": 45257, "epoch": 1077} {"train_loss": -5.682250022888184, "global_step": 45258, "epoch": 1077} {"train_loss": -5.624028205871582, "global_step": 45259, "epoch": 1077} {"train_loss": -5.680139541625977, "global_step": 45260, "epoch": 1077} {"train_loss": -5.609045028686523, "global_step": 45261, "epoch": 1077} {"train_loss": -5.57111120223999, "global_step": 45262, "epoch": 1077} {"train_loss": -5.586044788360596, "global_step": 45263, "epoch": 1077} {"train_loss": -5.777918338775635, "global_step": 45264, "epoch": 1077} {"train_loss": -5.760440826416016, "global_step": 45265, "epoch": 1077} {"train_loss": -5.740634918212891, "global_step": 45266, "epoch": 1077} {"train_loss": -5.722644805908203, "global_step": 45267, "epoch": 1077} {"train_loss": -5.58333683013916, "global_step": 45268, "epoch": 1077} {"train_loss": -5.660722732543945, "global_step": 45269, "epoch": 1077} {"train_loss": -5.666904926300049, "global_step": 45270, "epoch": 1077} {"train_loss": -5.745328426361084, "global_step": 45271, "epoch": 1077} {"train_loss": -5.821087837219238, "global_step": 45272, "epoch": 1077} {"train_loss": -5.642908573150635, "global_step": 45273, "epoch": 1077} {"train_loss": -5.630341053009033, "global_step": 45274, "epoch": 1077} {"train_loss": -5.690011115301223, "global_step": 45275, "epoch": 1077, "val_loss": 61849.62890625} {"train_loss": -5.735167503356934, "global_step": 45276, "epoch": 1078} {"train_loss": -5.558036804199219, "global_step": 45277, "epoch": 1078} {"train_loss": -5.598670959472656, "global_step": 45278, "epoch": 1078} {"train_loss": -5.601149559020996, "global_step": 45279, "epoch": 1078} {"train_loss": -5.69388484954834, "global_step": 45280, "epoch": 1078} {"train_loss": -5.714840412139893, "global_step": 45281, "epoch": 1078} {"train_loss": -5.562788009643555, "global_step": 45282, "epoch": 1078} {"train_loss": -5.716059684753418, "global_step": 45283, "epoch": 1078} {"train_loss": -5.758650302886963, "global_step": 45284, "epoch": 1078} {"train_loss": -5.700436592102051, "global_step": 45285, "epoch": 1078} {"train_loss": -5.743804931640625, "global_step": 45286, "epoch": 1078} {"train_loss": -5.555233001708984, "global_step": 45287, "epoch": 1078} {"train_loss": -5.642335414886475, "global_step": 45288, "epoch": 1078} {"train_loss": -5.888274192810059, "global_step": 45289, "epoch": 1078} {"train_loss": -5.668689727783203, "global_step": 45290, "epoch": 1078} {"train_loss": -5.733791351318359, "global_step": 45291, "epoch": 1078} {"train_loss": -5.771925926208496, "global_step": 45292, "epoch": 1078} {"train_loss": -5.783050060272217, "global_step": 45293, "epoch": 1078} {"train_loss": -5.720647811889648, "global_step": 45294, "epoch": 1078} {"train_loss": -5.642765998840332, "global_step": 45295, "epoch": 1078} {"train_loss": -5.701528549194336, "global_step": 45296, "epoch": 1078} {"train_loss": -5.884762763977051, "global_step": 45297, "epoch": 1078} {"train_loss": -5.761031627655029, "global_step": 45298, "epoch": 1078} {"train_loss": -5.626407623291016, "global_step": 45299, "epoch": 1078} {"train_loss": -5.657578945159912, "global_step": 45300, "epoch": 1078} {"train_loss": -5.610530853271484, "global_step": 45301, "epoch": 1078} {"train_loss": -5.658051490783691, "global_step": 45302, "epoch": 1078} {"train_loss": -5.798036575317383, "global_step": 45303, "epoch": 1078} {"train_loss": -5.721151351928711, "global_step": 45304, "epoch": 1078} {"train_loss": -5.777657508850098, "global_step": 45305, "epoch": 1078} {"train_loss": -5.635866165161133, "global_step": 45306, "epoch": 1078} {"train_loss": -5.827948570251465, "global_step": 45307, "epoch": 1078} {"train_loss": -5.851709842681885, "global_step": 45308, "epoch": 1078} {"train_loss": -5.632097244262695, "global_step": 45309, "epoch": 1078} {"train_loss": -5.755877494812012, "global_step": 45310, "epoch": 1078} {"train_loss": -5.705348014831543, "global_step": 45311, "epoch": 1078} {"train_loss": -5.664565086364746, "global_step": 45312, "epoch": 1078} {"train_loss": -5.73537015914917, "global_step": 45313, "epoch": 1078} {"train_loss": -5.550360679626465, "global_step": 45314, "epoch": 1078} {"train_loss": -5.779017925262451, "global_step": 45315, "epoch": 1078} {"train_loss": -5.6949357986450195, "global_step": 45316, "epoch": 1078} {"train_loss": -5.701537313915434, "global_step": 45317, "epoch": 1078, "val_loss": 61484.8828125} {"train_loss": -5.708698272705078, "global_step": 45318, "epoch": 1079} {"train_loss": -5.652935981750488, "global_step": 45319, "epoch": 1079} {"train_loss": -5.7714643478393555, "global_step": 45320, "epoch": 1079} {"train_loss": -5.659666061401367, "global_step": 45321, "epoch": 1079} {"train_loss": -5.8294572830200195, "global_step": 45322, "epoch": 1079} {"train_loss": -5.714094638824463, "global_step": 45323, "epoch": 1079} {"train_loss": -5.656773567199707, "global_step": 45324, "epoch": 1079} {"train_loss": -5.685201644897461, "global_step": 45325, "epoch": 1079} {"train_loss": -5.6280317306518555, "global_step": 45326, "epoch": 1079} {"train_loss": -5.811108589172363, "global_step": 45327, "epoch": 1079} {"train_loss": -5.800311088562012, "global_step": 45328, "epoch": 1079} {"train_loss": -5.725215911865234, "global_step": 45329, "epoch": 1079} {"train_loss": -5.761323928833008, "global_step": 45330, "epoch": 1079} {"train_loss": -5.628228187561035, "global_step": 45331, "epoch": 1079} {"train_loss": -5.844679832458496, "global_step": 45332, "epoch": 1079} {"train_loss": -5.850518226623535, "global_step": 45333, "epoch": 1079} {"train_loss": -5.690565586090088, "global_step": 45334, "epoch": 1079} {"train_loss": -5.627198219299316, "global_step": 45335, "epoch": 1079} {"train_loss": -5.772412300109863, "global_step": 45336, "epoch": 1079} {"train_loss": -5.853886127471924, "global_step": 45337, "epoch": 1079} {"train_loss": -5.730830669403076, "global_step": 45338, "epoch": 1079} {"train_loss": -5.726690292358398, "global_step": 45339, "epoch": 1079} {"train_loss": -5.658639907836914, "global_step": 45340, "epoch": 1079} {"train_loss": -5.775692939758301, "global_step": 45341, "epoch": 1079} {"train_loss": -5.735515594482422, "global_step": 45342, "epoch": 1079} {"train_loss": -5.524153709411621, "global_step": 45343, "epoch": 1079} {"train_loss": -5.748519420623779, "global_step": 45344, "epoch": 1079} {"train_loss": -5.7527265548706055, "global_step": 45345, "epoch": 1079} {"train_loss": -5.874147891998291, "global_step": 45346, "epoch": 1079} {"train_loss": -5.59744119644165, "global_step": 45347, "epoch": 1079} {"train_loss": -5.542943954467773, "global_step": 45348, "epoch": 1079} {"train_loss": -5.6588568687438965, "global_step": 45349, "epoch": 1079} {"train_loss": -5.661316871643066, "global_step": 45350, "epoch": 1079} {"train_loss": -5.650108814239502, "global_step": 45351, "epoch": 1079} {"train_loss": -5.676014423370361, "global_step": 45352, "epoch": 1079} {"train_loss": -5.5384368896484375, "global_step": 45353, "epoch": 1079} {"train_loss": -5.658706188201904, "global_step": 45354, "epoch": 1079} {"train_loss": -5.585306167602539, "global_step": 45355, "epoch": 1079} {"train_loss": -5.529524326324463, "global_step": 45356, "epoch": 1079} {"train_loss": -5.823698997497559, "global_step": 45357, "epoch": 1079} {"train_loss": -5.645535469055176, "global_step": 45358, "epoch": 1079} {"train_loss": -5.703316926956177, "global_step": 45359, "epoch": 1079, "val_loss": 62044.6171875} {"train_loss": -5.693166732788086, "global_step": 45360, "epoch": 1080} {"train_loss": -5.711542129516602, "global_step": 45361, "epoch": 1080} {"train_loss": -5.515434265136719, "global_step": 45362, "epoch": 1080} {"train_loss": -5.796592712402344, "global_step": 45363, "epoch": 1080} {"train_loss": -5.761012077331543, "global_step": 45364, "epoch": 1080} {"train_loss": -5.67114782333374, "global_step": 45365, "epoch": 1080} {"train_loss": -5.759915828704834, "global_step": 45366, "epoch": 1080} {"train_loss": -5.73020076751709, "global_step": 45367, "epoch": 1080} {"train_loss": -5.754703521728516, "global_step": 45368, "epoch": 1080} {"train_loss": -5.66697883605957, "global_step": 45369, "epoch": 1080} {"train_loss": -5.83570671081543, "global_step": 45370, "epoch": 1080} {"train_loss": -5.703104019165039, "global_step": 45371, "epoch": 1080} {"train_loss": -5.681690216064453, "global_step": 45372, "epoch": 1080} {"train_loss": -5.730236053466797, "global_step": 45373, "epoch": 1080} {"train_loss": -5.897188186645508, "global_step": 45374, "epoch": 1080} {"train_loss": -5.735403537750244, "global_step": 45375, "epoch": 1080} {"train_loss": -5.696130752563477, "global_step": 45376, "epoch": 1080} {"train_loss": -5.609465599060059, "global_step": 45377, "epoch": 1080} {"train_loss": -5.7467756271362305, "global_step": 45378, "epoch": 1080} {"train_loss": -5.734348297119141, "global_step": 45379, "epoch": 1080} {"train_loss": -5.689858913421631, "global_step": 45380, "epoch": 1080} {"train_loss": -5.673503398895264, "global_step": 45381, "epoch": 1080} {"train_loss": -5.7508931159973145, "global_step": 45382, "epoch": 1080} {"train_loss": -5.793575286865234, "global_step": 45383, "epoch": 1080} {"train_loss": -5.616388320922852, "global_step": 45384, "epoch": 1080} {"train_loss": -5.759706497192383, "global_step": 45385, "epoch": 1080} {"train_loss": -5.666070461273193, "global_step": 45386, "epoch": 1080} {"train_loss": -5.66748046875, "global_step": 45387, "epoch": 1080} {"train_loss": -5.744006633758545, "global_step": 45388, "epoch": 1080} {"train_loss": -5.838254928588867, "global_step": 45389, "epoch": 1080} {"train_loss": -5.6729021072387695, "global_step": 45390, "epoch": 1080} {"train_loss": -5.8564252853393555, "global_step": 45391, "epoch": 1080} {"train_loss": -5.693271636962891, "global_step": 45392, "epoch": 1080} {"train_loss": -5.635957717895508, "global_step": 45393, "epoch": 1080} {"train_loss": -5.746171951293945, "global_step": 45394, "epoch": 1080} {"train_loss": -5.793418884277344, "global_step": 45395, "epoch": 1080} {"train_loss": -5.86062479019165, "global_step": 45396, "epoch": 1080} {"train_loss": -5.662971019744873, "global_step": 45397, "epoch": 1080} {"train_loss": -5.712420463562012, "global_step": 45398, "epoch": 1080} {"train_loss": -5.708314418792725, "global_step": 45399, "epoch": 1080} {"train_loss": -5.646665573120117, "global_step": 45400, "epoch": 1080} {"train_loss": -5.724567322503953, "global_step": 45401, "epoch": 1080, "val_loss": 61717.8046875} {"train_loss": -5.7157883644104, "global_step": 45402, "epoch": 1081} {"train_loss": -5.825680732727051, "global_step": 45403, "epoch": 1081} {"train_loss": -5.766941547393799, "global_step": 45404, "epoch": 1081} {"train_loss": -5.672710418701172, "global_step": 45405, "epoch": 1081} {"train_loss": -5.7938008308410645, "global_step": 45406, "epoch": 1081} {"train_loss": -5.787016868591309, "global_step": 45407, "epoch": 1081} {"train_loss": -5.715947151184082, "global_step": 45408, "epoch": 1081} {"train_loss": -5.729794502258301, "global_step": 45409, "epoch": 1081} {"train_loss": -5.653416633605957, "global_step": 45410, "epoch": 1081} {"train_loss": -5.728177070617676, "global_step": 45411, "epoch": 1081} {"train_loss": -5.737384796142578, "global_step": 45412, "epoch": 1081} {"train_loss": -5.694139003753662, "global_step": 45413, "epoch": 1081} {"train_loss": -5.660270690917969, "global_step": 45414, "epoch": 1081} {"train_loss": -5.768386363983154, "global_step": 45415, "epoch": 1081} {"train_loss": -5.529195785522461, "global_step": 45416, "epoch": 1081} {"train_loss": -5.667924880981445, "global_step": 45417, "epoch": 1081} {"train_loss": -5.637564659118652, "global_step": 45418, "epoch": 1081} {"train_loss": -5.542044639587402, "global_step": 45419, "epoch": 1081} {"train_loss": -5.704423904418945, "global_step": 45420, "epoch": 1081} {"train_loss": -5.573853492736816, "global_step": 45421, "epoch": 1081} {"train_loss": -5.765242099761963, "global_step": 45422, "epoch": 1081} {"train_loss": -5.627229690551758, "global_step": 45423, "epoch": 1081} {"train_loss": -5.608373641967773, "global_step": 45424, "epoch": 1081} {"train_loss": -5.752387046813965, "global_step": 45425, "epoch": 1081} {"train_loss": -5.62729024887085, "global_step": 45426, "epoch": 1081} {"train_loss": -5.728644371032715, "global_step": 45427, "epoch": 1081} {"train_loss": -5.769202709197998, "global_step": 45428, "epoch": 1081} {"train_loss": -5.727120399475098, "global_step": 45429, "epoch": 1081} {"train_loss": -5.647497177124023, "global_step": 45430, "epoch": 1081} {"train_loss": -5.594226837158203, "global_step": 45431, "epoch": 1081} {"train_loss": -5.662233829498291, "global_step": 45432, "epoch": 1081} {"train_loss": -5.607264518737793, "global_step": 45433, "epoch": 1081} {"train_loss": -5.733859539031982, "global_step": 45434, "epoch": 1081} {"train_loss": -5.689067840576172, "global_step": 45435, "epoch": 1081} {"train_loss": -5.67963981628418, "global_step": 45436, "epoch": 1081} {"train_loss": -5.710923671722412, "global_step": 45437, "epoch": 1081} {"train_loss": -5.814497947692871, "global_step": 45438, "epoch": 1081} {"train_loss": -5.584926128387451, "global_step": 45439, "epoch": 1081} {"train_loss": -5.717929840087891, "global_step": 45440, "epoch": 1081} {"train_loss": -5.796360492706299, "global_step": 45441, "epoch": 1081} {"train_loss": -5.7671637535095215, "global_step": 45442, "epoch": 1081} {"train_loss": -5.697678713571458, "global_step": 45443, "epoch": 1081, "val_loss": 62221.84375} {"train_loss": -5.703499794006348, "global_step": 45444, "epoch": 1082} {"train_loss": -5.675729751586914, "global_step": 45445, "epoch": 1082} {"train_loss": -5.764360427856445, "global_step": 45446, "epoch": 1082} {"train_loss": -5.698829174041748, "global_step": 45447, "epoch": 1082} {"train_loss": -5.761055946350098, "global_step": 45448, "epoch": 1082} {"train_loss": -5.71125602722168, "global_step": 45449, "epoch": 1082} {"train_loss": -5.6830596923828125, "global_step": 45450, "epoch": 1082} {"train_loss": -5.720320701599121, "global_step": 45451, "epoch": 1082} {"train_loss": -5.694901466369629, "global_step": 45452, "epoch": 1082} {"train_loss": -5.6312360763549805, "global_step": 45453, "epoch": 1082} {"train_loss": -5.709723472595215, "global_step": 45454, "epoch": 1082} {"train_loss": -5.786639213562012, "global_step": 45455, "epoch": 1082} {"train_loss": -5.696930885314941, "global_step": 45456, "epoch": 1082} {"train_loss": -5.661904335021973, "global_step": 45457, "epoch": 1082} {"train_loss": -5.804965019226074, "global_step": 45458, "epoch": 1082} {"train_loss": -5.761058807373047, "global_step": 45459, "epoch": 1082} {"train_loss": -5.697587490081787, "global_step": 45460, "epoch": 1082} {"train_loss": -5.770687103271484, "global_step": 45461, "epoch": 1082} {"train_loss": -5.6709394454956055, "global_step": 45462, "epoch": 1082} {"train_loss": -5.804441928863525, "global_step": 45463, "epoch": 1082} {"train_loss": -5.746408939361572, "global_step": 45464, "epoch": 1082} {"train_loss": -5.7986555099487305, "global_step": 45465, "epoch": 1082} {"train_loss": -5.733061790466309, "global_step": 45466, "epoch": 1082} {"train_loss": -5.624517440795898, "global_step": 45467, "epoch": 1082} {"train_loss": -5.66751766204834, "global_step": 45468, "epoch": 1082} {"train_loss": -5.718322277069092, "global_step": 45469, "epoch": 1082} {"train_loss": -5.72231388092041, "global_step": 45470, "epoch": 1082} {"train_loss": -5.775734901428223, "global_step": 45471, "epoch": 1082} {"train_loss": -5.700396537780762, "global_step": 45472, "epoch": 1082} {"train_loss": -5.784390449523926, "global_step": 45473, "epoch": 1082} {"train_loss": -5.757850646972656, "global_step": 45474, "epoch": 1082} {"train_loss": -5.755916595458984, "global_step": 45475, "epoch": 1082} {"train_loss": -5.66384744644165, "global_step": 45476, "epoch": 1082} {"train_loss": -5.688697814941406, "global_step": 45477, "epoch": 1082} {"train_loss": -5.765573978424072, "global_step": 45478, "epoch": 1082} {"train_loss": -5.819226264953613, "global_step": 45479, "epoch": 1082} {"train_loss": -5.810299873352051, "global_step": 45480, "epoch": 1082} {"train_loss": -5.717199325561523, "global_step": 45481, "epoch": 1082} {"train_loss": -5.792919635772705, "global_step": 45482, "epoch": 1082} {"train_loss": -5.750194549560547, "global_step": 45483, "epoch": 1082} {"train_loss": -5.802582740783691, "global_step": 45484, "epoch": 1082} {"train_loss": -5.732291471390497, "global_step": 45485, "epoch": 1082, "val_loss": 61893.0390625} {"train_loss": -5.6047797203063965, "global_step": 45486, "epoch": 1083} {"train_loss": -5.731210231781006, "global_step": 45487, "epoch": 1083} {"train_loss": -5.641221046447754, "global_step": 45488, "epoch": 1083} {"train_loss": -5.780689716339111, "global_step": 45489, "epoch": 1083} {"train_loss": -5.753547191619873, "global_step": 45490, "epoch": 1083} {"train_loss": -5.7523274421691895, "global_step": 45491, "epoch": 1083} {"train_loss": -5.6842193603515625, "global_step": 45492, "epoch": 1083} {"train_loss": -5.822200775146484, "global_step": 45493, "epoch": 1083} {"train_loss": -5.6914520263671875, "global_step": 45494, "epoch": 1083} {"train_loss": -5.7786760330200195, "global_step": 45495, "epoch": 1083} {"train_loss": -5.77790641784668, "global_step": 45496, "epoch": 1083} {"train_loss": -5.786921501159668, "global_step": 45497, "epoch": 1083} {"train_loss": -5.671213626861572, "global_step": 45498, "epoch": 1083} {"train_loss": -5.743671417236328, "global_step": 45499, "epoch": 1083} {"train_loss": -5.591355323791504, "global_step": 45500, "epoch": 1083} {"train_loss": -5.630773544311523, "global_step": 45501, "epoch": 1083} {"train_loss": -5.592164039611816, "global_step": 45502, "epoch": 1083} {"train_loss": -5.665731906890869, "global_step": 45503, "epoch": 1083} {"train_loss": -5.573999881744385, "global_step": 45504, "epoch": 1083} {"train_loss": -5.64288330078125, "global_step": 45505, "epoch": 1083} {"train_loss": -5.647438049316406, "global_step": 45506, "epoch": 1083} {"train_loss": -5.713896751403809, "global_step": 45507, "epoch": 1083} {"train_loss": -5.601103782653809, "global_step": 45508, "epoch": 1083} {"train_loss": -5.713095664978027, "global_step": 45509, "epoch": 1083} {"train_loss": -5.6720991134643555, "global_step": 45510, "epoch": 1083} {"train_loss": -5.769374370574951, "global_step": 45511, "epoch": 1083} {"train_loss": -5.551070213317871, "global_step": 45512, "epoch": 1083} {"train_loss": -5.54186487197876, "global_step": 45513, "epoch": 1083} {"train_loss": -5.710738658905029, "global_step": 45514, "epoch": 1083} {"train_loss": -5.558780670166016, "global_step": 45515, "epoch": 1083} {"train_loss": -5.513946533203125, "global_step": 45516, "epoch": 1083} {"train_loss": -5.831986904144287, "global_step": 45517, "epoch": 1083} {"train_loss": -5.721999168395996, "global_step": 45518, "epoch": 1083} {"train_loss": -5.718544960021973, "global_step": 45519, "epoch": 1083} {"train_loss": -5.767724514007568, "global_step": 45520, "epoch": 1083} {"train_loss": -5.712996959686279, "global_step": 45521, "epoch": 1083} {"train_loss": -5.735149383544922, "global_step": 45522, "epoch": 1083} {"train_loss": -5.656206130981445, "global_step": 45523, "epoch": 1083} {"train_loss": -5.620248794555664, "global_step": 45524, "epoch": 1083} {"train_loss": -5.830138683319092, "global_step": 45525, "epoch": 1083} {"train_loss": -5.6756486892700195, "global_step": 45526, "epoch": 1083} {"train_loss": -5.689507983979725, "global_step": 45527, "epoch": 1083, "val_loss": 61628.3125} {"train_loss": -5.694334506988525, "global_step": 45528, "epoch": 1084} {"train_loss": -5.735403060913086, "global_step": 45529, "epoch": 1084} {"train_loss": -5.744411468505859, "global_step": 45530, "epoch": 1084} {"train_loss": -5.789338111877441, "global_step": 45531, "epoch": 1084} {"train_loss": -5.72847318649292, "global_step": 45532, "epoch": 1084} {"train_loss": -5.734922409057617, "global_step": 45533, "epoch": 1084} {"train_loss": -5.731571674346924, "global_step": 45534, "epoch": 1084} {"train_loss": -5.716618537902832, "global_step": 45535, "epoch": 1084} {"train_loss": -5.614785671234131, "global_step": 45536, "epoch": 1084} {"train_loss": -5.797935485839844, "global_step": 45537, "epoch": 1084} {"train_loss": -5.71464729309082, "global_step": 45538, "epoch": 1084} {"train_loss": -5.767088890075684, "global_step": 45539, "epoch": 1084} {"train_loss": -5.6693644523620605, "global_step": 45540, "epoch": 1084} {"train_loss": -5.691784858703613, "global_step": 45541, "epoch": 1084} {"train_loss": -5.711619853973389, "global_step": 45542, "epoch": 1084} {"train_loss": -5.621362209320068, "global_step": 45543, "epoch": 1084} {"train_loss": -5.767378807067871, "global_step": 45544, "epoch": 1084} {"train_loss": -5.768674850463867, "global_step": 45545, "epoch": 1084} {"train_loss": -5.522697925567627, "global_step": 45546, "epoch": 1084} {"train_loss": -5.792598247528076, "global_step": 45547, "epoch": 1084} {"train_loss": -5.61051082611084, "global_step": 45548, "epoch": 1084} {"train_loss": -5.637530326843262, "global_step": 45549, "epoch": 1084} {"train_loss": -5.662553787231445, "global_step": 45550, "epoch": 1084} {"train_loss": -5.710536956787109, "global_step": 45551, "epoch": 1084} {"train_loss": -5.81880521774292, "global_step": 45552, "epoch": 1084} {"train_loss": -5.701763153076172, "global_step": 45553, "epoch": 1084} {"train_loss": -5.588322639465332, "global_step": 45554, "epoch": 1084} {"train_loss": -5.652535915374756, "global_step": 45555, "epoch": 1084} {"train_loss": -5.875115394592285, "global_step": 45556, "epoch": 1084} {"train_loss": -5.7737345695495605, "global_step": 45557, "epoch": 1084} {"train_loss": -5.78000545501709, "global_step": 45558, "epoch": 1084} {"train_loss": -5.679239273071289, "global_step": 45559, "epoch": 1084} {"train_loss": -5.76999568939209, "global_step": 45560, "epoch": 1084} {"train_loss": -5.8594465255737305, "global_step": 45561, "epoch": 1084} {"train_loss": -5.66007137298584, "global_step": 45562, "epoch": 1084} {"train_loss": -5.6581010818481445, "global_step": 45563, "epoch": 1084} {"train_loss": -5.52935791015625, "global_step": 45564, "epoch": 1084} {"train_loss": -5.70784854888916, "global_step": 45565, "epoch": 1084} {"train_loss": -5.748793601989746, "global_step": 45566, "epoch": 1084} {"train_loss": -5.673303127288818, "global_step": 45567, "epoch": 1084} {"train_loss": -5.730251312255859, "global_step": 45568, "epoch": 1084} {"train_loss": -5.714115131469, "global_step": 45569, "epoch": 1084, "val_loss": 61766.5} {"train_loss": -5.577802658081055, "global_step": 45570, "epoch": 1085} {"train_loss": -5.706459999084473, "global_step": 45571, "epoch": 1085} {"train_loss": -5.870710372924805, "global_step": 45572, "epoch": 1085} {"train_loss": -5.6722564697265625, "global_step": 45573, "epoch": 1085} {"train_loss": -5.73911190032959, "global_step": 45574, "epoch": 1085} {"train_loss": -5.644560813903809, "global_step": 45575, "epoch": 1085} {"train_loss": -5.71323299407959, "global_step": 45576, "epoch": 1085} {"train_loss": -5.733401298522949, "global_step": 45577, "epoch": 1085} {"train_loss": -5.704745292663574, "global_step": 45578, "epoch": 1085} {"train_loss": -5.803047180175781, "global_step": 45579, "epoch": 1085} {"train_loss": -5.738482475280762, "global_step": 45580, "epoch": 1085} {"train_loss": -5.748201847076416, "global_step": 45581, "epoch": 1085} {"train_loss": -5.71988582611084, "global_step": 45582, "epoch": 1085} {"train_loss": -5.69239616394043, "global_step": 45583, "epoch": 1085} {"train_loss": -5.722717761993408, "global_step": 45584, "epoch": 1085} {"train_loss": -5.604808807373047, "global_step": 45585, "epoch": 1085} {"train_loss": -5.714146614074707, "global_step": 45586, "epoch": 1085} {"train_loss": -5.682190895080566, "global_step": 45587, "epoch": 1085} {"train_loss": -5.797273635864258, "global_step": 45588, "epoch": 1085} {"train_loss": -5.925746440887451, "global_step": 45589, "epoch": 1085} {"train_loss": -5.661227703094482, "global_step": 45590, "epoch": 1085} {"train_loss": -5.739262580871582, "global_step": 45591, "epoch": 1085} {"train_loss": -5.849905014038086, "global_step": 45592, "epoch": 1085} {"train_loss": -5.6960601806640625, "global_step": 45593, "epoch": 1085} {"train_loss": -5.825826644897461, "global_step": 45594, "epoch": 1085} {"train_loss": -5.779956817626953, "global_step": 45595, "epoch": 1085} {"train_loss": -5.647682189941406, "global_step": 45596, "epoch": 1085} {"train_loss": -5.6001739501953125, "global_step": 45597, "epoch": 1085} {"train_loss": -5.747159957885742, "global_step": 45598, "epoch": 1085} {"train_loss": -5.71075439453125, "global_step": 45599, "epoch": 1085} {"train_loss": -5.751067161560059, "global_step": 45600, "epoch": 1085} {"train_loss": -5.562259197235107, "global_step": 45601, "epoch": 1085} {"train_loss": -5.612537384033203, "global_step": 45602, "epoch": 1085} {"train_loss": -5.565145015716553, "global_step": 45603, "epoch": 1085} {"train_loss": -5.616205215454102, "global_step": 45604, "epoch": 1085} {"train_loss": -5.558338165283203, "global_step": 45605, "epoch": 1085} {"train_loss": -5.722414970397949, "global_step": 45606, "epoch": 1085} {"train_loss": -5.722696304321289, "global_step": 45607, "epoch": 1085} {"train_loss": -5.840023040771484, "global_step": 45608, "epoch": 1085} {"train_loss": -5.703880310058594, "global_step": 45609, "epoch": 1085} {"train_loss": -5.58756685256958, "global_step": 45610, "epoch": 1085} {"train_loss": -5.709497769673665, "global_step": 45611, "epoch": 1085, "val_loss": 62012.57421875} {"train_loss": -5.611152648925781, "global_step": 45612, "epoch": 1086} {"train_loss": -5.819916725158691, "global_step": 45613, "epoch": 1086} {"train_loss": -5.874265670776367, "global_step": 45614, "epoch": 1086} {"train_loss": -5.615781307220459, "global_step": 45615, "epoch": 1086} {"train_loss": -5.611985206604004, "global_step": 45616, "epoch": 1086} {"train_loss": -5.741632461547852, "global_step": 45617, "epoch": 1086} {"train_loss": -5.626195907592773, "global_step": 45618, "epoch": 1086} {"train_loss": -5.8049726486206055, "global_step": 45619, "epoch": 1086} {"train_loss": -5.640398025512695, "global_step": 45620, "epoch": 1086} {"train_loss": -5.617635726928711, "global_step": 45621, "epoch": 1086} {"train_loss": -5.6565937995910645, "global_step": 45622, "epoch": 1086} {"train_loss": -5.631749153137207, "global_step": 45623, "epoch": 1086} {"train_loss": -5.740291118621826, "global_step": 45624, "epoch": 1086} {"train_loss": -5.627910614013672, "global_step": 45625, "epoch": 1086} {"train_loss": -5.760883331298828, "global_step": 45626, "epoch": 1086} {"train_loss": -5.805458068847656, "global_step": 45627, "epoch": 1086} {"train_loss": -5.634485721588135, "global_step": 45628, "epoch": 1086} {"train_loss": -5.770029544830322, "global_step": 45629, "epoch": 1086} {"train_loss": -5.611599922180176, "global_step": 45630, "epoch": 1086} {"train_loss": -5.756890296936035, "global_step": 45631, "epoch": 1086} {"train_loss": -5.578214168548584, "global_step": 45632, "epoch": 1086} {"train_loss": -5.614935398101807, "global_step": 45633, "epoch": 1086} {"train_loss": -5.6255645751953125, "global_step": 45634, "epoch": 1086} {"train_loss": -5.677145004272461, "global_step": 45635, "epoch": 1086} {"train_loss": -5.648101329803467, "global_step": 45636, "epoch": 1086} {"train_loss": -5.627396583557129, "global_step": 45637, "epoch": 1086} {"train_loss": -5.6797966957092285, "global_step": 45638, "epoch": 1086} {"train_loss": -5.703602313995361, "global_step": 45639, "epoch": 1086} {"train_loss": -5.661516189575195, "global_step": 45640, "epoch": 1086} {"train_loss": -5.629350185394287, "global_step": 45641, "epoch": 1086} {"train_loss": -5.529821872711182, "global_step": 45642, "epoch": 1086} {"train_loss": -5.757298469543457, "global_step": 45643, "epoch": 1086} {"train_loss": -5.685662746429443, "global_step": 45644, "epoch": 1086} {"train_loss": -5.813767433166504, "global_step": 45645, "epoch": 1086} {"train_loss": -5.716248512268066, "global_step": 45646, "epoch": 1086} {"train_loss": -5.719072341918945, "global_step": 45647, "epoch": 1086} {"train_loss": -5.659466743469238, "global_step": 45648, "epoch": 1086} {"train_loss": -5.79469108581543, "global_step": 45649, "epoch": 1086} {"train_loss": -5.739744186401367, "global_step": 45650, "epoch": 1086} {"train_loss": -5.691039085388184, "global_step": 45651, "epoch": 1086} {"train_loss": -5.63751220703125, "global_step": 45652, "epoch": 1086} {"train_loss": -5.683896416709537, "global_step": 45653, "epoch": 1086, "val_loss": 61685.73046875} {"train_loss": -5.65322208404541, "global_step": 45654, "epoch": 1087} {"train_loss": -5.710206508636475, "global_step": 45655, "epoch": 1087} {"train_loss": -5.7884931564331055, "global_step": 45656, "epoch": 1087} {"train_loss": -5.742339611053467, "global_step": 45657, "epoch": 1087} {"train_loss": -5.749692916870117, "global_step": 45658, "epoch": 1087} {"train_loss": -5.806030750274658, "global_step": 45659, "epoch": 1087} {"train_loss": -5.540162086486816, "global_step": 45660, "epoch": 1087} {"train_loss": -5.611018657684326, "global_step": 45661, "epoch": 1087} {"train_loss": -5.7217936515808105, "global_step": 45662, "epoch": 1087} {"train_loss": -5.561342239379883, "global_step": 45663, "epoch": 1087} {"train_loss": -5.707366466522217, "global_step": 45664, "epoch": 1087} {"train_loss": -5.666492938995361, "global_step": 45665, "epoch": 1087} {"train_loss": -5.653278350830078, "global_step": 45666, "epoch": 1087} {"train_loss": -5.73095703125, "global_step": 45667, "epoch": 1087} {"train_loss": -5.708042144775391, "global_step": 45668, "epoch": 1087} {"train_loss": -5.675773620605469, "global_step": 45669, "epoch": 1087} {"train_loss": -5.695816993713379, "global_step": 45670, "epoch": 1087} {"train_loss": -5.603448867797852, "global_step": 45671, "epoch": 1087} {"train_loss": -5.82231330871582, "global_step": 45672, "epoch": 1087} {"train_loss": -5.770522117614746, "global_step": 45673, "epoch": 1087} {"train_loss": -5.712621688842773, "global_step": 45674, "epoch": 1087} {"train_loss": -5.74822998046875, "global_step": 45675, "epoch": 1087} {"train_loss": -5.692530155181885, "global_step": 45676, "epoch": 1087} {"train_loss": -5.600247383117676, "global_step": 45677, "epoch": 1087} {"train_loss": -5.734828472137451, "global_step": 45678, "epoch": 1087} {"train_loss": -5.6295294761657715, "global_step": 45679, "epoch": 1087} {"train_loss": -5.683022499084473, "global_step": 45680, "epoch": 1087} {"train_loss": -5.733518123626709, "global_step": 45681, "epoch": 1087} {"train_loss": -5.7521281242370605, "global_step": 45682, "epoch": 1087} {"train_loss": -5.713520050048828, "global_step": 45683, "epoch": 1087} {"train_loss": -5.6780195236206055, "global_step": 45684, "epoch": 1087} {"train_loss": -5.732415676116943, "global_step": 45685, "epoch": 1087} {"train_loss": -5.701495170593262, "global_step": 45686, "epoch": 1087} {"train_loss": -5.657412528991699, "global_step": 45687, "epoch": 1087} {"train_loss": -5.770786762237549, "global_step": 45688, "epoch": 1087} {"train_loss": -5.708547592163086, "global_step": 45689, "epoch": 1087} {"train_loss": -5.721845626831055, "global_step": 45690, "epoch": 1087} {"train_loss": -5.643361568450928, "global_step": 45691, "epoch": 1087} {"train_loss": -5.703530311584473, "global_step": 45692, "epoch": 1087} {"train_loss": -5.570708274841309, "global_step": 45693, "epoch": 1087} {"train_loss": -5.747734069824219, "global_step": 45694, "epoch": 1087} {"train_loss": -5.698020639873686, "global_step": 45695, "epoch": 1087, "val_loss": 61540.0546875} {"train_loss": -5.71144962310791, "global_step": 45696, "epoch": 1088} {"train_loss": -5.677806854248047, "global_step": 45697, "epoch": 1088} {"train_loss": -5.731686592102051, "global_step": 45698, "epoch": 1088} {"train_loss": -5.803116798400879, "global_step": 45699, "epoch": 1088} {"train_loss": -5.76206111907959, "global_step": 45700, "epoch": 1088} {"train_loss": -5.662636756896973, "global_step": 45701, "epoch": 1088} {"train_loss": -5.833780288696289, "global_step": 45702, "epoch": 1088} {"train_loss": -5.601797103881836, "global_step": 45703, "epoch": 1088} {"train_loss": -5.708651542663574, "global_step": 45704, "epoch": 1088} {"train_loss": -5.8695573806762695, "global_step": 45705, "epoch": 1088} {"train_loss": -5.677803039550781, "global_step": 45706, "epoch": 1088} {"train_loss": -5.752063274383545, "global_step": 45707, "epoch": 1088} {"train_loss": -5.691486358642578, "global_step": 45708, "epoch": 1088} {"train_loss": -5.71567440032959, "global_step": 45709, "epoch": 1088} {"train_loss": -5.706294059753418, "global_step": 45710, "epoch": 1088} {"train_loss": -5.73226261138916, "global_step": 45711, "epoch": 1088} {"train_loss": -5.66510009765625, "global_step": 45712, "epoch": 1088} {"train_loss": -5.698708534240723, "global_step": 45713, "epoch": 1088} {"train_loss": -5.613967418670654, "global_step": 45714, "epoch": 1088} {"train_loss": -5.522077560424805, "global_step": 45715, "epoch": 1088} {"train_loss": -5.6812543869018555, "global_step": 45716, "epoch": 1088} {"train_loss": -5.6766276359558105, "global_step": 45717, "epoch": 1088} {"train_loss": -5.637876987457275, "global_step": 45718, "epoch": 1088} {"train_loss": -5.680428504943848, "global_step": 45719, "epoch": 1088} {"train_loss": -5.679411888122559, "global_step": 45720, "epoch": 1088} {"train_loss": -5.675042629241943, "global_step": 45721, "epoch": 1088} {"train_loss": -5.683780670166016, "global_step": 45722, "epoch": 1088} {"train_loss": -5.662356376647949, "global_step": 45723, "epoch": 1088} {"train_loss": -5.6059675216674805, "global_step": 45724, "epoch": 1088} {"train_loss": -5.681306838989258, "global_step": 45725, "epoch": 1088} {"train_loss": -5.719432830810547, "global_step": 45726, "epoch": 1088} {"train_loss": -5.711246490478516, "global_step": 45727, "epoch": 1088} {"train_loss": -5.6402153968811035, "global_step": 45728, "epoch": 1088} {"train_loss": -5.746744155883789, "global_step": 45729, "epoch": 1088} {"train_loss": -5.663825988769531, "global_step": 45730, "epoch": 1088} {"train_loss": -5.625677108764648, "global_step": 45731, "epoch": 1088} {"train_loss": -5.858124732971191, "global_step": 45732, "epoch": 1088} {"train_loss": -5.435077667236328, "global_step": 45733, "epoch": 1088} {"train_loss": -5.6131134033203125, "global_step": 45734, "epoch": 1088} {"train_loss": -5.636131286621094, "global_step": 45735, "epoch": 1088} {"train_loss": -5.715484142303467, "global_step": 45736, "epoch": 1088} {"train_loss": -5.686764944167364, "global_step": 45737, "epoch": 1088, "val_loss": 61853.66015625} {"train_loss": -5.622469902038574, "global_step": 45738, "epoch": 1089} {"train_loss": -5.665466785430908, "global_step": 45739, "epoch": 1089} {"train_loss": -5.8049139976501465, "global_step": 45740, "epoch": 1089} {"train_loss": -5.669003486633301, "global_step": 45741, "epoch": 1089} {"train_loss": -5.776688575744629, "global_step": 45742, "epoch": 1089} {"train_loss": -5.748525142669678, "global_step": 45743, "epoch": 1089} {"train_loss": -5.734039306640625, "global_step": 45744, "epoch": 1089} {"train_loss": -5.7232818603515625, "global_step": 45745, "epoch": 1089} {"train_loss": -5.744986057281494, "global_step": 45746, "epoch": 1089} {"train_loss": -5.74038028717041, "global_step": 45747, "epoch": 1089} {"train_loss": -5.650548458099365, "global_step": 45748, "epoch": 1089} {"train_loss": -5.794253349304199, "global_step": 45749, "epoch": 1089} {"train_loss": -5.7322587966918945, "global_step": 45750, "epoch": 1089} {"train_loss": -5.821853160858154, "global_step": 45751, "epoch": 1089} {"train_loss": -5.736303329467773, "global_step": 45752, "epoch": 1089} {"train_loss": -5.697915077209473, "global_step": 45753, "epoch": 1089} {"train_loss": -5.670345306396484, "global_step": 45754, "epoch": 1089} {"train_loss": -5.658624649047852, "global_step": 45755, "epoch": 1089} {"train_loss": -5.769534111022949, "global_step": 45756, "epoch": 1089} {"train_loss": -5.739809989929199, "global_step": 45757, "epoch": 1089} {"train_loss": -5.68642520904541, "global_step": 45758, "epoch": 1089} {"train_loss": -5.775937080383301, "global_step": 45759, "epoch": 1089} {"train_loss": -5.653395652770996, "global_step": 45760, "epoch": 1089} {"train_loss": -5.783127784729004, "global_step": 45761, "epoch": 1089} {"train_loss": -5.778386116027832, "global_step": 45762, "epoch": 1089} {"train_loss": -5.733950614929199, "global_step": 45763, "epoch": 1089} {"train_loss": -5.792336463928223, "global_step": 45764, "epoch": 1089} {"train_loss": -5.80281925201416, "global_step": 45765, "epoch": 1089} {"train_loss": -5.6899800300598145, "global_step": 45766, "epoch": 1089} {"train_loss": -5.685535430908203, "global_step": 45767, "epoch": 1089} {"train_loss": -5.729693412780762, "global_step": 45768, "epoch": 1089} {"train_loss": -5.660551071166992, "global_step": 45769, "epoch": 1089} {"train_loss": -5.661952972412109, "global_step": 45770, "epoch": 1089} {"train_loss": -5.681989669799805, "global_step": 45771, "epoch": 1089} {"train_loss": -5.658597469329834, "global_step": 45772, "epoch": 1089} {"train_loss": -5.625673294067383, "global_step": 45773, "epoch": 1089} {"train_loss": -5.755433559417725, "global_step": 45774, "epoch": 1089} {"train_loss": -5.849152565002441, "global_step": 45775, "epoch": 1089} {"train_loss": -5.728053092956543, "global_step": 45776, "epoch": 1089} {"train_loss": -5.713325500488281, "global_step": 45777, "epoch": 1089} {"train_loss": -5.787358283996582, "global_step": 45778, "epoch": 1089} {"train_loss": -5.723569949467977, "global_step": 45779, "epoch": 1089, "val_loss": 61408.46875} {"train_loss": -5.716938495635986, "global_step": 45780, "epoch": 1090} {"train_loss": -5.778070449829102, "global_step": 45781, "epoch": 1090} {"train_loss": -5.792065620422363, "global_step": 45782, "epoch": 1090} {"train_loss": -5.591658592224121, "global_step": 45783, "epoch": 1090} {"train_loss": -5.682191371917725, "global_step": 45784, "epoch": 1090} {"train_loss": -5.773080825805664, "global_step": 45785, "epoch": 1090} {"train_loss": -5.792685031890869, "global_step": 45786, "epoch": 1090} {"train_loss": -5.754847049713135, "global_step": 45787, "epoch": 1090} {"train_loss": -5.774064064025879, "global_step": 45788, "epoch": 1090} {"train_loss": -5.728341579437256, "global_step": 45789, "epoch": 1090} {"train_loss": -5.7517852783203125, "global_step": 45790, "epoch": 1090} {"train_loss": -5.6599955558776855, "global_step": 45791, "epoch": 1090} {"train_loss": -5.850918292999268, "global_step": 45792, "epoch": 1090} {"train_loss": -5.863846778869629, "global_step": 45793, "epoch": 1090} {"train_loss": -5.912840843200684, "global_step": 45794, "epoch": 1090} {"train_loss": -5.743948459625244, "global_step": 45795, "epoch": 1090} {"train_loss": -5.703128814697266, "global_step": 45796, "epoch": 1090} {"train_loss": -5.7709550857543945, "global_step": 45797, "epoch": 1090} {"train_loss": -5.742712497711182, "global_step": 45798, "epoch": 1090} {"train_loss": -5.7816925048828125, "global_step": 45799, "epoch": 1090} {"train_loss": -5.6252570152282715, "global_step": 45800, "epoch": 1090} {"train_loss": -5.716792106628418, "global_step": 45801, "epoch": 1090} {"train_loss": -5.724118232727051, "global_step": 45802, "epoch": 1090} {"train_loss": -5.6694512367248535, "global_step": 45803, "epoch": 1090} {"train_loss": -5.575159072875977, "global_step": 45804, "epoch": 1090} {"train_loss": -5.8558831214904785, "global_step": 45805, "epoch": 1090} {"train_loss": -5.755171775817871, "global_step": 45806, "epoch": 1090} {"train_loss": -5.6449432373046875, "global_step": 45807, "epoch": 1090} {"train_loss": -5.687222957611084, "global_step": 45808, "epoch": 1090} {"train_loss": -5.749891757965088, "global_step": 45809, "epoch": 1090} {"train_loss": -5.685690402984619, "global_step": 45810, "epoch": 1090} {"train_loss": -5.610416889190674, "global_step": 45811, "epoch": 1090} {"train_loss": -5.59404993057251, "global_step": 45812, "epoch": 1090} {"train_loss": -5.699133396148682, "global_step": 45813, "epoch": 1090} {"train_loss": -5.772052764892578, "global_step": 45814, "epoch": 1090} {"train_loss": -5.723891735076904, "global_step": 45815, "epoch": 1090} {"train_loss": -5.766107559204102, "global_step": 45816, "epoch": 1090} {"train_loss": -5.641794681549072, "global_step": 45817, "epoch": 1090} {"train_loss": -5.73411750793457, "global_step": 45818, "epoch": 1090} {"train_loss": -5.738073348999023, "global_step": 45819, "epoch": 1090} {"train_loss": -5.629727363586426, "global_step": 45820, "epoch": 1090} {"train_loss": -5.728450922738938, "global_step": 45821, "epoch": 1090, "val_loss": 61762.8125} {"train_loss": -5.820509910583496, "global_step": 45822, "epoch": 1091} {"train_loss": -5.676764488220215, "global_step": 45823, "epoch": 1091} {"train_loss": -5.7612457275390625, "global_step": 45824, "epoch": 1091} {"train_loss": -5.809884548187256, "global_step": 45825, "epoch": 1091} {"train_loss": -5.760778427124023, "global_step": 45826, "epoch": 1091} {"train_loss": -5.65401029586792, "global_step": 45827, "epoch": 1091} {"train_loss": -5.565494060516357, "global_step": 45828, "epoch": 1091} {"train_loss": -5.651917457580566, "global_step": 45829, "epoch": 1091} {"train_loss": -5.804450988769531, "global_step": 45830, "epoch": 1091} {"train_loss": -5.697853088378906, "global_step": 45831, "epoch": 1091} {"train_loss": -5.748040199279785, "global_step": 45832, "epoch": 1091} {"train_loss": -5.671080112457275, "global_step": 45833, "epoch": 1091} {"train_loss": -5.673199653625488, "global_step": 45834, "epoch": 1091} {"train_loss": -5.719185829162598, "global_step": 45835, "epoch": 1091} {"train_loss": -5.80301570892334, "global_step": 45836, "epoch": 1091} {"train_loss": -5.7390618324279785, "global_step": 45837, "epoch": 1091} {"train_loss": -5.818988800048828, "global_step": 45838, "epoch": 1091} {"train_loss": -5.698663234710693, "global_step": 45839, "epoch": 1091} {"train_loss": -5.68902063369751, "global_step": 45840, "epoch": 1091} {"train_loss": -5.711371421813965, "global_step": 45841, "epoch": 1091} {"train_loss": -5.6760053634643555, "global_step": 45842, "epoch": 1091} {"train_loss": -5.702278137207031, "global_step": 45843, "epoch": 1091} {"train_loss": -5.739871501922607, "global_step": 45844, "epoch": 1091} {"train_loss": -5.751399040222168, "global_step": 45845, "epoch": 1091} {"train_loss": -5.854770660400391, "global_step": 45846, "epoch": 1091} {"train_loss": -5.564568042755127, "global_step": 45847, "epoch": 1091} {"train_loss": -5.768438816070557, "global_step": 45848, "epoch": 1091} {"train_loss": -5.815502643585205, "global_step": 45849, "epoch": 1091} {"train_loss": -5.553308486938477, "global_step": 45850, "epoch": 1091} {"train_loss": -5.750696182250977, "global_step": 45851, "epoch": 1091} {"train_loss": -5.62528657913208, "global_step": 45852, "epoch": 1091} {"train_loss": -5.686027526855469, "global_step": 45853, "epoch": 1091} {"train_loss": -5.746725082397461, "global_step": 45854, "epoch": 1091} {"train_loss": -5.647217750549316, "global_step": 45855, "epoch": 1091} {"train_loss": -5.708197116851807, "global_step": 45856, "epoch": 1091} {"train_loss": -5.810197830200195, "global_step": 45857, "epoch": 1091} {"train_loss": -5.67237663269043, "global_step": 45858, "epoch": 1091} {"train_loss": -5.696274757385254, "global_step": 45859, "epoch": 1091} {"train_loss": -5.760181903839111, "global_step": 45860, "epoch": 1091} {"train_loss": -5.737791061401367, "global_step": 45861, "epoch": 1091} {"train_loss": -5.816538333892822, "global_step": 45862, "epoch": 1091} {"train_loss": -5.7236961750757125, "global_step": 45863, "epoch": 1091, "val_loss": 61727.1796875} {"train_loss": -5.70102596282959, "global_step": 45864, "epoch": 1092} {"train_loss": -5.693643093109131, "global_step": 45865, "epoch": 1092} {"train_loss": -5.751409530639648, "global_step": 45866, "epoch": 1092} {"train_loss": -5.663022041320801, "global_step": 45867, "epoch": 1092} {"train_loss": -5.6820454597473145, "global_step": 45868, "epoch": 1092} {"train_loss": -5.683911323547363, "global_step": 45869, "epoch": 1092} {"train_loss": -5.7461957931518555, "global_step": 45870, "epoch": 1092} {"train_loss": -5.721706390380859, "global_step": 45871, "epoch": 1092} {"train_loss": -5.787596225738525, "global_step": 45872, "epoch": 1092} {"train_loss": -5.735734939575195, "global_step": 45873, "epoch": 1092} {"train_loss": -5.835832595825195, "global_step": 45874, "epoch": 1092} {"train_loss": -5.828838348388672, "global_step": 45875, "epoch": 1092} {"train_loss": -5.726685047149658, "global_step": 45876, "epoch": 1092} {"train_loss": -5.728908538818359, "global_step": 45877, "epoch": 1092} {"train_loss": -5.735846996307373, "global_step": 45878, "epoch": 1092} {"train_loss": -5.699432849884033, "global_step": 45879, "epoch": 1092} {"train_loss": -5.704253196716309, "global_step": 45880, "epoch": 1092} {"train_loss": -5.744422912597656, "global_step": 45881, "epoch": 1092} {"train_loss": -5.657962799072266, "global_step": 45882, "epoch": 1092} {"train_loss": -5.714842319488525, "global_step": 45883, "epoch": 1092} {"train_loss": -5.719429016113281, "global_step": 45884, "epoch": 1092} {"train_loss": -5.76322078704834, "global_step": 45885, "epoch": 1092} {"train_loss": -5.791531085968018, "global_step": 45886, "epoch": 1092} {"train_loss": -5.633759021759033, "global_step": 45887, "epoch": 1092} {"train_loss": -5.756855010986328, "global_step": 45888, "epoch": 1092} {"train_loss": -5.788747787475586, "global_step": 45889, "epoch": 1092} {"train_loss": -5.69841194152832, "global_step": 45890, "epoch": 1092} {"train_loss": -5.753067493438721, "global_step": 45891, "epoch": 1092} {"train_loss": -5.809979438781738, "global_step": 45892, "epoch": 1092} {"train_loss": -5.790991306304932, "global_step": 45893, "epoch": 1092} {"train_loss": -5.71503210067749, "global_step": 45894, "epoch": 1092} {"train_loss": -5.787369251251221, "global_step": 45895, "epoch": 1092} {"train_loss": -5.712764739990234, "global_step": 45896, "epoch": 1092} {"train_loss": -5.707372188568115, "global_step": 45897, "epoch": 1092} {"train_loss": -5.620877265930176, "global_step": 45898, "epoch": 1092} {"train_loss": -5.727933883666992, "global_step": 45899, "epoch": 1092} {"train_loss": -5.800830841064453, "global_step": 45900, "epoch": 1092} {"train_loss": -5.743678092956543, "global_step": 45901, "epoch": 1092} {"train_loss": -5.7246294021606445, "global_step": 45902, "epoch": 1092} {"train_loss": -5.74294376373291, "global_step": 45903, "epoch": 1092} {"train_loss": -5.699628829956055, "global_step": 45904, "epoch": 1092} {"train_loss": -5.728253194264004, "global_step": 45905, "epoch": 1092, "val_loss": 61715.87109375} {"train_loss": -5.743847846984863, "global_step": 45906, "epoch": 1093} {"train_loss": -5.60517692565918, "global_step": 45907, "epoch": 1093} {"train_loss": -5.696202278137207, "global_step": 45908, "epoch": 1093} {"train_loss": -5.750186920166016, "global_step": 45909, "epoch": 1093} {"train_loss": -5.701750755310059, "global_step": 45910, "epoch": 1093} {"train_loss": -5.740437984466553, "global_step": 45911, "epoch": 1093} {"train_loss": -5.7401909828186035, "global_step": 45912, "epoch": 1093} {"train_loss": -5.5802202224731445, "global_step": 45913, "epoch": 1093} {"train_loss": -5.629356861114502, "global_step": 45914, "epoch": 1093} {"train_loss": -5.6169514656066895, "global_step": 45915, "epoch": 1093} {"train_loss": -5.603055953979492, "global_step": 45916, "epoch": 1093} {"train_loss": -5.726936340332031, "global_step": 45917, "epoch": 1093} {"train_loss": -5.639666557312012, "global_step": 45918, "epoch": 1093} {"train_loss": -5.84739875793457, "global_step": 45919, "epoch": 1093} {"train_loss": -5.712744235992432, "global_step": 45920, "epoch": 1093} {"train_loss": -5.651595115661621, "global_step": 45921, "epoch": 1093} {"train_loss": -5.680083274841309, "global_step": 45922, "epoch": 1093} {"train_loss": -5.681730270385742, "global_step": 45923, "epoch": 1093} {"train_loss": -5.659055709838867, "global_step": 45924, "epoch": 1093} {"train_loss": -5.651046276092529, "global_step": 45925, "epoch": 1093} {"train_loss": -5.653940200805664, "global_step": 45926, "epoch": 1093} {"train_loss": -5.5637006759643555, "global_step": 45927, "epoch": 1093} {"train_loss": -5.70521354675293, "global_step": 45928, "epoch": 1093} {"train_loss": -5.746575832366943, "global_step": 45929, "epoch": 1093} {"train_loss": -5.75974178314209, "global_step": 45930, "epoch": 1093} {"train_loss": -5.596945762634277, "global_step": 45931, "epoch": 1093} {"train_loss": -5.772219181060791, "global_step": 45932, "epoch": 1093} {"train_loss": -5.84907341003418, "global_step": 45933, "epoch": 1093} {"train_loss": -5.5170674324035645, "global_step": 45934, "epoch": 1093} {"train_loss": -5.658078193664551, "global_step": 45935, "epoch": 1093} {"train_loss": -5.657522201538086, "global_step": 45936, "epoch": 1093} {"train_loss": -5.697230339050293, "global_step": 45937, "epoch": 1093} {"train_loss": -5.784056186676025, "global_step": 45938, "epoch": 1093} {"train_loss": -5.674485206604004, "global_step": 45939, "epoch": 1093} {"train_loss": -5.703847885131836, "global_step": 45940, "epoch": 1093} {"train_loss": -5.69167423248291, "global_step": 45941, "epoch": 1093} {"train_loss": -5.65203857421875, "global_step": 45942, "epoch": 1093} {"train_loss": -5.584917068481445, "global_step": 45943, "epoch": 1093} {"train_loss": -5.799472332000732, "global_step": 45944, "epoch": 1093} {"train_loss": -5.598515033721924, "global_step": 45945, "epoch": 1093} {"train_loss": -5.658681392669678, "global_step": 45946, "epoch": 1093} {"train_loss": -5.6841239134470625, "global_step": 45947, "epoch": 1093, "val_loss": 61610.5} {"train_loss": -5.7593584060668945, "global_step": 45948, "epoch": 1094} {"train_loss": -5.755380630493164, "global_step": 45949, "epoch": 1094} {"train_loss": -5.7068328857421875, "global_step": 45950, "epoch": 1094} {"train_loss": -5.717267990112305, "global_step": 45951, "epoch": 1094} {"train_loss": -5.697988986968994, "global_step": 45952, "epoch": 1094} {"train_loss": -5.560524940490723, "global_step": 45953, "epoch": 1094} {"train_loss": -5.595145225524902, "global_step": 45954, "epoch": 1094} {"train_loss": -5.608627796173096, "global_step": 45955, "epoch": 1094} {"train_loss": -5.745752811431885, "global_step": 45956, "epoch": 1094} {"train_loss": -5.766488075256348, "global_step": 45957, "epoch": 1094} {"train_loss": -5.632855415344238, "global_step": 45958, "epoch": 1094} {"train_loss": -5.731484413146973, "global_step": 45959, "epoch": 1094} {"train_loss": -5.736996650695801, "global_step": 45960, "epoch": 1094} {"train_loss": -5.71799898147583, "global_step": 45961, "epoch": 1094} {"train_loss": -5.697425842285156, "global_step": 45962, "epoch": 1094} {"train_loss": -5.747258186340332, "global_step": 45963, "epoch": 1094} {"train_loss": -5.676269054412842, "global_step": 45964, "epoch": 1094} {"train_loss": -5.75933837890625, "global_step": 45965, "epoch": 1094} {"train_loss": -5.797492027282715, "global_step": 45966, "epoch": 1094} {"train_loss": -5.664526462554932, "global_step": 45967, "epoch": 1094} {"train_loss": -5.646547794342041, "global_step": 45968, "epoch": 1094} {"train_loss": -5.684287071228027, "global_step": 45969, "epoch": 1094} {"train_loss": -5.664290904998779, "global_step": 45970, "epoch": 1094} {"train_loss": -5.8145341873168945, "global_step": 45971, "epoch": 1094} {"train_loss": -5.671913146972656, "global_step": 45972, "epoch": 1094} {"train_loss": -5.8318095207214355, "global_step": 45973, "epoch": 1094} {"train_loss": -5.724437713623047, "global_step": 45974, "epoch": 1094} {"train_loss": -5.634227752685547, "global_step": 45975, "epoch": 1094} {"train_loss": -5.736322402954102, "global_step": 45976, "epoch": 1094} {"train_loss": -5.716019630432129, "global_step": 45977, "epoch": 1094} {"train_loss": -5.66853141784668, "global_step": 45978, "epoch": 1094} {"train_loss": -5.704529285430908, "global_step": 45979, "epoch": 1094} {"train_loss": -5.630617141723633, "global_step": 45980, "epoch": 1094} {"train_loss": -5.712135314941406, "global_step": 45981, "epoch": 1094} {"train_loss": -5.690684795379639, "global_step": 45982, "epoch": 1094} {"train_loss": -5.643523693084717, "global_step": 45983, "epoch": 1094} {"train_loss": -5.754931449890137, "global_step": 45984, "epoch": 1094} {"train_loss": -5.772226333618164, "global_step": 45985, "epoch": 1094} {"train_loss": -5.661055564880371, "global_step": 45986, "epoch": 1094} {"train_loss": -5.597710609436035, "global_step": 45987, "epoch": 1094} {"train_loss": -5.721249580383301, "global_step": 45988, "epoch": 1094} {"train_loss": -5.698878015790667, "global_step": 45989, "epoch": 1094, "val_loss": 61873.16015625} {"train_loss": -5.718275547027588, "global_step": 45990, "epoch": 1095} {"train_loss": -5.7696967124938965, "global_step": 45991, "epoch": 1095} {"train_loss": -5.655024528503418, "global_step": 45992, "epoch": 1095} {"train_loss": -5.645143508911133, "global_step": 45993, "epoch": 1095} {"train_loss": -5.813875198364258, "global_step": 45994, "epoch": 1095} {"train_loss": -5.796450138092041, "global_step": 45995, "epoch": 1095} {"train_loss": -5.7651753425598145, "global_step": 45996, "epoch": 1095} {"train_loss": -5.7111358642578125, "global_step": 45997, "epoch": 1095} {"train_loss": -5.719264984130859, "global_step": 45998, "epoch": 1095} {"train_loss": -5.8488359451293945, "global_step": 45999, "epoch": 1095} {"train_loss": -5.784919738769531, "global_step": 46000, "epoch": 1095} {"train_loss": -5.718672752380371, "global_step": 46001, "epoch": 1095} {"train_loss": -5.644911766052246, "global_step": 46002, "epoch": 1095} {"train_loss": -5.746551513671875, "global_step": 46003, "epoch": 1095} {"train_loss": -5.663529872894287, "global_step": 46004, "epoch": 1095} {"train_loss": -5.6203742027282715, "global_step": 46005, "epoch": 1095} {"train_loss": -5.737942695617676, "global_step": 46006, "epoch": 1095} {"train_loss": -5.7984619140625, "global_step": 46007, "epoch": 1095} {"train_loss": -5.757444381713867, "global_step": 46008, "epoch": 1095} {"train_loss": -5.677766799926758, "global_step": 46009, "epoch": 1095} {"train_loss": -5.7379045486450195, "global_step": 46010, "epoch": 1095} {"train_loss": -5.752349853515625, "global_step": 46011, "epoch": 1095} {"train_loss": -5.742193698883057, "global_step": 46012, "epoch": 1095} {"train_loss": -5.621097564697266, "global_step": 46013, "epoch": 1095} {"train_loss": -5.703841686248779, "global_step": 46014, "epoch": 1095} {"train_loss": -5.708357810974121, "global_step": 46015, "epoch": 1095} {"train_loss": -5.779423713684082, "global_step": 46016, "epoch": 1095} {"train_loss": -5.680071830749512, "global_step": 46017, "epoch": 1095} {"train_loss": -5.665076732635498, "global_step": 46018, "epoch": 1095} {"train_loss": -5.725660800933838, "global_step": 46019, "epoch": 1095} {"train_loss": -5.825063228607178, "global_step": 46020, "epoch": 1095} {"train_loss": -5.820594787597656, "global_step": 46021, "epoch": 1095} {"train_loss": -5.724116325378418, "global_step": 46022, "epoch": 1095} {"train_loss": -5.80441951751709, "global_step": 46023, "epoch": 1095} {"train_loss": -5.790380001068115, "global_step": 46024, "epoch": 1095} {"train_loss": -5.676321029663086, "global_step": 46025, "epoch": 1095} {"train_loss": -5.699282646179199, "global_step": 46026, "epoch": 1095} {"train_loss": -5.679901123046875, "global_step": 46027, "epoch": 1095} {"train_loss": -5.552696228027344, "global_step": 46028, "epoch": 1095} {"train_loss": -5.7671427726745605, "global_step": 46029, "epoch": 1095} {"train_loss": -5.637969493865967, "global_step": 46030, "epoch": 1095} {"train_loss": -5.72181274777367, "global_step": 46031, "epoch": 1095, "val_loss": 61380.56640625} {"train_loss": -5.875756740570068, "global_step": 46032, "epoch": 1096} {"train_loss": -5.580377578735352, "global_step": 46033, "epoch": 1096} {"train_loss": -5.666923522949219, "global_step": 46034, "epoch": 1096} {"train_loss": -5.747902870178223, "global_step": 46035, "epoch": 1096} {"train_loss": -5.671339988708496, "global_step": 46036, "epoch": 1096} {"train_loss": -5.605698108673096, "global_step": 46037, "epoch": 1096} {"train_loss": -5.745266914367676, "global_step": 46038, "epoch": 1096} {"train_loss": -5.658693313598633, "global_step": 46039, "epoch": 1096} {"train_loss": -5.846711158752441, "global_step": 46040, "epoch": 1096} {"train_loss": -5.818785667419434, "global_step": 46041, "epoch": 1096} {"train_loss": -5.65863037109375, "global_step": 46042, "epoch": 1096} {"train_loss": -5.687406539916992, "global_step": 46043, "epoch": 1096} {"train_loss": -5.712359428405762, "global_step": 46044, "epoch": 1096} {"train_loss": -5.755031585693359, "global_step": 46045, "epoch": 1096} {"train_loss": -5.805825710296631, "global_step": 46046, "epoch": 1096} {"train_loss": -5.728950500488281, "global_step": 46047, "epoch": 1096} {"train_loss": -5.711503028869629, "global_step": 46048, "epoch": 1096} {"train_loss": -5.734090805053711, "global_step": 46049, "epoch": 1096} {"train_loss": -5.703895568847656, "global_step": 46050, "epoch": 1096} {"train_loss": -5.691789150238037, "global_step": 46051, "epoch": 1096} {"train_loss": -5.551643371582031, "global_step": 46052, "epoch": 1096} {"train_loss": -5.695647239685059, "global_step": 46053, "epoch": 1096} {"train_loss": -5.695162773132324, "global_step": 46054, "epoch": 1096} {"train_loss": -5.602658271789551, "global_step": 46055, "epoch": 1096} {"train_loss": -5.717990875244141, "global_step": 46056, "epoch": 1096} {"train_loss": -5.719941139221191, "global_step": 46057, "epoch": 1096} {"train_loss": -5.6888837814331055, "global_step": 46058, "epoch": 1096} {"train_loss": -5.818482398986816, "global_step": 46059, "epoch": 1096} {"train_loss": -5.635679721832275, "global_step": 46060, "epoch": 1096} {"train_loss": -5.674050331115723, "global_step": 46061, "epoch": 1096} {"train_loss": -5.736233711242676, "global_step": 46062, "epoch": 1096} {"train_loss": -5.748002052307129, "global_step": 46063, "epoch": 1096} {"train_loss": -5.683048725128174, "global_step": 46064, "epoch": 1096} {"train_loss": -5.801506042480469, "global_step": 46065, "epoch": 1096} {"train_loss": -5.816897392272949, "global_step": 46066, "epoch": 1096} {"train_loss": -5.771131992340088, "global_step": 46067, "epoch": 1096} {"train_loss": -5.752657890319824, "global_step": 46068, "epoch": 1096} {"train_loss": -5.864472389221191, "global_step": 46069, "epoch": 1096} {"train_loss": -5.780004501342773, "global_step": 46070, "epoch": 1096} {"train_loss": -5.742051601409912, "global_step": 46071, "epoch": 1096} {"train_loss": -5.686556816101074, "global_step": 46072, "epoch": 1096} {"train_loss": -5.721768004553659, "global_step": 46073, "epoch": 1096, "val_loss": 61603.5390625} {"train_loss": -5.692685127258301, "global_step": 46074, "epoch": 1097} {"train_loss": -5.788015365600586, "global_step": 46075, "epoch": 1097} {"train_loss": -5.6207475662231445, "global_step": 46076, "epoch": 1097} {"train_loss": -5.728433609008789, "global_step": 46077, "epoch": 1097} {"train_loss": -5.583100318908691, "global_step": 46078, "epoch": 1097} {"train_loss": -5.770684242248535, "global_step": 46079, "epoch": 1097} {"train_loss": -5.638094902038574, "global_step": 46080, "epoch": 1097} {"train_loss": -5.675940990447998, "global_step": 46081, "epoch": 1097} {"train_loss": -5.735623359680176, "global_step": 46082, "epoch": 1097} {"train_loss": -5.70648193359375, "global_step": 46083, "epoch": 1097} {"train_loss": -5.859338760375977, "global_step": 46084, "epoch": 1097} {"train_loss": -5.6891279220581055, "global_step": 46085, "epoch": 1097} {"train_loss": -5.761857032775879, "global_step": 46086, "epoch": 1097} {"train_loss": -5.7649054527282715, "global_step": 46087, "epoch": 1097} {"train_loss": -5.752617835998535, "global_step": 46088, "epoch": 1097} {"train_loss": -5.701656818389893, "global_step": 46089, "epoch": 1097} {"train_loss": -5.862635612487793, "global_step": 46090, "epoch": 1097} {"train_loss": -5.623697757720947, "global_step": 46091, "epoch": 1097} {"train_loss": -5.814835071563721, "global_step": 46092, "epoch": 1097} {"train_loss": -5.649851322174072, "global_step": 46093, "epoch": 1097} {"train_loss": -5.688024520874023, "global_step": 46094, "epoch": 1097} {"train_loss": -5.838286399841309, "global_step": 46095, "epoch": 1097} {"train_loss": -5.808167457580566, "global_step": 46096, "epoch": 1097} {"train_loss": -5.772486686706543, "global_step": 46097, "epoch": 1097} {"train_loss": -5.681791305541992, "global_step": 46098, "epoch": 1097} {"train_loss": -5.617861747741699, "global_step": 46099, "epoch": 1097} {"train_loss": -5.720564842224121, "global_step": 46100, "epoch": 1097} {"train_loss": -5.63659143447876, "global_step": 46101, "epoch": 1097} {"train_loss": -5.710358142852783, "global_step": 46102, "epoch": 1097} {"train_loss": -5.731437683105469, "global_step": 46103, "epoch": 1097} {"train_loss": -5.6633710861206055, "global_step": 46104, "epoch": 1097} {"train_loss": -5.780309677124023, "global_step": 46105, "epoch": 1097} {"train_loss": -5.602853298187256, "global_step": 46106, "epoch": 1097} {"train_loss": -5.7207231521606445, "global_step": 46107, "epoch": 1097} {"train_loss": -5.7895121574401855, "global_step": 46108, "epoch": 1097} {"train_loss": -5.73051643371582, "global_step": 46109, "epoch": 1097} {"train_loss": -5.765964508056641, "global_step": 46110, "epoch": 1097} {"train_loss": -5.745409965515137, "global_step": 46111, "epoch": 1097} {"train_loss": -5.725870609283447, "global_step": 46112, "epoch": 1097} {"train_loss": -5.903824806213379, "global_step": 46113, "epoch": 1097} {"train_loss": -5.811434745788574, "global_step": 46114, "epoch": 1097} {"train_loss": -5.727674802144368, "global_step": 46115, "epoch": 1097, "val_loss": 61599.33984375} {"train_loss": -5.789196014404297, "global_step": 46116, "epoch": 1098} {"train_loss": -5.728043556213379, "global_step": 46117, "epoch": 1098} {"train_loss": -5.7734479904174805, "global_step": 46118, "epoch": 1098} {"train_loss": -5.757006645202637, "global_step": 46119, "epoch": 1098} {"train_loss": -5.747220039367676, "global_step": 46120, "epoch": 1098} {"train_loss": -5.7664666175842285, "global_step": 46121, "epoch": 1098} {"train_loss": -5.704764366149902, "global_step": 46122, "epoch": 1098} {"train_loss": -5.695241928100586, "global_step": 46123, "epoch": 1098} {"train_loss": -5.715228080749512, "global_step": 46124, "epoch": 1098} {"train_loss": -5.76262092590332, "global_step": 46125, "epoch": 1098} {"train_loss": -5.625905990600586, "global_step": 46126, "epoch": 1098} {"train_loss": -5.624507427215576, "global_step": 46127, "epoch": 1098} {"train_loss": -5.6935834884643555, "global_step": 46128, "epoch": 1098} {"train_loss": -5.606017589569092, "global_step": 46129, "epoch": 1098} {"train_loss": -5.731733322143555, "global_step": 46130, "epoch": 1098} {"train_loss": -5.702294826507568, "global_step": 46131, "epoch": 1098} {"train_loss": -5.663881301879883, "global_step": 46132, "epoch": 1098} {"train_loss": -5.67376184463501, "global_step": 46133, "epoch": 1098} {"train_loss": -5.799761772155762, "global_step": 46134, "epoch": 1098} {"train_loss": -5.668042182922363, "global_step": 46135, "epoch": 1098} {"train_loss": -5.786243438720703, "global_step": 46136, "epoch": 1098} {"train_loss": -5.83975887298584, "global_step": 46137, "epoch": 1098} {"train_loss": -5.603018283843994, "global_step": 46138, "epoch": 1098} {"train_loss": -5.783102989196777, "global_step": 46139, "epoch": 1098} {"train_loss": -5.630122184753418, "global_step": 46140, "epoch": 1098} {"train_loss": -5.740177631378174, "global_step": 46141, "epoch": 1098} {"train_loss": -5.705061912536621, "global_step": 46142, "epoch": 1098} {"train_loss": -5.642277240753174, "global_step": 46143, "epoch": 1098} {"train_loss": -5.736663818359375, "global_step": 46144, "epoch": 1098} {"train_loss": -5.700144290924072, "global_step": 46145, "epoch": 1098} {"train_loss": -5.817011833190918, "global_step": 46146, "epoch": 1098} {"train_loss": -5.803351402282715, "global_step": 46147, "epoch": 1098} {"train_loss": -5.664097785949707, "global_step": 46148, "epoch": 1098} {"train_loss": -5.779982566833496, "global_step": 46149, "epoch": 1098} {"train_loss": -5.800751209259033, "global_step": 46150, "epoch": 1098} {"train_loss": -5.776257038116455, "global_step": 46151, "epoch": 1098} {"train_loss": -5.754119873046875, "global_step": 46152, "epoch": 1098} {"train_loss": -5.882309913635254, "global_step": 46153, "epoch": 1098} {"train_loss": -5.650335311889648, "global_step": 46154, "epoch": 1098} {"train_loss": -5.75748872756958, "global_step": 46155, "epoch": 1098} {"train_loss": -5.661977767944336, "global_step": 46156, "epoch": 1098} {"train_loss": -5.726107835769653, "global_step": 46157, "epoch": 1098, "val_loss": 61373.0078125} {"train_loss": -5.817987442016602, "global_step": 46158, "epoch": 1099} {"train_loss": -5.705665588378906, "global_step": 46159, "epoch": 1099} {"train_loss": -5.7687530517578125, "global_step": 46160, "epoch": 1099} {"train_loss": -5.67094612121582, "global_step": 46161, "epoch": 1099} {"train_loss": -5.763021469116211, "global_step": 46162, "epoch": 1099} {"train_loss": -5.8297319412231445, "global_step": 46163, "epoch": 1099} {"train_loss": -5.588367938995361, "global_step": 46164, "epoch": 1099} {"train_loss": -5.804530143737793, "global_step": 46165, "epoch": 1099} {"train_loss": -5.660438060760498, "global_step": 46166, "epoch": 1099} {"train_loss": -5.670095443725586, "global_step": 46167, "epoch": 1099} {"train_loss": -5.859192371368408, "global_step": 46168, "epoch": 1099} {"train_loss": -5.630302429199219, "global_step": 46169, "epoch": 1099} {"train_loss": -5.8256378173828125, "global_step": 46170, "epoch": 1099} {"train_loss": -5.830483436584473, "global_step": 46171, "epoch": 1099} {"train_loss": -5.683873176574707, "global_step": 46172, "epoch": 1099} {"train_loss": -5.748621940612793, "global_step": 46173, "epoch": 1099} {"train_loss": -5.688202857971191, "global_step": 46174, "epoch": 1099} {"train_loss": -5.589980602264404, "global_step": 46175, "epoch": 1099} {"train_loss": -5.743884563446045, "global_step": 46176, "epoch": 1099} {"train_loss": -5.68570613861084, "global_step": 46177, "epoch": 1099} {"train_loss": -5.662618160247803, "global_step": 46178, "epoch": 1099} {"train_loss": -5.674647331237793, "global_step": 46179, "epoch": 1099} {"train_loss": -5.625491619110107, "global_step": 46180, "epoch": 1099} {"train_loss": -5.728699684143066, "global_step": 46181, "epoch": 1099} {"train_loss": -5.795222759246826, "global_step": 46182, "epoch": 1099} {"train_loss": -5.790683269500732, "global_step": 46183, "epoch": 1099} {"train_loss": -5.753754615783691, "global_step": 46184, "epoch": 1099} {"train_loss": -5.678692817687988, "global_step": 46185, "epoch": 1099} {"train_loss": -5.881193161010742, "global_step": 46186, "epoch": 1099} {"train_loss": -5.713265419006348, "global_step": 46187, "epoch": 1099} {"train_loss": -5.744691848754883, "global_step": 46188, "epoch": 1099} {"train_loss": -5.721582889556885, "global_step": 46189, "epoch": 1099} {"train_loss": -5.827254295349121, "global_step": 46190, "epoch": 1099} {"train_loss": -5.748678207397461, "global_step": 46191, "epoch": 1099} {"train_loss": -5.72972297668457, "global_step": 46192, "epoch": 1099} {"train_loss": -5.71678352355957, "global_step": 46193, "epoch": 1099} {"train_loss": -5.679884433746338, "global_step": 46194, "epoch": 1099} {"train_loss": -5.756092071533203, "global_step": 46195, "epoch": 1099} {"train_loss": -5.715184211730957, "global_step": 46196, "epoch": 1099} {"train_loss": -5.672981262207031, "global_step": 46197, "epoch": 1099} {"train_loss": -5.7938079833984375, "global_step": 46198, "epoch": 1099} {"train_loss": -5.72970716158549, "global_step": 46199, "epoch": 1099, "val_loss": 61453.6953125} {"train_loss": -5.665261268615723, "global_step": 46200, "epoch": 1100} {"train_loss": -5.638295650482178, "global_step": 46201, "epoch": 1100} {"train_loss": -5.77331018447876, "global_step": 46202, "epoch": 1100} {"train_loss": -5.675384998321533, "global_step": 46203, "epoch": 1100} {"train_loss": -5.671272277832031, "global_step": 46204, "epoch": 1100} {"train_loss": -5.861822128295898, "global_step": 46205, "epoch": 1100} {"train_loss": -5.725366592407227, "global_step": 46206, "epoch": 1100} {"train_loss": -5.635472774505615, "global_step": 46207, "epoch": 1100} {"train_loss": -5.808104515075684, "global_step": 46208, "epoch": 1100} {"train_loss": -5.8071417808532715, "global_step": 46209, "epoch": 1100} {"train_loss": -5.7032670974731445, "global_step": 46210, "epoch": 1100} {"train_loss": -5.75215482711792, "global_step": 46211, "epoch": 1100} {"train_loss": -5.7517313957214355, "global_step": 46212, "epoch": 1100} {"train_loss": -5.747251510620117, "global_step": 46213, "epoch": 1100} {"train_loss": -5.7601423263549805, "global_step": 46214, "epoch": 1100} {"train_loss": -5.925421714782715, "global_step": 46215, "epoch": 1100} {"train_loss": -5.763688087463379, "global_step": 46216, "epoch": 1100} {"train_loss": -5.714298248291016, "global_step": 46217, "epoch": 1100} {"train_loss": -5.7596435546875, "global_step": 46218, "epoch": 1100} {"train_loss": -5.824456214904785, "global_step": 46219, "epoch": 1100} {"train_loss": -5.737217903137207, "global_step": 46220, "epoch": 1100} {"train_loss": -5.777834892272949, "global_step": 46221, "epoch": 1100} {"train_loss": -5.783421516418457, "global_step": 46222, "epoch": 1100} {"train_loss": -5.799130439758301, "global_step": 46223, "epoch": 1100} {"train_loss": -5.700409889221191, "global_step": 46224, "epoch": 1100} {"train_loss": -5.698622226715088, "global_step": 46225, "epoch": 1100} {"train_loss": -5.7761945724487305, "global_step": 46226, "epoch": 1100} {"train_loss": -5.675780296325684, "global_step": 46227, "epoch": 1100} {"train_loss": -5.6965012550354, "global_step": 46228, "epoch": 1100} {"train_loss": -5.645365238189697, "global_step": 46229, "epoch": 1100} {"train_loss": -5.677356719970703, "global_step": 46230, "epoch": 1100} {"train_loss": -5.731820106506348, "global_step": 46231, "epoch": 1100} {"train_loss": -5.814538478851318, "global_step": 46232, "epoch": 1100} {"train_loss": -5.66383171081543, "global_step": 46233, "epoch": 1100} {"train_loss": -5.658108234405518, "global_step": 46234, "epoch": 1100} {"train_loss": -5.822559356689453, "global_step": 46235, "epoch": 1100} {"train_loss": -5.72081184387207, "global_step": 46236, "epoch": 1100} {"train_loss": -5.727831840515137, "global_step": 46237, "epoch": 1100} {"train_loss": -5.663652420043945, "global_step": 46238, "epoch": 1100} {"train_loss": -5.60706090927124, "global_step": 46239, "epoch": 1100} {"train_loss": -5.736302375793457, "global_step": 46240, "epoch": 1100} {"train_loss": -5.731536081859043, "global_step": 46241, "epoch": 1100, "train/sim_max_reward_0": 0.7916076407857718, "train/sim_max_reward_1": 0.5995225117813784, "train/sim_max_reward_2": 0.5064122643487172, "train/sim_max_reward_3": 0.5028295122399512, "train/sim_max_reward_4": 0.71292153038313, "train/sim_max_reward_5": 0.6217184543596751, "test/sim_max_reward_4300000": 0.7555780984353747, "test/sim_max_reward_4300001": 0.22277884581993168, "test/sim_max_reward_4300002": 0.6282248050257078, "test/sim_max_reward_4300003": 0.8938423641198402, "test/sim_max_reward_4300004": 0.0960768779544909, "test/sim_max_reward_4300005": 0.6501770791475289, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.37619222213165576, "test/sim_max_reward_4300008": 0.9015629594260433, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.2200116426423552, "test/sim_max_reward_4300011": 0.8546861262491207, "test/sim_max_reward_4300012": 0.44023411235147003, "test/sim_max_reward_4300013": 0.3700356456491952, "test/sim_max_reward_4300014": 0.8560425219949286, "test/sim_max_reward_4300015": 0.9284355923572055, "test/sim_max_reward_4300016": 0.3091920341308427, "test/sim_max_reward_4300017": 0.8038045730314771, "test/sim_max_reward_4300018": 0.4416958758796744, "test/sim_max_reward_4300019": 0.18617063127637912, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.4387147317671823, "test/sim_max_reward_4300022": 0.9553550667719601, "test/sim_max_reward_4300023": 0.3382449473907113, "test/sim_max_reward_4300024": 0.7177500042204092, "test/sim_max_reward_4300025": 0.9159012908606929, "test/sim_max_reward_4300026": 0.7258499932472702, "test/sim_max_reward_4300027": 0.9145783847103872, "test/sim_max_reward_4300028": 2.8629497851710087e-07, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.0, "test/sim_max_reward_4300032": 0.8182562419508859, "test/sim_max_reward_4300033": 0.65572701525455, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8888799734638565, "test/sim_max_reward_4300038": 0.3929490640213741, "test/sim_max_reward_4300039": 0.8069709881153928, "test/sim_max_reward_4300040": 0.8787072353692981, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.6738340022394153, "test/sim_max_reward_4300043": 0.17446424413015846, "test/sim_max_reward_4300044": 0.8728148581926808, "test/sim_max_reward_4300045": 0.4829214547193906, "test/sim_max_reward_4300046": 0.7546878347966263, "test/sim_max_reward_4300047": 0.6985691211543916, "test/sim_max_reward_4300048": 0.7933657831328038, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.6225019856497707, "test/mean_score": 0.5006495728998223, "val_loss": 61588.28125} {"train_loss": -5.816059112548828, "global_step": 46242, "epoch": 1101} {"train_loss": -5.684649467468262, "global_step": 46243, "epoch": 1101} {"train_loss": -5.649957180023193, "global_step": 46244, "epoch": 1101} {"train_loss": -5.74262809753418, "global_step": 46245, "epoch": 1101} {"train_loss": -5.56815242767334, "global_step": 46246, "epoch": 1101} {"train_loss": -5.637539863586426, "global_step": 46247, "epoch": 1101} {"train_loss": -5.781282424926758, "global_step": 46248, "epoch": 1101} {"train_loss": -5.748935222625732, "global_step": 46249, "epoch": 1101} {"train_loss": -5.721166133880615, "global_step": 46250, "epoch": 1101} {"train_loss": -5.680909156799316, "global_step": 46251, "epoch": 1101} {"train_loss": -5.733903408050537, "global_step": 46252, "epoch": 1101} {"train_loss": -5.700468063354492, "global_step": 46253, "epoch": 1101} {"train_loss": -5.785336017608643, "global_step": 46254, "epoch": 1101} {"train_loss": -5.610567092895508, "global_step": 46255, "epoch": 1101} {"train_loss": -5.7944016456604, "global_step": 46256, "epoch": 1101} {"train_loss": -5.763657569885254, "global_step": 46257, "epoch": 1101} {"train_loss": -5.732512474060059, "global_step": 46258, "epoch": 1101} {"train_loss": -5.6194000244140625, "global_step": 46259, "epoch": 1101} {"train_loss": -5.872160911560059, "global_step": 46260, "epoch": 1101} {"train_loss": -5.682662010192871, "global_step": 46261, "epoch": 1101} {"train_loss": -5.749159812927246, "global_step": 46262, "epoch": 1101} {"train_loss": -5.779684543609619, "global_step": 46263, "epoch": 1101} {"train_loss": -5.69523811340332, "global_step": 46264, "epoch": 1101} {"train_loss": -5.668330192565918, "global_step": 46265, "epoch": 1101} {"train_loss": -5.68300724029541, "global_step": 46266, "epoch": 1101} {"train_loss": -5.756709575653076, "global_step": 46267, "epoch": 1101} {"train_loss": -5.740960121154785, "global_step": 46268, "epoch": 1101} {"train_loss": -5.816644668579102, "global_step": 46269, "epoch": 1101} {"train_loss": -5.749656677246094, "global_step": 46270, "epoch": 1101} {"train_loss": -5.784576416015625, "global_step": 46271, "epoch": 1101} {"train_loss": -5.716509819030762, "global_step": 46272, "epoch": 1101} {"train_loss": -5.822800636291504, "global_step": 46273, "epoch": 1101} {"train_loss": -5.698421478271484, "global_step": 46274, "epoch": 1101} {"train_loss": -5.800305366516113, "global_step": 46275, "epoch": 1101} {"train_loss": -5.659677505493164, "global_step": 46276, "epoch": 1101} {"train_loss": -5.7727203369140625, "global_step": 46277, "epoch": 1101} {"train_loss": -5.6462788581848145, "global_step": 46278, "epoch": 1101} {"train_loss": -5.756696701049805, "global_step": 46279, "epoch": 1101} {"train_loss": -5.759769439697266, "global_step": 46280, "epoch": 1101} {"train_loss": -5.822978973388672, "global_step": 46281, "epoch": 1101} {"train_loss": -5.65080451965332, "global_step": 46282, "epoch": 1101} {"train_loss": -5.728999580655779, "global_step": 46283, "epoch": 1101, "val_loss": 61734.37109375} {"train_loss": -5.750469207763672, "global_step": 46284, "epoch": 1102} {"train_loss": -5.732036590576172, "global_step": 46285, "epoch": 1102} {"train_loss": -5.641788482666016, "global_step": 46286, "epoch": 1102} {"train_loss": -5.6881208419799805, "global_step": 46287, "epoch": 1102} {"train_loss": -5.682013988494873, "global_step": 46288, "epoch": 1102} {"train_loss": -5.6821794509887695, "global_step": 46289, "epoch": 1102} {"train_loss": -5.700345516204834, "global_step": 46290, "epoch": 1102} {"train_loss": -5.602690696716309, "global_step": 46291, "epoch": 1102} {"train_loss": -5.604471206665039, "global_step": 46292, "epoch": 1102} {"train_loss": -5.8371806144714355, "global_step": 46293, "epoch": 1102} {"train_loss": -5.813004493713379, "global_step": 46294, "epoch": 1102} {"train_loss": -5.521966934204102, "global_step": 46295, "epoch": 1102} {"train_loss": -5.807181358337402, "global_step": 46296, "epoch": 1102} {"train_loss": -5.633243560791016, "global_step": 46297, "epoch": 1102} {"train_loss": -5.5823869705200195, "global_step": 46298, "epoch": 1102} {"train_loss": -5.746024131774902, "global_step": 46299, "epoch": 1102} {"train_loss": -5.748239517211914, "global_step": 46300, "epoch": 1102} {"train_loss": -5.798532485961914, "global_step": 46301, "epoch": 1102} {"train_loss": -5.653615951538086, "global_step": 46302, "epoch": 1102} {"train_loss": -5.6839704513549805, "global_step": 46303, "epoch": 1102} {"train_loss": -5.738018035888672, "global_step": 46304, "epoch": 1102} {"train_loss": -5.713773250579834, "global_step": 46305, "epoch": 1102} {"train_loss": -5.772923469543457, "global_step": 46306, "epoch": 1102} {"train_loss": -5.752010822296143, "global_step": 46307, "epoch": 1102} {"train_loss": -5.6802568435668945, "global_step": 46308, "epoch": 1102} {"train_loss": -5.7733473777771, "global_step": 46309, "epoch": 1102} {"train_loss": -5.597192287445068, "global_step": 46310, "epoch": 1102} {"train_loss": -5.688579559326172, "global_step": 46311, "epoch": 1102} {"train_loss": -5.681666374206543, "global_step": 46312, "epoch": 1102} {"train_loss": -5.802222728729248, "global_step": 46313, "epoch": 1102} {"train_loss": -5.809207916259766, "global_step": 46314, "epoch": 1102} {"train_loss": -5.690540313720703, "global_step": 46315, "epoch": 1102} {"train_loss": -5.754999160766602, "global_step": 46316, "epoch": 1102} {"train_loss": -5.791184425354004, "global_step": 46317, "epoch": 1102} {"train_loss": -5.712982177734375, "global_step": 46318, "epoch": 1102} {"train_loss": -5.7809977531433105, "global_step": 46319, "epoch": 1102} {"train_loss": -5.6759033203125, "global_step": 46320, "epoch": 1102} {"train_loss": -5.764756202697754, "global_step": 46321, "epoch": 1102} {"train_loss": -5.819431304931641, "global_step": 46322, "epoch": 1102} {"train_loss": -5.773226737976074, "global_step": 46323, "epoch": 1102} {"train_loss": -5.74633264541626, "global_step": 46324, "epoch": 1102} {"train_loss": -5.716952142261324, "global_step": 46325, "epoch": 1102, "val_loss": 61449.23046875} {"train_loss": -5.731072902679443, "global_step": 46326, "epoch": 1103} {"train_loss": -5.714179515838623, "global_step": 46327, "epoch": 1103} {"train_loss": -5.704164505004883, "global_step": 46328, "epoch": 1103} {"train_loss": -5.656957626342773, "global_step": 46329, "epoch": 1103} {"train_loss": -5.814840316772461, "global_step": 46330, "epoch": 1103} {"train_loss": -5.693504333496094, "global_step": 46331, "epoch": 1103} {"train_loss": -5.769772052764893, "global_step": 46332, "epoch": 1103} {"train_loss": -5.784651756286621, "global_step": 46333, "epoch": 1103} {"train_loss": -5.772578716278076, "global_step": 46334, "epoch": 1103} {"train_loss": -5.706137180328369, "global_step": 46335, "epoch": 1103} {"train_loss": -5.709182262420654, "global_step": 46336, "epoch": 1103} {"train_loss": -5.836049556732178, "global_step": 46337, "epoch": 1103} {"train_loss": -5.612904071807861, "global_step": 46338, "epoch": 1103} {"train_loss": -5.838834762573242, "global_step": 46339, "epoch": 1103} {"train_loss": -5.820204734802246, "global_step": 46340, "epoch": 1103} {"train_loss": -5.628931999206543, "global_step": 46341, "epoch": 1103} {"train_loss": -5.77427339553833, "global_step": 46342, "epoch": 1103} {"train_loss": -5.722830295562744, "global_step": 46343, "epoch": 1103} {"train_loss": -5.685633659362793, "global_step": 46344, "epoch": 1103} {"train_loss": -5.630645275115967, "global_step": 46345, "epoch": 1103} {"train_loss": -5.694097518920898, "global_step": 46346, "epoch": 1103} {"train_loss": -5.73307466506958, "global_step": 46347, "epoch": 1103} {"train_loss": -5.603503227233887, "global_step": 46348, "epoch": 1103} {"train_loss": -5.645220756530762, "global_step": 46349, "epoch": 1103} {"train_loss": -5.825183868408203, "global_step": 46350, "epoch": 1103} {"train_loss": -5.673691749572754, "global_step": 46351, "epoch": 1103} {"train_loss": -5.800820350646973, "global_step": 46352, "epoch": 1103} {"train_loss": -5.761402130126953, "global_step": 46353, "epoch": 1103} {"train_loss": -5.70488166809082, "global_step": 46354, "epoch": 1103} {"train_loss": -5.798341751098633, "global_step": 46355, "epoch": 1103} {"train_loss": -5.648682594299316, "global_step": 46356, "epoch": 1103} {"train_loss": -5.703113555908203, "global_step": 46357, "epoch": 1103} {"train_loss": -5.698320388793945, "global_step": 46358, "epoch": 1103} {"train_loss": -5.6877946853637695, "global_step": 46359, "epoch": 1103} {"train_loss": -5.543682098388672, "global_step": 46360, "epoch": 1103} {"train_loss": -5.823100566864014, "global_step": 46361, "epoch": 1103} {"train_loss": -5.529784202575684, "global_step": 46362, "epoch": 1103} {"train_loss": -5.651435375213623, "global_step": 46363, "epoch": 1103} {"train_loss": -5.757711410522461, "global_step": 46364, "epoch": 1103} {"train_loss": -5.605683326721191, "global_step": 46365, "epoch": 1103} {"train_loss": -5.686634063720703, "global_step": 46366, "epoch": 1103} {"train_loss": -5.711282979874384, "global_step": 46367, "epoch": 1103, "val_loss": 62398.43359375} {"train_loss": -5.5581254959106445, "global_step": 46368, "epoch": 1104} {"train_loss": -5.542363166809082, "global_step": 46369, "epoch": 1104} {"train_loss": -5.689875602722168, "global_step": 46370, "epoch": 1104} {"train_loss": -5.665646076202393, "global_step": 46371, "epoch": 1104} {"train_loss": -5.701684951782227, "global_step": 46372, "epoch": 1104} {"train_loss": -5.650198459625244, "global_step": 46373, "epoch": 1104} {"train_loss": -5.8165178298950195, "global_step": 46374, "epoch": 1104} {"train_loss": -5.746586322784424, "global_step": 46375, "epoch": 1104} {"train_loss": -5.6334309577941895, "global_step": 46376, "epoch": 1104} {"train_loss": -5.707277297973633, "global_step": 46377, "epoch": 1104} {"train_loss": -5.667328834533691, "global_step": 46378, "epoch": 1104} {"train_loss": -5.6163129806518555, "global_step": 46379, "epoch": 1104} {"train_loss": -5.645819664001465, "global_step": 46380, "epoch": 1104} {"train_loss": -5.584072589874268, "global_step": 46381, "epoch": 1104} {"train_loss": -5.537590503692627, "global_step": 46382, "epoch": 1104} {"train_loss": -5.801265239715576, "global_step": 46383, "epoch": 1104} {"train_loss": -5.558100700378418, "global_step": 46384, "epoch": 1104} {"train_loss": -5.668824195861816, "global_step": 46385, "epoch": 1104} {"train_loss": -5.726795196533203, "global_step": 46386, "epoch": 1104} {"train_loss": -5.691192626953125, "global_step": 46387, "epoch": 1104} {"train_loss": -5.812126159667969, "global_step": 46388, "epoch": 1104} {"train_loss": -5.601605415344238, "global_step": 46389, "epoch": 1104} {"train_loss": -5.691883563995361, "global_step": 46390, "epoch": 1104} {"train_loss": -5.7648420333862305, "global_step": 46391, "epoch": 1104} {"train_loss": -5.598980903625488, "global_step": 46392, "epoch": 1104} {"train_loss": -5.68867826461792, "global_step": 46393, "epoch": 1104} {"train_loss": -5.632292747497559, "global_step": 46394, "epoch": 1104} {"train_loss": -5.78714656829834, "global_step": 46395, "epoch": 1104} {"train_loss": -5.435698509216309, "global_step": 46396, "epoch": 1104} {"train_loss": -5.614337921142578, "global_step": 46397, "epoch": 1104} {"train_loss": -5.608612060546875, "global_step": 46398, "epoch": 1104} {"train_loss": -5.637881278991699, "global_step": 46399, "epoch": 1104} {"train_loss": -5.785520553588867, "global_step": 46400, "epoch": 1104} {"train_loss": -5.632510185241699, "global_step": 46401, "epoch": 1104} {"train_loss": -5.83636474609375, "global_step": 46402, "epoch": 1104} {"train_loss": -5.6348466873168945, "global_step": 46403, "epoch": 1104} {"train_loss": -5.666602611541748, "global_step": 46404, "epoch": 1104} {"train_loss": -5.721466541290283, "global_step": 46405, "epoch": 1104} {"train_loss": -5.605440139770508, "global_step": 46406, "epoch": 1104} {"train_loss": -5.800542831420898, "global_step": 46407, "epoch": 1104} {"train_loss": -5.776828765869141, "global_step": 46408, "epoch": 1104} {"train_loss": -5.676284494854155, "global_step": 46409, "epoch": 1104, "val_loss": 61631.1171875} {"train_loss": -5.5529465675354, "global_step": 46410, "epoch": 1105} {"train_loss": -5.726751327514648, "global_step": 46411, "epoch": 1105} {"train_loss": -5.574663162231445, "global_step": 46412, "epoch": 1105} {"train_loss": -5.708528518676758, "global_step": 46413, "epoch": 1105} {"train_loss": -5.768126964569092, "global_step": 46414, "epoch": 1105} {"train_loss": -5.744534492492676, "global_step": 46415, "epoch": 1105} {"train_loss": -5.784307479858398, "global_step": 46416, "epoch": 1105} {"train_loss": -5.773573875427246, "global_step": 46417, "epoch": 1105} {"train_loss": -5.680159568786621, "global_step": 46418, "epoch": 1105} {"train_loss": -5.714348316192627, "global_step": 46419, "epoch": 1105} {"train_loss": -5.693596839904785, "global_step": 46420, "epoch": 1105} {"train_loss": -5.7602081298828125, "global_step": 46421, "epoch": 1105} {"train_loss": -5.702199459075928, "global_step": 46422, "epoch": 1105} {"train_loss": -5.7473368644714355, "global_step": 46423, "epoch": 1105} {"train_loss": -5.651035308837891, "global_step": 46424, "epoch": 1105} {"train_loss": -5.742702484130859, "global_step": 46425, "epoch": 1105} {"train_loss": -5.83008337020874, "global_step": 46426, "epoch": 1105} {"train_loss": -5.7194318771362305, "global_step": 46427, "epoch": 1105} {"train_loss": -5.78394079208374, "global_step": 46428, "epoch": 1105} {"train_loss": -5.839344024658203, "global_step": 46429, "epoch": 1105} {"train_loss": -5.917795658111572, "global_step": 46430, "epoch": 1105} {"train_loss": -5.715183258056641, "global_step": 46431, "epoch": 1105} {"train_loss": -5.735289096832275, "global_step": 46432, "epoch": 1105} {"train_loss": -5.687154293060303, "global_step": 46433, "epoch": 1105} {"train_loss": -5.77410888671875, "global_step": 46434, "epoch": 1105} {"train_loss": -5.838603973388672, "global_step": 46435, "epoch": 1105} {"train_loss": -5.719858646392822, "global_step": 46436, "epoch": 1105} {"train_loss": -5.707047939300537, "global_step": 46437, "epoch": 1105} {"train_loss": -5.660557746887207, "global_step": 46438, "epoch": 1105} {"train_loss": -5.809719085693359, "global_step": 46439, "epoch": 1105} {"train_loss": -5.820515155792236, "global_step": 46440, "epoch": 1105} {"train_loss": -5.6448140144348145, "global_step": 46441, "epoch": 1105} {"train_loss": -5.779053211212158, "global_step": 46442, "epoch": 1105} {"train_loss": -5.74238395690918, "global_step": 46443, "epoch": 1105} {"train_loss": -5.8081159591674805, "global_step": 46444, "epoch": 1105} {"train_loss": -5.789124011993408, "global_step": 46445, "epoch": 1105} {"train_loss": -5.770885467529297, "global_step": 46446, "epoch": 1105} {"train_loss": -5.854898929595947, "global_step": 46447, "epoch": 1105} {"train_loss": -5.8469438552856445, "global_step": 46448, "epoch": 1105} {"train_loss": -5.610512733459473, "global_step": 46449, "epoch": 1105} {"train_loss": -5.6403489112854, "global_step": 46450, "epoch": 1105} {"train_loss": -5.73897952125186, "global_step": 46451, "epoch": 1105, "val_loss": 61375.046875} {"train_loss": -5.716294288635254, "global_step": 46452, "epoch": 1106} {"train_loss": -5.626455307006836, "global_step": 46453, "epoch": 1106} {"train_loss": -5.84196662902832, "global_step": 46454, "epoch": 1106} {"train_loss": -5.770815372467041, "global_step": 46455, "epoch": 1106} {"train_loss": -5.713086128234863, "global_step": 46456, "epoch": 1106} {"train_loss": -5.820915222167969, "global_step": 46457, "epoch": 1106} {"train_loss": -5.7683868408203125, "global_step": 46458, "epoch": 1106} {"train_loss": -5.802943706512451, "global_step": 46459, "epoch": 1106} {"train_loss": -5.669276714324951, "global_step": 46460, "epoch": 1106} {"train_loss": -5.712367057800293, "global_step": 46461, "epoch": 1106} {"train_loss": -5.90822696685791, "global_step": 46462, "epoch": 1106} {"train_loss": -5.722775459289551, "global_step": 46463, "epoch": 1106} {"train_loss": -5.841746807098389, "global_step": 46464, "epoch": 1106} {"train_loss": -5.71153450012207, "global_step": 46465, "epoch": 1106} {"train_loss": -5.806888580322266, "global_step": 46466, "epoch": 1106} {"train_loss": -5.742620468139648, "global_step": 46467, "epoch": 1106} {"train_loss": -5.678803443908691, "global_step": 46468, "epoch": 1106} {"train_loss": -5.834023475646973, "global_step": 46469, "epoch": 1106} {"train_loss": -5.688523292541504, "global_step": 46470, "epoch": 1106} {"train_loss": -5.736916542053223, "global_step": 46471, "epoch": 1106} {"train_loss": -5.662240028381348, "global_step": 46472, "epoch": 1106} {"train_loss": -5.885344505310059, "global_step": 46473, "epoch": 1106} {"train_loss": -5.747941017150879, "global_step": 46474, "epoch": 1106} {"train_loss": -5.763190269470215, "global_step": 46475, "epoch": 1106} {"train_loss": -5.6431474685668945, "global_step": 46476, "epoch": 1106} {"train_loss": -5.721691131591797, "global_step": 46477, "epoch": 1106} {"train_loss": -5.902839660644531, "global_step": 46478, "epoch": 1106} {"train_loss": -5.804618835449219, "global_step": 46479, "epoch": 1106} {"train_loss": -5.53035306930542, "global_step": 46480, "epoch": 1106} {"train_loss": -5.674895763397217, "global_step": 46481, "epoch": 1106} {"train_loss": -5.605430603027344, "global_step": 46482, "epoch": 1106} {"train_loss": -5.704870223999023, "global_step": 46483, "epoch": 1106} {"train_loss": -5.76321268081665, "global_step": 46484, "epoch": 1106} {"train_loss": -5.666720390319824, "global_step": 46485, "epoch": 1106} {"train_loss": -5.754900932312012, "global_step": 46486, "epoch": 1106} {"train_loss": -5.632096767425537, "global_step": 46487, "epoch": 1106} {"train_loss": -5.78309440612793, "global_step": 46488, "epoch": 1106} {"train_loss": -5.700572490692139, "global_step": 46489, "epoch": 1106} {"train_loss": -5.678827285766602, "global_step": 46490, "epoch": 1106} {"train_loss": -5.6641716957092285, "global_step": 46491, "epoch": 1106} {"train_loss": -5.721133232116699, "global_step": 46492, "epoch": 1106} {"train_loss": -5.735098021371024, "global_step": 46493, "epoch": 1106, "val_loss": 61411.7578125} {"train_loss": -5.757558822631836, "global_step": 46494, "epoch": 1107} {"train_loss": -5.685246467590332, "global_step": 46495, "epoch": 1107} {"train_loss": -5.802361488342285, "global_step": 46496, "epoch": 1107} {"train_loss": -5.635632038116455, "global_step": 46497, "epoch": 1107} {"train_loss": -5.698722839355469, "global_step": 46498, "epoch": 1107} {"train_loss": -5.680583477020264, "global_step": 46499, "epoch": 1107} {"train_loss": -5.574757099151611, "global_step": 46500, "epoch": 1107} {"train_loss": -5.754691123962402, "global_step": 46501, "epoch": 1107} {"train_loss": -5.729196548461914, "global_step": 46502, "epoch": 1107} {"train_loss": -5.653418064117432, "global_step": 46503, "epoch": 1107} {"train_loss": -5.852197647094727, "global_step": 46504, "epoch": 1107} {"train_loss": -5.7192840576171875, "global_step": 46505, "epoch": 1107} {"train_loss": -5.768662452697754, "global_step": 46506, "epoch": 1107} {"train_loss": -5.752779960632324, "global_step": 46507, "epoch": 1107} {"train_loss": -5.731088638305664, "global_step": 46508, "epoch": 1107} {"train_loss": -5.719780921936035, "global_step": 46509, "epoch": 1107} {"train_loss": -5.665782451629639, "global_step": 46510, "epoch": 1107} {"train_loss": -5.594179630279541, "global_step": 46511, "epoch": 1107} {"train_loss": -5.774425506591797, "global_step": 46512, "epoch": 1107} {"train_loss": -5.678917407989502, "global_step": 46513, "epoch": 1107} {"train_loss": -5.791571140289307, "global_step": 46514, "epoch": 1107} {"train_loss": -5.696468353271484, "global_step": 46515, "epoch": 1107} {"train_loss": -5.658656597137451, "global_step": 46516, "epoch": 1107} {"train_loss": -5.6794281005859375, "global_step": 46517, "epoch": 1107} {"train_loss": -5.6322526931762695, "global_step": 46518, "epoch": 1107} {"train_loss": -5.6064300537109375, "global_step": 46519, "epoch": 1107} {"train_loss": -5.657484531402588, "global_step": 46520, "epoch": 1107} {"train_loss": -5.587991714477539, "global_step": 46521, "epoch": 1107} {"train_loss": -5.772422790527344, "global_step": 46522, "epoch": 1107} {"train_loss": -5.654317855834961, "global_step": 46523, "epoch": 1107} {"train_loss": -5.756317138671875, "global_step": 46524, "epoch": 1107} {"train_loss": -5.708131790161133, "global_step": 46525, "epoch": 1107} {"train_loss": -5.72934627532959, "global_step": 46526, "epoch": 1107} {"train_loss": -5.651592254638672, "global_step": 46527, "epoch": 1107} {"train_loss": -5.739973068237305, "global_step": 46528, "epoch": 1107} {"train_loss": -5.546598434448242, "global_step": 46529, "epoch": 1107} {"train_loss": -5.694883346557617, "global_step": 46530, "epoch": 1107} {"train_loss": -5.574426651000977, "global_step": 46531, "epoch": 1107} {"train_loss": -5.638633728027344, "global_step": 46532, "epoch": 1107} {"train_loss": -5.75849723815918, "global_step": 46533, "epoch": 1107} {"train_loss": -5.662953853607178, "global_step": 46534, "epoch": 1107} {"train_loss": -5.693140801929292, "global_step": 46535, "epoch": 1107, "val_loss": 61968.80078125} {"train_loss": -5.6884260177612305, "global_step": 46536, "epoch": 1108} {"train_loss": -5.690441131591797, "global_step": 46537, "epoch": 1108} {"train_loss": -5.729235649108887, "global_step": 46538, "epoch": 1108} {"train_loss": -5.668604850769043, "global_step": 46539, "epoch": 1108} {"train_loss": -5.665339469909668, "global_step": 46540, "epoch": 1108} {"train_loss": -5.527863025665283, "global_step": 46541, "epoch": 1108} {"train_loss": -5.668271064758301, "global_step": 46542, "epoch": 1108} {"train_loss": -5.586785316467285, "global_step": 46543, "epoch": 1108} {"train_loss": -5.684002876281738, "global_step": 46544, "epoch": 1108} {"train_loss": -5.788975715637207, "global_step": 46545, "epoch": 1108} {"train_loss": -5.585076332092285, "global_step": 46546, "epoch": 1108} {"train_loss": -5.686002731323242, "global_step": 46547, "epoch": 1108} {"train_loss": -5.536002159118652, "global_step": 46548, "epoch": 1108} {"train_loss": -5.721109867095947, "global_step": 46549, "epoch": 1108} {"train_loss": -5.733944892883301, "global_step": 46550, "epoch": 1108} {"train_loss": -5.631859302520752, "global_step": 46551, "epoch": 1108} {"train_loss": -5.595510482788086, "global_step": 46552, "epoch": 1108} {"train_loss": -5.700473785400391, "global_step": 46553, "epoch": 1108} {"train_loss": -5.681000709533691, "global_step": 46554, "epoch": 1108} {"train_loss": -5.4997477531433105, "global_step": 46555, "epoch": 1108} {"train_loss": -5.702932357788086, "global_step": 46556, "epoch": 1108} {"train_loss": -5.764043807983398, "global_step": 46557, "epoch": 1108} {"train_loss": -5.589269161224365, "global_step": 46558, "epoch": 1108} {"train_loss": -5.665278911590576, "global_step": 46559, "epoch": 1108} {"train_loss": -5.652514457702637, "global_step": 46560, "epoch": 1108} {"train_loss": -5.64049768447876, "global_step": 46561, "epoch": 1108} {"train_loss": -5.713107109069824, "global_step": 46562, "epoch": 1108} {"train_loss": -5.527366638183594, "global_step": 46563, "epoch": 1108} {"train_loss": -5.766304016113281, "global_step": 46564, "epoch": 1108} {"train_loss": -5.678089618682861, "global_step": 46565, "epoch": 1108} {"train_loss": -5.690958023071289, "global_step": 46566, "epoch": 1108} {"train_loss": -5.605975151062012, "global_step": 46567, "epoch": 1108} {"train_loss": -5.7538161277771, "global_step": 46568, "epoch": 1108} {"train_loss": -5.7526960372924805, "global_step": 46569, "epoch": 1108} {"train_loss": -5.65194034576416, "global_step": 46570, "epoch": 1108} {"train_loss": -5.730384826660156, "global_step": 46571, "epoch": 1108} {"train_loss": -5.731381416320801, "global_step": 46572, "epoch": 1108} {"train_loss": -5.679231643676758, "global_step": 46573, "epoch": 1108} {"train_loss": -5.72829008102417, "global_step": 46574, "epoch": 1108} {"train_loss": -5.724697113037109, "global_step": 46575, "epoch": 1108} {"train_loss": -5.649880409240723, "global_step": 46576, "epoch": 1108} {"train_loss": -5.672751040685744, "global_step": 46577, "epoch": 1108, "val_loss": 61606.14453125} {"train_loss": -5.682557106018066, "global_step": 46578, "epoch": 1109} {"train_loss": -5.686230659484863, "global_step": 46579, "epoch": 1109} {"train_loss": -5.719732284545898, "global_step": 46580, "epoch": 1109} {"train_loss": -5.691783905029297, "global_step": 46581, "epoch": 1109} {"train_loss": -5.775620460510254, "global_step": 46582, "epoch": 1109} {"train_loss": -5.6015777587890625, "global_step": 46583, "epoch": 1109} {"train_loss": -5.697056293487549, "global_step": 46584, "epoch": 1109} {"train_loss": -5.82240104675293, "global_step": 46585, "epoch": 1109} {"train_loss": -5.756544589996338, "global_step": 46586, "epoch": 1109} {"train_loss": -5.633733749389648, "global_step": 46587, "epoch": 1109} {"train_loss": -5.773433208465576, "global_step": 46588, "epoch": 1109} {"train_loss": -5.823474884033203, "global_step": 46589, "epoch": 1109} {"train_loss": -5.740822792053223, "global_step": 46590, "epoch": 1109} {"train_loss": -5.631897926330566, "global_step": 46591, "epoch": 1109} {"train_loss": -5.706719875335693, "global_step": 46592, "epoch": 1109} {"train_loss": -5.674378871917725, "global_step": 46593, "epoch": 1109} {"train_loss": -5.738285541534424, "global_step": 46594, "epoch": 1109} {"train_loss": -5.616114616394043, "global_step": 46595, "epoch": 1109} {"train_loss": -5.614321708679199, "global_step": 46596, "epoch": 1109} {"train_loss": -5.664817810058594, "global_step": 46597, "epoch": 1109} {"train_loss": -5.627926826477051, "global_step": 46598, "epoch": 1109} {"train_loss": -5.766651153564453, "global_step": 46599, "epoch": 1109} {"train_loss": -5.692154884338379, "global_step": 46600, "epoch": 1109} {"train_loss": -5.6778364181518555, "global_step": 46601, "epoch": 1109} {"train_loss": -5.673673152923584, "global_step": 46602, "epoch": 1109} {"train_loss": -5.598965644836426, "global_step": 46603, "epoch": 1109} {"train_loss": -5.797691345214844, "global_step": 46604, "epoch": 1109} {"train_loss": -5.728163242340088, "global_step": 46605, "epoch": 1109} {"train_loss": -5.804964065551758, "global_step": 46606, "epoch": 1109} {"train_loss": -5.78816032409668, "global_step": 46607, "epoch": 1109} {"train_loss": -5.81273078918457, "global_step": 46608, "epoch": 1109} {"train_loss": -5.771883010864258, "global_step": 46609, "epoch": 1109} {"train_loss": -5.708401203155518, "global_step": 46610, "epoch": 1109} {"train_loss": -5.675864219665527, "global_step": 46611, "epoch": 1109} {"train_loss": -5.760234355926514, "global_step": 46612, "epoch": 1109} {"train_loss": -5.786208629608154, "global_step": 46613, "epoch": 1109} {"train_loss": -5.639228343963623, "global_step": 46614, "epoch": 1109} {"train_loss": -5.6607747077941895, "global_step": 46615, "epoch": 1109} {"train_loss": -5.608595371246338, "global_step": 46616, "epoch": 1109} {"train_loss": -5.841561794281006, "global_step": 46617, "epoch": 1109} {"train_loss": -5.730710506439209, "global_step": 46618, "epoch": 1109} {"train_loss": -5.7124880609058195, "global_step": 46619, "epoch": 1109, "val_loss": 61625.16796875} {"train_loss": -5.739894390106201, "global_step": 46620, "epoch": 1110} {"train_loss": -5.670153617858887, "global_step": 46621, "epoch": 1110} {"train_loss": -5.678234100341797, "global_step": 46622, "epoch": 1110} {"train_loss": -5.754225730895996, "global_step": 46623, "epoch": 1110} {"train_loss": -5.641061782836914, "global_step": 46624, "epoch": 1110} {"train_loss": -5.755450248718262, "global_step": 46625, "epoch": 1110} {"train_loss": -5.607116222381592, "global_step": 46626, "epoch": 1110} {"train_loss": -5.755032539367676, "global_step": 46627, "epoch": 1110} {"train_loss": -5.687077522277832, "global_step": 46628, "epoch": 1110} {"train_loss": -5.7829084396362305, "global_step": 46629, "epoch": 1110} {"train_loss": -5.702445983886719, "global_step": 46630, "epoch": 1110} {"train_loss": -5.7321977615356445, "global_step": 46631, "epoch": 1110} {"train_loss": -5.7688188552856445, "global_step": 46632, "epoch": 1110} {"train_loss": -5.772387981414795, "global_step": 46633, "epoch": 1110} {"train_loss": -5.850841999053955, "global_step": 46634, "epoch": 1110} {"train_loss": -5.775725364685059, "global_step": 46635, "epoch": 1110} {"train_loss": -5.654439926147461, "global_step": 46636, "epoch": 1110} {"train_loss": -5.752066612243652, "global_step": 46637, "epoch": 1110} {"train_loss": -5.681056976318359, "global_step": 46638, "epoch": 1110} {"train_loss": -5.765775680541992, "global_step": 46639, "epoch": 1110} {"train_loss": -5.7773518562316895, "global_step": 46640, "epoch": 1110} {"train_loss": -5.793485641479492, "global_step": 46641, "epoch": 1110} {"train_loss": -5.644634246826172, "global_step": 46642, "epoch": 1110} {"train_loss": -5.872727870941162, "global_step": 46643, "epoch": 1110} {"train_loss": -5.72703742980957, "global_step": 46644, "epoch": 1110} {"train_loss": -5.742025375366211, "global_step": 46645, "epoch": 1110} {"train_loss": -5.731630325317383, "global_step": 46646, "epoch": 1110} {"train_loss": -5.7538909912109375, "global_step": 46647, "epoch": 1110} {"train_loss": -5.648222923278809, "global_step": 46648, "epoch": 1110} {"train_loss": -5.768778324127197, "global_step": 46649, "epoch": 1110} {"train_loss": -5.682017803192139, "global_step": 46650, "epoch": 1110} {"train_loss": -5.707181930541992, "global_step": 46651, "epoch": 1110} {"train_loss": -5.750690460205078, "global_step": 46652, "epoch": 1110} {"train_loss": -5.836407661437988, "global_step": 46653, "epoch": 1110} {"train_loss": -5.71329402923584, "global_step": 46654, "epoch": 1110} {"train_loss": -5.83859920501709, "global_step": 46655, "epoch": 1110} {"train_loss": -5.816363334655762, "global_step": 46656, "epoch": 1110} {"train_loss": -5.684784889221191, "global_step": 46657, "epoch": 1110} {"train_loss": -5.747706890106201, "global_step": 46658, "epoch": 1110} {"train_loss": -5.6916961669921875, "global_step": 46659, "epoch": 1110} {"train_loss": -5.777583122253418, "global_step": 46660, "epoch": 1110} {"train_loss": -5.738839365187145, "global_step": 46661, "epoch": 1110, "val_loss": 61524.8828125} {"train_loss": -5.701624870300293, "global_step": 46662, "epoch": 1111} {"train_loss": -5.678386688232422, "global_step": 46663, "epoch": 1111} {"train_loss": -5.802968502044678, "global_step": 46664, "epoch": 1111} {"train_loss": -5.695257663726807, "global_step": 46665, "epoch": 1111} {"train_loss": -5.8613152503967285, "global_step": 46666, "epoch": 1111} {"train_loss": -5.635415554046631, "global_step": 46667, "epoch": 1111} {"train_loss": -5.817439079284668, "global_step": 46668, "epoch": 1111} {"train_loss": -5.725581645965576, "global_step": 46669, "epoch": 1111} {"train_loss": -5.761851787567139, "global_step": 46670, "epoch": 1111} {"train_loss": -5.753961086273193, "global_step": 46671, "epoch": 1111} {"train_loss": -5.479640960693359, "global_step": 46672, "epoch": 1111} {"train_loss": -5.832474708557129, "global_step": 46673, "epoch": 1111} {"train_loss": -5.675174236297607, "global_step": 46674, "epoch": 1111} {"train_loss": -5.712276458740234, "global_step": 46675, "epoch": 1111} {"train_loss": -5.7159247398376465, "global_step": 46676, "epoch": 1111} {"train_loss": -5.607047080993652, "global_step": 46677, "epoch": 1111} {"train_loss": -5.706910133361816, "global_step": 46678, "epoch": 1111} {"train_loss": -5.640576362609863, "global_step": 46679, "epoch": 1111} {"train_loss": -5.842768669128418, "global_step": 46680, "epoch": 1111} {"train_loss": -5.749297142028809, "global_step": 46681, "epoch": 1111} {"train_loss": -5.624250411987305, "global_step": 46682, "epoch": 1111} {"train_loss": -5.629505157470703, "global_step": 46683, "epoch": 1111} {"train_loss": -5.674036979675293, "global_step": 46684, "epoch": 1111} {"train_loss": -5.602644443511963, "global_step": 46685, "epoch": 1111} {"train_loss": -5.594855308532715, "global_step": 46686, "epoch": 1111} {"train_loss": -5.70137882232666, "global_step": 46687, "epoch": 1111} {"train_loss": -5.745397567749023, "global_step": 46688, "epoch": 1111} {"train_loss": -5.759345054626465, "global_step": 46689, "epoch": 1111} {"train_loss": -5.654903888702393, "global_step": 46690, "epoch": 1111} {"train_loss": -5.671216011047363, "global_step": 46691, "epoch": 1111} {"train_loss": -5.769359111785889, "global_step": 46692, "epoch": 1111} {"train_loss": -5.692257881164551, "global_step": 46693, "epoch": 1111} {"train_loss": -5.6477179527282715, "global_step": 46694, "epoch": 1111} {"train_loss": -5.869842529296875, "global_step": 46695, "epoch": 1111} {"train_loss": -5.549925804138184, "global_step": 46696, "epoch": 1111} {"train_loss": -5.714727401733398, "global_step": 46697, "epoch": 1111} {"train_loss": -5.79184627532959, "global_step": 46698, "epoch": 1111} {"train_loss": -5.663142681121826, "global_step": 46699, "epoch": 1111} {"train_loss": -5.6421685218811035, "global_step": 46700, "epoch": 1111} {"train_loss": -5.752264976501465, "global_step": 46701, "epoch": 1111} {"train_loss": -5.8207879066467285, "global_step": 46702, "epoch": 1111} {"train_loss": -5.708515689486549, "global_step": 46703, "epoch": 1111, "val_loss": 61374.41015625} {"train_loss": -5.724363327026367, "global_step": 46704, "epoch": 1112} {"train_loss": -5.579807758331299, "global_step": 46705, "epoch": 1112} {"train_loss": -5.780181884765625, "global_step": 46706, "epoch": 1112} {"train_loss": -5.70388126373291, "global_step": 46707, "epoch": 1112} {"train_loss": -5.793116569519043, "global_step": 46708, "epoch": 1112} {"train_loss": -5.707402229309082, "global_step": 46709, "epoch": 1112} {"train_loss": -5.69714879989624, "global_step": 46710, "epoch": 1112} {"train_loss": -5.766776084899902, "global_step": 46711, "epoch": 1112} {"train_loss": -5.708616733551025, "global_step": 46712, "epoch": 1112} {"train_loss": -5.809582233428955, "global_step": 46713, "epoch": 1112} {"train_loss": -5.549036979675293, "global_step": 46714, "epoch": 1112} {"train_loss": -5.842517852783203, "global_step": 46715, "epoch": 1112} {"train_loss": -5.74412202835083, "global_step": 46716, "epoch": 1112} {"train_loss": -5.68166446685791, "global_step": 46717, "epoch": 1112} {"train_loss": -5.7295660972595215, "global_step": 46718, "epoch": 1112} {"train_loss": -5.781732082366943, "global_step": 46719, "epoch": 1112} {"train_loss": -5.831748962402344, "global_step": 46720, "epoch": 1112} {"train_loss": -5.776159286499023, "global_step": 46721, "epoch": 1112} {"train_loss": -5.869082450866699, "global_step": 46722, "epoch": 1112} {"train_loss": -5.83009147644043, "global_step": 46723, "epoch": 1112} {"train_loss": -5.7809953689575195, "global_step": 46724, "epoch": 1112} {"train_loss": -5.894347190856934, "global_step": 46725, "epoch": 1112} {"train_loss": -5.7953033447265625, "global_step": 46726, "epoch": 1112} {"train_loss": -5.779882431030273, "global_step": 46727, "epoch": 1112} {"train_loss": -5.6957106590271, "global_step": 46728, "epoch": 1112} {"train_loss": -5.716246128082275, "global_step": 46729, "epoch": 1112} {"train_loss": -5.737809658050537, "global_step": 46730, "epoch": 1112} {"train_loss": -5.81410026550293, "global_step": 46731, "epoch": 1112} {"train_loss": -5.7455291748046875, "global_step": 46732, "epoch": 1112} {"train_loss": -5.720633506774902, "global_step": 46733, "epoch": 1112} {"train_loss": -5.667193412780762, "global_step": 46734, "epoch": 1112} {"train_loss": -5.859347820281982, "global_step": 46735, "epoch": 1112} {"train_loss": -5.808446884155273, "global_step": 46736, "epoch": 1112} {"train_loss": -5.765693664550781, "global_step": 46737, "epoch": 1112} {"train_loss": -5.858913421630859, "global_step": 46738, "epoch": 1112} {"train_loss": -5.667916297912598, "global_step": 46739, "epoch": 1112} {"train_loss": -5.751967430114746, "global_step": 46740, "epoch": 1112} {"train_loss": -5.821831703186035, "global_step": 46741, "epoch": 1112} {"train_loss": -5.835677623748779, "global_step": 46742, "epoch": 1112} {"train_loss": -5.806212902069092, "global_step": 46743, "epoch": 1112} {"train_loss": -5.794084548950195, "global_step": 46744, "epoch": 1112} {"train_loss": -5.762064014162336, "global_step": 46745, "epoch": 1112, "val_loss": 61472.72265625} {"train_loss": -5.781003475189209, "global_step": 46746, "epoch": 1113} {"train_loss": -5.8165283203125, "global_step": 46747, "epoch": 1113} {"train_loss": -5.757078170776367, "global_step": 46748, "epoch": 1113} {"train_loss": -5.772494316101074, "global_step": 46749, "epoch": 1113} {"train_loss": -5.754476070404053, "global_step": 46750, "epoch": 1113} {"train_loss": -5.734007835388184, "global_step": 46751, "epoch": 1113} {"train_loss": -5.826818943023682, "global_step": 46752, "epoch": 1113} {"train_loss": -5.736602783203125, "global_step": 46753, "epoch": 1113} {"train_loss": -5.829876899719238, "global_step": 46754, "epoch": 1113} {"train_loss": -5.773223876953125, "global_step": 46755, "epoch": 1113} {"train_loss": -5.770875453948975, "global_step": 46756, "epoch": 1113} {"train_loss": -5.702469825744629, "global_step": 46757, "epoch": 1113} {"train_loss": -5.788734436035156, "global_step": 46758, "epoch": 1113} {"train_loss": -5.815336227416992, "global_step": 46759, "epoch": 1113} {"train_loss": -5.760693550109863, "global_step": 46760, "epoch": 1113} {"train_loss": -5.838945388793945, "global_step": 46761, "epoch": 1113} {"train_loss": -5.6710615158081055, "global_step": 46762, "epoch": 1113} {"train_loss": -5.6914286613464355, "global_step": 46763, "epoch": 1113} {"train_loss": -5.7357892990112305, "global_step": 46764, "epoch": 1113} {"train_loss": -5.7802734375, "global_step": 46765, "epoch": 1113} {"train_loss": -5.791492462158203, "global_step": 46766, "epoch": 1113} {"train_loss": -5.8175883293151855, "global_step": 46767, "epoch": 1113} {"train_loss": -5.732311725616455, "global_step": 46768, "epoch": 1113} {"train_loss": -5.703604698181152, "global_step": 46769, "epoch": 1113} {"train_loss": -5.797128677368164, "global_step": 46770, "epoch": 1113} {"train_loss": -5.873378276824951, "global_step": 46771, "epoch": 1113} {"train_loss": -5.727866172790527, "global_step": 46772, "epoch": 1113} {"train_loss": -5.7122650146484375, "global_step": 46773, "epoch": 1113} {"train_loss": -5.743871212005615, "global_step": 46774, "epoch": 1113} {"train_loss": -5.7356672286987305, "global_step": 46775, "epoch": 1113} {"train_loss": -5.672689914703369, "global_step": 46776, "epoch": 1113} {"train_loss": -5.717739105224609, "global_step": 46777, "epoch": 1113} {"train_loss": -5.785983085632324, "global_step": 46778, "epoch": 1113} {"train_loss": -5.747876167297363, "global_step": 46779, "epoch": 1113} {"train_loss": -5.737765789031982, "global_step": 46780, "epoch": 1113} {"train_loss": -5.727519989013672, "global_step": 46781, "epoch": 1113} {"train_loss": -5.713662147521973, "global_step": 46782, "epoch": 1113} {"train_loss": -5.732958793640137, "global_step": 46783, "epoch": 1113} {"train_loss": -5.776633262634277, "global_step": 46784, "epoch": 1113} {"train_loss": -5.647007465362549, "global_step": 46785, "epoch": 1113} {"train_loss": -5.654987812042236, "global_step": 46786, "epoch": 1113} {"train_loss": -5.7509459881555465, "global_step": 46787, "epoch": 1113, "val_loss": 61484.1796875} {"train_loss": -5.65332555770874, "global_step": 46788, "epoch": 1114} {"train_loss": -5.77885627746582, "global_step": 46789, "epoch": 1114} {"train_loss": -5.682507514953613, "global_step": 46790, "epoch": 1114} {"train_loss": -5.7935004234313965, "global_step": 46791, "epoch": 1114} {"train_loss": -5.786935329437256, "global_step": 46792, "epoch": 1114} {"train_loss": -5.744915008544922, "global_step": 46793, "epoch": 1114} {"train_loss": -5.775359153747559, "global_step": 46794, "epoch": 1114} {"train_loss": -5.790886878967285, "global_step": 46795, "epoch": 1114} {"train_loss": -5.786548614501953, "global_step": 46796, "epoch": 1114} {"train_loss": -5.773033142089844, "global_step": 46797, "epoch": 1114} {"train_loss": -5.666584014892578, "global_step": 46798, "epoch": 1114} {"train_loss": -5.651245594024658, "global_step": 46799, "epoch": 1114} {"train_loss": -5.677116870880127, "global_step": 46800, "epoch": 1114} {"train_loss": -5.644835948944092, "global_step": 46801, "epoch": 1114} {"train_loss": -5.620410919189453, "global_step": 46802, "epoch": 1114} {"train_loss": -5.77597713470459, "global_step": 46803, "epoch": 1114} {"train_loss": -5.783638954162598, "global_step": 46804, "epoch": 1114} {"train_loss": -5.782499313354492, "global_step": 46805, "epoch": 1114} {"train_loss": -5.693421840667725, "global_step": 46806, "epoch": 1114} {"train_loss": -5.65403938293457, "global_step": 46807, "epoch": 1114} {"train_loss": -5.799334526062012, "global_step": 46808, "epoch": 1114} {"train_loss": -5.700099945068359, "global_step": 46809, "epoch": 1114} {"train_loss": -5.772178649902344, "global_step": 46810, "epoch": 1114} {"train_loss": -5.733323097229004, "global_step": 46811, "epoch": 1114} {"train_loss": -5.724065780639648, "global_step": 46812, "epoch": 1114} {"train_loss": -5.6967453956604, "global_step": 46813, "epoch": 1114} {"train_loss": -5.737807273864746, "global_step": 46814, "epoch": 1114} {"train_loss": -5.691835403442383, "global_step": 46815, "epoch": 1114} {"train_loss": -5.6280717849731445, "global_step": 46816, "epoch": 1114} {"train_loss": -5.725088119506836, "global_step": 46817, "epoch": 1114} {"train_loss": -5.758594989776611, "global_step": 46818, "epoch": 1114} {"train_loss": -5.684231758117676, "global_step": 46819, "epoch": 1114} {"train_loss": -5.810702323913574, "global_step": 46820, "epoch": 1114} {"train_loss": -5.836282730102539, "global_step": 46821, "epoch": 1114} {"train_loss": -5.651724815368652, "global_step": 46822, "epoch": 1114} {"train_loss": -5.790104866027832, "global_step": 46823, "epoch": 1114} {"train_loss": -5.7297749519348145, "global_step": 46824, "epoch": 1114} {"train_loss": -5.765130996704102, "global_step": 46825, "epoch": 1114} {"train_loss": -5.780949592590332, "global_step": 46826, "epoch": 1114} {"train_loss": -5.840138912200928, "global_step": 46827, "epoch": 1114} {"train_loss": -5.691683769226074, "global_step": 46828, "epoch": 1114} {"train_loss": -5.7300067856198265, "global_step": 46829, "epoch": 1114, "val_loss": 61437.1171875} {"train_loss": -5.690299987792969, "global_step": 46830, "epoch": 1115} {"train_loss": -5.684399127960205, "global_step": 46831, "epoch": 1115} {"train_loss": -5.835745811462402, "global_step": 46832, "epoch": 1115} {"train_loss": -5.901149749755859, "global_step": 46833, "epoch": 1115} {"train_loss": -5.76058292388916, "global_step": 46834, "epoch": 1115} {"train_loss": -5.681644916534424, "global_step": 46835, "epoch": 1115} {"train_loss": -5.723833084106445, "global_step": 46836, "epoch": 1115} {"train_loss": -5.658501625061035, "global_step": 46837, "epoch": 1115} {"train_loss": -5.828045845031738, "global_step": 46838, "epoch": 1115} {"train_loss": -5.793801307678223, "global_step": 46839, "epoch": 1115} {"train_loss": -5.767868518829346, "global_step": 46840, "epoch": 1115} {"train_loss": -5.850768089294434, "global_step": 46841, "epoch": 1115} {"train_loss": -5.746713161468506, "global_step": 46842, "epoch": 1115} {"train_loss": -5.673482418060303, "global_step": 46843, "epoch": 1115} {"train_loss": -5.7916741371154785, "global_step": 46844, "epoch": 1115} {"train_loss": -5.80137825012207, "global_step": 46845, "epoch": 1115} {"train_loss": -5.638703346252441, "global_step": 46846, "epoch": 1115} {"train_loss": -5.654435634613037, "global_step": 46847, "epoch": 1115} {"train_loss": -5.669072151184082, "global_step": 46848, "epoch": 1115} {"train_loss": -5.665176868438721, "global_step": 46849, "epoch": 1115} {"train_loss": -5.736337661743164, "global_step": 46850, "epoch": 1115} {"train_loss": -5.608716011047363, "global_step": 46851, "epoch": 1115} {"train_loss": -5.679527759552002, "global_step": 46852, "epoch": 1115} {"train_loss": -5.735740661621094, "global_step": 46853, "epoch": 1115} {"train_loss": -5.771549224853516, "global_step": 46854, "epoch": 1115} {"train_loss": -5.6655988693237305, "global_step": 46855, "epoch": 1115} {"train_loss": -5.702661514282227, "global_step": 46856, "epoch": 1115} {"train_loss": -5.727324962615967, "global_step": 46857, "epoch": 1115} {"train_loss": -5.655013084411621, "global_step": 46858, "epoch": 1115} {"train_loss": -5.583812236785889, "global_step": 46859, "epoch": 1115} {"train_loss": -5.674478530883789, "global_step": 46860, "epoch": 1115} {"train_loss": -5.7270827293396, "global_step": 46861, "epoch": 1115} {"train_loss": -5.734606742858887, "global_step": 46862, "epoch": 1115} {"train_loss": -5.604637622833252, "global_step": 46863, "epoch": 1115} {"train_loss": -5.788125991821289, "global_step": 46864, "epoch": 1115} {"train_loss": -5.695245742797852, "global_step": 46865, "epoch": 1115} {"train_loss": -5.771269798278809, "global_step": 46866, "epoch": 1115} {"train_loss": -5.616949081420898, "global_step": 46867, "epoch": 1115} {"train_loss": -5.751651763916016, "global_step": 46868, "epoch": 1115} {"train_loss": -5.79017448425293, "global_step": 46869, "epoch": 1115} {"train_loss": -5.75880241394043, "global_step": 46870, "epoch": 1115} {"train_loss": -5.72169041633606, "global_step": 46871, "epoch": 1115, "val_loss": 62004.14453125} {"train_loss": -5.793952465057373, "global_step": 46872, "epoch": 1116} {"train_loss": -5.808549880981445, "global_step": 46873, "epoch": 1116} {"train_loss": -5.784065246582031, "global_step": 46874, "epoch": 1116} {"train_loss": -5.6214141845703125, "global_step": 46875, "epoch": 1116} {"train_loss": -5.764314651489258, "global_step": 46876, "epoch": 1116} {"train_loss": -5.611530303955078, "global_step": 46877, "epoch": 1116} {"train_loss": -5.697910308837891, "global_step": 46878, "epoch": 1116} {"train_loss": -5.746016025543213, "global_step": 46879, "epoch": 1116} {"train_loss": -5.746270179748535, "global_step": 46880, "epoch": 1116} {"train_loss": -5.801701068878174, "global_step": 46881, "epoch": 1116} {"train_loss": -5.622194290161133, "global_step": 46882, "epoch": 1116} {"train_loss": -5.632444381713867, "global_step": 46883, "epoch": 1116} {"train_loss": -5.790094375610352, "global_step": 46884, "epoch": 1116} {"train_loss": -5.725035190582275, "global_step": 46885, "epoch": 1116} {"train_loss": -5.7006378173828125, "global_step": 46886, "epoch": 1116} {"train_loss": -5.742043495178223, "global_step": 46887, "epoch": 1116} {"train_loss": -5.754016399383545, "global_step": 46888, "epoch": 1116} {"train_loss": -5.618154525756836, "global_step": 46889, "epoch": 1116} {"train_loss": -5.6729278564453125, "global_step": 46890, "epoch": 1116} {"train_loss": -5.884439468383789, "global_step": 46891, "epoch": 1116} {"train_loss": -5.6954474449157715, "global_step": 46892, "epoch": 1116} {"train_loss": -5.643938064575195, "global_step": 46893, "epoch": 1116} {"train_loss": -5.65954065322876, "global_step": 46894, "epoch": 1116} {"train_loss": -5.630763053894043, "global_step": 46895, "epoch": 1116} {"train_loss": -5.712388038635254, "global_step": 46896, "epoch": 1116} {"train_loss": -5.80185604095459, "global_step": 46897, "epoch": 1116} {"train_loss": -5.740323066711426, "global_step": 46898, "epoch": 1116} {"train_loss": -5.751132011413574, "global_step": 46899, "epoch": 1116} {"train_loss": -5.842040061950684, "global_step": 46900, "epoch": 1116} {"train_loss": -5.705266952514648, "global_step": 46901, "epoch": 1116} {"train_loss": -5.819068908691406, "global_step": 46902, "epoch": 1116} {"train_loss": -5.755993843078613, "global_step": 46903, "epoch": 1116} {"train_loss": -5.738762855529785, "global_step": 46904, "epoch": 1116} {"train_loss": -5.644177436828613, "global_step": 46905, "epoch": 1116} {"train_loss": -5.687283992767334, "global_step": 46906, "epoch": 1116} {"train_loss": -5.602200984954834, "global_step": 46907, "epoch": 1116} {"train_loss": -5.744182586669922, "global_step": 46908, "epoch": 1116} {"train_loss": -5.669929027557373, "global_step": 46909, "epoch": 1116} {"train_loss": -5.801031112670898, "global_step": 46910, "epoch": 1116} {"train_loss": -5.7398681640625, "global_step": 46911, "epoch": 1116} {"train_loss": -5.7068915367126465, "global_step": 46912, "epoch": 1116} {"train_loss": -5.72248531523205, "global_step": 46913, "epoch": 1116, "val_loss": 61680.6640625} {"train_loss": -5.706737041473389, "global_step": 46914, "epoch": 1117} {"train_loss": -5.804686546325684, "global_step": 46915, "epoch": 1117} {"train_loss": -5.645231246948242, "global_step": 46916, "epoch": 1117} {"train_loss": -5.73392391204834, "global_step": 46917, "epoch": 1117} {"train_loss": -5.767007827758789, "global_step": 46918, "epoch": 1117} {"train_loss": -5.685303688049316, "global_step": 46919, "epoch": 1117} {"train_loss": -5.751499652862549, "global_step": 46920, "epoch": 1117} {"train_loss": -5.79473876953125, "global_step": 46921, "epoch": 1117} {"train_loss": -5.6301374435424805, "global_step": 46922, "epoch": 1117} {"train_loss": -5.649328231811523, "global_step": 46923, "epoch": 1117} {"train_loss": -5.7477264404296875, "global_step": 46924, "epoch": 1117} {"train_loss": -5.782611846923828, "global_step": 46925, "epoch": 1117} {"train_loss": -5.538575172424316, "global_step": 46926, "epoch": 1117} {"train_loss": -5.623232364654541, "global_step": 46927, "epoch": 1117} {"train_loss": -5.642480373382568, "global_step": 46928, "epoch": 1117} {"train_loss": -5.743042469024658, "global_step": 46929, "epoch": 1117} {"train_loss": -5.633161544799805, "global_step": 46930, "epoch": 1117} {"train_loss": -5.731224060058594, "global_step": 46931, "epoch": 1117} {"train_loss": -5.5608367919921875, "global_step": 46932, "epoch": 1117} {"train_loss": -5.590087890625, "global_step": 46933, "epoch": 1117} {"train_loss": -5.57792854309082, "global_step": 46934, "epoch": 1117} {"train_loss": -5.6497602462768555, "global_step": 46935, "epoch": 1117} {"train_loss": -5.593637943267822, "global_step": 46936, "epoch": 1117} {"train_loss": -5.561549663543701, "global_step": 46937, "epoch": 1117} {"train_loss": -5.763665199279785, "global_step": 46938, "epoch": 1117} {"train_loss": -5.653858184814453, "global_step": 46939, "epoch": 1117} {"train_loss": -5.665802955627441, "global_step": 46940, "epoch": 1117} {"train_loss": -5.703702926635742, "global_step": 46941, "epoch": 1117} {"train_loss": -5.687714576721191, "global_step": 46942, "epoch": 1117} {"train_loss": -5.532187461853027, "global_step": 46943, "epoch": 1117} {"train_loss": -5.753477573394775, "global_step": 46944, "epoch": 1117} {"train_loss": -5.5704450607299805, "global_step": 46945, "epoch": 1117} {"train_loss": -5.684393882751465, "global_step": 46946, "epoch": 1117} {"train_loss": -5.7770185470581055, "global_step": 46947, "epoch": 1117} {"train_loss": -5.791133880615234, "global_step": 46948, "epoch": 1117} {"train_loss": -5.812579154968262, "global_step": 46949, "epoch": 1117} {"train_loss": -5.666626453399658, "global_step": 46950, "epoch": 1117} {"train_loss": -5.795263290405273, "global_step": 46951, "epoch": 1117} {"train_loss": -5.87322998046875, "global_step": 46952, "epoch": 1117} {"train_loss": -5.67872428894043, "global_step": 46953, "epoch": 1117} {"train_loss": -5.719154357910156, "global_step": 46954, "epoch": 1117} {"train_loss": -5.693269650141398, "global_step": 46955, "epoch": 1117, "val_loss": 61496.60546875} {"train_loss": -5.743465423583984, "global_step": 46956, "epoch": 1118} {"train_loss": -5.715225696563721, "global_step": 46957, "epoch": 1118} {"train_loss": -5.742938041687012, "global_step": 46958, "epoch": 1118} {"train_loss": -5.767861366271973, "global_step": 46959, "epoch": 1118} {"train_loss": -5.768043518066406, "global_step": 46960, "epoch": 1118} {"train_loss": -5.799372673034668, "global_step": 46961, "epoch": 1118} {"train_loss": -5.741683006286621, "global_step": 46962, "epoch": 1118} {"train_loss": -5.808367729187012, "global_step": 46963, "epoch": 1118} {"train_loss": -5.667342662811279, "global_step": 46964, "epoch": 1118} {"train_loss": -5.737975120544434, "global_step": 46965, "epoch": 1118} {"train_loss": -5.818388938903809, "global_step": 46966, "epoch": 1118} {"train_loss": -5.738167762756348, "global_step": 46967, "epoch": 1118} {"train_loss": -5.628383159637451, "global_step": 46968, "epoch": 1118} {"train_loss": -5.738229274749756, "global_step": 46969, "epoch": 1118} {"train_loss": -5.78715705871582, "global_step": 46970, "epoch": 1118} {"train_loss": -5.840610504150391, "global_step": 46971, "epoch": 1118} {"train_loss": -5.740820407867432, "global_step": 46972, "epoch": 1118} {"train_loss": -5.800620079040527, "global_step": 46973, "epoch": 1118} {"train_loss": -5.760568618774414, "global_step": 46974, "epoch": 1118} {"train_loss": -5.816241264343262, "global_step": 46975, "epoch": 1118} {"train_loss": -5.679396629333496, "global_step": 46976, "epoch": 1118} {"train_loss": -5.674494743347168, "global_step": 46977, "epoch": 1118} {"train_loss": -5.777766227722168, "global_step": 46978, "epoch": 1118} {"train_loss": -5.642772197723389, "global_step": 46979, "epoch": 1118} {"train_loss": -5.759723663330078, "global_step": 46980, "epoch": 1118} {"train_loss": -5.6981658935546875, "global_step": 46981, "epoch": 1118} {"train_loss": -5.9036784172058105, "global_step": 46982, "epoch": 1118} {"train_loss": -5.699077606201172, "global_step": 46983, "epoch": 1118} {"train_loss": -5.688127040863037, "global_step": 46984, "epoch": 1118} {"train_loss": -5.740596771240234, "global_step": 46985, "epoch": 1118} {"train_loss": -5.6879963874816895, "global_step": 46986, "epoch": 1118} {"train_loss": -5.83015251159668, "global_step": 46987, "epoch": 1118} {"train_loss": -5.760220527648926, "global_step": 46988, "epoch": 1118} {"train_loss": -5.630143165588379, "global_step": 46989, "epoch": 1118} {"train_loss": -5.769331455230713, "global_step": 46990, "epoch": 1118} {"train_loss": -5.675259590148926, "global_step": 46991, "epoch": 1118} {"train_loss": -5.723498821258545, "global_step": 46992, "epoch": 1118} {"train_loss": -5.6727752685546875, "global_step": 46993, "epoch": 1118} {"train_loss": -5.703542709350586, "global_step": 46994, "epoch": 1118} {"train_loss": -5.753803253173828, "global_step": 46995, "epoch": 1118} {"train_loss": -5.614681720733643, "global_step": 46996, "epoch": 1118} {"train_loss": -5.735365231831868, "global_step": 46997, "epoch": 1118, "val_loss": 61495.33203125} {"train_loss": -5.8359880447387695, "global_step": 46998, "epoch": 1119} {"train_loss": -5.5936479568481445, "global_step": 46999, "epoch": 1119} {"train_loss": -5.66077995300293, "global_step": 47000, "epoch": 1119} {"train_loss": -5.711311340332031, "global_step": 47001, "epoch": 1119} {"train_loss": -5.7398152351379395, "global_step": 47002, "epoch": 1119} {"train_loss": -5.7832183837890625, "global_step": 47003, "epoch": 1119} {"train_loss": -5.742931365966797, "global_step": 47004, "epoch": 1119} {"train_loss": -5.671785831451416, "global_step": 47005, "epoch": 1119} {"train_loss": -5.82518196105957, "global_step": 47006, "epoch": 1119} {"train_loss": -5.783941268920898, "global_step": 47007, "epoch": 1119} {"train_loss": -5.760497093200684, "global_step": 47008, "epoch": 1119} {"train_loss": -5.781675338745117, "global_step": 47009, "epoch": 1119} {"train_loss": -5.737277984619141, "global_step": 47010, "epoch": 1119} {"train_loss": -5.696609020233154, "global_step": 47011, "epoch": 1119} {"train_loss": -5.838812828063965, "global_step": 47012, "epoch": 1119} {"train_loss": -5.719539642333984, "global_step": 47013, "epoch": 1119} {"train_loss": -5.763324737548828, "global_step": 47014, "epoch": 1119} {"train_loss": -5.82084846496582, "global_step": 47015, "epoch": 1119} {"train_loss": -5.627035140991211, "global_step": 47016, "epoch": 1119} {"train_loss": -5.605367183685303, "global_step": 47017, "epoch": 1119} {"train_loss": -5.820446491241455, "global_step": 47018, "epoch": 1119} {"train_loss": -5.832592010498047, "global_step": 47019, "epoch": 1119} {"train_loss": -5.688824653625488, "global_step": 47020, "epoch": 1119} {"train_loss": -5.734282493591309, "global_step": 47021, "epoch": 1119} {"train_loss": -5.669011116027832, "global_step": 47022, "epoch": 1119} {"train_loss": -5.737101078033447, "global_step": 47023, "epoch": 1119} {"train_loss": -5.718353271484375, "global_step": 47024, "epoch": 1119} {"train_loss": -5.668615818023682, "global_step": 47025, "epoch": 1119} {"train_loss": -5.73208475112915, "global_step": 47026, "epoch": 1119} {"train_loss": -5.790792465209961, "global_step": 47027, "epoch": 1119} {"train_loss": -5.65786075592041, "global_step": 47028, "epoch": 1119} {"train_loss": -5.679405689239502, "global_step": 47029, "epoch": 1119} {"train_loss": -5.7564568519592285, "global_step": 47030, "epoch": 1119} {"train_loss": -5.685581684112549, "global_step": 47031, "epoch": 1119} {"train_loss": -5.889655113220215, "global_step": 47032, "epoch": 1119} {"train_loss": -5.8204450607299805, "global_step": 47033, "epoch": 1119} {"train_loss": -5.743414402008057, "global_step": 47034, "epoch": 1119} {"train_loss": -5.702305793762207, "global_step": 47035, "epoch": 1119} {"train_loss": -5.760416507720947, "global_step": 47036, "epoch": 1119} {"train_loss": -5.725589752197266, "global_step": 47037, "epoch": 1119} {"train_loss": -5.7449493408203125, "global_step": 47038, "epoch": 1119} {"train_loss": -5.73701456614903, "global_step": 47039, "epoch": 1119, "val_loss": 61676.73046875} {"train_loss": -5.734969139099121, "global_step": 47040, "epoch": 1120} {"train_loss": -5.702340602874756, "global_step": 47041, "epoch": 1120} {"train_loss": -5.658441543579102, "global_step": 47042, "epoch": 1120} {"train_loss": -5.486071586608887, "global_step": 47043, "epoch": 1120} {"train_loss": -5.812211036682129, "global_step": 47044, "epoch": 1120} {"train_loss": -5.750919342041016, "global_step": 47045, "epoch": 1120} {"train_loss": -5.653367042541504, "global_step": 47046, "epoch": 1120} {"train_loss": -5.781078338623047, "global_step": 47047, "epoch": 1120} {"train_loss": -5.71921443939209, "global_step": 47048, "epoch": 1120} {"train_loss": -5.670315265655518, "global_step": 47049, "epoch": 1120} {"train_loss": -5.615721702575684, "global_step": 47050, "epoch": 1120} {"train_loss": -5.61637544631958, "global_step": 47051, "epoch": 1120} {"train_loss": -5.738107681274414, "global_step": 47052, "epoch": 1120} {"train_loss": -5.628456115722656, "global_step": 47053, "epoch": 1120} {"train_loss": -5.730597019195557, "global_step": 47054, "epoch": 1120} {"train_loss": -5.662921905517578, "global_step": 47055, "epoch": 1120} {"train_loss": -5.721426010131836, "global_step": 47056, "epoch": 1120} {"train_loss": -5.536581516265869, "global_step": 47057, "epoch": 1120} {"train_loss": -5.513271331787109, "global_step": 47058, "epoch": 1120} {"train_loss": -5.737464427947998, "global_step": 47059, "epoch": 1120} {"train_loss": -5.76708984375, "global_step": 47060, "epoch": 1120} {"train_loss": -5.704424858093262, "global_step": 47061, "epoch": 1120} {"train_loss": -5.680051326751709, "global_step": 47062, "epoch": 1120} {"train_loss": -5.731741428375244, "global_step": 47063, "epoch": 1120} {"train_loss": -5.820372581481934, "global_step": 47064, "epoch": 1120} {"train_loss": -5.69234037399292, "global_step": 47065, "epoch": 1120} {"train_loss": -5.767339706420898, "global_step": 47066, "epoch": 1120} {"train_loss": -5.713903903961182, "global_step": 47067, "epoch": 1120} {"train_loss": -5.7514495849609375, "global_step": 47068, "epoch": 1120} {"train_loss": -5.775473117828369, "global_step": 47069, "epoch": 1120} {"train_loss": -5.7655792236328125, "global_step": 47070, "epoch": 1120} {"train_loss": -5.764807224273682, "global_step": 47071, "epoch": 1120} {"train_loss": -5.708424091339111, "global_step": 47072, "epoch": 1120} {"train_loss": -5.749436378479004, "global_step": 47073, "epoch": 1120} {"train_loss": -5.780364036560059, "global_step": 47074, "epoch": 1120} {"train_loss": -5.686792373657227, "global_step": 47075, "epoch": 1120} {"train_loss": -5.7147603034973145, "global_step": 47076, "epoch": 1120} {"train_loss": -5.866273403167725, "global_step": 47077, "epoch": 1120} {"train_loss": -5.735508918762207, "global_step": 47078, "epoch": 1120} {"train_loss": -5.632694244384766, "global_step": 47079, "epoch": 1120} {"train_loss": -5.857278823852539, "global_step": 47080, "epoch": 1120} {"train_loss": -5.710713431948707, "global_step": 47081, "epoch": 1120, "val_loss": 61738.546875} {"train_loss": -5.809756755828857, "global_step": 47082, "epoch": 1121} {"train_loss": -5.667359352111816, "global_step": 47083, "epoch": 1121} {"train_loss": -5.692397594451904, "global_step": 47084, "epoch": 1121} {"train_loss": -5.830538749694824, "global_step": 47085, "epoch": 1121} {"train_loss": -5.7810516357421875, "global_step": 47086, "epoch": 1121} {"train_loss": -5.645074844360352, "global_step": 47087, "epoch": 1121} {"train_loss": -5.6844892501831055, "global_step": 47088, "epoch": 1121} {"train_loss": -5.646414279937744, "global_step": 47089, "epoch": 1121} {"train_loss": -5.751228332519531, "global_step": 47090, "epoch": 1121} {"train_loss": -5.670952320098877, "global_step": 47091, "epoch": 1121} {"train_loss": -5.807675361633301, "global_step": 47092, "epoch": 1121} {"train_loss": -5.708762168884277, "global_step": 47093, "epoch": 1121} {"train_loss": -5.779417991638184, "global_step": 47094, "epoch": 1121} {"train_loss": -5.761384963989258, "global_step": 47095, "epoch": 1121} {"train_loss": -5.745053768157959, "global_step": 47096, "epoch": 1121} {"train_loss": -5.798906326293945, "global_step": 47097, "epoch": 1121} {"train_loss": -5.792832851409912, "global_step": 47098, "epoch": 1121} {"train_loss": -5.7552809715271, "global_step": 47099, "epoch": 1121} {"train_loss": -5.8273396492004395, "global_step": 47100, "epoch": 1121} {"train_loss": -5.755620956420898, "global_step": 47101, "epoch": 1121} {"train_loss": -5.728633880615234, "global_step": 47102, "epoch": 1121} {"train_loss": -5.760699272155762, "global_step": 47103, "epoch": 1121} {"train_loss": -5.6721110343933105, "global_step": 47104, "epoch": 1121} {"train_loss": -5.796265125274658, "global_step": 47105, "epoch": 1121} {"train_loss": -5.694802761077881, "global_step": 47106, "epoch": 1121} {"train_loss": -5.666792392730713, "global_step": 47107, "epoch": 1121} {"train_loss": -5.63875150680542, "global_step": 47108, "epoch": 1121} {"train_loss": -5.620509147644043, "global_step": 47109, "epoch": 1121} {"train_loss": -5.702367782592773, "global_step": 47110, "epoch": 1121} {"train_loss": -5.758504390716553, "global_step": 47111, "epoch": 1121} {"train_loss": -5.7510199546813965, "global_step": 47112, "epoch": 1121} {"train_loss": -5.698328971862793, "global_step": 47113, "epoch": 1121} {"train_loss": -5.834844589233398, "global_step": 47114, "epoch": 1121} {"train_loss": -5.75206184387207, "global_step": 47115, "epoch": 1121} {"train_loss": -5.665689945220947, "global_step": 47116, "epoch": 1121} {"train_loss": -5.83894157409668, "global_step": 47117, "epoch": 1121} {"train_loss": -5.742387294769287, "global_step": 47118, "epoch": 1121} {"train_loss": -5.728503227233887, "global_step": 47119, "epoch": 1121} {"train_loss": -5.784638404846191, "global_step": 47120, "epoch": 1121} {"train_loss": -5.796051979064941, "global_step": 47121, "epoch": 1121} {"train_loss": -5.776371955871582, "global_step": 47122, "epoch": 1121} {"train_loss": -5.740846157073975, "global_step": 47123, "epoch": 1121, "val_loss": 61544.71875} {"train_loss": -5.806097984313965, "global_step": 47124, "epoch": 1122} {"train_loss": -5.655758857727051, "global_step": 47125, "epoch": 1122} {"train_loss": -5.830715179443359, "global_step": 47126, "epoch": 1122} {"train_loss": -5.756394863128662, "global_step": 47127, "epoch": 1122} {"train_loss": -5.674953937530518, "global_step": 47128, "epoch": 1122} {"train_loss": -5.662716865539551, "global_step": 47129, "epoch": 1122} {"train_loss": -5.736630916595459, "global_step": 47130, "epoch": 1122} {"train_loss": -5.699141502380371, "global_step": 47131, "epoch": 1122} {"train_loss": -5.717854022979736, "global_step": 47132, "epoch": 1122} {"train_loss": -5.857454776763916, "global_step": 47133, "epoch": 1122} {"train_loss": -5.731170177459717, "global_step": 47134, "epoch": 1122} {"train_loss": -5.556650638580322, "global_step": 47135, "epoch": 1122} {"train_loss": -5.851424217224121, "global_step": 47136, "epoch": 1122} {"train_loss": -5.669114112854004, "global_step": 47137, "epoch": 1122} {"train_loss": -5.705132961273193, "global_step": 47138, "epoch": 1122} {"train_loss": -5.829674243927002, "global_step": 47139, "epoch": 1122} {"train_loss": -5.779083251953125, "global_step": 47140, "epoch": 1122} {"train_loss": -5.6767168045043945, "global_step": 47141, "epoch": 1122} {"train_loss": -5.787039756774902, "global_step": 47142, "epoch": 1122} {"train_loss": -5.60499382019043, "global_step": 47143, "epoch": 1122} {"train_loss": -5.812869071960449, "global_step": 47144, "epoch": 1122} {"train_loss": -5.802914619445801, "global_step": 47145, "epoch": 1122} {"train_loss": -5.670398235321045, "global_step": 47146, "epoch": 1122} {"train_loss": -5.618385314941406, "global_step": 47147, "epoch": 1122} {"train_loss": -5.691987037658691, "global_step": 47148, "epoch": 1122} {"train_loss": -5.690827369689941, "global_step": 47149, "epoch": 1122} {"train_loss": -5.712714672088623, "global_step": 47150, "epoch": 1122} {"train_loss": -5.687501907348633, "global_step": 47151, "epoch": 1122} {"train_loss": -5.754889965057373, "global_step": 47152, "epoch": 1122} {"train_loss": -5.726706504821777, "global_step": 47153, "epoch": 1122} {"train_loss": -5.873845100402832, "global_step": 47154, "epoch": 1122} {"train_loss": -5.730112552642822, "global_step": 47155, "epoch": 1122} {"train_loss": -5.670530319213867, "global_step": 47156, "epoch": 1122} {"train_loss": -5.783072471618652, "global_step": 47157, "epoch": 1122} {"train_loss": -5.670060157775879, "global_step": 47158, "epoch": 1122} {"train_loss": -5.788288116455078, "global_step": 47159, "epoch": 1122} {"train_loss": -5.701754570007324, "global_step": 47160, "epoch": 1122} {"train_loss": -5.644558429718018, "global_step": 47161, "epoch": 1122} {"train_loss": -5.674225330352783, "global_step": 47162, "epoch": 1122} {"train_loss": -5.618344783782959, "global_step": 47163, "epoch": 1122} {"train_loss": -5.746367454528809, "global_step": 47164, "epoch": 1122} {"train_loss": -5.72341445514134, "global_step": 47165, "epoch": 1122, "val_loss": 61658.5625} {"train_loss": -5.691926002502441, "global_step": 47166, "epoch": 1123} {"train_loss": -5.7848896980285645, "global_step": 47167, "epoch": 1123} {"train_loss": -5.73525333404541, "global_step": 47168, "epoch": 1123} {"train_loss": -5.646907329559326, "global_step": 47169, "epoch": 1123} {"train_loss": -5.761590480804443, "global_step": 47170, "epoch": 1123} {"train_loss": -5.747360706329346, "global_step": 47171, "epoch": 1123} {"train_loss": -5.7748918533325195, "global_step": 47172, "epoch": 1123} {"train_loss": -5.733608245849609, "global_step": 47173, "epoch": 1123} {"train_loss": -5.722739219665527, "global_step": 47174, "epoch": 1123} {"train_loss": -5.723712921142578, "global_step": 47175, "epoch": 1123} {"train_loss": -5.743900299072266, "global_step": 47176, "epoch": 1123} {"train_loss": -5.7676873207092285, "global_step": 47177, "epoch": 1123} {"train_loss": -5.766791820526123, "global_step": 47178, "epoch": 1123} {"train_loss": -5.758027076721191, "global_step": 47179, "epoch": 1123} {"train_loss": -5.786232948303223, "global_step": 47180, "epoch": 1123} {"train_loss": -5.804778099060059, "global_step": 47181, "epoch": 1123} {"train_loss": -5.7373762130737305, "global_step": 47182, "epoch": 1123} {"train_loss": -5.760077476501465, "global_step": 47183, "epoch": 1123} {"train_loss": -5.724098205566406, "global_step": 47184, "epoch": 1123} {"train_loss": -5.701165199279785, "global_step": 47185, "epoch": 1123} {"train_loss": -5.789374351501465, "global_step": 47186, "epoch": 1123} {"train_loss": -5.507361888885498, "global_step": 47187, "epoch": 1123} {"train_loss": -5.655280590057373, "global_step": 47188, "epoch": 1123} {"train_loss": -5.612565994262695, "global_step": 47189, "epoch": 1123} {"train_loss": -5.832714080810547, "global_step": 47190, "epoch": 1123} {"train_loss": -5.719906806945801, "global_step": 47191, "epoch": 1123} {"train_loss": -5.622178077697754, "global_step": 47192, "epoch": 1123} {"train_loss": -5.685275077819824, "global_step": 47193, "epoch": 1123} {"train_loss": -5.705755233764648, "global_step": 47194, "epoch": 1123} {"train_loss": -5.778082370758057, "global_step": 47195, "epoch": 1123} {"train_loss": -5.773212432861328, "global_step": 47196, "epoch": 1123} {"train_loss": -5.718727111816406, "global_step": 47197, "epoch": 1123} {"train_loss": -5.844468593597412, "global_step": 47198, "epoch": 1123} {"train_loss": -5.780551433563232, "global_step": 47199, "epoch": 1123} {"train_loss": -5.6361894607543945, "global_step": 47200, "epoch": 1123} {"train_loss": -5.6733903884887695, "global_step": 47201, "epoch": 1123} {"train_loss": -5.650529861450195, "global_step": 47202, "epoch": 1123} {"train_loss": -5.800952911376953, "global_step": 47203, "epoch": 1123} {"train_loss": -5.751677513122559, "global_step": 47204, "epoch": 1123} {"train_loss": -5.701385021209717, "global_step": 47205, "epoch": 1123} {"train_loss": -5.717519283294678, "global_step": 47206, "epoch": 1123} {"train_loss": -5.726954812095279, "global_step": 47207, "epoch": 1123, "val_loss": 62003.32421875} {"train_loss": -5.79143762588501, "global_step": 47208, "epoch": 1124} {"train_loss": -5.759289741516113, "global_step": 47209, "epoch": 1124} {"train_loss": -5.856252193450928, "global_step": 47210, "epoch": 1124} {"train_loss": -5.666016578674316, "global_step": 47211, "epoch": 1124} {"train_loss": -5.554900646209717, "global_step": 47212, "epoch": 1124} {"train_loss": -5.738447189331055, "global_step": 47213, "epoch": 1124} {"train_loss": -5.683796405792236, "global_step": 47214, "epoch": 1124} {"train_loss": -5.686412811279297, "global_step": 47215, "epoch": 1124} {"train_loss": -5.64071798324585, "global_step": 47216, "epoch": 1124} {"train_loss": -5.440223693847656, "global_step": 47217, "epoch": 1124} {"train_loss": -5.687302589416504, "global_step": 47218, "epoch": 1124} {"train_loss": -5.591246604919434, "global_step": 47219, "epoch": 1124} {"train_loss": -5.6134419441223145, "global_step": 47220, "epoch": 1124} {"train_loss": -5.6479010581970215, "global_step": 47221, "epoch": 1124} {"train_loss": -5.5512189865112305, "global_step": 47222, "epoch": 1124} {"train_loss": -5.640186309814453, "global_step": 47223, "epoch": 1124} {"train_loss": -5.508262634277344, "global_step": 47224, "epoch": 1124} {"train_loss": -5.668048858642578, "global_step": 47225, "epoch": 1124} {"train_loss": -5.646233558654785, "global_step": 47226, "epoch": 1124} {"train_loss": -5.711929798126221, "global_step": 47227, "epoch": 1124} {"train_loss": -5.765097618103027, "global_step": 47228, "epoch": 1124} {"train_loss": -5.632157802581787, "global_step": 47229, "epoch": 1124} {"train_loss": -5.71772575378418, "global_step": 47230, "epoch": 1124} {"train_loss": -5.523253917694092, "global_step": 47231, "epoch": 1124} {"train_loss": -5.6630778312683105, "global_step": 47232, "epoch": 1124} {"train_loss": -5.674686431884766, "global_step": 47233, "epoch": 1124} {"train_loss": -5.6260576248168945, "global_step": 47234, "epoch": 1124} {"train_loss": -5.643610954284668, "global_step": 47235, "epoch": 1124} {"train_loss": -5.670767784118652, "global_step": 47236, "epoch": 1124} {"train_loss": -5.656994342803955, "global_step": 47237, "epoch": 1124} {"train_loss": -5.781184196472168, "global_step": 47238, "epoch": 1124} {"train_loss": -5.679848670959473, "global_step": 47239, "epoch": 1124} {"train_loss": -5.786923408508301, "global_step": 47240, "epoch": 1124} {"train_loss": -5.69743013381958, "global_step": 47241, "epoch": 1124} {"train_loss": -5.7003493309021, "global_step": 47242, "epoch": 1124} {"train_loss": -5.618674278259277, "global_step": 47243, "epoch": 1124} {"train_loss": -5.862095832824707, "global_step": 47244, "epoch": 1124} {"train_loss": -5.672687530517578, "global_step": 47245, "epoch": 1124} {"train_loss": -5.6081037521362305, "global_step": 47246, "epoch": 1124} {"train_loss": -5.745859146118164, "global_step": 47247, "epoch": 1124} {"train_loss": -5.673675060272217, "global_step": 47248, "epoch": 1124} {"train_loss": -5.671898035776048, "global_step": 47249, "epoch": 1124, "val_loss": 61530.8125} {"train_loss": -5.694799423217773, "global_step": 47250, "epoch": 1125} {"train_loss": -5.704499244689941, "global_step": 47251, "epoch": 1125} {"train_loss": -5.711423397064209, "global_step": 47252, "epoch": 1125} {"train_loss": -5.744409561157227, "global_step": 47253, "epoch": 1125} {"train_loss": -5.719460487365723, "global_step": 47254, "epoch": 1125} {"train_loss": -5.8338623046875, "global_step": 47255, "epoch": 1125} {"train_loss": -5.756510257720947, "global_step": 47256, "epoch": 1125} {"train_loss": -5.682835578918457, "global_step": 47257, "epoch": 1125} {"train_loss": -5.766996383666992, "global_step": 47258, "epoch": 1125} {"train_loss": -5.657526016235352, "global_step": 47259, "epoch": 1125} {"train_loss": -5.6444501876831055, "global_step": 47260, "epoch": 1125} {"train_loss": -5.698118209838867, "global_step": 47261, "epoch": 1125} {"train_loss": -5.675182819366455, "global_step": 47262, "epoch": 1125} {"train_loss": -5.697880744934082, "global_step": 47263, "epoch": 1125} {"train_loss": -5.766483783721924, "global_step": 47264, "epoch": 1125} {"train_loss": -5.787845611572266, "global_step": 47265, "epoch": 1125} {"train_loss": -5.7751946449279785, "global_step": 47266, "epoch": 1125} {"train_loss": -5.830202102661133, "global_step": 47267, "epoch": 1125} {"train_loss": -5.758292198181152, "global_step": 47268, "epoch": 1125} {"train_loss": -5.869223117828369, "global_step": 47269, "epoch": 1125} {"train_loss": -5.7069172859191895, "global_step": 47270, "epoch": 1125} {"train_loss": -5.717333793640137, "global_step": 47271, "epoch": 1125} {"train_loss": -5.726536750793457, "global_step": 47272, "epoch": 1125} {"train_loss": -5.690013885498047, "global_step": 47273, "epoch": 1125} {"train_loss": -5.809969425201416, "global_step": 47274, "epoch": 1125} {"train_loss": -5.720456123352051, "global_step": 47275, "epoch": 1125} {"train_loss": -5.8043212890625, "global_step": 47276, "epoch": 1125} {"train_loss": -5.83763313293457, "global_step": 47277, "epoch": 1125} {"train_loss": -5.732582092285156, "global_step": 47278, "epoch": 1125} {"train_loss": -5.627439975738525, "global_step": 47279, "epoch": 1125} {"train_loss": -5.679270267486572, "global_step": 47280, "epoch": 1125} {"train_loss": -5.852375507354736, "global_step": 47281, "epoch": 1125} {"train_loss": -5.7359418869018555, "global_step": 47282, "epoch": 1125} {"train_loss": -5.764014720916748, "global_step": 47283, "epoch": 1125} {"train_loss": -5.681026458740234, "global_step": 47284, "epoch": 1125} {"train_loss": -5.6929192543029785, "global_step": 47285, "epoch": 1125} {"train_loss": -5.689053535461426, "global_step": 47286, "epoch": 1125} {"train_loss": -5.745334625244141, "global_step": 47287, "epoch": 1125} {"train_loss": -5.810191631317139, "global_step": 47288, "epoch": 1125} {"train_loss": -5.797746658325195, "global_step": 47289, "epoch": 1125} {"train_loss": -5.867119789123535, "global_step": 47290, "epoch": 1125} {"train_loss": -5.746721653711228, "global_step": 47291, "epoch": 1125, "val_loss": 61425.6328125} {"train_loss": -5.818198204040527, "global_step": 47292, "epoch": 1126} {"train_loss": -5.693036079406738, "global_step": 47293, "epoch": 1126} {"train_loss": -5.788344860076904, "global_step": 47294, "epoch": 1126} {"train_loss": -5.855381011962891, "global_step": 47295, "epoch": 1126} {"train_loss": -5.855654716491699, "global_step": 47296, "epoch": 1126} {"train_loss": -5.734954357147217, "global_step": 47297, "epoch": 1126} {"train_loss": -5.668303966522217, "global_step": 47298, "epoch": 1126} {"train_loss": -5.793729782104492, "global_step": 47299, "epoch": 1126} {"train_loss": -5.754345893859863, "global_step": 47300, "epoch": 1126} {"train_loss": -5.8181939125061035, "global_step": 47301, "epoch": 1126} {"train_loss": -5.747003555297852, "global_step": 47302, "epoch": 1126} {"train_loss": -5.734985828399658, "global_step": 47303, "epoch": 1126} {"train_loss": -5.715444564819336, "global_step": 47304, "epoch": 1126} {"train_loss": -5.683844089508057, "global_step": 47305, "epoch": 1126} {"train_loss": -5.773038864135742, "global_step": 47306, "epoch": 1126} {"train_loss": -5.768861770629883, "global_step": 47307, "epoch": 1126} {"train_loss": -5.739906311035156, "global_step": 47308, "epoch": 1126} {"train_loss": -5.686641693115234, "global_step": 47309, "epoch": 1126} {"train_loss": -5.769883155822754, "global_step": 47310, "epoch": 1126} {"train_loss": -5.738152980804443, "global_step": 47311, "epoch": 1126} {"train_loss": -5.7494001388549805, "global_step": 47312, "epoch": 1126} {"train_loss": -5.665172576904297, "global_step": 47313, "epoch": 1126} {"train_loss": -5.647001266479492, "global_step": 47314, "epoch": 1126} {"train_loss": -5.793852806091309, "global_step": 47315, "epoch": 1126} {"train_loss": -5.750367164611816, "global_step": 47316, "epoch": 1126} {"train_loss": -5.773409843444824, "global_step": 47317, "epoch": 1126} {"train_loss": -5.65028715133667, "global_step": 47318, "epoch": 1126} {"train_loss": -5.607403755187988, "global_step": 47319, "epoch": 1126} {"train_loss": -5.849244117736816, "global_step": 47320, "epoch": 1126} {"train_loss": -5.556121826171875, "global_step": 47321, "epoch": 1126} {"train_loss": -5.692254066467285, "global_step": 47322, "epoch": 1126} {"train_loss": -5.688124656677246, "global_step": 47323, "epoch": 1126} {"train_loss": -5.534524917602539, "global_step": 47324, "epoch": 1126} {"train_loss": -5.700373649597168, "global_step": 47325, "epoch": 1126} {"train_loss": -5.7604756355285645, "global_step": 47326, "epoch": 1126} {"train_loss": -5.714651584625244, "global_step": 47327, "epoch": 1126} {"train_loss": -5.602182388305664, "global_step": 47328, "epoch": 1126} {"train_loss": -5.761223316192627, "global_step": 47329, "epoch": 1126} {"train_loss": -5.6074323654174805, "global_step": 47330, "epoch": 1126} {"train_loss": -5.743686676025391, "global_step": 47331, "epoch": 1126} {"train_loss": -5.753805160522461, "global_step": 47332, "epoch": 1126} {"train_loss": -5.726693879990351, "global_step": 47333, "epoch": 1126, "val_loss": 61531.08984375} {"train_loss": -5.581133842468262, "global_step": 47334, "epoch": 1127} {"train_loss": -5.698291301727295, "global_step": 47335, "epoch": 1127} {"train_loss": -5.611235618591309, "global_step": 47336, "epoch": 1127} {"train_loss": -5.70290994644165, "global_step": 47337, "epoch": 1127} {"train_loss": -5.726728439331055, "global_step": 47338, "epoch": 1127} {"train_loss": -5.788958549499512, "global_step": 47339, "epoch": 1127} {"train_loss": -5.799131393432617, "global_step": 47340, "epoch": 1127} {"train_loss": -5.707014083862305, "global_step": 47341, "epoch": 1127} {"train_loss": -5.679950714111328, "global_step": 47342, "epoch": 1127} {"train_loss": -5.828368186950684, "global_step": 47343, "epoch": 1127} {"train_loss": -5.801091194152832, "global_step": 47344, "epoch": 1127} {"train_loss": -5.793318271636963, "global_step": 47345, "epoch": 1127} {"train_loss": -5.696805000305176, "global_step": 47346, "epoch": 1127} {"train_loss": -5.875802993774414, "global_step": 47347, "epoch": 1127} {"train_loss": -5.754272937774658, "global_step": 47348, "epoch": 1127} {"train_loss": -5.6742963790893555, "global_step": 47349, "epoch": 1127} {"train_loss": -5.760794639587402, "global_step": 47350, "epoch": 1127} {"train_loss": -5.859054088592529, "global_step": 47351, "epoch": 1127} {"train_loss": -5.738527774810791, "global_step": 47352, "epoch": 1127} {"train_loss": -5.94193696975708, "global_step": 47353, "epoch": 1127} {"train_loss": -5.631802082061768, "global_step": 47354, "epoch": 1127} {"train_loss": -5.848850727081299, "global_step": 47355, "epoch": 1127} {"train_loss": -5.753808498382568, "global_step": 47356, "epoch": 1127} {"train_loss": -5.736980438232422, "global_step": 47357, "epoch": 1127} {"train_loss": -5.690757751464844, "global_step": 47358, "epoch": 1127} {"train_loss": -5.744296073913574, "global_step": 47359, "epoch": 1127} {"train_loss": -5.743419170379639, "global_step": 47360, "epoch": 1127} {"train_loss": -5.708611488342285, "global_step": 47361, "epoch": 1127} {"train_loss": -5.8283562660217285, "global_step": 47362, "epoch": 1127} {"train_loss": -5.738544464111328, "global_step": 47363, "epoch": 1127} {"train_loss": -5.7804741859436035, "global_step": 47364, "epoch": 1127} {"train_loss": -5.745907783508301, "global_step": 47365, "epoch": 1127} {"train_loss": -5.867031097412109, "global_step": 47366, "epoch": 1127} {"train_loss": -5.740347385406494, "global_step": 47367, "epoch": 1127} {"train_loss": -5.807272911071777, "global_step": 47368, "epoch": 1127} {"train_loss": -5.777432441711426, "global_step": 47369, "epoch": 1127} {"train_loss": -5.801315784454346, "global_step": 47370, "epoch": 1127} {"train_loss": -5.776535987854004, "global_step": 47371, "epoch": 1127} {"train_loss": -5.808181285858154, "global_step": 47372, "epoch": 1127} {"train_loss": -5.82066535949707, "global_step": 47373, "epoch": 1127} {"train_loss": -5.817373275756836, "global_step": 47374, "epoch": 1127} {"train_loss": -5.760088863826933, "global_step": 47375, "epoch": 1127, "val_loss": 61644.48046875} {"train_loss": -5.6829915046691895, "global_step": 47376, "epoch": 1128} {"train_loss": -5.58944034576416, "global_step": 47377, "epoch": 1128} {"train_loss": -5.840394020080566, "global_step": 47378, "epoch": 1128} {"train_loss": -5.693418979644775, "global_step": 47379, "epoch": 1128} {"train_loss": -5.698250770568848, "global_step": 47380, "epoch": 1128} {"train_loss": -5.707526206970215, "global_step": 47381, "epoch": 1128} {"train_loss": -5.696977138519287, "global_step": 47382, "epoch": 1128} {"train_loss": -5.747283935546875, "global_step": 47383, "epoch": 1128} {"train_loss": -5.74873161315918, "global_step": 47384, "epoch": 1128} {"train_loss": -5.6887407302856445, "global_step": 47385, "epoch": 1128} {"train_loss": -5.629919052124023, "global_step": 47386, "epoch": 1128} {"train_loss": -5.741335868835449, "global_step": 47387, "epoch": 1128} {"train_loss": -5.7143964767456055, "global_step": 47388, "epoch": 1128} {"train_loss": -5.715167999267578, "global_step": 47389, "epoch": 1128} {"train_loss": -5.747976303100586, "global_step": 47390, "epoch": 1128} {"train_loss": -5.7466278076171875, "global_step": 47391, "epoch": 1128} {"train_loss": -5.8048248291015625, "global_step": 47392, "epoch": 1128} {"train_loss": -5.823850631713867, "global_step": 47393, "epoch": 1128} {"train_loss": -5.709216117858887, "global_step": 47394, "epoch": 1128} {"train_loss": -5.677417755126953, "global_step": 47395, "epoch": 1128} {"train_loss": -5.772257328033447, "global_step": 47396, "epoch": 1128} {"train_loss": -5.717437744140625, "global_step": 47397, "epoch": 1128} {"train_loss": -5.758874893188477, "global_step": 47398, "epoch": 1128} {"train_loss": -5.771420955657959, "global_step": 47399, "epoch": 1128} {"train_loss": -5.7495880126953125, "global_step": 47400, "epoch": 1128} {"train_loss": -5.611138343811035, "global_step": 47401, "epoch": 1128} {"train_loss": -5.7369279861450195, "global_step": 47402, "epoch": 1128} {"train_loss": -5.71589469909668, "global_step": 47403, "epoch": 1128} {"train_loss": -5.668381690979004, "global_step": 47404, "epoch": 1128} {"train_loss": -5.699548721313477, "global_step": 47405, "epoch": 1128} {"train_loss": -5.754547119140625, "global_step": 47406, "epoch": 1128} {"train_loss": -5.679535388946533, "global_step": 47407, "epoch": 1128} {"train_loss": -5.634195804595947, "global_step": 47408, "epoch": 1128} {"train_loss": -5.6297149658203125, "global_step": 47409, "epoch": 1128} {"train_loss": -5.688351154327393, "global_step": 47410, "epoch": 1128} {"train_loss": -5.7113447189331055, "global_step": 47411, "epoch": 1128} {"train_loss": -5.748801231384277, "global_step": 47412, "epoch": 1128} {"train_loss": -5.743692398071289, "global_step": 47413, "epoch": 1128} {"train_loss": -5.591513633728027, "global_step": 47414, "epoch": 1128} {"train_loss": -5.759469032287598, "global_step": 47415, "epoch": 1128} {"train_loss": -5.700945854187012, "global_step": 47416, "epoch": 1128} {"train_loss": -5.7187636920384, "global_step": 47417, "epoch": 1128, "val_loss": 61824.61328125} {"train_loss": -5.747358798980713, "global_step": 47418, "epoch": 1129} {"train_loss": -5.754159927368164, "global_step": 47419, "epoch": 1129} {"train_loss": -5.764684677124023, "global_step": 47420, "epoch": 1129} {"train_loss": -5.9076008796691895, "global_step": 47421, "epoch": 1129} {"train_loss": -5.815486907958984, "global_step": 47422, "epoch": 1129} {"train_loss": -5.739459991455078, "global_step": 47423, "epoch": 1129} {"train_loss": -5.7399210929870605, "global_step": 47424, "epoch": 1129} {"train_loss": -5.673635959625244, "global_step": 47425, "epoch": 1129} {"train_loss": -5.812318325042725, "global_step": 47426, "epoch": 1129} {"train_loss": -5.698389530181885, "global_step": 47427, "epoch": 1129} {"train_loss": -5.716899871826172, "global_step": 47428, "epoch": 1129} {"train_loss": -5.6980695724487305, "global_step": 47429, "epoch": 1129} {"train_loss": -5.850465774536133, "global_step": 47430, "epoch": 1129} {"train_loss": -5.76473331451416, "global_step": 47431, "epoch": 1129} {"train_loss": -5.754420280456543, "global_step": 47432, "epoch": 1129} {"train_loss": -5.811738014221191, "global_step": 47433, "epoch": 1129} {"train_loss": -5.686709880828857, "global_step": 47434, "epoch": 1129} {"train_loss": -5.708620548248291, "global_step": 47435, "epoch": 1129} {"train_loss": -5.7089338302612305, "global_step": 47436, "epoch": 1129} {"train_loss": -5.758641242980957, "global_step": 47437, "epoch": 1129} {"train_loss": -5.5784173011779785, "global_step": 47438, "epoch": 1129} {"train_loss": -5.7081217765808105, "global_step": 47439, "epoch": 1129} {"train_loss": -5.826400279998779, "global_step": 47440, "epoch": 1129} {"train_loss": -5.718007564544678, "global_step": 47441, "epoch": 1129} {"train_loss": -5.778027534484863, "global_step": 47442, "epoch": 1129} {"train_loss": -5.856008529663086, "global_step": 47443, "epoch": 1129} {"train_loss": -5.805667877197266, "global_step": 47444, "epoch": 1129} {"train_loss": -5.630264759063721, "global_step": 47445, "epoch": 1129} {"train_loss": -5.63385009765625, "global_step": 47446, "epoch": 1129} {"train_loss": -5.617733001708984, "global_step": 47447, "epoch": 1129} {"train_loss": -5.771651268005371, "global_step": 47448, "epoch": 1129} {"train_loss": -5.716424465179443, "global_step": 47449, "epoch": 1129} {"train_loss": -5.617631912231445, "global_step": 47450, "epoch": 1129} {"train_loss": -5.773093223571777, "global_step": 47451, "epoch": 1129} {"train_loss": -5.709965229034424, "global_step": 47452, "epoch": 1129} {"train_loss": -5.717315196990967, "global_step": 47453, "epoch": 1129} {"train_loss": -5.789756774902344, "global_step": 47454, "epoch": 1129} {"train_loss": -5.6567864418029785, "global_step": 47455, "epoch": 1129} {"train_loss": -5.652066230773926, "global_step": 47456, "epoch": 1129} {"train_loss": -5.709394454956055, "global_step": 47457, "epoch": 1129} {"train_loss": -5.673553466796875, "global_step": 47458, "epoch": 1129} {"train_loss": -5.734901223863874, "global_step": 47459, "epoch": 1129, "val_loss": 61455.67578125} {"train_loss": -5.756071090698242, "global_step": 47460, "epoch": 1130} {"train_loss": -5.772269248962402, "global_step": 47461, "epoch": 1130} {"train_loss": -5.824345588684082, "global_step": 47462, "epoch": 1130} {"train_loss": -5.761882781982422, "global_step": 47463, "epoch": 1130} {"train_loss": -5.793623924255371, "global_step": 47464, "epoch": 1130} {"train_loss": -5.672226905822754, "global_step": 47465, "epoch": 1130} {"train_loss": -5.867440223693848, "global_step": 47466, "epoch": 1130} {"train_loss": -5.724059104919434, "global_step": 47467, "epoch": 1130} {"train_loss": -5.765009880065918, "global_step": 47468, "epoch": 1130} {"train_loss": -5.754333972930908, "global_step": 47469, "epoch": 1130} {"train_loss": -5.711565017700195, "global_step": 47470, "epoch": 1130} {"train_loss": -5.737841606140137, "global_step": 47471, "epoch": 1130} {"train_loss": -5.809446811676025, "global_step": 47472, "epoch": 1130} {"train_loss": -5.7314772605896, "global_step": 47473, "epoch": 1130} {"train_loss": -5.769529819488525, "global_step": 47474, "epoch": 1130} {"train_loss": -5.744308948516846, "global_step": 47475, "epoch": 1130} {"train_loss": -5.768671989440918, "global_step": 47476, "epoch": 1130} {"train_loss": -5.6779704093933105, "global_step": 47477, "epoch": 1130} {"train_loss": -5.662972450256348, "global_step": 47478, "epoch": 1130} {"train_loss": -5.734460353851318, "global_step": 47479, "epoch": 1130} {"train_loss": -5.736533164978027, "global_step": 47480, "epoch": 1130} {"train_loss": -5.810656547546387, "global_step": 47481, "epoch": 1130} {"train_loss": -5.775754928588867, "global_step": 47482, "epoch": 1130} {"train_loss": -5.7845964431762695, "global_step": 47483, "epoch": 1130} {"train_loss": -5.739523887634277, "global_step": 47484, "epoch": 1130} {"train_loss": -5.732733249664307, "global_step": 47485, "epoch": 1130} {"train_loss": -5.753090858459473, "global_step": 47486, "epoch": 1130} {"train_loss": -5.7372894287109375, "global_step": 47487, "epoch": 1130} {"train_loss": -5.721396446228027, "global_step": 47488, "epoch": 1130} {"train_loss": -5.787657737731934, "global_step": 47489, "epoch": 1130} {"train_loss": -5.745691299438477, "global_step": 47490, "epoch": 1130} {"train_loss": -5.7434892654418945, "global_step": 47491, "epoch": 1130} {"train_loss": -5.761538982391357, "global_step": 47492, "epoch": 1130} {"train_loss": -5.815366744995117, "global_step": 47493, "epoch": 1130} {"train_loss": -5.697819709777832, "global_step": 47494, "epoch": 1130} {"train_loss": -5.648168563842773, "global_step": 47495, "epoch": 1130} {"train_loss": -5.736478805541992, "global_step": 47496, "epoch": 1130} {"train_loss": -5.612236022949219, "global_step": 47497, "epoch": 1130} {"train_loss": -5.766647815704346, "global_step": 47498, "epoch": 1130} {"train_loss": -5.847536087036133, "global_step": 47499, "epoch": 1130} {"train_loss": -5.8266143798828125, "global_step": 47500, "epoch": 1130} {"train_loss": -5.7504916077568415, "global_step": 47501, "epoch": 1130, "val_loss": 61591.6640625} {"train_loss": -5.79223108291626, "global_step": 47502, "epoch": 1131} {"train_loss": -5.751058101654053, "global_step": 47503, "epoch": 1131} {"train_loss": -5.622508525848389, "global_step": 47504, "epoch": 1131} {"train_loss": -5.769568920135498, "global_step": 47505, "epoch": 1131} {"train_loss": -5.754944801330566, "global_step": 47506, "epoch": 1131} {"train_loss": -5.7435622215271, "global_step": 47507, "epoch": 1131} {"train_loss": -5.792712688446045, "global_step": 47508, "epoch": 1131} {"train_loss": -5.704155921936035, "global_step": 47509, "epoch": 1131} {"train_loss": -5.6585164070129395, "global_step": 47510, "epoch": 1131} {"train_loss": -5.8473615646362305, "global_step": 47511, "epoch": 1131} {"train_loss": -5.725462913513184, "global_step": 47512, "epoch": 1131} {"train_loss": -5.755913734436035, "global_step": 47513, "epoch": 1131} {"train_loss": -5.69149112701416, "global_step": 47514, "epoch": 1131} {"train_loss": -5.663078308105469, "global_step": 47515, "epoch": 1131} {"train_loss": -5.79934024810791, "global_step": 47516, "epoch": 1131} {"train_loss": -5.734358787536621, "global_step": 47517, "epoch": 1131} {"train_loss": -5.801425933837891, "global_step": 47518, "epoch": 1131} {"train_loss": -5.778838157653809, "global_step": 47519, "epoch": 1131} {"train_loss": -5.735235691070557, "global_step": 47520, "epoch": 1131} {"train_loss": -5.7380266189575195, "global_step": 47521, "epoch": 1131} {"train_loss": -5.7182536125183105, "global_step": 47522, "epoch": 1131} {"train_loss": -5.655019283294678, "global_step": 47523, "epoch": 1131} {"train_loss": -5.696872711181641, "global_step": 47524, "epoch": 1131} {"train_loss": -5.648079872131348, "global_step": 47525, "epoch": 1131} {"train_loss": -5.579225063323975, "global_step": 47526, "epoch": 1131} {"train_loss": -5.738010406494141, "global_step": 47527, "epoch": 1131} {"train_loss": -5.762683868408203, "global_step": 47528, "epoch": 1131} {"train_loss": -5.603740692138672, "global_step": 47529, "epoch": 1131} {"train_loss": -5.664330005645752, "global_step": 47530, "epoch": 1131} {"train_loss": -5.530921936035156, "global_step": 47531, "epoch": 1131} {"train_loss": -5.606805801391602, "global_step": 47532, "epoch": 1131} {"train_loss": -5.629272937774658, "global_step": 47533, "epoch": 1131} {"train_loss": -5.560605049133301, "global_step": 47534, "epoch": 1131} {"train_loss": -5.640991687774658, "global_step": 47535, "epoch": 1131} {"train_loss": -5.80086088180542, "global_step": 47536, "epoch": 1131} {"train_loss": -5.7406768798828125, "global_step": 47537, "epoch": 1131} {"train_loss": -5.662428855895996, "global_step": 47538, "epoch": 1131} {"train_loss": -5.679741859436035, "global_step": 47539, "epoch": 1131} {"train_loss": -5.547231197357178, "global_step": 47540, "epoch": 1131} {"train_loss": -5.80772590637207, "global_step": 47541, "epoch": 1131} {"train_loss": -5.6792731285095215, "global_step": 47542, "epoch": 1131} {"train_loss": -5.702430963516235, "global_step": 47543, "epoch": 1131, "val_loss": 61835.546875} {"train_loss": -5.81827449798584, "global_step": 47544, "epoch": 1132} {"train_loss": -5.588413715362549, "global_step": 47545, "epoch": 1132} {"train_loss": -5.635023593902588, "global_step": 47546, "epoch": 1132} {"train_loss": -5.800920009613037, "global_step": 47547, "epoch": 1132} {"train_loss": -5.789982795715332, "global_step": 47548, "epoch": 1132} {"train_loss": -5.807616233825684, "global_step": 47549, "epoch": 1132} {"train_loss": -5.869619369506836, "global_step": 47550, "epoch": 1132} {"train_loss": -5.800307273864746, "global_step": 47551, "epoch": 1132} {"train_loss": -5.714821815490723, "global_step": 47552, "epoch": 1132} {"train_loss": -5.750967025756836, "global_step": 47553, "epoch": 1132} {"train_loss": -5.724123001098633, "global_step": 47554, "epoch": 1132} {"train_loss": -5.724126815795898, "global_step": 47555, "epoch": 1132} {"train_loss": -5.817189693450928, "global_step": 47556, "epoch": 1132} {"train_loss": -5.651926040649414, "global_step": 47557, "epoch": 1132} {"train_loss": -5.547582149505615, "global_step": 47558, "epoch": 1132} {"train_loss": -5.722543716430664, "global_step": 47559, "epoch": 1132} {"train_loss": -5.840538024902344, "global_step": 47560, "epoch": 1132} {"train_loss": -5.7567901611328125, "global_step": 47561, "epoch": 1132} {"train_loss": -5.788091659545898, "global_step": 47562, "epoch": 1132} {"train_loss": -5.788834095001221, "global_step": 47563, "epoch": 1132} {"train_loss": -5.727441787719727, "global_step": 47564, "epoch": 1132} {"train_loss": -5.826841354370117, "global_step": 47565, "epoch": 1132} {"train_loss": -5.935153484344482, "global_step": 47566, "epoch": 1132} {"train_loss": -5.7884111404418945, "global_step": 47567, "epoch": 1132} {"train_loss": -5.727548122406006, "global_step": 47568, "epoch": 1132} {"train_loss": -5.778987884521484, "global_step": 47569, "epoch": 1132} {"train_loss": -5.737494468688965, "global_step": 47570, "epoch": 1132} {"train_loss": -5.685894966125488, "global_step": 47571, "epoch": 1132} {"train_loss": -5.686783790588379, "global_step": 47572, "epoch": 1132} {"train_loss": -5.766439437866211, "global_step": 47573, "epoch": 1132} {"train_loss": -5.809616565704346, "global_step": 47574, "epoch": 1132} {"train_loss": -5.735509395599365, "global_step": 47575, "epoch": 1132} {"train_loss": -5.708244800567627, "global_step": 47576, "epoch": 1132} {"train_loss": -5.639181137084961, "global_step": 47577, "epoch": 1132} {"train_loss": -5.676222801208496, "global_step": 47578, "epoch": 1132} {"train_loss": -5.689305305480957, "global_step": 47579, "epoch": 1132} {"train_loss": -5.717894554138184, "global_step": 47580, "epoch": 1132} {"train_loss": -5.721380233764648, "global_step": 47581, "epoch": 1132} {"train_loss": -5.793697357177734, "global_step": 47582, "epoch": 1132} {"train_loss": -5.72671365737915, "global_step": 47583, "epoch": 1132} {"train_loss": -5.655112266540527, "global_step": 47584, "epoch": 1132} {"train_loss": -5.743773460388184, "global_step": 47585, "epoch": 1132, "val_loss": 61648.2578125} {"train_loss": -5.821813106536865, "global_step": 47586, "epoch": 1133} {"train_loss": -5.763468265533447, "global_step": 47587, "epoch": 1133} {"train_loss": -5.705408096313477, "global_step": 47588, "epoch": 1133} {"train_loss": -5.648758888244629, "global_step": 47589, "epoch": 1133} {"train_loss": -5.640666961669922, "global_step": 47590, "epoch": 1133} {"train_loss": -5.827177047729492, "global_step": 47591, "epoch": 1133} {"train_loss": -5.783871650695801, "global_step": 47592, "epoch": 1133} {"train_loss": -5.681000232696533, "global_step": 47593, "epoch": 1133} {"train_loss": -5.786798477172852, "global_step": 47594, "epoch": 1133} {"train_loss": -5.714192867279053, "global_step": 47595, "epoch": 1133} {"train_loss": -5.710278511047363, "global_step": 47596, "epoch": 1133} {"train_loss": -5.790437698364258, "global_step": 47597, "epoch": 1133} {"train_loss": -5.8379082679748535, "global_step": 47598, "epoch": 1133} {"train_loss": -5.641795635223389, "global_step": 47599, "epoch": 1133} {"train_loss": -5.691856384277344, "global_step": 47600, "epoch": 1133} {"train_loss": -5.8258957862854, "global_step": 47601, "epoch": 1133} {"train_loss": -5.718805313110352, "global_step": 47602, "epoch": 1133} {"train_loss": -5.7743940353393555, "global_step": 47603, "epoch": 1133} {"train_loss": -5.696379661560059, "global_step": 47604, "epoch": 1133} {"train_loss": -5.740160942077637, "global_step": 47605, "epoch": 1133} {"train_loss": -5.733948230743408, "global_step": 47606, "epoch": 1133} {"train_loss": -5.894731521606445, "global_step": 47607, "epoch": 1133} {"train_loss": -5.769669532775879, "global_step": 47608, "epoch": 1133} {"train_loss": -5.667372703552246, "global_step": 47609, "epoch": 1133} {"train_loss": -5.722143173217773, "global_step": 47610, "epoch": 1133} {"train_loss": -5.759247779846191, "global_step": 47611, "epoch": 1133} {"train_loss": -5.744302749633789, "global_step": 47612, "epoch": 1133} {"train_loss": -5.963737487792969, "global_step": 47613, "epoch": 1133} {"train_loss": -5.73713493347168, "global_step": 47614, "epoch": 1133} {"train_loss": -5.889142036437988, "global_step": 47615, "epoch": 1133} {"train_loss": -5.8170366287231445, "global_step": 47616, "epoch": 1133} {"train_loss": -5.654880523681641, "global_step": 47617, "epoch": 1133} {"train_loss": -5.774367809295654, "global_step": 47618, "epoch": 1133} {"train_loss": -5.697619438171387, "global_step": 47619, "epoch": 1133} {"train_loss": -5.737566947937012, "global_step": 47620, "epoch": 1133} {"train_loss": -5.8272809982299805, "global_step": 47621, "epoch": 1133} {"train_loss": -5.7769012451171875, "global_step": 47622, "epoch": 1133} {"train_loss": -5.77314567565918, "global_step": 47623, "epoch": 1133} {"train_loss": -5.743163108825684, "global_step": 47624, "epoch": 1133} {"train_loss": -5.638225555419922, "global_step": 47625, "epoch": 1133} {"train_loss": -5.846826076507568, "global_step": 47626, "epoch": 1133} {"train_loss": -5.755427371887934, "global_step": 47627, "epoch": 1133, "val_loss": 61343.3671875} {"train_loss": -5.71461296081543, "global_step": 47628, "epoch": 1134} {"train_loss": -5.633235931396484, "global_step": 47629, "epoch": 1134} {"train_loss": -5.9169535636901855, "global_step": 47630, "epoch": 1134} {"train_loss": -5.839849948883057, "global_step": 47631, "epoch": 1134} {"train_loss": -5.762088298797607, "global_step": 47632, "epoch": 1134} {"train_loss": -5.71382474899292, "global_step": 47633, "epoch": 1134} {"train_loss": -5.754632949829102, "global_step": 47634, "epoch": 1134} {"train_loss": -5.827326774597168, "global_step": 47635, "epoch": 1134} {"train_loss": -5.627309799194336, "global_step": 47636, "epoch": 1134} {"train_loss": -5.728423118591309, "global_step": 47637, "epoch": 1134} {"train_loss": -5.781165599822998, "global_step": 47638, "epoch": 1134} {"train_loss": -5.71336555480957, "global_step": 47639, "epoch": 1134} {"train_loss": -5.769074440002441, "global_step": 47640, "epoch": 1134} {"train_loss": -5.771814823150635, "global_step": 47641, "epoch": 1134} {"train_loss": -5.7408857345581055, "global_step": 47642, "epoch": 1134} {"train_loss": -5.717851638793945, "global_step": 47643, "epoch": 1134} {"train_loss": -5.799561977386475, "global_step": 47644, "epoch": 1134} {"train_loss": -5.662096977233887, "global_step": 47645, "epoch": 1134} {"train_loss": -5.774194717407227, "global_step": 47646, "epoch": 1134} {"train_loss": -5.722372055053711, "global_step": 47647, "epoch": 1134} {"train_loss": -5.695807456970215, "global_step": 47648, "epoch": 1134} {"train_loss": -5.757514953613281, "global_step": 47649, "epoch": 1134} {"train_loss": -5.7177324295043945, "global_step": 47650, "epoch": 1134} {"train_loss": -5.723184108734131, "global_step": 47651, "epoch": 1134} {"train_loss": -5.771624565124512, "global_step": 47652, "epoch": 1134} {"train_loss": -5.574471473693848, "global_step": 47653, "epoch": 1134} {"train_loss": -5.687170505523682, "global_step": 47654, "epoch": 1134} {"train_loss": -5.737881660461426, "global_step": 47655, "epoch": 1134} {"train_loss": -5.626957893371582, "global_step": 47656, "epoch": 1134} {"train_loss": -5.663936614990234, "global_step": 47657, "epoch": 1134} {"train_loss": -5.822035312652588, "global_step": 47658, "epoch": 1134} {"train_loss": -5.732481956481934, "global_step": 47659, "epoch": 1134} {"train_loss": -5.763490676879883, "global_step": 47660, "epoch": 1134} {"train_loss": -5.741969108581543, "global_step": 47661, "epoch": 1134} {"train_loss": -5.8319807052612305, "global_step": 47662, "epoch": 1134} {"train_loss": -5.632519721984863, "global_step": 47663, "epoch": 1134} {"train_loss": -5.625178337097168, "global_step": 47664, "epoch": 1134} {"train_loss": -5.63716983795166, "global_step": 47665, "epoch": 1134} {"train_loss": -5.766025543212891, "global_step": 47666, "epoch": 1134} {"train_loss": -5.668778896331787, "global_step": 47667, "epoch": 1134} {"train_loss": -5.821136951446533, "global_step": 47668, "epoch": 1134} {"train_loss": -5.732944409052531, "global_step": 47669, "epoch": 1134, "val_loss": 61519.609375} {"train_loss": -5.757562160491943, "global_step": 47670, "epoch": 1135} {"train_loss": -5.695010662078857, "global_step": 47671, "epoch": 1135} {"train_loss": -5.817960739135742, "global_step": 47672, "epoch": 1135} {"train_loss": -5.709109306335449, "global_step": 47673, "epoch": 1135} {"train_loss": -5.63009786605835, "global_step": 47674, "epoch": 1135} {"train_loss": -5.841048240661621, "global_step": 47675, "epoch": 1135} {"train_loss": -5.682136535644531, "global_step": 47676, "epoch": 1135} {"train_loss": -5.760929107666016, "global_step": 47677, "epoch": 1135} {"train_loss": -5.701110363006592, "global_step": 47678, "epoch": 1135} {"train_loss": -5.65848445892334, "global_step": 47679, "epoch": 1135} {"train_loss": -5.889612674713135, "global_step": 47680, "epoch": 1135} {"train_loss": -5.711341381072998, "global_step": 47681, "epoch": 1135} {"train_loss": -5.823524475097656, "global_step": 47682, "epoch": 1135} {"train_loss": -5.768552780151367, "global_step": 47683, "epoch": 1135} {"train_loss": -5.748285293579102, "global_step": 47684, "epoch": 1135} {"train_loss": -5.7380475997924805, "global_step": 47685, "epoch": 1135} {"train_loss": -5.749813556671143, "global_step": 47686, "epoch": 1135} {"train_loss": -5.896224021911621, "global_step": 47687, "epoch": 1135} {"train_loss": -5.732975006103516, "global_step": 47688, "epoch": 1135} {"train_loss": -5.6618971824646, "global_step": 47689, "epoch": 1135} {"train_loss": -5.66024112701416, "global_step": 47690, "epoch": 1135} {"train_loss": -5.733001232147217, "global_step": 47691, "epoch": 1135} {"train_loss": -5.721283912658691, "global_step": 47692, "epoch": 1135} {"train_loss": -5.5930328369140625, "global_step": 47693, "epoch": 1135} {"train_loss": -5.781245231628418, "global_step": 47694, "epoch": 1135} {"train_loss": -5.78782844543457, "global_step": 47695, "epoch": 1135} {"train_loss": -5.758834362030029, "global_step": 47696, "epoch": 1135} {"train_loss": -5.649557113647461, "global_step": 47697, "epoch": 1135} {"train_loss": -5.714529991149902, "global_step": 47698, "epoch": 1135} {"train_loss": -5.701815605163574, "global_step": 47699, "epoch": 1135} {"train_loss": -5.756470680236816, "global_step": 47700, "epoch": 1135} {"train_loss": -5.7025465965271, "global_step": 47701, "epoch": 1135} {"train_loss": -5.879573822021484, "global_step": 47702, "epoch": 1135} {"train_loss": -5.7336320877075195, "global_step": 47703, "epoch": 1135} {"train_loss": -5.673220634460449, "global_step": 47704, "epoch": 1135} {"train_loss": -5.716233730316162, "global_step": 47705, "epoch": 1135} {"train_loss": -5.716969966888428, "global_step": 47706, "epoch": 1135} {"train_loss": -5.7937517166137695, "global_step": 47707, "epoch": 1135} {"train_loss": -5.708186626434326, "global_step": 47708, "epoch": 1135} {"train_loss": -5.7839765548706055, "global_step": 47709, "epoch": 1135} {"train_loss": -5.738267421722412, "global_step": 47710, "epoch": 1135} {"train_loss": -5.741059371403286, "global_step": 47711, "epoch": 1135, "val_loss": 61626.74609375} {"train_loss": -5.736391067504883, "global_step": 47712, "epoch": 1136} {"train_loss": -5.615074157714844, "global_step": 47713, "epoch": 1136} {"train_loss": -5.7407965660095215, "global_step": 47714, "epoch": 1136} {"train_loss": -5.800214767456055, "global_step": 47715, "epoch": 1136} {"train_loss": -5.7808732986450195, "global_step": 47716, "epoch": 1136} {"train_loss": -5.794555187225342, "global_step": 47717, "epoch": 1136} {"train_loss": -5.835446357727051, "global_step": 47718, "epoch": 1136} {"train_loss": -5.627765655517578, "global_step": 47719, "epoch": 1136} {"train_loss": -5.699053764343262, "global_step": 47720, "epoch": 1136} {"train_loss": -5.860949516296387, "global_step": 47721, "epoch": 1136} {"train_loss": -5.755128383636475, "global_step": 47722, "epoch": 1136} {"train_loss": -5.756840705871582, "global_step": 47723, "epoch": 1136} {"train_loss": -5.776565074920654, "global_step": 47724, "epoch": 1136} {"train_loss": -5.6549859046936035, "global_step": 47725, "epoch": 1136} {"train_loss": -5.753242015838623, "global_step": 47726, "epoch": 1136} {"train_loss": -5.708215713500977, "global_step": 47727, "epoch": 1136} {"train_loss": -5.780221462249756, "global_step": 47728, "epoch": 1136} {"train_loss": -5.856871128082275, "global_step": 47729, "epoch": 1136} {"train_loss": -5.761299133300781, "global_step": 47730, "epoch": 1136} {"train_loss": -5.674124240875244, "global_step": 47731, "epoch": 1136} {"train_loss": -5.735299110412598, "global_step": 47732, "epoch": 1136} {"train_loss": -5.863518714904785, "global_step": 47733, "epoch": 1136} {"train_loss": -5.734279632568359, "global_step": 47734, "epoch": 1136} {"train_loss": -5.799704551696777, "global_step": 47735, "epoch": 1136} {"train_loss": -5.724465847015381, "global_step": 47736, "epoch": 1136} {"train_loss": -5.704268455505371, "global_step": 47737, "epoch": 1136} {"train_loss": -5.603743076324463, "global_step": 47738, "epoch": 1136} {"train_loss": -5.859387397766113, "global_step": 47739, "epoch": 1136} {"train_loss": -5.69007682800293, "global_step": 47740, "epoch": 1136} {"train_loss": -5.734488487243652, "global_step": 47741, "epoch": 1136} {"train_loss": -5.7837934494018555, "global_step": 47742, "epoch": 1136} {"train_loss": -5.619532585144043, "global_step": 47743, "epoch": 1136} {"train_loss": -5.7372283935546875, "global_step": 47744, "epoch": 1136} {"train_loss": -5.694307327270508, "global_step": 47745, "epoch": 1136} {"train_loss": -5.734322547912598, "global_step": 47746, "epoch": 1136} {"train_loss": -5.7251081466674805, "global_step": 47747, "epoch": 1136} {"train_loss": -5.855928421020508, "global_step": 47748, "epoch": 1136} {"train_loss": -5.788359642028809, "global_step": 47749, "epoch": 1136} {"train_loss": -5.732313632965088, "global_step": 47750, "epoch": 1136} {"train_loss": -5.790959358215332, "global_step": 47751, "epoch": 1136} {"train_loss": -5.746707439422607, "global_step": 47752, "epoch": 1136} {"train_loss": -5.746914239156814, "global_step": 47753, "epoch": 1136, "val_loss": 61554.48046875} {"train_loss": -5.776824951171875, "global_step": 47754, "epoch": 1137} {"train_loss": -5.855747222900391, "global_step": 47755, "epoch": 1137} {"train_loss": -5.708642959594727, "global_step": 47756, "epoch": 1137} {"train_loss": -5.7764177322387695, "global_step": 47757, "epoch": 1137} {"train_loss": -5.792057037353516, "global_step": 47758, "epoch": 1137} {"train_loss": -5.688029766082764, "global_step": 47759, "epoch": 1137} {"train_loss": -5.708582878112793, "global_step": 47760, "epoch": 1137} {"train_loss": -5.8289794921875, "global_step": 47761, "epoch": 1137} {"train_loss": -5.905996322631836, "global_step": 47762, "epoch": 1137} {"train_loss": -5.797046184539795, "global_step": 47763, "epoch": 1137} {"train_loss": -5.696895599365234, "global_step": 47764, "epoch": 1137} {"train_loss": -5.7745161056518555, "global_step": 47765, "epoch": 1137} {"train_loss": -5.823144435882568, "global_step": 47766, "epoch": 1137} {"train_loss": -5.773828983306885, "global_step": 47767, "epoch": 1137} {"train_loss": -5.6912713050842285, "global_step": 47768, "epoch": 1137} {"train_loss": -5.774754047393799, "global_step": 47769, "epoch": 1137} {"train_loss": -5.819157600402832, "global_step": 47770, "epoch": 1137} {"train_loss": -5.749397277832031, "global_step": 47771, "epoch": 1137} {"train_loss": -5.714728355407715, "global_step": 47772, "epoch": 1137} {"train_loss": -5.73686408996582, "global_step": 47773, "epoch": 1137} {"train_loss": -5.8209662437438965, "global_step": 47774, "epoch": 1137} {"train_loss": -5.752630233764648, "global_step": 47775, "epoch": 1137} {"train_loss": -5.660308837890625, "global_step": 47776, "epoch": 1137} {"train_loss": -5.753488540649414, "global_step": 47777, "epoch": 1137} {"train_loss": -5.752413749694824, "global_step": 47778, "epoch": 1137} {"train_loss": -5.857071876525879, "global_step": 47779, "epoch": 1137} {"train_loss": -5.743957996368408, "global_step": 47780, "epoch": 1137} {"train_loss": -5.734292507171631, "global_step": 47781, "epoch": 1137} {"train_loss": -5.794424057006836, "global_step": 47782, "epoch": 1137} {"train_loss": -5.658633708953857, "global_step": 47783, "epoch": 1137} {"train_loss": -5.808609962463379, "global_step": 47784, "epoch": 1137} {"train_loss": -5.850852012634277, "global_step": 47785, "epoch": 1137} {"train_loss": -5.783064365386963, "global_step": 47786, "epoch": 1137} {"train_loss": -5.776588439941406, "global_step": 47787, "epoch": 1137} {"train_loss": -5.743854999542236, "global_step": 47788, "epoch": 1137} {"train_loss": -5.695267200469971, "global_step": 47789, "epoch": 1137} {"train_loss": -5.7713141441345215, "global_step": 47790, "epoch": 1137} {"train_loss": -5.906128406524658, "global_step": 47791, "epoch": 1137} {"train_loss": -5.910089492797852, "global_step": 47792, "epoch": 1137} {"train_loss": -5.677303791046143, "global_step": 47793, "epoch": 1137} {"train_loss": -5.7948713302612305, "global_step": 47794, "epoch": 1137} {"train_loss": -5.770264080592564, "global_step": 47795, "epoch": 1137, "val_loss": 61449.1328125} {"train_loss": -5.78242301940918, "global_step": 47796, "epoch": 1138} {"train_loss": -5.7223052978515625, "global_step": 47797, "epoch": 1138} {"train_loss": -5.742387771606445, "global_step": 47798, "epoch": 1138} {"train_loss": -5.773977279663086, "global_step": 47799, "epoch": 1138} {"train_loss": -5.844874858856201, "global_step": 47800, "epoch": 1138} {"train_loss": -5.799870491027832, "global_step": 47801, "epoch": 1138} {"train_loss": -5.778324127197266, "global_step": 47802, "epoch": 1138} {"train_loss": -5.776641368865967, "global_step": 47803, "epoch": 1138} {"train_loss": -5.733649730682373, "global_step": 47804, "epoch": 1138} {"train_loss": -5.682449817657471, "global_step": 47805, "epoch": 1138} {"train_loss": -5.759570598602295, "global_step": 47806, "epoch": 1138} {"train_loss": -5.882785320281982, "global_step": 47807, "epoch": 1138} {"train_loss": -5.747178077697754, "global_step": 47808, "epoch": 1138} {"train_loss": -5.867439270019531, "global_step": 47809, "epoch": 1138} {"train_loss": -5.687788009643555, "global_step": 47810, "epoch": 1138} {"train_loss": -5.695002555847168, "global_step": 47811, "epoch": 1138} {"train_loss": -5.771356582641602, "global_step": 47812, "epoch": 1138} {"train_loss": -5.78763484954834, "global_step": 47813, "epoch": 1138} {"train_loss": -5.6908159255981445, "global_step": 47814, "epoch": 1138} {"train_loss": -5.685677528381348, "global_step": 47815, "epoch": 1138} {"train_loss": -5.774784564971924, "global_step": 47816, "epoch": 1138} {"train_loss": -5.7609100341796875, "global_step": 47817, "epoch": 1138} {"train_loss": -5.771607398986816, "global_step": 47818, "epoch": 1138} {"train_loss": -5.668855667114258, "global_step": 47819, "epoch": 1138} {"train_loss": -5.6197285652160645, "global_step": 47820, "epoch": 1138} {"train_loss": -5.7687788009643555, "global_step": 47821, "epoch": 1138} {"train_loss": -5.68775749206543, "global_step": 47822, "epoch": 1138} {"train_loss": -5.718363285064697, "global_step": 47823, "epoch": 1138} {"train_loss": -5.705129146575928, "global_step": 47824, "epoch": 1138} {"train_loss": -5.699606895446777, "global_step": 47825, "epoch": 1138} {"train_loss": -5.691711902618408, "global_step": 47826, "epoch": 1138} {"train_loss": -5.622220039367676, "global_step": 47827, "epoch": 1138} {"train_loss": -5.874814033508301, "global_step": 47828, "epoch": 1138} {"train_loss": -5.56885290145874, "global_step": 47829, "epoch": 1138} {"train_loss": -5.693451881408691, "global_step": 47830, "epoch": 1138} {"train_loss": -5.7395806312561035, "global_step": 47831, "epoch": 1138} {"train_loss": -5.740031719207764, "global_step": 47832, "epoch": 1138} {"train_loss": -5.615069389343262, "global_step": 47833, "epoch": 1138} {"train_loss": -5.703729629516602, "global_step": 47834, "epoch": 1138} {"train_loss": -5.771877765655518, "global_step": 47835, "epoch": 1138} {"train_loss": -5.745788097381592, "global_step": 47836, "epoch": 1138} {"train_loss": -5.733730883825393, "global_step": 47837, "epoch": 1138, "val_loss": 61199.11328125} {"train_loss": -5.719346046447754, "global_step": 47838, "epoch": 1139} {"train_loss": -5.678393363952637, "global_step": 47839, "epoch": 1139} {"train_loss": -5.869151592254639, "global_step": 47840, "epoch": 1139} {"train_loss": -5.781964302062988, "global_step": 47841, "epoch": 1139} {"train_loss": -5.6897873878479, "global_step": 47842, "epoch": 1139} {"train_loss": -5.753023147583008, "global_step": 47843, "epoch": 1139} {"train_loss": -5.848925590515137, "global_step": 47844, "epoch": 1139} {"train_loss": -5.8587493896484375, "global_step": 47845, "epoch": 1139} {"train_loss": -5.75458288192749, "global_step": 47846, "epoch": 1139} {"train_loss": -5.685112953186035, "global_step": 47847, "epoch": 1139} {"train_loss": -5.695621490478516, "global_step": 47848, "epoch": 1139} {"train_loss": -5.760643005371094, "global_step": 47849, "epoch": 1139} {"train_loss": -5.762326717376709, "global_step": 47850, "epoch": 1139} {"train_loss": -5.577718257904053, "global_step": 47851, "epoch": 1139} {"train_loss": -5.662294387817383, "global_step": 47852, "epoch": 1139} {"train_loss": -5.708606719970703, "global_step": 47853, "epoch": 1139} {"train_loss": -5.805461883544922, "global_step": 47854, "epoch": 1139} {"train_loss": -5.834105014801025, "global_step": 47855, "epoch": 1139} {"train_loss": -5.760627746582031, "global_step": 47856, "epoch": 1139} {"train_loss": -5.797274112701416, "global_step": 47857, "epoch": 1139} {"train_loss": -5.820077896118164, "global_step": 47858, "epoch": 1139} {"train_loss": -5.692235946655273, "global_step": 47859, "epoch": 1139} {"train_loss": -5.814040660858154, "global_step": 47860, "epoch": 1139} {"train_loss": -5.847475051879883, "global_step": 47861, "epoch": 1139} {"train_loss": -5.766571521759033, "global_step": 47862, "epoch": 1139} {"train_loss": -5.783836364746094, "global_step": 47863, "epoch": 1139} {"train_loss": -5.790744781494141, "global_step": 47864, "epoch": 1139} {"train_loss": -5.735435485839844, "global_step": 47865, "epoch": 1139} {"train_loss": -5.724225044250488, "global_step": 47866, "epoch": 1139} {"train_loss": -5.711300849914551, "global_step": 47867, "epoch": 1139} {"train_loss": -5.780021667480469, "global_step": 47868, "epoch": 1139} {"train_loss": -5.756568908691406, "global_step": 47869, "epoch": 1139} {"train_loss": -5.651062965393066, "global_step": 47870, "epoch": 1139} {"train_loss": -5.600468635559082, "global_step": 47871, "epoch": 1139} {"train_loss": -5.757266044616699, "global_step": 47872, "epoch": 1139} {"train_loss": -5.734476089477539, "global_step": 47873, "epoch": 1139} {"train_loss": -5.775591850280762, "global_step": 47874, "epoch": 1139} {"train_loss": -5.912075042724609, "global_step": 47875, "epoch": 1139} {"train_loss": -5.842240333557129, "global_step": 47876, "epoch": 1139} {"train_loss": -5.721949577331543, "global_step": 47877, "epoch": 1139} {"train_loss": -5.792738437652588, "global_step": 47878, "epoch": 1139} {"train_loss": -5.75970737139384, "global_step": 47879, "epoch": 1139, "val_loss": 61772.046875} {"train_loss": -5.781652450561523, "global_step": 47880, "epoch": 1140} {"train_loss": -5.640061378479004, "global_step": 47881, "epoch": 1140} {"train_loss": -5.672771453857422, "global_step": 47882, "epoch": 1140} {"train_loss": -5.848621845245361, "global_step": 47883, "epoch": 1140} {"train_loss": -5.7590131759643555, "global_step": 47884, "epoch": 1140} {"train_loss": -5.6647491455078125, "global_step": 47885, "epoch": 1140} {"train_loss": -5.752036094665527, "global_step": 47886, "epoch": 1140} {"train_loss": -5.862638473510742, "global_step": 47887, "epoch": 1140} {"train_loss": -5.79097843170166, "global_step": 47888, "epoch": 1140} {"train_loss": -5.664191246032715, "global_step": 47889, "epoch": 1140} {"train_loss": -5.67935848236084, "global_step": 47890, "epoch": 1140} {"train_loss": -5.803609848022461, "global_step": 47891, "epoch": 1140} {"train_loss": -5.709839820861816, "global_step": 47892, "epoch": 1140} {"train_loss": -5.893856048583984, "global_step": 47893, "epoch": 1140} {"train_loss": -5.85336971282959, "global_step": 47894, "epoch": 1140} {"train_loss": -5.789491653442383, "global_step": 47895, "epoch": 1140} {"train_loss": -5.673121452331543, "global_step": 47896, "epoch": 1140} {"train_loss": -5.775857925415039, "global_step": 47897, "epoch": 1140} {"train_loss": -5.626269340515137, "global_step": 47898, "epoch": 1140} {"train_loss": -5.74251651763916, "global_step": 47899, "epoch": 1140} {"train_loss": -5.667236804962158, "global_step": 47900, "epoch": 1140} {"train_loss": -5.749397277832031, "global_step": 47901, "epoch": 1140} {"train_loss": -5.907894134521484, "global_step": 47902, "epoch": 1140} {"train_loss": -5.733799934387207, "global_step": 47903, "epoch": 1140} {"train_loss": -5.76092529296875, "global_step": 47904, "epoch": 1140} {"train_loss": -5.646270751953125, "global_step": 47905, "epoch": 1140} {"train_loss": -5.777060508728027, "global_step": 47906, "epoch": 1140} {"train_loss": -5.73094367980957, "global_step": 47907, "epoch": 1140} {"train_loss": -5.721919536590576, "global_step": 47908, "epoch": 1140} {"train_loss": -5.7378339767456055, "global_step": 47909, "epoch": 1140} {"train_loss": -5.664716720581055, "global_step": 47910, "epoch": 1140} {"train_loss": -5.692584991455078, "global_step": 47911, "epoch": 1140} {"train_loss": -5.716402053833008, "global_step": 47912, "epoch": 1140} {"train_loss": -5.670294284820557, "global_step": 47913, "epoch": 1140} {"train_loss": -5.708115100860596, "global_step": 47914, "epoch": 1140} {"train_loss": -5.7447357177734375, "global_step": 47915, "epoch": 1140} {"train_loss": -5.747862815856934, "global_step": 47916, "epoch": 1140} {"train_loss": -5.604375839233398, "global_step": 47917, "epoch": 1140} {"train_loss": -5.800838470458984, "global_step": 47918, "epoch": 1140} {"train_loss": -5.625344276428223, "global_step": 47919, "epoch": 1140} {"train_loss": -5.815953254699707, "global_step": 47920, "epoch": 1140} {"train_loss": -5.734674714860462, "global_step": 47921, "epoch": 1140, "val_loss": 61957.23046875} {"train_loss": -5.587029457092285, "global_step": 47922, "epoch": 1141} {"train_loss": -5.698520183563232, "global_step": 47923, "epoch": 1141} {"train_loss": -5.738971710205078, "global_step": 47924, "epoch": 1141} {"train_loss": -5.707320213317871, "global_step": 47925, "epoch": 1141} {"train_loss": -5.585973739624023, "global_step": 47926, "epoch": 1141} {"train_loss": -5.639479637145996, "global_step": 47927, "epoch": 1141} {"train_loss": -5.704531669616699, "global_step": 47928, "epoch": 1141} {"train_loss": -5.623430252075195, "global_step": 47929, "epoch": 1141} {"train_loss": -5.7155375480651855, "global_step": 47930, "epoch": 1141} {"train_loss": -5.867914199829102, "global_step": 47931, "epoch": 1141} {"train_loss": -5.857839584350586, "global_step": 47932, "epoch": 1141} {"train_loss": -5.619489669799805, "global_step": 47933, "epoch": 1141} {"train_loss": -5.750001430511475, "global_step": 47934, "epoch": 1141} {"train_loss": -5.8188347816467285, "global_step": 47935, "epoch": 1141} {"train_loss": -5.830778121948242, "global_step": 47936, "epoch": 1141} {"train_loss": -5.618353366851807, "global_step": 47937, "epoch": 1141} {"train_loss": -5.580134868621826, "global_step": 47938, "epoch": 1141} {"train_loss": -5.669484615325928, "global_step": 47939, "epoch": 1141} {"train_loss": -5.938990116119385, "global_step": 47940, "epoch": 1141} {"train_loss": -5.844562530517578, "global_step": 47941, "epoch": 1141} {"train_loss": -5.684049129486084, "global_step": 47942, "epoch": 1141} {"train_loss": -5.754909515380859, "global_step": 47943, "epoch": 1141} {"train_loss": -5.758908271789551, "global_step": 47944, "epoch": 1141} {"train_loss": -5.65146017074585, "global_step": 47945, "epoch": 1141} {"train_loss": -5.751614093780518, "global_step": 47946, "epoch": 1141} {"train_loss": -5.898558616638184, "global_step": 47947, "epoch": 1141} {"train_loss": -5.818822383880615, "global_step": 47948, "epoch": 1141} {"train_loss": -5.759477138519287, "global_step": 47949, "epoch": 1141} {"train_loss": -5.737461566925049, "global_step": 47950, "epoch": 1141} {"train_loss": -5.698084831237793, "global_step": 47951, "epoch": 1141} {"train_loss": -5.631841659545898, "global_step": 47952, "epoch": 1141} {"train_loss": -5.749443531036377, "global_step": 47953, "epoch": 1141} {"train_loss": -5.72320032119751, "global_step": 47954, "epoch": 1141} {"train_loss": -5.741466045379639, "global_step": 47955, "epoch": 1141} {"train_loss": -5.786637306213379, "global_step": 47956, "epoch": 1141} {"train_loss": -5.803078651428223, "global_step": 47957, "epoch": 1141} {"train_loss": -5.684221267700195, "global_step": 47958, "epoch": 1141} {"train_loss": -5.821944713592529, "global_step": 47959, "epoch": 1141} {"train_loss": -5.831894874572754, "global_step": 47960, "epoch": 1141} {"train_loss": -5.837837219238281, "global_step": 47961, "epoch": 1141} {"train_loss": -5.696434020996094, "global_step": 47962, "epoch": 1141} {"train_loss": -5.739045983269101, "global_step": 47963, "epoch": 1141, "val_loss": 61444.17578125} {"train_loss": -5.747969627380371, "global_step": 47964, "epoch": 1142} {"train_loss": -5.768257141113281, "global_step": 47965, "epoch": 1142} {"train_loss": -5.723302841186523, "global_step": 47966, "epoch": 1142} {"train_loss": -5.796242713928223, "global_step": 47967, "epoch": 1142} {"train_loss": -5.841180801391602, "global_step": 47968, "epoch": 1142} {"train_loss": -5.769448757171631, "global_step": 47969, "epoch": 1142} {"train_loss": -5.790164470672607, "global_step": 47970, "epoch": 1142} {"train_loss": -5.699225425720215, "global_step": 47971, "epoch": 1142} {"train_loss": -5.737024784088135, "global_step": 47972, "epoch": 1142} {"train_loss": -5.598807334899902, "global_step": 47973, "epoch": 1142} {"train_loss": -5.798772811889648, "global_step": 47974, "epoch": 1142} {"train_loss": -5.758728504180908, "global_step": 47975, "epoch": 1142} {"train_loss": -5.740503311157227, "global_step": 47976, "epoch": 1142} {"train_loss": -5.732287883758545, "global_step": 47977, "epoch": 1142} {"train_loss": -5.683366775512695, "global_step": 47978, "epoch": 1142} {"train_loss": -5.80638313293457, "global_step": 47979, "epoch": 1142} {"train_loss": -5.848837375640869, "global_step": 47980, "epoch": 1142} {"train_loss": -5.722454071044922, "global_step": 47981, "epoch": 1142} {"train_loss": -5.782525062561035, "global_step": 47982, "epoch": 1142} {"train_loss": -5.73397159576416, "global_step": 47983, "epoch": 1142} {"train_loss": -5.652017593383789, "global_step": 47984, "epoch": 1142} {"train_loss": -5.685060977935791, "global_step": 47985, "epoch": 1142} {"train_loss": -5.702877044677734, "global_step": 47986, "epoch": 1142} {"train_loss": -5.7708353996276855, "global_step": 47987, "epoch": 1142} {"train_loss": -5.793487548828125, "global_step": 47988, "epoch": 1142} {"train_loss": -5.746157169342041, "global_step": 47989, "epoch": 1142} {"train_loss": -5.700465202331543, "global_step": 47990, "epoch": 1142} {"train_loss": -5.810094356536865, "global_step": 47991, "epoch": 1142} {"train_loss": -5.888876438140869, "global_step": 47992, "epoch": 1142} {"train_loss": -5.7866597175598145, "global_step": 47993, "epoch": 1142} {"train_loss": -5.742488861083984, "global_step": 47994, "epoch": 1142} {"train_loss": -5.7112650871276855, "global_step": 47995, "epoch": 1142} {"train_loss": -5.717878818511963, "global_step": 47996, "epoch": 1142} {"train_loss": -5.812079429626465, "global_step": 47997, "epoch": 1142} {"train_loss": -5.714606761932373, "global_step": 47998, "epoch": 1142} {"train_loss": -5.75804328918457, "global_step": 47999, "epoch": 1142} {"train_loss": -5.781102180480957, "global_step": 48000, "epoch": 1142} {"train_loss": -5.813449859619141, "global_step": 48001, "epoch": 1142} {"train_loss": -5.796895980834961, "global_step": 48002, "epoch": 1142} {"train_loss": -5.732249736785889, "global_step": 48003, "epoch": 1142} {"train_loss": -5.803997993469238, "global_step": 48004, "epoch": 1142} {"train_loss": -5.755983454840524, "global_step": 48005, "epoch": 1142, "val_loss": 61901.64453125} {"train_loss": -5.704432487487793, "global_step": 48006, "epoch": 1143} {"train_loss": -5.603925704956055, "global_step": 48007, "epoch": 1143} {"train_loss": -5.858212947845459, "global_step": 48008, "epoch": 1143} {"train_loss": -5.697123050689697, "global_step": 48009, "epoch": 1143} {"train_loss": -5.727956771850586, "global_step": 48010, "epoch": 1143} {"train_loss": -5.760744571685791, "global_step": 48011, "epoch": 1143} {"train_loss": -5.592246055603027, "global_step": 48012, "epoch": 1143} {"train_loss": -5.780706405639648, "global_step": 48013, "epoch": 1143} {"train_loss": -5.843563079833984, "global_step": 48014, "epoch": 1143} {"train_loss": -5.734672546386719, "global_step": 48015, "epoch": 1143} {"train_loss": -5.678619384765625, "global_step": 48016, "epoch": 1143} {"train_loss": -5.761415004730225, "global_step": 48017, "epoch": 1143} {"train_loss": -5.643182754516602, "global_step": 48018, "epoch": 1143} {"train_loss": -5.793751239776611, "global_step": 48019, "epoch": 1143} {"train_loss": -5.610989570617676, "global_step": 48020, "epoch": 1143} {"train_loss": -5.557322025299072, "global_step": 48021, "epoch": 1143} {"train_loss": -5.658847808837891, "global_step": 48022, "epoch": 1143} {"train_loss": -5.688608646392822, "global_step": 48023, "epoch": 1143} {"train_loss": -5.807007789611816, "global_step": 48024, "epoch": 1143} {"train_loss": -5.775784492492676, "global_step": 48025, "epoch": 1143} {"train_loss": -5.784496307373047, "global_step": 48026, "epoch": 1143} {"train_loss": -5.690818786621094, "global_step": 48027, "epoch": 1143} {"train_loss": -5.847130298614502, "global_step": 48028, "epoch": 1143} {"train_loss": -5.681730270385742, "global_step": 48029, "epoch": 1143} {"train_loss": -5.838995933532715, "global_step": 48030, "epoch": 1143} {"train_loss": -5.794885635375977, "global_step": 48031, "epoch": 1143} {"train_loss": -5.696047782897949, "global_step": 48032, "epoch": 1143} {"train_loss": -5.759123802185059, "global_step": 48033, "epoch": 1143} {"train_loss": -5.713414192199707, "global_step": 48034, "epoch": 1143} {"train_loss": -5.686406135559082, "global_step": 48035, "epoch": 1143} {"train_loss": -5.683587074279785, "global_step": 48036, "epoch": 1143} {"train_loss": -5.807450294494629, "global_step": 48037, "epoch": 1143} {"train_loss": -5.75589656829834, "global_step": 48038, "epoch": 1143} {"train_loss": -5.744117259979248, "global_step": 48039, "epoch": 1143} {"train_loss": -5.6537885665893555, "global_step": 48040, "epoch": 1143} {"train_loss": -5.883185863494873, "global_step": 48041, "epoch": 1143} {"train_loss": -5.87620210647583, "global_step": 48042, "epoch": 1143} {"train_loss": -5.818662166595459, "global_step": 48043, "epoch": 1143} {"train_loss": -5.820217132568359, "global_step": 48044, "epoch": 1143} {"train_loss": -5.673174858093262, "global_step": 48045, "epoch": 1143} {"train_loss": -5.713698387145996, "global_step": 48046, "epoch": 1143} {"train_loss": -5.73419021424793, "global_step": 48047, "epoch": 1143, "val_loss": 61433.06640625} {"train_loss": -5.7890191078186035, "global_step": 48048, "epoch": 1144} {"train_loss": -5.712375164031982, "global_step": 48049, "epoch": 1144} {"train_loss": -5.828351020812988, "global_step": 48050, "epoch": 1144} {"train_loss": -5.7103166580200195, "global_step": 48051, "epoch": 1144} {"train_loss": -5.7252655029296875, "global_step": 48052, "epoch": 1144} {"train_loss": -5.823866367340088, "global_step": 48053, "epoch": 1144} {"train_loss": -5.773499488830566, "global_step": 48054, "epoch": 1144} {"train_loss": -5.726278305053711, "global_step": 48055, "epoch": 1144} {"train_loss": -5.8023881912231445, "global_step": 48056, "epoch": 1144} {"train_loss": -5.7876482009887695, "global_step": 48057, "epoch": 1144} {"train_loss": -5.765855312347412, "global_step": 48058, "epoch": 1144} {"train_loss": -5.795013427734375, "global_step": 48059, "epoch": 1144} {"train_loss": -5.844881534576416, "global_step": 48060, "epoch": 1144} {"train_loss": -5.71279764175415, "global_step": 48061, "epoch": 1144} {"train_loss": -5.750710964202881, "global_step": 48062, "epoch": 1144} {"train_loss": -5.783746242523193, "global_step": 48063, "epoch": 1144} {"train_loss": -5.701042652130127, "global_step": 48064, "epoch": 1144} {"train_loss": -5.680692672729492, "global_step": 48065, "epoch": 1144} {"train_loss": -5.722248077392578, "global_step": 48066, "epoch": 1144} {"train_loss": -5.64013671875, "global_step": 48067, "epoch": 1144} {"train_loss": -5.767365455627441, "global_step": 48068, "epoch": 1144} {"train_loss": -5.718027591705322, "global_step": 48069, "epoch": 1144} {"train_loss": -5.785003662109375, "global_step": 48070, "epoch": 1144} {"train_loss": -5.7803850173950195, "global_step": 48071, "epoch": 1144} {"train_loss": -5.648325443267822, "global_step": 48072, "epoch": 1144} {"train_loss": -5.894489765167236, "global_step": 48073, "epoch": 1144} {"train_loss": -5.689708709716797, "global_step": 48074, "epoch": 1144} {"train_loss": -5.576752662658691, "global_step": 48075, "epoch": 1144} {"train_loss": -5.849194526672363, "global_step": 48076, "epoch": 1144} {"train_loss": -5.674408912658691, "global_step": 48077, "epoch": 1144} {"train_loss": -5.708390235900879, "global_step": 48078, "epoch": 1144} {"train_loss": -5.685161590576172, "global_step": 48079, "epoch": 1144} {"train_loss": -5.723268985748291, "global_step": 48080, "epoch": 1144} {"train_loss": -5.7620344161987305, "global_step": 48081, "epoch": 1144} {"train_loss": -5.759349822998047, "global_step": 48082, "epoch": 1144} {"train_loss": -5.800449371337891, "global_step": 48083, "epoch": 1144} {"train_loss": -5.723642349243164, "global_step": 48084, "epoch": 1144} {"train_loss": -5.783625602722168, "global_step": 48085, "epoch": 1144} {"train_loss": -5.645635604858398, "global_step": 48086, "epoch": 1144} {"train_loss": -5.653292655944824, "global_step": 48087, "epoch": 1144} {"train_loss": -5.776396751403809, "global_step": 48088, "epoch": 1144} {"train_loss": -5.747120914005098, "global_step": 48089, "epoch": 1144, "val_loss": 61849.4609375} {"train_loss": -5.636083602905273, "global_step": 48090, "epoch": 1145} {"train_loss": -5.716254234313965, "global_step": 48091, "epoch": 1145} {"train_loss": -5.808198928833008, "global_step": 48092, "epoch": 1145} {"train_loss": -5.601343154907227, "global_step": 48093, "epoch": 1145} {"train_loss": -5.841856956481934, "global_step": 48094, "epoch": 1145} {"train_loss": -5.609365463256836, "global_step": 48095, "epoch": 1145} {"train_loss": -5.711921691894531, "global_step": 48096, "epoch": 1145} {"train_loss": -5.815269947052002, "global_step": 48097, "epoch": 1145} {"train_loss": -5.671051025390625, "global_step": 48098, "epoch": 1145} {"train_loss": -5.638520240783691, "global_step": 48099, "epoch": 1145} {"train_loss": -5.698040962219238, "global_step": 48100, "epoch": 1145} {"train_loss": -5.733999252319336, "global_step": 48101, "epoch": 1145} {"train_loss": -5.608909606933594, "global_step": 48102, "epoch": 1145} {"train_loss": -5.754607677459717, "global_step": 48103, "epoch": 1145} {"train_loss": -5.702794075012207, "global_step": 48104, "epoch": 1145} {"train_loss": -5.690938949584961, "global_step": 48105, "epoch": 1145} {"train_loss": -5.736754894256592, "global_step": 48106, "epoch": 1145} {"train_loss": -5.623864650726318, "global_step": 48107, "epoch": 1145} {"train_loss": -5.692018508911133, "global_step": 48108, "epoch": 1145} {"train_loss": -5.714430332183838, "global_step": 48109, "epoch": 1145} {"train_loss": -5.675385475158691, "global_step": 48110, "epoch": 1145} {"train_loss": -5.609165191650391, "global_step": 48111, "epoch": 1145} {"train_loss": -5.7181806564331055, "global_step": 48112, "epoch": 1145} {"train_loss": -5.729357719421387, "global_step": 48113, "epoch": 1145} {"train_loss": -5.801845073699951, "global_step": 48114, "epoch": 1145} {"train_loss": -5.658683776855469, "global_step": 48115, "epoch": 1145} {"train_loss": -5.7565155029296875, "global_step": 48116, "epoch": 1145} {"train_loss": -5.739509582519531, "global_step": 48117, "epoch": 1145} {"train_loss": -5.696228981018066, "global_step": 48118, "epoch": 1145} {"train_loss": -5.742202281951904, "global_step": 48119, "epoch": 1145} {"train_loss": -5.846309661865234, "global_step": 48120, "epoch": 1145} {"train_loss": -5.702847480773926, "global_step": 48121, "epoch": 1145} {"train_loss": -5.690142631530762, "global_step": 48122, "epoch": 1145} {"train_loss": -5.75914192199707, "global_step": 48123, "epoch": 1145} {"train_loss": -5.743173599243164, "global_step": 48124, "epoch": 1145} {"train_loss": -5.869474411010742, "global_step": 48125, "epoch": 1145} {"train_loss": -5.858487129211426, "global_step": 48126, "epoch": 1145} {"train_loss": -5.694546222686768, "global_step": 48127, "epoch": 1145} {"train_loss": -5.769372940063477, "global_step": 48128, "epoch": 1145} {"train_loss": -5.5393524169921875, "global_step": 48129, "epoch": 1145} {"train_loss": -5.701936721801758, "global_step": 48130, "epoch": 1145} {"train_loss": -5.716051726114182, "global_step": 48131, "epoch": 1145, "val_loss": 61620.01953125} {"train_loss": -5.744132041931152, "global_step": 48132, "epoch": 1146} {"train_loss": -5.765812397003174, "global_step": 48133, "epoch": 1146} {"train_loss": -5.709506034851074, "global_step": 48134, "epoch": 1146} {"train_loss": -5.769759654998779, "global_step": 48135, "epoch": 1146} {"train_loss": -5.861361503601074, "global_step": 48136, "epoch": 1146} {"train_loss": -5.651560306549072, "global_step": 48137, "epoch": 1146} {"train_loss": -5.777600288391113, "global_step": 48138, "epoch": 1146} {"train_loss": -5.756282806396484, "global_step": 48139, "epoch": 1146} {"train_loss": -5.730451583862305, "global_step": 48140, "epoch": 1146} {"train_loss": -5.823030948638916, "global_step": 48141, "epoch": 1146} {"train_loss": -5.640909194946289, "global_step": 48142, "epoch": 1146} {"train_loss": -5.807660102844238, "global_step": 48143, "epoch": 1146} {"train_loss": -5.758945465087891, "global_step": 48144, "epoch": 1146} {"train_loss": -5.934676170349121, "global_step": 48145, "epoch": 1146} {"train_loss": -5.874757289886475, "global_step": 48146, "epoch": 1146} {"train_loss": -5.7531561851501465, "global_step": 48147, "epoch": 1146} {"train_loss": -5.659480094909668, "global_step": 48148, "epoch": 1146} {"train_loss": -5.829138278961182, "global_step": 48149, "epoch": 1146} {"train_loss": -5.785192489624023, "global_step": 48150, "epoch": 1146} {"train_loss": -5.730638027191162, "global_step": 48151, "epoch": 1146} {"train_loss": -5.868906021118164, "global_step": 48152, "epoch": 1146} {"train_loss": -5.634016513824463, "global_step": 48153, "epoch": 1146} {"train_loss": -5.892580032348633, "global_step": 48154, "epoch": 1146} {"train_loss": -5.721662998199463, "global_step": 48155, "epoch": 1146} {"train_loss": -5.702363967895508, "global_step": 48156, "epoch": 1146} {"train_loss": -5.694890975952148, "global_step": 48157, "epoch": 1146} {"train_loss": -5.744576930999756, "global_step": 48158, "epoch": 1146} {"train_loss": -5.659913063049316, "global_step": 48159, "epoch": 1146} {"train_loss": -5.752364635467529, "global_step": 48160, "epoch": 1146} {"train_loss": -5.617565155029297, "global_step": 48161, "epoch": 1146} {"train_loss": -5.718603610992432, "global_step": 48162, "epoch": 1146} {"train_loss": -5.667881011962891, "global_step": 48163, "epoch": 1146} {"train_loss": -5.70072078704834, "global_step": 48164, "epoch": 1146} {"train_loss": -5.6430253982543945, "global_step": 48165, "epoch": 1146} {"train_loss": -5.726777076721191, "global_step": 48166, "epoch": 1146} {"train_loss": -5.673829078674316, "global_step": 48167, "epoch": 1146} {"train_loss": -5.735205173492432, "global_step": 48168, "epoch": 1146} {"train_loss": -5.792103290557861, "global_step": 48169, "epoch": 1146} {"train_loss": -5.8062920570373535, "global_step": 48170, "epoch": 1146} {"train_loss": -5.774516582489014, "global_step": 48171, "epoch": 1146} {"train_loss": -5.848372936248779, "global_step": 48172, "epoch": 1146} {"train_loss": -5.749754531042917, "global_step": 48173, "epoch": 1146, "val_loss": 61142.28125} {"train_loss": -5.828826904296875, "global_step": 48174, "epoch": 1147} {"train_loss": -5.7137861251831055, "global_step": 48175, "epoch": 1147} {"train_loss": -5.666504859924316, "global_step": 48176, "epoch": 1147} {"train_loss": -5.7423858642578125, "global_step": 48177, "epoch": 1147} {"train_loss": -5.726283550262451, "global_step": 48178, "epoch": 1147} {"train_loss": -5.728946685791016, "global_step": 48179, "epoch": 1147} {"train_loss": -5.862802982330322, "global_step": 48180, "epoch": 1147} {"train_loss": -5.657580852508545, "global_step": 48181, "epoch": 1147} {"train_loss": -5.623128890991211, "global_step": 48182, "epoch": 1147} {"train_loss": -5.71398401260376, "global_step": 48183, "epoch": 1147} {"train_loss": -5.702974796295166, "global_step": 48184, "epoch": 1147} {"train_loss": -5.743278503417969, "global_step": 48185, "epoch": 1147} {"train_loss": -5.735119819641113, "global_step": 48186, "epoch": 1147} {"train_loss": -5.780910491943359, "global_step": 48187, "epoch": 1147} {"train_loss": -5.81110143661499, "global_step": 48188, "epoch": 1147} {"train_loss": -5.866558074951172, "global_step": 48189, "epoch": 1147} {"train_loss": -5.722550392150879, "global_step": 48190, "epoch": 1147} {"train_loss": -5.763659477233887, "global_step": 48191, "epoch": 1147} {"train_loss": -5.788852691650391, "global_step": 48192, "epoch": 1147} {"train_loss": -5.685667514801025, "global_step": 48193, "epoch": 1147} {"train_loss": -5.713152885437012, "global_step": 48194, "epoch": 1147} {"train_loss": -5.7718048095703125, "global_step": 48195, "epoch": 1147} {"train_loss": -5.7258782386779785, "global_step": 48196, "epoch": 1147} {"train_loss": -5.616031169891357, "global_step": 48197, "epoch": 1147} {"train_loss": -5.732184410095215, "global_step": 48198, "epoch": 1147} {"train_loss": -5.775500297546387, "global_step": 48199, "epoch": 1147} {"train_loss": -5.699037551879883, "global_step": 48200, "epoch": 1147} {"train_loss": -5.786094665527344, "global_step": 48201, "epoch": 1147} {"train_loss": -5.740804672241211, "global_step": 48202, "epoch": 1147} {"train_loss": -5.789361953735352, "global_step": 48203, "epoch": 1147} {"train_loss": -5.732311725616455, "global_step": 48204, "epoch": 1147} {"train_loss": -5.68571138381958, "global_step": 48205, "epoch": 1147} {"train_loss": -5.716642379760742, "global_step": 48206, "epoch": 1147} {"train_loss": -5.731585502624512, "global_step": 48207, "epoch": 1147} {"train_loss": -5.745794296264648, "global_step": 48208, "epoch": 1147} {"train_loss": -5.717660903930664, "global_step": 48209, "epoch": 1147} {"train_loss": -5.823270797729492, "global_step": 48210, "epoch": 1147} {"train_loss": -5.7684454917907715, "global_step": 48211, "epoch": 1147} {"train_loss": -5.700439453125, "global_step": 48212, "epoch": 1147} {"train_loss": -5.816100120544434, "global_step": 48213, "epoch": 1147} {"train_loss": -5.746009826660156, "global_step": 48214, "epoch": 1147} {"train_loss": -5.743868169330415, "global_step": 48215, "epoch": 1147, "val_loss": 61279.66796875} {"train_loss": -5.800807952880859, "global_step": 48216, "epoch": 1148} {"train_loss": -5.726675987243652, "global_step": 48217, "epoch": 1148} {"train_loss": -5.8360114097595215, "global_step": 48218, "epoch": 1148} {"train_loss": -5.804872512817383, "global_step": 48219, "epoch": 1148} {"train_loss": -5.685085296630859, "global_step": 48220, "epoch": 1148} {"train_loss": -5.798612117767334, "global_step": 48221, "epoch": 1148} {"train_loss": -5.706532001495361, "global_step": 48222, "epoch": 1148} {"train_loss": -5.753524303436279, "global_step": 48223, "epoch": 1148} {"train_loss": -5.822402000427246, "global_step": 48224, "epoch": 1148} {"train_loss": -5.804924964904785, "global_step": 48225, "epoch": 1148} {"train_loss": -5.652396202087402, "global_step": 48226, "epoch": 1148} {"train_loss": -5.952853679656982, "global_step": 48227, "epoch": 1148} {"train_loss": -5.72376823425293, "global_step": 48228, "epoch": 1148} {"train_loss": -5.794743061065674, "global_step": 48229, "epoch": 1148} {"train_loss": -5.831384658813477, "global_step": 48230, "epoch": 1148} {"train_loss": -5.88484525680542, "global_step": 48231, "epoch": 1148} {"train_loss": -5.81256103515625, "global_step": 48232, "epoch": 1148} {"train_loss": -5.733968257904053, "global_step": 48233, "epoch": 1148} {"train_loss": -5.863274574279785, "global_step": 48234, "epoch": 1148} {"train_loss": -5.781407356262207, "global_step": 48235, "epoch": 1148} {"train_loss": -5.800095558166504, "global_step": 48236, "epoch": 1148} {"train_loss": -5.7504167556762695, "global_step": 48237, "epoch": 1148} {"train_loss": -5.741864204406738, "global_step": 48238, "epoch": 1148} {"train_loss": -5.72186279296875, "global_step": 48239, "epoch": 1148} {"train_loss": -5.781594753265381, "global_step": 48240, "epoch": 1148} {"train_loss": -5.752874851226807, "global_step": 48241, "epoch": 1148} {"train_loss": -5.853206157684326, "global_step": 48242, "epoch": 1148} {"train_loss": -5.804308891296387, "global_step": 48243, "epoch": 1148} {"train_loss": -5.7737812995910645, "global_step": 48244, "epoch": 1148} {"train_loss": -5.717982292175293, "global_step": 48245, "epoch": 1148} {"train_loss": -5.786350727081299, "global_step": 48246, "epoch": 1148} {"train_loss": -5.794022083282471, "global_step": 48247, "epoch": 1148} {"train_loss": -5.766857147216797, "global_step": 48248, "epoch": 1148} {"train_loss": -5.718952178955078, "global_step": 48249, "epoch": 1148} {"train_loss": -5.469857215881348, "global_step": 48250, "epoch": 1148} {"train_loss": -5.730923175811768, "global_step": 48251, "epoch": 1148} {"train_loss": -5.772963523864746, "global_step": 48252, "epoch": 1148} {"train_loss": -5.733732223510742, "global_step": 48253, "epoch": 1148} {"train_loss": -5.818237781524658, "global_step": 48254, "epoch": 1148} {"train_loss": -5.7436723709106445, "global_step": 48255, "epoch": 1148} {"train_loss": -5.678987503051758, "global_step": 48256, "epoch": 1148} {"train_loss": -5.7651073932647705, "global_step": 48257, "epoch": 1148, "val_loss": 61561.5234375} {"train_loss": -5.657764911651611, "global_step": 48258, "epoch": 1149} {"train_loss": -5.717259407043457, "global_step": 48259, "epoch": 1149} {"train_loss": -5.828690052032471, "global_step": 48260, "epoch": 1149} {"train_loss": -5.70192813873291, "global_step": 48261, "epoch": 1149} {"train_loss": -5.710700988769531, "global_step": 48262, "epoch": 1149} {"train_loss": -5.723711013793945, "global_step": 48263, "epoch": 1149} {"train_loss": -5.7710065841674805, "global_step": 48264, "epoch": 1149} {"train_loss": -5.675490379333496, "global_step": 48265, "epoch": 1149} {"train_loss": -5.7937493324279785, "global_step": 48266, "epoch": 1149} {"train_loss": -5.7820281982421875, "global_step": 48267, "epoch": 1149} {"train_loss": -5.7907233238220215, "global_step": 48268, "epoch": 1149} {"train_loss": -5.801755905151367, "global_step": 48269, "epoch": 1149} {"train_loss": -5.8371734619140625, "global_step": 48270, "epoch": 1149} {"train_loss": -5.850955963134766, "global_step": 48271, "epoch": 1149} {"train_loss": -5.715273857116699, "global_step": 48272, "epoch": 1149} {"train_loss": -5.69843864440918, "global_step": 48273, "epoch": 1149} {"train_loss": -5.766718864440918, "global_step": 48274, "epoch": 1149} {"train_loss": -5.853696823120117, "global_step": 48275, "epoch": 1149} {"train_loss": -5.772027015686035, "global_step": 48276, "epoch": 1149} {"train_loss": -5.841403484344482, "global_step": 48277, "epoch": 1149} {"train_loss": -5.760128974914551, "global_step": 48278, "epoch": 1149} {"train_loss": -5.837893962860107, "global_step": 48279, "epoch": 1149} {"train_loss": -5.885724067687988, "global_step": 48280, "epoch": 1149} {"train_loss": -5.817933082580566, "global_step": 48281, "epoch": 1149} {"train_loss": -5.740464210510254, "global_step": 48282, "epoch": 1149} {"train_loss": -5.868556976318359, "global_step": 48283, "epoch": 1149} {"train_loss": -5.614416599273682, "global_step": 48284, "epoch": 1149} {"train_loss": -5.750588417053223, "global_step": 48285, "epoch": 1149} {"train_loss": -5.765039443969727, "global_step": 48286, "epoch": 1149} {"train_loss": -5.7549309730529785, "global_step": 48287, "epoch": 1149} {"train_loss": -5.788046360015869, "global_step": 48288, "epoch": 1149} {"train_loss": -5.806593894958496, "global_step": 48289, "epoch": 1149} {"train_loss": -5.716781139373779, "global_step": 48290, "epoch": 1149} {"train_loss": -5.75709342956543, "global_step": 48291, "epoch": 1149} {"train_loss": -5.728728771209717, "global_step": 48292, "epoch": 1149} {"train_loss": -5.891899585723877, "global_step": 48293, "epoch": 1149} {"train_loss": -5.617631912231445, "global_step": 48294, "epoch": 1149} {"train_loss": -5.603420257568359, "global_step": 48295, "epoch": 1149} {"train_loss": -5.76542854309082, "global_step": 48296, "epoch": 1149} {"train_loss": -5.593742847442627, "global_step": 48297, "epoch": 1149} {"train_loss": -5.732688903808594, "global_step": 48298, "epoch": 1149} {"train_loss": -5.754354590461368, "global_step": 48299, "epoch": 1149, "val_loss": 61903.640625} {"train_loss": -5.729094982147217, "global_step": 48300, "epoch": 1150} {"train_loss": -5.610344886779785, "global_step": 48301, "epoch": 1150} {"train_loss": -5.636381149291992, "global_step": 48302, "epoch": 1150} {"train_loss": -5.790061950683594, "global_step": 48303, "epoch": 1150} {"train_loss": -5.674900054931641, "global_step": 48304, "epoch": 1150} {"train_loss": -5.6989850997924805, "global_step": 48305, "epoch": 1150} {"train_loss": -5.753279685974121, "global_step": 48306, "epoch": 1150} {"train_loss": -5.705689907073975, "global_step": 48307, "epoch": 1150} {"train_loss": -5.784289360046387, "global_step": 48308, "epoch": 1150} {"train_loss": -5.671393394470215, "global_step": 48309, "epoch": 1150} {"train_loss": -5.747673988342285, "global_step": 48310, "epoch": 1150} {"train_loss": -5.707554817199707, "global_step": 48311, "epoch": 1150} {"train_loss": -5.772655487060547, "global_step": 48312, "epoch": 1150} {"train_loss": -5.717004776000977, "global_step": 48313, "epoch": 1150} {"train_loss": -5.789436340332031, "global_step": 48314, "epoch": 1150} {"train_loss": -5.740586280822754, "global_step": 48315, "epoch": 1150} {"train_loss": -5.74129581451416, "global_step": 48316, "epoch": 1150} {"train_loss": -5.7123541831970215, "global_step": 48317, "epoch": 1150} {"train_loss": -5.762400150299072, "global_step": 48318, "epoch": 1150} {"train_loss": -5.714996337890625, "global_step": 48319, "epoch": 1150} {"train_loss": -5.771221160888672, "global_step": 48320, "epoch": 1150} {"train_loss": -5.810842514038086, "global_step": 48321, "epoch": 1150} {"train_loss": -5.821275234222412, "global_step": 48322, "epoch": 1150} {"train_loss": -5.781294345855713, "global_step": 48323, "epoch": 1150} {"train_loss": -5.686688423156738, "global_step": 48324, "epoch": 1150} {"train_loss": -5.8110857009887695, "global_step": 48325, "epoch": 1150} {"train_loss": -5.818597793579102, "global_step": 48326, "epoch": 1150} {"train_loss": -5.781050205230713, "global_step": 48327, "epoch": 1150} {"train_loss": -5.745840072631836, "global_step": 48328, "epoch": 1150} {"train_loss": -5.783489227294922, "global_step": 48329, "epoch": 1150} {"train_loss": -5.702500343322754, "global_step": 48330, "epoch": 1150} {"train_loss": -5.76901388168335, "global_step": 48331, "epoch": 1150} {"train_loss": -5.6395769119262695, "global_step": 48332, "epoch": 1150} {"train_loss": -5.743839263916016, "global_step": 48333, "epoch": 1150} {"train_loss": -5.751202583312988, "global_step": 48334, "epoch": 1150} {"train_loss": -5.683849334716797, "global_step": 48335, "epoch": 1150} {"train_loss": -5.7553606033325195, "global_step": 48336, "epoch": 1150} {"train_loss": -5.667491436004639, "global_step": 48337, "epoch": 1150} {"train_loss": -5.837282657623291, "global_step": 48338, "epoch": 1150} {"train_loss": -5.773874282836914, "global_step": 48339, "epoch": 1150} {"train_loss": -5.776542663574219, "global_step": 48340, "epoch": 1150} {"train_loss": -5.739247798919678, "global_step": 48341, "epoch": 1150, "train/sim_max_reward_0": 0.39777940227368314, "train/sim_max_reward_1": 0.8384464015763343, "train/sim_max_reward_2": 0.6429517200318453, "train/sim_max_reward_3": 0.8471904366305592, "train/sim_max_reward_4": 0.8430940148440419, "train/sim_max_reward_5": 0.729681422774626, "test/sim_max_reward_4300000": 0.5155958806717997, "test/sim_max_reward_4300001": 0.18440261521427845, "test/sim_max_reward_4300002": 0.835576152792104, "test/sim_max_reward_4300003": 0.5862327903825116, "test/sim_max_reward_4300004": 0.7044712330713399, "test/sim_max_reward_4300005": 0.9128899809819526, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.6884858123235464, "test/sim_max_reward_4300008": 0.8718030411644522, "test/sim_max_reward_4300009": 0.859508063996567, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.4747738439813153, "test/sim_max_reward_4300012": 0.9083231566954633, "test/sim_max_reward_4300013": 0.7797210921905258, "test/sim_max_reward_4300014": 0.9690413891184786, "test/sim_max_reward_4300015": 0.22434380981056135, "test/sim_max_reward_4300016": 0.7467161728175719, "test/sim_max_reward_4300017": 0.4402438744465765, "test/sim_max_reward_4300018": 0.42320869472501366, "test/sim_max_reward_4300019": 0.18517105418684984, "test/sim_max_reward_4300020": 0.9288182733285788, "test/sim_max_reward_4300021": 0.6100867741016074, "test/sim_max_reward_4300022": 0.22561886020943703, "test/sim_max_reward_4300023": 0.35978767199832995, "test/sim_max_reward_4300024": 0.09780279186028724, "test/sim_max_reward_4300025": 0.7231266109930279, "test/sim_max_reward_4300026": 0.17343785153031085, "test/sim_max_reward_4300027": 0.8013209792664302, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.248113926306843, "test/sim_max_reward_4300032": 0.8525180943666218, "test/sim_max_reward_4300033": 0.4115492497347886, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.6978429614317452, "test/sim_max_reward_4300038": 0.7020151037951257, "test/sim_max_reward_4300039": 0.5001510362644899, "test/sim_max_reward_4300040": 0.25513225784139076, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.8777882283760262, "test/sim_max_reward_4300043": 0.14591637633667903, "test/sim_max_reward_4300044": 0.7484432617691775, "test/sim_max_reward_4300045": 0.19072675622367624, "test/sim_max_reward_4300046": 0.6462284105763262, "test/sim_max_reward_4300047": 0.18182502695689523, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.03883142324995514, "train/mean_score": 0.7165238996885149, "test/mean_score": 0.43853569401304276, "val_loss": 61183.53125} {"train_loss": -5.896759033203125, "global_step": 48342, "epoch": 1151} {"train_loss": -5.813789367675781, "global_step": 48343, "epoch": 1151} {"train_loss": -5.794840335845947, "global_step": 48344, "epoch": 1151} {"train_loss": -5.790351867675781, "global_step": 48345, "epoch": 1151} {"train_loss": -5.869341850280762, "global_step": 48346, "epoch": 1151} {"train_loss": -5.665835380554199, "global_step": 48347, "epoch": 1151} {"train_loss": -5.812565803527832, "global_step": 48348, "epoch": 1151} {"train_loss": -5.667605400085449, "global_step": 48349, "epoch": 1151} {"train_loss": -5.901791572570801, "global_step": 48350, "epoch": 1151} {"train_loss": -5.795989036560059, "global_step": 48351, "epoch": 1151} {"train_loss": -5.612007141113281, "global_step": 48352, "epoch": 1151} {"train_loss": -5.592031955718994, "global_step": 48353, "epoch": 1151} {"train_loss": -5.749013423919678, "global_step": 48354, "epoch": 1151} {"train_loss": -5.617942810058594, "global_step": 48355, "epoch": 1151} {"train_loss": -5.614261627197266, "global_step": 48356, "epoch": 1151} {"train_loss": -5.740762233734131, "global_step": 48357, "epoch": 1151} {"train_loss": -5.6065497398376465, "global_step": 48358, "epoch": 1151} {"train_loss": -5.722831726074219, "global_step": 48359, "epoch": 1151} {"train_loss": -5.733804225921631, "global_step": 48360, "epoch": 1151} {"train_loss": -5.728387832641602, "global_step": 48361, "epoch": 1151} {"train_loss": -5.830624580383301, "global_step": 48362, "epoch": 1151} {"train_loss": -5.593503952026367, "global_step": 48363, "epoch": 1151} {"train_loss": -5.811315536499023, "global_step": 48364, "epoch": 1151} {"train_loss": -5.638260364532471, "global_step": 48365, "epoch": 1151} {"train_loss": -5.651098251342773, "global_step": 48366, "epoch": 1151} {"train_loss": -5.721382141113281, "global_step": 48367, "epoch": 1151} {"train_loss": -5.596548080444336, "global_step": 48368, "epoch": 1151} {"train_loss": -5.674037456512451, "global_step": 48369, "epoch": 1151} {"train_loss": -5.688723564147949, "global_step": 48370, "epoch": 1151} {"train_loss": -5.741262912750244, "global_step": 48371, "epoch": 1151} {"train_loss": -5.76339054107666, "global_step": 48372, "epoch": 1151} {"train_loss": -5.678278923034668, "global_step": 48373, "epoch": 1151} {"train_loss": -5.733780860900879, "global_step": 48374, "epoch": 1151} {"train_loss": -5.739587306976318, "global_step": 48375, "epoch": 1151} {"train_loss": -5.785623073577881, "global_step": 48376, "epoch": 1151} {"train_loss": -5.7233757972717285, "global_step": 48377, "epoch": 1151} {"train_loss": -5.681663990020752, "global_step": 48378, "epoch": 1151} {"train_loss": -5.733912467956543, "global_step": 48379, "epoch": 1151} {"train_loss": -5.731143951416016, "global_step": 48380, "epoch": 1151} {"train_loss": -5.635370254516602, "global_step": 48381, "epoch": 1151} {"train_loss": -5.712021827697754, "global_step": 48382, "epoch": 1151} {"train_loss": -5.719167663937523, "global_step": 48383, "epoch": 1151, "val_loss": 61709.90625} {"train_loss": -5.616109371185303, "global_step": 48384, "epoch": 1152} {"train_loss": -5.676587104797363, "global_step": 48385, "epoch": 1152} {"train_loss": -5.604389190673828, "global_step": 48386, "epoch": 1152} {"train_loss": -5.720861911773682, "global_step": 48387, "epoch": 1152} {"train_loss": -5.584458351135254, "global_step": 48388, "epoch": 1152} {"train_loss": -5.759955883026123, "global_step": 48389, "epoch": 1152} {"train_loss": -5.716901779174805, "global_step": 48390, "epoch": 1152} {"train_loss": -5.7975873947143555, "global_step": 48391, "epoch": 1152} {"train_loss": -5.775779724121094, "global_step": 48392, "epoch": 1152} {"train_loss": -5.748180389404297, "global_step": 48393, "epoch": 1152} {"train_loss": -5.655096530914307, "global_step": 48394, "epoch": 1152} {"train_loss": -5.703798770904541, "global_step": 48395, "epoch": 1152} {"train_loss": -5.746260643005371, "global_step": 48396, "epoch": 1152} {"train_loss": -5.88646125793457, "global_step": 48397, "epoch": 1152} {"train_loss": -5.647004127502441, "global_step": 48398, "epoch": 1152} {"train_loss": -5.76797342300415, "global_step": 48399, "epoch": 1152} {"train_loss": -5.667822360992432, "global_step": 48400, "epoch": 1152} {"train_loss": -5.785735130310059, "global_step": 48401, "epoch": 1152} {"train_loss": -5.788609504699707, "global_step": 48402, "epoch": 1152} {"train_loss": -5.823625564575195, "global_step": 48403, "epoch": 1152} {"train_loss": -5.786830902099609, "global_step": 48404, "epoch": 1152} {"train_loss": -5.614103317260742, "global_step": 48405, "epoch": 1152} {"train_loss": -5.784049034118652, "global_step": 48406, "epoch": 1152} {"train_loss": -5.740761756896973, "global_step": 48407, "epoch": 1152} {"train_loss": -5.803676128387451, "global_step": 48408, "epoch": 1152} {"train_loss": -5.702528953552246, "global_step": 48409, "epoch": 1152} {"train_loss": -5.695167064666748, "global_step": 48410, "epoch": 1152} {"train_loss": -5.742786407470703, "global_step": 48411, "epoch": 1152} {"train_loss": -5.830748558044434, "global_step": 48412, "epoch": 1152} {"train_loss": -5.724700927734375, "global_step": 48413, "epoch": 1152} {"train_loss": -5.858281135559082, "global_step": 48414, "epoch": 1152} {"train_loss": -5.778717994689941, "global_step": 48415, "epoch": 1152} {"train_loss": -5.7772955894470215, "global_step": 48416, "epoch": 1152} {"train_loss": -5.752876281738281, "global_step": 48417, "epoch": 1152} {"train_loss": -5.766119003295898, "global_step": 48418, "epoch": 1152} {"train_loss": -5.722831726074219, "global_step": 48419, "epoch": 1152} {"train_loss": -5.753747940063477, "global_step": 48420, "epoch": 1152} {"train_loss": -5.834095001220703, "global_step": 48421, "epoch": 1152} {"train_loss": -5.709446907043457, "global_step": 48422, "epoch": 1152} {"train_loss": -5.798905372619629, "global_step": 48423, "epoch": 1152} {"train_loss": -5.832386016845703, "global_step": 48424, "epoch": 1152} {"train_loss": -5.745984656470163, "global_step": 48425, "epoch": 1152, "val_loss": 61492.91015625} {"train_loss": -5.711884498596191, "global_step": 48426, "epoch": 1153} {"train_loss": -5.757810115814209, "global_step": 48427, "epoch": 1153} {"train_loss": -5.847281455993652, "global_step": 48428, "epoch": 1153} {"train_loss": -5.7711286544799805, "global_step": 48429, "epoch": 1153} {"train_loss": -5.873861789703369, "global_step": 48430, "epoch": 1153} {"train_loss": -5.7006425857543945, "global_step": 48431, "epoch": 1153} {"train_loss": -5.797835826873779, "global_step": 48432, "epoch": 1153} {"train_loss": -5.679409027099609, "global_step": 48433, "epoch": 1153} {"train_loss": -5.846434116363525, "global_step": 48434, "epoch": 1153} {"train_loss": -5.688231468200684, "global_step": 48435, "epoch": 1153} {"train_loss": -5.7494354248046875, "global_step": 48436, "epoch": 1153} {"train_loss": -5.675209999084473, "global_step": 48437, "epoch": 1153} {"train_loss": -5.867519378662109, "global_step": 48438, "epoch": 1153} {"train_loss": -5.860515594482422, "global_step": 48439, "epoch": 1153} {"train_loss": -5.828685760498047, "global_step": 48440, "epoch": 1153} {"train_loss": -5.811797618865967, "global_step": 48441, "epoch": 1153} {"train_loss": -5.797125339508057, "global_step": 48442, "epoch": 1153} {"train_loss": -5.634479522705078, "global_step": 48443, "epoch": 1153} {"train_loss": -5.812363147735596, "global_step": 48444, "epoch": 1153} {"train_loss": -5.7589430809021, "global_step": 48445, "epoch": 1153} {"train_loss": -5.800022125244141, "global_step": 48446, "epoch": 1153} {"train_loss": -5.7054290771484375, "global_step": 48447, "epoch": 1153} {"train_loss": -5.737308502197266, "global_step": 48448, "epoch": 1153} {"train_loss": -5.652637004852295, "global_step": 48449, "epoch": 1153} {"train_loss": -5.871746063232422, "global_step": 48450, "epoch": 1153} {"train_loss": -5.673239707946777, "global_step": 48451, "epoch": 1153} {"train_loss": -5.67822265625, "global_step": 48452, "epoch": 1153} {"train_loss": -5.82090950012207, "global_step": 48453, "epoch": 1153} {"train_loss": -5.708428382873535, "global_step": 48454, "epoch": 1153} {"train_loss": -5.658857822418213, "global_step": 48455, "epoch": 1153} {"train_loss": -5.786611557006836, "global_step": 48456, "epoch": 1153} {"train_loss": -5.7329230308532715, "global_step": 48457, "epoch": 1153} {"train_loss": -5.7090559005737305, "global_step": 48458, "epoch": 1153} {"train_loss": -5.743108749389648, "global_step": 48459, "epoch": 1153} {"train_loss": -5.781207084655762, "global_step": 48460, "epoch": 1153} {"train_loss": -5.805991172790527, "global_step": 48461, "epoch": 1153} {"train_loss": -5.793368816375732, "global_step": 48462, "epoch": 1153} {"train_loss": -5.858945846557617, "global_step": 48463, "epoch": 1153} {"train_loss": -5.842658519744873, "global_step": 48464, "epoch": 1153} {"train_loss": -5.720207214355469, "global_step": 48465, "epoch": 1153} {"train_loss": -5.7689619064331055, "global_step": 48466, "epoch": 1153} {"train_loss": -5.763815811702183, "global_step": 48467, "epoch": 1153, "val_loss": 62034.00390625} {"train_loss": -5.653459072113037, "global_step": 48468, "epoch": 1154} {"train_loss": -5.801476001739502, "global_step": 48469, "epoch": 1154} {"train_loss": -5.741711616516113, "global_step": 48470, "epoch": 1154} {"train_loss": -5.6440229415893555, "global_step": 48471, "epoch": 1154} {"train_loss": -5.752674102783203, "global_step": 48472, "epoch": 1154} {"train_loss": -5.78740119934082, "global_step": 48473, "epoch": 1154} {"train_loss": -5.774317741394043, "global_step": 48474, "epoch": 1154} {"train_loss": -5.8746232986450195, "global_step": 48475, "epoch": 1154} {"train_loss": -5.768849849700928, "global_step": 48476, "epoch": 1154} {"train_loss": -5.7717695236206055, "global_step": 48477, "epoch": 1154} {"train_loss": -5.7907867431640625, "global_step": 48478, "epoch": 1154} {"train_loss": -5.803753852844238, "global_step": 48479, "epoch": 1154} {"train_loss": -5.637729644775391, "global_step": 48480, "epoch": 1154} {"train_loss": -5.62996244430542, "global_step": 48481, "epoch": 1154} {"train_loss": -5.75404167175293, "global_step": 48482, "epoch": 1154} {"train_loss": -5.653971195220947, "global_step": 48483, "epoch": 1154} {"train_loss": -5.657105445861816, "global_step": 48484, "epoch": 1154} {"train_loss": -5.734979629516602, "global_step": 48485, "epoch": 1154} {"train_loss": -5.672926902770996, "global_step": 48486, "epoch": 1154} {"train_loss": -5.757370471954346, "global_step": 48487, "epoch": 1154} {"train_loss": -5.771839141845703, "global_step": 48488, "epoch": 1154} {"train_loss": -5.644318580627441, "global_step": 48489, "epoch": 1154} {"train_loss": -5.784926891326904, "global_step": 48490, "epoch": 1154} {"train_loss": -5.596007347106934, "global_step": 48491, "epoch": 1154} {"train_loss": -5.756747245788574, "global_step": 48492, "epoch": 1154} {"train_loss": -5.631871223449707, "global_step": 48493, "epoch": 1154} {"train_loss": -5.7483625411987305, "global_step": 48494, "epoch": 1154} {"train_loss": -5.73114013671875, "global_step": 48495, "epoch": 1154} {"train_loss": -5.663760185241699, "global_step": 48496, "epoch": 1154} {"train_loss": -5.636724948883057, "global_step": 48497, "epoch": 1154} {"train_loss": -5.896153450012207, "global_step": 48498, "epoch": 1154} {"train_loss": -5.731732368469238, "global_step": 48499, "epoch": 1154} {"train_loss": -5.77085018157959, "global_step": 48500, "epoch": 1154} {"train_loss": -5.852169990539551, "global_step": 48501, "epoch": 1154} {"train_loss": -5.811337471008301, "global_step": 48502, "epoch": 1154} {"train_loss": -5.709142684936523, "global_step": 48503, "epoch": 1154} {"train_loss": -5.708905220031738, "global_step": 48504, "epoch": 1154} {"train_loss": -5.5735626220703125, "global_step": 48505, "epoch": 1154} {"train_loss": -5.744479179382324, "global_step": 48506, "epoch": 1154} {"train_loss": -5.696794033050537, "global_step": 48507, "epoch": 1154} {"train_loss": -5.785280704498291, "global_step": 48508, "epoch": 1154} {"train_loss": -5.73063782283238, "global_step": 48509, "epoch": 1154, "val_loss": 61623.37890625} {"train_loss": -5.666057109832764, "global_step": 48510, "epoch": 1155} {"train_loss": -5.736045837402344, "global_step": 48511, "epoch": 1155} {"train_loss": -5.846603870391846, "global_step": 48512, "epoch": 1155} {"train_loss": -5.909231662750244, "global_step": 48513, "epoch": 1155} {"train_loss": -5.615278244018555, "global_step": 48514, "epoch": 1155} {"train_loss": -5.831222057342529, "global_step": 48515, "epoch": 1155} {"train_loss": -5.755409240722656, "global_step": 48516, "epoch": 1155} {"train_loss": -5.720877647399902, "global_step": 48517, "epoch": 1155} {"train_loss": -5.734757900238037, "global_step": 48518, "epoch": 1155} {"train_loss": -5.713526248931885, "global_step": 48519, "epoch": 1155} {"train_loss": -5.802412033081055, "global_step": 48520, "epoch": 1155} {"train_loss": -5.653085231781006, "global_step": 48521, "epoch": 1155} {"train_loss": -5.619419097900391, "global_step": 48522, "epoch": 1155} {"train_loss": -5.780254364013672, "global_step": 48523, "epoch": 1155} {"train_loss": -5.852934837341309, "global_step": 48524, "epoch": 1155} {"train_loss": -5.713773250579834, "global_step": 48525, "epoch": 1155} {"train_loss": -5.876596927642822, "global_step": 48526, "epoch": 1155} {"train_loss": -5.784173011779785, "global_step": 48527, "epoch": 1155} {"train_loss": -5.830200672149658, "global_step": 48528, "epoch": 1155} {"train_loss": -5.8815813064575195, "global_step": 48529, "epoch": 1155} {"train_loss": -5.833589553833008, "global_step": 48530, "epoch": 1155} {"train_loss": -5.719797134399414, "global_step": 48531, "epoch": 1155} {"train_loss": -5.733635902404785, "global_step": 48532, "epoch": 1155} {"train_loss": -5.70814847946167, "global_step": 48533, "epoch": 1155} {"train_loss": -5.760857105255127, "global_step": 48534, "epoch": 1155} {"train_loss": -5.840167999267578, "global_step": 48535, "epoch": 1155} {"train_loss": -5.787505149841309, "global_step": 48536, "epoch": 1155} {"train_loss": -5.862790107727051, "global_step": 48537, "epoch": 1155} {"train_loss": -5.652000427246094, "global_step": 48538, "epoch": 1155} {"train_loss": -5.7014570236206055, "global_step": 48539, "epoch": 1155} {"train_loss": -5.739347457885742, "global_step": 48540, "epoch": 1155} {"train_loss": -5.685772895812988, "global_step": 48541, "epoch": 1155} {"train_loss": -5.732897758483887, "global_step": 48542, "epoch": 1155} {"train_loss": -5.839612007141113, "global_step": 48543, "epoch": 1155} {"train_loss": -5.828958511352539, "global_step": 48544, "epoch": 1155} {"train_loss": -5.779565811157227, "global_step": 48545, "epoch": 1155} {"train_loss": -5.745260715484619, "global_step": 48546, "epoch": 1155} {"train_loss": -5.758712291717529, "global_step": 48547, "epoch": 1155} {"train_loss": -5.738171100616455, "global_step": 48548, "epoch": 1155} {"train_loss": -5.720180511474609, "global_step": 48549, "epoch": 1155} {"train_loss": -5.753168106079102, "global_step": 48550, "epoch": 1155} {"train_loss": -5.763128848302932, "global_step": 48551, "epoch": 1155, "val_loss": 61555.93359375} {"train_loss": -5.680118560791016, "global_step": 48552, "epoch": 1156} {"train_loss": -5.814938545227051, "global_step": 48553, "epoch": 1156} {"train_loss": -5.722886562347412, "global_step": 48554, "epoch": 1156} {"train_loss": -5.816669940948486, "global_step": 48555, "epoch": 1156} {"train_loss": -5.854902267456055, "global_step": 48556, "epoch": 1156} {"train_loss": -5.765809535980225, "global_step": 48557, "epoch": 1156} {"train_loss": -5.7047882080078125, "global_step": 48558, "epoch": 1156} {"train_loss": -5.735102653503418, "global_step": 48559, "epoch": 1156} {"train_loss": -5.794917106628418, "global_step": 48560, "epoch": 1156} {"train_loss": -5.905389308929443, "global_step": 48561, "epoch": 1156} {"train_loss": -5.740243434906006, "global_step": 48562, "epoch": 1156} {"train_loss": -5.727025508880615, "global_step": 48563, "epoch": 1156} {"train_loss": -5.803894996643066, "global_step": 48564, "epoch": 1156} {"train_loss": -5.619907855987549, "global_step": 48565, "epoch": 1156} {"train_loss": -5.688560962677002, "global_step": 48566, "epoch": 1156} {"train_loss": -5.830672264099121, "global_step": 48567, "epoch": 1156} {"train_loss": -5.67704963684082, "global_step": 48568, "epoch": 1156} {"train_loss": -5.731884002685547, "global_step": 48569, "epoch": 1156} {"train_loss": -5.841211318969727, "global_step": 48570, "epoch": 1156} {"train_loss": -5.7390289306640625, "global_step": 48571, "epoch": 1156} {"train_loss": -5.70894718170166, "global_step": 48572, "epoch": 1156} {"train_loss": -5.7043232917785645, "global_step": 48573, "epoch": 1156} {"train_loss": -5.877142906188965, "global_step": 48574, "epoch": 1156} {"train_loss": -5.723258018493652, "global_step": 48575, "epoch": 1156} {"train_loss": -5.727809906005859, "global_step": 48576, "epoch": 1156} {"train_loss": -5.692300796508789, "global_step": 48577, "epoch": 1156} {"train_loss": -5.825590133666992, "global_step": 48578, "epoch": 1156} {"train_loss": -5.8907060623168945, "global_step": 48579, "epoch": 1156} {"train_loss": -5.798443794250488, "global_step": 48580, "epoch": 1156} {"train_loss": -5.751856803894043, "global_step": 48581, "epoch": 1156} {"train_loss": -5.678713321685791, "global_step": 48582, "epoch": 1156} {"train_loss": -5.854904651641846, "global_step": 48583, "epoch": 1156} {"train_loss": -5.704922676086426, "global_step": 48584, "epoch": 1156} {"train_loss": -5.899449348449707, "global_step": 48585, "epoch": 1156} {"train_loss": -5.7452898025512695, "global_step": 48586, "epoch": 1156} {"train_loss": -5.724399089813232, "global_step": 48587, "epoch": 1156} {"train_loss": -5.759392738342285, "global_step": 48588, "epoch": 1156} {"train_loss": -5.782319068908691, "global_step": 48589, "epoch": 1156} {"train_loss": -5.782090187072754, "global_step": 48590, "epoch": 1156} {"train_loss": -5.794734954833984, "global_step": 48591, "epoch": 1156} {"train_loss": -5.702574729919434, "global_step": 48592, "epoch": 1156} {"train_loss": -5.764206034796579, "global_step": 48593, "epoch": 1156, "val_loss": 61390.2265625} {"train_loss": -5.826535701751709, "global_step": 48594, "epoch": 1157} {"train_loss": -5.788602352142334, "global_step": 48595, "epoch": 1157} {"train_loss": -5.599321365356445, "global_step": 48596, "epoch": 1157} {"train_loss": -5.705434799194336, "global_step": 48597, "epoch": 1157} {"train_loss": -5.658615589141846, "global_step": 48598, "epoch": 1157} {"train_loss": -5.692507266998291, "global_step": 48599, "epoch": 1157} {"train_loss": -5.662954807281494, "global_step": 48600, "epoch": 1157} {"train_loss": -5.81450891494751, "global_step": 48601, "epoch": 1157} {"train_loss": -5.886345863342285, "global_step": 48602, "epoch": 1157} {"train_loss": -5.801203727722168, "global_step": 48603, "epoch": 1157} {"train_loss": -5.790214538574219, "global_step": 48604, "epoch": 1157} {"train_loss": -5.697758674621582, "global_step": 48605, "epoch": 1157} {"train_loss": -5.898690223693848, "global_step": 48606, "epoch": 1157} {"train_loss": -5.749985694885254, "global_step": 48607, "epoch": 1157} {"train_loss": -5.847253799438477, "global_step": 48608, "epoch": 1157} {"train_loss": -5.595852375030518, "global_step": 48609, "epoch": 1157} {"train_loss": -5.737414360046387, "global_step": 48610, "epoch": 1157} {"train_loss": -5.65674352645874, "global_step": 48611, "epoch": 1157} {"train_loss": -5.696966648101807, "global_step": 48612, "epoch": 1157} {"train_loss": -5.823233127593994, "global_step": 48613, "epoch": 1157} {"train_loss": -5.761141777038574, "global_step": 48614, "epoch": 1157} {"train_loss": -5.635623931884766, "global_step": 48615, "epoch": 1157} {"train_loss": -5.815158843994141, "global_step": 48616, "epoch": 1157} {"train_loss": -5.635140419006348, "global_step": 48617, "epoch": 1157} {"train_loss": -5.734055995941162, "global_step": 48618, "epoch": 1157} {"train_loss": -5.844548225402832, "global_step": 48619, "epoch": 1157} {"train_loss": -5.546665668487549, "global_step": 48620, "epoch": 1157} {"train_loss": -5.7078375816345215, "global_step": 48621, "epoch": 1157} {"train_loss": -5.802530288696289, "global_step": 48622, "epoch": 1157} {"train_loss": -5.586926460266113, "global_step": 48623, "epoch": 1157} {"train_loss": -5.8039870262146, "global_step": 48624, "epoch": 1157} {"train_loss": -5.630216598510742, "global_step": 48625, "epoch": 1157} {"train_loss": -5.681272506713867, "global_step": 48626, "epoch": 1157} {"train_loss": -5.711382865905762, "global_step": 48627, "epoch": 1157} {"train_loss": -5.766778469085693, "global_step": 48628, "epoch": 1157} {"train_loss": -5.750092029571533, "global_step": 48629, "epoch": 1157} {"train_loss": -5.6685380935668945, "global_step": 48630, "epoch": 1157} {"train_loss": -5.750430107116699, "global_step": 48631, "epoch": 1157} {"train_loss": -5.649701118469238, "global_step": 48632, "epoch": 1157} {"train_loss": -5.752921104431152, "global_step": 48633, "epoch": 1157} {"train_loss": -5.704436302185059, "global_step": 48634, "epoch": 1157} {"train_loss": -5.729197184244792, "global_step": 48635, "epoch": 1157, "val_loss": 61762.0625} {"train_loss": -5.807437896728516, "global_step": 48636, "epoch": 1158} {"train_loss": -5.874709606170654, "global_step": 48637, "epoch": 1158} {"train_loss": -5.715712547302246, "global_step": 48638, "epoch": 1158} {"train_loss": -5.637764930725098, "global_step": 48639, "epoch": 1158} {"train_loss": -5.866490364074707, "global_step": 48640, "epoch": 1158} {"train_loss": -5.743346691131592, "global_step": 48641, "epoch": 1158} {"train_loss": -5.704509258270264, "global_step": 48642, "epoch": 1158} {"train_loss": -5.7488627433776855, "global_step": 48643, "epoch": 1158} {"train_loss": -5.824897766113281, "global_step": 48644, "epoch": 1158} {"train_loss": -5.733790397644043, "global_step": 48645, "epoch": 1158} {"train_loss": -5.698191165924072, "global_step": 48646, "epoch": 1158} {"train_loss": -5.795379638671875, "global_step": 48647, "epoch": 1158} {"train_loss": -5.709670066833496, "global_step": 48648, "epoch": 1158} {"train_loss": -5.748900890350342, "global_step": 48649, "epoch": 1158} {"train_loss": -5.785355567932129, "global_step": 48650, "epoch": 1158} {"train_loss": -5.604016304016113, "global_step": 48651, "epoch": 1158} {"train_loss": -5.801694869995117, "global_step": 48652, "epoch": 1158} {"train_loss": -5.789937496185303, "global_step": 48653, "epoch": 1158} {"train_loss": -5.733486652374268, "global_step": 48654, "epoch": 1158} {"train_loss": -5.818811893463135, "global_step": 48655, "epoch": 1158} {"train_loss": -5.641829490661621, "global_step": 48656, "epoch": 1158} {"train_loss": -5.724191665649414, "global_step": 48657, "epoch": 1158} {"train_loss": -5.825921535491943, "global_step": 48658, "epoch": 1158} {"train_loss": -5.715230941772461, "global_step": 48659, "epoch": 1158} {"train_loss": -5.7824554443359375, "global_step": 48660, "epoch": 1158} {"train_loss": -5.654613971710205, "global_step": 48661, "epoch": 1158} {"train_loss": -5.7476606369018555, "global_step": 48662, "epoch": 1158} {"train_loss": -5.7530999183654785, "global_step": 48663, "epoch": 1158} {"train_loss": -5.780072212219238, "global_step": 48664, "epoch": 1158} {"train_loss": -5.7771501541137695, "global_step": 48665, "epoch": 1158} {"train_loss": -5.734097003936768, "global_step": 48666, "epoch": 1158} {"train_loss": -5.727402687072754, "global_step": 48667, "epoch": 1158} {"train_loss": -5.827653884887695, "global_step": 48668, "epoch": 1158} {"train_loss": -5.830345153808594, "global_step": 48669, "epoch": 1158} {"train_loss": -5.719444274902344, "global_step": 48670, "epoch": 1158} {"train_loss": -5.727898120880127, "global_step": 48671, "epoch": 1158} {"train_loss": -5.760710716247559, "global_step": 48672, "epoch": 1158} {"train_loss": -5.756025791168213, "global_step": 48673, "epoch": 1158} {"train_loss": -5.748995304107666, "global_step": 48674, "epoch": 1158} {"train_loss": -5.75708532333374, "global_step": 48675, "epoch": 1158} {"train_loss": -5.774582862854004, "global_step": 48676, "epoch": 1158} {"train_loss": -5.753069423493885, "global_step": 48677, "epoch": 1158, "val_loss": 61646.80078125} {"train_loss": -5.747171401977539, "global_step": 48678, "epoch": 1159} {"train_loss": -5.723114967346191, "global_step": 48679, "epoch": 1159} {"train_loss": -5.76882266998291, "global_step": 48680, "epoch": 1159} {"train_loss": -5.6690874099731445, "global_step": 48681, "epoch": 1159} {"train_loss": -5.651729583740234, "global_step": 48682, "epoch": 1159} {"train_loss": -5.654000282287598, "global_step": 48683, "epoch": 1159} {"train_loss": -5.793208122253418, "global_step": 48684, "epoch": 1159} {"train_loss": -5.734678268432617, "global_step": 48685, "epoch": 1159} {"train_loss": -5.798096656799316, "global_step": 48686, "epoch": 1159} {"train_loss": -5.790342330932617, "global_step": 48687, "epoch": 1159} {"train_loss": -5.804888725280762, "global_step": 48688, "epoch": 1159} {"train_loss": -5.772078514099121, "global_step": 48689, "epoch": 1159} {"train_loss": -5.859680652618408, "global_step": 48690, "epoch": 1159} {"train_loss": -5.873619079589844, "global_step": 48691, "epoch": 1159} {"train_loss": -5.825680732727051, "global_step": 48692, "epoch": 1159} {"train_loss": -5.746336460113525, "global_step": 48693, "epoch": 1159} {"train_loss": -5.7227559089660645, "global_step": 48694, "epoch": 1159} {"train_loss": -5.801980018615723, "global_step": 48695, "epoch": 1159} {"train_loss": -5.75526237487793, "global_step": 48696, "epoch": 1159} {"train_loss": -5.820321083068848, "global_step": 48697, "epoch": 1159} {"train_loss": -5.757324695587158, "global_step": 48698, "epoch": 1159} {"train_loss": -5.804010391235352, "global_step": 48699, "epoch": 1159} {"train_loss": -5.710879802703857, "global_step": 48700, "epoch": 1159} {"train_loss": -5.809979438781738, "global_step": 48701, "epoch": 1159} {"train_loss": -5.793520927429199, "global_step": 48702, "epoch": 1159} {"train_loss": -5.79460334777832, "global_step": 48703, "epoch": 1159} {"train_loss": -5.710039138793945, "global_step": 48704, "epoch": 1159} {"train_loss": -5.7685747146606445, "global_step": 48705, "epoch": 1159} {"train_loss": -5.677194595336914, "global_step": 48706, "epoch": 1159} {"train_loss": -5.582690238952637, "global_step": 48707, "epoch": 1159} {"train_loss": -5.728842735290527, "global_step": 48708, "epoch": 1159} {"train_loss": -5.715906143188477, "global_step": 48709, "epoch": 1159} {"train_loss": -5.694937705993652, "global_step": 48710, "epoch": 1159} {"train_loss": -5.803374767303467, "global_step": 48711, "epoch": 1159} {"train_loss": -5.734493255615234, "global_step": 48712, "epoch": 1159} {"train_loss": -5.7956342697143555, "global_step": 48713, "epoch": 1159} {"train_loss": -5.768516540527344, "global_step": 48714, "epoch": 1159} {"train_loss": -5.721735954284668, "global_step": 48715, "epoch": 1159} {"train_loss": -5.767512321472168, "global_step": 48716, "epoch": 1159} {"train_loss": -5.641351699829102, "global_step": 48717, "epoch": 1159} {"train_loss": -5.790046691894531, "global_step": 48718, "epoch": 1159} {"train_loss": -5.754083429064069, "global_step": 48719, "epoch": 1159, "val_loss": 61766.65234375} {"train_loss": -5.746630668640137, "global_step": 48720, "epoch": 1160} {"train_loss": -5.801701545715332, "global_step": 48721, "epoch": 1160} {"train_loss": -5.771402359008789, "global_step": 48722, "epoch": 1160} {"train_loss": -5.702582359313965, "global_step": 48723, "epoch": 1160} {"train_loss": -5.736352920532227, "global_step": 48724, "epoch": 1160} {"train_loss": -5.661501884460449, "global_step": 48725, "epoch": 1160} {"train_loss": -5.851512432098389, "global_step": 48726, "epoch": 1160} {"train_loss": -5.804289817810059, "global_step": 48727, "epoch": 1160} {"train_loss": -5.773805618286133, "global_step": 48728, "epoch": 1160} {"train_loss": -5.811868667602539, "global_step": 48729, "epoch": 1160} {"train_loss": -5.821193695068359, "global_step": 48730, "epoch": 1160} {"train_loss": -5.732416152954102, "global_step": 48731, "epoch": 1160} {"train_loss": -5.710014343261719, "global_step": 48732, "epoch": 1160} {"train_loss": -5.62882661819458, "global_step": 48733, "epoch": 1160} {"train_loss": -5.771976470947266, "global_step": 48734, "epoch": 1160} {"train_loss": -5.779880523681641, "global_step": 48735, "epoch": 1160} {"train_loss": -5.816357612609863, "global_step": 48736, "epoch": 1160} {"train_loss": -5.797719955444336, "global_step": 48737, "epoch": 1160} {"train_loss": -5.760289192199707, "global_step": 48738, "epoch": 1160} {"train_loss": -5.671014785766602, "global_step": 48739, "epoch": 1160} {"train_loss": -5.742063522338867, "global_step": 48740, "epoch": 1160} {"train_loss": -5.783577919006348, "global_step": 48741, "epoch": 1160} {"train_loss": -5.750511169433594, "global_step": 48742, "epoch": 1160} {"train_loss": -5.873909950256348, "global_step": 48743, "epoch": 1160} {"train_loss": -5.812723159790039, "global_step": 48744, "epoch": 1160} {"train_loss": -5.77359676361084, "global_step": 48745, "epoch": 1160} {"train_loss": -5.820481300354004, "global_step": 48746, "epoch": 1160} {"train_loss": -5.751026630401611, "global_step": 48747, "epoch": 1160} {"train_loss": -5.837217330932617, "global_step": 48748, "epoch": 1160} {"train_loss": -5.808807373046875, "global_step": 48749, "epoch": 1160} {"train_loss": -5.655766010284424, "global_step": 48750, "epoch": 1160} {"train_loss": -5.648643493652344, "global_step": 48751, "epoch": 1160} {"train_loss": -5.791262626647949, "global_step": 48752, "epoch": 1160} {"train_loss": -5.64806604385376, "global_step": 48753, "epoch": 1160} {"train_loss": -5.733299255371094, "global_step": 48754, "epoch": 1160} {"train_loss": -5.673331260681152, "global_step": 48755, "epoch": 1160} {"train_loss": -5.7468132972717285, "global_step": 48756, "epoch": 1160} {"train_loss": -5.890531539916992, "global_step": 48757, "epoch": 1160} {"train_loss": -5.607285976409912, "global_step": 48758, "epoch": 1160} {"train_loss": -5.7398786544799805, "global_step": 48759, "epoch": 1160} {"train_loss": -5.7160491943359375, "global_step": 48760, "epoch": 1160} {"train_loss": -5.754976749420166, "global_step": 48761, "epoch": 1160, "val_loss": 61390.88671875} {"train_loss": -5.676798343658447, "global_step": 48762, "epoch": 1161} {"train_loss": -5.67617654800415, "global_step": 48763, "epoch": 1161} {"train_loss": -5.759100914001465, "global_step": 48764, "epoch": 1161} {"train_loss": -5.82051420211792, "global_step": 48765, "epoch": 1161} {"train_loss": -5.8530497550964355, "global_step": 48766, "epoch": 1161} {"train_loss": -5.773852348327637, "global_step": 48767, "epoch": 1161} {"train_loss": -5.791114330291748, "global_step": 48768, "epoch": 1161} {"train_loss": -5.767980098724365, "global_step": 48769, "epoch": 1161} {"train_loss": -5.850526332855225, "global_step": 48770, "epoch": 1161} {"train_loss": -5.697604179382324, "global_step": 48771, "epoch": 1161} {"train_loss": -5.7850542068481445, "global_step": 48772, "epoch": 1161} {"train_loss": -5.744329452514648, "global_step": 48773, "epoch": 1161} {"train_loss": -5.756616592407227, "global_step": 48774, "epoch": 1161} {"train_loss": -5.750765800476074, "global_step": 48775, "epoch": 1161} {"train_loss": -5.778782367706299, "global_step": 48776, "epoch": 1161} {"train_loss": -5.720325469970703, "global_step": 48777, "epoch": 1161} {"train_loss": -5.741768836975098, "global_step": 48778, "epoch": 1161} {"train_loss": -5.793062210083008, "global_step": 48779, "epoch": 1161} {"train_loss": -5.743359565734863, "global_step": 48780, "epoch": 1161} {"train_loss": -5.702785491943359, "global_step": 48781, "epoch": 1161} {"train_loss": -5.80311393737793, "global_step": 48782, "epoch": 1161} {"train_loss": -5.726489543914795, "global_step": 48783, "epoch": 1161} {"train_loss": -5.750735759735107, "global_step": 48784, "epoch": 1161} {"train_loss": -5.85610294342041, "global_step": 48785, "epoch": 1161} {"train_loss": -5.742961883544922, "global_step": 48786, "epoch": 1161} {"train_loss": -5.835299491882324, "global_step": 48787, "epoch": 1161} {"train_loss": -5.737851619720459, "global_step": 48788, "epoch": 1161} {"train_loss": -5.797354698181152, "global_step": 48789, "epoch": 1161} {"train_loss": -5.687881946563721, "global_step": 48790, "epoch": 1161} {"train_loss": -5.685634613037109, "global_step": 48791, "epoch": 1161} {"train_loss": -5.760991096496582, "global_step": 48792, "epoch": 1161} {"train_loss": -5.832345485687256, "global_step": 48793, "epoch": 1161} {"train_loss": -5.779522895812988, "global_step": 48794, "epoch": 1161} {"train_loss": -5.694827556610107, "global_step": 48795, "epoch": 1161} {"train_loss": -5.762977123260498, "global_step": 48796, "epoch": 1161} {"train_loss": -5.919205665588379, "global_step": 48797, "epoch": 1161} {"train_loss": -5.707744598388672, "global_step": 48798, "epoch": 1161} {"train_loss": -5.805755138397217, "global_step": 48799, "epoch": 1161} {"train_loss": -5.819332122802734, "global_step": 48800, "epoch": 1161} {"train_loss": -5.747749328613281, "global_step": 48801, "epoch": 1161} {"train_loss": -5.792231559753418, "global_step": 48802, "epoch": 1161} {"train_loss": -5.769142763955252, "global_step": 48803, "epoch": 1161, "val_loss": 61543.35546875} {"train_loss": -5.884395599365234, "global_step": 48804, "epoch": 1162} {"train_loss": -5.763158798217773, "global_step": 48805, "epoch": 1162} {"train_loss": -5.684589862823486, "global_step": 48806, "epoch": 1162} {"train_loss": -5.804318428039551, "global_step": 48807, "epoch": 1162} {"train_loss": -5.705991744995117, "global_step": 48808, "epoch": 1162} {"train_loss": -5.889318466186523, "global_step": 48809, "epoch": 1162} {"train_loss": -5.753432750701904, "global_step": 48810, "epoch": 1162} {"train_loss": -5.681394100189209, "global_step": 48811, "epoch": 1162} {"train_loss": -5.75279426574707, "global_step": 48812, "epoch": 1162} {"train_loss": -5.769824981689453, "global_step": 48813, "epoch": 1162} {"train_loss": -5.80763053894043, "global_step": 48814, "epoch": 1162} {"train_loss": -5.868732452392578, "global_step": 48815, "epoch": 1162} {"train_loss": -5.812564849853516, "global_step": 48816, "epoch": 1162} {"train_loss": -5.839822292327881, "global_step": 48817, "epoch": 1162} {"train_loss": -5.780547618865967, "global_step": 48818, "epoch": 1162} {"train_loss": -5.751654624938965, "global_step": 48819, "epoch": 1162} {"train_loss": -5.70998477935791, "global_step": 48820, "epoch": 1162} {"train_loss": -5.813673973083496, "global_step": 48821, "epoch": 1162} {"train_loss": -5.816061973571777, "global_step": 48822, "epoch": 1162} {"train_loss": -5.74772834777832, "global_step": 48823, "epoch": 1162} {"train_loss": -5.759463310241699, "global_step": 48824, "epoch": 1162} {"train_loss": -5.785295486450195, "global_step": 48825, "epoch": 1162} {"train_loss": -5.761613845825195, "global_step": 48826, "epoch": 1162} {"train_loss": -5.7584333419799805, "global_step": 48827, "epoch": 1162} {"train_loss": -5.889031410217285, "global_step": 48828, "epoch": 1162} {"train_loss": -5.761559009552002, "global_step": 48829, "epoch": 1162} {"train_loss": -5.945138931274414, "global_step": 48830, "epoch": 1162} {"train_loss": -5.817216873168945, "global_step": 48831, "epoch": 1162} {"train_loss": -5.840960502624512, "global_step": 48832, "epoch": 1162} {"train_loss": -5.781500339508057, "global_step": 48833, "epoch": 1162} {"train_loss": -5.793792724609375, "global_step": 48834, "epoch": 1162} {"train_loss": -5.794118881225586, "global_step": 48835, "epoch": 1162} {"train_loss": -5.798360824584961, "global_step": 48836, "epoch": 1162} {"train_loss": -5.84487771987915, "global_step": 48837, "epoch": 1162} {"train_loss": -5.712596893310547, "global_step": 48838, "epoch": 1162} {"train_loss": -5.772879600524902, "global_step": 48839, "epoch": 1162} {"train_loss": -5.745756149291992, "global_step": 48840, "epoch": 1162} {"train_loss": -5.757159233093262, "global_step": 48841, "epoch": 1162} {"train_loss": -5.709701061248779, "global_step": 48842, "epoch": 1162} {"train_loss": -5.866741180419922, "global_step": 48843, "epoch": 1162} {"train_loss": -5.68498420715332, "global_step": 48844, "epoch": 1162} {"train_loss": -5.784278699329922, "global_step": 48845, "epoch": 1162, "val_loss": 61750.61328125} {"train_loss": -5.854068756103516, "global_step": 48846, "epoch": 1163} {"train_loss": -5.745756149291992, "global_step": 48847, "epoch": 1163} {"train_loss": -5.612102508544922, "global_step": 48848, "epoch": 1163} {"train_loss": -5.700937271118164, "global_step": 48849, "epoch": 1163} {"train_loss": -5.802906036376953, "global_step": 48850, "epoch": 1163} {"train_loss": -5.805717468261719, "global_step": 48851, "epoch": 1163} {"train_loss": -5.698512077331543, "global_step": 48852, "epoch": 1163} {"train_loss": -5.696643829345703, "global_step": 48853, "epoch": 1163} {"train_loss": -5.752571105957031, "global_step": 48854, "epoch": 1163} {"train_loss": -5.729578018188477, "global_step": 48855, "epoch": 1163} {"train_loss": -5.920258045196533, "global_step": 48856, "epoch": 1163} {"train_loss": -5.598394393920898, "global_step": 48857, "epoch": 1163} {"train_loss": -5.748984336853027, "global_step": 48858, "epoch": 1163} {"train_loss": -5.754056930541992, "global_step": 48859, "epoch": 1163} {"train_loss": -5.6281633377075195, "global_step": 48860, "epoch": 1163} {"train_loss": -5.792946815490723, "global_step": 48861, "epoch": 1163} {"train_loss": -5.658787250518799, "global_step": 48862, "epoch": 1163} {"train_loss": -5.739717483520508, "global_step": 48863, "epoch": 1163} {"train_loss": -5.791483402252197, "global_step": 48864, "epoch": 1163} {"train_loss": -5.6290435791015625, "global_step": 48865, "epoch": 1163} {"train_loss": -5.848566055297852, "global_step": 48866, "epoch": 1163} {"train_loss": -5.801258087158203, "global_step": 48867, "epoch": 1163} {"train_loss": -5.597769737243652, "global_step": 48868, "epoch": 1163} {"train_loss": -5.8292341232299805, "global_step": 48869, "epoch": 1163} {"train_loss": -5.676117897033691, "global_step": 48870, "epoch": 1163} {"train_loss": -5.641439437866211, "global_step": 48871, "epoch": 1163} {"train_loss": -5.785286903381348, "global_step": 48872, "epoch": 1163} {"train_loss": -5.60454797744751, "global_step": 48873, "epoch": 1163} {"train_loss": -5.832901477813721, "global_step": 48874, "epoch": 1163} {"train_loss": -5.749824523925781, "global_step": 48875, "epoch": 1163} {"train_loss": -5.738535404205322, "global_step": 48876, "epoch": 1163} {"train_loss": -5.810915946960449, "global_step": 48877, "epoch": 1163} {"train_loss": -5.7309794425964355, "global_step": 48878, "epoch": 1163} {"train_loss": -5.691554069519043, "global_step": 48879, "epoch": 1163} {"train_loss": -5.611408233642578, "global_step": 48880, "epoch": 1163} {"train_loss": -5.702599048614502, "global_step": 48881, "epoch": 1163} {"train_loss": -5.7141923904418945, "global_step": 48882, "epoch": 1163} {"train_loss": -5.712935447692871, "global_step": 48883, "epoch": 1163} {"train_loss": -5.702361583709717, "global_step": 48884, "epoch": 1163} {"train_loss": -5.7614850997924805, "global_step": 48885, "epoch": 1163} {"train_loss": -5.76959228515625, "global_step": 48886, "epoch": 1163} {"train_loss": -5.728539137613206, "global_step": 48887, "epoch": 1163, "val_loss": 61630.765625} {"train_loss": -5.818789482116699, "global_step": 48888, "epoch": 1164} {"train_loss": -5.699403762817383, "global_step": 48889, "epoch": 1164} {"train_loss": -5.7943339347839355, "global_step": 48890, "epoch": 1164} {"train_loss": -5.653276443481445, "global_step": 48891, "epoch": 1164} {"train_loss": -5.673306941986084, "global_step": 48892, "epoch": 1164} {"train_loss": -5.701401233673096, "global_step": 48893, "epoch": 1164} {"train_loss": -5.664397716522217, "global_step": 48894, "epoch": 1164} {"train_loss": -5.736045837402344, "global_step": 48895, "epoch": 1164} {"train_loss": -5.6978302001953125, "global_step": 48896, "epoch": 1164} {"train_loss": -5.58512020111084, "global_step": 48897, "epoch": 1164} {"train_loss": -5.84107780456543, "global_step": 48898, "epoch": 1164} {"train_loss": -5.729358673095703, "global_step": 48899, "epoch": 1164} {"train_loss": -5.746055603027344, "global_step": 48900, "epoch": 1164} {"train_loss": -5.829031944274902, "global_step": 48901, "epoch": 1164} {"train_loss": -5.798674583435059, "global_step": 48902, "epoch": 1164} {"train_loss": -5.73245906829834, "global_step": 48903, "epoch": 1164} {"train_loss": -5.665594100952148, "global_step": 48904, "epoch": 1164} {"train_loss": -5.867769718170166, "global_step": 48905, "epoch": 1164} {"train_loss": -5.774308204650879, "global_step": 48906, "epoch": 1164} {"train_loss": -5.6503071784973145, "global_step": 48907, "epoch": 1164} {"train_loss": -5.7619476318359375, "global_step": 48908, "epoch": 1164} {"train_loss": -5.7082133293151855, "global_step": 48909, "epoch": 1164} {"train_loss": -5.819592475891113, "global_step": 48910, "epoch": 1164} {"train_loss": -5.787162780761719, "global_step": 48911, "epoch": 1164} {"train_loss": -5.784700870513916, "global_step": 48912, "epoch": 1164} {"train_loss": -5.6827216148376465, "global_step": 48913, "epoch": 1164} {"train_loss": -5.6610260009765625, "global_step": 48914, "epoch": 1164} {"train_loss": -5.80966329574585, "global_step": 48915, "epoch": 1164} {"train_loss": -5.822004318237305, "global_step": 48916, "epoch": 1164} {"train_loss": -5.7642927169799805, "global_step": 48917, "epoch": 1164} {"train_loss": -5.806573390960693, "global_step": 48918, "epoch": 1164} {"train_loss": -5.8001556396484375, "global_step": 48919, "epoch": 1164} {"train_loss": -5.703469276428223, "global_step": 48920, "epoch": 1164} {"train_loss": -5.699613571166992, "global_step": 48921, "epoch": 1164} {"train_loss": -5.798236846923828, "global_step": 48922, "epoch": 1164} {"train_loss": -5.63672399520874, "global_step": 48923, "epoch": 1164} {"train_loss": -5.735784530639648, "global_step": 48924, "epoch": 1164} {"train_loss": -5.7429938316345215, "global_step": 48925, "epoch": 1164} {"train_loss": -5.77717924118042, "global_step": 48926, "epoch": 1164} {"train_loss": -5.775619983673096, "global_step": 48927, "epoch": 1164} {"train_loss": -5.688784599304199, "global_step": 48928, "epoch": 1164} {"train_loss": -5.743041697002592, "global_step": 48929, "epoch": 1164, "val_loss": 61601.73046875} {"train_loss": -5.6830525398254395, "global_step": 48930, "epoch": 1165} {"train_loss": -5.693599700927734, "global_step": 48931, "epoch": 1165} {"train_loss": -5.797102928161621, "global_step": 48932, "epoch": 1165} {"train_loss": -5.782535552978516, "global_step": 48933, "epoch": 1165} {"train_loss": -5.812593460083008, "global_step": 48934, "epoch": 1165} {"train_loss": -5.806848049163818, "global_step": 48935, "epoch": 1165} {"train_loss": -5.770606994628906, "global_step": 48936, "epoch": 1165} {"train_loss": -5.731624603271484, "global_step": 48937, "epoch": 1165} {"train_loss": -5.732717037200928, "global_step": 48938, "epoch": 1165} {"train_loss": -5.723590850830078, "global_step": 48939, "epoch": 1165} {"train_loss": -5.955284118652344, "global_step": 48940, "epoch": 1165} {"train_loss": -5.723398208618164, "global_step": 48941, "epoch": 1165} {"train_loss": -5.6784749031066895, "global_step": 48942, "epoch": 1165} {"train_loss": -5.850947856903076, "global_step": 48943, "epoch": 1165} {"train_loss": -5.78389835357666, "global_step": 48944, "epoch": 1165} {"train_loss": -5.850940704345703, "global_step": 48945, "epoch": 1165} {"train_loss": -5.7134270668029785, "global_step": 48946, "epoch": 1165} {"train_loss": -5.75141716003418, "global_step": 48947, "epoch": 1165} {"train_loss": -5.785737037658691, "global_step": 48948, "epoch": 1165} {"train_loss": -5.687504291534424, "global_step": 48949, "epoch": 1165} {"train_loss": -5.850250244140625, "global_step": 48950, "epoch": 1165} {"train_loss": -5.755670070648193, "global_step": 48951, "epoch": 1165} {"train_loss": -5.758182525634766, "global_step": 48952, "epoch": 1165} {"train_loss": -5.875683307647705, "global_step": 48953, "epoch": 1165} {"train_loss": -5.703029155731201, "global_step": 48954, "epoch": 1165} {"train_loss": -5.679525375366211, "global_step": 48955, "epoch": 1165} {"train_loss": -5.766343116760254, "global_step": 48956, "epoch": 1165} {"train_loss": -5.7424516677856445, "global_step": 48957, "epoch": 1165} {"train_loss": -5.726555347442627, "global_step": 48958, "epoch": 1165} {"train_loss": -5.752476692199707, "global_step": 48959, "epoch": 1165} {"train_loss": -5.810781478881836, "global_step": 48960, "epoch": 1165} {"train_loss": -5.786103248596191, "global_step": 48961, "epoch": 1165} {"train_loss": -5.786725997924805, "global_step": 48962, "epoch": 1165} {"train_loss": -5.694388389587402, "global_step": 48963, "epoch": 1165} {"train_loss": -5.848937034606934, "global_step": 48964, "epoch": 1165} {"train_loss": -5.834113121032715, "global_step": 48965, "epoch": 1165} {"train_loss": -5.677139759063721, "global_step": 48966, "epoch": 1165} {"train_loss": -5.894465446472168, "global_step": 48967, "epoch": 1165} {"train_loss": -5.805168151855469, "global_step": 48968, "epoch": 1165} {"train_loss": -5.809082984924316, "global_step": 48969, "epoch": 1165} {"train_loss": -5.664979457855225, "global_step": 48970, "epoch": 1165} {"train_loss": -5.768562067122686, "global_step": 48971, "epoch": 1165, "val_loss": 61597.35546875} {"train_loss": -5.714231491088867, "global_step": 48972, "epoch": 1166} {"train_loss": -5.891280174255371, "global_step": 48973, "epoch": 1166} {"train_loss": -5.77204704284668, "global_step": 48974, "epoch": 1166} {"train_loss": -5.884657859802246, "global_step": 48975, "epoch": 1166} {"train_loss": -5.829641342163086, "global_step": 48976, "epoch": 1166} {"train_loss": -5.86029052734375, "global_step": 48977, "epoch": 1166} {"train_loss": -5.7475810050964355, "global_step": 48978, "epoch": 1166} {"train_loss": -5.856411933898926, "global_step": 48979, "epoch": 1166} {"train_loss": -5.845442295074463, "global_step": 48980, "epoch": 1166} {"train_loss": -5.756716728210449, "global_step": 48981, "epoch": 1166} {"train_loss": -5.693634986877441, "global_step": 48982, "epoch": 1166} {"train_loss": -5.865656852722168, "global_step": 48983, "epoch": 1166} {"train_loss": -5.793933868408203, "global_step": 48984, "epoch": 1166} {"train_loss": -5.774503707885742, "global_step": 48985, "epoch": 1166} {"train_loss": -5.656520843505859, "global_step": 48986, "epoch": 1166} {"train_loss": -5.8492631912231445, "global_step": 48987, "epoch": 1166} {"train_loss": -5.790322303771973, "global_step": 48988, "epoch": 1166} {"train_loss": -5.734683990478516, "global_step": 48989, "epoch": 1166} {"train_loss": -5.569951057434082, "global_step": 48990, "epoch": 1166} {"train_loss": -5.773838996887207, "global_step": 48991, "epoch": 1166} {"train_loss": -5.5832695960998535, "global_step": 48992, "epoch": 1166} {"train_loss": -5.619278430938721, "global_step": 48993, "epoch": 1166} {"train_loss": -5.861439228057861, "global_step": 48994, "epoch": 1166} {"train_loss": -5.721773147583008, "global_step": 48995, "epoch": 1166} {"train_loss": -5.768590927124023, "global_step": 48996, "epoch": 1166} {"train_loss": -5.656737327575684, "global_step": 48997, "epoch": 1166} {"train_loss": -5.796847343444824, "global_step": 48998, "epoch": 1166} {"train_loss": -5.80418586730957, "global_step": 48999, "epoch": 1166} {"train_loss": -5.925893306732178, "global_step": 49000, "epoch": 1166} {"train_loss": -5.7566938400268555, "global_step": 49001, "epoch": 1166} {"train_loss": -5.738828182220459, "global_step": 49002, "epoch": 1166} {"train_loss": -5.801011562347412, "global_step": 49003, "epoch": 1166} {"train_loss": -5.7919921875, "global_step": 49004, "epoch": 1166} {"train_loss": -5.814887523651123, "global_step": 49005, "epoch": 1166} {"train_loss": -5.683051109313965, "global_step": 49006, "epoch": 1166} {"train_loss": -5.868966579437256, "global_step": 49007, "epoch": 1166} {"train_loss": -5.830545425415039, "global_step": 49008, "epoch": 1166} {"train_loss": -5.752788543701172, "global_step": 49009, "epoch": 1166} {"train_loss": -5.662550926208496, "global_step": 49010, "epoch": 1166} {"train_loss": -5.74386739730835, "global_step": 49011, "epoch": 1166} {"train_loss": -5.775233268737793, "global_step": 49012, "epoch": 1166} {"train_loss": -5.770573286783128, "global_step": 49013, "epoch": 1166, "val_loss": 61715.59375} {"train_loss": -5.702585697174072, "global_step": 49014, "epoch": 1167} {"train_loss": -5.715336799621582, "global_step": 49015, "epoch": 1167} {"train_loss": -5.899198532104492, "global_step": 49016, "epoch": 1167} {"train_loss": -5.750539779663086, "global_step": 49017, "epoch": 1167} {"train_loss": -5.671348571777344, "global_step": 49018, "epoch": 1167} {"train_loss": -5.818024635314941, "global_step": 49019, "epoch": 1167} {"train_loss": -5.788537502288818, "global_step": 49020, "epoch": 1167} {"train_loss": -5.66312837600708, "global_step": 49021, "epoch": 1167} {"train_loss": -5.723942756652832, "global_step": 49022, "epoch": 1167} {"train_loss": -5.687676906585693, "global_step": 49023, "epoch": 1167} {"train_loss": -5.802064895629883, "global_step": 49024, "epoch": 1167} {"train_loss": -5.648595809936523, "global_step": 49025, "epoch": 1167} {"train_loss": -5.734698295593262, "global_step": 49026, "epoch": 1167} {"train_loss": -5.463050365447998, "global_step": 49027, "epoch": 1167} {"train_loss": -5.695195198059082, "global_step": 49028, "epoch": 1167} {"train_loss": -5.676031112670898, "global_step": 49029, "epoch": 1167} {"train_loss": -5.559003829956055, "global_step": 49030, "epoch": 1167} {"train_loss": -5.613527297973633, "global_step": 49031, "epoch": 1167} {"train_loss": -5.732184410095215, "global_step": 49032, "epoch": 1167} {"train_loss": -5.566679000854492, "global_step": 49033, "epoch": 1167} {"train_loss": -5.635197639465332, "global_step": 49034, "epoch": 1167} {"train_loss": -5.683249473571777, "global_step": 49035, "epoch": 1167} {"train_loss": -5.69358491897583, "global_step": 49036, "epoch": 1167} {"train_loss": -5.687483787536621, "global_step": 49037, "epoch": 1167} {"train_loss": -5.713230133056641, "global_step": 49038, "epoch": 1167} {"train_loss": -5.614808082580566, "global_step": 49039, "epoch": 1167} {"train_loss": -5.730282306671143, "global_step": 49040, "epoch": 1167} {"train_loss": -5.704389572143555, "global_step": 49041, "epoch": 1167} {"train_loss": -5.789750099182129, "global_step": 49042, "epoch": 1167} {"train_loss": -5.707772254943848, "global_step": 49043, "epoch": 1167} {"train_loss": -5.682004928588867, "global_step": 49044, "epoch": 1167} {"train_loss": -5.806297302246094, "global_step": 49045, "epoch": 1167} {"train_loss": -5.629581451416016, "global_step": 49046, "epoch": 1167} {"train_loss": -5.791243553161621, "global_step": 49047, "epoch": 1167} {"train_loss": -5.735713005065918, "global_step": 49048, "epoch": 1167} {"train_loss": -5.831183910369873, "global_step": 49049, "epoch": 1167} {"train_loss": -5.809818744659424, "global_step": 49050, "epoch": 1167} {"train_loss": -5.745862007141113, "global_step": 49051, "epoch": 1167} {"train_loss": -5.889765739440918, "global_step": 49052, "epoch": 1167} {"train_loss": -5.7597503662109375, "global_step": 49053, "epoch": 1167} {"train_loss": -5.753792762756348, "global_step": 49054, "epoch": 1167} {"train_loss": -5.7137392702556795, "global_step": 49055, "epoch": 1167, "val_loss": 61686.80078125} {"train_loss": -5.76055908203125, "global_step": 49056, "epoch": 1168} {"train_loss": -5.715631484985352, "global_step": 49057, "epoch": 1168} {"train_loss": -5.73846960067749, "global_step": 49058, "epoch": 1168} {"train_loss": -5.841273307800293, "global_step": 49059, "epoch": 1168} {"train_loss": -5.834897041320801, "global_step": 49060, "epoch": 1168} {"train_loss": -5.855382442474365, "global_step": 49061, "epoch": 1168} {"train_loss": -5.719760894775391, "global_step": 49062, "epoch": 1168} {"train_loss": -5.642636299133301, "global_step": 49063, "epoch": 1168} {"train_loss": -5.656191825866699, "global_step": 49064, "epoch": 1168} {"train_loss": -5.781074523925781, "global_step": 49065, "epoch": 1168} {"train_loss": -5.688448905944824, "global_step": 49066, "epoch": 1168} {"train_loss": -5.758466720581055, "global_step": 49067, "epoch": 1168} {"train_loss": -5.7224297523498535, "global_step": 49068, "epoch": 1168} {"train_loss": -5.71036958694458, "global_step": 49069, "epoch": 1168} {"train_loss": -5.791321754455566, "global_step": 49070, "epoch": 1168} {"train_loss": -5.843820571899414, "global_step": 49071, "epoch": 1168} {"train_loss": -5.8989057540893555, "global_step": 49072, "epoch": 1168} {"train_loss": -5.818397045135498, "global_step": 49073, "epoch": 1168} {"train_loss": -5.868474006652832, "global_step": 49074, "epoch": 1168} {"train_loss": -5.76601505279541, "global_step": 49075, "epoch": 1168} {"train_loss": -5.738391876220703, "global_step": 49076, "epoch": 1168} {"train_loss": -5.893509864807129, "global_step": 49077, "epoch": 1168} {"train_loss": -5.730775356292725, "global_step": 49078, "epoch": 1168} {"train_loss": -5.680435657501221, "global_step": 49079, "epoch": 1168} {"train_loss": -5.779533386230469, "global_step": 49080, "epoch": 1168} {"train_loss": -5.654054164886475, "global_step": 49081, "epoch": 1168} {"train_loss": -5.698955059051514, "global_step": 49082, "epoch": 1168} {"train_loss": -5.766084671020508, "global_step": 49083, "epoch": 1168} {"train_loss": -5.6673078536987305, "global_step": 49084, "epoch": 1168} {"train_loss": -5.641653060913086, "global_step": 49085, "epoch": 1168} {"train_loss": -5.743185997009277, "global_step": 49086, "epoch": 1168} {"train_loss": -5.754880905151367, "global_step": 49087, "epoch": 1168} {"train_loss": -5.610599040985107, "global_step": 49088, "epoch": 1168} {"train_loss": -5.609238147735596, "global_step": 49089, "epoch": 1168} {"train_loss": -5.852106094360352, "global_step": 49090, "epoch": 1168} {"train_loss": -5.632277965545654, "global_step": 49091, "epoch": 1168} {"train_loss": -5.799949645996094, "global_step": 49092, "epoch": 1168} {"train_loss": -5.718982219696045, "global_step": 49093, "epoch": 1168} {"train_loss": -5.787823677062988, "global_step": 49094, "epoch": 1168} {"train_loss": -5.690707683563232, "global_step": 49095, "epoch": 1168} {"train_loss": -5.70110559463501, "global_step": 49096, "epoch": 1168} {"train_loss": -5.744408641542707, "global_step": 49097, "epoch": 1168, "val_loss": 62183.70703125} {"train_loss": -5.727493762969971, "global_step": 49098, "epoch": 1169} {"train_loss": -5.7209296226501465, "global_step": 49099, "epoch": 1169} {"train_loss": -5.640458106994629, "global_step": 49100, "epoch": 1169} {"train_loss": -5.78956413269043, "global_step": 49101, "epoch": 1169} {"train_loss": -5.727700233459473, "global_step": 49102, "epoch": 1169} {"train_loss": -5.674543380737305, "global_step": 49103, "epoch": 1169} {"train_loss": -5.817926406860352, "global_step": 49104, "epoch": 1169} {"train_loss": -5.726016044616699, "global_step": 49105, "epoch": 1169} {"train_loss": -5.8526716232299805, "global_step": 49106, "epoch": 1169} {"train_loss": -5.785315036773682, "global_step": 49107, "epoch": 1169} {"train_loss": -5.790937423706055, "global_step": 49108, "epoch": 1169} {"train_loss": -5.9307756423950195, "global_step": 49109, "epoch": 1169} {"train_loss": -5.74583625793457, "global_step": 49110, "epoch": 1169} {"train_loss": -5.672239303588867, "global_step": 49111, "epoch": 1169} {"train_loss": -5.880988121032715, "global_step": 49112, "epoch": 1169} {"train_loss": -5.783986568450928, "global_step": 49113, "epoch": 1169} {"train_loss": -5.726640701293945, "global_step": 49114, "epoch": 1169} {"train_loss": -5.786727428436279, "global_step": 49115, "epoch": 1169} {"train_loss": -5.745819091796875, "global_step": 49116, "epoch": 1169} {"train_loss": -5.701358318328857, "global_step": 49117, "epoch": 1169} {"train_loss": -5.772498607635498, "global_step": 49118, "epoch": 1169} {"train_loss": -5.729799747467041, "global_step": 49119, "epoch": 1169} {"train_loss": -5.795568943023682, "global_step": 49120, "epoch": 1169} {"train_loss": -5.823822021484375, "global_step": 49121, "epoch": 1169} {"train_loss": -5.756980895996094, "global_step": 49122, "epoch": 1169} {"train_loss": -5.654693603515625, "global_step": 49123, "epoch": 1169} {"train_loss": -5.7153000831604, "global_step": 49124, "epoch": 1169} {"train_loss": -5.813528060913086, "global_step": 49125, "epoch": 1169} {"train_loss": -5.684178352355957, "global_step": 49126, "epoch": 1169} {"train_loss": -5.741881370544434, "global_step": 49127, "epoch": 1169} {"train_loss": -5.758159637451172, "global_step": 49128, "epoch": 1169} {"train_loss": -5.707592964172363, "global_step": 49129, "epoch": 1169} {"train_loss": -5.789491653442383, "global_step": 49130, "epoch": 1169} {"train_loss": -5.777561187744141, "global_step": 49131, "epoch": 1169} {"train_loss": -5.8101806640625, "global_step": 49132, "epoch": 1169} {"train_loss": -5.732590675354004, "global_step": 49133, "epoch": 1169} {"train_loss": -5.7533111572265625, "global_step": 49134, "epoch": 1169} {"train_loss": -5.653876304626465, "global_step": 49135, "epoch": 1169} {"train_loss": -5.822107315063477, "global_step": 49136, "epoch": 1169} {"train_loss": -5.870141983032227, "global_step": 49137, "epoch": 1169} {"train_loss": -5.680203437805176, "global_step": 49138, "epoch": 1169} {"train_loss": -5.760259809948149, "global_step": 49139, "epoch": 1169, "val_loss": 61502.19921875} {"train_loss": -5.820380210876465, "global_step": 49140, "epoch": 1170} {"train_loss": -5.673340797424316, "global_step": 49141, "epoch": 1170} {"train_loss": -5.770212650299072, "global_step": 49142, "epoch": 1170} {"train_loss": -5.72637939453125, "global_step": 49143, "epoch": 1170} {"train_loss": -5.913392543792725, "global_step": 49144, "epoch": 1170} {"train_loss": -5.705349922180176, "global_step": 49145, "epoch": 1170} {"train_loss": -5.581662654876709, "global_step": 49146, "epoch": 1170} {"train_loss": -5.682718276977539, "global_step": 49147, "epoch": 1170} {"train_loss": -5.776142597198486, "global_step": 49148, "epoch": 1170} {"train_loss": -5.702732086181641, "global_step": 49149, "epoch": 1170} {"train_loss": -5.680791854858398, "global_step": 49150, "epoch": 1170} {"train_loss": -5.737915992736816, "global_step": 49151, "epoch": 1170} {"train_loss": -5.82167387008667, "global_step": 49152, "epoch": 1170} {"train_loss": -5.769570350646973, "global_step": 49153, "epoch": 1170} {"train_loss": -5.896510124206543, "global_step": 49154, "epoch": 1170} {"train_loss": -5.833510398864746, "global_step": 49155, "epoch": 1170} {"train_loss": -5.782027721405029, "global_step": 49156, "epoch": 1170} {"train_loss": -5.7770538330078125, "global_step": 49157, "epoch": 1170} {"train_loss": -5.631389617919922, "global_step": 49158, "epoch": 1170} {"train_loss": -5.715658664703369, "global_step": 49159, "epoch": 1170} {"train_loss": -5.772834777832031, "global_step": 49160, "epoch": 1170} {"train_loss": -5.786843299865723, "global_step": 49161, "epoch": 1170} {"train_loss": -5.82010555267334, "global_step": 49162, "epoch": 1170} {"train_loss": -5.610665321350098, "global_step": 49163, "epoch": 1170} {"train_loss": -5.773715972900391, "global_step": 49164, "epoch": 1170} {"train_loss": -5.684502601623535, "global_step": 49165, "epoch": 1170} {"train_loss": -5.859870433807373, "global_step": 49166, "epoch": 1170} {"train_loss": -5.746471405029297, "global_step": 49167, "epoch": 1170} {"train_loss": -5.727892875671387, "global_step": 49168, "epoch": 1170} {"train_loss": -5.7603349685668945, "global_step": 49169, "epoch": 1170} {"train_loss": -5.839138031005859, "global_step": 49170, "epoch": 1170} {"train_loss": -5.628425598144531, "global_step": 49171, "epoch": 1170} {"train_loss": -5.731164932250977, "global_step": 49172, "epoch": 1170} {"train_loss": -5.724081993103027, "global_step": 49173, "epoch": 1170} {"train_loss": -5.708619117736816, "global_step": 49174, "epoch": 1170} {"train_loss": -5.731363296508789, "global_step": 49175, "epoch": 1170} {"train_loss": -5.5661773681640625, "global_step": 49176, "epoch": 1170} {"train_loss": -5.694824695587158, "global_step": 49177, "epoch": 1170} {"train_loss": -5.64547872543335, "global_step": 49178, "epoch": 1170} {"train_loss": -5.682539939880371, "global_step": 49179, "epoch": 1170} {"train_loss": -5.706545829772949, "global_step": 49180, "epoch": 1170} {"train_loss": -5.734408560253325, "global_step": 49181, "epoch": 1170, "val_loss": 61626.6953125} {"train_loss": -5.773934364318848, "global_step": 49182, "epoch": 1171} {"train_loss": -5.616360664367676, "global_step": 49183, "epoch": 1171} {"train_loss": -5.809012413024902, "global_step": 49184, "epoch": 1171} {"train_loss": -5.63902473449707, "global_step": 49185, "epoch": 1171} {"train_loss": -5.808674335479736, "global_step": 49186, "epoch": 1171} {"train_loss": -5.772650718688965, "global_step": 49187, "epoch": 1171} {"train_loss": -5.621757507324219, "global_step": 49188, "epoch": 1171} {"train_loss": -5.704438209533691, "global_step": 49189, "epoch": 1171} {"train_loss": -5.718271255493164, "global_step": 49190, "epoch": 1171} {"train_loss": -5.807567596435547, "global_step": 49191, "epoch": 1171} {"train_loss": -5.706881999969482, "global_step": 49192, "epoch": 1171} {"train_loss": -5.752757549285889, "global_step": 49193, "epoch": 1171} {"train_loss": -5.64677619934082, "global_step": 49194, "epoch": 1171} {"train_loss": -5.689230442047119, "global_step": 49195, "epoch": 1171} {"train_loss": -5.660384654998779, "global_step": 49196, "epoch": 1171} {"train_loss": -5.6860551834106445, "global_step": 49197, "epoch": 1171} {"train_loss": -5.581918716430664, "global_step": 49198, "epoch": 1171} {"train_loss": -5.750927925109863, "global_step": 49199, "epoch": 1171} {"train_loss": -5.739857196807861, "global_step": 49200, "epoch": 1171} {"train_loss": -5.795292377471924, "global_step": 49201, "epoch": 1171} {"train_loss": -5.640818119049072, "global_step": 49202, "epoch": 1171} {"train_loss": -5.576563835144043, "global_step": 49203, "epoch": 1171} {"train_loss": -5.8037872314453125, "global_step": 49204, "epoch": 1171} {"train_loss": -5.568079948425293, "global_step": 49205, "epoch": 1171} {"train_loss": -5.617889881134033, "global_step": 49206, "epoch": 1171} {"train_loss": -5.740667819976807, "global_step": 49207, "epoch": 1171} {"train_loss": -5.703014373779297, "global_step": 49208, "epoch": 1171} {"train_loss": -5.656303405761719, "global_step": 49209, "epoch": 1171} {"train_loss": -5.7370381355285645, "global_step": 49210, "epoch": 1171} {"train_loss": -5.666922569274902, "global_step": 49211, "epoch": 1171} {"train_loss": -5.751012325286865, "global_step": 49212, "epoch": 1171} {"train_loss": -5.6168437004089355, "global_step": 49213, "epoch": 1171} {"train_loss": -5.730072498321533, "global_step": 49214, "epoch": 1171} {"train_loss": -5.601412773132324, "global_step": 49215, "epoch": 1171} {"train_loss": -5.535409450531006, "global_step": 49216, "epoch": 1171} {"train_loss": -5.707888603210449, "global_step": 49217, "epoch": 1171} {"train_loss": -5.5921831130981445, "global_step": 49218, "epoch": 1171} {"train_loss": -5.680779933929443, "global_step": 49219, "epoch": 1171} {"train_loss": -5.703495979309082, "global_step": 49220, "epoch": 1171} {"train_loss": -5.8415656089782715, "global_step": 49221, "epoch": 1171} {"train_loss": -5.596950531005859, "global_step": 49222, "epoch": 1171} {"train_loss": -5.690867151532855, "global_step": 49223, "epoch": 1171, "val_loss": 61968.734375} {"train_loss": -5.587608337402344, "global_step": 49224, "epoch": 1172} {"train_loss": -5.655587196350098, "global_step": 49225, "epoch": 1172} {"train_loss": -5.72261905670166, "global_step": 49226, "epoch": 1172} {"train_loss": -5.780254364013672, "global_step": 49227, "epoch": 1172} {"train_loss": -5.599006175994873, "global_step": 49228, "epoch": 1172} {"train_loss": -5.723738193511963, "global_step": 49229, "epoch": 1172} {"train_loss": -5.595302581787109, "global_step": 49230, "epoch": 1172} {"train_loss": -5.838379383087158, "global_step": 49231, "epoch": 1172} {"train_loss": -5.672092437744141, "global_step": 49232, "epoch": 1172} {"train_loss": -5.873387336730957, "global_step": 49233, "epoch": 1172} {"train_loss": -5.752614498138428, "global_step": 49234, "epoch": 1172} {"train_loss": -5.812495231628418, "global_step": 49235, "epoch": 1172} {"train_loss": -5.860682487487793, "global_step": 49236, "epoch": 1172} {"train_loss": -5.721467971801758, "global_step": 49237, "epoch": 1172} {"train_loss": -5.815554618835449, "global_step": 49238, "epoch": 1172} {"train_loss": -5.705650806427002, "global_step": 49239, "epoch": 1172} {"train_loss": -5.795755386352539, "global_step": 49240, "epoch": 1172} {"train_loss": -5.863836288452148, "global_step": 49241, "epoch": 1172} {"train_loss": -5.845861434936523, "global_step": 49242, "epoch": 1172} {"train_loss": -5.77874755859375, "global_step": 49243, "epoch": 1172} {"train_loss": -5.757736682891846, "global_step": 49244, "epoch": 1172} {"train_loss": -5.694911956787109, "global_step": 49245, "epoch": 1172} {"train_loss": -5.845247268676758, "global_step": 49246, "epoch": 1172} {"train_loss": -5.667476177215576, "global_step": 49247, "epoch": 1172} {"train_loss": -5.846442222595215, "global_step": 49248, "epoch": 1172} {"train_loss": -5.798792839050293, "global_step": 49249, "epoch": 1172} {"train_loss": -5.76347541809082, "global_step": 49250, "epoch": 1172} {"train_loss": -5.789226055145264, "global_step": 49251, "epoch": 1172} {"train_loss": -5.765332221984863, "global_step": 49252, "epoch": 1172} {"train_loss": -5.684345722198486, "global_step": 49253, "epoch": 1172} {"train_loss": -5.858467102050781, "global_step": 49254, "epoch": 1172} {"train_loss": -5.8206281661987305, "global_step": 49255, "epoch": 1172} {"train_loss": -5.763385772705078, "global_step": 49256, "epoch": 1172} {"train_loss": -5.754096984863281, "global_step": 49257, "epoch": 1172} {"train_loss": -5.806387901306152, "global_step": 49258, "epoch": 1172} {"train_loss": -5.693467617034912, "global_step": 49259, "epoch": 1172} {"train_loss": -5.647092342376709, "global_step": 49260, "epoch": 1172} {"train_loss": -5.811046600341797, "global_step": 49261, "epoch": 1172} {"train_loss": -5.715666770935059, "global_step": 49262, "epoch": 1172} {"train_loss": -5.791197776794434, "global_step": 49263, "epoch": 1172} {"train_loss": -5.758482933044434, "global_step": 49264, "epoch": 1172} {"train_loss": -5.756985369182768, "global_step": 49265, "epoch": 1172, "val_loss": 61770.92578125} {"train_loss": -5.708622455596924, "global_step": 49266, "epoch": 1173} {"train_loss": -5.789523124694824, "global_step": 49267, "epoch": 1173} {"train_loss": -5.674253940582275, "global_step": 49268, "epoch": 1173} {"train_loss": -5.60911750793457, "global_step": 49269, "epoch": 1173} {"train_loss": -5.573489189147949, "global_step": 49270, "epoch": 1173} {"train_loss": -5.623950958251953, "global_step": 49271, "epoch": 1173} {"train_loss": -5.736335754394531, "global_step": 49272, "epoch": 1173} {"train_loss": -5.699041843414307, "global_step": 49273, "epoch": 1173} {"train_loss": -5.651930809020996, "global_step": 49274, "epoch": 1173} {"train_loss": -5.707090377807617, "global_step": 49275, "epoch": 1173} {"train_loss": -5.796435356140137, "global_step": 49276, "epoch": 1173} {"train_loss": -5.717281341552734, "global_step": 49277, "epoch": 1173} {"train_loss": -5.821015357971191, "global_step": 49278, "epoch": 1173} {"train_loss": -5.88870906829834, "global_step": 49279, "epoch": 1173} {"train_loss": -5.781270980834961, "global_step": 49280, "epoch": 1173} {"train_loss": -5.770642280578613, "global_step": 49281, "epoch": 1173} {"train_loss": -5.77054500579834, "global_step": 49282, "epoch": 1173} {"train_loss": -5.8374128341674805, "global_step": 49283, "epoch": 1173} {"train_loss": -5.772902011871338, "global_step": 49284, "epoch": 1173} {"train_loss": -5.76961612701416, "global_step": 49285, "epoch": 1173} {"train_loss": -5.872408390045166, "global_step": 49286, "epoch": 1173} {"train_loss": -5.650315284729004, "global_step": 49287, "epoch": 1173} {"train_loss": -5.709851264953613, "global_step": 49288, "epoch": 1173} {"train_loss": -5.881662845611572, "global_step": 49289, "epoch": 1173} {"train_loss": -5.7706804275512695, "global_step": 49290, "epoch": 1173} {"train_loss": -5.631918430328369, "global_step": 49291, "epoch": 1173} {"train_loss": -5.870611667633057, "global_step": 49292, "epoch": 1173} {"train_loss": -5.871554374694824, "global_step": 49293, "epoch": 1173} {"train_loss": -5.932884216308594, "global_step": 49294, "epoch": 1173} {"train_loss": -5.702218055725098, "global_step": 49295, "epoch": 1173} {"train_loss": -5.75577974319458, "global_step": 49296, "epoch": 1173} {"train_loss": -5.8468828201293945, "global_step": 49297, "epoch": 1173} {"train_loss": -5.936822891235352, "global_step": 49298, "epoch": 1173} {"train_loss": -5.766085624694824, "global_step": 49299, "epoch": 1173} {"train_loss": -5.897002220153809, "global_step": 49300, "epoch": 1173} {"train_loss": -5.771298408508301, "global_step": 49301, "epoch": 1173} {"train_loss": -5.725741386413574, "global_step": 49302, "epoch": 1173} {"train_loss": -5.768589496612549, "global_step": 49303, "epoch": 1173} {"train_loss": -5.79947566986084, "global_step": 49304, "epoch": 1173} {"train_loss": -5.674520015716553, "global_step": 49305, "epoch": 1173} {"train_loss": -5.84970760345459, "global_step": 49306, "epoch": 1173} {"train_loss": -5.766720839909145, "global_step": 49307, "epoch": 1173, "val_loss": 61376.5078125} {"train_loss": -5.848161220550537, "global_step": 49308, "epoch": 1174} {"train_loss": -5.8704986572265625, "global_step": 49309, "epoch": 1174} {"train_loss": -5.703508377075195, "global_step": 49310, "epoch": 1174} {"train_loss": -5.686993598937988, "global_step": 49311, "epoch": 1174} {"train_loss": -5.710839748382568, "global_step": 49312, "epoch": 1174} {"train_loss": -5.7821044921875, "global_step": 49313, "epoch": 1174} {"train_loss": -5.784846305847168, "global_step": 49314, "epoch": 1174} {"train_loss": -5.812394618988037, "global_step": 49315, "epoch": 1174} {"train_loss": -5.768834114074707, "global_step": 49316, "epoch": 1174} {"train_loss": -5.812294960021973, "global_step": 49317, "epoch": 1174} {"train_loss": -5.828442573547363, "global_step": 49318, "epoch": 1174} {"train_loss": -5.720544815063477, "global_step": 49319, "epoch": 1174} {"train_loss": -5.677319049835205, "global_step": 49320, "epoch": 1174} {"train_loss": -5.70919132232666, "global_step": 49321, "epoch": 1174} {"train_loss": -5.648360729217529, "global_step": 49322, "epoch": 1174} {"train_loss": -5.980016708374023, "global_step": 49323, "epoch": 1174} {"train_loss": -5.725937843322754, "global_step": 49324, "epoch": 1174} {"train_loss": -5.791562080383301, "global_step": 49325, "epoch": 1174} {"train_loss": -5.826022624969482, "global_step": 49326, "epoch": 1174} {"train_loss": -5.807172775268555, "global_step": 49327, "epoch": 1174} {"train_loss": -5.819882869720459, "global_step": 49328, "epoch": 1174} {"train_loss": -5.723934173583984, "global_step": 49329, "epoch": 1174} {"train_loss": -5.7061872482299805, "global_step": 49330, "epoch": 1174} {"train_loss": -5.781973838806152, "global_step": 49331, "epoch": 1174} {"train_loss": -5.746346473693848, "global_step": 49332, "epoch": 1174} {"train_loss": -5.7836408615112305, "global_step": 49333, "epoch": 1174} {"train_loss": -5.618614196777344, "global_step": 49334, "epoch": 1174} {"train_loss": -5.637437343597412, "global_step": 49335, "epoch": 1174} {"train_loss": -5.577432632446289, "global_step": 49336, "epoch": 1174} {"train_loss": -5.837528228759766, "global_step": 49337, "epoch": 1174} {"train_loss": -5.567959308624268, "global_step": 49338, "epoch": 1174} {"train_loss": -5.6935133934021, "global_step": 49339, "epoch": 1174} {"train_loss": -5.640486240386963, "global_step": 49340, "epoch": 1174} {"train_loss": -5.699155807495117, "global_step": 49341, "epoch": 1174} {"train_loss": -5.877695083618164, "global_step": 49342, "epoch": 1174} {"train_loss": -5.827211380004883, "global_step": 49343, "epoch": 1174} {"train_loss": -5.736433029174805, "global_step": 49344, "epoch": 1174} {"train_loss": -5.7195587158203125, "global_step": 49345, "epoch": 1174} {"train_loss": -5.791115760803223, "global_step": 49346, "epoch": 1174} {"train_loss": -5.818784713745117, "global_step": 49347, "epoch": 1174} {"train_loss": -5.796043395996094, "global_step": 49348, "epoch": 1174} {"train_loss": -5.753686473483131, "global_step": 49349, "epoch": 1174, "val_loss": 61540.04296875} {"train_loss": -5.579949378967285, "global_step": 49350, "epoch": 1175} {"train_loss": -5.734861850738525, "global_step": 49351, "epoch": 1175} {"train_loss": -5.858478546142578, "global_step": 49352, "epoch": 1175} {"train_loss": -5.754004955291748, "global_step": 49353, "epoch": 1175} {"train_loss": -5.809669017791748, "global_step": 49354, "epoch": 1175} {"train_loss": -5.854700565338135, "global_step": 49355, "epoch": 1175} {"train_loss": -5.724307060241699, "global_step": 49356, "epoch": 1175} {"train_loss": -5.821089744567871, "global_step": 49357, "epoch": 1175} {"train_loss": -5.764451026916504, "global_step": 49358, "epoch": 1175} {"train_loss": -5.8065571784973145, "global_step": 49359, "epoch": 1175} {"train_loss": -5.782867431640625, "global_step": 49360, "epoch": 1175} {"train_loss": -5.793034076690674, "global_step": 49361, "epoch": 1175} {"train_loss": -5.702274322509766, "global_step": 49362, "epoch": 1175} {"train_loss": -5.817420959472656, "global_step": 49363, "epoch": 1175} {"train_loss": -5.883957862854004, "global_step": 49364, "epoch": 1175} {"train_loss": -5.870690822601318, "global_step": 49365, "epoch": 1175} {"train_loss": -5.902152061462402, "global_step": 49366, "epoch": 1175} {"train_loss": -5.7592267990112305, "global_step": 49367, "epoch": 1175} {"train_loss": -5.795139312744141, "global_step": 49368, "epoch": 1175} {"train_loss": -5.702953338623047, "global_step": 49369, "epoch": 1175} {"train_loss": -5.772670745849609, "global_step": 49370, "epoch": 1175} {"train_loss": -5.762832164764404, "global_step": 49371, "epoch": 1175} {"train_loss": -5.768873691558838, "global_step": 49372, "epoch": 1175} {"train_loss": -5.801814556121826, "global_step": 49373, "epoch": 1175} {"train_loss": -5.846934795379639, "global_step": 49374, "epoch": 1175} {"train_loss": -5.708678245544434, "global_step": 49375, "epoch": 1175} {"train_loss": -5.835147857666016, "global_step": 49376, "epoch": 1175} {"train_loss": -5.738673210144043, "global_step": 49377, "epoch": 1175} {"train_loss": -5.782437801361084, "global_step": 49378, "epoch": 1175} {"train_loss": -5.886500358581543, "global_step": 49379, "epoch": 1175} {"train_loss": -5.627016067504883, "global_step": 49380, "epoch": 1175} {"train_loss": -5.625831127166748, "global_step": 49381, "epoch": 1175} {"train_loss": -5.778093338012695, "global_step": 49382, "epoch": 1175} {"train_loss": -5.766453742980957, "global_step": 49383, "epoch": 1175} {"train_loss": -5.759849548339844, "global_step": 49384, "epoch": 1175} {"train_loss": -5.855618000030518, "global_step": 49385, "epoch": 1175} {"train_loss": -5.723702430725098, "global_step": 49386, "epoch": 1175} {"train_loss": -5.805218696594238, "global_step": 49387, "epoch": 1175} {"train_loss": -5.806321620941162, "global_step": 49388, "epoch": 1175} {"train_loss": -5.774616241455078, "global_step": 49389, "epoch": 1175} {"train_loss": -5.7998762130737305, "global_step": 49390, "epoch": 1175} {"train_loss": -5.779054743903024, "global_step": 49391, "epoch": 1175, "val_loss": 61492.453125} {"train_loss": -5.885203838348389, "global_step": 49392, "epoch": 1176} {"train_loss": -5.760523319244385, "global_step": 49393, "epoch": 1176} {"train_loss": -5.889996528625488, "global_step": 49394, "epoch": 1176} {"train_loss": -5.7396697998046875, "global_step": 49395, "epoch": 1176} {"train_loss": -5.830532550811768, "global_step": 49396, "epoch": 1176} {"train_loss": -5.703082084655762, "global_step": 49397, "epoch": 1176} {"train_loss": -5.851876258850098, "global_step": 49398, "epoch": 1176} {"train_loss": -5.840081214904785, "global_step": 49399, "epoch": 1176} {"train_loss": -5.724495887756348, "global_step": 49400, "epoch": 1176} {"train_loss": -5.737937927246094, "global_step": 49401, "epoch": 1176} {"train_loss": -5.701033592224121, "global_step": 49402, "epoch": 1176} {"train_loss": -5.684355735778809, "global_step": 49403, "epoch": 1176} {"train_loss": -5.735027313232422, "global_step": 49404, "epoch": 1176} {"train_loss": -5.946834564208984, "global_step": 49405, "epoch": 1176} {"train_loss": -5.8594512939453125, "global_step": 49406, "epoch": 1176} {"train_loss": -5.807995319366455, "global_step": 49407, "epoch": 1176} {"train_loss": -5.772909641265869, "global_step": 49408, "epoch": 1176} {"train_loss": -5.667557716369629, "global_step": 49409, "epoch": 1176} {"train_loss": -5.794720649719238, "global_step": 49410, "epoch": 1176} {"train_loss": -5.775954246520996, "global_step": 49411, "epoch": 1176} {"train_loss": -5.689614295959473, "global_step": 49412, "epoch": 1176} {"train_loss": -5.892297744750977, "global_step": 49413, "epoch": 1176} {"train_loss": -5.632925033569336, "global_step": 49414, "epoch": 1176} {"train_loss": -5.728697299957275, "global_step": 49415, "epoch": 1176} {"train_loss": -5.8495049476623535, "global_step": 49416, "epoch": 1176} {"train_loss": -5.752587795257568, "global_step": 49417, "epoch": 1176} {"train_loss": -5.757473945617676, "global_step": 49418, "epoch": 1176} {"train_loss": -5.699177265167236, "global_step": 49419, "epoch": 1176} {"train_loss": -5.667548656463623, "global_step": 49420, "epoch": 1176} {"train_loss": -5.752839088439941, "global_step": 49421, "epoch": 1176} {"train_loss": -5.714578628540039, "global_step": 49422, "epoch": 1176} {"train_loss": -5.72590446472168, "global_step": 49423, "epoch": 1176} {"train_loss": -5.773892402648926, "global_step": 49424, "epoch": 1176} {"train_loss": -5.711596488952637, "global_step": 49425, "epoch": 1176} {"train_loss": -5.555062294006348, "global_step": 49426, "epoch": 1176} {"train_loss": -5.71951150894165, "global_step": 49427, "epoch": 1176} {"train_loss": -5.762054443359375, "global_step": 49428, "epoch": 1176} {"train_loss": -5.823489189147949, "global_step": 49429, "epoch": 1176} {"train_loss": -5.688331127166748, "global_step": 49430, "epoch": 1176} {"train_loss": -5.813175201416016, "global_step": 49431, "epoch": 1176} {"train_loss": -5.899731636047363, "global_step": 49432, "epoch": 1176} {"train_loss": -5.766304163705735, "global_step": 49433, "epoch": 1176, "val_loss": 61276.81640625} {"train_loss": -5.812968730926514, "global_step": 49434, "epoch": 1177} {"train_loss": -5.760385513305664, "global_step": 49435, "epoch": 1177} {"train_loss": -5.83992338180542, "global_step": 49436, "epoch": 1177} {"train_loss": -5.8548431396484375, "global_step": 49437, "epoch": 1177} {"train_loss": -5.802784442901611, "global_step": 49438, "epoch": 1177} {"train_loss": -5.765608787536621, "global_step": 49439, "epoch": 1177} {"train_loss": -5.755761623382568, "global_step": 49440, "epoch": 1177} {"train_loss": -5.722609519958496, "global_step": 49441, "epoch": 1177} {"train_loss": -5.742800235748291, "global_step": 49442, "epoch": 1177} {"train_loss": -5.7049102783203125, "global_step": 49443, "epoch": 1177} {"train_loss": -5.700437545776367, "global_step": 49444, "epoch": 1177} {"train_loss": -5.7588701248168945, "global_step": 49445, "epoch": 1177} {"train_loss": -5.749686241149902, "global_step": 49446, "epoch": 1177} {"train_loss": -5.660385608673096, "global_step": 49447, "epoch": 1177} {"train_loss": -5.8283772468566895, "global_step": 49448, "epoch": 1177} {"train_loss": -5.801290512084961, "global_step": 49449, "epoch": 1177} {"train_loss": -5.877330780029297, "global_step": 49450, "epoch": 1177} {"train_loss": -5.836217880249023, "global_step": 49451, "epoch": 1177} {"train_loss": -5.876007556915283, "global_step": 49452, "epoch": 1177} {"train_loss": -5.687735557556152, "global_step": 49453, "epoch": 1177} {"train_loss": -5.868613243103027, "global_step": 49454, "epoch": 1177} {"train_loss": -5.69918155670166, "global_step": 49455, "epoch": 1177} {"train_loss": -5.740576267242432, "global_step": 49456, "epoch": 1177} {"train_loss": -5.80320405960083, "global_step": 49457, "epoch": 1177} {"train_loss": -5.70942497253418, "global_step": 49458, "epoch": 1177} {"train_loss": -5.7978129386901855, "global_step": 49459, "epoch": 1177} {"train_loss": -5.655949115753174, "global_step": 49460, "epoch": 1177} {"train_loss": -5.6711530685424805, "global_step": 49461, "epoch": 1177} {"train_loss": -5.799618721008301, "global_step": 49462, "epoch": 1177} {"train_loss": -5.744555473327637, "global_step": 49463, "epoch": 1177} {"train_loss": -5.83510684967041, "global_step": 49464, "epoch": 1177} {"train_loss": -5.707442283630371, "global_step": 49465, "epoch": 1177} {"train_loss": -5.8026885986328125, "global_step": 49466, "epoch": 1177} {"train_loss": -5.878053665161133, "global_step": 49467, "epoch": 1177} {"train_loss": -5.78068733215332, "global_step": 49468, "epoch": 1177} {"train_loss": -5.774261474609375, "global_step": 49469, "epoch": 1177} {"train_loss": -5.853085041046143, "global_step": 49470, "epoch": 1177} {"train_loss": -5.6835222244262695, "global_step": 49471, "epoch": 1177} {"train_loss": -5.798745632171631, "global_step": 49472, "epoch": 1177} {"train_loss": -5.8068060874938965, "global_step": 49473, "epoch": 1177} {"train_loss": -5.739710807800293, "global_step": 49474, "epoch": 1177} {"train_loss": -5.77252721786499, "global_step": 49475, "epoch": 1177, "val_loss": 61519.40625} {"train_loss": -5.881656646728516, "global_step": 49476, "epoch": 1178} {"train_loss": -5.715257167816162, "global_step": 49477, "epoch": 1178} {"train_loss": -5.797183036804199, "global_step": 49478, "epoch": 1178} {"train_loss": -5.768986701965332, "global_step": 49479, "epoch": 1178} {"train_loss": -5.891059875488281, "global_step": 49480, "epoch": 1178} {"train_loss": -5.815644264221191, "global_step": 49481, "epoch": 1178} {"train_loss": -5.598392009735107, "global_step": 49482, "epoch": 1178} {"train_loss": -5.813691139221191, "global_step": 49483, "epoch": 1178} {"train_loss": -5.806277275085449, "global_step": 49484, "epoch": 1178} {"train_loss": -5.842349052429199, "global_step": 49485, "epoch": 1178} {"train_loss": -5.83134651184082, "global_step": 49486, "epoch": 1178} {"train_loss": -5.692266941070557, "global_step": 49487, "epoch": 1178} {"train_loss": -5.7572197914123535, "global_step": 49488, "epoch": 1178} {"train_loss": -5.791998863220215, "global_step": 49489, "epoch": 1178} {"train_loss": -5.698495388031006, "global_step": 49490, "epoch": 1178} {"train_loss": -5.594020843505859, "global_step": 49491, "epoch": 1178} {"train_loss": -5.63267707824707, "global_step": 49492, "epoch": 1178} {"train_loss": -5.72331428527832, "global_step": 49493, "epoch": 1178} {"train_loss": -5.655301570892334, "global_step": 49494, "epoch": 1178} {"train_loss": -5.759376525878906, "global_step": 49495, "epoch": 1178} {"train_loss": -5.676136493682861, "global_step": 49496, "epoch": 1178} {"train_loss": -5.672588348388672, "global_step": 49497, "epoch": 1178} {"train_loss": -5.649353981018066, "global_step": 49498, "epoch": 1178} {"train_loss": -5.525649547576904, "global_step": 49499, "epoch": 1178} {"train_loss": -5.720458984375, "global_step": 49500, "epoch": 1178} {"train_loss": -5.591259956359863, "global_step": 49501, "epoch": 1178} {"train_loss": -5.794284820556641, "global_step": 49502, "epoch": 1178} {"train_loss": -5.624526500701904, "global_step": 49503, "epoch": 1178} {"train_loss": -5.762540817260742, "global_step": 49504, "epoch": 1178} {"train_loss": -5.694149971008301, "global_step": 49505, "epoch": 1178} {"train_loss": -5.692350387573242, "global_step": 49506, "epoch": 1178} {"train_loss": -5.703143119812012, "global_step": 49507, "epoch": 1178} {"train_loss": -5.625190734863281, "global_step": 49508, "epoch": 1178} {"train_loss": -5.910662651062012, "global_step": 49509, "epoch": 1178} {"train_loss": -5.642793655395508, "global_step": 49510, "epoch": 1178} {"train_loss": -5.819860458374023, "global_step": 49511, "epoch": 1178} {"train_loss": -5.567080497741699, "global_step": 49512, "epoch": 1178} {"train_loss": -5.753434181213379, "global_step": 49513, "epoch": 1178} {"train_loss": -5.664745330810547, "global_step": 49514, "epoch": 1178} {"train_loss": -5.680434226989746, "global_step": 49515, "epoch": 1178} {"train_loss": -5.661284446716309, "global_step": 49516, "epoch": 1178} {"train_loss": -5.7173672290075395, "global_step": 49517, "epoch": 1178, "val_loss": 61443.50390625} {"train_loss": -5.6219282150268555, "global_step": 49518, "epoch": 1179} {"train_loss": -5.715552806854248, "global_step": 49519, "epoch": 1179} {"train_loss": -5.774193286895752, "global_step": 49520, "epoch": 1179} {"train_loss": -5.668741703033447, "global_step": 49521, "epoch": 1179} {"train_loss": -5.6902008056640625, "global_step": 49522, "epoch": 1179} {"train_loss": -5.759369373321533, "global_step": 49523, "epoch": 1179} {"train_loss": -5.737794876098633, "global_step": 49524, "epoch": 1179} {"train_loss": -5.639142990112305, "global_step": 49525, "epoch": 1179} {"train_loss": -5.761157035827637, "global_step": 49526, "epoch": 1179} {"train_loss": -5.562417030334473, "global_step": 49527, "epoch": 1179} {"train_loss": -5.771808624267578, "global_step": 49528, "epoch": 1179} {"train_loss": -5.732577323913574, "global_step": 49529, "epoch": 1179} {"train_loss": -5.658247947692871, "global_step": 49530, "epoch": 1179} {"train_loss": -5.737175941467285, "global_step": 49531, "epoch": 1179} {"train_loss": -5.67301082611084, "global_step": 49532, "epoch": 1179} {"train_loss": -5.837754249572754, "global_step": 49533, "epoch": 1179} {"train_loss": -5.653877258300781, "global_step": 49534, "epoch": 1179} {"train_loss": -5.8059844970703125, "global_step": 49535, "epoch": 1179} {"train_loss": -5.788172245025635, "global_step": 49536, "epoch": 1179} {"train_loss": -5.574275016784668, "global_step": 49537, "epoch": 1179} {"train_loss": -5.76835823059082, "global_step": 49538, "epoch": 1179} {"train_loss": -5.748507499694824, "global_step": 49539, "epoch": 1179} {"train_loss": -5.798422813415527, "global_step": 49540, "epoch": 1179} {"train_loss": -5.649577617645264, "global_step": 49541, "epoch": 1179} {"train_loss": -5.734212875366211, "global_step": 49542, "epoch": 1179} {"train_loss": -5.721194744110107, "global_step": 49543, "epoch": 1179} {"train_loss": -5.7624969482421875, "global_step": 49544, "epoch": 1179} {"train_loss": -5.6853790283203125, "global_step": 49545, "epoch": 1179} {"train_loss": -5.610901832580566, "global_step": 49546, "epoch": 1179} {"train_loss": -5.682988166809082, "global_step": 49547, "epoch": 1179} {"train_loss": -5.760727882385254, "global_step": 49548, "epoch": 1179} {"train_loss": -5.734073638916016, "global_step": 49549, "epoch": 1179} {"train_loss": -5.828060626983643, "global_step": 49550, "epoch": 1179} {"train_loss": -5.684198379516602, "global_step": 49551, "epoch": 1179} {"train_loss": -5.8179931640625, "global_step": 49552, "epoch": 1179} {"train_loss": -5.737926006317139, "global_step": 49553, "epoch": 1179} {"train_loss": -5.805389881134033, "global_step": 49554, "epoch": 1179} {"train_loss": -5.714764595031738, "global_step": 49555, "epoch": 1179} {"train_loss": -5.9236321449279785, "global_step": 49556, "epoch": 1179} {"train_loss": -5.718018531799316, "global_step": 49557, "epoch": 1179} {"train_loss": -5.793097972869873, "global_step": 49558, "epoch": 1179} {"train_loss": -5.731125536419096, "global_step": 49559, "epoch": 1179, "val_loss": 61317.953125} {"train_loss": -5.703612804412842, "global_step": 49560, "epoch": 1180} {"train_loss": -5.8343963623046875, "global_step": 49561, "epoch": 1180} {"train_loss": -5.863884449005127, "global_step": 49562, "epoch": 1180} {"train_loss": -5.8284125328063965, "global_step": 49563, "epoch": 1180} {"train_loss": -5.712920188903809, "global_step": 49564, "epoch": 1180} {"train_loss": -5.704240798950195, "global_step": 49565, "epoch": 1180} {"train_loss": -5.796346187591553, "global_step": 49566, "epoch": 1180} {"train_loss": -5.627979278564453, "global_step": 49567, "epoch": 1180} {"train_loss": -5.768901348114014, "global_step": 49568, "epoch": 1180} {"train_loss": -5.8288774490356445, "global_step": 49569, "epoch": 1180} {"train_loss": -5.523837566375732, "global_step": 49570, "epoch": 1180} {"train_loss": -5.733040809631348, "global_step": 49571, "epoch": 1180} {"train_loss": -5.760503768920898, "global_step": 49572, "epoch": 1180} {"train_loss": -5.746147155761719, "global_step": 49573, "epoch": 1180} {"train_loss": -5.70459508895874, "global_step": 49574, "epoch": 1180} {"train_loss": -5.871295928955078, "global_step": 49575, "epoch": 1180} {"train_loss": -5.715686798095703, "global_step": 49576, "epoch": 1180} {"train_loss": -5.7810211181640625, "global_step": 49577, "epoch": 1180} {"train_loss": -5.718992233276367, "global_step": 49578, "epoch": 1180} {"train_loss": -5.792694568634033, "global_step": 49579, "epoch": 1180} {"train_loss": -5.848820209503174, "global_step": 49580, "epoch": 1180} {"train_loss": -5.866300582885742, "global_step": 49581, "epoch": 1180} {"train_loss": -5.836081504821777, "global_step": 49582, "epoch": 1180} {"train_loss": -5.6888813972473145, "global_step": 49583, "epoch": 1180} {"train_loss": -5.774914264678955, "global_step": 49584, "epoch": 1180} {"train_loss": -5.778438091278076, "global_step": 49585, "epoch": 1180} {"train_loss": -5.776082992553711, "global_step": 49586, "epoch": 1180} {"train_loss": -5.793456077575684, "global_step": 49587, "epoch": 1180} {"train_loss": -5.815973281860352, "global_step": 49588, "epoch": 1180} {"train_loss": -5.793966293334961, "global_step": 49589, "epoch": 1180} {"train_loss": -5.861965656280518, "global_step": 49590, "epoch": 1180} {"train_loss": -5.820899963378906, "global_step": 49591, "epoch": 1180} {"train_loss": -5.825511455535889, "global_step": 49592, "epoch": 1180} {"train_loss": -5.863299369812012, "global_step": 49593, "epoch": 1180} {"train_loss": -5.740896224975586, "global_step": 49594, "epoch": 1180} {"train_loss": -5.879560947418213, "global_step": 49595, "epoch": 1180} {"train_loss": -5.835826396942139, "global_step": 49596, "epoch": 1180} {"train_loss": -5.869407653808594, "global_step": 49597, "epoch": 1180} {"train_loss": -5.863582611083984, "global_step": 49598, "epoch": 1180} {"train_loss": -5.780162811279297, "global_step": 49599, "epoch": 1180} {"train_loss": -5.729925155639648, "global_step": 49600, "epoch": 1180} {"train_loss": -5.7809637160528276, "global_step": 49601, "epoch": 1180, "val_loss": 61388.75} {"train_loss": -5.8465423583984375, "global_step": 49602, "epoch": 1181} {"train_loss": -5.818643569946289, "global_step": 49603, "epoch": 1181} {"train_loss": -5.78050422668457, "global_step": 49604, "epoch": 1181} {"train_loss": -5.805186748504639, "global_step": 49605, "epoch": 1181} {"train_loss": -5.869448184967041, "global_step": 49606, "epoch": 1181} {"train_loss": -5.8470258712768555, "global_step": 49607, "epoch": 1181} {"train_loss": -5.870748043060303, "global_step": 49608, "epoch": 1181} {"train_loss": -5.849040985107422, "global_step": 49609, "epoch": 1181} {"train_loss": -5.791543960571289, "global_step": 49610, "epoch": 1181} {"train_loss": -5.759732246398926, "global_step": 49611, "epoch": 1181} {"train_loss": -5.77479362487793, "global_step": 49612, "epoch": 1181} {"train_loss": -5.5871429443359375, "global_step": 49613, "epoch": 1181} {"train_loss": -5.857413291931152, "global_step": 49614, "epoch": 1181} {"train_loss": -5.826766014099121, "global_step": 49615, "epoch": 1181} {"train_loss": -5.76113224029541, "global_step": 49616, "epoch": 1181} {"train_loss": -5.827481269836426, "global_step": 49617, "epoch": 1181} {"train_loss": -5.734209060668945, "global_step": 49618, "epoch": 1181} {"train_loss": -5.754306793212891, "global_step": 49619, "epoch": 1181} {"train_loss": -5.752313613891602, "global_step": 49620, "epoch": 1181} {"train_loss": -5.862880706787109, "global_step": 49621, "epoch": 1181} {"train_loss": -5.704953193664551, "global_step": 49622, "epoch": 1181} {"train_loss": -5.768942356109619, "global_step": 49623, "epoch": 1181} {"train_loss": -5.778606414794922, "global_step": 49624, "epoch": 1181} {"train_loss": -5.898690223693848, "global_step": 49625, "epoch": 1181} {"train_loss": -5.906124114990234, "global_step": 49626, "epoch": 1181} {"train_loss": -5.858592510223389, "global_step": 49627, "epoch": 1181} {"train_loss": -5.702683448791504, "global_step": 49628, "epoch": 1181} {"train_loss": -5.785013198852539, "global_step": 49629, "epoch": 1181} {"train_loss": -5.689851760864258, "global_step": 49630, "epoch": 1181} {"train_loss": -5.675781726837158, "global_step": 49631, "epoch": 1181} {"train_loss": -5.857565402984619, "global_step": 49632, "epoch": 1181} {"train_loss": -5.722659111022949, "global_step": 49633, "epoch": 1181} {"train_loss": -5.6832733154296875, "global_step": 49634, "epoch": 1181} {"train_loss": -5.734483242034912, "global_step": 49635, "epoch": 1181} {"train_loss": -5.670709609985352, "global_step": 49636, "epoch": 1181} {"train_loss": -5.612390041351318, "global_step": 49637, "epoch": 1181} {"train_loss": -5.851269721984863, "global_step": 49638, "epoch": 1181} {"train_loss": -5.657299041748047, "global_step": 49639, "epoch": 1181} {"train_loss": -5.678260803222656, "global_step": 49640, "epoch": 1181} {"train_loss": -5.86720085144043, "global_step": 49641, "epoch": 1181} {"train_loss": -5.718393325805664, "global_step": 49642, "epoch": 1181} {"train_loss": -5.77509567851112, "global_step": 49643, "epoch": 1181, "val_loss": 61425.1875} {"train_loss": -5.786904811859131, "global_step": 49644, "epoch": 1182} {"train_loss": -5.781879425048828, "global_step": 49645, "epoch": 1182} {"train_loss": -5.750394344329834, "global_step": 49646, "epoch": 1182} {"train_loss": -5.823005676269531, "global_step": 49647, "epoch": 1182} {"train_loss": -5.674783706665039, "global_step": 49648, "epoch": 1182} {"train_loss": -5.69737434387207, "global_step": 49649, "epoch": 1182} {"train_loss": -5.713906764984131, "global_step": 49650, "epoch": 1182} {"train_loss": -5.689635276794434, "global_step": 49651, "epoch": 1182} {"train_loss": -5.721930503845215, "global_step": 49652, "epoch": 1182} {"train_loss": -5.760904312133789, "global_step": 49653, "epoch": 1182} {"train_loss": -5.805495262145996, "global_step": 49654, "epoch": 1182} {"train_loss": -5.6829023361206055, "global_step": 49655, "epoch": 1182} {"train_loss": -5.750235080718994, "global_step": 49656, "epoch": 1182} {"train_loss": -5.8738694190979, "global_step": 49657, "epoch": 1182} {"train_loss": -5.8722147941589355, "global_step": 49658, "epoch": 1182} {"train_loss": -5.63694429397583, "global_step": 49659, "epoch": 1182} {"train_loss": -5.858695030212402, "global_step": 49660, "epoch": 1182} {"train_loss": -5.717597007751465, "global_step": 49661, "epoch": 1182} {"train_loss": -5.696022033691406, "global_step": 49662, "epoch": 1182} {"train_loss": -5.755297660827637, "global_step": 49663, "epoch": 1182} {"train_loss": -5.7669267654418945, "global_step": 49664, "epoch": 1182} {"train_loss": -5.8569440841674805, "global_step": 49665, "epoch": 1182} {"train_loss": -5.779946327209473, "global_step": 49666, "epoch": 1182} {"train_loss": -5.80138635635376, "global_step": 49667, "epoch": 1182} {"train_loss": -5.67169189453125, "global_step": 49668, "epoch": 1182} {"train_loss": -5.820217609405518, "global_step": 49669, "epoch": 1182} {"train_loss": -5.872529029846191, "global_step": 49670, "epoch": 1182} {"train_loss": -5.91026496887207, "global_step": 49671, "epoch": 1182} {"train_loss": -5.884430885314941, "global_step": 49672, "epoch": 1182} {"train_loss": -5.850411415100098, "global_step": 49673, "epoch": 1182} {"train_loss": -5.773922443389893, "global_step": 49674, "epoch": 1182} {"train_loss": -5.735854148864746, "global_step": 49675, "epoch": 1182} {"train_loss": -5.872076034545898, "global_step": 49676, "epoch": 1182} {"train_loss": -5.794265270233154, "global_step": 49677, "epoch": 1182} {"train_loss": -5.713123321533203, "global_step": 49678, "epoch": 1182} {"train_loss": -5.665992259979248, "global_step": 49679, "epoch": 1182} {"train_loss": -5.807965278625488, "global_step": 49680, "epoch": 1182} {"train_loss": -5.709845066070557, "global_step": 49681, "epoch": 1182} {"train_loss": -5.728397369384766, "global_step": 49682, "epoch": 1182} {"train_loss": -5.85416841506958, "global_step": 49683, "epoch": 1182} {"train_loss": -5.789973258972168, "global_step": 49684, "epoch": 1182} {"train_loss": -5.771678175245013, "global_step": 49685, "epoch": 1182, "val_loss": 61490.34765625} {"train_loss": -5.773196220397949, "global_step": 49686, "epoch": 1183} {"train_loss": -5.688564777374268, "global_step": 49687, "epoch": 1183} {"train_loss": -5.799610614776611, "global_step": 49688, "epoch": 1183} {"train_loss": -5.724849700927734, "global_step": 49689, "epoch": 1183} {"train_loss": -5.921062469482422, "global_step": 49690, "epoch": 1183} {"train_loss": -5.806406021118164, "global_step": 49691, "epoch": 1183} {"train_loss": -5.87130069732666, "global_step": 49692, "epoch": 1183} {"train_loss": -5.789697647094727, "global_step": 49693, "epoch": 1183} {"train_loss": -5.847150802612305, "global_step": 49694, "epoch": 1183} {"train_loss": -5.744121551513672, "global_step": 49695, "epoch": 1183} {"train_loss": -5.812619686126709, "global_step": 49696, "epoch": 1183} {"train_loss": -5.890589714050293, "global_step": 49697, "epoch": 1183} {"train_loss": -5.773202896118164, "global_step": 49698, "epoch": 1183} {"train_loss": -5.727225303649902, "global_step": 49699, "epoch": 1183} {"train_loss": -5.716181755065918, "global_step": 49700, "epoch": 1183} {"train_loss": -5.680057525634766, "global_step": 49701, "epoch": 1183} {"train_loss": -5.746328353881836, "global_step": 49702, "epoch": 1183} {"train_loss": -5.606864929199219, "global_step": 49703, "epoch": 1183} {"train_loss": -5.921748161315918, "global_step": 49704, "epoch": 1183} {"train_loss": -5.722258567810059, "global_step": 49705, "epoch": 1183} {"train_loss": -5.6185150146484375, "global_step": 49706, "epoch": 1183} {"train_loss": -5.82932186126709, "global_step": 49707, "epoch": 1183} {"train_loss": -5.637204647064209, "global_step": 49708, "epoch": 1183} {"train_loss": -5.766961097717285, "global_step": 49709, "epoch": 1183} {"train_loss": -5.792191505432129, "global_step": 49710, "epoch": 1183} {"train_loss": -5.813192367553711, "global_step": 49711, "epoch": 1183} {"train_loss": -5.72967004776001, "global_step": 49712, "epoch": 1183} {"train_loss": -5.815600395202637, "global_step": 49713, "epoch": 1183} {"train_loss": -5.868298530578613, "global_step": 49714, "epoch": 1183} {"train_loss": -5.835244655609131, "global_step": 49715, "epoch": 1183} {"train_loss": -5.789772033691406, "global_step": 49716, "epoch": 1183} {"train_loss": -5.8476152420043945, "global_step": 49717, "epoch": 1183} {"train_loss": -5.789536476135254, "global_step": 49718, "epoch": 1183} {"train_loss": -5.700726509094238, "global_step": 49719, "epoch": 1183} {"train_loss": -5.867569923400879, "global_step": 49720, "epoch": 1183} {"train_loss": -5.72489070892334, "global_step": 49721, "epoch": 1183} {"train_loss": -5.841335773468018, "global_step": 49722, "epoch": 1183} {"train_loss": -5.813258647918701, "global_step": 49723, "epoch": 1183} {"train_loss": -5.740079402923584, "global_step": 49724, "epoch": 1183} {"train_loss": -5.788787841796875, "global_step": 49725, "epoch": 1183} {"train_loss": -5.833786964416504, "global_step": 49726, "epoch": 1183} {"train_loss": -5.782026234127226, "global_step": 49727, "epoch": 1183, "val_loss": 61526.60546875} {"train_loss": -5.758942127227783, "global_step": 49728, "epoch": 1184} {"train_loss": -5.7919206619262695, "global_step": 49729, "epoch": 1184} {"train_loss": -5.699338912963867, "global_step": 49730, "epoch": 1184} {"train_loss": -5.691895008087158, "global_step": 49731, "epoch": 1184} {"train_loss": -5.952487945556641, "global_step": 49732, "epoch": 1184} {"train_loss": -5.711462020874023, "global_step": 49733, "epoch": 1184} {"train_loss": -5.739523410797119, "global_step": 49734, "epoch": 1184} {"train_loss": -5.793276786804199, "global_step": 49735, "epoch": 1184} {"train_loss": -5.891224384307861, "global_step": 49736, "epoch": 1184} {"train_loss": -5.732282638549805, "global_step": 49737, "epoch": 1184} {"train_loss": -5.782703399658203, "global_step": 49738, "epoch": 1184} {"train_loss": -5.848911762237549, "global_step": 49739, "epoch": 1184} {"train_loss": -5.7772698402404785, "global_step": 49740, "epoch": 1184} {"train_loss": -5.792898654937744, "global_step": 49741, "epoch": 1184} {"train_loss": -5.8041887283325195, "global_step": 49742, "epoch": 1184} {"train_loss": -5.783376216888428, "global_step": 49743, "epoch": 1184} {"train_loss": -5.791208267211914, "global_step": 49744, "epoch": 1184} {"train_loss": -5.806550025939941, "global_step": 49745, "epoch": 1184} {"train_loss": -5.818323135375977, "global_step": 49746, "epoch": 1184} {"train_loss": -5.6103715896606445, "global_step": 49747, "epoch": 1184} {"train_loss": -5.599961280822754, "global_step": 49748, "epoch": 1184} {"train_loss": -5.684368133544922, "global_step": 49749, "epoch": 1184} {"train_loss": -5.804684162139893, "global_step": 49750, "epoch": 1184} {"train_loss": -5.741815090179443, "global_step": 49751, "epoch": 1184} {"train_loss": -5.82248592376709, "global_step": 49752, "epoch": 1184} {"train_loss": -5.80180025100708, "global_step": 49753, "epoch": 1184} {"train_loss": -5.769040107727051, "global_step": 49754, "epoch": 1184} {"train_loss": -5.789226055145264, "global_step": 49755, "epoch": 1184} {"train_loss": -5.699443817138672, "global_step": 49756, "epoch": 1184} {"train_loss": -5.774111747741699, "global_step": 49757, "epoch": 1184} {"train_loss": -5.633754730224609, "global_step": 49758, "epoch": 1184} {"train_loss": -5.78410530090332, "global_step": 49759, "epoch": 1184} {"train_loss": -5.778670787811279, "global_step": 49760, "epoch": 1184} {"train_loss": -5.865169048309326, "global_step": 49761, "epoch": 1184} {"train_loss": -5.774279594421387, "global_step": 49762, "epoch": 1184} {"train_loss": -5.785910129547119, "global_step": 49763, "epoch": 1184} {"train_loss": -5.786060333251953, "global_step": 49764, "epoch": 1184} {"train_loss": -5.633984088897705, "global_step": 49765, "epoch": 1184} {"train_loss": -5.67045783996582, "global_step": 49766, "epoch": 1184} {"train_loss": -5.850344181060791, "global_step": 49767, "epoch": 1184} {"train_loss": -5.8144378662109375, "global_step": 49768, "epoch": 1184} {"train_loss": -5.76896874109904, "global_step": 49769, "epoch": 1184, "val_loss": 61573.0234375} {"train_loss": -5.844954490661621, "global_step": 49770, "epoch": 1185} {"train_loss": -5.732666492462158, "global_step": 49771, "epoch": 1185} {"train_loss": -5.787592887878418, "global_step": 49772, "epoch": 1185} {"train_loss": -5.862001419067383, "global_step": 49773, "epoch": 1185} {"train_loss": -5.86184549331665, "global_step": 49774, "epoch": 1185} {"train_loss": -5.800978660583496, "global_step": 49775, "epoch": 1185} {"train_loss": -5.747650146484375, "global_step": 49776, "epoch": 1185} {"train_loss": -5.719012260437012, "global_step": 49777, "epoch": 1185} {"train_loss": -5.873053550720215, "global_step": 49778, "epoch": 1185} {"train_loss": -5.700122833251953, "global_step": 49779, "epoch": 1185} {"train_loss": -5.759374141693115, "global_step": 49780, "epoch": 1185} {"train_loss": -5.8245649337768555, "global_step": 49781, "epoch": 1185} {"train_loss": -5.860259056091309, "global_step": 49782, "epoch": 1185} {"train_loss": -5.820752143859863, "global_step": 49783, "epoch": 1185} {"train_loss": -5.7089433670043945, "global_step": 49784, "epoch": 1185} {"train_loss": -5.762556552886963, "global_step": 49785, "epoch": 1185} {"train_loss": -5.656057834625244, "global_step": 49786, "epoch": 1185} {"train_loss": -5.8280463218688965, "global_step": 49787, "epoch": 1185} {"train_loss": -5.930953502655029, "global_step": 49788, "epoch": 1185} {"train_loss": -5.868464469909668, "global_step": 49789, "epoch": 1185} {"train_loss": -5.745440483093262, "global_step": 49790, "epoch": 1185} {"train_loss": -5.80600643157959, "global_step": 49791, "epoch": 1185} {"train_loss": -5.756077766418457, "global_step": 49792, "epoch": 1185} {"train_loss": -5.7421417236328125, "global_step": 49793, "epoch": 1185} {"train_loss": -5.735013961791992, "global_step": 49794, "epoch": 1185} {"train_loss": -5.771037578582764, "global_step": 49795, "epoch": 1185} {"train_loss": -5.777617454528809, "global_step": 49796, "epoch": 1185} {"train_loss": -5.73093843460083, "global_step": 49797, "epoch": 1185} {"train_loss": -5.768881797790527, "global_step": 49798, "epoch": 1185} {"train_loss": -5.837022304534912, "global_step": 49799, "epoch": 1185} {"train_loss": -5.685349941253662, "global_step": 49800, "epoch": 1185} {"train_loss": -5.78705358505249, "global_step": 49801, "epoch": 1185} {"train_loss": -5.70671272277832, "global_step": 49802, "epoch": 1185} {"train_loss": -5.737150192260742, "global_step": 49803, "epoch": 1185} {"train_loss": -5.854679107666016, "global_step": 49804, "epoch": 1185} {"train_loss": -5.767016410827637, "global_step": 49805, "epoch": 1185} {"train_loss": -5.792572975158691, "global_step": 49806, "epoch": 1185} {"train_loss": -5.77182149887085, "global_step": 49807, "epoch": 1185} {"train_loss": -5.711423397064209, "global_step": 49808, "epoch": 1185} {"train_loss": -5.793893814086914, "global_step": 49809, "epoch": 1185} {"train_loss": -5.840446472167969, "global_step": 49810, "epoch": 1185} {"train_loss": -5.780383155459449, "global_step": 49811, "epoch": 1185, "val_loss": 61795.88671875} {"train_loss": -5.574566841125488, "global_step": 49812, "epoch": 1186} {"train_loss": -5.797688007354736, "global_step": 49813, "epoch": 1186} {"train_loss": -5.810949802398682, "global_step": 49814, "epoch": 1186} {"train_loss": -5.709130764007568, "global_step": 49815, "epoch": 1186} {"train_loss": -5.778495788574219, "global_step": 49816, "epoch": 1186} {"train_loss": -5.834862232208252, "global_step": 49817, "epoch": 1186} {"train_loss": -5.726207733154297, "global_step": 49818, "epoch": 1186} {"train_loss": -5.7613911628723145, "global_step": 49819, "epoch": 1186} {"train_loss": -5.735368728637695, "global_step": 49820, "epoch": 1186} {"train_loss": -5.862751483917236, "global_step": 49821, "epoch": 1186} {"train_loss": -5.905721187591553, "global_step": 49822, "epoch": 1186} {"train_loss": -5.73232364654541, "global_step": 49823, "epoch": 1186} {"train_loss": -5.8804931640625, "global_step": 49824, "epoch": 1186} {"train_loss": -5.823282241821289, "global_step": 49825, "epoch": 1186} {"train_loss": -5.86580753326416, "global_step": 49826, "epoch": 1186} {"train_loss": -5.777304172515869, "global_step": 49827, "epoch": 1186} {"train_loss": -5.6452178955078125, "global_step": 49828, "epoch": 1186} {"train_loss": -5.836808681488037, "global_step": 49829, "epoch": 1186} {"train_loss": -5.831193447113037, "global_step": 49830, "epoch": 1186} {"train_loss": -5.743361949920654, "global_step": 49831, "epoch": 1186} {"train_loss": -5.815647125244141, "global_step": 49832, "epoch": 1186} {"train_loss": -5.811734676361084, "global_step": 49833, "epoch": 1186} {"train_loss": -5.858025074005127, "global_step": 49834, "epoch": 1186} {"train_loss": -5.755993843078613, "global_step": 49835, "epoch": 1186} {"train_loss": -5.76284122467041, "global_step": 49836, "epoch": 1186} {"train_loss": -5.919342041015625, "global_step": 49837, "epoch": 1186} {"train_loss": -5.659503936767578, "global_step": 49838, "epoch": 1186} {"train_loss": -5.682399272918701, "global_step": 49839, "epoch": 1186} {"train_loss": -5.895402431488037, "global_step": 49840, "epoch": 1186} {"train_loss": -5.620121002197266, "global_step": 49841, "epoch": 1186} {"train_loss": -5.582441329956055, "global_step": 49842, "epoch": 1186} {"train_loss": -5.617774486541748, "global_step": 49843, "epoch": 1186} {"train_loss": -5.7117390632629395, "global_step": 49844, "epoch": 1186} {"train_loss": -5.792590141296387, "global_step": 49845, "epoch": 1186} {"train_loss": -5.877267837524414, "global_step": 49846, "epoch": 1186} {"train_loss": -5.581031799316406, "global_step": 49847, "epoch": 1186} {"train_loss": -5.71595573425293, "global_step": 49848, "epoch": 1186} {"train_loss": -5.722654342651367, "global_step": 49849, "epoch": 1186} {"train_loss": -5.7754316329956055, "global_step": 49850, "epoch": 1186} {"train_loss": -5.803986549377441, "global_step": 49851, "epoch": 1186} {"train_loss": -5.819256782531738, "global_step": 49852, "epoch": 1186} {"train_loss": -5.770704485121227, "global_step": 49853, "epoch": 1186, "val_loss": 61474.01953125} {"train_loss": -5.74415397644043, "global_step": 49854, "epoch": 1187} {"train_loss": -5.746938705444336, "global_step": 49855, "epoch": 1187} {"train_loss": -5.72950553894043, "global_step": 49856, "epoch": 1187} {"train_loss": -5.633320331573486, "global_step": 49857, "epoch": 1187} {"train_loss": -5.613267421722412, "global_step": 49858, "epoch": 1187} {"train_loss": -5.7213287353515625, "global_step": 49859, "epoch": 1187} {"train_loss": -5.701474189758301, "global_step": 49860, "epoch": 1187} {"train_loss": -5.637154579162598, "global_step": 49861, "epoch": 1187} {"train_loss": -5.7512102127075195, "global_step": 49862, "epoch": 1187} {"train_loss": -5.572878360748291, "global_step": 49863, "epoch": 1187} {"train_loss": -5.699810028076172, "global_step": 49864, "epoch": 1187} {"train_loss": -5.633945465087891, "global_step": 49865, "epoch": 1187} {"train_loss": -5.6750383377075195, "global_step": 49866, "epoch": 1187} {"train_loss": -5.709892272949219, "global_step": 49867, "epoch": 1187} {"train_loss": -5.800122261047363, "global_step": 49868, "epoch": 1187} {"train_loss": -5.7262187004089355, "global_step": 49869, "epoch": 1187} {"train_loss": -5.804086685180664, "global_step": 49870, "epoch": 1187} {"train_loss": -5.613863945007324, "global_step": 49871, "epoch": 1187} {"train_loss": -5.933513641357422, "global_step": 49872, "epoch": 1187} {"train_loss": -5.440146446228027, "global_step": 49873, "epoch": 1187} {"train_loss": -5.61666202545166, "global_step": 49874, "epoch": 1187} {"train_loss": -5.555027008056641, "global_step": 49875, "epoch": 1187} {"train_loss": -5.813337326049805, "global_step": 49876, "epoch": 1187} {"train_loss": -5.588276386260986, "global_step": 49877, "epoch": 1187} {"train_loss": -5.624022483825684, "global_step": 49878, "epoch": 1187} {"train_loss": -5.794997215270996, "global_step": 49879, "epoch": 1187} {"train_loss": -5.555212497711182, "global_step": 49880, "epoch": 1187} {"train_loss": -5.829552173614502, "global_step": 49881, "epoch": 1187} {"train_loss": -5.463578701019287, "global_step": 49882, "epoch": 1187} {"train_loss": -5.686924934387207, "global_step": 49883, "epoch": 1187} {"train_loss": -5.725884437561035, "global_step": 49884, "epoch": 1187} {"train_loss": -5.865530967712402, "global_step": 49885, "epoch": 1187} {"train_loss": -5.627435684204102, "global_step": 49886, "epoch": 1187} {"train_loss": -5.695282936096191, "global_step": 49887, "epoch": 1187} {"train_loss": -5.682348251342773, "global_step": 49888, "epoch": 1187} {"train_loss": -5.749373435974121, "global_step": 49889, "epoch": 1187} {"train_loss": -5.727196216583252, "global_step": 49890, "epoch": 1187} {"train_loss": -5.692724704742432, "global_step": 49891, "epoch": 1187} {"train_loss": -5.8239545822143555, "global_step": 49892, "epoch": 1187} {"train_loss": -5.70162296295166, "global_step": 49893, "epoch": 1187} {"train_loss": -5.745139122009277, "global_step": 49894, "epoch": 1187} {"train_loss": -5.697459118706839, "global_step": 49895, "epoch": 1187, "val_loss": 61514.48046875} {"train_loss": -5.745577335357666, "global_step": 49896, "epoch": 1188} {"train_loss": -5.793846130371094, "global_step": 49897, "epoch": 1188} {"train_loss": -5.704416275024414, "global_step": 49898, "epoch": 1188} {"train_loss": -5.841556549072266, "global_step": 49899, "epoch": 1188} {"train_loss": -5.888883590698242, "global_step": 49900, "epoch": 1188} {"train_loss": -5.783175468444824, "global_step": 49901, "epoch": 1188} {"train_loss": -5.950535774230957, "global_step": 49902, "epoch": 1188} {"train_loss": -5.71641731262207, "global_step": 49903, "epoch": 1188} {"train_loss": -5.808368682861328, "global_step": 49904, "epoch": 1188} {"train_loss": -5.717257499694824, "global_step": 49905, "epoch": 1188} {"train_loss": -5.765041828155518, "global_step": 49906, "epoch": 1188} {"train_loss": -5.749849796295166, "global_step": 49907, "epoch": 1188} {"train_loss": -5.754128456115723, "global_step": 49908, "epoch": 1188} {"train_loss": -5.85569953918457, "global_step": 49909, "epoch": 1188} {"train_loss": -5.824424743652344, "global_step": 49910, "epoch": 1188} {"train_loss": -5.689797878265381, "global_step": 49911, "epoch": 1188} {"train_loss": -5.793263912200928, "global_step": 49912, "epoch": 1188} {"train_loss": -5.736481666564941, "global_step": 49913, "epoch": 1188} {"train_loss": -5.654405117034912, "global_step": 49914, "epoch": 1188} {"train_loss": -5.739694595336914, "global_step": 49915, "epoch": 1188} {"train_loss": -5.682281017303467, "global_step": 49916, "epoch": 1188} {"train_loss": -5.729007720947266, "global_step": 49917, "epoch": 1188} {"train_loss": -5.712564468383789, "global_step": 49918, "epoch": 1188} {"train_loss": -5.8027520179748535, "global_step": 49919, "epoch": 1188} {"train_loss": -5.8089141845703125, "global_step": 49920, "epoch": 1188} {"train_loss": -5.812962532043457, "global_step": 49921, "epoch": 1188} {"train_loss": -5.684562683105469, "global_step": 49922, "epoch": 1188} {"train_loss": -5.792996406555176, "global_step": 49923, "epoch": 1188} {"train_loss": -5.6623992919921875, "global_step": 49924, "epoch": 1188} {"train_loss": -5.865081787109375, "global_step": 49925, "epoch": 1188} {"train_loss": -5.78453254699707, "global_step": 49926, "epoch": 1188} {"train_loss": -5.694390296936035, "global_step": 49927, "epoch": 1188} {"train_loss": -5.782846450805664, "global_step": 49928, "epoch": 1188} {"train_loss": -5.9287309646606445, "global_step": 49929, "epoch": 1188} {"train_loss": -5.706974983215332, "global_step": 49930, "epoch": 1188} {"train_loss": -5.781979560852051, "global_step": 49931, "epoch": 1188} {"train_loss": -5.855314254760742, "global_step": 49932, "epoch": 1188} {"train_loss": -5.758576393127441, "global_step": 49933, "epoch": 1188} {"train_loss": -5.85310173034668, "global_step": 49934, "epoch": 1188} {"train_loss": -5.622363567352295, "global_step": 49935, "epoch": 1188} {"train_loss": -5.864083290100098, "global_step": 49936, "epoch": 1188} {"train_loss": -5.773563884553456, "global_step": 49937, "epoch": 1188, "val_loss": 61676.7421875} {"train_loss": -5.827339172363281, "global_step": 49938, "epoch": 1189} {"train_loss": -5.731723785400391, "global_step": 49939, "epoch": 1189} {"train_loss": -5.707437992095947, "global_step": 49940, "epoch": 1189} {"train_loss": -5.76573371887207, "global_step": 49941, "epoch": 1189} {"train_loss": -5.840290546417236, "global_step": 49942, "epoch": 1189} {"train_loss": -5.761107921600342, "global_step": 49943, "epoch": 1189} {"train_loss": -5.753733158111572, "global_step": 49944, "epoch": 1189} {"train_loss": -5.753386497497559, "global_step": 49945, "epoch": 1189} {"train_loss": -5.773736000061035, "global_step": 49946, "epoch": 1189} {"train_loss": -5.8743896484375, "global_step": 49947, "epoch": 1189} {"train_loss": -5.880376815795898, "global_step": 49948, "epoch": 1189} {"train_loss": -5.850045680999756, "global_step": 49949, "epoch": 1189} {"train_loss": -5.818637847900391, "global_step": 49950, "epoch": 1189} {"train_loss": -5.669848918914795, "global_step": 49951, "epoch": 1189} {"train_loss": -5.88944149017334, "global_step": 49952, "epoch": 1189} {"train_loss": -5.837995529174805, "global_step": 49953, "epoch": 1189} {"train_loss": -5.7725396156311035, "global_step": 49954, "epoch": 1189} {"train_loss": -5.865605354309082, "global_step": 49955, "epoch": 1189} {"train_loss": -5.893619537353516, "global_step": 49956, "epoch": 1189} {"train_loss": -5.762185096740723, "global_step": 49957, "epoch": 1189} {"train_loss": -5.8344807624816895, "global_step": 49958, "epoch": 1189} {"train_loss": -5.768985748291016, "global_step": 49959, "epoch": 1189} {"train_loss": -5.7347636222839355, "global_step": 49960, "epoch": 1189} {"train_loss": -5.57395076751709, "global_step": 49961, "epoch": 1189} {"train_loss": -5.853234767913818, "global_step": 49962, "epoch": 1189} {"train_loss": -5.676203727722168, "global_step": 49963, "epoch": 1189} {"train_loss": -5.813499450683594, "global_step": 49964, "epoch": 1189} {"train_loss": -5.7779622077941895, "global_step": 49965, "epoch": 1189} {"train_loss": -5.891039848327637, "global_step": 49966, "epoch": 1189} {"train_loss": -5.682151794433594, "global_step": 49967, "epoch": 1189} {"train_loss": -5.743415355682373, "global_step": 49968, "epoch": 1189} {"train_loss": -5.718606948852539, "global_step": 49969, "epoch": 1189} {"train_loss": -5.667212009429932, "global_step": 49970, "epoch": 1189} {"train_loss": -5.659592628479004, "global_step": 49971, "epoch": 1189} {"train_loss": -5.679708480834961, "global_step": 49972, "epoch": 1189} {"train_loss": -5.795841217041016, "global_step": 49973, "epoch": 1189} {"train_loss": -5.81684684753418, "global_step": 49974, "epoch": 1189} {"train_loss": -5.73012638092041, "global_step": 49975, "epoch": 1189} {"train_loss": -5.662728309631348, "global_step": 49976, "epoch": 1189} {"train_loss": -5.769779205322266, "global_step": 49977, "epoch": 1189} {"train_loss": -5.706822395324707, "global_step": 49978, "epoch": 1189} {"train_loss": -5.772842566172282, "global_step": 49979, "epoch": 1189, "val_loss": 61702.4140625} {"train_loss": -5.7494120597839355, "global_step": 49980, "epoch": 1190} {"train_loss": -5.775524139404297, "global_step": 49981, "epoch": 1190} {"train_loss": -5.8268609046936035, "global_step": 49982, "epoch": 1190} {"train_loss": -5.8047194480896, "global_step": 49983, "epoch": 1190} {"train_loss": -5.78787899017334, "global_step": 49984, "epoch": 1190} {"train_loss": -5.770346641540527, "global_step": 49985, "epoch": 1190} {"train_loss": -5.701216697692871, "global_step": 49986, "epoch": 1190} {"train_loss": -5.8587493896484375, "global_step": 49987, "epoch": 1190} {"train_loss": -5.764739990234375, "global_step": 49988, "epoch": 1190} {"train_loss": -5.780597686767578, "global_step": 49989, "epoch": 1190} {"train_loss": -5.724734306335449, "global_step": 49990, "epoch": 1190} {"train_loss": -5.740228176116943, "global_step": 49991, "epoch": 1190} {"train_loss": -5.766490936279297, "global_step": 49992, "epoch": 1190} {"train_loss": -5.755979537963867, "global_step": 49993, "epoch": 1190} {"train_loss": -5.828191757202148, "global_step": 49994, "epoch": 1190} {"train_loss": -5.797383785247803, "global_step": 49995, "epoch": 1190} {"train_loss": -5.856935024261475, "global_step": 49996, "epoch": 1190} {"train_loss": -5.6911163330078125, "global_step": 49997, "epoch": 1190} {"train_loss": -5.863948822021484, "global_step": 49998, "epoch": 1190} {"train_loss": -5.738515853881836, "global_step": 49999, "epoch": 1190} {"train_loss": -5.780041694641113, "global_step": 50000, "epoch": 1190} {"train_loss": -5.84576940536499, "global_step": 50001, "epoch": 1190} {"train_loss": -5.651615142822266, "global_step": 50002, "epoch": 1190} {"train_loss": -5.714695453643799, "global_step": 50003, "epoch": 1190} {"train_loss": -5.8306450843811035, "global_step": 50004, "epoch": 1190} {"train_loss": -5.787624359130859, "global_step": 50005, "epoch": 1190} {"train_loss": -5.820136070251465, "global_step": 50006, "epoch": 1190} {"train_loss": -5.837062835693359, "global_step": 50007, "epoch": 1190} {"train_loss": -5.761589527130127, "global_step": 50008, "epoch": 1190} {"train_loss": -5.934852600097656, "global_step": 50009, "epoch": 1190} {"train_loss": -5.721445083618164, "global_step": 50010, "epoch": 1190} {"train_loss": -5.817626953125, "global_step": 50011, "epoch": 1190} {"train_loss": -5.741859436035156, "global_step": 50012, "epoch": 1190} {"train_loss": -5.8279571533203125, "global_step": 50013, "epoch": 1190} {"train_loss": -5.848609924316406, "global_step": 50014, "epoch": 1190} {"train_loss": -5.66241455078125, "global_step": 50015, "epoch": 1190} {"train_loss": -5.787047386169434, "global_step": 50016, "epoch": 1190} {"train_loss": -5.793496131896973, "global_step": 50017, "epoch": 1190} {"train_loss": -5.777342796325684, "global_step": 50018, "epoch": 1190} {"train_loss": -5.882354259490967, "global_step": 50019, "epoch": 1190} {"train_loss": -5.696933746337891, "global_step": 50020, "epoch": 1190} {"train_loss": -5.782745225088937, "global_step": 50021, "epoch": 1190, "val_loss": 61637.26953125} {"train_loss": -5.693375587463379, "global_step": 50022, "epoch": 1191} {"train_loss": -5.725586414337158, "global_step": 50023, "epoch": 1191} {"train_loss": -5.718215465545654, "global_step": 50024, "epoch": 1191} {"train_loss": -5.795010089874268, "global_step": 50025, "epoch": 1191} {"train_loss": -5.651119709014893, "global_step": 50026, "epoch": 1191} {"train_loss": -5.82285213470459, "global_step": 50027, "epoch": 1191} {"train_loss": -5.776090621948242, "global_step": 50028, "epoch": 1191} {"train_loss": -5.781630039215088, "global_step": 50029, "epoch": 1191} {"train_loss": -5.81396484375, "global_step": 50030, "epoch": 1191} {"train_loss": -5.717340469360352, "global_step": 50031, "epoch": 1191} {"train_loss": -5.8072004318237305, "global_step": 50032, "epoch": 1191} {"train_loss": -5.721147537231445, "global_step": 50033, "epoch": 1191} {"train_loss": -5.738295555114746, "global_step": 50034, "epoch": 1191} {"train_loss": -5.8109283447265625, "global_step": 50035, "epoch": 1191} {"train_loss": -5.7286376953125, "global_step": 50036, "epoch": 1191} {"train_loss": -5.731833457946777, "global_step": 50037, "epoch": 1191} {"train_loss": -5.85960578918457, "global_step": 50038, "epoch": 1191} {"train_loss": -5.83821964263916, "global_step": 50039, "epoch": 1191} {"train_loss": -5.792691707611084, "global_step": 50040, "epoch": 1191} {"train_loss": -5.850240707397461, "global_step": 50041, "epoch": 1191} {"train_loss": -5.683369159698486, "global_step": 50042, "epoch": 1191} {"train_loss": -5.703621864318848, "global_step": 50043, "epoch": 1191} {"train_loss": -5.763757705688477, "global_step": 50044, "epoch": 1191} {"train_loss": -5.819342613220215, "global_step": 50045, "epoch": 1191} {"train_loss": -5.764013767242432, "global_step": 50046, "epoch": 1191} {"train_loss": -5.7478837966918945, "global_step": 50047, "epoch": 1191} {"train_loss": -5.756862640380859, "global_step": 50048, "epoch": 1191} {"train_loss": -5.750365257263184, "global_step": 50049, "epoch": 1191} {"train_loss": -5.853529930114746, "global_step": 50050, "epoch": 1191} {"train_loss": -5.885432243347168, "global_step": 50051, "epoch": 1191} {"train_loss": -5.758753776550293, "global_step": 50052, "epoch": 1191} {"train_loss": -5.790136337280273, "global_step": 50053, "epoch": 1191} {"train_loss": -5.787168502807617, "global_step": 50054, "epoch": 1191} {"train_loss": -5.595855712890625, "global_step": 50055, "epoch": 1191} {"train_loss": -5.794386863708496, "global_step": 50056, "epoch": 1191} {"train_loss": -5.8938889503479, "global_step": 50057, "epoch": 1191} {"train_loss": -5.811891555786133, "global_step": 50058, "epoch": 1191} {"train_loss": -5.677679061889648, "global_step": 50059, "epoch": 1191} {"train_loss": -5.9117350578308105, "global_step": 50060, "epoch": 1191} {"train_loss": -5.844204902648926, "global_step": 50061, "epoch": 1191} {"train_loss": -5.855388164520264, "global_step": 50062, "epoch": 1191} {"train_loss": -5.77458888008481, "global_step": 50063, "epoch": 1191, "val_loss": 61314.46875} {"train_loss": -5.86057710647583, "global_step": 50064, "epoch": 1192} {"train_loss": -5.762387275695801, "global_step": 50065, "epoch": 1192} {"train_loss": -5.801848411560059, "global_step": 50066, "epoch": 1192} {"train_loss": -5.7278733253479, "global_step": 50067, "epoch": 1192} {"train_loss": -5.755696773529053, "global_step": 50068, "epoch": 1192} {"train_loss": -5.847333908081055, "global_step": 50069, "epoch": 1192} {"train_loss": -5.783351898193359, "global_step": 50070, "epoch": 1192} {"train_loss": -5.891186714172363, "global_step": 50071, "epoch": 1192} {"train_loss": -5.654938220977783, "global_step": 50072, "epoch": 1192} {"train_loss": -5.664178371429443, "global_step": 50073, "epoch": 1192} {"train_loss": -5.8088908195495605, "global_step": 50074, "epoch": 1192} {"train_loss": -5.704348087310791, "global_step": 50075, "epoch": 1192} {"train_loss": -5.930281162261963, "global_step": 50076, "epoch": 1192} {"train_loss": -5.860962867736816, "global_step": 50077, "epoch": 1192} {"train_loss": -5.76732873916626, "global_step": 50078, "epoch": 1192} {"train_loss": -5.707340717315674, "global_step": 50079, "epoch": 1192} {"train_loss": -5.7701849937438965, "global_step": 50080, "epoch": 1192} {"train_loss": -5.725338935852051, "global_step": 50081, "epoch": 1192} {"train_loss": -5.66580867767334, "global_step": 50082, "epoch": 1192} {"train_loss": -5.737191200256348, "global_step": 50083, "epoch": 1192} {"train_loss": -5.760644435882568, "global_step": 50084, "epoch": 1192} {"train_loss": -5.824204921722412, "global_step": 50085, "epoch": 1192} {"train_loss": -5.823487281799316, "global_step": 50086, "epoch": 1192} {"train_loss": -5.694261074066162, "global_step": 50087, "epoch": 1192} {"train_loss": -5.7237653732299805, "global_step": 50088, "epoch": 1192} {"train_loss": -5.753257751464844, "global_step": 50089, "epoch": 1192} {"train_loss": -5.920583724975586, "global_step": 50090, "epoch": 1192} {"train_loss": -5.854719161987305, "global_step": 50091, "epoch": 1192} {"train_loss": -5.934530258178711, "global_step": 50092, "epoch": 1192} {"train_loss": -5.713001251220703, "global_step": 50093, "epoch": 1192} {"train_loss": -5.811208248138428, "global_step": 50094, "epoch": 1192} {"train_loss": -5.719758987426758, "global_step": 50095, "epoch": 1192} {"train_loss": -5.800436019897461, "global_step": 50096, "epoch": 1192} {"train_loss": -5.754934787750244, "global_step": 50097, "epoch": 1192} {"train_loss": -5.794136047363281, "global_step": 50098, "epoch": 1192} {"train_loss": -5.872771263122559, "global_step": 50099, "epoch": 1192} {"train_loss": -5.890307426452637, "global_step": 50100, "epoch": 1192} {"train_loss": -5.828677177429199, "global_step": 50101, "epoch": 1192} {"train_loss": -5.739969253540039, "global_step": 50102, "epoch": 1192} {"train_loss": -5.746255397796631, "global_step": 50103, "epoch": 1192} {"train_loss": -5.790021896362305, "global_step": 50104, "epoch": 1192} {"train_loss": -5.781396082469395, "global_step": 50105, "epoch": 1192, "val_loss": 61422.83984375} {"train_loss": -5.69296932220459, "global_step": 50106, "epoch": 1193} {"train_loss": -5.8420023918151855, "global_step": 50107, "epoch": 1193} {"train_loss": -5.7732133865356445, "global_step": 50108, "epoch": 1193} {"train_loss": -5.789252281188965, "global_step": 50109, "epoch": 1193} {"train_loss": -5.802553176879883, "global_step": 50110, "epoch": 1193} {"train_loss": -5.900970458984375, "global_step": 50111, "epoch": 1193} {"train_loss": -5.720731735229492, "global_step": 50112, "epoch": 1193} {"train_loss": -5.726941108703613, "global_step": 50113, "epoch": 1193} {"train_loss": -5.74815559387207, "global_step": 50114, "epoch": 1193} {"train_loss": -5.853655815124512, "global_step": 50115, "epoch": 1193} {"train_loss": -5.596192359924316, "global_step": 50116, "epoch": 1193} {"train_loss": -5.792988300323486, "global_step": 50117, "epoch": 1193} {"train_loss": -5.819599151611328, "global_step": 50118, "epoch": 1193} {"train_loss": -5.780457973480225, "global_step": 50119, "epoch": 1193} {"train_loss": -5.784714698791504, "global_step": 50120, "epoch": 1193} {"train_loss": -5.934689998626709, "global_step": 50121, "epoch": 1193} {"train_loss": -5.750537395477295, "global_step": 50122, "epoch": 1193} {"train_loss": -5.813581466674805, "global_step": 50123, "epoch": 1193} {"train_loss": -5.679258823394775, "global_step": 50124, "epoch": 1193} {"train_loss": -5.767004013061523, "global_step": 50125, "epoch": 1193} {"train_loss": -5.92328405380249, "global_step": 50126, "epoch": 1193} {"train_loss": -5.6105523109436035, "global_step": 50127, "epoch": 1193} {"train_loss": -5.805549144744873, "global_step": 50128, "epoch": 1193} {"train_loss": -5.731320381164551, "global_step": 50129, "epoch": 1193} {"train_loss": -5.583765029907227, "global_step": 50130, "epoch": 1193} {"train_loss": -5.8852152824401855, "global_step": 50131, "epoch": 1193} {"train_loss": -5.762270450592041, "global_step": 50132, "epoch": 1193} {"train_loss": -5.775932312011719, "global_step": 50133, "epoch": 1193} {"train_loss": -5.807924270629883, "global_step": 50134, "epoch": 1193} {"train_loss": -5.709515571594238, "global_step": 50135, "epoch": 1193} {"train_loss": -5.760766983032227, "global_step": 50136, "epoch": 1193} {"train_loss": -5.712554931640625, "global_step": 50137, "epoch": 1193} {"train_loss": -5.760702133178711, "global_step": 50138, "epoch": 1193} {"train_loss": -5.831188201904297, "global_step": 50139, "epoch": 1193} {"train_loss": -5.770224571228027, "global_step": 50140, "epoch": 1193} {"train_loss": -5.758390426635742, "global_step": 50141, "epoch": 1193} {"train_loss": -5.85668420791626, "global_step": 50142, "epoch": 1193} {"train_loss": -5.85103702545166, "global_step": 50143, "epoch": 1193} {"train_loss": -5.662979602813721, "global_step": 50144, "epoch": 1193} {"train_loss": -5.846512794494629, "global_step": 50145, "epoch": 1193} {"train_loss": -5.807596206665039, "global_step": 50146, "epoch": 1193} {"train_loss": -5.773514214016142, "global_step": 50147, "epoch": 1193, "val_loss": 61323.203125} {"train_loss": -5.869706153869629, "global_step": 50148, "epoch": 1194} {"train_loss": -5.779373645782471, "global_step": 50149, "epoch": 1194} {"train_loss": -5.778180122375488, "global_step": 50150, "epoch": 1194} {"train_loss": -5.891904830932617, "global_step": 50151, "epoch": 1194} {"train_loss": -5.864204406738281, "global_step": 50152, "epoch": 1194} {"train_loss": -5.7849531173706055, "global_step": 50153, "epoch": 1194} {"train_loss": -5.732776165008545, "global_step": 50154, "epoch": 1194} {"train_loss": -5.735750198364258, "global_step": 50155, "epoch": 1194} {"train_loss": -5.868803977966309, "global_step": 50156, "epoch": 1194} {"train_loss": -5.694183826446533, "global_step": 50157, "epoch": 1194} {"train_loss": -5.735866546630859, "global_step": 50158, "epoch": 1194} {"train_loss": -5.7162556648254395, "global_step": 50159, "epoch": 1194} {"train_loss": -5.778785705566406, "global_step": 50160, "epoch": 1194} {"train_loss": -5.744046211242676, "global_step": 50161, "epoch": 1194} {"train_loss": -5.79909610748291, "global_step": 50162, "epoch": 1194} {"train_loss": -5.853738307952881, "global_step": 50163, "epoch": 1194} {"train_loss": -5.73625373840332, "global_step": 50164, "epoch": 1194} {"train_loss": -5.777448654174805, "global_step": 50165, "epoch": 1194} {"train_loss": -5.717763900756836, "global_step": 50166, "epoch": 1194} {"train_loss": -5.707180976867676, "global_step": 50167, "epoch": 1194} {"train_loss": -5.801971912384033, "global_step": 50168, "epoch": 1194} {"train_loss": -5.813872337341309, "global_step": 50169, "epoch": 1194} {"train_loss": -5.760043144226074, "global_step": 50170, "epoch": 1194} {"train_loss": -5.739086151123047, "global_step": 50171, "epoch": 1194} {"train_loss": -5.796684265136719, "global_step": 50172, "epoch": 1194} {"train_loss": -5.809935092926025, "global_step": 50173, "epoch": 1194} {"train_loss": -5.790585994720459, "global_step": 50174, "epoch": 1194} {"train_loss": -5.675703525543213, "global_step": 50175, "epoch": 1194} {"train_loss": -5.783258438110352, "global_step": 50176, "epoch": 1194} {"train_loss": -5.787467002868652, "global_step": 50177, "epoch": 1194} {"train_loss": -5.776798248291016, "global_step": 50178, "epoch": 1194} {"train_loss": -5.932169437408447, "global_step": 50179, "epoch": 1194} {"train_loss": -5.821117401123047, "global_step": 50180, "epoch": 1194} {"train_loss": -5.731968879699707, "global_step": 50181, "epoch": 1194} {"train_loss": -5.799875259399414, "global_step": 50182, "epoch": 1194} {"train_loss": -5.799567222595215, "global_step": 50183, "epoch": 1194} {"train_loss": -5.875619888305664, "global_step": 50184, "epoch": 1194} {"train_loss": -5.636109352111816, "global_step": 50185, "epoch": 1194} {"train_loss": -5.783367156982422, "global_step": 50186, "epoch": 1194} {"train_loss": -5.68601131439209, "global_step": 50187, "epoch": 1194} {"train_loss": -5.72781229019165, "global_step": 50188, "epoch": 1194} {"train_loss": -5.777651900336856, "global_step": 50189, "epoch": 1194, "val_loss": 61640.45703125} {"train_loss": -5.716817855834961, "global_step": 50190, "epoch": 1195} {"train_loss": -5.893472671508789, "global_step": 50191, "epoch": 1195} {"train_loss": -5.895906925201416, "global_step": 50192, "epoch": 1195} {"train_loss": -5.782523155212402, "global_step": 50193, "epoch": 1195} {"train_loss": -5.78143310546875, "global_step": 50194, "epoch": 1195} {"train_loss": -5.795876979827881, "global_step": 50195, "epoch": 1195} {"train_loss": -5.677022933959961, "global_step": 50196, "epoch": 1195} {"train_loss": -5.660561561584473, "global_step": 50197, "epoch": 1195} {"train_loss": -5.800933837890625, "global_step": 50198, "epoch": 1195} {"train_loss": -5.8445000648498535, "global_step": 50199, "epoch": 1195} {"train_loss": -5.765654563903809, "global_step": 50200, "epoch": 1195} {"train_loss": -5.65341329574585, "global_step": 50201, "epoch": 1195} {"train_loss": -5.835267066955566, "global_step": 50202, "epoch": 1195} {"train_loss": -5.718222618103027, "global_step": 50203, "epoch": 1195} {"train_loss": -5.697850704193115, "global_step": 50204, "epoch": 1195} {"train_loss": -5.776538372039795, "global_step": 50205, "epoch": 1195} {"train_loss": -5.710904121398926, "global_step": 50206, "epoch": 1195} {"train_loss": -5.835569381713867, "global_step": 50207, "epoch": 1195} {"train_loss": -5.724040985107422, "global_step": 50208, "epoch": 1195} {"train_loss": -5.855190753936768, "global_step": 50209, "epoch": 1195} {"train_loss": -5.7754693031311035, "global_step": 50210, "epoch": 1195} {"train_loss": -5.720156669616699, "global_step": 50211, "epoch": 1195} {"train_loss": -5.659826278686523, "global_step": 50212, "epoch": 1195} {"train_loss": -5.7642951011657715, "global_step": 50213, "epoch": 1195} {"train_loss": -5.817331314086914, "global_step": 50214, "epoch": 1195} {"train_loss": -5.685885429382324, "global_step": 50215, "epoch": 1195} {"train_loss": -5.918953895568848, "global_step": 50216, "epoch": 1195} {"train_loss": -5.845552444458008, "global_step": 50217, "epoch": 1195} {"train_loss": -5.860273361206055, "global_step": 50218, "epoch": 1195} {"train_loss": -5.663939476013184, "global_step": 50219, "epoch": 1195} {"train_loss": -5.82997989654541, "global_step": 50220, "epoch": 1195} {"train_loss": -5.715752601623535, "global_step": 50221, "epoch": 1195} {"train_loss": -5.860657691955566, "global_step": 50222, "epoch": 1195} {"train_loss": -5.8719892501831055, "global_step": 50223, "epoch": 1195} {"train_loss": -5.762508869171143, "global_step": 50224, "epoch": 1195} {"train_loss": -5.810451984405518, "global_step": 50225, "epoch": 1195} {"train_loss": -5.7520318031311035, "global_step": 50226, "epoch": 1195} {"train_loss": -5.894558906555176, "global_step": 50227, "epoch": 1195} {"train_loss": -5.7084245681762695, "global_step": 50228, "epoch": 1195} {"train_loss": -5.81892204284668, "global_step": 50229, "epoch": 1195} {"train_loss": -5.865332126617432, "global_step": 50230, "epoch": 1195} {"train_loss": -5.780579067411876, "global_step": 50231, "epoch": 1195, "val_loss": 61492.7109375} {"train_loss": -5.883091926574707, "global_step": 50232, "epoch": 1196} {"train_loss": -5.760135650634766, "global_step": 50233, "epoch": 1196} {"train_loss": -5.793705940246582, "global_step": 50234, "epoch": 1196} {"train_loss": -5.7490644454956055, "global_step": 50235, "epoch": 1196} {"train_loss": -5.813580513000488, "global_step": 50236, "epoch": 1196} {"train_loss": -5.799882411956787, "global_step": 50237, "epoch": 1196} {"train_loss": -5.801367282867432, "global_step": 50238, "epoch": 1196} {"train_loss": -5.574965000152588, "global_step": 50239, "epoch": 1196} {"train_loss": -5.781216621398926, "global_step": 50240, "epoch": 1196} {"train_loss": -5.774089336395264, "global_step": 50241, "epoch": 1196} {"train_loss": -5.750398635864258, "global_step": 50242, "epoch": 1196} {"train_loss": -5.74011754989624, "global_step": 50243, "epoch": 1196} {"train_loss": -5.760688781738281, "global_step": 50244, "epoch": 1196} {"train_loss": -5.705825328826904, "global_step": 50245, "epoch": 1196} {"train_loss": -5.8810834884643555, "global_step": 50246, "epoch": 1196} {"train_loss": -5.740348815917969, "global_step": 50247, "epoch": 1196} {"train_loss": -5.749837875366211, "global_step": 50248, "epoch": 1196} {"train_loss": -5.837854385375977, "global_step": 50249, "epoch": 1196} {"train_loss": -5.6972246170043945, "global_step": 50250, "epoch": 1196} {"train_loss": -5.834508895874023, "global_step": 50251, "epoch": 1196} {"train_loss": -5.822262763977051, "global_step": 50252, "epoch": 1196} {"train_loss": -5.846076011657715, "global_step": 50253, "epoch": 1196} {"train_loss": -5.750934600830078, "global_step": 50254, "epoch": 1196} {"train_loss": -5.824712753295898, "global_step": 50255, "epoch": 1196} {"train_loss": -5.826573371887207, "global_step": 50256, "epoch": 1196} {"train_loss": -5.857501983642578, "global_step": 50257, "epoch": 1196} {"train_loss": -5.961877822875977, "global_step": 50258, "epoch": 1196} {"train_loss": -5.703685283660889, "global_step": 50259, "epoch": 1196} {"train_loss": -5.838179111480713, "global_step": 50260, "epoch": 1196} {"train_loss": -5.869359970092773, "global_step": 50261, "epoch": 1196} {"train_loss": -5.847205638885498, "global_step": 50262, "epoch": 1196} {"train_loss": -5.776910305023193, "global_step": 50263, "epoch": 1196} {"train_loss": -5.851578712463379, "global_step": 50264, "epoch": 1196} {"train_loss": -5.882178783416748, "global_step": 50265, "epoch": 1196} {"train_loss": -5.889143943786621, "global_step": 50266, "epoch": 1196} {"train_loss": -5.886054515838623, "global_step": 50267, "epoch": 1196} {"train_loss": -5.822608947753906, "global_step": 50268, "epoch": 1196} {"train_loss": -5.839908123016357, "global_step": 50269, "epoch": 1196} {"train_loss": -5.771452903747559, "global_step": 50270, "epoch": 1196} {"train_loss": -5.728724479675293, "global_step": 50271, "epoch": 1196} {"train_loss": -5.781760215759277, "global_step": 50272, "epoch": 1196} {"train_loss": -5.798601695469448, "global_step": 50273, "epoch": 1196, "val_loss": 61773.046875} {"train_loss": -5.873763084411621, "global_step": 50274, "epoch": 1197} {"train_loss": -5.812522888183594, "global_step": 50275, "epoch": 1197} {"train_loss": -5.805288314819336, "global_step": 50276, "epoch": 1197} {"train_loss": -5.855788230895996, "global_step": 50277, "epoch": 1197} {"train_loss": -5.707169532775879, "global_step": 50278, "epoch": 1197} {"train_loss": -5.790465354919434, "global_step": 50279, "epoch": 1197} {"train_loss": -5.803610801696777, "global_step": 50280, "epoch": 1197} {"train_loss": -5.793451309204102, "global_step": 50281, "epoch": 1197} {"train_loss": -5.781365394592285, "global_step": 50282, "epoch": 1197} {"train_loss": -5.604987144470215, "global_step": 50283, "epoch": 1197} {"train_loss": -5.813084602355957, "global_step": 50284, "epoch": 1197} {"train_loss": -5.866087913513184, "global_step": 50285, "epoch": 1197} {"train_loss": -5.7187652587890625, "global_step": 50286, "epoch": 1197} {"train_loss": -5.766956329345703, "global_step": 50287, "epoch": 1197} {"train_loss": -5.766110420227051, "global_step": 50288, "epoch": 1197} {"train_loss": -5.774481773376465, "global_step": 50289, "epoch": 1197} {"train_loss": -5.72304105758667, "global_step": 50290, "epoch": 1197} {"train_loss": -5.566339015960693, "global_step": 50291, "epoch": 1197} {"train_loss": -5.894143581390381, "global_step": 50292, "epoch": 1197} {"train_loss": -5.643398761749268, "global_step": 50293, "epoch": 1197} {"train_loss": -5.781904220581055, "global_step": 50294, "epoch": 1197} {"train_loss": -5.626496315002441, "global_step": 50295, "epoch": 1197} {"train_loss": -5.707976341247559, "global_step": 50296, "epoch": 1197} {"train_loss": -5.75827693939209, "global_step": 50297, "epoch": 1197} {"train_loss": -5.582244873046875, "global_step": 50298, "epoch": 1197} {"train_loss": -5.686871528625488, "global_step": 50299, "epoch": 1197} {"train_loss": -5.706599235534668, "global_step": 50300, "epoch": 1197} {"train_loss": -5.964509010314941, "global_step": 50301, "epoch": 1197} {"train_loss": -5.637455940246582, "global_step": 50302, "epoch": 1197} {"train_loss": -5.721767425537109, "global_step": 50303, "epoch": 1197} {"train_loss": -5.535699844360352, "global_step": 50304, "epoch": 1197} {"train_loss": -5.684823989868164, "global_step": 50305, "epoch": 1197} {"train_loss": -5.649642467498779, "global_step": 50306, "epoch": 1197} {"train_loss": -5.691704750061035, "global_step": 50307, "epoch": 1197} {"train_loss": -5.680595874786377, "global_step": 50308, "epoch": 1197} {"train_loss": -5.677653789520264, "global_step": 50309, "epoch": 1197} {"train_loss": -5.675739288330078, "global_step": 50310, "epoch": 1197} {"train_loss": -5.727954864501953, "global_step": 50311, "epoch": 1197} {"train_loss": -5.619351863861084, "global_step": 50312, "epoch": 1197} {"train_loss": -5.817127227783203, "global_step": 50313, "epoch": 1197} {"train_loss": -5.663774490356445, "global_step": 50314, "epoch": 1197} {"train_loss": -5.7305745624360585, "global_step": 50315, "epoch": 1197, "val_loss": 61779.3359375} {"train_loss": -5.782967567443848, "global_step": 50316, "epoch": 1198} {"train_loss": -5.760296821594238, "global_step": 50317, "epoch": 1198} {"train_loss": -5.773937225341797, "global_step": 50318, "epoch": 1198} {"train_loss": -5.621902942657471, "global_step": 50319, "epoch": 1198} {"train_loss": -5.822805404663086, "global_step": 50320, "epoch": 1198} {"train_loss": -5.717584609985352, "global_step": 50321, "epoch": 1198} {"train_loss": -5.693675994873047, "global_step": 50322, "epoch": 1198} {"train_loss": -5.757610321044922, "global_step": 50323, "epoch": 1198} {"train_loss": -5.768112659454346, "global_step": 50324, "epoch": 1198} {"train_loss": -5.8278913497924805, "global_step": 50325, "epoch": 1198} {"train_loss": -5.727394104003906, "global_step": 50326, "epoch": 1198} {"train_loss": -5.810819149017334, "global_step": 50327, "epoch": 1198} {"train_loss": -5.730740070343018, "global_step": 50328, "epoch": 1198} {"train_loss": -5.855257987976074, "global_step": 50329, "epoch": 1198} {"train_loss": -5.787563323974609, "global_step": 50330, "epoch": 1198} {"train_loss": -5.786266326904297, "global_step": 50331, "epoch": 1198} {"train_loss": -5.730768203735352, "global_step": 50332, "epoch": 1198} {"train_loss": -5.705873966217041, "global_step": 50333, "epoch": 1198} {"train_loss": -5.731637954711914, "global_step": 50334, "epoch": 1198} {"train_loss": -5.8268351554870605, "global_step": 50335, "epoch": 1198} {"train_loss": -5.8882527351379395, "global_step": 50336, "epoch": 1198} {"train_loss": -5.814490795135498, "global_step": 50337, "epoch": 1198} {"train_loss": -5.862654685974121, "global_step": 50338, "epoch": 1198} {"train_loss": -5.872754096984863, "global_step": 50339, "epoch": 1198} {"train_loss": -5.786625862121582, "global_step": 50340, "epoch": 1198} {"train_loss": -5.761877059936523, "global_step": 50341, "epoch": 1198} {"train_loss": -5.934204578399658, "global_step": 50342, "epoch": 1198} {"train_loss": -5.78548526763916, "global_step": 50343, "epoch": 1198} {"train_loss": -5.664173603057861, "global_step": 50344, "epoch": 1198} {"train_loss": -5.822108268737793, "global_step": 50345, "epoch": 1198} {"train_loss": -5.837770462036133, "global_step": 50346, "epoch": 1198} {"train_loss": -5.780243396759033, "global_step": 50347, "epoch": 1198} {"train_loss": -5.9716081619262695, "global_step": 50348, "epoch": 1198} {"train_loss": -5.8323469161987305, "global_step": 50349, "epoch": 1198} {"train_loss": -5.82216739654541, "global_step": 50350, "epoch": 1198} {"train_loss": -5.839463710784912, "global_step": 50351, "epoch": 1198} {"train_loss": -5.817962169647217, "global_step": 50352, "epoch": 1198} {"train_loss": -5.706250190734863, "global_step": 50353, "epoch": 1198} {"train_loss": -5.702349662780762, "global_step": 50354, "epoch": 1198} {"train_loss": -5.834451198577881, "global_step": 50355, "epoch": 1198} {"train_loss": -5.709195137023926, "global_step": 50356, "epoch": 1198} {"train_loss": -5.792066358384632, "global_step": 50357, "epoch": 1198, "val_loss": 61703.64453125} {"train_loss": -5.799976825714111, "global_step": 50358, "epoch": 1199} {"train_loss": -5.7646379470825195, "global_step": 50359, "epoch": 1199} {"train_loss": -5.887438774108887, "global_step": 50360, "epoch": 1199} {"train_loss": -5.666635990142822, "global_step": 50361, "epoch": 1199} {"train_loss": -5.73545503616333, "global_step": 50362, "epoch": 1199} {"train_loss": -5.803000450134277, "global_step": 50363, "epoch": 1199} {"train_loss": -5.712131023406982, "global_step": 50364, "epoch": 1199} {"train_loss": -5.644258975982666, "global_step": 50365, "epoch": 1199} {"train_loss": -5.7002973556518555, "global_step": 50366, "epoch": 1199} {"train_loss": -5.707469463348389, "global_step": 50367, "epoch": 1199} {"train_loss": -5.836704254150391, "global_step": 50368, "epoch": 1199} {"train_loss": -5.6879119873046875, "global_step": 50369, "epoch": 1199} {"train_loss": -5.69364070892334, "global_step": 50370, "epoch": 1199} {"train_loss": -5.635502815246582, "global_step": 50371, "epoch": 1199} {"train_loss": -5.767928123474121, "global_step": 50372, "epoch": 1199} {"train_loss": -5.811887741088867, "global_step": 50373, "epoch": 1199} {"train_loss": -5.709795951843262, "global_step": 50374, "epoch": 1199} {"train_loss": -5.854392051696777, "global_step": 50375, "epoch": 1199} {"train_loss": -5.6648712158203125, "global_step": 50376, "epoch": 1199} {"train_loss": -5.761943817138672, "global_step": 50377, "epoch": 1199} {"train_loss": -5.8087005615234375, "global_step": 50378, "epoch": 1199} {"train_loss": -5.72709846496582, "global_step": 50379, "epoch": 1199} {"train_loss": -5.797385215759277, "global_step": 50380, "epoch": 1199} {"train_loss": -5.835941314697266, "global_step": 50381, "epoch": 1199} {"train_loss": -5.650628566741943, "global_step": 50382, "epoch": 1199} {"train_loss": -5.782798767089844, "global_step": 50383, "epoch": 1199} {"train_loss": -5.715169906616211, "global_step": 50384, "epoch": 1199} {"train_loss": -5.826750755310059, "global_step": 50385, "epoch": 1199} {"train_loss": -5.809521675109863, "global_step": 50386, "epoch": 1199} {"train_loss": -5.7589898109436035, "global_step": 50387, "epoch": 1199} {"train_loss": -5.824843406677246, "global_step": 50388, "epoch": 1199} {"train_loss": -5.65300989151001, "global_step": 50389, "epoch": 1199} {"train_loss": -5.770418167114258, "global_step": 50390, "epoch": 1199} {"train_loss": -5.890124320983887, "global_step": 50391, "epoch": 1199} {"train_loss": -5.694226264953613, "global_step": 50392, "epoch": 1199} {"train_loss": -5.846931457519531, "global_step": 50393, "epoch": 1199} {"train_loss": -5.902163505554199, "global_step": 50394, "epoch": 1199} {"train_loss": -5.7921648025512695, "global_step": 50395, "epoch": 1199} {"train_loss": -5.744088172912598, "global_step": 50396, "epoch": 1199} {"train_loss": -5.816864967346191, "global_step": 50397, "epoch": 1199} {"train_loss": -5.787303924560547, "global_step": 50398, "epoch": 1199} {"train_loss": -5.765170256296794, "global_step": 50399, "epoch": 1199, "val_loss": 61346.4921875} {"train_loss": -5.774378776550293, "global_step": 50400, "epoch": 1200} {"train_loss": -5.9596710205078125, "global_step": 50401, "epoch": 1200} {"train_loss": -5.830723285675049, "global_step": 50402, "epoch": 1200} {"train_loss": -5.671257972717285, "global_step": 50403, "epoch": 1200} {"train_loss": -5.7873406410217285, "global_step": 50404, "epoch": 1200} {"train_loss": -5.760893821716309, "global_step": 50405, "epoch": 1200} {"train_loss": -5.792487144470215, "global_step": 50406, "epoch": 1200} {"train_loss": -5.7366461753845215, "global_step": 50407, "epoch": 1200} {"train_loss": -5.861774444580078, "global_step": 50408, "epoch": 1200} {"train_loss": -5.730792999267578, "global_step": 50409, "epoch": 1200} {"train_loss": -5.730422019958496, "global_step": 50410, "epoch": 1200} {"train_loss": -5.783297538757324, "global_step": 50411, "epoch": 1200} {"train_loss": -5.716254234313965, "global_step": 50412, "epoch": 1200} {"train_loss": -5.743687152862549, "global_step": 50413, "epoch": 1200} {"train_loss": -5.643149375915527, "global_step": 50414, "epoch": 1200} {"train_loss": -5.778502464294434, "global_step": 50415, "epoch": 1200} {"train_loss": -5.7034196853637695, "global_step": 50416, "epoch": 1200} {"train_loss": -5.7934417724609375, "global_step": 50417, "epoch": 1200} {"train_loss": -5.763260364532471, "global_step": 50418, "epoch": 1200} {"train_loss": -5.714045524597168, "global_step": 50419, "epoch": 1200} {"train_loss": -5.746490478515625, "global_step": 50420, "epoch": 1200} {"train_loss": -5.740184307098389, "global_step": 50421, "epoch": 1200} {"train_loss": -5.775242805480957, "global_step": 50422, "epoch": 1200} {"train_loss": -5.702742576599121, "global_step": 50423, "epoch": 1200} {"train_loss": -5.757773399353027, "global_step": 50424, "epoch": 1200} {"train_loss": -5.793259620666504, "global_step": 50425, "epoch": 1200} {"train_loss": -5.732524871826172, "global_step": 50426, "epoch": 1200} {"train_loss": -5.91065788269043, "global_step": 50427, "epoch": 1200} {"train_loss": -5.8484883308410645, "global_step": 50428, "epoch": 1200} {"train_loss": -5.663497447967529, "global_step": 50429, "epoch": 1200} {"train_loss": -5.852219581604004, "global_step": 50430, "epoch": 1200} {"train_loss": -5.833085060119629, "global_step": 50431, "epoch": 1200} {"train_loss": -5.848980903625488, "global_step": 50432, "epoch": 1200} {"train_loss": -5.793241500854492, "global_step": 50433, "epoch": 1200} {"train_loss": -5.785051345825195, "global_step": 50434, "epoch": 1200} {"train_loss": -5.76692008972168, "global_step": 50435, "epoch": 1200} {"train_loss": -5.928668022155762, "global_step": 50436, "epoch": 1200} {"train_loss": -5.762706279754639, "global_step": 50437, "epoch": 1200} {"train_loss": -5.893774509429932, "global_step": 50438, "epoch": 1200} {"train_loss": -5.898207664489746, "global_step": 50439, "epoch": 1200} {"train_loss": -5.829090118408203, "global_step": 50440, "epoch": 1200} {"train_loss": -5.782816092173259, "global_step": 50441, "epoch": 1200, "train/sim_max_reward_0": 0.33140725414086303, "train/sim_max_reward_1": 0.2260794211255808, "train/sim_max_reward_2": 0.6127327989868877, "train/sim_max_reward_3": 0.8215342955978419, "train/sim_max_reward_4": 0.8568385699847474, "train/sim_max_reward_5": 0.9365408421170682, "test/sim_max_reward_4300000": 0.7862143600867801, "test/sim_max_reward_4300001": 0.38069356492682893, "test/sim_max_reward_4300002": 0.7596307844940168, "test/sim_max_reward_4300003": 0.8208549060244008, "test/sim_max_reward_4300004": 0.8686048568267182, "test/sim_max_reward_4300005": 0.4357808508254789, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.36059411579828854, "test/sim_max_reward_4300008": 0.4494146610582245, "test/sim_max_reward_4300009": 0.7712368024477027, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9250275403610599, "test/sim_max_reward_4300012": 0.7397841478351629, "test/sim_max_reward_4300013": 0.740917459333516, "test/sim_max_reward_4300014": 0.8295197939910286, "test/sim_max_reward_4300015": 0.9198722805993667, "test/sim_max_reward_4300016": 0.9558283377744127, "test/sim_max_reward_4300017": 0.9060677618759717, "test/sim_max_reward_4300018": 0.9483813311910809, "test/sim_max_reward_4300019": 0.1863267178723507, "test/sim_max_reward_4300020": 0.3498476698453855, "test/sim_max_reward_4300021": 0.9353559922881424, "test/sim_max_reward_4300022": 0.2613454453718299, "test/sim_max_reward_4300023": 0.35104678543097523, "test/sim_max_reward_4300024": 0.05525926941138335, "test/sim_max_reward_4300025": 0.7706548171620429, "test/sim_max_reward_4300026": 0.31794268716321455, "test/sim_max_reward_4300027": 0.7543633310307192, "test/sim_max_reward_4300028": 0.9215766982664906, "test/sim_max_reward_4300029": 0.13334208473800294, "test/sim_max_reward_4300030": 0.6764814268234597, "test/sim_max_reward_4300031": 0.2210575449834234, "test/sim_max_reward_4300032": 0.8763360507809514, "test/sim_max_reward_4300033": 0.9036030704142207, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.5882079830284702, "test/sim_max_reward_4300038": 0.731111105480226, "test/sim_max_reward_4300039": 0.8683934328759195, "test/sim_max_reward_4300040": 0.29041113503827454, "test/sim_max_reward_4300041": 0.983945367573213, "test/sim_max_reward_4300042": 0.542042201445611, "test/sim_max_reward_4300043": 0.16283120274679064, "test/sim_max_reward_4300044": 0.829693872996062, "test/sim_max_reward_4300045": 0.1624699530825434, "test/sim_max_reward_4300046": 0.6762555047192073, "test/sim_max_reward_4300047": 0.8719164698867621, "test/sim_max_reward_4300048": 0.8764008868748325, "test/sim_max_reward_4300049": 0.0010398229175116742, "train/mean_score": 0.6308555303254982, "test/mean_score": 0.5619375240252308, "val_loss": 61271.1875} {"train_loss": -5.835379123687744, "global_step": 50442, "epoch": 1201} {"train_loss": -5.745862007141113, "global_step": 50443, "epoch": 1201} {"train_loss": -5.824939727783203, "global_step": 50444, "epoch": 1201} {"train_loss": -5.790609359741211, "global_step": 50445, "epoch": 1201} {"train_loss": -5.678378105163574, "global_step": 50446, "epoch": 1201} {"train_loss": -5.849620819091797, "global_step": 50447, "epoch": 1201} {"train_loss": -5.824982643127441, "global_step": 50448, "epoch": 1201} {"train_loss": -5.820511341094971, "global_step": 50449, "epoch": 1201} {"train_loss": -5.845890045166016, "global_step": 50450, "epoch": 1201} {"train_loss": -5.848752498626709, "global_step": 50451, "epoch": 1201} {"train_loss": -5.803528308868408, "global_step": 50452, "epoch": 1201} {"train_loss": -5.802858829498291, "global_step": 50453, "epoch": 1201} {"train_loss": -5.842382907867432, "global_step": 50454, "epoch": 1201} {"train_loss": -5.942310333251953, "global_step": 50455, "epoch": 1201} {"train_loss": -5.878684997558594, "global_step": 50456, "epoch": 1201} {"train_loss": -5.868156909942627, "global_step": 50457, "epoch": 1201} {"train_loss": -5.7707061767578125, "global_step": 50458, "epoch": 1201} {"train_loss": -5.927496910095215, "global_step": 50459, "epoch": 1201} {"train_loss": -5.716731548309326, "global_step": 50460, "epoch": 1201} {"train_loss": -5.8088483810424805, "global_step": 50461, "epoch": 1201} {"train_loss": -5.864617347717285, "global_step": 50462, "epoch": 1201} {"train_loss": -5.752191543579102, "global_step": 50463, "epoch": 1201} {"train_loss": -5.796044826507568, "global_step": 50464, "epoch": 1201} {"train_loss": -5.816493034362793, "global_step": 50465, "epoch": 1201} {"train_loss": -5.886333465576172, "global_step": 50466, "epoch": 1201} {"train_loss": -5.828183650970459, "global_step": 50467, "epoch": 1201} {"train_loss": -5.666754722595215, "global_step": 50468, "epoch": 1201} {"train_loss": -5.790062427520752, "global_step": 50469, "epoch": 1201} {"train_loss": -5.849347114562988, "global_step": 50470, "epoch": 1201} {"train_loss": -5.845808506011963, "global_step": 50471, "epoch": 1201} {"train_loss": -5.815609455108643, "global_step": 50472, "epoch": 1201} {"train_loss": -5.70298957824707, "global_step": 50473, "epoch": 1201} {"train_loss": -5.765965461730957, "global_step": 50474, "epoch": 1201} {"train_loss": -5.772078514099121, "global_step": 50475, "epoch": 1201} {"train_loss": -5.716519832611084, "global_step": 50476, "epoch": 1201} {"train_loss": -5.786698341369629, "global_step": 50477, "epoch": 1201} {"train_loss": -5.66767692565918, "global_step": 50478, "epoch": 1201} {"train_loss": -5.755511283874512, "global_step": 50479, "epoch": 1201} {"train_loss": -5.679662704467773, "global_step": 50480, "epoch": 1201} {"train_loss": -5.768680572509766, "global_step": 50481, "epoch": 1201} {"train_loss": -5.791106224060059, "global_step": 50482, "epoch": 1201} {"train_loss": -5.79955758367266, "global_step": 50483, "epoch": 1201, "val_loss": 61813.7109375} {"train_loss": -5.756569862365723, "global_step": 50484, "epoch": 1202} {"train_loss": -5.819126129150391, "global_step": 50485, "epoch": 1202} {"train_loss": -5.762192726135254, "global_step": 50486, "epoch": 1202} {"train_loss": -5.813462734222412, "global_step": 50487, "epoch": 1202} {"train_loss": -5.841057777404785, "global_step": 50488, "epoch": 1202} {"train_loss": -5.821227550506592, "global_step": 50489, "epoch": 1202} {"train_loss": -5.884554386138916, "global_step": 50490, "epoch": 1202} {"train_loss": -5.708082675933838, "global_step": 50491, "epoch": 1202} {"train_loss": -5.774511337280273, "global_step": 50492, "epoch": 1202} {"train_loss": -5.825803756713867, "global_step": 50493, "epoch": 1202} {"train_loss": -5.986169338226318, "global_step": 50494, "epoch": 1202} {"train_loss": -5.801565170288086, "global_step": 50495, "epoch": 1202} {"train_loss": -5.72723388671875, "global_step": 50496, "epoch": 1202} {"train_loss": -5.740190505981445, "global_step": 50497, "epoch": 1202} {"train_loss": -5.857963562011719, "global_step": 50498, "epoch": 1202} {"train_loss": -5.863726615905762, "global_step": 50499, "epoch": 1202} {"train_loss": -5.789379596710205, "global_step": 50500, "epoch": 1202} {"train_loss": -5.73606538772583, "global_step": 50501, "epoch": 1202} {"train_loss": -5.864317417144775, "global_step": 50502, "epoch": 1202} {"train_loss": -5.85102653503418, "global_step": 50503, "epoch": 1202} {"train_loss": -5.81351900100708, "global_step": 50504, "epoch": 1202} {"train_loss": -5.69944953918457, "global_step": 50505, "epoch": 1202} {"train_loss": -5.845553398132324, "global_step": 50506, "epoch": 1202} {"train_loss": -5.792529106140137, "global_step": 50507, "epoch": 1202} {"train_loss": -5.697280406951904, "global_step": 50508, "epoch": 1202} {"train_loss": -5.841038227081299, "global_step": 50509, "epoch": 1202} {"train_loss": -5.856034278869629, "global_step": 50510, "epoch": 1202} {"train_loss": -5.8001813888549805, "global_step": 50511, "epoch": 1202} {"train_loss": -5.9705400466918945, "global_step": 50512, "epoch": 1202} {"train_loss": -5.834100723266602, "global_step": 50513, "epoch": 1202} {"train_loss": -5.730470657348633, "global_step": 50514, "epoch": 1202} {"train_loss": -5.88383674621582, "global_step": 50515, "epoch": 1202} {"train_loss": -5.8636980056762695, "global_step": 50516, "epoch": 1202} {"train_loss": -5.939310073852539, "global_step": 50517, "epoch": 1202} {"train_loss": -5.635512351989746, "global_step": 50518, "epoch": 1202} {"train_loss": -5.817272186279297, "global_step": 50519, "epoch": 1202} {"train_loss": -5.719076156616211, "global_step": 50520, "epoch": 1202} {"train_loss": -5.761548042297363, "global_step": 50521, "epoch": 1202} {"train_loss": -5.6893463134765625, "global_step": 50522, "epoch": 1202} {"train_loss": -5.831320762634277, "global_step": 50523, "epoch": 1202} {"train_loss": -5.6883416175842285, "global_step": 50524, "epoch": 1202} {"train_loss": -5.802725542159307, "global_step": 50525, "epoch": 1202, "val_loss": 61516.04296875} {"train_loss": -5.729471206665039, "global_step": 50526, "epoch": 1203} {"train_loss": -5.715609550476074, "global_step": 50527, "epoch": 1203} {"train_loss": -5.74403190612793, "global_step": 50528, "epoch": 1203} {"train_loss": -5.801252365112305, "global_step": 50529, "epoch": 1203} {"train_loss": -5.669816017150879, "global_step": 50530, "epoch": 1203} {"train_loss": -5.698615074157715, "global_step": 50531, "epoch": 1203} {"train_loss": -5.783951759338379, "global_step": 50532, "epoch": 1203} {"train_loss": -5.687154769897461, "global_step": 50533, "epoch": 1203} {"train_loss": -5.765994071960449, "global_step": 50534, "epoch": 1203} {"train_loss": -5.819360733032227, "global_step": 50535, "epoch": 1203} {"train_loss": -5.671660900115967, "global_step": 50536, "epoch": 1203} {"train_loss": -5.736833572387695, "global_step": 50537, "epoch": 1203} {"train_loss": -5.742697715759277, "global_step": 50538, "epoch": 1203} {"train_loss": -5.678823471069336, "global_step": 50539, "epoch": 1203} {"train_loss": -5.693996906280518, "global_step": 50540, "epoch": 1203} {"train_loss": -5.726686477661133, "global_step": 50541, "epoch": 1203} {"train_loss": -5.705877304077148, "global_step": 50542, "epoch": 1203} {"train_loss": -5.668055057525635, "global_step": 50543, "epoch": 1203} {"train_loss": -5.83881950378418, "global_step": 50544, "epoch": 1203} {"train_loss": -5.846685409545898, "global_step": 50545, "epoch": 1203} {"train_loss": -5.674938201904297, "global_step": 50546, "epoch": 1203} {"train_loss": -5.868051528930664, "global_step": 50547, "epoch": 1203} {"train_loss": -5.743005752563477, "global_step": 50548, "epoch": 1203} {"train_loss": -5.747418403625488, "global_step": 50549, "epoch": 1203} {"train_loss": -5.827378273010254, "global_step": 50550, "epoch": 1203} {"train_loss": -5.761317253112793, "global_step": 50551, "epoch": 1203} {"train_loss": -5.765210151672363, "global_step": 50552, "epoch": 1203} {"train_loss": -5.660526275634766, "global_step": 50553, "epoch": 1203} {"train_loss": -5.728909969329834, "global_step": 50554, "epoch": 1203} {"train_loss": -5.9139790534973145, "global_step": 50555, "epoch": 1203} {"train_loss": -5.770511627197266, "global_step": 50556, "epoch": 1203} {"train_loss": -5.547504901885986, "global_step": 50557, "epoch": 1203} {"train_loss": -5.7370710372924805, "global_step": 50558, "epoch": 1203} {"train_loss": -5.749177932739258, "global_step": 50559, "epoch": 1203} {"train_loss": -5.70792293548584, "global_step": 50560, "epoch": 1203} {"train_loss": -5.725775241851807, "global_step": 50561, "epoch": 1203} {"train_loss": -5.760288238525391, "global_step": 50562, "epoch": 1203} {"train_loss": -5.686578273773193, "global_step": 50563, "epoch": 1203} {"train_loss": -5.643134117126465, "global_step": 50564, "epoch": 1203} {"train_loss": -5.675292015075684, "global_step": 50565, "epoch": 1203} {"train_loss": -5.7041015625, "global_step": 50566, "epoch": 1203} {"train_loss": -5.734588089443388, "global_step": 50567, "epoch": 1203, "val_loss": 61518.62109375} {"train_loss": -5.632662296295166, "global_step": 50568, "epoch": 1204} {"train_loss": -5.647135257720947, "global_step": 50569, "epoch": 1204} {"train_loss": -5.75214147567749, "global_step": 50570, "epoch": 1204} {"train_loss": -5.655142784118652, "global_step": 50571, "epoch": 1204} {"train_loss": -5.853121757507324, "global_step": 50572, "epoch": 1204} {"train_loss": -5.815988540649414, "global_step": 50573, "epoch": 1204} {"train_loss": -5.7639617919921875, "global_step": 50574, "epoch": 1204} {"train_loss": -5.827506065368652, "global_step": 50575, "epoch": 1204} {"train_loss": -5.825857162475586, "global_step": 50576, "epoch": 1204} {"train_loss": -5.762113571166992, "global_step": 50577, "epoch": 1204} {"train_loss": -5.703240394592285, "global_step": 50578, "epoch": 1204} {"train_loss": -5.697409152984619, "global_step": 50579, "epoch": 1204} {"train_loss": -5.817634105682373, "global_step": 50580, "epoch": 1204} {"train_loss": -5.755013942718506, "global_step": 50581, "epoch": 1204} {"train_loss": -5.766486167907715, "global_step": 50582, "epoch": 1204} {"train_loss": -5.761204242706299, "global_step": 50583, "epoch": 1204} {"train_loss": -5.621088027954102, "global_step": 50584, "epoch": 1204} {"train_loss": -5.861507415771484, "global_step": 50585, "epoch": 1204} {"train_loss": -5.679487705230713, "global_step": 50586, "epoch": 1204} {"train_loss": -5.8789777755737305, "global_step": 50587, "epoch": 1204} {"train_loss": -5.889642238616943, "global_step": 50588, "epoch": 1204} {"train_loss": -5.69215202331543, "global_step": 50589, "epoch": 1204} {"train_loss": -5.768494606018066, "global_step": 50590, "epoch": 1204} {"train_loss": -5.742580413818359, "global_step": 50591, "epoch": 1204} {"train_loss": -5.770520210266113, "global_step": 50592, "epoch": 1204} {"train_loss": -5.815226078033447, "global_step": 50593, "epoch": 1204} {"train_loss": -5.923707008361816, "global_step": 50594, "epoch": 1204} {"train_loss": -5.786826133728027, "global_step": 50595, "epoch": 1204} {"train_loss": -5.827284812927246, "global_step": 50596, "epoch": 1204} {"train_loss": -5.701055526733398, "global_step": 50597, "epoch": 1204} {"train_loss": -5.707672119140625, "global_step": 50598, "epoch": 1204} {"train_loss": -5.817806243896484, "global_step": 50599, "epoch": 1204} {"train_loss": -5.753488540649414, "global_step": 50600, "epoch": 1204} {"train_loss": -5.685276031494141, "global_step": 50601, "epoch": 1204} {"train_loss": -5.963248252868652, "global_step": 50602, "epoch": 1204} {"train_loss": -5.81870174407959, "global_step": 50603, "epoch": 1204} {"train_loss": -5.84852933883667, "global_step": 50604, "epoch": 1204} {"train_loss": -5.84412956237793, "global_step": 50605, "epoch": 1204} {"train_loss": -5.774230003356934, "global_step": 50606, "epoch": 1204} {"train_loss": -5.909509181976318, "global_step": 50607, "epoch": 1204} {"train_loss": -5.763195037841797, "global_step": 50608, "epoch": 1204} {"train_loss": -5.779404731023879, "global_step": 50609, "epoch": 1204, "val_loss": 61832.734375} {"train_loss": -5.855782985687256, "global_step": 50610, "epoch": 1205} {"train_loss": -5.693655967712402, "global_step": 50611, "epoch": 1205} {"train_loss": -5.7989373207092285, "global_step": 50612, "epoch": 1205} {"train_loss": -5.869163513183594, "global_step": 50613, "epoch": 1205} {"train_loss": -5.888082027435303, "global_step": 50614, "epoch": 1205} {"train_loss": -5.8028998374938965, "global_step": 50615, "epoch": 1205} {"train_loss": -5.8696184158325195, "global_step": 50616, "epoch": 1205} {"train_loss": -5.856890678405762, "global_step": 50617, "epoch": 1205} {"train_loss": -5.791786193847656, "global_step": 50618, "epoch": 1205} {"train_loss": -5.848274230957031, "global_step": 50619, "epoch": 1205} {"train_loss": -5.854129791259766, "global_step": 50620, "epoch": 1205} {"train_loss": -5.755722999572754, "global_step": 50621, "epoch": 1205} {"train_loss": -5.76080322265625, "global_step": 50622, "epoch": 1205} {"train_loss": -5.862539291381836, "global_step": 50623, "epoch": 1205} {"train_loss": -5.715658664703369, "global_step": 50624, "epoch": 1205} {"train_loss": -5.775986671447754, "global_step": 50625, "epoch": 1205} {"train_loss": -5.790388107299805, "global_step": 50626, "epoch": 1205} {"train_loss": -5.766300201416016, "global_step": 50627, "epoch": 1205} {"train_loss": -5.868245601654053, "global_step": 50628, "epoch": 1205} {"train_loss": -5.736849784851074, "global_step": 50629, "epoch": 1205} {"train_loss": -5.8658294677734375, "global_step": 50630, "epoch": 1205} {"train_loss": -5.7851152420043945, "global_step": 50631, "epoch": 1205} {"train_loss": -5.795726299285889, "global_step": 50632, "epoch": 1205} {"train_loss": -5.748420715332031, "global_step": 50633, "epoch": 1205} {"train_loss": -5.877361297607422, "global_step": 50634, "epoch": 1205} {"train_loss": -5.783066272735596, "global_step": 50635, "epoch": 1205} {"train_loss": -5.847846031188965, "global_step": 50636, "epoch": 1205} {"train_loss": -5.790325164794922, "global_step": 50637, "epoch": 1205} {"train_loss": -5.788496017456055, "global_step": 50638, "epoch": 1205} {"train_loss": -5.848023414611816, "global_step": 50639, "epoch": 1205} {"train_loss": -5.679272651672363, "global_step": 50640, "epoch": 1205} {"train_loss": -5.834229469299316, "global_step": 50641, "epoch": 1205} {"train_loss": -5.768718242645264, "global_step": 50642, "epoch": 1205} {"train_loss": -5.769659996032715, "global_step": 50643, "epoch": 1205} {"train_loss": -5.79880428314209, "global_step": 50644, "epoch": 1205} {"train_loss": -5.877802848815918, "global_step": 50645, "epoch": 1205} {"train_loss": -5.76443338394165, "global_step": 50646, "epoch": 1205} {"train_loss": -5.712655544281006, "global_step": 50647, "epoch": 1205} {"train_loss": -5.867863178253174, "global_step": 50648, "epoch": 1205} {"train_loss": -5.729267120361328, "global_step": 50649, "epoch": 1205} {"train_loss": -5.68161153793335, "global_step": 50650, "epoch": 1205} {"train_loss": -5.796719494320097, "global_step": 50651, "epoch": 1205, "val_loss": 61709.0390625} {"train_loss": -5.790719032287598, "global_step": 50652, "epoch": 1206} {"train_loss": -5.764573097229004, "global_step": 50653, "epoch": 1206} {"train_loss": -5.769268035888672, "global_step": 50654, "epoch": 1206} {"train_loss": -5.888320446014404, "global_step": 50655, "epoch": 1206} {"train_loss": -5.655430793762207, "global_step": 50656, "epoch": 1206} {"train_loss": -5.629375457763672, "global_step": 50657, "epoch": 1206} {"train_loss": -5.851593017578125, "global_step": 50658, "epoch": 1206} {"train_loss": -5.77720308303833, "global_step": 50659, "epoch": 1206} {"train_loss": -5.776826858520508, "global_step": 50660, "epoch": 1206} {"train_loss": -5.729665756225586, "global_step": 50661, "epoch": 1206} {"train_loss": -5.724249362945557, "global_step": 50662, "epoch": 1206} {"train_loss": -5.778739929199219, "global_step": 50663, "epoch": 1206} {"train_loss": -5.724183082580566, "global_step": 50664, "epoch": 1206} {"train_loss": -5.817948341369629, "global_step": 50665, "epoch": 1206} {"train_loss": -5.834558963775635, "global_step": 50666, "epoch": 1206} {"train_loss": -5.849194526672363, "global_step": 50667, "epoch": 1206} {"train_loss": -5.682339668273926, "global_step": 50668, "epoch": 1206} {"train_loss": -5.862189292907715, "global_step": 50669, "epoch": 1206} {"train_loss": -5.844536781311035, "global_step": 50670, "epoch": 1206} {"train_loss": -5.751781463623047, "global_step": 50671, "epoch": 1206} {"train_loss": -5.754827499389648, "global_step": 50672, "epoch": 1206} {"train_loss": -5.89631462097168, "global_step": 50673, "epoch": 1206} {"train_loss": -5.683600425720215, "global_step": 50674, "epoch": 1206} {"train_loss": -5.808219909667969, "global_step": 50675, "epoch": 1206} {"train_loss": -5.847845077514648, "global_step": 50676, "epoch": 1206} {"train_loss": -5.77267599105835, "global_step": 50677, "epoch": 1206} {"train_loss": -5.682241439819336, "global_step": 50678, "epoch": 1206} {"train_loss": -5.929460525512695, "global_step": 50679, "epoch": 1206} {"train_loss": -5.811502456665039, "global_step": 50680, "epoch": 1206} {"train_loss": -5.658539295196533, "global_step": 50681, "epoch": 1206} {"train_loss": -5.958933353424072, "global_step": 50682, "epoch": 1206} {"train_loss": -5.667232513427734, "global_step": 50683, "epoch": 1206} {"train_loss": -5.766707420349121, "global_step": 50684, "epoch": 1206} {"train_loss": -5.608569145202637, "global_step": 50685, "epoch": 1206} {"train_loss": -5.720301628112793, "global_step": 50686, "epoch": 1206} {"train_loss": -5.7882280349731445, "global_step": 50687, "epoch": 1206} {"train_loss": -5.822710037231445, "global_step": 50688, "epoch": 1206} {"train_loss": -5.8433756828308105, "global_step": 50689, "epoch": 1206} {"train_loss": -5.828578948974609, "global_step": 50690, "epoch": 1206} {"train_loss": -5.732639789581299, "global_step": 50691, "epoch": 1206} {"train_loss": -5.784910202026367, "global_step": 50692, "epoch": 1206} {"train_loss": -5.773309877940586, "global_step": 50693, "epoch": 1206, "val_loss": 61588.7265625} {"train_loss": -5.853046894073486, "global_step": 50694, "epoch": 1207} {"train_loss": -5.828203201293945, "global_step": 50695, "epoch": 1207} {"train_loss": -5.910240173339844, "global_step": 50696, "epoch": 1207} {"train_loss": -5.746969223022461, "global_step": 50697, "epoch": 1207} {"train_loss": -5.742292881011963, "global_step": 50698, "epoch": 1207} {"train_loss": -5.828485488891602, "global_step": 50699, "epoch": 1207} {"train_loss": -5.797763824462891, "global_step": 50700, "epoch": 1207} {"train_loss": -5.835432052612305, "global_step": 50701, "epoch": 1207} {"train_loss": -5.793469429016113, "global_step": 50702, "epoch": 1207} {"train_loss": -5.816638469696045, "global_step": 50703, "epoch": 1207} {"train_loss": -5.76647424697876, "global_step": 50704, "epoch": 1207} {"train_loss": -5.807896614074707, "global_step": 50705, "epoch": 1207} {"train_loss": -5.865683555603027, "global_step": 50706, "epoch": 1207} {"train_loss": -5.7233452796936035, "global_step": 50707, "epoch": 1207} {"train_loss": -5.70885705947876, "global_step": 50708, "epoch": 1207} {"train_loss": -5.788445472717285, "global_step": 50709, "epoch": 1207} {"train_loss": -5.698160171508789, "global_step": 50710, "epoch": 1207} {"train_loss": -5.828255653381348, "global_step": 50711, "epoch": 1207} {"train_loss": -5.816560745239258, "global_step": 50712, "epoch": 1207} {"train_loss": -5.703065872192383, "global_step": 50713, "epoch": 1207} {"train_loss": -5.805831432342529, "global_step": 50714, "epoch": 1207} {"train_loss": -5.787471294403076, "global_step": 50715, "epoch": 1207} {"train_loss": -5.764015197753906, "global_step": 50716, "epoch": 1207} {"train_loss": -5.7358832359313965, "global_step": 50717, "epoch": 1207} {"train_loss": -5.692686080932617, "global_step": 50718, "epoch": 1207} {"train_loss": -5.987424850463867, "global_step": 50719, "epoch": 1207} {"train_loss": -5.75782585144043, "global_step": 50720, "epoch": 1207} {"train_loss": -5.815654754638672, "global_step": 50721, "epoch": 1207} {"train_loss": -5.788287162780762, "global_step": 50722, "epoch": 1207} {"train_loss": -5.874161243438721, "global_step": 50723, "epoch": 1207} {"train_loss": -5.792514801025391, "global_step": 50724, "epoch": 1207} {"train_loss": -5.835487365722656, "global_step": 50725, "epoch": 1207} {"train_loss": -5.864565849304199, "global_step": 50726, "epoch": 1207} {"train_loss": -5.808934211730957, "global_step": 50727, "epoch": 1207} {"train_loss": -5.80631160736084, "global_step": 50728, "epoch": 1207} {"train_loss": -5.702409744262695, "global_step": 50729, "epoch": 1207} {"train_loss": -5.827818870544434, "global_step": 50730, "epoch": 1207} {"train_loss": -5.828900337219238, "global_step": 50731, "epoch": 1207} {"train_loss": -5.784873962402344, "global_step": 50732, "epoch": 1207} {"train_loss": -5.747043609619141, "global_step": 50733, "epoch": 1207} {"train_loss": -5.8213582038879395, "global_step": 50734, "epoch": 1207} {"train_loss": -5.797025112878709, "global_step": 50735, "epoch": 1207, "val_loss": 61615.87109375} {"train_loss": -5.848182678222656, "global_step": 50736, "epoch": 1208} {"train_loss": -5.765148162841797, "global_step": 50737, "epoch": 1208} {"train_loss": -5.796877861022949, "global_step": 50738, "epoch": 1208} {"train_loss": -5.790436267852783, "global_step": 50739, "epoch": 1208} {"train_loss": -5.8235673904418945, "global_step": 50740, "epoch": 1208} {"train_loss": -5.736346244812012, "global_step": 50741, "epoch": 1208} {"train_loss": -5.942625999450684, "global_step": 50742, "epoch": 1208} {"train_loss": -5.759279727935791, "global_step": 50743, "epoch": 1208} {"train_loss": -5.741645336151123, "global_step": 50744, "epoch": 1208} {"train_loss": -5.801253318786621, "global_step": 50745, "epoch": 1208} {"train_loss": -5.822150230407715, "global_step": 50746, "epoch": 1208} {"train_loss": -5.852411270141602, "global_step": 50747, "epoch": 1208} {"train_loss": -5.866559982299805, "global_step": 50748, "epoch": 1208} {"train_loss": -5.7391486167907715, "global_step": 50749, "epoch": 1208} {"train_loss": -5.826689720153809, "global_step": 50750, "epoch": 1208} {"train_loss": -5.806737899780273, "global_step": 50751, "epoch": 1208} {"train_loss": -5.792880058288574, "global_step": 50752, "epoch": 1208} {"train_loss": -5.7360639572143555, "global_step": 50753, "epoch": 1208} {"train_loss": -5.807023525238037, "global_step": 50754, "epoch": 1208} {"train_loss": -5.7915825843811035, "global_step": 50755, "epoch": 1208} {"train_loss": -5.733837127685547, "global_step": 50756, "epoch": 1208} {"train_loss": -5.768084526062012, "global_step": 50757, "epoch": 1208} {"train_loss": -5.701852798461914, "global_step": 50758, "epoch": 1208} {"train_loss": -5.86952018737793, "global_step": 50759, "epoch": 1208} {"train_loss": -5.829297065734863, "global_step": 50760, "epoch": 1208} {"train_loss": -5.832012176513672, "global_step": 50761, "epoch": 1208} {"train_loss": -5.785190105438232, "global_step": 50762, "epoch": 1208} {"train_loss": -5.747444152832031, "global_step": 50763, "epoch": 1208} {"train_loss": -5.723025321960449, "global_step": 50764, "epoch": 1208} {"train_loss": -5.685665130615234, "global_step": 50765, "epoch": 1208} {"train_loss": -5.781778335571289, "global_step": 50766, "epoch": 1208} {"train_loss": -5.821728229522705, "global_step": 50767, "epoch": 1208} {"train_loss": -5.804532051086426, "global_step": 50768, "epoch": 1208} {"train_loss": -5.757619380950928, "global_step": 50769, "epoch": 1208} {"train_loss": -5.797008514404297, "global_step": 50770, "epoch": 1208} {"train_loss": -5.745721340179443, "global_step": 50771, "epoch": 1208} {"train_loss": -5.791821479797363, "global_step": 50772, "epoch": 1208} {"train_loss": -5.735363483428955, "global_step": 50773, "epoch": 1208} {"train_loss": -5.881747722625732, "global_step": 50774, "epoch": 1208} {"train_loss": -5.817325592041016, "global_step": 50775, "epoch": 1208} {"train_loss": -5.740225791931152, "global_step": 50776, "epoch": 1208} {"train_loss": -5.788861626670474, "global_step": 50777, "epoch": 1208, "val_loss": 61311.7734375} {"train_loss": -5.754638671875, "global_step": 50778, "epoch": 1209} {"train_loss": -5.840770721435547, "global_step": 50779, "epoch": 1209} {"train_loss": -5.774333953857422, "global_step": 50780, "epoch": 1209} {"train_loss": -5.695401191711426, "global_step": 50781, "epoch": 1209} {"train_loss": -5.8190598487854, "global_step": 50782, "epoch": 1209} {"train_loss": -5.729386329650879, "global_step": 50783, "epoch": 1209} {"train_loss": -5.834028720855713, "global_step": 50784, "epoch": 1209} {"train_loss": -5.775290012359619, "global_step": 50785, "epoch": 1209} {"train_loss": -5.721619606018066, "global_step": 50786, "epoch": 1209} {"train_loss": -5.674866676330566, "global_step": 50787, "epoch": 1209} {"train_loss": -5.750273704528809, "global_step": 50788, "epoch": 1209} {"train_loss": -5.823047637939453, "global_step": 50789, "epoch": 1209} {"train_loss": -5.766307353973389, "global_step": 50790, "epoch": 1209} {"train_loss": -5.771157264709473, "global_step": 50791, "epoch": 1209} {"train_loss": -5.792547702789307, "global_step": 50792, "epoch": 1209} {"train_loss": -5.772740364074707, "global_step": 50793, "epoch": 1209} {"train_loss": -5.806739807128906, "global_step": 50794, "epoch": 1209} {"train_loss": -5.80861759185791, "global_step": 50795, "epoch": 1209} {"train_loss": -5.806956768035889, "global_step": 50796, "epoch": 1209} {"train_loss": -5.697517395019531, "global_step": 50797, "epoch": 1209} {"train_loss": -5.832243919372559, "global_step": 50798, "epoch": 1209} {"train_loss": -5.651976585388184, "global_step": 50799, "epoch": 1209} {"train_loss": -5.781595706939697, "global_step": 50800, "epoch": 1209} {"train_loss": -5.840712547302246, "global_step": 50801, "epoch": 1209} {"train_loss": -5.8408660888671875, "global_step": 50802, "epoch": 1209} {"train_loss": -5.925677299499512, "global_step": 50803, "epoch": 1209} {"train_loss": -5.848700046539307, "global_step": 50804, "epoch": 1209} {"train_loss": -5.862163066864014, "global_step": 50805, "epoch": 1209} {"train_loss": -5.680379390716553, "global_step": 50806, "epoch": 1209} {"train_loss": -5.822758674621582, "global_step": 50807, "epoch": 1209} {"train_loss": -5.64096212387085, "global_step": 50808, "epoch": 1209} {"train_loss": -5.834721088409424, "global_step": 50809, "epoch": 1209} {"train_loss": -5.75258207321167, "global_step": 50810, "epoch": 1209} {"train_loss": -5.727577209472656, "global_step": 50811, "epoch": 1209} {"train_loss": -5.810993194580078, "global_step": 50812, "epoch": 1209} {"train_loss": -5.801747798919678, "global_step": 50813, "epoch": 1209} {"train_loss": -5.92294979095459, "global_step": 50814, "epoch": 1209} {"train_loss": -5.901022911071777, "global_step": 50815, "epoch": 1209} {"train_loss": -5.777026176452637, "global_step": 50816, "epoch": 1209} {"train_loss": -5.728594779968262, "global_step": 50817, "epoch": 1209} {"train_loss": -5.862898826599121, "global_step": 50818, "epoch": 1209} {"train_loss": -5.785830020904541, "global_step": 50819, "epoch": 1209, "val_loss": 61834.390625} {"train_loss": -5.938080787658691, "global_step": 50820, "epoch": 1210} {"train_loss": -5.758504867553711, "global_step": 50821, "epoch": 1210} {"train_loss": -5.669905662536621, "global_step": 50822, "epoch": 1210} {"train_loss": -5.880679130554199, "global_step": 50823, "epoch": 1210} {"train_loss": -5.730739593505859, "global_step": 50824, "epoch": 1210} {"train_loss": -5.7259016036987305, "global_step": 50825, "epoch": 1210} {"train_loss": -5.834273338317871, "global_step": 50826, "epoch": 1210} {"train_loss": -5.6971635818481445, "global_step": 50827, "epoch": 1210} {"train_loss": -5.825270175933838, "global_step": 50828, "epoch": 1210} {"train_loss": -5.895467758178711, "global_step": 50829, "epoch": 1210} {"train_loss": -5.7909746170043945, "global_step": 50830, "epoch": 1210} {"train_loss": -5.689255237579346, "global_step": 50831, "epoch": 1210} {"train_loss": -5.788812637329102, "global_step": 50832, "epoch": 1210} {"train_loss": -5.785538673400879, "global_step": 50833, "epoch": 1210} {"train_loss": -5.7161688804626465, "global_step": 50834, "epoch": 1210} {"train_loss": -5.8102874755859375, "global_step": 50835, "epoch": 1210} {"train_loss": -5.79770565032959, "global_step": 50836, "epoch": 1210} {"train_loss": -5.868131637573242, "global_step": 50837, "epoch": 1210} {"train_loss": -5.65561580657959, "global_step": 50838, "epoch": 1210} {"train_loss": -5.6433329582214355, "global_step": 50839, "epoch": 1210} {"train_loss": -5.923884868621826, "global_step": 50840, "epoch": 1210} {"train_loss": -5.660270690917969, "global_step": 50841, "epoch": 1210} {"train_loss": -5.801281452178955, "global_step": 50842, "epoch": 1210} {"train_loss": -5.857635974884033, "global_step": 50843, "epoch": 1210} {"train_loss": -5.759914398193359, "global_step": 50844, "epoch": 1210} {"train_loss": -5.8310322761535645, "global_step": 50845, "epoch": 1210} {"train_loss": -5.807561874389648, "global_step": 50846, "epoch": 1210} {"train_loss": -5.824286460876465, "global_step": 50847, "epoch": 1210} {"train_loss": -5.8602094650268555, "global_step": 50848, "epoch": 1210} {"train_loss": -5.870649337768555, "global_step": 50849, "epoch": 1210} {"train_loss": -5.8173370361328125, "global_step": 50850, "epoch": 1210} {"train_loss": -5.806507110595703, "global_step": 50851, "epoch": 1210} {"train_loss": -5.590018272399902, "global_step": 50852, "epoch": 1210} {"train_loss": -5.887738227844238, "global_step": 50853, "epoch": 1210} {"train_loss": -5.83212423324585, "global_step": 50854, "epoch": 1210} {"train_loss": -5.794236183166504, "global_step": 50855, "epoch": 1210} {"train_loss": -5.854550361633301, "global_step": 50856, "epoch": 1210} {"train_loss": -5.746527671813965, "global_step": 50857, "epoch": 1210} {"train_loss": -5.703484058380127, "global_step": 50858, "epoch": 1210} {"train_loss": -5.7470502853393555, "global_step": 50859, "epoch": 1210} {"train_loss": -5.805874347686768, "global_step": 50860, "epoch": 1210} {"train_loss": -5.7866425060090565, "global_step": 50861, "epoch": 1210, "val_loss": 61345.5234375} {"train_loss": -5.713448524475098, "global_step": 50862, "epoch": 1211} {"train_loss": -5.759026527404785, "global_step": 50863, "epoch": 1211} {"train_loss": -5.8703508377075195, "global_step": 50864, "epoch": 1211} {"train_loss": -5.789674758911133, "global_step": 50865, "epoch": 1211} {"train_loss": -5.796831130981445, "global_step": 50866, "epoch": 1211} {"train_loss": -5.751338005065918, "global_step": 50867, "epoch": 1211} {"train_loss": -5.865941047668457, "global_step": 50868, "epoch": 1211} {"train_loss": -5.764948844909668, "global_step": 50869, "epoch": 1211} {"train_loss": -5.802274703979492, "global_step": 50870, "epoch": 1211} {"train_loss": -5.846762180328369, "global_step": 50871, "epoch": 1211} {"train_loss": -5.853610992431641, "global_step": 50872, "epoch": 1211} {"train_loss": -5.833151817321777, "global_step": 50873, "epoch": 1211} {"train_loss": -5.740115165710449, "global_step": 50874, "epoch": 1211} {"train_loss": -5.850786209106445, "global_step": 50875, "epoch": 1211} {"train_loss": -5.809258460998535, "global_step": 50876, "epoch": 1211} {"train_loss": -5.821508884429932, "global_step": 50877, "epoch": 1211} {"train_loss": -5.8487653732299805, "global_step": 50878, "epoch": 1211} {"train_loss": -5.883028030395508, "global_step": 50879, "epoch": 1211} {"train_loss": -5.683914661407471, "global_step": 50880, "epoch": 1211} {"train_loss": -5.654898643493652, "global_step": 50881, "epoch": 1211} {"train_loss": -5.702475547790527, "global_step": 50882, "epoch": 1211} {"train_loss": -5.797235488891602, "global_step": 50883, "epoch": 1211} {"train_loss": -5.862515449523926, "global_step": 50884, "epoch": 1211} {"train_loss": -5.82253360748291, "global_step": 50885, "epoch": 1211} {"train_loss": -5.751765251159668, "global_step": 50886, "epoch": 1211} {"train_loss": -5.7823028564453125, "global_step": 50887, "epoch": 1211} {"train_loss": -5.735886573791504, "global_step": 50888, "epoch": 1211} {"train_loss": -5.880247116088867, "global_step": 50889, "epoch": 1211} {"train_loss": -5.712507724761963, "global_step": 50890, "epoch": 1211} {"train_loss": -5.745364665985107, "global_step": 50891, "epoch": 1211} {"train_loss": -5.783492088317871, "global_step": 50892, "epoch": 1211} {"train_loss": -5.692495346069336, "global_step": 50893, "epoch": 1211} {"train_loss": -5.738965034484863, "global_step": 50894, "epoch": 1211} {"train_loss": -5.8666486740112305, "global_step": 50895, "epoch": 1211} {"train_loss": -5.832269668579102, "global_step": 50896, "epoch": 1211} {"train_loss": -5.696013450622559, "global_step": 50897, "epoch": 1211} {"train_loss": -5.776776313781738, "global_step": 50898, "epoch": 1211} {"train_loss": -5.829232215881348, "global_step": 50899, "epoch": 1211} {"train_loss": -5.808934211730957, "global_step": 50900, "epoch": 1211} {"train_loss": -5.762075424194336, "global_step": 50901, "epoch": 1211} {"train_loss": -5.808263301849365, "global_step": 50902, "epoch": 1211} {"train_loss": -5.787782407942272, "global_step": 50903, "epoch": 1211, "val_loss": 61767.38671875} {"train_loss": -5.765209197998047, "global_step": 50904, "epoch": 1212} {"train_loss": -5.711957931518555, "global_step": 50905, "epoch": 1212} {"train_loss": -5.814471244812012, "global_step": 50906, "epoch": 1212} {"train_loss": -5.739398956298828, "global_step": 50907, "epoch": 1212} {"train_loss": -5.858937740325928, "global_step": 50908, "epoch": 1212} {"train_loss": -5.884476661682129, "global_step": 50909, "epoch": 1212} {"train_loss": -5.9543304443359375, "global_step": 50910, "epoch": 1212} {"train_loss": -5.802742004394531, "global_step": 50911, "epoch": 1212} {"train_loss": -5.703868389129639, "global_step": 50912, "epoch": 1212} {"train_loss": -5.750185489654541, "global_step": 50913, "epoch": 1212} {"train_loss": -5.765963554382324, "global_step": 50914, "epoch": 1212} {"train_loss": -5.712357521057129, "global_step": 50915, "epoch": 1212} {"train_loss": -5.8082475662231445, "global_step": 50916, "epoch": 1212} {"train_loss": -5.744370937347412, "global_step": 50917, "epoch": 1212} {"train_loss": -5.877143859863281, "global_step": 50918, "epoch": 1212} {"train_loss": -5.770181655883789, "global_step": 50919, "epoch": 1212} {"train_loss": -5.6696038246154785, "global_step": 50920, "epoch": 1212} {"train_loss": -5.748525619506836, "global_step": 50921, "epoch": 1212} {"train_loss": -5.625437259674072, "global_step": 50922, "epoch": 1212} {"train_loss": -5.7507476806640625, "global_step": 50923, "epoch": 1212} {"train_loss": -5.836353302001953, "global_step": 50924, "epoch": 1212} {"train_loss": -5.705480098724365, "global_step": 50925, "epoch": 1212} {"train_loss": -5.684882164001465, "global_step": 50926, "epoch": 1212} {"train_loss": -5.729605674743652, "global_step": 50927, "epoch": 1212} {"train_loss": -5.8332200050354, "global_step": 50928, "epoch": 1212} {"train_loss": -5.7359161376953125, "global_step": 50929, "epoch": 1212} {"train_loss": -5.780208587646484, "global_step": 50930, "epoch": 1212} {"train_loss": -5.654115676879883, "global_step": 50931, "epoch": 1212} {"train_loss": -5.804930686950684, "global_step": 50932, "epoch": 1212} {"train_loss": -5.854704856872559, "global_step": 50933, "epoch": 1212} {"train_loss": -5.794406890869141, "global_step": 50934, "epoch": 1212} {"train_loss": -5.865292072296143, "global_step": 50935, "epoch": 1212} {"train_loss": -5.770321369171143, "global_step": 50936, "epoch": 1212} {"train_loss": -5.764188289642334, "global_step": 50937, "epoch": 1212} {"train_loss": -5.787622928619385, "global_step": 50938, "epoch": 1212} {"train_loss": -5.765960693359375, "global_step": 50939, "epoch": 1212} {"train_loss": -5.731914043426514, "global_step": 50940, "epoch": 1212} {"train_loss": -5.809428691864014, "global_step": 50941, "epoch": 1212} {"train_loss": -5.7111334800720215, "global_step": 50942, "epoch": 1212} {"train_loss": -5.867987632751465, "global_step": 50943, "epoch": 1212} {"train_loss": -5.832895278930664, "global_step": 50944, "epoch": 1212} {"train_loss": -5.773301487877255, "global_step": 50945, "epoch": 1212, "val_loss": 61366.06640625} {"train_loss": -5.745551109313965, "global_step": 50946, "epoch": 1213} {"train_loss": -5.804013252258301, "global_step": 50947, "epoch": 1213} {"train_loss": -5.807936668395996, "global_step": 50948, "epoch": 1213} {"train_loss": -5.847775936126709, "global_step": 50949, "epoch": 1213} {"train_loss": -5.853305816650391, "global_step": 50950, "epoch": 1213} {"train_loss": -5.8654069900512695, "global_step": 50951, "epoch": 1213} {"train_loss": -5.770329475402832, "global_step": 50952, "epoch": 1213} {"train_loss": -5.7660017013549805, "global_step": 50953, "epoch": 1213} {"train_loss": -5.7018609046936035, "global_step": 50954, "epoch": 1213} {"train_loss": -5.86384391784668, "global_step": 50955, "epoch": 1213} {"train_loss": -5.789795875549316, "global_step": 50956, "epoch": 1213} {"train_loss": -5.614916801452637, "global_step": 50957, "epoch": 1213} {"train_loss": -5.893764495849609, "global_step": 50958, "epoch": 1213} {"train_loss": -5.809199333190918, "global_step": 50959, "epoch": 1213} {"train_loss": -5.7454681396484375, "global_step": 50960, "epoch": 1213} {"train_loss": -5.881384372711182, "global_step": 50961, "epoch": 1213} {"train_loss": -5.726696014404297, "global_step": 50962, "epoch": 1213} {"train_loss": -5.6624755859375, "global_step": 50963, "epoch": 1213} {"train_loss": -5.685968399047852, "global_step": 50964, "epoch": 1213} {"train_loss": -5.786102771759033, "global_step": 50965, "epoch": 1213} {"train_loss": -5.683399200439453, "global_step": 50966, "epoch": 1213} {"train_loss": -5.685781478881836, "global_step": 50967, "epoch": 1213} {"train_loss": -5.866924285888672, "global_step": 50968, "epoch": 1213} {"train_loss": -5.771377086639404, "global_step": 50969, "epoch": 1213} {"train_loss": -5.63295841217041, "global_step": 50970, "epoch": 1213} {"train_loss": -5.734302997589111, "global_step": 50971, "epoch": 1213} {"train_loss": -5.71341609954834, "global_step": 50972, "epoch": 1213} {"train_loss": -5.755247116088867, "global_step": 50973, "epoch": 1213} {"train_loss": -5.7367634773254395, "global_step": 50974, "epoch": 1213} {"train_loss": -5.725333213806152, "global_step": 50975, "epoch": 1213} {"train_loss": -5.690001487731934, "global_step": 50976, "epoch": 1213} {"train_loss": -5.617802619934082, "global_step": 50977, "epoch": 1213} {"train_loss": -5.745187759399414, "global_step": 50978, "epoch": 1213} {"train_loss": -5.7776899337768555, "global_step": 50979, "epoch": 1213} {"train_loss": -5.737218856811523, "global_step": 50980, "epoch": 1213} {"train_loss": -5.669075012207031, "global_step": 50981, "epoch": 1213} {"train_loss": -5.604299545288086, "global_step": 50982, "epoch": 1213} {"train_loss": -5.8351731300354, "global_step": 50983, "epoch": 1213} {"train_loss": -5.911056995391846, "global_step": 50984, "epoch": 1213} {"train_loss": -5.7547125816345215, "global_step": 50985, "epoch": 1213} {"train_loss": -5.735103607177734, "global_step": 50986, "epoch": 1213} {"train_loss": -5.7580290748959495, "global_step": 50987, "epoch": 1213, "val_loss": 62099.58203125} {"train_loss": -5.6862640380859375, "global_step": 50988, "epoch": 1214} {"train_loss": -5.704838752746582, "global_step": 50989, "epoch": 1214} {"train_loss": -5.738537788391113, "global_step": 50990, "epoch": 1214} {"train_loss": -5.757943153381348, "global_step": 50991, "epoch": 1214} {"train_loss": -5.657032012939453, "global_step": 50992, "epoch": 1214} {"train_loss": -5.69296932220459, "global_step": 50993, "epoch": 1214} {"train_loss": -5.719724655151367, "global_step": 50994, "epoch": 1214} {"train_loss": -5.825197219848633, "global_step": 50995, "epoch": 1214} {"train_loss": -5.750903129577637, "global_step": 50996, "epoch": 1214} {"train_loss": -5.704156398773193, "global_step": 50997, "epoch": 1214} {"train_loss": -5.812873840332031, "global_step": 50998, "epoch": 1214} {"train_loss": -5.696018218994141, "global_step": 50999, "epoch": 1214} {"train_loss": -5.727025032043457, "global_step": 51000, "epoch": 1214} {"train_loss": -5.735499382019043, "global_step": 51001, "epoch": 1214} {"train_loss": -5.74669075012207, "global_step": 51002, "epoch": 1214} {"train_loss": -5.691164970397949, "global_step": 51003, "epoch": 1214} {"train_loss": -5.705697059631348, "global_step": 51004, "epoch": 1214} {"train_loss": -5.769199848175049, "global_step": 51005, "epoch": 1214} {"train_loss": -5.893752098083496, "global_step": 51006, "epoch": 1214} {"train_loss": -5.80382776260376, "global_step": 51007, "epoch": 1214} {"train_loss": -5.764693260192871, "global_step": 51008, "epoch": 1214} {"train_loss": -5.712465286254883, "global_step": 51009, "epoch": 1214} {"train_loss": -5.834066390991211, "global_step": 51010, "epoch": 1214} {"train_loss": -5.860623836517334, "global_step": 51011, "epoch": 1214} {"train_loss": -5.560848236083984, "global_step": 51012, "epoch": 1214} {"train_loss": -5.759667873382568, "global_step": 51013, "epoch": 1214} {"train_loss": -5.724764823913574, "global_step": 51014, "epoch": 1214} {"train_loss": -5.719561576843262, "global_step": 51015, "epoch": 1214} {"train_loss": -5.680505752563477, "global_step": 51016, "epoch": 1214} {"train_loss": -5.573941230773926, "global_step": 51017, "epoch": 1214} {"train_loss": -5.678789138793945, "global_step": 51018, "epoch": 1214} {"train_loss": -5.684820175170898, "global_step": 51019, "epoch": 1214} {"train_loss": -5.73382568359375, "global_step": 51020, "epoch": 1214} {"train_loss": -5.759031295776367, "global_step": 51021, "epoch": 1214} {"train_loss": -5.540581703186035, "global_step": 51022, "epoch": 1214} {"train_loss": -5.761258125305176, "global_step": 51023, "epoch": 1214} {"train_loss": -5.621005535125732, "global_step": 51024, "epoch": 1214} {"train_loss": -5.736571311950684, "global_step": 51025, "epoch": 1214} {"train_loss": -5.645483016967773, "global_step": 51026, "epoch": 1214} {"train_loss": -5.769974708557129, "global_step": 51027, "epoch": 1214} {"train_loss": -5.8373284339904785, "global_step": 51028, "epoch": 1214} {"train_loss": -5.723473083405268, "global_step": 51029, "epoch": 1214, "val_loss": 61650.50390625} {"train_loss": -5.808907985687256, "global_step": 51030, "epoch": 1215} {"train_loss": -5.740013599395752, "global_step": 51031, "epoch": 1215} {"train_loss": -5.7183074951171875, "global_step": 51032, "epoch": 1215} {"train_loss": -5.790610313415527, "global_step": 51033, "epoch": 1215} {"train_loss": -5.7016801834106445, "global_step": 51034, "epoch": 1215} {"train_loss": -5.774309158325195, "global_step": 51035, "epoch": 1215} {"train_loss": -5.697206020355225, "global_step": 51036, "epoch": 1215} {"train_loss": -5.6239824295043945, "global_step": 51037, "epoch": 1215} {"train_loss": -5.7353925704956055, "global_step": 51038, "epoch": 1215} {"train_loss": -5.802523612976074, "global_step": 51039, "epoch": 1215} {"train_loss": -5.846116065979004, "global_step": 51040, "epoch": 1215} {"train_loss": -5.861611366271973, "global_step": 51041, "epoch": 1215} {"train_loss": -5.845301151275635, "global_step": 51042, "epoch": 1215} {"train_loss": -5.74206018447876, "global_step": 51043, "epoch": 1215} {"train_loss": -5.779209136962891, "global_step": 51044, "epoch": 1215} {"train_loss": -5.940252780914307, "global_step": 51045, "epoch": 1215} {"train_loss": -5.769191741943359, "global_step": 51046, "epoch": 1215} {"train_loss": -5.790014266967773, "global_step": 51047, "epoch": 1215} {"train_loss": -5.915202617645264, "global_step": 51048, "epoch": 1215} {"train_loss": -5.753698348999023, "global_step": 51049, "epoch": 1215} {"train_loss": -5.834230422973633, "global_step": 51050, "epoch": 1215} {"train_loss": -5.828313827514648, "global_step": 51051, "epoch": 1215} {"train_loss": -5.630960464477539, "global_step": 51052, "epoch": 1215} {"train_loss": -5.681099891662598, "global_step": 51053, "epoch": 1215} {"train_loss": -5.772581577301025, "global_step": 51054, "epoch": 1215} {"train_loss": -5.618862152099609, "global_step": 51055, "epoch": 1215} {"train_loss": -5.761933326721191, "global_step": 51056, "epoch": 1215} {"train_loss": -5.733449459075928, "global_step": 51057, "epoch": 1215} {"train_loss": -5.812341213226318, "global_step": 51058, "epoch": 1215} {"train_loss": -5.738665580749512, "global_step": 51059, "epoch": 1215} {"train_loss": -5.812639236450195, "global_step": 51060, "epoch": 1215} {"train_loss": -5.7760138511657715, "global_step": 51061, "epoch": 1215} {"train_loss": -5.738970756530762, "global_step": 51062, "epoch": 1215} {"train_loss": -5.805809020996094, "global_step": 51063, "epoch": 1215} {"train_loss": -5.802356719970703, "global_step": 51064, "epoch": 1215} {"train_loss": -5.738739013671875, "global_step": 51065, "epoch": 1215} {"train_loss": -5.715646743774414, "global_step": 51066, "epoch": 1215} {"train_loss": -5.7431464195251465, "global_step": 51067, "epoch": 1215} {"train_loss": -5.929171085357666, "global_step": 51068, "epoch": 1215} {"train_loss": -5.708279132843018, "global_step": 51069, "epoch": 1215} {"train_loss": -5.773373603820801, "global_step": 51070, "epoch": 1215} {"train_loss": -5.7729233560108, "global_step": 51071, "epoch": 1215, "val_loss": 61902.6171875} {"train_loss": -5.732431411743164, "global_step": 51072, "epoch": 1216} {"train_loss": -5.881768226623535, "global_step": 51073, "epoch": 1216} {"train_loss": -5.804475784301758, "global_step": 51074, "epoch": 1216} {"train_loss": -5.788394927978516, "global_step": 51075, "epoch": 1216} {"train_loss": -5.810193061828613, "global_step": 51076, "epoch": 1216} {"train_loss": -5.918301105499268, "global_step": 51077, "epoch": 1216} {"train_loss": -5.789948463439941, "global_step": 51078, "epoch": 1216} {"train_loss": -5.830283164978027, "global_step": 51079, "epoch": 1216} {"train_loss": -5.7176313400268555, "global_step": 51080, "epoch": 1216} {"train_loss": -5.813718795776367, "global_step": 51081, "epoch": 1216} {"train_loss": -5.687013149261475, "global_step": 51082, "epoch": 1216} {"train_loss": -5.762784481048584, "global_step": 51083, "epoch": 1216} {"train_loss": -5.82528018951416, "global_step": 51084, "epoch": 1216} {"train_loss": -5.848923683166504, "global_step": 51085, "epoch": 1216} {"train_loss": -5.834151268005371, "global_step": 51086, "epoch": 1216} {"train_loss": -5.779053688049316, "global_step": 51087, "epoch": 1216} {"train_loss": -5.645764350891113, "global_step": 51088, "epoch": 1216} {"train_loss": -5.726048469543457, "global_step": 51089, "epoch": 1216} {"train_loss": -5.783069610595703, "global_step": 51090, "epoch": 1216} {"train_loss": -5.702063083648682, "global_step": 51091, "epoch": 1216} {"train_loss": -5.775313377380371, "global_step": 51092, "epoch": 1216} {"train_loss": -5.881816387176514, "global_step": 51093, "epoch": 1216} {"train_loss": -5.86081600189209, "global_step": 51094, "epoch": 1216} {"train_loss": -5.769679069519043, "global_step": 51095, "epoch": 1216} {"train_loss": -5.754837512969971, "global_step": 51096, "epoch": 1216} {"train_loss": -5.850860595703125, "global_step": 51097, "epoch": 1216} {"train_loss": -5.750560283660889, "global_step": 51098, "epoch": 1216} {"train_loss": -5.907004356384277, "global_step": 51099, "epoch": 1216} {"train_loss": -5.890109062194824, "global_step": 51100, "epoch": 1216} {"train_loss": -5.689831733703613, "global_step": 51101, "epoch": 1216} {"train_loss": -5.904308319091797, "global_step": 51102, "epoch": 1216} {"train_loss": -5.6347455978393555, "global_step": 51103, "epoch": 1216} {"train_loss": -5.787508010864258, "global_step": 51104, "epoch": 1216} {"train_loss": -5.80549430847168, "global_step": 51105, "epoch": 1216} {"train_loss": -5.789213180541992, "global_step": 51106, "epoch": 1216} {"train_loss": -5.880641937255859, "global_step": 51107, "epoch": 1216} {"train_loss": -5.8804426193237305, "global_step": 51108, "epoch": 1216} {"train_loss": -5.681936264038086, "global_step": 51109, "epoch": 1216} {"train_loss": -5.809832572937012, "global_step": 51110, "epoch": 1216} {"train_loss": -5.703461170196533, "global_step": 51111, "epoch": 1216} {"train_loss": -5.873844623565674, "global_step": 51112, "epoch": 1216} {"train_loss": -5.795971018927438, "global_step": 51113, "epoch": 1216, "val_loss": 61916.3125} {"train_loss": -5.737783908843994, "global_step": 51114, "epoch": 1217} {"train_loss": -5.89788818359375, "global_step": 51115, "epoch": 1217} {"train_loss": -5.759973526000977, "global_step": 51116, "epoch": 1217} {"train_loss": -5.8214802742004395, "global_step": 51117, "epoch": 1217} {"train_loss": -5.713599681854248, "global_step": 51118, "epoch": 1217} {"train_loss": -5.7658233642578125, "global_step": 51119, "epoch": 1217} {"train_loss": -5.741546630859375, "global_step": 51120, "epoch": 1217} {"train_loss": -5.826792240142822, "global_step": 51121, "epoch": 1217} {"train_loss": -5.873712539672852, "global_step": 51122, "epoch": 1217} {"train_loss": -5.701633453369141, "global_step": 51123, "epoch": 1217} {"train_loss": -5.902464389801025, "global_step": 51124, "epoch": 1217} {"train_loss": -5.832156181335449, "global_step": 51125, "epoch": 1217} {"train_loss": -5.608188629150391, "global_step": 51126, "epoch": 1217} {"train_loss": -5.952841281890869, "global_step": 51127, "epoch": 1217} {"train_loss": -5.817259788513184, "global_step": 51128, "epoch": 1217} {"train_loss": -5.851974010467529, "global_step": 51129, "epoch": 1217} {"train_loss": -5.860409736633301, "global_step": 51130, "epoch": 1217} {"train_loss": -5.792398452758789, "global_step": 51131, "epoch": 1217} {"train_loss": -5.756917953491211, "global_step": 51132, "epoch": 1217} {"train_loss": -5.8657331466674805, "global_step": 51133, "epoch": 1217} {"train_loss": -5.8357625007629395, "global_step": 51134, "epoch": 1217} {"train_loss": -5.83708381652832, "global_step": 51135, "epoch": 1217} {"train_loss": -5.829370498657227, "global_step": 51136, "epoch": 1217} {"train_loss": -5.754219055175781, "global_step": 51137, "epoch": 1217} {"train_loss": -5.851947784423828, "global_step": 51138, "epoch": 1217} {"train_loss": -5.833923816680908, "global_step": 51139, "epoch": 1217} {"train_loss": -5.859607696533203, "global_step": 51140, "epoch": 1217} {"train_loss": -5.7868523597717285, "global_step": 51141, "epoch": 1217} {"train_loss": -5.808051586151123, "global_step": 51142, "epoch": 1217} {"train_loss": -5.7053022384643555, "global_step": 51143, "epoch": 1217} {"train_loss": -5.737296104431152, "global_step": 51144, "epoch": 1217} {"train_loss": -5.743223190307617, "global_step": 51145, "epoch": 1217} {"train_loss": -5.76066780090332, "global_step": 51146, "epoch": 1217} {"train_loss": -5.749369144439697, "global_step": 51147, "epoch": 1217} {"train_loss": -5.77227783203125, "global_step": 51148, "epoch": 1217} {"train_loss": -5.765996932983398, "global_step": 51149, "epoch": 1217} {"train_loss": -5.899680137634277, "global_step": 51150, "epoch": 1217} {"train_loss": -5.834131717681885, "global_step": 51151, "epoch": 1217} {"train_loss": -5.849889755249023, "global_step": 51152, "epoch": 1217} {"train_loss": -5.684421539306641, "global_step": 51153, "epoch": 1217} {"train_loss": -5.7323198318481445, "global_step": 51154, "epoch": 1217} {"train_loss": -5.798579216003418, "global_step": 51155, "epoch": 1217, "val_loss": 61393.5625} {"train_loss": -5.850436210632324, "global_step": 51156, "epoch": 1218} {"train_loss": -5.838698387145996, "global_step": 51157, "epoch": 1218} {"train_loss": -5.8335280418396, "global_step": 51158, "epoch": 1218} {"train_loss": -5.882379531860352, "global_step": 51159, "epoch": 1218} {"train_loss": -5.928382396697998, "global_step": 51160, "epoch": 1218} {"train_loss": -5.7102484703063965, "global_step": 51161, "epoch": 1218} {"train_loss": -5.77642822265625, "global_step": 51162, "epoch": 1218} {"train_loss": -5.794051170349121, "global_step": 51163, "epoch": 1218} {"train_loss": -5.849575042724609, "global_step": 51164, "epoch": 1218} {"train_loss": -5.723475456237793, "global_step": 51165, "epoch": 1218} {"train_loss": -5.7470197677612305, "global_step": 51166, "epoch": 1218} {"train_loss": -5.807425498962402, "global_step": 51167, "epoch": 1218} {"train_loss": -5.774774551391602, "global_step": 51168, "epoch": 1218} {"train_loss": -5.784021377563477, "global_step": 51169, "epoch": 1218} {"train_loss": -5.77043342590332, "global_step": 51170, "epoch": 1218} {"train_loss": -5.649500846862793, "global_step": 51171, "epoch": 1218} {"train_loss": -5.7764081954956055, "global_step": 51172, "epoch": 1218} {"train_loss": -5.806614875793457, "global_step": 51173, "epoch": 1218} {"train_loss": -5.7859206199646, "global_step": 51174, "epoch": 1218} {"train_loss": -5.8243794441223145, "global_step": 51175, "epoch": 1218} {"train_loss": -5.743680953979492, "global_step": 51176, "epoch": 1218} {"train_loss": -5.774077415466309, "global_step": 51177, "epoch": 1218} {"train_loss": -5.896350383758545, "global_step": 51178, "epoch": 1218} {"train_loss": -5.700165748596191, "global_step": 51179, "epoch": 1218} {"train_loss": -5.841026306152344, "global_step": 51180, "epoch": 1218} {"train_loss": -5.880830764770508, "global_step": 51181, "epoch": 1218} {"train_loss": -5.763210296630859, "global_step": 51182, "epoch": 1218} {"train_loss": -5.697861194610596, "global_step": 51183, "epoch": 1218} {"train_loss": -5.809674263000488, "global_step": 51184, "epoch": 1218} {"train_loss": -5.83392333984375, "global_step": 51185, "epoch": 1218} {"train_loss": -5.584386348724365, "global_step": 51186, "epoch": 1218} {"train_loss": -5.863336086273193, "global_step": 51187, "epoch": 1218} {"train_loss": -5.720740795135498, "global_step": 51188, "epoch": 1218} {"train_loss": -5.739433765411377, "global_step": 51189, "epoch": 1218} {"train_loss": -5.809403419494629, "global_step": 51190, "epoch": 1218} {"train_loss": -5.727776050567627, "global_step": 51191, "epoch": 1218} {"train_loss": -5.809780120849609, "global_step": 51192, "epoch": 1218} {"train_loss": -5.663891792297363, "global_step": 51193, "epoch": 1218} {"train_loss": -5.863957405090332, "global_step": 51194, "epoch": 1218} {"train_loss": -5.880680561065674, "global_step": 51195, "epoch": 1218} {"train_loss": -5.729341506958008, "global_step": 51196, "epoch": 1218} {"train_loss": -5.785810186749413, "global_step": 51197, "epoch": 1218, "val_loss": 61377.62890625} {"train_loss": -5.637246608734131, "global_step": 51198, "epoch": 1219} {"train_loss": -5.675195217132568, "global_step": 51199, "epoch": 1219} {"train_loss": -5.77454137802124, "global_step": 51200, "epoch": 1219} {"train_loss": -5.963902473449707, "global_step": 51201, "epoch": 1219} {"train_loss": -5.681000709533691, "global_step": 51202, "epoch": 1219} {"train_loss": -5.820420265197754, "global_step": 51203, "epoch": 1219} {"train_loss": -5.741344451904297, "global_step": 51204, "epoch": 1219} {"train_loss": -5.7686448097229, "global_step": 51205, "epoch": 1219} {"train_loss": -5.801148414611816, "global_step": 51206, "epoch": 1219} {"train_loss": -5.754439353942871, "global_step": 51207, "epoch": 1219} {"train_loss": -5.818447589874268, "global_step": 51208, "epoch": 1219} {"train_loss": -5.804302215576172, "global_step": 51209, "epoch": 1219} {"train_loss": -5.801288604736328, "global_step": 51210, "epoch": 1219} {"train_loss": -5.775017738342285, "global_step": 51211, "epoch": 1219} {"train_loss": -5.829934120178223, "global_step": 51212, "epoch": 1219} {"train_loss": -5.8763957023620605, "global_step": 51213, "epoch": 1219} {"train_loss": -5.775573253631592, "global_step": 51214, "epoch": 1219} {"train_loss": -5.806760311126709, "global_step": 51215, "epoch": 1219} {"train_loss": -5.828682899475098, "global_step": 51216, "epoch": 1219} {"train_loss": -5.655714988708496, "global_step": 51217, "epoch": 1219} {"train_loss": -5.7914838790893555, "global_step": 51218, "epoch": 1219} {"train_loss": -5.6670451164245605, "global_step": 51219, "epoch": 1219} {"train_loss": -5.812045574188232, "global_step": 51220, "epoch": 1219} {"train_loss": -5.750557899475098, "global_step": 51221, "epoch": 1219} {"train_loss": -5.764557838439941, "global_step": 51222, "epoch": 1219} {"train_loss": -5.773715019226074, "global_step": 51223, "epoch": 1219} {"train_loss": -5.898205757141113, "global_step": 51224, "epoch": 1219} {"train_loss": -5.8475470542907715, "global_step": 51225, "epoch": 1219} {"train_loss": -5.745743751525879, "global_step": 51226, "epoch": 1219} {"train_loss": -5.7696027755737305, "global_step": 51227, "epoch": 1219} {"train_loss": -5.804855823516846, "global_step": 51228, "epoch": 1219} {"train_loss": -5.761377811431885, "global_step": 51229, "epoch": 1219} {"train_loss": -5.807892322540283, "global_step": 51230, "epoch": 1219} {"train_loss": -5.7284135818481445, "global_step": 51231, "epoch": 1219} {"train_loss": -5.902405738830566, "global_step": 51232, "epoch": 1219} {"train_loss": -5.881324768066406, "global_step": 51233, "epoch": 1219} {"train_loss": -5.692291259765625, "global_step": 51234, "epoch": 1219} {"train_loss": -5.713617324829102, "global_step": 51235, "epoch": 1219} {"train_loss": -5.930872917175293, "global_step": 51236, "epoch": 1219} {"train_loss": -5.7188520431518555, "global_step": 51237, "epoch": 1219} {"train_loss": -5.626829147338867, "global_step": 51238, "epoch": 1219} {"train_loss": -5.781058493114653, "global_step": 51239, "epoch": 1219, "val_loss": 61574.07421875} {"train_loss": -5.820557594299316, "global_step": 51240, "epoch": 1220} {"train_loss": -5.739030838012695, "global_step": 51241, "epoch": 1220} {"train_loss": -5.843992233276367, "global_step": 51242, "epoch": 1220} {"train_loss": -5.687239646911621, "global_step": 51243, "epoch": 1220} {"train_loss": -5.817196846008301, "global_step": 51244, "epoch": 1220} {"train_loss": -5.827360153198242, "global_step": 51245, "epoch": 1220} {"train_loss": -5.801207065582275, "global_step": 51246, "epoch": 1220} {"train_loss": -5.771395683288574, "global_step": 51247, "epoch": 1220} {"train_loss": -5.828038215637207, "global_step": 51248, "epoch": 1220} {"train_loss": -5.865971565246582, "global_step": 51249, "epoch": 1220} {"train_loss": -5.822825908660889, "global_step": 51250, "epoch": 1220} {"train_loss": -5.813394546508789, "global_step": 51251, "epoch": 1220} {"train_loss": -5.753746032714844, "global_step": 51252, "epoch": 1220} {"train_loss": -5.793779373168945, "global_step": 51253, "epoch": 1220} {"train_loss": -5.8133955001831055, "global_step": 51254, "epoch": 1220} {"train_loss": -5.81374454498291, "global_step": 51255, "epoch": 1220} {"train_loss": -5.870372772216797, "global_step": 51256, "epoch": 1220} {"train_loss": -5.712785243988037, "global_step": 51257, "epoch": 1220} {"train_loss": -5.849605083465576, "global_step": 51258, "epoch": 1220} {"train_loss": -5.757607936859131, "global_step": 51259, "epoch": 1220} {"train_loss": -5.864253997802734, "global_step": 51260, "epoch": 1220} {"train_loss": -5.787017822265625, "global_step": 51261, "epoch": 1220} {"train_loss": -5.9154462814331055, "global_step": 51262, "epoch": 1220} {"train_loss": -5.774286270141602, "global_step": 51263, "epoch": 1220} {"train_loss": -5.817945957183838, "global_step": 51264, "epoch": 1220} {"train_loss": -5.970357894897461, "global_step": 51265, "epoch": 1220} {"train_loss": -5.900840759277344, "global_step": 51266, "epoch": 1220} {"train_loss": -5.715573310852051, "global_step": 51267, "epoch": 1220} {"train_loss": -5.720211982727051, "global_step": 51268, "epoch": 1220} {"train_loss": -5.860901832580566, "global_step": 51269, "epoch": 1220} {"train_loss": -5.751044273376465, "global_step": 51270, "epoch": 1220} {"train_loss": -5.719113349914551, "global_step": 51271, "epoch": 1220} {"train_loss": -5.725449562072754, "global_step": 51272, "epoch": 1220} {"train_loss": -5.757399559020996, "global_step": 51273, "epoch": 1220} {"train_loss": -5.756468772888184, "global_step": 51274, "epoch": 1220} {"train_loss": -5.847471237182617, "global_step": 51275, "epoch": 1220} {"train_loss": -5.741738319396973, "global_step": 51276, "epoch": 1220} {"train_loss": -5.791402816772461, "global_step": 51277, "epoch": 1220} {"train_loss": -5.773444175720215, "global_step": 51278, "epoch": 1220} {"train_loss": -5.663404941558838, "global_step": 51279, "epoch": 1220} {"train_loss": -5.863080024719238, "global_step": 51280, "epoch": 1220} {"train_loss": -5.795779080617995, "global_step": 51281, "epoch": 1220, "val_loss": 61392.87109375} {"train_loss": -5.818016052246094, "global_step": 51282, "epoch": 1221} {"train_loss": -5.816605567932129, "global_step": 51283, "epoch": 1221} {"train_loss": -5.737822532653809, "global_step": 51284, "epoch": 1221} {"train_loss": -5.914860725402832, "global_step": 51285, "epoch": 1221} {"train_loss": -5.774786472320557, "global_step": 51286, "epoch": 1221} {"train_loss": -5.780409336090088, "global_step": 51287, "epoch": 1221} {"train_loss": -5.924130439758301, "global_step": 51288, "epoch": 1221} {"train_loss": -5.723529815673828, "global_step": 51289, "epoch": 1221} {"train_loss": -5.8054351806640625, "global_step": 51290, "epoch": 1221} {"train_loss": -5.810037612915039, "global_step": 51291, "epoch": 1221} {"train_loss": -5.816649913787842, "global_step": 51292, "epoch": 1221} {"train_loss": -5.6251702308654785, "global_step": 51293, "epoch": 1221} {"train_loss": -5.77353572845459, "global_step": 51294, "epoch": 1221} {"train_loss": -5.696708679199219, "global_step": 51295, "epoch": 1221} {"train_loss": -5.857264518737793, "global_step": 51296, "epoch": 1221} {"train_loss": -5.746269226074219, "global_step": 51297, "epoch": 1221} {"train_loss": -5.863828659057617, "global_step": 51298, "epoch": 1221} {"train_loss": -5.93813419342041, "global_step": 51299, "epoch": 1221} {"train_loss": -5.787785053253174, "global_step": 51300, "epoch": 1221} {"train_loss": -5.833200454711914, "global_step": 51301, "epoch": 1221} {"train_loss": -5.8128132820129395, "global_step": 51302, "epoch": 1221} {"train_loss": -5.851701736450195, "global_step": 51303, "epoch": 1221} {"train_loss": -5.490367889404297, "global_step": 51304, "epoch": 1221} {"train_loss": -5.846414566040039, "global_step": 51305, "epoch": 1221} {"train_loss": -5.763467788696289, "global_step": 51306, "epoch": 1221} {"train_loss": -5.68671989440918, "global_step": 51307, "epoch": 1221} {"train_loss": -5.791852951049805, "global_step": 51308, "epoch": 1221} {"train_loss": -5.843328475952148, "global_step": 51309, "epoch": 1221} {"train_loss": -5.654749393463135, "global_step": 51310, "epoch": 1221} {"train_loss": -5.827940464019775, "global_step": 51311, "epoch": 1221} {"train_loss": -5.83133602142334, "global_step": 51312, "epoch": 1221} {"train_loss": -5.770181655883789, "global_step": 51313, "epoch": 1221} {"train_loss": -5.836087226867676, "global_step": 51314, "epoch": 1221} {"train_loss": -5.760392189025879, "global_step": 51315, "epoch": 1221} {"train_loss": -5.8748345375061035, "global_step": 51316, "epoch": 1221} {"train_loss": -5.853930473327637, "global_step": 51317, "epoch": 1221} {"train_loss": -5.83148193359375, "global_step": 51318, "epoch": 1221} {"train_loss": -5.798598289489746, "global_step": 51319, "epoch": 1221} {"train_loss": -5.783679008483887, "global_step": 51320, "epoch": 1221} {"train_loss": -5.822362422943115, "global_step": 51321, "epoch": 1221} {"train_loss": -5.769864559173584, "global_step": 51322, "epoch": 1221} {"train_loss": -5.7934628781818205, "global_step": 51323, "epoch": 1221, "val_loss": 61587.984375} {"train_loss": -5.806821346282959, "global_step": 51324, "epoch": 1222} {"train_loss": -5.7327423095703125, "global_step": 51325, "epoch": 1222} {"train_loss": -5.6818952560424805, "global_step": 51326, "epoch": 1222} {"train_loss": -5.769293308258057, "global_step": 51327, "epoch": 1222} {"train_loss": -5.809408664703369, "global_step": 51328, "epoch": 1222} {"train_loss": -5.6706414222717285, "global_step": 51329, "epoch": 1222} {"train_loss": -5.865550518035889, "global_step": 51330, "epoch": 1222} {"train_loss": -5.762187957763672, "global_step": 51331, "epoch": 1222} {"train_loss": -5.7894511222839355, "global_step": 51332, "epoch": 1222} {"train_loss": -5.845186233520508, "global_step": 51333, "epoch": 1222} {"train_loss": -5.862362861633301, "global_step": 51334, "epoch": 1222} {"train_loss": -5.771337509155273, "global_step": 51335, "epoch": 1222} {"train_loss": -5.680685997009277, "global_step": 51336, "epoch": 1222} {"train_loss": -5.760467529296875, "global_step": 51337, "epoch": 1222} {"train_loss": -5.845985412597656, "global_step": 51338, "epoch": 1222} {"train_loss": -5.808371067047119, "global_step": 51339, "epoch": 1222} {"train_loss": -5.867368221282959, "global_step": 51340, "epoch": 1222} {"train_loss": -5.85134744644165, "global_step": 51341, "epoch": 1222} {"train_loss": -5.679203987121582, "global_step": 51342, "epoch": 1222} {"train_loss": -5.756541728973389, "global_step": 51343, "epoch": 1222} {"train_loss": -5.696175575256348, "global_step": 51344, "epoch": 1222} {"train_loss": -5.948330879211426, "global_step": 51345, "epoch": 1222} {"train_loss": -5.810277938842773, "global_step": 51346, "epoch": 1222} {"train_loss": -5.815203666687012, "global_step": 51347, "epoch": 1222} {"train_loss": -5.869485855102539, "global_step": 51348, "epoch": 1222} {"train_loss": -5.825024604797363, "global_step": 51349, "epoch": 1222} {"train_loss": -5.76816463470459, "global_step": 51350, "epoch": 1222} {"train_loss": -5.750917911529541, "global_step": 51351, "epoch": 1222} {"train_loss": -5.821866035461426, "global_step": 51352, "epoch": 1222} {"train_loss": -5.866528511047363, "global_step": 51353, "epoch": 1222} {"train_loss": -5.747793197631836, "global_step": 51354, "epoch": 1222} {"train_loss": -5.816518783569336, "global_step": 51355, "epoch": 1222} {"train_loss": -5.803958892822266, "global_step": 51356, "epoch": 1222} {"train_loss": -5.725994110107422, "global_step": 51357, "epoch": 1222} {"train_loss": -5.850068092346191, "global_step": 51358, "epoch": 1222} {"train_loss": -5.798369407653809, "global_step": 51359, "epoch": 1222} {"train_loss": -5.792902946472168, "global_step": 51360, "epoch": 1222} {"train_loss": -5.812330722808838, "global_step": 51361, "epoch": 1222} {"train_loss": -5.743422985076904, "global_step": 51362, "epoch": 1222} {"train_loss": -5.7803449630737305, "global_step": 51363, "epoch": 1222} {"train_loss": -5.759407997131348, "global_step": 51364, "epoch": 1222} {"train_loss": -5.791566224325271, "global_step": 51365, "epoch": 1222, "val_loss": 61419.9453125} {"train_loss": -5.715435028076172, "global_step": 51366, "epoch": 1223} {"train_loss": -5.86393928527832, "global_step": 51367, "epoch": 1223} {"train_loss": -5.73574161529541, "global_step": 51368, "epoch": 1223} {"train_loss": -5.781243324279785, "global_step": 51369, "epoch": 1223} {"train_loss": -5.845067024230957, "global_step": 51370, "epoch": 1223} {"train_loss": -5.851598739624023, "global_step": 51371, "epoch": 1223} {"train_loss": -5.720311641693115, "global_step": 51372, "epoch": 1223} {"train_loss": -5.850869178771973, "global_step": 51373, "epoch": 1223} {"train_loss": -5.835169792175293, "global_step": 51374, "epoch": 1223} {"train_loss": -5.710959434509277, "global_step": 51375, "epoch": 1223} {"train_loss": -5.898151397705078, "global_step": 51376, "epoch": 1223} {"train_loss": -5.766690731048584, "global_step": 51377, "epoch": 1223} {"train_loss": -5.916499614715576, "global_step": 51378, "epoch": 1223} {"train_loss": -5.783326625823975, "global_step": 51379, "epoch": 1223} {"train_loss": -5.781216621398926, "global_step": 51380, "epoch": 1223} {"train_loss": -5.69633674621582, "global_step": 51381, "epoch": 1223} {"train_loss": -5.661439895629883, "global_step": 51382, "epoch": 1223} {"train_loss": -5.847221374511719, "global_step": 51383, "epoch": 1223} {"train_loss": -5.822444915771484, "global_step": 51384, "epoch": 1223} {"train_loss": -5.775972843170166, "global_step": 51385, "epoch": 1223} {"train_loss": -5.7599334716796875, "global_step": 51386, "epoch": 1223} {"train_loss": -5.718951225280762, "global_step": 51387, "epoch": 1223} {"train_loss": -5.841763496398926, "global_step": 51388, "epoch": 1223} {"train_loss": -5.890078544616699, "global_step": 51389, "epoch": 1223} {"train_loss": -5.715329170227051, "global_step": 51390, "epoch": 1223} {"train_loss": -5.8184003829956055, "global_step": 51391, "epoch": 1223} {"train_loss": -5.741395950317383, "global_step": 51392, "epoch": 1223} {"train_loss": -5.816873550415039, "global_step": 51393, "epoch": 1223} {"train_loss": -5.812798500061035, "global_step": 51394, "epoch": 1223} {"train_loss": -5.77946662902832, "global_step": 51395, "epoch": 1223} {"train_loss": -5.79262113571167, "global_step": 51396, "epoch": 1223} {"train_loss": -5.788125514984131, "global_step": 51397, "epoch": 1223} {"train_loss": -5.894208908081055, "global_step": 51398, "epoch": 1223} {"train_loss": -5.711081504821777, "global_step": 51399, "epoch": 1223} {"train_loss": -5.76783561706543, "global_step": 51400, "epoch": 1223} {"train_loss": -5.615778923034668, "global_step": 51401, "epoch": 1223} {"train_loss": -5.788519859313965, "global_step": 51402, "epoch": 1223} {"train_loss": -5.735093116760254, "global_step": 51403, "epoch": 1223} {"train_loss": -5.657876968383789, "global_step": 51404, "epoch": 1223} {"train_loss": -5.9604387283325195, "global_step": 51405, "epoch": 1223} {"train_loss": -5.724358558654785, "global_step": 51406, "epoch": 1223} {"train_loss": -5.78456821895781, "global_step": 51407, "epoch": 1223, "val_loss": 61454.32421875} {"train_loss": -5.850471496582031, "global_step": 51408, "epoch": 1224} {"train_loss": -5.819589614868164, "global_step": 51409, "epoch": 1224} {"train_loss": -5.874546527862549, "global_step": 51410, "epoch": 1224} {"train_loss": -5.8671555519104, "global_step": 51411, "epoch": 1224} {"train_loss": -5.656890392303467, "global_step": 51412, "epoch": 1224} {"train_loss": -5.811664581298828, "global_step": 51413, "epoch": 1224} {"train_loss": -5.77308464050293, "global_step": 51414, "epoch": 1224} {"train_loss": -5.7464799880981445, "global_step": 51415, "epoch": 1224} {"train_loss": -5.852267265319824, "global_step": 51416, "epoch": 1224} {"train_loss": -5.8154497146606445, "global_step": 51417, "epoch": 1224} {"train_loss": -5.890002250671387, "global_step": 51418, "epoch": 1224} {"train_loss": -5.753924369812012, "global_step": 51419, "epoch": 1224} {"train_loss": -5.770416259765625, "global_step": 51420, "epoch": 1224} {"train_loss": -5.777936935424805, "global_step": 51421, "epoch": 1224} {"train_loss": -5.800386428833008, "global_step": 51422, "epoch": 1224} {"train_loss": -5.831814289093018, "global_step": 51423, "epoch": 1224} {"train_loss": -5.884888648986816, "global_step": 51424, "epoch": 1224} {"train_loss": -5.837747573852539, "global_step": 51425, "epoch": 1224} {"train_loss": -5.834934234619141, "global_step": 51426, "epoch": 1224} {"train_loss": -5.750123977661133, "global_step": 51427, "epoch": 1224} {"train_loss": -5.870951175689697, "global_step": 51428, "epoch": 1224} {"train_loss": -5.820279121398926, "global_step": 51429, "epoch": 1224} {"train_loss": -5.785644054412842, "global_step": 51430, "epoch": 1224} {"train_loss": -5.825973033905029, "global_step": 51431, "epoch": 1224} {"train_loss": -5.8987579345703125, "global_step": 51432, "epoch": 1224} {"train_loss": -5.8606343269348145, "global_step": 51433, "epoch": 1224} {"train_loss": -5.646563529968262, "global_step": 51434, "epoch": 1224} {"train_loss": -5.780813694000244, "global_step": 51435, "epoch": 1224} {"train_loss": -5.846566200256348, "global_step": 51436, "epoch": 1224} {"train_loss": -5.754522800445557, "global_step": 51437, "epoch": 1224} {"train_loss": -5.807369232177734, "global_step": 51438, "epoch": 1224} {"train_loss": -5.802267074584961, "global_step": 51439, "epoch": 1224} {"train_loss": -5.684466361999512, "global_step": 51440, "epoch": 1224} {"train_loss": -5.713606357574463, "global_step": 51441, "epoch": 1224} {"train_loss": -5.736488342285156, "global_step": 51442, "epoch": 1224} {"train_loss": -5.799007892608643, "global_step": 51443, "epoch": 1224} {"train_loss": -5.865340232849121, "global_step": 51444, "epoch": 1224} {"train_loss": -5.81682014465332, "global_step": 51445, "epoch": 1224} {"train_loss": -5.804233074188232, "global_step": 51446, "epoch": 1224} {"train_loss": -5.77394437789917, "global_step": 51447, "epoch": 1224} {"train_loss": -5.740747451782227, "global_step": 51448, "epoch": 1224} {"train_loss": -5.801728657313755, "global_step": 51449, "epoch": 1224, "val_loss": 61337.43359375} {"train_loss": -5.896976470947266, "global_step": 51450, "epoch": 1225} {"train_loss": -5.855746269226074, "global_step": 51451, "epoch": 1225} {"train_loss": -5.717334747314453, "global_step": 51452, "epoch": 1225} {"train_loss": -5.81110954284668, "global_step": 51453, "epoch": 1225} {"train_loss": -5.826919078826904, "global_step": 51454, "epoch": 1225} {"train_loss": -5.874927520751953, "global_step": 51455, "epoch": 1225} {"train_loss": -5.791350364685059, "global_step": 51456, "epoch": 1225} {"train_loss": -5.776690483093262, "global_step": 51457, "epoch": 1225} {"train_loss": -5.8628668785095215, "global_step": 51458, "epoch": 1225} {"train_loss": -5.689394474029541, "global_step": 51459, "epoch": 1225} {"train_loss": -5.806715965270996, "global_step": 51460, "epoch": 1225} {"train_loss": -5.826709747314453, "global_step": 51461, "epoch": 1225} {"train_loss": -5.725196838378906, "global_step": 51462, "epoch": 1225} {"train_loss": -5.859399795532227, "global_step": 51463, "epoch": 1225} {"train_loss": -5.850112438201904, "global_step": 51464, "epoch": 1225} {"train_loss": -5.735413551330566, "global_step": 51465, "epoch": 1225} {"train_loss": -5.7141923904418945, "global_step": 51466, "epoch": 1225} {"train_loss": -5.925666809082031, "global_step": 51467, "epoch": 1225} {"train_loss": -5.745911121368408, "global_step": 51468, "epoch": 1225} {"train_loss": -5.826113224029541, "global_step": 51469, "epoch": 1225} {"train_loss": -5.66262674331665, "global_step": 51470, "epoch": 1225} {"train_loss": -5.821211338043213, "global_step": 51471, "epoch": 1225} {"train_loss": -5.855649948120117, "global_step": 51472, "epoch": 1225} {"train_loss": -5.730619430541992, "global_step": 51473, "epoch": 1225} {"train_loss": -5.744797706604004, "global_step": 51474, "epoch": 1225} {"train_loss": -5.655719757080078, "global_step": 51475, "epoch": 1225} {"train_loss": -5.797881126403809, "global_step": 51476, "epoch": 1225} {"train_loss": -5.534390926361084, "global_step": 51477, "epoch": 1225} {"train_loss": -5.80128288269043, "global_step": 51478, "epoch": 1225} {"train_loss": -5.661163330078125, "global_step": 51479, "epoch": 1225} {"train_loss": -5.669417381286621, "global_step": 51480, "epoch": 1225} {"train_loss": -5.7787885665893555, "global_step": 51481, "epoch": 1225} {"train_loss": -5.716296195983887, "global_step": 51482, "epoch": 1225} {"train_loss": -5.778963088989258, "global_step": 51483, "epoch": 1225} {"train_loss": -5.772712707519531, "global_step": 51484, "epoch": 1225} {"train_loss": -5.776554107666016, "global_step": 51485, "epoch": 1225} {"train_loss": -5.78818416595459, "global_step": 51486, "epoch": 1225} {"train_loss": -5.677838325500488, "global_step": 51487, "epoch": 1225} {"train_loss": -5.735931396484375, "global_step": 51488, "epoch": 1225} {"train_loss": -5.646120071411133, "global_step": 51489, "epoch": 1225} {"train_loss": -5.783206939697266, "global_step": 51490, "epoch": 1225} {"train_loss": -5.766302108764648, "global_step": 51491, "epoch": 1225, "val_loss": 61349.80078125} {"train_loss": -5.795160293579102, "global_step": 51492, "epoch": 1226} {"train_loss": -5.675225257873535, "global_step": 51493, "epoch": 1226} {"train_loss": -5.76666784286499, "global_step": 51494, "epoch": 1226} {"train_loss": -5.784204006195068, "global_step": 51495, "epoch": 1226} {"train_loss": -5.803303241729736, "global_step": 51496, "epoch": 1226} {"train_loss": -5.725121021270752, "global_step": 51497, "epoch": 1226} {"train_loss": -5.683785915374756, "global_step": 51498, "epoch": 1226} {"train_loss": -5.682050704956055, "global_step": 51499, "epoch": 1226} {"train_loss": -5.742952346801758, "global_step": 51500, "epoch": 1226} {"train_loss": -5.7222747802734375, "global_step": 51501, "epoch": 1226} {"train_loss": -5.762945175170898, "global_step": 51502, "epoch": 1226} {"train_loss": -5.675555229187012, "global_step": 51503, "epoch": 1226} {"train_loss": -5.747054100036621, "global_step": 51504, "epoch": 1226} {"train_loss": -5.728452205657959, "global_step": 51505, "epoch": 1226} {"train_loss": -5.818257808685303, "global_step": 51506, "epoch": 1226} {"train_loss": -5.714210033416748, "global_step": 51507, "epoch": 1226} {"train_loss": -5.8234477043151855, "global_step": 51508, "epoch": 1226} {"train_loss": -5.729752063751221, "global_step": 51509, "epoch": 1226} {"train_loss": -5.7147440910339355, "global_step": 51510, "epoch": 1226} {"train_loss": -5.7556610107421875, "global_step": 51511, "epoch": 1226} {"train_loss": -5.797603607177734, "global_step": 51512, "epoch": 1226} {"train_loss": -5.830698013305664, "global_step": 51513, "epoch": 1226} {"train_loss": -5.758227348327637, "global_step": 51514, "epoch": 1226} {"train_loss": -5.7822265625, "global_step": 51515, "epoch": 1226} {"train_loss": -5.848563194274902, "global_step": 51516, "epoch": 1226} {"train_loss": -5.779890537261963, "global_step": 51517, "epoch": 1226} {"train_loss": -5.785092353820801, "global_step": 51518, "epoch": 1226} {"train_loss": -5.842053413391113, "global_step": 51519, "epoch": 1226} {"train_loss": -5.769190311431885, "global_step": 51520, "epoch": 1226} {"train_loss": -5.7795257568359375, "global_step": 51521, "epoch": 1226} {"train_loss": -5.778251647949219, "global_step": 51522, "epoch": 1226} {"train_loss": -5.80794095993042, "global_step": 51523, "epoch": 1226} {"train_loss": -5.823793411254883, "global_step": 51524, "epoch": 1226} {"train_loss": -5.896463394165039, "global_step": 51525, "epoch": 1226} {"train_loss": -5.7485246658325195, "global_step": 51526, "epoch": 1226} {"train_loss": -5.869945526123047, "global_step": 51527, "epoch": 1226} {"train_loss": -5.640765190124512, "global_step": 51528, "epoch": 1226} {"train_loss": -5.809233665466309, "global_step": 51529, "epoch": 1226} {"train_loss": -5.724140167236328, "global_step": 51530, "epoch": 1226} {"train_loss": -5.77973747253418, "global_step": 51531, "epoch": 1226} {"train_loss": -5.64939546585083, "global_step": 51532, "epoch": 1226} {"train_loss": -5.7643459524427145, "global_step": 51533, "epoch": 1226, "val_loss": 61725.546875} {"train_loss": -5.678875923156738, "global_step": 51534, "epoch": 1227} {"train_loss": -5.818790912628174, "global_step": 51535, "epoch": 1227} {"train_loss": -5.755099296569824, "global_step": 51536, "epoch": 1227} {"train_loss": -5.876694679260254, "global_step": 51537, "epoch": 1227} {"train_loss": -5.764325141906738, "global_step": 51538, "epoch": 1227} {"train_loss": -5.714241981506348, "global_step": 51539, "epoch": 1227} {"train_loss": -5.612748622894287, "global_step": 51540, "epoch": 1227} {"train_loss": -5.875129699707031, "global_step": 51541, "epoch": 1227} {"train_loss": -5.744892120361328, "global_step": 51542, "epoch": 1227} {"train_loss": -5.683073043823242, "global_step": 51543, "epoch": 1227} {"train_loss": -5.770328521728516, "global_step": 51544, "epoch": 1227} {"train_loss": -5.698869228363037, "global_step": 51545, "epoch": 1227} {"train_loss": -5.829905986785889, "global_step": 51546, "epoch": 1227} {"train_loss": -5.860565185546875, "global_step": 51547, "epoch": 1227} {"train_loss": -5.8181915283203125, "global_step": 51548, "epoch": 1227} {"train_loss": -5.711249351501465, "global_step": 51549, "epoch": 1227} {"train_loss": -5.781284332275391, "global_step": 51550, "epoch": 1227} {"train_loss": -5.835360527038574, "global_step": 51551, "epoch": 1227} {"train_loss": -5.729774475097656, "global_step": 51552, "epoch": 1227} {"train_loss": -5.811886787414551, "global_step": 51553, "epoch": 1227} {"train_loss": -5.725429534912109, "global_step": 51554, "epoch": 1227} {"train_loss": -5.672933578491211, "global_step": 51555, "epoch": 1227} {"train_loss": -5.957988739013672, "global_step": 51556, "epoch": 1227} {"train_loss": -5.71081018447876, "global_step": 51557, "epoch": 1227} {"train_loss": -5.7456464767456055, "global_step": 51558, "epoch": 1227} {"train_loss": -5.7306742668151855, "global_step": 51559, "epoch": 1227} {"train_loss": -5.712223052978516, "global_step": 51560, "epoch": 1227} {"train_loss": -5.702796936035156, "global_step": 51561, "epoch": 1227} {"train_loss": -5.771520137786865, "global_step": 51562, "epoch": 1227} {"train_loss": -5.814329147338867, "global_step": 51563, "epoch": 1227} {"train_loss": -5.94253396987915, "global_step": 51564, "epoch": 1227} {"train_loss": -5.786327838897705, "global_step": 51565, "epoch": 1227} {"train_loss": -5.803804397583008, "global_step": 51566, "epoch": 1227} {"train_loss": -5.918950080871582, "global_step": 51567, "epoch": 1227} {"train_loss": -5.900745868682861, "global_step": 51568, "epoch": 1227} {"train_loss": -5.735233306884766, "global_step": 51569, "epoch": 1227} {"train_loss": -5.7933573722839355, "global_step": 51570, "epoch": 1227} {"train_loss": -5.856032371520996, "global_step": 51571, "epoch": 1227} {"train_loss": -5.859309196472168, "global_step": 51572, "epoch": 1227} {"train_loss": -5.7761993408203125, "global_step": 51573, "epoch": 1227} {"train_loss": -5.83745002746582, "global_step": 51574, "epoch": 1227} {"train_loss": -5.7818933100927445, "global_step": 51575, "epoch": 1227, "val_loss": 61968.65234375} {"train_loss": -5.711263179779053, "global_step": 51576, "epoch": 1228} {"train_loss": -5.800103664398193, "global_step": 51577, "epoch": 1228} {"train_loss": -5.866184234619141, "global_step": 51578, "epoch": 1228} {"train_loss": -5.7869133949279785, "global_step": 51579, "epoch": 1228} {"train_loss": -5.802723407745361, "global_step": 51580, "epoch": 1228} {"train_loss": -5.779903411865234, "global_step": 51581, "epoch": 1228} {"train_loss": -5.8549346923828125, "global_step": 51582, "epoch": 1228} {"train_loss": -5.801589012145996, "global_step": 51583, "epoch": 1228} {"train_loss": -5.914767265319824, "global_step": 51584, "epoch": 1228} {"train_loss": -5.724608421325684, "global_step": 51585, "epoch": 1228} {"train_loss": -5.805320739746094, "global_step": 51586, "epoch": 1228} {"train_loss": -5.821331977844238, "global_step": 51587, "epoch": 1228} {"train_loss": -5.874955177307129, "global_step": 51588, "epoch": 1228} {"train_loss": -5.788017272949219, "global_step": 51589, "epoch": 1228} {"train_loss": -5.747768402099609, "global_step": 51590, "epoch": 1228} {"train_loss": -5.823846340179443, "global_step": 51591, "epoch": 1228} {"train_loss": -5.9012451171875, "global_step": 51592, "epoch": 1228} {"train_loss": -5.858797073364258, "global_step": 51593, "epoch": 1228} {"train_loss": -5.791437149047852, "global_step": 51594, "epoch": 1228} {"train_loss": -5.808911323547363, "global_step": 51595, "epoch": 1228} {"train_loss": -5.929468154907227, "global_step": 51596, "epoch": 1228} {"train_loss": -5.811267852783203, "global_step": 51597, "epoch": 1228} {"train_loss": -5.829481601715088, "global_step": 51598, "epoch": 1228} {"train_loss": -5.647505760192871, "global_step": 51599, "epoch": 1228} {"train_loss": -5.852354049682617, "global_step": 51600, "epoch": 1228} {"train_loss": -5.778630256652832, "global_step": 51601, "epoch": 1228} {"train_loss": -5.749963760375977, "global_step": 51602, "epoch": 1228} {"train_loss": -5.7485032081604, "global_step": 51603, "epoch": 1228} {"train_loss": -5.701231479644775, "global_step": 51604, "epoch": 1228} {"train_loss": -5.869110584259033, "global_step": 51605, "epoch": 1228} {"train_loss": -5.823134422302246, "global_step": 51606, "epoch": 1228} {"train_loss": -5.76633358001709, "global_step": 51607, "epoch": 1228} {"train_loss": -5.715359687805176, "global_step": 51608, "epoch": 1228} {"train_loss": -5.817150115966797, "global_step": 51609, "epoch": 1228} {"train_loss": -5.695179462432861, "global_step": 51610, "epoch": 1228} {"train_loss": -5.752814292907715, "global_step": 51611, "epoch": 1228} {"train_loss": -5.787576675415039, "global_step": 51612, "epoch": 1228} {"train_loss": -5.796594142913818, "global_step": 51613, "epoch": 1228} {"train_loss": -5.891371726989746, "global_step": 51614, "epoch": 1228} {"train_loss": -5.704809188842773, "global_step": 51615, "epoch": 1228} {"train_loss": -5.74857234954834, "global_step": 51616, "epoch": 1228} {"train_loss": -5.798120566776821, "global_step": 51617, "epoch": 1228, "val_loss": 61446.7734375} {"train_loss": -5.9481964111328125, "global_step": 51618, "epoch": 1229} {"train_loss": -5.803657054901123, "global_step": 51619, "epoch": 1229} {"train_loss": -5.852719306945801, "global_step": 51620, "epoch": 1229} {"train_loss": -5.784092426300049, "global_step": 51621, "epoch": 1229} {"train_loss": -5.818552017211914, "global_step": 51622, "epoch": 1229} {"train_loss": -5.75228214263916, "global_step": 51623, "epoch": 1229} {"train_loss": -5.791438102722168, "global_step": 51624, "epoch": 1229} {"train_loss": -5.851886749267578, "global_step": 51625, "epoch": 1229} {"train_loss": -5.802804946899414, "global_step": 51626, "epoch": 1229} {"train_loss": -5.8104705810546875, "global_step": 51627, "epoch": 1229} {"train_loss": -5.805934906005859, "global_step": 51628, "epoch": 1229} {"train_loss": -5.952301979064941, "global_step": 51629, "epoch": 1229} {"train_loss": -5.943727493286133, "global_step": 51630, "epoch": 1229} {"train_loss": -5.820262432098389, "global_step": 51631, "epoch": 1229} {"train_loss": -5.759407043457031, "global_step": 51632, "epoch": 1229} {"train_loss": -5.639667987823486, "global_step": 51633, "epoch": 1229} {"train_loss": -5.835282802581787, "global_step": 51634, "epoch": 1229} {"train_loss": -5.724414825439453, "global_step": 51635, "epoch": 1229} {"train_loss": -5.759763717651367, "global_step": 51636, "epoch": 1229} {"train_loss": -5.81558895111084, "global_step": 51637, "epoch": 1229} {"train_loss": -5.718006134033203, "global_step": 51638, "epoch": 1229} {"train_loss": -5.851999282836914, "global_step": 51639, "epoch": 1229} {"train_loss": -5.663890838623047, "global_step": 51640, "epoch": 1229} {"train_loss": -5.809535026550293, "global_step": 51641, "epoch": 1229} {"train_loss": -5.73091983795166, "global_step": 51642, "epoch": 1229} {"train_loss": -5.648036003112793, "global_step": 51643, "epoch": 1229} {"train_loss": -5.795711517333984, "global_step": 51644, "epoch": 1229} {"train_loss": -5.435291290283203, "global_step": 51645, "epoch": 1229} {"train_loss": -5.6729607582092285, "global_step": 51646, "epoch": 1229} {"train_loss": -5.713346481323242, "global_step": 51647, "epoch": 1229} {"train_loss": -5.652166366577148, "global_step": 51648, "epoch": 1229} {"train_loss": -5.619032382965088, "global_step": 51649, "epoch": 1229} {"train_loss": -5.683977127075195, "global_step": 51650, "epoch": 1229} {"train_loss": -5.787548065185547, "global_step": 51651, "epoch": 1229} {"train_loss": -5.634057998657227, "global_step": 51652, "epoch": 1229} {"train_loss": -5.660919189453125, "global_step": 51653, "epoch": 1229} {"train_loss": -5.615126609802246, "global_step": 51654, "epoch": 1229} {"train_loss": -5.721169948577881, "global_step": 51655, "epoch": 1229} {"train_loss": -5.828023910522461, "global_step": 51656, "epoch": 1229} {"train_loss": -5.690187454223633, "global_step": 51657, "epoch": 1229} {"train_loss": -5.745209693908691, "global_step": 51658, "epoch": 1229} {"train_loss": -5.756022555487497, "global_step": 51659, "epoch": 1229, "val_loss": 62021.9140625} {"train_loss": -5.849048137664795, "global_step": 51660, "epoch": 1230} {"train_loss": -5.771653175354004, "global_step": 51661, "epoch": 1230} {"train_loss": -5.741481304168701, "global_step": 51662, "epoch": 1230} {"train_loss": -5.635399341583252, "global_step": 51663, "epoch": 1230} {"train_loss": -5.707619667053223, "global_step": 51664, "epoch": 1230} {"train_loss": -5.629622936248779, "global_step": 51665, "epoch": 1230} {"train_loss": -5.768423080444336, "global_step": 51666, "epoch": 1230} {"train_loss": -5.7302470207214355, "global_step": 51667, "epoch": 1230} {"train_loss": -5.732314586639404, "global_step": 51668, "epoch": 1230} {"train_loss": -5.84188175201416, "global_step": 51669, "epoch": 1230} {"train_loss": -5.731156349182129, "global_step": 51670, "epoch": 1230} {"train_loss": -5.75374698638916, "global_step": 51671, "epoch": 1230} {"train_loss": -5.763542175292969, "global_step": 51672, "epoch": 1230} {"train_loss": -5.7221221923828125, "global_step": 51673, "epoch": 1230} {"train_loss": -5.887364387512207, "global_step": 51674, "epoch": 1230} {"train_loss": -5.8704915046691895, "global_step": 51675, "epoch": 1230} {"train_loss": -5.833211898803711, "global_step": 51676, "epoch": 1230} {"train_loss": -5.7873148918151855, "global_step": 51677, "epoch": 1230} {"train_loss": -5.746265411376953, "global_step": 51678, "epoch": 1230} {"train_loss": -5.77852201461792, "global_step": 51679, "epoch": 1230} {"train_loss": -5.737414360046387, "global_step": 51680, "epoch": 1230} {"train_loss": -5.836431503295898, "global_step": 51681, "epoch": 1230} {"train_loss": -5.788653373718262, "global_step": 51682, "epoch": 1230} {"train_loss": -5.866337776184082, "global_step": 51683, "epoch": 1230} {"train_loss": -5.820347785949707, "global_step": 51684, "epoch": 1230} {"train_loss": -5.794488906860352, "global_step": 51685, "epoch": 1230} {"train_loss": -5.8204474449157715, "global_step": 51686, "epoch": 1230} {"train_loss": -5.867504119873047, "global_step": 51687, "epoch": 1230} {"train_loss": -5.732329368591309, "global_step": 51688, "epoch": 1230} {"train_loss": -5.782247543334961, "global_step": 51689, "epoch": 1230} {"train_loss": -5.842871189117432, "global_step": 51690, "epoch": 1230} {"train_loss": -5.880583763122559, "global_step": 51691, "epoch": 1230} {"train_loss": -5.7300615310668945, "global_step": 51692, "epoch": 1230} {"train_loss": -5.800745010375977, "global_step": 51693, "epoch": 1230} {"train_loss": -5.8331756591796875, "global_step": 51694, "epoch": 1230} {"train_loss": -5.7761125564575195, "global_step": 51695, "epoch": 1230} {"train_loss": -5.803191184997559, "global_step": 51696, "epoch": 1230} {"train_loss": -5.768555164337158, "global_step": 51697, "epoch": 1230} {"train_loss": -5.818578720092773, "global_step": 51698, "epoch": 1230} {"train_loss": -5.699660301208496, "global_step": 51699, "epoch": 1230} {"train_loss": -5.781924724578857, "global_step": 51700, "epoch": 1230} {"train_loss": -5.7829219954354425, "global_step": 51701, "epoch": 1230, "val_loss": 61643.2734375} {"train_loss": -5.615505218505859, "global_step": 51702, "epoch": 1231} {"train_loss": -5.711117267608643, "global_step": 51703, "epoch": 1231} {"train_loss": -5.7150774002075195, "global_step": 51704, "epoch": 1231} {"train_loss": -5.7903313636779785, "global_step": 51705, "epoch": 1231} {"train_loss": -5.853704452514648, "global_step": 51706, "epoch": 1231} {"train_loss": -5.842870235443115, "global_step": 51707, "epoch": 1231} {"train_loss": -5.868586540222168, "global_step": 51708, "epoch": 1231} {"train_loss": -5.782938480377197, "global_step": 51709, "epoch": 1231} {"train_loss": -5.707513809204102, "global_step": 51710, "epoch": 1231} {"train_loss": -5.881169319152832, "global_step": 51711, "epoch": 1231} {"train_loss": -5.87336540222168, "global_step": 51712, "epoch": 1231} {"train_loss": -5.803642272949219, "global_step": 51713, "epoch": 1231} {"train_loss": -5.92465877532959, "global_step": 51714, "epoch": 1231} {"train_loss": -5.825997829437256, "global_step": 51715, "epoch": 1231} {"train_loss": -5.790387153625488, "global_step": 51716, "epoch": 1231} {"train_loss": -5.939124584197998, "global_step": 51717, "epoch": 1231} {"train_loss": -5.901907920837402, "global_step": 51718, "epoch": 1231} {"train_loss": -5.828009605407715, "global_step": 51719, "epoch": 1231} {"train_loss": -5.748944282531738, "global_step": 51720, "epoch": 1231} {"train_loss": -5.866558074951172, "global_step": 51721, "epoch": 1231} {"train_loss": -5.859526634216309, "global_step": 51722, "epoch": 1231} {"train_loss": -5.7774338722229, "global_step": 51723, "epoch": 1231} {"train_loss": -5.802238464355469, "global_step": 51724, "epoch": 1231} {"train_loss": -5.789578437805176, "global_step": 51725, "epoch": 1231} {"train_loss": -5.74314022064209, "global_step": 51726, "epoch": 1231} {"train_loss": -5.77071475982666, "global_step": 51727, "epoch": 1231} {"train_loss": -5.8752007484436035, "global_step": 51728, "epoch": 1231} {"train_loss": -5.85032844543457, "global_step": 51729, "epoch": 1231} {"train_loss": -5.71461820602417, "global_step": 51730, "epoch": 1231} {"train_loss": -5.819498538970947, "global_step": 51731, "epoch": 1231} {"train_loss": -5.837869167327881, "global_step": 51732, "epoch": 1231} {"train_loss": -5.8372111320495605, "global_step": 51733, "epoch": 1231} {"train_loss": -5.8318586349487305, "global_step": 51734, "epoch": 1231} {"train_loss": -5.8451008796691895, "global_step": 51735, "epoch": 1231} {"train_loss": -5.783864974975586, "global_step": 51736, "epoch": 1231} {"train_loss": -5.960399150848389, "global_step": 51737, "epoch": 1231} {"train_loss": -5.759769439697266, "global_step": 51738, "epoch": 1231} {"train_loss": -5.833526611328125, "global_step": 51739, "epoch": 1231} {"train_loss": -5.783675670623779, "global_step": 51740, "epoch": 1231} {"train_loss": -5.791596412658691, "global_step": 51741, "epoch": 1231} {"train_loss": -5.847480297088623, "global_step": 51742, "epoch": 1231} {"train_loss": -5.816277821858724, "global_step": 51743, "epoch": 1231, "val_loss": 61530.19921875} {"train_loss": -5.779451370239258, "global_step": 51744, "epoch": 1232} {"train_loss": -5.847641944885254, "global_step": 51745, "epoch": 1232} {"train_loss": -5.798916816711426, "global_step": 51746, "epoch": 1232} {"train_loss": -5.7843918800354, "global_step": 51747, "epoch": 1232} {"train_loss": -5.826292037963867, "global_step": 51748, "epoch": 1232} {"train_loss": -5.833653926849365, "global_step": 51749, "epoch": 1232} {"train_loss": -5.883227348327637, "global_step": 51750, "epoch": 1232} {"train_loss": -5.841888427734375, "global_step": 51751, "epoch": 1232} {"train_loss": -5.853973388671875, "global_step": 51752, "epoch": 1232} {"train_loss": -5.834775924682617, "global_step": 51753, "epoch": 1232} {"train_loss": -5.89340877532959, "global_step": 51754, "epoch": 1232} {"train_loss": -5.803936958312988, "global_step": 51755, "epoch": 1232} {"train_loss": -5.693368434906006, "global_step": 51756, "epoch": 1232} {"train_loss": -5.741063117980957, "global_step": 51757, "epoch": 1232} {"train_loss": -5.627435207366943, "global_step": 51758, "epoch": 1232} {"train_loss": -5.720666408538818, "global_step": 51759, "epoch": 1232} {"train_loss": -5.970735549926758, "global_step": 51760, "epoch": 1232} {"train_loss": -5.847040176391602, "global_step": 51761, "epoch": 1232} {"train_loss": -5.854247570037842, "global_step": 51762, "epoch": 1232} {"train_loss": -5.895660400390625, "global_step": 51763, "epoch": 1232} {"train_loss": -5.82607364654541, "global_step": 51764, "epoch": 1232} {"train_loss": -5.8474602699279785, "global_step": 51765, "epoch": 1232} {"train_loss": -5.75876522064209, "global_step": 51766, "epoch": 1232} {"train_loss": -5.750082015991211, "global_step": 51767, "epoch": 1232} {"train_loss": -5.818294048309326, "global_step": 51768, "epoch": 1232} {"train_loss": -5.770734786987305, "global_step": 51769, "epoch": 1232} {"train_loss": -5.906580924987793, "global_step": 51770, "epoch": 1232} {"train_loss": -5.795503616333008, "global_step": 51771, "epoch": 1232} {"train_loss": -5.891539573669434, "global_step": 51772, "epoch": 1232} {"train_loss": -5.792433261871338, "global_step": 51773, "epoch": 1232} {"train_loss": -5.723377227783203, "global_step": 51774, "epoch": 1232} {"train_loss": -5.884678840637207, "global_step": 51775, "epoch": 1232} {"train_loss": -5.814449310302734, "global_step": 51776, "epoch": 1232} {"train_loss": -5.824099063873291, "global_step": 51777, "epoch": 1232} {"train_loss": -5.81284236907959, "global_step": 51778, "epoch": 1232} {"train_loss": -5.869093894958496, "global_step": 51779, "epoch": 1232} {"train_loss": -5.80002498626709, "global_step": 51780, "epoch": 1232} {"train_loss": -5.884236812591553, "global_step": 51781, "epoch": 1232} {"train_loss": -5.838145732879639, "global_step": 51782, "epoch": 1232} {"train_loss": -5.8482208251953125, "global_step": 51783, "epoch": 1232} {"train_loss": -5.840778350830078, "global_step": 51784, "epoch": 1232} {"train_loss": -5.819357168106806, "global_step": 51785, "epoch": 1232, "val_loss": 61266.78125} {"train_loss": -5.841650009155273, "global_step": 51786, "epoch": 1233} {"train_loss": -5.8296003341674805, "global_step": 51787, "epoch": 1233} {"train_loss": -5.851963996887207, "global_step": 51788, "epoch": 1233} {"train_loss": -5.796428680419922, "global_step": 51789, "epoch": 1233} {"train_loss": -5.83236837387085, "global_step": 51790, "epoch": 1233} {"train_loss": -5.802881717681885, "global_step": 51791, "epoch": 1233} {"train_loss": -5.792468070983887, "global_step": 51792, "epoch": 1233} {"train_loss": -5.679377555847168, "global_step": 51793, "epoch": 1233} {"train_loss": -5.803908824920654, "global_step": 51794, "epoch": 1233} {"train_loss": -5.783647060394287, "global_step": 51795, "epoch": 1233} {"train_loss": -5.693887710571289, "global_step": 51796, "epoch": 1233} {"train_loss": -5.860440254211426, "global_step": 51797, "epoch": 1233} {"train_loss": -5.742491245269775, "global_step": 51798, "epoch": 1233} {"train_loss": -5.780623435974121, "global_step": 51799, "epoch": 1233} {"train_loss": -5.7547736167907715, "global_step": 51800, "epoch": 1233} {"train_loss": -5.928391933441162, "global_step": 51801, "epoch": 1233} {"train_loss": -5.831263542175293, "global_step": 51802, "epoch": 1233} {"train_loss": -5.847763538360596, "global_step": 51803, "epoch": 1233} {"train_loss": -5.662787437438965, "global_step": 51804, "epoch": 1233} {"train_loss": -5.7582902908325195, "global_step": 51805, "epoch": 1233} {"train_loss": -5.689825534820557, "global_step": 51806, "epoch": 1233} {"train_loss": -5.634394645690918, "global_step": 51807, "epoch": 1233} {"train_loss": -5.776467323303223, "global_step": 51808, "epoch": 1233} {"train_loss": -5.725127220153809, "global_step": 51809, "epoch": 1233} {"train_loss": -5.71440315246582, "global_step": 51810, "epoch": 1233} {"train_loss": -5.733619689941406, "global_step": 51811, "epoch": 1233} {"train_loss": -5.763996124267578, "global_step": 51812, "epoch": 1233} {"train_loss": -5.632721424102783, "global_step": 51813, "epoch": 1233} {"train_loss": -5.792430877685547, "global_step": 51814, "epoch": 1233} {"train_loss": -5.70379638671875, "global_step": 51815, "epoch": 1233} {"train_loss": -5.842889785766602, "global_step": 51816, "epoch": 1233} {"train_loss": -5.756421089172363, "global_step": 51817, "epoch": 1233} {"train_loss": -5.813591003417969, "global_step": 51818, "epoch": 1233} {"train_loss": -5.766952991485596, "global_step": 51819, "epoch": 1233} {"train_loss": -5.757946491241455, "global_step": 51820, "epoch": 1233} {"train_loss": -5.805479049682617, "global_step": 51821, "epoch": 1233} {"train_loss": -5.806699275970459, "global_step": 51822, "epoch": 1233} {"train_loss": -5.877199172973633, "global_step": 51823, "epoch": 1233} {"train_loss": -5.795947074890137, "global_step": 51824, "epoch": 1233} {"train_loss": -5.660777568817139, "global_step": 51825, "epoch": 1233} {"train_loss": -5.854557037353516, "global_step": 51826, "epoch": 1233} {"train_loss": -5.775081589108422, "global_step": 51827, "epoch": 1233, "val_loss": 61935.19921875} {"train_loss": -5.826619625091553, "global_step": 51828, "epoch": 1234} {"train_loss": -5.835298538208008, "global_step": 51829, "epoch": 1234} {"train_loss": -5.788747787475586, "global_step": 51830, "epoch": 1234} {"train_loss": -5.770810127258301, "global_step": 51831, "epoch": 1234} {"train_loss": -5.720675468444824, "global_step": 51832, "epoch": 1234} {"train_loss": -5.708954334259033, "global_step": 51833, "epoch": 1234} {"train_loss": -5.768046855926514, "global_step": 51834, "epoch": 1234} {"train_loss": -5.846945285797119, "global_step": 51835, "epoch": 1234} {"train_loss": -5.78225040435791, "global_step": 51836, "epoch": 1234} {"train_loss": -5.756473541259766, "global_step": 51837, "epoch": 1234} {"train_loss": -5.740414619445801, "global_step": 51838, "epoch": 1234} {"train_loss": -5.900219917297363, "global_step": 51839, "epoch": 1234} {"train_loss": -5.836303234100342, "global_step": 51840, "epoch": 1234} {"train_loss": -5.740563869476318, "global_step": 51841, "epoch": 1234} {"train_loss": -5.786469459533691, "global_step": 51842, "epoch": 1234} {"train_loss": -5.6757493019104, "global_step": 51843, "epoch": 1234} {"train_loss": -5.740741729736328, "global_step": 51844, "epoch": 1234} {"train_loss": -5.680204391479492, "global_step": 51845, "epoch": 1234} {"train_loss": -5.767795562744141, "global_step": 51846, "epoch": 1234} {"train_loss": -5.866162300109863, "global_step": 51847, "epoch": 1234} {"train_loss": -5.871870040893555, "global_step": 51848, "epoch": 1234} {"train_loss": -5.7858476638793945, "global_step": 51849, "epoch": 1234} {"train_loss": -5.8191680908203125, "global_step": 51850, "epoch": 1234} {"train_loss": -5.784516334533691, "global_step": 51851, "epoch": 1234} {"train_loss": -5.539758682250977, "global_step": 51852, "epoch": 1234} {"train_loss": -5.798866271972656, "global_step": 51853, "epoch": 1234} {"train_loss": -5.731579780578613, "global_step": 51854, "epoch": 1234} {"train_loss": -5.681757926940918, "global_step": 51855, "epoch": 1234} {"train_loss": -5.781668663024902, "global_step": 51856, "epoch": 1234} {"train_loss": -5.762701988220215, "global_step": 51857, "epoch": 1234} {"train_loss": -5.637425422668457, "global_step": 51858, "epoch": 1234} {"train_loss": -5.798892021179199, "global_step": 51859, "epoch": 1234} {"train_loss": -5.712279319763184, "global_step": 51860, "epoch": 1234} {"train_loss": -5.75050687789917, "global_step": 51861, "epoch": 1234} {"train_loss": -5.714190483093262, "global_step": 51862, "epoch": 1234} {"train_loss": -5.62842321395874, "global_step": 51863, "epoch": 1234} {"train_loss": -5.798159599304199, "global_step": 51864, "epoch": 1234} {"train_loss": -5.713352680206299, "global_step": 51865, "epoch": 1234} {"train_loss": -5.677562713623047, "global_step": 51866, "epoch": 1234} {"train_loss": -5.699497222900391, "global_step": 51867, "epoch": 1234} {"train_loss": -5.6977386474609375, "global_step": 51868, "epoch": 1234} {"train_loss": -5.7547037942068915, "global_step": 51869, "epoch": 1234, "val_loss": 61937.97265625} {"train_loss": -5.789916515350342, "global_step": 51870, "epoch": 1235} {"train_loss": -5.832696914672852, "global_step": 51871, "epoch": 1235} {"train_loss": -5.86597204208374, "global_step": 51872, "epoch": 1235} {"train_loss": -5.671799659729004, "global_step": 51873, "epoch": 1235} {"train_loss": -5.885443687438965, "global_step": 51874, "epoch": 1235} {"train_loss": -5.67018985748291, "global_step": 51875, "epoch": 1235} {"train_loss": -5.773212432861328, "global_step": 51876, "epoch": 1235} {"train_loss": -5.849304676055908, "global_step": 51877, "epoch": 1235} {"train_loss": -5.578803539276123, "global_step": 51878, "epoch": 1235} {"train_loss": -5.820312023162842, "global_step": 51879, "epoch": 1235} {"train_loss": -5.654329776763916, "global_step": 51880, "epoch": 1235} {"train_loss": -5.838050842285156, "global_step": 51881, "epoch": 1235} {"train_loss": -5.71514892578125, "global_step": 51882, "epoch": 1235} {"train_loss": -5.831173896789551, "global_step": 51883, "epoch": 1235} {"train_loss": -5.85352897644043, "global_step": 51884, "epoch": 1235} {"train_loss": -5.760700225830078, "global_step": 51885, "epoch": 1235} {"train_loss": -5.841441631317139, "global_step": 51886, "epoch": 1235} {"train_loss": -5.767275810241699, "global_step": 51887, "epoch": 1235} {"train_loss": -5.853288173675537, "global_step": 51888, "epoch": 1235} {"train_loss": -5.717402458190918, "global_step": 51889, "epoch": 1235} {"train_loss": -5.817042350769043, "global_step": 51890, "epoch": 1235} {"train_loss": -5.68233060836792, "global_step": 51891, "epoch": 1235} {"train_loss": -5.760901927947998, "global_step": 51892, "epoch": 1235} {"train_loss": -5.774672985076904, "global_step": 51893, "epoch": 1235} {"train_loss": -5.833919525146484, "global_step": 51894, "epoch": 1235} {"train_loss": -5.739755630493164, "global_step": 51895, "epoch": 1235} {"train_loss": -5.855929374694824, "global_step": 51896, "epoch": 1235} {"train_loss": -5.889167785644531, "global_step": 51897, "epoch": 1235} {"train_loss": -5.912578582763672, "global_step": 51898, "epoch": 1235} {"train_loss": -5.8736395835876465, "global_step": 51899, "epoch": 1235} {"train_loss": -5.764881610870361, "global_step": 51900, "epoch": 1235} {"train_loss": -5.772397041320801, "global_step": 51901, "epoch": 1235} {"train_loss": -5.881464958190918, "global_step": 51902, "epoch": 1235} {"train_loss": -5.799525260925293, "global_step": 51903, "epoch": 1235} {"train_loss": -5.8926496505737305, "global_step": 51904, "epoch": 1235} {"train_loss": -5.687811851501465, "global_step": 51905, "epoch": 1235} {"train_loss": -5.905290126800537, "global_step": 51906, "epoch": 1235} {"train_loss": -5.819222450256348, "global_step": 51907, "epoch": 1235} {"train_loss": -5.856085300445557, "global_step": 51908, "epoch": 1235} {"train_loss": -5.760843276977539, "global_step": 51909, "epoch": 1235} {"train_loss": -5.715826988220215, "global_step": 51910, "epoch": 1235} {"train_loss": -5.795013586680095, "global_step": 51911, "epoch": 1235, "val_loss": 61357.25} {"train_loss": -5.936793327331543, "global_step": 51912, "epoch": 1236} {"train_loss": -5.844037055969238, "global_step": 51913, "epoch": 1236} {"train_loss": -5.872618198394775, "global_step": 51914, "epoch": 1236} {"train_loss": -5.8782148361206055, "global_step": 51915, "epoch": 1236} {"train_loss": -5.802839756011963, "global_step": 51916, "epoch": 1236} {"train_loss": -5.9532318115234375, "global_step": 51917, "epoch": 1236} {"train_loss": -5.847098350524902, "global_step": 51918, "epoch": 1236} {"train_loss": -5.8357439041137695, "global_step": 51919, "epoch": 1236} {"train_loss": -5.778049468994141, "global_step": 51920, "epoch": 1236} {"train_loss": -5.851448059082031, "global_step": 51921, "epoch": 1236} {"train_loss": -5.893488883972168, "global_step": 51922, "epoch": 1236} {"train_loss": -5.624011993408203, "global_step": 51923, "epoch": 1236} {"train_loss": -5.779241561889648, "global_step": 51924, "epoch": 1236} {"train_loss": -5.719132423400879, "global_step": 51925, "epoch": 1236} {"train_loss": -5.656144142150879, "global_step": 51926, "epoch": 1236} {"train_loss": -5.764410972595215, "global_step": 51927, "epoch": 1236} {"train_loss": -5.819328308105469, "global_step": 51928, "epoch": 1236} {"train_loss": -5.767684459686279, "global_step": 51929, "epoch": 1236} {"train_loss": -5.669591426849365, "global_step": 51930, "epoch": 1236} {"train_loss": -5.78730583190918, "global_step": 51931, "epoch": 1236} {"train_loss": -5.771365165710449, "global_step": 51932, "epoch": 1236} {"train_loss": -5.916045188903809, "global_step": 51933, "epoch": 1236} {"train_loss": -5.823634147644043, "global_step": 51934, "epoch": 1236} {"train_loss": -5.9609785079956055, "global_step": 51935, "epoch": 1236} {"train_loss": -5.796073913574219, "global_step": 51936, "epoch": 1236} {"train_loss": -5.832668304443359, "global_step": 51937, "epoch": 1236} {"train_loss": -5.929135322570801, "global_step": 51938, "epoch": 1236} {"train_loss": -5.8242082595825195, "global_step": 51939, "epoch": 1236} {"train_loss": -5.779389381408691, "global_step": 51940, "epoch": 1236} {"train_loss": -5.890137195587158, "global_step": 51941, "epoch": 1236} {"train_loss": -5.795628547668457, "global_step": 51942, "epoch": 1236} {"train_loss": -5.852982521057129, "global_step": 51943, "epoch": 1236} {"train_loss": -5.830077648162842, "global_step": 51944, "epoch": 1236} {"train_loss": -5.746310234069824, "global_step": 51945, "epoch": 1236} {"train_loss": -5.781647682189941, "global_step": 51946, "epoch": 1236} {"train_loss": -5.837214469909668, "global_step": 51947, "epoch": 1236} {"train_loss": -5.892299652099609, "global_step": 51948, "epoch": 1236} {"train_loss": -5.730860233306885, "global_step": 51949, "epoch": 1236} {"train_loss": -5.840645790100098, "global_step": 51950, "epoch": 1236} {"train_loss": -5.851737976074219, "global_step": 51951, "epoch": 1236} {"train_loss": -5.697765827178955, "global_step": 51952, "epoch": 1236} {"train_loss": -5.814688444137573, "global_step": 51953, "epoch": 1236, "val_loss": 61688.7734375} {"train_loss": -5.807397842407227, "global_step": 51954, "epoch": 1237} {"train_loss": -5.645947456359863, "global_step": 51955, "epoch": 1237} {"train_loss": -5.7622785568237305, "global_step": 51956, "epoch": 1237} {"train_loss": -5.653159141540527, "global_step": 51957, "epoch": 1237} {"train_loss": -5.856649398803711, "global_step": 51958, "epoch": 1237} {"train_loss": -5.6935014724731445, "global_step": 51959, "epoch": 1237} {"train_loss": -5.684250354766846, "global_step": 51960, "epoch": 1237} {"train_loss": -5.8229875564575195, "global_step": 51961, "epoch": 1237} {"train_loss": -5.815149307250977, "global_step": 51962, "epoch": 1237} {"train_loss": -5.845205783843994, "global_step": 51963, "epoch": 1237} {"train_loss": -5.7552876472473145, "global_step": 51964, "epoch": 1237} {"train_loss": -5.809789657592773, "global_step": 51965, "epoch": 1237} {"train_loss": -5.77972412109375, "global_step": 51966, "epoch": 1237} {"train_loss": -5.748866081237793, "global_step": 51967, "epoch": 1237} {"train_loss": -5.761041641235352, "global_step": 51968, "epoch": 1237} {"train_loss": -5.863744735717773, "global_step": 51969, "epoch": 1237} {"train_loss": -5.738705635070801, "global_step": 51970, "epoch": 1237} {"train_loss": -5.7388458251953125, "global_step": 51971, "epoch": 1237} {"train_loss": -5.742389678955078, "global_step": 51972, "epoch": 1237} {"train_loss": -5.761979103088379, "global_step": 51973, "epoch": 1237} {"train_loss": -5.71497106552124, "global_step": 51974, "epoch": 1237} {"train_loss": -5.798238754272461, "global_step": 51975, "epoch": 1237} {"train_loss": -5.874012470245361, "global_step": 51976, "epoch": 1237} {"train_loss": -5.867199897766113, "global_step": 51977, "epoch": 1237} {"train_loss": -5.74417781829834, "global_step": 51978, "epoch": 1237} {"train_loss": -5.898185729980469, "global_step": 51979, "epoch": 1237} {"train_loss": -5.865442276000977, "global_step": 51980, "epoch": 1237} {"train_loss": -5.914831161499023, "global_step": 51981, "epoch": 1237} {"train_loss": -5.652040004730225, "global_step": 51982, "epoch": 1237} {"train_loss": -5.860223770141602, "global_step": 51983, "epoch": 1237} {"train_loss": -5.765556335449219, "global_step": 51984, "epoch": 1237} {"train_loss": -5.822131156921387, "global_step": 51985, "epoch": 1237} {"train_loss": -5.946019172668457, "global_step": 51986, "epoch": 1237} {"train_loss": -5.760763168334961, "global_step": 51987, "epoch": 1237} {"train_loss": -5.855868339538574, "global_step": 51988, "epoch": 1237} {"train_loss": -5.87600040435791, "global_step": 51989, "epoch": 1237} {"train_loss": -5.794744968414307, "global_step": 51990, "epoch": 1237} {"train_loss": -5.834976673126221, "global_step": 51991, "epoch": 1237} {"train_loss": -5.739171504974365, "global_step": 51992, "epoch": 1237} {"train_loss": -5.83753776550293, "global_step": 51993, "epoch": 1237} {"train_loss": -5.756255149841309, "global_step": 51994, "epoch": 1237} {"train_loss": -5.790567227772304, "global_step": 51995, "epoch": 1237, "val_loss": 61543.41796875} {"train_loss": -5.811119079589844, "global_step": 51996, "epoch": 1238} {"train_loss": -5.831716537475586, "global_step": 51997, "epoch": 1238} {"train_loss": -5.744240760803223, "global_step": 51998, "epoch": 1238} {"train_loss": -5.875061988830566, "global_step": 51999, "epoch": 1238} {"train_loss": -5.773728370666504, "global_step": 52000, "epoch": 1238} {"train_loss": -5.836662292480469, "global_step": 52001, "epoch": 1238} {"train_loss": -5.7624125480651855, "global_step": 52002, "epoch": 1238} {"train_loss": -5.769869804382324, "global_step": 52003, "epoch": 1238} {"train_loss": -5.751871109008789, "global_step": 52004, "epoch": 1238} {"train_loss": -5.778959274291992, "global_step": 52005, "epoch": 1238} {"train_loss": -5.783208847045898, "global_step": 52006, "epoch": 1238} {"train_loss": -5.851495742797852, "global_step": 52007, "epoch": 1238} {"train_loss": -5.827653408050537, "global_step": 52008, "epoch": 1238} {"train_loss": -5.648674964904785, "global_step": 52009, "epoch": 1238} {"train_loss": -5.811837673187256, "global_step": 52010, "epoch": 1238} {"train_loss": -5.788613796234131, "global_step": 52011, "epoch": 1238} {"train_loss": -5.852085590362549, "global_step": 52012, "epoch": 1238} {"train_loss": -5.723440647125244, "global_step": 52013, "epoch": 1238} {"train_loss": -5.693597793579102, "global_step": 52014, "epoch": 1238} {"train_loss": -5.925459384918213, "global_step": 52015, "epoch": 1238} {"train_loss": -5.776240348815918, "global_step": 52016, "epoch": 1238} {"train_loss": -5.703597068786621, "global_step": 52017, "epoch": 1238} {"train_loss": -5.819126129150391, "global_step": 52018, "epoch": 1238} {"train_loss": -5.804590702056885, "global_step": 52019, "epoch": 1238} {"train_loss": -5.7568864822387695, "global_step": 52020, "epoch": 1238} {"train_loss": -5.832205295562744, "global_step": 52021, "epoch": 1238} {"train_loss": -5.7434773445129395, "global_step": 52022, "epoch": 1238} {"train_loss": -5.739324569702148, "global_step": 52023, "epoch": 1238} {"train_loss": -5.810822486877441, "global_step": 52024, "epoch": 1238} {"train_loss": -5.843909740447998, "global_step": 52025, "epoch": 1238} {"train_loss": -5.947478771209717, "global_step": 52026, "epoch": 1238} {"train_loss": -5.6645660400390625, "global_step": 52027, "epoch": 1238} {"train_loss": -5.823323726654053, "global_step": 52028, "epoch": 1238} {"train_loss": -5.9166579246521, "global_step": 52029, "epoch": 1238} {"train_loss": -5.659553050994873, "global_step": 52030, "epoch": 1238} {"train_loss": -5.763093948364258, "global_step": 52031, "epoch": 1238} {"train_loss": -5.762203216552734, "global_step": 52032, "epoch": 1238} {"train_loss": -5.766562461853027, "global_step": 52033, "epoch": 1238} {"train_loss": -5.853057861328125, "global_step": 52034, "epoch": 1238} {"train_loss": -5.843836784362793, "global_step": 52035, "epoch": 1238} {"train_loss": -5.796182632446289, "global_step": 52036, "epoch": 1238} {"train_loss": -5.792090495427449, "global_step": 52037, "epoch": 1238, "val_loss": 61265.9375} {"train_loss": -5.803048133850098, "global_step": 52038, "epoch": 1239} {"train_loss": -5.7323527336120605, "global_step": 52039, "epoch": 1239} {"train_loss": -5.726113319396973, "global_step": 52040, "epoch": 1239} {"train_loss": -5.806066513061523, "global_step": 52041, "epoch": 1239} {"train_loss": -5.826947212219238, "global_step": 52042, "epoch": 1239} {"train_loss": -5.780886173248291, "global_step": 52043, "epoch": 1239} {"train_loss": -5.721425533294678, "global_step": 52044, "epoch": 1239} {"train_loss": -5.734715938568115, "global_step": 52045, "epoch": 1239} {"train_loss": -5.867972373962402, "global_step": 52046, "epoch": 1239} {"train_loss": -5.750689506530762, "global_step": 52047, "epoch": 1239} {"train_loss": -5.685922145843506, "global_step": 52048, "epoch": 1239} {"train_loss": -5.736701965332031, "global_step": 52049, "epoch": 1239} {"train_loss": -5.885972023010254, "global_step": 52050, "epoch": 1239} {"train_loss": -5.896056652069092, "global_step": 52051, "epoch": 1239} {"train_loss": -5.78788948059082, "global_step": 52052, "epoch": 1239} {"train_loss": -5.769474029541016, "global_step": 52053, "epoch": 1239} {"train_loss": -5.782703876495361, "global_step": 52054, "epoch": 1239} {"train_loss": -5.857503414154053, "global_step": 52055, "epoch": 1239} {"train_loss": -5.74614953994751, "global_step": 52056, "epoch": 1239} {"train_loss": -5.759612560272217, "global_step": 52057, "epoch": 1239} {"train_loss": -5.901636123657227, "global_step": 52058, "epoch": 1239} {"train_loss": -5.708377838134766, "global_step": 52059, "epoch": 1239} {"train_loss": -5.801591396331787, "global_step": 52060, "epoch": 1239} {"train_loss": -5.795317649841309, "global_step": 52061, "epoch": 1239} {"train_loss": -5.715090751647949, "global_step": 52062, "epoch": 1239} {"train_loss": -5.673730850219727, "global_step": 52063, "epoch": 1239} {"train_loss": -5.8140411376953125, "global_step": 52064, "epoch": 1239} {"train_loss": -5.834867477416992, "global_step": 52065, "epoch": 1239} {"train_loss": -5.746876239776611, "global_step": 52066, "epoch": 1239} {"train_loss": -5.7746663093566895, "global_step": 52067, "epoch": 1239} {"train_loss": -5.812895774841309, "global_step": 52068, "epoch": 1239} {"train_loss": -5.71675968170166, "global_step": 52069, "epoch": 1239} {"train_loss": -5.770564079284668, "global_step": 52070, "epoch": 1239} {"train_loss": -5.7843098640441895, "global_step": 52071, "epoch": 1239} {"train_loss": -5.834300994873047, "global_step": 52072, "epoch": 1239} {"train_loss": -5.726747989654541, "global_step": 52073, "epoch": 1239} {"train_loss": -5.727774620056152, "global_step": 52074, "epoch": 1239} {"train_loss": -5.864801406860352, "global_step": 52075, "epoch": 1239} {"train_loss": -5.9488749504089355, "global_step": 52076, "epoch": 1239} {"train_loss": -5.880834579467773, "global_step": 52077, "epoch": 1239} {"train_loss": -5.780549049377441, "global_step": 52078, "epoch": 1239} {"train_loss": -5.788486730484736, "global_step": 52079, "epoch": 1239, "val_loss": 60962.8046875} {"train_loss": -5.807182788848877, "global_step": 52080, "epoch": 1240} {"train_loss": -5.967945575714111, "global_step": 52081, "epoch": 1240} {"train_loss": -5.824363708496094, "global_step": 52082, "epoch": 1240} {"train_loss": -5.777683734893799, "global_step": 52083, "epoch": 1240} {"train_loss": -5.830217361450195, "global_step": 52084, "epoch": 1240} {"train_loss": -5.813899040222168, "global_step": 52085, "epoch": 1240} {"train_loss": -5.8283843994140625, "global_step": 52086, "epoch": 1240} {"train_loss": -5.835007667541504, "global_step": 52087, "epoch": 1240} {"train_loss": -5.723006725311279, "global_step": 52088, "epoch": 1240} {"train_loss": -5.845573425292969, "global_step": 52089, "epoch": 1240} {"train_loss": -5.90681266784668, "global_step": 52090, "epoch": 1240} {"train_loss": -5.789919853210449, "global_step": 52091, "epoch": 1240} {"train_loss": -5.8160223960876465, "global_step": 52092, "epoch": 1240} {"train_loss": -5.757026195526123, "global_step": 52093, "epoch": 1240} {"train_loss": -5.896327018737793, "global_step": 52094, "epoch": 1240} {"train_loss": -5.873154640197754, "global_step": 52095, "epoch": 1240} {"train_loss": -5.794120788574219, "global_step": 52096, "epoch": 1240} {"train_loss": -5.740670204162598, "global_step": 52097, "epoch": 1240} {"train_loss": -5.763510704040527, "global_step": 52098, "epoch": 1240} {"train_loss": -5.919417381286621, "global_step": 52099, "epoch": 1240} {"train_loss": -5.861815452575684, "global_step": 52100, "epoch": 1240} {"train_loss": -5.796087265014648, "global_step": 52101, "epoch": 1240} {"train_loss": -5.823510646820068, "global_step": 52102, "epoch": 1240} {"train_loss": -5.847560405731201, "global_step": 52103, "epoch": 1240} {"train_loss": -5.776449680328369, "global_step": 52104, "epoch": 1240} {"train_loss": -5.938425540924072, "global_step": 52105, "epoch": 1240} {"train_loss": -5.780484199523926, "global_step": 52106, "epoch": 1240} {"train_loss": -5.889369010925293, "global_step": 52107, "epoch": 1240} {"train_loss": -5.74493408203125, "global_step": 52108, "epoch": 1240} {"train_loss": -5.740073204040527, "global_step": 52109, "epoch": 1240} {"train_loss": -5.739457130432129, "global_step": 52110, "epoch": 1240} {"train_loss": -5.88491153717041, "global_step": 52111, "epoch": 1240} {"train_loss": -5.771320343017578, "global_step": 52112, "epoch": 1240} {"train_loss": -5.824707984924316, "global_step": 52113, "epoch": 1240} {"train_loss": -5.91093111038208, "global_step": 52114, "epoch": 1240} {"train_loss": -5.873876094818115, "global_step": 52115, "epoch": 1240} {"train_loss": -5.781367301940918, "global_step": 52116, "epoch": 1240} {"train_loss": -5.8019866943359375, "global_step": 52117, "epoch": 1240} {"train_loss": -5.863498687744141, "global_step": 52118, "epoch": 1240} {"train_loss": -5.834419250488281, "global_step": 52119, "epoch": 1240} {"train_loss": -5.756987571716309, "global_step": 52120, "epoch": 1240} {"train_loss": -5.820838542211623, "global_step": 52121, "epoch": 1240, "val_loss": 61410.21875} {"train_loss": -5.778798580169678, "global_step": 52122, "epoch": 1241} {"train_loss": -5.900634765625, "global_step": 52123, "epoch": 1241} {"train_loss": -5.7864885330200195, "global_step": 52124, "epoch": 1241} {"train_loss": -5.829951763153076, "global_step": 52125, "epoch": 1241} {"train_loss": -5.798823356628418, "global_step": 52126, "epoch": 1241} {"train_loss": -5.799999237060547, "global_step": 52127, "epoch": 1241} {"train_loss": -5.764470100402832, "global_step": 52128, "epoch": 1241} {"train_loss": -5.918384552001953, "global_step": 52129, "epoch": 1241} {"train_loss": -5.906210422515869, "global_step": 52130, "epoch": 1241} {"train_loss": -5.747971534729004, "global_step": 52131, "epoch": 1241} {"train_loss": -5.772237777709961, "global_step": 52132, "epoch": 1241} {"train_loss": -5.778155326843262, "global_step": 52133, "epoch": 1241} {"train_loss": -5.860514163970947, "global_step": 52134, "epoch": 1241} {"train_loss": -5.783360958099365, "global_step": 52135, "epoch": 1241} {"train_loss": -5.819818019866943, "global_step": 52136, "epoch": 1241} {"train_loss": -5.868605613708496, "global_step": 52137, "epoch": 1241} {"train_loss": -5.764458179473877, "global_step": 52138, "epoch": 1241} {"train_loss": -5.989276885986328, "global_step": 52139, "epoch": 1241} {"train_loss": -5.861264228820801, "global_step": 52140, "epoch": 1241} {"train_loss": -5.844228744506836, "global_step": 52141, "epoch": 1241} {"train_loss": -5.774805068969727, "global_step": 52142, "epoch": 1241} {"train_loss": -5.87995719909668, "global_step": 52143, "epoch": 1241} {"train_loss": -5.702465534210205, "global_step": 52144, "epoch": 1241} {"train_loss": -5.621537685394287, "global_step": 52145, "epoch": 1241} {"train_loss": -5.735971450805664, "global_step": 52146, "epoch": 1241} {"train_loss": -5.722326755523682, "global_step": 52147, "epoch": 1241} {"train_loss": -5.6580657958984375, "global_step": 52148, "epoch": 1241} {"train_loss": -5.793937683105469, "global_step": 52149, "epoch": 1241} {"train_loss": -5.671188831329346, "global_step": 52150, "epoch": 1241} {"train_loss": -5.734268665313721, "global_step": 52151, "epoch": 1241} {"train_loss": -5.825794219970703, "global_step": 52152, "epoch": 1241} {"train_loss": -5.667508602142334, "global_step": 52153, "epoch": 1241} {"train_loss": -5.765770435333252, "global_step": 52154, "epoch": 1241} {"train_loss": -5.795536994934082, "global_step": 52155, "epoch": 1241} {"train_loss": -5.759515762329102, "global_step": 52156, "epoch": 1241} {"train_loss": -5.768146514892578, "global_step": 52157, "epoch": 1241} {"train_loss": -5.7407989501953125, "global_step": 52158, "epoch": 1241} {"train_loss": -5.762238502502441, "global_step": 52159, "epoch": 1241} {"train_loss": -5.755256175994873, "global_step": 52160, "epoch": 1241} {"train_loss": -5.822718620300293, "global_step": 52161, "epoch": 1241} {"train_loss": -5.827362537384033, "global_step": 52162, "epoch": 1241} {"train_loss": -5.788251842771258, "global_step": 52163, "epoch": 1241, "val_loss": 61777.78125} {"train_loss": -5.794713497161865, "global_step": 52164, "epoch": 1242} {"train_loss": -5.8867387771606445, "global_step": 52165, "epoch": 1242} {"train_loss": -5.724668025970459, "global_step": 52166, "epoch": 1242} {"train_loss": -5.885842323303223, "global_step": 52167, "epoch": 1242} {"train_loss": -5.899521827697754, "global_step": 52168, "epoch": 1242} {"train_loss": -5.654628276824951, "global_step": 52169, "epoch": 1242} {"train_loss": -5.748933792114258, "global_step": 52170, "epoch": 1242} {"train_loss": -5.762716293334961, "global_step": 52171, "epoch": 1242} {"train_loss": -5.603237152099609, "global_step": 52172, "epoch": 1242} {"train_loss": -5.907129287719727, "global_step": 52173, "epoch": 1242} {"train_loss": -5.7469964027404785, "global_step": 52174, "epoch": 1242} {"train_loss": -5.945681571960449, "global_step": 52175, "epoch": 1242} {"train_loss": -5.819924354553223, "global_step": 52176, "epoch": 1242} {"train_loss": -5.849213123321533, "global_step": 52177, "epoch": 1242} {"train_loss": -5.912827968597412, "global_step": 52178, "epoch": 1242} {"train_loss": -5.73919677734375, "global_step": 52179, "epoch": 1242} {"train_loss": -5.819876670837402, "global_step": 52180, "epoch": 1242} {"train_loss": -5.789975643157959, "global_step": 52181, "epoch": 1242} {"train_loss": -5.595150947570801, "global_step": 52182, "epoch": 1242} {"train_loss": -5.827859401702881, "global_step": 52183, "epoch": 1242} {"train_loss": -5.841239929199219, "global_step": 52184, "epoch": 1242} {"train_loss": -5.774497985839844, "global_step": 52185, "epoch": 1242} {"train_loss": -5.835315227508545, "global_step": 52186, "epoch": 1242} {"train_loss": -5.83964729309082, "global_step": 52187, "epoch": 1242} {"train_loss": -5.642901420593262, "global_step": 52188, "epoch": 1242} {"train_loss": -5.786982536315918, "global_step": 52189, "epoch": 1242} {"train_loss": -5.778704643249512, "global_step": 52190, "epoch": 1242} {"train_loss": -5.605376243591309, "global_step": 52191, "epoch": 1242} {"train_loss": -5.915645599365234, "global_step": 52192, "epoch": 1242} {"train_loss": -5.812443733215332, "global_step": 52193, "epoch": 1242} {"train_loss": -5.762713432312012, "global_step": 52194, "epoch": 1242} {"train_loss": -5.790624618530273, "global_step": 52195, "epoch": 1242} {"train_loss": -5.8535475730896, "global_step": 52196, "epoch": 1242} {"train_loss": -5.763234615325928, "global_step": 52197, "epoch": 1242} {"train_loss": -5.600442886352539, "global_step": 52198, "epoch": 1242} {"train_loss": -5.810765743255615, "global_step": 52199, "epoch": 1242} {"train_loss": -5.625978469848633, "global_step": 52200, "epoch": 1242} {"train_loss": -5.649385929107666, "global_step": 52201, "epoch": 1242} {"train_loss": -5.728899955749512, "global_step": 52202, "epoch": 1242} {"train_loss": -5.7271294593811035, "global_step": 52203, "epoch": 1242} {"train_loss": -5.807840347290039, "global_step": 52204, "epoch": 1242} {"train_loss": -5.7766908918108255, "global_step": 52205, "epoch": 1242, "val_loss": 61759.4140625} {"train_loss": -5.740708351135254, "global_step": 52206, "epoch": 1243} {"train_loss": -5.762095928192139, "global_step": 52207, "epoch": 1243} {"train_loss": -5.6702985763549805, "global_step": 52208, "epoch": 1243} {"train_loss": -5.652324676513672, "global_step": 52209, "epoch": 1243} {"train_loss": -5.666918754577637, "global_step": 52210, "epoch": 1243} {"train_loss": -5.744738578796387, "global_step": 52211, "epoch": 1243} {"train_loss": -5.5888543128967285, "global_step": 52212, "epoch": 1243} {"train_loss": -5.799208641052246, "global_step": 52213, "epoch": 1243} {"train_loss": -5.748721599578857, "global_step": 52214, "epoch": 1243} {"train_loss": -5.72895622253418, "global_step": 52215, "epoch": 1243} {"train_loss": -5.696828842163086, "global_step": 52216, "epoch": 1243} {"train_loss": -5.715975761413574, "global_step": 52217, "epoch": 1243} {"train_loss": -5.955690860748291, "global_step": 52218, "epoch": 1243} {"train_loss": -5.626996040344238, "global_step": 52219, "epoch": 1243} {"train_loss": -5.877570152282715, "global_step": 52220, "epoch": 1243} {"train_loss": -5.748233795166016, "global_step": 52221, "epoch": 1243} {"train_loss": -5.786375999450684, "global_step": 52222, "epoch": 1243} {"train_loss": -5.669791221618652, "global_step": 52223, "epoch": 1243} {"train_loss": -5.768145561218262, "global_step": 52224, "epoch": 1243} {"train_loss": -5.829112529754639, "global_step": 52225, "epoch": 1243} {"train_loss": -5.741098403930664, "global_step": 52226, "epoch": 1243} {"train_loss": -5.773564338684082, "global_step": 52227, "epoch": 1243} {"train_loss": -5.739926338195801, "global_step": 52228, "epoch": 1243} {"train_loss": -5.859835147857666, "global_step": 52229, "epoch": 1243} {"train_loss": -5.826991081237793, "global_step": 52230, "epoch": 1243} {"train_loss": -5.843745231628418, "global_step": 52231, "epoch": 1243} {"train_loss": -5.657135963439941, "global_step": 52232, "epoch": 1243} {"train_loss": -5.836319923400879, "global_step": 52233, "epoch": 1243} {"train_loss": -5.719855308532715, "global_step": 52234, "epoch": 1243} {"train_loss": -5.692415237426758, "global_step": 52235, "epoch": 1243} {"train_loss": -5.715668678283691, "global_step": 52236, "epoch": 1243} {"train_loss": -5.7058820724487305, "global_step": 52237, "epoch": 1243} {"train_loss": -5.795531272888184, "global_step": 52238, "epoch": 1243} {"train_loss": -5.818804740905762, "global_step": 52239, "epoch": 1243} {"train_loss": -5.776642799377441, "global_step": 52240, "epoch": 1243} {"train_loss": -5.683882713317871, "global_step": 52241, "epoch": 1243} {"train_loss": -5.767669677734375, "global_step": 52242, "epoch": 1243} {"train_loss": -5.678027153015137, "global_step": 52243, "epoch": 1243} {"train_loss": -5.719696998596191, "global_step": 52244, "epoch": 1243} {"train_loss": -5.7216477394104, "global_step": 52245, "epoch": 1243} {"train_loss": -5.819795608520508, "global_step": 52246, "epoch": 1243} {"train_loss": -5.75117217926752, "global_step": 52247, "epoch": 1243, "val_loss": 61449.390625} {"train_loss": -5.86043119430542, "global_step": 52248, "epoch": 1244} {"train_loss": -5.89415168762207, "global_step": 52249, "epoch": 1244} {"train_loss": -5.73512077331543, "global_step": 52250, "epoch": 1244} {"train_loss": -5.894039154052734, "global_step": 52251, "epoch": 1244} {"train_loss": -5.8115105628967285, "global_step": 52252, "epoch": 1244} {"train_loss": -5.9963459968566895, "global_step": 52253, "epoch": 1244} {"train_loss": -5.82391357421875, "global_step": 52254, "epoch": 1244} {"train_loss": -5.866683006286621, "global_step": 52255, "epoch": 1244} {"train_loss": -5.785982608795166, "global_step": 52256, "epoch": 1244} {"train_loss": -5.822261810302734, "global_step": 52257, "epoch": 1244} {"train_loss": -5.867627143859863, "global_step": 52258, "epoch": 1244} {"train_loss": -5.846421241760254, "global_step": 52259, "epoch": 1244} {"train_loss": -5.790872097015381, "global_step": 52260, "epoch": 1244} {"train_loss": -5.798221111297607, "global_step": 52261, "epoch": 1244} {"train_loss": -5.803699493408203, "global_step": 52262, "epoch": 1244} {"train_loss": -5.802865982055664, "global_step": 52263, "epoch": 1244} {"train_loss": -5.8194451332092285, "global_step": 52264, "epoch": 1244} {"train_loss": -5.7694172859191895, "global_step": 52265, "epoch": 1244} {"train_loss": -5.788331031799316, "global_step": 52266, "epoch": 1244} {"train_loss": -5.901767730712891, "global_step": 52267, "epoch": 1244} {"train_loss": -5.887511253356934, "global_step": 52268, "epoch": 1244} {"train_loss": -5.75960636138916, "global_step": 52269, "epoch": 1244} {"train_loss": -5.81016731262207, "global_step": 52270, "epoch": 1244} {"train_loss": -5.831033706665039, "global_step": 52271, "epoch": 1244} {"train_loss": -5.650957107543945, "global_step": 52272, "epoch": 1244} {"train_loss": -5.722617149353027, "global_step": 52273, "epoch": 1244} {"train_loss": -5.8502912521362305, "global_step": 52274, "epoch": 1244} {"train_loss": -5.862185478210449, "global_step": 52275, "epoch": 1244} {"train_loss": -5.6322174072265625, "global_step": 52276, "epoch": 1244} {"train_loss": -5.86530065536499, "global_step": 52277, "epoch": 1244} {"train_loss": -5.801900386810303, "global_step": 52278, "epoch": 1244} {"train_loss": -5.798924446105957, "global_step": 52279, "epoch": 1244} {"train_loss": -5.944121360778809, "global_step": 52280, "epoch": 1244} {"train_loss": -5.913009166717529, "global_step": 52281, "epoch": 1244} {"train_loss": -5.761519432067871, "global_step": 52282, "epoch": 1244} {"train_loss": -5.770140647888184, "global_step": 52283, "epoch": 1244} {"train_loss": -5.824140548706055, "global_step": 52284, "epoch": 1244} {"train_loss": -5.696730613708496, "global_step": 52285, "epoch": 1244} {"train_loss": -5.789170742034912, "global_step": 52286, "epoch": 1244} {"train_loss": -5.840703010559082, "global_step": 52287, "epoch": 1244} {"train_loss": -5.786324501037598, "global_step": 52288, "epoch": 1244} {"train_loss": -5.816982348759969, "global_step": 52289, "epoch": 1244, "val_loss": 61296.4296875} {"train_loss": -5.85268497467041, "global_step": 52290, "epoch": 1245} {"train_loss": -5.819047927856445, "global_step": 52291, "epoch": 1245} {"train_loss": -5.845264434814453, "global_step": 52292, "epoch": 1245} {"train_loss": -5.818639755249023, "global_step": 52293, "epoch": 1245} {"train_loss": -5.785090446472168, "global_step": 52294, "epoch": 1245} {"train_loss": -5.684216499328613, "global_step": 52295, "epoch": 1245} {"train_loss": -5.854549407958984, "global_step": 52296, "epoch": 1245} {"train_loss": -5.847184181213379, "global_step": 52297, "epoch": 1245} {"train_loss": -5.7658610343933105, "global_step": 52298, "epoch": 1245} {"train_loss": -5.789093494415283, "global_step": 52299, "epoch": 1245} {"train_loss": -5.777584075927734, "global_step": 52300, "epoch": 1245} {"train_loss": -5.935125350952148, "global_step": 52301, "epoch": 1245} {"train_loss": -5.806092262268066, "global_step": 52302, "epoch": 1245} {"train_loss": -5.785326957702637, "global_step": 52303, "epoch": 1245} {"train_loss": -5.807001113891602, "global_step": 52304, "epoch": 1245} {"train_loss": -5.71323299407959, "global_step": 52305, "epoch": 1245} {"train_loss": -5.9015302658081055, "global_step": 52306, "epoch": 1245} {"train_loss": -5.960061073303223, "global_step": 52307, "epoch": 1245} {"train_loss": -5.84581184387207, "global_step": 52308, "epoch": 1245} {"train_loss": -5.878838539123535, "global_step": 52309, "epoch": 1245} {"train_loss": -5.925825119018555, "global_step": 52310, "epoch": 1245} {"train_loss": -5.697253227233887, "global_step": 52311, "epoch": 1245} {"train_loss": -5.753576278686523, "global_step": 52312, "epoch": 1245} {"train_loss": -5.799123764038086, "global_step": 52313, "epoch": 1245} {"train_loss": -5.7105913162231445, "global_step": 52314, "epoch": 1245} {"train_loss": -5.889843940734863, "global_step": 52315, "epoch": 1245} {"train_loss": -5.802722930908203, "global_step": 52316, "epoch": 1245} {"train_loss": -5.854038238525391, "global_step": 52317, "epoch": 1245} {"train_loss": -5.645888328552246, "global_step": 52318, "epoch": 1245} {"train_loss": -5.705708980560303, "global_step": 52319, "epoch": 1245} {"train_loss": -5.9091010093688965, "global_step": 52320, "epoch": 1245} {"train_loss": -5.8107590675354, "global_step": 52321, "epoch": 1245} {"train_loss": -5.730619430541992, "global_step": 52322, "epoch": 1245} {"train_loss": -5.831804275512695, "global_step": 52323, "epoch": 1245} {"train_loss": -5.729766368865967, "global_step": 52324, "epoch": 1245} {"train_loss": -5.929853439331055, "global_step": 52325, "epoch": 1245} {"train_loss": -5.829588890075684, "global_step": 52326, "epoch": 1245} {"train_loss": -5.798834800720215, "global_step": 52327, "epoch": 1245} {"train_loss": -5.746899604797363, "global_step": 52328, "epoch": 1245} {"train_loss": -5.827398300170898, "global_step": 52329, "epoch": 1245} {"train_loss": -5.898550033569336, "global_step": 52330, "epoch": 1245} {"train_loss": -5.8126805282774425, "global_step": 52331, "epoch": 1245, "val_loss": 61457.74609375} {"train_loss": -5.863890647888184, "global_step": 52332, "epoch": 1246} {"train_loss": -5.791281223297119, "global_step": 52333, "epoch": 1246} {"train_loss": -5.892487049102783, "global_step": 52334, "epoch": 1246} {"train_loss": -5.7737650871276855, "global_step": 52335, "epoch": 1246} {"train_loss": -5.795774459838867, "global_step": 52336, "epoch": 1246} {"train_loss": -5.832846641540527, "global_step": 52337, "epoch": 1246} {"train_loss": -5.828705787658691, "global_step": 52338, "epoch": 1246} {"train_loss": -5.814801216125488, "global_step": 52339, "epoch": 1246} {"train_loss": -5.91953182220459, "global_step": 52340, "epoch": 1246} {"train_loss": -5.795114040374756, "global_step": 52341, "epoch": 1246} {"train_loss": -5.693390846252441, "global_step": 52342, "epoch": 1246} {"train_loss": -5.75052547454834, "global_step": 52343, "epoch": 1246} {"train_loss": -5.890872001647949, "global_step": 52344, "epoch": 1246} {"train_loss": -5.744959354400635, "global_step": 52345, "epoch": 1246} {"train_loss": -5.84423303604126, "global_step": 52346, "epoch": 1246} {"train_loss": -5.781680583953857, "global_step": 52347, "epoch": 1246} {"train_loss": -5.797944068908691, "global_step": 52348, "epoch": 1246} {"train_loss": -5.799861907958984, "global_step": 52349, "epoch": 1246} {"train_loss": -5.6930437088012695, "global_step": 52350, "epoch": 1246} {"train_loss": -5.864498138427734, "global_step": 52351, "epoch": 1246} {"train_loss": -5.749177932739258, "global_step": 52352, "epoch": 1246} {"train_loss": -5.734458923339844, "global_step": 52353, "epoch": 1246} {"train_loss": -5.765226364135742, "global_step": 52354, "epoch": 1246} {"train_loss": -5.857194900512695, "global_step": 52355, "epoch": 1246} {"train_loss": -5.7916669845581055, "global_step": 52356, "epoch": 1246} {"train_loss": -5.740475654602051, "global_step": 52357, "epoch": 1246} {"train_loss": -5.873753547668457, "global_step": 52358, "epoch": 1246} {"train_loss": -5.856570243835449, "global_step": 52359, "epoch": 1246} {"train_loss": -5.732417106628418, "global_step": 52360, "epoch": 1246} {"train_loss": -5.794059753417969, "global_step": 52361, "epoch": 1246} {"train_loss": -5.831617832183838, "global_step": 52362, "epoch": 1246} {"train_loss": -5.762411117553711, "global_step": 52363, "epoch": 1246} {"train_loss": -5.8017120361328125, "global_step": 52364, "epoch": 1246} {"train_loss": -5.937695503234863, "global_step": 52365, "epoch": 1246} {"train_loss": -5.842401504516602, "global_step": 52366, "epoch": 1246} {"train_loss": -5.728237152099609, "global_step": 52367, "epoch": 1246} {"train_loss": -5.768360614776611, "global_step": 52368, "epoch": 1246} {"train_loss": -5.871520042419434, "global_step": 52369, "epoch": 1246} {"train_loss": -5.797605514526367, "global_step": 52370, "epoch": 1246} {"train_loss": -5.801883697509766, "global_step": 52371, "epoch": 1246} {"train_loss": -5.823959827423096, "global_step": 52372, "epoch": 1246} {"train_loss": -5.804428395770845, "global_step": 52373, "epoch": 1246, "val_loss": 61167.5390625} {"train_loss": -5.797253131866455, "global_step": 52374, "epoch": 1247} {"train_loss": -5.831748008728027, "global_step": 52375, "epoch": 1247} {"train_loss": -5.786994934082031, "global_step": 52376, "epoch": 1247} {"train_loss": -5.916591644287109, "global_step": 52377, "epoch": 1247} {"train_loss": -5.893034934997559, "global_step": 52378, "epoch": 1247} {"train_loss": -5.744699478149414, "global_step": 52379, "epoch": 1247} {"train_loss": -5.819387435913086, "global_step": 52380, "epoch": 1247} {"train_loss": -5.816683769226074, "global_step": 52381, "epoch": 1247} {"train_loss": -5.920910835266113, "global_step": 52382, "epoch": 1247} {"train_loss": -5.786190986633301, "global_step": 52383, "epoch": 1247} {"train_loss": -5.743935585021973, "global_step": 52384, "epoch": 1247} {"train_loss": -5.984107971191406, "global_step": 52385, "epoch": 1247} {"train_loss": -5.870711803436279, "global_step": 52386, "epoch": 1247} {"train_loss": -5.80766487121582, "global_step": 52387, "epoch": 1247} {"train_loss": -5.750506401062012, "global_step": 52388, "epoch": 1247} {"train_loss": -5.769011497497559, "global_step": 52389, "epoch": 1247} {"train_loss": -5.758569717407227, "global_step": 52390, "epoch": 1247} {"train_loss": -5.743361473083496, "global_step": 52391, "epoch": 1247} {"train_loss": -5.767992973327637, "global_step": 52392, "epoch": 1247} {"train_loss": -5.814525127410889, "global_step": 52393, "epoch": 1247} {"train_loss": -5.754719257354736, "global_step": 52394, "epoch": 1247} {"train_loss": -5.743854999542236, "global_step": 52395, "epoch": 1247} {"train_loss": -5.877136707305908, "global_step": 52396, "epoch": 1247} {"train_loss": -5.840436935424805, "global_step": 52397, "epoch": 1247} {"train_loss": -5.781529426574707, "global_step": 52398, "epoch": 1247} {"train_loss": -5.788051605224609, "global_step": 52399, "epoch": 1247} {"train_loss": -5.7563276290893555, "global_step": 52400, "epoch": 1247} {"train_loss": -5.927611351013184, "global_step": 52401, "epoch": 1247} {"train_loss": -5.837599277496338, "global_step": 52402, "epoch": 1247} {"train_loss": -5.7477617263793945, "global_step": 52403, "epoch": 1247} {"train_loss": -5.792543411254883, "global_step": 52404, "epoch": 1247} {"train_loss": -5.889848709106445, "global_step": 52405, "epoch": 1247} {"train_loss": -5.78362512588501, "global_step": 52406, "epoch": 1247} {"train_loss": -5.80080509185791, "global_step": 52407, "epoch": 1247} {"train_loss": -5.895917892456055, "global_step": 52408, "epoch": 1247} {"train_loss": -5.716879844665527, "global_step": 52409, "epoch": 1247} {"train_loss": -5.729541778564453, "global_step": 52410, "epoch": 1247} {"train_loss": -5.644771575927734, "global_step": 52411, "epoch": 1247} {"train_loss": -5.656080722808838, "global_step": 52412, "epoch": 1247} {"train_loss": -5.6772050857543945, "global_step": 52413, "epoch": 1247} {"train_loss": -5.830477714538574, "global_step": 52414, "epoch": 1247} {"train_loss": -5.799027283986409, "global_step": 52415, "epoch": 1247, "val_loss": 61681.79296875} {"train_loss": -5.922013282775879, "global_step": 52416, "epoch": 1248} {"train_loss": -5.826171875, "global_step": 52417, "epoch": 1248} {"train_loss": -5.776507377624512, "global_step": 52418, "epoch": 1248} {"train_loss": -5.818480491638184, "global_step": 52419, "epoch": 1248} {"train_loss": -5.779030799865723, "global_step": 52420, "epoch": 1248} {"train_loss": -5.755681991577148, "global_step": 52421, "epoch": 1248} {"train_loss": -5.779997825622559, "global_step": 52422, "epoch": 1248} {"train_loss": -5.690349578857422, "global_step": 52423, "epoch": 1248} {"train_loss": -5.77744197845459, "global_step": 52424, "epoch": 1248} {"train_loss": -5.784512519836426, "global_step": 52425, "epoch": 1248} {"train_loss": -5.805452346801758, "global_step": 52426, "epoch": 1248} {"train_loss": -5.688177585601807, "global_step": 52427, "epoch": 1248} {"train_loss": -5.706325531005859, "global_step": 52428, "epoch": 1248} {"train_loss": -5.859516620635986, "global_step": 52429, "epoch": 1248} {"train_loss": -5.843787670135498, "global_step": 52430, "epoch": 1248} {"train_loss": -5.906542778015137, "global_step": 52431, "epoch": 1248} {"train_loss": -5.925397872924805, "global_step": 52432, "epoch": 1248} {"train_loss": -5.77426290512085, "global_step": 52433, "epoch": 1248} {"train_loss": -5.893881797790527, "global_step": 52434, "epoch": 1248} {"train_loss": -5.751141548156738, "global_step": 52435, "epoch": 1248} {"train_loss": -5.7234697341918945, "global_step": 52436, "epoch": 1248} {"train_loss": -5.787842750549316, "global_step": 52437, "epoch": 1248} {"train_loss": -5.498443603515625, "global_step": 52438, "epoch": 1248} {"train_loss": -5.74406623840332, "global_step": 52439, "epoch": 1248} {"train_loss": -5.859301567077637, "global_step": 52440, "epoch": 1248} {"train_loss": -5.81011962890625, "global_step": 52441, "epoch": 1248} {"train_loss": -5.809069633483887, "global_step": 52442, "epoch": 1248} {"train_loss": -5.698078632354736, "global_step": 52443, "epoch": 1248} {"train_loss": -5.862022876739502, "global_step": 52444, "epoch": 1248} {"train_loss": -5.904010772705078, "global_step": 52445, "epoch": 1248} {"train_loss": -5.746331214904785, "global_step": 52446, "epoch": 1248} {"train_loss": -5.953206539154053, "global_step": 52447, "epoch": 1248} {"train_loss": -5.893631935119629, "global_step": 52448, "epoch": 1248} {"train_loss": -5.806857109069824, "global_step": 52449, "epoch": 1248} {"train_loss": -5.803062438964844, "global_step": 52450, "epoch": 1248} {"train_loss": -5.752179145812988, "global_step": 52451, "epoch": 1248} {"train_loss": -5.7259063720703125, "global_step": 52452, "epoch": 1248} {"train_loss": -5.890516757965088, "global_step": 52453, "epoch": 1248} {"train_loss": -5.742460250854492, "global_step": 52454, "epoch": 1248} {"train_loss": -5.796536445617676, "global_step": 52455, "epoch": 1248} {"train_loss": -5.831690788269043, "global_step": 52456, "epoch": 1248} {"train_loss": -5.796056679316929, "global_step": 52457, "epoch": 1248, "val_loss": 61276.06640625} {"train_loss": -5.919422149658203, "global_step": 52458, "epoch": 1249} {"train_loss": -5.719342231750488, "global_step": 52459, "epoch": 1249} {"train_loss": -5.872535705566406, "global_step": 52460, "epoch": 1249} {"train_loss": -5.881846904754639, "global_step": 52461, "epoch": 1249} {"train_loss": -5.8867902755737305, "global_step": 52462, "epoch": 1249} {"train_loss": -5.732302188873291, "global_step": 52463, "epoch": 1249} {"train_loss": -5.857880115509033, "global_step": 52464, "epoch": 1249} {"train_loss": -5.991851329803467, "global_step": 52465, "epoch": 1249} {"train_loss": -5.83562707901001, "global_step": 52466, "epoch": 1249} {"train_loss": -5.840832710266113, "global_step": 52467, "epoch": 1249} {"train_loss": -5.810461044311523, "global_step": 52468, "epoch": 1249} {"train_loss": -5.69075870513916, "global_step": 52469, "epoch": 1249} {"train_loss": -5.88434362411499, "global_step": 52470, "epoch": 1249} {"train_loss": -5.853147506713867, "global_step": 52471, "epoch": 1249} {"train_loss": -5.861772537231445, "global_step": 52472, "epoch": 1249} {"train_loss": -5.702308654785156, "global_step": 52473, "epoch": 1249} {"train_loss": -5.7886810302734375, "global_step": 52474, "epoch": 1249} {"train_loss": -5.763742446899414, "global_step": 52475, "epoch": 1249} {"train_loss": -5.754347324371338, "global_step": 52476, "epoch": 1249} {"train_loss": -5.7806196212768555, "global_step": 52477, "epoch": 1249} {"train_loss": -5.835954666137695, "global_step": 52478, "epoch": 1249} {"train_loss": -5.7610979080200195, "global_step": 52479, "epoch": 1249} {"train_loss": -5.708909034729004, "global_step": 52480, "epoch": 1249} {"train_loss": -5.703268051147461, "global_step": 52481, "epoch": 1249} {"train_loss": -5.755102157592773, "global_step": 52482, "epoch": 1249} {"train_loss": -5.67417049407959, "global_step": 52483, "epoch": 1249} {"train_loss": -5.856966018676758, "global_step": 52484, "epoch": 1249} {"train_loss": -5.938163757324219, "global_step": 52485, "epoch": 1249} {"train_loss": -5.649428844451904, "global_step": 52486, "epoch": 1249} {"train_loss": -5.852956771850586, "global_step": 52487, "epoch": 1249} {"train_loss": -5.876594543457031, "global_step": 52488, "epoch": 1249} {"train_loss": -5.876410007476807, "global_step": 52489, "epoch": 1249} {"train_loss": -5.662593841552734, "global_step": 52490, "epoch": 1249} {"train_loss": -5.937361717224121, "global_step": 52491, "epoch": 1249} {"train_loss": -5.841037750244141, "global_step": 52492, "epoch": 1249} {"train_loss": -5.906335830688477, "global_step": 52493, "epoch": 1249} {"train_loss": -5.853250980377197, "global_step": 52494, "epoch": 1249} {"train_loss": -5.999240398406982, "global_step": 52495, "epoch": 1249} {"train_loss": -5.740503787994385, "global_step": 52496, "epoch": 1249} {"train_loss": -5.783997535705566, "global_step": 52497, "epoch": 1249} {"train_loss": -5.87104606628418, "global_step": 52498, "epoch": 1249} {"train_loss": -5.818955046789987, "global_step": 52499, "epoch": 1249, "val_loss": 61344.20703125} {"train_loss": -5.801756858825684, "global_step": 52500, "epoch": 1250} {"train_loss": -5.8043012619018555, "global_step": 52501, "epoch": 1250} {"train_loss": -5.87025260925293, "global_step": 52502, "epoch": 1250} {"train_loss": -5.788679122924805, "global_step": 52503, "epoch": 1250} {"train_loss": -5.807492256164551, "global_step": 52504, "epoch": 1250} {"train_loss": -5.896936416625977, "global_step": 52505, "epoch": 1250} {"train_loss": -5.913697242736816, "global_step": 52506, "epoch": 1250} {"train_loss": -5.92144250869751, "global_step": 52507, "epoch": 1250} {"train_loss": -5.859785079956055, "global_step": 52508, "epoch": 1250} {"train_loss": -5.877175331115723, "global_step": 52509, "epoch": 1250} {"train_loss": -5.770878314971924, "global_step": 52510, "epoch": 1250} {"train_loss": -5.756726264953613, "global_step": 52511, "epoch": 1250} {"train_loss": -5.861681938171387, "global_step": 52512, "epoch": 1250} {"train_loss": -5.645174503326416, "global_step": 52513, "epoch": 1250} {"train_loss": -5.735767364501953, "global_step": 52514, "epoch": 1250} {"train_loss": -5.869017601013184, "global_step": 52515, "epoch": 1250} {"train_loss": -5.802060127258301, "global_step": 52516, "epoch": 1250} {"train_loss": -5.7496795654296875, "global_step": 52517, "epoch": 1250} {"train_loss": -5.759833335876465, "global_step": 52518, "epoch": 1250} {"train_loss": -5.817148208618164, "global_step": 52519, "epoch": 1250} {"train_loss": -5.837638854980469, "global_step": 52520, "epoch": 1250} {"train_loss": -5.836483955383301, "global_step": 52521, "epoch": 1250} {"train_loss": -5.757201194763184, "global_step": 52522, "epoch": 1250} {"train_loss": -5.804612159729004, "global_step": 52523, "epoch": 1250} {"train_loss": -5.910465240478516, "global_step": 52524, "epoch": 1250} {"train_loss": -5.84979248046875, "global_step": 52525, "epoch": 1250} {"train_loss": -5.74395227432251, "global_step": 52526, "epoch": 1250} {"train_loss": -5.87873649597168, "global_step": 52527, "epoch": 1250} {"train_loss": -5.84535026550293, "global_step": 52528, "epoch": 1250} {"train_loss": -5.859818458557129, "global_step": 52529, "epoch": 1250} {"train_loss": -5.805032730102539, "global_step": 52530, "epoch": 1250} {"train_loss": -5.825718402862549, "global_step": 52531, "epoch": 1250} {"train_loss": -5.691272735595703, "global_step": 52532, "epoch": 1250} {"train_loss": -5.765724182128906, "global_step": 52533, "epoch": 1250} {"train_loss": -5.748187065124512, "global_step": 52534, "epoch": 1250} {"train_loss": -5.790595054626465, "global_step": 52535, "epoch": 1250} {"train_loss": -5.842979431152344, "global_step": 52536, "epoch": 1250} {"train_loss": -5.754894733428955, "global_step": 52537, "epoch": 1250} {"train_loss": -5.767706394195557, "global_step": 52538, "epoch": 1250} {"train_loss": -5.802270412445068, "global_step": 52539, "epoch": 1250} {"train_loss": -5.731839179992676, "global_step": 52540, "epoch": 1250} {"train_loss": -5.809550251279559, "global_step": 52541, "epoch": 1250, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.19073647570364108, "train/sim_max_reward_2": 0.56283836121676, "train/sim_max_reward_3": 0.575101548215439, "train/sim_max_reward_4": 0.9092932546997263, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8295691805494438, "test/sim_max_reward_4300001": 0.5343002133972073, "test/sim_max_reward_4300002": 0.8438105899564807, "test/sim_max_reward_4300003": 0.8193843886198163, "test/sim_max_reward_4300004": 0.9747539530024808, "test/sim_max_reward_4300005": 0.6604560672436901, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.748872849012436, "test/sim_max_reward_4300008": 0.41834334482182395, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.18029039448780657, "test/sim_max_reward_4300011": 0.28683287997830076, "test/sim_max_reward_4300012": 0.8377435612992133, "test/sim_max_reward_4300013": 0.6874054529133931, "test/sim_max_reward_4300014": 0.8714443739135055, "test/sim_max_reward_4300015": 0.9710228688560083, "test/sim_max_reward_4300016": 0.8116284465191712, "test/sim_max_reward_4300017": 0.7563359992725288, "test/sim_max_reward_4300018": 0.35821407159831525, "test/sim_max_reward_4300019": 0.1861916862030942, "test/sim_max_reward_4300020": 0.15408078560928787, "test/sim_max_reward_4300021": 0.9232946973421469, "test/sim_max_reward_4300022": 0.20374946322451198, "test/sim_max_reward_4300023": 0.3421795312226261, "test/sim_max_reward_4300024": 0.018270160890165484, "test/sim_max_reward_4300025": 0.8382091345418785, "test/sim_max_reward_4300026": 0.17570020450519008, "test/sim_max_reward_4300027": 0.9803899503674727, "test/sim_max_reward_4300028": 0.9115161360040612, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.0959962975507887, "test/sim_max_reward_4300032": 0.795411679310647, "test/sim_max_reward_4300033": 0.5546059407691428, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.7977627235895768, "test/sim_max_reward_4300038": 0.9197806438434388, "test/sim_max_reward_4300039": 0.8997366697818152, "test/sim_max_reward_4300040": 0.7577594939585692, "test/sim_max_reward_4300041": 0.7672694765529385, "test/sim_max_reward_4300042": 0.7251473048841506, "test/sim_max_reward_4300043": 0.174215873910162, "test/sim_max_reward_4300044": 0.8300539433034133, "test/sim_max_reward_4300045": 0.5976125005834219, "test/sim_max_reward_4300046": 0.8425424473270344, "test/sim_max_reward_4300047": 0.1445240603896605, "test/sim_max_reward_4300048": 0.8583932124350324, "test/sim_max_reward_4300049": 0.6946375717089948, "train/mean_score": 0.43687531596730106, "test/mean_score": 0.5595726868162864, "val_loss": 61481.4375} {"train_loss": -5.7148942947387695, "global_step": 52542, "epoch": 1251} {"train_loss": -5.779950141906738, "global_step": 52543, "epoch": 1251} {"train_loss": -5.94651460647583, "global_step": 52544, "epoch": 1251} {"train_loss": -5.808681488037109, "global_step": 52545, "epoch": 1251} {"train_loss": -5.734245777130127, "global_step": 52546, "epoch": 1251} {"train_loss": -5.800738334655762, "global_step": 52547, "epoch": 1251} {"train_loss": -5.769744873046875, "global_step": 52548, "epoch": 1251} {"train_loss": -5.878543853759766, "global_step": 52549, "epoch": 1251} {"train_loss": -5.917048454284668, "global_step": 52550, "epoch": 1251} {"train_loss": -5.871331214904785, "global_step": 52551, "epoch": 1251} {"train_loss": -5.834015846252441, "global_step": 52552, "epoch": 1251} {"train_loss": -5.72703742980957, "global_step": 52553, "epoch": 1251} {"train_loss": -5.7712626457214355, "global_step": 52554, "epoch": 1251} {"train_loss": -5.724879264831543, "global_step": 52555, "epoch": 1251} {"train_loss": -5.845399856567383, "global_step": 52556, "epoch": 1251} {"train_loss": -5.872483253479004, "global_step": 52557, "epoch": 1251} {"train_loss": -5.869734287261963, "global_step": 52558, "epoch": 1251} {"train_loss": -5.797890663146973, "global_step": 52559, "epoch": 1251} {"train_loss": -5.893041610717773, "global_step": 52560, "epoch": 1251} {"train_loss": -5.86911678314209, "global_step": 52561, "epoch": 1251} {"train_loss": -5.796101093292236, "global_step": 52562, "epoch": 1251} {"train_loss": -5.902966499328613, "global_step": 52563, "epoch": 1251} {"train_loss": -5.761594772338867, "global_step": 52564, "epoch": 1251} {"train_loss": -5.919714450836182, "global_step": 52565, "epoch": 1251} {"train_loss": -5.834952354431152, "global_step": 52566, "epoch": 1251} {"train_loss": -5.7276291847229, "global_step": 52567, "epoch": 1251} {"train_loss": -5.885791301727295, "global_step": 52568, "epoch": 1251} {"train_loss": -5.842931747436523, "global_step": 52569, "epoch": 1251} {"train_loss": -5.811187744140625, "global_step": 52570, "epoch": 1251} {"train_loss": -5.830150127410889, "global_step": 52571, "epoch": 1251} {"train_loss": -5.692874908447266, "global_step": 52572, "epoch": 1251} {"train_loss": -5.778431415557861, "global_step": 52573, "epoch": 1251} {"train_loss": -5.941689968109131, "global_step": 52574, "epoch": 1251} {"train_loss": -5.823512554168701, "global_step": 52575, "epoch": 1251} {"train_loss": -5.753986835479736, "global_step": 52576, "epoch": 1251} {"train_loss": -5.89133358001709, "global_step": 52577, "epoch": 1251} {"train_loss": -5.527078628540039, "global_step": 52578, "epoch": 1251} {"train_loss": -5.847410678863525, "global_step": 52579, "epoch": 1251} {"train_loss": -5.657076835632324, "global_step": 52580, "epoch": 1251} {"train_loss": -5.736375331878662, "global_step": 52581, "epoch": 1251} {"train_loss": -5.752847671508789, "global_step": 52582, "epoch": 1251} {"train_loss": -5.80524628502982, "global_step": 52583, "epoch": 1251, "val_loss": 61504.20703125} {"train_loss": -5.865262985229492, "global_step": 52584, "epoch": 1252} {"train_loss": -5.742977142333984, "global_step": 52585, "epoch": 1252} {"train_loss": -5.8357391357421875, "global_step": 52586, "epoch": 1252} {"train_loss": -5.799484729766846, "global_step": 52587, "epoch": 1252} {"train_loss": -5.956141471862793, "global_step": 52588, "epoch": 1252} {"train_loss": -5.648149490356445, "global_step": 52589, "epoch": 1252} {"train_loss": -5.787835597991943, "global_step": 52590, "epoch": 1252} {"train_loss": -5.709598541259766, "global_step": 52591, "epoch": 1252} {"train_loss": -5.754809856414795, "global_step": 52592, "epoch": 1252} {"train_loss": -5.684600830078125, "global_step": 52593, "epoch": 1252} {"train_loss": -5.75216007232666, "global_step": 52594, "epoch": 1252} {"train_loss": -5.766258239746094, "global_step": 52595, "epoch": 1252} {"train_loss": -5.692447662353516, "global_step": 52596, "epoch": 1252} {"train_loss": -5.769587516784668, "global_step": 52597, "epoch": 1252} {"train_loss": -5.7418413162231445, "global_step": 52598, "epoch": 1252} {"train_loss": -5.774632453918457, "global_step": 52599, "epoch": 1252} {"train_loss": -5.635137557983398, "global_step": 52600, "epoch": 1252} {"train_loss": -5.736080169677734, "global_step": 52601, "epoch": 1252} {"train_loss": -5.741248607635498, "global_step": 52602, "epoch": 1252} {"train_loss": -5.917629241943359, "global_step": 52603, "epoch": 1252} {"train_loss": -5.7851152420043945, "global_step": 52604, "epoch": 1252} {"train_loss": -5.769508361816406, "global_step": 52605, "epoch": 1252} {"train_loss": -5.850705623626709, "global_step": 52606, "epoch": 1252} {"train_loss": -5.856329917907715, "global_step": 52607, "epoch": 1252} {"train_loss": -5.7968621253967285, "global_step": 52608, "epoch": 1252} {"train_loss": -5.873629570007324, "global_step": 52609, "epoch": 1252} {"train_loss": -5.733319282531738, "global_step": 52610, "epoch": 1252} {"train_loss": -5.850212097167969, "global_step": 52611, "epoch": 1252} {"train_loss": -5.780588150024414, "global_step": 52612, "epoch": 1252} {"train_loss": -5.7586894035339355, "global_step": 52613, "epoch": 1252} {"train_loss": -5.868264198303223, "global_step": 52614, "epoch": 1252} {"train_loss": -5.7910919189453125, "global_step": 52615, "epoch": 1252} {"train_loss": -5.820539474487305, "global_step": 52616, "epoch": 1252} {"train_loss": -5.846010208129883, "global_step": 52617, "epoch": 1252} {"train_loss": -5.749706745147705, "global_step": 52618, "epoch": 1252} {"train_loss": -5.866899013519287, "global_step": 52619, "epoch": 1252} {"train_loss": -5.617905616760254, "global_step": 52620, "epoch": 1252} {"train_loss": -5.985204696655273, "global_step": 52621, "epoch": 1252} {"train_loss": -5.7877068519592285, "global_step": 52622, "epoch": 1252} {"train_loss": -5.8596906661987305, "global_step": 52623, "epoch": 1252} {"train_loss": -5.778796195983887, "global_step": 52624, "epoch": 1252} {"train_loss": -5.788962182544527, "global_step": 52625, "epoch": 1252, "val_loss": 61365.9609375} {"train_loss": -5.831579208374023, "global_step": 52626, "epoch": 1253} {"train_loss": -5.833748817443848, "global_step": 52627, "epoch": 1253} {"train_loss": -5.722949028015137, "global_step": 52628, "epoch": 1253} {"train_loss": -5.816216468811035, "global_step": 52629, "epoch": 1253} {"train_loss": -5.786062240600586, "global_step": 52630, "epoch": 1253} {"train_loss": -5.730685234069824, "global_step": 52631, "epoch": 1253} {"train_loss": -5.736329078674316, "global_step": 52632, "epoch": 1253} {"train_loss": -5.73551607131958, "global_step": 52633, "epoch": 1253} {"train_loss": -5.834874629974365, "global_step": 52634, "epoch": 1253} {"train_loss": -5.7505621910095215, "global_step": 52635, "epoch": 1253} {"train_loss": -5.827729225158691, "global_step": 52636, "epoch": 1253} {"train_loss": -5.7238569259643555, "global_step": 52637, "epoch": 1253} {"train_loss": -5.845028877258301, "global_step": 52638, "epoch": 1253} {"train_loss": -5.844265937805176, "global_step": 52639, "epoch": 1253} {"train_loss": -5.740621566772461, "global_step": 52640, "epoch": 1253} {"train_loss": -5.948822498321533, "global_step": 52641, "epoch": 1253} {"train_loss": -5.932232856750488, "global_step": 52642, "epoch": 1253} {"train_loss": -5.8795247077941895, "global_step": 52643, "epoch": 1253} {"train_loss": -5.660111904144287, "global_step": 52644, "epoch": 1253} {"train_loss": -5.839210033416748, "global_step": 52645, "epoch": 1253} {"train_loss": -5.822290420532227, "global_step": 52646, "epoch": 1253} {"train_loss": -5.797198295593262, "global_step": 52647, "epoch": 1253} {"train_loss": -5.806541442871094, "global_step": 52648, "epoch": 1253} {"train_loss": -5.766201019287109, "global_step": 52649, "epoch": 1253} {"train_loss": -5.930777549743652, "global_step": 52650, "epoch": 1253} {"train_loss": -5.844540119171143, "global_step": 52651, "epoch": 1253} {"train_loss": -5.834570407867432, "global_step": 52652, "epoch": 1253} {"train_loss": -5.780566215515137, "global_step": 52653, "epoch": 1253} {"train_loss": -5.890477180480957, "global_step": 52654, "epoch": 1253} {"train_loss": -5.784718036651611, "global_step": 52655, "epoch": 1253} {"train_loss": -5.90081262588501, "global_step": 52656, "epoch": 1253} {"train_loss": -5.70705509185791, "global_step": 52657, "epoch": 1253} {"train_loss": -5.7976579666137695, "global_step": 52658, "epoch": 1253} {"train_loss": -5.777745246887207, "global_step": 52659, "epoch": 1253} {"train_loss": -5.740014553070068, "global_step": 52660, "epoch": 1253} {"train_loss": -5.835923671722412, "global_step": 52661, "epoch": 1253} {"train_loss": -5.7464094161987305, "global_step": 52662, "epoch": 1253} {"train_loss": -5.83902645111084, "global_step": 52663, "epoch": 1253} {"train_loss": -5.897936820983887, "global_step": 52664, "epoch": 1253} {"train_loss": -5.838760852813721, "global_step": 52665, "epoch": 1253} {"train_loss": -5.765206336975098, "global_step": 52666, "epoch": 1253} {"train_loss": -5.811197314943586, "global_step": 52667, "epoch": 1253, "val_loss": 61216.2109375} {"train_loss": -5.903231143951416, "global_step": 52668, "epoch": 1254} {"train_loss": -5.724970817565918, "global_step": 52669, "epoch": 1254} {"train_loss": -5.912217617034912, "global_step": 52670, "epoch": 1254} {"train_loss": -5.887624740600586, "global_step": 52671, "epoch": 1254} {"train_loss": -5.958837509155273, "global_step": 52672, "epoch": 1254} {"train_loss": -5.879341125488281, "global_step": 52673, "epoch": 1254} {"train_loss": -5.711934566497803, "global_step": 52674, "epoch": 1254} {"train_loss": -5.837123870849609, "global_step": 52675, "epoch": 1254} {"train_loss": -6.000148773193359, "global_step": 52676, "epoch": 1254} {"train_loss": -5.716548919677734, "global_step": 52677, "epoch": 1254} {"train_loss": -5.777250289916992, "global_step": 52678, "epoch": 1254} {"train_loss": -5.982805252075195, "global_step": 52679, "epoch": 1254} {"train_loss": -5.806913375854492, "global_step": 52680, "epoch": 1254} {"train_loss": -5.744266986846924, "global_step": 52681, "epoch": 1254} {"train_loss": -5.9184250831604, "global_step": 52682, "epoch": 1254} {"train_loss": -5.791141510009766, "global_step": 52683, "epoch": 1254} {"train_loss": -5.811278343200684, "global_step": 52684, "epoch": 1254} {"train_loss": -5.787946701049805, "global_step": 52685, "epoch": 1254} {"train_loss": -5.704296112060547, "global_step": 52686, "epoch": 1254} {"train_loss": -5.832388877868652, "global_step": 52687, "epoch": 1254} {"train_loss": -5.9385223388671875, "global_step": 52688, "epoch": 1254} {"train_loss": -5.796986103057861, "global_step": 52689, "epoch": 1254} {"train_loss": -5.842601299285889, "global_step": 52690, "epoch": 1254} {"train_loss": -5.862598896026611, "global_step": 52691, "epoch": 1254} {"train_loss": -5.699589729309082, "global_step": 52692, "epoch": 1254} {"train_loss": -5.921282768249512, "global_step": 52693, "epoch": 1254} {"train_loss": -5.787324905395508, "global_step": 52694, "epoch": 1254} {"train_loss": -5.726199626922607, "global_step": 52695, "epoch": 1254} {"train_loss": -5.888118743896484, "global_step": 52696, "epoch": 1254} {"train_loss": -5.764653205871582, "global_step": 52697, "epoch": 1254} {"train_loss": -5.735818862915039, "global_step": 52698, "epoch": 1254} {"train_loss": -5.935254096984863, "global_step": 52699, "epoch": 1254} {"train_loss": -5.861154556274414, "global_step": 52700, "epoch": 1254} {"train_loss": -5.869580268859863, "global_step": 52701, "epoch": 1254} {"train_loss": -5.856338977813721, "global_step": 52702, "epoch": 1254} {"train_loss": -5.9005045890808105, "global_step": 52703, "epoch": 1254} {"train_loss": -5.878313064575195, "global_step": 52704, "epoch": 1254} {"train_loss": -5.790361404418945, "global_step": 52705, "epoch": 1254} {"train_loss": -5.859179496765137, "global_step": 52706, "epoch": 1254} {"train_loss": -5.807905197143555, "global_step": 52707, "epoch": 1254} {"train_loss": -5.809625625610352, "global_step": 52708, "epoch": 1254} {"train_loss": -5.832778953370594, "global_step": 52709, "epoch": 1254, "val_loss": 61439.4140625} {"train_loss": -5.884583473205566, "global_step": 52710, "epoch": 1255} {"train_loss": -5.746240615844727, "global_step": 52711, "epoch": 1255} {"train_loss": -5.781277656555176, "global_step": 52712, "epoch": 1255} {"train_loss": -5.9721574783325195, "global_step": 52713, "epoch": 1255} {"train_loss": -5.7152299880981445, "global_step": 52714, "epoch": 1255} {"train_loss": -5.948820114135742, "global_step": 52715, "epoch": 1255} {"train_loss": -5.820557594299316, "global_step": 52716, "epoch": 1255} {"train_loss": -5.72860050201416, "global_step": 52717, "epoch": 1255} {"train_loss": -5.900796890258789, "global_step": 52718, "epoch": 1255} {"train_loss": -5.872898101806641, "global_step": 52719, "epoch": 1255} {"train_loss": -5.826407432556152, "global_step": 52720, "epoch": 1255} {"train_loss": -5.819889068603516, "global_step": 52721, "epoch": 1255} {"train_loss": -5.922805309295654, "global_step": 52722, "epoch": 1255} {"train_loss": -5.795602798461914, "global_step": 52723, "epoch": 1255} {"train_loss": -5.716736793518066, "global_step": 52724, "epoch": 1255} {"train_loss": -5.7974653244018555, "global_step": 52725, "epoch": 1255} {"train_loss": -5.876755714416504, "global_step": 52726, "epoch": 1255} {"train_loss": -5.728084087371826, "global_step": 52727, "epoch": 1255} {"train_loss": -5.740152359008789, "global_step": 52728, "epoch": 1255} {"train_loss": -5.75225305557251, "global_step": 52729, "epoch": 1255} {"train_loss": -5.6921257972717285, "global_step": 52730, "epoch": 1255} {"train_loss": -5.794436931610107, "global_step": 52731, "epoch": 1255} {"train_loss": -5.759914398193359, "global_step": 52732, "epoch": 1255} {"train_loss": -5.820487976074219, "global_step": 52733, "epoch": 1255} {"train_loss": -5.744719982147217, "global_step": 52734, "epoch": 1255} {"train_loss": -5.924454689025879, "global_step": 52735, "epoch": 1255} {"train_loss": -5.776640892028809, "global_step": 52736, "epoch": 1255} {"train_loss": -5.869588851928711, "global_step": 52737, "epoch": 1255} {"train_loss": -5.714174747467041, "global_step": 52738, "epoch": 1255} {"train_loss": -5.762470245361328, "global_step": 52739, "epoch": 1255} {"train_loss": -5.765979766845703, "global_step": 52740, "epoch": 1255} {"train_loss": -5.781123161315918, "global_step": 52741, "epoch": 1255} {"train_loss": -5.827958106994629, "global_step": 52742, "epoch": 1255} {"train_loss": -5.843119144439697, "global_step": 52743, "epoch": 1255} {"train_loss": -5.675659656524658, "global_step": 52744, "epoch": 1255} {"train_loss": -5.7350239753723145, "global_step": 52745, "epoch": 1255} {"train_loss": -5.851966857910156, "global_step": 52746, "epoch": 1255} {"train_loss": -5.823843002319336, "global_step": 52747, "epoch": 1255} {"train_loss": -5.914072513580322, "global_step": 52748, "epoch": 1255} {"train_loss": -5.8705244064331055, "global_step": 52749, "epoch": 1255} {"train_loss": -5.886877059936523, "global_step": 52750, "epoch": 1255} {"train_loss": -5.81062202226548, "global_step": 52751, "epoch": 1255, "val_loss": 61651.19921875} {"train_loss": -5.904834270477295, "global_step": 52752, "epoch": 1256} {"train_loss": -5.757932186126709, "global_step": 52753, "epoch": 1256} {"train_loss": -5.765561103820801, "global_step": 52754, "epoch": 1256} {"train_loss": -5.784275054931641, "global_step": 52755, "epoch": 1256} {"train_loss": -5.861941814422607, "global_step": 52756, "epoch": 1256} {"train_loss": -5.828922271728516, "global_step": 52757, "epoch": 1256} {"train_loss": -5.827474594116211, "global_step": 52758, "epoch": 1256} {"train_loss": -5.890975475311279, "global_step": 52759, "epoch": 1256} {"train_loss": -5.688340663909912, "global_step": 52760, "epoch": 1256} {"train_loss": -5.682111740112305, "global_step": 52761, "epoch": 1256} {"train_loss": -5.835400104522705, "global_step": 52762, "epoch": 1256} {"train_loss": -5.909210205078125, "global_step": 52763, "epoch": 1256} {"train_loss": -5.891964912414551, "global_step": 52764, "epoch": 1256} {"train_loss": -5.891152381896973, "global_step": 52765, "epoch": 1256} {"train_loss": -5.887175559997559, "global_step": 52766, "epoch": 1256} {"train_loss": -5.852826118469238, "global_step": 52767, "epoch": 1256} {"train_loss": -5.867961406707764, "global_step": 52768, "epoch": 1256} {"train_loss": -5.723865509033203, "global_step": 52769, "epoch": 1256} {"train_loss": -5.932785987854004, "global_step": 52770, "epoch": 1256} {"train_loss": -5.793778419494629, "global_step": 52771, "epoch": 1256} {"train_loss": -5.807192802429199, "global_step": 52772, "epoch": 1256} {"train_loss": -5.887359619140625, "global_step": 52773, "epoch": 1256} {"train_loss": -5.773972511291504, "global_step": 52774, "epoch": 1256} {"train_loss": -5.8454813957214355, "global_step": 52775, "epoch": 1256} {"train_loss": -5.861927032470703, "global_step": 52776, "epoch": 1256} {"train_loss": -5.786207675933838, "global_step": 52777, "epoch": 1256} {"train_loss": -5.845282554626465, "global_step": 52778, "epoch": 1256} {"train_loss": -5.744126319885254, "global_step": 52779, "epoch": 1256} {"train_loss": -5.803516387939453, "global_step": 52780, "epoch": 1256} {"train_loss": -5.8259429931640625, "global_step": 52781, "epoch": 1256} {"train_loss": -5.906770706176758, "global_step": 52782, "epoch": 1256} {"train_loss": -5.740650653839111, "global_step": 52783, "epoch": 1256} {"train_loss": -5.831311225891113, "global_step": 52784, "epoch": 1256} {"train_loss": -5.889668941497803, "global_step": 52785, "epoch": 1256} {"train_loss": -5.8964128494262695, "global_step": 52786, "epoch": 1256} {"train_loss": -5.896053314208984, "global_step": 52787, "epoch": 1256} {"train_loss": -5.859405517578125, "global_step": 52788, "epoch": 1256} {"train_loss": -5.777216911315918, "global_step": 52789, "epoch": 1256} {"train_loss": -5.839518070220947, "global_step": 52790, "epoch": 1256} {"train_loss": -5.754106521606445, "global_step": 52791, "epoch": 1256} {"train_loss": -5.878328323364258, "global_step": 52792, "epoch": 1256} {"train_loss": -5.829197463535127, "global_step": 52793, "epoch": 1256, "val_loss": 61642.515625} {"train_loss": -5.798184394836426, "global_step": 52794, "epoch": 1257} {"train_loss": -5.771577835083008, "global_step": 52795, "epoch": 1257} {"train_loss": -5.838682174682617, "global_step": 52796, "epoch": 1257} {"train_loss": -5.790414810180664, "global_step": 52797, "epoch": 1257} {"train_loss": -5.978147029876709, "global_step": 52798, "epoch": 1257} {"train_loss": -5.886880874633789, "global_step": 52799, "epoch": 1257} {"train_loss": -5.806495666503906, "global_step": 52800, "epoch": 1257} {"train_loss": -5.743063926696777, "global_step": 52801, "epoch": 1257} {"train_loss": -5.848077774047852, "global_step": 52802, "epoch": 1257} {"train_loss": -5.692965984344482, "global_step": 52803, "epoch": 1257} {"train_loss": -5.768712997436523, "global_step": 52804, "epoch": 1257} {"train_loss": -5.8359527587890625, "global_step": 52805, "epoch": 1257} {"train_loss": -5.582632064819336, "global_step": 52806, "epoch": 1257} {"train_loss": -5.825499534606934, "global_step": 52807, "epoch": 1257} {"train_loss": -5.672212600708008, "global_step": 52808, "epoch": 1257} {"train_loss": -5.710518836975098, "global_step": 52809, "epoch": 1257} {"train_loss": -5.802111625671387, "global_step": 52810, "epoch": 1257} {"train_loss": -5.694764614105225, "global_step": 52811, "epoch": 1257} {"train_loss": -5.878548622131348, "global_step": 52812, "epoch": 1257} {"train_loss": -5.7956624031066895, "global_step": 52813, "epoch": 1257} {"train_loss": -5.728423595428467, "global_step": 52814, "epoch": 1257} {"train_loss": -5.82315731048584, "global_step": 52815, "epoch": 1257} {"train_loss": -5.650017261505127, "global_step": 52816, "epoch": 1257} {"train_loss": -5.864693641662598, "global_step": 52817, "epoch": 1257} {"train_loss": -5.646712303161621, "global_step": 52818, "epoch": 1257} {"train_loss": -5.77397346496582, "global_step": 52819, "epoch": 1257} {"train_loss": -5.833106517791748, "global_step": 52820, "epoch": 1257} {"train_loss": -5.864112377166748, "global_step": 52821, "epoch": 1257} {"train_loss": -5.80337381362915, "global_step": 52822, "epoch": 1257} {"train_loss": -5.695038318634033, "global_step": 52823, "epoch": 1257} {"train_loss": -5.748455047607422, "global_step": 52824, "epoch": 1257} {"train_loss": -5.78438663482666, "global_step": 52825, "epoch": 1257} {"train_loss": -5.753610610961914, "global_step": 52826, "epoch": 1257} {"train_loss": -5.775346755981445, "global_step": 52827, "epoch": 1257} {"train_loss": -5.7163004875183105, "global_step": 52828, "epoch": 1257} {"train_loss": -5.820609092712402, "global_step": 52829, "epoch": 1257} {"train_loss": -5.709042072296143, "global_step": 52830, "epoch": 1257} {"train_loss": -5.6979827880859375, "global_step": 52831, "epoch": 1257} {"train_loss": -5.697367191314697, "global_step": 52832, "epoch": 1257} {"train_loss": -5.768622398376465, "global_step": 52833, "epoch": 1257} {"train_loss": -5.820440292358398, "global_step": 52834, "epoch": 1257} {"train_loss": -5.775910400208973, "global_step": 52835, "epoch": 1257, "val_loss": 62266.46875} {"train_loss": -5.796241760253906, "global_step": 52836, "epoch": 1258} {"train_loss": -5.598299026489258, "global_step": 52837, "epoch": 1258} {"train_loss": -5.726967811584473, "global_step": 52838, "epoch": 1258} {"train_loss": -5.663759708404541, "global_step": 52839, "epoch": 1258} {"train_loss": -5.760019302368164, "global_step": 52840, "epoch": 1258} {"train_loss": -5.680014610290527, "global_step": 52841, "epoch": 1258} {"train_loss": -5.793130874633789, "global_step": 52842, "epoch": 1258} {"train_loss": -5.719205379486084, "global_step": 52843, "epoch": 1258} {"train_loss": -5.6692070960998535, "global_step": 52844, "epoch": 1258} {"train_loss": -5.7509870529174805, "global_step": 52845, "epoch": 1258} {"train_loss": -5.650787353515625, "global_step": 52846, "epoch": 1258} {"train_loss": -5.690288543701172, "global_step": 52847, "epoch": 1258} {"train_loss": -5.624290943145752, "global_step": 52848, "epoch": 1258} {"train_loss": -5.927824974060059, "global_step": 52849, "epoch": 1258} {"train_loss": -5.722168922424316, "global_step": 52850, "epoch": 1258} {"train_loss": -5.627486228942871, "global_step": 52851, "epoch": 1258} {"train_loss": -5.810244560241699, "global_step": 52852, "epoch": 1258} {"train_loss": -5.783696174621582, "global_step": 52853, "epoch": 1258} {"train_loss": -5.829556465148926, "global_step": 52854, "epoch": 1258} {"train_loss": -5.73015022277832, "global_step": 52855, "epoch": 1258} {"train_loss": -5.660467147827148, "global_step": 52856, "epoch": 1258} {"train_loss": -5.776415824890137, "global_step": 52857, "epoch": 1258} {"train_loss": -5.644696235656738, "global_step": 52858, "epoch": 1258} {"train_loss": -5.749121189117432, "global_step": 52859, "epoch": 1258} {"train_loss": -5.788727283477783, "global_step": 52860, "epoch": 1258} {"train_loss": -5.76422119140625, "global_step": 52861, "epoch": 1258} {"train_loss": -5.729452610015869, "global_step": 52862, "epoch": 1258} {"train_loss": -5.817354679107666, "global_step": 52863, "epoch": 1258} {"train_loss": -5.862244129180908, "global_step": 52864, "epoch": 1258} {"train_loss": -5.718630313873291, "global_step": 52865, "epoch": 1258} {"train_loss": -5.9659743309021, "global_step": 52866, "epoch": 1258} {"train_loss": -5.747049808502197, "global_step": 52867, "epoch": 1258} {"train_loss": -5.907181262969971, "global_step": 52868, "epoch": 1258} {"train_loss": -5.815732002258301, "global_step": 52869, "epoch": 1258} {"train_loss": -5.758522987365723, "global_step": 52870, "epoch": 1258} {"train_loss": -5.829859256744385, "global_step": 52871, "epoch": 1258} {"train_loss": -5.64191198348999, "global_step": 52872, "epoch": 1258} {"train_loss": -5.8382415771484375, "global_step": 52873, "epoch": 1258} {"train_loss": -5.653075695037842, "global_step": 52874, "epoch": 1258} {"train_loss": -5.800899505615234, "global_step": 52875, "epoch": 1258} {"train_loss": -5.5875654220581055, "global_step": 52876, "epoch": 1258} {"train_loss": -5.74762267158145, "global_step": 52877, "epoch": 1258, "val_loss": 62027.98046875} {"train_loss": -5.7208709716796875, "global_step": 52878, "epoch": 1259} {"train_loss": -5.792897701263428, "global_step": 52879, "epoch": 1259} {"train_loss": -5.6567816734313965, "global_step": 52880, "epoch": 1259} {"train_loss": -5.805470943450928, "global_step": 52881, "epoch": 1259} {"train_loss": -5.747382640838623, "global_step": 52882, "epoch": 1259} {"train_loss": -5.737417697906494, "global_step": 52883, "epoch": 1259} {"train_loss": -5.782364845275879, "global_step": 52884, "epoch": 1259} {"train_loss": -5.7743682861328125, "global_step": 52885, "epoch": 1259} {"train_loss": -5.812976837158203, "global_step": 52886, "epoch": 1259} {"train_loss": -5.686025142669678, "global_step": 52887, "epoch": 1259} {"train_loss": -5.82355260848999, "global_step": 52888, "epoch": 1259} {"train_loss": -5.9177775382995605, "global_step": 52889, "epoch": 1259} {"train_loss": -5.8215413093566895, "global_step": 52890, "epoch": 1259} {"train_loss": -5.939896583557129, "global_step": 52891, "epoch": 1259} {"train_loss": -5.799921989440918, "global_step": 52892, "epoch": 1259} {"train_loss": -5.793509006500244, "global_step": 52893, "epoch": 1259} {"train_loss": -5.7711381912231445, "global_step": 52894, "epoch": 1259} {"train_loss": -5.880533218383789, "global_step": 52895, "epoch": 1259} {"train_loss": -5.88629150390625, "global_step": 52896, "epoch": 1259} {"train_loss": -5.81563663482666, "global_step": 52897, "epoch": 1259} {"train_loss": -5.858758926391602, "global_step": 52898, "epoch": 1259} {"train_loss": -5.646906852722168, "global_step": 52899, "epoch": 1259} {"train_loss": -5.752610683441162, "global_step": 52900, "epoch": 1259} {"train_loss": -5.606734275817871, "global_step": 52901, "epoch": 1259} {"train_loss": -5.857413291931152, "global_step": 52902, "epoch": 1259} {"train_loss": -5.743114471435547, "global_step": 52903, "epoch": 1259} {"train_loss": -5.748452186584473, "global_step": 52904, "epoch": 1259} {"train_loss": -5.854168891906738, "global_step": 52905, "epoch": 1259} {"train_loss": -5.840304851531982, "global_step": 52906, "epoch": 1259} {"train_loss": -5.777298450469971, "global_step": 52907, "epoch": 1259} {"train_loss": -5.755138397216797, "global_step": 52908, "epoch": 1259} {"train_loss": -5.925982475280762, "global_step": 52909, "epoch": 1259} {"train_loss": -5.713315010070801, "global_step": 52910, "epoch": 1259} {"train_loss": -5.866375923156738, "global_step": 52911, "epoch": 1259} {"train_loss": -5.736512184143066, "global_step": 52912, "epoch": 1259} {"train_loss": -5.805856704711914, "global_step": 52913, "epoch": 1259} {"train_loss": -5.75145149230957, "global_step": 52914, "epoch": 1259} {"train_loss": -5.813839912414551, "global_step": 52915, "epoch": 1259} {"train_loss": -5.928116798400879, "global_step": 52916, "epoch": 1259} {"train_loss": -5.944063186645508, "global_step": 52917, "epoch": 1259} {"train_loss": -5.877798080444336, "global_step": 52918, "epoch": 1259} {"train_loss": -5.794992310660226, "global_step": 52919, "epoch": 1259, "val_loss": 61561.109375} {"train_loss": -5.797880172729492, "global_step": 52920, "epoch": 1260} {"train_loss": -5.8163299560546875, "global_step": 52921, "epoch": 1260} {"train_loss": -5.910154342651367, "global_step": 52922, "epoch": 1260} {"train_loss": -5.907619476318359, "global_step": 52923, "epoch": 1260} {"train_loss": -5.80735969543457, "global_step": 52924, "epoch": 1260} {"train_loss": -5.775889873504639, "global_step": 52925, "epoch": 1260} {"train_loss": -5.848074913024902, "global_step": 52926, "epoch": 1260} {"train_loss": -5.818792343139648, "global_step": 52927, "epoch": 1260} {"train_loss": -5.829267501831055, "global_step": 52928, "epoch": 1260} {"train_loss": -5.78338623046875, "global_step": 52929, "epoch": 1260} {"train_loss": -5.735324859619141, "global_step": 52930, "epoch": 1260} {"train_loss": -5.746072769165039, "global_step": 52931, "epoch": 1260} {"train_loss": -5.843237400054932, "global_step": 52932, "epoch": 1260} {"train_loss": -5.735982894897461, "global_step": 52933, "epoch": 1260} {"train_loss": -5.723518371582031, "global_step": 52934, "epoch": 1260} {"train_loss": -5.963133811950684, "global_step": 52935, "epoch": 1260} {"train_loss": -5.667254447937012, "global_step": 52936, "epoch": 1260} {"train_loss": -5.93758487701416, "global_step": 52937, "epoch": 1260} {"train_loss": -5.834955215454102, "global_step": 52938, "epoch": 1260} {"train_loss": -5.707830429077148, "global_step": 52939, "epoch": 1260} {"train_loss": -5.929494857788086, "global_step": 52940, "epoch": 1260} {"train_loss": -5.858170986175537, "global_step": 52941, "epoch": 1260} {"train_loss": -5.808866024017334, "global_step": 52942, "epoch": 1260} {"train_loss": -5.8644328117370605, "global_step": 52943, "epoch": 1260} {"train_loss": -5.789325714111328, "global_step": 52944, "epoch": 1260} {"train_loss": -5.817217826843262, "global_step": 52945, "epoch": 1260} {"train_loss": -5.777288913726807, "global_step": 52946, "epoch": 1260} {"train_loss": -5.761378288269043, "global_step": 52947, "epoch": 1260} {"train_loss": -5.9100341796875, "global_step": 52948, "epoch": 1260} {"train_loss": -5.755118370056152, "global_step": 52949, "epoch": 1260} {"train_loss": -5.723095893859863, "global_step": 52950, "epoch": 1260} {"train_loss": -5.710711479187012, "global_step": 52951, "epoch": 1260} {"train_loss": -5.770748138427734, "global_step": 52952, "epoch": 1260} {"train_loss": -5.805209159851074, "global_step": 52953, "epoch": 1260} {"train_loss": -5.8654398918151855, "global_step": 52954, "epoch": 1260} {"train_loss": -5.865891933441162, "global_step": 52955, "epoch": 1260} {"train_loss": -5.921058654785156, "global_step": 52956, "epoch": 1260} {"train_loss": -5.943842887878418, "global_step": 52957, "epoch": 1260} {"train_loss": -5.884611129760742, "global_step": 52958, "epoch": 1260} {"train_loss": -5.703581809997559, "global_step": 52959, "epoch": 1260} {"train_loss": -5.845279693603516, "global_step": 52960, "epoch": 1260} {"train_loss": -5.814942745935349, "global_step": 52961, "epoch": 1260, "val_loss": 61442.0703125} {"train_loss": -5.774371147155762, "global_step": 52962, "epoch": 1261} {"train_loss": -5.848491668701172, "global_step": 52963, "epoch": 1261} {"train_loss": -5.792407989501953, "global_step": 52964, "epoch": 1261} {"train_loss": -5.817584991455078, "global_step": 52965, "epoch": 1261} {"train_loss": -5.716655731201172, "global_step": 52966, "epoch": 1261} {"train_loss": -5.766853332519531, "global_step": 52967, "epoch": 1261} {"train_loss": -5.861704349517822, "global_step": 52968, "epoch": 1261} {"train_loss": -5.793095588684082, "global_step": 52969, "epoch": 1261} {"train_loss": -5.787914276123047, "global_step": 52970, "epoch": 1261} {"train_loss": -5.736536026000977, "global_step": 52971, "epoch": 1261} {"train_loss": -5.858124732971191, "global_step": 52972, "epoch": 1261} {"train_loss": -5.790212631225586, "global_step": 52973, "epoch": 1261} {"train_loss": -5.789215087890625, "global_step": 52974, "epoch": 1261} {"train_loss": -5.768006324768066, "global_step": 52975, "epoch": 1261} {"train_loss": -6.008596420288086, "global_step": 52976, "epoch": 1261} {"train_loss": -5.7799072265625, "global_step": 52977, "epoch": 1261} {"train_loss": -5.830319404602051, "global_step": 52978, "epoch": 1261} {"train_loss": -5.746993064880371, "global_step": 52979, "epoch": 1261} {"train_loss": -5.884394645690918, "global_step": 52980, "epoch": 1261} {"train_loss": -5.862277507781982, "global_step": 52981, "epoch": 1261} {"train_loss": -5.791845321655273, "global_step": 52982, "epoch": 1261} {"train_loss": -5.7638840675354, "global_step": 52983, "epoch": 1261} {"train_loss": -5.808749198913574, "global_step": 52984, "epoch": 1261} {"train_loss": -5.809284210205078, "global_step": 52985, "epoch": 1261} {"train_loss": -5.78909969329834, "global_step": 52986, "epoch": 1261} {"train_loss": -5.875764846801758, "global_step": 52987, "epoch": 1261} {"train_loss": -5.934144973754883, "global_step": 52988, "epoch": 1261} {"train_loss": -5.801839351654053, "global_step": 52989, "epoch": 1261} {"train_loss": -5.827468395233154, "global_step": 52990, "epoch": 1261} {"train_loss": -5.836702346801758, "global_step": 52991, "epoch": 1261} {"train_loss": -5.86845588684082, "global_step": 52992, "epoch": 1261} {"train_loss": -5.809292316436768, "global_step": 52993, "epoch": 1261} {"train_loss": -5.936835289001465, "global_step": 52994, "epoch": 1261} {"train_loss": -5.8824005126953125, "global_step": 52995, "epoch": 1261} {"train_loss": -5.920220375061035, "global_step": 52996, "epoch": 1261} {"train_loss": -5.8253583908081055, "global_step": 52997, "epoch": 1261} {"train_loss": -5.846829891204834, "global_step": 52998, "epoch": 1261} {"train_loss": -5.961507797241211, "global_step": 52999, "epoch": 1261} {"train_loss": -5.819325923919678, "global_step": 53000, "epoch": 1261} {"train_loss": -5.916841983795166, "global_step": 53001, "epoch": 1261} {"train_loss": -5.761237144470215, "global_step": 53002, "epoch": 1261} {"train_loss": -5.827944131124587, "global_step": 53003, "epoch": 1261, "val_loss": 61339.68359375} {"train_loss": -5.9181437492370605, "global_step": 53004, "epoch": 1262} {"train_loss": -5.833798408508301, "global_step": 53005, "epoch": 1262} {"train_loss": -5.875222206115723, "global_step": 53006, "epoch": 1262} {"train_loss": -5.87851619720459, "global_step": 53007, "epoch": 1262} {"train_loss": -5.814840793609619, "global_step": 53008, "epoch": 1262} {"train_loss": -5.813745975494385, "global_step": 53009, "epoch": 1262} {"train_loss": -5.845372200012207, "global_step": 53010, "epoch": 1262} {"train_loss": -5.794895172119141, "global_step": 53011, "epoch": 1262} {"train_loss": -5.900487899780273, "global_step": 53012, "epoch": 1262} {"train_loss": -5.85045051574707, "global_step": 53013, "epoch": 1262} {"train_loss": -5.765247344970703, "global_step": 53014, "epoch": 1262} {"train_loss": -5.924980163574219, "global_step": 53015, "epoch": 1262} {"train_loss": -5.736845016479492, "global_step": 53016, "epoch": 1262} {"train_loss": -5.783891201019287, "global_step": 53017, "epoch": 1262} {"train_loss": -5.8313727378845215, "global_step": 53018, "epoch": 1262} {"train_loss": -5.818389415740967, "global_step": 53019, "epoch": 1262} {"train_loss": -5.817416191101074, "global_step": 53020, "epoch": 1262} {"train_loss": -5.653100967407227, "global_step": 53021, "epoch": 1262} {"train_loss": -5.858150482177734, "global_step": 53022, "epoch": 1262} {"train_loss": -5.7016401290893555, "global_step": 53023, "epoch": 1262} {"train_loss": -5.708169937133789, "global_step": 53024, "epoch": 1262} {"train_loss": -5.807703018188477, "global_step": 53025, "epoch": 1262} {"train_loss": -5.727480888366699, "global_step": 53026, "epoch": 1262} {"train_loss": -5.831154823303223, "global_step": 53027, "epoch": 1262} {"train_loss": -5.65770149230957, "global_step": 53028, "epoch": 1262} {"train_loss": -5.795088291168213, "global_step": 53029, "epoch": 1262} {"train_loss": -5.835055351257324, "global_step": 53030, "epoch": 1262} {"train_loss": -5.6886091232299805, "global_step": 53031, "epoch": 1262} {"train_loss": -5.797816276550293, "global_step": 53032, "epoch": 1262} {"train_loss": -5.732952117919922, "global_step": 53033, "epoch": 1262} {"train_loss": -5.761373996734619, "global_step": 53034, "epoch": 1262} {"train_loss": -5.742044448852539, "global_step": 53035, "epoch": 1262} {"train_loss": -5.744553089141846, "global_step": 53036, "epoch": 1262} {"train_loss": -5.908424377441406, "global_step": 53037, "epoch": 1262} {"train_loss": -5.788396835327148, "global_step": 53038, "epoch": 1262} {"train_loss": -5.818643569946289, "global_step": 53039, "epoch": 1262} {"train_loss": -5.818453311920166, "global_step": 53040, "epoch": 1262} {"train_loss": -5.868490219116211, "global_step": 53041, "epoch": 1262} {"train_loss": -5.764034271240234, "global_step": 53042, "epoch": 1262} {"train_loss": -5.754118919372559, "global_step": 53043, "epoch": 1262} {"train_loss": -5.8520588874816895, "global_step": 53044, "epoch": 1262} {"train_loss": -5.802583024615333, "global_step": 53045, "epoch": 1262, "val_loss": 61869.6171875} {"train_loss": -5.7484002113342285, "global_step": 53046, "epoch": 1263} {"train_loss": -5.697091102600098, "global_step": 53047, "epoch": 1263} {"train_loss": -5.8405866622924805, "global_step": 53048, "epoch": 1263} {"train_loss": -5.714012145996094, "global_step": 53049, "epoch": 1263} {"train_loss": -5.824277877807617, "global_step": 53050, "epoch": 1263} {"train_loss": -5.765317440032959, "global_step": 53051, "epoch": 1263} {"train_loss": -5.8836212158203125, "global_step": 53052, "epoch": 1263} {"train_loss": -5.711397171020508, "global_step": 53053, "epoch": 1263} {"train_loss": -5.843235969543457, "global_step": 53054, "epoch": 1263} {"train_loss": -5.754926681518555, "global_step": 53055, "epoch": 1263} {"train_loss": -5.886973857879639, "global_step": 53056, "epoch": 1263} {"train_loss": -5.853346347808838, "global_step": 53057, "epoch": 1263} {"train_loss": -5.800370216369629, "global_step": 53058, "epoch": 1263} {"train_loss": -5.818632125854492, "global_step": 53059, "epoch": 1263} {"train_loss": -5.743133544921875, "global_step": 53060, "epoch": 1263} {"train_loss": -5.756470203399658, "global_step": 53061, "epoch": 1263} {"train_loss": -5.6443376541137695, "global_step": 53062, "epoch": 1263} {"train_loss": -5.714459419250488, "global_step": 53063, "epoch": 1263} {"train_loss": -5.7118821144104, "global_step": 53064, "epoch": 1263} {"train_loss": -5.8246846199035645, "global_step": 53065, "epoch": 1263} {"train_loss": -5.750960350036621, "global_step": 53066, "epoch": 1263} {"train_loss": -5.735291481018066, "global_step": 53067, "epoch": 1263} {"train_loss": -5.750151634216309, "global_step": 53068, "epoch": 1263} {"train_loss": -5.819927215576172, "global_step": 53069, "epoch": 1263} {"train_loss": -5.60799503326416, "global_step": 53070, "epoch": 1263} {"train_loss": -5.6655168533325195, "global_step": 53071, "epoch": 1263} {"train_loss": -5.859770774841309, "global_step": 53072, "epoch": 1263} {"train_loss": -5.892518043518066, "global_step": 53073, "epoch": 1263} {"train_loss": -5.8127641677856445, "global_step": 53074, "epoch": 1263} {"train_loss": -5.8303422927856445, "global_step": 53075, "epoch": 1263} {"train_loss": -5.870342254638672, "global_step": 53076, "epoch": 1263} {"train_loss": -5.87860107421875, "global_step": 53077, "epoch": 1263} {"train_loss": -5.862776279449463, "global_step": 53078, "epoch": 1263} {"train_loss": -5.753626346588135, "global_step": 53079, "epoch": 1263} {"train_loss": -5.877617835998535, "global_step": 53080, "epoch": 1263} {"train_loss": -5.779759883880615, "global_step": 53081, "epoch": 1263} {"train_loss": -5.791378974914551, "global_step": 53082, "epoch": 1263} {"train_loss": -5.817782402038574, "global_step": 53083, "epoch": 1263} {"train_loss": -5.796112537384033, "global_step": 53084, "epoch": 1263} {"train_loss": -5.850502014160156, "global_step": 53085, "epoch": 1263} {"train_loss": -5.974678993225098, "global_step": 53086, "epoch": 1263} {"train_loss": -5.789346524647304, "global_step": 53087, "epoch": 1263, "val_loss": 61369.15234375} {"train_loss": -5.860231876373291, "global_step": 53088, "epoch": 1264} {"train_loss": -5.735978126525879, "global_step": 53089, "epoch": 1264} {"train_loss": -5.896623611450195, "global_step": 53090, "epoch": 1264} {"train_loss": -5.777998924255371, "global_step": 53091, "epoch": 1264} {"train_loss": -5.692142486572266, "global_step": 53092, "epoch": 1264} {"train_loss": -5.847307205200195, "global_step": 53093, "epoch": 1264} {"train_loss": -5.866718292236328, "global_step": 53094, "epoch": 1264} {"train_loss": -5.789989471435547, "global_step": 53095, "epoch": 1264} {"train_loss": -5.759317398071289, "global_step": 53096, "epoch": 1264} {"train_loss": -5.863459587097168, "global_step": 53097, "epoch": 1264} {"train_loss": -5.848066329956055, "global_step": 53098, "epoch": 1264} {"train_loss": -5.950433731079102, "global_step": 53099, "epoch": 1264} {"train_loss": -5.853107929229736, "global_step": 53100, "epoch": 1264} {"train_loss": -5.763334274291992, "global_step": 53101, "epoch": 1264} {"train_loss": -5.854025363922119, "global_step": 53102, "epoch": 1264} {"train_loss": -5.856817245483398, "global_step": 53103, "epoch": 1264} {"train_loss": -5.8997063636779785, "global_step": 53104, "epoch": 1264} {"train_loss": -5.798676013946533, "global_step": 53105, "epoch": 1264} {"train_loss": -5.7286810874938965, "global_step": 53106, "epoch": 1264} {"train_loss": -5.75580358505249, "global_step": 53107, "epoch": 1264} {"train_loss": -5.808474063873291, "global_step": 53108, "epoch": 1264} {"train_loss": -5.842037200927734, "global_step": 53109, "epoch": 1264} {"train_loss": -5.8505706787109375, "global_step": 53110, "epoch": 1264} {"train_loss": -5.644920825958252, "global_step": 53111, "epoch": 1264} {"train_loss": -5.737794399261475, "global_step": 53112, "epoch": 1264} {"train_loss": -5.62851619720459, "global_step": 53113, "epoch": 1264} {"train_loss": -5.824261665344238, "global_step": 53114, "epoch": 1264} {"train_loss": -5.762063026428223, "global_step": 53115, "epoch": 1264} {"train_loss": -5.893963813781738, "global_step": 53116, "epoch": 1264} {"train_loss": -5.803175926208496, "global_step": 53117, "epoch": 1264} {"train_loss": -5.821077346801758, "global_step": 53118, "epoch": 1264} {"train_loss": -5.790952205657959, "global_step": 53119, "epoch": 1264} {"train_loss": -5.900591850280762, "global_step": 53120, "epoch": 1264} {"train_loss": -5.76082706451416, "global_step": 53121, "epoch": 1264} {"train_loss": -5.866298675537109, "global_step": 53122, "epoch": 1264} {"train_loss": -5.7640581130981445, "global_step": 53123, "epoch": 1264} {"train_loss": -5.852792263031006, "global_step": 53124, "epoch": 1264} {"train_loss": -5.801097869873047, "global_step": 53125, "epoch": 1264} {"train_loss": -5.734197616577148, "global_step": 53126, "epoch": 1264} {"train_loss": -5.7388596534729, "global_step": 53127, "epoch": 1264} {"train_loss": -5.720452308654785, "global_step": 53128, "epoch": 1264} {"train_loss": -5.803729431969779, "global_step": 53129, "epoch": 1264, "val_loss": 61404.0} {"train_loss": -5.804828643798828, "global_step": 53130, "epoch": 1265} {"train_loss": -5.8202643394470215, "global_step": 53131, "epoch": 1265} {"train_loss": -5.807598114013672, "global_step": 53132, "epoch": 1265} {"train_loss": -5.8597869873046875, "global_step": 53133, "epoch": 1265} {"train_loss": -5.72700309753418, "global_step": 53134, "epoch": 1265} {"train_loss": -5.803071022033691, "global_step": 53135, "epoch": 1265} {"train_loss": -5.812093734741211, "global_step": 53136, "epoch": 1265} {"train_loss": -5.761634826660156, "global_step": 53137, "epoch": 1265} {"train_loss": -5.7427520751953125, "global_step": 53138, "epoch": 1265} {"train_loss": -5.776825904846191, "global_step": 53139, "epoch": 1265} {"train_loss": -5.8575334548950195, "global_step": 53140, "epoch": 1265} {"train_loss": -5.814643859863281, "global_step": 53141, "epoch": 1265} {"train_loss": -5.866631507873535, "global_step": 53142, "epoch": 1265} {"train_loss": -5.878063678741455, "global_step": 53143, "epoch": 1265} {"train_loss": -5.672770023345947, "global_step": 53144, "epoch": 1265} {"train_loss": -5.811479091644287, "global_step": 53145, "epoch": 1265} {"train_loss": -5.726493835449219, "global_step": 53146, "epoch": 1265} {"train_loss": -5.815862655639648, "global_step": 53147, "epoch": 1265} {"train_loss": -5.917579650878906, "global_step": 53148, "epoch": 1265} {"train_loss": -5.889216423034668, "global_step": 53149, "epoch": 1265} {"train_loss": -5.804510593414307, "global_step": 53150, "epoch": 1265} {"train_loss": -5.854614734649658, "global_step": 53151, "epoch": 1265} {"train_loss": -5.77799129486084, "global_step": 53152, "epoch": 1265} {"train_loss": -5.868976593017578, "global_step": 53153, "epoch": 1265} {"train_loss": -5.864684104919434, "global_step": 53154, "epoch": 1265} {"train_loss": -5.879812240600586, "global_step": 53155, "epoch": 1265} {"train_loss": -6.004751682281494, "global_step": 53156, "epoch": 1265} {"train_loss": -5.810859680175781, "global_step": 53157, "epoch": 1265} {"train_loss": -5.909372329711914, "global_step": 53158, "epoch": 1265} {"train_loss": -5.819120407104492, "global_step": 53159, "epoch": 1265} {"train_loss": -5.8528947830200195, "global_step": 53160, "epoch": 1265} {"train_loss": -5.781700134277344, "global_step": 53161, "epoch": 1265} {"train_loss": -5.815891265869141, "global_step": 53162, "epoch": 1265} {"train_loss": -5.921069622039795, "global_step": 53163, "epoch": 1265} {"train_loss": -5.834217548370361, "global_step": 53164, "epoch": 1265} {"train_loss": -5.6811628341674805, "global_step": 53165, "epoch": 1265} {"train_loss": -5.762907981872559, "global_step": 53166, "epoch": 1265} {"train_loss": -5.795605182647705, "global_step": 53167, "epoch": 1265} {"train_loss": -5.782175064086914, "global_step": 53168, "epoch": 1265} {"train_loss": -5.620373725891113, "global_step": 53169, "epoch": 1265} {"train_loss": -5.798921585083008, "global_step": 53170, "epoch": 1265} {"train_loss": -5.817039875757127, "global_step": 53171, "epoch": 1265, "val_loss": 61422.5859375} {"train_loss": -5.876737117767334, "global_step": 53172, "epoch": 1266} {"train_loss": -5.817081451416016, "global_step": 53173, "epoch": 1266} {"train_loss": -5.824540615081787, "global_step": 53174, "epoch": 1266} {"train_loss": -5.746120929718018, "global_step": 53175, "epoch": 1266} {"train_loss": -5.76359748840332, "global_step": 53176, "epoch": 1266} {"train_loss": -5.863616943359375, "global_step": 53177, "epoch": 1266} {"train_loss": -5.864325523376465, "global_step": 53178, "epoch": 1266} {"train_loss": -5.740533351898193, "global_step": 53179, "epoch": 1266} {"train_loss": -5.888988494873047, "global_step": 53180, "epoch": 1266} {"train_loss": -5.839740753173828, "global_step": 53181, "epoch": 1266} {"train_loss": -5.844243049621582, "global_step": 53182, "epoch": 1266} {"train_loss": -5.785665512084961, "global_step": 53183, "epoch": 1266} {"train_loss": -5.826811790466309, "global_step": 53184, "epoch": 1266} {"train_loss": -5.821126937866211, "global_step": 53185, "epoch": 1266} {"train_loss": -5.766292572021484, "global_step": 53186, "epoch": 1266} {"train_loss": -5.691394805908203, "global_step": 53187, "epoch": 1266} {"train_loss": -5.803668022155762, "global_step": 53188, "epoch": 1266} {"train_loss": -5.7326741218566895, "global_step": 53189, "epoch": 1266} {"train_loss": -5.8390092849731445, "global_step": 53190, "epoch": 1266} {"train_loss": -5.940893173217773, "global_step": 53191, "epoch": 1266} {"train_loss": -5.838146209716797, "global_step": 53192, "epoch": 1266} {"train_loss": -5.8828887939453125, "global_step": 53193, "epoch": 1266} {"train_loss": -5.891993522644043, "global_step": 53194, "epoch": 1266} {"train_loss": -5.7736663818359375, "global_step": 53195, "epoch": 1266} {"train_loss": -5.853315830230713, "global_step": 53196, "epoch": 1266} {"train_loss": -5.725582122802734, "global_step": 53197, "epoch": 1266} {"train_loss": -5.953828811645508, "global_step": 53198, "epoch": 1266} {"train_loss": -5.797865867614746, "global_step": 53199, "epoch": 1266} {"train_loss": -5.764146327972412, "global_step": 53200, "epoch": 1266} {"train_loss": -5.741344928741455, "global_step": 53201, "epoch": 1266} {"train_loss": -5.696966648101807, "global_step": 53202, "epoch": 1266} {"train_loss": -5.63621187210083, "global_step": 53203, "epoch": 1266} {"train_loss": -5.917665481567383, "global_step": 53204, "epoch": 1266} {"train_loss": -5.65721321105957, "global_step": 53205, "epoch": 1266} {"train_loss": -5.663150787353516, "global_step": 53206, "epoch": 1266} {"train_loss": -5.894153594970703, "global_step": 53207, "epoch": 1266} {"train_loss": -5.518411636352539, "global_step": 53208, "epoch": 1266} {"train_loss": -5.795583248138428, "global_step": 53209, "epoch": 1266} {"train_loss": -5.765300750732422, "global_step": 53210, "epoch": 1266} {"train_loss": -5.639235496520996, "global_step": 53211, "epoch": 1266} {"train_loss": -5.91253662109375, "global_step": 53212, "epoch": 1266} {"train_loss": -5.788403760819208, "global_step": 53213, "epoch": 1266, "val_loss": 61446.5390625} {"train_loss": -5.874072551727295, "global_step": 53214, "epoch": 1267} {"train_loss": -5.620207786560059, "global_step": 53215, "epoch": 1267} {"train_loss": -5.83074951171875, "global_step": 53216, "epoch": 1267} {"train_loss": -5.742483615875244, "global_step": 53217, "epoch": 1267} {"train_loss": -5.7198405265808105, "global_step": 53218, "epoch": 1267} {"train_loss": -5.76314640045166, "global_step": 53219, "epoch": 1267} {"train_loss": -5.763932228088379, "global_step": 53220, "epoch": 1267} {"train_loss": -5.729416847229004, "global_step": 53221, "epoch": 1267} {"train_loss": -5.761456489562988, "global_step": 53222, "epoch": 1267} {"train_loss": -5.867731094360352, "global_step": 53223, "epoch": 1267} {"train_loss": -5.700686931610107, "global_step": 53224, "epoch": 1267} {"train_loss": -5.787947654724121, "global_step": 53225, "epoch": 1267} {"train_loss": -5.842213153839111, "global_step": 53226, "epoch": 1267} {"train_loss": -5.833108901977539, "global_step": 53227, "epoch": 1267} {"train_loss": -5.830964088439941, "global_step": 53228, "epoch": 1267} {"train_loss": -5.7805633544921875, "global_step": 53229, "epoch": 1267} {"train_loss": -5.6947340965271, "global_step": 53230, "epoch": 1267} {"train_loss": -5.777003765106201, "global_step": 53231, "epoch": 1267} {"train_loss": -5.909363746643066, "global_step": 53232, "epoch": 1267} {"train_loss": -5.656238555908203, "global_step": 53233, "epoch": 1267} {"train_loss": -5.86651611328125, "global_step": 53234, "epoch": 1267} {"train_loss": -5.743826866149902, "global_step": 53235, "epoch": 1267} {"train_loss": -5.763762474060059, "global_step": 53236, "epoch": 1267} {"train_loss": -5.846138954162598, "global_step": 53237, "epoch": 1267} {"train_loss": -5.744887351989746, "global_step": 53238, "epoch": 1267} {"train_loss": -5.70150089263916, "global_step": 53239, "epoch": 1267} {"train_loss": -5.848512649536133, "global_step": 53240, "epoch": 1267} {"train_loss": -5.683133125305176, "global_step": 53241, "epoch": 1267} {"train_loss": -5.850964546203613, "global_step": 53242, "epoch": 1267} {"train_loss": -5.7026567459106445, "global_step": 53243, "epoch": 1267} {"train_loss": -5.751870155334473, "global_step": 53244, "epoch": 1267} {"train_loss": -5.792807579040527, "global_step": 53245, "epoch": 1267} {"train_loss": -5.68718147277832, "global_step": 53246, "epoch": 1267} {"train_loss": -5.7756218910217285, "global_step": 53247, "epoch": 1267} {"train_loss": -5.8045172691345215, "global_step": 53248, "epoch": 1267} {"train_loss": -5.805871486663818, "global_step": 53249, "epoch": 1267} {"train_loss": -5.814640045166016, "global_step": 53250, "epoch": 1267} {"train_loss": -5.819433212280273, "global_step": 53251, "epoch": 1267} {"train_loss": -5.750169277191162, "global_step": 53252, "epoch": 1267} {"train_loss": -5.772982120513916, "global_step": 53253, "epoch": 1267} {"train_loss": -5.767031192779541, "global_step": 53254, "epoch": 1267} {"train_loss": -5.774935892650059, "global_step": 53255, "epoch": 1267, "val_loss": 61824.9453125} {"train_loss": -5.823237419128418, "global_step": 53256, "epoch": 1268} {"train_loss": -5.730443000793457, "global_step": 53257, "epoch": 1268} {"train_loss": -5.6914777755737305, "global_step": 53258, "epoch": 1268} {"train_loss": -5.836467742919922, "global_step": 53259, "epoch": 1268} {"train_loss": -5.802131652832031, "global_step": 53260, "epoch": 1268} {"train_loss": -5.714290618896484, "global_step": 53261, "epoch": 1268} {"train_loss": -5.885981559753418, "global_step": 53262, "epoch": 1268} {"train_loss": -5.838924884796143, "global_step": 53263, "epoch": 1268} {"train_loss": -5.765810012817383, "global_step": 53264, "epoch": 1268} {"train_loss": -5.921181678771973, "global_step": 53265, "epoch": 1268} {"train_loss": -5.800696849822998, "global_step": 53266, "epoch": 1268} {"train_loss": -5.712573051452637, "global_step": 53267, "epoch": 1268} {"train_loss": -5.7014617919921875, "global_step": 53268, "epoch": 1268} {"train_loss": -5.738928318023682, "global_step": 53269, "epoch": 1268} {"train_loss": -5.966337203979492, "global_step": 53270, "epoch": 1268} {"train_loss": -5.743875503540039, "global_step": 53271, "epoch": 1268} {"train_loss": -5.8234100341796875, "global_step": 53272, "epoch": 1268} {"train_loss": -5.703166484832764, "global_step": 53273, "epoch": 1268} {"train_loss": -5.844425201416016, "global_step": 53274, "epoch": 1268} {"train_loss": -5.758273601531982, "global_step": 53275, "epoch": 1268} {"train_loss": -5.798328399658203, "global_step": 53276, "epoch": 1268} {"train_loss": -5.780867576599121, "global_step": 53277, "epoch": 1268} {"train_loss": -5.7976484298706055, "global_step": 53278, "epoch": 1268} {"train_loss": -5.8694539070129395, "global_step": 53279, "epoch": 1268} {"train_loss": -5.871324062347412, "global_step": 53280, "epoch": 1268} {"train_loss": -5.921849727630615, "global_step": 53281, "epoch": 1268} {"train_loss": -5.741177082061768, "global_step": 53282, "epoch": 1268} {"train_loss": -5.772916793823242, "global_step": 53283, "epoch": 1268} {"train_loss": -5.9402971267700195, "global_step": 53284, "epoch": 1268} {"train_loss": -5.806532859802246, "global_step": 53285, "epoch": 1268} {"train_loss": -5.68106746673584, "global_step": 53286, "epoch": 1268} {"train_loss": -5.8126349449157715, "global_step": 53287, "epoch": 1268} {"train_loss": -5.812944412231445, "global_step": 53288, "epoch": 1268} {"train_loss": -5.730926513671875, "global_step": 53289, "epoch": 1268} {"train_loss": -5.85253381729126, "global_step": 53290, "epoch": 1268} {"train_loss": -5.651219367980957, "global_step": 53291, "epoch": 1268} {"train_loss": -5.843137264251709, "global_step": 53292, "epoch": 1268} {"train_loss": -5.851840972900391, "global_step": 53293, "epoch": 1268} {"train_loss": -5.728019714355469, "global_step": 53294, "epoch": 1268} {"train_loss": -5.852565765380859, "global_step": 53295, "epoch": 1268} {"train_loss": -5.737850189208984, "global_step": 53296, "epoch": 1268} {"train_loss": -5.796298969359625, "global_step": 53297, "epoch": 1268, "val_loss": 61615.89453125} {"train_loss": -5.829845905303955, "global_step": 53298, "epoch": 1269} {"train_loss": -5.711775779724121, "global_step": 53299, "epoch": 1269} {"train_loss": -5.9408159255981445, "global_step": 53300, "epoch": 1269} {"train_loss": -5.794089317321777, "global_step": 53301, "epoch": 1269} {"train_loss": -5.8608503341674805, "global_step": 53302, "epoch": 1269} {"train_loss": -5.844876289367676, "global_step": 53303, "epoch": 1269} {"train_loss": -5.860253810882568, "global_step": 53304, "epoch": 1269} {"train_loss": -5.825709342956543, "global_step": 53305, "epoch": 1269} {"train_loss": -5.863112449645996, "global_step": 53306, "epoch": 1269} {"train_loss": -5.773950099945068, "global_step": 53307, "epoch": 1269} {"train_loss": -5.77069616317749, "global_step": 53308, "epoch": 1269} {"train_loss": -5.7771806716918945, "global_step": 53309, "epoch": 1269} {"train_loss": -5.736936569213867, "global_step": 53310, "epoch": 1269} {"train_loss": -5.745261192321777, "global_step": 53311, "epoch": 1269} {"train_loss": -5.876473426818848, "global_step": 53312, "epoch": 1269} {"train_loss": -5.890111446380615, "global_step": 53313, "epoch": 1269} {"train_loss": -5.847984313964844, "global_step": 53314, "epoch": 1269} {"train_loss": -5.90359354019165, "global_step": 53315, "epoch": 1269} {"train_loss": -5.868523597717285, "global_step": 53316, "epoch": 1269} {"train_loss": -5.907672882080078, "global_step": 53317, "epoch": 1269} {"train_loss": -5.879329681396484, "global_step": 53318, "epoch": 1269} {"train_loss": -5.77377462387085, "global_step": 53319, "epoch": 1269} {"train_loss": -5.752501487731934, "global_step": 53320, "epoch": 1269} {"train_loss": -5.8811445236206055, "global_step": 53321, "epoch": 1269} {"train_loss": -5.947141170501709, "global_step": 53322, "epoch": 1269} {"train_loss": -5.903326511383057, "global_step": 53323, "epoch": 1269} {"train_loss": -5.842445373535156, "global_step": 53324, "epoch": 1269} {"train_loss": -5.871866703033447, "global_step": 53325, "epoch": 1269} {"train_loss": -5.855971336364746, "global_step": 53326, "epoch": 1269} {"train_loss": -5.845362663269043, "global_step": 53327, "epoch": 1269} {"train_loss": -5.931499004364014, "global_step": 53328, "epoch": 1269} {"train_loss": -5.806021213531494, "global_step": 53329, "epoch": 1269} {"train_loss": -5.946801662445068, "global_step": 53330, "epoch": 1269} {"train_loss": -5.942654609680176, "global_step": 53331, "epoch": 1269} {"train_loss": -5.751178741455078, "global_step": 53332, "epoch": 1269} {"train_loss": -5.779126167297363, "global_step": 53333, "epoch": 1269} {"train_loss": -5.767815589904785, "global_step": 53334, "epoch": 1269} {"train_loss": -5.756374359130859, "global_step": 53335, "epoch": 1269} {"train_loss": -5.88163948059082, "global_step": 53336, "epoch": 1269} {"train_loss": -5.83176326751709, "global_step": 53337, "epoch": 1269} {"train_loss": -5.958354949951172, "global_step": 53338, "epoch": 1269} {"train_loss": -5.841501122429257, "global_step": 53339, "epoch": 1269, "val_loss": 61167.59375} {"train_loss": -5.846343994140625, "global_step": 53340, "epoch": 1270} {"train_loss": -5.922208786010742, "global_step": 53341, "epoch": 1270} {"train_loss": -5.909704685211182, "global_step": 53342, "epoch": 1270} {"train_loss": -5.80070686340332, "global_step": 53343, "epoch": 1270} {"train_loss": -5.7804999351501465, "global_step": 53344, "epoch": 1270} {"train_loss": -5.839794635772705, "global_step": 53345, "epoch": 1270} {"train_loss": -5.751224040985107, "global_step": 53346, "epoch": 1270} {"train_loss": -5.723182678222656, "global_step": 53347, "epoch": 1270} {"train_loss": -5.875682830810547, "global_step": 53348, "epoch": 1270} {"train_loss": -5.7384490966796875, "global_step": 53349, "epoch": 1270} {"train_loss": -5.881566047668457, "global_step": 53350, "epoch": 1270} {"train_loss": -5.736716270446777, "global_step": 53351, "epoch": 1270} {"train_loss": -5.826752662658691, "global_step": 53352, "epoch": 1270} {"train_loss": -5.901773452758789, "global_step": 53353, "epoch": 1270} {"train_loss": -5.902456760406494, "global_step": 53354, "epoch": 1270} {"train_loss": -5.924242973327637, "global_step": 53355, "epoch": 1270} {"train_loss": -5.823967933654785, "global_step": 53356, "epoch": 1270} {"train_loss": -5.822399139404297, "global_step": 53357, "epoch": 1270} {"train_loss": -5.826116561889648, "global_step": 53358, "epoch": 1270} {"train_loss": -5.855227470397949, "global_step": 53359, "epoch": 1270} {"train_loss": -5.845495223999023, "global_step": 53360, "epoch": 1270} {"train_loss": -5.9334869384765625, "global_step": 53361, "epoch": 1270} {"train_loss": -5.933758735656738, "global_step": 53362, "epoch": 1270} {"train_loss": -5.802980899810791, "global_step": 53363, "epoch": 1270} {"train_loss": -5.859988689422607, "global_step": 53364, "epoch": 1270} {"train_loss": -5.885360240936279, "global_step": 53365, "epoch": 1270} {"train_loss": -5.728673934936523, "global_step": 53366, "epoch": 1270} {"train_loss": -5.994377613067627, "global_step": 53367, "epoch": 1270} {"train_loss": -5.911403179168701, "global_step": 53368, "epoch": 1270} {"train_loss": -5.771660327911377, "global_step": 53369, "epoch": 1270} {"train_loss": -5.862039089202881, "global_step": 53370, "epoch": 1270} {"train_loss": -5.78797721862793, "global_step": 53371, "epoch": 1270} {"train_loss": -5.933125019073486, "global_step": 53372, "epoch": 1270} {"train_loss": -5.709452152252197, "global_step": 53373, "epoch": 1270} {"train_loss": -5.826967716217041, "global_step": 53374, "epoch": 1270} {"train_loss": -5.693374156951904, "global_step": 53375, "epoch": 1270} {"train_loss": -5.917446136474609, "global_step": 53376, "epoch": 1270} {"train_loss": -5.811401844024658, "global_step": 53377, "epoch": 1270} {"train_loss": -5.829644203186035, "global_step": 53378, "epoch": 1270} {"train_loss": -5.868044376373291, "global_step": 53379, "epoch": 1270} {"train_loss": -5.674714088439941, "global_step": 53380, "epoch": 1270} {"train_loss": -5.836540687651861, "global_step": 53381, "epoch": 1270, "val_loss": 61957.90625} {"train_loss": -5.79609489440918, "global_step": 53382, "epoch": 1271} {"train_loss": -5.721504211425781, "global_step": 53383, "epoch": 1271} {"train_loss": -5.876355171203613, "global_step": 53384, "epoch": 1271} {"train_loss": -5.784343719482422, "global_step": 53385, "epoch": 1271} {"train_loss": -5.751743793487549, "global_step": 53386, "epoch": 1271} {"train_loss": -5.844542503356934, "global_step": 53387, "epoch": 1271} {"train_loss": -5.839439392089844, "global_step": 53388, "epoch": 1271} {"train_loss": -5.880974292755127, "global_step": 53389, "epoch": 1271} {"train_loss": -5.797284126281738, "global_step": 53390, "epoch": 1271} {"train_loss": -5.734004497528076, "global_step": 53391, "epoch": 1271} {"train_loss": -5.8384552001953125, "global_step": 53392, "epoch": 1271} {"train_loss": -5.879621982574463, "global_step": 53393, "epoch": 1271} {"train_loss": -5.829145908355713, "global_step": 53394, "epoch": 1271} {"train_loss": -5.892432689666748, "global_step": 53395, "epoch": 1271} {"train_loss": -5.825333118438721, "global_step": 53396, "epoch": 1271} {"train_loss": -5.854954719543457, "global_step": 53397, "epoch": 1271} {"train_loss": -5.811090469360352, "global_step": 53398, "epoch": 1271} {"train_loss": -5.8395233154296875, "global_step": 53399, "epoch": 1271} {"train_loss": -5.874214172363281, "global_step": 53400, "epoch": 1271} {"train_loss": -5.93058967590332, "global_step": 53401, "epoch": 1271} {"train_loss": -5.8167619705200195, "global_step": 53402, "epoch": 1271} {"train_loss": -5.846324920654297, "global_step": 53403, "epoch": 1271} {"train_loss": -5.932011127471924, "global_step": 53404, "epoch": 1271} {"train_loss": -5.906211853027344, "global_step": 53405, "epoch": 1271} {"train_loss": -5.768462181091309, "global_step": 53406, "epoch": 1271} {"train_loss": -5.8285980224609375, "global_step": 53407, "epoch": 1271} {"train_loss": -5.845052719116211, "global_step": 53408, "epoch": 1271} {"train_loss": -5.782291412353516, "global_step": 53409, "epoch": 1271} {"train_loss": -5.768596649169922, "global_step": 53410, "epoch": 1271} {"train_loss": -5.809072494506836, "global_step": 53411, "epoch": 1271} {"train_loss": -5.785869598388672, "global_step": 53412, "epoch": 1271} {"train_loss": -5.816633224487305, "global_step": 53413, "epoch": 1271} {"train_loss": -5.797771453857422, "global_step": 53414, "epoch": 1271} {"train_loss": -5.872357368469238, "global_step": 53415, "epoch": 1271} {"train_loss": -5.9626078605651855, "global_step": 53416, "epoch": 1271} {"train_loss": -5.902822494506836, "global_step": 53417, "epoch": 1271} {"train_loss": -5.802611827850342, "global_step": 53418, "epoch": 1271} {"train_loss": -5.769050598144531, "global_step": 53419, "epoch": 1271} {"train_loss": -5.645822525024414, "global_step": 53420, "epoch": 1271} {"train_loss": -5.710467338562012, "global_step": 53421, "epoch": 1271} {"train_loss": -5.766204833984375, "global_step": 53422, "epoch": 1271} {"train_loss": -5.821292434419904, "global_step": 53423, "epoch": 1271, "val_loss": 61584.21875} {"train_loss": -5.782040119171143, "global_step": 53424, "epoch": 1272} {"train_loss": -5.769052505493164, "global_step": 53425, "epoch": 1272} {"train_loss": -5.797080993652344, "global_step": 53426, "epoch": 1272} {"train_loss": -5.780157089233398, "global_step": 53427, "epoch": 1272} {"train_loss": -5.843780517578125, "global_step": 53428, "epoch": 1272} {"train_loss": -5.763393402099609, "global_step": 53429, "epoch": 1272} {"train_loss": -5.877681255340576, "global_step": 53430, "epoch": 1272} {"train_loss": -5.841244220733643, "global_step": 53431, "epoch": 1272} {"train_loss": -5.836909294128418, "global_step": 53432, "epoch": 1272} {"train_loss": -5.914046287536621, "global_step": 53433, "epoch": 1272} {"train_loss": -5.79878568649292, "global_step": 53434, "epoch": 1272} {"train_loss": -5.810014247894287, "global_step": 53435, "epoch": 1272} {"train_loss": -5.7435784339904785, "global_step": 53436, "epoch": 1272} {"train_loss": -5.750112056732178, "global_step": 53437, "epoch": 1272} {"train_loss": -5.77902364730835, "global_step": 53438, "epoch": 1272} {"train_loss": -5.939933776855469, "global_step": 53439, "epoch": 1272} {"train_loss": -5.923989295959473, "global_step": 53440, "epoch": 1272} {"train_loss": -5.8233160972595215, "global_step": 53441, "epoch": 1272} {"train_loss": -5.886868953704834, "global_step": 53442, "epoch": 1272} {"train_loss": -5.775087356567383, "global_step": 53443, "epoch": 1272} {"train_loss": -5.836892604827881, "global_step": 53444, "epoch": 1272} {"train_loss": -5.9250288009643555, "global_step": 53445, "epoch": 1272} {"train_loss": -5.860123634338379, "global_step": 53446, "epoch": 1272} {"train_loss": -5.884283065795898, "global_step": 53447, "epoch": 1272} {"train_loss": -5.783788681030273, "global_step": 53448, "epoch": 1272} {"train_loss": -5.826119422912598, "global_step": 53449, "epoch": 1272} {"train_loss": -5.803925037384033, "global_step": 53450, "epoch": 1272} {"train_loss": -5.83247184753418, "global_step": 53451, "epoch": 1272} {"train_loss": -5.743047714233398, "global_step": 53452, "epoch": 1272} {"train_loss": -5.835424423217773, "global_step": 53453, "epoch": 1272} {"train_loss": -5.876792907714844, "global_step": 53454, "epoch": 1272} {"train_loss": -5.791775703430176, "global_step": 53455, "epoch": 1272} {"train_loss": -5.809012413024902, "global_step": 53456, "epoch": 1272} {"train_loss": -5.83681583404541, "global_step": 53457, "epoch": 1272} {"train_loss": -6.016056060791016, "global_step": 53458, "epoch": 1272} {"train_loss": -5.780107498168945, "global_step": 53459, "epoch": 1272} {"train_loss": -5.912623405456543, "global_step": 53460, "epoch": 1272} {"train_loss": -5.804014682769775, "global_step": 53461, "epoch": 1272} {"train_loss": -5.7563581466674805, "global_step": 53462, "epoch": 1272} {"train_loss": -5.765761375427246, "global_step": 53463, "epoch": 1272} {"train_loss": -5.813816547393799, "global_step": 53464, "epoch": 1272} {"train_loss": -5.828257628849575, "global_step": 53465, "epoch": 1272, "val_loss": 61386.23046875} {"train_loss": -5.9187421798706055, "global_step": 53466, "epoch": 1273} {"train_loss": -5.724459648132324, "global_step": 53467, "epoch": 1273} {"train_loss": -5.779763698577881, "global_step": 53468, "epoch": 1273} {"train_loss": -5.759952068328857, "global_step": 53469, "epoch": 1273} {"train_loss": -5.763202667236328, "global_step": 53470, "epoch": 1273} {"train_loss": -5.793321132659912, "global_step": 53471, "epoch": 1273} {"train_loss": -5.796641826629639, "global_step": 53472, "epoch": 1273} {"train_loss": -5.900224208831787, "global_step": 53473, "epoch": 1273} {"train_loss": -5.913685321807861, "global_step": 53474, "epoch": 1273} {"train_loss": -5.838565826416016, "global_step": 53475, "epoch": 1273} {"train_loss": -5.85366153717041, "global_step": 53476, "epoch": 1273} {"train_loss": -5.950657844543457, "global_step": 53477, "epoch": 1273} {"train_loss": -5.839361190795898, "global_step": 53478, "epoch": 1273} {"train_loss": -5.877035617828369, "global_step": 53479, "epoch": 1273} {"train_loss": -5.905822277069092, "global_step": 53480, "epoch": 1273} {"train_loss": -5.801288604736328, "global_step": 53481, "epoch": 1273} {"train_loss": -5.919175148010254, "global_step": 53482, "epoch": 1273} {"train_loss": -5.81573486328125, "global_step": 53483, "epoch": 1273} {"train_loss": -5.839508056640625, "global_step": 53484, "epoch": 1273} {"train_loss": -5.749086380004883, "global_step": 53485, "epoch": 1273} {"train_loss": -5.768233776092529, "global_step": 53486, "epoch": 1273} {"train_loss": -5.952749729156494, "global_step": 53487, "epoch": 1273} {"train_loss": -5.989226341247559, "global_step": 53488, "epoch": 1273} {"train_loss": -5.900688171386719, "global_step": 53489, "epoch": 1273} {"train_loss": -5.862390041351318, "global_step": 53490, "epoch": 1273} {"train_loss": -5.8438639640808105, "global_step": 53491, "epoch": 1273} {"train_loss": -5.785916328430176, "global_step": 53492, "epoch": 1273} {"train_loss": -5.792880058288574, "global_step": 53493, "epoch": 1273} {"train_loss": -5.766067028045654, "global_step": 53494, "epoch": 1273} {"train_loss": -5.755786895751953, "global_step": 53495, "epoch": 1273} {"train_loss": -5.867806434631348, "global_step": 53496, "epoch": 1273} {"train_loss": -5.830913543701172, "global_step": 53497, "epoch": 1273} {"train_loss": -5.758080005645752, "global_step": 53498, "epoch": 1273} {"train_loss": -5.827777862548828, "global_step": 53499, "epoch": 1273} {"train_loss": -5.983310699462891, "global_step": 53500, "epoch": 1273} {"train_loss": -5.66700553894043, "global_step": 53501, "epoch": 1273} {"train_loss": -5.750480651855469, "global_step": 53502, "epoch": 1273} {"train_loss": -5.880633354187012, "global_step": 53503, "epoch": 1273} {"train_loss": -5.664150238037109, "global_step": 53504, "epoch": 1273} {"train_loss": -5.827635288238525, "global_step": 53505, "epoch": 1273} {"train_loss": -5.9170308113098145, "global_step": 53506, "epoch": 1273} {"train_loss": -5.832944347744896, "global_step": 53507, "epoch": 1273, "val_loss": 61545.296875} {"train_loss": -5.862817764282227, "global_step": 53508, "epoch": 1274} {"train_loss": -5.753719806671143, "global_step": 53509, "epoch": 1274} {"train_loss": -5.864684104919434, "global_step": 53510, "epoch": 1274} {"train_loss": -5.724313735961914, "global_step": 53511, "epoch": 1274} {"train_loss": -5.788168907165527, "global_step": 53512, "epoch": 1274} {"train_loss": -5.693958282470703, "global_step": 53513, "epoch": 1274} {"train_loss": -5.785550117492676, "global_step": 53514, "epoch": 1274} {"train_loss": -5.824300765991211, "global_step": 53515, "epoch": 1274} {"train_loss": -5.8412861824035645, "global_step": 53516, "epoch": 1274} {"train_loss": -5.900727272033691, "global_step": 53517, "epoch": 1274} {"train_loss": -5.800292015075684, "global_step": 53518, "epoch": 1274} {"train_loss": -5.6895599365234375, "global_step": 53519, "epoch": 1274} {"train_loss": -5.812384605407715, "global_step": 53520, "epoch": 1274} {"train_loss": -5.8220930099487305, "global_step": 53521, "epoch": 1274} {"train_loss": -5.823969841003418, "global_step": 53522, "epoch": 1274} {"train_loss": -5.786503791809082, "global_step": 53523, "epoch": 1274} {"train_loss": -5.931491851806641, "global_step": 53524, "epoch": 1274} {"train_loss": -5.739785194396973, "global_step": 53525, "epoch": 1274} {"train_loss": -5.766939163208008, "global_step": 53526, "epoch": 1274} {"train_loss": -5.918157577514648, "global_step": 53527, "epoch": 1274} {"train_loss": -5.75148868560791, "global_step": 53528, "epoch": 1274} {"train_loss": -5.8393144607543945, "global_step": 53529, "epoch": 1274} {"train_loss": -5.78239631652832, "global_step": 53530, "epoch": 1274} {"train_loss": -5.9411940574646, "global_step": 53531, "epoch": 1274} {"train_loss": -6.001480579376221, "global_step": 53532, "epoch": 1274} {"train_loss": -5.791795253753662, "global_step": 53533, "epoch": 1274} {"train_loss": -5.775729179382324, "global_step": 53534, "epoch": 1274} {"train_loss": -5.760934352874756, "global_step": 53535, "epoch": 1274} {"train_loss": -5.861556053161621, "global_step": 53536, "epoch": 1274} {"train_loss": -5.902708530426025, "global_step": 53537, "epoch": 1274} {"train_loss": -5.841214656829834, "global_step": 53538, "epoch": 1274} {"train_loss": -5.9770684242248535, "global_step": 53539, "epoch": 1274} {"train_loss": -5.780388355255127, "global_step": 53540, "epoch": 1274} {"train_loss": -5.879211902618408, "global_step": 53541, "epoch": 1274} {"train_loss": -5.9018683433532715, "global_step": 53542, "epoch": 1274} {"train_loss": -5.715945243835449, "global_step": 53543, "epoch": 1274} {"train_loss": -5.825899600982666, "global_step": 53544, "epoch": 1274} {"train_loss": -5.882907390594482, "global_step": 53545, "epoch": 1274} {"train_loss": -5.873392581939697, "global_step": 53546, "epoch": 1274} {"train_loss": -5.884761810302734, "global_step": 53547, "epoch": 1274} {"train_loss": -5.78319787979126, "global_step": 53548, "epoch": 1274} {"train_loss": -5.827571164994013, "global_step": 53549, "epoch": 1274, "val_loss": 61413.96875} {"train_loss": -5.908737659454346, "global_step": 53550, "epoch": 1275} {"train_loss": -5.787590026855469, "global_step": 53551, "epoch": 1275} {"train_loss": -5.9972734451293945, "global_step": 53552, "epoch": 1275} {"train_loss": -5.7942914962768555, "global_step": 53553, "epoch": 1275} {"train_loss": -5.684520244598389, "global_step": 53554, "epoch": 1275} {"train_loss": -5.91571044921875, "global_step": 53555, "epoch": 1275} {"train_loss": -5.747578144073486, "global_step": 53556, "epoch": 1275} {"train_loss": -5.610952377319336, "global_step": 53557, "epoch": 1275} {"train_loss": -5.912792205810547, "global_step": 53558, "epoch": 1275} {"train_loss": -5.6919846534729, "global_step": 53559, "epoch": 1275} {"train_loss": -5.887016296386719, "global_step": 53560, "epoch": 1275} {"train_loss": -5.746380805969238, "global_step": 53561, "epoch": 1275} {"train_loss": -5.69979190826416, "global_step": 53562, "epoch": 1275} {"train_loss": -5.885502815246582, "global_step": 53563, "epoch": 1275} {"train_loss": -5.670505523681641, "global_step": 53564, "epoch": 1275} {"train_loss": -5.714795112609863, "global_step": 53565, "epoch": 1275} {"train_loss": -5.843472480773926, "global_step": 53566, "epoch": 1275} {"train_loss": -5.6904683113098145, "global_step": 53567, "epoch": 1275} {"train_loss": -5.8718366622924805, "global_step": 53568, "epoch": 1275} {"train_loss": -5.8419318199157715, "global_step": 53569, "epoch": 1275} {"train_loss": -5.811420440673828, "global_step": 53570, "epoch": 1275} {"train_loss": -5.822645664215088, "global_step": 53571, "epoch": 1275} {"train_loss": -5.801068305969238, "global_step": 53572, "epoch": 1275} {"train_loss": -5.900773525238037, "global_step": 53573, "epoch": 1275} {"train_loss": -5.735147476196289, "global_step": 53574, "epoch": 1275} {"train_loss": -5.788145065307617, "global_step": 53575, "epoch": 1275} {"train_loss": -5.709179878234863, "global_step": 53576, "epoch": 1275} {"train_loss": -5.852193832397461, "global_step": 53577, "epoch": 1275} {"train_loss": -5.830771446228027, "global_step": 53578, "epoch": 1275} {"train_loss": -5.8142290115356445, "global_step": 53579, "epoch": 1275} {"train_loss": -5.746087551116943, "global_step": 53580, "epoch": 1275} {"train_loss": -5.821797847747803, "global_step": 53581, "epoch": 1275} {"train_loss": -5.763543128967285, "global_step": 53582, "epoch": 1275} {"train_loss": -5.7554826736450195, "global_step": 53583, "epoch": 1275} {"train_loss": -5.824010848999023, "global_step": 53584, "epoch": 1275} {"train_loss": -5.930898189544678, "global_step": 53585, "epoch": 1275} {"train_loss": -5.779854774475098, "global_step": 53586, "epoch": 1275} {"train_loss": -5.764642238616943, "global_step": 53587, "epoch": 1275} {"train_loss": -5.840362548828125, "global_step": 53588, "epoch": 1275} {"train_loss": -5.636023998260498, "global_step": 53589, "epoch": 1275} {"train_loss": -5.837997913360596, "global_step": 53590, "epoch": 1275} {"train_loss": -5.797754730497088, "global_step": 53591, "epoch": 1275, "val_loss": 61680.25390625} {"train_loss": -5.737978935241699, "global_step": 53592, "epoch": 1276} {"train_loss": -5.755616188049316, "global_step": 53593, "epoch": 1276} {"train_loss": -5.889873027801514, "global_step": 53594, "epoch": 1276} {"train_loss": -5.8005194664001465, "global_step": 53595, "epoch": 1276} {"train_loss": -5.84331750869751, "global_step": 53596, "epoch": 1276} {"train_loss": -5.850231647491455, "global_step": 53597, "epoch": 1276} {"train_loss": -5.780220985412598, "global_step": 53598, "epoch": 1276} {"train_loss": -5.727416515350342, "global_step": 53599, "epoch": 1276} {"train_loss": -5.802874565124512, "global_step": 53600, "epoch": 1276} {"train_loss": -5.782331943511963, "global_step": 53601, "epoch": 1276} {"train_loss": -5.909264087677002, "global_step": 53602, "epoch": 1276} {"train_loss": -5.985236167907715, "global_step": 53603, "epoch": 1276} {"train_loss": -5.821243762969971, "global_step": 53604, "epoch": 1276} {"train_loss": -5.816095352172852, "global_step": 53605, "epoch": 1276} {"train_loss": -5.7798542976379395, "global_step": 53606, "epoch": 1276} {"train_loss": -5.81392240524292, "global_step": 53607, "epoch": 1276} {"train_loss": -5.81695556640625, "global_step": 53608, "epoch": 1276} {"train_loss": -5.722049713134766, "global_step": 53609, "epoch": 1276} {"train_loss": -5.834211349487305, "global_step": 53610, "epoch": 1276} {"train_loss": -5.859657287597656, "global_step": 53611, "epoch": 1276} {"train_loss": -5.813690185546875, "global_step": 53612, "epoch": 1276} {"train_loss": -5.866166114807129, "global_step": 53613, "epoch": 1276} {"train_loss": -5.702384948730469, "global_step": 53614, "epoch": 1276} {"train_loss": -5.75010871887207, "global_step": 53615, "epoch": 1276} {"train_loss": -5.757822036743164, "global_step": 53616, "epoch": 1276} {"train_loss": -5.843076705932617, "global_step": 53617, "epoch": 1276} {"train_loss": -5.79221248626709, "global_step": 53618, "epoch": 1276} {"train_loss": -5.902583122253418, "global_step": 53619, "epoch": 1276} {"train_loss": -5.738977432250977, "global_step": 53620, "epoch": 1276} {"train_loss": -5.830438613891602, "global_step": 53621, "epoch": 1276} {"train_loss": -5.769634246826172, "global_step": 53622, "epoch": 1276} {"train_loss": -5.725193977355957, "global_step": 53623, "epoch": 1276} {"train_loss": -5.822983264923096, "global_step": 53624, "epoch": 1276} {"train_loss": -5.873164176940918, "global_step": 53625, "epoch": 1276} {"train_loss": -5.813014030456543, "global_step": 53626, "epoch": 1276} {"train_loss": -5.896997451782227, "global_step": 53627, "epoch": 1276} {"train_loss": -5.947783470153809, "global_step": 53628, "epoch": 1276} {"train_loss": -5.881640434265137, "global_step": 53629, "epoch": 1276} {"train_loss": -5.752120018005371, "global_step": 53630, "epoch": 1276} {"train_loss": -5.838079452514648, "global_step": 53631, "epoch": 1276} {"train_loss": -5.763038635253906, "global_step": 53632, "epoch": 1276} {"train_loss": -5.814680633090791, "global_step": 53633, "epoch": 1276, "val_loss": 61467.74609375} {"train_loss": -5.890042781829834, "global_step": 53634, "epoch": 1277} {"train_loss": -5.857081413269043, "global_step": 53635, "epoch": 1277} {"train_loss": -5.730759143829346, "global_step": 53636, "epoch": 1277} {"train_loss": -5.8281569480896, "global_step": 53637, "epoch": 1277} {"train_loss": -5.7815775871276855, "global_step": 53638, "epoch": 1277} {"train_loss": -5.855690002441406, "global_step": 53639, "epoch": 1277} {"train_loss": -5.742157936096191, "global_step": 53640, "epoch": 1277} {"train_loss": -5.778105735778809, "global_step": 53641, "epoch": 1277} {"train_loss": -5.7375640869140625, "global_step": 53642, "epoch": 1277} {"train_loss": -5.8579630851745605, "global_step": 53643, "epoch": 1277} {"train_loss": -5.860786437988281, "global_step": 53644, "epoch": 1277} {"train_loss": -5.773566722869873, "global_step": 53645, "epoch": 1277} {"train_loss": -5.736342430114746, "global_step": 53646, "epoch": 1277} {"train_loss": -5.863628387451172, "global_step": 53647, "epoch": 1277} {"train_loss": -5.886927604675293, "global_step": 53648, "epoch": 1277} {"train_loss": -5.850615978240967, "global_step": 53649, "epoch": 1277} {"train_loss": -5.798594951629639, "global_step": 53650, "epoch": 1277} {"train_loss": -5.867854118347168, "global_step": 53651, "epoch": 1277} {"train_loss": -5.944028377532959, "global_step": 53652, "epoch": 1277} {"train_loss": -5.939693450927734, "global_step": 53653, "epoch": 1277} {"train_loss": -5.904695987701416, "global_step": 53654, "epoch": 1277} {"train_loss": -5.914333820343018, "global_step": 53655, "epoch": 1277} {"train_loss": -5.840909004211426, "global_step": 53656, "epoch": 1277} {"train_loss": -5.8859405517578125, "global_step": 53657, "epoch": 1277} {"train_loss": -5.865106582641602, "global_step": 53658, "epoch": 1277} {"train_loss": -5.962201118469238, "global_step": 53659, "epoch": 1277} {"train_loss": -5.793437480926514, "global_step": 53660, "epoch": 1277} {"train_loss": -5.746130466461182, "global_step": 53661, "epoch": 1277} {"train_loss": -5.770627021789551, "global_step": 53662, "epoch": 1277} {"train_loss": -5.755847930908203, "global_step": 53663, "epoch": 1277} {"train_loss": -5.88002872467041, "global_step": 53664, "epoch": 1277} {"train_loss": -5.871705532073975, "global_step": 53665, "epoch": 1277} {"train_loss": -5.851858615875244, "global_step": 53666, "epoch": 1277} {"train_loss": -5.737234592437744, "global_step": 53667, "epoch": 1277} {"train_loss": -5.92152214050293, "global_step": 53668, "epoch": 1277} {"train_loss": -5.785098075866699, "global_step": 53669, "epoch": 1277} {"train_loss": -5.827042579650879, "global_step": 53670, "epoch": 1277} {"train_loss": -5.817713737487793, "global_step": 53671, "epoch": 1277} {"train_loss": -5.798655033111572, "global_step": 53672, "epoch": 1277} {"train_loss": -5.677639961242676, "global_step": 53673, "epoch": 1277} {"train_loss": -5.659897804260254, "global_step": 53674, "epoch": 1277} {"train_loss": -5.824344566890171, "global_step": 53675, "epoch": 1277, "val_loss": 61692.51953125} {"train_loss": -5.711391448974609, "global_step": 53676, "epoch": 1278} {"train_loss": -5.855829238891602, "global_step": 53677, "epoch": 1278} {"train_loss": -5.850205898284912, "global_step": 53678, "epoch": 1278} {"train_loss": -5.781366348266602, "global_step": 53679, "epoch": 1278} {"train_loss": -5.983638286590576, "global_step": 53680, "epoch": 1278} {"train_loss": -5.852193832397461, "global_step": 53681, "epoch": 1278} {"train_loss": -5.806036949157715, "global_step": 53682, "epoch": 1278} {"train_loss": -5.884591102600098, "global_step": 53683, "epoch": 1278} {"train_loss": -5.834236145019531, "global_step": 53684, "epoch": 1278} {"train_loss": -5.942377090454102, "global_step": 53685, "epoch": 1278} {"train_loss": -5.940382957458496, "global_step": 53686, "epoch": 1278} {"train_loss": -5.908005714416504, "global_step": 53687, "epoch": 1278} {"train_loss": -5.7595977783203125, "global_step": 53688, "epoch": 1278} {"train_loss": -5.776357650756836, "global_step": 53689, "epoch": 1278} {"train_loss": -5.670957565307617, "global_step": 53690, "epoch": 1278} {"train_loss": -5.930131912231445, "global_step": 53691, "epoch": 1278} {"train_loss": -5.738805770874023, "global_step": 53692, "epoch": 1278} {"train_loss": -5.7611165046691895, "global_step": 53693, "epoch": 1278} {"train_loss": -5.627752304077148, "global_step": 53694, "epoch": 1278} {"train_loss": -5.648833274841309, "global_step": 53695, "epoch": 1278} {"train_loss": -5.6943511962890625, "global_step": 53696, "epoch": 1278} {"train_loss": -5.771217346191406, "global_step": 53697, "epoch": 1278} {"train_loss": -5.5416646003723145, "global_step": 53698, "epoch": 1278} {"train_loss": -5.854228496551514, "global_step": 53699, "epoch": 1278} {"train_loss": -5.680246353149414, "global_step": 53700, "epoch": 1278} {"train_loss": -5.754300594329834, "global_step": 53701, "epoch": 1278} {"train_loss": -5.715191841125488, "global_step": 53702, "epoch": 1278} {"train_loss": -5.705456256866455, "global_step": 53703, "epoch": 1278} {"train_loss": -5.942841053009033, "global_step": 53704, "epoch": 1278} {"train_loss": -5.7785186767578125, "global_step": 53705, "epoch": 1278} {"train_loss": -5.803406715393066, "global_step": 53706, "epoch": 1278} {"train_loss": -5.775077819824219, "global_step": 53707, "epoch": 1278} {"train_loss": -5.866525173187256, "global_step": 53708, "epoch": 1278} {"train_loss": -5.76530647277832, "global_step": 53709, "epoch": 1278} {"train_loss": -5.771929740905762, "global_step": 53710, "epoch": 1278} {"train_loss": -5.7792768478393555, "global_step": 53711, "epoch": 1278} {"train_loss": -5.772037506103516, "global_step": 53712, "epoch": 1278} {"train_loss": -5.869537353515625, "global_step": 53713, "epoch": 1278} {"train_loss": -5.8417816162109375, "global_step": 53714, "epoch": 1278} {"train_loss": -5.683659553527832, "global_step": 53715, "epoch": 1278} {"train_loss": -5.696228504180908, "global_step": 53716, "epoch": 1278} {"train_loss": -5.792693660372779, "global_step": 53717, "epoch": 1278, "val_loss": 61411.5859375} {"train_loss": -5.821810722351074, "global_step": 53718, "epoch": 1279} {"train_loss": -5.802342891693115, "global_step": 53719, "epoch": 1279} {"train_loss": -5.892643451690674, "global_step": 53720, "epoch": 1279} {"train_loss": -5.827323913574219, "global_step": 53721, "epoch": 1279} {"train_loss": -5.808389186859131, "global_step": 53722, "epoch": 1279} {"train_loss": -5.934796333312988, "global_step": 53723, "epoch": 1279} {"train_loss": -5.728944778442383, "global_step": 53724, "epoch": 1279} {"train_loss": -5.8184075355529785, "global_step": 53725, "epoch": 1279} {"train_loss": -5.874361038208008, "global_step": 53726, "epoch": 1279} {"train_loss": -5.8883514404296875, "global_step": 53727, "epoch": 1279} {"train_loss": -5.818701267242432, "global_step": 53728, "epoch": 1279} {"train_loss": -5.801626205444336, "global_step": 53729, "epoch": 1279} {"train_loss": -5.865839958190918, "global_step": 53730, "epoch": 1279} {"train_loss": -5.800574779510498, "global_step": 53731, "epoch": 1279} {"train_loss": -5.6636881828308105, "global_step": 53732, "epoch": 1279} {"train_loss": -5.783472537994385, "global_step": 53733, "epoch": 1279} {"train_loss": -5.856847763061523, "global_step": 53734, "epoch": 1279} {"train_loss": -5.795831680297852, "global_step": 53735, "epoch": 1279} {"train_loss": -5.867131233215332, "global_step": 53736, "epoch": 1279} {"train_loss": -5.861503601074219, "global_step": 53737, "epoch": 1279} {"train_loss": -5.829640865325928, "global_step": 53738, "epoch": 1279} {"train_loss": -5.925937652587891, "global_step": 53739, "epoch": 1279} {"train_loss": -5.802949905395508, "global_step": 53740, "epoch": 1279} {"train_loss": -5.836993217468262, "global_step": 53741, "epoch": 1279} {"train_loss": -5.876289367675781, "global_step": 53742, "epoch": 1279} {"train_loss": -5.830540180206299, "global_step": 53743, "epoch": 1279} {"train_loss": -5.856113433837891, "global_step": 53744, "epoch": 1279} {"train_loss": -5.940293312072754, "global_step": 53745, "epoch": 1279} {"train_loss": -5.731614112854004, "global_step": 53746, "epoch": 1279} {"train_loss": -5.869755268096924, "global_step": 53747, "epoch": 1279} {"train_loss": -5.714509963989258, "global_step": 53748, "epoch": 1279} {"train_loss": -5.743447780609131, "global_step": 53749, "epoch": 1279} {"train_loss": -5.831252574920654, "global_step": 53750, "epoch": 1279} {"train_loss": -5.628360748291016, "global_step": 53751, "epoch": 1279} {"train_loss": -5.891848087310791, "global_step": 53752, "epoch": 1279} {"train_loss": -5.782049179077148, "global_step": 53753, "epoch": 1279} {"train_loss": -5.854940414428711, "global_step": 53754, "epoch": 1279} {"train_loss": -5.794506072998047, "global_step": 53755, "epoch": 1279} {"train_loss": -5.8035688400268555, "global_step": 53756, "epoch": 1279} {"train_loss": -5.877995014190674, "global_step": 53757, "epoch": 1279} {"train_loss": -5.821292877197266, "global_step": 53758, "epoch": 1279} {"train_loss": -5.8247224035717196, "global_step": 53759, "epoch": 1279, "val_loss": 61715.9140625} {"train_loss": -5.874344825744629, "global_step": 53760, "epoch": 1280} {"train_loss": -5.826544761657715, "global_step": 53761, "epoch": 1280} {"train_loss": -5.854057788848877, "global_step": 53762, "epoch": 1280} {"train_loss": -5.925754547119141, "global_step": 53763, "epoch": 1280} {"train_loss": -5.870429039001465, "global_step": 53764, "epoch": 1280} {"train_loss": -5.873627662658691, "global_step": 53765, "epoch": 1280} {"train_loss": -5.817634105682373, "global_step": 53766, "epoch": 1280} {"train_loss": -5.815814018249512, "global_step": 53767, "epoch": 1280} {"train_loss": -5.852278709411621, "global_step": 53768, "epoch": 1280} {"train_loss": -5.8274245262146, "global_step": 53769, "epoch": 1280} {"train_loss": -5.75558614730835, "global_step": 53770, "epoch": 1280} {"train_loss": -5.848300457000732, "global_step": 53771, "epoch": 1280} {"train_loss": -5.756965637207031, "global_step": 53772, "epoch": 1280} {"train_loss": -5.836147308349609, "global_step": 53773, "epoch": 1280} {"train_loss": -5.973663806915283, "global_step": 53774, "epoch": 1280} {"train_loss": -5.8731303215026855, "global_step": 53775, "epoch": 1280} {"train_loss": -5.816351890563965, "global_step": 53776, "epoch": 1280} {"train_loss": -5.931898593902588, "global_step": 53777, "epoch": 1280} {"train_loss": -5.8409271240234375, "global_step": 53778, "epoch": 1280} {"train_loss": -5.820505142211914, "global_step": 53779, "epoch": 1280} {"train_loss": -5.860992431640625, "global_step": 53780, "epoch": 1280} {"train_loss": -5.730413913726807, "global_step": 53781, "epoch": 1280} {"train_loss": -5.687068939208984, "global_step": 53782, "epoch": 1280} {"train_loss": -5.870038986206055, "global_step": 53783, "epoch": 1280} {"train_loss": -5.857460975646973, "global_step": 53784, "epoch": 1280} {"train_loss": -5.848654747009277, "global_step": 53785, "epoch": 1280} {"train_loss": -5.789163589477539, "global_step": 53786, "epoch": 1280} {"train_loss": -5.858245849609375, "global_step": 53787, "epoch": 1280} {"train_loss": -5.9039788246154785, "global_step": 53788, "epoch": 1280} {"train_loss": -5.87271785736084, "global_step": 53789, "epoch": 1280} {"train_loss": -5.823085308074951, "global_step": 53790, "epoch": 1280} {"train_loss": -5.901873588562012, "global_step": 53791, "epoch": 1280} {"train_loss": -5.752253532409668, "global_step": 53792, "epoch": 1280} {"train_loss": -5.967689514160156, "global_step": 53793, "epoch": 1280} {"train_loss": -5.82042932510376, "global_step": 53794, "epoch": 1280} {"train_loss": -5.843916893005371, "global_step": 53795, "epoch": 1280} {"train_loss": -5.715845108032227, "global_step": 53796, "epoch": 1280} {"train_loss": -5.763978481292725, "global_step": 53797, "epoch": 1280} {"train_loss": -5.883423805236816, "global_step": 53798, "epoch": 1280} {"train_loss": -5.898221015930176, "global_step": 53799, "epoch": 1280} {"train_loss": -5.963920593261719, "global_step": 53800, "epoch": 1280} {"train_loss": -5.84352920168922, "global_step": 53801, "epoch": 1280, "val_loss": 61282.4609375} {"train_loss": -5.920405387878418, "global_step": 53802, "epoch": 1281} {"train_loss": -5.928994655609131, "global_step": 53803, "epoch": 1281} {"train_loss": -5.784852981567383, "global_step": 53804, "epoch": 1281} {"train_loss": -5.860404968261719, "global_step": 53805, "epoch": 1281} {"train_loss": -5.789599418640137, "global_step": 53806, "epoch": 1281} {"train_loss": -5.832970142364502, "global_step": 53807, "epoch": 1281} {"train_loss": -5.814187049865723, "global_step": 53808, "epoch": 1281} {"train_loss": -5.834835529327393, "global_step": 53809, "epoch": 1281} {"train_loss": -5.775751113891602, "global_step": 53810, "epoch": 1281} {"train_loss": -5.820510387420654, "global_step": 53811, "epoch": 1281} {"train_loss": -5.788045406341553, "global_step": 53812, "epoch": 1281} {"train_loss": -5.885700225830078, "global_step": 53813, "epoch": 1281} {"train_loss": -5.771956920623779, "global_step": 53814, "epoch": 1281} {"train_loss": -5.872531890869141, "global_step": 53815, "epoch": 1281} {"train_loss": -5.957496166229248, "global_step": 53816, "epoch": 1281} {"train_loss": -5.892671585083008, "global_step": 53817, "epoch": 1281} {"train_loss": -5.892417907714844, "global_step": 53818, "epoch": 1281} {"train_loss": -5.7939958572387695, "global_step": 53819, "epoch": 1281} {"train_loss": -5.812507629394531, "global_step": 53820, "epoch": 1281} {"train_loss": -5.733821868896484, "global_step": 53821, "epoch": 1281} {"train_loss": -5.8729400634765625, "global_step": 53822, "epoch": 1281} {"train_loss": -5.798069477081299, "global_step": 53823, "epoch": 1281} {"train_loss": -5.757482051849365, "global_step": 53824, "epoch": 1281} {"train_loss": -5.883584022521973, "global_step": 53825, "epoch": 1281} {"train_loss": -5.888439178466797, "global_step": 53826, "epoch": 1281} {"train_loss": -5.802797317504883, "global_step": 53827, "epoch": 1281} {"train_loss": -5.945021629333496, "global_step": 53828, "epoch": 1281} {"train_loss": -5.891778469085693, "global_step": 53829, "epoch": 1281} {"train_loss": -5.7867279052734375, "global_step": 53830, "epoch": 1281} {"train_loss": -5.909092426300049, "global_step": 53831, "epoch": 1281} {"train_loss": -5.928418159484863, "global_step": 53832, "epoch": 1281} {"train_loss": -5.835184097290039, "global_step": 53833, "epoch": 1281} {"train_loss": -5.879268646240234, "global_step": 53834, "epoch": 1281} {"train_loss": -5.69155216217041, "global_step": 53835, "epoch": 1281} {"train_loss": -5.750694274902344, "global_step": 53836, "epoch": 1281} {"train_loss": -5.965624809265137, "global_step": 53837, "epoch": 1281} {"train_loss": -5.840570449829102, "global_step": 53838, "epoch": 1281} {"train_loss": -5.81219482421875, "global_step": 53839, "epoch": 1281} {"train_loss": -5.90906286239624, "global_step": 53840, "epoch": 1281} {"train_loss": -5.908624172210693, "global_step": 53841, "epoch": 1281} {"train_loss": -5.85926628112793, "global_step": 53842, "epoch": 1281} {"train_loss": -5.842469011034284, "global_step": 53843, "epoch": 1281, "val_loss": 61483.96875} {"train_loss": -5.754643440246582, "global_step": 53844, "epoch": 1282} {"train_loss": -5.739959716796875, "global_step": 53845, "epoch": 1282} {"train_loss": -5.655177593231201, "global_step": 53846, "epoch": 1282} {"train_loss": -5.755258083343506, "global_step": 53847, "epoch": 1282} {"train_loss": -5.958955764770508, "global_step": 53848, "epoch": 1282} {"train_loss": -5.750750541687012, "global_step": 53849, "epoch": 1282} {"train_loss": -5.798651218414307, "global_step": 53850, "epoch": 1282} {"train_loss": -5.774118900299072, "global_step": 53851, "epoch": 1282} {"train_loss": -5.811794281005859, "global_step": 53852, "epoch": 1282} {"train_loss": -5.958492279052734, "global_step": 53853, "epoch": 1282} {"train_loss": -5.846223831176758, "global_step": 53854, "epoch": 1282} {"train_loss": -5.922108173370361, "global_step": 53855, "epoch": 1282} {"train_loss": -5.963812351226807, "global_step": 53856, "epoch": 1282} {"train_loss": -5.90403413772583, "global_step": 53857, "epoch": 1282} {"train_loss": -5.84299898147583, "global_step": 53858, "epoch": 1282} {"train_loss": -5.873061180114746, "global_step": 53859, "epoch": 1282} {"train_loss": -5.708827018737793, "global_step": 53860, "epoch": 1282} {"train_loss": -5.848243713378906, "global_step": 53861, "epoch": 1282} {"train_loss": -5.763082504272461, "global_step": 53862, "epoch": 1282} {"train_loss": -5.7075910568237305, "global_step": 53863, "epoch": 1282} {"train_loss": -5.795921325683594, "global_step": 53864, "epoch": 1282} {"train_loss": -5.821490287780762, "global_step": 53865, "epoch": 1282} {"train_loss": -5.813939094543457, "global_step": 53866, "epoch": 1282} {"train_loss": -5.852321147918701, "global_step": 53867, "epoch": 1282} {"train_loss": -5.782622337341309, "global_step": 53868, "epoch": 1282} {"train_loss": -5.832610130310059, "global_step": 53869, "epoch": 1282} {"train_loss": -5.818233489990234, "global_step": 53870, "epoch": 1282} {"train_loss": -5.855878829956055, "global_step": 53871, "epoch": 1282} {"train_loss": -5.813946723937988, "global_step": 53872, "epoch": 1282} {"train_loss": -5.8155670166015625, "global_step": 53873, "epoch": 1282} {"train_loss": -5.715848922729492, "global_step": 53874, "epoch": 1282} {"train_loss": -5.801914691925049, "global_step": 53875, "epoch": 1282} {"train_loss": -5.863690376281738, "global_step": 53876, "epoch": 1282} {"train_loss": -5.893310070037842, "global_step": 53877, "epoch": 1282} {"train_loss": -5.927908897399902, "global_step": 53878, "epoch": 1282} {"train_loss": -5.798418045043945, "global_step": 53879, "epoch": 1282} {"train_loss": -5.894732475280762, "global_step": 53880, "epoch": 1282} {"train_loss": -5.777585983276367, "global_step": 53881, "epoch": 1282} {"train_loss": -5.867617607116699, "global_step": 53882, "epoch": 1282} {"train_loss": -5.754279613494873, "global_step": 53883, "epoch": 1282} {"train_loss": -5.957792282104492, "global_step": 53884, "epoch": 1282} {"train_loss": -5.8256516343071345, "global_step": 53885, "epoch": 1282, "val_loss": 61640.20703125} {"train_loss": -5.75340461730957, "global_step": 53886, "epoch": 1283} {"train_loss": -5.828940391540527, "global_step": 53887, "epoch": 1283} {"train_loss": -5.886882305145264, "global_step": 53888, "epoch": 1283} {"train_loss": -5.826507568359375, "global_step": 53889, "epoch": 1283} {"train_loss": -5.8295369148254395, "global_step": 53890, "epoch": 1283} {"train_loss": -5.830175399780273, "global_step": 53891, "epoch": 1283} {"train_loss": -5.713053226470947, "global_step": 53892, "epoch": 1283} {"train_loss": -5.800846099853516, "global_step": 53893, "epoch": 1283} {"train_loss": -5.8125834465026855, "global_step": 53894, "epoch": 1283} {"train_loss": -5.803833961486816, "global_step": 53895, "epoch": 1283} {"train_loss": -5.843329429626465, "global_step": 53896, "epoch": 1283} {"train_loss": -5.806247711181641, "global_step": 53897, "epoch": 1283} {"train_loss": -5.821772575378418, "global_step": 53898, "epoch": 1283} {"train_loss": -5.733694076538086, "global_step": 53899, "epoch": 1283} {"train_loss": -5.805218696594238, "global_step": 53900, "epoch": 1283} {"train_loss": -5.855752468109131, "global_step": 53901, "epoch": 1283} {"train_loss": -5.828747272491455, "global_step": 53902, "epoch": 1283} {"train_loss": -5.859064102172852, "global_step": 53903, "epoch": 1283} {"train_loss": -5.8708577156066895, "global_step": 53904, "epoch": 1283} {"train_loss": -5.847329616546631, "global_step": 53905, "epoch": 1283} {"train_loss": -5.806536674499512, "global_step": 53906, "epoch": 1283} {"train_loss": -5.852931022644043, "global_step": 53907, "epoch": 1283} {"train_loss": -5.7597856521606445, "global_step": 53908, "epoch": 1283} {"train_loss": -5.983893871307373, "global_step": 53909, "epoch": 1283} {"train_loss": -5.824500560760498, "global_step": 53910, "epoch": 1283} {"train_loss": -5.895316123962402, "global_step": 53911, "epoch": 1283} {"train_loss": -5.82863712310791, "global_step": 53912, "epoch": 1283} {"train_loss": -5.9176130294799805, "global_step": 53913, "epoch": 1283} {"train_loss": -5.8360490798950195, "global_step": 53914, "epoch": 1283} {"train_loss": -5.974621772766113, "global_step": 53915, "epoch": 1283} {"train_loss": -5.825549125671387, "global_step": 53916, "epoch": 1283} {"train_loss": -5.908163070678711, "global_step": 53917, "epoch": 1283} {"train_loss": -5.871212959289551, "global_step": 53918, "epoch": 1283} {"train_loss": -5.768840789794922, "global_step": 53919, "epoch": 1283} {"train_loss": -5.832582473754883, "global_step": 53920, "epoch": 1283} {"train_loss": -5.915339469909668, "global_step": 53921, "epoch": 1283} {"train_loss": -5.936156272888184, "global_step": 53922, "epoch": 1283} {"train_loss": -5.911314964294434, "global_step": 53923, "epoch": 1283} {"train_loss": -5.960738182067871, "global_step": 53924, "epoch": 1283} {"train_loss": -5.732647895812988, "global_step": 53925, "epoch": 1283} {"train_loss": -5.805501937866211, "global_step": 53926, "epoch": 1283} {"train_loss": -5.841805208297003, "global_step": 53927, "epoch": 1283, "val_loss": 61665.09375} {"train_loss": -5.732879638671875, "global_step": 53928, "epoch": 1284} {"train_loss": -5.975225448608398, "global_step": 53929, "epoch": 1284} {"train_loss": -5.737907886505127, "global_step": 53930, "epoch": 1284} {"train_loss": -5.715777397155762, "global_step": 53931, "epoch": 1284} {"train_loss": -5.807263374328613, "global_step": 53932, "epoch": 1284} {"train_loss": -5.829538345336914, "global_step": 53933, "epoch": 1284} {"train_loss": -5.751279830932617, "global_step": 53934, "epoch": 1284} {"train_loss": -5.823434829711914, "global_step": 53935, "epoch": 1284} {"train_loss": -5.968896389007568, "global_step": 53936, "epoch": 1284} {"train_loss": -5.734864234924316, "global_step": 53937, "epoch": 1284} {"train_loss": -5.769872665405273, "global_step": 53938, "epoch": 1284} {"train_loss": -5.863483428955078, "global_step": 53939, "epoch": 1284} {"train_loss": -5.803562164306641, "global_step": 53940, "epoch": 1284} {"train_loss": -5.880744934082031, "global_step": 53941, "epoch": 1284} {"train_loss": -5.9275946617126465, "global_step": 53942, "epoch": 1284} {"train_loss": -5.8383660316467285, "global_step": 53943, "epoch": 1284} {"train_loss": -5.766587257385254, "global_step": 53944, "epoch": 1284} {"train_loss": -5.928741455078125, "global_step": 53945, "epoch": 1284} {"train_loss": -5.772119045257568, "global_step": 53946, "epoch": 1284} {"train_loss": -5.9147443771362305, "global_step": 53947, "epoch": 1284} {"train_loss": -5.864226341247559, "global_step": 53948, "epoch": 1284} {"train_loss": -5.776507377624512, "global_step": 53949, "epoch": 1284} {"train_loss": -5.867775917053223, "global_step": 53950, "epoch": 1284} {"train_loss": -5.880788326263428, "global_step": 53951, "epoch": 1284} {"train_loss": -5.800881385803223, "global_step": 53952, "epoch": 1284} {"train_loss": -5.870122909545898, "global_step": 53953, "epoch": 1284} {"train_loss": -5.782721996307373, "global_step": 53954, "epoch": 1284} {"train_loss": -5.707253932952881, "global_step": 53955, "epoch": 1284} {"train_loss": -5.971675872802734, "global_step": 53956, "epoch": 1284} {"train_loss": -5.904236793518066, "global_step": 53957, "epoch": 1284} {"train_loss": -5.850238800048828, "global_step": 53958, "epoch": 1284} {"train_loss": -5.777256011962891, "global_step": 53959, "epoch": 1284} {"train_loss": -5.758434295654297, "global_step": 53960, "epoch": 1284} {"train_loss": -5.774910926818848, "global_step": 53961, "epoch": 1284} {"train_loss": -5.9051127433776855, "global_step": 53962, "epoch": 1284} {"train_loss": -5.805030345916748, "global_step": 53963, "epoch": 1284} {"train_loss": -5.670007705688477, "global_step": 53964, "epoch": 1284} {"train_loss": -5.873289108276367, "global_step": 53965, "epoch": 1284} {"train_loss": -5.943869590759277, "global_step": 53966, "epoch": 1284} {"train_loss": -5.937978744506836, "global_step": 53967, "epoch": 1284} {"train_loss": -5.830061912536621, "global_step": 53968, "epoch": 1284} {"train_loss": -5.83213920820327, "global_step": 53969, "epoch": 1284, "val_loss": 61332.0234375} {"train_loss": -5.917828559875488, "global_step": 53970, "epoch": 1285} {"train_loss": -5.8245038986206055, "global_step": 53971, "epoch": 1285} {"train_loss": -5.824583053588867, "global_step": 53972, "epoch": 1285} {"train_loss": -5.729098320007324, "global_step": 53973, "epoch": 1285} {"train_loss": -5.725836753845215, "global_step": 53974, "epoch": 1285} {"train_loss": -5.788317680358887, "global_step": 53975, "epoch": 1285} {"train_loss": -5.875125885009766, "global_step": 53976, "epoch": 1285} {"train_loss": -5.812748432159424, "global_step": 53977, "epoch": 1285} {"train_loss": -5.861339569091797, "global_step": 53978, "epoch": 1285} {"train_loss": -5.786679267883301, "global_step": 53979, "epoch": 1285} {"train_loss": -5.8528733253479, "global_step": 53980, "epoch": 1285} {"train_loss": -5.904641151428223, "global_step": 53981, "epoch": 1285} {"train_loss": -5.779825210571289, "global_step": 53982, "epoch": 1285} {"train_loss": -5.861144542694092, "global_step": 53983, "epoch": 1285} {"train_loss": -6.033403396606445, "global_step": 53984, "epoch": 1285} {"train_loss": -5.88673734664917, "global_step": 53985, "epoch": 1285} {"train_loss": -5.907229900360107, "global_step": 53986, "epoch": 1285} {"train_loss": -5.874091148376465, "global_step": 53987, "epoch": 1285} {"train_loss": -5.857127666473389, "global_step": 53988, "epoch": 1285} {"train_loss": -5.934013366699219, "global_step": 53989, "epoch": 1285} {"train_loss": -5.780243873596191, "global_step": 53990, "epoch": 1285} {"train_loss": -5.885927677154541, "global_step": 53991, "epoch": 1285} {"train_loss": -5.915164470672607, "global_step": 53992, "epoch": 1285} {"train_loss": -5.912191390991211, "global_step": 53993, "epoch": 1285} {"train_loss": -5.830599784851074, "global_step": 53994, "epoch": 1285} {"train_loss": -5.928869247436523, "global_step": 53995, "epoch": 1285} {"train_loss": -5.79850959777832, "global_step": 53996, "epoch": 1285} {"train_loss": -5.916067123413086, "global_step": 53997, "epoch": 1285} {"train_loss": -5.725672245025635, "global_step": 53998, "epoch": 1285} {"train_loss": -5.716893672943115, "global_step": 53999, "epoch": 1285} {"train_loss": -5.937128067016602, "global_step": 54000, "epoch": 1285} {"train_loss": -5.815612316131592, "global_step": 54001, "epoch": 1285} {"train_loss": -5.742281436920166, "global_step": 54002, "epoch": 1285} {"train_loss": -5.860690116882324, "global_step": 54003, "epoch": 1285} {"train_loss": -5.855408668518066, "global_step": 54004, "epoch": 1285} {"train_loss": -5.697854518890381, "global_step": 54005, "epoch": 1285} {"train_loss": -5.873011589050293, "global_step": 54006, "epoch": 1285} {"train_loss": -5.841097831726074, "global_step": 54007, "epoch": 1285} {"train_loss": -5.810361385345459, "global_step": 54008, "epoch": 1285} {"train_loss": -5.766702651977539, "global_step": 54009, "epoch": 1285} {"train_loss": -5.8711395263671875, "global_step": 54010, "epoch": 1285} {"train_loss": -5.840458495276315, "global_step": 54011, "epoch": 1285, "val_loss": 61257.69921875} {"train_loss": -5.744675159454346, "global_step": 54012, "epoch": 1286} {"train_loss": -5.9028472900390625, "global_step": 54013, "epoch": 1286} {"train_loss": -5.830957889556885, "global_step": 54014, "epoch": 1286} {"train_loss": -5.912078857421875, "global_step": 54015, "epoch": 1286} {"train_loss": -5.819817543029785, "global_step": 54016, "epoch": 1286} {"train_loss": -5.886299133300781, "global_step": 54017, "epoch": 1286} {"train_loss": -5.906634330749512, "global_step": 54018, "epoch": 1286} {"train_loss": -5.784632682800293, "global_step": 54019, "epoch": 1286} {"train_loss": -5.790767669677734, "global_step": 54020, "epoch": 1286} {"train_loss": -5.877246856689453, "global_step": 54021, "epoch": 1286} {"train_loss": -5.797248363494873, "global_step": 54022, "epoch": 1286} {"train_loss": -5.639591217041016, "global_step": 54023, "epoch": 1286} {"train_loss": -5.838720321655273, "global_step": 54024, "epoch": 1286} {"train_loss": -5.863358497619629, "global_step": 54025, "epoch": 1286} {"train_loss": -5.919105529785156, "global_step": 54026, "epoch": 1286} {"train_loss": -5.823356628417969, "global_step": 54027, "epoch": 1286} {"train_loss": -5.747253894805908, "global_step": 54028, "epoch": 1286} {"train_loss": -5.892012119293213, "global_step": 54029, "epoch": 1286} {"train_loss": -5.732810974121094, "global_step": 54030, "epoch": 1286} {"train_loss": -5.851004600524902, "global_step": 54031, "epoch": 1286} {"train_loss": -5.829217910766602, "global_step": 54032, "epoch": 1286} {"train_loss": -5.936538219451904, "global_step": 54033, "epoch": 1286} {"train_loss": -5.77984094619751, "global_step": 54034, "epoch": 1286} {"train_loss": -5.896064758300781, "global_step": 54035, "epoch": 1286} {"train_loss": -5.906007766723633, "global_step": 54036, "epoch": 1286} {"train_loss": -5.7584028244018555, "global_step": 54037, "epoch": 1286} {"train_loss": -5.900048732757568, "global_step": 54038, "epoch": 1286} {"train_loss": -5.793962001800537, "global_step": 54039, "epoch": 1286} {"train_loss": -5.837958335876465, "global_step": 54040, "epoch": 1286} {"train_loss": -5.868777751922607, "global_step": 54041, "epoch": 1286} {"train_loss": -5.833619117736816, "global_step": 54042, "epoch": 1286} {"train_loss": -5.815457344055176, "global_step": 54043, "epoch": 1286} {"train_loss": -5.843152046203613, "global_step": 54044, "epoch": 1286} {"train_loss": -5.836777687072754, "global_step": 54045, "epoch": 1286} {"train_loss": -5.837318420410156, "global_step": 54046, "epoch": 1286} {"train_loss": -5.827858924865723, "global_step": 54047, "epoch": 1286} {"train_loss": -5.860844612121582, "global_step": 54048, "epoch": 1286} {"train_loss": -5.910998344421387, "global_step": 54049, "epoch": 1286} {"train_loss": -5.862668991088867, "global_step": 54050, "epoch": 1286} {"train_loss": -5.941166877746582, "global_step": 54051, "epoch": 1286} {"train_loss": -5.754682540893555, "global_step": 54052, "epoch": 1286} {"train_loss": -5.837908131735666, "global_step": 54053, "epoch": 1286, "val_loss": 61432.51953125} {"train_loss": -5.840090751647949, "global_step": 54054, "epoch": 1287} {"train_loss": -5.846035480499268, "global_step": 54055, "epoch": 1287} {"train_loss": -5.732327938079834, "global_step": 54056, "epoch": 1287} {"train_loss": -5.790292263031006, "global_step": 54057, "epoch": 1287} {"train_loss": -5.729039192199707, "global_step": 54058, "epoch": 1287} {"train_loss": -5.877467155456543, "global_step": 54059, "epoch": 1287} {"train_loss": -5.883081436157227, "global_step": 54060, "epoch": 1287} {"train_loss": -5.764253616333008, "global_step": 54061, "epoch": 1287} {"train_loss": -5.772976398468018, "global_step": 54062, "epoch": 1287} {"train_loss": -5.7327656745910645, "global_step": 54063, "epoch": 1287} {"train_loss": -5.7321367263793945, "global_step": 54064, "epoch": 1287} {"train_loss": -5.849823951721191, "global_step": 54065, "epoch": 1287} {"train_loss": -5.8411946296691895, "global_step": 54066, "epoch": 1287} {"train_loss": -5.753692150115967, "global_step": 54067, "epoch": 1287} {"train_loss": -5.780843257904053, "global_step": 54068, "epoch": 1287} {"train_loss": -5.797171115875244, "global_step": 54069, "epoch": 1287} {"train_loss": -5.634036064147949, "global_step": 54070, "epoch": 1287} {"train_loss": -5.983997344970703, "global_step": 54071, "epoch": 1287} {"train_loss": -5.743300437927246, "global_step": 54072, "epoch": 1287} {"train_loss": -5.797201156616211, "global_step": 54073, "epoch": 1287} {"train_loss": -5.751566410064697, "global_step": 54074, "epoch": 1287} {"train_loss": -5.901118278503418, "global_step": 54075, "epoch": 1287} {"train_loss": -5.8975677490234375, "global_step": 54076, "epoch": 1287} {"train_loss": -5.737924575805664, "global_step": 54077, "epoch": 1287} {"train_loss": -5.6342926025390625, "global_step": 54078, "epoch": 1287} {"train_loss": -5.6912841796875, "global_step": 54079, "epoch": 1287} {"train_loss": -5.842185020446777, "global_step": 54080, "epoch": 1287} {"train_loss": -5.795618534088135, "global_step": 54081, "epoch": 1287} {"train_loss": -5.921572685241699, "global_step": 54082, "epoch": 1287} {"train_loss": -5.945230484008789, "global_step": 54083, "epoch": 1287} {"train_loss": -5.700367450714111, "global_step": 54084, "epoch": 1287} {"train_loss": -5.805117607116699, "global_step": 54085, "epoch": 1287} {"train_loss": -5.864529609680176, "global_step": 54086, "epoch": 1287} {"train_loss": -5.694365501403809, "global_step": 54087, "epoch": 1287} {"train_loss": -5.962213516235352, "global_step": 54088, "epoch": 1287} {"train_loss": -5.756190776824951, "global_step": 54089, "epoch": 1287} {"train_loss": -5.87624454498291, "global_step": 54090, "epoch": 1287} {"train_loss": -5.8066229820251465, "global_step": 54091, "epoch": 1287} {"train_loss": -5.672460556030273, "global_step": 54092, "epoch": 1287} {"train_loss": -5.756641387939453, "global_step": 54093, "epoch": 1287} {"train_loss": -5.738651275634766, "global_step": 54094, "epoch": 1287} {"train_loss": -5.795688924335298, "global_step": 54095, "epoch": 1287, "val_loss": 61766.9453125} {"train_loss": -5.953424453735352, "global_step": 54096, "epoch": 1288} {"train_loss": -5.71054744720459, "global_step": 54097, "epoch": 1288} {"train_loss": -5.889950752258301, "global_step": 54098, "epoch": 1288} {"train_loss": -5.841001510620117, "global_step": 54099, "epoch": 1288} {"train_loss": -5.796326637268066, "global_step": 54100, "epoch": 1288} {"train_loss": -5.903925895690918, "global_step": 54101, "epoch": 1288} {"train_loss": -5.788603782653809, "global_step": 54102, "epoch": 1288} {"train_loss": -5.91724967956543, "global_step": 54103, "epoch": 1288} {"train_loss": -5.733531951904297, "global_step": 54104, "epoch": 1288} {"train_loss": -5.696905136108398, "global_step": 54105, "epoch": 1288} {"train_loss": -5.721632957458496, "global_step": 54106, "epoch": 1288} {"train_loss": -5.7472310066223145, "global_step": 54107, "epoch": 1288} {"train_loss": -5.805641174316406, "global_step": 54108, "epoch": 1288} {"train_loss": -5.793552398681641, "global_step": 54109, "epoch": 1288} {"train_loss": -5.8562541007995605, "global_step": 54110, "epoch": 1288} {"train_loss": -5.877514839172363, "global_step": 54111, "epoch": 1288} {"train_loss": -5.7937774658203125, "global_step": 54112, "epoch": 1288} {"train_loss": -5.836094856262207, "global_step": 54113, "epoch": 1288} {"train_loss": -5.74713659286499, "global_step": 54114, "epoch": 1288} {"train_loss": -5.841605186462402, "global_step": 54115, "epoch": 1288} {"train_loss": -5.727067470550537, "global_step": 54116, "epoch": 1288} {"train_loss": -5.961264133453369, "global_step": 54117, "epoch": 1288} {"train_loss": -5.863737106323242, "global_step": 54118, "epoch": 1288} {"train_loss": -5.800546169281006, "global_step": 54119, "epoch": 1288} {"train_loss": -5.870649337768555, "global_step": 54120, "epoch": 1288} {"train_loss": -5.878369331359863, "global_step": 54121, "epoch": 1288} {"train_loss": -5.9103522300720215, "global_step": 54122, "epoch": 1288} {"train_loss": -5.779799461364746, "global_step": 54123, "epoch": 1288} {"train_loss": -5.9034743309021, "global_step": 54124, "epoch": 1288} {"train_loss": -5.886000633239746, "global_step": 54125, "epoch": 1288} {"train_loss": -5.828461647033691, "global_step": 54126, "epoch": 1288} {"train_loss": -5.754944801330566, "global_step": 54127, "epoch": 1288} {"train_loss": -5.871399879455566, "global_step": 54128, "epoch": 1288} {"train_loss": -5.9452009201049805, "global_step": 54129, "epoch": 1288} {"train_loss": -5.837114334106445, "global_step": 54130, "epoch": 1288} {"train_loss": -5.875985145568848, "global_step": 54131, "epoch": 1288} {"train_loss": -5.926826477050781, "global_step": 54132, "epoch": 1288} {"train_loss": -5.757266044616699, "global_step": 54133, "epoch": 1288} {"train_loss": -5.936639785766602, "global_step": 54134, "epoch": 1288} {"train_loss": -5.85739278793335, "global_step": 54135, "epoch": 1288} {"train_loss": -5.692477703094482, "global_step": 54136, "epoch": 1288} {"train_loss": -5.829612834112985, "global_step": 54137, "epoch": 1288, "val_loss": 61659.55078125} {"train_loss": -5.923473358154297, "global_step": 54138, "epoch": 1289} {"train_loss": -5.872588634490967, "global_step": 54139, "epoch": 1289} {"train_loss": -5.720389366149902, "global_step": 54140, "epoch": 1289} {"train_loss": -5.75386381149292, "global_step": 54141, "epoch": 1289} {"train_loss": -5.862516403198242, "global_step": 54142, "epoch": 1289} {"train_loss": -5.679329872131348, "global_step": 54143, "epoch": 1289} {"train_loss": -5.75173807144165, "global_step": 54144, "epoch": 1289} {"train_loss": -5.829486846923828, "global_step": 54145, "epoch": 1289} {"train_loss": -5.904396057128906, "global_step": 54146, "epoch": 1289} {"train_loss": -5.854287624359131, "global_step": 54147, "epoch": 1289} {"train_loss": -5.702964782714844, "global_step": 54148, "epoch": 1289} {"train_loss": -5.819559574127197, "global_step": 54149, "epoch": 1289} {"train_loss": -5.816211700439453, "global_step": 54150, "epoch": 1289} {"train_loss": -5.756658554077148, "global_step": 54151, "epoch": 1289} {"train_loss": -5.89802885055542, "global_step": 54152, "epoch": 1289} {"train_loss": -5.766450881958008, "global_step": 54153, "epoch": 1289} {"train_loss": -5.816320419311523, "global_step": 54154, "epoch": 1289} {"train_loss": -5.938701629638672, "global_step": 54155, "epoch": 1289} {"train_loss": -5.9317498207092285, "global_step": 54156, "epoch": 1289} {"train_loss": -5.822422027587891, "global_step": 54157, "epoch": 1289} {"train_loss": -5.800482749938965, "global_step": 54158, "epoch": 1289} {"train_loss": -5.902052879333496, "global_step": 54159, "epoch": 1289} {"train_loss": -5.660524368286133, "global_step": 54160, "epoch": 1289} {"train_loss": -5.741232872009277, "global_step": 54161, "epoch": 1289} {"train_loss": -5.814073085784912, "global_step": 54162, "epoch": 1289} {"train_loss": -5.834169387817383, "global_step": 54163, "epoch": 1289} {"train_loss": -5.782037734985352, "global_step": 54164, "epoch": 1289} {"train_loss": -5.812023162841797, "global_step": 54165, "epoch": 1289} {"train_loss": -5.647065162658691, "global_step": 54166, "epoch": 1289} {"train_loss": -5.822777271270752, "global_step": 54167, "epoch": 1289} {"train_loss": -5.793065071105957, "global_step": 54168, "epoch": 1289} {"train_loss": -5.828704357147217, "global_step": 54169, "epoch": 1289} {"train_loss": -5.857202529907227, "global_step": 54170, "epoch": 1289} {"train_loss": -5.686515808105469, "global_step": 54171, "epoch": 1289} {"train_loss": -5.753457069396973, "global_step": 54172, "epoch": 1289} {"train_loss": -5.753559112548828, "global_step": 54173, "epoch": 1289} {"train_loss": -5.7069091796875, "global_step": 54174, "epoch": 1289} {"train_loss": -5.924160003662109, "global_step": 54175, "epoch": 1289} {"train_loss": -5.639609336853027, "global_step": 54176, "epoch": 1289} {"train_loss": -5.759298324584961, "global_step": 54177, "epoch": 1289} {"train_loss": -5.801198959350586, "global_step": 54178, "epoch": 1289} {"train_loss": -5.800659929003034, "global_step": 54179, "epoch": 1289, "val_loss": 61411.25390625} {"train_loss": -5.742894649505615, "global_step": 54180, "epoch": 1290} {"train_loss": -5.910907745361328, "global_step": 54181, "epoch": 1290} {"train_loss": -5.8661041259765625, "global_step": 54182, "epoch": 1290} {"train_loss": -5.817707061767578, "global_step": 54183, "epoch": 1290} {"train_loss": -5.837508201599121, "global_step": 54184, "epoch": 1290} {"train_loss": -5.735541820526123, "global_step": 54185, "epoch": 1290} {"train_loss": -5.847438812255859, "global_step": 54186, "epoch": 1290} {"train_loss": -5.840389251708984, "global_step": 54187, "epoch": 1290} {"train_loss": -5.877498626708984, "global_step": 54188, "epoch": 1290} {"train_loss": -5.807280540466309, "global_step": 54189, "epoch": 1290} {"train_loss": -5.89124059677124, "global_step": 54190, "epoch": 1290} {"train_loss": -5.717220306396484, "global_step": 54191, "epoch": 1290} {"train_loss": -5.809726715087891, "global_step": 54192, "epoch": 1290} {"train_loss": -5.804768085479736, "global_step": 54193, "epoch": 1290} {"train_loss": -5.744400978088379, "global_step": 54194, "epoch": 1290} {"train_loss": -5.754117012023926, "global_step": 54195, "epoch": 1290} {"train_loss": -5.794450759887695, "global_step": 54196, "epoch": 1290} {"train_loss": -5.7423014640808105, "global_step": 54197, "epoch": 1290} {"train_loss": -5.8236541748046875, "global_step": 54198, "epoch": 1290} {"train_loss": -5.68038272857666, "global_step": 54199, "epoch": 1290} {"train_loss": -5.734623908996582, "global_step": 54200, "epoch": 1290} {"train_loss": -5.848274230957031, "global_step": 54201, "epoch": 1290} {"train_loss": -5.767467498779297, "global_step": 54202, "epoch": 1290} {"train_loss": -5.872429847717285, "global_step": 54203, "epoch": 1290} {"train_loss": -5.789453506469727, "global_step": 54204, "epoch": 1290} {"train_loss": -5.898682594299316, "global_step": 54205, "epoch": 1290} {"train_loss": -5.753963470458984, "global_step": 54206, "epoch": 1290} {"train_loss": -5.821913719177246, "global_step": 54207, "epoch": 1290} {"train_loss": -5.923342227935791, "global_step": 54208, "epoch": 1290} {"train_loss": -5.799808502197266, "global_step": 54209, "epoch": 1290} {"train_loss": -5.886433124542236, "global_step": 54210, "epoch": 1290} {"train_loss": -5.854893207550049, "global_step": 54211, "epoch": 1290} {"train_loss": -5.785688877105713, "global_step": 54212, "epoch": 1290} {"train_loss": -5.715756416320801, "global_step": 54213, "epoch": 1290} {"train_loss": -5.866778373718262, "global_step": 54214, "epoch": 1290} {"train_loss": -5.682950973510742, "global_step": 54215, "epoch": 1290} {"train_loss": -5.847944259643555, "global_step": 54216, "epoch": 1290} {"train_loss": -5.708732604980469, "global_step": 54217, "epoch": 1290} {"train_loss": -5.782817840576172, "global_step": 54218, "epoch": 1290} {"train_loss": -5.865116119384766, "global_step": 54219, "epoch": 1290} {"train_loss": -5.838438034057617, "global_step": 54220, "epoch": 1290} {"train_loss": -5.805653129305158, "global_step": 54221, "epoch": 1290, "val_loss": 61693.796875} {"train_loss": -5.7768235206604, "global_step": 54222, "epoch": 1291} {"train_loss": -5.921886444091797, "global_step": 54223, "epoch": 1291} {"train_loss": -5.886754512786865, "global_step": 54224, "epoch": 1291} {"train_loss": -5.742918014526367, "global_step": 54225, "epoch": 1291} {"train_loss": -5.797579765319824, "global_step": 54226, "epoch": 1291} {"train_loss": -5.856509208679199, "global_step": 54227, "epoch": 1291} {"train_loss": -5.7615861892700195, "global_step": 54228, "epoch": 1291} {"train_loss": -5.770042419433594, "global_step": 54229, "epoch": 1291} {"train_loss": -5.88470458984375, "global_step": 54230, "epoch": 1291} {"train_loss": -5.904152870178223, "global_step": 54231, "epoch": 1291} {"train_loss": -5.802180290222168, "global_step": 54232, "epoch": 1291} {"train_loss": -5.884413242340088, "global_step": 54233, "epoch": 1291} {"train_loss": -5.726499080657959, "global_step": 54234, "epoch": 1291} {"train_loss": -5.964311122894287, "global_step": 54235, "epoch": 1291} {"train_loss": -5.754063606262207, "global_step": 54236, "epoch": 1291} {"train_loss": -5.785950660705566, "global_step": 54237, "epoch": 1291} {"train_loss": -5.77015495300293, "global_step": 54238, "epoch": 1291} {"train_loss": -5.817873001098633, "global_step": 54239, "epoch": 1291} {"train_loss": -6.008622169494629, "global_step": 54240, "epoch": 1291} {"train_loss": -5.888164520263672, "global_step": 54241, "epoch": 1291} {"train_loss": -5.781271934509277, "global_step": 54242, "epoch": 1291} {"train_loss": -5.84492301940918, "global_step": 54243, "epoch": 1291} {"train_loss": -5.911009311676025, "global_step": 54244, "epoch": 1291} {"train_loss": -5.941882133483887, "global_step": 54245, "epoch": 1291} {"train_loss": -5.910057067871094, "global_step": 54246, "epoch": 1291} {"train_loss": -5.762155532836914, "global_step": 54247, "epoch": 1291} {"train_loss": -5.869518280029297, "global_step": 54248, "epoch": 1291} {"train_loss": -5.856204986572266, "global_step": 54249, "epoch": 1291} {"train_loss": -5.723215103149414, "global_step": 54250, "epoch": 1291} {"train_loss": -5.771932125091553, "global_step": 54251, "epoch": 1291} {"train_loss": -5.822797775268555, "global_step": 54252, "epoch": 1291} {"train_loss": -5.8580474853515625, "global_step": 54253, "epoch": 1291} {"train_loss": -5.797060966491699, "global_step": 54254, "epoch": 1291} {"train_loss": -5.625962734222412, "global_step": 54255, "epoch": 1291} {"train_loss": -5.842883110046387, "global_step": 54256, "epoch": 1291} {"train_loss": -5.742560386657715, "global_step": 54257, "epoch": 1291} {"train_loss": -5.854512691497803, "global_step": 54258, "epoch": 1291} {"train_loss": -5.740015029907227, "global_step": 54259, "epoch": 1291} {"train_loss": -5.654696464538574, "global_step": 54260, "epoch": 1291} {"train_loss": -5.756041526794434, "global_step": 54261, "epoch": 1291} {"train_loss": -5.687160491943359, "global_step": 54262, "epoch": 1291} {"train_loss": -5.813626153128488, "global_step": 54263, "epoch": 1291, "val_loss": 61406.39453125} {"train_loss": -5.791165351867676, "global_step": 54264, "epoch": 1292} {"train_loss": -5.77455472946167, "global_step": 54265, "epoch": 1292} {"train_loss": -5.734983444213867, "global_step": 54266, "epoch": 1292} {"train_loss": -5.863052845001221, "global_step": 54267, "epoch": 1292} {"train_loss": -5.7629852294921875, "global_step": 54268, "epoch": 1292} {"train_loss": -5.727859020233154, "global_step": 54269, "epoch": 1292} {"train_loss": -5.83019495010376, "global_step": 54270, "epoch": 1292} {"train_loss": -5.800548076629639, "global_step": 54271, "epoch": 1292} {"train_loss": -5.866070747375488, "global_step": 54272, "epoch": 1292} {"train_loss": -5.7358903884887695, "global_step": 54273, "epoch": 1292} {"train_loss": -5.838250160217285, "global_step": 54274, "epoch": 1292} {"train_loss": -5.84881591796875, "global_step": 54275, "epoch": 1292} {"train_loss": -5.921611785888672, "global_step": 54276, "epoch": 1292} {"train_loss": -5.856132507324219, "global_step": 54277, "epoch": 1292} {"train_loss": -5.840166091918945, "global_step": 54278, "epoch": 1292} {"train_loss": -5.6769328117370605, "global_step": 54279, "epoch": 1292} {"train_loss": -5.747655868530273, "global_step": 54280, "epoch": 1292} {"train_loss": -5.783933639526367, "global_step": 54281, "epoch": 1292} {"train_loss": -5.851446151733398, "global_step": 54282, "epoch": 1292} {"train_loss": -5.822410583496094, "global_step": 54283, "epoch": 1292} {"train_loss": -5.817385673522949, "global_step": 54284, "epoch": 1292} {"train_loss": -5.823151588439941, "global_step": 54285, "epoch": 1292} {"train_loss": -5.9260663986206055, "global_step": 54286, "epoch": 1292} {"train_loss": -5.875938892364502, "global_step": 54287, "epoch": 1292} {"train_loss": -5.841489791870117, "global_step": 54288, "epoch": 1292} {"train_loss": -5.7331132888793945, "global_step": 54289, "epoch": 1292} {"train_loss": -5.923487186431885, "global_step": 54290, "epoch": 1292} {"train_loss": -5.859782695770264, "global_step": 54291, "epoch": 1292} {"train_loss": -5.855158805847168, "global_step": 54292, "epoch": 1292} {"train_loss": -5.702911853790283, "global_step": 54293, "epoch": 1292} {"train_loss": -5.815421104431152, "global_step": 54294, "epoch": 1292} {"train_loss": -5.847171306610107, "global_step": 54295, "epoch": 1292} {"train_loss": -5.918758869171143, "global_step": 54296, "epoch": 1292} {"train_loss": -5.934141635894775, "global_step": 54297, "epoch": 1292} {"train_loss": -5.887141227722168, "global_step": 54298, "epoch": 1292} {"train_loss": -5.808482646942139, "global_step": 54299, "epoch": 1292} {"train_loss": -5.892711639404297, "global_step": 54300, "epoch": 1292} {"train_loss": -5.832008361816406, "global_step": 54301, "epoch": 1292} {"train_loss": -5.87493896484375, "global_step": 54302, "epoch": 1292} {"train_loss": -5.840792179107666, "global_step": 54303, "epoch": 1292} {"train_loss": -5.663361549377441, "global_step": 54304, "epoch": 1292} {"train_loss": -5.825021017165411, "global_step": 54305, "epoch": 1292, "val_loss": 61582.71875} {"train_loss": -5.7975873947143555, "global_step": 54306, "epoch": 1293} {"train_loss": -5.566014289855957, "global_step": 54307, "epoch": 1293} {"train_loss": -5.856879711151123, "global_step": 54308, "epoch": 1293} {"train_loss": -5.790070533752441, "global_step": 54309, "epoch": 1293} {"train_loss": -5.89117956161499, "global_step": 54310, "epoch": 1293} {"train_loss": -5.942939758300781, "global_step": 54311, "epoch": 1293} {"train_loss": -5.67849063873291, "global_step": 54312, "epoch": 1293} {"train_loss": -5.764113426208496, "global_step": 54313, "epoch": 1293} {"train_loss": -5.612167835235596, "global_step": 54314, "epoch": 1293} {"train_loss": -5.872117042541504, "global_step": 54315, "epoch": 1293} {"train_loss": -5.963129043579102, "global_step": 54316, "epoch": 1293} {"train_loss": -5.836489200592041, "global_step": 54317, "epoch": 1293} {"train_loss": -5.855840682983398, "global_step": 54318, "epoch": 1293} {"train_loss": -5.694514274597168, "global_step": 54319, "epoch": 1293} {"train_loss": -5.775984287261963, "global_step": 54320, "epoch": 1293} {"train_loss": -5.829213619232178, "global_step": 54321, "epoch": 1293} {"train_loss": -5.804471969604492, "global_step": 54322, "epoch": 1293} {"train_loss": -5.803336143493652, "global_step": 54323, "epoch": 1293} {"train_loss": -5.731610298156738, "global_step": 54324, "epoch": 1293} {"train_loss": -5.8802809715271, "global_step": 54325, "epoch": 1293} {"train_loss": -5.683266639709473, "global_step": 54326, "epoch": 1293} {"train_loss": -5.8856987953186035, "global_step": 54327, "epoch": 1293} {"train_loss": -5.866644859313965, "global_step": 54328, "epoch": 1293} {"train_loss": -5.977617263793945, "global_step": 54329, "epoch": 1293} {"train_loss": -5.889721870422363, "global_step": 54330, "epoch": 1293} {"train_loss": -5.931349754333496, "global_step": 54331, "epoch": 1293} {"train_loss": -5.775546073913574, "global_step": 54332, "epoch": 1293} {"train_loss": -5.778993606567383, "global_step": 54333, "epoch": 1293} {"train_loss": -5.933545112609863, "global_step": 54334, "epoch": 1293} {"train_loss": -5.78511905670166, "global_step": 54335, "epoch": 1293} {"train_loss": -5.906991004943848, "global_step": 54336, "epoch": 1293} {"train_loss": -5.877158164978027, "global_step": 54337, "epoch": 1293} {"train_loss": -5.769495487213135, "global_step": 54338, "epoch": 1293} {"train_loss": -5.81599235534668, "global_step": 54339, "epoch": 1293} {"train_loss": -5.664292812347412, "global_step": 54340, "epoch": 1293} {"train_loss": -5.73439884185791, "global_step": 54341, "epoch": 1293} {"train_loss": -5.673642158508301, "global_step": 54342, "epoch": 1293} {"train_loss": -5.716588020324707, "global_step": 54343, "epoch": 1293} {"train_loss": -5.773715019226074, "global_step": 54344, "epoch": 1293} {"train_loss": -5.586187839508057, "global_step": 54345, "epoch": 1293} {"train_loss": -5.737767219543457, "global_step": 54346, "epoch": 1293} {"train_loss": -5.795735540844145, "global_step": 54347, "epoch": 1293, "val_loss": 61685.37109375} {"train_loss": -5.814079284667969, "global_step": 54348, "epoch": 1294} {"train_loss": -5.80050802230835, "global_step": 54349, "epoch": 1294} {"train_loss": -5.82381534576416, "global_step": 54350, "epoch": 1294} {"train_loss": -5.831751823425293, "global_step": 54351, "epoch": 1294} {"train_loss": -5.968808650970459, "global_step": 54352, "epoch": 1294} {"train_loss": -5.788336753845215, "global_step": 54353, "epoch": 1294} {"train_loss": -5.885852813720703, "global_step": 54354, "epoch": 1294} {"train_loss": -5.777832984924316, "global_step": 54355, "epoch": 1294} {"train_loss": -5.921796798706055, "global_step": 54356, "epoch": 1294} {"train_loss": -5.825712203979492, "global_step": 54357, "epoch": 1294} {"train_loss": -5.708911418914795, "global_step": 54358, "epoch": 1294} {"train_loss": -5.921772480010986, "global_step": 54359, "epoch": 1294} {"train_loss": -5.918015003204346, "global_step": 54360, "epoch": 1294} {"train_loss": -5.734314918518066, "global_step": 54361, "epoch": 1294} {"train_loss": -5.886749744415283, "global_step": 54362, "epoch": 1294} {"train_loss": -5.691886901855469, "global_step": 54363, "epoch": 1294} {"train_loss": -5.823844909667969, "global_step": 54364, "epoch": 1294} {"train_loss": -5.834728240966797, "global_step": 54365, "epoch": 1294} {"train_loss": -5.8509931564331055, "global_step": 54366, "epoch": 1294} {"train_loss": -5.753368377685547, "global_step": 54367, "epoch": 1294} {"train_loss": -5.853730201721191, "global_step": 54368, "epoch": 1294} {"train_loss": -5.852999687194824, "global_step": 54369, "epoch": 1294} {"train_loss": -5.844095706939697, "global_step": 54370, "epoch": 1294} {"train_loss": -5.846297264099121, "global_step": 54371, "epoch": 1294} {"train_loss": -5.842940330505371, "global_step": 54372, "epoch": 1294} {"train_loss": -5.833483695983887, "global_step": 54373, "epoch": 1294} {"train_loss": -5.823158264160156, "global_step": 54374, "epoch": 1294} {"train_loss": -5.884169101715088, "global_step": 54375, "epoch": 1294} {"train_loss": -5.750627517700195, "global_step": 54376, "epoch": 1294} {"train_loss": -5.834202766418457, "global_step": 54377, "epoch": 1294} {"train_loss": -5.843042373657227, "global_step": 54378, "epoch": 1294} {"train_loss": -5.796069145202637, "global_step": 54379, "epoch": 1294} {"train_loss": -5.731472969055176, "global_step": 54380, "epoch": 1294} {"train_loss": -5.78202486038208, "global_step": 54381, "epoch": 1294} {"train_loss": -5.878098487854004, "global_step": 54382, "epoch": 1294} {"train_loss": -5.650536060333252, "global_step": 54383, "epoch": 1294} {"train_loss": -5.888151168823242, "global_step": 54384, "epoch": 1294} {"train_loss": -5.7617692947387695, "global_step": 54385, "epoch": 1294} {"train_loss": -5.830487251281738, "global_step": 54386, "epoch": 1294} {"train_loss": -5.80849552154541, "global_step": 54387, "epoch": 1294} {"train_loss": -5.871740341186523, "global_step": 54388, "epoch": 1294} {"train_loss": -5.823598350797381, "global_step": 54389, "epoch": 1294, "val_loss": 61607.10546875} {"train_loss": -5.766510963439941, "global_step": 54390, "epoch": 1295} {"train_loss": -5.820278167724609, "global_step": 54391, "epoch": 1295} {"train_loss": -5.9234619140625, "global_step": 54392, "epoch": 1295} {"train_loss": -5.804405689239502, "global_step": 54393, "epoch": 1295} {"train_loss": -5.879479885101318, "global_step": 54394, "epoch": 1295} {"train_loss": -5.939217567443848, "global_step": 54395, "epoch": 1295} {"train_loss": -5.935937881469727, "global_step": 54396, "epoch": 1295} {"train_loss": -5.955726623535156, "global_step": 54397, "epoch": 1295} {"train_loss": -5.786919116973877, "global_step": 54398, "epoch": 1295} {"train_loss": -5.765825271606445, "global_step": 54399, "epoch": 1295} {"train_loss": -5.816018104553223, "global_step": 54400, "epoch": 1295} {"train_loss": -5.862548828125, "global_step": 54401, "epoch": 1295} {"train_loss": -5.795691013336182, "global_step": 54402, "epoch": 1295} {"train_loss": -5.850172519683838, "global_step": 54403, "epoch": 1295} {"train_loss": -5.856077194213867, "global_step": 54404, "epoch": 1295} {"train_loss": -5.885516166687012, "global_step": 54405, "epoch": 1295} {"train_loss": -5.7799482345581055, "global_step": 54406, "epoch": 1295} {"train_loss": -5.751324653625488, "global_step": 54407, "epoch": 1295} {"train_loss": -5.953760147094727, "global_step": 54408, "epoch": 1295} {"train_loss": -5.888408184051514, "global_step": 54409, "epoch": 1295} {"train_loss": -5.865092754364014, "global_step": 54410, "epoch": 1295} {"train_loss": -5.824923515319824, "global_step": 54411, "epoch": 1295} {"train_loss": -5.871889591217041, "global_step": 54412, "epoch": 1295} {"train_loss": -5.809057235717773, "global_step": 54413, "epoch": 1295} {"train_loss": -5.888320446014404, "global_step": 54414, "epoch": 1295} {"train_loss": -5.849933624267578, "global_step": 54415, "epoch": 1295} {"train_loss": -5.80036735534668, "global_step": 54416, "epoch": 1295} {"train_loss": -5.954388618469238, "global_step": 54417, "epoch": 1295} {"train_loss": -5.958542346954346, "global_step": 54418, "epoch": 1295} {"train_loss": -5.806933879852295, "global_step": 54419, "epoch": 1295} {"train_loss": -5.890311241149902, "global_step": 54420, "epoch": 1295} {"train_loss": -5.903812408447266, "global_step": 54421, "epoch": 1295} {"train_loss": -5.758676528930664, "global_step": 54422, "epoch": 1295} {"train_loss": -5.789511680603027, "global_step": 54423, "epoch": 1295} {"train_loss": -5.902791500091553, "global_step": 54424, "epoch": 1295} {"train_loss": -6.008909225463867, "global_step": 54425, "epoch": 1295} {"train_loss": -5.834395885467529, "global_step": 54426, "epoch": 1295} {"train_loss": -5.881943702697754, "global_step": 54427, "epoch": 1295} {"train_loss": -5.809335708618164, "global_step": 54428, "epoch": 1295} {"train_loss": -5.7842864990234375, "global_step": 54429, "epoch": 1295} {"train_loss": -5.799274444580078, "global_step": 54430, "epoch": 1295} {"train_loss": -5.852532307306926, "global_step": 54431, "epoch": 1295, "val_loss": 61586.296875} {"train_loss": -5.817473888397217, "global_step": 54432, "epoch": 1296} {"train_loss": -5.853900909423828, "global_step": 54433, "epoch": 1296} {"train_loss": -5.82438325881958, "global_step": 54434, "epoch": 1296} {"train_loss": -5.883995056152344, "global_step": 54435, "epoch": 1296} {"train_loss": -5.8112030029296875, "global_step": 54436, "epoch": 1296} {"train_loss": -5.8752241134643555, "global_step": 54437, "epoch": 1296} {"train_loss": -5.791171073913574, "global_step": 54438, "epoch": 1296} {"train_loss": -5.95139217376709, "global_step": 54439, "epoch": 1296} {"train_loss": -5.9010009765625, "global_step": 54440, "epoch": 1296} {"train_loss": -5.872413158416748, "global_step": 54441, "epoch": 1296} {"train_loss": -5.811049461364746, "global_step": 54442, "epoch": 1296} {"train_loss": -5.818069934844971, "global_step": 54443, "epoch": 1296} {"train_loss": -5.704049587249756, "global_step": 54444, "epoch": 1296} {"train_loss": -5.868435859680176, "global_step": 54445, "epoch": 1296} {"train_loss": -5.990096569061279, "global_step": 54446, "epoch": 1296} {"train_loss": -5.741240978240967, "global_step": 54447, "epoch": 1296} {"train_loss": -5.784811496734619, "global_step": 54448, "epoch": 1296} {"train_loss": -5.76629638671875, "global_step": 54449, "epoch": 1296} {"train_loss": -5.730834484100342, "global_step": 54450, "epoch": 1296} {"train_loss": -5.835903644561768, "global_step": 54451, "epoch": 1296} {"train_loss": -5.800843715667725, "global_step": 54452, "epoch": 1296} {"train_loss": -5.734504699707031, "global_step": 54453, "epoch": 1296} {"train_loss": -5.845944404602051, "global_step": 54454, "epoch": 1296} {"train_loss": -5.750515937805176, "global_step": 54455, "epoch": 1296} {"train_loss": -5.846271991729736, "global_step": 54456, "epoch": 1296} {"train_loss": -5.832002639770508, "global_step": 54457, "epoch": 1296} {"train_loss": -5.820573329925537, "global_step": 54458, "epoch": 1296} {"train_loss": -5.831144332885742, "global_step": 54459, "epoch": 1296} {"train_loss": -5.783193111419678, "global_step": 54460, "epoch": 1296} {"train_loss": -5.726174354553223, "global_step": 54461, "epoch": 1296} {"train_loss": -5.901470184326172, "global_step": 54462, "epoch": 1296} {"train_loss": -5.761478424072266, "global_step": 54463, "epoch": 1296} {"train_loss": -5.9253129959106445, "global_step": 54464, "epoch": 1296} {"train_loss": -5.7980852127075195, "global_step": 54465, "epoch": 1296} {"train_loss": -5.771714210510254, "global_step": 54466, "epoch": 1296} {"train_loss": -5.7897796630859375, "global_step": 54467, "epoch": 1296} {"train_loss": -5.773136138916016, "global_step": 54468, "epoch": 1296} {"train_loss": -5.779926776885986, "global_step": 54469, "epoch": 1296} {"train_loss": -5.896581649780273, "global_step": 54470, "epoch": 1296} {"train_loss": -5.970394134521484, "global_step": 54471, "epoch": 1296} {"train_loss": -5.929808616638184, "global_step": 54472, "epoch": 1296} {"train_loss": -5.828961077190581, "global_step": 54473, "epoch": 1296, "val_loss": 61252.10546875} {"train_loss": -5.926983833312988, "global_step": 54474, "epoch": 1297} {"train_loss": -5.947885513305664, "global_step": 54475, "epoch": 1297} {"train_loss": -5.715615749359131, "global_step": 54476, "epoch": 1297} {"train_loss": -5.837642669677734, "global_step": 54477, "epoch": 1297} {"train_loss": -5.8782806396484375, "global_step": 54478, "epoch": 1297} {"train_loss": -5.614127159118652, "global_step": 54479, "epoch": 1297} {"train_loss": -5.878071308135986, "global_step": 54480, "epoch": 1297} {"train_loss": -5.973358154296875, "global_step": 54481, "epoch": 1297} {"train_loss": -5.852607250213623, "global_step": 54482, "epoch": 1297} {"train_loss": -5.7909746170043945, "global_step": 54483, "epoch": 1297} {"train_loss": -5.866682052612305, "global_step": 54484, "epoch": 1297} {"train_loss": -5.880776405334473, "global_step": 54485, "epoch": 1297} {"train_loss": -5.8037614822387695, "global_step": 54486, "epoch": 1297} {"train_loss": -5.9111328125, "global_step": 54487, "epoch": 1297} {"train_loss": -5.970728397369385, "global_step": 54488, "epoch": 1297} {"train_loss": -5.666377067565918, "global_step": 54489, "epoch": 1297} {"train_loss": -5.7845306396484375, "global_step": 54490, "epoch": 1297} {"train_loss": -5.720710277557373, "global_step": 54491, "epoch": 1297} {"train_loss": -5.767112731933594, "global_step": 54492, "epoch": 1297} {"train_loss": -5.779738426208496, "global_step": 54493, "epoch": 1297} {"train_loss": -5.919541358947754, "global_step": 54494, "epoch": 1297} {"train_loss": -5.883472442626953, "global_step": 54495, "epoch": 1297} {"train_loss": -5.781947135925293, "global_step": 54496, "epoch": 1297} {"train_loss": -5.830043792724609, "global_step": 54497, "epoch": 1297} {"train_loss": -5.908442497253418, "global_step": 54498, "epoch": 1297} {"train_loss": -5.889745712280273, "global_step": 54499, "epoch": 1297} {"train_loss": -5.975454807281494, "global_step": 54500, "epoch": 1297} {"train_loss": -5.830228805541992, "global_step": 54501, "epoch": 1297} {"train_loss": -5.831782341003418, "global_step": 54502, "epoch": 1297} {"train_loss": -5.807966232299805, "global_step": 54503, "epoch": 1297} {"train_loss": -5.722979545593262, "global_step": 54504, "epoch": 1297} {"train_loss": -5.881102561950684, "global_step": 54505, "epoch": 1297} {"train_loss": -5.883087158203125, "global_step": 54506, "epoch": 1297} {"train_loss": -5.856475353240967, "global_step": 54507, "epoch": 1297} {"train_loss": -5.860531806945801, "global_step": 54508, "epoch": 1297} {"train_loss": -5.851128578186035, "global_step": 54509, "epoch": 1297} {"train_loss": -6.005035400390625, "global_step": 54510, "epoch": 1297} {"train_loss": -5.760859966278076, "global_step": 54511, "epoch": 1297} {"train_loss": -5.889046669006348, "global_step": 54512, "epoch": 1297} {"train_loss": -5.871006965637207, "global_step": 54513, "epoch": 1297} {"train_loss": -5.785337448120117, "global_step": 54514, "epoch": 1297} {"train_loss": -5.843440192086356, "global_step": 54515, "epoch": 1297, "val_loss": 61371.68359375} {"train_loss": -5.829720497131348, "global_step": 54516, "epoch": 1298} {"train_loss": -5.724947929382324, "global_step": 54517, "epoch": 1298} {"train_loss": -5.803653717041016, "global_step": 54518, "epoch": 1298} {"train_loss": -5.964241027832031, "global_step": 54519, "epoch": 1298} {"train_loss": -5.836021423339844, "global_step": 54520, "epoch": 1298} {"train_loss": -5.826207160949707, "global_step": 54521, "epoch": 1298} {"train_loss": -5.969942092895508, "global_step": 54522, "epoch": 1298} {"train_loss": -5.9853620529174805, "global_step": 54523, "epoch": 1298} {"train_loss": -5.865385055541992, "global_step": 54524, "epoch": 1298} {"train_loss": -5.840928077697754, "global_step": 54525, "epoch": 1298} {"train_loss": -5.81813383102417, "global_step": 54526, "epoch": 1298} {"train_loss": -5.821592807769775, "global_step": 54527, "epoch": 1298} {"train_loss": -5.730518341064453, "global_step": 54528, "epoch": 1298} {"train_loss": -5.916975498199463, "global_step": 54529, "epoch": 1298} {"train_loss": -5.98170280456543, "global_step": 54530, "epoch": 1298} {"train_loss": -5.756266117095947, "global_step": 54531, "epoch": 1298} {"train_loss": -5.828199863433838, "global_step": 54532, "epoch": 1298} {"train_loss": -5.867889404296875, "global_step": 54533, "epoch": 1298} {"train_loss": -5.861837387084961, "global_step": 54534, "epoch": 1298} {"train_loss": -5.806777000427246, "global_step": 54535, "epoch": 1298} {"train_loss": -5.950847625732422, "global_step": 54536, "epoch": 1298} {"train_loss": -5.767054557800293, "global_step": 54537, "epoch": 1298} {"train_loss": -5.765082836151123, "global_step": 54538, "epoch": 1298} {"train_loss": -5.860030174255371, "global_step": 54539, "epoch": 1298} {"train_loss": -5.776187419891357, "global_step": 54540, "epoch": 1298} {"train_loss": -5.763951301574707, "global_step": 54541, "epoch": 1298} {"train_loss": -5.7061567306518555, "global_step": 54542, "epoch": 1298} {"train_loss": -5.726803302764893, "global_step": 54543, "epoch": 1298} {"train_loss": -5.752934455871582, "global_step": 54544, "epoch": 1298} {"train_loss": -5.821777820587158, "global_step": 54545, "epoch": 1298} {"train_loss": -5.827137470245361, "global_step": 54546, "epoch": 1298} {"train_loss": -5.74337100982666, "global_step": 54547, "epoch": 1298} {"train_loss": -5.800641059875488, "global_step": 54548, "epoch": 1298} {"train_loss": -5.801307678222656, "global_step": 54549, "epoch": 1298} {"train_loss": -5.940898418426514, "global_step": 54550, "epoch": 1298} {"train_loss": -5.650350570678711, "global_step": 54551, "epoch": 1298} {"train_loss": -5.827452659606934, "global_step": 54552, "epoch": 1298} {"train_loss": -5.923746109008789, "global_step": 54553, "epoch": 1298} {"train_loss": -5.749118804931641, "global_step": 54554, "epoch": 1298} {"train_loss": -5.8214240074157715, "global_step": 54555, "epoch": 1298} {"train_loss": -5.6981401443481445, "global_step": 54556, "epoch": 1298} {"train_loss": -5.8230933121272495, "global_step": 54557, "epoch": 1298, "val_loss": 61420.65234375} {"train_loss": -5.85037899017334, "global_step": 54558, "epoch": 1299} {"train_loss": -5.832510948181152, "global_step": 54559, "epoch": 1299} {"train_loss": -5.851513862609863, "global_step": 54560, "epoch": 1299} {"train_loss": -5.811220645904541, "global_step": 54561, "epoch": 1299} {"train_loss": -5.8069000244140625, "global_step": 54562, "epoch": 1299} {"train_loss": -5.897488594055176, "global_step": 54563, "epoch": 1299} {"train_loss": -5.826706886291504, "global_step": 54564, "epoch": 1299} {"train_loss": -5.876719951629639, "global_step": 54565, "epoch": 1299} {"train_loss": -5.871103286743164, "global_step": 54566, "epoch": 1299} {"train_loss": -5.78171968460083, "global_step": 54567, "epoch": 1299} {"train_loss": -5.873086452484131, "global_step": 54568, "epoch": 1299} {"train_loss": -5.8092570304870605, "global_step": 54569, "epoch": 1299} {"train_loss": -5.774635314941406, "global_step": 54570, "epoch": 1299} {"train_loss": -5.800683498382568, "global_step": 54571, "epoch": 1299} {"train_loss": -5.772676944732666, "global_step": 54572, "epoch": 1299} {"train_loss": -5.8931565284729, "global_step": 54573, "epoch": 1299} {"train_loss": -5.855647563934326, "global_step": 54574, "epoch": 1299} {"train_loss": -5.793649196624756, "global_step": 54575, "epoch": 1299} {"train_loss": -5.775002956390381, "global_step": 54576, "epoch": 1299} {"train_loss": -5.844522953033447, "global_step": 54577, "epoch": 1299} {"train_loss": -5.732625484466553, "global_step": 54578, "epoch": 1299} {"train_loss": -5.769227981567383, "global_step": 54579, "epoch": 1299} {"train_loss": -5.716347694396973, "global_step": 54580, "epoch": 1299} {"train_loss": -5.791871070861816, "global_step": 54581, "epoch": 1299} {"train_loss": -5.864175796508789, "global_step": 54582, "epoch": 1299} {"train_loss": -5.871519088745117, "global_step": 54583, "epoch": 1299} {"train_loss": -5.7466020584106445, "global_step": 54584, "epoch": 1299} {"train_loss": -5.853340148925781, "global_step": 54585, "epoch": 1299} {"train_loss": -5.870922088623047, "global_step": 54586, "epoch": 1299} {"train_loss": -5.828134536743164, "global_step": 54587, "epoch": 1299} {"train_loss": -5.89466667175293, "global_step": 54588, "epoch": 1299} {"train_loss": -5.925439357757568, "global_step": 54589, "epoch": 1299} {"train_loss": -5.78460693359375, "global_step": 54590, "epoch": 1299} {"train_loss": -5.765807151794434, "global_step": 54591, "epoch": 1299} {"train_loss": -5.735604763031006, "global_step": 54592, "epoch": 1299} {"train_loss": -5.801574230194092, "global_step": 54593, "epoch": 1299} {"train_loss": -5.672662258148193, "global_step": 54594, "epoch": 1299} {"train_loss": -5.670888900756836, "global_step": 54595, "epoch": 1299} {"train_loss": -5.814583778381348, "global_step": 54596, "epoch": 1299} {"train_loss": -5.828635215759277, "global_step": 54597, "epoch": 1299} {"train_loss": -5.779346466064453, "global_step": 54598, "epoch": 1299} {"train_loss": -5.812599431900751, "global_step": 54599, "epoch": 1299, "val_loss": 61316.0078125} {"train_loss": -5.842283248901367, "global_step": 54600, "epoch": 1300} {"train_loss": -5.907469749450684, "global_step": 54601, "epoch": 1300} {"train_loss": -5.880368232727051, "global_step": 54602, "epoch": 1300} {"train_loss": -5.780365943908691, "global_step": 54603, "epoch": 1300} {"train_loss": -5.808825492858887, "global_step": 54604, "epoch": 1300} {"train_loss": -5.711971282958984, "global_step": 54605, "epoch": 1300} {"train_loss": -5.954110145568848, "global_step": 54606, "epoch": 1300} {"train_loss": -5.9192304611206055, "global_step": 54607, "epoch": 1300} {"train_loss": -5.8530683517456055, "global_step": 54608, "epoch": 1300} {"train_loss": -5.730442523956299, "global_step": 54609, "epoch": 1300} {"train_loss": -5.916889190673828, "global_step": 54610, "epoch": 1300} {"train_loss": -5.795568466186523, "global_step": 54611, "epoch": 1300} {"train_loss": -5.875682830810547, "global_step": 54612, "epoch": 1300} {"train_loss": -5.803897380828857, "global_step": 54613, "epoch": 1300} {"train_loss": -5.68691349029541, "global_step": 54614, "epoch": 1300} {"train_loss": -5.862092971801758, "global_step": 54615, "epoch": 1300} {"train_loss": -5.786354064941406, "global_step": 54616, "epoch": 1300} {"train_loss": -5.8418684005737305, "global_step": 54617, "epoch": 1300} {"train_loss": -5.964902877807617, "global_step": 54618, "epoch": 1300} {"train_loss": -5.773162841796875, "global_step": 54619, "epoch": 1300} {"train_loss": -5.844062328338623, "global_step": 54620, "epoch": 1300} {"train_loss": -5.86624813079834, "global_step": 54621, "epoch": 1300} {"train_loss": -5.85463809967041, "global_step": 54622, "epoch": 1300} {"train_loss": -5.834842681884766, "global_step": 54623, "epoch": 1300} {"train_loss": -5.835768222808838, "global_step": 54624, "epoch": 1300} {"train_loss": -5.6507110595703125, "global_step": 54625, "epoch": 1300} {"train_loss": -5.878508567810059, "global_step": 54626, "epoch": 1300} {"train_loss": -5.913793563842773, "global_step": 54627, "epoch": 1300} {"train_loss": -5.6700592041015625, "global_step": 54628, "epoch": 1300} {"train_loss": -6.011677265167236, "global_step": 54629, "epoch": 1300} {"train_loss": -5.941715717315674, "global_step": 54630, "epoch": 1300} {"train_loss": -5.624333381652832, "global_step": 54631, "epoch": 1300} {"train_loss": -5.861640930175781, "global_step": 54632, "epoch": 1300} {"train_loss": -5.68939208984375, "global_step": 54633, "epoch": 1300} {"train_loss": -5.939517498016357, "global_step": 54634, "epoch": 1300} {"train_loss": -5.717288017272949, "global_step": 54635, "epoch": 1300} {"train_loss": -5.763689994812012, "global_step": 54636, "epoch": 1300} {"train_loss": -5.878324508666992, "global_step": 54637, "epoch": 1300} {"train_loss": -5.7900848388671875, "global_step": 54638, "epoch": 1300} {"train_loss": -5.884376525878906, "global_step": 54639, "epoch": 1300} {"train_loss": -5.787472724914551, "global_step": 54640, "epoch": 1300} {"train_loss": -5.8284366357894175, "global_step": 54641, "epoch": 1300, "train/sim_max_reward_0": 0.9681655378223045, "train/sim_max_reward_1": 0.25075410707338747, "train/sim_max_reward_2": 0.8238790974432457, "train/sim_max_reward_3": 0.9226403467706344, "train/sim_max_reward_4": 0.9431215802957721, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8819106357828911, "test/sim_max_reward_4300001": 0.49126678582368083, "test/sim_max_reward_4300002": 0.766439499817173, "test/sim_max_reward_4300003": 0.8028727434816896, "test/sim_max_reward_4300004": 0.12338513656677721, "test/sim_max_reward_4300005": 0.7659865933660065, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.37352069108723135, "test/sim_max_reward_4300008": 0.8099788833598737, "test/sim_max_reward_4300009": 0.8880310080084064, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.33059595114740004, "test/sim_max_reward_4300012": 0.90780365467365, "test/sim_max_reward_4300013": 0.31824489874725537, "test/sim_max_reward_4300014": 0.8433530947272784, "test/sim_max_reward_4300015": 0.9737633524070786, "test/sim_max_reward_4300016": 0.5566326209629106, "test/sim_max_reward_4300017": 0.7425634367570889, "test/sim_max_reward_4300018": 0.8986675668723794, "test/sim_max_reward_4300019": 0.18635168122877757, "test/sim_max_reward_4300020": 0.7253916352217761, "test/sim_max_reward_4300021": 0.7987218298386342, "test/sim_max_reward_4300022": 0.3238171519404918, "test/sim_max_reward_4300023": 0.3567727814362661, "test/sim_max_reward_4300024": 0.038739983583372294, "test/sim_max_reward_4300025": 0.9842044030690823, "test/sim_max_reward_4300026": 0.1657255046838938, "test/sim_max_reward_4300027": 0.7177175228073858, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.27477694787464474, "test/sim_max_reward_4300031": 0.2888353210678564, "test/sim_max_reward_4300032": 0.6325507031549528, "test/sim_max_reward_4300033": 0.45774919561831867, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9831518990814406, "test/sim_max_reward_4300038": 0.35903546227252014, "test/sim_max_reward_4300039": 0.8674003461840404, "test/sim_max_reward_4300040": 0.2479693551069725, "test/sim_max_reward_4300041": 0.9418883296771247, "test/sim_max_reward_4300042": 0.6586048679847462, "test/sim_max_reward_4300043": 0.17240863155534186, "test/sim_max_reward_4300044": 0.8358638773344881, "test/sim_max_reward_4300045": 0.16610941576343138, "test/sim_max_reward_4300046": 0.2516955105823629, "test/sim_max_reward_4300047": 0.15205138174937105, "test/sim_max_reward_4300048": 0.32052585734973915, "test/sim_max_reward_4300049": 0.19409640992669716, "train/mean_score": 0.6835909047945886, "test/mean_score": 0.4755273335049196, "val_loss": 61286.37890625} {"train_loss": -5.873922824859619, "global_step": 54642, "epoch": 1301} {"train_loss": -5.903820037841797, "global_step": 54643, "epoch": 1301} {"train_loss": -5.836627960205078, "global_step": 54644, "epoch": 1301} {"train_loss": -5.768250465393066, "global_step": 54645, "epoch": 1301} {"train_loss": -5.726776123046875, "global_step": 54646, "epoch": 1301} {"train_loss": -5.691264629364014, "global_step": 54647, "epoch": 1301} {"train_loss": -5.932455062866211, "global_step": 54648, "epoch": 1301} {"train_loss": -5.775815963745117, "global_step": 54649, "epoch": 1301} {"train_loss": -5.84157657623291, "global_step": 54650, "epoch": 1301} {"train_loss": -5.863746643066406, "global_step": 54651, "epoch": 1301} {"train_loss": -5.845429420471191, "global_step": 54652, "epoch": 1301} {"train_loss": -5.891056060791016, "global_step": 54653, "epoch": 1301} {"train_loss": -5.8698835372924805, "global_step": 54654, "epoch": 1301} {"train_loss": -5.8189167976379395, "global_step": 54655, "epoch": 1301} {"train_loss": -5.8658833503723145, "global_step": 54656, "epoch": 1301} {"train_loss": -5.904992580413818, "global_step": 54657, "epoch": 1301} {"train_loss": -5.657049655914307, "global_step": 54658, "epoch": 1301} {"train_loss": -5.976323127746582, "global_step": 54659, "epoch": 1301} {"train_loss": -5.782113552093506, "global_step": 54660, "epoch": 1301} {"train_loss": -5.727774143218994, "global_step": 54661, "epoch": 1301} {"train_loss": -5.719679832458496, "global_step": 54662, "epoch": 1301} {"train_loss": -5.806210517883301, "global_step": 54663, "epoch": 1301} {"train_loss": -5.833034515380859, "global_step": 54664, "epoch": 1301} {"train_loss": -5.744463920593262, "global_step": 54665, "epoch": 1301} {"train_loss": -5.901533126831055, "global_step": 54666, "epoch": 1301} {"train_loss": -5.7912278175354, "global_step": 54667, "epoch": 1301} {"train_loss": -5.803375244140625, "global_step": 54668, "epoch": 1301} {"train_loss": -5.855785369873047, "global_step": 54669, "epoch": 1301} {"train_loss": -5.8572845458984375, "global_step": 54670, "epoch": 1301} {"train_loss": -5.832446098327637, "global_step": 54671, "epoch": 1301} {"train_loss": -5.844935417175293, "global_step": 54672, "epoch": 1301} {"train_loss": -5.826276779174805, "global_step": 54673, "epoch": 1301} {"train_loss": -5.894100666046143, "global_step": 54674, "epoch": 1301} {"train_loss": -5.971260070800781, "global_step": 54675, "epoch": 1301} {"train_loss": -5.8371405601501465, "global_step": 54676, "epoch": 1301} {"train_loss": -5.79233455657959, "global_step": 54677, "epoch": 1301} {"train_loss": -5.919281959533691, "global_step": 54678, "epoch": 1301} {"train_loss": -5.717219829559326, "global_step": 54679, "epoch": 1301} {"train_loss": -5.7964582443237305, "global_step": 54680, "epoch": 1301} {"train_loss": -5.8676862716674805, "global_step": 54681, "epoch": 1301} {"train_loss": -5.74800968170166, "global_step": 54682, "epoch": 1301} {"train_loss": -5.827434800920033, "global_step": 54683, "epoch": 1301, "val_loss": 61579.7265625} {"train_loss": -5.9005584716796875, "global_step": 54684, "epoch": 1302} {"train_loss": -5.896781921386719, "global_step": 54685, "epoch": 1302} {"train_loss": -5.773609161376953, "global_step": 54686, "epoch": 1302} {"train_loss": -5.950133800506592, "global_step": 54687, "epoch": 1302} {"train_loss": -5.7410383224487305, "global_step": 54688, "epoch": 1302} {"train_loss": -5.8667402267456055, "global_step": 54689, "epoch": 1302} {"train_loss": -5.894034385681152, "global_step": 54690, "epoch": 1302} {"train_loss": -5.771401405334473, "global_step": 54691, "epoch": 1302} {"train_loss": -5.889374732971191, "global_step": 54692, "epoch": 1302} {"train_loss": -5.876575946807861, "global_step": 54693, "epoch": 1302} {"train_loss": -5.792738914489746, "global_step": 54694, "epoch": 1302} {"train_loss": -5.908168315887451, "global_step": 54695, "epoch": 1302} {"train_loss": -5.738039016723633, "global_step": 54696, "epoch": 1302} {"train_loss": -5.769125938415527, "global_step": 54697, "epoch": 1302} {"train_loss": -5.620297431945801, "global_step": 54698, "epoch": 1302} {"train_loss": -5.807245254516602, "global_step": 54699, "epoch": 1302} {"train_loss": -5.759746551513672, "global_step": 54700, "epoch": 1302} {"train_loss": -5.791748046875, "global_step": 54701, "epoch": 1302} {"train_loss": -5.752127647399902, "global_step": 54702, "epoch": 1302} {"train_loss": -5.787158966064453, "global_step": 54703, "epoch": 1302} {"train_loss": -5.907663345336914, "global_step": 54704, "epoch": 1302} {"train_loss": -5.800910949707031, "global_step": 54705, "epoch": 1302} {"train_loss": -5.862138748168945, "global_step": 54706, "epoch": 1302} {"train_loss": -5.843544960021973, "global_step": 54707, "epoch": 1302} {"train_loss": -5.763726234436035, "global_step": 54708, "epoch": 1302} {"train_loss": -5.752535820007324, "global_step": 54709, "epoch": 1302} {"train_loss": -5.765429496765137, "global_step": 54710, "epoch": 1302} {"train_loss": -5.845814228057861, "global_step": 54711, "epoch": 1302} {"train_loss": -5.769585132598877, "global_step": 54712, "epoch": 1302} {"train_loss": -5.718296051025391, "global_step": 54713, "epoch": 1302} {"train_loss": -5.805284023284912, "global_step": 54714, "epoch": 1302} {"train_loss": -5.805927276611328, "global_step": 54715, "epoch": 1302} {"train_loss": -5.893246650695801, "global_step": 54716, "epoch": 1302} {"train_loss": -5.908988952636719, "global_step": 54717, "epoch": 1302} {"train_loss": -5.854520797729492, "global_step": 54718, "epoch": 1302} {"train_loss": -5.741387844085693, "global_step": 54719, "epoch": 1302} {"train_loss": -5.916420936584473, "global_step": 54720, "epoch": 1302} {"train_loss": -5.846182823181152, "global_step": 54721, "epoch": 1302} {"train_loss": -5.812440395355225, "global_step": 54722, "epoch": 1302} {"train_loss": -5.896292686462402, "global_step": 54723, "epoch": 1302} {"train_loss": -5.827857971191406, "global_step": 54724, "epoch": 1302} {"train_loss": -5.820837951841808, "global_step": 54725, "epoch": 1302, "val_loss": 61421.28125} {"train_loss": -5.774251937866211, "global_step": 54726, "epoch": 1303} {"train_loss": -6.019899845123291, "global_step": 54727, "epoch": 1303} {"train_loss": -5.825011253356934, "global_step": 54728, "epoch": 1303} {"train_loss": -5.885766983032227, "global_step": 54729, "epoch": 1303} {"train_loss": -5.87557315826416, "global_step": 54730, "epoch": 1303} {"train_loss": -5.796687126159668, "global_step": 54731, "epoch": 1303} {"train_loss": -5.923515796661377, "global_step": 54732, "epoch": 1303} {"train_loss": -5.885257720947266, "global_step": 54733, "epoch": 1303} {"train_loss": -5.815855026245117, "global_step": 54734, "epoch": 1303} {"train_loss": -5.731858253479004, "global_step": 54735, "epoch": 1303} {"train_loss": -5.863135814666748, "global_step": 54736, "epoch": 1303} {"train_loss": -6.046121120452881, "global_step": 54737, "epoch": 1303} {"train_loss": -5.951529502868652, "global_step": 54738, "epoch": 1303} {"train_loss": -5.912692070007324, "global_step": 54739, "epoch": 1303} {"train_loss": -5.906180381774902, "global_step": 54740, "epoch": 1303} {"train_loss": -5.871546268463135, "global_step": 54741, "epoch": 1303} {"train_loss": -5.8384575843811035, "global_step": 54742, "epoch": 1303} {"train_loss": -5.75753927230835, "global_step": 54743, "epoch": 1303} {"train_loss": -5.980663776397705, "global_step": 54744, "epoch": 1303} {"train_loss": -5.955063819885254, "global_step": 54745, "epoch": 1303} {"train_loss": -5.733614444732666, "global_step": 54746, "epoch": 1303} {"train_loss": -5.789037704467773, "global_step": 54747, "epoch": 1303} {"train_loss": -5.84295654296875, "global_step": 54748, "epoch": 1303} {"train_loss": -5.736486434936523, "global_step": 54749, "epoch": 1303} {"train_loss": -5.8371477127075195, "global_step": 54750, "epoch": 1303} {"train_loss": -5.721624374389648, "global_step": 54751, "epoch": 1303} {"train_loss": -5.711663246154785, "global_step": 54752, "epoch": 1303} {"train_loss": -5.891602516174316, "global_step": 54753, "epoch": 1303} {"train_loss": -5.86063289642334, "global_step": 54754, "epoch": 1303} {"train_loss": -5.781949043273926, "global_step": 54755, "epoch": 1303} {"train_loss": -5.705145835876465, "global_step": 54756, "epoch": 1303} {"train_loss": -5.867290496826172, "global_step": 54757, "epoch": 1303} {"train_loss": -5.9471025466918945, "global_step": 54758, "epoch": 1303} {"train_loss": -5.928216934204102, "global_step": 54759, "epoch": 1303} {"train_loss": -5.877416133880615, "global_step": 54760, "epoch": 1303} {"train_loss": -5.931849956512451, "global_step": 54761, "epoch": 1303} {"train_loss": -5.857597351074219, "global_step": 54762, "epoch": 1303} {"train_loss": -5.911210060119629, "global_step": 54763, "epoch": 1303} {"train_loss": -5.879528045654297, "global_step": 54764, "epoch": 1303} {"train_loss": -5.631142616271973, "global_step": 54765, "epoch": 1303} {"train_loss": -5.906938076019287, "global_step": 54766, "epoch": 1303} {"train_loss": -5.851312762215024, "global_step": 54767, "epoch": 1303, "val_loss": 61148.87890625} {"train_loss": -5.833559036254883, "global_step": 54768, "epoch": 1304} {"train_loss": -5.855870246887207, "global_step": 54769, "epoch": 1304} {"train_loss": -5.866274833679199, "global_step": 54770, "epoch": 1304} {"train_loss": -5.857828140258789, "global_step": 54771, "epoch": 1304} {"train_loss": -5.7881317138671875, "global_step": 54772, "epoch": 1304} {"train_loss": -5.908473491668701, "global_step": 54773, "epoch": 1304} {"train_loss": -5.922309875488281, "global_step": 54774, "epoch": 1304} {"train_loss": -5.918771743774414, "global_step": 54775, "epoch": 1304} {"train_loss": -5.701731204986572, "global_step": 54776, "epoch": 1304} {"train_loss": -5.835988998413086, "global_step": 54777, "epoch": 1304} {"train_loss": -5.799232006072998, "global_step": 54778, "epoch": 1304} {"train_loss": -5.929953098297119, "global_step": 54779, "epoch": 1304} {"train_loss": -5.88446569442749, "global_step": 54780, "epoch": 1304} {"train_loss": -5.798253059387207, "global_step": 54781, "epoch": 1304} {"train_loss": -5.835977554321289, "global_step": 54782, "epoch": 1304} {"train_loss": -5.816291809082031, "global_step": 54783, "epoch": 1304} {"train_loss": -5.843010902404785, "global_step": 54784, "epoch": 1304} {"train_loss": -5.758765697479248, "global_step": 54785, "epoch": 1304} {"train_loss": -5.808739185333252, "global_step": 54786, "epoch": 1304} {"train_loss": -5.829702377319336, "global_step": 54787, "epoch": 1304} {"train_loss": -5.81879997253418, "global_step": 54788, "epoch": 1304} {"train_loss": -5.7915802001953125, "global_step": 54789, "epoch": 1304} {"train_loss": -5.827523231506348, "global_step": 54790, "epoch": 1304} {"train_loss": -5.842573642730713, "global_step": 54791, "epoch": 1304} {"train_loss": -5.795227527618408, "global_step": 54792, "epoch": 1304} {"train_loss": -5.824615478515625, "global_step": 54793, "epoch": 1304} {"train_loss": -5.938107013702393, "global_step": 54794, "epoch": 1304} {"train_loss": -5.883272171020508, "global_step": 54795, "epoch": 1304} {"train_loss": -5.770700931549072, "global_step": 54796, "epoch": 1304} {"train_loss": -5.920483112335205, "global_step": 54797, "epoch": 1304} {"train_loss": -5.8027849197387695, "global_step": 54798, "epoch": 1304} {"train_loss": -5.911575794219971, "global_step": 54799, "epoch": 1304} {"train_loss": -5.849937915802002, "global_step": 54800, "epoch": 1304} {"train_loss": -5.783037185668945, "global_step": 54801, "epoch": 1304} {"train_loss": -5.848102569580078, "global_step": 54802, "epoch": 1304} {"train_loss": -5.918471336364746, "global_step": 54803, "epoch": 1304} {"train_loss": -5.8041911125183105, "global_step": 54804, "epoch": 1304} {"train_loss": -5.751568794250488, "global_step": 54805, "epoch": 1304} {"train_loss": -5.945927619934082, "global_step": 54806, "epoch": 1304} {"train_loss": -5.81072998046875, "global_step": 54807, "epoch": 1304} {"train_loss": -5.85051155090332, "global_step": 54808, "epoch": 1304} {"train_loss": -5.84134460630871, "global_step": 54809, "epoch": 1304, "val_loss": 61443.5703125} {"train_loss": -5.853232383728027, "global_step": 54810, "epoch": 1305} {"train_loss": -5.867887020111084, "global_step": 54811, "epoch": 1305} {"train_loss": -5.893959999084473, "global_step": 54812, "epoch": 1305} {"train_loss": -5.860104560852051, "global_step": 54813, "epoch": 1305} {"train_loss": -5.781101226806641, "global_step": 54814, "epoch": 1305} {"train_loss": -5.779582977294922, "global_step": 54815, "epoch": 1305} {"train_loss": -5.739432334899902, "global_step": 54816, "epoch": 1305} {"train_loss": -5.858632564544678, "global_step": 54817, "epoch": 1305} {"train_loss": -5.736789703369141, "global_step": 54818, "epoch": 1305} {"train_loss": -5.855718612670898, "global_step": 54819, "epoch": 1305} {"train_loss": -5.664390563964844, "global_step": 54820, "epoch": 1305} {"train_loss": -5.8399658203125, "global_step": 54821, "epoch": 1305} {"train_loss": -5.79554557800293, "global_step": 54822, "epoch": 1305} {"train_loss": -5.895786285400391, "global_step": 54823, "epoch": 1305} {"train_loss": -5.948622703552246, "global_step": 54824, "epoch": 1305} {"train_loss": -5.807498931884766, "global_step": 54825, "epoch": 1305} {"train_loss": -5.847226619720459, "global_step": 54826, "epoch": 1305} {"train_loss": -5.861115455627441, "global_step": 54827, "epoch": 1305} {"train_loss": -5.85360050201416, "global_step": 54828, "epoch": 1305} {"train_loss": -5.793582916259766, "global_step": 54829, "epoch": 1305} {"train_loss": -5.792713165283203, "global_step": 54830, "epoch": 1305} {"train_loss": -5.923449516296387, "global_step": 54831, "epoch": 1305} {"train_loss": -5.891584396362305, "global_step": 54832, "epoch": 1305} {"train_loss": -5.8742475509643555, "global_step": 54833, "epoch": 1305} {"train_loss": -5.920092582702637, "global_step": 54834, "epoch": 1305} {"train_loss": -5.914532661437988, "global_step": 54835, "epoch": 1305} {"train_loss": -5.878327369689941, "global_step": 54836, "epoch": 1305} {"train_loss": -5.845523357391357, "global_step": 54837, "epoch": 1305} {"train_loss": -5.819724082946777, "global_step": 54838, "epoch": 1305} {"train_loss": -6.026843547821045, "global_step": 54839, "epoch": 1305} {"train_loss": -5.708471298217773, "global_step": 54840, "epoch": 1305} {"train_loss": -5.792017936706543, "global_step": 54841, "epoch": 1305} {"train_loss": -5.842710018157959, "global_step": 54842, "epoch": 1305} {"train_loss": -5.849818229675293, "global_step": 54843, "epoch": 1305} {"train_loss": -5.880579471588135, "global_step": 54844, "epoch": 1305} {"train_loss": -5.778064250946045, "global_step": 54845, "epoch": 1305} {"train_loss": -5.858591079711914, "global_step": 54846, "epoch": 1305} {"train_loss": -5.953207969665527, "global_step": 54847, "epoch": 1305} {"train_loss": -5.904877185821533, "global_step": 54848, "epoch": 1305} {"train_loss": -5.828753471374512, "global_step": 54849, "epoch": 1305} {"train_loss": -5.889281272888184, "global_step": 54850, "epoch": 1305} {"train_loss": -5.846813939866566, "global_step": 54851, "epoch": 1305, "val_loss": 61234.66796875} {"train_loss": -5.874314785003662, "global_step": 54852, "epoch": 1306} {"train_loss": -5.823491096496582, "global_step": 54853, "epoch": 1306} {"train_loss": -5.767556190490723, "global_step": 54854, "epoch": 1306} {"train_loss": -5.909022808074951, "global_step": 54855, "epoch": 1306} {"train_loss": -5.921907424926758, "global_step": 54856, "epoch": 1306} {"train_loss": -5.83738374710083, "global_step": 54857, "epoch": 1306} {"train_loss": -5.7285871505737305, "global_step": 54858, "epoch": 1306} {"train_loss": -5.948550224304199, "global_step": 54859, "epoch": 1306} {"train_loss": -5.884620666503906, "global_step": 54860, "epoch": 1306} {"train_loss": -5.8771233558654785, "global_step": 54861, "epoch": 1306} {"train_loss": -5.872077941894531, "global_step": 54862, "epoch": 1306} {"train_loss": -5.823779106140137, "global_step": 54863, "epoch": 1306} {"train_loss": -5.931793212890625, "global_step": 54864, "epoch": 1306} {"train_loss": -5.83841609954834, "global_step": 54865, "epoch": 1306} {"train_loss": -5.788259506225586, "global_step": 54866, "epoch": 1306} {"train_loss": -5.957308292388916, "global_step": 54867, "epoch": 1306} {"train_loss": -5.926631927490234, "global_step": 54868, "epoch": 1306} {"train_loss": -5.85443115234375, "global_step": 54869, "epoch": 1306} {"train_loss": -5.890082836151123, "global_step": 54870, "epoch": 1306} {"train_loss": -5.837424278259277, "global_step": 54871, "epoch": 1306} {"train_loss": -5.825498104095459, "global_step": 54872, "epoch": 1306} {"train_loss": -5.965578079223633, "global_step": 54873, "epoch": 1306} {"train_loss": -5.961524486541748, "global_step": 54874, "epoch": 1306} {"train_loss": -5.849521636962891, "global_step": 54875, "epoch": 1306} {"train_loss": -5.762513637542725, "global_step": 54876, "epoch": 1306} {"train_loss": -5.7846832275390625, "global_step": 54877, "epoch": 1306} {"train_loss": -5.776524066925049, "global_step": 54878, "epoch": 1306} {"train_loss": -5.892442226409912, "global_step": 54879, "epoch": 1306} {"train_loss": -5.823859214782715, "global_step": 54880, "epoch": 1306} {"train_loss": -5.839906215667725, "global_step": 54881, "epoch": 1306} {"train_loss": -5.811258316040039, "global_step": 54882, "epoch": 1306} {"train_loss": -5.904140472412109, "global_step": 54883, "epoch": 1306} {"train_loss": -5.7478179931640625, "global_step": 54884, "epoch": 1306} {"train_loss": -5.779685974121094, "global_step": 54885, "epoch": 1306} {"train_loss": -5.800936222076416, "global_step": 54886, "epoch": 1306} {"train_loss": -5.825204849243164, "global_step": 54887, "epoch": 1306} {"train_loss": -5.799073219299316, "global_step": 54888, "epoch": 1306} {"train_loss": -5.766141891479492, "global_step": 54889, "epoch": 1306} {"train_loss": -5.889181613922119, "global_step": 54890, "epoch": 1306} {"train_loss": -5.851615905761719, "global_step": 54891, "epoch": 1306} {"train_loss": -5.843581199645996, "global_step": 54892, "epoch": 1306} {"train_loss": -5.848082474299839, "global_step": 54893, "epoch": 1306, "val_loss": 61612.65625} {"train_loss": -5.8154215812683105, "global_step": 54894, "epoch": 1307} {"train_loss": -5.93888521194458, "global_step": 54895, "epoch": 1307} {"train_loss": -5.844683647155762, "global_step": 54896, "epoch": 1307} {"train_loss": -5.926617622375488, "global_step": 54897, "epoch": 1307} {"train_loss": -5.900467872619629, "global_step": 54898, "epoch": 1307} {"train_loss": -5.874513626098633, "global_step": 54899, "epoch": 1307} {"train_loss": -5.832087993621826, "global_step": 54900, "epoch": 1307} {"train_loss": -5.879899978637695, "global_step": 54901, "epoch": 1307} {"train_loss": -5.96406888961792, "global_step": 54902, "epoch": 1307} {"train_loss": -5.809054374694824, "global_step": 54903, "epoch": 1307} {"train_loss": -5.83586311340332, "global_step": 54904, "epoch": 1307} {"train_loss": -5.941020965576172, "global_step": 54905, "epoch": 1307} {"train_loss": -5.835283279418945, "global_step": 54906, "epoch": 1307} {"train_loss": -5.840170860290527, "global_step": 54907, "epoch": 1307} {"train_loss": -5.883249759674072, "global_step": 54908, "epoch": 1307} {"train_loss": -5.831555366516113, "global_step": 54909, "epoch": 1307} {"train_loss": -5.938749313354492, "global_step": 54910, "epoch": 1307} {"train_loss": -5.7400617599487305, "global_step": 54911, "epoch": 1307} {"train_loss": -5.866047382354736, "global_step": 54912, "epoch": 1307} {"train_loss": -5.859962463378906, "global_step": 54913, "epoch": 1307} {"train_loss": -5.9088335037231445, "global_step": 54914, "epoch": 1307} {"train_loss": -5.677098274230957, "global_step": 54915, "epoch": 1307} {"train_loss": -5.702218055725098, "global_step": 54916, "epoch": 1307} {"train_loss": -5.819868564605713, "global_step": 54917, "epoch": 1307} {"train_loss": -5.925487995147705, "global_step": 54918, "epoch": 1307} {"train_loss": -5.803036689758301, "global_step": 54919, "epoch": 1307} {"train_loss": -5.631056308746338, "global_step": 54920, "epoch": 1307} {"train_loss": -5.862985610961914, "global_step": 54921, "epoch": 1307} {"train_loss": -5.858730316162109, "global_step": 54922, "epoch": 1307} {"train_loss": -5.689001083374023, "global_step": 54923, "epoch": 1307} {"train_loss": -5.886623382568359, "global_step": 54924, "epoch": 1307} {"train_loss": -5.661961078643799, "global_step": 54925, "epoch": 1307} {"train_loss": -5.680818557739258, "global_step": 54926, "epoch": 1307} {"train_loss": -5.634122848510742, "global_step": 54927, "epoch": 1307} {"train_loss": -5.672975540161133, "global_step": 54928, "epoch": 1307} {"train_loss": -5.686800956726074, "global_step": 54929, "epoch": 1307} {"train_loss": -5.703622817993164, "global_step": 54930, "epoch": 1307} {"train_loss": -5.7998809814453125, "global_step": 54931, "epoch": 1307} {"train_loss": -5.792673110961914, "global_step": 54932, "epoch": 1307} {"train_loss": -5.803765296936035, "global_step": 54933, "epoch": 1307} {"train_loss": -5.79411506652832, "global_step": 54934, "epoch": 1307} {"train_loss": -5.813402005604336, "global_step": 54935, "epoch": 1307, "val_loss": 61824.734375} {"train_loss": -5.719282150268555, "global_step": 54936, "epoch": 1308} {"train_loss": -5.874159812927246, "global_step": 54937, "epoch": 1308} {"train_loss": -5.73983097076416, "global_step": 54938, "epoch": 1308} {"train_loss": -5.826840877532959, "global_step": 54939, "epoch": 1308} {"train_loss": -5.898873805999756, "global_step": 54940, "epoch": 1308} {"train_loss": -5.72280740737915, "global_step": 54941, "epoch": 1308} {"train_loss": -5.831205368041992, "global_step": 54942, "epoch": 1308} {"train_loss": -5.824073314666748, "global_step": 54943, "epoch": 1308} {"train_loss": -5.85449743270874, "global_step": 54944, "epoch": 1308} {"train_loss": -5.77278995513916, "global_step": 54945, "epoch": 1308} {"train_loss": -5.831912040710449, "global_step": 54946, "epoch": 1308} {"train_loss": -5.886570930480957, "global_step": 54947, "epoch": 1308} {"train_loss": -5.732692718505859, "global_step": 54948, "epoch": 1308} {"train_loss": -5.87114953994751, "global_step": 54949, "epoch": 1308} {"train_loss": -5.936858654022217, "global_step": 54950, "epoch": 1308} {"train_loss": -5.865419864654541, "global_step": 54951, "epoch": 1308} {"train_loss": -5.871393203735352, "global_step": 54952, "epoch": 1308} {"train_loss": -5.911346435546875, "global_step": 54953, "epoch": 1308} {"train_loss": -5.863641738891602, "global_step": 54954, "epoch": 1308} {"train_loss": -5.977688789367676, "global_step": 54955, "epoch": 1308} {"train_loss": -5.93202543258667, "global_step": 54956, "epoch": 1308} {"train_loss": -5.877224922180176, "global_step": 54957, "epoch": 1308} {"train_loss": -5.7740349769592285, "global_step": 54958, "epoch": 1308} {"train_loss": -5.93977165222168, "global_step": 54959, "epoch": 1308} {"train_loss": -5.809154510498047, "global_step": 54960, "epoch": 1308} {"train_loss": -5.9297895431518555, "global_step": 54961, "epoch": 1308} {"train_loss": -5.858836650848389, "global_step": 54962, "epoch": 1308} {"train_loss": -5.7589430809021, "global_step": 54963, "epoch": 1308} {"train_loss": -5.908365249633789, "global_step": 54964, "epoch": 1308} {"train_loss": -5.792213439941406, "global_step": 54965, "epoch": 1308} {"train_loss": -5.8598175048828125, "global_step": 54966, "epoch": 1308} {"train_loss": -5.879508018493652, "global_step": 54967, "epoch": 1308} {"train_loss": -5.759700775146484, "global_step": 54968, "epoch": 1308} {"train_loss": -5.825569152832031, "global_step": 54969, "epoch": 1308} {"train_loss": -5.777709484100342, "global_step": 54970, "epoch": 1308} {"train_loss": -5.691706657409668, "global_step": 54971, "epoch": 1308} {"train_loss": -5.779399871826172, "global_step": 54972, "epoch": 1308} {"train_loss": -5.724063396453857, "global_step": 54973, "epoch": 1308} {"train_loss": -5.754265308380127, "global_step": 54974, "epoch": 1308} {"train_loss": -5.789391994476318, "global_step": 54975, "epoch": 1308} {"train_loss": -5.876152992248535, "global_step": 54976, "epoch": 1308} {"train_loss": -5.830217452276321, "global_step": 54977, "epoch": 1308, "val_loss": 61865.6328125} {"train_loss": -5.707953929901123, "global_step": 54978, "epoch": 1309} {"train_loss": -5.688343048095703, "global_step": 54979, "epoch": 1309} {"train_loss": -5.770689010620117, "global_step": 54980, "epoch": 1309} {"train_loss": -5.794356346130371, "global_step": 54981, "epoch": 1309} {"train_loss": -5.729592323303223, "global_step": 54982, "epoch": 1309} {"train_loss": -5.800591945648193, "global_step": 54983, "epoch": 1309} {"train_loss": -5.6935224533081055, "global_step": 54984, "epoch": 1309} {"train_loss": -5.8449554443359375, "global_step": 54985, "epoch": 1309} {"train_loss": -5.795102119445801, "global_step": 54986, "epoch": 1309} {"train_loss": -5.778641223907471, "global_step": 54987, "epoch": 1309} {"train_loss": -5.806246757507324, "global_step": 54988, "epoch": 1309} {"train_loss": -5.8650736808776855, "global_step": 54989, "epoch": 1309} {"train_loss": -5.761346340179443, "global_step": 54990, "epoch": 1309} {"train_loss": -5.77939510345459, "global_step": 54991, "epoch": 1309} {"train_loss": -5.859951019287109, "global_step": 54992, "epoch": 1309} {"train_loss": -5.711286544799805, "global_step": 54993, "epoch": 1309} {"train_loss": -5.797740459442139, "global_step": 54994, "epoch": 1309} {"train_loss": -5.696386814117432, "global_step": 54995, "epoch": 1309} {"train_loss": -5.8753156661987305, "global_step": 54996, "epoch": 1309} {"train_loss": -5.774318695068359, "global_step": 54997, "epoch": 1309} {"train_loss": -5.818174362182617, "global_step": 54998, "epoch": 1309} {"train_loss": -5.818608283996582, "global_step": 54999, "epoch": 1309} {"train_loss": -5.853143215179443, "global_step": 55000, "epoch": 1309} {"train_loss": -5.768816947937012, "global_step": 55001, "epoch": 1309} {"train_loss": -5.964510440826416, "global_step": 55002, "epoch": 1309} {"train_loss": -5.883620262145996, "global_step": 55003, "epoch": 1309} {"train_loss": -5.882588863372803, "global_step": 55004, "epoch": 1309} {"train_loss": -5.923648834228516, "global_step": 55005, "epoch": 1309} {"train_loss": -5.766517639160156, "global_step": 55006, "epoch": 1309} {"train_loss": -5.818332672119141, "global_step": 55007, "epoch": 1309} {"train_loss": -5.886781215667725, "global_step": 55008, "epoch": 1309} {"train_loss": -5.721950531005859, "global_step": 55009, "epoch": 1309} {"train_loss": -5.753121376037598, "global_step": 55010, "epoch": 1309} {"train_loss": -5.84773063659668, "global_step": 55011, "epoch": 1309} {"train_loss": -5.788928031921387, "global_step": 55012, "epoch": 1309} {"train_loss": -5.809042930603027, "global_step": 55013, "epoch": 1309} {"train_loss": -5.7326273918151855, "global_step": 55014, "epoch": 1309} {"train_loss": -5.798454761505127, "global_step": 55015, "epoch": 1309} {"train_loss": -5.87473201751709, "global_step": 55016, "epoch": 1309} {"train_loss": -5.769159317016602, "global_step": 55017, "epoch": 1309} {"train_loss": -5.818459510803223, "global_step": 55018, "epoch": 1309} {"train_loss": -5.802879435675485, "global_step": 55019, "epoch": 1309, "val_loss": 61374.5} {"train_loss": -5.854908466339111, "global_step": 55020, "epoch": 1310} {"train_loss": -5.948314666748047, "global_step": 55021, "epoch": 1310} {"train_loss": -5.909008502960205, "global_step": 55022, "epoch": 1310} {"train_loss": -5.7313666343688965, "global_step": 55023, "epoch": 1310} {"train_loss": -5.884039878845215, "global_step": 55024, "epoch": 1310} {"train_loss": -5.87208366394043, "global_step": 55025, "epoch": 1310} {"train_loss": -5.853826999664307, "global_step": 55026, "epoch": 1310} {"train_loss": -5.837335586547852, "global_step": 55027, "epoch": 1310} {"train_loss": -5.7773847579956055, "global_step": 55028, "epoch": 1310} {"train_loss": -5.744421005249023, "global_step": 55029, "epoch": 1310} {"train_loss": -5.793406009674072, "global_step": 55030, "epoch": 1310} {"train_loss": -5.854177474975586, "global_step": 55031, "epoch": 1310} {"train_loss": -5.821149826049805, "global_step": 55032, "epoch": 1310} {"train_loss": -5.914736747741699, "global_step": 55033, "epoch": 1310} {"train_loss": -5.829928398132324, "global_step": 55034, "epoch": 1310} {"train_loss": -5.944161415100098, "global_step": 55035, "epoch": 1310} {"train_loss": -5.741530418395996, "global_step": 55036, "epoch": 1310} {"train_loss": -5.871560573577881, "global_step": 55037, "epoch": 1310} {"train_loss": -5.946323394775391, "global_step": 55038, "epoch": 1310} {"train_loss": -5.781805038452148, "global_step": 55039, "epoch": 1310} {"train_loss": -5.885034561157227, "global_step": 55040, "epoch": 1310} {"train_loss": -5.796082973480225, "global_step": 55041, "epoch": 1310} {"train_loss": -5.737383842468262, "global_step": 55042, "epoch": 1310} {"train_loss": -5.752341270446777, "global_step": 55043, "epoch": 1310} {"train_loss": -5.952707290649414, "global_step": 55044, "epoch": 1310} {"train_loss": -5.6779327392578125, "global_step": 55045, "epoch": 1310} {"train_loss": -5.9549560546875, "global_step": 55046, "epoch": 1310} {"train_loss": -5.709052085876465, "global_step": 55047, "epoch": 1310} {"train_loss": -5.785555362701416, "global_step": 55048, "epoch": 1310} {"train_loss": -5.656976699829102, "global_step": 55049, "epoch": 1310} {"train_loss": -5.937112808227539, "global_step": 55050, "epoch": 1310} {"train_loss": -5.697076797485352, "global_step": 55051, "epoch": 1310} {"train_loss": -5.844207286834717, "global_step": 55052, "epoch": 1310} {"train_loss": -5.76405143737793, "global_step": 55053, "epoch": 1310} {"train_loss": -5.887395858764648, "global_step": 55054, "epoch": 1310} {"train_loss": -5.812248229980469, "global_step": 55055, "epoch": 1310} {"train_loss": -5.901397228240967, "global_step": 55056, "epoch": 1310} {"train_loss": -5.773049354553223, "global_step": 55057, "epoch": 1310} {"train_loss": -5.733206272125244, "global_step": 55058, "epoch": 1310} {"train_loss": -5.745805740356445, "global_step": 55059, "epoch": 1310} {"train_loss": -5.748323440551758, "global_step": 55060, "epoch": 1310} {"train_loss": -5.822051547822499, "global_step": 55061, "epoch": 1310, "val_loss": 61514.71875} {"train_loss": -5.89118766784668, "global_step": 55062, "epoch": 1311} {"train_loss": -5.813954830169678, "global_step": 55063, "epoch": 1311} {"train_loss": -5.89898157119751, "global_step": 55064, "epoch": 1311} {"train_loss": -5.790428161621094, "global_step": 55065, "epoch": 1311} {"train_loss": -5.874990463256836, "global_step": 55066, "epoch": 1311} {"train_loss": -5.773710250854492, "global_step": 55067, "epoch": 1311} {"train_loss": -5.800415515899658, "global_step": 55068, "epoch": 1311} {"train_loss": -5.815391540527344, "global_step": 55069, "epoch": 1311} {"train_loss": -5.763797760009766, "global_step": 55070, "epoch": 1311} {"train_loss": -5.793081283569336, "global_step": 55071, "epoch": 1311} {"train_loss": -5.7730207443237305, "global_step": 55072, "epoch": 1311} {"train_loss": -5.960495948791504, "global_step": 55073, "epoch": 1311} {"train_loss": -5.670093536376953, "global_step": 55074, "epoch": 1311} {"train_loss": -5.7525634765625, "global_step": 55075, "epoch": 1311} {"train_loss": -5.887835502624512, "global_step": 55076, "epoch": 1311} {"train_loss": -5.621927738189697, "global_step": 55077, "epoch": 1311} {"train_loss": -5.921231269836426, "global_step": 55078, "epoch": 1311} {"train_loss": -5.815521717071533, "global_step": 55079, "epoch": 1311} {"train_loss": -5.731098651885986, "global_step": 55080, "epoch": 1311} {"train_loss": -5.840404510498047, "global_step": 55081, "epoch": 1311} {"train_loss": -5.716416358947754, "global_step": 55082, "epoch": 1311} {"train_loss": -5.824102878570557, "global_step": 55083, "epoch": 1311} {"train_loss": -5.858527183532715, "global_step": 55084, "epoch": 1311} {"train_loss": -5.723054885864258, "global_step": 55085, "epoch": 1311} {"train_loss": -5.849804878234863, "global_step": 55086, "epoch": 1311} {"train_loss": -5.8504533767700195, "global_step": 55087, "epoch": 1311} {"train_loss": -5.842432022094727, "global_step": 55088, "epoch": 1311} {"train_loss": -5.837066650390625, "global_step": 55089, "epoch": 1311} {"train_loss": -5.853388786315918, "global_step": 55090, "epoch": 1311} {"train_loss": -5.884054660797119, "global_step": 55091, "epoch": 1311} {"train_loss": -5.776546478271484, "global_step": 55092, "epoch": 1311} {"train_loss": -5.852187633514404, "global_step": 55093, "epoch": 1311} {"train_loss": -5.985719680786133, "global_step": 55094, "epoch": 1311} {"train_loss": -5.818811416625977, "global_step": 55095, "epoch": 1311} {"train_loss": -5.951144218444824, "global_step": 55096, "epoch": 1311} {"train_loss": -5.892186164855957, "global_step": 55097, "epoch": 1311} {"train_loss": -5.842575550079346, "global_step": 55098, "epoch": 1311} {"train_loss": -5.8414764404296875, "global_step": 55099, "epoch": 1311} {"train_loss": -5.904472351074219, "global_step": 55100, "epoch": 1311} {"train_loss": -5.89078426361084, "global_step": 55101, "epoch": 1311} {"train_loss": -5.796432018280029, "global_step": 55102, "epoch": 1311} {"train_loss": -5.832232895351591, "global_step": 55103, "epoch": 1311, "val_loss": 61277.9375} {"train_loss": -5.905214786529541, "global_step": 55104, "epoch": 1312} {"train_loss": -5.843210697174072, "global_step": 55105, "epoch": 1312} {"train_loss": -5.806358814239502, "global_step": 55106, "epoch": 1312} {"train_loss": -5.820770263671875, "global_step": 55107, "epoch": 1312} {"train_loss": -5.857686996459961, "global_step": 55108, "epoch": 1312} {"train_loss": -5.842913627624512, "global_step": 55109, "epoch": 1312} {"train_loss": -5.869245529174805, "global_step": 55110, "epoch": 1312} {"train_loss": -6.000240802764893, "global_step": 55111, "epoch": 1312} {"train_loss": -5.848871231079102, "global_step": 55112, "epoch": 1312} {"train_loss": -5.667067527770996, "global_step": 55113, "epoch": 1312} {"train_loss": -5.886209964752197, "global_step": 55114, "epoch": 1312} {"train_loss": -5.871975898742676, "global_step": 55115, "epoch": 1312} {"train_loss": -5.807643890380859, "global_step": 55116, "epoch": 1312} {"train_loss": -5.933823585510254, "global_step": 55117, "epoch": 1312} {"train_loss": -5.769177436828613, "global_step": 55118, "epoch": 1312} {"train_loss": -5.759985446929932, "global_step": 55119, "epoch": 1312} {"train_loss": -5.814884662628174, "global_step": 55120, "epoch": 1312} {"train_loss": -5.846536159515381, "global_step": 55121, "epoch": 1312} {"train_loss": -5.8447771072387695, "global_step": 55122, "epoch": 1312} {"train_loss": -5.827456474304199, "global_step": 55123, "epoch": 1312} {"train_loss": -5.910866737365723, "global_step": 55124, "epoch": 1312} {"train_loss": -5.824594497680664, "global_step": 55125, "epoch": 1312} {"train_loss": -5.819520473480225, "global_step": 55126, "epoch": 1312} {"train_loss": -5.83780574798584, "global_step": 55127, "epoch": 1312} {"train_loss": -5.874072551727295, "global_step": 55128, "epoch": 1312} {"train_loss": -5.805111408233643, "global_step": 55129, "epoch": 1312} {"train_loss": -5.9157185554504395, "global_step": 55130, "epoch": 1312} {"train_loss": -5.81838321685791, "global_step": 55131, "epoch": 1312} {"train_loss": -6.0175981521606445, "global_step": 55132, "epoch": 1312} {"train_loss": -5.9300642013549805, "global_step": 55133, "epoch": 1312} {"train_loss": -5.80415153503418, "global_step": 55134, "epoch": 1312} {"train_loss": -5.823864936828613, "global_step": 55135, "epoch": 1312} {"train_loss": -5.843745231628418, "global_step": 55136, "epoch": 1312} {"train_loss": -5.874463081359863, "global_step": 55137, "epoch": 1312} {"train_loss": -5.817777633666992, "global_step": 55138, "epoch": 1312} {"train_loss": -5.910332679748535, "global_step": 55139, "epoch": 1312} {"train_loss": -5.814988136291504, "global_step": 55140, "epoch": 1312} {"train_loss": -5.971968173980713, "global_step": 55141, "epoch": 1312} {"train_loss": -5.778352737426758, "global_step": 55142, "epoch": 1312} {"train_loss": -5.865279197692871, "global_step": 55143, "epoch": 1312} {"train_loss": -5.9002251625061035, "global_step": 55144, "epoch": 1312} {"train_loss": -5.854145810717628, "global_step": 55145, "epoch": 1312, "val_loss": 61650.32421875} {"train_loss": -5.886378765106201, "global_step": 55146, "epoch": 1313} {"train_loss": -5.743764877319336, "global_step": 55147, "epoch": 1313} {"train_loss": -5.776239395141602, "global_step": 55148, "epoch": 1313} {"train_loss": -5.9436750411987305, "global_step": 55149, "epoch": 1313} {"train_loss": -5.907127380371094, "global_step": 55150, "epoch": 1313} {"train_loss": -5.686734199523926, "global_step": 55151, "epoch": 1313} {"train_loss": -5.889885425567627, "global_step": 55152, "epoch": 1313} {"train_loss": -5.785477638244629, "global_step": 55153, "epoch": 1313} {"train_loss": -5.8202714920043945, "global_step": 55154, "epoch": 1313} {"train_loss": -5.815443992614746, "global_step": 55155, "epoch": 1313} {"train_loss": -5.948485851287842, "global_step": 55156, "epoch": 1313} {"train_loss": -5.934908866882324, "global_step": 55157, "epoch": 1313} {"train_loss": -5.855507850646973, "global_step": 55158, "epoch": 1313} {"train_loss": -5.757743835449219, "global_step": 55159, "epoch": 1313} {"train_loss": -5.7557854652404785, "global_step": 55160, "epoch": 1313} {"train_loss": -5.888023376464844, "global_step": 55161, "epoch": 1313} {"train_loss": -5.796650409698486, "global_step": 55162, "epoch": 1313} {"train_loss": -5.773720741271973, "global_step": 55163, "epoch": 1313} {"train_loss": -5.915955543518066, "global_step": 55164, "epoch": 1313} {"train_loss": -5.8592424392700195, "global_step": 55165, "epoch": 1313} {"train_loss": -5.809337615966797, "global_step": 55166, "epoch": 1313} {"train_loss": -5.842107772827148, "global_step": 55167, "epoch": 1313} {"train_loss": -5.8568572998046875, "global_step": 55168, "epoch": 1313} {"train_loss": -5.82903528213501, "global_step": 55169, "epoch": 1313} {"train_loss": -5.784026145935059, "global_step": 55170, "epoch": 1313} {"train_loss": -5.861139297485352, "global_step": 55171, "epoch": 1313} {"train_loss": -5.6762285232543945, "global_step": 55172, "epoch": 1313} {"train_loss": -6.001032829284668, "global_step": 55173, "epoch": 1313} {"train_loss": -5.928003787994385, "global_step": 55174, "epoch": 1313} {"train_loss": -5.933854103088379, "global_step": 55175, "epoch": 1313} {"train_loss": -5.820207595825195, "global_step": 55176, "epoch": 1313} {"train_loss": -5.920557022094727, "global_step": 55177, "epoch": 1313} {"train_loss": -5.736593246459961, "global_step": 55178, "epoch": 1313} {"train_loss": -5.833367347717285, "global_step": 55179, "epoch": 1313} {"train_loss": -5.8721923828125, "global_step": 55180, "epoch": 1313} {"train_loss": -5.853475570678711, "global_step": 55181, "epoch": 1313} {"train_loss": -5.864030838012695, "global_step": 55182, "epoch": 1313} {"train_loss": -5.743847370147705, "global_step": 55183, "epoch": 1313} {"train_loss": -5.854584217071533, "global_step": 55184, "epoch": 1313} {"train_loss": -5.861298084259033, "global_step": 55185, "epoch": 1313} {"train_loss": -5.844477653503418, "global_step": 55186, "epoch": 1313} {"train_loss": -5.841249658947899, "global_step": 55187, "epoch": 1313, "val_loss": 61287.46875} {"train_loss": -5.953825950622559, "global_step": 55188, "epoch": 1314} {"train_loss": -5.87308406829834, "global_step": 55189, "epoch": 1314} {"train_loss": -5.993047714233398, "global_step": 55190, "epoch": 1314} {"train_loss": -5.8858642578125, "global_step": 55191, "epoch": 1314} {"train_loss": -5.763403415679932, "global_step": 55192, "epoch": 1314} {"train_loss": -5.795293807983398, "global_step": 55193, "epoch": 1314} {"train_loss": -5.865213394165039, "global_step": 55194, "epoch": 1314} {"train_loss": -5.830309867858887, "global_step": 55195, "epoch": 1314} {"train_loss": -5.776730060577393, "global_step": 55196, "epoch": 1314} {"train_loss": -5.706114768981934, "global_step": 55197, "epoch": 1314} {"train_loss": -5.808874607086182, "global_step": 55198, "epoch": 1314} {"train_loss": -5.959307670593262, "global_step": 55199, "epoch": 1314} {"train_loss": -5.887428283691406, "global_step": 55200, "epoch": 1314} {"train_loss": -5.914549350738525, "global_step": 55201, "epoch": 1314} {"train_loss": -5.874276161193848, "global_step": 55202, "epoch": 1314} {"train_loss": -5.83248233795166, "global_step": 55203, "epoch": 1314} {"train_loss": -5.846042633056641, "global_step": 55204, "epoch": 1314} {"train_loss": -5.902978420257568, "global_step": 55205, "epoch": 1314} {"train_loss": -5.8188629150390625, "global_step": 55206, "epoch": 1314} {"train_loss": -5.75314998626709, "global_step": 55207, "epoch": 1314} {"train_loss": -5.857067584991455, "global_step": 55208, "epoch": 1314} {"train_loss": -5.93324613571167, "global_step": 55209, "epoch": 1314} {"train_loss": -5.805733680725098, "global_step": 55210, "epoch": 1314} {"train_loss": -5.795199394226074, "global_step": 55211, "epoch": 1314} {"train_loss": -5.861441612243652, "global_step": 55212, "epoch": 1314} {"train_loss": -5.8375396728515625, "global_step": 55213, "epoch": 1314} {"train_loss": -5.756051063537598, "global_step": 55214, "epoch": 1314} {"train_loss": -5.771466255187988, "global_step": 55215, "epoch": 1314} {"train_loss": -5.69310998916626, "global_step": 55216, "epoch": 1314} {"train_loss": -5.745601177215576, "global_step": 55217, "epoch": 1314} {"train_loss": -5.788041114807129, "global_step": 55218, "epoch": 1314} {"train_loss": -5.854654312133789, "global_step": 55219, "epoch": 1314} {"train_loss": -5.815642356872559, "global_step": 55220, "epoch": 1314} {"train_loss": -5.880675315856934, "global_step": 55221, "epoch": 1314} {"train_loss": -5.906625270843506, "global_step": 55222, "epoch": 1314} {"train_loss": -5.729784965515137, "global_step": 55223, "epoch": 1314} {"train_loss": -6.002008438110352, "global_step": 55224, "epoch": 1314} {"train_loss": -5.859610080718994, "global_step": 55225, "epoch": 1314} {"train_loss": -5.8585100173950195, "global_step": 55226, "epoch": 1314} {"train_loss": -5.875441551208496, "global_step": 55227, "epoch": 1314} {"train_loss": -5.724487781524658, "global_step": 55228, "epoch": 1314} {"train_loss": -5.840855553036644, "global_step": 55229, "epoch": 1314, "val_loss": 61634.9609375} {"train_loss": -5.889762878417969, "global_step": 55230, "epoch": 1315} {"train_loss": -5.764193058013916, "global_step": 55231, "epoch": 1315} {"train_loss": -5.720046043395996, "global_step": 55232, "epoch": 1315} {"train_loss": -5.72346830368042, "global_step": 55233, "epoch": 1315} {"train_loss": -5.7708234786987305, "global_step": 55234, "epoch": 1315} {"train_loss": -5.863243103027344, "global_step": 55235, "epoch": 1315} {"train_loss": -5.8439226150512695, "global_step": 55236, "epoch": 1315} {"train_loss": -5.814837455749512, "global_step": 55237, "epoch": 1315} {"train_loss": -5.875545501708984, "global_step": 55238, "epoch": 1315} {"train_loss": -5.842840194702148, "global_step": 55239, "epoch": 1315} {"train_loss": -5.768069744110107, "global_step": 55240, "epoch": 1315} {"train_loss": -5.886710166931152, "global_step": 55241, "epoch": 1315} {"train_loss": -5.805365562438965, "global_step": 55242, "epoch": 1315} {"train_loss": -5.91339635848999, "global_step": 55243, "epoch": 1315} {"train_loss": -5.806107997894287, "global_step": 55244, "epoch": 1315} {"train_loss": -5.861257553100586, "global_step": 55245, "epoch": 1315} {"train_loss": -5.884417533874512, "global_step": 55246, "epoch": 1315} {"train_loss": -5.87864875793457, "global_step": 55247, "epoch": 1315} {"train_loss": -5.958655834197998, "global_step": 55248, "epoch": 1315} {"train_loss": -5.9303741455078125, "global_step": 55249, "epoch": 1315} {"train_loss": -5.828327178955078, "global_step": 55250, "epoch": 1315} {"train_loss": -5.930266380310059, "global_step": 55251, "epoch": 1315} {"train_loss": -5.756251335144043, "global_step": 55252, "epoch": 1315} {"train_loss": -5.834637641906738, "global_step": 55253, "epoch": 1315} {"train_loss": -5.773578643798828, "global_step": 55254, "epoch": 1315} {"train_loss": -5.801081657409668, "global_step": 55255, "epoch": 1315} {"train_loss": -5.888246536254883, "global_step": 55256, "epoch": 1315} {"train_loss": -5.81265926361084, "global_step": 55257, "epoch": 1315} {"train_loss": -5.853733062744141, "global_step": 55258, "epoch": 1315} {"train_loss": -5.797236442565918, "global_step": 55259, "epoch": 1315} {"train_loss": -5.781121253967285, "global_step": 55260, "epoch": 1315} {"train_loss": -5.93408203125, "global_step": 55261, "epoch": 1315} {"train_loss": -5.859511375427246, "global_step": 55262, "epoch": 1315} {"train_loss": -5.887042045593262, "global_step": 55263, "epoch": 1315} {"train_loss": -5.837787628173828, "global_step": 55264, "epoch": 1315} {"train_loss": -5.826407432556152, "global_step": 55265, "epoch": 1315} {"train_loss": -5.9169816970825195, "global_step": 55266, "epoch": 1315} {"train_loss": -5.897035121917725, "global_step": 55267, "epoch": 1315} {"train_loss": -5.8016676902771, "global_step": 55268, "epoch": 1315} {"train_loss": -5.8383893966674805, "global_step": 55269, "epoch": 1315} {"train_loss": -5.787088394165039, "global_step": 55270, "epoch": 1315} {"train_loss": -5.839293093908401, "global_step": 55271, "epoch": 1315, "val_loss": 61468.359375} {"train_loss": -5.894872665405273, "global_step": 55272, "epoch": 1316} {"train_loss": -5.7862548828125, "global_step": 55273, "epoch": 1316} {"train_loss": -5.784605503082275, "global_step": 55274, "epoch": 1316} {"train_loss": -5.991666793823242, "global_step": 55275, "epoch": 1316} {"train_loss": -5.9386067390441895, "global_step": 55276, "epoch": 1316} {"train_loss": -5.8411078453063965, "global_step": 55277, "epoch": 1316} {"train_loss": -5.964086532592773, "global_step": 55278, "epoch": 1316} {"train_loss": -5.774509906768799, "global_step": 55279, "epoch": 1316} {"train_loss": -5.869063377380371, "global_step": 55280, "epoch": 1316} {"train_loss": -5.858650207519531, "global_step": 55281, "epoch": 1316} {"train_loss": -5.795627593994141, "global_step": 55282, "epoch": 1316} {"train_loss": -5.749952793121338, "global_step": 55283, "epoch": 1316} {"train_loss": -5.795806884765625, "global_step": 55284, "epoch": 1316} {"train_loss": -5.796961784362793, "global_step": 55285, "epoch": 1316} {"train_loss": -5.728951454162598, "global_step": 55286, "epoch": 1316} {"train_loss": -5.715400695800781, "global_step": 55287, "epoch": 1316} {"train_loss": -5.710594654083252, "global_step": 55288, "epoch": 1316} {"train_loss": -5.724936485290527, "global_step": 55289, "epoch": 1316} {"train_loss": -5.8595757484436035, "global_step": 55290, "epoch": 1316} {"train_loss": -5.711344242095947, "global_step": 55291, "epoch": 1316} {"train_loss": -5.828390121459961, "global_step": 55292, "epoch": 1316} {"train_loss": -5.706757068634033, "global_step": 55293, "epoch": 1316} {"train_loss": -5.787013053894043, "global_step": 55294, "epoch": 1316} {"train_loss": -5.8377885818481445, "global_step": 55295, "epoch": 1316} {"train_loss": -5.8672776222229, "global_step": 55296, "epoch": 1316} {"train_loss": -5.791290760040283, "global_step": 55297, "epoch": 1316} {"train_loss": -5.782886981964111, "global_step": 55298, "epoch": 1316} {"train_loss": -5.909598350524902, "global_step": 55299, "epoch": 1316} {"train_loss": -5.835615158081055, "global_step": 55300, "epoch": 1316} {"train_loss": -5.808773994445801, "global_step": 55301, "epoch": 1316} {"train_loss": -5.852156639099121, "global_step": 55302, "epoch": 1316} {"train_loss": -5.799483299255371, "global_step": 55303, "epoch": 1316} {"train_loss": -5.866369247436523, "global_step": 55304, "epoch": 1316} {"train_loss": -5.806880474090576, "global_step": 55305, "epoch": 1316} {"train_loss": -5.804619789123535, "global_step": 55306, "epoch": 1316} {"train_loss": -5.803864479064941, "global_step": 55307, "epoch": 1316} {"train_loss": -5.773438930511475, "global_step": 55308, "epoch": 1316} {"train_loss": -5.813279151916504, "global_step": 55309, "epoch": 1316} {"train_loss": -5.805417060852051, "global_step": 55310, "epoch": 1316} {"train_loss": -5.792839050292969, "global_step": 55311, "epoch": 1316} {"train_loss": -5.849403381347656, "global_step": 55312, "epoch": 1316} {"train_loss": -5.817027069273449, "global_step": 55313, "epoch": 1316, "val_loss": 61494.1953125} {"train_loss": -5.970398902893066, "global_step": 55314, "epoch": 1317} {"train_loss": -5.800415992736816, "global_step": 55315, "epoch": 1317} {"train_loss": -5.734179973602295, "global_step": 55316, "epoch": 1317} {"train_loss": -5.920483112335205, "global_step": 55317, "epoch": 1317} {"train_loss": -5.89085578918457, "global_step": 55318, "epoch": 1317} {"train_loss": -5.7971343994140625, "global_step": 55319, "epoch": 1317} {"train_loss": -5.9243364334106445, "global_step": 55320, "epoch": 1317} {"train_loss": -5.824767589569092, "global_step": 55321, "epoch": 1317} {"train_loss": -5.821826457977295, "global_step": 55322, "epoch": 1317} {"train_loss": -5.8233323097229, "global_step": 55323, "epoch": 1317} {"train_loss": -5.799286842346191, "global_step": 55324, "epoch": 1317} {"train_loss": -5.898015022277832, "global_step": 55325, "epoch": 1317} {"train_loss": -5.831040382385254, "global_step": 55326, "epoch": 1317} {"train_loss": -5.743710517883301, "global_step": 55327, "epoch": 1317} {"train_loss": -5.860727787017822, "global_step": 55328, "epoch": 1317} {"train_loss": -5.760692596435547, "global_step": 55329, "epoch": 1317} {"train_loss": -5.704070091247559, "global_step": 55330, "epoch": 1317} {"train_loss": -5.8096923828125, "global_step": 55331, "epoch": 1317} {"train_loss": -5.808056831359863, "global_step": 55332, "epoch": 1317} {"train_loss": -5.730489253997803, "global_step": 55333, "epoch": 1317} {"train_loss": -5.773309707641602, "global_step": 55334, "epoch": 1317} {"train_loss": -5.767496109008789, "global_step": 55335, "epoch": 1317} {"train_loss": -5.8875579833984375, "global_step": 55336, "epoch": 1317} {"train_loss": -5.816614151000977, "global_step": 55337, "epoch": 1317} {"train_loss": -5.725526332855225, "global_step": 55338, "epoch": 1317} {"train_loss": -5.791568756103516, "global_step": 55339, "epoch": 1317} {"train_loss": -5.708775997161865, "global_step": 55340, "epoch": 1317} {"train_loss": -5.843788146972656, "global_step": 55341, "epoch": 1317} {"train_loss": -5.700331687927246, "global_step": 55342, "epoch": 1317} {"train_loss": -5.807821273803711, "global_step": 55343, "epoch": 1317} {"train_loss": -5.816805362701416, "global_step": 55344, "epoch": 1317} {"train_loss": -5.7598419189453125, "global_step": 55345, "epoch": 1317} {"train_loss": -5.8465728759765625, "global_step": 55346, "epoch": 1317} {"train_loss": -5.848447799682617, "global_step": 55347, "epoch": 1317} {"train_loss": -5.816262722015381, "global_step": 55348, "epoch": 1317} {"train_loss": -5.823261737823486, "global_step": 55349, "epoch": 1317} {"train_loss": -5.827004432678223, "global_step": 55350, "epoch": 1317} {"train_loss": -5.674272537231445, "global_step": 55351, "epoch": 1317} {"train_loss": -5.750763893127441, "global_step": 55352, "epoch": 1317} {"train_loss": -5.708270072937012, "global_step": 55353, "epoch": 1317} {"train_loss": -5.9034223556518555, "global_step": 55354, "epoch": 1317} {"train_loss": -5.807828551247006, "global_step": 55355, "epoch": 1317, "val_loss": 61678.390625} {"train_loss": -5.736674785614014, "global_step": 55356, "epoch": 1318} {"train_loss": -5.785243511199951, "global_step": 55357, "epoch": 1318} {"train_loss": -5.77862548828125, "global_step": 55358, "epoch": 1318} {"train_loss": -5.8372979164123535, "global_step": 55359, "epoch": 1318} {"train_loss": -5.697866916656494, "global_step": 55360, "epoch": 1318} {"train_loss": -5.7968292236328125, "global_step": 55361, "epoch": 1318} {"train_loss": -5.769559383392334, "global_step": 55362, "epoch": 1318} {"train_loss": -5.859302520751953, "global_step": 55363, "epoch": 1318} {"train_loss": -5.845523834228516, "global_step": 55364, "epoch": 1318} {"train_loss": -5.788619041442871, "global_step": 55365, "epoch": 1318} {"train_loss": -5.8600006103515625, "global_step": 55366, "epoch": 1318} {"train_loss": -5.771061897277832, "global_step": 55367, "epoch": 1318} {"train_loss": -5.778685569763184, "global_step": 55368, "epoch": 1318} {"train_loss": -5.935719013214111, "global_step": 55369, "epoch": 1318} {"train_loss": -5.654097080230713, "global_step": 55370, "epoch": 1318} {"train_loss": -5.848277568817139, "global_step": 55371, "epoch": 1318} {"train_loss": -5.807393550872803, "global_step": 55372, "epoch": 1318} {"train_loss": -5.870595932006836, "global_step": 55373, "epoch": 1318} {"train_loss": -5.815754413604736, "global_step": 55374, "epoch": 1318} {"train_loss": -5.8139801025390625, "global_step": 55375, "epoch": 1318} {"train_loss": -5.864496231079102, "global_step": 55376, "epoch": 1318} {"train_loss": -5.812573432922363, "global_step": 55377, "epoch": 1318} {"train_loss": -5.910369873046875, "global_step": 55378, "epoch": 1318} {"train_loss": -5.827885627746582, "global_step": 55379, "epoch": 1318} {"train_loss": -5.749877452850342, "global_step": 55380, "epoch": 1318} {"train_loss": -5.778160572052002, "global_step": 55381, "epoch": 1318} {"train_loss": -5.912057876586914, "global_step": 55382, "epoch": 1318} {"train_loss": -5.859452247619629, "global_step": 55383, "epoch": 1318} {"train_loss": -5.86807918548584, "global_step": 55384, "epoch": 1318} {"train_loss": -5.89780330657959, "global_step": 55385, "epoch": 1318} {"train_loss": -5.804391384124756, "global_step": 55386, "epoch": 1318} {"train_loss": -5.937219142913818, "global_step": 55387, "epoch": 1318} {"train_loss": -5.866072654724121, "global_step": 55388, "epoch": 1318} {"train_loss": -5.918892860412598, "global_step": 55389, "epoch": 1318} {"train_loss": -5.857173442840576, "global_step": 55390, "epoch": 1318} {"train_loss": -5.912071228027344, "global_step": 55391, "epoch": 1318} {"train_loss": -5.79465389251709, "global_step": 55392, "epoch": 1318} {"train_loss": -5.681008815765381, "global_step": 55393, "epoch": 1318} {"train_loss": -5.98590087890625, "global_step": 55394, "epoch": 1318} {"train_loss": -6.012127876281738, "global_step": 55395, "epoch": 1318} {"train_loss": -5.796383857727051, "global_step": 55396, "epoch": 1318} {"train_loss": -5.832055909293039, "global_step": 55397, "epoch": 1318, "val_loss": 61306.73046875} {"train_loss": -5.8498687744140625, "global_step": 55398, "epoch": 1319} {"train_loss": -5.962309837341309, "global_step": 55399, "epoch": 1319} {"train_loss": -5.820441246032715, "global_step": 55400, "epoch": 1319} {"train_loss": -5.834986686706543, "global_step": 55401, "epoch": 1319} {"train_loss": -5.8483076095581055, "global_step": 55402, "epoch": 1319} {"train_loss": -5.689250946044922, "global_step": 55403, "epoch": 1319} {"train_loss": -5.785168647766113, "global_step": 55404, "epoch": 1319} {"train_loss": -5.808954238891602, "global_step": 55405, "epoch": 1319} {"train_loss": -5.810092926025391, "global_step": 55406, "epoch": 1319} {"train_loss": -5.893816947937012, "global_step": 55407, "epoch": 1319} {"train_loss": -5.849459171295166, "global_step": 55408, "epoch": 1319} {"train_loss": -5.9135894775390625, "global_step": 55409, "epoch": 1319} {"train_loss": -5.947262763977051, "global_step": 55410, "epoch": 1319} {"train_loss": -5.871821880340576, "global_step": 55411, "epoch": 1319} {"train_loss": -5.794254779815674, "global_step": 55412, "epoch": 1319} {"train_loss": -5.808145999908447, "global_step": 55413, "epoch": 1319} {"train_loss": -5.8967485427856445, "global_step": 55414, "epoch": 1319} {"train_loss": -5.9055633544921875, "global_step": 55415, "epoch": 1319} {"train_loss": -5.921968460083008, "global_step": 55416, "epoch": 1319} {"train_loss": -5.794780731201172, "global_step": 55417, "epoch": 1319} {"train_loss": -5.797455787658691, "global_step": 55418, "epoch": 1319} {"train_loss": -5.838119029998779, "global_step": 55419, "epoch": 1319} {"train_loss": -5.8313069343566895, "global_step": 55420, "epoch": 1319} {"train_loss": -5.913784027099609, "global_step": 55421, "epoch": 1319} {"train_loss": -5.913015365600586, "global_step": 55422, "epoch": 1319} {"train_loss": -5.69191312789917, "global_step": 55423, "epoch": 1319} {"train_loss": -5.791428089141846, "global_step": 55424, "epoch": 1319} {"train_loss": -5.786216735839844, "global_step": 55425, "epoch": 1319} {"train_loss": -5.9394731521606445, "global_step": 55426, "epoch": 1319} {"train_loss": -5.830875396728516, "global_step": 55427, "epoch": 1319} {"train_loss": -5.873867511749268, "global_step": 55428, "epoch": 1319} {"train_loss": -5.750065326690674, "global_step": 55429, "epoch": 1319} {"train_loss": -5.809535503387451, "global_step": 55430, "epoch": 1319} {"train_loss": -5.714107513427734, "global_step": 55431, "epoch": 1319} {"train_loss": -5.857904434204102, "global_step": 55432, "epoch": 1319} {"train_loss": -5.792089939117432, "global_step": 55433, "epoch": 1319} {"train_loss": -5.788884162902832, "global_step": 55434, "epoch": 1319} {"train_loss": -5.78652811050415, "global_step": 55435, "epoch": 1319} {"train_loss": -5.947227478027344, "global_step": 55436, "epoch": 1319} {"train_loss": -5.804272651672363, "global_step": 55437, "epoch": 1319} {"train_loss": -5.832517147064209, "global_step": 55438, "epoch": 1319} {"train_loss": -5.837654726845877, "global_step": 55439, "epoch": 1319, "val_loss": 61273.36328125} {"train_loss": -5.8354010581970215, "global_step": 55440, "epoch": 1320} {"train_loss": -5.832536697387695, "global_step": 55441, "epoch": 1320} {"train_loss": -5.73698091506958, "global_step": 55442, "epoch": 1320} {"train_loss": -5.846972465515137, "global_step": 55443, "epoch": 1320} {"train_loss": -5.861324310302734, "global_step": 55444, "epoch": 1320} {"train_loss": -5.736944198608398, "global_step": 55445, "epoch": 1320} {"train_loss": -5.884474277496338, "global_step": 55446, "epoch": 1320} {"train_loss": -5.769031524658203, "global_step": 55447, "epoch": 1320} {"train_loss": -5.8495025634765625, "global_step": 55448, "epoch": 1320} {"train_loss": -5.952053070068359, "global_step": 55449, "epoch": 1320} {"train_loss": -5.879554748535156, "global_step": 55450, "epoch": 1320} {"train_loss": -5.790036201477051, "global_step": 55451, "epoch": 1320} {"train_loss": -5.80642557144165, "global_step": 55452, "epoch": 1320} {"train_loss": -5.926936626434326, "global_step": 55453, "epoch": 1320} {"train_loss": -5.7903289794921875, "global_step": 55454, "epoch": 1320} {"train_loss": -5.798634052276611, "global_step": 55455, "epoch": 1320} {"train_loss": -5.855384349822998, "global_step": 55456, "epoch": 1320} {"train_loss": -5.753492832183838, "global_step": 55457, "epoch": 1320} {"train_loss": -5.762397289276123, "global_step": 55458, "epoch": 1320} {"train_loss": -5.79923677444458, "global_step": 55459, "epoch": 1320} {"train_loss": -5.843764781951904, "global_step": 55460, "epoch": 1320} {"train_loss": -5.796263694763184, "global_step": 55461, "epoch": 1320} {"train_loss": -5.783729553222656, "global_step": 55462, "epoch": 1320} {"train_loss": -5.867196083068848, "global_step": 55463, "epoch": 1320} {"train_loss": -5.766908645629883, "global_step": 55464, "epoch": 1320} {"train_loss": -5.84024715423584, "global_step": 55465, "epoch": 1320} {"train_loss": -5.814952850341797, "global_step": 55466, "epoch": 1320} {"train_loss": -5.788689613342285, "global_step": 55467, "epoch": 1320} {"train_loss": -5.868555545806885, "global_step": 55468, "epoch": 1320} {"train_loss": -5.971063613891602, "global_step": 55469, "epoch": 1320} {"train_loss": -5.958274841308594, "global_step": 55470, "epoch": 1320} {"train_loss": -5.919978141784668, "global_step": 55471, "epoch": 1320} {"train_loss": -5.776631832122803, "global_step": 55472, "epoch": 1320} {"train_loss": -5.877566337585449, "global_step": 55473, "epoch": 1320} {"train_loss": -5.820443153381348, "global_step": 55474, "epoch": 1320} {"train_loss": -5.796854019165039, "global_step": 55475, "epoch": 1320} {"train_loss": -5.754945755004883, "global_step": 55476, "epoch": 1320} {"train_loss": -5.847352027893066, "global_step": 55477, "epoch": 1320} {"train_loss": -5.842171669006348, "global_step": 55478, "epoch": 1320} {"train_loss": -5.665066242218018, "global_step": 55479, "epoch": 1320} {"train_loss": -5.700908184051514, "global_step": 55480, "epoch": 1320} {"train_loss": -5.822127557936168, "global_step": 55481, "epoch": 1320, "val_loss": 61044.2421875} {"train_loss": -5.882284164428711, "global_step": 55482, "epoch": 1321} {"train_loss": -5.90694522857666, "global_step": 55483, "epoch": 1321} {"train_loss": -5.898103713989258, "global_step": 55484, "epoch": 1321} {"train_loss": -5.839086532592773, "global_step": 55485, "epoch": 1321} {"train_loss": -5.898995399475098, "global_step": 55486, "epoch": 1321} {"train_loss": -5.92168664932251, "global_step": 55487, "epoch": 1321} {"train_loss": -5.674834728240967, "global_step": 55488, "epoch": 1321} {"train_loss": -5.863195896148682, "global_step": 55489, "epoch": 1321} {"train_loss": -5.723638534545898, "global_step": 55490, "epoch": 1321} {"train_loss": -5.772444725036621, "global_step": 55491, "epoch": 1321} {"train_loss": -5.802817344665527, "global_step": 55492, "epoch": 1321} {"train_loss": -5.839690685272217, "global_step": 55493, "epoch": 1321} {"train_loss": -5.826971054077148, "global_step": 55494, "epoch": 1321} {"train_loss": -5.7290449142456055, "global_step": 55495, "epoch": 1321} {"train_loss": -5.844831943511963, "global_step": 55496, "epoch": 1321} {"train_loss": -5.902548789978027, "global_step": 55497, "epoch": 1321} {"train_loss": -5.798811912536621, "global_step": 55498, "epoch": 1321} {"train_loss": -5.841499328613281, "global_step": 55499, "epoch": 1321} {"train_loss": -5.843520164489746, "global_step": 55500, "epoch": 1321} {"train_loss": -5.799315929412842, "global_step": 55501, "epoch": 1321} {"train_loss": -5.895583152770996, "global_step": 55502, "epoch": 1321} {"train_loss": -5.8632659912109375, "global_step": 55503, "epoch": 1321} {"train_loss": -5.823521614074707, "global_step": 55504, "epoch": 1321} {"train_loss": -5.862185001373291, "global_step": 55505, "epoch": 1321} {"train_loss": -5.891963958740234, "global_step": 55506, "epoch": 1321} {"train_loss": -5.875956058502197, "global_step": 55507, "epoch": 1321} {"train_loss": -5.852718353271484, "global_step": 55508, "epoch": 1321} {"train_loss": -5.875024318695068, "global_step": 55509, "epoch": 1321} {"train_loss": -5.878940105438232, "global_step": 55510, "epoch": 1321} {"train_loss": -5.925180435180664, "global_step": 55511, "epoch": 1321} {"train_loss": -5.8695878982543945, "global_step": 55512, "epoch": 1321} {"train_loss": -5.751330852508545, "global_step": 55513, "epoch": 1321} {"train_loss": -5.933950424194336, "global_step": 55514, "epoch": 1321} {"train_loss": -5.764156818389893, "global_step": 55515, "epoch": 1321} {"train_loss": -5.860569953918457, "global_step": 55516, "epoch": 1321} {"train_loss": -5.906400680541992, "global_step": 55517, "epoch": 1321} {"train_loss": -5.760251522064209, "global_step": 55518, "epoch": 1321} {"train_loss": -5.920385360717773, "global_step": 55519, "epoch": 1321} {"train_loss": -5.848672866821289, "global_step": 55520, "epoch": 1321} {"train_loss": -5.996476173400879, "global_step": 55521, "epoch": 1321} {"train_loss": -5.809174537658691, "global_step": 55522, "epoch": 1321} {"train_loss": -5.846713270459857, "global_step": 55523, "epoch": 1321, "val_loss": 61248.015625} {"train_loss": -5.914155960083008, "global_step": 55524, "epoch": 1322} {"train_loss": -5.835572242736816, "global_step": 55525, "epoch": 1322} {"train_loss": -5.981742858886719, "global_step": 55526, "epoch": 1322} {"train_loss": -5.788514614105225, "global_step": 55527, "epoch": 1322} {"train_loss": -5.883641719818115, "global_step": 55528, "epoch": 1322} {"train_loss": -5.804464340209961, "global_step": 55529, "epoch": 1322} {"train_loss": -5.8882598876953125, "global_step": 55530, "epoch": 1322} {"train_loss": -6.036959171295166, "global_step": 55531, "epoch": 1322} {"train_loss": -5.8416829109191895, "global_step": 55532, "epoch": 1322} {"train_loss": -5.740903377532959, "global_step": 55533, "epoch": 1322} {"train_loss": -5.851882457733154, "global_step": 55534, "epoch": 1322} {"train_loss": -5.7473039627075195, "global_step": 55535, "epoch": 1322} {"train_loss": -5.808745384216309, "global_step": 55536, "epoch": 1322} {"train_loss": -5.752319812774658, "global_step": 55537, "epoch": 1322} {"train_loss": -5.8398637771606445, "global_step": 55538, "epoch": 1322} {"train_loss": -5.919661045074463, "global_step": 55539, "epoch": 1322} {"train_loss": -5.838663101196289, "global_step": 55540, "epoch": 1322} {"train_loss": -5.846656799316406, "global_step": 55541, "epoch": 1322} {"train_loss": -5.790520191192627, "global_step": 55542, "epoch": 1322} {"train_loss": -5.936800479888916, "global_step": 55543, "epoch": 1322} {"train_loss": -5.922422409057617, "global_step": 55544, "epoch": 1322} {"train_loss": -5.803433418273926, "global_step": 55545, "epoch": 1322} {"train_loss": -5.926042556762695, "global_step": 55546, "epoch": 1322} {"train_loss": -5.783243179321289, "global_step": 55547, "epoch": 1322} {"train_loss": -5.864164352416992, "global_step": 55548, "epoch": 1322} {"train_loss": -6.059311866760254, "global_step": 55549, "epoch": 1322} {"train_loss": -5.920976638793945, "global_step": 55550, "epoch": 1322} {"train_loss": -5.8268537521362305, "global_step": 55551, "epoch": 1322} {"train_loss": -5.714345455169678, "global_step": 55552, "epoch": 1322} {"train_loss": -5.843914985656738, "global_step": 55553, "epoch": 1322} {"train_loss": -5.887538433074951, "global_step": 55554, "epoch": 1322} {"train_loss": -5.816925048828125, "global_step": 55555, "epoch": 1322} {"train_loss": -5.891148567199707, "global_step": 55556, "epoch": 1322} {"train_loss": -5.894819259643555, "global_step": 55557, "epoch": 1322} {"train_loss": -5.910062789916992, "global_step": 55558, "epoch": 1322} {"train_loss": -5.8960442543029785, "global_step": 55559, "epoch": 1322} {"train_loss": -5.635295391082764, "global_step": 55560, "epoch": 1322} {"train_loss": -5.851600646972656, "global_step": 55561, "epoch": 1322} {"train_loss": -5.7193684577941895, "global_step": 55562, "epoch": 1322} {"train_loss": -5.904315948486328, "global_step": 55563, "epoch": 1322} {"train_loss": -5.722397327423096, "global_step": 55564, "epoch": 1322} {"train_loss": -5.848537751606533, "global_step": 55565, "epoch": 1322, "val_loss": 61455.71875} {"train_loss": -5.804225921630859, "global_step": 55566, "epoch": 1323} {"train_loss": -5.783306121826172, "global_step": 55567, "epoch": 1323} {"train_loss": -5.813819885253906, "global_step": 55568, "epoch": 1323} {"train_loss": -5.813365936279297, "global_step": 55569, "epoch": 1323} {"train_loss": -5.777871131896973, "global_step": 55570, "epoch": 1323} {"train_loss": -5.860739231109619, "global_step": 55571, "epoch": 1323} {"train_loss": -5.80814266204834, "global_step": 55572, "epoch": 1323} {"train_loss": -5.729823112487793, "global_step": 55573, "epoch": 1323} {"train_loss": -5.828310489654541, "global_step": 55574, "epoch": 1323} {"train_loss": -5.805087089538574, "global_step": 55575, "epoch": 1323} {"train_loss": -5.701221466064453, "global_step": 55576, "epoch": 1323} {"train_loss": -5.8103179931640625, "global_step": 55577, "epoch": 1323} {"train_loss": -5.838665962219238, "global_step": 55578, "epoch": 1323} {"train_loss": -5.943109512329102, "global_step": 55579, "epoch": 1323} {"train_loss": -5.696896076202393, "global_step": 55580, "epoch": 1323} {"train_loss": -5.848459243774414, "global_step": 55581, "epoch": 1323} {"train_loss": -5.70920991897583, "global_step": 55582, "epoch": 1323} {"train_loss": -5.680273056030273, "global_step": 55583, "epoch": 1323} {"train_loss": -5.818179130554199, "global_step": 55584, "epoch": 1323} {"train_loss": -5.641289710998535, "global_step": 55585, "epoch": 1323} {"train_loss": -5.782769680023193, "global_step": 55586, "epoch": 1323} {"train_loss": -5.740952014923096, "global_step": 55587, "epoch": 1323} {"train_loss": -5.684906959533691, "global_step": 55588, "epoch": 1323} {"train_loss": -5.806476593017578, "global_step": 55589, "epoch": 1323} {"train_loss": -5.815460205078125, "global_step": 55590, "epoch": 1323} {"train_loss": -5.7820539474487305, "global_step": 55591, "epoch": 1323} {"train_loss": -5.881739616394043, "global_step": 55592, "epoch": 1323} {"train_loss": -5.795989513397217, "global_step": 55593, "epoch": 1323} {"train_loss": -5.744978904724121, "global_step": 55594, "epoch": 1323} {"train_loss": -5.838356971740723, "global_step": 55595, "epoch": 1323} {"train_loss": -5.832815170288086, "global_step": 55596, "epoch": 1323} {"train_loss": -6.01979398727417, "global_step": 55597, "epoch": 1323} {"train_loss": -5.897292137145996, "global_step": 55598, "epoch": 1323} {"train_loss": -5.771202087402344, "global_step": 55599, "epoch": 1323} {"train_loss": -5.928609848022461, "global_step": 55600, "epoch": 1323} {"train_loss": -5.847757339477539, "global_step": 55601, "epoch": 1323} {"train_loss": -5.968637466430664, "global_step": 55602, "epoch": 1323} {"train_loss": -5.924398422241211, "global_step": 55603, "epoch": 1323} {"train_loss": -5.837558269500732, "global_step": 55604, "epoch": 1323} {"train_loss": -5.965161323547363, "global_step": 55605, "epoch": 1323} {"train_loss": -5.8329057693481445, "global_step": 55606, "epoch": 1323} {"train_loss": -5.815322353726342, "global_step": 55607, "epoch": 1323, "val_loss": 61535.64453125} {"train_loss": -5.816231727600098, "global_step": 55608, "epoch": 1324} {"train_loss": -5.772311210632324, "global_step": 55609, "epoch": 1324} {"train_loss": -5.862823963165283, "global_step": 55610, "epoch": 1324} {"train_loss": -5.932898998260498, "global_step": 55611, "epoch": 1324} {"train_loss": -6.005301475524902, "global_step": 55612, "epoch": 1324} {"train_loss": -5.928572654724121, "global_step": 55613, "epoch": 1324} {"train_loss": -5.80891752243042, "global_step": 55614, "epoch": 1324} {"train_loss": -5.686061382293701, "global_step": 55615, "epoch": 1324} {"train_loss": -5.874018669128418, "global_step": 55616, "epoch": 1324} {"train_loss": -5.8230061531066895, "global_step": 55617, "epoch": 1324} {"train_loss": -5.947971343994141, "global_step": 55618, "epoch": 1324} {"train_loss": -5.834198474884033, "global_step": 55619, "epoch": 1324} {"train_loss": -5.862406253814697, "global_step": 55620, "epoch": 1324} {"train_loss": -5.8979620933532715, "global_step": 55621, "epoch": 1324} {"train_loss": -5.8549394607543945, "global_step": 55622, "epoch": 1324} {"train_loss": -5.880525588989258, "global_step": 55623, "epoch": 1324} {"train_loss": -5.946194648742676, "global_step": 55624, "epoch": 1324} {"train_loss": -5.901711463928223, "global_step": 55625, "epoch": 1324} {"train_loss": -5.92366886138916, "global_step": 55626, "epoch": 1324} {"train_loss": -5.835694313049316, "global_step": 55627, "epoch": 1324} {"train_loss": -5.870534420013428, "global_step": 55628, "epoch": 1324} {"train_loss": -5.825955390930176, "global_step": 55629, "epoch": 1324} {"train_loss": -5.82188606262207, "global_step": 55630, "epoch": 1324} {"train_loss": -5.910785675048828, "global_step": 55631, "epoch": 1324} {"train_loss": -5.807676792144775, "global_step": 55632, "epoch": 1324} {"train_loss": -5.689871788024902, "global_step": 55633, "epoch": 1324} {"train_loss": -5.904284477233887, "global_step": 55634, "epoch": 1324} {"train_loss": -5.855927467346191, "global_step": 55635, "epoch": 1324} {"train_loss": -5.82480525970459, "global_step": 55636, "epoch": 1324} {"train_loss": -5.851499080657959, "global_step": 55637, "epoch": 1324} {"train_loss": -5.826729774475098, "global_step": 55638, "epoch": 1324} {"train_loss": -5.794078826904297, "global_step": 55639, "epoch": 1324} {"train_loss": -5.877894401550293, "global_step": 55640, "epoch": 1324} {"train_loss": -5.745515823364258, "global_step": 55641, "epoch": 1324} {"train_loss": -5.722090244293213, "global_step": 55642, "epoch": 1324} {"train_loss": -5.905186176300049, "global_step": 55643, "epoch": 1324} {"train_loss": -5.778108596801758, "global_step": 55644, "epoch": 1324} {"train_loss": -5.789923191070557, "global_step": 55645, "epoch": 1324} {"train_loss": -5.8148274421691895, "global_step": 55646, "epoch": 1324} {"train_loss": -5.909048080444336, "global_step": 55647, "epoch": 1324} {"train_loss": -5.649781227111816, "global_step": 55648, "epoch": 1324} {"train_loss": -5.844050498235793, "global_step": 55649, "epoch": 1324, "val_loss": 61327.65234375} {"train_loss": -5.783356666564941, "global_step": 55650, "epoch": 1325} {"train_loss": -5.715557098388672, "global_step": 55651, "epoch": 1325} {"train_loss": -5.720196723937988, "global_step": 55652, "epoch": 1325} {"train_loss": -5.709362030029297, "global_step": 55653, "epoch": 1325} {"train_loss": -5.835559844970703, "global_step": 55654, "epoch": 1325} {"train_loss": -5.917494773864746, "global_step": 55655, "epoch": 1325} {"train_loss": -5.892297744750977, "global_step": 55656, "epoch": 1325} {"train_loss": -5.803120136260986, "global_step": 55657, "epoch": 1325} {"train_loss": -5.80165958404541, "global_step": 55658, "epoch": 1325} {"train_loss": -5.857579231262207, "global_step": 55659, "epoch": 1325} {"train_loss": -5.770798683166504, "global_step": 55660, "epoch": 1325} {"train_loss": -5.8744096755981445, "global_step": 55661, "epoch": 1325} {"train_loss": -5.901434421539307, "global_step": 55662, "epoch": 1325} {"train_loss": -5.76619815826416, "global_step": 55663, "epoch": 1325} {"train_loss": -5.906983375549316, "global_step": 55664, "epoch": 1325} {"train_loss": -5.831301689147949, "global_step": 55665, "epoch": 1325} {"train_loss": -5.85666036605835, "global_step": 55666, "epoch": 1325} {"train_loss": -5.857295036315918, "global_step": 55667, "epoch": 1325} {"train_loss": -5.842007637023926, "global_step": 55668, "epoch": 1325} {"train_loss": -5.92808723449707, "global_step": 55669, "epoch": 1325} {"train_loss": -5.866239070892334, "global_step": 55670, "epoch": 1325} {"train_loss": -5.74981689453125, "global_step": 55671, "epoch": 1325} {"train_loss": -5.85139274597168, "global_step": 55672, "epoch": 1325} {"train_loss": -5.762642860412598, "global_step": 55673, "epoch": 1325} {"train_loss": -5.8174896240234375, "global_step": 55674, "epoch": 1325} {"train_loss": -5.936487197875977, "global_step": 55675, "epoch": 1325} {"train_loss": -5.865653991699219, "global_step": 55676, "epoch": 1325} {"train_loss": -5.938819885253906, "global_step": 55677, "epoch": 1325} {"train_loss": -5.935622692108154, "global_step": 55678, "epoch": 1325} {"train_loss": -5.853987693786621, "global_step": 55679, "epoch": 1325} {"train_loss": -5.945860862731934, "global_step": 55680, "epoch": 1325} {"train_loss": -5.928342819213867, "global_step": 55681, "epoch": 1325} {"train_loss": -5.788963794708252, "global_step": 55682, "epoch": 1325} {"train_loss": -5.793147563934326, "global_step": 55683, "epoch": 1325} {"train_loss": -5.888534069061279, "global_step": 55684, "epoch": 1325} {"train_loss": -5.735416889190674, "global_step": 55685, "epoch": 1325} {"train_loss": -5.795281887054443, "global_step": 55686, "epoch": 1325} {"train_loss": -5.781219482421875, "global_step": 55687, "epoch": 1325} {"train_loss": -5.782958507537842, "global_step": 55688, "epoch": 1325} {"train_loss": -5.830896377563477, "global_step": 55689, "epoch": 1325} {"train_loss": -5.936493873596191, "global_step": 55690, "epoch": 1325} {"train_loss": -5.8392600899650935, "global_step": 55691, "epoch": 1325, "val_loss": 61361.6875} {"train_loss": -5.956376552581787, "global_step": 55692, "epoch": 1326} {"train_loss": -5.800074100494385, "global_step": 55693, "epoch": 1326} {"train_loss": -6.0375823974609375, "global_step": 55694, "epoch": 1326} {"train_loss": -5.896726608276367, "global_step": 55695, "epoch": 1326} {"train_loss": -5.828758239746094, "global_step": 55696, "epoch": 1326} {"train_loss": -5.865306854248047, "global_step": 55697, "epoch": 1326} {"train_loss": -5.924161911010742, "global_step": 55698, "epoch": 1326} {"train_loss": -5.835423469543457, "global_step": 55699, "epoch": 1326} {"train_loss": -5.844631195068359, "global_step": 55700, "epoch": 1326} {"train_loss": -5.799825668334961, "global_step": 55701, "epoch": 1326} {"train_loss": -5.714443206787109, "global_step": 55702, "epoch": 1326} {"train_loss": -5.92973518371582, "global_step": 55703, "epoch": 1326} {"train_loss": -5.888918876647949, "global_step": 55704, "epoch": 1326} {"train_loss": -5.802309989929199, "global_step": 55705, "epoch": 1326} {"train_loss": -5.879034519195557, "global_step": 55706, "epoch": 1326} {"train_loss": -5.765851020812988, "global_step": 55707, "epoch": 1326} {"train_loss": -5.976723670959473, "global_step": 55708, "epoch": 1326} {"train_loss": -5.893311500549316, "global_step": 55709, "epoch": 1326} {"train_loss": -5.805486679077148, "global_step": 55710, "epoch": 1326} {"train_loss": -5.821759223937988, "global_step": 55711, "epoch": 1326} {"train_loss": -5.7852888107299805, "global_step": 55712, "epoch": 1326} {"train_loss": -5.967167854309082, "global_step": 55713, "epoch": 1326} {"train_loss": -5.865285873413086, "global_step": 55714, "epoch": 1326} {"train_loss": -5.91853666305542, "global_step": 55715, "epoch": 1326} {"train_loss": -5.907502174377441, "global_step": 55716, "epoch": 1326} {"train_loss": -5.853163719177246, "global_step": 55717, "epoch": 1326} {"train_loss": -5.903242111206055, "global_step": 55718, "epoch": 1326} {"train_loss": -5.799226760864258, "global_step": 55719, "epoch": 1326} {"train_loss": -5.82668924331665, "global_step": 55720, "epoch": 1326} {"train_loss": -5.916567325592041, "global_step": 55721, "epoch": 1326} {"train_loss": -5.860025405883789, "global_step": 55722, "epoch": 1326} {"train_loss": -5.867349624633789, "global_step": 55723, "epoch": 1326} {"train_loss": -5.669468402862549, "global_step": 55724, "epoch": 1326} {"train_loss": -5.790556907653809, "global_step": 55725, "epoch": 1326} {"train_loss": -5.751767158508301, "global_step": 55726, "epoch": 1326} {"train_loss": -5.727509498596191, "global_step": 55727, "epoch": 1326} {"train_loss": -5.872762680053711, "global_step": 55728, "epoch": 1326} {"train_loss": -5.7451863288879395, "global_step": 55729, "epoch": 1326} {"train_loss": -5.779468536376953, "global_step": 55730, "epoch": 1326} {"train_loss": -5.854171276092529, "global_step": 55731, "epoch": 1326} {"train_loss": -5.952815055847168, "global_step": 55732, "epoch": 1326} {"train_loss": -5.8501536164964945, "global_step": 55733, "epoch": 1326, "val_loss": 61545.88671875} {"train_loss": -5.865206241607666, "global_step": 55734, "epoch": 1327} {"train_loss": -5.77788782119751, "global_step": 55735, "epoch": 1327} {"train_loss": -5.883779048919678, "global_step": 55736, "epoch": 1327} {"train_loss": -5.846750736236572, "global_step": 55737, "epoch": 1327} {"train_loss": -5.951313018798828, "global_step": 55738, "epoch": 1327} {"train_loss": -5.900012493133545, "global_step": 55739, "epoch": 1327} {"train_loss": -5.855313777923584, "global_step": 55740, "epoch": 1327} {"train_loss": -5.706698894500732, "global_step": 55741, "epoch": 1327} {"train_loss": -5.92568826675415, "global_step": 55742, "epoch": 1327} {"train_loss": -5.860138893127441, "global_step": 55743, "epoch": 1327} {"train_loss": -5.861142158508301, "global_step": 55744, "epoch": 1327} {"train_loss": -5.837018013000488, "global_step": 55745, "epoch": 1327} {"train_loss": -5.938477516174316, "global_step": 55746, "epoch": 1327} {"train_loss": -5.9123334884643555, "global_step": 55747, "epoch": 1327} {"train_loss": -5.89192533493042, "global_step": 55748, "epoch": 1327} {"train_loss": -5.7567033767700195, "global_step": 55749, "epoch": 1327} {"train_loss": -5.87396240234375, "global_step": 55750, "epoch": 1327} {"train_loss": -5.81456184387207, "global_step": 55751, "epoch": 1327} {"train_loss": -5.873786926269531, "global_step": 55752, "epoch": 1327} {"train_loss": -5.757762908935547, "global_step": 55753, "epoch": 1327} {"train_loss": -5.886479377746582, "global_step": 55754, "epoch": 1327} {"train_loss": -5.829021453857422, "global_step": 55755, "epoch": 1327} {"train_loss": -5.884082317352295, "global_step": 55756, "epoch": 1327} {"train_loss": -5.736680030822754, "global_step": 55757, "epoch": 1327} {"train_loss": -5.825985908508301, "global_step": 55758, "epoch": 1327} {"train_loss": -5.754900932312012, "global_step": 55759, "epoch": 1327} {"train_loss": -5.796572685241699, "global_step": 55760, "epoch": 1327} {"train_loss": -5.832582950592041, "global_step": 55761, "epoch": 1327} {"train_loss": -5.826908111572266, "global_step": 55762, "epoch": 1327} {"train_loss": -5.888964653015137, "global_step": 55763, "epoch": 1327} {"train_loss": -5.800930500030518, "global_step": 55764, "epoch": 1327} {"train_loss": -5.936250686645508, "global_step": 55765, "epoch": 1327} {"train_loss": -5.870306968688965, "global_step": 55766, "epoch": 1327} {"train_loss": -5.894077777862549, "global_step": 55767, "epoch": 1327} {"train_loss": -5.922493934631348, "global_step": 55768, "epoch": 1327} {"train_loss": -5.823770523071289, "global_step": 55769, "epoch": 1327} {"train_loss": -5.866879463195801, "global_step": 55770, "epoch": 1327} {"train_loss": -5.7622528076171875, "global_step": 55771, "epoch": 1327} {"train_loss": -5.865659236907959, "global_step": 55772, "epoch": 1327} {"train_loss": -5.747455596923828, "global_step": 55773, "epoch": 1327} {"train_loss": -5.86353874206543, "global_step": 55774, "epoch": 1327} {"train_loss": -5.84554402033488, "global_step": 55775, "epoch": 1327, "val_loss": 61411.0} {"train_loss": -5.935547828674316, "global_step": 55776, "epoch": 1328} {"train_loss": -5.811822891235352, "global_step": 55777, "epoch": 1328} {"train_loss": -5.8753886222839355, "global_step": 55778, "epoch": 1328} {"train_loss": -5.860978126525879, "global_step": 55779, "epoch": 1328} {"train_loss": -5.998090744018555, "global_step": 55780, "epoch": 1328} {"train_loss": -5.98187780380249, "global_step": 55781, "epoch": 1328} {"train_loss": -5.791262149810791, "global_step": 55782, "epoch": 1328} {"train_loss": -5.777128219604492, "global_step": 55783, "epoch": 1328} {"train_loss": -5.947584629058838, "global_step": 55784, "epoch": 1328} {"train_loss": -5.845785140991211, "global_step": 55785, "epoch": 1328} {"train_loss": -5.787748336791992, "global_step": 55786, "epoch": 1328} {"train_loss": -5.842013835906982, "global_step": 55787, "epoch": 1328} {"train_loss": -5.785983085632324, "global_step": 55788, "epoch": 1328} {"train_loss": -5.805964469909668, "global_step": 55789, "epoch": 1328} {"train_loss": -5.918964385986328, "global_step": 55790, "epoch": 1328} {"train_loss": -5.828670024871826, "global_step": 55791, "epoch": 1328} {"train_loss": -5.968846797943115, "global_step": 55792, "epoch": 1328} {"train_loss": -5.742532730102539, "global_step": 55793, "epoch": 1328} {"train_loss": -5.869445323944092, "global_step": 55794, "epoch": 1328} {"train_loss": -5.900811195373535, "global_step": 55795, "epoch": 1328} {"train_loss": -5.892787933349609, "global_step": 55796, "epoch": 1328} {"train_loss": -5.880462646484375, "global_step": 55797, "epoch": 1328} {"train_loss": -5.882798194885254, "global_step": 55798, "epoch": 1328} {"train_loss": -5.939553737640381, "global_step": 55799, "epoch": 1328} {"train_loss": -5.809586524963379, "global_step": 55800, "epoch": 1328} {"train_loss": -5.845057964324951, "global_step": 55801, "epoch": 1328} {"train_loss": -5.673042297363281, "global_step": 55802, "epoch": 1328} {"train_loss": -5.834224700927734, "global_step": 55803, "epoch": 1328} {"train_loss": -5.767641067504883, "global_step": 55804, "epoch": 1328} {"train_loss": -5.951882839202881, "global_step": 55805, "epoch": 1328} {"train_loss": -5.702661514282227, "global_step": 55806, "epoch": 1328} {"train_loss": -5.662613391876221, "global_step": 55807, "epoch": 1328} {"train_loss": -5.844980239868164, "global_step": 55808, "epoch": 1328} {"train_loss": -5.909087657928467, "global_step": 55809, "epoch": 1328} {"train_loss": -5.898890018463135, "global_step": 55810, "epoch": 1328} {"train_loss": -5.820505142211914, "global_step": 55811, "epoch": 1328} {"train_loss": -5.836024284362793, "global_step": 55812, "epoch": 1328} {"train_loss": -5.8706207275390625, "global_step": 55813, "epoch": 1328} {"train_loss": -5.876072883605957, "global_step": 55814, "epoch": 1328} {"train_loss": -5.920683860778809, "global_step": 55815, "epoch": 1328} {"train_loss": -5.730621814727783, "global_step": 55816, "epoch": 1328} {"train_loss": -5.848913964771089, "global_step": 55817, "epoch": 1328, "val_loss": 61684.8671875} {"train_loss": -5.737373352050781, "global_step": 55818, "epoch": 1329} {"train_loss": -5.744265556335449, "global_step": 55819, "epoch": 1329} {"train_loss": -5.912600040435791, "global_step": 55820, "epoch": 1329} {"train_loss": -5.796913146972656, "global_step": 55821, "epoch": 1329} {"train_loss": -5.831201553344727, "global_step": 55822, "epoch": 1329} {"train_loss": -5.85467529296875, "global_step": 55823, "epoch": 1329} {"train_loss": -5.838852882385254, "global_step": 55824, "epoch": 1329} {"train_loss": -5.913309097290039, "global_step": 55825, "epoch": 1329} {"train_loss": -5.794977188110352, "global_step": 55826, "epoch": 1329} {"train_loss": -5.885562896728516, "global_step": 55827, "epoch": 1329} {"train_loss": -5.940189361572266, "global_step": 55828, "epoch": 1329} {"train_loss": -5.888611316680908, "global_step": 55829, "epoch": 1329} {"train_loss": -5.902310371398926, "global_step": 55830, "epoch": 1329} {"train_loss": -5.856117248535156, "global_step": 55831, "epoch": 1329} {"train_loss": -5.848348617553711, "global_step": 55832, "epoch": 1329} {"train_loss": -5.832381248474121, "global_step": 55833, "epoch": 1329} {"train_loss": -5.889163494110107, "global_step": 55834, "epoch": 1329} {"train_loss": -5.79376220703125, "global_step": 55835, "epoch": 1329} {"train_loss": -5.911095142364502, "global_step": 55836, "epoch": 1329} {"train_loss": -5.829087257385254, "global_step": 55837, "epoch": 1329} {"train_loss": -5.793848514556885, "global_step": 55838, "epoch": 1329} {"train_loss": -5.920443534851074, "global_step": 55839, "epoch": 1329} {"train_loss": -5.907167434692383, "global_step": 55840, "epoch": 1329} {"train_loss": -5.7636237144470215, "global_step": 55841, "epoch": 1329} {"train_loss": -5.809040546417236, "global_step": 55842, "epoch": 1329} {"train_loss": -5.996855735778809, "global_step": 55843, "epoch": 1329} {"train_loss": -5.790724277496338, "global_step": 55844, "epoch": 1329} {"train_loss": -5.8954758644104, "global_step": 55845, "epoch": 1329} {"train_loss": -5.91076135635376, "global_step": 55846, "epoch": 1329} {"train_loss": -5.811154365539551, "global_step": 55847, "epoch": 1329} {"train_loss": -5.8151421546936035, "global_step": 55848, "epoch": 1329} {"train_loss": -5.969366073608398, "global_step": 55849, "epoch": 1329} {"train_loss": -5.919486999511719, "global_step": 55850, "epoch": 1329} {"train_loss": -5.9716715812683105, "global_step": 55851, "epoch": 1329} {"train_loss": -5.87717342376709, "global_step": 55852, "epoch": 1329} {"train_loss": -5.872784614562988, "global_step": 55853, "epoch": 1329} {"train_loss": -5.890876770019531, "global_step": 55854, "epoch": 1329} {"train_loss": -5.86221170425415, "global_step": 55855, "epoch": 1329} {"train_loss": -5.945979118347168, "global_step": 55856, "epoch": 1329} {"train_loss": -5.7630791664123535, "global_step": 55857, "epoch": 1329} {"train_loss": -5.93241024017334, "global_step": 55858, "epoch": 1329} {"train_loss": -5.8649970690409345, "global_step": 55859, "epoch": 1329, "val_loss": 61337.80078125} {"train_loss": -5.847212791442871, "global_step": 55860, "epoch": 1330} {"train_loss": -5.8774189949035645, "global_step": 55861, "epoch": 1330} {"train_loss": -6.017611026763916, "global_step": 55862, "epoch": 1330} {"train_loss": -5.916861057281494, "global_step": 55863, "epoch": 1330} {"train_loss": -5.916196823120117, "global_step": 55864, "epoch": 1330} {"train_loss": -5.920846939086914, "global_step": 55865, "epoch": 1330} {"train_loss": -5.712881088256836, "global_step": 55866, "epoch": 1330} {"train_loss": -5.81156063079834, "global_step": 55867, "epoch": 1330} {"train_loss": -5.825317859649658, "global_step": 55868, "epoch": 1330} {"train_loss": -5.755217552185059, "global_step": 55869, "epoch": 1330} {"train_loss": -5.85906982421875, "global_step": 55870, "epoch": 1330} {"train_loss": -5.940432548522949, "global_step": 55871, "epoch": 1330} {"train_loss": -5.9276933670043945, "global_step": 55872, "epoch": 1330} {"train_loss": -5.8700408935546875, "global_step": 55873, "epoch": 1330} {"train_loss": -5.900998115539551, "global_step": 55874, "epoch": 1330} {"train_loss": -5.938443183898926, "global_step": 55875, "epoch": 1330} {"train_loss": -5.883642673492432, "global_step": 55876, "epoch": 1330} {"train_loss": -5.915494918823242, "global_step": 55877, "epoch": 1330} {"train_loss": -6.021451473236084, "global_step": 55878, "epoch": 1330} {"train_loss": -5.866208076477051, "global_step": 55879, "epoch": 1330} {"train_loss": -5.8770432472229, "global_step": 55880, "epoch": 1330} {"train_loss": -5.84214973449707, "global_step": 55881, "epoch": 1330} {"train_loss": -5.759742736816406, "global_step": 55882, "epoch": 1330} {"train_loss": -5.832581520080566, "global_step": 55883, "epoch": 1330} {"train_loss": -5.754603385925293, "global_step": 55884, "epoch": 1330} {"train_loss": -5.790797233581543, "global_step": 55885, "epoch": 1330} {"train_loss": -5.790859699249268, "global_step": 55886, "epoch": 1330} {"train_loss": -5.810039520263672, "global_step": 55887, "epoch": 1330} {"train_loss": -5.8935747146606445, "global_step": 55888, "epoch": 1330} {"train_loss": -5.955833435058594, "global_step": 55889, "epoch": 1330} {"train_loss": -5.797239303588867, "global_step": 55890, "epoch": 1330} {"train_loss": -5.835744857788086, "global_step": 55891, "epoch": 1330} {"train_loss": -5.7664337158203125, "global_step": 55892, "epoch": 1330} {"train_loss": -5.820992469787598, "global_step": 55893, "epoch": 1330} {"train_loss": -5.8036885261535645, "global_step": 55894, "epoch": 1330} {"train_loss": -5.830068111419678, "global_step": 55895, "epoch": 1330} {"train_loss": -5.651191711425781, "global_step": 55896, "epoch": 1330} {"train_loss": -5.859673976898193, "global_step": 55897, "epoch": 1330} {"train_loss": -5.850768089294434, "global_step": 55898, "epoch": 1330} {"train_loss": -5.904570579528809, "global_step": 55899, "epoch": 1330} {"train_loss": -5.932893753051758, "global_step": 55900, "epoch": 1330} {"train_loss": -5.858079036076863, "global_step": 55901, "epoch": 1330, "val_loss": 61612.1171875} {"train_loss": -5.855007171630859, "global_step": 55902, "epoch": 1331} {"train_loss": -5.843863487243652, "global_step": 55903, "epoch": 1331} {"train_loss": -5.863999366760254, "global_step": 55904, "epoch": 1331} {"train_loss": -5.840367794036865, "global_step": 55905, "epoch": 1331} {"train_loss": -5.8607177734375, "global_step": 55906, "epoch": 1331} {"train_loss": -5.978283882141113, "global_step": 55907, "epoch": 1331} {"train_loss": -5.859784126281738, "global_step": 55908, "epoch": 1331} {"train_loss": -5.817115783691406, "global_step": 55909, "epoch": 1331} {"train_loss": -5.864904880523682, "global_step": 55910, "epoch": 1331} {"train_loss": -5.767150402069092, "global_step": 55911, "epoch": 1331} {"train_loss": -5.795053005218506, "global_step": 55912, "epoch": 1331} {"train_loss": -5.809405326843262, "global_step": 55913, "epoch": 1331} {"train_loss": -5.931784629821777, "global_step": 55914, "epoch": 1331} {"train_loss": -5.852502822875977, "global_step": 55915, "epoch": 1331} {"train_loss": -5.949410438537598, "global_step": 55916, "epoch": 1331} {"train_loss": -5.733244895935059, "global_step": 55917, "epoch": 1331} {"train_loss": -5.847052574157715, "global_step": 55918, "epoch": 1331} {"train_loss": -5.780938625335693, "global_step": 55919, "epoch": 1331} {"train_loss": -5.7071967124938965, "global_step": 55920, "epoch": 1331} {"train_loss": -5.745068550109863, "global_step": 55921, "epoch": 1331} {"train_loss": -5.783645153045654, "global_step": 55922, "epoch": 1331} {"train_loss": -5.6573896408081055, "global_step": 55923, "epoch": 1331} {"train_loss": -5.837223052978516, "global_step": 55924, "epoch": 1331} {"train_loss": -5.878751277923584, "global_step": 55925, "epoch": 1331} {"train_loss": -5.868639945983887, "global_step": 55926, "epoch": 1331} {"train_loss": -5.822272777557373, "global_step": 55927, "epoch": 1331} {"train_loss": -5.797749042510986, "global_step": 55928, "epoch": 1331} {"train_loss": -5.905594825744629, "global_step": 55929, "epoch": 1331} {"train_loss": -5.718188285827637, "global_step": 55930, "epoch": 1331} {"train_loss": -5.682441234588623, "global_step": 55931, "epoch": 1331} {"train_loss": -5.876597881317139, "global_step": 55932, "epoch": 1331} {"train_loss": -5.808123588562012, "global_step": 55933, "epoch": 1331} {"train_loss": -5.7834320068359375, "global_step": 55934, "epoch": 1331} {"train_loss": -5.835620880126953, "global_step": 55935, "epoch": 1331} {"train_loss": -5.797741889953613, "global_step": 55936, "epoch": 1331} {"train_loss": -5.876575469970703, "global_step": 55937, "epoch": 1331} {"train_loss": -5.881462574005127, "global_step": 55938, "epoch": 1331} {"train_loss": -5.738034725189209, "global_step": 55939, "epoch": 1331} {"train_loss": -5.818503379821777, "global_step": 55940, "epoch": 1331} {"train_loss": -5.612005233764648, "global_step": 55941, "epoch": 1331} {"train_loss": -5.803244590759277, "global_step": 55942, "epoch": 1331} {"train_loss": -5.814757085981823, "global_step": 55943, "epoch": 1331, "val_loss": 61843.5546875} {"train_loss": -5.807038307189941, "global_step": 55944, "epoch": 1332} {"train_loss": -5.920285224914551, "global_step": 55945, "epoch": 1332} {"train_loss": -5.7376508712768555, "global_step": 55946, "epoch": 1332} {"train_loss": -5.821754455566406, "global_step": 55947, "epoch": 1332} {"train_loss": -5.8626837730407715, "global_step": 55948, "epoch": 1332} {"train_loss": -5.7504658699035645, "global_step": 55949, "epoch": 1332} {"train_loss": -5.825926780700684, "global_step": 55950, "epoch": 1332} {"train_loss": -5.78931999206543, "global_step": 55951, "epoch": 1332} {"train_loss": -5.947350025177002, "global_step": 55952, "epoch": 1332} {"train_loss": -5.764200210571289, "global_step": 55953, "epoch": 1332} {"train_loss": -5.852214336395264, "global_step": 55954, "epoch": 1332} {"train_loss": -5.976276397705078, "global_step": 55955, "epoch": 1332} {"train_loss": -5.85807466506958, "global_step": 55956, "epoch": 1332} {"train_loss": -5.804081916809082, "global_step": 55957, "epoch": 1332} {"train_loss": -5.933284759521484, "global_step": 55958, "epoch": 1332} {"train_loss": -5.857465744018555, "global_step": 55959, "epoch": 1332} {"train_loss": -5.758599758148193, "global_step": 55960, "epoch": 1332} {"train_loss": -5.862799167633057, "global_step": 55961, "epoch": 1332} {"train_loss": -5.864613056182861, "global_step": 55962, "epoch": 1332} {"train_loss": -5.735779285430908, "global_step": 55963, "epoch": 1332} {"train_loss": -5.864370346069336, "global_step": 55964, "epoch": 1332} {"train_loss": -5.761780738830566, "global_step": 55965, "epoch": 1332} {"train_loss": -5.80001974105835, "global_step": 55966, "epoch": 1332} {"train_loss": -5.8992438316345215, "global_step": 55967, "epoch": 1332} {"train_loss": -5.818096160888672, "global_step": 55968, "epoch": 1332} {"train_loss": -5.8313798904418945, "global_step": 55969, "epoch": 1332} {"train_loss": -5.915589332580566, "global_step": 55970, "epoch": 1332} {"train_loss": -5.6873321533203125, "global_step": 55971, "epoch": 1332} {"train_loss": -5.851582050323486, "global_step": 55972, "epoch": 1332} {"train_loss": -5.761115550994873, "global_step": 55973, "epoch": 1332} {"train_loss": -5.968650817871094, "global_step": 55974, "epoch": 1332} {"train_loss": -5.770559310913086, "global_step": 55975, "epoch": 1332} {"train_loss": -5.783498764038086, "global_step": 55976, "epoch": 1332} {"train_loss": -5.841209411621094, "global_step": 55977, "epoch": 1332} {"train_loss": -5.836268424987793, "global_step": 55978, "epoch": 1332} {"train_loss": -5.843542098999023, "global_step": 55979, "epoch": 1332} {"train_loss": -5.865382671356201, "global_step": 55980, "epoch": 1332} {"train_loss": -5.885614395141602, "global_step": 55981, "epoch": 1332} {"train_loss": -5.930622577667236, "global_step": 55982, "epoch": 1332} {"train_loss": -5.866980075836182, "global_step": 55983, "epoch": 1332} {"train_loss": -5.721515655517578, "global_step": 55984, "epoch": 1332} {"train_loss": -5.83395588965643, "global_step": 55985, "epoch": 1332, "val_loss": 61481.09765625} {"train_loss": -5.949171543121338, "global_step": 55986, "epoch": 1333} {"train_loss": -5.805046081542969, "global_step": 55987, "epoch": 1333} {"train_loss": -5.72501277923584, "global_step": 55988, "epoch": 1333} {"train_loss": -5.847657203674316, "global_step": 55989, "epoch": 1333} {"train_loss": -5.80049991607666, "global_step": 55990, "epoch": 1333} {"train_loss": -5.875735759735107, "global_step": 55991, "epoch": 1333} {"train_loss": -5.9718217849731445, "global_step": 55992, "epoch": 1333} {"train_loss": -5.950868606567383, "global_step": 55993, "epoch": 1333} {"train_loss": -5.826860427856445, "global_step": 55994, "epoch": 1333} {"train_loss": -5.856180667877197, "global_step": 55995, "epoch": 1333} {"train_loss": -5.984129905700684, "global_step": 55996, "epoch": 1333} {"train_loss": -5.784145355224609, "global_step": 55997, "epoch": 1333} {"train_loss": -5.929449081420898, "global_step": 55998, "epoch": 1333} {"train_loss": -5.794323921203613, "global_step": 55999, "epoch": 1333} {"train_loss": -5.86977481842041, "global_step": 56000, "epoch": 1333} {"train_loss": -5.7947282791137695, "global_step": 56001, "epoch": 1333} {"train_loss": -5.823755264282227, "global_step": 56002, "epoch": 1333} {"train_loss": -5.854659080505371, "global_step": 56003, "epoch": 1333} {"train_loss": -5.999177932739258, "global_step": 56004, "epoch": 1333} {"train_loss": -5.8231987953186035, "global_step": 56005, "epoch": 1333} {"train_loss": -6.02529764175415, "global_step": 56006, "epoch": 1333} {"train_loss": -5.8661956787109375, "global_step": 56007, "epoch": 1333} {"train_loss": -6.033766746520996, "global_step": 56008, "epoch": 1333} {"train_loss": -5.802160263061523, "global_step": 56009, "epoch": 1333} {"train_loss": -5.833351135253906, "global_step": 56010, "epoch": 1333} {"train_loss": -5.784215927124023, "global_step": 56011, "epoch": 1333} {"train_loss": -5.897721767425537, "global_step": 56012, "epoch": 1333} {"train_loss": -5.848909378051758, "global_step": 56013, "epoch": 1333} {"train_loss": -5.750537872314453, "global_step": 56014, "epoch": 1333} {"train_loss": -5.770381450653076, "global_step": 56015, "epoch": 1333} {"train_loss": -5.842555999755859, "global_step": 56016, "epoch": 1333} {"train_loss": -5.729466438293457, "global_step": 56017, "epoch": 1333} {"train_loss": -5.871712684631348, "global_step": 56018, "epoch": 1333} {"train_loss": -5.655304908752441, "global_step": 56019, "epoch": 1333} {"train_loss": -5.728161811828613, "global_step": 56020, "epoch": 1333} {"train_loss": -5.764044761657715, "global_step": 56021, "epoch": 1333} {"train_loss": -5.841966152191162, "global_step": 56022, "epoch": 1333} {"train_loss": -5.818337440490723, "global_step": 56023, "epoch": 1333} {"train_loss": -5.959719657897949, "global_step": 56024, "epoch": 1333} {"train_loss": -5.77054500579834, "global_step": 56025, "epoch": 1333} {"train_loss": -5.872010231018066, "global_step": 56026, "epoch": 1333} {"train_loss": -5.848010937372844, "global_step": 56027, "epoch": 1333, "val_loss": 61664.93359375} {"train_loss": -5.799376964569092, "global_step": 56028, "epoch": 1334} {"train_loss": -5.801302909851074, "global_step": 56029, "epoch": 1334} {"train_loss": -5.784051895141602, "global_step": 56030, "epoch": 1334} {"train_loss": -5.780372142791748, "global_step": 56031, "epoch": 1334} {"train_loss": -5.784884452819824, "global_step": 56032, "epoch": 1334} {"train_loss": -5.894588947296143, "global_step": 56033, "epoch": 1334} {"train_loss": -6.006072044372559, "global_step": 56034, "epoch": 1334} {"train_loss": -5.790317535400391, "global_step": 56035, "epoch": 1334} {"train_loss": -5.905705451965332, "global_step": 56036, "epoch": 1334} {"train_loss": -5.858661651611328, "global_step": 56037, "epoch": 1334} {"train_loss": -5.914681434631348, "global_step": 56038, "epoch": 1334} {"train_loss": -5.917421340942383, "global_step": 56039, "epoch": 1334} {"train_loss": -5.876471996307373, "global_step": 56040, "epoch": 1334} {"train_loss": -6.073575973510742, "global_step": 56041, "epoch": 1334} {"train_loss": -5.881848335266113, "global_step": 56042, "epoch": 1334} {"train_loss": -5.92968225479126, "global_step": 56043, "epoch": 1334} {"train_loss": -5.817656517028809, "global_step": 56044, "epoch": 1334} {"train_loss": -5.947799205780029, "global_step": 56045, "epoch": 1334} {"train_loss": -5.847702980041504, "global_step": 56046, "epoch": 1334} {"train_loss": -5.870748043060303, "global_step": 56047, "epoch": 1334} {"train_loss": -5.738778114318848, "global_step": 56048, "epoch": 1334} {"train_loss": -5.714044570922852, "global_step": 56049, "epoch": 1334} {"train_loss": -5.848458290100098, "global_step": 56050, "epoch": 1334} {"train_loss": -5.791663646697998, "global_step": 56051, "epoch": 1334} {"train_loss": -5.881677627563477, "global_step": 56052, "epoch": 1334} {"train_loss": -6.009177207946777, "global_step": 56053, "epoch": 1334} {"train_loss": -5.834072113037109, "global_step": 56054, "epoch": 1334} {"train_loss": -5.752066612243652, "global_step": 56055, "epoch": 1334} {"train_loss": -5.909656524658203, "global_step": 56056, "epoch": 1334} {"train_loss": -5.903984069824219, "global_step": 56057, "epoch": 1334} {"train_loss": -5.920768737792969, "global_step": 56058, "epoch": 1334} {"train_loss": -5.96237325668335, "global_step": 56059, "epoch": 1334} {"train_loss": -5.827410697937012, "global_step": 56060, "epoch": 1334} {"train_loss": -5.914566993713379, "global_step": 56061, "epoch": 1334} {"train_loss": -5.891548156738281, "global_step": 56062, "epoch": 1334} {"train_loss": -5.858607769012451, "global_step": 56063, "epoch": 1334} {"train_loss": -5.768190383911133, "global_step": 56064, "epoch": 1334} {"train_loss": -5.7866010665893555, "global_step": 56065, "epoch": 1334} {"train_loss": -5.815534591674805, "global_step": 56066, "epoch": 1334} {"train_loss": -5.7955121994018555, "global_step": 56067, "epoch": 1334} {"train_loss": -5.879266738891602, "global_step": 56068, "epoch": 1334} {"train_loss": -5.861357859202793, "global_step": 56069, "epoch": 1334, "val_loss": 61444.87109375} {"train_loss": -6.0118513107299805, "global_step": 56070, "epoch": 1335} {"train_loss": -5.796841621398926, "global_step": 56071, "epoch": 1335} {"train_loss": -5.775493621826172, "global_step": 56072, "epoch": 1335} {"train_loss": -5.847246170043945, "global_step": 56073, "epoch": 1335} {"train_loss": -6.042214393615723, "global_step": 56074, "epoch": 1335} {"train_loss": -5.886689186096191, "global_step": 56075, "epoch": 1335} {"train_loss": -5.968935966491699, "global_step": 56076, "epoch": 1335} {"train_loss": -5.867531776428223, "global_step": 56077, "epoch": 1335} {"train_loss": -5.807895183563232, "global_step": 56078, "epoch": 1335} {"train_loss": -5.874460220336914, "global_step": 56079, "epoch": 1335} {"train_loss": -5.853486061096191, "global_step": 56080, "epoch": 1335} {"train_loss": -6.071269512176514, "global_step": 56081, "epoch": 1335} {"train_loss": -5.938396453857422, "global_step": 56082, "epoch": 1335} {"train_loss": -5.820828437805176, "global_step": 56083, "epoch": 1335} {"train_loss": -5.907314300537109, "global_step": 56084, "epoch": 1335} {"train_loss": -5.871997833251953, "global_step": 56085, "epoch": 1335} {"train_loss": -5.746636390686035, "global_step": 56086, "epoch": 1335} {"train_loss": -5.839903831481934, "global_step": 56087, "epoch": 1335} {"train_loss": -5.923912048339844, "global_step": 56088, "epoch": 1335} {"train_loss": -5.901613235473633, "global_step": 56089, "epoch": 1335} {"train_loss": -5.764784336090088, "global_step": 56090, "epoch": 1335} {"train_loss": -5.742271423339844, "global_step": 56091, "epoch": 1335} {"train_loss": -5.846922397613525, "global_step": 56092, "epoch": 1335} {"train_loss": -5.86804723739624, "global_step": 56093, "epoch": 1335} {"train_loss": -5.96057653427124, "global_step": 56094, "epoch": 1335} {"train_loss": -5.960345268249512, "global_step": 56095, "epoch": 1335} {"train_loss": -5.709287166595459, "global_step": 56096, "epoch": 1335} {"train_loss": -5.860955715179443, "global_step": 56097, "epoch": 1335} {"train_loss": -5.82578182220459, "global_step": 56098, "epoch": 1335} {"train_loss": -5.707856178283691, "global_step": 56099, "epoch": 1335} {"train_loss": -5.972066879272461, "global_step": 56100, "epoch": 1335} {"train_loss": -5.917814254760742, "global_step": 56101, "epoch": 1335} {"train_loss": -5.701145172119141, "global_step": 56102, "epoch": 1335} {"train_loss": -5.802733421325684, "global_step": 56103, "epoch": 1335} {"train_loss": -5.661919593811035, "global_step": 56104, "epoch": 1335} {"train_loss": -5.842721939086914, "global_step": 56105, "epoch": 1335} {"train_loss": -5.649998664855957, "global_step": 56106, "epoch": 1335} {"train_loss": -5.922657012939453, "global_step": 56107, "epoch": 1335} {"train_loss": -5.792688369750977, "global_step": 56108, "epoch": 1335} {"train_loss": -5.881657123565674, "global_step": 56109, "epoch": 1335} {"train_loss": -5.702069282531738, "global_step": 56110, "epoch": 1335} {"train_loss": -5.847985358465285, "global_step": 56111, "epoch": 1335, "val_loss": 61886.3359375} {"train_loss": -5.794117450714111, "global_step": 56112, "epoch": 1336} {"train_loss": -5.767621040344238, "global_step": 56113, "epoch": 1336} {"train_loss": -5.841670989990234, "global_step": 56114, "epoch": 1336} {"train_loss": -5.773396968841553, "global_step": 56115, "epoch": 1336} {"train_loss": -5.842112064361572, "global_step": 56116, "epoch": 1336} {"train_loss": -5.820591926574707, "global_step": 56117, "epoch": 1336} {"train_loss": -5.803676605224609, "global_step": 56118, "epoch": 1336} {"train_loss": -5.9194746017456055, "global_step": 56119, "epoch": 1336} {"train_loss": -5.8459248542785645, "global_step": 56120, "epoch": 1336} {"train_loss": -5.8734917640686035, "global_step": 56121, "epoch": 1336} {"train_loss": -5.9091997146606445, "global_step": 56122, "epoch": 1336} {"train_loss": -5.7930450439453125, "global_step": 56123, "epoch": 1336} {"train_loss": -5.8326497077941895, "global_step": 56124, "epoch": 1336} {"train_loss": -5.879680633544922, "global_step": 56125, "epoch": 1336} {"train_loss": -5.809814453125, "global_step": 56126, "epoch": 1336} {"train_loss": -5.738570690155029, "global_step": 56127, "epoch": 1336} {"train_loss": -5.83967399597168, "global_step": 56128, "epoch": 1336} {"train_loss": -5.922688961029053, "global_step": 56129, "epoch": 1336} {"train_loss": -5.838395595550537, "global_step": 56130, "epoch": 1336} {"train_loss": -5.850960731506348, "global_step": 56131, "epoch": 1336} {"train_loss": -5.82664680480957, "global_step": 56132, "epoch": 1336} {"train_loss": -5.79936408996582, "global_step": 56133, "epoch": 1336} {"train_loss": -5.823647499084473, "global_step": 56134, "epoch": 1336} {"train_loss": -5.746282577514648, "global_step": 56135, "epoch": 1336} {"train_loss": -5.647858619689941, "global_step": 56136, "epoch": 1336} {"train_loss": -5.919294357299805, "global_step": 56137, "epoch": 1336} {"train_loss": -5.799830913543701, "global_step": 56138, "epoch": 1336} {"train_loss": -5.872135162353516, "global_step": 56139, "epoch": 1336} {"train_loss": -5.9798784255981445, "global_step": 56140, "epoch": 1336} {"train_loss": -5.925185203552246, "global_step": 56141, "epoch": 1336} {"train_loss": -5.765347003936768, "global_step": 56142, "epoch": 1336} {"train_loss": -5.930666923522949, "global_step": 56143, "epoch": 1336} {"train_loss": -5.809646129608154, "global_step": 56144, "epoch": 1336} {"train_loss": -5.998418807983398, "global_step": 56145, "epoch": 1336} {"train_loss": -5.878139495849609, "global_step": 56146, "epoch": 1336} {"train_loss": -5.917620658874512, "global_step": 56147, "epoch": 1336} {"train_loss": -5.861743450164795, "global_step": 56148, "epoch": 1336} {"train_loss": -5.886962890625, "global_step": 56149, "epoch": 1336} {"train_loss": -5.902877330780029, "global_step": 56150, "epoch": 1336} {"train_loss": -5.8906049728393555, "global_step": 56151, "epoch": 1336} {"train_loss": -5.960227012634277, "global_step": 56152, "epoch": 1336} {"train_loss": -5.852785848435902, "global_step": 56153, "epoch": 1336, "val_loss": 61535.8828125} {"train_loss": -5.789268493652344, "global_step": 56154, "epoch": 1337} {"train_loss": -5.805588722229004, "global_step": 56155, "epoch": 1337} {"train_loss": -5.859467029571533, "global_step": 56156, "epoch": 1337} {"train_loss": -5.853715896606445, "global_step": 56157, "epoch": 1337} {"train_loss": -5.85438346862793, "global_step": 56158, "epoch": 1337} {"train_loss": -5.786581039428711, "global_step": 56159, "epoch": 1337} {"train_loss": -5.867871284484863, "global_step": 56160, "epoch": 1337} {"train_loss": -5.83998966217041, "global_step": 56161, "epoch": 1337} {"train_loss": -5.887765884399414, "global_step": 56162, "epoch": 1337} {"train_loss": -5.891740798950195, "global_step": 56163, "epoch": 1337} {"train_loss": -5.97640323638916, "global_step": 56164, "epoch": 1337} {"train_loss": -5.928654193878174, "global_step": 56165, "epoch": 1337} {"train_loss": -5.842881202697754, "global_step": 56166, "epoch": 1337} {"train_loss": -5.777413845062256, "global_step": 56167, "epoch": 1337} {"train_loss": -5.798645973205566, "global_step": 56168, "epoch": 1337} {"train_loss": -5.904123306274414, "global_step": 56169, "epoch": 1337} {"train_loss": -5.853771686553955, "global_step": 56170, "epoch": 1337} {"train_loss": -5.804187774658203, "global_step": 56171, "epoch": 1337} {"train_loss": -5.854726314544678, "global_step": 56172, "epoch": 1337} {"train_loss": -5.872987747192383, "global_step": 56173, "epoch": 1337} {"train_loss": -5.848193645477295, "global_step": 56174, "epoch": 1337} {"train_loss": -5.947877883911133, "global_step": 56175, "epoch": 1337} {"train_loss": -6.012622833251953, "global_step": 56176, "epoch": 1337} {"train_loss": -5.818427562713623, "global_step": 56177, "epoch": 1337} {"train_loss": -5.904795169830322, "global_step": 56178, "epoch": 1337} {"train_loss": -5.875910758972168, "global_step": 56179, "epoch": 1337} {"train_loss": -5.817545413970947, "global_step": 56180, "epoch": 1337} {"train_loss": -5.894825458526611, "global_step": 56181, "epoch": 1337} {"train_loss": -5.835790157318115, "global_step": 56182, "epoch": 1337} {"train_loss": -5.771578788757324, "global_step": 56183, "epoch": 1337} {"train_loss": -5.885534763336182, "global_step": 56184, "epoch": 1337} {"train_loss": -5.872888565063477, "global_step": 56185, "epoch": 1337} {"train_loss": -5.863099098205566, "global_step": 56186, "epoch": 1337} {"train_loss": -6.037558555603027, "global_step": 56187, "epoch": 1337} {"train_loss": -5.950394153594971, "global_step": 56188, "epoch": 1337} {"train_loss": -5.820579528808594, "global_step": 56189, "epoch": 1337} {"train_loss": -5.929281711578369, "global_step": 56190, "epoch": 1337} {"train_loss": -5.984683036804199, "global_step": 56191, "epoch": 1337} {"train_loss": -5.882481575012207, "global_step": 56192, "epoch": 1337} {"train_loss": -5.828616619110107, "global_step": 56193, "epoch": 1337} {"train_loss": -5.914715766906738, "global_step": 56194, "epoch": 1337} {"train_loss": -5.873650369190035, "global_step": 56195, "epoch": 1337, "val_loss": 61233.203125} {"train_loss": -5.843914031982422, "global_step": 56196, "epoch": 1338} {"train_loss": -5.844511985778809, "global_step": 56197, "epoch": 1338} {"train_loss": -5.8293023109436035, "global_step": 56198, "epoch": 1338} {"train_loss": -5.920640468597412, "global_step": 56199, "epoch": 1338} {"train_loss": -5.97119140625, "global_step": 56200, "epoch": 1338} {"train_loss": -5.858803749084473, "global_step": 56201, "epoch": 1338} {"train_loss": -5.83853006362915, "global_step": 56202, "epoch": 1338} {"train_loss": -5.984376907348633, "global_step": 56203, "epoch": 1338} {"train_loss": -5.955267429351807, "global_step": 56204, "epoch": 1338} {"train_loss": -5.909191131591797, "global_step": 56205, "epoch": 1338} {"train_loss": -5.953888893127441, "global_step": 56206, "epoch": 1338} {"train_loss": -5.933873653411865, "global_step": 56207, "epoch": 1338} {"train_loss": -5.838576316833496, "global_step": 56208, "epoch": 1338} {"train_loss": -5.925055503845215, "global_step": 56209, "epoch": 1338} {"train_loss": -5.913726329803467, "global_step": 56210, "epoch": 1338} {"train_loss": -5.825353622436523, "global_step": 56211, "epoch": 1338} {"train_loss": -5.920170783996582, "global_step": 56212, "epoch": 1338} {"train_loss": -5.885114669799805, "global_step": 56213, "epoch": 1338} {"train_loss": -5.956304550170898, "global_step": 56214, "epoch": 1338} {"train_loss": -5.8425140380859375, "global_step": 56215, "epoch": 1338} {"train_loss": -5.856212139129639, "global_step": 56216, "epoch": 1338} {"train_loss": -5.883900165557861, "global_step": 56217, "epoch": 1338} {"train_loss": -6.001495361328125, "global_step": 56218, "epoch": 1338} {"train_loss": -5.89585018157959, "global_step": 56219, "epoch": 1338} {"train_loss": -5.907073974609375, "global_step": 56220, "epoch": 1338} {"train_loss": -5.8835248947143555, "global_step": 56221, "epoch": 1338} {"train_loss": -5.886836051940918, "global_step": 56222, "epoch": 1338} {"train_loss": -5.917961597442627, "global_step": 56223, "epoch": 1338} {"train_loss": -5.731866836547852, "global_step": 56224, "epoch": 1338} {"train_loss": -5.73092794418335, "global_step": 56225, "epoch": 1338} {"train_loss": -5.961113929748535, "global_step": 56226, "epoch": 1338} {"train_loss": -5.772744655609131, "global_step": 56227, "epoch": 1338} {"train_loss": -5.9193854331970215, "global_step": 56228, "epoch": 1338} {"train_loss": -5.7276716232299805, "global_step": 56229, "epoch": 1338} {"train_loss": -5.777604103088379, "global_step": 56230, "epoch": 1338} {"train_loss": -5.840701580047607, "global_step": 56231, "epoch": 1338} {"train_loss": -5.713564395904541, "global_step": 56232, "epoch": 1338} {"train_loss": -5.885201930999756, "global_step": 56233, "epoch": 1338} {"train_loss": -5.749287128448486, "global_step": 56234, "epoch": 1338} {"train_loss": -5.934953689575195, "global_step": 56235, "epoch": 1338} {"train_loss": -5.833836555480957, "global_step": 56236, "epoch": 1338} {"train_loss": -5.869304475330171, "global_step": 56237, "epoch": 1338, "val_loss": 61345.2734375} {"train_loss": -5.730266571044922, "global_step": 56238, "epoch": 1339} {"train_loss": -5.785147666931152, "global_step": 56239, "epoch": 1339} {"train_loss": -5.832276344299316, "global_step": 56240, "epoch": 1339} {"train_loss": -5.838468551635742, "global_step": 56241, "epoch": 1339} {"train_loss": -5.874950408935547, "global_step": 56242, "epoch": 1339} {"train_loss": -5.850907325744629, "global_step": 56243, "epoch": 1339} {"train_loss": -5.842680931091309, "global_step": 56244, "epoch": 1339} {"train_loss": -5.902976989746094, "global_step": 56245, "epoch": 1339} {"train_loss": -5.802620887756348, "global_step": 56246, "epoch": 1339} {"train_loss": -5.844590663909912, "global_step": 56247, "epoch": 1339} {"train_loss": -5.882169723510742, "global_step": 56248, "epoch": 1339} {"train_loss": -5.760748863220215, "global_step": 56249, "epoch": 1339} {"train_loss": -5.8803839683532715, "global_step": 56250, "epoch": 1339} {"train_loss": -5.788710117340088, "global_step": 56251, "epoch": 1339} {"train_loss": -5.898129463195801, "global_step": 56252, "epoch": 1339} {"train_loss": -5.835986137390137, "global_step": 56253, "epoch": 1339} {"train_loss": -5.680586814880371, "global_step": 56254, "epoch": 1339} {"train_loss": -5.874602317810059, "global_step": 56255, "epoch": 1339} {"train_loss": -5.779789447784424, "global_step": 56256, "epoch": 1339} {"train_loss": -5.832251071929932, "global_step": 56257, "epoch": 1339} {"train_loss": -5.838167667388916, "global_step": 56258, "epoch": 1339} {"train_loss": -5.832282543182373, "global_step": 56259, "epoch": 1339} {"train_loss": -5.736523151397705, "global_step": 56260, "epoch": 1339} {"train_loss": -5.93865966796875, "global_step": 56261, "epoch": 1339} {"train_loss": -5.831844329833984, "global_step": 56262, "epoch": 1339} {"train_loss": -5.899140357971191, "global_step": 56263, "epoch": 1339} {"train_loss": -5.997951507568359, "global_step": 56264, "epoch": 1339} {"train_loss": -5.824553489685059, "global_step": 56265, "epoch": 1339} {"train_loss": -5.830486297607422, "global_step": 56266, "epoch": 1339} {"train_loss": -5.967526912689209, "global_step": 56267, "epoch": 1339} {"train_loss": -5.821629524230957, "global_step": 56268, "epoch": 1339} {"train_loss": -5.787176132202148, "global_step": 56269, "epoch": 1339} {"train_loss": -5.742406845092773, "global_step": 56270, "epoch": 1339} {"train_loss": -5.918038368225098, "global_step": 56271, "epoch": 1339} {"train_loss": -5.756937026977539, "global_step": 56272, "epoch": 1339} {"train_loss": -6.0008392333984375, "global_step": 56273, "epoch": 1339} {"train_loss": -5.721527099609375, "global_step": 56274, "epoch": 1339} {"train_loss": -5.8132405281066895, "global_step": 56275, "epoch": 1339} {"train_loss": -5.906894683837891, "global_step": 56276, "epoch": 1339} {"train_loss": -5.898128509521484, "global_step": 56277, "epoch": 1339} {"train_loss": -5.856545925140381, "global_step": 56278, "epoch": 1339} {"train_loss": -5.840700070063273, "global_step": 56279, "epoch": 1339, "val_loss": 61532.39453125} {"train_loss": -5.888617515563965, "global_step": 56280, "epoch": 1340} {"train_loss": -5.829641819000244, "global_step": 56281, "epoch": 1340} {"train_loss": -5.846261978149414, "global_step": 56282, "epoch": 1340} {"train_loss": -5.793976306915283, "global_step": 56283, "epoch": 1340} {"train_loss": -5.74031925201416, "global_step": 56284, "epoch": 1340} {"train_loss": -5.952637672424316, "global_step": 56285, "epoch": 1340} {"train_loss": -5.766246318817139, "global_step": 56286, "epoch": 1340} {"train_loss": -5.896745204925537, "global_step": 56287, "epoch": 1340} {"train_loss": -5.9141845703125, "global_step": 56288, "epoch": 1340} {"train_loss": -5.796862602233887, "global_step": 56289, "epoch": 1340} {"train_loss": -5.784709930419922, "global_step": 56290, "epoch": 1340} {"train_loss": -5.743320465087891, "global_step": 56291, "epoch": 1340} {"train_loss": -5.876740455627441, "global_step": 56292, "epoch": 1340} {"train_loss": -6.044904708862305, "global_step": 56293, "epoch": 1340} {"train_loss": -5.811107635498047, "global_step": 56294, "epoch": 1340} {"train_loss": -5.952779769897461, "global_step": 56295, "epoch": 1340} {"train_loss": -5.963338375091553, "global_step": 56296, "epoch": 1340} {"train_loss": -5.786715507507324, "global_step": 56297, "epoch": 1340} {"train_loss": -5.988179683685303, "global_step": 56298, "epoch": 1340} {"train_loss": -5.840869903564453, "global_step": 56299, "epoch": 1340} {"train_loss": -5.943708419799805, "global_step": 56300, "epoch": 1340} {"train_loss": -5.852504730224609, "global_step": 56301, "epoch": 1340} {"train_loss": -5.943781852722168, "global_step": 56302, "epoch": 1340} {"train_loss": -5.872279167175293, "global_step": 56303, "epoch": 1340} {"train_loss": -5.781951904296875, "global_step": 56304, "epoch": 1340} {"train_loss": -5.899298667907715, "global_step": 56305, "epoch": 1340} {"train_loss": -5.868027687072754, "global_step": 56306, "epoch": 1340} {"train_loss": -5.82619571685791, "global_step": 56307, "epoch": 1340} {"train_loss": -5.8444976806640625, "global_step": 56308, "epoch": 1340} {"train_loss": -5.861632347106934, "global_step": 56309, "epoch": 1340} {"train_loss": -5.9280829429626465, "global_step": 56310, "epoch": 1340} {"train_loss": -5.821742057800293, "global_step": 56311, "epoch": 1340} {"train_loss": -5.898058891296387, "global_step": 56312, "epoch": 1340} {"train_loss": -5.882447242736816, "global_step": 56313, "epoch": 1340} {"train_loss": -5.875722885131836, "global_step": 56314, "epoch": 1340} {"train_loss": -5.825862884521484, "global_step": 56315, "epoch": 1340} {"train_loss": -5.802386283874512, "global_step": 56316, "epoch": 1340} {"train_loss": -5.81114387512207, "global_step": 56317, "epoch": 1340} {"train_loss": -5.808114051818848, "global_step": 56318, "epoch": 1340} {"train_loss": -5.90493631362915, "global_step": 56319, "epoch": 1340} {"train_loss": -5.844441890716553, "global_step": 56320, "epoch": 1340} {"train_loss": -5.863226334253947, "global_step": 56321, "epoch": 1340, "val_loss": 61175.61328125} {"train_loss": -5.748699188232422, "global_step": 56322, "epoch": 1341} {"train_loss": -5.884115695953369, "global_step": 56323, "epoch": 1341} {"train_loss": -5.878414154052734, "global_step": 56324, "epoch": 1341} {"train_loss": -5.871790885925293, "global_step": 56325, "epoch": 1341} {"train_loss": -6.025636672973633, "global_step": 56326, "epoch": 1341} {"train_loss": -5.87712287902832, "global_step": 56327, "epoch": 1341} {"train_loss": -5.80924129486084, "global_step": 56328, "epoch": 1341} {"train_loss": -5.867866039276123, "global_step": 56329, "epoch": 1341} {"train_loss": -5.783935546875, "global_step": 56330, "epoch": 1341} {"train_loss": -5.7930097579956055, "global_step": 56331, "epoch": 1341} {"train_loss": -5.878339767456055, "global_step": 56332, "epoch": 1341} {"train_loss": -5.840127944946289, "global_step": 56333, "epoch": 1341} {"train_loss": -5.829889297485352, "global_step": 56334, "epoch": 1341} {"train_loss": -5.9120683670043945, "global_step": 56335, "epoch": 1341} {"train_loss": -5.907003879547119, "global_step": 56336, "epoch": 1341} {"train_loss": -5.866534233093262, "global_step": 56337, "epoch": 1341} {"train_loss": -5.830747127532959, "global_step": 56338, "epoch": 1341} {"train_loss": -5.724506378173828, "global_step": 56339, "epoch": 1341} {"train_loss": -5.9066996574401855, "global_step": 56340, "epoch": 1341} {"train_loss": -5.846578598022461, "global_step": 56341, "epoch": 1341} {"train_loss": -5.875799179077148, "global_step": 56342, "epoch": 1341} {"train_loss": -5.915380477905273, "global_step": 56343, "epoch": 1341} {"train_loss": -5.812626838684082, "global_step": 56344, "epoch": 1341} {"train_loss": -5.810040473937988, "global_step": 56345, "epoch": 1341} {"train_loss": -5.960905075073242, "global_step": 56346, "epoch": 1341} {"train_loss": -5.818285942077637, "global_step": 56347, "epoch": 1341} {"train_loss": -5.972806930541992, "global_step": 56348, "epoch": 1341} {"train_loss": -5.873405456542969, "global_step": 56349, "epoch": 1341} {"train_loss": -5.9748148918151855, "global_step": 56350, "epoch": 1341} {"train_loss": -5.786894798278809, "global_step": 56351, "epoch": 1341} {"train_loss": -5.766048431396484, "global_step": 56352, "epoch": 1341} {"train_loss": -5.854702949523926, "global_step": 56353, "epoch": 1341} {"train_loss": -5.748414039611816, "global_step": 56354, "epoch": 1341} {"train_loss": -5.827225685119629, "global_step": 56355, "epoch": 1341} {"train_loss": -5.862138748168945, "global_step": 56356, "epoch": 1341} {"train_loss": -5.8402814865112305, "global_step": 56357, "epoch": 1341} {"train_loss": -5.811738967895508, "global_step": 56358, "epoch": 1341} {"train_loss": -5.728869438171387, "global_step": 56359, "epoch": 1341} {"train_loss": -5.7896728515625, "global_step": 56360, "epoch": 1341} {"train_loss": -5.740584850311279, "global_step": 56361, "epoch": 1341} {"train_loss": -5.8537726402282715, "global_step": 56362, "epoch": 1341} {"train_loss": -5.848306633177257, "global_step": 56363, "epoch": 1341, "val_loss": 61502.51953125} {"train_loss": -5.840627670288086, "global_step": 56364, "epoch": 1342} {"train_loss": -5.840639114379883, "global_step": 56365, "epoch": 1342} {"train_loss": -5.8071699142456055, "global_step": 56366, "epoch": 1342} {"train_loss": -5.955965042114258, "global_step": 56367, "epoch": 1342} {"train_loss": -6.019962310791016, "global_step": 56368, "epoch": 1342} {"train_loss": -5.86651086807251, "global_step": 56369, "epoch": 1342} {"train_loss": -5.91978645324707, "global_step": 56370, "epoch": 1342} {"train_loss": -5.89350700378418, "global_step": 56371, "epoch": 1342} {"train_loss": -5.898709297180176, "global_step": 56372, "epoch": 1342} {"train_loss": -5.791391372680664, "global_step": 56373, "epoch": 1342} {"train_loss": -5.782410621643066, "global_step": 56374, "epoch": 1342} {"train_loss": -5.892886161804199, "global_step": 56375, "epoch": 1342} {"train_loss": -5.922846794128418, "global_step": 56376, "epoch": 1342} {"train_loss": -5.8438334465026855, "global_step": 56377, "epoch": 1342} {"train_loss": -5.798646926879883, "global_step": 56378, "epoch": 1342} {"train_loss": -5.762335777282715, "global_step": 56379, "epoch": 1342} {"train_loss": -5.790049076080322, "global_step": 56380, "epoch": 1342} {"train_loss": -5.877051830291748, "global_step": 56381, "epoch": 1342} {"train_loss": -5.917043685913086, "global_step": 56382, "epoch": 1342} {"train_loss": -5.765625476837158, "global_step": 56383, "epoch": 1342} {"train_loss": -5.963422775268555, "global_step": 56384, "epoch": 1342} {"train_loss": -5.763871192932129, "global_step": 56385, "epoch": 1342} {"train_loss": -5.86004114151001, "global_step": 56386, "epoch": 1342} {"train_loss": -5.826610565185547, "global_step": 56387, "epoch": 1342} {"train_loss": -5.939154148101807, "global_step": 56388, "epoch": 1342} {"train_loss": -5.872187614440918, "global_step": 56389, "epoch": 1342} {"train_loss": -5.887275218963623, "global_step": 56390, "epoch": 1342} {"train_loss": -5.8524322509765625, "global_step": 56391, "epoch": 1342} {"train_loss": -5.848968029022217, "global_step": 56392, "epoch": 1342} {"train_loss": -5.887576103210449, "global_step": 56393, "epoch": 1342} {"train_loss": -5.852371692657471, "global_step": 56394, "epoch": 1342} {"train_loss": -5.921597480773926, "global_step": 56395, "epoch": 1342} {"train_loss": -5.840473175048828, "global_step": 56396, "epoch": 1342} {"train_loss": -5.998856544494629, "global_step": 56397, "epoch": 1342} {"train_loss": -5.96317195892334, "global_step": 56398, "epoch": 1342} {"train_loss": -5.864136695861816, "global_step": 56399, "epoch": 1342} {"train_loss": -5.886359214782715, "global_step": 56400, "epoch": 1342} {"train_loss": -5.900516986846924, "global_step": 56401, "epoch": 1342} {"train_loss": -5.754352569580078, "global_step": 56402, "epoch": 1342} {"train_loss": -5.933363437652588, "global_step": 56403, "epoch": 1342} {"train_loss": -5.906249523162842, "global_step": 56404, "epoch": 1342} {"train_loss": -5.869742904390607, "global_step": 56405, "epoch": 1342, "val_loss": 61259.9140625} {"train_loss": -5.772268295288086, "global_step": 56406, "epoch": 1343} {"train_loss": -5.771038055419922, "global_step": 56407, "epoch": 1343} {"train_loss": -5.8405303955078125, "global_step": 56408, "epoch": 1343} {"train_loss": -5.681116104125977, "global_step": 56409, "epoch": 1343} {"train_loss": -5.8791069984436035, "global_step": 56410, "epoch": 1343} {"train_loss": -5.827914237976074, "global_step": 56411, "epoch": 1343} {"train_loss": -5.635958194732666, "global_step": 56412, "epoch": 1343} {"train_loss": -5.800397872924805, "global_step": 56413, "epoch": 1343} {"train_loss": -5.69563102722168, "global_step": 56414, "epoch": 1343} {"train_loss": -5.712491989135742, "global_step": 56415, "epoch": 1343} {"train_loss": -5.780277252197266, "global_step": 56416, "epoch": 1343} {"train_loss": -5.545496940612793, "global_step": 56417, "epoch": 1343} {"train_loss": -5.825773239135742, "global_step": 56418, "epoch": 1343} {"train_loss": -5.623232364654541, "global_step": 56419, "epoch": 1343} {"train_loss": -5.992528915405273, "global_step": 56420, "epoch": 1343} {"train_loss": -5.666092872619629, "global_step": 56421, "epoch": 1343} {"train_loss": -5.814090728759766, "global_step": 56422, "epoch": 1343} {"train_loss": -5.648614883422852, "global_step": 56423, "epoch": 1343} {"train_loss": -5.874024391174316, "global_step": 56424, "epoch": 1343} {"train_loss": -5.662353515625, "global_step": 56425, "epoch": 1343} {"train_loss": -5.808749198913574, "global_step": 56426, "epoch": 1343} {"train_loss": -5.736565113067627, "global_step": 56427, "epoch": 1343} {"train_loss": -5.918270111083984, "global_step": 56428, "epoch": 1343} {"train_loss": -5.845047950744629, "global_step": 56429, "epoch": 1343} {"train_loss": -5.825665473937988, "global_step": 56430, "epoch": 1343} {"train_loss": -5.819806098937988, "global_step": 56431, "epoch": 1343} {"train_loss": -5.894979476928711, "global_step": 56432, "epoch": 1343} {"train_loss": -5.800495624542236, "global_step": 56433, "epoch": 1343} {"train_loss": -5.79129695892334, "global_step": 56434, "epoch": 1343} {"train_loss": -5.851014137268066, "global_step": 56435, "epoch": 1343} {"train_loss": -5.859185218811035, "global_step": 56436, "epoch": 1343} {"train_loss": -5.7739763259887695, "global_step": 56437, "epoch": 1343} {"train_loss": -5.830158233642578, "global_step": 56438, "epoch": 1343} {"train_loss": -5.819204330444336, "global_step": 56439, "epoch": 1343} {"train_loss": -5.860258102416992, "global_step": 56440, "epoch": 1343} {"train_loss": -5.907046318054199, "global_step": 56441, "epoch": 1343} {"train_loss": -5.823390960693359, "global_step": 56442, "epoch": 1343} {"train_loss": -5.843654632568359, "global_step": 56443, "epoch": 1343} {"train_loss": -5.742040634155273, "global_step": 56444, "epoch": 1343} {"train_loss": -5.706507205963135, "global_step": 56445, "epoch": 1343} {"train_loss": -5.78879451751709, "global_step": 56446, "epoch": 1343} {"train_loss": -5.784147228513445, "global_step": 56447, "epoch": 1343, "val_loss": 61708.453125} {"train_loss": -5.735839366912842, "global_step": 56448, "epoch": 1344} {"train_loss": -5.706903457641602, "global_step": 56449, "epoch": 1344} {"train_loss": -5.7366743087768555, "global_step": 56450, "epoch": 1344} {"train_loss": -5.802084922790527, "global_step": 56451, "epoch": 1344} {"train_loss": -5.815786361694336, "global_step": 56452, "epoch": 1344} {"train_loss": -5.778135299682617, "global_step": 56453, "epoch": 1344} {"train_loss": -5.877011299133301, "global_step": 56454, "epoch": 1344} {"train_loss": -5.745200157165527, "global_step": 56455, "epoch": 1344} {"train_loss": -5.812682151794434, "global_step": 56456, "epoch": 1344} {"train_loss": -5.685061454772949, "global_step": 56457, "epoch": 1344} {"train_loss": -5.884400367736816, "global_step": 56458, "epoch": 1344} {"train_loss": -5.753541469573975, "global_step": 56459, "epoch": 1344} {"train_loss": -5.883199214935303, "global_step": 56460, "epoch": 1344} {"train_loss": -5.8954596519470215, "global_step": 56461, "epoch": 1344} {"train_loss": -5.908039093017578, "global_step": 56462, "epoch": 1344} {"train_loss": -5.828202247619629, "global_step": 56463, "epoch": 1344} {"train_loss": -5.901294708251953, "global_step": 56464, "epoch": 1344} {"train_loss": -5.825397491455078, "global_step": 56465, "epoch": 1344} {"train_loss": -5.803929805755615, "global_step": 56466, "epoch": 1344} {"train_loss": -5.800561428070068, "global_step": 56467, "epoch": 1344} {"train_loss": -5.863979816436768, "global_step": 56468, "epoch": 1344} {"train_loss": -5.817019939422607, "global_step": 56469, "epoch": 1344} {"train_loss": -5.8442864418029785, "global_step": 56470, "epoch": 1344} {"train_loss": -5.860969543457031, "global_step": 56471, "epoch": 1344} {"train_loss": -5.793269157409668, "global_step": 56472, "epoch": 1344} {"train_loss": -5.856800079345703, "global_step": 56473, "epoch": 1344} {"train_loss": -5.964047431945801, "global_step": 56474, "epoch": 1344} {"train_loss": -5.725778102874756, "global_step": 56475, "epoch": 1344} {"train_loss": -5.847756862640381, "global_step": 56476, "epoch": 1344} {"train_loss": -5.875954627990723, "global_step": 56477, "epoch": 1344} {"train_loss": -5.85344123840332, "global_step": 56478, "epoch": 1344} {"train_loss": -5.903072357177734, "global_step": 56479, "epoch": 1344} {"train_loss": -5.842754364013672, "global_step": 56480, "epoch": 1344} {"train_loss": -5.85577917098999, "global_step": 56481, "epoch": 1344} {"train_loss": -5.823941230773926, "global_step": 56482, "epoch": 1344} {"train_loss": -5.7935285568237305, "global_step": 56483, "epoch": 1344} {"train_loss": -5.974867820739746, "global_step": 56484, "epoch": 1344} {"train_loss": -6.026537895202637, "global_step": 56485, "epoch": 1344} {"train_loss": -5.963238716125488, "global_step": 56486, "epoch": 1344} {"train_loss": -5.729419708251953, "global_step": 56487, "epoch": 1344} {"train_loss": -5.941239356994629, "global_step": 56488, "epoch": 1344} {"train_loss": -5.836750530061268, "global_step": 56489, "epoch": 1344, "val_loss": 61486.453125} {"train_loss": -5.8223876953125, "global_step": 56490, "epoch": 1345} {"train_loss": -5.850394248962402, "global_step": 56491, "epoch": 1345} {"train_loss": -5.847537994384766, "global_step": 56492, "epoch": 1345} {"train_loss": -5.856907844543457, "global_step": 56493, "epoch": 1345} {"train_loss": -5.808453559875488, "global_step": 56494, "epoch": 1345} {"train_loss": -5.8383283615112305, "global_step": 56495, "epoch": 1345} {"train_loss": -5.843267917633057, "global_step": 56496, "epoch": 1345} {"train_loss": -5.771323204040527, "global_step": 56497, "epoch": 1345} {"train_loss": -5.685929298400879, "global_step": 56498, "epoch": 1345} {"train_loss": -5.846147537231445, "global_step": 56499, "epoch": 1345} {"train_loss": -5.753477096557617, "global_step": 56500, "epoch": 1345} {"train_loss": -5.789420127868652, "global_step": 56501, "epoch": 1345} {"train_loss": -5.721824645996094, "global_step": 56502, "epoch": 1345} {"train_loss": -5.934874057769775, "global_step": 56503, "epoch": 1345} {"train_loss": -5.878571510314941, "global_step": 56504, "epoch": 1345} {"train_loss": -5.916769981384277, "global_step": 56505, "epoch": 1345} {"train_loss": -5.850027084350586, "global_step": 56506, "epoch": 1345} {"train_loss": -5.816658973693848, "global_step": 56507, "epoch": 1345} {"train_loss": -5.725005149841309, "global_step": 56508, "epoch": 1345} {"train_loss": -5.876728057861328, "global_step": 56509, "epoch": 1345} {"train_loss": -5.956881523132324, "global_step": 56510, "epoch": 1345} {"train_loss": -5.852400779724121, "global_step": 56511, "epoch": 1345} {"train_loss": -5.887180328369141, "global_step": 56512, "epoch": 1345} {"train_loss": -5.905642509460449, "global_step": 56513, "epoch": 1345} {"train_loss": -5.8761677742004395, "global_step": 56514, "epoch": 1345} {"train_loss": -5.795553684234619, "global_step": 56515, "epoch": 1345} {"train_loss": -5.843719482421875, "global_step": 56516, "epoch": 1345} {"train_loss": -5.920351982116699, "global_step": 56517, "epoch": 1345} {"train_loss": -5.812560558319092, "global_step": 56518, "epoch": 1345} {"train_loss": -5.875280380249023, "global_step": 56519, "epoch": 1345} {"train_loss": -5.936331748962402, "global_step": 56520, "epoch": 1345} {"train_loss": -5.914236068725586, "global_step": 56521, "epoch": 1345} {"train_loss": -5.8240742683410645, "global_step": 56522, "epoch": 1345} {"train_loss": -5.829816818237305, "global_step": 56523, "epoch": 1345} {"train_loss": -5.925813674926758, "global_step": 56524, "epoch": 1345} {"train_loss": -5.8021697998046875, "global_step": 56525, "epoch": 1345} {"train_loss": -5.7859673500061035, "global_step": 56526, "epoch": 1345} {"train_loss": -5.856358528137207, "global_step": 56527, "epoch": 1345} {"train_loss": -5.890137195587158, "global_step": 56528, "epoch": 1345} {"train_loss": -5.887655735015869, "global_step": 56529, "epoch": 1345} {"train_loss": -5.865691184997559, "global_step": 56530, "epoch": 1345} {"train_loss": -5.846821398962112, "global_step": 56531, "epoch": 1345, "val_loss": 61769.63671875} {"train_loss": -5.943404197692871, "global_step": 56532, "epoch": 1346} {"train_loss": -5.8230438232421875, "global_step": 56533, "epoch": 1346} {"train_loss": -5.825672626495361, "global_step": 56534, "epoch": 1346} {"train_loss": -5.862626075744629, "global_step": 56535, "epoch": 1346} {"train_loss": -5.916925430297852, "global_step": 56536, "epoch": 1346} {"train_loss": -5.928642749786377, "global_step": 56537, "epoch": 1346} {"train_loss": -5.844965934753418, "global_step": 56538, "epoch": 1346} {"train_loss": -5.889222145080566, "global_step": 56539, "epoch": 1346} {"train_loss": -5.794000625610352, "global_step": 56540, "epoch": 1346} {"train_loss": -5.85532283782959, "global_step": 56541, "epoch": 1346} {"train_loss": -5.858154296875, "global_step": 56542, "epoch": 1346} {"train_loss": -5.954068183898926, "global_step": 56543, "epoch": 1346} {"train_loss": -5.947341442108154, "global_step": 56544, "epoch": 1346} {"train_loss": -5.915104866027832, "global_step": 56545, "epoch": 1346} {"train_loss": -5.936464309692383, "global_step": 56546, "epoch": 1346} {"train_loss": -5.973007678985596, "global_step": 56547, "epoch": 1346} {"train_loss": -5.914858818054199, "global_step": 56548, "epoch": 1346} {"train_loss": -5.897324562072754, "global_step": 56549, "epoch": 1346} {"train_loss": -5.80178165435791, "global_step": 56550, "epoch": 1346} {"train_loss": -5.936324596405029, "global_step": 56551, "epoch": 1346} {"train_loss": -5.9206037521362305, "global_step": 56552, "epoch": 1346} {"train_loss": -5.728650093078613, "global_step": 56553, "epoch": 1346} {"train_loss": -5.895560264587402, "global_step": 56554, "epoch": 1346} {"train_loss": -5.8972272872924805, "global_step": 56555, "epoch": 1346} {"train_loss": -5.814638614654541, "global_step": 56556, "epoch": 1346} {"train_loss": -5.8182477951049805, "global_step": 56557, "epoch": 1346} {"train_loss": -5.896121025085449, "global_step": 56558, "epoch": 1346} {"train_loss": -5.832048416137695, "global_step": 56559, "epoch": 1346} {"train_loss": -5.898522853851318, "global_step": 56560, "epoch": 1346} {"train_loss": -5.826582908630371, "global_step": 56561, "epoch": 1346} {"train_loss": -5.859691619873047, "global_step": 56562, "epoch": 1346} {"train_loss": -5.923637390136719, "global_step": 56563, "epoch": 1346} {"train_loss": -5.825237274169922, "global_step": 56564, "epoch": 1346} {"train_loss": -5.871668815612793, "global_step": 56565, "epoch": 1346} {"train_loss": -5.852914810180664, "global_step": 56566, "epoch": 1346} {"train_loss": -6.001029968261719, "global_step": 56567, "epoch": 1346} {"train_loss": -5.817140579223633, "global_step": 56568, "epoch": 1346} {"train_loss": -5.804952621459961, "global_step": 56569, "epoch": 1346} {"train_loss": -5.835179328918457, "global_step": 56570, "epoch": 1346} {"train_loss": -5.856965065002441, "global_step": 56571, "epoch": 1346} {"train_loss": -5.888233184814453, "global_step": 56572, "epoch": 1346} {"train_loss": -5.87632155418396, "global_step": 56573, "epoch": 1346, "val_loss": 61493.4609375} {"train_loss": -5.890794277191162, "global_step": 56574, "epoch": 1347} {"train_loss": -5.7942914962768555, "global_step": 56575, "epoch": 1347} {"train_loss": -5.868886947631836, "global_step": 56576, "epoch": 1347} {"train_loss": -5.848732948303223, "global_step": 56577, "epoch": 1347} {"train_loss": -5.744119644165039, "global_step": 56578, "epoch": 1347} {"train_loss": -5.7734150886535645, "global_step": 56579, "epoch": 1347} {"train_loss": -5.807291030883789, "global_step": 56580, "epoch": 1347} {"train_loss": -5.833039283752441, "global_step": 56581, "epoch": 1347} {"train_loss": -5.707347869873047, "global_step": 56582, "epoch": 1347} {"train_loss": -5.889026641845703, "global_step": 56583, "epoch": 1347} {"train_loss": -5.893281936645508, "global_step": 56584, "epoch": 1347} {"train_loss": -5.825991630554199, "global_step": 56585, "epoch": 1347} {"train_loss": -5.834897041320801, "global_step": 56586, "epoch": 1347} {"train_loss": -5.899486541748047, "global_step": 56587, "epoch": 1347} {"train_loss": -5.795205116271973, "global_step": 56588, "epoch": 1347} {"train_loss": -5.8270583152771, "global_step": 56589, "epoch": 1347} {"train_loss": -5.804706573486328, "global_step": 56590, "epoch": 1347} {"train_loss": -5.883419036865234, "global_step": 56591, "epoch": 1347} {"train_loss": -5.827103614807129, "global_step": 56592, "epoch": 1347} {"train_loss": -5.930267810821533, "global_step": 56593, "epoch": 1347} {"train_loss": -5.918717384338379, "global_step": 56594, "epoch": 1347} {"train_loss": -5.825865268707275, "global_step": 56595, "epoch": 1347} {"train_loss": -5.875028610229492, "global_step": 56596, "epoch": 1347} {"train_loss": -5.893610954284668, "global_step": 56597, "epoch": 1347} {"train_loss": -5.714725971221924, "global_step": 56598, "epoch": 1347} {"train_loss": -5.919437408447266, "global_step": 56599, "epoch": 1347} {"train_loss": -5.793028831481934, "global_step": 56600, "epoch": 1347} {"train_loss": -5.85002326965332, "global_step": 56601, "epoch": 1347} {"train_loss": -5.992791175842285, "global_step": 56602, "epoch": 1347} {"train_loss": -5.932356834411621, "global_step": 56603, "epoch": 1347} {"train_loss": -5.90885066986084, "global_step": 56604, "epoch": 1347} {"train_loss": -5.835172176361084, "global_step": 56605, "epoch": 1347} {"train_loss": -5.8249921798706055, "global_step": 56606, "epoch": 1347} {"train_loss": -5.888670921325684, "global_step": 56607, "epoch": 1347} {"train_loss": -5.814945220947266, "global_step": 56608, "epoch": 1347} {"train_loss": -5.886664390563965, "global_step": 56609, "epoch": 1347} {"train_loss": -5.931530952453613, "global_step": 56610, "epoch": 1347} {"train_loss": -5.87026309967041, "global_step": 56611, "epoch": 1347} {"train_loss": -5.857872009277344, "global_step": 56612, "epoch": 1347} {"train_loss": -5.94861364364624, "global_step": 56613, "epoch": 1347} {"train_loss": -5.791310787200928, "global_step": 56614, "epoch": 1347} {"train_loss": -5.8508192130497525, "global_step": 56615, "epoch": 1347, "val_loss": 61360.6796875} {"train_loss": -5.918631076812744, "global_step": 56616, "epoch": 1348} {"train_loss": -5.910707473754883, "global_step": 56617, "epoch": 1348} {"train_loss": -5.853156089782715, "global_step": 56618, "epoch": 1348} {"train_loss": -5.773957252502441, "global_step": 56619, "epoch": 1348} {"train_loss": -5.924099445343018, "global_step": 56620, "epoch": 1348} {"train_loss": -5.863127708435059, "global_step": 56621, "epoch": 1348} {"train_loss": -5.821066856384277, "global_step": 56622, "epoch": 1348} {"train_loss": -5.932831764221191, "global_step": 56623, "epoch": 1348} {"train_loss": -5.928582191467285, "global_step": 56624, "epoch": 1348} {"train_loss": -5.804727554321289, "global_step": 56625, "epoch": 1348} {"train_loss": -5.917414665222168, "global_step": 56626, "epoch": 1348} {"train_loss": -5.806121826171875, "global_step": 56627, "epoch": 1348} {"train_loss": -5.921064853668213, "global_step": 56628, "epoch": 1348} {"train_loss": -5.760507583618164, "global_step": 56629, "epoch": 1348} {"train_loss": -5.8170084953308105, "global_step": 56630, "epoch": 1348} {"train_loss": -5.828261375427246, "global_step": 56631, "epoch": 1348} {"train_loss": -5.924233913421631, "global_step": 56632, "epoch": 1348} {"train_loss": -5.944766521453857, "global_step": 56633, "epoch": 1348} {"train_loss": -5.965399742126465, "global_step": 56634, "epoch": 1348} {"train_loss": -5.939384460449219, "global_step": 56635, "epoch": 1348} {"train_loss": -5.771884918212891, "global_step": 56636, "epoch": 1348} {"train_loss": -5.792241096496582, "global_step": 56637, "epoch": 1348} {"train_loss": -5.879851341247559, "global_step": 56638, "epoch": 1348} {"train_loss": -5.860952854156494, "global_step": 56639, "epoch": 1348} {"train_loss": -5.840726852416992, "global_step": 56640, "epoch": 1348} {"train_loss": -5.940804481506348, "global_step": 56641, "epoch": 1348} {"train_loss": -5.829273700714111, "global_step": 56642, "epoch": 1348} {"train_loss": -5.9374284744262695, "global_step": 56643, "epoch": 1348} {"train_loss": -5.88585901260376, "global_step": 56644, "epoch": 1348} {"train_loss": -5.812838554382324, "global_step": 56645, "epoch": 1348} {"train_loss": -5.95570707321167, "global_step": 56646, "epoch": 1348} {"train_loss": -5.866745948791504, "global_step": 56647, "epoch": 1348} {"train_loss": -5.891181945800781, "global_step": 56648, "epoch": 1348} {"train_loss": -5.879072189331055, "global_step": 56649, "epoch": 1348} {"train_loss": -5.931929111480713, "global_step": 56650, "epoch": 1348} {"train_loss": -5.948920726776123, "global_step": 56651, "epoch": 1348} {"train_loss": -5.784897804260254, "global_step": 56652, "epoch": 1348} {"train_loss": -6.026059150695801, "global_step": 56653, "epoch": 1348} {"train_loss": -5.829973220825195, "global_step": 56654, "epoch": 1348} {"train_loss": -5.811370849609375, "global_step": 56655, "epoch": 1348} {"train_loss": -5.779007911682129, "global_step": 56656, "epoch": 1348} {"train_loss": -5.874586582183838, "global_step": 56657, "epoch": 1348, "val_loss": 61525.42578125} {"train_loss": -5.707396030426025, "global_step": 56658, "epoch": 1349} {"train_loss": -5.801059246063232, "global_step": 56659, "epoch": 1349} {"train_loss": -5.826727390289307, "global_step": 56660, "epoch": 1349} {"train_loss": -5.785313606262207, "global_step": 56661, "epoch": 1349} {"train_loss": -5.943571090698242, "global_step": 56662, "epoch": 1349} {"train_loss": -5.881195068359375, "global_step": 56663, "epoch": 1349} {"train_loss": -5.784963607788086, "global_step": 56664, "epoch": 1349} {"train_loss": -5.8131279945373535, "global_step": 56665, "epoch": 1349} {"train_loss": -5.888637542724609, "global_step": 56666, "epoch": 1349} {"train_loss": -5.820137023925781, "global_step": 56667, "epoch": 1349} {"train_loss": -5.757867813110352, "global_step": 56668, "epoch": 1349} {"train_loss": -5.751553535461426, "global_step": 56669, "epoch": 1349} {"train_loss": -5.887377738952637, "global_step": 56670, "epoch": 1349} {"train_loss": -5.950551986694336, "global_step": 56671, "epoch": 1349} {"train_loss": -5.978412628173828, "global_step": 56672, "epoch": 1349} {"train_loss": -5.942680358886719, "global_step": 56673, "epoch": 1349} {"train_loss": -5.898468017578125, "global_step": 56674, "epoch": 1349} {"train_loss": -5.954561233520508, "global_step": 56675, "epoch": 1349} {"train_loss": -5.882866859436035, "global_step": 56676, "epoch": 1349} {"train_loss": -5.949347496032715, "global_step": 56677, "epoch": 1349} {"train_loss": -5.789093017578125, "global_step": 56678, "epoch": 1349} {"train_loss": -5.923710823059082, "global_step": 56679, "epoch": 1349} {"train_loss": -5.841564655303955, "global_step": 56680, "epoch": 1349} {"train_loss": -5.988992691040039, "global_step": 56681, "epoch": 1349} {"train_loss": -5.849418640136719, "global_step": 56682, "epoch": 1349} {"train_loss": -5.817479610443115, "global_step": 56683, "epoch": 1349} {"train_loss": -5.847473621368408, "global_step": 56684, "epoch": 1349} {"train_loss": -5.891460418701172, "global_step": 56685, "epoch": 1349} {"train_loss": -5.873324394226074, "global_step": 56686, "epoch": 1349} {"train_loss": -5.918910026550293, "global_step": 56687, "epoch": 1349} {"train_loss": -5.72876501083374, "global_step": 56688, "epoch": 1349} {"train_loss": -5.849634170532227, "global_step": 56689, "epoch": 1349} {"train_loss": -5.89697265625, "global_step": 56690, "epoch": 1349} {"train_loss": -5.853851318359375, "global_step": 56691, "epoch": 1349} {"train_loss": -5.962098121643066, "global_step": 56692, "epoch": 1349} {"train_loss": -5.76982307434082, "global_step": 56693, "epoch": 1349} {"train_loss": -5.798691749572754, "global_step": 56694, "epoch": 1349} {"train_loss": -5.821378231048584, "global_step": 56695, "epoch": 1349} {"train_loss": -5.853610992431641, "global_step": 56696, "epoch": 1349} {"train_loss": -5.7802276611328125, "global_step": 56697, "epoch": 1349} {"train_loss": -5.920635223388672, "global_step": 56698, "epoch": 1349} {"train_loss": -5.85610674676441, "global_step": 56699, "epoch": 1349, "val_loss": 61423.59375} {"train_loss": -5.730215072631836, "global_step": 56700, "epoch": 1350} {"train_loss": -5.842918395996094, "global_step": 56701, "epoch": 1350} {"train_loss": -5.8098649978637695, "global_step": 56702, "epoch": 1350} {"train_loss": -5.741636276245117, "global_step": 56703, "epoch": 1350} {"train_loss": -5.747584342956543, "global_step": 56704, "epoch": 1350} {"train_loss": -5.882691860198975, "global_step": 56705, "epoch": 1350} {"train_loss": -5.784515380859375, "global_step": 56706, "epoch": 1350} {"train_loss": -5.849503517150879, "global_step": 56707, "epoch": 1350} {"train_loss": -5.8943915367126465, "global_step": 56708, "epoch": 1350} {"train_loss": -5.729945182800293, "global_step": 56709, "epoch": 1350} {"train_loss": -5.916909694671631, "global_step": 56710, "epoch": 1350} {"train_loss": -5.689757823944092, "global_step": 56711, "epoch": 1350} {"train_loss": -5.826390266418457, "global_step": 56712, "epoch": 1350} {"train_loss": -5.666753768920898, "global_step": 56713, "epoch": 1350} {"train_loss": -5.813584327697754, "global_step": 56714, "epoch": 1350} {"train_loss": -5.911445617675781, "global_step": 56715, "epoch": 1350} {"train_loss": -5.713285446166992, "global_step": 56716, "epoch": 1350} {"train_loss": -5.897164344787598, "global_step": 56717, "epoch": 1350} {"train_loss": -5.760045528411865, "global_step": 56718, "epoch": 1350} {"train_loss": -5.876874923706055, "global_step": 56719, "epoch": 1350} {"train_loss": -5.9236626625061035, "global_step": 56720, "epoch": 1350} {"train_loss": -5.784940719604492, "global_step": 56721, "epoch": 1350} {"train_loss": -5.968926429748535, "global_step": 56722, "epoch": 1350} {"train_loss": -5.93365478515625, "global_step": 56723, "epoch": 1350} {"train_loss": -5.970062732696533, "global_step": 56724, "epoch": 1350} {"train_loss": -5.925377368927002, "global_step": 56725, "epoch": 1350} {"train_loss": -5.903291702270508, "global_step": 56726, "epoch": 1350} {"train_loss": -5.828693389892578, "global_step": 56727, "epoch": 1350} {"train_loss": -5.8611040115356445, "global_step": 56728, "epoch": 1350} {"train_loss": -5.953721523284912, "global_step": 56729, "epoch": 1350} {"train_loss": -5.777019023895264, "global_step": 56730, "epoch": 1350} {"train_loss": -5.782979965209961, "global_step": 56731, "epoch": 1350} {"train_loss": -5.84608268737793, "global_step": 56732, "epoch": 1350} {"train_loss": -5.804369926452637, "global_step": 56733, "epoch": 1350} {"train_loss": -5.839847564697266, "global_step": 56734, "epoch": 1350} {"train_loss": -5.8352508544921875, "global_step": 56735, "epoch": 1350} {"train_loss": -5.8763427734375, "global_step": 56736, "epoch": 1350} {"train_loss": -5.865555763244629, "global_step": 56737, "epoch": 1350} {"train_loss": -5.764363765716553, "global_step": 56738, "epoch": 1350} {"train_loss": -5.827709197998047, "global_step": 56739, "epoch": 1350} {"train_loss": -5.938238143920898, "global_step": 56740, "epoch": 1350} {"train_loss": -5.836243198031471, "global_step": 56741, "epoch": 1350, "train/sim_max_reward_0": 0.8874279077983072, "train/sim_max_reward_1": 0.28669132500729255, "train/sim_max_reward_2": 0.9474486824080085, "train/sim_max_reward_3": 0.3811695348555378, "train/sim_max_reward_4": 0.9440267506896475, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.12097936507752381, "test/sim_max_reward_4300001": 0.21452909033932474, "test/sim_max_reward_4300002": 0.5261179367472234, "test/sim_max_reward_4300003": 0.8561989378108441, "test/sim_max_reward_4300004": 0.2690615785059859, "test/sim_max_reward_4300005": 0.8348696351647833, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.33463346083579576, "test/sim_max_reward_4300008": 0.8229961029958173, "test/sim_max_reward_4300009": 0.8788800944657604, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.3289409759738505, "test/sim_max_reward_4300012": 0.8289012154528108, "test/sim_max_reward_4300013": 0.9097010542094761, "test/sim_max_reward_4300014": 0.8855510496459011, "test/sim_max_reward_4300015": 0.9131475951099305, "test/sim_max_reward_4300016": 0.77087842387374, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.44551173170030656, "test/sim_max_reward_4300019": 0.1863158451594081, "test/sim_max_reward_4300020": 0.4230504371058723, "test/sim_max_reward_4300021": 0.9518474793763133, "test/sim_max_reward_4300022": 0.20932812423783353, "test/sim_max_reward_4300023": 0.3832959398180492, "test/sim_max_reward_4300024": 0.44777919103942093, "test/sim_max_reward_4300025": 0.3901008619220918, "test/sim_max_reward_4300026": 0.7965099762068483, "test/sim_max_reward_4300027": 0.7782986007402636, "test/sim_max_reward_4300028": 0.0003899244815575443, "test/sim_max_reward_4300029": 0.024089253863053158, "test/sim_max_reward_4300030": 0.22373126432930465, "test/sim_max_reward_4300031": 0.8015203439310356, "test/sim_max_reward_4300032": 0.6951809402811463, "test/sim_max_reward_4300033": 0.47155301034403435, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.4732073996203933, "test/sim_max_reward_4300037": 0.731557481966026, "test/sim_max_reward_4300038": 0.9526882987499942, "test/sim_max_reward_4300039": 0.9145624194820989, "test/sim_max_reward_4300040": 0.8689512836414058, "test/sim_max_reward_4300041": 0.6063221920234504, "test/sim_max_reward_4300042": 0.7131554110706391, "test/sim_max_reward_4300043": 0.1587039331120286, "test/sim_max_reward_4300044": 0.8711588618246325, "test/sim_max_reward_4300045": 0.9774253209784598, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.5351672144333558, "test/sim_max_reward_4300048": 0.9558838932737888, "test/sim_max_reward_4300049": 0.9643192067456036, "train/mean_score": 0.6066248266868302, "test/mean_score": 0.5689398471533437, "val_loss": 61461.22265625} {"train_loss": -5.809462547302246, "global_step": 56742, "epoch": 1351} {"train_loss": -5.917489051818848, "global_step": 56743, "epoch": 1351} {"train_loss": -5.924987316131592, "global_step": 56744, "epoch": 1351} {"train_loss": -5.796091556549072, "global_step": 56745, "epoch": 1351} {"train_loss": -5.926496505737305, "global_step": 56746, "epoch": 1351} {"train_loss": -6.0344767570495605, "global_step": 56747, "epoch": 1351} {"train_loss": -5.943449020385742, "global_step": 56748, "epoch": 1351} {"train_loss": -5.801258563995361, "global_step": 56749, "epoch": 1351} {"train_loss": -5.854277610778809, "global_step": 56750, "epoch": 1351} {"train_loss": -5.835433006286621, "global_step": 56751, "epoch": 1351} {"train_loss": -5.936784267425537, "global_step": 56752, "epoch": 1351} {"train_loss": -5.967684268951416, "global_step": 56753, "epoch": 1351} {"train_loss": -5.78608512878418, "global_step": 56754, "epoch": 1351} {"train_loss": -5.83149528503418, "global_step": 56755, "epoch": 1351} {"train_loss": -5.726687431335449, "global_step": 56756, "epoch": 1351} {"train_loss": -5.87169885635376, "global_step": 56757, "epoch": 1351} {"train_loss": -5.867255687713623, "global_step": 56758, "epoch": 1351} {"train_loss": -5.807861328125, "global_step": 56759, "epoch": 1351} {"train_loss": -5.775357246398926, "global_step": 56760, "epoch": 1351} {"train_loss": -5.827031135559082, "global_step": 56761, "epoch": 1351} {"train_loss": -5.962217330932617, "global_step": 56762, "epoch": 1351} {"train_loss": -5.8134379386901855, "global_step": 56763, "epoch": 1351} {"train_loss": -5.786097526550293, "global_step": 56764, "epoch": 1351} {"train_loss": -5.811717987060547, "global_step": 56765, "epoch": 1351} {"train_loss": -5.839285850524902, "global_step": 56766, "epoch": 1351} {"train_loss": -5.898562908172607, "global_step": 56767, "epoch": 1351} {"train_loss": -5.772875785827637, "global_step": 56768, "epoch": 1351} {"train_loss": -5.782619476318359, "global_step": 56769, "epoch": 1351} {"train_loss": -5.882031440734863, "global_step": 56770, "epoch": 1351} {"train_loss": -5.790431976318359, "global_step": 56771, "epoch": 1351} {"train_loss": -5.812928199768066, "global_step": 56772, "epoch": 1351} {"train_loss": -5.877322673797607, "global_step": 56773, "epoch": 1351} {"train_loss": -5.801568031311035, "global_step": 56774, "epoch": 1351} {"train_loss": -5.903571128845215, "global_step": 56775, "epoch": 1351} {"train_loss": -5.8297014236450195, "global_step": 56776, "epoch": 1351} {"train_loss": -5.818096160888672, "global_step": 56777, "epoch": 1351} {"train_loss": -5.779379844665527, "global_step": 56778, "epoch": 1351} {"train_loss": -5.663861274719238, "global_step": 56779, "epoch": 1351} {"train_loss": -5.910717487335205, "global_step": 56780, "epoch": 1351} {"train_loss": -5.961599349975586, "global_step": 56781, "epoch": 1351} {"train_loss": -5.681972980499268, "global_step": 56782, "epoch": 1351} {"train_loss": -5.845378830319359, "global_step": 56783, "epoch": 1351, "val_loss": 61465.41796875} {"train_loss": -5.868372917175293, "global_step": 56784, "epoch": 1352} {"train_loss": -5.9005327224731445, "global_step": 56785, "epoch": 1352} {"train_loss": -5.84581184387207, "global_step": 56786, "epoch": 1352} {"train_loss": -5.8416972160339355, "global_step": 56787, "epoch": 1352} {"train_loss": -5.845612049102783, "global_step": 56788, "epoch": 1352} {"train_loss": -5.827328681945801, "global_step": 56789, "epoch": 1352} {"train_loss": -5.822185516357422, "global_step": 56790, "epoch": 1352} {"train_loss": -5.754817962646484, "global_step": 56791, "epoch": 1352} {"train_loss": -5.903312683105469, "global_step": 56792, "epoch": 1352} {"train_loss": -5.749203681945801, "global_step": 56793, "epoch": 1352} {"train_loss": -5.873903274536133, "global_step": 56794, "epoch": 1352} {"train_loss": -5.804939270019531, "global_step": 56795, "epoch": 1352} {"train_loss": -5.7689528465271, "global_step": 56796, "epoch": 1352} {"train_loss": -5.95858097076416, "global_step": 56797, "epoch": 1352} {"train_loss": -5.865683078765869, "global_step": 56798, "epoch": 1352} {"train_loss": -5.825720310211182, "global_step": 56799, "epoch": 1352} {"train_loss": -5.809171676635742, "global_step": 56800, "epoch": 1352} {"train_loss": -5.981729507446289, "global_step": 56801, "epoch": 1352} {"train_loss": -5.949407577514648, "global_step": 56802, "epoch": 1352} {"train_loss": -5.661846160888672, "global_step": 56803, "epoch": 1352} {"train_loss": -5.928444862365723, "global_step": 56804, "epoch": 1352} {"train_loss": -5.825192451477051, "global_step": 56805, "epoch": 1352} {"train_loss": -5.8974409103393555, "global_step": 56806, "epoch": 1352} {"train_loss": -5.931866645812988, "global_step": 56807, "epoch": 1352} {"train_loss": -5.8814697265625, "global_step": 56808, "epoch": 1352} {"train_loss": -5.851713180541992, "global_step": 56809, "epoch": 1352} {"train_loss": -5.827722549438477, "global_step": 56810, "epoch": 1352} {"train_loss": -5.780434608459473, "global_step": 56811, "epoch": 1352} {"train_loss": -5.957369804382324, "global_step": 56812, "epoch": 1352} {"train_loss": -5.8072509765625, "global_step": 56813, "epoch": 1352} {"train_loss": -5.71295166015625, "global_step": 56814, "epoch": 1352} {"train_loss": -5.87296724319458, "global_step": 56815, "epoch": 1352} {"train_loss": -5.724595069885254, "global_step": 56816, "epoch": 1352} {"train_loss": -5.722725868225098, "global_step": 56817, "epoch": 1352} {"train_loss": -5.885613441467285, "global_step": 56818, "epoch": 1352} {"train_loss": -5.763340473175049, "global_step": 56819, "epoch": 1352} {"train_loss": -5.864648818969727, "global_step": 56820, "epoch": 1352} {"train_loss": -5.6793131828308105, "global_step": 56821, "epoch": 1352} {"train_loss": -5.788882255554199, "global_step": 56822, "epoch": 1352} {"train_loss": -5.9117655754089355, "global_step": 56823, "epoch": 1352} {"train_loss": -5.864078044891357, "global_step": 56824, "epoch": 1352} {"train_loss": -5.838105031422207, "global_step": 56825, "epoch": 1352, "val_loss": 61386.7421875} {"train_loss": -5.9340925216674805, "global_step": 56826, "epoch": 1353} {"train_loss": -5.873912811279297, "global_step": 56827, "epoch": 1353} {"train_loss": -5.795544147491455, "global_step": 56828, "epoch": 1353} {"train_loss": -5.7805938720703125, "global_step": 56829, "epoch": 1353} {"train_loss": -5.788832664489746, "global_step": 56830, "epoch": 1353} {"train_loss": -5.778911590576172, "global_step": 56831, "epoch": 1353} {"train_loss": -5.808973789215088, "global_step": 56832, "epoch": 1353} {"train_loss": -5.757491588592529, "global_step": 56833, "epoch": 1353} {"train_loss": -5.864391326904297, "global_step": 56834, "epoch": 1353} {"train_loss": -5.902031898498535, "global_step": 56835, "epoch": 1353} {"train_loss": -5.8645524978637695, "global_step": 56836, "epoch": 1353} {"train_loss": -5.854901313781738, "global_step": 56837, "epoch": 1353} {"train_loss": -5.757078170776367, "global_step": 56838, "epoch": 1353} {"train_loss": -5.911012649536133, "global_step": 56839, "epoch": 1353} {"train_loss": -5.635315895080566, "global_step": 56840, "epoch": 1353} {"train_loss": -5.792387008666992, "global_step": 56841, "epoch": 1353} {"train_loss": -5.939598083496094, "global_step": 56842, "epoch": 1353} {"train_loss": -5.728484153747559, "global_step": 56843, "epoch": 1353} {"train_loss": -5.929750442504883, "global_step": 56844, "epoch": 1353} {"train_loss": -5.639375686645508, "global_step": 56845, "epoch": 1353} {"train_loss": -5.790361404418945, "global_step": 56846, "epoch": 1353} {"train_loss": -5.709573745727539, "global_step": 56847, "epoch": 1353} {"train_loss": -5.808787822723389, "global_step": 56848, "epoch": 1353} {"train_loss": -5.783995151519775, "global_step": 56849, "epoch": 1353} {"train_loss": -5.764789581298828, "global_step": 56850, "epoch": 1353} {"train_loss": -5.797961235046387, "global_step": 56851, "epoch": 1353} {"train_loss": -5.750643253326416, "global_step": 56852, "epoch": 1353} {"train_loss": -5.877830982208252, "global_step": 56853, "epoch": 1353} {"train_loss": -5.790165901184082, "global_step": 56854, "epoch": 1353} {"train_loss": -5.82236909866333, "global_step": 56855, "epoch": 1353} {"train_loss": -5.862669944763184, "global_step": 56856, "epoch": 1353} {"train_loss": -5.834523677825928, "global_step": 56857, "epoch": 1353} {"train_loss": -5.852066516876221, "global_step": 56858, "epoch": 1353} {"train_loss": -5.973179340362549, "global_step": 56859, "epoch": 1353} {"train_loss": -5.935919761657715, "global_step": 56860, "epoch": 1353} {"train_loss": -5.762345314025879, "global_step": 56861, "epoch": 1353} {"train_loss": -5.888226509094238, "global_step": 56862, "epoch": 1353} {"train_loss": -5.881181716918945, "global_step": 56863, "epoch": 1353} {"train_loss": -5.879324913024902, "global_step": 56864, "epoch": 1353} {"train_loss": -5.767374515533447, "global_step": 56865, "epoch": 1353} {"train_loss": -5.946331977844238, "global_step": 56866, "epoch": 1353} {"train_loss": -5.825857900437855, "global_step": 56867, "epoch": 1353, "val_loss": 61298.3671875} {"train_loss": -5.911202907562256, "global_step": 56868, "epoch": 1354} {"train_loss": -5.990933418273926, "global_step": 56869, "epoch": 1354} {"train_loss": -5.947229385375977, "global_step": 56870, "epoch": 1354} {"train_loss": -5.894250392913818, "global_step": 56871, "epoch": 1354} {"train_loss": -6.004340648651123, "global_step": 56872, "epoch": 1354} {"train_loss": -5.854030609130859, "global_step": 56873, "epoch": 1354} {"train_loss": -5.775173187255859, "global_step": 56874, "epoch": 1354} {"train_loss": -5.986904144287109, "global_step": 56875, "epoch": 1354} {"train_loss": -5.8675336837768555, "global_step": 56876, "epoch": 1354} {"train_loss": -5.874322891235352, "global_step": 56877, "epoch": 1354} {"train_loss": -5.864936828613281, "global_step": 56878, "epoch": 1354} {"train_loss": -5.796262264251709, "global_step": 56879, "epoch": 1354} {"train_loss": -5.902749061584473, "global_step": 56880, "epoch": 1354} {"train_loss": -5.847248554229736, "global_step": 56881, "epoch": 1354} {"train_loss": -5.903826713562012, "global_step": 56882, "epoch": 1354} {"train_loss": -5.878870487213135, "global_step": 56883, "epoch": 1354} {"train_loss": -5.846654891967773, "global_step": 56884, "epoch": 1354} {"train_loss": -5.972925186157227, "global_step": 56885, "epoch": 1354} {"train_loss": -5.89934778213501, "global_step": 56886, "epoch": 1354} {"train_loss": -5.887828826904297, "global_step": 56887, "epoch": 1354} {"train_loss": -5.838920593261719, "global_step": 56888, "epoch": 1354} {"train_loss": -5.844076633453369, "global_step": 56889, "epoch": 1354} {"train_loss": -5.932041168212891, "global_step": 56890, "epoch": 1354} {"train_loss": -5.825076103210449, "global_step": 56891, "epoch": 1354} {"train_loss": -5.854770183563232, "global_step": 56892, "epoch": 1354} {"train_loss": -5.773660659790039, "global_step": 56893, "epoch": 1354} {"train_loss": -5.806797027587891, "global_step": 56894, "epoch": 1354} {"train_loss": -5.82088565826416, "global_step": 56895, "epoch": 1354} {"train_loss": -5.785632133483887, "global_step": 56896, "epoch": 1354} {"train_loss": -5.8358845710754395, "global_step": 56897, "epoch": 1354} {"train_loss": -5.874799728393555, "global_step": 56898, "epoch": 1354} {"train_loss": -5.8474555015563965, "global_step": 56899, "epoch": 1354} {"train_loss": -5.76834774017334, "global_step": 56900, "epoch": 1354} {"train_loss": -5.7944865226745605, "global_step": 56901, "epoch": 1354} {"train_loss": -5.645471572875977, "global_step": 56902, "epoch": 1354} {"train_loss": -5.851354598999023, "global_step": 56903, "epoch": 1354} {"train_loss": -5.783991813659668, "global_step": 56904, "epoch": 1354} {"train_loss": -5.965122699737549, "global_step": 56905, "epoch": 1354} {"train_loss": -5.826931476593018, "global_step": 56906, "epoch": 1354} {"train_loss": -5.772665977478027, "global_step": 56907, "epoch": 1354} {"train_loss": -5.9319658279418945, "global_step": 56908, "epoch": 1354} {"train_loss": -5.860620498657227, "global_step": 56909, "epoch": 1354, "val_loss": 61531.359375} {"train_loss": -5.889230728149414, "global_step": 56910, "epoch": 1355} {"train_loss": -5.902576923370361, "global_step": 56911, "epoch": 1355} {"train_loss": -5.896930694580078, "global_step": 56912, "epoch": 1355} {"train_loss": -5.849394798278809, "global_step": 56913, "epoch": 1355} {"train_loss": -5.9350714683532715, "global_step": 56914, "epoch": 1355} {"train_loss": -5.901043891906738, "global_step": 56915, "epoch": 1355} {"train_loss": -5.9027886390686035, "global_step": 56916, "epoch": 1355} {"train_loss": -5.958444118499756, "global_step": 56917, "epoch": 1355} {"train_loss": -5.807524681091309, "global_step": 56918, "epoch": 1355} {"train_loss": -5.78780460357666, "global_step": 56919, "epoch": 1355} {"train_loss": -5.912919998168945, "global_step": 56920, "epoch": 1355} {"train_loss": -5.918300151824951, "global_step": 56921, "epoch": 1355} {"train_loss": -5.890705108642578, "global_step": 56922, "epoch": 1355} {"train_loss": -5.808535575866699, "global_step": 56923, "epoch": 1355} {"train_loss": -5.874319553375244, "global_step": 56924, "epoch": 1355} {"train_loss": -5.946733474731445, "global_step": 56925, "epoch": 1355} {"train_loss": -5.922101020812988, "global_step": 56926, "epoch": 1355} {"train_loss": -5.889812469482422, "global_step": 56927, "epoch": 1355} {"train_loss": -5.825056076049805, "global_step": 56928, "epoch": 1355} {"train_loss": -5.867991924285889, "global_step": 56929, "epoch": 1355} {"train_loss": -5.898964881896973, "global_step": 56930, "epoch": 1355} {"train_loss": -5.77718448638916, "global_step": 56931, "epoch": 1355} {"train_loss": -5.8330559730529785, "global_step": 56932, "epoch": 1355} {"train_loss": -5.970527172088623, "global_step": 56933, "epoch": 1355} {"train_loss": -5.788588047027588, "global_step": 56934, "epoch": 1355} {"train_loss": -5.730083465576172, "global_step": 56935, "epoch": 1355} {"train_loss": -5.875908851623535, "global_step": 56936, "epoch": 1355} {"train_loss": -5.893712043762207, "global_step": 56937, "epoch": 1355} {"train_loss": -5.8383331298828125, "global_step": 56938, "epoch": 1355} {"train_loss": -5.844165802001953, "global_step": 56939, "epoch": 1355} {"train_loss": -5.874504089355469, "global_step": 56940, "epoch": 1355} {"train_loss": -5.801368713378906, "global_step": 56941, "epoch": 1355} {"train_loss": -5.808107376098633, "global_step": 56942, "epoch": 1355} {"train_loss": -5.655191421508789, "global_step": 56943, "epoch": 1355} {"train_loss": -5.911342620849609, "global_step": 56944, "epoch": 1355} {"train_loss": -5.814981460571289, "global_step": 56945, "epoch": 1355} {"train_loss": -5.746605396270752, "global_step": 56946, "epoch": 1355} {"train_loss": -5.710373401641846, "global_step": 56947, "epoch": 1355} {"train_loss": -5.836698055267334, "global_step": 56948, "epoch": 1355} {"train_loss": -5.764375686645508, "global_step": 56949, "epoch": 1355} {"train_loss": -5.824323654174805, "global_step": 56950, "epoch": 1355} {"train_loss": -5.848651988165719, "global_step": 56951, "epoch": 1355, "val_loss": 61385.50390625} {"train_loss": -5.778628349304199, "global_step": 56952, "epoch": 1356} {"train_loss": -5.795317649841309, "global_step": 56953, "epoch": 1356} {"train_loss": -5.771463394165039, "global_step": 56954, "epoch": 1356} {"train_loss": -5.82568359375, "global_step": 56955, "epoch": 1356} {"train_loss": -5.916903495788574, "global_step": 56956, "epoch": 1356} {"train_loss": -5.866197109222412, "global_step": 56957, "epoch": 1356} {"train_loss": -5.888602256774902, "global_step": 56958, "epoch": 1356} {"train_loss": -5.802455902099609, "global_step": 56959, "epoch": 1356} {"train_loss": -5.779331207275391, "global_step": 56960, "epoch": 1356} {"train_loss": -6.002170562744141, "global_step": 56961, "epoch": 1356} {"train_loss": -5.830399513244629, "global_step": 56962, "epoch": 1356} {"train_loss": -5.971131324768066, "global_step": 56963, "epoch": 1356} {"train_loss": -5.788887977600098, "global_step": 56964, "epoch": 1356} {"train_loss": -5.812236309051514, "global_step": 56965, "epoch": 1356} {"train_loss": -5.909767150878906, "global_step": 56966, "epoch": 1356} {"train_loss": -5.945489406585693, "global_step": 56967, "epoch": 1356} {"train_loss": -5.790814399719238, "global_step": 56968, "epoch": 1356} {"train_loss": -5.813908576965332, "global_step": 56969, "epoch": 1356} {"train_loss": -5.872601509094238, "global_step": 56970, "epoch": 1356} {"train_loss": -5.846069812774658, "global_step": 56971, "epoch": 1356} {"train_loss": -5.829341888427734, "global_step": 56972, "epoch": 1356} {"train_loss": -5.921668529510498, "global_step": 56973, "epoch": 1356} {"train_loss": -5.84050989151001, "global_step": 56974, "epoch": 1356} {"train_loss": -5.89167594909668, "global_step": 56975, "epoch": 1356} {"train_loss": -5.896162986755371, "global_step": 56976, "epoch": 1356} {"train_loss": -6.030673027038574, "global_step": 56977, "epoch": 1356} {"train_loss": -5.8208327293396, "global_step": 56978, "epoch": 1356} {"train_loss": -5.929791450500488, "global_step": 56979, "epoch": 1356} {"train_loss": -5.929408550262451, "global_step": 56980, "epoch": 1356} {"train_loss": -5.90707540512085, "global_step": 56981, "epoch": 1356} {"train_loss": -5.873477458953857, "global_step": 56982, "epoch": 1356} {"train_loss": -5.927731037139893, "global_step": 56983, "epoch": 1356} {"train_loss": -5.799201011657715, "global_step": 56984, "epoch": 1356} {"train_loss": -5.93839693069458, "global_step": 56985, "epoch": 1356} {"train_loss": -5.825146198272705, "global_step": 56986, "epoch": 1356} {"train_loss": -5.838199615478516, "global_step": 56987, "epoch": 1356} {"train_loss": -5.987737655639648, "global_step": 56988, "epoch": 1356} {"train_loss": -5.929109573364258, "global_step": 56989, "epoch": 1356} {"train_loss": -5.744182586669922, "global_step": 56990, "epoch": 1356} {"train_loss": -5.858330726623535, "global_step": 56991, "epoch": 1356} {"train_loss": -5.764165878295898, "global_step": 56992, "epoch": 1356} {"train_loss": -5.864357074101766, "global_step": 56993, "epoch": 1356, "val_loss": 61643.3828125} {"train_loss": -5.9473114013671875, "global_step": 56994, "epoch": 1357} {"train_loss": -5.868893146514893, "global_step": 56995, "epoch": 1357} {"train_loss": -5.689822196960449, "global_step": 56996, "epoch": 1357} {"train_loss": -5.898904800415039, "global_step": 56997, "epoch": 1357} {"train_loss": -6.015103340148926, "global_step": 56998, "epoch": 1357} {"train_loss": -5.72226095199585, "global_step": 56999, "epoch": 1357} {"train_loss": -5.882991790771484, "global_step": 57000, "epoch": 1357} {"train_loss": -5.801353931427002, "global_step": 57001, "epoch": 1357} {"train_loss": -5.931665420532227, "global_step": 57002, "epoch": 1357} {"train_loss": -5.803749084472656, "global_step": 57003, "epoch": 1357} {"train_loss": -5.786285877227783, "global_step": 57004, "epoch": 1357} {"train_loss": -5.827169895172119, "global_step": 57005, "epoch": 1357} {"train_loss": -5.920952796936035, "global_step": 57006, "epoch": 1357} {"train_loss": -5.822771072387695, "global_step": 57007, "epoch": 1357} {"train_loss": -5.9104766845703125, "global_step": 57008, "epoch": 1357} {"train_loss": -5.874918460845947, "global_step": 57009, "epoch": 1357} {"train_loss": -5.864726543426514, "global_step": 57010, "epoch": 1357} {"train_loss": -5.883646488189697, "global_step": 57011, "epoch": 1357} {"train_loss": -5.847587585449219, "global_step": 57012, "epoch": 1357} {"train_loss": -5.81840705871582, "global_step": 57013, "epoch": 1357} {"train_loss": -5.827095985412598, "global_step": 57014, "epoch": 1357} {"train_loss": -5.981277942657471, "global_step": 57015, "epoch": 1357} {"train_loss": -5.932710647583008, "global_step": 57016, "epoch": 1357} {"train_loss": -5.873922348022461, "global_step": 57017, "epoch": 1357} {"train_loss": -5.889828681945801, "global_step": 57018, "epoch": 1357} {"train_loss": -5.927925109863281, "global_step": 57019, "epoch": 1357} {"train_loss": -5.786919116973877, "global_step": 57020, "epoch": 1357} {"train_loss": -5.916244029998779, "global_step": 57021, "epoch": 1357} {"train_loss": -5.877804279327393, "global_step": 57022, "epoch": 1357} {"train_loss": -5.835054397583008, "global_step": 57023, "epoch": 1357} {"train_loss": -5.832102298736572, "global_step": 57024, "epoch": 1357} {"train_loss": -5.872284412384033, "global_step": 57025, "epoch": 1357} {"train_loss": -5.901871681213379, "global_step": 57026, "epoch": 1357} {"train_loss": -5.945443630218506, "global_step": 57027, "epoch": 1357} {"train_loss": -5.92745304107666, "global_step": 57028, "epoch": 1357} {"train_loss": -5.847381591796875, "global_step": 57029, "epoch": 1357} {"train_loss": -5.916292667388916, "global_step": 57030, "epoch": 1357} {"train_loss": -5.869719982147217, "global_step": 57031, "epoch": 1357} {"train_loss": -5.885481834411621, "global_step": 57032, "epoch": 1357} {"train_loss": -5.966424942016602, "global_step": 57033, "epoch": 1357} {"train_loss": -5.830161094665527, "global_step": 57034, "epoch": 1357} {"train_loss": -5.871811764580863, "global_step": 57035, "epoch": 1357, "val_loss": 61465.15625} {"train_loss": -5.984792709350586, "global_step": 57036, "epoch": 1358} {"train_loss": -5.865256309509277, "global_step": 57037, "epoch": 1358} {"train_loss": -5.889458656311035, "global_step": 57038, "epoch": 1358} {"train_loss": -5.815649032592773, "global_step": 57039, "epoch": 1358} {"train_loss": -5.981678485870361, "global_step": 57040, "epoch": 1358} {"train_loss": -5.890742301940918, "global_step": 57041, "epoch": 1358} {"train_loss": -5.8961591720581055, "global_step": 57042, "epoch": 1358} {"train_loss": -5.834033966064453, "global_step": 57043, "epoch": 1358} {"train_loss": -5.944319248199463, "global_step": 57044, "epoch": 1358} {"train_loss": -5.880344390869141, "global_step": 57045, "epoch": 1358} {"train_loss": -5.879939556121826, "global_step": 57046, "epoch": 1358} {"train_loss": -5.89243221282959, "global_step": 57047, "epoch": 1358} {"train_loss": -5.976393699645996, "global_step": 57048, "epoch": 1358} {"train_loss": -5.888024806976318, "global_step": 57049, "epoch": 1358} {"train_loss": -5.81418514251709, "global_step": 57050, "epoch": 1358} {"train_loss": -5.866575241088867, "global_step": 57051, "epoch": 1358} {"train_loss": -5.942596435546875, "global_step": 57052, "epoch": 1358} {"train_loss": -5.926939964294434, "global_step": 57053, "epoch": 1358} {"train_loss": -5.7974853515625, "global_step": 57054, "epoch": 1358} {"train_loss": -5.900940418243408, "global_step": 57055, "epoch": 1358} {"train_loss": -5.840271949768066, "global_step": 57056, "epoch": 1358} {"train_loss": -5.9073944091796875, "global_step": 57057, "epoch": 1358} {"train_loss": -5.914337158203125, "global_step": 57058, "epoch": 1358} {"train_loss": -5.942210674285889, "global_step": 57059, "epoch": 1358} {"train_loss": -5.868194580078125, "global_step": 57060, "epoch": 1358} {"train_loss": -5.984532356262207, "global_step": 57061, "epoch": 1358} {"train_loss": -5.893828868865967, "global_step": 57062, "epoch": 1358} {"train_loss": -5.925947666168213, "global_step": 57063, "epoch": 1358} {"train_loss": -5.897168159484863, "global_step": 57064, "epoch": 1358} {"train_loss": -5.932135581970215, "global_step": 57065, "epoch": 1358} {"train_loss": -5.940658092498779, "global_step": 57066, "epoch": 1358} {"train_loss": -5.774568557739258, "global_step": 57067, "epoch": 1358} {"train_loss": -5.852157115936279, "global_step": 57068, "epoch": 1358} {"train_loss": -5.890942573547363, "global_step": 57069, "epoch": 1358} {"train_loss": -5.98175573348999, "global_step": 57070, "epoch": 1358} {"train_loss": -5.884052753448486, "global_step": 57071, "epoch": 1358} {"train_loss": -5.793455123901367, "global_step": 57072, "epoch": 1358} {"train_loss": -5.88330078125, "global_step": 57073, "epoch": 1358} {"train_loss": -5.848818778991699, "global_step": 57074, "epoch": 1358} {"train_loss": -5.881954669952393, "global_step": 57075, "epoch": 1358} {"train_loss": -5.7703633308410645, "global_step": 57076, "epoch": 1358} {"train_loss": -5.888588337671189, "global_step": 57077, "epoch": 1358, "val_loss": 61264.38671875} {"train_loss": -5.857233047485352, "global_step": 57078, "epoch": 1359} {"train_loss": -5.904114246368408, "global_step": 57079, "epoch": 1359} {"train_loss": -5.938137054443359, "global_step": 57080, "epoch": 1359} {"train_loss": -5.865658760070801, "global_step": 57081, "epoch": 1359} {"train_loss": -5.785633087158203, "global_step": 57082, "epoch": 1359} {"train_loss": -5.869537353515625, "global_step": 57083, "epoch": 1359} {"train_loss": -5.872010707855225, "global_step": 57084, "epoch": 1359} {"train_loss": -5.9134745597839355, "global_step": 57085, "epoch": 1359} {"train_loss": -5.867006301879883, "global_step": 57086, "epoch": 1359} {"train_loss": -5.976224899291992, "global_step": 57087, "epoch": 1359} {"train_loss": -5.925588607788086, "global_step": 57088, "epoch": 1359} {"train_loss": -6.027783393859863, "global_step": 57089, "epoch": 1359} {"train_loss": -5.952942848205566, "global_step": 57090, "epoch": 1359} {"train_loss": -5.9342451095581055, "global_step": 57091, "epoch": 1359} {"train_loss": -5.928077697753906, "global_step": 57092, "epoch": 1359} {"train_loss": -5.918951034545898, "global_step": 57093, "epoch": 1359} {"train_loss": -5.782723903656006, "global_step": 57094, "epoch": 1359} {"train_loss": -5.753092288970947, "global_step": 57095, "epoch": 1359} {"train_loss": -5.883408069610596, "global_step": 57096, "epoch": 1359} {"train_loss": -5.975129127502441, "global_step": 57097, "epoch": 1359} {"train_loss": -5.982706069946289, "global_step": 57098, "epoch": 1359} {"train_loss": -5.99553918838501, "global_step": 57099, "epoch": 1359} {"train_loss": -5.900434494018555, "global_step": 57100, "epoch": 1359} {"train_loss": -5.886747360229492, "global_step": 57101, "epoch": 1359} {"train_loss": -5.894259452819824, "global_step": 57102, "epoch": 1359} {"train_loss": -5.955801963806152, "global_step": 57103, "epoch": 1359} {"train_loss": -5.786297798156738, "global_step": 57104, "epoch": 1359} {"train_loss": -5.821723937988281, "global_step": 57105, "epoch": 1359} {"train_loss": -5.920157432556152, "global_step": 57106, "epoch": 1359} {"train_loss": -5.928273677825928, "global_step": 57107, "epoch": 1359} {"train_loss": -5.873014450073242, "global_step": 57108, "epoch": 1359} {"train_loss": -5.8815155029296875, "global_step": 57109, "epoch": 1359} {"train_loss": -5.885246753692627, "global_step": 57110, "epoch": 1359} {"train_loss": -5.892583847045898, "global_step": 57111, "epoch": 1359} {"train_loss": -5.725715637207031, "global_step": 57112, "epoch": 1359} {"train_loss": -5.830609321594238, "global_step": 57113, "epoch": 1359} {"train_loss": -5.859086990356445, "global_step": 57114, "epoch": 1359} {"train_loss": -5.969486236572266, "global_step": 57115, "epoch": 1359} {"train_loss": -5.916223049163818, "global_step": 57116, "epoch": 1359} {"train_loss": -5.908894062042236, "global_step": 57117, "epoch": 1359} {"train_loss": -5.88853645324707, "global_step": 57118, "epoch": 1359} {"train_loss": -5.893964506330944, "global_step": 57119, "epoch": 1359, "val_loss": 61200.10546875} {"train_loss": -5.952849388122559, "global_step": 57120, "epoch": 1360} {"train_loss": -5.794050216674805, "global_step": 57121, "epoch": 1360} {"train_loss": -5.879649639129639, "global_step": 57122, "epoch": 1360} {"train_loss": -5.831901550292969, "global_step": 57123, "epoch": 1360} {"train_loss": -5.912708282470703, "global_step": 57124, "epoch": 1360} {"train_loss": -5.8051605224609375, "global_step": 57125, "epoch": 1360} {"train_loss": -5.853634834289551, "global_step": 57126, "epoch": 1360} {"train_loss": -5.9081573486328125, "global_step": 57127, "epoch": 1360} {"train_loss": -5.821770668029785, "global_step": 57128, "epoch": 1360} {"train_loss": -5.777196884155273, "global_step": 57129, "epoch": 1360} {"train_loss": -5.804069995880127, "global_step": 57130, "epoch": 1360} {"train_loss": -5.894511699676514, "global_step": 57131, "epoch": 1360} {"train_loss": -5.796063423156738, "global_step": 57132, "epoch": 1360} {"train_loss": -5.791969299316406, "global_step": 57133, "epoch": 1360} {"train_loss": -5.816714286804199, "global_step": 57134, "epoch": 1360} {"train_loss": -5.891928195953369, "global_step": 57135, "epoch": 1360} {"train_loss": -5.88718843460083, "global_step": 57136, "epoch": 1360} {"train_loss": -5.883481979370117, "global_step": 57137, "epoch": 1360} {"train_loss": -5.819921016693115, "global_step": 57138, "epoch": 1360} {"train_loss": -5.854519844055176, "global_step": 57139, "epoch": 1360} {"train_loss": -5.899423122406006, "global_step": 57140, "epoch": 1360} {"train_loss": -5.878868103027344, "global_step": 57141, "epoch": 1360} {"train_loss": -5.967304706573486, "global_step": 57142, "epoch": 1360} {"train_loss": -5.8165483474731445, "global_step": 57143, "epoch": 1360} {"train_loss": -5.891744613647461, "global_step": 57144, "epoch": 1360} {"train_loss": -5.869257926940918, "global_step": 57145, "epoch": 1360} {"train_loss": -5.834685802459717, "global_step": 57146, "epoch": 1360} {"train_loss": -5.819762229919434, "global_step": 57147, "epoch": 1360} {"train_loss": -5.783128261566162, "global_step": 57148, "epoch": 1360} {"train_loss": -5.864554405212402, "global_step": 57149, "epoch": 1360} {"train_loss": -5.955845832824707, "global_step": 57150, "epoch": 1360} {"train_loss": -5.876758575439453, "global_step": 57151, "epoch": 1360} {"train_loss": -5.937694072723389, "global_step": 57152, "epoch": 1360} {"train_loss": -5.825458526611328, "global_step": 57153, "epoch": 1360} {"train_loss": -5.9708757400512695, "global_step": 57154, "epoch": 1360} {"train_loss": -5.929378986358643, "global_step": 57155, "epoch": 1360} {"train_loss": -5.917710304260254, "global_step": 57156, "epoch": 1360} {"train_loss": -5.874438285827637, "global_step": 57157, "epoch": 1360} {"train_loss": -5.912744045257568, "global_step": 57158, "epoch": 1360} {"train_loss": -5.888039588928223, "global_step": 57159, "epoch": 1360} {"train_loss": -5.819271087646484, "global_step": 57160, "epoch": 1360} {"train_loss": -5.8671775091262095, "global_step": 57161, "epoch": 1360, "val_loss": 61606.57421875} {"train_loss": -5.7463154792785645, "global_step": 57162, "epoch": 1361} {"train_loss": -5.970609664916992, "global_step": 57163, "epoch": 1361} {"train_loss": -5.943717956542969, "global_step": 57164, "epoch": 1361} {"train_loss": -5.8342437744140625, "global_step": 57165, "epoch": 1361} {"train_loss": -5.8899970054626465, "global_step": 57166, "epoch": 1361} {"train_loss": -5.796738147735596, "global_step": 57167, "epoch": 1361} {"train_loss": -5.863023281097412, "global_step": 57168, "epoch": 1361} {"train_loss": -5.7770891189575195, "global_step": 57169, "epoch": 1361} {"train_loss": -5.879782199859619, "global_step": 57170, "epoch": 1361} {"train_loss": -5.750860691070557, "global_step": 57171, "epoch": 1361} {"train_loss": -5.82459020614624, "global_step": 57172, "epoch": 1361} {"train_loss": -5.784635543823242, "global_step": 57173, "epoch": 1361} {"train_loss": -5.822908878326416, "global_step": 57174, "epoch": 1361} {"train_loss": -5.822776794433594, "global_step": 57175, "epoch": 1361} {"train_loss": -5.799623489379883, "global_step": 57176, "epoch": 1361} {"train_loss": -5.7873430252075195, "global_step": 57177, "epoch": 1361} {"train_loss": -5.812273025512695, "global_step": 57178, "epoch": 1361} {"train_loss": -5.8633809089660645, "global_step": 57179, "epoch": 1361} {"train_loss": -5.813134670257568, "global_step": 57180, "epoch": 1361} {"train_loss": -5.9042181968688965, "global_step": 57181, "epoch": 1361} {"train_loss": -5.987405300140381, "global_step": 57182, "epoch": 1361} {"train_loss": -5.726244926452637, "global_step": 57183, "epoch": 1361} {"train_loss": -5.856661796569824, "global_step": 57184, "epoch": 1361} {"train_loss": -6.010406494140625, "global_step": 57185, "epoch": 1361} {"train_loss": -5.834739685058594, "global_step": 57186, "epoch": 1361} {"train_loss": -5.840823173522949, "global_step": 57187, "epoch": 1361} {"train_loss": -5.82479190826416, "global_step": 57188, "epoch": 1361} {"train_loss": -5.794439792633057, "global_step": 57189, "epoch": 1361} {"train_loss": -5.877915859222412, "global_step": 57190, "epoch": 1361} {"train_loss": -5.962810039520264, "global_step": 57191, "epoch": 1361} {"train_loss": -6.0212602615356445, "global_step": 57192, "epoch": 1361} {"train_loss": -5.921079635620117, "global_step": 57193, "epoch": 1361} {"train_loss": -5.938685894012451, "global_step": 57194, "epoch": 1361} {"train_loss": -5.955788612365723, "global_step": 57195, "epoch": 1361} {"train_loss": -6.000840187072754, "global_step": 57196, "epoch": 1361} {"train_loss": -5.823500156402588, "global_step": 57197, "epoch": 1361} {"train_loss": -5.86239767074585, "global_step": 57198, "epoch": 1361} {"train_loss": -5.841737747192383, "global_step": 57199, "epoch": 1361} {"train_loss": -5.964921474456787, "global_step": 57200, "epoch": 1361} {"train_loss": -5.741186141967773, "global_step": 57201, "epoch": 1361} {"train_loss": -5.823963165283203, "global_step": 57202, "epoch": 1361} {"train_loss": -5.859358515058245, "global_step": 57203, "epoch": 1361, "val_loss": 61755.83203125} {"train_loss": -5.844862937927246, "global_step": 57204, "epoch": 1362} {"train_loss": -5.910688400268555, "global_step": 57205, "epoch": 1362} {"train_loss": -5.9648027420043945, "global_step": 57206, "epoch": 1362} {"train_loss": -5.851800918579102, "global_step": 57207, "epoch": 1362} {"train_loss": -5.803078651428223, "global_step": 57208, "epoch": 1362} {"train_loss": -5.844343185424805, "global_step": 57209, "epoch": 1362} {"train_loss": -5.862343788146973, "global_step": 57210, "epoch": 1362} {"train_loss": -5.755227088928223, "global_step": 57211, "epoch": 1362} {"train_loss": -5.812337875366211, "global_step": 57212, "epoch": 1362} {"train_loss": -5.879823684692383, "global_step": 57213, "epoch": 1362} {"train_loss": -5.758824825286865, "global_step": 57214, "epoch": 1362} {"train_loss": -5.750038146972656, "global_step": 57215, "epoch": 1362} {"train_loss": -5.957554817199707, "global_step": 57216, "epoch": 1362} {"train_loss": -5.6384687423706055, "global_step": 57217, "epoch": 1362} {"train_loss": -5.836453437805176, "global_step": 57218, "epoch": 1362} {"train_loss": -5.764915943145752, "global_step": 57219, "epoch": 1362} {"train_loss": -5.775958061218262, "global_step": 57220, "epoch": 1362} {"train_loss": -5.906567573547363, "global_step": 57221, "epoch": 1362} {"train_loss": -5.800009727478027, "global_step": 57222, "epoch": 1362} {"train_loss": -5.907686233520508, "global_step": 57223, "epoch": 1362} {"train_loss": -5.749560356140137, "global_step": 57224, "epoch": 1362} {"train_loss": -5.891600131988525, "global_step": 57225, "epoch": 1362} {"train_loss": -5.852088928222656, "global_step": 57226, "epoch": 1362} {"train_loss": -5.8355712890625, "global_step": 57227, "epoch": 1362} {"train_loss": -5.925481796264648, "global_step": 57228, "epoch": 1362} {"train_loss": -5.760584831237793, "global_step": 57229, "epoch": 1362} {"train_loss": -5.839212417602539, "global_step": 57230, "epoch": 1362} {"train_loss": -5.819074630737305, "global_step": 57231, "epoch": 1362} {"train_loss": -5.753560543060303, "global_step": 57232, "epoch": 1362} {"train_loss": -5.705502986907959, "global_step": 57233, "epoch": 1362} {"train_loss": -5.791888236999512, "global_step": 57234, "epoch": 1362} {"train_loss": -5.843949317932129, "global_step": 57235, "epoch": 1362} {"train_loss": -5.850434303283691, "global_step": 57236, "epoch": 1362} {"train_loss": -5.849137306213379, "global_step": 57237, "epoch": 1362} {"train_loss": -5.819520473480225, "global_step": 57238, "epoch": 1362} {"train_loss": -5.930685520172119, "global_step": 57239, "epoch": 1362} {"train_loss": -5.828423500061035, "global_step": 57240, "epoch": 1362} {"train_loss": -5.714855194091797, "global_step": 57241, "epoch": 1362} {"train_loss": -5.8618550300598145, "global_step": 57242, "epoch": 1362} {"train_loss": -5.945697784423828, "global_step": 57243, "epoch": 1362} {"train_loss": -5.788651466369629, "global_step": 57244, "epoch": 1362} {"train_loss": -5.829957065128145, "global_step": 57245, "epoch": 1362, "val_loss": 61817.46875} {"train_loss": -5.833691120147705, "global_step": 57246, "epoch": 1363} {"train_loss": -5.832583904266357, "global_step": 57247, "epoch": 1363} {"train_loss": -5.829440593719482, "global_step": 57248, "epoch": 1363} {"train_loss": -5.686698913574219, "global_step": 57249, "epoch": 1363} {"train_loss": -5.873701095581055, "global_step": 57250, "epoch": 1363} {"train_loss": -5.786745071411133, "global_step": 57251, "epoch": 1363} {"train_loss": -5.91892671585083, "global_step": 57252, "epoch": 1363} {"train_loss": -5.886438369750977, "global_step": 57253, "epoch": 1363} {"train_loss": -5.945181846618652, "global_step": 57254, "epoch": 1363} {"train_loss": -5.777011394500732, "global_step": 57255, "epoch": 1363} {"train_loss": -5.80919885635376, "global_step": 57256, "epoch": 1363} {"train_loss": -5.918059349060059, "global_step": 57257, "epoch": 1363} {"train_loss": -5.7345428466796875, "global_step": 57258, "epoch": 1363} {"train_loss": -5.720136642456055, "global_step": 57259, "epoch": 1363} {"train_loss": -5.881631851196289, "global_step": 57260, "epoch": 1363} {"train_loss": -5.847397804260254, "global_step": 57261, "epoch": 1363} {"train_loss": -5.87344217300415, "global_step": 57262, "epoch": 1363} {"train_loss": -5.7366766929626465, "global_step": 57263, "epoch": 1363} {"train_loss": -5.845597267150879, "global_step": 57264, "epoch": 1363} {"train_loss": -5.964528560638428, "global_step": 57265, "epoch": 1363} {"train_loss": -5.912500381469727, "global_step": 57266, "epoch": 1363} {"train_loss": -5.842123031616211, "global_step": 57267, "epoch": 1363} {"train_loss": -5.9162092208862305, "global_step": 57268, "epoch": 1363} {"train_loss": -5.875881671905518, "global_step": 57269, "epoch": 1363} {"train_loss": -5.925931930541992, "global_step": 57270, "epoch": 1363} {"train_loss": -5.729123115539551, "global_step": 57271, "epoch": 1363} {"train_loss": -5.779977321624756, "global_step": 57272, "epoch": 1363} {"train_loss": -5.8740057945251465, "global_step": 57273, "epoch": 1363} {"train_loss": -5.810343265533447, "global_step": 57274, "epoch": 1363} {"train_loss": -5.874438285827637, "global_step": 57275, "epoch": 1363} {"train_loss": -5.89288330078125, "global_step": 57276, "epoch": 1363} {"train_loss": -5.788452625274658, "global_step": 57277, "epoch": 1363} {"train_loss": -5.890656471252441, "global_step": 57278, "epoch": 1363} {"train_loss": -5.880780220031738, "global_step": 57279, "epoch": 1363} {"train_loss": -5.782679080963135, "global_step": 57280, "epoch": 1363} {"train_loss": -5.851234436035156, "global_step": 57281, "epoch": 1363} {"train_loss": -5.957691192626953, "global_step": 57282, "epoch": 1363} {"train_loss": -5.766724586486816, "global_step": 57283, "epoch": 1363} {"train_loss": -5.951128959655762, "global_step": 57284, "epoch": 1363} {"train_loss": -5.942302703857422, "global_step": 57285, "epoch": 1363} {"train_loss": -5.851891040802002, "global_step": 57286, "epoch": 1363} {"train_loss": -5.849405674707322, "global_step": 57287, "epoch": 1363, "val_loss": 61703.83984375} {"train_loss": -5.889894962310791, "global_step": 57288, "epoch": 1364} {"train_loss": -5.824441909790039, "global_step": 57289, "epoch": 1364} {"train_loss": -5.95216703414917, "global_step": 57290, "epoch": 1364} {"train_loss": -5.879469394683838, "global_step": 57291, "epoch": 1364} {"train_loss": -5.785894393920898, "global_step": 57292, "epoch": 1364} {"train_loss": -5.888293743133545, "global_step": 57293, "epoch": 1364} {"train_loss": -5.870430946350098, "global_step": 57294, "epoch": 1364} {"train_loss": -5.741912841796875, "global_step": 57295, "epoch": 1364} {"train_loss": -5.829501152038574, "global_step": 57296, "epoch": 1364} {"train_loss": -5.87591552734375, "global_step": 57297, "epoch": 1364} {"train_loss": -5.8983917236328125, "global_step": 57298, "epoch": 1364} {"train_loss": -5.966259002685547, "global_step": 57299, "epoch": 1364} {"train_loss": -5.762628078460693, "global_step": 57300, "epoch": 1364} {"train_loss": -5.9026384353637695, "global_step": 57301, "epoch": 1364} {"train_loss": -5.857618808746338, "global_step": 57302, "epoch": 1364} {"train_loss": -5.741721153259277, "global_step": 57303, "epoch": 1364} {"train_loss": -5.919460296630859, "global_step": 57304, "epoch": 1364} {"train_loss": -5.8838701248168945, "global_step": 57305, "epoch": 1364} {"train_loss": -5.790658950805664, "global_step": 57306, "epoch": 1364} {"train_loss": -5.832084655761719, "global_step": 57307, "epoch": 1364} {"train_loss": -5.8227081298828125, "global_step": 57308, "epoch": 1364} {"train_loss": -5.924749374389648, "global_step": 57309, "epoch": 1364} {"train_loss": -5.773534297943115, "global_step": 57310, "epoch": 1364} {"train_loss": -5.825740814208984, "global_step": 57311, "epoch": 1364} {"train_loss": -5.9219818115234375, "global_step": 57312, "epoch": 1364} {"train_loss": -5.831510066986084, "global_step": 57313, "epoch": 1364} {"train_loss": -5.870735168457031, "global_step": 57314, "epoch": 1364} {"train_loss": -5.934223175048828, "global_step": 57315, "epoch": 1364} {"train_loss": -5.884829521179199, "global_step": 57316, "epoch": 1364} {"train_loss": -5.805319786071777, "global_step": 57317, "epoch": 1364} {"train_loss": -5.8242082595825195, "global_step": 57318, "epoch": 1364} {"train_loss": -5.922454833984375, "global_step": 57319, "epoch": 1364} {"train_loss": -5.823189735412598, "global_step": 57320, "epoch": 1364} {"train_loss": -5.933094024658203, "global_step": 57321, "epoch": 1364} {"train_loss": -5.860793113708496, "global_step": 57322, "epoch": 1364} {"train_loss": -5.95993185043335, "global_step": 57323, "epoch": 1364} {"train_loss": -5.804074287414551, "global_step": 57324, "epoch": 1364} {"train_loss": -5.914292335510254, "global_step": 57325, "epoch": 1364} {"train_loss": -5.8709611892700195, "global_step": 57326, "epoch": 1364} {"train_loss": -5.830195426940918, "global_step": 57327, "epoch": 1364} {"train_loss": -5.955379486083984, "global_step": 57328, "epoch": 1364} {"train_loss": -5.860601232165382, "global_step": 57329, "epoch": 1364, "val_loss": 61308.57421875} {"train_loss": -5.830303192138672, "global_step": 57330, "epoch": 1365} {"train_loss": -5.953513145446777, "global_step": 57331, "epoch": 1365} {"train_loss": -5.871180057525635, "global_step": 57332, "epoch": 1365} {"train_loss": -5.792680263519287, "global_step": 57333, "epoch": 1365} {"train_loss": -5.891474723815918, "global_step": 57334, "epoch": 1365} {"train_loss": -5.830289363861084, "global_step": 57335, "epoch": 1365} {"train_loss": -5.897097110748291, "global_step": 57336, "epoch": 1365} {"train_loss": -5.899331569671631, "global_step": 57337, "epoch": 1365} {"train_loss": -5.834238529205322, "global_step": 57338, "epoch": 1365} {"train_loss": -5.947871208190918, "global_step": 57339, "epoch": 1365} {"train_loss": -5.86155891418457, "global_step": 57340, "epoch": 1365} {"train_loss": -5.936490535736084, "global_step": 57341, "epoch": 1365} {"train_loss": -5.938218116760254, "global_step": 57342, "epoch": 1365} {"train_loss": -6.009961128234863, "global_step": 57343, "epoch": 1365} {"train_loss": -5.8031392097473145, "global_step": 57344, "epoch": 1365} {"train_loss": -5.977656841278076, "global_step": 57345, "epoch": 1365} {"train_loss": -5.830887794494629, "global_step": 57346, "epoch": 1365} {"train_loss": -5.861950874328613, "global_step": 57347, "epoch": 1365} {"train_loss": -5.911462783813477, "global_step": 57348, "epoch": 1365} {"train_loss": -5.938419818878174, "global_step": 57349, "epoch": 1365} {"train_loss": -5.854889392852783, "global_step": 57350, "epoch": 1365} {"train_loss": -5.91388463973999, "global_step": 57351, "epoch": 1365} {"train_loss": -5.83286190032959, "global_step": 57352, "epoch": 1365} {"train_loss": -5.962275981903076, "global_step": 57353, "epoch": 1365} {"train_loss": -5.879947662353516, "global_step": 57354, "epoch": 1365} {"train_loss": -5.900794982910156, "global_step": 57355, "epoch": 1365} {"train_loss": -5.9391188621521, "global_step": 57356, "epoch": 1365} {"train_loss": -5.877310752868652, "global_step": 57357, "epoch": 1365} {"train_loss": -5.9103922843933105, "global_step": 57358, "epoch": 1365} {"train_loss": -5.774648189544678, "global_step": 57359, "epoch": 1365} {"train_loss": -5.880980014801025, "global_step": 57360, "epoch": 1365} {"train_loss": -5.8538031578063965, "global_step": 57361, "epoch": 1365} {"train_loss": -5.862253189086914, "global_step": 57362, "epoch": 1365} {"train_loss": -5.797462463378906, "global_step": 57363, "epoch": 1365} {"train_loss": -5.899085998535156, "global_step": 57364, "epoch": 1365} {"train_loss": -5.798171043395996, "global_step": 57365, "epoch": 1365} {"train_loss": -5.885563850402832, "global_step": 57366, "epoch": 1365} {"train_loss": -5.757798671722412, "global_step": 57367, "epoch": 1365} {"train_loss": -5.868077278137207, "global_step": 57368, "epoch": 1365} {"train_loss": -5.803084850311279, "global_step": 57369, "epoch": 1365} {"train_loss": -5.8126678466796875, "global_step": 57370, "epoch": 1365} {"train_loss": -5.87097920690264, "global_step": 57371, "epoch": 1365, "val_loss": 61710.82421875} {"train_loss": -5.891556739807129, "global_step": 57372, "epoch": 1366} {"train_loss": -5.796313285827637, "global_step": 57373, "epoch": 1366} {"train_loss": -5.79585075378418, "global_step": 57374, "epoch": 1366} {"train_loss": -5.761959075927734, "global_step": 57375, "epoch": 1366} {"train_loss": -5.709956169128418, "global_step": 57376, "epoch": 1366} {"train_loss": -5.862634181976318, "global_step": 57377, "epoch": 1366} {"train_loss": -5.859532356262207, "global_step": 57378, "epoch": 1366} {"train_loss": -5.910290718078613, "global_step": 57379, "epoch": 1366} {"train_loss": -5.830352306365967, "global_step": 57380, "epoch": 1366} {"train_loss": -5.856734275817871, "global_step": 57381, "epoch": 1366} {"train_loss": -5.9398345947265625, "global_step": 57382, "epoch": 1366} {"train_loss": -5.805273056030273, "global_step": 57383, "epoch": 1366} {"train_loss": -5.947606086730957, "global_step": 57384, "epoch": 1366} {"train_loss": -5.740389823913574, "global_step": 57385, "epoch": 1366} {"train_loss": -5.990645408630371, "global_step": 57386, "epoch": 1366} {"train_loss": -5.852409362792969, "global_step": 57387, "epoch": 1366} {"train_loss": -5.866978645324707, "global_step": 57388, "epoch": 1366} {"train_loss": -5.8075432777404785, "global_step": 57389, "epoch": 1366} {"train_loss": -5.884832382202148, "global_step": 57390, "epoch": 1366} {"train_loss": -5.777317523956299, "global_step": 57391, "epoch": 1366} {"train_loss": -5.924629211425781, "global_step": 57392, "epoch": 1366} {"train_loss": -5.83733606338501, "global_step": 57393, "epoch": 1366} {"train_loss": -5.8025970458984375, "global_step": 57394, "epoch": 1366} {"train_loss": -5.981232643127441, "global_step": 57395, "epoch": 1366} {"train_loss": -5.852180004119873, "global_step": 57396, "epoch": 1366} {"train_loss": -5.888077259063721, "global_step": 57397, "epoch": 1366} {"train_loss": -5.940807342529297, "global_step": 57398, "epoch": 1366} {"train_loss": -5.832913398742676, "global_step": 57399, "epoch": 1366} {"train_loss": -5.832364082336426, "global_step": 57400, "epoch": 1366} {"train_loss": -5.927083969116211, "global_step": 57401, "epoch": 1366} {"train_loss": -6.053387641906738, "global_step": 57402, "epoch": 1366} {"train_loss": -5.824448585510254, "global_step": 57403, "epoch": 1366} {"train_loss": -5.883664131164551, "global_step": 57404, "epoch": 1366} {"train_loss": -5.863535404205322, "global_step": 57405, "epoch": 1366} {"train_loss": -5.861649513244629, "global_step": 57406, "epoch": 1366} {"train_loss": -5.834667205810547, "global_step": 57407, "epoch": 1366} {"train_loss": -5.850543975830078, "global_step": 57408, "epoch": 1366} {"train_loss": -5.921049118041992, "global_step": 57409, "epoch": 1366} {"train_loss": -5.99025821685791, "global_step": 57410, "epoch": 1366} {"train_loss": -5.926034450531006, "global_step": 57411, "epoch": 1366} {"train_loss": -5.662037372589111, "global_step": 57412, "epoch": 1366} {"train_loss": -5.860176733561924, "global_step": 57413, "epoch": 1366, "val_loss": 61406.5703125} {"train_loss": -5.942999839782715, "global_step": 57414, "epoch": 1367} {"train_loss": -5.814775466918945, "global_step": 57415, "epoch": 1367} {"train_loss": -5.830337047576904, "global_step": 57416, "epoch": 1367} {"train_loss": -5.934920310974121, "global_step": 57417, "epoch": 1367} {"train_loss": -5.807223796844482, "global_step": 57418, "epoch": 1367} {"train_loss": -5.777237892150879, "global_step": 57419, "epoch": 1367} {"train_loss": -5.8332037925720215, "global_step": 57420, "epoch": 1367} {"train_loss": -5.862288475036621, "global_step": 57421, "epoch": 1367} {"train_loss": -5.968973159790039, "global_step": 57422, "epoch": 1367} {"train_loss": -5.82523250579834, "global_step": 57423, "epoch": 1367} {"train_loss": -5.803789138793945, "global_step": 57424, "epoch": 1367} {"train_loss": -5.84425687789917, "global_step": 57425, "epoch": 1367} {"train_loss": -5.780438423156738, "global_step": 57426, "epoch": 1367} {"train_loss": -5.829422950744629, "global_step": 57427, "epoch": 1367} {"train_loss": -5.901480674743652, "global_step": 57428, "epoch": 1367} {"train_loss": -5.8107805252075195, "global_step": 57429, "epoch": 1367} {"train_loss": -5.819198131561279, "global_step": 57430, "epoch": 1367} {"train_loss": -5.905961990356445, "global_step": 57431, "epoch": 1367} {"train_loss": -5.809169769287109, "global_step": 57432, "epoch": 1367} {"train_loss": -5.79931116104126, "global_step": 57433, "epoch": 1367} {"train_loss": -5.966765880584717, "global_step": 57434, "epoch": 1367} {"train_loss": -5.980628967285156, "global_step": 57435, "epoch": 1367} {"train_loss": -5.913895130157471, "global_step": 57436, "epoch": 1367} {"train_loss": -5.7930707931518555, "global_step": 57437, "epoch": 1367} {"train_loss": -5.833021640777588, "global_step": 57438, "epoch": 1367} {"train_loss": -5.821407318115234, "global_step": 57439, "epoch": 1367} {"train_loss": -5.846959590911865, "global_step": 57440, "epoch": 1367} {"train_loss": -5.867588043212891, "global_step": 57441, "epoch": 1367} {"train_loss": -5.978786945343018, "global_step": 57442, "epoch": 1367} {"train_loss": -5.799970626831055, "global_step": 57443, "epoch": 1367} {"train_loss": -6.029480934143066, "global_step": 57444, "epoch": 1367} {"train_loss": -5.836460113525391, "global_step": 57445, "epoch": 1367} {"train_loss": -5.988289833068848, "global_step": 57446, "epoch": 1367} {"train_loss": -5.833776473999023, "global_step": 57447, "epoch": 1367} {"train_loss": -5.933772087097168, "global_step": 57448, "epoch": 1367} {"train_loss": -5.8148932456970215, "global_step": 57449, "epoch": 1367} {"train_loss": -5.875245094299316, "global_step": 57450, "epoch": 1367} {"train_loss": -5.900236129760742, "global_step": 57451, "epoch": 1367} {"train_loss": -5.831450462341309, "global_step": 57452, "epoch": 1367} {"train_loss": -5.987244129180908, "global_step": 57453, "epoch": 1367} {"train_loss": -5.780152797698975, "global_step": 57454, "epoch": 1367} {"train_loss": -5.865738198870704, "global_step": 57455, "epoch": 1367, "val_loss": 61405.5546875} {"train_loss": -5.974599838256836, "global_step": 57456, "epoch": 1368} {"train_loss": -5.916195392608643, "global_step": 57457, "epoch": 1368} {"train_loss": -5.729260444641113, "global_step": 57458, "epoch": 1368} {"train_loss": -5.783857345581055, "global_step": 57459, "epoch": 1368} {"train_loss": -5.81074857711792, "global_step": 57460, "epoch": 1368} {"train_loss": -5.761427402496338, "global_step": 57461, "epoch": 1368} {"train_loss": -5.971325874328613, "global_step": 57462, "epoch": 1368} {"train_loss": -5.927606582641602, "global_step": 57463, "epoch": 1368} {"train_loss": -5.802562713623047, "global_step": 57464, "epoch": 1368} {"train_loss": -5.900518894195557, "global_step": 57465, "epoch": 1368} {"train_loss": -5.924958229064941, "global_step": 57466, "epoch": 1368} {"train_loss": -5.94341516494751, "global_step": 57467, "epoch": 1368} {"train_loss": -5.828215599060059, "global_step": 57468, "epoch": 1368} {"train_loss": -5.865994453430176, "global_step": 57469, "epoch": 1368} {"train_loss": -5.87374210357666, "global_step": 57470, "epoch": 1368} {"train_loss": -5.784568786621094, "global_step": 57471, "epoch": 1368} {"train_loss": -5.8494439125061035, "global_step": 57472, "epoch": 1368} {"train_loss": -5.8281731605529785, "global_step": 57473, "epoch": 1368} {"train_loss": -5.848634719848633, "global_step": 57474, "epoch": 1368} {"train_loss": -5.727323532104492, "global_step": 57475, "epoch": 1368} {"train_loss": -5.940020561218262, "global_step": 57476, "epoch": 1368} {"train_loss": -5.8547821044921875, "global_step": 57477, "epoch": 1368} {"train_loss": -5.673797607421875, "global_step": 57478, "epoch": 1368} {"train_loss": -5.875299453735352, "global_step": 57479, "epoch": 1368} {"train_loss": -5.9502763748168945, "global_step": 57480, "epoch": 1368} {"train_loss": -5.869166374206543, "global_step": 57481, "epoch": 1368} {"train_loss": -5.89188289642334, "global_step": 57482, "epoch": 1368} {"train_loss": -5.883376121520996, "global_step": 57483, "epoch": 1368} {"train_loss": -5.857043266296387, "global_step": 57484, "epoch": 1368} {"train_loss": -5.900954246520996, "global_step": 57485, "epoch": 1368} {"train_loss": -5.994869709014893, "global_step": 57486, "epoch": 1368} {"train_loss": -5.914941787719727, "global_step": 57487, "epoch": 1368} {"train_loss": -5.839451789855957, "global_step": 57488, "epoch": 1368} {"train_loss": -6.04347562789917, "global_step": 57489, "epoch": 1368} {"train_loss": -5.824130058288574, "global_step": 57490, "epoch": 1368} {"train_loss": -5.910838603973389, "global_step": 57491, "epoch": 1368} {"train_loss": -5.966497898101807, "global_step": 57492, "epoch": 1368} {"train_loss": -5.876941204071045, "global_step": 57493, "epoch": 1368} {"train_loss": -5.979432582855225, "global_step": 57494, "epoch": 1368} {"train_loss": -6.009739875793457, "global_step": 57495, "epoch": 1368} {"train_loss": -5.874340057373047, "global_step": 57496, "epoch": 1368} {"train_loss": -5.880211886905489, "global_step": 57497, "epoch": 1368, "val_loss": 61349.9453125} {"train_loss": -5.994596481323242, "global_step": 57498, "epoch": 1369} {"train_loss": -5.844233989715576, "global_step": 57499, "epoch": 1369} {"train_loss": -5.96977424621582, "global_step": 57500, "epoch": 1369} {"train_loss": -5.867330074310303, "global_step": 57501, "epoch": 1369} {"train_loss": -5.827709674835205, "global_step": 57502, "epoch": 1369} {"train_loss": -5.935165882110596, "global_step": 57503, "epoch": 1369} {"train_loss": -5.877028465270996, "global_step": 57504, "epoch": 1369} {"train_loss": -5.7684478759765625, "global_step": 57505, "epoch": 1369} {"train_loss": -5.968635559082031, "global_step": 57506, "epoch": 1369} {"train_loss": -5.93067741394043, "global_step": 57507, "epoch": 1369} {"train_loss": -5.738039970397949, "global_step": 57508, "epoch": 1369} {"train_loss": -5.854623794555664, "global_step": 57509, "epoch": 1369} {"train_loss": -5.800302028656006, "global_step": 57510, "epoch": 1369} {"train_loss": -5.967896461486816, "global_step": 57511, "epoch": 1369} {"train_loss": -5.901412010192871, "global_step": 57512, "epoch": 1369} {"train_loss": -5.885846138000488, "global_step": 57513, "epoch": 1369} {"train_loss": -6.0055832862854, "global_step": 57514, "epoch": 1369} {"train_loss": -5.991868495941162, "global_step": 57515, "epoch": 1369} {"train_loss": -5.909762382507324, "global_step": 57516, "epoch": 1369} {"train_loss": -5.992624282836914, "global_step": 57517, "epoch": 1369} {"train_loss": -5.850613594055176, "global_step": 57518, "epoch": 1369} {"train_loss": -5.9201860427856445, "global_step": 57519, "epoch": 1369} {"train_loss": -5.89500617980957, "global_step": 57520, "epoch": 1369} {"train_loss": -5.895565032958984, "global_step": 57521, "epoch": 1369} {"train_loss": -5.908791542053223, "global_step": 57522, "epoch": 1369} {"train_loss": -5.833385467529297, "global_step": 57523, "epoch": 1369} {"train_loss": -5.79080057144165, "global_step": 57524, "epoch": 1369} {"train_loss": -5.975399971008301, "global_step": 57525, "epoch": 1369} {"train_loss": -5.870203971862793, "global_step": 57526, "epoch": 1369} {"train_loss": -5.951497554779053, "global_step": 57527, "epoch": 1369} {"train_loss": -5.8500471115112305, "global_step": 57528, "epoch": 1369} {"train_loss": -5.833798408508301, "global_step": 57529, "epoch": 1369} {"train_loss": -5.95328426361084, "global_step": 57530, "epoch": 1369} {"train_loss": -5.907322406768799, "global_step": 57531, "epoch": 1369} {"train_loss": -5.855266094207764, "global_step": 57532, "epoch": 1369} {"train_loss": -5.785869598388672, "global_step": 57533, "epoch": 1369} {"train_loss": -5.865054130554199, "global_step": 57534, "epoch": 1369} {"train_loss": -5.8383026123046875, "global_step": 57535, "epoch": 1369} {"train_loss": -5.6789398193359375, "global_step": 57536, "epoch": 1369} {"train_loss": -5.822587966918945, "global_step": 57537, "epoch": 1369} {"train_loss": -5.719698905944824, "global_step": 57538, "epoch": 1369} {"train_loss": -5.874998172124227, "global_step": 57539, "epoch": 1369, "val_loss": 61338.65234375} {"train_loss": -5.86152458190918, "global_step": 57540, "epoch": 1370} {"train_loss": -5.842294692993164, "global_step": 57541, "epoch": 1370} {"train_loss": -5.882752418518066, "global_step": 57542, "epoch": 1370} {"train_loss": -5.71711540222168, "global_step": 57543, "epoch": 1370} {"train_loss": -5.8093671798706055, "global_step": 57544, "epoch": 1370} {"train_loss": -5.893202781677246, "global_step": 57545, "epoch": 1370} {"train_loss": -5.835672855377197, "global_step": 57546, "epoch": 1370} {"train_loss": -5.903053283691406, "global_step": 57547, "epoch": 1370} {"train_loss": -5.883100509643555, "global_step": 57548, "epoch": 1370} {"train_loss": -5.853520393371582, "global_step": 57549, "epoch": 1370} {"train_loss": -5.916049957275391, "global_step": 57550, "epoch": 1370} {"train_loss": -5.838020324707031, "global_step": 57551, "epoch": 1370} {"train_loss": -5.860276222229004, "global_step": 57552, "epoch": 1370} {"train_loss": -5.8196868896484375, "global_step": 57553, "epoch": 1370} {"train_loss": -5.890668869018555, "global_step": 57554, "epoch": 1370} {"train_loss": -5.8434600830078125, "global_step": 57555, "epoch": 1370} {"train_loss": -5.988818168640137, "global_step": 57556, "epoch": 1370} {"train_loss": -5.9806742668151855, "global_step": 57557, "epoch": 1370} {"train_loss": -5.919905185699463, "global_step": 57558, "epoch": 1370} {"train_loss": -5.934883117675781, "global_step": 57559, "epoch": 1370} {"train_loss": -5.799981594085693, "global_step": 57560, "epoch": 1370} {"train_loss": -5.81451416015625, "global_step": 57561, "epoch": 1370} {"train_loss": -5.873689651489258, "global_step": 57562, "epoch": 1370} {"train_loss": -5.8230743408203125, "global_step": 57563, "epoch": 1370} {"train_loss": -5.772473335266113, "global_step": 57564, "epoch": 1370} {"train_loss": -5.680396556854248, "global_step": 57565, "epoch": 1370} {"train_loss": -5.90253210067749, "global_step": 57566, "epoch": 1370} {"train_loss": -5.805538177490234, "global_step": 57567, "epoch": 1370} {"train_loss": -5.901710510253906, "global_step": 57568, "epoch": 1370} {"train_loss": -5.918900966644287, "global_step": 57569, "epoch": 1370} {"train_loss": -5.770103931427002, "global_step": 57570, "epoch": 1370} {"train_loss": -6.018950462341309, "global_step": 57571, "epoch": 1370} {"train_loss": -5.842817783355713, "global_step": 57572, "epoch": 1370} {"train_loss": -5.9447150230407715, "global_step": 57573, "epoch": 1370} {"train_loss": -5.7676615715026855, "global_step": 57574, "epoch": 1370} {"train_loss": -5.804652214050293, "global_step": 57575, "epoch": 1370} {"train_loss": -5.8643693923950195, "global_step": 57576, "epoch": 1370} {"train_loss": -5.983822822570801, "global_step": 57577, "epoch": 1370} {"train_loss": -6.016221046447754, "global_step": 57578, "epoch": 1370} {"train_loss": -5.966313362121582, "global_step": 57579, "epoch": 1370} {"train_loss": -5.953176021575928, "global_step": 57580, "epoch": 1370} {"train_loss": -5.868458918162754, "global_step": 57581, "epoch": 1370, "val_loss": 61471.62109375} {"train_loss": -5.7932024002075195, "global_step": 57582, "epoch": 1371} {"train_loss": -5.863304138183594, "global_step": 57583, "epoch": 1371} {"train_loss": -5.865060806274414, "global_step": 57584, "epoch": 1371} {"train_loss": -5.7296319007873535, "global_step": 57585, "epoch": 1371} {"train_loss": -5.799986362457275, "global_step": 57586, "epoch": 1371} {"train_loss": -5.925469398498535, "global_step": 57587, "epoch": 1371} {"train_loss": -5.896856784820557, "global_step": 57588, "epoch": 1371} {"train_loss": -5.880307674407959, "global_step": 57589, "epoch": 1371} {"train_loss": -5.770388126373291, "global_step": 57590, "epoch": 1371} {"train_loss": -5.777365207672119, "global_step": 57591, "epoch": 1371} {"train_loss": -5.813793182373047, "global_step": 57592, "epoch": 1371} {"train_loss": -5.860650062561035, "global_step": 57593, "epoch": 1371} {"train_loss": -5.773061752319336, "global_step": 57594, "epoch": 1371} {"train_loss": -5.89901876449585, "global_step": 57595, "epoch": 1371} {"train_loss": -5.929424285888672, "global_step": 57596, "epoch": 1371} {"train_loss": -5.813228607177734, "global_step": 57597, "epoch": 1371} {"train_loss": -5.922715187072754, "global_step": 57598, "epoch": 1371} {"train_loss": -5.887808799743652, "global_step": 57599, "epoch": 1371} {"train_loss": -5.84071159362793, "global_step": 57600, "epoch": 1371} {"train_loss": -5.9147725105285645, "global_step": 57601, "epoch": 1371} {"train_loss": -5.881138324737549, "global_step": 57602, "epoch": 1371} {"train_loss": -5.862758159637451, "global_step": 57603, "epoch": 1371} {"train_loss": -5.800063610076904, "global_step": 57604, "epoch": 1371} {"train_loss": -5.897893905639648, "global_step": 57605, "epoch": 1371} {"train_loss": -5.926205635070801, "global_step": 57606, "epoch": 1371} {"train_loss": -5.839190483093262, "global_step": 57607, "epoch": 1371} {"train_loss": -5.983728408813477, "global_step": 57608, "epoch": 1371} {"train_loss": -5.910634994506836, "global_step": 57609, "epoch": 1371} {"train_loss": -5.849148273468018, "global_step": 57610, "epoch": 1371} {"train_loss": -5.827981948852539, "global_step": 57611, "epoch": 1371} {"train_loss": -5.910645008087158, "global_step": 57612, "epoch": 1371} {"train_loss": -5.818795204162598, "global_step": 57613, "epoch": 1371} {"train_loss": -5.870466709136963, "global_step": 57614, "epoch": 1371} {"train_loss": -5.960536003112793, "global_step": 57615, "epoch": 1371} {"train_loss": -6.0030975341796875, "global_step": 57616, "epoch": 1371} {"train_loss": -5.869803428649902, "global_step": 57617, "epoch": 1371} {"train_loss": -5.862664699554443, "global_step": 57618, "epoch": 1371} {"train_loss": -5.867790222167969, "global_step": 57619, "epoch": 1371} {"train_loss": -5.804108142852783, "global_step": 57620, "epoch": 1371} {"train_loss": -5.987855911254883, "global_step": 57621, "epoch": 1371} {"train_loss": -5.887998580932617, "global_step": 57622, "epoch": 1371} {"train_loss": -5.866935298556373, "global_step": 57623, "epoch": 1371, "val_loss": 61493.40234375} {"train_loss": -5.853496074676514, "global_step": 57624, "epoch": 1372} {"train_loss": -5.87661075592041, "global_step": 57625, "epoch": 1372} {"train_loss": -5.916355133056641, "global_step": 57626, "epoch": 1372} {"train_loss": -5.82564115524292, "global_step": 57627, "epoch": 1372} {"train_loss": -5.774219989776611, "global_step": 57628, "epoch": 1372} {"train_loss": -5.7988762855529785, "global_step": 57629, "epoch": 1372} {"train_loss": -5.933836936950684, "global_step": 57630, "epoch": 1372} {"train_loss": -5.883534908294678, "global_step": 57631, "epoch": 1372} {"train_loss": -5.900106430053711, "global_step": 57632, "epoch": 1372} {"train_loss": -5.9393720626831055, "global_step": 57633, "epoch": 1372} {"train_loss": -5.789386749267578, "global_step": 57634, "epoch": 1372} {"train_loss": -5.90015983581543, "global_step": 57635, "epoch": 1372} {"train_loss": -5.859846591949463, "global_step": 57636, "epoch": 1372} {"train_loss": -5.940734386444092, "global_step": 57637, "epoch": 1372} {"train_loss": -5.842146873474121, "global_step": 57638, "epoch": 1372} {"train_loss": -5.775470733642578, "global_step": 57639, "epoch": 1372} {"train_loss": -5.793302059173584, "global_step": 57640, "epoch": 1372} {"train_loss": -5.718443393707275, "global_step": 57641, "epoch": 1372} {"train_loss": -5.931368827819824, "global_step": 57642, "epoch": 1372} {"train_loss": -5.734455108642578, "global_step": 57643, "epoch": 1372} {"train_loss": -5.8934326171875, "global_step": 57644, "epoch": 1372} {"train_loss": -5.951421737670898, "global_step": 57645, "epoch": 1372} {"train_loss": -5.9607391357421875, "global_step": 57646, "epoch": 1372} {"train_loss": -5.858114719390869, "global_step": 57647, "epoch": 1372} {"train_loss": -5.866753578186035, "global_step": 57648, "epoch": 1372} {"train_loss": -5.869866371154785, "global_step": 57649, "epoch": 1372} {"train_loss": -5.799002647399902, "global_step": 57650, "epoch": 1372} {"train_loss": -5.887948513031006, "global_step": 57651, "epoch": 1372} {"train_loss": -5.833563327789307, "global_step": 57652, "epoch": 1372} {"train_loss": -5.911305904388428, "global_step": 57653, "epoch": 1372} {"train_loss": -5.943665027618408, "global_step": 57654, "epoch": 1372} {"train_loss": -5.847513675689697, "global_step": 57655, "epoch": 1372} {"train_loss": -5.8175249099731445, "global_step": 57656, "epoch": 1372} {"train_loss": -5.852195739746094, "global_step": 57657, "epoch": 1372} {"train_loss": -5.878587245941162, "global_step": 57658, "epoch": 1372} {"train_loss": -5.769723892211914, "global_step": 57659, "epoch": 1372} {"train_loss": -5.977698802947998, "global_step": 57660, "epoch": 1372} {"train_loss": -5.8963165283203125, "global_step": 57661, "epoch": 1372} {"train_loss": -5.896677017211914, "global_step": 57662, "epoch": 1372} {"train_loss": -5.949667930603027, "global_step": 57663, "epoch": 1372} {"train_loss": -5.905411720275879, "global_step": 57664, "epoch": 1372} {"train_loss": -5.866616237731207, "global_step": 57665, "epoch": 1372, "val_loss": 61492.0859375} {"train_loss": -5.967546463012695, "global_step": 57666, "epoch": 1373} {"train_loss": -5.90186071395874, "global_step": 57667, "epoch": 1373} {"train_loss": -5.909951210021973, "global_step": 57668, "epoch": 1373} {"train_loss": -5.881108283996582, "global_step": 57669, "epoch": 1373} {"train_loss": -5.797248840332031, "global_step": 57670, "epoch": 1373} {"train_loss": -5.921991348266602, "global_step": 57671, "epoch": 1373} {"train_loss": -5.992110252380371, "global_step": 57672, "epoch": 1373} {"train_loss": -5.822458267211914, "global_step": 57673, "epoch": 1373} {"train_loss": -5.841120719909668, "global_step": 57674, "epoch": 1373} {"train_loss": -5.8026442527771, "global_step": 57675, "epoch": 1373} {"train_loss": -5.819129943847656, "global_step": 57676, "epoch": 1373} {"train_loss": -5.945244789123535, "global_step": 57677, "epoch": 1373} {"train_loss": -5.844768524169922, "global_step": 57678, "epoch": 1373} {"train_loss": -5.94581413269043, "global_step": 57679, "epoch": 1373} {"train_loss": -5.858192443847656, "global_step": 57680, "epoch": 1373} {"train_loss": -5.814633369445801, "global_step": 57681, "epoch": 1373} {"train_loss": -5.856457710266113, "global_step": 57682, "epoch": 1373} {"train_loss": -5.985179424285889, "global_step": 57683, "epoch": 1373} {"train_loss": -5.89725923538208, "global_step": 57684, "epoch": 1373} {"train_loss": -5.8801751136779785, "global_step": 57685, "epoch": 1373} {"train_loss": -5.894222259521484, "global_step": 57686, "epoch": 1373} {"train_loss": -5.803569793701172, "global_step": 57687, "epoch": 1373} {"train_loss": -5.861556529998779, "global_step": 57688, "epoch": 1373} {"train_loss": -5.740602493286133, "global_step": 57689, "epoch": 1373} {"train_loss": -5.817731857299805, "global_step": 57690, "epoch": 1373} {"train_loss": -5.868533134460449, "global_step": 57691, "epoch": 1373} {"train_loss": -6.001225471496582, "global_step": 57692, "epoch": 1373} {"train_loss": -6.019527435302734, "global_step": 57693, "epoch": 1373} {"train_loss": -5.823598861694336, "global_step": 57694, "epoch": 1373} {"train_loss": -5.970471382141113, "global_step": 57695, "epoch": 1373} {"train_loss": -5.839349746704102, "global_step": 57696, "epoch": 1373} {"train_loss": -5.961589813232422, "global_step": 57697, "epoch": 1373} {"train_loss": -5.923382759094238, "global_step": 57698, "epoch": 1373} {"train_loss": -5.842807769775391, "global_step": 57699, "epoch": 1373} {"train_loss": -5.84493350982666, "global_step": 57700, "epoch": 1373} {"train_loss": -5.8157057762146, "global_step": 57701, "epoch": 1373} {"train_loss": -5.893392562866211, "global_step": 57702, "epoch": 1373} {"train_loss": -5.972438812255859, "global_step": 57703, "epoch": 1373} {"train_loss": -5.917400360107422, "global_step": 57704, "epoch": 1373} {"train_loss": -5.863553047180176, "global_step": 57705, "epoch": 1373} {"train_loss": -6.010705471038818, "global_step": 57706, "epoch": 1373} {"train_loss": -5.886603480293637, "global_step": 57707, "epoch": 1373, "val_loss": 61432.4609375} {"train_loss": -5.902971267700195, "global_step": 57708, "epoch": 1374} {"train_loss": -5.922807693481445, "global_step": 57709, "epoch": 1374} {"train_loss": -6.007936954498291, "global_step": 57710, "epoch": 1374} {"train_loss": -5.915041446685791, "global_step": 57711, "epoch": 1374} {"train_loss": -5.902613162994385, "global_step": 57712, "epoch": 1374} {"train_loss": -5.875971794128418, "global_step": 57713, "epoch": 1374} {"train_loss": -5.987415313720703, "global_step": 57714, "epoch": 1374} {"train_loss": -5.85690450668335, "global_step": 57715, "epoch": 1374} {"train_loss": -5.842423439025879, "global_step": 57716, "epoch": 1374} {"train_loss": -5.763978958129883, "global_step": 57717, "epoch": 1374} {"train_loss": -5.863829612731934, "global_step": 57718, "epoch": 1374} {"train_loss": -5.909431457519531, "global_step": 57719, "epoch": 1374} {"train_loss": -5.858964920043945, "global_step": 57720, "epoch": 1374} {"train_loss": -5.945265769958496, "global_step": 57721, "epoch": 1374} {"train_loss": -5.737102508544922, "global_step": 57722, "epoch": 1374} {"train_loss": -5.840640068054199, "global_step": 57723, "epoch": 1374} {"train_loss": -5.794790267944336, "global_step": 57724, "epoch": 1374} {"train_loss": -5.868267059326172, "global_step": 57725, "epoch": 1374} {"train_loss": -5.7017364501953125, "global_step": 57726, "epoch": 1374} {"train_loss": -5.898687839508057, "global_step": 57727, "epoch": 1374} {"train_loss": -5.82341194152832, "global_step": 57728, "epoch": 1374} {"train_loss": -5.936253070831299, "global_step": 57729, "epoch": 1374} {"train_loss": -6.030172348022461, "global_step": 57730, "epoch": 1374} {"train_loss": -5.781083106994629, "global_step": 57731, "epoch": 1374} {"train_loss": -5.843442440032959, "global_step": 57732, "epoch": 1374} {"train_loss": -5.985654354095459, "global_step": 57733, "epoch": 1374} {"train_loss": -5.941875457763672, "global_step": 57734, "epoch": 1374} {"train_loss": -5.785966396331787, "global_step": 57735, "epoch": 1374} {"train_loss": -5.832989692687988, "global_step": 57736, "epoch": 1374} {"train_loss": -5.901224613189697, "global_step": 57737, "epoch": 1374} {"train_loss": -5.955944538116455, "global_step": 57738, "epoch": 1374} {"train_loss": -5.881189346313477, "global_step": 57739, "epoch": 1374} {"train_loss": -5.899007797241211, "global_step": 57740, "epoch": 1374} {"train_loss": -5.863640785217285, "global_step": 57741, "epoch": 1374} {"train_loss": -5.823041915893555, "global_step": 57742, "epoch": 1374} {"train_loss": -5.878000736236572, "global_step": 57743, "epoch": 1374} {"train_loss": -5.823659420013428, "global_step": 57744, "epoch": 1374} {"train_loss": -5.899829864501953, "global_step": 57745, "epoch": 1374} {"train_loss": -5.774062156677246, "global_step": 57746, "epoch": 1374} {"train_loss": -5.83181619644165, "global_step": 57747, "epoch": 1374} {"train_loss": -5.845335960388184, "global_step": 57748, "epoch": 1374} {"train_loss": -5.870552607945034, "global_step": 57749, "epoch": 1374, "val_loss": 61721.62109375} {"train_loss": -5.863501071929932, "global_step": 57750, "epoch": 1375} {"train_loss": -5.795804023742676, "global_step": 57751, "epoch": 1375} {"train_loss": -5.885082721710205, "global_step": 57752, "epoch": 1375} {"train_loss": -5.749785900115967, "global_step": 57753, "epoch": 1375} {"train_loss": -5.8848042488098145, "global_step": 57754, "epoch": 1375} {"train_loss": -5.784548282623291, "global_step": 57755, "epoch": 1375} {"train_loss": -5.953455448150635, "global_step": 57756, "epoch": 1375} {"train_loss": -5.9223432540893555, "global_step": 57757, "epoch": 1375} {"train_loss": -5.954505920410156, "global_step": 57758, "epoch": 1375} {"train_loss": -5.796972274780273, "global_step": 57759, "epoch": 1375} {"train_loss": -5.981914520263672, "global_step": 57760, "epoch": 1375} {"train_loss": -5.886080741882324, "global_step": 57761, "epoch": 1375} {"train_loss": -5.822105407714844, "global_step": 57762, "epoch": 1375} {"train_loss": -5.7387895584106445, "global_step": 57763, "epoch": 1375} {"train_loss": -5.783699989318848, "global_step": 57764, "epoch": 1375} {"train_loss": -5.909127235412598, "global_step": 57765, "epoch": 1375} {"train_loss": -5.855368614196777, "global_step": 57766, "epoch": 1375} {"train_loss": -5.879162311553955, "global_step": 57767, "epoch": 1375} {"train_loss": -5.845131874084473, "global_step": 57768, "epoch": 1375} {"train_loss": -5.795069694519043, "global_step": 57769, "epoch": 1375} {"train_loss": -5.966144561767578, "global_step": 57770, "epoch": 1375} {"train_loss": -5.826171398162842, "global_step": 57771, "epoch": 1375} {"train_loss": -5.725485324859619, "global_step": 57772, "epoch": 1375} {"train_loss": -5.806379795074463, "global_step": 57773, "epoch": 1375} {"train_loss": -5.745086669921875, "global_step": 57774, "epoch": 1375} {"train_loss": -5.866708755493164, "global_step": 57775, "epoch": 1375} {"train_loss": -5.875746726989746, "global_step": 57776, "epoch": 1375} {"train_loss": -5.71418571472168, "global_step": 57777, "epoch": 1375} {"train_loss": -5.767033100128174, "global_step": 57778, "epoch": 1375} {"train_loss": -5.840099334716797, "global_step": 57779, "epoch": 1375} {"train_loss": -5.833429336547852, "global_step": 57780, "epoch": 1375} {"train_loss": -5.8104472160339355, "global_step": 57781, "epoch": 1375} {"train_loss": -5.964011192321777, "global_step": 57782, "epoch": 1375} {"train_loss": -5.936407089233398, "global_step": 57783, "epoch": 1375} {"train_loss": -5.922196865081787, "global_step": 57784, "epoch": 1375} {"train_loss": -5.830116271972656, "global_step": 57785, "epoch": 1375} {"train_loss": -5.8818511962890625, "global_step": 57786, "epoch": 1375} {"train_loss": -5.921028137207031, "global_step": 57787, "epoch": 1375} {"train_loss": -6.01673698425293, "global_step": 57788, "epoch": 1375} {"train_loss": -5.772377967834473, "global_step": 57789, "epoch": 1375} {"train_loss": -5.939159393310547, "global_step": 57790, "epoch": 1375} {"train_loss": -5.855361484345936, "global_step": 57791, "epoch": 1375, "val_loss": 61301.22265625} {"train_loss": -5.94008207321167, "global_step": 57792, "epoch": 1376} {"train_loss": -6.065147876739502, "global_step": 57793, "epoch": 1376} {"train_loss": -5.8999128341674805, "global_step": 57794, "epoch": 1376} {"train_loss": -6.020835876464844, "global_step": 57795, "epoch": 1376} {"train_loss": -5.979801177978516, "global_step": 57796, "epoch": 1376} {"train_loss": -5.8288774490356445, "global_step": 57797, "epoch": 1376} {"train_loss": -5.889472484588623, "global_step": 57798, "epoch": 1376} {"train_loss": -5.78090763092041, "global_step": 57799, "epoch": 1376} {"train_loss": -5.89227294921875, "global_step": 57800, "epoch": 1376} {"train_loss": -6.000056266784668, "global_step": 57801, "epoch": 1376} {"train_loss": -5.825592994689941, "global_step": 57802, "epoch": 1376} {"train_loss": -5.854988098144531, "global_step": 57803, "epoch": 1376} {"train_loss": -5.7674560546875, "global_step": 57804, "epoch": 1376} {"train_loss": -5.824326515197754, "global_step": 57805, "epoch": 1376} {"train_loss": -5.882731914520264, "global_step": 57806, "epoch": 1376} {"train_loss": -5.86132287979126, "global_step": 57807, "epoch": 1376} {"train_loss": -5.881119728088379, "global_step": 57808, "epoch": 1376} {"train_loss": -5.916718482971191, "global_step": 57809, "epoch": 1376} {"train_loss": -5.923947334289551, "global_step": 57810, "epoch": 1376} {"train_loss": -5.888413429260254, "global_step": 57811, "epoch": 1376} {"train_loss": -5.88324499130249, "global_step": 57812, "epoch": 1376} {"train_loss": -5.844932556152344, "global_step": 57813, "epoch": 1376} {"train_loss": -5.856267929077148, "global_step": 57814, "epoch": 1376} {"train_loss": -5.797317028045654, "global_step": 57815, "epoch": 1376} {"train_loss": -5.885416030883789, "global_step": 57816, "epoch": 1376} {"train_loss": -6.08836555480957, "global_step": 57817, "epoch": 1376} {"train_loss": -5.8847455978393555, "global_step": 57818, "epoch": 1376} {"train_loss": -5.900318622589111, "global_step": 57819, "epoch": 1376} {"train_loss": -5.895989894866943, "global_step": 57820, "epoch": 1376} {"train_loss": -5.887925148010254, "global_step": 57821, "epoch": 1376} {"train_loss": -6.050127029418945, "global_step": 57822, "epoch": 1376} {"train_loss": -5.875133514404297, "global_step": 57823, "epoch": 1376} {"train_loss": -5.8014302253723145, "global_step": 57824, "epoch": 1376} {"train_loss": -5.935619354248047, "global_step": 57825, "epoch": 1376} {"train_loss": -5.883978843688965, "global_step": 57826, "epoch": 1376} {"train_loss": -5.824521064758301, "global_step": 57827, "epoch": 1376} {"train_loss": -5.905182361602783, "global_step": 57828, "epoch": 1376} {"train_loss": -5.67530632019043, "global_step": 57829, "epoch": 1376} {"train_loss": -5.761961936950684, "global_step": 57830, "epoch": 1376} {"train_loss": -5.956074237823486, "global_step": 57831, "epoch": 1376} {"train_loss": -5.852278709411621, "global_step": 57832, "epoch": 1376} {"train_loss": -5.881540275755382, "global_step": 57833, "epoch": 1376, "val_loss": 61493.51953125} {"train_loss": -5.958553314208984, "global_step": 57834, "epoch": 1377} {"train_loss": -5.902125358581543, "global_step": 57835, "epoch": 1377} {"train_loss": -5.9766130447387695, "global_step": 57836, "epoch": 1377} {"train_loss": -5.871122360229492, "global_step": 57837, "epoch": 1377} {"train_loss": -5.889751434326172, "global_step": 57838, "epoch": 1377} {"train_loss": -5.9265055656433105, "global_step": 57839, "epoch": 1377} {"train_loss": -5.849864482879639, "global_step": 57840, "epoch": 1377} {"train_loss": -5.894972801208496, "global_step": 57841, "epoch": 1377} {"train_loss": -5.8993024826049805, "global_step": 57842, "epoch": 1377} {"train_loss": -5.769509792327881, "global_step": 57843, "epoch": 1377} {"train_loss": -5.938767433166504, "global_step": 57844, "epoch": 1377} {"train_loss": -5.852677345275879, "global_step": 57845, "epoch": 1377} {"train_loss": -5.831728458404541, "global_step": 57846, "epoch": 1377} {"train_loss": -5.905765533447266, "global_step": 57847, "epoch": 1377} {"train_loss": -5.827238082885742, "global_step": 57848, "epoch": 1377} {"train_loss": -5.924004554748535, "global_step": 57849, "epoch": 1377} {"train_loss": -6.03383731842041, "global_step": 57850, "epoch": 1377} {"train_loss": -5.892484664916992, "global_step": 57851, "epoch": 1377} {"train_loss": -5.846187114715576, "global_step": 57852, "epoch": 1377} {"train_loss": -5.863157272338867, "global_step": 57853, "epoch": 1377} {"train_loss": -5.979764938354492, "global_step": 57854, "epoch": 1377} {"train_loss": -5.79316520690918, "global_step": 57855, "epoch": 1377} {"train_loss": -5.825101375579834, "global_step": 57856, "epoch": 1377} {"train_loss": -5.7990827560424805, "global_step": 57857, "epoch": 1377} {"train_loss": -5.857942581176758, "global_step": 57858, "epoch": 1377} {"train_loss": -5.874210834503174, "global_step": 57859, "epoch": 1377} {"train_loss": -5.835630416870117, "global_step": 57860, "epoch": 1377} {"train_loss": -5.8711347579956055, "global_step": 57861, "epoch": 1377} {"train_loss": -5.880467414855957, "global_step": 57862, "epoch": 1377} {"train_loss": -5.885429382324219, "global_step": 57863, "epoch": 1377} {"train_loss": -5.776914119720459, "global_step": 57864, "epoch": 1377} {"train_loss": -5.850441932678223, "global_step": 57865, "epoch": 1377} {"train_loss": -5.812419891357422, "global_step": 57866, "epoch": 1377} {"train_loss": -5.922177791595459, "global_step": 57867, "epoch": 1377} {"train_loss": -5.890712738037109, "global_step": 57868, "epoch": 1377} {"train_loss": -5.724462509155273, "global_step": 57869, "epoch": 1377} {"train_loss": -5.984391212463379, "global_step": 57870, "epoch": 1377} {"train_loss": -5.726337909698486, "global_step": 57871, "epoch": 1377} {"train_loss": -5.831897735595703, "global_step": 57872, "epoch": 1377} {"train_loss": -5.94740104675293, "global_step": 57873, "epoch": 1377} {"train_loss": -5.8755574226379395, "global_step": 57874, "epoch": 1377} {"train_loss": -5.869143304370699, "global_step": 57875, "epoch": 1377, "val_loss": 61793.80078125} {"train_loss": -5.789017200469971, "global_step": 57876, "epoch": 1378} {"train_loss": -5.831092357635498, "global_step": 57877, "epoch": 1378} {"train_loss": -5.92998743057251, "global_step": 57878, "epoch": 1378} {"train_loss": -5.898636341094971, "global_step": 57879, "epoch": 1378} {"train_loss": -5.922259330749512, "global_step": 57880, "epoch": 1378} {"train_loss": -5.910771369934082, "global_step": 57881, "epoch": 1378} {"train_loss": -5.915902137756348, "global_step": 57882, "epoch": 1378} {"train_loss": -5.941461563110352, "global_step": 57883, "epoch": 1378} {"train_loss": -5.83759069442749, "global_step": 57884, "epoch": 1378} {"train_loss": -5.883648872375488, "global_step": 57885, "epoch": 1378} {"train_loss": -5.970076560974121, "global_step": 57886, "epoch": 1378} {"train_loss": -5.958549499511719, "global_step": 57887, "epoch": 1378} {"train_loss": -5.969465255737305, "global_step": 57888, "epoch": 1378} {"train_loss": -5.897887229919434, "global_step": 57889, "epoch": 1378} {"train_loss": -5.895533561706543, "global_step": 57890, "epoch": 1378} {"train_loss": -5.841136932373047, "global_step": 57891, "epoch": 1378} {"train_loss": -5.926585674285889, "global_step": 57892, "epoch": 1378} {"train_loss": -5.901350021362305, "global_step": 57893, "epoch": 1378} {"train_loss": -5.875020980834961, "global_step": 57894, "epoch": 1378} {"train_loss": -5.858883857727051, "global_step": 57895, "epoch": 1378} {"train_loss": -5.948598861694336, "global_step": 57896, "epoch": 1378} {"train_loss": -5.814803123474121, "global_step": 57897, "epoch": 1378} {"train_loss": -5.844578742980957, "global_step": 57898, "epoch": 1378} {"train_loss": -5.838889122009277, "global_step": 57899, "epoch": 1378} {"train_loss": -5.718816757202148, "global_step": 57900, "epoch": 1378} {"train_loss": -5.770882606506348, "global_step": 57901, "epoch": 1378} {"train_loss": -5.915448188781738, "global_step": 57902, "epoch": 1378} {"train_loss": -5.838318824768066, "global_step": 57903, "epoch": 1378} {"train_loss": -5.856943130493164, "global_step": 57904, "epoch": 1378} {"train_loss": -5.825253963470459, "global_step": 57905, "epoch": 1378} {"train_loss": -5.800572872161865, "global_step": 57906, "epoch": 1378} {"train_loss": -5.885991096496582, "global_step": 57907, "epoch": 1378} {"train_loss": -5.888063430786133, "global_step": 57908, "epoch": 1378} {"train_loss": -5.821999549865723, "global_step": 57909, "epoch": 1378} {"train_loss": -5.801685333251953, "global_step": 57910, "epoch": 1378} {"train_loss": -5.817969799041748, "global_step": 57911, "epoch": 1378} {"train_loss": -5.811210632324219, "global_step": 57912, "epoch": 1378} {"train_loss": -5.997365474700928, "global_step": 57913, "epoch": 1378} {"train_loss": -5.908539772033691, "global_step": 57914, "epoch": 1378} {"train_loss": -5.81915283203125, "global_step": 57915, "epoch": 1378} {"train_loss": -5.8246355056762695, "global_step": 57916, "epoch": 1378} {"train_loss": -5.867479335694086, "global_step": 57917, "epoch": 1378, "val_loss": 61719.34765625} {"train_loss": -5.86616325378418, "global_step": 57918, "epoch": 1379} {"train_loss": -5.986690998077393, "global_step": 57919, "epoch": 1379} {"train_loss": -5.848222732543945, "global_step": 57920, "epoch": 1379} {"train_loss": -5.808019638061523, "global_step": 57921, "epoch": 1379} {"train_loss": -5.898257255554199, "global_step": 57922, "epoch": 1379} {"train_loss": -5.972132205963135, "global_step": 57923, "epoch": 1379} {"train_loss": -5.927664756774902, "global_step": 57924, "epoch": 1379} {"train_loss": -5.905167579650879, "global_step": 57925, "epoch": 1379} {"train_loss": -5.793676376342773, "global_step": 57926, "epoch": 1379} {"train_loss": -5.986185073852539, "global_step": 57927, "epoch": 1379} {"train_loss": -5.80869197845459, "global_step": 57928, "epoch": 1379} {"train_loss": -5.969740867614746, "global_step": 57929, "epoch": 1379} {"train_loss": -5.885414123535156, "global_step": 57930, "epoch": 1379} {"train_loss": -5.819561958312988, "global_step": 57931, "epoch": 1379} {"train_loss": -6.021862983703613, "global_step": 57932, "epoch": 1379} {"train_loss": -5.829057693481445, "global_step": 57933, "epoch": 1379} {"train_loss": -5.9102630615234375, "global_step": 57934, "epoch": 1379} {"train_loss": -5.804457187652588, "global_step": 57935, "epoch": 1379} {"train_loss": -5.882363796234131, "global_step": 57936, "epoch": 1379} {"train_loss": -5.942270278930664, "global_step": 57937, "epoch": 1379} {"train_loss": -5.952803611755371, "global_step": 57938, "epoch": 1379} {"train_loss": -5.912333965301514, "global_step": 57939, "epoch": 1379} {"train_loss": -5.8466901779174805, "global_step": 57940, "epoch": 1379} {"train_loss": -5.8836517333984375, "global_step": 57941, "epoch": 1379} {"train_loss": -5.938250541687012, "global_step": 57942, "epoch": 1379} {"train_loss": -5.817958354949951, "global_step": 57943, "epoch": 1379} {"train_loss": -5.921997547149658, "global_step": 57944, "epoch": 1379} {"train_loss": -5.920757293701172, "global_step": 57945, "epoch": 1379} {"train_loss": -5.885802268981934, "global_step": 57946, "epoch": 1379} {"train_loss": -5.834112167358398, "global_step": 57947, "epoch": 1379} {"train_loss": -5.903350353240967, "global_step": 57948, "epoch": 1379} {"train_loss": -5.935495376586914, "global_step": 57949, "epoch": 1379} {"train_loss": -5.8332319259643555, "global_step": 57950, "epoch": 1379} {"train_loss": -5.889820575714111, "global_step": 57951, "epoch": 1379} {"train_loss": -5.848702430725098, "global_step": 57952, "epoch": 1379} {"train_loss": -5.960282325744629, "global_step": 57953, "epoch": 1379} {"train_loss": -5.972376823425293, "global_step": 57954, "epoch": 1379} {"train_loss": -5.913213729858398, "global_step": 57955, "epoch": 1379} {"train_loss": -6.01713228225708, "global_step": 57956, "epoch": 1379} {"train_loss": -5.970949172973633, "global_step": 57957, "epoch": 1379} {"train_loss": -5.849299430847168, "global_step": 57958, "epoch": 1379} {"train_loss": -5.9001648880186535, "global_step": 57959, "epoch": 1379, "val_loss": 61446.80078125} {"train_loss": -5.983774185180664, "global_step": 57960, "epoch": 1380} {"train_loss": -5.772902965545654, "global_step": 57961, "epoch": 1380} {"train_loss": -5.913534164428711, "global_step": 57962, "epoch": 1380} {"train_loss": -6.0276947021484375, "global_step": 57963, "epoch": 1380} {"train_loss": -5.830060005187988, "global_step": 57964, "epoch": 1380} {"train_loss": -5.752790451049805, "global_step": 57965, "epoch": 1380} {"train_loss": -5.921128273010254, "global_step": 57966, "epoch": 1380} {"train_loss": -5.9406890869140625, "global_step": 57967, "epoch": 1380} {"train_loss": -5.805733680725098, "global_step": 57968, "epoch": 1380} {"train_loss": -5.80817985534668, "global_step": 57969, "epoch": 1380} {"train_loss": -5.946221351623535, "global_step": 57970, "epoch": 1380} {"train_loss": -5.864015579223633, "global_step": 57971, "epoch": 1380} {"train_loss": -5.8558573722839355, "global_step": 57972, "epoch": 1380} {"train_loss": -5.915740489959717, "global_step": 57973, "epoch": 1380} {"train_loss": -5.896174430847168, "global_step": 57974, "epoch": 1380} {"train_loss": -5.887986183166504, "global_step": 57975, "epoch": 1380} {"train_loss": -5.964997291564941, "global_step": 57976, "epoch": 1380} {"train_loss": -5.839839935302734, "global_step": 57977, "epoch": 1380} {"train_loss": -6.00046443939209, "global_step": 57978, "epoch": 1380} {"train_loss": -5.878369331359863, "global_step": 57979, "epoch": 1380} {"train_loss": -5.775504112243652, "global_step": 57980, "epoch": 1380} {"train_loss": -5.846571445465088, "global_step": 57981, "epoch": 1380} {"train_loss": -5.8587541580200195, "global_step": 57982, "epoch": 1380} {"train_loss": -5.810850143432617, "global_step": 57983, "epoch": 1380} {"train_loss": -5.911618232727051, "global_step": 57984, "epoch": 1380} {"train_loss": -5.840939044952393, "global_step": 57985, "epoch": 1380} {"train_loss": -5.760031223297119, "global_step": 57986, "epoch": 1380} {"train_loss": -5.808846473693848, "global_step": 57987, "epoch": 1380} {"train_loss": -5.8115715980529785, "global_step": 57988, "epoch": 1380} {"train_loss": -5.832678318023682, "global_step": 57989, "epoch": 1380} {"train_loss": -5.916158199310303, "global_step": 57990, "epoch": 1380} {"train_loss": -5.9086809158325195, "global_step": 57991, "epoch": 1380} {"train_loss": -5.974013328552246, "global_step": 57992, "epoch": 1380} {"train_loss": -5.906439781188965, "global_step": 57993, "epoch": 1380} {"train_loss": -5.779791831970215, "global_step": 57994, "epoch": 1380} {"train_loss": -5.896901607513428, "global_step": 57995, "epoch": 1380} {"train_loss": -5.958672046661377, "global_step": 57996, "epoch": 1380} {"train_loss": -5.751253128051758, "global_step": 57997, "epoch": 1380} {"train_loss": -5.826844215393066, "global_step": 57998, "epoch": 1380} {"train_loss": -5.748095512390137, "global_step": 57999, "epoch": 1380} {"train_loss": -5.953359603881836, "global_step": 58000, "epoch": 1380} {"train_loss": -5.87065441267831, "global_step": 58001, "epoch": 1380, "val_loss": 61707.609375} {"train_loss": -5.910922527313232, "global_step": 58002, "epoch": 1381} {"train_loss": -5.835745811462402, "global_step": 58003, "epoch": 1381} {"train_loss": -5.848865985870361, "global_step": 58004, "epoch": 1381} {"train_loss": -5.827938079833984, "global_step": 58005, "epoch": 1381} {"train_loss": -5.906573295593262, "global_step": 58006, "epoch": 1381} {"train_loss": -5.867898464202881, "global_step": 58007, "epoch": 1381} {"train_loss": -5.859223365783691, "global_step": 58008, "epoch": 1381} {"train_loss": -5.861349105834961, "global_step": 58009, "epoch": 1381} {"train_loss": -5.896541595458984, "global_step": 58010, "epoch": 1381} {"train_loss": -5.801002502441406, "global_step": 58011, "epoch": 1381} {"train_loss": -5.853507041931152, "global_step": 58012, "epoch": 1381} {"train_loss": -5.8862481117248535, "global_step": 58013, "epoch": 1381} {"train_loss": -5.759504318237305, "global_step": 58014, "epoch": 1381} {"train_loss": -5.941327095031738, "global_step": 58015, "epoch": 1381} {"train_loss": -5.834249496459961, "global_step": 58016, "epoch": 1381} {"train_loss": -5.828311920166016, "global_step": 58017, "epoch": 1381} {"train_loss": -5.9206647872924805, "global_step": 58018, "epoch": 1381} {"train_loss": -5.876241683959961, "global_step": 58019, "epoch": 1381} {"train_loss": -5.842071533203125, "global_step": 58020, "epoch": 1381} {"train_loss": -5.871819496154785, "global_step": 58021, "epoch": 1381} {"train_loss": -5.853201866149902, "global_step": 58022, "epoch": 1381} {"train_loss": -5.862898826599121, "global_step": 58023, "epoch": 1381} {"train_loss": -5.752191066741943, "global_step": 58024, "epoch": 1381} {"train_loss": -5.851283073425293, "global_step": 58025, "epoch": 1381} {"train_loss": -5.8138203620910645, "global_step": 58026, "epoch": 1381} {"train_loss": -5.8397932052612305, "global_step": 58027, "epoch": 1381} {"train_loss": -5.936617851257324, "global_step": 58028, "epoch": 1381} {"train_loss": -5.907742023468018, "global_step": 58029, "epoch": 1381} {"train_loss": -5.784635543823242, "global_step": 58030, "epoch": 1381} {"train_loss": -5.929485321044922, "global_step": 58031, "epoch": 1381} {"train_loss": -5.858010292053223, "global_step": 58032, "epoch": 1381} {"train_loss": -5.86843729019165, "global_step": 58033, "epoch": 1381} {"train_loss": -5.73817253112793, "global_step": 58034, "epoch": 1381} {"train_loss": -5.82794713973999, "global_step": 58035, "epoch": 1381} {"train_loss": -5.877201080322266, "global_step": 58036, "epoch": 1381} {"train_loss": -5.915397644042969, "global_step": 58037, "epoch": 1381} {"train_loss": -6.03950309753418, "global_step": 58038, "epoch": 1381} {"train_loss": -5.756335735321045, "global_step": 58039, "epoch": 1381} {"train_loss": -5.897359848022461, "global_step": 58040, "epoch": 1381} {"train_loss": -5.958681106567383, "global_step": 58041, "epoch": 1381} {"train_loss": -5.872734069824219, "global_step": 58042, "epoch": 1381} {"train_loss": -5.865211248397827, "global_step": 58043, "epoch": 1381, "val_loss": 61289.70703125} {"train_loss": -5.816577911376953, "global_step": 58044, "epoch": 1382} {"train_loss": -5.826460361480713, "global_step": 58045, "epoch": 1382} {"train_loss": -5.9340105056762695, "global_step": 58046, "epoch": 1382} {"train_loss": -5.944230556488037, "global_step": 58047, "epoch": 1382} {"train_loss": -5.975961685180664, "global_step": 58048, "epoch": 1382} {"train_loss": -5.849976539611816, "global_step": 58049, "epoch": 1382} {"train_loss": -5.916748046875, "global_step": 58050, "epoch": 1382} {"train_loss": -5.95150899887085, "global_step": 58051, "epoch": 1382} {"train_loss": -5.890332221984863, "global_step": 58052, "epoch": 1382} {"train_loss": -5.9518585205078125, "global_step": 58053, "epoch": 1382} {"train_loss": -5.918041706085205, "global_step": 58054, "epoch": 1382} {"train_loss": -5.982269287109375, "global_step": 58055, "epoch": 1382} {"train_loss": -5.87833833694458, "global_step": 58056, "epoch": 1382} {"train_loss": -5.967959403991699, "global_step": 58057, "epoch": 1382} {"train_loss": -5.936454772949219, "global_step": 58058, "epoch": 1382} {"train_loss": -5.919726848602295, "global_step": 58059, "epoch": 1382} {"train_loss": -5.975702285766602, "global_step": 58060, "epoch": 1382} {"train_loss": -5.96038818359375, "global_step": 58061, "epoch": 1382} {"train_loss": -5.930745601654053, "global_step": 58062, "epoch": 1382} {"train_loss": -5.902475357055664, "global_step": 58063, "epoch": 1382} {"train_loss": -5.850593566894531, "global_step": 58064, "epoch": 1382} {"train_loss": -5.881133079528809, "global_step": 58065, "epoch": 1382} {"train_loss": -5.811531066894531, "global_step": 58066, "epoch": 1382} {"train_loss": -5.789120674133301, "global_step": 58067, "epoch": 1382} {"train_loss": -5.910282135009766, "global_step": 58068, "epoch": 1382} {"train_loss": -5.836521625518799, "global_step": 58069, "epoch": 1382} {"train_loss": -5.873250961303711, "global_step": 58070, "epoch": 1382} {"train_loss": -5.703951835632324, "global_step": 58071, "epoch": 1382} {"train_loss": -5.9477972984313965, "global_step": 58072, "epoch": 1382} {"train_loss": -5.749768257141113, "global_step": 58073, "epoch": 1382} {"train_loss": -5.802739143371582, "global_step": 58074, "epoch": 1382} {"train_loss": -5.91046142578125, "global_step": 58075, "epoch": 1382} {"train_loss": -6.035355091094971, "global_step": 58076, "epoch": 1382} {"train_loss": -5.725221157073975, "global_step": 58077, "epoch": 1382} {"train_loss": -5.813750267028809, "global_step": 58078, "epoch": 1382} {"train_loss": -5.867862224578857, "global_step": 58079, "epoch": 1382} {"train_loss": -5.845160961151123, "global_step": 58080, "epoch": 1382} {"train_loss": -5.847104072570801, "global_step": 58081, "epoch": 1382} {"train_loss": -5.986060619354248, "global_step": 58082, "epoch": 1382} {"train_loss": -5.873507499694824, "global_step": 58083, "epoch": 1382} {"train_loss": -5.869123935699463, "global_step": 58084, "epoch": 1382} {"train_loss": -5.8833198093232655, "global_step": 58085, "epoch": 1382, "val_loss": 61741.25390625} {"train_loss": -5.805288314819336, "global_step": 58086, "epoch": 1383} {"train_loss": -5.798661708831787, "global_step": 58087, "epoch": 1383} {"train_loss": -5.877743721008301, "global_step": 58088, "epoch": 1383} {"train_loss": -5.738944053649902, "global_step": 58089, "epoch": 1383} {"train_loss": -5.752840042114258, "global_step": 58090, "epoch": 1383} {"train_loss": -5.832962989807129, "global_step": 58091, "epoch": 1383} {"train_loss": -5.794744491577148, "global_step": 58092, "epoch": 1383} {"train_loss": -5.8222150802612305, "global_step": 58093, "epoch": 1383} {"train_loss": -5.911434650421143, "global_step": 58094, "epoch": 1383} {"train_loss": -5.832404136657715, "global_step": 58095, "epoch": 1383} {"train_loss": -5.954352378845215, "global_step": 58096, "epoch": 1383} {"train_loss": -5.777228832244873, "global_step": 58097, "epoch": 1383} {"train_loss": -5.855754375457764, "global_step": 58098, "epoch": 1383} {"train_loss": -5.930136680603027, "global_step": 58099, "epoch": 1383} {"train_loss": -5.9107160568237305, "global_step": 58100, "epoch": 1383} {"train_loss": -5.900032997131348, "global_step": 58101, "epoch": 1383} {"train_loss": -5.8897175788879395, "global_step": 58102, "epoch": 1383} {"train_loss": -5.952465057373047, "global_step": 58103, "epoch": 1383} {"train_loss": -5.820478439331055, "global_step": 58104, "epoch": 1383} {"train_loss": -5.828636646270752, "global_step": 58105, "epoch": 1383} {"train_loss": -5.917820930480957, "global_step": 58106, "epoch": 1383} {"train_loss": -5.823043346405029, "global_step": 58107, "epoch": 1383} {"train_loss": -5.899240493774414, "global_step": 58108, "epoch": 1383} {"train_loss": -5.967624664306641, "global_step": 58109, "epoch": 1383} {"train_loss": -5.841666221618652, "global_step": 58110, "epoch": 1383} {"train_loss": -5.938840389251709, "global_step": 58111, "epoch": 1383} {"train_loss": -5.936033248901367, "global_step": 58112, "epoch": 1383} {"train_loss": -5.899713516235352, "global_step": 58113, "epoch": 1383} {"train_loss": -5.88062858581543, "global_step": 58114, "epoch": 1383} {"train_loss": -5.893283843994141, "global_step": 58115, "epoch": 1383} {"train_loss": -5.93958854675293, "global_step": 58116, "epoch": 1383} {"train_loss": -5.8540849685668945, "global_step": 58117, "epoch": 1383} {"train_loss": -5.778933525085449, "global_step": 58118, "epoch": 1383} {"train_loss": -5.833776473999023, "global_step": 58119, "epoch": 1383} {"train_loss": -5.864394187927246, "global_step": 58120, "epoch": 1383} {"train_loss": -5.922530174255371, "global_step": 58121, "epoch": 1383} {"train_loss": -5.825625419616699, "global_step": 58122, "epoch": 1383} {"train_loss": -5.789387226104736, "global_step": 58123, "epoch": 1383} {"train_loss": -5.750110626220703, "global_step": 58124, "epoch": 1383} {"train_loss": -5.929335594177246, "global_step": 58125, "epoch": 1383} {"train_loss": -6.037967681884766, "global_step": 58126, "epoch": 1383} {"train_loss": -5.863456510362171, "global_step": 58127, "epoch": 1383, "val_loss": 61634.87890625} {"train_loss": -5.845588684082031, "global_step": 58128, "epoch": 1384} {"train_loss": -5.891945838928223, "global_step": 58129, "epoch": 1384} {"train_loss": -5.910922050476074, "global_step": 58130, "epoch": 1384} {"train_loss": -5.93044376373291, "global_step": 58131, "epoch": 1384} {"train_loss": -5.785430431365967, "global_step": 58132, "epoch": 1384} {"train_loss": -5.8876237869262695, "global_step": 58133, "epoch": 1384} {"train_loss": -5.822983264923096, "global_step": 58134, "epoch": 1384} {"train_loss": -5.924965858459473, "global_step": 58135, "epoch": 1384} {"train_loss": -5.908600330352783, "global_step": 58136, "epoch": 1384} {"train_loss": -5.838006973266602, "global_step": 58137, "epoch": 1384} {"train_loss": -5.867065906524658, "global_step": 58138, "epoch": 1384} {"train_loss": -6.060583114624023, "global_step": 58139, "epoch": 1384} {"train_loss": -5.812835693359375, "global_step": 58140, "epoch": 1384} {"train_loss": -5.891897678375244, "global_step": 58141, "epoch": 1384} {"train_loss": -5.85790491104126, "global_step": 58142, "epoch": 1384} {"train_loss": -5.926058769226074, "global_step": 58143, "epoch": 1384} {"train_loss": -5.848158359527588, "global_step": 58144, "epoch": 1384} {"train_loss": -5.854005813598633, "global_step": 58145, "epoch": 1384} {"train_loss": -5.650570869445801, "global_step": 58146, "epoch": 1384} {"train_loss": -5.90397834777832, "global_step": 58147, "epoch": 1384} {"train_loss": -5.866625785827637, "global_step": 58148, "epoch": 1384} {"train_loss": -5.860128402709961, "global_step": 58149, "epoch": 1384} {"train_loss": -5.812857151031494, "global_step": 58150, "epoch": 1384} {"train_loss": -5.837157249450684, "global_step": 58151, "epoch": 1384} {"train_loss": -5.805134296417236, "global_step": 58152, "epoch": 1384} {"train_loss": -5.992046356201172, "global_step": 58153, "epoch": 1384} {"train_loss": -5.883504867553711, "global_step": 58154, "epoch": 1384} {"train_loss": -5.982810974121094, "global_step": 58155, "epoch": 1384} {"train_loss": -5.837603569030762, "global_step": 58156, "epoch": 1384} {"train_loss": -5.837973594665527, "global_step": 58157, "epoch": 1384} {"train_loss": -5.850088596343994, "global_step": 58158, "epoch": 1384} {"train_loss": -5.770010948181152, "global_step": 58159, "epoch": 1384} {"train_loss": -5.932889461517334, "global_step": 58160, "epoch": 1384} {"train_loss": -5.972403049468994, "global_step": 58161, "epoch": 1384} {"train_loss": -5.935086250305176, "global_step": 58162, "epoch": 1384} {"train_loss": -5.889019966125488, "global_step": 58163, "epoch": 1384} {"train_loss": -5.978983402252197, "global_step": 58164, "epoch": 1384} {"train_loss": -5.887539863586426, "global_step": 58165, "epoch": 1384} {"train_loss": -5.833103179931641, "global_step": 58166, "epoch": 1384} {"train_loss": -5.782595634460449, "global_step": 58167, "epoch": 1384} {"train_loss": -5.985775947570801, "global_step": 58168, "epoch": 1384} {"train_loss": -5.876021918796358, "global_step": 58169, "epoch": 1384, "val_loss": 61453.3671875} {"train_loss": -5.84372615814209, "global_step": 58170, "epoch": 1385} {"train_loss": -6.062532424926758, "global_step": 58171, "epoch": 1385} {"train_loss": -5.763523101806641, "global_step": 58172, "epoch": 1385} {"train_loss": -6.067203044891357, "global_step": 58173, "epoch": 1385} {"train_loss": -5.764725208282471, "global_step": 58174, "epoch": 1385} {"train_loss": -5.738805770874023, "global_step": 58175, "epoch": 1385} {"train_loss": -5.811893463134766, "global_step": 58176, "epoch": 1385} {"train_loss": -5.6644392013549805, "global_step": 58177, "epoch": 1385} {"train_loss": -5.95094633102417, "global_step": 58178, "epoch": 1385} {"train_loss": -5.643467903137207, "global_step": 58179, "epoch": 1385} {"train_loss": -5.781355857849121, "global_step": 58180, "epoch": 1385} {"train_loss": -5.829267501831055, "global_step": 58181, "epoch": 1385} {"train_loss": -5.7211198806762695, "global_step": 58182, "epoch": 1385} {"train_loss": -5.896124839782715, "global_step": 58183, "epoch": 1385} {"train_loss": -5.7385358810424805, "global_step": 58184, "epoch": 1385} {"train_loss": -5.964815139770508, "global_step": 58185, "epoch": 1385} {"train_loss": -5.635920524597168, "global_step": 58186, "epoch": 1385} {"train_loss": -5.832278728485107, "global_step": 58187, "epoch": 1385} {"train_loss": -5.775489330291748, "global_step": 58188, "epoch": 1385} {"train_loss": -5.952371120452881, "global_step": 58189, "epoch": 1385} {"train_loss": -5.815485000610352, "global_step": 58190, "epoch": 1385} {"train_loss": -5.833951950073242, "global_step": 58191, "epoch": 1385} {"train_loss": -5.866222381591797, "global_step": 58192, "epoch": 1385} {"train_loss": -5.848776340484619, "global_step": 58193, "epoch": 1385} {"train_loss": -5.780751705169678, "global_step": 58194, "epoch": 1385} {"train_loss": -5.777989387512207, "global_step": 58195, "epoch": 1385} {"train_loss": -5.761545181274414, "global_step": 58196, "epoch": 1385} {"train_loss": -5.825323104858398, "global_step": 58197, "epoch": 1385} {"train_loss": -5.849021911621094, "global_step": 58198, "epoch": 1385} {"train_loss": -5.709416389465332, "global_step": 58199, "epoch": 1385} {"train_loss": -5.823280334472656, "global_step": 58200, "epoch": 1385} {"train_loss": -5.854080677032471, "global_step": 58201, "epoch": 1385} {"train_loss": -5.925982475280762, "global_step": 58202, "epoch": 1385} {"train_loss": -5.771996021270752, "global_step": 58203, "epoch": 1385} {"train_loss": -5.866509437561035, "global_step": 58204, "epoch": 1385} {"train_loss": -5.812824726104736, "global_step": 58205, "epoch": 1385} {"train_loss": -5.787254333496094, "global_step": 58206, "epoch": 1385} {"train_loss": -5.885615348815918, "global_step": 58207, "epoch": 1385} {"train_loss": -5.902835845947266, "global_step": 58208, "epoch": 1385} {"train_loss": -5.853212356567383, "global_step": 58209, "epoch": 1385} {"train_loss": -5.898922920227051, "global_step": 58210, "epoch": 1385} {"train_loss": -5.827184881482806, "global_step": 58211, "epoch": 1385, "val_loss": 61470.25390625} {"train_loss": -5.887178897857666, "global_step": 58212, "epoch": 1386} {"train_loss": -5.934336185455322, "global_step": 58213, "epoch": 1386} {"train_loss": -5.9380950927734375, "global_step": 58214, "epoch": 1386} {"train_loss": -5.847403526306152, "global_step": 58215, "epoch": 1386} {"train_loss": -5.925819396972656, "global_step": 58216, "epoch": 1386} {"train_loss": -5.883121490478516, "global_step": 58217, "epoch": 1386} {"train_loss": -5.863067626953125, "global_step": 58218, "epoch": 1386} {"train_loss": -6.041286468505859, "global_step": 58219, "epoch": 1386} {"train_loss": -5.9372758865356445, "global_step": 58220, "epoch": 1386} {"train_loss": -5.865840435028076, "global_step": 58221, "epoch": 1386} {"train_loss": -5.860888957977295, "global_step": 58222, "epoch": 1386} {"train_loss": -5.859353065490723, "global_step": 58223, "epoch": 1386} {"train_loss": -5.842826843261719, "global_step": 58224, "epoch": 1386} {"train_loss": -5.97994327545166, "global_step": 58225, "epoch": 1386} {"train_loss": -5.923882484436035, "global_step": 58226, "epoch": 1386} {"train_loss": -5.841504096984863, "global_step": 58227, "epoch": 1386} {"train_loss": -5.976212024688721, "global_step": 58228, "epoch": 1386} {"train_loss": -5.929620265960693, "global_step": 58229, "epoch": 1386} {"train_loss": -5.80189323425293, "global_step": 58230, "epoch": 1386} {"train_loss": -5.848508834838867, "global_step": 58231, "epoch": 1386} {"train_loss": -5.965029716491699, "global_step": 58232, "epoch": 1386} {"train_loss": -5.900566101074219, "global_step": 58233, "epoch": 1386} {"train_loss": -5.9901556968688965, "global_step": 58234, "epoch": 1386} {"train_loss": -5.840989112854004, "global_step": 58235, "epoch": 1386} {"train_loss": -5.915436267852783, "global_step": 58236, "epoch": 1386} {"train_loss": -5.9068803787231445, "global_step": 58237, "epoch": 1386} {"train_loss": -5.915830612182617, "global_step": 58238, "epoch": 1386} {"train_loss": -5.928315162658691, "global_step": 58239, "epoch": 1386} {"train_loss": -5.898994445800781, "global_step": 58240, "epoch": 1386} {"train_loss": -5.938765525817871, "global_step": 58241, "epoch": 1386} {"train_loss": -5.917726516723633, "global_step": 58242, "epoch": 1386} {"train_loss": -5.963991165161133, "global_step": 58243, "epoch": 1386} {"train_loss": -5.852874279022217, "global_step": 58244, "epoch": 1386} {"train_loss": -5.943057060241699, "global_step": 58245, "epoch": 1386} {"train_loss": -5.871919631958008, "global_step": 58246, "epoch": 1386} {"train_loss": -5.836640357971191, "global_step": 58247, "epoch": 1386} {"train_loss": -5.886059761047363, "global_step": 58248, "epoch": 1386} {"train_loss": -5.713364124298096, "global_step": 58249, "epoch": 1386} {"train_loss": -5.892852306365967, "global_step": 58250, "epoch": 1386} {"train_loss": -5.847673416137695, "global_step": 58251, "epoch": 1386} {"train_loss": -5.88401985168457, "global_step": 58252, "epoch": 1386} {"train_loss": -5.897358190445673, "global_step": 58253, "epoch": 1386, "val_loss": 61592.68359375} {"train_loss": -5.939569473266602, "global_step": 58254, "epoch": 1387} {"train_loss": -5.7654829025268555, "global_step": 58255, "epoch": 1387} {"train_loss": -5.884753227233887, "global_step": 58256, "epoch": 1387} {"train_loss": -5.762228012084961, "global_step": 58257, "epoch": 1387} {"train_loss": -5.841729164123535, "global_step": 58258, "epoch": 1387} {"train_loss": -5.9276885986328125, "global_step": 58259, "epoch": 1387} {"train_loss": -5.833791732788086, "global_step": 58260, "epoch": 1387} {"train_loss": -5.876943111419678, "global_step": 58261, "epoch": 1387} {"train_loss": -6.021901607513428, "global_step": 58262, "epoch": 1387} {"train_loss": -5.97043514251709, "global_step": 58263, "epoch": 1387} {"train_loss": -5.9857177734375, "global_step": 58264, "epoch": 1387} {"train_loss": -5.933272361755371, "global_step": 58265, "epoch": 1387} {"train_loss": -5.727112770080566, "global_step": 58266, "epoch": 1387} {"train_loss": -5.96242618560791, "global_step": 58267, "epoch": 1387} {"train_loss": -5.928885459899902, "global_step": 58268, "epoch": 1387} {"train_loss": -5.756882667541504, "global_step": 58269, "epoch": 1387} {"train_loss": -5.763066291809082, "global_step": 58270, "epoch": 1387} {"train_loss": -5.7646965980529785, "global_step": 58271, "epoch": 1387} {"train_loss": -5.839962959289551, "global_step": 58272, "epoch": 1387} {"train_loss": -5.896785736083984, "global_step": 58273, "epoch": 1387} {"train_loss": -5.976293563842773, "global_step": 58274, "epoch": 1387} {"train_loss": -5.799370288848877, "global_step": 58275, "epoch": 1387} {"train_loss": -5.84822940826416, "global_step": 58276, "epoch": 1387} {"train_loss": -5.863483428955078, "global_step": 58277, "epoch": 1387} {"train_loss": -5.8997297286987305, "global_step": 58278, "epoch": 1387} {"train_loss": -5.823404312133789, "global_step": 58279, "epoch": 1387} {"train_loss": -5.872323989868164, "global_step": 58280, "epoch": 1387} {"train_loss": -5.960546970367432, "global_step": 58281, "epoch": 1387} {"train_loss": -5.9683837890625, "global_step": 58282, "epoch": 1387} {"train_loss": -5.908195495605469, "global_step": 58283, "epoch": 1387} {"train_loss": -5.855531692504883, "global_step": 58284, "epoch": 1387} {"train_loss": -5.839934349060059, "global_step": 58285, "epoch": 1387} {"train_loss": -5.842832565307617, "global_step": 58286, "epoch": 1387} {"train_loss": -5.749724388122559, "global_step": 58287, "epoch": 1387} {"train_loss": -5.831258773803711, "global_step": 58288, "epoch": 1387} {"train_loss": -5.786250114440918, "global_step": 58289, "epoch": 1387} {"train_loss": -5.963837623596191, "global_step": 58290, "epoch": 1387} {"train_loss": -5.9262800216674805, "global_step": 58291, "epoch": 1387} {"train_loss": -5.84691047668457, "global_step": 58292, "epoch": 1387} {"train_loss": -5.783421039581299, "global_step": 58293, "epoch": 1387} {"train_loss": -5.813011646270752, "global_step": 58294, "epoch": 1387} {"train_loss": -5.866064650671823, "global_step": 58295, "epoch": 1387, "val_loss": 61527.734375} {"train_loss": -5.866907596588135, "global_step": 58296, "epoch": 1388} {"train_loss": -5.7720537185668945, "global_step": 58297, "epoch": 1388} {"train_loss": -6.044347763061523, "global_step": 58298, "epoch": 1388} {"train_loss": -6.028108596801758, "global_step": 58299, "epoch": 1388} {"train_loss": -5.8268303871154785, "global_step": 58300, "epoch": 1388} {"train_loss": -5.937590599060059, "global_step": 58301, "epoch": 1388} {"train_loss": -5.852529525756836, "global_step": 58302, "epoch": 1388} {"train_loss": -5.669289588928223, "global_step": 58303, "epoch": 1388} {"train_loss": -5.904682636260986, "global_step": 58304, "epoch": 1388} {"train_loss": -5.938215255737305, "global_step": 58305, "epoch": 1388} {"train_loss": -5.887044906616211, "global_step": 58306, "epoch": 1388} {"train_loss": -5.882830619812012, "global_step": 58307, "epoch": 1388} {"train_loss": -5.7724151611328125, "global_step": 58308, "epoch": 1388} {"train_loss": -5.925646781921387, "global_step": 58309, "epoch": 1388} {"train_loss": -5.958490371704102, "global_step": 58310, "epoch": 1388} {"train_loss": -5.807215690612793, "global_step": 58311, "epoch": 1388} {"train_loss": -5.9307169914245605, "global_step": 58312, "epoch": 1388} {"train_loss": -5.864179611206055, "global_step": 58313, "epoch": 1388} {"train_loss": -5.964303016662598, "global_step": 58314, "epoch": 1388} {"train_loss": -5.834212303161621, "global_step": 58315, "epoch": 1388} {"train_loss": -5.8959574699401855, "global_step": 58316, "epoch": 1388} {"train_loss": -5.879809379577637, "global_step": 58317, "epoch": 1388} {"train_loss": -5.956058025360107, "global_step": 58318, "epoch": 1388} {"train_loss": -5.810875415802002, "global_step": 58319, "epoch": 1388} {"train_loss": -6.003514289855957, "global_step": 58320, "epoch": 1388} {"train_loss": -5.960206985473633, "global_step": 58321, "epoch": 1388} {"train_loss": -5.884781837463379, "global_step": 58322, "epoch": 1388} {"train_loss": -5.780722618103027, "global_step": 58323, "epoch": 1388} {"train_loss": -5.899322509765625, "global_step": 58324, "epoch": 1388} {"train_loss": -5.8294854164123535, "global_step": 58325, "epoch": 1388} {"train_loss": -5.807413101196289, "global_step": 58326, "epoch": 1388} {"train_loss": -5.894010066986084, "global_step": 58327, "epoch": 1388} {"train_loss": -5.89241886138916, "global_step": 58328, "epoch": 1388} {"train_loss": -5.9782819747924805, "global_step": 58329, "epoch": 1388} {"train_loss": -5.958250999450684, "global_step": 58330, "epoch": 1388} {"train_loss": -5.84846830368042, "global_step": 58331, "epoch": 1388} {"train_loss": -5.880585670471191, "global_step": 58332, "epoch": 1388} {"train_loss": -5.82457160949707, "global_step": 58333, "epoch": 1388} {"train_loss": -5.961005687713623, "global_step": 58334, "epoch": 1388} {"train_loss": -5.926299095153809, "global_step": 58335, "epoch": 1388} {"train_loss": -5.901058673858643, "global_step": 58336, "epoch": 1388} {"train_loss": -5.888910986128307, "global_step": 58337, "epoch": 1388, "val_loss": 61217.60546875} {"train_loss": -5.950207710266113, "global_step": 58338, "epoch": 1389} {"train_loss": -5.953880786895752, "global_step": 58339, "epoch": 1389} {"train_loss": -5.882564067840576, "global_step": 58340, "epoch": 1389} {"train_loss": -5.817111015319824, "global_step": 58341, "epoch": 1389} {"train_loss": -5.916406631469727, "global_step": 58342, "epoch": 1389} {"train_loss": -5.981625556945801, "global_step": 58343, "epoch": 1389} {"train_loss": -5.946296691894531, "global_step": 58344, "epoch": 1389} {"train_loss": -5.88796329498291, "global_step": 58345, "epoch": 1389} {"train_loss": -5.806150436401367, "global_step": 58346, "epoch": 1389} {"train_loss": -5.879405975341797, "global_step": 58347, "epoch": 1389} {"train_loss": -5.867859363555908, "global_step": 58348, "epoch": 1389} {"train_loss": -5.8575029373168945, "global_step": 58349, "epoch": 1389} {"train_loss": -5.910076141357422, "global_step": 58350, "epoch": 1389} {"train_loss": -5.922720909118652, "global_step": 58351, "epoch": 1389} {"train_loss": -5.805269241333008, "global_step": 58352, "epoch": 1389} {"train_loss": -5.889433860778809, "global_step": 58353, "epoch": 1389} {"train_loss": -5.840852737426758, "global_step": 58354, "epoch": 1389} {"train_loss": -5.867753982543945, "global_step": 58355, "epoch": 1389} {"train_loss": -5.804537773132324, "global_step": 58356, "epoch": 1389} {"train_loss": -5.93897008895874, "global_step": 58357, "epoch": 1389} {"train_loss": -5.927842140197754, "global_step": 58358, "epoch": 1389} {"train_loss": -5.939624786376953, "global_step": 58359, "epoch": 1389} {"train_loss": -5.888106822967529, "global_step": 58360, "epoch": 1389} {"train_loss": -5.860523223876953, "global_step": 58361, "epoch": 1389} {"train_loss": -5.944891929626465, "global_step": 58362, "epoch": 1389} {"train_loss": -6.040126800537109, "global_step": 58363, "epoch": 1389} {"train_loss": -5.925188064575195, "global_step": 58364, "epoch": 1389} {"train_loss": -5.96787691116333, "global_step": 58365, "epoch": 1389} {"train_loss": -5.859738349914551, "global_step": 58366, "epoch": 1389} {"train_loss": -5.887005805969238, "global_step": 58367, "epoch": 1389} {"train_loss": -5.838139533996582, "global_step": 58368, "epoch": 1389} {"train_loss": -5.912067413330078, "global_step": 58369, "epoch": 1389} {"train_loss": -5.976053237915039, "global_step": 58370, "epoch": 1389} {"train_loss": -5.845170497894287, "global_step": 58371, "epoch": 1389} {"train_loss": -5.9342780113220215, "global_step": 58372, "epoch": 1389} {"train_loss": -5.926958084106445, "global_step": 58373, "epoch": 1389} {"train_loss": -5.760107517242432, "global_step": 58374, "epoch": 1389} {"train_loss": -5.895888805389404, "global_step": 58375, "epoch": 1389} {"train_loss": -5.8780317306518555, "global_step": 58376, "epoch": 1389} {"train_loss": -5.8336005210876465, "global_step": 58377, "epoch": 1389} {"train_loss": -5.960637092590332, "global_step": 58378, "epoch": 1389} {"train_loss": -5.8922373567308695, "global_step": 58379, "epoch": 1389, "val_loss": 61711.08984375} {"train_loss": -5.906630992889404, "global_step": 58380, "epoch": 1390} {"train_loss": -5.90339469909668, "global_step": 58381, "epoch": 1390} {"train_loss": -5.808918476104736, "global_step": 58382, "epoch": 1390} {"train_loss": -5.925236701965332, "global_step": 58383, "epoch": 1390} {"train_loss": -5.905609130859375, "global_step": 58384, "epoch": 1390} {"train_loss": -5.791949272155762, "global_step": 58385, "epoch": 1390} {"train_loss": -5.981355667114258, "global_step": 58386, "epoch": 1390} {"train_loss": -5.7441020011901855, "global_step": 58387, "epoch": 1390} {"train_loss": -5.848123073577881, "global_step": 58388, "epoch": 1390} {"train_loss": -5.922360897064209, "global_step": 58389, "epoch": 1390} {"train_loss": -5.872208118438721, "global_step": 58390, "epoch": 1390} {"train_loss": -5.853002548217773, "global_step": 58391, "epoch": 1390} {"train_loss": -5.889590263366699, "global_step": 58392, "epoch": 1390} {"train_loss": -5.850083351135254, "global_step": 58393, "epoch": 1390} {"train_loss": -5.9680633544921875, "global_step": 58394, "epoch": 1390} {"train_loss": -5.836924076080322, "global_step": 58395, "epoch": 1390} {"train_loss": -5.836312294006348, "global_step": 58396, "epoch": 1390} {"train_loss": -5.92764949798584, "global_step": 58397, "epoch": 1390} {"train_loss": -5.828888893127441, "global_step": 58398, "epoch": 1390} {"train_loss": -5.891772270202637, "global_step": 58399, "epoch": 1390} {"train_loss": -5.940085411071777, "global_step": 58400, "epoch": 1390} {"train_loss": -5.849725723266602, "global_step": 58401, "epoch": 1390} {"train_loss": -5.823162078857422, "global_step": 58402, "epoch": 1390} {"train_loss": -5.837328910827637, "global_step": 58403, "epoch": 1390} {"train_loss": -5.973892688751221, "global_step": 58404, "epoch": 1390} {"train_loss": -5.91436243057251, "global_step": 58405, "epoch": 1390} {"train_loss": -5.942904949188232, "global_step": 58406, "epoch": 1390} {"train_loss": -6.024144172668457, "global_step": 58407, "epoch": 1390} {"train_loss": -5.84951114654541, "global_step": 58408, "epoch": 1390} {"train_loss": -5.932782173156738, "global_step": 58409, "epoch": 1390} {"train_loss": -5.892374038696289, "global_step": 58410, "epoch": 1390} {"train_loss": -5.938277244567871, "global_step": 58411, "epoch": 1390} {"train_loss": -5.99233341217041, "global_step": 58412, "epoch": 1390} {"train_loss": -5.9229631423950195, "global_step": 58413, "epoch": 1390} {"train_loss": -5.797948837280273, "global_step": 58414, "epoch": 1390} {"train_loss": -5.829442024230957, "global_step": 58415, "epoch": 1390} {"train_loss": -5.8126959800720215, "global_step": 58416, "epoch": 1390} {"train_loss": -5.873188018798828, "global_step": 58417, "epoch": 1390} {"train_loss": -5.8451128005981445, "global_step": 58418, "epoch": 1390} {"train_loss": -5.90926456451416, "global_step": 58419, "epoch": 1390} {"train_loss": -5.930797100067139, "global_step": 58420, "epoch": 1390} {"train_loss": -5.884047973723638, "global_step": 58421, "epoch": 1390, "val_loss": 61798.40625} {"train_loss": -5.926133632659912, "global_step": 58422, "epoch": 1391} {"train_loss": -5.904755115509033, "global_step": 58423, "epoch": 1391} {"train_loss": -5.816183090209961, "global_step": 58424, "epoch": 1391} {"train_loss": -5.895325183868408, "global_step": 58425, "epoch": 1391} {"train_loss": -5.9727463722229, "global_step": 58426, "epoch": 1391} {"train_loss": -5.804311752319336, "global_step": 58427, "epoch": 1391} {"train_loss": -5.856864929199219, "global_step": 58428, "epoch": 1391} {"train_loss": -5.849231719970703, "global_step": 58429, "epoch": 1391} {"train_loss": -5.768746376037598, "global_step": 58430, "epoch": 1391} {"train_loss": -5.780503273010254, "global_step": 58431, "epoch": 1391} {"train_loss": -5.820012092590332, "global_step": 58432, "epoch": 1391} {"train_loss": -5.869974136352539, "global_step": 58433, "epoch": 1391} {"train_loss": -5.876036643981934, "global_step": 58434, "epoch": 1391} {"train_loss": -5.742567539215088, "global_step": 58435, "epoch": 1391} {"train_loss": -5.7532267570495605, "global_step": 58436, "epoch": 1391} {"train_loss": -5.7130279541015625, "global_step": 58437, "epoch": 1391} {"train_loss": -5.884387969970703, "global_step": 58438, "epoch": 1391} {"train_loss": -5.967232704162598, "global_step": 58439, "epoch": 1391} {"train_loss": -5.887264728546143, "global_step": 58440, "epoch": 1391} {"train_loss": -5.919852256774902, "global_step": 58441, "epoch": 1391} {"train_loss": -5.864341735839844, "global_step": 58442, "epoch": 1391} {"train_loss": -5.931920051574707, "global_step": 58443, "epoch": 1391} {"train_loss": -5.844301700592041, "global_step": 58444, "epoch": 1391} {"train_loss": -5.805736541748047, "global_step": 58445, "epoch": 1391} {"train_loss": -5.8490729331970215, "global_step": 58446, "epoch": 1391} {"train_loss": -5.837456226348877, "global_step": 58447, "epoch": 1391} {"train_loss": -5.771961688995361, "global_step": 58448, "epoch": 1391} {"train_loss": -5.833367347717285, "global_step": 58449, "epoch": 1391} {"train_loss": -5.820686340332031, "global_step": 58450, "epoch": 1391} {"train_loss": -5.935692310333252, "global_step": 58451, "epoch": 1391} {"train_loss": -5.7347564697265625, "global_step": 58452, "epoch": 1391} {"train_loss": -5.935269832611084, "global_step": 58453, "epoch": 1391} {"train_loss": -5.802777290344238, "global_step": 58454, "epoch": 1391} {"train_loss": -5.923561096191406, "global_step": 58455, "epoch": 1391} {"train_loss": -5.795285224914551, "global_step": 58456, "epoch": 1391} {"train_loss": -5.822988033294678, "global_step": 58457, "epoch": 1391} {"train_loss": -6.034386157989502, "global_step": 58458, "epoch": 1391} {"train_loss": -5.849472522735596, "global_step": 58459, "epoch": 1391} {"train_loss": -5.9579057693481445, "global_step": 58460, "epoch": 1391} {"train_loss": -5.870783805847168, "global_step": 58461, "epoch": 1391} {"train_loss": -5.937346458435059, "global_step": 58462, "epoch": 1391} {"train_loss": -5.860662131082444, "global_step": 58463, "epoch": 1391, "val_loss": 61284.265625} {"train_loss": -5.921082019805908, "global_step": 58464, "epoch": 1392} {"train_loss": -5.988099098205566, "global_step": 58465, "epoch": 1392} {"train_loss": -5.993591785430908, "global_step": 58466, "epoch": 1392} {"train_loss": -5.93589973449707, "global_step": 58467, "epoch": 1392} {"train_loss": -6.016493320465088, "global_step": 58468, "epoch": 1392} {"train_loss": -6.051878452301025, "global_step": 58469, "epoch": 1392} {"train_loss": -5.791665077209473, "global_step": 58470, "epoch": 1392} {"train_loss": -5.869721412658691, "global_step": 58471, "epoch": 1392} {"train_loss": -5.900572776794434, "global_step": 58472, "epoch": 1392} {"train_loss": -5.9856672286987305, "global_step": 58473, "epoch": 1392} {"train_loss": -5.83327579498291, "global_step": 58474, "epoch": 1392} {"train_loss": -5.858722686767578, "global_step": 58475, "epoch": 1392} {"train_loss": -5.8364458084106445, "global_step": 58476, "epoch": 1392} {"train_loss": -5.847607612609863, "global_step": 58477, "epoch": 1392} {"train_loss": -5.804359436035156, "global_step": 58478, "epoch": 1392} {"train_loss": -5.895144462585449, "global_step": 58479, "epoch": 1392} {"train_loss": -5.798760414123535, "global_step": 58480, "epoch": 1392} {"train_loss": -5.946703910827637, "global_step": 58481, "epoch": 1392} {"train_loss": -5.725673675537109, "global_step": 58482, "epoch": 1392} {"train_loss": -5.852718353271484, "global_step": 58483, "epoch": 1392} {"train_loss": -5.789910316467285, "global_step": 58484, "epoch": 1392} {"train_loss": -5.791176795959473, "global_step": 58485, "epoch": 1392} {"train_loss": -5.934054374694824, "global_step": 58486, "epoch": 1392} {"train_loss": -5.758065700531006, "global_step": 58487, "epoch": 1392} {"train_loss": -5.8447089195251465, "global_step": 58488, "epoch": 1392} {"train_loss": -5.847434043884277, "global_step": 58489, "epoch": 1392} {"train_loss": -5.611549377441406, "global_step": 58490, "epoch": 1392} {"train_loss": -5.741596221923828, "global_step": 58491, "epoch": 1392} {"train_loss": -5.828706741333008, "global_step": 58492, "epoch": 1392} {"train_loss": -5.795620918273926, "global_step": 58493, "epoch": 1392} {"train_loss": -5.800139427185059, "global_step": 58494, "epoch": 1392} {"train_loss": -5.729848384857178, "global_step": 58495, "epoch": 1392} {"train_loss": -5.820366859436035, "global_step": 58496, "epoch": 1392} {"train_loss": -5.893987655639648, "global_step": 58497, "epoch": 1392} {"train_loss": -5.796328544616699, "global_step": 58498, "epoch": 1392} {"train_loss": -5.958270072937012, "global_step": 58499, "epoch": 1392} {"train_loss": -5.851344108581543, "global_step": 58500, "epoch": 1392} {"train_loss": -5.9235920906066895, "global_step": 58501, "epoch": 1392} {"train_loss": -5.876234531402588, "global_step": 58502, "epoch": 1392} {"train_loss": -5.841740608215332, "global_step": 58503, "epoch": 1392} {"train_loss": -5.749977111816406, "global_step": 58504, "epoch": 1392} {"train_loss": -5.853939374287923, "global_step": 58505, "epoch": 1392, "val_loss": 61529.52734375} {"train_loss": -5.8853044509887695, "global_step": 58506, "epoch": 1393} {"train_loss": -5.886650085449219, "global_step": 58507, "epoch": 1393} {"train_loss": -5.881602764129639, "global_step": 58508, "epoch": 1393} {"train_loss": -5.940857410430908, "global_step": 58509, "epoch": 1393} {"train_loss": -5.870882987976074, "global_step": 58510, "epoch": 1393} {"train_loss": -5.854847431182861, "global_step": 58511, "epoch": 1393} {"train_loss": -5.972682476043701, "global_step": 58512, "epoch": 1393} {"train_loss": -5.82196044921875, "global_step": 58513, "epoch": 1393} {"train_loss": -5.796797752380371, "global_step": 58514, "epoch": 1393} {"train_loss": -5.750489711761475, "global_step": 58515, "epoch": 1393} {"train_loss": -5.858908653259277, "global_step": 58516, "epoch": 1393} {"train_loss": -5.91869592666626, "global_step": 58517, "epoch": 1393} {"train_loss": -5.962220668792725, "global_step": 58518, "epoch": 1393} {"train_loss": -5.80073881149292, "global_step": 58519, "epoch": 1393} {"train_loss": -5.882145881652832, "global_step": 58520, "epoch": 1393} {"train_loss": -5.982375621795654, "global_step": 58521, "epoch": 1393} {"train_loss": -5.893415927886963, "global_step": 58522, "epoch": 1393} {"train_loss": -5.889811992645264, "global_step": 58523, "epoch": 1393} {"train_loss": -5.838616371154785, "global_step": 58524, "epoch": 1393} {"train_loss": -5.828906059265137, "global_step": 58525, "epoch": 1393} {"train_loss": -5.838529586791992, "global_step": 58526, "epoch": 1393} {"train_loss": -5.861152648925781, "global_step": 58527, "epoch": 1393} {"train_loss": -5.916288375854492, "global_step": 58528, "epoch": 1393} {"train_loss": -5.849484920501709, "global_step": 58529, "epoch": 1393} {"train_loss": -5.853694438934326, "global_step": 58530, "epoch": 1393} {"train_loss": -5.812755584716797, "global_step": 58531, "epoch": 1393} {"train_loss": -5.902823448181152, "global_step": 58532, "epoch": 1393} {"train_loss": -5.818713188171387, "global_step": 58533, "epoch": 1393} {"train_loss": -5.931503772735596, "global_step": 58534, "epoch": 1393} {"train_loss": -5.76173210144043, "global_step": 58535, "epoch": 1393} {"train_loss": -5.8183794021606445, "global_step": 58536, "epoch": 1393} {"train_loss": -5.745692253112793, "global_step": 58537, "epoch": 1393} {"train_loss": -5.99019718170166, "global_step": 58538, "epoch": 1393} {"train_loss": -5.9348063468933105, "global_step": 58539, "epoch": 1393} {"train_loss": -5.842588424682617, "global_step": 58540, "epoch": 1393} {"train_loss": -5.857311725616455, "global_step": 58541, "epoch": 1393} {"train_loss": -5.8474531173706055, "global_step": 58542, "epoch": 1393} {"train_loss": -5.856932640075684, "global_step": 58543, "epoch": 1393} {"train_loss": -5.827854156494141, "global_step": 58544, "epoch": 1393} {"train_loss": -5.815791130065918, "global_step": 58545, "epoch": 1393} {"train_loss": -5.89176607131958, "global_step": 58546, "epoch": 1393} {"train_loss": -5.866608699162801, "global_step": 58547, "epoch": 1393, "val_loss": 61766.5546875} {"train_loss": -5.692596912384033, "global_step": 58548, "epoch": 1394} {"train_loss": -5.834033489227295, "global_step": 58549, "epoch": 1394} {"train_loss": -5.69997501373291, "global_step": 58550, "epoch": 1394} {"train_loss": -5.928316116333008, "global_step": 58551, "epoch": 1394} {"train_loss": -5.813157081604004, "global_step": 58552, "epoch": 1394} {"train_loss": -5.802716255187988, "global_step": 58553, "epoch": 1394} {"train_loss": -5.932888507843018, "global_step": 58554, "epoch": 1394} {"train_loss": -5.833032608032227, "global_step": 58555, "epoch": 1394} {"train_loss": -5.796930313110352, "global_step": 58556, "epoch": 1394} {"train_loss": -5.856010913848877, "global_step": 58557, "epoch": 1394} {"train_loss": -5.830461502075195, "global_step": 58558, "epoch": 1394} {"train_loss": -5.912210464477539, "global_step": 58559, "epoch": 1394} {"train_loss": -5.767319679260254, "global_step": 58560, "epoch": 1394} {"train_loss": -5.871662616729736, "global_step": 58561, "epoch": 1394} {"train_loss": -5.772440433502197, "global_step": 58562, "epoch": 1394} {"train_loss": -5.919864177703857, "global_step": 58563, "epoch": 1394} {"train_loss": -5.919610023498535, "global_step": 58564, "epoch": 1394} {"train_loss": -5.7991414070129395, "global_step": 58565, "epoch": 1394} {"train_loss": -5.820957183837891, "global_step": 58566, "epoch": 1394} {"train_loss": -5.974481582641602, "global_step": 58567, "epoch": 1394} {"train_loss": -5.9298095703125, "global_step": 58568, "epoch": 1394} {"train_loss": -5.915291786193848, "global_step": 58569, "epoch": 1394} {"train_loss": -5.907732009887695, "global_step": 58570, "epoch": 1394} {"train_loss": -5.967400550842285, "global_step": 58571, "epoch": 1394} {"train_loss": -5.794532775878906, "global_step": 58572, "epoch": 1394} {"train_loss": -5.787224769592285, "global_step": 58573, "epoch": 1394} {"train_loss": -5.945866584777832, "global_step": 58574, "epoch": 1394} {"train_loss": -5.807917594909668, "global_step": 58575, "epoch": 1394} {"train_loss": -5.981396198272705, "global_step": 58576, "epoch": 1394} {"train_loss": -5.995466232299805, "global_step": 58577, "epoch": 1394} {"train_loss": -5.998421669006348, "global_step": 58578, "epoch": 1394} {"train_loss": -5.869935989379883, "global_step": 58579, "epoch": 1394} {"train_loss": -5.978303909301758, "global_step": 58580, "epoch": 1394} {"train_loss": -6.0110015869140625, "global_step": 58581, "epoch": 1394} {"train_loss": -5.896651268005371, "global_step": 58582, "epoch": 1394} {"train_loss": -5.891332149505615, "global_step": 58583, "epoch": 1394} {"train_loss": -5.920002460479736, "global_step": 58584, "epoch": 1394} {"train_loss": -5.883857727050781, "global_step": 58585, "epoch": 1394} {"train_loss": -5.923333644866943, "global_step": 58586, "epoch": 1394} {"train_loss": -5.773624420166016, "global_step": 58587, "epoch": 1394} {"train_loss": -5.846224784851074, "global_step": 58588, "epoch": 1394} {"train_loss": -5.874820743288312, "global_step": 58589, "epoch": 1394, "val_loss": 61437.31640625} {"train_loss": -5.80430793762207, "global_step": 58590, "epoch": 1395} {"train_loss": -5.804445743560791, "global_step": 58591, "epoch": 1395} {"train_loss": -5.893259048461914, "global_step": 58592, "epoch": 1395} {"train_loss": -5.832167148590088, "global_step": 58593, "epoch": 1395} {"train_loss": -5.826837062835693, "global_step": 58594, "epoch": 1395} {"train_loss": -5.93441104888916, "global_step": 58595, "epoch": 1395} {"train_loss": -5.8032684326171875, "global_step": 58596, "epoch": 1395} {"train_loss": -5.789621353149414, "global_step": 58597, "epoch": 1395} {"train_loss": -5.746528625488281, "global_step": 58598, "epoch": 1395} {"train_loss": -5.931507110595703, "global_step": 58599, "epoch": 1395} {"train_loss": -5.945408821105957, "global_step": 58600, "epoch": 1395} {"train_loss": -5.929574966430664, "global_step": 58601, "epoch": 1395} {"train_loss": -5.863794326782227, "global_step": 58602, "epoch": 1395} {"train_loss": -5.921348571777344, "global_step": 58603, "epoch": 1395} {"train_loss": -5.856560230255127, "global_step": 58604, "epoch": 1395} {"train_loss": -5.747159481048584, "global_step": 58605, "epoch": 1395} {"train_loss": -5.946264266967773, "global_step": 58606, "epoch": 1395} {"train_loss": -5.808029651641846, "global_step": 58607, "epoch": 1395} {"train_loss": -5.943541526794434, "global_step": 58608, "epoch": 1395} {"train_loss": -5.889406681060791, "global_step": 58609, "epoch": 1395} {"train_loss": -5.932180404663086, "global_step": 58610, "epoch": 1395} {"train_loss": -5.863582611083984, "global_step": 58611, "epoch": 1395} {"train_loss": -5.929974555969238, "global_step": 58612, "epoch": 1395} {"train_loss": -5.829820156097412, "global_step": 58613, "epoch": 1395} {"train_loss": -5.8220930099487305, "global_step": 58614, "epoch": 1395} {"train_loss": -5.658756256103516, "global_step": 58615, "epoch": 1395} {"train_loss": -5.828230857849121, "global_step": 58616, "epoch": 1395} {"train_loss": -5.909359931945801, "global_step": 58617, "epoch": 1395} {"train_loss": -5.777926921844482, "global_step": 58618, "epoch": 1395} {"train_loss": -5.9199066162109375, "global_step": 58619, "epoch": 1395} {"train_loss": -5.907876968383789, "global_step": 58620, "epoch": 1395} {"train_loss": -5.8359575271606445, "global_step": 58621, "epoch": 1395} {"train_loss": -5.812463760375977, "global_step": 58622, "epoch": 1395} {"train_loss": -5.890445709228516, "global_step": 58623, "epoch": 1395} {"train_loss": -5.864799499511719, "global_step": 58624, "epoch": 1395} {"train_loss": -5.8701701164245605, "global_step": 58625, "epoch": 1395} {"train_loss": -5.690569877624512, "global_step": 58626, "epoch": 1395} {"train_loss": -5.873195648193359, "global_step": 58627, "epoch": 1395} {"train_loss": -5.882109642028809, "global_step": 58628, "epoch": 1395} {"train_loss": -5.8335723876953125, "global_step": 58629, "epoch": 1395} {"train_loss": -5.902266979217529, "global_step": 58630, "epoch": 1395} {"train_loss": -5.85485517411005, "global_step": 58631, "epoch": 1395, "val_loss": 61387.4453125} {"train_loss": -5.8348002433776855, "global_step": 58632, "epoch": 1396} {"train_loss": -5.820400238037109, "global_step": 58633, "epoch": 1396} {"train_loss": -5.976729393005371, "global_step": 58634, "epoch": 1396} {"train_loss": -5.855069160461426, "global_step": 58635, "epoch": 1396} {"train_loss": -5.802117824554443, "global_step": 58636, "epoch": 1396} {"train_loss": -5.7732086181640625, "global_step": 58637, "epoch": 1396} {"train_loss": -5.767607688903809, "global_step": 58638, "epoch": 1396} {"train_loss": -5.981008052825928, "global_step": 58639, "epoch": 1396} {"train_loss": -5.763308525085449, "global_step": 58640, "epoch": 1396} {"train_loss": -5.881009101867676, "global_step": 58641, "epoch": 1396} {"train_loss": -5.942498683929443, "global_step": 58642, "epoch": 1396} {"train_loss": -5.854653358459473, "global_step": 58643, "epoch": 1396} {"train_loss": -5.97630500793457, "global_step": 58644, "epoch": 1396} {"train_loss": -5.858753204345703, "global_step": 58645, "epoch": 1396} {"train_loss": -5.808723449707031, "global_step": 58646, "epoch": 1396} {"train_loss": -5.84573221206665, "global_step": 58647, "epoch": 1396} {"train_loss": -5.76202392578125, "global_step": 58648, "epoch": 1396} {"train_loss": -5.984119415283203, "global_step": 58649, "epoch": 1396} {"train_loss": -5.826041221618652, "global_step": 58650, "epoch": 1396} {"train_loss": -5.9238600730896, "global_step": 58651, "epoch": 1396} {"train_loss": -5.979117393493652, "global_step": 58652, "epoch": 1396} {"train_loss": -5.935272216796875, "global_step": 58653, "epoch": 1396} {"train_loss": -5.936175346374512, "global_step": 58654, "epoch": 1396} {"train_loss": -5.870433807373047, "global_step": 58655, "epoch": 1396} {"train_loss": -5.7139387130737305, "global_step": 58656, "epoch": 1396} {"train_loss": -5.889314651489258, "global_step": 58657, "epoch": 1396} {"train_loss": -5.90096378326416, "global_step": 58658, "epoch": 1396} {"train_loss": -5.824316024780273, "global_step": 58659, "epoch": 1396} {"train_loss": -5.7997894287109375, "global_step": 58660, "epoch": 1396} {"train_loss": -5.74558162689209, "global_step": 58661, "epoch": 1396} {"train_loss": -5.856605529785156, "global_step": 58662, "epoch": 1396} {"train_loss": -5.807281494140625, "global_step": 58663, "epoch": 1396} {"train_loss": -5.8787431716918945, "global_step": 58664, "epoch": 1396} {"train_loss": -5.844709396362305, "global_step": 58665, "epoch": 1396} {"train_loss": -5.879207611083984, "global_step": 58666, "epoch": 1396} {"train_loss": -5.980059623718262, "global_step": 58667, "epoch": 1396} {"train_loss": -5.7799787521362305, "global_step": 58668, "epoch": 1396} {"train_loss": -5.846639633178711, "global_step": 58669, "epoch": 1396} {"train_loss": -5.914990425109863, "global_step": 58670, "epoch": 1396} {"train_loss": -5.7902936935424805, "global_step": 58671, "epoch": 1396} {"train_loss": -5.833460807800293, "global_step": 58672, "epoch": 1396} {"train_loss": -5.857790742601667, "global_step": 58673, "epoch": 1396, "val_loss": 61547.859375} {"train_loss": -5.901758670806885, "global_step": 58674, "epoch": 1397} {"train_loss": -5.886650085449219, "global_step": 58675, "epoch": 1397} {"train_loss": -5.9858503341674805, "global_step": 58676, "epoch": 1397} {"train_loss": -5.881122589111328, "global_step": 58677, "epoch": 1397} {"train_loss": -5.9067158699035645, "global_step": 58678, "epoch": 1397} {"train_loss": -5.934045791625977, "global_step": 58679, "epoch": 1397} {"train_loss": -5.784942150115967, "global_step": 58680, "epoch": 1397} {"train_loss": -5.9721832275390625, "global_step": 58681, "epoch": 1397} {"train_loss": -5.814209938049316, "global_step": 58682, "epoch": 1397} {"train_loss": -5.819490432739258, "global_step": 58683, "epoch": 1397} {"train_loss": -6.019710540771484, "global_step": 58684, "epoch": 1397} {"train_loss": -5.834140777587891, "global_step": 58685, "epoch": 1397} {"train_loss": -6.02235221862793, "global_step": 58686, "epoch": 1397} {"train_loss": -5.884088516235352, "global_step": 58687, "epoch": 1397} {"train_loss": -5.881386756896973, "global_step": 58688, "epoch": 1397} {"train_loss": -5.909648895263672, "global_step": 58689, "epoch": 1397} {"train_loss": -5.865946292877197, "global_step": 58690, "epoch": 1397} {"train_loss": -5.758224964141846, "global_step": 58691, "epoch": 1397} {"train_loss": -5.945239067077637, "global_step": 58692, "epoch": 1397} {"train_loss": -5.807088851928711, "global_step": 58693, "epoch": 1397} {"train_loss": -5.833146095275879, "global_step": 58694, "epoch": 1397} {"train_loss": -5.86713171005249, "global_step": 58695, "epoch": 1397} {"train_loss": -5.741610527038574, "global_step": 58696, "epoch": 1397} {"train_loss": -5.853985786437988, "global_step": 58697, "epoch": 1397} {"train_loss": -5.9174652099609375, "global_step": 58698, "epoch": 1397} {"train_loss": -5.864073276519775, "global_step": 58699, "epoch": 1397} {"train_loss": -5.775420188903809, "global_step": 58700, "epoch": 1397} {"train_loss": -5.859760284423828, "global_step": 58701, "epoch": 1397} {"train_loss": -5.921401500701904, "global_step": 58702, "epoch": 1397} {"train_loss": -5.841039180755615, "global_step": 58703, "epoch": 1397} {"train_loss": -5.955035209655762, "global_step": 58704, "epoch": 1397} {"train_loss": -5.6490888595581055, "global_step": 58705, "epoch": 1397} {"train_loss": -5.879931449890137, "global_step": 58706, "epoch": 1397} {"train_loss": -5.7680206298828125, "global_step": 58707, "epoch": 1397} {"train_loss": -5.853450298309326, "global_step": 58708, "epoch": 1397} {"train_loss": -5.840825080871582, "global_step": 58709, "epoch": 1397} {"train_loss": -5.920444011688232, "global_step": 58710, "epoch": 1397} {"train_loss": -5.879222869873047, "global_step": 58711, "epoch": 1397} {"train_loss": -5.855720520019531, "global_step": 58712, "epoch": 1397} {"train_loss": -5.826226234436035, "global_step": 58713, "epoch": 1397} {"train_loss": -5.807991027832031, "global_step": 58714, "epoch": 1397} {"train_loss": -5.865257683254423, "global_step": 58715, "epoch": 1397, "val_loss": 61386.50390625} {"train_loss": -5.770148277282715, "global_step": 58716, "epoch": 1398} {"train_loss": -5.886183738708496, "global_step": 58717, "epoch": 1398} {"train_loss": -5.870946407318115, "global_step": 58718, "epoch": 1398} {"train_loss": -5.915624618530273, "global_step": 58719, "epoch": 1398} {"train_loss": -5.951366424560547, "global_step": 58720, "epoch": 1398} {"train_loss": -5.953340530395508, "global_step": 58721, "epoch": 1398} {"train_loss": -5.917601108551025, "global_step": 58722, "epoch": 1398} {"train_loss": -5.9509172439575195, "global_step": 58723, "epoch": 1398} {"train_loss": -5.805848121643066, "global_step": 58724, "epoch": 1398} {"train_loss": -5.863171100616455, "global_step": 58725, "epoch": 1398} {"train_loss": -5.949633598327637, "global_step": 58726, "epoch": 1398} {"train_loss": -5.892473220825195, "global_step": 58727, "epoch": 1398} {"train_loss": -5.816272735595703, "global_step": 58728, "epoch": 1398} {"train_loss": -5.958501815795898, "global_step": 58729, "epoch": 1398} {"train_loss": -5.92794942855835, "global_step": 58730, "epoch": 1398} {"train_loss": -5.8055524826049805, "global_step": 58731, "epoch": 1398} {"train_loss": -5.9398088455200195, "global_step": 58732, "epoch": 1398} {"train_loss": -5.963503837585449, "global_step": 58733, "epoch": 1398} {"train_loss": -5.829297065734863, "global_step": 58734, "epoch": 1398} {"train_loss": -5.930402755737305, "global_step": 58735, "epoch": 1398} {"train_loss": -5.985199928283691, "global_step": 58736, "epoch": 1398} {"train_loss": -5.841347694396973, "global_step": 58737, "epoch": 1398} {"train_loss": -5.912629127502441, "global_step": 58738, "epoch": 1398} {"train_loss": -5.851531028747559, "global_step": 58739, "epoch": 1398} {"train_loss": -5.961714744567871, "global_step": 58740, "epoch": 1398} {"train_loss": -6.028810977935791, "global_step": 58741, "epoch": 1398} {"train_loss": -5.814595699310303, "global_step": 58742, "epoch": 1398} {"train_loss": -5.80190372467041, "global_step": 58743, "epoch": 1398} {"train_loss": -5.835029125213623, "global_step": 58744, "epoch": 1398} {"train_loss": -5.850951671600342, "global_step": 58745, "epoch": 1398} {"train_loss": -5.929990291595459, "global_step": 58746, "epoch": 1398} {"train_loss": -5.833515644073486, "global_step": 58747, "epoch": 1398} {"train_loss": -5.993567943572998, "global_step": 58748, "epoch": 1398} {"train_loss": -6.008711814880371, "global_step": 58749, "epoch": 1398} {"train_loss": -5.8500895500183105, "global_step": 58750, "epoch": 1398} {"train_loss": -5.915232181549072, "global_step": 58751, "epoch": 1398} {"train_loss": -5.838453769683838, "global_step": 58752, "epoch": 1398} {"train_loss": -6.009988784790039, "global_step": 58753, "epoch": 1398} {"train_loss": -5.820896148681641, "global_step": 58754, "epoch": 1398} {"train_loss": -5.806972980499268, "global_step": 58755, "epoch": 1398} {"train_loss": -5.838120460510254, "global_step": 58756, "epoch": 1398} {"train_loss": -5.89319170088995, "global_step": 58757, "epoch": 1398, "val_loss": 61403.95703125} {"train_loss": -5.868295669555664, "global_step": 58758, "epoch": 1399} {"train_loss": -5.778826713562012, "global_step": 58759, "epoch": 1399} {"train_loss": -5.736409664154053, "global_step": 58760, "epoch": 1399} {"train_loss": -5.975111961364746, "global_step": 58761, "epoch": 1399} {"train_loss": -5.842661380767822, "global_step": 58762, "epoch": 1399} {"train_loss": -5.879934787750244, "global_step": 58763, "epoch": 1399} {"train_loss": -5.918890476226807, "global_step": 58764, "epoch": 1399} {"train_loss": -5.792247295379639, "global_step": 58765, "epoch": 1399} {"train_loss": -5.883464813232422, "global_step": 58766, "epoch": 1399} {"train_loss": -5.892752647399902, "global_step": 58767, "epoch": 1399} {"train_loss": -5.8849945068359375, "global_step": 58768, "epoch": 1399} {"train_loss": -5.840027809143066, "global_step": 58769, "epoch": 1399} {"train_loss": -5.886760234832764, "global_step": 58770, "epoch": 1399} {"train_loss": -5.956366539001465, "global_step": 58771, "epoch": 1399} {"train_loss": -5.902016639709473, "global_step": 58772, "epoch": 1399} {"train_loss": -5.981594085693359, "global_step": 58773, "epoch": 1399} {"train_loss": -5.8636651039123535, "global_step": 58774, "epoch": 1399} {"train_loss": -5.9269280433654785, "global_step": 58775, "epoch": 1399} {"train_loss": -5.887100696563721, "global_step": 58776, "epoch": 1399} {"train_loss": -5.892973899841309, "global_step": 58777, "epoch": 1399} {"train_loss": -5.901068210601807, "global_step": 58778, "epoch": 1399} {"train_loss": -5.828123569488525, "global_step": 58779, "epoch": 1399} {"train_loss": -5.835163116455078, "global_step": 58780, "epoch": 1399} {"train_loss": -5.795346260070801, "global_step": 58781, "epoch": 1399} {"train_loss": -5.857729434967041, "global_step": 58782, "epoch": 1399} {"train_loss": -5.818190574645996, "global_step": 58783, "epoch": 1399} {"train_loss": -5.890195369720459, "global_step": 58784, "epoch": 1399} {"train_loss": -5.9264044761657715, "global_step": 58785, "epoch": 1399} {"train_loss": -5.924230575561523, "global_step": 58786, "epoch": 1399} {"train_loss": -6.022663593292236, "global_step": 58787, "epoch": 1399} {"train_loss": -5.914572715759277, "global_step": 58788, "epoch": 1399} {"train_loss": -6.004776954650879, "global_step": 58789, "epoch": 1399} {"train_loss": -5.949215888977051, "global_step": 58790, "epoch": 1399} {"train_loss": -5.901033878326416, "global_step": 58791, "epoch": 1399} {"train_loss": -5.925594806671143, "global_step": 58792, "epoch": 1399} {"train_loss": -6.012262344360352, "global_step": 58793, "epoch": 1399} {"train_loss": -5.893518447875977, "global_step": 58794, "epoch": 1399} {"train_loss": -5.87616491317749, "global_step": 58795, "epoch": 1399} {"train_loss": -5.934304237365723, "global_step": 58796, "epoch": 1399} {"train_loss": -5.9825029373168945, "global_step": 58797, "epoch": 1399} {"train_loss": -5.901474952697754, "global_step": 58798, "epoch": 1399} {"train_loss": -5.897160677682786, "global_step": 58799, "epoch": 1399, "val_loss": 61609.90234375} {"train_loss": -5.792925834655762, "global_step": 58800, "epoch": 1400} {"train_loss": -5.942131996154785, "global_step": 58801, "epoch": 1400} {"train_loss": -6.001245498657227, "global_step": 58802, "epoch": 1400} {"train_loss": -5.822573661804199, "global_step": 58803, "epoch": 1400} {"train_loss": -5.932645797729492, "global_step": 58804, "epoch": 1400} {"train_loss": -5.865788459777832, "global_step": 58805, "epoch": 1400} {"train_loss": -5.8397064208984375, "global_step": 58806, "epoch": 1400} {"train_loss": -5.963100433349609, "global_step": 58807, "epoch": 1400} {"train_loss": -5.889605522155762, "global_step": 58808, "epoch": 1400} {"train_loss": -5.847801208496094, "global_step": 58809, "epoch": 1400} {"train_loss": -5.845648288726807, "global_step": 58810, "epoch": 1400} {"train_loss": -5.950019359588623, "global_step": 58811, "epoch": 1400} {"train_loss": -5.944982528686523, "global_step": 58812, "epoch": 1400} {"train_loss": -5.939199447631836, "global_step": 58813, "epoch": 1400} {"train_loss": -5.903618812561035, "global_step": 58814, "epoch": 1400} {"train_loss": -5.933754920959473, "global_step": 58815, "epoch": 1400} {"train_loss": -5.925723075866699, "global_step": 58816, "epoch": 1400} {"train_loss": -5.820508003234863, "global_step": 58817, "epoch": 1400} {"train_loss": -5.933097839355469, "global_step": 58818, "epoch": 1400} {"train_loss": -5.834569931030273, "global_step": 58819, "epoch": 1400} {"train_loss": -5.88162899017334, "global_step": 58820, "epoch": 1400} {"train_loss": -5.853350639343262, "global_step": 58821, "epoch": 1400} {"train_loss": -5.754509925842285, "global_step": 58822, "epoch": 1400} {"train_loss": -5.7831926345825195, "global_step": 58823, "epoch": 1400} {"train_loss": -5.920437812805176, "global_step": 58824, "epoch": 1400} {"train_loss": -5.723637580871582, "global_step": 58825, "epoch": 1400} {"train_loss": -5.687041282653809, "global_step": 58826, "epoch": 1400} {"train_loss": -5.904706954956055, "global_step": 58827, "epoch": 1400} {"train_loss": -5.729047775268555, "global_step": 58828, "epoch": 1400} {"train_loss": -5.819523811340332, "global_step": 58829, "epoch": 1400} {"train_loss": -5.937836170196533, "global_step": 58830, "epoch": 1400} {"train_loss": -5.73331356048584, "global_step": 58831, "epoch": 1400} {"train_loss": -5.910192489624023, "global_step": 58832, "epoch": 1400} {"train_loss": -5.87030553817749, "global_step": 58833, "epoch": 1400} {"train_loss": -5.830376148223877, "global_step": 58834, "epoch": 1400} {"train_loss": -5.7199201583862305, "global_step": 58835, "epoch": 1400} {"train_loss": -5.9285054206848145, "global_step": 58836, "epoch": 1400} {"train_loss": -5.722464084625244, "global_step": 58837, "epoch": 1400} {"train_loss": -5.902221202850342, "global_step": 58838, "epoch": 1400} {"train_loss": -5.843381404876709, "global_step": 58839, "epoch": 1400} {"train_loss": -5.895168304443359, "global_step": 58840, "epoch": 1400} {"train_loss": -5.862159638177781, "global_step": 58841, "epoch": 1400, "train/sim_max_reward_0": 0.2878775350126073, "train/sim_max_reward_1": 0.40061466980936616, "train/sim_max_reward_2": 0.5424553709977855, "train/sim_max_reward_3": 0.15317493401740367, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8422812953690226, "test/sim_max_reward_4300001": 0.3156846910398643, "test/sim_max_reward_4300002": 0.9551975910444128, "test/sim_max_reward_4300003": 0.7611050692027116, "test/sim_max_reward_4300004": 0.42300908736691883, "test/sim_max_reward_4300005": 0.7764105159497835, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3085064087414552, "test/sim_max_reward_4300008": 0.5059233628120775, "test/sim_max_reward_4300009": 0.8059987292308588, "test/sim_max_reward_4300010": 0.11718242782390002, "test/sim_max_reward_4300011": 0.9298896835727692, "test/sim_max_reward_4300012": 0.3836204036448256, "test/sim_max_reward_4300013": 0.7149706828288523, "test/sim_max_reward_4300014": 0.903632046544763, "test/sim_max_reward_4300015": 0.7964443454510945, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.5462443294140081, "test/sim_max_reward_4300018": 0.41727924901271063, "test/sim_max_reward_4300019": 0.18594230954471033, "test/sim_max_reward_4300020": 0.7475426868505924, "test/sim_max_reward_4300021": 0.7677484923785737, "test/sim_max_reward_4300022": 0.7208030061043715, "test/sim_max_reward_4300023": 0.335752473859592, "test/sim_max_reward_4300024": 0.45381504142828416, "test/sim_max_reward_4300025": 0.75833660238354, "test/sim_max_reward_4300026": 0.16706253914802022, "test/sim_max_reward_4300027": 0.717030905100918, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.2134284275322783, "test/sim_max_reward_4300030": 0.8877548514888042, "test/sim_max_reward_4300031": 0.25399702968519255, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.543096657355992, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.6786991656508743, "test/sim_max_reward_4300038": 0.8638209940386941, "test/sim_max_reward_4300039": 0.8542134991472091, "test/sim_max_reward_4300040": 0.30910808578340754, "test/sim_max_reward_4300041": 0.919823375427111, "test/sim_max_reward_4300042": 0.5992657076037546, "test/sim_max_reward_4300043": 0.06090880000144952, "test/sim_max_reward_4300044": 0.7815307444629137, "test/sim_max_reward_4300045": 0.1702223066572756, "test/sim_max_reward_4300046": 0.16858270501962377, "test/sim_max_reward_4300047": 0.12282322296416812, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.27224204557095266, "train/mean_score": 0.4295178781998917, "test/mean_score": 0.48512251419603625, "val_loss": 61432.7734375} {"train_loss": -5.745936393737793, "global_step": 58842, "epoch": 1401} {"train_loss": -5.969052791595459, "global_step": 58843, "epoch": 1401} {"train_loss": -5.921952247619629, "global_step": 58844, "epoch": 1401} {"train_loss": -6.0235185623168945, "global_step": 58845, "epoch": 1401} {"train_loss": -5.793102741241455, "global_step": 58846, "epoch": 1401} {"train_loss": -6.00821590423584, "global_step": 58847, "epoch": 1401} {"train_loss": -5.95038366317749, "global_step": 58848, "epoch": 1401} {"train_loss": -5.827834129333496, "global_step": 58849, "epoch": 1401} {"train_loss": -5.8933796882629395, "global_step": 58850, "epoch": 1401} {"train_loss": -5.8451032638549805, "global_step": 58851, "epoch": 1401} {"train_loss": -5.910882949829102, "global_step": 58852, "epoch": 1401} {"train_loss": -5.930559158325195, "global_step": 58853, "epoch": 1401} {"train_loss": -5.895726203918457, "global_step": 58854, "epoch": 1401} {"train_loss": -5.989105224609375, "global_step": 58855, "epoch": 1401} {"train_loss": -5.844058036804199, "global_step": 58856, "epoch": 1401} {"train_loss": -5.932060718536377, "global_step": 58857, "epoch": 1401} {"train_loss": -5.8183979988098145, "global_step": 58858, "epoch": 1401} {"train_loss": -5.959488868713379, "global_step": 58859, "epoch": 1401} {"train_loss": -5.961254119873047, "global_step": 58860, "epoch": 1401} {"train_loss": -5.9145684242248535, "global_step": 58861, "epoch": 1401} {"train_loss": -5.914707183837891, "global_step": 58862, "epoch": 1401} {"train_loss": -5.890560150146484, "global_step": 58863, "epoch": 1401} {"train_loss": -5.883891582489014, "global_step": 58864, "epoch": 1401} {"train_loss": -6.014880180358887, "global_step": 58865, "epoch": 1401} {"train_loss": -5.970880031585693, "global_step": 58866, "epoch": 1401} {"train_loss": -5.942013740539551, "global_step": 58867, "epoch": 1401} {"train_loss": -5.903992652893066, "global_step": 58868, "epoch": 1401} {"train_loss": -5.837209224700928, "global_step": 58869, "epoch": 1401} {"train_loss": -5.880771636962891, "global_step": 58870, "epoch": 1401} {"train_loss": -5.775482177734375, "global_step": 58871, "epoch": 1401} {"train_loss": -5.756021022796631, "global_step": 58872, "epoch": 1401} {"train_loss": -5.9439167976379395, "global_step": 58873, "epoch": 1401} {"train_loss": -5.944465637207031, "global_step": 58874, "epoch": 1401} {"train_loss": -5.813478469848633, "global_step": 58875, "epoch": 1401} {"train_loss": -5.893787860870361, "global_step": 58876, "epoch": 1401} {"train_loss": -5.887998104095459, "global_step": 58877, "epoch": 1401} {"train_loss": -5.93422794342041, "global_step": 58878, "epoch": 1401} {"train_loss": -5.818099498748779, "global_step": 58879, "epoch": 1401} {"train_loss": -5.876775741577148, "global_step": 58880, "epoch": 1401} {"train_loss": -5.987335205078125, "global_step": 58881, "epoch": 1401} {"train_loss": -5.915982723236084, "global_step": 58882, "epoch": 1401} {"train_loss": -5.898425715310233, "global_step": 58883, "epoch": 1401, "val_loss": 61336.359375} {"train_loss": -5.909648895263672, "global_step": 58884, "epoch": 1402} {"train_loss": -5.86984395980835, "global_step": 58885, "epoch": 1402} {"train_loss": -5.882626533508301, "global_step": 58886, "epoch": 1402} {"train_loss": -5.901803493499756, "global_step": 58887, "epoch": 1402} {"train_loss": -5.845951080322266, "global_step": 58888, "epoch": 1402} {"train_loss": -5.901198863983154, "global_step": 58889, "epoch": 1402} {"train_loss": -5.860562324523926, "global_step": 58890, "epoch": 1402} {"train_loss": -5.934383392333984, "global_step": 58891, "epoch": 1402} {"train_loss": -5.942708492279053, "global_step": 58892, "epoch": 1402} {"train_loss": -5.9569807052612305, "global_step": 58893, "epoch": 1402} {"train_loss": -5.807361602783203, "global_step": 58894, "epoch": 1402} {"train_loss": -5.853353977203369, "global_step": 58895, "epoch": 1402} {"train_loss": -5.73210334777832, "global_step": 58896, "epoch": 1402} {"train_loss": -5.924745559692383, "global_step": 58897, "epoch": 1402} {"train_loss": -5.902351379394531, "global_step": 58898, "epoch": 1402} {"train_loss": -5.790511131286621, "global_step": 58899, "epoch": 1402} {"train_loss": -5.864781379699707, "global_step": 58900, "epoch": 1402} {"train_loss": -5.735352516174316, "global_step": 58901, "epoch": 1402} {"train_loss": -5.8862199783325195, "global_step": 58902, "epoch": 1402} {"train_loss": -5.859365940093994, "global_step": 58903, "epoch": 1402} {"train_loss": -5.793705940246582, "global_step": 58904, "epoch": 1402} {"train_loss": -6.042279243469238, "global_step": 58905, "epoch": 1402} {"train_loss": -5.869332313537598, "global_step": 58906, "epoch": 1402} {"train_loss": -5.86573600769043, "global_step": 58907, "epoch": 1402} {"train_loss": -5.867025852203369, "global_step": 58908, "epoch": 1402} {"train_loss": -5.8552751541137695, "global_step": 58909, "epoch": 1402} {"train_loss": -5.887950897216797, "global_step": 58910, "epoch": 1402} {"train_loss": -5.849346160888672, "global_step": 58911, "epoch": 1402} {"train_loss": -6.02194356918335, "global_step": 58912, "epoch": 1402} {"train_loss": -5.880318641662598, "global_step": 58913, "epoch": 1402} {"train_loss": -5.980269432067871, "global_step": 58914, "epoch": 1402} {"train_loss": -5.8560075759887695, "global_step": 58915, "epoch": 1402} {"train_loss": -5.865203857421875, "global_step": 58916, "epoch": 1402} {"train_loss": -5.861577033996582, "global_step": 58917, "epoch": 1402} {"train_loss": -5.921881675720215, "global_step": 58918, "epoch": 1402} {"train_loss": -5.844160556793213, "global_step": 58919, "epoch": 1402} {"train_loss": -5.78564453125, "global_step": 58920, "epoch": 1402} {"train_loss": -5.963380336761475, "global_step": 58921, "epoch": 1402} {"train_loss": -5.829461574554443, "global_step": 58922, "epoch": 1402} {"train_loss": -6.004946708679199, "global_step": 58923, "epoch": 1402} {"train_loss": -5.78945255279541, "global_step": 58924, "epoch": 1402} {"train_loss": -5.878275144667852, "global_step": 58925, "epoch": 1402, "val_loss": 61228.953125} {"train_loss": -6.030924320220947, "global_step": 58926, "epoch": 1403} {"train_loss": -5.900485038757324, "global_step": 58927, "epoch": 1403} {"train_loss": -5.957533836364746, "global_step": 58928, "epoch": 1403} {"train_loss": -5.872878551483154, "global_step": 58929, "epoch": 1403} {"train_loss": -5.885683536529541, "global_step": 58930, "epoch": 1403} {"train_loss": -5.884835243225098, "global_step": 58931, "epoch": 1403} {"train_loss": -5.771387100219727, "global_step": 58932, "epoch": 1403} {"train_loss": -5.821767807006836, "global_step": 58933, "epoch": 1403} {"train_loss": -5.860771179199219, "global_step": 58934, "epoch": 1403} {"train_loss": -5.681401252746582, "global_step": 58935, "epoch": 1403} {"train_loss": -5.948741912841797, "global_step": 58936, "epoch": 1403} {"train_loss": -5.785484313964844, "global_step": 58937, "epoch": 1403} {"train_loss": -5.9204630851745605, "global_step": 58938, "epoch": 1403} {"train_loss": -5.869872093200684, "global_step": 58939, "epoch": 1403} {"train_loss": -5.970635414123535, "global_step": 58940, "epoch": 1403} {"train_loss": -5.891989707946777, "global_step": 58941, "epoch": 1403} {"train_loss": -5.927459716796875, "global_step": 58942, "epoch": 1403} {"train_loss": -5.788218975067139, "global_step": 58943, "epoch": 1403} {"train_loss": -5.964752674102783, "global_step": 58944, "epoch": 1403} {"train_loss": -5.92018985748291, "global_step": 58945, "epoch": 1403} {"train_loss": -5.835248947143555, "global_step": 58946, "epoch": 1403} {"train_loss": -6.092469215393066, "global_step": 58947, "epoch": 1403} {"train_loss": -6.045316696166992, "global_step": 58948, "epoch": 1403} {"train_loss": -5.9228901863098145, "global_step": 58949, "epoch": 1403} {"train_loss": -5.849662780761719, "global_step": 58950, "epoch": 1403} {"train_loss": -5.908404350280762, "global_step": 58951, "epoch": 1403} {"train_loss": -5.889651775360107, "global_step": 58952, "epoch": 1403} {"train_loss": -5.920792579650879, "global_step": 58953, "epoch": 1403} {"train_loss": -5.871549606323242, "global_step": 58954, "epoch": 1403} {"train_loss": -5.8197126388549805, "global_step": 58955, "epoch": 1403} {"train_loss": -5.943544387817383, "global_step": 58956, "epoch": 1403} {"train_loss": -5.8737006187438965, "global_step": 58957, "epoch": 1403} {"train_loss": -5.809212684631348, "global_step": 58958, "epoch": 1403} {"train_loss": -5.908196449279785, "global_step": 58959, "epoch": 1403} {"train_loss": -5.8636674880981445, "global_step": 58960, "epoch": 1403} {"train_loss": -5.960203170776367, "global_step": 58961, "epoch": 1403} {"train_loss": -5.966156959533691, "global_step": 58962, "epoch": 1403} {"train_loss": -5.826580047607422, "global_step": 58963, "epoch": 1403} {"train_loss": -5.929793357849121, "global_step": 58964, "epoch": 1403} {"train_loss": -5.828066825866699, "global_step": 58965, "epoch": 1403} {"train_loss": -5.979037284851074, "global_step": 58966, "epoch": 1403} {"train_loss": -5.8965430827367875, "global_step": 58967, "epoch": 1403, "val_loss": 61671.5078125} {"train_loss": -5.764786720275879, "global_step": 58968, "epoch": 1404} {"train_loss": -5.841656684875488, "global_step": 58969, "epoch": 1404} {"train_loss": -5.929323196411133, "global_step": 58970, "epoch": 1404} {"train_loss": -5.876049995422363, "global_step": 58971, "epoch": 1404} {"train_loss": -5.894151210784912, "global_step": 58972, "epoch": 1404} {"train_loss": -5.799160480499268, "global_step": 58973, "epoch": 1404} {"train_loss": -5.892961502075195, "global_step": 58974, "epoch": 1404} {"train_loss": -5.9177141189575195, "global_step": 58975, "epoch": 1404} {"train_loss": -5.850308418273926, "global_step": 58976, "epoch": 1404} {"train_loss": -5.868552207946777, "global_step": 58977, "epoch": 1404} {"train_loss": -5.630370140075684, "global_step": 58978, "epoch": 1404} {"train_loss": -5.789307117462158, "global_step": 58979, "epoch": 1404} {"train_loss": -5.825313568115234, "global_step": 58980, "epoch": 1404} {"train_loss": -5.941261291503906, "global_step": 58981, "epoch": 1404} {"train_loss": -5.91475772857666, "global_step": 58982, "epoch": 1404} {"train_loss": -5.779500484466553, "global_step": 58983, "epoch": 1404} {"train_loss": -5.934991836547852, "global_step": 58984, "epoch": 1404} {"train_loss": -5.818894863128662, "global_step": 58985, "epoch": 1404} {"train_loss": -5.8007893562316895, "global_step": 58986, "epoch": 1404} {"train_loss": -5.837306022644043, "global_step": 58987, "epoch": 1404} {"train_loss": -5.786522388458252, "global_step": 58988, "epoch": 1404} {"train_loss": -5.899641036987305, "global_step": 58989, "epoch": 1404} {"train_loss": -5.95449161529541, "global_step": 58990, "epoch": 1404} {"train_loss": -5.917231559753418, "global_step": 58991, "epoch": 1404} {"train_loss": -5.91555118560791, "global_step": 58992, "epoch": 1404} {"train_loss": -5.8764567375183105, "global_step": 58993, "epoch": 1404} {"train_loss": -5.8177490234375, "global_step": 58994, "epoch": 1404} {"train_loss": -5.99271297454834, "global_step": 58995, "epoch": 1404} {"train_loss": -5.910729885101318, "global_step": 58996, "epoch": 1404} {"train_loss": -5.826148986816406, "global_step": 58997, "epoch": 1404} {"train_loss": -5.866503715515137, "global_step": 58998, "epoch": 1404} {"train_loss": -5.980587005615234, "global_step": 58999, "epoch": 1404} {"train_loss": -5.807572364807129, "global_step": 59000, "epoch": 1404} {"train_loss": -5.983902454376221, "global_step": 59001, "epoch": 1404} {"train_loss": -5.876974582672119, "global_step": 59002, "epoch": 1404} {"train_loss": -6.0034098625183105, "global_step": 59003, "epoch": 1404} {"train_loss": -5.87980842590332, "global_step": 59004, "epoch": 1404} {"train_loss": -5.850873947143555, "global_step": 59005, "epoch": 1404} {"train_loss": -6.011013031005859, "global_step": 59006, "epoch": 1404} {"train_loss": -5.939201354980469, "global_step": 59007, "epoch": 1404} {"train_loss": -5.912988185882568, "global_step": 59008, "epoch": 1404} {"train_loss": -5.875891095116025, "global_step": 59009, "epoch": 1404, "val_loss": 61313.6875} {"train_loss": -6.026602745056152, "global_step": 59010, "epoch": 1405} {"train_loss": -5.840305805206299, "global_step": 59011, "epoch": 1405} {"train_loss": -6.013389587402344, "global_step": 59012, "epoch": 1405} {"train_loss": -5.878776550292969, "global_step": 59013, "epoch": 1405} {"train_loss": -5.8225417137146, "global_step": 59014, "epoch": 1405} {"train_loss": -5.896341323852539, "global_step": 59015, "epoch": 1405} {"train_loss": -5.91478157043457, "global_step": 59016, "epoch": 1405} {"train_loss": -5.780274391174316, "global_step": 59017, "epoch": 1405} {"train_loss": -5.868454456329346, "global_step": 59018, "epoch": 1405} {"train_loss": -5.813448905944824, "global_step": 59019, "epoch": 1405} {"train_loss": -5.747952461242676, "global_step": 59020, "epoch": 1405} {"train_loss": -5.942566871643066, "global_step": 59021, "epoch": 1405} {"train_loss": -5.672888278961182, "global_step": 59022, "epoch": 1405} {"train_loss": -5.8382978439331055, "global_step": 59023, "epoch": 1405} {"train_loss": -5.976983070373535, "global_step": 59024, "epoch": 1405} {"train_loss": -5.821211814880371, "global_step": 59025, "epoch": 1405} {"train_loss": -5.752983093261719, "global_step": 59026, "epoch": 1405} {"train_loss": -5.925013542175293, "global_step": 59027, "epoch": 1405} {"train_loss": -5.791962146759033, "global_step": 59028, "epoch": 1405} {"train_loss": -5.901150703430176, "global_step": 59029, "epoch": 1405} {"train_loss": -5.812322616577148, "global_step": 59030, "epoch": 1405} {"train_loss": -5.890088081359863, "global_step": 59031, "epoch": 1405} {"train_loss": -5.94896125793457, "global_step": 59032, "epoch": 1405} {"train_loss": -5.844305038452148, "global_step": 59033, "epoch": 1405} {"train_loss": -5.859905242919922, "global_step": 59034, "epoch": 1405} {"train_loss": -5.986075401306152, "global_step": 59035, "epoch": 1405} {"train_loss": -5.893571853637695, "global_step": 59036, "epoch": 1405} {"train_loss": -5.935179710388184, "global_step": 59037, "epoch": 1405} {"train_loss": -5.902988433837891, "global_step": 59038, "epoch": 1405} {"train_loss": -5.875847816467285, "global_step": 59039, "epoch": 1405} {"train_loss": -5.859665393829346, "global_step": 59040, "epoch": 1405} {"train_loss": -5.991583347320557, "global_step": 59041, "epoch": 1405} {"train_loss": -5.916199207305908, "global_step": 59042, "epoch": 1405} {"train_loss": -5.913300514221191, "global_step": 59043, "epoch": 1405} {"train_loss": -5.8903913497924805, "global_step": 59044, "epoch": 1405} {"train_loss": -5.929925918579102, "global_step": 59045, "epoch": 1405} {"train_loss": -5.928788185119629, "global_step": 59046, "epoch": 1405} {"train_loss": -5.891537189483643, "global_step": 59047, "epoch": 1405} {"train_loss": -5.907040596008301, "global_step": 59048, "epoch": 1405} {"train_loss": -5.883260250091553, "global_step": 59049, "epoch": 1405} {"train_loss": -5.852710723876953, "global_step": 59050, "epoch": 1405} {"train_loss": -5.881311779930478, "global_step": 59051, "epoch": 1405, "val_loss": 61323.25390625} {"train_loss": -5.959225654602051, "global_step": 59052, "epoch": 1406} {"train_loss": -5.880561828613281, "global_step": 59053, "epoch": 1406} {"train_loss": -5.9196624755859375, "global_step": 59054, "epoch": 1406} {"train_loss": -5.829527378082275, "global_step": 59055, "epoch": 1406} {"train_loss": -5.91663932800293, "global_step": 59056, "epoch": 1406} {"train_loss": -5.934608459472656, "global_step": 59057, "epoch": 1406} {"train_loss": -5.871958255767822, "global_step": 59058, "epoch": 1406} {"train_loss": -5.907198429107666, "global_step": 59059, "epoch": 1406} {"train_loss": -5.930639743804932, "global_step": 59060, "epoch": 1406} {"train_loss": -5.9576802253723145, "global_step": 59061, "epoch": 1406} {"train_loss": -6.060929298400879, "global_step": 59062, "epoch": 1406} {"train_loss": -5.920473575592041, "global_step": 59063, "epoch": 1406} {"train_loss": -5.774162292480469, "global_step": 59064, "epoch": 1406} {"train_loss": -5.859859466552734, "global_step": 59065, "epoch": 1406} {"train_loss": -5.8125200271606445, "global_step": 59066, "epoch": 1406} {"train_loss": -5.970692157745361, "global_step": 59067, "epoch": 1406} {"train_loss": -5.810941696166992, "global_step": 59068, "epoch": 1406} {"train_loss": -5.793888568878174, "global_step": 59069, "epoch": 1406} {"train_loss": -5.92545747756958, "global_step": 59070, "epoch": 1406} {"train_loss": -5.916433334350586, "global_step": 59071, "epoch": 1406} {"train_loss": -5.913695335388184, "global_step": 59072, "epoch": 1406} {"train_loss": -5.904480934143066, "global_step": 59073, "epoch": 1406} {"train_loss": -5.931910514831543, "global_step": 59074, "epoch": 1406} {"train_loss": -5.6714606285095215, "global_step": 59075, "epoch": 1406} {"train_loss": -5.968860626220703, "global_step": 59076, "epoch": 1406} {"train_loss": -5.740804672241211, "global_step": 59077, "epoch": 1406} {"train_loss": -5.8659844398498535, "global_step": 59078, "epoch": 1406} {"train_loss": -5.919421195983887, "global_step": 59079, "epoch": 1406} {"train_loss": -5.857126712799072, "global_step": 59080, "epoch": 1406} {"train_loss": -5.901707649230957, "global_step": 59081, "epoch": 1406} {"train_loss": -5.81928825378418, "global_step": 59082, "epoch": 1406} {"train_loss": -5.811613082885742, "global_step": 59083, "epoch": 1406} {"train_loss": -5.901622772216797, "global_step": 59084, "epoch": 1406} {"train_loss": -6.002729415893555, "global_step": 59085, "epoch": 1406} {"train_loss": -5.880061626434326, "global_step": 59086, "epoch": 1406} {"train_loss": -5.910368919372559, "global_step": 59087, "epoch": 1406} {"train_loss": -5.9525604248046875, "global_step": 59088, "epoch": 1406} {"train_loss": -5.974420547485352, "global_step": 59089, "epoch": 1406} {"train_loss": -5.821550369262695, "global_step": 59090, "epoch": 1406} {"train_loss": -5.890913963317871, "global_step": 59091, "epoch": 1406} {"train_loss": -5.925729751586914, "global_step": 59092, "epoch": 1406} {"train_loss": -5.893134979974656, "global_step": 59093, "epoch": 1406, "val_loss": 61504.1796875} {"train_loss": -5.926927089691162, "global_step": 59094, "epoch": 1407} {"train_loss": -5.897474765777588, "global_step": 59095, "epoch": 1407} {"train_loss": -5.93464469909668, "global_step": 59096, "epoch": 1407} {"train_loss": -5.95634651184082, "global_step": 59097, "epoch": 1407} {"train_loss": -5.928286552429199, "global_step": 59098, "epoch": 1407} {"train_loss": -5.9630303382873535, "global_step": 59099, "epoch": 1407} {"train_loss": -5.862018585205078, "global_step": 59100, "epoch": 1407} {"train_loss": -5.958614826202393, "global_step": 59101, "epoch": 1407} {"train_loss": -5.875869274139404, "global_step": 59102, "epoch": 1407} {"train_loss": -5.903573989868164, "global_step": 59103, "epoch": 1407} {"train_loss": -5.866717338562012, "global_step": 59104, "epoch": 1407} {"train_loss": -6.079716205596924, "global_step": 59105, "epoch": 1407} {"train_loss": -6.0067243576049805, "global_step": 59106, "epoch": 1407} {"train_loss": -5.979138374328613, "global_step": 59107, "epoch": 1407} {"train_loss": -5.9193010330200195, "global_step": 59108, "epoch": 1407} {"train_loss": -5.896099090576172, "global_step": 59109, "epoch": 1407} {"train_loss": -6.0475873947143555, "global_step": 59110, "epoch": 1407} {"train_loss": -5.825307369232178, "global_step": 59111, "epoch": 1407} {"train_loss": -6.015728950500488, "global_step": 59112, "epoch": 1407} {"train_loss": -5.906689167022705, "global_step": 59113, "epoch": 1407} {"train_loss": -5.86359977722168, "global_step": 59114, "epoch": 1407} {"train_loss": -6.056123733520508, "global_step": 59115, "epoch": 1407} {"train_loss": -5.83989953994751, "global_step": 59116, "epoch": 1407} {"train_loss": -5.867626190185547, "global_step": 59117, "epoch": 1407} {"train_loss": -5.872982025146484, "global_step": 59118, "epoch": 1407} {"train_loss": -5.95131778717041, "global_step": 59119, "epoch": 1407} {"train_loss": -5.88493537902832, "global_step": 59120, "epoch": 1407} {"train_loss": -5.789124965667725, "global_step": 59121, "epoch": 1407} {"train_loss": -5.812509059906006, "global_step": 59122, "epoch": 1407} {"train_loss": -5.925109386444092, "global_step": 59123, "epoch": 1407} {"train_loss": -5.9327263832092285, "global_step": 59124, "epoch": 1407} {"train_loss": -5.888426780700684, "global_step": 59125, "epoch": 1407} {"train_loss": -5.900373458862305, "global_step": 59126, "epoch": 1407} {"train_loss": -5.801130771636963, "global_step": 59127, "epoch": 1407} {"train_loss": -5.97369384765625, "global_step": 59128, "epoch": 1407} {"train_loss": -5.847064018249512, "global_step": 59129, "epoch": 1407} {"train_loss": -5.811163425445557, "global_step": 59130, "epoch": 1407} {"train_loss": -5.808648109436035, "global_step": 59131, "epoch": 1407} {"train_loss": -5.978266716003418, "global_step": 59132, "epoch": 1407} {"train_loss": -5.839419841766357, "global_step": 59133, "epoch": 1407} {"train_loss": -5.850587844848633, "global_step": 59134, "epoch": 1407} {"train_loss": -5.90508678981236, "global_step": 59135, "epoch": 1407, "val_loss": 61319.1640625} {"train_loss": -5.909087657928467, "global_step": 59136, "epoch": 1408} {"train_loss": -5.882564544677734, "global_step": 59137, "epoch": 1408} {"train_loss": -5.992186069488525, "global_step": 59138, "epoch": 1408} {"train_loss": -5.803494453430176, "global_step": 59139, "epoch": 1408} {"train_loss": -5.949112892150879, "global_step": 59140, "epoch": 1408} {"train_loss": -5.935270309448242, "global_step": 59141, "epoch": 1408} {"train_loss": -5.924112319946289, "global_step": 59142, "epoch": 1408} {"train_loss": -5.878241062164307, "global_step": 59143, "epoch": 1408} {"train_loss": -5.871649742126465, "global_step": 59144, "epoch": 1408} {"train_loss": -5.8716559410095215, "global_step": 59145, "epoch": 1408} {"train_loss": -5.849240303039551, "global_step": 59146, "epoch": 1408} {"train_loss": -5.7723798751831055, "global_step": 59147, "epoch": 1408} {"train_loss": -5.841847896575928, "global_step": 59148, "epoch": 1408} {"train_loss": -5.896627902984619, "global_step": 59149, "epoch": 1408} {"train_loss": -5.937899589538574, "global_step": 59150, "epoch": 1408} {"train_loss": -5.843404769897461, "global_step": 59151, "epoch": 1408} {"train_loss": -5.846503257751465, "global_step": 59152, "epoch": 1408} {"train_loss": -5.894106864929199, "global_step": 59153, "epoch": 1408} {"train_loss": -5.940916061401367, "global_step": 59154, "epoch": 1408} {"train_loss": -5.833615303039551, "global_step": 59155, "epoch": 1408} {"train_loss": -5.854714393615723, "global_step": 59156, "epoch": 1408} {"train_loss": -5.941514492034912, "global_step": 59157, "epoch": 1408} {"train_loss": -5.850088119506836, "global_step": 59158, "epoch": 1408} {"train_loss": -5.800830841064453, "global_step": 59159, "epoch": 1408} {"train_loss": -5.8944573402404785, "global_step": 59160, "epoch": 1408} {"train_loss": -5.98067045211792, "global_step": 59161, "epoch": 1408} {"train_loss": -5.865213871002197, "global_step": 59162, "epoch": 1408} {"train_loss": -5.8933424949646, "global_step": 59163, "epoch": 1408} {"train_loss": -5.8834333419799805, "global_step": 59164, "epoch": 1408} {"train_loss": -5.7701873779296875, "global_step": 59165, "epoch": 1408} {"train_loss": -5.9141693115234375, "global_step": 59166, "epoch": 1408} {"train_loss": -5.810638904571533, "global_step": 59167, "epoch": 1408} {"train_loss": -5.811858177185059, "global_step": 59168, "epoch": 1408} {"train_loss": -5.94606876373291, "global_step": 59169, "epoch": 1408} {"train_loss": -5.887640476226807, "global_step": 59170, "epoch": 1408} {"train_loss": -5.780478477478027, "global_step": 59171, "epoch": 1408} {"train_loss": -5.8400397300720215, "global_step": 59172, "epoch": 1408} {"train_loss": -5.95974063873291, "global_step": 59173, "epoch": 1408} {"train_loss": -5.918704032897949, "global_step": 59174, "epoch": 1408} {"train_loss": -6.048168182373047, "global_step": 59175, "epoch": 1408} {"train_loss": -5.899211406707764, "global_step": 59176, "epoch": 1408} {"train_loss": -5.884234541938419, "global_step": 59177, "epoch": 1408, "val_loss": 61375.66796875} {"train_loss": -5.943580627441406, "global_step": 59178, "epoch": 1409} {"train_loss": -6.016507148742676, "global_step": 59179, "epoch": 1409} {"train_loss": -5.902334213256836, "global_step": 59180, "epoch": 1409} {"train_loss": -6.02278995513916, "global_step": 59181, "epoch": 1409} {"train_loss": -5.852165699005127, "global_step": 59182, "epoch": 1409} {"train_loss": -5.828893661499023, "global_step": 59183, "epoch": 1409} {"train_loss": -5.863301753997803, "global_step": 59184, "epoch": 1409} {"train_loss": -5.878377914428711, "global_step": 59185, "epoch": 1409} {"train_loss": -5.811339378356934, "global_step": 59186, "epoch": 1409} {"train_loss": -5.8686113357543945, "global_step": 59187, "epoch": 1409} {"train_loss": -5.915102005004883, "global_step": 59188, "epoch": 1409} {"train_loss": -6.004502773284912, "global_step": 59189, "epoch": 1409} {"train_loss": -5.891933441162109, "global_step": 59190, "epoch": 1409} {"train_loss": -5.825645923614502, "global_step": 59191, "epoch": 1409} {"train_loss": -5.838311195373535, "global_step": 59192, "epoch": 1409} {"train_loss": -5.942706108093262, "global_step": 59193, "epoch": 1409} {"train_loss": -5.843689918518066, "global_step": 59194, "epoch": 1409} {"train_loss": -5.880735397338867, "global_step": 59195, "epoch": 1409} {"train_loss": -5.907162666320801, "global_step": 59196, "epoch": 1409} {"train_loss": -5.921131610870361, "global_step": 59197, "epoch": 1409} {"train_loss": -6.070628643035889, "global_step": 59198, "epoch": 1409} {"train_loss": -5.901165962219238, "global_step": 59199, "epoch": 1409} {"train_loss": -5.876730918884277, "global_step": 59200, "epoch": 1409} {"train_loss": -5.779839515686035, "global_step": 59201, "epoch": 1409} {"train_loss": -5.979947090148926, "global_step": 59202, "epoch": 1409} {"train_loss": -5.892226696014404, "global_step": 59203, "epoch": 1409} {"train_loss": -5.843169212341309, "global_step": 59204, "epoch": 1409} {"train_loss": -5.797203063964844, "global_step": 59205, "epoch": 1409} {"train_loss": -5.912298202514648, "global_step": 59206, "epoch": 1409} {"train_loss": -5.765041351318359, "global_step": 59207, "epoch": 1409} {"train_loss": -5.857357025146484, "global_step": 59208, "epoch": 1409} {"train_loss": -5.952381610870361, "global_step": 59209, "epoch": 1409} {"train_loss": -5.833227157592773, "global_step": 59210, "epoch": 1409} {"train_loss": -5.846099853515625, "global_step": 59211, "epoch": 1409} {"train_loss": -5.797459125518799, "global_step": 59212, "epoch": 1409} {"train_loss": -5.922957420349121, "global_step": 59213, "epoch": 1409} {"train_loss": -5.890931129455566, "global_step": 59214, "epoch": 1409} {"train_loss": -5.898978233337402, "global_step": 59215, "epoch": 1409} {"train_loss": -5.930241107940674, "global_step": 59216, "epoch": 1409} {"train_loss": -5.764510154724121, "global_step": 59217, "epoch": 1409} {"train_loss": -5.97556209564209, "global_step": 59218, "epoch": 1409} {"train_loss": -5.890251579738798, "global_step": 59219, "epoch": 1409, "val_loss": 61278.94921875} {"train_loss": -5.910311698913574, "global_step": 59220, "epoch": 1410} {"train_loss": -5.879238128662109, "global_step": 59221, "epoch": 1410} {"train_loss": -5.985034942626953, "global_step": 59222, "epoch": 1410} {"train_loss": -5.904914379119873, "global_step": 59223, "epoch": 1410} {"train_loss": -5.8614983558654785, "global_step": 59224, "epoch": 1410} {"train_loss": -5.9766340255737305, "global_step": 59225, "epoch": 1410} {"train_loss": -5.893363952636719, "global_step": 59226, "epoch": 1410} {"train_loss": -5.93428897857666, "global_step": 59227, "epoch": 1410} {"train_loss": -5.800761699676514, "global_step": 59228, "epoch": 1410} {"train_loss": -5.916660308837891, "global_step": 59229, "epoch": 1410} {"train_loss": -5.955439567565918, "global_step": 59230, "epoch": 1410} {"train_loss": -5.8983869552612305, "global_step": 59231, "epoch": 1410} {"train_loss": -5.9385480880737305, "global_step": 59232, "epoch": 1410} {"train_loss": -5.821781635284424, "global_step": 59233, "epoch": 1410} {"train_loss": -5.852938652038574, "global_step": 59234, "epoch": 1410} {"train_loss": -5.913375377655029, "global_step": 59235, "epoch": 1410} {"train_loss": -5.932206153869629, "global_step": 59236, "epoch": 1410} {"train_loss": -6.097591400146484, "global_step": 59237, "epoch": 1410} {"train_loss": -5.893579006195068, "global_step": 59238, "epoch": 1410} {"train_loss": -5.981414794921875, "global_step": 59239, "epoch": 1410} {"train_loss": -5.900396347045898, "global_step": 59240, "epoch": 1410} {"train_loss": -5.752474308013916, "global_step": 59241, "epoch": 1410} {"train_loss": -5.907203674316406, "global_step": 59242, "epoch": 1410} {"train_loss": -5.802927494049072, "global_step": 59243, "epoch": 1410} {"train_loss": -5.774515628814697, "global_step": 59244, "epoch": 1410} {"train_loss": -5.897512912750244, "global_step": 59245, "epoch": 1410} {"train_loss": -5.8933916091918945, "global_step": 59246, "epoch": 1410} {"train_loss": -5.925380706787109, "global_step": 59247, "epoch": 1410} {"train_loss": -5.828051567077637, "global_step": 59248, "epoch": 1410} {"train_loss": -5.985629558563232, "global_step": 59249, "epoch": 1410} {"train_loss": -5.9617228507995605, "global_step": 59250, "epoch": 1410} {"train_loss": -5.972502708435059, "global_step": 59251, "epoch": 1410} {"train_loss": -5.724956512451172, "global_step": 59252, "epoch": 1410} {"train_loss": -5.942919731140137, "global_step": 59253, "epoch": 1410} {"train_loss": -5.9500732421875, "global_step": 59254, "epoch": 1410} {"train_loss": -5.9765849113464355, "global_step": 59255, "epoch": 1410} {"train_loss": -5.858476638793945, "global_step": 59256, "epoch": 1410} {"train_loss": -5.7475905418396, "global_step": 59257, "epoch": 1410} {"train_loss": -5.970731735229492, "global_step": 59258, "epoch": 1410} {"train_loss": -5.888921737670898, "global_step": 59259, "epoch": 1410} {"train_loss": -5.914366722106934, "global_step": 59260, "epoch": 1410} {"train_loss": -5.900234858194987, "global_step": 59261, "epoch": 1410, "val_loss": 61803.26953125} {"train_loss": -5.808222770690918, "global_step": 59262, "epoch": 1411} {"train_loss": -5.944454669952393, "global_step": 59263, "epoch": 1411} {"train_loss": -5.8816680908203125, "global_step": 59264, "epoch": 1411} {"train_loss": -5.903107643127441, "global_step": 59265, "epoch": 1411} {"train_loss": -5.954740047454834, "global_step": 59266, "epoch": 1411} {"train_loss": -5.974518775939941, "global_step": 59267, "epoch": 1411} {"train_loss": -5.852872371673584, "global_step": 59268, "epoch": 1411} {"train_loss": -6.0657525062561035, "global_step": 59269, "epoch": 1411} {"train_loss": -5.7027788162231445, "global_step": 59270, "epoch": 1411} {"train_loss": -5.935385704040527, "global_step": 59271, "epoch": 1411} {"train_loss": -5.879354476928711, "global_step": 59272, "epoch": 1411} {"train_loss": -5.910445213317871, "global_step": 59273, "epoch": 1411} {"train_loss": -5.956435203552246, "global_step": 59274, "epoch": 1411} {"train_loss": -5.865780830383301, "global_step": 59275, "epoch": 1411} {"train_loss": -5.839271545410156, "global_step": 59276, "epoch": 1411} {"train_loss": -5.907631874084473, "global_step": 59277, "epoch": 1411} {"train_loss": -6.03029727935791, "global_step": 59278, "epoch": 1411} {"train_loss": -5.851741790771484, "global_step": 59279, "epoch": 1411} {"train_loss": -5.941621780395508, "global_step": 59280, "epoch": 1411} {"train_loss": -5.873384475708008, "global_step": 59281, "epoch": 1411} {"train_loss": -5.84763765335083, "global_step": 59282, "epoch": 1411} {"train_loss": -5.860283374786377, "global_step": 59283, "epoch": 1411} {"train_loss": -5.861319541931152, "global_step": 59284, "epoch": 1411} {"train_loss": -5.812918186187744, "global_step": 59285, "epoch": 1411} {"train_loss": -5.881213665008545, "global_step": 59286, "epoch": 1411} {"train_loss": -5.920001983642578, "global_step": 59287, "epoch": 1411} {"train_loss": -6.03781795501709, "global_step": 59288, "epoch": 1411} {"train_loss": -5.958775043487549, "global_step": 59289, "epoch": 1411} {"train_loss": -5.850947380065918, "global_step": 59290, "epoch": 1411} {"train_loss": -5.950955867767334, "global_step": 59291, "epoch": 1411} {"train_loss": -5.924112796783447, "global_step": 59292, "epoch": 1411} {"train_loss": -5.945945739746094, "global_step": 59293, "epoch": 1411} {"train_loss": -5.957937240600586, "global_step": 59294, "epoch": 1411} {"train_loss": -5.8260064125061035, "global_step": 59295, "epoch": 1411} {"train_loss": -5.886129379272461, "global_step": 59296, "epoch": 1411} {"train_loss": -5.798227310180664, "global_step": 59297, "epoch": 1411} {"train_loss": -6.016086578369141, "global_step": 59298, "epoch": 1411} {"train_loss": -5.987740516662598, "global_step": 59299, "epoch": 1411} {"train_loss": -5.880826950073242, "global_step": 59300, "epoch": 1411} {"train_loss": -5.866245269775391, "global_step": 59301, "epoch": 1411} {"train_loss": -5.9742631912231445, "global_step": 59302, "epoch": 1411} {"train_loss": -5.903545493171329, "global_step": 59303, "epoch": 1411, "val_loss": 61410.9921875} {"train_loss": -6.0250749588012695, "global_step": 59304, "epoch": 1412} {"train_loss": -5.934204578399658, "global_step": 59305, "epoch": 1412} {"train_loss": -5.879377365112305, "global_step": 59306, "epoch": 1412} {"train_loss": -5.983290195465088, "global_step": 59307, "epoch": 1412} {"train_loss": -5.80892276763916, "global_step": 59308, "epoch": 1412} {"train_loss": -5.904168128967285, "global_step": 59309, "epoch": 1412} {"train_loss": -5.865493297576904, "global_step": 59310, "epoch": 1412} {"train_loss": -5.840132236480713, "global_step": 59311, "epoch": 1412} {"train_loss": -5.97416353225708, "global_step": 59312, "epoch": 1412} {"train_loss": -5.809439659118652, "global_step": 59313, "epoch": 1412} {"train_loss": -5.807190895080566, "global_step": 59314, "epoch": 1412} {"train_loss": -5.91841983795166, "global_step": 59315, "epoch": 1412} {"train_loss": -5.764432907104492, "global_step": 59316, "epoch": 1412} {"train_loss": -5.805140495300293, "global_step": 59317, "epoch": 1412} {"train_loss": -5.925971031188965, "global_step": 59318, "epoch": 1412} {"train_loss": -5.701173782348633, "global_step": 59319, "epoch": 1412} {"train_loss": -5.829350471496582, "global_step": 59320, "epoch": 1412} {"train_loss": -5.8665056228637695, "global_step": 59321, "epoch": 1412} {"train_loss": -5.873845100402832, "global_step": 59322, "epoch": 1412} {"train_loss": -5.899618148803711, "global_step": 59323, "epoch": 1412} {"train_loss": -5.827165126800537, "global_step": 59324, "epoch": 1412} {"train_loss": -5.86336612701416, "global_step": 59325, "epoch": 1412} {"train_loss": -5.971642971038818, "global_step": 59326, "epoch": 1412} {"train_loss": -5.686915397644043, "global_step": 59327, "epoch": 1412} {"train_loss": -5.79718017578125, "global_step": 59328, "epoch": 1412} {"train_loss": -5.811985969543457, "global_step": 59329, "epoch": 1412} {"train_loss": -5.760802268981934, "global_step": 59330, "epoch": 1412} {"train_loss": -5.8625359535217285, "global_step": 59331, "epoch": 1412} {"train_loss": -5.9342522621154785, "global_step": 59332, "epoch": 1412} {"train_loss": -5.9373931884765625, "global_step": 59333, "epoch": 1412} {"train_loss": -5.864154815673828, "global_step": 59334, "epoch": 1412} {"train_loss": -5.933943748474121, "global_step": 59335, "epoch": 1412} {"train_loss": -5.843026638031006, "global_step": 59336, "epoch": 1412} {"train_loss": -5.860042572021484, "global_step": 59337, "epoch": 1412} {"train_loss": -5.885926246643066, "global_step": 59338, "epoch": 1412} {"train_loss": -5.768271446228027, "global_step": 59339, "epoch": 1412} {"train_loss": -5.912225723266602, "global_step": 59340, "epoch": 1412} {"train_loss": -5.942228317260742, "global_step": 59341, "epoch": 1412} {"train_loss": -5.9783220291137695, "global_step": 59342, "epoch": 1412} {"train_loss": -5.91703987121582, "global_step": 59343, "epoch": 1412} {"train_loss": -5.855226039886475, "global_step": 59344, "epoch": 1412} {"train_loss": -5.87091520854405, "global_step": 59345, "epoch": 1412, "val_loss": 61487.91015625} {"train_loss": -5.944085597991943, "global_step": 59346, "epoch": 1413} {"train_loss": -5.88347053527832, "global_step": 59347, "epoch": 1413} {"train_loss": -5.865556716918945, "global_step": 59348, "epoch": 1413} {"train_loss": -5.8554534912109375, "global_step": 59349, "epoch": 1413} {"train_loss": -5.904526710510254, "global_step": 59350, "epoch": 1413} {"train_loss": -5.8775224685668945, "global_step": 59351, "epoch": 1413} {"train_loss": -5.756397724151611, "global_step": 59352, "epoch": 1413} {"train_loss": -5.858227729797363, "global_step": 59353, "epoch": 1413} {"train_loss": -5.8971967697143555, "global_step": 59354, "epoch": 1413} {"train_loss": -5.898176193237305, "global_step": 59355, "epoch": 1413} {"train_loss": -6.033773422241211, "global_step": 59356, "epoch": 1413} {"train_loss": -5.882474899291992, "global_step": 59357, "epoch": 1413} {"train_loss": -5.850582122802734, "global_step": 59358, "epoch": 1413} {"train_loss": -5.92275333404541, "global_step": 59359, "epoch": 1413} {"train_loss": -5.893586158752441, "global_step": 59360, "epoch": 1413} {"train_loss": -5.880838394165039, "global_step": 59361, "epoch": 1413} {"train_loss": -5.78054666519165, "global_step": 59362, "epoch": 1413} {"train_loss": -5.927807807922363, "global_step": 59363, "epoch": 1413} {"train_loss": -5.929849147796631, "global_step": 59364, "epoch": 1413} {"train_loss": -5.878403663635254, "global_step": 59365, "epoch": 1413} {"train_loss": -5.774759769439697, "global_step": 59366, "epoch": 1413} {"train_loss": -5.773240089416504, "global_step": 59367, "epoch": 1413} {"train_loss": -5.937365531921387, "global_step": 59368, "epoch": 1413} {"train_loss": -5.875935077667236, "global_step": 59369, "epoch": 1413} {"train_loss": -5.979544162750244, "global_step": 59370, "epoch": 1413} {"train_loss": -5.977398872375488, "global_step": 59371, "epoch": 1413} {"train_loss": -5.980937480926514, "global_step": 59372, "epoch": 1413} {"train_loss": -5.835134506225586, "global_step": 59373, "epoch": 1413} {"train_loss": -6.002373695373535, "global_step": 59374, "epoch": 1413} {"train_loss": -5.965448379516602, "global_step": 59375, "epoch": 1413} {"train_loss": -5.946347236633301, "global_step": 59376, "epoch": 1413} {"train_loss": -5.982975959777832, "global_step": 59377, "epoch": 1413} {"train_loss": -5.899950981140137, "global_step": 59378, "epoch": 1413} {"train_loss": -5.88489294052124, "global_step": 59379, "epoch": 1413} {"train_loss": -5.897387981414795, "global_step": 59380, "epoch": 1413} {"train_loss": -5.9061431884765625, "global_step": 59381, "epoch": 1413} {"train_loss": -5.853631019592285, "global_step": 59382, "epoch": 1413} {"train_loss": -5.900691509246826, "global_step": 59383, "epoch": 1413} {"train_loss": -5.930817604064941, "global_step": 59384, "epoch": 1413} {"train_loss": -5.964890003204346, "global_step": 59385, "epoch": 1413} {"train_loss": -5.906364440917969, "global_step": 59386, "epoch": 1413} {"train_loss": -5.899614277340117, "global_step": 59387, "epoch": 1413, "val_loss": 61348.7109375} {"train_loss": -5.912469863891602, "global_step": 59388, "epoch": 1414} {"train_loss": -5.848696708679199, "global_step": 59389, "epoch": 1414} {"train_loss": -5.75123405456543, "global_step": 59390, "epoch": 1414} {"train_loss": -5.962418079376221, "global_step": 59391, "epoch": 1414} {"train_loss": -5.84719181060791, "global_step": 59392, "epoch": 1414} {"train_loss": -5.770840167999268, "global_step": 59393, "epoch": 1414} {"train_loss": -5.876781940460205, "global_step": 59394, "epoch": 1414} {"train_loss": -5.83678674697876, "global_step": 59395, "epoch": 1414} {"train_loss": -5.841763496398926, "global_step": 59396, "epoch": 1414} {"train_loss": -5.781515121459961, "global_step": 59397, "epoch": 1414} {"train_loss": -5.9974589347839355, "global_step": 59398, "epoch": 1414} {"train_loss": -5.917742729187012, "global_step": 59399, "epoch": 1414} {"train_loss": -5.9568586349487305, "global_step": 59400, "epoch": 1414} {"train_loss": -5.939705848693848, "global_step": 59401, "epoch": 1414} {"train_loss": -5.844449520111084, "global_step": 59402, "epoch": 1414} {"train_loss": -5.921408653259277, "global_step": 59403, "epoch": 1414} {"train_loss": -5.973040580749512, "global_step": 59404, "epoch": 1414} {"train_loss": -5.861661911010742, "global_step": 59405, "epoch": 1414} {"train_loss": -5.86484432220459, "global_step": 59406, "epoch": 1414} {"train_loss": -5.839089393615723, "global_step": 59407, "epoch": 1414} {"train_loss": -5.902209281921387, "global_step": 59408, "epoch": 1414} {"train_loss": -5.740044593811035, "global_step": 59409, "epoch": 1414} {"train_loss": -5.882083892822266, "global_step": 59410, "epoch": 1414} {"train_loss": -5.749211311340332, "global_step": 59411, "epoch": 1414} {"train_loss": -5.785774230957031, "global_step": 59412, "epoch": 1414} {"train_loss": -5.875347137451172, "global_step": 59413, "epoch": 1414} {"train_loss": -5.905925750732422, "global_step": 59414, "epoch": 1414} {"train_loss": -5.712508678436279, "global_step": 59415, "epoch": 1414} {"train_loss": -5.985175132751465, "global_step": 59416, "epoch": 1414} {"train_loss": -5.733755111694336, "global_step": 59417, "epoch": 1414} {"train_loss": -5.724165916442871, "global_step": 59418, "epoch": 1414} {"train_loss": -5.8848419189453125, "global_step": 59419, "epoch": 1414} {"train_loss": -5.827768802642822, "global_step": 59420, "epoch": 1414} {"train_loss": -5.806802749633789, "global_step": 59421, "epoch": 1414} {"train_loss": -5.732714653015137, "global_step": 59422, "epoch": 1414} {"train_loss": -5.871763229370117, "global_step": 59423, "epoch": 1414} {"train_loss": -5.793652057647705, "global_step": 59424, "epoch": 1414} {"train_loss": -5.876957893371582, "global_step": 59425, "epoch": 1414} {"train_loss": -5.75809907913208, "global_step": 59426, "epoch": 1414} {"train_loss": -5.832699775695801, "global_step": 59427, "epoch": 1414} {"train_loss": -5.903364181518555, "global_step": 59428, "epoch": 1414} {"train_loss": -5.849882035028367, "global_step": 59429, "epoch": 1414, "val_loss": 61162.234375} {"train_loss": -5.762465953826904, "global_step": 59430, "epoch": 1415} {"train_loss": -5.949679374694824, "global_step": 59431, "epoch": 1415} {"train_loss": -5.811723709106445, "global_step": 59432, "epoch": 1415} {"train_loss": -6.007962703704834, "global_step": 59433, "epoch": 1415} {"train_loss": -5.8391828536987305, "global_step": 59434, "epoch": 1415} {"train_loss": -5.911698341369629, "global_step": 59435, "epoch": 1415} {"train_loss": -5.831269264221191, "global_step": 59436, "epoch": 1415} {"train_loss": -5.909623146057129, "global_step": 59437, "epoch": 1415} {"train_loss": -6.020712852478027, "global_step": 59438, "epoch": 1415} {"train_loss": -5.936550140380859, "global_step": 59439, "epoch": 1415} {"train_loss": -5.883960723876953, "global_step": 59440, "epoch": 1415} {"train_loss": -5.94674015045166, "global_step": 59441, "epoch": 1415} {"train_loss": -5.701843738555908, "global_step": 59442, "epoch": 1415} {"train_loss": -5.902570724487305, "global_step": 59443, "epoch": 1415} {"train_loss": -5.869149208068848, "global_step": 59444, "epoch": 1415} {"train_loss": -5.83781623840332, "global_step": 59445, "epoch": 1415} {"train_loss": -5.886111736297607, "global_step": 59446, "epoch": 1415} {"train_loss": -5.833944797515869, "global_step": 59447, "epoch": 1415} {"train_loss": -5.9761199951171875, "global_step": 59448, "epoch": 1415} {"train_loss": -5.928362846374512, "global_step": 59449, "epoch": 1415} {"train_loss": -5.922693729400635, "global_step": 59450, "epoch": 1415} {"train_loss": -5.939870357513428, "global_step": 59451, "epoch": 1415} {"train_loss": -5.89141845703125, "global_step": 59452, "epoch": 1415} {"train_loss": -5.95306396484375, "global_step": 59453, "epoch": 1415} {"train_loss": -5.87939453125, "global_step": 59454, "epoch": 1415} {"train_loss": -5.8911027908325195, "global_step": 59455, "epoch": 1415} {"train_loss": -5.7216081619262695, "global_step": 59456, "epoch": 1415} {"train_loss": -5.758655071258545, "global_step": 59457, "epoch": 1415} {"train_loss": -5.928030014038086, "global_step": 59458, "epoch": 1415} {"train_loss": -5.798530101776123, "global_step": 59459, "epoch": 1415} {"train_loss": -5.9928460121154785, "global_step": 59460, "epoch": 1415} {"train_loss": -5.680340766906738, "global_step": 59461, "epoch": 1415} {"train_loss": -5.830594062805176, "global_step": 59462, "epoch": 1415} {"train_loss": -5.840081214904785, "global_step": 59463, "epoch": 1415} {"train_loss": -5.827133655548096, "global_step": 59464, "epoch": 1415} {"train_loss": -5.993721961975098, "global_step": 59465, "epoch": 1415} {"train_loss": -5.814050197601318, "global_step": 59466, "epoch": 1415} {"train_loss": -5.973036766052246, "global_step": 59467, "epoch": 1415} {"train_loss": -5.84440803527832, "global_step": 59468, "epoch": 1415} {"train_loss": -5.881708145141602, "global_step": 59469, "epoch": 1415} {"train_loss": -5.906388282775879, "global_step": 59470, "epoch": 1415} {"train_loss": -5.879840135574341, "global_step": 59471, "epoch": 1415, "val_loss": 61226.70703125} {"train_loss": -6.07765531539917, "global_step": 59472, "epoch": 1416} {"train_loss": -5.862648010253906, "global_step": 59473, "epoch": 1416} {"train_loss": -5.956220626831055, "global_step": 59474, "epoch": 1416} {"train_loss": -5.919679641723633, "global_step": 59475, "epoch": 1416} {"train_loss": -5.965824127197266, "global_step": 59476, "epoch": 1416} {"train_loss": -5.955883026123047, "global_step": 59477, "epoch": 1416} {"train_loss": -5.926649570465088, "global_step": 59478, "epoch": 1416} {"train_loss": -6.005906105041504, "global_step": 59479, "epoch": 1416} {"train_loss": -5.865492820739746, "global_step": 59480, "epoch": 1416} {"train_loss": -5.979127407073975, "global_step": 59481, "epoch": 1416} {"train_loss": -5.885504245758057, "global_step": 59482, "epoch": 1416} {"train_loss": -5.870720386505127, "global_step": 59483, "epoch": 1416} {"train_loss": -5.77486515045166, "global_step": 59484, "epoch": 1416} {"train_loss": -5.851507186889648, "global_step": 59485, "epoch": 1416} {"train_loss": -5.970726013183594, "global_step": 59486, "epoch": 1416} {"train_loss": -5.763993263244629, "global_step": 59487, "epoch": 1416} {"train_loss": -5.846012115478516, "global_step": 59488, "epoch": 1416} {"train_loss": -5.7737579345703125, "global_step": 59489, "epoch": 1416} {"train_loss": -5.8653564453125, "global_step": 59490, "epoch": 1416} {"train_loss": -5.820722579956055, "global_step": 59491, "epoch": 1416} {"train_loss": -5.88321590423584, "global_step": 59492, "epoch": 1416} {"train_loss": -5.815923690795898, "global_step": 59493, "epoch": 1416} {"train_loss": -5.663186550140381, "global_step": 59494, "epoch": 1416} {"train_loss": -5.890252113342285, "global_step": 59495, "epoch": 1416} {"train_loss": -5.809605598449707, "global_step": 59496, "epoch": 1416} {"train_loss": -5.755857467651367, "global_step": 59497, "epoch": 1416} {"train_loss": -5.958587646484375, "global_step": 59498, "epoch": 1416} {"train_loss": -5.776440620422363, "global_step": 59499, "epoch": 1416} {"train_loss": -5.895307540893555, "global_step": 59500, "epoch": 1416} {"train_loss": -5.800151348114014, "global_step": 59501, "epoch": 1416} {"train_loss": -5.842395782470703, "global_step": 59502, "epoch": 1416} {"train_loss": -5.899346351623535, "global_step": 59503, "epoch": 1416} {"train_loss": -5.877966403961182, "global_step": 59504, "epoch": 1416} {"train_loss": -5.830931663513184, "global_step": 59505, "epoch": 1416} {"train_loss": -5.905524730682373, "global_step": 59506, "epoch": 1416} {"train_loss": -5.962558269500732, "global_step": 59507, "epoch": 1416} {"train_loss": -5.885348320007324, "global_step": 59508, "epoch": 1416} {"train_loss": -5.900273323059082, "global_step": 59509, "epoch": 1416} {"train_loss": -5.891905307769775, "global_step": 59510, "epoch": 1416} {"train_loss": -5.678733825683594, "global_step": 59511, "epoch": 1416} {"train_loss": -5.816642761230469, "global_step": 59512, "epoch": 1416} {"train_loss": -5.869846264521281, "global_step": 59513, "epoch": 1416, "val_loss": 61317.5859375} {"train_loss": -5.9928436279296875, "global_step": 59514, "epoch": 1417} {"train_loss": -5.785915374755859, "global_step": 59515, "epoch": 1417} {"train_loss": -5.889200687408447, "global_step": 59516, "epoch": 1417} {"train_loss": -5.97553825378418, "global_step": 59517, "epoch": 1417} {"train_loss": -5.867483139038086, "global_step": 59518, "epoch": 1417} {"train_loss": -5.935481071472168, "global_step": 59519, "epoch": 1417} {"train_loss": -5.752601623535156, "global_step": 59520, "epoch": 1417} {"train_loss": -5.925919532775879, "global_step": 59521, "epoch": 1417} {"train_loss": -5.936057090759277, "global_step": 59522, "epoch": 1417} {"train_loss": -5.901188850402832, "global_step": 59523, "epoch": 1417} {"train_loss": -5.869790077209473, "global_step": 59524, "epoch": 1417} {"train_loss": -5.919752597808838, "global_step": 59525, "epoch": 1417} {"train_loss": -5.827926158905029, "global_step": 59526, "epoch": 1417} {"train_loss": -5.889959335327148, "global_step": 59527, "epoch": 1417} {"train_loss": -5.822750091552734, "global_step": 59528, "epoch": 1417} {"train_loss": -5.822904109954834, "global_step": 59529, "epoch": 1417} {"train_loss": -5.89039945602417, "global_step": 59530, "epoch": 1417} {"train_loss": -5.967557907104492, "global_step": 59531, "epoch": 1417} {"train_loss": -5.961633682250977, "global_step": 59532, "epoch": 1417} {"train_loss": -5.9059529304504395, "global_step": 59533, "epoch": 1417} {"train_loss": -5.895073890686035, "global_step": 59534, "epoch": 1417} {"train_loss": -5.970998764038086, "global_step": 59535, "epoch": 1417} {"train_loss": -5.936505317687988, "global_step": 59536, "epoch": 1417} {"train_loss": -5.921023368835449, "global_step": 59537, "epoch": 1417} {"train_loss": -5.943874835968018, "global_step": 59538, "epoch": 1417} {"train_loss": -5.876723766326904, "global_step": 59539, "epoch": 1417} {"train_loss": -5.934398651123047, "global_step": 59540, "epoch": 1417} {"train_loss": -5.905553817749023, "global_step": 59541, "epoch": 1417} {"train_loss": -6.017508506774902, "global_step": 59542, "epoch": 1417} {"train_loss": -5.869810104370117, "global_step": 59543, "epoch": 1417} {"train_loss": -5.913822174072266, "global_step": 59544, "epoch": 1417} {"train_loss": -5.925256729125977, "global_step": 59545, "epoch": 1417} {"train_loss": -5.825321197509766, "global_step": 59546, "epoch": 1417} {"train_loss": -5.803475379943848, "global_step": 59547, "epoch": 1417} {"train_loss": -5.829960823059082, "global_step": 59548, "epoch": 1417} {"train_loss": -5.942788124084473, "global_step": 59549, "epoch": 1417} {"train_loss": -5.865218162536621, "global_step": 59550, "epoch": 1417} {"train_loss": -5.868603706359863, "global_step": 59551, "epoch": 1417} {"train_loss": -5.922513008117676, "global_step": 59552, "epoch": 1417} {"train_loss": -5.942049026489258, "global_step": 59553, "epoch": 1417} {"train_loss": -6.026823997497559, "global_step": 59554, "epoch": 1417} {"train_loss": -5.901468299684071, "global_step": 59555, "epoch": 1417, "val_loss": 61249.98046875} {"train_loss": -5.948080062866211, "global_step": 59556, "epoch": 1418} {"train_loss": -5.938435077667236, "global_step": 59557, "epoch": 1418} {"train_loss": -5.904646873474121, "global_step": 59558, "epoch": 1418} {"train_loss": -5.868151664733887, "global_step": 59559, "epoch": 1418} {"train_loss": -6.017339706420898, "global_step": 59560, "epoch": 1418} {"train_loss": -5.908724784851074, "global_step": 59561, "epoch": 1418} {"train_loss": -5.935837745666504, "global_step": 59562, "epoch": 1418} {"train_loss": -5.956454277038574, "global_step": 59563, "epoch": 1418} {"train_loss": -5.848118305206299, "global_step": 59564, "epoch": 1418} {"train_loss": -5.887373924255371, "global_step": 59565, "epoch": 1418} {"train_loss": -6.025525093078613, "global_step": 59566, "epoch": 1418} {"train_loss": -5.897417068481445, "global_step": 59567, "epoch": 1418} {"train_loss": -6.005708694458008, "global_step": 59568, "epoch": 1418} {"train_loss": -5.8632612228393555, "global_step": 59569, "epoch": 1418} {"train_loss": -5.933218002319336, "global_step": 59570, "epoch": 1418} {"train_loss": -5.822789192199707, "global_step": 59571, "epoch": 1418} {"train_loss": -5.9396233558654785, "global_step": 59572, "epoch": 1418} {"train_loss": -5.981823921203613, "global_step": 59573, "epoch": 1418} {"train_loss": -5.933326721191406, "global_step": 59574, "epoch": 1418} {"train_loss": -5.860325813293457, "global_step": 59575, "epoch": 1418} {"train_loss": -5.9333624839782715, "global_step": 59576, "epoch": 1418} {"train_loss": -5.8931732177734375, "global_step": 59577, "epoch": 1418} {"train_loss": -5.983966827392578, "global_step": 59578, "epoch": 1418} {"train_loss": -5.886601448059082, "global_step": 59579, "epoch": 1418} {"train_loss": -5.831961631774902, "global_step": 59580, "epoch": 1418} {"train_loss": -5.892303466796875, "global_step": 59581, "epoch": 1418} {"train_loss": -5.860129356384277, "global_step": 59582, "epoch": 1418} {"train_loss": -5.823058605194092, "global_step": 59583, "epoch": 1418} {"train_loss": -5.955739974975586, "global_step": 59584, "epoch": 1418} {"train_loss": -5.897690773010254, "global_step": 59585, "epoch": 1418} {"train_loss": -5.881460189819336, "global_step": 59586, "epoch": 1418} {"train_loss": -5.961360931396484, "global_step": 59587, "epoch": 1418} {"train_loss": -6.004953384399414, "global_step": 59588, "epoch": 1418} {"train_loss": -5.834018707275391, "global_step": 59589, "epoch": 1418} {"train_loss": -5.8432393074035645, "global_step": 59590, "epoch": 1418} {"train_loss": -5.911894798278809, "global_step": 59591, "epoch": 1418} {"train_loss": -5.985224723815918, "global_step": 59592, "epoch": 1418} {"train_loss": -5.787741661071777, "global_step": 59593, "epoch": 1418} {"train_loss": -5.949290752410889, "global_step": 59594, "epoch": 1418} {"train_loss": -5.879627704620361, "global_step": 59595, "epoch": 1418} {"train_loss": -5.912280082702637, "global_step": 59596, "epoch": 1418} {"train_loss": -5.912245580128261, "global_step": 59597, "epoch": 1418, "val_loss": 61473.0546875} {"train_loss": -5.940001964569092, "global_step": 59598, "epoch": 1419} {"train_loss": -5.8984246253967285, "global_step": 59599, "epoch": 1419} {"train_loss": -5.896754741668701, "global_step": 59600, "epoch": 1419} {"train_loss": -5.9491167068481445, "global_step": 59601, "epoch": 1419} {"train_loss": -5.998784065246582, "global_step": 59602, "epoch": 1419} {"train_loss": -5.938709259033203, "global_step": 59603, "epoch": 1419} {"train_loss": -5.806889533996582, "global_step": 59604, "epoch": 1419} {"train_loss": -5.961153030395508, "global_step": 59605, "epoch": 1419} {"train_loss": -5.815486907958984, "global_step": 59606, "epoch": 1419} {"train_loss": -5.972635746002197, "global_step": 59607, "epoch": 1419} {"train_loss": -5.976700782775879, "global_step": 59608, "epoch": 1419} {"train_loss": -5.960933208465576, "global_step": 59609, "epoch": 1419} {"train_loss": -6.041170597076416, "global_step": 59610, "epoch": 1419} {"train_loss": -6.063053131103516, "global_step": 59611, "epoch": 1419} {"train_loss": -5.918404579162598, "global_step": 59612, "epoch": 1419} {"train_loss": -5.8663177490234375, "global_step": 59613, "epoch": 1419} {"train_loss": -5.8649067878723145, "global_step": 59614, "epoch": 1419} {"train_loss": -5.844954967498779, "global_step": 59615, "epoch": 1419} {"train_loss": -5.879375457763672, "global_step": 59616, "epoch": 1419} {"train_loss": -5.926053047180176, "global_step": 59617, "epoch": 1419} {"train_loss": -5.989294528961182, "global_step": 59618, "epoch": 1419} {"train_loss": -5.8257575035095215, "global_step": 59619, "epoch": 1419} {"train_loss": -5.758933067321777, "global_step": 59620, "epoch": 1419} {"train_loss": -5.991583824157715, "global_step": 59621, "epoch": 1419} {"train_loss": -5.822403907775879, "global_step": 59622, "epoch": 1419} {"train_loss": -5.876303672790527, "global_step": 59623, "epoch": 1419} {"train_loss": -5.881651878356934, "global_step": 59624, "epoch": 1419} {"train_loss": -5.887086868286133, "global_step": 59625, "epoch": 1419} {"train_loss": -5.799493789672852, "global_step": 59626, "epoch": 1419} {"train_loss": -5.9255900382995605, "global_step": 59627, "epoch": 1419} {"train_loss": -5.800817489624023, "global_step": 59628, "epoch": 1419} {"train_loss": -5.980178356170654, "global_step": 59629, "epoch": 1419} {"train_loss": -5.993809700012207, "global_step": 59630, "epoch": 1419} {"train_loss": -5.945717811584473, "global_step": 59631, "epoch": 1419} {"train_loss": -5.932000637054443, "global_step": 59632, "epoch": 1419} {"train_loss": -5.837380409240723, "global_step": 59633, "epoch": 1419} {"train_loss": -6.081634521484375, "global_step": 59634, "epoch": 1419} {"train_loss": -5.980401515960693, "global_step": 59635, "epoch": 1419} {"train_loss": -5.852622985839844, "global_step": 59636, "epoch": 1419} {"train_loss": -5.962773323059082, "global_step": 59637, "epoch": 1419} {"train_loss": -5.828934192657471, "global_step": 59638, "epoch": 1419} {"train_loss": -5.9121476127987815, "global_step": 59639, "epoch": 1419, "val_loss": 61280.9921875} {"train_loss": -5.914749622344971, "global_step": 59640, "epoch": 1420} {"train_loss": -5.835687637329102, "global_step": 59641, "epoch": 1420} {"train_loss": -5.979716777801514, "global_step": 59642, "epoch": 1420} {"train_loss": -5.895263671875, "global_step": 59643, "epoch": 1420} {"train_loss": -6.001683235168457, "global_step": 59644, "epoch": 1420} {"train_loss": -5.903005599975586, "global_step": 59645, "epoch": 1420} {"train_loss": -5.871173858642578, "global_step": 59646, "epoch": 1420} {"train_loss": -5.866085052490234, "global_step": 59647, "epoch": 1420} {"train_loss": -5.947000503540039, "global_step": 59648, "epoch": 1420} {"train_loss": -5.983713150024414, "global_step": 59649, "epoch": 1420} {"train_loss": -6.003771781921387, "global_step": 59650, "epoch": 1420} {"train_loss": -6.024301528930664, "global_step": 59651, "epoch": 1420} {"train_loss": -5.943968772888184, "global_step": 59652, "epoch": 1420} {"train_loss": -5.86726713180542, "global_step": 59653, "epoch": 1420} {"train_loss": -5.932331085205078, "global_step": 59654, "epoch": 1420} {"train_loss": -5.809379577636719, "global_step": 59655, "epoch": 1420} {"train_loss": -5.85984992980957, "global_step": 59656, "epoch": 1420} {"train_loss": -5.9584550857543945, "global_step": 59657, "epoch": 1420} {"train_loss": -5.831080913543701, "global_step": 59658, "epoch": 1420} {"train_loss": -5.873267650604248, "global_step": 59659, "epoch": 1420} {"train_loss": -5.812530040740967, "global_step": 59660, "epoch": 1420} {"train_loss": -5.86857271194458, "global_step": 59661, "epoch": 1420} {"train_loss": -5.786720275878906, "global_step": 59662, "epoch": 1420} {"train_loss": -5.85477352142334, "global_step": 59663, "epoch": 1420} {"train_loss": -5.878161430358887, "global_step": 59664, "epoch": 1420} {"train_loss": -5.773711204528809, "global_step": 59665, "epoch": 1420} {"train_loss": -5.9362945556640625, "global_step": 59666, "epoch": 1420} {"train_loss": -5.98268985748291, "global_step": 59667, "epoch": 1420} {"train_loss": -5.816100120544434, "global_step": 59668, "epoch": 1420} {"train_loss": -5.892693996429443, "global_step": 59669, "epoch": 1420} {"train_loss": -5.867968559265137, "global_step": 59670, "epoch": 1420} {"train_loss": -5.844234466552734, "global_step": 59671, "epoch": 1420} {"train_loss": -5.873181343078613, "global_step": 59672, "epoch": 1420} {"train_loss": -5.7610578536987305, "global_step": 59673, "epoch": 1420} {"train_loss": -5.968569278717041, "global_step": 59674, "epoch": 1420} {"train_loss": -5.943713188171387, "global_step": 59675, "epoch": 1420} {"train_loss": -5.84257698059082, "global_step": 59676, "epoch": 1420} {"train_loss": -6.019441604614258, "global_step": 59677, "epoch": 1420} {"train_loss": -5.97135591506958, "global_step": 59678, "epoch": 1420} {"train_loss": -5.892986297607422, "global_step": 59679, "epoch": 1420} {"train_loss": -5.995238304138184, "global_step": 59680, "epoch": 1420} {"train_loss": -5.899872813905988, "global_step": 59681, "epoch": 1420, "val_loss": 61507.453125} {"train_loss": -5.941511154174805, "global_step": 59682, "epoch": 1421} {"train_loss": -6.037333965301514, "global_step": 59683, "epoch": 1421} {"train_loss": -5.999998092651367, "global_step": 59684, "epoch": 1421} {"train_loss": -5.821910858154297, "global_step": 59685, "epoch": 1421} {"train_loss": -5.882663726806641, "global_step": 59686, "epoch": 1421} {"train_loss": -5.742393493652344, "global_step": 59687, "epoch": 1421} {"train_loss": -5.989500999450684, "global_step": 59688, "epoch": 1421} {"train_loss": -5.833992004394531, "global_step": 59689, "epoch": 1421} {"train_loss": -5.975701332092285, "global_step": 59690, "epoch": 1421} {"train_loss": -5.7301530838012695, "global_step": 59691, "epoch": 1421} {"train_loss": -5.77202033996582, "global_step": 59692, "epoch": 1421} {"train_loss": -5.8413004875183105, "global_step": 59693, "epoch": 1421} {"train_loss": -5.911330699920654, "global_step": 59694, "epoch": 1421} {"train_loss": -5.736188888549805, "global_step": 59695, "epoch": 1421} {"train_loss": -5.838644981384277, "global_step": 59696, "epoch": 1421} {"train_loss": -5.950265407562256, "global_step": 59697, "epoch": 1421} {"train_loss": -5.8486528396606445, "global_step": 59698, "epoch": 1421} {"train_loss": -5.777358055114746, "global_step": 59699, "epoch": 1421} {"train_loss": -5.74727725982666, "global_step": 59700, "epoch": 1421} {"train_loss": -5.910167694091797, "global_step": 59701, "epoch": 1421} {"train_loss": -5.875261306762695, "global_step": 59702, "epoch": 1421} {"train_loss": -5.86076021194458, "global_step": 59703, "epoch": 1421} {"train_loss": -5.79625129699707, "global_step": 59704, "epoch": 1421} {"train_loss": -5.826414108276367, "global_step": 59705, "epoch": 1421} {"train_loss": -5.814767837524414, "global_step": 59706, "epoch": 1421} {"train_loss": -5.9643073081970215, "global_step": 59707, "epoch": 1421} {"train_loss": -5.892455101013184, "global_step": 59708, "epoch": 1421} {"train_loss": -5.948166847229004, "global_step": 59709, "epoch": 1421} {"train_loss": -5.877893447875977, "global_step": 59710, "epoch": 1421} {"train_loss": -5.841104984283447, "global_step": 59711, "epoch": 1421} {"train_loss": -5.963752746582031, "global_step": 59712, "epoch": 1421} {"train_loss": -5.913031578063965, "global_step": 59713, "epoch": 1421} {"train_loss": -5.788537979125977, "global_step": 59714, "epoch": 1421} {"train_loss": -5.838859558105469, "global_step": 59715, "epoch": 1421} {"train_loss": -5.927660942077637, "global_step": 59716, "epoch": 1421} {"train_loss": -5.852845191955566, "global_step": 59717, "epoch": 1421} {"train_loss": -5.931102752685547, "global_step": 59718, "epoch": 1421} {"train_loss": -6.085296630859375, "global_step": 59719, "epoch": 1421} {"train_loss": -5.94538688659668, "global_step": 59720, "epoch": 1421} {"train_loss": -5.937751293182373, "global_step": 59721, "epoch": 1421} {"train_loss": -5.92358922958374, "global_step": 59722, "epoch": 1421} {"train_loss": -5.882834548041934, "global_step": 59723, "epoch": 1421, "val_loss": 61215.0} {"train_loss": -5.968544960021973, "global_step": 59724, "epoch": 1422} {"train_loss": -5.982905387878418, "global_step": 59725, "epoch": 1422} {"train_loss": -5.910152435302734, "global_step": 59726, "epoch": 1422} {"train_loss": -5.878781795501709, "global_step": 59727, "epoch": 1422} {"train_loss": -5.847742080688477, "global_step": 59728, "epoch": 1422} {"train_loss": -5.909793853759766, "global_step": 59729, "epoch": 1422} {"train_loss": -5.923040390014648, "global_step": 59730, "epoch": 1422} {"train_loss": -5.863410949707031, "global_step": 59731, "epoch": 1422} {"train_loss": -5.7676496505737305, "global_step": 59732, "epoch": 1422} {"train_loss": -5.778374195098877, "global_step": 59733, "epoch": 1422} {"train_loss": -5.873384475708008, "global_step": 59734, "epoch": 1422} {"train_loss": -5.720084190368652, "global_step": 59735, "epoch": 1422} {"train_loss": -5.764488697052002, "global_step": 59736, "epoch": 1422} {"train_loss": -5.7213287353515625, "global_step": 59737, "epoch": 1422} {"train_loss": -5.999645233154297, "global_step": 59738, "epoch": 1422} {"train_loss": -5.681824684143066, "global_step": 59739, "epoch": 1422} {"train_loss": -5.87264347076416, "global_step": 59740, "epoch": 1422} {"train_loss": -5.825522422790527, "global_step": 59741, "epoch": 1422} {"train_loss": -5.861855506896973, "global_step": 59742, "epoch": 1422} {"train_loss": -5.755141258239746, "global_step": 59743, "epoch": 1422} {"train_loss": -5.806880950927734, "global_step": 59744, "epoch": 1422} {"train_loss": -5.959338188171387, "global_step": 59745, "epoch": 1422} {"train_loss": -5.818723678588867, "global_step": 59746, "epoch": 1422} {"train_loss": -5.834458351135254, "global_step": 59747, "epoch": 1422} {"train_loss": -5.776866436004639, "global_step": 59748, "epoch": 1422} {"train_loss": -5.946523189544678, "global_step": 59749, "epoch": 1422} {"train_loss": -5.813590049743652, "global_step": 59750, "epoch": 1422} {"train_loss": -5.877457141876221, "global_step": 59751, "epoch": 1422} {"train_loss": -5.884231090545654, "global_step": 59752, "epoch": 1422} {"train_loss": -5.825735569000244, "global_step": 59753, "epoch": 1422} {"train_loss": -5.8642497062683105, "global_step": 59754, "epoch": 1422} {"train_loss": -5.904892921447754, "global_step": 59755, "epoch": 1422} {"train_loss": -5.875950813293457, "global_step": 59756, "epoch": 1422} {"train_loss": -5.829135894775391, "global_step": 59757, "epoch": 1422} {"train_loss": -6.092244625091553, "global_step": 59758, "epoch": 1422} {"train_loss": -5.905482292175293, "global_step": 59759, "epoch": 1422} {"train_loss": -5.921815872192383, "global_step": 59760, "epoch": 1422} {"train_loss": -5.91251802444458, "global_step": 59761, "epoch": 1422} {"train_loss": -5.903757095336914, "global_step": 59762, "epoch": 1422} {"train_loss": -5.979121208190918, "global_step": 59763, "epoch": 1422} {"train_loss": -5.931998252868652, "global_step": 59764, "epoch": 1422} {"train_loss": -5.868668567566645, "global_step": 59765, "epoch": 1422, "val_loss": 61248.7421875} {"train_loss": -5.785901069641113, "global_step": 59766, "epoch": 1423} {"train_loss": -5.942409515380859, "global_step": 59767, "epoch": 1423} {"train_loss": -5.9089555740356445, "global_step": 59768, "epoch": 1423} {"train_loss": -5.822512626647949, "global_step": 59769, "epoch": 1423} {"train_loss": -5.970462322235107, "global_step": 59770, "epoch": 1423} {"train_loss": -5.963876724243164, "global_step": 59771, "epoch": 1423} {"train_loss": -5.8968825340271, "global_step": 59772, "epoch": 1423} {"train_loss": -6.015402793884277, "global_step": 59773, "epoch": 1423} {"train_loss": -5.903684616088867, "global_step": 59774, "epoch": 1423} {"train_loss": -5.909551620483398, "global_step": 59775, "epoch": 1423} {"train_loss": -6.039442539215088, "global_step": 59776, "epoch": 1423} {"train_loss": -6.030965805053711, "global_step": 59777, "epoch": 1423} {"train_loss": -5.851175785064697, "global_step": 59778, "epoch": 1423} {"train_loss": -6.0474853515625, "global_step": 59779, "epoch": 1423} {"train_loss": -5.919006824493408, "global_step": 59780, "epoch": 1423} {"train_loss": -5.8348069190979, "global_step": 59781, "epoch": 1423} {"train_loss": -5.940786361694336, "global_step": 59782, "epoch": 1423} {"train_loss": -5.81120491027832, "global_step": 59783, "epoch": 1423} {"train_loss": -5.818857192993164, "global_step": 59784, "epoch": 1423} {"train_loss": -5.8102312088012695, "global_step": 59785, "epoch": 1423} {"train_loss": -5.861362457275391, "global_step": 59786, "epoch": 1423} {"train_loss": -5.807741165161133, "global_step": 59787, "epoch": 1423} {"train_loss": -6.057940483093262, "global_step": 59788, "epoch": 1423} {"train_loss": -5.863299369812012, "global_step": 59789, "epoch": 1423} {"train_loss": -5.989252090454102, "global_step": 59790, "epoch": 1423} {"train_loss": -5.81447696685791, "global_step": 59791, "epoch": 1423} {"train_loss": -6.015109062194824, "global_step": 59792, "epoch": 1423} {"train_loss": -5.7979631423950195, "global_step": 59793, "epoch": 1423} {"train_loss": -5.991405487060547, "global_step": 59794, "epoch": 1423} {"train_loss": -5.930878639221191, "global_step": 59795, "epoch": 1423} {"train_loss": -5.866701126098633, "global_step": 59796, "epoch": 1423} {"train_loss": -6.034300804138184, "global_step": 59797, "epoch": 1423} {"train_loss": -5.8477783203125, "global_step": 59798, "epoch": 1423} {"train_loss": -5.756608009338379, "global_step": 59799, "epoch": 1423} {"train_loss": -5.9493279457092285, "global_step": 59800, "epoch": 1423} {"train_loss": -5.816798210144043, "global_step": 59801, "epoch": 1423} {"train_loss": -5.916957378387451, "global_step": 59802, "epoch": 1423} {"train_loss": -5.892111301422119, "global_step": 59803, "epoch": 1423} {"train_loss": -5.807649612426758, "global_step": 59804, "epoch": 1423} {"train_loss": -5.992225170135498, "global_step": 59805, "epoch": 1423} {"train_loss": -5.938227653503418, "global_step": 59806, "epoch": 1423} {"train_loss": -5.904223146892729, "global_step": 59807, "epoch": 1423, "val_loss": 61510.46875} {"train_loss": -5.999009609222412, "global_step": 59808, "epoch": 1424} {"train_loss": -5.827323913574219, "global_step": 59809, "epoch": 1424} {"train_loss": -5.923094749450684, "global_step": 59810, "epoch": 1424} {"train_loss": -5.941641330718994, "global_step": 59811, "epoch": 1424} {"train_loss": -5.829250335693359, "global_step": 59812, "epoch": 1424} {"train_loss": -5.902945518493652, "global_step": 59813, "epoch": 1424} {"train_loss": -5.848364353179932, "global_step": 59814, "epoch": 1424} {"train_loss": -5.7953596115112305, "global_step": 59815, "epoch": 1424} {"train_loss": -5.8486504554748535, "global_step": 59816, "epoch": 1424} {"train_loss": -5.865823745727539, "global_step": 59817, "epoch": 1424} {"train_loss": -5.734577178955078, "global_step": 59818, "epoch": 1424} {"train_loss": -5.991005897521973, "global_step": 59819, "epoch": 1424} {"train_loss": -5.608219146728516, "global_step": 59820, "epoch": 1424} {"train_loss": -5.7671966552734375, "global_step": 59821, "epoch": 1424} {"train_loss": -5.780170440673828, "global_step": 59822, "epoch": 1424} {"train_loss": -5.80466365814209, "global_step": 59823, "epoch": 1424} {"train_loss": -5.771137237548828, "global_step": 59824, "epoch": 1424} {"train_loss": -5.740170478820801, "global_step": 59825, "epoch": 1424} {"train_loss": -5.906921863555908, "global_step": 59826, "epoch": 1424} {"train_loss": -5.841463088989258, "global_step": 59827, "epoch": 1424} {"train_loss": -5.949571132659912, "global_step": 59828, "epoch": 1424} {"train_loss": -5.766876220703125, "global_step": 59829, "epoch": 1424} {"train_loss": -5.883583068847656, "global_step": 59830, "epoch": 1424} {"train_loss": -5.7858452796936035, "global_step": 59831, "epoch": 1424} {"train_loss": -5.851001739501953, "global_step": 59832, "epoch": 1424} {"train_loss": -5.853202819824219, "global_step": 59833, "epoch": 1424} {"train_loss": -5.8999528884887695, "global_step": 59834, "epoch": 1424} {"train_loss": -5.9022297859191895, "global_step": 59835, "epoch": 1424} {"train_loss": -5.9612627029418945, "global_step": 59836, "epoch": 1424} {"train_loss": -5.8015289306640625, "global_step": 59837, "epoch": 1424} {"train_loss": -5.881331443786621, "global_step": 59838, "epoch": 1424} {"train_loss": -5.7103986740112305, "global_step": 59839, "epoch": 1424} {"train_loss": -5.771821975708008, "global_step": 59840, "epoch": 1424} {"train_loss": -5.862433433532715, "global_step": 59841, "epoch": 1424} {"train_loss": -5.706060409545898, "global_step": 59842, "epoch": 1424} {"train_loss": -5.86572265625, "global_step": 59843, "epoch": 1424} {"train_loss": -5.837721824645996, "global_step": 59844, "epoch": 1424} {"train_loss": -5.877012252807617, "global_step": 59845, "epoch": 1424} {"train_loss": -5.887673377990723, "global_step": 59846, "epoch": 1424} {"train_loss": -5.808889389038086, "global_step": 59847, "epoch": 1424} {"train_loss": -5.811565399169922, "global_step": 59848, "epoch": 1424} {"train_loss": -5.838772909981864, "global_step": 59849, "epoch": 1424, "val_loss": 61271.0} {"train_loss": -5.934375762939453, "global_step": 59850, "epoch": 1425} {"train_loss": -5.92116641998291, "global_step": 59851, "epoch": 1425} {"train_loss": -5.812737464904785, "global_step": 59852, "epoch": 1425} {"train_loss": -5.898425102233887, "global_step": 59853, "epoch": 1425} {"train_loss": -5.815511226654053, "global_step": 59854, "epoch": 1425} {"train_loss": -5.954227924346924, "global_step": 59855, "epoch": 1425} {"train_loss": -5.982455730438232, "global_step": 59856, "epoch": 1425} {"train_loss": -5.807252883911133, "global_step": 59857, "epoch": 1425} {"train_loss": -5.926120758056641, "global_step": 59858, "epoch": 1425} {"train_loss": -5.817896842956543, "global_step": 59859, "epoch": 1425} {"train_loss": -5.915619850158691, "global_step": 59860, "epoch": 1425} {"train_loss": -5.946592330932617, "global_step": 59861, "epoch": 1425} {"train_loss": -5.942598342895508, "global_step": 59862, "epoch": 1425} {"train_loss": -5.929018974304199, "global_step": 59863, "epoch": 1425} {"train_loss": -5.98177433013916, "global_step": 59864, "epoch": 1425} {"train_loss": -5.9281110763549805, "global_step": 59865, "epoch": 1425} {"train_loss": -6.013613224029541, "global_step": 59866, "epoch": 1425} {"train_loss": -5.843531608581543, "global_step": 59867, "epoch": 1425} {"train_loss": -5.867969989776611, "global_step": 59868, "epoch": 1425} {"train_loss": -5.864506721496582, "global_step": 59869, "epoch": 1425} {"train_loss": -5.9936299324035645, "global_step": 59870, "epoch": 1425} {"train_loss": -5.894994258880615, "global_step": 59871, "epoch": 1425} {"train_loss": -5.9389190673828125, "global_step": 59872, "epoch": 1425} {"train_loss": -5.892242431640625, "global_step": 59873, "epoch": 1425} {"train_loss": -5.927492618560791, "global_step": 59874, "epoch": 1425} {"train_loss": -5.75880241394043, "global_step": 59875, "epoch": 1425} {"train_loss": -5.903026580810547, "global_step": 59876, "epoch": 1425} {"train_loss": -5.862651824951172, "global_step": 59877, "epoch": 1425} {"train_loss": -5.877347946166992, "global_step": 59878, "epoch": 1425} {"train_loss": -5.967568874359131, "global_step": 59879, "epoch": 1425} {"train_loss": -5.873039245605469, "global_step": 59880, "epoch": 1425} {"train_loss": -5.971555709838867, "global_step": 59881, "epoch": 1425} {"train_loss": -5.94041633605957, "global_step": 59882, "epoch": 1425} {"train_loss": -5.819565296173096, "global_step": 59883, "epoch": 1425} {"train_loss": -5.904557228088379, "global_step": 59884, "epoch": 1425} {"train_loss": -5.741908550262451, "global_step": 59885, "epoch": 1425} {"train_loss": -5.895369529724121, "global_step": 59886, "epoch": 1425} {"train_loss": -5.744731903076172, "global_step": 59887, "epoch": 1425} {"train_loss": -5.960358142852783, "global_step": 59888, "epoch": 1425} {"train_loss": -5.900964736938477, "global_step": 59889, "epoch": 1425} {"train_loss": -5.817610740661621, "global_step": 59890, "epoch": 1425} {"train_loss": -5.894107443945749, "global_step": 59891, "epoch": 1425, "val_loss": 61458.59375} {"train_loss": -5.81880521774292, "global_step": 59892, "epoch": 1426} {"train_loss": -6.001872539520264, "global_step": 59893, "epoch": 1426} {"train_loss": -6.04520320892334, "global_step": 59894, "epoch": 1426} {"train_loss": -5.934327602386475, "global_step": 59895, "epoch": 1426} {"train_loss": -5.96718168258667, "global_step": 59896, "epoch": 1426} {"train_loss": -5.942824363708496, "global_step": 59897, "epoch": 1426} {"train_loss": -5.845571517944336, "global_step": 59898, "epoch": 1426} {"train_loss": -5.913656711578369, "global_step": 59899, "epoch": 1426} {"train_loss": -5.829959392547607, "global_step": 59900, "epoch": 1426} {"train_loss": -5.942361831665039, "global_step": 59901, "epoch": 1426} {"train_loss": -5.821342945098877, "global_step": 59902, "epoch": 1426} {"train_loss": -6.021418571472168, "global_step": 59903, "epoch": 1426} {"train_loss": -5.903837203979492, "global_step": 59904, "epoch": 1426} {"train_loss": -5.7766947746276855, "global_step": 59905, "epoch": 1426} {"train_loss": -5.908803939819336, "global_step": 59906, "epoch": 1426} {"train_loss": -5.915582180023193, "global_step": 59907, "epoch": 1426} {"train_loss": -5.877570152282715, "global_step": 59908, "epoch": 1426} {"train_loss": -5.8972320556640625, "global_step": 59909, "epoch": 1426} {"train_loss": -5.919437408447266, "global_step": 59910, "epoch": 1426} {"train_loss": -5.865506649017334, "global_step": 59911, "epoch": 1426} {"train_loss": -5.887829780578613, "global_step": 59912, "epoch": 1426} {"train_loss": -5.878763675689697, "global_step": 59913, "epoch": 1426} {"train_loss": -5.85595703125, "global_step": 59914, "epoch": 1426} {"train_loss": -5.853151321411133, "global_step": 59915, "epoch": 1426} {"train_loss": -5.842994689941406, "global_step": 59916, "epoch": 1426} {"train_loss": -5.9368696212768555, "global_step": 59917, "epoch": 1426} {"train_loss": -6.026552200317383, "global_step": 59918, "epoch": 1426} {"train_loss": -5.925044536590576, "global_step": 59919, "epoch": 1426} {"train_loss": -5.762938499450684, "global_step": 59920, "epoch": 1426} {"train_loss": -5.895935535430908, "global_step": 59921, "epoch": 1426} {"train_loss": -5.960104942321777, "global_step": 59922, "epoch": 1426} {"train_loss": -5.8973870277404785, "global_step": 59923, "epoch": 1426} {"train_loss": -5.943284034729004, "global_step": 59924, "epoch": 1426} {"train_loss": -6.000837326049805, "global_step": 59925, "epoch": 1426} {"train_loss": -5.876863479614258, "global_step": 59926, "epoch": 1426} {"train_loss": -5.878400802612305, "global_step": 59927, "epoch": 1426} {"train_loss": -5.992160797119141, "global_step": 59928, "epoch": 1426} {"train_loss": -6.013236045837402, "global_step": 59929, "epoch": 1426} {"train_loss": -5.854750633239746, "global_step": 59930, "epoch": 1426} {"train_loss": -5.707643985748291, "global_step": 59931, "epoch": 1426} {"train_loss": -6.013213157653809, "global_step": 59932, "epoch": 1426} {"train_loss": -5.90837067649478, "global_step": 59933, "epoch": 1426, "val_loss": 61251.80078125} {"train_loss": -6.001344680786133, "global_step": 59934, "epoch": 1427} {"train_loss": -5.937075614929199, "global_step": 59935, "epoch": 1427} {"train_loss": -5.952391147613525, "global_step": 59936, "epoch": 1427} {"train_loss": -6.039177894592285, "global_step": 59937, "epoch": 1427} {"train_loss": -5.90860652923584, "global_step": 59938, "epoch": 1427} {"train_loss": -6.061054229736328, "global_step": 59939, "epoch": 1427} {"train_loss": -5.969626426696777, "global_step": 59940, "epoch": 1427} {"train_loss": -5.8964924812316895, "global_step": 59941, "epoch": 1427} {"train_loss": -5.961066246032715, "global_step": 59942, "epoch": 1427} {"train_loss": -5.90891170501709, "global_step": 59943, "epoch": 1427} {"train_loss": -5.962984085083008, "global_step": 59944, "epoch": 1427} {"train_loss": -6.057527542114258, "global_step": 59945, "epoch": 1427} {"train_loss": -5.89113712310791, "global_step": 59946, "epoch": 1427} {"train_loss": -5.8416595458984375, "global_step": 59947, "epoch": 1427} {"train_loss": -6.029850006103516, "global_step": 59948, "epoch": 1427} {"train_loss": -5.837852478027344, "global_step": 59949, "epoch": 1427} {"train_loss": -5.811679840087891, "global_step": 59950, "epoch": 1427} {"train_loss": -5.929007530212402, "global_step": 59951, "epoch": 1427} {"train_loss": -5.938210487365723, "global_step": 59952, "epoch": 1427} {"train_loss": -5.838507652282715, "global_step": 59953, "epoch": 1427} {"train_loss": -5.898300647735596, "global_step": 59954, "epoch": 1427} {"train_loss": -5.927249908447266, "global_step": 59955, "epoch": 1427} {"train_loss": -5.93855619430542, "global_step": 59956, "epoch": 1427} {"train_loss": -6.028345584869385, "global_step": 59957, "epoch": 1427} {"train_loss": -5.898402214050293, "global_step": 59958, "epoch": 1427} {"train_loss": -5.825568199157715, "global_step": 59959, "epoch": 1427} {"train_loss": -5.941082954406738, "global_step": 59960, "epoch": 1427} {"train_loss": -5.864935874938965, "global_step": 59961, "epoch": 1427} {"train_loss": -5.99210262298584, "global_step": 59962, "epoch": 1427} {"train_loss": -5.935698509216309, "global_step": 59963, "epoch": 1427} {"train_loss": -5.977939605712891, "global_step": 59964, "epoch": 1427} {"train_loss": -5.9856414794921875, "global_step": 59965, "epoch": 1427} {"train_loss": -5.924708366394043, "global_step": 59966, "epoch": 1427} {"train_loss": -6.047361373901367, "global_step": 59967, "epoch": 1427} {"train_loss": -5.943343162536621, "global_step": 59968, "epoch": 1427} {"train_loss": -5.940425872802734, "global_step": 59969, "epoch": 1427} {"train_loss": -5.824330806732178, "global_step": 59970, "epoch": 1427} {"train_loss": -5.776273727416992, "global_step": 59971, "epoch": 1427} {"train_loss": -5.746461868286133, "global_step": 59972, "epoch": 1427} {"train_loss": -5.945740222930908, "global_step": 59973, "epoch": 1427} {"train_loss": -5.942487716674805, "global_step": 59974, "epoch": 1427} {"train_loss": -5.927801699865432, "global_step": 59975, "epoch": 1427, "val_loss": 61296.4375} {"train_loss": -5.952363014221191, "global_step": 59976, "epoch": 1428} {"train_loss": -5.81475830078125, "global_step": 59977, "epoch": 1428} {"train_loss": -5.996374130249023, "global_step": 59978, "epoch": 1428} {"train_loss": -5.869633674621582, "global_step": 59979, "epoch": 1428} {"train_loss": -5.868959903717041, "global_step": 59980, "epoch": 1428} {"train_loss": -5.879948616027832, "global_step": 59981, "epoch": 1428} {"train_loss": -5.939636707305908, "global_step": 59982, "epoch": 1428} {"train_loss": -5.971956253051758, "global_step": 59983, "epoch": 1428} {"train_loss": -5.929656505584717, "global_step": 59984, "epoch": 1428} {"train_loss": -5.9106059074401855, "global_step": 59985, "epoch": 1428} {"train_loss": -5.834679126739502, "global_step": 59986, "epoch": 1428} {"train_loss": -5.772517204284668, "global_step": 59987, "epoch": 1428} {"train_loss": -5.939821720123291, "global_step": 59988, "epoch": 1428} {"train_loss": -5.826781272888184, "global_step": 59989, "epoch": 1428} {"train_loss": -5.897487163543701, "global_step": 59990, "epoch": 1428} {"train_loss": -5.803215026855469, "global_step": 59991, "epoch": 1428} {"train_loss": -5.85037899017334, "global_step": 59992, "epoch": 1428} {"train_loss": -5.944817543029785, "global_step": 59993, "epoch": 1428} {"train_loss": -5.852419376373291, "global_step": 59994, "epoch": 1428} {"train_loss": -5.895562648773193, "global_step": 59995, "epoch": 1428} {"train_loss": -5.827811241149902, "global_step": 59996, "epoch": 1428} {"train_loss": -5.9365034103393555, "global_step": 59997, "epoch": 1428} {"train_loss": -5.9194536209106445, "global_step": 59998, "epoch": 1428} {"train_loss": -5.930129051208496, "global_step": 59999, "epoch": 1428} {"train_loss": -5.980881214141846, "global_step": 60000, "epoch": 1428} {"train_loss": -5.91904354095459, "global_step": 60001, "epoch": 1428} {"train_loss": -5.94297981262207, "global_step": 60002, "epoch": 1428} {"train_loss": -5.834955215454102, "global_step": 60003, "epoch": 1428} {"train_loss": -5.92490291595459, "global_step": 60004, "epoch": 1428} {"train_loss": -5.921739101409912, "global_step": 60005, "epoch": 1428} {"train_loss": -5.902108192443848, "global_step": 60006, "epoch": 1428} {"train_loss": -5.9323859214782715, "global_step": 60007, "epoch": 1428} {"train_loss": -5.938096523284912, "global_step": 60008, "epoch": 1428} {"train_loss": -6.027121067047119, "global_step": 60009, "epoch": 1428} {"train_loss": -6.019004821777344, "global_step": 60010, "epoch": 1428} {"train_loss": -5.962331771850586, "global_step": 60011, "epoch": 1428} {"train_loss": -5.967232704162598, "global_step": 60012, "epoch": 1428} {"train_loss": -5.934662818908691, "global_step": 60013, "epoch": 1428} {"train_loss": -5.9168901443481445, "global_step": 60014, "epoch": 1428} {"train_loss": -5.830039024353027, "global_step": 60015, "epoch": 1428} {"train_loss": -5.967525005340576, "global_step": 60016, "epoch": 1428} {"train_loss": -5.910132555734544, "global_step": 60017, "epoch": 1428, "val_loss": 61291.68359375} {"train_loss": -5.981400012969971, "global_step": 60018, "epoch": 1429} {"train_loss": -5.9383039474487305, "global_step": 60019, "epoch": 1429} {"train_loss": -5.9487996101379395, "global_step": 60020, "epoch": 1429} {"train_loss": -5.951355934143066, "global_step": 60021, "epoch": 1429} {"train_loss": -6.008378505706787, "global_step": 60022, "epoch": 1429} {"train_loss": -5.988153457641602, "global_step": 60023, "epoch": 1429} {"train_loss": -5.884320259094238, "global_step": 60024, "epoch": 1429} {"train_loss": -5.949073314666748, "global_step": 60025, "epoch": 1429} {"train_loss": -5.886330604553223, "global_step": 60026, "epoch": 1429} {"train_loss": -5.9520721435546875, "global_step": 60027, "epoch": 1429} {"train_loss": -5.875096321105957, "global_step": 60028, "epoch": 1429} {"train_loss": -6.0320281982421875, "global_step": 60029, "epoch": 1429} {"train_loss": -5.972442150115967, "global_step": 60030, "epoch": 1429} {"train_loss": -5.812395095825195, "global_step": 60031, "epoch": 1429} {"train_loss": -6.0019659996032715, "global_step": 60032, "epoch": 1429} {"train_loss": -5.915513038635254, "global_step": 60033, "epoch": 1429} {"train_loss": -5.782960891723633, "global_step": 60034, "epoch": 1429} {"train_loss": -5.785020351409912, "global_step": 60035, "epoch": 1429} {"train_loss": -5.894068717956543, "global_step": 60036, "epoch": 1429} {"train_loss": -5.956852912902832, "global_step": 60037, "epoch": 1429} {"train_loss": -5.953839302062988, "global_step": 60038, "epoch": 1429} {"train_loss": -5.865119457244873, "global_step": 60039, "epoch": 1429} {"train_loss": -5.892822265625, "global_step": 60040, "epoch": 1429} {"train_loss": -5.95828104019165, "global_step": 60041, "epoch": 1429} {"train_loss": -5.920319557189941, "global_step": 60042, "epoch": 1429} {"train_loss": -5.944252014160156, "global_step": 60043, "epoch": 1429} {"train_loss": -5.893636703491211, "global_step": 60044, "epoch": 1429} {"train_loss": -5.870415210723877, "global_step": 60045, "epoch": 1429} {"train_loss": -5.8336286544799805, "global_step": 60046, "epoch": 1429} {"train_loss": -5.882259845733643, "global_step": 60047, "epoch": 1429} {"train_loss": -5.872200012207031, "global_step": 60048, "epoch": 1429} {"train_loss": -5.969094276428223, "global_step": 60049, "epoch": 1429} {"train_loss": -5.798773765563965, "global_step": 60050, "epoch": 1429} {"train_loss": -5.835192680358887, "global_step": 60051, "epoch": 1429} {"train_loss": -6.012778282165527, "global_step": 60052, "epoch": 1429} {"train_loss": -5.965947151184082, "global_step": 60053, "epoch": 1429} {"train_loss": -5.815482139587402, "global_step": 60054, "epoch": 1429} {"train_loss": -5.85161018371582, "global_step": 60055, "epoch": 1429} {"train_loss": -5.829407691955566, "global_step": 60056, "epoch": 1429} {"train_loss": -5.840251922607422, "global_step": 60057, "epoch": 1429} {"train_loss": -5.914587497711182, "global_step": 60058, "epoch": 1429} {"train_loss": -5.908103284381685, "global_step": 60059, "epoch": 1429, "val_loss": 61237.67578125} {"train_loss": -5.805043697357178, "global_step": 60060, "epoch": 1430} {"train_loss": -5.846522331237793, "global_step": 60061, "epoch": 1430} {"train_loss": -5.807476043701172, "global_step": 60062, "epoch": 1430} {"train_loss": -5.925185680389404, "global_step": 60063, "epoch": 1430} {"train_loss": -5.828841209411621, "global_step": 60064, "epoch": 1430} {"train_loss": -6.01876163482666, "global_step": 60065, "epoch": 1430} {"train_loss": -5.76180362701416, "global_step": 60066, "epoch": 1430} {"train_loss": -5.801032066345215, "global_step": 60067, "epoch": 1430} {"train_loss": -5.858124732971191, "global_step": 60068, "epoch": 1430} {"train_loss": -5.847879409790039, "global_step": 60069, "epoch": 1430} {"train_loss": -5.908689498901367, "global_step": 60070, "epoch": 1430} {"train_loss": -5.756040573120117, "global_step": 60071, "epoch": 1430} {"train_loss": -5.940864562988281, "global_step": 60072, "epoch": 1430} {"train_loss": -5.900237083435059, "global_step": 60073, "epoch": 1430} {"train_loss": -5.952435493469238, "global_step": 60074, "epoch": 1430} {"train_loss": -6.017585754394531, "global_step": 60075, "epoch": 1430} {"train_loss": -5.944933891296387, "global_step": 60076, "epoch": 1430} {"train_loss": -5.933724880218506, "global_step": 60077, "epoch": 1430} {"train_loss": -5.92282772064209, "global_step": 60078, "epoch": 1430} {"train_loss": -5.843562602996826, "global_step": 60079, "epoch": 1430} {"train_loss": -5.9730987548828125, "global_step": 60080, "epoch": 1430} {"train_loss": -5.84047794342041, "global_step": 60081, "epoch": 1430} {"train_loss": -5.915399074554443, "global_step": 60082, "epoch": 1430} {"train_loss": -6.008233547210693, "global_step": 60083, "epoch": 1430} {"train_loss": -5.892430782318115, "global_step": 60084, "epoch": 1430} {"train_loss": -6.0341644287109375, "global_step": 60085, "epoch": 1430} {"train_loss": -5.903242111206055, "global_step": 60086, "epoch": 1430} {"train_loss": -5.952114582061768, "global_step": 60087, "epoch": 1430} {"train_loss": -5.919355869293213, "global_step": 60088, "epoch": 1430} {"train_loss": -5.9966840744018555, "global_step": 60089, "epoch": 1430} {"train_loss": -5.9918060302734375, "global_step": 60090, "epoch": 1430} {"train_loss": -5.861733913421631, "global_step": 60091, "epoch": 1430} {"train_loss": -5.911627769470215, "global_step": 60092, "epoch": 1430} {"train_loss": -5.926419258117676, "global_step": 60093, "epoch": 1430} {"train_loss": -5.8956732749938965, "global_step": 60094, "epoch": 1430} {"train_loss": -5.951315879821777, "global_step": 60095, "epoch": 1430} {"train_loss": -5.819170951843262, "global_step": 60096, "epoch": 1430} {"train_loss": -5.916218280792236, "global_step": 60097, "epoch": 1430} {"train_loss": -5.888158798217773, "global_step": 60098, "epoch": 1430} {"train_loss": -5.921849250793457, "global_step": 60099, "epoch": 1430} {"train_loss": -5.972726821899414, "global_step": 60100, "epoch": 1430} {"train_loss": -5.905389115923927, "global_step": 60101, "epoch": 1430, "val_loss": 61687.9453125} {"train_loss": -5.865265369415283, "global_step": 60102, "epoch": 1431} {"train_loss": -5.820334434509277, "global_step": 60103, "epoch": 1431} {"train_loss": -5.881377220153809, "global_step": 60104, "epoch": 1431} {"train_loss": -5.816662788391113, "global_step": 60105, "epoch": 1431} {"train_loss": -6.017589569091797, "global_step": 60106, "epoch": 1431} {"train_loss": -5.88667631149292, "global_step": 60107, "epoch": 1431} {"train_loss": -5.810467720031738, "global_step": 60108, "epoch": 1431} {"train_loss": -6.032977104187012, "global_step": 60109, "epoch": 1431} {"train_loss": -5.9232072830200195, "global_step": 60110, "epoch": 1431} {"train_loss": -5.940436363220215, "global_step": 60111, "epoch": 1431} {"train_loss": -5.826933860778809, "global_step": 60112, "epoch": 1431} {"train_loss": -5.9402360916137695, "global_step": 60113, "epoch": 1431} {"train_loss": -5.829376220703125, "global_step": 60114, "epoch": 1431} {"train_loss": -5.813399791717529, "global_step": 60115, "epoch": 1431} {"train_loss": -5.955446243286133, "global_step": 60116, "epoch": 1431} {"train_loss": -5.7000837326049805, "global_step": 60117, "epoch": 1431} {"train_loss": -5.924837112426758, "global_step": 60118, "epoch": 1431} {"train_loss": -5.875326156616211, "global_step": 60119, "epoch": 1431} {"train_loss": -5.721613883972168, "global_step": 60120, "epoch": 1431} {"train_loss": -5.80991268157959, "global_step": 60121, "epoch": 1431} {"train_loss": -5.8919830322265625, "global_step": 60122, "epoch": 1431} {"train_loss": -5.851079940795898, "global_step": 60123, "epoch": 1431} {"train_loss": -5.915740966796875, "global_step": 60124, "epoch": 1431} {"train_loss": -5.786478042602539, "global_step": 60125, "epoch": 1431} {"train_loss": -5.868043422698975, "global_step": 60126, "epoch": 1431} {"train_loss": -5.840500831604004, "global_step": 60127, "epoch": 1431} {"train_loss": -6.034816265106201, "global_step": 60128, "epoch": 1431} {"train_loss": -5.845964431762695, "global_step": 60129, "epoch": 1431} {"train_loss": -5.954383850097656, "global_step": 60130, "epoch": 1431} {"train_loss": -5.85403299331665, "global_step": 60131, "epoch": 1431} {"train_loss": -5.934638977050781, "global_step": 60132, "epoch": 1431} {"train_loss": -5.874688625335693, "global_step": 60133, "epoch": 1431} {"train_loss": -5.946515083312988, "global_step": 60134, "epoch": 1431} {"train_loss": -5.9844465255737305, "global_step": 60135, "epoch": 1431} {"train_loss": -5.995386123657227, "global_step": 60136, "epoch": 1431} {"train_loss": -5.923884391784668, "global_step": 60137, "epoch": 1431} {"train_loss": -6.003477096557617, "global_step": 60138, "epoch": 1431} {"train_loss": -5.9612555503845215, "global_step": 60139, "epoch": 1431} {"train_loss": -5.9227423667907715, "global_step": 60140, "epoch": 1431} {"train_loss": -5.828921794891357, "global_step": 60141, "epoch": 1431} {"train_loss": -5.930371284484863, "global_step": 60142, "epoch": 1431} {"train_loss": -5.891649041857038, "global_step": 60143, "epoch": 1431, "val_loss": 61357.19921875} {"train_loss": -5.9026336669921875, "global_step": 60144, "epoch": 1432} {"train_loss": -5.9616804122924805, "global_step": 60145, "epoch": 1432} {"train_loss": -5.926084041595459, "global_step": 60146, "epoch": 1432} {"train_loss": -6.006584167480469, "global_step": 60147, "epoch": 1432} {"train_loss": -5.83165979385376, "global_step": 60148, "epoch": 1432} {"train_loss": -5.964627265930176, "global_step": 60149, "epoch": 1432} {"train_loss": -5.944199085235596, "global_step": 60150, "epoch": 1432} {"train_loss": -5.964949131011963, "global_step": 60151, "epoch": 1432} {"train_loss": -5.899860382080078, "global_step": 60152, "epoch": 1432} {"train_loss": -5.89363956451416, "global_step": 60153, "epoch": 1432} {"train_loss": -5.900845527648926, "global_step": 60154, "epoch": 1432} {"train_loss": -5.922876358032227, "global_step": 60155, "epoch": 1432} {"train_loss": -5.914747714996338, "global_step": 60156, "epoch": 1432} {"train_loss": -5.800904750823975, "global_step": 60157, "epoch": 1432} {"train_loss": -5.876860618591309, "global_step": 60158, "epoch": 1432} {"train_loss": -5.95228385925293, "global_step": 60159, "epoch": 1432} {"train_loss": -6.021459579467773, "global_step": 60160, "epoch": 1432} {"train_loss": -5.817320823669434, "global_step": 60161, "epoch": 1432} {"train_loss": -5.897751331329346, "global_step": 60162, "epoch": 1432} {"train_loss": -5.883955001831055, "global_step": 60163, "epoch": 1432} {"train_loss": -5.812997341156006, "global_step": 60164, "epoch": 1432} {"train_loss": -5.944809913635254, "global_step": 60165, "epoch": 1432} {"train_loss": -5.905259132385254, "global_step": 60166, "epoch": 1432} {"train_loss": -5.849714279174805, "global_step": 60167, "epoch": 1432} {"train_loss": -5.940803527832031, "global_step": 60168, "epoch": 1432} {"train_loss": -5.970226764678955, "global_step": 60169, "epoch": 1432} {"train_loss": -5.987436294555664, "global_step": 60170, "epoch": 1432} {"train_loss": -5.852649688720703, "global_step": 60171, "epoch": 1432} {"train_loss": -5.85455322265625, "global_step": 60172, "epoch": 1432} {"train_loss": -5.857165336608887, "global_step": 60173, "epoch": 1432} {"train_loss": -5.871870040893555, "global_step": 60174, "epoch": 1432} {"train_loss": -5.980507850646973, "global_step": 60175, "epoch": 1432} {"train_loss": -5.925638198852539, "global_step": 60176, "epoch": 1432} {"train_loss": -5.822549819946289, "global_step": 60177, "epoch": 1432} {"train_loss": -5.939111709594727, "global_step": 60178, "epoch": 1432} {"train_loss": -5.89642333984375, "global_step": 60179, "epoch": 1432} {"train_loss": -5.890802383422852, "global_step": 60180, "epoch": 1432} {"train_loss": -5.898679733276367, "global_step": 60181, "epoch": 1432} {"train_loss": -5.8608503341674805, "global_step": 60182, "epoch": 1432} {"train_loss": -5.8455586433410645, "global_step": 60183, "epoch": 1432} {"train_loss": -5.969523906707764, "global_step": 60184, "epoch": 1432} {"train_loss": -5.905090104965937, "global_step": 60185, "epoch": 1432, "val_loss": 61713.9921875} {"train_loss": -5.898622512817383, "global_step": 60186, "epoch": 1433} {"train_loss": -5.900284290313721, "global_step": 60187, "epoch": 1433} {"train_loss": -5.854640960693359, "global_step": 60188, "epoch": 1433} {"train_loss": -5.93856954574585, "global_step": 60189, "epoch": 1433} {"train_loss": -5.990145683288574, "global_step": 60190, "epoch": 1433} {"train_loss": -5.932247638702393, "global_step": 60191, "epoch": 1433} {"train_loss": -5.8468170166015625, "global_step": 60192, "epoch": 1433} {"train_loss": -5.9759111404418945, "global_step": 60193, "epoch": 1433} {"train_loss": -5.921289920806885, "global_step": 60194, "epoch": 1433} {"train_loss": -5.771535873413086, "global_step": 60195, "epoch": 1433} {"train_loss": -5.752488136291504, "global_step": 60196, "epoch": 1433} {"train_loss": -5.919574737548828, "global_step": 60197, "epoch": 1433} {"train_loss": -5.986236572265625, "global_step": 60198, "epoch": 1433} {"train_loss": -5.737588405609131, "global_step": 60199, "epoch": 1433} {"train_loss": -5.883254528045654, "global_step": 60200, "epoch": 1433} {"train_loss": -5.97361946105957, "global_step": 60201, "epoch": 1433} {"train_loss": -5.90318489074707, "global_step": 60202, "epoch": 1433} {"train_loss": -5.925955772399902, "global_step": 60203, "epoch": 1433} {"train_loss": -5.8592329025268555, "global_step": 60204, "epoch": 1433} {"train_loss": -5.756702423095703, "global_step": 60205, "epoch": 1433} {"train_loss": -5.912219047546387, "global_step": 60206, "epoch": 1433} {"train_loss": -5.8418474197387695, "global_step": 60207, "epoch": 1433} {"train_loss": -5.849987983703613, "global_step": 60208, "epoch": 1433} {"train_loss": -5.780456066131592, "global_step": 60209, "epoch": 1433} {"train_loss": -5.887941837310791, "global_step": 60210, "epoch": 1433} {"train_loss": -5.76603889465332, "global_step": 60211, "epoch": 1433} {"train_loss": -5.904965877532959, "global_step": 60212, "epoch": 1433} {"train_loss": -5.8224897384643555, "global_step": 60213, "epoch": 1433} {"train_loss": -6.034605979919434, "global_step": 60214, "epoch": 1433} {"train_loss": -5.998493671417236, "global_step": 60215, "epoch": 1433} {"train_loss": -6.004454612731934, "global_step": 60216, "epoch": 1433} {"train_loss": -5.829596519470215, "global_step": 60217, "epoch": 1433} {"train_loss": -5.853601932525635, "global_step": 60218, "epoch": 1433} {"train_loss": -5.758506774902344, "global_step": 60219, "epoch": 1433} {"train_loss": -5.922873497009277, "global_step": 60220, "epoch": 1433} {"train_loss": -5.894376277923584, "global_step": 60221, "epoch": 1433} {"train_loss": -5.802581310272217, "global_step": 60222, "epoch": 1433} {"train_loss": -5.9802165031433105, "global_step": 60223, "epoch": 1433} {"train_loss": -5.904401779174805, "global_step": 60224, "epoch": 1433} {"train_loss": -5.855381488800049, "global_step": 60225, "epoch": 1433} {"train_loss": -6.029872417449951, "global_step": 60226, "epoch": 1433} {"train_loss": -5.884310449872698, "global_step": 60227, "epoch": 1433, "val_loss": 61419.3125} {"train_loss": -5.939040184020996, "global_step": 60228, "epoch": 1434} {"train_loss": -5.86536169052124, "global_step": 60229, "epoch": 1434} {"train_loss": -5.826208114624023, "global_step": 60230, "epoch": 1434} {"train_loss": -6.006476879119873, "global_step": 60231, "epoch": 1434} {"train_loss": -5.849207878112793, "global_step": 60232, "epoch": 1434} {"train_loss": -5.852582931518555, "global_step": 60233, "epoch": 1434} {"train_loss": -5.939032554626465, "global_step": 60234, "epoch": 1434} {"train_loss": -5.819283485412598, "global_step": 60235, "epoch": 1434} {"train_loss": -5.947421073913574, "global_step": 60236, "epoch": 1434} {"train_loss": -5.866977691650391, "global_step": 60237, "epoch": 1434} {"train_loss": -5.959436416625977, "global_step": 60238, "epoch": 1434} {"train_loss": -5.827965259552002, "global_step": 60239, "epoch": 1434} {"train_loss": -5.894384384155273, "global_step": 60240, "epoch": 1434} {"train_loss": -5.891219615936279, "global_step": 60241, "epoch": 1434} {"train_loss": -5.977785110473633, "global_step": 60242, "epoch": 1434} {"train_loss": -5.871983528137207, "global_step": 60243, "epoch": 1434} {"train_loss": -5.93657922744751, "global_step": 60244, "epoch": 1434} {"train_loss": -6.009705066680908, "global_step": 60245, "epoch": 1434} {"train_loss": -5.864141941070557, "global_step": 60246, "epoch": 1434} {"train_loss": -5.940003395080566, "global_step": 60247, "epoch": 1434} {"train_loss": -5.900724411010742, "global_step": 60248, "epoch": 1434} {"train_loss": -5.944733142852783, "global_step": 60249, "epoch": 1434} {"train_loss": -6.014534950256348, "global_step": 60250, "epoch": 1434} {"train_loss": -5.84107780456543, "global_step": 60251, "epoch": 1434} {"train_loss": -5.974308967590332, "global_step": 60252, "epoch": 1434} {"train_loss": -6.000856399536133, "global_step": 60253, "epoch": 1434} {"train_loss": -5.914132118225098, "global_step": 60254, "epoch": 1434} {"train_loss": -5.949213027954102, "global_step": 60255, "epoch": 1434} {"train_loss": -5.882774353027344, "global_step": 60256, "epoch": 1434} {"train_loss": -5.938602924346924, "global_step": 60257, "epoch": 1434} {"train_loss": -5.994270324707031, "global_step": 60258, "epoch": 1434} {"train_loss": -6.040021896362305, "global_step": 60259, "epoch": 1434} {"train_loss": -5.793052673339844, "global_step": 60260, "epoch": 1434} {"train_loss": -5.933344841003418, "global_step": 60261, "epoch": 1434} {"train_loss": -5.884347438812256, "global_step": 60262, "epoch": 1434} {"train_loss": -5.867702484130859, "global_step": 60263, "epoch": 1434} {"train_loss": -6.012085437774658, "global_step": 60264, "epoch": 1434} {"train_loss": -5.9769792556762695, "global_step": 60265, "epoch": 1434} {"train_loss": -6.014337539672852, "global_step": 60266, "epoch": 1434} {"train_loss": -5.8111371994018555, "global_step": 60267, "epoch": 1434} {"train_loss": -5.970174789428711, "global_step": 60268, "epoch": 1434} {"train_loss": -5.923430431456793, "global_step": 60269, "epoch": 1434, "val_loss": 61294.19921875} {"train_loss": -5.939039707183838, "global_step": 60270, "epoch": 1435} {"train_loss": -6.078639030456543, "global_step": 60271, "epoch": 1435} {"train_loss": -5.935872554779053, "global_step": 60272, "epoch": 1435} {"train_loss": -6.007662296295166, "global_step": 60273, "epoch": 1435} {"train_loss": -5.8650712966918945, "global_step": 60274, "epoch": 1435} {"train_loss": -5.935643196105957, "global_step": 60275, "epoch": 1435} {"train_loss": -5.884356498718262, "global_step": 60276, "epoch": 1435} {"train_loss": -5.859664440155029, "global_step": 60277, "epoch": 1435} {"train_loss": -5.947301864624023, "global_step": 60278, "epoch": 1435} {"train_loss": -5.997535705566406, "global_step": 60279, "epoch": 1435} {"train_loss": -5.824895858764648, "global_step": 60280, "epoch": 1435} {"train_loss": -5.921195030212402, "global_step": 60281, "epoch": 1435} {"train_loss": -6.004021644592285, "global_step": 60282, "epoch": 1435} {"train_loss": -5.927133560180664, "global_step": 60283, "epoch": 1435} {"train_loss": -5.908920764923096, "global_step": 60284, "epoch": 1435} {"train_loss": -5.8983540534973145, "global_step": 60285, "epoch": 1435} {"train_loss": -5.96322774887085, "global_step": 60286, "epoch": 1435} {"train_loss": -5.876600742340088, "global_step": 60287, "epoch": 1435} {"train_loss": -5.866198539733887, "global_step": 60288, "epoch": 1435} {"train_loss": -5.910333156585693, "global_step": 60289, "epoch": 1435} {"train_loss": -5.85348653793335, "global_step": 60290, "epoch": 1435} {"train_loss": -5.980380058288574, "global_step": 60291, "epoch": 1435} {"train_loss": -5.903125762939453, "global_step": 60292, "epoch": 1435} {"train_loss": -5.93803596496582, "global_step": 60293, "epoch": 1435} {"train_loss": -5.942383766174316, "global_step": 60294, "epoch": 1435} {"train_loss": -5.880885124206543, "global_step": 60295, "epoch": 1435} {"train_loss": -5.874634742736816, "global_step": 60296, "epoch": 1435} {"train_loss": -5.892404556274414, "global_step": 60297, "epoch": 1435} {"train_loss": -6.042238712310791, "global_step": 60298, "epoch": 1435} {"train_loss": -5.80856466293335, "global_step": 60299, "epoch": 1435} {"train_loss": -5.868098735809326, "global_step": 60300, "epoch": 1435} {"train_loss": -5.876105308532715, "global_step": 60301, "epoch": 1435} {"train_loss": -5.892884254455566, "global_step": 60302, "epoch": 1435} {"train_loss": -5.8941545486450195, "global_step": 60303, "epoch": 1435} {"train_loss": -5.818010330200195, "global_step": 60304, "epoch": 1435} {"train_loss": -5.821709632873535, "global_step": 60305, "epoch": 1435} {"train_loss": -5.872357368469238, "global_step": 60306, "epoch": 1435} {"train_loss": -5.759258270263672, "global_step": 60307, "epoch": 1435} {"train_loss": -5.860004901885986, "global_step": 60308, "epoch": 1435} {"train_loss": -5.908906936645508, "global_step": 60309, "epoch": 1435} {"train_loss": -5.9475178718566895, "global_step": 60310, "epoch": 1435} {"train_loss": -5.903754688444591, "global_step": 60311, "epoch": 1435, "val_loss": 61316.65234375} {"train_loss": -5.941103935241699, "global_step": 60312, "epoch": 1436} {"train_loss": -5.967364311218262, "global_step": 60313, "epoch": 1436} {"train_loss": -5.825411319732666, "global_step": 60314, "epoch": 1436} {"train_loss": -5.947258949279785, "global_step": 60315, "epoch": 1436} {"train_loss": -5.754737377166748, "global_step": 60316, "epoch": 1436} {"train_loss": -5.94002628326416, "global_step": 60317, "epoch": 1436} {"train_loss": -5.990776538848877, "global_step": 60318, "epoch": 1436} {"train_loss": -5.894904136657715, "global_step": 60319, "epoch": 1436} {"train_loss": -5.880587100982666, "global_step": 60320, "epoch": 1436} {"train_loss": -6.053927421569824, "global_step": 60321, "epoch": 1436} {"train_loss": -5.855620384216309, "global_step": 60322, "epoch": 1436} {"train_loss": -5.973995685577393, "global_step": 60323, "epoch": 1436} {"train_loss": -5.981975078582764, "global_step": 60324, "epoch": 1436} {"train_loss": -5.9221415519714355, "global_step": 60325, "epoch": 1436} {"train_loss": -5.854990005493164, "global_step": 60326, "epoch": 1436} {"train_loss": -6.033236026763916, "global_step": 60327, "epoch": 1436} {"train_loss": -6.002375602722168, "global_step": 60328, "epoch": 1436} {"train_loss": -6.018362045288086, "global_step": 60329, "epoch": 1436} {"train_loss": -5.859724044799805, "global_step": 60330, "epoch": 1436} {"train_loss": -5.884120941162109, "global_step": 60331, "epoch": 1436} {"train_loss": -6.007380485534668, "global_step": 60332, "epoch": 1436} {"train_loss": -5.891744136810303, "global_step": 60333, "epoch": 1436} {"train_loss": -5.913544654846191, "global_step": 60334, "epoch": 1436} {"train_loss": -5.880832672119141, "global_step": 60335, "epoch": 1436} {"train_loss": -5.809370994567871, "global_step": 60336, "epoch": 1436} {"train_loss": -5.942670822143555, "global_step": 60337, "epoch": 1436} {"train_loss": -5.943262100219727, "global_step": 60338, "epoch": 1436} {"train_loss": -5.848745822906494, "global_step": 60339, "epoch": 1436} {"train_loss": -5.893887519836426, "global_step": 60340, "epoch": 1436} {"train_loss": -5.790887355804443, "global_step": 60341, "epoch": 1436} {"train_loss": -5.886621475219727, "global_step": 60342, "epoch": 1436} {"train_loss": -5.960535049438477, "global_step": 60343, "epoch": 1436} {"train_loss": -5.799648284912109, "global_step": 60344, "epoch": 1436} {"train_loss": -5.949626922607422, "global_step": 60345, "epoch": 1436} {"train_loss": -5.828101634979248, "global_step": 60346, "epoch": 1436} {"train_loss": -5.82696533203125, "global_step": 60347, "epoch": 1436} {"train_loss": -5.901270866394043, "global_step": 60348, "epoch": 1436} {"train_loss": -5.908091068267822, "global_step": 60349, "epoch": 1436} {"train_loss": -5.726370334625244, "global_step": 60350, "epoch": 1436} {"train_loss": -6.023828506469727, "global_step": 60351, "epoch": 1436} {"train_loss": -5.81959867477417, "global_step": 60352, "epoch": 1436} {"train_loss": -5.904886586325509, "global_step": 60353, "epoch": 1436, "val_loss": 61415.75390625} {"train_loss": -5.905270099639893, "global_step": 60354, "epoch": 1437} {"train_loss": -5.910262584686279, "global_step": 60355, "epoch": 1437} {"train_loss": -5.899003028869629, "global_step": 60356, "epoch": 1437} {"train_loss": -5.935371398925781, "global_step": 60357, "epoch": 1437} {"train_loss": -5.960573673248291, "global_step": 60358, "epoch": 1437} {"train_loss": -5.856507301330566, "global_step": 60359, "epoch": 1437} {"train_loss": -5.8144073486328125, "global_step": 60360, "epoch": 1437} {"train_loss": -5.954089164733887, "global_step": 60361, "epoch": 1437} {"train_loss": -5.793552398681641, "global_step": 60362, "epoch": 1437} {"train_loss": -5.984959125518799, "global_step": 60363, "epoch": 1437} {"train_loss": -5.95058012008667, "global_step": 60364, "epoch": 1437} {"train_loss": -5.90836238861084, "global_step": 60365, "epoch": 1437} {"train_loss": -5.919118404388428, "global_step": 60366, "epoch": 1437} {"train_loss": -5.961273193359375, "global_step": 60367, "epoch": 1437} {"train_loss": -5.9603471755981445, "global_step": 60368, "epoch": 1437} {"train_loss": -5.879555702209473, "global_step": 60369, "epoch": 1437} {"train_loss": -5.949897766113281, "global_step": 60370, "epoch": 1437} {"train_loss": -6.009127616882324, "global_step": 60371, "epoch": 1437} {"train_loss": -5.787873268127441, "global_step": 60372, "epoch": 1437} {"train_loss": -5.994163990020752, "global_step": 60373, "epoch": 1437} {"train_loss": -5.952896595001221, "global_step": 60374, "epoch": 1437} {"train_loss": -5.937348365783691, "global_step": 60375, "epoch": 1437} {"train_loss": -6.006957054138184, "global_step": 60376, "epoch": 1437} {"train_loss": -5.970921516418457, "global_step": 60377, "epoch": 1437} {"train_loss": -5.970787048339844, "global_step": 60378, "epoch": 1437} {"train_loss": -5.876996040344238, "global_step": 60379, "epoch": 1437} {"train_loss": -5.9035420417785645, "global_step": 60380, "epoch": 1437} {"train_loss": -5.885370254516602, "global_step": 60381, "epoch": 1437} {"train_loss": -5.872331619262695, "global_step": 60382, "epoch": 1437} {"train_loss": -5.9747700691223145, "global_step": 60383, "epoch": 1437} {"train_loss": -6.025115489959717, "global_step": 60384, "epoch": 1437} {"train_loss": -6.030322551727295, "global_step": 60385, "epoch": 1437} {"train_loss": -5.846109390258789, "global_step": 60386, "epoch": 1437} {"train_loss": -5.98759651184082, "global_step": 60387, "epoch": 1437} {"train_loss": -5.896861553192139, "global_step": 60388, "epoch": 1437} {"train_loss": -5.837061882019043, "global_step": 60389, "epoch": 1437} {"train_loss": -5.908455848693848, "global_step": 60390, "epoch": 1437} {"train_loss": -5.813211441040039, "global_step": 60391, "epoch": 1437} {"train_loss": -5.774529457092285, "global_step": 60392, "epoch": 1437} {"train_loss": -6.008114814758301, "global_step": 60393, "epoch": 1437} {"train_loss": -5.953854560852051, "global_step": 60394, "epoch": 1437} {"train_loss": -5.919607378187633, "global_step": 60395, "epoch": 1437, "val_loss": 61498.69921875} {"train_loss": -5.910606861114502, "global_step": 60396, "epoch": 1438} {"train_loss": -5.904505729675293, "global_step": 60397, "epoch": 1438} {"train_loss": -6.012703895568848, "global_step": 60398, "epoch": 1438} {"train_loss": -5.943011283874512, "global_step": 60399, "epoch": 1438} {"train_loss": -5.8374738693237305, "global_step": 60400, "epoch": 1438} {"train_loss": -5.978786468505859, "global_step": 60401, "epoch": 1438} {"train_loss": -5.855294227600098, "global_step": 60402, "epoch": 1438} {"train_loss": -5.893276691436768, "global_step": 60403, "epoch": 1438} {"train_loss": -5.867558002471924, "global_step": 60404, "epoch": 1438} {"train_loss": -5.787590980529785, "global_step": 60405, "epoch": 1438} {"train_loss": -5.892822265625, "global_step": 60406, "epoch": 1438} {"train_loss": -5.935872554779053, "global_step": 60407, "epoch": 1438} {"train_loss": -5.961537837982178, "global_step": 60408, "epoch": 1438} {"train_loss": -5.958396911621094, "global_step": 60409, "epoch": 1438} {"train_loss": -5.96551513671875, "global_step": 60410, "epoch": 1438} {"train_loss": -5.80885648727417, "global_step": 60411, "epoch": 1438} {"train_loss": -5.825126647949219, "global_step": 60412, "epoch": 1438} {"train_loss": -5.986080169677734, "global_step": 60413, "epoch": 1438} {"train_loss": -6.0545148849487305, "global_step": 60414, "epoch": 1438} {"train_loss": -5.950405120849609, "global_step": 60415, "epoch": 1438} {"train_loss": -5.988882064819336, "global_step": 60416, "epoch": 1438} {"train_loss": -5.994470596313477, "global_step": 60417, "epoch": 1438} {"train_loss": -5.971100330352783, "global_step": 60418, "epoch": 1438} {"train_loss": -5.911960601806641, "global_step": 60419, "epoch": 1438} {"train_loss": -5.907153129577637, "global_step": 60420, "epoch": 1438} {"train_loss": -5.889920711517334, "global_step": 60421, "epoch": 1438} {"train_loss": -5.975940227508545, "global_step": 60422, "epoch": 1438} {"train_loss": -5.909152030944824, "global_step": 60423, "epoch": 1438} {"train_loss": -5.870288372039795, "global_step": 60424, "epoch": 1438} {"train_loss": -5.931914329528809, "global_step": 60425, "epoch": 1438} {"train_loss": -5.926459789276123, "global_step": 60426, "epoch": 1438} {"train_loss": -5.976758003234863, "global_step": 60427, "epoch": 1438} {"train_loss": -5.997145175933838, "global_step": 60428, "epoch": 1438} {"train_loss": -5.966372489929199, "global_step": 60429, "epoch": 1438} {"train_loss": -5.934203624725342, "global_step": 60430, "epoch": 1438} {"train_loss": -5.799536228179932, "global_step": 60431, "epoch": 1438} {"train_loss": -5.97451114654541, "global_step": 60432, "epoch": 1438} {"train_loss": -5.905338764190674, "global_step": 60433, "epoch": 1438} {"train_loss": -5.835405349731445, "global_step": 60434, "epoch": 1438} {"train_loss": -5.872856140136719, "global_step": 60435, "epoch": 1438} {"train_loss": -5.9311442375183105, "global_step": 60436, "epoch": 1438} {"train_loss": -5.919649351210821, "global_step": 60437, "epoch": 1438, "val_loss": 61498.7421875} {"train_loss": -5.978399276733398, "global_step": 60438, "epoch": 1439} {"train_loss": -5.906090259552002, "global_step": 60439, "epoch": 1439} {"train_loss": -5.9809112548828125, "global_step": 60440, "epoch": 1439} {"train_loss": -5.9168291091918945, "global_step": 60441, "epoch": 1439} {"train_loss": -5.8154802322387695, "global_step": 60442, "epoch": 1439} {"train_loss": -5.77568244934082, "global_step": 60443, "epoch": 1439} {"train_loss": -5.942494869232178, "global_step": 60444, "epoch": 1439} {"train_loss": -5.957297325134277, "global_step": 60445, "epoch": 1439} {"train_loss": -5.794296741485596, "global_step": 60446, "epoch": 1439} {"train_loss": -5.896332740783691, "global_step": 60447, "epoch": 1439} {"train_loss": -5.943424701690674, "global_step": 60448, "epoch": 1439} {"train_loss": -5.932768821716309, "global_step": 60449, "epoch": 1439} {"train_loss": -5.916902542114258, "global_step": 60450, "epoch": 1439} {"train_loss": -5.770280838012695, "global_step": 60451, "epoch": 1439} {"train_loss": -5.893115043640137, "global_step": 60452, "epoch": 1439} {"train_loss": -6.0042266845703125, "global_step": 60453, "epoch": 1439} {"train_loss": -6.040497779846191, "global_step": 60454, "epoch": 1439} {"train_loss": -5.951847076416016, "global_step": 60455, "epoch": 1439} {"train_loss": -5.789210796356201, "global_step": 60456, "epoch": 1439} {"train_loss": -5.787524223327637, "global_step": 60457, "epoch": 1439} {"train_loss": -5.929007530212402, "global_step": 60458, "epoch": 1439} {"train_loss": -5.98797082901001, "global_step": 60459, "epoch": 1439} {"train_loss": -5.834361553192139, "global_step": 60460, "epoch": 1439} {"train_loss": -5.8990159034729, "global_step": 60461, "epoch": 1439} {"train_loss": -6.039044380187988, "global_step": 60462, "epoch": 1439} {"train_loss": -6.029497146606445, "global_step": 60463, "epoch": 1439} {"train_loss": -5.9267168045043945, "global_step": 60464, "epoch": 1439} {"train_loss": -6.039798259735107, "global_step": 60465, "epoch": 1439} {"train_loss": -5.877845764160156, "global_step": 60466, "epoch": 1439} {"train_loss": -5.927923679351807, "global_step": 60467, "epoch": 1439} {"train_loss": -6.025738716125488, "global_step": 60468, "epoch": 1439} {"train_loss": -5.855517387390137, "global_step": 60469, "epoch": 1439} {"train_loss": -5.927730560302734, "global_step": 60470, "epoch": 1439} {"train_loss": -5.910829544067383, "global_step": 60471, "epoch": 1439} {"train_loss": -5.922513484954834, "global_step": 60472, "epoch": 1439} {"train_loss": -5.9626874923706055, "global_step": 60473, "epoch": 1439} {"train_loss": -6.017692565917969, "global_step": 60474, "epoch": 1439} {"train_loss": -5.889658451080322, "global_step": 60475, "epoch": 1439} {"train_loss": -5.910734176635742, "global_step": 60476, "epoch": 1439} {"train_loss": -5.867449760437012, "global_step": 60477, "epoch": 1439} {"train_loss": -5.7630157470703125, "global_step": 60478, "epoch": 1439} {"train_loss": -5.916733367102487, "global_step": 60479, "epoch": 1439, "val_loss": 61338.1875} {"train_loss": -6.03170108795166, "global_step": 60480, "epoch": 1440} {"train_loss": -6.005917549133301, "global_step": 60481, "epoch": 1440} {"train_loss": -5.9681525230407715, "global_step": 60482, "epoch": 1440} {"train_loss": -6.023430824279785, "global_step": 60483, "epoch": 1440} {"train_loss": -5.867201805114746, "global_step": 60484, "epoch": 1440} {"train_loss": -5.951025009155273, "global_step": 60485, "epoch": 1440} {"train_loss": -5.951972484588623, "global_step": 60486, "epoch": 1440} {"train_loss": -5.777570724487305, "global_step": 60487, "epoch": 1440} {"train_loss": -5.92225456237793, "global_step": 60488, "epoch": 1440} {"train_loss": -5.941954135894775, "global_step": 60489, "epoch": 1440} {"train_loss": -5.835261344909668, "global_step": 60490, "epoch": 1440} {"train_loss": -5.93450927734375, "global_step": 60491, "epoch": 1440} {"train_loss": -5.936318874359131, "global_step": 60492, "epoch": 1440} {"train_loss": -5.846972942352295, "global_step": 60493, "epoch": 1440} {"train_loss": -5.9116058349609375, "global_step": 60494, "epoch": 1440} {"train_loss": -5.931188583374023, "global_step": 60495, "epoch": 1440} {"train_loss": -5.851225852966309, "global_step": 60496, "epoch": 1440} {"train_loss": -5.807750701904297, "global_step": 60497, "epoch": 1440} {"train_loss": -5.824159145355225, "global_step": 60498, "epoch": 1440} {"train_loss": -5.877720832824707, "global_step": 60499, "epoch": 1440} {"train_loss": -5.885894775390625, "global_step": 60500, "epoch": 1440} {"train_loss": -5.923462867736816, "global_step": 60501, "epoch": 1440} {"train_loss": -5.908123970031738, "global_step": 60502, "epoch": 1440} {"train_loss": -5.8408966064453125, "global_step": 60503, "epoch": 1440} {"train_loss": -5.94287109375, "global_step": 60504, "epoch": 1440} {"train_loss": -6.02247428894043, "global_step": 60505, "epoch": 1440} {"train_loss": -5.925144195556641, "global_step": 60506, "epoch": 1440} {"train_loss": -5.946524620056152, "global_step": 60507, "epoch": 1440} {"train_loss": -6.03167724609375, "global_step": 60508, "epoch": 1440} {"train_loss": -5.774318695068359, "global_step": 60509, "epoch": 1440} {"train_loss": -5.919018745422363, "global_step": 60510, "epoch": 1440} {"train_loss": -5.970747947692871, "global_step": 60511, "epoch": 1440} {"train_loss": -5.915223121643066, "global_step": 60512, "epoch": 1440} {"train_loss": -5.995923042297363, "global_step": 60513, "epoch": 1440} {"train_loss": -5.857112407684326, "global_step": 60514, "epoch": 1440} {"train_loss": -5.874863147735596, "global_step": 60515, "epoch": 1440} {"train_loss": -5.893882751464844, "global_step": 60516, "epoch": 1440} {"train_loss": -5.950272560119629, "global_step": 60517, "epoch": 1440} {"train_loss": -5.895524978637695, "global_step": 60518, "epoch": 1440} {"train_loss": -5.806509017944336, "global_step": 60519, "epoch": 1440} {"train_loss": -5.8877153396606445, "global_step": 60520, "epoch": 1440} {"train_loss": -5.912760291780744, "global_step": 60521, "epoch": 1440, "val_loss": 61264.9453125} {"train_loss": -5.854427814483643, "global_step": 60522, "epoch": 1441} {"train_loss": -5.993680000305176, "global_step": 60523, "epoch": 1441} {"train_loss": -5.893135070800781, "global_step": 60524, "epoch": 1441} {"train_loss": -5.925406455993652, "global_step": 60525, "epoch": 1441} {"train_loss": -5.85884952545166, "global_step": 60526, "epoch": 1441} {"train_loss": -5.788585662841797, "global_step": 60527, "epoch": 1441} {"train_loss": -6.081993103027344, "global_step": 60528, "epoch": 1441} {"train_loss": -5.890289306640625, "global_step": 60529, "epoch": 1441} {"train_loss": -5.946476936340332, "global_step": 60530, "epoch": 1441} {"train_loss": -5.939267158508301, "global_step": 60531, "epoch": 1441} {"train_loss": -5.924374103546143, "global_step": 60532, "epoch": 1441} {"train_loss": -6.048074722290039, "global_step": 60533, "epoch": 1441} {"train_loss": -5.831437110900879, "global_step": 60534, "epoch": 1441} {"train_loss": -5.879783630371094, "global_step": 60535, "epoch": 1441} {"train_loss": -5.881146430969238, "global_step": 60536, "epoch": 1441} {"train_loss": -5.885274410247803, "global_step": 60537, "epoch": 1441} {"train_loss": -5.825981140136719, "global_step": 60538, "epoch": 1441} {"train_loss": -5.8600311279296875, "global_step": 60539, "epoch": 1441} {"train_loss": -5.903808116912842, "global_step": 60540, "epoch": 1441} {"train_loss": -6.031988143920898, "global_step": 60541, "epoch": 1441} {"train_loss": -6.000601768493652, "global_step": 60542, "epoch": 1441} {"train_loss": -5.7517619132995605, "global_step": 60543, "epoch": 1441} {"train_loss": -5.87288761138916, "global_step": 60544, "epoch": 1441} {"train_loss": -5.996469497680664, "global_step": 60545, "epoch": 1441} {"train_loss": -5.948312759399414, "global_step": 60546, "epoch": 1441} {"train_loss": -5.9156999588012695, "global_step": 60547, "epoch": 1441} {"train_loss": -5.93408203125, "global_step": 60548, "epoch": 1441} {"train_loss": -5.896607398986816, "global_step": 60549, "epoch": 1441} {"train_loss": -6.019640922546387, "global_step": 60550, "epoch": 1441} {"train_loss": -5.964343070983887, "global_step": 60551, "epoch": 1441} {"train_loss": -6.051362991333008, "global_step": 60552, "epoch": 1441} {"train_loss": -6.0749592781066895, "global_step": 60553, "epoch": 1441} {"train_loss": -5.975240707397461, "global_step": 60554, "epoch": 1441} {"train_loss": -5.958652496337891, "global_step": 60555, "epoch": 1441} {"train_loss": -5.901559829711914, "global_step": 60556, "epoch": 1441} {"train_loss": -5.85468864440918, "global_step": 60557, "epoch": 1441} {"train_loss": -5.940159320831299, "global_step": 60558, "epoch": 1441} {"train_loss": -5.91574764251709, "global_step": 60559, "epoch": 1441} {"train_loss": -5.995449066162109, "global_step": 60560, "epoch": 1441} {"train_loss": -5.902583122253418, "global_step": 60561, "epoch": 1441} {"train_loss": -5.787482261657715, "global_step": 60562, "epoch": 1441} {"train_loss": -5.9253755296979636, "global_step": 60563, "epoch": 1441, "val_loss": 61212.97265625} {"train_loss": -5.962203502655029, "global_step": 60564, "epoch": 1442} {"train_loss": -5.905092239379883, "global_step": 60565, "epoch": 1442} {"train_loss": -5.98235559463501, "global_step": 60566, "epoch": 1442} {"train_loss": -5.8699631690979, "global_step": 60567, "epoch": 1442} {"train_loss": -5.9187822341918945, "global_step": 60568, "epoch": 1442} {"train_loss": -5.902362823486328, "global_step": 60569, "epoch": 1442} {"train_loss": -5.959717750549316, "global_step": 60570, "epoch": 1442} {"train_loss": -5.8612236976623535, "global_step": 60571, "epoch": 1442} {"train_loss": -6.040204048156738, "global_step": 60572, "epoch": 1442} {"train_loss": -5.998260498046875, "global_step": 60573, "epoch": 1442} {"train_loss": -5.8935627937316895, "global_step": 60574, "epoch": 1442} {"train_loss": -5.863528251647949, "global_step": 60575, "epoch": 1442} {"train_loss": -5.975573539733887, "global_step": 60576, "epoch": 1442} {"train_loss": -5.936223983764648, "global_step": 60577, "epoch": 1442} {"train_loss": -5.782952308654785, "global_step": 60578, "epoch": 1442} {"train_loss": -5.95651912689209, "global_step": 60579, "epoch": 1442} {"train_loss": -5.835713863372803, "global_step": 60580, "epoch": 1442} {"train_loss": -5.846368312835693, "global_step": 60581, "epoch": 1442} {"train_loss": -6.038627624511719, "global_step": 60582, "epoch": 1442} {"train_loss": -5.869407653808594, "global_step": 60583, "epoch": 1442} {"train_loss": -5.820183753967285, "global_step": 60584, "epoch": 1442} {"train_loss": -5.682163238525391, "global_step": 60585, "epoch": 1442} {"train_loss": -5.922698020935059, "global_step": 60586, "epoch": 1442} {"train_loss": -5.83743953704834, "global_step": 60587, "epoch": 1442} {"train_loss": -5.8216118812561035, "global_step": 60588, "epoch": 1442} {"train_loss": -6.041460037231445, "global_step": 60589, "epoch": 1442} {"train_loss": -5.768115043640137, "global_step": 60590, "epoch": 1442} {"train_loss": -5.771404266357422, "global_step": 60591, "epoch": 1442} {"train_loss": -5.869812965393066, "global_step": 60592, "epoch": 1442} {"train_loss": -5.793726444244385, "global_step": 60593, "epoch": 1442} {"train_loss": -5.8035478591918945, "global_step": 60594, "epoch": 1442} {"train_loss": -5.868213653564453, "global_step": 60595, "epoch": 1442} {"train_loss": -5.884888172149658, "global_step": 60596, "epoch": 1442} {"train_loss": -5.8690900802612305, "global_step": 60597, "epoch": 1442} {"train_loss": -5.906279563903809, "global_step": 60598, "epoch": 1442} {"train_loss": -5.85398006439209, "global_step": 60599, "epoch": 1442} {"train_loss": -5.83311128616333, "global_step": 60600, "epoch": 1442} {"train_loss": -5.8669328689575195, "global_step": 60601, "epoch": 1442} {"train_loss": -5.903625011444092, "global_step": 60602, "epoch": 1442} {"train_loss": -5.884666442871094, "global_step": 60603, "epoch": 1442} {"train_loss": -5.871800899505615, "global_step": 60604, "epoch": 1442} {"train_loss": -5.887294405982608, "global_step": 60605, "epoch": 1442, "val_loss": 61674.2109375} {"train_loss": -5.915174961090088, "global_step": 60606, "epoch": 1443} {"train_loss": -5.985655307769775, "global_step": 60607, "epoch": 1443} {"train_loss": -5.912729263305664, "global_step": 60608, "epoch": 1443} {"train_loss": -5.851543426513672, "global_step": 60609, "epoch": 1443} {"train_loss": -5.8738179206848145, "global_step": 60610, "epoch": 1443} {"train_loss": -5.824668884277344, "global_step": 60611, "epoch": 1443} {"train_loss": -6.116122245788574, "global_step": 60612, "epoch": 1443} {"train_loss": -5.964496612548828, "global_step": 60613, "epoch": 1443} {"train_loss": -5.833762168884277, "global_step": 60614, "epoch": 1443} {"train_loss": -5.807704448699951, "global_step": 60615, "epoch": 1443} {"train_loss": -5.976916313171387, "global_step": 60616, "epoch": 1443} {"train_loss": -5.808279037475586, "global_step": 60617, "epoch": 1443} {"train_loss": -5.869383335113525, "global_step": 60618, "epoch": 1443} {"train_loss": -5.951181411743164, "global_step": 60619, "epoch": 1443} {"train_loss": -5.853713035583496, "global_step": 60620, "epoch": 1443} {"train_loss": -6.059570789337158, "global_step": 60621, "epoch": 1443} {"train_loss": -6.003956317901611, "global_step": 60622, "epoch": 1443} {"train_loss": -5.955679893493652, "global_step": 60623, "epoch": 1443} {"train_loss": -5.888883590698242, "global_step": 60624, "epoch": 1443} {"train_loss": -5.907489776611328, "global_step": 60625, "epoch": 1443} {"train_loss": -5.88784122467041, "global_step": 60626, "epoch": 1443} {"train_loss": -5.848857879638672, "global_step": 60627, "epoch": 1443} {"train_loss": -5.8099045753479, "global_step": 60628, "epoch": 1443} {"train_loss": -5.875344753265381, "global_step": 60629, "epoch": 1443} {"train_loss": -5.893623352050781, "global_step": 60630, "epoch": 1443} {"train_loss": -5.924685955047607, "global_step": 60631, "epoch": 1443} {"train_loss": -5.966226577758789, "global_step": 60632, "epoch": 1443} {"train_loss": -5.89068603515625, "global_step": 60633, "epoch": 1443} {"train_loss": -6.028749942779541, "global_step": 60634, "epoch": 1443} {"train_loss": -5.974555015563965, "global_step": 60635, "epoch": 1443} {"train_loss": -5.883289813995361, "global_step": 60636, "epoch": 1443} {"train_loss": -5.956204891204834, "global_step": 60637, "epoch": 1443} {"train_loss": -5.928116798400879, "global_step": 60638, "epoch": 1443} {"train_loss": -5.968056678771973, "global_step": 60639, "epoch": 1443} {"train_loss": -5.890149116516113, "global_step": 60640, "epoch": 1443} {"train_loss": -5.9436235427856445, "global_step": 60641, "epoch": 1443} {"train_loss": -5.877315521240234, "global_step": 60642, "epoch": 1443} {"train_loss": -6.07216739654541, "global_step": 60643, "epoch": 1443} {"train_loss": -6.0009284019470215, "global_step": 60644, "epoch": 1443} {"train_loss": -5.882125377655029, "global_step": 60645, "epoch": 1443} {"train_loss": -5.924505233764648, "global_step": 60646, "epoch": 1443} {"train_loss": -5.920390776225498, "global_step": 60647, "epoch": 1443, "val_loss": 61314.0} {"train_loss": -5.961048126220703, "global_step": 60648, "epoch": 1444} {"train_loss": -5.922063827514648, "global_step": 60649, "epoch": 1444} {"train_loss": -5.891984939575195, "global_step": 60650, "epoch": 1444} {"train_loss": -5.966447353363037, "global_step": 60651, "epoch": 1444} {"train_loss": -5.887914657592773, "global_step": 60652, "epoch": 1444} {"train_loss": -5.940191268920898, "global_step": 60653, "epoch": 1444} {"train_loss": -5.911267280578613, "global_step": 60654, "epoch": 1444} {"train_loss": -5.970820426940918, "global_step": 60655, "epoch": 1444} {"train_loss": -5.858120918273926, "global_step": 60656, "epoch": 1444} {"train_loss": -5.961181163787842, "global_step": 60657, "epoch": 1444} {"train_loss": -5.843920707702637, "global_step": 60658, "epoch": 1444} {"train_loss": -5.77579402923584, "global_step": 60659, "epoch": 1444} {"train_loss": -5.905400276184082, "global_step": 60660, "epoch": 1444} {"train_loss": -5.969952583312988, "global_step": 60661, "epoch": 1444} {"train_loss": -5.778450012207031, "global_step": 60662, "epoch": 1444} {"train_loss": -5.926119804382324, "global_step": 60663, "epoch": 1444} {"train_loss": -5.985023498535156, "global_step": 60664, "epoch": 1444} {"train_loss": -5.922361850738525, "global_step": 60665, "epoch": 1444} {"train_loss": -5.9248456954956055, "global_step": 60666, "epoch": 1444} {"train_loss": -5.913451194763184, "global_step": 60667, "epoch": 1444} {"train_loss": -5.894670486450195, "global_step": 60668, "epoch": 1444} {"train_loss": -5.892731666564941, "global_step": 60669, "epoch": 1444} {"train_loss": -5.946799278259277, "global_step": 60670, "epoch": 1444} {"train_loss": -5.986992359161377, "global_step": 60671, "epoch": 1444} {"train_loss": -5.891229629516602, "global_step": 60672, "epoch": 1444} {"train_loss": -5.937680244445801, "global_step": 60673, "epoch": 1444} {"train_loss": -5.9430389404296875, "global_step": 60674, "epoch": 1444} {"train_loss": -5.917423248291016, "global_step": 60675, "epoch": 1444} {"train_loss": -5.806012153625488, "global_step": 60676, "epoch": 1444} {"train_loss": -5.876524925231934, "global_step": 60677, "epoch": 1444} {"train_loss": -5.937150001525879, "global_step": 60678, "epoch": 1444} {"train_loss": -5.760322570800781, "global_step": 60679, "epoch": 1444} {"train_loss": -5.86749792098999, "global_step": 60680, "epoch": 1444} {"train_loss": -5.944481372833252, "global_step": 60681, "epoch": 1444} {"train_loss": -5.879215240478516, "global_step": 60682, "epoch": 1444} {"train_loss": -5.853477478027344, "global_step": 60683, "epoch": 1444} {"train_loss": -5.886651992797852, "global_step": 60684, "epoch": 1444} {"train_loss": -5.913445472717285, "global_step": 60685, "epoch": 1444} {"train_loss": -6.009320259094238, "global_step": 60686, "epoch": 1444} {"train_loss": -5.885400295257568, "global_step": 60687, "epoch": 1444} {"train_loss": -5.828768730163574, "global_step": 60688, "epoch": 1444} {"train_loss": -5.907687334787278, "global_step": 60689, "epoch": 1444, "val_loss": 61364.83203125} {"train_loss": -5.923415184020996, "global_step": 60690, "epoch": 1445} {"train_loss": -5.814279556274414, "global_step": 60691, "epoch": 1445} {"train_loss": -5.993992328643799, "global_step": 60692, "epoch": 1445} {"train_loss": -5.826584815979004, "global_step": 60693, "epoch": 1445} {"train_loss": -5.973447322845459, "global_step": 60694, "epoch": 1445} {"train_loss": -5.8787336349487305, "global_step": 60695, "epoch": 1445} {"train_loss": -6.035769462585449, "global_step": 60696, "epoch": 1445} {"train_loss": -5.90779972076416, "global_step": 60697, "epoch": 1445} {"train_loss": -5.9209747314453125, "global_step": 60698, "epoch": 1445} {"train_loss": -5.86881685256958, "global_step": 60699, "epoch": 1445} {"train_loss": -5.854511737823486, "global_step": 60700, "epoch": 1445} {"train_loss": -5.932065010070801, "global_step": 60701, "epoch": 1445} {"train_loss": -5.951433181762695, "global_step": 60702, "epoch": 1445} {"train_loss": -5.862227916717529, "global_step": 60703, "epoch": 1445} {"train_loss": -5.999048233032227, "global_step": 60704, "epoch": 1445} {"train_loss": -5.83479642868042, "global_step": 60705, "epoch": 1445} {"train_loss": -6.010617256164551, "global_step": 60706, "epoch": 1445} {"train_loss": -5.875769138336182, "global_step": 60707, "epoch": 1445} {"train_loss": -5.8047990798950195, "global_step": 60708, "epoch": 1445} {"train_loss": -5.85703182220459, "global_step": 60709, "epoch": 1445} {"train_loss": -5.913403511047363, "global_step": 60710, "epoch": 1445} {"train_loss": -5.780733585357666, "global_step": 60711, "epoch": 1445} {"train_loss": -5.932483673095703, "global_step": 60712, "epoch": 1445} {"train_loss": -5.835983753204346, "global_step": 60713, "epoch": 1445} {"train_loss": -5.956705093383789, "global_step": 60714, "epoch": 1445} {"train_loss": -5.833132743835449, "global_step": 60715, "epoch": 1445} {"train_loss": -5.975716590881348, "global_step": 60716, "epoch": 1445} {"train_loss": -5.80068302154541, "global_step": 60717, "epoch": 1445} {"train_loss": -5.930960655212402, "global_step": 60718, "epoch": 1445} {"train_loss": -5.891435623168945, "global_step": 60719, "epoch": 1445} {"train_loss": -5.819663047790527, "global_step": 60720, "epoch": 1445} {"train_loss": -5.831494331359863, "global_step": 60721, "epoch": 1445} {"train_loss": -5.917599201202393, "global_step": 60722, "epoch": 1445} {"train_loss": -5.90211296081543, "global_step": 60723, "epoch": 1445} {"train_loss": -5.895745277404785, "global_step": 60724, "epoch": 1445} {"train_loss": -5.944220542907715, "global_step": 60725, "epoch": 1445} {"train_loss": -5.941404819488525, "global_step": 60726, "epoch": 1445} {"train_loss": -5.917770862579346, "global_step": 60727, "epoch": 1445} {"train_loss": -5.818018913269043, "global_step": 60728, "epoch": 1445} {"train_loss": -5.903923034667969, "global_step": 60729, "epoch": 1445} {"train_loss": -5.861271858215332, "global_step": 60730, "epoch": 1445} {"train_loss": -5.895865463075184, "global_step": 60731, "epoch": 1445, "val_loss": 61356.66015625} {"train_loss": -5.936313629150391, "global_step": 60732, "epoch": 1446} {"train_loss": -5.917957305908203, "global_step": 60733, "epoch": 1446} {"train_loss": -5.912874221801758, "global_step": 60734, "epoch": 1446} {"train_loss": -5.879636764526367, "global_step": 60735, "epoch": 1446} {"train_loss": -5.915331840515137, "global_step": 60736, "epoch": 1446} {"train_loss": -5.838803291320801, "global_step": 60737, "epoch": 1446} {"train_loss": -6.017911434173584, "global_step": 60738, "epoch": 1446} {"train_loss": -6.0527167320251465, "global_step": 60739, "epoch": 1446} {"train_loss": -5.932194709777832, "global_step": 60740, "epoch": 1446} {"train_loss": -5.914823055267334, "global_step": 60741, "epoch": 1446} {"train_loss": -5.943658828735352, "global_step": 60742, "epoch": 1446} {"train_loss": -5.983426094055176, "global_step": 60743, "epoch": 1446} {"train_loss": -5.978862285614014, "global_step": 60744, "epoch": 1446} {"train_loss": -6.063291549682617, "global_step": 60745, "epoch": 1446} {"train_loss": -5.854731559753418, "global_step": 60746, "epoch": 1446} {"train_loss": -5.8794379234313965, "global_step": 60747, "epoch": 1446} {"train_loss": -5.9414167404174805, "global_step": 60748, "epoch": 1446} {"train_loss": -5.998410224914551, "global_step": 60749, "epoch": 1446} {"train_loss": -5.861452579498291, "global_step": 60750, "epoch": 1446} {"train_loss": -5.966153144836426, "global_step": 60751, "epoch": 1446} {"train_loss": -5.853713035583496, "global_step": 60752, "epoch": 1446} {"train_loss": -5.968722343444824, "global_step": 60753, "epoch": 1446} {"train_loss": -5.935391902923584, "global_step": 60754, "epoch": 1446} {"train_loss": -5.998469352722168, "global_step": 60755, "epoch": 1446} {"train_loss": -5.917539596557617, "global_step": 60756, "epoch": 1446} {"train_loss": -5.818844795227051, "global_step": 60757, "epoch": 1446} {"train_loss": -5.913688659667969, "global_step": 60758, "epoch": 1446} {"train_loss": -5.834434509277344, "global_step": 60759, "epoch": 1446} {"train_loss": -5.836061000823975, "global_step": 60760, "epoch": 1446} {"train_loss": -5.950318813323975, "global_step": 60761, "epoch": 1446} {"train_loss": -5.886813163757324, "global_step": 60762, "epoch": 1446} {"train_loss": -6.02180290222168, "global_step": 60763, "epoch": 1446} {"train_loss": -5.970337867736816, "global_step": 60764, "epoch": 1446} {"train_loss": -5.869449615478516, "global_step": 60765, "epoch": 1446} {"train_loss": -5.981956958770752, "global_step": 60766, "epoch": 1446} {"train_loss": -5.9088897705078125, "global_step": 60767, "epoch": 1446} {"train_loss": -5.861761093139648, "global_step": 60768, "epoch": 1446} {"train_loss": -5.922828674316406, "global_step": 60769, "epoch": 1446} {"train_loss": -5.926235198974609, "global_step": 60770, "epoch": 1446} {"train_loss": -5.906398773193359, "global_step": 60771, "epoch": 1446} {"train_loss": -5.940274715423584, "global_step": 60772, "epoch": 1446} {"train_loss": -5.927138748623076, "global_step": 60773, "epoch": 1446, "val_loss": 61450.1328125} {"train_loss": -5.875638961791992, "global_step": 60774, "epoch": 1447} {"train_loss": -5.906837463378906, "global_step": 60775, "epoch": 1447} {"train_loss": -6.023427963256836, "global_step": 60776, "epoch": 1447} {"train_loss": -5.906821250915527, "global_step": 60777, "epoch": 1447} {"train_loss": -6.030300140380859, "global_step": 60778, "epoch": 1447} {"train_loss": -6.030608654022217, "global_step": 60779, "epoch": 1447} {"train_loss": -5.877671241760254, "global_step": 60780, "epoch": 1447} {"train_loss": -5.87957763671875, "global_step": 60781, "epoch": 1447} {"train_loss": -5.979903221130371, "global_step": 60782, "epoch": 1447} {"train_loss": -5.980413436889648, "global_step": 60783, "epoch": 1447} {"train_loss": -5.772671699523926, "global_step": 60784, "epoch": 1447} {"train_loss": -5.966796398162842, "global_step": 60785, "epoch": 1447} {"train_loss": -6.025358200073242, "global_step": 60786, "epoch": 1447} {"train_loss": -6.086887359619141, "global_step": 60787, "epoch": 1447} {"train_loss": -6.00297737121582, "global_step": 60788, "epoch": 1447} {"train_loss": -5.9463605880737305, "global_step": 60789, "epoch": 1447} {"train_loss": -5.916275501251221, "global_step": 60790, "epoch": 1447} {"train_loss": -5.8016767501831055, "global_step": 60791, "epoch": 1447} {"train_loss": -5.958208084106445, "global_step": 60792, "epoch": 1447} {"train_loss": -5.959294319152832, "global_step": 60793, "epoch": 1447} {"train_loss": -5.920287132263184, "global_step": 60794, "epoch": 1447} {"train_loss": -5.908773422241211, "global_step": 60795, "epoch": 1447} {"train_loss": -6.00767183303833, "global_step": 60796, "epoch": 1447} {"train_loss": -5.832472324371338, "global_step": 60797, "epoch": 1447} {"train_loss": -5.977322578430176, "global_step": 60798, "epoch": 1447} {"train_loss": -5.897877216339111, "global_step": 60799, "epoch": 1447} {"train_loss": -5.878438949584961, "global_step": 60800, "epoch": 1447} {"train_loss": -5.872370719909668, "global_step": 60801, "epoch": 1447} {"train_loss": -5.982388496398926, "global_step": 60802, "epoch": 1447} {"train_loss": -5.907334327697754, "global_step": 60803, "epoch": 1447} {"train_loss": -5.9652605056762695, "global_step": 60804, "epoch": 1447} {"train_loss": -5.815831184387207, "global_step": 60805, "epoch": 1447} {"train_loss": -5.802826881408691, "global_step": 60806, "epoch": 1447} {"train_loss": -5.756629467010498, "global_step": 60807, "epoch": 1447} {"train_loss": -5.967494010925293, "global_step": 60808, "epoch": 1447} {"train_loss": -5.825438976287842, "global_step": 60809, "epoch": 1447} {"train_loss": -5.833380699157715, "global_step": 60810, "epoch": 1447} {"train_loss": -5.9090423583984375, "global_step": 60811, "epoch": 1447} {"train_loss": -5.822466850280762, "global_step": 60812, "epoch": 1447} {"train_loss": -5.895749092102051, "global_step": 60813, "epoch": 1447} {"train_loss": -5.856559753417969, "global_step": 60814, "epoch": 1447} {"train_loss": -5.916284651983352, "global_step": 60815, "epoch": 1447, "val_loss": 61436.84375} {"train_loss": -5.874457836151123, "global_step": 60816, "epoch": 1448} {"train_loss": -5.89872932434082, "global_step": 60817, "epoch": 1448} {"train_loss": -5.9237260818481445, "global_step": 60818, "epoch": 1448} {"train_loss": -6.099940299987793, "global_step": 60819, "epoch": 1448} {"train_loss": -5.893901348114014, "global_step": 60820, "epoch": 1448} {"train_loss": -5.971866130828857, "global_step": 60821, "epoch": 1448} {"train_loss": -5.882143020629883, "global_step": 60822, "epoch": 1448} {"train_loss": -5.996726036071777, "global_step": 60823, "epoch": 1448} {"train_loss": -5.959286212921143, "global_step": 60824, "epoch": 1448} {"train_loss": -5.997288703918457, "global_step": 60825, "epoch": 1448} {"train_loss": -5.949620246887207, "global_step": 60826, "epoch": 1448} {"train_loss": -5.880078315734863, "global_step": 60827, "epoch": 1448} {"train_loss": -5.885668754577637, "global_step": 60828, "epoch": 1448} {"train_loss": -5.889618873596191, "global_step": 60829, "epoch": 1448} {"train_loss": -5.938850402832031, "global_step": 60830, "epoch": 1448} {"train_loss": -5.763681411743164, "global_step": 60831, "epoch": 1448} {"train_loss": -5.891432762145996, "global_step": 60832, "epoch": 1448} {"train_loss": -5.761906623840332, "global_step": 60833, "epoch": 1448} {"train_loss": -5.936822414398193, "global_step": 60834, "epoch": 1448} {"train_loss": -5.925773620605469, "global_step": 60835, "epoch": 1448} {"train_loss": -5.965220928192139, "global_step": 60836, "epoch": 1448} {"train_loss": -5.917428016662598, "global_step": 60837, "epoch": 1448} {"train_loss": -5.867735385894775, "global_step": 60838, "epoch": 1448} {"train_loss": -5.754725933074951, "global_step": 60839, "epoch": 1448} {"train_loss": -5.8625969886779785, "global_step": 60840, "epoch": 1448} {"train_loss": -5.770496368408203, "global_step": 60841, "epoch": 1448} {"train_loss": -5.953503608703613, "global_step": 60842, "epoch": 1448} {"train_loss": -5.810525894165039, "global_step": 60843, "epoch": 1448} {"train_loss": -5.837457180023193, "global_step": 60844, "epoch": 1448} {"train_loss": -6.036314010620117, "global_step": 60845, "epoch": 1448} {"train_loss": -5.9344611167907715, "global_step": 60846, "epoch": 1448} {"train_loss": -5.9063310623168945, "global_step": 60847, "epoch": 1448} {"train_loss": -5.964178085327148, "global_step": 60848, "epoch": 1448} {"train_loss": -5.870464324951172, "global_step": 60849, "epoch": 1448} {"train_loss": -5.898638725280762, "global_step": 60850, "epoch": 1448} {"train_loss": -5.755710601806641, "global_step": 60851, "epoch": 1448} {"train_loss": -5.902685165405273, "global_step": 60852, "epoch": 1448} {"train_loss": -5.978610038757324, "global_step": 60853, "epoch": 1448} {"train_loss": -6.013769626617432, "global_step": 60854, "epoch": 1448} {"train_loss": -6.0154876708984375, "global_step": 60855, "epoch": 1448} {"train_loss": -5.861093521118164, "global_step": 60856, "epoch": 1448} {"train_loss": -5.909875313440959, "global_step": 60857, "epoch": 1448, "val_loss": 61577.1953125} {"train_loss": -6.008120059967041, "global_step": 60858, "epoch": 1449} {"train_loss": -5.881608009338379, "global_step": 60859, "epoch": 1449} {"train_loss": -5.876705646514893, "global_step": 60860, "epoch": 1449} {"train_loss": -5.942981719970703, "global_step": 60861, "epoch": 1449} {"train_loss": -5.840877532958984, "global_step": 60862, "epoch": 1449} {"train_loss": -5.9724440574646, "global_step": 60863, "epoch": 1449} {"train_loss": -5.917102813720703, "global_step": 60864, "epoch": 1449} {"train_loss": -5.786249160766602, "global_step": 60865, "epoch": 1449} {"train_loss": -5.989393711090088, "global_step": 60866, "epoch": 1449} {"train_loss": -5.902619361877441, "global_step": 60867, "epoch": 1449} {"train_loss": -5.708136558532715, "global_step": 60868, "epoch": 1449} {"train_loss": -5.827980995178223, "global_step": 60869, "epoch": 1449} {"train_loss": -5.840306282043457, "global_step": 60870, "epoch": 1449} {"train_loss": -5.948690414428711, "global_step": 60871, "epoch": 1449} {"train_loss": -5.864664077758789, "global_step": 60872, "epoch": 1449} {"train_loss": -5.887734413146973, "global_step": 60873, "epoch": 1449} {"train_loss": -6.004904747009277, "global_step": 60874, "epoch": 1449} {"train_loss": -5.877168655395508, "global_step": 60875, "epoch": 1449} {"train_loss": -5.842777729034424, "global_step": 60876, "epoch": 1449} {"train_loss": -5.853187084197998, "global_step": 60877, "epoch": 1449} {"train_loss": -5.863162517547607, "global_step": 60878, "epoch": 1449} {"train_loss": -5.900362968444824, "global_step": 60879, "epoch": 1449} {"train_loss": -5.922096252441406, "global_step": 60880, "epoch": 1449} {"train_loss": -5.936099529266357, "global_step": 60881, "epoch": 1449} {"train_loss": -5.889502048492432, "global_step": 60882, "epoch": 1449} {"train_loss": -5.884305000305176, "global_step": 60883, "epoch": 1449} {"train_loss": -5.847311973571777, "global_step": 60884, "epoch": 1449} {"train_loss": -5.777926445007324, "global_step": 60885, "epoch": 1449} {"train_loss": -5.980807781219482, "global_step": 60886, "epoch": 1449} {"train_loss": -5.896893501281738, "global_step": 60887, "epoch": 1449} {"train_loss": -5.802163124084473, "global_step": 60888, "epoch": 1449} {"train_loss": -5.995969772338867, "global_step": 60889, "epoch": 1449} {"train_loss": -5.869585037231445, "global_step": 60890, "epoch": 1449} {"train_loss": -5.8078179359436035, "global_step": 60891, "epoch": 1449} {"train_loss": -5.9071502685546875, "global_step": 60892, "epoch": 1449} {"train_loss": -5.783946990966797, "global_step": 60893, "epoch": 1449} {"train_loss": -5.869345664978027, "global_step": 60894, "epoch": 1449} {"train_loss": -5.710239410400391, "global_step": 60895, "epoch": 1449} {"train_loss": -5.852567672729492, "global_step": 60896, "epoch": 1449} {"train_loss": -5.808078765869141, "global_step": 60897, "epoch": 1449} {"train_loss": -5.853985786437988, "global_step": 60898, "epoch": 1449} {"train_loss": -5.8746657485053655, "global_step": 60899, "epoch": 1449, "val_loss": 61722.9375} {"train_loss": -5.809728622436523, "global_step": 60900, "epoch": 1450} {"train_loss": -5.895193099975586, "global_step": 60901, "epoch": 1450} {"train_loss": -5.781469345092773, "global_step": 60902, "epoch": 1450} {"train_loss": -5.950530052185059, "global_step": 60903, "epoch": 1450} {"train_loss": -5.7763824462890625, "global_step": 60904, "epoch": 1450} {"train_loss": -5.754183769226074, "global_step": 60905, "epoch": 1450} {"train_loss": -5.865908622741699, "global_step": 60906, "epoch": 1450} {"train_loss": -5.696837902069092, "global_step": 60907, "epoch": 1450} {"train_loss": -5.996042251586914, "global_step": 60908, "epoch": 1450} {"train_loss": -5.765401840209961, "global_step": 60909, "epoch": 1450} {"train_loss": -5.864592552185059, "global_step": 60910, "epoch": 1450} {"train_loss": -5.797866344451904, "global_step": 60911, "epoch": 1450} {"train_loss": -5.9677534103393555, "global_step": 60912, "epoch": 1450} {"train_loss": -5.757367134094238, "global_step": 60913, "epoch": 1450} {"train_loss": -5.85715389251709, "global_step": 60914, "epoch": 1450} {"train_loss": -5.894532203674316, "global_step": 60915, "epoch": 1450} {"train_loss": -5.9781904220581055, "global_step": 60916, "epoch": 1450} {"train_loss": -5.852207183837891, "global_step": 60917, "epoch": 1450} {"train_loss": -5.963565826416016, "global_step": 60918, "epoch": 1450} {"train_loss": -5.805441856384277, "global_step": 60919, "epoch": 1450} {"train_loss": -5.873561859130859, "global_step": 60920, "epoch": 1450} {"train_loss": -5.914703845977783, "global_step": 60921, "epoch": 1450} {"train_loss": -5.90536642074585, "global_step": 60922, "epoch": 1450} {"train_loss": -5.899404525756836, "global_step": 60923, "epoch": 1450} {"train_loss": -5.915109157562256, "global_step": 60924, "epoch": 1450} {"train_loss": -5.958303928375244, "global_step": 60925, "epoch": 1450} {"train_loss": -5.917669296264648, "global_step": 60926, "epoch": 1450} {"train_loss": -6.029171943664551, "global_step": 60927, "epoch": 1450} {"train_loss": -5.916902542114258, "global_step": 60928, "epoch": 1450} {"train_loss": -5.989438056945801, "global_step": 60929, "epoch": 1450} {"train_loss": -5.836399078369141, "global_step": 60930, "epoch": 1450} {"train_loss": -5.962047576904297, "global_step": 60931, "epoch": 1450} {"train_loss": -5.894319534301758, "global_step": 60932, "epoch": 1450} {"train_loss": -6.062004089355469, "global_step": 60933, "epoch": 1450} {"train_loss": -5.920607566833496, "global_step": 60934, "epoch": 1450} {"train_loss": -5.886846542358398, "global_step": 60935, "epoch": 1450} {"train_loss": -5.937239646911621, "global_step": 60936, "epoch": 1450} {"train_loss": -5.847618103027344, "global_step": 60937, "epoch": 1450} {"train_loss": -5.867088317871094, "global_step": 60938, "epoch": 1450} {"train_loss": -5.889747142791748, "global_step": 60939, "epoch": 1450} {"train_loss": -5.871859550476074, "global_step": 60940, "epoch": 1450} {"train_loss": -5.882832084383283, "global_step": 60941, "epoch": 1450, "train/sim_max_reward_0": 0.49675246109166027, "train/sim_max_reward_1": 0.22770006609450605, "train/sim_max_reward_2": 0.7111352856687005, "train/sim_max_reward_3": 0.7975790880488349, "train/sim_max_reward_4": 0.9042538718251458, "train/sim_max_reward_5": 0.528130744926713, "test/sim_max_reward_4300000": 0.1754702741552541, "test/sim_max_reward_4300001": 0.1425531122876279, "test/sim_max_reward_4300002": 0.9497835490339481, "test/sim_max_reward_4300003": 0.5587658288064615, "test/sim_max_reward_4300004": 0.13300266711210623, "test/sim_max_reward_4300005": 0.41894525683256395, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.29351241285610896, "test/sim_max_reward_4300008": 0.7999340391714457, "test/sim_max_reward_4300009": 0.688425242996978, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.3149772114036844, "test/sim_max_reward_4300012": 0.8226197773844881, "test/sim_max_reward_4300013": 0.41669621112976934, "test/sim_max_reward_4300014": 0.8658586388933247, "test/sim_max_reward_4300015": 0.6032231210445252, "test/sim_max_reward_4300016": 0.9232528146633445, "test/sim_max_reward_4300017": 0.86056878260232, "test/sim_max_reward_4300018": 0.9449530983115555, "test/sim_max_reward_4300019": 0.18569329626700637, "test/sim_max_reward_4300020": 0.5905686861576485, "test/sim_max_reward_4300021": 1.0, "test/sim_max_reward_4300022": 0.9546672083218418, "test/sim_max_reward_4300023": 0.3349970460153556, "test/sim_max_reward_4300024": 0.7763725656383631, "test/sim_max_reward_4300025": 0.7522657285340844, "test/sim_max_reward_4300026": 0.5913005207172116, "test/sim_max_reward_4300027": 0.9536224405620539, "test/sim_max_reward_4300028": 0.9603730353282496, "test/sim_max_reward_4300029": 0.0031962100542726273, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.8763612817695384, "test/sim_max_reward_4300032": 0.7132823514379998, "test/sim_max_reward_4300033": 0.5188725127747612, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.7574349904055361, "test/sim_max_reward_4300036": 0.28736929957585783, "test/sim_max_reward_4300037": 0.7246474523490506, "test/sim_max_reward_4300038": 0.8217434798804403, "test/sim_max_reward_4300039": 0.9471465441040556, "test/sim_max_reward_4300040": 0.662932336850726, "test/sim_max_reward_4300041": 0.9600118693583909, "test/sim_max_reward_4300042": 0.6668761361167075, "test/sim_max_reward_4300043": 0.1567996897717082, "test/sim_max_reward_4300044": 0.808733769072553, "test/sim_max_reward_4300045": 0.4664845587570158, "test/sim_max_reward_4300046": 0.9092782949041043, "test/sim_max_reward_4300047": 0.15258971143049524, "test/sim_max_reward_4300048": 0.9769339203693461, "test/sim_max_reward_4300049": 0.5425662762138671, "train/mean_score": 0.6109252529425935, "test/mean_score": 0.579313265028475, "val_loss": 61318.12109375} {"train_loss": -5.919951438903809, "global_step": 60942, "epoch": 1451} {"train_loss": -6.0843353271484375, "global_step": 60943, "epoch": 1451} {"train_loss": -5.863924980163574, "global_step": 60944, "epoch": 1451} {"train_loss": -5.9213714599609375, "global_step": 60945, "epoch": 1451} {"train_loss": -5.961846351623535, "global_step": 60946, "epoch": 1451} {"train_loss": -5.700174808502197, "global_step": 60947, "epoch": 1451} {"train_loss": -5.922767639160156, "global_step": 60948, "epoch": 1451} {"train_loss": -5.9795684814453125, "global_step": 60949, "epoch": 1451} {"train_loss": -5.986392021179199, "global_step": 60950, "epoch": 1451} {"train_loss": -5.991976737976074, "global_step": 60951, "epoch": 1451} {"train_loss": -5.951101779937744, "global_step": 60952, "epoch": 1451} {"train_loss": -6.0771894454956055, "global_step": 60953, "epoch": 1451} {"train_loss": -5.908160209655762, "global_step": 60954, "epoch": 1451} {"train_loss": -5.898514747619629, "global_step": 60955, "epoch": 1451} {"train_loss": -6.01414155960083, "global_step": 60956, "epoch": 1451} {"train_loss": -5.932504177093506, "global_step": 60957, "epoch": 1451} {"train_loss": -5.886305809020996, "global_step": 60958, "epoch": 1451} {"train_loss": -5.921798229217529, "global_step": 60959, "epoch": 1451} {"train_loss": -5.898991107940674, "global_step": 60960, "epoch": 1451} {"train_loss": -5.852692604064941, "global_step": 60961, "epoch": 1451} {"train_loss": -5.797786712646484, "global_step": 60962, "epoch": 1451} {"train_loss": -5.797679901123047, "global_step": 60963, "epoch": 1451} {"train_loss": -5.944854259490967, "global_step": 60964, "epoch": 1451} {"train_loss": -5.875070571899414, "global_step": 60965, "epoch": 1451} {"train_loss": -5.844827651977539, "global_step": 60966, "epoch": 1451} {"train_loss": -5.821242332458496, "global_step": 60967, "epoch": 1451} {"train_loss": -5.823993682861328, "global_step": 60968, "epoch": 1451} {"train_loss": -5.914887428283691, "global_step": 60969, "epoch": 1451} {"train_loss": -5.92535400390625, "global_step": 60970, "epoch": 1451} {"train_loss": -5.760920524597168, "global_step": 60971, "epoch": 1451} {"train_loss": -5.812283992767334, "global_step": 60972, "epoch": 1451} {"train_loss": -5.941352844238281, "global_step": 60973, "epoch": 1451} {"train_loss": -6.042417526245117, "global_step": 60974, "epoch": 1451} {"train_loss": -5.7298994064331055, "global_step": 60975, "epoch": 1451} {"train_loss": -5.854106903076172, "global_step": 60976, "epoch": 1451} {"train_loss": -5.81015682220459, "global_step": 60977, "epoch": 1451} {"train_loss": -5.789921760559082, "global_step": 60978, "epoch": 1451} {"train_loss": -5.833831787109375, "global_step": 60979, "epoch": 1451} {"train_loss": -5.825852394104004, "global_step": 60980, "epoch": 1451} {"train_loss": -5.897629737854004, "global_step": 60981, "epoch": 1451} {"train_loss": -5.893533229827881, "global_step": 60982, "epoch": 1451} {"train_loss": -5.892447641917637, "global_step": 60983, "epoch": 1451, "val_loss": 61649.359375} {"train_loss": -5.717158317565918, "global_step": 60984, "epoch": 1452} {"train_loss": -5.852468013763428, "global_step": 60985, "epoch": 1452} {"train_loss": -5.844491004943848, "global_step": 60986, "epoch": 1452} {"train_loss": -5.86328125, "global_step": 60987, "epoch": 1452} {"train_loss": -5.973474502563477, "global_step": 60988, "epoch": 1452} {"train_loss": -5.809315204620361, "global_step": 60989, "epoch": 1452} {"train_loss": -5.8743438720703125, "global_step": 60990, "epoch": 1452} {"train_loss": -5.814643859863281, "global_step": 60991, "epoch": 1452} {"train_loss": -5.837325096130371, "global_step": 60992, "epoch": 1452} {"train_loss": -5.841179847717285, "global_step": 60993, "epoch": 1452} {"train_loss": -5.828802108764648, "global_step": 60994, "epoch": 1452} {"train_loss": -5.8724470138549805, "global_step": 60995, "epoch": 1452} {"train_loss": -5.8586626052856445, "global_step": 60996, "epoch": 1452} {"train_loss": -5.972914695739746, "global_step": 60997, "epoch": 1452} {"train_loss": -5.868882179260254, "global_step": 60998, "epoch": 1452} {"train_loss": -5.775996208190918, "global_step": 60999, "epoch": 1452} {"train_loss": -5.874037742614746, "global_step": 61000, "epoch": 1452} {"train_loss": -5.920351028442383, "global_step": 61001, "epoch": 1452} {"train_loss": -5.849620342254639, "global_step": 61002, "epoch": 1452} {"train_loss": -5.892382621765137, "global_step": 61003, "epoch": 1452} {"train_loss": -5.926982879638672, "global_step": 61004, "epoch": 1452} {"train_loss": -5.727365016937256, "global_step": 61005, "epoch": 1452} {"train_loss": -5.949475288391113, "global_step": 61006, "epoch": 1452} {"train_loss": -5.848145961761475, "global_step": 61007, "epoch": 1452} {"train_loss": -5.966981887817383, "global_step": 61008, "epoch": 1452} {"train_loss": -5.988829612731934, "global_step": 61009, "epoch": 1452} {"train_loss": -6.000646591186523, "global_step": 61010, "epoch": 1452} {"train_loss": -5.952493667602539, "global_step": 61011, "epoch": 1452} {"train_loss": -5.925805568695068, "global_step": 61012, "epoch": 1452} {"train_loss": -5.847239971160889, "global_step": 61013, "epoch": 1452} {"train_loss": -5.921699523925781, "global_step": 61014, "epoch": 1452} {"train_loss": -5.83734130859375, "global_step": 61015, "epoch": 1452} {"train_loss": -5.957449913024902, "global_step": 61016, "epoch": 1452} {"train_loss": -5.804845333099365, "global_step": 61017, "epoch": 1452} {"train_loss": -5.941509246826172, "global_step": 61018, "epoch": 1452} {"train_loss": -5.867892742156982, "global_step": 61019, "epoch": 1452} {"train_loss": -5.878127574920654, "global_step": 61020, "epoch": 1452} {"train_loss": -5.974062919616699, "global_step": 61021, "epoch": 1452} {"train_loss": -5.8323493003845215, "global_step": 61022, "epoch": 1452} {"train_loss": -6.015551567077637, "global_step": 61023, "epoch": 1452} {"train_loss": -5.938726425170898, "global_step": 61024, "epoch": 1452} {"train_loss": -5.884846641903832, "global_step": 61025, "epoch": 1452, "val_loss": 61415.08984375} {"train_loss": -5.925431251525879, "global_step": 61026, "epoch": 1453} {"train_loss": -5.891970634460449, "global_step": 61027, "epoch": 1453} {"train_loss": -5.9771881103515625, "global_step": 61028, "epoch": 1453} {"train_loss": -5.656276226043701, "global_step": 61029, "epoch": 1453} {"train_loss": -6.037505626678467, "global_step": 61030, "epoch": 1453} {"train_loss": -5.905290603637695, "global_step": 61031, "epoch": 1453} {"train_loss": -5.914748191833496, "global_step": 61032, "epoch": 1453} {"train_loss": -6.0741472244262695, "global_step": 61033, "epoch": 1453} {"train_loss": -5.98665714263916, "global_step": 61034, "epoch": 1453} {"train_loss": -5.788061141967773, "global_step": 61035, "epoch": 1453} {"train_loss": -5.8983306884765625, "global_step": 61036, "epoch": 1453} {"train_loss": -5.92418909072876, "global_step": 61037, "epoch": 1453} {"train_loss": -5.855652332305908, "global_step": 61038, "epoch": 1453} {"train_loss": -5.864715099334717, "global_step": 61039, "epoch": 1453} {"train_loss": -5.82979679107666, "global_step": 61040, "epoch": 1453} {"train_loss": -5.85438346862793, "global_step": 61041, "epoch": 1453} {"train_loss": -5.85855770111084, "global_step": 61042, "epoch": 1453} {"train_loss": -5.928771018981934, "global_step": 61043, "epoch": 1453} {"train_loss": -5.896725177764893, "global_step": 61044, "epoch": 1453} {"train_loss": -5.8635382652282715, "global_step": 61045, "epoch": 1453} {"train_loss": -5.834135055541992, "global_step": 61046, "epoch": 1453} {"train_loss": -5.90858793258667, "global_step": 61047, "epoch": 1453} {"train_loss": -5.830389022827148, "global_step": 61048, "epoch": 1453} {"train_loss": -5.81418514251709, "global_step": 61049, "epoch": 1453} {"train_loss": -5.835779666900635, "global_step": 61050, "epoch": 1453} {"train_loss": -5.805611610412598, "global_step": 61051, "epoch": 1453} {"train_loss": -5.90423583984375, "global_step": 61052, "epoch": 1453} {"train_loss": -5.917178630828857, "global_step": 61053, "epoch": 1453} {"train_loss": -5.785530090332031, "global_step": 61054, "epoch": 1453} {"train_loss": -5.773334980010986, "global_step": 61055, "epoch": 1453} {"train_loss": -5.881155014038086, "global_step": 61056, "epoch": 1453} {"train_loss": -5.883058547973633, "global_step": 61057, "epoch": 1453} {"train_loss": -5.874001502990723, "global_step": 61058, "epoch": 1453} {"train_loss": -5.815411567687988, "global_step": 61059, "epoch": 1453} {"train_loss": -5.882542610168457, "global_step": 61060, "epoch": 1453} {"train_loss": -5.9253411293029785, "global_step": 61061, "epoch": 1453} {"train_loss": -5.870715618133545, "global_step": 61062, "epoch": 1453} {"train_loss": -5.855574131011963, "global_step": 61063, "epoch": 1453} {"train_loss": -5.774787902832031, "global_step": 61064, "epoch": 1453} {"train_loss": -5.964761734008789, "global_step": 61065, "epoch": 1453} {"train_loss": -5.836406707763672, "global_step": 61066, "epoch": 1453} {"train_loss": -5.877566382998512, "global_step": 61067, "epoch": 1453, "val_loss": 61155.3828125} {"train_loss": -5.824459552764893, "global_step": 61068, "epoch": 1454} {"train_loss": -5.791847229003906, "global_step": 61069, "epoch": 1454} {"train_loss": -5.830148696899414, "global_step": 61070, "epoch": 1454} {"train_loss": -5.736651420593262, "global_step": 61071, "epoch": 1454} {"train_loss": -5.940339088439941, "global_step": 61072, "epoch": 1454} {"train_loss": -5.780644416809082, "global_step": 61073, "epoch": 1454} {"train_loss": -5.730094909667969, "global_step": 61074, "epoch": 1454} {"train_loss": -5.741684913635254, "global_step": 61075, "epoch": 1454} {"train_loss": -5.795984268188477, "global_step": 61076, "epoch": 1454} {"train_loss": -5.882769584655762, "global_step": 61077, "epoch": 1454} {"train_loss": -5.928852558135986, "global_step": 61078, "epoch": 1454} {"train_loss": -5.831625461578369, "global_step": 61079, "epoch": 1454} {"train_loss": -5.854137420654297, "global_step": 61080, "epoch": 1454} {"train_loss": -5.929479598999023, "global_step": 61081, "epoch": 1454} {"train_loss": -5.824860572814941, "global_step": 61082, "epoch": 1454} {"train_loss": -5.982134819030762, "global_step": 61083, "epoch": 1454} {"train_loss": -5.821944713592529, "global_step": 61084, "epoch": 1454} {"train_loss": -5.822824478149414, "global_step": 61085, "epoch": 1454} {"train_loss": -5.781830787658691, "global_step": 61086, "epoch": 1454} {"train_loss": -5.956873893737793, "global_step": 61087, "epoch": 1454} {"train_loss": -5.83367919921875, "global_step": 61088, "epoch": 1454} {"train_loss": -5.988753318786621, "global_step": 61089, "epoch": 1454} {"train_loss": -5.876635551452637, "global_step": 61090, "epoch": 1454} {"train_loss": -5.95479679107666, "global_step": 61091, "epoch": 1454} {"train_loss": -5.949802398681641, "global_step": 61092, "epoch": 1454} {"train_loss": -5.934443950653076, "global_step": 61093, "epoch": 1454} {"train_loss": -6.018749713897705, "global_step": 61094, "epoch": 1454} {"train_loss": -5.8464202880859375, "global_step": 61095, "epoch": 1454} {"train_loss": -5.947699546813965, "global_step": 61096, "epoch": 1454} {"train_loss": -5.813108444213867, "global_step": 61097, "epoch": 1454} {"train_loss": -5.987675666809082, "global_step": 61098, "epoch": 1454} {"train_loss": -5.983511924743652, "global_step": 61099, "epoch": 1454} {"train_loss": -5.877211570739746, "global_step": 61100, "epoch": 1454} {"train_loss": -6.034761428833008, "global_step": 61101, "epoch": 1454} {"train_loss": -5.962926864624023, "global_step": 61102, "epoch": 1454} {"train_loss": -5.944479942321777, "global_step": 61103, "epoch": 1454} {"train_loss": -5.969448566436768, "global_step": 61104, "epoch": 1454} {"train_loss": -5.945725440979004, "global_step": 61105, "epoch": 1454} {"train_loss": -5.977595806121826, "global_step": 61106, "epoch": 1454} {"train_loss": -6.109965801239014, "global_step": 61107, "epoch": 1454} {"train_loss": -5.845222473144531, "global_step": 61108, "epoch": 1454} {"train_loss": -5.892577194032215, "global_step": 61109, "epoch": 1454, "val_loss": 61137.90234375} {"train_loss": -5.969784259796143, "global_step": 61110, "epoch": 1455} {"train_loss": -6.047750473022461, "global_step": 61111, "epoch": 1455} {"train_loss": -5.839937686920166, "global_step": 61112, "epoch": 1455} {"train_loss": -5.934171199798584, "global_step": 61113, "epoch": 1455} {"train_loss": -5.92159366607666, "global_step": 61114, "epoch": 1455} {"train_loss": -5.928790092468262, "global_step": 61115, "epoch": 1455} {"train_loss": -6.0167341232299805, "global_step": 61116, "epoch": 1455} {"train_loss": -5.953272819519043, "global_step": 61117, "epoch": 1455} {"train_loss": -6.029532432556152, "global_step": 61118, "epoch": 1455} {"train_loss": -5.993192195892334, "global_step": 61119, "epoch": 1455} {"train_loss": -5.98129415512085, "global_step": 61120, "epoch": 1455} {"train_loss": -5.9331207275390625, "global_step": 61121, "epoch": 1455} {"train_loss": -5.855221748352051, "global_step": 61122, "epoch": 1455} {"train_loss": -5.710411548614502, "global_step": 61123, "epoch": 1455} {"train_loss": -5.945784091949463, "global_step": 61124, "epoch": 1455} {"train_loss": -5.968567371368408, "global_step": 61125, "epoch": 1455} {"train_loss": -5.856292724609375, "global_step": 61126, "epoch": 1455} {"train_loss": -5.9872846603393555, "global_step": 61127, "epoch": 1455} {"train_loss": -5.960666656494141, "global_step": 61128, "epoch": 1455} {"train_loss": -5.858809947967529, "global_step": 61129, "epoch": 1455} {"train_loss": -5.877921104431152, "global_step": 61130, "epoch": 1455} {"train_loss": -6.015976905822754, "global_step": 61131, "epoch": 1455} {"train_loss": -5.988034248352051, "global_step": 61132, "epoch": 1455} {"train_loss": -5.890766620635986, "global_step": 61133, "epoch": 1455} {"train_loss": -5.91168212890625, "global_step": 61134, "epoch": 1455} {"train_loss": -5.804454803466797, "global_step": 61135, "epoch": 1455} {"train_loss": -6.03669548034668, "global_step": 61136, "epoch": 1455} {"train_loss": -5.890827178955078, "global_step": 61137, "epoch": 1455} {"train_loss": -5.823725700378418, "global_step": 61138, "epoch": 1455} {"train_loss": -5.820481300354004, "global_step": 61139, "epoch": 1455} {"train_loss": -5.957251071929932, "global_step": 61140, "epoch": 1455} {"train_loss": -5.8873748779296875, "global_step": 61141, "epoch": 1455} {"train_loss": -5.950163841247559, "global_step": 61142, "epoch": 1455} {"train_loss": -5.913752555847168, "global_step": 61143, "epoch": 1455} {"train_loss": -6.063063621520996, "global_step": 61144, "epoch": 1455} {"train_loss": -5.8787078857421875, "global_step": 61145, "epoch": 1455} {"train_loss": -5.773995876312256, "global_step": 61146, "epoch": 1455} {"train_loss": -5.958621501922607, "global_step": 61147, "epoch": 1455} {"train_loss": -5.9833574295043945, "global_step": 61148, "epoch": 1455} {"train_loss": -5.9781975746154785, "global_step": 61149, "epoch": 1455} {"train_loss": -5.988077163696289, "global_step": 61150, "epoch": 1455} {"train_loss": -5.927994977860224, "global_step": 61151, "epoch": 1455, "val_loss": 61498.5078125} {"train_loss": -5.967901229858398, "global_step": 61152, "epoch": 1456} {"train_loss": -5.85002326965332, "global_step": 61153, "epoch": 1456} {"train_loss": -5.919140815734863, "global_step": 61154, "epoch": 1456} {"train_loss": -5.922292709350586, "global_step": 61155, "epoch": 1456} {"train_loss": -5.866304397583008, "global_step": 61156, "epoch": 1456} {"train_loss": -6.076445579528809, "global_step": 61157, "epoch": 1456} {"train_loss": -5.816634178161621, "global_step": 61158, "epoch": 1456} {"train_loss": -5.988315582275391, "global_step": 61159, "epoch": 1456} {"train_loss": -6.05835485458374, "global_step": 61160, "epoch": 1456} {"train_loss": -5.9417524337768555, "global_step": 61161, "epoch": 1456} {"train_loss": -5.910724639892578, "global_step": 61162, "epoch": 1456} {"train_loss": -5.953401565551758, "global_step": 61163, "epoch": 1456} {"train_loss": -6.03564977645874, "global_step": 61164, "epoch": 1456} {"train_loss": -5.96218204498291, "global_step": 61165, "epoch": 1456} {"train_loss": -5.986407279968262, "global_step": 61166, "epoch": 1456} {"train_loss": -6.084880352020264, "global_step": 61167, "epoch": 1456} {"train_loss": -5.955874443054199, "global_step": 61168, "epoch": 1456} {"train_loss": -5.868111610412598, "global_step": 61169, "epoch": 1456} {"train_loss": -5.932703018188477, "global_step": 61170, "epoch": 1456} {"train_loss": -5.932286262512207, "global_step": 61171, "epoch": 1456} {"train_loss": -5.961427688598633, "global_step": 61172, "epoch": 1456} {"train_loss": -5.942773818969727, "global_step": 61173, "epoch": 1456} {"train_loss": -5.9264936447143555, "global_step": 61174, "epoch": 1456} {"train_loss": -5.884326457977295, "global_step": 61175, "epoch": 1456} {"train_loss": -5.938139915466309, "global_step": 61176, "epoch": 1456} {"train_loss": -5.916116714477539, "global_step": 61177, "epoch": 1456} {"train_loss": -5.9995317459106445, "global_step": 61178, "epoch": 1456} {"train_loss": -5.908614635467529, "global_step": 61179, "epoch": 1456} {"train_loss": -5.988781929016113, "global_step": 61180, "epoch": 1456} {"train_loss": -5.83937931060791, "global_step": 61181, "epoch": 1456} {"train_loss": -5.869545936584473, "global_step": 61182, "epoch": 1456} {"train_loss": -5.948173522949219, "global_step": 61183, "epoch": 1456} {"train_loss": -5.934864044189453, "global_step": 61184, "epoch": 1456} {"train_loss": -5.870302200317383, "global_step": 61185, "epoch": 1456} {"train_loss": -5.902547836303711, "global_step": 61186, "epoch": 1456} {"train_loss": -5.804292678833008, "global_step": 61187, "epoch": 1456} {"train_loss": -5.887941360473633, "global_step": 61188, "epoch": 1456} {"train_loss": -5.870795249938965, "global_step": 61189, "epoch": 1456} {"train_loss": -5.948251724243164, "global_step": 61190, "epoch": 1456} {"train_loss": -5.990222454071045, "global_step": 61191, "epoch": 1456} {"train_loss": -5.867653846740723, "global_step": 61192, "epoch": 1456} {"train_loss": -5.931608710970197, "global_step": 61193, "epoch": 1456, "val_loss": 61264.48046875} {"train_loss": -5.933599472045898, "global_step": 61194, "epoch": 1457} {"train_loss": -5.928297519683838, "global_step": 61195, "epoch": 1457} {"train_loss": -5.865809440612793, "global_step": 61196, "epoch": 1457} {"train_loss": -6.045149326324463, "global_step": 61197, "epoch": 1457} {"train_loss": -5.932562351226807, "global_step": 61198, "epoch": 1457} {"train_loss": -5.913180351257324, "global_step": 61199, "epoch": 1457} {"train_loss": -6.026026725769043, "global_step": 61200, "epoch": 1457} {"train_loss": -5.833437442779541, "global_step": 61201, "epoch": 1457} {"train_loss": -5.962292671203613, "global_step": 61202, "epoch": 1457} {"train_loss": -6.044283390045166, "global_step": 61203, "epoch": 1457} {"train_loss": -5.921090126037598, "global_step": 61204, "epoch": 1457} {"train_loss": -5.924224853515625, "global_step": 61205, "epoch": 1457} {"train_loss": -5.922708988189697, "global_step": 61206, "epoch": 1457} {"train_loss": -5.838712692260742, "global_step": 61207, "epoch": 1457} {"train_loss": -5.870465278625488, "global_step": 61208, "epoch": 1457} {"train_loss": -5.844139099121094, "global_step": 61209, "epoch": 1457} {"train_loss": -5.861175537109375, "global_step": 61210, "epoch": 1457} {"train_loss": -6.048406600952148, "global_step": 61211, "epoch": 1457} {"train_loss": -5.896650314331055, "global_step": 61212, "epoch": 1457} {"train_loss": -5.859241962432861, "global_step": 61213, "epoch": 1457} {"train_loss": -5.828909873962402, "global_step": 61214, "epoch": 1457} {"train_loss": -5.947541236877441, "global_step": 61215, "epoch": 1457} {"train_loss": -5.854121208190918, "global_step": 61216, "epoch": 1457} {"train_loss": -5.810039043426514, "global_step": 61217, "epoch": 1457} {"train_loss": -6.023238658905029, "global_step": 61218, "epoch": 1457} {"train_loss": -5.969967842102051, "global_step": 61219, "epoch": 1457} {"train_loss": -5.895774841308594, "global_step": 61220, "epoch": 1457} {"train_loss": -5.896688461303711, "global_step": 61221, "epoch": 1457} {"train_loss": -5.938036918640137, "global_step": 61222, "epoch": 1457} {"train_loss": -5.898382186889648, "global_step": 61223, "epoch": 1457} {"train_loss": -5.815507888793945, "global_step": 61224, "epoch": 1457} {"train_loss": -6.030806541442871, "global_step": 61225, "epoch": 1457} {"train_loss": -5.971867561340332, "global_step": 61226, "epoch": 1457} {"train_loss": -5.920479774475098, "global_step": 61227, "epoch": 1457} {"train_loss": -5.851504802703857, "global_step": 61228, "epoch": 1457} {"train_loss": -5.9467339515686035, "global_step": 61229, "epoch": 1457} {"train_loss": -5.918140888214111, "global_step": 61230, "epoch": 1457} {"train_loss": -5.911842346191406, "global_step": 61231, "epoch": 1457} {"train_loss": -5.9463300704956055, "global_step": 61232, "epoch": 1457} {"train_loss": -5.852391242980957, "global_step": 61233, "epoch": 1457} {"train_loss": -6.022704124450684, "global_step": 61234, "epoch": 1457} {"train_loss": -5.919743719555083, "global_step": 61235, "epoch": 1457, "val_loss": 61525.10546875} {"train_loss": -5.926836013793945, "global_step": 61236, "epoch": 1458} {"train_loss": -5.902151584625244, "global_step": 61237, "epoch": 1458} {"train_loss": -5.973607063293457, "global_step": 61238, "epoch": 1458} {"train_loss": -5.995171546936035, "global_step": 61239, "epoch": 1458} {"train_loss": -5.844024658203125, "global_step": 61240, "epoch": 1458} {"train_loss": -5.986656665802002, "global_step": 61241, "epoch": 1458} {"train_loss": -6.033797264099121, "global_step": 61242, "epoch": 1458} {"train_loss": -5.889481067657471, "global_step": 61243, "epoch": 1458} {"train_loss": -6.043827056884766, "global_step": 61244, "epoch": 1458} {"train_loss": -5.924686908721924, "global_step": 61245, "epoch": 1458} {"train_loss": -5.96504020690918, "global_step": 61246, "epoch": 1458} {"train_loss": -5.991368770599365, "global_step": 61247, "epoch": 1458} {"train_loss": -5.890247344970703, "global_step": 61248, "epoch": 1458} {"train_loss": -5.807961463928223, "global_step": 61249, "epoch": 1458} {"train_loss": -5.915306091308594, "global_step": 61250, "epoch": 1458} {"train_loss": -5.906403541564941, "global_step": 61251, "epoch": 1458} {"train_loss": -5.910112380981445, "global_step": 61252, "epoch": 1458} {"train_loss": -5.999845504760742, "global_step": 61253, "epoch": 1458} {"train_loss": -5.894453048706055, "global_step": 61254, "epoch": 1458} {"train_loss": -5.959819316864014, "global_step": 61255, "epoch": 1458} {"train_loss": -5.929841995239258, "global_step": 61256, "epoch": 1458} {"train_loss": -5.858019828796387, "global_step": 61257, "epoch": 1458} {"train_loss": -5.923050880432129, "global_step": 61258, "epoch": 1458} {"train_loss": -5.833295822143555, "global_step": 61259, "epoch": 1458} {"train_loss": -5.932328224182129, "global_step": 61260, "epoch": 1458} {"train_loss": -5.981950759887695, "global_step": 61261, "epoch": 1458} {"train_loss": -5.859759330749512, "global_step": 61262, "epoch": 1458} {"train_loss": -5.964112281799316, "global_step": 61263, "epoch": 1458} {"train_loss": -5.932300567626953, "global_step": 61264, "epoch": 1458} {"train_loss": -5.7655158042907715, "global_step": 61265, "epoch": 1458} {"train_loss": -5.8284149169921875, "global_step": 61266, "epoch": 1458} {"train_loss": -5.917840957641602, "global_step": 61267, "epoch": 1458} {"train_loss": -5.881192207336426, "global_step": 61268, "epoch": 1458} {"train_loss": -5.907595634460449, "global_step": 61269, "epoch": 1458} {"train_loss": -5.8769731521606445, "global_step": 61270, "epoch": 1458} {"train_loss": -5.9543232917785645, "global_step": 61271, "epoch": 1458} {"train_loss": -6.012698173522949, "global_step": 61272, "epoch": 1458} {"train_loss": -5.868228912353516, "global_step": 61273, "epoch": 1458} {"train_loss": -5.948910713195801, "global_step": 61274, "epoch": 1458} {"train_loss": -5.986835479736328, "global_step": 61275, "epoch": 1458} {"train_loss": -5.980035305023193, "global_step": 61276, "epoch": 1458} {"train_loss": -5.924866630917504, "global_step": 61277, "epoch": 1458, "val_loss": 61482.69921875} {"train_loss": -5.8795928955078125, "global_step": 61278, "epoch": 1459} {"train_loss": -5.774046897888184, "global_step": 61279, "epoch": 1459} {"train_loss": -5.967744827270508, "global_step": 61280, "epoch": 1459} {"train_loss": -5.939878463745117, "global_step": 61281, "epoch": 1459} {"train_loss": -5.9442949295043945, "global_step": 61282, "epoch": 1459} {"train_loss": -5.959575176239014, "global_step": 61283, "epoch": 1459} {"train_loss": -5.959492206573486, "global_step": 61284, "epoch": 1459} {"train_loss": -5.932551383972168, "global_step": 61285, "epoch": 1459} {"train_loss": -5.856227874755859, "global_step": 61286, "epoch": 1459} {"train_loss": -5.926265239715576, "global_step": 61287, "epoch": 1459} {"train_loss": -5.833441734313965, "global_step": 61288, "epoch": 1459} {"train_loss": -5.998381614685059, "global_step": 61289, "epoch": 1459} {"train_loss": -5.885451316833496, "global_step": 61290, "epoch": 1459} {"train_loss": -5.910213470458984, "global_step": 61291, "epoch": 1459} {"train_loss": -5.974777698516846, "global_step": 61292, "epoch": 1459} {"train_loss": -5.9013519287109375, "global_step": 61293, "epoch": 1459} {"train_loss": -5.941944599151611, "global_step": 61294, "epoch": 1459} {"train_loss": -5.825769424438477, "global_step": 61295, "epoch": 1459} {"train_loss": -5.963168144226074, "global_step": 61296, "epoch": 1459} {"train_loss": -6.056129455566406, "global_step": 61297, "epoch": 1459} {"train_loss": -5.862415313720703, "global_step": 61298, "epoch": 1459} {"train_loss": -5.970902442932129, "global_step": 61299, "epoch": 1459} {"train_loss": -5.998244285583496, "global_step": 61300, "epoch": 1459} {"train_loss": -5.982072353363037, "global_step": 61301, "epoch": 1459} {"train_loss": -5.924137115478516, "global_step": 61302, "epoch": 1459} {"train_loss": -5.919875144958496, "global_step": 61303, "epoch": 1459} {"train_loss": -5.867974281311035, "global_step": 61304, "epoch": 1459} {"train_loss": -5.923952579498291, "global_step": 61305, "epoch": 1459} {"train_loss": -5.9278788566589355, "global_step": 61306, "epoch": 1459} {"train_loss": -5.905119895935059, "global_step": 61307, "epoch": 1459} {"train_loss": -5.926084518432617, "global_step": 61308, "epoch": 1459} {"train_loss": -5.919647216796875, "global_step": 61309, "epoch": 1459} {"train_loss": -5.8770952224731445, "global_step": 61310, "epoch": 1459} {"train_loss": -5.896583557128906, "global_step": 61311, "epoch": 1459} {"train_loss": -5.920670509338379, "global_step": 61312, "epoch": 1459} {"train_loss": -5.94217586517334, "global_step": 61313, "epoch": 1459} {"train_loss": -5.814687252044678, "global_step": 61314, "epoch": 1459} {"train_loss": -5.87445068359375, "global_step": 61315, "epoch": 1459} {"train_loss": -6.019767761230469, "global_step": 61316, "epoch": 1459} {"train_loss": -6.001903057098389, "global_step": 61317, "epoch": 1459} {"train_loss": -5.956442832946777, "global_step": 61318, "epoch": 1459} {"train_loss": -5.92213461512611, "global_step": 61319, "epoch": 1459, "val_loss": 61325.07421875} {"train_loss": -5.877532958984375, "global_step": 61320, "epoch": 1460} {"train_loss": -6.003846645355225, "global_step": 61321, "epoch": 1460} {"train_loss": -5.947934150695801, "global_step": 61322, "epoch": 1460} {"train_loss": -5.810483932495117, "global_step": 61323, "epoch": 1460} {"train_loss": -5.888023376464844, "global_step": 61324, "epoch": 1460} {"train_loss": -5.908979415893555, "global_step": 61325, "epoch": 1460} {"train_loss": -5.994387626647949, "global_step": 61326, "epoch": 1460} {"train_loss": -5.890242099761963, "global_step": 61327, "epoch": 1460} {"train_loss": -5.861831188201904, "global_step": 61328, "epoch": 1460} {"train_loss": -5.930754661560059, "global_step": 61329, "epoch": 1460} {"train_loss": -5.956421375274658, "global_step": 61330, "epoch": 1460} {"train_loss": -5.928855895996094, "global_step": 61331, "epoch": 1460} {"train_loss": -5.954644680023193, "global_step": 61332, "epoch": 1460} {"train_loss": -5.983719825744629, "global_step": 61333, "epoch": 1460} {"train_loss": -5.936989784240723, "global_step": 61334, "epoch": 1460} {"train_loss": -5.943323135375977, "global_step": 61335, "epoch": 1460} {"train_loss": -5.964829444885254, "global_step": 61336, "epoch": 1460} {"train_loss": -5.835902214050293, "global_step": 61337, "epoch": 1460} {"train_loss": -5.874207496643066, "global_step": 61338, "epoch": 1460} {"train_loss": -6.064173698425293, "global_step": 61339, "epoch": 1460} {"train_loss": -6.006143569946289, "global_step": 61340, "epoch": 1460} {"train_loss": -5.961026668548584, "global_step": 61341, "epoch": 1460} {"train_loss": -5.974266052246094, "global_step": 61342, "epoch": 1460} {"train_loss": -5.932345390319824, "global_step": 61343, "epoch": 1460} {"train_loss": -5.910565376281738, "global_step": 61344, "epoch": 1460} {"train_loss": -6.078754425048828, "global_step": 61345, "epoch": 1460} {"train_loss": -5.891022682189941, "global_step": 61346, "epoch": 1460} {"train_loss": -5.9262166023254395, "global_step": 61347, "epoch": 1460} {"train_loss": -6.023928642272949, "global_step": 61348, "epoch": 1460} {"train_loss": -5.922708511352539, "global_step": 61349, "epoch": 1460} {"train_loss": -6.046809196472168, "global_step": 61350, "epoch": 1460} {"train_loss": -6.01716423034668, "global_step": 61351, "epoch": 1460} {"train_loss": -5.936395645141602, "global_step": 61352, "epoch": 1460} {"train_loss": -5.8484086990356445, "global_step": 61353, "epoch": 1460} {"train_loss": -5.840533256530762, "global_step": 61354, "epoch": 1460} {"train_loss": -5.882190704345703, "global_step": 61355, "epoch": 1460} {"train_loss": -5.956775665283203, "global_step": 61356, "epoch": 1460} {"train_loss": -5.93598747253418, "global_step": 61357, "epoch": 1460} {"train_loss": -5.835280895233154, "global_step": 61358, "epoch": 1460} {"train_loss": -5.920795440673828, "global_step": 61359, "epoch": 1460} {"train_loss": -5.959585666656494, "global_step": 61360, "epoch": 1460} {"train_loss": -5.931932846705119, "global_step": 61361, "epoch": 1460, "val_loss": 61543.20703125} {"train_loss": -5.826533317565918, "global_step": 61362, "epoch": 1461} {"train_loss": -5.931487083435059, "global_step": 61363, "epoch": 1461} {"train_loss": -5.944520950317383, "global_step": 61364, "epoch": 1461} {"train_loss": -5.935396194458008, "global_step": 61365, "epoch": 1461} {"train_loss": -5.992633819580078, "global_step": 61366, "epoch": 1461} {"train_loss": -5.8600640296936035, "global_step": 61367, "epoch": 1461} {"train_loss": -5.958967685699463, "global_step": 61368, "epoch": 1461} {"train_loss": -5.8420209884643555, "global_step": 61369, "epoch": 1461} {"train_loss": -5.944278717041016, "global_step": 61370, "epoch": 1461} {"train_loss": -5.999603748321533, "global_step": 61371, "epoch": 1461} {"train_loss": -6.015676021575928, "global_step": 61372, "epoch": 1461} {"train_loss": -5.92390251159668, "global_step": 61373, "epoch": 1461} {"train_loss": -5.9304938316345215, "global_step": 61374, "epoch": 1461} {"train_loss": -5.939535140991211, "global_step": 61375, "epoch": 1461} {"train_loss": -5.840734958648682, "global_step": 61376, "epoch": 1461} {"train_loss": -5.977242946624756, "global_step": 61377, "epoch": 1461} {"train_loss": -5.891747951507568, "global_step": 61378, "epoch": 1461} {"train_loss": -5.768998146057129, "global_step": 61379, "epoch": 1461} {"train_loss": -5.9450602531433105, "global_step": 61380, "epoch": 1461} {"train_loss": -5.917421340942383, "global_step": 61381, "epoch": 1461} {"train_loss": -5.901572227478027, "global_step": 61382, "epoch": 1461} {"train_loss": -5.8040924072265625, "global_step": 61383, "epoch": 1461} {"train_loss": -5.9602155685424805, "global_step": 61384, "epoch": 1461} {"train_loss": -5.854820728302002, "global_step": 61385, "epoch": 1461} {"train_loss": -5.833736419677734, "global_step": 61386, "epoch": 1461} {"train_loss": -5.8382768630981445, "global_step": 61387, "epoch": 1461} {"train_loss": -5.95820426940918, "global_step": 61388, "epoch": 1461} {"train_loss": -5.954314231872559, "global_step": 61389, "epoch": 1461} {"train_loss": -5.873165607452393, "global_step": 61390, "epoch": 1461} {"train_loss": -5.7949347496032715, "global_step": 61391, "epoch": 1461} {"train_loss": -5.8722639083862305, "global_step": 61392, "epoch": 1461} {"train_loss": -5.8925557136535645, "global_step": 61393, "epoch": 1461} {"train_loss": -5.912763595581055, "global_step": 61394, "epoch": 1461} {"train_loss": -5.944760322570801, "global_step": 61395, "epoch": 1461} {"train_loss": -5.803104400634766, "global_step": 61396, "epoch": 1461} {"train_loss": -5.951100826263428, "global_step": 61397, "epoch": 1461} {"train_loss": -5.851193428039551, "global_step": 61398, "epoch": 1461} {"train_loss": -5.895444869995117, "global_step": 61399, "epoch": 1461} {"train_loss": -5.858741283416748, "global_step": 61400, "epoch": 1461} {"train_loss": -6.039233207702637, "global_step": 61401, "epoch": 1461} {"train_loss": -5.918017387390137, "global_step": 61402, "epoch": 1461} {"train_loss": -5.904852061044602, "global_step": 61403, "epoch": 1461, "val_loss": 61214.6171875} {"train_loss": -5.821966171264648, "global_step": 61404, "epoch": 1462} {"train_loss": -5.904313564300537, "global_step": 61405, "epoch": 1462} {"train_loss": -5.853119850158691, "global_step": 61406, "epoch": 1462} {"train_loss": -5.8836350440979, "global_step": 61407, "epoch": 1462} {"train_loss": -5.857326984405518, "global_step": 61408, "epoch": 1462} {"train_loss": -5.9265456199646, "global_step": 61409, "epoch": 1462} {"train_loss": -5.870805740356445, "global_step": 61410, "epoch": 1462} {"train_loss": -5.943459510803223, "global_step": 61411, "epoch": 1462} {"train_loss": -5.8686909675598145, "global_step": 61412, "epoch": 1462} {"train_loss": -5.804385662078857, "global_step": 61413, "epoch": 1462} {"train_loss": -5.971853256225586, "global_step": 61414, "epoch": 1462} {"train_loss": -5.881023406982422, "global_step": 61415, "epoch": 1462} {"train_loss": -5.861137390136719, "global_step": 61416, "epoch": 1462} {"train_loss": -5.7505879402160645, "global_step": 61417, "epoch": 1462} {"train_loss": -5.96323299407959, "global_step": 61418, "epoch": 1462} {"train_loss": -5.958044052124023, "global_step": 61419, "epoch": 1462} {"train_loss": -5.822996139526367, "global_step": 61420, "epoch": 1462} {"train_loss": -5.973170280456543, "global_step": 61421, "epoch": 1462} {"train_loss": -5.799033164978027, "global_step": 61422, "epoch": 1462} {"train_loss": -6.0361104011535645, "global_step": 61423, "epoch": 1462} {"train_loss": -5.811274528503418, "global_step": 61424, "epoch": 1462} {"train_loss": -5.897641181945801, "global_step": 61425, "epoch": 1462} {"train_loss": -5.9503607749938965, "global_step": 61426, "epoch": 1462} {"train_loss": -5.803089618682861, "global_step": 61427, "epoch": 1462} {"train_loss": -5.979806900024414, "global_step": 61428, "epoch": 1462} {"train_loss": -5.987051010131836, "global_step": 61429, "epoch": 1462} {"train_loss": -5.747646331787109, "global_step": 61430, "epoch": 1462} {"train_loss": -5.923315525054932, "global_step": 61431, "epoch": 1462} {"train_loss": -6.017139911651611, "global_step": 61432, "epoch": 1462} {"train_loss": -5.853370666503906, "global_step": 61433, "epoch": 1462} {"train_loss": -5.968079566955566, "global_step": 61434, "epoch": 1462} {"train_loss": -5.945879936218262, "global_step": 61435, "epoch": 1462} {"train_loss": -5.915701866149902, "global_step": 61436, "epoch": 1462} {"train_loss": -6.003664016723633, "global_step": 61437, "epoch": 1462} {"train_loss": -5.9772443771362305, "global_step": 61438, "epoch": 1462} {"train_loss": -6.023911476135254, "global_step": 61439, "epoch": 1462} {"train_loss": -6.099952220916748, "global_step": 61440, "epoch": 1462} {"train_loss": -5.972385406494141, "global_step": 61441, "epoch": 1462} {"train_loss": -6.057435035705566, "global_step": 61442, "epoch": 1462} {"train_loss": -6.0607523918151855, "global_step": 61443, "epoch": 1462} {"train_loss": -5.959575176239014, "global_step": 61444, "epoch": 1462} {"train_loss": -5.920362438474383, "global_step": 61445, "epoch": 1462, "val_loss": 61464.49609375} {"train_loss": -5.888844013214111, "global_step": 61446, "epoch": 1463} {"train_loss": -5.884503364562988, "global_step": 61447, "epoch": 1463} {"train_loss": -6.033263206481934, "global_step": 61448, "epoch": 1463} {"train_loss": -6.022344589233398, "global_step": 61449, "epoch": 1463} {"train_loss": -5.933722972869873, "global_step": 61450, "epoch": 1463} {"train_loss": -5.9315996170043945, "global_step": 61451, "epoch": 1463} {"train_loss": -5.990734100341797, "global_step": 61452, "epoch": 1463} {"train_loss": -6.103194236755371, "global_step": 61453, "epoch": 1463} {"train_loss": -5.7791242599487305, "global_step": 61454, "epoch": 1463} {"train_loss": -5.966740608215332, "global_step": 61455, "epoch": 1463} {"train_loss": -5.979075908660889, "global_step": 61456, "epoch": 1463} {"train_loss": -6.026076316833496, "global_step": 61457, "epoch": 1463} {"train_loss": -5.8787736892700195, "global_step": 61458, "epoch": 1463} {"train_loss": -5.930466651916504, "global_step": 61459, "epoch": 1463} {"train_loss": -5.9088335037231445, "global_step": 61460, "epoch": 1463} {"train_loss": -5.979269981384277, "global_step": 61461, "epoch": 1463} {"train_loss": -6.040963172912598, "global_step": 61462, "epoch": 1463} {"train_loss": -5.824093818664551, "global_step": 61463, "epoch": 1463} {"train_loss": -6.090136528015137, "global_step": 61464, "epoch": 1463} {"train_loss": -5.943709850311279, "global_step": 61465, "epoch": 1463} {"train_loss": -6.007949352264404, "global_step": 61466, "epoch": 1463} {"train_loss": -5.992081642150879, "global_step": 61467, "epoch": 1463} {"train_loss": -5.922292232513428, "global_step": 61468, "epoch": 1463} {"train_loss": -5.831986427307129, "global_step": 61469, "epoch": 1463} {"train_loss": -5.957816123962402, "global_step": 61470, "epoch": 1463} {"train_loss": -5.846343040466309, "global_step": 61471, "epoch": 1463} {"train_loss": -5.965846061706543, "global_step": 61472, "epoch": 1463} {"train_loss": -5.949481010437012, "global_step": 61473, "epoch": 1463} {"train_loss": -5.7558183670043945, "global_step": 61474, "epoch": 1463} {"train_loss": -5.854557037353516, "global_step": 61475, "epoch": 1463} {"train_loss": -5.9677324295043945, "global_step": 61476, "epoch": 1463} {"train_loss": -5.973817825317383, "global_step": 61477, "epoch": 1463} {"train_loss": -5.87805700302124, "global_step": 61478, "epoch": 1463} {"train_loss": -5.951862335205078, "global_step": 61479, "epoch": 1463} {"train_loss": -5.910853862762451, "global_step": 61480, "epoch": 1463} {"train_loss": -5.991327285766602, "global_step": 61481, "epoch": 1463} {"train_loss": -5.799295902252197, "global_step": 61482, "epoch": 1463} {"train_loss": -6.04714822769165, "global_step": 61483, "epoch": 1463} {"train_loss": -5.825424671173096, "global_step": 61484, "epoch": 1463} {"train_loss": -5.890355110168457, "global_step": 61485, "epoch": 1463} {"train_loss": -5.864335060119629, "global_step": 61486, "epoch": 1463} {"train_loss": -5.933795974368141, "global_step": 61487, "epoch": 1463, "val_loss": 61361.890625} {"train_loss": -5.916216850280762, "global_step": 61488, "epoch": 1464} {"train_loss": -5.919898509979248, "global_step": 61489, "epoch": 1464} {"train_loss": -5.998160362243652, "global_step": 61490, "epoch": 1464} {"train_loss": -5.863894462585449, "global_step": 61491, "epoch": 1464} {"train_loss": -5.817270278930664, "global_step": 61492, "epoch": 1464} {"train_loss": -5.732302665710449, "global_step": 61493, "epoch": 1464} {"train_loss": -6.039701461791992, "global_step": 61494, "epoch": 1464} {"train_loss": -5.951066970825195, "global_step": 61495, "epoch": 1464} {"train_loss": -5.986959457397461, "global_step": 61496, "epoch": 1464} {"train_loss": -5.854743957519531, "global_step": 61497, "epoch": 1464} {"train_loss": -6.0091552734375, "global_step": 61498, "epoch": 1464} {"train_loss": -5.855207443237305, "global_step": 61499, "epoch": 1464} {"train_loss": -5.8816986083984375, "global_step": 61500, "epoch": 1464} {"train_loss": -5.88338565826416, "global_step": 61501, "epoch": 1464} {"train_loss": -5.990571975708008, "global_step": 61502, "epoch": 1464} {"train_loss": -5.97663688659668, "global_step": 61503, "epoch": 1464} {"train_loss": -5.896537780761719, "global_step": 61504, "epoch": 1464} {"train_loss": -5.946538925170898, "global_step": 61505, "epoch": 1464} {"train_loss": -5.900544166564941, "global_step": 61506, "epoch": 1464} {"train_loss": -5.987142562866211, "global_step": 61507, "epoch": 1464} {"train_loss": -6.051582336425781, "global_step": 61508, "epoch": 1464} {"train_loss": -5.874380111694336, "global_step": 61509, "epoch": 1464} {"train_loss": -5.948256015777588, "global_step": 61510, "epoch": 1464} {"train_loss": -5.869929313659668, "global_step": 61511, "epoch": 1464} {"train_loss": -5.940121650695801, "global_step": 61512, "epoch": 1464} {"train_loss": -5.89550256729126, "global_step": 61513, "epoch": 1464} {"train_loss": -5.835048198699951, "global_step": 61514, "epoch": 1464} {"train_loss": -5.96826696395874, "global_step": 61515, "epoch": 1464} {"train_loss": -5.8135833740234375, "global_step": 61516, "epoch": 1464} {"train_loss": -5.966795921325684, "global_step": 61517, "epoch": 1464} {"train_loss": -5.958357810974121, "global_step": 61518, "epoch": 1464} {"train_loss": -5.926131248474121, "global_step": 61519, "epoch": 1464} {"train_loss": -5.965631484985352, "global_step": 61520, "epoch": 1464} {"train_loss": -5.960449695587158, "global_step": 61521, "epoch": 1464} {"train_loss": -5.938410758972168, "global_step": 61522, "epoch": 1464} {"train_loss": -5.916844844818115, "global_step": 61523, "epoch": 1464} {"train_loss": -5.959884166717529, "global_step": 61524, "epoch": 1464} {"train_loss": -5.8586955070495605, "global_step": 61525, "epoch": 1464} {"train_loss": -6.011144638061523, "global_step": 61526, "epoch": 1464} {"train_loss": -5.922890663146973, "global_step": 61527, "epoch": 1464} {"train_loss": -5.941559791564941, "global_step": 61528, "epoch": 1464} {"train_loss": -5.925327232905796, "global_step": 61529, "epoch": 1464, "val_loss": 61405.98046875} {"train_loss": -5.897974967956543, "global_step": 61530, "epoch": 1465} {"train_loss": -6.016998291015625, "global_step": 61531, "epoch": 1465} {"train_loss": -5.987651824951172, "global_step": 61532, "epoch": 1465} {"train_loss": -5.960505485534668, "global_step": 61533, "epoch": 1465} {"train_loss": -6.004723072052002, "global_step": 61534, "epoch": 1465} {"train_loss": -5.862761497497559, "global_step": 61535, "epoch": 1465} {"train_loss": -5.862959384918213, "global_step": 61536, "epoch": 1465} {"train_loss": -5.886602401733398, "global_step": 61537, "epoch": 1465} {"train_loss": -5.955196857452393, "global_step": 61538, "epoch": 1465} {"train_loss": -5.986299991607666, "global_step": 61539, "epoch": 1465} {"train_loss": -5.890010833740234, "global_step": 61540, "epoch": 1465} {"train_loss": -5.912486553192139, "global_step": 61541, "epoch": 1465} {"train_loss": -5.869394302368164, "global_step": 61542, "epoch": 1465} {"train_loss": -5.798336982727051, "global_step": 61543, "epoch": 1465} {"train_loss": -5.995129585266113, "global_step": 61544, "epoch": 1465} {"train_loss": -6.052059173583984, "global_step": 61545, "epoch": 1465} {"train_loss": -5.96665620803833, "global_step": 61546, "epoch": 1465} {"train_loss": -5.835041046142578, "global_step": 61547, "epoch": 1465} {"train_loss": -5.933819770812988, "global_step": 61548, "epoch": 1465} {"train_loss": -5.881608963012695, "global_step": 61549, "epoch": 1465} {"train_loss": -5.967942237854004, "global_step": 61550, "epoch": 1465} {"train_loss": -5.911524772644043, "global_step": 61551, "epoch": 1465} {"train_loss": -6.009430408477783, "global_step": 61552, "epoch": 1465} {"train_loss": -5.966358184814453, "global_step": 61553, "epoch": 1465} {"train_loss": -5.917576789855957, "global_step": 61554, "epoch": 1465} {"train_loss": -5.845193862915039, "global_step": 61555, "epoch": 1465} {"train_loss": -5.888584613800049, "global_step": 61556, "epoch": 1465} {"train_loss": -5.896722316741943, "global_step": 61557, "epoch": 1465} {"train_loss": -5.998675346374512, "global_step": 61558, "epoch": 1465} {"train_loss": -5.8869404792785645, "global_step": 61559, "epoch": 1465} {"train_loss": -6.0111165046691895, "global_step": 61560, "epoch": 1465} {"train_loss": -5.906822204589844, "global_step": 61561, "epoch": 1465} {"train_loss": -6.071928977966309, "global_step": 61562, "epoch": 1465} {"train_loss": -5.931790351867676, "global_step": 61563, "epoch": 1465} {"train_loss": -6.016558647155762, "global_step": 61564, "epoch": 1465} {"train_loss": -5.96716833114624, "global_step": 61565, "epoch": 1465} {"train_loss": -5.997703552246094, "global_step": 61566, "epoch": 1465} {"train_loss": -5.981727123260498, "global_step": 61567, "epoch": 1465} {"train_loss": -5.91378116607666, "global_step": 61568, "epoch": 1465} {"train_loss": -5.84713888168335, "global_step": 61569, "epoch": 1465} {"train_loss": -5.879363059997559, "global_step": 61570, "epoch": 1465} {"train_loss": -5.9367352440243675, "global_step": 61571, "epoch": 1465, "val_loss": 61274.296875} {"train_loss": -5.816236972808838, "global_step": 61572, "epoch": 1466} {"train_loss": -5.895686626434326, "global_step": 61573, "epoch": 1466} {"train_loss": -5.882468223571777, "global_step": 61574, "epoch": 1466} {"train_loss": -6.032233238220215, "global_step": 61575, "epoch": 1466} {"train_loss": -5.868917942047119, "global_step": 61576, "epoch": 1466} {"train_loss": -6.031375885009766, "global_step": 61577, "epoch": 1466} {"train_loss": -5.89501953125, "global_step": 61578, "epoch": 1466} {"train_loss": -5.836226940155029, "global_step": 61579, "epoch": 1466} {"train_loss": -5.79024600982666, "global_step": 61580, "epoch": 1466} {"train_loss": -5.875682830810547, "global_step": 61581, "epoch": 1466} {"train_loss": -5.9051008224487305, "global_step": 61582, "epoch": 1466} {"train_loss": -5.974849700927734, "global_step": 61583, "epoch": 1466} {"train_loss": -5.828941822052002, "global_step": 61584, "epoch": 1466} {"train_loss": -5.851390361785889, "global_step": 61585, "epoch": 1466} {"train_loss": -5.805440902709961, "global_step": 61586, "epoch": 1466} {"train_loss": -5.926609992980957, "global_step": 61587, "epoch": 1466} {"train_loss": -5.798249244689941, "global_step": 61588, "epoch": 1466} {"train_loss": -5.831284046173096, "global_step": 61589, "epoch": 1466} {"train_loss": -5.741628170013428, "global_step": 61590, "epoch": 1466} {"train_loss": -5.627597808837891, "global_step": 61591, "epoch": 1466} {"train_loss": -5.853632926940918, "global_step": 61592, "epoch": 1466} {"train_loss": -5.810308933258057, "global_step": 61593, "epoch": 1466} {"train_loss": -5.952408313751221, "global_step": 61594, "epoch": 1466} {"train_loss": -5.8557634353637695, "global_step": 61595, "epoch": 1466} {"train_loss": -5.854820251464844, "global_step": 61596, "epoch": 1466} {"train_loss": -5.94313383102417, "global_step": 61597, "epoch": 1466} {"train_loss": -5.83508825302124, "global_step": 61598, "epoch": 1466} {"train_loss": -5.836555480957031, "global_step": 61599, "epoch": 1466} {"train_loss": -5.814939498901367, "global_step": 61600, "epoch": 1466} {"train_loss": -5.944493770599365, "global_step": 61601, "epoch": 1466} {"train_loss": -5.892772197723389, "global_step": 61602, "epoch": 1466} {"train_loss": -5.977412700653076, "global_step": 61603, "epoch": 1466} {"train_loss": -5.7836151123046875, "global_step": 61604, "epoch": 1466} {"train_loss": -5.955997943878174, "global_step": 61605, "epoch": 1466} {"train_loss": -5.884463787078857, "global_step": 61606, "epoch": 1466} {"train_loss": -5.857170104980469, "global_step": 61607, "epoch": 1466} {"train_loss": -5.809116363525391, "global_step": 61608, "epoch": 1466} {"train_loss": -5.929965496063232, "global_step": 61609, "epoch": 1466} {"train_loss": -5.907674789428711, "global_step": 61610, "epoch": 1466} {"train_loss": -5.900019645690918, "global_step": 61611, "epoch": 1466} {"train_loss": -5.900979995727539, "global_step": 61612, "epoch": 1466} {"train_loss": -5.871394191469465, "global_step": 61613, "epoch": 1466, "val_loss": 61408.87890625} {"train_loss": -6.003742218017578, "global_step": 61614, "epoch": 1467} {"train_loss": -5.801129341125488, "global_step": 61615, "epoch": 1467} {"train_loss": -5.965735912322998, "global_step": 61616, "epoch": 1467} {"train_loss": -5.879664421081543, "global_step": 61617, "epoch": 1467} {"train_loss": -5.929052352905273, "global_step": 61618, "epoch": 1467} {"train_loss": -5.869220733642578, "global_step": 61619, "epoch": 1467} {"train_loss": -6.016681671142578, "global_step": 61620, "epoch": 1467} {"train_loss": -5.979423522949219, "global_step": 61621, "epoch": 1467} {"train_loss": -5.939672470092773, "global_step": 61622, "epoch": 1467} {"train_loss": -5.997152328491211, "global_step": 61623, "epoch": 1467} {"train_loss": -5.843720436096191, "global_step": 61624, "epoch": 1467} {"train_loss": -5.914431095123291, "global_step": 61625, "epoch": 1467} {"train_loss": -5.994361877441406, "global_step": 61626, "epoch": 1467} {"train_loss": -5.876302719116211, "global_step": 61627, "epoch": 1467} {"train_loss": -5.9353718757629395, "global_step": 61628, "epoch": 1467} {"train_loss": -5.945771217346191, "global_step": 61629, "epoch": 1467} {"train_loss": -5.959444999694824, "global_step": 61630, "epoch": 1467} {"train_loss": -5.839461803436279, "global_step": 61631, "epoch": 1467} {"train_loss": -5.958518028259277, "global_step": 61632, "epoch": 1467} {"train_loss": -5.928624153137207, "global_step": 61633, "epoch": 1467} {"train_loss": -5.9194488525390625, "global_step": 61634, "epoch": 1467} {"train_loss": -5.876707077026367, "global_step": 61635, "epoch": 1467} {"train_loss": -5.932380199432373, "global_step": 61636, "epoch": 1467} {"train_loss": -5.819986343383789, "global_step": 61637, "epoch": 1467} {"train_loss": -5.971765995025635, "global_step": 61638, "epoch": 1467} {"train_loss": -5.861713409423828, "global_step": 61639, "epoch": 1467} {"train_loss": -5.875030040740967, "global_step": 61640, "epoch": 1467} {"train_loss": -5.968581199645996, "global_step": 61641, "epoch": 1467} {"train_loss": -5.786055564880371, "global_step": 61642, "epoch": 1467} {"train_loss": -5.916595458984375, "global_step": 61643, "epoch": 1467} {"train_loss": -5.993255615234375, "global_step": 61644, "epoch": 1467} {"train_loss": -5.894425868988037, "global_step": 61645, "epoch": 1467} {"train_loss": -6.02585506439209, "global_step": 61646, "epoch": 1467} {"train_loss": -5.9844069480896, "global_step": 61647, "epoch": 1467} {"train_loss": -5.825477600097656, "global_step": 61648, "epoch": 1467} {"train_loss": -5.922746181488037, "global_step": 61649, "epoch": 1467} {"train_loss": -5.856112003326416, "global_step": 61650, "epoch": 1467} {"train_loss": -5.891002655029297, "global_step": 61651, "epoch": 1467} {"train_loss": -6.042209625244141, "global_step": 61652, "epoch": 1467} {"train_loss": -5.863222122192383, "global_step": 61653, "epoch": 1467} {"train_loss": -5.957503318786621, "global_step": 61654, "epoch": 1467} {"train_loss": -5.920214596248808, "global_step": 61655, "epoch": 1467, "val_loss": 61233.5703125} {"train_loss": -5.985989093780518, "global_step": 61656, "epoch": 1468} {"train_loss": -5.9516282081604, "global_step": 61657, "epoch": 1468} {"train_loss": -6.009127616882324, "global_step": 61658, "epoch": 1468} {"train_loss": -6.036185264587402, "global_step": 61659, "epoch": 1468} {"train_loss": -5.886605739593506, "global_step": 61660, "epoch": 1468} {"train_loss": -5.894073009490967, "global_step": 61661, "epoch": 1468} {"train_loss": -6.028141975402832, "global_step": 61662, "epoch": 1468} {"train_loss": -6.087045192718506, "global_step": 61663, "epoch": 1468} {"train_loss": -5.942710876464844, "global_step": 61664, "epoch": 1468} {"train_loss": -5.874401092529297, "global_step": 61665, "epoch": 1468} {"train_loss": -5.931955814361572, "global_step": 61666, "epoch": 1468} {"train_loss": -5.923489093780518, "global_step": 61667, "epoch": 1468} {"train_loss": -5.88746452331543, "global_step": 61668, "epoch": 1468} {"train_loss": -5.8476152420043945, "global_step": 61669, "epoch": 1468} {"train_loss": -5.83928108215332, "global_step": 61670, "epoch": 1468} {"train_loss": -5.99708890914917, "global_step": 61671, "epoch": 1468} {"train_loss": -5.913029670715332, "global_step": 61672, "epoch": 1468} {"train_loss": -5.988198757171631, "global_step": 61673, "epoch": 1468} {"train_loss": -5.977267265319824, "global_step": 61674, "epoch": 1468} {"train_loss": -6.057224750518799, "global_step": 61675, "epoch": 1468} {"train_loss": -5.864610195159912, "global_step": 61676, "epoch": 1468} {"train_loss": -5.84694766998291, "global_step": 61677, "epoch": 1468} {"train_loss": -5.943330764770508, "global_step": 61678, "epoch": 1468} {"train_loss": -6.053668975830078, "global_step": 61679, "epoch": 1468} {"train_loss": -5.926260948181152, "global_step": 61680, "epoch": 1468} {"train_loss": -5.85294246673584, "global_step": 61681, "epoch": 1468} {"train_loss": -5.912897109985352, "global_step": 61682, "epoch": 1468} {"train_loss": -5.983846664428711, "global_step": 61683, "epoch": 1468} {"train_loss": -5.8486647605896, "global_step": 61684, "epoch": 1468} {"train_loss": -5.952454566955566, "global_step": 61685, "epoch": 1468} {"train_loss": -5.8937225341796875, "global_step": 61686, "epoch": 1468} {"train_loss": -5.828423976898193, "global_step": 61687, "epoch": 1468} {"train_loss": -5.83554744720459, "global_step": 61688, "epoch": 1468} {"train_loss": -5.748671054840088, "global_step": 61689, "epoch": 1468} {"train_loss": -6.0543670654296875, "global_step": 61690, "epoch": 1468} {"train_loss": -5.871999740600586, "global_step": 61691, "epoch": 1468} {"train_loss": -5.971954345703125, "global_step": 61692, "epoch": 1468} {"train_loss": -5.958927631378174, "global_step": 61693, "epoch": 1468} {"train_loss": -5.872984886169434, "global_step": 61694, "epoch": 1468} {"train_loss": -5.810225963592529, "global_step": 61695, "epoch": 1468} {"train_loss": -5.892847061157227, "global_step": 61696, "epoch": 1468} {"train_loss": -5.92765846706572, "global_step": 61697, "epoch": 1468, "val_loss": 61314.41796875} {"train_loss": -5.932345867156982, "global_step": 61698, "epoch": 1469} {"train_loss": -5.976294994354248, "global_step": 61699, "epoch": 1469} {"train_loss": -5.901971817016602, "global_step": 61700, "epoch": 1469} {"train_loss": -5.876717567443848, "global_step": 61701, "epoch": 1469} {"train_loss": -5.946150779724121, "global_step": 61702, "epoch": 1469} {"train_loss": -5.9135637283325195, "global_step": 61703, "epoch": 1469} {"train_loss": -5.936829566955566, "global_step": 61704, "epoch": 1469} {"train_loss": -5.890081405639648, "global_step": 61705, "epoch": 1469} {"train_loss": -5.861418724060059, "global_step": 61706, "epoch": 1469} {"train_loss": -5.907694339752197, "global_step": 61707, "epoch": 1469} {"train_loss": -5.987306594848633, "global_step": 61708, "epoch": 1469} {"train_loss": -5.83272647857666, "global_step": 61709, "epoch": 1469} {"train_loss": -5.948354721069336, "global_step": 61710, "epoch": 1469} {"train_loss": -5.934850692749023, "global_step": 61711, "epoch": 1469} {"train_loss": -5.871781349182129, "global_step": 61712, "epoch": 1469} {"train_loss": -5.958291053771973, "global_step": 61713, "epoch": 1469} {"train_loss": -5.854424476623535, "global_step": 61714, "epoch": 1469} {"train_loss": -5.7746052742004395, "global_step": 61715, "epoch": 1469} {"train_loss": -5.94285774230957, "global_step": 61716, "epoch": 1469} {"train_loss": -5.900364398956299, "global_step": 61717, "epoch": 1469} {"train_loss": -5.804966449737549, "global_step": 61718, "epoch": 1469} {"train_loss": -6.002303123474121, "global_step": 61719, "epoch": 1469} {"train_loss": -5.936840057373047, "global_step": 61720, "epoch": 1469} {"train_loss": -5.864401340484619, "global_step": 61721, "epoch": 1469} {"train_loss": -5.853328704833984, "global_step": 61722, "epoch": 1469} {"train_loss": -5.802294731140137, "global_step": 61723, "epoch": 1469} {"train_loss": -5.880268096923828, "global_step": 61724, "epoch": 1469} {"train_loss": -5.953875541687012, "global_step": 61725, "epoch": 1469} {"train_loss": -5.894262790679932, "global_step": 61726, "epoch": 1469} {"train_loss": -6.058541774749756, "global_step": 61727, "epoch": 1469} {"train_loss": -5.866361618041992, "global_step": 61728, "epoch": 1469} {"train_loss": -5.88134765625, "global_step": 61729, "epoch": 1469} {"train_loss": -5.978513717651367, "global_step": 61730, "epoch": 1469} {"train_loss": -5.807723522186279, "global_step": 61731, "epoch": 1469} {"train_loss": -6.009965419769287, "global_step": 61732, "epoch": 1469} {"train_loss": -5.752427101135254, "global_step": 61733, "epoch": 1469} {"train_loss": -5.991076469421387, "global_step": 61734, "epoch": 1469} {"train_loss": -5.96201229095459, "global_step": 61735, "epoch": 1469} {"train_loss": -5.898882865905762, "global_step": 61736, "epoch": 1469} {"train_loss": -5.936221122741699, "global_step": 61737, "epoch": 1469} {"train_loss": -5.842993259429932, "global_step": 61738, "epoch": 1469} {"train_loss": -5.907332091104417, "global_step": 61739, "epoch": 1469, "val_loss": 61573.39453125} {"train_loss": -5.920360565185547, "global_step": 61740, "epoch": 1470} {"train_loss": -5.874658584594727, "global_step": 61741, "epoch": 1470} {"train_loss": -5.935342788696289, "global_step": 61742, "epoch": 1470} {"train_loss": -5.95271110534668, "global_step": 61743, "epoch": 1470} {"train_loss": -5.921945571899414, "global_step": 61744, "epoch": 1470} {"train_loss": -5.988221168518066, "global_step": 61745, "epoch": 1470} {"train_loss": -6.019505023956299, "global_step": 61746, "epoch": 1470} {"train_loss": -5.996551513671875, "global_step": 61747, "epoch": 1470} {"train_loss": -5.864008903503418, "global_step": 61748, "epoch": 1470} {"train_loss": -5.907110691070557, "global_step": 61749, "epoch": 1470} {"train_loss": -5.95997428894043, "global_step": 61750, "epoch": 1470} {"train_loss": -5.9397172927856445, "global_step": 61751, "epoch": 1470} {"train_loss": -5.939567565917969, "global_step": 61752, "epoch": 1470} {"train_loss": -5.927362442016602, "global_step": 61753, "epoch": 1470} {"train_loss": -5.836302757263184, "global_step": 61754, "epoch": 1470} {"train_loss": -5.909767150878906, "global_step": 61755, "epoch": 1470} {"train_loss": -5.910512924194336, "global_step": 61756, "epoch": 1470} {"train_loss": -5.927456855773926, "global_step": 61757, "epoch": 1470} {"train_loss": -5.892474174499512, "global_step": 61758, "epoch": 1470} {"train_loss": -5.886903762817383, "global_step": 61759, "epoch": 1470} {"train_loss": -5.969964981079102, "global_step": 61760, "epoch": 1470} {"train_loss": -5.898094654083252, "global_step": 61761, "epoch": 1470} {"train_loss": -5.900615692138672, "global_step": 61762, "epoch": 1470} {"train_loss": -5.9462995529174805, "global_step": 61763, "epoch": 1470} {"train_loss": -5.956974029541016, "global_step": 61764, "epoch": 1470} {"train_loss": -5.853804588317871, "global_step": 61765, "epoch": 1470} {"train_loss": -5.895721435546875, "global_step": 61766, "epoch": 1470} {"train_loss": -6.006917476654053, "global_step": 61767, "epoch": 1470} {"train_loss": -5.778466701507568, "global_step": 61768, "epoch": 1470} {"train_loss": -6.0123291015625, "global_step": 61769, "epoch": 1470} {"train_loss": -5.940027236938477, "global_step": 61770, "epoch": 1470} {"train_loss": -5.9500226974487305, "global_step": 61771, "epoch": 1470} {"train_loss": -5.927945137023926, "global_step": 61772, "epoch": 1470} {"train_loss": -6.016147613525391, "global_step": 61773, "epoch": 1470} {"train_loss": -6.0232462882995605, "global_step": 61774, "epoch": 1470} {"train_loss": -5.886862754821777, "global_step": 61775, "epoch": 1470} {"train_loss": -6.022722244262695, "global_step": 61776, "epoch": 1470} {"train_loss": -5.84007453918457, "global_step": 61777, "epoch": 1470} {"train_loss": -5.879935264587402, "global_step": 61778, "epoch": 1470} {"train_loss": -5.974071979522705, "global_step": 61779, "epoch": 1470} {"train_loss": -5.942755222320557, "global_step": 61780, "epoch": 1470} {"train_loss": -5.927520206996372, "global_step": 61781, "epoch": 1470, "val_loss": 61439.70703125} {"train_loss": -5.918241500854492, "global_step": 61782, "epoch": 1471} {"train_loss": -5.962066650390625, "global_step": 61783, "epoch": 1471} {"train_loss": -6.004281044006348, "global_step": 61784, "epoch": 1471} {"train_loss": -5.944817543029785, "global_step": 61785, "epoch": 1471} {"train_loss": -5.943613529205322, "global_step": 61786, "epoch": 1471} {"train_loss": -5.989882469177246, "global_step": 61787, "epoch": 1471} {"train_loss": -5.799145221710205, "global_step": 61788, "epoch": 1471} {"train_loss": -5.964859962463379, "global_step": 61789, "epoch": 1471} {"train_loss": -5.887764930725098, "global_step": 61790, "epoch": 1471} {"train_loss": -6.040871620178223, "global_step": 61791, "epoch": 1471} {"train_loss": -5.905328750610352, "global_step": 61792, "epoch": 1471} {"train_loss": -5.975406169891357, "global_step": 61793, "epoch": 1471} {"train_loss": -6.108184814453125, "global_step": 61794, "epoch": 1471} {"train_loss": -5.909124851226807, "global_step": 61795, "epoch": 1471} {"train_loss": -6.008212566375732, "global_step": 61796, "epoch": 1471} {"train_loss": -5.945833683013916, "global_step": 61797, "epoch": 1471} {"train_loss": -5.836411952972412, "global_step": 61798, "epoch": 1471} {"train_loss": -5.834005832672119, "global_step": 61799, "epoch": 1471} {"train_loss": -6.0568437576293945, "global_step": 61800, "epoch": 1471} {"train_loss": -5.868203639984131, "global_step": 61801, "epoch": 1471} {"train_loss": -5.961407661437988, "global_step": 61802, "epoch": 1471} {"train_loss": -5.892584800720215, "global_step": 61803, "epoch": 1471} {"train_loss": -5.86033821105957, "global_step": 61804, "epoch": 1471} {"train_loss": -5.967219352722168, "global_step": 61805, "epoch": 1471} {"train_loss": -5.9343976974487305, "global_step": 61806, "epoch": 1471} {"train_loss": -5.784144401550293, "global_step": 61807, "epoch": 1471} {"train_loss": -5.934279918670654, "global_step": 61808, "epoch": 1471} {"train_loss": -5.956937313079834, "global_step": 61809, "epoch": 1471} {"train_loss": -5.938318729400635, "global_step": 61810, "epoch": 1471} {"train_loss": -5.913242816925049, "global_step": 61811, "epoch": 1471} {"train_loss": -6.130347728729248, "global_step": 61812, "epoch": 1471} {"train_loss": -6.025873184204102, "global_step": 61813, "epoch": 1471} {"train_loss": -5.920044898986816, "global_step": 61814, "epoch": 1471} {"train_loss": -5.952034950256348, "global_step": 61815, "epoch": 1471} {"train_loss": -5.850822925567627, "global_step": 61816, "epoch": 1471} {"train_loss": -6.028738498687744, "global_step": 61817, "epoch": 1471} {"train_loss": -5.960247039794922, "global_step": 61818, "epoch": 1471} {"train_loss": -5.820809364318848, "global_step": 61819, "epoch": 1471} {"train_loss": -5.888980865478516, "global_step": 61820, "epoch": 1471} {"train_loss": -5.847906112670898, "global_step": 61821, "epoch": 1471} {"train_loss": -5.800721168518066, "global_step": 61822, "epoch": 1471} {"train_loss": -5.927893536431449, "global_step": 61823, "epoch": 1471, "val_loss": 61898.7421875} {"train_loss": -5.7714972496032715, "global_step": 61824, "epoch": 1472} {"train_loss": -5.864974498748779, "global_step": 61825, "epoch": 1472} {"train_loss": -5.88559627532959, "global_step": 61826, "epoch": 1472} {"train_loss": -5.826195240020752, "global_step": 61827, "epoch": 1472} {"train_loss": -5.993457794189453, "global_step": 61828, "epoch": 1472} {"train_loss": -5.910981178283691, "global_step": 61829, "epoch": 1472} {"train_loss": -5.90651273727417, "global_step": 61830, "epoch": 1472} {"train_loss": -5.980786323547363, "global_step": 61831, "epoch": 1472} {"train_loss": -6.004132270812988, "global_step": 61832, "epoch": 1472} {"train_loss": -5.974244117736816, "global_step": 61833, "epoch": 1472} {"train_loss": -5.905411720275879, "global_step": 61834, "epoch": 1472} {"train_loss": -5.881051063537598, "global_step": 61835, "epoch": 1472} {"train_loss": -5.861695766448975, "global_step": 61836, "epoch": 1472} {"train_loss": -5.804445266723633, "global_step": 61837, "epoch": 1472} {"train_loss": -5.997724533081055, "global_step": 61838, "epoch": 1472} {"train_loss": -5.799832344055176, "global_step": 61839, "epoch": 1472} {"train_loss": -5.919624328613281, "global_step": 61840, "epoch": 1472} {"train_loss": -6.052650451660156, "global_step": 61841, "epoch": 1472} {"train_loss": -5.8608222007751465, "global_step": 61842, "epoch": 1472} {"train_loss": -5.856341361999512, "global_step": 61843, "epoch": 1472} {"train_loss": -6.0472283363342285, "global_step": 61844, "epoch": 1472} {"train_loss": -5.855701446533203, "global_step": 61845, "epoch": 1472} {"train_loss": -5.954198360443115, "global_step": 61846, "epoch": 1472} {"train_loss": -5.938040733337402, "global_step": 61847, "epoch": 1472} {"train_loss": -6.041613578796387, "global_step": 61848, "epoch": 1472} {"train_loss": -5.938839912414551, "global_step": 61849, "epoch": 1472} {"train_loss": -5.780422687530518, "global_step": 61850, "epoch": 1472} {"train_loss": -5.931554794311523, "global_step": 61851, "epoch": 1472} {"train_loss": -5.899659633636475, "global_step": 61852, "epoch": 1472} {"train_loss": -5.8873138427734375, "global_step": 61853, "epoch": 1472} {"train_loss": -5.871125221252441, "global_step": 61854, "epoch": 1472} {"train_loss": -6.0092291831970215, "global_step": 61855, "epoch": 1472} {"train_loss": -5.964520454406738, "global_step": 61856, "epoch": 1472} {"train_loss": -5.829771041870117, "global_step": 61857, "epoch": 1472} {"train_loss": -5.822803020477295, "global_step": 61858, "epoch": 1472} {"train_loss": -5.881191730499268, "global_step": 61859, "epoch": 1472} {"train_loss": -5.886803150177002, "global_step": 61860, "epoch": 1472} {"train_loss": -5.981426239013672, "global_step": 61861, "epoch": 1472} {"train_loss": -5.879877090454102, "global_step": 61862, "epoch": 1472} {"train_loss": -5.782375335693359, "global_step": 61863, "epoch": 1472} {"train_loss": -5.915760040283203, "global_step": 61864, "epoch": 1472} {"train_loss": -5.908632641746884, "global_step": 61865, "epoch": 1472, "val_loss": 61525.45703125} {"train_loss": -5.864012718200684, "global_step": 61866, "epoch": 1473} {"train_loss": -5.951087951660156, "global_step": 61867, "epoch": 1473} {"train_loss": -5.865549087524414, "global_step": 61868, "epoch": 1473} {"train_loss": -5.844325542449951, "global_step": 61869, "epoch": 1473} {"train_loss": -5.907532215118408, "global_step": 61870, "epoch": 1473} {"train_loss": -5.920388698577881, "global_step": 61871, "epoch": 1473} {"train_loss": -5.956263542175293, "global_step": 61872, "epoch": 1473} {"train_loss": -5.945060729980469, "global_step": 61873, "epoch": 1473} {"train_loss": -5.885326385498047, "global_step": 61874, "epoch": 1473} {"train_loss": -5.920350074768066, "global_step": 61875, "epoch": 1473} {"train_loss": -5.852836608886719, "global_step": 61876, "epoch": 1473} {"train_loss": -6.067858695983887, "global_step": 61877, "epoch": 1473} {"train_loss": -5.9835734367370605, "global_step": 61878, "epoch": 1473} {"train_loss": -6.030313491821289, "global_step": 61879, "epoch": 1473} {"train_loss": -5.884913921356201, "global_step": 61880, "epoch": 1473} {"train_loss": -5.782122611999512, "global_step": 61881, "epoch": 1473} {"train_loss": -5.918100357055664, "global_step": 61882, "epoch": 1473} {"train_loss": -5.882117748260498, "global_step": 61883, "epoch": 1473} {"train_loss": -5.983687877655029, "global_step": 61884, "epoch": 1473} {"train_loss": -5.904748916625977, "global_step": 61885, "epoch": 1473} {"train_loss": -5.958859443664551, "global_step": 61886, "epoch": 1473} {"train_loss": -5.950568199157715, "global_step": 61887, "epoch": 1473} {"train_loss": -5.948808193206787, "global_step": 61888, "epoch": 1473} {"train_loss": -5.883365154266357, "global_step": 61889, "epoch": 1473} {"train_loss": -5.821300983428955, "global_step": 61890, "epoch": 1473} {"train_loss": -5.934744834899902, "global_step": 61891, "epoch": 1473} {"train_loss": -5.981193542480469, "global_step": 61892, "epoch": 1473} {"train_loss": -5.929765224456787, "global_step": 61893, "epoch": 1473} {"train_loss": -5.974366188049316, "global_step": 61894, "epoch": 1473} {"train_loss": -6.062743186950684, "global_step": 61895, "epoch": 1473} {"train_loss": -5.915472984313965, "global_step": 61896, "epoch": 1473} {"train_loss": -6.096120834350586, "global_step": 61897, "epoch": 1473} {"train_loss": -5.974150657653809, "global_step": 61898, "epoch": 1473} {"train_loss": -5.892359733581543, "global_step": 61899, "epoch": 1473} {"train_loss": -6.014080047607422, "global_step": 61900, "epoch": 1473} {"train_loss": -5.832124710083008, "global_step": 61901, "epoch": 1473} {"train_loss": -5.987077713012695, "global_step": 61902, "epoch": 1473} {"train_loss": -5.840146064758301, "global_step": 61903, "epoch": 1473} {"train_loss": -5.856964111328125, "global_step": 61904, "epoch": 1473} {"train_loss": -6.073185443878174, "global_step": 61905, "epoch": 1473} {"train_loss": -5.900979995727539, "global_step": 61906, "epoch": 1473} {"train_loss": -5.927316779182071, "global_step": 61907, "epoch": 1473, "val_loss": 61176.8359375} {"train_loss": -5.986570358276367, "global_step": 61908, "epoch": 1474} {"train_loss": -5.863102912902832, "global_step": 61909, "epoch": 1474} {"train_loss": -6.022441387176514, "global_step": 61910, "epoch": 1474} {"train_loss": -5.948114395141602, "global_step": 61911, "epoch": 1474} {"train_loss": -5.883177757263184, "global_step": 61912, "epoch": 1474} {"train_loss": -5.978274822235107, "global_step": 61913, "epoch": 1474} {"train_loss": -5.841224670410156, "global_step": 61914, "epoch": 1474} {"train_loss": -5.896349906921387, "global_step": 61915, "epoch": 1474} {"train_loss": -5.983996391296387, "global_step": 61916, "epoch": 1474} {"train_loss": -6.047828197479248, "global_step": 61917, "epoch": 1474} {"train_loss": -5.921149253845215, "global_step": 61918, "epoch": 1474} {"train_loss": -5.920015335083008, "global_step": 61919, "epoch": 1474} {"train_loss": -6.0370283126831055, "global_step": 61920, "epoch": 1474} {"train_loss": -5.837623596191406, "global_step": 61921, "epoch": 1474} {"train_loss": -5.969783306121826, "global_step": 61922, "epoch": 1474} {"train_loss": -5.954288482666016, "global_step": 61923, "epoch": 1474} {"train_loss": -5.982470512390137, "global_step": 61924, "epoch": 1474} {"train_loss": -5.968988418579102, "global_step": 61925, "epoch": 1474} {"train_loss": -5.882548809051514, "global_step": 61926, "epoch": 1474} {"train_loss": -5.853362083435059, "global_step": 61927, "epoch": 1474} {"train_loss": -5.914340972900391, "global_step": 61928, "epoch": 1474} {"train_loss": -5.859780311584473, "global_step": 61929, "epoch": 1474} {"train_loss": -5.909344673156738, "global_step": 61930, "epoch": 1474} {"train_loss": -5.893218994140625, "global_step": 61931, "epoch": 1474} {"train_loss": -5.933650016784668, "global_step": 61932, "epoch": 1474} {"train_loss": -5.885025978088379, "global_step": 61933, "epoch": 1474} {"train_loss": -6.075026512145996, "global_step": 61934, "epoch": 1474} {"train_loss": -5.953557968139648, "global_step": 61935, "epoch": 1474} {"train_loss": -5.905771255493164, "global_step": 61936, "epoch": 1474} {"train_loss": -6.105403423309326, "global_step": 61937, "epoch": 1474} {"train_loss": -5.882245063781738, "global_step": 61938, "epoch": 1474} {"train_loss": -5.832008361816406, "global_step": 61939, "epoch": 1474} {"train_loss": -5.897767066955566, "global_step": 61940, "epoch": 1474} {"train_loss": -6.05290412902832, "global_step": 61941, "epoch": 1474} {"train_loss": -6.039654731750488, "global_step": 61942, "epoch": 1474} {"train_loss": -6.011877059936523, "global_step": 61943, "epoch": 1474} {"train_loss": -5.865231037139893, "global_step": 61944, "epoch": 1474} {"train_loss": -6.008837699890137, "global_step": 61945, "epoch": 1474} {"train_loss": -5.890445709228516, "global_step": 61946, "epoch": 1474} {"train_loss": -5.955153942108154, "global_step": 61947, "epoch": 1474} {"train_loss": -6.023836612701416, "global_step": 61948, "epoch": 1474} {"train_loss": -5.940656718753633, "global_step": 61949, "epoch": 1474, "val_loss": 61666.55078125} {"train_loss": -5.865594863891602, "global_step": 61950, "epoch": 1475} {"train_loss": -5.978263854980469, "global_step": 61951, "epoch": 1475} {"train_loss": -5.868093967437744, "global_step": 61952, "epoch": 1475} {"train_loss": -5.933341026306152, "global_step": 61953, "epoch": 1475} {"train_loss": -5.884030342102051, "global_step": 61954, "epoch": 1475} {"train_loss": -5.806396484375, "global_step": 61955, "epoch": 1475} {"train_loss": -5.8730034828186035, "global_step": 61956, "epoch": 1475} {"train_loss": -5.6825761795043945, "global_step": 61957, "epoch": 1475} {"train_loss": -5.814240455627441, "global_step": 61958, "epoch": 1475} {"train_loss": -5.694361209869385, "global_step": 61959, "epoch": 1475} {"train_loss": -5.71297550201416, "global_step": 61960, "epoch": 1475} {"train_loss": -5.855550765991211, "global_step": 61961, "epoch": 1475} {"train_loss": -5.735823631286621, "global_step": 61962, "epoch": 1475} {"train_loss": -5.879732131958008, "global_step": 61963, "epoch": 1475} {"train_loss": -5.790085792541504, "global_step": 61964, "epoch": 1475} {"train_loss": -5.9349565505981445, "global_step": 61965, "epoch": 1475} {"train_loss": -5.868873596191406, "global_step": 61966, "epoch": 1475} {"train_loss": -5.788911819458008, "global_step": 61967, "epoch": 1475} {"train_loss": -5.958982467651367, "global_step": 61968, "epoch": 1475} {"train_loss": -5.865447044372559, "global_step": 61969, "epoch": 1475} {"train_loss": -5.900188446044922, "global_step": 61970, "epoch": 1475} {"train_loss": -5.9213056564331055, "global_step": 61971, "epoch": 1475} {"train_loss": -5.903933525085449, "global_step": 61972, "epoch": 1475} {"train_loss": -5.953542232513428, "global_step": 61973, "epoch": 1475} {"train_loss": -5.968436241149902, "global_step": 61974, "epoch": 1475} {"train_loss": -5.887940406799316, "global_step": 61975, "epoch": 1475} {"train_loss": -6.000624656677246, "global_step": 61976, "epoch": 1475} {"train_loss": -5.983988285064697, "global_step": 61977, "epoch": 1475} {"train_loss": -5.736904144287109, "global_step": 61978, "epoch": 1475} {"train_loss": -5.8664398193359375, "global_step": 61979, "epoch": 1475} {"train_loss": -6.016517162322998, "global_step": 61980, "epoch": 1475} {"train_loss": -6.07698917388916, "global_step": 61981, "epoch": 1475} {"train_loss": -6.087215423583984, "global_step": 61982, "epoch": 1475} {"train_loss": -6.006579399108887, "global_step": 61983, "epoch": 1475} {"train_loss": -5.890896797180176, "global_step": 61984, "epoch": 1475} {"train_loss": -5.9685869216918945, "global_step": 61985, "epoch": 1475} {"train_loss": -6.038167953491211, "global_step": 61986, "epoch": 1475} {"train_loss": -6.04335880279541, "global_step": 61987, "epoch": 1475} {"train_loss": -5.96546745300293, "global_step": 61988, "epoch": 1475} {"train_loss": -5.9211883544921875, "global_step": 61989, "epoch": 1475} {"train_loss": -5.945416450500488, "global_step": 61990, "epoch": 1475} {"train_loss": -5.899979920614333, "global_step": 61991, "epoch": 1475, "val_loss": 61051.06640625} {"train_loss": -5.924099445343018, "global_step": 61992, "epoch": 1476} {"train_loss": -6.095468044281006, "global_step": 61993, "epoch": 1476} {"train_loss": -5.894426345825195, "global_step": 61994, "epoch": 1476} {"train_loss": -5.94273042678833, "global_step": 61995, "epoch": 1476} {"train_loss": -5.876264572143555, "global_step": 61996, "epoch": 1476} {"train_loss": -5.9190168380737305, "global_step": 61997, "epoch": 1476} {"train_loss": -6.039248466491699, "global_step": 61998, "epoch": 1476} {"train_loss": -5.929828643798828, "global_step": 61999, "epoch": 1476} {"train_loss": -5.975866317749023, "global_step": 62000, "epoch": 1476} {"train_loss": -6.012712478637695, "global_step": 62001, "epoch": 1476} {"train_loss": -5.942141532897949, "global_step": 62002, "epoch": 1476} {"train_loss": -5.92545747756958, "global_step": 62003, "epoch": 1476} {"train_loss": -6.028382778167725, "global_step": 62004, "epoch": 1476} {"train_loss": -5.916031360626221, "global_step": 62005, "epoch": 1476} {"train_loss": -5.922915458679199, "global_step": 62006, "epoch": 1476} {"train_loss": -6.01439905166626, "global_step": 62007, "epoch": 1476} {"train_loss": -6.041988372802734, "global_step": 62008, "epoch": 1476} {"train_loss": -5.720671653747559, "global_step": 62009, "epoch": 1476} {"train_loss": -6.058647632598877, "global_step": 62010, "epoch": 1476} {"train_loss": -6.0096001625061035, "global_step": 62011, "epoch": 1476} {"train_loss": -5.94443416595459, "global_step": 62012, "epoch": 1476} {"train_loss": -5.863831520080566, "global_step": 62013, "epoch": 1476} {"train_loss": -5.812680721282959, "global_step": 62014, "epoch": 1476} {"train_loss": -5.955224990844727, "global_step": 62015, "epoch": 1476} {"train_loss": -5.850282192230225, "global_step": 62016, "epoch": 1476} {"train_loss": -5.990187168121338, "global_step": 62017, "epoch": 1476} {"train_loss": -6.082629203796387, "global_step": 62018, "epoch": 1476} {"train_loss": -5.973747253417969, "global_step": 62019, "epoch": 1476} {"train_loss": -5.9837751388549805, "global_step": 62020, "epoch": 1476} {"train_loss": -5.897823810577393, "global_step": 62021, "epoch": 1476} {"train_loss": -5.931541442871094, "global_step": 62022, "epoch": 1476} {"train_loss": -5.958058834075928, "global_step": 62023, "epoch": 1476} {"train_loss": -5.980085372924805, "global_step": 62024, "epoch": 1476} {"train_loss": -5.972211837768555, "global_step": 62025, "epoch": 1476} {"train_loss": -5.987411022186279, "global_step": 62026, "epoch": 1476} {"train_loss": -5.9172163009643555, "global_step": 62027, "epoch": 1476} {"train_loss": -5.904266357421875, "global_step": 62028, "epoch": 1476} {"train_loss": -5.875707626342773, "global_step": 62029, "epoch": 1476} {"train_loss": -6.0111470222473145, "global_step": 62030, "epoch": 1476} {"train_loss": -5.926490783691406, "global_step": 62031, "epoch": 1476} {"train_loss": -5.850732803344727, "global_step": 62032, "epoch": 1476} {"train_loss": -5.947616667974563, "global_step": 62033, "epoch": 1476, "val_loss": 61505.91015625} {"train_loss": -5.895735740661621, "global_step": 62034, "epoch": 1477} {"train_loss": -6.097051620483398, "global_step": 62035, "epoch": 1477} {"train_loss": -5.959012508392334, "global_step": 62036, "epoch": 1477} {"train_loss": -5.872137546539307, "global_step": 62037, "epoch": 1477} {"train_loss": -5.951545715332031, "global_step": 62038, "epoch": 1477} {"train_loss": -5.9581217765808105, "global_step": 62039, "epoch": 1477} {"train_loss": -5.86187219619751, "global_step": 62040, "epoch": 1477} {"train_loss": -5.840426921844482, "global_step": 62041, "epoch": 1477} {"train_loss": -5.862137794494629, "global_step": 62042, "epoch": 1477} {"train_loss": -5.890203475952148, "global_step": 62043, "epoch": 1477} {"train_loss": -5.864893913269043, "global_step": 62044, "epoch": 1477} {"train_loss": -5.883857727050781, "global_step": 62045, "epoch": 1477} {"train_loss": -5.962959289550781, "global_step": 62046, "epoch": 1477} {"train_loss": -6.033827781677246, "global_step": 62047, "epoch": 1477} {"train_loss": -5.980947494506836, "global_step": 62048, "epoch": 1477} {"train_loss": -5.994663238525391, "global_step": 62049, "epoch": 1477} {"train_loss": -5.932665824890137, "global_step": 62050, "epoch": 1477} {"train_loss": -5.968939781188965, "global_step": 62051, "epoch": 1477} {"train_loss": -5.8374104499816895, "global_step": 62052, "epoch": 1477} {"train_loss": -5.925004959106445, "global_step": 62053, "epoch": 1477} {"train_loss": -5.952175140380859, "global_step": 62054, "epoch": 1477} {"train_loss": -5.842312335968018, "global_step": 62055, "epoch": 1477} {"train_loss": -6.02420711517334, "global_step": 62056, "epoch": 1477} {"train_loss": -5.910815715789795, "global_step": 62057, "epoch": 1477} {"train_loss": -5.8926801681518555, "global_step": 62058, "epoch": 1477} {"train_loss": -5.894185543060303, "global_step": 62059, "epoch": 1477} {"train_loss": -5.912546157836914, "global_step": 62060, "epoch": 1477} {"train_loss": -5.978847980499268, "global_step": 62061, "epoch": 1477} {"train_loss": -5.946953773498535, "global_step": 62062, "epoch": 1477} {"train_loss": -5.921445846557617, "global_step": 62063, "epoch": 1477} {"train_loss": -5.9061994552612305, "global_step": 62064, "epoch": 1477} {"train_loss": -6.02260160446167, "global_step": 62065, "epoch": 1477} {"train_loss": -5.87243127822876, "global_step": 62066, "epoch": 1477} {"train_loss": -5.848893165588379, "global_step": 62067, "epoch": 1477} {"train_loss": -5.877168655395508, "global_step": 62068, "epoch": 1477} {"train_loss": -5.933850288391113, "global_step": 62069, "epoch": 1477} {"train_loss": -5.876959800720215, "global_step": 62070, "epoch": 1477} {"train_loss": -6.014993667602539, "global_step": 62071, "epoch": 1477} {"train_loss": -5.844051361083984, "global_step": 62072, "epoch": 1477} {"train_loss": -5.876616477966309, "global_step": 62073, "epoch": 1477} {"train_loss": -5.8723530769348145, "global_step": 62074, "epoch": 1477} {"train_loss": -5.92366978100368, "global_step": 62075, "epoch": 1477, "val_loss": 61023.65234375} {"train_loss": -5.999101638793945, "global_step": 62076, "epoch": 1478} {"train_loss": -5.9446587562561035, "global_step": 62077, "epoch": 1478} {"train_loss": -5.856800079345703, "global_step": 62078, "epoch": 1478} {"train_loss": -5.9635515213012695, "global_step": 62079, "epoch": 1478} {"train_loss": -5.9578962326049805, "global_step": 62080, "epoch": 1478} {"train_loss": -5.911381244659424, "global_step": 62081, "epoch": 1478} {"train_loss": -5.885865211486816, "global_step": 62082, "epoch": 1478} {"train_loss": -5.896829605102539, "global_step": 62083, "epoch": 1478} {"train_loss": -5.918985366821289, "global_step": 62084, "epoch": 1478} {"train_loss": -6.045202732086182, "global_step": 62085, "epoch": 1478} {"train_loss": -5.968735694885254, "global_step": 62086, "epoch": 1478} {"train_loss": -5.939187049865723, "global_step": 62087, "epoch": 1478} {"train_loss": -5.977058410644531, "global_step": 62088, "epoch": 1478} {"train_loss": -5.977429389953613, "global_step": 62089, "epoch": 1478} {"train_loss": -5.9403581619262695, "global_step": 62090, "epoch": 1478} {"train_loss": -5.91964054107666, "global_step": 62091, "epoch": 1478} {"train_loss": -5.836308002471924, "global_step": 62092, "epoch": 1478} {"train_loss": -5.867611408233643, "global_step": 62093, "epoch": 1478} {"train_loss": -5.889370918273926, "global_step": 62094, "epoch": 1478} {"train_loss": -6.066751003265381, "global_step": 62095, "epoch": 1478} {"train_loss": -5.936851978302002, "global_step": 62096, "epoch": 1478} {"train_loss": -5.9005327224731445, "global_step": 62097, "epoch": 1478} {"train_loss": -5.85020637512207, "global_step": 62098, "epoch": 1478} {"train_loss": -5.860438346862793, "global_step": 62099, "epoch": 1478} {"train_loss": -5.892812252044678, "global_step": 62100, "epoch": 1478} {"train_loss": -5.982246398925781, "global_step": 62101, "epoch": 1478} {"train_loss": -5.959183692932129, "global_step": 62102, "epoch": 1478} {"train_loss": -5.895764350891113, "global_step": 62103, "epoch": 1478} {"train_loss": -5.946980953216553, "global_step": 62104, "epoch": 1478} {"train_loss": -5.800019264221191, "global_step": 62105, "epoch": 1478} {"train_loss": -5.930544853210449, "global_step": 62106, "epoch": 1478} {"train_loss": -5.984196186065674, "global_step": 62107, "epoch": 1478} {"train_loss": -5.854203224182129, "global_step": 62108, "epoch": 1478} {"train_loss": -6.022357940673828, "global_step": 62109, "epoch": 1478} {"train_loss": -5.927910327911377, "global_step": 62110, "epoch": 1478} {"train_loss": -5.940371513366699, "global_step": 62111, "epoch": 1478} {"train_loss": -5.955687522888184, "global_step": 62112, "epoch": 1478} {"train_loss": -5.974593639373779, "global_step": 62113, "epoch": 1478} {"train_loss": -5.952700614929199, "global_step": 62114, "epoch": 1478} {"train_loss": -5.883618354797363, "global_step": 62115, "epoch": 1478} {"train_loss": -5.9569902420043945, "global_step": 62116, "epoch": 1478} {"train_loss": -5.932686204002017, "global_step": 62117, "epoch": 1478, "val_loss": 61321.3046875} {"train_loss": -5.970820903778076, "global_step": 62118, "epoch": 1479} {"train_loss": -5.968908309936523, "global_step": 62119, "epoch": 1479} {"train_loss": -5.88861608505249, "global_step": 62120, "epoch": 1479} {"train_loss": -5.954797267913818, "global_step": 62121, "epoch": 1479} {"train_loss": -5.92232608795166, "global_step": 62122, "epoch": 1479} {"train_loss": -6.122891426086426, "global_step": 62123, "epoch": 1479} {"train_loss": -6.06173038482666, "global_step": 62124, "epoch": 1479} {"train_loss": -5.923296928405762, "global_step": 62125, "epoch": 1479} {"train_loss": -5.993490219116211, "global_step": 62126, "epoch": 1479} {"train_loss": -5.838907241821289, "global_step": 62127, "epoch": 1479} {"train_loss": -5.963846683502197, "global_step": 62128, "epoch": 1479} {"train_loss": -6.049417018890381, "global_step": 62129, "epoch": 1479} {"train_loss": -5.908074378967285, "global_step": 62130, "epoch": 1479} {"train_loss": -5.966353893280029, "global_step": 62131, "epoch": 1479} {"train_loss": -5.956411838531494, "global_step": 62132, "epoch": 1479} {"train_loss": -5.984638690948486, "global_step": 62133, "epoch": 1479} {"train_loss": -5.8919267654418945, "global_step": 62134, "epoch": 1479} {"train_loss": -5.8472113609313965, "global_step": 62135, "epoch": 1479} {"train_loss": -6.052307605743408, "global_step": 62136, "epoch": 1479} {"train_loss": -5.936864376068115, "global_step": 62137, "epoch": 1479} {"train_loss": -5.9874114990234375, "global_step": 62138, "epoch": 1479} {"train_loss": -5.844637393951416, "global_step": 62139, "epoch": 1479} {"train_loss": -5.98239278793335, "global_step": 62140, "epoch": 1479} {"train_loss": -5.899685382843018, "global_step": 62141, "epoch": 1479} {"train_loss": -5.973644733428955, "global_step": 62142, "epoch": 1479} {"train_loss": -5.938329696655273, "global_step": 62143, "epoch": 1479} {"train_loss": -6.007672309875488, "global_step": 62144, "epoch": 1479} {"train_loss": -5.874629020690918, "global_step": 62145, "epoch": 1479} {"train_loss": -6.066150188446045, "global_step": 62146, "epoch": 1479} {"train_loss": -5.954319477081299, "global_step": 62147, "epoch": 1479} {"train_loss": -5.999000549316406, "global_step": 62148, "epoch": 1479} {"train_loss": -6.021236419677734, "global_step": 62149, "epoch": 1479} {"train_loss": -5.983143329620361, "global_step": 62150, "epoch": 1479} {"train_loss": -5.897976875305176, "global_step": 62151, "epoch": 1479} {"train_loss": -5.891914367675781, "global_step": 62152, "epoch": 1479} {"train_loss": -5.92757511138916, "global_step": 62153, "epoch": 1479} {"train_loss": -5.950334548950195, "global_step": 62154, "epoch": 1479} {"train_loss": -6.0182342529296875, "global_step": 62155, "epoch": 1479} {"train_loss": -5.944225788116455, "global_step": 62156, "epoch": 1479} {"train_loss": -5.890258312225342, "global_step": 62157, "epoch": 1479} {"train_loss": -5.869776725769043, "global_step": 62158, "epoch": 1479} {"train_loss": -5.954271350588117, "global_step": 62159, "epoch": 1479, "val_loss": 61666.0} {"train_loss": -5.992324352264404, "global_step": 62160, "epoch": 1480} {"train_loss": -5.971024513244629, "global_step": 62161, "epoch": 1480} {"train_loss": -5.927559852600098, "global_step": 62162, "epoch": 1480} {"train_loss": -5.956173896789551, "global_step": 62163, "epoch": 1480} {"train_loss": -5.947519302368164, "global_step": 62164, "epoch": 1480} {"train_loss": -5.868311882019043, "global_step": 62165, "epoch": 1480} {"train_loss": -5.864469051361084, "global_step": 62166, "epoch": 1480} {"train_loss": -6.020631790161133, "global_step": 62167, "epoch": 1480} {"train_loss": -5.935474395751953, "global_step": 62168, "epoch": 1480} {"train_loss": -5.972596168518066, "global_step": 62169, "epoch": 1480} {"train_loss": -5.979473114013672, "global_step": 62170, "epoch": 1480} {"train_loss": -6.097116470336914, "global_step": 62171, "epoch": 1480} {"train_loss": -5.994843482971191, "global_step": 62172, "epoch": 1480} {"train_loss": -5.954742431640625, "global_step": 62173, "epoch": 1480} {"train_loss": -5.970724105834961, "global_step": 62174, "epoch": 1480} {"train_loss": -6.0637335777282715, "global_step": 62175, "epoch": 1480} {"train_loss": -5.91868782043457, "global_step": 62176, "epoch": 1480} {"train_loss": -5.9041948318481445, "global_step": 62177, "epoch": 1480} {"train_loss": -5.932242393493652, "global_step": 62178, "epoch": 1480} {"train_loss": -5.8989667892456055, "global_step": 62179, "epoch": 1480} {"train_loss": -5.796389579772949, "global_step": 62180, "epoch": 1480} {"train_loss": -5.863411903381348, "global_step": 62181, "epoch": 1480} {"train_loss": -5.769759178161621, "global_step": 62182, "epoch": 1480} {"train_loss": -5.966437816619873, "global_step": 62183, "epoch": 1480} {"train_loss": -5.77994966506958, "global_step": 62184, "epoch": 1480} {"train_loss": -5.8229522705078125, "global_step": 62185, "epoch": 1480} {"train_loss": -5.880098819732666, "global_step": 62186, "epoch": 1480} {"train_loss": -5.819207191467285, "global_step": 62187, "epoch": 1480} {"train_loss": -5.907493591308594, "global_step": 62188, "epoch": 1480} {"train_loss": -5.857133865356445, "global_step": 62189, "epoch": 1480} {"train_loss": -5.841361999511719, "global_step": 62190, "epoch": 1480} {"train_loss": -5.892529487609863, "global_step": 62191, "epoch": 1480} {"train_loss": -5.90686559677124, "global_step": 62192, "epoch": 1480} {"train_loss": -5.928110122680664, "global_step": 62193, "epoch": 1480} {"train_loss": -5.887604713439941, "global_step": 62194, "epoch": 1480} {"train_loss": -5.915689468383789, "global_step": 62195, "epoch": 1480} {"train_loss": -5.912742614746094, "global_step": 62196, "epoch": 1480} {"train_loss": -5.922112941741943, "global_step": 62197, "epoch": 1480} {"train_loss": -5.858003616333008, "global_step": 62198, "epoch": 1480} {"train_loss": -5.880465030670166, "global_step": 62199, "epoch": 1480} {"train_loss": -5.955742359161377, "global_step": 62200, "epoch": 1480} {"train_loss": -5.915697665441604, "global_step": 62201, "epoch": 1480, "val_loss": 61385.06640625} {"train_loss": -5.942075729370117, "global_step": 62202, "epoch": 1481} {"train_loss": -5.812900543212891, "global_step": 62203, "epoch": 1481} {"train_loss": -5.973374366760254, "global_step": 62204, "epoch": 1481} {"train_loss": -5.95009708404541, "global_step": 62205, "epoch": 1481} {"train_loss": -5.863237380981445, "global_step": 62206, "epoch": 1481} {"train_loss": -5.979681968688965, "global_step": 62207, "epoch": 1481} {"train_loss": -5.866112232208252, "global_step": 62208, "epoch": 1481} {"train_loss": -5.921215057373047, "global_step": 62209, "epoch": 1481} {"train_loss": -5.981575012207031, "global_step": 62210, "epoch": 1481} {"train_loss": -5.940743923187256, "global_step": 62211, "epoch": 1481} {"train_loss": -5.89712381362915, "global_step": 62212, "epoch": 1481} {"train_loss": -5.972334861755371, "global_step": 62213, "epoch": 1481} {"train_loss": -5.857080936431885, "global_step": 62214, "epoch": 1481} {"train_loss": -6.014227867126465, "global_step": 62215, "epoch": 1481} {"train_loss": -5.9386372566223145, "global_step": 62216, "epoch": 1481} {"train_loss": -5.8864593505859375, "global_step": 62217, "epoch": 1481} {"train_loss": -5.978573799133301, "global_step": 62218, "epoch": 1481} {"train_loss": -5.891339302062988, "global_step": 62219, "epoch": 1481} {"train_loss": -5.899803638458252, "global_step": 62220, "epoch": 1481} {"train_loss": -6.053853988647461, "global_step": 62221, "epoch": 1481} {"train_loss": -5.8802642822265625, "global_step": 62222, "epoch": 1481} {"train_loss": -5.944382667541504, "global_step": 62223, "epoch": 1481} {"train_loss": -5.88573694229126, "global_step": 62224, "epoch": 1481} {"train_loss": -5.957314491271973, "global_step": 62225, "epoch": 1481} {"train_loss": -5.990947246551514, "global_step": 62226, "epoch": 1481} {"train_loss": -6.0838623046875, "global_step": 62227, "epoch": 1481} {"train_loss": -5.872590065002441, "global_step": 62228, "epoch": 1481} {"train_loss": -6.010465145111084, "global_step": 62229, "epoch": 1481} {"train_loss": -6.004922389984131, "global_step": 62230, "epoch": 1481} {"train_loss": -6.018802165985107, "global_step": 62231, "epoch": 1481} {"train_loss": -5.919699668884277, "global_step": 62232, "epoch": 1481} {"train_loss": -5.957460403442383, "global_step": 62233, "epoch": 1481} {"train_loss": -6.054741859436035, "global_step": 62234, "epoch": 1481} {"train_loss": -5.875096797943115, "global_step": 62235, "epoch": 1481} {"train_loss": -5.932271957397461, "global_step": 62236, "epoch": 1481} {"train_loss": -5.920318126678467, "global_step": 62237, "epoch": 1481} {"train_loss": -6.006688117980957, "global_step": 62238, "epoch": 1481} {"train_loss": -5.956612586975098, "global_step": 62239, "epoch": 1481} {"train_loss": -5.875242233276367, "global_step": 62240, "epoch": 1481} {"train_loss": -5.813042640686035, "global_step": 62241, "epoch": 1481} {"train_loss": -5.856535911560059, "global_step": 62242, "epoch": 1481} {"train_loss": -5.936457270667667, "global_step": 62243, "epoch": 1481, "val_loss": 61489.2265625} {"train_loss": -5.889641761779785, "global_step": 62244, "epoch": 1482} {"train_loss": -5.80649471282959, "global_step": 62245, "epoch": 1482} {"train_loss": -6.045909881591797, "global_step": 62246, "epoch": 1482} {"train_loss": -5.814183235168457, "global_step": 62247, "epoch": 1482} {"train_loss": -5.887115955352783, "global_step": 62248, "epoch": 1482} {"train_loss": -5.941953659057617, "global_step": 62249, "epoch": 1482} {"train_loss": -6.005497455596924, "global_step": 62250, "epoch": 1482} {"train_loss": -5.856049537658691, "global_step": 62251, "epoch": 1482} {"train_loss": -5.848232269287109, "global_step": 62252, "epoch": 1482} {"train_loss": -5.876066207885742, "global_step": 62253, "epoch": 1482} {"train_loss": -5.926684379577637, "global_step": 62254, "epoch": 1482} {"train_loss": -5.9152092933654785, "global_step": 62255, "epoch": 1482} {"train_loss": -5.9068684577941895, "global_step": 62256, "epoch": 1482} {"train_loss": -5.859254837036133, "global_step": 62257, "epoch": 1482} {"train_loss": -5.943769931793213, "global_step": 62258, "epoch": 1482} {"train_loss": -5.922146797180176, "global_step": 62259, "epoch": 1482} {"train_loss": -5.925431251525879, "global_step": 62260, "epoch": 1482} {"train_loss": -5.928216934204102, "global_step": 62261, "epoch": 1482} {"train_loss": -5.878189563751221, "global_step": 62262, "epoch": 1482} {"train_loss": -6.04781436920166, "global_step": 62263, "epoch": 1482} {"train_loss": -6.065014839172363, "global_step": 62264, "epoch": 1482} {"train_loss": -5.915212631225586, "global_step": 62265, "epoch": 1482} {"train_loss": -5.883181571960449, "global_step": 62266, "epoch": 1482} {"train_loss": -5.93418025970459, "global_step": 62267, "epoch": 1482} {"train_loss": -5.890398979187012, "global_step": 62268, "epoch": 1482} {"train_loss": -5.979554653167725, "global_step": 62269, "epoch": 1482} {"train_loss": -5.9535231590271, "global_step": 62270, "epoch": 1482} {"train_loss": -5.862561225891113, "global_step": 62271, "epoch": 1482} {"train_loss": -5.906191349029541, "global_step": 62272, "epoch": 1482} {"train_loss": -5.940729141235352, "global_step": 62273, "epoch": 1482} {"train_loss": -5.961184501647949, "global_step": 62274, "epoch": 1482} {"train_loss": -5.905333518981934, "global_step": 62275, "epoch": 1482} {"train_loss": -5.746308326721191, "global_step": 62276, "epoch": 1482} {"train_loss": -5.840036392211914, "global_step": 62277, "epoch": 1482} {"train_loss": -5.772830963134766, "global_step": 62278, "epoch": 1482} {"train_loss": -5.869470119476318, "global_step": 62279, "epoch": 1482} {"train_loss": -5.921955585479736, "global_step": 62280, "epoch": 1482} {"train_loss": -5.939088344573975, "global_step": 62281, "epoch": 1482} {"train_loss": -5.980342864990234, "global_step": 62282, "epoch": 1482} {"train_loss": -6.054715156555176, "global_step": 62283, "epoch": 1482} {"train_loss": -5.8626179695129395, "global_step": 62284, "epoch": 1482} {"train_loss": -5.911018905185518, "global_step": 62285, "epoch": 1482, "val_loss": 61340.62890625} {"train_loss": -5.918844699859619, "global_step": 62286, "epoch": 1483} {"train_loss": -5.911288261413574, "global_step": 62287, "epoch": 1483} {"train_loss": -5.861453533172607, "global_step": 62288, "epoch": 1483} {"train_loss": -5.848942756652832, "global_step": 62289, "epoch": 1483} {"train_loss": -5.828869819641113, "global_step": 62290, "epoch": 1483} {"train_loss": -5.944536209106445, "global_step": 62291, "epoch": 1483} {"train_loss": -5.892643928527832, "global_step": 62292, "epoch": 1483} {"train_loss": -5.797050476074219, "global_step": 62293, "epoch": 1483} {"train_loss": -5.951412200927734, "global_step": 62294, "epoch": 1483} {"train_loss": -5.943978786468506, "global_step": 62295, "epoch": 1483} {"train_loss": -5.9072065353393555, "global_step": 62296, "epoch": 1483} {"train_loss": -5.967652320861816, "global_step": 62297, "epoch": 1483} {"train_loss": -5.87586784362793, "global_step": 62298, "epoch": 1483} {"train_loss": -5.955538749694824, "global_step": 62299, "epoch": 1483} {"train_loss": -5.9056782722473145, "global_step": 62300, "epoch": 1483} {"train_loss": -5.897701263427734, "global_step": 62301, "epoch": 1483} {"train_loss": -5.80459451675415, "global_step": 62302, "epoch": 1483} {"train_loss": -5.783478736877441, "global_step": 62303, "epoch": 1483} {"train_loss": -6.004046440124512, "global_step": 62304, "epoch": 1483} {"train_loss": -5.892998695373535, "global_step": 62305, "epoch": 1483} {"train_loss": -5.886000633239746, "global_step": 62306, "epoch": 1483} {"train_loss": -5.905166149139404, "global_step": 62307, "epoch": 1483} {"train_loss": -5.88861083984375, "global_step": 62308, "epoch": 1483} {"train_loss": -5.985042095184326, "global_step": 62309, "epoch": 1483} {"train_loss": -5.92686653137207, "global_step": 62310, "epoch": 1483} {"train_loss": -6.061639785766602, "global_step": 62311, "epoch": 1483} {"train_loss": -5.977278709411621, "global_step": 62312, "epoch": 1483} {"train_loss": -5.819615364074707, "global_step": 62313, "epoch": 1483} {"train_loss": -6.027621269226074, "global_step": 62314, "epoch": 1483} {"train_loss": -5.968798637390137, "global_step": 62315, "epoch": 1483} {"train_loss": -5.959888458251953, "global_step": 62316, "epoch": 1483} {"train_loss": -5.9271159172058105, "global_step": 62317, "epoch": 1483} {"train_loss": -5.878488063812256, "global_step": 62318, "epoch": 1483} {"train_loss": -5.915475845336914, "global_step": 62319, "epoch": 1483} {"train_loss": -6.011058807373047, "global_step": 62320, "epoch": 1483} {"train_loss": -5.984152317047119, "global_step": 62321, "epoch": 1483} {"train_loss": -5.9523606300354, "global_step": 62322, "epoch": 1483} {"train_loss": -5.985563278198242, "global_step": 62323, "epoch": 1483} {"train_loss": -5.858897686004639, "global_step": 62324, "epoch": 1483} {"train_loss": -5.920027732849121, "global_step": 62325, "epoch": 1483} {"train_loss": -5.955618381500244, "global_step": 62326, "epoch": 1483} {"train_loss": -5.919074319657826, "global_step": 62327, "epoch": 1483, "val_loss": 61242.01953125} {"train_loss": -5.9886603355407715, "global_step": 62328, "epoch": 1484} {"train_loss": -6.007512092590332, "global_step": 62329, "epoch": 1484} {"train_loss": -5.864579677581787, "global_step": 62330, "epoch": 1484} {"train_loss": -5.908649921417236, "global_step": 62331, "epoch": 1484} {"train_loss": -5.847434997558594, "global_step": 62332, "epoch": 1484} {"train_loss": -5.946114540100098, "global_step": 62333, "epoch": 1484} {"train_loss": -5.951385021209717, "global_step": 62334, "epoch": 1484} {"train_loss": -6.115218162536621, "global_step": 62335, "epoch": 1484} {"train_loss": -5.75697135925293, "global_step": 62336, "epoch": 1484} {"train_loss": -5.842523574829102, "global_step": 62337, "epoch": 1484} {"train_loss": -5.982604503631592, "global_step": 62338, "epoch": 1484} {"train_loss": -5.896857738494873, "global_step": 62339, "epoch": 1484} {"train_loss": -5.948209762573242, "global_step": 62340, "epoch": 1484} {"train_loss": -5.845916748046875, "global_step": 62341, "epoch": 1484} {"train_loss": -5.9095072746276855, "global_step": 62342, "epoch": 1484} {"train_loss": -5.888344764709473, "global_step": 62343, "epoch": 1484} {"train_loss": -6.000517845153809, "global_step": 62344, "epoch": 1484} {"train_loss": -5.882776260375977, "global_step": 62345, "epoch": 1484} {"train_loss": -5.941418170928955, "global_step": 62346, "epoch": 1484} {"train_loss": -5.828470706939697, "global_step": 62347, "epoch": 1484} {"train_loss": -5.832476615905762, "global_step": 62348, "epoch": 1484} {"train_loss": -5.951428413391113, "global_step": 62349, "epoch": 1484} {"train_loss": -5.977266311645508, "global_step": 62350, "epoch": 1484} {"train_loss": -5.9517621994018555, "global_step": 62351, "epoch": 1484} {"train_loss": -5.8499603271484375, "global_step": 62352, "epoch": 1484} {"train_loss": -6.005454063415527, "global_step": 62353, "epoch": 1484} {"train_loss": -5.843321800231934, "global_step": 62354, "epoch": 1484} {"train_loss": -5.8603925704956055, "global_step": 62355, "epoch": 1484} {"train_loss": -5.83159065246582, "global_step": 62356, "epoch": 1484} {"train_loss": -5.930529594421387, "global_step": 62357, "epoch": 1484} {"train_loss": -5.951467037200928, "global_step": 62358, "epoch": 1484} {"train_loss": -5.950411796569824, "global_step": 62359, "epoch": 1484} {"train_loss": -5.994386196136475, "global_step": 62360, "epoch": 1484} {"train_loss": -6.071954250335693, "global_step": 62361, "epoch": 1484} {"train_loss": -5.873764991760254, "global_step": 62362, "epoch": 1484} {"train_loss": -5.96898078918457, "global_step": 62363, "epoch": 1484} {"train_loss": -5.910701751708984, "global_step": 62364, "epoch": 1484} {"train_loss": -5.977982521057129, "global_step": 62365, "epoch": 1484} {"train_loss": -5.894522666931152, "global_step": 62366, "epoch": 1484} {"train_loss": -5.925937652587891, "global_step": 62367, "epoch": 1484} {"train_loss": -6.023442268371582, "global_step": 62368, "epoch": 1484} {"train_loss": -5.929394517626081, "global_step": 62369, "epoch": 1484, "val_loss": 61564.40234375} {"train_loss": -5.926218032836914, "global_step": 62370, "epoch": 1485} {"train_loss": -5.976302623748779, "global_step": 62371, "epoch": 1485} {"train_loss": -6.027187824249268, "global_step": 62372, "epoch": 1485} {"train_loss": -6.0026445388793945, "global_step": 62373, "epoch": 1485} {"train_loss": -5.964483737945557, "global_step": 62374, "epoch": 1485} {"train_loss": -5.758939266204834, "global_step": 62375, "epoch": 1485} {"train_loss": -5.957393646240234, "global_step": 62376, "epoch": 1485} {"train_loss": -5.902009963989258, "global_step": 62377, "epoch": 1485} {"train_loss": -6.001650333404541, "global_step": 62378, "epoch": 1485} {"train_loss": -5.948545455932617, "global_step": 62379, "epoch": 1485} {"train_loss": -5.999202728271484, "global_step": 62380, "epoch": 1485} {"train_loss": -5.984877586364746, "global_step": 62381, "epoch": 1485} {"train_loss": -5.93472957611084, "global_step": 62382, "epoch": 1485} {"train_loss": -5.9943623542785645, "global_step": 62383, "epoch": 1485} {"train_loss": -5.902763843536377, "global_step": 62384, "epoch": 1485} {"train_loss": -5.9661359786987305, "global_step": 62385, "epoch": 1485} {"train_loss": -6.086613655090332, "global_step": 62386, "epoch": 1485} {"train_loss": -5.922015190124512, "global_step": 62387, "epoch": 1485} {"train_loss": -5.939022064208984, "global_step": 62388, "epoch": 1485} {"train_loss": -5.955931663513184, "global_step": 62389, "epoch": 1485} {"train_loss": -6.031965255737305, "global_step": 62390, "epoch": 1485} {"train_loss": -6.02128267288208, "global_step": 62391, "epoch": 1485} {"train_loss": -5.817883014678955, "global_step": 62392, "epoch": 1485} {"train_loss": -5.910989761352539, "global_step": 62393, "epoch": 1485} {"train_loss": -5.953618049621582, "global_step": 62394, "epoch": 1485} {"train_loss": -5.997912406921387, "global_step": 62395, "epoch": 1485} {"train_loss": -5.8734869956970215, "global_step": 62396, "epoch": 1485} {"train_loss": -5.8863348960876465, "global_step": 62397, "epoch": 1485} {"train_loss": -5.963955879211426, "global_step": 62398, "epoch": 1485} {"train_loss": -5.986480712890625, "global_step": 62399, "epoch": 1485} {"train_loss": -5.948307514190674, "global_step": 62400, "epoch": 1485} {"train_loss": -5.850884914398193, "global_step": 62401, "epoch": 1485} {"train_loss": -5.872441291809082, "global_step": 62402, "epoch": 1485} {"train_loss": -5.963161468505859, "global_step": 62403, "epoch": 1485} {"train_loss": -5.947229862213135, "global_step": 62404, "epoch": 1485} {"train_loss": -5.963979244232178, "global_step": 62405, "epoch": 1485} {"train_loss": -6.08647346496582, "global_step": 62406, "epoch": 1485} {"train_loss": -5.834861755371094, "global_step": 62407, "epoch": 1485} {"train_loss": -5.90757942199707, "global_step": 62408, "epoch": 1485} {"train_loss": -5.998086929321289, "global_step": 62409, "epoch": 1485} {"train_loss": -5.876363754272461, "global_step": 62410, "epoch": 1485} {"train_loss": -5.949109156926473, "global_step": 62411, "epoch": 1485, "val_loss": 61232.49609375} {"train_loss": -5.979212760925293, "global_step": 62412, "epoch": 1486} {"train_loss": -5.988508224487305, "global_step": 62413, "epoch": 1486} {"train_loss": -5.905420303344727, "global_step": 62414, "epoch": 1486} {"train_loss": -5.857746124267578, "global_step": 62415, "epoch": 1486} {"train_loss": -5.9694318771362305, "global_step": 62416, "epoch": 1486} {"train_loss": -5.882770538330078, "global_step": 62417, "epoch": 1486} {"train_loss": -5.921314239501953, "global_step": 62418, "epoch": 1486} {"train_loss": -6.066939353942871, "global_step": 62419, "epoch": 1486} {"train_loss": -5.999017238616943, "global_step": 62420, "epoch": 1486} {"train_loss": -5.968118667602539, "global_step": 62421, "epoch": 1486} {"train_loss": -5.9738054275512695, "global_step": 62422, "epoch": 1486} {"train_loss": -5.9807209968566895, "global_step": 62423, "epoch": 1486} {"train_loss": -5.919247627258301, "global_step": 62424, "epoch": 1486} {"train_loss": -5.942582130432129, "global_step": 62425, "epoch": 1486} {"train_loss": -5.868974685668945, "global_step": 62426, "epoch": 1486} {"train_loss": -5.94036865234375, "global_step": 62427, "epoch": 1486} {"train_loss": -5.943379878997803, "global_step": 62428, "epoch": 1486} {"train_loss": -5.962873458862305, "global_step": 62429, "epoch": 1486} {"train_loss": -5.851668357849121, "global_step": 62430, "epoch": 1486} {"train_loss": -5.9520263671875, "global_step": 62431, "epoch": 1486} {"train_loss": -5.936687469482422, "global_step": 62432, "epoch": 1486} {"train_loss": -5.8305253982543945, "global_step": 62433, "epoch": 1486} {"train_loss": -5.955225944519043, "global_step": 62434, "epoch": 1486} {"train_loss": -5.882419109344482, "global_step": 62435, "epoch": 1486} {"train_loss": -5.685932159423828, "global_step": 62436, "epoch": 1486} {"train_loss": -6.003490447998047, "global_step": 62437, "epoch": 1486} {"train_loss": -5.921540260314941, "global_step": 62438, "epoch": 1486} {"train_loss": -5.782455921173096, "global_step": 62439, "epoch": 1486} {"train_loss": -5.945258140563965, "global_step": 62440, "epoch": 1486} {"train_loss": -5.870121479034424, "global_step": 62441, "epoch": 1486} {"train_loss": -6.033716201782227, "global_step": 62442, "epoch": 1486} {"train_loss": -5.997254371643066, "global_step": 62443, "epoch": 1486} {"train_loss": -5.808575630187988, "global_step": 62444, "epoch": 1486} {"train_loss": -5.861084938049316, "global_step": 62445, "epoch": 1486} {"train_loss": -5.908698558807373, "global_step": 62446, "epoch": 1486} {"train_loss": -5.942815780639648, "global_step": 62447, "epoch": 1486} {"train_loss": -6.005414009094238, "global_step": 62448, "epoch": 1486} {"train_loss": -5.861493110656738, "global_step": 62449, "epoch": 1486} {"train_loss": -5.892245292663574, "global_step": 62450, "epoch": 1486} {"train_loss": -5.932010650634766, "global_step": 62451, "epoch": 1486} {"train_loss": -5.962471961975098, "global_step": 62452, "epoch": 1486} {"train_loss": -5.9229387782868885, "global_step": 62453, "epoch": 1486, "val_loss": 61261.96875} {"train_loss": -6.053426742553711, "global_step": 62454, "epoch": 1487} {"train_loss": -5.979068279266357, "global_step": 62455, "epoch": 1487} {"train_loss": -5.939977645874023, "global_step": 62456, "epoch": 1487} {"train_loss": -5.963576316833496, "global_step": 62457, "epoch": 1487} {"train_loss": -5.9129204750061035, "global_step": 62458, "epoch": 1487} {"train_loss": -6.146587371826172, "global_step": 62459, "epoch": 1487} {"train_loss": -5.93950080871582, "global_step": 62460, "epoch": 1487} {"train_loss": -5.981037616729736, "global_step": 62461, "epoch": 1487} {"train_loss": -5.876757621765137, "global_step": 62462, "epoch": 1487} {"train_loss": -5.885091781616211, "global_step": 62463, "epoch": 1487} {"train_loss": -6.013228416442871, "global_step": 62464, "epoch": 1487} {"train_loss": -5.917143821716309, "global_step": 62465, "epoch": 1487} {"train_loss": -5.965863227844238, "global_step": 62466, "epoch": 1487} {"train_loss": -5.965042591094971, "global_step": 62467, "epoch": 1487} {"train_loss": -5.852906703948975, "global_step": 62468, "epoch": 1487} {"train_loss": -6.018387317657471, "global_step": 62469, "epoch": 1487} {"train_loss": -5.870406150817871, "global_step": 62470, "epoch": 1487} {"train_loss": -5.799342155456543, "global_step": 62471, "epoch": 1487} {"train_loss": -5.896964073181152, "global_step": 62472, "epoch": 1487} {"train_loss": -5.985589504241943, "global_step": 62473, "epoch": 1487} {"train_loss": -5.989144325256348, "global_step": 62474, "epoch": 1487} {"train_loss": -6.062291145324707, "global_step": 62475, "epoch": 1487} {"train_loss": -5.962906360626221, "global_step": 62476, "epoch": 1487} {"train_loss": -6.000567436218262, "global_step": 62477, "epoch": 1487} {"train_loss": -5.856109619140625, "global_step": 62478, "epoch": 1487} {"train_loss": -6.013755798339844, "global_step": 62479, "epoch": 1487} {"train_loss": -5.904753684997559, "global_step": 62480, "epoch": 1487} {"train_loss": -5.855210781097412, "global_step": 62481, "epoch": 1487} {"train_loss": -5.840832710266113, "global_step": 62482, "epoch": 1487} {"train_loss": -5.874736785888672, "global_step": 62483, "epoch": 1487} {"train_loss": -5.95231819152832, "global_step": 62484, "epoch": 1487} {"train_loss": -5.988481521606445, "global_step": 62485, "epoch": 1487} {"train_loss": -5.898230075836182, "global_step": 62486, "epoch": 1487} {"train_loss": -5.958623886108398, "global_step": 62487, "epoch": 1487} {"train_loss": -5.995640754699707, "global_step": 62488, "epoch": 1487} {"train_loss": -5.994657516479492, "global_step": 62489, "epoch": 1487} {"train_loss": -5.967642307281494, "global_step": 62490, "epoch": 1487} {"train_loss": -6.007803916931152, "global_step": 62491, "epoch": 1487} {"train_loss": -5.865903854370117, "global_step": 62492, "epoch": 1487} {"train_loss": -6.038141250610352, "global_step": 62493, "epoch": 1487} {"train_loss": -5.970174789428711, "global_step": 62494, "epoch": 1487} {"train_loss": -5.95169126419794, "global_step": 62495, "epoch": 1487, "val_loss": 61368.00390625} {"train_loss": -6.049470901489258, "global_step": 62496, "epoch": 1488} {"train_loss": -5.906264781951904, "global_step": 62497, "epoch": 1488} {"train_loss": -5.915614128112793, "global_step": 62498, "epoch": 1488} {"train_loss": -5.8654632568359375, "global_step": 62499, "epoch": 1488} {"train_loss": -6.005365371704102, "global_step": 62500, "epoch": 1488} {"train_loss": -6.017214298248291, "global_step": 62501, "epoch": 1488} {"train_loss": -5.869482040405273, "global_step": 62502, "epoch": 1488} {"train_loss": -5.954856872558594, "global_step": 62503, "epoch": 1488} {"train_loss": -6.0374650955200195, "global_step": 62504, "epoch": 1488} {"train_loss": -6.01845645904541, "global_step": 62505, "epoch": 1488} {"train_loss": -5.9613847732543945, "global_step": 62506, "epoch": 1488} {"train_loss": -6.022591590881348, "global_step": 62507, "epoch": 1488} {"train_loss": -5.990478992462158, "global_step": 62508, "epoch": 1488} {"train_loss": -5.9811248779296875, "global_step": 62509, "epoch": 1488} {"train_loss": -6.088773727416992, "global_step": 62510, "epoch": 1488} {"train_loss": -6.033810615539551, "global_step": 62511, "epoch": 1488} {"train_loss": -5.986438274383545, "global_step": 62512, "epoch": 1488} {"train_loss": -5.910081386566162, "global_step": 62513, "epoch": 1488} {"train_loss": -5.98649263381958, "global_step": 62514, "epoch": 1488} {"train_loss": -5.924407482147217, "global_step": 62515, "epoch": 1488} {"train_loss": -6.137080192565918, "global_step": 62516, "epoch": 1488} {"train_loss": -5.980060577392578, "global_step": 62517, "epoch": 1488} {"train_loss": -5.963164329528809, "global_step": 62518, "epoch": 1488} {"train_loss": -5.945425510406494, "global_step": 62519, "epoch": 1488} {"train_loss": -5.922214508056641, "global_step": 62520, "epoch": 1488} {"train_loss": -5.858999252319336, "global_step": 62521, "epoch": 1488} {"train_loss": -5.987486839294434, "global_step": 62522, "epoch": 1488} {"train_loss": -5.843405246734619, "global_step": 62523, "epoch": 1488} {"train_loss": -5.966433525085449, "global_step": 62524, "epoch": 1488} {"train_loss": -5.879748344421387, "global_step": 62525, "epoch": 1488} {"train_loss": -5.909318923950195, "global_step": 62526, "epoch": 1488} {"train_loss": -5.957371711730957, "global_step": 62527, "epoch": 1488} {"train_loss": -5.8843817710876465, "global_step": 62528, "epoch": 1488} {"train_loss": -6.025862216949463, "global_step": 62529, "epoch": 1488} {"train_loss": -6.029746055603027, "global_step": 62530, "epoch": 1488} {"train_loss": -5.982272148132324, "global_step": 62531, "epoch": 1488} {"train_loss": -5.923055648803711, "global_step": 62532, "epoch": 1488} {"train_loss": -6.002506256103516, "global_step": 62533, "epoch": 1488} {"train_loss": -5.947257041931152, "global_step": 62534, "epoch": 1488} {"train_loss": -5.879905700683594, "global_step": 62535, "epoch": 1488} {"train_loss": -5.959258556365967, "global_step": 62536, "epoch": 1488} {"train_loss": -5.963494266782488, "global_step": 62537, "epoch": 1488, "val_loss": 61371.765625} {"train_loss": -6.03391170501709, "global_step": 62538, "epoch": 1489} {"train_loss": -5.940862655639648, "global_step": 62539, "epoch": 1489} {"train_loss": -5.935483932495117, "global_step": 62540, "epoch": 1489} {"train_loss": -5.89670467376709, "global_step": 62541, "epoch": 1489} {"train_loss": -5.940828800201416, "global_step": 62542, "epoch": 1489} {"train_loss": -5.933098316192627, "global_step": 62543, "epoch": 1489} {"train_loss": -5.906451225280762, "global_step": 62544, "epoch": 1489} {"train_loss": -5.911489963531494, "global_step": 62545, "epoch": 1489} {"train_loss": -5.999298572540283, "global_step": 62546, "epoch": 1489} {"train_loss": -5.945773601531982, "global_step": 62547, "epoch": 1489} {"train_loss": -5.892264366149902, "global_step": 62548, "epoch": 1489} {"train_loss": -5.900932788848877, "global_step": 62549, "epoch": 1489} {"train_loss": -5.872111797332764, "global_step": 62550, "epoch": 1489} {"train_loss": -6.034499168395996, "global_step": 62551, "epoch": 1489} {"train_loss": -5.837741851806641, "global_step": 62552, "epoch": 1489} {"train_loss": -5.7864861488342285, "global_step": 62553, "epoch": 1489} {"train_loss": -5.873291015625, "global_step": 62554, "epoch": 1489} {"train_loss": -5.948580741882324, "global_step": 62555, "epoch": 1489} {"train_loss": -5.943219184875488, "global_step": 62556, "epoch": 1489} {"train_loss": -5.908501148223877, "global_step": 62557, "epoch": 1489} {"train_loss": -5.909893035888672, "global_step": 62558, "epoch": 1489} {"train_loss": -5.8947038650512695, "global_step": 62559, "epoch": 1489} {"train_loss": -6.030532360076904, "global_step": 62560, "epoch": 1489} {"train_loss": -6.0283308029174805, "global_step": 62561, "epoch": 1489} {"train_loss": -5.842832565307617, "global_step": 62562, "epoch": 1489} {"train_loss": -5.9277801513671875, "global_step": 62563, "epoch": 1489} {"train_loss": -5.888472557067871, "global_step": 62564, "epoch": 1489} {"train_loss": -5.983063220977783, "global_step": 62565, "epoch": 1489} {"train_loss": -6.00563383102417, "global_step": 62566, "epoch": 1489} {"train_loss": -5.982837200164795, "global_step": 62567, "epoch": 1489} {"train_loss": -5.831676483154297, "global_step": 62568, "epoch": 1489} {"train_loss": -5.994365692138672, "global_step": 62569, "epoch": 1489} {"train_loss": -5.9530029296875, "global_step": 62570, "epoch": 1489} {"train_loss": -6.05804443359375, "global_step": 62571, "epoch": 1489} {"train_loss": -5.847100257873535, "global_step": 62572, "epoch": 1489} {"train_loss": -5.84088134765625, "global_step": 62573, "epoch": 1489} {"train_loss": -5.90567684173584, "global_step": 62574, "epoch": 1489} {"train_loss": -5.766870498657227, "global_step": 62575, "epoch": 1489} {"train_loss": -5.783804893493652, "global_step": 62576, "epoch": 1489} {"train_loss": -5.980121612548828, "global_step": 62577, "epoch": 1489} {"train_loss": -5.793369293212891, "global_step": 62578, "epoch": 1489} {"train_loss": -5.92032664162772, "global_step": 62579, "epoch": 1489, "val_loss": 61401.62109375} {"train_loss": -5.80272912979126, "global_step": 62580, "epoch": 1490} {"train_loss": -5.893899917602539, "global_step": 62581, "epoch": 1490} {"train_loss": -5.901910781860352, "global_step": 62582, "epoch": 1490} {"train_loss": -5.902348518371582, "global_step": 62583, "epoch": 1490} {"train_loss": -5.911919593811035, "global_step": 62584, "epoch": 1490} {"train_loss": -6.036589622497559, "global_step": 62585, "epoch": 1490} {"train_loss": -5.947699069976807, "global_step": 62586, "epoch": 1490} {"train_loss": -5.957564830780029, "global_step": 62587, "epoch": 1490} {"train_loss": -5.885403633117676, "global_step": 62588, "epoch": 1490} {"train_loss": -5.890534400939941, "global_step": 62589, "epoch": 1490} {"train_loss": -5.937891006469727, "global_step": 62590, "epoch": 1490} {"train_loss": -5.879014015197754, "global_step": 62591, "epoch": 1490} {"train_loss": -6.00327730178833, "global_step": 62592, "epoch": 1490} {"train_loss": -6.032408714294434, "global_step": 62593, "epoch": 1490} {"train_loss": -5.897899150848389, "global_step": 62594, "epoch": 1490} {"train_loss": -6.153106689453125, "global_step": 62595, "epoch": 1490} {"train_loss": -5.893497467041016, "global_step": 62596, "epoch": 1490} {"train_loss": -5.884028911590576, "global_step": 62597, "epoch": 1490} {"train_loss": -5.953019618988037, "global_step": 62598, "epoch": 1490} {"train_loss": -5.893369674682617, "global_step": 62599, "epoch": 1490} {"train_loss": -5.815129280090332, "global_step": 62600, "epoch": 1490} {"train_loss": -5.898952007293701, "global_step": 62601, "epoch": 1490} {"train_loss": -5.976294994354248, "global_step": 62602, "epoch": 1490} {"train_loss": -5.801844120025635, "global_step": 62603, "epoch": 1490} {"train_loss": -5.947909355163574, "global_step": 62604, "epoch": 1490} {"train_loss": -6.026410102844238, "global_step": 62605, "epoch": 1490} {"train_loss": -5.931024551391602, "global_step": 62606, "epoch": 1490} {"train_loss": -5.950267791748047, "global_step": 62607, "epoch": 1490} {"train_loss": -5.937299728393555, "global_step": 62608, "epoch": 1490} {"train_loss": -5.851131439208984, "global_step": 62609, "epoch": 1490} {"train_loss": -5.901473045349121, "global_step": 62610, "epoch": 1490} {"train_loss": -5.905536651611328, "global_step": 62611, "epoch": 1490} {"train_loss": -5.9617204666137695, "global_step": 62612, "epoch": 1490} {"train_loss": -5.965075492858887, "global_step": 62613, "epoch": 1490} {"train_loss": -5.970142364501953, "global_step": 62614, "epoch": 1490} {"train_loss": -6.069182395935059, "global_step": 62615, "epoch": 1490} {"train_loss": -5.8249664306640625, "global_step": 62616, "epoch": 1490} {"train_loss": -5.871998310089111, "global_step": 62617, "epoch": 1490} {"train_loss": -5.882160186767578, "global_step": 62618, "epoch": 1490} {"train_loss": -5.815990447998047, "global_step": 62619, "epoch": 1490} {"train_loss": -5.87861442565918, "global_step": 62620, "epoch": 1490} {"train_loss": -5.920954329626901, "global_step": 62621, "epoch": 1490, "val_loss": 61448.14453125} {"train_loss": -5.872549057006836, "global_step": 62622, "epoch": 1491} {"train_loss": -5.823177337646484, "global_step": 62623, "epoch": 1491} {"train_loss": -6.059569835662842, "global_step": 62624, "epoch": 1491} {"train_loss": -5.882359504699707, "global_step": 62625, "epoch": 1491} {"train_loss": -5.886456489562988, "global_step": 62626, "epoch": 1491} {"train_loss": -5.960227012634277, "global_step": 62627, "epoch": 1491} {"train_loss": -5.960335731506348, "global_step": 62628, "epoch": 1491} {"train_loss": -5.95034646987915, "global_step": 62629, "epoch": 1491} {"train_loss": -5.765178203582764, "global_step": 62630, "epoch": 1491} {"train_loss": -6.050168991088867, "global_step": 62631, "epoch": 1491} {"train_loss": -5.935009956359863, "global_step": 62632, "epoch": 1491} {"train_loss": -5.8415961265563965, "global_step": 62633, "epoch": 1491} {"train_loss": -6.016709327697754, "global_step": 62634, "epoch": 1491} {"train_loss": -5.804619789123535, "global_step": 62635, "epoch": 1491} {"train_loss": -5.859682083129883, "global_step": 62636, "epoch": 1491} {"train_loss": -5.754961967468262, "global_step": 62637, "epoch": 1491} {"train_loss": -5.907534599304199, "global_step": 62638, "epoch": 1491} {"train_loss": -6.042781829833984, "global_step": 62639, "epoch": 1491} {"train_loss": -5.9320902824401855, "global_step": 62640, "epoch": 1491} {"train_loss": -5.908977031707764, "global_step": 62641, "epoch": 1491} {"train_loss": -5.757357597351074, "global_step": 62642, "epoch": 1491} {"train_loss": -5.829574108123779, "global_step": 62643, "epoch": 1491} {"train_loss": -5.821843147277832, "global_step": 62644, "epoch": 1491} {"train_loss": -5.919915199279785, "global_step": 62645, "epoch": 1491} {"train_loss": -5.908533096313477, "global_step": 62646, "epoch": 1491} {"train_loss": -5.850519180297852, "global_step": 62647, "epoch": 1491} {"train_loss": -6.045106887817383, "global_step": 62648, "epoch": 1491} {"train_loss": -5.931528568267822, "global_step": 62649, "epoch": 1491} {"train_loss": -5.91895866394043, "global_step": 62650, "epoch": 1491} {"train_loss": -5.98615837097168, "global_step": 62651, "epoch": 1491} {"train_loss": -5.898716449737549, "global_step": 62652, "epoch": 1491} {"train_loss": -6.000051498413086, "global_step": 62653, "epoch": 1491} {"train_loss": -5.890903949737549, "global_step": 62654, "epoch": 1491} {"train_loss": -5.910336494445801, "global_step": 62655, "epoch": 1491} {"train_loss": -6.027411460876465, "global_step": 62656, "epoch": 1491} {"train_loss": -5.951325416564941, "global_step": 62657, "epoch": 1491} {"train_loss": -5.9107232093811035, "global_step": 62658, "epoch": 1491} {"train_loss": -5.983096599578857, "global_step": 62659, "epoch": 1491} {"train_loss": -5.922109127044678, "global_step": 62660, "epoch": 1491} {"train_loss": -5.902851104736328, "global_step": 62661, "epoch": 1491} {"train_loss": -5.798890113830566, "global_step": 62662, "epoch": 1491} {"train_loss": -5.906647988728115, "global_step": 62663, "epoch": 1491, "val_loss": 61551.1640625} {"train_loss": -5.789545059204102, "global_step": 62664, "epoch": 1492} {"train_loss": -5.783328056335449, "global_step": 62665, "epoch": 1492} {"train_loss": -5.8166069984436035, "global_step": 62666, "epoch": 1492} {"train_loss": -5.855226993560791, "global_step": 62667, "epoch": 1492} {"train_loss": -5.902841567993164, "global_step": 62668, "epoch": 1492} {"train_loss": -5.912322998046875, "global_step": 62669, "epoch": 1492} {"train_loss": -5.916461944580078, "global_step": 62670, "epoch": 1492} {"train_loss": -5.792922496795654, "global_step": 62671, "epoch": 1492} {"train_loss": -5.9649271965026855, "global_step": 62672, "epoch": 1492} {"train_loss": -5.925474166870117, "global_step": 62673, "epoch": 1492} {"train_loss": -5.851205825805664, "global_step": 62674, "epoch": 1492} {"train_loss": -6.028446674346924, "global_step": 62675, "epoch": 1492} {"train_loss": -5.880624771118164, "global_step": 62676, "epoch": 1492} {"train_loss": -5.791875839233398, "global_step": 62677, "epoch": 1492} {"train_loss": -5.8262786865234375, "global_step": 62678, "epoch": 1492} {"train_loss": -5.956298351287842, "global_step": 62679, "epoch": 1492} {"train_loss": -6.142590045928955, "global_step": 62680, "epoch": 1492} {"train_loss": -5.945615291595459, "global_step": 62681, "epoch": 1492} {"train_loss": -5.96329402923584, "global_step": 62682, "epoch": 1492} {"train_loss": -5.87236213684082, "global_step": 62683, "epoch": 1492} {"train_loss": -5.932819366455078, "global_step": 62684, "epoch": 1492} {"train_loss": -5.960247993469238, "global_step": 62685, "epoch": 1492} {"train_loss": -5.998544216156006, "global_step": 62686, "epoch": 1492} {"train_loss": -5.7986860275268555, "global_step": 62687, "epoch": 1492} {"train_loss": -5.995008945465088, "global_step": 62688, "epoch": 1492} {"train_loss": -6.029780387878418, "global_step": 62689, "epoch": 1492} {"train_loss": -5.987669944763184, "global_step": 62690, "epoch": 1492} {"train_loss": -6.049159526824951, "global_step": 62691, "epoch": 1492} {"train_loss": -5.840863227844238, "global_step": 62692, "epoch": 1492} {"train_loss": -5.843907356262207, "global_step": 62693, "epoch": 1492} {"train_loss": -6.019051551818848, "global_step": 62694, "epoch": 1492} {"train_loss": -6.065335750579834, "global_step": 62695, "epoch": 1492} {"train_loss": -5.96435022354126, "global_step": 62696, "epoch": 1492} {"train_loss": -5.864534378051758, "global_step": 62697, "epoch": 1492} {"train_loss": -5.905792713165283, "global_step": 62698, "epoch": 1492} {"train_loss": -5.909757614135742, "global_step": 62699, "epoch": 1492} {"train_loss": -6.132159233093262, "global_step": 62700, "epoch": 1492} {"train_loss": -5.890758991241455, "global_step": 62701, "epoch": 1492} {"train_loss": -5.983217239379883, "global_step": 62702, "epoch": 1492} {"train_loss": -5.9698076248168945, "global_step": 62703, "epoch": 1492} {"train_loss": -5.937257766723633, "global_step": 62704, "epoch": 1492} {"train_loss": -5.928664990833828, "global_step": 62705, "epoch": 1492, "val_loss": 61338.65234375} {"train_loss": -5.872483253479004, "global_step": 62706, "epoch": 1493} {"train_loss": -5.923108100891113, "global_step": 62707, "epoch": 1493} {"train_loss": -6.056540489196777, "global_step": 62708, "epoch": 1493} {"train_loss": -5.895796775817871, "global_step": 62709, "epoch": 1493} {"train_loss": -6.029149532318115, "global_step": 62710, "epoch": 1493} {"train_loss": -5.852483749389648, "global_step": 62711, "epoch": 1493} {"train_loss": -6.036437034606934, "global_step": 62712, "epoch": 1493} {"train_loss": -6.001053810119629, "global_step": 62713, "epoch": 1493} {"train_loss": -5.850106239318848, "global_step": 62714, "epoch": 1493} {"train_loss": -5.969081401824951, "global_step": 62715, "epoch": 1493} {"train_loss": -6.000093460083008, "global_step": 62716, "epoch": 1493} {"train_loss": -5.939741134643555, "global_step": 62717, "epoch": 1493} {"train_loss": -6.020796298980713, "global_step": 62718, "epoch": 1493} {"train_loss": -5.902866363525391, "global_step": 62719, "epoch": 1493} {"train_loss": -5.973716735839844, "global_step": 62720, "epoch": 1493} {"train_loss": -5.8654327392578125, "global_step": 62721, "epoch": 1493} {"train_loss": -5.951943397521973, "global_step": 62722, "epoch": 1493} {"train_loss": -5.923142433166504, "global_step": 62723, "epoch": 1493} {"train_loss": -6.051261901855469, "global_step": 62724, "epoch": 1493} {"train_loss": -5.871369361877441, "global_step": 62725, "epoch": 1493} {"train_loss": -5.972087860107422, "global_step": 62726, "epoch": 1493} {"train_loss": -6.021216869354248, "global_step": 62727, "epoch": 1493} {"train_loss": -5.942317962646484, "global_step": 62728, "epoch": 1493} {"train_loss": -5.9818925857543945, "global_step": 62729, "epoch": 1493} {"train_loss": -6.146527290344238, "global_step": 62730, "epoch": 1493} {"train_loss": -5.818455219268799, "global_step": 62731, "epoch": 1493} {"train_loss": -5.897339820861816, "global_step": 62732, "epoch": 1493} {"train_loss": -5.940370559692383, "global_step": 62733, "epoch": 1493} {"train_loss": -5.704895496368408, "global_step": 62734, "epoch": 1493} {"train_loss": -5.965193748474121, "global_step": 62735, "epoch": 1493} {"train_loss": -5.867118835449219, "global_step": 62736, "epoch": 1493} {"train_loss": -5.940827369689941, "global_step": 62737, "epoch": 1493} {"train_loss": -5.994182586669922, "global_step": 62738, "epoch": 1493} {"train_loss": -6.086730003356934, "global_step": 62739, "epoch": 1493} {"train_loss": -5.916165828704834, "global_step": 62740, "epoch": 1493} {"train_loss": -5.91429328918457, "global_step": 62741, "epoch": 1493} {"train_loss": -5.850529670715332, "global_step": 62742, "epoch": 1493} {"train_loss": -5.923031330108643, "global_step": 62743, "epoch": 1493} {"train_loss": -5.96875, "global_step": 62744, "epoch": 1493} {"train_loss": -5.899796962738037, "global_step": 62745, "epoch": 1493} {"train_loss": -5.920843124389648, "global_step": 62746, "epoch": 1493} {"train_loss": -5.940250260489328, "global_step": 62747, "epoch": 1493, "val_loss": 61384.63671875} {"train_loss": -6.034907341003418, "global_step": 62748, "epoch": 1494} {"train_loss": -6.004018783569336, "global_step": 62749, "epoch": 1494} {"train_loss": -5.873235702514648, "global_step": 62750, "epoch": 1494} {"train_loss": -5.913875579833984, "global_step": 62751, "epoch": 1494} {"train_loss": -5.932267189025879, "global_step": 62752, "epoch": 1494} {"train_loss": -5.827682971954346, "global_step": 62753, "epoch": 1494} {"train_loss": -6.10344934463501, "global_step": 62754, "epoch": 1494} {"train_loss": -5.7882490158081055, "global_step": 62755, "epoch": 1494} {"train_loss": -5.866167068481445, "global_step": 62756, "epoch": 1494} {"train_loss": -5.895381927490234, "global_step": 62757, "epoch": 1494} {"train_loss": -5.8531575202941895, "global_step": 62758, "epoch": 1494} {"train_loss": -6.002920150756836, "global_step": 62759, "epoch": 1494} {"train_loss": -5.8914899826049805, "global_step": 62760, "epoch": 1494} {"train_loss": -5.949797630310059, "global_step": 62761, "epoch": 1494} {"train_loss": -5.933113098144531, "global_step": 62762, "epoch": 1494} {"train_loss": -5.897092342376709, "global_step": 62763, "epoch": 1494} {"train_loss": -5.939538955688477, "global_step": 62764, "epoch": 1494} {"train_loss": -5.919588565826416, "global_step": 62765, "epoch": 1494} {"train_loss": -5.936025142669678, "global_step": 62766, "epoch": 1494} {"train_loss": -6.060833930969238, "global_step": 62767, "epoch": 1494} {"train_loss": -5.873543739318848, "global_step": 62768, "epoch": 1494} {"train_loss": -5.9524617195129395, "global_step": 62769, "epoch": 1494} {"train_loss": -5.782566070556641, "global_step": 62770, "epoch": 1494} {"train_loss": -5.929741859436035, "global_step": 62771, "epoch": 1494} {"train_loss": -5.866198539733887, "global_step": 62772, "epoch": 1494} {"train_loss": -5.958412170410156, "global_step": 62773, "epoch": 1494} {"train_loss": -5.952712059020996, "global_step": 62774, "epoch": 1494} {"train_loss": -5.916298866271973, "global_step": 62775, "epoch": 1494} {"train_loss": -5.942109107971191, "global_step": 62776, "epoch": 1494} {"train_loss": -5.987725257873535, "global_step": 62777, "epoch": 1494} {"train_loss": -5.925773620605469, "global_step": 62778, "epoch": 1494} {"train_loss": -5.90507698059082, "global_step": 62779, "epoch": 1494} {"train_loss": -5.93878698348999, "global_step": 62780, "epoch": 1494} {"train_loss": -5.932337284088135, "global_step": 62781, "epoch": 1494} {"train_loss": -6.112694263458252, "global_step": 62782, "epoch": 1494} {"train_loss": -6.0141072273254395, "global_step": 62783, "epoch": 1494} {"train_loss": -5.8482794761657715, "global_step": 62784, "epoch": 1494} {"train_loss": -5.912406921386719, "global_step": 62785, "epoch": 1494} {"train_loss": -5.906089782714844, "global_step": 62786, "epoch": 1494} {"train_loss": -5.86966609954834, "global_step": 62787, "epoch": 1494} {"train_loss": -5.855990409851074, "global_step": 62788, "epoch": 1494} {"train_loss": -5.925379832585652, "global_step": 62789, "epoch": 1494, "val_loss": 61221.69921875} {"train_loss": -5.997401237487793, "global_step": 62790, "epoch": 1495} {"train_loss": -5.939599514007568, "global_step": 62791, "epoch": 1495} {"train_loss": -6.043013572692871, "global_step": 62792, "epoch": 1495} {"train_loss": -5.881411552429199, "global_step": 62793, "epoch": 1495} {"train_loss": -5.958476543426514, "global_step": 62794, "epoch": 1495} {"train_loss": -6.000585556030273, "global_step": 62795, "epoch": 1495} {"train_loss": -5.900845527648926, "global_step": 62796, "epoch": 1495} {"train_loss": -5.896524429321289, "global_step": 62797, "epoch": 1495} {"train_loss": -5.834808349609375, "global_step": 62798, "epoch": 1495} {"train_loss": -5.866252899169922, "global_step": 62799, "epoch": 1495} {"train_loss": -5.899198532104492, "global_step": 62800, "epoch": 1495} {"train_loss": -6.035436153411865, "global_step": 62801, "epoch": 1495} {"train_loss": -5.895796298980713, "global_step": 62802, "epoch": 1495} {"train_loss": -5.765120506286621, "global_step": 62803, "epoch": 1495} {"train_loss": -5.94011116027832, "global_step": 62804, "epoch": 1495} {"train_loss": -5.90767765045166, "global_step": 62805, "epoch": 1495} {"train_loss": -5.830268859863281, "global_step": 62806, "epoch": 1495} {"train_loss": -5.890229225158691, "global_step": 62807, "epoch": 1495} {"train_loss": -5.995089054107666, "global_step": 62808, "epoch": 1495} {"train_loss": -5.965478420257568, "global_step": 62809, "epoch": 1495} {"train_loss": -5.877913475036621, "global_step": 62810, "epoch": 1495} {"train_loss": -5.988120079040527, "global_step": 62811, "epoch": 1495} {"train_loss": -5.942093372344971, "global_step": 62812, "epoch": 1495} {"train_loss": -5.952156066894531, "global_step": 62813, "epoch": 1495} {"train_loss": -5.934370040893555, "global_step": 62814, "epoch": 1495} {"train_loss": -5.877753257751465, "global_step": 62815, "epoch": 1495} {"train_loss": -5.957701206207275, "global_step": 62816, "epoch": 1495} {"train_loss": -6.02168607711792, "global_step": 62817, "epoch": 1495} {"train_loss": -6.026430130004883, "global_step": 62818, "epoch": 1495} {"train_loss": -5.940464973449707, "global_step": 62819, "epoch": 1495} {"train_loss": -5.86660099029541, "global_step": 62820, "epoch": 1495} {"train_loss": -5.977780818939209, "global_step": 62821, "epoch": 1495} {"train_loss": -5.967761993408203, "global_step": 62822, "epoch": 1495} {"train_loss": -6.0145649909973145, "global_step": 62823, "epoch": 1495} {"train_loss": -5.925932884216309, "global_step": 62824, "epoch": 1495} {"train_loss": -6.003782272338867, "global_step": 62825, "epoch": 1495} {"train_loss": -5.9682745933532715, "global_step": 62826, "epoch": 1495} {"train_loss": -5.9986677169799805, "global_step": 62827, "epoch": 1495} {"train_loss": -6.014931678771973, "global_step": 62828, "epoch": 1495} {"train_loss": -5.9614362716674805, "global_step": 62829, "epoch": 1495} {"train_loss": -5.830345153808594, "global_step": 62830, "epoch": 1495} {"train_loss": -5.941425459725516, "global_step": 62831, "epoch": 1495, "val_loss": 61280.0546875} {"train_loss": -5.879018783569336, "global_step": 62832, "epoch": 1496} {"train_loss": -5.842327117919922, "global_step": 62833, "epoch": 1496} {"train_loss": -5.934744834899902, "global_step": 62834, "epoch": 1496} {"train_loss": -5.860940933227539, "global_step": 62835, "epoch": 1496} {"train_loss": -5.8845086097717285, "global_step": 62836, "epoch": 1496} {"train_loss": -5.975325107574463, "global_step": 62837, "epoch": 1496} {"train_loss": -5.864137649536133, "global_step": 62838, "epoch": 1496} {"train_loss": -5.892275333404541, "global_step": 62839, "epoch": 1496} {"train_loss": -5.9225754737854, "global_step": 62840, "epoch": 1496} {"train_loss": -5.761207103729248, "global_step": 62841, "epoch": 1496} {"train_loss": -5.952789783477783, "global_step": 62842, "epoch": 1496} {"train_loss": -5.9307427406311035, "global_step": 62843, "epoch": 1496} {"train_loss": -5.938386917114258, "global_step": 62844, "epoch": 1496} {"train_loss": -5.9582624435424805, "global_step": 62845, "epoch": 1496} {"train_loss": -5.883034706115723, "global_step": 62846, "epoch": 1496} {"train_loss": -6.025855541229248, "global_step": 62847, "epoch": 1496} {"train_loss": -5.986762046813965, "global_step": 62848, "epoch": 1496} {"train_loss": -5.991347312927246, "global_step": 62849, "epoch": 1496} {"train_loss": -5.974355697631836, "global_step": 62850, "epoch": 1496} {"train_loss": -5.7806596755981445, "global_step": 62851, "epoch": 1496} {"train_loss": -5.901497840881348, "global_step": 62852, "epoch": 1496} {"train_loss": -5.820326805114746, "global_step": 62853, "epoch": 1496} {"train_loss": -5.839198112487793, "global_step": 62854, "epoch": 1496} {"train_loss": -5.9551520347595215, "global_step": 62855, "epoch": 1496} {"train_loss": -5.806492805480957, "global_step": 62856, "epoch": 1496} {"train_loss": -5.941221237182617, "global_step": 62857, "epoch": 1496} {"train_loss": -5.973793983459473, "global_step": 62858, "epoch": 1496} {"train_loss": -5.814519882202148, "global_step": 62859, "epoch": 1496} {"train_loss": -6.031201362609863, "global_step": 62860, "epoch": 1496} {"train_loss": -5.921371936798096, "global_step": 62861, "epoch": 1496} {"train_loss": -5.965524673461914, "global_step": 62862, "epoch": 1496} {"train_loss": -5.90809965133667, "global_step": 62863, "epoch": 1496} {"train_loss": -5.876810550689697, "global_step": 62864, "epoch": 1496} {"train_loss": -5.912664890289307, "global_step": 62865, "epoch": 1496} {"train_loss": -5.920471668243408, "global_step": 62866, "epoch": 1496} {"train_loss": -6.013617992401123, "global_step": 62867, "epoch": 1496} {"train_loss": -5.887233734130859, "global_step": 62868, "epoch": 1496} {"train_loss": -5.980338096618652, "global_step": 62869, "epoch": 1496} {"train_loss": -5.914427280426025, "global_step": 62870, "epoch": 1496} {"train_loss": -5.899496078491211, "global_step": 62871, "epoch": 1496} {"train_loss": -5.881068229675293, "global_step": 62872, "epoch": 1496} {"train_loss": -5.911916142418271, "global_step": 62873, "epoch": 1496, "val_loss": 61522.9453125} {"train_loss": -5.939642906188965, "global_step": 62874, "epoch": 1497} {"train_loss": -5.975412368774414, "global_step": 62875, "epoch": 1497} {"train_loss": -5.982393264770508, "global_step": 62876, "epoch": 1497} {"train_loss": -5.926122665405273, "global_step": 62877, "epoch": 1497} {"train_loss": -6.049147605895996, "global_step": 62878, "epoch": 1497} {"train_loss": -5.833688259124756, "global_step": 62879, "epoch": 1497} {"train_loss": -5.805381774902344, "global_step": 62880, "epoch": 1497} {"train_loss": -5.927711009979248, "global_step": 62881, "epoch": 1497} {"train_loss": -5.802586555480957, "global_step": 62882, "epoch": 1497} {"train_loss": -5.8755340576171875, "global_step": 62883, "epoch": 1497} {"train_loss": -5.920212745666504, "global_step": 62884, "epoch": 1497} {"train_loss": -5.862557888031006, "global_step": 62885, "epoch": 1497} {"train_loss": -6.031929969787598, "global_step": 62886, "epoch": 1497} {"train_loss": -5.764274597167969, "global_step": 62887, "epoch": 1497} {"train_loss": -5.96596622467041, "global_step": 62888, "epoch": 1497} {"train_loss": -5.705927848815918, "global_step": 62889, "epoch": 1497} {"train_loss": -5.826089382171631, "global_step": 62890, "epoch": 1497} {"train_loss": -5.871119499206543, "global_step": 62891, "epoch": 1497} {"train_loss": -5.872229099273682, "global_step": 62892, "epoch": 1497} {"train_loss": -5.778615474700928, "global_step": 62893, "epoch": 1497} {"train_loss": -5.8040032386779785, "global_step": 62894, "epoch": 1497} {"train_loss": -5.891225814819336, "global_step": 62895, "epoch": 1497} {"train_loss": -5.836806297302246, "global_step": 62896, "epoch": 1497} {"train_loss": -5.8245391845703125, "global_step": 62897, "epoch": 1497} {"train_loss": -5.810029983520508, "global_step": 62898, "epoch": 1497} {"train_loss": -5.984734535217285, "global_step": 62899, "epoch": 1497} {"train_loss": -5.9871344566345215, "global_step": 62900, "epoch": 1497} {"train_loss": -6.068490505218506, "global_step": 62901, "epoch": 1497} {"train_loss": -5.908144474029541, "global_step": 62902, "epoch": 1497} {"train_loss": -5.8883514404296875, "global_step": 62903, "epoch": 1497} {"train_loss": -5.852479934692383, "global_step": 62904, "epoch": 1497} {"train_loss": -5.915184497833252, "global_step": 62905, "epoch": 1497} {"train_loss": -5.9414472579956055, "global_step": 62906, "epoch": 1497} {"train_loss": -5.914177894592285, "global_step": 62907, "epoch": 1497} {"train_loss": -5.88035249710083, "global_step": 62908, "epoch": 1497} {"train_loss": -5.906492710113525, "global_step": 62909, "epoch": 1497} {"train_loss": -5.910017013549805, "global_step": 62910, "epoch": 1497} {"train_loss": -5.824338436126709, "global_step": 62911, "epoch": 1497} {"train_loss": -5.84374475479126, "global_step": 62912, "epoch": 1497} {"train_loss": -5.978638648986816, "global_step": 62913, "epoch": 1497} {"train_loss": -5.8712053298950195, "global_step": 62914, "epoch": 1497} {"train_loss": -5.894384463628133, "global_step": 62915, "epoch": 1497, "val_loss": 61470.0546875} {"train_loss": -5.882994651794434, "global_step": 62916, "epoch": 1498} {"train_loss": -5.85335636138916, "global_step": 62917, "epoch": 1498} {"train_loss": -5.95438289642334, "global_step": 62918, "epoch": 1498} {"train_loss": -5.937495708465576, "global_step": 62919, "epoch": 1498} {"train_loss": -5.936774730682373, "global_step": 62920, "epoch": 1498} {"train_loss": -5.9704461097717285, "global_step": 62921, "epoch": 1498} {"train_loss": -5.911420822143555, "global_step": 62922, "epoch": 1498} {"train_loss": -5.940507888793945, "global_step": 62923, "epoch": 1498} {"train_loss": -5.893501281738281, "global_step": 62924, "epoch": 1498} {"train_loss": -5.792462348937988, "global_step": 62925, "epoch": 1498} {"train_loss": -5.921689987182617, "global_step": 62926, "epoch": 1498} {"train_loss": -5.950395584106445, "global_step": 62927, "epoch": 1498} {"train_loss": -5.873085975646973, "global_step": 62928, "epoch": 1498} {"train_loss": -5.973272323608398, "global_step": 62929, "epoch": 1498} {"train_loss": -5.85896110534668, "global_step": 62930, "epoch": 1498} {"train_loss": -6.0099334716796875, "global_step": 62931, "epoch": 1498} {"train_loss": -5.991581916809082, "global_step": 62932, "epoch": 1498} {"train_loss": -5.873706340789795, "global_step": 62933, "epoch": 1498} {"train_loss": -5.911712646484375, "global_step": 62934, "epoch": 1498} {"train_loss": -5.9429779052734375, "global_step": 62935, "epoch": 1498} {"train_loss": -5.849625587463379, "global_step": 62936, "epoch": 1498} {"train_loss": -6.00081205368042, "global_step": 62937, "epoch": 1498} {"train_loss": -5.944070339202881, "global_step": 62938, "epoch": 1498} {"train_loss": -5.804141521453857, "global_step": 62939, "epoch": 1498} {"train_loss": -6.052949905395508, "global_step": 62940, "epoch": 1498} {"train_loss": -6.064006328582764, "global_step": 62941, "epoch": 1498} {"train_loss": -5.938343524932861, "global_step": 62942, "epoch": 1498} {"train_loss": -5.910517692565918, "global_step": 62943, "epoch": 1498} {"train_loss": -6.022141933441162, "global_step": 62944, "epoch": 1498} {"train_loss": -5.788209438323975, "global_step": 62945, "epoch": 1498} {"train_loss": -5.932763576507568, "global_step": 62946, "epoch": 1498} {"train_loss": -5.9506425857543945, "global_step": 62947, "epoch": 1498} {"train_loss": -6.001629829406738, "global_step": 62948, "epoch": 1498} {"train_loss": -5.942055702209473, "global_step": 62949, "epoch": 1498} {"train_loss": -6.044539928436279, "global_step": 62950, "epoch": 1498} {"train_loss": -5.8857831954956055, "global_step": 62951, "epoch": 1498} {"train_loss": -6.0086469650268555, "global_step": 62952, "epoch": 1498} {"train_loss": -5.933349609375, "global_step": 62953, "epoch": 1498} {"train_loss": -5.8679656982421875, "global_step": 62954, "epoch": 1498} {"train_loss": -5.900572299957275, "global_step": 62955, "epoch": 1498} {"train_loss": -5.765477180480957, "global_step": 62956, "epoch": 1498} {"train_loss": -5.929573831104097, "global_step": 62957, "epoch": 1498, "val_loss": 61605.8828125} {"train_loss": -5.839993476867676, "global_step": 62958, "epoch": 1499} {"train_loss": -5.827040195465088, "global_step": 62959, "epoch": 1499} {"train_loss": -6.0188093185424805, "global_step": 62960, "epoch": 1499} {"train_loss": -5.907641410827637, "global_step": 62961, "epoch": 1499} {"train_loss": -5.785211563110352, "global_step": 62962, "epoch": 1499} {"train_loss": -5.9065728187561035, "global_step": 62963, "epoch": 1499} {"train_loss": -5.90821647644043, "global_step": 62964, "epoch": 1499} {"train_loss": -5.833336353302002, "global_step": 62965, "epoch": 1499} {"train_loss": -6.039492130279541, "global_step": 62966, "epoch": 1499} {"train_loss": -5.808813571929932, "global_step": 62967, "epoch": 1499} {"train_loss": -6.01163387298584, "global_step": 62968, "epoch": 1499} {"train_loss": -5.850977897644043, "global_step": 62969, "epoch": 1499} {"train_loss": -5.92537784576416, "global_step": 62970, "epoch": 1499} {"train_loss": -6.003853797912598, "global_step": 62971, "epoch": 1499} {"train_loss": -5.912230968475342, "global_step": 62972, "epoch": 1499} {"train_loss": -5.963437080383301, "global_step": 62973, "epoch": 1499} {"train_loss": -5.902389049530029, "global_step": 62974, "epoch": 1499} {"train_loss": -6.00287389755249, "global_step": 62975, "epoch": 1499} {"train_loss": -6.056848526000977, "global_step": 62976, "epoch": 1499} {"train_loss": -5.827533721923828, "global_step": 62977, "epoch": 1499} {"train_loss": -6.011445999145508, "global_step": 62978, "epoch": 1499} {"train_loss": -6.082027435302734, "global_step": 62979, "epoch": 1499} {"train_loss": -5.987349987030029, "global_step": 62980, "epoch": 1499} {"train_loss": -5.87395715713501, "global_step": 62981, "epoch": 1499} {"train_loss": -5.8992438316345215, "global_step": 62982, "epoch": 1499} {"train_loss": -5.9891252517700195, "global_step": 62983, "epoch": 1499} {"train_loss": -6.0322184562683105, "global_step": 62984, "epoch": 1499} {"train_loss": -5.950528144836426, "global_step": 62985, "epoch": 1499} {"train_loss": -5.931458473205566, "global_step": 62986, "epoch": 1499} {"train_loss": -5.986199378967285, "global_step": 62987, "epoch": 1499} {"train_loss": -5.9296956062316895, "global_step": 62988, "epoch": 1499} {"train_loss": -6.072397232055664, "global_step": 62989, "epoch": 1499} {"train_loss": -5.936636924743652, "global_step": 62990, "epoch": 1499} {"train_loss": -5.950446128845215, "global_step": 62991, "epoch": 1499} {"train_loss": -5.940367221832275, "global_step": 62992, "epoch": 1499} {"train_loss": -5.903212547302246, "global_step": 62993, "epoch": 1499} {"train_loss": -5.9987945556640625, "global_step": 62994, "epoch": 1499} {"train_loss": -5.95124626159668, "global_step": 62995, "epoch": 1499} {"train_loss": -5.906989574432373, "global_step": 62996, "epoch": 1499} {"train_loss": -5.931301116943359, "global_step": 62997, "epoch": 1499} {"train_loss": -5.869417667388916, "global_step": 62998, "epoch": 1499} {"train_loss": -5.936582860492525, "global_step": 62999, "epoch": 1499, "val_loss": 61156.89453125} {"train_loss": -5.97930908203125, "global_step": 63000, "epoch": 1500} {"train_loss": -5.9549713134765625, "global_step": 63001, "epoch": 1500} {"train_loss": -5.947248458862305, "global_step": 63002, "epoch": 1500} {"train_loss": -5.915293216705322, "global_step": 63003, "epoch": 1500} {"train_loss": -6.010967254638672, "global_step": 63004, "epoch": 1500} {"train_loss": -6.006635665893555, "global_step": 63005, "epoch": 1500} {"train_loss": -6.028814315795898, "global_step": 63006, "epoch": 1500} {"train_loss": -5.932553291320801, "global_step": 63007, "epoch": 1500} {"train_loss": -5.984603404998779, "global_step": 63008, "epoch": 1500} {"train_loss": -5.995365142822266, "global_step": 63009, "epoch": 1500} {"train_loss": -5.9130473136901855, "global_step": 63010, "epoch": 1500} {"train_loss": -5.984107971191406, "global_step": 63011, "epoch": 1500} {"train_loss": -5.979248046875, "global_step": 63012, "epoch": 1500} {"train_loss": -5.9100446701049805, "global_step": 63013, "epoch": 1500} {"train_loss": -6.026237964630127, "global_step": 63014, "epoch": 1500} {"train_loss": -5.974257469177246, "global_step": 63015, "epoch": 1500} {"train_loss": -5.846386909484863, "global_step": 63016, "epoch": 1500} {"train_loss": -5.873376846313477, "global_step": 63017, "epoch": 1500} {"train_loss": -5.9125590324401855, "global_step": 63018, "epoch": 1500} {"train_loss": -5.902798652648926, "global_step": 63019, "epoch": 1500} {"train_loss": -6.011138916015625, "global_step": 63020, "epoch": 1500} {"train_loss": -5.785182476043701, "global_step": 63021, "epoch": 1500} {"train_loss": -5.753662109375, "global_step": 63022, "epoch": 1500} {"train_loss": -5.935731887817383, "global_step": 63023, "epoch": 1500} {"train_loss": -5.677234172821045, "global_step": 63024, "epoch": 1500} {"train_loss": -6.071985244750977, "global_step": 63025, "epoch": 1500} {"train_loss": -5.867275238037109, "global_step": 63026, "epoch": 1500} {"train_loss": -5.842531204223633, "global_step": 63027, "epoch": 1500} {"train_loss": -5.759425163269043, "global_step": 63028, "epoch": 1500} {"train_loss": -5.9377241134643555, "global_step": 63029, "epoch": 1500} {"train_loss": -5.893402099609375, "global_step": 63030, "epoch": 1500} {"train_loss": -5.863420009613037, "global_step": 63031, "epoch": 1500} {"train_loss": -5.912343978881836, "global_step": 63032, "epoch": 1500} {"train_loss": -5.798237323760986, "global_step": 63033, "epoch": 1500} {"train_loss": -5.924202919006348, "global_step": 63034, "epoch": 1500} {"train_loss": -5.775230407714844, "global_step": 63035, "epoch": 1500} {"train_loss": -5.996670722961426, "global_step": 63036, "epoch": 1500} {"train_loss": -5.879302024841309, "global_step": 63037, "epoch": 1500} {"train_loss": -5.970128536224365, "global_step": 63038, "epoch": 1500} {"train_loss": -5.927023887634277, "global_step": 63039, "epoch": 1500} {"train_loss": -5.913374900817871, "global_step": 63040, "epoch": 1500} {"train_loss": -5.917730047589257, "global_step": 63041, "epoch": 1500, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.8403583804714637, "train/sim_max_reward_2": 0.6219527060962026, "train/sim_max_reward_3": 0.16684469869483728, "train/sim_max_reward_4": 0.8855846425326326, "train/sim_max_reward_5": 0.76775388142541, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.3276492273123253, "test/sim_max_reward_4300002": 0.8111648045662437, "test/sim_max_reward_4300003": 0.9084542311396567, "test/sim_max_reward_4300004": 0.8997526040573366, "test/sim_max_reward_4300005": 0.987603917533656, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.38555054548321344, "test/sim_max_reward_4300008": 0.6160220186838256, "test/sim_max_reward_4300009": 0.6932467673080303, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.8879512241860534, "test/sim_max_reward_4300012": 0.9851238524301069, "test/sim_max_reward_4300013": 0.9652189578487703, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.6111676577321435, "test/sim_max_reward_4300016": 0.8897247899673358, "test/sim_max_reward_4300017": 0.5383403959560327, "test/sim_max_reward_4300018": 0.8152738968286783, "test/sim_max_reward_4300019": 0.18475194275210866, "test/sim_max_reward_4300020": 0.7865821118696339, "test/sim_max_reward_4300021": 0.8281217647121859, "test/sim_max_reward_4300022": 0.3273809695295093, "test/sim_max_reward_4300023": 0.33947737434586117, "test/sim_max_reward_4300024": 0.4816429834684127, "test/sim_max_reward_4300025": 0.19587430684071308, "test/sim_max_reward_4300026": 0.05928407227931195, "test/sim_max_reward_4300027": 0.7310308613601508, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.5941934123408972, "test/sim_max_reward_4300030": 0.9267549133440002, "test/sim_max_reward_4300031": 0.24032251248473618, "test/sim_max_reward_4300032": 0.8709413276091504, "test/sim_max_reward_4300033": 0.6629635522843268, "test/sim_max_reward_4300034": 0.11743089681843037, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9782656385575964, "test/sim_max_reward_4300038": 0.5777125786795962, "test/sim_max_reward_4300039": 0.9676404212937261, "test/sim_max_reward_4300040": 0.933807824849897, "test/sim_max_reward_4300041": 0.16553897178327925, "test/sim_max_reward_4300042": 0.5838357670578982, "test/sim_max_reward_4300043": 0.15661230851473482, "test/sim_max_reward_4300044": 0.6881859481133403, "test/sim_max_reward_4300045": 0.19009530119634063, "test/sim_max_reward_4300046": 0.9148945334666122, "test/sim_max_reward_4300047": 0.9560365346085085, "test/sim_max_reward_4300048": 0.8779137440080502, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.578798634304433, "test/mean_score": 0.5571746316153179, "val_loss": 61679.70703125} {"train_loss": -5.862807273864746, "global_step": 63042, "epoch": 1501} {"train_loss": -5.916234493255615, "global_step": 63043, "epoch": 1501} {"train_loss": -5.913468360900879, "global_step": 63044, "epoch": 1501} {"train_loss": -5.953945159912109, "global_step": 63045, "epoch": 1501} {"train_loss": -5.845648288726807, "global_step": 63046, "epoch": 1501} {"train_loss": -6.0772199630737305, "global_step": 63047, "epoch": 1501} {"train_loss": -5.9282379150390625, "global_step": 63048, "epoch": 1501} {"train_loss": -5.973423957824707, "global_step": 63049, "epoch": 1501} {"train_loss": -5.923796653747559, "global_step": 63050, "epoch": 1501} {"train_loss": -5.998641014099121, "global_step": 63051, "epoch": 1501} {"train_loss": -5.879283905029297, "global_step": 63052, "epoch": 1501} {"train_loss": -5.972412109375, "global_step": 63053, "epoch": 1501} {"train_loss": -5.973361015319824, "global_step": 63054, "epoch": 1501} {"train_loss": -5.926957130432129, "global_step": 63055, "epoch": 1501} {"train_loss": -5.972616195678711, "global_step": 63056, "epoch": 1501} {"train_loss": -5.902903079986572, "global_step": 63057, "epoch": 1501} {"train_loss": -5.841827392578125, "global_step": 63058, "epoch": 1501} {"train_loss": -6.05677604675293, "global_step": 63059, "epoch": 1501} {"train_loss": -5.981782913208008, "global_step": 63060, "epoch": 1501} {"train_loss": -5.76334285736084, "global_step": 63061, "epoch": 1501} {"train_loss": -5.997173309326172, "global_step": 63062, "epoch": 1501} {"train_loss": -6.018514633178711, "global_step": 63063, "epoch": 1501} {"train_loss": -5.774779319763184, "global_step": 63064, "epoch": 1501} {"train_loss": -5.962803840637207, "global_step": 63065, "epoch": 1501} {"train_loss": -5.782744407653809, "global_step": 63066, "epoch": 1501} {"train_loss": -5.858392238616943, "global_step": 63067, "epoch": 1501} {"train_loss": -5.880092620849609, "global_step": 63068, "epoch": 1501} {"train_loss": -5.847155570983887, "global_step": 63069, "epoch": 1501} {"train_loss": -5.802347183227539, "global_step": 63070, "epoch": 1501} {"train_loss": -5.894391059875488, "global_step": 63071, "epoch": 1501} {"train_loss": -5.925661087036133, "global_step": 63072, "epoch": 1501} {"train_loss": -5.900864124298096, "global_step": 63073, "epoch": 1501} {"train_loss": -5.944586753845215, "global_step": 63074, "epoch": 1501} {"train_loss": -5.905728340148926, "global_step": 63075, "epoch": 1501} {"train_loss": -5.790106773376465, "global_step": 63076, "epoch": 1501} {"train_loss": -5.88929557800293, "global_step": 63077, "epoch": 1501} {"train_loss": -5.906350135803223, "global_step": 63078, "epoch": 1501} {"train_loss": -5.9185686111450195, "global_step": 63079, "epoch": 1501} {"train_loss": -5.920175552368164, "global_step": 63080, "epoch": 1501} {"train_loss": -5.964081287384033, "global_step": 63081, "epoch": 1501} {"train_loss": -5.931595802307129, "global_step": 63082, "epoch": 1501} {"train_loss": -5.914692106701079, "global_step": 63083, "epoch": 1501, "val_loss": 61703.9453125} {"train_loss": -5.947934150695801, "global_step": 63084, "epoch": 1502} {"train_loss": -5.926121234893799, "global_step": 63085, "epoch": 1502} {"train_loss": -5.870604991912842, "global_step": 63086, "epoch": 1502} {"train_loss": -6.028141021728516, "global_step": 63087, "epoch": 1502} {"train_loss": -5.929949760437012, "global_step": 63088, "epoch": 1502} {"train_loss": -5.890842437744141, "global_step": 63089, "epoch": 1502} {"train_loss": -5.943922996520996, "global_step": 63090, "epoch": 1502} {"train_loss": -5.986230850219727, "global_step": 63091, "epoch": 1502} {"train_loss": -5.917507171630859, "global_step": 63092, "epoch": 1502} {"train_loss": -5.930661201477051, "global_step": 63093, "epoch": 1502} {"train_loss": -5.8778839111328125, "global_step": 63094, "epoch": 1502} {"train_loss": -5.913617134094238, "global_step": 63095, "epoch": 1502} {"train_loss": -6.0731048583984375, "global_step": 63096, "epoch": 1502} {"train_loss": -5.971543312072754, "global_step": 63097, "epoch": 1502} {"train_loss": -5.9268622398376465, "global_step": 63098, "epoch": 1502} {"train_loss": -6.109929084777832, "global_step": 63099, "epoch": 1502} {"train_loss": -5.903957366943359, "global_step": 63100, "epoch": 1502} {"train_loss": -5.948585033416748, "global_step": 63101, "epoch": 1502} {"train_loss": -6.01889705657959, "global_step": 63102, "epoch": 1502} {"train_loss": -5.9030632972717285, "global_step": 63103, "epoch": 1502} {"train_loss": -5.953020095825195, "global_step": 63104, "epoch": 1502} {"train_loss": -5.8562211990356445, "global_step": 63105, "epoch": 1502} {"train_loss": -5.873883247375488, "global_step": 63106, "epoch": 1502} {"train_loss": -5.872666358947754, "global_step": 63107, "epoch": 1502} {"train_loss": -5.820978164672852, "global_step": 63108, "epoch": 1502} {"train_loss": -5.873329162597656, "global_step": 63109, "epoch": 1502} {"train_loss": -5.918630123138428, "global_step": 63110, "epoch": 1502} {"train_loss": -5.801774978637695, "global_step": 63111, "epoch": 1502} {"train_loss": -5.916481018066406, "global_step": 63112, "epoch": 1502} {"train_loss": -5.833867073059082, "global_step": 63113, "epoch": 1502} {"train_loss": -5.873987197875977, "global_step": 63114, "epoch": 1502} {"train_loss": -5.842126846313477, "global_step": 63115, "epoch": 1502} {"train_loss": -5.9953413009643555, "global_step": 63116, "epoch": 1502} {"train_loss": -5.89954948425293, "global_step": 63117, "epoch": 1502} {"train_loss": -5.885369300842285, "global_step": 63118, "epoch": 1502} {"train_loss": -5.942525863647461, "global_step": 63119, "epoch": 1502} {"train_loss": -5.929129600524902, "global_step": 63120, "epoch": 1502} {"train_loss": -5.851747035980225, "global_step": 63121, "epoch": 1502} {"train_loss": -5.96539306640625, "global_step": 63122, "epoch": 1502} {"train_loss": -5.890949249267578, "global_step": 63123, "epoch": 1502} {"train_loss": -5.9534010887146, "global_step": 63124, "epoch": 1502} {"train_loss": -5.923613866170247, "global_step": 63125, "epoch": 1502, "val_loss": 61752.58984375} {"train_loss": -5.837801456451416, "global_step": 63126, "epoch": 1503} {"train_loss": -5.889305114746094, "global_step": 63127, "epoch": 1503} {"train_loss": -5.763521671295166, "global_step": 63128, "epoch": 1503} {"train_loss": -6.001089572906494, "global_step": 63129, "epoch": 1503} {"train_loss": -5.948318958282471, "global_step": 63130, "epoch": 1503} {"train_loss": -5.947894096374512, "global_step": 63131, "epoch": 1503} {"train_loss": -5.975729942321777, "global_step": 63132, "epoch": 1503} {"train_loss": -5.983633995056152, "global_step": 63133, "epoch": 1503} {"train_loss": -5.948310852050781, "global_step": 63134, "epoch": 1503} {"train_loss": -5.910871982574463, "global_step": 63135, "epoch": 1503} {"train_loss": -5.935606002807617, "global_step": 63136, "epoch": 1503} {"train_loss": -5.893020153045654, "global_step": 63137, "epoch": 1503} {"train_loss": -5.930371284484863, "global_step": 63138, "epoch": 1503} {"train_loss": -5.956501483917236, "global_step": 63139, "epoch": 1503} {"train_loss": -5.980622291564941, "global_step": 63140, "epoch": 1503} {"train_loss": -5.91396427154541, "global_step": 63141, "epoch": 1503} {"train_loss": -5.909335136413574, "global_step": 63142, "epoch": 1503} {"train_loss": -5.9698638916015625, "global_step": 63143, "epoch": 1503} {"train_loss": -5.8877716064453125, "global_step": 63144, "epoch": 1503} {"train_loss": -5.948454856872559, "global_step": 63145, "epoch": 1503} {"train_loss": -5.872103214263916, "global_step": 63146, "epoch": 1503} {"train_loss": -5.9295454025268555, "global_step": 63147, "epoch": 1503} {"train_loss": -6.090365409851074, "global_step": 63148, "epoch": 1503} {"train_loss": -5.9576568603515625, "global_step": 63149, "epoch": 1503} {"train_loss": -5.952086448669434, "global_step": 63150, "epoch": 1503} {"train_loss": -5.976805210113525, "global_step": 63151, "epoch": 1503} {"train_loss": -5.866950988769531, "global_step": 63152, "epoch": 1503} {"train_loss": -5.940209865570068, "global_step": 63153, "epoch": 1503} {"train_loss": -5.909483909606934, "global_step": 63154, "epoch": 1503} {"train_loss": -5.9948225021362305, "global_step": 63155, "epoch": 1503} {"train_loss": -5.956332683563232, "global_step": 63156, "epoch": 1503} {"train_loss": -5.961296081542969, "global_step": 63157, "epoch": 1503} {"train_loss": -5.921091079711914, "global_step": 63158, "epoch": 1503} {"train_loss": -5.836805820465088, "global_step": 63159, "epoch": 1503} {"train_loss": -5.963855743408203, "global_step": 63160, "epoch": 1503} {"train_loss": -5.965299606323242, "global_step": 63161, "epoch": 1503} {"train_loss": -5.960247993469238, "global_step": 63162, "epoch": 1503} {"train_loss": -5.954390525817871, "global_step": 63163, "epoch": 1503} {"train_loss": -5.9706711769104, "global_step": 63164, "epoch": 1503} {"train_loss": -5.981237411499023, "global_step": 63165, "epoch": 1503} {"train_loss": -6.0807929039001465, "global_step": 63166, "epoch": 1503} {"train_loss": -5.943817626862299, "global_step": 63167, "epoch": 1503, "val_loss": 61433.39453125} {"train_loss": -5.93931770324707, "global_step": 63168, "epoch": 1504} {"train_loss": -5.86515998840332, "global_step": 63169, "epoch": 1504} {"train_loss": -5.860416412353516, "global_step": 63170, "epoch": 1504} {"train_loss": -5.923041343688965, "global_step": 63171, "epoch": 1504} {"train_loss": -6.08966064453125, "global_step": 63172, "epoch": 1504} {"train_loss": -5.892210006713867, "global_step": 63173, "epoch": 1504} {"train_loss": -5.862593173980713, "global_step": 63174, "epoch": 1504} {"train_loss": -6.101808547973633, "global_step": 63175, "epoch": 1504} {"train_loss": -5.985874176025391, "global_step": 63176, "epoch": 1504} {"train_loss": -5.885548114776611, "global_step": 63177, "epoch": 1504} {"train_loss": -6.018582344055176, "global_step": 63178, "epoch": 1504} {"train_loss": -5.960657119750977, "global_step": 63179, "epoch": 1504} {"train_loss": -5.977139472961426, "global_step": 63180, "epoch": 1504} {"train_loss": -5.978079319000244, "global_step": 63181, "epoch": 1504} {"train_loss": -5.916183948516846, "global_step": 63182, "epoch": 1504} {"train_loss": -6.026332855224609, "global_step": 63183, "epoch": 1504} {"train_loss": -5.928293704986572, "global_step": 63184, "epoch": 1504} {"train_loss": -5.8864641189575195, "global_step": 63185, "epoch": 1504} {"train_loss": -6.092754364013672, "global_step": 63186, "epoch": 1504} {"train_loss": -5.9308390617370605, "global_step": 63187, "epoch": 1504} {"train_loss": -6.009975433349609, "global_step": 63188, "epoch": 1504} {"train_loss": -5.896066188812256, "global_step": 63189, "epoch": 1504} {"train_loss": -5.876260757446289, "global_step": 63190, "epoch": 1504} {"train_loss": -5.903310775756836, "global_step": 63191, "epoch": 1504} {"train_loss": -5.85919189453125, "global_step": 63192, "epoch": 1504} {"train_loss": -5.9335527420043945, "global_step": 63193, "epoch": 1504} {"train_loss": -5.720392227172852, "global_step": 63194, "epoch": 1504} {"train_loss": -5.992305755615234, "global_step": 63195, "epoch": 1504} {"train_loss": -5.946771621704102, "global_step": 63196, "epoch": 1504} {"train_loss": -5.899869918823242, "global_step": 63197, "epoch": 1504} {"train_loss": -5.904573440551758, "global_step": 63198, "epoch": 1504} {"train_loss": -5.954078197479248, "global_step": 63199, "epoch": 1504} {"train_loss": -5.895779132843018, "global_step": 63200, "epoch": 1504} {"train_loss": -6.04630184173584, "global_step": 63201, "epoch": 1504} {"train_loss": -5.915407180786133, "global_step": 63202, "epoch": 1504} {"train_loss": -5.963386058807373, "global_step": 63203, "epoch": 1504} {"train_loss": -5.9429473876953125, "global_step": 63204, "epoch": 1504} {"train_loss": -5.890110969543457, "global_step": 63205, "epoch": 1504} {"train_loss": -5.963417053222656, "global_step": 63206, "epoch": 1504} {"train_loss": -6.076257228851318, "global_step": 63207, "epoch": 1504} {"train_loss": -5.8697052001953125, "global_step": 63208, "epoch": 1504} {"train_loss": -5.939476705732799, "global_step": 63209, "epoch": 1504, "val_loss": 61204.20703125} {"train_loss": -5.9258222579956055, "global_step": 63210, "epoch": 1505} {"train_loss": -5.906495094299316, "global_step": 63211, "epoch": 1505} {"train_loss": -5.9708662033081055, "global_step": 63212, "epoch": 1505} {"train_loss": -5.981558799743652, "global_step": 63213, "epoch": 1505} {"train_loss": -5.919824600219727, "global_step": 63214, "epoch": 1505} {"train_loss": -5.90825080871582, "global_step": 63215, "epoch": 1505} {"train_loss": -6.040013313293457, "global_step": 63216, "epoch": 1505} {"train_loss": -5.776740074157715, "global_step": 63217, "epoch": 1505} {"train_loss": -5.946690559387207, "global_step": 63218, "epoch": 1505} {"train_loss": -5.938072681427002, "global_step": 63219, "epoch": 1505} {"train_loss": -5.8240065574646, "global_step": 63220, "epoch": 1505} {"train_loss": -5.83226203918457, "global_step": 63221, "epoch": 1505} {"train_loss": -5.8966779708862305, "global_step": 63222, "epoch": 1505} {"train_loss": -5.902709007263184, "global_step": 63223, "epoch": 1505} {"train_loss": -5.91121768951416, "global_step": 63224, "epoch": 1505} {"train_loss": -5.900416851043701, "global_step": 63225, "epoch": 1505} {"train_loss": -5.907037258148193, "global_step": 63226, "epoch": 1505} {"train_loss": -6.025721549987793, "global_step": 63227, "epoch": 1505} {"train_loss": -5.934072494506836, "global_step": 63228, "epoch": 1505} {"train_loss": -5.894813537597656, "global_step": 63229, "epoch": 1505} {"train_loss": -6.002472400665283, "global_step": 63230, "epoch": 1505} {"train_loss": -5.922330379486084, "global_step": 63231, "epoch": 1505} {"train_loss": -5.983466625213623, "global_step": 63232, "epoch": 1505} {"train_loss": -5.918281078338623, "global_step": 63233, "epoch": 1505} {"train_loss": -6.009476661682129, "global_step": 63234, "epoch": 1505} {"train_loss": -5.903825759887695, "global_step": 63235, "epoch": 1505} {"train_loss": -5.971761703491211, "global_step": 63236, "epoch": 1505} {"train_loss": -5.953121185302734, "global_step": 63237, "epoch": 1505} {"train_loss": -5.942643165588379, "global_step": 63238, "epoch": 1505} {"train_loss": -6.066708564758301, "global_step": 63239, "epoch": 1505} {"train_loss": -5.965268135070801, "global_step": 63240, "epoch": 1505} {"train_loss": -6.020155906677246, "global_step": 63241, "epoch": 1505} {"train_loss": -6.035600662231445, "global_step": 63242, "epoch": 1505} {"train_loss": -5.974377632141113, "global_step": 63243, "epoch": 1505} {"train_loss": -5.9935808181762695, "global_step": 63244, "epoch": 1505} {"train_loss": -5.970863342285156, "global_step": 63245, "epoch": 1505} {"train_loss": -5.926847457885742, "global_step": 63246, "epoch": 1505} {"train_loss": -5.996204853057861, "global_step": 63247, "epoch": 1505} {"train_loss": -5.8843994140625, "global_step": 63248, "epoch": 1505} {"train_loss": -5.850245475769043, "global_step": 63249, "epoch": 1505} {"train_loss": -5.963080406188965, "global_step": 63250, "epoch": 1505} {"train_loss": -5.938919135502407, "global_step": 63251, "epoch": 1505, "val_loss": 61418.859375} {"train_loss": -6.109203815460205, "global_step": 63252, "epoch": 1506} {"train_loss": -5.869675636291504, "global_step": 63253, "epoch": 1506} {"train_loss": -5.876602649688721, "global_step": 63254, "epoch": 1506} {"train_loss": -5.97530460357666, "global_step": 63255, "epoch": 1506} {"train_loss": -5.968496799468994, "global_step": 63256, "epoch": 1506} {"train_loss": -5.967599391937256, "global_step": 63257, "epoch": 1506} {"train_loss": -5.89151668548584, "global_step": 63258, "epoch": 1506} {"train_loss": -5.9639573097229, "global_step": 63259, "epoch": 1506} {"train_loss": -5.966224670410156, "global_step": 63260, "epoch": 1506} {"train_loss": -5.995760917663574, "global_step": 63261, "epoch": 1506} {"train_loss": -6.052095413208008, "global_step": 63262, "epoch": 1506} {"train_loss": -5.935883522033691, "global_step": 63263, "epoch": 1506} {"train_loss": -5.964023590087891, "global_step": 63264, "epoch": 1506} {"train_loss": -5.952115058898926, "global_step": 63265, "epoch": 1506} {"train_loss": -5.933789253234863, "global_step": 63266, "epoch": 1506} {"train_loss": -5.9721479415893555, "global_step": 63267, "epoch": 1506} {"train_loss": -5.878650665283203, "global_step": 63268, "epoch": 1506} {"train_loss": -6.011362075805664, "global_step": 63269, "epoch": 1506} {"train_loss": -5.935791969299316, "global_step": 63270, "epoch": 1506} {"train_loss": -5.933147430419922, "global_step": 63271, "epoch": 1506} {"train_loss": -5.905370235443115, "global_step": 63272, "epoch": 1506} {"train_loss": -5.8638081550598145, "global_step": 63273, "epoch": 1506} {"train_loss": -5.922641754150391, "global_step": 63274, "epoch": 1506} {"train_loss": -5.933439254760742, "global_step": 63275, "epoch": 1506} {"train_loss": -6.008591175079346, "global_step": 63276, "epoch": 1506} {"train_loss": -5.927956581115723, "global_step": 63277, "epoch": 1506} {"train_loss": -5.985260009765625, "global_step": 63278, "epoch": 1506} {"train_loss": -6.000046730041504, "global_step": 63279, "epoch": 1506} {"train_loss": -5.9081902503967285, "global_step": 63280, "epoch": 1506} {"train_loss": -5.961569309234619, "global_step": 63281, "epoch": 1506} {"train_loss": -5.95201301574707, "global_step": 63282, "epoch": 1506} {"train_loss": -5.971933364868164, "global_step": 63283, "epoch": 1506} {"train_loss": -5.962977409362793, "global_step": 63284, "epoch": 1506} {"train_loss": -5.8723344802856445, "global_step": 63285, "epoch": 1506} {"train_loss": -5.9144368171691895, "global_step": 63286, "epoch": 1506} {"train_loss": -5.952768325805664, "global_step": 63287, "epoch": 1506} {"train_loss": -5.922991752624512, "global_step": 63288, "epoch": 1506} {"train_loss": -5.961141586303711, "global_step": 63289, "epoch": 1506} {"train_loss": -5.913758277893066, "global_step": 63290, "epoch": 1506} {"train_loss": -5.977514266967773, "global_step": 63291, "epoch": 1506} {"train_loss": -5.915855407714844, "global_step": 63292, "epoch": 1506} {"train_loss": -5.948164587929135, "global_step": 63293, "epoch": 1506, "val_loss": 61328.4296875} {"train_loss": -5.869546413421631, "global_step": 63294, "epoch": 1507} {"train_loss": -5.980349063873291, "global_step": 63295, "epoch": 1507} {"train_loss": -5.925677299499512, "global_step": 63296, "epoch": 1507} {"train_loss": -6.013557434082031, "global_step": 63297, "epoch": 1507} {"train_loss": -6.037911415100098, "global_step": 63298, "epoch": 1507} {"train_loss": -5.962685585021973, "global_step": 63299, "epoch": 1507} {"train_loss": -5.915387153625488, "global_step": 63300, "epoch": 1507} {"train_loss": -6.0189313888549805, "global_step": 63301, "epoch": 1507} {"train_loss": -5.98411750793457, "global_step": 63302, "epoch": 1507} {"train_loss": -5.885587215423584, "global_step": 63303, "epoch": 1507} {"train_loss": -5.909628391265869, "global_step": 63304, "epoch": 1507} {"train_loss": -6.084196090698242, "global_step": 63305, "epoch": 1507} {"train_loss": -5.9428324699401855, "global_step": 63306, "epoch": 1507} {"train_loss": -5.881779193878174, "global_step": 63307, "epoch": 1507} {"train_loss": -6.126364231109619, "global_step": 63308, "epoch": 1507} {"train_loss": -5.808813571929932, "global_step": 63309, "epoch": 1507} {"train_loss": -5.942449569702148, "global_step": 63310, "epoch": 1507} {"train_loss": -5.997594356536865, "global_step": 63311, "epoch": 1507} {"train_loss": -6.000880241394043, "global_step": 63312, "epoch": 1507} {"train_loss": -5.932497024536133, "global_step": 63313, "epoch": 1507} {"train_loss": -5.9723358154296875, "global_step": 63314, "epoch": 1507} {"train_loss": -6.024125099182129, "global_step": 63315, "epoch": 1507} {"train_loss": -5.863405227661133, "global_step": 63316, "epoch": 1507} {"train_loss": -6.029543876647949, "global_step": 63317, "epoch": 1507} {"train_loss": -5.8810505867004395, "global_step": 63318, "epoch": 1507} {"train_loss": -5.867318630218506, "global_step": 63319, "epoch": 1507} {"train_loss": -5.969346523284912, "global_step": 63320, "epoch": 1507} {"train_loss": -5.942912578582764, "global_step": 63321, "epoch": 1507} {"train_loss": -6.001016616821289, "global_step": 63322, "epoch": 1507} {"train_loss": -5.996028423309326, "global_step": 63323, "epoch": 1507} {"train_loss": -5.799045562744141, "global_step": 63324, "epoch": 1507} {"train_loss": -6.03909158706665, "global_step": 63325, "epoch": 1507} {"train_loss": -5.792757034301758, "global_step": 63326, "epoch": 1507} {"train_loss": -5.9262542724609375, "global_step": 63327, "epoch": 1507} {"train_loss": -5.975692272186279, "global_step": 63328, "epoch": 1507} {"train_loss": -5.886625289916992, "global_step": 63329, "epoch": 1507} {"train_loss": -5.910947322845459, "global_step": 63330, "epoch": 1507} {"train_loss": -5.890705108642578, "global_step": 63331, "epoch": 1507} {"train_loss": -5.858431816101074, "global_step": 63332, "epoch": 1507} {"train_loss": -5.928053855895996, "global_step": 63333, "epoch": 1507} {"train_loss": -5.888874053955078, "global_step": 63334, "epoch": 1507} {"train_loss": -5.940676087424869, "global_step": 63335, "epoch": 1507, "val_loss": 61432.40625} {"train_loss": -6.049151420593262, "global_step": 63336, "epoch": 1508} {"train_loss": -5.861544609069824, "global_step": 63337, "epoch": 1508} {"train_loss": -5.961431503295898, "global_step": 63338, "epoch": 1508} {"train_loss": -5.967670440673828, "global_step": 63339, "epoch": 1508} {"train_loss": -5.928385257720947, "global_step": 63340, "epoch": 1508} {"train_loss": -5.945005416870117, "global_step": 63341, "epoch": 1508} {"train_loss": -6.031981468200684, "global_step": 63342, "epoch": 1508} {"train_loss": -5.858793258666992, "global_step": 63343, "epoch": 1508} {"train_loss": -5.978209018707275, "global_step": 63344, "epoch": 1508} {"train_loss": -5.9671220779418945, "global_step": 63345, "epoch": 1508} {"train_loss": -5.811199188232422, "global_step": 63346, "epoch": 1508} {"train_loss": -5.915193557739258, "global_step": 63347, "epoch": 1508} {"train_loss": -5.910159111022949, "global_step": 63348, "epoch": 1508} {"train_loss": -5.994340896606445, "global_step": 63349, "epoch": 1508} {"train_loss": -6.036242485046387, "global_step": 63350, "epoch": 1508} {"train_loss": -5.8852996826171875, "global_step": 63351, "epoch": 1508} {"train_loss": -5.951078414916992, "global_step": 63352, "epoch": 1508} {"train_loss": -5.895407676696777, "global_step": 63353, "epoch": 1508} {"train_loss": -5.899402141571045, "global_step": 63354, "epoch": 1508} {"train_loss": -5.8937201499938965, "global_step": 63355, "epoch": 1508} {"train_loss": -5.972991466522217, "global_step": 63356, "epoch": 1508} {"train_loss": -5.871642112731934, "global_step": 63357, "epoch": 1508} {"train_loss": -6.034543037414551, "global_step": 63358, "epoch": 1508} {"train_loss": -5.871428489685059, "global_step": 63359, "epoch": 1508} {"train_loss": -5.865883827209473, "global_step": 63360, "epoch": 1508} {"train_loss": -5.8673295974731445, "global_step": 63361, "epoch": 1508} {"train_loss": -5.907173156738281, "global_step": 63362, "epoch": 1508} {"train_loss": -5.9186553955078125, "global_step": 63363, "epoch": 1508} {"train_loss": -5.977028846740723, "global_step": 63364, "epoch": 1508} {"train_loss": -5.929239273071289, "global_step": 63365, "epoch": 1508} {"train_loss": -5.945524215698242, "global_step": 63366, "epoch": 1508} {"train_loss": -6.00431489944458, "global_step": 63367, "epoch": 1508} {"train_loss": -5.950719833374023, "global_step": 63368, "epoch": 1508} {"train_loss": -5.890160083770752, "global_step": 63369, "epoch": 1508} {"train_loss": -5.792156219482422, "global_step": 63370, "epoch": 1508} {"train_loss": -5.826575756072998, "global_step": 63371, "epoch": 1508} {"train_loss": -6.014400959014893, "global_step": 63372, "epoch": 1508} {"train_loss": -5.902703762054443, "global_step": 63373, "epoch": 1508} {"train_loss": -5.920374870300293, "global_step": 63374, "epoch": 1508} {"train_loss": -5.9307379722595215, "global_step": 63375, "epoch": 1508} {"train_loss": -5.834853172302246, "global_step": 63376, "epoch": 1508} {"train_loss": -5.927248091924758, "global_step": 63377, "epoch": 1508, "val_loss": 61356.15625} {"train_loss": -5.985161781311035, "global_step": 63378, "epoch": 1509} {"train_loss": -6.007988929748535, "global_step": 63379, "epoch": 1509} {"train_loss": -5.969729423522949, "global_step": 63380, "epoch": 1509} {"train_loss": -6.012371063232422, "global_step": 63381, "epoch": 1509} {"train_loss": -5.876237869262695, "global_step": 63382, "epoch": 1509} {"train_loss": -5.8855390548706055, "global_step": 63383, "epoch": 1509} {"train_loss": -5.939231872558594, "global_step": 63384, "epoch": 1509} {"train_loss": -5.946611404418945, "global_step": 63385, "epoch": 1509} {"train_loss": -5.802677631378174, "global_step": 63386, "epoch": 1509} {"train_loss": -5.831530570983887, "global_step": 63387, "epoch": 1509} {"train_loss": -5.857992172241211, "global_step": 63388, "epoch": 1509} {"train_loss": -5.914360046386719, "global_step": 63389, "epoch": 1509} {"train_loss": -5.921802520751953, "global_step": 63390, "epoch": 1509} {"train_loss": -5.879828453063965, "global_step": 63391, "epoch": 1509} {"train_loss": -5.89271354675293, "global_step": 63392, "epoch": 1509} {"train_loss": -5.861161708831787, "global_step": 63393, "epoch": 1509} {"train_loss": -6.131537914276123, "global_step": 63394, "epoch": 1509} {"train_loss": -5.858091354370117, "global_step": 63395, "epoch": 1509} {"train_loss": -6.072755813598633, "global_step": 63396, "epoch": 1509} {"train_loss": -5.981469631195068, "global_step": 63397, "epoch": 1509} {"train_loss": -5.984383583068848, "global_step": 63398, "epoch": 1509} {"train_loss": -5.969621181488037, "global_step": 63399, "epoch": 1509} {"train_loss": -5.924103260040283, "global_step": 63400, "epoch": 1509} {"train_loss": -6.095113277435303, "global_step": 63401, "epoch": 1509} {"train_loss": -5.979489326477051, "global_step": 63402, "epoch": 1509} {"train_loss": -6.027291297912598, "global_step": 63403, "epoch": 1509} {"train_loss": -5.814751625061035, "global_step": 63404, "epoch": 1509} {"train_loss": -5.95524263381958, "global_step": 63405, "epoch": 1509} {"train_loss": -6.0045013427734375, "global_step": 63406, "epoch": 1509} {"train_loss": -5.77143669128418, "global_step": 63407, "epoch": 1509} {"train_loss": -5.966737747192383, "global_step": 63408, "epoch": 1509} {"train_loss": -5.958827495574951, "global_step": 63409, "epoch": 1509} {"train_loss": -5.825446128845215, "global_step": 63410, "epoch": 1509} {"train_loss": -6.0451459884643555, "global_step": 63411, "epoch": 1509} {"train_loss": -6.011519432067871, "global_step": 63412, "epoch": 1509} {"train_loss": -6.0619306564331055, "global_step": 63413, "epoch": 1509} {"train_loss": -5.955386161804199, "global_step": 63414, "epoch": 1509} {"train_loss": -6.121218681335449, "global_step": 63415, "epoch": 1509} {"train_loss": -5.981777191162109, "global_step": 63416, "epoch": 1509} {"train_loss": -6.037469863891602, "global_step": 63417, "epoch": 1509} {"train_loss": -6.015528678894043, "global_step": 63418, "epoch": 1509} {"train_loss": -5.954982042312622, "global_step": 63419, "epoch": 1509, "val_loss": 61398.734375} {"train_loss": -6.067130088806152, "global_step": 63420, "epoch": 1510} {"train_loss": -5.897017478942871, "global_step": 63421, "epoch": 1510} {"train_loss": -6.010872840881348, "global_step": 63422, "epoch": 1510} {"train_loss": -5.980905532836914, "global_step": 63423, "epoch": 1510} {"train_loss": -6.090022563934326, "global_step": 63424, "epoch": 1510} {"train_loss": -5.972210884094238, "global_step": 63425, "epoch": 1510} {"train_loss": -6.0450849533081055, "global_step": 63426, "epoch": 1510} {"train_loss": -5.938671112060547, "global_step": 63427, "epoch": 1510} {"train_loss": -6.015531063079834, "global_step": 63428, "epoch": 1510} {"train_loss": -5.997368812561035, "global_step": 63429, "epoch": 1510} {"train_loss": -6.026487827301025, "global_step": 63430, "epoch": 1510} {"train_loss": -6.024614334106445, "global_step": 63431, "epoch": 1510} {"train_loss": -6.051753044128418, "global_step": 63432, "epoch": 1510} {"train_loss": -5.906041145324707, "global_step": 63433, "epoch": 1510} {"train_loss": -6.006461143493652, "global_step": 63434, "epoch": 1510} {"train_loss": -6.177692413330078, "global_step": 63435, "epoch": 1510} {"train_loss": -5.991352558135986, "global_step": 63436, "epoch": 1510} {"train_loss": -6.066383361816406, "global_step": 63437, "epoch": 1510} {"train_loss": -5.987383842468262, "global_step": 63438, "epoch": 1510} {"train_loss": -5.771846771240234, "global_step": 63439, "epoch": 1510} {"train_loss": -5.981350421905518, "global_step": 63440, "epoch": 1510} {"train_loss": -5.934340476989746, "global_step": 63441, "epoch": 1510} {"train_loss": -5.911154747009277, "global_step": 63442, "epoch": 1510} {"train_loss": -5.958827972412109, "global_step": 63443, "epoch": 1510} {"train_loss": -5.884993553161621, "global_step": 63444, "epoch": 1510} {"train_loss": -5.999539375305176, "global_step": 63445, "epoch": 1510} {"train_loss": -5.915674209594727, "global_step": 63446, "epoch": 1510} {"train_loss": -5.919070243835449, "global_step": 63447, "epoch": 1510} {"train_loss": -5.874322891235352, "global_step": 63448, "epoch": 1510} {"train_loss": -5.969972610473633, "global_step": 63449, "epoch": 1510} {"train_loss": -5.94988489151001, "global_step": 63450, "epoch": 1510} {"train_loss": -5.977251052856445, "global_step": 63451, "epoch": 1510} {"train_loss": -5.923617362976074, "global_step": 63452, "epoch": 1510} {"train_loss": -5.8129167556762695, "global_step": 63453, "epoch": 1510} {"train_loss": -5.888247489929199, "global_step": 63454, "epoch": 1510} {"train_loss": -6.080410957336426, "global_step": 63455, "epoch": 1510} {"train_loss": -5.828454971313477, "global_step": 63456, "epoch": 1510} {"train_loss": -5.974928379058838, "global_step": 63457, "epoch": 1510} {"train_loss": -5.90872859954834, "global_step": 63458, "epoch": 1510} {"train_loss": -6.021758079528809, "global_step": 63459, "epoch": 1510} {"train_loss": -5.910465240478516, "global_step": 63460, "epoch": 1510} {"train_loss": -5.967151403427124, "global_step": 63461, "epoch": 1510, "val_loss": 61475.89453125} {"train_loss": -6.038022994995117, "global_step": 63462, "epoch": 1511} {"train_loss": -5.998936653137207, "global_step": 63463, "epoch": 1511} {"train_loss": -6.070338726043701, "global_step": 63464, "epoch": 1511} {"train_loss": -5.95728874206543, "global_step": 63465, "epoch": 1511} {"train_loss": -5.951593399047852, "global_step": 63466, "epoch": 1511} {"train_loss": -6.004768371582031, "global_step": 63467, "epoch": 1511} {"train_loss": -6.00117301940918, "global_step": 63468, "epoch": 1511} {"train_loss": -5.750970840454102, "global_step": 63469, "epoch": 1511} {"train_loss": -5.936055660247803, "global_step": 63470, "epoch": 1511} {"train_loss": -5.942594528198242, "global_step": 63471, "epoch": 1511} {"train_loss": -5.850964546203613, "global_step": 63472, "epoch": 1511} {"train_loss": -6.047204494476318, "global_step": 63473, "epoch": 1511} {"train_loss": -5.895984649658203, "global_step": 63474, "epoch": 1511} {"train_loss": -5.954825401306152, "global_step": 63475, "epoch": 1511} {"train_loss": -5.9179182052612305, "global_step": 63476, "epoch": 1511} {"train_loss": -5.969023704528809, "global_step": 63477, "epoch": 1511} {"train_loss": -5.90757417678833, "global_step": 63478, "epoch": 1511} {"train_loss": -5.998404502868652, "global_step": 63479, "epoch": 1511} {"train_loss": -5.914178848266602, "global_step": 63480, "epoch": 1511} {"train_loss": -6.069650173187256, "global_step": 63481, "epoch": 1511} {"train_loss": -5.875761032104492, "global_step": 63482, "epoch": 1511} {"train_loss": -5.896537780761719, "global_step": 63483, "epoch": 1511} {"train_loss": -5.92466402053833, "global_step": 63484, "epoch": 1511} {"train_loss": -5.815858840942383, "global_step": 63485, "epoch": 1511} {"train_loss": -6.031933307647705, "global_step": 63486, "epoch": 1511} {"train_loss": -5.892216682434082, "global_step": 63487, "epoch": 1511} {"train_loss": -5.8487548828125, "global_step": 63488, "epoch": 1511} {"train_loss": -6.019248008728027, "global_step": 63489, "epoch": 1511} {"train_loss": -5.842094421386719, "global_step": 63490, "epoch": 1511} {"train_loss": -5.919858932495117, "global_step": 63491, "epoch": 1511} {"train_loss": -5.922240257263184, "global_step": 63492, "epoch": 1511} {"train_loss": -5.923922061920166, "global_step": 63493, "epoch": 1511} {"train_loss": -5.984061241149902, "global_step": 63494, "epoch": 1511} {"train_loss": -5.9633870124816895, "global_step": 63495, "epoch": 1511} {"train_loss": -5.995488166809082, "global_step": 63496, "epoch": 1511} {"train_loss": -5.9379096031188965, "global_step": 63497, "epoch": 1511} {"train_loss": -6.066988945007324, "global_step": 63498, "epoch": 1511} {"train_loss": -5.904807090759277, "global_step": 63499, "epoch": 1511} {"train_loss": -5.981330394744873, "global_step": 63500, "epoch": 1511} {"train_loss": -5.9593281745910645, "global_step": 63501, "epoch": 1511} {"train_loss": -5.868282318115234, "global_step": 63502, "epoch": 1511} {"train_loss": -5.942846468516758, "global_step": 63503, "epoch": 1511, "val_loss": 61356.890625} {"train_loss": -6.017521858215332, "global_step": 63504, "epoch": 1512} {"train_loss": -6.070350646972656, "global_step": 63505, "epoch": 1512} {"train_loss": -5.950565338134766, "global_step": 63506, "epoch": 1512} {"train_loss": -5.830253601074219, "global_step": 63507, "epoch": 1512} {"train_loss": -5.878082275390625, "global_step": 63508, "epoch": 1512} {"train_loss": -5.997296333312988, "global_step": 63509, "epoch": 1512} {"train_loss": -5.880017280578613, "global_step": 63510, "epoch": 1512} {"train_loss": -5.996294021606445, "global_step": 63511, "epoch": 1512} {"train_loss": -6.079894065856934, "global_step": 63512, "epoch": 1512} {"train_loss": -5.946928977966309, "global_step": 63513, "epoch": 1512} {"train_loss": -5.932826995849609, "global_step": 63514, "epoch": 1512} {"train_loss": -5.90650749206543, "global_step": 63515, "epoch": 1512} {"train_loss": -5.937046051025391, "global_step": 63516, "epoch": 1512} {"train_loss": -5.890610218048096, "global_step": 63517, "epoch": 1512} {"train_loss": -5.9611616134643555, "global_step": 63518, "epoch": 1512} {"train_loss": -5.924201011657715, "global_step": 63519, "epoch": 1512} {"train_loss": -6.006744861602783, "global_step": 63520, "epoch": 1512} {"train_loss": -5.91351318359375, "global_step": 63521, "epoch": 1512} {"train_loss": -6.032707214355469, "global_step": 63522, "epoch": 1512} {"train_loss": -5.966456413269043, "global_step": 63523, "epoch": 1512} {"train_loss": -5.849907875061035, "global_step": 63524, "epoch": 1512} {"train_loss": -5.9871602058410645, "global_step": 63525, "epoch": 1512} {"train_loss": -6.0435051918029785, "global_step": 63526, "epoch": 1512} {"train_loss": -5.861149311065674, "global_step": 63527, "epoch": 1512} {"train_loss": -6.039700508117676, "global_step": 63528, "epoch": 1512} {"train_loss": -5.941160202026367, "global_step": 63529, "epoch": 1512} {"train_loss": -6.0066118240356445, "global_step": 63530, "epoch": 1512} {"train_loss": -5.9642839431762695, "global_step": 63531, "epoch": 1512} {"train_loss": -5.829407691955566, "global_step": 63532, "epoch": 1512} {"train_loss": -5.905731201171875, "global_step": 63533, "epoch": 1512} {"train_loss": -5.869852066040039, "global_step": 63534, "epoch": 1512} {"train_loss": -5.905744552612305, "global_step": 63535, "epoch": 1512} {"train_loss": -5.870229721069336, "global_step": 63536, "epoch": 1512} {"train_loss": -5.915323257446289, "global_step": 63537, "epoch": 1512} {"train_loss": -5.877898216247559, "global_step": 63538, "epoch": 1512} {"train_loss": -5.98277473449707, "global_step": 63539, "epoch": 1512} {"train_loss": -5.964547634124756, "global_step": 63540, "epoch": 1512} {"train_loss": -5.924774169921875, "global_step": 63541, "epoch": 1512} {"train_loss": -6.0176615715026855, "global_step": 63542, "epoch": 1512} {"train_loss": -5.972365379333496, "global_step": 63543, "epoch": 1512} {"train_loss": -5.876326084136963, "global_step": 63544, "epoch": 1512} {"train_loss": -5.945549136116391, "global_step": 63545, "epoch": 1512, "val_loss": 61435.1875} {"train_loss": -5.840134620666504, "global_step": 63546, "epoch": 1513} {"train_loss": -5.994170188903809, "global_step": 63547, "epoch": 1513} {"train_loss": -6.1121392250061035, "global_step": 63548, "epoch": 1513} {"train_loss": -5.944406509399414, "global_step": 63549, "epoch": 1513} {"train_loss": -5.945338726043701, "global_step": 63550, "epoch": 1513} {"train_loss": -5.973076820373535, "global_step": 63551, "epoch": 1513} {"train_loss": -5.911388397216797, "global_step": 63552, "epoch": 1513} {"train_loss": -5.814297676086426, "global_step": 63553, "epoch": 1513} {"train_loss": -6.005661487579346, "global_step": 63554, "epoch": 1513} {"train_loss": -5.9434309005737305, "global_step": 63555, "epoch": 1513} {"train_loss": -5.9865288734436035, "global_step": 63556, "epoch": 1513} {"train_loss": -5.997241020202637, "global_step": 63557, "epoch": 1513} {"train_loss": -5.8235673904418945, "global_step": 63558, "epoch": 1513} {"train_loss": -5.9189534187316895, "global_step": 63559, "epoch": 1513} {"train_loss": -5.987054347991943, "global_step": 63560, "epoch": 1513} {"train_loss": -5.925365447998047, "global_step": 63561, "epoch": 1513} {"train_loss": -5.885003089904785, "global_step": 63562, "epoch": 1513} {"train_loss": -6.035438060760498, "global_step": 63563, "epoch": 1513} {"train_loss": -6.048633575439453, "global_step": 63564, "epoch": 1513} {"train_loss": -5.92718505859375, "global_step": 63565, "epoch": 1513} {"train_loss": -5.964104175567627, "global_step": 63566, "epoch": 1513} {"train_loss": -5.847834587097168, "global_step": 63567, "epoch": 1513} {"train_loss": -5.957523345947266, "global_step": 63568, "epoch": 1513} {"train_loss": -5.829998970031738, "global_step": 63569, "epoch": 1513} {"train_loss": -6.017763137817383, "global_step": 63570, "epoch": 1513} {"train_loss": -5.839573383331299, "global_step": 63571, "epoch": 1513} {"train_loss": -5.94809103012085, "global_step": 63572, "epoch": 1513} {"train_loss": -5.998627662658691, "global_step": 63573, "epoch": 1513} {"train_loss": -5.950203895568848, "global_step": 63574, "epoch": 1513} {"train_loss": -5.9818572998046875, "global_step": 63575, "epoch": 1513} {"train_loss": -5.92819356918335, "global_step": 63576, "epoch": 1513} {"train_loss": -5.85238790512085, "global_step": 63577, "epoch": 1513} {"train_loss": -5.918201446533203, "global_step": 63578, "epoch": 1513} {"train_loss": -5.856427192687988, "global_step": 63579, "epoch": 1513} {"train_loss": -5.926492214202881, "global_step": 63580, "epoch": 1513} {"train_loss": -5.861264228820801, "global_step": 63581, "epoch": 1513} {"train_loss": -5.892936706542969, "global_step": 63582, "epoch": 1513} {"train_loss": -5.924829006195068, "global_step": 63583, "epoch": 1513} {"train_loss": -5.93147611618042, "global_step": 63584, "epoch": 1513} {"train_loss": -5.957770347595215, "global_step": 63585, "epoch": 1513} {"train_loss": -5.738957405090332, "global_step": 63586, "epoch": 1513} {"train_loss": -5.929861409323556, "global_step": 63587, "epoch": 1513, "val_loss": 61652.13671875} {"train_loss": -5.90557861328125, "global_step": 63588, "epoch": 1514} {"train_loss": -5.774820804595947, "global_step": 63589, "epoch": 1514} {"train_loss": -5.9303669929504395, "global_step": 63590, "epoch": 1514} {"train_loss": -5.713545799255371, "global_step": 63591, "epoch": 1514} {"train_loss": -6.004731178283691, "global_step": 63592, "epoch": 1514} {"train_loss": -5.800494194030762, "global_step": 63593, "epoch": 1514} {"train_loss": -5.9286699295043945, "global_step": 63594, "epoch": 1514} {"train_loss": -5.866039752960205, "global_step": 63595, "epoch": 1514} {"train_loss": -5.784625053405762, "global_step": 63596, "epoch": 1514} {"train_loss": -5.974979400634766, "global_step": 63597, "epoch": 1514} {"train_loss": -5.865388870239258, "global_step": 63598, "epoch": 1514} {"train_loss": -5.968682289123535, "global_step": 63599, "epoch": 1514} {"train_loss": -5.91502046585083, "global_step": 63600, "epoch": 1514} {"train_loss": -6.055582046508789, "global_step": 63601, "epoch": 1514} {"train_loss": -5.895354270935059, "global_step": 63602, "epoch": 1514} {"train_loss": -5.981952667236328, "global_step": 63603, "epoch": 1514} {"train_loss": -5.919045448303223, "global_step": 63604, "epoch": 1514} {"train_loss": -5.98123836517334, "global_step": 63605, "epoch": 1514} {"train_loss": -5.979389667510986, "global_step": 63606, "epoch": 1514} {"train_loss": -5.8614182472229, "global_step": 63607, "epoch": 1514} {"train_loss": -6.096865653991699, "global_step": 63608, "epoch": 1514} {"train_loss": -6.093422889709473, "global_step": 63609, "epoch": 1514} {"train_loss": -5.898768424987793, "global_step": 63610, "epoch": 1514} {"train_loss": -5.987163543701172, "global_step": 63611, "epoch": 1514} {"train_loss": -5.955745697021484, "global_step": 63612, "epoch": 1514} {"train_loss": -5.931319713592529, "global_step": 63613, "epoch": 1514} {"train_loss": -6.094672679901123, "global_step": 63614, "epoch": 1514} {"train_loss": -6.029337406158447, "global_step": 63615, "epoch": 1514} {"train_loss": -5.942936420440674, "global_step": 63616, "epoch": 1514} {"train_loss": -5.980165004730225, "global_step": 63617, "epoch": 1514} {"train_loss": -5.862637042999268, "global_step": 63618, "epoch": 1514} {"train_loss": -5.913114547729492, "global_step": 63619, "epoch": 1514} {"train_loss": -5.776444435119629, "global_step": 63620, "epoch": 1514} {"train_loss": -6.0326690673828125, "global_step": 63621, "epoch": 1514} {"train_loss": -5.914360523223877, "global_step": 63622, "epoch": 1514} {"train_loss": -5.948125839233398, "global_step": 63623, "epoch": 1514} {"train_loss": -5.884092330932617, "global_step": 63624, "epoch": 1514} {"train_loss": -5.938981056213379, "global_step": 63625, "epoch": 1514} {"train_loss": -5.961212158203125, "global_step": 63626, "epoch": 1514} {"train_loss": -5.953365325927734, "global_step": 63627, "epoch": 1514} {"train_loss": -5.913344383239746, "global_step": 63628, "epoch": 1514} {"train_loss": -5.932152850287301, "global_step": 63629, "epoch": 1514, "val_loss": 61441.65234375} {"train_loss": -5.887438774108887, "global_step": 63630, "epoch": 1515} {"train_loss": -5.94211483001709, "global_step": 63631, "epoch": 1515} {"train_loss": -6.058102607727051, "global_step": 63632, "epoch": 1515} {"train_loss": -5.923369407653809, "global_step": 63633, "epoch": 1515} {"train_loss": -5.954305171966553, "global_step": 63634, "epoch": 1515} {"train_loss": -5.975550651550293, "global_step": 63635, "epoch": 1515} {"train_loss": -5.989536762237549, "global_step": 63636, "epoch": 1515} {"train_loss": -5.967794895172119, "global_step": 63637, "epoch": 1515} {"train_loss": -6.0179057121276855, "global_step": 63638, "epoch": 1515} {"train_loss": -6.090017795562744, "global_step": 63639, "epoch": 1515} {"train_loss": -5.817534923553467, "global_step": 63640, "epoch": 1515} {"train_loss": -5.913246154785156, "global_step": 63641, "epoch": 1515} {"train_loss": -6.026202201843262, "global_step": 63642, "epoch": 1515} {"train_loss": -5.93752384185791, "global_step": 63643, "epoch": 1515} {"train_loss": -5.905879974365234, "global_step": 63644, "epoch": 1515} {"train_loss": -5.9266276359558105, "global_step": 63645, "epoch": 1515} {"train_loss": -5.954165458679199, "global_step": 63646, "epoch": 1515} {"train_loss": -5.9633283615112305, "global_step": 63647, "epoch": 1515} {"train_loss": -5.90677547454834, "global_step": 63648, "epoch": 1515} {"train_loss": -5.921236515045166, "global_step": 63649, "epoch": 1515} {"train_loss": -6.003999710083008, "global_step": 63650, "epoch": 1515} {"train_loss": -5.8928728103637695, "global_step": 63651, "epoch": 1515} {"train_loss": -5.928396701812744, "global_step": 63652, "epoch": 1515} {"train_loss": -5.999858856201172, "global_step": 63653, "epoch": 1515} {"train_loss": -6.018083572387695, "global_step": 63654, "epoch": 1515} {"train_loss": -6.0604095458984375, "global_step": 63655, "epoch": 1515} {"train_loss": -5.95646333694458, "global_step": 63656, "epoch": 1515} {"train_loss": -5.945648193359375, "global_step": 63657, "epoch": 1515} {"train_loss": -5.920205593109131, "global_step": 63658, "epoch": 1515} {"train_loss": -5.916755676269531, "global_step": 63659, "epoch": 1515} {"train_loss": -5.951292037963867, "global_step": 63660, "epoch": 1515} {"train_loss": -5.878475189208984, "global_step": 63661, "epoch": 1515} {"train_loss": -5.913991928100586, "global_step": 63662, "epoch": 1515} {"train_loss": -6.062519550323486, "global_step": 63663, "epoch": 1515} {"train_loss": -5.996781349182129, "global_step": 63664, "epoch": 1515} {"train_loss": -6.06231689453125, "global_step": 63665, "epoch": 1515} {"train_loss": -5.96208381652832, "global_step": 63666, "epoch": 1515} {"train_loss": -5.827922344207764, "global_step": 63667, "epoch": 1515} {"train_loss": -5.891443252563477, "global_step": 63668, "epoch": 1515} {"train_loss": -5.846055030822754, "global_step": 63669, "epoch": 1515} {"train_loss": -5.917688846588135, "global_step": 63670, "epoch": 1515} {"train_loss": -5.950980583826701, "global_step": 63671, "epoch": 1515, "val_loss": 61393.60546875} {"train_loss": -5.970152378082275, "global_step": 63672, "epoch": 1516} {"train_loss": -5.960726737976074, "global_step": 63673, "epoch": 1516} {"train_loss": -5.991741180419922, "global_step": 63674, "epoch": 1516} {"train_loss": -5.898641586303711, "global_step": 63675, "epoch": 1516} {"train_loss": -5.987752437591553, "global_step": 63676, "epoch": 1516} {"train_loss": -5.959131717681885, "global_step": 63677, "epoch": 1516} {"train_loss": -6.031433582305908, "global_step": 63678, "epoch": 1516} {"train_loss": -6.065021514892578, "global_step": 63679, "epoch": 1516} {"train_loss": -5.9215898513793945, "global_step": 63680, "epoch": 1516} {"train_loss": -5.870546340942383, "global_step": 63681, "epoch": 1516} {"train_loss": -5.926432132720947, "global_step": 63682, "epoch": 1516} {"train_loss": -5.915622711181641, "global_step": 63683, "epoch": 1516} {"train_loss": -5.972336769104004, "global_step": 63684, "epoch": 1516} {"train_loss": -5.823410511016846, "global_step": 63685, "epoch": 1516} {"train_loss": -6.040792465209961, "global_step": 63686, "epoch": 1516} {"train_loss": -5.995034217834473, "global_step": 63687, "epoch": 1516} {"train_loss": -5.784812927246094, "global_step": 63688, "epoch": 1516} {"train_loss": -5.998372554779053, "global_step": 63689, "epoch": 1516} {"train_loss": -5.834102630615234, "global_step": 63690, "epoch": 1516} {"train_loss": -5.9037652015686035, "global_step": 63691, "epoch": 1516} {"train_loss": -5.942852020263672, "global_step": 63692, "epoch": 1516} {"train_loss": -5.690609931945801, "global_step": 63693, "epoch": 1516} {"train_loss": -5.841155052185059, "global_step": 63694, "epoch": 1516} {"train_loss": -5.888810634613037, "global_step": 63695, "epoch": 1516} {"train_loss": -5.829582214355469, "global_step": 63696, "epoch": 1516} {"train_loss": -5.978862762451172, "global_step": 63697, "epoch": 1516} {"train_loss": -5.942164421081543, "global_step": 63698, "epoch": 1516} {"train_loss": -6.036116600036621, "global_step": 63699, "epoch": 1516} {"train_loss": -5.890345573425293, "global_step": 63700, "epoch": 1516} {"train_loss": -5.86454963684082, "global_step": 63701, "epoch": 1516} {"train_loss": -6.024119853973389, "global_step": 63702, "epoch": 1516} {"train_loss": -5.872712135314941, "global_step": 63703, "epoch": 1516} {"train_loss": -6.054660797119141, "global_step": 63704, "epoch": 1516} {"train_loss": -5.907670497894287, "global_step": 63705, "epoch": 1516} {"train_loss": -5.804262161254883, "global_step": 63706, "epoch": 1516} {"train_loss": -5.85107421875, "global_step": 63707, "epoch": 1516} {"train_loss": -5.881136417388916, "global_step": 63708, "epoch": 1516} {"train_loss": -6.008059024810791, "global_step": 63709, "epoch": 1516} {"train_loss": -5.871240615844727, "global_step": 63710, "epoch": 1516} {"train_loss": -5.943855285644531, "global_step": 63711, "epoch": 1516} {"train_loss": -5.833498001098633, "global_step": 63712, "epoch": 1516} {"train_loss": -5.924577327001662, "global_step": 63713, "epoch": 1516, "val_loss": 61387.84375} {"train_loss": -5.908904075622559, "global_step": 63714, "epoch": 1517} {"train_loss": -5.958855628967285, "global_step": 63715, "epoch": 1517} {"train_loss": -6.1125407218933105, "global_step": 63716, "epoch": 1517} {"train_loss": -5.817562103271484, "global_step": 63717, "epoch": 1517} {"train_loss": -5.958983421325684, "global_step": 63718, "epoch": 1517} {"train_loss": -6.032744884490967, "global_step": 63719, "epoch": 1517} {"train_loss": -5.911787986755371, "global_step": 63720, "epoch": 1517} {"train_loss": -5.925951957702637, "global_step": 63721, "epoch": 1517} {"train_loss": -5.936522483825684, "global_step": 63722, "epoch": 1517} {"train_loss": -6.057009696960449, "global_step": 63723, "epoch": 1517} {"train_loss": -5.933125019073486, "global_step": 63724, "epoch": 1517} {"train_loss": -5.8830718994140625, "global_step": 63725, "epoch": 1517} {"train_loss": -6.026863098144531, "global_step": 63726, "epoch": 1517} {"train_loss": -5.930394172668457, "global_step": 63727, "epoch": 1517} {"train_loss": -6.007056713104248, "global_step": 63728, "epoch": 1517} {"train_loss": -6.053897857666016, "global_step": 63729, "epoch": 1517} {"train_loss": -5.807703971862793, "global_step": 63730, "epoch": 1517} {"train_loss": -6.015201568603516, "global_step": 63731, "epoch": 1517} {"train_loss": -5.848997592926025, "global_step": 63732, "epoch": 1517} {"train_loss": -5.925927639007568, "global_step": 63733, "epoch": 1517} {"train_loss": -5.876863479614258, "global_step": 63734, "epoch": 1517} {"train_loss": -5.963029384613037, "global_step": 63735, "epoch": 1517} {"train_loss": -5.892051696777344, "global_step": 63736, "epoch": 1517} {"train_loss": -5.838919639587402, "global_step": 63737, "epoch": 1517} {"train_loss": -5.986257553100586, "global_step": 63738, "epoch": 1517} {"train_loss": -5.87816858291626, "global_step": 63739, "epoch": 1517} {"train_loss": -5.952088356018066, "global_step": 63740, "epoch": 1517} {"train_loss": -5.9192795753479, "global_step": 63741, "epoch": 1517} {"train_loss": -6.000150680541992, "global_step": 63742, "epoch": 1517} {"train_loss": -5.985491752624512, "global_step": 63743, "epoch": 1517} {"train_loss": -5.802211284637451, "global_step": 63744, "epoch": 1517} {"train_loss": -5.940910339355469, "global_step": 63745, "epoch": 1517} {"train_loss": -5.903758525848389, "global_step": 63746, "epoch": 1517} {"train_loss": -5.951343059539795, "global_step": 63747, "epoch": 1517} {"train_loss": -5.9563398361206055, "global_step": 63748, "epoch": 1517} {"train_loss": -5.971541881561279, "global_step": 63749, "epoch": 1517} {"train_loss": -6.002416133880615, "global_step": 63750, "epoch": 1517} {"train_loss": -5.9814605712890625, "global_step": 63751, "epoch": 1517} {"train_loss": -5.927925109863281, "global_step": 63752, "epoch": 1517} {"train_loss": -5.934754371643066, "global_step": 63753, "epoch": 1517} {"train_loss": -5.911827564239502, "global_step": 63754, "epoch": 1517} {"train_loss": -5.939974694024949, "global_step": 63755, "epoch": 1517, "val_loss": 61198.6796875} {"train_loss": -6.028433799743652, "global_step": 63756, "epoch": 1518} {"train_loss": -5.94273567199707, "global_step": 63757, "epoch": 1518} {"train_loss": -5.870857238769531, "global_step": 63758, "epoch": 1518} {"train_loss": -6.100786209106445, "global_step": 63759, "epoch": 1518} {"train_loss": -5.892721176147461, "global_step": 63760, "epoch": 1518} {"train_loss": -5.978499412536621, "global_step": 63761, "epoch": 1518} {"train_loss": -6.093705177307129, "global_step": 63762, "epoch": 1518} {"train_loss": -5.930042266845703, "global_step": 63763, "epoch": 1518} {"train_loss": -5.91021728515625, "global_step": 63764, "epoch": 1518} {"train_loss": -5.967294216156006, "global_step": 63765, "epoch": 1518} {"train_loss": -5.950328826904297, "global_step": 63766, "epoch": 1518} {"train_loss": -5.933226585388184, "global_step": 63767, "epoch": 1518} {"train_loss": -5.965348243713379, "global_step": 63768, "epoch": 1518} {"train_loss": -5.948326587677002, "global_step": 63769, "epoch": 1518} {"train_loss": -5.819364547729492, "global_step": 63770, "epoch": 1518} {"train_loss": -5.935773849487305, "global_step": 63771, "epoch": 1518} {"train_loss": -5.907380104064941, "global_step": 63772, "epoch": 1518} {"train_loss": -5.951128959655762, "global_step": 63773, "epoch": 1518} {"train_loss": -6.061794281005859, "global_step": 63774, "epoch": 1518} {"train_loss": -5.843245506286621, "global_step": 63775, "epoch": 1518} {"train_loss": -5.8262786865234375, "global_step": 63776, "epoch": 1518} {"train_loss": -5.7395148277282715, "global_step": 63777, "epoch": 1518} {"train_loss": -5.915738105773926, "global_step": 63778, "epoch": 1518} {"train_loss": -5.928153991699219, "global_step": 63779, "epoch": 1518} {"train_loss": -5.840008735656738, "global_step": 63780, "epoch": 1518} {"train_loss": -5.84760856628418, "global_step": 63781, "epoch": 1518} {"train_loss": -5.930290699005127, "global_step": 63782, "epoch": 1518} {"train_loss": -5.883143901824951, "global_step": 63783, "epoch": 1518} {"train_loss": -5.902728080749512, "global_step": 63784, "epoch": 1518} {"train_loss": -5.8941755294799805, "global_step": 63785, "epoch": 1518} {"train_loss": -5.943393707275391, "global_step": 63786, "epoch": 1518} {"train_loss": -6.076396942138672, "global_step": 63787, "epoch": 1518} {"train_loss": -5.9282331466674805, "global_step": 63788, "epoch": 1518} {"train_loss": -6.082821846008301, "global_step": 63789, "epoch": 1518} {"train_loss": -5.873183727264404, "global_step": 63790, "epoch": 1518} {"train_loss": -5.997840881347656, "global_step": 63791, "epoch": 1518} {"train_loss": -5.904682159423828, "global_step": 63792, "epoch": 1518} {"train_loss": -5.939145088195801, "global_step": 63793, "epoch": 1518} {"train_loss": -5.946772575378418, "global_step": 63794, "epoch": 1518} {"train_loss": -5.935878753662109, "global_step": 63795, "epoch": 1518} {"train_loss": -5.966037273406982, "global_step": 63796, "epoch": 1518} {"train_loss": -5.937421389988491, "global_step": 63797, "epoch": 1518, "val_loss": 61485.69921875} {"train_loss": -5.989023685455322, "global_step": 63798, "epoch": 1519} {"train_loss": -5.913878917694092, "global_step": 63799, "epoch": 1519} {"train_loss": -5.9311113357543945, "global_step": 63800, "epoch": 1519} {"train_loss": -5.948448181152344, "global_step": 63801, "epoch": 1519} {"train_loss": -5.990996837615967, "global_step": 63802, "epoch": 1519} {"train_loss": -5.860302925109863, "global_step": 63803, "epoch": 1519} {"train_loss": -6.078899383544922, "global_step": 63804, "epoch": 1519} {"train_loss": -5.78305196762085, "global_step": 63805, "epoch": 1519} {"train_loss": -5.959785461425781, "global_step": 63806, "epoch": 1519} {"train_loss": -5.9500932693481445, "global_step": 63807, "epoch": 1519} {"train_loss": -6.046013832092285, "global_step": 63808, "epoch": 1519} {"train_loss": -5.905076503753662, "global_step": 63809, "epoch": 1519} {"train_loss": -6.0135297775268555, "global_step": 63810, "epoch": 1519} {"train_loss": -5.910208225250244, "global_step": 63811, "epoch": 1519} {"train_loss": -5.950869560241699, "global_step": 63812, "epoch": 1519} {"train_loss": -5.93964147567749, "global_step": 63813, "epoch": 1519} {"train_loss": -6.06011962890625, "global_step": 63814, "epoch": 1519} {"train_loss": -5.926339149475098, "global_step": 63815, "epoch": 1519} {"train_loss": -5.887167453765869, "global_step": 63816, "epoch": 1519} {"train_loss": -5.843451499938965, "global_step": 63817, "epoch": 1519} {"train_loss": -5.804893493652344, "global_step": 63818, "epoch": 1519} {"train_loss": -5.880744934082031, "global_step": 63819, "epoch": 1519} {"train_loss": -5.8199639320373535, "global_step": 63820, "epoch": 1519} {"train_loss": -5.995665073394775, "global_step": 63821, "epoch": 1519} {"train_loss": -5.8628387451171875, "global_step": 63822, "epoch": 1519} {"train_loss": -5.972902297973633, "global_step": 63823, "epoch": 1519} {"train_loss": -5.834628105163574, "global_step": 63824, "epoch": 1519} {"train_loss": -5.989894390106201, "global_step": 63825, "epoch": 1519} {"train_loss": -5.982295513153076, "global_step": 63826, "epoch": 1519} {"train_loss": -5.939896583557129, "global_step": 63827, "epoch": 1519} {"train_loss": -6.094143867492676, "global_step": 63828, "epoch": 1519} {"train_loss": -5.9660491943359375, "global_step": 63829, "epoch": 1519} {"train_loss": -5.98331356048584, "global_step": 63830, "epoch": 1519} {"train_loss": -5.938839912414551, "global_step": 63831, "epoch": 1519} {"train_loss": -5.937438011169434, "global_step": 63832, "epoch": 1519} {"train_loss": -5.991171836853027, "global_step": 63833, "epoch": 1519} {"train_loss": -5.954020977020264, "global_step": 63834, "epoch": 1519} {"train_loss": -6.032090187072754, "global_step": 63835, "epoch": 1519} {"train_loss": -5.932171821594238, "global_step": 63836, "epoch": 1519} {"train_loss": -5.9093427658081055, "global_step": 63837, "epoch": 1519} {"train_loss": -5.956732749938965, "global_step": 63838, "epoch": 1519} {"train_loss": -5.948275429861886, "global_step": 63839, "epoch": 1519, "val_loss": 61263.1328125} {"train_loss": -6.113807678222656, "global_step": 63840, "epoch": 1520} {"train_loss": -5.771378040313721, "global_step": 63841, "epoch": 1520} {"train_loss": -5.984461307525635, "global_step": 63842, "epoch": 1520} {"train_loss": -5.980321407318115, "global_step": 63843, "epoch": 1520} {"train_loss": -5.905592918395996, "global_step": 63844, "epoch": 1520} {"train_loss": -5.98829460144043, "global_step": 63845, "epoch": 1520} {"train_loss": -5.945952415466309, "global_step": 63846, "epoch": 1520} {"train_loss": -5.928433418273926, "global_step": 63847, "epoch": 1520} {"train_loss": -6.010440826416016, "global_step": 63848, "epoch": 1520} {"train_loss": -6.027176856994629, "global_step": 63849, "epoch": 1520} {"train_loss": -5.995639324188232, "global_step": 63850, "epoch": 1520} {"train_loss": -5.935733795166016, "global_step": 63851, "epoch": 1520} {"train_loss": -5.909310340881348, "global_step": 63852, "epoch": 1520} {"train_loss": -5.931229114532471, "global_step": 63853, "epoch": 1520} {"train_loss": -6.017923831939697, "global_step": 63854, "epoch": 1520} {"train_loss": -5.9174346923828125, "global_step": 63855, "epoch": 1520} {"train_loss": -6.033870697021484, "global_step": 63856, "epoch": 1520} {"train_loss": -5.924041748046875, "global_step": 63857, "epoch": 1520} {"train_loss": -5.931936740875244, "global_step": 63858, "epoch": 1520} {"train_loss": -6.005518913269043, "global_step": 63859, "epoch": 1520} {"train_loss": -5.891385078430176, "global_step": 63860, "epoch": 1520} {"train_loss": -5.944429397583008, "global_step": 63861, "epoch": 1520} {"train_loss": -5.92205810546875, "global_step": 63862, "epoch": 1520} {"train_loss": -5.951652526855469, "global_step": 63863, "epoch": 1520} {"train_loss": -5.913361072540283, "global_step": 63864, "epoch": 1520} {"train_loss": -5.9000654220581055, "global_step": 63865, "epoch": 1520} {"train_loss": -5.953117370605469, "global_step": 63866, "epoch": 1520} {"train_loss": -5.860188961029053, "global_step": 63867, "epoch": 1520} {"train_loss": -5.873579502105713, "global_step": 63868, "epoch": 1520} {"train_loss": -5.863627910614014, "global_step": 63869, "epoch": 1520} {"train_loss": -5.804614067077637, "global_step": 63870, "epoch": 1520} {"train_loss": -5.9957685470581055, "global_step": 63871, "epoch": 1520} {"train_loss": -5.940133571624756, "global_step": 63872, "epoch": 1520} {"train_loss": -5.908783912658691, "global_step": 63873, "epoch": 1520} {"train_loss": -6.0203094482421875, "global_step": 63874, "epoch": 1520} {"train_loss": -5.921576976776123, "global_step": 63875, "epoch": 1520} {"train_loss": -5.91376256942749, "global_step": 63876, "epoch": 1520} {"train_loss": -5.878284454345703, "global_step": 63877, "epoch": 1520} {"train_loss": -5.975180625915527, "global_step": 63878, "epoch": 1520} {"train_loss": -5.922132968902588, "global_step": 63879, "epoch": 1520} {"train_loss": -5.841152667999268, "global_step": 63880, "epoch": 1520} {"train_loss": -5.938395693188622, "global_step": 63881, "epoch": 1520, "val_loss": 61591.70703125} {"train_loss": -5.94086217880249, "global_step": 63882, "epoch": 1521} {"train_loss": -5.8605475425720215, "global_step": 63883, "epoch": 1521} {"train_loss": -6.022393226623535, "global_step": 63884, "epoch": 1521} {"train_loss": -5.92852783203125, "global_step": 63885, "epoch": 1521} {"train_loss": -5.93932580947876, "global_step": 63886, "epoch": 1521} {"train_loss": -5.988596439361572, "global_step": 63887, "epoch": 1521} {"train_loss": -5.932997703552246, "global_step": 63888, "epoch": 1521} {"train_loss": -5.975428104400635, "global_step": 63889, "epoch": 1521} {"train_loss": -6.017988681793213, "global_step": 63890, "epoch": 1521} {"train_loss": -5.969471454620361, "global_step": 63891, "epoch": 1521} {"train_loss": -6.017978668212891, "global_step": 63892, "epoch": 1521} {"train_loss": -6.051985740661621, "global_step": 63893, "epoch": 1521} {"train_loss": -6.016317367553711, "global_step": 63894, "epoch": 1521} {"train_loss": -6.126518249511719, "global_step": 63895, "epoch": 1521} {"train_loss": -6.004892826080322, "global_step": 63896, "epoch": 1521} {"train_loss": -6.007970809936523, "global_step": 63897, "epoch": 1521} {"train_loss": -5.88804817199707, "global_step": 63898, "epoch": 1521} {"train_loss": -5.9409589767456055, "global_step": 63899, "epoch": 1521} {"train_loss": -5.969701290130615, "global_step": 63900, "epoch": 1521} {"train_loss": -5.94501256942749, "global_step": 63901, "epoch": 1521} {"train_loss": -5.956768989562988, "global_step": 63902, "epoch": 1521} {"train_loss": -5.935966968536377, "global_step": 63903, "epoch": 1521} {"train_loss": -5.947014808654785, "global_step": 63904, "epoch": 1521} {"train_loss": -5.875645160675049, "global_step": 63905, "epoch": 1521} {"train_loss": -5.993974208831787, "global_step": 63906, "epoch": 1521} {"train_loss": -5.902522563934326, "global_step": 63907, "epoch": 1521} {"train_loss": -6.064712047576904, "global_step": 63908, "epoch": 1521} {"train_loss": -5.871981620788574, "global_step": 63909, "epoch": 1521} {"train_loss": -5.905133247375488, "global_step": 63910, "epoch": 1521} {"train_loss": -6.081874847412109, "global_step": 63911, "epoch": 1521} {"train_loss": -5.808760643005371, "global_step": 63912, "epoch": 1521} {"train_loss": -5.739229679107666, "global_step": 63913, "epoch": 1521} {"train_loss": -6.041204929351807, "global_step": 63914, "epoch": 1521} {"train_loss": -5.879630088806152, "global_step": 63915, "epoch": 1521} {"train_loss": -5.859330177307129, "global_step": 63916, "epoch": 1521} {"train_loss": -5.867501258850098, "global_step": 63917, "epoch": 1521} {"train_loss": -5.903148651123047, "global_step": 63918, "epoch": 1521} {"train_loss": -5.883454322814941, "global_step": 63919, "epoch": 1521} {"train_loss": -5.8866987228393555, "global_step": 63920, "epoch": 1521} {"train_loss": -5.8733720779418945, "global_step": 63921, "epoch": 1521} {"train_loss": -5.879088401794434, "global_step": 63922, "epoch": 1521} {"train_loss": -5.9428515547797796, "global_step": 63923, "epoch": 1521, "val_loss": 61419.1171875} {"train_loss": -5.9334821701049805, "global_step": 63924, "epoch": 1522} {"train_loss": -6.010000228881836, "global_step": 63925, "epoch": 1522} {"train_loss": -6.0268096923828125, "global_step": 63926, "epoch": 1522} {"train_loss": -5.996079444885254, "global_step": 63927, "epoch": 1522} {"train_loss": -5.9621357917785645, "global_step": 63928, "epoch": 1522} {"train_loss": -5.945593357086182, "global_step": 63929, "epoch": 1522} {"train_loss": -6.052112579345703, "global_step": 63930, "epoch": 1522} {"train_loss": -5.958507061004639, "global_step": 63931, "epoch": 1522} {"train_loss": -6.031257152557373, "global_step": 63932, "epoch": 1522} {"train_loss": -5.911988258361816, "global_step": 63933, "epoch": 1522} {"train_loss": -5.987287521362305, "global_step": 63934, "epoch": 1522} {"train_loss": -5.990788459777832, "global_step": 63935, "epoch": 1522} {"train_loss": -5.955897808074951, "global_step": 63936, "epoch": 1522} {"train_loss": -5.81477165222168, "global_step": 63937, "epoch": 1522} {"train_loss": -5.9489240646362305, "global_step": 63938, "epoch": 1522} {"train_loss": -5.900613784790039, "global_step": 63939, "epoch": 1522} {"train_loss": -5.9302778244018555, "global_step": 63940, "epoch": 1522} {"train_loss": -5.936146259307861, "global_step": 63941, "epoch": 1522} {"train_loss": -5.879355430603027, "global_step": 63942, "epoch": 1522} {"train_loss": -5.9632768630981445, "global_step": 63943, "epoch": 1522} {"train_loss": -5.983686923980713, "global_step": 63944, "epoch": 1522} {"train_loss": -5.914722919464111, "global_step": 63945, "epoch": 1522} {"train_loss": -5.901015281677246, "global_step": 63946, "epoch": 1522} {"train_loss": -5.783127784729004, "global_step": 63947, "epoch": 1522} {"train_loss": -5.802701950073242, "global_step": 63948, "epoch": 1522} {"train_loss": -6.007261276245117, "global_step": 63949, "epoch": 1522} {"train_loss": -5.9691362380981445, "global_step": 63950, "epoch": 1522} {"train_loss": -5.849356174468994, "global_step": 63951, "epoch": 1522} {"train_loss": -5.818243026733398, "global_step": 63952, "epoch": 1522} {"train_loss": -5.935002326965332, "global_step": 63953, "epoch": 1522} {"train_loss": -5.930886745452881, "global_step": 63954, "epoch": 1522} {"train_loss": -6.030888557434082, "global_step": 63955, "epoch": 1522} {"train_loss": -5.914308547973633, "global_step": 63956, "epoch": 1522} {"train_loss": -5.9212541580200195, "global_step": 63957, "epoch": 1522} {"train_loss": -5.900605201721191, "global_step": 63958, "epoch": 1522} {"train_loss": -5.866658687591553, "global_step": 63959, "epoch": 1522} {"train_loss": -5.867374420166016, "global_step": 63960, "epoch": 1522} {"train_loss": -5.878486633300781, "global_step": 63961, "epoch": 1522} {"train_loss": -6.00681209564209, "global_step": 63962, "epoch": 1522} {"train_loss": -6.031520843505859, "global_step": 63963, "epoch": 1522} {"train_loss": -5.884678840637207, "global_step": 63964, "epoch": 1522} {"train_loss": -5.936299142383394, "global_step": 63965, "epoch": 1522, "val_loss": 61478.27734375} {"train_loss": -5.868653774261475, "global_step": 63966, "epoch": 1523} {"train_loss": -5.912029266357422, "global_step": 63967, "epoch": 1523} {"train_loss": -5.946926116943359, "global_step": 63968, "epoch": 1523} {"train_loss": -5.914814472198486, "global_step": 63969, "epoch": 1523} {"train_loss": -5.902602672576904, "global_step": 63970, "epoch": 1523} {"train_loss": -5.8933610916137695, "global_step": 63971, "epoch": 1523} {"train_loss": -5.980108261108398, "global_step": 63972, "epoch": 1523} {"train_loss": -5.833143711090088, "global_step": 63973, "epoch": 1523} {"train_loss": -5.930894374847412, "global_step": 63974, "epoch": 1523} {"train_loss": -5.915464401245117, "global_step": 63975, "epoch": 1523} {"train_loss": -5.906757831573486, "global_step": 63976, "epoch": 1523} {"train_loss": -5.889749050140381, "global_step": 63977, "epoch": 1523} {"train_loss": -5.914664268493652, "global_step": 63978, "epoch": 1523} {"train_loss": -5.951104164123535, "global_step": 63979, "epoch": 1523} {"train_loss": -5.973498344421387, "global_step": 63980, "epoch": 1523} {"train_loss": -5.995322227478027, "global_step": 63981, "epoch": 1523} {"train_loss": -5.917226791381836, "global_step": 63982, "epoch": 1523} {"train_loss": -5.992452621459961, "global_step": 63983, "epoch": 1523} {"train_loss": -5.822225570678711, "global_step": 63984, "epoch": 1523} {"train_loss": -5.937127113342285, "global_step": 63985, "epoch": 1523} {"train_loss": -6.09937858581543, "global_step": 63986, "epoch": 1523} {"train_loss": -5.958540916442871, "global_step": 63987, "epoch": 1523} {"train_loss": -5.895028591156006, "global_step": 63988, "epoch": 1523} {"train_loss": -5.867579936981201, "global_step": 63989, "epoch": 1523} {"train_loss": -6.009366989135742, "global_step": 63990, "epoch": 1523} {"train_loss": -6.034106254577637, "global_step": 63991, "epoch": 1523} {"train_loss": -5.929112911224365, "global_step": 63992, "epoch": 1523} {"train_loss": -6.001949310302734, "global_step": 63993, "epoch": 1523} {"train_loss": -5.934879302978516, "global_step": 63994, "epoch": 1523} {"train_loss": -6.003751277923584, "global_step": 63995, "epoch": 1523} {"train_loss": -5.943982124328613, "global_step": 63996, "epoch": 1523} {"train_loss": -5.968339443206787, "global_step": 63997, "epoch": 1523} {"train_loss": -5.953880786895752, "global_step": 63998, "epoch": 1523} {"train_loss": -5.794582843780518, "global_step": 63999, "epoch": 1523} {"train_loss": -5.887911796569824, "global_step": 64000, "epoch": 1523} {"train_loss": -5.928771018981934, "global_step": 64001, "epoch": 1523} {"train_loss": -5.9603271484375, "global_step": 64002, "epoch": 1523} {"train_loss": -5.963041305541992, "global_step": 64003, "epoch": 1523} {"train_loss": -5.9254984855651855, "global_step": 64004, "epoch": 1523} {"train_loss": -5.98890495300293, "global_step": 64005, "epoch": 1523} {"train_loss": -5.970108985900879, "global_step": 64006, "epoch": 1523} {"train_loss": -5.9360147430783226, "global_step": 64007, "epoch": 1523, "val_loss": 61355.48046875} {"train_loss": -5.925484657287598, "global_step": 64008, "epoch": 1524} {"train_loss": -5.8464674949646, "global_step": 64009, "epoch": 1524} {"train_loss": -5.96054744720459, "global_step": 64010, "epoch": 1524} {"train_loss": -5.843154430389404, "global_step": 64011, "epoch": 1524} {"train_loss": -5.950919151306152, "global_step": 64012, "epoch": 1524} {"train_loss": -5.9587554931640625, "global_step": 64013, "epoch": 1524} {"train_loss": -5.993391990661621, "global_step": 64014, "epoch": 1524} {"train_loss": -5.961690902709961, "global_step": 64015, "epoch": 1524} {"train_loss": -5.952825546264648, "global_step": 64016, "epoch": 1524} {"train_loss": -5.984976768493652, "global_step": 64017, "epoch": 1524} {"train_loss": -6.052840709686279, "global_step": 64018, "epoch": 1524} {"train_loss": -5.896788597106934, "global_step": 64019, "epoch": 1524} {"train_loss": -5.889277458190918, "global_step": 64020, "epoch": 1524} {"train_loss": -6.0135393142700195, "global_step": 64021, "epoch": 1524} {"train_loss": -6.079127311706543, "global_step": 64022, "epoch": 1524} {"train_loss": -6.004322052001953, "global_step": 64023, "epoch": 1524} {"train_loss": -6.040340423583984, "global_step": 64024, "epoch": 1524} {"train_loss": -5.922398567199707, "global_step": 64025, "epoch": 1524} {"train_loss": -5.9715046882629395, "global_step": 64026, "epoch": 1524} {"train_loss": -6.053834915161133, "global_step": 64027, "epoch": 1524} {"train_loss": -6.037631988525391, "global_step": 64028, "epoch": 1524} {"train_loss": -5.997175216674805, "global_step": 64029, "epoch": 1524} {"train_loss": -5.986138343811035, "global_step": 64030, "epoch": 1524} {"train_loss": -5.896642208099365, "global_step": 64031, "epoch": 1524} {"train_loss": -5.980043888092041, "global_step": 64032, "epoch": 1524} {"train_loss": -5.995486259460449, "global_step": 64033, "epoch": 1524} {"train_loss": -6.043841361999512, "global_step": 64034, "epoch": 1524} {"train_loss": -6.0551042556762695, "global_step": 64035, "epoch": 1524} {"train_loss": -5.832562446594238, "global_step": 64036, "epoch": 1524} {"train_loss": -6.011279106140137, "global_step": 64037, "epoch": 1524} {"train_loss": -5.93601655960083, "global_step": 64038, "epoch": 1524} {"train_loss": -5.878411293029785, "global_step": 64039, "epoch": 1524} {"train_loss": -5.941169261932373, "global_step": 64040, "epoch": 1524} {"train_loss": -5.8286566734313965, "global_step": 64041, "epoch": 1524} {"train_loss": -5.941162109375, "global_step": 64042, "epoch": 1524} {"train_loss": -5.757671356201172, "global_step": 64043, "epoch": 1524} {"train_loss": -5.894522666931152, "global_step": 64044, "epoch": 1524} {"train_loss": -5.964728832244873, "global_step": 64045, "epoch": 1524} {"train_loss": -5.864150047302246, "global_step": 64046, "epoch": 1524} {"train_loss": -5.916603088378906, "global_step": 64047, "epoch": 1524} {"train_loss": -5.950075149536133, "global_step": 64048, "epoch": 1524} {"train_loss": -5.952629134768531, "global_step": 64049, "epoch": 1524, "val_loss": 61529.10546875} {"train_loss": -5.987999439239502, "global_step": 64050, "epoch": 1525} {"train_loss": -5.912524223327637, "global_step": 64051, "epoch": 1525} {"train_loss": -5.979854583740234, "global_step": 64052, "epoch": 1525} {"train_loss": -6.063385009765625, "global_step": 64053, "epoch": 1525} {"train_loss": -5.9668498039245605, "global_step": 64054, "epoch": 1525} {"train_loss": -6.000374794006348, "global_step": 64055, "epoch": 1525} {"train_loss": -5.97598934173584, "global_step": 64056, "epoch": 1525} {"train_loss": -6.040460109710693, "global_step": 64057, "epoch": 1525} {"train_loss": -5.902803897857666, "global_step": 64058, "epoch": 1525} {"train_loss": -6.07736873626709, "global_step": 64059, "epoch": 1525} {"train_loss": -5.9699296951293945, "global_step": 64060, "epoch": 1525} {"train_loss": -5.9575300216674805, "global_step": 64061, "epoch": 1525} {"train_loss": -5.939460754394531, "global_step": 64062, "epoch": 1525} {"train_loss": -6.032012462615967, "global_step": 64063, "epoch": 1525} {"train_loss": -6.008208751678467, "global_step": 64064, "epoch": 1525} {"train_loss": -6.020870208740234, "global_step": 64065, "epoch": 1525} {"train_loss": -5.882620811462402, "global_step": 64066, "epoch": 1525} {"train_loss": -5.919822692871094, "global_step": 64067, "epoch": 1525} {"train_loss": -5.830257415771484, "global_step": 64068, "epoch": 1525} {"train_loss": -5.95119571685791, "global_step": 64069, "epoch": 1525} {"train_loss": -6.067169189453125, "global_step": 64070, "epoch": 1525} {"train_loss": -5.808046340942383, "global_step": 64071, "epoch": 1525} {"train_loss": -6.051468849182129, "global_step": 64072, "epoch": 1525} {"train_loss": -6.009457588195801, "global_step": 64073, "epoch": 1525} {"train_loss": -6.063209533691406, "global_step": 64074, "epoch": 1525} {"train_loss": -5.896024703979492, "global_step": 64075, "epoch": 1525} {"train_loss": -6.04600191116333, "global_step": 64076, "epoch": 1525} {"train_loss": -6.000336170196533, "global_step": 64077, "epoch": 1525} {"train_loss": -5.997199535369873, "global_step": 64078, "epoch": 1525} {"train_loss": -6.027921199798584, "global_step": 64079, "epoch": 1525} {"train_loss": -6.054418563842773, "global_step": 64080, "epoch": 1525} {"train_loss": -5.983121871948242, "global_step": 64081, "epoch": 1525} {"train_loss": -5.9426798820495605, "global_step": 64082, "epoch": 1525} {"train_loss": -5.905416488647461, "global_step": 64083, "epoch": 1525} {"train_loss": -6.0133819580078125, "global_step": 64084, "epoch": 1525} {"train_loss": -5.901238441467285, "global_step": 64085, "epoch": 1525} {"train_loss": -5.896172046661377, "global_step": 64086, "epoch": 1525} {"train_loss": -5.864956378936768, "global_step": 64087, "epoch": 1525} {"train_loss": -5.971384048461914, "global_step": 64088, "epoch": 1525} {"train_loss": -5.989198684692383, "global_step": 64089, "epoch": 1525} {"train_loss": -5.997928619384766, "global_step": 64090, "epoch": 1525} {"train_loss": -5.972201381410871, "global_step": 64091, "epoch": 1525, "val_loss": 61511.859375} {"train_loss": -5.871338844299316, "global_step": 64092, "epoch": 1526} {"train_loss": -5.995777606964111, "global_step": 64093, "epoch": 1526} {"train_loss": -6.005394458770752, "global_step": 64094, "epoch": 1526} {"train_loss": -5.807632923126221, "global_step": 64095, "epoch": 1526} {"train_loss": -6.085205078125, "global_step": 64096, "epoch": 1526} {"train_loss": -6.013937473297119, "global_step": 64097, "epoch": 1526} {"train_loss": -5.971384525299072, "global_step": 64098, "epoch": 1526} {"train_loss": -6.056830406188965, "global_step": 64099, "epoch": 1526} {"train_loss": -6.027440071105957, "global_step": 64100, "epoch": 1526} {"train_loss": -5.982527256011963, "global_step": 64101, "epoch": 1526} {"train_loss": -5.8952555656433105, "global_step": 64102, "epoch": 1526} {"train_loss": -5.961852550506592, "global_step": 64103, "epoch": 1526} {"train_loss": -6.0344109535217285, "global_step": 64104, "epoch": 1526} {"train_loss": -5.949088096618652, "global_step": 64105, "epoch": 1526} {"train_loss": -6.018532752990723, "global_step": 64106, "epoch": 1526} {"train_loss": -5.9608659744262695, "global_step": 64107, "epoch": 1526} {"train_loss": -6.0051093101501465, "global_step": 64108, "epoch": 1526} {"train_loss": -5.987922668457031, "global_step": 64109, "epoch": 1526} {"train_loss": -5.927206039428711, "global_step": 64110, "epoch": 1526} {"train_loss": -6.010566234588623, "global_step": 64111, "epoch": 1526} {"train_loss": -5.973421096801758, "global_step": 64112, "epoch": 1526} {"train_loss": -6.065496444702148, "global_step": 64113, "epoch": 1526} {"train_loss": -5.934814929962158, "global_step": 64114, "epoch": 1526} {"train_loss": -5.951086521148682, "global_step": 64115, "epoch": 1526} {"train_loss": -6.0333757400512695, "global_step": 64116, "epoch": 1526} {"train_loss": -6.092255592346191, "global_step": 64117, "epoch": 1526} {"train_loss": -6.031200885772705, "global_step": 64118, "epoch": 1526} {"train_loss": -6.000925064086914, "global_step": 64119, "epoch": 1526} {"train_loss": -5.937821388244629, "global_step": 64120, "epoch": 1526} {"train_loss": -6.046363830566406, "global_step": 64121, "epoch": 1526} {"train_loss": -5.910598278045654, "global_step": 64122, "epoch": 1526} {"train_loss": -6.03168249130249, "global_step": 64123, "epoch": 1526} {"train_loss": -6.009187698364258, "global_step": 64124, "epoch": 1526} {"train_loss": -6.008091926574707, "global_step": 64125, "epoch": 1526} {"train_loss": -5.965538024902344, "global_step": 64126, "epoch": 1526} {"train_loss": -6.007536888122559, "global_step": 64127, "epoch": 1526} {"train_loss": -5.97092342376709, "global_step": 64128, "epoch": 1526} {"train_loss": -5.887044906616211, "global_step": 64129, "epoch": 1526} {"train_loss": -5.962212085723877, "global_step": 64130, "epoch": 1526} {"train_loss": -5.951758861541748, "global_step": 64131, "epoch": 1526} {"train_loss": -5.931158065795898, "global_step": 64132, "epoch": 1526} {"train_loss": -5.983551672526768, "global_step": 64133, "epoch": 1526, "val_loss": 61276.140625} {"train_loss": -5.976158142089844, "global_step": 64134, "epoch": 1527} {"train_loss": -5.9381232261657715, "global_step": 64135, "epoch": 1527} {"train_loss": -6.0136189460754395, "global_step": 64136, "epoch": 1527} {"train_loss": -5.931427955627441, "global_step": 64137, "epoch": 1527} {"train_loss": -5.981966972351074, "global_step": 64138, "epoch": 1527} {"train_loss": -5.860700607299805, "global_step": 64139, "epoch": 1527} {"train_loss": -6.044875144958496, "global_step": 64140, "epoch": 1527} {"train_loss": -5.851766586303711, "global_step": 64141, "epoch": 1527} {"train_loss": -6.066195487976074, "global_step": 64142, "epoch": 1527} {"train_loss": -6.00328254699707, "global_step": 64143, "epoch": 1527} {"train_loss": -5.91402530670166, "global_step": 64144, "epoch": 1527} {"train_loss": -5.878267288208008, "global_step": 64145, "epoch": 1527} {"train_loss": -5.808494567871094, "global_step": 64146, "epoch": 1527} {"train_loss": -6.065844535827637, "global_step": 64147, "epoch": 1527} {"train_loss": -5.957005500793457, "global_step": 64148, "epoch": 1527} {"train_loss": -5.807077407836914, "global_step": 64149, "epoch": 1527} {"train_loss": -5.899975776672363, "global_step": 64150, "epoch": 1527} {"train_loss": -5.866289138793945, "global_step": 64151, "epoch": 1527} {"train_loss": -5.937570095062256, "global_step": 64152, "epoch": 1527} {"train_loss": -5.878108024597168, "global_step": 64153, "epoch": 1527} {"train_loss": -5.766786575317383, "global_step": 64154, "epoch": 1527} {"train_loss": -5.905501365661621, "global_step": 64155, "epoch": 1527} {"train_loss": -5.99287223815918, "global_step": 64156, "epoch": 1527} {"train_loss": -5.9467973709106445, "global_step": 64157, "epoch": 1527} {"train_loss": -5.97109317779541, "global_step": 64158, "epoch": 1527} {"train_loss": -5.920742034912109, "global_step": 64159, "epoch": 1527} {"train_loss": -5.758526802062988, "global_step": 64160, "epoch": 1527} {"train_loss": -5.843774795532227, "global_step": 64161, "epoch": 1527} {"train_loss": -5.918581008911133, "global_step": 64162, "epoch": 1527} {"train_loss": -6.01031494140625, "global_step": 64163, "epoch": 1527} {"train_loss": -5.855232238769531, "global_step": 64164, "epoch": 1527} {"train_loss": -5.923211097717285, "global_step": 64165, "epoch": 1527} {"train_loss": -5.860782146453857, "global_step": 64166, "epoch": 1527} {"train_loss": -5.882306098937988, "global_step": 64167, "epoch": 1527} {"train_loss": -5.917536735534668, "global_step": 64168, "epoch": 1527} {"train_loss": -6.080230712890625, "global_step": 64169, "epoch": 1527} {"train_loss": -5.878536224365234, "global_step": 64170, "epoch": 1527} {"train_loss": -5.996744155883789, "global_step": 64171, "epoch": 1527} {"train_loss": -5.967540264129639, "global_step": 64172, "epoch": 1527} {"train_loss": -5.931942462921143, "global_step": 64173, "epoch": 1527} {"train_loss": -5.933725833892822, "global_step": 64174, "epoch": 1527} {"train_loss": -5.927043653669811, "global_step": 64175, "epoch": 1527, "val_loss": 61543.88671875} {"train_loss": -5.8674139976501465, "global_step": 64176, "epoch": 1528} {"train_loss": -5.940487861633301, "global_step": 64177, "epoch": 1528} {"train_loss": -5.906772136688232, "global_step": 64178, "epoch": 1528} {"train_loss": -5.94667387008667, "global_step": 64179, "epoch": 1528} {"train_loss": -5.909193992614746, "global_step": 64180, "epoch": 1528} {"train_loss": -5.916723251342773, "global_step": 64181, "epoch": 1528} {"train_loss": -5.982741832733154, "global_step": 64182, "epoch": 1528} {"train_loss": -5.843639850616455, "global_step": 64183, "epoch": 1528} {"train_loss": -5.9489288330078125, "global_step": 64184, "epoch": 1528} {"train_loss": -6.006765365600586, "global_step": 64185, "epoch": 1528} {"train_loss": -5.9133405685424805, "global_step": 64186, "epoch": 1528} {"train_loss": -5.922144412994385, "global_step": 64187, "epoch": 1528} {"train_loss": -5.9484100341796875, "global_step": 64188, "epoch": 1528} {"train_loss": -5.903652191162109, "global_step": 64189, "epoch": 1528} {"train_loss": -5.960280895233154, "global_step": 64190, "epoch": 1528} {"train_loss": -5.85288143157959, "global_step": 64191, "epoch": 1528} {"train_loss": -5.873482704162598, "global_step": 64192, "epoch": 1528} {"train_loss": -5.876335620880127, "global_step": 64193, "epoch": 1528} {"train_loss": -5.869537353515625, "global_step": 64194, "epoch": 1528} {"train_loss": -5.950380325317383, "global_step": 64195, "epoch": 1528} {"train_loss": -5.919888496398926, "global_step": 64196, "epoch": 1528} {"train_loss": -5.960817337036133, "global_step": 64197, "epoch": 1528} {"train_loss": -5.858915328979492, "global_step": 64198, "epoch": 1528} {"train_loss": -5.9874444007873535, "global_step": 64199, "epoch": 1528} {"train_loss": -5.819316864013672, "global_step": 64200, "epoch": 1528} {"train_loss": -5.8658223152160645, "global_step": 64201, "epoch": 1528} {"train_loss": -5.990054607391357, "global_step": 64202, "epoch": 1528} {"train_loss": -5.9333696365356445, "global_step": 64203, "epoch": 1528} {"train_loss": -5.975552558898926, "global_step": 64204, "epoch": 1528} {"train_loss": -5.864193916320801, "global_step": 64205, "epoch": 1528} {"train_loss": -5.964544773101807, "global_step": 64206, "epoch": 1528} {"train_loss": -5.971435546875, "global_step": 64207, "epoch": 1528} {"train_loss": -5.893606185913086, "global_step": 64208, "epoch": 1528} {"train_loss": -5.908541679382324, "global_step": 64209, "epoch": 1528} {"train_loss": -5.99237060546875, "global_step": 64210, "epoch": 1528} {"train_loss": -5.896367073059082, "global_step": 64211, "epoch": 1528} {"train_loss": -5.955704689025879, "global_step": 64212, "epoch": 1528} {"train_loss": -5.942758083343506, "global_step": 64213, "epoch": 1528} {"train_loss": -5.922159671783447, "global_step": 64214, "epoch": 1528} {"train_loss": -6.02641487121582, "global_step": 64215, "epoch": 1528} {"train_loss": -5.9181084632873535, "global_step": 64216, "epoch": 1528} {"train_loss": -5.924395901816232, "global_step": 64217, "epoch": 1528, "val_loss": 61317.703125} {"train_loss": -6.022189140319824, "global_step": 64218, "epoch": 1529} {"train_loss": -5.95578670501709, "global_step": 64219, "epoch": 1529} {"train_loss": -5.950802326202393, "global_step": 64220, "epoch": 1529} {"train_loss": -5.859709739685059, "global_step": 64221, "epoch": 1529} {"train_loss": -6.068356513977051, "global_step": 64222, "epoch": 1529} {"train_loss": -5.99714469909668, "global_step": 64223, "epoch": 1529} {"train_loss": -5.882878303527832, "global_step": 64224, "epoch": 1529} {"train_loss": -5.927985668182373, "global_step": 64225, "epoch": 1529} {"train_loss": -5.972203731536865, "global_step": 64226, "epoch": 1529} {"train_loss": -6.019835472106934, "global_step": 64227, "epoch": 1529} {"train_loss": -6.233536243438721, "global_step": 64228, "epoch": 1529} {"train_loss": -5.975437164306641, "global_step": 64229, "epoch": 1529} {"train_loss": -5.986183166503906, "global_step": 64230, "epoch": 1529} {"train_loss": -5.892762184143066, "global_step": 64231, "epoch": 1529} {"train_loss": -5.918981552124023, "global_step": 64232, "epoch": 1529} {"train_loss": -5.953330993652344, "global_step": 64233, "epoch": 1529} {"train_loss": -5.881265640258789, "global_step": 64234, "epoch": 1529} {"train_loss": -6.067038059234619, "global_step": 64235, "epoch": 1529} {"train_loss": -6.073521614074707, "global_step": 64236, "epoch": 1529} {"train_loss": -6.048617839813232, "global_step": 64237, "epoch": 1529} {"train_loss": -5.880992889404297, "global_step": 64238, "epoch": 1529} {"train_loss": -5.9234418869018555, "global_step": 64239, "epoch": 1529} {"train_loss": -5.869854927062988, "global_step": 64240, "epoch": 1529} {"train_loss": -5.888206481933594, "global_step": 64241, "epoch": 1529} {"train_loss": -6.042752742767334, "global_step": 64242, "epoch": 1529} {"train_loss": -5.970646858215332, "global_step": 64243, "epoch": 1529} {"train_loss": -6.049204349517822, "global_step": 64244, "epoch": 1529} {"train_loss": -6.003462791442871, "global_step": 64245, "epoch": 1529} {"train_loss": -5.961495399475098, "global_step": 64246, "epoch": 1529} {"train_loss": -5.962823867797852, "global_step": 64247, "epoch": 1529} {"train_loss": -5.994960784912109, "global_step": 64248, "epoch": 1529} {"train_loss": -5.995264530181885, "global_step": 64249, "epoch": 1529} {"train_loss": -6.000883102416992, "global_step": 64250, "epoch": 1529} {"train_loss": -5.963295936584473, "global_step": 64251, "epoch": 1529} {"train_loss": -5.869741439819336, "global_step": 64252, "epoch": 1529} {"train_loss": -5.887552261352539, "global_step": 64253, "epoch": 1529} {"train_loss": -5.939411640167236, "global_step": 64254, "epoch": 1529} {"train_loss": -5.874663352966309, "global_step": 64255, "epoch": 1529} {"train_loss": -5.911641597747803, "global_step": 64256, "epoch": 1529} {"train_loss": -5.929681777954102, "global_step": 64257, "epoch": 1529} {"train_loss": -5.975855350494385, "global_step": 64258, "epoch": 1529} {"train_loss": -5.963701793125698, "global_step": 64259, "epoch": 1529, "val_loss": 61378.91015625} {"train_loss": -5.942713737487793, "global_step": 64260, "epoch": 1530} {"train_loss": -5.994879722595215, "global_step": 64261, "epoch": 1530} {"train_loss": -6.012390613555908, "global_step": 64262, "epoch": 1530} {"train_loss": -5.988089561462402, "global_step": 64263, "epoch": 1530} {"train_loss": -6.039885520935059, "global_step": 64264, "epoch": 1530} {"train_loss": -5.967828750610352, "global_step": 64265, "epoch": 1530} {"train_loss": -6.016041278839111, "global_step": 64266, "epoch": 1530} {"train_loss": -6.057709217071533, "global_step": 64267, "epoch": 1530} {"train_loss": -5.989859580993652, "global_step": 64268, "epoch": 1530} {"train_loss": -5.968100547790527, "global_step": 64269, "epoch": 1530} {"train_loss": -6.020694255828857, "global_step": 64270, "epoch": 1530} {"train_loss": -6.058134078979492, "global_step": 64271, "epoch": 1530} {"train_loss": -5.99974250793457, "global_step": 64272, "epoch": 1530} {"train_loss": -5.860782623291016, "global_step": 64273, "epoch": 1530} {"train_loss": -6.0572309494018555, "global_step": 64274, "epoch": 1530} {"train_loss": -6.009422302246094, "global_step": 64275, "epoch": 1530} {"train_loss": -5.9778947830200195, "global_step": 64276, "epoch": 1530} {"train_loss": -5.873865127563477, "global_step": 64277, "epoch": 1530} {"train_loss": -5.911446571350098, "global_step": 64278, "epoch": 1530} {"train_loss": -6.0384745597839355, "global_step": 64279, "epoch": 1530} {"train_loss": -5.913762092590332, "global_step": 64280, "epoch": 1530} {"train_loss": -5.907553672790527, "global_step": 64281, "epoch": 1530} {"train_loss": -5.950611114501953, "global_step": 64282, "epoch": 1530} {"train_loss": -6.013993263244629, "global_step": 64283, "epoch": 1530} {"train_loss": -5.948931694030762, "global_step": 64284, "epoch": 1530} {"train_loss": -5.887880325317383, "global_step": 64285, "epoch": 1530} {"train_loss": -5.962028503417969, "global_step": 64286, "epoch": 1530} {"train_loss": -5.9742841720581055, "global_step": 64287, "epoch": 1530} {"train_loss": -5.8226213455200195, "global_step": 64288, "epoch": 1530} {"train_loss": -6.023613929748535, "global_step": 64289, "epoch": 1530} {"train_loss": -5.976027488708496, "global_step": 64290, "epoch": 1530} {"train_loss": -6.010441780090332, "global_step": 64291, "epoch": 1530} {"train_loss": -5.871355056762695, "global_step": 64292, "epoch": 1530} {"train_loss": -6.007765769958496, "global_step": 64293, "epoch": 1530} {"train_loss": -6.056733131408691, "global_step": 64294, "epoch": 1530} {"train_loss": -5.885048866271973, "global_step": 64295, "epoch": 1530} {"train_loss": -6.044764041900635, "global_step": 64296, "epoch": 1530} {"train_loss": -5.833648681640625, "global_step": 64297, "epoch": 1530} {"train_loss": -5.992501258850098, "global_step": 64298, "epoch": 1530} {"train_loss": -5.937823295593262, "global_step": 64299, "epoch": 1530} {"train_loss": -6.053393363952637, "global_step": 64300, "epoch": 1530} {"train_loss": -5.9711349578130815, "global_step": 64301, "epoch": 1530, "val_loss": 61538.04296875} {"train_loss": -5.847509860992432, "global_step": 64302, "epoch": 1531} {"train_loss": -5.943961143493652, "global_step": 64303, "epoch": 1531} {"train_loss": -6.021308422088623, "global_step": 64304, "epoch": 1531} {"train_loss": -5.960415840148926, "global_step": 64305, "epoch": 1531} {"train_loss": -6.002867698669434, "global_step": 64306, "epoch": 1531} {"train_loss": -5.947538375854492, "global_step": 64307, "epoch": 1531} {"train_loss": -6.084328651428223, "global_step": 64308, "epoch": 1531} {"train_loss": -5.99813175201416, "global_step": 64309, "epoch": 1531} {"train_loss": -6.030790328979492, "global_step": 64310, "epoch": 1531} {"train_loss": -6.027470588684082, "global_step": 64311, "epoch": 1531} {"train_loss": -5.888175964355469, "global_step": 64312, "epoch": 1531} {"train_loss": -6.029550075531006, "global_step": 64313, "epoch": 1531} {"train_loss": -5.840327262878418, "global_step": 64314, "epoch": 1531} {"train_loss": -5.928008556365967, "global_step": 64315, "epoch": 1531} {"train_loss": -5.939795970916748, "global_step": 64316, "epoch": 1531} {"train_loss": -5.934088706970215, "global_step": 64317, "epoch": 1531} {"train_loss": -5.993601322174072, "global_step": 64318, "epoch": 1531} {"train_loss": -6.041075706481934, "global_step": 64319, "epoch": 1531} {"train_loss": -6.115036487579346, "global_step": 64320, "epoch": 1531} {"train_loss": -6.003028869628906, "global_step": 64321, "epoch": 1531} {"train_loss": -5.8832902908325195, "global_step": 64322, "epoch": 1531} {"train_loss": -5.821328163146973, "global_step": 64323, "epoch": 1531} {"train_loss": -6.030427932739258, "global_step": 64324, "epoch": 1531} {"train_loss": -6.053813934326172, "global_step": 64325, "epoch": 1531} {"train_loss": -5.9451446533203125, "global_step": 64326, "epoch": 1531} {"train_loss": -5.904458522796631, "global_step": 64327, "epoch": 1531} {"train_loss": -6.000432014465332, "global_step": 64328, "epoch": 1531} {"train_loss": -5.846784591674805, "global_step": 64329, "epoch": 1531} {"train_loss": -6.0481672286987305, "global_step": 64330, "epoch": 1531} {"train_loss": -5.962363243103027, "global_step": 64331, "epoch": 1531} {"train_loss": -5.9554643630981445, "global_step": 64332, "epoch": 1531} {"train_loss": -5.924602508544922, "global_step": 64333, "epoch": 1531} {"train_loss": -5.934930801391602, "global_step": 64334, "epoch": 1531} {"train_loss": -5.943490028381348, "global_step": 64335, "epoch": 1531} {"train_loss": -5.914193153381348, "global_step": 64336, "epoch": 1531} {"train_loss": -5.964416980743408, "global_step": 64337, "epoch": 1531} {"train_loss": -5.928136825561523, "global_step": 64338, "epoch": 1531} {"train_loss": -5.873790264129639, "global_step": 64339, "epoch": 1531} {"train_loss": -5.977207183837891, "global_step": 64340, "epoch": 1531} {"train_loss": -5.901752948760986, "global_step": 64341, "epoch": 1531} {"train_loss": -5.959892272949219, "global_step": 64342, "epoch": 1531} {"train_loss": -5.9576278527577715, "global_step": 64343, "epoch": 1531, "val_loss": 61555.39453125} {"train_loss": -5.886100769042969, "global_step": 64344, "epoch": 1532} {"train_loss": -5.930281639099121, "global_step": 64345, "epoch": 1532} {"train_loss": -5.970938682556152, "global_step": 64346, "epoch": 1532} {"train_loss": -5.9579315185546875, "global_step": 64347, "epoch": 1532} {"train_loss": -5.893919944763184, "global_step": 64348, "epoch": 1532} {"train_loss": -6.044521331787109, "global_step": 64349, "epoch": 1532} {"train_loss": -5.822616100311279, "global_step": 64350, "epoch": 1532} {"train_loss": -5.890444755554199, "global_step": 64351, "epoch": 1532} {"train_loss": -5.978987693786621, "global_step": 64352, "epoch": 1532} {"train_loss": -5.863763809204102, "global_step": 64353, "epoch": 1532} {"train_loss": -6.024698734283447, "global_step": 64354, "epoch": 1532} {"train_loss": -5.875217437744141, "global_step": 64355, "epoch": 1532} {"train_loss": -6.0304059982299805, "global_step": 64356, "epoch": 1532} {"train_loss": -5.979287147521973, "global_step": 64357, "epoch": 1532} {"train_loss": -5.979483604431152, "global_step": 64358, "epoch": 1532} {"train_loss": -6.084682464599609, "global_step": 64359, "epoch": 1532} {"train_loss": -6.002407550811768, "global_step": 64360, "epoch": 1532} {"train_loss": -5.8469390869140625, "global_step": 64361, "epoch": 1532} {"train_loss": -5.876601219177246, "global_step": 64362, "epoch": 1532} {"train_loss": -6.061965465545654, "global_step": 64363, "epoch": 1532} {"train_loss": -5.9701247215271, "global_step": 64364, "epoch": 1532} {"train_loss": -5.820874214172363, "global_step": 64365, "epoch": 1532} {"train_loss": -5.807041168212891, "global_step": 64366, "epoch": 1532} {"train_loss": -6.012939453125, "global_step": 64367, "epoch": 1532} {"train_loss": -5.911616325378418, "global_step": 64368, "epoch": 1532} {"train_loss": -6.033149719238281, "global_step": 64369, "epoch": 1532} {"train_loss": -5.993608474731445, "global_step": 64370, "epoch": 1532} {"train_loss": -5.838302135467529, "global_step": 64371, "epoch": 1532} {"train_loss": -6.038542747497559, "global_step": 64372, "epoch": 1532} {"train_loss": -6.011960029602051, "global_step": 64373, "epoch": 1532} {"train_loss": -5.846674919128418, "global_step": 64374, "epoch": 1532} {"train_loss": -5.914159297943115, "global_step": 64375, "epoch": 1532} {"train_loss": -5.844147682189941, "global_step": 64376, "epoch": 1532} {"train_loss": -5.913266181945801, "global_step": 64377, "epoch": 1532} {"train_loss": -6.110322952270508, "global_step": 64378, "epoch": 1532} {"train_loss": -5.975746154785156, "global_step": 64379, "epoch": 1532} {"train_loss": -6.033385276794434, "global_step": 64380, "epoch": 1532} {"train_loss": -6.1037187576293945, "global_step": 64381, "epoch": 1532} {"train_loss": -6.082297325134277, "global_step": 64382, "epoch": 1532} {"train_loss": -5.831774711608887, "global_step": 64383, "epoch": 1532} {"train_loss": -5.846409797668457, "global_step": 64384, "epoch": 1532} {"train_loss": -5.949490342821393, "global_step": 64385, "epoch": 1532, "val_loss": 61444.8125} {"train_loss": -6.012815475463867, "global_step": 64386, "epoch": 1533} {"train_loss": -5.99700403213501, "global_step": 64387, "epoch": 1533} {"train_loss": -5.967377662658691, "global_step": 64388, "epoch": 1533} {"train_loss": -5.87447452545166, "global_step": 64389, "epoch": 1533} {"train_loss": -5.989959239959717, "global_step": 64390, "epoch": 1533} {"train_loss": -6.009629249572754, "global_step": 64391, "epoch": 1533} {"train_loss": -5.980654239654541, "global_step": 64392, "epoch": 1533} {"train_loss": -6.071361064910889, "global_step": 64393, "epoch": 1533} {"train_loss": -5.998157024383545, "global_step": 64394, "epoch": 1533} {"train_loss": -5.922856330871582, "global_step": 64395, "epoch": 1533} {"train_loss": -5.9466352462768555, "global_step": 64396, "epoch": 1533} {"train_loss": -6.1063618659973145, "global_step": 64397, "epoch": 1533} {"train_loss": -5.888221740722656, "global_step": 64398, "epoch": 1533} {"train_loss": -6.031955718994141, "global_step": 64399, "epoch": 1533} {"train_loss": -5.931829452514648, "global_step": 64400, "epoch": 1533} {"train_loss": -6.052818775177002, "global_step": 64401, "epoch": 1533} {"train_loss": -5.922848701477051, "global_step": 64402, "epoch": 1533} {"train_loss": -5.9621381759643555, "global_step": 64403, "epoch": 1533} {"train_loss": -5.844459533691406, "global_step": 64404, "epoch": 1533} {"train_loss": -6.026619911193848, "global_step": 64405, "epoch": 1533} {"train_loss": -5.996703147888184, "global_step": 64406, "epoch": 1533} {"train_loss": -5.979687690734863, "global_step": 64407, "epoch": 1533} {"train_loss": -5.961325645446777, "global_step": 64408, "epoch": 1533} {"train_loss": -5.961826801300049, "global_step": 64409, "epoch": 1533} {"train_loss": -5.9890217781066895, "global_step": 64410, "epoch": 1533} {"train_loss": -6.019576072692871, "global_step": 64411, "epoch": 1533} {"train_loss": -5.9064040184021, "global_step": 64412, "epoch": 1533} {"train_loss": -6.040960311889648, "global_step": 64413, "epoch": 1533} {"train_loss": -5.955309867858887, "global_step": 64414, "epoch": 1533} {"train_loss": -5.91210412979126, "global_step": 64415, "epoch": 1533} {"train_loss": -5.997169494628906, "global_step": 64416, "epoch": 1533} {"train_loss": -6.008662700653076, "global_step": 64417, "epoch": 1533} {"train_loss": -5.8700270652771, "global_step": 64418, "epoch": 1533} {"train_loss": -5.986302375793457, "global_step": 64419, "epoch": 1533} {"train_loss": -5.870292663574219, "global_step": 64420, "epoch": 1533} {"train_loss": -5.959418773651123, "global_step": 64421, "epoch": 1533} {"train_loss": -6.097554683685303, "global_step": 64422, "epoch": 1533} {"train_loss": -5.985102653503418, "global_step": 64423, "epoch": 1533} {"train_loss": -5.97591495513916, "global_step": 64424, "epoch": 1533} {"train_loss": -6.104734420776367, "global_step": 64425, "epoch": 1533} {"train_loss": -5.880152702331543, "global_step": 64426, "epoch": 1533} {"train_loss": -5.9760495367504305, "global_step": 64427, "epoch": 1533, "val_loss": 61751.02734375} {"train_loss": -5.977513313293457, "global_step": 64428, "epoch": 1534} {"train_loss": -5.973991394042969, "global_step": 64429, "epoch": 1534} {"train_loss": -5.882040023803711, "global_step": 64430, "epoch": 1534} {"train_loss": -5.899721145629883, "global_step": 64431, "epoch": 1534} {"train_loss": -5.950582504272461, "global_step": 64432, "epoch": 1534} {"train_loss": -5.9452972412109375, "global_step": 64433, "epoch": 1534} {"train_loss": -5.875296115875244, "global_step": 64434, "epoch": 1534} {"train_loss": -5.944535255432129, "global_step": 64435, "epoch": 1534} {"train_loss": -5.837703227996826, "global_step": 64436, "epoch": 1534} {"train_loss": -5.864277362823486, "global_step": 64437, "epoch": 1534} {"train_loss": -5.991175651550293, "global_step": 64438, "epoch": 1534} {"train_loss": -5.968748092651367, "global_step": 64439, "epoch": 1534} {"train_loss": -5.849183559417725, "global_step": 64440, "epoch": 1534} {"train_loss": -6.045741081237793, "global_step": 64441, "epoch": 1534} {"train_loss": -6.112153053283691, "global_step": 64442, "epoch": 1534} {"train_loss": -5.974534034729004, "global_step": 64443, "epoch": 1534} {"train_loss": -5.9680986404418945, "global_step": 64444, "epoch": 1534} {"train_loss": -5.864282131195068, "global_step": 64445, "epoch": 1534} {"train_loss": -5.918023586273193, "global_step": 64446, "epoch": 1534} {"train_loss": -5.893218040466309, "global_step": 64447, "epoch": 1534} {"train_loss": -6.027257919311523, "global_step": 64448, "epoch": 1534} {"train_loss": -5.9539666175842285, "global_step": 64449, "epoch": 1534} {"train_loss": -5.9832563400268555, "global_step": 64450, "epoch": 1534} {"train_loss": -6.005560398101807, "global_step": 64451, "epoch": 1534} {"train_loss": -5.936569690704346, "global_step": 64452, "epoch": 1534} {"train_loss": -5.883388519287109, "global_step": 64453, "epoch": 1534} {"train_loss": -6.029123783111572, "global_step": 64454, "epoch": 1534} {"train_loss": -6.0652923583984375, "global_step": 64455, "epoch": 1534} {"train_loss": -5.869229316711426, "global_step": 64456, "epoch": 1534} {"train_loss": -5.9814229011535645, "global_step": 64457, "epoch": 1534} {"train_loss": -6.011396408081055, "global_step": 64458, "epoch": 1534} {"train_loss": -5.913520812988281, "global_step": 64459, "epoch": 1534} {"train_loss": -5.982496738433838, "global_step": 64460, "epoch": 1534} {"train_loss": -5.929251670837402, "global_step": 64461, "epoch": 1534} {"train_loss": -5.958847999572754, "global_step": 64462, "epoch": 1534} {"train_loss": -5.991548538208008, "global_step": 64463, "epoch": 1534} {"train_loss": -5.9275312423706055, "global_step": 64464, "epoch": 1534} {"train_loss": -5.94462776184082, "global_step": 64465, "epoch": 1534} {"train_loss": -6.028754234313965, "global_step": 64466, "epoch": 1534} {"train_loss": -5.944258689880371, "global_step": 64467, "epoch": 1534} {"train_loss": -5.85331916809082, "global_step": 64468, "epoch": 1534} {"train_loss": -5.949231919788179, "global_step": 64469, "epoch": 1534, "val_loss": 61406.484375} {"train_loss": -6.05610990524292, "global_step": 64470, "epoch": 1535} {"train_loss": -6.020515441894531, "global_step": 64471, "epoch": 1535} {"train_loss": -5.963852882385254, "global_step": 64472, "epoch": 1535} {"train_loss": -5.941258907318115, "global_step": 64473, "epoch": 1535} {"train_loss": -5.704619884490967, "global_step": 64474, "epoch": 1535} {"train_loss": -5.7765326499938965, "global_step": 64475, "epoch": 1535} {"train_loss": -5.983526706695557, "global_step": 64476, "epoch": 1535} {"train_loss": -5.954601764678955, "global_step": 64477, "epoch": 1535} {"train_loss": -5.940317153930664, "global_step": 64478, "epoch": 1535} {"train_loss": -5.928613662719727, "global_step": 64479, "epoch": 1535} {"train_loss": -6.015707969665527, "global_step": 64480, "epoch": 1535} {"train_loss": -5.976461887359619, "global_step": 64481, "epoch": 1535} {"train_loss": -5.905716419219971, "global_step": 64482, "epoch": 1535} {"train_loss": -5.838290214538574, "global_step": 64483, "epoch": 1535} {"train_loss": -5.98410177230835, "global_step": 64484, "epoch": 1535} {"train_loss": -6.0510101318359375, "global_step": 64485, "epoch": 1535} {"train_loss": -6.011480331420898, "global_step": 64486, "epoch": 1535} {"train_loss": -5.996380805969238, "global_step": 64487, "epoch": 1535} {"train_loss": -5.960945129394531, "global_step": 64488, "epoch": 1535} {"train_loss": -5.863591194152832, "global_step": 64489, "epoch": 1535} {"train_loss": -5.968401908874512, "global_step": 64490, "epoch": 1535} {"train_loss": -5.9569501876831055, "global_step": 64491, "epoch": 1535} {"train_loss": -5.939757347106934, "global_step": 64492, "epoch": 1535} {"train_loss": -6.0364251136779785, "global_step": 64493, "epoch": 1535} {"train_loss": -5.87844181060791, "global_step": 64494, "epoch": 1535} {"train_loss": -5.965713024139404, "global_step": 64495, "epoch": 1535} {"train_loss": -5.9708251953125, "global_step": 64496, "epoch": 1535} {"train_loss": -5.949203014373779, "global_step": 64497, "epoch": 1535} {"train_loss": -5.949648380279541, "global_step": 64498, "epoch": 1535} {"train_loss": -6.01578950881958, "global_step": 64499, "epoch": 1535} {"train_loss": -5.8574018478393555, "global_step": 64500, "epoch": 1535} {"train_loss": -5.840747833251953, "global_step": 64501, "epoch": 1535} {"train_loss": -5.921391010284424, "global_step": 64502, "epoch": 1535} {"train_loss": -5.998716831207275, "global_step": 64503, "epoch": 1535} {"train_loss": -5.879622459411621, "global_step": 64504, "epoch": 1535} {"train_loss": -6.028371810913086, "global_step": 64505, "epoch": 1535} {"train_loss": -6.119511604309082, "global_step": 64506, "epoch": 1535} {"train_loss": -5.867486953735352, "global_step": 64507, "epoch": 1535} {"train_loss": -6.032210350036621, "global_step": 64508, "epoch": 1535} {"train_loss": -6.020565986633301, "global_step": 64509, "epoch": 1535} {"train_loss": -6.022817611694336, "global_step": 64510, "epoch": 1535} {"train_loss": -5.952960854484921, "global_step": 64511, "epoch": 1535, "val_loss": 61138.38671875} {"train_loss": -6.055477142333984, "global_step": 64512, "epoch": 1536} {"train_loss": -6.01451301574707, "global_step": 64513, "epoch": 1536} {"train_loss": -5.984097957611084, "global_step": 64514, "epoch": 1536} {"train_loss": -5.950821876525879, "global_step": 64515, "epoch": 1536} {"train_loss": -6.021501541137695, "global_step": 64516, "epoch": 1536} {"train_loss": -5.9355316162109375, "global_step": 64517, "epoch": 1536} {"train_loss": -6.0519700050354, "global_step": 64518, "epoch": 1536} {"train_loss": -5.910215377807617, "global_step": 64519, "epoch": 1536} {"train_loss": -6.097856044769287, "global_step": 64520, "epoch": 1536} {"train_loss": -5.929879188537598, "global_step": 64521, "epoch": 1536} {"train_loss": -6.0270562171936035, "global_step": 64522, "epoch": 1536} {"train_loss": -5.812421798706055, "global_step": 64523, "epoch": 1536} {"train_loss": -5.954588413238525, "global_step": 64524, "epoch": 1536} {"train_loss": -6.013222694396973, "global_step": 64525, "epoch": 1536} {"train_loss": -5.894179344177246, "global_step": 64526, "epoch": 1536} {"train_loss": -5.78574275970459, "global_step": 64527, "epoch": 1536} {"train_loss": -6.0734782218933105, "global_step": 64528, "epoch": 1536} {"train_loss": -6.062646865844727, "global_step": 64529, "epoch": 1536} {"train_loss": -6.048025608062744, "global_step": 64530, "epoch": 1536} {"train_loss": -6.0610246658325195, "global_step": 64531, "epoch": 1536} {"train_loss": -6.054831504821777, "global_step": 64532, "epoch": 1536} {"train_loss": -6.003138542175293, "global_step": 64533, "epoch": 1536} {"train_loss": -6.051120758056641, "global_step": 64534, "epoch": 1536} {"train_loss": -6.0515546798706055, "global_step": 64535, "epoch": 1536} {"train_loss": -5.92221736907959, "global_step": 64536, "epoch": 1536} {"train_loss": -6.008728981018066, "global_step": 64537, "epoch": 1536} {"train_loss": -6.062629222869873, "global_step": 64538, "epoch": 1536} {"train_loss": -5.983382225036621, "global_step": 64539, "epoch": 1536} {"train_loss": -5.878721237182617, "global_step": 64540, "epoch": 1536} {"train_loss": -6.096641540527344, "global_step": 64541, "epoch": 1536} {"train_loss": -6.052785873413086, "global_step": 64542, "epoch": 1536} {"train_loss": -5.904240608215332, "global_step": 64543, "epoch": 1536} {"train_loss": -5.955957412719727, "global_step": 64544, "epoch": 1536} {"train_loss": -5.920244216918945, "global_step": 64545, "epoch": 1536} {"train_loss": -5.948880195617676, "global_step": 64546, "epoch": 1536} {"train_loss": -6.0202317237854, "global_step": 64547, "epoch": 1536} {"train_loss": -5.939903259277344, "global_step": 64548, "epoch": 1536} {"train_loss": -5.957068920135498, "global_step": 64549, "epoch": 1536} {"train_loss": -6.002352714538574, "global_step": 64550, "epoch": 1536} {"train_loss": -5.7897515296936035, "global_step": 64551, "epoch": 1536} {"train_loss": -5.951702117919922, "global_step": 64552, "epoch": 1536} {"train_loss": -5.98183840797061, "global_step": 64553, "epoch": 1536, "val_loss": 61678.109375} {"train_loss": -5.9245171546936035, "global_step": 64554, "epoch": 1537} {"train_loss": -5.893368721008301, "global_step": 64555, "epoch": 1537} {"train_loss": -5.883414268493652, "global_step": 64556, "epoch": 1537} {"train_loss": -5.9368510246276855, "global_step": 64557, "epoch": 1537} {"train_loss": -6.0597076416015625, "global_step": 64558, "epoch": 1537} {"train_loss": -5.829641819000244, "global_step": 64559, "epoch": 1537} {"train_loss": -5.807521820068359, "global_step": 64560, "epoch": 1537} {"train_loss": -5.926626205444336, "global_step": 64561, "epoch": 1537} {"train_loss": -5.973454475402832, "global_step": 64562, "epoch": 1537} {"train_loss": -6.019560813903809, "global_step": 64563, "epoch": 1537} {"train_loss": -5.95332145690918, "global_step": 64564, "epoch": 1537} {"train_loss": -5.870963096618652, "global_step": 64565, "epoch": 1537} {"train_loss": -5.924731254577637, "global_step": 64566, "epoch": 1537} {"train_loss": -6.045816898345947, "global_step": 64567, "epoch": 1537} {"train_loss": -5.912106513977051, "global_step": 64568, "epoch": 1537} {"train_loss": -5.965714454650879, "global_step": 64569, "epoch": 1537} {"train_loss": -5.970872402191162, "global_step": 64570, "epoch": 1537} {"train_loss": -5.909483432769775, "global_step": 64571, "epoch": 1537} {"train_loss": -5.858398914337158, "global_step": 64572, "epoch": 1537} {"train_loss": -5.876649379730225, "global_step": 64573, "epoch": 1537} {"train_loss": -5.963839054107666, "global_step": 64574, "epoch": 1537} {"train_loss": -5.966355323791504, "global_step": 64575, "epoch": 1537} {"train_loss": -5.824193954467773, "global_step": 64576, "epoch": 1537} {"train_loss": -6.059080123901367, "global_step": 64577, "epoch": 1537} {"train_loss": -6.065695762634277, "global_step": 64578, "epoch": 1537} {"train_loss": -5.96263313293457, "global_step": 64579, "epoch": 1537} {"train_loss": -5.832064151763916, "global_step": 64580, "epoch": 1537} {"train_loss": -5.970094680786133, "global_step": 64581, "epoch": 1537} {"train_loss": -5.922423839569092, "global_step": 64582, "epoch": 1537} {"train_loss": -6.046469688415527, "global_step": 64583, "epoch": 1537} {"train_loss": -5.959873199462891, "global_step": 64584, "epoch": 1537} {"train_loss": -5.910366535186768, "global_step": 64585, "epoch": 1537} {"train_loss": -6.040733814239502, "global_step": 64586, "epoch": 1537} {"train_loss": -6.011960506439209, "global_step": 64587, "epoch": 1537} {"train_loss": -5.992084503173828, "global_step": 64588, "epoch": 1537} {"train_loss": -5.986612319946289, "global_step": 64589, "epoch": 1537} {"train_loss": -5.8737921714782715, "global_step": 64590, "epoch": 1537} {"train_loss": -6.007157325744629, "global_step": 64591, "epoch": 1537} {"train_loss": -5.980994701385498, "global_step": 64592, "epoch": 1537} {"train_loss": -6.128363609313965, "global_step": 64593, "epoch": 1537} {"train_loss": -6.09913444519043, "global_step": 64594, "epoch": 1537} {"train_loss": -5.9555732522691995, "global_step": 64595, "epoch": 1537, "val_loss": 61261.203125} {"train_loss": -5.891208648681641, "global_step": 64596, "epoch": 1538} {"train_loss": -6.025714874267578, "global_step": 64597, "epoch": 1538} {"train_loss": -5.926861763000488, "global_step": 64598, "epoch": 1538} {"train_loss": -6.043935775756836, "global_step": 64599, "epoch": 1538} {"train_loss": -6.054391860961914, "global_step": 64600, "epoch": 1538} {"train_loss": -5.972265720367432, "global_step": 64601, "epoch": 1538} {"train_loss": -5.993390083312988, "global_step": 64602, "epoch": 1538} {"train_loss": -6.074832439422607, "global_step": 64603, "epoch": 1538} {"train_loss": -5.950554847717285, "global_step": 64604, "epoch": 1538} {"train_loss": -5.956187725067139, "global_step": 64605, "epoch": 1538} {"train_loss": -6.0194573402404785, "global_step": 64606, "epoch": 1538} {"train_loss": -5.9567670822143555, "global_step": 64607, "epoch": 1538} {"train_loss": -5.941464424133301, "global_step": 64608, "epoch": 1538} {"train_loss": -5.920635223388672, "global_step": 64609, "epoch": 1538} {"train_loss": -5.991175651550293, "global_step": 64610, "epoch": 1538} {"train_loss": -5.957213401794434, "global_step": 64611, "epoch": 1538} {"train_loss": -5.9809722900390625, "global_step": 64612, "epoch": 1538} {"train_loss": -5.949810981750488, "global_step": 64613, "epoch": 1538} {"train_loss": -5.964986801147461, "global_step": 64614, "epoch": 1538} {"train_loss": -5.895358085632324, "global_step": 64615, "epoch": 1538} {"train_loss": -5.906313896179199, "global_step": 64616, "epoch": 1538} {"train_loss": -5.976316928863525, "global_step": 64617, "epoch": 1538} {"train_loss": -5.864048480987549, "global_step": 64618, "epoch": 1538} {"train_loss": -5.858720779418945, "global_step": 64619, "epoch": 1538} {"train_loss": -5.985994338989258, "global_step": 64620, "epoch": 1538} {"train_loss": -6.063450336456299, "global_step": 64621, "epoch": 1538} {"train_loss": -5.858546257019043, "global_step": 64622, "epoch": 1538} {"train_loss": -5.937099456787109, "global_step": 64623, "epoch": 1538} {"train_loss": -5.898416519165039, "global_step": 64624, "epoch": 1538} {"train_loss": -6.016911029815674, "global_step": 64625, "epoch": 1538} {"train_loss": -5.898491382598877, "global_step": 64626, "epoch": 1538} {"train_loss": -5.888908386230469, "global_step": 64627, "epoch": 1538} {"train_loss": -5.958932876586914, "global_step": 64628, "epoch": 1538} {"train_loss": -6.035506248474121, "global_step": 64629, "epoch": 1538} {"train_loss": -5.968585968017578, "global_step": 64630, "epoch": 1538} {"train_loss": -5.8591108322143555, "global_step": 64631, "epoch": 1538} {"train_loss": -5.801025867462158, "global_step": 64632, "epoch": 1538} {"train_loss": -5.9298095703125, "global_step": 64633, "epoch": 1538} {"train_loss": -5.900918960571289, "global_step": 64634, "epoch": 1538} {"train_loss": -5.989092826843262, "global_step": 64635, "epoch": 1538} {"train_loss": -5.931766510009766, "global_step": 64636, "epoch": 1538} {"train_loss": -5.948815584182739, "global_step": 64637, "epoch": 1538, "val_loss": 61653.7421875} {"train_loss": -6.1756086349487305, "global_step": 64638, "epoch": 1539} {"train_loss": -5.8472371101379395, "global_step": 64639, "epoch": 1539} {"train_loss": -5.997292995452881, "global_step": 64640, "epoch": 1539} {"train_loss": -5.876243591308594, "global_step": 64641, "epoch": 1539} {"train_loss": -5.916684150695801, "global_step": 64642, "epoch": 1539} {"train_loss": -5.925362586975098, "global_step": 64643, "epoch": 1539} {"train_loss": -5.9145097732543945, "global_step": 64644, "epoch": 1539} {"train_loss": -5.914644241333008, "global_step": 64645, "epoch": 1539} {"train_loss": -6.022866249084473, "global_step": 64646, "epoch": 1539} {"train_loss": -5.93458890914917, "global_step": 64647, "epoch": 1539} {"train_loss": -5.947397232055664, "global_step": 64648, "epoch": 1539} {"train_loss": -5.934916019439697, "global_step": 64649, "epoch": 1539} {"train_loss": -5.871595859527588, "global_step": 64650, "epoch": 1539} {"train_loss": -5.832516193389893, "global_step": 64651, "epoch": 1539} {"train_loss": -5.938253879547119, "global_step": 64652, "epoch": 1539} {"train_loss": -5.795966625213623, "global_step": 64653, "epoch": 1539} {"train_loss": -5.973158836364746, "global_step": 64654, "epoch": 1539} {"train_loss": -6.007540702819824, "global_step": 64655, "epoch": 1539} {"train_loss": -5.903075218200684, "global_step": 64656, "epoch": 1539} {"train_loss": -5.878000259399414, "global_step": 64657, "epoch": 1539} {"train_loss": -5.844191074371338, "global_step": 64658, "epoch": 1539} {"train_loss": -5.99756383895874, "global_step": 64659, "epoch": 1539} {"train_loss": -5.942910194396973, "global_step": 64660, "epoch": 1539} {"train_loss": -5.897692680358887, "global_step": 64661, "epoch": 1539} {"train_loss": -5.963415145874023, "global_step": 64662, "epoch": 1539} {"train_loss": -6.009198188781738, "global_step": 64663, "epoch": 1539} {"train_loss": -6.002585411071777, "global_step": 64664, "epoch": 1539} {"train_loss": -5.972965240478516, "global_step": 64665, "epoch": 1539} {"train_loss": -6.019397258758545, "global_step": 64666, "epoch": 1539} {"train_loss": -6.053039073944092, "global_step": 64667, "epoch": 1539} {"train_loss": -5.935166358947754, "global_step": 64668, "epoch": 1539} {"train_loss": -6.042298316955566, "global_step": 64669, "epoch": 1539} {"train_loss": -5.900903701782227, "global_step": 64670, "epoch": 1539} {"train_loss": -5.929928302764893, "global_step": 64671, "epoch": 1539} {"train_loss": -5.941500663757324, "global_step": 64672, "epoch": 1539} {"train_loss": -5.970296859741211, "global_step": 64673, "epoch": 1539} {"train_loss": -5.975615978240967, "global_step": 64674, "epoch": 1539} {"train_loss": -5.933830261230469, "global_step": 64675, "epoch": 1539} {"train_loss": -6.006254196166992, "global_step": 64676, "epoch": 1539} {"train_loss": -5.924424171447754, "global_step": 64677, "epoch": 1539} {"train_loss": -5.895906448364258, "global_step": 64678, "epoch": 1539} {"train_loss": -5.944896346046811, "global_step": 64679, "epoch": 1539, "val_loss": 61336.203125} {"train_loss": -6.004265785217285, "global_step": 64680, "epoch": 1540} {"train_loss": -5.966378211975098, "global_step": 64681, "epoch": 1540} {"train_loss": -5.800056457519531, "global_step": 64682, "epoch": 1540} {"train_loss": -5.812002182006836, "global_step": 64683, "epoch": 1540} {"train_loss": -5.968414306640625, "global_step": 64684, "epoch": 1540} {"train_loss": -5.984000205993652, "global_step": 64685, "epoch": 1540} {"train_loss": -5.951873779296875, "global_step": 64686, "epoch": 1540} {"train_loss": -5.972546577453613, "global_step": 64687, "epoch": 1540} {"train_loss": -5.884047985076904, "global_step": 64688, "epoch": 1540} {"train_loss": -5.94024658203125, "global_step": 64689, "epoch": 1540} {"train_loss": -5.837575435638428, "global_step": 64690, "epoch": 1540} {"train_loss": -5.818550109863281, "global_step": 64691, "epoch": 1540} {"train_loss": -5.917661666870117, "global_step": 64692, "epoch": 1540} {"train_loss": -5.9622039794921875, "global_step": 64693, "epoch": 1540} {"train_loss": -5.977733135223389, "global_step": 64694, "epoch": 1540} {"train_loss": -5.987806797027588, "global_step": 64695, "epoch": 1540} {"train_loss": -5.917016983032227, "global_step": 64696, "epoch": 1540} {"train_loss": -5.854190826416016, "global_step": 64697, "epoch": 1540} {"train_loss": -5.932730674743652, "global_step": 64698, "epoch": 1540} {"train_loss": -5.988398551940918, "global_step": 64699, "epoch": 1540} {"train_loss": -5.998137474060059, "global_step": 64700, "epoch": 1540} {"train_loss": -5.926910400390625, "global_step": 64701, "epoch": 1540} {"train_loss": -5.952092170715332, "global_step": 64702, "epoch": 1540} {"train_loss": -5.99040412902832, "global_step": 64703, "epoch": 1540} {"train_loss": -5.99738073348999, "global_step": 64704, "epoch": 1540} {"train_loss": -5.90975284576416, "global_step": 64705, "epoch": 1540} {"train_loss": -5.899618148803711, "global_step": 64706, "epoch": 1540} {"train_loss": -5.924530982971191, "global_step": 64707, "epoch": 1540} {"train_loss": -5.99715518951416, "global_step": 64708, "epoch": 1540} {"train_loss": -6.039379596710205, "global_step": 64709, "epoch": 1540} {"train_loss": -5.9078240394592285, "global_step": 64710, "epoch": 1540} {"train_loss": -6.079348564147949, "global_step": 64711, "epoch": 1540} {"train_loss": -5.97315788269043, "global_step": 64712, "epoch": 1540} {"train_loss": -5.9919281005859375, "global_step": 64713, "epoch": 1540} {"train_loss": -5.96619987487793, "global_step": 64714, "epoch": 1540} {"train_loss": -6.02163028717041, "global_step": 64715, "epoch": 1540} {"train_loss": -6.005834102630615, "global_step": 64716, "epoch": 1540} {"train_loss": -6.011756896972656, "global_step": 64717, "epoch": 1540} {"train_loss": -5.795245170593262, "global_step": 64718, "epoch": 1540} {"train_loss": -5.957243919372559, "global_step": 64719, "epoch": 1540} {"train_loss": -5.932346343994141, "global_step": 64720, "epoch": 1540} {"train_loss": -5.943713778541202, "global_step": 64721, "epoch": 1540, "val_loss": 61261.12890625} {"train_loss": -5.92953634262085, "global_step": 64722, "epoch": 1541} {"train_loss": -5.980302810668945, "global_step": 64723, "epoch": 1541} {"train_loss": -5.940509796142578, "global_step": 64724, "epoch": 1541} {"train_loss": -5.9796271324157715, "global_step": 64725, "epoch": 1541} {"train_loss": -5.981390953063965, "global_step": 64726, "epoch": 1541} {"train_loss": -5.901810646057129, "global_step": 64727, "epoch": 1541} {"train_loss": -5.92080020904541, "global_step": 64728, "epoch": 1541} {"train_loss": -5.914936065673828, "global_step": 64729, "epoch": 1541} {"train_loss": -5.98836088180542, "global_step": 64730, "epoch": 1541} {"train_loss": -5.789850234985352, "global_step": 64731, "epoch": 1541} {"train_loss": -5.8888702392578125, "global_step": 64732, "epoch": 1541} {"train_loss": -5.896838188171387, "global_step": 64733, "epoch": 1541} {"train_loss": -5.908380508422852, "global_step": 64734, "epoch": 1541} {"train_loss": -5.982780456542969, "global_step": 64735, "epoch": 1541} {"train_loss": -5.9321770668029785, "global_step": 64736, "epoch": 1541} {"train_loss": -6.099339008331299, "global_step": 64737, "epoch": 1541} {"train_loss": -6.048044204711914, "global_step": 64738, "epoch": 1541} {"train_loss": -5.9706292152404785, "global_step": 64739, "epoch": 1541} {"train_loss": -5.9422383308410645, "global_step": 64740, "epoch": 1541} {"train_loss": -5.980137825012207, "global_step": 64741, "epoch": 1541} {"train_loss": -5.991554260253906, "global_step": 64742, "epoch": 1541} {"train_loss": -5.915740013122559, "global_step": 64743, "epoch": 1541} {"train_loss": -5.977271556854248, "global_step": 64744, "epoch": 1541} {"train_loss": -5.926243782043457, "global_step": 64745, "epoch": 1541} {"train_loss": -6.0130720138549805, "global_step": 64746, "epoch": 1541} {"train_loss": -6.036299705505371, "global_step": 64747, "epoch": 1541} {"train_loss": -5.974976062774658, "global_step": 64748, "epoch": 1541} {"train_loss": -5.970626354217529, "global_step": 64749, "epoch": 1541} {"train_loss": -5.981136322021484, "global_step": 64750, "epoch": 1541} {"train_loss": -5.926928997039795, "global_step": 64751, "epoch": 1541} {"train_loss": -5.881142616271973, "global_step": 64752, "epoch": 1541} {"train_loss": -5.768014907836914, "global_step": 64753, "epoch": 1541} {"train_loss": -5.93742561340332, "global_step": 64754, "epoch": 1541} {"train_loss": -5.938988208770752, "global_step": 64755, "epoch": 1541} {"train_loss": -5.8884429931640625, "global_step": 64756, "epoch": 1541} {"train_loss": -6.027133941650391, "global_step": 64757, "epoch": 1541} {"train_loss": -5.930631637573242, "global_step": 64758, "epoch": 1541} {"train_loss": -5.9871673583984375, "global_step": 64759, "epoch": 1541} {"train_loss": -5.863408088684082, "global_step": 64760, "epoch": 1541} {"train_loss": -5.953957557678223, "global_step": 64761, "epoch": 1541} {"train_loss": -5.961544990539551, "global_step": 64762, "epoch": 1541} {"train_loss": -5.9445944513593405, "global_step": 64763, "epoch": 1541, "val_loss": 61527.3671875} {"train_loss": -6.011629104614258, "global_step": 64764, "epoch": 1542} {"train_loss": -6.007807731628418, "global_step": 64765, "epoch": 1542} {"train_loss": -5.898772239685059, "global_step": 64766, "epoch": 1542} {"train_loss": -6.0631232261657715, "global_step": 64767, "epoch": 1542} {"train_loss": -6.009551525115967, "global_step": 64768, "epoch": 1542} {"train_loss": -5.966317176818848, "global_step": 64769, "epoch": 1542} {"train_loss": -5.931831359863281, "global_step": 64770, "epoch": 1542} {"train_loss": -6.068285942077637, "global_step": 64771, "epoch": 1542} {"train_loss": -5.883823394775391, "global_step": 64772, "epoch": 1542} {"train_loss": -5.971266746520996, "global_step": 64773, "epoch": 1542} {"train_loss": -6.009731292724609, "global_step": 64774, "epoch": 1542} {"train_loss": -6.15958309173584, "global_step": 64775, "epoch": 1542} {"train_loss": -6.0431389808654785, "global_step": 64776, "epoch": 1542} {"train_loss": -6.0356926918029785, "global_step": 64777, "epoch": 1542} {"train_loss": -5.961716175079346, "global_step": 64778, "epoch": 1542} {"train_loss": -6.003483772277832, "global_step": 64779, "epoch": 1542} {"train_loss": -5.906857013702393, "global_step": 64780, "epoch": 1542} {"train_loss": -5.931279182434082, "global_step": 64781, "epoch": 1542} {"train_loss": -5.970054626464844, "global_step": 64782, "epoch": 1542} {"train_loss": -5.905780792236328, "global_step": 64783, "epoch": 1542} {"train_loss": -5.96354341506958, "global_step": 64784, "epoch": 1542} {"train_loss": -6.122052192687988, "global_step": 64785, "epoch": 1542} {"train_loss": -5.864510536193848, "global_step": 64786, "epoch": 1542} {"train_loss": -6.015764236450195, "global_step": 64787, "epoch": 1542} {"train_loss": -6.00962495803833, "global_step": 64788, "epoch": 1542} {"train_loss": -5.772735595703125, "global_step": 64789, "epoch": 1542} {"train_loss": -5.981346130371094, "global_step": 64790, "epoch": 1542} {"train_loss": -5.734387397766113, "global_step": 64791, "epoch": 1542} {"train_loss": -5.890688896179199, "global_step": 64792, "epoch": 1542} {"train_loss": -5.833841323852539, "global_step": 64793, "epoch": 1542} {"train_loss": -5.894238471984863, "global_step": 64794, "epoch": 1542} {"train_loss": -5.905214786529541, "global_step": 64795, "epoch": 1542} {"train_loss": -5.960941314697266, "global_step": 64796, "epoch": 1542} {"train_loss": -5.828597068786621, "global_step": 64797, "epoch": 1542} {"train_loss": -5.933794021606445, "global_step": 64798, "epoch": 1542} {"train_loss": -5.951248645782471, "global_step": 64799, "epoch": 1542} {"train_loss": -5.70554256439209, "global_step": 64800, "epoch": 1542} {"train_loss": -5.84526252746582, "global_step": 64801, "epoch": 1542} {"train_loss": -5.949981212615967, "global_step": 64802, "epoch": 1542} {"train_loss": -5.757855415344238, "global_step": 64803, "epoch": 1542} {"train_loss": -5.926552772521973, "global_step": 64804, "epoch": 1542} {"train_loss": -5.939544053304763, "global_step": 64805, "epoch": 1542, "val_loss": 61744.1875} {"train_loss": -5.90503454208374, "global_step": 64806, "epoch": 1543} {"train_loss": -5.929663181304932, "global_step": 64807, "epoch": 1543} {"train_loss": -5.791869640350342, "global_step": 64808, "epoch": 1543} {"train_loss": -5.87601375579834, "global_step": 64809, "epoch": 1543} {"train_loss": -5.822289943695068, "global_step": 64810, "epoch": 1543} {"train_loss": -6.019868850708008, "global_step": 64811, "epoch": 1543} {"train_loss": -5.946012496948242, "global_step": 64812, "epoch": 1543} {"train_loss": -5.913069725036621, "global_step": 64813, "epoch": 1543} {"train_loss": -5.946976184844971, "global_step": 64814, "epoch": 1543} {"train_loss": -5.924663543701172, "global_step": 64815, "epoch": 1543} {"train_loss": -5.939554214477539, "global_step": 64816, "epoch": 1543} {"train_loss": -6.018918991088867, "global_step": 64817, "epoch": 1543} {"train_loss": -5.920047760009766, "global_step": 64818, "epoch": 1543} {"train_loss": -5.961712837219238, "global_step": 64819, "epoch": 1543} {"train_loss": -5.867233753204346, "global_step": 64820, "epoch": 1543} {"train_loss": -5.992950439453125, "global_step": 64821, "epoch": 1543} {"train_loss": -5.989300727844238, "global_step": 64822, "epoch": 1543} {"train_loss": -5.855421543121338, "global_step": 64823, "epoch": 1543} {"train_loss": -5.936203956604004, "global_step": 64824, "epoch": 1543} {"train_loss": -5.990274429321289, "global_step": 64825, "epoch": 1543} {"train_loss": -6.0077409744262695, "global_step": 64826, "epoch": 1543} {"train_loss": -5.905390739440918, "global_step": 64827, "epoch": 1543} {"train_loss": -6.07432746887207, "global_step": 64828, "epoch": 1543} {"train_loss": -5.954751968383789, "global_step": 64829, "epoch": 1543} {"train_loss": -5.999124526977539, "global_step": 64830, "epoch": 1543} {"train_loss": -6.011954307556152, "global_step": 64831, "epoch": 1543} {"train_loss": -5.947388648986816, "global_step": 64832, "epoch": 1543} {"train_loss": -6.048384666442871, "global_step": 64833, "epoch": 1543} {"train_loss": -5.935174942016602, "global_step": 64834, "epoch": 1543} {"train_loss": -5.926329612731934, "global_step": 64835, "epoch": 1543} {"train_loss": -6.067649841308594, "global_step": 64836, "epoch": 1543} {"train_loss": -5.969890117645264, "global_step": 64837, "epoch": 1543} {"train_loss": -5.955752372741699, "global_step": 64838, "epoch": 1543} {"train_loss": -5.960115909576416, "global_step": 64839, "epoch": 1543} {"train_loss": -6.057619094848633, "global_step": 64840, "epoch": 1543} {"train_loss": -5.8857927322387695, "global_step": 64841, "epoch": 1543} {"train_loss": -6.006539344787598, "global_step": 64842, "epoch": 1543} {"train_loss": -5.91160774230957, "global_step": 64843, "epoch": 1543} {"train_loss": -5.835633277893066, "global_step": 64844, "epoch": 1543} {"train_loss": -5.985893249511719, "global_step": 64845, "epoch": 1543} {"train_loss": -5.963073253631592, "global_step": 64846, "epoch": 1543} {"train_loss": -5.950286626815796, "global_step": 64847, "epoch": 1543, "val_loss": 61407.93359375} {"train_loss": -5.890618324279785, "global_step": 64848, "epoch": 1544} {"train_loss": -5.963163375854492, "global_step": 64849, "epoch": 1544} {"train_loss": -5.948278427124023, "global_step": 64850, "epoch": 1544} {"train_loss": -5.945683002471924, "global_step": 64851, "epoch": 1544} {"train_loss": -5.835247993469238, "global_step": 64852, "epoch": 1544} {"train_loss": -5.925737380981445, "global_step": 64853, "epoch": 1544} {"train_loss": -6.158431053161621, "global_step": 64854, "epoch": 1544} {"train_loss": -5.95236873626709, "global_step": 64855, "epoch": 1544} {"train_loss": -5.969979286193848, "global_step": 64856, "epoch": 1544} {"train_loss": -6.101785659790039, "global_step": 64857, "epoch": 1544} {"train_loss": -6.0005784034729, "global_step": 64858, "epoch": 1544} {"train_loss": -5.977159023284912, "global_step": 64859, "epoch": 1544} {"train_loss": -5.9849772453308105, "global_step": 64860, "epoch": 1544} {"train_loss": -6.055409908294678, "global_step": 64861, "epoch": 1544} {"train_loss": -5.92710018157959, "global_step": 64862, "epoch": 1544} {"train_loss": -6.011668682098389, "global_step": 64863, "epoch": 1544} {"train_loss": -5.93570613861084, "global_step": 64864, "epoch": 1544} {"train_loss": -5.987675666809082, "global_step": 64865, "epoch": 1544} {"train_loss": -5.975135803222656, "global_step": 64866, "epoch": 1544} {"train_loss": -6.013623237609863, "global_step": 64867, "epoch": 1544} {"train_loss": -5.998104572296143, "global_step": 64868, "epoch": 1544} {"train_loss": -5.939100742340088, "global_step": 64869, "epoch": 1544} {"train_loss": -5.9465107917785645, "global_step": 64870, "epoch": 1544} {"train_loss": -5.925765514373779, "global_step": 64871, "epoch": 1544} {"train_loss": -5.969549655914307, "global_step": 64872, "epoch": 1544} {"train_loss": -5.9891533851623535, "global_step": 64873, "epoch": 1544} {"train_loss": -5.886187553405762, "global_step": 64874, "epoch": 1544} {"train_loss": -6.113138198852539, "global_step": 64875, "epoch": 1544} {"train_loss": -5.937665939331055, "global_step": 64876, "epoch": 1544} {"train_loss": -5.85079288482666, "global_step": 64877, "epoch": 1544} {"train_loss": -6.05704927444458, "global_step": 64878, "epoch": 1544} {"train_loss": -5.9674072265625, "global_step": 64879, "epoch": 1544} {"train_loss": -5.954100131988525, "global_step": 64880, "epoch": 1544} {"train_loss": -5.958667755126953, "global_step": 64881, "epoch": 1544} {"train_loss": -5.923737525939941, "global_step": 64882, "epoch": 1544} {"train_loss": -5.9698286056518555, "global_step": 64883, "epoch": 1544} {"train_loss": -6.089136123657227, "global_step": 64884, "epoch": 1544} {"train_loss": -6.104740619659424, "global_step": 64885, "epoch": 1544} {"train_loss": -5.964612007141113, "global_step": 64886, "epoch": 1544} {"train_loss": -5.993083953857422, "global_step": 64887, "epoch": 1544} {"train_loss": -5.978266716003418, "global_step": 64888, "epoch": 1544} {"train_loss": -5.976461512701852, "global_step": 64889, "epoch": 1544, "val_loss": 61433.09375} {"train_loss": -6.033817291259766, "global_step": 64890, "epoch": 1545} {"train_loss": -5.946658611297607, "global_step": 64891, "epoch": 1545} {"train_loss": -6.026971817016602, "global_step": 64892, "epoch": 1545} {"train_loss": -5.943341255187988, "global_step": 64893, "epoch": 1545} {"train_loss": -6.000543594360352, "global_step": 64894, "epoch": 1545} {"train_loss": -5.981524467468262, "global_step": 64895, "epoch": 1545} {"train_loss": -6.060999870300293, "global_step": 64896, "epoch": 1545} {"train_loss": -5.935184955596924, "global_step": 64897, "epoch": 1545} {"train_loss": -5.881695747375488, "global_step": 64898, "epoch": 1545} {"train_loss": -5.970586776733398, "global_step": 64899, "epoch": 1545} {"train_loss": -5.938940048217773, "global_step": 64900, "epoch": 1545} {"train_loss": -5.907824993133545, "global_step": 64901, "epoch": 1545} {"train_loss": -5.9895734786987305, "global_step": 64902, "epoch": 1545} {"train_loss": -5.9731550216674805, "global_step": 64903, "epoch": 1545} {"train_loss": -6.079346656799316, "global_step": 64904, "epoch": 1545} {"train_loss": -5.980478286743164, "global_step": 64905, "epoch": 1545} {"train_loss": -5.928286075592041, "global_step": 64906, "epoch": 1545} {"train_loss": -5.965545654296875, "global_step": 64907, "epoch": 1545} {"train_loss": -6.029275894165039, "global_step": 64908, "epoch": 1545} {"train_loss": -5.972521781921387, "global_step": 64909, "epoch": 1545} {"train_loss": -5.936352729797363, "global_step": 64910, "epoch": 1545} {"train_loss": -6.039320468902588, "global_step": 64911, "epoch": 1545} {"train_loss": -6.005411148071289, "global_step": 64912, "epoch": 1545} {"train_loss": -5.969791889190674, "global_step": 64913, "epoch": 1545} {"train_loss": -5.917270183563232, "global_step": 64914, "epoch": 1545} {"train_loss": -5.953190803527832, "global_step": 64915, "epoch": 1545} {"train_loss": -5.985256195068359, "global_step": 64916, "epoch": 1545} {"train_loss": -5.902977466583252, "global_step": 64917, "epoch": 1545} {"train_loss": -5.92137336730957, "global_step": 64918, "epoch": 1545} {"train_loss": -5.971770763397217, "global_step": 64919, "epoch": 1545} {"train_loss": -5.834146499633789, "global_step": 64920, "epoch": 1545} {"train_loss": -6.038629531860352, "global_step": 64921, "epoch": 1545} {"train_loss": -5.993566513061523, "global_step": 64922, "epoch": 1545} {"train_loss": -5.956263065338135, "global_step": 64923, "epoch": 1545} {"train_loss": -5.934134483337402, "global_step": 64924, "epoch": 1545} {"train_loss": -5.901116371154785, "global_step": 64925, "epoch": 1545} {"train_loss": -5.915365219116211, "global_step": 64926, "epoch": 1545} {"train_loss": -6.076591491699219, "global_step": 64927, "epoch": 1545} {"train_loss": -5.955969333648682, "global_step": 64928, "epoch": 1545} {"train_loss": -5.975747108459473, "global_step": 64929, "epoch": 1545} {"train_loss": -5.79944372177124, "global_step": 64930, "epoch": 1545} {"train_loss": -5.966937803086781, "global_step": 64931, "epoch": 1545, "val_loss": 61462.21875} {"train_loss": -5.966498374938965, "global_step": 64932, "epoch": 1546} {"train_loss": -5.862246036529541, "global_step": 64933, "epoch": 1546} {"train_loss": -6.075974464416504, "global_step": 64934, "epoch": 1546} {"train_loss": -5.887690544128418, "global_step": 64935, "epoch": 1546} {"train_loss": -6.022146224975586, "global_step": 64936, "epoch": 1546} {"train_loss": -6.024302959442139, "global_step": 64937, "epoch": 1546} {"train_loss": -5.943938255310059, "global_step": 64938, "epoch": 1546} {"train_loss": -5.990328311920166, "global_step": 64939, "epoch": 1546} {"train_loss": -5.976283073425293, "global_step": 64940, "epoch": 1546} {"train_loss": -6.027037620544434, "global_step": 64941, "epoch": 1546} {"train_loss": -5.943999290466309, "global_step": 64942, "epoch": 1546} {"train_loss": -6.038114547729492, "global_step": 64943, "epoch": 1546} {"train_loss": -5.888351917266846, "global_step": 64944, "epoch": 1546} {"train_loss": -6.016171455383301, "global_step": 64945, "epoch": 1546} {"train_loss": -5.867018222808838, "global_step": 64946, "epoch": 1546} {"train_loss": -6.116029739379883, "global_step": 64947, "epoch": 1546} {"train_loss": -5.926620006561279, "global_step": 64948, "epoch": 1546} {"train_loss": -5.951569557189941, "global_step": 64949, "epoch": 1546} {"train_loss": -6.05781888961792, "global_step": 64950, "epoch": 1546} {"train_loss": -5.908646106719971, "global_step": 64951, "epoch": 1546} {"train_loss": -6.0668182373046875, "global_step": 64952, "epoch": 1546} {"train_loss": -5.958920478820801, "global_step": 64953, "epoch": 1546} {"train_loss": -5.9334564208984375, "global_step": 64954, "epoch": 1546} {"train_loss": -6.057981967926025, "global_step": 64955, "epoch": 1546} {"train_loss": -6.089143753051758, "global_step": 64956, "epoch": 1546} {"train_loss": -6.071115016937256, "global_step": 64957, "epoch": 1546} {"train_loss": -6.100387096405029, "global_step": 64958, "epoch": 1546} {"train_loss": -6.086623191833496, "global_step": 64959, "epoch": 1546} {"train_loss": -6.115006446838379, "global_step": 64960, "epoch": 1546} {"train_loss": -6.025201797485352, "global_step": 64961, "epoch": 1546} {"train_loss": -6.0973405838012695, "global_step": 64962, "epoch": 1546} {"train_loss": -5.895390510559082, "global_step": 64963, "epoch": 1546} {"train_loss": -5.839533805847168, "global_step": 64964, "epoch": 1546} {"train_loss": -6.057596683502197, "global_step": 64965, "epoch": 1546} {"train_loss": -5.902887344360352, "global_step": 64966, "epoch": 1546} {"train_loss": -5.865079879760742, "global_step": 64967, "epoch": 1546} {"train_loss": -5.972999572753906, "global_step": 64968, "epoch": 1546} {"train_loss": -5.906305313110352, "global_step": 64969, "epoch": 1546} {"train_loss": -5.960011005401611, "global_step": 64970, "epoch": 1546} {"train_loss": -5.930408000946045, "global_step": 64971, "epoch": 1546} {"train_loss": -5.927076816558838, "global_step": 64972, "epoch": 1546} {"train_loss": -5.9847179253896075, "global_step": 64973, "epoch": 1546, "val_loss": 61406.75390625} {"train_loss": -6.019643306732178, "global_step": 64974, "epoch": 1547} {"train_loss": -5.888664245605469, "global_step": 64975, "epoch": 1547} {"train_loss": -6.036243438720703, "global_step": 64976, "epoch": 1547} {"train_loss": -5.944029331207275, "global_step": 64977, "epoch": 1547} {"train_loss": -5.936347007751465, "global_step": 64978, "epoch": 1547} {"train_loss": -6.015903472900391, "global_step": 64979, "epoch": 1547} {"train_loss": -5.971570014953613, "global_step": 64980, "epoch": 1547} {"train_loss": -5.951925754547119, "global_step": 64981, "epoch": 1547} {"train_loss": -5.8665571212768555, "global_step": 64982, "epoch": 1547} {"train_loss": -5.989508628845215, "global_step": 64983, "epoch": 1547} {"train_loss": -6.091883182525635, "global_step": 64984, "epoch": 1547} {"train_loss": -5.9524455070495605, "global_step": 64985, "epoch": 1547} {"train_loss": -6.066253185272217, "global_step": 64986, "epoch": 1547} {"train_loss": -5.9696478843688965, "global_step": 64987, "epoch": 1547} {"train_loss": -6.009909152984619, "global_step": 64988, "epoch": 1547} {"train_loss": -5.925996780395508, "global_step": 64989, "epoch": 1547} {"train_loss": -5.865523815155029, "global_step": 64990, "epoch": 1547} {"train_loss": -5.941590309143066, "global_step": 64991, "epoch": 1547} {"train_loss": -5.90819787979126, "global_step": 64992, "epoch": 1547} {"train_loss": -5.864166736602783, "global_step": 64993, "epoch": 1547} {"train_loss": -6.029869556427002, "global_step": 64994, "epoch": 1547} {"train_loss": -5.832917213439941, "global_step": 64995, "epoch": 1547} {"train_loss": -6.028679370880127, "global_step": 64996, "epoch": 1547} {"train_loss": -6.057339668273926, "global_step": 64997, "epoch": 1547} {"train_loss": -5.969473838806152, "global_step": 64998, "epoch": 1547} {"train_loss": -5.945168495178223, "global_step": 64999, "epoch": 1547} {"train_loss": -5.910370826721191, "global_step": 65000, "epoch": 1547} {"train_loss": -5.899897575378418, "global_step": 65001, "epoch": 1547} {"train_loss": -6.025331497192383, "global_step": 65002, "epoch": 1547} {"train_loss": -6.025802135467529, "global_step": 65003, "epoch": 1547} {"train_loss": -5.822595119476318, "global_step": 65004, "epoch": 1547} {"train_loss": -6.094250202178955, "global_step": 65005, "epoch": 1547} {"train_loss": -5.873429775238037, "global_step": 65006, "epoch": 1547} {"train_loss": -5.8941650390625, "global_step": 65007, "epoch": 1547} {"train_loss": -5.987084865570068, "global_step": 65008, "epoch": 1547} {"train_loss": -6.015250205993652, "global_step": 65009, "epoch": 1547} {"train_loss": -5.955822944641113, "global_step": 65010, "epoch": 1547} {"train_loss": -5.88066291809082, "global_step": 65011, "epoch": 1547} {"train_loss": -5.985245704650879, "global_step": 65012, "epoch": 1547} {"train_loss": -5.84620475769043, "global_step": 65013, "epoch": 1547} {"train_loss": -5.890413284301758, "global_step": 65014, "epoch": 1547} {"train_loss": -5.957461743127732, "global_step": 65015, "epoch": 1547, "val_loss": 61397.54296875} {"train_loss": -5.886689186096191, "global_step": 65016, "epoch": 1548} {"train_loss": -6.010244846343994, "global_step": 65017, "epoch": 1548} {"train_loss": -5.949772357940674, "global_step": 65018, "epoch": 1548} {"train_loss": -5.910399436950684, "global_step": 65019, "epoch": 1548} {"train_loss": -5.998093605041504, "global_step": 65020, "epoch": 1548} {"train_loss": -5.956272125244141, "global_step": 65021, "epoch": 1548} {"train_loss": -5.918290615081787, "global_step": 65022, "epoch": 1548} {"train_loss": -5.873903751373291, "global_step": 65023, "epoch": 1548} {"train_loss": -5.946590423583984, "global_step": 65024, "epoch": 1548} {"train_loss": -6.036666393280029, "global_step": 65025, "epoch": 1548} {"train_loss": -5.98684024810791, "global_step": 65026, "epoch": 1548} {"train_loss": -5.965946197509766, "global_step": 65027, "epoch": 1548} {"train_loss": -6.09182596206665, "global_step": 65028, "epoch": 1548} {"train_loss": -5.8792595863342285, "global_step": 65029, "epoch": 1548} {"train_loss": -5.922818660736084, "global_step": 65030, "epoch": 1548} {"train_loss": -6.047097206115723, "global_step": 65031, "epoch": 1548} {"train_loss": -5.920129776000977, "global_step": 65032, "epoch": 1548} {"train_loss": -6.034583568572998, "global_step": 65033, "epoch": 1548} {"train_loss": -5.886369705200195, "global_step": 65034, "epoch": 1548} {"train_loss": -5.824462890625, "global_step": 65035, "epoch": 1548} {"train_loss": -5.891419887542725, "global_step": 65036, "epoch": 1548} {"train_loss": -5.906075954437256, "global_step": 65037, "epoch": 1548} {"train_loss": -5.897782325744629, "global_step": 65038, "epoch": 1548} {"train_loss": -5.940040588378906, "global_step": 65039, "epoch": 1548} {"train_loss": -5.946160316467285, "global_step": 65040, "epoch": 1548} {"train_loss": -5.994924545288086, "global_step": 65041, "epoch": 1548} {"train_loss": -6.004118919372559, "global_step": 65042, "epoch": 1548} {"train_loss": -5.99119758605957, "global_step": 65043, "epoch": 1548} {"train_loss": -5.976537227630615, "global_step": 65044, "epoch": 1548} {"train_loss": -5.87085485458374, "global_step": 65045, "epoch": 1548} {"train_loss": -5.986996650695801, "global_step": 65046, "epoch": 1548} {"train_loss": -5.911697864532471, "global_step": 65047, "epoch": 1548} {"train_loss": -6.130687236785889, "global_step": 65048, "epoch": 1548} {"train_loss": -5.837131977081299, "global_step": 65049, "epoch": 1548} {"train_loss": -5.87106990814209, "global_step": 65050, "epoch": 1548} {"train_loss": -6.015357971191406, "global_step": 65051, "epoch": 1548} {"train_loss": -5.936216354370117, "global_step": 65052, "epoch": 1548} {"train_loss": -5.918496131896973, "global_step": 65053, "epoch": 1548} {"train_loss": -6.0826416015625, "global_step": 65054, "epoch": 1548} {"train_loss": -6.024918079376221, "global_step": 65055, "epoch": 1548} {"train_loss": -5.995204925537109, "global_step": 65056, "epoch": 1548} {"train_loss": -5.956704060236613, "global_step": 65057, "epoch": 1548, "val_loss": 61222.13671875} {"train_loss": -5.933559417724609, "global_step": 65058, "epoch": 1549} {"train_loss": -5.917128086090088, "global_step": 65059, "epoch": 1549} {"train_loss": -6.088798999786377, "global_step": 65060, "epoch": 1549} {"train_loss": -5.880507469177246, "global_step": 65061, "epoch": 1549} {"train_loss": -6.004121780395508, "global_step": 65062, "epoch": 1549} {"train_loss": -6.005688667297363, "global_step": 65063, "epoch": 1549} {"train_loss": -6.000189781188965, "global_step": 65064, "epoch": 1549} {"train_loss": -6.030316352844238, "global_step": 65065, "epoch": 1549} {"train_loss": -6.005518913269043, "global_step": 65066, "epoch": 1549} {"train_loss": -5.944515228271484, "global_step": 65067, "epoch": 1549} {"train_loss": -6.105195045471191, "global_step": 65068, "epoch": 1549} {"train_loss": -5.970103740692139, "global_step": 65069, "epoch": 1549} {"train_loss": -5.980924606323242, "global_step": 65070, "epoch": 1549} {"train_loss": -5.965381622314453, "global_step": 65071, "epoch": 1549} {"train_loss": -6.053650379180908, "global_step": 65072, "epoch": 1549} {"train_loss": -5.971173286437988, "global_step": 65073, "epoch": 1549} {"train_loss": -5.97213077545166, "global_step": 65074, "epoch": 1549} {"train_loss": -5.952121257781982, "global_step": 65075, "epoch": 1549} {"train_loss": -6.0031585693359375, "global_step": 65076, "epoch": 1549} {"train_loss": -6.063167572021484, "global_step": 65077, "epoch": 1549} {"train_loss": -6.030880928039551, "global_step": 65078, "epoch": 1549} {"train_loss": -5.962436676025391, "global_step": 65079, "epoch": 1549} {"train_loss": -6.039148330688477, "global_step": 65080, "epoch": 1549} {"train_loss": -5.985790252685547, "global_step": 65081, "epoch": 1549} {"train_loss": -5.747037887573242, "global_step": 65082, "epoch": 1549} {"train_loss": -5.993600368499756, "global_step": 65083, "epoch": 1549} {"train_loss": -6.071920394897461, "global_step": 65084, "epoch": 1549} {"train_loss": -5.863412380218506, "global_step": 65085, "epoch": 1549} {"train_loss": -5.99263858795166, "global_step": 65086, "epoch": 1549} {"train_loss": -6.023492813110352, "global_step": 65087, "epoch": 1549} {"train_loss": -6.015779972076416, "global_step": 65088, "epoch": 1549} {"train_loss": -6.038243293762207, "global_step": 65089, "epoch": 1549} {"train_loss": -6.018462657928467, "global_step": 65090, "epoch": 1549} {"train_loss": -5.96370792388916, "global_step": 65091, "epoch": 1549} {"train_loss": -6.048788547515869, "global_step": 65092, "epoch": 1549} {"train_loss": -5.913211345672607, "global_step": 65093, "epoch": 1549} {"train_loss": -5.902807712554932, "global_step": 65094, "epoch": 1549} {"train_loss": -6.033401012420654, "global_step": 65095, "epoch": 1549} {"train_loss": -6.00160551071167, "global_step": 65096, "epoch": 1549} {"train_loss": -5.949322700500488, "global_step": 65097, "epoch": 1549} {"train_loss": -5.9654541015625, "global_step": 65098, "epoch": 1549} {"train_loss": -5.986408971604847, "global_step": 65099, "epoch": 1549, "val_loss": 61515.9140625} {"train_loss": -5.919787406921387, "global_step": 65100, "epoch": 1550} {"train_loss": -6.098349571228027, "global_step": 65101, "epoch": 1550} {"train_loss": -6.039645671844482, "global_step": 65102, "epoch": 1550} {"train_loss": -6.093601226806641, "global_step": 65103, "epoch": 1550} {"train_loss": -5.929635047912598, "global_step": 65104, "epoch": 1550} {"train_loss": -6.099789142608643, "global_step": 65105, "epoch": 1550} {"train_loss": -6.088423728942871, "global_step": 65106, "epoch": 1550} {"train_loss": -5.985424995422363, "global_step": 65107, "epoch": 1550} {"train_loss": -6.033775329589844, "global_step": 65108, "epoch": 1550} {"train_loss": -5.869616508483887, "global_step": 65109, "epoch": 1550} {"train_loss": -5.87330436706543, "global_step": 65110, "epoch": 1550} {"train_loss": -6.0714111328125, "global_step": 65111, "epoch": 1550} {"train_loss": -5.924623966217041, "global_step": 65112, "epoch": 1550} {"train_loss": -5.852715969085693, "global_step": 65113, "epoch": 1550} {"train_loss": -6.106175422668457, "global_step": 65114, "epoch": 1550} {"train_loss": -5.89060640335083, "global_step": 65115, "epoch": 1550} {"train_loss": -5.83720064163208, "global_step": 65116, "epoch": 1550} {"train_loss": -5.939380645751953, "global_step": 65117, "epoch": 1550} {"train_loss": -5.833404064178467, "global_step": 65118, "epoch": 1550} {"train_loss": -5.916196346282959, "global_step": 65119, "epoch": 1550} {"train_loss": -6.045502662658691, "global_step": 65120, "epoch": 1550} {"train_loss": -5.89553689956665, "global_step": 65121, "epoch": 1550} {"train_loss": -6.020432472229004, "global_step": 65122, "epoch": 1550} {"train_loss": -5.898922920227051, "global_step": 65123, "epoch": 1550} {"train_loss": -6.018573760986328, "global_step": 65124, "epoch": 1550} {"train_loss": -5.985945224761963, "global_step": 65125, "epoch": 1550} {"train_loss": -5.937762260437012, "global_step": 65126, "epoch": 1550} {"train_loss": -6.020479202270508, "global_step": 65127, "epoch": 1550} {"train_loss": -5.958881855010986, "global_step": 65128, "epoch": 1550} {"train_loss": -5.850410461425781, "global_step": 65129, "epoch": 1550} {"train_loss": -5.896224498748779, "global_step": 65130, "epoch": 1550} {"train_loss": -5.96522855758667, "global_step": 65131, "epoch": 1550} {"train_loss": -5.839691162109375, "global_step": 65132, "epoch": 1550} {"train_loss": -5.947856903076172, "global_step": 65133, "epoch": 1550} {"train_loss": -5.863954544067383, "global_step": 65134, "epoch": 1550} {"train_loss": -5.927701950073242, "global_step": 65135, "epoch": 1550} {"train_loss": -5.924712181091309, "global_step": 65136, "epoch": 1550} {"train_loss": -5.881304740905762, "global_step": 65137, "epoch": 1550} {"train_loss": -5.872451305389404, "global_step": 65138, "epoch": 1550} {"train_loss": -5.999849319458008, "global_step": 65139, "epoch": 1550} {"train_loss": -5.967209815979004, "global_step": 65140, "epoch": 1550} {"train_loss": -5.952568190438407, "global_step": 65141, "epoch": 1550, "train/sim_max_reward_0": 0.9129038525243296, "train/sim_max_reward_1": 0.207758746665346, "train/sim_max_reward_2": 0.6637943580269555, "train/sim_max_reward_3": 0.42435364777856127, "train/sim_max_reward_4": 0.8038640306497006, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.03460449895889544, "test/sim_max_reward_4300001": 0.41996954540594306, "test/sim_max_reward_4300002": 0.9791948575217602, "test/sim_max_reward_4300003": 0.7431013347739713, "test/sim_max_reward_4300004": 0.11746710685292379, "test/sim_max_reward_4300005": 0.8093416742455313, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.32756136446210116, "test/sim_max_reward_4300008": 0.9543797849401416, "test/sim_max_reward_4300009": 0.6492543953468387, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.2783026702252576, "test/sim_max_reward_4300012": 0.42396930465892624, "test/sim_max_reward_4300013": 0.4070645615595594, "test/sim_max_reward_4300014": 0.9268032675853629, "test/sim_max_reward_4300015": 0.2628014928820001, "test/sim_max_reward_4300016": 0.6112867696112736, "test/sim_max_reward_4300017": 0.7226675226374398, "test/sim_max_reward_4300018": 0.32947354858708716, "test/sim_max_reward_4300019": 0.18495192641089753, "test/sim_max_reward_4300020": 0.9450370912900478, "test/sim_max_reward_4300021": 0.9312323013091649, "test/sim_max_reward_4300022": 0.7264875239461163, "test/sim_max_reward_4300023": 0.335927447950123, "test/sim_max_reward_4300024": 0.42878012569874285, "test/sim_max_reward_4300025": 0.7446411882448629, "test/sim_max_reward_4300026": 0.8910279713323168, "test/sim_max_reward_4300027": 0.8614850705069806, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.05708011330199215, "test/sim_max_reward_4300030": 0.2158513658689002, "test/sim_max_reward_4300031": 0.08718068661420339, "test/sim_max_reward_4300032": 0.8536939455979102, "test/sim_max_reward_4300033": 0.9384000457271496, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.19957623108273573, "test/sim_max_reward_4300037": 0.5821384204588322, "test/sim_max_reward_4300038": 0.5459243599977411, "test/sim_max_reward_4300039": 0.6462161028218322, "test/sim_max_reward_4300040": 0.7153750380860532, "test/sim_max_reward_4300041": 0.8080993339205065, "test/sim_max_reward_4300042": 0.5298689619816487, "test/sim_max_reward_4300043": 0.11698135616871097, "test/sim_max_reward_4300044": 0.8276204189329938, "test/sim_max_reward_4300045": 0.9308734070623572, "test/sim_max_reward_4300046": 0.9472773561785457, "test/sim_max_reward_4300047": 0.17085263002626358, "test/sim_max_reward_4300048": 0.9813708807389132, "test/sim_max_reward_4300049": 0.6247750150783262, "train/mean_score": 0.5342765658345133, "test/mean_score": 0.5165194003317977, "val_loss": 61662.9375} {"train_loss": -5.970224857330322, "global_step": 65142, "epoch": 1551} {"train_loss": -5.9096784591674805, "global_step": 65143, "epoch": 1551} {"train_loss": -5.996465682983398, "global_step": 65144, "epoch": 1551} {"train_loss": -5.9271135330200195, "global_step": 65145, "epoch": 1551} {"train_loss": -5.909374237060547, "global_step": 65146, "epoch": 1551} {"train_loss": -5.933340549468994, "global_step": 65147, "epoch": 1551} {"train_loss": -6.053851127624512, "global_step": 65148, "epoch": 1551} {"train_loss": -5.890566825866699, "global_step": 65149, "epoch": 1551} {"train_loss": -6.098348617553711, "global_step": 65150, "epoch": 1551} {"train_loss": -5.930181503295898, "global_step": 65151, "epoch": 1551} {"train_loss": -5.951143264770508, "global_step": 65152, "epoch": 1551} {"train_loss": -6.14607048034668, "global_step": 65153, "epoch": 1551} {"train_loss": -6.140945911407471, "global_step": 65154, "epoch": 1551} {"train_loss": -5.888213157653809, "global_step": 65155, "epoch": 1551} {"train_loss": -6.013189315795898, "global_step": 65156, "epoch": 1551} {"train_loss": -5.960398197174072, "global_step": 65157, "epoch": 1551} {"train_loss": -6.069228172302246, "global_step": 65158, "epoch": 1551} {"train_loss": -6.022463798522949, "global_step": 65159, "epoch": 1551} {"train_loss": -6.126705169677734, "global_step": 65160, "epoch": 1551} {"train_loss": -6.005720615386963, "global_step": 65161, "epoch": 1551} {"train_loss": -5.960095405578613, "global_step": 65162, "epoch": 1551} {"train_loss": -5.979508399963379, "global_step": 65163, "epoch": 1551} {"train_loss": -6.0547895431518555, "global_step": 65164, "epoch": 1551} {"train_loss": -5.96474027633667, "global_step": 65165, "epoch": 1551} {"train_loss": -5.960012912750244, "global_step": 65166, "epoch": 1551} {"train_loss": -5.94686222076416, "global_step": 65167, "epoch": 1551} {"train_loss": -6.026346206665039, "global_step": 65168, "epoch": 1551} {"train_loss": -6.057260036468506, "global_step": 65169, "epoch": 1551} {"train_loss": -5.947321891784668, "global_step": 65170, "epoch": 1551} {"train_loss": -5.900987148284912, "global_step": 65171, "epoch": 1551} {"train_loss": -5.978490829467773, "global_step": 65172, "epoch": 1551} {"train_loss": -5.954615116119385, "global_step": 65173, "epoch": 1551} {"train_loss": -6.0259904861450195, "global_step": 65174, "epoch": 1551} {"train_loss": -6.001001834869385, "global_step": 65175, "epoch": 1551} {"train_loss": -5.90792989730835, "global_step": 65176, "epoch": 1551} {"train_loss": -5.9772467613220215, "global_step": 65177, "epoch": 1551} {"train_loss": -5.949617862701416, "global_step": 65178, "epoch": 1551} {"train_loss": -5.885339736938477, "global_step": 65179, "epoch": 1551} {"train_loss": -5.994050025939941, "global_step": 65180, "epoch": 1551} {"train_loss": -5.900077819824219, "global_step": 65181, "epoch": 1551} {"train_loss": -5.907767295837402, "global_step": 65182, "epoch": 1551} {"train_loss": -5.981724035172236, "global_step": 65183, "epoch": 1551, "val_loss": 61410.453125} {"train_loss": -6.017889022827148, "global_step": 65184, "epoch": 1552} {"train_loss": -6.018428325653076, "global_step": 65185, "epoch": 1552} {"train_loss": -5.922307014465332, "global_step": 65186, "epoch": 1552} {"train_loss": -5.943091869354248, "global_step": 65187, "epoch": 1552} {"train_loss": -6.081303119659424, "global_step": 65188, "epoch": 1552} {"train_loss": -5.956891059875488, "global_step": 65189, "epoch": 1552} {"train_loss": -5.867737293243408, "global_step": 65190, "epoch": 1552} {"train_loss": -5.918277740478516, "global_step": 65191, "epoch": 1552} {"train_loss": -6.006821632385254, "global_step": 65192, "epoch": 1552} {"train_loss": -5.984466075897217, "global_step": 65193, "epoch": 1552} {"train_loss": -5.964200019836426, "global_step": 65194, "epoch": 1552} {"train_loss": -5.9549455642700195, "global_step": 65195, "epoch": 1552} {"train_loss": -6.105854511260986, "global_step": 65196, "epoch": 1552} {"train_loss": -6.017746925354004, "global_step": 65197, "epoch": 1552} {"train_loss": -6.03999662399292, "global_step": 65198, "epoch": 1552} {"train_loss": -6.029892921447754, "global_step": 65199, "epoch": 1552} {"train_loss": -5.888915538787842, "global_step": 65200, "epoch": 1552} {"train_loss": -5.908492088317871, "global_step": 65201, "epoch": 1552} {"train_loss": -5.972344398498535, "global_step": 65202, "epoch": 1552} {"train_loss": -6.045420169830322, "global_step": 65203, "epoch": 1552} {"train_loss": -5.883549690246582, "global_step": 65204, "epoch": 1552} {"train_loss": -5.939892768859863, "global_step": 65205, "epoch": 1552} {"train_loss": -5.927355766296387, "global_step": 65206, "epoch": 1552} {"train_loss": -5.930669784545898, "global_step": 65207, "epoch": 1552} {"train_loss": -5.97585391998291, "global_step": 65208, "epoch": 1552} {"train_loss": -5.944219589233398, "global_step": 65209, "epoch": 1552} {"train_loss": -6.124863147735596, "global_step": 65210, "epoch": 1552} {"train_loss": -5.85244083404541, "global_step": 65211, "epoch": 1552} {"train_loss": -5.978554725646973, "global_step": 65212, "epoch": 1552} {"train_loss": -5.981784820556641, "global_step": 65213, "epoch": 1552} {"train_loss": -6.058734893798828, "global_step": 65214, "epoch": 1552} {"train_loss": -5.990540027618408, "global_step": 65215, "epoch": 1552} {"train_loss": -6.000369071960449, "global_step": 65216, "epoch": 1552} {"train_loss": -5.982755661010742, "global_step": 65217, "epoch": 1552} {"train_loss": -5.860661506652832, "global_step": 65218, "epoch": 1552} {"train_loss": -5.863788604736328, "global_step": 65219, "epoch": 1552} {"train_loss": -6.0143632888793945, "global_step": 65220, "epoch": 1552} {"train_loss": -5.972570419311523, "global_step": 65221, "epoch": 1552} {"train_loss": -5.940335750579834, "global_step": 65222, "epoch": 1552} {"train_loss": -6.050113677978516, "global_step": 65223, "epoch": 1552} {"train_loss": -5.712087631225586, "global_step": 65224, "epoch": 1552} {"train_loss": -5.968436184383574, "global_step": 65225, "epoch": 1552, "val_loss": 61798.39453125} {"train_loss": -5.841317176818848, "global_step": 65226, "epoch": 1553} {"train_loss": -5.87980318069458, "global_step": 65227, "epoch": 1553} {"train_loss": -5.982645034790039, "global_step": 65228, "epoch": 1553} {"train_loss": -5.867829322814941, "global_step": 65229, "epoch": 1553} {"train_loss": -5.968257904052734, "global_step": 65230, "epoch": 1553} {"train_loss": -5.910930633544922, "global_step": 65231, "epoch": 1553} {"train_loss": -5.828208923339844, "global_step": 65232, "epoch": 1553} {"train_loss": -5.961956024169922, "global_step": 65233, "epoch": 1553} {"train_loss": -5.881059169769287, "global_step": 65234, "epoch": 1553} {"train_loss": -5.945671081542969, "global_step": 65235, "epoch": 1553} {"train_loss": -6.010025501251221, "global_step": 65236, "epoch": 1553} {"train_loss": -5.971729278564453, "global_step": 65237, "epoch": 1553} {"train_loss": -5.882943153381348, "global_step": 65238, "epoch": 1553} {"train_loss": -6.051886081695557, "global_step": 65239, "epoch": 1553} {"train_loss": -5.855341911315918, "global_step": 65240, "epoch": 1553} {"train_loss": -5.979506492614746, "global_step": 65241, "epoch": 1553} {"train_loss": -5.88608980178833, "global_step": 65242, "epoch": 1553} {"train_loss": -5.898433208465576, "global_step": 65243, "epoch": 1553} {"train_loss": -5.9784440994262695, "global_step": 65244, "epoch": 1553} {"train_loss": -5.964266777038574, "global_step": 65245, "epoch": 1553} {"train_loss": -5.857029914855957, "global_step": 65246, "epoch": 1553} {"train_loss": -5.974968433380127, "global_step": 65247, "epoch": 1553} {"train_loss": -5.973348617553711, "global_step": 65248, "epoch": 1553} {"train_loss": -5.9958648681640625, "global_step": 65249, "epoch": 1553} {"train_loss": -6.036316871643066, "global_step": 65250, "epoch": 1553} {"train_loss": -5.861999988555908, "global_step": 65251, "epoch": 1553} {"train_loss": -6.027254104614258, "global_step": 65252, "epoch": 1553} {"train_loss": -5.878108978271484, "global_step": 65253, "epoch": 1553} {"train_loss": -5.9595136642456055, "global_step": 65254, "epoch": 1553} {"train_loss": -5.9616546630859375, "global_step": 65255, "epoch": 1553} {"train_loss": -5.960784912109375, "global_step": 65256, "epoch": 1553} {"train_loss": -5.911533355712891, "global_step": 65257, "epoch": 1553} {"train_loss": -5.984082221984863, "global_step": 65258, "epoch": 1553} {"train_loss": -5.954258918762207, "global_step": 65259, "epoch": 1553} {"train_loss": -6.06585693359375, "global_step": 65260, "epoch": 1553} {"train_loss": -5.937967777252197, "global_step": 65261, "epoch": 1553} {"train_loss": -5.942617416381836, "global_step": 65262, "epoch": 1553} {"train_loss": -6.019495964050293, "global_step": 65263, "epoch": 1553} {"train_loss": -5.894914150238037, "global_step": 65264, "epoch": 1553} {"train_loss": -5.896932601928711, "global_step": 65265, "epoch": 1553} {"train_loss": -6.093341827392578, "global_step": 65266, "epoch": 1553} {"train_loss": -5.944646755854289, "global_step": 65267, "epoch": 1553, "val_loss": 61578.13671875} {"train_loss": -6.023362159729004, "global_step": 65268, "epoch": 1554} {"train_loss": -5.926316738128662, "global_step": 65269, "epoch": 1554} {"train_loss": -5.999752044677734, "global_step": 65270, "epoch": 1554} {"train_loss": -6.079477310180664, "global_step": 65271, "epoch": 1554} {"train_loss": -5.9264044761657715, "global_step": 65272, "epoch": 1554} {"train_loss": -6.168197154998779, "global_step": 65273, "epoch": 1554} {"train_loss": -6.074949264526367, "global_step": 65274, "epoch": 1554} {"train_loss": -6.035884380340576, "global_step": 65275, "epoch": 1554} {"train_loss": -5.990082740783691, "global_step": 65276, "epoch": 1554} {"train_loss": -5.982079029083252, "global_step": 65277, "epoch": 1554} {"train_loss": -5.909296035766602, "global_step": 65278, "epoch": 1554} {"train_loss": -5.995677947998047, "global_step": 65279, "epoch": 1554} {"train_loss": -6.011614799499512, "global_step": 65280, "epoch": 1554} {"train_loss": -6.063708305358887, "global_step": 65281, "epoch": 1554} {"train_loss": -5.922146797180176, "global_step": 65282, "epoch": 1554} {"train_loss": -6.001677989959717, "global_step": 65283, "epoch": 1554} {"train_loss": -5.913740634918213, "global_step": 65284, "epoch": 1554} {"train_loss": -5.8522186279296875, "global_step": 65285, "epoch": 1554} {"train_loss": -5.931170463562012, "global_step": 65286, "epoch": 1554} {"train_loss": -5.929744720458984, "global_step": 65287, "epoch": 1554} {"train_loss": -5.919097423553467, "global_step": 65288, "epoch": 1554} {"train_loss": -5.917675971984863, "global_step": 65289, "epoch": 1554} {"train_loss": -5.92661190032959, "global_step": 65290, "epoch": 1554} {"train_loss": -5.967437744140625, "global_step": 65291, "epoch": 1554} {"train_loss": -5.880061626434326, "global_step": 65292, "epoch": 1554} {"train_loss": -5.8590989112854, "global_step": 65293, "epoch": 1554} {"train_loss": -5.904552459716797, "global_step": 65294, "epoch": 1554} {"train_loss": -5.877825736999512, "global_step": 65295, "epoch": 1554} {"train_loss": -5.992319107055664, "global_step": 65296, "epoch": 1554} {"train_loss": -5.824026584625244, "global_step": 65297, "epoch": 1554} {"train_loss": -5.964598178863525, "global_step": 65298, "epoch": 1554} {"train_loss": -6.133654594421387, "global_step": 65299, "epoch": 1554} {"train_loss": -5.9082841873168945, "global_step": 65300, "epoch": 1554} {"train_loss": -5.999420166015625, "global_step": 65301, "epoch": 1554} {"train_loss": -5.952646732330322, "global_step": 65302, "epoch": 1554} {"train_loss": -5.927857875823975, "global_step": 65303, "epoch": 1554} {"train_loss": -5.932111740112305, "global_step": 65304, "epoch": 1554} {"train_loss": -5.7646708488464355, "global_step": 65305, "epoch": 1554} {"train_loss": -5.995044231414795, "global_step": 65306, "epoch": 1554} {"train_loss": -5.963689804077148, "global_step": 65307, "epoch": 1554} {"train_loss": -5.931927680969238, "global_step": 65308, "epoch": 1554} {"train_loss": -5.95473431405567, "global_step": 65309, "epoch": 1554, "val_loss": 61679.10546875} {"train_loss": -5.884992599487305, "global_step": 65310, "epoch": 1555} {"train_loss": -6.0720977783203125, "global_step": 65311, "epoch": 1555} {"train_loss": -5.8298516273498535, "global_step": 65312, "epoch": 1555} {"train_loss": -6.022545337677002, "global_step": 65313, "epoch": 1555} {"train_loss": -5.877776145935059, "global_step": 65314, "epoch": 1555} {"train_loss": -5.972245216369629, "global_step": 65315, "epoch": 1555} {"train_loss": -5.853360176086426, "global_step": 65316, "epoch": 1555} {"train_loss": -5.954870700836182, "global_step": 65317, "epoch": 1555} {"train_loss": -6.031213283538818, "global_step": 65318, "epoch": 1555} {"train_loss": -5.936933994293213, "global_step": 65319, "epoch": 1555} {"train_loss": -5.969449043273926, "global_step": 65320, "epoch": 1555} {"train_loss": -6.0263776779174805, "global_step": 65321, "epoch": 1555} {"train_loss": -5.994009971618652, "global_step": 65322, "epoch": 1555} {"train_loss": -5.889180660247803, "global_step": 65323, "epoch": 1555} {"train_loss": -6.039003372192383, "global_step": 65324, "epoch": 1555} {"train_loss": -5.976651191711426, "global_step": 65325, "epoch": 1555} {"train_loss": -6.035170555114746, "global_step": 65326, "epoch": 1555} {"train_loss": -5.9424943923950195, "global_step": 65327, "epoch": 1555} {"train_loss": -5.960458755493164, "global_step": 65328, "epoch": 1555} {"train_loss": -5.97844123840332, "global_step": 65329, "epoch": 1555} {"train_loss": -5.970726013183594, "global_step": 65330, "epoch": 1555} {"train_loss": -5.970917224884033, "global_step": 65331, "epoch": 1555} {"train_loss": -5.977312088012695, "global_step": 65332, "epoch": 1555} {"train_loss": -6.024407386779785, "global_step": 65333, "epoch": 1555} {"train_loss": -6.018024921417236, "global_step": 65334, "epoch": 1555} {"train_loss": -6.005133628845215, "global_step": 65335, "epoch": 1555} {"train_loss": -6.072938919067383, "global_step": 65336, "epoch": 1555} {"train_loss": -5.965312957763672, "global_step": 65337, "epoch": 1555} {"train_loss": -5.958159923553467, "global_step": 65338, "epoch": 1555} {"train_loss": -5.978323459625244, "global_step": 65339, "epoch": 1555} {"train_loss": -6.041274070739746, "global_step": 65340, "epoch": 1555} {"train_loss": -5.923084735870361, "global_step": 65341, "epoch": 1555} {"train_loss": -5.858482837677002, "global_step": 65342, "epoch": 1555} {"train_loss": -6.0509185791015625, "global_step": 65343, "epoch": 1555} {"train_loss": -5.944216728210449, "global_step": 65344, "epoch": 1555} {"train_loss": -5.999520301818848, "global_step": 65345, "epoch": 1555} {"train_loss": -5.946603298187256, "global_step": 65346, "epoch": 1555} {"train_loss": -6.051266670227051, "global_step": 65347, "epoch": 1555} {"train_loss": -5.910357475280762, "global_step": 65348, "epoch": 1555} {"train_loss": -5.975939750671387, "global_step": 65349, "epoch": 1555} {"train_loss": -5.979405403137207, "global_step": 65350, "epoch": 1555} {"train_loss": -5.970369168690273, "global_step": 65351, "epoch": 1555, "val_loss": 61317.23046875} {"train_loss": -5.963869094848633, "global_step": 65352, "epoch": 1556} {"train_loss": -5.80620002746582, "global_step": 65353, "epoch": 1556} {"train_loss": -6.053818225860596, "global_step": 65354, "epoch": 1556} {"train_loss": -5.8883819580078125, "global_step": 65355, "epoch": 1556} {"train_loss": -5.987712383270264, "global_step": 65356, "epoch": 1556} {"train_loss": -5.983235836029053, "global_step": 65357, "epoch": 1556} {"train_loss": -5.943593978881836, "global_step": 65358, "epoch": 1556} {"train_loss": -6.006617546081543, "global_step": 65359, "epoch": 1556} {"train_loss": -6.022819519042969, "global_step": 65360, "epoch": 1556} {"train_loss": -5.993803977966309, "global_step": 65361, "epoch": 1556} {"train_loss": -5.9542236328125, "global_step": 65362, "epoch": 1556} {"train_loss": -6.001278877258301, "global_step": 65363, "epoch": 1556} {"train_loss": -5.914270877838135, "global_step": 65364, "epoch": 1556} {"train_loss": -6.0430755615234375, "global_step": 65365, "epoch": 1556} {"train_loss": -5.995917320251465, "global_step": 65366, "epoch": 1556} {"train_loss": -6.00185489654541, "global_step": 65367, "epoch": 1556} {"train_loss": -5.95875358581543, "global_step": 65368, "epoch": 1556} {"train_loss": -5.93609619140625, "global_step": 65369, "epoch": 1556} {"train_loss": -5.978628158569336, "global_step": 65370, "epoch": 1556} {"train_loss": -5.935850620269775, "global_step": 65371, "epoch": 1556} {"train_loss": -5.983224868774414, "global_step": 65372, "epoch": 1556} {"train_loss": -5.870961666107178, "global_step": 65373, "epoch": 1556} {"train_loss": -5.9895172119140625, "global_step": 65374, "epoch": 1556} {"train_loss": -6.060236930847168, "global_step": 65375, "epoch": 1556} {"train_loss": -5.932058811187744, "global_step": 65376, "epoch": 1556} {"train_loss": -5.959657669067383, "global_step": 65377, "epoch": 1556} {"train_loss": -5.962488174438477, "global_step": 65378, "epoch": 1556} {"train_loss": -5.91836404800415, "global_step": 65379, "epoch": 1556} {"train_loss": -5.982958793640137, "global_step": 65380, "epoch": 1556} {"train_loss": -5.910407543182373, "global_step": 65381, "epoch": 1556} {"train_loss": -6.041421890258789, "global_step": 65382, "epoch": 1556} {"train_loss": -5.980615615844727, "global_step": 65383, "epoch": 1556} {"train_loss": -5.916525363922119, "global_step": 65384, "epoch": 1556} {"train_loss": -6.0880632400512695, "global_step": 65385, "epoch": 1556} {"train_loss": -5.859220504760742, "global_step": 65386, "epoch": 1556} {"train_loss": -6.002253532409668, "global_step": 65387, "epoch": 1556} {"train_loss": -6.048447132110596, "global_step": 65388, "epoch": 1556} {"train_loss": -5.833544731140137, "global_step": 65389, "epoch": 1556} {"train_loss": -5.954390525817871, "global_step": 65390, "epoch": 1556} {"train_loss": -6.044158458709717, "global_step": 65391, "epoch": 1556} {"train_loss": -6.0106282234191895, "global_step": 65392, "epoch": 1556} {"train_loss": -5.969966650009155, "global_step": 65393, "epoch": 1556, "val_loss": 61718.80078125} {"train_loss": -6.026158809661865, "global_step": 65394, "epoch": 1557} {"train_loss": -6.064495086669922, "global_step": 65395, "epoch": 1557} {"train_loss": -5.977278709411621, "global_step": 65396, "epoch": 1557} {"train_loss": -5.895468711853027, "global_step": 65397, "epoch": 1557} {"train_loss": -6.038034439086914, "global_step": 65398, "epoch": 1557} {"train_loss": -5.836306571960449, "global_step": 65399, "epoch": 1557} {"train_loss": -5.956371307373047, "global_step": 65400, "epoch": 1557} {"train_loss": -6.010024070739746, "global_step": 65401, "epoch": 1557} {"train_loss": -6.0275397300720215, "global_step": 65402, "epoch": 1557} {"train_loss": -5.9920148849487305, "global_step": 65403, "epoch": 1557} {"train_loss": -5.974421501159668, "global_step": 65404, "epoch": 1557} {"train_loss": -6.008573055267334, "global_step": 65405, "epoch": 1557} {"train_loss": -5.979820251464844, "global_step": 65406, "epoch": 1557} {"train_loss": -6.006405830383301, "global_step": 65407, "epoch": 1557} {"train_loss": -5.905943870544434, "global_step": 65408, "epoch": 1557} {"train_loss": -6.165637016296387, "global_step": 65409, "epoch": 1557} {"train_loss": -6.002249717712402, "global_step": 65410, "epoch": 1557} {"train_loss": -5.895287036895752, "global_step": 65411, "epoch": 1557} {"train_loss": -5.973549842834473, "global_step": 65412, "epoch": 1557} {"train_loss": -5.963177680969238, "global_step": 65413, "epoch": 1557} {"train_loss": -5.83860969543457, "global_step": 65414, "epoch": 1557} {"train_loss": -5.984316825866699, "global_step": 65415, "epoch": 1557} {"train_loss": -5.9889020919799805, "global_step": 65416, "epoch": 1557} {"train_loss": -6.038380146026611, "global_step": 65417, "epoch": 1557} {"train_loss": -5.9402642250061035, "global_step": 65418, "epoch": 1557} {"train_loss": -5.942487716674805, "global_step": 65419, "epoch": 1557} {"train_loss": -6.009561538696289, "global_step": 65420, "epoch": 1557} {"train_loss": -5.954572677612305, "global_step": 65421, "epoch": 1557} {"train_loss": -6.061886787414551, "global_step": 65422, "epoch": 1557} {"train_loss": -6.053255558013916, "global_step": 65423, "epoch": 1557} {"train_loss": -5.987397193908691, "global_step": 65424, "epoch": 1557} {"train_loss": -5.992623805999756, "global_step": 65425, "epoch": 1557} {"train_loss": -6.007857322692871, "global_step": 65426, "epoch": 1557} {"train_loss": -6.0889692306518555, "global_step": 65427, "epoch": 1557} {"train_loss": -5.986918926239014, "global_step": 65428, "epoch": 1557} {"train_loss": -5.991992473602295, "global_step": 65429, "epoch": 1557} {"train_loss": -5.9816131591796875, "global_step": 65430, "epoch": 1557} {"train_loss": -6.0116496086120605, "global_step": 65431, "epoch": 1557} {"train_loss": -6.031164169311523, "global_step": 65432, "epoch": 1557} {"train_loss": -5.976612567901611, "global_step": 65433, "epoch": 1557} {"train_loss": -5.958140850067139, "global_step": 65434, "epoch": 1557} {"train_loss": -5.988871971766154, "global_step": 65435, "epoch": 1557, "val_loss": 61357.4375} {"train_loss": -5.9705047607421875, "global_step": 65436, "epoch": 1558} {"train_loss": -5.936432838439941, "global_step": 65437, "epoch": 1558} {"train_loss": -6.008636474609375, "global_step": 65438, "epoch": 1558} {"train_loss": -5.952610492706299, "global_step": 65439, "epoch": 1558} {"train_loss": -5.885641098022461, "global_step": 65440, "epoch": 1558} {"train_loss": -6.085880279541016, "global_step": 65441, "epoch": 1558} {"train_loss": -5.946714401245117, "global_step": 65442, "epoch": 1558} {"train_loss": -6.035641670227051, "global_step": 65443, "epoch": 1558} {"train_loss": -5.9061689376831055, "global_step": 65444, "epoch": 1558} {"train_loss": -6.007192611694336, "global_step": 65445, "epoch": 1558} {"train_loss": -5.986027717590332, "global_step": 65446, "epoch": 1558} {"train_loss": -5.928235054016113, "global_step": 65447, "epoch": 1558} {"train_loss": -5.986527442932129, "global_step": 65448, "epoch": 1558} {"train_loss": -5.896078109741211, "global_step": 65449, "epoch": 1558} {"train_loss": -5.961776256561279, "global_step": 65450, "epoch": 1558} {"train_loss": -5.905587196350098, "global_step": 65451, "epoch": 1558} {"train_loss": -5.86943244934082, "global_step": 65452, "epoch": 1558} {"train_loss": -5.698309421539307, "global_step": 65453, "epoch": 1558} {"train_loss": -6.109245300292969, "global_step": 65454, "epoch": 1558} {"train_loss": -5.983828067779541, "global_step": 65455, "epoch": 1558} {"train_loss": -5.817144393920898, "global_step": 65456, "epoch": 1558} {"train_loss": -5.744958400726318, "global_step": 65457, "epoch": 1558} {"train_loss": -5.938928604125977, "global_step": 65458, "epoch": 1558} {"train_loss": -5.733127593994141, "global_step": 65459, "epoch": 1558} {"train_loss": -5.935627460479736, "global_step": 65460, "epoch": 1558} {"train_loss": -5.9450273513793945, "global_step": 65461, "epoch": 1558} {"train_loss": -5.983428001403809, "global_step": 65462, "epoch": 1558} {"train_loss": -5.856974124908447, "global_step": 65463, "epoch": 1558} {"train_loss": -6.019397735595703, "global_step": 65464, "epoch": 1558} {"train_loss": -5.915092945098877, "global_step": 65465, "epoch": 1558} {"train_loss": -5.968438148498535, "global_step": 65466, "epoch": 1558} {"train_loss": -5.972031593322754, "global_step": 65467, "epoch": 1558} {"train_loss": -5.928304672241211, "global_step": 65468, "epoch": 1558} {"train_loss": -5.972756385803223, "global_step": 65469, "epoch": 1558} {"train_loss": -6.036806106567383, "global_step": 65470, "epoch": 1558} {"train_loss": -5.799757957458496, "global_step": 65471, "epoch": 1558} {"train_loss": -6.047916412353516, "global_step": 65472, "epoch": 1558} {"train_loss": -5.833853721618652, "global_step": 65473, "epoch": 1558} {"train_loss": -5.8333940505981445, "global_step": 65474, "epoch": 1558} {"train_loss": -5.797306060791016, "global_step": 65475, "epoch": 1558} {"train_loss": -6.006796836853027, "global_step": 65476, "epoch": 1558} {"train_loss": -5.931780383700416, "global_step": 65477, "epoch": 1558, "val_loss": 61544.31640625} {"train_loss": -5.898869514465332, "global_step": 65478, "epoch": 1559} {"train_loss": -5.982937812805176, "global_step": 65479, "epoch": 1559} {"train_loss": -5.928597927093506, "global_step": 65480, "epoch": 1559} {"train_loss": -5.929370403289795, "global_step": 65481, "epoch": 1559} {"train_loss": -5.878767967224121, "global_step": 65482, "epoch": 1559} {"train_loss": -5.887763977050781, "global_step": 65483, "epoch": 1559} {"train_loss": -6.010014533996582, "global_step": 65484, "epoch": 1559} {"train_loss": -5.8230133056640625, "global_step": 65485, "epoch": 1559} {"train_loss": -5.787558078765869, "global_step": 65486, "epoch": 1559} {"train_loss": -5.944674968719482, "global_step": 65487, "epoch": 1559} {"train_loss": -5.9952874183654785, "global_step": 65488, "epoch": 1559} {"train_loss": -6.013218402862549, "global_step": 65489, "epoch": 1559} {"train_loss": -5.999347686767578, "global_step": 65490, "epoch": 1559} {"train_loss": -5.781811714172363, "global_step": 65491, "epoch": 1559} {"train_loss": -5.970254421234131, "global_step": 65492, "epoch": 1559} {"train_loss": -5.837760925292969, "global_step": 65493, "epoch": 1559} {"train_loss": -5.905163764953613, "global_step": 65494, "epoch": 1559} {"train_loss": -6.019920349121094, "global_step": 65495, "epoch": 1559} {"train_loss": -5.9839677810668945, "global_step": 65496, "epoch": 1559} {"train_loss": -5.91216516494751, "global_step": 65497, "epoch": 1559} {"train_loss": -5.95750617980957, "global_step": 65498, "epoch": 1559} {"train_loss": -6.14199161529541, "global_step": 65499, "epoch": 1559} {"train_loss": -5.97981071472168, "global_step": 65500, "epoch": 1559} {"train_loss": -5.828001976013184, "global_step": 65501, "epoch": 1559} {"train_loss": -6.1050615310668945, "global_step": 65502, "epoch": 1559} {"train_loss": -5.916903495788574, "global_step": 65503, "epoch": 1559} {"train_loss": -5.950054168701172, "global_step": 65504, "epoch": 1559} {"train_loss": -5.967677116394043, "global_step": 65505, "epoch": 1559} {"train_loss": -5.894833564758301, "global_step": 65506, "epoch": 1559} {"train_loss": -5.969918727874756, "global_step": 65507, "epoch": 1559} {"train_loss": -6.047746658325195, "global_step": 65508, "epoch": 1559} {"train_loss": -5.971460819244385, "global_step": 65509, "epoch": 1559} {"train_loss": -6.039613723754883, "global_step": 65510, "epoch": 1559} {"train_loss": -6.0486555099487305, "global_step": 65511, "epoch": 1559} {"train_loss": -6.020587921142578, "global_step": 65512, "epoch": 1559} {"train_loss": -5.897904396057129, "global_step": 65513, "epoch": 1559} {"train_loss": -6.020807266235352, "global_step": 65514, "epoch": 1559} {"train_loss": -6.002625465393066, "global_step": 65515, "epoch": 1559} {"train_loss": -5.867137908935547, "global_step": 65516, "epoch": 1559} {"train_loss": -6.0001912117004395, "global_step": 65517, "epoch": 1559} {"train_loss": -5.886600494384766, "global_step": 65518, "epoch": 1559} {"train_loss": -5.952504998161679, "global_step": 65519, "epoch": 1559, "val_loss": 61518.25390625} {"train_loss": -5.931745529174805, "global_step": 65520, "epoch": 1560} {"train_loss": -5.922495365142822, "global_step": 65521, "epoch": 1560} {"train_loss": -5.991950988769531, "global_step": 65522, "epoch": 1560} {"train_loss": -6.063338279724121, "global_step": 65523, "epoch": 1560} {"train_loss": -5.883184432983398, "global_step": 65524, "epoch": 1560} {"train_loss": -5.991810321807861, "global_step": 65525, "epoch": 1560} {"train_loss": -5.876006126403809, "global_step": 65526, "epoch": 1560} {"train_loss": -6.1444501876831055, "global_step": 65527, "epoch": 1560} {"train_loss": -6.1319169998168945, "global_step": 65528, "epoch": 1560} {"train_loss": -6.018298149108887, "global_step": 65529, "epoch": 1560} {"train_loss": -6.016674995422363, "global_step": 65530, "epoch": 1560} {"train_loss": -6.048053741455078, "global_step": 65531, "epoch": 1560} {"train_loss": -5.991144180297852, "global_step": 65532, "epoch": 1560} {"train_loss": -5.921060562133789, "global_step": 65533, "epoch": 1560} {"train_loss": -6.015631198883057, "global_step": 65534, "epoch": 1560} {"train_loss": -6.031449317932129, "global_step": 65535, "epoch": 1560} {"train_loss": -6.058244705200195, "global_step": 65536, "epoch": 1560} {"train_loss": -5.887723445892334, "global_step": 65537, "epoch": 1560} {"train_loss": -5.9570770263671875, "global_step": 65538, "epoch": 1560} {"train_loss": -5.9557952880859375, "global_step": 65539, "epoch": 1560} {"train_loss": -6.024643898010254, "global_step": 65540, "epoch": 1560} {"train_loss": -5.88442850112915, "global_step": 65541, "epoch": 1560} {"train_loss": -5.945363998413086, "global_step": 65542, "epoch": 1560} {"train_loss": -5.88175106048584, "global_step": 65543, "epoch": 1560} {"train_loss": -6.041184425354004, "global_step": 65544, "epoch": 1560} {"train_loss": -5.812129974365234, "global_step": 65545, "epoch": 1560} {"train_loss": -5.963593006134033, "global_step": 65546, "epoch": 1560} {"train_loss": -5.889082431793213, "global_step": 65547, "epoch": 1560} {"train_loss": -5.824994087219238, "global_step": 65548, "epoch": 1560} {"train_loss": -5.912671089172363, "global_step": 65549, "epoch": 1560} {"train_loss": -5.942201614379883, "global_step": 65550, "epoch": 1560} {"train_loss": -5.935675621032715, "global_step": 65551, "epoch": 1560} {"train_loss": -5.970013618469238, "global_step": 65552, "epoch": 1560} {"train_loss": -6.027279853820801, "global_step": 65553, "epoch": 1560} {"train_loss": -5.987369537353516, "global_step": 65554, "epoch": 1560} {"train_loss": -5.932381629943848, "global_step": 65555, "epoch": 1560} {"train_loss": -6.031717300415039, "global_step": 65556, "epoch": 1560} {"train_loss": -5.963441848754883, "global_step": 65557, "epoch": 1560} {"train_loss": -5.991323947906494, "global_step": 65558, "epoch": 1560} {"train_loss": -5.946056365966797, "global_step": 65559, "epoch": 1560} {"train_loss": -5.89764404296875, "global_step": 65560, "epoch": 1560} {"train_loss": -5.967494340169997, "global_step": 65561, "epoch": 1560, "val_loss": 61319.4609375} {"train_loss": -6.099864959716797, "global_step": 65562, "epoch": 1561} {"train_loss": -5.999630451202393, "global_step": 65563, "epoch": 1561} {"train_loss": -5.904275894165039, "global_step": 65564, "epoch": 1561} {"train_loss": -5.961315155029297, "global_step": 65565, "epoch": 1561} {"train_loss": -6.072169303894043, "global_step": 65566, "epoch": 1561} {"train_loss": -5.946022033691406, "global_step": 65567, "epoch": 1561} {"train_loss": -5.861776351928711, "global_step": 65568, "epoch": 1561} {"train_loss": -6.007454872131348, "global_step": 65569, "epoch": 1561} {"train_loss": -6.026251316070557, "global_step": 65570, "epoch": 1561} {"train_loss": -5.973640441894531, "global_step": 65571, "epoch": 1561} {"train_loss": -5.8575568199157715, "global_step": 65572, "epoch": 1561} {"train_loss": -5.958237648010254, "global_step": 65573, "epoch": 1561} {"train_loss": -6.050551891326904, "global_step": 65574, "epoch": 1561} {"train_loss": -5.840721130371094, "global_step": 65575, "epoch": 1561} {"train_loss": -6.035750389099121, "global_step": 65576, "epoch": 1561} {"train_loss": -6.131314277648926, "global_step": 65577, "epoch": 1561} {"train_loss": -6.003946304321289, "global_step": 65578, "epoch": 1561} {"train_loss": -5.976596832275391, "global_step": 65579, "epoch": 1561} {"train_loss": -5.9714579582214355, "global_step": 65580, "epoch": 1561} {"train_loss": -6.034924507141113, "global_step": 65581, "epoch": 1561} {"train_loss": -5.997200012207031, "global_step": 65582, "epoch": 1561} {"train_loss": -5.952449798583984, "global_step": 65583, "epoch": 1561} {"train_loss": -5.953010082244873, "global_step": 65584, "epoch": 1561} {"train_loss": -5.959439277648926, "global_step": 65585, "epoch": 1561} {"train_loss": -5.928492546081543, "global_step": 65586, "epoch": 1561} {"train_loss": -6.119812965393066, "global_step": 65587, "epoch": 1561} {"train_loss": -5.993462085723877, "global_step": 65588, "epoch": 1561} {"train_loss": -6.024749755859375, "global_step": 65589, "epoch": 1561} {"train_loss": -5.997336387634277, "global_step": 65590, "epoch": 1561} {"train_loss": -5.969514846801758, "global_step": 65591, "epoch": 1561} {"train_loss": -6.023413181304932, "global_step": 65592, "epoch": 1561} {"train_loss": -5.895313262939453, "global_step": 65593, "epoch": 1561} {"train_loss": -5.917112350463867, "global_step": 65594, "epoch": 1561} {"train_loss": -6.038088321685791, "global_step": 65595, "epoch": 1561} {"train_loss": -5.926440238952637, "global_step": 65596, "epoch": 1561} {"train_loss": -5.909930229187012, "global_step": 65597, "epoch": 1561} {"train_loss": -5.956652641296387, "global_step": 65598, "epoch": 1561} {"train_loss": -5.87026834487915, "global_step": 65599, "epoch": 1561} {"train_loss": -5.98194694519043, "global_step": 65600, "epoch": 1561} {"train_loss": -5.794491767883301, "global_step": 65601, "epoch": 1561} {"train_loss": -5.839970588684082, "global_step": 65602, "epoch": 1561} {"train_loss": -5.968470335006714, "global_step": 65603, "epoch": 1561, "val_loss": 61447.26953125} {"train_loss": -5.93939208984375, "global_step": 65604, "epoch": 1562} {"train_loss": -5.920660018920898, "global_step": 65605, "epoch": 1562} {"train_loss": -5.9275970458984375, "global_step": 65606, "epoch": 1562} {"train_loss": -6.00573205947876, "global_step": 65607, "epoch": 1562} {"train_loss": -5.921751976013184, "global_step": 65608, "epoch": 1562} {"train_loss": -5.954302787780762, "global_step": 65609, "epoch": 1562} {"train_loss": -5.999786853790283, "global_step": 65610, "epoch": 1562} {"train_loss": -5.964408874511719, "global_step": 65611, "epoch": 1562} {"train_loss": -5.925693511962891, "global_step": 65612, "epoch": 1562} {"train_loss": -6.0454559326171875, "global_step": 65613, "epoch": 1562} {"train_loss": -5.882444381713867, "global_step": 65614, "epoch": 1562} {"train_loss": -6.053959369659424, "global_step": 65615, "epoch": 1562} {"train_loss": -6.026350975036621, "global_step": 65616, "epoch": 1562} {"train_loss": -6.00050163269043, "global_step": 65617, "epoch": 1562} {"train_loss": -6.054807662963867, "global_step": 65618, "epoch": 1562} {"train_loss": -6.1102294921875, "global_step": 65619, "epoch": 1562} {"train_loss": -5.958260536193848, "global_step": 65620, "epoch": 1562} {"train_loss": -6.0071916580200195, "global_step": 65621, "epoch": 1562} {"train_loss": -6.005003929138184, "global_step": 65622, "epoch": 1562} {"train_loss": -6.107563495635986, "global_step": 65623, "epoch": 1562} {"train_loss": -6.1157073974609375, "global_step": 65624, "epoch": 1562} {"train_loss": -6.005507469177246, "global_step": 65625, "epoch": 1562} {"train_loss": -6.034935474395752, "global_step": 65626, "epoch": 1562} {"train_loss": -6.064044952392578, "global_step": 65627, "epoch": 1562} {"train_loss": -5.995080947875977, "global_step": 65628, "epoch": 1562} {"train_loss": -6.00883674621582, "global_step": 65629, "epoch": 1562} {"train_loss": -5.9350738525390625, "global_step": 65630, "epoch": 1562} {"train_loss": -6.052145004272461, "global_step": 65631, "epoch": 1562} {"train_loss": -5.990344524383545, "global_step": 65632, "epoch": 1562} {"train_loss": -5.908071994781494, "global_step": 65633, "epoch": 1562} {"train_loss": -5.999974250793457, "global_step": 65634, "epoch": 1562} {"train_loss": -6.07373046875, "global_step": 65635, "epoch": 1562} {"train_loss": -5.930901527404785, "global_step": 65636, "epoch": 1562} {"train_loss": -5.98213529586792, "global_step": 65637, "epoch": 1562} {"train_loss": -5.921795845031738, "global_step": 65638, "epoch": 1562} {"train_loss": -5.914881706237793, "global_step": 65639, "epoch": 1562} {"train_loss": -5.937511444091797, "global_step": 65640, "epoch": 1562} {"train_loss": -5.94488000869751, "global_step": 65641, "epoch": 1562} {"train_loss": -5.924932956695557, "global_step": 65642, "epoch": 1562} {"train_loss": -5.954981803894043, "global_step": 65643, "epoch": 1562} {"train_loss": -6.007388114929199, "global_step": 65644, "epoch": 1562} {"train_loss": -5.987514473143078, "global_step": 65645, "epoch": 1562, "val_loss": 61524.4921875} {"train_loss": -5.98125696182251, "global_step": 65646, "epoch": 1563} {"train_loss": -5.958532810211182, "global_step": 65647, "epoch": 1563} {"train_loss": -6.097768306732178, "global_step": 65648, "epoch": 1563} {"train_loss": -5.926896095275879, "global_step": 65649, "epoch": 1563} {"train_loss": -5.888283729553223, "global_step": 65650, "epoch": 1563} {"train_loss": -6.102418899536133, "global_step": 65651, "epoch": 1563} {"train_loss": -5.94300651550293, "global_step": 65652, "epoch": 1563} {"train_loss": -6.06138277053833, "global_step": 65653, "epoch": 1563} {"train_loss": -5.951871871948242, "global_step": 65654, "epoch": 1563} {"train_loss": -5.832554340362549, "global_step": 65655, "epoch": 1563} {"train_loss": -5.917044162750244, "global_step": 65656, "epoch": 1563} {"train_loss": -5.931922912597656, "global_step": 65657, "epoch": 1563} {"train_loss": -5.758868217468262, "global_step": 65658, "epoch": 1563} {"train_loss": -5.909786701202393, "global_step": 65659, "epoch": 1563} {"train_loss": -5.8430280685424805, "global_step": 65660, "epoch": 1563} {"train_loss": -5.8374152183532715, "global_step": 65661, "epoch": 1563} {"train_loss": -5.872621536254883, "global_step": 65662, "epoch": 1563} {"train_loss": -5.879389762878418, "global_step": 65663, "epoch": 1563} {"train_loss": -5.977527141571045, "global_step": 65664, "epoch": 1563} {"train_loss": -6.001678466796875, "global_step": 65665, "epoch": 1563} {"train_loss": -5.876132011413574, "global_step": 65666, "epoch": 1563} {"train_loss": -5.91784143447876, "global_step": 65667, "epoch": 1563} {"train_loss": -5.937593460083008, "global_step": 65668, "epoch": 1563} {"train_loss": -5.912915229797363, "global_step": 65669, "epoch": 1563} {"train_loss": -5.910512924194336, "global_step": 65670, "epoch": 1563} {"train_loss": -5.943553924560547, "global_step": 65671, "epoch": 1563} {"train_loss": -6.004578590393066, "global_step": 65672, "epoch": 1563} {"train_loss": -5.9602532386779785, "global_step": 65673, "epoch": 1563} {"train_loss": -5.932537078857422, "global_step": 65674, "epoch": 1563} {"train_loss": -6.0961127281188965, "global_step": 65675, "epoch": 1563} {"train_loss": -5.977404594421387, "global_step": 65676, "epoch": 1563} {"train_loss": -5.87723445892334, "global_step": 65677, "epoch": 1563} {"train_loss": -5.971569538116455, "global_step": 65678, "epoch": 1563} {"train_loss": -5.889092445373535, "global_step": 65679, "epoch": 1563} {"train_loss": -6.008490562438965, "global_step": 65680, "epoch": 1563} {"train_loss": -5.968483924865723, "global_step": 65681, "epoch": 1563} {"train_loss": -5.878689765930176, "global_step": 65682, "epoch": 1563} {"train_loss": -5.973971843719482, "global_step": 65683, "epoch": 1563} {"train_loss": -5.959734916687012, "global_step": 65684, "epoch": 1563} {"train_loss": -5.892356872558594, "global_step": 65685, "epoch": 1563} {"train_loss": -5.901145935058594, "global_step": 65686, "epoch": 1563} {"train_loss": -5.941610540662493, "global_step": 65687, "epoch": 1563, "val_loss": 61486.90625} {"train_loss": -5.9797563552856445, "global_step": 65688, "epoch": 1564} {"train_loss": -5.9118571281433105, "global_step": 65689, "epoch": 1564} {"train_loss": -6.019596099853516, "global_step": 65690, "epoch": 1564} {"train_loss": -6.0387797355651855, "global_step": 65691, "epoch": 1564} {"train_loss": -5.870289325714111, "global_step": 65692, "epoch": 1564} {"train_loss": -6.0409698486328125, "global_step": 65693, "epoch": 1564} {"train_loss": -5.923349380493164, "global_step": 65694, "epoch": 1564} {"train_loss": -5.90771484375, "global_step": 65695, "epoch": 1564} {"train_loss": -5.983246803283691, "global_step": 65696, "epoch": 1564} {"train_loss": -6.0258331298828125, "global_step": 65697, "epoch": 1564} {"train_loss": -6.05819034576416, "global_step": 65698, "epoch": 1564} {"train_loss": -6.085757255554199, "global_step": 65699, "epoch": 1564} {"train_loss": -5.930646896362305, "global_step": 65700, "epoch": 1564} {"train_loss": -6.030479431152344, "global_step": 65701, "epoch": 1564} {"train_loss": -5.92597770690918, "global_step": 65702, "epoch": 1564} {"train_loss": -5.998345851898193, "global_step": 65703, "epoch": 1564} {"train_loss": -5.911973476409912, "global_step": 65704, "epoch": 1564} {"train_loss": -5.998048305511475, "global_step": 65705, "epoch": 1564} {"train_loss": -5.998136520385742, "global_step": 65706, "epoch": 1564} {"train_loss": -5.9797234535217285, "global_step": 65707, "epoch": 1564} {"train_loss": -5.885920524597168, "global_step": 65708, "epoch": 1564} {"train_loss": -5.886069297790527, "global_step": 65709, "epoch": 1564} {"train_loss": -5.897234916687012, "global_step": 65710, "epoch": 1564} {"train_loss": -6.1110639572143555, "global_step": 65711, "epoch": 1564} {"train_loss": -6.033813953399658, "global_step": 65712, "epoch": 1564} {"train_loss": -5.914268970489502, "global_step": 65713, "epoch": 1564} {"train_loss": -6.059404373168945, "global_step": 65714, "epoch": 1564} {"train_loss": -5.946600914001465, "global_step": 65715, "epoch": 1564} {"train_loss": -5.888016223907471, "global_step": 65716, "epoch": 1564} {"train_loss": -5.855564117431641, "global_step": 65717, "epoch": 1564} {"train_loss": -5.97406530380249, "global_step": 65718, "epoch": 1564} {"train_loss": -5.914685249328613, "global_step": 65719, "epoch": 1564} {"train_loss": -5.981223106384277, "global_step": 65720, "epoch": 1564} {"train_loss": -5.976423263549805, "global_step": 65721, "epoch": 1564} {"train_loss": -5.887389183044434, "global_step": 65722, "epoch": 1564} {"train_loss": -6.043307304382324, "global_step": 65723, "epoch": 1564} {"train_loss": -5.939264297485352, "global_step": 65724, "epoch": 1564} {"train_loss": -6.036363124847412, "global_step": 65725, "epoch": 1564} {"train_loss": -5.912878036499023, "global_step": 65726, "epoch": 1564} {"train_loss": -5.914211273193359, "global_step": 65727, "epoch": 1564} {"train_loss": -6.025835037231445, "global_step": 65728, "epoch": 1564} {"train_loss": -5.971542437871297, "global_step": 65729, "epoch": 1564, "val_loss": 61484.6640625} {"train_loss": -5.932499408721924, "global_step": 65730, "epoch": 1565} {"train_loss": -6.047395706176758, "global_step": 65731, "epoch": 1565} {"train_loss": -5.873921871185303, "global_step": 65732, "epoch": 1565} {"train_loss": -5.936182498931885, "global_step": 65733, "epoch": 1565} {"train_loss": -5.988807678222656, "global_step": 65734, "epoch": 1565} {"train_loss": -6.0195817947387695, "global_step": 65735, "epoch": 1565} {"train_loss": -6.070159912109375, "global_step": 65736, "epoch": 1565} {"train_loss": -5.9547119140625, "global_step": 65737, "epoch": 1565} {"train_loss": -5.9096221923828125, "global_step": 65738, "epoch": 1565} {"train_loss": -5.9458160400390625, "global_step": 65739, "epoch": 1565} {"train_loss": -5.903080463409424, "global_step": 65740, "epoch": 1565} {"train_loss": -5.823596954345703, "global_step": 65741, "epoch": 1565} {"train_loss": -6.003802299499512, "global_step": 65742, "epoch": 1565} {"train_loss": -6.081300735473633, "global_step": 65743, "epoch": 1565} {"train_loss": -5.921845436096191, "global_step": 65744, "epoch": 1565} {"train_loss": -5.951615333557129, "global_step": 65745, "epoch": 1565} {"train_loss": -6.020766258239746, "global_step": 65746, "epoch": 1565} {"train_loss": -5.9666242599487305, "global_step": 65747, "epoch": 1565} {"train_loss": -5.9178571701049805, "global_step": 65748, "epoch": 1565} {"train_loss": -5.991919994354248, "global_step": 65749, "epoch": 1565} {"train_loss": -5.942798614501953, "global_step": 65750, "epoch": 1565} {"train_loss": -5.867717742919922, "global_step": 65751, "epoch": 1565} {"train_loss": -6.0160932540893555, "global_step": 65752, "epoch": 1565} {"train_loss": -6.088377475738525, "global_step": 65753, "epoch": 1565} {"train_loss": -6.037115097045898, "global_step": 65754, "epoch": 1565} {"train_loss": -5.974620342254639, "global_step": 65755, "epoch": 1565} {"train_loss": -5.8696465492248535, "global_step": 65756, "epoch": 1565} {"train_loss": -6.067933082580566, "global_step": 65757, "epoch": 1565} {"train_loss": -6.01885986328125, "global_step": 65758, "epoch": 1565} {"train_loss": -6.094973087310791, "global_step": 65759, "epoch": 1565} {"train_loss": -6.029386043548584, "global_step": 65760, "epoch": 1565} {"train_loss": -6.087847709655762, "global_step": 65761, "epoch": 1565} {"train_loss": -5.876020431518555, "global_step": 65762, "epoch": 1565} {"train_loss": -6.102835655212402, "global_step": 65763, "epoch": 1565} {"train_loss": -5.930583477020264, "global_step": 65764, "epoch": 1565} {"train_loss": -6.052095413208008, "global_step": 65765, "epoch": 1565} {"train_loss": -5.850894927978516, "global_step": 65766, "epoch": 1565} {"train_loss": -6.008037567138672, "global_step": 65767, "epoch": 1565} {"train_loss": -6.046933650970459, "global_step": 65768, "epoch": 1565} {"train_loss": -5.833266735076904, "global_step": 65769, "epoch": 1565} {"train_loss": -5.993806838989258, "global_step": 65770, "epoch": 1565} {"train_loss": -5.97510560353597, "global_step": 65771, "epoch": 1565, "val_loss": 61576.2890625} {"train_loss": -5.993621349334717, "global_step": 65772, "epoch": 1566} {"train_loss": -5.959959030151367, "global_step": 65773, "epoch": 1566} {"train_loss": -6.008096694946289, "global_step": 65774, "epoch": 1566} {"train_loss": -6.007935523986816, "global_step": 65775, "epoch": 1566} {"train_loss": -5.975014686584473, "global_step": 65776, "epoch": 1566} {"train_loss": -6.021421909332275, "global_step": 65777, "epoch": 1566} {"train_loss": -6.024977684020996, "global_step": 65778, "epoch": 1566} {"train_loss": -5.931907653808594, "global_step": 65779, "epoch": 1566} {"train_loss": -5.9544758796691895, "global_step": 65780, "epoch": 1566} {"train_loss": -5.902834415435791, "global_step": 65781, "epoch": 1566} {"train_loss": -6.0431060791015625, "global_step": 65782, "epoch": 1566} {"train_loss": -5.918457984924316, "global_step": 65783, "epoch": 1566} {"train_loss": -5.930384635925293, "global_step": 65784, "epoch": 1566} {"train_loss": -6.025938987731934, "global_step": 65785, "epoch": 1566} {"train_loss": -5.982665061950684, "global_step": 65786, "epoch": 1566} {"train_loss": -5.936854362487793, "global_step": 65787, "epoch": 1566} {"train_loss": -6.135968208312988, "global_step": 65788, "epoch": 1566} {"train_loss": -5.87648868560791, "global_step": 65789, "epoch": 1566} {"train_loss": -5.975722312927246, "global_step": 65790, "epoch": 1566} {"train_loss": -5.966456413269043, "global_step": 65791, "epoch": 1566} {"train_loss": -5.935509204864502, "global_step": 65792, "epoch": 1566} {"train_loss": -6.0017499923706055, "global_step": 65793, "epoch": 1566} {"train_loss": -5.984410762786865, "global_step": 65794, "epoch": 1566} {"train_loss": -5.983014106750488, "global_step": 65795, "epoch": 1566} {"train_loss": -5.97727108001709, "global_step": 65796, "epoch": 1566} {"train_loss": -5.898870468139648, "global_step": 65797, "epoch": 1566} {"train_loss": -6.033642292022705, "global_step": 65798, "epoch": 1566} {"train_loss": -5.948558807373047, "global_step": 65799, "epoch": 1566} {"train_loss": -5.971138000488281, "global_step": 65800, "epoch": 1566} {"train_loss": -6.040008544921875, "global_step": 65801, "epoch": 1566} {"train_loss": -5.976546764373779, "global_step": 65802, "epoch": 1566} {"train_loss": -5.986905097961426, "global_step": 65803, "epoch": 1566} {"train_loss": -5.957993507385254, "global_step": 65804, "epoch": 1566} {"train_loss": -6.054661750793457, "global_step": 65805, "epoch": 1566} {"train_loss": -6.104616165161133, "global_step": 65806, "epoch": 1566} {"train_loss": -6.084020614624023, "global_step": 65807, "epoch": 1566} {"train_loss": -5.86917781829834, "global_step": 65808, "epoch": 1566} {"train_loss": -6.051301002502441, "global_step": 65809, "epoch": 1566} {"train_loss": -5.877382278442383, "global_step": 65810, "epoch": 1566} {"train_loss": -6.046348571777344, "global_step": 65811, "epoch": 1566} {"train_loss": -6.025556564331055, "global_step": 65812, "epoch": 1566} {"train_loss": -5.9843327431451705, "global_step": 65813, "epoch": 1566, "val_loss": 61440.07421875} {"train_loss": -6.083549499511719, "global_step": 65814, "epoch": 1567} {"train_loss": -6.010008335113525, "global_step": 65815, "epoch": 1567} {"train_loss": -5.9917449951171875, "global_step": 65816, "epoch": 1567} {"train_loss": -6.072818756103516, "global_step": 65817, "epoch": 1567} {"train_loss": -5.963856220245361, "global_step": 65818, "epoch": 1567} {"train_loss": -5.875345230102539, "global_step": 65819, "epoch": 1567} {"train_loss": -5.9633870124816895, "global_step": 65820, "epoch": 1567} {"train_loss": -5.982977867126465, "global_step": 65821, "epoch": 1567} {"train_loss": -5.903191566467285, "global_step": 65822, "epoch": 1567} {"train_loss": -5.938806056976318, "global_step": 65823, "epoch": 1567} {"train_loss": -5.9044928550720215, "global_step": 65824, "epoch": 1567} {"train_loss": -5.947946548461914, "global_step": 65825, "epoch": 1567} {"train_loss": -6.01371955871582, "global_step": 65826, "epoch": 1567} {"train_loss": -5.959594249725342, "global_step": 65827, "epoch": 1567} {"train_loss": -6.031005859375, "global_step": 65828, "epoch": 1567} {"train_loss": -5.985944747924805, "global_step": 65829, "epoch": 1567} {"train_loss": -6.001709938049316, "global_step": 65830, "epoch": 1567} {"train_loss": -6.018648147583008, "global_step": 65831, "epoch": 1567} {"train_loss": -5.970668792724609, "global_step": 65832, "epoch": 1567} {"train_loss": -6.026096820831299, "global_step": 65833, "epoch": 1567} {"train_loss": -6.070171356201172, "global_step": 65834, "epoch": 1567} {"train_loss": -6.06041145324707, "global_step": 65835, "epoch": 1567} {"train_loss": -6.0016069412231445, "global_step": 65836, "epoch": 1567} {"train_loss": -5.978521347045898, "global_step": 65837, "epoch": 1567} {"train_loss": -5.958399772644043, "global_step": 65838, "epoch": 1567} {"train_loss": -5.882406711578369, "global_step": 65839, "epoch": 1567} {"train_loss": -6.055488109588623, "global_step": 65840, "epoch": 1567} {"train_loss": -5.897579193115234, "global_step": 65841, "epoch": 1567} {"train_loss": -5.964304447174072, "global_step": 65842, "epoch": 1567} {"train_loss": -5.839791297912598, "global_step": 65843, "epoch": 1567} {"train_loss": -5.9006242752075195, "global_step": 65844, "epoch": 1567} {"train_loss": -5.993766784667969, "global_step": 65845, "epoch": 1567} {"train_loss": -5.934603214263916, "global_step": 65846, "epoch": 1567} {"train_loss": -6.0024518966674805, "global_step": 65847, "epoch": 1567} {"train_loss": -5.999736785888672, "global_step": 65848, "epoch": 1567} {"train_loss": -6.05158805847168, "global_step": 65849, "epoch": 1567} {"train_loss": -5.984954833984375, "global_step": 65850, "epoch": 1567} {"train_loss": -6.032792568206787, "global_step": 65851, "epoch": 1567} {"train_loss": -6.075531959533691, "global_step": 65852, "epoch": 1567} {"train_loss": -5.9033074378967285, "global_step": 65853, "epoch": 1567} {"train_loss": -6.01844596862793, "global_step": 65854, "epoch": 1567} {"train_loss": -5.982028030213856, "global_step": 65855, "epoch": 1567, "val_loss": 61566.08203125} {"train_loss": -5.940268039703369, "global_step": 65856, "epoch": 1568} {"train_loss": -6.089876651763916, "global_step": 65857, "epoch": 1568} {"train_loss": -6.010186195373535, "global_step": 65858, "epoch": 1568} {"train_loss": -5.928651332855225, "global_step": 65859, "epoch": 1568} {"train_loss": -5.9637556076049805, "global_step": 65860, "epoch": 1568} {"train_loss": -6.038064479827881, "global_step": 65861, "epoch": 1568} {"train_loss": -6.025468826293945, "global_step": 65862, "epoch": 1568} {"train_loss": -5.981112480163574, "global_step": 65863, "epoch": 1568} {"train_loss": -6.009150505065918, "global_step": 65864, "epoch": 1568} {"train_loss": -6.081897258758545, "global_step": 65865, "epoch": 1568} {"train_loss": -5.83096981048584, "global_step": 65866, "epoch": 1568} {"train_loss": -5.94121789932251, "global_step": 65867, "epoch": 1568} {"train_loss": -5.997929573059082, "global_step": 65868, "epoch": 1568} {"train_loss": -6.032670974731445, "global_step": 65869, "epoch": 1568} {"train_loss": -6.036355972290039, "global_step": 65870, "epoch": 1568} {"train_loss": -5.904794692993164, "global_step": 65871, "epoch": 1568} {"train_loss": -5.9785051345825195, "global_step": 65872, "epoch": 1568} {"train_loss": -6.022902488708496, "global_step": 65873, "epoch": 1568} {"train_loss": -5.981265544891357, "global_step": 65874, "epoch": 1568} {"train_loss": -5.941764831542969, "global_step": 65875, "epoch": 1568} {"train_loss": -5.956835746765137, "global_step": 65876, "epoch": 1568} {"train_loss": -6.044949054718018, "global_step": 65877, "epoch": 1568} {"train_loss": -5.930633544921875, "global_step": 65878, "epoch": 1568} {"train_loss": -5.887653350830078, "global_step": 65879, "epoch": 1568} {"train_loss": -5.97900390625, "global_step": 65880, "epoch": 1568} {"train_loss": -5.987037181854248, "global_step": 65881, "epoch": 1568} {"train_loss": -6.073616981506348, "global_step": 65882, "epoch": 1568} {"train_loss": -6.042644500732422, "global_step": 65883, "epoch": 1568} {"train_loss": -5.941555976867676, "global_step": 65884, "epoch": 1568} {"train_loss": -6.001743316650391, "global_step": 65885, "epoch": 1568} {"train_loss": -5.975469589233398, "global_step": 65886, "epoch": 1568} {"train_loss": -5.932245254516602, "global_step": 65887, "epoch": 1568} {"train_loss": -6.051023483276367, "global_step": 65888, "epoch": 1568} {"train_loss": -5.9101786613464355, "global_step": 65889, "epoch": 1568} {"train_loss": -5.863797664642334, "global_step": 65890, "epoch": 1568} {"train_loss": -5.857636451721191, "global_step": 65891, "epoch": 1568} {"train_loss": -5.907649993896484, "global_step": 65892, "epoch": 1568} {"train_loss": -5.910667419433594, "global_step": 65893, "epoch": 1568} {"train_loss": -6.110461235046387, "global_step": 65894, "epoch": 1568} {"train_loss": -5.9001970291137695, "global_step": 65895, "epoch": 1568} {"train_loss": -5.9273247718811035, "global_step": 65896, "epoch": 1568} {"train_loss": -5.972260611397879, "global_step": 65897, "epoch": 1568, "val_loss": 61661.6328125} {"train_loss": -5.950199127197266, "global_step": 65898, "epoch": 1569} {"train_loss": -5.882036209106445, "global_step": 65899, "epoch": 1569} {"train_loss": -5.930364608764648, "global_step": 65900, "epoch": 1569} {"train_loss": -6.018656253814697, "global_step": 65901, "epoch": 1569} {"train_loss": -5.924224376678467, "global_step": 65902, "epoch": 1569} {"train_loss": -6.018388271331787, "global_step": 65903, "epoch": 1569} {"train_loss": -5.969592094421387, "global_step": 65904, "epoch": 1569} {"train_loss": -5.844974517822266, "global_step": 65905, "epoch": 1569} {"train_loss": -5.977631568908691, "global_step": 65906, "epoch": 1569} {"train_loss": -5.906914234161377, "global_step": 65907, "epoch": 1569} {"train_loss": -6.0413498878479, "global_step": 65908, "epoch": 1569} {"train_loss": -5.958470344543457, "global_step": 65909, "epoch": 1569} {"train_loss": -5.968313217163086, "global_step": 65910, "epoch": 1569} {"train_loss": -6.143246650695801, "global_step": 65911, "epoch": 1569} {"train_loss": -6.015158653259277, "global_step": 65912, "epoch": 1569} {"train_loss": -6.049498558044434, "global_step": 65913, "epoch": 1569} {"train_loss": -5.8840837478637695, "global_step": 65914, "epoch": 1569} {"train_loss": -5.960838317871094, "global_step": 65915, "epoch": 1569} {"train_loss": -5.977036476135254, "global_step": 65916, "epoch": 1569} {"train_loss": -5.9034528732299805, "global_step": 65917, "epoch": 1569} {"train_loss": -5.998838424682617, "global_step": 65918, "epoch": 1569} {"train_loss": -5.894800662994385, "global_step": 65919, "epoch": 1569} {"train_loss": -5.935333728790283, "global_step": 65920, "epoch": 1569} {"train_loss": -6.022319316864014, "global_step": 65921, "epoch": 1569} {"train_loss": -5.977721214294434, "global_step": 65922, "epoch": 1569} {"train_loss": -5.901918411254883, "global_step": 65923, "epoch": 1569} {"train_loss": -6.00541353225708, "global_step": 65924, "epoch": 1569} {"train_loss": -5.86767053604126, "global_step": 65925, "epoch": 1569} {"train_loss": -6.046369552612305, "global_step": 65926, "epoch": 1569} {"train_loss": -5.987472057342529, "global_step": 65927, "epoch": 1569} {"train_loss": -6.0749406814575195, "global_step": 65928, "epoch": 1569} {"train_loss": -5.937443256378174, "global_step": 65929, "epoch": 1569} {"train_loss": -5.961036682128906, "global_step": 65930, "epoch": 1569} {"train_loss": -5.995956897735596, "global_step": 65931, "epoch": 1569} {"train_loss": -6.016543388366699, "global_step": 65932, "epoch": 1569} {"train_loss": -6.037654399871826, "global_step": 65933, "epoch": 1569} {"train_loss": -5.877703666687012, "global_step": 65934, "epoch": 1569} {"train_loss": -5.886782646179199, "global_step": 65935, "epoch": 1569} {"train_loss": -5.990789890289307, "global_step": 65936, "epoch": 1569} {"train_loss": -5.954657554626465, "global_step": 65937, "epoch": 1569} {"train_loss": -6.022450923919678, "global_step": 65938, "epoch": 1569} {"train_loss": -5.971421446119036, "global_step": 65939, "epoch": 1569, "val_loss": 61689.45703125} {"train_loss": -5.867189884185791, "global_step": 65940, "epoch": 1570} {"train_loss": -5.863956451416016, "global_step": 65941, "epoch": 1570} {"train_loss": -5.992339134216309, "global_step": 65942, "epoch": 1570} {"train_loss": -6.064238548278809, "global_step": 65943, "epoch": 1570} {"train_loss": -5.681648254394531, "global_step": 65944, "epoch": 1570} {"train_loss": -5.8752055168151855, "global_step": 65945, "epoch": 1570} {"train_loss": -5.944249153137207, "global_step": 65946, "epoch": 1570} {"train_loss": -5.8498148918151855, "global_step": 65947, "epoch": 1570} {"train_loss": -5.914557456970215, "global_step": 65948, "epoch": 1570} {"train_loss": -5.977787971496582, "global_step": 65949, "epoch": 1570} {"train_loss": -5.843425750732422, "global_step": 65950, "epoch": 1570} {"train_loss": -5.964008331298828, "global_step": 65951, "epoch": 1570} {"train_loss": -5.9209489822387695, "global_step": 65952, "epoch": 1570} {"train_loss": -5.850590705871582, "global_step": 65953, "epoch": 1570} {"train_loss": -5.980384826660156, "global_step": 65954, "epoch": 1570} {"train_loss": -5.807108402252197, "global_step": 65955, "epoch": 1570} {"train_loss": -5.957324028015137, "global_step": 65956, "epoch": 1570} {"train_loss": -5.830723762512207, "global_step": 65957, "epoch": 1570} {"train_loss": -5.9774651527404785, "global_step": 65958, "epoch": 1570} {"train_loss": -5.952523231506348, "global_step": 65959, "epoch": 1570} {"train_loss": -5.911380767822266, "global_step": 65960, "epoch": 1570} {"train_loss": -5.9076128005981445, "global_step": 65961, "epoch": 1570} {"train_loss": -5.919522285461426, "global_step": 65962, "epoch": 1570} {"train_loss": -5.846510887145996, "global_step": 65963, "epoch": 1570} {"train_loss": -6.000655174255371, "global_step": 65964, "epoch": 1570} {"train_loss": -6.100978851318359, "global_step": 65965, "epoch": 1570} {"train_loss": -6.009971618652344, "global_step": 65966, "epoch": 1570} {"train_loss": -5.918143272399902, "global_step": 65967, "epoch": 1570} {"train_loss": -5.973643779754639, "global_step": 65968, "epoch": 1570} {"train_loss": -5.957085132598877, "global_step": 65969, "epoch": 1570} {"train_loss": -5.966412544250488, "global_step": 65970, "epoch": 1570} {"train_loss": -5.990426063537598, "global_step": 65971, "epoch": 1570} {"train_loss": -5.999401092529297, "global_step": 65972, "epoch": 1570} {"train_loss": -5.916658401489258, "global_step": 65973, "epoch": 1570} {"train_loss": -6.0568437576293945, "global_step": 65974, "epoch": 1570} {"train_loss": -6.057899475097656, "global_step": 65975, "epoch": 1570} {"train_loss": -6.087545394897461, "global_step": 65976, "epoch": 1570} {"train_loss": -5.970755100250244, "global_step": 65977, "epoch": 1570} {"train_loss": -6.00081729888916, "global_step": 65978, "epoch": 1570} {"train_loss": -5.952264308929443, "global_step": 65979, "epoch": 1570} {"train_loss": -5.995409965515137, "global_step": 65980, "epoch": 1570} {"train_loss": -5.945143336341495, "global_step": 65981, "epoch": 1570, "val_loss": 61363.265625} {"train_loss": -5.944291114807129, "global_step": 65982, "epoch": 1571} {"train_loss": -6.00899600982666, "global_step": 65983, "epoch": 1571} {"train_loss": -5.915185928344727, "global_step": 65984, "epoch": 1571} {"train_loss": -6.0349555015563965, "global_step": 65985, "epoch": 1571} {"train_loss": -6.110857963562012, "global_step": 65986, "epoch": 1571} {"train_loss": -6.070005416870117, "global_step": 65987, "epoch": 1571} {"train_loss": -6.016485691070557, "global_step": 65988, "epoch": 1571} {"train_loss": -5.979860305786133, "global_step": 65989, "epoch": 1571} {"train_loss": -6.062283515930176, "global_step": 65990, "epoch": 1571} {"train_loss": -6.01832914352417, "global_step": 65991, "epoch": 1571} {"train_loss": -5.831058025360107, "global_step": 65992, "epoch": 1571} {"train_loss": -6.066481590270996, "global_step": 65993, "epoch": 1571} {"train_loss": -6.062397003173828, "global_step": 65994, "epoch": 1571} {"train_loss": -6.030484676361084, "global_step": 65995, "epoch": 1571} {"train_loss": -5.988846302032471, "global_step": 65996, "epoch": 1571} {"train_loss": -5.956319808959961, "global_step": 65997, "epoch": 1571} {"train_loss": -6.066061973571777, "global_step": 65998, "epoch": 1571} {"train_loss": -5.990011215209961, "global_step": 65999, "epoch": 1571} {"train_loss": -6.033461570739746, "global_step": 66000, "epoch": 1571} {"train_loss": -5.9471940994262695, "global_step": 66001, "epoch": 1571} {"train_loss": -5.92501163482666, "global_step": 66002, "epoch": 1571} {"train_loss": -6.122008323669434, "global_step": 66003, "epoch": 1571} {"train_loss": -5.83322811126709, "global_step": 66004, "epoch": 1571} {"train_loss": -5.991970062255859, "global_step": 66005, "epoch": 1571} {"train_loss": -5.994277000427246, "global_step": 66006, "epoch": 1571} {"train_loss": -6.057161808013916, "global_step": 66007, "epoch": 1571} {"train_loss": -5.946206092834473, "global_step": 66008, "epoch": 1571} {"train_loss": -6.055113792419434, "global_step": 66009, "epoch": 1571} {"train_loss": -5.895493507385254, "global_step": 66010, "epoch": 1571} {"train_loss": -6.090015411376953, "global_step": 66011, "epoch": 1571} {"train_loss": -5.956426620483398, "global_step": 66012, "epoch": 1571} {"train_loss": -5.9407243728637695, "global_step": 66013, "epoch": 1571} {"train_loss": -5.981348037719727, "global_step": 66014, "epoch": 1571} {"train_loss": -5.946699142456055, "global_step": 66015, "epoch": 1571} {"train_loss": -6.027980804443359, "global_step": 66016, "epoch": 1571} {"train_loss": -5.869452476501465, "global_step": 66017, "epoch": 1571} {"train_loss": -5.857476234436035, "global_step": 66018, "epoch": 1571} {"train_loss": -5.993265151977539, "global_step": 66019, "epoch": 1571} {"train_loss": -5.88493013381958, "global_step": 66020, "epoch": 1571} {"train_loss": -6.008082866668701, "global_step": 66021, "epoch": 1571} {"train_loss": -6.049142360687256, "global_step": 66022, "epoch": 1571} {"train_loss": -5.987749360856556, "global_step": 66023, "epoch": 1571, "val_loss": 61546.203125} {"train_loss": -5.994503021240234, "global_step": 66024, "epoch": 1572} {"train_loss": -5.917453765869141, "global_step": 66025, "epoch": 1572} {"train_loss": -6.030904769897461, "global_step": 66026, "epoch": 1572} {"train_loss": -6.038789749145508, "global_step": 66027, "epoch": 1572} {"train_loss": -5.930733680725098, "global_step": 66028, "epoch": 1572} {"train_loss": -6.038355827331543, "global_step": 66029, "epoch": 1572} {"train_loss": -6.057443141937256, "global_step": 66030, "epoch": 1572} {"train_loss": -6.047260284423828, "global_step": 66031, "epoch": 1572} {"train_loss": -5.906383514404297, "global_step": 66032, "epoch": 1572} {"train_loss": -5.94140625, "global_step": 66033, "epoch": 1572} {"train_loss": -5.958295822143555, "global_step": 66034, "epoch": 1572} {"train_loss": -5.885224342346191, "global_step": 66035, "epoch": 1572} {"train_loss": -5.94895076751709, "global_step": 66036, "epoch": 1572} {"train_loss": -5.928827285766602, "global_step": 66037, "epoch": 1572} {"train_loss": -6.020231246948242, "global_step": 66038, "epoch": 1572} {"train_loss": -5.991203308105469, "global_step": 66039, "epoch": 1572} {"train_loss": -6.042934417724609, "global_step": 66040, "epoch": 1572} {"train_loss": -5.9506144523620605, "global_step": 66041, "epoch": 1572} {"train_loss": -5.960455417633057, "global_step": 66042, "epoch": 1572} {"train_loss": -5.98581075668335, "global_step": 66043, "epoch": 1572} {"train_loss": -5.897064208984375, "global_step": 66044, "epoch": 1572} {"train_loss": -6.033930778503418, "global_step": 66045, "epoch": 1572} {"train_loss": -5.856308937072754, "global_step": 66046, "epoch": 1572} {"train_loss": -6.036063194274902, "global_step": 66047, "epoch": 1572} {"train_loss": -5.996800422668457, "global_step": 66048, "epoch": 1572} {"train_loss": -6.004047870635986, "global_step": 66049, "epoch": 1572} {"train_loss": -5.99116325378418, "global_step": 66050, "epoch": 1572} {"train_loss": -5.9843950271606445, "global_step": 66051, "epoch": 1572} {"train_loss": -5.923000812530518, "global_step": 66052, "epoch": 1572} {"train_loss": -6.009757995605469, "global_step": 66053, "epoch": 1572} {"train_loss": -6.0122270584106445, "global_step": 66054, "epoch": 1572} {"train_loss": -5.86434268951416, "global_step": 66055, "epoch": 1572} {"train_loss": -5.8869218826293945, "global_step": 66056, "epoch": 1572} {"train_loss": -5.867212295532227, "global_step": 66057, "epoch": 1572} {"train_loss": -5.907840251922607, "global_step": 66058, "epoch": 1572} {"train_loss": -5.985433578491211, "global_step": 66059, "epoch": 1572} {"train_loss": -5.932958126068115, "global_step": 66060, "epoch": 1572} {"train_loss": -5.9800872802734375, "global_step": 66061, "epoch": 1572} {"train_loss": -5.977138519287109, "global_step": 66062, "epoch": 1572} {"train_loss": -5.862802982330322, "global_step": 66063, "epoch": 1572} {"train_loss": -5.965825080871582, "global_step": 66064, "epoch": 1572} {"train_loss": -5.966031846545992, "global_step": 66065, "epoch": 1572, "val_loss": 61671.17578125} {"train_loss": -5.891745567321777, "global_step": 66066, "epoch": 1573} {"train_loss": -6.070739269256592, "global_step": 66067, "epoch": 1573} {"train_loss": -5.961353302001953, "global_step": 66068, "epoch": 1573} {"train_loss": -5.975234508514404, "global_step": 66069, "epoch": 1573} {"train_loss": -5.928234100341797, "global_step": 66070, "epoch": 1573} {"train_loss": -5.858066558837891, "global_step": 66071, "epoch": 1573} {"train_loss": -6.017162322998047, "global_step": 66072, "epoch": 1573} {"train_loss": -5.922239303588867, "global_step": 66073, "epoch": 1573} {"train_loss": -5.966990947723389, "global_step": 66074, "epoch": 1573} {"train_loss": -6.093020915985107, "global_step": 66075, "epoch": 1573} {"train_loss": -5.884525775909424, "global_step": 66076, "epoch": 1573} {"train_loss": -5.990317344665527, "global_step": 66077, "epoch": 1573} {"train_loss": -5.990449905395508, "global_step": 66078, "epoch": 1573} {"train_loss": -5.850546836853027, "global_step": 66079, "epoch": 1573} {"train_loss": -6.054018020629883, "global_step": 66080, "epoch": 1573} {"train_loss": -6.030240535736084, "global_step": 66081, "epoch": 1573} {"train_loss": -6.035198211669922, "global_step": 66082, "epoch": 1573} {"train_loss": -6.020389080047607, "global_step": 66083, "epoch": 1573} {"train_loss": -5.921738624572754, "global_step": 66084, "epoch": 1573} {"train_loss": -5.903672218322754, "global_step": 66085, "epoch": 1573} {"train_loss": -6.012742042541504, "global_step": 66086, "epoch": 1573} {"train_loss": -6.042026042938232, "global_step": 66087, "epoch": 1573} {"train_loss": -5.951505184173584, "global_step": 66088, "epoch": 1573} {"train_loss": -5.908902645111084, "global_step": 66089, "epoch": 1573} {"train_loss": -5.978071689605713, "global_step": 66090, "epoch": 1573} {"train_loss": -5.9265241622924805, "global_step": 66091, "epoch": 1573} {"train_loss": -6.004809379577637, "global_step": 66092, "epoch": 1573} {"train_loss": -6.037081718444824, "global_step": 66093, "epoch": 1573} {"train_loss": -6.051966667175293, "global_step": 66094, "epoch": 1573} {"train_loss": -6.094338417053223, "global_step": 66095, "epoch": 1573} {"train_loss": -6.051897048950195, "global_step": 66096, "epoch": 1573} {"train_loss": -6.100081443786621, "global_step": 66097, "epoch": 1573} {"train_loss": -6.00913143157959, "global_step": 66098, "epoch": 1573} {"train_loss": -6.033840656280518, "global_step": 66099, "epoch": 1573} {"train_loss": -6.080689430236816, "global_step": 66100, "epoch": 1573} {"train_loss": -6.084624767303467, "global_step": 66101, "epoch": 1573} {"train_loss": -6.038439750671387, "global_step": 66102, "epoch": 1573} {"train_loss": -6.00908899307251, "global_step": 66103, "epoch": 1573} {"train_loss": -5.969235897064209, "global_step": 66104, "epoch": 1573} {"train_loss": -5.960382461547852, "global_step": 66105, "epoch": 1573} {"train_loss": -6.041015625, "global_step": 66106, "epoch": 1573} {"train_loss": -5.996871017274403, "global_step": 66107, "epoch": 1573, "val_loss": 61553.9453125} {"train_loss": -6.04655647277832, "global_step": 66108, "epoch": 1574} {"train_loss": -6.155400276184082, "global_step": 66109, "epoch": 1574} {"train_loss": -6.0338640213012695, "global_step": 66110, "epoch": 1574} {"train_loss": -6.124985694885254, "global_step": 66111, "epoch": 1574} {"train_loss": -6.100793838500977, "global_step": 66112, "epoch": 1574} {"train_loss": -6.016887664794922, "global_step": 66113, "epoch": 1574} {"train_loss": -6.006124496459961, "global_step": 66114, "epoch": 1574} {"train_loss": -6.029600143432617, "global_step": 66115, "epoch": 1574} {"train_loss": -6.066499710083008, "global_step": 66116, "epoch": 1574} {"train_loss": -6.008258819580078, "global_step": 66117, "epoch": 1574} {"train_loss": -5.939872741699219, "global_step": 66118, "epoch": 1574} {"train_loss": -5.985910415649414, "global_step": 66119, "epoch": 1574} {"train_loss": -5.972984313964844, "global_step": 66120, "epoch": 1574} {"train_loss": -5.924948692321777, "global_step": 66121, "epoch": 1574} {"train_loss": -6.005018711090088, "global_step": 66122, "epoch": 1574} {"train_loss": -6.129575729370117, "global_step": 66123, "epoch": 1574} {"train_loss": -6.125576972961426, "global_step": 66124, "epoch": 1574} {"train_loss": -6.064743995666504, "global_step": 66125, "epoch": 1574} {"train_loss": -6.098589897155762, "global_step": 66126, "epoch": 1574} {"train_loss": -6.036462783813477, "global_step": 66127, "epoch": 1574} {"train_loss": -5.939312934875488, "global_step": 66128, "epoch": 1574} {"train_loss": -5.976770877838135, "global_step": 66129, "epoch": 1574} {"train_loss": -5.905369758605957, "global_step": 66130, "epoch": 1574} {"train_loss": -6.001833915710449, "global_step": 66131, "epoch": 1574} {"train_loss": -6.036270618438721, "global_step": 66132, "epoch": 1574} {"train_loss": -5.98563289642334, "global_step": 66133, "epoch": 1574} {"train_loss": -5.881505966186523, "global_step": 66134, "epoch": 1574} {"train_loss": -5.979260444641113, "global_step": 66135, "epoch": 1574} {"train_loss": -6.019406795501709, "global_step": 66136, "epoch": 1574} {"train_loss": -5.92266845703125, "global_step": 66137, "epoch": 1574} {"train_loss": -5.991114616394043, "global_step": 66138, "epoch": 1574} {"train_loss": -6.048168182373047, "global_step": 66139, "epoch": 1574} {"train_loss": -5.925470352172852, "global_step": 66140, "epoch": 1574} {"train_loss": -6.024694442749023, "global_step": 66141, "epoch": 1574} {"train_loss": -5.955415725708008, "global_step": 66142, "epoch": 1574} {"train_loss": -5.935805797576904, "global_step": 66143, "epoch": 1574} {"train_loss": -6.036714553833008, "global_step": 66144, "epoch": 1574} {"train_loss": -6.049635887145996, "global_step": 66145, "epoch": 1574} {"train_loss": -5.864018440246582, "global_step": 66146, "epoch": 1574} {"train_loss": -5.912652015686035, "global_step": 66147, "epoch": 1574} {"train_loss": -5.925731658935547, "global_step": 66148, "epoch": 1574} {"train_loss": -6.005500452859061, "global_step": 66149, "epoch": 1574, "val_loss": 61391.41015625} {"train_loss": -6.007180213928223, "global_step": 66150, "epoch": 1575} {"train_loss": -6.012862205505371, "global_step": 66151, "epoch": 1575} {"train_loss": -5.887913703918457, "global_step": 66152, "epoch": 1575} {"train_loss": -6.051592826843262, "global_step": 66153, "epoch": 1575} {"train_loss": -5.884169578552246, "global_step": 66154, "epoch": 1575} {"train_loss": -5.958494186401367, "global_step": 66155, "epoch": 1575} {"train_loss": -5.902945518493652, "global_step": 66156, "epoch": 1575} {"train_loss": -5.911192417144775, "global_step": 66157, "epoch": 1575} {"train_loss": -5.96848201751709, "global_step": 66158, "epoch": 1575} {"train_loss": -5.963695526123047, "global_step": 66159, "epoch": 1575} {"train_loss": -5.923167705535889, "global_step": 66160, "epoch": 1575} {"train_loss": -5.898937225341797, "global_step": 66161, "epoch": 1575} {"train_loss": -6.027495384216309, "global_step": 66162, "epoch": 1575} {"train_loss": -5.9347381591796875, "global_step": 66163, "epoch": 1575} {"train_loss": -6.049760341644287, "global_step": 66164, "epoch": 1575} {"train_loss": -5.862891674041748, "global_step": 66165, "epoch": 1575} {"train_loss": -6.02885103225708, "global_step": 66166, "epoch": 1575} {"train_loss": -5.927013397216797, "global_step": 66167, "epoch": 1575} {"train_loss": -6.002542495727539, "global_step": 66168, "epoch": 1575} {"train_loss": -5.866083145141602, "global_step": 66169, "epoch": 1575} {"train_loss": -5.986599922180176, "global_step": 66170, "epoch": 1575} {"train_loss": -5.950562000274658, "global_step": 66171, "epoch": 1575} {"train_loss": -5.8607258796691895, "global_step": 66172, "epoch": 1575} {"train_loss": -5.983425617218018, "global_step": 66173, "epoch": 1575} {"train_loss": -5.9530839920043945, "global_step": 66174, "epoch": 1575} {"train_loss": -5.904560089111328, "global_step": 66175, "epoch": 1575} {"train_loss": -6.025027275085449, "global_step": 66176, "epoch": 1575} {"train_loss": -5.823619842529297, "global_step": 66177, "epoch": 1575} {"train_loss": -5.9158244132995605, "global_step": 66178, "epoch": 1575} {"train_loss": -6.119542121887207, "global_step": 66179, "epoch": 1575} {"train_loss": -5.850224018096924, "global_step": 66180, "epoch": 1575} {"train_loss": -6.06917667388916, "global_step": 66181, "epoch": 1575} {"train_loss": -5.962059020996094, "global_step": 66182, "epoch": 1575} {"train_loss": -5.993775844573975, "global_step": 66183, "epoch": 1575} {"train_loss": -5.913122177124023, "global_step": 66184, "epoch": 1575} {"train_loss": -5.983466625213623, "global_step": 66185, "epoch": 1575} {"train_loss": -5.996881484985352, "global_step": 66186, "epoch": 1575} {"train_loss": -5.931053161621094, "global_step": 66187, "epoch": 1575} {"train_loss": -6.059037208557129, "global_step": 66188, "epoch": 1575} {"train_loss": -5.88347053527832, "global_step": 66189, "epoch": 1575} {"train_loss": -6.009986400604248, "global_step": 66190, "epoch": 1575} {"train_loss": -5.956757238933018, "global_step": 66191, "epoch": 1575, "val_loss": 61450.0} {"train_loss": -5.979160308837891, "global_step": 66192, "epoch": 1576} {"train_loss": -6.150565147399902, "global_step": 66193, "epoch": 1576} {"train_loss": -6.0086283683776855, "global_step": 66194, "epoch": 1576} {"train_loss": -5.978246688842773, "global_step": 66195, "epoch": 1576} {"train_loss": -6.02223014831543, "global_step": 66196, "epoch": 1576} {"train_loss": -5.909178733825684, "global_step": 66197, "epoch": 1576} {"train_loss": -5.880866050720215, "global_step": 66198, "epoch": 1576} {"train_loss": -5.82070779800415, "global_step": 66199, "epoch": 1576} {"train_loss": -6.077197074890137, "global_step": 66200, "epoch": 1576} {"train_loss": -6.085243225097656, "global_step": 66201, "epoch": 1576} {"train_loss": -6.102212905883789, "global_step": 66202, "epoch": 1576} {"train_loss": -5.98063850402832, "global_step": 66203, "epoch": 1576} {"train_loss": -6.029402732849121, "global_step": 66204, "epoch": 1576} {"train_loss": -5.997553825378418, "global_step": 66205, "epoch": 1576} {"train_loss": -6.0048956871032715, "global_step": 66206, "epoch": 1576} {"train_loss": -6.023184776306152, "global_step": 66207, "epoch": 1576} {"train_loss": -6.030074596405029, "global_step": 66208, "epoch": 1576} {"train_loss": -6.151385307312012, "global_step": 66209, "epoch": 1576} {"train_loss": -5.9757537841796875, "global_step": 66210, "epoch": 1576} {"train_loss": -6.005953311920166, "global_step": 66211, "epoch": 1576} {"train_loss": -6.035086631774902, "global_step": 66212, "epoch": 1576} {"train_loss": -5.932977676391602, "global_step": 66213, "epoch": 1576} {"train_loss": -5.942720413208008, "global_step": 66214, "epoch": 1576} {"train_loss": -5.976654052734375, "global_step": 66215, "epoch": 1576} {"train_loss": -6.077930927276611, "global_step": 66216, "epoch": 1576} {"train_loss": -6.043928623199463, "global_step": 66217, "epoch": 1576} {"train_loss": -6.084073066711426, "global_step": 66218, "epoch": 1576} {"train_loss": -5.958050727844238, "global_step": 66219, "epoch": 1576} {"train_loss": -6.043091773986816, "global_step": 66220, "epoch": 1576} {"train_loss": -5.967067241668701, "global_step": 66221, "epoch": 1576} {"train_loss": -6.061624526977539, "global_step": 66222, "epoch": 1576} {"train_loss": -6.075011730194092, "global_step": 66223, "epoch": 1576} {"train_loss": -5.985653877258301, "global_step": 66224, "epoch": 1576} {"train_loss": -6.041662216186523, "global_step": 66225, "epoch": 1576} {"train_loss": -5.891035079956055, "global_step": 66226, "epoch": 1576} {"train_loss": -6.016676902770996, "global_step": 66227, "epoch": 1576} {"train_loss": -5.940384864807129, "global_step": 66228, "epoch": 1576} {"train_loss": -5.892187118530273, "global_step": 66229, "epoch": 1576} {"train_loss": -5.913463115692139, "global_step": 66230, "epoch": 1576} {"train_loss": -5.96565055847168, "global_step": 66231, "epoch": 1576} {"train_loss": -5.879471778869629, "global_step": 66232, "epoch": 1576} {"train_loss": -5.9962918644859675, "global_step": 66233, "epoch": 1576, "val_loss": 61344.9140625} {"train_loss": -6.084962844848633, "global_step": 66234, "epoch": 1577} {"train_loss": -5.928076267242432, "global_step": 66235, "epoch": 1577} {"train_loss": -5.971678733825684, "global_step": 66236, "epoch": 1577} {"train_loss": -6.011102676391602, "global_step": 66237, "epoch": 1577} {"train_loss": -6.087555885314941, "global_step": 66238, "epoch": 1577} {"train_loss": -5.949069976806641, "global_step": 66239, "epoch": 1577} {"train_loss": -6.006663799285889, "global_step": 66240, "epoch": 1577} {"train_loss": -5.943039417266846, "global_step": 66241, "epoch": 1577} {"train_loss": -5.931766033172607, "global_step": 66242, "epoch": 1577} {"train_loss": -5.936043739318848, "global_step": 66243, "epoch": 1577} {"train_loss": -5.908977031707764, "global_step": 66244, "epoch": 1577} {"train_loss": -5.932683944702148, "global_step": 66245, "epoch": 1577} {"train_loss": -5.887664794921875, "global_step": 66246, "epoch": 1577} {"train_loss": -5.951320171356201, "global_step": 66247, "epoch": 1577} {"train_loss": -5.921625137329102, "global_step": 66248, "epoch": 1577} {"train_loss": -5.805434226989746, "global_step": 66249, "epoch": 1577} {"train_loss": -5.985339641571045, "global_step": 66250, "epoch": 1577} {"train_loss": -5.912182331085205, "global_step": 66251, "epoch": 1577} {"train_loss": -5.96705436706543, "global_step": 66252, "epoch": 1577} {"train_loss": -5.982637405395508, "global_step": 66253, "epoch": 1577} {"train_loss": -6.011517524719238, "global_step": 66254, "epoch": 1577} {"train_loss": -5.920448303222656, "global_step": 66255, "epoch": 1577} {"train_loss": -5.890487194061279, "global_step": 66256, "epoch": 1577} {"train_loss": -5.988534927368164, "global_step": 66257, "epoch": 1577} {"train_loss": -5.9428606033325195, "global_step": 66258, "epoch": 1577} {"train_loss": -6.005692958831787, "global_step": 66259, "epoch": 1577} {"train_loss": -5.897436141967773, "global_step": 66260, "epoch": 1577} {"train_loss": -5.93173360824585, "global_step": 66261, "epoch": 1577} {"train_loss": -5.936596393585205, "global_step": 66262, "epoch": 1577} {"train_loss": -6.035008430480957, "global_step": 66263, "epoch": 1577} {"train_loss": -5.868906497955322, "global_step": 66264, "epoch": 1577} {"train_loss": -5.929977893829346, "global_step": 66265, "epoch": 1577} {"train_loss": -5.982911109924316, "global_step": 66266, "epoch": 1577} {"train_loss": -5.926314830780029, "global_step": 66267, "epoch": 1577} {"train_loss": -5.9980316162109375, "global_step": 66268, "epoch": 1577} {"train_loss": -5.967336177825928, "global_step": 66269, "epoch": 1577} {"train_loss": -6.064004898071289, "global_step": 66270, "epoch": 1577} {"train_loss": -6.09665584564209, "global_step": 66271, "epoch": 1577} {"train_loss": -6.065786838531494, "global_step": 66272, "epoch": 1577} {"train_loss": -6.015583038330078, "global_step": 66273, "epoch": 1577} {"train_loss": -5.889065742492676, "global_step": 66274, "epoch": 1577} {"train_loss": -5.962478035972232, "global_step": 66275, "epoch": 1577, "val_loss": 61673.34375} {"train_loss": -6.023792266845703, "global_step": 66276, "epoch": 1578} {"train_loss": -6.060194969177246, "global_step": 66277, "epoch": 1578} {"train_loss": -5.953329086303711, "global_step": 66278, "epoch": 1578} {"train_loss": -5.988844394683838, "global_step": 66279, "epoch": 1578} {"train_loss": -6.0527119636535645, "global_step": 66280, "epoch": 1578} {"train_loss": -6.013489723205566, "global_step": 66281, "epoch": 1578} {"train_loss": -5.9490814208984375, "global_step": 66282, "epoch": 1578} {"train_loss": -5.9627580642700195, "global_step": 66283, "epoch": 1578} {"train_loss": -5.951719284057617, "global_step": 66284, "epoch": 1578} {"train_loss": -6.033272743225098, "global_step": 66285, "epoch": 1578} {"train_loss": -5.985910892486572, "global_step": 66286, "epoch": 1578} {"train_loss": -5.909918785095215, "global_step": 66287, "epoch": 1578} {"train_loss": -6.038966178894043, "global_step": 66288, "epoch": 1578} {"train_loss": -5.9366455078125, "global_step": 66289, "epoch": 1578} {"train_loss": -6.02137565612793, "global_step": 66290, "epoch": 1578} {"train_loss": -5.885693550109863, "global_step": 66291, "epoch": 1578} {"train_loss": -6.01644229888916, "global_step": 66292, "epoch": 1578} {"train_loss": -5.886383533477783, "global_step": 66293, "epoch": 1578} {"train_loss": -5.937100410461426, "global_step": 66294, "epoch": 1578} {"train_loss": -6.048091888427734, "global_step": 66295, "epoch": 1578} {"train_loss": -6.000340461730957, "global_step": 66296, "epoch": 1578} {"train_loss": -5.954360485076904, "global_step": 66297, "epoch": 1578} {"train_loss": -5.963822841644287, "global_step": 66298, "epoch": 1578} {"train_loss": -5.959442615509033, "global_step": 66299, "epoch": 1578} {"train_loss": -5.960292339324951, "global_step": 66300, "epoch": 1578} {"train_loss": -5.9013471603393555, "global_step": 66301, "epoch": 1578} {"train_loss": -5.988926887512207, "global_step": 66302, "epoch": 1578} {"train_loss": -5.732108116149902, "global_step": 66303, "epoch": 1578} {"train_loss": -5.819644451141357, "global_step": 66304, "epoch": 1578} {"train_loss": -5.859832763671875, "global_step": 66305, "epoch": 1578} {"train_loss": -5.879317760467529, "global_step": 66306, "epoch": 1578} {"train_loss": -5.843378067016602, "global_step": 66307, "epoch": 1578} {"train_loss": -5.849837303161621, "global_step": 66308, "epoch": 1578} {"train_loss": -5.930083274841309, "global_step": 66309, "epoch": 1578} {"train_loss": -5.990726470947266, "global_step": 66310, "epoch": 1578} {"train_loss": -5.928265571594238, "global_step": 66311, "epoch": 1578} {"train_loss": -5.959009170532227, "global_step": 66312, "epoch": 1578} {"train_loss": -5.936582088470459, "global_step": 66313, "epoch": 1578} {"train_loss": -5.9742584228515625, "global_step": 66314, "epoch": 1578} {"train_loss": -5.967895984649658, "global_step": 66315, "epoch": 1578} {"train_loss": -5.834202289581299, "global_step": 66316, "epoch": 1578} {"train_loss": -5.947283994583857, "global_step": 66317, "epoch": 1578, "val_loss": 61737.87109375} {"train_loss": -5.890535354614258, "global_step": 66318, "epoch": 1579} {"train_loss": -5.871790885925293, "global_step": 66319, "epoch": 1579} {"train_loss": -5.909924030303955, "global_step": 66320, "epoch": 1579} {"train_loss": -6.096182346343994, "global_step": 66321, "epoch": 1579} {"train_loss": -5.914035797119141, "global_step": 66322, "epoch": 1579} {"train_loss": -6.04874849319458, "global_step": 66323, "epoch": 1579} {"train_loss": -6.0483717918396, "global_step": 66324, "epoch": 1579} {"train_loss": -5.706168174743652, "global_step": 66325, "epoch": 1579} {"train_loss": -5.9925055503845215, "global_step": 66326, "epoch": 1579} {"train_loss": -5.918704986572266, "global_step": 66327, "epoch": 1579} {"train_loss": -5.91526460647583, "global_step": 66328, "epoch": 1579} {"train_loss": -6.010275363922119, "global_step": 66329, "epoch": 1579} {"train_loss": -5.965126991271973, "global_step": 66330, "epoch": 1579} {"train_loss": -5.984169960021973, "global_step": 66331, "epoch": 1579} {"train_loss": -6.102354526519775, "global_step": 66332, "epoch": 1579} {"train_loss": -5.997551918029785, "global_step": 66333, "epoch": 1579} {"train_loss": -6.052669525146484, "global_step": 66334, "epoch": 1579} {"train_loss": -5.9231977462768555, "global_step": 66335, "epoch": 1579} {"train_loss": -5.940465450286865, "global_step": 66336, "epoch": 1579} {"train_loss": -6.03082275390625, "global_step": 66337, "epoch": 1579} {"train_loss": -5.955722808837891, "global_step": 66338, "epoch": 1579} {"train_loss": -5.932140350341797, "global_step": 66339, "epoch": 1579} {"train_loss": -5.929969310760498, "global_step": 66340, "epoch": 1579} {"train_loss": -5.978024482727051, "global_step": 66341, "epoch": 1579} {"train_loss": -5.974248886108398, "global_step": 66342, "epoch": 1579} {"train_loss": -5.838301658630371, "global_step": 66343, "epoch": 1579} {"train_loss": -6.023252487182617, "global_step": 66344, "epoch": 1579} {"train_loss": -6.0401434898376465, "global_step": 66345, "epoch": 1579} {"train_loss": -5.9133100509643555, "global_step": 66346, "epoch": 1579} {"train_loss": -6.031914710998535, "global_step": 66347, "epoch": 1579} {"train_loss": -5.987469673156738, "global_step": 66348, "epoch": 1579} {"train_loss": -6.09418249130249, "global_step": 66349, "epoch": 1579} {"train_loss": -6.047621726989746, "global_step": 66350, "epoch": 1579} {"train_loss": -6.037343978881836, "global_step": 66351, "epoch": 1579} {"train_loss": -6.060798645019531, "global_step": 66352, "epoch": 1579} {"train_loss": -6.007104396820068, "global_step": 66353, "epoch": 1579} {"train_loss": -6.04893159866333, "global_step": 66354, "epoch": 1579} {"train_loss": -5.896554946899414, "global_step": 66355, "epoch": 1579} {"train_loss": -6.043367862701416, "global_step": 66356, "epoch": 1579} {"train_loss": -6.039515495300293, "global_step": 66357, "epoch": 1579} {"train_loss": -6.0638227462768555, "global_step": 66358, "epoch": 1579} {"train_loss": -5.9803927058265325, "global_step": 66359, "epoch": 1579, "val_loss": 61350.7265625} {"train_loss": -6.001246452331543, "global_step": 66360, "epoch": 1580} {"train_loss": -6.052466869354248, "global_step": 66361, "epoch": 1580} {"train_loss": -5.975759029388428, "global_step": 66362, "epoch": 1580} {"train_loss": -5.997159481048584, "global_step": 66363, "epoch": 1580} {"train_loss": -5.997910022735596, "global_step": 66364, "epoch": 1580} {"train_loss": -5.972311973571777, "global_step": 66365, "epoch": 1580} {"train_loss": -6.052192211151123, "global_step": 66366, "epoch": 1580} {"train_loss": -6.017575263977051, "global_step": 66367, "epoch": 1580} {"train_loss": -5.857036113739014, "global_step": 66368, "epoch": 1580} {"train_loss": -5.96446418762207, "global_step": 66369, "epoch": 1580} {"train_loss": -6.020456790924072, "global_step": 66370, "epoch": 1580} {"train_loss": -5.867504119873047, "global_step": 66371, "epoch": 1580} {"train_loss": -5.939553260803223, "global_step": 66372, "epoch": 1580} {"train_loss": -6.022439002990723, "global_step": 66373, "epoch": 1580} {"train_loss": -5.948939800262451, "global_step": 66374, "epoch": 1580} {"train_loss": -5.958488941192627, "global_step": 66375, "epoch": 1580} {"train_loss": -6.00453519821167, "global_step": 66376, "epoch": 1580} {"train_loss": -5.941318035125732, "global_step": 66377, "epoch": 1580} {"train_loss": -5.9829511642456055, "global_step": 66378, "epoch": 1580} {"train_loss": -5.94088077545166, "global_step": 66379, "epoch": 1580} {"train_loss": -6.002622604370117, "global_step": 66380, "epoch": 1580} {"train_loss": -5.918209075927734, "global_step": 66381, "epoch": 1580} {"train_loss": -5.9568400382995605, "global_step": 66382, "epoch": 1580} {"train_loss": -6.027710914611816, "global_step": 66383, "epoch": 1580} {"train_loss": -5.975170612335205, "global_step": 66384, "epoch": 1580} {"train_loss": -6.082701683044434, "global_step": 66385, "epoch": 1580} {"train_loss": -5.903133392333984, "global_step": 66386, "epoch": 1580} {"train_loss": -5.884929656982422, "global_step": 66387, "epoch": 1580} {"train_loss": -5.990021705627441, "global_step": 66388, "epoch": 1580} {"train_loss": -5.982338905334473, "global_step": 66389, "epoch": 1580} {"train_loss": -6.089578151702881, "global_step": 66390, "epoch": 1580} {"train_loss": -5.983624458312988, "global_step": 66391, "epoch": 1580} {"train_loss": -5.960562705993652, "global_step": 66392, "epoch": 1580} {"train_loss": -6.054301738739014, "global_step": 66393, "epoch": 1580} {"train_loss": -5.9186248779296875, "global_step": 66394, "epoch": 1580} {"train_loss": -5.9441070556640625, "global_step": 66395, "epoch": 1580} {"train_loss": -6.0377912521362305, "global_step": 66396, "epoch": 1580} {"train_loss": -6.0426764488220215, "global_step": 66397, "epoch": 1580} {"train_loss": -6.051197052001953, "global_step": 66398, "epoch": 1580} {"train_loss": -5.9465484619140625, "global_step": 66399, "epoch": 1580} {"train_loss": -5.943336486816406, "global_step": 66400, "epoch": 1580} {"train_loss": -5.982859645571027, "global_step": 66401, "epoch": 1580, "val_loss": 61503.24609375} {"train_loss": -5.983380317687988, "global_step": 66402, "epoch": 1581} {"train_loss": -5.923133850097656, "global_step": 66403, "epoch": 1581} {"train_loss": -6.056254863739014, "global_step": 66404, "epoch": 1581} {"train_loss": -5.910398483276367, "global_step": 66405, "epoch": 1581} {"train_loss": -5.924650192260742, "global_step": 66406, "epoch": 1581} {"train_loss": -5.9927263259887695, "global_step": 66407, "epoch": 1581} {"train_loss": -5.97496223449707, "global_step": 66408, "epoch": 1581} {"train_loss": -6.0995330810546875, "global_step": 66409, "epoch": 1581} {"train_loss": -5.957618236541748, "global_step": 66410, "epoch": 1581} {"train_loss": -5.932676315307617, "global_step": 66411, "epoch": 1581} {"train_loss": -6.0738677978515625, "global_step": 66412, "epoch": 1581} {"train_loss": -6.034735679626465, "global_step": 66413, "epoch": 1581} {"train_loss": -6.008800029754639, "global_step": 66414, "epoch": 1581} {"train_loss": -6.053140163421631, "global_step": 66415, "epoch": 1581} {"train_loss": -6.012314796447754, "global_step": 66416, "epoch": 1581} {"train_loss": -5.950217247009277, "global_step": 66417, "epoch": 1581} {"train_loss": -6.0036773681640625, "global_step": 66418, "epoch": 1581} {"train_loss": -6.1235198974609375, "global_step": 66419, "epoch": 1581} {"train_loss": -6.0615763664245605, "global_step": 66420, "epoch": 1581} {"train_loss": -6.059140682220459, "global_step": 66421, "epoch": 1581} {"train_loss": -6.1837873458862305, "global_step": 66422, "epoch": 1581} {"train_loss": -5.928576469421387, "global_step": 66423, "epoch": 1581} {"train_loss": -6.043354511260986, "global_step": 66424, "epoch": 1581} {"train_loss": -6.016005516052246, "global_step": 66425, "epoch": 1581} {"train_loss": -5.84464168548584, "global_step": 66426, "epoch": 1581} {"train_loss": -5.886728286743164, "global_step": 66427, "epoch": 1581} {"train_loss": -5.953584671020508, "global_step": 66428, "epoch": 1581} {"train_loss": -6.0907673835754395, "global_step": 66429, "epoch": 1581} {"train_loss": -6.007266044616699, "global_step": 66430, "epoch": 1581} {"train_loss": -6.033144950866699, "global_step": 66431, "epoch": 1581} {"train_loss": -6.097458839416504, "global_step": 66432, "epoch": 1581} {"train_loss": -5.840085983276367, "global_step": 66433, "epoch": 1581} {"train_loss": -5.920204162597656, "global_step": 66434, "epoch": 1581} {"train_loss": -5.966639518737793, "global_step": 66435, "epoch": 1581} {"train_loss": -6.079244613647461, "global_step": 66436, "epoch": 1581} {"train_loss": -5.8976945877075195, "global_step": 66437, "epoch": 1581} {"train_loss": -5.97900390625, "global_step": 66438, "epoch": 1581} {"train_loss": -5.999914169311523, "global_step": 66439, "epoch": 1581} {"train_loss": -6.1614484786987305, "global_step": 66440, "epoch": 1581} {"train_loss": -6.0147247314453125, "global_step": 66441, "epoch": 1581} {"train_loss": -5.983567237854004, "global_step": 66442, "epoch": 1581} {"train_loss": -6.001252730687459, "global_step": 66443, "epoch": 1581, "val_loss": 61441.265625} {"train_loss": -6.124153137207031, "global_step": 66444, "epoch": 1582} {"train_loss": -6.060635566711426, "global_step": 66445, "epoch": 1582} {"train_loss": -5.946801662445068, "global_step": 66446, "epoch": 1582} {"train_loss": -6.055115222930908, "global_step": 66447, "epoch": 1582} {"train_loss": -6.003452777862549, "global_step": 66448, "epoch": 1582} {"train_loss": -5.943017959594727, "global_step": 66449, "epoch": 1582} {"train_loss": -5.8802289962768555, "global_step": 66450, "epoch": 1582} {"train_loss": -5.936278820037842, "global_step": 66451, "epoch": 1582} {"train_loss": -5.871102809906006, "global_step": 66452, "epoch": 1582} {"train_loss": -5.911248207092285, "global_step": 66453, "epoch": 1582} {"train_loss": -5.987746238708496, "global_step": 66454, "epoch": 1582} {"train_loss": -5.85291862487793, "global_step": 66455, "epoch": 1582} {"train_loss": -5.884530067443848, "global_step": 66456, "epoch": 1582} {"train_loss": -5.941384315490723, "global_step": 66457, "epoch": 1582} {"train_loss": -5.9450459480285645, "global_step": 66458, "epoch": 1582} {"train_loss": -5.9000396728515625, "global_step": 66459, "epoch": 1582} {"train_loss": -5.9942121505737305, "global_step": 66460, "epoch": 1582} {"train_loss": -5.994801044464111, "global_step": 66461, "epoch": 1582} {"train_loss": -6.0175323486328125, "global_step": 66462, "epoch": 1582} {"train_loss": -5.935009956359863, "global_step": 66463, "epoch": 1582} {"train_loss": -5.935245990753174, "global_step": 66464, "epoch": 1582} {"train_loss": -5.880373001098633, "global_step": 66465, "epoch": 1582} {"train_loss": -5.963132381439209, "global_step": 66466, "epoch": 1582} {"train_loss": -5.908175945281982, "global_step": 66467, "epoch": 1582} {"train_loss": -5.94870662689209, "global_step": 66468, "epoch": 1582} {"train_loss": -5.90349817276001, "global_step": 66469, "epoch": 1582} {"train_loss": -6.0805768966674805, "global_step": 66470, "epoch": 1582} {"train_loss": -6.032912254333496, "global_step": 66471, "epoch": 1582} {"train_loss": -5.937032699584961, "global_step": 66472, "epoch": 1582} {"train_loss": -6.0368828773498535, "global_step": 66473, "epoch": 1582} {"train_loss": -5.951750755310059, "global_step": 66474, "epoch": 1582} {"train_loss": -5.96511173248291, "global_step": 66475, "epoch": 1582} {"train_loss": -5.888355731964111, "global_step": 66476, "epoch": 1582} {"train_loss": -5.800065994262695, "global_step": 66477, "epoch": 1582} {"train_loss": -6.007623672485352, "global_step": 66478, "epoch": 1582} {"train_loss": -5.967860221862793, "global_step": 66479, "epoch": 1582} {"train_loss": -5.807000160217285, "global_step": 66480, "epoch": 1582} {"train_loss": -6.010251998901367, "global_step": 66481, "epoch": 1582} {"train_loss": -5.954404830932617, "global_step": 66482, "epoch": 1582} {"train_loss": -5.9178972244262695, "global_step": 66483, "epoch": 1582} {"train_loss": -5.907100677490234, "global_step": 66484, "epoch": 1582} {"train_loss": -5.948695795876639, "global_step": 66485, "epoch": 1582, "val_loss": 62009.24609375} {"train_loss": -5.945345878601074, "global_step": 66486, "epoch": 1583} {"train_loss": -6.1349921226501465, "global_step": 66487, "epoch": 1583} {"train_loss": -5.832912445068359, "global_step": 66488, "epoch": 1583} {"train_loss": -6.0045166015625, "global_step": 66489, "epoch": 1583} {"train_loss": -6.049034118652344, "global_step": 66490, "epoch": 1583} {"train_loss": -6.0417022705078125, "global_step": 66491, "epoch": 1583} {"train_loss": -5.934591770172119, "global_step": 66492, "epoch": 1583} {"train_loss": -5.957367420196533, "global_step": 66493, "epoch": 1583} {"train_loss": -5.980091571807861, "global_step": 66494, "epoch": 1583} {"train_loss": -6.060901641845703, "global_step": 66495, "epoch": 1583} {"train_loss": -5.954580307006836, "global_step": 66496, "epoch": 1583} {"train_loss": -6.000162124633789, "global_step": 66497, "epoch": 1583} {"train_loss": -5.947817802429199, "global_step": 66498, "epoch": 1583} {"train_loss": -5.984821319580078, "global_step": 66499, "epoch": 1583} {"train_loss": -5.9549736976623535, "global_step": 66500, "epoch": 1583} {"train_loss": -6.059169292449951, "global_step": 66501, "epoch": 1583} {"train_loss": -5.973496913909912, "global_step": 66502, "epoch": 1583} {"train_loss": -5.955585479736328, "global_step": 66503, "epoch": 1583} {"train_loss": -5.967853546142578, "global_step": 66504, "epoch": 1583} {"train_loss": -5.917880058288574, "global_step": 66505, "epoch": 1583} {"train_loss": -6.015024662017822, "global_step": 66506, "epoch": 1583} {"train_loss": -5.875749588012695, "global_step": 66507, "epoch": 1583} {"train_loss": -5.975812911987305, "global_step": 66508, "epoch": 1583} {"train_loss": -5.981253623962402, "global_step": 66509, "epoch": 1583} {"train_loss": -6.003439903259277, "global_step": 66510, "epoch": 1583} {"train_loss": -5.928406238555908, "global_step": 66511, "epoch": 1583} {"train_loss": -6.041497230529785, "global_step": 66512, "epoch": 1583} {"train_loss": -5.921317100524902, "global_step": 66513, "epoch": 1583} {"train_loss": -5.947533130645752, "global_step": 66514, "epoch": 1583} {"train_loss": -6.01063346862793, "global_step": 66515, "epoch": 1583} {"train_loss": -6.022686958312988, "global_step": 66516, "epoch": 1583} {"train_loss": -5.901827812194824, "global_step": 66517, "epoch": 1583} {"train_loss": -5.993678092956543, "global_step": 66518, "epoch": 1583} {"train_loss": -6.030130386352539, "global_step": 66519, "epoch": 1583} {"train_loss": -5.8271942138671875, "global_step": 66520, "epoch": 1583} {"train_loss": -6.003822326660156, "global_step": 66521, "epoch": 1583} {"train_loss": -6.06721305847168, "global_step": 66522, "epoch": 1583} {"train_loss": -5.903544902801514, "global_step": 66523, "epoch": 1583} {"train_loss": -5.973710060119629, "global_step": 66524, "epoch": 1583} {"train_loss": -5.878993034362793, "global_step": 66525, "epoch": 1583} {"train_loss": -6.082662582397461, "global_step": 66526, "epoch": 1583} {"train_loss": -5.972949550265358, "global_step": 66527, "epoch": 1583, "val_loss": 61547.5546875} {"train_loss": -5.985439300537109, "global_step": 66528, "epoch": 1584} {"train_loss": -5.933627128601074, "global_step": 66529, "epoch": 1584} {"train_loss": -5.966553688049316, "global_step": 66530, "epoch": 1584} {"train_loss": -6.023806571960449, "global_step": 66531, "epoch": 1584} {"train_loss": -6.066987991333008, "global_step": 66532, "epoch": 1584} {"train_loss": -6.04311990737915, "global_step": 66533, "epoch": 1584} {"train_loss": -6.142082214355469, "global_step": 66534, "epoch": 1584} {"train_loss": -6.045994758605957, "global_step": 66535, "epoch": 1584} {"train_loss": -6.1904802322387695, "global_step": 66536, "epoch": 1584} {"train_loss": -5.944734573364258, "global_step": 66537, "epoch": 1584} {"train_loss": -5.948150634765625, "global_step": 66538, "epoch": 1584} {"train_loss": -6.074557781219482, "global_step": 66539, "epoch": 1584} {"train_loss": -5.987571716308594, "global_step": 66540, "epoch": 1584} {"train_loss": -5.995497226715088, "global_step": 66541, "epoch": 1584} {"train_loss": -5.999283790588379, "global_step": 66542, "epoch": 1584} {"train_loss": -6.075319290161133, "global_step": 66543, "epoch": 1584} {"train_loss": -5.978303909301758, "global_step": 66544, "epoch": 1584} {"train_loss": -6.003517150878906, "global_step": 66545, "epoch": 1584} {"train_loss": -5.947712421417236, "global_step": 66546, "epoch": 1584} {"train_loss": -5.931976318359375, "global_step": 66547, "epoch": 1584} {"train_loss": -5.9399614334106445, "global_step": 66548, "epoch": 1584} {"train_loss": -5.964009761810303, "global_step": 66549, "epoch": 1584} {"train_loss": -6.146175384521484, "global_step": 66550, "epoch": 1584} {"train_loss": -6.0832905769348145, "global_step": 66551, "epoch": 1584} {"train_loss": -5.897294521331787, "global_step": 66552, "epoch": 1584} {"train_loss": -6.028940200805664, "global_step": 66553, "epoch": 1584} {"train_loss": -6.003223419189453, "global_step": 66554, "epoch": 1584} {"train_loss": -5.749443054199219, "global_step": 66555, "epoch": 1584} {"train_loss": -5.864625930786133, "global_step": 66556, "epoch": 1584} {"train_loss": -6.021625518798828, "global_step": 66557, "epoch": 1584} {"train_loss": -5.900359153747559, "global_step": 66558, "epoch": 1584} {"train_loss": -5.943966865539551, "global_step": 66559, "epoch": 1584} {"train_loss": -5.937098503112793, "global_step": 66560, "epoch": 1584} {"train_loss": -5.996926784515381, "global_step": 66561, "epoch": 1584} {"train_loss": -6.010400295257568, "global_step": 66562, "epoch": 1584} {"train_loss": -6.002080917358398, "global_step": 66563, "epoch": 1584} {"train_loss": -5.933298110961914, "global_step": 66564, "epoch": 1584} {"train_loss": -5.962876796722412, "global_step": 66565, "epoch": 1584} {"train_loss": -6.000595569610596, "global_step": 66566, "epoch": 1584} {"train_loss": -6.0269317626953125, "global_step": 66567, "epoch": 1584} {"train_loss": -5.97902774810791, "global_step": 66568, "epoch": 1584} {"train_loss": -5.992762145541963, "global_step": 66569, "epoch": 1584, "val_loss": 61682.5390625} {"train_loss": -5.928577423095703, "global_step": 66570, "epoch": 1585} {"train_loss": -6.022534370422363, "global_step": 66571, "epoch": 1585} {"train_loss": -5.973109245300293, "global_step": 66572, "epoch": 1585} {"train_loss": -6.0896100997924805, "global_step": 66573, "epoch": 1585} {"train_loss": -6.007629871368408, "global_step": 66574, "epoch": 1585} {"train_loss": -5.995701313018799, "global_step": 66575, "epoch": 1585} {"train_loss": -6.030623435974121, "global_step": 66576, "epoch": 1585} {"train_loss": -6.046971321105957, "global_step": 66577, "epoch": 1585} {"train_loss": -5.920592784881592, "global_step": 66578, "epoch": 1585} {"train_loss": -5.878087043762207, "global_step": 66579, "epoch": 1585} {"train_loss": -5.9472479820251465, "global_step": 66580, "epoch": 1585} {"train_loss": -5.974252700805664, "global_step": 66581, "epoch": 1585} {"train_loss": -6.087996006011963, "global_step": 66582, "epoch": 1585} {"train_loss": -6.054417610168457, "global_step": 66583, "epoch": 1585} {"train_loss": -5.959868431091309, "global_step": 66584, "epoch": 1585} {"train_loss": -5.92346715927124, "global_step": 66585, "epoch": 1585} {"train_loss": -6.046424865722656, "global_step": 66586, "epoch": 1585} {"train_loss": -5.884953022003174, "global_step": 66587, "epoch": 1585} {"train_loss": -6.013347625732422, "global_step": 66588, "epoch": 1585} {"train_loss": -6.008827209472656, "global_step": 66589, "epoch": 1585} {"train_loss": -5.993011951446533, "global_step": 66590, "epoch": 1585} {"train_loss": -6.065439701080322, "global_step": 66591, "epoch": 1585} {"train_loss": -5.810495853424072, "global_step": 66592, "epoch": 1585} {"train_loss": -5.981877326965332, "global_step": 66593, "epoch": 1585} {"train_loss": -5.936389923095703, "global_step": 66594, "epoch": 1585} {"train_loss": -6.171787261962891, "global_step": 66595, "epoch": 1585} {"train_loss": -5.9897308349609375, "global_step": 66596, "epoch": 1585} {"train_loss": -5.942841529846191, "global_step": 66597, "epoch": 1585} {"train_loss": -5.9828410148620605, "global_step": 66598, "epoch": 1585} {"train_loss": -6.056118965148926, "global_step": 66599, "epoch": 1585} {"train_loss": -6.044528961181641, "global_step": 66600, "epoch": 1585} {"train_loss": -6.019898414611816, "global_step": 66601, "epoch": 1585} {"train_loss": -5.96823787689209, "global_step": 66602, "epoch": 1585} {"train_loss": -5.924306869506836, "global_step": 66603, "epoch": 1585} {"train_loss": -6.012434005737305, "global_step": 66604, "epoch": 1585} {"train_loss": -5.787179946899414, "global_step": 66605, "epoch": 1585} {"train_loss": -5.955996990203857, "global_step": 66606, "epoch": 1585} {"train_loss": -5.928614139556885, "global_step": 66607, "epoch": 1585} {"train_loss": -5.896206378936768, "global_step": 66608, "epoch": 1585} {"train_loss": -5.890843391418457, "global_step": 66609, "epoch": 1585} {"train_loss": -5.984684944152832, "global_step": 66610, "epoch": 1585} {"train_loss": -5.979519458044143, "global_step": 66611, "epoch": 1585, "val_loss": 61677.65234375} {"train_loss": -5.908825874328613, "global_step": 66612, "epoch": 1586} {"train_loss": -5.986001014709473, "global_step": 66613, "epoch": 1586} {"train_loss": -5.949386119842529, "global_step": 66614, "epoch": 1586} {"train_loss": -5.951091766357422, "global_step": 66615, "epoch": 1586} {"train_loss": -6.11800479888916, "global_step": 66616, "epoch": 1586} {"train_loss": -5.947551727294922, "global_step": 66617, "epoch": 1586} {"train_loss": -5.901124000549316, "global_step": 66618, "epoch": 1586} {"train_loss": -5.978665828704834, "global_step": 66619, "epoch": 1586} {"train_loss": -6.040966987609863, "global_step": 66620, "epoch": 1586} {"train_loss": -6.108444690704346, "global_step": 66621, "epoch": 1586} {"train_loss": -5.9092607498168945, "global_step": 66622, "epoch": 1586} {"train_loss": -6.004188537597656, "global_step": 66623, "epoch": 1586} {"train_loss": -6.035221099853516, "global_step": 66624, "epoch": 1586} {"train_loss": -6.048379421234131, "global_step": 66625, "epoch": 1586} {"train_loss": -6.039213180541992, "global_step": 66626, "epoch": 1586} {"train_loss": -6.028414726257324, "global_step": 66627, "epoch": 1586} {"train_loss": -6.093282699584961, "global_step": 66628, "epoch": 1586} {"train_loss": -5.925087928771973, "global_step": 66629, "epoch": 1586} {"train_loss": -5.953887462615967, "global_step": 66630, "epoch": 1586} {"train_loss": -5.981814384460449, "global_step": 66631, "epoch": 1586} {"train_loss": -5.942881107330322, "global_step": 66632, "epoch": 1586} {"train_loss": -5.909942150115967, "global_step": 66633, "epoch": 1586} {"train_loss": -6.0265326499938965, "global_step": 66634, "epoch": 1586} {"train_loss": -5.981656074523926, "global_step": 66635, "epoch": 1586} {"train_loss": -5.882289409637451, "global_step": 66636, "epoch": 1586} {"train_loss": -5.89767599105835, "global_step": 66637, "epoch": 1586} {"train_loss": -5.956321716308594, "global_step": 66638, "epoch": 1586} {"train_loss": -5.997196197509766, "global_step": 66639, "epoch": 1586} {"train_loss": -6.000993251800537, "global_step": 66640, "epoch": 1586} {"train_loss": -5.984764099121094, "global_step": 66641, "epoch": 1586} {"train_loss": -5.980447292327881, "global_step": 66642, "epoch": 1586} {"train_loss": -5.970301628112793, "global_step": 66643, "epoch": 1586} {"train_loss": -6.011116981506348, "global_step": 66644, "epoch": 1586} {"train_loss": -5.973664283752441, "global_step": 66645, "epoch": 1586} {"train_loss": -5.973905086517334, "global_step": 66646, "epoch": 1586} {"train_loss": -5.946250915527344, "global_step": 66647, "epoch": 1586} {"train_loss": -5.910399436950684, "global_step": 66648, "epoch": 1586} {"train_loss": -6.0300397872924805, "global_step": 66649, "epoch": 1586} {"train_loss": -6.004480838775635, "global_step": 66650, "epoch": 1586} {"train_loss": -6.065518379211426, "global_step": 66651, "epoch": 1586} {"train_loss": -5.867511749267578, "global_step": 66652, "epoch": 1586} {"train_loss": -5.9812422934032625, "global_step": 66653, "epoch": 1586, "val_loss": 61305.25390625} {"train_loss": -5.819991111755371, "global_step": 66654, "epoch": 1587} {"train_loss": -5.950088024139404, "global_step": 66655, "epoch": 1587} {"train_loss": -6.0015716552734375, "global_step": 66656, "epoch": 1587} {"train_loss": -5.793736457824707, "global_step": 66657, "epoch": 1587} {"train_loss": -6.009923934936523, "global_step": 66658, "epoch": 1587} {"train_loss": -5.949649810791016, "global_step": 66659, "epoch": 1587} {"train_loss": -5.959968566894531, "global_step": 66660, "epoch": 1587} {"train_loss": -6.041562557220459, "global_step": 66661, "epoch": 1587} {"train_loss": -5.816750526428223, "global_step": 66662, "epoch": 1587} {"train_loss": -6.000021934509277, "global_step": 66663, "epoch": 1587} {"train_loss": -5.853653907775879, "global_step": 66664, "epoch": 1587} {"train_loss": -5.950150489807129, "global_step": 66665, "epoch": 1587} {"train_loss": -5.947888374328613, "global_step": 66666, "epoch": 1587} {"train_loss": -5.906890869140625, "global_step": 66667, "epoch": 1587} {"train_loss": -6.000663757324219, "global_step": 66668, "epoch": 1587} {"train_loss": -5.924854278564453, "global_step": 66669, "epoch": 1587} {"train_loss": -6.00480842590332, "global_step": 66670, "epoch": 1587} {"train_loss": -5.985709190368652, "global_step": 66671, "epoch": 1587} {"train_loss": -6.096020698547363, "global_step": 66672, "epoch": 1587} {"train_loss": -5.99553918838501, "global_step": 66673, "epoch": 1587} {"train_loss": -6.020760536193848, "global_step": 66674, "epoch": 1587} {"train_loss": -6.06123685836792, "global_step": 66675, "epoch": 1587} {"train_loss": -6.103750705718994, "global_step": 66676, "epoch": 1587} {"train_loss": -6.037039756774902, "global_step": 66677, "epoch": 1587} {"train_loss": -5.995404243469238, "global_step": 66678, "epoch": 1587} {"train_loss": -6.084697246551514, "global_step": 66679, "epoch": 1587} {"train_loss": -6.038814544677734, "global_step": 66680, "epoch": 1587} {"train_loss": -5.954309463500977, "global_step": 66681, "epoch": 1587} {"train_loss": -6.035542011260986, "global_step": 66682, "epoch": 1587} {"train_loss": -5.918379783630371, "global_step": 66683, "epoch": 1587} {"train_loss": -5.967723846435547, "global_step": 66684, "epoch": 1587} {"train_loss": -6.009944438934326, "global_step": 66685, "epoch": 1587} {"train_loss": -6.030564308166504, "global_step": 66686, "epoch": 1587} {"train_loss": -6.08841609954834, "global_step": 66687, "epoch": 1587} {"train_loss": -6.066697120666504, "global_step": 66688, "epoch": 1587} {"train_loss": -5.9658637046813965, "global_step": 66689, "epoch": 1587} {"train_loss": -6.052573204040527, "global_step": 66690, "epoch": 1587} {"train_loss": -6.013278007507324, "global_step": 66691, "epoch": 1587} {"train_loss": -5.869192123413086, "global_step": 66692, "epoch": 1587} {"train_loss": -6.019867897033691, "global_step": 66693, "epoch": 1587} {"train_loss": -5.741952419281006, "global_step": 66694, "epoch": 1587} {"train_loss": -5.979309978939238, "global_step": 66695, "epoch": 1587, "val_loss": 61467.234375} {"train_loss": -5.9893035888671875, "global_step": 66696, "epoch": 1588} {"train_loss": -5.8904523849487305, "global_step": 66697, "epoch": 1588} {"train_loss": -5.958561420440674, "global_step": 66698, "epoch": 1588} {"train_loss": -6.130248546600342, "global_step": 66699, "epoch": 1588} {"train_loss": -5.908999443054199, "global_step": 66700, "epoch": 1588} {"train_loss": -6.114188194274902, "global_step": 66701, "epoch": 1588} {"train_loss": -6.05313777923584, "global_step": 66702, "epoch": 1588} {"train_loss": -5.941775321960449, "global_step": 66703, "epoch": 1588} {"train_loss": -5.967384338378906, "global_step": 66704, "epoch": 1588} {"train_loss": -5.936229228973389, "global_step": 66705, "epoch": 1588} {"train_loss": -5.90931510925293, "global_step": 66706, "epoch": 1588} {"train_loss": -5.924560546875, "global_step": 66707, "epoch": 1588} {"train_loss": -5.852819919586182, "global_step": 66708, "epoch": 1588} {"train_loss": -6.064684867858887, "global_step": 66709, "epoch": 1588} {"train_loss": -5.961386680603027, "global_step": 66710, "epoch": 1588} {"train_loss": -5.859886169433594, "global_step": 66711, "epoch": 1588} {"train_loss": -5.99566650390625, "global_step": 66712, "epoch": 1588} {"train_loss": -5.859434127807617, "global_step": 66713, "epoch": 1588} {"train_loss": -5.99913215637207, "global_step": 66714, "epoch": 1588} {"train_loss": -5.999131202697754, "global_step": 66715, "epoch": 1588} {"train_loss": -5.972066879272461, "global_step": 66716, "epoch": 1588} {"train_loss": -5.978704929351807, "global_step": 66717, "epoch": 1588} {"train_loss": -5.895776271820068, "global_step": 66718, "epoch": 1588} {"train_loss": -5.983543872833252, "global_step": 66719, "epoch": 1588} {"train_loss": -5.997257232666016, "global_step": 66720, "epoch": 1588} {"train_loss": -5.999256610870361, "global_step": 66721, "epoch": 1588} {"train_loss": -5.916897773742676, "global_step": 66722, "epoch": 1588} {"train_loss": -5.963222503662109, "global_step": 66723, "epoch": 1588} {"train_loss": -6.0159101486206055, "global_step": 66724, "epoch": 1588} {"train_loss": -5.948602676391602, "global_step": 66725, "epoch": 1588} {"train_loss": -5.989360332489014, "global_step": 66726, "epoch": 1588} {"train_loss": -5.931445121765137, "global_step": 66727, "epoch": 1588} {"train_loss": -5.909946441650391, "global_step": 66728, "epoch": 1588} {"train_loss": -5.928745269775391, "global_step": 66729, "epoch": 1588} {"train_loss": -6.054175853729248, "global_step": 66730, "epoch": 1588} {"train_loss": -5.993894577026367, "global_step": 66731, "epoch": 1588} {"train_loss": -5.888481616973877, "global_step": 66732, "epoch": 1588} {"train_loss": -5.98340368270874, "global_step": 66733, "epoch": 1588} {"train_loss": -5.868679523468018, "global_step": 66734, "epoch": 1588} {"train_loss": -6.061356544494629, "global_step": 66735, "epoch": 1588} {"train_loss": -5.987544536590576, "global_step": 66736, "epoch": 1588} {"train_loss": -5.9622316019875665, "global_step": 66737, "epoch": 1588, "val_loss": 61675.15234375} {"train_loss": -5.840203285217285, "global_step": 66738, "epoch": 1589} {"train_loss": -6.022487640380859, "global_step": 66739, "epoch": 1589} {"train_loss": -5.949808120727539, "global_step": 66740, "epoch": 1589} {"train_loss": -6.157033920288086, "global_step": 66741, "epoch": 1589} {"train_loss": -5.99996280670166, "global_step": 66742, "epoch": 1589} {"train_loss": -5.990084171295166, "global_step": 66743, "epoch": 1589} {"train_loss": -5.993016719818115, "global_step": 66744, "epoch": 1589} {"train_loss": -6.080810546875, "global_step": 66745, "epoch": 1589} {"train_loss": -5.96138858795166, "global_step": 66746, "epoch": 1589} {"train_loss": -6.077304840087891, "global_step": 66747, "epoch": 1589} {"train_loss": -5.940340995788574, "global_step": 66748, "epoch": 1589} {"train_loss": -6.127283096313477, "global_step": 66749, "epoch": 1589} {"train_loss": -5.956509113311768, "global_step": 66750, "epoch": 1589} {"train_loss": -6.046817779541016, "global_step": 66751, "epoch": 1589} {"train_loss": -6.011446952819824, "global_step": 66752, "epoch": 1589} {"train_loss": -5.878965377807617, "global_step": 66753, "epoch": 1589} {"train_loss": -5.970195770263672, "global_step": 66754, "epoch": 1589} {"train_loss": -5.90987491607666, "global_step": 66755, "epoch": 1589} {"train_loss": -5.981125831604004, "global_step": 66756, "epoch": 1589} {"train_loss": -6.011768341064453, "global_step": 66757, "epoch": 1589} {"train_loss": -6.083403587341309, "global_step": 66758, "epoch": 1589} {"train_loss": -6.077304840087891, "global_step": 66759, "epoch": 1589} {"train_loss": -6.015583038330078, "global_step": 66760, "epoch": 1589} {"train_loss": -6.041740894317627, "global_step": 66761, "epoch": 1589} {"train_loss": -5.851008892059326, "global_step": 66762, "epoch": 1589} {"train_loss": -5.981791019439697, "global_step": 66763, "epoch": 1589} {"train_loss": -6.00900411605835, "global_step": 66764, "epoch": 1589} {"train_loss": -6.1280975341796875, "global_step": 66765, "epoch": 1589} {"train_loss": -5.905343055725098, "global_step": 66766, "epoch": 1589} {"train_loss": -5.939486503601074, "global_step": 66767, "epoch": 1589} {"train_loss": -5.986759662628174, "global_step": 66768, "epoch": 1589} {"train_loss": -5.970471382141113, "global_step": 66769, "epoch": 1589} {"train_loss": -5.92729377746582, "global_step": 66770, "epoch": 1589} {"train_loss": -5.976393699645996, "global_step": 66771, "epoch": 1589} {"train_loss": -6.056159019470215, "global_step": 66772, "epoch": 1589} {"train_loss": -6.00830078125, "global_step": 66773, "epoch": 1589} {"train_loss": -5.963126182556152, "global_step": 66774, "epoch": 1589} {"train_loss": -5.985507011413574, "global_step": 66775, "epoch": 1589} {"train_loss": -5.991199493408203, "global_step": 66776, "epoch": 1589} {"train_loss": -6.0190277099609375, "global_step": 66777, "epoch": 1589} {"train_loss": -5.93712043762207, "global_step": 66778, "epoch": 1589} {"train_loss": -5.991622107369559, "global_step": 66779, "epoch": 1589, "val_loss": 61859.19921875} {"train_loss": -6.038740634918213, "global_step": 66780, "epoch": 1590} {"train_loss": -5.910943031311035, "global_step": 66781, "epoch": 1590} {"train_loss": -5.9822797775268555, "global_step": 66782, "epoch": 1590} {"train_loss": -5.976183891296387, "global_step": 66783, "epoch": 1590} {"train_loss": -5.903707027435303, "global_step": 66784, "epoch": 1590} {"train_loss": -5.959530830383301, "global_step": 66785, "epoch": 1590} {"train_loss": -6.041242599487305, "global_step": 66786, "epoch": 1590} {"train_loss": -6.041481971740723, "global_step": 66787, "epoch": 1590} {"train_loss": -5.841449737548828, "global_step": 66788, "epoch": 1590} {"train_loss": -5.901833534240723, "global_step": 66789, "epoch": 1590} {"train_loss": -5.9267730712890625, "global_step": 66790, "epoch": 1590} {"train_loss": -5.819839954376221, "global_step": 66791, "epoch": 1590} {"train_loss": -5.846444129943848, "global_step": 66792, "epoch": 1590} {"train_loss": -5.819884777069092, "global_step": 66793, "epoch": 1590} {"train_loss": -5.8058857917785645, "global_step": 66794, "epoch": 1590} {"train_loss": -5.951633453369141, "global_step": 66795, "epoch": 1590} {"train_loss": -5.900737762451172, "global_step": 66796, "epoch": 1590} {"train_loss": -5.951668739318848, "global_step": 66797, "epoch": 1590} {"train_loss": -5.988452911376953, "global_step": 66798, "epoch": 1590} {"train_loss": -5.938795566558838, "global_step": 66799, "epoch": 1590} {"train_loss": -5.950838565826416, "global_step": 66800, "epoch": 1590} {"train_loss": -5.89940071105957, "global_step": 66801, "epoch": 1590} {"train_loss": -5.873047828674316, "global_step": 66802, "epoch": 1590} {"train_loss": -5.989221572875977, "global_step": 66803, "epoch": 1590} {"train_loss": -5.942804336547852, "global_step": 66804, "epoch": 1590} {"train_loss": -6.056892395019531, "global_step": 66805, "epoch": 1590} {"train_loss": -5.976727485656738, "global_step": 66806, "epoch": 1590} {"train_loss": -6.020590782165527, "global_step": 66807, "epoch": 1590} {"train_loss": -6.0279717445373535, "global_step": 66808, "epoch": 1590} {"train_loss": -6.016391754150391, "global_step": 66809, "epoch": 1590} {"train_loss": -5.971470355987549, "global_step": 66810, "epoch": 1590} {"train_loss": -6.011954307556152, "global_step": 66811, "epoch": 1590} {"train_loss": -5.962486267089844, "global_step": 66812, "epoch": 1590} {"train_loss": -6.074012279510498, "global_step": 66813, "epoch": 1590} {"train_loss": -5.948967933654785, "global_step": 66814, "epoch": 1590} {"train_loss": -5.9615983963012695, "global_step": 66815, "epoch": 1590} {"train_loss": -5.964840412139893, "global_step": 66816, "epoch": 1590} {"train_loss": -5.987480640411377, "global_step": 66817, "epoch": 1590} {"train_loss": -6.129551887512207, "global_step": 66818, "epoch": 1590} {"train_loss": -6.125785827636719, "global_step": 66819, "epoch": 1590} {"train_loss": -6.03507661819458, "global_step": 66820, "epoch": 1590} {"train_loss": -5.963572729201544, "global_step": 66821, "epoch": 1590, "val_loss": 61678.296875} {"train_loss": -5.963694095611572, "global_step": 66822, "epoch": 1591} {"train_loss": -5.872088432312012, "global_step": 66823, "epoch": 1591} {"train_loss": -6.031352996826172, "global_step": 66824, "epoch": 1591} {"train_loss": -6.0135602951049805, "global_step": 66825, "epoch": 1591} {"train_loss": -5.996760368347168, "global_step": 66826, "epoch": 1591} {"train_loss": -5.980249404907227, "global_step": 66827, "epoch": 1591} {"train_loss": -6.019814491271973, "global_step": 66828, "epoch": 1591} {"train_loss": -5.995739936828613, "global_step": 66829, "epoch": 1591} {"train_loss": -5.922003269195557, "global_step": 66830, "epoch": 1591} {"train_loss": -6.01474666595459, "global_step": 66831, "epoch": 1591} {"train_loss": -5.968204498291016, "global_step": 66832, "epoch": 1591} {"train_loss": -6.044461250305176, "global_step": 66833, "epoch": 1591} {"train_loss": -5.970828056335449, "global_step": 66834, "epoch": 1591} {"train_loss": -6.159242630004883, "global_step": 66835, "epoch": 1591} {"train_loss": -6.087715148925781, "global_step": 66836, "epoch": 1591} {"train_loss": -5.930171966552734, "global_step": 66837, "epoch": 1591} {"train_loss": -6.076242446899414, "global_step": 66838, "epoch": 1591} {"train_loss": -6.0559892654418945, "global_step": 66839, "epoch": 1591} {"train_loss": -5.9406890869140625, "global_step": 66840, "epoch": 1591} {"train_loss": -6.175466060638428, "global_step": 66841, "epoch": 1591} {"train_loss": -5.975530624389648, "global_step": 66842, "epoch": 1591} {"train_loss": -6.009488582611084, "global_step": 66843, "epoch": 1591} {"train_loss": -6.036521911621094, "global_step": 66844, "epoch": 1591} {"train_loss": -5.956334590911865, "global_step": 66845, "epoch": 1591} {"train_loss": -6.086716651916504, "global_step": 66846, "epoch": 1591} {"train_loss": -6.043413162231445, "global_step": 66847, "epoch": 1591} {"train_loss": -5.971125602722168, "global_step": 66848, "epoch": 1591} {"train_loss": -6.119690895080566, "global_step": 66849, "epoch": 1591} {"train_loss": -6.044813632965088, "global_step": 66850, "epoch": 1591} {"train_loss": -6.104377269744873, "global_step": 66851, "epoch": 1591} {"train_loss": -6.019824504852295, "global_step": 66852, "epoch": 1591} {"train_loss": -6.077709197998047, "global_step": 66853, "epoch": 1591} {"train_loss": -6.001997947692871, "global_step": 66854, "epoch": 1591} {"train_loss": -6.130433082580566, "global_step": 66855, "epoch": 1591} {"train_loss": -6.075985908508301, "global_step": 66856, "epoch": 1591} {"train_loss": -6.009175777435303, "global_step": 66857, "epoch": 1591} {"train_loss": -6.039361953735352, "global_step": 66858, "epoch": 1591} {"train_loss": -5.989624977111816, "global_step": 66859, "epoch": 1591} {"train_loss": -6.002063274383545, "global_step": 66860, "epoch": 1591} {"train_loss": -6.059730529785156, "global_step": 66861, "epoch": 1591} {"train_loss": -5.943652629852295, "global_step": 66862, "epoch": 1591} {"train_loss": -6.018982660202753, "global_step": 66863, "epoch": 1591, "val_loss": 61513.359375} {"train_loss": -5.861615180969238, "global_step": 66864, "epoch": 1592} {"train_loss": -6.01474666595459, "global_step": 66865, "epoch": 1592} {"train_loss": -6.0180583000183105, "global_step": 66866, "epoch": 1592} {"train_loss": -5.962395668029785, "global_step": 66867, "epoch": 1592} {"train_loss": -5.933945655822754, "global_step": 66868, "epoch": 1592} {"train_loss": -5.868220329284668, "global_step": 66869, "epoch": 1592} {"train_loss": -6.001619338989258, "global_step": 66870, "epoch": 1592} {"train_loss": -5.912842750549316, "global_step": 66871, "epoch": 1592} {"train_loss": -5.856917381286621, "global_step": 66872, "epoch": 1592} {"train_loss": -6.025546550750732, "global_step": 66873, "epoch": 1592} {"train_loss": -5.971656322479248, "global_step": 66874, "epoch": 1592} {"train_loss": -5.986131191253662, "global_step": 66875, "epoch": 1592} {"train_loss": -6.04410982131958, "global_step": 66876, "epoch": 1592} {"train_loss": -5.927060127258301, "global_step": 66877, "epoch": 1592} {"train_loss": -6.138096809387207, "global_step": 66878, "epoch": 1592} {"train_loss": -5.935610771179199, "global_step": 66879, "epoch": 1592} {"train_loss": -6.105727195739746, "global_step": 66880, "epoch": 1592} {"train_loss": -5.9493842124938965, "global_step": 66881, "epoch": 1592} {"train_loss": -5.994318962097168, "global_step": 66882, "epoch": 1592} {"train_loss": -5.941661357879639, "global_step": 66883, "epoch": 1592} {"train_loss": -5.994030952453613, "global_step": 66884, "epoch": 1592} {"train_loss": -5.948307991027832, "global_step": 66885, "epoch": 1592} {"train_loss": -6.06206750869751, "global_step": 66886, "epoch": 1592} {"train_loss": -5.997384071350098, "global_step": 66887, "epoch": 1592} {"train_loss": -5.956754684448242, "global_step": 66888, "epoch": 1592} {"train_loss": -5.909884929656982, "global_step": 66889, "epoch": 1592} {"train_loss": -6.0469970703125, "global_step": 66890, "epoch": 1592} {"train_loss": -6.0233964920043945, "global_step": 66891, "epoch": 1592} {"train_loss": -6.1043195724487305, "global_step": 66892, "epoch": 1592} {"train_loss": -6.0476579666137695, "global_step": 66893, "epoch": 1592} {"train_loss": -5.991018295288086, "global_step": 66894, "epoch": 1592} {"train_loss": -6.005976676940918, "global_step": 66895, "epoch": 1592} {"train_loss": -5.936457633972168, "global_step": 66896, "epoch": 1592} {"train_loss": -5.925886154174805, "global_step": 66897, "epoch": 1592} {"train_loss": -6.098455905914307, "global_step": 66898, "epoch": 1592} {"train_loss": -6.045055866241455, "global_step": 66899, "epoch": 1592} {"train_loss": -5.984109401702881, "global_step": 66900, "epoch": 1592} {"train_loss": -6.088163375854492, "global_step": 66901, "epoch": 1592} {"train_loss": -5.967824459075928, "global_step": 66902, "epoch": 1592} {"train_loss": -5.976352691650391, "global_step": 66903, "epoch": 1592} {"train_loss": -5.990094184875488, "global_step": 66904, "epoch": 1592} {"train_loss": -5.989164363770258, "global_step": 66905, "epoch": 1592, "val_loss": 61368.44921875} {"train_loss": -5.885374546051025, "global_step": 66906, "epoch": 1593} {"train_loss": -5.982426166534424, "global_step": 66907, "epoch": 1593} {"train_loss": -6.09836483001709, "global_step": 66908, "epoch": 1593} {"train_loss": -6.001033782958984, "global_step": 66909, "epoch": 1593} {"train_loss": -5.97233247756958, "global_step": 66910, "epoch": 1593} {"train_loss": -5.860400199890137, "global_step": 66911, "epoch": 1593} {"train_loss": -5.856470108032227, "global_step": 66912, "epoch": 1593} {"train_loss": -5.977093696594238, "global_step": 66913, "epoch": 1593} {"train_loss": -5.931099891662598, "global_step": 66914, "epoch": 1593} {"train_loss": -5.792941093444824, "global_step": 66915, "epoch": 1593} {"train_loss": -5.953251361846924, "global_step": 66916, "epoch": 1593} {"train_loss": -5.888504981994629, "global_step": 66917, "epoch": 1593} {"train_loss": -5.834939956665039, "global_step": 66918, "epoch": 1593} {"train_loss": -5.958691596984863, "global_step": 66919, "epoch": 1593} {"train_loss": -5.789302825927734, "global_step": 66920, "epoch": 1593} {"train_loss": -5.940864562988281, "global_step": 66921, "epoch": 1593} {"train_loss": -5.8035383224487305, "global_step": 66922, "epoch": 1593} {"train_loss": -5.9043474197387695, "global_step": 66923, "epoch": 1593} {"train_loss": -6.012925148010254, "global_step": 66924, "epoch": 1593} {"train_loss": -5.934943199157715, "global_step": 66925, "epoch": 1593} {"train_loss": -5.938395023345947, "global_step": 66926, "epoch": 1593} {"train_loss": -5.920343399047852, "global_step": 66927, "epoch": 1593} {"train_loss": -6.044220924377441, "global_step": 66928, "epoch": 1593} {"train_loss": -5.76904296875, "global_step": 66929, "epoch": 1593} {"train_loss": -6.0986833572387695, "global_step": 66930, "epoch": 1593} {"train_loss": -5.946903228759766, "global_step": 66931, "epoch": 1593} {"train_loss": -6.023437023162842, "global_step": 66932, "epoch": 1593} {"train_loss": -5.963300704956055, "global_step": 66933, "epoch": 1593} {"train_loss": -5.951066017150879, "global_step": 66934, "epoch": 1593} {"train_loss": -6.001691818237305, "global_step": 66935, "epoch": 1593} {"train_loss": -5.946854591369629, "global_step": 66936, "epoch": 1593} {"train_loss": -5.999415397644043, "global_step": 66937, "epoch": 1593} {"train_loss": -5.997601509094238, "global_step": 66938, "epoch": 1593} {"train_loss": -5.944087982177734, "global_step": 66939, "epoch": 1593} {"train_loss": -5.957475662231445, "global_step": 66940, "epoch": 1593} {"train_loss": -5.98423957824707, "global_step": 66941, "epoch": 1593} {"train_loss": -5.874210834503174, "global_step": 66942, "epoch": 1593} {"train_loss": -6.033371925354004, "global_step": 66943, "epoch": 1593} {"train_loss": -5.901644706726074, "global_step": 66944, "epoch": 1593} {"train_loss": -6.070196151733398, "global_step": 66945, "epoch": 1593} {"train_loss": -5.867993354797363, "global_step": 66946, "epoch": 1593} {"train_loss": -5.943377301806495, "global_step": 66947, "epoch": 1593, "val_loss": 61782.62109375} {"train_loss": -5.896553993225098, "global_step": 66948, "epoch": 1594} {"train_loss": -5.919637680053711, "global_step": 66949, "epoch": 1594} {"train_loss": -6.043743133544922, "global_step": 66950, "epoch": 1594} {"train_loss": -6.062843322753906, "global_step": 66951, "epoch": 1594} {"train_loss": -5.992627143859863, "global_step": 66952, "epoch": 1594} {"train_loss": -6.017325401306152, "global_step": 66953, "epoch": 1594} {"train_loss": -5.938326835632324, "global_step": 66954, "epoch": 1594} {"train_loss": -5.894571304321289, "global_step": 66955, "epoch": 1594} {"train_loss": -6.103581428527832, "global_step": 66956, "epoch": 1594} {"train_loss": -5.9797844886779785, "global_step": 66957, "epoch": 1594} {"train_loss": -6.143125534057617, "global_step": 66958, "epoch": 1594} {"train_loss": -5.998915195465088, "global_step": 66959, "epoch": 1594} {"train_loss": -5.912017345428467, "global_step": 66960, "epoch": 1594} {"train_loss": -5.944962978363037, "global_step": 66961, "epoch": 1594} {"train_loss": -5.9822587966918945, "global_step": 66962, "epoch": 1594} {"train_loss": -5.992598533630371, "global_step": 66963, "epoch": 1594} {"train_loss": -6.049193382263184, "global_step": 66964, "epoch": 1594} {"train_loss": -5.998573303222656, "global_step": 66965, "epoch": 1594} {"train_loss": -6.000295162200928, "global_step": 66966, "epoch": 1594} {"train_loss": -5.930469036102295, "global_step": 66967, "epoch": 1594} {"train_loss": -5.998226165771484, "global_step": 66968, "epoch": 1594} {"train_loss": -5.931459426879883, "global_step": 66969, "epoch": 1594} {"train_loss": -6.021203517913818, "global_step": 66970, "epoch": 1594} {"train_loss": -6.0430450439453125, "global_step": 66971, "epoch": 1594} {"train_loss": -5.9658966064453125, "global_step": 66972, "epoch": 1594} {"train_loss": -5.895900726318359, "global_step": 66973, "epoch": 1594} {"train_loss": -6.106184005737305, "global_step": 66974, "epoch": 1594} {"train_loss": -5.955312252044678, "global_step": 66975, "epoch": 1594} {"train_loss": -6.060344696044922, "global_step": 66976, "epoch": 1594} {"train_loss": -6.107570171356201, "global_step": 66977, "epoch": 1594} {"train_loss": -5.910220623016357, "global_step": 66978, "epoch": 1594} {"train_loss": -5.970371246337891, "global_step": 66979, "epoch": 1594} {"train_loss": -5.995436668395996, "global_step": 66980, "epoch": 1594} {"train_loss": -6.090709686279297, "global_step": 66981, "epoch": 1594} {"train_loss": -6.081249237060547, "global_step": 66982, "epoch": 1594} {"train_loss": -5.950814247131348, "global_step": 66983, "epoch": 1594} {"train_loss": -5.811616897583008, "global_step": 66984, "epoch": 1594} {"train_loss": -6.019548416137695, "global_step": 66985, "epoch": 1594} {"train_loss": -6.055870056152344, "global_step": 66986, "epoch": 1594} {"train_loss": -5.931543350219727, "global_step": 66987, "epoch": 1594} {"train_loss": -6.104573726654053, "global_step": 66988, "epoch": 1594} {"train_loss": -5.992742004848662, "global_step": 66989, "epoch": 1594, "val_loss": 61676.75} {"train_loss": -5.97495174407959, "global_step": 66990, "epoch": 1595} {"train_loss": -5.979719638824463, "global_step": 66991, "epoch": 1595} {"train_loss": -6.037363052368164, "global_step": 66992, "epoch": 1595} {"train_loss": -5.871377944946289, "global_step": 66993, "epoch": 1595} {"train_loss": -5.981019973754883, "global_step": 66994, "epoch": 1595} {"train_loss": -6.076704502105713, "global_step": 66995, "epoch": 1595} {"train_loss": -5.8742265701293945, "global_step": 66996, "epoch": 1595} {"train_loss": -6.0018630027771, "global_step": 66997, "epoch": 1595} {"train_loss": -5.909839630126953, "global_step": 66998, "epoch": 1595} {"train_loss": -5.986607551574707, "global_step": 66999, "epoch": 1595} {"train_loss": -5.989610195159912, "global_step": 67000, "epoch": 1595} {"train_loss": -5.942752838134766, "global_step": 67001, "epoch": 1595} {"train_loss": -5.941595077514648, "global_step": 67002, "epoch": 1595} {"train_loss": -6.0443115234375, "global_step": 67003, "epoch": 1595} {"train_loss": -5.857304573059082, "global_step": 67004, "epoch": 1595} {"train_loss": -6.01862096786499, "global_step": 67005, "epoch": 1595} {"train_loss": -5.908052444458008, "global_step": 67006, "epoch": 1595} {"train_loss": -5.90797758102417, "global_step": 67007, "epoch": 1595} {"train_loss": -5.837357521057129, "global_step": 67008, "epoch": 1595} {"train_loss": -5.9655046463012695, "global_step": 67009, "epoch": 1595} {"train_loss": -5.987641334533691, "global_step": 67010, "epoch": 1595} {"train_loss": -5.861485958099365, "global_step": 67011, "epoch": 1595} {"train_loss": -6.056215286254883, "global_step": 67012, "epoch": 1595} {"train_loss": -5.920689582824707, "global_step": 67013, "epoch": 1595} {"train_loss": -5.9462785720825195, "global_step": 67014, "epoch": 1595} {"train_loss": -5.967428207397461, "global_step": 67015, "epoch": 1595} {"train_loss": -5.980663299560547, "global_step": 67016, "epoch": 1595} {"train_loss": -6.016025543212891, "global_step": 67017, "epoch": 1595} {"train_loss": -6.006857872009277, "global_step": 67018, "epoch": 1595} {"train_loss": -6.054529666900635, "global_step": 67019, "epoch": 1595} {"train_loss": -6.007879734039307, "global_step": 67020, "epoch": 1595} {"train_loss": -6.066140174865723, "global_step": 67021, "epoch": 1595} {"train_loss": -6.024604797363281, "global_step": 67022, "epoch": 1595} {"train_loss": -5.978095531463623, "global_step": 67023, "epoch": 1595} {"train_loss": -5.93273401260376, "global_step": 67024, "epoch": 1595} {"train_loss": -6.072725296020508, "global_step": 67025, "epoch": 1595} {"train_loss": -6.030061721801758, "global_step": 67026, "epoch": 1595} {"train_loss": -6.116888046264648, "global_step": 67027, "epoch": 1595} {"train_loss": -5.98911190032959, "global_step": 67028, "epoch": 1595} {"train_loss": -5.999711990356445, "global_step": 67029, "epoch": 1595} {"train_loss": -6.183625221252441, "global_step": 67030, "epoch": 1595} {"train_loss": -5.985989457085019, "global_step": 67031, "epoch": 1595, "val_loss": 61698.66015625} {"train_loss": -6.024903297424316, "global_step": 67032, "epoch": 1596} {"train_loss": -6.003560543060303, "global_step": 67033, "epoch": 1596} {"train_loss": -5.979195594787598, "global_step": 67034, "epoch": 1596} {"train_loss": -6.113160133361816, "global_step": 67035, "epoch": 1596} {"train_loss": -6.004876136779785, "global_step": 67036, "epoch": 1596} {"train_loss": -5.895742416381836, "global_step": 67037, "epoch": 1596} {"train_loss": -6.044322967529297, "global_step": 67038, "epoch": 1596} {"train_loss": -6.011713027954102, "global_step": 67039, "epoch": 1596} {"train_loss": -5.987163066864014, "global_step": 67040, "epoch": 1596} {"train_loss": -5.994080543518066, "global_step": 67041, "epoch": 1596} {"train_loss": -5.833001136779785, "global_step": 67042, "epoch": 1596} {"train_loss": -5.902566432952881, "global_step": 67043, "epoch": 1596} {"train_loss": -5.921257972717285, "global_step": 67044, "epoch": 1596} {"train_loss": -6.087406158447266, "global_step": 67045, "epoch": 1596} {"train_loss": -5.9882097244262695, "global_step": 67046, "epoch": 1596} {"train_loss": -6.06671142578125, "global_step": 67047, "epoch": 1596} {"train_loss": -5.956728458404541, "global_step": 67048, "epoch": 1596} {"train_loss": -5.943966865539551, "global_step": 67049, "epoch": 1596} {"train_loss": -6.045964241027832, "global_step": 67050, "epoch": 1596} {"train_loss": -5.967576503753662, "global_step": 67051, "epoch": 1596} {"train_loss": -5.921667098999023, "global_step": 67052, "epoch": 1596} {"train_loss": -6.081533432006836, "global_step": 67053, "epoch": 1596} {"train_loss": -5.994816780090332, "global_step": 67054, "epoch": 1596} {"train_loss": -6.070274829864502, "global_step": 67055, "epoch": 1596} {"train_loss": -6.007513046264648, "global_step": 67056, "epoch": 1596} {"train_loss": -6.000765323638916, "global_step": 67057, "epoch": 1596} {"train_loss": -6.181990623474121, "global_step": 67058, "epoch": 1596} {"train_loss": -6.023470878601074, "global_step": 67059, "epoch": 1596} {"train_loss": -5.986124038696289, "global_step": 67060, "epoch": 1596} {"train_loss": -5.9840407371521, "global_step": 67061, "epoch": 1596} {"train_loss": -5.871726989746094, "global_step": 67062, "epoch": 1596} {"train_loss": -6.010589599609375, "global_step": 67063, "epoch": 1596} {"train_loss": -6.059682846069336, "global_step": 67064, "epoch": 1596} {"train_loss": -5.924630165100098, "global_step": 67065, "epoch": 1596} {"train_loss": -5.918050765991211, "global_step": 67066, "epoch": 1596} {"train_loss": -5.921063423156738, "global_step": 67067, "epoch": 1596} {"train_loss": -5.907492637634277, "global_step": 67068, "epoch": 1596} {"train_loss": -5.912680625915527, "global_step": 67069, "epoch": 1596} {"train_loss": -5.9348249435424805, "global_step": 67070, "epoch": 1596} {"train_loss": -6.059083461761475, "global_step": 67071, "epoch": 1596} {"train_loss": -6.034888744354248, "global_step": 67072, "epoch": 1596} {"train_loss": -5.990922360193162, "global_step": 67073, "epoch": 1596, "val_loss": 61554.3046875} {"train_loss": -5.9443535804748535, "global_step": 67074, "epoch": 1597} {"train_loss": -6.0481767654418945, "global_step": 67075, "epoch": 1597} {"train_loss": -6.033482074737549, "global_step": 67076, "epoch": 1597} {"train_loss": -6.095281600952148, "global_step": 67077, "epoch": 1597} {"train_loss": -6.07145881652832, "global_step": 67078, "epoch": 1597} {"train_loss": -6.063030242919922, "global_step": 67079, "epoch": 1597} {"train_loss": -5.97590446472168, "global_step": 67080, "epoch": 1597} {"train_loss": -6.093667030334473, "global_step": 67081, "epoch": 1597} {"train_loss": -6.058335781097412, "global_step": 67082, "epoch": 1597} {"train_loss": -6.049766540527344, "global_step": 67083, "epoch": 1597} {"train_loss": -5.956975936889648, "global_step": 67084, "epoch": 1597} {"train_loss": -6.05156135559082, "global_step": 67085, "epoch": 1597} {"train_loss": -5.984368801116943, "global_step": 67086, "epoch": 1597} {"train_loss": -5.992368698120117, "global_step": 67087, "epoch": 1597} {"train_loss": -6.031841278076172, "global_step": 67088, "epoch": 1597} {"train_loss": -6.048511028289795, "global_step": 67089, "epoch": 1597} {"train_loss": -6.110265731811523, "global_step": 67090, "epoch": 1597} {"train_loss": -5.919731140136719, "global_step": 67091, "epoch": 1597} {"train_loss": -6.011248588562012, "global_step": 67092, "epoch": 1597} {"train_loss": -5.962827682495117, "global_step": 67093, "epoch": 1597} {"train_loss": -5.9818620681762695, "global_step": 67094, "epoch": 1597} {"train_loss": -5.977682113647461, "global_step": 67095, "epoch": 1597} {"train_loss": -6.0627312660217285, "global_step": 67096, "epoch": 1597} {"train_loss": -5.96465539932251, "global_step": 67097, "epoch": 1597} {"train_loss": -6.112066268920898, "global_step": 67098, "epoch": 1597} {"train_loss": -6.049931526184082, "global_step": 67099, "epoch": 1597} {"train_loss": -6.0283002853393555, "global_step": 67100, "epoch": 1597} {"train_loss": -5.916596412658691, "global_step": 67101, "epoch": 1597} {"train_loss": -5.991135597229004, "global_step": 67102, "epoch": 1597} {"train_loss": -5.936171531677246, "global_step": 67103, "epoch": 1597} {"train_loss": -5.961665153503418, "global_step": 67104, "epoch": 1597} {"train_loss": -6.071829795837402, "global_step": 67105, "epoch": 1597} {"train_loss": -5.993168354034424, "global_step": 67106, "epoch": 1597} {"train_loss": -6.074728012084961, "global_step": 67107, "epoch": 1597} {"train_loss": -5.971874237060547, "global_step": 67108, "epoch": 1597} {"train_loss": -6.01599645614624, "global_step": 67109, "epoch": 1597} {"train_loss": -5.916886806488037, "global_step": 67110, "epoch": 1597} {"train_loss": -5.892634391784668, "global_step": 67111, "epoch": 1597} {"train_loss": -5.9751081466674805, "global_step": 67112, "epoch": 1597} {"train_loss": -5.992827415466309, "global_step": 67113, "epoch": 1597} {"train_loss": -5.900970458984375, "global_step": 67114, "epoch": 1597} {"train_loss": -6.007913544064476, "global_step": 67115, "epoch": 1597, "val_loss": 62093.13671875} {"train_loss": -5.841741561889648, "global_step": 67116, "epoch": 1598} {"train_loss": -5.907895088195801, "global_step": 67117, "epoch": 1598} {"train_loss": -5.975107669830322, "global_step": 67118, "epoch": 1598} {"train_loss": -6.0051374435424805, "global_step": 67119, "epoch": 1598} {"train_loss": -6.012784957885742, "global_step": 67120, "epoch": 1598} {"train_loss": -5.705426216125488, "global_step": 67121, "epoch": 1598} {"train_loss": -5.93757438659668, "global_step": 67122, "epoch": 1598} {"train_loss": -5.848564147949219, "global_step": 67123, "epoch": 1598} {"train_loss": -6.019837856292725, "global_step": 67124, "epoch": 1598} {"train_loss": -5.995723724365234, "global_step": 67125, "epoch": 1598} {"train_loss": -5.9594597816467285, "global_step": 67126, "epoch": 1598} {"train_loss": -5.95677375793457, "global_step": 67127, "epoch": 1598} {"train_loss": -5.9535040855407715, "global_step": 67128, "epoch": 1598} {"train_loss": -5.847404479980469, "global_step": 67129, "epoch": 1598} {"train_loss": -5.873206615447998, "global_step": 67130, "epoch": 1598} {"train_loss": -5.927256107330322, "global_step": 67131, "epoch": 1598} {"train_loss": -6.049009799957275, "global_step": 67132, "epoch": 1598} {"train_loss": -6.019669532775879, "global_step": 67133, "epoch": 1598} {"train_loss": -5.9220380783081055, "global_step": 67134, "epoch": 1598} {"train_loss": -5.999847888946533, "global_step": 67135, "epoch": 1598} {"train_loss": -5.9637041091918945, "global_step": 67136, "epoch": 1598} {"train_loss": -5.873374938964844, "global_step": 67137, "epoch": 1598} {"train_loss": -5.958707332611084, "global_step": 67138, "epoch": 1598} {"train_loss": -5.902362823486328, "global_step": 67139, "epoch": 1598} {"train_loss": -5.840339660644531, "global_step": 67140, "epoch": 1598} {"train_loss": -5.990510940551758, "global_step": 67141, "epoch": 1598} {"train_loss": -5.945044994354248, "global_step": 67142, "epoch": 1598} {"train_loss": -6.055045127868652, "global_step": 67143, "epoch": 1598} {"train_loss": -6.009336471557617, "global_step": 67144, "epoch": 1598} {"train_loss": -5.868144512176514, "global_step": 67145, "epoch": 1598} {"train_loss": -5.9961137771606445, "global_step": 67146, "epoch": 1598} {"train_loss": -5.967381477355957, "global_step": 67147, "epoch": 1598} {"train_loss": -5.926602363586426, "global_step": 67148, "epoch": 1598} {"train_loss": -6.015618324279785, "global_step": 67149, "epoch": 1598} {"train_loss": -5.903903007507324, "global_step": 67150, "epoch": 1598} {"train_loss": -5.952851295471191, "global_step": 67151, "epoch": 1598} {"train_loss": -5.979189872741699, "global_step": 67152, "epoch": 1598} {"train_loss": -5.984624862670898, "global_step": 67153, "epoch": 1598} {"train_loss": -6.157405853271484, "global_step": 67154, "epoch": 1598} {"train_loss": -6.041771411895752, "global_step": 67155, "epoch": 1598} {"train_loss": -6.040910720825195, "global_step": 67156, "epoch": 1598} {"train_loss": -5.957169680368333, "global_step": 67157, "epoch": 1598, "val_loss": 61747.56640625} {"train_loss": -5.965117454528809, "global_step": 67158, "epoch": 1599} {"train_loss": -5.905427932739258, "global_step": 67159, "epoch": 1599} {"train_loss": -6.01133394241333, "global_step": 67160, "epoch": 1599} {"train_loss": -5.993697643280029, "global_step": 67161, "epoch": 1599} {"train_loss": -5.965548515319824, "global_step": 67162, "epoch": 1599} {"train_loss": -6.066474914550781, "global_step": 67163, "epoch": 1599} {"train_loss": -5.8745927810668945, "global_step": 67164, "epoch": 1599} {"train_loss": -6.017233848571777, "global_step": 67165, "epoch": 1599} {"train_loss": -5.892947196960449, "global_step": 67166, "epoch": 1599} {"train_loss": -5.9737982749938965, "global_step": 67167, "epoch": 1599} {"train_loss": -6.122518539428711, "global_step": 67168, "epoch": 1599} {"train_loss": -6.113699436187744, "global_step": 67169, "epoch": 1599} {"train_loss": -5.83249044418335, "global_step": 67170, "epoch": 1599} {"train_loss": -5.933995723724365, "global_step": 67171, "epoch": 1599} {"train_loss": -6.0749359130859375, "global_step": 67172, "epoch": 1599} {"train_loss": -6.048432350158691, "global_step": 67173, "epoch": 1599} {"train_loss": -6.0785064697265625, "global_step": 67174, "epoch": 1599} {"train_loss": -6.048239231109619, "global_step": 67175, "epoch": 1599} {"train_loss": -6.025120735168457, "global_step": 67176, "epoch": 1599} {"train_loss": -5.924736499786377, "global_step": 67177, "epoch": 1599} {"train_loss": -6.0381975173950195, "global_step": 67178, "epoch": 1599} {"train_loss": -5.994643688201904, "global_step": 67179, "epoch": 1599} {"train_loss": -5.94818115234375, "global_step": 67180, "epoch": 1599} {"train_loss": -6.129533290863037, "global_step": 67181, "epoch": 1599} {"train_loss": -6.000758171081543, "global_step": 67182, "epoch": 1599} {"train_loss": -6.006056308746338, "global_step": 67183, "epoch": 1599} {"train_loss": -5.923863410949707, "global_step": 67184, "epoch": 1599} {"train_loss": -6.126771450042725, "global_step": 67185, "epoch": 1599} {"train_loss": -5.978927135467529, "global_step": 67186, "epoch": 1599} {"train_loss": -6.0867156982421875, "global_step": 67187, "epoch": 1599} {"train_loss": -6.074226379394531, "global_step": 67188, "epoch": 1599} {"train_loss": -5.963919639587402, "global_step": 67189, "epoch": 1599} {"train_loss": -6.049295902252197, "global_step": 67190, "epoch": 1599} {"train_loss": -5.84861946105957, "global_step": 67191, "epoch": 1599} {"train_loss": -5.995361328125, "global_step": 67192, "epoch": 1599} {"train_loss": -5.932137966156006, "global_step": 67193, "epoch": 1599} {"train_loss": -6.072311878204346, "global_step": 67194, "epoch": 1599} {"train_loss": -5.996644020080566, "global_step": 67195, "epoch": 1599} {"train_loss": -6.081747531890869, "global_step": 67196, "epoch": 1599} {"train_loss": -6.0447235107421875, "global_step": 67197, "epoch": 1599} {"train_loss": -5.921608924865723, "global_step": 67198, "epoch": 1599} {"train_loss": -6.001944382985433, "global_step": 67199, "epoch": 1599, "val_loss": 61471.234375} {"train_loss": -6.067708969116211, "global_step": 67200, "epoch": 1600} {"train_loss": -5.936941146850586, "global_step": 67201, "epoch": 1600} {"train_loss": -6.016735076904297, "global_step": 67202, "epoch": 1600} {"train_loss": -5.945666313171387, "global_step": 67203, "epoch": 1600} {"train_loss": -5.977640628814697, "global_step": 67204, "epoch": 1600} {"train_loss": -6.017528533935547, "global_step": 67205, "epoch": 1600} {"train_loss": -5.986004829406738, "global_step": 67206, "epoch": 1600} {"train_loss": -6.041234970092773, "global_step": 67207, "epoch": 1600} {"train_loss": -6.045344352722168, "global_step": 67208, "epoch": 1600} {"train_loss": -5.876680374145508, "global_step": 67209, "epoch": 1600} {"train_loss": -6.041818618774414, "global_step": 67210, "epoch": 1600} {"train_loss": -5.918247222900391, "global_step": 67211, "epoch": 1600} {"train_loss": -6.061966896057129, "global_step": 67212, "epoch": 1600} {"train_loss": -6.173055648803711, "global_step": 67213, "epoch": 1600} {"train_loss": -5.953865051269531, "global_step": 67214, "epoch": 1600} {"train_loss": -6.088898658752441, "global_step": 67215, "epoch": 1600} {"train_loss": -5.970347881317139, "global_step": 67216, "epoch": 1600} {"train_loss": -6.063106536865234, "global_step": 67217, "epoch": 1600} {"train_loss": -6.043046951293945, "global_step": 67218, "epoch": 1600} {"train_loss": -6.110535621643066, "global_step": 67219, "epoch": 1600} {"train_loss": -6.0473833084106445, "global_step": 67220, "epoch": 1600} {"train_loss": -5.996122360229492, "global_step": 67221, "epoch": 1600} {"train_loss": -6.1039628982543945, "global_step": 67222, "epoch": 1600} {"train_loss": -5.962733745574951, "global_step": 67223, "epoch": 1600} {"train_loss": -5.982866287231445, "global_step": 67224, "epoch": 1600} {"train_loss": -6.000619888305664, "global_step": 67225, "epoch": 1600} {"train_loss": -5.934982776641846, "global_step": 67226, "epoch": 1600} {"train_loss": -5.932449817657471, "global_step": 67227, "epoch": 1600} {"train_loss": -5.824847221374512, "global_step": 67228, "epoch": 1600} {"train_loss": -5.879764556884766, "global_step": 67229, "epoch": 1600} {"train_loss": -5.952884674072266, "global_step": 67230, "epoch": 1600} {"train_loss": -5.932628631591797, "global_step": 67231, "epoch": 1600} {"train_loss": -6.052170753479004, "global_step": 67232, "epoch": 1600} {"train_loss": -5.79035758972168, "global_step": 67233, "epoch": 1600} {"train_loss": -5.927755355834961, "global_step": 67234, "epoch": 1600} {"train_loss": -5.856281280517578, "global_step": 67235, "epoch": 1600} {"train_loss": -5.936558246612549, "global_step": 67236, "epoch": 1600} {"train_loss": -6.006182670593262, "global_step": 67237, "epoch": 1600} {"train_loss": -5.840609073638916, "global_step": 67238, "epoch": 1600} {"train_loss": -5.937664031982422, "global_step": 67239, "epoch": 1600} {"train_loss": -5.9326887130737305, "global_step": 67240, "epoch": 1600} {"train_loss": -5.977363802137829, "global_step": 67241, "epoch": 1600, "train/sim_max_reward_0": 0.6173576990778897, "train/sim_max_reward_1": 0.785153922326557, "train/sim_max_reward_2": 0.20905399938612115, "train/sim_max_reward_3": 0.7804386946901624, "train/sim_max_reward_4": 0.6927319649955765, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.24880933101527106, "test/sim_max_reward_4300002": 0.8034028927213913, "test/sim_max_reward_4300003": 0.7639959524842438, "test/sim_max_reward_4300004": 0.3639997495203848, "test/sim_max_reward_4300005": 0.9661427266469761, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.39370400454351284, "test/sim_max_reward_4300008": 0.40731790993164657, "test/sim_max_reward_4300009": 0.682491081887059, "test/sim_max_reward_4300010": 0.7821925897697892, "test/sim_max_reward_4300011": 0.4572169768527283, "test/sim_max_reward_4300012": 0.41106908268618814, "test/sim_max_reward_4300013": 0.7887894209377406, "test/sim_max_reward_4300014": 0.854711517381583, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.7945606422234671, "test/sim_max_reward_4300017": 0.8773308826531757, "test/sim_max_reward_4300018": 0.43753204749218777, "test/sim_max_reward_4300019": 0.18528738570654546, "test/sim_max_reward_4300020": 0.8359367860057471, "test/sim_max_reward_4300021": 0.7540947166699677, "test/sim_max_reward_4300022": 0.7769120639755994, "test/sim_max_reward_4300023": 0.5260086604115315, "test/sim_max_reward_4300024": 0.0048455840505580924, "test/sim_max_reward_4300025": 0.6856042662207088, "test/sim_max_reward_4300026": 0.83851616581042, "test/sim_max_reward_4300027": 0.8700682542219429, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.5201093946873784, "test/sim_max_reward_4300031": 0.9027096248559009, "test/sim_max_reward_4300032": 0.978638352282054, "test/sim_max_reward_4300033": 0.4553585337976279, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.20298208196430542, "test/sim_max_reward_4300037": 0.78737858921447, "test/sim_max_reward_4300038": 0.6263129135139253, "test/sim_max_reward_4300039": 0.07285228424301238, "test/sim_max_reward_4300040": 0.2524843473114078, "test/sim_max_reward_4300041": 0.7455691978088348, "test/sim_max_reward_4300042": 0.5035504723209313, "test/sim_max_reward_4300043": 0.8502806194600623, "test/sim_max_reward_4300044": 0.7223836649764149, "test/sim_max_reward_4300045": 0.2553985905744243, "test/sim_max_reward_4300046": 0.018690146633336343, "test/sim_max_reward_4300047": 0.7604907996357231, "test/sim_max_reward_4300048": 0.8974749174302001, "test/sim_max_reward_4300049": 0.2770465801087138, "train/mean_score": 0.5462868399730824, "test/mean_score": 0.5268050360527818, "val_loss": 61899.10546875} {"train_loss": -5.8544487953186035, "global_step": 67242, "epoch": 1601} {"train_loss": -6.016953945159912, "global_step": 67243, "epoch": 1601} {"train_loss": -5.87514066696167, "global_step": 67244, "epoch": 1601} {"train_loss": -5.9543657302856445, "global_step": 67245, "epoch": 1601} {"train_loss": -5.814295291900635, "global_step": 67246, "epoch": 1601} {"train_loss": -5.88436222076416, "global_step": 67247, "epoch": 1601} {"train_loss": -5.994915962219238, "global_step": 67248, "epoch": 1601} {"train_loss": -5.933540344238281, "global_step": 67249, "epoch": 1601} {"train_loss": -5.863239288330078, "global_step": 67250, "epoch": 1601} {"train_loss": -5.92872428894043, "global_step": 67251, "epoch": 1601} {"train_loss": -5.894650936126709, "global_step": 67252, "epoch": 1601} {"train_loss": -5.952922821044922, "global_step": 67253, "epoch": 1601} {"train_loss": -5.829230308532715, "global_step": 67254, "epoch": 1601} {"train_loss": -5.861583709716797, "global_step": 67255, "epoch": 1601} {"train_loss": -5.949637413024902, "global_step": 67256, "epoch": 1601} {"train_loss": -6.049555778503418, "global_step": 67257, "epoch": 1601} {"train_loss": -5.9162750244140625, "global_step": 67258, "epoch": 1601} {"train_loss": -5.998946189880371, "global_step": 67259, "epoch": 1601} {"train_loss": -6.060348033905029, "global_step": 67260, "epoch": 1601} {"train_loss": -6.012867450714111, "global_step": 67261, "epoch": 1601} {"train_loss": -6.111449241638184, "global_step": 67262, "epoch": 1601} {"train_loss": -5.984447479248047, "global_step": 67263, "epoch": 1601} {"train_loss": -5.968534469604492, "global_step": 67264, "epoch": 1601} {"train_loss": -5.888132095336914, "global_step": 67265, "epoch": 1601} {"train_loss": -6.048830986022949, "global_step": 67266, "epoch": 1601} {"train_loss": -6.029068470001221, "global_step": 67267, "epoch": 1601} {"train_loss": -6.1166534423828125, "global_step": 67268, "epoch": 1601} {"train_loss": -6.013789176940918, "global_step": 67269, "epoch": 1601} {"train_loss": -6.06253719329834, "global_step": 67270, "epoch": 1601} {"train_loss": -6.054739952087402, "global_step": 67271, "epoch": 1601} {"train_loss": -5.941319942474365, "global_step": 67272, "epoch": 1601} {"train_loss": -6.042646884918213, "global_step": 67273, "epoch": 1601} {"train_loss": -6.051753997802734, "global_step": 67274, "epoch": 1601} {"train_loss": -5.9784393310546875, "global_step": 67275, "epoch": 1601} {"train_loss": -5.902187824249268, "global_step": 67276, "epoch": 1601} {"train_loss": -5.989022254943848, "global_step": 67277, "epoch": 1601} {"train_loss": -5.994467735290527, "global_step": 67278, "epoch": 1601} {"train_loss": -5.885351657867432, "global_step": 67279, "epoch": 1601} {"train_loss": -5.904727458953857, "global_step": 67280, "epoch": 1601} {"train_loss": -5.999825477600098, "global_step": 67281, "epoch": 1601} {"train_loss": -6.088284969329834, "global_step": 67282, "epoch": 1601} {"train_loss": -5.9705031031654, "global_step": 67283, "epoch": 1601, "val_loss": 61371.69921875} {"train_loss": -6.006230354309082, "global_step": 67284, "epoch": 1602} {"train_loss": -6.050229072570801, "global_step": 67285, "epoch": 1602} {"train_loss": -6.052219390869141, "global_step": 67286, "epoch": 1602} {"train_loss": -6.102992057800293, "global_step": 67287, "epoch": 1602} {"train_loss": -6.0879597663879395, "global_step": 67288, "epoch": 1602} {"train_loss": -6.059359550476074, "global_step": 67289, "epoch": 1602} {"train_loss": -5.9497785568237305, "global_step": 67290, "epoch": 1602} {"train_loss": -6.048961162567139, "global_step": 67291, "epoch": 1602} {"train_loss": -5.975164413452148, "global_step": 67292, "epoch": 1602} {"train_loss": -5.88908576965332, "global_step": 67293, "epoch": 1602} {"train_loss": -6.075140476226807, "global_step": 67294, "epoch": 1602} {"train_loss": -6.002938270568848, "global_step": 67295, "epoch": 1602} {"train_loss": -5.990814208984375, "global_step": 67296, "epoch": 1602} {"train_loss": -6.015264511108398, "global_step": 67297, "epoch": 1602} {"train_loss": -6.085057258605957, "global_step": 67298, "epoch": 1602} {"train_loss": -6.000790596008301, "global_step": 67299, "epoch": 1602} {"train_loss": -6.022988319396973, "global_step": 67300, "epoch": 1602} {"train_loss": -6.139261722564697, "global_step": 67301, "epoch": 1602} {"train_loss": -6.031291961669922, "global_step": 67302, "epoch": 1602} {"train_loss": -6.083219528198242, "global_step": 67303, "epoch": 1602} {"train_loss": -6.088415145874023, "global_step": 67304, "epoch": 1602} {"train_loss": -6.069375038146973, "global_step": 67305, "epoch": 1602} {"train_loss": -5.962687969207764, "global_step": 67306, "epoch": 1602} {"train_loss": -5.973989486694336, "global_step": 67307, "epoch": 1602} {"train_loss": -5.940011501312256, "global_step": 67308, "epoch": 1602} {"train_loss": -5.889917850494385, "global_step": 67309, "epoch": 1602} {"train_loss": -5.973148345947266, "global_step": 67310, "epoch": 1602} {"train_loss": -5.954607009887695, "global_step": 67311, "epoch": 1602} {"train_loss": -5.991498947143555, "global_step": 67312, "epoch": 1602} {"train_loss": -5.853351593017578, "global_step": 67313, "epoch": 1602} {"train_loss": -5.952816486358643, "global_step": 67314, "epoch": 1602} {"train_loss": -5.912270545959473, "global_step": 67315, "epoch": 1602} {"train_loss": -5.962862491607666, "global_step": 67316, "epoch": 1602} {"train_loss": -5.852203845977783, "global_step": 67317, "epoch": 1602} {"train_loss": -5.967658519744873, "global_step": 67318, "epoch": 1602} {"train_loss": -5.914778709411621, "global_step": 67319, "epoch": 1602} {"train_loss": -6.060704231262207, "global_step": 67320, "epoch": 1602} {"train_loss": -5.788128852844238, "global_step": 67321, "epoch": 1602} {"train_loss": -5.9716997146606445, "global_step": 67322, "epoch": 1602} {"train_loss": -6.018346309661865, "global_step": 67323, "epoch": 1602} {"train_loss": -6.020574569702148, "global_step": 67324, "epoch": 1602} {"train_loss": -5.994367134003412, "global_step": 67325, "epoch": 1602, "val_loss": 61696.5390625} {"train_loss": -6.045541763305664, "global_step": 67326, "epoch": 1603} {"train_loss": -5.984520435333252, "global_step": 67327, "epoch": 1603} {"train_loss": -6.038692951202393, "global_step": 67328, "epoch": 1603} {"train_loss": -6.03719425201416, "global_step": 67329, "epoch": 1603} {"train_loss": -6.1325578689575195, "global_step": 67330, "epoch": 1603} {"train_loss": -5.929129123687744, "global_step": 67331, "epoch": 1603} {"train_loss": -6.052255153656006, "global_step": 67332, "epoch": 1603} {"train_loss": -5.994057655334473, "global_step": 67333, "epoch": 1603} {"train_loss": -5.998186111450195, "global_step": 67334, "epoch": 1603} {"train_loss": -6.0929155349731445, "global_step": 67335, "epoch": 1603} {"train_loss": -5.9762773513793945, "global_step": 67336, "epoch": 1603} {"train_loss": -6.058418273925781, "global_step": 67337, "epoch": 1603} {"train_loss": -6.094725608825684, "global_step": 67338, "epoch": 1603} {"train_loss": -5.953315258026123, "global_step": 67339, "epoch": 1603} {"train_loss": -5.97144079208374, "global_step": 67340, "epoch": 1603} {"train_loss": -6.113353729248047, "global_step": 67341, "epoch": 1603} {"train_loss": -5.992123126983643, "global_step": 67342, "epoch": 1603} {"train_loss": -5.9778900146484375, "global_step": 67343, "epoch": 1603} {"train_loss": -6.073694705963135, "global_step": 67344, "epoch": 1603} {"train_loss": -6.022668361663818, "global_step": 67345, "epoch": 1603} {"train_loss": -6.11787223815918, "global_step": 67346, "epoch": 1603} {"train_loss": -6.025050163269043, "global_step": 67347, "epoch": 1603} {"train_loss": -6.060751438140869, "global_step": 67348, "epoch": 1603} {"train_loss": -5.852107048034668, "global_step": 67349, "epoch": 1603} {"train_loss": -6.132172584533691, "global_step": 67350, "epoch": 1603} {"train_loss": -6.103803634643555, "global_step": 67351, "epoch": 1603} {"train_loss": -6.076808929443359, "global_step": 67352, "epoch": 1603} {"train_loss": -6.114462852478027, "global_step": 67353, "epoch": 1603} {"train_loss": -6.075575828552246, "global_step": 67354, "epoch": 1603} {"train_loss": -6.041135787963867, "global_step": 67355, "epoch": 1603} {"train_loss": -6.0037078857421875, "global_step": 67356, "epoch": 1603} {"train_loss": -6.0927605628967285, "global_step": 67357, "epoch": 1603} {"train_loss": -6.060481071472168, "global_step": 67358, "epoch": 1603} {"train_loss": -5.953704833984375, "global_step": 67359, "epoch": 1603} {"train_loss": -6.018008232116699, "global_step": 67360, "epoch": 1603} {"train_loss": -6.0920729637146, "global_step": 67361, "epoch": 1603} {"train_loss": -5.974478244781494, "global_step": 67362, "epoch": 1603} {"train_loss": -5.939460754394531, "global_step": 67363, "epoch": 1603} {"train_loss": -5.911595344543457, "global_step": 67364, "epoch": 1603} {"train_loss": -6.039890766143799, "global_step": 67365, "epoch": 1603} {"train_loss": -5.9176554679870605, "global_step": 67366, "epoch": 1603} {"train_loss": -6.025611945561001, "global_step": 67367, "epoch": 1603, "val_loss": 61533.0078125} {"train_loss": -6.0608625411987305, "global_step": 67368, "epoch": 1604} {"train_loss": -5.991803169250488, "global_step": 67369, "epoch": 1604} {"train_loss": -6.0584211349487305, "global_step": 67370, "epoch": 1604} {"train_loss": -6.032118797302246, "global_step": 67371, "epoch": 1604} {"train_loss": -6.163302898406982, "global_step": 67372, "epoch": 1604} {"train_loss": -5.921621799468994, "global_step": 67373, "epoch": 1604} {"train_loss": -5.97857666015625, "global_step": 67374, "epoch": 1604} {"train_loss": -5.927840232849121, "global_step": 67375, "epoch": 1604} {"train_loss": -6.058480262756348, "global_step": 67376, "epoch": 1604} {"train_loss": -6.107786178588867, "global_step": 67377, "epoch": 1604} {"train_loss": -5.960927963256836, "global_step": 67378, "epoch": 1604} {"train_loss": -5.833578586578369, "global_step": 67379, "epoch": 1604} {"train_loss": -6.01212215423584, "global_step": 67380, "epoch": 1604} {"train_loss": -6.109519958496094, "global_step": 67381, "epoch": 1604} {"train_loss": -5.850458145141602, "global_step": 67382, "epoch": 1604} {"train_loss": -5.866644859313965, "global_step": 67383, "epoch": 1604} {"train_loss": -6.069758892059326, "global_step": 67384, "epoch": 1604} {"train_loss": -5.828941345214844, "global_step": 67385, "epoch": 1604} {"train_loss": -5.941545486450195, "global_step": 67386, "epoch": 1604} {"train_loss": -5.929110527038574, "global_step": 67387, "epoch": 1604} {"train_loss": -5.830615520477295, "global_step": 67388, "epoch": 1604} {"train_loss": -5.9267425537109375, "global_step": 67389, "epoch": 1604} {"train_loss": -5.952818870544434, "global_step": 67390, "epoch": 1604} {"train_loss": -5.842153072357178, "global_step": 67391, "epoch": 1604} {"train_loss": -5.935844421386719, "global_step": 67392, "epoch": 1604} {"train_loss": -5.885356903076172, "global_step": 67393, "epoch": 1604} {"train_loss": -6.083195686340332, "global_step": 67394, "epoch": 1604} {"train_loss": -5.871748924255371, "global_step": 67395, "epoch": 1604} {"train_loss": -5.94740104675293, "global_step": 67396, "epoch": 1604} {"train_loss": -5.903800964355469, "global_step": 67397, "epoch": 1604} {"train_loss": -5.936609268188477, "global_step": 67398, "epoch": 1604} {"train_loss": -5.986159324645996, "global_step": 67399, "epoch": 1604} {"train_loss": -5.838456153869629, "global_step": 67400, "epoch": 1604} {"train_loss": -5.812675952911377, "global_step": 67401, "epoch": 1604} {"train_loss": -5.837189197540283, "global_step": 67402, "epoch": 1604} {"train_loss": -5.844574451446533, "global_step": 67403, "epoch": 1604} {"train_loss": -5.901283264160156, "global_step": 67404, "epoch": 1604} {"train_loss": -6.039317607879639, "global_step": 67405, "epoch": 1604} {"train_loss": -5.939774036407471, "global_step": 67406, "epoch": 1604} {"train_loss": -5.918992042541504, "global_step": 67407, "epoch": 1604} {"train_loss": -5.971701622009277, "global_step": 67408, "epoch": 1604} {"train_loss": -5.948696885790143, "global_step": 67409, "epoch": 1604, "val_loss": 62071.04296875} {"train_loss": -6.005467891693115, "global_step": 67410, "epoch": 1605} {"train_loss": -5.916616439819336, "global_step": 67411, "epoch": 1605} {"train_loss": -5.9714460372924805, "global_step": 67412, "epoch": 1605} {"train_loss": -5.975666046142578, "global_step": 67413, "epoch": 1605} {"train_loss": -6.009617805480957, "global_step": 67414, "epoch": 1605} {"train_loss": -6.0233635902404785, "global_step": 67415, "epoch": 1605} {"train_loss": -5.946091651916504, "global_step": 67416, "epoch": 1605} {"train_loss": -6.027456760406494, "global_step": 67417, "epoch": 1605} {"train_loss": -5.859683513641357, "global_step": 67418, "epoch": 1605} {"train_loss": -6.160722732543945, "global_step": 67419, "epoch": 1605} {"train_loss": -6.028295040130615, "global_step": 67420, "epoch": 1605} {"train_loss": -5.921980381011963, "global_step": 67421, "epoch": 1605} {"train_loss": -6.000497817993164, "global_step": 67422, "epoch": 1605} {"train_loss": -6.0548505783081055, "global_step": 67423, "epoch": 1605} {"train_loss": -6.0860137939453125, "global_step": 67424, "epoch": 1605} {"train_loss": -5.966496467590332, "global_step": 67425, "epoch": 1605} {"train_loss": -5.966724395751953, "global_step": 67426, "epoch": 1605} {"train_loss": -6.001502513885498, "global_step": 67427, "epoch": 1605} {"train_loss": -5.9138875007629395, "global_step": 67428, "epoch": 1605} {"train_loss": -6.127849578857422, "global_step": 67429, "epoch": 1605} {"train_loss": -6.119556427001953, "global_step": 67430, "epoch": 1605} {"train_loss": -6.057517051696777, "global_step": 67431, "epoch": 1605} {"train_loss": -5.9841156005859375, "global_step": 67432, "epoch": 1605} {"train_loss": -6.097097396850586, "global_step": 67433, "epoch": 1605} {"train_loss": -5.8666791915893555, "global_step": 67434, "epoch": 1605} {"train_loss": -5.978854179382324, "global_step": 67435, "epoch": 1605} {"train_loss": -5.949880599975586, "global_step": 67436, "epoch": 1605} {"train_loss": -6.01854133605957, "global_step": 67437, "epoch": 1605} {"train_loss": -6.029341220855713, "global_step": 67438, "epoch": 1605} {"train_loss": -6.040117263793945, "global_step": 67439, "epoch": 1605} {"train_loss": -5.9624528884887695, "global_step": 67440, "epoch": 1605} {"train_loss": -5.9641571044921875, "global_step": 67441, "epoch": 1605} {"train_loss": -5.93666410446167, "global_step": 67442, "epoch": 1605} {"train_loss": -5.855682373046875, "global_step": 67443, "epoch": 1605} {"train_loss": -6.003108024597168, "global_step": 67444, "epoch": 1605} {"train_loss": -6.032953262329102, "global_step": 67445, "epoch": 1605} {"train_loss": -5.997407913208008, "global_step": 67446, "epoch": 1605} {"train_loss": -5.935258865356445, "global_step": 67447, "epoch": 1605} {"train_loss": -6.038551330566406, "global_step": 67448, "epoch": 1605} {"train_loss": -5.910558700561523, "global_step": 67449, "epoch": 1605} {"train_loss": -5.988624572753906, "global_step": 67450, "epoch": 1605} {"train_loss": -5.991939317612421, "global_step": 67451, "epoch": 1605, "val_loss": 61757.8359375} {"train_loss": -6.01622200012207, "global_step": 67452, "epoch": 1606} {"train_loss": -5.954431533813477, "global_step": 67453, "epoch": 1606} {"train_loss": -6.044157981872559, "global_step": 67454, "epoch": 1606} {"train_loss": -5.992459297180176, "global_step": 67455, "epoch": 1606} {"train_loss": -6.011662006378174, "global_step": 67456, "epoch": 1606} {"train_loss": -5.855110168457031, "global_step": 67457, "epoch": 1606} {"train_loss": -6.033515930175781, "global_step": 67458, "epoch": 1606} {"train_loss": -5.9765214920043945, "global_step": 67459, "epoch": 1606} {"train_loss": -5.8131585121154785, "global_step": 67460, "epoch": 1606} {"train_loss": -6.035656452178955, "global_step": 67461, "epoch": 1606} {"train_loss": -5.9487624168396, "global_step": 67462, "epoch": 1606} {"train_loss": -6.084933280944824, "global_step": 67463, "epoch": 1606} {"train_loss": -6.074026584625244, "global_step": 67464, "epoch": 1606} {"train_loss": -5.937742233276367, "global_step": 67465, "epoch": 1606} {"train_loss": -5.985536575317383, "global_step": 67466, "epoch": 1606} {"train_loss": -6.06926155090332, "global_step": 67467, "epoch": 1606} {"train_loss": -6.108039379119873, "global_step": 67468, "epoch": 1606} {"train_loss": -6.067842483520508, "global_step": 67469, "epoch": 1606} {"train_loss": -6.006990432739258, "global_step": 67470, "epoch": 1606} {"train_loss": -6.106576919555664, "global_step": 67471, "epoch": 1606} {"train_loss": -6.045823574066162, "global_step": 67472, "epoch": 1606} {"train_loss": -6.120719909667969, "global_step": 67473, "epoch": 1606} {"train_loss": -6.018560409545898, "global_step": 67474, "epoch": 1606} {"train_loss": -6.084403038024902, "global_step": 67475, "epoch": 1606} {"train_loss": -6.013286590576172, "global_step": 67476, "epoch": 1606} {"train_loss": -6.0160980224609375, "global_step": 67477, "epoch": 1606} {"train_loss": -6.037311553955078, "global_step": 67478, "epoch": 1606} {"train_loss": -5.939253807067871, "global_step": 67479, "epoch": 1606} {"train_loss": -6.084919452667236, "global_step": 67480, "epoch": 1606} {"train_loss": -6.075008392333984, "global_step": 67481, "epoch": 1606} {"train_loss": -5.923198699951172, "global_step": 67482, "epoch": 1606} {"train_loss": -5.978431701660156, "global_step": 67483, "epoch": 1606} {"train_loss": -6.049854755401611, "global_step": 67484, "epoch": 1606} {"train_loss": -6.041933059692383, "global_step": 67485, "epoch": 1606} {"train_loss": -6.136969566345215, "global_step": 67486, "epoch": 1606} {"train_loss": -5.985360622406006, "global_step": 67487, "epoch": 1606} {"train_loss": -5.978340148925781, "global_step": 67488, "epoch": 1606} {"train_loss": -6.088143348693848, "global_step": 67489, "epoch": 1606} {"train_loss": -5.978849411010742, "global_step": 67490, "epoch": 1606} {"train_loss": -5.913212776184082, "global_step": 67491, "epoch": 1606} {"train_loss": -5.927034378051758, "global_step": 67492, "epoch": 1606} {"train_loss": -6.014609359559559, "global_step": 67493, "epoch": 1606, "val_loss": 61800.5703125} {"train_loss": -5.906953811645508, "global_step": 67494, "epoch": 1607} {"train_loss": -5.966843128204346, "global_step": 67495, "epoch": 1607} {"train_loss": -6.05910587310791, "global_step": 67496, "epoch": 1607} {"train_loss": -5.868887901306152, "global_step": 67497, "epoch": 1607} {"train_loss": -5.929803371429443, "global_step": 67498, "epoch": 1607} {"train_loss": -5.885008811950684, "global_step": 67499, "epoch": 1607} {"train_loss": -5.862517833709717, "global_step": 67500, "epoch": 1607} {"train_loss": -5.991987228393555, "global_step": 67501, "epoch": 1607} {"train_loss": -5.856411933898926, "global_step": 67502, "epoch": 1607} {"train_loss": -5.902654647827148, "global_step": 67503, "epoch": 1607} {"train_loss": -6.021641731262207, "global_step": 67504, "epoch": 1607} {"train_loss": -5.944542407989502, "global_step": 67505, "epoch": 1607} {"train_loss": -6.0009379386901855, "global_step": 67506, "epoch": 1607} {"train_loss": -5.986522674560547, "global_step": 67507, "epoch": 1607} {"train_loss": -5.9419145584106445, "global_step": 67508, "epoch": 1607} {"train_loss": -5.879021167755127, "global_step": 67509, "epoch": 1607} {"train_loss": -5.984753608703613, "global_step": 67510, "epoch": 1607} {"train_loss": -5.885109901428223, "global_step": 67511, "epoch": 1607} {"train_loss": -6.116547584533691, "global_step": 67512, "epoch": 1607} {"train_loss": -5.807032108306885, "global_step": 67513, "epoch": 1607} {"train_loss": -5.845854759216309, "global_step": 67514, "epoch": 1607} {"train_loss": -6.0648298263549805, "global_step": 67515, "epoch": 1607} {"train_loss": -5.934567928314209, "global_step": 67516, "epoch": 1607} {"train_loss": -5.928539276123047, "global_step": 67517, "epoch": 1607} {"train_loss": -5.967927932739258, "global_step": 67518, "epoch": 1607} {"train_loss": -6.009128570556641, "global_step": 67519, "epoch": 1607} {"train_loss": -5.882470607757568, "global_step": 67520, "epoch": 1607} {"train_loss": -5.8124098777771, "global_step": 67521, "epoch": 1607} {"train_loss": -5.863329887390137, "global_step": 67522, "epoch": 1607} {"train_loss": -5.870388507843018, "global_step": 67523, "epoch": 1607} {"train_loss": -6.045915603637695, "global_step": 67524, "epoch": 1607} {"train_loss": -6.042855262756348, "global_step": 67525, "epoch": 1607} {"train_loss": -5.753974914550781, "global_step": 67526, "epoch": 1607} {"train_loss": -6.085380554199219, "global_step": 67527, "epoch": 1607} {"train_loss": -5.951545715332031, "global_step": 67528, "epoch": 1607} {"train_loss": -5.987062454223633, "global_step": 67529, "epoch": 1607} {"train_loss": -5.911513328552246, "global_step": 67530, "epoch": 1607} {"train_loss": -6.024742603302002, "global_step": 67531, "epoch": 1607} {"train_loss": -5.994181156158447, "global_step": 67532, "epoch": 1607} {"train_loss": -5.888551712036133, "global_step": 67533, "epoch": 1607} {"train_loss": -5.8616943359375, "global_step": 67534, "epoch": 1607} {"train_loss": -5.940497625441778, "global_step": 67535, "epoch": 1607, "val_loss": 61642.61328125} {"train_loss": -6.105714797973633, "global_step": 67536, "epoch": 1608} {"train_loss": -6.082221508026123, "global_step": 67537, "epoch": 1608} {"train_loss": -5.923992156982422, "global_step": 67538, "epoch": 1608} {"train_loss": -5.992524147033691, "global_step": 67539, "epoch": 1608} {"train_loss": -5.979578495025635, "global_step": 67540, "epoch": 1608} {"train_loss": -5.927094459533691, "global_step": 67541, "epoch": 1608} {"train_loss": -6.046616077423096, "global_step": 67542, "epoch": 1608} {"train_loss": -6.087301254272461, "global_step": 67543, "epoch": 1608} {"train_loss": -5.984638214111328, "global_step": 67544, "epoch": 1608} {"train_loss": -5.970092296600342, "global_step": 67545, "epoch": 1608} {"train_loss": -5.899521350860596, "global_step": 67546, "epoch": 1608} {"train_loss": -6.156208515167236, "global_step": 67547, "epoch": 1608} {"train_loss": -5.9785847663879395, "global_step": 67548, "epoch": 1608} {"train_loss": -5.975950717926025, "global_step": 67549, "epoch": 1608} {"train_loss": -6.001159191131592, "global_step": 67550, "epoch": 1608} {"train_loss": -5.902149200439453, "global_step": 67551, "epoch": 1608} {"train_loss": -5.919486999511719, "global_step": 67552, "epoch": 1608} {"train_loss": -5.954107284545898, "global_step": 67553, "epoch": 1608} {"train_loss": -5.8939714431762695, "global_step": 67554, "epoch": 1608} {"train_loss": -5.8985395431518555, "global_step": 67555, "epoch": 1608} {"train_loss": -5.946589469909668, "global_step": 67556, "epoch": 1608} {"train_loss": -6.020563125610352, "global_step": 67557, "epoch": 1608} {"train_loss": -6.0449395179748535, "global_step": 67558, "epoch": 1608} {"train_loss": -5.944460391998291, "global_step": 67559, "epoch": 1608} {"train_loss": -6.129093170166016, "global_step": 67560, "epoch": 1608} {"train_loss": -5.994272708892822, "global_step": 67561, "epoch": 1608} {"train_loss": -5.991336345672607, "global_step": 67562, "epoch": 1608} {"train_loss": -5.918947696685791, "global_step": 67563, "epoch": 1608} {"train_loss": -6.014739036560059, "global_step": 67564, "epoch": 1608} {"train_loss": -5.880478858947754, "global_step": 67565, "epoch": 1608} {"train_loss": -5.972432613372803, "global_step": 67566, "epoch": 1608} {"train_loss": -6.018460750579834, "global_step": 67567, "epoch": 1608} {"train_loss": -5.9774885177612305, "global_step": 67568, "epoch": 1608} {"train_loss": -6.013469696044922, "global_step": 67569, "epoch": 1608} {"train_loss": -6.07493782043457, "global_step": 67570, "epoch": 1608} {"train_loss": -6.064211845397949, "global_step": 67571, "epoch": 1608} {"train_loss": -5.9665303230285645, "global_step": 67572, "epoch": 1608} {"train_loss": -5.993222713470459, "global_step": 67573, "epoch": 1608} {"train_loss": -6.036401748657227, "global_step": 67574, "epoch": 1608} {"train_loss": -5.96242618560791, "global_step": 67575, "epoch": 1608} {"train_loss": -6.045482158660889, "global_step": 67576, "epoch": 1608} {"train_loss": -5.994221153713408, "global_step": 67577, "epoch": 1608, "val_loss": 61733.77734375} {"train_loss": -5.929932594299316, "global_step": 67578, "epoch": 1609} {"train_loss": -5.901040554046631, "global_step": 67579, "epoch": 1609} {"train_loss": -5.949824810028076, "global_step": 67580, "epoch": 1609} {"train_loss": -5.882630348205566, "global_step": 67581, "epoch": 1609} {"train_loss": -5.9812774658203125, "global_step": 67582, "epoch": 1609} {"train_loss": -5.970270156860352, "global_step": 67583, "epoch": 1609} {"train_loss": -6.115339279174805, "global_step": 67584, "epoch": 1609} {"train_loss": -6.075313568115234, "global_step": 67585, "epoch": 1609} {"train_loss": -5.920554161071777, "global_step": 67586, "epoch": 1609} {"train_loss": -5.942498207092285, "global_step": 67587, "epoch": 1609} {"train_loss": -6.007680416107178, "global_step": 67588, "epoch": 1609} {"train_loss": -5.99818229675293, "global_step": 67589, "epoch": 1609} {"train_loss": -6.098273754119873, "global_step": 67590, "epoch": 1609} {"train_loss": -5.925540924072266, "global_step": 67591, "epoch": 1609} {"train_loss": -6.013542175292969, "global_step": 67592, "epoch": 1609} {"train_loss": -6.028353214263916, "global_step": 67593, "epoch": 1609} {"train_loss": -5.896914005279541, "global_step": 67594, "epoch": 1609} {"train_loss": -6.0148115158081055, "global_step": 67595, "epoch": 1609} {"train_loss": -6.017051696777344, "global_step": 67596, "epoch": 1609} {"train_loss": -6.050337791442871, "global_step": 67597, "epoch": 1609} {"train_loss": -5.962807655334473, "global_step": 67598, "epoch": 1609} {"train_loss": -5.954647064208984, "global_step": 67599, "epoch": 1609} {"train_loss": -6.005846977233887, "global_step": 67600, "epoch": 1609} {"train_loss": -6.0688252449035645, "global_step": 67601, "epoch": 1609} {"train_loss": -5.946337699890137, "global_step": 67602, "epoch": 1609} {"train_loss": -6.0257110595703125, "global_step": 67603, "epoch": 1609} {"train_loss": -5.945942401885986, "global_step": 67604, "epoch": 1609} {"train_loss": -6.074720859527588, "global_step": 67605, "epoch": 1609} {"train_loss": -5.9643964767456055, "global_step": 67606, "epoch": 1609} {"train_loss": -5.796832084655762, "global_step": 67607, "epoch": 1609} {"train_loss": -6.116213798522949, "global_step": 67608, "epoch": 1609} {"train_loss": -5.988015174865723, "global_step": 67609, "epoch": 1609} {"train_loss": -5.895132541656494, "global_step": 67610, "epoch": 1609} {"train_loss": -6.019240379333496, "global_step": 67611, "epoch": 1609} {"train_loss": -5.894660472869873, "global_step": 67612, "epoch": 1609} {"train_loss": -5.965853691101074, "global_step": 67613, "epoch": 1609} {"train_loss": -5.955440521240234, "global_step": 67614, "epoch": 1609} {"train_loss": -6.077908515930176, "global_step": 67615, "epoch": 1609} {"train_loss": -6.017481803894043, "global_step": 67616, "epoch": 1609} {"train_loss": -5.928417205810547, "global_step": 67617, "epoch": 1609} {"train_loss": -5.98477840423584, "global_step": 67618, "epoch": 1609} {"train_loss": -5.9802070912860685, "global_step": 67619, "epoch": 1609, "val_loss": 61505.25390625} {"train_loss": -5.896974086761475, "global_step": 67620, "epoch": 1610} {"train_loss": -5.834926605224609, "global_step": 67621, "epoch": 1610} {"train_loss": -6.022425651550293, "global_step": 67622, "epoch": 1610} {"train_loss": -5.944016456604004, "global_step": 67623, "epoch": 1610} {"train_loss": -5.864457130432129, "global_step": 67624, "epoch": 1610} {"train_loss": -6.067951679229736, "global_step": 67625, "epoch": 1610} {"train_loss": -5.994218349456787, "global_step": 67626, "epoch": 1610} {"train_loss": -5.961953163146973, "global_step": 67627, "epoch": 1610} {"train_loss": -6.023252487182617, "global_step": 67628, "epoch": 1610} {"train_loss": -5.92437744140625, "global_step": 67629, "epoch": 1610} {"train_loss": -6.084660053253174, "global_step": 67630, "epoch": 1610} {"train_loss": -6.02387809753418, "global_step": 67631, "epoch": 1610} {"train_loss": -5.964540958404541, "global_step": 67632, "epoch": 1610} {"train_loss": -6.069553375244141, "global_step": 67633, "epoch": 1610} {"train_loss": -5.942713737487793, "global_step": 67634, "epoch": 1610} {"train_loss": -6.0178070068359375, "global_step": 67635, "epoch": 1610} {"train_loss": -6.0069780349731445, "global_step": 67636, "epoch": 1610} {"train_loss": -6.017394065856934, "global_step": 67637, "epoch": 1610} {"train_loss": -5.988651752471924, "global_step": 67638, "epoch": 1610} {"train_loss": -6.1304521560668945, "global_step": 67639, "epoch": 1610} {"train_loss": -5.997260570526123, "global_step": 67640, "epoch": 1610} {"train_loss": -5.92169189453125, "global_step": 67641, "epoch": 1610} {"train_loss": -5.957301139831543, "global_step": 67642, "epoch": 1610} {"train_loss": -6.039074897766113, "global_step": 67643, "epoch": 1610} {"train_loss": -5.916568279266357, "global_step": 67644, "epoch": 1610} {"train_loss": -6.003144264221191, "global_step": 67645, "epoch": 1610} {"train_loss": -6.01113748550415, "global_step": 67646, "epoch": 1610} {"train_loss": -6.063205718994141, "global_step": 67647, "epoch": 1610} {"train_loss": -6.099003791809082, "global_step": 67648, "epoch": 1610} {"train_loss": -6.072412967681885, "global_step": 67649, "epoch": 1610} {"train_loss": -6.023690223693848, "global_step": 67650, "epoch": 1610} {"train_loss": -6.032000541687012, "global_step": 67651, "epoch": 1610} {"train_loss": -5.945776462554932, "global_step": 67652, "epoch": 1610} {"train_loss": -6.048895835876465, "global_step": 67653, "epoch": 1610} {"train_loss": -6.018072605133057, "global_step": 67654, "epoch": 1610} {"train_loss": -6.033135414123535, "global_step": 67655, "epoch": 1610} {"train_loss": -6.039868354797363, "global_step": 67656, "epoch": 1610} {"train_loss": -6.020804405212402, "global_step": 67657, "epoch": 1610} {"train_loss": -5.970736980438232, "global_step": 67658, "epoch": 1610} {"train_loss": -5.971994400024414, "global_step": 67659, "epoch": 1610} {"train_loss": -6.013936996459961, "global_step": 67660, "epoch": 1610} {"train_loss": -5.998225427809215, "global_step": 67661, "epoch": 1610, "val_loss": 61653.61328125} {"train_loss": -5.9956135749816895, "global_step": 67662, "epoch": 1611} {"train_loss": -5.78511905670166, "global_step": 67663, "epoch": 1611} {"train_loss": -6.042584419250488, "global_step": 67664, "epoch": 1611} {"train_loss": -5.976746082305908, "global_step": 67665, "epoch": 1611} {"train_loss": -5.915414333343506, "global_step": 67666, "epoch": 1611} {"train_loss": -6.02505350112915, "global_step": 67667, "epoch": 1611} {"train_loss": -6.17838716506958, "global_step": 67668, "epoch": 1611} {"train_loss": -6.036791801452637, "global_step": 67669, "epoch": 1611} {"train_loss": -6.041939735412598, "global_step": 67670, "epoch": 1611} {"train_loss": -5.982348442077637, "global_step": 67671, "epoch": 1611} {"train_loss": -5.981842041015625, "global_step": 67672, "epoch": 1611} {"train_loss": -5.935210227966309, "global_step": 67673, "epoch": 1611} {"train_loss": -6.029538154602051, "global_step": 67674, "epoch": 1611} {"train_loss": -6.0531744956970215, "global_step": 67675, "epoch": 1611} {"train_loss": -5.8364105224609375, "global_step": 67676, "epoch": 1611} {"train_loss": -6.103099346160889, "global_step": 67677, "epoch": 1611} {"train_loss": -5.942012786865234, "global_step": 67678, "epoch": 1611} {"train_loss": -5.98127555847168, "global_step": 67679, "epoch": 1611} {"train_loss": -6.077319145202637, "global_step": 67680, "epoch": 1611} {"train_loss": -6.074965000152588, "global_step": 67681, "epoch": 1611} {"train_loss": -6.0367889404296875, "global_step": 67682, "epoch": 1611} {"train_loss": -6.0318403244018555, "global_step": 67683, "epoch": 1611} {"train_loss": -5.970557689666748, "global_step": 67684, "epoch": 1611} {"train_loss": -6.1656694412231445, "global_step": 67685, "epoch": 1611} {"train_loss": -6.094797134399414, "global_step": 67686, "epoch": 1611} {"train_loss": -5.997349739074707, "global_step": 67687, "epoch": 1611} {"train_loss": -5.863492012023926, "global_step": 67688, "epoch": 1611} {"train_loss": -6.198430061340332, "global_step": 67689, "epoch": 1611} {"train_loss": -5.806070804595947, "global_step": 67690, "epoch": 1611} {"train_loss": -6.005203723907471, "global_step": 67691, "epoch": 1611} {"train_loss": -5.930442810058594, "global_step": 67692, "epoch": 1611} {"train_loss": -5.773983955383301, "global_step": 67693, "epoch": 1611} {"train_loss": -5.8922953605651855, "global_step": 67694, "epoch": 1611} {"train_loss": -5.849827766418457, "global_step": 67695, "epoch": 1611} {"train_loss": -5.926825523376465, "global_step": 67696, "epoch": 1611} {"train_loss": -5.763733863830566, "global_step": 67697, "epoch": 1611} {"train_loss": -5.8568501472473145, "global_step": 67698, "epoch": 1611} {"train_loss": -5.962128639221191, "global_step": 67699, "epoch": 1611} {"train_loss": -5.92960786819458, "global_step": 67700, "epoch": 1611} {"train_loss": -5.836585521697998, "global_step": 67701, "epoch": 1611} {"train_loss": -5.885586738586426, "global_step": 67702, "epoch": 1611} {"train_loss": -5.97146479288737, "global_step": 67703, "epoch": 1611, "val_loss": 61699.640625} {"train_loss": -5.9441022872924805, "global_step": 67704, "epoch": 1612} {"train_loss": -6.019034385681152, "global_step": 67705, "epoch": 1612} {"train_loss": -5.940124034881592, "global_step": 67706, "epoch": 1612} {"train_loss": -6.034395694732666, "global_step": 67707, "epoch": 1612} {"train_loss": -5.943733215332031, "global_step": 67708, "epoch": 1612} {"train_loss": -5.999533176422119, "global_step": 67709, "epoch": 1612} {"train_loss": -5.9923858642578125, "global_step": 67710, "epoch": 1612} {"train_loss": -6.020476341247559, "global_step": 67711, "epoch": 1612} {"train_loss": -6.024478435516357, "global_step": 67712, "epoch": 1612} {"train_loss": -6.020003318786621, "global_step": 67713, "epoch": 1612} {"train_loss": -6.0395588874816895, "global_step": 67714, "epoch": 1612} {"train_loss": -5.949993133544922, "global_step": 67715, "epoch": 1612} {"train_loss": -5.894628047943115, "global_step": 67716, "epoch": 1612} {"train_loss": -6.109168529510498, "global_step": 67717, "epoch": 1612} {"train_loss": -6.128293037414551, "global_step": 67718, "epoch": 1612} {"train_loss": -6.077786922454834, "global_step": 67719, "epoch": 1612} {"train_loss": -5.960157871246338, "global_step": 67720, "epoch": 1612} {"train_loss": -6.058585166931152, "global_step": 67721, "epoch": 1612} {"train_loss": -6.009993553161621, "global_step": 67722, "epoch": 1612} {"train_loss": -6.052218914031982, "global_step": 67723, "epoch": 1612} {"train_loss": -5.867686748504639, "global_step": 67724, "epoch": 1612} {"train_loss": -5.943665504455566, "global_step": 67725, "epoch": 1612} {"train_loss": -6.0318827629089355, "global_step": 67726, "epoch": 1612} {"train_loss": -5.925274848937988, "global_step": 67727, "epoch": 1612} {"train_loss": -6.078256130218506, "global_step": 67728, "epoch": 1612} {"train_loss": -5.98723030090332, "global_step": 67729, "epoch": 1612} {"train_loss": -5.995674133300781, "global_step": 67730, "epoch": 1612} {"train_loss": -5.960309028625488, "global_step": 67731, "epoch": 1612} {"train_loss": -5.925142765045166, "global_step": 67732, "epoch": 1612} {"train_loss": -5.96220064163208, "global_step": 67733, "epoch": 1612} {"train_loss": -5.892168045043945, "global_step": 67734, "epoch": 1612} {"train_loss": -6.028200149536133, "global_step": 67735, "epoch": 1612} {"train_loss": -6.034152984619141, "global_step": 67736, "epoch": 1612} {"train_loss": -5.992252349853516, "global_step": 67737, "epoch": 1612} {"train_loss": -5.9380364418029785, "global_step": 67738, "epoch": 1612} {"train_loss": -6.0940046310424805, "global_step": 67739, "epoch": 1612} {"train_loss": -6.0384907722473145, "global_step": 67740, "epoch": 1612} {"train_loss": -6.016291618347168, "global_step": 67741, "epoch": 1612} {"train_loss": -6.077532768249512, "global_step": 67742, "epoch": 1612} {"train_loss": -5.908313751220703, "global_step": 67743, "epoch": 1612} {"train_loss": -6.109812259674072, "global_step": 67744, "epoch": 1612} {"train_loss": -6.000575519743419, "global_step": 67745, "epoch": 1612, "val_loss": 61604.39453125} {"train_loss": -5.86321496963501, "global_step": 67746, "epoch": 1613} {"train_loss": -5.972496032714844, "global_step": 67747, "epoch": 1613} {"train_loss": -5.973614692687988, "global_step": 67748, "epoch": 1613} {"train_loss": -6.064311981201172, "global_step": 67749, "epoch": 1613} {"train_loss": -6.013443946838379, "global_step": 67750, "epoch": 1613} {"train_loss": -5.998865127563477, "global_step": 67751, "epoch": 1613} {"train_loss": -6.018581390380859, "global_step": 67752, "epoch": 1613} {"train_loss": -5.929047584533691, "global_step": 67753, "epoch": 1613} {"train_loss": -6.062223434448242, "global_step": 67754, "epoch": 1613} {"train_loss": -6.032444000244141, "global_step": 67755, "epoch": 1613} {"train_loss": -6.046013355255127, "global_step": 67756, "epoch": 1613} {"train_loss": -5.969099044799805, "global_step": 67757, "epoch": 1613} {"train_loss": -5.996061325073242, "global_step": 67758, "epoch": 1613} {"train_loss": -6.023196220397949, "global_step": 67759, "epoch": 1613} {"train_loss": -6.164162635803223, "global_step": 67760, "epoch": 1613} {"train_loss": -6.017706871032715, "global_step": 67761, "epoch": 1613} {"train_loss": -6.058706283569336, "global_step": 67762, "epoch": 1613} {"train_loss": -5.988005638122559, "global_step": 67763, "epoch": 1613} {"train_loss": -6.048545837402344, "global_step": 67764, "epoch": 1613} {"train_loss": -6.035330295562744, "global_step": 67765, "epoch": 1613} {"train_loss": -5.982338905334473, "global_step": 67766, "epoch": 1613} {"train_loss": -5.953412055969238, "global_step": 67767, "epoch": 1613} {"train_loss": -6.053520679473877, "global_step": 67768, "epoch": 1613} {"train_loss": -6.067744731903076, "global_step": 67769, "epoch": 1613} {"train_loss": -6.109283447265625, "global_step": 67770, "epoch": 1613} {"train_loss": -5.954161167144775, "global_step": 67771, "epoch": 1613} {"train_loss": -6.027701377868652, "global_step": 67772, "epoch": 1613} {"train_loss": -6.053204536437988, "global_step": 67773, "epoch": 1613} {"train_loss": -5.961297988891602, "global_step": 67774, "epoch": 1613} {"train_loss": -5.999973297119141, "global_step": 67775, "epoch": 1613} {"train_loss": -5.928313732147217, "global_step": 67776, "epoch": 1613} {"train_loss": -5.992054462432861, "global_step": 67777, "epoch": 1613} {"train_loss": -6.0915422439575195, "global_step": 67778, "epoch": 1613} {"train_loss": -6.077559471130371, "global_step": 67779, "epoch": 1613} {"train_loss": -5.977433204650879, "global_step": 67780, "epoch": 1613} {"train_loss": -6.079063415527344, "global_step": 67781, "epoch": 1613} {"train_loss": -6.0108442306518555, "global_step": 67782, "epoch": 1613} {"train_loss": -6.014454364776611, "global_step": 67783, "epoch": 1613} {"train_loss": -6.050281047821045, "global_step": 67784, "epoch": 1613} {"train_loss": -6.056680679321289, "global_step": 67785, "epoch": 1613} {"train_loss": -6.066573143005371, "global_step": 67786, "epoch": 1613} {"train_loss": -6.0199731304532005, "global_step": 67787, "epoch": 1613, "val_loss": 61402.87890625} {"train_loss": -6.034341812133789, "global_step": 67788, "epoch": 1614} {"train_loss": -5.952054023742676, "global_step": 67789, "epoch": 1614} {"train_loss": -6.096417427062988, "global_step": 67790, "epoch": 1614} {"train_loss": -5.923639297485352, "global_step": 67791, "epoch": 1614} {"train_loss": -6.0022382736206055, "global_step": 67792, "epoch": 1614} {"train_loss": -5.9802398681640625, "global_step": 67793, "epoch": 1614} {"train_loss": -6.016849994659424, "global_step": 67794, "epoch": 1614} {"train_loss": -6.05478048324585, "global_step": 67795, "epoch": 1614} {"train_loss": -6.066292762756348, "global_step": 67796, "epoch": 1614} {"train_loss": -6.129087448120117, "global_step": 67797, "epoch": 1614} {"train_loss": -6.07388162612915, "global_step": 67798, "epoch": 1614} {"train_loss": -6.003077030181885, "global_step": 67799, "epoch": 1614} {"train_loss": -6.047598838806152, "global_step": 67800, "epoch": 1614} {"train_loss": -6.06324577331543, "global_step": 67801, "epoch": 1614} {"train_loss": -6.027744293212891, "global_step": 67802, "epoch": 1614} {"train_loss": -6.079184532165527, "global_step": 67803, "epoch": 1614} {"train_loss": -5.9594926834106445, "global_step": 67804, "epoch": 1614} {"train_loss": -6.070137023925781, "global_step": 67805, "epoch": 1614} {"train_loss": -6.038393020629883, "global_step": 67806, "epoch": 1614} {"train_loss": -6.047065734863281, "global_step": 67807, "epoch": 1614} {"train_loss": -6.0025200843811035, "global_step": 67808, "epoch": 1614} {"train_loss": -5.9883623123168945, "global_step": 67809, "epoch": 1614} {"train_loss": -6.067053318023682, "global_step": 67810, "epoch": 1614} {"train_loss": -5.885666847229004, "global_step": 67811, "epoch": 1614} {"train_loss": -6.032148361206055, "global_step": 67812, "epoch": 1614} {"train_loss": -6.035961151123047, "global_step": 67813, "epoch": 1614} {"train_loss": -6.071241855621338, "global_step": 67814, "epoch": 1614} {"train_loss": -5.9094462394714355, "global_step": 67815, "epoch": 1614} {"train_loss": -6.058449745178223, "global_step": 67816, "epoch": 1614} {"train_loss": -6.0849609375, "global_step": 67817, "epoch": 1614} {"train_loss": -6.2026824951171875, "global_step": 67818, "epoch": 1614} {"train_loss": -6.16232967376709, "global_step": 67819, "epoch": 1614} {"train_loss": -6.080901145935059, "global_step": 67820, "epoch": 1614} {"train_loss": -5.969867706298828, "global_step": 67821, "epoch": 1614} {"train_loss": -5.961757659912109, "global_step": 67822, "epoch": 1614} {"train_loss": -6.053314208984375, "global_step": 67823, "epoch": 1614} {"train_loss": -6.1318359375, "global_step": 67824, "epoch": 1614} {"train_loss": -5.983262062072754, "global_step": 67825, "epoch": 1614} {"train_loss": -6.149404048919678, "global_step": 67826, "epoch": 1614} {"train_loss": -5.79595422744751, "global_step": 67827, "epoch": 1614} {"train_loss": -6.001217365264893, "global_step": 67828, "epoch": 1614} {"train_loss": -6.031920115152995, "global_step": 67829, "epoch": 1614, "val_loss": 61420.0078125} {"train_loss": -6.133490562438965, "global_step": 67830, "epoch": 1615} {"train_loss": -6.063443183898926, "global_step": 67831, "epoch": 1615} {"train_loss": -6.064280986785889, "global_step": 67832, "epoch": 1615} {"train_loss": -6.042862892150879, "global_step": 67833, "epoch": 1615} {"train_loss": -6.136901378631592, "global_step": 67834, "epoch": 1615} {"train_loss": -6.067975997924805, "global_step": 67835, "epoch": 1615} {"train_loss": -6.105688095092773, "global_step": 67836, "epoch": 1615} {"train_loss": -6.064256191253662, "global_step": 67837, "epoch": 1615} {"train_loss": -5.94713020324707, "global_step": 67838, "epoch": 1615} {"train_loss": -6.0127668380737305, "global_step": 67839, "epoch": 1615} {"train_loss": -5.948421478271484, "global_step": 67840, "epoch": 1615} {"train_loss": -6.132837772369385, "global_step": 67841, "epoch": 1615} {"train_loss": -5.961400985717773, "global_step": 67842, "epoch": 1615} {"train_loss": -5.8929338455200195, "global_step": 67843, "epoch": 1615} {"train_loss": -5.848006248474121, "global_step": 67844, "epoch": 1615} {"train_loss": -5.989886283874512, "global_step": 67845, "epoch": 1615} {"train_loss": -5.975130558013916, "global_step": 67846, "epoch": 1615} {"train_loss": -6.02849006652832, "global_step": 67847, "epoch": 1615} {"train_loss": -6.040492534637451, "global_step": 67848, "epoch": 1615} {"train_loss": -5.844078063964844, "global_step": 67849, "epoch": 1615} {"train_loss": -6.046178817749023, "global_step": 67850, "epoch": 1615} {"train_loss": -6.027932167053223, "global_step": 67851, "epoch": 1615} {"train_loss": -5.925742149353027, "global_step": 67852, "epoch": 1615} {"train_loss": -5.87489128112793, "global_step": 67853, "epoch": 1615} {"train_loss": -6.0404744148254395, "global_step": 67854, "epoch": 1615} {"train_loss": -6.00471830368042, "global_step": 67855, "epoch": 1615} {"train_loss": -5.952658176422119, "global_step": 67856, "epoch": 1615} {"train_loss": -5.98640251159668, "global_step": 67857, "epoch": 1615} {"train_loss": -6.021888732910156, "global_step": 67858, "epoch": 1615} {"train_loss": -5.8700056076049805, "global_step": 67859, "epoch": 1615} {"train_loss": -6.0229716300964355, "global_step": 67860, "epoch": 1615} {"train_loss": -6.046281814575195, "global_step": 67861, "epoch": 1615} {"train_loss": -5.94172477722168, "global_step": 67862, "epoch": 1615} {"train_loss": -6.087763786315918, "global_step": 67863, "epoch": 1615} {"train_loss": -6.053777694702148, "global_step": 67864, "epoch": 1615} {"train_loss": -5.9995903968811035, "global_step": 67865, "epoch": 1615} {"train_loss": -5.9750776290893555, "global_step": 67866, "epoch": 1615} {"train_loss": -6.012126445770264, "global_step": 67867, "epoch": 1615} {"train_loss": -5.750480651855469, "global_step": 67868, "epoch": 1615} {"train_loss": -5.978057861328125, "global_step": 67869, "epoch": 1615} {"train_loss": -5.943872928619385, "global_step": 67870, "epoch": 1615} {"train_loss": -5.997154133660453, "global_step": 67871, "epoch": 1615, "val_loss": 61536.7734375} {"train_loss": -5.994668960571289, "global_step": 67872, "epoch": 1616} {"train_loss": -5.8911614418029785, "global_step": 67873, "epoch": 1616} {"train_loss": -5.952178001403809, "global_step": 67874, "epoch": 1616} {"train_loss": -6.0291242599487305, "global_step": 67875, "epoch": 1616} {"train_loss": -5.766022682189941, "global_step": 67876, "epoch": 1616} {"train_loss": -5.964495658874512, "global_step": 67877, "epoch": 1616} {"train_loss": -5.933890342712402, "global_step": 67878, "epoch": 1616} {"train_loss": -5.910675525665283, "global_step": 67879, "epoch": 1616} {"train_loss": -6.067737102508545, "global_step": 67880, "epoch": 1616} {"train_loss": -5.8593878746032715, "global_step": 67881, "epoch": 1616} {"train_loss": -6.01153564453125, "global_step": 67882, "epoch": 1616} {"train_loss": -6.066329002380371, "global_step": 67883, "epoch": 1616} {"train_loss": -6.1031084060668945, "global_step": 67884, "epoch": 1616} {"train_loss": -5.960899353027344, "global_step": 67885, "epoch": 1616} {"train_loss": -5.958433151245117, "global_step": 67886, "epoch": 1616} {"train_loss": -5.9961442947387695, "global_step": 67887, "epoch": 1616} {"train_loss": -5.9372239112854, "global_step": 67888, "epoch": 1616} {"train_loss": -5.9181904792785645, "global_step": 67889, "epoch": 1616} {"train_loss": -6.0345916748046875, "global_step": 67890, "epoch": 1616} {"train_loss": -6.0486297607421875, "global_step": 67891, "epoch": 1616} {"train_loss": -5.9863786697387695, "global_step": 67892, "epoch": 1616} {"train_loss": -5.9762067794799805, "global_step": 67893, "epoch": 1616} {"train_loss": -5.99202823638916, "global_step": 67894, "epoch": 1616} {"train_loss": -6.081465721130371, "global_step": 67895, "epoch": 1616} {"train_loss": -5.996598243713379, "global_step": 67896, "epoch": 1616} {"train_loss": -6.001964569091797, "global_step": 67897, "epoch": 1616} {"train_loss": -6.048542022705078, "global_step": 67898, "epoch": 1616} {"train_loss": -6.024604797363281, "global_step": 67899, "epoch": 1616} {"train_loss": -6.0102386474609375, "global_step": 67900, "epoch": 1616} {"train_loss": -5.986136436462402, "global_step": 67901, "epoch": 1616} {"train_loss": -6.001331329345703, "global_step": 67902, "epoch": 1616} {"train_loss": -6.132749557495117, "global_step": 67903, "epoch": 1616} {"train_loss": -5.997235298156738, "global_step": 67904, "epoch": 1616} {"train_loss": -5.983587265014648, "global_step": 67905, "epoch": 1616} {"train_loss": -6.093378067016602, "global_step": 67906, "epoch": 1616} {"train_loss": -5.987668514251709, "global_step": 67907, "epoch": 1616} {"train_loss": -5.961554527282715, "global_step": 67908, "epoch": 1616} {"train_loss": -5.981083869934082, "global_step": 67909, "epoch": 1616} {"train_loss": -5.95266056060791, "global_step": 67910, "epoch": 1616} {"train_loss": -5.917560577392578, "global_step": 67911, "epoch": 1616} {"train_loss": -6.001567363739014, "global_step": 67912, "epoch": 1616} {"train_loss": -5.987750348590669, "global_step": 67913, "epoch": 1616, "val_loss": 61626.25} {"train_loss": -5.9146728515625, "global_step": 67914, "epoch": 1617} {"train_loss": -5.96837043762207, "global_step": 67915, "epoch": 1617} {"train_loss": -5.9881415367126465, "global_step": 67916, "epoch": 1617} {"train_loss": -5.834219455718994, "global_step": 67917, "epoch": 1617} {"train_loss": -6.074521064758301, "global_step": 67918, "epoch": 1617} {"train_loss": -6.105731964111328, "global_step": 67919, "epoch": 1617} {"train_loss": -6.015419006347656, "global_step": 67920, "epoch": 1617} {"train_loss": -5.959470748901367, "global_step": 67921, "epoch": 1617} {"train_loss": -5.994864463806152, "global_step": 67922, "epoch": 1617} {"train_loss": -5.97978401184082, "global_step": 67923, "epoch": 1617} {"train_loss": -5.954467296600342, "global_step": 67924, "epoch": 1617} {"train_loss": -6.109434127807617, "global_step": 67925, "epoch": 1617} {"train_loss": -6.018190383911133, "global_step": 67926, "epoch": 1617} {"train_loss": -6.017061233520508, "global_step": 67927, "epoch": 1617} {"train_loss": -5.844844818115234, "global_step": 67928, "epoch": 1617} {"train_loss": -5.981876373291016, "global_step": 67929, "epoch": 1617} {"train_loss": -5.952420234680176, "global_step": 67930, "epoch": 1617} {"train_loss": -6.0433502197265625, "global_step": 67931, "epoch": 1617} {"train_loss": -6.008697032928467, "global_step": 67932, "epoch": 1617} {"train_loss": -6.00745964050293, "global_step": 67933, "epoch": 1617} {"train_loss": -5.963840961456299, "global_step": 67934, "epoch": 1617} {"train_loss": -5.891059875488281, "global_step": 67935, "epoch": 1617} {"train_loss": -5.987221717834473, "global_step": 67936, "epoch": 1617} {"train_loss": -5.979382514953613, "global_step": 67937, "epoch": 1617} {"train_loss": -5.946869850158691, "global_step": 67938, "epoch": 1617} {"train_loss": -6.017197132110596, "global_step": 67939, "epoch": 1617} {"train_loss": -5.901555061340332, "global_step": 67940, "epoch": 1617} {"train_loss": -6.032919883728027, "global_step": 67941, "epoch": 1617} {"train_loss": -5.990538597106934, "global_step": 67942, "epoch": 1617} {"train_loss": -6.151235580444336, "global_step": 67943, "epoch": 1617} {"train_loss": -5.975724220275879, "global_step": 67944, "epoch": 1617} {"train_loss": -6.0658860206604, "global_step": 67945, "epoch": 1617} {"train_loss": -5.990082740783691, "global_step": 67946, "epoch": 1617} {"train_loss": -6.084118843078613, "global_step": 67947, "epoch": 1617} {"train_loss": -5.962094783782959, "global_step": 67948, "epoch": 1617} {"train_loss": -6.148168563842773, "global_step": 67949, "epoch": 1617} {"train_loss": -6.068024635314941, "global_step": 67950, "epoch": 1617} {"train_loss": -5.994590759277344, "global_step": 67951, "epoch": 1617} {"train_loss": -6.004705429077148, "global_step": 67952, "epoch": 1617} {"train_loss": -6.058103084564209, "global_step": 67953, "epoch": 1617} {"train_loss": -5.950136184692383, "global_step": 67954, "epoch": 1617} {"train_loss": -5.998562131609235, "global_step": 67955, "epoch": 1617, "val_loss": 61791.41796875} {"train_loss": -6.014545440673828, "global_step": 67956, "epoch": 1618} {"train_loss": -5.997636795043945, "global_step": 67957, "epoch": 1618} {"train_loss": -6.145724296569824, "global_step": 67958, "epoch": 1618} {"train_loss": -5.97228479385376, "global_step": 67959, "epoch": 1618} {"train_loss": -5.967315673828125, "global_step": 67960, "epoch": 1618} {"train_loss": -5.98915433883667, "global_step": 67961, "epoch": 1618} {"train_loss": -6.004874229431152, "global_step": 67962, "epoch": 1618} {"train_loss": -5.940758228302002, "global_step": 67963, "epoch": 1618} {"train_loss": -5.97078800201416, "global_step": 67964, "epoch": 1618} {"train_loss": -6.037785530090332, "global_step": 67965, "epoch": 1618} {"train_loss": -5.960949897766113, "global_step": 67966, "epoch": 1618} {"train_loss": -5.982365608215332, "global_step": 67967, "epoch": 1618} {"train_loss": -5.993043899536133, "global_step": 67968, "epoch": 1618} {"train_loss": -5.9722418785095215, "global_step": 67969, "epoch": 1618} {"train_loss": -6.017509460449219, "global_step": 67970, "epoch": 1618} {"train_loss": -6.0344719886779785, "global_step": 67971, "epoch": 1618} {"train_loss": -5.934802055358887, "global_step": 67972, "epoch": 1618} {"train_loss": -6.120936393737793, "global_step": 67973, "epoch": 1618} {"train_loss": -6.023687839508057, "global_step": 67974, "epoch": 1618} {"train_loss": -5.995932579040527, "global_step": 67975, "epoch": 1618} {"train_loss": -6.052280902862549, "global_step": 67976, "epoch": 1618} {"train_loss": -5.927871227264404, "global_step": 67977, "epoch": 1618} {"train_loss": -5.829599380493164, "global_step": 67978, "epoch": 1618} {"train_loss": -5.9174041748046875, "global_step": 67979, "epoch": 1618} {"train_loss": -5.968686580657959, "global_step": 67980, "epoch": 1618} {"train_loss": -5.90730094909668, "global_step": 67981, "epoch": 1618} {"train_loss": -5.936171531677246, "global_step": 67982, "epoch": 1618} {"train_loss": -5.991937160491943, "global_step": 67983, "epoch": 1618} {"train_loss": -5.954822540283203, "global_step": 67984, "epoch": 1618} {"train_loss": -5.959852695465088, "global_step": 67985, "epoch": 1618} {"train_loss": -5.935884475708008, "global_step": 67986, "epoch": 1618} {"train_loss": -6.050177574157715, "global_step": 67987, "epoch": 1618} {"train_loss": -5.995652675628662, "global_step": 67988, "epoch": 1618} {"train_loss": -5.987195014953613, "global_step": 67989, "epoch": 1618} {"train_loss": -5.980354309082031, "global_step": 67990, "epoch": 1618} {"train_loss": -5.968380928039551, "global_step": 67991, "epoch": 1618} {"train_loss": -5.965771675109863, "global_step": 67992, "epoch": 1618} {"train_loss": -6.010146141052246, "global_step": 67993, "epoch": 1618} {"train_loss": -5.978504180908203, "global_step": 67994, "epoch": 1618} {"train_loss": -5.97419548034668, "global_step": 67995, "epoch": 1618} {"train_loss": -6.11078405380249, "global_step": 67996, "epoch": 1618} {"train_loss": -5.988652899151757, "global_step": 67997, "epoch": 1618, "val_loss": 61450.7890625} {"train_loss": -6.124670505523682, "global_step": 67998, "epoch": 1619} {"train_loss": -5.975368976593018, "global_step": 67999, "epoch": 1619} {"train_loss": -6.002968788146973, "global_step": 68000, "epoch": 1619} {"train_loss": -5.979517936706543, "global_step": 68001, "epoch": 1619} {"train_loss": -5.96511173248291, "global_step": 68002, "epoch": 1619} {"train_loss": -6.151444911956787, "global_step": 68003, "epoch": 1619} {"train_loss": -6.099733829498291, "global_step": 68004, "epoch": 1619} {"train_loss": -6.020249843597412, "global_step": 68005, "epoch": 1619} {"train_loss": -5.872920036315918, "global_step": 68006, "epoch": 1619} {"train_loss": -6.0879364013671875, "global_step": 68007, "epoch": 1619} {"train_loss": -5.986569404602051, "global_step": 68008, "epoch": 1619} {"train_loss": -6.122670650482178, "global_step": 68009, "epoch": 1619} {"train_loss": -5.974277973175049, "global_step": 68010, "epoch": 1619} {"train_loss": -5.957388877868652, "global_step": 68011, "epoch": 1619} {"train_loss": -6.029331207275391, "global_step": 68012, "epoch": 1619} {"train_loss": -5.938750267028809, "global_step": 68013, "epoch": 1619} {"train_loss": -5.99423885345459, "global_step": 68014, "epoch": 1619} {"train_loss": -5.997097015380859, "global_step": 68015, "epoch": 1619} {"train_loss": -6.036763668060303, "global_step": 68016, "epoch": 1619} {"train_loss": -6.06387996673584, "global_step": 68017, "epoch": 1619} {"train_loss": -6.0011396408081055, "global_step": 68018, "epoch": 1619} {"train_loss": -5.9414963722229, "global_step": 68019, "epoch": 1619} {"train_loss": -5.966479301452637, "global_step": 68020, "epoch": 1619} {"train_loss": -6.112927436828613, "global_step": 68021, "epoch": 1619} {"train_loss": -5.96494722366333, "global_step": 68022, "epoch": 1619} {"train_loss": -5.900965690612793, "global_step": 68023, "epoch": 1619} {"train_loss": -6.010627269744873, "global_step": 68024, "epoch": 1619} {"train_loss": -5.907108306884766, "global_step": 68025, "epoch": 1619} {"train_loss": -6.067935466766357, "global_step": 68026, "epoch": 1619} {"train_loss": -5.907836437225342, "global_step": 68027, "epoch": 1619} {"train_loss": -5.968499183654785, "global_step": 68028, "epoch": 1619} {"train_loss": -6.058108329772949, "global_step": 68029, "epoch": 1619} {"train_loss": -6.007551193237305, "global_step": 68030, "epoch": 1619} {"train_loss": -6.083408832550049, "global_step": 68031, "epoch": 1619} {"train_loss": -5.914802551269531, "global_step": 68032, "epoch": 1619} {"train_loss": -5.978159427642822, "global_step": 68033, "epoch": 1619} {"train_loss": -6.022225379943848, "global_step": 68034, "epoch": 1619} {"train_loss": -6.086379051208496, "global_step": 68035, "epoch": 1619} {"train_loss": -6.00115966796875, "global_step": 68036, "epoch": 1619} {"train_loss": -5.850368022918701, "global_step": 68037, "epoch": 1619} {"train_loss": -6.135110855102539, "global_step": 68038, "epoch": 1619} {"train_loss": -6.006379388627552, "global_step": 68039, "epoch": 1619, "val_loss": 61553.953125} {"train_loss": -5.985880374908447, "global_step": 68040, "epoch": 1620} {"train_loss": -6.1211090087890625, "global_step": 68041, "epoch": 1620} {"train_loss": -6.076059341430664, "global_step": 68042, "epoch": 1620} {"train_loss": -5.918825149536133, "global_step": 68043, "epoch": 1620} {"train_loss": -5.986124038696289, "global_step": 68044, "epoch": 1620} {"train_loss": -6.034082412719727, "global_step": 68045, "epoch": 1620} {"train_loss": -5.969865798950195, "global_step": 68046, "epoch": 1620} {"train_loss": -5.962343692779541, "global_step": 68047, "epoch": 1620} {"train_loss": -6.03917121887207, "global_step": 68048, "epoch": 1620} {"train_loss": -6.0605974197387695, "global_step": 68049, "epoch": 1620} {"train_loss": -5.904623031616211, "global_step": 68050, "epoch": 1620} {"train_loss": -6.042198181152344, "global_step": 68051, "epoch": 1620} {"train_loss": -5.990827560424805, "global_step": 68052, "epoch": 1620} {"train_loss": -6.088812351226807, "global_step": 68053, "epoch": 1620} {"train_loss": -6.050295829772949, "global_step": 68054, "epoch": 1620} {"train_loss": -5.934996128082275, "global_step": 68055, "epoch": 1620} {"train_loss": -5.9197282791137695, "global_step": 68056, "epoch": 1620} {"train_loss": -5.959576606750488, "global_step": 68057, "epoch": 1620} {"train_loss": -5.983761310577393, "global_step": 68058, "epoch": 1620} {"train_loss": -5.953304290771484, "global_step": 68059, "epoch": 1620} {"train_loss": -6.079643726348877, "global_step": 68060, "epoch": 1620} {"train_loss": -6.004386901855469, "global_step": 68061, "epoch": 1620} {"train_loss": -6.102260589599609, "global_step": 68062, "epoch": 1620} {"train_loss": -6.065883636474609, "global_step": 68063, "epoch": 1620} {"train_loss": -5.9926042556762695, "global_step": 68064, "epoch": 1620} {"train_loss": -5.946099281311035, "global_step": 68065, "epoch": 1620} {"train_loss": -5.99628210067749, "global_step": 68066, "epoch": 1620} {"train_loss": -5.986623764038086, "global_step": 68067, "epoch": 1620} {"train_loss": -5.973242282867432, "global_step": 68068, "epoch": 1620} {"train_loss": -5.963315963745117, "global_step": 68069, "epoch": 1620} {"train_loss": -6.133933067321777, "global_step": 68070, "epoch": 1620} {"train_loss": -6.154447078704834, "global_step": 68071, "epoch": 1620} {"train_loss": -5.9695539474487305, "global_step": 68072, "epoch": 1620} {"train_loss": -6.03187370300293, "global_step": 68073, "epoch": 1620} {"train_loss": -5.9922075271606445, "global_step": 68074, "epoch": 1620} {"train_loss": -5.9514594078063965, "global_step": 68075, "epoch": 1620} {"train_loss": -6.023161888122559, "global_step": 68076, "epoch": 1620} {"train_loss": -6.031062126159668, "global_step": 68077, "epoch": 1620} {"train_loss": -6.086385726928711, "global_step": 68078, "epoch": 1620} {"train_loss": -6.045033931732178, "global_step": 68079, "epoch": 1620} {"train_loss": -5.918966293334961, "global_step": 68080, "epoch": 1620} {"train_loss": -6.010855288732619, "global_step": 68081, "epoch": 1620, "val_loss": 61768.984375} {"train_loss": -5.916971206665039, "global_step": 68082, "epoch": 1621} {"train_loss": -5.793801307678223, "global_step": 68083, "epoch": 1621} {"train_loss": -6.105466365814209, "global_step": 68084, "epoch": 1621} {"train_loss": -5.8825364112854, "global_step": 68085, "epoch": 1621} {"train_loss": -5.942075729370117, "global_step": 68086, "epoch": 1621} {"train_loss": -5.9745378494262695, "global_step": 68087, "epoch": 1621} {"train_loss": -5.9667134284973145, "global_step": 68088, "epoch": 1621} {"train_loss": -5.9371747970581055, "global_step": 68089, "epoch": 1621} {"train_loss": -5.967885971069336, "global_step": 68090, "epoch": 1621} {"train_loss": -5.924793243408203, "global_step": 68091, "epoch": 1621} {"train_loss": -5.908127784729004, "global_step": 68092, "epoch": 1621} {"train_loss": -6.000092506408691, "global_step": 68093, "epoch": 1621} {"train_loss": -6.13100528717041, "global_step": 68094, "epoch": 1621} {"train_loss": -5.897216796875, "global_step": 68095, "epoch": 1621} {"train_loss": -6.0716166496276855, "global_step": 68096, "epoch": 1621} {"train_loss": -5.941967964172363, "global_step": 68097, "epoch": 1621} {"train_loss": -6.068830966949463, "global_step": 68098, "epoch": 1621} {"train_loss": -5.953891754150391, "global_step": 68099, "epoch": 1621} {"train_loss": -6.073668479919434, "global_step": 68100, "epoch": 1621} {"train_loss": -6.074831962585449, "global_step": 68101, "epoch": 1621} {"train_loss": -5.971364498138428, "global_step": 68102, "epoch": 1621} {"train_loss": -5.932343482971191, "global_step": 68103, "epoch": 1621} {"train_loss": -6.0671067237854, "global_step": 68104, "epoch": 1621} {"train_loss": -5.909149169921875, "global_step": 68105, "epoch": 1621} {"train_loss": -5.909306049346924, "global_step": 68106, "epoch": 1621} {"train_loss": -6.012681484222412, "global_step": 68107, "epoch": 1621} {"train_loss": -5.962381839752197, "global_step": 68108, "epoch": 1621} {"train_loss": -6.05154275894165, "global_step": 68109, "epoch": 1621} {"train_loss": -6.065954208374023, "global_step": 68110, "epoch": 1621} {"train_loss": -5.967803001403809, "global_step": 68111, "epoch": 1621} {"train_loss": -5.918426036834717, "global_step": 68112, "epoch": 1621} {"train_loss": -5.928676605224609, "global_step": 68113, "epoch": 1621} {"train_loss": -5.931535720825195, "global_step": 68114, "epoch": 1621} {"train_loss": -6.049552917480469, "global_step": 68115, "epoch": 1621} {"train_loss": -5.8991851806640625, "global_step": 68116, "epoch": 1621} {"train_loss": -5.999051094055176, "global_step": 68117, "epoch": 1621} {"train_loss": -5.913159370422363, "global_step": 68118, "epoch": 1621} {"train_loss": -5.897668838500977, "global_step": 68119, "epoch": 1621} {"train_loss": -5.89555025100708, "global_step": 68120, "epoch": 1621} {"train_loss": -5.908437728881836, "global_step": 68121, "epoch": 1621} {"train_loss": -5.906642436981201, "global_step": 68122, "epoch": 1621} {"train_loss": -5.968590520677113, "global_step": 68123, "epoch": 1621, "val_loss": 61807.4453125} {"train_loss": -5.99536657333374, "global_step": 68124, "epoch": 1622} {"train_loss": -6.002438545227051, "global_step": 68125, "epoch": 1622} {"train_loss": -5.971983909606934, "global_step": 68126, "epoch": 1622} {"train_loss": -5.862596035003662, "global_step": 68127, "epoch": 1622} {"train_loss": -5.964176177978516, "global_step": 68128, "epoch": 1622} {"train_loss": -5.947780132293701, "global_step": 68129, "epoch": 1622} {"train_loss": -6.033722877502441, "global_step": 68130, "epoch": 1622} {"train_loss": -5.978662967681885, "global_step": 68131, "epoch": 1622} {"train_loss": -6.000908374786377, "global_step": 68132, "epoch": 1622} {"train_loss": -6.002850532531738, "global_step": 68133, "epoch": 1622} {"train_loss": -5.871514320373535, "global_step": 68134, "epoch": 1622} {"train_loss": -5.9008941650390625, "global_step": 68135, "epoch": 1622} {"train_loss": -6.020242691040039, "global_step": 68136, "epoch": 1622} {"train_loss": -6.010049819946289, "global_step": 68137, "epoch": 1622} {"train_loss": -6.009274959564209, "global_step": 68138, "epoch": 1622} {"train_loss": -6.014962196350098, "global_step": 68139, "epoch": 1622} {"train_loss": -6.027205467224121, "global_step": 68140, "epoch": 1622} {"train_loss": -5.894896507263184, "global_step": 68141, "epoch": 1622} {"train_loss": -5.914777755737305, "global_step": 68142, "epoch": 1622} {"train_loss": -5.992895603179932, "global_step": 68143, "epoch": 1622} {"train_loss": -5.9655866622924805, "global_step": 68144, "epoch": 1622} {"train_loss": -5.929553985595703, "global_step": 68145, "epoch": 1622} {"train_loss": -5.991026878356934, "global_step": 68146, "epoch": 1622} {"train_loss": -5.98615026473999, "global_step": 68147, "epoch": 1622} {"train_loss": -5.934733867645264, "global_step": 68148, "epoch": 1622} {"train_loss": -6.071170330047607, "global_step": 68149, "epoch": 1622} {"train_loss": -6.018516540527344, "global_step": 68150, "epoch": 1622} {"train_loss": -6.028847694396973, "global_step": 68151, "epoch": 1622} {"train_loss": -5.989902496337891, "global_step": 68152, "epoch": 1622} {"train_loss": -5.961877346038818, "global_step": 68153, "epoch": 1622} {"train_loss": -6.0222578048706055, "global_step": 68154, "epoch": 1622} {"train_loss": -5.974294662475586, "global_step": 68155, "epoch": 1622} {"train_loss": -6.003467559814453, "global_step": 68156, "epoch": 1622} {"train_loss": -5.977402687072754, "global_step": 68157, "epoch": 1622} {"train_loss": -5.92482852935791, "global_step": 68158, "epoch": 1622} {"train_loss": -5.970458507537842, "global_step": 68159, "epoch": 1622} {"train_loss": -5.877594947814941, "global_step": 68160, "epoch": 1622} {"train_loss": -5.87084436416626, "global_step": 68161, "epoch": 1622} {"train_loss": -5.976980686187744, "global_step": 68162, "epoch": 1622} {"train_loss": -5.854763031005859, "global_step": 68163, "epoch": 1622} {"train_loss": -5.852766513824463, "global_step": 68164, "epoch": 1622} {"train_loss": -5.964382750647409, "global_step": 68165, "epoch": 1622, "val_loss": 61520.890625} {"train_loss": -5.9629974365234375, "global_step": 68166, "epoch": 1623} {"train_loss": -6.103384017944336, "global_step": 68167, "epoch": 1623} {"train_loss": -6.019514560699463, "global_step": 68168, "epoch": 1623} {"train_loss": -6.021287441253662, "global_step": 68169, "epoch": 1623} {"train_loss": -6.05143928527832, "global_step": 68170, "epoch": 1623} {"train_loss": -5.958227634429932, "global_step": 68171, "epoch": 1623} {"train_loss": -5.992954254150391, "global_step": 68172, "epoch": 1623} {"train_loss": -6.002890586853027, "global_step": 68173, "epoch": 1623} {"train_loss": -6.007890701293945, "global_step": 68174, "epoch": 1623} {"train_loss": -5.969701766967773, "global_step": 68175, "epoch": 1623} {"train_loss": -6.104952812194824, "global_step": 68176, "epoch": 1623} {"train_loss": -5.971677780151367, "global_step": 68177, "epoch": 1623} {"train_loss": -6.033332824707031, "global_step": 68178, "epoch": 1623} {"train_loss": -5.980123043060303, "global_step": 68179, "epoch": 1623} {"train_loss": -5.901607513427734, "global_step": 68180, "epoch": 1623} {"train_loss": -6.019628524780273, "global_step": 68181, "epoch": 1623} {"train_loss": -6.041403770446777, "global_step": 68182, "epoch": 1623} {"train_loss": -6.039409637451172, "global_step": 68183, "epoch": 1623} {"train_loss": -6.0904645919799805, "global_step": 68184, "epoch": 1623} {"train_loss": -5.827131271362305, "global_step": 68185, "epoch": 1623} {"train_loss": -5.930815696716309, "global_step": 68186, "epoch": 1623} {"train_loss": -6.018095970153809, "global_step": 68187, "epoch": 1623} {"train_loss": -5.911770820617676, "global_step": 68188, "epoch": 1623} {"train_loss": -5.896464824676514, "global_step": 68189, "epoch": 1623} {"train_loss": -5.971088409423828, "global_step": 68190, "epoch": 1623} {"train_loss": -5.91391658782959, "global_step": 68191, "epoch": 1623} {"train_loss": -5.996356964111328, "global_step": 68192, "epoch": 1623} {"train_loss": -5.981734752655029, "global_step": 68193, "epoch": 1623} {"train_loss": -6.025590419769287, "global_step": 68194, "epoch": 1623} {"train_loss": -6.0589599609375, "global_step": 68195, "epoch": 1623} {"train_loss": -6.0461883544921875, "global_step": 68196, "epoch": 1623} {"train_loss": -6.104493141174316, "global_step": 68197, "epoch": 1623} {"train_loss": -6.067975997924805, "global_step": 68198, "epoch": 1623} {"train_loss": -5.856738090515137, "global_step": 68199, "epoch": 1623} {"train_loss": -5.887081623077393, "global_step": 68200, "epoch": 1623} {"train_loss": -6.035801887512207, "global_step": 68201, "epoch": 1623} {"train_loss": -5.977750301361084, "global_step": 68202, "epoch": 1623} {"train_loss": -5.935377597808838, "global_step": 68203, "epoch": 1623} {"train_loss": -6.034782409667969, "global_step": 68204, "epoch": 1623} {"train_loss": -6.005889415740967, "global_step": 68205, "epoch": 1623} {"train_loss": -5.937284469604492, "global_step": 68206, "epoch": 1623} {"train_loss": -5.99355445589338, "global_step": 68207, "epoch": 1623, "val_loss": 61758.2421875} {"train_loss": -6.018430709838867, "global_step": 68208, "epoch": 1624} {"train_loss": -5.9145097732543945, "global_step": 68209, "epoch": 1624} {"train_loss": -6.0219855308532715, "global_step": 68210, "epoch": 1624} {"train_loss": -5.988659858703613, "global_step": 68211, "epoch": 1624} {"train_loss": -6.0207929611206055, "global_step": 68212, "epoch": 1624} {"train_loss": -6.005129814147949, "global_step": 68213, "epoch": 1624} {"train_loss": -6.029671669006348, "global_step": 68214, "epoch": 1624} {"train_loss": -5.968827247619629, "global_step": 68215, "epoch": 1624} {"train_loss": -6.10520601272583, "global_step": 68216, "epoch": 1624} {"train_loss": -6.106832027435303, "global_step": 68217, "epoch": 1624} {"train_loss": -6.003583908081055, "global_step": 68218, "epoch": 1624} {"train_loss": -6.022658348083496, "global_step": 68219, "epoch": 1624} {"train_loss": -5.965962886810303, "global_step": 68220, "epoch": 1624} {"train_loss": -5.919354438781738, "global_step": 68221, "epoch": 1624} {"train_loss": -6.026384353637695, "global_step": 68222, "epoch": 1624} {"train_loss": -5.976415634155273, "global_step": 68223, "epoch": 1624} {"train_loss": -6.054376602172852, "global_step": 68224, "epoch": 1624} {"train_loss": -5.968588829040527, "global_step": 68225, "epoch": 1624} {"train_loss": -6.039096355438232, "global_step": 68226, "epoch": 1624} {"train_loss": -6.081235885620117, "global_step": 68227, "epoch": 1624} {"train_loss": -5.834927558898926, "global_step": 68228, "epoch": 1624} {"train_loss": -6.060994625091553, "global_step": 68229, "epoch": 1624} {"train_loss": -5.8400068283081055, "global_step": 68230, "epoch": 1624} {"train_loss": -5.946335315704346, "global_step": 68231, "epoch": 1624} {"train_loss": -5.97840690612793, "global_step": 68232, "epoch": 1624} {"train_loss": -6.002788543701172, "global_step": 68233, "epoch": 1624} {"train_loss": -5.976259231567383, "global_step": 68234, "epoch": 1624} {"train_loss": -6.101255416870117, "global_step": 68235, "epoch": 1624} {"train_loss": -5.903378963470459, "global_step": 68236, "epoch": 1624} {"train_loss": -5.979859352111816, "global_step": 68237, "epoch": 1624} {"train_loss": -5.891790390014648, "global_step": 68238, "epoch": 1624} {"train_loss": -5.996560096740723, "global_step": 68239, "epoch": 1624} {"train_loss": -5.826516628265381, "global_step": 68240, "epoch": 1624} {"train_loss": -5.964350700378418, "global_step": 68241, "epoch": 1624} {"train_loss": -5.931546688079834, "global_step": 68242, "epoch": 1624} {"train_loss": -5.930745601654053, "global_step": 68243, "epoch": 1624} {"train_loss": -6.010308265686035, "global_step": 68244, "epoch": 1624} {"train_loss": -5.877220630645752, "global_step": 68245, "epoch": 1624} {"train_loss": -6.002715587615967, "global_step": 68246, "epoch": 1624} {"train_loss": -6.052127838134766, "global_step": 68247, "epoch": 1624} {"train_loss": -6.080196857452393, "global_step": 68248, "epoch": 1624} {"train_loss": -5.985597349348522, "global_step": 68249, "epoch": 1624, "val_loss": 61634.17578125} {"train_loss": -6.022459983825684, "global_step": 68250, "epoch": 1625} {"train_loss": -5.8557329177856445, "global_step": 68251, "epoch": 1625} {"train_loss": -6.063022136688232, "global_step": 68252, "epoch": 1625} {"train_loss": -6.101146697998047, "global_step": 68253, "epoch": 1625} {"train_loss": -6.159561634063721, "global_step": 68254, "epoch": 1625} {"train_loss": -6.100590229034424, "global_step": 68255, "epoch": 1625} {"train_loss": -5.965340614318848, "global_step": 68256, "epoch": 1625} {"train_loss": -6.127190113067627, "global_step": 68257, "epoch": 1625} {"train_loss": -6.074647903442383, "global_step": 68258, "epoch": 1625} {"train_loss": -5.954912185668945, "global_step": 68259, "epoch": 1625} {"train_loss": -6.036890983581543, "global_step": 68260, "epoch": 1625} {"train_loss": -6.06364631652832, "global_step": 68261, "epoch": 1625} {"train_loss": -5.822319984436035, "global_step": 68262, "epoch": 1625} {"train_loss": -6.1239333152771, "global_step": 68263, "epoch": 1625} {"train_loss": -6.193686485290527, "global_step": 68264, "epoch": 1625} {"train_loss": -5.945286273956299, "global_step": 68265, "epoch": 1625} {"train_loss": -6.030551910400391, "global_step": 68266, "epoch": 1625} {"train_loss": -5.992430686950684, "global_step": 68267, "epoch": 1625} {"train_loss": -6.082693099975586, "global_step": 68268, "epoch": 1625} {"train_loss": -6.170256614685059, "global_step": 68269, "epoch": 1625} {"train_loss": -6.01460075378418, "global_step": 68270, "epoch": 1625} {"train_loss": -6.0804219245910645, "global_step": 68271, "epoch": 1625} {"train_loss": -5.854579448699951, "global_step": 68272, "epoch": 1625} {"train_loss": -6.012821197509766, "global_step": 68273, "epoch": 1625} {"train_loss": -6.021093368530273, "global_step": 68274, "epoch": 1625} {"train_loss": -6.127260684967041, "global_step": 68275, "epoch": 1625} {"train_loss": -5.968681812286377, "global_step": 68276, "epoch": 1625} {"train_loss": -5.963138103485107, "global_step": 68277, "epoch": 1625} {"train_loss": -5.868464469909668, "global_step": 68278, "epoch": 1625} {"train_loss": -5.923455238342285, "global_step": 68279, "epoch": 1625} {"train_loss": -6.082210540771484, "global_step": 68280, "epoch": 1625} {"train_loss": -6.100394248962402, "global_step": 68281, "epoch": 1625} {"train_loss": -6.069515228271484, "global_step": 68282, "epoch": 1625} {"train_loss": -5.975759983062744, "global_step": 68283, "epoch": 1625} {"train_loss": -5.949717998504639, "global_step": 68284, "epoch": 1625} {"train_loss": -5.981008529663086, "global_step": 68285, "epoch": 1625} {"train_loss": -6.09112548828125, "global_step": 68286, "epoch": 1625} {"train_loss": -6.032831192016602, "global_step": 68287, "epoch": 1625} {"train_loss": -6.050478458404541, "global_step": 68288, "epoch": 1625} {"train_loss": -5.947630882263184, "global_step": 68289, "epoch": 1625} {"train_loss": -5.924410820007324, "global_step": 68290, "epoch": 1625} {"train_loss": -6.020084403810047, "global_step": 68291, "epoch": 1625, "val_loss": 61644.88671875} {"train_loss": -6.030871868133545, "global_step": 68292, "epoch": 1626} {"train_loss": -6.125574111938477, "global_step": 68293, "epoch": 1626} {"train_loss": -6.100610733032227, "global_step": 68294, "epoch": 1626} {"train_loss": -6.128727912902832, "global_step": 68295, "epoch": 1626} {"train_loss": -5.945950508117676, "global_step": 68296, "epoch": 1626} {"train_loss": -5.936516761779785, "global_step": 68297, "epoch": 1626} {"train_loss": -6.0789594650268555, "global_step": 68298, "epoch": 1626} {"train_loss": -5.9445343017578125, "global_step": 68299, "epoch": 1626} {"train_loss": -5.974764347076416, "global_step": 68300, "epoch": 1626} {"train_loss": -5.9547953605651855, "global_step": 68301, "epoch": 1626} {"train_loss": -5.961770057678223, "global_step": 68302, "epoch": 1626} {"train_loss": -6.085969924926758, "global_step": 68303, "epoch": 1626} {"train_loss": -5.956594467163086, "global_step": 68304, "epoch": 1626} {"train_loss": -5.9280829429626465, "global_step": 68305, "epoch": 1626} {"train_loss": -6.085876941680908, "global_step": 68306, "epoch": 1626} {"train_loss": -5.909470081329346, "global_step": 68307, "epoch": 1626} {"train_loss": -5.918628692626953, "global_step": 68308, "epoch": 1626} {"train_loss": -5.905892372131348, "global_step": 68309, "epoch": 1626} {"train_loss": -5.806325912475586, "global_step": 68310, "epoch": 1626} {"train_loss": -5.970852375030518, "global_step": 68311, "epoch": 1626} {"train_loss": -5.902400016784668, "global_step": 68312, "epoch": 1626} {"train_loss": -5.951127052307129, "global_step": 68313, "epoch": 1626} {"train_loss": -5.8717756271362305, "global_step": 68314, "epoch": 1626} {"train_loss": -5.902390003204346, "global_step": 68315, "epoch": 1626} {"train_loss": -5.848213195800781, "global_step": 68316, "epoch": 1626} {"train_loss": -5.77677059173584, "global_step": 68317, "epoch": 1626} {"train_loss": -5.9533610343933105, "global_step": 68318, "epoch": 1626} {"train_loss": -5.754622459411621, "global_step": 68319, "epoch": 1626} {"train_loss": -5.85353946685791, "global_step": 68320, "epoch": 1626} {"train_loss": -5.966168403625488, "global_step": 68321, "epoch": 1626} {"train_loss": -5.968111991882324, "global_step": 68322, "epoch": 1626} {"train_loss": -5.779616355895996, "global_step": 68323, "epoch": 1626} {"train_loss": -5.953813552856445, "global_step": 68324, "epoch": 1626} {"train_loss": -5.918225288391113, "global_step": 68325, "epoch": 1626} {"train_loss": -5.919165134429932, "global_step": 68326, "epoch": 1626} {"train_loss": -6.016042709350586, "global_step": 68327, "epoch": 1626} {"train_loss": -5.8614959716796875, "global_step": 68328, "epoch": 1626} {"train_loss": -5.908514499664307, "global_step": 68329, "epoch": 1626} {"train_loss": -5.954063415527344, "global_step": 68330, "epoch": 1626} {"train_loss": -5.854090690612793, "global_step": 68331, "epoch": 1626} {"train_loss": -5.9468793869018555, "global_step": 68332, "epoch": 1626} {"train_loss": -5.941937230882191, "global_step": 68333, "epoch": 1626, "val_loss": 61614.76953125} {"train_loss": -6.0064287185668945, "global_step": 68334, "epoch": 1627} {"train_loss": -6.019357204437256, "global_step": 68335, "epoch": 1627} {"train_loss": -5.8945183753967285, "global_step": 68336, "epoch": 1627} {"train_loss": -6.006251335144043, "global_step": 68337, "epoch": 1627} {"train_loss": -5.854206562042236, "global_step": 68338, "epoch": 1627} {"train_loss": -5.863101959228516, "global_step": 68339, "epoch": 1627} {"train_loss": -5.968606472015381, "global_step": 68340, "epoch": 1627} {"train_loss": -5.95175838470459, "global_step": 68341, "epoch": 1627} {"train_loss": -6.004214286804199, "global_step": 68342, "epoch": 1627} {"train_loss": -5.935713768005371, "global_step": 68343, "epoch": 1627} {"train_loss": -6.021176815032959, "global_step": 68344, "epoch": 1627} {"train_loss": -5.931299209594727, "global_step": 68345, "epoch": 1627} {"train_loss": -6.055891036987305, "global_step": 68346, "epoch": 1627} {"train_loss": -5.96214485168457, "global_step": 68347, "epoch": 1627} {"train_loss": -6.02506685256958, "global_step": 68348, "epoch": 1627} {"train_loss": -6.09000825881958, "global_step": 68349, "epoch": 1627} {"train_loss": -6.002116680145264, "global_step": 68350, "epoch": 1627} {"train_loss": -5.906866073608398, "global_step": 68351, "epoch": 1627} {"train_loss": -5.997931003570557, "global_step": 68352, "epoch": 1627} {"train_loss": -6.037539005279541, "global_step": 68353, "epoch": 1627} {"train_loss": -6.100508689880371, "global_step": 68354, "epoch": 1627} {"train_loss": -5.9824981689453125, "global_step": 68355, "epoch": 1627} {"train_loss": -6.023741245269775, "global_step": 68356, "epoch": 1627} {"train_loss": -6.003020286560059, "global_step": 68357, "epoch": 1627} {"train_loss": -5.975126266479492, "global_step": 68358, "epoch": 1627} {"train_loss": -6.0684027671813965, "global_step": 68359, "epoch": 1627} {"train_loss": -5.99057149887085, "global_step": 68360, "epoch": 1627} {"train_loss": -5.988437652587891, "global_step": 68361, "epoch": 1627} {"train_loss": -5.982979774475098, "global_step": 68362, "epoch": 1627} {"train_loss": -6.013049125671387, "global_step": 68363, "epoch": 1627} {"train_loss": -6.013005256652832, "global_step": 68364, "epoch": 1627} {"train_loss": -5.98133659362793, "global_step": 68365, "epoch": 1627} {"train_loss": -6.009305953979492, "global_step": 68366, "epoch": 1627} {"train_loss": -6.060401916503906, "global_step": 68367, "epoch": 1627} {"train_loss": -6.1222734451293945, "global_step": 68368, "epoch": 1627} {"train_loss": -5.996466159820557, "global_step": 68369, "epoch": 1627} {"train_loss": -6.1147918701171875, "global_step": 68370, "epoch": 1627} {"train_loss": -6.067831516265869, "global_step": 68371, "epoch": 1627} {"train_loss": -5.909936904907227, "global_step": 68372, "epoch": 1627} {"train_loss": -5.99812126159668, "global_step": 68373, "epoch": 1627} {"train_loss": -6.027276992797852, "global_step": 68374, "epoch": 1627} {"train_loss": -6.000243084771292, "global_step": 68375, "epoch": 1627, "val_loss": 61521.99609375} {"train_loss": -6.044416427612305, "global_step": 68376, "epoch": 1628} {"train_loss": -6.045045852661133, "global_step": 68377, "epoch": 1628} {"train_loss": -5.970274448394775, "global_step": 68378, "epoch": 1628} {"train_loss": -5.932981014251709, "global_step": 68379, "epoch": 1628} {"train_loss": -5.993535041809082, "global_step": 68380, "epoch": 1628} {"train_loss": -6.050804615020752, "global_step": 68381, "epoch": 1628} {"train_loss": -5.925109386444092, "global_step": 68382, "epoch": 1628} {"train_loss": -6.100855827331543, "global_step": 68383, "epoch": 1628} {"train_loss": -5.995793342590332, "global_step": 68384, "epoch": 1628} {"train_loss": -6.019808769226074, "global_step": 68385, "epoch": 1628} {"train_loss": -6.026811599731445, "global_step": 68386, "epoch": 1628} {"train_loss": -5.988194465637207, "global_step": 68387, "epoch": 1628} {"train_loss": -5.951320648193359, "global_step": 68388, "epoch": 1628} {"train_loss": -5.968016147613525, "global_step": 68389, "epoch": 1628} {"train_loss": -5.902678489685059, "global_step": 68390, "epoch": 1628} {"train_loss": -5.967984199523926, "global_step": 68391, "epoch": 1628} {"train_loss": -5.986306667327881, "global_step": 68392, "epoch": 1628} {"train_loss": -5.9241766929626465, "global_step": 68393, "epoch": 1628} {"train_loss": -5.88641357421875, "global_step": 68394, "epoch": 1628} {"train_loss": -6.013402462005615, "global_step": 68395, "epoch": 1628} {"train_loss": -5.999448776245117, "global_step": 68396, "epoch": 1628} {"train_loss": -6.0148420333862305, "global_step": 68397, "epoch": 1628} {"train_loss": -5.998116493225098, "global_step": 68398, "epoch": 1628} {"train_loss": -5.976571559906006, "global_step": 68399, "epoch": 1628} {"train_loss": -5.840384483337402, "global_step": 68400, "epoch": 1628} {"train_loss": -5.9286088943481445, "global_step": 68401, "epoch": 1628} {"train_loss": -6.002975940704346, "global_step": 68402, "epoch": 1628} {"train_loss": -5.982054710388184, "global_step": 68403, "epoch": 1628} {"train_loss": -6.020550727844238, "global_step": 68404, "epoch": 1628} {"train_loss": -6.062910556793213, "global_step": 68405, "epoch": 1628} {"train_loss": -6.067758560180664, "global_step": 68406, "epoch": 1628} {"train_loss": -5.998529434204102, "global_step": 68407, "epoch": 1628} {"train_loss": -6.087406158447266, "global_step": 68408, "epoch": 1628} {"train_loss": -6.031831741333008, "global_step": 68409, "epoch": 1628} {"train_loss": -5.976224422454834, "global_step": 68410, "epoch": 1628} {"train_loss": -5.950600624084473, "global_step": 68411, "epoch": 1628} {"train_loss": -6.073605537414551, "global_step": 68412, "epoch": 1628} {"train_loss": -6.018525123596191, "global_step": 68413, "epoch": 1628} {"train_loss": -6.0038533210754395, "global_step": 68414, "epoch": 1628} {"train_loss": -6.029557704925537, "global_step": 68415, "epoch": 1628} {"train_loss": -5.984023094177246, "global_step": 68416, "epoch": 1628} {"train_loss": -5.996017649060204, "global_step": 68417, "epoch": 1628, "val_loss": 61458.9375} {"train_loss": -5.981266975402832, "global_step": 68418, "epoch": 1629} {"train_loss": -6.062465667724609, "global_step": 68419, "epoch": 1629} {"train_loss": -5.96925163269043, "global_step": 68420, "epoch": 1629} {"train_loss": -6.00856876373291, "global_step": 68421, "epoch": 1629} {"train_loss": -6.017226219177246, "global_step": 68422, "epoch": 1629} {"train_loss": -6.125784873962402, "global_step": 68423, "epoch": 1629} {"train_loss": -6.047393321990967, "global_step": 68424, "epoch": 1629} {"train_loss": -5.972810745239258, "global_step": 68425, "epoch": 1629} {"train_loss": -6.047456741333008, "global_step": 68426, "epoch": 1629} {"train_loss": -6.054726600646973, "global_step": 68427, "epoch": 1629} {"train_loss": -6.0350847244262695, "global_step": 68428, "epoch": 1629} {"train_loss": -6.122776985168457, "global_step": 68429, "epoch": 1629} {"train_loss": -6.0213141441345215, "global_step": 68430, "epoch": 1629} {"train_loss": -5.915925025939941, "global_step": 68431, "epoch": 1629} {"train_loss": -6.075198173522949, "global_step": 68432, "epoch": 1629} {"train_loss": -5.975389003753662, "global_step": 68433, "epoch": 1629} {"train_loss": -5.97788143157959, "global_step": 68434, "epoch": 1629} {"train_loss": -5.872808933258057, "global_step": 68435, "epoch": 1629} {"train_loss": -6.038153648376465, "global_step": 68436, "epoch": 1629} {"train_loss": -6.071024417877197, "global_step": 68437, "epoch": 1629} {"train_loss": -6.048232078552246, "global_step": 68438, "epoch": 1629} {"train_loss": -6.0126495361328125, "global_step": 68439, "epoch": 1629} {"train_loss": -6.054255485534668, "global_step": 68440, "epoch": 1629} {"train_loss": -5.839786529541016, "global_step": 68441, "epoch": 1629} {"train_loss": -5.896327972412109, "global_step": 68442, "epoch": 1629} {"train_loss": -5.9047698974609375, "global_step": 68443, "epoch": 1629} {"train_loss": -6.031260013580322, "global_step": 68444, "epoch": 1629} {"train_loss": -5.997550964355469, "global_step": 68445, "epoch": 1629} {"train_loss": -6.010339260101318, "global_step": 68446, "epoch": 1629} {"train_loss": -6.061709403991699, "global_step": 68447, "epoch": 1629} {"train_loss": -6.046176910400391, "global_step": 68448, "epoch": 1629} {"train_loss": -5.945241928100586, "global_step": 68449, "epoch": 1629} {"train_loss": -6.029135227203369, "global_step": 68450, "epoch": 1629} {"train_loss": -5.903953552246094, "global_step": 68451, "epoch": 1629} {"train_loss": -5.810220718383789, "global_step": 68452, "epoch": 1629} {"train_loss": -6.042734622955322, "global_step": 68453, "epoch": 1629} {"train_loss": -6.002618789672852, "global_step": 68454, "epoch": 1629} {"train_loss": -6.044916152954102, "global_step": 68455, "epoch": 1629} {"train_loss": -6.034524917602539, "global_step": 68456, "epoch": 1629} {"train_loss": -6.0953755378723145, "global_step": 68457, "epoch": 1629} {"train_loss": -5.971818923950195, "global_step": 68458, "epoch": 1629} {"train_loss": -6.0028661886851, "global_step": 68459, "epoch": 1629, "val_loss": 61494.16015625} {"train_loss": -6.019229412078857, "global_step": 68460, "epoch": 1630} {"train_loss": -5.9829206466674805, "global_step": 68461, "epoch": 1630} {"train_loss": -6.142565727233887, "global_step": 68462, "epoch": 1630} {"train_loss": -6.152683734893799, "global_step": 68463, "epoch": 1630} {"train_loss": -6.054316520690918, "global_step": 68464, "epoch": 1630} {"train_loss": -6.082197189331055, "global_step": 68465, "epoch": 1630} {"train_loss": -6.096721649169922, "global_step": 68466, "epoch": 1630} {"train_loss": -6.067663192749023, "global_step": 68467, "epoch": 1630} {"train_loss": -6.085051536560059, "global_step": 68468, "epoch": 1630} {"train_loss": -6.065485954284668, "global_step": 68469, "epoch": 1630} {"train_loss": -6.082574367523193, "global_step": 68470, "epoch": 1630} {"train_loss": -6.016282558441162, "global_step": 68471, "epoch": 1630} {"train_loss": -6.014137268066406, "global_step": 68472, "epoch": 1630} {"train_loss": -6.104231834411621, "global_step": 68473, "epoch": 1630} {"train_loss": -5.896696090698242, "global_step": 68474, "epoch": 1630} {"train_loss": -5.997467994689941, "global_step": 68475, "epoch": 1630} {"train_loss": -5.904067039489746, "global_step": 68476, "epoch": 1630} {"train_loss": -5.992624282836914, "global_step": 68477, "epoch": 1630} {"train_loss": -6.040143013000488, "global_step": 68478, "epoch": 1630} {"train_loss": -5.9255523681640625, "global_step": 68479, "epoch": 1630} {"train_loss": -6.079765319824219, "global_step": 68480, "epoch": 1630} {"train_loss": -5.931302070617676, "global_step": 68481, "epoch": 1630} {"train_loss": -5.974822044372559, "global_step": 68482, "epoch": 1630} {"train_loss": -6.052188873291016, "global_step": 68483, "epoch": 1630} {"train_loss": -5.927657127380371, "global_step": 68484, "epoch": 1630} {"train_loss": -6.0258588790893555, "global_step": 68485, "epoch": 1630} {"train_loss": -5.984847068786621, "global_step": 68486, "epoch": 1630} {"train_loss": -6.088879585266113, "global_step": 68487, "epoch": 1630} {"train_loss": -6.09675407409668, "global_step": 68488, "epoch": 1630} {"train_loss": -6.000700950622559, "global_step": 68489, "epoch": 1630} {"train_loss": -5.981765270233154, "global_step": 68490, "epoch": 1630} {"train_loss": -6.030455589294434, "global_step": 68491, "epoch": 1630} {"train_loss": -6.053033828735352, "global_step": 68492, "epoch": 1630} {"train_loss": -6.0265350341796875, "global_step": 68493, "epoch": 1630} {"train_loss": -5.971527099609375, "global_step": 68494, "epoch": 1630} {"train_loss": -5.997980117797852, "global_step": 68495, "epoch": 1630} {"train_loss": -6.027642250061035, "global_step": 68496, "epoch": 1630} {"train_loss": -6.114352226257324, "global_step": 68497, "epoch": 1630} {"train_loss": -6.021197319030762, "global_step": 68498, "epoch": 1630} {"train_loss": -5.884946823120117, "global_step": 68499, "epoch": 1630} {"train_loss": -6.0156145095825195, "global_step": 68500, "epoch": 1630} {"train_loss": -6.026407082875569, "global_step": 68501, "epoch": 1630, "val_loss": 61526.75} {"train_loss": -6.010390281677246, "global_step": 68502, "epoch": 1631} {"train_loss": -6.046051502227783, "global_step": 68503, "epoch": 1631} {"train_loss": -6.056992530822754, "global_step": 68504, "epoch": 1631} {"train_loss": -5.937814712524414, "global_step": 68505, "epoch": 1631} {"train_loss": -5.884273529052734, "global_step": 68506, "epoch": 1631} {"train_loss": -5.995593070983887, "global_step": 68507, "epoch": 1631} {"train_loss": -6.114730358123779, "global_step": 68508, "epoch": 1631} {"train_loss": -6.085738182067871, "global_step": 68509, "epoch": 1631} {"train_loss": -6.043667316436768, "global_step": 68510, "epoch": 1631} {"train_loss": -5.989563941955566, "global_step": 68511, "epoch": 1631} {"train_loss": -5.977268218994141, "global_step": 68512, "epoch": 1631} {"train_loss": -6.024543762207031, "global_step": 68513, "epoch": 1631} {"train_loss": -6.181698799133301, "global_step": 68514, "epoch": 1631} {"train_loss": -5.987961769104004, "global_step": 68515, "epoch": 1631} {"train_loss": -5.930617809295654, "global_step": 68516, "epoch": 1631} {"train_loss": -6.025022983551025, "global_step": 68517, "epoch": 1631} {"train_loss": -6.085980415344238, "global_step": 68518, "epoch": 1631} {"train_loss": -6.057868957519531, "global_step": 68519, "epoch": 1631} {"train_loss": -6.098238468170166, "global_step": 68520, "epoch": 1631} {"train_loss": -5.9993205070495605, "global_step": 68521, "epoch": 1631} {"train_loss": -6.011813640594482, "global_step": 68522, "epoch": 1631} {"train_loss": -6.012035846710205, "global_step": 68523, "epoch": 1631} {"train_loss": -5.956662178039551, "global_step": 68524, "epoch": 1631} {"train_loss": -6.073273658752441, "global_step": 68525, "epoch": 1631} {"train_loss": -6.0656890869140625, "global_step": 68526, "epoch": 1631} {"train_loss": -6.121762752532959, "global_step": 68527, "epoch": 1631} {"train_loss": -6.094191551208496, "global_step": 68528, "epoch": 1631} {"train_loss": -6.100132942199707, "global_step": 68529, "epoch": 1631} {"train_loss": -6.04142951965332, "global_step": 68530, "epoch": 1631} {"train_loss": -6.078826904296875, "global_step": 68531, "epoch": 1631} {"train_loss": -6.094913005828857, "global_step": 68532, "epoch": 1631} {"train_loss": -6.0955705642700195, "global_step": 68533, "epoch": 1631} {"train_loss": -6.093769550323486, "global_step": 68534, "epoch": 1631} {"train_loss": -6.071516513824463, "global_step": 68535, "epoch": 1631} {"train_loss": -5.996112823486328, "global_step": 68536, "epoch": 1631} {"train_loss": -6.040275573730469, "global_step": 68537, "epoch": 1631} {"train_loss": -6.049033164978027, "global_step": 68538, "epoch": 1631} {"train_loss": -6.04300594329834, "global_step": 68539, "epoch": 1631} {"train_loss": -6.086302280426025, "global_step": 68540, "epoch": 1631} {"train_loss": -6.058248519897461, "global_step": 68541, "epoch": 1631} {"train_loss": -6.066728115081787, "global_step": 68542, "epoch": 1631} {"train_loss": -6.044105802263532, "global_step": 68543, "epoch": 1631, "val_loss": 61689.33203125} {"train_loss": -6.045675277709961, "global_step": 68544, "epoch": 1632} {"train_loss": -5.970225811004639, "global_step": 68545, "epoch": 1632} {"train_loss": -6.085935592651367, "global_step": 68546, "epoch": 1632} {"train_loss": -6.176979064941406, "global_step": 68547, "epoch": 1632} {"train_loss": -5.998265266418457, "global_step": 68548, "epoch": 1632} {"train_loss": -6.004663467407227, "global_step": 68549, "epoch": 1632} {"train_loss": -6.068781852722168, "global_step": 68550, "epoch": 1632} {"train_loss": -5.857174873352051, "global_step": 68551, "epoch": 1632} {"train_loss": -5.983005523681641, "global_step": 68552, "epoch": 1632} {"train_loss": -6.063333988189697, "global_step": 68553, "epoch": 1632} {"train_loss": -6.065389156341553, "global_step": 68554, "epoch": 1632} {"train_loss": -6.0240888595581055, "global_step": 68555, "epoch": 1632} {"train_loss": -5.970672130584717, "global_step": 68556, "epoch": 1632} {"train_loss": -6.008429527282715, "global_step": 68557, "epoch": 1632} {"train_loss": -5.931247234344482, "global_step": 68558, "epoch": 1632} {"train_loss": -5.828085422515869, "global_step": 68559, "epoch": 1632} {"train_loss": -5.998823165893555, "global_step": 68560, "epoch": 1632} {"train_loss": -5.979471206665039, "global_step": 68561, "epoch": 1632} {"train_loss": -5.850348472595215, "global_step": 68562, "epoch": 1632} {"train_loss": -5.947113037109375, "global_step": 68563, "epoch": 1632} {"train_loss": -5.956907749176025, "global_step": 68564, "epoch": 1632} {"train_loss": -5.84797477722168, "global_step": 68565, "epoch": 1632} {"train_loss": -5.977293014526367, "global_step": 68566, "epoch": 1632} {"train_loss": -5.779505729675293, "global_step": 68567, "epoch": 1632} {"train_loss": -5.974947929382324, "global_step": 68568, "epoch": 1632} {"train_loss": -5.679902076721191, "global_step": 68569, "epoch": 1632} {"train_loss": -5.938365936279297, "global_step": 68570, "epoch": 1632} {"train_loss": -5.807075500488281, "global_step": 68571, "epoch": 1632} {"train_loss": -6.085346221923828, "global_step": 68572, "epoch": 1632} {"train_loss": -5.830600738525391, "global_step": 68573, "epoch": 1632} {"train_loss": -5.868564605712891, "global_step": 68574, "epoch": 1632} {"train_loss": -6.025961875915527, "global_step": 68575, "epoch": 1632} {"train_loss": -5.935417175292969, "global_step": 68576, "epoch": 1632} {"train_loss": -5.965956687927246, "global_step": 68577, "epoch": 1632} {"train_loss": -5.868229389190674, "global_step": 68578, "epoch": 1632} {"train_loss": -5.98213005065918, "global_step": 68579, "epoch": 1632} {"train_loss": -5.887201309204102, "global_step": 68580, "epoch": 1632} {"train_loss": -5.842732906341553, "global_step": 68581, "epoch": 1632} {"train_loss": -5.702624320983887, "global_step": 68582, "epoch": 1632} {"train_loss": -5.875199317932129, "global_step": 68583, "epoch": 1632} {"train_loss": -5.931820869445801, "global_step": 68584, "epoch": 1632} {"train_loss": -5.939728112447829, "global_step": 68585, "epoch": 1632, "val_loss": 62030.4140625} {"train_loss": -5.964366436004639, "global_step": 68586, "epoch": 1633} {"train_loss": -5.959680557250977, "global_step": 68587, "epoch": 1633} {"train_loss": -5.929354190826416, "global_step": 68588, "epoch": 1633} {"train_loss": -5.816803932189941, "global_step": 68589, "epoch": 1633} {"train_loss": -5.930434226989746, "global_step": 68590, "epoch": 1633} {"train_loss": -5.941218852996826, "global_step": 68591, "epoch": 1633} {"train_loss": -5.939990520477295, "global_step": 68592, "epoch": 1633} {"train_loss": -5.879471778869629, "global_step": 68593, "epoch": 1633} {"train_loss": -5.881745338439941, "global_step": 68594, "epoch": 1633} {"train_loss": -5.899230003356934, "global_step": 68595, "epoch": 1633} {"train_loss": -6.063114643096924, "global_step": 68596, "epoch": 1633} {"train_loss": -5.936237335205078, "global_step": 68597, "epoch": 1633} {"train_loss": -5.9702467918396, "global_step": 68598, "epoch": 1633} {"train_loss": -6.05485200881958, "global_step": 68599, "epoch": 1633} {"train_loss": -5.928506851196289, "global_step": 68600, "epoch": 1633} {"train_loss": -5.9701642990112305, "global_step": 68601, "epoch": 1633} {"train_loss": -5.996825218200684, "global_step": 68602, "epoch": 1633} {"train_loss": -5.99727725982666, "global_step": 68603, "epoch": 1633} {"train_loss": -6.0282392501831055, "global_step": 68604, "epoch": 1633} {"train_loss": -6.038873195648193, "global_step": 68605, "epoch": 1633} {"train_loss": -6.039852142333984, "global_step": 68606, "epoch": 1633} {"train_loss": -5.974262237548828, "global_step": 68607, "epoch": 1633} {"train_loss": -5.968423366546631, "global_step": 68608, "epoch": 1633} {"train_loss": -5.914585113525391, "global_step": 68609, "epoch": 1633} {"train_loss": -6.037604331970215, "global_step": 68610, "epoch": 1633} {"train_loss": -5.885749816894531, "global_step": 68611, "epoch": 1633} {"train_loss": -6.167823791503906, "global_step": 68612, "epoch": 1633} {"train_loss": -5.956082820892334, "global_step": 68613, "epoch": 1633} {"train_loss": -5.9766130447387695, "global_step": 68614, "epoch": 1633} {"train_loss": -5.986001491546631, "global_step": 68615, "epoch": 1633} {"train_loss": -6.027692794799805, "global_step": 68616, "epoch": 1633} {"train_loss": -5.8865532875061035, "global_step": 68617, "epoch": 1633} {"train_loss": -6.0883660316467285, "global_step": 68618, "epoch": 1633} {"train_loss": -5.997523307800293, "global_step": 68619, "epoch": 1633} {"train_loss": -5.91042423248291, "global_step": 68620, "epoch": 1633} {"train_loss": -6.013718605041504, "global_step": 68621, "epoch": 1633} {"train_loss": -6.013201713562012, "global_step": 68622, "epoch": 1633} {"train_loss": -5.977090835571289, "global_step": 68623, "epoch": 1633} {"train_loss": -6.004955291748047, "global_step": 68624, "epoch": 1633} {"train_loss": -5.905272006988525, "global_step": 68625, "epoch": 1633} {"train_loss": -5.921276092529297, "global_step": 68626, "epoch": 1633} {"train_loss": -5.96931334904262, "global_step": 68627, "epoch": 1633, "val_loss": 61822.8359375} {"train_loss": -5.918938159942627, "global_step": 68628, "epoch": 1634} {"train_loss": -5.99375581741333, "global_step": 68629, "epoch": 1634} {"train_loss": -5.854192733764648, "global_step": 68630, "epoch": 1634} {"train_loss": -5.964545249938965, "global_step": 68631, "epoch": 1634} {"train_loss": -6.02469539642334, "global_step": 68632, "epoch": 1634} {"train_loss": -5.920763969421387, "global_step": 68633, "epoch": 1634} {"train_loss": -6.021195411682129, "global_step": 68634, "epoch": 1634} {"train_loss": -5.845707893371582, "global_step": 68635, "epoch": 1634} {"train_loss": -6.016752243041992, "global_step": 68636, "epoch": 1634} {"train_loss": -5.909226894378662, "global_step": 68637, "epoch": 1634} {"train_loss": -5.91066837310791, "global_step": 68638, "epoch": 1634} {"train_loss": -6.082995414733887, "global_step": 68639, "epoch": 1634} {"train_loss": -6.060708522796631, "global_step": 68640, "epoch": 1634} {"train_loss": -5.899630069732666, "global_step": 68641, "epoch": 1634} {"train_loss": -5.9004011154174805, "global_step": 68642, "epoch": 1634} {"train_loss": -5.89979362487793, "global_step": 68643, "epoch": 1634} {"train_loss": -6.0103936195373535, "global_step": 68644, "epoch": 1634} {"train_loss": -6.011620998382568, "global_step": 68645, "epoch": 1634} {"train_loss": -5.959829330444336, "global_step": 68646, "epoch": 1634} {"train_loss": -6.049943923950195, "global_step": 68647, "epoch": 1634} {"train_loss": -5.972750663757324, "global_step": 68648, "epoch": 1634} {"train_loss": -5.92172908782959, "global_step": 68649, "epoch": 1634} {"train_loss": -5.991872787475586, "global_step": 68650, "epoch": 1634} {"train_loss": -5.983550548553467, "global_step": 68651, "epoch": 1634} {"train_loss": -6.094582557678223, "global_step": 68652, "epoch": 1634} {"train_loss": -5.965723991394043, "global_step": 68653, "epoch": 1634} {"train_loss": -6.036519527435303, "global_step": 68654, "epoch": 1634} {"train_loss": -6.002878189086914, "global_step": 68655, "epoch": 1634} {"train_loss": -5.902758598327637, "global_step": 68656, "epoch": 1634} {"train_loss": -5.9733076095581055, "global_step": 68657, "epoch": 1634} {"train_loss": -5.847211837768555, "global_step": 68658, "epoch": 1634} {"train_loss": -6.034780979156494, "global_step": 68659, "epoch": 1634} {"train_loss": -6.051268100738525, "global_step": 68660, "epoch": 1634} {"train_loss": -5.867203712463379, "global_step": 68661, "epoch": 1634} {"train_loss": -5.979090213775635, "global_step": 68662, "epoch": 1634} {"train_loss": -5.853314399719238, "global_step": 68663, "epoch": 1634} {"train_loss": -6.009435653686523, "global_step": 68664, "epoch": 1634} {"train_loss": -5.945813179016113, "global_step": 68665, "epoch": 1634} {"train_loss": -6.061436653137207, "global_step": 68666, "epoch": 1634} {"train_loss": -6.1313090324401855, "global_step": 68667, "epoch": 1634} {"train_loss": -5.864630699157715, "global_step": 68668, "epoch": 1634} {"train_loss": -5.968883730116344, "global_step": 68669, "epoch": 1634, "val_loss": 61736.46875} {"train_loss": -6.0810651779174805, "global_step": 68670, "epoch": 1635} {"train_loss": -6.014695167541504, "global_step": 68671, "epoch": 1635} {"train_loss": -5.997518539428711, "global_step": 68672, "epoch": 1635} {"train_loss": -6.031115531921387, "global_step": 68673, "epoch": 1635} {"train_loss": -6.083140850067139, "global_step": 68674, "epoch": 1635} {"train_loss": -6.05396842956543, "global_step": 68675, "epoch": 1635} {"train_loss": -6.005452632904053, "global_step": 68676, "epoch": 1635} {"train_loss": -6.039695739746094, "global_step": 68677, "epoch": 1635} {"train_loss": -6.061898231506348, "global_step": 68678, "epoch": 1635} {"train_loss": -5.968624114990234, "global_step": 68679, "epoch": 1635} {"train_loss": -5.96791934967041, "global_step": 68680, "epoch": 1635} {"train_loss": -6.105386734008789, "global_step": 68681, "epoch": 1635} {"train_loss": -6.030801773071289, "global_step": 68682, "epoch": 1635} {"train_loss": -5.982221603393555, "global_step": 68683, "epoch": 1635} {"train_loss": -5.995326519012451, "global_step": 68684, "epoch": 1635} {"train_loss": -6.1349639892578125, "global_step": 68685, "epoch": 1635} {"train_loss": -5.989852428436279, "global_step": 68686, "epoch": 1635} {"train_loss": -6.119757652282715, "global_step": 68687, "epoch": 1635} {"train_loss": -5.905672073364258, "global_step": 68688, "epoch": 1635} {"train_loss": -5.9057841300964355, "global_step": 68689, "epoch": 1635} {"train_loss": -5.899425506591797, "global_step": 68690, "epoch": 1635} {"train_loss": -5.973694801330566, "global_step": 68691, "epoch": 1635} {"train_loss": -5.930019855499268, "global_step": 68692, "epoch": 1635} {"train_loss": -6.008636951446533, "global_step": 68693, "epoch": 1635} {"train_loss": -5.953900337219238, "global_step": 68694, "epoch": 1635} {"train_loss": -5.998705863952637, "global_step": 68695, "epoch": 1635} {"train_loss": -6.032501220703125, "global_step": 68696, "epoch": 1635} {"train_loss": -6.0176100730896, "global_step": 68697, "epoch": 1635} {"train_loss": -6.066679954528809, "global_step": 68698, "epoch": 1635} {"train_loss": -6.083294868469238, "global_step": 68699, "epoch": 1635} {"train_loss": -5.994339942932129, "global_step": 68700, "epoch": 1635} {"train_loss": -6.0760040283203125, "global_step": 68701, "epoch": 1635} {"train_loss": -5.926064491271973, "global_step": 68702, "epoch": 1635} {"train_loss": -6.084043502807617, "global_step": 68703, "epoch": 1635} {"train_loss": -5.934286117553711, "global_step": 68704, "epoch": 1635} {"train_loss": -5.947967052459717, "global_step": 68705, "epoch": 1635} {"train_loss": -6.042786598205566, "global_step": 68706, "epoch": 1635} {"train_loss": -5.9807281494140625, "global_step": 68707, "epoch": 1635} {"train_loss": -5.95677375793457, "global_step": 68708, "epoch": 1635} {"train_loss": -5.965242862701416, "global_step": 68709, "epoch": 1635} {"train_loss": -5.9561004638671875, "global_step": 68710, "epoch": 1635} {"train_loss": -6.007875703629994, "global_step": 68711, "epoch": 1635, "val_loss": 61795.71875} {"train_loss": -6.026865005493164, "global_step": 68712, "epoch": 1636} {"train_loss": -6.210139274597168, "global_step": 68713, "epoch": 1636} {"train_loss": -5.949868202209473, "global_step": 68714, "epoch": 1636} {"train_loss": -6.062298774719238, "global_step": 68715, "epoch": 1636} {"train_loss": -5.983475685119629, "global_step": 68716, "epoch": 1636} {"train_loss": -6.006926536560059, "global_step": 68717, "epoch": 1636} {"train_loss": -6.109931945800781, "global_step": 68718, "epoch": 1636} {"train_loss": -5.885601997375488, "global_step": 68719, "epoch": 1636} {"train_loss": -6.095444679260254, "global_step": 68720, "epoch": 1636} {"train_loss": -5.956719398498535, "global_step": 68721, "epoch": 1636} {"train_loss": -5.946642875671387, "global_step": 68722, "epoch": 1636} {"train_loss": -5.964098930358887, "global_step": 68723, "epoch": 1636} {"train_loss": -5.906032085418701, "global_step": 68724, "epoch": 1636} {"train_loss": -6.123232364654541, "global_step": 68725, "epoch": 1636} {"train_loss": -5.939064025878906, "global_step": 68726, "epoch": 1636} {"train_loss": -5.970355033874512, "global_step": 68727, "epoch": 1636} {"train_loss": -5.982861518859863, "global_step": 68728, "epoch": 1636} {"train_loss": -6.07279109954834, "global_step": 68729, "epoch": 1636} {"train_loss": -6.0021772384643555, "global_step": 68730, "epoch": 1636} {"train_loss": -5.942780494689941, "global_step": 68731, "epoch": 1636} {"train_loss": -6.035433769226074, "global_step": 68732, "epoch": 1636} {"train_loss": -6.038919448852539, "global_step": 68733, "epoch": 1636} {"train_loss": -6.0018720626831055, "global_step": 68734, "epoch": 1636} {"train_loss": -5.940155982971191, "global_step": 68735, "epoch": 1636} {"train_loss": -6.046816349029541, "global_step": 68736, "epoch": 1636} {"train_loss": -6.018279075622559, "global_step": 68737, "epoch": 1636} {"train_loss": -5.957968235015869, "global_step": 68738, "epoch": 1636} {"train_loss": -5.909024238586426, "global_step": 68739, "epoch": 1636} {"train_loss": -6.104034423828125, "global_step": 68740, "epoch": 1636} {"train_loss": -6.048644065856934, "global_step": 68741, "epoch": 1636} {"train_loss": -6.0306220054626465, "global_step": 68742, "epoch": 1636} {"train_loss": -6.015334129333496, "global_step": 68743, "epoch": 1636} {"train_loss": -5.952935218811035, "global_step": 68744, "epoch": 1636} {"train_loss": -6.095643043518066, "global_step": 68745, "epoch": 1636} {"train_loss": -5.991477966308594, "global_step": 68746, "epoch": 1636} {"train_loss": -6.062831878662109, "global_step": 68747, "epoch": 1636} {"train_loss": -6.0446062088012695, "global_step": 68748, "epoch": 1636} {"train_loss": -6.109835147857666, "global_step": 68749, "epoch": 1636} {"train_loss": -5.96873140335083, "global_step": 68750, "epoch": 1636} {"train_loss": -6.006204605102539, "global_step": 68751, "epoch": 1636} {"train_loss": -5.989091396331787, "global_step": 68752, "epoch": 1636} {"train_loss": -6.013892525718326, "global_step": 68753, "epoch": 1636, "val_loss": 61431.92578125} {"train_loss": -6.121020317077637, "global_step": 68754, "epoch": 1637} {"train_loss": -5.93462610244751, "global_step": 68755, "epoch": 1637} {"train_loss": -5.843108177185059, "global_step": 68756, "epoch": 1637} {"train_loss": -6.079885005950928, "global_step": 68757, "epoch": 1637} {"train_loss": -5.985263347625732, "global_step": 68758, "epoch": 1637} {"train_loss": -5.969283103942871, "global_step": 68759, "epoch": 1637} {"train_loss": -6.091261863708496, "global_step": 68760, "epoch": 1637} {"train_loss": -6.026026248931885, "global_step": 68761, "epoch": 1637} {"train_loss": -6.074891090393066, "global_step": 68762, "epoch": 1637} {"train_loss": -6.060741424560547, "global_step": 68763, "epoch": 1637} {"train_loss": -5.974269390106201, "global_step": 68764, "epoch": 1637} {"train_loss": -6.097556114196777, "global_step": 68765, "epoch": 1637} {"train_loss": -5.925629138946533, "global_step": 68766, "epoch": 1637} {"train_loss": -6.06102180480957, "global_step": 68767, "epoch": 1637} {"train_loss": -5.9353227615356445, "global_step": 68768, "epoch": 1637} {"train_loss": -6.101489067077637, "global_step": 68769, "epoch": 1637} {"train_loss": -6.029821872711182, "global_step": 68770, "epoch": 1637} {"train_loss": -6.04050350189209, "global_step": 68771, "epoch": 1637} {"train_loss": -5.943453788757324, "global_step": 68772, "epoch": 1637} {"train_loss": -5.982015609741211, "global_step": 68773, "epoch": 1637} {"train_loss": -6.108321189880371, "global_step": 68774, "epoch": 1637} {"train_loss": -6.063167095184326, "global_step": 68775, "epoch": 1637} {"train_loss": -6.105426788330078, "global_step": 68776, "epoch": 1637} {"train_loss": -5.974124908447266, "global_step": 68777, "epoch": 1637} {"train_loss": -6.11067533493042, "global_step": 68778, "epoch": 1637} {"train_loss": -6.109500885009766, "global_step": 68779, "epoch": 1637} {"train_loss": -6.02553653717041, "global_step": 68780, "epoch": 1637} {"train_loss": -6.038451194763184, "global_step": 68781, "epoch": 1637} {"train_loss": -6.117036819458008, "global_step": 68782, "epoch": 1637} {"train_loss": -6.024245262145996, "global_step": 68783, "epoch": 1637} {"train_loss": -6.050371170043945, "global_step": 68784, "epoch": 1637} {"train_loss": -5.9405198097229, "global_step": 68785, "epoch": 1637} {"train_loss": -6.0171709060668945, "global_step": 68786, "epoch": 1637} {"train_loss": -6.103010654449463, "global_step": 68787, "epoch": 1637} {"train_loss": -5.911943435668945, "global_step": 68788, "epoch": 1637} {"train_loss": -6.114494800567627, "global_step": 68789, "epoch": 1637} {"train_loss": -6.0398783683776855, "global_step": 68790, "epoch": 1637} {"train_loss": -6.041344165802002, "global_step": 68791, "epoch": 1637} {"train_loss": -6.045001029968262, "global_step": 68792, "epoch": 1637} {"train_loss": -6.070350646972656, "global_step": 68793, "epoch": 1637} {"train_loss": -6.036430358886719, "global_step": 68794, "epoch": 1637} {"train_loss": -6.032122986657279, "global_step": 68795, "epoch": 1637, "val_loss": 61642.0390625} {"train_loss": -6.147801399230957, "global_step": 68796, "epoch": 1638} {"train_loss": -6.146262168884277, "global_step": 68797, "epoch": 1638} {"train_loss": -6.03516960144043, "global_step": 68798, "epoch": 1638} {"train_loss": -6.023846626281738, "global_step": 68799, "epoch": 1638} {"train_loss": -6.075817108154297, "global_step": 68800, "epoch": 1638} {"train_loss": -5.97617244720459, "global_step": 68801, "epoch": 1638} {"train_loss": -5.9694929122924805, "global_step": 68802, "epoch": 1638} {"train_loss": -6.026617050170898, "global_step": 68803, "epoch": 1638} {"train_loss": -5.988241672515869, "global_step": 68804, "epoch": 1638} {"train_loss": -5.998687267303467, "global_step": 68805, "epoch": 1638} {"train_loss": -6.12558650970459, "global_step": 68806, "epoch": 1638} {"train_loss": -6.065561294555664, "global_step": 68807, "epoch": 1638} {"train_loss": -6.037055969238281, "global_step": 68808, "epoch": 1638} {"train_loss": -6.106660842895508, "global_step": 68809, "epoch": 1638} {"train_loss": -5.988872528076172, "global_step": 68810, "epoch": 1638} {"train_loss": -6.028292655944824, "global_step": 68811, "epoch": 1638} {"train_loss": -5.975937843322754, "global_step": 68812, "epoch": 1638} {"train_loss": -6.013213157653809, "global_step": 68813, "epoch": 1638} {"train_loss": -5.994022846221924, "global_step": 68814, "epoch": 1638} {"train_loss": -6.011763572692871, "global_step": 68815, "epoch": 1638} {"train_loss": -6.073183059692383, "global_step": 68816, "epoch": 1638} {"train_loss": -6.011878967285156, "global_step": 68817, "epoch": 1638} {"train_loss": -6.077303886413574, "global_step": 68818, "epoch": 1638} {"train_loss": -6.072328090667725, "global_step": 68819, "epoch": 1638} {"train_loss": -6.045947074890137, "global_step": 68820, "epoch": 1638} {"train_loss": -6.086493492126465, "global_step": 68821, "epoch": 1638} {"train_loss": -6.08199405670166, "global_step": 68822, "epoch": 1638} {"train_loss": -6.078768253326416, "global_step": 68823, "epoch": 1638} {"train_loss": -6.026815414428711, "global_step": 68824, "epoch": 1638} {"train_loss": -5.992142200469971, "global_step": 68825, "epoch": 1638} {"train_loss": -6.119275093078613, "global_step": 68826, "epoch": 1638} {"train_loss": -5.932424545288086, "global_step": 68827, "epoch": 1638} {"train_loss": -6.075784683227539, "global_step": 68828, "epoch": 1638} {"train_loss": -6.083580493927002, "global_step": 68829, "epoch": 1638} {"train_loss": -5.992585182189941, "global_step": 68830, "epoch": 1638} {"train_loss": -5.958733558654785, "global_step": 68831, "epoch": 1638} {"train_loss": -6.056588172912598, "global_step": 68832, "epoch": 1638} {"train_loss": -6.093067169189453, "global_step": 68833, "epoch": 1638} {"train_loss": -6.056846618652344, "global_step": 68834, "epoch": 1638} {"train_loss": -6.081591606140137, "global_step": 68835, "epoch": 1638} {"train_loss": -5.956453323364258, "global_step": 68836, "epoch": 1638} {"train_loss": -6.03893796602885, "global_step": 68837, "epoch": 1638, "val_loss": 61549.95703125} {"train_loss": -6.103545188903809, "global_step": 68838, "epoch": 1639} {"train_loss": -6.020345687866211, "global_step": 68839, "epoch": 1639} {"train_loss": -6.071584701538086, "global_step": 68840, "epoch": 1639} {"train_loss": -6.093384265899658, "global_step": 68841, "epoch": 1639} {"train_loss": -6.155537128448486, "global_step": 68842, "epoch": 1639} {"train_loss": -6.052419185638428, "global_step": 68843, "epoch": 1639} {"train_loss": -6.017714500427246, "global_step": 68844, "epoch": 1639} {"train_loss": -6.07185173034668, "global_step": 68845, "epoch": 1639} {"train_loss": -5.869751930236816, "global_step": 68846, "epoch": 1639} {"train_loss": -6.001100063323975, "global_step": 68847, "epoch": 1639} {"train_loss": -6.029792785644531, "global_step": 68848, "epoch": 1639} {"train_loss": -5.955012321472168, "global_step": 68849, "epoch": 1639} {"train_loss": -5.940146446228027, "global_step": 68850, "epoch": 1639} {"train_loss": -6.059499740600586, "global_step": 68851, "epoch": 1639} {"train_loss": -6.037349700927734, "global_step": 68852, "epoch": 1639} {"train_loss": -6.157307147979736, "global_step": 68853, "epoch": 1639} {"train_loss": -5.921380519866943, "global_step": 68854, "epoch": 1639} {"train_loss": -5.995888710021973, "global_step": 68855, "epoch": 1639} {"train_loss": -6.035296440124512, "global_step": 68856, "epoch": 1639} {"train_loss": -5.999773025512695, "global_step": 68857, "epoch": 1639} {"train_loss": -6.047646522521973, "global_step": 68858, "epoch": 1639} {"train_loss": -6.076202869415283, "global_step": 68859, "epoch": 1639} {"train_loss": -6.009226322174072, "global_step": 68860, "epoch": 1639} {"train_loss": -6.115730285644531, "global_step": 68861, "epoch": 1639} {"train_loss": -6.073813438415527, "global_step": 68862, "epoch": 1639} {"train_loss": -6.081037998199463, "global_step": 68863, "epoch": 1639} {"train_loss": -5.989192008972168, "global_step": 68864, "epoch": 1639} {"train_loss": -6.02683687210083, "global_step": 68865, "epoch": 1639} {"train_loss": -6.070496559143066, "global_step": 68866, "epoch": 1639} {"train_loss": -6.080160140991211, "global_step": 68867, "epoch": 1639} {"train_loss": -6.043143272399902, "global_step": 68868, "epoch": 1639} {"train_loss": -6.0893449783325195, "global_step": 68869, "epoch": 1639} {"train_loss": -5.99623441696167, "global_step": 68870, "epoch": 1639} {"train_loss": -6.027743816375732, "global_step": 68871, "epoch": 1639} {"train_loss": -6.004864692687988, "global_step": 68872, "epoch": 1639} {"train_loss": -6.150925636291504, "global_step": 68873, "epoch": 1639} {"train_loss": -5.9355597496032715, "global_step": 68874, "epoch": 1639} {"train_loss": -6.046525478363037, "global_step": 68875, "epoch": 1639} {"train_loss": -5.976187705993652, "global_step": 68876, "epoch": 1639} {"train_loss": -5.966352939605713, "global_step": 68877, "epoch": 1639} {"train_loss": -6.0053253173828125, "global_step": 68878, "epoch": 1639} {"train_loss": -6.035740193866548, "global_step": 68879, "epoch": 1639, "val_loss": 61779.66015625} {"train_loss": -5.898525238037109, "global_step": 68880, "epoch": 1640} {"train_loss": -5.9568586349487305, "global_step": 68881, "epoch": 1640} {"train_loss": -5.976586818695068, "global_step": 68882, "epoch": 1640} {"train_loss": -6.058645725250244, "global_step": 68883, "epoch": 1640} {"train_loss": -6.037919044494629, "global_step": 68884, "epoch": 1640} {"train_loss": -6.1098785400390625, "global_step": 68885, "epoch": 1640} {"train_loss": -6.111321449279785, "global_step": 68886, "epoch": 1640} {"train_loss": -6.17271614074707, "global_step": 68887, "epoch": 1640} {"train_loss": -6.008916854858398, "global_step": 68888, "epoch": 1640} {"train_loss": -5.935117721557617, "global_step": 68889, "epoch": 1640} {"train_loss": -6.033156394958496, "global_step": 68890, "epoch": 1640} {"train_loss": -5.930829048156738, "global_step": 68891, "epoch": 1640} {"train_loss": -6.064618110656738, "global_step": 68892, "epoch": 1640} {"train_loss": -5.834391117095947, "global_step": 68893, "epoch": 1640} {"train_loss": -5.8845930099487305, "global_step": 68894, "epoch": 1640} {"train_loss": -5.9938859939575195, "global_step": 68895, "epoch": 1640} {"train_loss": -6.048782825469971, "global_step": 68896, "epoch": 1640} {"train_loss": -5.9993462562561035, "global_step": 68897, "epoch": 1640} {"train_loss": -5.945276260375977, "global_step": 68898, "epoch": 1640} {"train_loss": -5.940307140350342, "global_step": 68899, "epoch": 1640} {"train_loss": -5.947831630706787, "global_step": 68900, "epoch": 1640} {"train_loss": -5.976569652557373, "global_step": 68901, "epoch": 1640} {"train_loss": -6.082024097442627, "global_step": 68902, "epoch": 1640} {"train_loss": -5.935369491577148, "global_step": 68903, "epoch": 1640} {"train_loss": -5.918698310852051, "global_step": 68904, "epoch": 1640} {"train_loss": -5.949754238128662, "global_step": 68905, "epoch": 1640} {"train_loss": -5.945706844329834, "global_step": 68906, "epoch": 1640} {"train_loss": -6.038540840148926, "global_step": 68907, "epoch": 1640} {"train_loss": -5.93393611907959, "global_step": 68908, "epoch": 1640} {"train_loss": -5.978338241577148, "global_step": 68909, "epoch": 1640} {"train_loss": -6.066411972045898, "global_step": 68910, "epoch": 1640} {"train_loss": -6.072701454162598, "global_step": 68911, "epoch": 1640} {"train_loss": -5.938039302825928, "global_step": 68912, "epoch": 1640} {"train_loss": -6.098171234130859, "global_step": 68913, "epoch": 1640} {"train_loss": -6.128170013427734, "global_step": 68914, "epoch": 1640} {"train_loss": -6.05018424987793, "global_step": 68915, "epoch": 1640} {"train_loss": -5.902758598327637, "global_step": 68916, "epoch": 1640} {"train_loss": -6.020498275756836, "global_step": 68917, "epoch": 1640} {"train_loss": -5.938002109527588, "global_step": 68918, "epoch": 1640} {"train_loss": -6.0145463943481445, "global_step": 68919, "epoch": 1640} {"train_loss": -6.02013635635376, "global_step": 68920, "epoch": 1640} {"train_loss": -5.995939220700945, "global_step": 68921, "epoch": 1640, "val_loss": 61578.43359375} {"train_loss": -6.008889675140381, "global_step": 68922, "epoch": 1641} {"train_loss": -5.9883551597595215, "global_step": 68923, "epoch": 1641} {"train_loss": -6.0568647384643555, "global_step": 68924, "epoch": 1641} {"train_loss": -6.114346027374268, "global_step": 68925, "epoch": 1641} {"train_loss": -6.02362060546875, "global_step": 68926, "epoch": 1641} {"train_loss": -6.059975624084473, "global_step": 68927, "epoch": 1641} {"train_loss": -5.986358165740967, "global_step": 68928, "epoch": 1641} {"train_loss": -6.01200008392334, "global_step": 68929, "epoch": 1641} {"train_loss": -6.077927589416504, "global_step": 68930, "epoch": 1641} {"train_loss": -6.080405235290527, "global_step": 68931, "epoch": 1641} {"train_loss": -6.035614967346191, "global_step": 68932, "epoch": 1641} {"train_loss": -6.066131591796875, "global_step": 68933, "epoch": 1641} {"train_loss": -6.074455261230469, "global_step": 68934, "epoch": 1641} {"train_loss": -6.082009315490723, "global_step": 68935, "epoch": 1641} {"train_loss": -6.078386306762695, "global_step": 68936, "epoch": 1641} {"train_loss": -6.036197662353516, "global_step": 68937, "epoch": 1641} {"train_loss": -6.004347801208496, "global_step": 68938, "epoch": 1641} {"train_loss": -5.941783428192139, "global_step": 68939, "epoch": 1641} {"train_loss": -6.033979892730713, "global_step": 68940, "epoch": 1641} {"train_loss": -6.0384416580200195, "global_step": 68941, "epoch": 1641} {"train_loss": -6.100801944732666, "global_step": 68942, "epoch": 1641} {"train_loss": -5.913802146911621, "global_step": 68943, "epoch": 1641} {"train_loss": -6.010138511657715, "global_step": 68944, "epoch": 1641} {"train_loss": -5.974025726318359, "global_step": 68945, "epoch": 1641} {"train_loss": -5.961102485656738, "global_step": 68946, "epoch": 1641} {"train_loss": -6.033419132232666, "global_step": 68947, "epoch": 1641} {"train_loss": -5.946381092071533, "global_step": 68948, "epoch": 1641} {"train_loss": -5.904972076416016, "global_step": 68949, "epoch": 1641} {"train_loss": -5.929659843444824, "global_step": 68950, "epoch": 1641} {"train_loss": -6.0407867431640625, "global_step": 68951, "epoch": 1641} {"train_loss": -5.858405590057373, "global_step": 68952, "epoch": 1641} {"train_loss": -6.024942874908447, "global_step": 68953, "epoch": 1641} {"train_loss": -5.929833889007568, "global_step": 68954, "epoch": 1641} {"train_loss": -5.993861675262451, "global_step": 68955, "epoch": 1641} {"train_loss": -5.995645999908447, "global_step": 68956, "epoch": 1641} {"train_loss": -6.023186206817627, "global_step": 68957, "epoch": 1641} {"train_loss": -5.984139442443848, "global_step": 68958, "epoch": 1641} {"train_loss": -5.933585166931152, "global_step": 68959, "epoch": 1641} {"train_loss": -6.0540924072265625, "global_step": 68960, "epoch": 1641} {"train_loss": -5.8253326416015625, "global_step": 68961, "epoch": 1641} {"train_loss": -5.941777229309082, "global_step": 68962, "epoch": 1641} {"train_loss": -6.003437450953892, "global_step": 68963, "epoch": 1641, "val_loss": 61543.29296875} {"train_loss": -5.981873989105225, "global_step": 68964, "epoch": 1642} {"train_loss": -5.856067180633545, "global_step": 68965, "epoch": 1642} {"train_loss": -6.058831691741943, "global_step": 68966, "epoch": 1642} {"train_loss": -6.026485919952393, "global_step": 68967, "epoch": 1642} {"train_loss": -5.960928916931152, "global_step": 68968, "epoch": 1642} {"train_loss": -5.978522777557373, "global_step": 68969, "epoch": 1642} {"train_loss": -5.964170455932617, "global_step": 68970, "epoch": 1642} {"train_loss": -5.987932205200195, "global_step": 68971, "epoch": 1642} {"train_loss": -5.946150302886963, "global_step": 68972, "epoch": 1642} {"train_loss": -5.994858264923096, "global_step": 68973, "epoch": 1642} {"train_loss": -5.953126907348633, "global_step": 68974, "epoch": 1642} {"train_loss": -6.004197597503662, "global_step": 68975, "epoch": 1642} {"train_loss": -5.999543190002441, "global_step": 68976, "epoch": 1642} {"train_loss": -6.047477722167969, "global_step": 68977, "epoch": 1642} {"train_loss": -6.060468673706055, "global_step": 68978, "epoch": 1642} {"train_loss": -6.009376049041748, "global_step": 68979, "epoch": 1642} {"train_loss": -6.027714729309082, "global_step": 68980, "epoch": 1642} {"train_loss": -6.020810127258301, "global_step": 68981, "epoch": 1642} {"train_loss": -5.978734493255615, "global_step": 68982, "epoch": 1642} {"train_loss": -6.009664058685303, "global_step": 68983, "epoch": 1642} {"train_loss": -5.940984725952148, "global_step": 68984, "epoch": 1642} {"train_loss": -5.975487232208252, "global_step": 68985, "epoch": 1642} {"train_loss": -6.100492000579834, "global_step": 68986, "epoch": 1642} {"train_loss": -5.986715316772461, "global_step": 68987, "epoch": 1642} {"train_loss": -5.977018356323242, "global_step": 68988, "epoch": 1642} {"train_loss": -6.083827018737793, "global_step": 68989, "epoch": 1642} {"train_loss": -6.058352470397949, "global_step": 68990, "epoch": 1642} {"train_loss": -6.034789562225342, "global_step": 68991, "epoch": 1642} {"train_loss": -6.062638759613037, "global_step": 68992, "epoch": 1642} {"train_loss": -5.999269962310791, "global_step": 68993, "epoch": 1642} {"train_loss": -6.076671123504639, "global_step": 68994, "epoch": 1642} {"train_loss": -5.988293647766113, "global_step": 68995, "epoch": 1642} {"train_loss": -5.867079734802246, "global_step": 68996, "epoch": 1642} {"train_loss": -5.978921890258789, "global_step": 68997, "epoch": 1642} {"train_loss": -6.056475639343262, "global_step": 68998, "epoch": 1642} {"train_loss": -6.000263214111328, "global_step": 68999, "epoch": 1642} {"train_loss": -6.049516201019287, "global_step": 69000, "epoch": 1642} {"train_loss": -5.922281265258789, "global_step": 69001, "epoch": 1642} {"train_loss": -5.987184524536133, "global_step": 69002, "epoch": 1642} {"train_loss": -6.025629997253418, "global_step": 69003, "epoch": 1642} {"train_loss": -5.944486618041992, "global_step": 69004, "epoch": 1642} {"train_loss": -5.998857327869961, "global_step": 69005, "epoch": 1642, "val_loss": 61671.77734375} {"train_loss": -5.986577033996582, "global_step": 69006, "epoch": 1643} {"train_loss": -6.030466079711914, "global_step": 69007, "epoch": 1643} {"train_loss": -5.993615627288818, "global_step": 69008, "epoch": 1643} {"train_loss": -6.10815954208374, "global_step": 69009, "epoch": 1643} {"train_loss": -6.114803314208984, "global_step": 69010, "epoch": 1643} {"train_loss": -6.079510688781738, "global_step": 69011, "epoch": 1643} {"train_loss": -6.013554096221924, "global_step": 69012, "epoch": 1643} {"train_loss": -6.028491973876953, "global_step": 69013, "epoch": 1643} {"train_loss": -6.1082658767700195, "global_step": 69014, "epoch": 1643} {"train_loss": -6.066237926483154, "global_step": 69015, "epoch": 1643} {"train_loss": -6.012680530548096, "global_step": 69016, "epoch": 1643} {"train_loss": -5.991507053375244, "global_step": 69017, "epoch": 1643} {"train_loss": -5.989198684692383, "global_step": 69018, "epoch": 1643} {"train_loss": -6.037162780761719, "global_step": 69019, "epoch": 1643} {"train_loss": -6.076092720031738, "global_step": 69020, "epoch": 1643} {"train_loss": -6.082940101623535, "global_step": 69021, "epoch": 1643} {"train_loss": -6.004400730133057, "global_step": 69022, "epoch": 1643} {"train_loss": -6.09528923034668, "global_step": 69023, "epoch": 1643} {"train_loss": -5.913207054138184, "global_step": 69024, "epoch": 1643} {"train_loss": -6.105493545532227, "global_step": 69025, "epoch": 1643} {"train_loss": -5.922466278076172, "global_step": 69026, "epoch": 1643} {"train_loss": -6.120016574859619, "global_step": 69027, "epoch": 1643} {"train_loss": -5.962677001953125, "global_step": 69028, "epoch": 1643} {"train_loss": -5.929147720336914, "global_step": 69029, "epoch": 1643} {"train_loss": -6.002320289611816, "global_step": 69030, "epoch": 1643} {"train_loss": -5.999974250793457, "global_step": 69031, "epoch": 1643} {"train_loss": -6.121062278747559, "global_step": 69032, "epoch": 1643} {"train_loss": -6.046098709106445, "global_step": 69033, "epoch": 1643} {"train_loss": -6.110147476196289, "global_step": 69034, "epoch": 1643} {"train_loss": -6.069034576416016, "global_step": 69035, "epoch": 1643} {"train_loss": -6.036450386047363, "global_step": 69036, "epoch": 1643} {"train_loss": -6.020725250244141, "global_step": 69037, "epoch": 1643} {"train_loss": -6.052619934082031, "global_step": 69038, "epoch": 1643} {"train_loss": -6.008890151977539, "global_step": 69039, "epoch": 1643} {"train_loss": -6.045679569244385, "global_step": 69040, "epoch": 1643} {"train_loss": -5.995997428894043, "global_step": 69041, "epoch": 1643} {"train_loss": -5.994503021240234, "global_step": 69042, "epoch": 1643} {"train_loss": -6.187025547027588, "global_step": 69043, "epoch": 1643} {"train_loss": -5.843725204467773, "global_step": 69044, "epoch": 1643} {"train_loss": -6.076606750488281, "global_step": 69045, "epoch": 1643} {"train_loss": -5.98044490814209, "global_step": 69046, "epoch": 1643} {"train_loss": -6.032795769827707, "global_step": 69047, "epoch": 1643, "val_loss": 61582.95703125} {"train_loss": -6.004838466644287, "global_step": 69048, "epoch": 1644} {"train_loss": -6.124368667602539, "global_step": 69049, "epoch": 1644} {"train_loss": -5.995248317718506, "global_step": 69050, "epoch": 1644} {"train_loss": -6.0232439041137695, "global_step": 69051, "epoch": 1644} {"train_loss": -6.148449897766113, "global_step": 69052, "epoch": 1644} {"train_loss": -6.07326602935791, "global_step": 69053, "epoch": 1644} {"train_loss": -6.021252155303955, "global_step": 69054, "epoch": 1644} {"train_loss": -6.022629261016846, "global_step": 69055, "epoch": 1644} {"train_loss": -5.978628158569336, "global_step": 69056, "epoch": 1644} {"train_loss": -6.072195529937744, "global_step": 69057, "epoch": 1644} {"train_loss": -6.084601402282715, "global_step": 69058, "epoch": 1644} {"train_loss": -6.04726505279541, "global_step": 69059, "epoch": 1644} {"train_loss": -6.011288642883301, "global_step": 69060, "epoch": 1644} {"train_loss": -5.95101261138916, "global_step": 69061, "epoch": 1644} {"train_loss": -5.999335289001465, "global_step": 69062, "epoch": 1644} {"train_loss": -6.1516008377075195, "global_step": 69063, "epoch": 1644} {"train_loss": -6.047079563140869, "global_step": 69064, "epoch": 1644} {"train_loss": -5.998003005981445, "global_step": 69065, "epoch": 1644} {"train_loss": -6.014012336730957, "global_step": 69066, "epoch": 1644} {"train_loss": -6.103114604949951, "global_step": 69067, "epoch": 1644} {"train_loss": -6.022288799285889, "global_step": 69068, "epoch": 1644} {"train_loss": -5.980883598327637, "global_step": 69069, "epoch": 1644} {"train_loss": -5.925748825073242, "global_step": 69070, "epoch": 1644} {"train_loss": -5.997854232788086, "global_step": 69071, "epoch": 1644} {"train_loss": -5.998558521270752, "global_step": 69072, "epoch": 1644} {"train_loss": -5.862373352050781, "global_step": 69073, "epoch": 1644} {"train_loss": -5.905179023742676, "global_step": 69074, "epoch": 1644} {"train_loss": -5.932350158691406, "global_step": 69075, "epoch": 1644} {"train_loss": -5.911085605621338, "global_step": 69076, "epoch": 1644} {"train_loss": -5.8506011962890625, "global_step": 69077, "epoch": 1644} {"train_loss": -6.013171195983887, "global_step": 69078, "epoch": 1644} {"train_loss": -5.988097667694092, "global_step": 69079, "epoch": 1644} {"train_loss": -5.857444763183594, "global_step": 69080, "epoch": 1644} {"train_loss": -5.980010032653809, "global_step": 69081, "epoch": 1644} {"train_loss": -5.914010047912598, "global_step": 69082, "epoch": 1644} {"train_loss": -5.971320152282715, "global_step": 69083, "epoch": 1644} {"train_loss": -5.864446640014648, "global_step": 69084, "epoch": 1644} {"train_loss": -5.807387828826904, "global_step": 69085, "epoch": 1644} {"train_loss": -5.921326637268066, "global_step": 69086, "epoch": 1644} {"train_loss": -5.945024490356445, "global_step": 69087, "epoch": 1644} {"train_loss": -5.845804214477539, "global_step": 69088, "epoch": 1644} {"train_loss": -5.982514267876034, "global_step": 69089, "epoch": 1644, "val_loss": 61811.81640625} {"train_loss": -5.944758415222168, "global_step": 69090, "epoch": 1645} {"train_loss": -6.005154609680176, "global_step": 69091, "epoch": 1645} {"train_loss": -5.988179683685303, "global_step": 69092, "epoch": 1645} {"train_loss": -5.950414657592773, "global_step": 69093, "epoch": 1645} {"train_loss": -6.014473915100098, "global_step": 69094, "epoch": 1645} {"train_loss": -6.039508819580078, "global_step": 69095, "epoch": 1645} {"train_loss": -5.991232872009277, "global_step": 69096, "epoch": 1645} {"train_loss": -5.8726325035095215, "global_step": 69097, "epoch": 1645} {"train_loss": -5.965204238891602, "global_step": 69098, "epoch": 1645} {"train_loss": -5.952411651611328, "global_step": 69099, "epoch": 1645} {"train_loss": -5.992800712585449, "global_step": 69100, "epoch": 1645} {"train_loss": -6.005947113037109, "global_step": 69101, "epoch": 1645} {"train_loss": -5.984112739562988, "global_step": 69102, "epoch": 1645} {"train_loss": -5.8597846031188965, "global_step": 69103, "epoch": 1645} {"train_loss": -6.01045036315918, "global_step": 69104, "epoch": 1645} {"train_loss": -6.13819694519043, "global_step": 69105, "epoch": 1645} {"train_loss": -5.973094940185547, "global_step": 69106, "epoch": 1645} {"train_loss": -5.984993934631348, "global_step": 69107, "epoch": 1645} {"train_loss": -6.012754440307617, "global_step": 69108, "epoch": 1645} {"train_loss": -6.109068393707275, "global_step": 69109, "epoch": 1645} {"train_loss": -6.007360935211182, "global_step": 69110, "epoch": 1645} {"train_loss": -5.9637579917907715, "global_step": 69111, "epoch": 1645} {"train_loss": -6.035030364990234, "global_step": 69112, "epoch": 1645} {"train_loss": -6.062983512878418, "global_step": 69113, "epoch": 1645} {"train_loss": -6.030322074890137, "global_step": 69114, "epoch": 1645} {"train_loss": -6.051680564880371, "global_step": 69115, "epoch": 1645} {"train_loss": -5.91750431060791, "global_step": 69116, "epoch": 1645} {"train_loss": -6.059230804443359, "global_step": 69117, "epoch": 1645} {"train_loss": -6.018104553222656, "global_step": 69118, "epoch": 1645} {"train_loss": -5.916017532348633, "global_step": 69119, "epoch": 1645} {"train_loss": -5.857015609741211, "global_step": 69120, "epoch": 1645} {"train_loss": -5.87237548828125, "global_step": 69121, "epoch": 1645} {"train_loss": -5.84790563583374, "global_step": 69122, "epoch": 1645} {"train_loss": -5.950138568878174, "global_step": 69123, "epoch": 1645} {"train_loss": -5.8329854011535645, "global_step": 69124, "epoch": 1645} {"train_loss": -5.9758453369140625, "global_step": 69125, "epoch": 1645} {"train_loss": -5.977043151855469, "global_step": 69126, "epoch": 1645} {"train_loss": -5.954195499420166, "global_step": 69127, "epoch": 1645} {"train_loss": -6.018404006958008, "global_step": 69128, "epoch": 1645} {"train_loss": -6.023940086364746, "global_step": 69129, "epoch": 1645} {"train_loss": -6.016404151916504, "global_step": 69130, "epoch": 1645} {"train_loss": -5.976831810814994, "global_step": 69131, "epoch": 1645, "val_loss": 61459.234375} {"train_loss": -6.053963661193848, "global_step": 69132, "epoch": 1646} {"train_loss": -5.951725006103516, "global_step": 69133, "epoch": 1646} {"train_loss": -5.986294746398926, "global_step": 69134, "epoch": 1646} {"train_loss": -5.979534149169922, "global_step": 69135, "epoch": 1646} {"train_loss": -5.914237022399902, "global_step": 69136, "epoch": 1646} {"train_loss": -5.987039566040039, "global_step": 69137, "epoch": 1646} {"train_loss": -6.033559799194336, "global_step": 69138, "epoch": 1646} {"train_loss": -5.966182708740234, "global_step": 69139, "epoch": 1646} {"train_loss": -6.035950660705566, "global_step": 69140, "epoch": 1646} {"train_loss": -6.01461935043335, "global_step": 69141, "epoch": 1646} {"train_loss": -6.031040191650391, "global_step": 69142, "epoch": 1646} {"train_loss": -5.975203514099121, "global_step": 69143, "epoch": 1646} {"train_loss": -5.916975498199463, "global_step": 69144, "epoch": 1646} {"train_loss": -6.039470195770264, "global_step": 69145, "epoch": 1646} {"train_loss": -6.024639129638672, "global_step": 69146, "epoch": 1646} {"train_loss": -5.855414867401123, "global_step": 69147, "epoch": 1646} {"train_loss": -6.054653644561768, "global_step": 69148, "epoch": 1646} {"train_loss": -5.950071334838867, "global_step": 69149, "epoch": 1646} {"train_loss": -5.98204231262207, "global_step": 69150, "epoch": 1646} {"train_loss": -5.972110271453857, "global_step": 69151, "epoch": 1646} {"train_loss": -5.9251813888549805, "global_step": 69152, "epoch": 1646} {"train_loss": -5.891995906829834, "global_step": 69153, "epoch": 1646} {"train_loss": -6.010842323303223, "global_step": 69154, "epoch": 1646} {"train_loss": -5.913771152496338, "global_step": 69155, "epoch": 1646} {"train_loss": -6.062790870666504, "global_step": 69156, "epoch": 1646} {"train_loss": -6.059942245483398, "global_step": 69157, "epoch": 1646} {"train_loss": -5.959670543670654, "global_step": 69158, "epoch": 1646} {"train_loss": -5.9578752517700195, "global_step": 69159, "epoch": 1646} {"train_loss": -5.859528541564941, "global_step": 69160, "epoch": 1646} {"train_loss": -5.9683427810668945, "global_step": 69161, "epoch": 1646} {"train_loss": -6.102532386779785, "global_step": 69162, "epoch": 1646} {"train_loss": -5.914083957672119, "global_step": 69163, "epoch": 1646} {"train_loss": -6.018138885498047, "global_step": 69164, "epoch": 1646} {"train_loss": -5.9787092208862305, "global_step": 69165, "epoch": 1646} {"train_loss": -5.9820451736450195, "global_step": 69166, "epoch": 1646} {"train_loss": -6.039851188659668, "global_step": 69167, "epoch": 1646} {"train_loss": -5.913132667541504, "global_step": 69168, "epoch": 1646} {"train_loss": -6.102602958679199, "global_step": 69169, "epoch": 1646} {"train_loss": -5.933370590209961, "global_step": 69170, "epoch": 1646} {"train_loss": -5.936576843261719, "global_step": 69171, "epoch": 1646} {"train_loss": -5.878918647766113, "global_step": 69172, "epoch": 1646} {"train_loss": -5.981798183350336, "global_step": 69173, "epoch": 1646, "val_loss": 61486.34765625} {"train_loss": -5.977438449859619, "global_step": 69174, "epoch": 1647} {"train_loss": -6.039002418518066, "global_step": 69175, "epoch": 1647} {"train_loss": -6.101045608520508, "global_step": 69176, "epoch": 1647} {"train_loss": -6.135003089904785, "global_step": 69177, "epoch": 1647} {"train_loss": -6.085502624511719, "global_step": 69178, "epoch": 1647} {"train_loss": -6.0616912841796875, "global_step": 69179, "epoch": 1647} {"train_loss": -6.078598976135254, "global_step": 69180, "epoch": 1647} {"train_loss": -6.061703681945801, "global_step": 69181, "epoch": 1647} {"train_loss": -6.084421634674072, "global_step": 69182, "epoch": 1647} {"train_loss": -5.924013614654541, "global_step": 69183, "epoch": 1647} {"train_loss": -5.982332229614258, "global_step": 69184, "epoch": 1647} {"train_loss": -6.043298244476318, "global_step": 69185, "epoch": 1647} {"train_loss": -6.086792945861816, "global_step": 69186, "epoch": 1647} {"train_loss": -6.037235260009766, "global_step": 69187, "epoch": 1647} {"train_loss": -5.998612403869629, "global_step": 69188, "epoch": 1647} {"train_loss": -6.061069488525391, "global_step": 69189, "epoch": 1647} {"train_loss": -6.122576713562012, "global_step": 69190, "epoch": 1647} {"train_loss": -6.052997589111328, "global_step": 69191, "epoch": 1647} {"train_loss": -6.038023471832275, "global_step": 69192, "epoch": 1647} {"train_loss": -5.974884033203125, "global_step": 69193, "epoch": 1647} {"train_loss": -6.019625663757324, "global_step": 69194, "epoch": 1647} {"train_loss": -5.968096733093262, "global_step": 69195, "epoch": 1647} {"train_loss": -6.040919780731201, "global_step": 69196, "epoch": 1647} {"train_loss": -5.978071689605713, "global_step": 69197, "epoch": 1647} {"train_loss": -6.152843475341797, "global_step": 69198, "epoch": 1647} {"train_loss": -6.052118301391602, "global_step": 69199, "epoch": 1647} {"train_loss": -6.073936462402344, "global_step": 69200, "epoch": 1647} {"train_loss": -6.04542350769043, "global_step": 69201, "epoch": 1647} {"train_loss": -5.9462738037109375, "global_step": 69202, "epoch": 1647} {"train_loss": -6.017918586730957, "global_step": 69203, "epoch": 1647} {"train_loss": -5.9857378005981445, "global_step": 69204, "epoch": 1647} {"train_loss": -5.972591400146484, "global_step": 69205, "epoch": 1647} {"train_loss": -5.934695243835449, "global_step": 69206, "epoch": 1647} {"train_loss": -5.9423675537109375, "global_step": 69207, "epoch": 1647} {"train_loss": -6.094209671020508, "global_step": 69208, "epoch": 1647} {"train_loss": -6.057988166809082, "global_step": 69209, "epoch": 1647} {"train_loss": -6.062875270843506, "global_step": 69210, "epoch": 1647} {"train_loss": -6.09287166595459, "global_step": 69211, "epoch": 1647} {"train_loss": -6.088619232177734, "global_step": 69212, "epoch": 1647} {"train_loss": -6.009400367736816, "global_step": 69213, "epoch": 1647} {"train_loss": -6.086252212524414, "global_step": 69214, "epoch": 1647} {"train_loss": -6.040750548953102, "global_step": 69215, "epoch": 1647, "val_loss": 61546.0703125} {"train_loss": -6.181430816650391, "global_step": 69216, "epoch": 1648} {"train_loss": -6.007411479949951, "global_step": 69217, "epoch": 1648} {"train_loss": -6.010836601257324, "global_step": 69218, "epoch": 1648} {"train_loss": -6.011193752288818, "global_step": 69219, "epoch": 1648} {"train_loss": -6.006638526916504, "global_step": 69220, "epoch": 1648} {"train_loss": -6.143878936767578, "global_step": 69221, "epoch": 1648} {"train_loss": -6.004010200500488, "global_step": 69222, "epoch": 1648} {"train_loss": -6.077113151550293, "global_step": 69223, "epoch": 1648} {"train_loss": -5.943551063537598, "global_step": 69224, "epoch": 1648} {"train_loss": -5.993300914764404, "global_step": 69225, "epoch": 1648} {"train_loss": -6.029890060424805, "global_step": 69226, "epoch": 1648} {"train_loss": -6.177682876586914, "global_step": 69227, "epoch": 1648} {"train_loss": -6.057649612426758, "global_step": 69228, "epoch": 1648} {"train_loss": -6.10366153717041, "global_step": 69229, "epoch": 1648} {"train_loss": -5.98506498336792, "global_step": 69230, "epoch": 1648} {"train_loss": -5.943140029907227, "global_step": 69231, "epoch": 1648} {"train_loss": -6.132894515991211, "global_step": 69232, "epoch": 1648} {"train_loss": -5.973318099975586, "global_step": 69233, "epoch": 1648} {"train_loss": -6.061026096343994, "global_step": 69234, "epoch": 1648} {"train_loss": -6.00037956237793, "global_step": 69235, "epoch": 1648} {"train_loss": -5.930235385894775, "global_step": 69236, "epoch": 1648} {"train_loss": -6.039165496826172, "global_step": 69237, "epoch": 1648} {"train_loss": -6.154284477233887, "global_step": 69238, "epoch": 1648} {"train_loss": -6.047687530517578, "global_step": 69239, "epoch": 1648} {"train_loss": -5.958062171936035, "global_step": 69240, "epoch": 1648} {"train_loss": -6.100131034851074, "global_step": 69241, "epoch": 1648} {"train_loss": -6.048124313354492, "global_step": 69242, "epoch": 1648} {"train_loss": -6.05064582824707, "global_step": 69243, "epoch": 1648} {"train_loss": -6.028626441955566, "global_step": 69244, "epoch": 1648} {"train_loss": -6.134340286254883, "global_step": 69245, "epoch": 1648} {"train_loss": -6.042627334594727, "global_step": 69246, "epoch": 1648} {"train_loss": -5.957490921020508, "global_step": 69247, "epoch": 1648} {"train_loss": -5.989880561828613, "global_step": 69248, "epoch": 1648} {"train_loss": -5.915383815765381, "global_step": 69249, "epoch": 1648} {"train_loss": -6.012396812438965, "global_step": 69250, "epoch": 1648} {"train_loss": -5.984114646911621, "global_step": 69251, "epoch": 1648} {"train_loss": -6.075082778930664, "global_step": 69252, "epoch": 1648} {"train_loss": -6.055865287780762, "global_step": 69253, "epoch": 1648} {"train_loss": -5.960944652557373, "global_step": 69254, "epoch": 1648} {"train_loss": -6.150999069213867, "global_step": 69255, "epoch": 1648} {"train_loss": -6.074711322784424, "global_step": 69256, "epoch": 1648} {"train_loss": -6.041827417555309, "global_step": 69257, "epoch": 1648, "val_loss": 61437.1328125} {"train_loss": -6.009673118591309, "global_step": 69258, "epoch": 1649} {"train_loss": -6.084530353546143, "global_step": 69259, "epoch": 1649} {"train_loss": -6.112028121948242, "global_step": 69260, "epoch": 1649} {"train_loss": -5.8799848556518555, "global_step": 69261, "epoch": 1649} {"train_loss": -6.005875587463379, "global_step": 69262, "epoch": 1649} {"train_loss": -6.009142875671387, "global_step": 69263, "epoch": 1649} {"train_loss": -6.044229984283447, "global_step": 69264, "epoch": 1649} {"train_loss": -6.061254501342773, "global_step": 69265, "epoch": 1649} {"train_loss": -6.044013500213623, "global_step": 69266, "epoch": 1649} {"train_loss": -6.099065780639648, "global_step": 69267, "epoch": 1649} {"train_loss": -5.9534149169921875, "global_step": 69268, "epoch": 1649} {"train_loss": -5.995934963226318, "global_step": 69269, "epoch": 1649} {"train_loss": -6.099306106567383, "global_step": 69270, "epoch": 1649} {"train_loss": -6.026201248168945, "global_step": 69271, "epoch": 1649} {"train_loss": -6.037991523742676, "global_step": 69272, "epoch": 1649} {"train_loss": -6.1177473068237305, "global_step": 69273, "epoch": 1649} {"train_loss": -6.004025459289551, "global_step": 69274, "epoch": 1649} {"train_loss": -5.893308162689209, "global_step": 69275, "epoch": 1649} {"train_loss": -5.8953375816345215, "global_step": 69276, "epoch": 1649} {"train_loss": -6.072521686553955, "global_step": 69277, "epoch": 1649} {"train_loss": -6.042346954345703, "global_step": 69278, "epoch": 1649} {"train_loss": -5.985039710998535, "global_step": 69279, "epoch": 1649} {"train_loss": -5.983109474182129, "global_step": 69280, "epoch": 1649} {"train_loss": -6.038391590118408, "global_step": 69281, "epoch": 1649} {"train_loss": -5.950351715087891, "global_step": 69282, "epoch": 1649} {"train_loss": -5.916674613952637, "global_step": 69283, "epoch": 1649} {"train_loss": -5.989670753479004, "global_step": 69284, "epoch": 1649} {"train_loss": -5.817924499511719, "global_step": 69285, "epoch": 1649} {"train_loss": -6.124598503112793, "global_step": 69286, "epoch": 1649} {"train_loss": -5.851154327392578, "global_step": 69287, "epoch": 1649} {"train_loss": -6.055300712585449, "global_step": 69288, "epoch": 1649} {"train_loss": -5.787533760070801, "global_step": 69289, "epoch": 1649} {"train_loss": -6.041794300079346, "global_step": 69290, "epoch": 1649} {"train_loss": -5.955294609069824, "global_step": 69291, "epoch": 1649} {"train_loss": -6.075280666351318, "global_step": 69292, "epoch": 1649} {"train_loss": -6.057583808898926, "global_step": 69293, "epoch": 1649} {"train_loss": -5.931728839874268, "global_step": 69294, "epoch": 1649} {"train_loss": -6.0160698890686035, "global_step": 69295, "epoch": 1649} {"train_loss": -5.956241130828857, "global_step": 69296, "epoch": 1649} {"train_loss": -6.028111457824707, "global_step": 69297, "epoch": 1649} {"train_loss": -6.0223493576049805, "global_step": 69298, "epoch": 1649} {"train_loss": -6.000503517332531, "global_step": 69299, "epoch": 1649, "val_loss": 61814.140625} {"train_loss": -5.895112991333008, "global_step": 69300, "epoch": 1650} {"train_loss": -5.900357246398926, "global_step": 69301, "epoch": 1650} {"train_loss": -6.119143486022949, "global_step": 69302, "epoch": 1650} {"train_loss": -5.957062721252441, "global_step": 69303, "epoch": 1650} {"train_loss": -5.941150188446045, "global_step": 69304, "epoch": 1650} {"train_loss": -6.047091960906982, "global_step": 69305, "epoch": 1650} {"train_loss": -6.020846366882324, "global_step": 69306, "epoch": 1650} {"train_loss": -5.984899044036865, "global_step": 69307, "epoch": 1650} {"train_loss": -6.035464286804199, "global_step": 69308, "epoch": 1650} {"train_loss": -5.965330600738525, "global_step": 69309, "epoch": 1650} {"train_loss": -6.123789310455322, "global_step": 69310, "epoch": 1650} {"train_loss": -6.101168632507324, "global_step": 69311, "epoch": 1650} {"train_loss": -6.088652610778809, "global_step": 69312, "epoch": 1650} {"train_loss": -6.019067287445068, "global_step": 69313, "epoch": 1650} {"train_loss": -6.071054935455322, "global_step": 69314, "epoch": 1650} {"train_loss": -6.056522369384766, "global_step": 69315, "epoch": 1650} {"train_loss": -6.029598236083984, "global_step": 69316, "epoch": 1650} {"train_loss": -5.978334426879883, "global_step": 69317, "epoch": 1650} {"train_loss": -6.008153438568115, "global_step": 69318, "epoch": 1650} {"train_loss": -6.048961639404297, "global_step": 69319, "epoch": 1650} {"train_loss": -6.012272834777832, "global_step": 69320, "epoch": 1650} {"train_loss": -6.061291694641113, "global_step": 69321, "epoch": 1650} {"train_loss": -6.118070125579834, "global_step": 69322, "epoch": 1650} {"train_loss": -6.0500640869140625, "global_step": 69323, "epoch": 1650} {"train_loss": -6.111747741699219, "global_step": 69324, "epoch": 1650} {"train_loss": -6.0708818435668945, "global_step": 69325, "epoch": 1650} {"train_loss": -5.9452595710754395, "global_step": 69326, "epoch": 1650} {"train_loss": -6.132368087768555, "global_step": 69327, "epoch": 1650} {"train_loss": -6.141096115112305, "global_step": 69328, "epoch": 1650} {"train_loss": -6.034465789794922, "global_step": 69329, "epoch": 1650} {"train_loss": -6.079967975616455, "global_step": 69330, "epoch": 1650} {"train_loss": -5.931110858917236, "global_step": 69331, "epoch": 1650} {"train_loss": -5.933906555175781, "global_step": 69332, "epoch": 1650} {"train_loss": -6.08926248550415, "global_step": 69333, "epoch": 1650} {"train_loss": -6.020275592803955, "global_step": 69334, "epoch": 1650} {"train_loss": -6.074213027954102, "global_step": 69335, "epoch": 1650} {"train_loss": -6.030426979064941, "global_step": 69336, "epoch": 1650} {"train_loss": -6.060357093811035, "global_step": 69337, "epoch": 1650} {"train_loss": -6.022000312805176, "global_step": 69338, "epoch": 1650} {"train_loss": -6.052304744720459, "global_step": 69339, "epoch": 1650} {"train_loss": -5.986403465270996, "global_step": 69340, "epoch": 1650} {"train_loss": -6.032323894046602, "global_step": 69341, "epoch": 1650, "train/sim_max_reward_0": 0.19781692364289477, "train/sim_max_reward_1": 0.3243110317325805, "train/sim_max_reward_2": 0.4151520899646983, "train/sim_max_reward_3": 0.677830518414633, "train/sim_max_reward_4": 0.8942630617209745, "train/sim_max_reward_5": 0.4120855852863711, "test/sim_max_reward_4300000": 0.26462345608131094, "test/sim_max_reward_4300001": 0.18444591464695254, "test/sim_max_reward_4300002": 0.9076732128687132, "test/sim_max_reward_4300003": 0.8114436285165955, "test/sim_max_reward_4300004": 1.0, "test/sim_max_reward_4300005": 0.5346510672103505, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.44708082145313366, "test/sim_max_reward_4300008": 0.9929057716431416, "test/sim_max_reward_4300009": 0.8367920499127212, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.32471888400130633, "test/sim_max_reward_4300012": 0.9019590492005419, "test/sim_max_reward_4300013": 0.4092588597698907, "test/sim_max_reward_4300014": 0.9595071047457551, "test/sim_max_reward_4300015": 0.9820331889003892, "test/sim_max_reward_4300016": 0.9454581465982346, "test/sim_max_reward_4300017": 0.8303844327750104, "test/sim_max_reward_4300018": 0.4453387328082652, "test/sim_max_reward_4300019": 0.18629165769983974, "test/sim_max_reward_4300020": 0.6675695459373986, "test/sim_max_reward_4300021": 0.9388408373326564, "test/sim_max_reward_4300022": 0.8780302987800512, "test/sim_max_reward_4300023": 0.35245096459922254, "test/sim_max_reward_4300024": 0.8033186950051496, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.1837141871522907, "test/sim_max_reward_4300027": 0.857447054708084, "test/sim_max_reward_4300028": 0.8707799677927985, "test/sim_max_reward_4300029": 0.7774395028543876, "test/sim_max_reward_4300030": 0.9085830444636415, "test/sim_max_reward_4300031": 0.21500839242452252, "test/sim_max_reward_4300032": 0.924615613613757, "test/sim_max_reward_4300033": 0.6886614216937362, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.1997943364817132, "test/sim_max_reward_4300037": 0.895425687479687, "test/sim_max_reward_4300038": 0.44678971666141937, "test/sim_max_reward_4300039": 0.9300973635583607, "test/sim_max_reward_4300040": 0.2453013521679916, "test/sim_max_reward_4300041": 0.6358620169889755, "test/sim_max_reward_4300042": 0.6286068852737628, "test/sim_max_reward_4300043": 0.1454899609033448, "test/sim_max_reward_4300044": 0.8261592454799259, "test/sim_max_reward_4300045": 0.933842011384306, "test/sim_max_reward_4300046": 0.8437961216219487, "test/sim_max_reward_4300047": 0.23716597375246218, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.07167618543708743, "train/mean_score": 0.4869098684603587, "test/mean_score": 0.5814206472476167, "val_loss": 61871.94921875} {"train_loss": -6.049007415771484, "global_step": 69342, "epoch": 1651} {"train_loss": -6.048344612121582, "global_step": 69343, "epoch": 1651} {"train_loss": -6.055590629577637, "global_step": 69344, "epoch": 1651} {"train_loss": -5.981647968292236, "global_step": 69345, "epoch": 1651} {"train_loss": -6.018838882446289, "global_step": 69346, "epoch": 1651} {"train_loss": -6.078944683074951, "global_step": 69347, "epoch": 1651} {"train_loss": -6.009036064147949, "global_step": 69348, "epoch": 1651} {"train_loss": -6.009479522705078, "global_step": 69349, "epoch": 1651} {"train_loss": -6.041983127593994, "global_step": 69350, "epoch": 1651} {"train_loss": -6.011051177978516, "global_step": 69351, "epoch": 1651} {"train_loss": -6.102123260498047, "global_step": 69352, "epoch": 1651} {"train_loss": -6.005395889282227, "global_step": 69353, "epoch": 1651} {"train_loss": -6.167015075683594, "global_step": 69354, "epoch": 1651} {"train_loss": -6.062591552734375, "global_step": 69355, "epoch": 1651} {"train_loss": -6.085771560668945, "global_step": 69356, "epoch": 1651} {"train_loss": -6.0969743728637695, "global_step": 69357, "epoch": 1651} {"train_loss": -6.050571441650391, "global_step": 69358, "epoch": 1651} {"train_loss": -6.052647590637207, "global_step": 69359, "epoch": 1651} {"train_loss": -6.069690704345703, "global_step": 69360, "epoch": 1651} {"train_loss": -6.026832580566406, "global_step": 69361, "epoch": 1651} {"train_loss": -6.066557884216309, "global_step": 69362, "epoch": 1651} {"train_loss": -6.12201452255249, "global_step": 69363, "epoch": 1651} {"train_loss": -5.962348937988281, "global_step": 69364, "epoch": 1651} {"train_loss": -6.000547885894775, "global_step": 69365, "epoch": 1651} {"train_loss": -6.046253204345703, "global_step": 69366, "epoch": 1651} {"train_loss": -6.075651168823242, "global_step": 69367, "epoch": 1651} {"train_loss": -6.0511674880981445, "global_step": 69368, "epoch": 1651} {"train_loss": -6.030665397644043, "global_step": 69369, "epoch": 1651} {"train_loss": -6.125832557678223, "global_step": 69370, "epoch": 1651} {"train_loss": -6.072498798370361, "global_step": 69371, "epoch": 1651} {"train_loss": -6.034054756164551, "global_step": 69372, "epoch": 1651} {"train_loss": -6.138043403625488, "global_step": 69373, "epoch": 1651} {"train_loss": -5.990602493286133, "global_step": 69374, "epoch": 1651} {"train_loss": -6.007699966430664, "global_step": 69375, "epoch": 1651} {"train_loss": -6.101075649261475, "global_step": 69376, "epoch": 1651} {"train_loss": -5.94991397857666, "global_step": 69377, "epoch": 1651} {"train_loss": -6.1066179275512695, "global_step": 69378, "epoch": 1651} {"train_loss": -5.985724449157715, "global_step": 69379, "epoch": 1651} {"train_loss": -6.040269374847412, "global_step": 69380, "epoch": 1651} {"train_loss": -6.059223175048828, "global_step": 69381, "epoch": 1651} {"train_loss": -6.038054466247559, "global_step": 69382, "epoch": 1651} {"train_loss": -6.050553106126332, "global_step": 69383, "epoch": 1651, "val_loss": 61960.21875} {"train_loss": -6.055882453918457, "global_step": 69384, "epoch": 1652} {"train_loss": -6.013822555541992, "global_step": 69385, "epoch": 1652} {"train_loss": -6.065065383911133, "global_step": 69386, "epoch": 1652} {"train_loss": -5.983698844909668, "global_step": 69387, "epoch": 1652} {"train_loss": -5.910260200500488, "global_step": 69388, "epoch": 1652} {"train_loss": -6.036770343780518, "global_step": 69389, "epoch": 1652} {"train_loss": -6.099548816680908, "global_step": 69390, "epoch": 1652} {"train_loss": -6.025116443634033, "global_step": 69391, "epoch": 1652} {"train_loss": -5.969636917114258, "global_step": 69392, "epoch": 1652} {"train_loss": -5.886267185211182, "global_step": 69393, "epoch": 1652} {"train_loss": -6.055793762207031, "global_step": 69394, "epoch": 1652} {"train_loss": -6.0724897384643555, "global_step": 69395, "epoch": 1652} {"train_loss": -6.025601387023926, "global_step": 69396, "epoch": 1652} {"train_loss": -6.058154582977295, "global_step": 69397, "epoch": 1652} {"train_loss": -5.959046363830566, "global_step": 69398, "epoch": 1652} {"train_loss": -6.104556083679199, "global_step": 69399, "epoch": 1652} {"train_loss": -6.103283405303955, "global_step": 69400, "epoch": 1652} {"train_loss": -5.989338397979736, "global_step": 69401, "epoch": 1652} {"train_loss": -5.983123302459717, "global_step": 69402, "epoch": 1652} {"train_loss": -6.011559009552002, "global_step": 69403, "epoch": 1652} {"train_loss": -5.994314193725586, "global_step": 69404, "epoch": 1652} {"train_loss": -6.149689674377441, "global_step": 69405, "epoch": 1652} {"train_loss": -5.970891952514648, "global_step": 69406, "epoch": 1652} {"train_loss": -6.101578235626221, "global_step": 69407, "epoch": 1652} {"train_loss": -6.0694403648376465, "global_step": 69408, "epoch": 1652} {"train_loss": -5.929024696350098, "global_step": 69409, "epoch": 1652} {"train_loss": -5.990236282348633, "global_step": 69410, "epoch": 1652} {"train_loss": -6.017546653747559, "global_step": 69411, "epoch": 1652} {"train_loss": -5.946931838989258, "global_step": 69412, "epoch": 1652} {"train_loss": -5.818043231964111, "global_step": 69413, "epoch": 1652} {"train_loss": -5.937440872192383, "global_step": 69414, "epoch": 1652} {"train_loss": -5.989940643310547, "global_step": 69415, "epoch": 1652} {"train_loss": -6.021229267120361, "global_step": 69416, "epoch": 1652} {"train_loss": -5.943795204162598, "global_step": 69417, "epoch": 1652} {"train_loss": -6.001593112945557, "global_step": 69418, "epoch": 1652} {"train_loss": -5.995865821838379, "global_step": 69419, "epoch": 1652} {"train_loss": -6.059940338134766, "global_step": 69420, "epoch": 1652} {"train_loss": -6.106965065002441, "global_step": 69421, "epoch": 1652} {"train_loss": -5.947896957397461, "global_step": 69422, "epoch": 1652} {"train_loss": -5.957098007202148, "global_step": 69423, "epoch": 1652} {"train_loss": -6.05171012878418, "global_step": 69424, "epoch": 1652} {"train_loss": -6.0103550638471335, "global_step": 69425, "epoch": 1652, "val_loss": 61716.6796875} {"train_loss": -6.096771240234375, "global_step": 69426, "epoch": 1653} {"train_loss": -6.016265869140625, "global_step": 69427, "epoch": 1653} {"train_loss": -5.995291709899902, "global_step": 69428, "epoch": 1653} {"train_loss": -6.0568461418151855, "global_step": 69429, "epoch": 1653} {"train_loss": -6.010527610778809, "global_step": 69430, "epoch": 1653} {"train_loss": -5.981532096862793, "global_step": 69431, "epoch": 1653} {"train_loss": -6.197422981262207, "global_step": 69432, "epoch": 1653} {"train_loss": -5.9970703125, "global_step": 69433, "epoch": 1653} {"train_loss": -6.084990501403809, "global_step": 69434, "epoch": 1653} {"train_loss": -5.944085121154785, "global_step": 69435, "epoch": 1653} {"train_loss": -6.00874662399292, "global_step": 69436, "epoch": 1653} {"train_loss": -6.1077165603637695, "global_step": 69437, "epoch": 1653} {"train_loss": -6.012068748474121, "global_step": 69438, "epoch": 1653} {"train_loss": -6.0121684074401855, "global_step": 69439, "epoch": 1653} {"train_loss": -6.040416717529297, "global_step": 69440, "epoch": 1653} {"train_loss": -5.987428665161133, "global_step": 69441, "epoch": 1653} {"train_loss": -5.999899387359619, "global_step": 69442, "epoch": 1653} {"train_loss": -6.018847465515137, "global_step": 69443, "epoch": 1653} {"train_loss": -5.941780090332031, "global_step": 69444, "epoch": 1653} {"train_loss": -5.952497482299805, "global_step": 69445, "epoch": 1653} {"train_loss": -6.025112152099609, "global_step": 69446, "epoch": 1653} {"train_loss": -5.995693206787109, "global_step": 69447, "epoch": 1653} {"train_loss": -6.036396503448486, "global_step": 69448, "epoch": 1653} {"train_loss": -6.07060432434082, "global_step": 69449, "epoch": 1653} {"train_loss": -6.016518592834473, "global_step": 69450, "epoch": 1653} {"train_loss": -5.871517181396484, "global_step": 69451, "epoch": 1653} {"train_loss": -5.994494438171387, "global_step": 69452, "epoch": 1653} {"train_loss": -6.033050537109375, "global_step": 69453, "epoch": 1653} {"train_loss": -5.959432601928711, "global_step": 69454, "epoch": 1653} {"train_loss": -6.024677276611328, "global_step": 69455, "epoch": 1653} {"train_loss": -6.000223159790039, "global_step": 69456, "epoch": 1653} {"train_loss": -6.090902328491211, "global_step": 69457, "epoch": 1653} {"train_loss": -6.087249755859375, "global_step": 69458, "epoch": 1653} {"train_loss": -6.041366100311279, "global_step": 69459, "epoch": 1653} {"train_loss": -6.076344013214111, "global_step": 69460, "epoch": 1653} {"train_loss": -6.03322696685791, "global_step": 69461, "epoch": 1653} {"train_loss": -5.971229553222656, "global_step": 69462, "epoch": 1653} {"train_loss": -6.032590389251709, "global_step": 69463, "epoch": 1653} {"train_loss": -6.008888244628906, "global_step": 69464, "epoch": 1653} {"train_loss": -6.012453079223633, "global_step": 69465, "epoch": 1653} {"train_loss": -5.990330696105957, "global_step": 69466, "epoch": 1653} {"train_loss": -6.022272654942104, "global_step": 69467, "epoch": 1653, "val_loss": 61633.85546875} {"train_loss": -6.0188188552856445, "global_step": 69468, "epoch": 1654} {"train_loss": -6.067068576812744, "global_step": 69469, "epoch": 1654} {"train_loss": -6.060626029968262, "global_step": 69470, "epoch": 1654} {"train_loss": -6.018344879150391, "global_step": 69471, "epoch": 1654} {"train_loss": -5.9448347091674805, "global_step": 69472, "epoch": 1654} {"train_loss": -6.018294334411621, "global_step": 69473, "epoch": 1654} {"train_loss": -6.100424766540527, "global_step": 69474, "epoch": 1654} {"train_loss": -6.05993127822876, "global_step": 69475, "epoch": 1654} {"train_loss": -5.970122337341309, "global_step": 69476, "epoch": 1654} {"train_loss": -5.996769905090332, "global_step": 69477, "epoch": 1654} {"train_loss": -6.09222936630249, "global_step": 69478, "epoch": 1654} {"train_loss": -5.949108600616455, "global_step": 69479, "epoch": 1654} {"train_loss": -6.023078918457031, "global_step": 69480, "epoch": 1654} {"train_loss": -6.0553083419799805, "global_step": 69481, "epoch": 1654} {"train_loss": -5.979003429412842, "global_step": 69482, "epoch": 1654} {"train_loss": -6.054129123687744, "global_step": 69483, "epoch": 1654} {"train_loss": -5.895482540130615, "global_step": 69484, "epoch": 1654} {"train_loss": -6.042683124542236, "global_step": 69485, "epoch": 1654} {"train_loss": -5.904962539672852, "global_step": 69486, "epoch": 1654} {"train_loss": -6.037372589111328, "global_step": 69487, "epoch": 1654} {"train_loss": -5.910436153411865, "global_step": 69488, "epoch": 1654} {"train_loss": -6.001580238342285, "global_step": 69489, "epoch": 1654} {"train_loss": -5.9165544509887695, "global_step": 69490, "epoch": 1654} {"train_loss": -5.944523811340332, "global_step": 69491, "epoch": 1654} {"train_loss": -6.0422797203063965, "global_step": 69492, "epoch": 1654} {"train_loss": -6.080420970916748, "global_step": 69493, "epoch": 1654} {"train_loss": -5.950749397277832, "global_step": 69494, "epoch": 1654} {"train_loss": -6.00900936126709, "global_step": 69495, "epoch": 1654} {"train_loss": -6.045144081115723, "global_step": 69496, "epoch": 1654} {"train_loss": -5.943532943725586, "global_step": 69497, "epoch": 1654} {"train_loss": -5.899387359619141, "global_step": 69498, "epoch": 1654} {"train_loss": -6.080010414123535, "global_step": 69499, "epoch": 1654} {"train_loss": -6.017788887023926, "global_step": 69500, "epoch": 1654} {"train_loss": -5.97939395904541, "global_step": 69501, "epoch": 1654} {"train_loss": -6.03609561920166, "global_step": 69502, "epoch": 1654} {"train_loss": -6.071907043457031, "global_step": 69503, "epoch": 1654} {"train_loss": -6.074119567871094, "global_step": 69504, "epoch": 1654} {"train_loss": -6.076864242553711, "global_step": 69505, "epoch": 1654} {"train_loss": -6.09539794921875, "global_step": 69506, "epoch": 1654} {"train_loss": -5.990133285522461, "global_step": 69507, "epoch": 1654} {"train_loss": -6.124578475952148, "global_step": 69508, "epoch": 1654} {"train_loss": -6.016591446740287, "global_step": 69509, "epoch": 1654, "val_loss": 61634.4453125} {"train_loss": -5.989415168762207, "global_step": 69510, "epoch": 1655} {"train_loss": -6.006743907928467, "global_step": 69511, "epoch": 1655} {"train_loss": -5.893593788146973, "global_step": 69512, "epoch": 1655} {"train_loss": -6.094733715057373, "global_step": 69513, "epoch": 1655} {"train_loss": -6.000147819519043, "global_step": 69514, "epoch": 1655} {"train_loss": -5.962205410003662, "global_step": 69515, "epoch": 1655} {"train_loss": -6.040722846984863, "global_step": 69516, "epoch": 1655} {"train_loss": -5.98032283782959, "global_step": 69517, "epoch": 1655} {"train_loss": -6.100588798522949, "global_step": 69518, "epoch": 1655} {"train_loss": -6.044371128082275, "global_step": 69519, "epoch": 1655} {"train_loss": -6.032221794128418, "global_step": 69520, "epoch": 1655} {"train_loss": -6.092464447021484, "global_step": 69521, "epoch": 1655} {"train_loss": -6.0650634765625, "global_step": 69522, "epoch": 1655} {"train_loss": -6.009836673736572, "global_step": 69523, "epoch": 1655} {"train_loss": -5.955928802490234, "global_step": 69524, "epoch": 1655} {"train_loss": -5.950955390930176, "global_step": 69525, "epoch": 1655} {"train_loss": -5.979511260986328, "global_step": 69526, "epoch": 1655} {"train_loss": -6.161216735839844, "global_step": 69527, "epoch": 1655} {"train_loss": -6.0725603103637695, "global_step": 69528, "epoch": 1655} {"train_loss": -6.067352294921875, "global_step": 69529, "epoch": 1655} {"train_loss": -6.076061248779297, "global_step": 69530, "epoch": 1655} {"train_loss": -5.888083457946777, "global_step": 69531, "epoch": 1655} {"train_loss": -6.03033447265625, "global_step": 69532, "epoch": 1655} {"train_loss": -6.088159561157227, "global_step": 69533, "epoch": 1655} {"train_loss": -6.0289154052734375, "global_step": 69534, "epoch": 1655} {"train_loss": -5.991928577423096, "global_step": 69535, "epoch": 1655} {"train_loss": -6.01746940612793, "global_step": 69536, "epoch": 1655} {"train_loss": -6.067588806152344, "global_step": 69537, "epoch": 1655} {"train_loss": -5.954781532287598, "global_step": 69538, "epoch": 1655} {"train_loss": -6.1239166259765625, "global_step": 69539, "epoch": 1655} {"train_loss": -6.074984550476074, "global_step": 69540, "epoch": 1655} {"train_loss": -6.046589374542236, "global_step": 69541, "epoch": 1655} {"train_loss": -6.021353244781494, "global_step": 69542, "epoch": 1655} {"train_loss": -5.963907241821289, "global_step": 69543, "epoch": 1655} {"train_loss": -5.892829895019531, "global_step": 69544, "epoch": 1655} {"train_loss": -5.921424865722656, "global_step": 69545, "epoch": 1655} {"train_loss": -6.035739898681641, "global_step": 69546, "epoch": 1655} {"train_loss": -6.025075912475586, "global_step": 69547, "epoch": 1655} {"train_loss": -5.966945648193359, "global_step": 69548, "epoch": 1655} {"train_loss": -6.009297847747803, "global_step": 69549, "epoch": 1655} {"train_loss": -6.086930274963379, "global_step": 69550, "epoch": 1655} {"train_loss": -6.017394429161435, "global_step": 69551, "epoch": 1655, "val_loss": 61501.0703125} {"train_loss": -5.9523468017578125, "global_step": 69552, "epoch": 1656} {"train_loss": -6.070243835449219, "global_step": 69553, "epoch": 1656} {"train_loss": -5.925504684448242, "global_step": 69554, "epoch": 1656} {"train_loss": -6.059273719787598, "global_step": 69555, "epoch": 1656} {"train_loss": -5.854349136352539, "global_step": 69556, "epoch": 1656} {"train_loss": -5.98049783706665, "global_step": 69557, "epoch": 1656} {"train_loss": -5.950550556182861, "global_step": 69558, "epoch": 1656} {"train_loss": -5.904973030090332, "global_step": 69559, "epoch": 1656} {"train_loss": -5.914244651794434, "global_step": 69560, "epoch": 1656} {"train_loss": -6.049129486083984, "global_step": 69561, "epoch": 1656} {"train_loss": -5.9419708251953125, "global_step": 69562, "epoch": 1656} {"train_loss": -6.003283500671387, "global_step": 69563, "epoch": 1656} {"train_loss": -6.012702465057373, "global_step": 69564, "epoch": 1656} {"train_loss": -5.935635566711426, "global_step": 69565, "epoch": 1656} {"train_loss": -5.999196529388428, "global_step": 69566, "epoch": 1656} {"train_loss": -5.989560127258301, "global_step": 69567, "epoch": 1656} {"train_loss": -5.933159828186035, "global_step": 69568, "epoch": 1656} {"train_loss": -5.905250549316406, "global_step": 69569, "epoch": 1656} {"train_loss": -6.064558982849121, "global_step": 69570, "epoch": 1656} {"train_loss": -6.014832496643066, "global_step": 69571, "epoch": 1656} {"train_loss": -6.036495685577393, "global_step": 69572, "epoch": 1656} {"train_loss": -6.110016822814941, "global_step": 69573, "epoch": 1656} {"train_loss": -5.994297027587891, "global_step": 69574, "epoch": 1656} {"train_loss": -6.027100563049316, "global_step": 69575, "epoch": 1656} {"train_loss": -6.015730857849121, "global_step": 69576, "epoch": 1656} {"train_loss": -6.009247303009033, "global_step": 69577, "epoch": 1656} {"train_loss": -6.083583831787109, "global_step": 69578, "epoch": 1656} {"train_loss": -6.082071304321289, "global_step": 69579, "epoch": 1656} {"train_loss": -6.024208068847656, "global_step": 69580, "epoch": 1656} {"train_loss": -6.035170078277588, "global_step": 69581, "epoch": 1656} {"train_loss": -5.951630592346191, "global_step": 69582, "epoch": 1656} {"train_loss": -6.102555274963379, "global_step": 69583, "epoch": 1656} {"train_loss": -5.965271472930908, "global_step": 69584, "epoch": 1656} {"train_loss": -6.040482521057129, "global_step": 69585, "epoch": 1656} {"train_loss": -6.00217866897583, "global_step": 69586, "epoch": 1656} {"train_loss": -6.037631034851074, "global_step": 69587, "epoch": 1656} {"train_loss": -6.013633728027344, "global_step": 69588, "epoch": 1656} {"train_loss": -5.99096155166626, "global_step": 69589, "epoch": 1656} {"train_loss": -5.942244052886963, "global_step": 69590, "epoch": 1656} {"train_loss": -5.899859428405762, "global_step": 69591, "epoch": 1656} {"train_loss": -6.064708232879639, "global_step": 69592, "epoch": 1656} {"train_loss": -5.997146254494076, "global_step": 69593, "epoch": 1656, "val_loss": 61805.11328125} {"train_loss": -6.008173942565918, "global_step": 69594, "epoch": 1657} {"train_loss": -5.945902347564697, "global_step": 69595, "epoch": 1657} {"train_loss": -6.002808094024658, "global_step": 69596, "epoch": 1657} {"train_loss": -6.021193504333496, "global_step": 69597, "epoch": 1657} {"train_loss": -6.105014801025391, "global_step": 69598, "epoch": 1657} {"train_loss": -6.012589454650879, "global_step": 69599, "epoch": 1657} {"train_loss": -5.986486434936523, "global_step": 69600, "epoch": 1657} {"train_loss": -6.0580573081970215, "global_step": 69601, "epoch": 1657} {"train_loss": -6.03183650970459, "global_step": 69602, "epoch": 1657} {"train_loss": -6.040982723236084, "global_step": 69603, "epoch": 1657} {"train_loss": -6.133424758911133, "global_step": 69604, "epoch": 1657} {"train_loss": -5.970389366149902, "global_step": 69605, "epoch": 1657} {"train_loss": -5.990911483764648, "global_step": 69606, "epoch": 1657} {"train_loss": -5.972859859466553, "global_step": 69607, "epoch": 1657} {"train_loss": -6.028741836547852, "global_step": 69608, "epoch": 1657} {"train_loss": -6.0853800773620605, "global_step": 69609, "epoch": 1657} {"train_loss": -6.003190040588379, "global_step": 69610, "epoch": 1657} {"train_loss": -5.999370098114014, "global_step": 69611, "epoch": 1657} {"train_loss": -6.01915168762207, "global_step": 69612, "epoch": 1657} {"train_loss": -6.109243869781494, "global_step": 69613, "epoch": 1657} {"train_loss": -6.076290130615234, "global_step": 69614, "epoch": 1657} {"train_loss": -6.033116340637207, "global_step": 69615, "epoch": 1657} {"train_loss": -6.059505462646484, "global_step": 69616, "epoch": 1657} {"train_loss": -6.025821685791016, "global_step": 69617, "epoch": 1657} {"train_loss": -6.073481559753418, "global_step": 69618, "epoch": 1657} {"train_loss": -6.034919738769531, "global_step": 69619, "epoch": 1657} {"train_loss": -6.030584812164307, "global_step": 69620, "epoch": 1657} {"train_loss": -6.214675426483154, "global_step": 69621, "epoch": 1657} {"train_loss": -6.040440559387207, "global_step": 69622, "epoch": 1657} {"train_loss": -5.972172737121582, "global_step": 69623, "epoch": 1657} {"train_loss": -6.080286026000977, "global_step": 69624, "epoch": 1657} {"train_loss": -5.91392183303833, "global_step": 69625, "epoch": 1657} {"train_loss": -6.0340471267700195, "global_step": 69626, "epoch": 1657} {"train_loss": -6.107295036315918, "global_step": 69627, "epoch": 1657} {"train_loss": -5.933481216430664, "global_step": 69628, "epoch": 1657} {"train_loss": -6.069943428039551, "global_step": 69629, "epoch": 1657} {"train_loss": -5.97996711730957, "global_step": 69630, "epoch": 1657} {"train_loss": -6.128517150878906, "global_step": 69631, "epoch": 1657} {"train_loss": -6.099174499511719, "global_step": 69632, "epoch": 1657} {"train_loss": -5.962140083312988, "global_step": 69633, "epoch": 1657} {"train_loss": -6.018786907196045, "global_step": 69634, "epoch": 1657} {"train_loss": -6.0345734641665505, "global_step": 69635, "epoch": 1657, "val_loss": 61736.60546875} {"train_loss": -6.069142818450928, "global_step": 69636, "epoch": 1658} {"train_loss": -6.084445476531982, "global_step": 69637, "epoch": 1658} {"train_loss": -5.904712677001953, "global_step": 69638, "epoch": 1658} {"train_loss": -6.080471038818359, "global_step": 69639, "epoch": 1658} {"train_loss": -6.114699363708496, "global_step": 69640, "epoch": 1658} {"train_loss": -5.991270065307617, "global_step": 69641, "epoch": 1658} {"train_loss": -6.018035888671875, "global_step": 69642, "epoch": 1658} {"train_loss": -6.118471145629883, "global_step": 69643, "epoch": 1658} {"train_loss": -5.906257629394531, "global_step": 69644, "epoch": 1658} {"train_loss": -6.134038925170898, "global_step": 69645, "epoch": 1658} {"train_loss": -6.0583062171936035, "global_step": 69646, "epoch": 1658} {"train_loss": -6.022414207458496, "global_step": 69647, "epoch": 1658} {"train_loss": -6.069062232971191, "global_step": 69648, "epoch": 1658} {"train_loss": -6.044282913208008, "global_step": 69649, "epoch": 1658} {"train_loss": -5.974154949188232, "global_step": 69650, "epoch": 1658} {"train_loss": -6.041135787963867, "global_step": 69651, "epoch": 1658} {"train_loss": -6.125907897949219, "global_step": 69652, "epoch": 1658} {"train_loss": -6.032081604003906, "global_step": 69653, "epoch": 1658} {"train_loss": -5.9813103675842285, "global_step": 69654, "epoch": 1658} {"train_loss": -6.087249279022217, "global_step": 69655, "epoch": 1658} {"train_loss": -5.946128845214844, "global_step": 69656, "epoch": 1658} {"train_loss": -6.00924825668335, "global_step": 69657, "epoch": 1658} {"train_loss": -6.03985071182251, "global_step": 69658, "epoch": 1658} {"train_loss": -6.069921493530273, "global_step": 69659, "epoch": 1658} {"train_loss": -6.048672676086426, "global_step": 69660, "epoch": 1658} {"train_loss": -6.107819557189941, "global_step": 69661, "epoch": 1658} {"train_loss": -6.167129039764404, "global_step": 69662, "epoch": 1658} {"train_loss": -6.13752555847168, "global_step": 69663, "epoch": 1658} {"train_loss": -6.033353805541992, "global_step": 69664, "epoch": 1658} {"train_loss": -6.0521440505981445, "global_step": 69665, "epoch": 1658} {"train_loss": -6.157665729522705, "global_step": 69666, "epoch": 1658} {"train_loss": -6.00547981262207, "global_step": 69667, "epoch": 1658} {"train_loss": -6.004765510559082, "global_step": 69668, "epoch": 1658} {"train_loss": -6.154684066772461, "global_step": 69669, "epoch": 1658} {"train_loss": -6.026301860809326, "global_step": 69670, "epoch": 1658} {"train_loss": -5.933990001678467, "global_step": 69671, "epoch": 1658} {"train_loss": -6.051474571228027, "global_step": 69672, "epoch": 1658} {"train_loss": -6.10917854309082, "global_step": 69673, "epoch": 1658} {"train_loss": -5.916025161743164, "global_step": 69674, "epoch": 1658} {"train_loss": -6.112530708312988, "global_step": 69675, "epoch": 1658} {"train_loss": -6.03240966796875, "global_step": 69676, "epoch": 1658} {"train_loss": -6.047877220880418, "global_step": 69677, "epoch": 1658, "val_loss": 61508.546875} {"train_loss": -6.085648536682129, "global_step": 69678, "epoch": 1659} {"train_loss": -5.957005500793457, "global_step": 69679, "epoch": 1659} {"train_loss": -5.947465419769287, "global_step": 69680, "epoch": 1659} {"train_loss": -6.0807976722717285, "global_step": 69681, "epoch": 1659} {"train_loss": -6.085733890533447, "global_step": 69682, "epoch": 1659} {"train_loss": -6.021036148071289, "global_step": 69683, "epoch": 1659} {"train_loss": -5.992836952209473, "global_step": 69684, "epoch": 1659} {"train_loss": -6.209395885467529, "global_step": 69685, "epoch": 1659} {"train_loss": -6.091864585876465, "global_step": 69686, "epoch": 1659} {"train_loss": -5.925764560699463, "global_step": 69687, "epoch": 1659} {"train_loss": -6.0571699142456055, "global_step": 69688, "epoch": 1659} {"train_loss": -6.039888381958008, "global_step": 69689, "epoch": 1659} {"train_loss": -5.978479385375977, "global_step": 69690, "epoch": 1659} {"train_loss": -6.132572650909424, "global_step": 69691, "epoch": 1659} {"train_loss": -6.002784729003906, "global_step": 69692, "epoch": 1659} {"train_loss": -6.06548547744751, "global_step": 69693, "epoch": 1659} {"train_loss": -6.090988636016846, "global_step": 69694, "epoch": 1659} {"train_loss": -5.930891036987305, "global_step": 69695, "epoch": 1659} {"train_loss": -5.9648919105529785, "global_step": 69696, "epoch": 1659} {"train_loss": -6.0805463790893555, "global_step": 69697, "epoch": 1659} {"train_loss": -5.946394920349121, "global_step": 69698, "epoch": 1659} {"train_loss": -6.051712989807129, "global_step": 69699, "epoch": 1659} {"train_loss": -6.120576858520508, "global_step": 69700, "epoch": 1659} {"train_loss": -6.022038459777832, "global_step": 69701, "epoch": 1659} {"train_loss": -6.033877372741699, "global_step": 69702, "epoch": 1659} {"train_loss": -5.965928077697754, "global_step": 69703, "epoch": 1659} {"train_loss": -6.0137834548950195, "global_step": 69704, "epoch": 1659} {"train_loss": -6.028717041015625, "global_step": 69705, "epoch": 1659} {"train_loss": -6.127411365509033, "global_step": 69706, "epoch": 1659} {"train_loss": -6.068711280822754, "global_step": 69707, "epoch": 1659} {"train_loss": -6.013996124267578, "global_step": 69708, "epoch": 1659} {"train_loss": -6.033652305603027, "global_step": 69709, "epoch": 1659} {"train_loss": -6.001590251922607, "global_step": 69710, "epoch": 1659} {"train_loss": -6.116693496704102, "global_step": 69711, "epoch": 1659} {"train_loss": -6.061995983123779, "global_step": 69712, "epoch": 1659} {"train_loss": -6.011853218078613, "global_step": 69713, "epoch": 1659} {"train_loss": -5.844329833984375, "global_step": 69714, "epoch": 1659} {"train_loss": -5.995291709899902, "global_step": 69715, "epoch": 1659} {"train_loss": -6.037683486938477, "global_step": 69716, "epoch": 1659} {"train_loss": -6.002344131469727, "global_step": 69717, "epoch": 1659} {"train_loss": -5.962098598480225, "global_step": 69718, "epoch": 1659} {"train_loss": -6.027063642229352, "global_step": 69719, "epoch": 1659, "val_loss": 61814.65234375} {"train_loss": -6.086665153503418, "global_step": 69720, "epoch": 1660} {"train_loss": -6.083959579467773, "global_step": 69721, "epoch": 1660} {"train_loss": -6.095036506652832, "global_step": 69722, "epoch": 1660} {"train_loss": -6.0316643714904785, "global_step": 69723, "epoch": 1660} {"train_loss": -6.076575756072998, "global_step": 69724, "epoch": 1660} {"train_loss": -6.028697967529297, "global_step": 69725, "epoch": 1660} {"train_loss": -6.0704851150512695, "global_step": 69726, "epoch": 1660} {"train_loss": -6.088678359985352, "global_step": 69727, "epoch": 1660} {"train_loss": -6.164325714111328, "global_step": 69728, "epoch": 1660} {"train_loss": -5.961243629455566, "global_step": 69729, "epoch": 1660} {"train_loss": -5.987894058227539, "global_step": 69730, "epoch": 1660} {"train_loss": -6.0532917976379395, "global_step": 69731, "epoch": 1660} {"train_loss": -6.035663604736328, "global_step": 69732, "epoch": 1660} {"train_loss": -5.8482818603515625, "global_step": 69733, "epoch": 1660} {"train_loss": -5.93613338470459, "global_step": 69734, "epoch": 1660} {"train_loss": -6.010676383972168, "global_step": 69735, "epoch": 1660} {"train_loss": -5.851816177368164, "global_step": 69736, "epoch": 1660} {"train_loss": -6.071014881134033, "global_step": 69737, "epoch": 1660} {"train_loss": -5.974928855895996, "global_step": 69738, "epoch": 1660} {"train_loss": -5.997045516967773, "global_step": 69739, "epoch": 1660} {"train_loss": -6.116970062255859, "global_step": 69740, "epoch": 1660} {"train_loss": -6.07769775390625, "global_step": 69741, "epoch": 1660} {"train_loss": -5.929938316345215, "global_step": 69742, "epoch": 1660} {"train_loss": -6.030622959136963, "global_step": 69743, "epoch": 1660} {"train_loss": -6.086615085601807, "global_step": 69744, "epoch": 1660} {"train_loss": -5.976742744445801, "global_step": 69745, "epoch": 1660} {"train_loss": -5.957676887512207, "global_step": 69746, "epoch": 1660} {"train_loss": -6.0987868309021, "global_step": 69747, "epoch": 1660} {"train_loss": -5.931173801422119, "global_step": 69748, "epoch": 1660} {"train_loss": -6.07701301574707, "global_step": 69749, "epoch": 1660} {"train_loss": -6.085885524749756, "global_step": 69750, "epoch": 1660} {"train_loss": -5.92437744140625, "global_step": 69751, "epoch": 1660} {"train_loss": -5.897849082946777, "global_step": 69752, "epoch": 1660} {"train_loss": -5.766228675842285, "global_step": 69753, "epoch": 1660} {"train_loss": -5.928192615509033, "global_step": 69754, "epoch": 1660} {"train_loss": -6.079437255859375, "global_step": 69755, "epoch": 1660} {"train_loss": -5.795536994934082, "global_step": 69756, "epoch": 1660} {"train_loss": -6.004429817199707, "global_step": 69757, "epoch": 1660} {"train_loss": -5.917844295501709, "global_step": 69758, "epoch": 1660} {"train_loss": -5.835052490234375, "global_step": 69759, "epoch": 1660} {"train_loss": -6.054851531982422, "global_step": 69760, "epoch": 1660} {"train_loss": -6.000105233419509, "global_step": 69761, "epoch": 1660, "val_loss": 61766.1328125} {"train_loss": -5.995580196380615, "global_step": 69762, "epoch": 1661} {"train_loss": -5.9514312744140625, "global_step": 69763, "epoch": 1661} {"train_loss": -5.984443664550781, "global_step": 69764, "epoch": 1661} {"train_loss": -6.09885311126709, "global_step": 69765, "epoch": 1661} {"train_loss": -5.938108921051025, "global_step": 69766, "epoch": 1661} {"train_loss": -6.056695938110352, "global_step": 69767, "epoch": 1661} {"train_loss": -5.865994453430176, "global_step": 69768, "epoch": 1661} {"train_loss": -6.037407875061035, "global_step": 69769, "epoch": 1661} {"train_loss": -6.001609802246094, "global_step": 69770, "epoch": 1661} {"train_loss": -5.955644130706787, "global_step": 69771, "epoch": 1661} {"train_loss": -5.99920654296875, "global_step": 69772, "epoch": 1661} {"train_loss": -6.037411212921143, "global_step": 69773, "epoch": 1661} {"train_loss": -6.123680114746094, "global_step": 69774, "epoch": 1661} {"train_loss": -6.051741600036621, "global_step": 69775, "epoch": 1661} {"train_loss": -6.046477317810059, "global_step": 69776, "epoch": 1661} {"train_loss": -6.053789138793945, "global_step": 69777, "epoch": 1661} {"train_loss": -6.073215484619141, "global_step": 69778, "epoch": 1661} {"train_loss": -6.174822807312012, "global_step": 69779, "epoch": 1661} {"train_loss": -6.018071174621582, "global_step": 69780, "epoch": 1661} {"train_loss": -6.132445335388184, "global_step": 69781, "epoch": 1661} {"train_loss": -6.042846202850342, "global_step": 69782, "epoch": 1661} {"train_loss": -5.955494403839111, "global_step": 69783, "epoch": 1661} {"train_loss": -5.962344169616699, "global_step": 69784, "epoch": 1661} {"train_loss": -6.055844783782959, "global_step": 69785, "epoch": 1661} {"train_loss": -6.011974811553955, "global_step": 69786, "epoch": 1661} {"train_loss": -6.070376396179199, "global_step": 69787, "epoch": 1661} {"train_loss": -6.007966041564941, "global_step": 69788, "epoch": 1661} {"train_loss": -6.097894668579102, "global_step": 69789, "epoch": 1661} {"train_loss": -6.03150749206543, "global_step": 69790, "epoch": 1661} {"train_loss": -5.997932434082031, "global_step": 69791, "epoch": 1661} {"train_loss": -5.982146263122559, "global_step": 69792, "epoch": 1661} {"train_loss": -5.95588493347168, "global_step": 69793, "epoch": 1661} {"train_loss": -5.964018821716309, "global_step": 69794, "epoch": 1661} {"train_loss": -5.870105743408203, "global_step": 69795, "epoch": 1661} {"train_loss": -6.041806221008301, "global_step": 69796, "epoch": 1661} {"train_loss": -6.054228782653809, "global_step": 69797, "epoch": 1661} {"train_loss": -6.096899509429932, "global_step": 69798, "epoch": 1661} {"train_loss": -6.124677658081055, "global_step": 69799, "epoch": 1661} {"train_loss": -5.91899299621582, "global_step": 69800, "epoch": 1661} {"train_loss": -6.123019218444824, "global_step": 69801, "epoch": 1661} {"train_loss": -6.02644157409668, "global_step": 69802, "epoch": 1661} {"train_loss": -6.025105465026129, "global_step": 69803, "epoch": 1661, "val_loss": 61674.8359375} {"train_loss": -6.014804840087891, "global_step": 69804, "epoch": 1662} {"train_loss": -5.980928897857666, "global_step": 69805, "epoch": 1662} {"train_loss": -6.081176280975342, "global_step": 69806, "epoch": 1662} {"train_loss": -5.919391632080078, "global_step": 69807, "epoch": 1662} {"train_loss": -5.992095947265625, "global_step": 69808, "epoch": 1662} {"train_loss": -6.0455474853515625, "global_step": 69809, "epoch": 1662} {"train_loss": -6.007637023925781, "global_step": 69810, "epoch": 1662} {"train_loss": -6.147244930267334, "global_step": 69811, "epoch": 1662} {"train_loss": -5.985387802124023, "global_step": 69812, "epoch": 1662} {"train_loss": -6.025139808654785, "global_step": 69813, "epoch": 1662} {"train_loss": -6.103375434875488, "global_step": 69814, "epoch": 1662} {"train_loss": -6.069298267364502, "global_step": 69815, "epoch": 1662} {"train_loss": -5.931089401245117, "global_step": 69816, "epoch": 1662} {"train_loss": -6.038003444671631, "global_step": 69817, "epoch": 1662} {"train_loss": -6.049262046813965, "global_step": 69818, "epoch": 1662} {"train_loss": -6.152172088623047, "global_step": 69819, "epoch": 1662} {"train_loss": -6.020885467529297, "global_step": 69820, "epoch": 1662} {"train_loss": -6.143667221069336, "global_step": 69821, "epoch": 1662} {"train_loss": -6.02250862121582, "global_step": 69822, "epoch": 1662} {"train_loss": -6.132590293884277, "global_step": 69823, "epoch": 1662} {"train_loss": -5.983660697937012, "global_step": 69824, "epoch": 1662} {"train_loss": -6.050937652587891, "global_step": 69825, "epoch": 1662} {"train_loss": -5.954708099365234, "global_step": 69826, "epoch": 1662} {"train_loss": -6.126321792602539, "global_step": 69827, "epoch": 1662} {"train_loss": -5.971247673034668, "global_step": 69828, "epoch": 1662} {"train_loss": -6.1281280517578125, "global_step": 69829, "epoch": 1662} {"train_loss": -5.999938011169434, "global_step": 69830, "epoch": 1662} {"train_loss": -5.88582706451416, "global_step": 69831, "epoch": 1662} {"train_loss": -6.025819301605225, "global_step": 69832, "epoch": 1662} {"train_loss": -6.014878749847412, "global_step": 69833, "epoch": 1662} {"train_loss": -5.997532367706299, "global_step": 69834, "epoch": 1662} {"train_loss": -6.044129848480225, "global_step": 69835, "epoch": 1662} {"train_loss": -6.064520359039307, "global_step": 69836, "epoch": 1662} {"train_loss": -5.981093406677246, "global_step": 69837, "epoch": 1662} {"train_loss": -6.019181251525879, "global_step": 69838, "epoch": 1662} {"train_loss": -6.053075790405273, "global_step": 69839, "epoch": 1662} {"train_loss": -6.047677516937256, "global_step": 69840, "epoch": 1662} {"train_loss": -6.014872074127197, "global_step": 69841, "epoch": 1662} {"train_loss": -6.010586738586426, "global_step": 69842, "epoch": 1662} {"train_loss": -6.042585372924805, "global_step": 69843, "epoch": 1662} {"train_loss": -5.953309535980225, "global_step": 69844, "epoch": 1662} {"train_loss": -6.030425253368559, "global_step": 69845, "epoch": 1662, "val_loss": 61662.984375} {"train_loss": -6.017861843109131, "global_step": 69846, "epoch": 1663} {"train_loss": -6.10344123840332, "global_step": 69847, "epoch": 1663} {"train_loss": -6.0408406257629395, "global_step": 69848, "epoch": 1663} {"train_loss": -6.024089336395264, "global_step": 69849, "epoch": 1663} {"train_loss": -6.146869659423828, "global_step": 69850, "epoch": 1663} {"train_loss": -6.009449481964111, "global_step": 69851, "epoch": 1663} {"train_loss": -5.983316898345947, "global_step": 69852, "epoch": 1663} {"train_loss": -5.984167575836182, "global_step": 69853, "epoch": 1663} {"train_loss": -6.000869274139404, "global_step": 69854, "epoch": 1663} {"train_loss": -6.113679885864258, "global_step": 69855, "epoch": 1663} {"train_loss": -6.086933135986328, "global_step": 69856, "epoch": 1663} {"train_loss": -6.02192497253418, "global_step": 69857, "epoch": 1663} {"train_loss": -6.005670547485352, "global_step": 69858, "epoch": 1663} {"train_loss": -6.051840782165527, "global_step": 69859, "epoch": 1663} {"train_loss": -5.99130916595459, "global_step": 69860, "epoch": 1663} {"train_loss": -5.943497657775879, "global_step": 69861, "epoch": 1663} {"train_loss": -6.042877197265625, "global_step": 69862, "epoch": 1663} {"train_loss": -6.072281837463379, "global_step": 69863, "epoch": 1663} {"train_loss": -6.069754123687744, "global_step": 69864, "epoch": 1663} {"train_loss": -6.072902679443359, "global_step": 69865, "epoch": 1663} {"train_loss": -6.073617935180664, "global_step": 69866, "epoch": 1663} {"train_loss": -5.988912582397461, "global_step": 69867, "epoch": 1663} {"train_loss": -6.126624584197998, "global_step": 69868, "epoch": 1663} {"train_loss": -5.97214412689209, "global_step": 69869, "epoch": 1663} {"train_loss": -6.080954074859619, "global_step": 69870, "epoch": 1663} {"train_loss": -5.949885368347168, "global_step": 69871, "epoch": 1663} {"train_loss": -6.0565290451049805, "global_step": 69872, "epoch": 1663} {"train_loss": -5.986240386962891, "global_step": 69873, "epoch": 1663} {"train_loss": -6.058854103088379, "global_step": 69874, "epoch": 1663} {"train_loss": -6.124549388885498, "global_step": 69875, "epoch": 1663} {"train_loss": -5.971076488494873, "global_step": 69876, "epoch": 1663} {"train_loss": -5.86905574798584, "global_step": 69877, "epoch": 1663} {"train_loss": -6.100707054138184, "global_step": 69878, "epoch": 1663} {"train_loss": -6.03334379196167, "global_step": 69879, "epoch": 1663} {"train_loss": -6.013509750366211, "global_step": 69880, "epoch": 1663} {"train_loss": -6.016439437866211, "global_step": 69881, "epoch": 1663} {"train_loss": -5.965881824493408, "global_step": 69882, "epoch": 1663} {"train_loss": -5.954618453979492, "global_step": 69883, "epoch": 1663} {"train_loss": -5.975315570831299, "global_step": 69884, "epoch": 1663} {"train_loss": -6.063991546630859, "global_step": 69885, "epoch": 1663} {"train_loss": -5.946925163269043, "global_step": 69886, "epoch": 1663} {"train_loss": -6.026297796340216, "global_step": 69887, "epoch": 1663, "val_loss": 61608.09375} {"train_loss": -6.021426200866699, "global_step": 69888, "epoch": 1664} {"train_loss": -5.974273681640625, "global_step": 69889, "epoch": 1664} {"train_loss": -6.048482894897461, "global_step": 69890, "epoch": 1664} {"train_loss": -5.977680683135986, "global_step": 69891, "epoch": 1664} {"train_loss": -5.871866226196289, "global_step": 69892, "epoch": 1664} {"train_loss": -6.067625999450684, "global_step": 69893, "epoch": 1664} {"train_loss": -5.906116008758545, "global_step": 69894, "epoch": 1664} {"train_loss": -6.02080774307251, "global_step": 69895, "epoch": 1664} {"train_loss": -5.891241073608398, "global_step": 69896, "epoch": 1664} {"train_loss": -5.988390922546387, "global_step": 69897, "epoch": 1664} {"train_loss": -6.083586692810059, "global_step": 69898, "epoch": 1664} {"train_loss": -6.173982620239258, "global_step": 69899, "epoch": 1664} {"train_loss": -6.0883870124816895, "global_step": 69900, "epoch": 1664} {"train_loss": -6.1768035888671875, "global_step": 69901, "epoch": 1664} {"train_loss": -6.0959978103637695, "global_step": 69902, "epoch": 1664} {"train_loss": -6.101351737976074, "global_step": 69903, "epoch": 1664} {"train_loss": -6.000978946685791, "global_step": 69904, "epoch": 1664} {"train_loss": -6.047643184661865, "global_step": 69905, "epoch": 1664} {"train_loss": -6.097870826721191, "global_step": 69906, "epoch": 1664} {"train_loss": -5.9525041580200195, "global_step": 69907, "epoch": 1664} {"train_loss": -6.0030012130737305, "global_step": 69908, "epoch": 1664} {"train_loss": -6.017532825469971, "global_step": 69909, "epoch": 1664} {"train_loss": -5.947111129760742, "global_step": 69910, "epoch": 1664} {"train_loss": -5.925534248352051, "global_step": 69911, "epoch": 1664} {"train_loss": -6.14102840423584, "global_step": 69912, "epoch": 1664} {"train_loss": -6.0129241943359375, "global_step": 69913, "epoch": 1664} {"train_loss": -6.0238142013549805, "global_step": 69914, "epoch": 1664} {"train_loss": -6.026713848114014, "global_step": 69915, "epoch": 1664} {"train_loss": -5.961045265197754, "global_step": 69916, "epoch": 1664} {"train_loss": -5.904662132263184, "global_step": 69917, "epoch": 1664} {"train_loss": -6.024811744689941, "global_step": 69918, "epoch": 1664} {"train_loss": -5.980327606201172, "global_step": 69919, "epoch": 1664} {"train_loss": -5.87677001953125, "global_step": 69920, "epoch": 1664} {"train_loss": -6.126859664916992, "global_step": 69921, "epoch": 1664} {"train_loss": -6.046522617340088, "global_step": 69922, "epoch": 1664} {"train_loss": -5.8360185623168945, "global_step": 69923, "epoch": 1664} {"train_loss": -5.994932174682617, "global_step": 69924, "epoch": 1664} {"train_loss": -5.750357627868652, "global_step": 69925, "epoch": 1664} {"train_loss": -6.038291931152344, "global_step": 69926, "epoch": 1664} {"train_loss": -5.9361066818237305, "global_step": 69927, "epoch": 1664} {"train_loss": -5.946496963500977, "global_step": 69928, "epoch": 1664} {"train_loss": -6.006387619745164, "global_step": 69929, "epoch": 1664, "val_loss": 61789.22265625} {"train_loss": -5.951848030090332, "global_step": 69930, "epoch": 1665} {"train_loss": -6.0159010887146, "global_step": 69931, "epoch": 1665} {"train_loss": -6.03580379486084, "global_step": 69932, "epoch": 1665} {"train_loss": -6.050082206726074, "global_step": 69933, "epoch": 1665} {"train_loss": -5.9757232666015625, "global_step": 69934, "epoch": 1665} {"train_loss": -5.968640327453613, "global_step": 69935, "epoch": 1665} {"train_loss": -5.991194725036621, "global_step": 69936, "epoch": 1665} {"train_loss": -5.977719783782959, "global_step": 69937, "epoch": 1665} {"train_loss": -5.970766067504883, "global_step": 69938, "epoch": 1665} {"train_loss": -5.964420318603516, "global_step": 69939, "epoch": 1665} {"train_loss": -6.002192497253418, "global_step": 69940, "epoch": 1665} {"train_loss": -5.885833740234375, "global_step": 69941, "epoch": 1665} {"train_loss": -6.010228157043457, "global_step": 69942, "epoch": 1665} {"train_loss": -5.7822160720825195, "global_step": 69943, "epoch": 1665} {"train_loss": -5.962640285491943, "global_step": 69944, "epoch": 1665} {"train_loss": -5.910996437072754, "global_step": 69945, "epoch": 1665} {"train_loss": -5.829111099243164, "global_step": 69946, "epoch": 1665} {"train_loss": -5.980030059814453, "global_step": 69947, "epoch": 1665} {"train_loss": -5.949762344360352, "global_step": 69948, "epoch": 1665} {"train_loss": -6.082879066467285, "global_step": 69949, "epoch": 1665} {"train_loss": -5.858035087585449, "global_step": 69950, "epoch": 1665} {"train_loss": -5.903702735900879, "global_step": 69951, "epoch": 1665} {"train_loss": -6.037825107574463, "global_step": 69952, "epoch": 1665} {"train_loss": -6.008281230926514, "global_step": 69953, "epoch": 1665} {"train_loss": -6.042824745178223, "global_step": 69954, "epoch": 1665} {"train_loss": -5.984165191650391, "global_step": 69955, "epoch": 1665} {"train_loss": -6.058584690093994, "global_step": 69956, "epoch": 1665} {"train_loss": -6.061453342437744, "global_step": 69957, "epoch": 1665} {"train_loss": -6.08333683013916, "global_step": 69958, "epoch": 1665} {"train_loss": -6.119555473327637, "global_step": 69959, "epoch": 1665} {"train_loss": -6.085883140563965, "global_step": 69960, "epoch": 1665} {"train_loss": -5.999876976013184, "global_step": 69961, "epoch": 1665} {"train_loss": -6.026310920715332, "global_step": 69962, "epoch": 1665} {"train_loss": -6.013200283050537, "global_step": 69963, "epoch": 1665} {"train_loss": -6.078116416931152, "global_step": 69964, "epoch": 1665} {"train_loss": -5.963896751403809, "global_step": 69965, "epoch": 1665} {"train_loss": -6.060884952545166, "global_step": 69966, "epoch": 1665} {"train_loss": -5.977145671844482, "global_step": 69967, "epoch": 1665} {"train_loss": -5.879487037658691, "global_step": 69968, "epoch": 1665} {"train_loss": -6.017535209655762, "global_step": 69969, "epoch": 1665} {"train_loss": -5.958609104156494, "global_step": 69970, "epoch": 1665} {"train_loss": -5.988550356456211, "global_step": 69971, "epoch": 1665, "val_loss": 61480.9453125} {"train_loss": -6.055872917175293, "global_step": 69972, "epoch": 1666} {"train_loss": -6.002750396728516, "global_step": 69973, "epoch": 1666} {"train_loss": -6.104516506195068, "global_step": 69974, "epoch": 1666} {"train_loss": -6.096080780029297, "global_step": 69975, "epoch": 1666} {"train_loss": -6.075223445892334, "global_step": 69976, "epoch": 1666} {"train_loss": -6.095377445220947, "global_step": 69977, "epoch": 1666} {"train_loss": -5.988887310028076, "global_step": 69978, "epoch": 1666} {"train_loss": -6.058101177215576, "global_step": 69979, "epoch": 1666} {"train_loss": -6.128008842468262, "global_step": 69980, "epoch": 1666} {"train_loss": -6.026968479156494, "global_step": 69981, "epoch": 1666} {"train_loss": -6.112803936004639, "global_step": 69982, "epoch": 1666} {"train_loss": -5.970409393310547, "global_step": 69983, "epoch": 1666} {"train_loss": -5.941259860992432, "global_step": 69984, "epoch": 1666} {"train_loss": -5.935492515563965, "global_step": 69985, "epoch": 1666} {"train_loss": -5.92186975479126, "global_step": 69986, "epoch": 1666} {"train_loss": -5.915421485900879, "global_step": 69987, "epoch": 1666} {"train_loss": -6.105100631713867, "global_step": 69988, "epoch": 1666} {"train_loss": -6.039188385009766, "global_step": 69989, "epoch": 1666} {"train_loss": -6.001777648925781, "global_step": 69990, "epoch": 1666} {"train_loss": -5.9933857917785645, "global_step": 69991, "epoch": 1666} {"train_loss": -5.905138969421387, "global_step": 69992, "epoch": 1666} {"train_loss": -6.03997278213501, "global_step": 69993, "epoch": 1666} {"train_loss": -6.0320892333984375, "global_step": 69994, "epoch": 1666} {"train_loss": -5.955249786376953, "global_step": 69995, "epoch": 1666} {"train_loss": -6.047835350036621, "global_step": 69996, "epoch": 1666} {"train_loss": -6.014046669006348, "global_step": 69997, "epoch": 1666} {"train_loss": -6.111607074737549, "global_step": 69998, "epoch": 1666} {"train_loss": -6.0221405029296875, "global_step": 69999, "epoch": 1666} {"train_loss": -6.097075939178467, "global_step": 70000, "epoch": 1666} {"train_loss": -5.940988540649414, "global_step": 70001, "epoch": 1666} {"train_loss": -6.027401447296143, "global_step": 70002, "epoch": 1666} {"train_loss": -6.125728607177734, "global_step": 70003, "epoch": 1666} {"train_loss": -6.105630397796631, "global_step": 70004, "epoch": 1666} {"train_loss": -6.021823883056641, "global_step": 70005, "epoch": 1666} {"train_loss": -6.103254318237305, "global_step": 70006, "epoch": 1666} {"train_loss": -5.859346389770508, "global_step": 70007, "epoch": 1666} {"train_loss": -5.9430718421936035, "global_step": 70008, "epoch": 1666} {"train_loss": -5.950947284698486, "global_step": 70009, "epoch": 1666} {"train_loss": -5.965180397033691, "global_step": 70010, "epoch": 1666} {"train_loss": -6.004255294799805, "global_step": 70011, "epoch": 1666} {"train_loss": -6.084561824798584, "global_step": 70012, "epoch": 1666} {"train_loss": -6.02319842293149, "global_step": 70013, "epoch": 1666, "val_loss": 61864.3203125} {"train_loss": -5.987043857574463, "global_step": 70014, "epoch": 1667} {"train_loss": -6.070228576660156, "global_step": 70015, "epoch": 1667} {"train_loss": -6.020219802856445, "global_step": 70016, "epoch": 1667} {"train_loss": -6.0213470458984375, "global_step": 70017, "epoch": 1667} {"train_loss": -5.928751468658447, "global_step": 70018, "epoch": 1667} {"train_loss": -5.943702697753906, "global_step": 70019, "epoch": 1667} {"train_loss": -5.986142635345459, "global_step": 70020, "epoch": 1667} {"train_loss": -6.0082831382751465, "global_step": 70021, "epoch": 1667} {"train_loss": -5.991156578063965, "global_step": 70022, "epoch": 1667} {"train_loss": -6.0345845222473145, "global_step": 70023, "epoch": 1667} {"train_loss": -5.993022918701172, "global_step": 70024, "epoch": 1667} {"train_loss": -5.983160018920898, "global_step": 70025, "epoch": 1667} {"train_loss": -5.916266918182373, "global_step": 70026, "epoch": 1667} {"train_loss": -5.970208168029785, "global_step": 70027, "epoch": 1667} {"train_loss": -6.113225936889648, "global_step": 70028, "epoch": 1667} {"train_loss": -5.890690326690674, "global_step": 70029, "epoch": 1667} {"train_loss": -6.013420581817627, "global_step": 70030, "epoch": 1667} {"train_loss": -6.039941787719727, "global_step": 70031, "epoch": 1667} {"train_loss": -6.065715312957764, "global_step": 70032, "epoch": 1667} {"train_loss": -5.9305572509765625, "global_step": 70033, "epoch": 1667} {"train_loss": -6.054163455963135, "global_step": 70034, "epoch": 1667} {"train_loss": -5.899274826049805, "global_step": 70035, "epoch": 1667} {"train_loss": -6.082322120666504, "global_step": 70036, "epoch": 1667} {"train_loss": -6.146862030029297, "global_step": 70037, "epoch": 1667} {"train_loss": -5.997862339019775, "global_step": 70038, "epoch": 1667} {"train_loss": -6.071033000946045, "global_step": 70039, "epoch": 1667} {"train_loss": -6.005528450012207, "global_step": 70040, "epoch": 1667} {"train_loss": -6.130461692810059, "global_step": 70041, "epoch": 1667} {"train_loss": -6.072486400604248, "global_step": 70042, "epoch": 1667} {"train_loss": -6.009921073913574, "global_step": 70043, "epoch": 1667} {"train_loss": -6.026821136474609, "global_step": 70044, "epoch": 1667} {"train_loss": -6.0023674964904785, "global_step": 70045, "epoch": 1667} {"train_loss": -6.042961120605469, "global_step": 70046, "epoch": 1667} {"train_loss": -5.9981231689453125, "global_step": 70047, "epoch": 1667} {"train_loss": -6.089766502380371, "global_step": 70048, "epoch": 1667} {"train_loss": -6.032700538635254, "global_step": 70049, "epoch": 1667} {"train_loss": -6.15559196472168, "global_step": 70050, "epoch": 1667} {"train_loss": -6.0479817390441895, "global_step": 70051, "epoch": 1667} {"train_loss": -6.12004280090332, "global_step": 70052, "epoch": 1667} {"train_loss": -6.015439987182617, "global_step": 70053, "epoch": 1667} {"train_loss": -6.132613658905029, "global_step": 70054, "epoch": 1667} {"train_loss": -6.024231570107596, "global_step": 70055, "epoch": 1667, "val_loss": 61388.765625} {"train_loss": -6.0047712326049805, "global_step": 70056, "epoch": 1668} {"train_loss": -6.098658561706543, "global_step": 70057, "epoch": 1668} {"train_loss": -6.077461242675781, "global_step": 70058, "epoch": 1668} {"train_loss": -5.978322982788086, "global_step": 70059, "epoch": 1668} {"train_loss": -6.049945831298828, "global_step": 70060, "epoch": 1668} {"train_loss": -6.04164457321167, "global_step": 70061, "epoch": 1668} {"train_loss": -6.042004585266113, "global_step": 70062, "epoch": 1668} {"train_loss": -5.936008453369141, "global_step": 70063, "epoch": 1668} {"train_loss": -5.964109897613525, "global_step": 70064, "epoch": 1668} {"train_loss": -5.947684288024902, "global_step": 70065, "epoch": 1668} {"train_loss": -5.959445953369141, "global_step": 70066, "epoch": 1668} {"train_loss": -5.967044830322266, "global_step": 70067, "epoch": 1668} {"train_loss": -5.905198097229004, "global_step": 70068, "epoch": 1668} {"train_loss": -5.98936653137207, "global_step": 70069, "epoch": 1668} {"train_loss": -6.0724897384643555, "global_step": 70070, "epoch": 1668} {"train_loss": -5.884879112243652, "global_step": 70071, "epoch": 1668} {"train_loss": -5.942922592163086, "global_step": 70072, "epoch": 1668} {"train_loss": -6.011345863342285, "global_step": 70073, "epoch": 1668} {"train_loss": -6.068298816680908, "global_step": 70074, "epoch": 1668} {"train_loss": -5.977366924285889, "global_step": 70075, "epoch": 1668} {"train_loss": -6.133457183837891, "global_step": 70076, "epoch": 1668} {"train_loss": -6.031201362609863, "global_step": 70077, "epoch": 1668} {"train_loss": -6.078023910522461, "global_step": 70078, "epoch": 1668} {"train_loss": -5.956447124481201, "global_step": 70079, "epoch": 1668} {"train_loss": -6.043203353881836, "global_step": 70080, "epoch": 1668} {"train_loss": -6.161698818206787, "global_step": 70081, "epoch": 1668} {"train_loss": -5.944293975830078, "global_step": 70082, "epoch": 1668} {"train_loss": -6.01972770690918, "global_step": 70083, "epoch": 1668} {"train_loss": -6.021307945251465, "global_step": 70084, "epoch": 1668} {"train_loss": -5.997725963592529, "global_step": 70085, "epoch": 1668} {"train_loss": -6.059284210205078, "global_step": 70086, "epoch": 1668} {"train_loss": -6.095308303833008, "global_step": 70087, "epoch": 1668} {"train_loss": -6.084546089172363, "global_step": 70088, "epoch": 1668} {"train_loss": -6.0849809646606445, "global_step": 70089, "epoch": 1668} {"train_loss": -5.734956741333008, "global_step": 70090, "epoch": 1668} {"train_loss": -5.900754451751709, "global_step": 70091, "epoch": 1668} {"train_loss": -5.88977575302124, "global_step": 70092, "epoch": 1668} {"train_loss": -5.782014846801758, "global_step": 70093, "epoch": 1668} {"train_loss": -6.011319637298584, "global_step": 70094, "epoch": 1668} {"train_loss": -5.911323547363281, "global_step": 70095, "epoch": 1668} {"train_loss": -5.954679489135742, "global_step": 70096, "epoch": 1668} {"train_loss": -5.994029737654186, "global_step": 70097, "epoch": 1668, "val_loss": 61867.296875} {"train_loss": -6.063265800476074, "global_step": 70098, "epoch": 1669} {"train_loss": -5.962512969970703, "global_step": 70099, "epoch": 1669} {"train_loss": -5.877976894378662, "global_step": 70100, "epoch": 1669} {"train_loss": -6.005941867828369, "global_step": 70101, "epoch": 1669} {"train_loss": -5.936304092407227, "global_step": 70102, "epoch": 1669} {"train_loss": -6.046572685241699, "global_step": 70103, "epoch": 1669} {"train_loss": -5.959168434143066, "global_step": 70104, "epoch": 1669} {"train_loss": -6.069438934326172, "global_step": 70105, "epoch": 1669} {"train_loss": -5.972662925720215, "global_step": 70106, "epoch": 1669} {"train_loss": -6.008833885192871, "global_step": 70107, "epoch": 1669} {"train_loss": -5.824077606201172, "global_step": 70108, "epoch": 1669} {"train_loss": -5.964156627655029, "global_step": 70109, "epoch": 1669} {"train_loss": -5.951480865478516, "global_step": 70110, "epoch": 1669} {"train_loss": -6.129827499389648, "global_step": 70111, "epoch": 1669} {"train_loss": -6.056064605712891, "global_step": 70112, "epoch": 1669} {"train_loss": -5.980755805969238, "global_step": 70113, "epoch": 1669} {"train_loss": -5.99034309387207, "global_step": 70114, "epoch": 1669} {"train_loss": -6.139740943908691, "global_step": 70115, "epoch": 1669} {"train_loss": -6.0246734619140625, "global_step": 70116, "epoch": 1669} {"train_loss": -5.985395431518555, "global_step": 70117, "epoch": 1669} {"train_loss": -6.081738471984863, "global_step": 70118, "epoch": 1669} {"train_loss": -6.112457275390625, "global_step": 70119, "epoch": 1669} {"train_loss": -5.930651664733887, "global_step": 70120, "epoch": 1669} {"train_loss": -6.104727268218994, "global_step": 70121, "epoch": 1669} {"train_loss": -6.117330551147461, "global_step": 70122, "epoch": 1669} {"train_loss": -6.029153823852539, "global_step": 70123, "epoch": 1669} {"train_loss": -6.039005279541016, "global_step": 70124, "epoch": 1669} {"train_loss": -6.017003059387207, "global_step": 70125, "epoch": 1669} {"train_loss": -6.169363021850586, "global_step": 70126, "epoch": 1669} {"train_loss": -6.118931770324707, "global_step": 70127, "epoch": 1669} {"train_loss": -6.041985988616943, "global_step": 70128, "epoch": 1669} {"train_loss": -6.154567718505859, "global_step": 70129, "epoch": 1669} {"train_loss": -5.990217208862305, "global_step": 70130, "epoch": 1669} {"train_loss": -5.943309783935547, "global_step": 70131, "epoch": 1669} {"train_loss": -5.993275165557861, "global_step": 70132, "epoch": 1669} {"train_loss": -6.115394592285156, "global_step": 70133, "epoch": 1669} {"train_loss": -5.846297264099121, "global_step": 70134, "epoch": 1669} {"train_loss": -5.925683975219727, "global_step": 70135, "epoch": 1669} {"train_loss": -6.020383834838867, "global_step": 70136, "epoch": 1669} {"train_loss": -5.930275917053223, "global_step": 70137, "epoch": 1669} {"train_loss": -5.948850631713867, "global_step": 70138, "epoch": 1669} {"train_loss": -6.014911810557048, "global_step": 70139, "epoch": 1669, "val_loss": 61589.5546875} {"train_loss": -6.10273551940918, "global_step": 70140, "epoch": 1670} {"train_loss": -6.024745941162109, "global_step": 70141, "epoch": 1670} {"train_loss": -6.034107208251953, "global_step": 70142, "epoch": 1670} {"train_loss": -5.999460220336914, "global_step": 70143, "epoch": 1670} {"train_loss": -5.987610816955566, "global_step": 70144, "epoch": 1670} {"train_loss": -6.108539581298828, "global_step": 70145, "epoch": 1670} {"train_loss": -6.120238304138184, "global_step": 70146, "epoch": 1670} {"train_loss": -6.031352996826172, "global_step": 70147, "epoch": 1670} {"train_loss": -6.030126094818115, "global_step": 70148, "epoch": 1670} {"train_loss": -6.041625022888184, "global_step": 70149, "epoch": 1670} {"train_loss": -6.007537841796875, "global_step": 70150, "epoch": 1670} {"train_loss": -6.0446624755859375, "global_step": 70151, "epoch": 1670} {"train_loss": -6.118832111358643, "global_step": 70152, "epoch": 1670} {"train_loss": -6.1394853591918945, "global_step": 70153, "epoch": 1670} {"train_loss": -6.127664566040039, "global_step": 70154, "epoch": 1670} {"train_loss": -6.167342185974121, "global_step": 70155, "epoch": 1670} {"train_loss": -5.962882041931152, "global_step": 70156, "epoch": 1670} {"train_loss": -6.169119358062744, "global_step": 70157, "epoch": 1670} {"train_loss": -6.113828659057617, "global_step": 70158, "epoch": 1670} {"train_loss": -5.969654083251953, "global_step": 70159, "epoch": 1670} {"train_loss": -5.998655319213867, "global_step": 70160, "epoch": 1670} {"train_loss": -6.172877311706543, "global_step": 70161, "epoch": 1670} {"train_loss": -6.014014720916748, "global_step": 70162, "epoch": 1670} {"train_loss": -5.9188385009765625, "global_step": 70163, "epoch": 1670} {"train_loss": -6.030375957489014, "global_step": 70164, "epoch": 1670} {"train_loss": -6.132423400878906, "global_step": 70165, "epoch": 1670} {"train_loss": -6.102777004241943, "global_step": 70166, "epoch": 1670} {"train_loss": -6.170243263244629, "global_step": 70167, "epoch": 1670} {"train_loss": -6.1284332275390625, "global_step": 70168, "epoch": 1670} {"train_loss": -6.096675872802734, "global_step": 70169, "epoch": 1670} {"train_loss": -6.01618766784668, "global_step": 70170, "epoch": 1670} {"train_loss": -6.055354118347168, "global_step": 70171, "epoch": 1670} {"train_loss": -5.968180179595947, "global_step": 70172, "epoch": 1670} {"train_loss": -6.047478199005127, "global_step": 70173, "epoch": 1670} {"train_loss": -6.067090034484863, "global_step": 70174, "epoch": 1670} {"train_loss": -5.9536566734313965, "global_step": 70175, "epoch": 1670} {"train_loss": -6.043436050415039, "global_step": 70176, "epoch": 1670} {"train_loss": -6.038183689117432, "global_step": 70177, "epoch": 1670} {"train_loss": -6.051961421966553, "global_step": 70178, "epoch": 1670} {"train_loss": -5.932244777679443, "global_step": 70179, "epoch": 1670} {"train_loss": -6.073066234588623, "global_step": 70180, "epoch": 1670} {"train_loss": -6.0583081131889704, "global_step": 70181, "epoch": 1670, "val_loss": 61687.61328125} {"train_loss": -6.056148529052734, "global_step": 70182, "epoch": 1671} {"train_loss": -5.968227386474609, "global_step": 70183, "epoch": 1671} {"train_loss": -6.161659240722656, "global_step": 70184, "epoch": 1671} {"train_loss": -5.961979866027832, "global_step": 70185, "epoch": 1671} {"train_loss": -6.1492919921875, "global_step": 70186, "epoch": 1671} {"train_loss": -6.094071865081787, "global_step": 70187, "epoch": 1671} {"train_loss": -6.021767616271973, "global_step": 70188, "epoch": 1671} {"train_loss": -6.096017837524414, "global_step": 70189, "epoch": 1671} {"train_loss": -5.992066860198975, "global_step": 70190, "epoch": 1671} {"train_loss": -6.07745361328125, "global_step": 70191, "epoch": 1671} {"train_loss": -5.918520450592041, "global_step": 70192, "epoch": 1671} {"train_loss": -6.063084125518799, "global_step": 70193, "epoch": 1671} {"train_loss": -6.066089630126953, "global_step": 70194, "epoch": 1671} {"train_loss": -6.031031131744385, "global_step": 70195, "epoch": 1671} {"train_loss": -6.036760330200195, "global_step": 70196, "epoch": 1671} {"train_loss": -5.926301002502441, "global_step": 70197, "epoch": 1671} {"train_loss": -5.989130020141602, "global_step": 70198, "epoch": 1671} {"train_loss": -5.965656280517578, "global_step": 70199, "epoch": 1671} {"train_loss": -6.042747497558594, "global_step": 70200, "epoch": 1671} {"train_loss": -5.928188323974609, "global_step": 70201, "epoch": 1671} {"train_loss": -6.067178726196289, "global_step": 70202, "epoch": 1671} {"train_loss": -5.9357805252075195, "global_step": 70203, "epoch": 1671} {"train_loss": -5.92783784866333, "global_step": 70204, "epoch": 1671} {"train_loss": -5.9345316886901855, "global_step": 70205, "epoch": 1671} {"train_loss": -5.964766502380371, "global_step": 70206, "epoch": 1671} {"train_loss": -5.935832977294922, "global_step": 70207, "epoch": 1671} {"train_loss": -5.978516578674316, "global_step": 70208, "epoch": 1671} {"train_loss": -6.0401835441589355, "global_step": 70209, "epoch": 1671} {"train_loss": -5.986319065093994, "global_step": 70210, "epoch": 1671} {"train_loss": -6.008646488189697, "global_step": 70211, "epoch": 1671} {"train_loss": -5.979547500610352, "global_step": 70212, "epoch": 1671} {"train_loss": -5.986332893371582, "global_step": 70213, "epoch": 1671} {"train_loss": -6.0657196044921875, "global_step": 70214, "epoch": 1671} {"train_loss": -5.958041191101074, "global_step": 70215, "epoch": 1671} {"train_loss": -6.01246452331543, "global_step": 70216, "epoch": 1671} {"train_loss": -5.941305160522461, "global_step": 70217, "epoch": 1671} {"train_loss": -6.0010294914245605, "global_step": 70218, "epoch": 1671} {"train_loss": -6.026098728179932, "global_step": 70219, "epoch": 1671} {"train_loss": -5.975777626037598, "global_step": 70220, "epoch": 1671} {"train_loss": -6.009156227111816, "global_step": 70221, "epoch": 1671} {"train_loss": -6.0539045333862305, "global_step": 70222, "epoch": 1671} {"train_loss": -6.00665637425014, "global_step": 70223, "epoch": 1671, "val_loss": 61249.4453125} {"train_loss": -6.078352928161621, "global_step": 70224, "epoch": 1672} {"train_loss": -5.954070091247559, "global_step": 70225, "epoch": 1672} {"train_loss": -6.012747287750244, "global_step": 70226, "epoch": 1672} {"train_loss": -6.045722484588623, "global_step": 70227, "epoch": 1672} {"train_loss": -5.9703850746154785, "global_step": 70228, "epoch": 1672} {"train_loss": -6.036604881286621, "global_step": 70229, "epoch": 1672} {"train_loss": -5.977273941040039, "global_step": 70230, "epoch": 1672} {"train_loss": -6.009209632873535, "global_step": 70231, "epoch": 1672} {"train_loss": -6.143069267272949, "global_step": 70232, "epoch": 1672} {"train_loss": -6.003605842590332, "global_step": 70233, "epoch": 1672} {"train_loss": -5.985676288604736, "global_step": 70234, "epoch": 1672} {"train_loss": -5.976672649383545, "global_step": 70235, "epoch": 1672} {"train_loss": -6.011778831481934, "global_step": 70236, "epoch": 1672} {"train_loss": -5.939526081085205, "global_step": 70237, "epoch": 1672} {"train_loss": -6.094413757324219, "global_step": 70238, "epoch": 1672} {"train_loss": -5.9457550048828125, "global_step": 70239, "epoch": 1672} {"train_loss": -6.07753324508667, "global_step": 70240, "epoch": 1672} {"train_loss": -6.014050483703613, "global_step": 70241, "epoch": 1672} {"train_loss": -6.035355567932129, "global_step": 70242, "epoch": 1672} {"train_loss": -6.126351833343506, "global_step": 70243, "epoch": 1672} {"train_loss": -6.027285099029541, "global_step": 70244, "epoch": 1672} {"train_loss": -6.08983850479126, "global_step": 70245, "epoch": 1672} {"train_loss": -6.06742525100708, "global_step": 70246, "epoch": 1672} {"train_loss": -6.10498571395874, "global_step": 70247, "epoch": 1672} {"train_loss": -6.004439830780029, "global_step": 70248, "epoch": 1672} {"train_loss": -6.046454429626465, "global_step": 70249, "epoch": 1672} {"train_loss": -6.003195762634277, "global_step": 70250, "epoch": 1672} {"train_loss": -5.945571422576904, "global_step": 70251, "epoch": 1672} {"train_loss": -6.021602153778076, "global_step": 70252, "epoch": 1672} {"train_loss": -6.075697898864746, "global_step": 70253, "epoch": 1672} {"train_loss": -5.990172386169434, "global_step": 70254, "epoch": 1672} {"train_loss": -6.042732238769531, "global_step": 70255, "epoch": 1672} {"train_loss": -6.1353559494018555, "global_step": 70256, "epoch": 1672} {"train_loss": -5.9678192138671875, "global_step": 70257, "epoch": 1672} {"train_loss": -6.040672302246094, "global_step": 70258, "epoch": 1672} {"train_loss": -6.108935832977295, "global_step": 70259, "epoch": 1672} {"train_loss": -6.054375648498535, "global_step": 70260, "epoch": 1672} {"train_loss": -6.101536273956299, "global_step": 70261, "epoch": 1672} {"train_loss": -6.045132637023926, "global_step": 70262, "epoch": 1672} {"train_loss": -6.113011837005615, "global_step": 70263, "epoch": 1672} {"train_loss": -5.95198392868042, "global_step": 70264, "epoch": 1672} {"train_loss": -6.031564587638492, "global_step": 70265, "epoch": 1672, "val_loss": 61394.45703125} {"train_loss": -6.034727573394775, "global_step": 70266, "epoch": 1673} {"train_loss": -6.060172080993652, "global_step": 70267, "epoch": 1673} {"train_loss": -6.037813186645508, "global_step": 70268, "epoch": 1673} {"train_loss": -6.089094638824463, "global_step": 70269, "epoch": 1673} {"train_loss": -6.123908519744873, "global_step": 70270, "epoch": 1673} {"train_loss": -5.952460289001465, "global_step": 70271, "epoch": 1673} {"train_loss": -6.099092960357666, "global_step": 70272, "epoch": 1673} {"train_loss": -6.028470993041992, "global_step": 70273, "epoch": 1673} {"train_loss": -6.000733852386475, "global_step": 70274, "epoch": 1673} {"train_loss": -5.998939514160156, "global_step": 70275, "epoch": 1673} {"train_loss": -5.9821600914001465, "global_step": 70276, "epoch": 1673} {"train_loss": -5.935853958129883, "global_step": 70277, "epoch": 1673} {"train_loss": -6.205282211303711, "global_step": 70278, "epoch": 1673} {"train_loss": -6.0712785720825195, "global_step": 70279, "epoch": 1673} {"train_loss": -6.069331169128418, "global_step": 70280, "epoch": 1673} {"train_loss": -6.084184169769287, "global_step": 70281, "epoch": 1673} {"train_loss": -5.9466166496276855, "global_step": 70282, "epoch": 1673} {"train_loss": -6.035358428955078, "global_step": 70283, "epoch": 1673} {"train_loss": -6.055091857910156, "global_step": 70284, "epoch": 1673} {"train_loss": -6.067714214324951, "global_step": 70285, "epoch": 1673} {"train_loss": -6.045929908752441, "global_step": 70286, "epoch": 1673} {"train_loss": -5.9871087074279785, "global_step": 70287, "epoch": 1673} {"train_loss": -5.992948532104492, "global_step": 70288, "epoch": 1673} {"train_loss": -6.041175365447998, "global_step": 70289, "epoch": 1673} {"train_loss": -5.97797966003418, "global_step": 70290, "epoch": 1673} {"train_loss": -6.119389057159424, "global_step": 70291, "epoch": 1673} {"train_loss": -5.995109558105469, "global_step": 70292, "epoch": 1673} {"train_loss": -6.017369270324707, "global_step": 70293, "epoch": 1673} {"train_loss": -6.095072269439697, "global_step": 70294, "epoch": 1673} {"train_loss": -6.066303730010986, "global_step": 70295, "epoch": 1673} {"train_loss": -6.058505058288574, "global_step": 70296, "epoch": 1673} {"train_loss": -6.134002685546875, "global_step": 70297, "epoch": 1673} {"train_loss": -6.070283889770508, "global_step": 70298, "epoch": 1673} {"train_loss": -5.976900100708008, "global_step": 70299, "epoch": 1673} {"train_loss": -6.096233367919922, "global_step": 70300, "epoch": 1673} {"train_loss": -5.979565620422363, "global_step": 70301, "epoch": 1673} {"train_loss": -6.087096214294434, "global_step": 70302, "epoch": 1673} {"train_loss": -6.1238603591918945, "global_step": 70303, "epoch": 1673} {"train_loss": -5.885419845581055, "global_step": 70304, "epoch": 1673} {"train_loss": -6.065316677093506, "global_step": 70305, "epoch": 1673} {"train_loss": -6.1261491775512695, "global_step": 70306, "epoch": 1673} {"train_loss": -6.04610934711638, "global_step": 70307, "epoch": 1673, "val_loss": 61794.12109375} {"train_loss": -6.11604118347168, "global_step": 70308, "epoch": 1674} {"train_loss": -6.10386323928833, "global_step": 70309, "epoch": 1674} {"train_loss": -5.967995643615723, "global_step": 70310, "epoch": 1674} {"train_loss": -6.051165580749512, "global_step": 70311, "epoch": 1674} {"train_loss": -6.132777214050293, "global_step": 70312, "epoch": 1674} {"train_loss": -5.992649078369141, "global_step": 70313, "epoch": 1674} {"train_loss": -5.9827165603637695, "global_step": 70314, "epoch": 1674} {"train_loss": -5.990575313568115, "global_step": 70315, "epoch": 1674} {"train_loss": -6.124234199523926, "global_step": 70316, "epoch": 1674} {"train_loss": -5.989867210388184, "global_step": 70317, "epoch": 1674} {"train_loss": -6.137904644012451, "global_step": 70318, "epoch": 1674} {"train_loss": -6.115813255310059, "global_step": 70319, "epoch": 1674} {"train_loss": -6.13999080657959, "global_step": 70320, "epoch": 1674} {"train_loss": -6.0772552490234375, "global_step": 70321, "epoch": 1674} {"train_loss": -6.100124359130859, "global_step": 70322, "epoch": 1674} {"train_loss": -6.224429130554199, "global_step": 70323, "epoch": 1674} {"train_loss": -6.126408576965332, "global_step": 70324, "epoch": 1674} {"train_loss": -6.001439094543457, "global_step": 70325, "epoch": 1674} {"train_loss": -6.071727752685547, "global_step": 70326, "epoch": 1674} {"train_loss": -6.061173439025879, "global_step": 70327, "epoch": 1674} {"train_loss": -6.012311935424805, "global_step": 70328, "epoch": 1674} {"train_loss": -6.134327411651611, "global_step": 70329, "epoch": 1674} {"train_loss": -5.981855869293213, "global_step": 70330, "epoch": 1674} {"train_loss": -6.06983757019043, "global_step": 70331, "epoch": 1674} {"train_loss": -6.193624973297119, "global_step": 70332, "epoch": 1674} {"train_loss": -6.058046817779541, "global_step": 70333, "epoch": 1674} {"train_loss": -6.026796817779541, "global_step": 70334, "epoch": 1674} {"train_loss": -5.914562225341797, "global_step": 70335, "epoch": 1674} {"train_loss": -5.945305824279785, "global_step": 70336, "epoch": 1674} {"train_loss": -6.031830787658691, "global_step": 70337, "epoch": 1674} {"train_loss": -6.05538272857666, "global_step": 70338, "epoch": 1674} {"train_loss": -6.031143665313721, "global_step": 70339, "epoch": 1674} {"train_loss": -6.047450065612793, "global_step": 70340, "epoch": 1674} {"train_loss": -6.02055549621582, "global_step": 70341, "epoch": 1674} {"train_loss": -6.072196960449219, "global_step": 70342, "epoch": 1674} {"train_loss": -5.9840006828308105, "global_step": 70343, "epoch": 1674} {"train_loss": -5.95854377746582, "global_step": 70344, "epoch": 1674} {"train_loss": -6.116851806640625, "global_step": 70345, "epoch": 1674} {"train_loss": -5.974767684936523, "global_step": 70346, "epoch": 1674} {"train_loss": -6.118045330047607, "global_step": 70347, "epoch": 1674} {"train_loss": -6.025935649871826, "global_step": 70348, "epoch": 1674} {"train_loss": -6.054497219267345, "global_step": 70349, "epoch": 1674, "val_loss": 61577.9921875} {"train_loss": -6.0254621505737305, "global_step": 70350, "epoch": 1675} {"train_loss": -6.082968711853027, "global_step": 70351, "epoch": 1675} {"train_loss": -5.921982288360596, "global_step": 70352, "epoch": 1675} {"train_loss": -6.026149749755859, "global_step": 70353, "epoch": 1675} {"train_loss": -6.0438995361328125, "global_step": 70354, "epoch": 1675} {"train_loss": -5.816989421844482, "global_step": 70355, "epoch": 1675} {"train_loss": -6.151022911071777, "global_step": 70356, "epoch": 1675} {"train_loss": -5.8949294090271, "global_step": 70357, "epoch": 1675} {"train_loss": -5.912524223327637, "global_step": 70358, "epoch": 1675} {"train_loss": -6.129430770874023, "global_step": 70359, "epoch": 1675} {"train_loss": -5.916898727416992, "global_step": 70360, "epoch": 1675} {"train_loss": -5.958171844482422, "global_step": 70361, "epoch": 1675} {"train_loss": -5.98474645614624, "global_step": 70362, "epoch": 1675} {"train_loss": -6.004846572875977, "global_step": 70363, "epoch": 1675} {"train_loss": -6.049867153167725, "global_step": 70364, "epoch": 1675} {"train_loss": -6.042261123657227, "global_step": 70365, "epoch": 1675} {"train_loss": -5.995056629180908, "global_step": 70366, "epoch": 1675} {"train_loss": -6.001474380493164, "global_step": 70367, "epoch": 1675} {"train_loss": -5.974241256713867, "global_step": 70368, "epoch": 1675} {"train_loss": -6.096518516540527, "global_step": 70369, "epoch": 1675} {"train_loss": -6.048760890960693, "global_step": 70370, "epoch": 1675} {"train_loss": -6.002468109130859, "global_step": 70371, "epoch": 1675} {"train_loss": -6.091806411743164, "global_step": 70372, "epoch": 1675} {"train_loss": -6.193216323852539, "global_step": 70373, "epoch": 1675} {"train_loss": -5.920248985290527, "global_step": 70374, "epoch": 1675} {"train_loss": -6.09759521484375, "global_step": 70375, "epoch": 1675} {"train_loss": -5.973000526428223, "global_step": 70376, "epoch": 1675} {"train_loss": -5.900312900543213, "global_step": 70377, "epoch": 1675} {"train_loss": -5.9747209548950195, "global_step": 70378, "epoch": 1675} {"train_loss": -5.999410629272461, "global_step": 70379, "epoch": 1675} {"train_loss": -6.040285587310791, "global_step": 70380, "epoch": 1675} {"train_loss": -5.956537246704102, "global_step": 70381, "epoch": 1675} {"train_loss": -5.931950569152832, "global_step": 70382, "epoch": 1675} {"train_loss": -5.969515323638916, "global_step": 70383, "epoch": 1675} {"train_loss": -5.981209754943848, "global_step": 70384, "epoch": 1675} {"train_loss": -6.1426825523376465, "global_step": 70385, "epoch": 1675} {"train_loss": -5.990845203399658, "global_step": 70386, "epoch": 1675} {"train_loss": -5.9316792488098145, "global_step": 70387, "epoch": 1675} {"train_loss": -6.075437545776367, "global_step": 70388, "epoch": 1675} {"train_loss": -5.9708685874938965, "global_step": 70389, "epoch": 1675} {"train_loss": -6.042193412780762, "global_step": 70390, "epoch": 1675} {"train_loss": -6.006653354281471, "global_step": 70391, "epoch": 1675, "val_loss": 61673.2890625} {"train_loss": -6.019953727722168, "global_step": 70392, "epoch": 1676} {"train_loss": -6.0731201171875, "global_step": 70393, "epoch": 1676} {"train_loss": -5.964327812194824, "global_step": 70394, "epoch": 1676} {"train_loss": -5.899414539337158, "global_step": 70395, "epoch": 1676} {"train_loss": -5.9626288414001465, "global_step": 70396, "epoch": 1676} {"train_loss": -6.004509925842285, "global_step": 70397, "epoch": 1676} {"train_loss": -6.057854652404785, "global_step": 70398, "epoch": 1676} {"train_loss": -6.074034690856934, "global_step": 70399, "epoch": 1676} {"train_loss": -6.02992582321167, "global_step": 70400, "epoch": 1676} {"train_loss": -6.010931968688965, "global_step": 70401, "epoch": 1676} {"train_loss": -6.0377912521362305, "global_step": 70402, "epoch": 1676} {"train_loss": -6.120230674743652, "global_step": 70403, "epoch": 1676} {"train_loss": -6.109537601470947, "global_step": 70404, "epoch": 1676} {"train_loss": -5.926673889160156, "global_step": 70405, "epoch": 1676} {"train_loss": -6.03550910949707, "global_step": 70406, "epoch": 1676} {"train_loss": -6.009477138519287, "global_step": 70407, "epoch": 1676} {"train_loss": -6.037791728973389, "global_step": 70408, "epoch": 1676} {"train_loss": -5.999289512634277, "global_step": 70409, "epoch": 1676} {"train_loss": -5.9142303466796875, "global_step": 70410, "epoch": 1676} {"train_loss": -6.103580474853516, "global_step": 70411, "epoch": 1676} {"train_loss": -5.9758148193359375, "global_step": 70412, "epoch": 1676} {"train_loss": -6.067420959472656, "global_step": 70413, "epoch": 1676} {"train_loss": -5.958288192749023, "global_step": 70414, "epoch": 1676} {"train_loss": -5.989223957061768, "global_step": 70415, "epoch": 1676} {"train_loss": -6.042508125305176, "global_step": 70416, "epoch": 1676} {"train_loss": -5.96467399597168, "global_step": 70417, "epoch": 1676} {"train_loss": -6.020273685455322, "global_step": 70418, "epoch": 1676} {"train_loss": -5.986324310302734, "global_step": 70419, "epoch": 1676} {"train_loss": -6.008167266845703, "global_step": 70420, "epoch": 1676} {"train_loss": -6.065064430236816, "global_step": 70421, "epoch": 1676} {"train_loss": -6.0456109046936035, "global_step": 70422, "epoch": 1676} {"train_loss": -6.10566520690918, "global_step": 70423, "epoch": 1676} {"train_loss": -6.029579162597656, "global_step": 70424, "epoch": 1676} {"train_loss": -6.086350440979004, "global_step": 70425, "epoch": 1676} {"train_loss": -6.18265962600708, "global_step": 70426, "epoch": 1676} {"train_loss": -5.991441249847412, "global_step": 70427, "epoch": 1676} {"train_loss": -6.1088409423828125, "global_step": 70428, "epoch": 1676} {"train_loss": -6.008790969848633, "global_step": 70429, "epoch": 1676} {"train_loss": -6.002904891967773, "global_step": 70430, "epoch": 1676} {"train_loss": -6.0629658699035645, "global_step": 70431, "epoch": 1676} {"train_loss": -6.09589147567749, "global_step": 70432, "epoch": 1676} {"train_loss": -6.0308925197238015, "global_step": 70433, "epoch": 1676, "val_loss": 61589.19921875} {"train_loss": -6.040261268615723, "global_step": 70434, "epoch": 1677} {"train_loss": -6.123671531677246, "global_step": 70435, "epoch": 1677} {"train_loss": -6.05248498916626, "global_step": 70436, "epoch": 1677} {"train_loss": -6.055941581726074, "global_step": 70437, "epoch": 1677} {"train_loss": -5.956937789916992, "global_step": 70438, "epoch": 1677} {"train_loss": -6.120490074157715, "global_step": 70439, "epoch": 1677} {"train_loss": -6.154359817504883, "global_step": 70440, "epoch": 1677} {"train_loss": -6.062997817993164, "global_step": 70441, "epoch": 1677} {"train_loss": -6.010349273681641, "global_step": 70442, "epoch": 1677} {"train_loss": -6.159101486206055, "global_step": 70443, "epoch": 1677} {"train_loss": -6.011127471923828, "global_step": 70444, "epoch": 1677} {"train_loss": -6.065722465515137, "global_step": 70445, "epoch": 1677} {"train_loss": -6.047817230224609, "global_step": 70446, "epoch": 1677} {"train_loss": -5.825486183166504, "global_step": 70447, "epoch": 1677} {"train_loss": -6.035004138946533, "global_step": 70448, "epoch": 1677} {"train_loss": -6.0555877685546875, "global_step": 70449, "epoch": 1677} {"train_loss": -6.105228900909424, "global_step": 70450, "epoch": 1677} {"train_loss": -6.117847442626953, "global_step": 70451, "epoch": 1677} {"train_loss": -6.000317573547363, "global_step": 70452, "epoch": 1677} {"train_loss": -6.094657897949219, "global_step": 70453, "epoch": 1677} {"train_loss": -6.107609748840332, "global_step": 70454, "epoch": 1677} {"train_loss": -6.100032806396484, "global_step": 70455, "epoch": 1677} {"train_loss": -6.01136589050293, "global_step": 70456, "epoch": 1677} {"train_loss": -5.929464817047119, "global_step": 70457, "epoch": 1677} {"train_loss": -5.902706146240234, "global_step": 70458, "epoch": 1677} {"train_loss": -6.004589080810547, "global_step": 70459, "epoch": 1677} {"train_loss": -6.034430503845215, "global_step": 70460, "epoch": 1677} {"train_loss": -6.098169326782227, "global_step": 70461, "epoch": 1677} {"train_loss": -5.923832893371582, "global_step": 70462, "epoch": 1677} {"train_loss": -6.1279754638671875, "global_step": 70463, "epoch": 1677} {"train_loss": -6.004961013793945, "global_step": 70464, "epoch": 1677} {"train_loss": -5.940667629241943, "global_step": 70465, "epoch": 1677} {"train_loss": -6.01144552230835, "global_step": 70466, "epoch": 1677} {"train_loss": -5.917200565338135, "global_step": 70467, "epoch": 1677} {"train_loss": -5.950122833251953, "global_step": 70468, "epoch": 1677} {"train_loss": -5.924106121063232, "global_step": 70469, "epoch": 1677} {"train_loss": -5.97736930847168, "global_step": 70470, "epoch": 1677} {"train_loss": -5.8846282958984375, "global_step": 70471, "epoch": 1677} {"train_loss": -6.104236602783203, "global_step": 70472, "epoch": 1677} {"train_loss": -5.987734317779541, "global_step": 70473, "epoch": 1677} {"train_loss": -5.923422336578369, "global_step": 70474, "epoch": 1677} {"train_loss": -6.02499152365185, "global_step": 70475, "epoch": 1677, "val_loss": 61766.6640625} {"train_loss": -6.001682281494141, "global_step": 70476, "epoch": 1678} {"train_loss": -5.889513969421387, "global_step": 70477, "epoch": 1678} {"train_loss": -5.965221405029297, "global_step": 70478, "epoch": 1678} {"train_loss": -5.9072585105896, "global_step": 70479, "epoch": 1678} {"train_loss": -6.006169319152832, "global_step": 70480, "epoch": 1678} {"train_loss": -6.063908576965332, "global_step": 70481, "epoch": 1678} {"train_loss": -5.959492206573486, "global_step": 70482, "epoch": 1678} {"train_loss": -6.00158166885376, "global_step": 70483, "epoch": 1678} {"train_loss": -5.916272163391113, "global_step": 70484, "epoch": 1678} {"train_loss": -5.903510570526123, "global_step": 70485, "epoch": 1678} {"train_loss": -6.0226216316223145, "global_step": 70486, "epoch": 1678} {"train_loss": -6.020890712738037, "global_step": 70487, "epoch": 1678} {"train_loss": -6.007594108581543, "global_step": 70488, "epoch": 1678} {"train_loss": -6.0748138427734375, "global_step": 70489, "epoch": 1678} {"train_loss": -6.024727821350098, "global_step": 70490, "epoch": 1678} {"train_loss": -5.955388069152832, "global_step": 70491, "epoch": 1678} {"train_loss": -6.120114326477051, "global_step": 70492, "epoch": 1678} {"train_loss": -6.100700855255127, "global_step": 70493, "epoch": 1678} {"train_loss": -6.135797500610352, "global_step": 70494, "epoch": 1678} {"train_loss": -6.090709686279297, "global_step": 70495, "epoch": 1678} {"train_loss": -5.983617782592773, "global_step": 70496, "epoch": 1678} {"train_loss": -6.082557678222656, "global_step": 70497, "epoch": 1678} {"train_loss": -5.946023464202881, "global_step": 70498, "epoch": 1678} {"train_loss": -6.168772220611572, "global_step": 70499, "epoch": 1678} {"train_loss": -6.108057975769043, "global_step": 70500, "epoch": 1678} {"train_loss": -5.911536693572998, "global_step": 70501, "epoch": 1678} {"train_loss": -5.970162868499756, "global_step": 70502, "epoch": 1678} {"train_loss": -5.9655866622924805, "global_step": 70503, "epoch": 1678} {"train_loss": -5.944736480712891, "global_step": 70504, "epoch": 1678} {"train_loss": -5.984492778778076, "global_step": 70505, "epoch": 1678} {"train_loss": -6.061208724975586, "global_step": 70506, "epoch": 1678} {"train_loss": -6.047517776489258, "global_step": 70507, "epoch": 1678} {"train_loss": -6.129998207092285, "global_step": 70508, "epoch": 1678} {"train_loss": -6.129319190979004, "global_step": 70509, "epoch": 1678} {"train_loss": -6.033603668212891, "global_step": 70510, "epoch": 1678} {"train_loss": -6.098780155181885, "global_step": 70511, "epoch": 1678} {"train_loss": -5.8302812576293945, "global_step": 70512, "epoch": 1678} {"train_loss": -5.999253273010254, "global_step": 70513, "epoch": 1678} {"train_loss": -6.101169586181641, "global_step": 70514, "epoch": 1678} {"train_loss": -5.981853008270264, "global_step": 70515, "epoch": 1678} {"train_loss": -6.150577545166016, "global_step": 70516, "epoch": 1678} {"train_loss": -6.019893430528187, "global_step": 70517, "epoch": 1678, "val_loss": 61582.66796875} {"train_loss": -6.060347080230713, "global_step": 70518, "epoch": 1679} {"train_loss": -5.979196548461914, "global_step": 70519, "epoch": 1679} {"train_loss": -5.952558517456055, "global_step": 70520, "epoch": 1679} {"train_loss": -6.094697952270508, "global_step": 70521, "epoch": 1679} {"train_loss": -6.062111854553223, "global_step": 70522, "epoch": 1679} {"train_loss": -6.087956428527832, "global_step": 70523, "epoch": 1679} {"train_loss": -6.068271160125732, "global_step": 70524, "epoch": 1679} {"train_loss": -6.120755672454834, "global_step": 70525, "epoch": 1679} {"train_loss": -6.050647735595703, "global_step": 70526, "epoch": 1679} {"train_loss": -6.017077445983887, "global_step": 70527, "epoch": 1679} {"train_loss": -6.035698413848877, "global_step": 70528, "epoch": 1679} {"train_loss": -6.105435371398926, "global_step": 70529, "epoch": 1679} {"train_loss": -6.114301681518555, "global_step": 70530, "epoch": 1679} {"train_loss": -6.009172439575195, "global_step": 70531, "epoch": 1679} {"train_loss": -6.0266523361206055, "global_step": 70532, "epoch": 1679} {"train_loss": -6.054764270782471, "global_step": 70533, "epoch": 1679} {"train_loss": -6.054964065551758, "global_step": 70534, "epoch": 1679} {"train_loss": -6.037537574768066, "global_step": 70535, "epoch": 1679} {"train_loss": -6.120199203491211, "global_step": 70536, "epoch": 1679} {"train_loss": -6.028733730316162, "global_step": 70537, "epoch": 1679} {"train_loss": -6.02740478515625, "global_step": 70538, "epoch": 1679} {"train_loss": -5.905694961547852, "global_step": 70539, "epoch": 1679} {"train_loss": -5.981938362121582, "global_step": 70540, "epoch": 1679} {"train_loss": -6.120494842529297, "global_step": 70541, "epoch": 1679} {"train_loss": -5.998987197875977, "global_step": 70542, "epoch": 1679} {"train_loss": -5.946704864501953, "global_step": 70543, "epoch": 1679} {"train_loss": -6.043280124664307, "global_step": 70544, "epoch": 1679} {"train_loss": -5.879979133605957, "global_step": 70545, "epoch": 1679} {"train_loss": -6.008754730224609, "global_step": 70546, "epoch": 1679} {"train_loss": -6.023164749145508, "global_step": 70547, "epoch": 1679} {"train_loss": -5.922001838684082, "global_step": 70548, "epoch": 1679} {"train_loss": -5.980068206787109, "global_step": 70549, "epoch": 1679} {"train_loss": -6.00107479095459, "global_step": 70550, "epoch": 1679} {"train_loss": -5.889403343200684, "global_step": 70551, "epoch": 1679} {"train_loss": -6.021015167236328, "global_step": 70552, "epoch": 1679} {"train_loss": -6.155486106872559, "global_step": 70553, "epoch": 1679} {"train_loss": -5.999476432800293, "global_step": 70554, "epoch": 1679} {"train_loss": -6.037039756774902, "global_step": 70555, "epoch": 1679} {"train_loss": -5.976391792297363, "global_step": 70556, "epoch": 1679} {"train_loss": -5.940174579620361, "global_step": 70557, "epoch": 1679} {"train_loss": -6.018389701843262, "global_step": 70558, "epoch": 1679} {"train_loss": -6.0266134057726175, "global_step": 70559, "epoch": 1679, "val_loss": 61968.7265625} {"train_loss": -5.903201580047607, "global_step": 70560, "epoch": 1680} {"train_loss": -5.972555160522461, "global_step": 70561, "epoch": 1680} {"train_loss": -6.067379951477051, "global_step": 70562, "epoch": 1680} {"train_loss": -6.044251441955566, "global_step": 70563, "epoch": 1680} {"train_loss": -6.001993179321289, "global_step": 70564, "epoch": 1680} {"train_loss": -6.047965049743652, "global_step": 70565, "epoch": 1680} {"train_loss": -5.900145053863525, "global_step": 70566, "epoch": 1680} {"train_loss": -5.954599380493164, "global_step": 70567, "epoch": 1680} {"train_loss": -6.08519172668457, "global_step": 70568, "epoch": 1680} {"train_loss": -5.970947742462158, "global_step": 70569, "epoch": 1680} {"train_loss": -6.0730180740356445, "global_step": 70570, "epoch": 1680} {"train_loss": -6.057287216186523, "global_step": 70571, "epoch": 1680} {"train_loss": -6.002154350280762, "global_step": 70572, "epoch": 1680} {"train_loss": -6.0599565505981445, "global_step": 70573, "epoch": 1680} {"train_loss": -6.005556106567383, "global_step": 70574, "epoch": 1680} {"train_loss": -5.940191745758057, "global_step": 70575, "epoch": 1680} {"train_loss": -6.044165134429932, "global_step": 70576, "epoch": 1680} {"train_loss": -6.033378601074219, "global_step": 70577, "epoch": 1680} {"train_loss": -5.934964656829834, "global_step": 70578, "epoch": 1680} {"train_loss": -5.967868804931641, "global_step": 70579, "epoch": 1680} {"train_loss": -6.0357255935668945, "global_step": 70580, "epoch": 1680} {"train_loss": -5.8335161209106445, "global_step": 70581, "epoch": 1680} {"train_loss": -5.925504207611084, "global_step": 70582, "epoch": 1680} {"train_loss": -5.991570472717285, "global_step": 70583, "epoch": 1680} {"train_loss": -5.981019973754883, "global_step": 70584, "epoch": 1680} {"train_loss": -6.013877868652344, "global_step": 70585, "epoch": 1680} {"train_loss": -5.895678520202637, "global_step": 70586, "epoch": 1680} {"train_loss": -5.958566665649414, "global_step": 70587, "epoch": 1680} {"train_loss": -5.803582191467285, "global_step": 70588, "epoch": 1680} {"train_loss": -5.86483097076416, "global_step": 70589, "epoch": 1680} {"train_loss": -5.891037940979004, "global_step": 70590, "epoch": 1680} {"train_loss": -5.892237186431885, "global_step": 70591, "epoch": 1680} {"train_loss": -6.180076599121094, "global_step": 70592, "epoch": 1680} {"train_loss": -5.806523323059082, "global_step": 70593, "epoch": 1680} {"train_loss": -6.02202033996582, "global_step": 70594, "epoch": 1680} {"train_loss": -6.024355411529541, "global_step": 70595, "epoch": 1680} {"train_loss": -5.869441032409668, "global_step": 70596, "epoch": 1680} {"train_loss": -6.009927749633789, "global_step": 70597, "epoch": 1680} {"train_loss": -5.910614967346191, "global_step": 70598, "epoch": 1680} {"train_loss": -6.053264617919922, "global_step": 70599, "epoch": 1680} {"train_loss": -5.906346321105957, "global_step": 70600, "epoch": 1680} {"train_loss": -5.974840629668463, "global_step": 70601, "epoch": 1680, "val_loss": 61882.28125} {"train_loss": -5.930109024047852, "global_step": 70602, "epoch": 1681} {"train_loss": -5.90278434753418, "global_step": 70603, "epoch": 1681} {"train_loss": -6.124356746673584, "global_step": 70604, "epoch": 1681} {"train_loss": -6.02174186706543, "global_step": 70605, "epoch": 1681} {"train_loss": -5.987392902374268, "global_step": 70606, "epoch": 1681} {"train_loss": -6.222718715667725, "global_step": 70607, "epoch": 1681} {"train_loss": -5.939816474914551, "global_step": 70608, "epoch": 1681} {"train_loss": -6.040440559387207, "global_step": 70609, "epoch": 1681} {"train_loss": -6.006688117980957, "global_step": 70610, "epoch": 1681} {"train_loss": -5.934037208557129, "global_step": 70611, "epoch": 1681} {"train_loss": -5.956907749176025, "global_step": 70612, "epoch": 1681} {"train_loss": -5.9770965576171875, "global_step": 70613, "epoch": 1681} {"train_loss": -5.974472999572754, "global_step": 70614, "epoch": 1681} {"train_loss": -6.101226806640625, "global_step": 70615, "epoch": 1681} {"train_loss": -6.060492038726807, "global_step": 70616, "epoch": 1681} {"train_loss": -6.0375165939331055, "global_step": 70617, "epoch": 1681} {"train_loss": -6.0633134841918945, "global_step": 70618, "epoch": 1681} {"train_loss": -5.950898170471191, "global_step": 70619, "epoch": 1681} {"train_loss": -6.0093889236450195, "global_step": 70620, "epoch": 1681} {"train_loss": -6.205880165100098, "global_step": 70621, "epoch": 1681} {"train_loss": -6.059708118438721, "global_step": 70622, "epoch": 1681} {"train_loss": -6.07437801361084, "global_step": 70623, "epoch": 1681} {"train_loss": -6.0520548820495605, "global_step": 70624, "epoch": 1681} {"train_loss": -6.081614971160889, "global_step": 70625, "epoch": 1681} {"train_loss": -6.1233625411987305, "global_step": 70626, "epoch": 1681} {"train_loss": -5.935556411743164, "global_step": 70627, "epoch": 1681} {"train_loss": -6.166633129119873, "global_step": 70628, "epoch": 1681} {"train_loss": -5.997082233428955, "global_step": 70629, "epoch": 1681} {"train_loss": -6.006592750549316, "global_step": 70630, "epoch": 1681} {"train_loss": -6.095940589904785, "global_step": 70631, "epoch": 1681} {"train_loss": -6.034046649932861, "global_step": 70632, "epoch": 1681} {"train_loss": -5.874322891235352, "global_step": 70633, "epoch": 1681} {"train_loss": -6.005731582641602, "global_step": 70634, "epoch": 1681} {"train_loss": -5.967929840087891, "global_step": 70635, "epoch": 1681} {"train_loss": -6.019542694091797, "global_step": 70636, "epoch": 1681} {"train_loss": -5.951194763183594, "global_step": 70637, "epoch": 1681} {"train_loss": -5.918259620666504, "global_step": 70638, "epoch": 1681} {"train_loss": -5.963549613952637, "global_step": 70639, "epoch": 1681} {"train_loss": -5.906936168670654, "global_step": 70640, "epoch": 1681} {"train_loss": -5.923059463500977, "global_step": 70641, "epoch": 1681} {"train_loss": -5.938352584838867, "global_step": 70642, "epoch": 1681} {"train_loss": -6.009280692963373, "global_step": 70643, "epoch": 1681, "val_loss": 61987.32421875} {"train_loss": -6.027460098266602, "global_step": 70644, "epoch": 1682} {"train_loss": -6.093837738037109, "global_step": 70645, "epoch": 1682} {"train_loss": -6.030119895935059, "global_step": 70646, "epoch": 1682} {"train_loss": -5.96065616607666, "global_step": 70647, "epoch": 1682} {"train_loss": -6.011699676513672, "global_step": 70648, "epoch": 1682} {"train_loss": -5.998290061950684, "global_step": 70649, "epoch": 1682} {"train_loss": -6.088988304138184, "global_step": 70650, "epoch": 1682} {"train_loss": -6.048346996307373, "global_step": 70651, "epoch": 1682} {"train_loss": -5.925212860107422, "global_step": 70652, "epoch": 1682} {"train_loss": -6.092833042144775, "global_step": 70653, "epoch": 1682} {"train_loss": -6.032165050506592, "global_step": 70654, "epoch": 1682} {"train_loss": -6.033204078674316, "global_step": 70655, "epoch": 1682} {"train_loss": -6.0473127365112305, "global_step": 70656, "epoch": 1682} {"train_loss": -5.975492477416992, "global_step": 70657, "epoch": 1682} {"train_loss": -5.980921268463135, "global_step": 70658, "epoch": 1682} {"train_loss": -5.992053031921387, "global_step": 70659, "epoch": 1682} {"train_loss": -6.010055065155029, "global_step": 70660, "epoch": 1682} {"train_loss": -5.979339599609375, "global_step": 70661, "epoch": 1682} {"train_loss": -5.970623970031738, "global_step": 70662, "epoch": 1682} {"train_loss": -5.930852890014648, "global_step": 70663, "epoch": 1682} {"train_loss": -6.001981735229492, "global_step": 70664, "epoch": 1682} {"train_loss": -5.954282760620117, "global_step": 70665, "epoch": 1682} {"train_loss": -6.016539573669434, "global_step": 70666, "epoch": 1682} {"train_loss": -5.996276378631592, "global_step": 70667, "epoch": 1682} {"train_loss": -5.916558265686035, "global_step": 70668, "epoch": 1682} {"train_loss": -6.0500664710998535, "global_step": 70669, "epoch": 1682} {"train_loss": -5.918692588806152, "global_step": 70670, "epoch": 1682} {"train_loss": -5.959225654602051, "global_step": 70671, "epoch": 1682} {"train_loss": -5.915685653686523, "global_step": 70672, "epoch": 1682} {"train_loss": -5.9540510177612305, "global_step": 70673, "epoch": 1682} {"train_loss": -5.855375289916992, "global_step": 70674, "epoch": 1682} {"train_loss": -6.04503870010376, "global_step": 70675, "epoch": 1682} {"train_loss": -6.041752815246582, "global_step": 70676, "epoch": 1682} {"train_loss": -6.059892654418945, "global_step": 70677, "epoch": 1682} {"train_loss": -6.109288215637207, "global_step": 70678, "epoch": 1682} {"train_loss": -5.916416645050049, "global_step": 70679, "epoch": 1682} {"train_loss": -6.060108184814453, "global_step": 70680, "epoch": 1682} {"train_loss": -6.016687393188477, "global_step": 70681, "epoch": 1682} {"train_loss": -6.113719463348389, "global_step": 70682, "epoch": 1682} {"train_loss": -6.017724514007568, "global_step": 70683, "epoch": 1682} {"train_loss": -5.998142242431641, "global_step": 70684, "epoch": 1682} {"train_loss": -6.0033553668430875, "global_step": 70685, "epoch": 1682, "val_loss": 61668.19921875} {"train_loss": -6.1198577880859375, "global_step": 70686, "epoch": 1683} {"train_loss": -5.9635467529296875, "global_step": 70687, "epoch": 1683} {"train_loss": -5.990299224853516, "global_step": 70688, "epoch": 1683} {"train_loss": -6.093149662017822, "global_step": 70689, "epoch": 1683} {"train_loss": -6.017091751098633, "global_step": 70690, "epoch": 1683} {"train_loss": -5.953834056854248, "global_step": 70691, "epoch": 1683} {"train_loss": -5.902326583862305, "global_step": 70692, "epoch": 1683} {"train_loss": -6.086877346038818, "global_step": 70693, "epoch": 1683} {"train_loss": -6.0294084548950195, "global_step": 70694, "epoch": 1683} {"train_loss": -5.944953918457031, "global_step": 70695, "epoch": 1683} {"train_loss": -6.080364227294922, "global_step": 70696, "epoch": 1683} {"train_loss": -6.10103178024292, "global_step": 70697, "epoch": 1683} {"train_loss": -6.0197858810424805, "global_step": 70698, "epoch": 1683} {"train_loss": -5.9185943603515625, "global_step": 70699, "epoch": 1683} {"train_loss": -5.922730445861816, "global_step": 70700, "epoch": 1683} {"train_loss": -5.949086666107178, "global_step": 70701, "epoch": 1683} {"train_loss": -6.106931686401367, "global_step": 70702, "epoch": 1683} {"train_loss": -6.090883255004883, "global_step": 70703, "epoch": 1683} {"train_loss": -6.052986145019531, "global_step": 70704, "epoch": 1683} {"train_loss": -6.013449668884277, "global_step": 70705, "epoch": 1683} {"train_loss": -6.054738521575928, "global_step": 70706, "epoch": 1683} {"train_loss": -6.144783020019531, "global_step": 70707, "epoch": 1683} {"train_loss": -6.062627792358398, "global_step": 70708, "epoch": 1683} {"train_loss": -6.039216995239258, "global_step": 70709, "epoch": 1683} {"train_loss": -5.980708122253418, "global_step": 70710, "epoch": 1683} {"train_loss": -6.019438743591309, "global_step": 70711, "epoch": 1683} {"train_loss": -6.003562927246094, "global_step": 70712, "epoch": 1683} {"train_loss": -6.020754814147949, "global_step": 70713, "epoch": 1683} {"train_loss": -6.109688758850098, "global_step": 70714, "epoch": 1683} {"train_loss": -6.061806678771973, "global_step": 70715, "epoch": 1683} {"train_loss": -6.0985107421875, "global_step": 70716, "epoch": 1683} {"train_loss": -6.16219425201416, "global_step": 70717, "epoch": 1683} {"train_loss": -5.990090370178223, "global_step": 70718, "epoch": 1683} {"train_loss": -5.956007480621338, "global_step": 70719, "epoch": 1683} {"train_loss": -6.032041549682617, "global_step": 70720, "epoch": 1683} {"train_loss": -6.134970188140869, "global_step": 70721, "epoch": 1683} {"train_loss": -6.163209915161133, "global_step": 70722, "epoch": 1683} {"train_loss": -6.163425445556641, "global_step": 70723, "epoch": 1683} {"train_loss": -6.047049522399902, "global_step": 70724, "epoch": 1683} {"train_loss": -6.132211685180664, "global_step": 70725, "epoch": 1683} {"train_loss": -6.245237350463867, "global_step": 70726, "epoch": 1683} {"train_loss": -6.050407648086548, "global_step": 70727, "epoch": 1683, "val_loss": 61643.5625} {"train_loss": -6.152918815612793, "global_step": 70728, "epoch": 1684} {"train_loss": -6.059432506561279, "global_step": 70729, "epoch": 1684} {"train_loss": -6.095170021057129, "global_step": 70730, "epoch": 1684} {"train_loss": -6.193202972412109, "global_step": 70731, "epoch": 1684} {"train_loss": -6.034465789794922, "global_step": 70732, "epoch": 1684} {"train_loss": -6.09417200088501, "global_step": 70733, "epoch": 1684} {"train_loss": -6.058277130126953, "global_step": 70734, "epoch": 1684} {"train_loss": -6.0776848793029785, "global_step": 70735, "epoch": 1684} {"train_loss": -6.116975784301758, "global_step": 70736, "epoch": 1684} {"train_loss": -5.971225738525391, "global_step": 70737, "epoch": 1684} {"train_loss": -6.010903358459473, "global_step": 70738, "epoch": 1684} {"train_loss": -6.050167083740234, "global_step": 70739, "epoch": 1684} {"train_loss": -6.0141425132751465, "global_step": 70740, "epoch": 1684} {"train_loss": -5.971433162689209, "global_step": 70741, "epoch": 1684} {"train_loss": -6.142131328582764, "global_step": 70742, "epoch": 1684} {"train_loss": -6.125394821166992, "global_step": 70743, "epoch": 1684} {"train_loss": -6.073154449462891, "global_step": 70744, "epoch": 1684} {"train_loss": -5.914244651794434, "global_step": 70745, "epoch": 1684} {"train_loss": -6.072463035583496, "global_step": 70746, "epoch": 1684} {"train_loss": -6.180580139160156, "global_step": 70747, "epoch": 1684} {"train_loss": -6.012265682220459, "global_step": 70748, "epoch": 1684} {"train_loss": -5.9317474365234375, "global_step": 70749, "epoch": 1684} {"train_loss": -6.0161356925964355, "global_step": 70750, "epoch": 1684} {"train_loss": -5.977783203125, "global_step": 70751, "epoch": 1684} {"train_loss": -6.059048652648926, "global_step": 70752, "epoch": 1684} {"train_loss": -6.139752388000488, "global_step": 70753, "epoch": 1684} {"train_loss": -5.907504081726074, "global_step": 70754, "epoch": 1684} {"train_loss": -6.095208644866943, "global_step": 70755, "epoch": 1684} {"train_loss": -6.062849998474121, "global_step": 70756, "epoch": 1684} {"train_loss": -5.982224941253662, "global_step": 70757, "epoch": 1684} {"train_loss": -6.0301513671875, "global_step": 70758, "epoch": 1684} {"train_loss": -5.9510817527771, "global_step": 70759, "epoch": 1684} {"train_loss": -5.991358757019043, "global_step": 70760, "epoch": 1684} {"train_loss": -5.878681182861328, "global_step": 70761, "epoch": 1684} {"train_loss": -6.069764614105225, "global_step": 70762, "epoch": 1684} {"train_loss": -6.093392372131348, "global_step": 70763, "epoch": 1684} {"train_loss": -6.067737102508545, "global_step": 70764, "epoch": 1684} {"train_loss": -6.080466270446777, "global_step": 70765, "epoch": 1684} {"train_loss": -6.233956813812256, "global_step": 70766, "epoch": 1684} {"train_loss": -6.024105072021484, "global_step": 70767, "epoch": 1684} {"train_loss": -6.016937255859375, "global_step": 70768, "epoch": 1684} {"train_loss": -6.049567109062558, "global_step": 70769, "epoch": 1684, "val_loss": 61673.609375} {"train_loss": -6.034750938415527, "global_step": 70770, "epoch": 1685} {"train_loss": -6.039943218231201, "global_step": 70771, "epoch": 1685} {"train_loss": -6.117048263549805, "global_step": 70772, "epoch": 1685} {"train_loss": -6.159683704376221, "global_step": 70773, "epoch": 1685} {"train_loss": -6.078464508056641, "global_step": 70774, "epoch": 1685} {"train_loss": -6.1218390464782715, "global_step": 70775, "epoch": 1685} {"train_loss": -6.097002983093262, "global_step": 70776, "epoch": 1685} {"train_loss": -6.087251663208008, "global_step": 70777, "epoch": 1685} {"train_loss": -6.00596809387207, "global_step": 70778, "epoch": 1685} {"train_loss": -6.071268081665039, "global_step": 70779, "epoch": 1685} {"train_loss": -6.032833099365234, "global_step": 70780, "epoch": 1685} {"train_loss": -6.002378940582275, "global_step": 70781, "epoch": 1685} {"train_loss": -6.013294219970703, "global_step": 70782, "epoch": 1685} {"train_loss": -6.146195411682129, "global_step": 70783, "epoch": 1685} {"train_loss": -6.068532943725586, "global_step": 70784, "epoch": 1685} {"train_loss": -6.119205474853516, "global_step": 70785, "epoch": 1685} {"train_loss": -6.063887596130371, "global_step": 70786, "epoch": 1685} {"train_loss": -5.955654144287109, "global_step": 70787, "epoch": 1685} {"train_loss": -6.017420768737793, "global_step": 70788, "epoch": 1685} {"train_loss": -6.076681137084961, "global_step": 70789, "epoch": 1685} {"train_loss": -6.034838676452637, "global_step": 70790, "epoch": 1685} {"train_loss": -5.933082580566406, "global_step": 70791, "epoch": 1685} {"train_loss": -5.984941482543945, "global_step": 70792, "epoch": 1685} {"train_loss": -6.094676971435547, "global_step": 70793, "epoch": 1685} {"train_loss": -6.076145648956299, "global_step": 70794, "epoch": 1685} {"train_loss": -6.001971244812012, "global_step": 70795, "epoch": 1685} {"train_loss": -6.053503036499023, "global_step": 70796, "epoch": 1685} {"train_loss": -6.057602882385254, "global_step": 70797, "epoch": 1685} {"train_loss": -5.991240501403809, "global_step": 70798, "epoch": 1685} {"train_loss": -6.039828300476074, "global_step": 70799, "epoch": 1685} {"train_loss": -6.003230094909668, "global_step": 70800, "epoch": 1685} {"train_loss": -6.014810085296631, "global_step": 70801, "epoch": 1685} {"train_loss": -6.089807987213135, "global_step": 70802, "epoch": 1685} {"train_loss": -6.083984375, "global_step": 70803, "epoch": 1685} {"train_loss": -6.080654144287109, "global_step": 70804, "epoch": 1685} {"train_loss": -6.095822811126709, "global_step": 70805, "epoch": 1685} {"train_loss": -6.056591987609863, "global_step": 70806, "epoch": 1685} {"train_loss": -6.140522003173828, "global_step": 70807, "epoch": 1685} {"train_loss": -6.094729900360107, "global_step": 70808, "epoch": 1685} {"train_loss": -6.060528755187988, "global_step": 70809, "epoch": 1685} {"train_loss": -6.03007698059082, "global_step": 70810, "epoch": 1685} {"train_loss": -6.058663118453253, "global_step": 70811, "epoch": 1685, "val_loss": 62010.01953125} {"train_loss": -6.058786392211914, "global_step": 70812, "epoch": 1686} {"train_loss": -6.056936740875244, "global_step": 70813, "epoch": 1686} {"train_loss": -6.072999000549316, "global_step": 70814, "epoch": 1686} {"train_loss": -5.982892990112305, "global_step": 70815, "epoch": 1686} {"train_loss": -5.977825164794922, "global_step": 70816, "epoch": 1686} {"train_loss": -5.975470542907715, "global_step": 70817, "epoch": 1686} {"train_loss": -5.986739158630371, "global_step": 70818, "epoch": 1686} {"train_loss": -5.962874412536621, "global_step": 70819, "epoch": 1686} {"train_loss": -6.026722431182861, "global_step": 70820, "epoch": 1686} {"train_loss": -6.144040107727051, "global_step": 70821, "epoch": 1686} {"train_loss": -6.002470970153809, "global_step": 70822, "epoch": 1686} {"train_loss": -6.0434160232543945, "global_step": 70823, "epoch": 1686} {"train_loss": -5.978732109069824, "global_step": 70824, "epoch": 1686} {"train_loss": -5.961370468139648, "global_step": 70825, "epoch": 1686} {"train_loss": -6.070573806762695, "global_step": 70826, "epoch": 1686} {"train_loss": -6.067121505737305, "global_step": 70827, "epoch": 1686} {"train_loss": -6.028002738952637, "global_step": 70828, "epoch": 1686} {"train_loss": -6.046168327331543, "global_step": 70829, "epoch": 1686} {"train_loss": -5.987316131591797, "global_step": 70830, "epoch": 1686} {"train_loss": -6.082887649536133, "global_step": 70831, "epoch": 1686} {"train_loss": -6.175940036773682, "global_step": 70832, "epoch": 1686} {"train_loss": -6.021709442138672, "global_step": 70833, "epoch": 1686} {"train_loss": -6.093029975891113, "global_step": 70834, "epoch": 1686} {"train_loss": -6.117190361022949, "global_step": 70835, "epoch": 1686} {"train_loss": -6.054709434509277, "global_step": 70836, "epoch": 1686} {"train_loss": -6.055004119873047, "global_step": 70837, "epoch": 1686} {"train_loss": -6.026160717010498, "global_step": 70838, "epoch": 1686} {"train_loss": -6.046753406524658, "global_step": 70839, "epoch": 1686} {"train_loss": -5.965007781982422, "global_step": 70840, "epoch": 1686} {"train_loss": -6.137129783630371, "global_step": 70841, "epoch": 1686} {"train_loss": -6.040202617645264, "global_step": 70842, "epoch": 1686} {"train_loss": -5.9846038818359375, "global_step": 70843, "epoch": 1686} {"train_loss": -6.055332660675049, "global_step": 70844, "epoch": 1686} {"train_loss": -6.087925910949707, "global_step": 70845, "epoch": 1686} {"train_loss": -6.065263271331787, "global_step": 70846, "epoch": 1686} {"train_loss": -6.123194694519043, "global_step": 70847, "epoch": 1686} {"train_loss": -5.9143385887146, "global_step": 70848, "epoch": 1686} {"train_loss": -6.058932304382324, "global_step": 70849, "epoch": 1686} {"train_loss": -6.081948280334473, "global_step": 70850, "epoch": 1686} {"train_loss": -5.952655792236328, "global_step": 70851, "epoch": 1686} {"train_loss": -5.91494083404541, "global_step": 70852, "epoch": 1686} {"train_loss": -6.038033019928705, "global_step": 70853, "epoch": 1686, "val_loss": 61810.7265625} {"train_loss": -6.151751518249512, "global_step": 70854, "epoch": 1687} {"train_loss": -6.066877841949463, "global_step": 70855, "epoch": 1687} {"train_loss": -6.034372329711914, "global_step": 70856, "epoch": 1687} {"train_loss": -6.031671524047852, "global_step": 70857, "epoch": 1687} {"train_loss": -5.885124206542969, "global_step": 70858, "epoch": 1687} {"train_loss": -6.151176452636719, "global_step": 70859, "epoch": 1687} {"train_loss": -5.949855804443359, "global_step": 70860, "epoch": 1687} {"train_loss": -6.051427841186523, "global_step": 70861, "epoch": 1687} {"train_loss": -6.040589809417725, "global_step": 70862, "epoch": 1687} {"train_loss": -6.120453834533691, "global_step": 70863, "epoch": 1687} {"train_loss": -5.972561836242676, "global_step": 70864, "epoch": 1687} {"train_loss": -6.1455535888671875, "global_step": 70865, "epoch": 1687} {"train_loss": -6.086672782897949, "global_step": 70866, "epoch": 1687} {"train_loss": -5.998444557189941, "global_step": 70867, "epoch": 1687} {"train_loss": -5.882407188415527, "global_step": 70868, "epoch": 1687} {"train_loss": -5.994186878204346, "global_step": 70869, "epoch": 1687} {"train_loss": -6.046371936798096, "global_step": 70870, "epoch": 1687} {"train_loss": -6.007070541381836, "global_step": 70871, "epoch": 1687} {"train_loss": -6.030817031860352, "global_step": 70872, "epoch": 1687} {"train_loss": -5.952367782592773, "global_step": 70873, "epoch": 1687} {"train_loss": -6.057036399841309, "global_step": 70874, "epoch": 1687} {"train_loss": -5.9130401611328125, "global_step": 70875, "epoch": 1687} {"train_loss": -5.977187156677246, "global_step": 70876, "epoch": 1687} {"train_loss": -5.97230339050293, "global_step": 70877, "epoch": 1687} {"train_loss": -5.906074523925781, "global_step": 70878, "epoch": 1687} {"train_loss": -6.024892807006836, "global_step": 70879, "epoch": 1687} {"train_loss": -5.9046630859375, "global_step": 70880, "epoch": 1687} {"train_loss": -6.083410739898682, "global_step": 70881, "epoch": 1687} {"train_loss": -5.919926643371582, "global_step": 70882, "epoch": 1687} {"train_loss": -5.982816696166992, "global_step": 70883, "epoch": 1687} {"train_loss": -6.021081924438477, "global_step": 70884, "epoch": 1687} {"train_loss": -5.903953552246094, "global_step": 70885, "epoch": 1687} {"train_loss": -5.936726093292236, "global_step": 70886, "epoch": 1687} {"train_loss": -5.969476222991943, "global_step": 70887, "epoch": 1687} {"train_loss": -6.0669050216674805, "global_step": 70888, "epoch": 1687} {"train_loss": -6.074504852294922, "global_step": 70889, "epoch": 1687} {"train_loss": -5.891975402832031, "global_step": 70890, "epoch": 1687} {"train_loss": -5.979184627532959, "global_step": 70891, "epoch": 1687} {"train_loss": -6.024079322814941, "global_step": 70892, "epoch": 1687} {"train_loss": -6.00782585144043, "global_step": 70893, "epoch": 1687} {"train_loss": -5.96965217590332, "global_step": 70894, "epoch": 1687} {"train_loss": -6.0063328970046275, "global_step": 70895, "epoch": 1687, "val_loss": 62026.5} {"train_loss": -5.997188091278076, "global_step": 70896, "epoch": 1688} {"train_loss": -6.070601940155029, "global_step": 70897, "epoch": 1688} {"train_loss": -5.969779968261719, "global_step": 70898, "epoch": 1688} {"train_loss": -5.9188761711120605, "global_step": 70899, "epoch": 1688} {"train_loss": -6.059793472290039, "global_step": 70900, "epoch": 1688} {"train_loss": -6.056643486022949, "global_step": 70901, "epoch": 1688} {"train_loss": -5.996762275695801, "global_step": 70902, "epoch": 1688} {"train_loss": -6.01751708984375, "global_step": 70903, "epoch": 1688} {"train_loss": -5.995392799377441, "global_step": 70904, "epoch": 1688} {"train_loss": -5.91822624206543, "global_step": 70905, "epoch": 1688} {"train_loss": -6.016956806182861, "global_step": 70906, "epoch": 1688} {"train_loss": -5.9424028396606445, "global_step": 70907, "epoch": 1688} {"train_loss": -5.94354248046875, "global_step": 70908, "epoch": 1688} {"train_loss": -5.987573623657227, "global_step": 70909, "epoch": 1688} {"train_loss": -6.106031894683838, "global_step": 70910, "epoch": 1688} {"train_loss": -6.075593948364258, "global_step": 70911, "epoch": 1688} {"train_loss": -6.087518692016602, "global_step": 70912, "epoch": 1688} {"train_loss": -6.074345588684082, "global_step": 70913, "epoch": 1688} {"train_loss": -6.0818071365356445, "global_step": 70914, "epoch": 1688} {"train_loss": -6.081023693084717, "global_step": 70915, "epoch": 1688} {"train_loss": -6.144094467163086, "global_step": 70916, "epoch": 1688} {"train_loss": -5.985550880432129, "global_step": 70917, "epoch": 1688} {"train_loss": -6.110541343688965, "global_step": 70918, "epoch": 1688} {"train_loss": -6.036534309387207, "global_step": 70919, "epoch": 1688} {"train_loss": -6.115636348724365, "global_step": 70920, "epoch": 1688} {"train_loss": -5.930332183837891, "global_step": 70921, "epoch": 1688} {"train_loss": -6.0552544593811035, "global_step": 70922, "epoch": 1688} {"train_loss": -6.006114959716797, "global_step": 70923, "epoch": 1688} {"train_loss": -6.074470520019531, "global_step": 70924, "epoch": 1688} {"train_loss": -5.968443870544434, "global_step": 70925, "epoch": 1688} {"train_loss": -6.061917304992676, "global_step": 70926, "epoch": 1688} {"train_loss": -6.013385772705078, "global_step": 70927, "epoch": 1688} {"train_loss": -5.998711585998535, "global_step": 70928, "epoch": 1688} {"train_loss": -6.037642955780029, "global_step": 70929, "epoch": 1688} {"train_loss": -6.156676292419434, "global_step": 70930, "epoch": 1688} {"train_loss": -5.870345115661621, "global_step": 70931, "epoch": 1688} {"train_loss": -5.980368614196777, "global_step": 70932, "epoch": 1688} {"train_loss": -6.046430587768555, "global_step": 70933, "epoch": 1688} {"train_loss": -5.994443893432617, "global_step": 70934, "epoch": 1688} {"train_loss": -6.10141658782959, "global_step": 70935, "epoch": 1688} {"train_loss": -6.029016494750977, "global_step": 70936, "epoch": 1688} {"train_loss": -6.026469628016154, "global_step": 70937, "epoch": 1688, "val_loss": 61643.3125} {"train_loss": -5.916723728179932, "global_step": 70938, "epoch": 1689} {"train_loss": -6.089843273162842, "global_step": 70939, "epoch": 1689} {"train_loss": -5.9214043617248535, "global_step": 70940, "epoch": 1689} {"train_loss": -6.059000015258789, "global_step": 70941, "epoch": 1689} {"train_loss": -6.073281288146973, "global_step": 70942, "epoch": 1689} {"train_loss": -6.007608413696289, "global_step": 70943, "epoch": 1689} {"train_loss": -6.077716827392578, "global_step": 70944, "epoch": 1689} {"train_loss": -6.139249801635742, "global_step": 70945, "epoch": 1689} {"train_loss": -6.000162601470947, "global_step": 70946, "epoch": 1689} {"train_loss": -6.019657135009766, "global_step": 70947, "epoch": 1689} {"train_loss": -6.108859539031982, "global_step": 70948, "epoch": 1689} {"train_loss": -6.051111221313477, "global_step": 70949, "epoch": 1689} {"train_loss": -6.017685890197754, "global_step": 70950, "epoch": 1689} {"train_loss": -5.986546516418457, "global_step": 70951, "epoch": 1689} {"train_loss": -6.0421295166015625, "global_step": 70952, "epoch": 1689} {"train_loss": -5.926262378692627, "global_step": 70953, "epoch": 1689} {"train_loss": -5.943748474121094, "global_step": 70954, "epoch": 1689} {"train_loss": -6.027414321899414, "global_step": 70955, "epoch": 1689} {"train_loss": -6.003693580627441, "global_step": 70956, "epoch": 1689} {"train_loss": -5.983557224273682, "global_step": 70957, "epoch": 1689} {"train_loss": -5.974673271179199, "global_step": 70958, "epoch": 1689} {"train_loss": -5.894010543823242, "global_step": 70959, "epoch": 1689} {"train_loss": -5.9467997550964355, "global_step": 70960, "epoch": 1689} {"train_loss": -5.802533149719238, "global_step": 70961, "epoch": 1689} {"train_loss": -5.97161865234375, "global_step": 70962, "epoch": 1689} {"train_loss": -5.955090045928955, "global_step": 70963, "epoch": 1689} {"train_loss": -5.953070640563965, "global_step": 70964, "epoch": 1689} {"train_loss": -5.981870651245117, "global_step": 70965, "epoch": 1689} {"train_loss": -5.957088470458984, "global_step": 70966, "epoch": 1689} {"train_loss": -5.985883712768555, "global_step": 70967, "epoch": 1689} {"train_loss": -6.001070499420166, "global_step": 70968, "epoch": 1689} {"train_loss": -6.064574241638184, "global_step": 70969, "epoch": 1689} {"train_loss": -6.015422821044922, "global_step": 70970, "epoch": 1689} {"train_loss": -6.079061031341553, "global_step": 70971, "epoch": 1689} {"train_loss": -5.917757034301758, "global_step": 70972, "epoch": 1689} {"train_loss": -6.139247894287109, "global_step": 70973, "epoch": 1689} {"train_loss": -5.9743852615356445, "global_step": 70974, "epoch": 1689} {"train_loss": -5.959683418273926, "global_step": 70975, "epoch": 1689} {"train_loss": -5.903875827789307, "global_step": 70976, "epoch": 1689} {"train_loss": -6.061985015869141, "global_step": 70977, "epoch": 1689} {"train_loss": -5.796271324157715, "global_step": 70978, "epoch": 1689} {"train_loss": -5.994478452773321, "global_step": 70979, "epoch": 1689, "val_loss": 62124.8125} {"train_loss": -5.959125518798828, "global_step": 70980, "epoch": 1690} {"train_loss": -5.936978340148926, "global_step": 70981, "epoch": 1690} {"train_loss": -5.903590202331543, "global_step": 70982, "epoch": 1690} {"train_loss": -6.008188247680664, "global_step": 70983, "epoch": 1690} {"train_loss": -5.958662986755371, "global_step": 70984, "epoch": 1690} {"train_loss": -5.947386264801025, "global_step": 70985, "epoch": 1690} {"train_loss": -5.977413654327393, "global_step": 70986, "epoch": 1690} {"train_loss": -6.067821979522705, "global_step": 70987, "epoch": 1690} {"train_loss": -5.980141639709473, "global_step": 70988, "epoch": 1690} {"train_loss": -5.978060245513916, "global_step": 70989, "epoch": 1690} {"train_loss": -5.955368995666504, "global_step": 70990, "epoch": 1690} {"train_loss": -6.060070037841797, "global_step": 70991, "epoch": 1690} {"train_loss": -5.96129035949707, "global_step": 70992, "epoch": 1690} {"train_loss": -6.0500359535217285, "global_step": 70993, "epoch": 1690} {"train_loss": -5.925637245178223, "global_step": 70994, "epoch": 1690} {"train_loss": -6.1116108894348145, "global_step": 70995, "epoch": 1690} {"train_loss": -5.984688758850098, "global_step": 70996, "epoch": 1690} {"train_loss": -6.034940719604492, "global_step": 70997, "epoch": 1690} {"train_loss": -6.043554306030273, "global_step": 70998, "epoch": 1690} {"train_loss": -5.944042682647705, "global_step": 70999, "epoch": 1690} {"train_loss": -6.156493186950684, "global_step": 71000, "epoch": 1690} {"train_loss": -6.142759323120117, "global_step": 71001, "epoch": 1690} {"train_loss": -6.061284065246582, "global_step": 71002, "epoch": 1690} {"train_loss": -6.0111799240112305, "global_step": 71003, "epoch": 1690} {"train_loss": -5.911777496337891, "global_step": 71004, "epoch": 1690} {"train_loss": -6.0003767013549805, "global_step": 71005, "epoch": 1690} {"train_loss": -6.035859107971191, "global_step": 71006, "epoch": 1690} {"train_loss": -6.115570068359375, "global_step": 71007, "epoch": 1690} {"train_loss": -6.093527793884277, "global_step": 71008, "epoch": 1690} {"train_loss": -6.114402770996094, "global_step": 71009, "epoch": 1690} {"train_loss": -5.956567287445068, "global_step": 71010, "epoch": 1690} {"train_loss": -6.0430908203125, "global_step": 71011, "epoch": 1690} {"train_loss": -6.042316436767578, "global_step": 71012, "epoch": 1690} {"train_loss": -6.085953712463379, "global_step": 71013, "epoch": 1690} {"train_loss": -6.159297943115234, "global_step": 71014, "epoch": 1690} {"train_loss": -6.1766767501831055, "global_step": 71015, "epoch": 1690} {"train_loss": -6.187079429626465, "global_step": 71016, "epoch": 1690} {"train_loss": -6.1037139892578125, "global_step": 71017, "epoch": 1690} {"train_loss": -6.133918285369873, "global_step": 71018, "epoch": 1690} {"train_loss": -6.137962341308594, "global_step": 71019, "epoch": 1690} {"train_loss": -6.087174415588379, "global_step": 71020, "epoch": 1690} {"train_loss": -6.039352246693203, "global_step": 71021, "epoch": 1690, "val_loss": 61686.41796875} {"train_loss": -6.047970294952393, "global_step": 71022, "epoch": 1691} {"train_loss": -6.083390235900879, "global_step": 71023, "epoch": 1691} {"train_loss": -6.104152679443359, "global_step": 71024, "epoch": 1691} {"train_loss": -6.047896385192871, "global_step": 71025, "epoch": 1691} {"train_loss": -6.012813568115234, "global_step": 71026, "epoch": 1691} {"train_loss": -6.119634628295898, "global_step": 71027, "epoch": 1691} {"train_loss": -6.134141445159912, "global_step": 71028, "epoch": 1691} {"train_loss": -6.190115928649902, "global_step": 71029, "epoch": 1691} {"train_loss": -6.144890785217285, "global_step": 71030, "epoch": 1691} {"train_loss": -6.117957592010498, "global_step": 71031, "epoch": 1691} {"train_loss": -6.0673112869262695, "global_step": 71032, "epoch": 1691} {"train_loss": -6.043171405792236, "global_step": 71033, "epoch": 1691} {"train_loss": -6.124289035797119, "global_step": 71034, "epoch": 1691} {"train_loss": -6.086862087249756, "global_step": 71035, "epoch": 1691} {"train_loss": -6.0534796714782715, "global_step": 71036, "epoch": 1691} {"train_loss": -6.008148193359375, "global_step": 71037, "epoch": 1691} {"train_loss": -6.027995586395264, "global_step": 71038, "epoch": 1691} {"train_loss": -6.049745559692383, "global_step": 71039, "epoch": 1691} {"train_loss": -5.950655460357666, "global_step": 71040, "epoch": 1691} {"train_loss": -6.137234687805176, "global_step": 71041, "epoch": 1691} {"train_loss": -6.135974407196045, "global_step": 71042, "epoch": 1691} {"train_loss": -6.135630130767822, "global_step": 71043, "epoch": 1691} {"train_loss": -6.016523361206055, "global_step": 71044, "epoch": 1691} {"train_loss": -6.041201591491699, "global_step": 71045, "epoch": 1691} {"train_loss": -6.058910846710205, "global_step": 71046, "epoch": 1691} {"train_loss": -6.0886616706848145, "global_step": 71047, "epoch": 1691} {"train_loss": -6.076536655426025, "global_step": 71048, "epoch": 1691} {"train_loss": -6.047816276550293, "global_step": 71049, "epoch": 1691} {"train_loss": -6.105576992034912, "global_step": 71050, "epoch": 1691} {"train_loss": -6.005955219268799, "global_step": 71051, "epoch": 1691} {"train_loss": -5.835122108459473, "global_step": 71052, "epoch": 1691} {"train_loss": -6.068463325500488, "global_step": 71053, "epoch": 1691} {"train_loss": -6.0454792976379395, "global_step": 71054, "epoch": 1691} {"train_loss": -5.9350690841674805, "global_step": 71055, "epoch": 1691} {"train_loss": -6.053528308868408, "global_step": 71056, "epoch": 1691} {"train_loss": -5.932689189910889, "global_step": 71057, "epoch": 1691} {"train_loss": -5.932553768157959, "global_step": 71058, "epoch": 1691} {"train_loss": -6.040600776672363, "global_step": 71059, "epoch": 1691} {"train_loss": -5.860647201538086, "global_step": 71060, "epoch": 1691} {"train_loss": -6.0432515144348145, "global_step": 71061, "epoch": 1691} {"train_loss": -5.99333381652832, "global_step": 71062, "epoch": 1691} {"train_loss": -6.04785402615865, "global_step": 71063, "epoch": 1691, "val_loss": 61833.86328125} {"train_loss": -5.962213516235352, "global_step": 71064, "epoch": 1692} {"train_loss": -6.118603706359863, "global_step": 71065, "epoch": 1692} {"train_loss": -6.083017349243164, "global_step": 71066, "epoch": 1692} {"train_loss": -6.011755466461182, "global_step": 71067, "epoch": 1692} {"train_loss": -6.106078147888184, "global_step": 71068, "epoch": 1692} {"train_loss": -6.0676398277282715, "global_step": 71069, "epoch": 1692} {"train_loss": -6.040393829345703, "global_step": 71070, "epoch": 1692} {"train_loss": -6.0143585205078125, "global_step": 71071, "epoch": 1692} {"train_loss": -5.895144462585449, "global_step": 71072, "epoch": 1692} {"train_loss": -6.092519760131836, "global_step": 71073, "epoch": 1692} {"train_loss": -6.1020827293396, "global_step": 71074, "epoch": 1692} {"train_loss": -5.976749420166016, "global_step": 71075, "epoch": 1692} {"train_loss": -6.099846839904785, "global_step": 71076, "epoch": 1692} {"train_loss": -6.052156925201416, "global_step": 71077, "epoch": 1692} {"train_loss": -6.089427471160889, "global_step": 71078, "epoch": 1692} {"train_loss": -6.053518295288086, "global_step": 71079, "epoch": 1692} {"train_loss": -6.008597373962402, "global_step": 71080, "epoch": 1692} {"train_loss": -5.9886016845703125, "global_step": 71081, "epoch": 1692} {"train_loss": -6.045200824737549, "global_step": 71082, "epoch": 1692} {"train_loss": -6.049853324890137, "global_step": 71083, "epoch": 1692} {"train_loss": -6.096388816833496, "global_step": 71084, "epoch": 1692} {"train_loss": -5.9670023918151855, "global_step": 71085, "epoch": 1692} {"train_loss": -5.913479804992676, "global_step": 71086, "epoch": 1692} {"train_loss": -6.029973030090332, "global_step": 71087, "epoch": 1692} {"train_loss": -6.068653106689453, "global_step": 71088, "epoch": 1692} {"train_loss": -6.064518928527832, "global_step": 71089, "epoch": 1692} {"train_loss": -6.115386962890625, "global_step": 71090, "epoch": 1692} {"train_loss": -5.884173393249512, "global_step": 71091, "epoch": 1692} {"train_loss": -5.911565780639648, "global_step": 71092, "epoch": 1692} {"train_loss": -6.007599830627441, "global_step": 71093, "epoch": 1692} {"train_loss": -6.0390424728393555, "global_step": 71094, "epoch": 1692} {"train_loss": -6.1331987380981445, "global_step": 71095, "epoch": 1692} {"train_loss": -6.030479907989502, "global_step": 71096, "epoch": 1692} {"train_loss": -6.076028823852539, "global_step": 71097, "epoch": 1692} {"train_loss": -6.026118278503418, "global_step": 71098, "epoch": 1692} {"train_loss": -6.070368766784668, "global_step": 71099, "epoch": 1692} {"train_loss": -6.021457672119141, "global_step": 71100, "epoch": 1692} {"train_loss": -5.982601165771484, "global_step": 71101, "epoch": 1692} {"train_loss": -6.079115867614746, "global_step": 71102, "epoch": 1692} {"train_loss": -6.039264678955078, "global_step": 71103, "epoch": 1692} {"train_loss": -5.841826438903809, "global_step": 71104, "epoch": 1692} {"train_loss": -6.033085448401315, "global_step": 71105, "epoch": 1692, "val_loss": 61607.453125} {"train_loss": -6.037900924682617, "global_step": 71106, "epoch": 1693} {"train_loss": -6.039003372192383, "global_step": 71107, "epoch": 1693} {"train_loss": -6.06321907043457, "global_step": 71108, "epoch": 1693} {"train_loss": -5.959536552429199, "global_step": 71109, "epoch": 1693} {"train_loss": -6.041193962097168, "global_step": 71110, "epoch": 1693} {"train_loss": -6.084038734436035, "global_step": 71111, "epoch": 1693} {"train_loss": -5.994968414306641, "global_step": 71112, "epoch": 1693} {"train_loss": -6.079206466674805, "global_step": 71113, "epoch": 1693} {"train_loss": -5.903876304626465, "global_step": 71114, "epoch": 1693} {"train_loss": -5.965664386749268, "global_step": 71115, "epoch": 1693} {"train_loss": -6.052228927612305, "global_step": 71116, "epoch": 1693} {"train_loss": -5.858692169189453, "global_step": 71117, "epoch": 1693} {"train_loss": -5.932275772094727, "global_step": 71118, "epoch": 1693} {"train_loss": -5.8040666580200195, "global_step": 71119, "epoch": 1693} {"train_loss": -6.01291561126709, "global_step": 71120, "epoch": 1693} {"train_loss": -6.090663909912109, "global_step": 71121, "epoch": 1693} {"train_loss": -5.883342742919922, "global_step": 71122, "epoch": 1693} {"train_loss": -5.986542224884033, "global_step": 71123, "epoch": 1693} {"train_loss": -5.9466142654418945, "global_step": 71124, "epoch": 1693} {"train_loss": -6.024844169616699, "global_step": 71125, "epoch": 1693} {"train_loss": -5.961324214935303, "global_step": 71126, "epoch": 1693} {"train_loss": -5.972923755645752, "global_step": 71127, "epoch": 1693} {"train_loss": -6.1019792556762695, "global_step": 71128, "epoch": 1693} {"train_loss": -5.98321533203125, "global_step": 71129, "epoch": 1693} {"train_loss": -5.991655349731445, "global_step": 71130, "epoch": 1693} {"train_loss": -6.045248985290527, "global_step": 71131, "epoch": 1693} {"train_loss": -6.07001256942749, "global_step": 71132, "epoch": 1693} {"train_loss": -6.005794525146484, "global_step": 71133, "epoch": 1693} {"train_loss": -6.009726524353027, "global_step": 71134, "epoch": 1693} {"train_loss": -5.97752571105957, "global_step": 71135, "epoch": 1693} {"train_loss": -5.970493316650391, "global_step": 71136, "epoch": 1693} {"train_loss": -6.072524547576904, "global_step": 71137, "epoch": 1693} {"train_loss": -6.033175468444824, "global_step": 71138, "epoch": 1693} {"train_loss": -6.081072807312012, "global_step": 71139, "epoch": 1693} {"train_loss": -6.037327766418457, "global_step": 71140, "epoch": 1693} {"train_loss": -6.018158435821533, "global_step": 71141, "epoch": 1693} {"train_loss": -6.06689453125, "global_step": 71142, "epoch": 1693} {"train_loss": -6.073894500732422, "global_step": 71143, "epoch": 1693} {"train_loss": -6.114579200744629, "global_step": 71144, "epoch": 1693} {"train_loss": -6.175442695617676, "global_step": 71145, "epoch": 1693} {"train_loss": -6.009337425231934, "global_step": 71146, "epoch": 1693} {"train_loss": -6.013127088546753, "global_step": 71147, "epoch": 1693, "val_loss": 61562.140625} {"train_loss": -6.038818359375, "global_step": 71148, "epoch": 1694} {"train_loss": -5.966773509979248, "global_step": 71149, "epoch": 1694} {"train_loss": -6.187221050262451, "global_step": 71150, "epoch": 1694} {"train_loss": -5.988145351409912, "global_step": 71151, "epoch": 1694} {"train_loss": -5.933218002319336, "global_step": 71152, "epoch": 1694} {"train_loss": -6.1023101806640625, "global_step": 71153, "epoch": 1694} {"train_loss": -5.928040504455566, "global_step": 71154, "epoch": 1694} {"train_loss": -5.974632263183594, "global_step": 71155, "epoch": 1694} {"train_loss": -6.067406177520752, "global_step": 71156, "epoch": 1694} {"train_loss": -5.868863105773926, "global_step": 71157, "epoch": 1694} {"train_loss": -6.066566467285156, "global_step": 71158, "epoch": 1694} {"train_loss": -6.010178565979004, "global_step": 71159, "epoch": 1694} {"train_loss": -5.965266227722168, "global_step": 71160, "epoch": 1694} {"train_loss": -5.997058868408203, "global_step": 71161, "epoch": 1694} {"train_loss": -6.104890823364258, "global_step": 71162, "epoch": 1694} {"train_loss": -6.097379684448242, "global_step": 71163, "epoch": 1694} {"train_loss": -6.005405426025391, "global_step": 71164, "epoch": 1694} {"train_loss": -6.031220436096191, "global_step": 71165, "epoch": 1694} {"train_loss": -6.152912139892578, "global_step": 71166, "epoch": 1694} {"train_loss": -6.023266315460205, "global_step": 71167, "epoch": 1694} {"train_loss": -5.8343658447265625, "global_step": 71168, "epoch": 1694} {"train_loss": -5.983119487762451, "global_step": 71169, "epoch": 1694} {"train_loss": -5.968051910400391, "global_step": 71170, "epoch": 1694} {"train_loss": -6.090216636657715, "global_step": 71171, "epoch": 1694} {"train_loss": -6.065580368041992, "global_step": 71172, "epoch": 1694} {"train_loss": -6.050442695617676, "global_step": 71173, "epoch": 1694} {"train_loss": -6.147744178771973, "global_step": 71174, "epoch": 1694} {"train_loss": -5.933071136474609, "global_step": 71175, "epoch": 1694} {"train_loss": -6.1235151290893555, "global_step": 71176, "epoch": 1694} {"train_loss": -6.015039443969727, "global_step": 71177, "epoch": 1694} {"train_loss": -5.998684883117676, "global_step": 71178, "epoch": 1694} {"train_loss": -6.1025776863098145, "global_step": 71179, "epoch": 1694} {"train_loss": -6.1124773025512695, "global_step": 71180, "epoch": 1694} {"train_loss": -6.006374359130859, "global_step": 71181, "epoch": 1694} {"train_loss": -6.027316570281982, "global_step": 71182, "epoch": 1694} {"train_loss": -6.125978469848633, "global_step": 71183, "epoch": 1694} {"train_loss": -6.072590351104736, "global_step": 71184, "epoch": 1694} {"train_loss": -5.952472686767578, "global_step": 71185, "epoch": 1694} {"train_loss": -6.041270732879639, "global_step": 71186, "epoch": 1694} {"train_loss": -6.04832649230957, "global_step": 71187, "epoch": 1694} {"train_loss": -5.995675563812256, "global_step": 71188, "epoch": 1694} {"train_loss": -6.0316235565003895, "global_step": 71189, "epoch": 1694, "val_loss": 61928.87109375} {"train_loss": -6.186910152435303, "global_step": 71190, "epoch": 1695} {"train_loss": -6.0125813484191895, "global_step": 71191, "epoch": 1695} {"train_loss": -6.09661340713501, "global_step": 71192, "epoch": 1695} {"train_loss": -6.101551532745361, "global_step": 71193, "epoch": 1695} {"train_loss": -5.977274417877197, "global_step": 71194, "epoch": 1695} {"train_loss": -6.001858711242676, "global_step": 71195, "epoch": 1695} {"train_loss": -6.105912208557129, "global_step": 71196, "epoch": 1695} {"train_loss": -5.941605091094971, "global_step": 71197, "epoch": 1695} {"train_loss": -6.210454940795898, "global_step": 71198, "epoch": 1695} {"train_loss": -6.108983993530273, "global_step": 71199, "epoch": 1695} {"train_loss": -6.103035926818848, "global_step": 71200, "epoch": 1695} {"train_loss": -6.071539878845215, "global_step": 71201, "epoch": 1695} {"train_loss": -5.927576065063477, "global_step": 71202, "epoch": 1695} {"train_loss": -6.066658973693848, "global_step": 71203, "epoch": 1695} {"train_loss": -6.080072402954102, "global_step": 71204, "epoch": 1695} {"train_loss": -6.073987007141113, "global_step": 71205, "epoch": 1695} {"train_loss": -6.019092559814453, "global_step": 71206, "epoch": 1695} {"train_loss": -6.057096004486084, "global_step": 71207, "epoch": 1695} {"train_loss": -6.030343055725098, "global_step": 71208, "epoch": 1695} {"train_loss": -6.116628170013428, "global_step": 71209, "epoch": 1695} {"train_loss": -6.062034606933594, "global_step": 71210, "epoch": 1695} {"train_loss": -6.0991716384887695, "global_step": 71211, "epoch": 1695} {"train_loss": -5.977621078491211, "global_step": 71212, "epoch": 1695} {"train_loss": -6.020284652709961, "global_step": 71213, "epoch": 1695} {"train_loss": -6.108278274536133, "global_step": 71214, "epoch": 1695} {"train_loss": -6.049914360046387, "global_step": 71215, "epoch": 1695} {"train_loss": -5.991527557373047, "global_step": 71216, "epoch": 1695} {"train_loss": -6.1313347816467285, "global_step": 71217, "epoch": 1695} {"train_loss": -6.078879356384277, "global_step": 71218, "epoch": 1695} {"train_loss": -6.202791213989258, "global_step": 71219, "epoch": 1695} {"train_loss": -6.129724025726318, "global_step": 71220, "epoch": 1695} {"train_loss": -6.131914138793945, "global_step": 71221, "epoch": 1695} {"train_loss": -6.1146368980407715, "global_step": 71222, "epoch": 1695} {"train_loss": -5.869349002838135, "global_step": 71223, "epoch": 1695} {"train_loss": -5.978643417358398, "global_step": 71224, "epoch": 1695} {"train_loss": -5.985507011413574, "global_step": 71225, "epoch": 1695} {"train_loss": -5.95194673538208, "global_step": 71226, "epoch": 1695} {"train_loss": -6.083649635314941, "global_step": 71227, "epoch": 1695} {"train_loss": -6.018889427185059, "global_step": 71228, "epoch": 1695} {"train_loss": -6.026871681213379, "global_step": 71229, "epoch": 1695} {"train_loss": -6.082700729370117, "global_step": 71230, "epoch": 1695} {"train_loss": -6.055575438908169, "global_step": 71231, "epoch": 1695, "val_loss": 61821.53125} {"train_loss": -6.096902847290039, "global_step": 71232, "epoch": 1696} {"train_loss": -6.081865310668945, "global_step": 71233, "epoch": 1696} {"train_loss": -5.989333152770996, "global_step": 71234, "epoch": 1696} {"train_loss": -6.0400590896606445, "global_step": 71235, "epoch": 1696} {"train_loss": -5.839926719665527, "global_step": 71236, "epoch": 1696} {"train_loss": -5.916290760040283, "global_step": 71237, "epoch": 1696} {"train_loss": -6.070047378540039, "global_step": 71238, "epoch": 1696} {"train_loss": -5.937717437744141, "global_step": 71239, "epoch": 1696} {"train_loss": -6.052474498748779, "global_step": 71240, "epoch": 1696} {"train_loss": -6.082067489624023, "global_step": 71241, "epoch": 1696} {"train_loss": -6.088951110839844, "global_step": 71242, "epoch": 1696} {"train_loss": -6.188786506652832, "global_step": 71243, "epoch": 1696} {"train_loss": -6.081384658813477, "global_step": 71244, "epoch": 1696} {"train_loss": -6.048634052276611, "global_step": 71245, "epoch": 1696} {"train_loss": -6.049098968505859, "global_step": 71246, "epoch": 1696} {"train_loss": -6.166399002075195, "global_step": 71247, "epoch": 1696} {"train_loss": -6.128361701965332, "global_step": 71248, "epoch": 1696} {"train_loss": -6.02389669418335, "global_step": 71249, "epoch": 1696} {"train_loss": -5.975503921508789, "global_step": 71250, "epoch": 1696} {"train_loss": -6.0056962966918945, "global_step": 71251, "epoch": 1696} {"train_loss": -6.105397701263428, "global_step": 71252, "epoch": 1696} {"train_loss": -5.9181718826293945, "global_step": 71253, "epoch": 1696} {"train_loss": -5.9594621658325195, "global_step": 71254, "epoch": 1696} {"train_loss": -6.051592826843262, "global_step": 71255, "epoch": 1696} {"train_loss": -6.0818562507629395, "global_step": 71256, "epoch": 1696} {"train_loss": -5.966386795043945, "global_step": 71257, "epoch": 1696} {"train_loss": -5.987677574157715, "global_step": 71258, "epoch": 1696} {"train_loss": -6.005205154418945, "global_step": 71259, "epoch": 1696} {"train_loss": -6.155786514282227, "global_step": 71260, "epoch": 1696} {"train_loss": -6.037703514099121, "global_step": 71261, "epoch": 1696} {"train_loss": -6.052882671356201, "global_step": 71262, "epoch": 1696} {"train_loss": -6.052297115325928, "global_step": 71263, "epoch": 1696} {"train_loss": -5.932511329650879, "global_step": 71264, "epoch": 1696} {"train_loss": -5.9614691734313965, "global_step": 71265, "epoch": 1696} {"train_loss": -6.126666069030762, "global_step": 71266, "epoch": 1696} {"train_loss": -6.089652061462402, "global_step": 71267, "epoch": 1696} {"train_loss": -6.010729789733887, "global_step": 71268, "epoch": 1696} {"train_loss": -6.15760612487793, "global_step": 71269, "epoch": 1696} {"train_loss": -6.18706750869751, "global_step": 71270, "epoch": 1696} {"train_loss": -6.040923118591309, "global_step": 71271, "epoch": 1696} {"train_loss": -6.016891002655029, "global_step": 71272, "epoch": 1696} {"train_loss": -6.046418723605928, "global_step": 71273, "epoch": 1696, "val_loss": 61559.26953125} {"train_loss": -6.125344276428223, "global_step": 71274, "epoch": 1697} {"train_loss": -6.10683536529541, "global_step": 71275, "epoch": 1697} {"train_loss": -6.105564117431641, "global_step": 71276, "epoch": 1697} {"train_loss": -6.091400623321533, "global_step": 71277, "epoch": 1697} {"train_loss": -6.064787864685059, "global_step": 71278, "epoch": 1697} {"train_loss": -5.966811180114746, "global_step": 71279, "epoch": 1697} {"train_loss": -6.198167324066162, "global_step": 71280, "epoch": 1697} {"train_loss": -5.964377403259277, "global_step": 71281, "epoch": 1697} {"train_loss": -5.98109245300293, "global_step": 71282, "epoch": 1697} {"train_loss": -5.9493021965026855, "global_step": 71283, "epoch": 1697} {"train_loss": -5.913562774658203, "global_step": 71284, "epoch": 1697} {"train_loss": -5.919846534729004, "global_step": 71285, "epoch": 1697} {"train_loss": -5.997745513916016, "global_step": 71286, "epoch": 1697} {"train_loss": -6.105991840362549, "global_step": 71287, "epoch": 1697} {"train_loss": -5.944974422454834, "global_step": 71288, "epoch": 1697} {"train_loss": -6.009243965148926, "global_step": 71289, "epoch": 1697} {"train_loss": -6.123763084411621, "global_step": 71290, "epoch": 1697} {"train_loss": -6.097352027893066, "global_step": 71291, "epoch": 1697} {"train_loss": -6.04079008102417, "global_step": 71292, "epoch": 1697} {"train_loss": -5.926845073699951, "global_step": 71293, "epoch": 1697} {"train_loss": -5.990875244140625, "global_step": 71294, "epoch": 1697} {"train_loss": -5.981104373931885, "global_step": 71295, "epoch": 1697} {"train_loss": -6.070737838745117, "global_step": 71296, "epoch": 1697} {"train_loss": -6.011909484863281, "global_step": 71297, "epoch": 1697} {"train_loss": -6.054760932922363, "global_step": 71298, "epoch": 1697} {"train_loss": -5.981149196624756, "global_step": 71299, "epoch": 1697} {"train_loss": -5.949158191680908, "global_step": 71300, "epoch": 1697} {"train_loss": -5.991443157196045, "global_step": 71301, "epoch": 1697} {"train_loss": -6.01230525970459, "global_step": 71302, "epoch": 1697} {"train_loss": -6.045469760894775, "global_step": 71303, "epoch": 1697} {"train_loss": -5.955803394317627, "global_step": 71304, "epoch": 1697} {"train_loss": -5.971529960632324, "global_step": 71305, "epoch": 1697} {"train_loss": -6.111248016357422, "global_step": 71306, "epoch": 1697} {"train_loss": -6.081961631774902, "global_step": 71307, "epoch": 1697} {"train_loss": -6.0608415603637695, "global_step": 71308, "epoch": 1697} {"train_loss": -6.029751777648926, "global_step": 71309, "epoch": 1697} {"train_loss": -5.971802711486816, "global_step": 71310, "epoch": 1697} {"train_loss": -6.11057710647583, "global_step": 71311, "epoch": 1697} {"train_loss": -6.091774940490723, "global_step": 71312, "epoch": 1697} {"train_loss": -6.073724746704102, "global_step": 71313, "epoch": 1697} {"train_loss": -5.991892337799072, "global_step": 71314, "epoch": 1697} {"train_loss": -6.0293333530426025, "global_step": 71315, "epoch": 1697, "val_loss": 61659.859375} {"train_loss": -6.031702995300293, "global_step": 71316, "epoch": 1698} {"train_loss": -6.164050102233887, "global_step": 71317, "epoch": 1698} {"train_loss": -6.138834476470947, "global_step": 71318, "epoch": 1698} {"train_loss": -6.00568962097168, "global_step": 71319, "epoch": 1698} {"train_loss": -6.052215576171875, "global_step": 71320, "epoch": 1698} {"train_loss": -6.001197338104248, "global_step": 71321, "epoch": 1698} {"train_loss": -5.995786666870117, "global_step": 71322, "epoch": 1698} {"train_loss": -6.13840389251709, "global_step": 71323, "epoch": 1698} {"train_loss": -6.067487716674805, "global_step": 71324, "epoch": 1698} {"train_loss": -6.13752555847168, "global_step": 71325, "epoch": 1698} {"train_loss": -5.929123878479004, "global_step": 71326, "epoch": 1698} {"train_loss": -5.988831520080566, "global_step": 71327, "epoch": 1698} {"train_loss": -6.173986434936523, "global_step": 71328, "epoch": 1698} {"train_loss": -6.1617889404296875, "global_step": 71329, "epoch": 1698} {"train_loss": -6.085694313049316, "global_step": 71330, "epoch": 1698} {"train_loss": -6.098920822143555, "global_step": 71331, "epoch": 1698} {"train_loss": -6.092441558837891, "global_step": 71332, "epoch": 1698} {"train_loss": -6.012012481689453, "global_step": 71333, "epoch": 1698} {"train_loss": -6.126441955566406, "global_step": 71334, "epoch": 1698} {"train_loss": -6.014210224151611, "global_step": 71335, "epoch": 1698} {"train_loss": -6.056819915771484, "global_step": 71336, "epoch": 1698} {"train_loss": -6.158679008483887, "global_step": 71337, "epoch": 1698} {"train_loss": -6.018592834472656, "global_step": 71338, "epoch": 1698} {"train_loss": -6.035259246826172, "global_step": 71339, "epoch": 1698} {"train_loss": -6.200255393981934, "global_step": 71340, "epoch": 1698} {"train_loss": -6.000100135803223, "global_step": 71341, "epoch": 1698} {"train_loss": -6.1504669189453125, "global_step": 71342, "epoch": 1698} {"train_loss": -5.99776554107666, "global_step": 71343, "epoch": 1698} {"train_loss": -6.0658369064331055, "global_step": 71344, "epoch": 1698} {"train_loss": -5.94936466217041, "global_step": 71345, "epoch": 1698} {"train_loss": -6.020485877990723, "global_step": 71346, "epoch": 1698} {"train_loss": -6.006833553314209, "global_step": 71347, "epoch": 1698} {"train_loss": -5.969350814819336, "global_step": 71348, "epoch": 1698} {"train_loss": -6.019712924957275, "global_step": 71349, "epoch": 1698} {"train_loss": -6.090672016143799, "global_step": 71350, "epoch": 1698} {"train_loss": -6.084527015686035, "global_step": 71351, "epoch": 1698} {"train_loss": -6.020199775695801, "global_step": 71352, "epoch": 1698} {"train_loss": -6.085760116577148, "global_step": 71353, "epoch": 1698} {"train_loss": -6.058843612670898, "global_step": 71354, "epoch": 1698} {"train_loss": -6.118292331695557, "global_step": 71355, "epoch": 1698} {"train_loss": -6.047850608825684, "global_step": 71356, "epoch": 1698} {"train_loss": -6.063047170639038, "global_step": 71357, "epoch": 1698, "val_loss": 62103.33984375} {"train_loss": -6.116863250732422, "global_step": 71358, "epoch": 1699} {"train_loss": -6.020933628082275, "global_step": 71359, "epoch": 1699} {"train_loss": -6.062169075012207, "global_step": 71360, "epoch": 1699} {"train_loss": -6.096279144287109, "global_step": 71361, "epoch": 1699} {"train_loss": -6.161961555480957, "global_step": 71362, "epoch": 1699} {"train_loss": -5.991227626800537, "global_step": 71363, "epoch": 1699} {"train_loss": -6.015037536621094, "global_step": 71364, "epoch": 1699} {"train_loss": -5.983609676361084, "global_step": 71365, "epoch": 1699} {"train_loss": -6.060644626617432, "global_step": 71366, "epoch": 1699} {"train_loss": -6.060932159423828, "global_step": 71367, "epoch": 1699} {"train_loss": -5.991573810577393, "global_step": 71368, "epoch": 1699} {"train_loss": -6.201637268066406, "global_step": 71369, "epoch": 1699} {"train_loss": -6.08836555480957, "global_step": 71370, "epoch": 1699} {"train_loss": -6.168596267700195, "global_step": 71371, "epoch": 1699} {"train_loss": -5.986453056335449, "global_step": 71372, "epoch": 1699} {"train_loss": -6.014801025390625, "global_step": 71373, "epoch": 1699} {"train_loss": -6.017508029937744, "global_step": 71374, "epoch": 1699} {"train_loss": -6.032155513763428, "global_step": 71375, "epoch": 1699} {"train_loss": -6.072487831115723, "global_step": 71376, "epoch": 1699} {"train_loss": -6.097922325134277, "global_step": 71377, "epoch": 1699} {"train_loss": -6.0097270011901855, "global_step": 71378, "epoch": 1699} {"train_loss": -5.962871551513672, "global_step": 71379, "epoch": 1699} {"train_loss": -5.925911903381348, "global_step": 71380, "epoch": 1699} {"train_loss": -5.954336166381836, "global_step": 71381, "epoch": 1699} {"train_loss": -6.02840518951416, "global_step": 71382, "epoch": 1699} {"train_loss": -6.029355049133301, "global_step": 71383, "epoch": 1699} {"train_loss": -6.013408184051514, "global_step": 71384, "epoch": 1699} {"train_loss": -5.9587812423706055, "global_step": 71385, "epoch": 1699} {"train_loss": -6.154522895812988, "global_step": 71386, "epoch": 1699} {"train_loss": -6.058539390563965, "global_step": 71387, "epoch": 1699} {"train_loss": -5.8977508544921875, "global_step": 71388, "epoch": 1699} {"train_loss": -6.136794567108154, "global_step": 71389, "epoch": 1699} {"train_loss": -6.099233150482178, "global_step": 71390, "epoch": 1699} {"train_loss": -5.940436840057373, "global_step": 71391, "epoch": 1699} {"train_loss": -6.042031764984131, "global_step": 71392, "epoch": 1699} {"train_loss": -5.895044803619385, "global_step": 71393, "epoch": 1699} {"train_loss": -5.8346452713012695, "global_step": 71394, "epoch": 1699} {"train_loss": -5.919368743896484, "global_step": 71395, "epoch": 1699} {"train_loss": -6.01060676574707, "global_step": 71396, "epoch": 1699} {"train_loss": -6.006800651550293, "global_step": 71397, "epoch": 1699} {"train_loss": -6.058687686920166, "global_step": 71398, "epoch": 1699} {"train_loss": -6.028630881082444, "global_step": 71399, "epoch": 1699, "val_loss": 61550.23046875} {"train_loss": -5.993356704711914, "global_step": 71400, "epoch": 1700} {"train_loss": -6.1179304122924805, "global_step": 71401, "epoch": 1700} {"train_loss": -6.0758514404296875, "global_step": 71402, "epoch": 1700} {"train_loss": -6.019330978393555, "global_step": 71403, "epoch": 1700} {"train_loss": -6.061565399169922, "global_step": 71404, "epoch": 1700} {"train_loss": -6.04135274887085, "global_step": 71405, "epoch": 1700} {"train_loss": -5.971672058105469, "global_step": 71406, "epoch": 1700} {"train_loss": -6.1208906173706055, "global_step": 71407, "epoch": 1700} {"train_loss": -6.072352409362793, "global_step": 71408, "epoch": 1700} {"train_loss": -5.929570198059082, "global_step": 71409, "epoch": 1700} {"train_loss": -6.119637966156006, "global_step": 71410, "epoch": 1700} {"train_loss": -5.9385762214660645, "global_step": 71411, "epoch": 1700} {"train_loss": -5.967188835144043, "global_step": 71412, "epoch": 1700} {"train_loss": -6.028678894042969, "global_step": 71413, "epoch": 1700} {"train_loss": -5.943222999572754, "global_step": 71414, "epoch": 1700} {"train_loss": -5.826179504394531, "global_step": 71415, "epoch": 1700} {"train_loss": -6.038201332092285, "global_step": 71416, "epoch": 1700} {"train_loss": -6.025968551635742, "global_step": 71417, "epoch": 1700} {"train_loss": -5.873171806335449, "global_step": 71418, "epoch": 1700} {"train_loss": -5.969385147094727, "global_step": 71419, "epoch": 1700} {"train_loss": -6.074956893920898, "global_step": 71420, "epoch": 1700} {"train_loss": -5.973793029785156, "global_step": 71421, "epoch": 1700} {"train_loss": -5.985530853271484, "global_step": 71422, "epoch": 1700} {"train_loss": -6.013762950897217, "global_step": 71423, "epoch": 1700} {"train_loss": -6.012345314025879, "global_step": 71424, "epoch": 1700} {"train_loss": -6.007795810699463, "global_step": 71425, "epoch": 1700} {"train_loss": -5.977415084838867, "global_step": 71426, "epoch": 1700} {"train_loss": -5.860977649688721, "global_step": 71427, "epoch": 1700} {"train_loss": -5.995077133178711, "global_step": 71428, "epoch": 1700} {"train_loss": -6.160848617553711, "global_step": 71429, "epoch": 1700} {"train_loss": -6.040699005126953, "global_step": 71430, "epoch": 1700} {"train_loss": -5.953974723815918, "global_step": 71431, "epoch": 1700} {"train_loss": -5.886294364929199, "global_step": 71432, "epoch": 1700} {"train_loss": -5.962340354919434, "global_step": 71433, "epoch": 1700} {"train_loss": -5.968747138977051, "global_step": 71434, "epoch": 1700} {"train_loss": -5.911929130554199, "global_step": 71435, "epoch": 1700} {"train_loss": -5.973309516906738, "global_step": 71436, "epoch": 1700} {"train_loss": -6.0831427574157715, "global_step": 71437, "epoch": 1700} {"train_loss": -6.001034736633301, "global_step": 71438, "epoch": 1700} {"train_loss": -6.1579179763793945, "global_step": 71439, "epoch": 1700} {"train_loss": -5.955977439880371, "global_step": 71440, "epoch": 1700} {"train_loss": -6.00310620807466, "global_step": 71441, "epoch": 1700, "train/sim_max_reward_0": 0.8928191334282826, "train/sim_max_reward_1": 0.28581274181377175, "train/sim_max_reward_2": 0.6980854959156748, "train/sim_max_reward_3": 0.15629031309131702, "train/sim_max_reward_4": 0.8551122969911574, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.38374157923640373, "test/sim_max_reward_4300001": 0.5080561245257008, "test/sim_max_reward_4300002": 0.9832900671062991, "test/sim_max_reward_4300003": 0.9106880164400291, "test/sim_max_reward_4300004": 0.9845048891378401, "test/sim_max_reward_4300005": 0.42056091079659474, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3678899621251318, "test/sim_max_reward_4300008": 0.5112609123086571, "test/sim_max_reward_4300009": 0.8393442675933528, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.8902651928898131, "test/sim_max_reward_4300012": 0.8694805006149388, "test/sim_max_reward_4300013": 0.41282772043923205, "test/sim_max_reward_4300014": 0.9362008553989221, "test/sim_max_reward_4300015": 0.8814215727686097, "test/sim_max_reward_4300016": 0.9085449276087515, "test/sim_max_reward_4300017": 0.8573890005531812, "test/sim_max_reward_4300018": 0.38574334275576155, "test/sim_max_reward_4300019": 0.1867959234411197, "test/sim_max_reward_4300020": 0.8583320949310127, "test/sim_max_reward_4300021": 1.0, "test/sim_max_reward_4300022": 0.797952768816592, "test/sim_max_reward_4300023": 0.33046796018872504, "test/sim_max_reward_4300024": 0.024389292646722557, "test/sim_max_reward_4300025": 0.565782775751901, "test/sim_max_reward_4300026": 0.847101619492622, "test/sim_max_reward_4300027": 0.8384197077799888, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.924844804856734, "test/sim_max_reward_4300030": 0.00611325477482507, "test/sim_max_reward_4300031": 0.20858050620919683, "test/sim_max_reward_4300032": 0.8137877469178876, "test/sim_max_reward_4300033": 0.530533940465193, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.24389915231729437, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 1.0, "test/sim_max_reward_4300038": 0.5670159474865769, "test/sim_max_reward_4300039": 0.9320737964701054, "test/sim_max_reward_4300040": 0.855301180767051, "test/sim_max_reward_4300041": 0.9830649013960812, "test/sim_max_reward_4300042": 0.8499852653733867, "test/sim_max_reward_4300043": 0.17245814207504243, "test/sim_max_reward_4300044": 0.6989744091254846, "test/sim_max_reward_4300045": 0.18197828021695922, "test/sim_max_reward_4300046": 0.5919047476278176, "test/sim_max_reward_4300047": 0.9075424380687892, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.23267160109284665, "train/mean_score": 0.5135174567670652, "test/mean_score": 0.568007524323053, "val_loss": 61870.6875} {"train_loss": -6.062406539916992, "global_step": 71442, "epoch": 1701} {"train_loss": -6.031797409057617, "global_step": 71443, "epoch": 1701} {"train_loss": -6.044942378997803, "global_step": 71444, "epoch": 1701} {"train_loss": -5.997465133666992, "global_step": 71445, "epoch": 1701} {"train_loss": -5.959323883056641, "global_step": 71446, "epoch": 1701} {"train_loss": -6.129568099975586, "global_step": 71447, "epoch": 1701} {"train_loss": -5.933870315551758, "global_step": 71448, "epoch": 1701} {"train_loss": -6.059512138366699, "global_step": 71449, "epoch": 1701} {"train_loss": -6.052543640136719, "global_step": 71450, "epoch": 1701} {"train_loss": -6.126360893249512, "global_step": 71451, "epoch": 1701} {"train_loss": -6.123323917388916, "global_step": 71452, "epoch": 1701} {"train_loss": -6.064828872680664, "global_step": 71453, "epoch": 1701} {"train_loss": -5.995630264282227, "global_step": 71454, "epoch": 1701} {"train_loss": -6.066395282745361, "global_step": 71455, "epoch": 1701} {"train_loss": -6.1202392578125, "global_step": 71456, "epoch": 1701} {"train_loss": -6.06634521484375, "global_step": 71457, "epoch": 1701} {"train_loss": -6.146568775177002, "global_step": 71458, "epoch": 1701} {"train_loss": -5.953167915344238, "global_step": 71459, "epoch": 1701} {"train_loss": -6.006951332092285, "global_step": 71460, "epoch": 1701} {"train_loss": -6.0840301513671875, "global_step": 71461, "epoch": 1701} {"train_loss": -5.983058452606201, "global_step": 71462, "epoch": 1701} {"train_loss": -6.204153060913086, "global_step": 71463, "epoch": 1701} {"train_loss": -5.9252119064331055, "global_step": 71464, "epoch": 1701} {"train_loss": -5.9148969650268555, "global_step": 71465, "epoch": 1701} {"train_loss": -6.0651702880859375, "global_step": 71466, "epoch": 1701} {"train_loss": -6.061183452606201, "global_step": 71467, "epoch": 1701} {"train_loss": -6.062127113342285, "global_step": 71468, "epoch": 1701} {"train_loss": -6.059479713439941, "global_step": 71469, "epoch": 1701} {"train_loss": -6.034158706665039, "global_step": 71470, "epoch": 1701} {"train_loss": -6.063692092895508, "global_step": 71471, "epoch": 1701} {"train_loss": -5.996537208557129, "global_step": 71472, "epoch": 1701} {"train_loss": -6.03037166595459, "global_step": 71473, "epoch": 1701} {"train_loss": -5.974593639373779, "global_step": 71474, "epoch": 1701} {"train_loss": -6.062258243560791, "global_step": 71475, "epoch": 1701} {"train_loss": -5.939977645874023, "global_step": 71476, "epoch": 1701} {"train_loss": -6.014371871948242, "global_step": 71477, "epoch": 1701} {"train_loss": -6.088202953338623, "global_step": 71478, "epoch": 1701} {"train_loss": -5.992397308349609, "global_step": 71479, "epoch": 1701} {"train_loss": -6.039979934692383, "global_step": 71480, "epoch": 1701} {"train_loss": -6.092533111572266, "global_step": 71481, "epoch": 1701} {"train_loss": -5.94630241394043, "global_step": 71482, "epoch": 1701} {"train_loss": -6.0380932830628895, "global_step": 71483, "epoch": 1701, "val_loss": 61680.59375} {"train_loss": -6.0559492111206055, "global_step": 71484, "epoch": 1702} {"train_loss": -6.109970569610596, "global_step": 71485, "epoch": 1702} {"train_loss": -6.091712951660156, "global_step": 71486, "epoch": 1702} {"train_loss": -6.085504055023193, "global_step": 71487, "epoch": 1702} {"train_loss": -6.08330774307251, "global_step": 71488, "epoch": 1702} {"train_loss": -6.064278602600098, "global_step": 71489, "epoch": 1702} {"train_loss": -6.0744309425354, "global_step": 71490, "epoch": 1702} {"train_loss": -6.130527496337891, "global_step": 71491, "epoch": 1702} {"train_loss": -6.091156959533691, "global_step": 71492, "epoch": 1702} {"train_loss": -6.117652893066406, "global_step": 71493, "epoch": 1702} {"train_loss": -6.082428932189941, "global_step": 71494, "epoch": 1702} {"train_loss": -6.119946479797363, "global_step": 71495, "epoch": 1702} {"train_loss": -6.0903778076171875, "global_step": 71496, "epoch": 1702} {"train_loss": -6.159449100494385, "global_step": 71497, "epoch": 1702} {"train_loss": -6.075265884399414, "global_step": 71498, "epoch": 1702} {"train_loss": -6.130077362060547, "global_step": 71499, "epoch": 1702} {"train_loss": -6.1985673904418945, "global_step": 71500, "epoch": 1702} {"train_loss": -6.000358581542969, "global_step": 71501, "epoch": 1702} {"train_loss": -5.98423957824707, "global_step": 71502, "epoch": 1702} {"train_loss": -6.087908744812012, "global_step": 71503, "epoch": 1702} {"train_loss": -6.03167200088501, "global_step": 71504, "epoch": 1702} {"train_loss": -6.053407669067383, "global_step": 71505, "epoch": 1702} {"train_loss": -6.004655838012695, "global_step": 71506, "epoch": 1702} {"train_loss": -6.101133346557617, "global_step": 71507, "epoch": 1702} {"train_loss": -6.163324356079102, "global_step": 71508, "epoch": 1702} {"train_loss": -6.081118583679199, "global_step": 71509, "epoch": 1702} {"train_loss": -6.096053123474121, "global_step": 71510, "epoch": 1702} {"train_loss": -6.0970306396484375, "global_step": 71511, "epoch": 1702} {"train_loss": -5.988584518432617, "global_step": 71512, "epoch": 1702} {"train_loss": -6.108964443206787, "global_step": 71513, "epoch": 1702} {"train_loss": -6.070681095123291, "global_step": 71514, "epoch": 1702} {"train_loss": -5.947562217712402, "global_step": 71515, "epoch": 1702} {"train_loss": -5.990120887756348, "global_step": 71516, "epoch": 1702} {"train_loss": -5.924283504486084, "global_step": 71517, "epoch": 1702} {"train_loss": -5.95772647857666, "global_step": 71518, "epoch": 1702} {"train_loss": -6.042131423950195, "global_step": 71519, "epoch": 1702} {"train_loss": -6.004820823669434, "global_step": 71520, "epoch": 1702} {"train_loss": -5.9362921714782715, "global_step": 71521, "epoch": 1702} {"train_loss": -6.019747734069824, "global_step": 71522, "epoch": 1702} {"train_loss": -6.018588066101074, "global_step": 71523, "epoch": 1702} {"train_loss": -6.050902366638184, "global_step": 71524, "epoch": 1702} {"train_loss": -6.061382668358939, "global_step": 71525, "epoch": 1702, "val_loss": 61787.37890625} {"train_loss": -5.958310604095459, "global_step": 71526, "epoch": 1703} {"train_loss": -5.935301780700684, "global_step": 71527, "epoch": 1703} {"train_loss": -6.060021877288818, "global_step": 71528, "epoch": 1703} {"train_loss": -6.123340606689453, "global_step": 71529, "epoch": 1703} {"train_loss": -6.011325836181641, "global_step": 71530, "epoch": 1703} {"train_loss": -6.088896751403809, "global_step": 71531, "epoch": 1703} {"train_loss": -6.0703935623168945, "global_step": 71532, "epoch": 1703} {"train_loss": -6.01419734954834, "global_step": 71533, "epoch": 1703} {"train_loss": -5.971733570098877, "global_step": 71534, "epoch": 1703} {"train_loss": -5.954809665679932, "global_step": 71535, "epoch": 1703} {"train_loss": -6.012186527252197, "global_step": 71536, "epoch": 1703} {"train_loss": -5.967822551727295, "global_step": 71537, "epoch": 1703} {"train_loss": -6.152081489562988, "global_step": 71538, "epoch": 1703} {"train_loss": -6.010752201080322, "global_step": 71539, "epoch": 1703} {"train_loss": -5.9241132736206055, "global_step": 71540, "epoch": 1703} {"train_loss": -6.07045841217041, "global_step": 71541, "epoch": 1703} {"train_loss": -6.086215972900391, "global_step": 71542, "epoch": 1703} {"train_loss": -5.935750961303711, "global_step": 71543, "epoch": 1703} {"train_loss": -5.969851493835449, "global_step": 71544, "epoch": 1703} {"train_loss": -6.05704402923584, "global_step": 71545, "epoch": 1703} {"train_loss": -6.07033109664917, "global_step": 71546, "epoch": 1703} {"train_loss": -5.874489784240723, "global_step": 71547, "epoch": 1703} {"train_loss": -6.051085948944092, "global_step": 71548, "epoch": 1703} {"train_loss": -6.022279739379883, "global_step": 71549, "epoch": 1703} {"train_loss": -6.022927284240723, "global_step": 71550, "epoch": 1703} {"train_loss": -6.006795883178711, "global_step": 71551, "epoch": 1703} {"train_loss": -5.907697677612305, "global_step": 71552, "epoch": 1703} {"train_loss": -6.096343517303467, "global_step": 71553, "epoch": 1703} {"train_loss": -6.042580604553223, "global_step": 71554, "epoch": 1703} {"train_loss": -6.118394374847412, "global_step": 71555, "epoch": 1703} {"train_loss": -6.069940567016602, "global_step": 71556, "epoch": 1703} {"train_loss": -6.072505474090576, "global_step": 71557, "epoch": 1703} {"train_loss": -6.006401062011719, "global_step": 71558, "epoch": 1703} {"train_loss": -6.015721321105957, "global_step": 71559, "epoch": 1703} {"train_loss": -6.089875221252441, "global_step": 71560, "epoch": 1703} {"train_loss": -6.053040504455566, "global_step": 71561, "epoch": 1703} {"train_loss": -6.083131790161133, "global_step": 71562, "epoch": 1703} {"train_loss": -6.010798454284668, "global_step": 71563, "epoch": 1703} {"train_loss": -6.089067459106445, "global_step": 71564, "epoch": 1703} {"train_loss": -6.086810111999512, "global_step": 71565, "epoch": 1703} {"train_loss": -6.146627426147461, "global_step": 71566, "epoch": 1703} {"train_loss": -6.033014865148635, "global_step": 71567, "epoch": 1703, "val_loss": 61687.04296875} {"train_loss": -6.081179618835449, "global_step": 71568, "epoch": 1704} {"train_loss": -6.089885711669922, "global_step": 71569, "epoch": 1704} {"train_loss": -6.020743370056152, "global_step": 71570, "epoch": 1704} {"train_loss": -6.197273254394531, "global_step": 71571, "epoch": 1704} {"train_loss": -6.162158012390137, "global_step": 71572, "epoch": 1704} {"train_loss": -6.008787155151367, "global_step": 71573, "epoch": 1704} {"train_loss": -5.997159004211426, "global_step": 71574, "epoch": 1704} {"train_loss": -6.0675129890441895, "global_step": 71575, "epoch": 1704} {"train_loss": -6.093031406402588, "global_step": 71576, "epoch": 1704} {"train_loss": -5.905195236206055, "global_step": 71577, "epoch": 1704} {"train_loss": -6.12138032913208, "global_step": 71578, "epoch": 1704} {"train_loss": -6.124354839324951, "global_step": 71579, "epoch": 1704} {"train_loss": -5.986808776855469, "global_step": 71580, "epoch": 1704} {"train_loss": -6.109660625457764, "global_step": 71581, "epoch": 1704} {"train_loss": -6.093044281005859, "global_step": 71582, "epoch": 1704} {"train_loss": -6.126148700714111, "global_step": 71583, "epoch": 1704} {"train_loss": -6.110072612762451, "global_step": 71584, "epoch": 1704} {"train_loss": -6.103320598602295, "global_step": 71585, "epoch": 1704} {"train_loss": -6.1101202964782715, "global_step": 71586, "epoch": 1704} {"train_loss": -6.046452522277832, "global_step": 71587, "epoch": 1704} {"train_loss": -5.966272830963135, "global_step": 71588, "epoch": 1704} {"train_loss": -6.040289878845215, "global_step": 71589, "epoch": 1704} {"train_loss": -6.083691596984863, "global_step": 71590, "epoch": 1704} {"train_loss": -6.065034866333008, "global_step": 71591, "epoch": 1704} {"train_loss": -6.1531572341918945, "global_step": 71592, "epoch": 1704} {"train_loss": -6.098779201507568, "global_step": 71593, "epoch": 1704} {"train_loss": -5.997429847717285, "global_step": 71594, "epoch": 1704} {"train_loss": -6.094756126403809, "global_step": 71595, "epoch": 1704} {"train_loss": -6.0376410484313965, "global_step": 71596, "epoch": 1704} {"train_loss": -5.930917739868164, "global_step": 71597, "epoch": 1704} {"train_loss": -6.051321983337402, "global_step": 71598, "epoch": 1704} {"train_loss": -5.9536895751953125, "global_step": 71599, "epoch": 1704} {"train_loss": -6.052574157714844, "global_step": 71600, "epoch": 1704} {"train_loss": -6.137106895446777, "global_step": 71601, "epoch": 1704} {"train_loss": -5.985664367675781, "global_step": 71602, "epoch": 1704} {"train_loss": -6.068782329559326, "global_step": 71603, "epoch": 1704} {"train_loss": -5.959173679351807, "global_step": 71604, "epoch": 1704} {"train_loss": -5.920557975769043, "global_step": 71605, "epoch": 1704} {"train_loss": -6.057535171508789, "global_step": 71606, "epoch": 1704} {"train_loss": -6.1482768058776855, "global_step": 71607, "epoch": 1704} {"train_loss": -6.099998474121094, "global_step": 71608, "epoch": 1704} {"train_loss": -6.0611357007707864, "global_step": 71609, "epoch": 1704, "val_loss": 61833.84765625} {"train_loss": -6.023197650909424, "global_step": 71610, "epoch": 1705} {"train_loss": -5.954418659210205, "global_step": 71611, "epoch": 1705} {"train_loss": -5.914916038513184, "global_step": 71612, "epoch": 1705} {"train_loss": -6.083434581756592, "global_step": 71613, "epoch": 1705} {"train_loss": -6.112791061401367, "global_step": 71614, "epoch": 1705} {"train_loss": -6.011822700500488, "global_step": 71615, "epoch": 1705} {"train_loss": -6.120987415313721, "global_step": 71616, "epoch": 1705} {"train_loss": -5.999717712402344, "global_step": 71617, "epoch": 1705} {"train_loss": -6.056155204772949, "global_step": 71618, "epoch": 1705} {"train_loss": -6.0003204345703125, "global_step": 71619, "epoch": 1705} {"train_loss": -6.100546360015869, "global_step": 71620, "epoch": 1705} {"train_loss": -5.995079040527344, "global_step": 71621, "epoch": 1705} {"train_loss": -6.089039325714111, "global_step": 71622, "epoch": 1705} {"train_loss": -6.050601959228516, "global_step": 71623, "epoch": 1705} {"train_loss": -6.060274124145508, "global_step": 71624, "epoch": 1705} {"train_loss": -5.957908630371094, "global_step": 71625, "epoch": 1705} {"train_loss": -6.007116317749023, "global_step": 71626, "epoch": 1705} {"train_loss": -5.954834938049316, "global_step": 71627, "epoch": 1705} {"train_loss": -6.08461856842041, "global_step": 71628, "epoch": 1705} {"train_loss": -5.985543251037598, "global_step": 71629, "epoch": 1705} {"train_loss": -5.97772741317749, "global_step": 71630, "epoch": 1705} {"train_loss": -6.079453468322754, "global_step": 71631, "epoch": 1705} {"train_loss": -5.8166961669921875, "global_step": 71632, "epoch": 1705} {"train_loss": -5.9358978271484375, "global_step": 71633, "epoch": 1705} {"train_loss": -5.9603376388549805, "global_step": 71634, "epoch": 1705} {"train_loss": -5.985877990722656, "global_step": 71635, "epoch": 1705} {"train_loss": -5.977879524230957, "global_step": 71636, "epoch": 1705} {"train_loss": -5.979422569274902, "global_step": 71637, "epoch": 1705} {"train_loss": -6.078027725219727, "global_step": 71638, "epoch": 1705} {"train_loss": -6.062257766723633, "global_step": 71639, "epoch": 1705} {"train_loss": -5.946155548095703, "global_step": 71640, "epoch": 1705} {"train_loss": -5.9350128173828125, "global_step": 71641, "epoch": 1705} {"train_loss": -6.110827922821045, "global_step": 71642, "epoch": 1705} {"train_loss": -5.985069274902344, "global_step": 71643, "epoch": 1705} {"train_loss": -6.090728282928467, "global_step": 71644, "epoch": 1705} {"train_loss": -6.053229331970215, "global_step": 71645, "epoch": 1705} {"train_loss": -5.9752397537231445, "global_step": 71646, "epoch": 1705} {"train_loss": -5.96810245513916, "global_step": 71647, "epoch": 1705} {"train_loss": -6.066137313842773, "global_step": 71648, "epoch": 1705} {"train_loss": -6.07588529586792, "global_step": 71649, "epoch": 1705} {"train_loss": -6.107215881347656, "global_step": 71650, "epoch": 1705} {"train_loss": -6.016391981215704, "global_step": 71651, "epoch": 1705, "val_loss": 61627.28125} {"train_loss": -6.037038803100586, "global_step": 71652, "epoch": 1706} {"train_loss": -6.030601501464844, "global_step": 71653, "epoch": 1706} {"train_loss": -6.017538070678711, "global_step": 71654, "epoch": 1706} {"train_loss": -6.072057723999023, "global_step": 71655, "epoch": 1706} {"train_loss": -6.1810832023620605, "global_step": 71656, "epoch": 1706} {"train_loss": -6.073383331298828, "global_step": 71657, "epoch": 1706} {"train_loss": -6.071881294250488, "global_step": 71658, "epoch": 1706} {"train_loss": -6.0193867683410645, "global_step": 71659, "epoch": 1706} {"train_loss": -6.052783966064453, "global_step": 71660, "epoch": 1706} {"train_loss": -6.096269130706787, "global_step": 71661, "epoch": 1706} {"train_loss": -6.024049758911133, "global_step": 71662, "epoch": 1706} {"train_loss": -6.030548095703125, "global_step": 71663, "epoch": 1706} {"train_loss": -6.039758205413818, "global_step": 71664, "epoch": 1706} {"train_loss": -6.066463470458984, "global_step": 71665, "epoch": 1706} {"train_loss": -6.042716979980469, "global_step": 71666, "epoch": 1706} {"train_loss": -6.091443061828613, "global_step": 71667, "epoch": 1706} {"train_loss": -6.056037425994873, "global_step": 71668, "epoch": 1706} {"train_loss": -6.022030353546143, "global_step": 71669, "epoch": 1706} {"train_loss": -5.94072151184082, "global_step": 71670, "epoch": 1706} {"train_loss": -5.981902599334717, "global_step": 71671, "epoch": 1706} {"train_loss": -5.877938270568848, "global_step": 71672, "epoch": 1706} {"train_loss": -6.018424987792969, "global_step": 71673, "epoch": 1706} {"train_loss": -6.1485137939453125, "global_step": 71674, "epoch": 1706} {"train_loss": -6.049927711486816, "global_step": 71675, "epoch": 1706} {"train_loss": -6.138266563415527, "global_step": 71676, "epoch": 1706} {"train_loss": -6.011116027832031, "global_step": 71677, "epoch": 1706} {"train_loss": -6.150843620300293, "global_step": 71678, "epoch": 1706} {"train_loss": -6.006892204284668, "global_step": 71679, "epoch": 1706} {"train_loss": -6.054549217224121, "global_step": 71680, "epoch": 1706} {"train_loss": -6.055194854736328, "global_step": 71681, "epoch": 1706} {"train_loss": -6.032539367675781, "global_step": 71682, "epoch": 1706} {"train_loss": -6.005128860473633, "global_step": 71683, "epoch": 1706} {"train_loss": -6.065423011779785, "global_step": 71684, "epoch": 1706} {"train_loss": -6.0413360595703125, "global_step": 71685, "epoch": 1706} {"train_loss": -6.036960601806641, "global_step": 71686, "epoch": 1706} {"train_loss": -6.030889987945557, "global_step": 71687, "epoch": 1706} {"train_loss": -6.074463844299316, "global_step": 71688, "epoch": 1706} {"train_loss": -6.083134651184082, "global_step": 71689, "epoch": 1706} {"train_loss": -6.029386043548584, "global_step": 71690, "epoch": 1706} {"train_loss": -6.009541034698486, "global_step": 71691, "epoch": 1706} {"train_loss": -6.106729507446289, "global_step": 71692, "epoch": 1706} {"train_loss": -6.0466290428524925, "global_step": 71693, "epoch": 1706, "val_loss": 61812.56640625} {"train_loss": -6.098027229309082, "global_step": 71694, "epoch": 1707} {"train_loss": -6.121781349182129, "global_step": 71695, "epoch": 1707} {"train_loss": -6.056366920471191, "global_step": 71696, "epoch": 1707} {"train_loss": -6.008904457092285, "global_step": 71697, "epoch": 1707} {"train_loss": -6.074967384338379, "global_step": 71698, "epoch": 1707} {"train_loss": -6.100452423095703, "global_step": 71699, "epoch": 1707} {"train_loss": -6.046808242797852, "global_step": 71700, "epoch": 1707} {"train_loss": -6.07258939743042, "global_step": 71701, "epoch": 1707} {"train_loss": -6.020956516265869, "global_step": 71702, "epoch": 1707} {"train_loss": -6.045436859130859, "global_step": 71703, "epoch": 1707} {"train_loss": -6.10560417175293, "global_step": 71704, "epoch": 1707} {"train_loss": -6.159675121307373, "global_step": 71705, "epoch": 1707} {"train_loss": -6.040764808654785, "global_step": 71706, "epoch": 1707} {"train_loss": -6.061585426330566, "global_step": 71707, "epoch": 1707} {"train_loss": -6.056333065032959, "global_step": 71708, "epoch": 1707} {"train_loss": -6.094660758972168, "global_step": 71709, "epoch": 1707} {"train_loss": -6.054802894592285, "global_step": 71710, "epoch": 1707} {"train_loss": -6.080202579498291, "global_step": 71711, "epoch": 1707} {"train_loss": -6.159552574157715, "global_step": 71712, "epoch": 1707} {"train_loss": -6.05338191986084, "global_step": 71713, "epoch": 1707} {"train_loss": -5.975675582885742, "global_step": 71714, "epoch": 1707} {"train_loss": -6.041787624359131, "global_step": 71715, "epoch": 1707} {"train_loss": -6.107278823852539, "global_step": 71716, "epoch": 1707} {"train_loss": -6.009809494018555, "global_step": 71717, "epoch": 1707} {"train_loss": -6.104971885681152, "global_step": 71718, "epoch": 1707} {"train_loss": -6.153570652008057, "global_step": 71719, "epoch": 1707} {"train_loss": -6.068056106567383, "global_step": 71720, "epoch": 1707} {"train_loss": -6.020555019378662, "global_step": 71721, "epoch": 1707} {"train_loss": -5.937755584716797, "global_step": 71722, "epoch": 1707} {"train_loss": -6.012905120849609, "global_step": 71723, "epoch": 1707} {"train_loss": -6.067559242248535, "global_step": 71724, "epoch": 1707} {"train_loss": -6.008007049560547, "global_step": 71725, "epoch": 1707} {"train_loss": -6.12991189956665, "global_step": 71726, "epoch": 1707} {"train_loss": -6.126110076904297, "global_step": 71727, "epoch": 1707} {"train_loss": -6.125225067138672, "global_step": 71728, "epoch": 1707} {"train_loss": -6.091939926147461, "global_step": 71729, "epoch": 1707} {"train_loss": -5.9887261390686035, "global_step": 71730, "epoch": 1707} {"train_loss": -5.964475631713867, "global_step": 71731, "epoch": 1707} {"train_loss": -6.070037841796875, "global_step": 71732, "epoch": 1707} {"train_loss": -6.025941371917725, "global_step": 71733, "epoch": 1707} {"train_loss": -6.070544719696045, "global_step": 71734, "epoch": 1707} {"train_loss": -6.061836458387829, "global_step": 71735, "epoch": 1707, "val_loss": 61666.2734375} {"train_loss": -6.055141925811768, "global_step": 71736, "epoch": 1708} {"train_loss": -6.128862380981445, "global_step": 71737, "epoch": 1708} {"train_loss": -5.991400718688965, "global_step": 71738, "epoch": 1708} {"train_loss": -6.067138671875, "global_step": 71739, "epoch": 1708} {"train_loss": -6.129490852355957, "global_step": 71740, "epoch": 1708} {"train_loss": -6.0545148849487305, "global_step": 71741, "epoch": 1708} {"train_loss": -6.1818647384643555, "global_step": 71742, "epoch": 1708} {"train_loss": -6.047567844390869, "global_step": 71743, "epoch": 1708} {"train_loss": -6.100124359130859, "global_step": 71744, "epoch": 1708} {"train_loss": -6.0927324295043945, "global_step": 71745, "epoch": 1708} {"train_loss": -6.130621910095215, "global_step": 71746, "epoch": 1708} {"train_loss": -6.132994651794434, "global_step": 71747, "epoch": 1708} {"train_loss": -6.089921474456787, "global_step": 71748, "epoch": 1708} {"train_loss": -6.172459602355957, "global_step": 71749, "epoch": 1708} {"train_loss": -6.097586154937744, "global_step": 71750, "epoch": 1708} {"train_loss": -6.0080437660217285, "global_step": 71751, "epoch": 1708} {"train_loss": -6.059528827667236, "global_step": 71752, "epoch": 1708} {"train_loss": -6.069173812866211, "global_step": 71753, "epoch": 1708} {"train_loss": -6.270326614379883, "global_step": 71754, "epoch": 1708} {"train_loss": -6.071247100830078, "global_step": 71755, "epoch": 1708} {"train_loss": -6.102968215942383, "global_step": 71756, "epoch": 1708} {"train_loss": -6.092255592346191, "global_step": 71757, "epoch": 1708} {"train_loss": -6.043444633483887, "global_step": 71758, "epoch": 1708} {"train_loss": -6.148171424865723, "global_step": 71759, "epoch": 1708} {"train_loss": -5.987580299377441, "global_step": 71760, "epoch": 1708} {"train_loss": -5.986442565917969, "global_step": 71761, "epoch": 1708} {"train_loss": -6.032675266265869, "global_step": 71762, "epoch": 1708} {"train_loss": -5.989775657653809, "global_step": 71763, "epoch": 1708} {"train_loss": -6.097202301025391, "global_step": 71764, "epoch": 1708} {"train_loss": -6.113058090209961, "global_step": 71765, "epoch": 1708} {"train_loss": -6.0163893699646, "global_step": 71766, "epoch": 1708} {"train_loss": -6.021551132202148, "global_step": 71767, "epoch": 1708} {"train_loss": -6.111827850341797, "global_step": 71768, "epoch": 1708} {"train_loss": -6.081546783447266, "global_step": 71769, "epoch": 1708} {"train_loss": -6.1155805587768555, "global_step": 71770, "epoch": 1708} {"train_loss": -5.966961860656738, "global_step": 71771, "epoch": 1708} {"train_loss": -5.816066265106201, "global_step": 71772, "epoch": 1708} {"train_loss": -5.969451904296875, "global_step": 71773, "epoch": 1708} {"train_loss": -6.091015815734863, "global_step": 71774, "epoch": 1708} {"train_loss": -6.0596089363098145, "global_step": 71775, "epoch": 1708} {"train_loss": -6.082649230957031, "global_step": 71776, "epoch": 1708} {"train_loss": -6.0720777738662, "global_step": 71777, "epoch": 1708, "val_loss": 61781.83203125} {"train_loss": -6.003714084625244, "global_step": 71778, "epoch": 1709} {"train_loss": -5.946225166320801, "global_step": 71779, "epoch": 1709} {"train_loss": -6.066646575927734, "global_step": 71780, "epoch": 1709} {"train_loss": -5.990011692047119, "global_step": 71781, "epoch": 1709} {"train_loss": -6.0086774826049805, "global_step": 71782, "epoch": 1709} {"train_loss": -5.974322319030762, "global_step": 71783, "epoch": 1709} {"train_loss": -6.038551330566406, "global_step": 71784, "epoch": 1709} {"train_loss": -5.932781219482422, "global_step": 71785, "epoch": 1709} {"train_loss": -5.967911243438721, "global_step": 71786, "epoch": 1709} {"train_loss": -6.048303604125977, "global_step": 71787, "epoch": 1709} {"train_loss": -6.092423439025879, "global_step": 71788, "epoch": 1709} {"train_loss": -5.963911056518555, "global_step": 71789, "epoch": 1709} {"train_loss": -6.026244163513184, "global_step": 71790, "epoch": 1709} {"train_loss": -6.0024614334106445, "global_step": 71791, "epoch": 1709} {"train_loss": -6.099676609039307, "global_step": 71792, "epoch": 1709} {"train_loss": -6.073660850524902, "global_step": 71793, "epoch": 1709} {"train_loss": -6.052244186401367, "global_step": 71794, "epoch": 1709} {"train_loss": -6.1177167892456055, "global_step": 71795, "epoch": 1709} {"train_loss": -5.961608409881592, "global_step": 71796, "epoch": 1709} {"train_loss": -6.0701398849487305, "global_step": 71797, "epoch": 1709} {"train_loss": -6.192424774169922, "global_step": 71798, "epoch": 1709} {"train_loss": -6.092504501342773, "global_step": 71799, "epoch": 1709} {"train_loss": -6.105749130249023, "global_step": 71800, "epoch": 1709} {"train_loss": -6.123469829559326, "global_step": 71801, "epoch": 1709} {"train_loss": -6.0490922927856445, "global_step": 71802, "epoch": 1709} {"train_loss": -6.103522777557373, "global_step": 71803, "epoch": 1709} {"train_loss": -6.075737953186035, "global_step": 71804, "epoch": 1709} {"train_loss": -6.056191921234131, "global_step": 71805, "epoch": 1709} {"train_loss": -6.101959228515625, "global_step": 71806, "epoch": 1709} {"train_loss": -6.047473907470703, "global_step": 71807, "epoch": 1709} {"train_loss": -6.174256324768066, "global_step": 71808, "epoch": 1709} {"train_loss": -5.969832420349121, "global_step": 71809, "epoch": 1709} {"train_loss": -6.2260260581970215, "global_step": 71810, "epoch": 1709} {"train_loss": -5.9720001220703125, "global_step": 71811, "epoch": 1709} {"train_loss": -6.00381326675415, "global_step": 71812, "epoch": 1709} {"train_loss": -6.108555316925049, "global_step": 71813, "epoch": 1709} {"train_loss": -6.1087236404418945, "global_step": 71814, "epoch": 1709} {"train_loss": -6.09531307220459, "global_step": 71815, "epoch": 1709} {"train_loss": -5.992981910705566, "global_step": 71816, "epoch": 1709} {"train_loss": -6.012739181518555, "global_step": 71817, "epoch": 1709} {"train_loss": -6.133688926696777, "global_step": 71818, "epoch": 1709} {"train_loss": -6.053006285712833, "global_step": 71819, "epoch": 1709, "val_loss": 61829.14453125} {"train_loss": -5.979303359985352, "global_step": 71820, "epoch": 1710} {"train_loss": -5.920982360839844, "global_step": 71821, "epoch": 1710} {"train_loss": -6.047436714172363, "global_step": 71822, "epoch": 1710} {"train_loss": -6.033987045288086, "global_step": 71823, "epoch": 1710} {"train_loss": -6.07220983505249, "global_step": 71824, "epoch": 1710} {"train_loss": -6.161412239074707, "global_step": 71825, "epoch": 1710} {"train_loss": -6.16243314743042, "global_step": 71826, "epoch": 1710} {"train_loss": -6.141574859619141, "global_step": 71827, "epoch": 1710} {"train_loss": -6.041057109832764, "global_step": 71828, "epoch": 1710} {"train_loss": -5.95413875579834, "global_step": 71829, "epoch": 1710} {"train_loss": -6.050956726074219, "global_step": 71830, "epoch": 1710} {"train_loss": -5.994599342346191, "global_step": 71831, "epoch": 1710} {"train_loss": -5.93678092956543, "global_step": 71832, "epoch": 1710} {"train_loss": -6.099087715148926, "global_step": 71833, "epoch": 1710} {"train_loss": -5.974391460418701, "global_step": 71834, "epoch": 1710} {"train_loss": -5.920363903045654, "global_step": 71835, "epoch": 1710} {"train_loss": -6.010812759399414, "global_step": 71836, "epoch": 1710} {"train_loss": -6.067196369171143, "global_step": 71837, "epoch": 1710} {"train_loss": -6.209056854248047, "global_step": 71838, "epoch": 1710} {"train_loss": -6.028582572937012, "global_step": 71839, "epoch": 1710} {"train_loss": -6.06500244140625, "global_step": 71840, "epoch": 1710} {"train_loss": -6.0393171310424805, "global_step": 71841, "epoch": 1710} {"train_loss": -6.165777206420898, "global_step": 71842, "epoch": 1710} {"train_loss": -6.012889862060547, "global_step": 71843, "epoch": 1710} {"train_loss": -6.112395286560059, "global_step": 71844, "epoch": 1710} {"train_loss": -5.934570789337158, "global_step": 71845, "epoch": 1710} {"train_loss": -6.043651580810547, "global_step": 71846, "epoch": 1710} {"train_loss": -6.15538215637207, "global_step": 71847, "epoch": 1710} {"train_loss": -6.007953643798828, "global_step": 71848, "epoch": 1710} {"train_loss": -6.163362503051758, "global_step": 71849, "epoch": 1710} {"train_loss": -6.043625831604004, "global_step": 71850, "epoch": 1710} {"train_loss": -6.138974189758301, "global_step": 71851, "epoch": 1710} {"train_loss": -6.242033004760742, "global_step": 71852, "epoch": 1710} {"train_loss": -6.043384552001953, "global_step": 71853, "epoch": 1710} {"train_loss": -5.939149856567383, "global_step": 71854, "epoch": 1710} {"train_loss": -6.071262359619141, "global_step": 71855, "epoch": 1710} {"train_loss": -6.057842254638672, "global_step": 71856, "epoch": 1710} {"train_loss": -6.035614013671875, "global_step": 71857, "epoch": 1710} {"train_loss": -6.106527328491211, "global_step": 71858, "epoch": 1710} {"train_loss": -6.131531238555908, "global_step": 71859, "epoch": 1710} {"train_loss": -6.098751068115234, "global_step": 71860, "epoch": 1710} {"train_loss": -6.05843094417027, "global_step": 71861, "epoch": 1710, "val_loss": 61645.66015625} {"train_loss": -6.039055824279785, "global_step": 71862, "epoch": 1711} {"train_loss": -6.087833404541016, "global_step": 71863, "epoch": 1711} {"train_loss": -6.078095436096191, "global_step": 71864, "epoch": 1711} {"train_loss": -6.134465217590332, "global_step": 71865, "epoch": 1711} {"train_loss": -6.15446662902832, "global_step": 71866, "epoch": 1711} {"train_loss": -6.049655914306641, "global_step": 71867, "epoch": 1711} {"train_loss": -6.150842666625977, "global_step": 71868, "epoch": 1711} {"train_loss": -6.090714454650879, "global_step": 71869, "epoch": 1711} {"train_loss": -6.143733978271484, "global_step": 71870, "epoch": 1711} {"train_loss": -6.045714378356934, "global_step": 71871, "epoch": 1711} {"train_loss": -6.001213550567627, "global_step": 71872, "epoch": 1711} {"train_loss": -6.0827131271362305, "global_step": 71873, "epoch": 1711} {"train_loss": -6.131504058837891, "global_step": 71874, "epoch": 1711} {"train_loss": -5.9958176612854, "global_step": 71875, "epoch": 1711} {"train_loss": -6.161295413970947, "global_step": 71876, "epoch": 1711} {"train_loss": -6.062931060791016, "global_step": 71877, "epoch": 1711} {"train_loss": -6.12617301940918, "global_step": 71878, "epoch": 1711} {"train_loss": -6.096647262573242, "global_step": 71879, "epoch": 1711} {"train_loss": -5.991649150848389, "global_step": 71880, "epoch": 1711} {"train_loss": -6.12656307220459, "global_step": 71881, "epoch": 1711} {"train_loss": -5.9852294921875, "global_step": 71882, "epoch": 1711} {"train_loss": -6.175034046173096, "global_step": 71883, "epoch": 1711} {"train_loss": -6.101117134094238, "global_step": 71884, "epoch": 1711} {"train_loss": -5.960690498352051, "global_step": 71885, "epoch": 1711} {"train_loss": -5.999234199523926, "global_step": 71886, "epoch": 1711} {"train_loss": -6.123420715332031, "global_step": 71887, "epoch": 1711} {"train_loss": -6.099102020263672, "global_step": 71888, "epoch": 1711} {"train_loss": -6.003596305847168, "global_step": 71889, "epoch": 1711} {"train_loss": -6.0351152420043945, "global_step": 71890, "epoch": 1711} {"train_loss": -5.940755844116211, "global_step": 71891, "epoch": 1711} {"train_loss": -6.086862564086914, "global_step": 71892, "epoch": 1711} {"train_loss": -5.958647727966309, "global_step": 71893, "epoch": 1711} {"train_loss": -5.890134811401367, "global_step": 71894, "epoch": 1711} {"train_loss": -6.086288928985596, "global_step": 71895, "epoch": 1711} {"train_loss": -6.065345764160156, "global_step": 71896, "epoch": 1711} {"train_loss": -6.024255275726318, "global_step": 71897, "epoch": 1711} {"train_loss": -6.147924423217773, "global_step": 71898, "epoch": 1711} {"train_loss": -5.9634809494018555, "global_step": 71899, "epoch": 1711} {"train_loss": -6.060507774353027, "global_step": 71900, "epoch": 1711} {"train_loss": -6.039186477661133, "global_step": 71901, "epoch": 1711} {"train_loss": -6.018622398376465, "global_step": 71902, "epoch": 1711} {"train_loss": -6.058736199424381, "global_step": 71903, "epoch": 1711, "val_loss": 61854.36328125} {"train_loss": -6.097132682800293, "global_step": 71904, "epoch": 1712} {"train_loss": -6.127033233642578, "global_step": 71905, "epoch": 1712} {"train_loss": -6.101802825927734, "global_step": 71906, "epoch": 1712} {"train_loss": -6.105496406555176, "global_step": 71907, "epoch": 1712} {"train_loss": -6.105679512023926, "global_step": 71908, "epoch": 1712} {"train_loss": -6.083464622497559, "global_step": 71909, "epoch": 1712} {"train_loss": -6.109804153442383, "global_step": 71910, "epoch": 1712} {"train_loss": -6.015974998474121, "global_step": 71911, "epoch": 1712} {"train_loss": -5.978158473968506, "global_step": 71912, "epoch": 1712} {"train_loss": -6.110528469085693, "global_step": 71913, "epoch": 1712} {"train_loss": -6.124146461486816, "global_step": 71914, "epoch": 1712} {"train_loss": -6.093012809753418, "global_step": 71915, "epoch": 1712} {"train_loss": -6.16374397277832, "global_step": 71916, "epoch": 1712} {"train_loss": -6.151330947875977, "global_step": 71917, "epoch": 1712} {"train_loss": -6.092533111572266, "global_step": 71918, "epoch": 1712} {"train_loss": -6.054503440856934, "global_step": 71919, "epoch": 1712} {"train_loss": -6.020784854888916, "global_step": 71920, "epoch": 1712} {"train_loss": -6.124622344970703, "global_step": 71921, "epoch": 1712} {"train_loss": -6.1276960372924805, "global_step": 71922, "epoch": 1712} {"train_loss": -6.005739688873291, "global_step": 71923, "epoch": 1712} {"train_loss": -6.107534885406494, "global_step": 71924, "epoch": 1712} {"train_loss": -6.0468292236328125, "global_step": 71925, "epoch": 1712} {"train_loss": -6.138832092285156, "global_step": 71926, "epoch": 1712} {"train_loss": -6.022464752197266, "global_step": 71927, "epoch": 1712} {"train_loss": -5.99244499206543, "global_step": 71928, "epoch": 1712} {"train_loss": -6.065310001373291, "global_step": 71929, "epoch": 1712} {"train_loss": -5.9792890548706055, "global_step": 71930, "epoch": 1712} {"train_loss": -6.076663970947266, "global_step": 71931, "epoch": 1712} {"train_loss": -6.0709357261657715, "global_step": 71932, "epoch": 1712} {"train_loss": -6.09989070892334, "global_step": 71933, "epoch": 1712} {"train_loss": -6.128923416137695, "global_step": 71934, "epoch": 1712} {"train_loss": -6.078022003173828, "global_step": 71935, "epoch": 1712} {"train_loss": -5.996748924255371, "global_step": 71936, "epoch": 1712} {"train_loss": -6.0272536277771, "global_step": 71937, "epoch": 1712} {"train_loss": -6.0010199546813965, "global_step": 71938, "epoch": 1712} {"train_loss": -6.203908920288086, "global_step": 71939, "epoch": 1712} {"train_loss": -5.933218479156494, "global_step": 71940, "epoch": 1712} {"train_loss": -6.01124382019043, "global_step": 71941, "epoch": 1712} {"train_loss": -6.105379581451416, "global_step": 71942, "epoch": 1712} {"train_loss": -6.040251731872559, "global_step": 71943, "epoch": 1712} {"train_loss": -6.095257759094238, "global_step": 71944, "epoch": 1712} {"train_loss": -6.0725736277444025, "global_step": 71945, "epoch": 1712, "val_loss": 61895.05078125} {"train_loss": -6.04290771484375, "global_step": 71946, "epoch": 1713} {"train_loss": -6.000864028930664, "global_step": 71947, "epoch": 1713} {"train_loss": -6.175131797790527, "global_step": 71948, "epoch": 1713} {"train_loss": -6.042075157165527, "global_step": 71949, "epoch": 1713} {"train_loss": -5.993519306182861, "global_step": 71950, "epoch": 1713} {"train_loss": -6.132513046264648, "global_step": 71951, "epoch": 1713} {"train_loss": -6.086297512054443, "global_step": 71952, "epoch": 1713} {"train_loss": -6.09538459777832, "global_step": 71953, "epoch": 1713} {"train_loss": -6.137207508087158, "global_step": 71954, "epoch": 1713} {"train_loss": -6.161722660064697, "global_step": 71955, "epoch": 1713} {"train_loss": -6.018021583557129, "global_step": 71956, "epoch": 1713} {"train_loss": -6.1138129234313965, "global_step": 71957, "epoch": 1713} {"train_loss": -5.9778571128845215, "global_step": 71958, "epoch": 1713} {"train_loss": -6.126483917236328, "global_step": 71959, "epoch": 1713} {"train_loss": -6.043046474456787, "global_step": 71960, "epoch": 1713} {"train_loss": -6.028794765472412, "global_step": 71961, "epoch": 1713} {"train_loss": -5.977603912353516, "global_step": 71962, "epoch": 1713} {"train_loss": -6.036395072937012, "global_step": 71963, "epoch": 1713} {"train_loss": -5.987822532653809, "global_step": 71964, "epoch": 1713} {"train_loss": -6.063450813293457, "global_step": 71965, "epoch": 1713} {"train_loss": -5.94835901260376, "global_step": 71966, "epoch": 1713} {"train_loss": -5.993111610412598, "global_step": 71967, "epoch": 1713} {"train_loss": -6.1126837730407715, "global_step": 71968, "epoch": 1713} {"train_loss": -5.941473007202148, "global_step": 71969, "epoch": 1713} {"train_loss": -6.1437225341796875, "global_step": 71970, "epoch": 1713} {"train_loss": -6.121377468109131, "global_step": 71971, "epoch": 1713} {"train_loss": -6.055105209350586, "global_step": 71972, "epoch": 1713} {"train_loss": -6.1517109870910645, "global_step": 71973, "epoch": 1713} {"train_loss": -6.102016925811768, "global_step": 71974, "epoch": 1713} {"train_loss": -6.128008842468262, "global_step": 71975, "epoch": 1713} {"train_loss": -6.1712541580200195, "global_step": 71976, "epoch": 1713} {"train_loss": -6.174780368804932, "global_step": 71977, "epoch": 1713} {"train_loss": -5.955776214599609, "global_step": 71978, "epoch": 1713} {"train_loss": -6.052857398986816, "global_step": 71979, "epoch": 1713} {"train_loss": -6.1512298583984375, "global_step": 71980, "epoch": 1713} {"train_loss": -6.050656318664551, "global_step": 71981, "epoch": 1713} {"train_loss": -6.099503517150879, "global_step": 71982, "epoch": 1713} {"train_loss": -6.035828590393066, "global_step": 71983, "epoch": 1713} {"train_loss": -5.9508442878723145, "global_step": 71984, "epoch": 1713} {"train_loss": -5.996177673339844, "global_step": 71985, "epoch": 1713} {"train_loss": -6.001715183258057, "global_step": 71986, "epoch": 1713} {"train_loss": -6.061524050576346, "global_step": 71987, "epoch": 1713, "val_loss": 61899.02734375} {"train_loss": -6.079521179199219, "global_step": 71988, "epoch": 1714} {"train_loss": -5.976467609405518, "global_step": 71989, "epoch": 1714} {"train_loss": -6.0519914627075195, "global_step": 71990, "epoch": 1714} {"train_loss": -5.945618629455566, "global_step": 71991, "epoch": 1714} {"train_loss": -6.009686470031738, "global_step": 71992, "epoch": 1714} {"train_loss": -5.9647932052612305, "global_step": 71993, "epoch": 1714} {"train_loss": -6.105416297912598, "global_step": 71994, "epoch": 1714} {"train_loss": -6.03898811340332, "global_step": 71995, "epoch": 1714} {"train_loss": -5.954879283905029, "global_step": 71996, "epoch": 1714} {"train_loss": -6.078378200531006, "global_step": 71997, "epoch": 1714} {"train_loss": -6.128756046295166, "global_step": 71998, "epoch": 1714} {"train_loss": -5.9327874183654785, "global_step": 71999, "epoch": 1714} {"train_loss": -6.088176250457764, "global_step": 72000, "epoch": 1714} {"train_loss": -6.049751281738281, "global_step": 72001, "epoch": 1714} {"train_loss": -6.010964393615723, "global_step": 72002, "epoch": 1714} {"train_loss": -6.053375244140625, "global_step": 72003, "epoch": 1714} {"train_loss": -5.985225677490234, "global_step": 72004, "epoch": 1714} {"train_loss": -5.9913129806518555, "global_step": 72005, "epoch": 1714} {"train_loss": -5.9912919998168945, "global_step": 72006, "epoch": 1714} {"train_loss": -6.1209588050842285, "global_step": 72007, "epoch": 1714} {"train_loss": -6.073355674743652, "global_step": 72008, "epoch": 1714} {"train_loss": -6.149997711181641, "global_step": 72009, "epoch": 1714} {"train_loss": -6.103641033172607, "global_step": 72010, "epoch": 1714} {"train_loss": -6.139261245727539, "global_step": 72011, "epoch": 1714} {"train_loss": -6.093410968780518, "global_step": 72012, "epoch": 1714} {"train_loss": -6.029771327972412, "global_step": 72013, "epoch": 1714} {"train_loss": -6.042479991912842, "global_step": 72014, "epoch": 1714} {"train_loss": -6.117425441741943, "global_step": 72015, "epoch": 1714} {"train_loss": -5.962589740753174, "global_step": 72016, "epoch": 1714} {"train_loss": -6.058043479919434, "global_step": 72017, "epoch": 1714} {"train_loss": -6.199434280395508, "global_step": 72018, "epoch": 1714} {"train_loss": -6.032751083374023, "global_step": 72019, "epoch": 1714} {"train_loss": -5.990070343017578, "global_step": 72020, "epoch": 1714} {"train_loss": -6.101784706115723, "global_step": 72021, "epoch": 1714} {"train_loss": -6.097596168518066, "global_step": 72022, "epoch": 1714} {"train_loss": -6.067333698272705, "global_step": 72023, "epoch": 1714} {"train_loss": -5.935569763183594, "global_step": 72024, "epoch": 1714} {"train_loss": -5.9984002113342285, "global_step": 72025, "epoch": 1714} {"train_loss": -6.007292747497559, "global_step": 72026, "epoch": 1714} {"train_loss": -5.989656448364258, "global_step": 72027, "epoch": 1714} {"train_loss": -6.128736972808838, "global_step": 72028, "epoch": 1714} {"train_loss": -6.043103728975568, "global_step": 72029, "epoch": 1714, "val_loss": 61800.80078125} {"train_loss": -6.091109752655029, "global_step": 72030, "epoch": 1715} {"train_loss": -6.056064128875732, "global_step": 72031, "epoch": 1715} {"train_loss": -6.094059944152832, "global_step": 72032, "epoch": 1715} {"train_loss": -6.092108249664307, "global_step": 72033, "epoch": 1715} {"train_loss": -6.149889945983887, "global_step": 72034, "epoch": 1715} {"train_loss": -6.0342559814453125, "global_step": 72035, "epoch": 1715} {"train_loss": -5.978005886077881, "global_step": 72036, "epoch": 1715} {"train_loss": -6.065673828125, "global_step": 72037, "epoch": 1715} {"train_loss": -6.078472137451172, "global_step": 72038, "epoch": 1715} {"train_loss": -6.0452561378479, "global_step": 72039, "epoch": 1715} {"train_loss": -5.954514503479004, "global_step": 72040, "epoch": 1715} {"train_loss": -6.063353061676025, "global_step": 72041, "epoch": 1715} {"train_loss": -5.999476432800293, "global_step": 72042, "epoch": 1715} {"train_loss": -5.9981865882873535, "global_step": 72043, "epoch": 1715} {"train_loss": -6.16302490234375, "global_step": 72044, "epoch": 1715} {"train_loss": -6.1577606201171875, "global_step": 72045, "epoch": 1715} {"train_loss": -6.079830169677734, "global_step": 72046, "epoch": 1715} {"train_loss": -5.993070125579834, "global_step": 72047, "epoch": 1715} {"train_loss": -6.022578239440918, "global_step": 72048, "epoch": 1715} {"train_loss": -6.001133918762207, "global_step": 72049, "epoch": 1715} {"train_loss": -6.091126918792725, "global_step": 72050, "epoch": 1715} {"train_loss": -5.996779441833496, "global_step": 72051, "epoch": 1715} {"train_loss": -6.096731662750244, "global_step": 72052, "epoch": 1715} {"train_loss": -6.203050136566162, "global_step": 72053, "epoch": 1715} {"train_loss": -6.113924503326416, "global_step": 72054, "epoch": 1715} {"train_loss": -5.992495536804199, "global_step": 72055, "epoch": 1715} {"train_loss": -6.121703147888184, "global_step": 72056, "epoch": 1715} {"train_loss": -6.04012393951416, "global_step": 72057, "epoch": 1715} {"train_loss": -5.970738410949707, "global_step": 72058, "epoch": 1715} {"train_loss": -5.929738998413086, "global_step": 72059, "epoch": 1715} {"train_loss": -6.103841781616211, "global_step": 72060, "epoch": 1715} {"train_loss": -6.092123031616211, "global_step": 72061, "epoch": 1715} {"train_loss": -6.037074089050293, "global_step": 72062, "epoch": 1715} {"train_loss": -6.040576934814453, "global_step": 72063, "epoch": 1715} {"train_loss": -5.907984733581543, "global_step": 72064, "epoch": 1715} {"train_loss": -6.028615951538086, "global_step": 72065, "epoch": 1715} {"train_loss": -5.917792320251465, "global_step": 72066, "epoch": 1715} {"train_loss": -6.082749843597412, "global_step": 72067, "epoch": 1715} {"train_loss": -6.050189971923828, "global_step": 72068, "epoch": 1715} {"train_loss": -5.9678192138671875, "global_step": 72069, "epoch": 1715} {"train_loss": -6.130380630493164, "global_step": 72070, "epoch": 1715} {"train_loss": -6.046780779248192, "global_step": 72071, "epoch": 1715, "val_loss": 61852.36328125} {"train_loss": -5.914727687835693, "global_step": 72072, "epoch": 1716} {"train_loss": -6.006439685821533, "global_step": 72073, "epoch": 1716} {"train_loss": -6.017161846160889, "global_step": 72074, "epoch": 1716} {"train_loss": -5.9835205078125, "global_step": 72075, "epoch": 1716} {"train_loss": -5.985812187194824, "global_step": 72076, "epoch": 1716} {"train_loss": -6.013596534729004, "global_step": 72077, "epoch": 1716} {"train_loss": -6.0097503662109375, "global_step": 72078, "epoch": 1716} {"train_loss": -6.062103271484375, "global_step": 72079, "epoch": 1716} {"train_loss": -5.910937309265137, "global_step": 72080, "epoch": 1716} {"train_loss": -6.039243698120117, "global_step": 72081, "epoch": 1716} {"train_loss": -6.066091060638428, "global_step": 72082, "epoch": 1716} {"train_loss": -5.912117958068848, "global_step": 72083, "epoch": 1716} {"train_loss": -5.938977241516113, "global_step": 72084, "epoch": 1716} {"train_loss": -6.048251152038574, "global_step": 72085, "epoch": 1716} {"train_loss": -6.167824745178223, "global_step": 72086, "epoch": 1716} {"train_loss": -6.0151214599609375, "global_step": 72087, "epoch": 1716} {"train_loss": -5.945795059204102, "global_step": 72088, "epoch": 1716} {"train_loss": -5.990958213806152, "global_step": 72089, "epoch": 1716} {"train_loss": -5.963464260101318, "global_step": 72090, "epoch": 1716} {"train_loss": -6.109370708465576, "global_step": 72091, "epoch": 1716} {"train_loss": -5.960165500640869, "global_step": 72092, "epoch": 1716} {"train_loss": -5.956966400146484, "global_step": 72093, "epoch": 1716} {"train_loss": -6.039703369140625, "global_step": 72094, "epoch": 1716} {"train_loss": -6.092901706695557, "global_step": 72095, "epoch": 1716} {"train_loss": -5.950668811798096, "global_step": 72096, "epoch": 1716} {"train_loss": -6.04940128326416, "global_step": 72097, "epoch": 1716} {"train_loss": -6.066359519958496, "global_step": 72098, "epoch": 1716} {"train_loss": -5.980037212371826, "global_step": 72099, "epoch": 1716} {"train_loss": -6.022825241088867, "global_step": 72100, "epoch": 1716} {"train_loss": -6.0835185050964355, "global_step": 72101, "epoch": 1716} {"train_loss": -6.013921737670898, "global_step": 72102, "epoch": 1716} {"train_loss": -6.137402534484863, "global_step": 72103, "epoch": 1716} {"train_loss": -5.9444098472595215, "global_step": 72104, "epoch": 1716} {"train_loss": -6.028091907501221, "global_step": 72105, "epoch": 1716} {"train_loss": -6.011085033416748, "global_step": 72106, "epoch": 1716} {"train_loss": -5.9177350997924805, "global_step": 72107, "epoch": 1716} {"train_loss": -6.0407514572143555, "global_step": 72108, "epoch": 1716} {"train_loss": -5.932374954223633, "global_step": 72109, "epoch": 1716} {"train_loss": -5.981279373168945, "global_step": 72110, "epoch": 1716} {"train_loss": -5.9614033699035645, "global_step": 72111, "epoch": 1716} {"train_loss": -6.002191066741943, "global_step": 72112, "epoch": 1716} {"train_loss": -6.005120845068069, "global_step": 72113, "epoch": 1716, "val_loss": 62067.9609375} {"train_loss": -6.009164810180664, "global_step": 72114, "epoch": 1717} {"train_loss": -5.890678405761719, "global_step": 72115, "epoch": 1717} {"train_loss": -6.019806861877441, "global_step": 72116, "epoch": 1717} {"train_loss": -5.951545238494873, "global_step": 72117, "epoch": 1717} {"train_loss": -5.991931915283203, "global_step": 72118, "epoch": 1717} {"train_loss": -6.066595077514648, "global_step": 72119, "epoch": 1717} {"train_loss": -6.095284461975098, "global_step": 72120, "epoch": 1717} {"train_loss": -6.053123474121094, "global_step": 72121, "epoch": 1717} {"train_loss": -6.006401062011719, "global_step": 72122, "epoch": 1717} {"train_loss": -6.055856227874756, "global_step": 72123, "epoch": 1717} {"train_loss": -6.002397537231445, "global_step": 72124, "epoch": 1717} {"train_loss": -6.091990947723389, "global_step": 72125, "epoch": 1717} {"train_loss": -5.948404312133789, "global_step": 72126, "epoch": 1717} {"train_loss": -6.024068832397461, "global_step": 72127, "epoch": 1717} {"train_loss": -6.009529113769531, "global_step": 72128, "epoch": 1717} {"train_loss": -6.119019508361816, "global_step": 72129, "epoch": 1717} {"train_loss": -6.034046649932861, "global_step": 72130, "epoch": 1717} {"train_loss": -6.082242965698242, "global_step": 72131, "epoch": 1717} {"train_loss": -6.197096824645996, "global_step": 72132, "epoch": 1717} {"train_loss": -6.136241912841797, "global_step": 72133, "epoch": 1717} {"train_loss": -6.0056328773498535, "global_step": 72134, "epoch": 1717} {"train_loss": -6.10759973526001, "global_step": 72135, "epoch": 1717} {"train_loss": -6.023144245147705, "global_step": 72136, "epoch": 1717} {"train_loss": -6.233122825622559, "global_step": 72137, "epoch": 1717} {"train_loss": -6.074738502502441, "global_step": 72138, "epoch": 1717} {"train_loss": -5.929860591888428, "global_step": 72139, "epoch": 1717} {"train_loss": -6.107270240783691, "global_step": 72140, "epoch": 1717} {"train_loss": -5.9436726570129395, "global_step": 72141, "epoch": 1717} {"train_loss": -5.943639278411865, "global_step": 72142, "epoch": 1717} {"train_loss": -5.9625139236450195, "global_step": 72143, "epoch": 1717} {"train_loss": -5.9705963134765625, "global_step": 72144, "epoch": 1717} {"train_loss": -6.111418724060059, "global_step": 72145, "epoch": 1717} {"train_loss": -5.962034225463867, "global_step": 72146, "epoch": 1717} {"train_loss": -6.073738098144531, "global_step": 72147, "epoch": 1717} {"train_loss": -5.967962265014648, "global_step": 72148, "epoch": 1717} {"train_loss": -6.027207374572754, "global_step": 72149, "epoch": 1717} {"train_loss": -5.957812786102295, "global_step": 72150, "epoch": 1717} {"train_loss": -6.0811920166015625, "global_step": 72151, "epoch": 1717} {"train_loss": -6.050742149353027, "global_step": 72152, "epoch": 1717} {"train_loss": -6.046456336975098, "global_step": 72153, "epoch": 1717} {"train_loss": -6.086630821228027, "global_step": 72154, "epoch": 1717} {"train_loss": -6.038147097542172, "global_step": 72155, "epoch": 1717, "val_loss": 61754.83203125} {"train_loss": -6.02548885345459, "global_step": 72156, "epoch": 1718} {"train_loss": -6.150435447692871, "global_step": 72157, "epoch": 1718} {"train_loss": -6.036304950714111, "global_step": 72158, "epoch": 1718} {"train_loss": -6.112083435058594, "global_step": 72159, "epoch": 1718} {"train_loss": -6.008858680725098, "global_step": 72160, "epoch": 1718} {"train_loss": -6.086243152618408, "global_step": 72161, "epoch": 1718} {"train_loss": -5.976136207580566, "global_step": 72162, "epoch": 1718} {"train_loss": -6.00386381149292, "global_step": 72163, "epoch": 1718} {"train_loss": -6.061842918395996, "global_step": 72164, "epoch": 1718} {"train_loss": -6.064873218536377, "global_step": 72165, "epoch": 1718} {"train_loss": -5.962658882141113, "global_step": 72166, "epoch": 1718} {"train_loss": -6.038448333740234, "global_step": 72167, "epoch": 1718} {"train_loss": -6.121397018432617, "global_step": 72168, "epoch": 1718} {"train_loss": -6.0959672927856445, "global_step": 72169, "epoch": 1718} {"train_loss": -6.069665908813477, "global_step": 72170, "epoch": 1718} {"train_loss": -6.100223541259766, "global_step": 72171, "epoch": 1718} {"train_loss": -6.168394088745117, "global_step": 72172, "epoch": 1718} {"train_loss": -6.09669303894043, "global_step": 72173, "epoch": 1718} {"train_loss": -6.085583209991455, "global_step": 72174, "epoch": 1718} {"train_loss": -6.165989875793457, "global_step": 72175, "epoch": 1718} {"train_loss": -5.961044788360596, "global_step": 72176, "epoch": 1718} {"train_loss": -6.091433525085449, "global_step": 72177, "epoch": 1718} {"train_loss": -6.145580291748047, "global_step": 72178, "epoch": 1718} {"train_loss": -6.077971458435059, "global_step": 72179, "epoch": 1718} {"train_loss": -6.076946258544922, "global_step": 72180, "epoch": 1718} {"train_loss": -5.960744857788086, "global_step": 72181, "epoch": 1718} {"train_loss": -6.003561973571777, "global_step": 72182, "epoch": 1718} {"train_loss": -6.124943256378174, "global_step": 72183, "epoch": 1718} {"train_loss": -6.044469833374023, "global_step": 72184, "epoch": 1718} {"train_loss": -6.0971574783325195, "global_step": 72185, "epoch": 1718} {"train_loss": -6.103508472442627, "global_step": 72186, "epoch": 1718} {"train_loss": -5.9684882164001465, "global_step": 72187, "epoch": 1718} {"train_loss": -6.096986770629883, "global_step": 72188, "epoch": 1718} {"train_loss": -6.053284645080566, "global_step": 72189, "epoch": 1718} {"train_loss": -6.10694694519043, "global_step": 72190, "epoch": 1718} {"train_loss": -5.953085899353027, "global_step": 72191, "epoch": 1718} {"train_loss": -6.142973899841309, "global_step": 72192, "epoch": 1718} {"train_loss": -5.9495463371276855, "global_step": 72193, "epoch": 1718} {"train_loss": -5.999790668487549, "global_step": 72194, "epoch": 1718} {"train_loss": -6.099696159362793, "global_step": 72195, "epoch": 1718} {"train_loss": -5.978485107421875, "global_step": 72196, "epoch": 1718} {"train_loss": -6.060476575578962, "global_step": 72197, "epoch": 1718, "val_loss": 61728.02734375} {"train_loss": -6.139947891235352, "global_step": 72198, "epoch": 1719} {"train_loss": -5.923052787780762, "global_step": 72199, "epoch": 1719} {"train_loss": -6.197151184082031, "global_step": 72200, "epoch": 1719} {"train_loss": -6.1081085205078125, "global_step": 72201, "epoch": 1719} {"train_loss": -6.001943588256836, "global_step": 72202, "epoch": 1719} {"train_loss": -6.023393154144287, "global_step": 72203, "epoch": 1719} {"train_loss": -6.044182777404785, "global_step": 72204, "epoch": 1719} {"train_loss": -6.083544731140137, "global_step": 72205, "epoch": 1719} {"train_loss": -6.071465015411377, "global_step": 72206, "epoch": 1719} {"train_loss": -5.944843769073486, "global_step": 72207, "epoch": 1719} {"train_loss": -5.994919776916504, "global_step": 72208, "epoch": 1719} {"train_loss": -5.987775802612305, "global_step": 72209, "epoch": 1719} {"train_loss": -6.085591793060303, "global_step": 72210, "epoch": 1719} {"train_loss": -5.9616780281066895, "global_step": 72211, "epoch": 1719} {"train_loss": -6.130929470062256, "global_step": 72212, "epoch": 1719} {"train_loss": -6.029629707336426, "global_step": 72213, "epoch": 1719} {"train_loss": -6.04147481918335, "global_step": 72214, "epoch": 1719} {"train_loss": -5.931559085845947, "global_step": 72215, "epoch": 1719} {"train_loss": -5.983519554138184, "global_step": 72216, "epoch": 1719} {"train_loss": -5.962445259094238, "global_step": 72217, "epoch": 1719} {"train_loss": -6.032399654388428, "global_step": 72218, "epoch": 1719} {"train_loss": -5.989786148071289, "global_step": 72219, "epoch": 1719} {"train_loss": -5.977715492248535, "global_step": 72220, "epoch": 1719} {"train_loss": -6.105433464050293, "global_step": 72221, "epoch": 1719} {"train_loss": -6.012495994567871, "global_step": 72222, "epoch": 1719} {"train_loss": -6.019086837768555, "global_step": 72223, "epoch": 1719} {"train_loss": -5.9589948654174805, "global_step": 72224, "epoch": 1719} {"train_loss": -5.872034549713135, "global_step": 72225, "epoch": 1719} {"train_loss": -6.100714683532715, "global_step": 72226, "epoch": 1719} {"train_loss": -6.040097236633301, "global_step": 72227, "epoch": 1719} {"train_loss": -5.950229644775391, "global_step": 72228, "epoch": 1719} {"train_loss": -6.053173542022705, "global_step": 72229, "epoch": 1719} {"train_loss": -6.096771240234375, "global_step": 72230, "epoch": 1719} {"train_loss": -5.963834762573242, "global_step": 72231, "epoch": 1719} {"train_loss": -5.968817234039307, "global_step": 72232, "epoch": 1719} {"train_loss": -6.035372734069824, "global_step": 72233, "epoch": 1719} {"train_loss": -6.107522010803223, "global_step": 72234, "epoch": 1719} {"train_loss": -5.997884750366211, "global_step": 72235, "epoch": 1719} {"train_loss": -6.046755790710449, "global_step": 72236, "epoch": 1719} {"train_loss": -6.103279113769531, "global_step": 72237, "epoch": 1719} {"train_loss": -6.067773818969727, "global_step": 72238, "epoch": 1719} {"train_loss": -6.026358683904012, "global_step": 72239, "epoch": 1719, "val_loss": 61647.16796875} {"train_loss": -6.162368297576904, "global_step": 72240, "epoch": 1720} {"train_loss": -5.982388496398926, "global_step": 72241, "epoch": 1720} {"train_loss": -6.066197395324707, "global_step": 72242, "epoch": 1720} {"train_loss": -6.1312127113342285, "global_step": 72243, "epoch": 1720} {"train_loss": -6.062714576721191, "global_step": 72244, "epoch": 1720} {"train_loss": -6.002087593078613, "global_step": 72245, "epoch": 1720} {"train_loss": -6.040923595428467, "global_step": 72246, "epoch": 1720} {"train_loss": -6.069241046905518, "global_step": 72247, "epoch": 1720} {"train_loss": -5.971895217895508, "global_step": 72248, "epoch": 1720} {"train_loss": -6.0442914962768555, "global_step": 72249, "epoch": 1720} {"train_loss": -5.986355781555176, "global_step": 72250, "epoch": 1720} {"train_loss": -6.004311561584473, "global_step": 72251, "epoch": 1720} {"train_loss": -6.03972864151001, "global_step": 72252, "epoch": 1720} {"train_loss": -6.009811878204346, "global_step": 72253, "epoch": 1720} {"train_loss": -5.954596519470215, "global_step": 72254, "epoch": 1720} {"train_loss": -6.132185935974121, "global_step": 72255, "epoch": 1720} {"train_loss": -6.020543575286865, "global_step": 72256, "epoch": 1720} {"train_loss": -6.103338718414307, "global_step": 72257, "epoch": 1720} {"train_loss": -5.990957736968994, "global_step": 72258, "epoch": 1720} {"train_loss": -6.094304084777832, "global_step": 72259, "epoch": 1720} {"train_loss": -6.0589799880981445, "global_step": 72260, "epoch": 1720} {"train_loss": -6.060515403747559, "global_step": 72261, "epoch": 1720} {"train_loss": -6.07863712310791, "global_step": 72262, "epoch": 1720} {"train_loss": -6.0025129318237305, "global_step": 72263, "epoch": 1720} {"train_loss": -6.035212516784668, "global_step": 72264, "epoch": 1720} {"train_loss": -6.177675247192383, "global_step": 72265, "epoch": 1720} {"train_loss": -5.933080196380615, "global_step": 72266, "epoch": 1720} {"train_loss": -6.138226509094238, "global_step": 72267, "epoch": 1720} {"train_loss": -6.104933738708496, "global_step": 72268, "epoch": 1720} {"train_loss": -6.110821723937988, "global_step": 72269, "epoch": 1720} {"train_loss": -5.978839874267578, "global_step": 72270, "epoch": 1720} {"train_loss": -6.02938985824585, "global_step": 72271, "epoch": 1720} {"train_loss": -6.116909980773926, "global_step": 72272, "epoch": 1720} {"train_loss": -6.099551200866699, "global_step": 72273, "epoch": 1720} {"train_loss": -6.037014961242676, "global_step": 72274, "epoch": 1720} {"train_loss": -6.132345199584961, "global_step": 72275, "epoch": 1720} {"train_loss": -6.021052360534668, "global_step": 72276, "epoch": 1720} {"train_loss": -6.049394607543945, "global_step": 72277, "epoch": 1720} {"train_loss": -6.00731086730957, "global_step": 72278, "epoch": 1720} {"train_loss": -6.097403049468994, "global_step": 72279, "epoch": 1720} {"train_loss": -6.093010902404785, "global_step": 72280, "epoch": 1720} {"train_loss": -6.052065985543387, "global_step": 72281, "epoch": 1720, "val_loss": 61847.49609375} {"train_loss": -6.054219722747803, "global_step": 72282, "epoch": 1721} {"train_loss": -6.07124137878418, "global_step": 72283, "epoch": 1721} {"train_loss": -5.9951629638671875, "global_step": 72284, "epoch": 1721} {"train_loss": -6.110577583312988, "global_step": 72285, "epoch": 1721} {"train_loss": -6.045926094055176, "global_step": 72286, "epoch": 1721} {"train_loss": -6.053654670715332, "global_step": 72287, "epoch": 1721} {"train_loss": -6.0112504959106445, "global_step": 72288, "epoch": 1721} {"train_loss": -6.078812122344971, "global_step": 72289, "epoch": 1721} {"train_loss": -6.063043117523193, "global_step": 72290, "epoch": 1721} {"train_loss": -6.086865425109863, "global_step": 72291, "epoch": 1721} {"train_loss": -5.991183280944824, "global_step": 72292, "epoch": 1721} {"train_loss": -6.122763633728027, "global_step": 72293, "epoch": 1721} {"train_loss": -6.144024848937988, "global_step": 72294, "epoch": 1721} {"train_loss": -6.0655999183654785, "global_step": 72295, "epoch": 1721} {"train_loss": -6.119564056396484, "global_step": 72296, "epoch": 1721} {"train_loss": -6.178591728210449, "global_step": 72297, "epoch": 1721} {"train_loss": -6.162097454071045, "global_step": 72298, "epoch": 1721} {"train_loss": -5.9895782470703125, "global_step": 72299, "epoch": 1721} {"train_loss": -6.061417579650879, "global_step": 72300, "epoch": 1721} {"train_loss": -6.089462757110596, "global_step": 72301, "epoch": 1721} {"train_loss": -5.9231696128845215, "global_step": 72302, "epoch": 1721} {"train_loss": -6.066855430603027, "global_step": 72303, "epoch": 1721} {"train_loss": -6.111102104187012, "global_step": 72304, "epoch": 1721} {"train_loss": -6.010207653045654, "global_step": 72305, "epoch": 1721} {"train_loss": -6.121746063232422, "global_step": 72306, "epoch": 1721} {"train_loss": -6.004319190979004, "global_step": 72307, "epoch": 1721} {"train_loss": -6.124942779541016, "global_step": 72308, "epoch": 1721} {"train_loss": -6.028553009033203, "global_step": 72309, "epoch": 1721} {"train_loss": -5.888565540313721, "global_step": 72310, "epoch": 1721} {"train_loss": -6.018451690673828, "global_step": 72311, "epoch": 1721} {"train_loss": -6.1152849197387695, "global_step": 72312, "epoch": 1721} {"train_loss": -6.104219436645508, "global_step": 72313, "epoch": 1721} {"train_loss": -6.042917728424072, "global_step": 72314, "epoch": 1721} {"train_loss": -6.062205791473389, "global_step": 72315, "epoch": 1721} {"train_loss": -6.02783203125, "global_step": 72316, "epoch": 1721} {"train_loss": -5.985507488250732, "global_step": 72317, "epoch": 1721} {"train_loss": -5.982553482055664, "global_step": 72318, "epoch": 1721} {"train_loss": -6.015862464904785, "global_step": 72319, "epoch": 1721} {"train_loss": -5.977766513824463, "global_step": 72320, "epoch": 1721} {"train_loss": -5.96275520324707, "global_step": 72321, "epoch": 1721} {"train_loss": -5.987250328063965, "global_step": 72322, "epoch": 1721} {"train_loss": -6.050680433000837, "global_step": 72323, "epoch": 1721, "val_loss": 61784.73046875} {"train_loss": -6.0428786277771, "global_step": 72324, "epoch": 1722} {"train_loss": -6.020667552947998, "global_step": 72325, "epoch": 1722} {"train_loss": -6.001804351806641, "global_step": 72326, "epoch": 1722} {"train_loss": -6.166707992553711, "global_step": 72327, "epoch": 1722} {"train_loss": -6.073259353637695, "global_step": 72328, "epoch": 1722} {"train_loss": -6.038271903991699, "global_step": 72329, "epoch": 1722} {"train_loss": -5.995035171508789, "global_step": 72330, "epoch": 1722} {"train_loss": -6.0142621994018555, "global_step": 72331, "epoch": 1722} {"train_loss": -6.086302757263184, "global_step": 72332, "epoch": 1722} {"train_loss": -6.169572830200195, "global_step": 72333, "epoch": 1722} {"train_loss": -6.01039457321167, "global_step": 72334, "epoch": 1722} {"train_loss": -6.1530351638793945, "global_step": 72335, "epoch": 1722} {"train_loss": -6.185401916503906, "global_step": 72336, "epoch": 1722} {"train_loss": -6.066832542419434, "global_step": 72337, "epoch": 1722} {"train_loss": -6.180640697479248, "global_step": 72338, "epoch": 1722} {"train_loss": -6.067965030670166, "global_step": 72339, "epoch": 1722} {"train_loss": -6.117697715759277, "global_step": 72340, "epoch": 1722} {"train_loss": -6.069084167480469, "global_step": 72341, "epoch": 1722} {"train_loss": -6.068329811096191, "global_step": 72342, "epoch": 1722} {"train_loss": -6.144636154174805, "global_step": 72343, "epoch": 1722} {"train_loss": -6.098789215087891, "global_step": 72344, "epoch": 1722} {"train_loss": -6.093411445617676, "global_step": 72345, "epoch": 1722} {"train_loss": -6.224632263183594, "global_step": 72346, "epoch": 1722} {"train_loss": -6.172436714172363, "global_step": 72347, "epoch": 1722} {"train_loss": -6.177187919616699, "global_step": 72348, "epoch": 1722} {"train_loss": -6.255212783813477, "global_step": 72349, "epoch": 1722} {"train_loss": -6.011053085327148, "global_step": 72350, "epoch": 1722} {"train_loss": -6.031984806060791, "global_step": 72351, "epoch": 1722} {"train_loss": -6.059992790222168, "global_step": 72352, "epoch": 1722} {"train_loss": -6.093838691711426, "global_step": 72353, "epoch": 1722} {"train_loss": -5.977656364440918, "global_step": 72354, "epoch": 1722} {"train_loss": -6.043901443481445, "global_step": 72355, "epoch": 1722} {"train_loss": -6.078958511352539, "global_step": 72356, "epoch": 1722} {"train_loss": -6.065150737762451, "global_step": 72357, "epoch": 1722} {"train_loss": -6.032403945922852, "global_step": 72358, "epoch": 1722} {"train_loss": -5.966507911682129, "global_step": 72359, "epoch": 1722} {"train_loss": -6.040276050567627, "global_step": 72360, "epoch": 1722} {"train_loss": -5.994880676269531, "global_step": 72361, "epoch": 1722} {"train_loss": -6.107287406921387, "global_step": 72362, "epoch": 1722} {"train_loss": -6.0806379318237305, "global_step": 72363, "epoch": 1722} {"train_loss": -5.989931106567383, "global_step": 72364, "epoch": 1722} {"train_loss": -6.08113305909293, "global_step": 72365, "epoch": 1722, "val_loss": 61705.88671875} {"train_loss": -6.088253974914551, "global_step": 72366, "epoch": 1723} {"train_loss": -6.068698406219482, "global_step": 72367, "epoch": 1723} {"train_loss": -6.072193145751953, "global_step": 72368, "epoch": 1723} {"train_loss": -6.015969753265381, "global_step": 72369, "epoch": 1723} {"train_loss": -6.137031555175781, "global_step": 72370, "epoch": 1723} {"train_loss": -6.058181285858154, "global_step": 72371, "epoch": 1723} {"train_loss": -6.038905620574951, "global_step": 72372, "epoch": 1723} {"train_loss": -6.133294582366943, "global_step": 72373, "epoch": 1723} {"train_loss": -6.016776084899902, "global_step": 72374, "epoch": 1723} {"train_loss": -6.027029037475586, "global_step": 72375, "epoch": 1723} {"train_loss": -6.137516975402832, "global_step": 72376, "epoch": 1723} {"train_loss": -5.975159645080566, "global_step": 72377, "epoch": 1723} {"train_loss": -6.128274917602539, "global_step": 72378, "epoch": 1723} {"train_loss": -6.07775354385376, "global_step": 72379, "epoch": 1723} {"train_loss": -6.027314186096191, "global_step": 72380, "epoch": 1723} {"train_loss": -6.019357204437256, "global_step": 72381, "epoch": 1723} {"train_loss": -6.014726161956787, "global_step": 72382, "epoch": 1723} {"train_loss": -6.077855110168457, "global_step": 72383, "epoch": 1723} {"train_loss": -5.957413673400879, "global_step": 72384, "epoch": 1723} {"train_loss": -6.067386627197266, "global_step": 72385, "epoch": 1723} {"train_loss": -5.996298313140869, "global_step": 72386, "epoch": 1723} {"train_loss": -6.03713321685791, "global_step": 72387, "epoch": 1723} {"train_loss": -6.178863525390625, "global_step": 72388, "epoch": 1723} {"train_loss": -6.131304740905762, "global_step": 72389, "epoch": 1723} {"train_loss": -6.005610942840576, "global_step": 72390, "epoch": 1723} {"train_loss": -6.063481330871582, "global_step": 72391, "epoch": 1723} {"train_loss": -6.160238265991211, "global_step": 72392, "epoch": 1723} {"train_loss": -5.960321426391602, "global_step": 72393, "epoch": 1723} {"train_loss": -6.085819244384766, "global_step": 72394, "epoch": 1723} {"train_loss": -6.023948669433594, "global_step": 72395, "epoch": 1723} {"train_loss": -5.984406471252441, "global_step": 72396, "epoch": 1723} {"train_loss": -6.055980682373047, "global_step": 72397, "epoch": 1723} {"train_loss": -6.055258750915527, "global_step": 72398, "epoch": 1723} {"train_loss": -6.008283615112305, "global_step": 72399, "epoch": 1723} {"train_loss": -6.001852989196777, "global_step": 72400, "epoch": 1723} {"train_loss": -6.020549774169922, "global_step": 72401, "epoch": 1723} {"train_loss": -6.052435874938965, "global_step": 72402, "epoch": 1723} {"train_loss": -6.034215927124023, "global_step": 72403, "epoch": 1723} {"train_loss": -6.104053497314453, "global_step": 72404, "epoch": 1723} {"train_loss": -6.111814498901367, "global_step": 72405, "epoch": 1723} {"train_loss": -5.983488082885742, "global_step": 72406, "epoch": 1723} {"train_loss": -6.053612561452956, "global_step": 72407, "epoch": 1723, "val_loss": 61944.66796875} {"train_loss": -6.07421875, "global_step": 72408, "epoch": 1724} {"train_loss": -6.167787551879883, "global_step": 72409, "epoch": 1724} {"train_loss": -5.997361183166504, "global_step": 72410, "epoch": 1724} {"train_loss": -6.065781593322754, "global_step": 72411, "epoch": 1724} {"train_loss": -6.1959757804870605, "global_step": 72412, "epoch": 1724} {"train_loss": -6.0859904289245605, "global_step": 72413, "epoch": 1724} {"train_loss": -5.88116979598999, "global_step": 72414, "epoch": 1724} {"train_loss": -5.990720748901367, "global_step": 72415, "epoch": 1724} {"train_loss": -6.02985143661499, "global_step": 72416, "epoch": 1724} {"train_loss": -6.162051200866699, "global_step": 72417, "epoch": 1724} {"train_loss": -6.067501068115234, "global_step": 72418, "epoch": 1724} {"train_loss": -6.038177490234375, "global_step": 72419, "epoch": 1724} {"train_loss": -5.987032890319824, "global_step": 72420, "epoch": 1724} {"train_loss": -5.98320198059082, "global_step": 72421, "epoch": 1724} {"train_loss": -6.095699310302734, "global_step": 72422, "epoch": 1724} {"train_loss": -6.111978530883789, "global_step": 72423, "epoch": 1724} {"train_loss": -6.119239807128906, "global_step": 72424, "epoch": 1724} {"train_loss": -5.986849784851074, "global_step": 72425, "epoch": 1724} {"train_loss": -5.972838878631592, "global_step": 72426, "epoch": 1724} {"train_loss": -6.0585198402404785, "global_step": 72427, "epoch": 1724} {"train_loss": -6.067595958709717, "global_step": 72428, "epoch": 1724} {"train_loss": -5.95619010925293, "global_step": 72429, "epoch": 1724} {"train_loss": -6.180271148681641, "global_step": 72430, "epoch": 1724} {"train_loss": -6.067508697509766, "global_step": 72431, "epoch": 1724} {"train_loss": -6.104160308837891, "global_step": 72432, "epoch": 1724} {"train_loss": -6.077136039733887, "global_step": 72433, "epoch": 1724} {"train_loss": -6.127928733825684, "global_step": 72434, "epoch": 1724} {"train_loss": -6.158936500549316, "global_step": 72435, "epoch": 1724} {"train_loss": -6.126020908355713, "global_step": 72436, "epoch": 1724} {"train_loss": -6.082271099090576, "global_step": 72437, "epoch": 1724} {"train_loss": -6.113661766052246, "global_step": 72438, "epoch": 1724} {"train_loss": -6.123375415802002, "global_step": 72439, "epoch": 1724} {"train_loss": -6.1200408935546875, "global_step": 72440, "epoch": 1724} {"train_loss": -6.058586120605469, "global_step": 72441, "epoch": 1724} {"train_loss": -6.0519866943359375, "global_step": 72442, "epoch": 1724} {"train_loss": -5.933471202850342, "global_step": 72443, "epoch": 1724} {"train_loss": -6.035790920257568, "global_step": 72444, "epoch": 1724} {"train_loss": -6.006955146789551, "global_step": 72445, "epoch": 1724} {"train_loss": -6.068373680114746, "global_step": 72446, "epoch": 1724} {"train_loss": -6.063444137573242, "global_step": 72447, "epoch": 1724} {"train_loss": -6.076709747314453, "global_step": 72448, "epoch": 1724} {"train_loss": -6.067881652287075, "global_step": 72449, "epoch": 1724, "val_loss": 61854.234375} {"train_loss": -6.18387508392334, "global_step": 72450, "epoch": 1725} {"train_loss": -6.134487152099609, "global_step": 72451, "epoch": 1725} {"train_loss": -6.09926700592041, "global_step": 72452, "epoch": 1725} {"train_loss": -6.108524799346924, "global_step": 72453, "epoch": 1725} {"train_loss": -6.107260227203369, "global_step": 72454, "epoch": 1725} {"train_loss": -6.041478157043457, "global_step": 72455, "epoch": 1725} {"train_loss": -6.0281267166137695, "global_step": 72456, "epoch": 1725} {"train_loss": -6.048846244812012, "global_step": 72457, "epoch": 1725} {"train_loss": -5.981804370880127, "global_step": 72458, "epoch": 1725} {"train_loss": -5.93214225769043, "global_step": 72459, "epoch": 1725} {"train_loss": -6.092033386230469, "global_step": 72460, "epoch": 1725} {"train_loss": -6.066852569580078, "global_step": 72461, "epoch": 1725} {"train_loss": -5.994570255279541, "global_step": 72462, "epoch": 1725} {"train_loss": -5.961439609527588, "global_step": 72463, "epoch": 1725} {"train_loss": -6.082971572875977, "global_step": 72464, "epoch": 1725} {"train_loss": -6.064482688903809, "global_step": 72465, "epoch": 1725} {"train_loss": -6.018692970275879, "global_step": 72466, "epoch": 1725} {"train_loss": -6.0481486320495605, "global_step": 72467, "epoch": 1725} {"train_loss": -5.916299819946289, "global_step": 72468, "epoch": 1725} {"train_loss": -6.135345458984375, "global_step": 72469, "epoch": 1725} {"train_loss": -5.935216903686523, "global_step": 72470, "epoch": 1725} {"train_loss": -6.0242767333984375, "global_step": 72471, "epoch": 1725} {"train_loss": -6.034147262573242, "global_step": 72472, "epoch": 1725} {"train_loss": -5.898030757904053, "global_step": 72473, "epoch": 1725} {"train_loss": -5.982662677764893, "global_step": 72474, "epoch": 1725} {"train_loss": -5.970359802246094, "global_step": 72475, "epoch": 1725} {"train_loss": -6.074406623840332, "global_step": 72476, "epoch": 1725} {"train_loss": -6.060907363891602, "global_step": 72477, "epoch": 1725} {"train_loss": -5.993116855621338, "global_step": 72478, "epoch": 1725} {"train_loss": -6.054241180419922, "global_step": 72479, "epoch": 1725} {"train_loss": -5.87571907043457, "global_step": 72480, "epoch": 1725} {"train_loss": -6.0105462074279785, "global_step": 72481, "epoch": 1725} {"train_loss": -5.9673566818237305, "global_step": 72482, "epoch": 1725} {"train_loss": -5.955211639404297, "global_step": 72483, "epoch": 1725} {"train_loss": -5.922410488128662, "global_step": 72484, "epoch": 1725} {"train_loss": -5.979641437530518, "global_step": 72485, "epoch": 1725} {"train_loss": -6.0433030128479, "global_step": 72486, "epoch": 1725} {"train_loss": -6.0418219566345215, "global_step": 72487, "epoch": 1725} {"train_loss": -6.076092720031738, "global_step": 72488, "epoch": 1725} {"train_loss": -6.0448713302612305, "global_step": 72489, "epoch": 1725} {"train_loss": -5.991006374359131, "global_step": 72490, "epoch": 1725} {"train_loss": -6.022982756296794, "global_step": 72491, "epoch": 1725, "val_loss": 61847.140625} {"train_loss": -5.915973663330078, "global_step": 72492, "epoch": 1726} {"train_loss": -6.045164108276367, "global_step": 72493, "epoch": 1726} {"train_loss": -5.929714202880859, "global_step": 72494, "epoch": 1726} {"train_loss": -6.1286301612854, "global_step": 72495, "epoch": 1726} {"train_loss": -6.078167915344238, "global_step": 72496, "epoch": 1726} {"train_loss": -6.0986647605896, "global_step": 72497, "epoch": 1726} {"train_loss": -6.015524864196777, "global_step": 72498, "epoch": 1726} {"train_loss": -6.056914329528809, "global_step": 72499, "epoch": 1726} {"train_loss": -6.100522041320801, "global_step": 72500, "epoch": 1726} {"train_loss": -6.143036842346191, "global_step": 72501, "epoch": 1726} {"train_loss": -6.086796760559082, "global_step": 72502, "epoch": 1726} {"train_loss": -6.0834503173828125, "global_step": 72503, "epoch": 1726} {"train_loss": -5.9984822273254395, "global_step": 72504, "epoch": 1726} {"train_loss": -5.979301452636719, "global_step": 72505, "epoch": 1726} {"train_loss": -5.893464088439941, "global_step": 72506, "epoch": 1726} {"train_loss": -6.196165084838867, "global_step": 72507, "epoch": 1726} {"train_loss": -6.111433982849121, "global_step": 72508, "epoch": 1726} {"train_loss": -5.976252555847168, "global_step": 72509, "epoch": 1726} {"train_loss": -6.056188106536865, "global_step": 72510, "epoch": 1726} {"train_loss": -6.1237287521362305, "global_step": 72511, "epoch": 1726} {"train_loss": -5.967062950134277, "global_step": 72512, "epoch": 1726} {"train_loss": -6.114229202270508, "global_step": 72513, "epoch": 1726} {"train_loss": -6.139954566955566, "global_step": 72514, "epoch": 1726} {"train_loss": -6.145511627197266, "global_step": 72515, "epoch": 1726} {"train_loss": -5.997134208679199, "global_step": 72516, "epoch": 1726} {"train_loss": -6.0150604248046875, "global_step": 72517, "epoch": 1726} {"train_loss": -5.913887977600098, "global_step": 72518, "epoch": 1726} {"train_loss": -5.945117950439453, "global_step": 72519, "epoch": 1726} {"train_loss": -5.970300197601318, "global_step": 72520, "epoch": 1726} {"train_loss": -6.030425071716309, "global_step": 72521, "epoch": 1726} {"train_loss": -5.8747100830078125, "global_step": 72522, "epoch": 1726} {"train_loss": -6.0555620193481445, "global_step": 72523, "epoch": 1726} {"train_loss": -5.934934616088867, "global_step": 72524, "epoch": 1726} {"train_loss": -5.965036392211914, "global_step": 72525, "epoch": 1726} {"train_loss": -6.003469944000244, "global_step": 72526, "epoch": 1726} {"train_loss": -6.022830963134766, "global_step": 72527, "epoch": 1726} {"train_loss": -5.962209224700928, "global_step": 72528, "epoch": 1726} {"train_loss": -6.032655715942383, "global_step": 72529, "epoch": 1726} {"train_loss": -6.047344207763672, "global_step": 72530, "epoch": 1726} {"train_loss": -5.97401237487793, "global_step": 72531, "epoch": 1726} {"train_loss": -6.001550674438477, "global_step": 72532, "epoch": 1726} {"train_loss": -6.027418306895664, "global_step": 72533, "epoch": 1726, "val_loss": 61908.98046875} {"train_loss": -6.053443908691406, "global_step": 72534, "epoch": 1727} {"train_loss": -6.062109470367432, "global_step": 72535, "epoch": 1727} {"train_loss": -6.068683624267578, "global_step": 72536, "epoch": 1727} {"train_loss": -6.1191816329956055, "global_step": 72537, "epoch": 1727} {"train_loss": -5.96166467666626, "global_step": 72538, "epoch": 1727} {"train_loss": -6.065999984741211, "global_step": 72539, "epoch": 1727} {"train_loss": -5.885976791381836, "global_step": 72540, "epoch": 1727} {"train_loss": -5.977374076843262, "global_step": 72541, "epoch": 1727} {"train_loss": -6.043949604034424, "global_step": 72542, "epoch": 1727} {"train_loss": -6.070799350738525, "global_step": 72543, "epoch": 1727} {"train_loss": -5.965134620666504, "global_step": 72544, "epoch": 1727} {"train_loss": -5.987605094909668, "global_step": 72545, "epoch": 1727} {"train_loss": -6.088234901428223, "global_step": 72546, "epoch": 1727} {"train_loss": -5.996984958648682, "global_step": 72547, "epoch": 1727} {"train_loss": -5.958507537841797, "global_step": 72548, "epoch": 1727} {"train_loss": -5.961267471313477, "global_step": 72549, "epoch": 1727} {"train_loss": -6.030981063842773, "global_step": 72550, "epoch": 1727} {"train_loss": -6.067972183227539, "global_step": 72551, "epoch": 1727} {"train_loss": -5.930500030517578, "global_step": 72552, "epoch": 1727} {"train_loss": -6.128294467926025, "global_step": 72553, "epoch": 1727} {"train_loss": -6.078515529632568, "global_step": 72554, "epoch": 1727} {"train_loss": -6.099363803863525, "global_step": 72555, "epoch": 1727} {"train_loss": -6.072021961212158, "global_step": 72556, "epoch": 1727} {"train_loss": -6.073660850524902, "global_step": 72557, "epoch": 1727} {"train_loss": -6.013631820678711, "global_step": 72558, "epoch": 1727} {"train_loss": -6.088817596435547, "global_step": 72559, "epoch": 1727} {"train_loss": -6.155330657958984, "global_step": 72560, "epoch": 1727} {"train_loss": -6.000155925750732, "global_step": 72561, "epoch": 1727} {"train_loss": -6.039103984832764, "global_step": 72562, "epoch": 1727} {"train_loss": -6.013916969299316, "global_step": 72563, "epoch": 1727} {"train_loss": -6.115873336791992, "global_step": 72564, "epoch": 1727} {"train_loss": -6.028743743896484, "global_step": 72565, "epoch": 1727} {"train_loss": -6.095709800720215, "global_step": 72566, "epoch": 1727} {"train_loss": -6.11779260635376, "global_step": 72567, "epoch": 1727} {"train_loss": -6.073321342468262, "global_step": 72568, "epoch": 1727} {"train_loss": -6.03832483291626, "global_step": 72569, "epoch": 1727} {"train_loss": -6.181807041168213, "global_step": 72570, "epoch": 1727} {"train_loss": -6.163286209106445, "global_step": 72571, "epoch": 1727} {"train_loss": -6.050180435180664, "global_step": 72572, "epoch": 1727} {"train_loss": -6.116695404052734, "global_step": 72573, "epoch": 1727} {"train_loss": -6.063503265380859, "global_step": 72574, "epoch": 1727} {"train_loss": -6.050437314169748, "global_step": 72575, "epoch": 1727, "val_loss": 61663.2109375} {"train_loss": -6.122744083404541, "global_step": 72576, "epoch": 1728} {"train_loss": -5.951942443847656, "global_step": 72577, "epoch": 1728} {"train_loss": -6.159884452819824, "global_step": 72578, "epoch": 1728} {"train_loss": -6.0521345138549805, "global_step": 72579, "epoch": 1728} {"train_loss": -6.070233345031738, "global_step": 72580, "epoch": 1728} {"train_loss": -6.112266540527344, "global_step": 72581, "epoch": 1728} {"train_loss": -6.040409564971924, "global_step": 72582, "epoch": 1728} {"train_loss": -6.1172099113464355, "global_step": 72583, "epoch": 1728} {"train_loss": -5.9474897384643555, "global_step": 72584, "epoch": 1728} {"train_loss": -6.100497722625732, "global_step": 72585, "epoch": 1728} {"train_loss": -6.133341312408447, "global_step": 72586, "epoch": 1728} {"train_loss": -6.061700820922852, "global_step": 72587, "epoch": 1728} {"train_loss": -6.086870193481445, "global_step": 72588, "epoch": 1728} {"train_loss": -6.168428421020508, "global_step": 72589, "epoch": 1728} {"train_loss": -6.025286674499512, "global_step": 72590, "epoch": 1728} {"train_loss": -6.093987464904785, "global_step": 72591, "epoch": 1728} {"train_loss": -6.084436416625977, "global_step": 72592, "epoch": 1728} {"train_loss": -5.929681777954102, "global_step": 72593, "epoch": 1728} {"train_loss": -6.067119598388672, "global_step": 72594, "epoch": 1728} {"train_loss": -6.175731182098389, "global_step": 72595, "epoch": 1728} {"train_loss": -6.054708480834961, "global_step": 72596, "epoch": 1728} {"train_loss": -6.042911529541016, "global_step": 72597, "epoch": 1728} {"train_loss": -6.098840713500977, "global_step": 72598, "epoch": 1728} {"train_loss": -6.159316539764404, "global_step": 72599, "epoch": 1728} {"train_loss": -6.076216697692871, "global_step": 72600, "epoch": 1728} {"train_loss": -6.152663707733154, "global_step": 72601, "epoch": 1728} {"train_loss": -5.964232444763184, "global_step": 72602, "epoch": 1728} {"train_loss": -5.974915981292725, "global_step": 72603, "epoch": 1728} {"train_loss": -5.988058090209961, "global_step": 72604, "epoch": 1728} {"train_loss": -6.066601276397705, "global_step": 72605, "epoch": 1728} {"train_loss": -6.11407995223999, "global_step": 72606, "epoch": 1728} {"train_loss": -5.977001190185547, "global_step": 72607, "epoch": 1728} {"train_loss": -6.060044288635254, "global_step": 72608, "epoch": 1728} {"train_loss": -6.139508247375488, "global_step": 72609, "epoch": 1728} {"train_loss": -6.036052703857422, "global_step": 72610, "epoch": 1728} {"train_loss": -6.042098045349121, "global_step": 72611, "epoch": 1728} {"train_loss": -6.113534927368164, "global_step": 72612, "epoch": 1728} {"train_loss": -5.988560676574707, "global_step": 72613, "epoch": 1728} {"train_loss": -6.0414628982543945, "global_step": 72614, "epoch": 1728} {"train_loss": -6.089385509490967, "global_step": 72615, "epoch": 1728} {"train_loss": -6.041178226470947, "global_step": 72616, "epoch": 1728} {"train_loss": -6.065611078625634, "global_step": 72617, "epoch": 1728, "val_loss": 61664.16015625} {"train_loss": -5.997166633605957, "global_step": 72618, "epoch": 1729} {"train_loss": -6.069764137268066, "global_step": 72619, "epoch": 1729} {"train_loss": -6.090320110321045, "global_step": 72620, "epoch": 1729} {"train_loss": -6.167246341705322, "global_step": 72621, "epoch": 1729} {"train_loss": -6.145947456359863, "global_step": 72622, "epoch": 1729} {"train_loss": -6.177732467651367, "global_step": 72623, "epoch": 1729} {"train_loss": -6.095977783203125, "global_step": 72624, "epoch": 1729} {"train_loss": -5.952764987945557, "global_step": 72625, "epoch": 1729} {"train_loss": -6.015864372253418, "global_step": 72626, "epoch": 1729} {"train_loss": -5.99668025970459, "global_step": 72627, "epoch": 1729} {"train_loss": -6.1118879318237305, "global_step": 72628, "epoch": 1729} {"train_loss": -6.072768211364746, "global_step": 72629, "epoch": 1729} {"train_loss": -6.04090690612793, "global_step": 72630, "epoch": 1729} {"train_loss": -6.070580005645752, "global_step": 72631, "epoch": 1729} {"train_loss": -6.121255874633789, "global_step": 72632, "epoch": 1729} {"train_loss": -6.228408336639404, "global_step": 72633, "epoch": 1729} {"train_loss": -6.169112205505371, "global_step": 72634, "epoch": 1729} {"train_loss": -6.0332465171813965, "global_step": 72635, "epoch": 1729} {"train_loss": -6.041203498840332, "global_step": 72636, "epoch": 1729} {"train_loss": -6.01878023147583, "global_step": 72637, "epoch": 1729} {"train_loss": -6.1502156257629395, "global_step": 72638, "epoch": 1729} {"train_loss": -6.039374828338623, "global_step": 72639, "epoch": 1729} {"train_loss": -5.988979339599609, "global_step": 72640, "epoch": 1729} {"train_loss": -6.076845169067383, "global_step": 72641, "epoch": 1729} {"train_loss": -6.029152870178223, "global_step": 72642, "epoch": 1729} {"train_loss": -6.080357551574707, "global_step": 72643, "epoch": 1729} {"train_loss": -6.01978063583374, "global_step": 72644, "epoch": 1729} {"train_loss": -6.03184700012207, "global_step": 72645, "epoch": 1729} {"train_loss": -5.984480381011963, "global_step": 72646, "epoch": 1729} {"train_loss": -6.0250115394592285, "global_step": 72647, "epoch": 1729} {"train_loss": -5.988886833190918, "global_step": 72648, "epoch": 1729} {"train_loss": -5.956348896026611, "global_step": 72649, "epoch": 1729} {"train_loss": -5.93521785736084, "global_step": 72650, "epoch": 1729} {"train_loss": -6.076117992401123, "global_step": 72651, "epoch": 1729} {"train_loss": -5.885335922241211, "global_step": 72652, "epoch": 1729} {"train_loss": -5.966879844665527, "global_step": 72653, "epoch": 1729} {"train_loss": -6.000816822052002, "global_step": 72654, "epoch": 1729} {"train_loss": -5.970117568969727, "global_step": 72655, "epoch": 1729} {"train_loss": -6.0676140785217285, "global_step": 72656, "epoch": 1729} {"train_loss": -5.9704108238220215, "global_step": 72657, "epoch": 1729} {"train_loss": -5.947864532470703, "global_step": 72658, "epoch": 1729} {"train_loss": -6.046015659968059, "global_step": 72659, "epoch": 1729, "val_loss": 62119.609375} {"train_loss": -6.020191192626953, "global_step": 72660, "epoch": 1730} {"train_loss": -6.058521270751953, "global_step": 72661, "epoch": 1730} {"train_loss": -6.063359260559082, "global_step": 72662, "epoch": 1730} {"train_loss": -5.9141340255737305, "global_step": 72663, "epoch": 1730} {"train_loss": -6.006516456604004, "global_step": 72664, "epoch": 1730} {"train_loss": -5.976630210876465, "global_step": 72665, "epoch": 1730} {"train_loss": -6.0807342529296875, "global_step": 72666, "epoch": 1730} {"train_loss": -6.073012351989746, "global_step": 72667, "epoch": 1730} {"train_loss": -6.0158514976501465, "global_step": 72668, "epoch": 1730} {"train_loss": -6.02110481262207, "global_step": 72669, "epoch": 1730} {"train_loss": -5.938684463500977, "global_step": 72670, "epoch": 1730} {"train_loss": -6.106618404388428, "global_step": 72671, "epoch": 1730} {"train_loss": -5.957300662994385, "global_step": 72672, "epoch": 1730} {"train_loss": -6.098254203796387, "global_step": 72673, "epoch": 1730} {"train_loss": -6.037236213684082, "global_step": 72674, "epoch": 1730} {"train_loss": -6.074554443359375, "global_step": 72675, "epoch": 1730} {"train_loss": -6.101645469665527, "global_step": 72676, "epoch": 1730} {"train_loss": -6.088875770568848, "global_step": 72677, "epoch": 1730} {"train_loss": -5.935240745544434, "global_step": 72678, "epoch": 1730} {"train_loss": -6.0595703125, "global_step": 72679, "epoch": 1730} {"train_loss": -6.062536239624023, "global_step": 72680, "epoch": 1730} {"train_loss": -6.050804138183594, "global_step": 72681, "epoch": 1730} {"train_loss": -6.036984443664551, "global_step": 72682, "epoch": 1730} {"train_loss": -5.982099533081055, "global_step": 72683, "epoch": 1730} {"train_loss": -6.087216377258301, "global_step": 72684, "epoch": 1730} {"train_loss": -6.094212055206299, "global_step": 72685, "epoch": 1730} {"train_loss": -6.075746536254883, "global_step": 72686, "epoch": 1730} {"train_loss": -6.055819511413574, "global_step": 72687, "epoch": 1730} {"train_loss": -6.036230087280273, "global_step": 72688, "epoch": 1730} {"train_loss": -6.038332939147949, "global_step": 72689, "epoch": 1730} {"train_loss": -5.993372440338135, "global_step": 72690, "epoch": 1730} {"train_loss": -6.1401495933532715, "global_step": 72691, "epoch": 1730} {"train_loss": -6.060918807983398, "global_step": 72692, "epoch": 1730} {"train_loss": -6.175734519958496, "global_step": 72693, "epoch": 1730} {"train_loss": -5.953203201293945, "global_step": 72694, "epoch": 1730} {"train_loss": -6.065025806427002, "global_step": 72695, "epoch": 1730} {"train_loss": -5.973155975341797, "global_step": 72696, "epoch": 1730} {"train_loss": -5.931456565856934, "global_step": 72697, "epoch": 1730} {"train_loss": -5.980445861816406, "global_step": 72698, "epoch": 1730} {"train_loss": -6.00440788269043, "global_step": 72699, "epoch": 1730} {"train_loss": -6.146188259124756, "global_step": 72700, "epoch": 1730} {"train_loss": -6.037525744665237, "global_step": 72701, "epoch": 1730, "val_loss": 61915.58203125} {"train_loss": -6.094448089599609, "global_step": 72702, "epoch": 1731} {"train_loss": -6.025084972381592, "global_step": 72703, "epoch": 1731} {"train_loss": -6.05460262298584, "global_step": 72704, "epoch": 1731} {"train_loss": -6.037773132324219, "global_step": 72705, "epoch": 1731} {"train_loss": -6.122142791748047, "global_step": 72706, "epoch": 1731} {"train_loss": -5.887372970581055, "global_step": 72707, "epoch": 1731} {"train_loss": -5.945354461669922, "global_step": 72708, "epoch": 1731} {"train_loss": -6.032765865325928, "global_step": 72709, "epoch": 1731} {"train_loss": -6.158982276916504, "global_step": 72710, "epoch": 1731} {"train_loss": -6.12977409362793, "global_step": 72711, "epoch": 1731} {"train_loss": -6.13665771484375, "global_step": 72712, "epoch": 1731} {"train_loss": -6.053924560546875, "global_step": 72713, "epoch": 1731} {"train_loss": -6.072820663452148, "global_step": 72714, "epoch": 1731} {"train_loss": -6.149164199829102, "global_step": 72715, "epoch": 1731} {"train_loss": -6.128914833068848, "global_step": 72716, "epoch": 1731} {"train_loss": -6.062554836273193, "global_step": 72717, "epoch": 1731} {"train_loss": -6.011590003967285, "global_step": 72718, "epoch": 1731} {"train_loss": -6.002768516540527, "global_step": 72719, "epoch": 1731} {"train_loss": -6.116745948791504, "global_step": 72720, "epoch": 1731} {"train_loss": -6.05281925201416, "global_step": 72721, "epoch": 1731} {"train_loss": -5.9808349609375, "global_step": 72722, "epoch": 1731} {"train_loss": -6.148992538452148, "global_step": 72723, "epoch": 1731} {"train_loss": -6.051357269287109, "global_step": 72724, "epoch": 1731} {"train_loss": -6.0732808113098145, "global_step": 72725, "epoch": 1731} {"train_loss": -6.130463600158691, "global_step": 72726, "epoch": 1731} {"train_loss": -6.037801742553711, "global_step": 72727, "epoch": 1731} {"train_loss": -5.942276477813721, "global_step": 72728, "epoch": 1731} {"train_loss": -6.062910079956055, "global_step": 72729, "epoch": 1731} {"train_loss": -6.0564093589782715, "global_step": 72730, "epoch": 1731} {"train_loss": -6.103524208068848, "global_step": 72731, "epoch": 1731} {"train_loss": -6.0489583015441895, "global_step": 72732, "epoch": 1731} {"train_loss": -6.169094562530518, "global_step": 72733, "epoch": 1731} {"train_loss": -5.947727203369141, "global_step": 72734, "epoch": 1731} {"train_loss": -6.1128950119018555, "global_step": 72735, "epoch": 1731} {"train_loss": -6.101881980895996, "global_step": 72736, "epoch": 1731} {"train_loss": -6.0090155601501465, "global_step": 72737, "epoch": 1731} {"train_loss": -6.0341949462890625, "global_step": 72738, "epoch": 1731} {"train_loss": -6.034360885620117, "global_step": 72739, "epoch": 1731} {"train_loss": -5.934002876281738, "global_step": 72740, "epoch": 1731} {"train_loss": -6.117656230926514, "global_step": 72741, "epoch": 1731} {"train_loss": -6.078282356262207, "global_step": 72742, "epoch": 1731} {"train_loss": -6.058058034806025, "global_step": 72743, "epoch": 1731, "val_loss": 61740.90234375} {"train_loss": -6.072229385375977, "global_step": 72744, "epoch": 1732} {"train_loss": -6.0839643478393555, "global_step": 72745, "epoch": 1732} {"train_loss": -6.138125419616699, "global_step": 72746, "epoch": 1732} {"train_loss": -6.094128608703613, "global_step": 72747, "epoch": 1732} {"train_loss": -6.032756805419922, "global_step": 72748, "epoch": 1732} {"train_loss": -6.006936073303223, "global_step": 72749, "epoch": 1732} {"train_loss": -6.050941467285156, "global_step": 72750, "epoch": 1732} {"train_loss": -6.192388534545898, "global_step": 72751, "epoch": 1732} {"train_loss": -6.0783891677856445, "global_step": 72752, "epoch": 1732} {"train_loss": -5.965815544128418, "global_step": 72753, "epoch": 1732} {"train_loss": -5.923430919647217, "global_step": 72754, "epoch": 1732} {"train_loss": -6.0436906814575195, "global_step": 72755, "epoch": 1732} {"train_loss": -6.072893142700195, "global_step": 72756, "epoch": 1732} {"train_loss": -6.111282825469971, "global_step": 72757, "epoch": 1732} {"train_loss": -6.065832614898682, "global_step": 72758, "epoch": 1732} {"train_loss": -6.053402423858643, "global_step": 72759, "epoch": 1732} {"train_loss": -6.031868934631348, "global_step": 72760, "epoch": 1732} {"train_loss": -6.003950119018555, "global_step": 72761, "epoch": 1732} {"train_loss": -6.15000057220459, "global_step": 72762, "epoch": 1732} {"train_loss": -6.062027454376221, "global_step": 72763, "epoch": 1732} {"train_loss": -6.087863922119141, "global_step": 72764, "epoch": 1732} {"train_loss": -5.875509262084961, "global_step": 72765, "epoch": 1732} {"train_loss": -5.987861633300781, "global_step": 72766, "epoch": 1732} {"train_loss": -6.107827663421631, "global_step": 72767, "epoch": 1732} {"train_loss": -6.064410209655762, "global_step": 72768, "epoch": 1732} {"train_loss": -6.070237636566162, "global_step": 72769, "epoch": 1732} {"train_loss": -6.088224411010742, "global_step": 72770, "epoch": 1732} {"train_loss": -6.1481523513793945, "global_step": 72771, "epoch": 1732} {"train_loss": -6.229222297668457, "global_step": 72772, "epoch": 1732} {"train_loss": -6.1496429443359375, "global_step": 72773, "epoch": 1732} {"train_loss": -6.099730014801025, "global_step": 72774, "epoch": 1732} {"train_loss": -6.185211181640625, "global_step": 72775, "epoch": 1732} {"train_loss": -6.063595294952393, "global_step": 72776, "epoch": 1732} {"train_loss": -6.051643371582031, "global_step": 72777, "epoch": 1732} {"train_loss": -6.165532112121582, "global_step": 72778, "epoch": 1732} {"train_loss": -6.131038665771484, "global_step": 72779, "epoch": 1732} {"train_loss": -6.170295715332031, "global_step": 72780, "epoch": 1732} {"train_loss": -6.121685981750488, "global_step": 72781, "epoch": 1732} {"train_loss": -6.073553085327148, "global_step": 72782, "epoch": 1732} {"train_loss": -6.083531379699707, "global_step": 72783, "epoch": 1732} {"train_loss": -6.173225402832031, "global_step": 72784, "epoch": 1732} {"train_loss": -6.08357606615339, "global_step": 72785, "epoch": 1732, "val_loss": 61910.29296875} {"train_loss": -5.97382926940918, "global_step": 72786, "epoch": 1733} {"train_loss": -5.966358184814453, "global_step": 72787, "epoch": 1733} {"train_loss": -6.073473930358887, "global_step": 72788, "epoch": 1733} {"train_loss": -6.113160133361816, "global_step": 72789, "epoch": 1733} {"train_loss": -6.193097114562988, "global_step": 72790, "epoch": 1733} {"train_loss": -6.1056952476501465, "global_step": 72791, "epoch": 1733} {"train_loss": -6.007232666015625, "global_step": 72792, "epoch": 1733} {"train_loss": -6.139187335968018, "global_step": 72793, "epoch": 1733} {"train_loss": -6.131921291351318, "global_step": 72794, "epoch": 1733} {"train_loss": -6.064218521118164, "global_step": 72795, "epoch": 1733} {"train_loss": -5.987208366394043, "global_step": 72796, "epoch": 1733} {"train_loss": -6.035685062408447, "global_step": 72797, "epoch": 1733} {"train_loss": -6.073177337646484, "global_step": 72798, "epoch": 1733} {"train_loss": -6.057255744934082, "global_step": 72799, "epoch": 1733} {"train_loss": -6.199245929718018, "global_step": 72800, "epoch": 1733} {"train_loss": -6.0980730056762695, "global_step": 72801, "epoch": 1733} {"train_loss": -6.070068359375, "global_step": 72802, "epoch": 1733} {"train_loss": -6.046058654785156, "global_step": 72803, "epoch": 1733} {"train_loss": -6.006039619445801, "global_step": 72804, "epoch": 1733} {"train_loss": -6.000940799713135, "global_step": 72805, "epoch": 1733} {"train_loss": -6.003971099853516, "global_step": 72806, "epoch": 1733} {"train_loss": -5.927765369415283, "global_step": 72807, "epoch": 1733} {"train_loss": -5.966799736022949, "global_step": 72808, "epoch": 1733} {"train_loss": -6.151844024658203, "global_step": 72809, "epoch": 1733} {"train_loss": -5.936471462249756, "global_step": 72810, "epoch": 1733} {"train_loss": -6.034012794494629, "global_step": 72811, "epoch": 1733} {"train_loss": -6.095439910888672, "global_step": 72812, "epoch": 1733} {"train_loss": -5.992807388305664, "global_step": 72813, "epoch": 1733} {"train_loss": -6.024981498718262, "global_step": 72814, "epoch": 1733} {"train_loss": -6.100832939147949, "global_step": 72815, "epoch": 1733} {"train_loss": -6.01983642578125, "global_step": 72816, "epoch": 1733} {"train_loss": -5.93388032913208, "global_step": 72817, "epoch": 1733} {"train_loss": -6.086416244506836, "global_step": 72818, "epoch": 1733} {"train_loss": -6.062493324279785, "global_step": 72819, "epoch": 1733} {"train_loss": -5.997461795806885, "global_step": 72820, "epoch": 1733} {"train_loss": -6.076160907745361, "global_step": 72821, "epoch": 1733} {"train_loss": -5.983542442321777, "global_step": 72822, "epoch": 1733} {"train_loss": -6.120162487030029, "global_step": 72823, "epoch": 1733} {"train_loss": -6.194944381713867, "global_step": 72824, "epoch": 1733} {"train_loss": -6.191404342651367, "global_step": 72825, "epoch": 1733} {"train_loss": -6.098226070404053, "global_step": 72826, "epoch": 1733} {"train_loss": -6.057541222799392, "global_step": 72827, "epoch": 1733, "val_loss": 61872.5703125} {"train_loss": -6.080207824707031, "global_step": 72828, "epoch": 1734} {"train_loss": -5.966433525085449, "global_step": 72829, "epoch": 1734} {"train_loss": -6.051007270812988, "global_step": 72830, "epoch": 1734} {"train_loss": -6.149616241455078, "global_step": 72831, "epoch": 1734} {"train_loss": -6.149316787719727, "global_step": 72832, "epoch": 1734} {"train_loss": -6.14054536819458, "global_step": 72833, "epoch": 1734} {"train_loss": -6.036959648132324, "global_step": 72834, "epoch": 1734} {"train_loss": -5.936638832092285, "global_step": 72835, "epoch": 1734} {"train_loss": -6.108840465545654, "global_step": 72836, "epoch": 1734} {"train_loss": -6.003798007965088, "global_step": 72837, "epoch": 1734} {"train_loss": -6.105674743652344, "global_step": 72838, "epoch": 1734} {"train_loss": -5.916280269622803, "global_step": 72839, "epoch": 1734} {"train_loss": -5.913610935211182, "global_step": 72840, "epoch": 1734} {"train_loss": -6.118657112121582, "global_step": 72841, "epoch": 1734} {"train_loss": -5.964863300323486, "global_step": 72842, "epoch": 1734} {"train_loss": -5.997457504272461, "global_step": 72843, "epoch": 1734} {"train_loss": -6.070556163787842, "global_step": 72844, "epoch": 1734} {"train_loss": -5.946967124938965, "global_step": 72845, "epoch": 1734} {"train_loss": -6.16826057434082, "global_step": 72846, "epoch": 1734} {"train_loss": -5.965687274932861, "global_step": 72847, "epoch": 1734} {"train_loss": -6.052975654602051, "global_step": 72848, "epoch": 1734} {"train_loss": -6.153512001037598, "global_step": 72849, "epoch": 1734} {"train_loss": -6.108993053436279, "global_step": 72850, "epoch": 1734} {"train_loss": -6.128006935119629, "global_step": 72851, "epoch": 1734} {"train_loss": -5.904636383056641, "global_step": 72852, "epoch": 1734} {"train_loss": -6.024040222167969, "global_step": 72853, "epoch": 1734} {"train_loss": -6.204215049743652, "global_step": 72854, "epoch": 1734} {"train_loss": -6.0202741622924805, "global_step": 72855, "epoch": 1734} {"train_loss": -6.1079559326171875, "global_step": 72856, "epoch": 1734} {"train_loss": -6.0885419845581055, "global_step": 72857, "epoch": 1734} {"train_loss": -6.0998687744140625, "global_step": 72858, "epoch": 1734} {"train_loss": -6.0811614990234375, "global_step": 72859, "epoch": 1734} {"train_loss": -6.087154865264893, "global_step": 72860, "epoch": 1734} {"train_loss": -6.024287223815918, "global_step": 72861, "epoch": 1734} {"train_loss": -6.154516220092773, "global_step": 72862, "epoch": 1734} {"train_loss": -6.1131110191345215, "global_step": 72863, "epoch": 1734} {"train_loss": -6.072558879852295, "global_step": 72864, "epoch": 1734} {"train_loss": -6.130488395690918, "global_step": 72865, "epoch": 1734} {"train_loss": -5.844359397888184, "global_step": 72866, "epoch": 1734} {"train_loss": -6.126445770263672, "global_step": 72867, "epoch": 1734} {"train_loss": -6.015069484710693, "global_step": 72868, "epoch": 1734} {"train_loss": -6.059086879094441, "global_step": 72869, "epoch": 1734, "val_loss": 61634.93359375} {"train_loss": -6.211795806884766, "global_step": 72870, "epoch": 1735} {"train_loss": -6.061686992645264, "global_step": 72871, "epoch": 1735} {"train_loss": -6.018344402313232, "global_step": 72872, "epoch": 1735} {"train_loss": -6.0235114097595215, "global_step": 72873, "epoch": 1735} {"train_loss": -5.998656272888184, "global_step": 72874, "epoch": 1735} {"train_loss": -6.018367767333984, "global_step": 72875, "epoch": 1735} {"train_loss": -6.086051940917969, "global_step": 72876, "epoch": 1735} {"train_loss": -6.016408920288086, "global_step": 72877, "epoch": 1735} {"train_loss": -6.104216575622559, "global_step": 72878, "epoch": 1735} {"train_loss": -6.177060604095459, "global_step": 72879, "epoch": 1735} {"train_loss": -6.15401554107666, "global_step": 72880, "epoch": 1735} {"train_loss": -6.052149295806885, "global_step": 72881, "epoch": 1735} {"train_loss": -6.060301780700684, "global_step": 72882, "epoch": 1735} {"train_loss": -6.041665077209473, "global_step": 72883, "epoch": 1735} {"train_loss": -6.003876686096191, "global_step": 72884, "epoch": 1735} {"train_loss": -6.066586971282959, "global_step": 72885, "epoch": 1735} {"train_loss": -6.0928955078125, "global_step": 72886, "epoch": 1735} {"train_loss": -6.006050109863281, "global_step": 72887, "epoch": 1735} {"train_loss": -6.02614688873291, "global_step": 72888, "epoch": 1735} {"train_loss": -6.107529640197754, "global_step": 72889, "epoch": 1735} {"train_loss": -6.011932373046875, "global_step": 72890, "epoch": 1735} {"train_loss": -6.079965591430664, "global_step": 72891, "epoch": 1735} {"train_loss": -6.055440425872803, "global_step": 72892, "epoch": 1735} {"train_loss": -6.072079658508301, "global_step": 72893, "epoch": 1735} {"train_loss": -6.181222915649414, "global_step": 72894, "epoch": 1735} {"train_loss": -5.9332709312438965, "global_step": 72895, "epoch": 1735} {"train_loss": -6.0147600173950195, "global_step": 72896, "epoch": 1735} {"train_loss": -6.018701553344727, "global_step": 72897, "epoch": 1735} {"train_loss": -5.956596374511719, "global_step": 72898, "epoch": 1735} {"train_loss": -6.1890034675598145, "global_step": 72899, "epoch": 1735} {"train_loss": -6.030633926391602, "global_step": 72900, "epoch": 1735} {"train_loss": -5.9898834228515625, "global_step": 72901, "epoch": 1735} {"train_loss": -6.126468658447266, "global_step": 72902, "epoch": 1735} {"train_loss": -6.022953510284424, "global_step": 72903, "epoch": 1735} {"train_loss": -6.063304901123047, "global_step": 72904, "epoch": 1735} {"train_loss": -5.985020637512207, "global_step": 72905, "epoch": 1735} {"train_loss": -5.939194679260254, "global_step": 72906, "epoch": 1735} {"train_loss": -5.940479278564453, "global_step": 72907, "epoch": 1735} {"train_loss": -6.060924530029297, "global_step": 72908, "epoch": 1735} {"train_loss": -6.06319522857666, "global_step": 72909, "epoch": 1735} {"train_loss": -6.062355041503906, "global_step": 72910, "epoch": 1735} {"train_loss": -6.049876088187808, "global_step": 72911, "epoch": 1735, "val_loss": 61822.84375} {"train_loss": -6.002018928527832, "global_step": 72912, "epoch": 1736} {"train_loss": -6.163036346435547, "global_step": 72913, "epoch": 1736} {"train_loss": -6.039051055908203, "global_step": 72914, "epoch": 1736} {"train_loss": -5.974179744720459, "global_step": 72915, "epoch": 1736} {"train_loss": -5.957828998565674, "global_step": 72916, "epoch": 1736} {"train_loss": -6.232128143310547, "global_step": 72917, "epoch": 1736} {"train_loss": -5.941446304321289, "global_step": 72918, "epoch": 1736} {"train_loss": -6.077589988708496, "global_step": 72919, "epoch": 1736} {"train_loss": -5.924221515655518, "global_step": 72920, "epoch": 1736} {"train_loss": -5.927598476409912, "global_step": 72921, "epoch": 1736} {"train_loss": -5.982056617736816, "global_step": 72922, "epoch": 1736} {"train_loss": -5.978626728057861, "global_step": 72923, "epoch": 1736} {"train_loss": -5.97252082824707, "global_step": 72924, "epoch": 1736} {"train_loss": -6.00091028213501, "global_step": 72925, "epoch": 1736} {"train_loss": -5.959219932556152, "global_step": 72926, "epoch": 1736} {"train_loss": -6.069345474243164, "global_step": 72927, "epoch": 1736} {"train_loss": -5.991042613983154, "global_step": 72928, "epoch": 1736} {"train_loss": -6.0317840576171875, "global_step": 72929, "epoch": 1736} {"train_loss": -6.039820671081543, "global_step": 72930, "epoch": 1736} {"train_loss": -5.984748840332031, "global_step": 72931, "epoch": 1736} {"train_loss": -6.146405220031738, "global_step": 72932, "epoch": 1736} {"train_loss": -6.086861610412598, "global_step": 72933, "epoch": 1736} {"train_loss": -6.021289348602295, "global_step": 72934, "epoch": 1736} {"train_loss": -6.097359657287598, "global_step": 72935, "epoch": 1736} {"train_loss": -5.844661712646484, "global_step": 72936, "epoch": 1736} {"train_loss": -6.087604522705078, "global_step": 72937, "epoch": 1736} {"train_loss": -6.106735706329346, "global_step": 72938, "epoch": 1736} {"train_loss": -5.910250663757324, "global_step": 72939, "epoch": 1736} {"train_loss": -6.147966384887695, "global_step": 72940, "epoch": 1736} {"train_loss": -6.020511627197266, "global_step": 72941, "epoch": 1736} {"train_loss": -6.019114017486572, "global_step": 72942, "epoch": 1736} {"train_loss": -5.9801411628723145, "global_step": 72943, "epoch": 1736} {"train_loss": -6.022387504577637, "global_step": 72944, "epoch": 1736} {"train_loss": -6.132047653198242, "global_step": 72945, "epoch": 1736} {"train_loss": -5.95343017578125, "global_step": 72946, "epoch": 1736} {"train_loss": -5.969451427459717, "global_step": 72947, "epoch": 1736} {"train_loss": -6.091978073120117, "global_step": 72948, "epoch": 1736} {"train_loss": -5.989691734313965, "global_step": 72949, "epoch": 1736} {"train_loss": -5.93129825592041, "global_step": 72950, "epoch": 1736} {"train_loss": -6.0240678787231445, "global_step": 72951, "epoch": 1736} {"train_loss": -6.078196048736572, "global_step": 72952, "epoch": 1736} {"train_loss": -6.022720779691424, "global_step": 72953, "epoch": 1736, "val_loss": 61856.484375} {"train_loss": -6.075745105743408, "global_step": 72954, "epoch": 1737} {"train_loss": -5.9377288818359375, "global_step": 72955, "epoch": 1737} {"train_loss": -6.061837196350098, "global_step": 72956, "epoch": 1737} {"train_loss": -6.011180400848389, "global_step": 72957, "epoch": 1737} {"train_loss": -6.067157745361328, "global_step": 72958, "epoch": 1737} {"train_loss": -6.001850128173828, "global_step": 72959, "epoch": 1737} {"train_loss": -6.06488561630249, "global_step": 72960, "epoch": 1737} {"train_loss": -6.132768154144287, "global_step": 72961, "epoch": 1737} {"train_loss": -6.0871052742004395, "global_step": 72962, "epoch": 1737} {"train_loss": -6.053024768829346, "global_step": 72963, "epoch": 1737} {"train_loss": -6.022007465362549, "global_step": 72964, "epoch": 1737} {"train_loss": -6.068387985229492, "global_step": 72965, "epoch": 1737} {"train_loss": -6.053638935089111, "global_step": 72966, "epoch": 1737} {"train_loss": -6.067386150360107, "global_step": 72967, "epoch": 1737} {"train_loss": -6.06488561630249, "global_step": 72968, "epoch": 1737} {"train_loss": -5.971584320068359, "global_step": 72969, "epoch": 1737} {"train_loss": -6.137049674987793, "global_step": 72970, "epoch": 1737} {"train_loss": -6.0469865798950195, "global_step": 72971, "epoch": 1737} {"train_loss": -6.169241905212402, "global_step": 72972, "epoch": 1737} {"train_loss": -6.138909339904785, "global_step": 72973, "epoch": 1737} {"train_loss": -5.929123878479004, "global_step": 72974, "epoch": 1737} {"train_loss": -6.031017303466797, "global_step": 72975, "epoch": 1737} {"train_loss": -6.009304046630859, "global_step": 72976, "epoch": 1737} {"train_loss": -5.943696975708008, "global_step": 72977, "epoch": 1737} {"train_loss": -6.126248836517334, "global_step": 72978, "epoch": 1737} {"train_loss": -5.988268852233887, "global_step": 72979, "epoch": 1737} {"train_loss": -5.9749555587768555, "global_step": 72980, "epoch": 1737} {"train_loss": -6.091826438903809, "global_step": 72981, "epoch": 1737} {"train_loss": -5.9754486083984375, "global_step": 72982, "epoch": 1737} {"train_loss": -5.930790901184082, "global_step": 72983, "epoch": 1737} {"train_loss": -5.966416358947754, "global_step": 72984, "epoch": 1737} {"train_loss": -6.078058242797852, "global_step": 72985, "epoch": 1737} {"train_loss": -5.928759574890137, "global_step": 72986, "epoch": 1737} {"train_loss": -5.999126434326172, "global_step": 72987, "epoch": 1737} {"train_loss": -6.016953945159912, "global_step": 72988, "epoch": 1737} {"train_loss": -6.0216827392578125, "global_step": 72989, "epoch": 1737} {"train_loss": -6.131695747375488, "global_step": 72990, "epoch": 1737} {"train_loss": -6.017336845397949, "global_step": 72991, "epoch": 1737} {"train_loss": -6.108484268188477, "global_step": 72992, "epoch": 1737} {"train_loss": -6.020903587341309, "global_step": 72993, "epoch": 1737} {"train_loss": -6.050248146057129, "global_step": 72994, "epoch": 1737} {"train_loss": -6.03592418489002, "global_step": 72995, "epoch": 1737, "val_loss": 61810.47265625} {"train_loss": -6.03075647354126, "global_step": 72996, "epoch": 1738} {"train_loss": -6.121945381164551, "global_step": 72997, "epoch": 1738} {"train_loss": -6.067371368408203, "global_step": 72998, "epoch": 1738} {"train_loss": -6.067495346069336, "global_step": 72999, "epoch": 1738} {"train_loss": -6.130009651184082, "global_step": 73000, "epoch": 1738} {"train_loss": -6.057577133178711, "global_step": 73001, "epoch": 1738} {"train_loss": -6.008391857147217, "global_step": 73002, "epoch": 1738} {"train_loss": -6.0502238273620605, "global_step": 73003, "epoch": 1738} {"train_loss": -6.048209190368652, "global_step": 73004, "epoch": 1738} {"train_loss": -5.975405693054199, "global_step": 73005, "epoch": 1738} {"train_loss": -6.02626895904541, "global_step": 73006, "epoch": 1738} {"train_loss": -6.0543107986450195, "global_step": 73007, "epoch": 1738} {"train_loss": -6.0663228034973145, "global_step": 73008, "epoch": 1738} {"train_loss": -6.083611488342285, "global_step": 73009, "epoch": 1738} {"train_loss": -6.114246368408203, "global_step": 73010, "epoch": 1738} {"train_loss": -6.036357879638672, "global_step": 73011, "epoch": 1738} {"train_loss": -5.965083599090576, "global_step": 73012, "epoch": 1738} {"train_loss": -6.014841079711914, "global_step": 73013, "epoch": 1738} {"train_loss": -6.005131721496582, "global_step": 73014, "epoch": 1738} {"train_loss": -6.085594177246094, "global_step": 73015, "epoch": 1738} {"train_loss": -6.182519912719727, "global_step": 73016, "epoch": 1738} {"train_loss": -6.17468786239624, "global_step": 73017, "epoch": 1738} {"train_loss": -6.019439697265625, "global_step": 73018, "epoch": 1738} {"train_loss": -6.035224914550781, "global_step": 73019, "epoch": 1738} {"train_loss": -6.103575706481934, "global_step": 73020, "epoch": 1738} {"train_loss": -5.989254951477051, "global_step": 73021, "epoch": 1738} {"train_loss": -5.928381443023682, "global_step": 73022, "epoch": 1738} {"train_loss": -6.064549446105957, "global_step": 73023, "epoch": 1738} {"train_loss": -5.987793922424316, "global_step": 73024, "epoch": 1738} {"train_loss": -6.122350692749023, "global_step": 73025, "epoch": 1738} {"train_loss": -6.04917049407959, "global_step": 73026, "epoch": 1738} {"train_loss": -5.963930130004883, "global_step": 73027, "epoch": 1738} {"train_loss": -6.035473823547363, "global_step": 73028, "epoch": 1738} {"train_loss": -5.980321884155273, "global_step": 73029, "epoch": 1738} {"train_loss": -6.153319835662842, "global_step": 73030, "epoch": 1738} {"train_loss": -5.937410354614258, "global_step": 73031, "epoch": 1738} {"train_loss": -6.075992107391357, "global_step": 73032, "epoch": 1738} {"train_loss": -6.058921813964844, "global_step": 73033, "epoch": 1738} {"train_loss": -5.971560001373291, "global_step": 73034, "epoch": 1738} {"train_loss": -6.113516807556152, "global_step": 73035, "epoch": 1738} {"train_loss": -6.061409950256348, "global_step": 73036, "epoch": 1738} {"train_loss": -6.0481029238019675, "global_step": 73037, "epoch": 1738, "val_loss": 62106.93359375} {"train_loss": -6.058571815490723, "global_step": 73038, "epoch": 1739} {"train_loss": -5.977104663848877, "global_step": 73039, "epoch": 1739} {"train_loss": -6.176248073577881, "global_step": 73040, "epoch": 1739} {"train_loss": -5.925030708312988, "global_step": 73041, "epoch": 1739} {"train_loss": -6.093170166015625, "global_step": 73042, "epoch": 1739} {"train_loss": -5.997406959533691, "global_step": 73043, "epoch": 1739} {"train_loss": -5.977569580078125, "global_step": 73044, "epoch": 1739} {"train_loss": -6.208089828491211, "global_step": 73045, "epoch": 1739} {"train_loss": -6.064990997314453, "global_step": 73046, "epoch": 1739} {"train_loss": -6.100103378295898, "global_step": 73047, "epoch": 1739} {"train_loss": -6.099664688110352, "global_step": 73048, "epoch": 1739} {"train_loss": -6.015957832336426, "global_step": 73049, "epoch": 1739} {"train_loss": -6.027231216430664, "global_step": 73050, "epoch": 1739} {"train_loss": -5.984757423400879, "global_step": 73051, "epoch": 1739} {"train_loss": -6.0069780349731445, "global_step": 73052, "epoch": 1739} {"train_loss": -6.001532554626465, "global_step": 73053, "epoch": 1739} {"train_loss": -6.134672164916992, "global_step": 73054, "epoch": 1739} {"train_loss": -6.029314041137695, "global_step": 73055, "epoch": 1739} {"train_loss": -6.047009468078613, "global_step": 73056, "epoch": 1739} {"train_loss": -6.020663261413574, "global_step": 73057, "epoch": 1739} {"train_loss": -6.084290504455566, "global_step": 73058, "epoch": 1739} {"train_loss": -6.038424491882324, "global_step": 73059, "epoch": 1739} {"train_loss": -6.144845962524414, "global_step": 73060, "epoch": 1739} {"train_loss": -6.100793838500977, "global_step": 73061, "epoch": 1739} {"train_loss": -6.064209461212158, "global_step": 73062, "epoch": 1739} {"train_loss": -6.107381820678711, "global_step": 73063, "epoch": 1739} {"train_loss": -6.006991863250732, "global_step": 73064, "epoch": 1739} {"train_loss": -6.08629035949707, "global_step": 73065, "epoch": 1739} {"train_loss": -6.055210113525391, "global_step": 73066, "epoch": 1739} {"train_loss": -6.140283584594727, "global_step": 73067, "epoch": 1739} {"train_loss": -6.1864519119262695, "global_step": 73068, "epoch": 1739} {"train_loss": -6.058425426483154, "global_step": 73069, "epoch": 1739} {"train_loss": -6.032461643218994, "global_step": 73070, "epoch": 1739} {"train_loss": -6.050228118896484, "global_step": 73071, "epoch": 1739} {"train_loss": -6.003944396972656, "global_step": 73072, "epoch": 1739} {"train_loss": -6.092453479766846, "global_step": 73073, "epoch": 1739} {"train_loss": -6.023036479949951, "global_step": 73074, "epoch": 1739} {"train_loss": -6.095097541809082, "global_step": 73075, "epoch": 1739} {"train_loss": -6.15731143951416, "global_step": 73076, "epoch": 1739} {"train_loss": -6.05648946762085, "global_step": 73077, "epoch": 1739} {"train_loss": -6.135848045349121, "global_step": 73078, "epoch": 1739} {"train_loss": -6.067343530200777, "global_step": 73079, "epoch": 1739, "val_loss": 61930.453125} {"train_loss": -6.100894927978516, "global_step": 73080, "epoch": 1740} {"train_loss": -6.007037162780762, "global_step": 73081, "epoch": 1740} {"train_loss": -6.186673164367676, "global_step": 73082, "epoch": 1740} {"train_loss": -5.970461845397949, "global_step": 73083, "epoch": 1740} {"train_loss": -6.090609550476074, "global_step": 73084, "epoch": 1740} {"train_loss": -6.105597496032715, "global_step": 73085, "epoch": 1740} {"train_loss": -6.070468902587891, "global_step": 73086, "epoch": 1740} {"train_loss": -6.1220502853393555, "global_step": 73087, "epoch": 1740} {"train_loss": -6.177974224090576, "global_step": 73088, "epoch": 1740} {"train_loss": -6.142370223999023, "global_step": 73089, "epoch": 1740} {"train_loss": -6.147063255310059, "global_step": 73090, "epoch": 1740} {"train_loss": -6.114630699157715, "global_step": 73091, "epoch": 1740} {"train_loss": -6.168926239013672, "global_step": 73092, "epoch": 1740} {"train_loss": -5.994582653045654, "global_step": 73093, "epoch": 1740} {"train_loss": -6.097596168518066, "global_step": 73094, "epoch": 1740} {"train_loss": -6.151045799255371, "global_step": 73095, "epoch": 1740} {"train_loss": -6.149319648742676, "global_step": 73096, "epoch": 1740} {"train_loss": -5.976785659790039, "global_step": 73097, "epoch": 1740} {"train_loss": -6.054418563842773, "global_step": 73098, "epoch": 1740} {"train_loss": -5.964883804321289, "global_step": 73099, "epoch": 1740} {"train_loss": -5.871164321899414, "global_step": 73100, "epoch": 1740} {"train_loss": -6.1492204666137695, "global_step": 73101, "epoch": 1740} {"train_loss": -6.012537956237793, "global_step": 73102, "epoch": 1740} {"train_loss": -6.038698196411133, "global_step": 73103, "epoch": 1740} {"train_loss": -6.257988929748535, "global_step": 73104, "epoch": 1740} {"train_loss": -5.935791015625, "global_step": 73105, "epoch": 1740} {"train_loss": -6.037830352783203, "global_step": 73106, "epoch": 1740} {"train_loss": -6.05855655670166, "global_step": 73107, "epoch": 1740} {"train_loss": -6.062619209289551, "global_step": 73108, "epoch": 1740} {"train_loss": -6.032029151916504, "global_step": 73109, "epoch": 1740} {"train_loss": -6.014677047729492, "global_step": 73110, "epoch": 1740} {"train_loss": -6.130680561065674, "global_step": 73111, "epoch": 1740} {"train_loss": -6.097630500793457, "global_step": 73112, "epoch": 1740} {"train_loss": -6.112730979919434, "global_step": 73113, "epoch": 1740} {"train_loss": -6.012306213378906, "global_step": 73114, "epoch": 1740} {"train_loss": -6.076181888580322, "global_step": 73115, "epoch": 1740} {"train_loss": -6.0786662101745605, "global_step": 73116, "epoch": 1740} {"train_loss": -6.065511703491211, "global_step": 73117, "epoch": 1740} {"train_loss": -6.055264472961426, "global_step": 73118, "epoch": 1740} {"train_loss": -6.016849517822266, "global_step": 73119, "epoch": 1740} {"train_loss": -6.127956390380859, "global_step": 73120, "epoch": 1740} {"train_loss": -6.071311031069074, "global_step": 73121, "epoch": 1740, "val_loss": 61867.33203125} {"train_loss": -6.175622940063477, "global_step": 73122, "epoch": 1741} {"train_loss": -6.096771240234375, "global_step": 73123, "epoch": 1741} {"train_loss": -6.145602703094482, "global_step": 73124, "epoch": 1741} {"train_loss": -6.171669006347656, "global_step": 73125, "epoch": 1741} {"train_loss": -6.014030933380127, "global_step": 73126, "epoch": 1741} {"train_loss": -6.118409156799316, "global_step": 73127, "epoch": 1741} {"train_loss": -5.988746643066406, "global_step": 73128, "epoch": 1741} {"train_loss": -5.988748550415039, "global_step": 73129, "epoch": 1741} {"train_loss": -6.0240254402160645, "global_step": 73130, "epoch": 1741} {"train_loss": -6.135558605194092, "global_step": 73131, "epoch": 1741} {"train_loss": -6.15836238861084, "global_step": 73132, "epoch": 1741} {"train_loss": -6.049623966217041, "global_step": 73133, "epoch": 1741} {"train_loss": -6.0934014320373535, "global_step": 73134, "epoch": 1741} {"train_loss": -6.044802188873291, "global_step": 73135, "epoch": 1741} {"train_loss": -6.133330345153809, "global_step": 73136, "epoch": 1741} {"train_loss": -6.1399736404418945, "global_step": 73137, "epoch": 1741} {"train_loss": -6.001654148101807, "global_step": 73138, "epoch": 1741} {"train_loss": -6.182189464569092, "global_step": 73139, "epoch": 1741} {"train_loss": -6.1598801612854, "global_step": 73140, "epoch": 1741} {"train_loss": -5.9944915771484375, "global_step": 73141, "epoch": 1741} {"train_loss": -5.986797332763672, "global_step": 73142, "epoch": 1741} {"train_loss": -6.039732933044434, "global_step": 73143, "epoch": 1741} {"train_loss": -6.041782379150391, "global_step": 73144, "epoch": 1741} {"train_loss": -5.997537612915039, "global_step": 73145, "epoch": 1741} {"train_loss": -6.076403617858887, "global_step": 73146, "epoch": 1741} {"train_loss": -6.014408111572266, "global_step": 73147, "epoch": 1741} {"train_loss": -6.094577789306641, "global_step": 73148, "epoch": 1741} {"train_loss": -6.078658580780029, "global_step": 73149, "epoch": 1741} {"train_loss": -6.065422534942627, "global_step": 73150, "epoch": 1741} {"train_loss": -6.053391456604004, "global_step": 73151, "epoch": 1741} {"train_loss": -5.96662712097168, "global_step": 73152, "epoch": 1741} {"train_loss": -6.02194881439209, "global_step": 73153, "epoch": 1741} {"train_loss": -6.069059371948242, "global_step": 73154, "epoch": 1741} {"train_loss": -6.114615440368652, "global_step": 73155, "epoch": 1741} {"train_loss": -6.028990745544434, "global_step": 73156, "epoch": 1741} {"train_loss": -6.077643394470215, "global_step": 73157, "epoch": 1741} {"train_loss": -6.065134048461914, "global_step": 73158, "epoch": 1741} {"train_loss": -5.889681816101074, "global_step": 73159, "epoch": 1741} {"train_loss": -6.061540603637695, "global_step": 73160, "epoch": 1741} {"train_loss": -6.014514923095703, "global_step": 73161, "epoch": 1741} {"train_loss": -5.997133255004883, "global_step": 73162, "epoch": 1741} {"train_loss": -6.062474682217553, "global_step": 73163, "epoch": 1741, "val_loss": 61807.359375} {"train_loss": -6.0279436111450195, "global_step": 73164, "epoch": 1742} {"train_loss": -6.04673433303833, "global_step": 73165, "epoch": 1742} {"train_loss": -6.085447311401367, "global_step": 73166, "epoch": 1742} {"train_loss": -6.159912109375, "global_step": 73167, "epoch": 1742} {"train_loss": -6.0229291915893555, "global_step": 73168, "epoch": 1742} {"train_loss": -6.033060550689697, "global_step": 73169, "epoch": 1742} {"train_loss": -6.042003631591797, "global_step": 73170, "epoch": 1742} {"train_loss": -6.020610809326172, "global_step": 73171, "epoch": 1742} {"train_loss": -6.029501914978027, "global_step": 73172, "epoch": 1742} {"train_loss": -5.995019435882568, "global_step": 73173, "epoch": 1742} {"train_loss": -6.034011363983154, "global_step": 73174, "epoch": 1742} {"train_loss": -6.132227897644043, "global_step": 73175, "epoch": 1742} {"train_loss": -5.959242820739746, "global_step": 73176, "epoch": 1742} {"train_loss": -6.08621883392334, "global_step": 73177, "epoch": 1742} {"train_loss": -6.0358171463012695, "global_step": 73178, "epoch": 1742} {"train_loss": -6.001781463623047, "global_step": 73179, "epoch": 1742} {"train_loss": -6.038365364074707, "global_step": 73180, "epoch": 1742} {"train_loss": -6.144965171813965, "global_step": 73181, "epoch": 1742} {"train_loss": -5.9700469970703125, "global_step": 73182, "epoch": 1742} {"train_loss": -6.090877532958984, "global_step": 73183, "epoch": 1742} {"train_loss": -6.023027420043945, "global_step": 73184, "epoch": 1742} {"train_loss": -5.993988990783691, "global_step": 73185, "epoch": 1742} {"train_loss": -6.053351402282715, "global_step": 73186, "epoch": 1742} {"train_loss": -6.0880913734436035, "global_step": 73187, "epoch": 1742} {"train_loss": -6.076115131378174, "global_step": 73188, "epoch": 1742} {"train_loss": -6.039454460144043, "global_step": 73189, "epoch": 1742} {"train_loss": -5.989762306213379, "global_step": 73190, "epoch": 1742} {"train_loss": -6.001708507537842, "global_step": 73191, "epoch": 1742} {"train_loss": -6.051325798034668, "global_step": 73192, "epoch": 1742} {"train_loss": -6.107151985168457, "global_step": 73193, "epoch": 1742} {"train_loss": -5.859569549560547, "global_step": 73194, "epoch": 1742} {"train_loss": -6.135079383850098, "global_step": 73195, "epoch": 1742} {"train_loss": -5.997426986694336, "global_step": 73196, "epoch": 1742} {"train_loss": -6.068387031555176, "global_step": 73197, "epoch": 1742} {"train_loss": -6.160569190979004, "global_step": 73198, "epoch": 1742} {"train_loss": -6.078805923461914, "global_step": 73199, "epoch": 1742} {"train_loss": -6.07380485534668, "global_step": 73200, "epoch": 1742} {"train_loss": -6.058974266052246, "global_step": 73201, "epoch": 1742} {"train_loss": -5.9870405197143555, "global_step": 73202, "epoch": 1742} {"train_loss": -6.104794502258301, "global_step": 73203, "epoch": 1742} {"train_loss": -6.013629913330078, "global_step": 73204, "epoch": 1742} {"train_loss": -6.044717062087286, "global_step": 73205, "epoch": 1742, "val_loss": 61810.14453125} {"train_loss": -6.016409397125244, "global_step": 73206, "epoch": 1743} {"train_loss": -6.215723037719727, "global_step": 73207, "epoch": 1743} {"train_loss": -6.064046859741211, "global_step": 73208, "epoch": 1743} {"train_loss": -6.040194034576416, "global_step": 73209, "epoch": 1743} {"train_loss": -6.152433395385742, "global_step": 73210, "epoch": 1743} {"train_loss": -6.1144819259643555, "global_step": 73211, "epoch": 1743} {"train_loss": -6.112095832824707, "global_step": 73212, "epoch": 1743} {"train_loss": -6.184342861175537, "global_step": 73213, "epoch": 1743} {"train_loss": -6.248845100402832, "global_step": 73214, "epoch": 1743} {"train_loss": -6.099479675292969, "global_step": 73215, "epoch": 1743} {"train_loss": -6.095619201660156, "global_step": 73216, "epoch": 1743} {"train_loss": -5.964626789093018, "global_step": 73217, "epoch": 1743} {"train_loss": -6.085445404052734, "global_step": 73218, "epoch": 1743} {"train_loss": -6.047222137451172, "global_step": 73219, "epoch": 1743} {"train_loss": -5.973028182983398, "global_step": 73220, "epoch": 1743} {"train_loss": -6.061530113220215, "global_step": 73221, "epoch": 1743} {"train_loss": -6.108369827270508, "global_step": 73222, "epoch": 1743} {"train_loss": -5.956721305847168, "global_step": 73223, "epoch": 1743} {"train_loss": -5.929844856262207, "global_step": 73224, "epoch": 1743} {"train_loss": -5.9066362380981445, "global_step": 73225, "epoch": 1743} {"train_loss": -5.887200832366943, "global_step": 73226, "epoch": 1743} {"train_loss": -6.056882858276367, "global_step": 73227, "epoch": 1743} {"train_loss": -5.960984230041504, "global_step": 73228, "epoch": 1743} {"train_loss": -5.8895978927612305, "global_step": 73229, "epoch": 1743} {"train_loss": -5.93380069732666, "global_step": 73230, "epoch": 1743} {"train_loss": -5.838492393493652, "global_step": 73231, "epoch": 1743} {"train_loss": -5.980198383331299, "global_step": 73232, "epoch": 1743} {"train_loss": -6.020388603210449, "global_step": 73233, "epoch": 1743} {"train_loss": -5.986759185791016, "global_step": 73234, "epoch": 1743} {"train_loss": -5.986739635467529, "global_step": 73235, "epoch": 1743} {"train_loss": -6.000546455383301, "global_step": 73236, "epoch": 1743} {"train_loss": -6.050045013427734, "global_step": 73237, "epoch": 1743} {"train_loss": -5.911413669586182, "global_step": 73238, "epoch": 1743} {"train_loss": -6.014986991882324, "global_step": 73239, "epoch": 1743} {"train_loss": -5.8980631828308105, "global_step": 73240, "epoch": 1743} {"train_loss": -6.132205963134766, "global_step": 73241, "epoch": 1743} {"train_loss": -5.9136881828308105, "global_step": 73242, "epoch": 1743} {"train_loss": -6.001879692077637, "global_step": 73243, "epoch": 1743} {"train_loss": -6.071083068847656, "global_step": 73244, "epoch": 1743} {"train_loss": -5.942309379577637, "global_step": 73245, "epoch": 1743} {"train_loss": -6.009111404418945, "global_step": 73246, "epoch": 1743} {"train_loss": -6.021360465458462, "global_step": 73247, "epoch": 1743, "val_loss": 61692.41796875} {"train_loss": -5.926701545715332, "global_step": 73248, "epoch": 1744} {"train_loss": -6.046825408935547, "global_step": 73249, "epoch": 1744} {"train_loss": -5.918884754180908, "global_step": 73250, "epoch": 1744} {"train_loss": -6.124729156494141, "global_step": 73251, "epoch": 1744} {"train_loss": -6.175022125244141, "global_step": 73252, "epoch": 1744} {"train_loss": -5.954854965209961, "global_step": 73253, "epoch": 1744} {"train_loss": -6.045194625854492, "global_step": 73254, "epoch": 1744} {"train_loss": -5.762537956237793, "global_step": 73255, "epoch": 1744} {"train_loss": -6.086670875549316, "global_step": 73256, "epoch": 1744} {"train_loss": -5.980902671813965, "global_step": 73257, "epoch": 1744} {"train_loss": -6.125735282897949, "global_step": 73258, "epoch": 1744} {"train_loss": -6.185267448425293, "global_step": 73259, "epoch": 1744} {"train_loss": -6.018214702606201, "global_step": 73260, "epoch": 1744} {"train_loss": -6.177302360534668, "global_step": 73261, "epoch": 1744} {"train_loss": -6.266611576080322, "global_step": 73262, "epoch": 1744} {"train_loss": -6.000245571136475, "global_step": 73263, "epoch": 1744} {"train_loss": -6.079154968261719, "global_step": 73264, "epoch": 1744} {"train_loss": -6.0132927894592285, "global_step": 73265, "epoch": 1744} {"train_loss": -6.118076324462891, "global_step": 73266, "epoch": 1744} {"train_loss": -6.057146072387695, "global_step": 73267, "epoch": 1744} {"train_loss": -5.97313928604126, "global_step": 73268, "epoch": 1744} {"train_loss": -6.076204299926758, "global_step": 73269, "epoch": 1744} {"train_loss": -6.0183563232421875, "global_step": 73270, "epoch": 1744} {"train_loss": -6.080071449279785, "global_step": 73271, "epoch": 1744} {"train_loss": -6.093544006347656, "global_step": 73272, "epoch": 1744} {"train_loss": -6.105673789978027, "global_step": 73273, "epoch": 1744} {"train_loss": -6.050136089324951, "global_step": 73274, "epoch": 1744} {"train_loss": -6.015271186828613, "global_step": 73275, "epoch": 1744} {"train_loss": -6.003961563110352, "global_step": 73276, "epoch": 1744} {"train_loss": -6.202250957489014, "global_step": 73277, "epoch": 1744} {"train_loss": -6.089703559875488, "global_step": 73278, "epoch": 1744} {"train_loss": -6.007411956787109, "global_step": 73279, "epoch": 1744} {"train_loss": -6.155292987823486, "global_step": 73280, "epoch": 1744} {"train_loss": -5.9737043380737305, "global_step": 73281, "epoch": 1744} {"train_loss": -6.083870887756348, "global_step": 73282, "epoch": 1744} {"train_loss": -5.992743968963623, "global_step": 73283, "epoch": 1744} {"train_loss": -5.926214218139648, "global_step": 73284, "epoch": 1744} {"train_loss": -6.077520847320557, "global_step": 73285, "epoch": 1744} {"train_loss": -5.900328636169434, "global_step": 73286, "epoch": 1744} {"train_loss": -5.975492477416992, "global_step": 73287, "epoch": 1744} {"train_loss": -6.027786731719971, "global_step": 73288, "epoch": 1744} {"train_loss": -6.043300310770671, "global_step": 73289, "epoch": 1744, "val_loss": 62016.8203125} {"train_loss": -5.978271007537842, "global_step": 73290, "epoch": 1745} {"train_loss": -5.951855659484863, "global_step": 73291, "epoch": 1745} {"train_loss": -6.0921735763549805, "global_step": 73292, "epoch": 1745} {"train_loss": -6.073864459991455, "global_step": 73293, "epoch": 1745} {"train_loss": -6.126626014709473, "global_step": 73294, "epoch": 1745} {"train_loss": -5.987624168395996, "global_step": 73295, "epoch": 1745} {"train_loss": -6.103835582733154, "global_step": 73296, "epoch": 1745} {"train_loss": -5.882406234741211, "global_step": 73297, "epoch": 1745} {"train_loss": -5.971347808837891, "global_step": 73298, "epoch": 1745} {"train_loss": -6.091922760009766, "global_step": 73299, "epoch": 1745} {"train_loss": -6.056366443634033, "global_step": 73300, "epoch": 1745} {"train_loss": -6.057585716247559, "global_step": 73301, "epoch": 1745} {"train_loss": -6.028609752655029, "global_step": 73302, "epoch": 1745} {"train_loss": -6.058001518249512, "global_step": 73303, "epoch": 1745} {"train_loss": -5.918489456176758, "global_step": 73304, "epoch": 1745} {"train_loss": -6.170631408691406, "global_step": 73305, "epoch": 1745} {"train_loss": -6.0312418937683105, "global_step": 73306, "epoch": 1745} {"train_loss": -6.134922981262207, "global_step": 73307, "epoch": 1745} {"train_loss": -6.064993858337402, "global_step": 73308, "epoch": 1745} {"train_loss": -6.100130081176758, "global_step": 73309, "epoch": 1745} {"train_loss": -6.10301399230957, "global_step": 73310, "epoch": 1745} {"train_loss": -6.002239227294922, "global_step": 73311, "epoch": 1745} {"train_loss": -6.10223388671875, "global_step": 73312, "epoch": 1745} {"train_loss": -6.039427280426025, "global_step": 73313, "epoch": 1745} {"train_loss": -6.032867908477783, "global_step": 73314, "epoch": 1745} {"train_loss": -6.053203582763672, "global_step": 73315, "epoch": 1745} {"train_loss": -5.943029880523682, "global_step": 73316, "epoch": 1745} {"train_loss": -5.9342498779296875, "global_step": 73317, "epoch": 1745} {"train_loss": -6.091108798980713, "global_step": 73318, "epoch": 1745} {"train_loss": -6.078342437744141, "global_step": 73319, "epoch": 1745} {"train_loss": -6.073775291442871, "global_step": 73320, "epoch": 1745} {"train_loss": -6.002727508544922, "global_step": 73321, "epoch": 1745} {"train_loss": -6.012890338897705, "global_step": 73322, "epoch": 1745} {"train_loss": -6.017215728759766, "global_step": 73323, "epoch": 1745} {"train_loss": -6.013798236846924, "global_step": 73324, "epoch": 1745} {"train_loss": -6.034991264343262, "global_step": 73325, "epoch": 1745} {"train_loss": -6.120151519775391, "global_step": 73326, "epoch": 1745} {"train_loss": -6.102385520935059, "global_step": 73327, "epoch": 1745} {"train_loss": -5.908048629760742, "global_step": 73328, "epoch": 1745} {"train_loss": -6.087663650512695, "global_step": 73329, "epoch": 1745} {"train_loss": -6.033453941345215, "global_step": 73330, "epoch": 1745} {"train_loss": -6.041040477298555, "global_step": 73331, "epoch": 1745, "val_loss": 61833.5546875} {"train_loss": -6.111904621124268, "global_step": 73332, "epoch": 1746} {"train_loss": -6.124026298522949, "global_step": 73333, "epoch": 1746} {"train_loss": -6.085822105407715, "global_step": 73334, "epoch": 1746} {"train_loss": -6.06986141204834, "global_step": 73335, "epoch": 1746} {"train_loss": -6.033524513244629, "global_step": 73336, "epoch": 1746} {"train_loss": -6.038386344909668, "global_step": 73337, "epoch": 1746} {"train_loss": -6.042809963226318, "global_step": 73338, "epoch": 1746} {"train_loss": -6.201445579528809, "global_step": 73339, "epoch": 1746} {"train_loss": -5.981461524963379, "global_step": 73340, "epoch": 1746} {"train_loss": -6.146955966949463, "global_step": 73341, "epoch": 1746} {"train_loss": -6.1455888748168945, "global_step": 73342, "epoch": 1746} {"train_loss": -5.9919891357421875, "global_step": 73343, "epoch": 1746} {"train_loss": -6.193724632263184, "global_step": 73344, "epoch": 1746} {"train_loss": -5.950161457061768, "global_step": 73345, "epoch": 1746} {"train_loss": -6.0057783126831055, "global_step": 73346, "epoch": 1746} {"train_loss": -6.126230239868164, "global_step": 73347, "epoch": 1746} {"train_loss": -5.934657096862793, "global_step": 73348, "epoch": 1746} {"train_loss": -6.072486877441406, "global_step": 73349, "epoch": 1746} {"train_loss": -6.016561508178711, "global_step": 73350, "epoch": 1746} {"train_loss": -6.038807392120361, "global_step": 73351, "epoch": 1746} {"train_loss": -5.952740669250488, "global_step": 73352, "epoch": 1746} {"train_loss": -5.918066501617432, "global_step": 73353, "epoch": 1746} {"train_loss": -6.022416114807129, "global_step": 73354, "epoch": 1746} {"train_loss": -5.895469665527344, "global_step": 73355, "epoch": 1746} {"train_loss": -6.189314842224121, "global_step": 73356, "epoch": 1746} {"train_loss": -6.0801591873168945, "global_step": 73357, "epoch": 1746} {"train_loss": -6.001446723937988, "global_step": 73358, "epoch": 1746} {"train_loss": -6.208369255065918, "global_step": 73359, "epoch": 1746} {"train_loss": -6.004948616027832, "global_step": 73360, "epoch": 1746} {"train_loss": -6.005767822265625, "global_step": 73361, "epoch": 1746} {"train_loss": -6.09074592590332, "global_step": 73362, "epoch": 1746} {"train_loss": -6.1145548820495605, "global_step": 73363, "epoch": 1746} {"train_loss": -5.941462516784668, "global_step": 73364, "epoch": 1746} {"train_loss": -6.062407970428467, "global_step": 73365, "epoch": 1746} {"train_loss": -6.089566230773926, "global_step": 73366, "epoch": 1746} {"train_loss": -6.142281532287598, "global_step": 73367, "epoch": 1746} {"train_loss": -5.996010780334473, "global_step": 73368, "epoch": 1746} {"train_loss": -6.0503950119018555, "global_step": 73369, "epoch": 1746} {"train_loss": -6.01824951171875, "global_step": 73370, "epoch": 1746} {"train_loss": -5.965415000915527, "global_step": 73371, "epoch": 1746} {"train_loss": -6.146260738372803, "global_step": 73372, "epoch": 1746} {"train_loss": -6.05377889814831, "global_step": 73373, "epoch": 1746, "val_loss": 61739.75} {"train_loss": -6.048205375671387, "global_step": 73374, "epoch": 1747} {"train_loss": -6.02780818939209, "global_step": 73375, "epoch": 1747} {"train_loss": -6.043173789978027, "global_step": 73376, "epoch": 1747} {"train_loss": -6.1172776222229, "global_step": 73377, "epoch": 1747} {"train_loss": -5.97242546081543, "global_step": 73378, "epoch": 1747} {"train_loss": -6.070900917053223, "global_step": 73379, "epoch": 1747} {"train_loss": -5.962041854858398, "global_step": 73380, "epoch": 1747} {"train_loss": -6.100811958312988, "global_step": 73381, "epoch": 1747} {"train_loss": -6.072416305541992, "global_step": 73382, "epoch": 1747} {"train_loss": -5.952220916748047, "global_step": 73383, "epoch": 1747} {"train_loss": -6.064434051513672, "global_step": 73384, "epoch": 1747} {"train_loss": -6.12218713760376, "global_step": 73385, "epoch": 1747} {"train_loss": -6.046040058135986, "global_step": 73386, "epoch": 1747} {"train_loss": -6.034514427185059, "global_step": 73387, "epoch": 1747} {"train_loss": -5.989120006561279, "global_step": 73388, "epoch": 1747} {"train_loss": -6.092746257781982, "global_step": 73389, "epoch": 1747} {"train_loss": -6.087970733642578, "global_step": 73390, "epoch": 1747} {"train_loss": -5.978171348571777, "global_step": 73391, "epoch": 1747} {"train_loss": -6.1322808265686035, "global_step": 73392, "epoch": 1747} {"train_loss": -6.119814872741699, "global_step": 73393, "epoch": 1747} {"train_loss": -6.189918518066406, "global_step": 73394, "epoch": 1747} {"train_loss": -6.094690322875977, "global_step": 73395, "epoch": 1747} {"train_loss": -6.0549774169921875, "global_step": 73396, "epoch": 1747} {"train_loss": -6.074421405792236, "global_step": 73397, "epoch": 1747} {"train_loss": -6.084847450256348, "global_step": 73398, "epoch": 1747} {"train_loss": -6.081151008605957, "global_step": 73399, "epoch": 1747} {"train_loss": -6.068015098571777, "global_step": 73400, "epoch": 1747} {"train_loss": -6.057962417602539, "global_step": 73401, "epoch": 1747} {"train_loss": -6.0609893798828125, "global_step": 73402, "epoch": 1747} {"train_loss": -6.046776294708252, "global_step": 73403, "epoch": 1747} {"train_loss": -6.048576831817627, "global_step": 73404, "epoch": 1747} {"train_loss": -6.159486293792725, "global_step": 73405, "epoch": 1747} {"train_loss": -6.211115837097168, "global_step": 73406, "epoch": 1747} {"train_loss": -6.034902572631836, "global_step": 73407, "epoch": 1747} {"train_loss": -6.1261887550354, "global_step": 73408, "epoch": 1747} {"train_loss": -6.223020553588867, "global_step": 73409, "epoch": 1747} {"train_loss": -6.023877143859863, "global_step": 73410, "epoch": 1747} {"train_loss": -6.130360126495361, "global_step": 73411, "epoch": 1747} {"train_loss": -5.978303909301758, "global_step": 73412, "epoch": 1747} {"train_loss": -6.085814476013184, "global_step": 73413, "epoch": 1747} {"train_loss": -6.116072177886963, "global_step": 73414, "epoch": 1747} {"train_loss": -6.073888835452852, "global_step": 73415, "epoch": 1747, "val_loss": 61893.4453125} {"train_loss": -5.987591743469238, "global_step": 73416, "epoch": 1748} {"train_loss": -6.03154182434082, "global_step": 73417, "epoch": 1748} {"train_loss": -5.995842456817627, "global_step": 73418, "epoch": 1748} {"train_loss": -6.0413665771484375, "global_step": 73419, "epoch": 1748} {"train_loss": -6.096747875213623, "global_step": 73420, "epoch": 1748} {"train_loss": -5.994972229003906, "global_step": 73421, "epoch": 1748} {"train_loss": -6.188173770904541, "global_step": 73422, "epoch": 1748} {"train_loss": -5.999870300292969, "global_step": 73423, "epoch": 1748} {"train_loss": -6.055485725402832, "global_step": 73424, "epoch": 1748} {"train_loss": -6.0985565185546875, "global_step": 73425, "epoch": 1748} {"train_loss": -6.062559127807617, "global_step": 73426, "epoch": 1748} {"train_loss": -6.041540145874023, "global_step": 73427, "epoch": 1748} {"train_loss": -6.0876312255859375, "global_step": 73428, "epoch": 1748} {"train_loss": -6.160894393920898, "global_step": 73429, "epoch": 1748} {"train_loss": -6.245810031890869, "global_step": 73430, "epoch": 1748} {"train_loss": -6.263186454772949, "global_step": 73431, "epoch": 1748} {"train_loss": -6.015530586242676, "global_step": 73432, "epoch": 1748} {"train_loss": -6.203004360198975, "global_step": 73433, "epoch": 1748} {"train_loss": -6.2421746253967285, "global_step": 73434, "epoch": 1748} {"train_loss": -6.1315765380859375, "global_step": 73435, "epoch": 1748} {"train_loss": -6.009746551513672, "global_step": 73436, "epoch": 1748} {"train_loss": -6.092580795288086, "global_step": 73437, "epoch": 1748} {"train_loss": -5.997737884521484, "global_step": 73438, "epoch": 1748} {"train_loss": -6.109068870544434, "global_step": 73439, "epoch": 1748} {"train_loss": -6.022342205047607, "global_step": 73440, "epoch": 1748} {"train_loss": -6.156191825866699, "global_step": 73441, "epoch": 1748} {"train_loss": -6.1339826583862305, "global_step": 73442, "epoch": 1748} {"train_loss": -5.941307067871094, "global_step": 73443, "epoch": 1748} {"train_loss": -6.053955078125, "global_step": 73444, "epoch": 1748} {"train_loss": -6.113249778747559, "global_step": 73445, "epoch": 1748} {"train_loss": -5.988883018493652, "global_step": 73446, "epoch": 1748} {"train_loss": -6.026961326599121, "global_step": 73447, "epoch": 1748} {"train_loss": -5.998007774353027, "global_step": 73448, "epoch": 1748} {"train_loss": -6.04215145111084, "global_step": 73449, "epoch": 1748} {"train_loss": -6.069767951965332, "global_step": 73450, "epoch": 1748} {"train_loss": -6.074641227722168, "global_step": 73451, "epoch": 1748} {"train_loss": -6.117891311645508, "global_step": 73452, "epoch": 1748} {"train_loss": -6.142451763153076, "global_step": 73453, "epoch": 1748} {"train_loss": -5.960172653198242, "global_step": 73454, "epoch": 1748} {"train_loss": -6.072881698608398, "global_step": 73455, "epoch": 1748} {"train_loss": -5.969647407531738, "global_step": 73456, "epoch": 1748} {"train_loss": -6.072667224066598, "global_step": 73457, "epoch": 1748, "val_loss": 61878.484375} {"train_loss": -6.022790908813477, "global_step": 73458, "epoch": 1749} {"train_loss": -6.078003883361816, "global_step": 73459, "epoch": 1749} {"train_loss": -6.028334140777588, "global_step": 73460, "epoch": 1749} {"train_loss": -6.059043884277344, "global_step": 73461, "epoch": 1749} {"train_loss": -6.03408670425415, "global_step": 73462, "epoch": 1749} {"train_loss": -5.93105936050415, "global_step": 73463, "epoch": 1749} {"train_loss": -6.063210487365723, "global_step": 73464, "epoch": 1749} {"train_loss": -5.999514102935791, "global_step": 73465, "epoch": 1749} {"train_loss": -5.893893718719482, "global_step": 73466, "epoch": 1749} {"train_loss": -6.084435939788818, "global_step": 73467, "epoch": 1749} {"train_loss": -6.080687522888184, "global_step": 73468, "epoch": 1749} {"train_loss": -6.0919108390808105, "global_step": 73469, "epoch": 1749} {"train_loss": -6.136680603027344, "global_step": 73470, "epoch": 1749} {"train_loss": -5.993492126464844, "global_step": 73471, "epoch": 1749} {"train_loss": -6.065149307250977, "global_step": 73472, "epoch": 1749} {"train_loss": -5.946590423583984, "global_step": 73473, "epoch": 1749} {"train_loss": -5.940094947814941, "global_step": 73474, "epoch": 1749} {"train_loss": -6.082915782928467, "global_step": 73475, "epoch": 1749} {"train_loss": -6.037317276000977, "global_step": 73476, "epoch": 1749} {"train_loss": -6.030109882354736, "global_step": 73477, "epoch": 1749} {"train_loss": -6.113799095153809, "global_step": 73478, "epoch": 1749} {"train_loss": -6.0982666015625, "global_step": 73479, "epoch": 1749} {"train_loss": -6.0469536781311035, "global_step": 73480, "epoch": 1749} {"train_loss": -6.118054389953613, "global_step": 73481, "epoch": 1749} {"train_loss": -6.146032333374023, "global_step": 73482, "epoch": 1749} {"train_loss": -6.072186470031738, "global_step": 73483, "epoch": 1749} {"train_loss": -6.038125991821289, "global_step": 73484, "epoch": 1749} {"train_loss": -6.1811418533325195, "global_step": 73485, "epoch": 1749} {"train_loss": -6.112004280090332, "global_step": 73486, "epoch": 1749} {"train_loss": -5.974650859832764, "global_step": 73487, "epoch": 1749} {"train_loss": -6.025885581970215, "global_step": 73488, "epoch": 1749} {"train_loss": -5.976500988006592, "global_step": 73489, "epoch": 1749} {"train_loss": -6.087447166442871, "global_step": 73490, "epoch": 1749} {"train_loss": -6.185172080993652, "global_step": 73491, "epoch": 1749} {"train_loss": -6.121038436889648, "global_step": 73492, "epoch": 1749} {"train_loss": -5.97602653503418, "global_step": 73493, "epoch": 1749} {"train_loss": -6.140377521514893, "global_step": 73494, "epoch": 1749} {"train_loss": -6.045818328857422, "global_step": 73495, "epoch": 1749} {"train_loss": -6.031089782714844, "global_step": 73496, "epoch": 1749} {"train_loss": -6.08527946472168, "global_step": 73497, "epoch": 1749} {"train_loss": -6.131058692932129, "global_step": 73498, "epoch": 1749} {"train_loss": -6.056753260748727, "global_step": 73499, "epoch": 1749, "val_loss": 61667.5703125} {"train_loss": -6.0912861824035645, "global_step": 73500, "epoch": 1750} {"train_loss": -6.156295299530029, "global_step": 73501, "epoch": 1750} {"train_loss": -6.1130523681640625, "global_step": 73502, "epoch": 1750} {"train_loss": -6.16336727142334, "global_step": 73503, "epoch": 1750} {"train_loss": -6.053041934967041, "global_step": 73504, "epoch": 1750} {"train_loss": -6.127203464508057, "global_step": 73505, "epoch": 1750} {"train_loss": -6.144994735717773, "global_step": 73506, "epoch": 1750} {"train_loss": -6.010163307189941, "global_step": 73507, "epoch": 1750} {"train_loss": -6.068479537963867, "global_step": 73508, "epoch": 1750} {"train_loss": -6.117267608642578, "global_step": 73509, "epoch": 1750} {"train_loss": -6.065027236938477, "global_step": 73510, "epoch": 1750} {"train_loss": -6.032785415649414, "global_step": 73511, "epoch": 1750} {"train_loss": -6.135309219360352, "global_step": 73512, "epoch": 1750} {"train_loss": -6.038626670837402, "global_step": 73513, "epoch": 1750} {"train_loss": -6.101910591125488, "global_step": 73514, "epoch": 1750} {"train_loss": -6.125282287597656, "global_step": 73515, "epoch": 1750} {"train_loss": -6.0734171867370605, "global_step": 73516, "epoch": 1750} {"train_loss": -6.128551483154297, "global_step": 73517, "epoch": 1750} {"train_loss": -6.01451301574707, "global_step": 73518, "epoch": 1750} {"train_loss": -6.011239051818848, "global_step": 73519, "epoch": 1750} {"train_loss": -6.044018745422363, "global_step": 73520, "epoch": 1750} {"train_loss": -6.136916637420654, "global_step": 73521, "epoch": 1750} {"train_loss": -6.020001411437988, "global_step": 73522, "epoch": 1750} {"train_loss": -6.004671096801758, "global_step": 73523, "epoch": 1750} {"train_loss": -6.01304817199707, "global_step": 73524, "epoch": 1750} {"train_loss": -5.934649467468262, "global_step": 73525, "epoch": 1750} {"train_loss": -6.130893707275391, "global_step": 73526, "epoch": 1750} {"train_loss": -6.092642784118652, "global_step": 73527, "epoch": 1750} {"train_loss": -6.038435459136963, "global_step": 73528, "epoch": 1750} {"train_loss": -6.104358196258545, "global_step": 73529, "epoch": 1750} {"train_loss": -6.007988452911377, "global_step": 73530, "epoch": 1750} {"train_loss": -6.072190284729004, "global_step": 73531, "epoch": 1750} {"train_loss": -6.044188022613525, "global_step": 73532, "epoch": 1750} {"train_loss": -6.024694442749023, "global_step": 73533, "epoch": 1750} {"train_loss": -6.078915596008301, "global_step": 73534, "epoch": 1750} {"train_loss": -6.102992057800293, "global_step": 73535, "epoch": 1750} {"train_loss": -6.119035720825195, "global_step": 73536, "epoch": 1750} {"train_loss": -6.07089900970459, "global_step": 73537, "epoch": 1750} {"train_loss": -6.095790386199951, "global_step": 73538, "epoch": 1750} {"train_loss": -6.043646812438965, "global_step": 73539, "epoch": 1750} {"train_loss": -5.9806904792785645, "global_step": 73540, "epoch": 1750} {"train_loss": -6.07167607262021, "global_step": 73541, "epoch": 1750, "train/sim_max_reward_0": 0.1952122243388001, "train/sim_max_reward_1": 0.8633267677802321, "train/sim_max_reward_2": 0.5046985151988833, "train/sim_max_reward_3": 0.12141549799647196, "train/sim_max_reward_4": 0.9462853893031301, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.45168446993741074, "test/sim_max_reward_4300002": 0.6655875148396293, "test/sim_max_reward_4300003": 0.9346728777367791, "test/sim_max_reward_4300004": 0.4857984104800907, "test/sim_max_reward_4300005": 0.3896930487669645, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9612245072358562, "test/sim_max_reward_4300008": 0.8107711284149317, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.939523122196671, "test/sim_max_reward_4300012": 0.7778695804744677, "test/sim_max_reward_4300013": 0.4174252928703917, "test/sim_max_reward_4300014": 0.9949350317186583, "test/sim_max_reward_4300015": 0.9508065169272707, "test/sim_max_reward_4300016": 0.8958794550051448, "test/sim_max_reward_4300017": 0.9640792555431088, "test/sim_max_reward_4300018": 0.3689822723271591, "test/sim_max_reward_4300019": 0.18646429395344277, "test/sim_max_reward_4300020": 1.0, "test/sim_max_reward_4300021": 1.0, "test/sim_max_reward_4300022": 0.6432492627680134, "test/sim_max_reward_4300023": 0.8276390578729677, "test/sim_max_reward_4300024": 0.40405136371858835, "test/sim_max_reward_4300025": 0.7974286754253193, "test/sim_max_reward_4300026": 1.0, "test/sim_max_reward_4300027": 0.9303405344807678, "test/sim_max_reward_4300028": 0.6892884327682225, "test/sim_max_reward_4300029": 0.00733854556095997, "test/sim_max_reward_4300030": 0.7527630595336754, "test/sim_max_reward_4300031": 0.6731669703609975, "test/sim_max_reward_4300032": 0.8633205914724502, "test/sim_max_reward_4300033": 0.8810897529891433, "test/sim_max_reward_4300034": 0.8646921228356906, "test/sim_max_reward_4300035": 0.5226901110412133, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8808874735912771, "test/sim_max_reward_4300038": 1.0, "test/sim_max_reward_4300039": 0.9270961267590565, "test/sim_max_reward_4300040": 0.15607465617693586, "test/sim_max_reward_4300041": 0.9109473041558049, "test/sim_max_reward_4300042": 0.6505894670753163, "test/sim_max_reward_4300043": 0.9695437612264466, "test/sim_max_reward_4300044": 0.8670543198537392, "test/sim_max_reward_4300045": 0.2013100011186513, "test/sim_max_reward_4300046": 0.8154254435817349, "test/sim_max_reward_4300047": 0.16205855729327684, "test/sim_max_reward_4300048": 0.9694709804713569, "test/sim_max_reward_4300049": 0.25379428115974106, "train/mean_score": 0.47065385899661755, "test/mean_score": 0.6603180349456562, "val_loss": 62152.9765625} {"train_loss": -5.998557090759277, "global_step": 73542, "epoch": 1751} {"train_loss": -6.194125175476074, "global_step": 73543, "epoch": 1751} {"train_loss": -6.239620208740234, "global_step": 73544, "epoch": 1751} {"train_loss": -6.106036186218262, "global_step": 73545, "epoch": 1751} {"train_loss": -6.035211086273193, "global_step": 73546, "epoch": 1751} {"train_loss": -6.124532222747803, "global_step": 73547, "epoch": 1751} {"train_loss": -6.063776969909668, "global_step": 73548, "epoch": 1751} {"train_loss": -5.951543807983398, "global_step": 73549, "epoch": 1751} {"train_loss": -6.061470031738281, "global_step": 73550, "epoch": 1751} {"train_loss": -6.010231018066406, "global_step": 73551, "epoch": 1751} {"train_loss": -6.151083946228027, "global_step": 73552, "epoch": 1751} {"train_loss": -6.036014556884766, "global_step": 73553, "epoch": 1751} {"train_loss": -6.101632595062256, "global_step": 73554, "epoch": 1751} {"train_loss": -6.081747531890869, "global_step": 73555, "epoch": 1751} {"train_loss": -6.01575231552124, "global_step": 73556, "epoch": 1751} {"train_loss": -6.140059947967529, "global_step": 73557, "epoch": 1751} {"train_loss": -6.1193037033081055, "global_step": 73558, "epoch": 1751} {"train_loss": -6.044229507446289, "global_step": 73559, "epoch": 1751} {"train_loss": -6.145795822143555, "global_step": 73560, "epoch": 1751} {"train_loss": -6.079143524169922, "global_step": 73561, "epoch": 1751} {"train_loss": -6.112117767333984, "global_step": 73562, "epoch": 1751} {"train_loss": -6.04084587097168, "global_step": 73563, "epoch": 1751} {"train_loss": -6.181343078613281, "global_step": 73564, "epoch": 1751} {"train_loss": -6.039393424987793, "global_step": 73565, "epoch": 1751} {"train_loss": -5.97567892074585, "global_step": 73566, "epoch": 1751} {"train_loss": -6.078341484069824, "global_step": 73567, "epoch": 1751} {"train_loss": -6.125260829925537, "global_step": 73568, "epoch": 1751} {"train_loss": -6.1922926902771, "global_step": 73569, "epoch": 1751} {"train_loss": -6.1425299644470215, "global_step": 73570, "epoch": 1751} {"train_loss": -6.0935258865356445, "global_step": 73571, "epoch": 1751} {"train_loss": -6.155963897705078, "global_step": 73572, "epoch": 1751} {"train_loss": -6.076666831970215, "global_step": 73573, "epoch": 1751} {"train_loss": -6.070798873901367, "global_step": 73574, "epoch": 1751} {"train_loss": -5.952892780303955, "global_step": 73575, "epoch": 1751} {"train_loss": -6.004011631011963, "global_step": 73576, "epoch": 1751} {"train_loss": -5.962486267089844, "global_step": 73577, "epoch": 1751} {"train_loss": -6.118102073669434, "global_step": 73578, "epoch": 1751} {"train_loss": -6.034773826599121, "global_step": 73579, "epoch": 1751} {"train_loss": -6.0346221923828125, "global_step": 73580, "epoch": 1751} {"train_loss": -6.109314441680908, "global_step": 73581, "epoch": 1751} {"train_loss": -6.011575698852539, "global_step": 73582, "epoch": 1751} {"train_loss": -6.078778107961019, "global_step": 73583, "epoch": 1751, "val_loss": 61793.21875} {"train_loss": -6.123447418212891, "global_step": 73584, "epoch": 1752} {"train_loss": -6.005599498748779, "global_step": 73585, "epoch": 1752} {"train_loss": -5.996307849884033, "global_step": 73586, "epoch": 1752} {"train_loss": -6.081260681152344, "global_step": 73587, "epoch": 1752} {"train_loss": -6.064859390258789, "global_step": 73588, "epoch": 1752} {"train_loss": -6.018341541290283, "global_step": 73589, "epoch": 1752} {"train_loss": -6.013144493103027, "global_step": 73590, "epoch": 1752} {"train_loss": -6.060341835021973, "global_step": 73591, "epoch": 1752} {"train_loss": -6.0145463943481445, "global_step": 73592, "epoch": 1752} {"train_loss": -6.096111297607422, "global_step": 73593, "epoch": 1752} {"train_loss": -6.083277702331543, "global_step": 73594, "epoch": 1752} {"train_loss": -6.085153579711914, "global_step": 73595, "epoch": 1752} {"train_loss": -6.057262420654297, "global_step": 73596, "epoch": 1752} {"train_loss": -6.071401596069336, "global_step": 73597, "epoch": 1752} {"train_loss": -6.208641052246094, "global_step": 73598, "epoch": 1752} {"train_loss": -6.291181564331055, "global_step": 73599, "epoch": 1752} {"train_loss": -6.104173183441162, "global_step": 73600, "epoch": 1752} {"train_loss": -6.043429851531982, "global_step": 73601, "epoch": 1752} {"train_loss": -6.138038635253906, "global_step": 73602, "epoch": 1752} {"train_loss": -6.189940452575684, "global_step": 73603, "epoch": 1752} {"train_loss": -6.074253559112549, "global_step": 73604, "epoch": 1752} {"train_loss": -6.091535568237305, "global_step": 73605, "epoch": 1752} {"train_loss": -6.201666355133057, "global_step": 73606, "epoch": 1752} {"train_loss": -6.054141044616699, "global_step": 73607, "epoch": 1752} {"train_loss": -6.154422760009766, "global_step": 73608, "epoch": 1752} {"train_loss": -6.005348205566406, "global_step": 73609, "epoch": 1752} {"train_loss": -6.0683112144470215, "global_step": 73610, "epoch": 1752} {"train_loss": -5.9974751472473145, "global_step": 73611, "epoch": 1752} {"train_loss": -6.071587562561035, "global_step": 73612, "epoch": 1752} {"train_loss": -6.223609447479248, "global_step": 73613, "epoch": 1752} {"train_loss": -6.12233829498291, "global_step": 73614, "epoch": 1752} {"train_loss": -6.102875709533691, "global_step": 73615, "epoch": 1752} {"train_loss": -5.966922760009766, "global_step": 73616, "epoch": 1752} {"train_loss": -6.032087326049805, "global_step": 73617, "epoch": 1752} {"train_loss": -6.03554105758667, "global_step": 73618, "epoch": 1752} {"train_loss": -6.0932207107543945, "global_step": 73619, "epoch": 1752} {"train_loss": -6.015097141265869, "global_step": 73620, "epoch": 1752} {"train_loss": -6.1039910316467285, "global_step": 73621, "epoch": 1752} {"train_loss": -5.8833136558532715, "global_step": 73622, "epoch": 1752} {"train_loss": -6.009200096130371, "global_step": 73623, "epoch": 1752} {"train_loss": -6.093806266784668, "global_step": 73624, "epoch": 1752} {"train_loss": -6.0742019925798685, "global_step": 73625, "epoch": 1752, "val_loss": 61850.36328125} {"train_loss": -6.176225662231445, "global_step": 73626, "epoch": 1753} {"train_loss": -6.056492805480957, "global_step": 73627, "epoch": 1753} {"train_loss": -6.042590141296387, "global_step": 73628, "epoch": 1753} {"train_loss": -6.154517650604248, "global_step": 73629, "epoch": 1753} {"train_loss": -5.987865924835205, "global_step": 73630, "epoch": 1753} {"train_loss": -6.107449531555176, "global_step": 73631, "epoch": 1753} {"train_loss": -6.019070148468018, "global_step": 73632, "epoch": 1753} {"train_loss": -6.118481636047363, "global_step": 73633, "epoch": 1753} {"train_loss": -6.044039726257324, "global_step": 73634, "epoch": 1753} {"train_loss": -6.07600212097168, "global_step": 73635, "epoch": 1753} {"train_loss": -6.086103439331055, "global_step": 73636, "epoch": 1753} {"train_loss": -6.0146589279174805, "global_step": 73637, "epoch": 1753} {"train_loss": -6.043094635009766, "global_step": 73638, "epoch": 1753} {"train_loss": -6.111956596374512, "global_step": 73639, "epoch": 1753} {"train_loss": -5.982266902923584, "global_step": 73640, "epoch": 1753} {"train_loss": -6.053990840911865, "global_step": 73641, "epoch": 1753} {"train_loss": -6.013463020324707, "global_step": 73642, "epoch": 1753} {"train_loss": -6.013003349304199, "global_step": 73643, "epoch": 1753} {"train_loss": -5.997105598449707, "global_step": 73644, "epoch": 1753} {"train_loss": -6.162466526031494, "global_step": 73645, "epoch": 1753} {"train_loss": -5.875677108764648, "global_step": 73646, "epoch": 1753} {"train_loss": -6.067238807678223, "global_step": 73647, "epoch": 1753} {"train_loss": -5.96730899810791, "global_step": 73648, "epoch": 1753} {"train_loss": -6.152587890625, "global_step": 73649, "epoch": 1753} {"train_loss": -6.214776992797852, "global_step": 73650, "epoch": 1753} {"train_loss": -6.199678421020508, "global_step": 73651, "epoch": 1753} {"train_loss": -6.133913040161133, "global_step": 73652, "epoch": 1753} {"train_loss": -6.1453447341918945, "global_step": 73653, "epoch": 1753} {"train_loss": -6.170648574829102, "global_step": 73654, "epoch": 1753} {"train_loss": -6.126997947692871, "global_step": 73655, "epoch": 1753} {"train_loss": -6.108423233032227, "global_step": 73656, "epoch": 1753} {"train_loss": -6.152278423309326, "global_step": 73657, "epoch": 1753} {"train_loss": -6.133227825164795, "global_step": 73658, "epoch": 1753} {"train_loss": -6.063982009887695, "global_step": 73659, "epoch": 1753} {"train_loss": -5.993684768676758, "global_step": 73660, "epoch": 1753} {"train_loss": -6.226535797119141, "global_step": 73661, "epoch": 1753} {"train_loss": -6.097287178039551, "global_step": 73662, "epoch": 1753} {"train_loss": -6.158517360687256, "global_step": 73663, "epoch": 1753} {"train_loss": -6.03829288482666, "global_step": 73664, "epoch": 1753} {"train_loss": -6.117168426513672, "global_step": 73665, "epoch": 1753} {"train_loss": -6.141291618347168, "global_step": 73666, "epoch": 1753} {"train_loss": -6.085589533760434, "global_step": 73667, "epoch": 1753, "val_loss": 62194.6171875} {"train_loss": -5.954812049865723, "global_step": 73668, "epoch": 1754} {"train_loss": -6.108183860778809, "global_step": 73669, "epoch": 1754} {"train_loss": -6.0048723220825195, "global_step": 73670, "epoch": 1754} {"train_loss": -6.015680313110352, "global_step": 73671, "epoch": 1754} {"train_loss": -6.056234359741211, "global_step": 73672, "epoch": 1754} {"train_loss": -5.954039573669434, "global_step": 73673, "epoch": 1754} {"train_loss": -6.184553146362305, "global_step": 73674, "epoch": 1754} {"train_loss": -6.116715908050537, "global_step": 73675, "epoch": 1754} {"train_loss": -6.05235481262207, "global_step": 73676, "epoch": 1754} {"train_loss": -6.064971446990967, "global_step": 73677, "epoch": 1754} {"train_loss": -6.1639299392700195, "global_step": 73678, "epoch": 1754} {"train_loss": -6.112696647644043, "global_step": 73679, "epoch": 1754} {"train_loss": -6.089948654174805, "global_step": 73680, "epoch": 1754} {"train_loss": -6.055487632751465, "global_step": 73681, "epoch": 1754} {"train_loss": -6.155462741851807, "global_step": 73682, "epoch": 1754} {"train_loss": -6.023553848266602, "global_step": 73683, "epoch": 1754} {"train_loss": -6.127225875854492, "global_step": 73684, "epoch": 1754} {"train_loss": -6.142357349395752, "global_step": 73685, "epoch": 1754} {"train_loss": -6.067345142364502, "global_step": 73686, "epoch": 1754} {"train_loss": -6.074235916137695, "global_step": 73687, "epoch": 1754} {"train_loss": -6.120984077453613, "global_step": 73688, "epoch": 1754} {"train_loss": -6.0597991943359375, "global_step": 73689, "epoch": 1754} {"train_loss": -6.068817138671875, "global_step": 73690, "epoch": 1754} {"train_loss": -6.1487274169921875, "global_step": 73691, "epoch": 1754} {"train_loss": -5.997302532196045, "global_step": 73692, "epoch": 1754} {"train_loss": -6.09965181350708, "global_step": 73693, "epoch": 1754} {"train_loss": -6.099978446960449, "global_step": 73694, "epoch": 1754} {"train_loss": -6.024502754211426, "global_step": 73695, "epoch": 1754} {"train_loss": -5.929737091064453, "global_step": 73696, "epoch": 1754} {"train_loss": -6.157153129577637, "global_step": 73697, "epoch": 1754} {"train_loss": -5.991916656494141, "global_step": 73698, "epoch": 1754} {"train_loss": -6.212436676025391, "global_step": 73699, "epoch": 1754} {"train_loss": -5.9232306480407715, "global_step": 73700, "epoch": 1754} {"train_loss": -5.954741477966309, "global_step": 73701, "epoch": 1754} {"train_loss": -6.205367088317871, "global_step": 73702, "epoch": 1754} {"train_loss": -6.075066566467285, "global_step": 73703, "epoch": 1754} {"train_loss": -6.102653980255127, "global_step": 73704, "epoch": 1754} {"train_loss": -5.974987983703613, "global_step": 73705, "epoch": 1754} {"train_loss": -6.042176246643066, "global_step": 73706, "epoch": 1754} {"train_loss": -5.901787757873535, "global_step": 73707, "epoch": 1754} {"train_loss": -6.069149017333984, "global_step": 73708, "epoch": 1754} {"train_loss": -6.062470118204753, "global_step": 73709, "epoch": 1754, "val_loss": 62164.72265625} {"train_loss": -5.983739852905273, "global_step": 73710, "epoch": 1755} {"train_loss": -6.141275405883789, "global_step": 73711, "epoch": 1755} {"train_loss": -6.040274143218994, "global_step": 73712, "epoch": 1755} {"train_loss": -6.144573211669922, "global_step": 73713, "epoch": 1755} {"train_loss": -6.071639537811279, "global_step": 73714, "epoch": 1755} {"train_loss": -6.110318660736084, "global_step": 73715, "epoch": 1755} {"train_loss": -5.999058723449707, "global_step": 73716, "epoch": 1755} {"train_loss": -6.193902015686035, "global_step": 73717, "epoch": 1755} {"train_loss": -6.127625465393066, "global_step": 73718, "epoch": 1755} {"train_loss": -6.020408630371094, "global_step": 73719, "epoch": 1755} {"train_loss": -6.1682844161987305, "global_step": 73720, "epoch": 1755} {"train_loss": -6.071076393127441, "global_step": 73721, "epoch": 1755} {"train_loss": -5.996580123901367, "global_step": 73722, "epoch": 1755} {"train_loss": -6.121479034423828, "global_step": 73723, "epoch": 1755} {"train_loss": -6.066193580627441, "global_step": 73724, "epoch": 1755} {"train_loss": -6.1320390701293945, "global_step": 73725, "epoch": 1755} {"train_loss": -5.998834133148193, "global_step": 73726, "epoch": 1755} {"train_loss": -6.016999244689941, "global_step": 73727, "epoch": 1755} {"train_loss": -6.048216819763184, "global_step": 73728, "epoch": 1755} {"train_loss": -6.0222063064575195, "global_step": 73729, "epoch": 1755} {"train_loss": -6.093208312988281, "global_step": 73730, "epoch": 1755} {"train_loss": -6.0605010986328125, "global_step": 73731, "epoch": 1755} {"train_loss": -6.0250468254089355, "global_step": 73732, "epoch": 1755} {"train_loss": -6.0321245193481445, "global_step": 73733, "epoch": 1755} {"train_loss": -6.033914566040039, "global_step": 73734, "epoch": 1755} {"train_loss": -5.994597434997559, "global_step": 73735, "epoch": 1755} {"train_loss": -6.052427768707275, "global_step": 73736, "epoch": 1755} {"train_loss": -6.055973529815674, "global_step": 73737, "epoch": 1755} {"train_loss": -5.9842610359191895, "global_step": 73738, "epoch": 1755} {"train_loss": -6.001118183135986, "global_step": 73739, "epoch": 1755} {"train_loss": -6.063510894775391, "global_step": 73740, "epoch": 1755} {"train_loss": -5.941929817199707, "global_step": 73741, "epoch": 1755} {"train_loss": -6.180469989776611, "global_step": 73742, "epoch": 1755} {"train_loss": -6.044468879699707, "global_step": 73743, "epoch": 1755} {"train_loss": -6.035736083984375, "global_step": 73744, "epoch": 1755} {"train_loss": -6.149145126342773, "global_step": 73745, "epoch": 1755} {"train_loss": -6.110950946807861, "global_step": 73746, "epoch": 1755} {"train_loss": -6.020317077636719, "global_step": 73747, "epoch": 1755} {"train_loss": -6.065922737121582, "global_step": 73748, "epoch": 1755} {"train_loss": -6.0660624504089355, "global_step": 73749, "epoch": 1755} {"train_loss": -6.029515743255615, "global_step": 73750, "epoch": 1755} {"train_loss": -6.060705253056118, "global_step": 73751, "epoch": 1755, "val_loss": 61959.9453125} {"train_loss": -6.1012444496154785, "global_step": 73752, "epoch": 1756} {"train_loss": -6.130828380584717, "global_step": 73753, "epoch": 1756} {"train_loss": -6.056963920593262, "global_step": 73754, "epoch": 1756} {"train_loss": -6.035362720489502, "global_step": 73755, "epoch": 1756} {"train_loss": -6.016817092895508, "global_step": 73756, "epoch": 1756} {"train_loss": -5.972095966339111, "global_step": 73757, "epoch": 1756} {"train_loss": -5.998641014099121, "global_step": 73758, "epoch": 1756} {"train_loss": -5.979955673217773, "global_step": 73759, "epoch": 1756} {"train_loss": -6.039290904998779, "global_step": 73760, "epoch": 1756} {"train_loss": -6.100650787353516, "global_step": 73761, "epoch": 1756} {"train_loss": -5.979366779327393, "global_step": 73762, "epoch": 1756} {"train_loss": -6.047575950622559, "global_step": 73763, "epoch": 1756} {"train_loss": -6.206728935241699, "global_step": 73764, "epoch": 1756} {"train_loss": -6.116321563720703, "global_step": 73765, "epoch": 1756} {"train_loss": -6.018671989440918, "global_step": 73766, "epoch": 1756} {"train_loss": -6.204371452331543, "global_step": 73767, "epoch": 1756} {"train_loss": -6.171113967895508, "global_step": 73768, "epoch": 1756} {"train_loss": -6.154332637786865, "global_step": 73769, "epoch": 1756} {"train_loss": -6.125513076782227, "global_step": 73770, "epoch": 1756} {"train_loss": -6.080020904541016, "global_step": 73771, "epoch": 1756} {"train_loss": -5.985062122344971, "global_step": 73772, "epoch": 1756} {"train_loss": -6.11772346496582, "global_step": 73773, "epoch": 1756} {"train_loss": -6.05167293548584, "global_step": 73774, "epoch": 1756} {"train_loss": -6.098353385925293, "global_step": 73775, "epoch": 1756} {"train_loss": -6.177800178527832, "global_step": 73776, "epoch": 1756} {"train_loss": -6.049351215362549, "global_step": 73777, "epoch": 1756} {"train_loss": -6.044338703155518, "global_step": 73778, "epoch": 1756} {"train_loss": -6.1344194412231445, "global_step": 73779, "epoch": 1756} {"train_loss": -6.201082229614258, "global_step": 73780, "epoch": 1756} {"train_loss": -6.125536918640137, "global_step": 73781, "epoch": 1756} {"train_loss": -5.973871231079102, "global_step": 73782, "epoch": 1756} {"train_loss": -5.970385551452637, "global_step": 73783, "epoch": 1756} {"train_loss": -6.097979545593262, "global_step": 73784, "epoch": 1756} {"train_loss": -6.058581352233887, "global_step": 73785, "epoch": 1756} {"train_loss": -6.051394462585449, "global_step": 73786, "epoch": 1756} {"train_loss": -6.102015495300293, "global_step": 73787, "epoch": 1756} {"train_loss": -5.948235034942627, "global_step": 73788, "epoch": 1756} {"train_loss": -6.106931686401367, "global_step": 73789, "epoch": 1756} {"train_loss": -5.991177558898926, "global_step": 73790, "epoch": 1756} {"train_loss": -5.991399765014648, "global_step": 73791, "epoch": 1756} {"train_loss": -5.912447929382324, "global_step": 73792, "epoch": 1756} {"train_loss": -6.066094784509568, "global_step": 73793, "epoch": 1756, "val_loss": 61926.0} {"train_loss": -6.095694065093994, "global_step": 73794, "epoch": 1757} {"train_loss": -5.998709678649902, "global_step": 73795, "epoch": 1757} {"train_loss": -6.0778398513793945, "global_step": 73796, "epoch": 1757} {"train_loss": -5.989467144012451, "global_step": 73797, "epoch": 1757} {"train_loss": -5.983720779418945, "global_step": 73798, "epoch": 1757} {"train_loss": -6.0867109298706055, "global_step": 73799, "epoch": 1757} {"train_loss": -5.995842933654785, "global_step": 73800, "epoch": 1757} {"train_loss": -5.99101448059082, "global_step": 73801, "epoch": 1757} {"train_loss": -5.955937385559082, "global_step": 73802, "epoch": 1757} {"train_loss": -6.104555130004883, "global_step": 73803, "epoch": 1757} {"train_loss": -5.995675086975098, "global_step": 73804, "epoch": 1757} {"train_loss": -5.942770957946777, "global_step": 73805, "epoch": 1757} {"train_loss": -6.067018985748291, "global_step": 73806, "epoch": 1757} {"train_loss": -6.039037704467773, "global_step": 73807, "epoch": 1757} {"train_loss": -5.954403877258301, "global_step": 73808, "epoch": 1757} {"train_loss": -6.026083946228027, "global_step": 73809, "epoch": 1757} {"train_loss": -6.046050071716309, "global_step": 73810, "epoch": 1757} {"train_loss": -6.072078704833984, "global_step": 73811, "epoch": 1757} {"train_loss": -6.064810276031494, "global_step": 73812, "epoch": 1757} {"train_loss": -6.080612659454346, "global_step": 73813, "epoch": 1757} {"train_loss": -6.173000812530518, "global_step": 73814, "epoch": 1757} {"train_loss": -6.100033283233643, "global_step": 73815, "epoch": 1757} {"train_loss": -6.028372764587402, "global_step": 73816, "epoch": 1757} {"train_loss": -6.032079696655273, "global_step": 73817, "epoch": 1757} {"train_loss": -5.867410659790039, "global_step": 73818, "epoch": 1757} {"train_loss": -6.110994815826416, "global_step": 73819, "epoch": 1757} {"train_loss": -6.0371880531311035, "global_step": 73820, "epoch": 1757} {"train_loss": -6.04499626159668, "global_step": 73821, "epoch": 1757} {"train_loss": -6.1575469970703125, "global_step": 73822, "epoch": 1757} {"train_loss": -6.113101005554199, "global_step": 73823, "epoch": 1757} {"train_loss": -6.1518354415893555, "global_step": 73824, "epoch": 1757} {"train_loss": -6.037158012390137, "global_step": 73825, "epoch": 1757} {"train_loss": -6.118474006652832, "global_step": 73826, "epoch": 1757} {"train_loss": -6.114129543304443, "global_step": 73827, "epoch": 1757} {"train_loss": -6.100166320800781, "global_step": 73828, "epoch": 1757} {"train_loss": -6.060480117797852, "global_step": 73829, "epoch": 1757} {"train_loss": -5.979038238525391, "global_step": 73830, "epoch": 1757} {"train_loss": -5.987943172454834, "global_step": 73831, "epoch": 1757} {"train_loss": -5.974123001098633, "global_step": 73832, "epoch": 1757} {"train_loss": -6.107961654663086, "global_step": 73833, "epoch": 1757} {"train_loss": -5.933610916137695, "global_step": 73834, "epoch": 1757} {"train_loss": -6.044905810129075, "global_step": 73835, "epoch": 1757, "val_loss": 61871.6953125} {"train_loss": -6.11235237121582, "global_step": 73836, "epoch": 1758} {"train_loss": -6.04464054107666, "global_step": 73837, "epoch": 1758} {"train_loss": -6.019583225250244, "global_step": 73838, "epoch": 1758} {"train_loss": -6.108196258544922, "global_step": 73839, "epoch": 1758} {"train_loss": -6.025885581970215, "global_step": 73840, "epoch": 1758} {"train_loss": -6.265765190124512, "global_step": 73841, "epoch": 1758} {"train_loss": -6.009298324584961, "global_step": 73842, "epoch": 1758} {"train_loss": -6.117486953735352, "global_step": 73843, "epoch": 1758} {"train_loss": -6.148952484130859, "global_step": 73844, "epoch": 1758} {"train_loss": -6.049583911895752, "global_step": 73845, "epoch": 1758} {"train_loss": -6.068474292755127, "global_step": 73846, "epoch": 1758} {"train_loss": -5.9797468185424805, "global_step": 73847, "epoch": 1758} {"train_loss": -6.024109840393066, "global_step": 73848, "epoch": 1758} {"train_loss": -6.101519584655762, "global_step": 73849, "epoch": 1758} {"train_loss": -5.977583885192871, "global_step": 73850, "epoch": 1758} {"train_loss": -6.06669807434082, "global_step": 73851, "epoch": 1758} {"train_loss": -5.941807746887207, "global_step": 73852, "epoch": 1758} {"train_loss": -6.034107685089111, "global_step": 73853, "epoch": 1758} {"train_loss": -6.121770858764648, "global_step": 73854, "epoch": 1758} {"train_loss": -6.120743751525879, "global_step": 73855, "epoch": 1758} {"train_loss": -6.075586318969727, "global_step": 73856, "epoch": 1758} {"train_loss": -6.071798324584961, "global_step": 73857, "epoch": 1758} {"train_loss": -6.124677658081055, "global_step": 73858, "epoch": 1758} {"train_loss": -6.151742935180664, "global_step": 73859, "epoch": 1758} {"train_loss": -6.133633613586426, "global_step": 73860, "epoch": 1758} {"train_loss": -6.007205486297607, "global_step": 73861, "epoch": 1758} {"train_loss": -6.039849281311035, "global_step": 73862, "epoch": 1758} {"train_loss": -6.091241836547852, "global_step": 73863, "epoch": 1758} {"train_loss": -6.111428260803223, "global_step": 73864, "epoch": 1758} {"train_loss": -5.981659412384033, "global_step": 73865, "epoch": 1758} {"train_loss": -6.005130767822266, "global_step": 73866, "epoch": 1758} {"train_loss": -5.975554943084717, "global_step": 73867, "epoch": 1758} {"train_loss": -6.124175548553467, "global_step": 73868, "epoch": 1758} {"train_loss": -6.111529350280762, "global_step": 73869, "epoch": 1758} {"train_loss": -5.995487689971924, "global_step": 73870, "epoch": 1758} {"train_loss": -6.0348920822143555, "global_step": 73871, "epoch": 1758} {"train_loss": -6.053132057189941, "global_step": 73872, "epoch": 1758} {"train_loss": -6.063621520996094, "global_step": 73873, "epoch": 1758} {"train_loss": -6.237783432006836, "global_step": 73874, "epoch": 1758} {"train_loss": -6.014436721801758, "global_step": 73875, "epoch": 1758} {"train_loss": -6.104011535644531, "global_step": 73876, "epoch": 1758} {"train_loss": -6.0677381583622525, "global_step": 73877, "epoch": 1758, "val_loss": 61668.57421875} {"train_loss": -6.11862325668335, "global_step": 73878, "epoch": 1759} {"train_loss": -5.962375640869141, "global_step": 73879, "epoch": 1759} {"train_loss": -6.012331962585449, "global_step": 73880, "epoch": 1759} {"train_loss": -6.027830123901367, "global_step": 73881, "epoch": 1759} {"train_loss": -6.077523231506348, "global_step": 73882, "epoch": 1759} {"train_loss": -6.139041900634766, "global_step": 73883, "epoch": 1759} {"train_loss": -6.188518524169922, "global_step": 73884, "epoch": 1759} {"train_loss": -6.094682693481445, "global_step": 73885, "epoch": 1759} {"train_loss": -6.050298690795898, "global_step": 73886, "epoch": 1759} {"train_loss": -6.0358357429504395, "global_step": 73887, "epoch": 1759} {"train_loss": -6.124264717102051, "global_step": 73888, "epoch": 1759} {"train_loss": -6.108311653137207, "global_step": 73889, "epoch": 1759} {"train_loss": -6.131389141082764, "global_step": 73890, "epoch": 1759} {"train_loss": -6.096567630767822, "global_step": 73891, "epoch": 1759} {"train_loss": -6.12938117980957, "global_step": 73892, "epoch": 1759} {"train_loss": -5.9993414878845215, "global_step": 73893, "epoch": 1759} {"train_loss": -5.969565391540527, "global_step": 73894, "epoch": 1759} {"train_loss": -6.089803218841553, "global_step": 73895, "epoch": 1759} {"train_loss": -6.072966575622559, "global_step": 73896, "epoch": 1759} {"train_loss": -6.092043399810791, "global_step": 73897, "epoch": 1759} {"train_loss": -6.113736152648926, "global_step": 73898, "epoch": 1759} {"train_loss": -5.931729793548584, "global_step": 73899, "epoch": 1759} {"train_loss": -6.005251884460449, "global_step": 73900, "epoch": 1759} {"train_loss": -5.987861633300781, "global_step": 73901, "epoch": 1759} {"train_loss": -6.008262634277344, "global_step": 73902, "epoch": 1759} {"train_loss": -6.125443935394287, "global_step": 73903, "epoch": 1759} {"train_loss": -6.0620527267456055, "global_step": 73904, "epoch": 1759} {"train_loss": -6.069060802459717, "global_step": 73905, "epoch": 1759} {"train_loss": -6.042354106903076, "global_step": 73906, "epoch": 1759} {"train_loss": -6.085649490356445, "global_step": 73907, "epoch": 1759} {"train_loss": -6.014585971832275, "global_step": 73908, "epoch": 1759} {"train_loss": -6.103732109069824, "global_step": 73909, "epoch": 1759} {"train_loss": -6.0634050369262695, "global_step": 73910, "epoch": 1759} {"train_loss": -6.077390670776367, "global_step": 73911, "epoch": 1759} {"train_loss": -6.036702632904053, "global_step": 73912, "epoch": 1759} {"train_loss": -5.973447799682617, "global_step": 73913, "epoch": 1759} {"train_loss": -6.116223335266113, "global_step": 73914, "epoch": 1759} {"train_loss": -6.125107288360596, "global_step": 73915, "epoch": 1759} {"train_loss": -5.9993438720703125, "global_step": 73916, "epoch": 1759} {"train_loss": -6.110660552978516, "global_step": 73917, "epoch": 1759} {"train_loss": -6.134977340698242, "global_step": 73918, "epoch": 1759} {"train_loss": -6.067388409659976, "global_step": 73919, "epoch": 1759, "val_loss": 61969.45703125} {"train_loss": -6.053955554962158, "global_step": 73920, "epoch": 1760} {"train_loss": -6.201589584350586, "global_step": 73921, "epoch": 1760} {"train_loss": -6.081447601318359, "global_step": 73922, "epoch": 1760} {"train_loss": -5.952615737915039, "global_step": 73923, "epoch": 1760} {"train_loss": -6.1792311668396, "global_step": 73924, "epoch": 1760} {"train_loss": -6.02462100982666, "global_step": 73925, "epoch": 1760} {"train_loss": -6.01449728012085, "global_step": 73926, "epoch": 1760} {"train_loss": -6.028632164001465, "global_step": 73927, "epoch": 1760} {"train_loss": -6.014721870422363, "global_step": 73928, "epoch": 1760} {"train_loss": -6.0078325271606445, "global_step": 73929, "epoch": 1760} {"train_loss": -6.057449817657471, "global_step": 73930, "epoch": 1760} {"train_loss": -6.016318321228027, "global_step": 73931, "epoch": 1760} {"train_loss": -6.215333461761475, "global_step": 73932, "epoch": 1760} {"train_loss": -6.12524938583374, "global_step": 73933, "epoch": 1760} {"train_loss": -6.071494102478027, "global_step": 73934, "epoch": 1760} {"train_loss": -6.207705020904541, "global_step": 73935, "epoch": 1760} {"train_loss": -6.094289779663086, "global_step": 73936, "epoch": 1760} {"train_loss": -5.959628105163574, "global_step": 73937, "epoch": 1760} {"train_loss": -6.0297088623046875, "global_step": 73938, "epoch": 1760} {"train_loss": -5.919288158416748, "global_step": 73939, "epoch": 1760} {"train_loss": -6.021697044372559, "global_step": 73940, "epoch": 1760} {"train_loss": -6.005325794219971, "global_step": 73941, "epoch": 1760} {"train_loss": -6.189972400665283, "global_step": 73942, "epoch": 1760} {"train_loss": -6.10502815246582, "global_step": 73943, "epoch": 1760} {"train_loss": -5.892741680145264, "global_step": 73944, "epoch": 1760} {"train_loss": -5.9393157958984375, "global_step": 73945, "epoch": 1760} {"train_loss": -6.070402145385742, "global_step": 73946, "epoch": 1760} {"train_loss": -6.090669631958008, "global_step": 73947, "epoch": 1760} {"train_loss": -6.077024459838867, "global_step": 73948, "epoch": 1760} {"train_loss": -6.108123302459717, "global_step": 73949, "epoch": 1760} {"train_loss": -6.106619358062744, "global_step": 73950, "epoch": 1760} {"train_loss": -6.039724349975586, "global_step": 73951, "epoch": 1760} {"train_loss": -6.149001598358154, "global_step": 73952, "epoch": 1760} {"train_loss": -6.03533935546875, "global_step": 73953, "epoch": 1760} {"train_loss": -6.142854690551758, "global_step": 73954, "epoch": 1760} {"train_loss": -6.217802047729492, "global_step": 73955, "epoch": 1760} {"train_loss": -6.114554405212402, "global_step": 73956, "epoch": 1760} {"train_loss": -6.066540718078613, "global_step": 73957, "epoch": 1760} {"train_loss": -6.115413188934326, "global_step": 73958, "epoch": 1760} {"train_loss": -6.1143107414245605, "global_step": 73959, "epoch": 1760} {"train_loss": -6.078596115112305, "global_step": 73960, "epoch": 1760} {"train_loss": -6.071244205747332, "global_step": 73961, "epoch": 1760, "val_loss": 62009.71875} {"train_loss": -6.063720703125, "global_step": 73962, "epoch": 1761} {"train_loss": -5.947848320007324, "global_step": 73963, "epoch": 1761} {"train_loss": -6.101838111877441, "global_step": 73964, "epoch": 1761} {"train_loss": -5.974177360534668, "global_step": 73965, "epoch": 1761} {"train_loss": -6.185683250427246, "global_step": 73966, "epoch": 1761} {"train_loss": -6.129920959472656, "global_step": 73967, "epoch": 1761} {"train_loss": -6.099337577819824, "global_step": 73968, "epoch": 1761} {"train_loss": -6.1419572830200195, "global_step": 73969, "epoch": 1761} {"train_loss": -6.032891273498535, "global_step": 73970, "epoch": 1761} {"train_loss": -6.144172668457031, "global_step": 73971, "epoch": 1761} {"train_loss": -5.971810340881348, "global_step": 73972, "epoch": 1761} {"train_loss": -6.052399635314941, "global_step": 73973, "epoch": 1761} {"train_loss": -6.172330856323242, "global_step": 73974, "epoch": 1761} {"train_loss": -5.9231157302856445, "global_step": 73975, "epoch": 1761} {"train_loss": -6.019864082336426, "global_step": 73976, "epoch": 1761} {"train_loss": -5.943977355957031, "global_step": 73977, "epoch": 1761} {"train_loss": -5.874218940734863, "global_step": 73978, "epoch": 1761} {"train_loss": -6.0425310134887695, "global_step": 73979, "epoch": 1761} {"train_loss": -5.971714973449707, "global_step": 73980, "epoch": 1761} {"train_loss": -6.062437057495117, "global_step": 73981, "epoch": 1761} {"train_loss": -5.857561111450195, "global_step": 73982, "epoch": 1761} {"train_loss": -6.092500686645508, "global_step": 73983, "epoch": 1761} {"train_loss": -5.999436855316162, "global_step": 73984, "epoch": 1761} {"train_loss": -5.972118377685547, "global_step": 73985, "epoch": 1761} {"train_loss": -6.069403648376465, "global_step": 73986, "epoch": 1761} {"train_loss": -5.981999397277832, "global_step": 73987, "epoch": 1761} {"train_loss": -5.983255863189697, "global_step": 73988, "epoch": 1761} {"train_loss": -6.019622802734375, "global_step": 73989, "epoch": 1761} {"train_loss": -6.041114330291748, "global_step": 73990, "epoch": 1761} {"train_loss": -5.9443817138671875, "global_step": 73991, "epoch": 1761} {"train_loss": -5.937160491943359, "global_step": 73992, "epoch": 1761} {"train_loss": -6.155548095703125, "global_step": 73993, "epoch": 1761} {"train_loss": -5.991981506347656, "global_step": 73994, "epoch": 1761} {"train_loss": -5.988483428955078, "global_step": 73995, "epoch": 1761} {"train_loss": -5.986737251281738, "global_step": 73996, "epoch": 1761} {"train_loss": -6.103527545928955, "global_step": 73997, "epoch": 1761} {"train_loss": -6.059622764587402, "global_step": 73998, "epoch": 1761} {"train_loss": -6.108943462371826, "global_step": 73999, "epoch": 1761} {"train_loss": -6.112250328063965, "global_step": 74000, "epoch": 1761} {"train_loss": -6.129290580749512, "global_step": 74001, "epoch": 1761} {"train_loss": -6.119770050048828, "global_step": 74002, "epoch": 1761} {"train_loss": -6.038749320166452, "global_step": 74003, "epoch": 1761, "val_loss": 61729.7265625} {"train_loss": -6.182318687438965, "global_step": 74004, "epoch": 1762} {"train_loss": -6.075175762176514, "global_step": 74005, "epoch": 1762} {"train_loss": -6.086517333984375, "global_step": 74006, "epoch": 1762} {"train_loss": -6.167778015136719, "global_step": 74007, "epoch": 1762} {"train_loss": -6.100210666656494, "global_step": 74008, "epoch": 1762} {"train_loss": -6.061823844909668, "global_step": 74009, "epoch": 1762} {"train_loss": -6.103808879852295, "global_step": 74010, "epoch": 1762} {"train_loss": -6.32689094543457, "global_step": 74011, "epoch": 1762} {"train_loss": -6.0280914306640625, "global_step": 74012, "epoch": 1762} {"train_loss": -6.049997329711914, "global_step": 74013, "epoch": 1762} {"train_loss": -6.208172798156738, "global_step": 74014, "epoch": 1762} {"train_loss": -6.083330154418945, "global_step": 74015, "epoch": 1762} {"train_loss": -6.08041524887085, "global_step": 74016, "epoch": 1762} {"train_loss": -6.003683090209961, "global_step": 74017, "epoch": 1762} {"train_loss": -6.147934913635254, "global_step": 74018, "epoch": 1762} {"train_loss": -6.079654693603516, "global_step": 74019, "epoch": 1762} {"train_loss": -6.103960037231445, "global_step": 74020, "epoch": 1762} {"train_loss": -6.066921234130859, "global_step": 74021, "epoch": 1762} {"train_loss": -6.171138763427734, "global_step": 74022, "epoch": 1762} {"train_loss": -6.167150497436523, "global_step": 74023, "epoch": 1762} {"train_loss": -6.171178340911865, "global_step": 74024, "epoch": 1762} {"train_loss": -6.169199466705322, "global_step": 74025, "epoch": 1762} {"train_loss": -6.092167377471924, "global_step": 74026, "epoch": 1762} {"train_loss": -6.037557601928711, "global_step": 74027, "epoch": 1762} {"train_loss": -6.1144304275512695, "global_step": 74028, "epoch": 1762} {"train_loss": -6.092487335205078, "global_step": 74029, "epoch": 1762} {"train_loss": -6.072418689727783, "global_step": 74030, "epoch": 1762} {"train_loss": -6.091644287109375, "global_step": 74031, "epoch": 1762} {"train_loss": -6.156622886657715, "global_step": 74032, "epoch": 1762} {"train_loss": -6.131184101104736, "global_step": 74033, "epoch": 1762} {"train_loss": -6.151951789855957, "global_step": 74034, "epoch": 1762} {"train_loss": -6.209596633911133, "global_step": 74035, "epoch": 1762} {"train_loss": -6.05175256729126, "global_step": 74036, "epoch": 1762} {"train_loss": -6.061491966247559, "global_step": 74037, "epoch": 1762} {"train_loss": -5.954655647277832, "global_step": 74038, "epoch": 1762} {"train_loss": -6.148237228393555, "global_step": 74039, "epoch": 1762} {"train_loss": -6.1027045249938965, "global_step": 74040, "epoch": 1762} {"train_loss": -6.157462120056152, "global_step": 74041, "epoch": 1762} {"train_loss": -6.167787551879883, "global_step": 74042, "epoch": 1762} {"train_loss": -6.0626220703125, "global_step": 74043, "epoch": 1762} {"train_loss": -6.177979946136475, "global_step": 74044, "epoch": 1762} {"train_loss": -6.113461982636225, "global_step": 74045, "epoch": 1762, "val_loss": 61821.4296875} {"train_loss": -6.145838737487793, "global_step": 74046, "epoch": 1763} {"train_loss": -6.10651159286499, "global_step": 74047, "epoch": 1763} {"train_loss": -6.032173156738281, "global_step": 74048, "epoch": 1763} {"train_loss": -6.074435710906982, "global_step": 74049, "epoch": 1763} {"train_loss": -6.171699523925781, "global_step": 74050, "epoch": 1763} {"train_loss": -6.00506591796875, "global_step": 74051, "epoch": 1763} {"train_loss": -6.041097640991211, "global_step": 74052, "epoch": 1763} {"train_loss": -6.13922643661499, "global_step": 74053, "epoch": 1763} {"train_loss": -6.09104061126709, "global_step": 74054, "epoch": 1763} {"train_loss": -6.006372928619385, "global_step": 74055, "epoch": 1763} {"train_loss": -6.144493103027344, "global_step": 74056, "epoch": 1763} {"train_loss": -6.131059646606445, "global_step": 74057, "epoch": 1763} {"train_loss": -5.9950852394104, "global_step": 74058, "epoch": 1763} {"train_loss": -5.996791839599609, "global_step": 74059, "epoch": 1763} {"train_loss": -6.077753067016602, "global_step": 74060, "epoch": 1763} {"train_loss": -6.167817115783691, "global_step": 74061, "epoch": 1763} {"train_loss": -6.228843688964844, "global_step": 74062, "epoch": 1763} {"train_loss": -6.0018768310546875, "global_step": 74063, "epoch": 1763} {"train_loss": -6.193410873413086, "global_step": 74064, "epoch": 1763} {"train_loss": -6.0190839767456055, "global_step": 74065, "epoch": 1763} {"train_loss": -6.0777363777160645, "global_step": 74066, "epoch": 1763} {"train_loss": -6.090913772583008, "global_step": 74067, "epoch": 1763} {"train_loss": -6.121517181396484, "global_step": 74068, "epoch": 1763} {"train_loss": -6.09567928314209, "global_step": 74069, "epoch": 1763} {"train_loss": -6.076966285705566, "global_step": 74070, "epoch": 1763} {"train_loss": -6.113724708557129, "global_step": 74071, "epoch": 1763} {"train_loss": -6.168231010437012, "global_step": 74072, "epoch": 1763} {"train_loss": -6.180473327636719, "global_step": 74073, "epoch": 1763} {"train_loss": -6.116086006164551, "global_step": 74074, "epoch": 1763} {"train_loss": -6.115018844604492, "global_step": 74075, "epoch": 1763} {"train_loss": -6.1348114013671875, "global_step": 74076, "epoch": 1763} {"train_loss": -6.178564071655273, "global_step": 74077, "epoch": 1763} {"train_loss": -6.0935187339782715, "global_step": 74078, "epoch": 1763} {"train_loss": -6.112674713134766, "global_step": 74079, "epoch": 1763} {"train_loss": -6.130220413208008, "global_step": 74080, "epoch": 1763} {"train_loss": -6.187071323394775, "global_step": 74081, "epoch": 1763} {"train_loss": -6.144749641418457, "global_step": 74082, "epoch": 1763} {"train_loss": -6.127457141876221, "global_step": 74083, "epoch": 1763} {"train_loss": -6.100634574890137, "global_step": 74084, "epoch": 1763} {"train_loss": -6.048881530761719, "global_step": 74085, "epoch": 1763} {"train_loss": -6.108229160308838, "global_step": 74086, "epoch": 1763} {"train_loss": -6.106510446185157, "global_step": 74087, "epoch": 1763, "val_loss": 61900.71875} {"train_loss": -6.059345245361328, "global_step": 74088, "epoch": 1764} {"train_loss": -6.1897430419921875, "global_step": 74089, "epoch": 1764} {"train_loss": -5.9787983894348145, "global_step": 74090, "epoch": 1764} {"train_loss": -6.115070819854736, "global_step": 74091, "epoch": 1764} {"train_loss": -6.087040424346924, "global_step": 74092, "epoch": 1764} {"train_loss": -6.170111179351807, "global_step": 74093, "epoch": 1764} {"train_loss": -6.174284934997559, "global_step": 74094, "epoch": 1764} {"train_loss": -6.081578254699707, "global_step": 74095, "epoch": 1764} {"train_loss": -6.119555473327637, "global_step": 74096, "epoch": 1764} {"train_loss": -6.11321496963501, "global_step": 74097, "epoch": 1764} {"train_loss": -6.123753070831299, "global_step": 74098, "epoch": 1764} {"train_loss": -6.243308067321777, "global_step": 74099, "epoch": 1764} {"train_loss": -6.117605686187744, "global_step": 74100, "epoch": 1764} {"train_loss": -5.98585844039917, "global_step": 74101, "epoch": 1764} {"train_loss": -5.95657205581665, "global_step": 74102, "epoch": 1764} {"train_loss": -5.997926235198975, "global_step": 74103, "epoch": 1764} {"train_loss": -6.062610149383545, "global_step": 74104, "epoch": 1764} {"train_loss": -6.040802478790283, "global_step": 74105, "epoch": 1764} {"train_loss": -6.080300807952881, "global_step": 74106, "epoch": 1764} {"train_loss": -6.096142768859863, "global_step": 74107, "epoch": 1764} {"train_loss": -6.064384460449219, "global_step": 74108, "epoch": 1764} {"train_loss": -6.0912089347839355, "global_step": 74109, "epoch": 1764} {"train_loss": -6.058536529541016, "global_step": 74110, "epoch": 1764} {"train_loss": -6.009521484375, "global_step": 74111, "epoch": 1764} {"train_loss": -6.168387413024902, "global_step": 74112, "epoch": 1764} {"train_loss": -6.0249128341674805, "global_step": 74113, "epoch": 1764} {"train_loss": -6.156844139099121, "global_step": 74114, "epoch": 1764} {"train_loss": -6.0892486572265625, "global_step": 74115, "epoch": 1764} {"train_loss": -6.043172836303711, "global_step": 74116, "epoch": 1764} {"train_loss": -6.100528717041016, "global_step": 74117, "epoch": 1764} {"train_loss": -6.096401214599609, "global_step": 74118, "epoch": 1764} {"train_loss": -6.085181713104248, "global_step": 74119, "epoch": 1764} {"train_loss": -6.171766757965088, "global_step": 74120, "epoch": 1764} {"train_loss": -6.1038055419921875, "global_step": 74121, "epoch": 1764} {"train_loss": -6.005115032196045, "global_step": 74122, "epoch": 1764} {"train_loss": -6.07366418838501, "global_step": 74123, "epoch": 1764} {"train_loss": -6.0202813148498535, "global_step": 74124, "epoch": 1764} {"train_loss": -6.0357818603515625, "global_step": 74125, "epoch": 1764} {"train_loss": -6.103644371032715, "global_step": 74126, "epoch": 1764} {"train_loss": -6.028866291046143, "global_step": 74127, "epoch": 1764} {"train_loss": -6.0200653076171875, "global_step": 74128, "epoch": 1764} {"train_loss": -6.081391697838193, "global_step": 74129, "epoch": 1764, "val_loss": 61638.203125} {"train_loss": -5.955666542053223, "global_step": 74130, "epoch": 1765} {"train_loss": -6.130207538604736, "global_step": 74131, "epoch": 1765} {"train_loss": -6.105842590332031, "global_step": 74132, "epoch": 1765} {"train_loss": -6.010440826416016, "global_step": 74133, "epoch": 1765} {"train_loss": -6.003279685974121, "global_step": 74134, "epoch": 1765} {"train_loss": -6.224742412567139, "global_step": 74135, "epoch": 1765} {"train_loss": -6.003583908081055, "global_step": 74136, "epoch": 1765} {"train_loss": -5.949129104614258, "global_step": 74137, "epoch": 1765} {"train_loss": -6.084012985229492, "global_step": 74138, "epoch": 1765} {"train_loss": -6.0383219718933105, "global_step": 74139, "epoch": 1765} {"train_loss": -6.106191158294678, "global_step": 74140, "epoch": 1765} {"train_loss": -6.039855003356934, "global_step": 74141, "epoch": 1765} {"train_loss": -5.969799995422363, "global_step": 74142, "epoch": 1765} {"train_loss": -5.980074882507324, "global_step": 74143, "epoch": 1765} {"train_loss": -6.0353007316589355, "global_step": 74144, "epoch": 1765} {"train_loss": -5.970712184906006, "global_step": 74145, "epoch": 1765} {"train_loss": -6.028589725494385, "global_step": 74146, "epoch": 1765} {"train_loss": -6.106321334838867, "global_step": 74147, "epoch": 1765} {"train_loss": -6.066524982452393, "global_step": 74148, "epoch": 1765} {"train_loss": -6.0313401222229, "global_step": 74149, "epoch": 1765} {"train_loss": -6.091002464294434, "global_step": 74150, "epoch": 1765} {"train_loss": -6.145066261291504, "global_step": 74151, "epoch": 1765} {"train_loss": -6.125971794128418, "global_step": 74152, "epoch": 1765} {"train_loss": -6.102997779846191, "global_step": 74153, "epoch": 1765} {"train_loss": -6.043117523193359, "global_step": 74154, "epoch": 1765} {"train_loss": -6.0525689125061035, "global_step": 74155, "epoch": 1765} {"train_loss": -6.0910210609436035, "global_step": 74156, "epoch": 1765} {"train_loss": -6.104544162750244, "global_step": 74157, "epoch": 1765} {"train_loss": -6.113210678100586, "global_step": 74158, "epoch": 1765} {"train_loss": -6.02048921585083, "global_step": 74159, "epoch": 1765} {"train_loss": -6.103476524353027, "global_step": 74160, "epoch": 1765} {"train_loss": -6.067252159118652, "global_step": 74161, "epoch": 1765} {"train_loss": -6.076564788818359, "global_step": 74162, "epoch": 1765} {"train_loss": -6.128963947296143, "global_step": 74163, "epoch": 1765} {"train_loss": -6.189118385314941, "global_step": 74164, "epoch": 1765} {"train_loss": -6.092395782470703, "global_step": 74165, "epoch": 1765} {"train_loss": -6.150551795959473, "global_step": 74166, "epoch": 1765} {"train_loss": -6.092187404632568, "global_step": 74167, "epoch": 1765} {"train_loss": -5.974133491516113, "global_step": 74168, "epoch": 1765} {"train_loss": -6.089997291564941, "global_step": 74169, "epoch": 1765} {"train_loss": -5.949627876281738, "global_step": 74170, "epoch": 1765} {"train_loss": -6.065199954169137, "global_step": 74171, "epoch": 1765, "val_loss": 61800.234375} {"train_loss": -6.08814811706543, "global_step": 74172, "epoch": 1766} {"train_loss": -6.020051002502441, "global_step": 74173, "epoch": 1766} {"train_loss": -6.0019426345825195, "global_step": 74174, "epoch": 1766} {"train_loss": -6.184460639953613, "global_step": 74175, "epoch": 1766} {"train_loss": -6.047089576721191, "global_step": 74176, "epoch": 1766} {"train_loss": -6.056327819824219, "global_step": 74177, "epoch": 1766} {"train_loss": -5.988070487976074, "global_step": 74178, "epoch": 1766} {"train_loss": -6.046097755432129, "global_step": 74179, "epoch": 1766} {"train_loss": -6.154543876647949, "global_step": 74180, "epoch": 1766} {"train_loss": -6.025676727294922, "global_step": 74181, "epoch": 1766} {"train_loss": -5.971480846405029, "global_step": 74182, "epoch": 1766} {"train_loss": -6.01268196105957, "global_step": 74183, "epoch": 1766} {"train_loss": -6.1703267097473145, "global_step": 74184, "epoch": 1766} {"train_loss": -6.124506950378418, "global_step": 74185, "epoch": 1766} {"train_loss": -6.154953956604004, "global_step": 74186, "epoch": 1766} {"train_loss": -6.049668312072754, "global_step": 74187, "epoch": 1766} {"train_loss": -6.098153591156006, "global_step": 74188, "epoch": 1766} {"train_loss": -6.075085639953613, "global_step": 74189, "epoch": 1766} {"train_loss": -6.023645401000977, "global_step": 74190, "epoch": 1766} {"train_loss": -5.973415374755859, "global_step": 74191, "epoch": 1766} {"train_loss": -5.962902545928955, "global_step": 74192, "epoch": 1766} {"train_loss": -6.159283638000488, "global_step": 74193, "epoch": 1766} {"train_loss": -5.9995527267456055, "global_step": 74194, "epoch": 1766} {"train_loss": -6.064761161804199, "global_step": 74195, "epoch": 1766} {"train_loss": -5.9862775802612305, "global_step": 74196, "epoch": 1766} {"train_loss": -6.0990376472473145, "global_step": 74197, "epoch": 1766} {"train_loss": -6.1013994216918945, "global_step": 74198, "epoch": 1766} {"train_loss": -6.047287940979004, "global_step": 74199, "epoch": 1766} {"train_loss": -6.079377174377441, "global_step": 74200, "epoch": 1766} {"train_loss": -5.991296768188477, "global_step": 74201, "epoch": 1766} {"train_loss": -5.966730117797852, "global_step": 74202, "epoch": 1766} {"train_loss": -6.038180351257324, "global_step": 74203, "epoch": 1766} {"train_loss": -6.147106170654297, "global_step": 74204, "epoch": 1766} {"train_loss": -6.242018699645996, "global_step": 74205, "epoch": 1766} {"train_loss": -6.146276950836182, "global_step": 74206, "epoch": 1766} {"train_loss": -6.115269660949707, "global_step": 74207, "epoch": 1766} {"train_loss": -6.097599029541016, "global_step": 74208, "epoch": 1766} {"train_loss": -6.080845832824707, "global_step": 74209, "epoch": 1766} {"train_loss": -6.038816452026367, "global_step": 74210, "epoch": 1766} {"train_loss": -6.178073406219482, "global_step": 74211, "epoch": 1766} {"train_loss": -6.0594563484191895, "global_step": 74212, "epoch": 1766} {"train_loss": -6.068773167473929, "global_step": 74213, "epoch": 1766, "val_loss": 61887.12109375} {"train_loss": -6.084507942199707, "global_step": 74214, "epoch": 1767} {"train_loss": -6.08884334564209, "global_step": 74215, "epoch": 1767} {"train_loss": -6.08380651473999, "global_step": 74216, "epoch": 1767} {"train_loss": -5.956256866455078, "global_step": 74217, "epoch": 1767} {"train_loss": -6.137654781341553, "global_step": 74218, "epoch": 1767} {"train_loss": -6.0971269607543945, "global_step": 74219, "epoch": 1767} {"train_loss": -6.1110124588012695, "global_step": 74220, "epoch": 1767} {"train_loss": -6.06907844543457, "global_step": 74221, "epoch": 1767} {"train_loss": -6.116762638092041, "global_step": 74222, "epoch": 1767} {"train_loss": -6.039955139160156, "global_step": 74223, "epoch": 1767} {"train_loss": -6.147051811218262, "global_step": 74224, "epoch": 1767} {"train_loss": -6.153514862060547, "global_step": 74225, "epoch": 1767} {"train_loss": -6.137507438659668, "global_step": 74226, "epoch": 1767} {"train_loss": -6.1405487060546875, "global_step": 74227, "epoch": 1767} {"train_loss": -6.151411056518555, "global_step": 74228, "epoch": 1767} {"train_loss": -6.098455429077148, "global_step": 74229, "epoch": 1767} {"train_loss": -6.204751014709473, "global_step": 74230, "epoch": 1767} {"train_loss": -6.041719913482666, "global_step": 74231, "epoch": 1767} {"train_loss": -6.02117919921875, "global_step": 74232, "epoch": 1767} {"train_loss": -5.963595390319824, "global_step": 74233, "epoch": 1767} {"train_loss": -5.996276378631592, "global_step": 74234, "epoch": 1767} {"train_loss": -6.105078220367432, "global_step": 74235, "epoch": 1767} {"train_loss": -6.127527236938477, "global_step": 74236, "epoch": 1767} {"train_loss": -6.076192855834961, "global_step": 74237, "epoch": 1767} {"train_loss": -6.0453996658325195, "global_step": 74238, "epoch": 1767} {"train_loss": -6.173532009124756, "global_step": 74239, "epoch": 1767} {"train_loss": -6.111656665802002, "global_step": 74240, "epoch": 1767} {"train_loss": -6.07725715637207, "global_step": 74241, "epoch": 1767} {"train_loss": -5.994021415710449, "global_step": 74242, "epoch": 1767} {"train_loss": -6.089357852935791, "global_step": 74243, "epoch": 1767} {"train_loss": -6.096646308898926, "global_step": 74244, "epoch": 1767} {"train_loss": -6.086282253265381, "global_step": 74245, "epoch": 1767} {"train_loss": -6.109809875488281, "global_step": 74246, "epoch": 1767} {"train_loss": -6.180226802825928, "global_step": 74247, "epoch": 1767} {"train_loss": -6.125977516174316, "global_step": 74248, "epoch": 1767} {"train_loss": -6.135936737060547, "global_step": 74249, "epoch": 1767} {"train_loss": -5.993974685668945, "global_step": 74250, "epoch": 1767} {"train_loss": -6.0949249267578125, "global_step": 74251, "epoch": 1767} {"train_loss": -6.048636436462402, "global_step": 74252, "epoch": 1767} {"train_loss": -6.146434783935547, "global_step": 74253, "epoch": 1767} {"train_loss": -6.0952863693237305, "global_step": 74254, "epoch": 1767} {"train_loss": -6.091499056134905, "global_step": 74255, "epoch": 1767, "val_loss": 61884.81640625} {"train_loss": -6.082148551940918, "global_step": 74256, "epoch": 1768} {"train_loss": -6.239530563354492, "global_step": 74257, "epoch": 1768} {"train_loss": -6.069057464599609, "global_step": 74258, "epoch": 1768} {"train_loss": -6.151256084442139, "global_step": 74259, "epoch": 1768} {"train_loss": -6.050440788269043, "global_step": 74260, "epoch": 1768} {"train_loss": -6.031911373138428, "global_step": 74261, "epoch": 1768} {"train_loss": -6.140604496002197, "global_step": 74262, "epoch": 1768} {"train_loss": -6.001175403594971, "global_step": 74263, "epoch": 1768} {"train_loss": -6.011828899383545, "global_step": 74264, "epoch": 1768} {"train_loss": -6.1458845138549805, "global_step": 74265, "epoch": 1768} {"train_loss": -6.066925525665283, "global_step": 74266, "epoch": 1768} {"train_loss": -6.076861381530762, "global_step": 74267, "epoch": 1768} {"train_loss": -6.1642632484436035, "global_step": 74268, "epoch": 1768} {"train_loss": -6.088902473449707, "global_step": 74269, "epoch": 1768} {"train_loss": -6.1859283447265625, "global_step": 74270, "epoch": 1768} {"train_loss": -6.085227012634277, "global_step": 74271, "epoch": 1768} {"train_loss": -6.003082275390625, "global_step": 74272, "epoch": 1768} {"train_loss": -6.04746150970459, "global_step": 74273, "epoch": 1768} {"train_loss": -6.079514503479004, "global_step": 74274, "epoch": 1768} {"train_loss": -6.073259353637695, "global_step": 74275, "epoch": 1768} {"train_loss": -6.148314476013184, "global_step": 74276, "epoch": 1768} {"train_loss": -6.032210826873779, "global_step": 74277, "epoch": 1768} {"train_loss": -6.103607654571533, "global_step": 74278, "epoch": 1768} {"train_loss": -5.85152530670166, "global_step": 74279, "epoch": 1768} {"train_loss": -6.072806358337402, "global_step": 74280, "epoch": 1768} {"train_loss": -5.958417892456055, "global_step": 74281, "epoch": 1768} {"train_loss": -5.959317207336426, "global_step": 74282, "epoch": 1768} {"train_loss": -6.121640205383301, "global_step": 74283, "epoch": 1768} {"train_loss": -5.966353416442871, "global_step": 74284, "epoch": 1768} {"train_loss": -6.064870834350586, "global_step": 74285, "epoch": 1768} {"train_loss": -6.0382466316223145, "global_step": 74286, "epoch": 1768} {"train_loss": -6.001792907714844, "global_step": 74287, "epoch": 1768} {"train_loss": -6.19792366027832, "global_step": 74288, "epoch": 1768} {"train_loss": -6.088278293609619, "global_step": 74289, "epoch": 1768} {"train_loss": -6.063873291015625, "global_step": 74290, "epoch": 1768} {"train_loss": -6.010034084320068, "global_step": 74291, "epoch": 1768} {"train_loss": -5.990696907043457, "global_step": 74292, "epoch": 1768} {"train_loss": -6.070590972900391, "global_step": 74293, "epoch": 1768} {"train_loss": -6.15494441986084, "global_step": 74294, "epoch": 1768} {"train_loss": -6.124286651611328, "global_step": 74295, "epoch": 1768} {"train_loss": -6.115328311920166, "global_step": 74296, "epoch": 1768} {"train_loss": -6.073285488855271, "global_step": 74297, "epoch": 1768, "val_loss": 61774.51953125} {"train_loss": -6.269105434417725, "global_step": 74298, "epoch": 1769} {"train_loss": -6.167873382568359, "global_step": 74299, "epoch": 1769} {"train_loss": -6.169953346252441, "global_step": 74300, "epoch": 1769} {"train_loss": -6.051980018615723, "global_step": 74301, "epoch": 1769} {"train_loss": -6.079804420471191, "global_step": 74302, "epoch": 1769} {"train_loss": -6.0676398277282715, "global_step": 74303, "epoch": 1769} {"train_loss": -6.156909465789795, "global_step": 74304, "epoch": 1769} {"train_loss": -6.146251678466797, "global_step": 74305, "epoch": 1769} {"train_loss": -5.890120029449463, "global_step": 74306, "epoch": 1769} {"train_loss": -6.114474296569824, "global_step": 74307, "epoch": 1769} {"train_loss": -6.096581935882568, "global_step": 74308, "epoch": 1769} {"train_loss": -5.981244087219238, "global_step": 74309, "epoch": 1769} {"train_loss": -5.979101181030273, "global_step": 74310, "epoch": 1769} {"train_loss": -6.164312362670898, "global_step": 74311, "epoch": 1769} {"train_loss": -6.06242036819458, "global_step": 74312, "epoch": 1769} {"train_loss": -6.020413398742676, "global_step": 74313, "epoch": 1769} {"train_loss": -6.017180442810059, "global_step": 74314, "epoch": 1769} {"train_loss": -5.889289855957031, "global_step": 74315, "epoch": 1769} {"train_loss": -5.993544101715088, "global_step": 74316, "epoch": 1769} {"train_loss": -6.115848541259766, "global_step": 74317, "epoch": 1769} {"train_loss": -5.98513650894165, "global_step": 74318, "epoch": 1769} {"train_loss": -6.075715065002441, "global_step": 74319, "epoch": 1769} {"train_loss": -6.085247039794922, "global_step": 74320, "epoch": 1769} {"train_loss": -6.060097694396973, "global_step": 74321, "epoch": 1769} {"train_loss": -6.224911689758301, "global_step": 74322, "epoch": 1769} {"train_loss": -6.074351787567139, "global_step": 74323, "epoch": 1769} {"train_loss": -6.094639778137207, "global_step": 74324, "epoch": 1769} {"train_loss": -6.1784868240356445, "global_step": 74325, "epoch": 1769} {"train_loss": -6.133066177368164, "global_step": 74326, "epoch": 1769} {"train_loss": -6.022910118103027, "global_step": 74327, "epoch": 1769} {"train_loss": -6.148143768310547, "global_step": 74328, "epoch": 1769} {"train_loss": -5.9937334060668945, "global_step": 74329, "epoch": 1769} {"train_loss": -6.079751014709473, "global_step": 74330, "epoch": 1769} {"train_loss": -6.006508827209473, "global_step": 74331, "epoch": 1769} {"train_loss": -6.056577205657959, "global_step": 74332, "epoch": 1769} {"train_loss": -6.081048965454102, "global_step": 74333, "epoch": 1769} {"train_loss": -5.924284934997559, "global_step": 74334, "epoch": 1769} {"train_loss": -6.105312347412109, "global_step": 74335, "epoch": 1769} {"train_loss": -6.045304298400879, "global_step": 74336, "epoch": 1769} {"train_loss": -6.101997375488281, "global_step": 74337, "epoch": 1769} {"train_loss": -6.009513854980469, "global_step": 74338, "epoch": 1769} {"train_loss": -6.072602362859817, "global_step": 74339, "epoch": 1769, "val_loss": 62022.640625} {"train_loss": -6.035248279571533, "global_step": 74340, "epoch": 1770} {"train_loss": -6.117345809936523, "global_step": 74341, "epoch": 1770} {"train_loss": -6.0550360679626465, "global_step": 74342, "epoch": 1770} {"train_loss": -6.032688140869141, "global_step": 74343, "epoch": 1770} {"train_loss": -6.058494567871094, "global_step": 74344, "epoch": 1770} {"train_loss": -6.096724510192871, "global_step": 74345, "epoch": 1770} {"train_loss": -6.1365966796875, "global_step": 74346, "epoch": 1770} {"train_loss": -6.176691055297852, "global_step": 74347, "epoch": 1770} {"train_loss": -6.043906211853027, "global_step": 74348, "epoch": 1770} {"train_loss": -6.086737632751465, "global_step": 74349, "epoch": 1770} {"train_loss": -6.065125465393066, "global_step": 74350, "epoch": 1770} {"train_loss": -6.068552017211914, "global_step": 74351, "epoch": 1770} {"train_loss": -6.022644996643066, "global_step": 74352, "epoch": 1770} {"train_loss": -6.145809173583984, "global_step": 74353, "epoch": 1770} {"train_loss": -6.12447452545166, "global_step": 74354, "epoch": 1770} {"train_loss": -5.932276248931885, "global_step": 74355, "epoch": 1770} {"train_loss": -6.197081565856934, "global_step": 74356, "epoch": 1770} {"train_loss": -6.039541244506836, "global_step": 74357, "epoch": 1770} {"train_loss": -6.089936256408691, "global_step": 74358, "epoch": 1770} {"train_loss": -6.10566520690918, "global_step": 74359, "epoch": 1770} {"train_loss": -6.085630893707275, "global_step": 74360, "epoch": 1770} {"train_loss": -6.094629287719727, "global_step": 74361, "epoch": 1770} {"train_loss": -5.992069244384766, "global_step": 74362, "epoch": 1770} {"train_loss": -6.055517196655273, "global_step": 74363, "epoch": 1770} {"train_loss": -6.075921058654785, "global_step": 74364, "epoch": 1770} {"train_loss": -6.042232513427734, "global_step": 74365, "epoch": 1770} {"train_loss": -6.208514213562012, "global_step": 74366, "epoch": 1770} {"train_loss": -6.0231547355651855, "global_step": 74367, "epoch": 1770} {"train_loss": -6.047608375549316, "global_step": 74368, "epoch": 1770} {"train_loss": -6.120117664337158, "global_step": 74369, "epoch": 1770} {"train_loss": -6.111292362213135, "global_step": 74370, "epoch": 1770} {"train_loss": -6.163805961608887, "global_step": 74371, "epoch": 1770} {"train_loss": -6.110068321228027, "global_step": 74372, "epoch": 1770} {"train_loss": -6.138765335083008, "global_step": 74373, "epoch": 1770} {"train_loss": -6.017668724060059, "global_step": 74374, "epoch": 1770} {"train_loss": -6.108451843261719, "global_step": 74375, "epoch": 1770} {"train_loss": -6.124939441680908, "global_step": 74376, "epoch": 1770} {"train_loss": -6.166299819946289, "global_step": 74377, "epoch": 1770} {"train_loss": -6.079219818115234, "global_step": 74378, "epoch": 1770} {"train_loss": -5.959028244018555, "global_step": 74379, "epoch": 1770} {"train_loss": -6.064690113067627, "global_step": 74380, "epoch": 1770} {"train_loss": -6.084610291889736, "global_step": 74381, "epoch": 1770, "val_loss": 62041.90625} {"train_loss": -6.09129524230957, "global_step": 74382, "epoch": 1771} {"train_loss": -6.065974712371826, "global_step": 74383, "epoch": 1771} {"train_loss": -5.973730564117432, "global_step": 74384, "epoch": 1771} {"train_loss": -6.085232734680176, "global_step": 74385, "epoch": 1771} {"train_loss": -6.012328147888184, "global_step": 74386, "epoch": 1771} {"train_loss": -6.062261581420898, "global_step": 74387, "epoch": 1771} {"train_loss": -6.047236442565918, "global_step": 74388, "epoch": 1771} {"train_loss": -6.067338466644287, "global_step": 74389, "epoch": 1771} {"train_loss": -6.06893253326416, "global_step": 74390, "epoch": 1771} {"train_loss": -6.154921531677246, "global_step": 74391, "epoch": 1771} {"train_loss": -6.071621894836426, "global_step": 74392, "epoch": 1771} {"train_loss": -6.099513530731201, "global_step": 74393, "epoch": 1771} {"train_loss": -6.115830421447754, "global_step": 74394, "epoch": 1771} {"train_loss": -5.980644226074219, "global_step": 74395, "epoch": 1771} {"train_loss": -6.1909332275390625, "global_step": 74396, "epoch": 1771} {"train_loss": -6.049545764923096, "global_step": 74397, "epoch": 1771} {"train_loss": -6.001156330108643, "global_step": 74398, "epoch": 1771} {"train_loss": -6.0488200187683105, "global_step": 74399, "epoch": 1771} {"train_loss": -6.098024368286133, "global_step": 74400, "epoch": 1771} {"train_loss": -6.095109939575195, "global_step": 74401, "epoch": 1771} {"train_loss": -5.9908342361450195, "global_step": 74402, "epoch": 1771} {"train_loss": -6.052238941192627, "global_step": 74403, "epoch": 1771} {"train_loss": -6.119139671325684, "global_step": 74404, "epoch": 1771} {"train_loss": -6.190464019775391, "global_step": 74405, "epoch": 1771} {"train_loss": -5.943514823913574, "global_step": 74406, "epoch": 1771} {"train_loss": -6.133499622344971, "global_step": 74407, "epoch": 1771} {"train_loss": -5.990598678588867, "global_step": 74408, "epoch": 1771} {"train_loss": -5.915862560272217, "global_step": 74409, "epoch": 1771} {"train_loss": -6.063124656677246, "global_step": 74410, "epoch": 1771} {"train_loss": -6.023411750793457, "global_step": 74411, "epoch": 1771} {"train_loss": -6.0919880867004395, "global_step": 74412, "epoch": 1771} {"train_loss": -6.026400566101074, "global_step": 74413, "epoch": 1771} {"train_loss": -6.072417259216309, "global_step": 74414, "epoch": 1771} {"train_loss": -5.961184978485107, "global_step": 74415, "epoch": 1771} {"train_loss": -6.002810478210449, "global_step": 74416, "epoch": 1771} {"train_loss": -6.136433124542236, "global_step": 74417, "epoch": 1771} {"train_loss": -6.069550514221191, "global_step": 74418, "epoch": 1771} {"train_loss": -5.969849586486816, "global_step": 74419, "epoch": 1771} {"train_loss": -6.003748416900635, "global_step": 74420, "epoch": 1771} {"train_loss": -6.058643341064453, "global_step": 74421, "epoch": 1771} {"train_loss": -6.033407688140869, "global_step": 74422, "epoch": 1771} {"train_loss": -6.052981581006732, "global_step": 74423, "epoch": 1771, "val_loss": 61767.5234375} {"train_loss": -6.130559921264648, "global_step": 74424, "epoch": 1772} {"train_loss": -6.134071350097656, "global_step": 74425, "epoch": 1772} {"train_loss": -6.067136764526367, "global_step": 74426, "epoch": 1772} {"train_loss": -6.100261688232422, "global_step": 74427, "epoch": 1772} {"train_loss": -5.956608772277832, "global_step": 74428, "epoch": 1772} {"train_loss": -6.118374824523926, "global_step": 74429, "epoch": 1772} {"train_loss": -6.0592145919799805, "global_step": 74430, "epoch": 1772} {"train_loss": -6.01805305480957, "global_step": 74431, "epoch": 1772} {"train_loss": -6.058414459228516, "global_step": 74432, "epoch": 1772} {"train_loss": -6.1172990798950195, "global_step": 74433, "epoch": 1772} {"train_loss": -6.087406158447266, "global_step": 74434, "epoch": 1772} {"train_loss": -6.163844108581543, "global_step": 74435, "epoch": 1772} {"train_loss": -6.045156002044678, "global_step": 74436, "epoch": 1772} {"train_loss": -6.014690399169922, "global_step": 74437, "epoch": 1772} {"train_loss": -6.120619773864746, "global_step": 74438, "epoch": 1772} {"train_loss": -6.123966217041016, "global_step": 74439, "epoch": 1772} {"train_loss": -6.0660600662231445, "global_step": 74440, "epoch": 1772} {"train_loss": -6.148751258850098, "global_step": 74441, "epoch": 1772} {"train_loss": -5.979964256286621, "global_step": 74442, "epoch": 1772} {"train_loss": -6.110073089599609, "global_step": 74443, "epoch": 1772} {"train_loss": -6.095316410064697, "global_step": 74444, "epoch": 1772} {"train_loss": -6.043826103210449, "global_step": 74445, "epoch": 1772} {"train_loss": -6.043160915374756, "global_step": 74446, "epoch": 1772} {"train_loss": -6.116626739501953, "global_step": 74447, "epoch": 1772} {"train_loss": -6.040775299072266, "global_step": 74448, "epoch": 1772} {"train_loss": -5.893119812011719, "global_step": 74449, "epoch": 1772} {"train_loss": -6.0792236328125, "global_step": 74450, "epoch": 1772} {"train_loss": -6.070237159729004, "global_step": 74451, "epoch": 1772} {"train_loss": -6.101972579956055, "global_step": 74452, "epoch": 1772} {"train_loss": -6.155346393585205, "global_step": 74453, "epoch": 1772} {"train_loss": -5.997905254364014, "global_step": 74454, "epoch": 1772} {"train_loss": -6.139693260192871, "global_step": 74455, "epoch": 1772} {"train_loss": -6.080223083496094, "global_step": 74456, "epoch": 1772} {"train_loss": -6.1279120445251465, "global_step": 74457, "epoch": 1772} {"train_loss": -6.15148401260376, "global_step": 74458, "epoch": 1772} {"train_loss": -6.053972244262695, "global_step": 74459, "epoch": 1772} {"train_loss": -6.011455535888672, "global_step": 74460, "epoch": 1772} {"train_loss": -6.124205589294434, "global_step": 74461, "epoch": 1772} {"train_loss": -6.16215705871582, "global_step": 74462, "epoch": 1772} {"train_loss": -6.2160491943359375, "global_step": 74463, "epoch": 1772} {"train_loss": -6.184082984924316, "global_step": 74464, "epoch": 1772} {"train_loss": -6.086408013389224, "global_step": 74465, "epoch": 1772, "val_loss": 61787.22265625} {"train_loss": -6.080648422241211, "global_step": 74466, "epoch": 1773} {"train_loss": -6.0383758544921875, "global_step": 74467, "epoch": 1773} {"train_loss": -6.196916103363037, "global_step": 74468, "epoch": 1773} {"train_loss": -6.094160079956055, "global_step": 74469, "epoch": 1773} {"train_loss": -5.978133201599121, "global_step": 74470, "epoch": 1773} {"train_loss": -6.151906967163086, "global_step": 74471, "epoch": 1773} {"train_loss": -6.1118903160095215, "global_step": 74472, "epoch": 1773} {"train_loss": -6.0385026931762695, "global_step": 74473, "epoch": 1773} {"train_loss": -6.066193580627441, "global_step": 74474, "epoch": 1773} {"train_loss": -6.119612693786621, "global_step": 74475, "epoch": 1773} {"train_loss": -6.121950149536133, "global_step": 74476, "epoch": 1773} {"train_loss": -6.085322856903076, "global_step": 74477, "epoch": 1773} {"train_loss": -6.169185638427734, "global_step": 74478, "epoch": 1773} {"train_loss": -6.087776184082031, "global_step": 74479, "epoch": 1773} {"train_loss": -5.986826419830322, "global_step": 74480, "epoch": 1773} {"train_loss": -6.075474739074707, "global_step": 74481, "epoch": 1773} {"train_loss": -6.054811954498291, "global_step": 74482, "epoch": 1773} {"train_loss": -5.966383457183838, "global_step": 74483, "epoch": 1773} {"train_loss": -6.098767280578613, "global_step": 74484, "epoch": 1773} {"train_loss": -6.0394134521484375, "global_step": 74485, "epoch": 1773} {"train_loss": -6.146974563598633, "global_step": 74486, "epoch": 1773} {"train_loss": -6.083051681518555, "global_step": 74487, "epoch": 1773} {"train_loss": -6.076936721801758, "global_step": 74488, "epoch": 1773} {"train_loss": -6.102346420288086, "global_step": 74489, "epoch": 1773} {"train_loss": -6.0132646560668945, "global_step": 74490, "epoch": 1773} {"train_loss": -6.018701553344727, "global_step": 74491, "epoch": 1773} {"train_loss": -6.100715637207031, "global_step": 74492, "epoch": 1773} {"train_loss": -6.212264537811279, "global_step": 74493, "epoch": 1773} {"train_loss": -6.107856750488281, "global_step": 74494, "epoch": 1773} {"train_loss": -6.043708324432373, "global_step": 74495, "epoch": 1773} {"train_loss": -6.120089530944824, "global_step": 74496, "epoch": 1773} {"train_loss": -6.195914268493652, "global_step": 74497, "epoch": 1773} {"train_loss": -6.274819850921631, "global_step": 74498, "epoch": 1773} {"train_loss": -6.126064300537109, "global_step": 74499, "epoch": 1773} {"train_loss": -6.10776424407959, "global_step": 74500, "epoch": 1773} {"train_loss": -6.056353569030762, "global_step": 74501, "epoch": 1773} {"train_loss": -6.134990692138672, "global_step": 74502, "epoch": 1773} {"train_loss": -6.033559799194336, "global_step": 74503, "epoch": 1773} {"train_loss": -6.2131242752075195, "global_step": 74504, "epoch": 1773} {"train_loss": -6.049934387207031, "global_step": 74505, "epoch": 1773} {"train_loss": -6.213295936584473, "global_step": 74506, "epoch": 1773} {"train_loss": -6.09909116654169, "global_step": 74507, "epoch": 1773, "val_loss": 62065.11328125} {"train_loss": -6.006648540496826, "global_step": 74508, "epoch": 1774} {"train_loss": -6.109763145446777, "global_step": 74509, "epoch": 1774} {"train_loss": -6.099822044372559, "global_step": 74510, "epoch": 1774} {"train_loss": -6.03916072845459, "global_step": 74511, "epoch": 1774} {"train_loss": -6.059699058532715, "global_step": 74512, "epoch": 1774} {"train_loss": -6.08748722076416, "global_step": 74513, "epoch": 1774} {"train_loss": -6.165833473205566, "global_step": 74514, "epoch": 1774} {"train_loss": -6.072964668273926, "global_step": 74515, "epoch": 1774} {"train_loss": -6.051939964294434, "global_step": 74516, "epoch": 1774} {"train_loss": -6.109955787658691, "global_step": 74517, "epoch": 1774} {"train_loss": -6.087876796722412, "global_step": 74518, "epoch": 1774} {"train_loss": -6.123612880706787, "global_step": 74519, "epoch": 1774} {"train_loss": -6.090909004211426, "global_step": 74520, "epoch": 1774} {"train_loss": -5.946468353271484, "global_step": 74521, "epoch": 1774} {"train_loss": -6.08085823059082, "global_step": 74522, "epoch": 1774} {"train_loss": -6.0425004959106445, "global_step": 74523, "epoch": 1774} {"train_loss": -6.075921535491943, "global_step": 74524, "epoch": 1774} {"train_loss": -6.1788177490234375, "global_step": 74525, "epoch": 1774} {"train_loss": -6.179294109344482, "global_step": 74526, "epoch": 1774} {"train_loss": -6.11200475692749, "global_step": 74527, "epoch": 1774} {"train_loss": -6.046902179718018, "global_step": 74528, "epoch": 1774} {"train_loss": -6.197493553161621, "global_step": 74529, "epoch": 1774} {"train_loss": -6.039556503295898, "global_step": 74530, "epoch": 1774} {"train_loss": -6.132755756378174, "global_step": 74531, "epoch": 1774} {"train_loss": -5.904008865356445, "global_step": 74532, "epoch": 1774} {"train_loss": -5.955965995788574, "global_step": 74533, "epoch": 1774} {"train_loss": -5.949292182922363, "global_step": 74534, "epoch": 1774} {"train_loss": -6.104793548583984, "global_step": 74535, "epoch": 1774} {"train_loss": -6.041792869567871, "global_step": 74536, "epoch": 1774} {"train_loss": -6.181734085083008, "global_step": 74537, "epoch": 1774} {"train_loss": -5.976175308227539, "global_step": 74538, "epoch": 1774} {"train_loss": -5.945000648498535, "global_step": 74539, "epoch": 1774} {"train_loss": -6.025308609008789, "global_step": 74540, "epoch": 1774} {"train_loss": -6.026541233062744, "global_step": 74541, "epoch": 1774} {"train_loss": -6.065525054931641, "global_step": 74542, "epoch": 1774} {"train_loss": -6.121028900146484, "global_step": 74543, "epoch": 1774} {"train_loss": -5.995053768157959, "global_step": 74544, "epoch": 1774} {"train_loss": -6.050796031951904, "global_step": 74545, "epoch": 1774} {"train_loss": -5.976565361022949, "global_step": 74546, "epoch": 1774} {"train_loss": -6.095478057861328, "global_step": 74547, "epoch": 1774} {"train_loss": -5.94046688079834, "global_step": 74548, "epoch": 1774} {"train_loss": -6.058793522062755, "global_step": 74549, "epoch": 1774, "val_loss": 62184.5625} {"train_loss": -6.02866268157959, "global_step": 74550, "epoch": 1775} {"train_loss": -6.029971599578857, "global_step": 74551, "epoch": 1775} {"train_loss": -6.091024398803711, "global_step": 74552, "epoch": 1775} {"train_loss": -5.953758239746094, "global_step": 74553, "epoch": 1775} {"train_loss": -6.164820671081543, "global_step": 74554, "epoch": 1775} {"train_loss": -6.024752616882324, "global_step": 74555, "epoch": 1775} {"train_loss": -6.091161251068115, "global_step": 74556, "epoch": 1775} {"train_loss": -6.131960868835449, "global_step": 74557, "epoch": 1775} {"train_loss": -5.929858207702637, "global_step": 74558, "epoch": 1775} {"train_loss": -6.087160110473633, "global_step": 74559, "epoch": 1775} {"train_loss": -6.161466598510742, "global_step": 74560, "epoch": 1775} {"train_loss": -6.022038459777832, "global_step": 74561, "epoch": 1775} {"train_loss": -5.99560022354126, "global_step": 74562, "epoch": 1775} {"train_loss": -6.044848442077637, "global_step": 74563, "epoch": 1775} {"train_loss": -5.976017951965332, "global_step": 74564, "epoch": 1775} {"train_loss": -6.054924964904785, "global_step": 74565, "epoch": 1775} {"train_loss": -6.128396987915039, "global_step": 74566, "epoch": 1775} {"train_loss": -6.130215167999268, "global_step": 74567, "epoch": 1775} {"train_loss": -5.902829647064209, "global_step": 74568, "epoch": 1775} {"train_loss": -6.110752582550049, "global_step": 74569, "epoch": 1775} {"train_loss": -6.055300712585449, "global_step": 74570, "epoch": 1775} {"train_loss": -6.062767505645752, "global_step": 74571, "epoch": 1775} {"train_loss": -6.116335868835449, "global_step": 74572, "epoch": 1775} {"train_loss": -6.123561382293701, "global_step": 74573, "epoch": 1775} {"train_loss": -6.142526626586914, "global_step": 74574, "epoch": 1775} {"train_loss": -6.166400909423828, "global_step": 74575, "epoch": 1775} {"train_loss": -6.059156894683838, "global_step": 74576, "epoch": 1775} {"train_loss": -6.103330612182617, "global_step": 74577, "epoch": 1775} {"train_loss": -6.0350446701049805, "global_step": 74578, "epoch": 1775} {"train_loss": -6.071341514587402, "global_step": 74579, "epoch": 1775} {"train_loss": -6.048747539520264, "global_step": 74580, "epoch": 1775} {"train_loss": -6.057738304138184, "global_step": 74581, "epoch": 1775} {"train_loss": -6.125269889831543, "global_step": 74582, "epoch": 1775} {"train_loss": -6.1356611251831055, "global_step": 74583, "epoch": 1775} {"train_loss": -6.162028789520264, "global_step": 74584, "epoch": 1775} {"train_loss": -6.115177631378174, "global_step": 74585, "epoch": 1775} {"train_loss": -6.190566539764404, "global_step": 74586, "epoch": 1775} {"train_loss": -5.983034133911133, "global_step": 74587, "epoch": 1775} {"train_loss": -6.103075981140137, "global_step": 74588, "epoch": 1775} {"train_loss": -6.00200080871582, "global_step": 74589, "epoch": 1775} {"train_loss": -5.997503280639648, "global_step": 74590, "epoch": 1775} {"train_loss": -6.0698117188044955, "global_step": 74591, "epoch": 1775, "val_loss": 61908.14453125} {"train_loss": -6.072864055633545, "global_step": 74592, "epoch": 1776} {"train_loss": -6.030210971832275, "global_step": 74593, "epoch": 1776} {"train_loss": -6.042782783508301, "global_step": 74594, "epoch": 1776} {"train_loss": -6.0715789794921875, "global_step": 74595, "epoch": 1776} {"train_loss": -6.042741298675537, "global_step": 74596, "epoch": 1776} {"train_loss": -6.160105228424072, "global_step": 74597, "epoch": 1776} {"train_loss": -6.149342060089111, "global_step": 74598, "epoch": 1776} {"train_loss": -5.96364688873291, "global_step": 74599, "epoch": 1776} {"train_loss": -6.138664245605469, "global_step": 74600, "epoch": 1776} {"train_loss": -6.1796979904174805, "global_step": 74601, "epoch": 1776} {"train_loss": -6.084173202514648, "global_step": 74602, "epoch": 1776} {"train_loss": -6.061592102050781, "global_step": 74603, "epoch": 1776} {"train_loss": -6.138387680053711, "global_step": 74604, "epoch": 1776} {"train_loss": -6.138611316680908, "global_step": 74605, "epoch": 1776} {"train_loss": -6.136751174926758, "global_step": 74606, "epoch": 1776} {"train_loss": -6.119078636169434, "global_step": 74607, "epoch": 1776} {"train_loss": -6.122445106506348, "global_step": 74608, "epoch": 1776} {"train_loss": -6.104001998901367, "global_step": 74609, "epoch": 1776} {"train_loss": -6.073355197906494, "global_step": 74610, "epoch": 1776} {"train_loss": -6.070444107055664, "global_step": 74611, "epoch": 1776} {"train_loss": -6.112313270568848, "global_step": 74612, "epoch": 1776} {"train_loss": -6.065825462341309, "global_step": 74613, "epoch": 1776} {"train_loss": -6.1706390380859375, "global_step": 74614, "epoch": 1776} {"train_loss": -6.009517669677734, "global_step": 74615, "epoch": 1776} {"train_loss": -6.104381084442139, "global_step": 74616, "epoch": 1776} {"train_loss": -6.1916375160217285, "global_step": 74617, "epoch": 1776} {"train_loss": -5.985328674316406, "global_step": 74618, "epoch": 1776} {"train_loss": -6.267332077026367, "global_step": 74619, "epoch": 1776} {"train_loss": -6.22938871383667, "global_step": 74620, "epoch": 1776} {"train_loss": -6.278387069702148, "global_step": 74621, "epoch": 1776} {"train_loss": -5.933877944946289, "global_step": 74622, "epoch": 1776} {"train_loss": -6.107741355895996, "global_step": 74623, "epoch": 1776} {"train_loss": -6.0809831619262695, "global_step": 74624, "epoch": 1776} {"train_loss": -6.047122001647949, "global_step": 74625, "epoch": 1776} {"train_loss": -6.106122970581055, "global_step": 74626, "epoch": 1776} {"train_loss": -6.044576644897461, "global_step": 74627, "epoch": 1776} {"train_loss": -6.04231595993042, "global_step": 74628, "epoch": 1776} {"train_loss": -5.878996849060059, "global_step": 74629, "epoch": 1776} {"train_loss": -5.9518141746521, "global_step": 74630, "epoch": 1776} {"train_loss": -5.787044048309326, "global_step": 74631, "epoch": 1776} {"train_loss": -6.00400447845459, "global_step": 74632, "epoch": 1776} {"train_loss": -6.078501349403744, "global_step": 74633, "epoch": 1776, "val_loss": 61998.1953125} {"train_loss": -6.1222243309021, "global_step": 74634, "epoch": 1777} {"train_loss": -6.194300651550293, "global_step": 74635, "epoch": 1777} {"train_loss": -6.067910194396973, "global_step": 74636, "epoch": 1777} {"train_loss": -6.126678466796875, "global_step": 74637, "epoch": 1777} {"train_loss": -6.113404273986816, "global_step": 74638, "epoch": 1777} {"train_loss": -6.0330047607421875, "global_step": 74639, "epoch": 1777} {"train_loss": -6.0918660163879395, "global_step": 74640, "epoch": 1777} {"train_loss": -6.091164588928223, "global_step": 74641, "epoch": 1777} {"train_loss": -6.0308661460876465, "global_step": 74642, "epoch": 1777} {"train_loss": -6.305574893951416, "global_step": 74643, "epoch": 1777} {"train_loss": -6.082717418670654, "global_step": 74644, "epoch": 1777} {"train_loss": -6.156858444213867, "global_step": 74645, "epoch": 1777} {"train_loss": -6.269804000854492, "global_step": 74646, "epoch": 1777} {"train_loss": -6.042261123657227, "global_step": 74647, "epoch": 1777} {"train_loss": -6.083959102630615, "global_step": 74648, "epoch": 1777} {"train_loss": -6.0620880126953125, "global_step": 74649, "epoch": 1777} {"train_loss": -6.078160285949707, "global_step": 74650, "epoch": 1777} {"train_loss": -6.060988903045654, "global_step": 74651, "epoch": 1777} {"train_loss": -6.037322044372559, "global_step": 74652, "epoch": 1777} {"train_loss": -6.024257183074951, "global_step": 74653, "epoch": 1777} {"train_loss": -6.061149597167969, "global_step": 74654, "epoch": 1777} {"train_loss": -6.04498815536499, "global_step": 74655, "epoch": 1777} {"train_loss": -6.026034355163574, "global_step": 74656, "epoch": 1777} {"train_loss": -6.074615478515625, "global_step": 74657, "epoch": 1777} {"train_loss": -5.991127014160156, "global_step": 74658, "epoch": 1777} {"train_loss": -6.0290679931640625, "global_step": 74659, "epoch": 1777} {"train_loss": -6.005154132843018, "global_step": 74660, "epoch": 1777} {"train_loss": -5.987193584442139, "global_step": 74661, "epoch": 1777} {"train_loss": -6.03262996673584, "global_step": 74662, "epoch": 1777} {"train_loss": -5.920679569244385, "global_step": 74663, "epoch": 1777} {"train_loss": -6.034584045410156, "global_step": 74664, "epoch": 1777} {"train_loss": -6.102573394775391, "global_step": 74665, "epoch": 1777} {"train_loss": -6.130526542663574, "global_step": 74666, "epoch": 1777} {"train_loss": -6.116926193237305, "global_step": 74667, "epoch": 1777} {"train_loss": -6.013991832733154, "global_step": 74668, "epoch": 1777} {"train_loss": -6.037551403045654, "global_step": 74669, "epoch": 1777} {"train_loss": -6.031350135803223, "global_step": 74670, "epoch": 1777} {"train_loss": -6.10638427734375, "global_step": 74671, "epoch": 1777} {"train_loss": -6.194060325622559, "global_step": 74672, "epoch": 1777} {"train_loss": -5.980720520019531, "global_step": 74673, "epoch": 1777} {"train_loss": -6.136083602905273, "global_step": 74674, "epoch": 1777} {"train_loss": -6.076375620705741, "global_step": 74675, "epoch": 1777, "val_loss": 61929.98046875} {"train_loss": -6.033209323883057, "global_step": 74676, "epoch": 1778} {"train_loss": -6.1033735275268555, "global_step": 74677, "epoch": 1778} {"train_loss": -6.012594223022461, "global_step": 74678, "epoch": 1778} {"train_loss": -6.132465362548828, "global_step": 74679, "epoch": 1778} {"train_loss": -6.053699493408203, "global_step": 74680, "epoch": 1778} {"train_loss": -6.044088363647461, "global_step": 74681, "epoch": 1778} {"train_loss": -6.008201599121094, "global_step": 74682, "epoch": 1778} {"train_loss": -6.111635208129883, "global_step": 74683, "epoch": 1778} {"train_loss": -6.0237884521484375, "global_step": 74684, "epoch": 1778} {"train_loss": -6.006246566772461, "global_step": 74685, "epoch": 1778} {"train_loss": -6.033027172088623, "global_step": 74686, "epoch": 1778} {"train_loss": -6.030652046203613, "global_step": 74687, "epoch": 1778} {"train_loss": -6.055023193359375, "global_step": 74688, "epoch": 1778} {"train_loss": -6.0760087966918945, "global_step": 74689, "epoch": 1778} {"train_loss": -6.086373805999756, "global_step": 74690, "epoch": 1778} {"train_loss": -6.105353832244873, "global_step": 74691, "epoch": 1778} {"train_loss": -6.065914630889893, "global_step": 74692, "epoch": 1778} {"train_loss": -6.065873622894287, "global_step": 74693, "epoch": 1778} {"train_loss": -6.162449836730957, "global_step": 74694, "epoch": 1778} {"train_loss": -6.115018844604492, "global_step": 74695, "epoch": 1778} {"train_loss": -6.165829658508301, "global_step": 74696, "epoch": 1778} {"train_loss": -6.085656642913818, "global_step": 74697, "epoch": 1778} {"train_loss": -6.030374050140381, "global_step": 74698, "epoch": 1778} {"train_loss": -6.075555324554443, "global_step": 74699, "epoch": 1778} {"train_loss": -6.036004066467285, "global_step": 74700, "epoch": 1778} {"train_loss": -5.995547294616699, "global_step": 74701, "epoch": 1778} {"train_loss": -6.102548599243164, "global_step": 74702, "epoch": 1778} {"train_loss": -6.074150085449219, "global_step": 74703, "epoch": 1778} {"train_loss": -6.115335464477539, "global_step": 74704, "epoch": 1778} {"train_loss": -6.037199020385742, "global_step": 74705, "epoch": 1778} {"train_loss": -6.119288444519043, "global_step": 74706, "epoch": 1778} {"train_loss": -6.002313613891602, "global_step": 74707, "epoch": 1778} {"train_loss": -6.131875991821289, "global_step": 74708, "epoch": 1778} {"train_loss": -6.087993144989014, "global_step": 74709, "epoch": 1778} {"train_loss": -6.189727783203125, "global_step": 74710, "epoch": 1778} {"train_loss": -6.104206085205078, "global_step": 74711, "epoch": 1778} {"train_loss": -6.094347953796387, "global_step": 74712, "epoch": 1778} {"train_loss": -6.110851287841797, "global_step": 74713, "epoch": 1778} {"train_loss": -6.252286911010742, "global_step": 74714, "epoch": 1778} {"train_loss": -6.03194522857666, "global_step": 74715, "epoch": 1778} {"train_loss": -6.142367362976074, "global_step": 74716, "epoch": 1778} {"train_loss": -6.080094553175426, "global_step": 74717, "epoch": 1778, "val_loss": 61765.50390625} {"train_loss": -6.067714691162109, "global_step": 74718, "epoch": 1779} {"train_loss": -6.130217552185059, "global_step": 74719, "epoch": 1779} {"train_loss": -6.063694953918457, "global_step": 74720, "epoch": 1779} {"train_loss": -6.098324775695801, "global_step": 74721, "epoch": 1779} {"train_loss": -6.076347351074219, "global_step": 74722, "epoch": 1779} {"train_loss": -6.169844150543213, "global_step": 74723, "epoch": 1779} {"train_loss": -6.023561477661133, "global_step": 74724, "epoch": 1779} {"train_loss": -6.059028148651123, "global_step": 74725, "epoch": 1779} {"train_loss": -6.223094940185547, "global_step": 74726, "epoch": 1779} {"train_loss": -6.101263046264648, "global_step": 74727, "epoch": 1779} {"train_loss": -6.065894603729248, "global_step": 74728, "epoch": 1779} {"train_loss": -6.245532512664795, "global_step": 74729, "epoch": 1779} {"train_loss": -6.0575103759765625, "global_step": 74730, "epoch": 1779} {"train_loss": -6.110879898071289, "global_step": 74731, "epoch": 1779} {"train_loss": -6.126514434814453, "global_step": 74732, "epoch": 1779} {"train_loss": -6.091955184936523, "global_step": 74733, "epoch": 1779} {"train_loss": -6.064606189727783, "global_step": 74734, "epoch": 1779} {"train_loss": -6.1655073165893555, "global_step": 74735, "epoch": 1779} {"train_loss": -6.000158786773682, "global_step": 74736, "epoch": 1779} {"train_loss": -6.033573150634766, "global_step": 74737, "epoch": 1779} {"train_loss": -6.0246171951293945, "global_step": 74738, "epoch": 1779} {"train_loss": -6.0601630210876465, "global_step": 74739, "epoch": 1779} {"train_loss": -5.990301609039307, "global_step": 74740, "epoch": 1779} {"train_loss": -6.113216400146484, "global_step": 74741, "epoch": 1779} {"train_loss": -5.979938507080078, "global_step": 74742, "epoch": 1779} {"train_loss": -6.088626384735107, "global_step": 74743, "epoch": 1779} {"train_loss": -6.05401611328125, "global_step": 74744, "epoch": 1779} {"train_loss": -6.045557975769043, "global_step": 74745, "epoch": 1779} {"train_loss": -6.033209800720215, "global_step": 74746, "epoch": 1779} {"train_loss": -5.962380886077881, "global_step": 74747, "epoch": 1779} {"train_loss": -6.116871356964111, "global_step": 74748, "epoch": 1779} {"train_loss": -6.036782741546631, "global_step": 74749, "epoch": 1779} {"train_loss": -5.952147006988525, "global_step": 74750, "epoch": 1779} {"train_loss": -6.067608833312988, "global_step": 74751, "epoch": 1779} {"train_loss": -6.064302444458008, "global_step": 74752, "epoch": 1779} {"train_loss": -5.937586307525635, "global_step": 74753, "epoch": 1779} {"train_loss": -5.959893703460693, "global_step": 74754, "epoch": 1779} {"train_loss": -6.033815383911133, "global_step": 74755, "epoch": 1779} {"train_loss": -6.155007362365723, "global_step": 74756, "epoch": 1779} {"train_loss": -5.980985641479492, "global_step": 74757, "epoch": 1779} {"train_loss": -6.15617561340332, "global_step": 74758, "epoch": 1779} {"train_loss": -6.064108678272793, "global_step": 74759, "epoch": 1779, "val_loss": 61802.1796875} {"train_loss": -6.057392597198486, "global_step": 74760, "epoch": 1780} {"train_loss": -6.102712631225586, "global_step": 74761, "epoch": 1780} {"train_loss": -6.0997161865234375, "global_step": 74762, "epoch": 1780} {"train_loss": -6.121757507324219, "global_step": 74763, "epoch": 1780} {"train_loss": -6.049252510070801, "global_step": 74764, "epoch": 1780} {"train_loss": -6.0623579025268555, "global_step": 74765, "epoch": 1780} {"train_loss": -6.008772373199463, "global_step": 74766, "epoch": 1780} {"train_loss": -6.087640762329102, "global_step": 74767, "epoch": 1780} {"train_loss": -6.1257853507995605, "global_step": 74768, "epoch": 1780} {"train_loss": -6.089259147644043, "global_step": 74769, "epoch": 1780} {"train_loss": -6.0676798820495605, "global_step": 74770, "epoch": 1780} {"train_loss": -6.04203987121582, "global_step": 74771, "epoch": 1780} {"train_loss": -6.068840503692627, "global_step": 74772, "epoch": 1780} {"train_loss": -6.13968563079834, "global_step": 74773, "epoch": 1780} {"train_loss": -6.123719215393066, "global_step": 74774, "epoch": 1780} {"train_loss": -6.11092472076416, "global_step": 74775, "epoch": 1780} {"train_loss": -6.220240592956543, "global_step": 74776, "epoch": 1780} {"train_loss": -6.0778608322143555, "global_step": 74777, "epoch": 1780} {"train_loss": -5.91855001449585, "global_step": 74778, "epoch": 1780} {"train_loss": -6.110568523406982, "global_step": 74779, "epoch": 1780} {"train_loss": -5.963296890258789, "global_step": 74780, "epoch": 1780} {"train_loss": -6.033621311187744, "global_step": 74781, "epoch": 1780} {"train_loss": -6.034080505371094, "global_step": 74782, "epoch": 1780} {"train_loss": -6.0334320068359375, "global_step": 74783, "epoch": 1780} {"train_loss": -6.08989143371582, "global_step": 74784, "epoch": 1780} {"train_loss": -6.120419979095459, "global_step": 74785, "epoch": 1780} {"train_loss": -6.070470333099365, "global_step": 74786, "epoch": 1780} {"train_loss": -6.085104942321777, "global_step": 74787, "epoch": 1780} {"train_loss": -6.1406049728393555, "global_step": 74788, "epoch": 1780} {"train_loss": -6.179823875427246, "global_step": 74789, "epoch": 1780} {"train_loss": -6.078341484069824, "global_step": 74790, "epoch": 1780} {"train_loss": -6.167276382446289, "global_step": 74791, "epoch": 1780} {"train_loss": -6.141544342041016, "global_step": 74792, "epoch": 1780} {"train_loss": -6.069390296936035, "global_step": 74793, "epoch": 1780} {"train_loss": -6.113224983215332, "global_step": 74794, "epoch": 1780} {"train_loss": -6.027028560638428, "global_step": 74795, "epoch": 1780} {"train_loss": -6.083096504211426, "global_step": 74796, "epoch": 1780} {"train_loss": -6.132152557373047, "global_step": 74797, "epoch": 1780} {"train_loss": -6.168646335601807, "global_step": 74798, "epoch": 1780} {"train_loss": -6.133976936340332, "global_step": 74799, "epoch": 1780} {"train_loss": -6.031220436096191, "global_step": 74800, "epoch": 1780} {"train_loss": -6.086087465286255, "global_step": 74801, "epoch": 1780, "val_loss": 61815.58984375} {"train_loss": -6.135035037994385, "global_step": 74802, "epoch": 1781} {"train_loss": -6.036170959472656, "global_step": 74803, "epoch": 1781} {"train_loss": -6.021742343902588, "global_step": 74804, "epoch": 1781} {"train_loss": -6.099865913391113, "global_step": 74805, "epoch": 1781} {"train_loss": -6.124950885772705, "global_step": 74806, "epoch": 1781} {"train_loss": -6.013689994812012, "global_step": 74807, "epoch": 1781} {"train_loss": -6.056234359741211, "global_step": 74808, "epoch": 1781} {"train_loss": -5.966591835021973, "global_step": 74809, "epoch": 1781} {"train_loss": -6.037600517272949, "global_step": 74810, "epoch": 1781} {"train_loss": -6.107813835144043, "global_step": 74811, "epoch": 1781} {"train_loss": -5.965285301208496, "global_step": 74812, "epoch": 1781} {"train_loss": -6.054063320159912, "global_step": 74813, "epoch": 1781} {"train_loss": -6.080795764923096, "global_step": 74814, "epoch": 1781} {"train_loss": -6.009498596191406, "global_step": 74815, "epoch": 1781} {"train_loss": -6.04479455947876, "global_step": 74816, "epoch": 1781} {"train_loss": -6.067242622375488, "global_step": 74817, "epoch": 1781} {"train_loss": -6.017576694488525, "global_step": 74818, "epoch": 1781} {"train_loss": -6.144285678863525, "global_step": 74819, "epoch": 1781} {"train_loss": -6.111906051635742, "global_step": 74820, "epoch": 1781} {"train_loss": -6.052177429199219, "global_step": 74821, "epoch": 1781} {"train_loss": -6.089237213134766, "global_step": 74822, "epoch": 1781} {"train_loss": -6.121776103973389, "global_step": 74823, "epoch": 1781} {"train_loss": -6.059484481811523, "global_step": 74824, "epoch": 1781} {"train_loss": -5.966651916503906, "global_step": 74825, "epoch": 1781} {"train_loss": -6.053186893463135, "global_step": 74826, "epoch": 1781} {"train_loss": -6.051235675811768, "global_step": 74827, "epoch": 1781} {"train_loss": -5.939070701599121, "global_step": 74828, "epoch": 1781} {"train_loss": -5.923576354980469, "global_step": 74829, "epoch": 1781} {"train_loss": -6.037132263183594, "global_step": 74830, "epoch": 1781} {"train_loss": -6.079720497131348, "global_step": 74831, "epoch": 1781} {"train_loss": -6.02311372756958, "global_step": 74832, "epoch": 1781} {"train_loss": -6.059976577758789, "global_step": 74833, "epoch": 1781} {"train_loss": -6.009799003601074, "global_step": 74834, "epoch": 1781} {"train_loss": -6.065831184387207, "global_step": 74835, "epoch": 1781} {"train_loss": -6.124056339263916, "global_step": 74836, "epoch": 1781} {"train_loss": -6.005209922790527, "global_step": 74837, "epoch": 1781} {"train_loss": -6.086822509765625, "global_step": 74838, "epoch": 1781} {"train_loss": -6.186460494995117, "global_step": 74839, "epoch": 1781} {"train_loss": -6.067839622497559, "global_step": 74840, "epoch": 1781} {"train_loss": -6.0027689933776855, "global_step": 74841, "epoch": 1781} {"train_loss": -6.0760345458984375, "global_step": 74842, "epoch": 1781} {"train_loss": -6.052832705633981, "global_step": 74843, "epoch": 1781, "val_loss": 61666.07421875} {"train_loss": -6.0056257247924805, "global_step": 74844, "epoch": 1782} {"train_loss": -6.071502685546875, "global_step": 74845, "epoch": 1782} {"train_loss": -6.113523483276367, "global_step": 74846, "epoch": 1782} {"train_loss": -6.051523208618164, "global_step": 74847, "epoch": 1782} {"train_loss": -6.155237674713135, "global_step": 74848, "epoch": 1782} {"train_loss": -6.204148769378662, "global_step": 74849, "epoch": 1782} {"train_loss": -6.080265998840332, "global_step": 74850, "epoch": 1782} {"train_loss": -6.03382682800293, "global_step": 74851, "epoch": 1782} {"train_loss": -6.119002342224121, "global_step": 74852, "epoch": 1782} {"train_loss": -6.027705192565918, "global_step": 74853, "epoch": 1782} {"train_loss": -6.00008487701416, "global_step": 74854, "epoch": 1782} {"train_loss": -6.128657817840576, "global_step": 74855, "epoch": 1782} {"train_loss": -5.908168792724609, "global_step": 74856, "epoch": 1782} {"train_loss": -6.241321563720703, "global_step": 74857, "epoch": 1782} {"train_loss": -5.954473972320557, "global_step": 74858, "epoch": 1782} {"train_loss": -5.970599174499512, "global_step": 74859, "epoch": 1782} {"train_loss": -6.100088119506836, "global_step": 74860, "epoch": 1782} {"train_loss": -6.027148723602295, "global_step": 74861, "epoch": 1782} {"train_loss": -5.9938507080078125, "global_step": 74862, "epoch": 1782} {"train_loss": -6.000695705413818, "global_step": 74863, "epoch": 1782} {"train_loss": -6.118213653564453, "global_step": 74864, "epoch": 1782} {"train_loss": -6.053534507751465, "global_step": 74865, "epoch": 1782} {"train_loss": -6.158051490783691, "global_step": 74866, "epoch": 1782} {"train_loss": -6.010424613952637, "global_step": 74867, "epoch": 1782} {"train_loss": -6.0092058181762695, "global_step": 74868, "epoch": 1782} {"train_loss": -6.025623321533203, "global_step": 74869, "epoch": 1782} {"train_loss": -6.063721656799316, "global_step": 74870, "epoch": 1782} {"train_loss": -6.051386833190918, "global_step": 74871, "epoch": 1782} {"train_loss": -6.006413459777832, "global_step": 74872, "epoch": 1782} {"train_loss": -5.999000549316406, "global_step": 74873, "epoch": 1782} {"train_loss": -6.201015472412109, "global_step": 74874, "epoch": 1782} {"train_loss": -6.056238174438477, "global_step": 74875, "epoch": 1782} {"train_loss": -6.064468860626221, "global_step": 74876, "epoch": 1782} {"train_loss": -6.125533103942871, "global_step": 74877, "epoch": 1782} {"train_loss": -6.100091934204102, "global_step": 74878, "epoch": 1782} {"train_loss": -6.085044860839844, "global_step": 74879, "epoch": 1782} {"train_loss": -6.017283916473389, "global_step": 74880, "epoch": 1782} {"train_loss": -6.004541873931885, "global_step": 74881, "epoch": 1782} {"train_loss": -6.077620506286621, "global_step": 74882, "epoch": 1782} {"train_loss": -6.118870735168457, "global_step": 74883, "epoch": 1782} {"train_loss": -6.0101213455200195, "global_step": 74884, "epoch": 1782} {"train_loss": -6.064547936121623, "global_step": 74885, "epoch": 1782, "val_loss": 62029.59765625} {"train_loss": -6.013230323791504, "global_step": 74886, "epoch": 1783} {"train_loss": -6.092254638671875, "global_step": 74887, "epoch": 1783} {"train_loss": -6.183503150939941, "global_step": 74888, "epoch": 1783} {"train_loss": -6.141856670379639, "global_step": 74889, "epoch": 1783} {"train_loss": -6.014354705810547, "global_step": 74890, "epoch": 1783} {"train_loss": -6.051196098327637, "global_step": 74891, "epoch": 1783} {"train_loss": -6.100647449493408, "global_step": 74892, "epoch": 1783} {"train_loss": -6.097414970397949, "global_step": 74893, "epoch": 1783} {"train_loss": -6.0480194091796875, "global_step": 74894, "epoch": 1783} {"train_loss": -5.934047698974609, "global_step": 74895, "epoch": 1783} {"train_loss": -5.992815971374512, "global_step": 74896, "epoch": 1783} {"train_loss": -6.053049087524414, "global_step": 74897, "epoch": 1783} {"train_loss": -6.054344177246094, "global_step": 74898, "epoch": 1783} {"train_loss": -6.132540702819824, "global_step": 74899, "epoch": 1783} {"train_loss": -5.990853309631348, "global_step": 74900, "epoch": 1783} {"train_loss": -5.9519195556640625, "global_step": 74901, "epoch": 1783} {"train_loss": -6.165682792663574, "global_step": 74902, "epoch": 1783} {"train_loss": -5.916287899017334, "global_step": 74903, "epoch": 1783} {"train_loss": -5.937624931335449, "global_step": 74904, "epoch": 1783} {"train_loss": -6.088246822357178, "global_step": 74905, "epoch": 1783} {"train_loss": -6.041375160217285, "global_step": 74906, "epoch": 1783} {"train_loss": -6.033568859100342, "global_step": 74907, "epoch": 1783} {"train_loss": -6.117832183837891, "global_step": 74908, "epoch": 1783} {"train_loss": -6.08049201965332, "global_step": 74909, "epoch": 1783} {"train_loss": -6.078182697296143, "global_step": 74910, "epoch": 1783} {"train_loss": -6.168013095855713, "global_step": 74911, "epoch": 1783} {"train_loss": -6.134095668792725, "global_step": 74912, "epoch": 1783} {"train_loss": -6.010604381561279, "global_step": 74913, "epoch": 1783} {"train_loss": -6.059546947479248, "global_step": 74914, "epoch": 1783} {"train_loss": -6.203524589538574, "global_step": 74915, "epoch": 1783} {"train_loss": -6.140013217926025, "global_step": 74916, "epoch": 1783} {"train_loss": -6.124186038970947, "global_step": 74917, "epoch": 1783} {"train_loss": -6.103821754455566, "global_step": 74918, "epoch": 1783} {"train_loss": -6.134504795074463, "global_step": 74919, "epoch": 1783} {"train_loss": -6.192754745483398, "global_step": 74920, "epoch": 1783} {"train_loss": -6.148637771606445, "global_step": 74921, "epoch": 1783} {"train_loss": -6.06119966506958, "global_step": 74922, "epoch": 1783} {"train_loss": -6.090333938598633, "global_step": 74923, "epoch": 1783} {"train_loss": -6.13704776763916, "global_step": 74924, "epoch": 1783} {"train_loss": -6.107761383056641, "global_step": 74925, "epoch": 1783} {"train_loss": -6.191651344299316, "global_step": 74926, "epoch": 1783} {"train_loss": -6.080186117263067, "global_step": 74927, "epoch": 1783, "val_loss": 61999.37109375} {"train_loss": -6.096548080444336, "global_step": 74928, "epoch": 1784} {"train_loss": -6.154999732971191, "global_step": 74929, "epoch": 1784} {"train_loss": -6.0703630447387695, "global_step": 74930, "epoch": 1784} {"train_loss": -6.046045303344727, "global_step": 74931, "epoch": 1784} {"train_loss": -6.028541088104248, "global_step": 74932, "epoch": 1784} {"train_loss": -6.067378044128418, "global_step": 74933, "epoch": 1784} {"train_loss": -6.013381004333496, "global_step": 74934, "epoch": 1784} {"train_loss": -6.200259685516357, "global_step": 74935, "epoch": 1784} {"train_loss": -5.904430866241455, "global_step": 74936, "epoch": 1784} {"train_loss": -6.095800399780273, "global_step": 74937, "epoch": 1784} {"train_loss": -6.019386291503906, "global_step": 74938, "epoch": 1784} {"train_loss": -6.0746636390686035, "global_step": 74939, "epoch": 1784} {"train_loss": -5.992774963378906, "global_step": 74940, "epoch": 1784} {"train_loss": -6.046290397644043, "global_step": 74941, "epoch": 1784} {"train_loss": -6.1864190101623535, "global_step": 74942, "epoch": 1784} {"train_loss": -6.163495063781738, "global_step": 74943, "epoch": 1784} {"train_loss": -6.0226335525512695, "global_step": 74944, "epoch": 1784} {"train_loss": -6.077169418334961, "global_step": 74945, "epoch": 1784} {"train_loss": -6.053661346435547, "global_step": 74946, "epoch": 1784} {"train_loss": -6.173178195953369, "global_step": 74947, "epoch": 1784} {"train_loss": -6.153617858886719, "global_step": 74948, "epoch": 1784} {"train_loss": -6.187843322753906, "global_step": 74949, "epoch": 1784} {"train_loss": -6.097928047180176, "global_step": 74950, "epoch": 1784} {"train_loss": -6.131921768188477, "global_step": 74951, "epoch": 1784} {"train_loss": -6.019562721252441, "global_step": 74952, "epoch": 1784} {"train_loss": -6.097752571105957, "global_step": 74953, "epoch": 1784} {"train_loss": -5.998096942901611, "global_step": 74954, "epoch": 1784} {"train_loss": -5.966582775115967, "global_step": 74955, "epoch": 1784} {"train_loss": -6.072522163391113, "global_step": 74956, "epoch": 1784} {"train_loss": -6.157755374908447, "global_step": 74957, "epoch": 1784} {"train_loss": -6.063220977783203, "global_step": 74958, "epoch": 1784} {"train_loss": -6.242999076843262, "global_step": 74959, "epoch": 1784} {"train_loss": -5.923000335693359, "global_step": 74960, "epoch": 1784} {"train_loss": -6.0101213455200195, "global_step": 74961, "epoch": 1784} {"train_loss": -6.091923713684082, "global_step": 74962, "epoch": 1784} {"train_loss": -6.009068489074707, "global_step": 74963, "epoch": 1784} {"train_loss": -6.1051836013793945, "global_step": 74964, "epoch": 1784} {"train_loss": -6.055978775024414, "global_step": 74965, "epoch": 1784} {"train_loss": -6.0418548583984375, "global_step": 74966, "epoch": 1784} {"train_loss": -6.017794609069824, "global_step": 74967, "epoch": 1784} {"train_loss": -5.93474006652832, "global_step": 74968, "epoch": 1784} {"train_loss": -6.069949036552792, "global_step": 74969, "epoch": 1784, "val_loss": 62049.59375} {"train_loss": -6.022926330566406, "global_step": 74970, "epoch": 1785} {"train_loss": -5.978265762329102, "global_step": 74971, "epoch": 1785} {"train_loss": -6.087995529174805, "global_step": 74972, "epoch": 1785} {"train_loss": -6.079421520233154, "global_step": 74973, "epoch": 1785} {"train_loss": -6.1200971603393555, "global_step": 74974, "epoch": 1785} {"train_loss": -6.125531196594238, "global_step": 74975, "epoch": 1785} {"train_loss": -6.026583194732666, "global_step": 74976, "epoch": 1785} {"train_loss": -6.201718330383301, "global_step": 74977, "epoch": 1785} {"train_loss": -5.975426197052002, "global_step": 74978, "epoch": 1785} {"train_loss": -6.124736785888672, "global_step": 74979, "epoch": 1785} {"train_loss": -6.080437660217285, "global_step": 74980, "epoch": 1785} {"train_loss": -6.035167694091797, "global_step": 74981, "epoch": 1785} {"train_loss": -6.1785454750061035, "global_step": 74982, "epoch": 1785} {"train_loss": -6.149957656860352, "global_step": 74983, "epoch": 1785} {"train_loss": -6.000001430511475, "global_step": 74984, "epoch": 1785} {"train_loss": -6.052772045135498, "global_step": 74985, "epoch": 1785} {"train_loss": -6.147312164306641, "global_step": 74986, "epoch": 1785} {"train_loss": -6.177377700805664, "global_step": 74987, "epoch": 1785} {"train_loss": -6.02718448638916, "global_step": 74988, "epoch": 1785} {"train_loss": -6.223150253295898, "global_step": 74989, "epoch": 1785} {"train_loss": -6.031525611877441, "global_step": 74990, "epoch": 1785} {"train_loss": -6.158934116363525, "global_step": 74991, "epoch": 1785} {"train_loss": -6.1002607345581055, "global_step": 74992, "epoch": 1785} {"train_loss": -6.104081630706787, "global_step": 74993, "epoch": 1785} {"train_loss": -6.164652347564697, "global_step": 74994, "epoch": 1785} {"train_loss": -6.199095249176025, "global_step": 74995, "epoch": 1785} {"train_loss": -6.168337345123291, "global_step": 74996, "epoch": 1785} {"train_loss": -6.1775994300842285, "global_step": 74997, "epoch": 1785} {"train_loss": -6.100218296051025, "global_step": 74998, "epoch": 1785} {"train_loss": -6.052533149719238, "global_step": 74999, "epoch": 1785} {"train_loss": -6.156128406524658, "global_step": 75000, "epoch": 1785} {"train_loss": -6.0940093994140625, "global_step": 75001, "epoch": 1785} {"train_loss": -6.056780815124512, "global_step": 75002, "epoch": 1785} {"train_loss": -6.2027106285095215, "global_step": 75003, "epoch": 1785} {"train_loss": -5.900991439819336, "global_step": 75004, "epoch": 1785} {"train_loss": -6.040122985839844, "global_step": 75005, "epoch": 1785} {"train_loss": -6.081464767456055, "global_step": 75006, "epoch": 1785} {"train_loss": -6.010167121887207, "global_step": 75007, "epoch": 1785} {"train_loss": -5.9268059730529785, "global_step": 75008, "epoch": 1785} {"train_loss": -5.97426700592041, "global_step": 75009, "epoch": 1785} {"train_loss": -6.093300819396973, "global_step": 75010, "epoch": 1785} {"train_loss": -6.089519489379156, "global_step": 75011, "epoch": 1785, "val_loss": 62040.41015625} {"train_loss": -6.109297752380371, "global_step": 75012, "epoch": 1786} {"train_loss": -6.183419227600098, "global_step": 75013, "epoch": 1786} {"train_loss": -5.967171669006348, "global_step": 75014, "epoch": 1786} {"train_loss": -6.12457275390625, "global_step": 75015, "epoch": 1786} {"train_loss": -6.008687496185303, "global_step": 75016, "epoch": 1786} {"train_loss": -6.161873817443848, "global_step": 75017, "epoch": 1786} {"train_loss": -6.129590034484863, "global_step": 75018, "epoch": 1786} {"train_loss": -6.094013214111328, "global_step": 75019, "epoch": 1786} {"train_loss": -6.179914474487305, "global_step": 75020, "epoch": 1786} {"train_loss": -6.098759174346924, "global_step": 75021, "epoch": 1786} {"train_loss": -6.16562557220459, "global_step": 75022, "epoch": 1786} {"train_loss": -6.198158264160156, "global_step": 75023, "epoch": 1786} {"train_loss": -6.1787109375, "global_step": 75024, "epoch": 1786} {"train_loss": -6.125200271606445, "global_step": 75025, "epoch": 1786} {"train_loss": -6.131669998168945, "global_step": 75026, "epoch": 1786} {"train_loss": -6.187279224395752, "global_step": 75027, "epoch": 1786} {"train_loss": -6.1344685554504395, "global_step": 75028, "epoch": 1786} {"train_loss": -6.0605268478393555, "global_step": 75029, "epoch": 1786} {"train_loss": -6.129336357116699, "global_step": 75030, "epoch": 1786} {"train_loss": -6.1229963302612305, "global_step": 75031, "epoch": 1786} {"train_loss": -6.046274185180664, "global_step": 75032, "epoch": 1786} {"train_loss": -6.200326919555664, "global_step": 75033, "epoch": 1786} {"train_loss": -6.236454963684082, "global_step": 75034, "epoch": 1786} {"train_loss": -6.099646091461182, "global_step": 75035, "epoch": 1786} {"train_loss": -6.189597129821777, "global_step": 75036, "epoch": 1786} {"train_loss": -6.080591678619385, "global_step": 75037, "epoch": 1786} {"train_loss": -6.044921398162842, "global_step": 75038, "epoch": 1786} {"train_loss": -6.12326717376709, "global_step": 75039, "epoch": 1786} {"train_loss": -6.202101707458496, "global_step": 75040, "epoch": 1786} {"train_loss": -6.1092424392700195, "global_step": 75041, "epoch": 1786} {"train_loss": -6.087869644165039, "global_step": 75042, "epoch": 1786} {"train_loss": -6.089061260223389, "global_step": 75043, "epoch": 1786} {"train_loss": -6.107449054718018, "global_step": 75044, "epoch": 1786} {"train_loss": -6.072452545166016, "global_step": 75045, "epoch": 1786} {"train_loss": -6.01224422454834, "global_step": 75046, "epoch": 1786} {"train_loss": -6.185008525848389, "global_step": 75047, "epoch": 1786} {"train_loss": -5.963537216186523, "global_step": 75048, "epoch": 1786} {"train_loss": -6.078248023986816, "global_step": 75049, "epoch": 1786} {"train_loss": -6.021320819854736, "global_step": 75050, "epoch": 1786} {"train_loss": -5.998485088348389, "global_step": 75051, "epoch": 1786} {"train_loss": -6.0861921310424805, "global_step": 75052, "epoch": 1786} {"train_loss": -6.110985699154082, "global_step": 75053, "epoch": 1786, "val_loss": 62075.6640625} {"train_loss": -6.068429470062256, "global_step": 75054, "epoch": 1787} {"train_loss": -6.125205993652344, "global_step": 75055, "epoch": 1787} {"train_loss": -6.156335830688477, "global_step": 75056, "epoch": 1787} {"train_loss": -6.031850814819336, "global_step": 75057, "epoch": 1787} {"train_loss": -6.071222305297852, "global_step": 75058, "epoch": 1787} {"train_loss": -5.9906005859375, "global_step": 75059, "epoch": 1787} {"train_loss": -6.188482284545898, "global_step": 75060, "epoch": 1787} {"train_loss": -6.099423885345459, "global_step": 75061, "epoch": 1787} {"train_loss": -6.000072479248047, "global_step": 75062, "epoch": 1787} {"train_loss": -6.087469577789307, "global_step": 75063, "epoch": 1787} {"train_loss": -6.189411640167236, "global_step": 75064, "epoch": 1787} {"train_loss": -6.032415866851807, "global_step": 75065, "epoch": 1787} {"train_loss": -6.115681171417236, "global_step": 75066, "epoch": 1787} {"train_loss": -6.032559871673584, "global_step": 75067, "epoch": 1787} {"train_loss": -6.082596778869629, "global_step": 75068, "epoch": 1787} {"train_loss": -6.038297653198242, "global_step": 75069, "epoch": 1787} {"train_loss": -6.085366249084473, "global_step": 75070, "epoch": 1787} {"train_loss": -6.100157737731934, "global_step": 75071, "epoch": 1787} {"train_loss": -6.0593767166137695, "global_step": 75072, "epoch": 1787} {"train_loss": -6.120060920715332, "global_step": 75073, "epoch": 1787} {"train_loss": -6.06112813949585, "global_step": 75074, "epoch": 1787} {"train_loss": -6.080541610717773, "global_step": 75075, "epoch": 1787} {"train_loss": -6.207278251647949, "global_step": 75076, "epoch": 1787} {"train_loss": -6.184478759765625, "global_step": 75077, "epoch": 1787} {"train_loss": -6.14618444442749, "global_step": 75078, "epoch": 1787} {"train_loss": -6.088405609130859, "global_step": 75079, "epoch": 1787} {"train_loss": -5.976415634155273, "global_step": 75080, "epoch": 1787} {"train_loss": -6.149103164672852, "global_step": 75081, "epoch": 1787} {"train_loss": -6.12899112701416, "global_step": 75082, "epoch": 1787} {"train_loss": -6.092806816101074, "global_step": 75083, "epoch": 1787} {"train_loss": -6.1147308349609375, "global_step": 75084, "epoch": 1787} {"train_loss": -6.075203895568848, "global_step": 75085, "epoch": 1787} {"train_loss": -6.126956939697266, "global_step": 75086, "epoch": 1787} {"train_loss": -6.111091613769531, "global_step": 75087, "epoch": 1787} {"train_loss": -6.056778907775879, "global_step": 75088, "epoch": 1787} {"train_loss": -6.11263370513916, "global_step": 75089, "epoch": 1787} {"train_loss": -6.0429792404174805, "global_step": 75090, "epoch": 1787} {"train_loss": -6.260095596313477, "global_step": 75091, "epoch": 1787} {"train_loss": -6.0563435554504395, "global_step": 75092, "epoch": 1787} {"train_loss": -6.170888900756836, "global_step": 75093, "epoch": 1787} {"train_loss": -6.085905075073242, "global_step": 75094, "epoch": 1787} {"train_loss": -6.0968361014411565, "global_step": 75095, "epoch": 1787, "val_loss": 62040.38671875} {"train_loss": -6.107160568237305, "global_step": 75096, "epoch": 1788} {"train_loss": -6.0618181228637695, "global_step": 75097, "epoch": 1788} {"train_loss": -6.116819381713867, "global_step": 75098, "epoch": 1788} {"train_loss": -6.117159366607666, "global_step": 75099, "epoch": 1788} {"train_loss": -6.192287445068359, "global_step": 75100, "epoch": 1788} {"train_loss": -6.117396354675293, "global_step": 75101, "epoch": 1788} {"train_loss": -5.908443450927734, "global_step": 75102, "epoch": 1788} {"train_loss": -6.201298713684082, "global_step": 75103, "epoch": 1788} {"train_loss": -6.105950832366943, "global_step": 75104, "epoch": 1788} {"train_loss": -6.219211101531982, "global_step": 75105, "epoch": 1788} {"train_loss": -6.026704788208008, "global_step": 75106, "epoch": 1788} {"train_loss": -6.04814338684082, "global_step": 75107, "epoch": 1788} {"train_loss": -6.1704254150390625, "global_step": 75108, "epoch": 1788} {"train_loss": -6.102167129516602, "global_step": 75109, "epoch": 1788} {"train_loss": -6.104022026062012, "global_step": 75110, "epoch": 1788} {"train_loss": -6.109918594360352, "global_step": 75111, "epoch": 1788} {"train_loss": -5.987853527069092, "global_step": 75112, "epoch": 1788} {"train_loss": -6.0792236328125, "global_step": 75113, "epoch": 1788} {"train_loss": -6.121504783630371, "global_step": 75114, "epoch": 1788} {"train_loss": -6.055478096008301, "global_step": 75115, "epoch": 1788} {"train_loss": -6.041681289672852, "global_step": 75116, "epoch": 1788} {"train_loss": -6.182060241699219, "global_step": 75117, "epoch": 1788} {"train_loss": -6.031481742858887, "global_step": 75118, "epoch": 1788} {"train_loss": -6.085257530212402, "global_step": 75119, "epoch": 1788} {"train_loss": -6.075893402099609, "global_step": 75120, "epoch": 1788} {"train_loss": -6.053650856018066, "global_step": 75121, "epoch": 1788} {"train_loss": -6.12980318069458, "global_step": 75122, "epoch": 1788} {"train_loss": -6.256582260131836, "global_step": 75123, "epoch": 1788} {"train_loss": -6.071080207824707, "global_step": 75124, "epoch": 1788} {"train_loss": -6.116015911102295, "global_step": 75125, "epoch": 1788} {"train_loss": -6.1453351974487305, "global_step": 75126, "epoch": 1788} {"train_loss": -6.0506415367126465, "global_step": 75127, "epoch": 1788} {"train_loss": -6.188060760498047, "global_step": 75128, "epoch": 1788} {"train_loss": -6.050899505615234, "global_step": 75129, "epoch": 1788} {"train_loss": -6.047659397125244, "global_step": 75130, "epoch": 1788} {"train_loss": -6.011727333068848, "global_step": 75131, "epoch": 1788} {"train_loss": -6.103915214538574, "global_step": 75132, "epoch": 1788} {"train_loss": -6.1721110343933105, "global_step": 75133, "epoch": 1788} {"train_loss": -6.090414047241211, "global_step": 75134, "epoch": 1788} {"train_loss": -6.08197021484375, "global_step": 75135, "epoch": 1788} {"train_loss": -6.030328750610352, "global_step": 75136, "epoch": 1788} {"train_loss": -6.095517623992193, "global_step": 75137, "epoch": 1788, "val_loss": 61865.859375} {"train_loss": -6.039853096008301, "global_step": 75138, "epoch": 1789} {"train_loss": -6.168340682983398, "global_step": 75139, "epoch": 1789} {"train_loss": -6.164485931396484, "global_step": 75140, "epoch": 1789} {"train_loss": -6.190891265869141, "global_step": 75141, "epoch": 1789} {"train_loss": -6.050553798675537, "global_step": 75142, "epoch": 1789} {"train_loss": -6.017287731170654, "global_step": 75143, "epoch": 1789} {"train_loss": -6.057868957519531, "global_step": 75144, "epoch": 1789} {"train_loss": -5.9841790199279785, "global_step": 75145, "epoch": 1789} {"train_loss": -6.121338367462158, "global_step": 75146, "epoch": 1789} {"train_loss": -5.935421943664551, "global_step": 75147, "epoch": 1789} {"train_loss": -6.100748062133789, "global_step": 75148, "epoch": 1789} {"train_loss": -6.0171709060668945, "global_step": 75149, "epoch": 1789} {"train_loss": -6.085614204406738, "global_step": 75150, "epoch": 1789} {"train_loss": -6.049171447753906, "global_step": 75151, "epoch": 1789} {"train_loss": -6.003298282623291, "global_step": 75152, "epoch": 1789} {"train_loss": -6.076907634735107, "global_step": 75153, "epoch": 1789} {"train_loss": -6.125680923461914, "global_step": 75154, "epoch": 1789} {"train_loss": -6.015557289123535, "global_step": 75155, "epoch": 1789} {"train_loss": -6.105011463165283, "global_step": 75156, "epoch": 1789} {"train_loss": -6.153903007507324, "global_step": 75157, "epoch": 1789} {"train_loss": -6.025444030761719, "global_step": 75158, "epoch": 1789} {"train_loss": -6.086811065673828, "global_step": 75159, "epoch": 1789} {"train_loss": -6.108327865600586, "global_step": 75160, "epoch": 1789} {"train_loss": -6.11578893661499, "global_step": 75161, "epoch": 1789} {"train_loss": -6.078368186950684, "global_step": 75162, "epoch": 1789} {"train_loss": -6.168708801269531, "global_step": 75163, "epoch": 1789} {"train_loss": -6.167226791381836, "global_step": 75164, "epoch": 1789} {"train_loss": -6.11690616607666, "global_step": 75165, "epoch": 1789} {"train_loss": -6.071001052856445, "global_step": 75166, "epoch": 1789} {"train_loss": -6.050787925720215, "global_step": 75167, "epoch": 1789} {"train_loss": -6.10694694519043, "global_step": 75168, "epoch": 1789} {"train_loss": -6.11052131652832, "global_step": 75169, "epoch": 1789} {"train_loss": -6.1705217361450195, "global_step": 75170, "epoch": 1789} {"train_loss": -6.080497741699219, "global_step": 75171, "epoch": 1789} {"train_loss": -6.099489688873291, "global_step": 75172, "epoch": 1789} {"train_loss": -6.114445209503174, "global_step": 75173, "epoch": 1789} {"train_loss": -6.211126327514648, "global_step": 75174, "epoch": 1789} {"train_loss": -6.173884391784668, "global_step": 75175, "epoch": 1789} {"train_loss": -6.091446876525879, "global_step": 75176, "epoch": 1789} {"train_loss": -6.251218795776367, "global_step": 75177, "epoch": 1789} {"train_loss": -6.153902053833008, "global_step": 75178, "epoch": 1789} {"train_loss": -6.097359203156971, "global_step": 75179, "epoch": 1789, "val_loss": 62180.84765625} {"train_loss": -6.144170761108398, "global_step": 75180, "epoch": 1790} {"train_loss": -6.032130241394043, "global_step": 75181, "epoch": 1790} {"train_loss": -6.146507263183594, "global_step": 75182, "epoch": 1790} {"train_loss": -6.067582130432129, "global_step": 75183, "epoch": 1790} {"train_loss": -5.991710662841797, "global_step": 75184, "epoch": 1790} {"train_loss": -6.191766738891602, "global_step": 75185, "epoch": 1790} {"train_loss": -6.1309099197387695, "global_step": 75186, "epoch": 1790} {"train_loss": -6.140137672424316, "global_step": 75187, "epoch": 1790} {"train_loss": -6.022065162658691, "global_step": 75188, "epoch": 1790} {"train_loss": -6.077634811401367, "global_step": 75189, "epoch": 1790} {"train_loss": -6.098518371582031, "global_step": 75190, "epoch": 1790} {"train_loss": -6.105316638946533, "global_step": 75191, "epoch": 1790} {"train_loss": -6.182681083679199, "global_step": 75192, "epoch": 1790} {"train_loss": -6.094621658325195, "global_step": 75193, "epoch": 1790} {"train_loss": -6.136130332946777, "global_step": 75194, "epoch": 1790} {"train_loss": -6.078503131866455, "global_step": 75195, "epoch": 1790} {"train_loss": -6.098667621612549, "global_step": 75196, "epoch": 1790} {"train_loss": -6.089017868041992, "global_step": 75197, "epoch": 1790} {"train_loss": -6.154519081115723, "global_step": 75198, "epoch": 1790} {"train_loss": -6.184803009033203, "global_step": 75199, "epoch": 1790} {"train_loss": -6.010187149047852, "global_step": 75200, "epoch": 1790} {"train_loss": -6.064489841461182, "global_step": 75201, "epoch": 1790} {"train_loss": -6.08870792388916, "global_step": 75202, "epoch": 1790} {"train_loss": -6.1019287109375, "global_step": 75203, "epoch": 1790} {"train_loss": -6.090432167053223, "global_step": 75204, "epoch": 1790} {"train_loss": -6.006108283996582, "global_step": 75205, "epoch": 1790} {"train_loss": -6.080534934997559, "global_step": 75206, "epoch": 1790} {"train_loss": -6.089634895324707, "global_step": 75207, "epoch": 1790} {"train_loss": -6.012685775756836, "global_step": 75208, "epoch": 1790} {"train_loss": -6.100305080413818, "global_step": 75209, "epoch": 1790} {"train_loss": -6.16896915435791, "global_step": 75210, "epoch": 1790} {"train_loss": -6.034910202026367, "global_step": 75211, "epoch": 1790} {"train_loss": -6.052588939666748, "global_step": 75212, "epoch": 1790} {"train_loss": -6.0568742752075195, "global_step": 75213, "epoch": 1790} {"train_loss": -5.987239837646484, "global_step": 75214, "epoch": 1790} {"train_loss": -6.128162384033203, "global_step": 75215, "epoch": 1790} {"train_loss": -6.019972801208496, "global_step": 75216, "epoch": 1790} {"train_loss": -6.084467887878418, "global_step": 75217, "epoch": 1790} {"train_loss": -6.0550432205200195, "global_step": 75218, "epoch": 1790} {"train_loss": -6.203634262084961, "global_step": 75219, "epoch": 1790} {"train_loss": -6.006343364715576, "global_step": 75220, "epoch": 1790} {"train_loss": -6.08854543595087, "global_step": 75221, "epoch": 1790, "val_loss": 62134.1875} {"train_loss": -6.078067779541016, "global_step": 75222, "epoch": 1791} {"train_loss": -6.107719898223877, "global_step": 75223, "epoch": 1791} {"train_loss": -6.053244113922119, "global_step": 75224, "epoch": 1791} {"train_loss": -6.1092376708984375, "global_step": 75225, "epoch": 1791} {"train_loss": -6.070913314819336, "global_step": 75226, "epoch": 1791} {"train_loss": -6.1874775886535645, "global_step": 75227, "epoch": 1791} {"train_loss": -6.07655143737793, "global_step": 75228, "epoch": 1791} {"train_loss": -6.142063617706299, "global_step": 75229, "epoch": 1791} {"train_loss": -6.20211124420166, "global_step": 75230, "epoch": 1791} {"train_loss": -6.061205863952637, "global_step": 75231, "epoch": 1791} {"train_loss": -6.163800239562988, "global_step": 75232, "epoch": 1791} {"train_loss": -6.133569717407227, "global_step": 75233, "epoch": 1791} {"train_loss": -6.108564376831055, "global_step": 75234, "epoch": 1791} {"train_loss": -5.9482526779174805, "global_step": 75235, "epoch": 1791} {"train_loss": -6.068423748016357, "global_step": 75236, "epoch": 1791} {"train_loss": -5.970748424530029, "global_step": 75237, "epoch": 1791} {"train_loss": -6.210392951965332, "global_step": 75238, "epoch": 1791} {"train_loss": -6.109391212463379, "global_step": 75239, "epoch": 1791} {"train_loss": -6.156189918518066, "global_step": 75240, "epoch": 1791} {"train_loss": -6.12191104888916, "global_step": 75241, "epoch": 1791} {"train_loss": -6.1047139167785645, "global_step": 75242, "epoch": 1791} {"train_loss": -6.07427978515625, "global_step": 75243, "epoch": 1791} {"train_loss": -6.085488796234131, "global_step": 75244, "epoch": 1791} {"train_loss": -6.036719799041748, "global_step": 75245, "epoch": 1791} {"train_loss": -6.027905464172363, "global_step": 75246, "epoch": 1791} {"train_loss": -5.98991584777832, "global_step": 75247, "epoch": 1791} {"train_loss": -6.084177017211914, "global_step": 75248, "epoch": 1791} {"train_loss": -6.0789594650268555, "global_step": 75249, "epoch": 1791} {"train_loss": -5.975076198577881, "global_step": 75250, "epoch": 1791} {"train_loss": -6.080004692077637, "global_step": 75251, "epoch": 1791} {"train_loss": -5.9684529304504395, "global_step": 75252, "epoch": 1791} {"train_loss": -6.122415065765381, "global_step": 75253, "epoch": 1791} {"train_loss": -5.997235298156738, "global_step": 75254, "epoch": 1791} {"train_loss": -6.019284248352051, "global_step": 75255, "epoch": 1791} {"train_loss": -6.024446487426758, "global_step": 75256, "epoch": 1791} {"train_loss": -6.095035552978516, "global_step": 75257, "epoch": 1791} {"train_loss": -6.112407684326172, "global_step": 75258, "epoch": 1791} {"train_loss": -6.04957389831543, "global_step": 75259, "epoch": 1791} {"train_loss": -6.066994667053223, "global_step": 75260, "epoch": 1791} {"train_loss": -6.064614772796631, "global_step": 75261, "epoch": 1791} {"train_loss": -6.0792951583862305, "global_step": 75262, "epoch": 1791} {"train_loss": -6.076091868536813, "global_step": 75263, "epoch": 1791, "val_loss": 62007.97265625} {"train_loss": -6.027221202850342, "global_step": 75264, "epoch": 1792} {"train_loss": -6.153486251831055, "global_step": 75265, "epoch": 1792} {"train_loss": -6.109851837158203, "global_step": 75266, "epoch": 1792} {"train_loss": -6.0395097732543945, "global_step": 75267, "epoch": 1792} {"train_loss": -6.104216575622559, "global_step": 75268, "epoch": 1792} {"train_loss": -6.031852722167969, "global_step": 75269, "epoch": 1792} {"train_loss": -5.986266613006592, "global_step": 75270, "epoch": 1792} {"train_loss": -6.090057373046875, "global_step": 75271, "epoch": 1792} {"train_loss": -6.009966850280762, "global_step": 75272, "epoch": 1792} {"train_loss": -6.089786529541016, "global_step": 75273, "epoch": 1792} {"train_loss": -6.070817947387695, "global_step": 75274, "epoch": 1792} {"train_loss": -6.092856407165527, "global_step": 75275, "epoch": 1792} {"train_loss": -6.1255927085876465, "global_step": 75276, "epoch": 1792} {"train_loss": -6.016519546508789, "global_step": 75277, "epoch": 1792} {"train_loss": -6.136386394500732, "global_step": 75278, "epoch": 1792} {"train_loss": -6.029972553253174, "global_step": 75279, "epoch": 1792} {"train_loss": -6.015480041503906, "global_step": 75280, "epoch": 1792} {"train_loss": -6.032829761505127, "global_step": 75281, "epoch": 1792} {"train_loss": -6.0276384353637695, "global_step": 75282, "epoch": 1792} {"train_loss": -6.051609992980957, "global_step": 75283, "epoch": 1792} {"train_loss": -6.059515953063965, "global_step": 75284, "epoch": 1792} {"train_loss": -6.1122941970825195, "global_step": 75285, "epoch": 1792} {"train_loss": -6.031499862670898, "global_step": 75286, "epoch": 1792} {"train_loss": -6.1137495040893555, "global_step": 75287, "epoch": 1792} {"train_loss": -6.068172454833984, "global_step": 75288, "epoch": 1792} {"train_loss": -6.111671447753906, "global_step": 75289, "epoch": 1792} {"train_loss": -5.927207946777344, "global_step": 75290, "epoch": 1792} {"train_loss": -6.089778900146484, "global_step": 75291, "epoch": 1792} {"train_loss": -6.011531829833984, "global_step": 75292, "epoch": 1792} {"train_loss": -6.042145729064941, "global_step": 75293, "epoch": 1792} {"train_loss": -6.019126892089844, "global_step": 75294, "epoch": 1792} {"train_loss": -6.059985637664795, "global_step": 75295, "epoch": 1792} {"train_loss": -6.069286346435547, "global_step": 75296, "epoch": 1792} {"train_loss": -6.119692325592041, "global_step": 75297, "epoch": 1792} {"train_loss": -6.011068820953369, "global_step": 75298, "epoch": 1792} {"train_loss": -5.971000671386719, "global_step": 75299, "epoch": 1792} {"train_loss": -6.036818504333496, "global_step": 75300, "epoch": 1792} {"train_loss": -6.0903639793396, "global_step": 75301, "epoch": 1792} {"train_loss": -6.033495903015137, "global_step": 75302, "epoch": 1792} {"train_loss": -6.039730072021484, "global_step": 75303, "epoch": 1792} {"train_loss": -6.04066276550293, "global_step": 75304, "epoch": 1792} {"train_loss": -6.0553472609747026, "global_step": 75305, "epoch": 1792, "val_loss": 62134.04296875} {"train_loss": -6.170902252197266, "global_step": 75306, "epoch": 1793} {"train_loss": -6.022366523742676, "global_step": 75307, "epoch": 1793} {"train_loss": -6.02476692199707, "global_step": 75308, "epoch": 1793} {"train_loss": -6.092914581298828, "global_step": 75309, "epoch": 1793} {"train_loss": -5.969593048095703, "global_step": 75310, "epoch": 1793} {"train_loss": -6.016602516174316, "global_step": 75311, "epoch": 1793} {"train_loss": -6.108494758605957, "global_step": 75312, "epoch": 1793} {"train_loss": -5.987555027008057, "global_step": 75313, "epoch": 1793} {"train_loss": -6.071346282958984, "global_step": 75314, "epoch": 1793} {"train_loss": -5.944203853607178, "global_step": 75315, "epoch": 1793} {"train_loss": -6.093896865844727, "global_step": 75316, "epoch": 1793} {"train_loss": -5.981402397155762, "global_step": 75317, "epoch": 1793} {"train_loss": -6.149645805358887, "global_step": 75318, "epoch": 1793} {"train_loss": -6.088977336883545, "global_step": 75319, "epoch": 1793} {"train_loss": -6.076244354248047, "global_step": 75320, "epoch": 1793} {"train_loss": -5.960597038269043, "global_step": 75321, "epoch": 1793} {"train_loss": -5.923760890960693, "global_step": 75322, "epoch": 1793} {"train_loss": -6.0891594886779785, "global_step": 75323, "epoch": 1793} {"train_loss": -6.047889709472656, "global_step": 75324, "epoch": 1793} {"train_loss": -6.0224609375, "global_step": 75325, "epoch": 1793} {"train_loss": -5.955410480499268, "global_step": 75326, "epoch": 1793} {"train_loss": -6.0319743156433105, "global_step": 75327, "epoch": 1793} {"train_loss": -6.01589822769165, "global_step": 75328, "epoch": 1793} {"train_loss": -5.931766986846924, "global_step": 75329, "epoch": 1793} {"train_loss": -6.1241044998168945, "global_step": 75330, "epoch": 1793} {"train_loss": -5.999561309814453, "global_step": 75331, "epoch": 1793} {"train_loss": -6.050783157348633, "global_step": 75332, "epoch": 1793} {"train_loss": -6.106870174407959, "global_step": 75333, "epoch": 1793} {"train_loss": -6.0604119300842285, "global_step": 75334, "epoch": 1793} {"train_loss": -6.104032516479492, "global_step": 75335, "epoch": 1793} {"train_loss": -6.056843280792236, "global_step": 75336, "epoch": 1793} {"train_loss": -5.953762531280518, "global_step": 75337, "epoch": 1793} {"train_loss": -5.911223888397217, "global_step": 75338, "epoch": 1793} {"train_loss": -6.056393623352051, "global_step": 75339, "epoch": 1793} {"train_loss": -5.91333532333374, "global_step": 75340, "epoch": 1793} {"train_loss": -6.076332092285156, "global_step": 75341, "epoch": 1793} {"train_loss": -6.227567672729492, "global_step": 75342, "epoch": 1793} {"train_loss": -6.02366828918457, "global_step": 75343, "epoch": 1793} {"train_loss": -6.004764556884766, "global_step": 75344, "epoch": 1793} {"train_loss": -6.132852554321289, "global_step": 75345, "epoch": 1793} {"train_loss": -6.004304885864258, "global_step": 75346, "epoch": 1793} {"train_loss": -6.039744842620123, "global_step": 75347, "epoch": 1793, "val_loss": 62177.05078125} {"train_loss": -6.032676696777344, "global_step": 75348, "epoch": 1794} {"train_loss": -6.076642990112305, "global_step": 75349, "epoch": 1794} {"train_loss": -6.015933036804199, "global_step": 75350, "epoch": 1794} {"train_loss": -6.080880641937256, "global_step": 75351, "epoch": 1794} {"train_loss": -6.099732875823975, "global_step": 75352, "epoch": 1794} {"train_loss": -6.048266410827637, "global_step": 75353, "epoch": 1794} {"train_loss": -6.1472673416137695, "global_step": 75354, "epoch": 1794} {"train_loss": -6.123247146606445, "global_step": 75355, "epoch": 1794} {"train_loss": -6.240679740905762, "global_step": 75356, "epoch": 1794} {"train_loss": -6.026810646057129, "global_step": 75357, "epoch": 1794} {"train_loss": -6.102161884307861, "global_step": 75358, "epoch": 1794} {"train_loss": -5.990621566772461, "global_step": 75359, "epoch": 1794} {"train_loss": -6.172664642333984, "global_step": 75360, "epoch": 1794} {"train_loss": -5.989404678344727, "global_step": 75361, "epoch": 1794} {"train_loss": -6.115945339202881, "global_step": 75362, "epoch": 1794} {"train_loss": -6.128623962402344, "global_step": 75363, "epoch": 1794} {"train_loss": -6.192648410797119, "global_step": 75364, "epoch": 1794} {"train_loss": -6.103791236877441, "global_step": 75365, "epoch": 1794} {"train_loss": -6.130504608154297, "global_step": 75366, "epoch": 1794} {"train_loss": -6.173287391662598, "global_step": 75367, "epoch": 1794} {"train_loss": -6.053549766540527, "global_step": 75368, "epoch": 1794} {"train_loss": -6.061252593994141, "global_step": 75369, "epoch": 1794} {"train_loss": -5.9003167152404785, "global_step": 75370, "epoch": 1794} {"train_loss": -6.203706741333008, "global_step": 75371, "epoch": 1794} {"train_loss": -5.961676597595215, "global_step": 75372, "epoch": 1794} {"train_loss": -6.083045482635498, "global_step": 75373, "epoch": 1794} {"train_loss": -6.021703243255615, "global_step": 75374, "epoch": 1794} {"train_loss": -5.9868388175964355, "global_step": 75375, "epoch": 1794} {"train_loss": -6.154268264770508, "global_step": 75376, "epoch": 1794} {"train_loss": -6.073708534240723, "global_step": 75377, "epoch": 1794} {"train_loss": -6.153006076812744, "global_step": 75378, "epoch": 1794} {"train_loss": -6.152772903442383, "global_step": 75379, "epoch": 1794} {"train_loss": -5.9981303215026855, "global_step": 75380, "epoch": 1794} {"train_loss": -5.98251485824585, "global_step": 75381, "epoch": 1794} {"train_loss": -6.133630275726318, "global_step": 75382, "epoch": 1794} {"train_loss": -5.9443817138671875, "global_step": 75383, "epoch": 1794} {"train_loss": -5.995073318481445, "global_step": 75384, "epoch": 1794} {"train_loss": -6.079290390014648, "global_step": 75385, "epoch": 1794} {"train_loss": -6.120569229125977, "global_step": 75386, "epoch": 1794} {"train_loss": -5.9670867919921875, "global_step": 75387, "epoch": 1794} {"train_loss": -6.156468391418457, "global_step": 75388, "epoch": 1794} {"train_loss": -6.078577529816401, "global_step": 75389, "epoch": 1794, "val_loss": 62299.859375} {"train_loss": -5.919593811035156, "global_step": 75390, "epoch": 1795} {"train_loss": -6.109458923339844, "global_step": 75391, "epoch": 1795} {"train_loss": -6.010252952575684, "global_step": 75392, "epoch": 1795} {"train_loss": -6.012022018432617, "global_step": 75393, "epoch": 1795} {"train_loss": -6.0213942527771, "global_step": 75394, "epoch": 1795} {"train_loss": -6.026462554931641, "global_step": 75395, "epoch": 1795} {"train_loss": -6.111637592315674, "global_step": 75396, "epoch": 1795} {"train_loss": -6.017614364624023, "global_step": 75397, "epoch": 1795} {"train_loss": -6.058575630187988, "global_step": 75398, "epoch": 1795} {"train_loss": -6.254593849182129, "global_step": 75399, "epoch": 1795} {"train_loss": -6.169090270996094, "global_step": 75400, "epoch": 1795} {"train_loss": -6.167667388916016, "global_step": 75401, "epoch": 1795} {"train_loss": -6.120230674743652, "global_step": 75402, "epoch": 1795} {"train_loss": -6.0624847412109375, "global_step": 75403, "epoch": 1795} {"train_loss": -6.06689453125, "global_step": 75404, "epoch": 1795} {"train_loss": -6.060112476348877, "global_step": 75405, "epoch": 1795} {"train_loss": -5.9700117111206055, "global_step": 75406, "epoch": 1795} {"train_loss": -6.072525978088379, "global_step": 75407, "epoch": 1795} {"train_loss": -6.03727912902832, "global_step": 75408, "epoch": 1795} {"train_loss": -5.934370040893555, "global_step": 75409, "epoch": 1795} {"train_loss": -6.039898872375488, "global_step": 75410, "epoch": 1795} {"train_loss": -6.165063858032227, "global_step": 75411, "epoch": 1795} {"train_loss": -6.052297115325928, "global_step": 75412, "epoch": 1795} {"train_loss": -6.008734703063965, "global_step": 75413, "epoch": 1795} {"train_loss": -5.976570129394531, "global_step": 75414, "epoch": 1795} {"train_loss": -5.8182692527771, "global_step": 75415, "epoch": 1795} {"train_loss": -5.82806921005249, "global_step": 75416, "epoch": 1795} {"train_loss": -5.947518348693848, "global_step": 75417, "epoch": 1795} {"train_loss": -5.9877729415893555, "global_step": 75418, "epoch": 1795} {"train_loss": -5.88523530960083, "global_step": 75419, "epoch": 1795} {"train_loss": -5.999334335327148, "global_step": 75420, "epoch": 1795} {"train_loss": -5.962612152099609, "global_step": 75421, "epoch": 1795} {"train_loss": -6.036632061004639, "global_step": 75422, "epoch": 1795} {"train_loss": -6.096574783325195, "global_step": 75423, "epoch": 1795} {"train_loss": -5.990403175354004, "global_step": 75424, "epoch": 1795} {"train_loss": -6.089487075805664, "global_step": 75425, "epoch": 1795} {"train_loss": -6.052037239074707, "global_step": 75426, "epoch": 1795} {"train_loss": -6.009425640106201, "global_step": 75427, "epoch": 1795} {"train_loss": -5.920809745788574, "global_step": 75428, "epoch": 1795} {"train_loss": -6.0720038414001465, "global_step": 75429, "epoch": 1795} {"train_loss": -5.999286651611328, "global_step": 75430, "epoch": 1795} {"train_loss": -6.028256756918771, "global_step": 75431, "epoch": 1795, "val_loss": 62023.78125} {"train_loss": -6.061408519744873, "global_step": 75432, "epoch": 1796} {"train_loss": -5.990133285522461, "global_step": 75433, "epoch": 1796} {"train_loss": -6.105587959289551, "global_step": 75434, "epoch": 1796} {"train_loss": -6.000993728637695, "global_step": 75435, "epoch": 1796} {"train_loss": -6.105402946472168, "global_step": 75436, "epoch": 1796} {"train_loss": -6.17630672454834, "global_step": 75437, "epoch": 1796} {"train_loss": -6.1942596435546875, "global_step": 75438, "epoch": 1796} {"train_loss": -6.099922180175781, "global_step": 75439, "epoch": 1796} {"train_loss": -6.053792953491211, "global_step": 75440, "epoch": 1796} {"train_loss": -6.068366527557373, "global_step": 75441, "epoch": 1796} {"train_loss": -6.034091949462891, "global_step": 75442, "epoch": 1796} {"train_loss": -6.195666313171387, "global_step": 75443, "epoch": 1796} {"train_loss": -6.191201210021973, "global_step": 75444, "epoch": 1796} {"train_loss": -6.134160995483398, "global_step": 75445, "epoch": 1796} {"train_loss": -6.103200435638428, "global_step": 75446, "epoch": 1796} {"train_loss": -6.067718505859375, "global_step": 75447, "epoch": 1796} {"train_loss": -6.130510330200195, "global_step": 75448, "epoch": 1796} {"train_loss": -6.127452850341797, "global_step": 75449, "epoch": 1796} {"train_loss": -6.125699996948242, "global_step": 75450, "epoch": 1796} {"train_loss": -6.102662086486816, "global_step": 75451, "epoch": 1796} {"train_loss": -6.172969818115234, "global_step": 75452, "epoch": 1796} {"train_loss": -6.19776725769043, "global_step": 75453, "epoch": 1796} {"train_loss": -6.081028938293457, "global_step": 75454, "epoch": 1796} {"train_loss": -6.199337005615234, "global_step": 75455, "epoch": 1796} {"train_loss": -5.893659591674805, "global_step": 75456, "epoch": 1796} {"train_loss": -6.020102500915527, "global_step": 75457, "epoch": 1796} {"train_loss": -6.136103630065918, "global_step": 75458, "epoch": 1796} {"train_loss": -6.241670608520508, "global_step": 75459, "epoch": 1796} {"train_loss": -6.056841850280762, "global_step": 75460, "epoch": 1796} {"train_loss": -6.155737400054932, "global_step": 75461, "epoch": 1796} {"train_loss": -6.035490989685059, "global_step": 75462, "epoch": 1796} {"train_loss": -6.080061435699463, "global_step": 75463, "epoch": 1796} {"train_loss": -6.109935760498047, "global_step": 75464, "epoch": 1796} {"train_loss": -6.058563232421875, "global_step": 75465, "epoch": 1796} {"train_loss": -6.125931739807129, "global_step": 75466, "epoch": 1796} {"train_loss": -6.126672744750977, "global_step": 75467, "epoch": 1796} {"train_loss": -6.136013031005859, "global_step": 75468, "epoch": 1796} {"train_loss": -5.969860076904297, "global_step": 75469, "epoch": 1796} {"train_loss": -6.1429667472839355, "global_step": 75470, "epoch": 1796} {"train_loss": -6.086343288421631, "global_step": 75471, "epoch": 1796} {"train_loss": -6.026783466339111, "global_step": 75472, "epoch": 1796} {"train_loss": -6.098749319712321, "global_step": 75473, "epoch": 1796, "val_loss": 62052.1171875} {"train_loss": -5.999196529388428, "global_step": 75474, "epoch": 1797} {"train_loss": -6.050815582275391, "global_step": 75475, "epoch": 1797} {"train_loss": -6.167562961578369, "global_step": 75476, "epoch": 1797} {"train_loss": -6.0931596755981445, "global_step": 75477, "epoch": 1797} {"train_loss": -6.093090057373047, "global_step": 75478, "epoch": 1797} {"train_loss": -6.050293922424316, "global_step": 75479, "epoch": 1797} {"train_loss": -6.041191101074219, "global_step": 75480, "epoch": 1797} {"train_loss": -6.063085556030273, "global_step": 75481, "epoch": 1797} {"train_loss": -6.08845329284668, "global_step": 75482, "epoch": 1797} {"train_loss": -6.118447780609131, "global_step": 75483, "epoch": 1797} {"train_loss": -6.085347652435303, "global_step": 75484, "epoch": 1797} {"train_loss": -6.092486381530762, "global_step": 75485, "epoch": 1797} {"train_loss": -6.108046531677246, "global_step": 75486, "epoch": 1797} {"train_loss": -6.138923645019531, "global_step": 75487, "epoch": 1797} {"train_loss": -6.13880729675293, "global_step": 75488, "epoch": 1797} {"train_loss": -6.172909736633301, "global_step": 75489, "epoch": 1797} {"train_loss": -6.085162162780762, "global_step": 75490, "epoch": 1797} {"train_loss": -6.074868679046631, "global_step": 75491, "epoch": 1797} {"train_loss": -6.142575263977051, "global_step": 75492, "epoch": 1797} {"train_loss": -6.13018798828125, "global_step": 75493, "epoch": 1797} {"train_loss": -6.105777740478516, "global_step": 75494, "epoch": 1797} {"train_loss": -6.078214645385742, "global_step": 75495, "epoch": 1797} {"train_loss": -6.009943008422852, "global_step": 75496, "epoch": 1797} {"train_loss": -6.161101818084717, "global_step": 75497, "epoch": 1797} {"train_loss": -6.046252250671387, "global_step": 75498, "epoch": 1797} {"train_loss": -6.0042219161987305, "global_step": 75499, "epoch": 1797} {"train_loss": -6.140690803527832, "global_step": 75500, "epoch": 1797} {"train_loss": -6.1835737228393555, "global_step": 75501, "epoch": 1797} {"train_loss": -5.983097076416016, "global_step": 75502, "epoch": 1797} {"train_loss": -6.074703216552734, "global_step": 75503, "epoch": 1797} {"train_loss": -6.14784049987793, "global_step": 75504, "epoch": 1797} {"train_loss": -6.117554664611816, "global_step": 75505, "epoch": 1797} {"train_loss": -6.111057281494141, "global_step": 75506, "epoch": 1797} {"train_loss": -6.031803131103516, "global_step": 75507, "epoch": 1797} {"train_loss": -6.07105827331543, "global_step": 75508, "epoch": 1797} {"train_loss": -6.074222564697266, "global_step": 75509, "epoch": 1797} {"train_loss": -6.031501770019531, "global_step": 75510, "epoch": 1797} {"train_loss": -6.063166618347168, "global_step": 75511, "epoch": 1797} {"train_loss": -6.123142242431641, "global_step": 75512, "epoch": 1797} {"train_loss": -6.1122636795043945, "global_step": 75513, "epoch": 1797} {"train_loss": -5.922621250152588, "global_step": 75514, "epoch": 1797} {"train_loss": -6.089019729977562, "global_step": 75515, "epoch": 1797, "val_loss": 62004.99609375} {"train_loss": -6.030620574951172, "global_step": 75516, "epoch": 1798} {"train_loss": -6.18451452255249, "global_step": 75517, "epoch": 1798} {"train_loss": -6.071266174316406, "global_step": 75518, "epoch": 1798} {"train_loss": -6.023918151855469, "global_step": 75519, "epoch": 1798} {"train_loss": -6.075567245483398, "global_step": 75520, "epoch": 1798} {"train_loss": -6.001747131347656, "global_step": 75521, "epoch": 1798} {"train_loss": -6.084812164306641, "global_step": 75522, "epoch": 1798} {"train_loss": -6.1121506690979, "global_step": 75523, "epoch": 1798} {"train_loss": -6.217024803161621, "global_step": 75524, "epoch": 1798} {"train_loss": -6.059840202331543, "global_step": 75525, "epoch": 1798} {"train_loss": -6.183797836303711, "global_step": 75526, "epoch": 1798} {"train_loss": -6.073825836181641, "global_step": 75527, "epoch": 1798} {"train_loss": -6.236144065856934, "global_step": 75528, "epoch": 1798} {"train_loss": -6.0589399337768555, "global_step": 75529, "epoch": 1798} {"train_loss": -6.009420871734619, "global_step": 75530, "epoch": 1798} {"train_loss": -6.027463912963867, "global_step": 75531, "epoch": 1798} {"train_loss": -5.998657703399658, "global_step": 75532, "epoch": 1798} {"train_loss": -6.018734931945801, "global_step": 75533, "epoch": 1798} {"train_loss": -6.084207534790039, "global_step": 75534, "epoch": 1798} {"train_loss": -6.027736186981201, "global_step": 75535, "epoch": 1798} {"train_loss": -6.005051612854004, "global_step": 75536, "epoch": 1798} {"train_loss": -5.969949722290039, "global_step": 75537, "epoch": 1798} {"train_loss": -5.9774274826049805, "global_step": 75538, "epoch": 1798} {"train_loss": -6.184398651123047, "global_step": 75539, "epoch": 1798} {"train_loss": -5.938066482543945, "global_step": 75540, "epoch": 1798} {"train_loss": -6.096123695373535, "global_step": 75541, "epoch": 1798} {"train_loss": -6.0694146156311035, "global_step": 75542, "epoch": 1798} {"train_loss": -5.962862968444824, "global_step": 75543, "epoch": 1798} {"train_loss": -6.178732872009277, "global_step": 75544, "epoch": 1798} {"train_loss": -6.262624263763428, "global_step": 75545, "epoch": 1798} {"train_loss": -6.089278221130371, "global_step": 75546, "epoch": 1798} {"train_loss": -6.141819953918457, "global_step": 75547, "epoch": 1798} {"train_loss": -6.03135871887207, "global_step": 75548, "epoch": 1798} {"train_loss": -6.031350135803223, "global_step": 75549, "epoch": 1798} {"train_loss": -6.124904632568359, "global_step": 75550, "epoch": 1798} {"train_loss": -6.141048431396484, "global_step": 75551, "epoch": 1798} {"train_loss": -6.265899658203125, "global_step": 75552, "epoch": 1798} {"train_loss": -6.143838882446289, "global_step": 75553, "epoch": 1798} {"train_loss": -6.173226356506348, "global_step": 75554, "epoch": 1798} {"train_loss": -6.1678876876831055, "global_step": 75555, "epoch": 1798} {"train_loss": -6.037625312805176, "global_step": 75556, "epoch": 1798} {"train_loss": -6.08952031816755, "global_step": 75557, "epoch": 1798, "val_loss": 61848.28125} {"train_loss": -6.031508445739746, "global_step": 75558, "epoch": 1799} {"train_loss": -6.139065742492676, "global_step": 75559, "epoch": 1799} {"train_loss": -6.103946208953857, "global_step": 75560, "epoch": 1799} {"train_loss": -6.164785385131836, "global_step": 75561, "epoch": 1799} {"train_loss": -6.083154678344727, "global_step": 75562, "epoch": 1799} {"train_loss": -6.112719535827637, "global_step": 75563, "epoch": 1799} {"train_loss": -6.130669116973877, "global_step": 75564, "epoch": 1799} {"train_loss": -6.072356700897217, "global_step": 75565, "epoch": 1799} {"train_loss": -6.057896137237549, "global_step": 75566, "epoch": 1799} {"train_loss": -6.229544162750244, "global_step": 75567, "epoch": 1799} {"train_loss": -6.106153964996338, "global_step": 75568, "epoch": 1799} {"train_loss": -6.112720966339111, "global_step": 75569, "epoch": 1799} {"train_loss": -6.102241516113281, "global_step": 75570, "epoch": 1799} {"train_loss": -6.119485855102539, "global_step": 75571, "epoch": 1799} {"train_loss": -6.122893333435059, "global_step": 75572, "epoch": 1799} {"train_loss": -6.1219162940979, "global_step": 75573, "epoch": 1799} {"train_loss": -6.085242748260498, "global_step": 75574, "epoch": 1799} {"train_loss": -6.041785717010498, "global_step": 75575, "epoch": 1799} {"train_loss": -6.151060104370117, "global_step": 75576, "epoch": 1799} {"train_loss": -6.0583624839782715, "global_step": 75577, "epoch": 1799} {"train_loss": -6.062199592590332, "global_step": 75578, "epoch": 1799} {"train_loss": -6.11456823348999, "global_step": 75579, "epoch": 1799} {"train_loss": -5.969993591308594, "global_step": 75580, "epoch": 1799} {"train_loss": -6.081106185913086, "global_step": 75581, "epoch": 1799} {"train_loss": -6.182363986968994, "global_step": 75582, "epoch": 1799} {"train_loss": -6.146543502807617, "global_step": 75583, "epoch": 1799} {"train_loss": -6.1343183517456055, "global_step": 75584, "epoch": 1799} {"train_loss": -6.186921119689941, "global_step": 75585, "epoch": 1799} {"train_loss": -6.1312255859375, "global_step": 75586, "epoch": 1799} {"train_loss": -6.1669769287109375, "global_step": 75587, "epoch": 1799} {"train_loss": -6.172128677368164, "global_step": 75588, "epoch": 1799} {"train_loss": -6.011907577514648, "global_step": 75589, "epoch": 1799} {"train_loss": -6.074043273925781, "global_step": 75590, "epoch": 1799} {"train_loss": -5.935938358306885, "global_step": 75591, "epoch": 1799} {"train_loss": -6.085846424102783, "global_step": 75592, "epoch": 1799} {"train_loss": -6.1295166015625, "global_step": 75593, "epoch": 1799} {"train_loss": -6.057461738586426, "global_step": 75594, "epoch": 1799} {"train_loss": -6.196928977966309, "global_step": 75595, "epoch": 1799} {"train_loss": -6.116181373596191, "global_step": 75596, "epoch": 1799} {"train_loss": -6.007844924926758, "global_step": 75597, "epoch": 1799} {"train_loss": -6.145866394042969, "global_step": 75598, "epoch": 1799} {"train_loss": -6.104770467394874, "global_step": 75599, "epoch": 1799, "val_loss": 62031.1796875} {"train_loss": -6.122756004333496, "global_step": 75600, "epoch": 1800} {"train_loss": -6.130309104919434, "global_step": 75601, "epoch": 1800} {"train_loss": -6.177286148071289, "global_step": 75602, "epoch": 1800} {"train_loss": -6.181149005889893, "global_step": 75603, "epoch": 1800} {"train_loss": -6.174195766448975, "global_step": 75604, "epoch": 1800} {"train_loss": -6.099606513977051, "global_step": 75605, "epoch": 1800} {"train_loss": -6.171058654785156, "global_step": 75606, "epoch": 1800} {"train_loss": -6.096723556518555, "global_step": 75607, "epoch": 1800} {"train_loss": -6.1283698081970215, "global_step": 75608, "epoch": 1800} {"train_loss": -6.160761833190918, "global_step": 75609, "epoch": 1800} {"train_loss": -6.060756683349609, "global_step": 75610, "epoch": 1800} {"train_loss": -6.047321319580078, "global_step": 75611, "epoch": 1800} {"train_loss": -6.108080863952637, "global_step": 75612, "epoch": 1800} {"train_loss": -6.056971073150635, "global_step": 75613, "epoch": 1800} {"train_loss": -6.101752281188965, "global_step": 75614, "epoch": 1800} {"train_loss": -6.147982597351074, "global_step": 75615, "epoch": 1800} {"train_loss": -6.108145713806152, "global_step": 75616, "epoch": 1800} {"train_loss": -6.149504661560059, "global_step": 75617, "epoch": 1800} {"train_loss": -6.175907135009766, "global_step": 75618, "epoch": 1800} {"train_loss": -6.142220973968506, "global_step": 75619, "epoch": 1800} {"train_loss": -6.092825889587402, "global_step": 75620, "epoch": 1800} {"train_loss": -6.066973686218262, "global_step": 75621, "epoch": 1800} {"train_loss": -5.975922107696533, "global_step": 75622, "epoch": 1800} {"train_loss": -6.067028045654297, "global_step": 75623, "epoch": 1800} {"train_loss": -6.150859355926514, "global_step": 75624, "epoch": 1800} {"train_loss": -6.10090970993042, "global_step": 75625, "epoch": 1800} {"train_loss": -6.0431060791015625, "global_step": 75626, "epoch": 1800} {"train_loss": -6.180606842041016, "global_step": 75627, "epoch": 1800} {"train_loss": -6.020783424377441, "global_step": 75628, "epoch": 1800} {"train_loss": -6.198500633239746, "global_step": 75629, "epoch": 1800} {"train_loss": -6.167438507080078, "global_step": 75630, "epoch": 1800} {"train_loss": -5.978544235229492, "global_step": 75631, "epoch": 1800} {"train_loss": -6.040798187255859, "global_step": 75632, "epoch": 1800} {"train_loss": -6.086220741271973, "global_step": 75633, "epoch": 1800} {"train_loss": -6.0874176025390625, "global_step": 75634, "epoch": 1800} {"train_loss": -6.021430015563965, "global_step": 75635, "epoch": 1800} {"train_loss": -6.163905143737793, "global_step": 75636, "epoch": 1800} {"train_loss": -6.005768775939941, "global_step": 75637, "epoch": 1800} {"train_loss": -6.143453598022461, "global_step": 75638, "epoch": 1800} {"train_loss": -6.100876808166504, "global_step": 75639, "epoch": 1800} {"train_loss": -6.132715225219727, "global_step": 75640, "epoch": 1800} {"train_loss": -6.10472001348223, "global_step": 75641, "epoch": 1800, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.3043592915114877, "train/sim_max_reward_2": 0.7868777574924962, "train/sim_max_reward_3": 0.47537558705286825, "train/sim_max_reward_4": 0.9823376249262697, "train/sim_max_reward_5": 0.8241606116615502, "test/sim_max_reward_4300000": 0.8479571867999433, "test/sim_max_reward_4300001": 0.5845307240544758, "test/sim_max_reward_4300002": 0.9010122278986717, "test/sim_max_reward_4300003": 0.9472395919500712, "test/sim_max_reward_4300004": 0.36741015002646144, "test/sim_max_reward_4300005": 0.8652786859365623, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.8828264225030464, "test/sim_max_reward_4300008": 0.8013407309086068, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.8060305517996397, "test/sim_max_reward_4300011": 0.9533958235733901, "test/sim_max_reward_4300012": 0.8895092186086274, "test/sim_max_reward_4300013": 0.5228417492752052, "test/sim_max_reward_4300014": 0.875941001467983, "test/sim_max_reward_4300015": 0.9219307845982103, "test/sim_max_reward_4300016": 0.9893054158252312, "test/sim_max_reward_4300017": 0.9601457472430684, "test/sim_max_reward_4300018": 0.4010038972560649, "test/sim_max_reward_4300019": 0.18679412749776123, "test/sim_max_reward_4300020": 0.747369193594018, "test/sim_max_reward_4300021": 0.6392760529799834, "test/sim_max_reward_4300022": 0.4919072766281776, "test/sim_max_reward_4300023": 0.3573914436449905, "test/sim_max_reward_4300024": 0.4523653034943918, "test/sim_max_reward_4300025": 0.9132916421144428, "test/sim_max_reward_4300026": 0.16807002316778702, "test/sim_max_reward_4300027": 0.7969888961732566, "test/sim_max_reward_4300028": 0.8817402018400333, "test/sim_max_reward_4300029": 0.0001140197169269425, "test/sim_max_reward_4300030": 0.5364140939383588, "test/sim_max_reward_4300031": 0.8169204960943186, "test/sim_max_reward_4300032": 0.9657660231530992, "test/sim_max_reward_4300033": 0.6247438156706396, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9822025913186185, "test/sim_max_reward_4300038": 0.43541065943364454, "test/sim_max_reward_4300039": 0.9421212582128208, "test/sim_max_reward_4300040": 0.41770983358264097, "test/sim_max_reward_4300041": 0.9352302965515947, "test/sim_max_reward_4300042": 0.8289883540933, "test/sim_max_reward_4300043": 0.48691347266104773, "test/sim_max_reward_4300044": 0.7664879010989698, "test/sim_max_reward_4300045": 0.9117357531706735, "test/sim_max_reward_4300046": 0.8728762570039592, "test/sim_max_reward_4300047": 0.8914022928796216, "test/sim_max_reward_4300048": 0.3789972325315925, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.5939013948751207, "test/mean_score": 0.6429224507507082, "val_loss": 62066.06640625} {"train_loss": -6.135989189147949, "global_step": 75642, "epoch": 1801} {"train_loss": -6.163552284240723, "global_step": 75643, "epoch": 1801} {"train_loss": -6.172543525695801, "global_step": 75644, "epoch": 1801} {"train_loss": -6.247279167175293, "global_step": 75645, "epoch": 1801} {"train_loss": -6.156659126281738, "global_step": 75646, "epoch": 1801} {"train_loss": -6.096648216247559, "global_step": 75647, "epoch": 1801} {"train_loss": -6.163020610809326, "global_step": 75648, "epoch": 1801} {"train_loss": -6.159996032714844, "global_step": 75649, "epoch": 1801} {"train_loss": -6.034966468811035, "global_step": 75650, "epoch": 1801} {"train_loss": -6.082220554351807, "global_step": 75651, "epoch": 1801} {"train_loss": -6.076822280883789, "global_step": 75652, "epoch": 1801} {"train_loss": -6.027098655700684, "global_step": 75653, "epoch": 1801} {"train_loss": -6.126230239868164, "global_step": 75654, "epoch": 1801} {"train_loss": -5.996391773223877, "global_step": 75655, "epoch": 1801} {"train_loss": -6.208407878875732, "global_step": 75656, "epoch": 1801} {"train_loss": -6.191678047180176, "global_step": 75657, "epoch": 1801} {"train_loss": -6.127532005310059, "global_step": 75658, "epoch": 1801} {"train_loss": -6.080975532531738, "global_step": 75659, "epoch": 1801} {"train_loss": -6.041485786437988, "global_step": 75660, "epoch": 1801} {"train_loss": -6.160611152648926, "global_step": 75661, "epoch": 1801} {"train_loss": -6.139291763305664, "global_step": 75662, "epoch": 1801} {"train_loss": -6.142485618591309, "global_step": 75663, "epoch": 1801} {"train_loss": -6.181758880615234, "global_step": 75664, "epoch": 1801} {"train_loss": -6.095022201538086, "global_step": 75665, "epoch": 1801} {"train_loss": -6.140466213226318, "global_step": 75666, "epoch": 1801} {"train_loss": -6.145523548126221, "global_step": 75667, "epoch": 1801} {"train_loss": -6.114112854003906, "global_step": 75668, "epoch": 1801} {"train_loss": -6.123138427734375, "global_step": 75669, "epoch": 1801} {"train_loss": -6.175373077392578, "global_step": 75670, "epoch": 1801} {"train_loss": -6.096227169036865, "global_step": 75671, "epoch": 1801} {"train_loss": -6.151875019073486, "global_step": 75672, "epoch": 1801} {"train_loss": -6.071141719818115, "global_step": 75673, "epoch": 1801} {"train_loss": -6.145268440246582, "global_step": 75674, "epoch": 1801} {"train_loss": -6.089479923248291, "global_step": 75675, "epoch": 1801} {"train_loss": -6.022543907165527, "global_step": 75676, "epoch": 1801} {"train_loss": -6.015977382659912, "global_step": 75677, "epoch": 1801} {"train_loss": -6.074774742126465, "global_step": 75678, "epoch": 1801} {"train_loss": -6.114367485046387, "global_step": 75679, "epoch": 1801} {"train_loss": -6.1183271408081055, "global_step": 75680, "epoch": 1801} {"train_loss": -6.076252460479736, "global_step": 75681, "epoch": 1801} {"train_loss": -6.043907165527344, "global_step": 75682, "epoch": 1801} {"train_loss": -6.115994805381412, "global_step": 75683, "epoch": 1801, "val_loss": 61969.13671875} {"train_loss": -6.110437393188477, "global_step": 75684, "epoch": 1802} {"train_loss": -6.160944938659668, "global_step": 75685, "epoch": 1802} {"train_loss": -6.060704231262207, "global_step": 75686, "epoch": 1802} {"train_loss": -6.164200782775879, "global_step": 75687, "epoch": 1802} {"train_loss": -6.092766284942627, "global_step": 75688, "epoch": 1802} {"train_loss": -6.030575752258301, "global_step": 75689, "epoch": 1802} {"train_loss": -5.961173057556152, "global_step": 75690, "epoch": 1802} {"train_loss": -6.136387825012207, "global_step": 75691, "epoch": 1802} {"train_loss": -6.088374137878418, "global_step": 75692, "epoch": 1802} {"train_loss": -6.100416660308838, "global_step": 75693, "epoch": 1802} {"train_loss": -6.114095687866211, "global_step": 75694, "epoch": 1802} {"train_loss": -6.118380069732666, "global_step": 75695, "epoch": 1802} {"train_loss": -6.037229537963867, "global_step": 75696, "epoch": 1802} {"train_loss": -5.951354026794434, "global_step": 75697, "epoch": 1802} {"train_loss": -6.103270053863525, "global_step": 75698, "epoch": 1802} {"train_loss": -6.069927215576172, "global_step": 75699, "epoch": 1802} {"train_loss": -6.081414699554443, "global_step": 75700, "epoch": 1802} {"train_loss": -5.999977111816406, "global_step": 75701, "epoch": 1802} {"train_loss": -6.118142127990723, "global_step": 75702, "epoch": 1802} {"train_loss": -6.235158443450928, "global_step": 75703, "epoch": 1802} {"train_loss": -5.998417854309082, "global_step": 75704, "epoch": 1802} {"train_loss": -6.076025009155273, "global_step": 75705, "epoch": 1802} {"train_loss": -6.19809627532959, "global_step": 75706, "epoch": 1802} {"train_loss": -6.207493305206299, "global_step": 75707, "epoch": 1802} {"train_loss": -6.093132972717285, "global_step": 75708, "epoch": 1802} {"train_loss": -6.170623779296875, "global_step": 75709, "epoch": 1802} {"train_loss": -6.03562068939209, "global_step": 75710, "epoch": 1802} {"train_loss": -6.133865833282471, "global_step": 75711, "epoch": 1802} {"train_loss": -6.083329200744629, "global_step": 75712, "epoch": 1802} {"train_loss": -6.036118984222412, "global_step": 75713, "epoch": 1802} {"train_loss": -6.186522483825684, "global_step": 75714, "epoch": 1802} {"train_loss": -6.023249626159668, "global_step": 75715, "epoch": 1802} {"train_loss": -6.150687217712402, "global_step": 75716, "epoch": 1802} {"train_loss": -6.165311336517334, "global_step": 75717, "epoch": 1802} {"train_loss": -6.084563732147217, "global_step": 75718, "epoch": 1802} {"train_loss": -6.155926704406738, "global_step": 75719, "epoch": 1802} {"train_loss": -6.170998573303223, "global_step": 75720, "epoch": 1802} {"train_loss": -6.179523944854736, "global_step": 75721, "epoch": 1802} {"train_loss": -6.153695106506348, "global_step": 75722, "epoch": 1802} {"train_loss": -6.210912704467773, "global_step": 75723, "epoch": 1802} {"train_loss": -6.048604488372803, "global_step": 75724, "epoch": 1802} {"train_loss": -6.104186580294654, "global_step": 75725, "epoch": 1802, "val_loss": 61882.9140625} {"train_loss": -6.185049057006836, "global_step": 75726, "epoch": 1803} {"train_loss": -6.070998668670654, "global_step": 75727, "epoch": 1803} {"train_loss": -6.089527130126953, "global_step": 75728, "epoch": 1803} {"train_loss": -6.032280445098877, "global_step": 75729, "epoch": 1803} {"train_loss": -6.096322059631348, "global_step": 75730, "epoch": 1803} {"train_loss": -6.148376941680908, "global_step": 75731, "epoch": 1803} {"train_loss": -6.093310356140137, "global_step": 75732, "epoch": 1803} {"train_loss": -6.148200988769531, "global_step": 75733, "epoch": 1803} {"train_loss": -6.147429466247559, "global_step": 75734, "epoch": 1803} {"train_loss": -6.051192283630371, "global_step": 75735, "epoch": 1803} {"train_loss": -6.158486843109131, "global_step": 75736, "epoch": 1803} {"train_loss": -6.121466159820557, "global_step": 75737, "epoch": 1803} {"train_loss": -6.2322282791137695, "global_step": 75738, "epoch": 1803} {"train_loss": -6.018232345581055, "global_step": 75739, "epoch": 1803} {"train_loss": -6.016142845153809, "global_step": 75740, "epoch": 1803} {"train_loss": -6.129281044006348, "global_step": 75741, "epoch": 1803} {"train_loss": -6.018963813781738, "global_step": 75742, "epoch": 1803} {"train_loss": -6.026591777801514, "global_step": 75743, "epoch": 1803} {"train_loss": -6.005967140197754, "global_step": 75744, "epoch": 1803} {"train_loss": -6.092021942138672, "global_step": 75745, "epoch": 1803} {"train_loss": -6.002691268920898, "global_step": 75746, "epoch": 1803} {"train_loss": -5.995927810668945, "global_step": 75747, "epoch": 1803} {"train_loss": -6.0025129318237305, "global_step": 75748, "epoch": 1803} {"train_loss": -6.044519424438477, "global_step": 75749, "epoch": 1803} {"train_loss": -6.131373882293701, "global_step": 75750, "epoch": 1803} {"train_loss": -6.073406219482422, "global_step": 75751, "epoch": 1803} {"train_loss": -6.019806861877441, "global_step": 75752, "epoch": 1803} {"train_loss": -6.019837379455566, "global_step": 75753, "epoch": 1803} {"train_loss": -6.145453453063965, "global_step": 75754, "epoch": 1803} {"train_loss": -6.061003684997559, "global_step": 75755, "epoch": 1803} {"train_loss": -5.988572597503662, "global_step": 75756, "epoch": 1803} {"train_loss": -6.079308986663818, "global_step": 75757, "epoch": 1803} {"train_loss": -5.8534135818481445, "global_step": 75758, "epoch": 1803} {"train_loss": -6.097972869873047, "global_step": 75759, "epoch": 1803} {"train_loss": -5.848434925079346, "global_step": 75760, "epoch": 1803} {"train_loss": -5.978229522705078, "global_step": 75761, "epoch": 1803} {"train_loss": -5.9932098388671875, "global_step": 75762, "epoch": 1803} {"train_loss": -5.977170944213867, "global_step": 75763, "epoch": 1803} {"train_loss": -5.989017486572266, "global_step": 75764, "epoch": 1803} {"train_loss": -5.980116844177246, "global_step": 75765, "epoch": 1803} {"train_loss": -5.996260643005371, "global_step": 75766, "epoch": 1803} {"train_loss": -6.0486779099419, "global_step": 75767, "epoch": 1803, "val_loss": 61902.62109375} {"train_loss": -6.136084079742432, "global_step": 75768, "epoch": 1804} {"train_loss": -6.060426712036133, "global_step": 75769, "epoch": 1804} {"train_loss": -5.998763084411621, "global_step": 75770, "epoch": 1804} {"train_loss": -6.064337730407715, "global_step": 75771, "epoch": 1804} {"train_loss": -6.004524230957031, "global_step": 75772, "epoch": 1804} {"train_loss": -6.12273645401001, "global_step": 75773, "epoch": 1804} {"train_loss": -5.936988830566406, "global_step": 75774, "epoch": 1804} {"train_loss": -6.022702217102051, "global_step": 75775, "epoch": 1804} {"train_loss": -5.996828079223633, "global_step": 75776, "epoch": 1804} {"train_loss": -6.023077011108398, "global_step": 75777, "epoch": 1804} {"train_loss": -6.0845160484313965, "global_step": 75778, "epoch": 1804} {"train_loss": -5.967318534851074, "global_step": 75779, "epoch": 1804} {"train_loss": -6.096696853637695, "global_step": 75780, "epoch": 1804} {"train_loss": -6.071646213531494, "global_step": 75781, "epoch": 1804} {"train_loss": -6.126195907592773, "global_step": 75782, "epoch": 1804} {"train_loss": -6.113182544708252, "global_step": 75783, "epoch": 1804} {"train_loss": -6.059094429016113, "global_step": 75784, "epoch": 1804} {"train_loss": -6.20982551574707, "global_step": 75785, "epoch": 1804} {"train_loss": -6.140363693237305, "global_step": 75786, "epoch": 1804} {"train_loss": -6.060626029968262, "global_step": 75787, "epoch": 1804} {"train_loss": -6.054532051086426, "global_step": 75788, "epoch": 1804} {"train_loss": -6.031145095825195, "global_step": 75789, "epoch": 1804} {"train_loss": -6.12908935546875, "global_step": 75790, "epoch": 1804} {"train_loss": -6.14854097366333, "global_step": 75791, "epoch": 1804} {"train_loss": -6.108188152313232, "global_step": 75792, "epoch": 1804} {"train_loss": -6.193830490112305, "global_step": 75793, "epoch": 1804} {"train_loss": -6.196806907653809, "global_step": 75794, "epoch": 1804} {"train_loss": -6.103708267211914, "global_step": 75795, "epoch": 1804} {"train_loss": -6.098576545715332, "global_step": 75796, "epoch": 1804} {"train_loss": -6.188716888427734, "global_step": 75797, "epoch": 1804} {"train_loss": -6.1012749671936035, "global_step": 75798, "epoch": 1804} {"train_loss": -6.069372653961182, "global_step": 75799, "epoch": 1804} {"train_loss": -6.18044900894165, "global_step": 75800, "epoch": 1804} {"train_loss": -6.097555160522461, "global_step": 75801, "epoch": 1804} {"train_loss": -6.091325283050537, "global_step": 75802, "epoch": 1804} {"train_loss": -6.0909223556518555, "global_step": 75803, "epoch": 1804} {"train_loss": -6.030967712402344, "global_step": 75804, "epoch": 1804} {"train_loss": -6.019163131713867, "global_step": 75805, "epoch": 1804} {"train_loss": -6.156846523284912, "global_step": 75806, "epoch": 1804} {"train_loss": -6.167928695678711, "global_step": 75807, "epoch": 1804} {"train_loss": -6.076700687408447, "global_step": 75808, "epoch": 1804} {"train_loss": -6.086489983967373, "global_step": 75809, "epoch": 1804, "val_loss": 61999.234375} {"train_loss": -6.050140857696533, "global_step": 75810, "epoch": 1805} {"train_loss": -6.15568208694458, "global_step": 75811, "epoch": 1805} {"train_loss": -6.188158988952637, "global_step": 75812, "epoch": 1805} {"train_loss": -6.151501655578613, "global_step": 75813, "epoch": 1805} {"train_loss": -6.130517959594727, "global_step": 75814, "epoch": 1805} {"train_loss": -6.011693000793457, "global_step": 75815, "epoch": 1805} {"train_loss": -6.082289695739746, "global_step": 75816, "epoch": 1805} {"train_loss": -6.046360015869141, "global_step": 75817, "epoch": 1805} {"train_loss": -6.194797992706299, "global_step": 75818, "epoch": 1805} {"train_loss": -6.193078994750977, "global_step": 75819, "epoch": 1805} {"train_loss": -5.982108116149902, "global_step": 75820, "epoch": 1805} {"train_loss": -6.0667805671691895, "global_step": 75821, "epoch": 1805} {"train_loss": -6.0599141120910645, "global_step": 75822, "epoch": 1805} {"train_loss": -6.131027698516846, "global_step": 75823, "epoch": 1805} {"train_loss": -6.075865745544434, "global_step": 75824, "epoch": 1805} {"train_loss": -6.044772148132324, "global_step": 75825, "epoch": 1805} {"train_loss": -6.117992401123047, "global_step": 75826, "epoch": 1805} {"train_loss": -6.081415176391602, "global_step": 75827, "epoch": 1805} {"train_loss": -6.168221473693848, "global_step": 75828, "epoch": 1805} {"train_loss": -6.058047294616699, "global_step": 75829, "epoch": 1805} {"train_loss": -5.984788417816162, "global_step": 75830, "epoch": 1805} {"train_loss": -6.115986347198486, "global_step": 75831, "epoch": 1805} {"train_loss": -6.010632514953613, "global_step": 75832, "epoch": 1805} {"train_loss": -6.189382553100586, "global_step": 75833, "epoch": 1805} {"train_loss": -6.171405792236328, "global_step": 75834, "epoch": 1805} {"train_loss": -6.179943561553955, "global_step": 75835, "epoch": 1805} {"train_loss": -6.10577917098999, "global_step": 75836, "epoch": 1805} {"train_loss": -6.103226184844971, "global_step": 75837, "epoch": 1805} {"train_loss": -6.035287857055664, "global_step": 75838, "epoch": 1805} {"train_loss": -6.145444869995117, "global_step": 75839, "epoch": 1805} {"train_loss": -6.137993812561035, "global_step": 75840, "epoch": 1805} {"train_loss": -6.087790489196777, "global_step": 75841, "epoch": 1805} {"train_loss": -6.099251747131348, "global_step": 75842, "epoch": 1805} {"train_loss": -6.150385856628418, "global_step": 75843, "epoch": 1805} {"train_loss": -6.166120529174805, "global_step": 75844, "epoch": 1805} {"train_loss": -6.188204765319824, "global_step": 75845, "epoch": 1805} {"train_loss": -6.117955684661865, "global_step": 75846, "epoch": 1805} {"train_loss": -6.107692718505859, "global_step": 75847, "epoch": 1805} {"train_loss": -6.120655536651611, "global_step": 75848, "epoch": 1805} {"train_loss": -5.998147964477539, "global_step": 75849, "epoch": 1805} {"train_loss": -6.0338215827941895, "global_step": 75850, "epoch": 1805} {"train_loss": -6.10101960954212, "global_step": 75851, "epoch": 1805, "val_loss": 62186.79296875} {"train_loss": -6.132253646850586, "global_step": 75852, "epoch": 1806} {"train_loss": -5.951968669891357, "global_step": 75853, "epoch": 1806} {"train_loss": -5.989073753356934, "global_step": 75854, "epoch": 1806} {"train_loss": -5.926349639892578, "global_step": 75855, "epoch": 1806} {"train_loss": -6.016727447509766, "global_step": 75856, "epoch": 1806} {"train_loss": -6.043085098266602, "global_step": 75857, "epoch": 1806} {"train_loss": -6.06790018081665, "global_step": 75858, "epoch": 1806} {"train_loss": -6.084041595458984, "global_step": 75859, "epoch": 1806} {"train_loss": -6.091737747192383, "global_step": 75860, "epoch": 1806} {"train_loss": -5.99794864654541, "global_step": 75861, "epoch": 1806} {"train_loss": -6.0985612869262695, "global_step": 75862, "epoch": 1806} {"train_loss": -6.050050735473633, "global_step": 75863, "epoch": 1806} {"train_loss": -5.963268280029297, "global_step": 75864, "epoch": 1806} {"train_loss": -6.047263145446777, "global_step": 75865, "epoch": 1806} {"train_loss": -5.96579647064209, "global_step": 75866, "epoch": 1806} {"train_loss": -6.177066326141357, "global_step": 75867, "epoch": 1806} {"train_loss": -5.932979583740234, "global_step": 75868, "epoch": 1806} {"train_loss": -6.134754180908203, "global_step": 75869, "epoch": 1806} {"train_loss": -6.035897254943848, "global_step": 75870, "epoch": 1806} {"train_loss": -6.017402648925781, "global_step": 75871, "epoch": 1806} {"train_loss": -6.003710746765137, "global_step": 75872, "epoch": 1806} {"train_loss": -6.05571174621582, "global_step": 75873, "epoch": 1806} {"train_loss": -6.02005672454834, "global_step": 75874, "epoch": 1806} {"train_loss": -6.040491104125977, "global_step": 75875, "epoch": 1806} {"train_loss": -6.016040802001953, "global_step": 75876, "epoch": 1806} {"train_loss": -6.0879597663879395, "global_step": 75877, "epoch": 1806} {"train_loss": -6.129587173461914, "global_step": 75878, "epoch": 1806} {"train_loss": -6.213167667388916, "global_step": 75879, "epoch": 1806} {"train_loss": -6.013441562652588, "global_step": 75880, "epoch": 1806} {"train_loss": -6.069314479827881, "global_step": 75881, "epoch": 1806} {"train_loss": -6.193976402282715, "global_step": 75882, "epoch": 1806} {"train_loss": -6.12568473815918, "global_step": 75883, "epoch": 1806} {"train_loss": -6.126456260681152, "global_step": 75884, "epoch": 1806} {"train_loss": -6.193006992340088, "global_step": 75885, "epoch": 1806} {"train_loss": -6.092048645019531, "global_step": 75886, "epoch": 1806} {"train_loss": -6.066280364990234, "global_step": 75887, "epoch": 1806} {"train_loss": -5.979480743408203, "global_step": 75888, "epoch": 1806} {"train_loss": -6.10981559753418, "global_step": 75889, "epoch": 1806} {"train_loss": -6.148530960083008, "global_step": 75890, "epoch": 1806} {"train_loss": -5.98781681060791, "global_step": 75891, "epoch": 1806} {"train_loss": -6.087489128112793, "global_step": 75892, "epoch": 1806} {"train_loss": -6.061992713383266, "global_step": 75893, "epoch": 1806, "val_loss": 62168.40625} {"train_loss": -6.0293731689453125, "global_step": 75894, "epoch": 1807} {"train_loss": -5.996209144592285, "global_step": 75895, "epoch": 1807} {"train_loss": -6.068336486816406, "global_step": 75896, "epoch": 1807} {"train_loss": -6.0121002197265625, "global_step": 75897, "epoch": 1807} {"train_loss": -6.023970603942871, "global_step": 75898, "epoch": 1807} {"train_loss": -5.936075210571289, "global_step": 75899, "epoch": 1807} {"train_loss": -6.086939334869385, "global_step": 75900, "epoch": 1807} {"train_loss": -5.944409370422363, "global_step": 75901, "epoch": 1807} {"train_loss": -5.939068794250488, "global_step": 75902, "epoch": 1807} {"train_loss": -6.024392127990723, "global_step": 75903, "epoch": 1807} {"train_loss": -6.010361671447754, "global_step": 75904, "epoch": 1807} {"train_loss": -6.101061820983887, "global_step": 75905, "epoch": 1807} {"train_loss": -5.941122055053711, "global_step": 75906, "epoch": 1807} {"train_loss": -6.087963104248047, "global_step": 75907, "epoch": 1807} {"train_loss": -6.0996880531311035, "global_step": 75908, "epoch": 1807} {"train_loss": -6.027647018432617, "global_step": 75909, "epoch": 1807} {"train_loss": -6.088965892791748, "global_step": 75910, "epoch": 1807} {"train_loss": -6.044197082519531, "global_step": 75911, "epoch": 1807} {"train_loss": -6.057573318481445, "global_step": 75912, "epoch": 1807} {"train_loss": -6.066196918487549, "global_step": 75913, "epoch": 1807} {"train_loss": -6.093198776245117, "global_step": 75914, "epoch": 1807} {"train_loss": -6.044961452484131, "global_step": 75915, "epoch": 1807} {"train_loss": -6.041585922241211, "global_step": 75916, "epoch": 1807} {"train_loss": -5.918524265289307, "global_step": 75917, "epoch": 1807} {"train_loss": -5.935821056365967, "global_step": 75918, "epoch": 1807} {"train_loss": -6.108734130859375, "global_step": 75919, "epoch": 1807} {"train_loss": -6.04979944229126, "global_step": 75920, "epoch": 1807} {"train_loss": -5.965810298919678, "global_step": 75921, "epoch": 1807} {"train_loss": -6.047255039215088, "global_step": 75922, "epoch": 1807} {"train_loss": -6.089450836181641, "global_step": 75923, "epoch": 1807} {"train_loss": -6.172919750213623, "global_step": 75924, "epoch": 1807} {"train_loss": -6.158200740814209, "global_step": 75925, "epoch": 1807} {"train_loss": -6.179091453552246, "global_step": 75926, "epoch": 1807} {"train_loss": -6.174347877502441, "global_step": 75927, "epoch": 1807} {"train_loss": -6.154363632202148, "global_step": 75928, "epoch": 1807} {"train_loss": -6.0855536460876465, "global_step": 75929, "epoch": 1807} {"train_loss": -6.164536476135254, "global_step": 75930, "epoch": 1807} {"train_loss": -5.99620246887207, "global_step": 75931, "epoch": 1807} {"train_loss": -6.007469177246094, "global_step": 75932, "epoch": 1807} {"train_loss": -6.192656993865967, "global_step": 75933, "epoch": 1807} {"train_loss": -6.0810465812683105, "global_step": 75934, "epoch": 1807} {"train_loss": -6.055742195674351, "global_step": 75935, "epoch": 1807, "val_loss": 61878.9375} {"train_loss": -6.089398384094238, "global_step": 75936, "epoch": 1808} {"train_loss": -6.097005844116211, "global_step": 75937, "epoch": 1808} {"train_loss": -6.110134124755859, "global_step": 75938, "epoch": 1808} {"train_loss": -6.194812297821045, "global_step": 75939, "epoch": 1808} {"train_loss": -5.951394081115723, "global_step": 75940, "epoch": 1808} {"train_loss": -6.110537528991699, "global_step": 75941, "epoch": 1808} {"train_loss": -6.109094142913818, "global_step": 75942, "epoch": 1808} {"train_loss": -6.045773506164551, "global_step": 75943, "epoch": 1808} {"train_loss": -6.086878299713135, "global_step": 75944, "epoch": 1808} {"train_loss": -6.074472427368164, "global_step": 75945, "epoch": 1808} {"train_loss": -6.161297798156738, "global_step": 75946, "epoch": 1808} {"train_loss": -6.022326946258545, "global_step": 75947, "epoch": 1808} {"train_loss": -5.949574947357178, "global_step": 75948, "epoch": 1808} {"train_loss": -6.037508964538574, "global_step": 75949, "epoch": 1808} {"train_loss": -5.954931259155273, "global_step": 75950, "epoch": 1808} {"train_loss": -5.930657386779785, "global_step": 75951, "epoch": 1808} {"train_loss": -6.002328872680664, "global_step": 75952, "epoch": 1808} {"train_loss": -6.126987457275391, "global_step": 75953, "epoch": 1808} {"train_loss": -6.031100749969482, "global_step": 75954, "epoch": 1808} {"train_loss": -6.126345634460449, "global_step": 75955, "epoch": 1808} {"train_loss": -6.145662307739258, "global_step": 75956, "epoch": 1808} {"train_loss": -6.166278839111328, "global_step": 75957, "epoch": 1808} {"train_loss": -6.117289066314697, "global_step": 75958, "epoch": 1808} {"train_loss": -6.119770050048828, "global_step": 75959, "epoch": 1808} {"train_loss": -6.150905132293701, "global_step": 75960, "epoch": 1808} {"train_loss": -6.0806779861450195, "global_step": 75961, "epoch": 1808} {"train_loss": -6.021356582641602, "global_step": 75962, "epoch": 1808} {"train_loss": -6.172194480895996, "global_step": 75963, "epoch": 1808} {"train_loss": -6.0213823318481445, "global_step": 75964, "epoch": 1808} {"train_loss": -6.184642791748047, "global_step": 75965, "epoch": 1808} {"train_loss": -6.143319129943848, "global_step": 75966, "epoch": 1808} {"train_loss": -6.10993766784668, "global_step": 75967, "epoch": 1808} {"train_loss": -6.017838478088379, "global_step": 75968, "epoch": 1808} {"train_loss": -6.221011638641357, "global_step": 75969, "epoch": 1808} {"train_loss": -5.93454647064209, "global_step": 75970, "epoch": 1808} {"train_loss": -6.104007720947266, "global_step": 75971, "epoch": 1808} {"train_loss": -6.185026168823242, "global_step": 75972, "epoch": 1808} {"train_loss": -6.02876615524292, "global_step": 75973, "epoch": 1808} {"train_loss": -6.080944061279297, "global_step": 75974, "epoch": 1808} {"train_loss": -6.102360248565674, "global_step": 75975, "epoch": 1808} {"train_loss": -6.162405014038086, "global_step": 75976, "epoch": 1808} {"train_loss": -6.08459902945019, "global_step": 75977, "epoch": 1808, "val_loss": 62094.15234375} {"train_loss": -6.194392204284668, "global_step": 75978, "epoch": 1809} {"train_loss": -6.095468044281006, "global_step": 75979, "epoch": 1809} {"train_loss": -6.08790397644043, "global_step": 75980, "epoch": 1809} {"train_loss": -6.094610691070557, "global_step": 75981, "epoch": 1809} {"train_loss": -6.2018232345581055, "global_step": 75982, "epoch": 1809} {"train_loss": -6.165914535522461, "global_step": 75983, "epoch": 1809} {"train_loss": -6.232751846313477, "global_step": 75984, "epoch": 1809} {"train_loss": -6.235355377197266, "global_step": 75985, "epoch": 1809} {"train_loss": -6.2297515869140625, "global_step": 75986, "epoch": 1809} {"train_loss": -6.197505474090576, "global_step": 75987, "epoch": 1809} {"train_loss": -6.147881507873535, "global_step": 75988, "epoch": 1809} {"train_loss": -6.175820350646973, "global_step": 75989, "epoch": 1809} {"train_loss": -6.273655891418457, "global_step": 75990, "epoch": 1809} {"train_loss": -5.9923200607299805, "global_step": 75991, "epoch": 1809} {"train_loss": -6.128528594970703, "global_step": 75992, "epoch": 1809} {"train_loss": -6.085395812988281, "global_step": 75993, "epoch": 1809} {"train_loss": -6.037718772888184, "global_step": 75994, "epoch": 1809} {"train_loss": -6.123936653137207, "global_step": 75995, "epoch": 1809} {"train_loss": -6.01738166809082, "global_step": 75996, "epoch": 1809} {"train_loss": -6.121872901916504, "global_step": 75997, "epoch": 1809} {"train_loss": -6.184882164001465, "global_step": 75998, "epoch": 1809} {"train_loss": -6.102971076965332, "global_step": 75999, "epoch": 1809} {"train_loss": -6.1274824142456055, "global_step": 76000, "epoch": 1809} {"train_loss": -6.147795677185059, "global_step": 76001, "epoch": 1809} {"train_loss": -6.049734115600586, "global_step": 76002, "epoch": 1809} {"train_loss": -6.116209030151367, "global_step": 76003, "epoch": 1809} {"train_loss": -6.035577297210693, "global_step": 76004, "epoch": 1809} {"train_loss": -6.0337324142456055, "global_step": 76005, "epoch": 1809} {"train_loss": -6.210144996643066, "global_step": 76006, "epoch": 1809} {"train_loss": -6.066924095153809, "global_step": 76007, "epoch": 1809} {"train_loss": -5.996152877807617, "global_step": 76008, "epoch": 1809} {"train_loss": -6.2759246826171875, "global_step": 76009, "epoch": 1809} {"train_loss": -6.149822235107422, "global_step": 76010, "epoch": 1809} {"train_loss": -6.013937950134277, "global_step": 76011, "epoch": 1809} {"train_loss": -6.1340742111206055, "global_step": 76012, "epoch": 1809} {"train_loss": -6.041568756103516, "global_step": 76013, "epoch": 1809} {"train_loss": -6.09837532043457, "global_step": 76014, "epoch": 1809} {"train_loss": -6.088104724884033, "global_step": 76015, "epoch": 1809} {"train_loss": -6.033462047576904, "global_step": 76016, "epoch": 1809} {"train_loss": -6.197484970092773, "global_step": 76017, "epoch": 1809} {"train_loss": -6.163487434387207, "global_step": 76018, "epoch": 1809} {"train_loss": -6.123285395758493, "global_step": 76019, "epoch": 1809, "val_loss": 61935.1796875} {"train_loss": -6.124265193939209, "global_step": 76020, "epoch": 1810} {"train_loss": -6.13565731048584, "global_step": 76021, "epoch": 1810} {"train_loss": -6.1110687255859375, "global_step": 76022, "epoch": 1810} {"train_loss": -6.100763320922852, "global_step": 76023, "epoch": 1810} {"train_loss": -6.215570449829102, "global_step": 76024, "epoch": 1810} {"train_loss": -6.083547592163086, "global_step": 76025, "epoch": 1810} {"train_loss": -6.052879810333252, "global_step": 76026, "epoch": 1810} {"train_loss": -6.170503616333008, "global_step": 76027, "epoch": 1810} {"train_loss": -6.047399520874023, "global_step": 76028, "epoch": 1810} {"train_loss": -6.143251895904541, "global_step": 76029, "epoch": 1810} {"train_loss": -6.083129405975342, "global_step": 76030, "epoch": 1810} {"train_loss": -6.010553359985352, "global_step": 76031, "epoch": 1810} {"train_loss": -6.044106960296631, "global_step": 76032, "epoch": 1810} {"train_loss": -6.107439041137695, "global_step": 76033, "epoch": 1810} {"train_loss": -6.1136274337768555, "global_step": 76034, "epoch": 1810} {"train_loss": -6.112123966217041, "global_step": 76035, "epoch": 1810} {"train_loss": -6.136441230773926, "global_step": 76036, "epoch": 1810} {"train_loss": -6.032716751098633, "global_step": 76037, "epoch": 1810} {"train_loss": -6.197210311889648, "global_step": 76038, "epoch": 1810} {"train_loss": -6.173618316650391, "global_step": 76039, "epoch": 1810} {"train_loss": -6.018424034118652, "global_step": 76040, "epoch": 1810} {"train_loss": -6.1087141036987305, "global_step": 76041, "epoch": 1810} {"train_loss": -6.035918235778809, "global_step": 76042, "epoch": 1810} {"train_loss": -6.1648030281066895, "global_step": 76043, "epoch": 1810} {"train_loss": -6.179086685180664, "global_step": 76044, "epoch": 1810} {"train_loss": -6.192221641540527, "global_step": 76045, "epoch": 1810} {"train_loss": -6.047369003295898, "global_step": 76046, "epoch": 1810} {"train_loss": -6.16917610168457, "global_step": 76047, "epoch": 1810} {"train_loss": -6.216150760650635, "global_step": 76048, "epoch": 1810} {"train_loss": -6.167152404785156, "global_step": 76049, "epoch": 1810} {"train_loss": -6.037199020385742, "global_step": 76050, "epoch": 1810} {"train_loss": -6.294135093688965, "global_step": 76051, "epoch": 1810} {"train_loss": -6.211947917938232, "global_step": 76052, "epoch": 1810} {"train_loss": -6.17017126083374, "global_step": 76053, "epoch": 1810} {"train_loss": -6.154475212097168, "global_step": 76054, "epoch": 1810} {"train_loss": -6.078102111816406, "global_step": 76055, "epoch": 1810} {"train_loss": -6.084332466125488, "global_step": 76056, "epoch": 1810} {"train_loss": -5.955033779144287, "global_step": 76057, "epoch": 1810} {"train_loss": -6.073822021484375, "global_step": 76058, "epoch": 1810} {"train_loss": -5.943536281585693, "global_step": 76059, "epoch": 1810} {"train_loss": -6.1102614402771, "global_step": 76060, "epoch": 1810} {"train_loss": -6.1102210112980435, "global_step": 76061, "epoch": 1810, "val_loss": 61911.3671875} {"train_loss": -6.125502586364746, "global_step": 76062, "epoch": 1811} {"train_loss": -6.096921920776367, "global_step": 76063, "epoch": 1811} {"train_loss": -6.242169380187988, "global_step": 76064, "epoch": 1811} {"train_loss": -6.131329536437988, "global_step": 76065, "epoch": 1811} {"train_loss": -6.07732629776001, "global_step": 76066, "epoch": 1811} {"train_loss": -6.143179893493652, "global_step": 76067, "epoch": 1811} {"train_loss": -6.042843818664551, "global_step": 76068, "epoch": 1811} {"train_loss": -6.100891590118408, "global_step": 76069, "epoch": 1811} {"train_loss": -6.12943172454834, "global_step": 76070, "epoch": 1811} {"train_loss": -6.087732315063477, "global_step": 76071, "epoch": 1811} {"train_loss": -6.162473678588867, "global_step": 76072, "epoch": 1811} {"train_loss": -6.095307350158691, "global_step": 76073, "epoch": 1811} {"train_loss": -5.97935676574707, "global_step": 76074, "epoch": 1811} {"train_loss": -6.115168571472168, "global_step": 76075, "epoch": 1811} {"train_loss": -6.038552284240723, "global_step": 76076, "epoch": 1811} {"train_loss": -6.137054443359375, "global_step": 76077, "epoch": 1811} {"train_loss": -6.146622657775879, "global_step": 76078, "epoch": 1811} {"train_loss": -6.108501434326172, "global_step": 76079, "epoch": 1811} {"train_loss": -6.112444877624512, "global_step": 76080, "epoch": 1811} {"train_loss": -6.140229225158691, "global_step": 76081, "epoch": 1811} {"train_loss": -6.011908531188965, "global_step": 76082, "epoch": 1811} {"train_loss": -6.097606658935547, "global_step": 76083, "epoch": 1811} {"train_loss": -6.04878044128418, "global_step": 76084, "epoch": 1811} {"train_loss": -6.0477495193481445, "global_step": 76085, "epoch": 1811} {"train_loss": -6.104706764221191, "global_step": 76086, "epoch": 1811} {"train_loss": -6.10183048248291, "global_step": 76087, "epoch": 1811} {"train_loss": -5.90516471862793, "global_step": 76088, "epoch": 1811} {"train_loss": -6.0978803634643555, "global_step": 76089, "epoch": 1811} {"train_loss": -5.986867904663086, "global_step": 76090, "epoch": 1811} {"train_loss": -6.03728723526001, "global_step": 76091, "epoch": 1811} {"train_loss": -6.004461765289307, "global_step": 76092, "epoch": 1811} {"train_loss": -5.989916801452637, "global_step": 76093, "epoch": 1811} {"train_loss": -6.159267902374268, "global_step": 76094, "epoch": 1811} {"train_loss": -5.977875709533691, "global_step": 76095, "epoch": 1811} {"train_loss": -6.01231575012207, "global_step": 76096, "epoch": 1811} {"train_loss": -5.992388725280762, "global_step": 76097, "epoch": 1811} {"train_loss": -5.989898681640625, "global_step": 76098, "epoch": 1811} {"train_loss": -6.053255081176758, "global_step": 76099, "epoch": 1811} {"train_loss": -6.035879135131836, "global_step": 76100, "epoch": 1811} {"train_loss": -6.072574138641357, "global_step": 76101, "epoch": 1811} {"train_loss": -6.057807445526123, "global_step": 76102, "epoch": 1811} {"train_loss": -6.069989658537365, "global_step": 76103, "epoch": 1811, "val_loss": 62094.25390625} {"train_loss": -6.08848762512207, "global_step": 76104, "epoch": 1812} {"train_loss": -6.031312465667725, "global_step": 76105, "epoch": 1812} {"train_loss": -6.083894729614258, "global_step": 76106, "epoch": 1812} {"train_loss": -6.111905097961426, "global_step": 76107, "epoch": 1812} {"train_loss": -6.099856376647949, "global_step": 76108, "epoch": 1812} {"train_loss": -6.15134334564209, "global_step": 76109, "epoch": 1812} {"train_loss": -6.148179054260254, "global_step": 76110, "epoch": 1812} {"train_loss": -6.0933122634887695, "global_step": 76111, "epoch": 1812} {"train_loss": -6.077834129333496, "global_step": 76112, "epoch": 1812} {"train_loss": -6.107027053833008, "global_step": 76113, "epoch": 1812} {"train_loss": -6.129827976226807, "global_step": 76114, "epoch": 1812} {"train_loss": -6.129282474517822, "global_step": 76115, "epoch": 1812} {"train_loss": -6.202259063720703, "global_step": 76116, "epoch": 1812} {"train_loss": -6.105420112609863, "global_step": 76117, "epoch": 1812} {"train_loss": -6.095463275909424, "global_step": 76118, "epoch": 1812} {"train_loss": -6.095646858215332, "global_step": 76119, "epoch": 1812} {"train_loss": -6.110540866851807, "global_step": 76120, "epoch": 1812} {"train_loss": -6.064234256744385, "global_step": 76121, "epoch": 1812} {"train_loss": -6.004795074462891, "global_step": 76122, "epoch": 1812} {"train_loss": -6.149643898010254, "global_step": 76123, "epoch": 1812} {"train_loss": -6.257345199584961, "global_step": 76124, "epoch": 1812} {"train_loss": -6.136248588562012, "global_step": 76125, "epoch": 1812} {"train_loss": -6.174429893493652, "global_step": 76126, "epoch": 1812} {"train_loss": -6.156167507171631, "global_step": 76127, "epoch": 1812} {"train_loss": -6.072415828704834, "global_step": 76128, "epoch": 1812} {"train_loss": -6.087705612182617, "global_step": 76129, "epoch": 1812} {"train_loss": -6.110828399658203, "global_step": 76130, "epoch": 1812} {"train_loss": -6.119645595550537, "global_step": 76131, "epoch": 1812} {"train_loss": -6.068210124969482, "global_step": 76132, "epoch": 1812} {"train_loss": -6.205168724060059, "global_step": 76133, "epoch": 1812} {"train_loss": -6.148384094238281, "global_step": 76134, "epoch": 1812} {"train_loss": -5.969367504119873, "global_step": 76135, "epoch": 1812} {"train_loss": -5.941064834594727, "global_step": 76136, "epoch": 1812} {"train_loss": -6.0789384841918945, "global_step": 76137, "epoch": 1812} {"train_loss": -6.066904544830322, "global_step": 76138, "epoch": 1812} {"train_loss": -6.173099517822266, "global_step": 76139, "epoch": 1812} {"train_loss": -6.0689544677734375, "global_step": 76140, "epoch": 1812} {"train_loss": -6.0625, "global_step": 76141, "epoch": 1812} {"train_loss": -6.0264387130737305, "global_step": 76142, "epoch": 1812} {"train_loss": -6.098281383514404, "global_step": 76143, "epoch": 1812} {"train_loss": -6.157419204711914, "global_step": 76144, "epoch": 1812} {"train_loss": -6.105389095488048, "global_step": 76145, "epoch": 1812, "val_loss": 62373.40625} {"train_loss": -5.9575347900390625, "global_step": 76146, "epoch": 1813} {"train_loss": -6.092154502868652, "global_step": 76147, "epoch": 1813} {"train_loss": -6.053499221801758, "global_step": 76148, "epoch": 1813} {"train_loss": -6.137948513031006, "global_step": 76149, "epoch": 1813} {"train_loss": -6.04887580871582, "global_step": 76150, "epoch": 1813} {"train_loss": -6.124861717224121, "global_step": 76151, "epoch": 1813} {"train_loss": -6.076676368713379, "global_step": 76152, "epoch": 1813} {"train_loss": -5.956066131591797, "global_step": 76153, "epoch": 1813} {"train_loss": -6.126880168914795, "global_step": 76154, "epoch": 1813} {"train_loss": -5.9947028160095215, "global_step": 76155, "epoch": 1813} {"train_loss": -6.001359939575195, "global_step": 76156, "epoch": 1813} {"train_loss": -6.0948591232299805, "global_step": 76157, "epoch": 1813} {"train_loss": -6.088674545288086, "global_step": 76158, "epoch": 1813} {"train_loss": -6.126430988311768, "global_step": 76159, "epoch": 1813} {"train_loss": -6.035510540008545, "global_step": 76160, "epoch": 1813} {"train_loss": -6.056513786315918, "global_step": 76161, "epoch": 1813} {"train_loss": -6.013589382171631, "global_step": 76162, "epoch": 1813} {"train_loss": -6.228124141693115, "global_step": 76163, "epoch": 1813} {"train_loss": -6.117264747619629, "global_step": 76164, "epoch": 1813} {"train_loss": -6.037315845489502, "global_step": 76165, "epoch": 1813} {"train_loss": -6.096874713897705, "global_step": 76166, "epoch": 1813} {"train_loss": -6.070199012756348, "global_step": 76167, "epoch": 1813} {"train_loss": -6.0267229080200195, "global_step": 76168, "epoch": 1813} {"train_loss": -6.1544694900512695, "global_step": 76169, "epoch": 1813} {"train_loss": -6.100121021270752, "global_step": 76170, "epoch": 1813} {"train_loss": -6.201178550720215, "global_step": 76171, "epoch": 1813} {"train_loss": -6.030973434448242, "global_step": 76172, "epoch": 1813} {"train_loss": -6.2078657150268555, "global_step": 76173, "epoch": 1813} {"train_loss": -6.206712245941162, "global_step": 76174, "epoch": 1813} {"train_loss": -6.152250289916992, "global_step": 76175, "epoch": 1813} {"train_loss": -6.010132312774658, "global_step": 76176, "epoch": 1813} {"train_loss": -6.142698764801025, "global_step": 76177, "epoch": 1813} {"train_loss": -6.188992023468018, "global_step": 76178, "epoch": 1813} {"train_loss": -6.0366411209106445, "global_step": 76179, "epoch": 1813} {"train_loss": -6.10371208190918, "global_step": 76180, "epoch": 1813} {"train_loss": -6.0505266189575195, "global_step": 76181, "epoch": 1813} {"train_loss": -6.0493364334106445, "global_step": 76182, "epoch": 1813} {"train_loss": -6.0448431968688965, "global_step": 76183, "epoch": 1813} {"train_loss": -6.0704545974731445, "global_step": 76184, "epoch": 1813} {"train_loss": -5.96839714050293, "global_step": 76185, "epoch": 1813} {"train_loss": -6.0713582038879395, "global_step": 76186, "epoch": 1813} {"train_loss": -6.0756309032440186, "global_step": 76187, "epoch": 1813, "val_loss": 62215.4296875} {"train_loss": -6.048725128173828, "global_step": 76188, "epoch": 1814} {"train_loss": -6.071287155151367, "global_step": 76189, "epoch": 1814} {"train_loss": -6.056161880493164, "global_step": 76190, "epoch": 1814} {"train_loss": -6.1419782638549805, "global_step": 76191, "epoch": 1814} {"train_loss": -6.001099109649658, "global_step": 76192, "epoch": 1814} {"train_loss": -6.111330509185791, "global_step": 76193, "epoch": 1814} {"train_loss": -6.019554615020752, "global_step": 76194, "epoch": 1814} {"train_loss": -6.073524475097656, "global_step": 76195, "epoch": 1814} {"train_loss": -6.114206314086914, "global_step": 76196, "epoch": 1814} {"train_loss": -6.081015586853027, "global_step": 76197, "epoch": 1814} {"train_loss": -6.051840782165527, "global_step": 76198, "epoch": 1814} {"train_loss": -6.107484817504883, "global_step": 76199, "epoch": 1814} {"train_loss": -6.160489082336426, "global_step": 76200, "epoch": 1814} {"train_loss": -6.146850109100342, "global_step": 76201, "epoch": 1814} {"train_loss": -6.062098026275635, "global_step": 76202, "epoch": 1814} {"train_loss": -6.052917957305908, "global_step": 76203, "epoch": 1814} {"train_loss": -6.1737751960754395, "global_step": 76204, "epoch": 1814} {"train_loss": -6.072011947631836, "global_step": 76205, "epoch": 1814} {"train_loss": -6.093494415283203, "global_step": 76206, "epoch": 1814} {"train_loss": -6.196290969848633, "global_step": 76207, "epoch": 1814} {"train_loss": -6.128558158874512, "global_step": 76208, "epoch": 1814} {"train_loss": -6.168893337249756, "global_step": 76209, "epoch": 1814} {"train_loss": -6.013518810272217, "global_step": 76210, "epoch": 1814} {"train_loss": -6.06502628326416, "global_step": 76211, "epoch": 1814} {"train_loss": -6.107058525085449, "global_step": 76212, "epoch": 1814} {"train_loss": -6.111580848693848, "global_step": 76213, "epoch": 1814} {"train_loss": -6.06028413772583, "global_step": 76214, "epoch": 1814} {"train_loss": -6.117207050323486, "global_step": 76215, "epoch": 1814} {"train_loss": -6.13606595993042, "global_step": 76216, "epoch": 1814} {"train_loss": -6.070066452026367, "global_step": 76217, "epoch": 1814} {"train_loss": -6.102412223815918, "global_step": 76218, "epoch": 1814} {"train_loss": -6.117812156677246, "global_step": 76219, "epoch": 1814} {"train_loss": -6.088134765625, "global_step": 76220, "epoch": 1814} {"train_loss": -6.071386337280273, "global_step": 76221, "epoch": 1814} {"train_loss": -6.0591044425964355, "global_step": 76222, "epoch": 1814} {"train_loss": -6.036823272705078, "global_step": 76223, "epoch": 1814} {"train_loss": -6.040366172790527, "global_step": 76224, "epoch": 1814} {"train_loss": -5.983035087585449, "global_step": 76225, "epoch": 1814} {"train_loss": -6.116097450256348, "global_step": 76226, "epoch": 1814} {"train_loss": -6.0823163986206055, "global_step": 76227, "epoch": 1814} {"train_loss": -5.989405632019043, "global_step": 76228, "epoch": 1814} {"train_loss": -6.086675893692743, "global_step": 76229, "epoch": 1814, "val_loss": 62180.40625} {"train_loss": -6.060849189758301, "global_step": 76230, "epoch": 1815} {"train_loss": -6.131621360778809, "global_step": 76231, "epoch": 1815} {"train_loss": -5.993159294128418, "global_step": 76232, "epoch": 1815} {"train_loss": -6.136752605438232, "global_step": 76233, "epoch": 1815} {"train_loss": -6.086943626403809, "global_step": 76234, "epoch": 1815} {"train_loss": -6.087568283081055, "global_step": 76235, "epoch": 1815} {"train_loss": -6.083197593688965, "global_step": 76236, "epoch": 1815} {"train_loss": -6.085536956787109, "global_step": 76237, "epoch": 1815} {"train_loss": -6.1366496086120605, "global_step": 76238, "epoch": 1815} {"train_loss": -6.060860633850098, "global_step": 76239, "epoch": 1815} {"train_loss": -6.144286632537842, "global_step": 76240, "epoch": 1815} {"train_loss": -6.089022636413574, "global_step": 76241, "epoch": 1815} {"train_loss": -6.168379306793213, "global_step": 76242, "epoch": 1815} {"train_loss": -6.116188049316406, "global_step": 76243, "epoch": 1815} {"train_loss": -6.18222188949585, "global_step": 76244, "epoch": 1815} {"train_loss": -6.054448127746582, "global_step": 76245, "epoch": 1815} {"train_loss": -6.148966312408447, "global_step": 76246, "epoch": 1815} {"train_loss": -6.1044464111328125, "global_step": 76247, "epoch": 1815} {"train_loss": -6.121553421020508, "global_step": 76248, "epoch": 1815} {"train_loss": -6.105067253112793, "global_step": 76249, "epoch": 1815} {"train_loss": -6.084947109222412, "global_step": 76250, "epoch": 1815} {"train_loss": -6.025693416595459, "global_step": 76251, "epoch": 1815} {"train_loss": -5.990399360656738, "global_step": 76252, "epoch": 1815} {"train_loss": -6.040487289428711, "global_step": 76253, "epoch": 1815} {"train_loss": -6.131836891174316, "global_step": 76254, "epoch": 1815} {"train_loss": -6.120961666107178, "global_step": 76255, "epoch": 1815} {"train_loss": -6.036198616027832, "global_step": 76256, "epoch": 1815} {"train_loss": -6.151163578033447, "global_step": 76257, "epoch": 1815} {"train_loss": -5.9896135330200195, "global_step": 76258, "epoch": 1815} {"train_loss": -6.0085649490356445, "global_step": 76259, "epoch": 1815} {"train_loss": -6.101891994476318, "global_step": 76260, "epoch": 1815} {"train_loss": -5.990211486816406, "global_step": 76261, "epoch": 1815} {"train_loss": -6.044747352600098, "global_step": 76262, "epoch": 1815} {"train_loss": -5.988883018493652, "global_step": 76263, "epoch": 1815} {"train_loss": -6.069343090057373, "global_step": 76264, "epoch": 1815} {"train_loss": -6.101670742034912, "global_step": 76265, "epoch": 1815} {"train_loss": -6.054500579833984, "global_step": 76266, "epoch": 1815} {"train_loss": -5.984185218811035, "global_step": 76267, "epoch": 1815} {"train_loss": -6.076618194580078, "global_step": 76268, "epoch": 1815} {"train_loss": -6.091771125793457, "global_step": 76269, "epoch": 1815} {"train_loss": -6.075103282928467, "global_step": 76270, "epoch": 1815} {"train_loss": -6.080305916922433, "global_step": 76271, "epoch": 1815, "val_loss": 62065.10546875} {"train_loss": -6.043003082275391, "global_step": 76272, "epoch": 1816} {"train_loss": -6.043674468994141, "global_step": 76273, "epoch": 1816} {"train_loss": -6.1325788497924805, "global_step": 76274, "epoch": 1816} {"train_loss": -6.304389476776123, "global_step": 76275, "epoch": 1816} {"train_loss": -6.149738311767578, "global_step": 76276, "epoch": 1816} {"train_loss": -6.085353374481201, "global_step": 76277, "epoch": 1816} {"train_loss": -5.9239959716796875, "global_step": 76278, "epoch": 1816} {"train_loss": -6.119875907897949, "global_step": 76279, "epoch": 1816} {"train_loss": -6.107229232788086, "global_step": 76280, "epoch": 1816} {"train_loss": -6.083418846130371, "global_step": 76281, "epoch": 1816} {"train_loss": -6.102064609527588, "global_step": 76282, "epoch": 1816} {"train_loss": -6.050286293029785, "global_step": 76283, "epoch": 1816} {"train_loss": -6.037954807281494, "global_step": 76284, "epoch": 1816} {"train_loss": -6.223383903503418, "global_step": 76285, "epoch": 1816} {"train_loss": -6.061054706573486, "global_step": 76286, "epoch": 1816} {"train_loss": -6.0698137283325195, "global_step": 76287, "epoch": 1816} {"train_loss": -6.200837135314941, "global_step": 76288, "epoch": 1816} {"train_loss": -6.2223124504089355, "global_step": 76289, "epoch": 1816} {"train_loss": -6.167043685913086, "global_step": 76290, "epoch": 1816} {"train_loss": -6.199765205383301, "global_step": 76291, "epoch": 1816} {"train_loss": -6.144571781158447, "global_step": 76292, "epoch": 1816} {"train_loss": -6.123976707458496, "global_step": 76293, "epoch": 1816} {"train_loss": -6.076930046081543, "global_step": 76294, "epoch": 1816} {"train_loss": -6.106705188751221, "global_step": 76295, "epoch": 1816} {"train_loss": -6.124977111816406, "global_step": 76296, "epoch": 1816} {"train_loss": -6.184069633483887, "global_step": 76297, "epoch": 1816} {"train_loss": -6.123449325561523, "global_step": 76298, "epoch": 1816} {"train_loss": -6.189388275146484, "global_step": 76299, "epoch": 1816} {"train_loss": -6.138210296630859, "global_step": 76300, "epoch": 1816} {"train_loss": -6.056612968444824, "global_step": 76301, "epoch": 1816} {"train_loss": -6.131933212280273, "global_step": 76302, "epoch": 1816} {"train_loss": -6.082388401031494, "global_step": 76303, "epoch": 1816} {"train_loss": -5.980619430541992, "global_step": 76304, "epoch": 1816} {"train_loss": -6.012180805206299, "global_step": 76305, "epoch": 1816} {"train_loss": -6.127013683319092, "global_step": 76306, "epoch": 1816} {"train_loss": -5.956394195556641, "global_step": 76307, "epoch": 1816} {"train_loss": -6.009029388427734, "global_step": 76308, "epoch": 1816} {"train_loss": -6.253061294555664, "global_step": 76309, "epoch": 1816} {"train_loss": -6.195882320404053, "global_step": 76310, "epoch": 1816} {"train_loss": -6.128509998321533, "global_step": 76311, "epoch": 1816} {"train_loss": -6.073678016662598, "global_step": 76312, "epoch": 1816} {"train_loss": -6.107827288763864, "global_step": 76313, "epoch": 1816, "val_loss": 62086.7109375} {"train_loss": -6.025397300720215, "global_step": 76314, "epoch": 1817} {"train_loss": -5.954268932342529, "global_step": 76315, "epoch": 1817} {"train_loss": -6.110738754272461, "global_step": 76316, "epoch": 1817} {"train_loss": -5.9596357345581055, "global_step": 76317, "epoch": 1817} {"train_loss": -6.130929470062256, "global_step": 76318, "epoch": 1817} {"train_loss": -6.156431198120117, "global_step": 76319, "epoch": 1817} {"train_loss": -5.884145736694336, "global_step": 76320, "epoch": 1817} {"train_loss": -5.976081848144531, "global_step": 76321, "epoch": 1817} {"train_loss": -6.045353412628174, "global_step": 76322, "epoch": 1817} {"train_loss": -5.9863176345825195, "global_step": 76323, "epoch": 1817} {"train_loss": -6.034062385559082, "global_step": 76324, "epoch": 1817} {"train_loss": -5.958776473999023, "global_step": 76325, "epoch": 1817} {"train_loss": -6.116530418395996, "global_step": 76326, "epoch": 1817} {"train_loss": -6.012781143188477, "global_step": 76327, "epoch": 1817} {"train_loss": -6.076509475708008, "global_step": 76328, "epoch": 1817} {"train_loss": -6.147632122039795, "global_step": 76329, "epoch": 1817} {"train_loss": -6.0106964111328125, "global_step": 76330, "epoch": 1817} {"train_loss": -6.132885932922363, "global_step": 76331, "epoch": 1817} {"train_loss": -6.132658004760742, "global_step": 76332, "epoch": 1817} {"train_loss": -6.012483596801758, "global_step": 76333, "epoch": 1817} {"train_loss": -6.072770118713379, "global_step": 76334, "epoch": 1817} {"train_loss": -6.070406436920166, "global_step": 76335, "epoch": 1817} {"train_loss": -6.116886138916016, "global_step": 76336, "epoch": 1817} {"train_loss": -6.058194160461426, "global_step": 76337, "epoch": 1817} {"train_loss": -6.036736488342285, "global_step": 76338, "epoch": 1817} {"train_loss": -6.008594512939453, "global_step": 76339, "epoch": 1817} {"train_loss": -6.275219917297363, "global_step": 76340, "epoch": 1817} {"train_loss": -6.056763172149658, "global_step": 76341, "epoch": 1817} {"train_loss": -6.037606239318848, "global_step": 76342, "epoch": 1817} {"train_loss": -6.084413528442383, "global_step": 76343, "epoch": 1817} {"train_loss": -6.162132740020752, "global_step": 76344, "epoch": 1817} {"train_loss": -6.071378707885742, "global_step": 76345, "epoch": 1817} {"train_loss": -6.135223388671875, "global_step": 76346, "epoch": 1817} {"train_loss": -6.087246894836426, "global_step": 76347, "epoch": 1817} {"train_loss": -6.081182479858398, "global_step": 76348, "epoch": 1817} {"train_loss": -6.288952350616455, "global_step": 76349, "epoch": 1817} {"train_loss": -6.134367942810059, "global_step": 76350, "epoch": 1817} {"train_loss": -6.101795196533203, "global_step": 76351, "epoch": 1817} {"train_loss": -6.126605033874512, "global_step": 76352, "epoch": 1817} {"train_loss": -6.137322902679443, "global_step": 76353, "epoch": 1817} {"train_loss": -6.023019790649414, "global_step": 76354, "epoch": 1817} {"train_loss": -6.075206608999343, "global_step": 76355, "epoch": 1817, "val_loss": 61747.15234375} {"train_loss": -6.143157958984375, "global_step": 76356, "epoch": 1818} {"train_loss": -6.024506568908691, "global_step": 76357, "epoch": 1818} {"train_loss": -6.248887062072754, "global_step": 76358, "epoch": 1818} {"train_loss": -6.218704700469971, "global_step": 76359, "epoch": 1818} {"train_loss": -6.146690368652344, "global_step": 76360, "epoch": 1818} {"train_loss": -6.192928314208984, "global_step": 76361, "epoch": 1818} {"train_loss": -6.0623273849487305, "global_step": 76362, "epoch": 1818} {"train_loss": -6.155089855194092, "global_step": 76363, "epoch": 1818} {"train_loss": -6.13236141204834, "global_step": 76364, "epoch": 1818} {"train_loss": -6.124133110046387, "global_step": 76365, "epoch": 1818} {"train_loss": -6.138271331787109, "global_step": 76366, "epoch": 1818} {"train_loss": -6.269491195678711, "global_step": 76367, "epoch": 1818} {"train_loss": -6.1166863441467285, "global_step": 76368, "epoch": 1818} {"train_loss": -6.199675559997559, "global_step": 76369, "epoch": 1818} {"train_loss": -6.067082405090332, "global_step": 76370, "epoch": 1818} {"train_loss": -6.161257743835449, "global_step": 76371, "epoch": 1818} {"train_loss": -6.135087966918945, "global_step": 76372, "epoch": 1818} {"train_loss": -6.14137077331543, "global_step": 76373, "epoch": 1818} {"train_loss": -6.216211318969727, "global_step": 76374, "epoch": 1818} {"train_loss": -5.986550331115723, "global_step": 76375, "epoch": 1818} {"train_loss": -6.170048236846924, "global_step": 76376, "epoch": 1818} {"train_loss": -6.0950798988342285, "global_step": 76377, "epoch": 1818} {"train_loss": -6.089598178863525, "global_step": 76378, "epoch": 1818} {"train_loss": -6.112570762634277, "global_step": 76379, "epoch": 1818} {"train_loss": -6.144045352935791, "global_step": 76380, "epoch": 1818} {"train_loss": -6.057680130004883, "global_step": 76381, "epoch": 1818} {"train_loss": -6.163022994995117, "global_step": 76382, "epoch": 1818} {"train_loss": -6.097243785858154, "global_step": 76383, "epoch": 1818} {"train_loss": -6.164587497711182, "global_step": 76384, "epoch": 1818} {"train_loss": -6.189602851867676, "global_step": 76385, "epoch": 1818} {"train_loss": -6.1704206466674805, "global_step": 76386, "epoch": 1818} {"train_loss": -6.2272233963012695, "global_step": 76387, "epoch": 1818} {"train_loss": -6.147726058959961, "global_step": 76388, "epoch": 1818} {"train_loss": -6.051701545715332, "global_step": 76389, "epoch": 1818} {"train_loss": -6.108489990234375, "global_step": 76390, "epoch": 1818} {"train_loss": -6.022582054138184, "global_step": 76391, "epoch": 1818} {"train_loss": -6.124011993408203, "global_step": 76392, "epoch": 1818} {"train_loss": -6.1511149406433105, "global_step": 76393, "epoch": 1818} {"train_loss": -6.103360176086426, "global_step": 76394, "epoch": 1818} {"train_loss": -6.169157981872559, "global_step": 76395, "epoch": 1818} {"train_loss": -6.182760238647461, "global_step": 76396, "epoch": 1818} {"train_loss": -6.134304705120268, "global_step": 76397, "epoch": 1818, "val_loss": 62051.12109375} {"train_loss": -6.03498649597168, "global_step": 76398, "epoch": 1819} {"train_loss": -6.101357460021973, "global_step": 76399, "epoch": 1819} {"train_loss": -6.187990665435791, "global_step": 76400, "epoch": 1819} {"train_loss": -6.063656806945801, "global_step": 76401, "epoch": 1819} {"train_loss": -6.145463943481445, "global_step": 76402, "epoch": 1819} {"train_loss": -6.181601524353027, "global_step": 76403, "epoch": 1819} {"train_loss": -6.033079147338867, "global_step": 76404, "epoch": 1819} {"train_loss": -6.092881202697754, "global_step": 76405, "epoch": 1819} {"train_loss": -6.090065002441406, "global_step": 76406, "epoch": 1819} {"train_loss": -6.025370121002197, "global_step": 76407, "epoch": 1819} {"train_loss": -6.123261451721191, "global_step": 76408, "epoch": 1819} {"train_loss": -6.020174503326416, "global_step": 76409, "epoch": 1819} {"train_loss": -6.037544250488281, "global_step": 76410, "epoch": 1819} {"train_loss": -6.186865329742432, "global_step": 76411, "epoch": 1819} {"train_loss": -6.073269844055176, "global_step": 76412, "epoch": 1819} {"train_loss": -6.149158000946045, "global_step": 76413, "epoch": 1819} {"train_loss": -6.073875427246094, "global_step": 76414, "epoch": 1819} {"train_loss": -6.154184818267822, "global_step": 76415, "epoch": 1819} {"train_loss": -6.172362327575684, "global_step": 76416, "epoch": 1819} {"train_loss": -6.017734527587891, "global_step": 76417, "epoch": 1819} {"train_loss": -6.074820518493652, "global_step": 76418, "epoch": 1819} {"train_loss": -6.191399574279785, "global_step": 76419, "epoch": 1819} {"train_loss": -6.092149257659912, "global_step": 76420, "epoch": 1819} {"train_loss": -6.206338405609131, "global_step": 76421, "epoch": 1819} {"train_loss": -6.166126728057861, "global_step": 76422, "epoch": 1819} {"train_loss": -6.041871547698975, "global_step": 76423, "epoch": 1819} {"train_loss": -6.150622844696045, "global_step": 76424, "epoch": 1819} {"train_loss": -6.033853530883789, "global_step": 76425, "epoch": 1819} {"train_loss": -6.133573532104492, "global_step": 76426, "epoch": 1819} {"train_loss": -6.079144477844238, "global_step": 76427, "epoch": 1819} {"train_loss": -6.262170314788818, "global_step": 76428, "epoch": 1819} {"train_loss": -6.064965724945068, "global_step": 76429, "epoch": 1819} {"train_loss": -6.155117988586426, "global_step": 76430, "epoch": 1819} {"train_loss": -6.138011932373047, "global_step": 76431, "epoch": 1819} {"train_loss": -6.230433464050293, "global_step": 76432, "epoch": 1819} {"train_loss": -5.982377052307129, "global_step": 76433, "epoch": 1819} {"train_loss": -6.111072540283203, "global_step": 76434, "epoch": 1819} {"train_loss": -6.166932582855225, "global_step": 76435, "epoch": 1819} {"train_loss": -5.924805641174316, "global_step": 76436, "epoch": 1819} {"train_loss": -6.13261604309082, "global_step": 76437, "epoch": 1819} {"train_loss": -6.035289764404297, "global_step": 76438, "epoch": 1819} {"train_loss": -6.106367440450759, "global_step": 76439, "epoch": 1819, "val_loss": 61965.01953125} {"train_loss": -6.017199993133545, "global_step": 76440, "epoch": 1820} {"train_loss": -6.105620384216309, "global_step": 76441, "epoch": 1820} {"train_loss": -6.120247840881348, "global_step": 76442, "epoch": 1820} {"train_loss": -6.196393966674805, "global_step": 76443, "epoch": 1820} {"train_loss": -6.045320510864258, "global_step": 76444, "epoch": 1820} {"train_loss": -6.072498321533203, "global_step": 76445, "epoch": 1820} {"train_loss": -6.046050548553467, "global_step": 76446, "epoch": 1820} {"train_loss": -6.100496768951416, "global_step": 76447, "epoch": 1820} {"train_loss": -6.157154083251953, "global_step": 76448, "epoch": 1820} {"train_loss": -6.028789043426514, "global_step": 76449, "epoch": 1820} {"train_loss": -6.169478893280029, "global_step": 76450, "epoch": 1820} {"train_loss": -6.115548133850098, "global_step": 76451, "epoch": 1820} {"train_loss": -6.026790618896484, "global_step": 76452, "epoch": 1820} {"train_loss": -6.140970706939697, "global_step": 76453, "epoch": 1820} {"train_loss": -6.146173477172852, "global_step": 76454, "epoch": 1820} {"train_loss": -6.030444145202637, "global_step": 76455, "epoch": 1820} {"train_loss": -6.035017013549805, "global_step": 76456, "epoch": 1820} {"train_loss": -5.94456148147583, "global_step": 76457, "epoch": 1820} {"train_loss": -6.176272392272949, "global_step": 76458, "epoch": 1820} {"train_loss": -6.131124019622803, "global_step": 76459, "epoch": 1820} {"train_loss": -6.040396690368652, "global_step": 76460, "epoch": 1820} {"train_loss": -6.106244087219238, "global_step": 76461, "epoch": 1820} {"train_loss": -6.107723236083984, "global_step": 76462, "epoch": 1820} {"train_loss": -6.178535461425781, "global_step": 76463, "epoch": 1820} {"train_loss": -6.229373455047607, "global_step": 76464, "epoch": 1820} {"train_loss": -6.19310188293457, "global_step": 76465, "epoch": 1820} {"train_loss": -6.169535160064697, "global_step": 76466, "epoch": 1820} {"train_loss": -6.012764930725098, "global_step": 76467, "epoch": 1820} {"train_loss": -6.208345413208008, "global_step": 76468, "epoch": 1820} {"train_loss": -6.118332862854004, "global_step": 76469, "epoch": 1820} {"train_loss": -6.11375093460083, "global_step": 76470, "epoch": 1820} {"train_loss": -6.1444478034973145, "global_step": 76471, "epoch": 1820} {"train_loss": -6.094878196716309, "global_step": 76472, "epoch": 1820} {"train_loss": -5.996537208557129, "global_step": 76473, "epoch": 1820} {"train_loss": -5.994697570800781, "global_step": 76474, "epoch": 1820} {"train_loss": -6.198215484619141, "global_step": 76475, "epoch": 1820} {"train_loss": -6.057603359222412, "global_step": 76476, "epoch": 1820} {"train_loss": -6.109096050262451, "global_step": 76477, "epoch": 1820} {"train_loss": -6.038752555847168, "global_step": 76478, "epoch": 1820} {"train_loss": -6.05239200592041, "global_step": 76479, "epoch": 1820} {"train_loss": -6.118498802185059, "global_step": 76480, "epoch": 1820} {"train_loss": -6.100887639181955, "global_step": 76481, "epoch": 1820, "val_loss": 62192.5625} {"train_loss": -6.057838439941406, "global_step": 76482, "epoch": 1821} {"train_loss": -6.0504231452941895, "global_step": 76483, "epoch": 1821} {"train_loss": -6.116540908813477, "global_step": 76484, "epoch": 1821} {"train_loss": -6.196874618530273, "global_step": 76485, "epoch": 1821} {"train_loss": -5.9451069831848145, "global_step": 76486, "epoch": 1821} {"train_loss": -6.201780319213867, "global_step": 76487, "epoch": 1821} {"train_loss": -6.023423194885254, "global_step": 76488, "epoch": 1821} {"train_loss": -6.082695007324219, "global_step": 76489, "epoch": 1821} {"train_loss": -6.115544319152832, "global_step": 76490, "epoch": 1821} {"train_loss": -6.033079147338867, "global_step": 76491, "epoch": 1821} {"train_loss": -6.125565528869629, "global_step": 76492, "epoch": 1821} {"train_loss": -6.161871910095215, "global_step": 76493, "epoch": 1821} {"train_loss": -6.092162609100342, "global_step": 76494, "epoch": 1821} {"train_loss": -6.065174579620361, "global_step": 76495, "epoch": 1821} {"train_loss": -6.199853897094727, "global_step": 76496, "epoch": 1821} {"train_loss": -6.025406837463379, "global_step": 76497, "epoch": 1821} {"train_loss": -6.163976669311523, "global_step": 76498, "epoch": 1821} {"train_loss": -6.103703022003174, "global_step": 76499, "epoch": 1821} {"train_loss": -6.095151901245117, "global_step": 76500, "epoch": 1821} {"train_loss": -6.087157726287842, "global_step": 76501, "epoch": 1821} {"train_loss": -6.084831237792969, "global_step": 76502, "epoch": 1821} {"train_loss": -6.126953125, "global_step": 76503, "epoch": 1821} {"train_loss": -6.112992286682129, "global_step": 76504, "epoch": 1821} {"train_loss": -6.100431442260742, "global_step": 76505, "epoch": 1821} {"train_loss": -6.099036693572998, "global_step": 76506, "epoch": 1821} {"train_loss": -5.958587646484375, "global_step": 76507, "epoch": 1821} {"train_loss": -6.081072807312012, "global_step": 76508, "epoch": 1821} {"train_loss": -5.922100067138672, "global_step": 76509, "epoch": 1821} {"train_loss": -6.070084571838379, "global_step": 76510, "epoch": 1821} {"train_loss": -6.280989646911621, "global_step": 76511, "epoch": 1821} {"train_loss": -6.145142555236816, "global_step": 76512, "epoch": 1821} {"train_loss": -5.956517219543457, "global_step": 76513, "epoch": 1821} {"train_loss": -6.0996222496032715, "global_step": 76514, "epoch": 1821} {"train_loss": -5.956637382507324, "global_step": 76515, "epoch": 1821} {"train_loss": -6.108885288238525, "global_step": 76516, "epoch": 1821} {"train_loss": -6.085011005401611, "global_step": 76517, "epoch": 1821} {"train_loss": -6.027744293212891, "global_step": 76518, "epoch": 1821} {"train_loss": -6.152166366577148, "global_step": 76519, "epoch": 1821} {"train_loss": -6.1023054122924805, "global_step": 76520, "epoch": 1821} {"train_loss": -6.05049991607666, "global_step": 76521, "epoch": 1821} {"train_loss": -6.155513763427734, "global_step": 76522, "epoch": 1821} {"train_loss": -6.0886865456899, "global_step": 76523, "epoch": 1821, "val_loss": 62139.92578125} {"train_loss": -6.120377540588379, "global_step": 76524, "epoch": 1822} {"train_loss": -6.0687432289123535, "global_step": 76525, "epoch": 1822} {"train_loss": -6.09304141998291, "global_step": 76526, "epoch": 1822} {"train_loss": -6.139235496520996, "global_step": 76527, "epoch": 1822} {"train_loss": -6.2862725257873535, "global_step": 76528, "epoch": 1822} {"train_loss": -6.205986976623535, "global_step": 76529, "epoch": 1822} {"train_loss": -6.119088649749756, "global_step": 76530, "epoch": 1822} {"train_loss": -6.083117485046387, "global_step": 76531, "epoch": 1822} {"train_loss": -6.118536472320557, "global_step": 76532, "epoch": 1822} {"train_loss": -6.154233932495117, "global_step": 76533, "epoch": 1822} {"train_loss": -6.079440116882324, "global_step": 76534, "epoch": 1822} {"train_loss": -6.182570457458496, "global_step": 76535, "epoch": 1822} {"train_loss": -6.13627815246582, "global_step": 76536, "epoch": 1822} {"train_loss": -6.103221893310547, "global_step": 76537, "epoch": 1822} {"train_loss": -6.162635803222656, "global_step": 76538, "epoch": 1822} {"train_loss": -6.053071975708008, "global_step": 76539, "epoch": 1822} {"train_loss": -6.176398754119873, "global_step": 76540, "epoch": 1822} {"train_loss": -6.12902307510376, "global_step": 76541, "epoch": 1822} {"train_loss": -6.180958271026611, "global_step": 76542, "epoch": 1822} {"train_loss": -6.075925350189209, "global_step": 76543, "epoch": 1822} {"train_loss": -6.141322135925293, "global_step": 76544, "epoch": 1822} {"train_loss": -6.088167667388916, "global_step": 76545, "epoch": 1822} {"train_loss": -6.081783771514893, "global_step": 76546, "epoch": 1822} {"train_loss": -6.188641548156738, "global_step": 76547, "epoch": 1822} {"train_loss": -6.156068801879883, "global_step": 76548, "epoch": 1822} {"train_loss": -6.095663070678711, "global_step": 76549, "epoch": 1822} {"train_loss": -6.061065673828125, "global_step": 76550, "epoch": 1822} {"train_loss": -6.106096267700195, "global_step": 76551, "epoch": 1822} {"train_loss": -6.128477096557617, "global_step": 76552, "epoch": 1822} {"train_loss": -6.068939685821533, "global_step": 76553, "epoch": 1822} {"train_loss": -6.167771816253662, "global_step": 76554, "epoch": 1822} {"train_loss": -6.119635581970215, "global_step": 76555, "epoch": 1822} {"train_loss": -6.1200056076049805, "global_step": 76556, "epoch": 1822} {"train_loss": -6.080925464630127, "global_step": 76557, "epoch": 1822} {"train_loss": -6.0862884521484375, "global_step": 76558, "epoch": 1822} {"train_loss": -6.1836323738098145, "global_step": 76559, "epoch": 1822} {"train_loss": -6.190798282623291, "global_step": 76560, "epoch": 1822} {"train_loss": -6.013504981994629, "global_step": 76561, "epoch": 1822} {"train_loss": -6.061009883880615, "global_step": 76562, "epoch": 1822} {"train_loss": -6.0444231033325195, "global_step": 76563, "epoch": 1822} {"train_loss": -5.981884002685547, "global_step": 76564, "epoch": 1822} {"train_loss": -6.11748388835362, "global_step": 76565, "epoch": 1822, "val_loss": 62329.65625} {"train_loss": -6.125372886657715, "global_step": 76566, "epoch": 1823} {"train_loss": -6.158601760864258, "global_step": 76567, "epoch": 1823} {"train_loss": -5.999235153198242, "global_step": 76568, "epoch": 1823} {"train_loss": -6.180475234985352, "global_step": 76569, "epoch": 1823} {"train_loss": -6.189379692077637, "global_step": 76570, "epoch": 1823} {"train_loss": -5.982576370239258, "global_step": 76571, "epoch": 1823} {"train_loss": -6.187683582305908, "global_step": 76572, "epoch": 1823} {"train_loss": -6.05853271484375, "global_step": 76573, "epoch": 1823} {"train_loss": -5.997268199920654, "global_step": 76574, "epoch": 1823} {"train_loss": -6.1400346755981445, "global_step": 76575, "epoch": 1823} {"train_loss": -6.004724025726318, "global_step": 76576, "epoch": 1823} {"train_loss": -6.095937728881836, "global_step": 76577, "epoch": 1823} {"train_loss": -6.144369125366211, "global_step": 76578, "epoch": 1823} {"train_loss": -6.134959697723389, "global_step": 76579, "epoch": 1823} {"train_loss": -6.182043075561523, "global_step": 76580, "epoch": 1823} {"train_loss": -5.962467193603516, "global_step": 76581, "epoch": 1823} {"train_loss": -6.158050060272217, "global_step": 76582, "epoch": 1823} {"train_loss": -6.119945526123047, "global_step": 76583, "epoch": 1823} {"train_loss": -6.167559623718262, "global_step": 76584, "epoch": 1823} {"train_loss": -6.128351211547852, "global_step": 76585, "epoch": 1823} {"train_loss": -6.163717269897461, "global_step": 76586, "epoch": 1823} {"train_loss": -6.163274765014648, "global_step": 76587, "epoch": 1823} {"train_loss": -6.147709369659424, "global_step": 76588, "epoch": 1823} {"train_loss": -6.1171417236328125, "global_step": 76589, "epoch": 1823} {"train_loss": -6.128525733947754, "global_step": 76590, "epoch": 1823} {"train_loss": -6.079420566558838, "global_step": 76591, "epoch": 1823} {"train_loss": -6.175062656402588, "global_step": 76592, "epoch": 1823} {"train_loss": -6.06748104095459, "global_step": 76593, "epoch": 1823} {"train_loss": -6.028616905212402, "global_step": 76594, "epoch": 1823} {"train_loss": -6.096747398376465, "global_step": 76595, "epoch": 1823} {"train_loss": -6.157306671142578, "global_step": 76596, "epoch": 1823} {"train_loss": -6.183492660522461, "global_step": 76597, "epoch": 1823} {"train_loss": -6.015939235687256, "global_step": 76598, "epoch": 1823} {"train_loss": -6.058315277099609, "global_step": 76599, "epoch": 1823} {"train_loss": -6.118386268615723, "global_step": 76600, "epoch": 1823} {"train_loss": -6.060988903045654, "global_step": 76601, "epoch": 1823} {"train_loss": -6.012351989746094, "global_step": 76602, "epoch": 1823} {"train_loss": -6.17810583114624, "global_step": 76603, "epoch": 1823} {"train_loss": -6.032962322235107, "global_step": 76604, "epoch": 1823} {"train_loss": -6.00189208984375, "global_step": 76605, "epoch": 1823} {"train_loss": -6.034433364868164, "global_step": 76606, "epoch": 1823} {"train_loss": -6.096884682064965, "global_step": 76607, "epoch": 1823, "val_loss": 61906.5859375} {"train_loss": -6.097987651824951, "global_step": 76608, "epoch": 1824} {"train_loss": -5.996109485626221, "global_step": 76609, "epoch": 1824} {"train_loss": -6.068241119384766, "global_step": 76610, "epoch": 1824} {"train_loss": -6.070615291595459, "global_step": 76611, "epoch": 1824} {"train_loss": -5.853633880615234, "global_step": 76612, "epoch": 1824} {"train_loss": -6.042226791381836, "global_step": 76613, "epoch": 1824} {"train_loss": -6.141472816467285, "global_step": 76614, "epoch": 1824} {"train_loss": -6.104849815368652, "global_step": 76615, "epoch": 1824} {"train_loss": -6.03800106048584, "global_step": 76616, "epoch": 1824} {"train_loss": -6.068599700927734, "global_step": 76617, "epoch": 1824} {"train_loss": -6.012256622314453, "global_step": 76618, "epoch": 1824} {"train_loss": -5.976099967956543, "global_step": 76619, "epoch": 1824} {"train_loss": -6.048515319824219, "global_step": 76620, "epoch": 1824} {"train_loss": -5.899436950683594, "global_step": 76621, "epoch": 1824} {"train_loss": -6.148652076721191, "global_step": 76622, "epoch": 1824} {"train_loss": -6.003790855407715, "global_step": 76623, "epoch": 1824} {"train_loss": -6.119709014892578, "global_step": 76624, "epoch": 1824} {"train_loss": -6.04727840423584, "global_step": 76625, "epoch": 1824} {"train_loss": -6.142371654510498, "global_step": 76626, "epoch": 1824} {"train_loss": -6.071968078613281, "global_step": 76627, "epoch": 1824} {"train_loss": -6.1266632080078125, "global_step": 76628, "epoch": 1824} {"train_loss": -6.104940891265869, "global_step": 76629, "epoch": 1824} {"train_loss": -6.030879974365234, "global_step": 76630, "epoch": 1824} {"train_loss": -6.11649751663208, "global_step": 76631, "epoch": 1824} {"train_loss": -6.0943603515625, "global_step": 76632, "epoch": 1824} {"train_loss": -6.166478633880615, "global_step": 76633, "epoch": 1824} {"train_loss": -6.042571067810059, "global_step": 76634, "epoch": 1824} {"train_loss": -6.127606391906738, "global_step": 76635, "epoch": 1824} {"train_loss": -6.0483269691467285, "global_step": 76636, "epoch": 1824} {"train_loss": -6.061352252960205, "global_step": 76637, "epoch": 1824} {"train_loss": -5.996085166931152, "global_step": 76638, "epoch": 1824} {"train_loss": -6.07574987411499, "global_step": 76639, "epoch": 1824} {"train_loss": -6.142981052398682, "global_step": 76640, "epoch": 1824} {"train_loss": -6.112060070037842, "global_step": 76641, "epoch": 1824} {"train_loss": -6.0736083984375, "global_step": 76642, "epoch": 1824} {"train_loss": -6.167380332946777, "global_step": 76643, "epoch": 1824} {"train_loss": -5.868533134460449, "global_step": 76644, "epoch": 1824} {"train_loss": -6.186075687408447, "global_step": 76645, "epoch": 1824} {"train_loss": -6.02096700668335, "global_step": 76646, "epoch": 1824} {"train_loss": -5.97641658782959, "global_step": 76647, "epoch": 1824} {"train_loss": -6.142891883850098, "global_step": 76648, "epoch": 1824} {"train_loss": -6.065735794249035, "global_step": 76649, "epoch": 1824, "val_loss": 62170.953125} {"train_loss": -6.079603672027588, "global_step": 76650, "epoch": 1825} {"train_loss": -6.1465535163879395, "global_step": 76651, "epoch": 1825} {"train_loss": -6.131244659423828, "global_step": 76652, "epoch": 1825} {"train_loss": -6.115306854248047, "global_step": 76653, "epoch": 1825} {"train_loss": -6.057873725891113, "global_step": 76654, "epoch": 1825} {"train_loss": -6.070193290710449, "global_step": 76655, "epoch": 1825} {"train_loss": -6.191164016723633, "global_step": 76656, "epoch": 1825} {"train_loss": -6.1955437660217285, "global_step": 76657, "epoch": 1825} {"train_loss": -6.072725772857666, "global_step": 76658, "epoch": 1825} {"train_loss": -6.178281784057617, "global_step": 76659, "epoch": 1825} {"train_loss": -6.102908611297607, "global_step": 76660, "epoch": 1825} {"train_loss": -6.169240951538086, "global_step": 76661, "epoch": 1825} {"train_loss": -6.0347723960876465, "global_step": 76662, "epoch": 1825} {"train_loss": -5.999340057373047, "global_step": 76663, "epoch": 1825} {"train_loss": -6.07523775100708, "global_step": 76664, "epoch": 1825} {"train_loss": -6.032846927642822, "global_step": 76665, "epoch": 1825} {"train_loss": -6.029919624328613, "global_step": 76666, "epoch": 1825} {"train_loss": -6.124032020568848, "global_step": 76667, "epoch": 1825} {"train_loss": -6.115168571472168, "global_step": 76668, "epoch": 1825} {"train_loss": -6.193830490112305, "global_step": 76669, "epoch": 1825} {"train_loss": -6.097739219665527, "global_step": 76670, "epoch": 1825} {"train_loss": -6.064085006713867, "global_step": 76671, "epoch": 1825} {"train_loss": -6.1402082443237305, "global_step": 76672, "epoch": 1825} {"train_loss": -6.145855903625488, "global_step": 76673, "epoch": 1825} {"train_loss": -6.163429260253906, "global_step": 76674, "epoch": 1825} {"train_loss": -5.989948272705078, "global_step": 76675, "epoch": 1825} {"train_loss": -6.149139404296875, "global_step": 76676, "epoch": 1825} {"train_loss": -6.0554304122924805, "global_step": 76677, "epoch": 1825} {"train_loss": -6.190382480621338, "global_step": 76678, "epoch": 1825} {"train_loss": -6.015591621398926, "global_step": 76679, "epoch": 1825} {"train_loss": -6.011633396148682, "global_step": 76680, "epoch": 1825} {"train_loss": -6.066696643829346, "global_step": 76681, "epoch": 1825} {"train_loss": -5.97293758392334, "global_step": 76682, "epoch": 1825} {"train_loss": -6.111741065979004, "global_step": 76683, "epoch": 1825} {"train_loss": -6.1063385009765625, "global_step": 76684, "epoch": 1825} {"train_loss": -6.117718696594238, "global_step": 76685, "epoch": 1825} {"train_loss": -6.152422904968262, "global_step": 76686, "epoch": 1825} {"train_loss": -6.258586883544922, "global_step": 76687, "epoch": 1825} {"train_loss": -6.107428073883057, "global_step": 76688, "epoch": 1825} {"train_loss": -6.16762113571167, "global_step": 76689, "epoch": 1825} {"train_loss": -5.977016448974609, "global_step": 76690, "epoch": 1825} {"train_loss": -6.103171541577294, "global_step": 76691, "epoch": 1825, "val_loss": 62147.25390625} {"train_loss": -6.028839588165283, "global_step": 76692, "epoch": 1826} {"train_loss": -6.018993377685547, "global_step": 76693, "epoch": 1826} {"train_loss": -6.074084758758545, "global_step": 76694, "epoch": 1826} {"train_loss": -6.165724754333496, "global_step": 76695, "epoch": 1826} {"train_loss": -6.136599540710449, "global_step": 76696, "epoch": 1826} {"train_loss": -6.143340110778809, "global_step": 76697, "epoch": 1826} {"train_loss": -6.11322546005249, "global_step": 76698, "epoch": 1826} {"train_loss": -6.113901138305664, "global_step": 76699, "epoch": 1826} {"train_loss": -6.026512145996094, "global_step": 76700, "epoch": 1826} {"train_loss": -6.129981994628906, "global_step": 76701, "epoch": 1826} {"train_loss": -5.994596004486084, "global_step": 76702, "epoch": 1826} {"train_loss": -6.107810974121094, "global_step": 76703, "epoch": 1826} {"train_loss": -6.222476005554199, "global_step": 76704, "epoch": 1826} {"train_loss": -6.112200736999512, "global_step": 76705, "epoch": 1826} {"train_loss": -6.127817630767822, "global_step": 76706, "epoch": 1826} {"train_loss": -6.059919834136963, "global_step": 76707, "epoch": 1826} {"train_loss": -6.129495620727539, "global_step": 76708, "epoch": 1826} {"train_loss": -6.161563396453857, "global_step": 76709, "epoch": 1826} {"train_loss": -6.229276180267334, "global_step": 76710, "epoch": 1826} {"train_loss": -6.197023868560791, "global_step": 76711, "epoch": 1826} {"train_loss": -6.037722587585449, "global_step": 76712, "epoch": 1826} {"train_loss": -6.169261932373047, "global_step": 76713, "epoch": 1826} {"train_loss": -6.250845432281494, "global_step": 76714, "epoch": 1826} {"train_loss": -6.135320663452148, "global_step": 76715, "epoch": 1826} {"train_loss": -6.186953067779541, "global_step": 76716, "epoch": 1826} {"train_loss": -6.10234260559082, "global_step": 76717, "epoch": 1826} {"train_loss": -6.086609363555908, "global_step": 76718, "epoch": 1826} {"train_loss": -6.032042026519775, "global_step": 76719, "epoch": 1826} {"train_loss": -6.1461591720581055, "global_step": 76720, "epoch": 1826} {"train_loss": -6.134454727172852, "global_step": 76721, "epoch": 1826} {"train_loss": -6.103607177734375, "global_step": 76722, "epoch": 1826} {"train_loss": -6.201180458068848, "global_step": 76723, "epoch": 1826} {"train_loss": -6.201302528381348, "global_step": 76724, "epoch": 1826} {"train_loss": -6.1928253173828125, "global_step": 76725, "epoch": 1826} {"train_loss": -6.124399185180664, "global_step": 76726, "epoch": 1826} {"train_loss": -6.0801682472229, "global_step": 76727, "epoch": 1826} {"train_loss": -6.187085151672363, "global_step": 76728, "epoch": 1826} {"train_loss": -6.164176940917969, "global_step": 76729, "epoch": 1826} {"train_loss": -6.013578414916992, "global_step": 76730, "epoch": 1826} {"train_loss": -6.148629188537598, "global_step": 76731, "epoch": 1826} {"train_loss": -6.170855522155762, "global_step": 76732, "epoch": 1826} {"train_loss": -6.124090751012166, "global_step": 76733, "epoch": 1826, "val_loss": 61833.94921875} {"train_loss": -6.0701117515563965, "global_step": 76734, "epoch": 1827} {"train_loss": -6.1768927574157715, "global_step": 76735, "epoch": 1827} {"train_loss": -6.088399887084961, "global_step": 76736, "epoch": 1827} {"train_loss": -6.08515739440918, "global_step": 76737, "epoch": 1827} {"train_loss": -6.250888347625732, "global_step": 76738, "epoch": 1827} {"train_loss": -6.17110538482666, "global_step": 76739, "epoch": 1827} {"train_loss": -6.175983428955078, "global_step": 76740, "epoch": 1827} {"train_loss": -6.173447608947754, "global_step": 76741, "epoch": 1827} {"train_loss": -5.991827964782715, "global_step": 76742, "epoch": 1827} {"train_loss": -6.05135440826416, "global_step": 76743, "epoch": 1827} {"train_loss": -6.09632682800293, "global_step": 76744, "epoch": 1827} {"train_loss": -6.100100040435791, "global_step": 76745, "epoch": 1827} {"train_loss": -6.086451530456543, "global_step": 76746, "epoch": 1827} {"train_loss": -6.191839218139648, "global_step": 76747, "epoch": 1827} {"train_loss": -6.218167304992676, "global_step": 76748, "epoch": 1827} {"train_loss": -6.128944396972656, "global_step": 76749, "epoch": 1827} {"train_loss": -6.142427444458008, "global_step": 76750, "epoch": 1827} {"train_loss": -6.090216636657715, "global_step": 76751, "epoch": 1827} {"train_loss": -6.192707061767578, "global_step": 76752, "epoch": 1827} {"train_loss": -6.182541847229004, "global_step": 76753, "epoch": 1827} {"train_loss": -6.060492038726807, "global_step": 76754, "epoch": 1827} {"train_loss": -6.139991760253906, "global_step": 76755, "epoch": 1827} {"train_loss": -6.180294990539551, "global_step": 76756, "epoch": 1827} {"train_loss": -6.11381721496582, "global_step": 76757, "epoch": 1827} {"train_loss": -6.119792461395264, "global_step": 76758, "epoch": 1827} {"train_loss": -6.241063117980957, "global_step": 76759, "epoch": 1827} {"train_loss": -6.0720367431640625, "global_step": 76760, "epoch": 1827} {"train_loss": -6.173447608947754, "global_step": 76761, "epoch": 1827} {"train_loss": -6.042851448059082, "global_step": 76762, "epoch": 1827} {"train_loss": -6.139256954193115, "global_step": 76763, "epoch": 1827} {"train_loss": -6.067509651184082, "global_step": 76764, "epoch": 1827} {"train_loss": -6.009341716766357, "global_step": 76765, "epoch": 1827} {"train_loss": -6.050378799438477, "global_step": 76766, "epoch": 1827} {"train_loss": -6.131894111633301, "global_step": 76767, "epoch": 1827} {"train_loss": -6.013765811920166, "global_step": 76768, "epoch": 1827} {"train_loss": -6.163022041320801, "global_step": 76769, "epoch": 1827} {"train_loss": -6.102866172790527, "global_step": 76770, "epoch": 1827} {"train_loss": -6.100451469421387, "global_step": 76771, "epoch": 1827} {"train_loss": -6.143866062164307, "global_step": 76772, "epoch": 1827} {"train_loss": -6.167784690856934, "global_step": 76773, "epoch": 1827} {"train_loss": -6.024476051330566, "global_step": 76774, "epoch": 1827} {"train_loss": -6.119217622847784, "global_step": 76775, "epoch": 1827, "val_loss": 62126.33984375} {"train_loss": -6.129642009735107, "global_step": 76776, "epoch": 1828} {"train_loss": -6.000556945800781, "global_step": 76777, "epoch": 1828} {"train_loss": -6.175809860229492, "global_step": 76778, "epoch": 1828} {"train_loss": -6.038066387176514, "global_step": 76779, "epoch": 1828} {"train_loss": -6.086623191833496, "global_step": 76780, "epoch": 1828} {"train_loss": -6.186212539672852, "global_step": 76781, "epoch": 1828} {"train_loss": -6.061519145965576, "global_step": 76782, "epoch": 1828} {"train_loss": -6.059099197387695, "global_step": 76783, "epoch": 1828} {"train_loss": -5.989075660705566, "global_step": 76784, "epoch": 1828} {"train_loss": -6.348601818084717, "global_step": 76785, "epoch": 1828} {"train_loss": -6.080726623535156, "global_step": 76786, "epoch": 1828} {"train_loss": -6.127792835235596, "global_step": 76787, "epoch": 1828} {"train_loss": -6.229439735412598, "global_step": 76788, "epoch": 1828} {"train_loss": -6.140936851501465, "global_step": 76789, "epoch": 1828} {"train_loss": -6.183617115020752, "global_step": 76790, "epoch": 1828} {"train_loss": -6.197359561920166, "global_step": 76791, "epoch": 1828} {"train_loss": -6.044613838195801, "global_step": 76792, "epoch": 1828} {"train_loss": -6.156519889831543, "global_step": 76793, "epoch": 1828} {"train_loss": -6.183545112609863, "global_step": 76794, "epoch": 1828} {"train_loss": -5.965415000915527, "global_step": 76795, "epoch": 1828} {"train_loss": -6.150585174560547, "global_step": 76796, "epoch": 1828} {"train_loss": -5.9754109382629395, "global_step": 76797, "epoch": 1828} {"train_loss": -6.137290000915527, "global_step": 76798, "epoch": 1828} {"train_loss": -6.204817295074463, "global_step": 76799, "epoch": 1828} {"train_loss": -6.050124168395996, "global_step": 76800, "epoch": 1828} {"train_loss": -6.00416374206543, "global_step": 76801, "epoch": 1828} {"train_loss": -6.096745491027832, "global_step": 76802, "epoch": 1828} {"train_loss": -6.038517475128174, "global_step": 76803, "epoch": 1828} {"train_loss": -6.1777801513671875, "global_step": 76804, "epoch": 1828} {"train_loss": -6.147182464599609, "global_step": 76805, "epoch": 1828} {"train_loss": -6.034599304199219, "global_step": 76806, "epoch": 1828} {"train_loss": -6.203381061553955, "global_step": 76807, "epoch": 1828} {"train_loss": -5.906881809234619, "global_step": 76808, "epoch": 1828} {"train_loss": -6.138801574707031, "global_step": 76809, "epoch": 1828} {"train_loss": -6.042015075683594, "global_step": 76810, "epoch": 1828} {"train_loss": -6.070890426635742, "global_step": 76811, "epoch": 1828} {"train_loss": -6.094531059265137, "global_step": 76812, "epoch": 1828} {"train_loss": -6.091222286224365, "global_step": 76813, "epoch": 1828} {"train_loss": -6.112258434295654, "global_step": 76814, "epoch": 1828} {"train_loss": -6.114253044128418, "global_step": 76815, "epoch": 1828} {"train_loss": -6.001253128051758, "global_step": 76816, "epoch": 1828} {"train_loss": -6.099669694900513, "global_step": 76817, "epoch": 1828, "val_loss": 62171.0390625} {"train_loss": -6.131433486938477, "global_step": 76818, "epoch": 1829} {"train_loss": -6.047859191894531, "global_step": 76819, "epoch": 1829} {"train_loss": -6.034445762634277, "global_step": 76820, "epoch": 1829} {"train_loss": -6.256502151489258, "global_step": 76821, "epoch": 1829} {"train_loss": -6.08357048034668, "global_step": 76822, "epoch": 1829} {"train_loss": -6.027524948120117, "global_step": 76823, "epoch": 1829} {"train_loss": -6.19096565246582, "global_step": 76824, "epoch": 1829} {"train_loss": -5.988947868347168, "global_step": 76825, "epoch": 1829} {"train_loss": -6.122417449951172, "global_step": 76826, "epoch": 1829} {"train_loss": -5.99018669128418, "global_step": 76827, "epoch": 1829} {"train_loss": -6.10396671295166, "global_step": 76828, "epoch": 1829} {"train_loss": -5.990993022918701, "global_step": 76829, "epoch": 1829} {"train_loss": -6.06178617477417, "global_step": 76830, "epoch": 1829} {"train_loss": -5.939083099365234, "global_step": 76831, "epoch": 1829} {"train_loss": -6.077220916748047, "global_step": 76832, "epoch": 1829} {"train_loss": -6.052621364593506, "global_step": 76833, "epoch": 1829} {"train_loss": -6.113219261169434, "global_step": 76834, "epoch": 1829} {"train_loss": -6.098609924316406, "global_step": 76835, "epoch": 1829} {"train_loss": -6.127447605133057, "global_step": 76836, "epoch": 1829} {"train_loss": -6.032751083374023, "global_step": 76837, "epoch": 1829} {"train_loss": -6.135481834411621, "global_step": 76838, "epoch": 1829} {"train_loss": -6.224177360534668, "global_step": 76839, "epoch": 1829} {"train_loss": -6.1075592041015625, "global_step": 76840, "epoch": 1829} {"train_loss": -6.164935111999512, "global_step": 76841, "epoch": 1829} {"train_loss": -6.175195217132568, "global_step": 76842, "epoch": 1829} {"train_loss": -6.164188385009766, "global_step": 76843, "epoch": 1829} {"train_loss": -6.055595397949219, "global_step": 76844, "epoch": 1829} {"train_loss": -6.111259460449219, "global_step": 76845, "epoch": 1829} {"train_loss": -6.116203308105469, "global_step": 76846, "epoch": 1829} {"train_loss": -5.990438461303711, "global_step": 76847, "epoch": 1829} {"train_loss": -6.075651168823242, "global_step": 76848, "epoch": 1829} {"train_loss": -6.155489444732666, "global_step": 76849, "epoch": 1829} {"train_loss": -5.9481000900268555, "global_step": 76850, "epoch": 1829} {"train_loss": -6.119598388671875, "global_step": 76851, "epoch": 1829} {"train_loss": -6.217504501342773, "global_step": 76852, "epoch": 1829} {"train_loss": -6.106959342956543, "global_step": 76853, "epoch": 1829} {"train_loss": -6.0972137451171875, "global_step": 76854, "epoch": 1829} {"train_loss": -6.184542655944824, "global_step": 76855, "epoch": 1829} {"train_loss": -6.141287326812744, "global_step": 76856, "epoch": 1829} {"train_loss": -6.1674485206604, "global_step": 76857, "epoch": 1829} {"train_loss": -6.113392353057861, "global_step": 76858, "epoch": 1829} {"train_loss": -6.100531316938854, "global_step": 76859, "epoch": 1829, "val_loss": 62026.22265625} {"train_loss": -6.215716361999512, "global_step": 76860, "epoch": 1830} {"train_loss": -6.009114742279053, "global_step": 76861, "epoch": 1830} {"train_loss": -6.288082122802734, "global_step": 76862, "epoch": 1830} {"train_loss": -6.014526844024658, "global_step": 76863, "epoch": 1830} {"train_loss": -6.191410541534424, "global_step": 76864, "epoch": 1830} {"train_loss": -6.231845855712891, "global_step": 76865, "epoch": 1830} {"train_loss": -6.075481414794922, "global_step": 76866, "epoch": 1830} {"train_loss": -6.117032051086426, "global_step": 76867, "epoch": 1830} {"train_loss": -6.1450700759887695, "global_step": 76868, "epoch": 1830} {"train_loss": -6.0923590660095215, "global_step": 76869, "epoch": 1830} {"train_loss": -6.123302459716797, "global_step": 76870, "epoch": 1830} {"train_loss": -6.180960655212402, "global_step": 76871, "epoch": 1830} {"train_loss": -6.212133884429932, "global_step": 76872, "epoch": 1830} {"train_loss": -6.12972354888916, "global_step": 76873, "epoch": 1830} {"train_loss": -6.086300373077393, "global_step": 76874, "epoch": 1830} {"train_loss": -6.158137798309326, "global_step": 76875, "epoch": 1830} {"train_loss": -6.096253871917725, "global_step": 76876, "epoch": 1830} {"train_loss": -6.166780471801758, "global_step": 76877, "epoch": 1830} {"train_loss": -6.135815620422363, "global_step": 76878, "epoch": 1830} {"train_loss": -6.233929634094238, "global_step": 76879, "epoch": 1830} {"train_loss": -5.996450424194336, "global_step": 76880, "epoch": 1830} {"train_loss": -6.210860729217529, "global_step": 76881, "epoch": 1830} {"train_loss": -6.144708156585693, "global_step": 76882, "epoch": 1830} {"train_loss": -6.152266025543213, "global_step": 76883, "epoch": 1830} {"train_loss": -6.191476821899414, "global_step": 76884, "epoch": 1830} {"train_loss": -6.034460067749023, "global_step": 76885, "epoch": 1830} {"train_loss": -6.042764663696289, "global_step": 76886, "epoch": 1830} {"train_loss": -6.236288070678711, "global_step": 76887, "epoch": 1830} {"train_loss": -6.203402519226074, "global_step": 76888, "epoch": 1830} {"train_loss": -6.081485271453857, "global_step": 76889, "epoch": 1830} {"train_loss": -6.098286151885986, "global_step": 76890, "epoch": 1830} {"train_loss": -6.130002975463867, "global_step": 76891, "epoch": 1830} {"train_loss": -6.113644123077393, "global_step": 76892, "epoch": 1830} {"train_loss": -6.221737861633301, "global_step": 76893, "epoch": 1830} {"train_loss": -5.969701766967773, "global_step": 76894, "epoch": 1830} {"train_loss": -6.202535152435303, "global_step": 76895, "epoch": 1830} {"train_loss": -6.073451995849609, "global_step": 76896, "epoch": 1830} {"train_loss": -6.160172462463379, "global_step": 76897, "epoch": 1830} {"train_loss": -6.090090751647949, "global_step": 76898, "epoch": 1830} {"train_loss": -6.177734375, "global_step": 76899, "epoch": 1830} {"train_loss": -6.065596580505371, "global_step": 76900, "epoch": 1830} {"train_loss": -6.132957640148344, "global_step": 76901, "epoch": 1830, "val_loss": 62117.5703125} {"train_loss": -6.147132873535156, "global_step": 76902, "epoch": 1831} {"train_loss": -6.135410785675049, "global_step": 76903, "epoch": 1831} {"train_loss": -6.0231781005859375, "global_step": 76904, "epoch": 1831} {"train_loss": -6.112865447998047, "global_step": 76905, "epoch": 1831} {"train_loss": -6.129148006439209, "global_step": 76906, "epoch": 1831} {"train_loss": -6.265875816345215, "global_step": 76907, "epoch": 1831} {"train_loss": -6.174222469329834, "global_step": 76908, "epoch": 1831} {"train_loss": -6.075738906860352, "global_step": 76909, "epoch": 1831} {"train_loss": -6.259756565093994, "global_step": 76910, "epoch": 1831} {"train_loss": -6.110790252685547, "global_step": 76911, "epoch": 1831} {"train_loss": -6.133838176727295, "global_step": 76912, "epoch": 1831} {"train_loss": -6.099040985107422, "global_step": 76913, "epoch": 1831} {"train_loss": -6.139286041259766, "global_step": 76914, "epoch": 1831} {"train_loss": -6.089625358581543, "global_step": 76915, "epoch": 1831} {"train_loss": -6.098384857177734, "global_step": 76916, "epoch": 1831} {"train_loss": -6.057254791259766, "global_step": 76917, "epoch": 1831} {"train_loss": -6.104828357696533, "global_step": 76918, "epoch": 1831} {"train_loss": -6.1996660232543945, "global_step": 76919, "epoch": 1831} {"train_loss": -6.144283771514893, "global_step": 76920, "epoch": 1831} {"train_loss": -6.159876823425293, "global_step": 76921, "epoch": 1831} {"train_loss": -6.0825090408325195, "global_step": 76922, "epoch": 1831} {"train_loss": -6.063363552093506, "global_step": 76923, "epoch": 1831} {"train_loss": -6.113625526428223, "global_step": 76924, "epoch": 1831} {"train_loss": -5.975571632385254, "global_step": 76925, "epoch": 1831} {"train_loss": -6.053623676300049, "global_step": 76926, "epoch": 1831} {"train_loss": -5.995203971862793, "global_step": 76927, "epoch": 1831} {"train_loss": -6.001816272735596, "global_step": 76928, "epoch": 1831} {"train_loss": -6.183795928955078, "global_step": 76929, "epoch": 1831} {"train_loss": -6.014598846435547, "global_step": 76930, "epoch": 1831} {"train_loss": -6.079990386962891, "global_step": 76931, "epoch": 1831} {"train_loss": -6.105168342590332, "global_step": 76932, "epoch": 1831} {"train_loss": -6.065245628356934, "global_step": 76933, "epoch": 1831} {"train_loss": -6.040691375732422, "global_step": 76934, "epoch": 1831} {"train_loss": -6.0882978439331055, "global_step": 76935, "epoch": 1831} {"train_loss": -6.164302825927734, "global_step": 76936, "epoch": 1831} {"train_loss": -6.117547035217285, "global_step": 76937, "epoch": 1831} {"train_loss": -6.196019172668457, "global_step": 76938, "epoch": 1831} {"train_loss": -6.042628288269043, "global_step": 76939, "epoch": 1831} {"train_loss": -6.095550537109375, "global_step": 76940, "epoch": 1831} {"train_loss": -6.180309295654297, "global_step": 76941, "epoch": 1831} {"train_loss": -6.197610378265381, "global_step": 76942, "epoch": 1831} {"train_loss": -6.111316646848406, "global_step": 76943, "epoch": 1831, "val_loss": 61989.5} {"train_loss": -6.1986470222473145, "global_step": 76944, "epoch": 1832} {"train_loss": -6.139894962310791, "global_step": 76945, "epoch": 1832} {"train_loss": -6.028083801269531, "global_step": 76946, "epoch": 1832} {"train_loss": -6.194341659545898, "global_step": 76947, "epoch": 1832} {"train_loss": -6.108654499053955, "global_step": 76948, "epoch": 1832} {"train_loss": -6.185498237609863, "global_step": 76949, "epoch": 1832} {"train_loss": -6.1068220138549805, "global_step": 76950, "epoch": 1832} {"train_loss": -6.130214214324951, "global_step": 76951, "epoch": 1832} {"train_loss": -6.0109357833862305, "global_step": 76952, "epoch": 1832} {"train_loss": -6.206262588500977, "global_step": 76953, "epoch": 1832} {"train_loss": -6.081064701080322, "global_step": 76954, "epoch": 1832} {"train_loss": -6.124274253845215, "global_step": 76955, "epoch": 1832} {"train_loss": -6.102603912353516, "global_step": 76956, "epoch": 1832} {"train_loss": -5.963467597961426, "global_step": 76957, "epoch": 1832} {"train_loss": -6.134873390197754, "global_step": 76958, "epoch": 1832} {"train_loss": -6.093328952789307, "global_step": 76959, "epoch": 1832} {"train_loss": -6.039161682128906, "global_step": 76960, "epoch": 1832} {"train_loss": -6.078684329986572, "global_step": 76961, "epoch": 1832} {"train_loss": -6.059735298156738, "global_step": 76962, "epoch": 1832} {"train_loss": -6.042636394500732, "global_step": 76963, "epoch": 1832} {"train_loss": -5.984961032867432, "global_step": 76964, "epoch": 1832} {"train_loss": -5.974225997924805, "global_step": 76965, "epoch": 1832} {"train_loss": -6.1406097412109375, "global_step": 76966, "epoch": 1832} {"train_loss": -6.140619277954102, "global_step": 76967, "epoch": 1832} {"train_loss": -6.171631336212158, "global_step": 76968, "epoch": 1832} {"train_loss": -6.13511848449707, "global_step": 76969, "epoch": 1832} {"train_loss": -6.095739841461182, "global_step": 76970, "epoch": 1832} {"train_loss": -6.103752136230469, "global_step": 76971, "epoch": 1832} {"train_loss": -6.140469551086426, "global_step": 76972, "epoch": 1832} {"train_loss": -6.017223358154297, "global_step": 76973, "epoch": 1832} {"train_loss": -6.0274529457092285, "global_step": 76974, "epoch": 1832} {"train_loss": -6.013803005218506, "global_step": 76975, "epoch": 1832} {"train_loss": -5.994424819946289, "global_step": 76976, "epoch": 1832} {"train_loss": -6.137557029724121, "global_step": 76977, "epoch": 1832} {"train_loss": -6.085217475891113, "global_step": 76978, "epoch": 1832} {"train_loss": -6.038923740386963, "global_step": 76979, "epoch": 1832} {"train_loss": -6.074129104614258, "global_step": 76980, "epoch": 1832} {"train_loss": -6.037773132324219, "global_step": 76981, "epoch": 1832} {"train_loss": -5.985278606414795, "global_step": 76982, "epoch": 1832} {"train_loss": -6.080302715301514, "global_step": 76983, "epoch": 1832} {"train_loss": -6.020214557647705, "global_step": 76984, "epoch": 1832} {"train_loss": -6.082481804348173, "global_step": 76985, "epoch": 1832, "val_loss": 62156.5390625} {"train_loss": -6.170921325683594, "global_step": 76986, "epoch": 1833} {"train_loss": -6.0217695236206055, "global_step": 76987, "epoch": 1833} {"train_loss": -6.1245927810668945, "global_step": 76988, "epoch": 1833} {"train_loss": -6.067584991455078, "global_step": 76989, "epoch": 1833} {"train_loss": -6.114608287811279, "global_step": 76990, "epoch": 1833} {"train_loss": -6.064037322998047, "global_step": 76991, "epoch": 1833} {"train_loss": -6.066489219665527, "global_step": 76992, "epoch": 1833} {"train_loss": -6.095353126525879, "global_step": 76993, "epoch": 1833} {"train_loss": -6.057430267333984, "global_step": 76994, "epoch": 1833} {"train_loss": -6.113708019256592, "global_step": 76995, "epoch": 1833} {"train_loss": -6.152907848358154, "global_step": 76996, "epoch": 1833} {"train_loss": -6.010928153991699, "global_step": 76997, "epoch": 1833} {"train_loss": -6.017903804779053, "global_step": 76998, "epoch": 1833} {"train_loss": -6.13936710357666, "global_step": 76999, "epoch": 1833} {"train_loss": -5.998417377471924, "global_step": 77000, "epoch": 1833} {"train_loss": -6.162353515625, "global_step": 77001, "epoch": 1833} {"train_loss": -6.112847328186035, "global_step": 77002, "epoch": 1833} {"train_loss": -6.009953498840332, "global_step": 77003, "epoch": 1833} {"train_loss": -6.044219017028809, "global_step": 77004, "epoch": 1833} {"train_loss": -6.114691734313965, "global_step": 77005, "epoch": 1833} {"train_loss": -5.996702194213867, "global_step": 77006, "epoch": 1833} {"train_loss": -6.121334075927734, "global_step": 77007, "epoch": 1833} {"train_loss": -6.103266716003418, "global_step": 77008, "epoch": 1833} {"train_loss": -5.8981122970581055, "global_step": 77009, "epoch": 1833} {"train_loss": -6.056887626647949, "global_step": 77010, "epoch": 1833} {"train_loss": -6.067048072814941, "global_step": 77011, "epoch": 1833} {"train_loss": -5.973875045776367, "global_step": 77012, "epoch": 1833} {"train_loss": -6.117849349975586, "global_step": 77013, "epoch": 1833} {"train_loss": -6.0431108474731445, "global_step": 77014, "epoch": 1833} {"train_loss": -6.042813301086426, "global_step": 77015, "epoch": 1833} {"train_loss": -6.007268905639648, "global_step": 77016, "epoch": 1833} {"train_loss": -6.081158638000488, "global_step": 77017, "epoch": 1833} {"train_loss": -6.07096004486084, "global_step": 77018, "epoch": 1833} {"train_loss": -6.1954569816589355, "global_step": 77019, "epoch": 1833} {"train_loss": -6.101871490478516, "global_step": 77020, "epoch": 1833} {"train_loss": -6.094054222106934, "global_step": 77021, "epoch": 1833} {"train_loss": -6.022405624389648, "global_step": 77022, "epoch": 1833} {"train_loss": -6.126496315002441, "global_step": 77023, "epoch": 1833} {"train_loss": -6.213801383972168, "global_step": 77024, "epoch": 1833} {"train_loss": -5.971057891845703, "global_step": 77025, "epoch": 1833} {"train_loss": -6.140861511230469, "global_step": 77026, "epoch": 1833} {"train_loss": -6.078821976979573, "global_step": 77027, "epoch": 1833, "val_loss": 62208.1640625} {"train_loss": -6.114633560180664, "global_step": 77028, "epoch": 1834} {"train_loss": -5.959781646728516, "global_step": 77029, "epoch": 1834} {"train_loss": -6.03639030456543, "global_step": 77030, "epoch": 1834} {"train_loss": -6.051934242248535, "global_step": 77031, "epoch": 1834} {"train_loss": -6.172152996063232, "global_step": 77032, "epoch": 1834} {"train_loss": -6.163278579711914, "global_step": 77033, "epoch": 1834} {"train_loss": -6.058810234069824, "global_step": 77034, "epoch": 1834} {"train_loss": -6.009765148162842, "global_step": 77035, "epoch": 1834} {"train_loss": -6.024783611297607, "global_step": 77036, "epoch": 1834} {"train_loss": -6.095268726348877, "global_step": 77037, "epoch": 1834} {"train_loss": -6.051060199737549, "global_step": 77038, "epoch": 1834} {"train_loss": -6.070990085601807, "global_step": 77039, "epoch": 1834} {"train_loss": -6.090945243835449, "global_step": 77040, "epoch": 1834} {"train_loss": -5.993829250335693, "global_step": 77041, "epoch": 1834} {"train_loss": -6.026388645172119, "global_step": 77042, "epoch": 1834} {"train_loss": -5.935581207275391, "global_step": 77043, "epoch": 1834} {"train_loss": -6.182512283325195, "global_step": 77044, "epoch": 1834} {"train_loss": -5.935466289520264, "global_step": 77045, "epoch": 1834} {"train_loss": -6.109103679656982, "global_step": 77046, "epoch": 1834} {"train_loss": -6.052417278289795, "global_step": 77047, "epoch": 1834} {"train_loss": -6.0381269454956055, "global_step": 77048, "epoch": 1834} {"train_loss": -6.030511856079102, "global_step": 77049, "epoch": 1834} {"train_loss": -5.939931869506836, "global_step": 77050, "epoch": 1834} {"train_loss": -6.164361953735352, "global_step": 77051, "epoch": 1834} {"train_loss": -6.013452053070068, "global_step": 77052, "epoch": 1834} {"train_loss": -6.096435546875, "global_step": 77053, "epoch": 1834} {"train_loss": -6.061642646789551, "global_step": 77054, "epoch": 1834} {"train_loss": -6.093018531799316, "global_step": 77055, "epoch": 1834} {"train_loss": -6.210997581481934, "global_step": 77056, "epoch": 1834} {"train_loss": -5.962924957275391, "global_step": 77057, "epoch": 1834} {"train_loss": -6.089436054229736, "global_step": 77058, "epoch": 1834} {"train_loss": -6.081124305725098, "global_step": 77059, "epoch": 1834} {"train_loss": -6.0335774421691895, "global_step": 77060, "epoch": 1834} {"train_loss": -6.115524768829346, "global_step": 77061, "epoch": 1834} {"train_loss": -5.99237060546875, "global_step": 77062, "epoch": 1834} {"train_loss": -6.088018417358398, "global_step": 77063, "epoch": 1834} {"train_loss": -6.089693546295166, "global_step": 77064, "epoch": 1834} {"train_loss": -6.1238603591918945, "global_step": 77065, "epoch": 1834} {"train_loss": -6.212283134460449, "global_step": 77066, "epoch": 1834} {"train_loss": -6.00323486328125, "global_step": 77067, "epoch": 1834} {"train_loss": -5.993987560272217, "global_step": 77068, "epoch": 1834} {"train_loss": -6.060503880182902, "global_step": 77069, "epoch": 1834, "val_loss": 62395.80078125} {"train_loss": -6.108343124389648, "global_step": 77070, "epoch": 1835} {"train_loss": -6.113503456115723, "global_step": 77071, "epoch": 1835} {"train_loss": -6.0523176193237305, "global_step": 77072, "epoch": 1835} {"train_loss": -5.982267379760742, "global_step": 77073, "epoch": 1835} {"train_loss": -6.063988208770752, "global_step": 77074, "epoch": 1835} {"train_loss": -6.116098403930664, "global_step": 77075, "epoch": 1835} {"train_loss": -6.077994346618652, "global_step": 77076, "epoch": 1835} {"train_loss": -6.03420352935791, "global_step": 77077, "epoch": 1835} {"train_loss": -6.182400703430176, "global_step": 77078, "epoch": 1835} {"train_loss": -6.054888725280762, "global_step": 77079, "epoch": 1835} {"train_loss": -6.14273738861084, "global_step": 77080, "epoch": 1835} {"train_loss": -6.042557716369629, "global_step": 77081, "epoch": 1835} {"train_loss": -5.95326042175293, "global_step": 77082, "epoch": 1835} {"train_loss": -6.144792556762695, "global_step": 77083, "epoch": 1835} {"train_loss": -6.162952899932861, "global_step": 77084, "epoch": 1835} {"train_loss": -6.075153350830078, "global_step": 77085, "epoch": 1835} {"train_loss": -6.113862991333008, "global_step": 77086, "epoch": 1835} {"train_loss": -6.1831278800964355, "global_step": 77087, "epoch": 1835} {"train_loss": -6.080966949462891, "global_step": 77088, "epoch": 1835} {"train_loss": -6.099769115447998, "global_step": 77089, "epoch": 1835} {"train_loss": -6.115126609802246, "global_step": 77090, "epoch": 1835} {"train_loss": -6.111758232116699, "global_step": 77091, "epoch": 1835} {"train_loss": -6.082157135009766, "global_step": 77092, "epoch": 1835} {"train_loss": -6.083827972412109, "global_step": 77093, "epoch": 1835} {"train_loss": -6.076848030090332, "global_step": 77094, "epoch": 1835} {"train_loss": -6.094466209411621, "global_step": 77095, "epoch": 1835} {"train_loss": -6.019602298736572, "global_step": 77096, "epoch": 1835} {"train_loss": -5.987015724182129, "global_step": 77097, "epoch": 1835} {"train_loss": -6.110434532165527, "global_step": 77098, "epoch": 1835} {"train_loss": -6.111733913421631, "global_step": 77099, "epoch": 1835} {"train_loss": -5.999347686767578, "global_step": 77100, "epoch": 1835} {"train_loss": -6.206881523132324, "global_step": 77101, "epoch": 1835} {"train_loss": -6.07991886138916, "global_step": 77102, "epoch": 1835} {"train_loss": -6.077495574951172, "global_step": 77103, "epoch": 1835} {"train_loss": -6.125244140625, "global_step": 77104, "epoch": 1835} {"train_loss": -6.134544372558594, "global_step": 77105, "epoch": 1835} {"train_loss": -6.042879581451416, "global_step": 77106, "epoch": 1835} {"train_loss": -6.025390625, "global_step": 77107, "epoch": 1835} {"train_loss": -5.9280500411987305, "global_step": 77108, "epoch": 1835} {"train_loss": -6.088726997375488, "global_step": 77109, "epoch": 1835} {"train_loss": -6.137392997741699, "global_step": 77110, "epoch": 1835} {"train_loss": -6.0818237236567905, "global_step": 77111, "epoch": 1835, "val_loss": 61981.59375} {"train_loss": -5.994077205657959, "global_step": 77112, "epoch": 1836} {"train_loss": -6.13508415222168, "global_step": 77113, "epoch": 1836} {"train_loss": -6.043037414550781, "global_step": 77114, "epoch": 1836} {"train_loss": -6.2415666580200195, "global_step": 77115, "epoch": 1836} {"train_loss": -6.1052117347717285, "global_step": 77116, "epoch": 1836} {"train_loss": -6.173703670501709, "global_step": 77117, "epoch": 1836} {"train_loss": -6.161654472351074, "global_step": 77118, "epoch": 1836} {"train_loss": -6.057401657104492, "global_step": 77119, "epoch": 1836} {"train_loss": -6.077638626098633, "global_step": 77120, "epoch": 1836} {"train_loss": -6.018688201904297, "global_step": 77121, "epoch": 1836} {"train_loss": -6.0787248611450195, "global_step": 77122, "epoch": 1836} {"train_loss": -6.1531243324279785, "global_step": 77123, "epoch": 1836} {"train_loss": -6.181435585021973, "global_step": 77124, "epoch": 1836} {"train_loss": -6.082667827606201, "global_step": 77125, "epoch": 1836} {"train_loss": -6.106646537780762, "global_step": 77126, "epoch": 1836} {"train_loss": -6.121058464050293, "global_step": 77127, "epoch": 1836} {"train_loss": -6.0178680419921875, "global_step": 77128, "epoch": 1836} {"train_loss": -6.164125919342041, "global_step": 77129, "epoch": 1836} {"train_loss": -6.177962303161621, "global_step": 77130, "epoch": 1836} {"train_loss": -6.094378471374512, "global_step": 77131, "epoch": 1836} {"train_loss": -6.245569229125977, "global_step": 77132, "epoch": 1836} {"train_loss": -6.163771629333496, "global_step": 77133, "epoch": 1836} {"train_loss": -6.074199676513672, "global_step": 77134, "epoch": 1836} {"train_loss": -5.967962265014648, "global_step": 77135, "epoch": 1836} {"train_loss": -6.163003921508789, "global_step": 77136, "epoch": 1836} {"train_loss": -6.15908145904541, "global_step": 77137, "epoch": 1836} {"train_loss": -6.142406463623047, "global_step": 77138, "epoch": 1836} {"train_loss": -6.138338088989258, "global_step": 77139, "epoch": 1836} {"train_loss": -6.272265434265137, "global_step": 77140, "epoch": 1836} {"train_loss": -6.220432758331299, "global_step": 77141, "epoch": 1836} {"train_loss": -6.153155326843262, "global_step": 77142, "epoch": 1836} {"train_loss": -6.008892059326172, "global_step": 77143, "epoch": 1836} {"train_loss": -6.105162143707275, "global_step": 77144, "epoch": 1836} {"train_loss": -6.067956924438477, "global_step": 77145, "epoch": 1836} {"train_loss": -6.067649841308594, "global_step": 77146, "epoch": 1836} {"train_loss": -6.273467063903809, "global_step": 77147, "epoch": 1836} {"train_loss": -6.174497604370117, "global_step": 77148, "epoch": 1836} {"train_loss": -6.147407531738281, "global_step": 77149, "epoch": 1836} {"train_loss": -6.083729267120361, "global_step": 77150, "epoch": 1836} {"train_loss": -6.032705307006836, "global_step": 77151, "epoch": 1836} {"train_loss": -6.1042680740356445, "global_step": 77152, "epoch": 1836} {"train_loss": -6.119734151022775, "global_step": 77153, "epoch": 1836, "val_loss": 62084.9765625} {"train_loss": -6.175198554992676, "global_step": 77154, "epoch": 1837} {"train_loss": -6.096859931945801, "global_step": 77155, "epoch": 1837} {"train_loss": -6.203804016113281, "global_step": 77156, "epoch": 1837} {"train_loss": -5.947927474975586, "global_step": 77157, "epoch": 1837} {"train_loss": -6.105576038360596, "global_step": 77158, "epoch": 1837} {"train_loss": -6.021561145782471, "global_step": 77159, "epoch": 1837} {"train_loss": -6.183685779571533, "global_step": 77160, "epoch": 1837} {"train_loss": -6.100733280181885, "global_step": 77161, "epoch": 1837} {"train_loss": -6.2028985023498535, "global_step": 77162, "epoch": 1837} {"train_loss": -6.137426376342773, "global_step": 77163, "epoch": 1837} {"train_loss": -6.160927772521973, "global_step": 77164, "epoch": 1837} {"train_loss": -6.192694187164307, "global_step": 77165, "epoch": 1837} {"train_loss": -6.11585807800293, "global_step": 77166, "epoch": 1837} {"train_loss": -6.226088523864746, "global_step": 77167, "epoch": 1837} {"train_loss": -6.0590410232543945, "global_step": 77168, "epoch": 1837} {"train_loss": -6.163846969604492, "global_step": 77169, "epoch": 1837} {"train_loss": -6.0912933349609375, "global_step": 77170, "epoch": 1837} {"train_loss": -6.293509483337402, "global_step": 77171, "epoch": 1837} {"train_loss": -6.130063056945801, "global_step": 77172, "epoch": 1837} {"train_loss": -6.1168413162231445, "global_step": 77173, "epoch": 1837} {"train_loss": -6.028987884521484, "global_step": 77174, "epoch": 1837} {"train_loss": -6.08763313293457, "global_step": 77175, "epoch": 1837} {"train_loss": -6.035694122314453, "global_step": 77176, "epoch": 1837} {"train_loss": -6.097476005554199, "global_step": 77177, "epoch": 1837} {"train_loss": -6.207876682281494, "global_step": 77178, "epoch": 1837} {"train_loss": -6.237166404724121, "global_step": 77179, "epoch": 1837} {"train_loss": -6.166135311126709, "global_step": 77180, "epoch": 1837} {"train_loss": -6.10344123840332, "global_step": 77181, "epoch": 1837} {"train_loss": -6.188764572143555, "global_step": 77182, "epoch": 1837} {"train_loss": -6.1081438064575195, "global_step": 77183, "epoch": 1837} {"train_loss": -6.1513848304748535, "global_step": 77184, "epoch": 1837} {"train_loss": -6.047938346862793, "global_step": 77185, "epoch": 1837} {"train_loss": -6.021699905395508, "global_step": 77186, "epoch": 1837} {"train_loss": -6.1856689453125, "global_step": 77187, "epoch": 1837} {"train_loss": -6.024140357971191, "global_step": 77188, "epoch": 1837} {"train_loss": -6.072178840637207, "global_step": 77189, "epoch": 1837} {"train_loss": -6.037634372711182, "global_step": 77190, "epoch": 1837} {"train_loss": -6.118967056274414, "global_step": 77191, "epoch": 1837} {"train_loss": -6.074962615966797, "global_step": 77192, "epoch": 1837} {"train_loss": -6.107002258300781, "global_step": 77193, "epoch": 1837} {"train_loss": -6.142990589141846, "global_step": 77194, "epoch": 1837} {"train_loss": -6.121448301133656, "global_step": 77195, "epoch": 1837, "val_loss": 62203.5546875} {"train_loss": -6.211982727050781, "global_step": 77196, "epoch": 1838} {"train_loss": -6.140653610229492, "global_step": 77197, "epoch": 1838} {"train_loss": -6.141942977905273, "global_step": 77198, "epoch": 1838} {"train_loss": -6.013341426849365, "global_step": 77199, "epoch": 1838} {"train_loss": -6.240603446960449, "global_step": 77200, "epoch": 1838} {"train_loss": -6.045126914978027, "global_step": 77201, "epoch": 1838} {"train_loss": -6.122433185577393, "global_step": 77202, "epoch": 1838} {"train_loss": -6.064878463745117, "global_step": 77203, "epoch": 1838} {"train_loss": -6.13359260559082, "global_step": 77204, "epoch": 1838} {"train_loss": -6.214481353759766, "global_step": 77205, "epoch": 1838} {"train_loss": -6.093757152557373, "global_step": 77206, "epoch": 1838} {"train_loss": -6.132228851318359, "global_step": 77207, "epoch": 1838} {"train_loss": -6.0893707275390625, "global_step": 77208, "epoch": 1838} {"train_loss": -6.053580284118652, "global_step": 77209, "epoch": 1838} {"train_loss": -6.0351762771606445, "global_step": 77210, "epoch": 1838} {"train_loss": -6.0179524421691895, "global_step": 77211, "epoch": 1838} {"train_loss": -6.181330680847168, "global_step": 77212, "epoch": 1838} {"train_loss": -6.125893592834473, "global_step": 77213, "epoch": 1838} {"train_loss": -6.081627368927002, "global_step": 77214, "epoch": 1838} {"train_loss": -6.201587677001953, "global_step": 77215, "epoch": 1838} {"train_loss": -6.141201019287109, "global_step": 77216, "epoch": 1838} {"train_loss": -6.10736083984375, "global_step": 77217, "epoch": 1838} {"train_loss": -6.073429107666016, "global_step": 77218, "epoch": 1838} {"train_loss": -6.173836708068848, "global_step": 77219, "epoch": 1838} {"train_loss": -6.1279425621032715, "global_step": 77220, "epoch": 1838} {"train_loss": -5.995655059814453, "global_step": 77221, "epoch": 1838} {"train_loss": -6.167403221130371, "global_step": 77222, "epoch": 1838} {"train_loss": -5.925066947937012, "global_step": 77223, "epoch": 1838} {"train_loss": -5.984859466552734, "global_step": 77224, "epoch": 1838} {"train_loss": -6.148967266082764, "global_step": 77225, "epoch": 1838} {"train_loss": -6.010437965393066, "global_step": 77226, "epoch": 1838} {"train_loss": -6.179241180419922, "global_step": 77227, "epoch": 1838} {"train_loss": -6.068031311035156, "global_step": 77228, "epoch": 1838} {"train_loss": -6.019182205200195, "global_step": 77229, "epoch": 1838} {"train_loss": -6.10532808303833, "global_step": 77230, "epoch": 1838} {"train_loss": -6.043654918670654, "global_step": 77231, "epoch": 1838} {"train_loss": -6.048491954803467, "global_step": 77232, "epoch": 1838} {"train_loss": -6.076410293579102, "global_step": 77233, "epoch": 1838} {"train_loss": -6.0168046951293945, "global_step": 77234, "epoch": 1838} {"train_loss": -6.019232273101807, "global_step": 77235, "epoch": 1838} {"train_loss": -6.077609062194824, "global_step": 77236, "epoch": 1838} {"train_loss": -6.090991690045311, "global_step": 77237, "epoch": 1838, "val_loss": 62022.73046875} {"train_loss": -6.17459774017334, "global_step": 77238, "epoch": 1839} {"train_loss": -6.01568078994751, "global_step": 77239, "epoch": 1839} {"train_loss": -6.054257869720459, "global_step": 77240, "epoch": 1839} {"train_loss": -6.058206558227539, "global_step": 77241, "epoch": 1839} {"train_loss": -5.991995811462402, "global_step": 77242, "epoch": 1839} {"train_loss": -5.902291297912598, "global_step": 77243, "epoch": 1839} {"train_loss": -6.054271697998047, "global_step": 77244, "epoch": 1839} {"train_loss": -5.9452290534973145, "global_step": 77245, "epoch": 1839} {"train_loss": -5.977409839630127, "global_step": 77246, "epoch": 1839} {"train_loss": -5.902031421661377, "global_step": 77247, "epoch": 1839} {"train_loss": -5.97557258605957, "global_step": 77248, "epoch": 1839} {"train_loss": -6.100874900817871, "global_step": 77249, "epoch": 1839} {"train_loss": -6.126471519470215, "global_step": 77250, "epoch": 1839} {"train_loss": -6.10471248626709, "global_step": 77251, "epoch": 1839} {"train_loss": -6.077691078186035, "global_step": 77252, "epoch": 1839} {"train_loss": -6.125384330749512, "global_step": 77253, "epoch": 1839} {"train_loss": -6.087201118469238, "global_step": 77254, "epoch": 1839} {"train_loss": -6.002882480621338, "global_step": 77255, "epoch": 1839} {"train_loss": -6.079869747161865, "global_step": 77256, "epoch": 1839} {"train_loss": -6.114257335662842, "global_step": 77257, "epoch": 1839} {"train_loss": -6.036208152770996, "global_step": 77258, "epoch": 1839} {"train_loss": -6.045405387878418, "global_step": 77259, "epoch": 1839} {"train_loss": -6.1038312911987305, "global_step": 77260, "epoch": 1839} {"train_loss": -6.105757713317871, "global_step": 77261, "epoch": 1839} {"train_loss": -6.107857704162598, "global_step": 77262, "epoch": 1839} {"train_loss": -6.06995153427124, "global_step": 77263, "epoch": 1839} {"train_loss": -6.178330421447754, "global_step": 77264, "epoch": 1839} {"train_loss": -6.104128360748291, "global_step": 77265, "epoch": 1839} {"train_loss": -5.981827735900879, "global_step": 77266, "epoch": 1839} {"train_loss": -6.100244045257568, "global_step": 77267, "epoch": 1839} {"train_loss": -6.043329238891602, "global_step": 77268, "epoch": 1839} {"train_loss": -6.030539512634277, "global_step": 77269, "epoch": 1839} {"train_loss": -6.191742897033691, "global_step": 77270, "epoch": 1839} {"train_loss": -6.138947486877441, "global_step": 77271, "epoch": 1839} {"train_loss": -6.156389236450195, "global_step": 77272, "epoch": 1839} {"train_loss": -6.176785469055176, "global_step": 77273, "epoch": 1839} {"train_loss": -6.22314453125, "global_step": 77274, "epoch": 1839} {"train_loss": -6.095452785491943, "global_step": 77275, "epoch": 1839} {"train_loss": -6.170854091644287, "global_step": 77276, "epoch": 1839} {"train_loss": -6.153903007507324, "global_step": 77277, "epoch": 1839} {"train_loss": -6.090939521789551, "global_step": 77278, "epoch": 1839} {"train_loss": -6.078536294755482, "global_step": 77279, "epoch": 1839, "val_loss": 62037.03125} {"train_loss": -6.282769203186035, "global_step": 77280, "epoch": 1840} {"train_loss": -6.232814788818359, "global_step": 77281, "epoch": 1840} {"train_loss": -6.172894477844238, "global_step": 77282, "epoch": 1840} {"train_loss": -6.239872455596924, "global_step": 77283, "epoch": 1840} {"train_loss": -6.118593692779541, "global_step": 77284, "epoch": 1840} {"train_loss": -6.085559844970703, "global_step": 77285, "epoch": 1840} {"train_loss": -6.156668186187744, "global_step": 77286, "epoch": 1840} {"train_loss": -6.2119140625, "global_step": 77287, "epoch": 1840} {"train_loss": -6.047812461853027, "global_step": 77288, "epoch": 1840} {"train_loss": -6.304267883300781, "global_step": 77289, "epoch": 1840} {"train_loss": -6.190295219421387, "global_step": 77290, "epoch": 1840} {"train_loss": -6.133509635925293, "global_step": 77291, "epoch": 1840} {"train_loss": -6.147225379943848, "global_step": 77292, "epoch": 1840} {"train_loss": -6.050251007080078, "global_step": 77293, "epoch": 1840} {"train_loss": -6.151355266571045, "global_step": 77294, "epoch": 1840} {"train_loss": -6.118069648742676, "global_step": 77295, "epoch": 1840} {"train_loss": -6.2005839347839355, "global_step": 77296, "epoch": 1840} {"train_loss": -6.200712203979492, "global_step": 77297, "epoch": 1840} {"train_loss": -6.053118705749512, "global_step": 77298, "epoch": 1840} {"train_loss": -6.196478366851807, "global_step": 77299, "epoch": 1840} {"train_loss": -6.105960845947266, "global_step": 77300, "epoch": 1840} {"train_loss": -6.269457817077637, "global_step": 77301, "epoch": 1840} {"train_loss": -6.101320266723633, "global_step": 77302, "epoch": 1840} {"train_loss": -6.118132591247559, "global_step": 77303, "epoch": 1840} {"train_loss": -6.218051433563232, "global_step": 77304, "epoch": 1840} {"train_loss": -6.064359664916992, "global_step": 77305, "epoch": 1840} {"train_loss": -6.041703701019287, "global_step": 77306, "epoch": 1840} {"train_loss": -6.074807167053223, "global_step": 77307, "epoch": 1840} {"train_loss": -6.125339031219482, "global_step": 77308, "epoch": 1840} {"train_loss": -6.049911022186279, "global_step": 77309, "epoch": 1840} {"train_loss": -6.219437122344971, "global_step": 77310, "epoch": 1840} {"train_loss": -6.02472448348999, "global_step": 77311, "epoch": 1840} {"train_loss": -6.125029563903809, "global_step": 77312, "epoch": 1840} {"train_loss": -6.059835433959961, "global_step": 77313, "epoch": 1840} {"train_loss": -6.113053321838379, "global_step": 77314, "epoch": 1840} {"train_loss": -6.103757381439209, "global_step": 77315, "epoch": 1840} {"train_loss": -6.1138386726379395, "global_step": 77316, "epoch": 1840} {"train_loss": -6.154770374298096, "global_step": 77317, "epoch": 1840} {"train_loss": -6.124883651733398, "global_step": 77318, "epoch": 1840} {"train_loss": -6.147251129150391, "global_step": 77319, "epoch": 1840} {"train_loss": -6.039934158325195, "global_step": 77320, "epoch": 1840} {"train_loss": -6.14024821917216, "global_step": 77321, "epoch": 1840, "val_loss": 62026.203125} {"train_loss": -6.120887279510498, "global_step": 77322, "epoch": 1841} {"train_loss": -6.095963478088379, "global_step": 77323, "epoch": 1841} {"train_loss": -6.206799507141113, "global_step": 77324, "epoch": 1841} {"train_loss": -6.091416835784912, "global_step": 77325, "epoch": 1841} {"train_loss": -6.240697860717773, "global_step": 77326, "epoch": 1841} {"train_loss": -6.145565986633301, "global_step": 77327, "epoch": 1841} {"train_loss": -6.189785957336426, "global_step": 77328, "epoch": 1841} {"train_loss": -6.154308795928955, "global_step": 77329, "epoch": 1841} {"train_loss": -6.19079065322876, "global_step": 77330, "epoch": 1841} {"train_loss": -6.192580699920654, "global_step": 77331, "epoch": 1841} {"train_loss": -6.1097917556762695, "global_step": 77332, "epoch": 1841} {"train_loss": -6.100581169128418, "global_step": 77333, "epoch": 1841} {"train_loss": -6.1806511878967285, "global_step": 77334, "epoch": 1841} {"train_loss": -6.117103099822998, "global_step": 77335, "epoch": 1841} {"train_loss": -6.139365196228027, "global_step": 77336, "epoch": 1841} {"train_loss": -6.1305694580078125, "global_step": 77337, "epoch": 1841} {"train_loss": -6.077663898468018, "global_step": 77338, "epoch": 1841} {"train_loss": -6.160911560058594, "global_step": 77339, "epoch": 1841} {"train_loss": -6.207677841186523, "global_step": 77340, "epoch": 1841} {"train_loss": -6.20068359375, "global_step": 77341, "epoch": 1841} {"train_loss": -6.084415435791016, "global_step": 77342, "epoch": 1841} {"train_loss": -6.224869251251221, "global_step": 77343, "epoch": 1841} {"train_loss": -6.231844902038574, "global_step": 77344, "epoch": 1841} {"train_loss": -6.123967170715332, "global_step": 77345, "epoch": 1841} {"train_loss": -6.077156066894531, "global_step": 77346, "epoch": 1841} {"train_loss": -6.062529563903809, "global_step": 77347, "epoch": 1841} {"train_loss": -6.129004001617432, "global_step": 77348, "epoch": 1841} {"train_loss": -6.104142189025879, "global_step": 77349, "epoch": 1841} {"train_loss": -6.189474105834961, "global_step": 77350, "epoch": 1841} {"train_loss": -6.139307498931885, "global_step": 77351, "epoch": 1841} {"train_loss": -6.1468610763549805, "global_step": 77352, "epoch": 1841} {"train_loss": -6.191327095031738, "global_step": 77353, "epoch": 1841} {"train_loss": -6.130678176879883, "global_step": 77354, "epoch": 1841} {"train_loss": -6.1279168128967285, "global_step": 77355, "epoch": 1841} {"train_loss": -6.257664680480957, "global_step": 77356, "epoch": 1841} {"train_loss": -6.207616806030273, "global_step": 77357, "epoch": 1841} {"train_loss": -6.109923839569092, "global_step": 77358, "epoch": 1841} {"train_loss": -6.095362186431885, "global_step": 77359, "epoch": 1841} {"train_loss": -6.121289253234863, "global_step": 77360, "epoch": 1841} {"train_loss": -6.144845962524414, "global_step": 77361, "epoch": 1841} {"train_loss": -6.178536415100098, "global_step": 77362, "epoch": 1841} {"train_loss": -6.151418458847773, "global_step": 77363, "epoch": 1841, "val_loss": 61898.53125} {"train_loss": -6.056670188903809, "global_step": 77364, "epoch": 1842} {"train_loss": -6.219700813293457, "global_step": 77365, "epoch": 1842} {"train_loss": -6.169246196746826, "global_step": 77366, "epoch": 1842} {"train_loss": -6.136411666870117, "global_step": 77367, "epoch": 1842} {"train_loss": -6.168951034545898, "global_step": 77368, "epoch": 1842} {"train_loss": -6.110381126403809, "global_step": 77369, "epoch": 1842} {"train_loss": -6.250227928161621, "global_step": 77370, "epoch": 1842} {"train_loss": -6.115811347961426, "global_step": 77371, "epoch": 1842} {"train_loss": -6.045187950134277, "global_step": 77372, "epoch": 1842} {"train_loss": -6.187511444091797, "global_step": 77373, "epoch": 1842} {"train_loss": -6.154331207275391, "global_step": 77374, "epoch": 1842} {"train_loss": -6.06568717956543, "global_step": 77375, "epoch": 1842} {"train_loss": -6.105152606964111, "global_step": 77376, "epoch": 1842} {"train_loss": -6.173623561859131, "global_step": 77377, "epoch": 1842} {"train_loss": -6.1929450035095215, "global_step": 77378, "epoch": 1842} {"train_loss": -6.103024482727051, "global_step": 77379, "epoch": 1842} {"train_loss": -6.147021770477295, "global_step": 77380, "epoch": 1842} {"train_loss": -6.151945114135742, "global_step": 77381, "epoch": 1842} {"train_loss": -6.055233478546143, "global_step": 77382, "epoch": 1842} {"train_loss": -6.113650321960449, "global_step": 77383, "epoch": 1842} {"train_loss": -6.24428653717041, "global_step": 77384, "epoch": 1842} {"train_loss": -6.065009117126465, "global_step": 77385, "epoch": 1842} {"train_loss": -6.134790897369385, "global_step": 77386, "epoch": 1842} {"train_loss": -6.327341556549072, "global_step": 77387, "epoch": 1842} {"train_loss": -6.219036102294922, "global_step": 77388, "epoch": 1842} {"train_loss": -6.140100479125977, "global_step": 77389, "epoch": 1842} {"train_loss": -6.152754306793213, "global_step": 77390, "epoch": 1842} {"train_loss": -6.0955939292907715, "global_step": 77391, "epoch": 1842} {"train_loss": -6.122262954711914, "global_step": 77392, "epoch": 1842} {"train_loss": -6.271427154541016, "global_step": 77393, "epoch": 1842} {"train_loss": -6.111555099487305, "global_step": 77394, "epoch": 1842} {"train_loss": -6.002870559692383, "global_step": 77395, "epoch": 1842} {"train_loss": -5.991138458251953, "global_step": 77396, "epoch": 1842} {"train_loss": -6.040041446685791, "global_step": 77397, "epoch": 1842} {"train_loss": -6.038796424865723, "global_step": 77398, "epoch": 1842} {"train_loss": -6.019560813903809, "global_step": 77399, "epoch": 1842} {"train_loss": -6.099023818969727, "global_step": 77400, "epoch": 1842} {"train_loss": -6.063835144042969, "global_step": 77401, "epoch": 1842} {"train_loss": -6.009363651275635, "global_step": 77402, "epoch": 1842} {"train_loss": -6.092594623565674, "global_step": 77403, "epoch": 1842} {"train_loss": -6.069757461547852, "global_step": 77404, "epoch": 1842} {"train_loss": -6.120097296578543, "global_step": 77405, "epoch": 1842, "val_loss": 62425.5546875} {"train_loss": -6.134938716888428, "global_step": 77406, "epoch": 1843} {"train_loss": -6.165130615234375, "global_step": 77407, "epoch": 1843} {"train_loss": -5.978318214416504, "global_step": 77408, "epoch": 1843} {"train_loss": -6.086266994476318, "global_step": 77409, "epoch": 1843} {"train_loss": -6.002094268798828, "global_step": 77410, "epoch": 1843} {"train_loss": -6.088685989379883, "global_step": 77411, "epoch": 1843} {"train_loss": -5.9610419273376465, "global_step": 77412, "epoch": 1843} {"train_loss": -6.173938751220703, "global_step": 77413, "epoch": 1843} {"train_loss": -6.179335117340088, "global_step": 77414, "epoch": 1843} {"train_loss": -6.048254489898682, "global_step": 77415, "epoch": 1843} {"train_loss": -6.07707405090332, "global_step": 77416, "epoch": 1843} {"train_loss": -5.996094703674316, "global_step": 77417, "epoch": 1843} {"train_loss": -6.077802658081055, "global_step": 77418, "epoch": 1843} {"train_loss": -6.129995822906494, "global_step": 77419, "epoch": 1843} {"train_loss": -6.030463695526123, "global_step": 77420, "epoch": 1843} {"train_loss": -6.163481712341309, "global_step": 77421, "epoch": 1843} {"train_loss": -6.072129249572754, "global_step": 77422, "epoch": 1843} {"train_loss": -6.041196346282959, "global_step": 77423, "epoch": 1843} {"train_loss": -6.027101039886475, "global_step": 77424, "epoch": 1843} {"train_loss": -6.221096038818359, "global_step": 77425, "epoch": 1843} {"train_loss": -6.2610979080200195, "global_step": 77426, "epoch": 1843} {"train_loss": -6.137824058532715, "global_step": 77427, "epoch": 1843} {"train_loss": -6.0785112380981445, "global_step": 77428, "epoch": 1843} {"train_loss": -6.107692241668701, "global_step": 77429, "epoch": 1843} {"train_loss": -6.231288433074951, "global_step": 77430, "epoch": 1843} {"train_loss": -6.113885879516602, "global_step": 77431, "epoch": 1843} {"train_loss": -6.193443775177002, "global_step": 77432, "epoch": 1843} {"train_loss": -6.109764575958252, "global_step": 77433, "epoch": 1843} {"train_loss": -6.086061000823975, "global_step": 77434, "epoch": 1843} {"train_loss": -6.114654541015625, "global_step": 77435, "epoch": 1843} {"train_loss": -6.082723617553711, "global_step": 77436, "epoch": 1843} {"train_loss": -6.140678405761719, "global_step": 77437, "epoch": 1843} {"train_loss": -6.181816577911377, "global_step": 77438, "epoch": 1843} {"train_loss": -6.226720809936523, "global_step": 77439, "epoch": 1843} {"train_loss": -6.083512783050537, "global_step": 77440, "epoch": 1843} {"train_loss": -6.138699054718018, "global_step": 77441, "epoch": 1843} {"train_loss": -6.192372798919678, "global_step": 77442, "epoch": 1843} {"train_loss": -6.048742294311523, "global_step": 77443, "epoch": 1843} {"train_loss": -6.123740196228027, "global_step": 77444, "epoch": 1843} {"train_loss": -6.1719207763671875, "global_step": 77445, "epoch": 1843} {"train_loss": -5.9433393478393555, "global_step": 77446, "epoch": 1843} {"train_loss": -6.106821582430885, "global_step": 77447, "epoch": 1843, "val_loss": 62061.734375} {"train_loss": -6.0765299797058105, "global_step": 77448, "epoch": 1844} {"train_loss": -6.07257080078125, "global_step": 77449, "epoch": 1844} {"train_loss": -6.117584228515625, "global_step": 77450, "epoch": 1844} {"train_loss": -6.1570844650268555, "global_step": 77451, "epoch": 1844} {"train_loss": -6.171114921569824, "global_step": 77452, "epoch": 1844} {"train_loss": -6.18062686920166, "global_step": 77453, "epoch": 1844} {"train_loss": -6.117617607116699, "global_step": 77454, "epoch": 1844} {"train_loss": -6.110744953155518, "global_step": 77455, "epoch": 1844} {"train_loss": -6.172135353088379, "global_step": 77456, "epoch": 1844} {"train_loss": -6.15062141418457, "global_step": 77457, "epoch": 1844} {"train_loss": -6.10221529006958, "global_step": 77458, "epoch": 1844} {"train_loss": -6.023897171020508, "global_step": 77459, "epoch": 1844} {"train_loss": -6.162557601928711, "global_step": 77460, "epoch": 1844} {"train_loss": -6.0272111892700195, "global_step": 77461, "epoch": 1844} {"train_loss": -6.005455017089844, "global_step": 77462, "epoch": 1844} {"train_loss": -6.085951805114746, "global_step": 77463, "epoch": 1844} {"train_loss": -6.149292469024658, "global_step": 77464, "epoch": 1844} {"train_loss": -6.066136360168457, "global_step": 77465, "epoch": 1844} {"train_loss": -6.112569332122803, "global_step": 77466, "epoch": 1844} {"train_loss": -6.032705307006836, "global_step": 77467, "epoch": 1844} {"train_loss": -6.14631462097168, "global_step": 77468, "epoch": 1844} {"train_loss": -6.126576900482178, "global_step": 77469, "epoch": 1844} {"train_loss": -6.147965431213379, "global_step": 77470, "epoch": 1844} {"train_loss": -6.1022539138793945, "global_step": 77471, "epoch": 1844} {"train_loss": -6.090954780578613, "global_step": 77472, "epoch": 1844} {"train_loss": -6.042270660400391, "global_step": 77473, "epoch": 1844} {"train_loss": -6.125367164611816, "global_step": 77474, "epoch": 1844} {"train_loss": -6.038840293884277, "global_step": 77475, "epoch": 1844} {"train_loss": -6.065932750701904, "global_step": 77476, "epoch": 1844} {"train_loss": -6.045122146606445, "global_step": 77477, "epoch": 1844} {"train_loss": -6.1212592124938965, "global_step": 77478, "epoch": 1844} {"train_loss": -6.237269401550293, "global_step": 77479, "epoch": 1844} {"train_loss": -5.972639083862305, "global_step": 77480, "epoch": 1844} {"train_loss": -6.161819934844971, "global_step": 77481, "epoch": 1844} {"train_loss": -6.107264995574951, "global_step": 77482, "epoch": 1844} {"train_loss": -6.053644180297852, "global_step": 77483, "epoch": 1844} {"train_loss": -6.180000305175781, "global_step": 77484, "epoch": 1844} {"train_loss": -6.190728187561035, "global_step": 77485, "epoch": 1844} {"train_loss": -6.117329120635986, "global_step": 77486, "epoch": 1844} {"train_loss": -6.009685516357422, "global_step": 77487, "epoch": 1844} {"train_loss": -6.07520866394043, "global_step": 77488, "epoch": 1844} {"train_loss": -6.107103779202416, "global_step": 77489, "epoch": 1844, "val_loss": 62236.31640625} {"train_loss": -6.108829498291016, "global_step": 77490, "epoch": 1845} {"train_loss": -6.205387115478516, "global_step": 77491, "epoch": 1845} {"train_loss": -6.008631229400635, "global_step": 77492, "epoch": 1845} {"train_loss": -6.063928604125977, "global_step": 77493, "epoch": 1845} {"train_loss": -6.128867149353027, "global_step": 77494, "epoch": 1845} {"train_loss": -6.142853736877441, "global_step": 77495, "epoch": 1845} {"train_loss": -6.151777744293213, "global_step": 77496, "epoch": 1845} {"train_loss": -6.160583972930908, "global_step": 77497, "epoch": 1845} {"train_loss": -6.154184341430664, "global_step": 77498, "epoch": 1845} {"train_loss": -6.157932281494141, "global_step": 77499, "epoch": 1845} {"train_loss": -6.178708076477051, "global_step": 77500, "epoch": 1845} {"train_loss": -6.107774257659912, "global_step": 77501, "epoch": 1845} {"train_loss": -6.13615608215332, "global_step": 77502, "epoch": 1845} {"train_loss": -6.139648914337158, "global_step": 77503, "epoch": 1845} {"train_loss": -6.0497660636901855, "global_step": 77504, "epoch": 1845} {"train_loss": -6.1330389976501465, "global_step": 77505, "epoch": 1845} {"train_loss": -6.076781272888184, "global_step": 77506, "epoch": 1845} {"train_loss": -6.128443717956543, "global_step": 77507, "epoch": 1845} {"train_loss": -6.03121280670166, "global_step": 77508, "epoch": 1845} {"train_loss": -6.210497856140137, "global_step": 77509, "epoch": 1845} {"train_loss": -6.048954010009766, "global_step": 77510, "epoch": 1845} {"train_loss": -6.25737190246582, "global_step": 77511, "epoch": 1845} {"train_loss": -6.1352033615112305, "global_step": 77512, "epoch": 1845} {"train_loss": -6.136561870574951, "global_step": 77513, "epoch": 1845} {"train_loss": -6.22186279296875, "global_step": 77514, "epoch": 1845} {"train_loss": -6.052577972412109, "global_step": 77515, "epoch": 1845} {"train_loss": -6.055698394775391, "global_step": 77516, "epoch": 1845} {"train_loss": -6.0992350578308105, "global_step": 77517, "epoch": 1845} {"train_loss": -6.133657455444336, "global_step": 77518, "epoch": 1845} {"train_loss": -6.0785627365112305, "global_step": 77519, "epoch": 1845} {"train_loss": -6.049116611480713, "global_step": 77520, "epoch": 1845} {"train_loss": -6.006106853485107, "global_step": 77521, "epoch": 1845} {"train_loss": -6.112873554229736, "global_step": 77522, "epoch": 1845} {"train_loss": -6.0980682373046875, "global_step": 77523, "epoch": 1845} {"train_loss": -6.062433242797852, "global_step": 77524, "epoch": 1845} {"train_loss": -6.111460208892822, "global_step": 77525, "epoch": 1845} {"train_loss": -6.152891159057617, "global_step": 77526, "epoch": 1845} {"train_loss": -6.145801544189453, "global_step": 77527, "epoch": 1845} {"train_loss": -6.1611127853393555, "global_step": 77528, "epoch": 1845} {"train_loss": -6.079407215118408, "global_step": 77529, "epoch": 1845} {"train_loss": -6.052608489990234, "global_step": 77530, "epoch": 1845} {"train_loss": -6.115886177335467, "global_step": 77531, "epoch": 1845, "val_loss": 62112.140625} {"train_loss": -6.059830665588379, "global_step": 77532, "epoch": 1846} {"train_loss": -6.151398658752441, "global_step": 77533, "epoch": 1846} {"train_loss": -6.180837631225586, "global_step": 77534, "epoch": 1846} {"train_loss": -6.128834247589111, "global_step": 77535, "epoch": 1846} {"train_loss": -5.997428894042969, "global_step": 77536, "epoch": 1846} {"train_loss": -6.198980808258057, "global_step": 77537, "epoch": 1846} {"train_loss": -6.128016471862793, "global_step": 77538, "epoch": 1846} {"train_loss": -6.182380199432373, "global_step": 77539, "epoch": 1846} {"train_loss": -6.227353572845459, "global_step": 77540, "epoch": 1846} {"train_loss": -6.1832990646362305, "global_step": 77541, "epoch": 1846} {"train_loss": -6.182552337646484, "global_step": 77542, "epoch": 1846} {"train_loss": -6.143923282623291, "global_step": 77543, "epoch": 1846} {"train_loss": -6.097417831420898, "global_step": 77544, "epoch": 1846} {"train_loss": -6.014634609222412, "global_step": 77545, "epoch": 1846} {"train_loss": -6.003180503845215, "global_step": 77546, "epoch": 1846} {"train_loss": -6.079270362854004, "global_step": 77547, "epoch": 1846} {"train_loss": -6.051203727722168, "global_step": 77548, "epoch": 1846} {"train_loss": -6.190216064453125, "global_step": 77549, "epoch": 1846} {"train_loss": -6.182474136352539, "global_step": 77550, "epoch": 1846} {"train_loss": -6.1115875244140625, "global_step": 77551, "epoch": 1846} {"train_loss": -6.047439098358154, "global_step": 77552, "epoch": 1846} {"train_loss": -6.08543586730957, "global_step": 77553, "epoch": 1846} {"train_loss": -6.098325729370117, "global_step": 77554, "epoch": 1846} {"train_loss": -6.029778480529785, "global_step": 77555, "epoch": 1846} {"train_loss": -6.179123878479004, "global_step": 77556, "epoch": 1846} {"train_loss": -6.150327682495117, "global_step": 77557, "epoch": 1846} {"train_loss": -6.091228485107422, "global_step": 77558, "epoch": 1846} {"train_loss": -6.0756988525390625, "global_step": 77559, "epoch": 1846} {"train_loss": -6.1611785888671875, "global_step": 77560, "epoch": 1846} {"train_loss": -6.005545616149902, "global_step": 77561, "epoch": 1846} {"train_loss": -6.063774585723877, "global_step": 77562, "epoch": 1846} {"train_loss": -6.029650688171387, "global_step": 77563, "epoch": 1846} {"train_loss": -6.105639457702637, "global_step": 77564, "epoch": 1846} {"train_loss": -6.028566360473633, "global_step": 77565, "epoch": 1846} {"train_loss": -6.233523368835449, "global_step": 77566, "epoch": 1846} {"train_loss": -6.009039878845215, "global_step": 77567, "epoch": 1846} {"train_loss": -6.049438953399658, "global_step": 77568, "epoch": 1846} {"train_loss": -6.111593723297119, "global_step": 77569, "epoch": 1846} {"train_loss": -6.118338584899902, "global_step": 77570, "epoch": 1846} {"train_loss": -6.140486240386963, "global_step": 77571, "epoch": 1846} {"train_loss": -6.077692985534668, "global_step": 77572, "epoch": 1846} {"train_loss": -6.105771428062802, "global_step": 77573, "epoch": 1846, "val_loss": 62311.79296875} {"train_loss": -6.023733139038086, "global_step": 77574, "epoch": 1847} {"train_loss": -6.0627617835998535, "global_step": 77575, "epoch": 1847} {"train_loss": -6.171801567077637, "global_step": 77576, "epoch": 1847} {"train_loss": -6.142307281494141, "global_step": 77577, "epoch": 1847} {"train_loss": -6.050136089324951, "global_step": 77578, "epoch": 1847} {"train_loss": -6.137876987457275, "global_step": 77579, "epoch": 1847} {"train_loss": -6.2138671875, "global_step": 77580, "epoch": 1847} {"train_loss": -6.135576248168945, "global_step": 77581, "epoch": 1847} {"train_loss": -6.124828815460205, "global_step": 77582, "epoch": 1847} {"train_loss": -6.109100341796875, "global_step": 77583, "epoch": 1847} {"train_loss": -6.113936424255371, "global_step": 77584, "epoch": 1847} {"train_loss": -6.17249870300293, "global_step": 77585, "epoch": 1847} {"train_loss": -6.208067417144775, "global_step": 77586, "epoch": 1847} {"train_loss": -6.093868732452393, "global_step": 77587, "epoch": 1847} {"train_loss": -6.195148468017578, "global_step": 77588, "epoch": 1847} {"train_loss": -6.243217468261719, "global_step": 77589, "epoch": 1847} {"train_loss": -6.1219940185546875, "global_step": 77590, "epoch": 1847} {"train_loss": -6.020963191986084, "global_step": 77591, "epoch": 1847} {"train_loss": -6.20753288269043, "global_step": 77592, "epoch": 1847} {"train_loss": -6.235618591308594, "global_step": 77593, "epoch": 1847} {"train_loss": -6.056970596313477, "global_step": 77594, "epoch": 1847} {"train_loss": -6.073470115661621, "global_step": 77595, "epoch": 1847} {"train_loss": -6.311657428741455, "global_step": 77596, "epoch": 1847} {"train_loss": -6.021456718444824, "global_step": 77597, "epoch": 1847} {"train_loss": -5.994195938110352, "global_step": 77598, "epoch": 1847} {"train_loss": -6.120335578918457, "global_step": 77599, "epoch": 1847} {"train_loss": -6.083907127380371, "global_step": 77600, "epoch": 1847} {"train_loss": -6.081291198730469, "global_step": 77601, "epoch": 1847} {"train_loss": -6.037083625793457, "global_step": 77602, "epoch": 1847} {"train_loss": -6.004099369049072, "global_step": 77603, "epoch": 1847} {"train_loss": -6.075894355773926, "global_step": 77604, "epoch": 1847} {"train_loss": -6.148447036743164, "global_step": 77605, "epoch": 1847} {"train_loss": -6.004769802093506, "global_step": 77606, "epoch": 1847} {"train_loss": -6.104860305786133, "global_step": 77607, "epoch": 1847} {"train_loss": -6.150430202484131, "global_step": 77608, "epoch": 1847} {"train_loss": -6.069101333618164, "global_step": 77609, "epoch": 1847} {"train_loss": -6.118721008300781, "global_step": 77610, "epoch": 1847} {"train_loss": -6.1636152267456055, "global_step": 77611, "epoch": 1847} {"train_loss": -6.060241222381592, "global_step": 77612, "epoch": 1847} {"train_loss": -6.129410266876221, "global_step": 77613, "epoch": 1847} {"train_loss": -5.879030227661133, "global_step": 77614, "epoch": 1847} {"train_loss": -6.107946827298119, "global_step": 77615, "epoch": 1847, "val_loss": 62280.609375} {"train_loss": -6.005544662475586, "global_step": 77616, "epoch": 1848} {"train_loss": -6.064012050628662, "global_step": 77617, "epoch": 1848} {"train_loss": -6.212058067321777, "global_step": 77618, "epoch": 1848} {"train_loss": -6.179107666015625, "global_step": 77619, "epoch": 1848} {"train_loss": -6.118765830993652, "global_step": 77620, "epoch": 1848} {"train_loss": -6.168661594390869, "global_step": 77621, "epoch": 1848} {"train_loss": -6.1360764503479, "global_step": 77622, "epoch": 1848} {"train_loss": -6.063661575317383, "global_step": 77623, "epoch": 1848} {"train_loss": -6.016872882843018, "global_step": 77624, "epoch": 1848} {"train_loss": -6.2183403968811035, "global_step": 77625, "epoch": 1848} {"train_loss": -6.202686309814453, "global_step": 77626, "epoch": 1848} {"train_loss": -6.052555561065674, "global_step": 77627, "epoch": 1848} {"train_loss": -6.106926918029785, "global_step": 77628, "epoch": 1848} {"train_loss": -6.16221809387207, "global_step": 77629, "epoch": 1848} {"train_loss": -6.120120048522949, "global_step": 77630, "epoch": 1848} {"train_loss": -6.0586748123168945, "global_step": 77631, "epoch": 1848} {"train_loss": -6.103629112243652, "global_step": 77632, "epoch": 1848} {"train_loss": -6.2443742752075195, "global_step": 77633, "epoch": 1848} {"train_loss": -6.1751861572265625, "global_step": 77634, "epoch": 1848} {"train_loss": -6.095625877380371, "global_step": 77635, "epoch": 1848} {"train_loss": -6.176143169403076, "global_step": 77636, "epoch": 1848} {"train_loss": -6.0410356521606445, "global_step": 77637, "epoch": 1848} {"train_loss": -6.147186279296875, "global_step": 77638, "epoch": 1848} {"train_loss": -6.09022331237793, "global_step": 77639, "epoch": 1848} {"train_loss": -6.142757415771484, "global_step": 77640, "epoch": 1848} {"train_loss": -6.2186431884765625, "global_step": 77641, "epoch": 1848} {"train_loss": -6.107592582702637, "global_step": 77642, "epoch": 1848} {"train_loss": -6.042947769165039, "global_step": 77643, "epoch": 1848} {"train_loss": -6.203585147857666, "global_step": 77644, "epoch": 1848} {"train_loss": -6.204668998718262, "global_step": 77645, "epoch": 1848} {"train_loss": -6.1352362632751465, "global_step": 77646, "epoch": 1848} {"train_loss": -6.107764720916748, "global_step": 77647, "epoch": 1848} {"train_loss": -6.257952690124512, "global_step": 77648, "epoch": 1848} {"train_loss": -6.155673027038574, "global_step": 77649, "epoch": 1848} {"train_loss": -6.1605377197265625, "global_step": 77650, "epoch": 1848} {"train_loss": -6.121590614318848, "global_step": 77651, "epoch": 1848} {"train_loss": -6.281580924987793, "global_step": 77652, "epoch": 1848} {"train_loss": -6.210553169250488, "global_step": 77653, "epoch": 1848} {"train_loss": -6.018404006958008, "global_step": 77654, "epoch": 1848} {"train_loss": -6.212204933166504, "global_step": 77655, "epoch": 1848} {"train_loss": -6.049222946166992, "global_step": 77656, "epoch": 1848} {"train_loss": -6.137633391789028, "global_step": 77657, "epoch": 1848, "val_loss": 62109.3671875} {"train_loss": -6.202831268310547, "global_step": 77658, "epoch": 1849} {"train_loss": -6.09277868270874, "global_step": 77659, "epoch": 1849} {"train_loss": -6.0599493980407715, "global_step": 77660, "epoch": 1849} {"train_loss": -6.191254615783691, "global_step": 77661, "epoch": 1849} {"train_loss": -6.091683864593506, "global_step": 77662, "epoch": 1849} {"train_loss": -6.057704925537109, "global_step": 77663, "epoch": 1849} {"train_loss": -6.17975378036499, "global_step": 77664, "epoch": 1849} {"train_loss": -6.172822952270508, "global_step": 77665, "epoch": 1849} {"train_loss": -6.131879806518555, "global_step": 77666, "epoch": 1849} {"train_loss": -6.216245174407959, "global_step": 77667, "epoch": 1849} {"train_loss": -6.157700061798096, "global_step": 77668, "epoch": 1849} {"train_loss": -6.130020618438721, "global_step": 77669, "epoch": 1849} {"train_loss": -5.983105182647705, "global_step": 77670, "epoch": 1849} {"train_loss": -6.055936813354492, "global_step": 77671, "epoch": 1849} {"train_loss": -6.054192543029785, "global_step": 77672, "epoch": 1849} {"train_loss": -6.068180084228516, "global_step": 77673, "epoch": 1849} {"train_loss": -6.123485088348389, "global_step": 77674, "epoch": 1849} {"train_loss": -6.085165977478027, "global_step": 77675, "epoch": 1849} {"train_loss": -6.155762195587158, "global_step": 77676, "epoch": 1849} {"train_loss": -5.981148719787598, "global_step": 77677, "epoch": 1849} {"train_loss": -6.09123420715332, "global_step": 77678, "epoch": 1849} {"train_loss": -6.104170799255371, "global_step": 77679, "epoch": 1849} {"train_loss": -6.1378092765808105, "global_step": 77680, "epoch": 1849} {"train_loss": -5.9076008796691895, "global_step": 77681, "epoch": 1849} {"train_loss": -6.0475568771362305, "global_step": 77682, "epoch": 1849} {"train_loss": -5.937161445617676, "global_step": 77683, "epoch": 1849} {"train_loss": -6.16727876663208, "global_step": 77684, "epoch": 1849} {"train_loss": -6.0481085777282715, "global_step": 77685, "epoch": 1849} {"train_loss": -6.004602909088135, "global_step": 77686, "epoch": 1849} {"train_loss": -6.083808898925781, "global_step": 77687, "epoch": 1849} {"train_loss": -5.929940700531006, "global_step": 77688, "epoch": 1849} {"train_loss": -6.040833473205566, "global_step": 77689, "epoch": 1849} {"train_loss": -6.096993446350098, "global_step": 77690, "epoch": 1849} {"train_loss": -6.092532157897949, "global_step": 77691, "epoch": 1849} {"train_loss": -6.069881439208984, "global_step": 77692, "epoch": 1849} {"train_loss": -6.149003028869629, "global_step": 77693, "epoch": 1849} {"train_loss": -6.0965576171875, "global_step": 77694, "epoch": 1849} {"train_loss": -6.023714542388916, "global_step": 77695, "epoch": 1849} {"train_loss": -6.060042858123779, "global_step": 77696, "epoch": 1849} {"train_loss": -6.04517936706543, "global_step": 77697, "epoch": 1849} {"train_loss": -6.1341962814331055, "global_step": 77698, "epoch": 1849} {"train_loss": -6.082631769634428, "global_step": 77699, "epoch": 1849, "val_loss": 62231.71875} {"train_loss": -6.1729736328125, "global_step": 77700, "epoch": 1850} {"train_loss": -6.306710243225098, "global_step": 77701, "epoch": 1850} {"train_loss": -6.095545768737793, "global_step": 77702, "epoch": 1850} {"train_loss": -6.061344146728516, "global_step": 77703, "epoch": 1850} {"train_loss": -6.006453514099121, "global_step": 77704, "epoch": 1850} {"train_loss": -6.06048583984375, "global_step": 77705, "epoch": 1850} {"train_loss": -6.007282257080078, "global_step": 77706, "epoch": 1850} {"train_loss": -6.066953659057617, "global_step": 77707, "epoch": 1850} {"train_loss": -6.1755475997924805, "global_step": 77708, "epoch": 1850} {"train_loss": -6.038473129272461, "global_step": 77709, "epoch": 1850} {"train_loss": -6.081264495849609, "global_step": 77710, "epoch": 1850} {"train_loss": -6.085896015167236, "global_step": 77711, "epoch": 1850} {"train_loss": -6.2731781005859375, "global_step": 77712, "epoch": 1850} {"train_loss": -6.138212203979492, "global_step": 77713, "epoch": 1850} {"train_loss": -6.107043266296387, "global_step": 77714, "epoch": 1850} {"train_loss": -6.2000627517700195, "global_step": 77715, "epoch": 1850} {"train_loss": -6.0366058349609375, "global_step": 77716, "epoch": 1850} {"train_loss": -6.165701866149902, "global_step": 77717, "epoch": 1850} {"train_loss": -6.057340621948242, "global_step": 77718, "epoch": 1850} {"train_loss": -6.162322044372559, "global_step": 77719, "epoch": 1850} {"train_loss": -6.182572364807129, "global_step": 77720, "epoch": 1850} {"train_loss": -6.180013656616211, "global_step": 77721, "epoch": 1850} {"train_loss": -6.190604209899902, "global_step": 77722, "epoch": 1850} {"train_loss": -6.087679862976074, "global_step": 77723, "epoch": 1850} {"train_loss": -6.136422157287598, "global_step": 77724, "epoch": 1850} {"train_loss": -6.205979824066162, "global_step": 77725, "epoch": 1850} {"train_loss": -6.009426116943359, "global_step": 77726, "epoch": 1850} {"train_loss": -6.090404033660889, "global_step": 77727, "epoch": 1850} {"train_loss": -6.259546756744385, "global_step": 77728, "epoch": 1850} {"train_loss": -6.060069561004639, "global_step": 77729, "epoch": 1850} {"train_loss": -6.131037712097168, "global_step": 77730, "epoch": 1850} {"train_loss": -6.172394275665283, "global_step": 77731, "epoch": 1850} {"train_loss": -6.153863906860352, "global_step": 77732, "epoch": 1850} {"train_loss": -6.170385360717773, "global_step": 77733, "epoch": 1850} {"train_loss": -6.122533798217773, "global_step": 77734, "epoch": 1850} {"train_loss": -6.100176811218262, "global_step": 77735, "epoch": 1850} {"train_loss": -6.12020206451416, "global_step": 77736, "epoch": 1850} {"train_loss": -6.1017608642578125, "global_step": 77737, "epoch": 1850} {"train_loss": -6.171693801879883, "global_step": 77738, "epoch": 1850} {"train_loss": -6.069326400756836, "global_step": 77739, "epoch": 1850} {"train_loss": -6.150265216827393, "global_step": 77740, "epoch": 1850} {"train_loss": -6.125942128045218, "global_step": 77741, "epoch": 1850, "train/sim_max_reward_0": 0.6734656527246161, "train/sim_max_reward_1": 0.7244262615434661, "train/sim_max_reward_2": 0.8831468123151563, "train/sim_max_reward_3": 0.9346580403549934, "train/sim_max_reward_4": 0.8854857714523322, "train/sim_max_reward_5": 0.6866211028965384, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.9376633878015558, "test/sim_max_reward_4300002": 0.7862551189356591, "test/sim_max_reward_4300003": 0.9967556936225415, "test/sim_max_reward_4300004": 0.2761057103687821, "test/sim_max_reward_4300005": 0.7969200971196992, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9628247288955069, "test/sim_max_reward_4300008": 0.7380491270453535, "test/sim_max_reward_4300009": 0.8665073809467068, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.8269653174622511, "test/sim_max_reward_4300012": 0.6305723823632766, "test/sim_max_reward_4300013": 0.9964785831942217, "test/sim_max_reward_4300014": 0.8508944428991001, "test/sim_max_reward_4300015": 0.8893568505008727, "test/sim_max_reward_4300016": 0.7962862750579298, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.8746275559915904, "test/sim_max_reward_4300019": 0.18540362024748705, "test/sim_max_reward_4300020": 0.8900890864807732, "test/sim_max_reward_4300021": 0.765405335218248, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.34840543484504966, "test/sim_max_reward_4300024": 0.05737975128533643, "test/sim_max_reward_4300025": 0.9760924806462243, "test/sim_max_reward_4300026": 0.658665617897701, "test/sim_max_reward_4300027": 0.9863753316942699, "test/sim_max_reward_4300028": 0.0046851982405283505, "test/sim_max_reward_4300029": 0.0007411998238577134, "test/sim_max_reward_4300030": 0.11776389839125931, "test/sim_max_reward_4300031": 0.21649454219621356, "test/sim_max_reward_4300032": 0.8879888193418678, "test/sim_max_reward_4300033": 0.8404247007967675, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.3109686510717166, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.878690631711465, "test/sim_max_reward_4300038": 0.011142342833603323, "test/sim_max_reward_4300039": 0.8843103310762039, "test/sim_max_reward_4300040": 0.0, "test/sim_max_reward_4300041": 0.7576682208117238, "test/sim_max_reward_4300042": 0.8379341746775646, "test/sim_max_reward_4300043": 0.030682319031148337, "test/sim_max_reward_4300044": 0.4945192612154546, "test/sim_max_reward_4300045": 0.2973077333149933, "test/sim_max_reward_4300046": 0.027960517105728337, "test/sim_max_reward_4300047": 0.7410804032837627, "test/sim_max_reward_4300048": 0.02247908848174155, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.7979672735478504, "test/mean_score": 0.5331223091897843, "val_loss": 62047.9140625} {"train_loss": -6.108023643493652, "global_step": 77742, "epoch": 1851} {"train_loss": -6.1270294189453125, "global_step": 77743, "epoch": 1851} {"train_loss": -6.128109931945801, "global_step": 77744, "epoch": 1851} {"train_loss": -6.143693923950195, "global_step": 77745, "epoch": 1851} {"train_loss": -6.2385334968566895, "global_step": 77746, "epoch": 1851} {"train_loss": -6.090592861175537, "global_step": 77747, "epoch": 1851} {"train_loss": -6.1320600509643555, "global_step": 77748, "epoch": 1851} {"train_loss": -6.184012413024902, "global_step": 77749, "epoch": 1851} {"train_loss": -6.081938743591309, "global_step": 77750, "epoch": 1851} {"train_loss": -6.0882649421691895, "global_step": 77751, "epoch": 1851} {"train_loss": -6.11850118637085, "global_step": 77752, "epoch": 1851} {"train_loss": -6.0927581787109375, "global_step": 77753, "epoch": 1851} {"train_loss": -6.246539115905762, "global_step": 77754, "epoch": 1851} {"train_loss": -6.260998725891113, "global_step": 77755, "epoch": 1851} {"train_loss": -6.14404296875, "global_step": 77756, "epoch": 1851} {"train_loss": -6.100652694702148, "global_step": 77757, "epoch": 1851} {"train_loss": -6.121214866638184, "global_step": 77758, "epoch": 1851} {"train_loss": -6.07756233215332, "global_step": 77759, "epoch": 1851} {"train_loss": -6.232906341552734, "global_step": 77760, "epoch": 1851} {"train_loss": -6.1874847412109375, "global_step": 77761, "epoch": 1851} {"train_loss": -6.1146392822265625, "global_step": 77762, "epoch": 1851} {"train_loss": -6.018128395080566, "global_step": 77763, "epoch": 1851} {"train_loss": -6.154128551483154, "global_step": 77764, "epoch": 1851} {"train_loss": -6.1241374015808105, "global_step": 77765, "epoch": 1851} {"train_loss": -6.185333728790283, "global_step": 77766, "epoch": 1851} {"train_loss": -6.193243026733398, "global_step": 77767, "epoch": 1851} {"train_loss": -6.190898895263672, "global_step": 77768, "epoch": 1851} {"train_loss": -6.069735527038574, "global_step": 77769, "epoch": 1851} {"train_loss": -6.212302207946777, "global_step": 77770, "epoch": 1851} {"train_loss": -6.075504302978516, "global_step": 77771, "epoch": 1851} {"train_loss": -6.138525009155273, "global_step": 77772, "epoch": 1851} {"train_loss": -6.160455703735352, "global_step": 77773, "epoch": 1851} {"train_loss": -6.2060160636901855, "global_step": 77774, "epoch": 1851} {"train_loss": -6.0435943603515625, "global_step": 77775, "epoch": 1851} {"train_loss": -6.113897323608398, "global_step": 77776, "epoch": 1851} {"train_loss": -6.154397964477539, "global_step": 77777, "epoch": 1851} {"train_loss": -6.173396587371826, "global_step": 77778, "epoch": 1851} {"train_loss": -5.946719169616699, "global_step": 77779, "epoch": 1851} {"train_loss": -6.242980003356934, "global_step": 77780, "epoch": 1851} {"train_loss": -6.083462238311768, "global_step": 77781, "epoch": 1851} {"train_loss": -6.19934606552124, "global_step": 77782, "epoch": 1851} {"train_loss": -6.135287852514358, "global_step": 77783, "epoch": 1851, "val_loss": 61912.7421875} {"train_loss": -6.086353302001953, "global_step": 77784, "epoch": 1852} {"train_loss": -6.213044166564941, "global_step": 77785, "epoch": 1852} {"train_loss": -6.117712020874023, "global_step": 77786, "epoch": 1852} {"train_loss": -6.090826988220215, "global_step": 77787, "epoch": 1852} {"train_loss": -6.005430698394775, "global_step": 77788, "epoch": 1852} {"train_loss": -6.1114397048950195, "global_step": 77789, "epoch": 1852} {"train_loss": -6.163592338562012, "global_step": 77790, "epoch": 1852} {"train_loss": -6.2169189453125, "global_step": 77791, "epoch": 1852} {"train_loss": -6.186316013336182, "global_step": 77792, "epoch": 1852} {"train_loss": -6.174304962158203, "global_step": 77793, "epoch": 1852} {"train_loss": -6.203183174133301, "global_step": 77794, "epoch": 1852} {"train_loss": -6.205170154571533, "global_step": 77795, "epoch": 1852} {"train_loss": -6.118134498596191, "global_step": 77796, "epoch": 1852} {"train_loss": -6.310220718383789, "global_step": 77797, "epoch": 1852} {"train_loss": -6.0536370277404785, "global_step": 77798, "epoch": 1852} {"train_loss": -5.984217643737793, "global_step": 77799, "epoch": 1852} {"train_loss": -6.198814392089844, "global_step": 77800, "epoch": 1852} {"train_loss": -6.008274078369141, "global_step": 77801, "epoch": 1852} {"train_loss": -6.190566062927246, "global_step": 77802, "epoch": 1852} {"train_loss": -6.1519317626953125, "global_step": 77803, "epoch": 1852} {"train_loss": -6.106904029846191, "global_step": 77804, "epoch": 1852} {"train_loss": -6.117744445800781, "global_step": 77805, "epoch": 1852} {"train_loss": -6.053942680358887, "global_step": 77806, "epoch": 1852} {"train_loss": -6.097386837005615, "global_step": 77807, "epoch": 1852} {"train_loss": -6.146761894226074, "global_step": 77808, "epoch": 1852} {"train_loss": -6.124481201171875, "global_step": 77809, "epoch": 1852} {"train_loss": -6.138237953186035, "global_step": 77810, "epoch": 1852} {"train_loss": -6.208264350891113, "global_step": 77811, "epoch": 1852} {"train_loss": -6.166254043579102, "global_step": 77812, "epoch": 1852} {"train_loss": -6.124129295349121, "global_step": 77813, "epoch": 1852} {"train_loss": -6.098453998565674, "global_step": 77814, "epoch": 1852} {"train_loss": -6.0834808349609375, "global_step": 77815, "epoch": 1852} {"train_loss": -6.082278251647949, "global_step": 77816, "epoch": 1852} {"train_loss": -6.132419109344482, "global_step": 77817, "epoch": 1852} {"train_loss": -6.058060646057129, "global_step": 77818, "epoch": 1852} {"train_loss": -6.108178615570068, "global_step": 77819, "epoch": 1852} {"train_loss": -6.105020523071289, "global_step": 77820, "epoch": 1852} {"train_loss": -6.189648628234863, "global_step": 77821, "epoch": 1852} {"train_loss": -6.208719253540039, "global_step": 77822, "epoch": 1852} {"train_loss": -6.066709518432617, "global_step": 77823, "epoch": 1852} {"train_loss": -6.1336565017700195, "global_step": 77824, "epoch": 1852} {"train_loss": -6.128802027021136, "global_step": 77825, "epoch": 1852, "val_loss": 62190.69921875} {"train_loss": -6.031880855560303, "global_step": 77826, "epoch": 1853} {"train_loss": -6.047858715057373, "global_step": 77827, "epoch": 1853} {"train_loss": -6.16987419128418, "global_step": 77828, "epoch": 1853} {"train_loss": -6.176627159118652, "global_step": 77829, "epoch": 1853} {"train_loss": -6.021965980529785, "global_step": 77830, "epoch": 1853} {"train_loss": -6.21132230758667, "global_step": 77831, "epoch": 1853} {"train_loss": -6.054998397827148, "global_step": 77832, "epoch": 1853} {"train_loss": -6.12252140045166, "global_step": 77833, "epoch": 1853} {"train_loss": -6.128758430480957, "global_step": 77834, "epoch": 1853} {"train_loss": -6.100854396820068, "global_step": 77835, "epoch": 1853} {"train_loss": -6.184069633483887, "global_step": 77836, "epoch": 1853} {"train_loss": -6.154815673828125, "global_step": 77837, "epoch": 1853} {"train_loss": -6.169013500213623, "global_step": 77838, "epoch": 1853} {"train_loss": -6.105707168579102, "global_step": 77839, "epoch": 1853} {"train_loss": -6.1580352783203125, "global_step": 77840, "epoch": 1853} {"train_loss": -6.188553810119629, "global_step": 77841, "epoch": 1853} {"train_loss": -6.195030689239502, "global_step": 77842, "epoch": 1853} {"train_loss": -6.021356582641602, "global_step": 77843, "epoch": 1853} {"train_loss": -6.280285835266113, "global_step": 77844, "epoch": 1853} {"train_loss": -6.174320697784424, "global_step": 77845, "epoch": 1853} {"train_loss": -6.301302909851074, "global_step": 77846, "epoch": 1853} {"train_loss": -6.119204521179199, "global_step": 77847, "epoch": 1853} {"train_loss": -6.107651710510254, "global_step": 77848, "epoch": 1853} {"train_loss": -6.1775970458984375, "global_step": 77849, "epoch": 1853} {"train_loss": -6.072877883911133, "global_step": 77850, "epoch": 1853} {"train_loss": -6.1317338943481445, "global_step": 77851, "epoch": 1853} {"train_loss": -6.084564208984375, "global_step": 77852, "epoch": 1853} {"train_loss": -6.1249284744262695, "global_step": 77853, "epoch": 1853} {"train_loss": -6.053272724151611, "global_step": 77854, "epoch": 1853} {"train_loss": -6.085774898529053, "global_step": 77855, "epoch": 1853} {"train_loss": -6.102931976318359, "global_step": 77856, "epoch": 1853} {"train_loss": -6.08071231842041, "global_step": 77857, "epoch": 1853} {"train_loss": -6.124783992767334, "global_step": 77858, "epoch": 1853} {"train_loss": -6.036941051483154, "global_step": 77859, "epoch": 1853} {"train_loss": -6.188715934753418, "global_step": 77860, "epoch": 1853} {"train_loss": -6.22784423828125, "global_step": 77861, "epoch": 1853} {"train_loss": -6.022058963775635, "global_step": 77862, "epoch": 1853} {"train_loss": -6.300362586975098, "global_step": 77863, "epoch": 1853} {"train_loss": -6.14780330657959, "global_step": 77864, "epoch": 1853} {"train_loss": -6.0408244132995605, "global_step": 77865, "epoch": 1853} {"train_loss": -6.075325965881348, "global_step": 77866, "epoch": 1853} {"train_loss": -6.128055549803234, "global_step": 77867, "epoch": 1853, "val_loss": 62270.4375} {"train_loss": -6.065319061279297, "global_step": 77868, "epoch": 1854} {"train_loss": -6.171390533447266, "global_step": 77869, "epoch": 1854} {"train_loss": -6.0250349044799805, "global_step": 77870, "epoch": 1854} {"train_loss": -6.142693996429443, "global_step": 77871, "epoch": 1854} {"train_loss": -6.187863349914551, "global_step": 77872, "epoch": 1854} {"train_loss": -6.099944114685059, "global_step": 77873, "epoch": 1854} {"train_loss": -6.171879768371582, "global_step": 77874, "epoch": 1854} {"train_loss": -6.273146629333496, "global_step": 77875, "epoch": 1854} {"train_loss": -5.994219779968262, "global_step": 77876, "epoch": 1854} {"train_loss": -5.953311920166016, "global_step": 77877, "epoch": 1854} {"train_loss": -6.151754379272461, "global_step": 77878, "epoch": 1854} {"train_loss": -6.020478248596191, "global_step": 77879, "epoch": 1854} {"train_loss": -6.214912414550781, "global_step": 77880, "epoch": 1854} {"train_loss": -6.183932781219482, "global_step": 77881, "epoch": 1854} {"train_loss": -6.169874668121338, "global_step": 77882, "epoch": 1854} {"train_loss": -6.132643699645996, "global_step": 77883, "epoch": 1854} {"train_loss": -6.005255222320557, "global_step": 77884, "epoch": 1854} {"train_loss": -6.093136787414551, "global_step": 77885, "epoch": 1854} {"train_loss": -6.039887428283691, "global_step": 77886, "epoch": 1854} {"train_loss": -6.176483631134033, "global_step": 77887, "epoch": 1854} {"train_loss": -6.111441135406494, "global_step": 77888, "epoch": 1854} {"train_loss": -6.096726894378662, "global_step": 77889, "epoch": 1854} {"train_loss": -6.127630710601807, "global_step": 77890, "epoch": 1854} {"train_loss": -6.1742706298828125, "global_step": 77891, "epoch": 1854} {"train_loss": -6.085620880126953, "global_step": 77892, "epoch": 1854} {"train_loss": -6.030289649963379, "global_step": 77893, "epoch": 1854} {"train_loss": -6.126108169555664, "global_step": 77894, "epoch": 1854} {"train_loss": -6.144682884216309, "global_step": 77895, "epoch": 1854} {"train_loss": -6.227713108062744, "global_step": 77896, "epoch": 1854} {"train_loss": -6.075294017791748, "global_step": 77897, "epoch": 1854} {"train_loss": -6.090734958648682, "global_step": 77898, "epoch": 1854} {"train_loss": -6.149150371551514, "global_step": 77899, "epoch": 1854} {"train_loss": -6.228663444519043, "global_step": 77900, "epoch": 1854} {"train_loss": -6.10301399230957, "global_step": 77901, "epoch": 1854} {"train_loss": -6.162834644317627, "global_step": 77902, "epoch": 1854} {"train_loss": -6.1377458572387695, "global_step": 77903, "epoch": 1854} {"train_loss": -6.111493110656738, "global_step": 77904, "epoch": 1854} {"train_loss": -6.234235763549805, "global_step": 77905, "epoch": 1854} {"train_loss": -6.066531181335449, "global_step": 77906, "epoch": 1854} {"train_loss": -6.056451797485352, "global_step": 77907, "epoch": 1854} {"train_loss": -6.2383575439453125, "global_step": 77908, "epoch": 1854} {"train_loss": -6.120984974361601, "global_step": 77909, "epoch": 1854, "val_loss": 62279.98046875} {"train_loss": -6.088216781616211, "global_step": 77910, "epoch": 1855} {"train_loss": -6.190245628356934, "global_step": 77911, "epoch": 1855} {"train_loss": -6.151515007019043, "global_step": 77912, "epoch": 1855} {"train_loss": -6.09665584564209, "global_step": 77913, "epoch": 1855} {"train_loss": -6.1973114013671875, "global_step": 77914, "epoch": 1855} {"train_loss": -6.0910539627075195, "global_step": 77915, "epoch": 1855} {"train_loss": -6.091800689697266, "global_step": 77916, "epoch": 1855} {"train_loss": -6.229148864746094, "global_step": 77917, "epoch": 1855} {"train_loss": -6.160738945007324, "global_step": 77918, "epoch": 1855} {"train_loss": -6.2309465408325195, "global_step": 77919, "epoch": 1855} {"train_loss": -6.120386123657227, "global_step": 77920, "epoch": 1855} {"train_loss": -6.1339569091796875, "global_step": 77921, "epoch": 1855} {"train_loss": -6.258180618286133, "global_step": 77922, "epoch": 1855} {"train_loss": -6.148613929748535, "global_step": 77923, "epoch": 1855} {"train_loss": -6.141112804412842, "global_step": 77924, "epoch": 1855} {"train_loss": -6.175366401672363, "global_step": 77925, "epoch": 1855} {"train_loss": -6.113783836364746, "global_step": 77926, "epoch": 1855} {"train_loss": -6.220922946929932, "global_step": 77927, "epoch": 1855} {"train_loss": -6.093362331390381, "global_step": 77928, "epoch": 1855} {"train_loss": -6.142653465270996, "global_step": 77929, "epoch": 1855} {"train_loss": -6.132453918457031, "global_step": 77930, "epoch": 1855} {"train_loss": -6.091489791870117, "global_step": 77931, "epoch": 1855} {"train_loss": -6.220361709594727, "global_step": 77932, "epoch": 1855} {"train_loss": -6.048980712890625, "global_step": 77933, "epoch": 1855} {"train_loss": -6.2596940994262695, "global_step": 77934, "epoch": 1855} {"train_loss": -6.101651668548584, "global_step": 77935, "epoch": 1855} {"train_loss": -6.062183380126953, "global_step": 77936, "epoch": 1855} {"train_loss": -6.151392936706543, "global_step": 77937, "epoch": 1855} {"train_loss": -6.142283916473389, "global_step": 77938, "epoch": 1855} {"train_loss": -6.038407325744629, "global_step": 77939, "epoch": 1855} {"train_loss": -6.036003112792969, "global_step": 77940, "epoch": 1855} {"train_loss": -6.0590925216674805, "global_step": 77941, "epoch": 1855} {"train_loss": -6.102344512939453, "global_step": 77942, "epoch": 1855} {"train_loss": -6.054306983947754, "global_step": 77943, "epoch": 1855} {"train_loss": -6.191488742828369, "global_step": 77944, "epoch": 1855} {"train_loss": -6.019079208374023, "global_step": 77945, "epoch": 1855} {"train_loss": -6.120922565460205, "global_step": 77946, "epoch": 1855} {"train_loss": -5.984257698059082, "global_step": 77947, "epoch": 1855} {"train_loss": -5.981985092163086, "global_step": 77948, "epoch": 1855} {"train_loss": -6.0848388671875, "global_step": 77949, "epoch": 1855} {"train_loss": -6.0705389976501465, "global_step": 77950, "epoch": 1855} {"train_loss": -6.119676374253773, "global_step": 77951, "epoch": 1855, "val_loss": 62812.06640625} {"train_loss": -5.9454345703125, "global_step": 77952, "epoch": 1856} {"train_loss": -6.143610954284668, "global_step": 77953, "epoch": 1856} {"train_loss": -6.001233100891113, "global_step": 77954, "epoch": 1856} {"train_loss": -6.111550807952881, "global_step": 77955, "epoch": 1856} {"train_loss": -5.989727020263672, "global_step": 77956, "epoch": 1856} {"train_loss": -6.103372097015381, "global_step": 77957, "epoch": 1856} {"train_loss": -5.998520851135254, "global_step": 77958, "epoch": 1856} {"train_loss": -6.128554344177246, "global_step": 77959, "epoch": 1856} {"train_loss": -6.081941604614258, "global_step": 77960, "epoch": 1856} {"train_loss": -6.064513206481934, "global_step": 77961, "epoch": 1856} {"train_loss": -6.19295597076416, "global_step": 77962, "epoch": 1856} {"train_loss": -6.164968967437744, "global_step": 77963, "epoch": 1856} {"train_loss": -6.127407073974609, "global_step": 77964, "epoch": 1856} {"train_loss": -6.115869045257568, "global_step": 77965, "epoch": 1856} {"train_loss": -6.149716854095459, "global_step": 77966, "epoch": 1856} {"train_loss": -6.149304389953613, "global_step": 77967, "epoch": 1856} {"train_loss": -6.182464122772217, "global_step": 77968, "epoch": 1856} {"train_loss": -6.070833206176758, "global_step": 77969, "epoch": 1856} {"train_loss": -6.1418914794921875, "global_step": 77970, "epoch": 1856} {"train_loss": -6.01516056060791, "global_step": 77971, "epoch": 1856} {"train_loss": -6.1293439865112305, "global_step": 77972, "epoch": 1856} {"train_loss": -6.1105451583862305, "global_step": 77973, "epoch": 1856} {"train_loss": -6.136858940124512, "global_step": 77974, "epoch": 1856} {"train_loss": -5.972259998321533, "global_step": 77975, "epoch": 1856} {"train_loss": -6.111116409301758, "global_step": 77976, "epoch": 1856} {"train_loss": -5.9627766609191895, "global_step": 77977, "epoch": 1856} {"train_loss": -6.083934307098389, "global_step": 77978, "epoch": 1856} {"train_loss": -6.0447587966918945, "global_step": 77979, "epoch": 1856} {"train_loss": -6.054656028747559, "global_step": 77980, "epoch": 1856} {"train_loss": -6.03288459777832, "global_step": 77981, "epoch": 1856} {"train_loss": -6.089612007141113, "global_step": 77982, "epoch": 1856} {"train_loss": -6.053221225738525, "global_step": 77983, "epoch": 1856} {"train_loss": -6.172122955322266, "global_step": 77984, "epoch": 1856} {"train_loss": -6.078952789306641, "global_step": 77985, "epoch": 1856} {"train_loss": -6.10134220123291, "global_step": 77986, "epoch": 1856} {"train_loss": -6.2519001960754395, "global_step": 77987, "epoch": 1856} {"train_loss": -6.190211296081543, "global_step": 77988, "epoch": 1856} {"train_loss": -6.039684772491455, "global_step": 77989, "epoch": 1856} {"train_loss": -5.988759517669678, "global_step": 77990, "epoch": 1856} {"train_loss": -6.202114105224609, "global_step": 77991, "epoch": 1856} {"train_loss": -5.978557586669922, "global_step": 77992, "epoch": 1856} {"train_loss": -6.088786216009231, "global_step": 77993, "epoch": 1856, "val_loss": 62126.8359375} {"train_loss": -6.047356605529785, "global_step": 77994, "epoch": 1857} {"train_loss": -6.108206748962402, "global_step": 77995, "epoch": 1857} {"train_loss": -6.216395378112793, "global_step": 77996, "epoch": 1857} {"train_loss": -6.196566581726074, "global_step": 77997, "epoch": 1857} {"train_loss": -6.177759170532227, "global_step": 77998, "epoch": 1857} {"train_loss": -6.153114318847656, "global_step": 77999, "epoch": 1857} {"train_loss": -6.068316459655762, "global_step": 78000, "epoch": 1857} {"train_loss": -6.071551322937012, "global_step": 78001, "epoch": 1857} {"train_loss": -6.1217427253723145, "global_step": 78002, "epoch": 1857} {"train_loss": -6.205785751342773, "global_step": 78003, "epoch": 1857} {"train_loss": -6.133390426635742, "global_step": 78004, "epoch": 1857} {"train_loss": -6.160243988037109, "global_step": 78005, "epoch": 1857} {"train_loss": -6.0384063720703125, "global_step": 78006, "epoch": 1857} {"train_loss": -6.081502437591553, "global_step": 78007, "epoch": 1857} {"train_loss": -6.199013710021973, "global_step": 78008, "epoch": 1857} {"train_loss": -6.149140357971191, "global_step": 78009, "epoch": 1857} {"train_loss": -6.105353355407715, "global_step": 78010, "epoch": 1857} {"train_loss": -6.128252983093262, "global_step": 78011, "epoch": 1857} {"train_loss": -6.098451137542725, "global_step": 78012, "epoch": 1857} {"train_loss": -6.184676170349121, "global_step": 78013, "epoch": 1857} {"train_loss": -6.044365406036377, "global_step": 78014, "epoch": 1857} {"train_loss": -6.056468963623047, "global_step": 78015, "epoch": 1857} {"train_loss": -6.197391510009766, "global_step": 78016, "epoch": 1857} {"train_loss": -6.222935199737549, "global_step": 78017, "epoch": 1857} {"train_loss": -6.030719757080078, "global_step": 78018, "epoch": 1857} {"train_loss": -6.031111717224121, "global_step": 78019, "epoch": 1857} {"train_loss": -6.195734024047852, "global_step": 78020, "epoch": 1857} {"train_loss": -6.020536422729492, "global_step": 78021, "epoch": 1857} {"train_loss": -6.165278911590576, "global_step": 78022, "epoch": 1857} {"train_loss": -6.1792826652526855, "global_step": 78023, "epoch": 1857} {"train_loss": -6.226041316986084, "global_step": 78024, "epoch": 1857} {"train_loss": -6.161688804626465, "global_step": 78025, "epoch": 1857} {"train_loss": -6.148608207702637, "global_step": 78026, "epoch": 1857} {"train_loss": -6.058263778686523, "global_step": 78027, "epoch": 1857} {"train_loss": -6.1132965087890625, "global_step": 78028, "epoch": 1857} {"train_loss": -6.033812522888184, "global_step": 78029, "epoch": 1857} {"train_loss": -6.116259574890137, "global_step": 78030, "epoch": 1857} {"train_loss": -5.953385353088379, "global_step": 78031, "epoch": 1857} {"train_loss": -5.963494300842285, "global_step": 78032, "epoch": 1857} {"train_loss": -6.176841735839844, "global_step": 78033, "epoch": 1857} {"train_loss": -5.954341411590576, "global_step": 78034, "epoch": 1857} {"train_loss": -6.110718783878145, "global_step": 78035, "epoch": 1857, "val_loss": 62222.0625} {"train_loss": -5.990296363830566, "global_step": 78036, "epoch": 1858} {"train_loss": -6.11933708190918, "global_step": 78037, "epoch": 1858} {"train_loss": -6.116213321685791, "global_step": 78038, "epoch": 1858} {"train_loss": -6.067006587982178, "global_step": 78039, "epoch": 1858} {"train_loss": -6.085744857788086, "global_step": 78040, "epoch": 1858} {"train_loss": -5.89840030670166, "global_step": 78041, "epoch": 1858} {"train_loss": -6.166583061218262, "global_step": 78042, "epoch": 1858} {"train_loss": -6.079388618469238, "global_step": 78043, "epoch": 1858} {"train_loss": -5.974546432495117, "global_step": 78044, "epoch": 1858} {"train_loss": -6.049963474273682, "global_step": 78045, "epoch": 1858} {"train_loss": -6.203607559204102, "global_step": 78046, "epoch": 1858} {"train_loss": -6.060194969177246, "global_step": 78047, "epoch": 1858} {"train_loss": -6.113206386566162, "global_step": 78048, "epoch": 1858} {"train_loss": -6.112038612365723, "global_step": 78049, "epoch": 1858} {"train_loss": -6.2010040283203125, "global_step": 78050, "epoch": 1858} {"train_loss": -6.153118133544922, "global_step": 78051, "epoch": 1858} {"train_loss": -6.230811595916748, "global_step": 78052, "epoch": 1858} {"train_loss": -6.126375198364258, "global_step": 78053, "epoch": 1858} {"train_loss": -6.219357490539551, "global_step": 78054, "epoch": 1858} {"train_loss": -6.132526874542236, "global_step": 78055, "epoch": 1858} {"train_loss": -6.145526885986328, "global_step": 78056, "epoch": 1858} {"train_loss": -5.961417198181152, "global_step": 78057, "epoch": 1858} {"train_loss": -6.179379940032959, "global_step": 78058, "epoch": 1858} {"train_loss": -6.26848840713501, "global_step": 78059, "epoch": 1858} {"train_loss": -6.161347389221191, "global_step": 78060, "epoch": 1858} {"train_loss": -6.108151435852051, "global_step": 78061, "epoch": 1858} {"train_loss": -6.114297866821289, "global_step": 78062, "epoch": 1858} {"train_loss": -6.074316024780273, "global_step": 78063, "epoch": 1858} {"train_loss": -6.066829681396484, "global_step": 78064, "epoch": 1858} {"train_loss": -6.019321441650391, "global_step": 78065, "epoch": 1858} {"train_loss": -6.222738742828369, "global_step": 78066, "epoch": 1858} {"train_loss": -6.143748760223389, "global_step": 78067, "epoch": 1858} {"train_loss": -6.0705389976501465, "global_step": 78068, "epoch": 1858} {"train_loss": -6.078118324279785, "global_step": 78069, "epoch": 1858} {"train_loss": -6.058405876159668, "global_step": 78070, "epoch": 1858} {"train_loss": -6.197451591491699, "global_step": 78071, "epoch": 1858} {"train_loss": -6.138267517089844, "global_step": 78072, "epoch": 1858} {"train_loss": -6.095211982727051, "global_step": 78073, "epoch": 1858} {"train_loss": -6.072542190551758, "global_step": 78074, "epoch": 1858} {"train_loss": -6.197938919067383, "global_step": 78075, "epoch": 1858} {"train_loss": -6.006316184997559, "global_step": 78076, "epoch": 1858} {"train_loss": -6.1059702805110385, "global_step": 78077, "epoch": 1858, "val_loss": 62350.20703125} {"train_loss": -6.0154523849487305, "global_step": 78078, "epoch": 1859} {"train_loss": -6.178615570068359, "global_step": 78079, "epoch": 1859} {"train_loss": -6.148806095123291, "global_step": 78080, "epoch": 1859} {"train_loss": -6.145961284637451, "global_step": 78081, "epoch": 1859} {"train_loss": -6.178905487060547, "global_step": 78082, "epoch": 1859} {"train_loss": -6.018362045288086, "global_step": 78083, "epoch": 1859} {"train_loss": -6.177300453186035, "global_step": 78084, "epoch": 1859} {"train_loss": -6.212672233581543, "global_step": 78085, "epoch": 1859} {"train_loss": -6.002907752990723, "global_step": 78086, "epoch": 1859} {"train_loss": -6.059893608093262, "global_step": 78087, "epoch": 1859} {"train_loss": -6.1676225662231445, "global_step": 78088, "epoch": 1859} {"train_loss": -6.174703121185303, "global_step": 78089, "epoch": 1859} {"train_loss": -6.041226863861084, "global_step": 78090, "epoch": 1859} {"train_loss": -6.129523277282715, "global_step": 78091, "epoch": 1859} {"train_loss": -6.2433929443359375, "global_step": 78092, "epoch": 1859} {"train_loss": -6.091628551483154, "global_step": 78093, "epoch": 1859} {"train_loss": -6.107375621795654, "global_step": 78094, "epoch": 1859} {"train_loss": -6.2255778312683105, "global_step": 78095, "epoch": 1859} {"train_loss": -6.106192111968994, "global_step": 78096, "epoch": 1859} {"train_loss": -6.195767402648926, "global_step": 78097, "epoch": 1859} {"train_loss": -6.089958190917969, "global_step": 78098, "epoch": 1859} {"train_loss": -6.06120491027832, "global_step": 78099, "epoch": 1859} {"train_loss": -6.075333595275879, "global_step": 78100, "epoch": 1859} {"train_loss": -6.055795192718506, "global_step": 78101, "epoch": 1859} {"train_loss": -6.138633728027344, "global_step": 78102, "epoch": 1859} {"train_loss": -6.150352478027344, "global_step": 78103, "epoch": 1859} {"train_loss": -6.162411689758301, "global_step": 78104, "epoch": 1859} {"train_loss": -6.129222393035889, "global_step": 78105, "epoch": 1859} {"train_loss": -6.164034843444824, "global_step": 78106, "epoch": 1859} {"train_loss": -6.009329795837402, "global_step": 78107, "epoch": 1859} {"train_loss": -6.181591033935547, "global_step": 78108, "epoch": 1859} {"train_loss": -6.084190368652344, "global_step": 78109, "epoch": 1859} {"train_loss": -6.143644332885742, "global_step": 78110, "epoch": 1859} {"train_loss": -6.184391975402832, "global_step": 78111, "epoch": 1859} {"train_loss": -6.208441257476807, "global_step": 78112, "epoch": 1859} {"train_loss": -6.090697288513184, "global_step": 78113, "epoch": 1859} {"train_loss": -6.069236755371094, "global_step": 78114, "epoch": 1859} {"train_loss": -6.171220779418945, "global_step": 78115, "epoch": 1859} {"train_loss": -6.066000461578369, "global_step": 78116, "epoch": 1859} {"train_loss": -5.972733497619629, "global_step": 78117, "epoch": 1859} {"train_loss": -6.079760551452637, "global_step": 78118, "epoch": 1859} {"train_loss": -6.120819171269734, "global_step": 78119, "epoch": 1859, "val_loss": 62164.2265625} {"train_loss": -6.182992458343506, "global_step": 78120, "epoch": 1860} {"train_loss": -6.185603141784668, "global_step": 78121, "epoch": 1860} {"train_loss": -6.100037574768066, "global_step": 78122, "epoch": 1860} {"train_loss": -6.1654438972473145, "global_step": 78123, "epoch": 1860} {"train_loss": -6.086357593536377, "global_step": 78124, "epoch": 1860} {"train_loss": -6.131076812744141, "global_step": 78125, "epoch": 1860} {"train_loss": -6.182765483856201, "global_step": 78126, "epoch": 1860} {"train_loss": -6.124153137207031, "global_step": 78127, "epoch": 1860} {"train_loss": -6.133676528930664, "global_step": 78128, "epoch": 1860} {"train_loss": -6.195463180541992, "global_step": 78129, "epoch": 1860} {"train_loss": -6.174576759338379, "global_step": 78130, "epoch": 1860} {"train_loss": -6.134591579437256, "global_step": 78131, "epoch": 1860} {"train_loss": -6.096514701843262, "global_step": 78132, "epoch": 1860} {"train_loss": -6.06368350982666, "global_step": 78133, "epoch": 1860} {"train_loss": -6.055001735687256, "global_step": 78134, "epoch": 1860} {"train_loss": -6.052992820739746, "global_step": 78135, "epoch": 1860} {"train_loss": -6.066825866699219, "global_step": 78136, "epoch": 1860} {"train_loss": -6.060792922973633, "global_step": 78137, "epoch": 1860} {"train_loss": -6.183300971984863, "global_step": 78138, "epoch": 1860} {"train_loss": -6.213001251220703, "global_step": 78139, "epoch": 1860} {"train_loss": -6.081921100616455, "global_step": 78140, "epoch": 1860} {"train_loss": -6.149497032165527, "global_step": 78141, "epoch": 1860} {"train_loss": -6.074561595916748, "global_step": 78142, "epoch": 1860} {"train_loss": -6.212342262268066, "global_step": 78143, "epoch": 1860} {"train_loss": -6.175857067108154, "global_step": 78144, "epoch": 1860} {"train_loss": -6.086400985717773, "global_step": 78145, "epoch": 1860} {"train_loss": -6.07153844833374, "global_step": 78146, "epoch": 1860} {"train_loss": -6.163351535797119, "global_step": 78147, "epoch": 1860} {"train_loss": -6.158302307128906, "global_step": 78148, "epoch": 1860} {"train_loss": -6.137119293212891, "global_step": 78149, "epoch": 1860} {"train_loss": -6.245721817016602, "global_step": 78150, "epoch": 1860} {"train_loss": -6.142443656921387, "global_step": 78151, "epoch": 1860} {"train_loss": -6.16704797744751, "global_step": 78152, "epoch": 1860} {"train_loss": -6.224693298339844, "global_step": 78153, "epoch": 1860} {"train_loss": -6.033543586730957, "global_step": 78154, "epoch": 1860} {"train_loss": -6.200187683105469, "global_step": 78155, "epoch": 1860} {"train_loss": -6.0131425857543945, "global_step": 78156, "epoch": 1860} {"train_loss": -6.015722274780273, "global_step": 78157, "epoch": 1860} {"train_loss": -6.13494873046875, "global_step": 78158, "epoch": 1860} {"train_loss": -6.0232744216918945, "global_step": 78159, "epoch": 1860} {"train_loss": -6.107101917266846, "global_step": 78160, "epoch": 1860} {"train_loss": -6.1249691645304365, "global_step": 78161, "epoch": 1860, "val_loss": 62275.76953125} {"train_loss": -5.975775718688965, "global_step": 78162, "epoch": 1861} {"train_loss": -6.139763832092285, "global_step": 78163, "epoch": 1861} {"train_loss": -5.989683151245117, "global_step": 78164, "epoch": 1861} {"train_loss": -6.046604633331299, "global_step": 78165, "epoch": 1861} {"train_loss": -5.907460689544678, "global_step": 78166, "epoch": 1861} {"train_loss": -6.146266937255859, "global_step": 78167, "epoch": 1861} {"train_loss": -6.146803855895996, "global_step": 78168, "epoch": 1861} {"train_loss": -6.07125186920166, "global_step": 78169, "epoch": 1861} {"train_loss": -5.979393005371094, "global_step": 78170, "epoch": 1861} {"train_loss": -6.0753045082092285, "global_step": 78171, "epoch": 1861} {"train_loss": -6.276571273803711, "global_step": 78172, "epoch": 1861} {"train_loss": -6.162909984588623, "global_step": 78173, "epoch": 1861} {"train_loss": -6.176407337188721, "global_step": 78174, "epoch": 1861} {"train_loss": -6.10953426361084, "global_step": 78175, "epoch": 1861} {"train_loss": -6.15892219543457, "global_step": 78176, "epoch": 1861} {"train_loss": -6.237770080566406, "global_step": 78177, "epoch": 1861} {"train_loss": -6.116955757141113, "global_step": 78178, "epoch": 1861} {"train_loss": -6.146097183227539, "global_step": 78179, "epoch": 1861} {"train_loss": -6.094785690307617, "global_step": 78180, "epoch": 1861} {"train_loss": -6.1897783279418945, "global_step": 78181, "epoch": 1861} {"train_loss": -6.202569007873535, "global_step": 78182, "epoch": 1861} {"train_loss": -6.18347692489624, "global_step": 78183, "epoch": 1861} {"train_loss": -6.188472270965576, "global_step": 78184, "epoch": 1861} {"train_loss": -6.267266273498535, "global_step": 78185, "epoch": 1861} {"train_loss": -6.1305694580078125, "global_step": 78186, "epoch": 1861} {"train_loss": -6.06220817565918, "global_step": 78187, "epoch": 1861} {"train_loss": -6.172893524169922, "global_step": 78188, "epoch": 1861} {"train_loss": -6.119763374328613, "global_step": 78189, "epoch": 1861} {"train_loss": -6.206252098083496, "global_step": 78190, "epoch": 1861} {"train_loss": -6.1547417640686035, "global_step": 78191, "epoch": 1861} {"train_loss": -6.165676116943359, "global_step": 78192, "epoch": 1861} {"train_loss": -6.088974475860596, "global_step": 78193, "epoch": 1861} {"train_loss": -6.101426601409912, "global_step": 78194, "epoch": 1861} {"train_loss": -6.163966655731201, "global_step": 78195, "epoch": 1861} {"train_loss": -6.0130534172058105, "global_step": 78196, "epoch": 1861} {"train_loss": -6.1934099197387695, "global_step": 78197, "epoch": 1861} {"train_loss": -6.116843223571777, "global_step": 78198, "epoch": 1861} {"train_loss": -5.983964920043945, "global_step": 78199, "epoch": 1861} {"train_loss": -6.168900489807129, "global_step": 78200, "epoch": 1861} {"train_loss": -6.164628982543945, "global_step": 78201, "epoch": 1861} {"train_loss": -6.070379257202148, "global_step": 78202, "epoch": 1861} {"train_loss": -6.125113918667748, "global_step": 78203, "epoch": 1861, "val_loss": 62347.64453125} {"train_loss": -6.294369697570801, "global_step": 78204, "epoch": 1862} {"train_loss": -6.024899482727051, "global_step": 78205, "epoch": 1862} {"train_loss": -5.968515872955322, "global_step": 78206, "epoch": 1862} {"train_loss": -6.1174821853637695, "global_step": 78207, "epoch": 1862} {"train_loss": -6.153881072998047, "global_step": 78208, "epoch": 1862} {"train_loss": -6.109750747680664, "global_step": 78209, "epoch": 1862} {"train_loss": -6.098509788513184, "global_step": 78210, "epoch": 1862} {"train_loss": -6.090693473815918, "global_step": 78211, "epoch": 1862} {"train_loss": -6.06224250793457, "global_step": 78212, "epoch": 1862} {"train_loss": -6.184542655944824, "global_step": 78213, "epoch": 1862} {"train_loss": -6.125221252441406, "global_step": 78214, "epoch": 1862} {"train_loss": -6.019829750061035, "global_step": 78215, "epoch": 1862} {"train_loss": -6.06166410446167, "global_step": 78216, "epoch": 1862} {"train_loss": -6.05854606628418, "global_step": 78217, "epoch": 1862} {"train_loss": -6.153781414031982, "global_step": 78218, "epoch": 1862} {"train_loss": -6.055696964263916, "global_step": 78219, "epoch": 1862} {"train_loss": -6.003902912139893, "global_step": 78220, "epoch": 1862} {"train_loss": -6.115780830383301, "global_step": 78221, "epoch": 1862} {"train_loss": -6.025942802429199, "global_step": 78222, "epoch": 1862} {"train_loss": -6.0982465744018555, "global_step": 78223, "epoch": 1862} {"train_loss": -5.987701892852783, "global_step": 78224, "epoch": 1862} {"train_loss": -6.05299186706543, "global_step": 78225, "epoch": 1862} {"train_loss": -6.032597064971924, "global_step": 78226, "epoch": 1862} {"train_loss": -6.088884353637695, "global_step": 78227, "epoch": 1862} {"train_loss": -6.157253265380859, "global_step": 78228, "epoch": 1862} {"train_loss": -6.128392696380615, "global_step": 78229, "epoch": 1862} {"train_loss": -6.177903175354004, "global_step": 78230, "epoch": 1862} {"train_loss": -6.096018314361572, "global_step": 78231, "epoch": 1862} {"train_loss": -6.104341506958008, "global_step": 78232, "epoch": 1862} {"train_loss": -6.094355583190918, "global_step": 78233, "epoch": 1862} {"train_loss": -6.0617780685424805, "global_step": 78234, "epoch": 1862} {"train_loss": -5.915660858154297, "global_step": 78235, "epoch": 1862} {"train_loss": -6.128283977508545, "global_step": 78236, "epoch": 1862} {"train_loss": -6.26297664642334, "global_step": 78237, "epoch": 1862} {"train_loss": -5.9908294677734375, "global_step": 78238, "epoch": 1862} {"train_loss": -5.920001029968262, "global_step": 78239, "epoch": 1862} {"train_loss": -6.099380970001221, "global_step": 78240, "epoch": 1862} {"train_loss": -6.114171981811523, "global_step": 78241, "epoch": 1862} {"train_loss": -6.129122734069824, "global_step": 78242, "epoch": 1862} {"train_loss": -6.087523460388184, "global_step": 78243, "epoch": 1862} {"train_loss": -5.909120559692383, "global_step": 78244, "epoch": 1862} {"train_loss": -6.084385213397798, "global_step": 78245, "epoch": 1862, "val_loss": 61987.6796875} {"train_loss": -6.153966903686523, "global_step": 78246, "epoch": 1863} {"train_loss": -6.214242935180664, "global_step": 78247, "epoch": 1863} {"train_loss": -6.163752555847168, "global_step": 78248, "epoch": 1863} {"train_loss": -6.114697456359863, "global_step": 78249, "epoch": 1863} {"train_loss": -6.115303039550781, "global_step": 78250, "epoch": 1863} {"train_loss": -6.245273590087891, "global_step": 78251, "epoch": 1863} {"train_loss": -6.117182731628418, "global_step": 78252, "epoch": 1863} {"train_loss": -6.14894962310791, "global_step": 78253, "epoch": 1863} {"train_loss": -6.145263195037842, "global_step": 78254, "epoch": 1863} {"train_loss": -6.231301784515381, "global_step": 78255, "epoch": 1863} {"train_loss": -6.116066932678223, "global_step": 78256, "epoch": 1863} {"train_loss": -6.104144096374512, "global_step": 78257, "epoch": 1863} {"train_loss": -6.12086296081543, "global_step": 78258, "epoch": 1863} {"train_loss": -6.115849494934082, "global_step": 78259, "epoch": 1863} {"train_loss": -6.080746650695801, "global_step": 78260, "epoch": 1863} {"train_loss": -6.091886520385742, "global_step": 78261, "epoch": 1863} {"train_loss": -6.174958229064941, "global_step": 78262, "epoch": 1863} {"train_loss": -6.200480937957764, "global_step": 78263, "epoch": 1863} {"train_loss": -6.181547164916992, "global_step": 78264, "epoch": 1863} {"train_loss": -6.131875514984131, "global_step": 78265, "epoch": 1863} {"train_loss": -6.124831199645996, "global_step": 78266, "epoch": 1863} {"train_loss": -6.118200302124023, "global_step": 78267, "epoch": 1863} {"train_loss": -6.078853607177734, "global_step": 78268, "epoch": 1863} {"train_loss": -6.044859886169434, "global_step": 78269, "epoch": 1863} {"train_loss": -6.118721008300781, "global_step": 78270, "epoch": 1863} {"train_loss": -6.050239562988281, "global_step": 78271, "epoch": 1863} {"train_loss": -6.191595077514648, "global_step": 78272, "epoch": 1863} {"train_loss": -6.150139808654785, "global_step": 78273, "epoch": 1863} {"train_loss": -6.0524983406066895, "global_step": 78274, "epoch": 1863} {"train_loss": -6.082550048828125, "global_step": 78275, "epoch": 1863} {"train_loss": -6.050734519958496, "global_step": 78276, "epoch": 1863} {"train_loss": -6.03007173538208, "global_step": 78277, "epoch": 1863} {"train_loss": -6.153277397155762, "global_step": 78278, "epoch": 1863} {"train_loss": -6.198174476623535, "global_step": 78279, "epoch": 1863} {"train_loss": -6.0990071296691895, "global_step": 78280, "epoch": 1863} {"train_loss": -6.110228538513184, "global_step": 78281, "epoch": 1863} {"train_loss": -6.1545209884643555, "global_step": 78282, "epoch": 1863} {"train_loss": -6.215771675109863, "global_step": 78283, "epoch": 1863} {"train_loss": -6.139559268951416, "global_step": 78284, "epoch": 1863} {"train_loss": -6.033336639404297, "global_step": 78285, "epoch": 1863} {"train_loss": -6.137184143066406, "global_step": 78286, "epoch": 1863} {"train_loss": -6.128998688289097, "global_step": 78287, "epoch": 1863, "val_loss": 62069.703125} {"train_loss": -6.174821853637695, "global_step": 78288, "epoch": 1864} {"train_loss": -6.151845932006836, "global_step": 78289, "epoch": 1864} {"train_loss": -6.160823822021484, "global_step": 78290, "epoch": 1864} {"train_loss": -6.190177917480469, "global_step": 78291, "epoch": 1864} {"train_loss": -6.0682878494262695, "global_step": 78292, "epoch": 1864} {"train_loss": -6.234470367431641, "global_step": 78293, "epoch": 1864} {"train_loss": -6.261384010314941, "global_step": 78294, "epoch": 1864} {"train_loss": -6.088446617126465, "global_step": 78295, "epoch": 1864} {"train_loss": -6.149025917053223, "global_step": 78296, "epoch": 1864} {"train_loss": -6.102686882019043, "global_step": 78297, "epoch": 1864} {"train_loss": -6.15688419342041, "global_step": 78298, "epoch": 1864} {"train_loss": -6.029131889343262, "global_step": 78299, "epoch": 1864} {"train_loss": -6.173467636108398, "global_step": 78300, "epoch": 1864} {"train_loss": -6.219099998474121, "global_step": 78301, "epoch": 1864} {"train_loss": -6.1977128982543945, "global_step": 78302, "epoch": 1864} {"train_loss": -6.027456760406494, "global_step": 78303, "epoch": 1864} {"train_loss": -6.210150718688965, "global_step": 78304, "epoch": 1864} {"train_loss": -6.255440711975098, "global_step": 78305, "epoch": 1864} {"train_loss": -6.238681793212891, "global_step": 78306, "epoch": 1864} {"train_loss": -6.056535720825195, "global_step": 78307, "epoch": 1864} {"train_loss": -6.179775238037109, "global_step": 78308, "epoch": 1864} {"train_loss": -6.196255683898926, "global_step": 78309, "epoch": 1864} {"train_loss": -6.224202632904053, "global_step": 78310, "epoch": 1864} {"train_loss": -6.176999092102051, "global_step": 78311, "epoch": 1864} {"train_loss": -6.066244125366211, "global_step": 78312, "epoch": 1864} {"train_loss": -6.154800891876221, "global_step": 78313, "epoch": 1864} {"train_loss": -6.1437788009643555, "global_step": 78314, "epoch": 1864} {"train_loss": -6.15341854095459, "global_step": 78315, "epoch": 1864} {"train_loss": -6.1720871925354, "global_step": 78316, "epoch": 1864} {"train_loss": -6.223158836364746, "global_step": 78317, "epoch": 1864} {"train_loss": -6.253507614135742, "global_step": 78318, "epoch": 1864} {"train_loss": -6.143260955810547, "global_step": 78319, "epoch": 1864} {"train_loss": -6.068236351013184, "global_step": 78320, "epoch": 1864} {"train_loss": -6.107046127319336, "global_step": 78321, "epoch": 1864} {"train_loss": -6.0367889404296875, "global_step": 78322, "epoch": 1864} {"train_loss": -6.092410087585449, "global_step": 78323, "epoch": 1864} {"train_loss": -6.173272132873535, "global_step": 78324, "epoch": 1864} {"train_loss": -6.096217155456543, "global_step": 78325, "epoch": 1864} {"train_loss": -6.071784973144531, "global_step": 78326, "epoch": 1864} {"train_loss": -6.132308006286621, "global_step": 78327, "epoch": 1864} {"train_loss": -6.244465351104736, "global_step": 78328, "epoch": 1864} {"train_loss": -6.151715165092831, "global_step": 78329, "epoch": 1864, "val_loss": 62060.91796875} {"train_loss": -6.19926118850708, "global_step": 78330, "epoch": 1865} {"train_loss": -6.1991682052612305, "global_step": 78331, "epoch": 1865} {"train_loss": -6.26701021194458, "global_step": 78332, "epoch": 1865} {"train_loss": -6.255919933319092, "global_step": 78333, "epoch": 1865} {"train_loss": -6.068233489990234, "global_step": 78334, "epoch": 1865} {"train_loss": -6.1442365646362305, "global_step": 78335, "epoch": 1865} {"train_loss": -6.237350940704346, "global_step": 78336, "epoch": 1865} {"train_loss": -6.304718971252441, "global_step": 78337, "epoch": 1865} {"train_loss": -6.248556137084961, "global_step": 78338, "epoch": 1865} {"train_loss": -6.178625106811523, "global_step": 78339, "epoch": 1865} {"train_loss": -6.163975715637207, "global_step": 78340, "epoch": 1865} {"train_loss": -6.05790901184082, "global_step": 78341, "epoch": 1865} {"train_loss": -6.1522216796875, "global_step": 78342, "epoch": 1865} {"train_loss": -6.170571327209473, "global_step": 78343, "epoch": 1865} {"train_loss": -6.118823528289795, "global_step": 78344, "epoch": 1865} {"train_loss": -6.273837089538574, "global_step": 78345, "epoch": 1865} {"train_loss": -6.246116638183594, "global_step": 78346, "epoch": 1865} {"train_loss": -6.171248435974121, "global_step": 78347, "epoch": 1865} {"train_loss": -5.990658760070801, "global_step": 78348, "epoch": 1865} {"train_loss": -6.188333034515381, "global_step": 78349, "epoch": 1865} {"train_loss": -6.140232563018799, "global_step": 78350, "epoch": 1865} {"train_loss": -6.1425700187683105, "global_step": 78351, "epoch": 1865} {"train_loss": -6.149184226989746, "global_step": 78352, "epoch": 1865} {"train_loss": -6.172745227813721, "global_step": 78353, "epoch": 1865} {"train_loss": -6.131455421447754, "global_step": 78354, "epoch": 1865} {"train_loss": -6.129402160644531, "global_step": 78355, "epoch": 1865} {"train_loss": -5.954075813293457, "global_step": 78356, "epoch": 1865} {"train_loss": -6.018838882446289, "global_step": 78357, "epoch": 1865} {"train_loss": -6.057111740112305, "global_step": 78358, "epoch": 1865} {"train_loss": -5.961844444274902, "global_step": 78359, "epoch": 1865} {"train_loss": -5.99930477142334, "global_step": 78360, "epoch": 1865} {"train_loss": -6.081841468811035, "global_step": 78361, "epoch": 1865} {"train_loss": -5.965383529663086, "global_step": 78362, "epoch": 1865} {"train_loss": -6.079342365264893, "global_step": 78363, "epoch": 1865} {"train_loss": -6.093906402587891, "global_step": 78364, "epoch": 1865} {"train_loss": -6.16234827041626, "global_step": 78365, "epoch": 1865} {"train_loss": -6.1149702072143555, "global_step": 78366, "epoch": 1865} {"train_loss": -6.200688362121582, "global_step": 78367, "epoch": 1865} {"train_loss": -6.1486616134643555, "global_step": 78368, "epoch": 1865} {"train_loss": -6.22153902053833, "global_step": 78369, "epoch": 1865} {"train_loss": -6.105700492858887, "global_step": 78370, "epoch": 1865} {"train_loss": -6.135716052282424, "global_step": 78371, "epoch": 1865, "val_loss": 62347.80078125} {"train_loss": -6.1680588722229, "global_step": 78372, "epoch": 1866} {"train_loss": -6.133312225341797, "global_step": 78373, "epoch": 1866} {"train_loss": -6.179963111877441, "global_step": 78374, "epoch": 1866} {"train_loss": -6.183091640472412, "global_step": 78375, "epoch": 1866} {"train_loss": -6.22569465637207, "global_step": 78376, "epoch": 1866} {"train_loss": -6.084296703338623, "global_step": 78377, "epoch": 1866} {"train_loss": -6.086909294128418, "global_step": 78378, "epoch": 1866} {"train_loss": -6.173228740692139, "global_step": 78379, "epoch": 1866} {"train_loss": -6.153424263000488, "global_step": 78380, "epoch": 1866} {"train_loss": -6.092655181884766, "global_step": 78381, "epoch": 1866} {"train_loss": -6.174680709838867, "global_step": 78382, "epoch": 1866} {"train_loss": -6.287207126617432, "global_step": 78383, "epoch": 1866} {"train_loss": -6.134832382202148, "global_step": 78384, "epoch": 1866} {"train_loss": -6.157641410827637, "global_step": 78385, "epoch": 1866} {"train_loss": -6.069360256195068, "global_step": 78386, "epoch": 1866} {"train_loss": -6.185370922088623, "global_step": 78387, "epoch": 1866} {"train_loss": -6.31702184677124, "global_step": 78388, "epoch": 1866} {"train_loss": -6.23194694519043, "global_step": 78389, "epoch": 1866} {"train_loss": -6.110346794128418, "global_step": 78390, "epoch": 1866} {"train_loss": -6.187021732330322, "global_step": 78391, "epoch": 1866} {"train_loss": -6.136147499084473, "global_step": 78392, "epoch": 1866} {"train_loss": -6.097010612487793, "global_step": 78393, "epoch": 1866} {"train_loss": -6.188589572906494, "global_step": 78394, "epoch": 1866} {"train_loss": -6.220259189605713, "global_step": 78395, "epoch": 1866} {"train_loss": -6.154082775115967, "global_step": 78396, "epoch": 1866} {"train_loss": -6.110418796539307, "global_step": 78397, "epoch": 1866} {"train_loss": -6.159051895141602, "global_step": 78398, "epoch": 1866} {"train_loss": -6.0641632080078125, "global_step": 78399, "epoch": 1866} {"train_loss": -6.119498252868652, "global_step": 78400, "epoch": 1866} {"train_loss": -6.1642255783081055, "global_step": 78401, "epoch": 1866} {"train_loss": -6.0253682136535645, "global_step": 78402, "epoch": 1866} {"train_loss": -6.082375526428223, "global_step": 78403, "epoch": 1866} {"train_loss": -6.17537260055542, "global_step": 78404, "epoch": 1866} {"train_loss": -5.999820709228516, "global_step": 78405, "epoch": 1866} {"train_loss": -6.113090991973877, "global_step": 78406, "epoch": 1866} {"train_loss": -6.192420959472656, "global_step": 78407, "epoch": 1866} {"train_loss": -6.1927666664123535, "global_step": 78408, "epoch": 1866} {"train_loss": -6.165909767150879, "global_step": 78409, "epoch": 1866} {"train_loss": -6.039764404296875, "global_step": 78410, "epoch": 1866} {"train_loss": -6.041261672973633, "global_step": 78411, "epoch": 1866} {"train_loss": -6.124020576477051, "global_step": 78412, "epoch": 1866} {"train_loss": -6.144137836637951, "global_step": 78413, "epoch": 1866, "val_loss": 62171.60546875} {"train_loss": -6.082758903503418, "global_step": 78414, "epoch": 1867} {"train_loss": -6.089871406555176, "global_step": 78415, "epoch": 1867} {"train_loss": -6.2131266593933105, "global_step": 78416, "epoch": 1867} {"train_loss": -6.156965255737305, "global_step": 78417, "epoch": 1867} {"train_loss": -6.067601203918457, "global_step": 78418, "epoch": 1867} {"train_loss": -6.059700965881348, "global_step": 78419, "epoch": 1867} {"train_loss": -6.08705472946167, "global_step": 78420, "epoch": 1867} {"train_loss": -6.024060249328613, "global_step": 78421, "epoch": 1867} {"train_loss": -6.104308128356934, "global_step": 78422, "epoch": 1867} {"train_loss": -6.080792427062988, "global_step": 78423, "epoch": 1867} {"train_loss": -6.083706378936768, "global_step": 78424, "epoch": 1867} {"train_loss": -6.164037704467773, "global_step": 78425, "epoch": 1867} {"train_loss": -6.058027267456055, "global_step": 78426, "epoch": 1867} {"train_loss": -6.194559097290039, "global_step": 78427, "epoch": 1867} {"train_loss": -6.095888137817383, "global_step": 78428, "epoch": 1867} {"train_loss": -5.982150554656982, "global_step": 78429, "epoch": 1867} {"train_loss": -6.180837631225586, "global_step": 78430, "epoch": 1867} {"train_loss": -6.103006362915039, "global_step": 78431, "epoch": 1867} {"train_loss": -6.075074195861816, "global_step": 78432, "epoch": 1867} {"train_loss": -6.298216819763184, "global_step": 78433, "epoch": 1867} {"train_loss": -6.187283039093018, "global_step": 78434, "epoch": 1867} {"train_loss": -5.986950874328613, "global_step": 78435, "epoch": 1867} {"train_loss": -6.04848051071167, "global_step": 78436, "epoch": 1867} {"train_loss": -5.951613426208496, "global_step": 78437, "epoch": 1867} {"train_loss": -6.1096954345703125, "global_step": 78438, "epoch": 1867} {"train_loss": -6.134984970092773, "global_step": 78439, "epoch": 1867} {"train_loss": -6.1139044761657715, "global_step": 78440, "epoch": 1867} {"train_loss": -6.026185512542725, "global_step": 78441, "epoch": 1867} {"train_loss": -6.025392532348633, "global_step": 78442, "epoch": 1867} {"train_loss": -6.161701202392578, "global_step": 78443, "epoch": 1867} {"train_loss": -6.156745910644531, "global_step": 78444, "epoch": 1867} {"train_loss": -6.073729515075684, "global_step": 78445, "epoch": 1867} {"train_loss": -6.089400768280029, "global_step": 78446, "epoch": 1867} {"train_loss": -6.280524253845215, "global_step": 78447, "epoch": 1867} {"train_loss": -6.163317680358887, "global_step": 78448, "epoch": 1867} {"train_loss": -6.155206680297852, "global_step": 78449, "epoch": 1867} {"train_loss": -6.223013877868652, "global_step": 78450, "epoch": 1867} {"train_loss": -6.086591720581055, "global_step": 78451, "epoch": 1867} {"train_loss": -6.19154691696167, "global_step": 78452, "epoch": 1867} {"train_loss": -5.875393867492676, "global_step": 78453, "epoch": 1867} {"train_loss": -6.035247325897217, "global_step": 78454, "epoch": 1867} {"train_loss": -6.104393720626831, "global_step": 78455, "epoch": 1867, "val_loss": 62506.12109375} {"train_loss": -5.997978210449219, "global_step": 78456, "epoch": 1868} {"train_loss": -6.099836349487305, "global_step": 78457, "epoch": 1868} {"train_loss": -6.057286739349365, "global_step": 78458, "epoch": 1868} {"train_loss": -6.045411109924316, "global_step": 78459, "epoch": 1868} {"train_loss": -6.056550979614258, "global_step": 78460, "epoch": 1868} {"train_loss": -6.038455009460449, "global_step": 78461, "epoch": 1868} {"train_loss": -6.147707939147949, "global_step": 78462, "epoch": 1868} {"train_loss": -5.891079902648926, "global_step": 78463, "epoch": 1868} {"train_loss": -6.0380754470825195, "global_step": 78464, "epoch": 1868} {"train_loss": -6.0837602615356445, "global_step": 78465, "epoch": 1868} {"train_loss": -6.076462745666504, "global_step": 78466, "epoch": 1868} {"train_loss": -6.100711822509766, "global_step": 78467, "epoch": 1868} {"train_loss": -6.196329116821289, "global_step": 78468, "epoch": 1868} {"train_loss": -6.104025840759277, "global_step": 78469, "epoch": 1868} {"train_loss": -5.979541301727295, "global_step": 78470, "epoch": 1868} {"train_loss": -6.085303783416748, "global_step": 78471, "epoch": 1868} {"train_loss": -6.01561975479126, "global_step": 78472, "epoch": 1868} {"train_loss": -6.180899143218994, "global_step": 78473, "epoch": 1868} {"train_loss": -6.178910255432129, "global_step": 78474, "epoch": 1868} {"train_loss": -6.1831207275390625, "global_step": 78475, "epoch": 1868} {"train_loss": -6.12526798248291, "global_step": 78476, "epoch": 1868} {"train_loss": -6.036383628845215, "global_step": 78477, "epoch": 1868} {"train_loss": -6.160196781158447, "global_step": 78478, "epoch": 1868} {"train_loss": -6.132892608642578, "global_step": 78479, "epoch": 1868} {"train_loss": -6.152791500091553, "global_step": 78480, "epoch": 1868} {"train_loss": -6.1539716720581055, "global_step": 78481, "epoch": 1868} {"train_loss": -6.03444766998291, "global_step": 78482, "epoch": 1868} {"train_loss": -6.161543846130371, "global_step": 78483, "epoch": 1868} {"train_loss": -6.163876533508301, "global_step": 78484, "epoch": 1868} {"train_loss": -6.1182146072387695, "global_step": 78485, "epoch": 1868} {"train_loss": -6.161777973175049, "global_step": 78486, "epoch": 1868} {"train_loss": -6.186737060546875, "global_step": 78487, "epoch": 1868} {"train_loss": -6.093380928039551, "global_step": 78488, "epoch": 1868} {"train_loss": -6.133188724517822, "global_step": 78489, "epoch": 1868} {"train_loss": -5.998452663421631, "global_step": 78490, "epoch": 1868} {"train_loss": -6.108431816101074, "global_step": 78491, "epoch": 1868} {"train_loss": -6.200482368469238, "global_step": 78492, "epoch": 1868} {"train_loss": -6.028603553771973, "global_step": 78493, "epoch": 1868} {"train_loss": -6.215579986572266, "global_step": 78494, "epoch": 1868} {"train_loss": -5.969550609588623, "global_step": 78495, "epoch": 1868} {"train_loss": -5.97015380859375, "global_step": 78496, "epoch": 1868} {"train_loss": -6.095011529468355, "global_step": 78497, "epoch": 1868, "val_loss": 62097.765625} {"train_loss": -6.063776969909668, "global_step": 78498, "epoch": 1869} {"train_loss": -6.184223175048828, "global_step": 78499, "epoch": 1869} {"train_loss": -6.165807247161865, "global_step": 78500, "epoch": 1869} {"train_loss": -6.071619987487793, "global_step": 78501, "epoch": 1869} {"train_loss": -6.074359893798828, "global_step": 78502, "epoch": 1869} {"train_loss": -6.209012508392334, "global_step": 78503, "epoch": 1869} {"train_loss": -6.132988929748535, "global_step": 78504, "epoch": 1869} {"train_loss": -6.081963062286377, "global_step": 78505, "epoch": 1869} {"train_loss": -6.142958164215088, "global_step": 78506, "epoch": 1869} {"train_loss": -6.05272102355957, "global_step": 78507, "epoch": 1869} {"train_loss": -6.130321502685547, "global_step": 78508, "epoch": 1869} {"train_loss": -6.107451438903809, "global_step": 78509, "epoch": 1869} {"train_loss": -6.110797882080078, "global_step": 78510, "epoch": 1869} {"train_loss": -6.170730113983154, "global_step": 78511, "epoch": 1869} {"train_loss": -6.287539958953857, "global_step": 78512, "epoch": 1869} {"train_loss": -6.246231555938721, "global_step": 78513, "epoch": 1869} {"train_loss": -6.154847145080566, "global_step": 78514, "epoch": 1869} {"train_loss": -6.1354875564575195, "global_step": 78515, "epoch": 1869} {"train_loss": -6.278360366821289, "global_step": 78516, "epoch": 1869} {"train_loss": -6.217439651489258, "global_step": 78517, "epoch": 1869} {"train_loss": -6.010541915893555, "global_step": 78518, "epoch": 1869} {"train_loss": -6.115787506103516, "global_step": 78519, "epoch": 1869} {"train_loss": -6.102953910827637, "global_step": 78520, "epoch": 1869} {"train_loss": -6.124093055725098, "global_step": 78521, "epoch": 1869} {"train_loss": -6.203355312347412, "global_step": 78522, "epoch": 1869} {"train_loss": -6.112813949584961, "global_step": 78523, "epoch": 1869} {"train_loss": -6.077091217041016, "global_step": 78524, "epoch": 1869} {"train_loss": -6.17356014251709, "global_step": 78525, "epoch": 1869} {"train_loss": -6.010573387145996, "global_step": 78526, "epoch": 1869} {"train_loss": -6.065617561340332, "global_step": 78527, "epoch": 1869} {"train_loss": -6.0216264724731445, "global_step": 78528, "epoch": 1869} {"train_loss": -6.096780776977539, "global_step": 78529, "epoch": 1869} {"train_loss": -6.086732864379883, "global_step": 78530, "epoch": 1869} {"train_loss": -6.223892688751221, "global_step": 78531, "epoch": 1869} {"train_loss": -6.061824321746826, "global_step": 78532, "epoch": 1869} {"train_loss": -6.068511486053467, "global_step": 78533, "epoch": 1869} {"train_loss": -5.96028995513916, "global_step": 78534, "epoch": 1869} {"train_loss": -6.151309490203857, "global_step": 78535, "epoch": 1869} {"train_loss": -6.039280414581299, "global_step": 78536, "epoch": 1869} {"train_loss": -6.065309524536133, "global_step": 78537, "epoch": 1869} {"train_loss": -6.126877784729004, "global_step": 78538, "epoch": 1869} {"train_loss": -6.119935637428647, "global_step": 78539, "epoch": 1869, "val_loss": 62242.6875} {"train_loss": -6.075794219970703, "global_step": 78540, "epoch": 1870} {"train_loss": -6.030250549316406, "global_step": 78541, "epoch": 1870} {"train_loss": -6.157135963439941, "global_step": 78542, "epoch": 1870} {"train_loss": -6.134530067443848, "global_step": 78543, "epoch": 1870} {"train_loss": -6.1459503173828125, "global_step": 78544, "epoch": 1870} {"train_loss": -6.149993419647217, "global_step": 78545, "epoch": 1870} {"train_loss": -6.191318035125732, "global_step": 78546, "epoch": 1870} {"train_loss": -6.1209211349487305, "global_step": 78547, "epoch": 1870} {"train_loss": -6.131416320800781, "global_step": 78548, "epoch": 1870} {"train_loss": -6.245787620544434, "global_step": 78549, "epoch": 1870} {"train_loss": -6.098255157470703, "global_step": 78550, "epoch": 1870} {"train_loss": -6.100200176239014, "global_step": 78551, "epoch": 1870} {"train_loss": -6.097228050231934, "global_step": 78552, "epoch": 1870} {"train_loss": -6.004627227783203, "global_step": 78553, "epoch": 1870} {"train_loss": -6.044112682342529, "global_step": 78554, "epoch": 1870} {"train_loss": -6.095123291015625, "global_step": 78555, "epoch": 1870} {"train_loss": -6.071367263793945, "global_step": 78556, "epoch": 1870} {"train_loss": -6.142918586730957, "global_step": 78557, "epoch": 1870} {"train_loss": -6.151025772094727, "global_step": 78558, "epoch": 1870} {"train_loss": -6.154392719268799, "global_step": 78559, "epoch": 1870} {"train_loss": -6.197607040405273, "global_step": 78560, "epoch": 1870} {"train_loss": -6.220137596130371, "global_step": 78561, "epoch": 1870} {"train_loss": -6.204396724700928, "global_step": 78562, "epoch": 1870} {"train_loss": -6.159384727478027, "global_step": 78563, "epoch": 1870} {"train_loss": -6.141160011291504, "global_step": 78564, "epoch": 1870} {"train_loss": -6.105530738830566, "global_step": 78565, "epoch": 1870} {"train_loss": -6.056088447570801, "global_step": 78566, "epoch": 1870} {"train_loss": -6.23881196975708, "global_step": 78567, "epoch": 1870} {"train_loss": -6.152297019958496, "global_step": 78568, "epoch": 1870} {"train_loss": -6.227623462677002, "global_step": 78569, "epoch": 1870} {"train_loss": -6.151679039001465, "global_step": 78570, "epoch": 1870} {"train_loss": -6.124706268310547, "global_step": 78571, "epoch": 1870} {"train_loss": -6.152820587158203, "global_step": 78572, "epoch": 1870} {"train_loss": -6.081943035125732, "global_step": 78573, "epoch": 1870} {"train_loss": -6.153646469116211, "global_step": 78574, "epoch": 1870} {"train_loss": -6.071488380432129, "global_step": 78575, "epoch": 1870} {"train_loss": -6.134571552276611, "global_step": 78576, "epoch": 1870} {"train_loss": -6.258632659912109, "global_step": 78577, "epoch": 1870} {"train_loss": -6.100439071655273, "global_step": 78578, "epoch": 1870} {"train_loss": -6.124163627624512, "global_step": 78579, "epoch": 1870} {"train_loss": -6.216694355010986, "global_step": 78580, "epoch": 1870} {"train_loss": -6.138788132440476, "global_step": 78581, "epoch": 1870, "val_loss": 62299.59765625} {"train_loss": -6.156759262084961, "global_step": 78582, "epoch": 1871} {"train_loss": -6.106039524078369, "global_step": 78583, "epoch": 1871} {"train_loss": -6.296780586242676, "global_step": 78584, "epoch": 1871} {"train_loss": -6.067989349365234, "global_step": 78585, "epoch": 1871} {"train_loss": -6.045315742492676, "global_step": 78586, "epoch": 1871} {"train_loss": -6.141720771789551, "global_step": 78587, "epoch": 1871} {"train_loss": -6.1153483390808105, "global_step": 78588, "epoch": 1871} {"train_loss": -6.052010536193848, "global_step": 78589, "epoch": 1871} {"train_loss": -6.033992767333984, "global_step": 78590, "epoch": 1871} {"train_loss": -6.088475227355957, "global_step": 78591, "epoch": 1871} {"train_loss": -6.238058090209961, "global_step": 78592, "epoch": 1871} {"train_loss": -6.092499732971191, "global_step": 78593, "epoch": 1871} {"train_loss": -6.065314292907715, "global_step": 78594, "epoch": 1871} {"train_loss": -6.091042518615723, "global_step": 78595, "epoch": 1871} {"train_loss": -6.080208778381348, "global_step": 78596, "epoch": 1871} {"train_loss": -6.2237162590026855, "global_step": 78597, "epoch": 1871} {"train_loss": -6.216330528259277, "global_step": 78598, "epoch": 1871} {"train_loss": -6.107993125915527, "global_step": 78599, "epoch": 1871} {"train_loss": -6.121870994567871, "global_step": 78600, "epoch": 1871} {"train_loss": -6.193704605102539, "global_step": 78601, "epoch": 1871} {"train_loss": -6.166146278381348, "global_step": 78602, "epoch": 1871} {"train_loss": -6.140007495880127, "global_step": 78603, "epoch": 1871} {"train_loss": -6.015557765960693, "global_step": 78604, "epoch": 1871} {"train_loss": -6.082284450531006, "global_step": 78605, "epoch": 1871} {"train_loss": -6.100649833679199, "global_step": 78606, "epoch": 1871} {"train_loss": -6.051454544067383, "global_step": 78607, "epoch": 1871} {"train_loss": -6.121267795562744, "global_step": 78608, "epoch": 1871} {"train_loss": -6.051728248596191, "global_step": 78609, "epoch": 1871} {"train_loss": -6.2013959884643555, "global_step": 78610, "epoch": 1871} {"train_loss": -6.271005630493164, "global_step": 78611, "epoch": 1871} {"train_loss": -6.13459587097168, "global_step": 78612, "epoch": 1871} {"train_loss": -6.137822151184082, "global_step": 78613, "epoch": 1871} {"train_loss": -6.075708389282227, "global_step": 78614, "epoch": 1871} {"train_loss": -6.191365718841553, "global_step": 78615, "epoch": 1871} {"train_loss": -6.261204242706299, "global_step": 78616, "epoch": 1871} {"train_loss": -6.259490013122559, "global_step": 78617, "epoch": 1871} {"train_loss": -6.198122978210449, "global_step": 78618, "epoch": 1871} {"train_loss": -6.291250705718994, "global_step": 78619, "epoch": 1871} {"train_loss": -6.226450443267822, "global_step": 78620, "epoch": 1871} {"train_loss": -6.067536354064941, "global_step": 78621, "epoch": 1871} {"train_loss": -6.192909240722656, "global_step": 78622, "epoch": 1871} {"train_loss": -6.142036903472174, "global_step": 78623, "epoch": 1871, "val_loss": 62330.30078125} {"train_loss": -6.155803203582764, "global_step": 78624, "epoch": 1872} {"train_loss": -6.071459770202637, "global_step": 78625, "epoch": 1872} {"train_loss": -6.040773391723633, "global_step": 78626, "epoch": 1872} {"train_loss": -6.129764556884766, "global_step": 78627, "epoch": 1872} {"train_loss": -6.149655342102051, "global_step": 78628, "epoch": 1872} {"train_loss": -6.14202880859375, "global_step": 78629, "epoch": 1872} {"train_loss": -6.209667205810547, "global_step": 78630, "epoch": 1872} {"train_loss": -6.130257606506348, "global_step": 78631, "epoch": 1872} {"train_loss": -6.052935600280762, "global_step": 78632, "epoch": 1872} {"train_loss": -6.1452741622924805, "global_step": 78633, "epoch": 1872} {"train_loss": -6.069287300109863, "global_step": 78634, "epoch": 1872} {"train_loss": -6.079068183898926, "global_step": 78635, "epoch": 1872} {"train_loss": -6.1235551834106445, "global_step": 78636, "epoch": 1872} {"train_loss": -6.018095970153809, "global_step": 78637, "epoch": 1872} {"train_loss": -6.161777496337891, "global_step": 78638, "epoch": 1872} {"train_loss": -6.291975975036621, "global_step": 78639, "epoch": 1872} {"train_loss": -6.168819427490234, "global_step": 78640, "epoch": 1872} {"train_loss": -6.094011306762695, "global_step": 78641, "epoch": 1872} {"train_loss": -6.123495101928711, "global_step": 78642, "epoch": 1872} {"train_loss": -5.874797821044922, "global_step": 78643, "epoch": 1872} {"train_loss": -6.104282379150391, "global_step": 78644, "epoch": 1872} {"train_loss": -6.0634355545043945, "global_step": 78645, "epoch": 1872} {"train_loss": -6.098441123962402, "global_step": 78646, "epoch": 1872} {"train_loss": -6.087014198303223, "global_step": 78647, "epoch": 1872} {"train_loss": -5.9090576171875, "global_step": 78648, "epoch": 1872} {"train_loss": -6.058176040649414, "global_step": 78649, "epoch": 1872} {"train_loss": -6.040350914001465, "global_step": 78650, "epoch": 1872} {"train_loss": -6.130014896392822, "global_step": 78651, "epoch": 1872} {"train_loss": -6.031845569610596, "global_step": 78652, "epoch": 1872} {"train_loss": -6.079026222229004, "global_step": 78653, "epoch": 1872} {"train_loss": -6.044456481933594, "global_step": 78654, "epoch": 1872} {"train_loss": -6.0687456130981445, "global_step": 78655, "epoch": 1872} {"train_loss": -6.064116954803467, "global_step": 78656, "epoch": 1872} {"train_loss": -6.100102424621582, "global_step": 78657, "epoch": 1872} {"train_loss": -6.189059734344482, "global_step": 78658, "epoch": 1872} {"train_loss": -6.067776679992676, "global_step": 78659, "epoch": 1872} {"train_loss": -6.113391876220703, "global_step": 78660, "epoch": 1872} {"train_loss": -6.175534725189209, "global_step": 78661, "epoch": 1872} {"train_loss": -6.0826826095581055, "global_step": 78662, "epoch": 1872} {"train_loss": -6.182448863983154, "global_step": 78663, "epoch": 1872} {"train_loss": -6.147912979125977, "global_step": 78664, "epoch": 1872} {"train_loss": -6.09874829791841, "global_step": 78665, "epoch": 1872, "val_loss": 62031.0546875} {"train_loss": -6.183815956115723, "global_step": 78666, "epoch": 1873} {"train_loss": -6.107256889343262, "global_step": 78667, "epoch": 1873} {"train_loss": -6.223508834838867, "global_step": 78668, "epoch": 1873} {"train_loss": -6.164018630981445, "global_step": 78669, "epoch": 1873} {"train_loss": -6.143375396728516, "global_step": 78670, "epoch": 1873} {"train_loss": -6.112562656402588, "global_step": 78671, "epoch": 1873} {"train_loss": -6.143258094787598, "global_step": 78672, "epoch": 1873} {"train_loss": -6.091704368591309, "global_step": 78673, "epoch": 1873} {"train_loss": -6.085508823394775, "global_step": 78674, "epoch": 1873} {"train_loss": -6.14285945892334, "global_step": 78675, "epoch": 1873} {"train_loss": -6.063997268676758, "global_step": 78676, "epoch": 1873} {"train_loss": -6.08020544052124, "global_step": 78677, "epoch": 1873} {"train_loss": -6.124665260314941, "global_step": 78678, "epoch": 1873} {"train_loss": -6.007259845733643, "global_step": 78679, "epoch": 1873} {"train_loss": -6.124680519104004, "global_step": 78680, "epoch": 1873} {"train_loss": -6.0493879318237305, "global_step": 78681, "epoch": 1873} {"train_loss": -6.268703460693359, "global_step": 78682, "epoch": 1873} {"train_loss": -6.022438049316406, "global_step": 78683, "epoch": 1873} {"train_loss": -6.100374221801758, "global_step": 78684, "epoch": 1873} {"train_loss": -6.222452163696289, "global_step": 78685, "epoch": 1873} {"train_loss": -6.1941728591918945, "global_step": 78686, "epoch": 1873} {"train_loss": -6.135396957397461, "global_step": 78687, "epoch": 1873} {"train_loss": -6.176300525665283, "global_step": 78688, "epoch": 1873} {"train_loss": -6.14248514175415, "global_step": 78689, "epoch": 1873} {"train_loss": -6.117306709289551, "global_step": 78690, "epoch": 1873} {"train_loss": -6.0178022384643555, "global_step": 78691, "epoch": 1873} {"train_loss": -6.130142688751221, "global_step": 78692, "epoch": 1873} {"train_loss": -6.177951812744141, "global_step": 78693, "epoch": 1873} {"train_loss": -6.127647399902344, "global_step": 78694, "epoch": 1873} {"train_loss": -5.975391387939453, "global_step": 78695, "epoch": 1873} {"train_loss": -6.070535659790039, "global_step": 78696, "epoch": 1873} {"train_loss": -6.056934356689453, "global_step": 78697, "epoch": 1873} {"train_loss": -6.053745746612549, "global_step": 78698, "epoch": 1873} {"train_loss": -6.0765533447265625, "global_step": 78699, "epoch": 1873} {"train_loss": -6.171187400817871, "global_step": 78700, "epoch": 1873} {"train_loss": -6.1531829833984375, "global_step": 78701, "epoch": 1873} {"train_loss": -5.9878339767456055, "global_step": 78702, "epoch": 1873} {"train_loss": -6.046811580657959, "global_step": 78703, "epoch": 1873} {"train_loss": -6.010495185852051, "global_step": 78704, "epoch": 1873} {"train_loss": -6.169449806213379, "global_step": 78705, "epoch": 1873} {"train_loss": -6.105246543884277, "global_step": 78706, "epoch": 1873} {"train_loss": -6.110258374895368, "global_step": 78707, "epoch": 1873, "val_loss": 62075.37890625} {"train_loss": -6.210582733154297, "global_step": 78708, "epoch": 1874} {"train_loss": -6.044180393218994, "global_step": 78709, "epoch": 1874} {"train_loss": -6.186054229736328, "global_step": 78710, "epoch": 1874} {"train_loss": -6.099560737609863, "global_step": 78711, "epoch": 1874} {"train_loss": -6.037469863891602, "global_step": 78712, "epoch": 1874} {"train_loss": -6.122086524963379, "global_step": 78713, "epoch": 1874} {"train_loss": -6.195697784423828, "global_step": 78714, "epoch": 1874} {"train_loss": -6.158733367919922, "global_step": 78715, "epoch": 1874} {"train_loss": -6.146196365356445, "global_step": 78716, "epoch": 1874} {"train_loss": -6.087652683258057, "global_step": 78717, "epoch": 1874} {"train_loss": -6.0525078773498535, "global_step": 78718, "epoch": 1874} {"train_loss": -6.094088554382324, "global_step": 78719, "epoch": 1874} {"train_loss": -6.105247497558594, "global_step": 78720, "epoch": 1874} {"train_loss": -6.163118362426758, "global_step": 78721, "epoch": 1874} {"train_loss": -6.098245143890381, "global_step": 78722, "epoch": 1874} {"train_loss": -6.215143203735352, "global_step": 78723, "epoch": 1874} {"train_loss": -6.086434364318848, "global_step": 78724, "epoch": 1874} {"train_loss": -6.054399013519287, "global_step": 78725, "epoch": 1874} {"train_loss": -6.126713752746582, "global_step": 78726, "epoch": 1874} {"train_loss": -6.196859359741211, "global_step": 78727, "epoch": 1874} {"train_loss": -6.056637763977051, "global_step": 78728, "epoch": 1874} {"train_loss": -6.129719257354736, "global_step": 78729, "epoch": 1874} {"train_loss": -6.088343620300293, "global_step": 78730, "epoch": 1874} {"train_loss": -6.174736022949219, "global_step": 78731, "epoch": 1874} {"train_loss": -6.162067413330078, "global_step": 78732, "epoch": 1874} {"train_loss": -6.176352024078369, "global_step": 78733, "epoch": 1874} {"train_loss": -6.062243938446045, "global_step": 78734, "epoch": 1874} {"train_loss": -6.148496627807617, "global_step": 78735, "epoch": 1874} {"train_loss": -6.336827754974365, "global_step": 78736, "epoch": 1874} {"train_loss": -6.127399921417236, "global_step": 78737, "epoch": 1874} {"train_loss": -6.13369083404541, "global_step": 78738, "epoch": 1874} {"train_loss": -6.1927032470703125, "global_step": 78739, "epoch": 1874} {"train_loss": -6.053851127624512, "global_step": 78740, "epoch": 1874} {"train_loss": -6.046845436096191, "global_step": 78741, "epoch": 1874} {"train_loss": -6.145119667053223, "global_step": 78742, "epoch": 1874} {"train_loss": -6.136940956115723, "global_step": 78743, "epoch": 1874} {"train_loss": -6.199174880981445, "global_step": 78744, "epoch": 1874} {"train_loss": -6.239823341369629, "global_step": 78745, "epoch": 1874} {"train_loss": -6.216228485107422, "global_step": 78746, "epoch": 1874} {"train_loss": -6.077211380004883, "global_step": 78747, "epoch": 1874} {"train_loss": -6.150047302246094, "global_step": 78748, "epoch": 1874} {"train_loss": -6.132961670557658, "global_step": 78749, "epoch": 1874, "val_loss": 62282.15234375} {"train_loss": -6.201228141784668, "global_step": 78750, "epoch": 1875} {"train_loss": -6.101151466369629, "global_step": 78751, "epoch": 1875} {"train_loss": -6.159862518310547, "global_step": 78752, "epoch": 1875} {"train_loss": -6.139238357543945, "global_step": 78753, "epoch": 1875} {"train_loss": -6.119833946228027, "global_step": 78754, "epoch": 1875} {"train_loss": -6.120700836181641, "global_step": 78755, "epoch": 1875} {"train_loss": -6.076284885406494, "global_step": 78756, "epoch": 1875} {"train_loss": -6.137319087982178, "global_step": 78757, "epoch": 1875} {"train_loss": -6.034564971923828, "global_step": 78758, "epoch": 1875} {"train_loss": -5.900306701660156, "global_step": 78759, "epoch": 1875} {"train_loss": -6.055624008178711, "global_step": 78760, "epoch": 1875} {"train_loss": -6.0643205642700195, "global_step": 78761, "epoch": 1875} {"train_loss": -6.083605766296387, "global_step": 78762, "epoch": 1875} {"train_loss": -6.028373718261719, "global_step": 78763, "epoch": 1875} {"train_loss": -6.1107892990112305, "global_step": 78764, "epoch": 1875} {"train_loss": -6.096051216125488, "global_step": 78765, "epoch": 1875} {"train_loss": -6.087398052215576, "global_step": 78766, "epoch": 1875} {"train_loss": -6.141712665557861, "global_step": 78767, "epoch": 1875} {"train_loss": -6.100960731506348, "global_step": 78768, "epoch": 1875} {"train_loss": -5.9908905029296875, "global_step": 78769, "epoch": 1875} {"train_loss": -6.109757423400879, "global_step": 78770, "epoch": 1875} {"train_loss": -6.195334434509277, "global_step": 78771, "epoch": 1875} {"train_loss": -6.182849407196045, "global_step": 78772, "epoch": 1875} {"train_loss": -6.1797776222229, "global_step": 78773, "epoch": 1875} {"train_loss": -6.058615684509277, "global_step": 78774, "epoch": 1875} {"train_loss": -6.074972152709961, "global_step": 78775, "epoch": 1875} {"train_loss": -6.044193744659424, "global_step": 78776, "epoch": 1875} {"train_loss": -6.147183895111084, "global_step": 78777, "epoch": 1875} {"train_loss": -6.272322177886963, "global_step": 78778, "epoch": 1875} {"train_loss": -6.130367279052734, "global_step": 78779, "epoch": 1875} {"train_loss": -6.045987129211426, "global_step": 78780, "epoch": 1875} {"train_loss": -6.0827717781066895, "global_step": 78781, "epoch": 1875} {"train_loss": -6.060869216918945, "global_step": 78782, "epoch": 1875} {"train_loss": -6.031996726989746, "global_step": 78783, "epoch": 1875} {"train_loss": -6.05902624130249, "global_step": 78784, "epoch": 1875} {"train_loss": -6.131429672241211, "global_step": 78785, "epoch": 1875} {"train_loss": -6.086286544799805, "global_step": 78786, "epoch": 1875} {"train_loss": -6.262085914611816, "global_step": 78787, "epoch": 1875} {"train_loss": -6.103553771972656, "global_step": 78788, "epoch": 1875} {"train_loss": -6.131951808929443, "global_step": 78789, "epoch": 1875} {"train_loss": -6.130061149597168, "global_step": 78790, "epoch": 1875} {"train_loss": -6.1028809660956975, "global_step": 78791, "epoch": 1875, "val_loss": 62081.2421875} {"train_loss": -6.157731533050537, "global_step": 78792, "epoch": 1876} {"train_loss": -6.178176403045654, "global_step": 78793, "epoch": 1876} {"train_loss": -6.036962985992432, "global_step": 78794, "epoch": 1876} {"train_loss": -6.123213291168213, "global_step": 78795, "epoch": 1876} {"train_loss": -6.168476104736328, "global_step": 78796, "epoch": 1876} {"train_loss": -6.043485164642334, "global_step": 78797, "epoch": 1876} {"train_loss": -6.160972595214844, "global_step": 78798, "epoch": 1876} {"train_loss": -6.14593505859375, "global_step": 78799, "epoch": 1876} {"train_loss": -6.0369415283203125, "global_step": 78800, "epoch": 1876} {"train_loss": -6.218681335449219, "global_step": 78801, "epoch": 1876} {"train_loss": -6.099541664123535, "global_step": 78802, "epoch": 1876} {"train_loss": -6.050533771514893, "global_step": 78803, "epoch": 1876} {"train_loss": -6.204007148742676, "global_step": 78804, "epoch": 1876} {"train_loss": -6.130569934844971, "global_step": 78805, "epoch": 1876} {"train_loss": -6.150234222412109, "global_step": 78806, "epoch": 1876} {"train_loss": -6.15036678314209, "global_step": 78807, "epoch": 1876} {"train_loss": -6.00862455368042, "global_step": 78808, "epoch": 1876} {"train_loss": -6.079782962799072, "global_step": 78809, "epoch": 1876} {"train_loss": -6.098875999450684, "global_step": 78810, "epoch": 1876} {"train_loss": -6.066654205322266, "global_step": 78811, "epoch": 1876} {"train_loss": -6.182226657867432, "global_step": 78812, "epoch": 1876} {"train_loss": -6.154043197631836, "global_step": 78813, "epoch": 1876} {"train_loss": -6.081118583679199, "global_step": 78814, "epoch": 1876} {"train_loss": -6.182854652404785, "global_step": 78815, "epoch": 1876} {"train_loss": -6.232995510101318, "global_step": 78816, "epoch": 1876} {"train_loss": -6.0571370124816895, "global_step": 78817, "epoch": 1876} {"train_loss": -6.1721296310424805, "global_step": 78818, "epoch": 1876} {"train_loss": -6.049637794494629, "global_step": 78819, "epoch": 1876} {"train_loss": -6.208754539489746, "global_step": 78820, "epoch": 1876} {"train_loss": -6.013523101806641, "global_step": 78821, "epoch": 1876} {"train_loss": -6.179888725280762, "global_step": 78822, "epoch": 1876} {"train_loss": -6.259376525878906, "global_step": 78823, "epoch": 1876} {"train_loss": -6.079544544219971, "global_step": 78824, "epoch": 1876} {"train_loss": -6.177109718322754, "global_step": 78825, "epoch": 1876} {"train_loss": -6.075312614440918, "global_step": 78826, "epoch": 1876} {"train_loss": -5.999062538146973, "global_step": 78827, "epoch": 1876} {"train_loss": -6.099244594573975, "global_step": 78828, "epoch": 1876} {"train_loss": -6.068843841552734, "global_step": 78829, "epoch": 1876} {"train_loss": -6.137209415435791, "global_step": 78830, "epoch": 1876} {"train_loss": -6.147233486175537, "global_step": 78831, "epoch": 1876} {"train_loss": -6.216086387634277, "global_step": 78832, "epoch": 1876} {"train_loss": -6.122944570723034, "global_step": 78833, "epoch": 1876, "val_loss": 62286.390625} {"train_loss": -6.088992118835449, "global_step": 78834, "epoch": 1877} {"train_loss": -6.109572410583496, "global_step": 78835, "epoch": 1877} {"train_loss": -6.105775833129883, "global_step": 78836, "epoch": 1877} {"train_loss": -6.099316596984863, "global_step": 78837, "epoch": 1877} {"train_loss": -6.216524124145508, "global_step": 78838, "epoch": 1877} {"train_loss": -6.064284324645996, "global_step": 78839, "epoch": 1877} {"train_loss": -6.168985366821289, "global_step": 78840, "epoch": 1877} {"train_loss": -6.008813858032227, "global_step": 78841, "epoch": 1877} {"train_loss": -6.102639198303223, "global_step": 78842, "epoch": 1877} {"train_loss": -6.06378698348999, "global_step": 78843, "epoch": 1877} {"train_loss": -6.173493385314941, "global_step": 78844, "epoch": 1877} {"train_loss": -6.088164329528809, "global_step": 78845, "epoch": 1877} {"train_loss": -6.028935432434082, "global_step": 78846, "epoch": 1877} {"train_loss": -6.145511150360107, "global_step": 78847, "epoch": 1877} {"train_loss": -5.99969482421875, "global_step": 78848, "epoch": 1877} {"train_loss": -6.153879165649414, "global_step": 78849, "epoch": 1877} {"train_loss": -6.220676422119141, "global_step": 78850, "epoch": 1877} {"train_loss": -6.20078182220459, "global_step": 78851, "epoch": 1877} {"train_loss": -6.162961006164551, "global_step": 78852, "epoch": 1877} {"train_loss": -6.149598598480225, "global_step": 78853, "epoch": 1877} {"train_loss": -6.201857089996338, "global_step": 78854, "epoch": 1877} {"train_loss": -6.151543617248535, "global_step": 78855, "epoch": 1877} {"train_loss": -6.272978782653809, "global_step": 78856, "epoch": 1877} {"train_loss": -6.1994309425354, "global_step": 78857, "epoch": 1877} {"train_loss": -6.2080535888671875, "global_step": 78858, "epoch": 1877} {"train_loss": -6.177048206329346, "global_step": 78859, "epoch": 1877} {"train_loss": -6.171740531921387, "global_step": 78860, "epoch": 1877} {"train_loss": -6.239381790161133, "global_step": 78861, "epoch": 1877} {"train_loss": -6.245658874511719, "global_step": 78862, "epoch": 1877} {"train_loss": -6.2232561111450195, "global_step": 78863, "epoch": 1877} {"train_loss": -6.2054338455200195, "global_step": 78864, "epoch": 1877} {"train_loss": -6.13339900970459, "global_step": 78865, "epoch": 1877} {"train_loss": -6.148791313171387, "global_step": 78866, "epoch": 1877} {"train_loss": -6.248281955718994, "global_step": 78867, "epoch": 1877} {"train_loss": -6.188346862792969, "global_step": 78868, "epoch": 1877} {"train_loss": -6.107687473297119, "global_step": 78869, "epoch": 1877} {"train_loss": -6.131067752838135, "global_step": 78870, "epoch": 1877} {"train_loss": -6.064053058624268, "global_step": 78871, "epoch": 1877} {"train_loss": -6.136469841003418, "global_step": 78872, "epoch": 1877} {"train_loss": -6.109252452850342, "global_step": 78873, "epoch": 1877} {"train_loss": -6.083317756652832, "global_step": 78874, "epoch": 1877} {"train_loss": -6.143173705963862, "global_step": 78875, "epoch": 1877, "val_loss": 62126.640625} {"train_loss": -6.194240093231201, "global_step": 78876, "epoch": 1878} {"train_loss": -6.091526508331299, "global_step": 78877, "epoch": 1878} {"train_loss": -6.094564914703369, "global_step": 78878, "epoch": 1878} {"train_loss": -6.1481733322143555, "global_step": 78879, "epoch": 1878} {"train_loss": -6.129990577697754, "global_step": 78880, "epoch": 1878} {"train_loss": -6.240209579467773, "global_step": 78881, "epoch": 1878} {"train_loss": -6.182343482971191, "global_step": 78882, "epoch": 1878} {"train_loss": -6.079553127288818, "global_step": 78883, "epoch": 1878} {"train_loss": -6.027209281921387, "global_step": 78884, "epoch": 1878} {"train_loss": -6.153736114501953, "global_step": 78885, "epoch": 1878} {"train_loss": -6.1180219650268555, "global_step": 78886, "epoch": 1878} {"train_loss": -6.094482898712158, "global_step": 78887, "epoch": 1878} {"train_loss": -6.0149827003479, "global_step": 78888, "epoch": 1878} {"train_loss": -6.162447929382324, "global_step": 78889, "epoch": 1878} {"train_loss": -6.0471014976501465, "global_step": 78890, "epoch": 1878} {"train_loss": -6.135405540466309, "global_step": 78891, "epoch": 1878} {"train_loss": -6.159812927246094, "global_step": 78892, "epoch": 1878} {"train_loss": -6.070201396942139, "global_step": 78893, "epoch": 1878} {"train_loss": -6.095298767089844, "global_step": 78894, "epoch": 1878} {"train_loss": -6.126270771026611, "global_step": 78895, "epoch": 1878} {"train_loss": -6.102899074554443, "global_step": 78896, "epoch": 1878} {"train_loss": -6.129448413848877, "global_step": 78897, "epoch": 1878} {"train_loss": -6.159708023071289, "global_step": 78898, "epoch": 1878} {"train_loss": -6.214500427246094, "global_step": 78899, "epoch": 1878} {"train_loss": -6.206601142883301, "global_step": 78900, "epoch": 1878} {"train_loss": -6.005400657653809, "global_step": 78901, "epoch": 1878} {"train_loss": -6.210094451904297, "global_step": 78902, "epoch": 1878} {"train_loss": -6.062895774841309, "global_step": 78903, "epoch": 1878} {"train_loss": -6.210217475891113, "global_step": 78904, "epoch": 1878} {"train_loss": -6.183841705322266, "global_step": 78905, "epoch": 1878} {"train_loss": -6.092897415161133, "global_step": 78906, "epoch": 1878} {"train_loss": -6.069040298461914, "global_step": 78907, "epoch": 1878} {"train_loss": -6.235313415527344, "global_step": 78908, "epoch": 1878} {"train_loss": -6.022226333618164, "global_step": 78909, "epoch": 1878} {"train_loss": -5.994724750518799, "global_step": 78910, "epoch": 1878} {"train_loss": -6.1992034912109375, "global_step": 78911, "epoch": 1878} {"train_loss": -6.061916351318359, "global_step": 78912, "epoch": 1878} {"train_loss": -6.048564910888672, "global_step": 78913, "epoch": 1878} {"train_loss": -6.153709411621094, "global_step": 78914, "epoch": 1878} {"train_loss": -5.977105140686035, "global_step": 78915, "epoch": 1878} {"train_loss": -6.07232666015625, "global_step": 78916, "epoch": 1878} {"train_loss": -6.115302210762387, "global_step": 78917, "epoch": 1878, "val_loss": 62389.56640625} {"train_loss": -6.043599605560303, "global_step": 78918, "epoch": 1879} {"train_loss": -6.131114482879639, "global_step": 78919, "epoch": 1879} {"train_loss": -6.093164443969727, "global_step": 78920, "epoch": 1879} {"train_loss": -6.215359687805176, "global_step": 78921, "epoch": 1879} {"train_loss": -6.0173659324646, "global_step": 78922, "epoch": 1879} {"train_loss": -6.205954551696777, "global_step": 78923, "epoch": 1879} {"train_loss": -6.0293474197387695, "global_step": 78924, "epoch": 1879} {"train_loss": -6.0496063232421875, "global_step": 78925, "epoch": 1879} {"train_loss": -5.99383544921875, "global_step": 78926, "epoch": 1879} {"train_loss": -6.057453155517578, "global_step": 78927, "epoch": 1879} {"train_loss": -6.0775980949401855, "global_step": 78928, "epoch": 1879} {"train_loss": -6.18199348449707, "global_step": 78929, "epoch": 1879} {"train_loss": -6.090384483337402, "global_step": 78930, "epoch": 1879} {"train_loss": -6.09921932220459, "global_step": 78931, "epoch": 1879} {"train_loss": -5.956818580627441, "global_step": 78932, "epoch": 1879} {"train_loss": -6.166261672973633, "global_step": 78933, "epoch": 1879} {"train_loss": -6.049035549163818, "global_step": 78934, "epoch": 1879} {"train_loss": -6.191363334655762, "global_step": 78935, "epoch": 1879} {"train_loss": -6.107452392578125, "global_step": 78936, "epoch": 1879} {"train_loss": -6.021087169647217, "global_step": 78937, "epoch": 1879} {"train_loss": -6.100595474243164, "global_step": 78938, "epoch": 1879} {"train_loss": -6.15960693359375, "global_step": 78939, "epoch": 1879} {"train_loss": -6.108809471130371, "global_step": 78940, "epoch": 1879} {"train_loss": -6.161418914794922, "global_step": 78941, "epoch": 1879} {"train_loss": -5.985714912414551, "global_step": 78942, "epoch": 1879} {"train_loss": -6.156700134277344, "global_step": 78943, "epoch": 1879} {"train_loss": -5.9131999015808105, "global_step": 78944, "epoch": 1879} {"train_loss": -6.131371021270752, "global_step": 78945, "epoch": 1879} {"train_loss": -6.154240608215332, "global_step": 78946, "epoch": 1879} {"train_loss": -6.046854496002197, "global_step": 78947, "epoch": 1879} {"train_loss": -6.189565658569336, "global_step": 78948, "epoch": 1879} {"train_loss": -5.996848106384277, "global_step": 78949, "epoch": 1879} {"train_loss": -6.129253387451172, "global_step": 78950, "epoch": 1879} {"train_loss": -6.090818405151367, "global_step": 78951, "epoch": 1879} {"train_loss": -6.143896102905273, "global_step": 78952, "epoch": 1879} {"train_loss": -6.201202392578125, "global_step": 78953, "epoch": 1879} {"train_loss": -6.17839241027832, "global_step": 78954, "epoch": 1879} {"train_loss": -6.088715553283691, "global_step": 78955, "epoch": 1879} {"train_loss": -6.178467750549316, "global_step": 78956, "epoch": 1879} {"train_loss": -6.183708190917969, "global_step": 78957, "epoch": 1879} {"train_loss": -6.149071216583252, "global_step": 78958, "epoch": 1879} {"train_loss": -6.104511646997361, "global_step": 78959, "epoch": 1879, "val_loss": 61963.9296875} {"train_loss": -6.161868095397949, "global_step": 78960, "epoch": 1880} {"train_loss": -6.109364986419678, "global_step": 78961, "epoch": 1880} {"train_loss": -6.161264419555664, "global_step": 78962, "epoch": 1880} {"train_loss": -6.168346405029297, "global_step": 78963, "epoch": 1880} {"train_loss": -5.973790168762207, "global_step": 78964, "epoch": 1880} {"train_loss": -6.093706130981445, "global_step": 78965, "epoch": 1880} {"train_loss": -6.102791786193848, "global_step": 78966, "epoch": 1880} {"train_loss": -6.074958801269531, "global_step": 78967, "epoch": 1880} {"train_loss": -6.162111282348633, "global_step": 78968, "epoch": 1880} {"train_loss": -6.102304458618164, "global_step": 78969, "epoch": 1880} {"train_loss": -6.16342830657959, "global_step": 78970, "epoch": 1880} {"train_loss": -6.174894332885742, "global_step": 78971, "epoch": 1880} {"train_loss": -6.115058898925781, "global_step": 78972, "epoch": 1880} {"train_loss": -6.162168502807617, "global_step": 78973, "epoch": 1880} {"train_loss": -6.0264506340026855, "global_step": 78974, "epoch": 1880} {"train_loss": -5.998061656951904, "global_step": 78975, "epoch": 1880} {"train_loss": -6.163384437561035, "global_step": 78976, "epoch": 1880} {"train_loss": -6.141729354858398, "global_step": 78977, "epoch": 1880} {"train_loss": -6.158961296081543, "global_step": 78978, "epoch": 1880} {"train_loss": -6.069993019104004, "global_step": 78979, "epoch": 1880} {"train_loss": -6.21859073638916, "global_step": 78980, "epoch": 1880} {"train_loss": -6.018319129943848, "global_step": 78981, "epoch": 1880} {"train_loss": -6.2191362380981445, "global_step": 78982, "epoch": 1880} {"train_loss": -6.064720153808594, "global_step": 78983, "epoch": 1880} {"train_loss": -6.09159517288208, "global_step": 78984, "epoch": 1880} {"train_loss": -6.230939865112305, "global_step": 78985, "epoch": 1880} {"train_loss": -6.132779121398926, "global_step": 78986, "epoch": 1880} {"train_loss": -6.245347499847412, "global_step": 78987, "epoch": 1880} {"train_loss": -6.057552814483643, "global_step": 78988, "epoch": 1880} {"train_loss": -6.138850212097168, "global_step": 78989, "epoch": 1880} {"train_loss": -6.040062427520752, "global_step": 78990, "epoch": 1880} {"train_loss": -6.093972682952881, "global_step": 78991, "epoch": 1880} {"train_loss": -5.995368480682373, "global_step": 78992, "epoch": 1880} {"train_loss": -6.139091491699219, "global_step": 78993, "epoch": 1880} {"train_loss": -6.056881427764893, "global_step": 78994, "epoch": 1880} {"train_loss": -6.036696434020996, "global_step": 78995, "epoch": 1880} {"train_loss": -6.090089797973633, "global_step": 78996, "epoch": 1880} {"train_loss": -6.172361373901367, "global_step": 78997, "epoch": 1880} {"train_loss": -6.241586685180664, "global_step": 78998, "epoch": 1880} {"train_loss": -6.166084289550781, "global_step": 78999, "epoch": 1880} {"train_loss": -6.032853126525879, "global_step": 79000, "epoch": 1880} {"train_loss": -6.119004363105411, "global_step": 79001, "epoch": 1880, "val_loss": 62181.66796875} {"train_loss": -6.203617095947266, "global_step": 79002, "epoch": 1881} {"train_loss": -6.118623733520508, "global_step": 79003, "epoch": 1881} {"train_loss": -6.190716743469238, "global_step": 79004, "epoch": 1881} {"train_loss": -6.109281063079834, "global_step": 79005, "epoch": 1881} {"train_loss": -6.069270610809326, "global_step": 79006, "epoch": 1881} {"train_loss": -6.259675025939941, "global_step": 79007, "epoch": 1881} {"train_loss": -6.1024909019470215, "global_step": 79008, "epoch": 1881} {"train_loss": -6.1010284423828125, "global_step": 79009, "epoch": 1881} {"train_loss": -6.2416791915893555, "global_step": 79010, "epoch": 1881} {"train_loss": -6.031503677368164, "global_step": 79011, "epoch": 1881} {"train_loss": -6.058813571929932, "global_step": 79012, "epoch": 1881} {"train_loss": -6.043191432952881, "global_step": 79013, "epoch": 1881} {"train_loss": -6.146651268005371, "global_step": 79014, "epoch": 1881} {"train_loss": -6.058601379394531, "global_step": 79015, "epoch": 1881} {"train_loss": -6.126399040222168, "global_step": 79016, "epoch": 1881} {"train_loss": -6.138027191162109, "global_step": 79017, "epoch": 1881} {"train_loss": -6.052671432495117, "global_step": 79018, "epoch": 1881} {"train_loss": -6.051390171051025, "global_step": 79019, "epoch": 1881} {"train_loss": -6.199934482574463, "global_step": 79020, "epoch": 1881} {"train_loss": -6.052538871765137, "global_step": 79021, "epoch": 1881} {"train_loss": -6.165043354034424, "global_step": 79022, "epoch": 1881} {"train_loss": -6.078194618225098, "global_step": 79023, "epoch": 1881} {"train_loss": -5.990377426147461, "global_step": 79024, "epoch": 1881} {"train_loss": -5.999786376953125, "global_step": 79025, "epoch": 1881} {"train_loss": -5.955999374389648, "global_step": 79026, "epoch": 1881} {"train_loss": -6.0677080154418945, "global_step": 79027, "epoch": 1881} {"train_loss": -6.039395332336426, "global_step": 79028, "epoch": 1881} {"train_loss": -6.17716646194458, "global_step": 79029, "epoch": 1881} {"train_loss": -6.0596418380737305, "global_step": 79030, "epoch": 1881} {"train_loss": -6.058748722076416, "global_step": 79031, "epoch": 1881} {"train_loss": -6.084419250488281, "global_step": 79032, "epoch": 1881} {"train_loss": -6.119604110717773, "global_step": 79033, "epoch": 1881} {"train_loss": -6.083252906799316, "global_step": 79034, "epoch": 1881} {"train_loss": -6.097023963928223, "global_step": 79035, "epoch": 1881} {"train_loss": -6.155394554138184, "global_step": 79036, "epoch": 1881} {"train_loss": -6.063626289367676, "global_step": 79037, "epoch": 1881} {"train_loss": -6.124926567077637, "global_step": 79038, "epoch": 1881} {"train_loss": -6.067829132080078, "global_step": 79039, "epoch": 1881} {"train_loss": -6.118935585021973, "global_step": 79040, "epoch": 1881} {"train_loss": -6.190524578094482, "global_step": 79041, "epoch": 1881} {"train_loss": -6.200329303741455, "global_step": 79042, "epoch": 1881} {"train_loss": -6.105789786293393, "global_step": 79043, "epoch": 1881, "val_loss": 62111.265625} {"train_loss": -6.198334217071533, "global_step": 79044, "epoch": 1882} {"train_loss": -6.089794635772705, "global_step": 79045, "epoch": 1882} {"train_loss": -6.19913387298584, "global_step": 79046, "epoch": 1882} {"train_loss": -6.0577898025512695, "global_step": 79047, "epoch": 1882} {"train_loss": -6.134670734405518, "global_step": 79048, "epoch": 1882} {"train_loss": -6.10413932800293, "global_step": 79049, "epoch": 1882} {"train_loss": -6.101194858551025, "global_step": 79050, "epoch": 1882} {"train_loss": -6.166469097137451, "global_step": 79051, "epoch": 1882} {"train_loss": -6.1207594871521, "global_step": 79052, "epoch": 1882} {"train_loss": -6.1764421463012695, "global_step": 79053, "epoch": 1882} {"train_loss": -6.200664520263672, "global_step": 79054, "epoch": 1882} {"train_loss": -6.204113483428955, "global_step": 79055, "epoch": 1882} {"train_loss": -6.059841632843018, "global_step": 79056, "epoch": 1882} {"train_loss": -6.139168739318848, "global_step": 79057, "epoch": 1882} {"train_loss": -6.117227554321289, "global_step": 79058, "epoch": 1882} {"train_loss": -6.205867767333984, "global_step": 79059, "epoch": 1882} {"train_loss": -6.249460220336914, "global_step": 79060, "epoch": 1882} {"train_loss": -6.197330474853516, "global_step": 79061, "epoch": 1882} {"train_loss": -6.168646812438965, "global_step": 79062, "epoch": 1882} {"train_loss": -6.134245872497559, "global_step": 79063, "epoch": 1882} {"train_loss": -6.089934349060059, "global_step": 79064, "epoch": 1882} {"train_loss": -6.131511688232422, "global_step": 79065, "epoch": 1882} {"train_loss": -6.149683952331543, "global_step": 79066, "epoch": 1882} {"train_loss": -6.1225433349609375, "global_step": 79067, "epoch": 1882} {"train_loss": -6.133959770202637, "global_step": 79068, "epoch": 1882} {"train_loss": -6.158313274383545, "global_step": 79069, "epoch": 1882} {"train_loss": -6.161762714385986, "global_step": 79070, "epoch": 1882} {"train_loss": -6.156527042388916, "global_step": 79071, "epoch": 1882} {"train_loss": -6.160682678222656, "global_step": 79072, "epoch": 1882} {"train_loss": -6.104277610778809, "global_step": 79073, "epoch": 1882} {"train_loss": -6.171594142913818, "global_step": 79074, "epoch": 1882} {"train_loss": -6.118505001068115, "global_step": 79075, "epoch": 1882} {"train_loss": -6.179396152496338, "global_step": 79076, "epoch": 1882} {"train_loss": -6.182154178619385, "global_step": 79077, "epoch": 1882} {"train_loss": -6.075645923614502, "global_step": 79078, "epoch": 1882} {"train_loss": -6.113363742828369, "global_step": 79079, "epoch": 1882} {"train_loss": -6.0736494064331055, "global_step": 79080, "epoch": 1882} {"train_loss": -6.115467548370361, "global_step": 79081, "epoch": 1882} {"train_loss": -6.164427280426025, "global_step": 79082, "epoch": 1882} {"train_loss": -6.130733966827393, "global_step": 79083, "epoch": 1882} {"train_loss": -6.010495662689209, "global_step": 79084, "epoch": 1882} {"train_loss": -6.137825454984393, "global_step": 79085, "epoch": 1882, "val_loss": 62238.43359375} {"train_loss": -5.992556571960449, "global_step": 79086, "epoch": 1883} {"train_loss": -6.215000629425049, "global_step": 79087, "epoch": 1883} {"train_loss": -5.990799903869629, "global_step": 79088, "epoch": 1883} {"train_loss": -6.138968467712402, "global_step": 79089, "epoch": 1883} {"train_loss": -6.144705772399902, "global_step": 79090, "epoch": 1883} {"train_loss": -6.122223854064941, "global_step": 79091, "epoch": 1883} {"train_loss": -6.249328136444092, "global_step": 79092, "epoch": 1883} {"train_loss": -6.14089298248291, "global_step": 79093, "epoch": 1883} {"train_loss": -6.120715141296387, "global_step": 79094, "epoch": 1883} {"train_loss": -6.026525497436523, "global_step": 79095, "epoch": 1883} {"train_loss": -6.210183620452881, "global_step": 79096, "epoch": 1883} {"train_loss": -6.150869369506836, "global_step": 79097, "epoch": 1883} {"train_loss": -6.105831146240234, "global_step": 79098, "epoch": 1883} {"train_loss": -6.192638874053955, "global_step": 79099, "epoch": 1883} {"train_loss": -6.045016288757324, "global_step": 79100, "epoch": 1883} {"train_loss": -6.089376926422119, "global_step": 79101, "epoch": 1883} {"train_loss": -6.059441566467285, "global_step": 79102, "epoch": 1883} {"train_loss": -6.13737678527832, "global_step": 79103, "epoch": 1883} {"train_loss": -6.159308433532715, "global_step": 79104, "epoch": 1883} {"train_loss": -6.092574596405029, "global_step": 79105, "epoch": 1883} {"train_loss": -6.227394104003906, "global_step": 79106, "epoch": 1883} {"train_loss": -6.25330924987793, "global_step": 79107, "epoch": 1883} {"train_loss": -6.2049946784973145, "global_step": 79108, "epoch": 1883} {"train_loss": -6.151524066925049, "global_step": 79109, "epoch": 1883} {"train_loss": -6.153128147125244, "global_step": 79110, "epoch": 1883} {"train_loss": -6.185604095458984, "global_step": 79111, "epoch": 1883} {"train_loss": -6.167897701263428, "global_step": 79112, "epoch": 1883} {"train_loss": -6.135091781616211, "global_step": 79113, "epoch": 1883} {"train_loss": -6.211424827575684, "global_step": 79114, "epoch": 1883} {"train_loss": -6.1890387535095215, "global_step": 79115, "epoch": 1883} {"train_loss": -6.13340950012207, "global_step": 79116, "epoch": 1883} {"train_loss": -6.238252639770508, "global_step": 79117, "epoch": 1883} {"train_loss": -6.125942230224609, "global_step": 79118, "epoch": 1883} {"train_loss": -6.117867946624756, "global_step": 79119, "epoch": 1883} {"train_loss": -6.255309104919434, "global_step": 79120, "epoch": 1883} {"train_loss": -6.223697662353516, "global_step": 79121, "epoch": 1883} {"train_loss": -6.180336952209473, "global_step": 79122, "epoch": 1883} {"train_loss": -6.105103492736816, "global_step": 79123, "epoch": 1883} {"train_loss": -5.9571027755737305, "global_step": 79124, "epoch": 1883} {"train_loss": -6.110613822937012, "global_step": 79125, "epoch": 1883} {"train_loss": -6.235374450683594, "global_step": 79126, "epoch": 1883} {"train_loss": -6.140712329319546, "global_step": 79127, "epoch": 1883, "val_loss": 62186.1875} {"train_loss": -6.211821556091309, "global_step": 79128, "epoch": 1884} {"train_loss": -6.235996246337891, "global_step": 79129, "epoch": 1884} {"train_loss": -6.175037384033203, "global_step": 79130, "epoch": 1884} {"train_loss": -6.185258865356445, "global_step": 79131, "epoch": 1884} {"train_loss": -6.2149457931518555, "global_step": 79132, "epoch": 1884} {"train_loss": -6.037715911865234, "global_step": 79133, "epoch": 1884} {"train_loss": -6.2860541343688965, "global_step": 79134, "epoch": 1884} {"train_loss": -6.123056411743164, "global_step": 79135, "epoch": 1884} {"train_loss": -6.179129600524902, "global_step": 79136, "epoch": 1884} {"train_loss": -6.178382873535156, "global_step": 79137, "epoch": 1884} {"train_loss": -6.084359169006348, "global_step": 79138, "epoch": 1884} {"train_loss": -6.156440734863281, "global_step": 79139, "epoch": 1884} {"train_loss": -6.206782341003418, "global_step": 79140, "epoch": 1884} {"train_loss": -6.095366477966309, "global_step": 79141, "epoch": 1884} {"train_loss": -6.075530052185059, "global_step": 79142, "epoch": 1884} {"train_loss": -6.107999801635742, "global_step": 79143, "epoch": 1884} {"train_loss": -6.121767520904541, "global_step": 79144, "epoch": 1884} {"train_loss": -6.317923545837402, "global_step": 79145, "epoch": 1884} {"train_loss": -6.077291488647461, "global_step": 79146, "epoch": 1884} {"train_loss": -6.150026321411133, "global_step": 79147, "epoch": 1884} {"train_loss": -6.051197052001953, "global_step": 79148, "epoch": 1884} {"train_loss": -6.120102882385254, "global_step": 79149, "epoch": 1884} {"train_loss": -6.0892534255981445, "global_step": 79150, "epoch": 1884} {"train_loss": -6.150172710418701, "global_step": 79151, "epoch": 1884} {"train_loss": -6.117351531982422, "global_step": 79152, "epoch": 1884} {"train_loss": -6.159775257110596, "global_step": 79153, "epoch": 1884} {"train_loss": -6.158735275268555, "global_step": 79154, "epoch": 1884} {"train_loss": -6.039462566375732, "global_step": 79155, "epoch": 1884} {"train_loss": -6.074253082275391, "global_step": 79156, "epoch": 1884} {"train_loss": -6.146951675415039, "global_step": 79157, "epoch": 1884} {"train_loss": -6.01800012588501, "global_step": 79158, "epoch": 1884} {"train_loss": -6.043425559997559, "global_step": 79159, "epoch": 1884} {"train_loss": -6.177875518798828, "global_step": 79160, "epoch": 1884} {"train_loss": -6.093509674072266, "global_step": 79161, "epoch": 1884} {"train_loss": -6.161986351013184, "global_step": 79162, "epoch": 1884} {"train_loss": -6.058508396148682, "global_step": 79163, "epoch": 1884} {"train_loss": -6.048094749450684, "global_step": 79164, "epoch": 1884} {"train_loss": -6.178946495056152, "global_step": 79165, "epoch": 1884} {"train_loss": -6.278566360473633, "global_step": 79166, "epoch": 1884} {"train_loss": -6.157595634460449, "global_step": 79167, "epoch": 1884} {"train_loss": -6.105632781982422, "global_step": 79168, "epoch": 1884} {"train_loss": -6.134564638137817, "global_step": 79169, "epoch": 1884, "val_loss": 62017.61328125} {"train_loss": -6.178074836730957, "global_step": 79170, "epoch": 1885} {"train_loss": -6.038215637207031, "global_step": 79171, "epoch": 1885} {"train_loss": -6.066458702087402, "global_step": 79172, "epoch": 1885} {"train_loss": -6.2049078941345215, "global_step": 79173, "epoch": 1885} {"train_loss": -6.113785743713379, "global_step": 79174, "epoch": 1885} {"train_loss": -6.145291805267334, "global_step": 79175, "epoch": 1885} {"train_loss": -6.249926567077637, "global_step": 79176, "epoch": 1885} {"train_loss": -6.206570148468018, "global_step": 79177, "epoch": 1885} {"train_loss": -6.047956466674805, "global_step": 79178, "epoch": 1885} {"train_loss": -6.237018585205078, "global_step": 79179, "epoch": 1885} {"train_loss": -6.253787040710449, "global_step": 79180, "epoch": 1885} {"train_loss": -6.160233974456787, "global_step": 79181, "epoch": 1885} {"train_loss": -6.181936740875244, "global_step": 79182, "epoch": 1885} {"train_loss": -6.114971160888672, "global_step": 79183, "epoch": 1885} {"train_loss": -6.199324607849121, "global_step": 79184, "epoch": 1885} {"train_loss": -6.013763427734375, "global_step": 79185, "epoch": 1885} {"train_loss": -6.144791126251221, "global_step": 79186, "epoch": 1885} {"train_loss": -6.058779716491699, "global_step": 79187, "epoch": 1885} {"train_loss": -6.153315544128418, "global_step": 79188, "epoch": 1885} {"train_loss": -6.189634323120117, "global_step": 79189, "epoch": 1885} {"train_loss": -6.2928876876831055, "global_step": 79190, "epoch": 1885} {"train_loss": -6.12747859954834, "global_step": 79191, "epoch": 1885} {"train_loss": -6.183764457702637, "global_step": 79192, "epoch": 1885} {"train_loss": -6.257479667663574, "global_step": 79193, "epoch": 1885} {"train_loss": -6.30157470703125, "global_step": 79194, "epoch": 1885} {"train_loss": -6.16617488861084, "global_step": 79195, "epoch": 1885} {"train_loss": -6.250981330871582, "global_step": 79196, "epoch": 1885} {"train_loss": -6.143492221832275, "global_step": 79197, "epoch": 1885} {"train_loss": -6.076032638549805, "global_step": 79198, "epoch": 1885} {"train_loss": -6.166775703430176, "global_step": 79199, "epoch": 1885} {"train_loss": -6.125716686248779, "global_step": 79200, "epoch": 1885} {"train_loss": -6.120051383972168, "global_step": 79201, "epoch": 1885} {"train_loss": -6.284741401672363, "global_step": 79202, "epoch": 1885} {"train_loss": -6.286307334899902, "global_step": 79203, "epoch": 1885} {"train_loss": -6.196710586547852, "global_step": 79204, "epoch": 1885} {"train_loss": -6.018184661865234, "global_step": 79205, "epoch": 1885} {"train_loss": -6.118008613586426, "global_step": 79206, "epoch": 1885} {"train_loss": -6.175268650054932, "global_step": 79207, "epoch": 1885} {"train_loss": -6.076352119445801, "global_step": 79208, "epoch": 1885} {"train_loss": -6.045255661010742, "global_step": 79209, "epoch": 1885} {"train_loss": -6.159933090209961, "global_step": 79210, "epoch": 1885} {"train_loss": -6.158964770180838, "global_step": 79211, "epoch": 1885, "val_loss": 62094.3671875} {"train_loss": -6.200603008270264, "global_step": 79212, "epoch": 1886} {"train_loss": -6.084569454193115, "global_step": 79213, "epoch": 1886} {"train_loss": -6.207515716552734, "global_step": 79214, "epoch": 1886} {"train_loss": -6.181265830993652, "global_step": 79215, "epoch": 1886} {"train_loss": -6.000603675842285, "global_step": 79216, "epoch": 1886} {"train_loss": -6.194069862365723, "global_step": 79217, "epoch": 1886} {"train_loss": -6.081284523010254, "global_step": 79218, "epoch": 1886} {"train_loss": -6.061584949493408, "global_step": 79219, "epoch": 1886} {"train_loss": -6.092286109924316, "global_step": 79220, "epoch": 1886} {"train_loss": -6.101633071899414, "global_step": 79221, "epoch": 1886} {"train_loss": -6.16087007522583, "global_step": 79222, "epoch": 1886} {"train_loss": -6.18404483795166, "global_step": 79223, "epoch": 1886} {"train_loss": -6.210268020629883, "global_step": 79224, "epoch": 1886} {"train_loss": -6.199283123016357, "global_step": 79225, "epoch": 1886} {"train_loss": -6.073879718780518, "global_step": 79226, "epoch": 1886} {"train_loss": -6.213519096374512, "global_step": 79227, "epoch": 1886} {"train_loss": -6.173525333404541, "global_step": 79228, "epoch": 1886} {"train_loss": -6.093038558959961, "global_step": 79229, "epoch": 1886} {"train_loss": -6.142783164978027, "global_step": 79230, "epoch": 1886} {"train_loss": -6.072740077972412, "global_step": 79231, "epoch": 1886} {"train_loss": -6.137781143188477, "global_step": 79232, "epoch": 1886} {"train_loss": -6.198251724243164, "global_step": 79233, "epoch": 1886} {"train_loss": -6.1700215339660645, "global_step": 79234, "epoch": 1886} {"train_loss": -6.146571159362793, "global_step": 79235, "epoch": 1886} {"train_loss": -6.051692485809326, "global_step": 79236, "epoch": 1886} {"train_loss": -6.132444858551025, "global_step": 79237, "epoch": 1886} {"train_loss": -6.169766902923584, "global_step": 79238, "epoch": 1886} {"train_loss": -6.0812788009643555, "global_step": 79239, "epoch": 1886} {"train_loss": -6.164006233215332, "global_step": 79240, "epoch": 1886} {"train_loss": -6.174511909484863, "global_step": 79241, "epoch": 1886} {"train_loss": -6.090649604797363, "global_step": 79242, "epoch": 1886} {"train_loss": -6.231496810913086, "global_step": 79243, "epoch": 1886} {"train_loss": -6.1011128425598145, "global_step": 79244, "epoch": 1886} {"train_loss": -6.11369514465332, "global_step": 79245, "epoch": 1886} {"train_loss": -5.912320137023926, "global_step": 79246, "epoch": 1886} {"train_loss": -6.157666206359863, "global_step": 79247, "epoch": 1886} {"train_loss": -6.138309001922607, "global_step": 79248, "epoch": 1886} {"train_loss": -6.0781145095825195, "global_step": 79249, "epoch": 1886} {"train_loss": -6.029841423034668, "global_step": 79250, "epoch": 1886} {"train_loss": -6.225518226623535, "global_step": 79251, "epoch": 1886} {"train_loss": -6.068082809448242, "global_step": 79252, "epoch": 1886} {"train_loss": -6.1263906842186335, "global_step": 79253, "epoch": 1886, "val_loss": 62298.33203125} {"train_loss": -6.2112627029418945, "global_step": 79254, "epoch": 1887} {"train_loss": -6.090015888214111, "global_step": 79255, "epoch": 1887} {"train_loss": -6.1332197189331055, "global_step": 79256, "epoch": 1887} {"train_loss": -6.037128925323486, "global_step": 79257, "epoch": 1887} {"train_loss": -6.13909912109375, "global_step": 79258, "epoch": 1887} {"train_loss": -6.19364070892334, "global_step": 79259, "epoch": 1887} {"train_loss": -6.142206192016602, "global_step": 79260, "epoch": 1887} {"train_loss": -6.022899627685547, "global_step": 79261, "epoch": 1887} {"train_loss": -6.096922874450684, "global_step": 79262, "epoch": 1887} {"train_loss": -6.023454666137695, "global_step": 79263, "epoch": 1887} {"train_loss": -6.128748893737793, "global_step": 79264, "epoch": 1887} {"train_loss": -6.057503700256348, "global_step": 79265, "epoch": 1887} {"train_loss": -6.100262641906738, "global_step": 79266, "epoch": 1887} {"train_loss": -6.203950881958008, "global_step": 79267, "epoch": 1887} {"train_loss": -6.024292945861816, "global_step": 79268, "epoch": 1887} {"train_loss": -6.104317665100098, "global_step": 79269, "epoch": 1887} {"train_loss": -6.106637477874756, "global_step": 79270, "epoch": 1887} {"train_loss": -6.2709126472473145, "global_step": 79271, "epoch": 1887} {"train_loss": -6.0676727294921875, "global_step": 79272, "epoch": 1887} {"train_loss": -6.118616104125977, "global_step": 79273, "epoch": 1887} {"train_loss": -6.028596878051758, "global_step": 79274, "epoch": 1887} {"train_loss": -6.210330486297607, "global_step": 79275, "epoch": 1887} {"train_loss": -6.212900161743164, "global_step": 79276, "epoch": 1887} {"train_loss": -6.160434722900391, "global_step": 79277, "epoch": 1887} {"train_loss": -6.2992329597473145, "global_step": 79278, "epoch": 1887} {"train_loss": -6.097675323486328, "global_step": 79279, "epoch": 1887} {"train_loss": -6.207522869110107, "global_step": 79280, "epoch": 1887} {"train_loss": -6.169442653656006, "global_step": 79281, "epoch": 1887} {"train_loss": -6.060150623321533, "global_step": 79282, "epoch": 1887} {"train_loss": -6.140992164611816, "global_step": 79283, "epoch": 1887} {"train_loss": -6.139944076538086, "global_step": 79284, "epoch": 1887} {"train_loss": -6.1471147537231445, "global_step": 79285, "epoch": 1887} {"train_loss": -6.1616010665893555, "global_step": 79286, "epoch": 1887} {"train_loss": -6.071252822875977, "global_step": 79287, "epoch": 1887} {"train_loss": -6.157294273376465, "global_step": 79288, "epoch": 1887} {"train_loss": -6.11988639831543, "global_step": 79289, "epoch": 1887} {"train_loss": -6.196817398071289, "global_step": 79290, "epoch": 1887} {"train_loss": -6.163414001464844, "global_step": 79291, "epoch": 1887} {"train_loss": -6.142943859100342, "global_step": 79292, "epoch": 1887} {"train_loss": -6.150001525878906, "global_step": 79293, "epoch": 1887} {"train_loss": -6.195992946624756, "global_step": 79294, "epoch": 1887} {"train_loss": -6.136451403299968, "global_step": 79295, "epoch": 1887, "val_loss": 62448.703125} {"train_loss": -6.066501617431641, "global_step": 79296, "epoch": 1888} {"train_loss": -6.010370254516602, "global_step": 79297, "epoch": 1888} {"train_loss": -6.336847305297852, "global_step": 79298, "epoch": 1888} {"train_loss": -6.177826881408691, "global_step": 79299, "epoch": 1888} {"train_loss": -6.123507976531982, "global_step": 79300, "epoch": 1888} {"train_loss": -6.152608394622803, "global_step": 79301, "epoch": 1888} {"train_loss": -6.02146577835083, "global_step": 79302, "epoch": 1888} {"train_loss": -6.045620918273926, "global_step": 79303, "epoch": 1888} {"train_loss": -6.178700923919678, "global_step": 79304, "epoch": 1888} {"train_loss": -6.09354829788208, "global_step": 79305, "epoch": 1888} {"train_loss": -6.112452507019043, "global_step": 79306, "epoch": 1888} {"train_loss": -6.077877998352051, "global_step": 79307, "epoch": 1888} {"train_loss": -6.146433353424072, "global_step": 79308, "epoch": 1888} {"train_loss": -6.188442230224609, "global_step": 79309, "epoch": 1888} {"train_loss": -6.160294532775879, "global_step": 79310, "epoch": 1888} {"train_loss": -6.143813133239746, "global_step": 79311, "epoch": 1888} {"train_loss": -6.084813117980957, "global_step": 79312, "epoch": 1888} {"train_loss": -6.157835960388184, "global_step": 79313, "epoch": 1888} {"train_loss": -6.121480941772461, "global_step": 79314, "epoch": 1888} {"train_loss": -6.173399925231934, "global_step": 79315, "epoch": 1888} {"train_loss": -6.130988597869873, "global_step": 79316, "epoch": 1888} {"train_loss": -6.165126800537109, "global_step": 79317, "epoch": 1888} {"train_loss": -6.123663902282715, "global_step": 79318, "epoch": 1888} {"train_loss": -5.990819454193115, "global_step": 79319, "epoch": 1888} {"train_loss": -6.173714637756348, "global_step": 79320, "epoch": 1888} {"train_loss": -6.220009803771973, "global_step": 79321, "epoch": 1888} {"train_loss": -6.076956272125244, "global_step": 79322, "epoch": 1888} {"train_loss": -6.233433723449707, "global_step": 79323, "epoch": 1888} {"train_loss": -6.169363975524902, "global_step": 79324, "epoch": 1888} {"train_loss": -6.08449125289917, "global_step": 79325, "epoch": 1888} {"train_loss": -6.117776870727539, "global_step": 79326, "epoch": 1888} {"train_loss": -5.995728492736816, "global_step": 79327, "epoch": 1888} {"train_loss": -6.176612854003906, "global_step": 79328, "epoch": 1888} {"train_loss": -6.09598445892334, "global_step": 79329, "epoch": 1888} {"train_loss": -6.130824565887451, "global_step": 79330, "epoch": 1888} {"train_loss": -6.125775337219238, "global_step": 79331, "epoch": 1888} {"train_loss": -6.106986045837402, "global_step": 79332, "epoch": 1888} {"train_loss": -6.0789079666137695, "global_step": 79333, "epoch": 1888} {"train_loss": -6.125895977020264, "global_step": 79334, "epoch": 1888} {"train_loss": -6.0977091789245605, "global_step": 79335, "epoch": 1888} {"train_loss": -6.138009071350098, "global_step": 79336, "epoch": 1888} {"train_loss": -6.125105960028512, "global_step": 79337, "epoch": 1888, "val_loss": 62263.88671875} {"train_loss": -6.165215492248535, "global_step": 79338, "epoch": 1889} {"train_loss": -6.246954917907715, "global_step": 79339, "epoch": 1889} {"train_loss": -6.078673362731934, "global_step": 79340, "epoch": 1889} {"train_loss": -6.092245101928711, "global_step": 79341, "epoch": 1889} {"train_loss": -6.143864631652832, "global_step": 79342, "epoch": 1889} {"train_loss": -6.15731143951416, "global_step": 79343, "epoch": 1889} {"train_loss": -5.991892337799072, "global_step": 79344, "epoch": 1889} {"train_loss": -6.059493064880371, "global_step": 79345, "epoch": 1889} {"train_loss": -6.200869083404541, "global_step": 79346, "epoch": 1889} {"train_loss": -6.130337715148926, "global_step": 79347, "epoch": 1889} {"train_loss": -6.235857963562012, "global_step": 79348, "epoch": 1889} {"train_loss": -6.055406093597412, "global_step": 79349, "epoch": 1889} {"train_loss": -6.07362699508667, "global_step": 79350, "epoch": 1889} {"train_loss": -6.081818580627441, "global_step": 79351, "epoch": 1889} {"train_loss": -5.934233665466309, "global_step": 79352, "epoch": 1889} {"train_loss": -6.0953569412231445, "global_step": 79353, "epoch": 1889} {"train_loss": -5.98964262008667, "global_step": 79354, "epoch": 1889} {"train_loss": -6.0517683029174805, "global_step": 79355, "epoch": 1889} {"train_loss": -6.272073745727539, "global_step": 79356, "epoch": 1889} {"train_loss": -6.078949928283691, "global_step": 79357, "epoch": 1889} {"train_loss": -6.207779884338379, "global_step": 79358, "epoch": 1889} {"train_loss": -6.087184906005859, "global_step": 79359, "epoch": 1889} {"train_loss": -6.116488456726074, "global_step": 79360, "epoch": 1889} {"train_loss": -6.148077964782715, "global_step": 79361, "epoch": 1889} {"train_loss": -6.0354437828063965, "global_step": 79362, "epoch": 1889} {"train_loss": -6.134469032287598, "global_step": 79363, "epoch": 1889} {"train_loss": -6.099822044372559, "global_step": 79364, "epoch": 1889} {"train_loss": -6.0603485107421875, "global_step": 79365, "epoch": 1889} {"train_loss": -6.168840408325195, "global_step": 79366, "epoch": 1889} {"train_loss": -6.120490550994873, "global_step": 79367, "epoch": 1889} {"train_loss": -6.052663803100586, "global_step": 79368, "epoch": 1889} {"train_loss": -6.066038608551025, "global_step": 79369, "epoch": 1889} {"train_loss": -6.196208953857422, "global_step": 79370, "epoch": 1889} {"train_loss": -6.191265106201172, "global_step": 79371, "epoch": 1889} {"train_loss": -5.973318099975586, "global_step": 79372, "epoch": 1889} {"train_loss": -6.142829418182373, "global_step": 79373, "epoch": 1889} {"train_loss": -6.210291862487793, "global_step": 79374, "epoch": 1889} {"train_loss": -6.183643341064453, "global_step": 79375, "epoch": 1889} {"train_loss": -6.155559539794922, "global_step": 79376, "epoch": 1889} {"train_loss": -6.154181480407715, "global_step": 79377, "epoch": 1889} {"train_loss": -6.09202766418457, "global_step": 79378, "epoch": 1889} {"train_loss": -6.115567184629894, "global_step": 79379, "epoch": 1889, "val_loss": 62255.25} {"train_loss": -6.12629508972168, "global_step": 79380, "epoch": 1890} {"train_loss": -6.117963790893555, "global_step": 79381, "epoch": 1890} {"train_loss": -6.168099403381348, "global_step": 79382, "epoch": 1890} {"train_loss": -6.222368240356445, "global_step": 79383, "epoch": 1890} {"train_loss": -6.137887954711914, "global_step": 79384, "epoch": 1890} {"train_loss": -6.092895030975342, "global_step": 79385, "epoch": 1890} {"train_loss": -6.114924430847168, "global_step": 79386, "epoch": 1890} {"train_loss": -6.213870048522949, "global_step": 79387, "epoch": 1890} {"train_loss": -6.257377624511719, "global_step": 79388, "epoch": 1890} {"train_loss": -6.019838809967041, "global_step": 79389, "epoch": 1890} {"train_loss": -6.14586877822876, "global_step": 79390, "epoch": 1890} {"train_loss": -6.198579788208008, "global_step": 79391, "epoch": 1890} {"train_loss": -6.178628921508789, "global_step": 79392, "epoch": 1890} {"train_loss": -6.107789039611816, "global_step": 79393, "epoch": 1890} {"train_loss": -6.105064392089844, "global_step": 79394, "epoch": 1890} {"train_loss": -6.049569129943848, "global_step": 79395, "epoch": 1890} {"train_loss": -6.150655269622803, "global_step": 79396, "epoch": 1890} {"train_loss": -6.210407257080078, "global_step": 79397, "epoch": 1890} {"train_loss": -6.127866744995117, "global_step": 79398, "epoch": 1890} {"train_loss": -6.132462978363037, "global_step": 79399, "epoch": 1890} {"train_loss": -6.000925540924072, "global_step": 79400, "epoch": 1890} {"train_loss": -6.277525901794434, "global_step": 79401, "epoch": 1890} {"train_loss": -6.145979881286621, "global_step": 79402, "epoch": 1890} {"train_loss": -6.116361141204834, "global_step": 79403, "epoch": 1890} {"train_loss": -6.056342124938965, "global_step": 79404, "epoch": 1890} {"train_loss": -6.119052410125732, "global_step": 79405, "epoch": 1890} {"train_loss": -6.172153472900391, "global_step": 79406, "epoch": 1890} {"train_loss": -6.075349807739258, "global_step": 79407, "epoch": 1890} {"train_loss": -6.116178035736084, "global_step": 79408, "epoch": 1890} {"train_loss": -5.954224586486816, "global_step": 79409, "epoch": 1890} {"train_loss": -6.129136562347412, "global_step": 79410, "epoch": 1890} {"train_loss": -6.13299036026001, "global_step": 79411, "epoch": 1890} {"train_loss": -6.183111667633057, "global_step": 79412, "epoch": 1890} {"train_loss": -6.222587585449219, "global_step": 79413, "epoch": 1890} {"train_loss": -6.123902320861816, "global_step": 79414, "epoch": 1890} {"train_loss": -6.136277198791504, "global_step": 79415, "epoch": 1890} {"train_loss": -6.183193206787109, "global_step": 79416, "epoch": 1890} {"train_loss": -6.050309181213379, "global_step": 79417, "epoch": 1890} {"train_loss": -6.09654426574707, "global_step": 79418, "epoch": 1890} {"train_loss": -6.138419151306152, "global_step": 79419, "epoch": 1890} {"train_loss": -6.148225784301758, "global_step": 79420, "epoch": 1890} {"train_loss": -6.131787606648037, "global_step": 79421, "epoch": 1890, "val_loss": 62159.65234375} {"train_loss": -6.166232109069824, "global_step": 79422, "epoch": 1891} {"train_loss": -6.050003528594971, "global_step": 79423, "epoch": 1891} {"train_loss": -6.184172630310059, "global_step": 79424, "epoch": 1891} {"train_loss": -6.107694149017334, "global_step": 79425, "epoch": 1891} {"train_loss": -6.173752784729004, "global_step": 79426, "epoch": 1891} {"train_loss": -6.148617744445801, "global_step": 79427, "epoch": 1891} {"train_loss": -6.074873447418213, "global_step": 79428, "epoch": 1891} {"train_loss": -6.192353248596191, "global_step": 79429, "epoch": 1891} {"train_loss": -6.075463771820068, "global_step": 79430, "epoch": 1891} {"train_loss": -6.117582321166992, "global_step": 79431, "epoch": 1891} {"train_loss": -6.166137218475342, "global_step": 79432, "epoch": 1891} {"train_loss": -6.0592546463012695, "global_step": 79433, "epoch": 1891} {"train_loss": -6.133623123168945, "global_step": 79434, "epoch": 1891} {"train_loss": -6.146330833435059, "global_step": 79435, "epoch": 1891} {"train_loss": -6.210686683654785, "global_step": 79436, "epoch": 1891} {"train_loss": -6.027924060821533, "global_step": 79437, "epoch": 1891} {"train_loss": -6.097672939300537, "global_step": 79438, "epoch": 1891} {"train_loss": -6.056070804595947, "global_step": 79439, "epoch": 1891} {"train_loss": -5.9927978515625, "global_step": 79440, "epoch": 1891} {"train_loss": -6.080610275268555, "global_step": 79441, "epoch": 1891} {"train_loss": -6.015758991241455, "global_step": 79442, "epoch": 1891} {"train_loss": -5.965490818023682, "global_step": 79443, "epoch": 1891} {"train_loss": -6.106234550476074, "global_step": 79444, "epoch": 1891} {"train_loss": -5.939310550689697, "global_step": 79445, "epoch": 1891} {"train_loss": -6.0131330490112305, "global_step": 79446, "epoch": 1891} {"train_loss": -6.079204559326172, "global_step": 79447, "epoch": 1891} {"train_loss": -6.178299427032471, "global_step": 79448, "epoch": 1891} {"train_loss": -5.9452972412109375, "global_step": 79449, "epoch": 1891} {"train_loss": -6.185701370239258, "global_step": 79450, "epoch": 1891} {"train_loss": -6.036236763000488, "global_step": 79451, "epoch": 1891} {"train_loss": -6.196949481964111, "global_step": 79452, "epoch": 1891} {"train_loss": -6.05391788482666, "global_step": 79453, "epoch": 1891} {"train_loss": -6.07331657409668, "global_step": 79454, "epoch": 1891} {"train_loss": -5.9680914878845215, "global_step": 79455, "epoch": 1891} {"train_loss": -6.021718502044678, "global_step": 79456, "epoch": 1891} {"train_loss": -6.037571430206299, "global_step": 79457, "epoch": 1891} {"train_loss": -6.191460132598877, "global_step": 79458, "epoch": 1891} {"train_loss": -6.043335914611816, "global_step": 79459, "epoch": 1891} {"train_loss": -6.126867294311523, "global_step": 79460, "epoch": 1891} {"train_loss": -6.125988006591797, "global_step": 79461, "epoch": 1891} {"train_loss": -6.143771171569824, "global_step": 79462, "epoch": 1891} {"train_loss": -6.092891659055438, "global_step": 79463, "epoch": 1891, "val_loss": 62404.1953125} {"train_loss": -6.058912754058838, "global_step": 79464, "epoch": 1892} {"train_loss": -6.196077823638916, "global_step": 79465, "epoch": 1892} {"train_loss": -5.997990608215332, "global_step": 79466, "epoch": 1892} {"train_loss": -6.206974029541016, "global_step": 79467, "epoch": 1892} {"train_loss": -6.131330490112305, "global_step": 79468, "epoch": 1892} {"train_loss": -6.187058448791504, "global_step": 79469, "epoch": 1892} {"train_loss": -6.209639072418213, "global_step": 79470, "epoch": 1892} {"train_loss": -6.1790771484375, "global_step": 79471, "epoch": 1892} {"train_loss": -6.100806713104248, "global_step": 79472, "epoch": 1892} {"train_loss": -6.045258045196533, "global_step": 79473, "epoch": 1892} {"train_loss": -6.179853916168213, "global_step": 79474, "epoch": 1892} {"train_loss": -6.137272834777832, "global_step": 79475, "epoch": 1892} {"train_loss": -6.237974643707275, "global_step": 79476, "epoch": 1892} {"train_loss": -6.151793479919434, "global_step": 79477, "epoch": 1892} {"train_loss": -6.10465669631958, "global_step": 79478, "epoch": 1892} {"train_loss": -6.206186294555664, "global_step": 79479, "epoch": 1892} {"train_loss": -6.111629486083984, "global_step": 79480, "epoch": 1892} {"train_loss": -6.184293746948242, "global_step": 79481, "epoch": 1892} {"train_loss": -6.22958517074585, "global_step": 79482, "epoch": 1892} {"train_loss": -6.136875629425049, "global_step": 79483, "epoch": 1892} {"train_loss": -6.251673698425293, "global_step": 79484, "epoch": 1892} {"train_loss": -6.016483306884766, "global_step": 79485, "epoch": 1892} {"train_loss": -6.1316752433776855, "global_step": 79486, "epoch": 1892} {"train_loss": -6.083559513092041, "global_step": 79487, "epoch": 1892} {"train_loss": -5.963069915771484, "global_step": 79488, "epoch": 1892} {"train_loss": -6.238693714141846, "global_step": 79489, "epoch": 1892} {"train_loss": -5.9907450675964355, "global_step": 79490, "epoch": 1892} {"train_loss": -6.189013481140137, "global_step": 79491, "epoch": 1892} {"train_loss": -6.026015281677246, "global_step": 79492, "epoch": 1892} {"train_loss": -6.001804351806641, "global_step": 79493, "epoch": 1892} {"train_loss": -6.156466484069824, "global_step": 79494, "epoch": 1892} {"train_loss": -6.082102298736572, "global_step": 79495, "epoch": 1892} {"train_loss": -6.136613845825195, "global_step": 79496, "epoch": 1892} {"train_loss": -6.012633800506592, "global_step": 79497, "epoch": 1892} {"train_loss": -6.244233131408691, "global_step": 79498, "epoch": 1892} {"train_loss": -6.060184478759766, "global_step": 79499, "epoch": 1892} {"train_loss": -6.140210151672363, "global_step": 79500, "epoch": 1892} {"train_loss": -6.070908546447754, "global_step": 79501, "epoch": 1892} {"train_loss": -6.049651145935059, "global_step": 79502, "epoch": 1892} {"train_loss": -6.116689682006836, "global_step": 79503, "epoch": 1892} {"train_loss": -6.093773365020752, "global_step": 79504, "epoch": 1892} {"train_loss": -6.122103373209636, "global_step": 79505, "epoch": 1892, "val_loss": 62298.890625} {"train_loss": -6.101079940795898, "global_step": 79506, "epoch": 1893} {"train_loss": -5.994589805603027, "global_step": 79507, "epoch": 1893} {"train_loss": -6.109806060791016, "global_step": 79508, "epoch": 1893} {"train_loss": -6.159360885620117, "global_step": 79509, "epoch": 1893} {"train_loss": -6.126964092254639, "global_step": 79510, "epoch": 1893} {"train_loss": -6.180680274963379, "global_step": 79511, "epoch": 1893} {"train_loss": -6.282975196838379, "global_step": 79512, "epoch": 1893} {"train_loss": -6.096399784088135, "global_step": 79513, "epoch": 1893} {"train_loss": -6.013301849365234, "global_step": 79514, "epoch": 1893} {"train_loss": -6.096693992614746, "global_step": 79515, "epoch": 1893} {"train_loss": -5.974014759063721, "global_step": 79516, "epoch": 1893} {"train_loss": -6.10353946685791, "global_step": 79517, "epoch": 1893} {"train_loss": -6.299741744995117, "global_step": 79518, "epoch": 1893} {"train_loss": -6.075862884521484, "global_step": 79519, "epoch": 1893} {"train_loss": -6.1156511306762695, "global_step": 79520, "epoch": 1893} {"train_loss": -6.231032371520996, "global_step": 79521, "epoch": 1893} {"train_loss": -6.087916374206543, "global_step": 79522, "epoch": 1893} {"train_loss": -6.026506423950195, "global_step": 79523, "epoch": 1893} {"train_loss": -6.055103302001953, "global_step": 79524, "epoch": 1893} {"train_loss": -6.108670711517334, "global_step": 79525, "epoch": 1893} {"train_loss": -6.1441521644592285, "global_step": 79526, "epoch": 1893} {"train_loss": -6.055986404418945, "global_step": 79527, "epoch": 1893} {"train_loss": -6.181754112243652, "global_step": 79528, "epoch": 1893} {"train_loss": -6.075991630554199, "global_step": 79529, "epoch": 1893} {"train_loss": -6.13500452041626, "global_step": 79530, "epoch": 1893} {"train_loss": -6.125720024108887, "global_step": 79531, "epoch": 1893} {"train_loss": -6.152661323547363, "global_step": 79532, "epoch": 1893} {"train_loss": -6.088043212890625, "global_step": 79533, "epoch": 1893} {"train_loss": -6.045353889465332, "global_step": 79534, "epoch": 1893} {"train_loss": -6.042168617248535, "global_step": 79535, "epoch": 1893} {"train_loss": -6.217878818511963, "global_step": 79536, "epoch": 1893} {"train_loss": -6.275277137756348, "global_step": 79537, "epoch": 1893} {"train_loss": -6.079290866851807, "global_step": 79538, "epoch": 1893} {"train_loss": -6.051030158996582, "global_step": 79539, "epoch": 1893} {"train_loss": -6.163882732391357, "global_step": 79540, "epoch": 1893} {"train_loss": -6.163403034210205, "global_step": 79541, "epoch": 1893} {"train_loss": -6.146280288696289, "global_step": 79542, "epoch": 1893} {"train_loss": -6.061409950256348, "global_step": 79543, "epoch": 1893} {"train_loss": -6.081677436828613, "global_step": 79544, "epoch": 1893} {"train_loss": -6.134498596191406, "global_step": 79545, "epoch": 1893} {"train_loss": -6.195603370666504, "global_step": 79546, "epoch": 1893} {"train_loss": -6.119762000583467, "global_step": 79547, "epoch": 1893, "val_loss": 62293.94921875} {"train_loss": -6.1647844314575195, "global_step": 79548, "epoch": 1894} {"train_loss": -6.195244789123535, "global_step": 79549, "epoch": 1894} {"train_loss": -6.165706157684326, "global_step": 79550, "epoch": 1894} {"train_loss": -6.131032943725586, "global_step": 79551, "epoch": 1894} {"train_loss": -6.086193084716797, "global_step": 79552, "epoch": 1894} {"train_loss": -6.12028694152832, "global_step": 79553, "epoch": 1894} {"train_loss": -6.182372093200684, "global_step": 79554, "epoch": 1894} {"train_loss": -6.18170690536499, "global_step": 79555, "epoch": 1894} {"train_loss": -6.272253036499023, "global_step": 79556, "epoch": 1894} {"train_loss": -6.231211185455322, "global_step": 79557, "epoch": 1894} {"train_loss": -6.166337966918945, "global_step": 79558, "epoch": 1894} {"train_loss": -6.145316123962402, "global_step": 79559, "epoch": 1894} {"train_loss": -6.130611896514893, "global_step": 79560, "epoch": 1894} {"train_loss": -6.160331726074219, "global_step": 79561, "epoch": 1894} {"train_loss": -6.100279331207275, "global_step": 79562, "epoch": 1894} {"train_loss": -6.187331676483154, "global_step": 79563, "epoch": 1894} {"train_loss": -6.221343994140625, "global_step": 79564, "epoch": 1894} {"train_loss": -6.188765525817871, "global_step": 79565, "epoch": 1894} {"train_loss": -6.1776628494262695, "global_step": 79566, "epoch": 1894} {"train_loss": -6.1110639572143555, "global_step": 79567, "epoch": 1894} {"train_loss": -6.145594596862793, "global_step": 79568, "epoch": 1894} {"train_loss": -6.233088970184326, "global_step": 79569, "epoch": 1894} {"train_loss": -6.149211883544922, "global_step": 79570, "epoch": 1894} {"train_loss": -6.102382183074951, "global_step": 79571, "epoch": 1894} {"train_loss": -6.172569274902344, "global_step": 79572, "epoch": 1894} {"train_loss": -5.95319128036499, "global_step": 79573, "epoch": 1894} {"train_loss": -6.035189628601074, "global_step": 79574, "epoch": 1894} {"train_loss": -6.17885684967041, "global_step": 79575, "epoch": 1894} {"train_loss": -6.106497764587402, "global_step": 79576, "epoch": 1894} {"train_loss": -6.073374271392822, "global_step": 79577, "epoch": 1894} {"train_loss": -6.1362810134887695, "global_step": 79578, "epoch": 1894} {"train_loss": -6.023883819580078, "global_step": 79579, "epoch": 1894} {"train_loss": -6.0973615646362305, "global_step": 79580, "epoch": 1894} {"train_loss": -6.0045552253723145, "global_step": 79581, "epoch": 1894} {"train_loss": -6.138233184814453, "global_step": 79582, "epoch": 1894} {"train_loss": -6.019875526428223, "global_step": 79583, "epoch": 1894} {"train_loss": -6.0875654220581055, "global_step": 79584, "epoch": 1894} {"train_loss": -6.178132057189941, "global_step": 79585, "epoch": 1894} {"train_loss": -5.919374465942383, "global_step": 79586, "epoch": 1894} {"train_loss": -6.186187744140625, "global_step": 79587, "epoch": 1894} {"train_loss": -6.0449371337890625, "global_step": 79588, "epoch": 1894} {"train_loss": -6.130925258000691, "global_step": 79589, "epoch": 1894, "val_loss": 62163.21875} {"train_loss": -6.147751331329346, "global_step": 79590, "epoch": 1895} {"train_loss": -6.089405536651611, "global_step": 79591, "epoch": 1895} {"train_loss": -6.2307353019714355, "global_step": 79592, "epoch": 1895} {"train_loss": -6.21790075302124, "global_step": 79593, "epoch": 1895} {"train_loss": -6.0348615646362305, "global_step": 79594, "epoch": 1895} {"train_loss": -6.2305450439453125, "global_step": 79595, "epoch": 1895} {"train_loss": -6.111087799072266, "global_step": 79596, "epoch": 1895} {"train_loss": -6.07089376449585, "global_step": 79597, "epoch": 1895} {"train_loss": -6.061796188354492, "global_step": 79598, "epoch": 1895} {"train_loss": -6.061648368835449, "global_step": 79599, "epoch": 1895} {"train_loss": -6.004611015319824, "global_step": 79600, "epoch": 1895} {"train_loss": -6.096116065979004, "global_step": 79601, "epoch": 1895} {"train_loss": -6.085552215576172, "global_step": 79602, "epoch": 1895} {"train_loss": -6.022676467895508, "global_step": 79603, "epoch": 1895} {"train_loss": -6.109101295471191, "global_step": 79604, "epoch": 1895} {"train_loss": -6.137903213500977, "global_step": 79605, "epoch": 1895} {"train_loss": -6.194268226623535, "global_step": 79606, "epoch": 1895} {"train_loss": -6.087478160858154, "global_step": 79607, "epoch": 1895} {"train_loss": -6.130934715270996, "global_step": 79608, "epoch": 1895} {"train_loss": -6.136031627655029, "global_step": 79609, "epoch": 1895} {"train_loss": -6.156422138214111, "global_step": 79610, "epoch": 1895} {"train_loss": -6.138223648071289, "global_step": 79611, "epoch": 1895} {"train_loss": -5.998904228210449, "global_step": 79612, "epoch": 1895} {"train_loss": -6.175128936767578, "global_step": 79613, "epoch": 1895} {"train_loss": -6.226686477661133, "global_step": 79614, "epoch": 1895} {"train_loss": -6.073309898376465, "global_step": 79615, "epoch": 1895} {"train_loss": -6.135017395019531, "global_step": 79616, "epoch": 1895} {"train_loss": -6.2189764976501465, "global_step": 79617, "epoch": 1895} {"train_loss": -6.103978633880615, "global_step": 79618, "epoch": 1895} {"train_loss": -6.206021308898926, "global_step": 79619, "epoch": 1895} {"train_loss": -6.089846611022949, "global_step": 79620, "epoch": 1895} {"train_loss": -6.085145950317383, "global_step": 79621, "epoch": 1895} {"train_loss": -6.163887977600098, "global_step": 79622, "epoch": 1895} {"train_loss": -6.06151008605957, "global_step": 79623, "epoch": 1895} {"train_loss": -6.19694709777832, "global_step": 79624, "epoch": 1895} {"train_loss": -6.16376256942749, "global_step": 79625, "epoch": 1895} {"train_loss": -6.09446382522583, "global_step": 79626, "epoch": 1895} {"train_loss": -6.150214672088623, "global_step": 79627, "epoch": 1895} {"train_loss": -6.137660980224609, "global_step": 79628, "epoch": 1895} {"train_loss": -6.140574932098389, "global_step": 79629, "epoch": 1895} {"train_loss": -6.262505054473877, "global_step": 79630, "epoch": 1895} {"train_loss": -6.125771250043597, "global_step": 79631, "epoch": 1895, "val_loss": 62128.390625} {"train_loss": -6.1115827560424805, "global_step": 79632, "epoch": 1896} {"train_loss": -6.1422438621521, "global_step": 79633, "epoch": 1896} {"train_loss": -6.1088972091674805, "global_step": 79634, "epoch": 1896} {"train_loss": -6.131004810333252, "global_step": 79635, "epoch": 1896} {"train_loss": -6.126125335693359, "global_step": 79636, "epoch": 1896} {"train_loss": -6.172637462615967, "global_step": 79637, "epoch": 1896} {"train_loss": -6.17694616317749, "global_step": 79638, "epoch": 1896} {"train_loss": -6.199927806854248, "global_step": 79639, "epoch": 1896} {"train_loss": -6.148890495300293, "global_step": 79640, "epoch": 1896} {"train_loss": -6.141334533691406, "global_step": 79641, "epoch": 1896} {"train_loss": -6.1973347663879395, "global_step": 79642, "epoch": 1896} {"train_loss": -6.098142623901367, "global_step": 79643, "epoch": 1896} {"train_loss": -6.18160343170166, "global_step": 79644, "epoch": 1896} {"train_loss": -6.120358943939209, "global_step": 79645, "epoch": 1896} {"train_loss": -6.166796684265137, "global_step": 79646, "epoch": 1896} {"train_loss": -6.143257141113281, "global_step": 79647, "epoch": 1896} {"train_loss": -6.083055019378662, "global_step": 79648, "epoch": 1896} {"train_loss": -6.063685417175293, "global_step": 79649, "epoch": 1896} {"train_loss": -6.194180011749268, "global_step": 79650, "epoch": 1896} {"train_loss": -6.1305952072143555, "global_step": 79651, "epoch": 1896} {"train_loss": -6.237344741821289, "global_step": 79652, "epoch": 1896} {"train_loss": -6.2512431144714355, "global_step": 79653, "epoch": 1896} {"train_loss": -6.1282243728637695, "global_step": 79654, "epoch": 1896} {"train_loss": -6.103325366973877, "global_step": 79655, "epoch": 1896} {"train_loss": -6.174755096435547, "global_step": 79656, "epoch": 1896} {"train_loss": -6.241198539733887, "global_step": 79657, "epoch": 1896} {"train_loss": -6.330724239349365, "global_step": 79658, "epoch": 1896} {"train_loss": -6.218070030212402, "global_step": 79659, "epoch": 1896} {"train_loss": -6.244283199310303, "global_step": 79660, "epoch": 1896} {"train_loss": -6.050427436828613, "global_step": 79661, "epoch": 1896} {"train_loss": -6.165691375732422, "global_step": 79662, "epoch": 1896} {"train_loss": -6.16370964050293, "global_step": 79663, "epoch": 1896} {"train_loss": -6.230274200439453, "global_step": 79664, "epoch": 1896} {"train_loss": -6.197009563446045, "global_step": 79665, "epoch": 1896} {"train_loss": -6.262630462646484, "global_step": 79666, "epoch": 1896} {"train_loss": -6.078105926513672, "global_step": 79667, "epoch": 1896} {"train_loss": -6.198359966278076, "global_step": 79668, "epoch": 1896} {"train_loss": -6.262583255767822, "global_step": 79669, "epoch": 1896} {"train_loss": -6.187341690063477, "global_step": 79670, "epoch": 1896} {"train_loss": -6.072818756103516, "global_step": 79671, "epoch": 1896} {"train_loss": -6.24244499206543, "global_step": 79672, "epoch": 1896} {"train_loss": -6.166662443251837, "global_step": 79673, "epoch": 1896, "val_loss": 62531.0078125} {"train_loss": -6.080848217010498, "global_step": 79674, "epoch": 1897} {"train_loss": -6.244884490966797, "global_step": 79675, "epoch": 1897} {"train_loss": -6.253466606140137, "global_step": 79676, "epoch": 1897} {"train_loss": -6.112934589385986, "global_step": 79677, "epoch": 1897} {"train_loss": -6.090527534484863, "global_step": 79678, "epoch": 1897} {"train_loss": -6.2059454917907715, "global_step": 79679, "epoch": 1897} {"train_loss": -6.238081455230713, "global_step": 79680, "epoch": 1897} {"train_loss": -6.253969192504883, "global_step": 79681, "epoch": 1897} {"train_loss": -6.19587516784668, "global_step": 79682, "epoch": 1897} {"train_loss": -6.1549482345581055, "global_step": 79683, "epoch": 1897} {"train_loss": -6.1808905601501465, "global_step": 79684, "epoch": 1897} {"train_loss": -6.098605632781982, "global_step": 79685, "epoch": 1897} {"train_loss": -6.131113052368164, "global_step": 79686, "epoch": 1897} {"train_loss": -6.11732292175293, "global_step": 79687, "epoch": 1897} {"train_loss": -6.038403034210205, "global_step": 79688, "epoch": 1897} {"train_loss": -6.154720306396484, "global_step": 79689, "epoch": 1897} {"train_loss": -6.1255669593811035, "global_step": 79690, "epoch": 1897} {"train_loss": -6.0466108322143555, "global_step": 79691, "epoch": 1897} {"train_loss": -5.984128952026367, "global_step": 79692, "epoch": 1897} {"train_loss": -6.068431377410889, "global_step": 79693, "epoch": 1897} {"train_loss": -6.0036797523498535, "global_step": 79694, "epoch": 1897} {"train_loss": -6.164319038391113, "global_step": 79695, "epoch": 1897} {"train_loss": -6.177511215209961, "global_step": 79696, "epoch": 1897} {"train_loss": -6.108182430267334, "global_step": 79697, "epoch": 1897} {"train_loss": -5.993173122406006, "global_step": 79698, "epoch": 1897} {"train_loss": -6.1031365394592285, "global_step": 79699, "epoch": 1897} {"train_loss": -6.104819297790527, "global_step": 79700, "epoch": 1897} {"train_loss": -6.062740325927734, "global_step": 79701, "epoch": 1897} {"train_loss": -6.1981401443481445, "global_step": 79702, "epoch": 1897} {"train_loss": -6.066268444061279, "global_step": 79703, "epoch": 1897} {"train_loss": -6.08439826965332, "global_step": 79704, "epoch": 1897} {"train_loss": -6.083126068115234, "global_step": 79705, "epoch": 1897} {"train_loss": -6.156063079833984, "global_step": 79706, "epoch": 1897} {"train_loss": -6.163395881652832, "global_step": 79707, "epoch": 1897} {"train_loss": -6.133612632751465, "global_step": 79708, "epoch": 1897} {"train_loss": -6.2143707275390625, "global_step": 79709, "epoch": 1897} {"train_loss": -6.217560768127441, "global_step": 79710, "epoch": 1897} {"train_loss": -6.105628490447998, "global_step": 79711, "epoch": 1897} {"train_loss": -6.100715637207031, "global_step": 79712, "epoch": 1897} {"train_loss": -6.216988563537598, "global_step": 79713, "epoch": 1897} {"train_loss": -6.2780232429504395, "global_step": 79714, "epoch": 1897} {"train_loss": -6.1347605387369795, "global_step": 79715, "epoch": 1897, "val_loss": 62263.26953125} {"train_loss": -6.114768981933594, "global_step": 79716, "epoch": 1898} {"train_loss": -6.145709991455078, "global_step": 79717, "epoch": 1898} {"train_loss": -6.208623886108398, "global_step": 79718, "epoch": 1898} {"train_loss": -6.127906799316406, "global_step": 79719, "epoch": 1898} {"train_loss": -6.147871017456055, "global_step": 79720, "epoch": 1898} {"train_loss": -6.12052059173584, "global_step": 79721, "epoch": 1898} {"train_loss": -6.211154460906982, "global_step": 79722, "epoch": 1898} {"train_loss": -6.032534599304199, "global_step": 79723, "epoch": 1898} {"train_loss": -6.231813430786133, "global_step": 79724, "epoch": 1898} {"train_loss": -6.168728351593018, "global_step": 79725, "epoch": 1898} {"train_loss": -6.196916580200195, "global_step": 79726, "epoch": 1898} {"train_loss": -6.243435859680176, "global_step": 79727, "epoch": 1898} {"train_loss": -6.237642288208008, "global_step": 79728, "epoch": 1898} {"train_loss": -6.13948917388916, "global_step": 79729, "epoch": 1898} {"train_loss": -6.179172515869141, "global_step": 79730, "epoch": 1898} {"train_loss": -6.1508941650390625, "global_step": 79731, "epoch": 1898} {"train_loss": -6.188310623168945, "global_step": 79732, "epoch": 1898} {"train_loss": -6.130308151245117, "global_step": 79733, "epoch": 1898} {"train_loss": -6.156787872314453, "global_step": 79734, "epoch": 1898} {"train_loss": -6.199735641479492, "global_step": 79735, "epoch": 1898} {"train_loss": -6.069139003753662, "global_step": 79736, "epoch": 1898} {"train_loss": -6.1059250831604, "global_step": 79737, "epoch": 1898} {"train_loss": -6.092451095581055, "global_step": 79738, "epoch": 1898} {"train_loss": -6.117184162139893, "global_step": 79739, "epoch": 1898} {"train_loss": -6.107914924621582, "global_step": 79740, "epoch": 1898} {"train_loss": -6.180564880371094, "global_step": 79741, "epoch": 1898} {"train_loss": -6.029115200042725, "global_step": 79742, "epoch": 1898} {"train_loss": -6.123960018157959, "global_step": 79743, "epoch": 1898} {"train_loss": -6.089356899261475, "global_step": 79744, "epoch": 1898} {"train_loss": -6.169716835021973, "global_step": 79745, "epoch": 1898} {"train_loss": -6.1717753410339355, "global_step": 79746, "epoch": 1898} {"train_loss": -6.264554977416992, "global_step": 79747, "epoch": 1898} {"train_loss": -6.274039268493652, "global_step": 79748, "epoch": 1898} {"train_loss": -6.058921813964844, "global_step": 79749, "epoch": 1898} {"train_loss": -6.16161584854126, "global_step": 79750, "epoch": 1898} {"train_loss": -6.231513977050781, "global_step": 79751, "epoch": 1898} {"train_loss": -6.168045520782471, "global_step": 79752, "epoch": 1898} {"train_loss": -6.2390289306640625, "global_step": 79753, "epoch": 1898} {"train_loss": -6.111072063446045, "global_step": 79754, "epoch": 1898} {"train_loss": -6.107994079589844, "global_step": 79755, "epoch": 1898} {"train_loss": -6.104457855224609, "global_step": 79756, "epoch": 1898} {"train_loss": -6.154735428946359, "global_step": 79757, "epoch": 1898, "val_loss": 62203.1875} {"train_loss": -6.167210102081299, "global_step": 79758, "epoch": 1899} {"train_loss": -6.231861114501953, "global_step": 79759, "epoch": 1899} {"train_loss": -6.1218061447143555, "global_step": 79760, "epoch": 1899} {"train_loss": -5.9857072830200195, "global_step": 79761, "epoch": 1899} {"train_loss": -6.16807746887207, "global_step": 79762, "epoch": 1899} {"train_loss": -6.2584428787231445, "global_step": 79763, "epoch": 1899} {"train_loss": -6.211980819702148, "global_step": 79764, "epoch": 1899} {"train_loss": -6.208682060241699, "global_step": 79765, "epoch": 1899} {"train_loss": -6.083948135375977, "global_step": 79766, "epoch": 1899} {"train_loss": -6.156838417053223, "global_step": 79767, "epoch": 1899} {"train_loss": -6.273778915405273, "global_step": 79768, "epoch": 1899} {"train_loss": -6.190347194671631, "global_step": 79769, "epoch": 1899} {"train_loss": -6.175259590148926, "global_step": 79770, "epoch": 1899} {"train_loss": -6.044471740722656, "global_step": 79771, "epoch": 1899} {"train_loss": -6.203354358673096, "global_step": 79772, "epoch": 1899} {"train_loss": -6.143059253692627, "global_step": 79773, "epoch": 1899} {"train_loss": -6.03641414642334, "global_step": 79774, "epoch": 1899} {"train_loss": -6.119941711425781, "global_step": 79775, "epoch": 1899} {"train_loss": -6.138948440551758, "global_step": 79776, "epoch": 1899} {"train_loss": -6.249927997589111, "global_step": 79777, "epoch": 1899} {"train_loss": -6.289595603942871, "global_step": 79778, "epoch": 1899} {"train_loss": -6.204920768737793, "global_step": 79779, "epoch": 1899} {"train_loss": -6.064359664916992, "global_step": 79780, "epoch": 1899} {"train_loss": -6.211753845214844, "global_step": 79781, "epoch": 1899} {"train_loss": -6.019096851348877, "global_step": 79782, "epoch": 1899} {"train_loss": -6.122012138366699, "global_step": 79783, "epoch": 1899} {"train_loss": -6.096264362335205, "global_step": 79784, "epoch": 1899} {"train_loss": -6.056817054748535, "global_step": 79785, "epoch": 1899} {"train_loss": -6.150322914123535, "global_step": 79786, "epoch": 1899} {"train_loss": -6.1349077224731445, "global_step": 79787, "epoch": 1899} {"train_loss": -6.189404487609863, "global_step": 79788, "epoch": 1899} {"train_loss": -6.101069927215576, "global_step": 79789, "epoch": 1899} {"train_loss": -6.249124526977539, "global_step": 79790, "epoch": 1899} {"train_loss": -6.153314590454102, "global_step": 79791, "epoch": 1899} {"train_loss": -6.249037742614746, "global_step": 79792, "epoch": 1899} {"train_loss": -6.243611812591553, "global_step": 79793, "epoch": 1899} {"train_loss": -6.192093849182129, "global_step": 79794, "epoch": 1899} {"train_loss": -6.241368293762207, "global_step": 79795, "epoch": 1899} {"train_loss": -6.216664791107178, "global_step": 79796, "epoch": 1899} {"train_loss": -6.234917640686035, "global_step": 79797, "epoch": 1899} {"train_loss": -6.122648239135742, "global_step": 79798, "epoch": 1899} {"train_loss": -6.163185846237909, "global_step": 79799, "epoch": 1899, "val_loss": 62408.609375} {"train_loss": -6.141069412231445, "global_step": 79800, "epoch": 1900} {"train_loss": -6.228144645690918, "global_step": 79801, "epoch": 1900} {"train_loss": -6.173866271972656, "global_step": 79802, "epoch": 1900} {"train_loss": -6.153008937835693, "global_step": 79803, "epoch": 1900} {"train_loss": -6.219747066497803, "global_step": 79804, "epoch": 1900} {"train_loss": -6.2692461013793945, "global_step": 79805, "epoch": 1900} {"train_loss": -6.194700241088867, "global_step": 79806, "epoch": 1900} {"train_loss": -6.094871997833252, "global_step": 79807, "epoch": 1900} {"train_loss": -6.160715579986572, "global_step": 79808, "epoch": 1900} {"train_loss": -6.118890285491943, "global_step": 79809, "epoch": 1900} {"train_loss": -6.113910675048828, "global_step": 79810, "epoch": 1900} {"train_loss": -6.154482841491699, "global_step": 79811, "epoch": 1900} {"train_loss": -6.231934070587158, "global_step": 79812, "epoch": 1900} {"train_loss": -6.09752082824707, "global_step": 79813, "epoch": 1900} {"train_loss": -6.120938301086426, "global_step": 79814, "epoch": 1900} {"train_loss": -6.121910095214844, "global_step": 79815, "epoch": 1900} {"train_loss": -6.223183631896973, "global_step": 79816, "epoch": 1900} {"train_loss": -6.206428527832031, "global_step": 79817, "epoch": 1900} {"train_loss": -6.097229480743408, "global_step": 79818, "epoch": 1900} {"train_loss": -6.2298431396484375, "global_step": 79819, "epoch": 1900} {"train_loss": -6.063813209533691, "global_step": 79820, "epoch": 1900} {"train_loss": -6.05633544921875, "global_step": 79821, "epoch": 1900} {"train_loss": -6.144573211669922, "global_step": 79822, "epoch": 1900} {"train_loss": -6.109524250030518, "global_step": 79823, "epoch": 1900} {"train_loss": -6.155320167541504, "global_step": 79824, "epoch": 1900} {"train_loss": -6.128473281860352, "global_step": 79825, "epoch": 1900} {"train_loss": -6.221689224243164, "global_step": 79826, "epoch": 1900} {"train_loss": -6.119717597961426, "global_step": 79827, "epoch": 1900} {"train_loss": -6.236728668212891, "global_step": 79828, "epoch": 1900} {"train_loss": -6.076736927032471, "global_step": 79829, "epoch": 1900} {"train_loss": -6.188754558563232, "global_step": 79830, "epoch": 1900} {"train_loss": -6.253559112548828, "global_step": 79831, "epoch": 1900} {"train_loss": -6.06394100189209, "global_step": 79832, "epoch": 1900} {"train_loss": -6.123654842376709, "global_step": 79833, "epoch": 1900} {"train_loss": -6.0823211669921875, "global_step": 79834, "epoch": 1900} {"train_loss": -6.141699314117432, "global_step": 79835, "epoch": 1900} {"train_loss": -6.252071380615234, "global_step": 79836, "epoch": 1900} {"train_loss": -6.155910015106201, "global_step": 79837, "epoch": 1900} {"train_loss": -6.241249084472656, "global_step": 79838, "epoch": 1900} {"train_loss": -6.143653869628906, "global_step": 79839, "epoch": 1900} {"train_loss": -6.1173624992370605, "global_step": 79840, "epoch": 1900} {"train_loss": -6.157789593651181, "global_step": 79841, "epoch": 1900, "train/sim_max_reward_0": 0.2219532264532795, "train/sim_max_reward_1": 0.9424206327042368, "train/sim_max_reward_2": 0.9744788115937778, "train/sim_max_reward_3": 0.7863520295575042, "train/sim_max_reward_4": 0.9845684673385889, "train/sim_max_reward_5": 0.9861025591867689, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5510466326790653, "test/sim_max_reward_4300002": 0.7609762460942469, "test/sim_max_reward_4300003": 0.8572920725465737, "test/sim_max_reward_4300004": 0.33838248587035435, "test/sim_max_reward_4300005": 0.7798705540697187, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.6051011152580951, "test/sim_max_reward_4300008": 0.7671058321850669, "test/sim_max_reward_4300009": 0.9702178011697802, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.6336451473028739, "test/sim_max_reward_4300012": 0.6344040381843423, "test/sim_max_reward_4300013": 0.9362301152557791, "test/sim_max_reward_4300014": 0.8445807132985974, "test/sim_max_reward_4300015": 0.5112630317132876, "test/sim_max_reward_4300016": 0.16815810070338502, "test/sim_max_reward_4300017": 0.9619207408514552, "test/sim_max_reward_4300018": 0.8551550151711109, "test/sim_max_reward_4300019": 0.1850994362027303, "test/sim_max_reward_4300020": 0.8061104306001184, "test/sim_max_reward_4300021": 0.8182963142742462, "test/sim_max_reward_4300022": 0.8588520867986169, "test/sim_max_reward_4300023": 0.3465579913953398, "test/sim_max_reward_4300024": 0.0, "test/sim_max_reward_4300025": 0.9771861829684487, "test/sim_max_reward_4300026": 0.11947952971336823, "test/sim_max_reward_4300027": 0.9384026201087816, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.5797459210582071, "test/sim_max_reward_4300030": 0.3300228767166406, "test/sim_max_reward_4300031": 0.7761825394787258, "test/sim_max_reward_4300032": 0.9032123211334917, "test/sim_max_reward_4300033": 0.9674798946144377, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.2514591665023441, "test/sim_max_reward_4300036": 0.20072761425821564, "test/sim_max_reward_4300037": 0.6972079204280217, "test/sim_max_reward_4300038": 0.870814740615877, "test/sim_max_reward_4300039": 0.3922057295140946, "test/sim_max_reward_4300040": 0.34347145503406085, "test/sim_max_reward_4300041": 1.0, "test/sim_max_reward_4300042": 0.7266474171327076, "test/sim_max_reward_4300043": 0.13594594639644067, "test/sim_max_reward_4300044": 0.7029441377445277, "test/sim_max_reward_4300045": 0.49890461648473333, "test/sim_max_reward_4300046": 0.29500058472820795, "test/sim_max_reward_4300047": 0.12308685404527007, "test/sim_max_reward_4300048": 0.8978941144916989, "test/sim_max_reward_4300049": 0.1131726950866236, "train/mean_score": 0.8159792878056927, "test/mean_score": 0.5406292155975941, "val_loss": 62095.08203125} {"train_loss": -6.070455551147461, "global_step": 79842, "epoch": 1901} {"train_loss": -6.1641950607299805, "global_step": 79843, "epoch": 1901} {"train_loss": -6.149798393249512, "global_step": 79844, "epoch": 1901} {"train_loss": -6.247779846191406, "global_step": 79845, "epoch": 1901} {"train_loss": -6.179660320281982, "global_step": 79846, "epoch": 1901} {"train_loss": -6.124917030334473, "global_step": 79847, "epoch": 1901} {"train_loss": -6.111227989196777, "global_step": 79848, "epoch": 1901} {"train_loss": -6.112790107727051, "global_step": 79849, "epoch": 1901} {"train_loss": -6.131424427032471, "global_step": 79850, "epoch": 1901} {"train_loss": -6.182826042175293, "global_step": 79851, "epoch": 1901} {"train_loss": -6.075255870819092, "global_step": 79852, "epoch": 1901} {"train_loss": -6.199997901916504, "global_step": 79853, "epoch": 1901} {"train_loss": -6.11809778213501, "global_step": 79854, "epoch": 1901} {"train_loss": -6.159470081329346, "global_step": 79855, "epoch": 1901} {"train_loss": -6.069817543029785, "global_step": 79856, "epoch": 1901} {"train_loss": -6.208887577056885, "global_step": 79857, "epoch": 1901} {"train_loss": -6.141050338745117, "global_step": 79858, "epoch": 1901} {"train_loss": -6.175989627838135, "global_step": 79859, "epoch": 1901} {"train_loss": -6.219343662261963, "global_step": 79860, "epoch": 1901} {"train_loss": -6.0576958656311035, "global_step": 79861, "epoch": 1901} {"train_loss": -6.2484211921691895, "global_step": 79862, "epoch": 1901} {"train_loss": -6.189306735992432, "global_step": 79863, "epoch": 1901} {"train_loss": -6.156773567199707, "global_step": 79864, "epoch": 1901} {"train_loss": -6.197248458862305, "global_step": 79865, "epoch": 1901} {"train_loss": -6.137862205505371, "global_step": 79866, "epoch": 1901} {"train_loss": -6.208728313446045, "global_step": 79867, "epoch": 1901} {"train_loss": -6.288676738739014, "global_step": 79868, "epoch": 1901} {"train_loss": -6.222773551940918, "global_step": 79869, "epoch": 1901} {"train_loss": -6.217961311340332, "global_step": 79870, "epoch": 1901} {"train_loss": -6.151090621948242, "global_step": 79871, "epoch": 1901} {"train_loss": -6.229426860809326, "global_step": 79872, "epoch": 1901} {"train_loss": -6.14238166809082, "global_step": 79873, "epoch": 1901} {"train_loss": -6.031576633453369, "global_step": 79874, "epoch": 1901} {"train_loss": -6.13741397857666, "global_step": 79875, "epoch": 1901} {"train_loss": -6.199655055999756, "global_step": 79876, "epoch": 1901} {"train_loss": -6.167973518371582, "global_step": 79877, "epoch": 1901} {"train_loss": -6.15163516998291, "global_step": 79878, "epoch": 1901} {"train_loss": -6.1534104347229, "global_step": 79879, "epoch": 1901} {"train_loss": -6.209743022918701, "global_step": 79880, "epoch": 1901} {"train_loss": -6.168554306030273, "global_step": 79881, "epoch": 1901} {"train_loss": -6.2605743408203125, "global_step": 79882, "epoch": 1901} {"train_loss": -6.163418996901739, "global_step": 79883, "epoch": 1901, "val_loss": 62233.90625} {"train_loss": -6.239353179931641, "global_step": 79884, "epoch": 1902} {"train_loss": -6.165889263153076, "global_step": 79885, "epoch": 1902} {"train_loss": -6.147751808166504, "global_step": 79886, "epoch": 1902} {"train_loss": -6.149508476257324, "global_step": 79887, "epoch": 1902} {"train_loss": -5.931215763092041, "global_step": 79888, "epoch": 1902} {"train_loss": -5.9499406814575195, "global_step": 79889, "epoch": 1902} {"train_loss": -6.130486011505127, "global_step": 79890, "epoch": 1902} {"train_loss": -6.085792541503906, "global_step": 79891, "epoch": 1902} {"train_loss": -6.055292129516602, "global_step": 79892, "epoch": 1902} {"train_loss": -6.14244270324707, "global_step": 79893, "epoch": 1902} {"train_loss": -5.988211631774902, "global_step": 79894, "epoch": 1902} {"train_loss": -6.033984184265137, "global_step": 79895, "epoch": 1902} {"train_loss": -6.047264099121094, "global_step": 79896, "epoch": 1902} {"train_loss": -6.057805061340332, "global_step": 79897, "epoch": 1902} {"train_loss": -6.090642929077148, "global_step": 79898, "epoch": 1902} {"train_loss": -6.141609191894531, "global_step": 79899, "epoch": 1902} {"train_loss": -6.1808061599731445, "global_step": 79900, "epoch": 1902} {"train_loss": -6.16454553604126, "global_step": 79901, "epoch": 1902} {"train_loss": -6.235598564147949, "global_step": 79902, "epoch": 1902} {"train_loss": -6.1262736320495605, "global_step": 79903, "epoch": 1902} {"train_loss": -6.112351894378662, "global_step": 79904, "epoch": 1902} {"train_loss": -6.124615669250488, "global_step": 79905, "epoch": 1902} {"train_loss": -6.123204231262207, "global_step": 79906, "epoch": 1902} {"train_loss": -6.092397689819336, "global_step": 79907, "epoch": 1902} {"train_loss": -6.178189277648926, "global_step": 79908, "epoch": 1902} {"train_loss": -6.14984130859375, "global_step": 79909, "epoch": 1902} {"train_loss": -6.154754638671875, "global_step": 79910, "epoch": 1902} {"train_loss": -6.211206436157227, "global_step": 79911, "epoch": 1902} {"train_loss": -6.015374183654785, "global_step": 79912, "epoch": 1902} {"train_loss": -6.162407398223877, "global_step": 79913, "epoch": 1902} {"train_loss": -6.151376724243164, "global_step": 79914, "epoch": 1902} {"train_loss": -6.114885330200195, "global_step": 79915, "epoch": 1902} {"train_loss": -6.147741794586182, "global_step": 79916, "epoch": 1902} {"train_loss": -6.080440521240234, "global_step": 79917, "epoch": 1902} {"train_loss": -6.026174545288086, "global_step": 79918, "epoch": 1902} {"train_loss": -6.241778373718262, "global_step": 79919, "epoch": 1902} {"train_loss": -6.230739593505859, "global_step": 79920, "epoch": 1902} {"train_loss": -6.0219526290893555, "global_step": 79921, "epoch": 1902} {"train_loss": -6.224186897277832, "global_step": 79922, "epoch": 1902} {"train_loss": -6.180206298828125, "global_step": 79923, "epoch": 1902} {"train_loss": -6.107611656188965, "global_step": 79924, "epoch": 1902} {"train_loss": -6.120790402094523, "global_step": 79925, "epoch": 1902, "val_loss": 62223.13671875} {"train_loss": -6.061874866485596, "global_step": 79926, "epoch": 1903} {"train_loss": -6.160140037536621, "global_step": 79927, "epoch": 1903} {"train_loss": -5.987787246704102, "global_step": 79928, "epoch": 1903} {"train_loss": -6.095509052276611, "global_step": 79929, "epoch": 1903} {"train_loss": -6.198715686798096, "global_step": 79930, "epoch": 1903} {"train_loss": -6.118496417999268, "global_step": 79931, "epoch": 1903} {"train_loss": -6.021301746368408, "global_step": 79932, "epoch": 1903} {"train_loss": -6.134089469909668, "global_step": 79933, "epoch": 1903} {"train_loss": -6.169084548950195, "global_step": 79934, "epoch": 1903} {"train_loss": -6.109734058380127, "global_step": 79935, "epoch": 1903} {"train_loss": -6.2316389083862305, "global_step": 79936, "epoch": 1903} {"train_loss": -6.042941093444824, "global_step": 79937, "epoch": 1903} {"train_loss": -6.004232406616211, "global_step": 79938, "epoch": 1903} {"train_loss": -6.120659828186035, "global_step": 79939, "epoch": 1903} {"train_loss": -6.162148952484131, "global_step": 79940, "epoch": 1903} {"train_loss": -5.996675968170166, "global_step": 79941, "epoch": 1903} {"train_loss": -6.051284313201904, "global_step": 79942, "epoch": 1903} {"train_loss": -6.071140289306641, "global_step": 79943, "epoch": 1903} {"train_loss": -6.2311296463012695, "global_step": 79944, "epoch": 1903} {"train_loss": -6.2365875244140625, "global_step": 79945, "epoch": 1903} {"train_loss": -6.164615631103516, "global_step": 79946, "epoch": 1903} {"train_loss": -6.208227157592773, "global_step": 79947, "epoch": 1903} {"train_loss": -6.14085578918457, "global_step": 79948, "epoch": 1903} {"train_loss": -6.090723514556885, "global_step": 79949, "epoch": 1903} {"train_loss": -6.132355213165283, "global_step": 79950, "epoch": 1903} {"train_loss": -6.037306785583496, "global_step": 79951, "epoch": 1903} {"train_loss": -6.001859188079834, "global_step": 79952, "epoch": 1903} {"train_loss": -6.277285575866699, "global_step": 79953, "epoch": 1903} {"train_loss": -6.199487686157227, "global_step": 79954, "epoch": 1903} {"train_loss": -6.141635417938232, "global_step": 79955, "epoch": 1903} {"train_loss": -6.24571418762207, "global_step": 79956, "epoch": 1903} {"train_loss": -6.052098274230957, "global_step": 79957, "epoch": 1903} {"train_loss": -6.054862022399902, "global_step": 79958, "epoch": 1903} {"train_loss": -6.245636940002441, "global_step": 79959, "epoch": 1903} {"train_loss": -6.146575927734375, "global_step": 79960, "epoch": 1903} {"train_loss": -6.010035514831543, "global_step": 79961, "epoch": 1903} {"train_loss": -6.242334365844727, "global_step": 79962, "epoch": 1903} {"train_loss": -6.131704330444336, "global_step": 79963, "epoch": 1903} {"train_loss": -6.129524230957031, "global_step": 79964, "epoch": 1903} {"train_loss": -6.219904899597168, "global_step": 79965, "epoch": 1903} {"train_loss": -6.127847671508789, "global_step": 79966, "epoch": 1903} {"train_loss": -6.125738825116839, "global_step": 79967, "epoch": 1903, "val_loss": 62421.09375} {"train_loss": -6.096685409545898, "global_step": 79968, "epoch": 1904} {"train_loss": -6.08137321472168, "global_step": 79969, "epoch": 1904} {"train_loss": -6.123230934143066, "global_step": 79970, "epoch": 1904} {"train_loss": -6.042595863342285, "global_step": 79971, "epoch": 1904} {"train_loss": -6.093733787536621, "global_step": 79972, "epoch": 1904} {"train_loss": -6.056634426116943, "global_step": 79973, "epoch": 1904} {"train_loss": -6.127346515655518, "global_step": 79974, "epoch": 1904} {"train_loss": -6.106917381286621, "global_step": 79975, "epoch": 1904} {"train_loss": -6.174794673919678, "global_step": 79976, "epoch": 1904} {"train_loss": -6.146546840667725, "global_step": 79977, "epoch": 1904} {"train_loss": -6.179231643676758, "global_step": 79978, "epoch": 1904} {"train_loss": -6.149162769317627, "global_step": 79979, "epoch": 1904} {"train_loss": -6.086061000823975, "global_step": 79980, "epoch": 1904} {"train_loss": -6.1041460037231445, "global_step": 79981, "epoch": 1904} {"train_loss": -6.054966449737549, "global_step": 79982, "epoch": 1904} {"train_loss": -6.003871917724609, "global_step": 79983, "epoch": 1904} {"train_loss": -6.157636642456055, "global_step": 79984, "epoch": 1904} {"train_loss": -6.187097072601318, "global_step": 79985, "epoch": 1904} {"train_loss": -6.123891830444336, "global_step": 79986, "epoch": 1904} {"train_loss": -6.17009973526001, "global_step": 79987, "epoch": 1904} {"train_loss": -6.078685760498047, "global_step": 79988, "epoch": 1904} {"train_loss": -6.242264747619629, "global_step": 79989, "epoch": 1904} {"train_loss": -6.1859636306762695, "global_step": 79990, "epoch": 1904} {"train_loss": -6.214786529541016, "global_step": 79991, "epoch": 1904} {"train_loss": -6.203218460083008, "global_step": 79992, "epoch": 1904} {"train_loss": -6.143526077270508, "global_step": 79993, "epoch": 1904} {"train_loss": -6.078485488891602, "global_step": 79994, "epoch": 1904} {"train_loss": -6.0398335456848145, "global_step": 79995, "epoch": 1904} {"train_loss": -6.153894901275635, "global_step": 79996, "epoch": 1904} {"train_loss": -6.135165691375732, "global_step": 79997, "epoch": 1904} {"train_loss": -6.06127405166626, "global_step": 79998, "epoch": 1904} {"train_loss": -6.120240688323975, "global_step": 79999, "epoch": 1904} {"train_loss": -6.16990852355957, "global_step": 80000, "epoch": 1904} {"train_loss": -6.171419143676758, "global_step": 80001, "epoch": 1904} {"train_loss": -6.059854507446289, "global_step": 80002, "epoch": 1904} {"train_loss": -6.209011554718018, "global_step": 80003, "epoch": 1904} {"train_loss": -6.082090854644775, "global_step": 80004, "epoch": 1904} {"train_loss": -6.084446430206299, "global_step": 80005, "epoch": 1904} {"train_loss": -6.204323768615723, "global_step": 80006, "epoch": 1904} {"train_loss": -6.2101922035217285, "global_step": 80007, "epoch": 1904} {"train_loss": -6.107259273529053, "global_step": 80008, "epoch": 1904} {"train_loss": -6.128137168430147, "global_step": 80009, "epoch": 1904, "val_loss": 62184.05078125} {"train_loss": -6.129242420196533, "global_step": 80010, "epoch": 1905} {"train_loss": -6.110290050506592, "global_step": 80011, "epoch": 1905} {"train_loss": -6.222463607788086, "global_step": 80012, "epoch": 1905} {"train_loss": -6.134336948394775, "global_step": 80013, "epoch": 1905} {"train_loss": -6.082406997680664, "global_step": 80014, "epoch": 1905} {"train_loss": -6.185107231140137, "global_step": 80015, "epoch": 1905} {"train_loss": -6.133222579956055, "global_step": 80016, "epoch": 1905} {"train_loss": -6.192095756530762, "global_step": 80017, "epoch": 1905} {"train_loss": -6.080453872680664, "global_step": 80018, "epoch": 1905} {"train_loss": -6.1873674392700195, "global_step": 80019, "epoch": 1905} {"train_loss": -6.117005348205566, "global_step": 80020, "epoch": 1905} {"train_loss": -6.072346210479736, "global_step": 80021, "epoch": 1905} {"train_loss": -6.190800666809082, "global_step": 80022, "epoch": 1905} {"train_loss": -6.163536071777344, "global_step": 80023, "epoch": 1905} {"train_loss": -6.234647750854492, "global_step": 80024, "epoch": 1905} {"train_loss": -6.096066951751709, "global_step": 80025, "epoch": 1905} {"train_loss": -6.210201263427734, "global_step": 80026, "epoch": 1905} {"train_loss": -6.146414756774902, "global_step": 80027, "epoch": 1905} {"train_loss": -6.125237464904785, "global_step": 80028, "epoch": 1905} {"train_loss": -6.155233383178711, "global_step": 80029, "epoch": 1905} {"train_loss": -6.099028587341309, "global_step": 80030, "epoch": 1905} {"train_loss": -6.205615520477295, "global_step": 80031, "epoch": 1905} {"train_loss": -6.149385452270508, "global_step": 80032, "epoch": 1905} {"train_loss": -6.122705936431885, "global_step": 80033, "epoch": 1905} {"train_loss": -6.095728874206543, "global_step": 80034, "epoch": 1905} {"train_loss": -6.111350059509277, "global_step": 80035, "epoch": 1905} {"train_loss": -6.136162757873535, "global_step": 80036, "epoch": 1905} {"train_loss": -6.11962890625, "global_step": 80037, "epoch": 1905} {"train_loss": -6.154191493988037, "global_step": 80038, "epoch": 1905} {"train_loss": -5.847843170166016, "global_step": 80039, "epoch": 1905} {"train_loss": -6.029707431793213, "global_step": 80040, "epoch": 1905} {"train_loss": -6.105114936828613, "global_step": 80041, "epoch": 1905} {"train_loss": -6.0071492195129395, "global_step": 80042, "epoch": 1905} {"train_loss": -6.273852348327637, "global_step": 80043, "epoch": 1905} {"train_loss": -5.932355880737305, "global_step": 80044, "epoch": 1905} {"train_loss": -6.028781890869141, "global_step": 80045, "epoch": 1905} {"train_loss": -6.0774245262146, "global_step": 80046, "epoch": 1905} {"train_loss": -6.007648468017578, "global_step": 80047, "epoch": 1905} {"train_loss": -6.277591228485107, "global_step": 80048, "epoch": 1905} {"train_loss": -6.043055534362793, "global_step": 80049, "epoch": 1905} {"train_loss": -6.153014183044434, "global_step": 80050, "epoch": 1905} {"train_loss": -6.1202690941946845, "global_step": 80051, "epoch": 1905, "val_loss": 62740.6640625} {"train_loss": -6.005422592163086, "global_step": 80052, "epoch": 1906} {"train_loss": -6.2200846672058105, "global_step": 80053, "epoch": 1906} {"train_loss": -6.110415458679199, "global_step": 80054, "epoch": 1906} {"train_loss": -6.213611602783203, "global_step": 80055, "epoch": 1906} {"train_loss": -6.140201568603516, "global_step": 80056, "epoch": 1906} {"train_loss": -6.210623741149902, "global_step": 80057, "epoch": 1906} {"train_loss": -6.189686298370361, "global_step": 80058, "epoch": 1906} {"train_loss": -6.183816909790039, "global_step": 80059, "epoch": 1906} {"train_loss": -6.224614143371582, "global_step": 80060, "epoch": 1906} {"train_loss": -6.124128818511963, "global_step": 80061, "epoch": 1906} {"train_loss": -6.108739376068115, "global_step": 80062, "epoch": 1906} {"train_loss": -6.143824577331543, "global_step": 80063, "epoch": 1906} {"train_loss": -6.2657575607299805, "global_step": 80064, "epoch": 1906} {"train_loss": -6.078152656555176, "global_step": 80065, "epoch": 1906} {"train_loss": -6.206844329833984, "global_step": 80066, "epoch": 1906} {"train_loss": -6.179469108581543, "global_step": 80067, "epoch": 1906} {"train_loss": -6.121983528137207, "global_step": 80068, "epoch": 1906} {"train_loss": -6.054201126098633, "global_step": 80069, "epoch": 1906} {"train_loss": -6.116924285888672, "global_step": 80070, "epoch": 1906} {"train_loss": -6.104240417480469, "global_step": 80071, "epoch": 1906} {"train_loss": -6.295156955718994, "global_step": 80072, "epoch": 1906} {"train_loss": -6.089678764343262, "global_step": 80073, "epoch": 1906} {"train_loss": -5.995296955108643, "global_step": 80074, "epoch": 1906} {"train_loss": -6.158543586730957, "global_step": 80075, "epoch": 1906} {"train_loss": -6.073945999145508, "global_step": 80076, "epoch": 1906} {"train_loss": -6.172019958496094, "global_step": 80077, "epoch": 1906} {"train_loss": -6.046069145202637, "global_step": 80078, "epoch": 1906} {"train_loss": -6.122272968292236, "global_step": 80079, "epoch": 1906} {"train_loss": -6.1880269050598145, "global_step": 80080, "epoch": 1906} {"train_loss": -6.165705680847168, "global_step": 80081, "epoch": 1906} {"train_loss": -6.187773704528809, "global_step": 80082, "epoch": 1906} {"train_loss": -6.097830772399902, "global_step": 80083, "epoch": 1906} {"train_loss": -6.1444902420043945, "global_step": 80084, "epoch": 1906} {"train_loss": -6.129852294921875, "global_step": 80085, "epoch": 1906} {"train_loss": -6.122106552124023, "global_step": 80086, "epoch": 1906} {"train_loss": -6.179905414581299, "global_step": 80087, "epoch": 1906} {"train_loss": -6.109593391418457, "global_step": 80088, "epoch": 1906} {"train_loss": -6.207797050476074, "global_step": 80089, "epoch": 1906} {"train_loss": -6.190114498138428, "global_step": 80090, "epoch": 1906} {"train_loss": -6.107959747314453, "global_step": 80091, "epoch": 1906} {"train_loss": -6.209022045135498, "global_step": 80092, "epoch": 1906} {"train_loss": -6.145924556823004, "global_step": 80093, "epoch": 1906, "val_loss": 62574.84375} {"train_loss": -6.2652082443237305, "global_step": 80094, "epoch": 1907} {"train_loss": -6.193559169769287, "global_step": 80095, "epoch": 1907} {"train_loss": -6.325604438781738, "global_step": 80096, "epoch": 1907} {"train_loss": -6.1171393394470215, "global_step": 80097, "epoch": 1907} {"train_loss": -6.256384372711182, "global_step": 80098, "epoch": 1907} {"train_loss": -6.1495795249938965, "global_step": 80099, "epoch": 1907} {"train_loss": -6.149553298950195, "global_step": 80100, "epoch": 1907} {"train_loss": -6.170681953430176, "global_step": 80101, "epoch": 1907} {"train_loss": -6.167193412780762, "global_step": 80102, "epoch": 1907} {"train_loss": -6.147038459777832, "global_step": 80103, "epoch": 1907} {"train_loss": -6.17926025390625, "global_step": 80104, "epoch": 1907} {"train_loss": -6.171835899353027, "global_step": 80105, "epoch": 1907} {"train_loss": -6.194503307342529, "global_step": 80106, "epoch": 1907} {"train_loss": -6.1920247077941895, "global_step": 80107, "epoch": 1907} {"train_loss": -6.095772743225098, "global_step": 80108, "epoch": 1907} {"train_loss": -6.155716896057129, "global_step": 80109, "epoch": 1907} {"train_loss": -6.086074352264404, "global_step": 80110, "epoch": 1907} {"train_loss": -6.155294418334961, "global_step": 80111, "epoch": 1907} {"train_loss": -6.064912796020508, "global_step": 80112, "epoch": 1907} {"train_loss": -6.16603946685791, "global_step": 80113, "epoch": 1907} {"train_loss": -6.245525360107422, "global_step": 80114, "epoch": 1907} {"train_loss": -6.080662250518799, "global_step": 80115, "epoch": 1907} {"train_loss": -6.081880569458008, "global_step": 80116, "epoch": 1907} {"train_loss": -6.178954124450684, "global_step": 80117, "epoch": 1907} {"train_loss": -6.05137825012207, "global_step": 80118, "epoch": 1907} {"train_loss": -6.123068809509277, "global_step": 80119, "epoch": 1907} {"train_loss": -6.163791179656982, "global_step": 80120, "epoch": 1907} {"train_loss": -6.166473388671875, "global_step": 80121, "epoch": 1907} {"train_loss": -6.147304058074951, "global_step": 80122, "epoch": 1907} {"train_loss": -6.214538097381592, "global_step": 80123, "epoch": 1907} {"train_loss": -6.233339786529541, "global_step": 80124, "epoch": 1907} {"train_loss": -6.2385406494140625, "global_step": 80125, "epoch": 1907} {"train_loss": -6.079051971435547, "global_step": 80126, "epoch": 1907} {"train_loss": -6.124320030212402, "global_step": 80127, "epoch": 1907} {"train_loss": -6.128404140472412, "global_step": 80128, "epoch": 1907} {"train_loss": -6.087873458862305, "global_step": 80129, "epoch": 1907} {"train_loss": -6.163443565368652, "global_step": 80130, "epoch": 1907} {"train_loss": -6.106392860412598, "global_step": 80131, "epoch": 1907} {"train_loss": -6.2009663581848145, "global_step": 80132, "epoch": 1907} {"train_loss": -6.14932918548584, "global_step": 80133, "epoch": 1907} {"train_loss": -6.182123184204102, "global_step": 80134, "epoch": 1907} {"train_loss": -6.159434307189215, "global_step": 80135, "epoch": 1907, "val_loss": 62366.38671875} {"train_loss": -6.217812538146973, "global_step": 80136, "epoch": 1908} {"train_loss": -6.176290512084961, "global_step": 80137, "epoch": 1908} {"train_loss": -6.248526573181152, "global_step": 80138, "epoch": 1908} {"train_loss": -6.147490501403809, "global_step": 80139, "epoch": 1908} {"train_loss": -6.101572036743164, "global_step": 80140, "epoch": 1908} {"train_loss": -6.165687084197998, "global_step": 80141, "epoch": 1908} {"train_loss": -6.065007209777832, "global_step": 80142, "epoch": 1908} {"train_loss": -6.107148170471191, "global_step": 80143, "epoch": 1908} {"train_loss": -6.104861259460449, "global_step": 80144, "epoch": 1908} {"train_loss": -6.239738464355469, "global_step": 80145, "epoch": 1908} {"train_loss": -6.248619556427002, "global_step": 80146, "epoch": 1908} {"train_loss": -6.176604270935059, "global_step": 80147, "epoch": 1908} {"train_loss": -6.184146881103516, "global_step": 80148, "epoch": 1908} {"train_loss": -6.119877815246582, "global_step": 80149, "epoch": 1908} {"train_loss": -6.002051830291748, "global_step": 80150, "epoch": 1908} {"train_loss": -6.19286584854126, "global_step": 80151, "epoch": 1908} {"train_loss": -6.299919605255127, "global_step": 80152, "epoch": 1908} {"train_loss": -6.188078880310059, "global_step": 80153, "epoch": 1908} {"train_loss": -6.128544807434082, "global_step": 80154, "epoch": 1908} {"train_loss": -6.121594429016113, "global_step": 80155, "epoch": 1908} {"train_loss": -6.1377668380737305, "global_step": 80156, "epoch": 1908} {"train_loss": -6.2568206787109375, "global_step": 80157, "epoch": 1908} {"train_loss": -6.131416320800781, "global_step": 80158, "epoch": 1908} {"train_loss": -6.1411895751953125, "global_step": 80159, "epoch": 1908} {"train_loss": -6.112156391143799, "global_step": 80160, "epoch": 1908} {"train_loss": -6.157292366027832, "global_step": 80161, "epoch": 1908} {"train_loss": -6.108220100402832, "global_step": 80162, "epoch": 1908} {"train_loss": -6.125581741333008, "global_step": 80163, "epoch": 1908} {"train_loss": -6.171103477478027, "global_step": 80164, "epoch": 1908} {"train_loss": -6.224871635437012, "global_step": 80165, "epoch": 1908} {"train_loss": -6.104840278625488, "global_step": 80166, "epoch": 1908} {"train_loss": -6.186877250671387, "global_step": 80167, "epoch": 1908} {"train_loss": -6.114508628845215, "global_step": 80168, "epoch": 1908} {"train_loss": -6.181787014007568, "global_step": 80169, "epoch": 1908} {"train_loss": -6.136449337005615, "global_step": 80170, "epoch": 1908} {"train_loss": -6.248046875, "global_step": 80171, "epoch": 1908} {"train_loss": -6.143842697143555, "global_step": 80172, "epoch": 1908} {"train_loss": -6.262335777282715, "global_step": 80173, "epoch": 1908} {"train_loss": -6.135287761688232, "global_step": 80174, "epoch": 1908} {"train_loss": -6.15402364730835, "global_step": 80175, "epoch": 1908} {"train_loss": -6.115087985992432, "global_step": 80176, "epoch": 1908} {"train_loss": -6.160762162435622, "global_step": 80177, "epoch": 1908, "val_loss": 62462.46875} {"train_loss": -6.094032287597656, "global_step": 80178, "epoch": 1909} {"train_loss": -6.247915267944336, "global_step": 80179, "epoch": 1909} {"train_loss": -6.206911087036133, "global_step": 80180, "epoch": 1909} {"train_loss": -6.111619472503662, "global_step": 80181, "epoch": 1909} {"train_loss": -6.224221706390381, "global_step": 80182, "epoch": 1909} {"train_loss": -6.091304302215576, "global_step": 80183, "epoch": 1909} {"train_loss": -6.160172939300537, "global_step": 80184, "epoch": 1909} {"train_loss": -6.0818376541137695, "global_step": 80185, "epoch": 1909} {"train_loss": -6.085120677947998, "global_step": 80186, "epoch": 1909} {"train_loss": -6.137361526489258, "global_step": 80187, "epoch": 1909} {"train_loss": -6.152055740356445, "global_step": 80188, "epoch": 1909} {"train_loss": -6.126161575317383, "global_step": 80189, "epoch": 1909} {"train_loss": -6.191851615905762, "global_step": 80190, "epoch": 1909} {"train_loss": -6.215775489807129, "global_step": 80191, "epoch": 1909} {"train_loss": -5.976691722869873, "global_step": 80192, "epoch": 1909} {"train_loss": -6.153977870941162, "global_step": 80193, "epoch": 1909} {"train_loss": -6.330283164978027, "global_step": 80194, "epoch": 1909} {"train_loss": -6.146681785583496, "global_step": 80195, "epoch": 1909} {"train_loss": -6.186548233032227, "global_step": 80196, "epoch": 1909} {"train_loss": -6.106070518493652, "global_step": 80197, "epoch": 1909} {"train_loss": -6.077154159545898, "global_step": 80198, "epoch": 1909} {"train_loss": -6.141644477844238, "global_step": 80199, "epoch": 1909} {"train_loss": -6.2263946533203125, "global_step": 80200, "epoch": 1909} {"train_loss": -6.068728923797607, "global_step": 80201, "epoch": 1909} {"train_loss": -6.081707954406738, "global_step": 80202, "epoch": 1909} {"train_loss": -6.13712215423584, "global_step": 80203, "epoch": 1909} {"train_loss": -6.125615119934082, "global_step": 80204, "epoch": 1909} {"train_loss": -6.154677867889404, "global_step": 80205, "epoch": 1909} {"train_loss": -6.24839973449707, "global_step": 80206, "epoch": 1909} {"train_loss": -6.142094135284424, "global_step": 80207, "epoch": 1909} {"train_loss": -6.060408115386963, "global_step": 80208, "epoch": 1909} {"train_loss": -6.144193172454834, "global_step": 80209, "epoch": 1909} {"train_loss": -6.091347694396973, "global_step": 80210, "epoch": 1909} {"train_loss": -6.146252632141113, "global_step": 80211, "epoch": 1909} {"train_loss": -6.210984230041504, "global_step": 80212, "epoch": 1909} {"train_loss": -6.075096607208252, "global_step": 80213, "epoch": 1909} {"train_loss": -6.224279880523682, "global_step": 80214, "epoch": 1909} {"train_loss": -6.103287220001221, "global_step": 80215, "epoch": 1909} {"train_loss": -6.051178455352783, "global_step": 80216, "epoch": 1909} {"train_loss": -6.153043746948242, "global_step": 80217, "epoch": 1909} {"train_loss": -6.119631767272949, "global_step": 80218, "epoch": 1909} {"train_loss": -6.14339448156811, "global_step": 80219, "epoch": 1909, "val_loss": 62148.34765625} {"train_loss": -6.2404398918151855, "global_step": 80220, "epoch": 1910} {"train_loss": -6.179408550262451, "global_step": 80221, "epoch": 1910} {"train_loss": -6.206657409667969, "global_step": 80222, "epoch": 1910} {"train_loss": -6.255227565765381, "global_step": 80223, "epoch": 1910} {"train_loss": -6.18366003036499, "global_step": 80224, "epoch": 1910} {"train_loss": -6.155550003051758, "global_step": 80225, "epoch": 1910} {"train_loss": -6.106694221496582, "global_step": 80226, "epoch": 1910} {"train_loss": -6.143365859985352, "global_step": 80227, "epoch": 1910} {"train_loss": -6.102023124694824, "global_step": 80228, "epoch": 1910} {"train_loss": -6.270207405090332, "global_step": 80229, "epoch": 1910} {"train_loss": -6.146671295166016, "global_step": 80230, "epoch": 1910} {"train_loss": -6.090463638305664, "global_step": 80231, "epoch": 1910} {"train_loss": -6.2124857902526855, "global_step": 80232, "epoch": 1910} {"train_loss": -6.140957832336426, "global_step": 80233, "epoch": 1910} {"train_loss": -6.247755527496338, "global_step": 80234, "epoch": 1910} {"train_loss": -6.116469383239746, "global_step": 80235, "epoch": 1910} {"train_loss": -6.108960151672363, "global_step": 80236, "epoch": 1910} {"train_loss": -6.117465496063232, "global_step": 80237, "epoch": 1910} {"train_loss": -6.074499130249023, "global_step": 80238, "epoch": 1910} {"train_loss": -6.164253234863281, "global_step": 80239, "epoch": 1910} {"train_loss": -6.062393665313721, "global_step": 80240, "epoch": 1910} {"train_loss": -6.05792236328125, "global_step": 80241, "epoch": 1910} {"train_loss": -6.176326751708984, "global_step": 80242, "epoch": 1910} {"train_loss": -5.945943832397461, "global_step": 80243, "epoch": 1910} {"train_loss": -6.181297302246094, "global_step": 80244, "epoch": 1910} {"train_loss": -6.132491588592529, "global_step": 80245, "epoch": 1910} {"train_loss": -5.859947204589844, "global_step": 80246, "epoch": 1910} {"train_loss": -6.164637565612793, "global_step": 80247, "epoch": 1910} {"train_loss": -6.169823169708252, "global_step": 80248, "epoch": 1910} {"train_loss": -5.927321434020996, "global_step": 80249, "epoch": 1910} {"train_loss": -6.097026348114014, "global_step": 80250, "epoch": 1910} {"train_loss": -5.929325103759766, "global_step": 80251, "epoch": 1910} {"train_loss": -6.10420036315918, "global_step": 80252, "epoch": 1910} {"train_loss": -6.059727668762207, "global_step": 80253, "epoch": 1910} {"train_loss": -5.931244850158691, "global_step": 80254, "epoch": 1910} {"train_loss": -6.204379081726074, "global_step": 80255, "epoch": 1910} {"train_loss": -5.949934959411621, "global_step": 80256, "epoch": 1910} {"train_loss": -6.192410945892334, "global_step": 80257, "epoch": 1910} {"train_loss": -5.988593101501465, "global_step": 80258, "epoch": 1910} {"train_loss": -6.133599281311035, "global_step": 80259, "epoch": 1910} {"train_loss": -6.098247528076172, "global_step": 80260, "epoch": 1910} {"train_loss": -6.112164406549363, "global_step": 80261, "epoch": 1910, "val_loss": 62529.7265625} {"train_loss": -6.197510719299316, "global_step": 80262, "epoch": 1911} {"train_loss": -5.990509033203125, "global_step": 80263, "epoch": 1911} {"train_loss": -6.032262325286865, "global_step": 80264, "epoch": 1911} {"train_loss": -6.099851131439209, "global_step": 80265, "epoch": 1911} {"train_loss": -6.141768455505371, "global_step": 80266, "epoch": 1911} {"train_loss": -6.113217830657959, "global_step": 80267, "epoch": 1911} {"train_loss": -6.222221374511719, "global_step": 80268, "epoch": 1911} {"train_loss": -6.217223167419434, "global_step": 80269, "epoch": 1911} {"train_loss": -6.082494735717773, "global_step": 80270, "epoch": 1911} {"train_loss": -6.156250953674316, "global_step": 80271, "epoch": 1911} {"train_loss": -6.18472957611084, "global_step": 80272, "epoch": 1911} {"train_loss": -6.053993225097656, "global_step": 80273, "epoch": 1911} {"train_loss": -6.095709323883057, "global_step": 80274, "epoch": 1911} {"train_loss": -6.205641746520996, "global_step": 80275, "epoch": 1911} {"train_loss": -6.158585071563721, "global_step": 80276, "epoch": 1911} {"train_loss": -6.101949691772461, "global_step": 80277, "epoch": 1911} {"train_loss": -6.150511741638184, "global_step": 80278, "epoch": 1911} {"train_loss": -6.197648525238037, "global_step": 80279, "epoch": 1911} {"train_loss": -6.087762832641602, "global_step": 80280, "epoch": 1911} {"train_loss": -6.189536094665527, "global_step": 80281, "epoch": 1911} {"train_loss": -6.090075969696045, "global_step": 80282, "epoch": 1911} {"train_loss": -6.184123992919922, "global_step": 80283, "epoch": 1911} {"train_loss": -6.1588592529296875, "global_step": 80284, "epoch": 1911} {"train_loss": -6.101881980895996, "global_step": 80285, "epoch": 1911} {"train_loss": -6.143641471862793, "global_step": 80286, "epoch": 1911} {"train_loss": -6.103758335113525, "global_step": 80287, "epoch": 1911} {"train_loss": -6.039936065673828, "global_step": 80288, "epoch": 1911} {"train_loss": -6.006792068481445, "global_step": 80289, "epoch": 1911} {"train_loss": -6.120944023132324, "global_step": 80290, "epoch": 1911} {"train_loss": -6.076956748962402, "global_step": 80291, "epoch": 1911} {"train_loss": -6.087381362915039, "global_step": 80292, "epoch": 1911} {"train_loss": -6.028461456298828, "global_step": 80293, "epoch": 1911} {"train_loss": -6.038381576538086, "global_step": 80294, "epoch": 1911} {"train_loss": -6.214723587036133, "global_step": 80295, "epoch": 1911} {"train_loss": -6.149465560913086, "global_step": 80296, "epoch": 1911} {"train_loss": -6.022927284240723, "global_step": 80297, "epoch": 1911} {"train_loss": -6.131725788116455, "global_step": 80298, "epoch": 1911} {"train_loss": -6.132379055023193, "global_step": 80299, "epoch": 1911} {"train_loss": -5.975707530975342, "global_step": 80300, "epoch": 1911} {"train_loss": -5.988979339599609, "global_step": 80301, "epoch": 1911} {"train_loss": -6.034289360046387, "global_step": 80302, "epoch": 1911} {"train_loss": -6.108943519138155, "global_step": 80303, "epoch": 1911, "val_loss": 62367.89453125} {"train_loss": -6.098260402679443, "global_step": 80304, "epoch": 1912} {"train_loss": -6.084410667419434, "global_step": 80305, "epoch": 1912} {"train_loss": -6.136343002319336, "global_step": 80306, "epoch": 1912} {"train_loss": -6.0922160148620605, "global_step": 80307, "epoch": 1912} {"train_loss": -6.0956315994262695, "global_step": 80308, "epoch": 1912} {"train_loss": -6.110793113708496, "global_step": 80309, "epoch": 1912} {"train_loss": -6.136843681335449, "global_step": 80310, "epoch": 1912} {"train_loss": -6.048784255981445, "global_step": 80311, "epoch": 1912} {"train_loss": -6.123373985290527, "global_step": 80312, "epoch": 1912} {"train_loss": -6.147109031677246, "global_step": 80313, "epoch": 1912} {"train_loss": -6.071617126464844, "global_step": 80314, "epoch": 1912} {"train_loss": -6.168932914733887, "global_step": 80315, "epoch": 1912} {"train_loss": -5.907994747161865, "global_step": 80316, "epoch": 1912} {"train_loss": -6.059613227844238, "global_step": 80317, "epoch": 1912} {"train_loss": -6.015556335449219, "global_step": 80318, "epoch": 1912} {"train_loss": -6.229548931121826, "global_step": 80319, "epoch": 1912} {"train_loss": -6.113430023193359, "global_step": 80320, "epoch": 1912} {"train_loss": -6.104446887969971, "global_step": 80321, "epoch": 1912} {"train_loss": -6.134854316711426, "global_step": 80322, "epoch": 1912} {"train_loss": -6.110289573669434, "global_step": 80323, "epoch": 1912} {"train_loss": -6.228862762451172, "global_step": 80324, "epoch": 1912} {"train_loss": -6.141800880432129, "global_step": 80325, "epoch": 1912} {"train_loss": -6.252597808837891, "global_step": 80326, "epoch": 1912} {"train_loss": -6.223087310791016, "global_step": 80327, "epoch": 1912} {"train_loss": -6.043503761291504, "global_step": 80328, "epoch": 1912} {"train_loss": -6.187356948852539, "global_step": 80329, "epoch": 1912} {"train_loss": -6.132176399230957, "global_step": 80330, "epoch": 1912} {"train_loss": -6.137041091918945, "global_step": 80331, "epoch": 1912} {"train_loss": -6.180698394775391, "global_step": 80332, "epoch": 1912} {"train_loss": -6.160982131958008, "global_step": 80333, "epoch": 1912} {"train_loss": -6.189002990722656, "global_step": 80334, "epoch": 1912} {"train_loss": -6.099806785583496, "global_step": 80335, "epoch": 1912} {"train_loss": -6.2593841552734375, "global_step": 80336, "epoch": 1912} {"train_loss": -6.189105033874512, "global_step": 80337, "epoch": 1912} {"train_loss": -6.195932388305664, "global_step": 80338, "epoch": 1912} {"train_loss": -6.150258541107178, "global_step": 80339, "epoch": 1912} {"train_loss": -6.084444999694824, "global_step": 80340, "epoch": 1912} {"train_loss": -6.237817287445068, "global_step": 80341, "epoch": 1912} {"train_loss": -6.068248748779297, "global_step": 80342, "epoch": 1912} {"train_loss": -6.219760417938232, "global_step": 80343, "epoch": 1912} {"train_loss": -6.152199745178223, "global_step": 80344, "epoch": 1912} {"train_loss": -6.135501941045125, "global_step": 80345, "epoch": 1912, "val_loss": 62243.8359375} {"train_loss": -6.196871280670166, "global_step": 80346, "epoch": 1913} {"train_loss": -6.232540130615234, "global_step": 80347, "epoch": 1913} {"train_loss": -6.131626129150391, "global_step": 80348, "epoch": 1913} {"train_loss": -6.238122463226318, "global_step": 80349, "epoch": 1913} {"train_loss": -6.173669815063477, "global_step": 80350, "epoch": 1913} {"train_loss": -6.110246181488037, "global_step": 80351, "epoch": 1913} {"train_loss": -6.207786560058594, "global_step": 80352, "epoch": 1913} {"train_loss": -6.192914962768555, "global_step": 80353, "epoch": 1913} {"train_loss": -6.04643440246582, "global_step": 80354, "epoch": 1913} {"train_loss": -6.117107391357422, "global_step": 80355, "epoch": 1913} {"train_loss": -6.2086639404296875, "global_step": 80356, "epoch": 1913} {"train_loss": -6.116432189941406, "global_step": 80357, "epoch": 1913} {"train_loss": -6.257714748382568, "global_step": 80358, "epoch": 1913} {"train_loss": -6.055099010467529, "global_step": 80359, "epoch": 1913} {"train_loss": -6.184494972229004, "global_step": 80360, "epoch": 1913} {"train_loss": -6.085200309753418, "global_step": 80361, "epoch": 1913} {"train_loss": -5.986737251281738, "global_step": 80362, "epoch": 1913} {"train_loss": -6.065866470336914, "global_step": 80363, "epoch": 1913} {"train_loss": -6.161414623260498, "global_step": 80364, "epoch": 1913} {"train_loss": -6.0818634033203125, "global_step": 80365, "epoch": 1913} {"train_loss": -6.2099609375, "global_step": 80366, "epoch": 1913} {"train_loss": -6.281192779541016, "global_step": 80367, "epoch": 1913} {"train_loss": -6.147106647491455, "global_step": 80368, "epoch": 1913} {"train_loss": -6.11711311340332, "global_step": 80369, "epoch": 1913} {"train_loss": -6.108969688415527, "global_step": 80370, "epoch": 1913} {"train_loss": -5.94416618347168, "global_step": 80371, "epoch": 1913} {"train_loss": -6.047147750854492, "global_step": 80372, "epoch": 1913} {"train_loss": -5.968227386474609, "global_step": 80373, "epoch": 1913} {"train_loss": -6.037112236022949, "global_step": 80374, "epoch": 1913} {"train_loss": -6.299698352813721, "global_step": 80375, "epoch": 1913} {"train_loss": -5.983860015869141, "global_step": 80376, "epoch": 1913} {"train_loss": -6.2547383308410645, "global_step": 80377, "epoch": 1913} {"train_loss": -6.2136359214782715, "global_step": 80378, "epoch": 1913} {"train_loss": -6.0741777420043945, "global_step": 80379, "epoch": 1913} {"train_loss": -6.107516288757324, "global_step": 80380, "epoch": 1913} {"train_loss": -6.0537919998168945, "global_step": 80381, "epoch": 1913} {"train_loss": -6.070958137512207, "global_step": 80382, "epoch": 1913} {"train_loss": -6.144902229309082, "global_step": 80383, "epoch": 1913} {"train_loss": -6.032353401184082, "global_step": 80384, "epoch": 1913} {"train_loss": -6.142087936401367, "global_step": 80385, "epoch": 1913} {"train_loss": -6.07187032699585, "global_step": 80386, "epoch": 1913} {"train_loss": -6.127505257016137, "global_step": 80387, "epoch": 1913, "val_loss": 62332.36328125} {"train_loss": -6.136073112487793, "global_step": 80388, "epoch": 1914} {"train_loss": -6.185980796813965, "global_step": 80389, "epoch": 1914} {"train_loss": -6.209567070007324, "global_step": 80390, "epoch": 1914} {"train_loss": -6.270537376403809, "global_step": 80391, "epoch": 1914} {"train_loss": -6.258487701416016, "global_step": 80392, "epoch": 1914} {"train_loss": -6.309154033660889, "global_step": 80393, "epoch": 1914} {"train_loss": -6.085638046264648, "global_step": 80394, "epoch": 1914} {"train_loss": -6.049192905426025, "global_step": 80395, "epoch": 1914} {"train_loss": -6.15192985534668, "global_step": 80396, "epoch": 1914} {"train_loss": -6.215784072875977, "global_step": 80397, "epoch": 1914} {"train_loss": -6.150351047515869, "global_step": 80398, "epoch": 1914} {"train_loss": -6.236346244812012, "global_step": 80399, "epoch": 1914} {"train_loss": -6.2707648277282715, "global_step": 80400, "epoch": 1914} {"train_loss": -6.258652210235596, "global_step": 80401, "epoch": 1914} {"train_loss": -6.070996284484863, "global_step": 80402, "epoch": 1914} {"train_loss": -6.04068660736084, "global_step": 80403, "epoch": 1914} {"train_loss": -6.156440258026123, "global_step": 80404, "epoch": 1914} {"train_loss": -6.198700428009033, "global_step": 80405, "epoch": 1914} {"train_loss": -6.048006057739258, "global_step": 80406, "epoch": 1914} {"train_loss": -6.176670551300049, "global_step": 80407, "epoch": 1914} {"train_loss": -6.107846736907959, "global_step": 80408, "epoch": 1914} {"train_loss": -6.157622337341309, "global_step": 80409, "epoch": 1914} {"train_loss": -6.202122688293457, "global_step": 80410, "epoch": 1914} {"train_loss": -6.170166015625, "global_step": 80411, "epoch": 1914} {"train_loss": -6.104962348937988, "global_step": 80412, "epoch": 1914} {"train_loss": -6.230908393859863, "global_step": 80413, "epoch": 1914} {"train_loss": -6.052643775939941, "global_step": 80414, "epoch": 1914} {"train_loss": -6.138416290283203, "global_step": 80415, "epoch": 1914} {"train_loss": -6.252599239349365, "global_step": 80416, "epoch": 1914} {"train_loss": -6.210324287414551, "global_step": 80417, "epoch": 1914} {"train_loss": -6.153416633605957, "global_step": 80418, "epoch": 1914} {"train_loss": -6.127542495727539, "global_step": 80419, "epoch": 1914} {"train_loss": -6.151766777038574, "global_step": 80420, "epoch": 1914} {"train_loss": -6.252751350402832, "global_step": 80421, "epoch": 1914} {"train_loss": -6.174219131469727, "global_step": 80422, "epoch": 1914} {"train_loss": -6.118852138519287, "global_step": 80423, "epoch": 1914} {"train_loss": -6.10173225402832, "global_step": 80424, "epoch": 1914} {"train_loss": -6.228719234466553, "global_step": 80425, "epoch": 1914} {"train_loss": -6.140665054321289, "global_step": 80426, "epoch": 1914} {"train_loss": -6.150135040283203, "global_step": 80427, "epoch": 1914} {"train_loss": -6.213428497314453, "global_step": 80428, "epoch": 1914} {"train_loss": -6.165235201517741, "global_step": 80429, "epoch": 1914, "val_loss": 62410.4609375} {"train_loss": -6.06714391708374, "global_step": 80430, "epoch": 1915} {"train_loss": -6.145674705505371, "global_step": 80431, "epoch": 1915} {"train_loss": -6.116505146026611, "global_step": 80432, "epoch": 1915} {"train_loss": -6.1829023361206055, "global_step": 80433, "epoch": 1915} {"train_loss": -6.237064361572266, "global_step": 80434, "epoch": 1915} {"train_loss": -6.274111747741699, "global_step": 80435, "epoch": 1915} {"train_loss": -6.124176502227783, "global_step": 80436, "epoch": 1915} {"train_loss": -6.292791366577148, "global_step": 80437, "epoch": 1915} {"train_loss": -6.089454174041748, "global_step": 80438, "epoch": 1915} {"train_loss": -6.190836429595947, "global_step": 80439, "epoch": 1915} {"train_loss": -6.1102705001831055, "global_step": 80440, "epoch": 1915} {"train_loss": -6.073237419128418, "global_step": 80441, "epoch": 1915} {"train_loss": -6.10926628112793, "global_step": 80442, "epoch": 1915} {"train_loss": -6.245993614196777, "global_step": 80443, "epoch": 1915} {"train_loss": -6.148769378662109, "global_step": 80444, "epoch": 1915} {"train_loss": -6.1832170486450195, "global_step": 80445, "epoch": 1915} {"train_loss": -6.161427021026611, "global_step": 80446, "epoch": 1915} {"train_loss": -6.205951690673828, "global_step": 80447, "epoch": 1915} {"train_loss": -6.123192310333252, "global_step": 80448, "epoch": 1915} {"train_loss": -6.0718278884887695, "global_step": 80449, "epoch": 1915} {"train_loss": -6.164594650268555, "global_step": 80450, "epoch": 1915} {"train_loss": -6.2143449783325195, "global_step": 80451, "epoch": 1915} {"train_loss": -6.117463111877441, "global_step": 80452, "epoch": 1915} {"train_loss": -6.197795867919922, "global_step": 80453, "epoch": 1915} {"train_loss": -6.104995250701904, "global_step": 80454, "epoch": 1915} {"train_loss": -6.189383506774902, "global_step": 80455, "epoch": 1915} {"train_loss": -6.146231651306152, "global_step": 80456, "epoch": 1915} {"train_loss": -6.125813961029053, "global_step": 80457, "epoch": 1915} {"train_loss": -6.061983108520508, "global_step": 80458, "epoch": 1915} {"train_loss": -6.092691421508789, "global_step": 80459, "epoch": 1915} {"train_loss": -6.13458251953125, "global_step": 80460, "epoch": 1915} {"train_loss": -6.273074150085449, "global_step": 80461, "epoch": 1915} {"train_loss": -6.115697860717773, "global_step": 80462, "epoch": 1915} {"train_loss": -6.25155782699585, "global_step": 80463, "epoch": 1915} {"train_loss": -6.181920051574707, "global_step": 80464, "epoch": 1915} {"train_loss": -6.225908279418945, "global_step": 80465, "epoch": 1915} {"train_loss": -6.170377731323242, "global_step": 80466, "epoch": 1915} {"train_loss": -6.162097930908203, "global_step": 80467, "epoch": 1915} {"train_loss": -6.197945594787598, "global_step": 80468, "epoch": 1915} {"train_loss": -6.137369155883789, "global_step": 80469, "epoch": 1915} {"train_loss": -6.166745185852051, "global_step": 80470, "epoch": 1915} {"train_loss": -6.163522720336914, "global_step": 80471, "epoch": 1915, "val_loss": 62640.25390625} {"train_loss": -6.235625267028809, "global_step": 80472, "epoch": 1916} {"train_loss": -6.196313381195068, "global_step": 80473, "epoch": 1916} {"train_loss": -6.212718486785889, "global_step": 80474, "epoch": 1916} {"train_loss": -6.187297821044922, "global_step": 80475, "epoch": 1916} {"train_loss": -6.178399562835693, "global_step": 80476, "epoch": 1916} {"train_loss": -6.179065704345703, "global_step": 80477, "epoch": 1916} {"train_loss": -6.178891181945801, "global_step": 80478, "epoch": 1916} {"train_loss": -6.1386308670043945, "global_step": 80479, "epoch": 1916} {"train_loss": -6.308409690856934, "global_step": 80480, "epoch": 1916} {"train_loss": -6.199113368988037, "global_step": 80481, "epoch": 1916} {"train_loss": -6.204921722412109, "global_step": 80482, "epoch": 1916} {"train_loss": -6.224571704864502, "global_step": 80483, "epoch": 1916} {"train_loss": -6.264179229736328, "global_step": 80484, "epoch": 1916} {"train_loss": -6.0601396560668945, "global_step": 80485, "epoch": 1916} {"train_loss": -6.085052490234375, "global_step": 80486, "epoch": 1916} {"train_loss": -6.12891960144043, "global_step": 80487, "epoch": 1916} {"train_loss": -6.106451988220215, "global_step": 80488, "epoch": 1916} {"train_loss": -6.1619873046875, "global_step": 80489, "epoch": 1916} {"train_loss": -6.099180698394775, "global_step": 80490, "epoch": 1916} {"train_loss": -6.296921730041504, "global_step": 80491, "epoch": 1916} {"train_loss": -6.143880367279053, "global_step": 80492, "epoch": 1916} {"train_loss": -5.95753812789917, "global_step": 80493, "epoch": 1916} {"train_loss": -6.048882484436035, "global_step": 80494, "epoch": 1916} {"train_loss": -6.144346714019775, "global_step": 80495, "epoch": 1916} {"train_loss": -6.046520233154297, "global_step": 80496, "epoch": 1916} {"train_loss": -6.1331586837768555, "global_step": 80497, "epoch": 1916} {"train_loss": -6.122004985809326, "global_step": 80498, "epoch": 1916} {"train_loss": -6.204421043395996, "global_step": 80499, "epoch": 1916} {"train_loss": -6.2804388999938965, "global_step": 80500, "epoch": 1916} {"train_loss": -6.095535755157471, "global_step": 80501, "epoch": 1916} {"train_loss": -6.032347202301025, "global_step": 80502, "epoch": 1916} {"train_loss": -6.1057024002075195, "global_step": 80503, "epoch": 1916} {"train_loss": -6.142951488494873, "global_step": 80504, "epoch": 1916} {"train_loss": -6.046387672424316, "global_step": 80505, "epoch": 1916} {"train_loss": -6.111360549926758, "global_step": 80506, "epoch": 1916} {"train_loss": -6.150110721588135, "global_step": 80507, "epoch": 1916} {"train_loss": -6.082756996154785, "global_step": 80508, "epoch": 1916} {"train_loss": -6.208366394042969, "global_step": 80509, "epoch": 1916} {"train_loss": -6.041098594665527, "global_step": 80510, "epoch": 1916} {"train_loss": -6.235394477844238, "global_step": 80511, "epoch": 1916} {"train_loss": -6.100583553314209, "global_step": 80512, "epoch": 1916} {"train_loss": -6.1484442211332775, "global_step": 80513, "epoch": 1916, "val_loss": 62349.65234375} {"train_loss": -6.224149703979492, "global_step": 80514, "epoch": 1917} {"train_loss": -6.151600360870361, "global_step": 80515, "epoch": 1917} {"train_loss": -6.307490825653076, "global_step": 80516, "epoch": 1917} {"train_loss": -6.193595886230469, "global_step": 80517, "epoch": 1917} {"train_loss": -6.210042476654053, "global_step": 80518, "epoch": 1917} {"train_loss": -6.126402854919434, "global_step": 80519, "epoch": 1917} {"train_loss": -6.163785457611084, "global_step": 80520, "epoch": 1917} {"train_loss": -6.181235313415527, "global_step": 80521, "epoch": 1917} {"train_loss": -6.1065802574157715, "global_step": 80522, "epoch": 1917} {"train_loss": -6.137911796569824, "global_step": 80523, "epoch": 1917} {"train_loss": -6.131818771362305, "global_step": 80524, "epoch": 1917} {"train_loss": -6.14304256439209, "global_step": 80525, "epoch": 1917} {"train_loss": -6.194350242614746, "global_step": 80526, "epoch": 1917} {"train_loss": -6.2109270095825195, "global_step": 80527, "epoch": 1917} {"train_loss": -6.140810012817383, "global_step": 80528, "epoch": 1917} {"train_loss": -6.163036346435547, "global_step": 80529, "epoch": 1917} {"train_loss": -6.219242572784424, "global_step": 80530, "epoch": 1917} {"train_loss": -6.1941986083984375, "global_step": 80531, "epoch": 1917} {"train_loss": -6.213588714599609, "global_step": 80532, "epoch": 1917} {"train_loss": -6.183685779571533, "global_step": 80533, "epoch": 1917} {"train_loss": -6.123968601226807, "global_step": 80534, "epoch": 1917} {"train_loss": -6.161317825317383, "global_step": 80535, "epoch": 1917} {"train_loss": -6.204965114593506, "global_step": 80536, "epoch": 1917} {"train_loss": -6.197250843048096, "global_step": 80537, "epoch": 1917} {"train_loss": -6.176179885864258, "global_step": 80538, "epoch": 1917} {"train_loss": -6.268150806427002, "global_step": 80539, "epoch": 1917} {"train_loss": -6.239789962768555, "global_step": 80540, "epoch": 1917} {"train_loss": -6.225955009460449, "global_step": 80541, "epoch": 1917} {"train_loss": -6.3021087646484375, "global_step": 80542, "epoch": 1917} {"train_loss": -6.339532852172852, "global_step": 80543, "epoch": 1917} {"train_loss": -6.082802772521973, "global_step": 80544, "epoch": 1917} {"train_loss": -6.09000825881958, "global_step": 80545, "epoch": 1917} {"train_loss": -6.043363571166992, "global_step": 80546, "epoch": 1917} {"train_loss": -6.255010604858398, "global_step": 80547, "epoch": 1917} {"train_loss": -6.214944839477539, "global_step": 80548, "epoch": 1917} {"train_loss": -6.104280471801758, "global_step": 80549, "epoch": 1917} {"train_loss": -6.196393966674805, "global_step": 80550, "epoch": 1917} {"train_loss": -6.165224552154541, "global_step": 80551, "epoch": 1917} {"train_loss": -6.106764316558838, "global_step": 80552, "epoch": 1917} {"train_loss": -6.113307476043701, "global_step": 80553, "epoch": 1917} {"train_loss": -6.089306831359863, "global_step": 80554, "epoch": 1917} {"train_loss": -6.176410936173939, "global_step": 80555, "epoch": 1917, "val_loss": 62417.7109375} {"train_loss": -6.211916923522949, "global_step": 80556, "epoch": 1918} {"train_loss": -6.207510471343994, "global_step": 80557, "epoch": 1918} {"train_loss": -6.225348472595215, "global_step": 80558, "epoch": 1918} {"train_loss": -6.13535213470459, "global_step": 80559, "epoch": 1918} {"train_loss": -6.245571136474609, "global_step": 80560, "epoch": 1918} {"train_loss": -6.125064373016357, "global_step": 80561, "epoch": 1918} {"train_loss": -6.1050639152526855, "global_step": 80562, "epoch": 1918} {"train_loss": -6.135254383087158, "global_step": 80563, "epoch": 1918} {"train_loss": -6.220826148986816, "global_step": 80564, "epoch": 1918} {"train_loss": -6.153990745544434, "global_step": 80565, "epoch": 1918} {"train_loss": -6.128913402557373, "global_step": 80566, "epoch": 1918} {"train_loss": -6.037815093994141, "global_step": 80567, "epoch": 1918} {"train_loss": -6.097541332244873, "global_step": 80568, "epoch": 1918} {"train_loss": -6.120534896850586, "global_step": 80569, "epoch": 1918} {"train_loss": -6.205334186553955, "global_step": 80570, "epoch": 1918} {"train_loss": -6.136141777038574, "global_step": 80571, "epoch": 1918} {"train_loss": -6.222278594970703, "global_step": 80572, "epoch": 1918} {"train_loss": -6.179357051849365, "global_step": 80573, "epoch": 1918} {"train_loss": -6.2690582275390625, "global_step": 80574, "epoch": 1918} {"train_loss": -6.0982666015625, "global_step": 80575, "epoch": 1918} {"train_loss": -6.04482364654541, "global_step": 80576, "epoch": 1918} {"train_loss": -6.210507869720459, "global_step": 80577, "epoch": 1918} {"train_loss": -6.184334754943848, "global_step": 80578, "epoch": 1918} {"train_loss": -6.11994743347168, "global_step": 80579, "epoch": 1918} {"train_loss": -6.069642066955566, "global_step": 80580, "epoch": 1918} {"train_loss": -6.1176958084106445, "global_step": 80581, "epoch": 1918} {"train_loss": -6.116847991943359, "global_step": 80582, "epoch": 1918} {"train_loss": -6.133174419403076, "global_step": 80583, "epoch": 1918} {"train_loss": -6.146724700927734, "global_step": 80584, "epoch": 1918} {"train_loss": -6.068470478057861, "global_step": 80585, "epoch": 1918} {"train_loss": -6.115898609161377, "global_step": 80586, "epoch": 1918} {"train_loss": -6.099885940551758, "global_step": 80587, "epoch": 1918} {"train_loss": -6.083938121795654, "global_step": 80588, "epoch": 1918} {"train_loss": -6.161802291870117, "global_step": 80589, "epoch": 1918} {"train_loss": -6.248536586761475, "global_step": 80590, "epoch": 1918} {"train_loss": -6.25400447845459, "global_step": 80591, "epoch": 1918} {"train_loss": -6.091569423675537, "global_step": 80592, "epoch": 1918} {"train_loss": -6.127219200134277, "global_step": 80593, "epoch": 1918} {"train_loss": -6.153944492340088, "global_step": 80594, "epoch": 1918} {"train_loss": -6.07205867767334, "global_step": 80595, "epoch": 1918} {"train_loss": -6.191981792449951, "global_step": 80596, "epoch": 1918} {"train_loss": -6.148285343533471, "global_step": 80597, "epoch": 1918, "val_loss": 62309.9609375} {"train_loss": -6.120178699493408, "global_step": 80598, "epoch": 1919} {"train_loss": -6.105739116668701, "global_step": 80599, "epoch": 1919} {"train_loss": -6.113644123077393, "global_step": 80600, "epoch": 1919} {"train_loss": -6.157302379608154, "global_step": 80601, "epoch": 1919} {"train_loss": -6.115611553192139, "global_step": 80602, "epoch": 1919} {"train_loss": -6.169424057006836, "global_step": 80603, "epoch": 1919} {"train_loss": -6.139366149902344, "global_step": 80604, "epoch": 1919} {"train_loss": -5.902548313140869, "global_step": 80605, "epoch": 1919} {"train_loss": -6.123019695281982, "global_step": 80606, "epoch": 1919} {"train_loss": -6.064709186553955, "global_step": 80607, "epoch": 1919} {"train_loss": -6.035655498504639, "global_step": 80608, "epoch": 1919} {"train_loss": -6.116982460021973, "global_step": 80609, "epoch": 1919} {"train_loss": -6.0721635818481445, "global_step": 80610, "epoch": 1919} {"train_loss": -6.128696441650391, "global_step": 80611, "epoch": 1919} {"train_loss": -6.258427619934082, "global_step": 80612, "epoch": 1919} {"train_loss": -6.226733207702637, "global_step": 80613, "epoch": 1919} {"train_loss": -6.251850128173828, "global_step": 80614, "epoch": 1919} {"train_loss": -6.120363712310791, "global_step": 80615, "epoch": 1919} {"train_loss": -6.230879783630371, "global_step": 80616, "epoch": 1919} {"train_loss": -6.092776775360107, "global_step": 80617, "epoch": 1919} {"train_loss": -6.091925621032715, "global_step": 80618, "epoch": 1919} {"train_loss": -6.174543380737305, "global_step": 80619, "epoch": 1919} {"train_loss": -6.14679479598999, "global_step": 80620, "epoch": 1919} {"train_loss": -6.202640056610107, "global_step": 80621, "epoch": 1919} {"train_loss": -6.1765360832214355, "global_step": 80622, "epoch": 1919} {"train_loss": -6.087257385253906, "global_step": 80623, "epoch": 1919} {"train_loss": -6.152632236480713, "global_step": 80624, "epoch": 1919} {"train_loss": -6.183943748474121, "global_step": 80625, "epoch": 1919} {"train_loss": -6.257370948791504, "global_step": 80626, "epoch": 1919} {"train_loss": -6.107034683227539, "global_step": 80627, "epoch": 1919} {"train_loss": -6.23193883895874, "global_step": 80628, "epoch": 1919} {"train_loss": -6.164750576019287, "global_step": 80629, "epoch": 1919} {"train_loss": -6.199635028839111, "global_step": 80630, "epoch": 1919} {"train_loss": -6.128324508666992, "global_step": 80631, "epoch": 1919} {"train_loss": -6.10809326171875, "global_step": 80632, "epoch": 1919} {"train_loss": -6.055516719818115, "global_step": 80633, "epoch": 1919} {"train_loss": -6.247204780578613, "global_step": 80634, "epoch": 1919} {"train_loss": -6.037143707275391, "global_step": 80635, "epoch": 1919} {"train_loss": -6.197685241699219, "global_step": 80636, "epoch": 1919} {"train_loss": -6.146139144897461, "global_step": 80637, "epoch": 1919} {"train_loss": -6.037691116333008, "global_step": 80638, "epoch": 1919} {"train_loss": -6.139085213343303, "global_step": 80639, "epoch": 1919, "val_loss": 62388.44921875} {"train_loss": -6.018442630767822, "global_step": 80640, "epoch": 1920} {"train_loss": -6.161386013031006, "global_step": 80641, "epoch": 1920} {"train_loss": -6.19502067565918, "global_step": 80642, "epoch": 1920} {"train_loss": -6.058852195739746, "global_step": 80643, "epoch": 1920} {"train_loss": -6.0906500816345215, "global_step": 80644, "epoch": 1920} {"train_loss": -6.134624481201172, "global_step": 80645, "epoch": 1920} {"train_loss": -6.160517692565918, "global_step": 80646, "epoch": 1920} {"train_loss": -6.229767799377441, "global_step": 80647, "epoch": 1920} {"train_loss": -6.1441473960876465, "global_step": 80648, "epoch": 1920} {"train_loss": -5.947973728179932, "global_step": 80649, "epoch": 1920} {"train_loss": -6.213285446166992, "global_step": 80650, "epoch": 1920} {"train_loss": -6.155384063720703, "global_step": 80651, "epoch": 1920} {"train_loss": -6.013103485107422, "global_step": 80652, "epoch": 1920} {"train_loss": -6.070889472961426, "global_step": 80653, "epoch": 1920} {"train_loss": -6.203774452209473, "global_step": 80654, "epoch": 1920} {"train_loss": -6.134993553161621, "global_step": 80655, "epoch": 1920} {"train_loss": -6.0436506271362305, "global_step": 80656, "epoch": 1920} {"train_loss": -6.162138938903809, "global_step": 80657, "epoch": 1920} {"train_loss": -6.168143272399902, "global_step": 80658, "epoch": 1920} {"train_loss": -6.002835273742676, "global_step": 80659, "epoch": 1920} {"train_loss": -6.104158401489258, "global_step": 80660, "epoch": 1920} {"train_loss": -5.984597682952881, "global_step": 80661, "epoch": 1920} {"train_loss": -6.0850067138671875, "global_step": 80662, "epoch": 1920} {"train_loss": -6.140468597412109, "global_step": 80663, "epoch": 1920} {"train_loss": -6.066378593444824, "global_step": 80664, "epoch": 1920} {"train_loss": -6.072652816772461, "global_step": 80665, "epoch": 1920} {"train_loss": -6.212944984436035, "global_step": 80666, "epoch": 1920} {"train_loss": -6.0901665687561035, "global_step": 80667, "epoch": 1920} {"train_loss": -6.086899757385254, "global_step": 80668, "epoch": 1920} {"train_loss": -6.198419570922852, "global_step": 80669, "epoch": 1920} {"train_loss": -6.079346656799316, "global_step": 80670, "epoch": 1920} {"train_loss": -6.280706405639648, "global_step": 80671, "epoch": 1920} {"train_loss": -6.1552228927612305, "global_step": 80672, "epoch": 1920} {"train_loss": -6.0724029541015625, "global_step": 80673, "epoch": 1920} {"train_loss": -6.0784406661987305, "global_step": 80674, "epoch": 1920} {"train_loss": -6.171232223510742, "global_step": 80675, "epoch": 1920} {"train_loss": -6.177016258239746, "global_step": 80676, "epoch": 1920} {"train_loss": -6.080327033996582, "global_step": 80677, "epoch": 1920} {"train_loss": -6.201664924621582, "global_step": 80678, "epoch": 1920} {"train_loss": -6.161667346954346, "global_step": 80679, "epoch": 1920} {"train_loss": -6.0287699699401855, "global_step": 80680, "epoch": 1920} {"train_loss": -6.119460457847232, "global_step": 80681, "epoch": 1920, "val_loss": 62316.140625} {"train_loss": -6.226557731628418, "global_step": 80682, "epoch": 1921} {"train_loss": -6.239097595214844, "global_step": 80683, "epoch": 1921} {"train_loss": -6.100067138671875, "global_step": 80684, "epoch": 1921} {"train_loss": -6.125286102294922, "global_step": 80685, "epoch": 1921} {"train_loss": -6.121376991271973, "global_step": 80686, "epoch": 1921} {"train_loss": -6.243350028991699, "global_step": 80687, "epoch": 1921} {"train_loss": -6.0936384201049805, "global_step": 80688, "epoch": 1921} {"train_loss": -6.26137638092041, "global_step": 80689, "epoch": 1921} {"train_loss": -6.086034774780273, "global_step": 80690, "epoch": 1921} {"train_loss": -6.167290687561035, "global_step": 80691, "epoch": 1921} {"train_loss": -6.1249895095825195, "global_step": 80692, "epoch": 1921} {"train_loss": -6.155625343322754, "global_step": 80693, "epoch": 1921} {"train_loss": -6.097696781158447, "global_step": 80694, "epoch": 1921} {"train_loss": -6.080879211425781, "global_step": 80695, "epoch": 1921} {"train_loss": -6.127684593200684, "global_step": 80696, "epoch": 1921} {"train_loss": -6.21582555770874, "global_step": 80697, "epoch": 1921} {"train_loss": -6.097891807556152, "global_step": 80698, "epoch": 1921} {"train_loss": -6.163934230804443, "global_step": 80699, "epoch": 1921} {"train_loss": -6.086490631103516, "global_step": 80700, "epoch": 1921} {"train_loss": -6.180294036865234, "global_step": 80701, "epoch": 1921} {"train_loss": -6.236364841461182, "global_step": 80702, "epoch": 1921} {"train_loss": -6.11037015914917, "global_step": 80703, "epoch": 1921} {"train_loss": -6.132411956787109, "global_step": 80704, "epoch": 1921} {"train_loss": -6.188549518585205, "global_step": 80705, "epoch": 1921} {"train_loss": -6.062094688415527, "global_step": 80706, "epoch": 1921} {"train_loss": -6.047109127044678, "global_step": 80707, "epoch": 1921} {"train_loss": -6.138062000274658, "global_step": 80708, "epoch": 1921} {"train_loss": -6.11182975769043, "global_step": 80709, "epoch": 1921} {"train_loss": -6.225193023681641, "global_step": 80710, "epoch": 1921} {"train_loss": -6.2448015213012695, "global_step": 80711, "epoch": 1921} {"train_loss": -6.2428879737854, "global_step": 80712, "epoch": 1921} {"train_loss": -6.132762908935547, "global_step": 80713, "epoch": 1921} {"train_loss": -6.203261375427246, "global_step": 80714, "epoch": 1921} {"train_loss": -6.188790798187256, "global_step": 80715, "epoch": 1921} {"train_loss": -6.1438140869140625, "global_step": 80716, "epoch": 1921} {"train_loss": -6.0840301513671875, "global_step": 80717, "epoch": 1921} {"train_loss": -6.1737380027771, "global_step": 80718, "epoch": 1921} {"train_loss": -6.240487575531006, "global_step": 80719, "epoch": 1921} {"train_loss": -6.249495029449463, "global_step": 80720, "epoch": 1921} {"train_loss": -6.203060150146484, "global_step": 80721, "epoch": 1921} {"train_loss": -6.257195472717285, "global_step": 80722, "epoch": 1921} {"train_loss": -6.161883399600074, "global_step": 80723, "epoch": 1921, "val_loss": 62340.23046875} {"train_loss": -6.2670512199401855, "global_step": 80724, "epoch": 1922} {"train_loss": -6.213771820068359, "global_step": 80725, "epoch": 1922} {"train_loss": -6.134654998779297, "global_step": 80726, "epoch": 1922} {"train_loss": -6.114863872528076, "global_step": 80727, "epoch": 1922} {"train_loss": -6.092128753662109, "global_step": 80728, "epoch": 1922} {"train_loss": -6.171308994293213, "global_step": 80729, "epoch": 1922} {"train_loss": -6.208967685699463, "global_step": 80730, "epoch": 1922} {"train_loss": -6.228626251220703, "global_step": 80731, "epoch": 1922} {"train_loss": -6.302082061767578, "global_step": 80732, "epoch": 1922} {"train_loss": -6.19382381439209, "global_step": 80733, "epoch": 1922} {"train_loss": -6.228825092315674, "global_step": 80734, "epoch": 1922} {"train_loss": -6.290714740753174, "global_step": 80735, "epoch": 1922} {"train_loss": -6.274999618530273, "global_step": 80736, "epoch": 1922} {"train_loss": -6.261058807373047, "global_step": 80737, "epoch": 1922} {"train_loss": -6.081696510314941, "global_step": 80738, "epoch": 1922} {"train_loss": -6.160408020019531, "global_step": 80739, "epoch": 1922} {"train_loss": -6.0966033935546875, "global_step": 80740, "epoch": 1922} {"train_loss": -6.116395950317383, "global_step": 80741, "epoch": 1922} {"train_loss": -6.155917167663574, "global_step": 80742, "epoch": 1922} {"train_loss": -5.953068256378174, "global_step": 80743, "epoch": 1922} {"train_loss": -6.28771448135376, "global_step": 80744, "epoch": 1922} {"train_loss": -6.135213375091553, "global_step": 80745, "epoch": 1922} {"train_loss": -6.052121162414551, "global_step": 80746, "epoch": 1922} {"train_loss": -6.191082000732422, "global_step": 80747, "epoch": 1922} {"train_loss": -6.17040491104126, "global_step": 80748, "epoch": 1922} {"train_loss": -6.18171501159668, "global_step": 80749, "epoch": 1922} {"train_loss": -6.104691982269287, "global_step": 80750, "epoch": 1922} {"train_loss": -6.07281494140625, "global_step": 80751, "epoch": 1922} {"train_loss": -6.112797737121582, "global_step": 80752, "epoch": 1922} {"train_loss": -6.218147277832031, "global_step": 80753, "epoch": 1922} {"train_loss": -6.195934295654297, "global_step": 80754, "epoch": 1922} {"train_loss": -6.222104549407959, "global_step": 80755, "epoch": 1922} {"train_loss": -6.145909309387207, "global_step": 80756, "epoch": 1922} {"train_loss": -6.209874153137207, "global_step": 80757, "epoch": 1922} {"train_loss": -6.171976089477539, "global_step": 80758, "epoch": 1922} {"train_loss": -6.193202018737793, "global_step": 80759, "epoch": 1922} {"train_loss": -6.072903633117676, "global_step": 80760, "epoch": 1922} {"train_loss": -6.098236083984375, "global_step": 80761, "epoch": 1922} {"train_loss": -6.227302074432373, "global_step": 80762, "epoch": 1922} {"train_loss": -6.127915382385254, "global_step": 80763, "epoch": 1922} {"train_loss": -6.096357822418213, "global_step": 80764, "epoch": 1922} {"train_loss": -6.164337112790062, "global_step": 80765, "epoch": 1922, "val_loss": 62330.09375} {"train_loss": -6.143113136291504, "global_step": 80766, "epoch": 1923} {"train_loss": -6.133403778076172, "global_step": 80767, "epoch": 1923} {"train_loss": -6.2515950202941895, "global_step": 80768, "epoch": 1923} {"train_loss": -6.269471168518066, "global_step": 80769, "epoch": 1923} {"train_loss": -6.258697032928467, "global_step": 80770, "epoch": 1923} {"train_loss": -6.2053070068359375, "global_step": 80771, "epoch": 1923} {"train_loss": -6.078252792358398, "global_step": 80772, "epoch": 1923} {"train_loss": -6.102655410766602, "global_step": 80773, "epoch": 1923} {"train_loss": -6.178953647613525, "global_step": 80774, "epoch": 1923} {"train_loss": -6.2507429122924805, "global_step": 80775, "epoch": 1923} {"train_loss": -6.23305606842041, "global_step": 80776, "epoch": 1923} {"train_loss": -6.218087196350098, "global_step": 80777, "epoch": 1923} {"train_loss": -6.286155700683594, "global_step": 80778, "epoch": 1923} {"train_loss": -6.120275974273682, "global_step": 80779, "epoch": 1923} {"train_loss": -6.1981892585754395, "global_step": 80780, "epoch": 1923} {"train_loss": -6.085041046142578, "global_step": 80781, "epoch": 1923} {"train_loss": -6.171034336090088, "global_step": 80782, "epoch": 1923} {"train_loss": -6.276608467102051, "global_step": 80783, "epoch": 1923} {"train_loss": -6.149350166320801, "global_step": 80784, "epoch": 1923} {"train_loss": -6.144421577453613, "global_step": 80785, "epoch": 1923} {"train_loss": -6.146024227142334, "global_step": 80786, "epoch": 1923} {"train_loss": -6.141169548034668, "global_step": 80787, "epoch": 1923} {"train_loss": -6.240976810455322, "global_step": 80788, "epoch": 1923} {"train_loss": -6.110348701477051, "global_step": 80789, "epoch": 1923} {"train_loss": -6.266404151916504, "global_step": 80790, "epoch": 1923} {"train_loss": -6.214969158172607, "global_step": 80791, "epoch": 1923} {"train_loss": -6.163797855377197, "global_step": 80792, "epoch": 1923} {"train_loss": -6.151732921600342, "global_step": 80793, "epoch": 1923} {"train_loss": -6.170320987701416, "global_step": 80794, "epoch": 1923} {"train_loss": -6.157362937927246, "global_step": 80795, "epoch": 1923} {"train_loss": -6.168569087982178, "global_step": 80796, "epoch": 1923} {"train_loss": -6.171306610107422, "global_step": 80797, "epoch": 1923} {"train_loss": -6.144272804260254, "global_step": 80798, "epoch": 1923} {"train_loss": -6.227941989898682, "global_step": 80799, "epoch": 1923} {"train_loss": -6.077451705932617, "global_step": 80800, "epoch": 1923} {"train_loss": -6.130816459655762, "global_step": 80801, "epoch": 1923} {"train_loss": -6.0732574462890625, "global_step": 80802, "epoch": 1923} {"train_loss": -6.217774391174316, "global_step": 80803, "epoch": 1923} {"train_loss": -6.147886276245117, "global_step": 80804, "epoch": 1923} {"train_loss": -6.112185478210449, "global_step": 80805, "epoch": 1923} {"train_loss": -6.219249248504639, "global_step": 80806, "epoch": 1923} {"train_loss": -6.172403585343134, "global_step": 80807, "epoch": 1923, "val_loss": 62338.796875} {"train_loss": -6.101085662841797, "global_step": 80808, "epoch": 1924} {"train_loss": -6.130572319030762, "global_step": 80809, "epoch": 1924} {"train_loss": -6.0697736740112305, "global_step": 80810, "epoch": 1924} {"train_loss": -6.180109977722168, "global_step": 80811, "epoch": 1924} {"train_loss": -6.169631481170654, "global_step": 80812, "epoch": 1924} {"train_loss": -6.046241760253906, "global_step": 80813, "epoch": 1924} {"train_loss": -6.144245147705078, "global_step": 80814, "epoch": 1924} {"train_loss": -6.15210485458374, "global_step": 80815, "epoch": 1924} {"train_loss": -6.207094192504883, "global_step": 80816, "epoch": 1924} {"train_loss": -6.188050270080566, "global_step": 80817, "epoch": 1924} {"train_loss": -6.133705139160156, "global_step": 80818, "epoch": 1924} {"train_loss": -6.144039154052734, "global_step": 80819, "epoch": 1924} {"train_loss": -5.993701457977295, "global_step": 80820, "epoch": 1924} {"train_loss": -6.031206130981445, "global_step": 80821, "epoch": 1924} {"train_loss": -6.133397579193115, "global_step": 80822, "epoch": 1924} {"train_loss": -6.109818458557129, "global_step": 80823, "epoch": 1924} {"train_loss": -6.134087562561035, "global_step": 80824, "epoch": 1924} {"train_loss": -6.082633972167969, "global_step": 80825, "epoch": 1924} {"train_loss": -6.1817169189453125, "global_step": 80826, "epoch": 1924} {"train_loss": -6.1656646728515625, "global_step": 80827, "epoch": 1924} {"train_loss": -6.240727424621582, "global_step": 80828, "epoch": 1924} {"train_loss": -6.170074939727783, "global_step": 80829, "epoch": 1924} {"train_loss": -6.23325252532959, "global_step": 80830, "epoch": 1924} {"train_loss": -6.146020889282227, "global_step": 80831, "epoch": 1924} {"train_loss": -6.138740539550781, "global_step": 80832, "epoch": 1924} {"train_loss": -6.123801231384277, "global_step": 80833, "epoch": 1924} {"train_loss": -6.198431015014648, "global_step": 80834, "epoch": 1924} {"train_loss": -6.1744704246521, "global_step": 80835, "epoch": 1924} {"train_loss": -6.131516933441162, "global_step": 80836, "epoch": 1924} {"train_loss": -6.14376974105835, "global_step": 80837, "epoch": 1924} {"train_loss": -6.240946292877197, "global_step": 80838, "epoch": 1924} {"train_loss": -6.245232582092285, "global_step": 80839, "epoch": 1924} {"train_loss": -6.143370151519775, "global_step": 80840, "epoch": 1924} {"train_loss": -6.07499361038208, "global_step": 80841, "epoch": 1924} {"train_loss": -6.170842170715332, "global_step": 80842, "epoch": 1924} {"train_loss": -6.162763595581055, "global_step": 80843, "epoch": 1924} {"train_loss": -6.122086524963379, "global_step": 80844, "epoch": 1924} {"train_loss": -6.194717884063721, "global_step": 80845, "epoch": 1924} {"train_loss": -6.216825485229492, "global_step": 80846, "epoch": 1924} {"train_loss": -6.193978309631348, "global_step": 80847, "epoch": 1924} {"train_loss": -6.1756591796875, "global_step": 80848, "epoch": 1924} {"train_loss": -6.150189967382522, "global_step": 80849, "epoch": 1924, "val_loss": 62376.5546875} {"train_loss": -6.269608497619629, "global_step": 80850, "epoch": 1925} {"train_loss": -6.078056812286377, "global_step": 80851, "epoch": 1925} {"train_loss": -6.230845928192139, "global_step": 80852, "epoch": 1925} {"train_loss": -6.163400650024414, "global_step": 80853, "epoch": 1925} {"train_loss": -6.134770393371582, "global_step": 80854, "epoch": 1925} {"train_loss": -6.099673271179199, "global_step": 80855, "epoch": 1925} {"train_loss": -6.05404806137085, "global_step": 80856, "epoch": 1925} {"train_loss": -6.109375, "global_step": 80857, "epoch": 1925} {"train_loss": -6.057369709014893, "global_step": 80858, "epoch": 1925} {"train_loss": -5.994189262390137, "global_step": 80859, "epoch": 1925} {"train_loss": -6.089293003082275, "global_step": 80860, "epoch": 1925} {"train_loss": -5.8823347091674805, "global_step": 80861, "epoch": 1925} {"train_loss": -6.068132400512695, "global_step": 80862, "epoch": 1925} {"train_loss": -5.976071834564209, "global_step": 80863, "epoch": 1925} {"train_loss": -6.035901069641113, "global_step": 80864, "epoch": 1925} {"train_loss": -6.201948642730713, "global_step": 80865, "epoch": 1925} {"train_loss": -6.112583160400391, "global_step": 80866, "epoch": 1925} {"train_loss": -6.169618606567383, "global_step": 80867, "epoch": 1925} {"train_loss": -6.147481918334961, "global_step": 80868, "epoch": 1925} {"train_loss": -6.157798767089844, "global_step": 80869, "epoch": 1925} {"train_loss": -6.097575664520264, "global_step": 80870, "epoch": 1925} {"train_loss": -6.190899848937988, "global_step": 80871, "epoch": 1925} {"train_loss": -6.105389595031738, "global_step": 80872, "epoch": 1925} {"train_loss": -6.096682548522949, "global_step": 80873, "epoch": 1925} {"train_loss": -6.111155986785889, "global_step": 80874, "epoch": 1925} {"train_loss": -6.194426536560059, "global_step": 80875, "epoch": 1925} {"train_loss": -6.1218132972717285, "global_step": 80876, "epoch": 1925} {"train_loss": -6.129084587097168, "global_step": 80877, "epoch": 1925} {"train_loss": -6.179670810699463, "global_step": 80878, "epoch": 1925} {"train_loss": -6.115840911865234, "global_step": 80879, "epoch": 1925} {"train_loss": -6.189703941345215, "global_step": 80880, "epoch": 1925} {"train_loss": -6.258355140686035, "global_step": 80881, "epoch": 1925} {"train_loss": -6.158524036407471, "global_step": 80882, "epoch": 1925} {"train_loss": -6.146324157714844, "global_step": 80883, "epoch": 1925} {"train_loss": -6.210922718048096, "global_step": 80884, "epoch": 1925} {"train_loss": -6.157180309295654, "global_step": 80885, "epoch": 1925} {"train_loss": -6.1639180183410645, "global_step": 80886, "epoch": 1925} {"train_loss": -6.163079261779785, "global_step": 80887, "epoch": 1925} {"train_loss": -6.1977858543396, "global_step": 80888, "epoch": 1925} {"train_loss": -6.150160789489746, "global_step": 80889, "epoch": 1925} {"train_loss": -6.1389570236206055, "global_step": 80890, "epoch": 1925} {"train_loss": -6.130285319827852, "global_step": 80891, "epoch": 1925, "val_loss": 62362.3671875} {"train_loss": -6.074769020080566, "global_step": 80892, "epoch": 1926} {"train_loss": -6.262572288513184, "global_step": 80893, "epoch": 1926} {"train_loss": -6.052567481994629, "global_step": 80894, "epoch": 1926} {"train_loss": -6.1639180183410645, "global_step": 80895, "epoch": 1926} {"train_loss": -6.17998743057251, "global_step": 80896, "epoch": 1926} {"train_loss": -6.132377624511719, "global_step": 80897, "epoch": 1926} {"train_loss": -6.194088935852051, "global_step": 80898, "epoch": 1926} {"train_loss": -6.173989295959473, "global_step": 80899, "epoch": 1926} {"train_loss": -6.041032791137695, "global_step": 80900, "epoch": 1926} {"train_loss": -6.16472053527832, "global_step": 80901, "epoch": 1926} {"train_loss": -6.173152446746826, "global_step": 80902, "epoch": 1926} {"train_loss": -6.200078010559082, "global_step": 80903, "epoch": 1926} {"train_loss": -6.242694854736328, "global_step": 80904, "epoch": 1926} {"train_loss": -6.155897617340088, "global_step": 80905, "epoch": 1926} {"train_loss": -6.164287567138672, "global_step": 80906, "epoch": 1926} {"train_loss": -6.066826343536377, "global_step": 80907, "epoch": 1926} {"train_loss": -6.218797206878662, "global_step": 80908, "epoch": 1926} {"train_loss": -6.155516624450684, "global_step": 80909, "epoch": 1926} {"train_loss": -6.1737589836120605, "global_step": 80910, "epoch": 1926} {"train_loss": -6.113061428070068, "global_step": 80911, "epoch": 1926} {"train_loss": -6.200536727905273, "global_step": 80912, "epoch": 1926} {"train_loss": -6.239020347595215, "global_step": 80913, "epoch": 1926} {"train_loss": -6.00209379196167, "global_step": 80914, "epoch": 1926} {"train_loss": -6.1076979637146, "global_step": 80915, "epoch": 1926} {"train_loss": -6.0088067054748535, "global_step": 80916, "epoch": 1926} {"train_loss": -6.15352725982666, "global_step": 80917, "epoch": 1926} {"train_loss": -6.233441352844238, "global_step": 80918, "epoch": 1926} {"train_loss": -6.100721836090088, "global_step": 80919, "epoch": 1926} {"train_loss": -6.246665954589844, "global_step": 80920, "epoch": 1926} {"train_loss": -6.102109909057617, "global_step": 80921, "epoch": 1926} {"train_loss": -6.213840484619141, "global_step": 80922, "epoch": 1926} {"train_loss": -6.132692337036133, "global_step": 80923, "epoch": 1926} {"train_loss": -6.09602165222168, "global_step": 80924, "epoch": 1926} {"train_loss": -6.107548713684082, "global_step": 80925, "epoch": 1926} {"train_loss": -6.023502349853516, "global_step": 80926, "epoch": 1926} {"train_loss": -5.976073265075684, "global_step": 80927, "epoch": 1926} {"train_loss": -6.242512226104736, "global_step": 80928, "epoch": 1926} {"train_loss": -6.070366859436035, "global_step": 80929, "epoch": 1926} {"train_loss": -5.992576599121094, "global_step": 80930, "epoch": 1926} {"train_loss": -6.015901565551758, "global_step": 80931, "epoch": 1926} {"train_loss": -6.129842758178711, "global_step": 80932, "epoch": 1926} {"train_loss": -6.132520539419992, "global_step": 80933, "epoch": 1926, "val_loss": 62421.08203125} {"train_loss": -6.227763652801514, "global_step": 80934, "epoch": 1927} {"train_loss": -6.048603057861328, "global_step": 80935, "epoch": 1927} {"train_loss": -6.168461322784424, "global_step": 80936, "epoch": 1927} {"train_loss": -6.084726333618164, "global_step": 80937, "epoch": 1927} {"train_loss": -6.05312442779541, "global_step": 80938, "epoch": 1927} {"train_loss": -6.110755443572998, "global_step": 80939, "epoch": 1927} {"train_loss": -6.071495532989502, "global_step": 80940, "epoch": 1927} {"train_loss": -6.275148868560791, "global_step": 80941, "epoch": 1927} {"train_loss": -6.118162155151367, "global_step": 80942, "epoch": 1927} {"train_loss": -6.09602165222168, "global_step": 80943, "epoch": 1927} {"train_loss": -6.121918678283691, "global_step": 80944, "epoch": 1927} {"train_loss": -6.110581398010254, "global_step": 80945, "epoch": 1927} {"train_loss": -6.2117815017700195, "global_step": 80946, "epoch": 1927} {"train_loss": -6.220909118652344, "global_step": 80947, "epoch": 1927} {"train_loss": -6.024123191833496, "global_step": 80948, "epoch": 1927} {"train_loss": -6.147188663482666, "global_step": 80949, "epoch": 1927} {"train_loss": -6.103763580322266, "global_step": 80950, "epoch": 1927} {"train_loss": -6.159762382507324, "global_step": 80951, "epoch": 1927} {"train_loss": -6.129873275756836, "global_step": 80952, "epoch": 1927} {"train_loss": -6.170539855957031, "global_step": 80953, "epoch": 1927} {"train_loss": -6.0709638595581055, "global_step": 80954, "epoch": 1927} {"train_loss": -6.022711277008057, "global_step": 80955, "epoch": 1927} {"train_loss": -6.012209415435791, "global_step": 80956, "epoch": 1927} {"train_loss": -6.0756425857543945, "global_step": 80957, "epoch": 1927} {"train_loss": -6.076634407043457, "global_step": 80958, "epoch": 1927} {"train_loss": -6.107054710388184, "global_step": 80959, "epoch": 1927} {"train_loss": -6.050314903259277, "global_step": 80960, "epoch": 1927} {"train_loss": -6.173890113830566, "global_step": 80961, "epoch": 1927} {"train_loss": -6.163662433624268, "global_step": 80962, "epoch": 1927} {"train_loss": -6.195512771606445, "global_step": 80963, "epoch": 1927} {"train_loss": -6.102618217468262, "global_step": 80964, "epoch": 1927} {"train_loss": -6.124361038208008, "global_step": 80965, "epoch": 1927} {"train_loss": -6.108973503112793, "global_step": 80966, "epoch": 1927} {"train_loss": -6.185386657714844, "global_step": 80967, "epoch": 1927} {"train_loss": -6.213117599487305, "global_step": 80968, "epoch": 1927} {"train_loss": -6.220336437225342, "global_step": 80969, "epoch": 1927} {"train_loss": -6.147390842437744, "global_step": 80970, "epoch": 1927} {"train_loss": -6.1568193435668945, "global_step": 80971, "epoch": 1927} {"train_loss": -6.264638423919678, "global_step": 80972, "epoch": 1927} {"train_loss": -6.1398444175720215, "global_step": 80973, "epoch": 1927} {"train_loss": -6.281237602233887, "global_step": 80974, "epoch": 1927} {"train_loss": -6.136293399901617, "global_step": 80975, "epoch": 1927, "val_loss": 62333.5} {"train_loss": -6.232450485229492, "global_step": 80976, "epoch": 1928} {"train_loss": -6.141634941101074, "global_step": 80977, "epoch": 1928} {"train_loss": -6.216020584106445, "global_step": 80978, "epoch": 1928} {"train_loss": -6.138113021850586, "global_step": 80979, "epoch": 1928} {"train_loss": -6.186411380767822, "global_step": 80980, "epoch": 1928} {"train_loss": -6.206872940063477, "global_step": 80981, "epoch": 1928} {"train_loss": -6.2676262855529785, "global_step": 80982, "epoch": 1928} {"train_loss": -6.186798095703125, "global_step": 80983, "epoch": 1928} {"train_loss": -6.076401710510254, "global_step": 80984, "epoch": 1928} {"train_loss": -6.306668281555176, "global_step": 80985, "epoch": 1928} {"train_loss": -6.112674236297607, "global_step": 80986, "epoch": 1928} {"train_loss": -5.955924034118652, "global_step": 80987, "epoch": 1928} {"train_loss": -6.045658111572266, "global_step": 80988, "epoch": 1928} {"train_loss": -6.188301086425781, "global_step": 80989, "epoch": 1928} {"train_loss": -5.940760612487793, "global_step": 80990, "epoch": 1928} {"train_loss": -5.954679012298584, "global_step": 80991, "epoch": 1928} {"train_loss": -6.050013542175293, "global_step": 80992, "epoch": 1928} {"train_loss": -6.150658130645752, "global_step": 80993, "epoch": 1928} {"train_loss": -6.204257965087891, "global_step": 80994, "epoch": 1928} {"train_loss": -6.02493953704834, "global_step": 80995, "epoch": 1928} {"train_loss": -6.210111141204834, "global_step": 80996, "epoch": 1928} {"train_loss": -6.087423801422119, "global_step": 80997, "epoch": 1928} {"train_loss": -6.021806716918945, "global_step": 80998, "epoch": 1928} {"train_loss": -6.120199680328369, "global_step": 80999, "epoch": 1928} {"train_loss": -6.138987064361572, "global_step": 81000, "epoch": 1928} {"train_loss": -6.147091388702393, "global_step": 81001, "epoch": 1928} {"train_loss": -5.948085784912109, "global_step": 81002, "epoch": 1928} {"train_loss": -6.06440544128418, "global_step": 81003, "epoch": 1928} {"train_loss": -6.14622688293457, "global_step": 81004, "epoch": 1928} {"train_loss": -6.070213317871094, "global_step": 81005, "epoch": 1928} {"train_loss": -6.159191131591797, "global_step": 81006, "epoch": 1928} {"train_loss": -6.07984733581543, "global_step": 81007, "epoch": 1928} {"train_loss": -6.222209930419922, "global_step": 81008, "epoch": 1928} {"train_loss": -5.977036476135254, "global_step": 81009, "epoch": 1928} {"train_loss": -6.153079509735107, "global_step": 81010, "epoch": 1928} {"train_loss": -6.144806385040283, "global_step": 81011, "epoch": 1928} {"train_loss": -6.193235397338867, "global_step": 81012, "epoch": 1928} {"train_loss": -6.220918655395508, "global_step": 81013, "epoch": 1928} {"train_loss": -6.131399154663086, "global_step": 81014, "epoch": 1928} {"train_loss": -6.180663108825684, "global_step": 81015, "epoch": 1928} {"train_loss": -6.134045600891113, "global_step": 81016, "epoch": 1928} {"train_loss": -6.126426764896938, "global_step": 81017, "epoch": 1928, "val_loss": 62179.50390625} {"train_loss": -6.22652530670166, "global_step": 81018, "epoch": 1929} {"train_loss": -6.151176452636719, "global_step": 81019, "epoch": 1929} {"train_loss": -6.253438949584961, "global_step": 81020, "epoch": 1929} {"train_loss": -6.269632339477539, "global_step": 81021, "epoch": 1929} {"train_loss": -6.133079528808594, "global_step": 81022, "epoch": 1929} {"train_loss": -6.095096111297607, "global_step": 81023, "epoch": 1929} {"train_loss": -6.162736892700195, "global_step": 81024, "epoch": 1929} {"train_loss": -6.083155632019043, "global_step": 81025, "epoch": 1929} {"train_loss": -6.093520164489746, "global_step": 81026, "epoch": 1929} {"train_loss": -6.143594264984131, "global_step": 81027, "epoch": 1929} {"train_loss": -6.256192207336426, "global_step": 81028, "epoch": 1929} {"train_loss": -6.120486259460449, "global_step": 81029, "epoch": 1929} {"train_loss": -6.051770210266113, "global_step": 81030, "epoch": 1929} {"train_loss": -6.222358703613281, "global_step": 81031, "epoch": 1929} {"train_loss": -6.1086835861206055, "global_step": 81032, "epoch": 1929} {"train_loss": -6.136913299560547, "global_step": 81033, "epoch": 1929} {"train_loss": -6.1726226806640625, "global_step": 81034, "epoch": 1929} {"train_loss": -6.098926544189453, "global_step": 81035, "epoch": 1929} {"train_loss": -6.221777439117432, "global_step": 81036, "epoch": 1929} {"train_loss": -6.12095832824707, "global_step": 81037, "epoch": 1929} {"train_loss": -6.172600746154785, "global_step": 81038, "epoch": 1929} {"train_loss": -6.164722919464111, "global_step": 81039, "epoch": 1929} {"train_loss": -5.919942378997803, "global_step": 81040, "epoch": 1929} {"train_loss": -6.098767280578613, "global_step": 81041, "epoch": 1929} {"train_loss": -6.14646577835083, "global_step": 81042, "epoch": 1929} {"train_loss": -6.017324924468994, "global_step": 81043, "epoch": 1929} {"train_loss": -6.240413188934326, "global_step": 81044, "epoch": 1929} {"train_loss": -6.127997875213623, "global_step": 81045, "epoch": 1929} {"train_loss": -6.16409969329834, "global_step": 81046, "epoch": 1929} {"train_loss": -6.226226329803467, "global_step": 81047, "epoch": 1929} {"train_loss": -6.26950216293335, "global_step": 81048, "epoch": 1929} {"train_loss": -6.122957229614258, "global_step": 81049, "epoch": 1929} {"train_loss": -6.212989330291748, "global_step": 81050, "epoch": 1929} {"train_loss": -6.2420549392700195, "global_step": 81051, "epoch": 1929} {"train_loss": -6.216379642486572, "global_step": 81052, "epoch": 1929} {"train_loss": -6.197059154510498, "global_step": 81053, "epoch": 1929} {"train_loss": -6.118593692779541, "global_step": 81054, "epoch": 1929} {"train_loss": -6.078236103057861, "global_step": 81055, "epoch": 1929} {"train_loss": -6.305722236633301, "global_step": 81056, "epoch": 1929} {"train_loss": -6.280627250671387, "global_step": 81057, "epoch": 1929} {"train_loss": -6.004406929016113, "global_step": 81058, "epoch": 1929} {"train_loss": -6.157010725566319, "global_step": 81059, "epoch": 1929, "val_loss": 62543.80078125} {"train_loss": -6.159176826477051, "global_step": 81060, "epoch": 1930} {"train_loss": -6.054328918457031, "global_step": 81061, "epoch": 1930} {"train_loss": -6.2700910568237305, "global_step": 81062, "epoch": 1930} {"train_loss": -6.154789924621582, "global_step": 81063, "epoch": 1930} {"train_loss": -6.150073051452637, "global_step": 81064, "epoch": 1930} {"train_loss": -6.107829570770264, "global_step": 81065, "epoch": 1930} {"train_loss": -6.25956916809082, "global_step": 81066, "epoch": 1930} {"train_loss": -6.1582489013671875, "global_step": 81067, "epoch": 1930} {"train_loss": -6.287869453430176, "global_step": 81068, "epoch": 1930} {"train_loss": -6.040453910827637, "global_step": 81069, "epoch": 1930} {"train_loss": -6.240347385406494, "global_step": 81070, "epoch": 1930} {"train_loss": -6.179936408996582, "global_step": 81071, "epoch": 1930} {"train_loss": -6.2375898361206055, "global_step": 81072, "epoch": 1930} {"train_loss": -6.065526962280273, "global_step": 81073, "epoch": 1930} {"train_loss": -6.184294700622559, "global_step": 81074, "epoch": 1930} {"train_loss": -6.100824356079102, "global_step": 81075, "epoch": 1930} {"train_loss": -6.09230899810791, "global_step": 81076, "epoch": 1930} {"train_loss": -6.108698844909668, "global_step": 81077, "epoch": 1930} {"train_loss": -6.0102410316467285, "global_step": 81078, "epoch": 1930} {"train_loss": -6.2465972900390625, "global_step": 81079, "epoch": 1930} {"train_loss": -6.089108467102051, "global_step": 81080, "epoch": 1930} {"train_loss": -6.100339889526367, "global_step": 81081, "epoch": 1930} {"train_loss": -6.303249835968018, "global_step": 81082, "epoch": 1930} {"train_loss": -6.047809600830078, "global_step": 81083, "epoch": 1930} {"train_loss": -6.154193878173828, "global_step": 81084, "epoch": 1930} {"train_loss": -6.225984573364258, "global_step": 81085, "epoch": 1930} {"train_loss": -6.230982780456543, "global_step": 81086, "epoch": 1930} {"train_loss": -6.073891639709473, "global_step": 81087, "epoch": 1930} {"train_loss": -6.171561241149902, "global_step": 81088, "epoch": 1930} {"train_loss": -6.268239974975586, "global_step": 81089, "epoch": 1930} {"train_loss": -6.177367687225342, "global_step": 81090, "epoch": 1930} {"train_loss": -6.083415985107422, "global_step": 81091, "epoch": 1930} {"train_loss": -6.049465179443359, "global_step": 81092, "epoch": 1930} {"train_loss": -6.120586395263672, "global_step": 81093, "epoch": 1930} {"train_loss": -6.1128692626953125, "global_step": 81094, "epoch": 1930} {"train_loss": -6.268370628356934, "global_step": 81095, "epoch": 1930} {"train_loss": -6.181475639343262, "global_step": 81096, "epoch": 1930} {"train_loss": -6.127369403839111, "global_step": 81097, "epoch": 1930} {"train_loss": -6.122884750366211, "global_step": 81098, "epoch": 1930} {"train_loss": -6.247805595397949, "global_step": 81099, "epoch": 1930} {"train_loss": -6.170773029327393, "global_step": 81100, "epoch": 1930} {"train_loss": -6.155751375924973, "global_step": 81101, "epoch": 1930, "val_loss": 62366.40234375} {"train_loss": -6.177737236022949, "global_step": 81102, "epoch": 1931} {"train_loss": -6.215559959411621, "global_step": 81103, "epoch": 1931} {"train_loss": -6.2211127281188965, "global_step": 81104, "epoch": 1931} {"train_loss": -6.168063163757324, "global_step": 81105, "epoch": 1931} {"train_loss": -6.129058837890625, "global_step": 81106, "epoch": 1931} {"train_loss": -6.235895156860352, "global_step": 81107, "epoch": 1931} {"train_loss": -6.265538215637207, "global_step": 81108, "epoch": 1931} {"train_loss": -6.143641471862793, "global_step": 81109, "epoch": 1931} {"train_loss": -6.217138290405273, "global_step": 81110, "epoch": 1931} {"train_loss": -6.141523838043213, "global_step": 81111, "epoch": 1931} {"train_loss": -6.200831413269043, "global_step": 81112, "epoch": 1931} {"train_loss": -6.136262893676758, "global_step": 81113, "epoch": 1931} {"train_loss": -6.062640190124512, "global_step": 81114, "epoch": 1931} {"train_loss": -6.1856489181518555, "global_step": 81115, "epoch": 1931} {"train_loss": -6.124475479125977, "global_step": 81116, "epoch": 1931} {"train_loss": -6.180811405181885, "global_step": 81117, "epoch": 1931} {"train_loss": -6.153714179992676, "global_step": 81118, "epoch": 1931} {"train_loss": -6.229158878326416, "global_step": 81119, "epoch": 1931} {"train_loss": -6.18117618560791, "global_step": 81120, "epoch": 1931} {"train_loss": -6.192585468292236, "global_step": 81121, "epoch": 1931} {"train_loss": -6.188752174377441, "global_step": 81122, "epoch": 1931} {"train_loss": -6.204337120056152, "global_step": 81123, "epoch": 1931} {"train_loss": -6.114472389221191, "global_step": 81124, "epoch": 1931} {"train_loss": -6.282149314880371, "global_step": 81125, "epoch": 1931} {"train_loss": -6.1997270584106445, "global_step": 81126, "epoch": 1931} {"train_loss": -6.129460334777832, "global_step": 81127, "epoch": 1931} {"train_loss": -6.208821773529053, "global_step": 81128, "epoch": 1931} {"train_loss": -6.2100019454956055, "global_step": 81129, "epoch": 1931} {"train_loss": -6.157649040222168, "global_step": 81130, "epoch": 1931} {"train_loss": -6.211542129516602, "global_step": 81131, "epoch": 1931} {"train_loss": -6.004663467407227, "global_step": 81132, "epoch": 1931} {"train_loss": -6.192748546600342, "global_step": 81133, "epoch": 1931} {"train_loss": -6.082305908203125, "global_step": 81134, "epoch": 1931} {"train_loss": -6.18702507019043, "global_step": 81135, "epoch": 1931} {"train_loss": -6.1619086265563965, "global_step": 81136, "epoch": 1931} {"train_loss": -6.229798793792725, "global_step": 81137, "epoch": 1931} {"train_loss": -6.156818389892578, "global_step": 81138, "epoch": 1931} {"train_loss": -6.131032943725586, "global_step": 81139, "epoch": 1931} {"train_loss": -6.159801483154297, "global_step": 81140, "epoch": 1931} {"train_loss": -6.211149215698242, "global_step": 81141, "epoch": 1931} {"train_loss": -6.155159950256348, "global_step": 81142, "epoch": 1931} {"train_loss": -6.174221368063064, "global_step": 81143, "epoch": 1931, "val_loss": 62414.52734375} {"train_loss": -6.070983409881592, "global_step": 81144, "epoch": 1932} {"train_loss": -6.112608432769775, "global_step": 81145, "epoch": 1932} {"train_loss": -6.204592704772949, "global_step": 81146, "epoch": 1932} {"train_loss": -6.210526943206787, "global_step": 81147, "epoch": 1932} {"train_loss": -6.125400543212891, "global_step": 81148, "epoch": 1932} {"train_loss": -6.084080219268799, "global_step": 81149, "epoch": 1932} {"train_loss": -6.142824172973633, "global_step": 81150, "epoch": 1932} {"train_loss": -6.105146408081055, "global_step": 81151, "epoch": 1932} {"train_loss": -6.116858005523682, "global_step": 81152, "epoch": 1932} {"train_loss": -6.148481845855713, "global_step": 81153, "epoch": 1932} {"train_loss": -6.229879379272461, "global_step": 81154, "epoch": 1932} {"train_loss": -6.273808002471924, "global_step": 81155, "epoch": 1932} {"train_loss": -6.1414594650268555, "global_step": 81156, "epoch": 1932} {"train_loss": -6.2515058517456055, "global_step": 81157, "epoch": 1932} {"train_loss": -6.104438781738281, "global_step": 81158, "epoch": 1932} {"train_loss": -6.199844837188721, "global_step": 81159, "epoch": 1932} {"train_loss": -6.1486406326293945, "global_step": 81160, "epoch": 1932} {"train_loss": -6.1146955490112305, "global_step": 81161, "epoch": 1932} {"train_loss": -6.184442520141602, "global_step": 81162, "epoch": 1932} {"train_loss": -6.135475158691406, "global_step": 81163, "epoch": 1932} {"train_loss": -6.153739929199219, "global_step": 81164, "epoch": 1932} {"train_loss": -6.248315811157227, "global_step": 81165, "epoch": 1932} {"train_loss": -6.161023139953613, "global_step": 81166, "epoch": 1932} {"train_loss": -6.120121479034424, "global_step": 81167, "epoch": 1932} {"train_loss": -6.043394088745117, "global_step": 81168, "epoch": 1932} {"train_loss": -6.138216018676758, "global_step": 81169, "epoch": 1932} {"train_loss": -6.170138835906982, "global_step": 81170, "epoch": 1932} {"train_loss": -6.142004013061523, "global_step": 81171, "epoch": 1932} {"train_loss": -6.043103218078613, "global_step": 81172, "epoch": 1932} {"train_loss": -6.1430277824401855, "global_step": 81173, "epoch": 1932} {"train_loss": -6.219806671142578, "global_step": 81174, "epoch": 1932} {"train_loss": -6.1638031005859375, "global_step": 81175, "epoch": 1932} {"train_loss": -6.090743541717529, "global_step": 81176, "epoch": 1932} {"train_loss": -6.262866497039795, "global_step": 81177, "epoch": 1932} {"train_loss": -6.167506217956543, "global_step": 81178, "epoch": 1932} {"train_loss": -6.195849418640137, "global_step": 81179, "epoch": 1932} {"train_loss": -6.213293075561523, "global_step": 81180, "epoch": 1932} {"train_loss": -6.214053153991699, "global_step": 81181, "epoch": 1932} {"train_loss": -6.291488170623779, "global_step": 81182, "epoch": 1932} {"train_loss": -6.248769760131836, "global_step": 81183, "epoch": 1932} {"train_loss": -6.111474990844727, "global_step": 81184, "epoch": 1932} {"train_loss": -6.16238994825454, "global_step": 81185, "epoch": 1932, "val_loss": 62286.50390625} {"train_loss": -6.189159393310547, "global_step": 81186, "epoch": 1933} {"train_loss": -6.196537017822266, "global_step": 81187, "epoch": 1933} {"train_loss": -6.203261375427246, "global_step": 81188, "epoch": 1933} {"train_loss": -6.132509708404541, "global_step": 81189, "epoch": 1933} {"train_loss": -6.10719108581543, "global_step": 81190, "epoch": 1933} {"train_loss": -6.1757283210754395, "global_step": 81191, "epoch": 1933} {"train_loss": -6.119973659515381, "global_step": 81192, "epoch": 1933} {"train_loss": -6.220475673675537, "global_step": 81193, "epoch": 1933} {"train_loss": -6.19936466217041, "global_step": 81194, "epoch": 1933} {"train_loss": -6.153858184814453, "global_step": 81195, "epoch": 1933} {"train_loss": -6.129707336425781, "global_step": 81196, "epoch": 1933} {"train_loss": -6.18463134765625, "global_step": 81197, "epoch": 1933} {"train_loss": -6.016141414642334, "global_step": 81198, "epoch": 1933} {"train_loss": -6.192004680633545, "global_step": 81199, "epoch": 1933} {"train_loss": -6.123976707458496, "global_step": 81200, "epoch": 1933} {"train_loss": -6.2523651123046875, "global_step": 81201, "epoch": 1933} {"train_loss": -6.153719902038574, "global_step": 81202, "epoch": 1933} {"train_loss": -6.134777069091797, "global_step": 81203, "epoch": 1933} {"train_loss": -6.206666946411133, "global_step": 81204, "epoch": 1933} {"train_loss": -6.133944034576416, "global_step": 81205, "epoch": 1933} {"train_loss": -6.2321014404296875, "global_step": 81206, "epoch": 1933} {"train_loss": -6.158290863037109, "global_step": 81207, "epoch": 1933} {"train_loss": -6.161809921264648, "global_step": 81208, "epoch": 1933} {"train_loss": -6.205817699432373, "global_step": 81209, "epoch": 1933} {"train_loss": -6.139244556427002, "global_step": 81210, "epoch": 1933} {"train_loss": -6.221169948577881, "global_step": 81211, "epoch": 1933} {"train_loss": -6.095096588134766, "global_step": 81212, "epoch": 1933} {"train_loss": -6.17989444732666, "global_step": 81213, "epoch": 1933} {"train_loss": -6.22636604309082, "global_step": 81214, "epoch": 1933} {"train_loss": -6.109561920166016, "global_step": 81215, "epoch": 1933} {"train_loss": -6.112204074859619, "global_step": 81216, "epoch": 1933} {"train_loss": -6.177239418029785, "global_step": 81217, "epoch": 1933} {"train_loss": -6.133175849914551, "global_step": 81218, "epoch": 1933} {"train_loss": -6.167579174041748, "global_step": 81219, "epoch": 1933} {"train_loss": -6.080124378204346, "global_step": 81220, "epoch": 1933} {"train_loss": -6.128324508666992, "global_step": 81221, "epoch": 1933} {"train_loss": -6.261928081512451, "global_step": 81222, "epoch": 1933} {"train_loss": -6.153147220611572, "global_step": 81223, "epoch": 1933} {"train_loss": -6.09457540512085, "global_step": 81224, "epoch": 1933} {"train_loss": -6.09742546081543, "global_step": 81225, "epoch": 1933} {"train_loss": -6.097615718841553, "global_step": 81226, "epoch": 1933} {"train_loss": -6.157340061096918, "global_step": 81227, "epoch": 1933, "val_loss": 62397.0859375} {"train_loss": -6.188185691833496, "global_step": 81228, "epoch": 1934} {"train_loss": -6.153158187866211, "global_step": 81229, "epoch": 1934} {"train_loss": -6.2638654708862305, "global_step": 81230, "epoch": 1934} {"train_loss": -6.2139363288879395, "global_step": 81231, "epoch": 1934} {"train_loss": -6.233736515045166, "global_step": 81232, "epoch": 1934} {"train_loss": -6.135385513305664, "global_step": 81233, "epoch": 1934} {"train_loss": -6.3119916915893555, "global_step": 81234, "epoch": 1934} {"train_loss": -6.037846565246582, "global_step": 81235, "epoch": 1934} {"train_loss": -6.047854900360107, "global_step": 81236, "epoch": 1934} {"train_loss": -6.219416618347168, "global_step": 81237, "epoch": 1934} {"train_loss": -6.123530387878418, "global_step": 81238, "epoch": 1934} {"train_loss": -6.269799709320068, "global_step": 81239, "epoch": 1934} {"train_loss": -6.22542667388916, "global_step": 81240, "epoch": 1934} {"train_loss": -6.176799774169922, "global_step": 81241, "epoch": 1934} {"train_loss": -6.18619966506958, "global_step": 81242, "epoch": 1934} {"train_loss": -6.183465003967285, "global_step": 81243, "epoch": 1934} {"train_loss": -6.219964981079102, "global_step": 81244, "epoch": 1934} {"train_loss": -6.1997528076171875, "global_step": 81245, "epoch": 1934} {"train_loss": -6.209831237792969, "global_step": 81246, "epoch": 1934} {"train_loss": -6.155767917633057, "global_step": 81247, "epoch": 1934} {"train_loss": -6.181475639343262, "global_step": 81248, "epoch": 1934} {"train_loss": -6.229280471801758, "global_step": 81249, "epoch": 1934} {"train_loss": -6.160651206970215, "global_step": 81250, "epoch": 1934} {"train_loss": -6.210000991821289, "global_step": 81251, "epoch": 1934} {"train_loss": -6.095901012420654, "global_step": 81252, "epoch": 1934} {"train_loss": -5.979812145233154, "global_step": 81253, "epoch": 1934} {"train_loss": -6.116846084594727, "global_step": 81254, "epoch": 1934} {"train_loss": -6.029910087585449, "global_step": 81255, "epoch": 1934} {"train_loss": -6.002880096435547, "global_step": 81256, "epoch": 1934} {"train_loss": -6.164201736450195, "global_step": 81257, "epoch": 1934} {"train_loss": -6.054081439971924, "global_step": 81258, "epoch": 1934} {"train_loss": -6.166330337524414, "global_step": 81259, "epoch": 1934} {"train_loss": -6.1685004234313965, "global_step": 81260, "epoch": 1934} {"train_loss": -6.131892204284668, "global_step": 81261, "epoch": 1934} {"train_loss": -6.144178867340088, "global_step": 81262, "epoch": 1934} {"train_loss": -6.123926639556885, "global_step": 81263, "epoch": 1934} {"train_loss": -6.244986534118652, "global_step": 81264, "epoch": 1934} {"train_loss": -6.199388027191162, "global_step": 81265, "epoch": 1934} {"train_loss": -6.127962589263916, "global_step": 81266, "epoch": 1934} {"train_loss": -6.180809020996094, "global_step": 81267, "epoch": 1934} {"train_loss": -6.226849555969238, "global_step": 81268, "epoch": 1934} {"train_loss": -6.16218866620745, "global_step": 81269, "epoch": 1934, "val_loss": 62444.70703125} {"train_loss": -6.064251899719238, "global_step": 81270, "epoch": 1935} {"train_loss": -6.302980422973633, "global_step": 81271, "epoch": 1935} {"train_loss": -6.1031174659729, "global_step": 81272, "epoch": 1935} {"train_loss": -6.268211364746094, "global_step": 81273, "epoch": 1935} {"train_loss": -6.0965895652771, "global_step": 81274, "epoch": 1935} {"train_loss": -6.265575885772705, "global_step": 81275, "epoch": 1935} {"train_loss": -6.268609523773193, "global_step": 81276, "epoch": 1935} {"train_loss": -6.283843040466309, "global_step": 81277, "epoch": 1935} {"train_loss": -6.078000068664551, "global_step": 81278, "epoch": 1935} {"train_loss": -6.150461196899414, "global_step": 81279, "epoch": 1935} {"train_loss": -6.247736930847168, "global_step": 81280, "epoch": 1935} {"train_loss": -6.147424221038818, "global_step": 81281, "epoch": 1935} {"train_loss": -6.16119909286499, "global_step": 81282, "epoch": 1935} {"train_loss": -6.3358917236328125, "global_step": 81283, "epoch": 1935} {"train_loss": -6.073120594024658, "global_step": 81284, "epoch": 1935} {"train_loss": -6.137396812438965, "global_step": 81285, "epoch": 1935} {"train_loss": -6.1561737060546875, "global_step": 81286, "epoch": 1935} {"train_loss": -6.190962791442871, "global_step": 81287, "epoch": 1935} {"train_loss": -6.15668249130249, "global_step": 81288, "epoch": 1935} {"train_loss": -6.174692153930664, "global_step": 81289, "epoch": 1935} {"train_loss": -6.079789638519287, "global_step": 81290, "epoch": 1935} {"train_loss": -6.119050025939941, "global_step": 81291, "epoch": 1935} {"train_loss": -6.220643997192383, "global_step": 81292, "epoch": 1935} {"train_loss": -6.205172538757324, "global_step": 81293, "epoch": 1935} {"train_loss": -6.262203216552734, "global_step": 81294, "epoch": 1935} {"train_loss": -6.224315643310547, "global_step": 81295, "epoch": 1935} {"train_loss": -6.276707649230957, "global_step": 81296, "epoch": 1935} {"train_loss": -6.105372428894043, "global_step": 81297, "epoch": 1935} {"train_loss": -6.163039207458496, "global_step": 81298, "epoch": 1935} {"train_loss": -6.095427513122559, "global_step": 81299, "epoch": 1935} {"train_loss": -6.1607441902160645, "global_step": 81300, "epoch": 1935} {"train_loss": -6.235930442810059, "global_step": 81301, "epoch": 1935} {"train_loss": -6.005719184875488, "global_step": 81302, "epoch": 1935} {"train_loss": -5.958834648132324, "global_step": 81303, "epoch": 1935} {"train_loss": -6.175358772277832, "global_step": 81304, "epoch": 1935} {"train_loss": -6.094066619873047, "global_step": 81305, "epoch": 1935} {"train_loss": -6.046103477478027, "global_step": 81306, "epoch": 1935} {"train_loss": -6.088876724243164, "global_step": 81307, "epoch": 1935} {"train_loss": -6.056532382965088, "global_step": 81308, "epoch": 1935} {"train_loss": -6.12755823135376, "global_step": 81309, "epoch": 1935} {"train_loss": -6.196275234222412, "global_step": 81310, "epoch": 1935} {"train_loss": -6.156898793720064, "global_step": 81311, "epoch": 1935, "val_loss": 62417.0390625} {"train_loss": -6.017438888549805, "global_step": 81312, "epoch": 1936} {"train_loss": -6.183688163757324, "global_step": 81313, "epoch": 1936} {"train_loss": -6.156324863433838, "global_step": 81314, "epoch": 1936} {"train_loss": -6.242434501647949, "global_step": 81315, "epoch": 1936} {"train_loss": -6.219446659088135, "global_step": 81316, "epoch": 1936} {"train_loss": -6.047123908996582, "global_step": 81317, "epoch": 1936} {"train_loss": -6.225201606750488, "global_step": 81318, "epoch": 1936} {"train_loss": -6.066338539123535, "global_step": 81319, "epoch": 1936} {"train_loss": -6.106539249420166, "global_step": 81320, "epoch": 1936} {"train_loss": -6.1181721687316895, "global_step": 81321, "epoch": 1936} {"train_loss": -6.189894676208496, "global_step": 81322, "epoch": 1936} {"train_loss": -6.006168365478516, "global_step": 81323, "epoch": 1936} {"train_loss": -6.122907638549805, "global_step": 81324, "epoch": 1936} {"train_loss": -6.150547981262207, "global_step": 81325, "epoch": 1936} {"train_loss": -6.109836101531982, "global_step": 81326, "epoch": 1936} {"train_loss": -6.184414863586426, "global_step": 81327, "epoch": 1936} {"train_loss": -6.089023590087891, "global_step": 81328, "epoch": 1936} {"train_loss": -6.126378059387207, "global_step": 81329, "epoch": 1936} {"train_loss": -6.199770927429199, "global_step": 81330, "epoch": 1936} {"train_loss": -6.076565742492676, "global_step": 81331, "epoch": 1936} {"train_loss": -6.078472137451172, "global_step": 81332, "epoch": 1936} {"train_loss": -6.0248799324035645, "global_step": 81333, "epoch": 1936} {"train_loss": -6.173223495483398, "global_step": 81334, "epoch": 1936} {"train_loss": -6.115864276885986, "global_step": 81335, "epoch": 1936} {"train_loss": -6.204658508300781, "global_step": 81336, "epoch": 1936} {"train_loss": -6.191562175750732, "global_step": 81337, "epoch": 1936} {"train_loss": -6.2115278244018555, "global_step": 81338, "epoch": 1936} {"train_loss": -6.144082069396973, "global_step": 81339, "epoch": 1936} {"train_loss": -6.116686820983887, "global_step": 81340, "epoch": 1936} {"train_loss": -6.129288673400879, "global_step": 81341, "epoch": 1936} {"train_loss": -6.086220741271973, "global_step": 81342, "epoch": 1936} {"train_loss": -6.091876983642578, "global_step": 81343, "epoch": 1936} {"train_loss": -6.169088363647461, "global_step": 81344, "epoch": 1936} {"train_loss": -6.09548282623291, "global_step": 81345, "epoch": 1936} {"train_loss": -6.0426836013793945, "global_step": 81346, "epoch": 1936} {"train_loss": -6.033563613891602, "global_step": 81347, "epoch": 1936} {"train_loss": -6.146670341491699, "global_step": 81348, "epoch": 1936} {"train_loss": -6.140031814575195, "global_step": 81349, "epoch": 1936} {"train_loss": -6.18258810043335, "global_step": 81350, "epoch": 1936} {"train_loss": -6.171346664428711, "global_step": 81351, "epoch": 1936} {"train_loss": -6.124377250671387, "global_step": 81352, "epoch": 1936} {"train_loss": -6.127321231932867, "global_step": 81353, "epoch": 1936, "val_loss": 62572.8125} {"train_loss": -6.036053657531738, "global_step": 81354, "epoch": 1937} {"train_loss": -6.073291778564453, "global_step": 81355, "epoch": 1937} {"train_loss": -6.185009956359863, "global_step": 81356, "epoch": 1937} {"train_loss": -6.166132926940918, "global_step": 81357, "epoch": 1937} {"train_loss": -6.032849311828613, "global_step": 81358, "epoch": 1937} {"train_loss": -6.1768798828125, "global_step": 81359, "epoch": 1937} {"train_loss": -6.118894100189209, "global_step": 81360, "epoch": 1937} {"train_loss": -6.152924537658691, "global_step": 81361, "epoch": 1937} {"train_loss": -6.12693452835083, "global_step": 81362, "epoch": 1937} {"train_loss": -6.052845478057861, "global_step": 81363, "epoch": 1937} {"train_loss": -6.126087188720703, "global_step": 81364, "epoch": 1937} {"train_loss": -6.1208391189575195, "global_step": 81365, "epoch": 1937} {"train_loss": -6.142266273498535, "global_step": 81366, "epoch": 1937} {"train_loss": -6.078836917877197, "global_step": 81367, "epoch": 1937} {"train_loss": -6.077083110809326, "global_step": 81368, "epoch": 1937} {"train_loss": -6.156279563903809, "global_step": 81369, "epoch": 1937} {"train_loss": -6.120650291442871, "global_step": 81370, "epoch": 1937} {"train_loss": -6.15847110748291, "global_step": 81371, "epoch": 1937} {"train_loss": -6.047226905822754, "global_step": 81372, "epoch": 1937} {"train_loss": -6.123285293579102, "global_step": 81373, "epoch": 1937} {"train_loss": -6.1733622550964355, "global_step": 81374, "epoch": 1937} {"train_loss": -6.182893753051758, "global_step": 81375, "epoch": 1937} {"train_loss": -6.172763347625732, "global_step": 81376, "epoch": 1937} {"train_loss": -6.098837852478027, "global_step": 81377, "epoch": 1937} {"train_loss": -6.104787826538086, "global_step": 81378, "epoch": 1937} {"train_loss": -6.08633279800415, "global_step": 81379, "epoch": 1937} {"train_loss": -6.097330093383789, "global_step": 81380, "epoch": 1937} {"train_loss": -6.146720886230469, "global_step": 81381, "epoch": 1937} {"train_loss": -6.109282970428467, "global_step": 81382, "epoch": 1937} {"train_loss": -6.156838417053223, "global_step": 81383, "epoch": 1937} {"train_loss": -6.09914493560791, "global_step": 81384, "epoch": 1937} {"train_loss": -6.18226432800293, "global_step": 81385, "epoch": 1937} {"train_loss": -6.047963619232178, "global_step": 81386, "epoch": 1937} {"train_loss": -6.092339038848877, "global_step": 81387, "epoch": 1937} {"train_loss": -6.088572978973389, "global_step": 81388, "epoch": 1937} {"train_loss": -6.282899856567383, "global_step": 81389, "epoch": 1937} {"train_loss": -6.2123308181762695, "global_step": 81390, "epoch": 1937} {"train_loss": -6.119377613067627, "global_step": 81391, "epoch": 1937} {"train_loss": -6.162482738494873, "global_step": 81392, "epoch": 1937} {"train_loss": -6.260021209716797, "global_step": 81393, "epoch": 1937} {"train_loss": -6.168778896331787, "global_step": 81394, "epoch": 1937} {"train_loss": -6.131399097896757, "global_step": 81395, "epoch": 1937, "val_loss": 62588.2109375} {"train_loss": -6.040293216705322, "global_step": 81396, "epoch": 1938} {"train_loss": -6.215405464172363, "global_step": 81397, "epoch": 1938} {"train_loss": -6.105915069580078, "global_step": 81398, "epoch": 1938} {"train_loss": -6.245224952697754, "global_step": 81399, "epoch": 1938} {"train_loss": -6.242274284362793, "global_step": 81400, "epoch": 1938} {"train_loss": -6.114719390869141, "global_step": 81401, "epoch": 1938} {"train_loss": -6.109947204589844, "global_step": 81402, "epoch": 1938} {"train_loss": -6.205886363983154, "global_step": 81403, "epoch": 1938} {"train_loss": -6.27281379699707, "global_step": 81404, "epoch": 1938} {"train_loss": -6.195914268493652, "global_step": 81405, "epoch": 1938} {"train_loss": -6.143354892730713, "global_step": 81406, "epoch": 1938} {"train_loss": -6.155123233795166, "global_step": 81407, "epoch": 1938} {"train_loss": -6.170814514160156, "global_step": 81408, "epoch": 1938} {"train_loss": -6.076940536499023, "global_step": 81409, "epoch": 1938} {"train_loss": -6.224617004394531, "global_step": 81410, "epoch": 1938} {"train_loss": -6.139005184173584, "global_step": 81411, "epoch": 1938} {"train_loss": -6.142416000366211, "global_step": 81412, "epoch": 1938} {"train_loss": -6.222777366638184, "global_step": 81413, "epoch": 1938} {"train_loss": -6.229938507080078, "global_step": 81414, "epoch": 1938} {"train_loss": -6.156708240509033, "global_step": 81415, "epoch": 1938} {"train_loss": -6.100490570068359, "global_step": 81416, "epoch": 1938} {"train_loss": -6.252460479736328, "global_step": 81417, "epoch": 1938} {"train_loss": -6.165866851806641, "global_step": 81418, "epoch": 1938} {"train_loss": -6.230469703674316, "global_step": 81419, "epoch": 1938} {"train_loss": -6.15771484375, "global_step": 81420, "epoch": 1938} {"train_loss": -6.135985374450684, "global_step": 81421, "epoch": 1938} {"train_loss": -6.251613616943359, "global_step": 81422, "epoch": 1938} {"train_loss": -6.186454772949219, "global_step": 81423, "epoch": 1938} {"train_loss": -6.2420244216918945, "global_step": 81424, "epoch": 1938} {"train_loss": -6.208950996398926, "global_step": 81425, "epoch": 1938} {"train_loss": -6.0721917152404785, "global_step": 81426, "epoch": 1938} {"train_loss": -6.1646199226379395, "global_step": 81427, "epoch": 1938} {"train_loss": -6.224785327911377, "global_step": 81428, "epoch": 1938} {"train_loss": -6.158214092254639, "global_step": 81429, "epoch": 1938} {"train_loss": -6.23853874206543, "global_step": 81430, "epoch": 1938} {"train_loss": -6.184473514556885, "global_step": 81431, "epoch": 1938} {"train_loss": -6.168482780456543, "global_step": 81432, "epoch": 1938} {"train_loss": -6.204656600952148, "global_step": 81433, "epoch": 1938} {"train_loss": -6.194035053253174, "global_step": 81434, "epoch": 1938} {"train_loss": -6.106850624084473, "global_step": 81435, "epoch": 1938} {"train_loss": -6.041741847991943, "global_step": 81436, "epoch": 1938} {"train_loss": -6.173839818863642, "global_step": 81437, "epoch": 1938, "val_loss": 62499.58203125} {"train_loss": -6.123708248138428, "global_step": 81438, "epoch": 1939} {"train_loss": -6.063648700714111, "global_step": 81439, "epoch": 1939} {"train_loss": -6.196193218231201, "global_step": 81440, "epoch": 1939} {"train_loss": -6.160793304443359, "global_step": 81441, "epoch": 1939} {"train_loss": -6.188423156738281, "global_step": 81442, "epoch": 1939} {"train_loss": -6.0288615226745605, "global_step": 81443, "epoch": 1939} {"train_loss": -6.037375450134277, "global_step": 81444, "epoch": 1939} {"train_loss": -6.1281328201293945, "global_step": 81445, "epoch": 1939} {"train_loss": -6.165713310241699, "global_step": 81446, "epoch": 1939} {"train_loss": -6.123454570770264, "global_step": 81447, "epoch": 1939} {"train_loss": -6.106217861175537, "global_step": 81448, "epoch": 1939} {"train_loss": -6.2226457595825195, "global_step": 81449, "epoch": 1939} {"train_loss": -6.1250104904174805, "global_step": 81450, "epoch": 1939} {"train_loss": -6.069110870361328, "global_step": 81451, "epoch": 1939} {"train_loss": -6.187614440917969, "global_step": 81452, "epoch": 1939} {"train_loss": -6.173958778381348, "global_step": 81453, "epoch": 1939} {"train_loss": -6.1714582443237305, "global_step": 81454, "epoch": 1939} {"train_loss": -6.159494876861572, "global_step": 81455, "epoch": 1939} {"train_loss": -6.107150077819824, "global_step": 81456, "epoch": 1939} {"train_loss": -6.129632472991943, "global_step": 81457, "epoch": 1939} {"train_loss": -6.171934604644775, "global_step": 81458, "epoch": 1939} {"train_loss": -6.251222133636475, "global_step": 81459, "epoch": 1939} {"train_loss": -6.25330114364624, "global_step": 81460, "epoch": 1939} {"train_loss": -6.163897514343262, "global_step": 81461, "epoch": 1939} {"train_loss": -6.150311470031738, "global_step": 81462, "epoch": 1939} {"train_loss": -6.049704551696777, "global_step": 81463, "epoch": 1939} {"train_loss": -6.257053375244141, "global_step": 81464, "epoch": 1939} {"train_loss": -6.201807975769043, "global_step": 81465, "epoch": 1939} {"train_loss": -6.233677864074707, "global_step": 81466, "epoch": 1939} {"train_loss": -6.2121782302856445, "global_step": 81467, "epoch": 1939} {"train_loss": -6.164862155914307, "global_step": 81468, "epoch": 1939} {"train_loss": -6.174658298492432, "global_step": 81469, "epoch": 1939} {"train_loss": -6.224133491516113, "global_step": 81470, "epoch": 1939} {"train_loss": -6.260293483734131, "global_step": 81471, "epoch": 1939} {"train_loss": -6.243781566619873, "global_step": 81472, "epoch": 1939} {"train_loss": -6.2447662353515625, "global_step": 81473, "epoch": 1939} {"train_loss": -6.139588832855225, "global_step": 81474, "epoch": 1939} {"train_loss": -6.087457656860352, "global_step": 81475, "epoch": 1939} {"train_loss": -6.073448657989502, "global_step": 81476, "epoch": 1939} {"train_loss": -6.146462440490723, "global_step": 81477, "epoch": 1939} {"train_loss": -6.019561767578125, "global_step": 81478, "epoch": 1939} {"train_loss": -6.156555913743519, "global_step": 81479, "epoch": 1939, "val_loss": 62569.609375} {"train_loss": -6.196926116943359, "global_step": 81480, "epoch": 1940} {"train_loss": -6.041418075561523, "global_step": 81481, "epoch": 1940} {"train_loss": -6.132589340209961, "global_step": 81482, "epoch": 1940} {"train_loss": -6.182378768920898, "global_step": 81483, "epoch": 1940} {"train_loss": -6.0481743812561035, "global_step": 81484, "epoch": 1940} {"train_loss": -6.165431976318359, "global_step": 81485, "epoch": 1940} {"train_loss": -6.121927261352539, "global_step": 81486, "epoch": 1940} {"train_loss": -6.14653205871582, "global_step": 81487, "epoch": 1940} {"train_loss": -6.10010290145874, "global_step": 81488, "epoch": 1940} {"train_loss": -6.090663433074951, "global_step": 81489, "epoch": 1940} {"train_loss": -6.125036239624023, "global_step": 81490, "epoch": 1940} {"train_loss": -6.248255729675293, "global_step": 81491, "epoch": 1940} {"train_loss": -6.257338047027588, "global_step": 81492, "epoch": 1940} {"train_loss": -6.22797155380249, "global_step": 81493, "epoch": 1940} {"train_loss": -6.116659164428711, "global_step": 81494, "epoch": 1940} {"train_loss": -6.206865310668945, "global_step": 81495, "epoch": 1940} {"train_loss": -6.199909210205078, "global_step": 81496, "epoch": 1940} {"train_loss": -6.187227249145508, "global_step": 81497, "epoch": 1940} {"train_loss": -6.189024925231934, "global_step": 81498, "epoch": 1940} {"train_loss": -6.2273712158203125, "global_step": 81499, "epoch": 1940} {"train_loss": -6.159328460693359, "global_step": 81500, "epoch": 1940} {"train_loss": -6.181885719299316, "global_step": 81501, "epoch": 1940} {"train_loss": -6.168097496032715, "global_step": 81502, "epoch": 1940} {"train_loss": -6.209141731262207, "global_step": 81503, "epoch": 1940} {"train_loss": -6.2389068603515625, "global_step": 81504, "epoch": 1940} {"train_loss": -6.16641902923584, "global_step": 81505, "epoch": 1940} {"train_loss": -6.108667373657227, "global_step": 81506, "epoch": 1940} {"train_loss": -6.16792106628418, "global_step": 81507, "epoch": 1940} {"train_loss": -6.196608066558838, "global_step": 81508, "epoch": 1940} {"train_loss": -6.200583457946777, "global_step": 81509, "epoch": 1940} {"train_loss": -6.192468166351318, "global_step": 81510, "epoch": 1940} {"train_loss": -6.171475410461426, "global_step": 81511, "epoch": 1940} {"train_loss": -6.232416152954102, "global_step": 81512, "epoch": 1940} {"train_loss": -6.127101898193359, "global_step": 81513, "epoch": 1940} {"train_loss": -6.159440040588379, "global_step": 81514, "epoch": 1940} {"train_loss": -6.202350616455078, "global_step": 81515, "epoch": 1940} {"train_loss": -6.177148342132568, "global_step": 81516, "epoch": 1940} {"train_loss": -6.032711505889893, "global_step": 81517, "epoch": 1940} {"train_loss": -6.050534248352051, "global_step": 81518, "epoch": 1940} {"train_loss": -6.150263786315918, "global_step": 81519, "epoch": 1940} {"train_loss": -6.160966396331787, "global_step": 81520, "epoch": 1940} {"train_loss": -6.160541261945452, "global_step": 81521, "epoch": 1940, "val_loss": 62123.47265625} {"train_loss": -6.2031660079956055, "global_step": 81522, "epoch": 1941} {"train_loss": -6.191997528076172, "global_step": 81523, "epoch": 1941} {"train_loss": -6.1642165184021, "global_step": 81524, "epoch": 1941} {"train_loss": -6.102377891540527, "global_step": 81525, "epoch": 1941} {"train_loss": -6.115492343902588, "global_step": 81526, "epoch": 1941} {"train_loss": -6.224690914154053, "global_step": 81527, "epoch": 1941} {"train_loss": -6.257863521575928, "global_step": 81528, "epoch": 1941} {"train_loss": -6.123592376708984, "global_step": 81529, "epoch": 1941} {"train_loss": -6.096764087677002, "global_step": 81530, "epoch": 1941} {"train_loss": -6.026439189910889, "global_step": 81531, "epoch": 1941} {"train_loss": -6.186919212341309, "global_step": 81532, "epoch": 1941} {"train_loss": -6.22023868560791, "global_step": 81533, "epoch": 1941} {"train_loss": -6.093972206115723, "global_step": 81534, "epoch": 1941} {"train_loss": -6.126836776733398, "global_step": 81535, "epoch": 1941} {"train_loss": -6.080999374389648, "global_step": 81536, "epoch": 1941} {"train_loss": -6.102735996246338, "global_step": 81537, "epoch": 1941} {"train_loss": -6.0953898429870605, "global_step": 81538, "epoch": 1941} {"train_loss": -6.161916732788086, "global_step": 81539, "epoch": 1941} {"train_loss": -6.1758012771606445, "global_step": 81540, "epoch": 1941} {"train_loss": -6.179549694061279, "global_step": 81541, "epoch": 1941} {"train_loss": -6.235488414764404, "global_step": 81542, "epoch": 1941} {"train_loss": -6.212484836578369, "global_step": 81543, "epoch": 1941} {"train_loss": -6.253368377685547, "global_step": 81544, "epoch": 1941} {"train_loss": -6.309165000915527, "global_step": 81545, "epoch": 1941} {"train_loss": -6.102343559265137, "global_step": 81546, "epoch": 1941} {"train_loss": -6.283904075622559, "global_step": 81547, "epoch": 1941} {"train_loss": -6.205568313598633, "global_step": 81548, "epoch": 1941} {"train_loss": -6.188482284545898, "global_step": 81549, "epoch": 1941} {"train_loss": -6.190948963165283, "global_step": 81550, "epoch": 1941} {"train_loss": -6.186301231384277, "global_step": 81551, "epoch": 1941} {"train_loss": -6.168094635009766, "global_step": 81552, "epoch": 1941} {"train_loss": -6.154770851135254, "global_step": 81553, "epoch": 1941} {"train_loss": -6.146757125854492, "global_step": 81554, "epoch": 1941} {"train_loss": -6.195313453674316, "global_step": 81555, "epoch": 1941} {"train_loss": -6.086130142211914, "global_step": 81556, "epoch": 1941} {"train_loss": -6.1178297996521, "global_step": 81557, "epoch": 1941} {"train_loss": -6.245510101318359, "global_step": 81558, "epoch": 1941} {"train_loss": -6.154196739196777, "global_step": 81559, "epoch": 1941} {"train_loss": -6.209336280822754, "global_step": 81560, "epoch": 1941} {"train_loss": -6.083747863769531, "global_step": 81561, "epoch": 1941} {"train_loss": -6.1112775802612305, "global_step": 81562, "epoch": 1941} {"train_loss": -6.16547551609221, "global_step": 81563, "epoch": 1941, "val_loss": 62536.5390625} {"train_loss": -6.176974296569824, "global_step": 81564, "epoch": 1942} {"train_loss": -6.153894424438477, "global_step": 81565, "epoch": 1942} {"train_loss": -6.109803199768066, "global_step": 81566, "epoch": 1942} {"train_loss": -6.09903621673584, "global_step": 81567, "epoch": 1942} {"train_loss": -6.132667541503906, "global_step": 81568, "epoch": 1942} {"train_loss": -6.106592178344727, "global_step": 81569, "epoch": 1942} {"train_loss": -6.179506778717041, "global_step": 81570, "epoch": 1942} {"train_loss": -6.181734085083008, "global_step": 81571, "epoch": 1942} {"train_loss": -6.194418907165527, "global_step": 81572, "epoch": 1942} {"train_loss": -6.106925964355469, "global_step": 81573, "epoch": 1942} {"train_loss": -6.304429054260254, "global_step": 81574, "epoch": 1942} {"train_loss": -6.156650543212891, "global_step": 81575, "epoch": 1942} {"train_loss": -6.1203083992004395, "global_step": 81576, "epoch": 1942} {"train_loss": -6.115360260009766, "global_step": 81577, "epoch": 1942} {"train_loss": -6.141493797302246, "global_step": 81578, "epoch": 1942} {"train_loss": -6.193911075592041, "global_step": 81579, "epoch": 1942} {"train_loss": -6.129303932189941, "global_step": 81580, "epoch": 1942} {"train_loss": -6.179320335388184, "global_step": 81581, "epoch": 1942} {"train_loss": -6.0793046951293945, "global_step": 81582, "epoch": 1942} {"train_loss": -6.15128755569458, "global_step": 81583, "epoch": 1942} {"train_loss": -6.1044158935546875, "global_step": 81584, "epoch": 1942} {"train_loss": -6.111400604248047, "global_step": 81585, "epoch": 1942} {"train_loss": -6.104069709777832, "global_step": 81586, "epoch": 1942} {"train_loss": -6.064292907714844, "global_step": 81587, "epoch": 1942} {"train_loss": -6.144017219543457, "global_step": 81588, "epoch": 1942} {"train_loss": -6.142390251159668, "global_step": 81589, "epoch": 1942} {"train_loss": -6.141757965087891, "global_step": 81590, "epoch": 1942} {"train_loss": -6.142910003662109, "global_step": 81591, "epoch": 1942} {"train_loss": -6.165306568145752, "global_step": 81592, "epoch": 1942} {"train_loss": -5.953644752502441, "global_step": 81593, "epoch": 1942} {"train_loss": -6.184110641479492, "global_step": 81594, "epoch": 1942} {"train_loss": -5.947575092315674, "global_step": 81595, "epoch": 1942} {"train_loss": -6.069929599761963, "global_step": 81596, "epoch": 1942} {"train_loss": -6.1317033767700195, "global_step": 81597, "epoch": 1942} {"train_loss": -6.000466346740723, "global_step": 81598, "epoch": 1942} {"train_loss": -6.19785737991333, "global_step": 81599, "epoch": 1942} {"train_loss": -6.14013147354126, "global_step": 81600, "epoch": 1942} {"train_loss": -6.102459907531738, "global_step": 81601, "epoch": 1942} {"train_loss": -6.233756065368652, "global_step": 81602, "epoch": 1942} {"train_loss": -6.2066168785095215, "global_step": 81603, "epoch": 1942} {"train_loss": -6.042684555053711, "global_step": 81604, "epoch": 1942} {"train_loss": -6.129210903531029, "global_step": 81605, "epoch": 1942, "val_loss": 62262.234375} {"train_loss": -6.132137298583984, "global_step": 81606, "epoch": 1943} {"train_loss": -6.164403915405273, "global_step": 81607, "epoch": 1943} {"train_loss": -6.103268146514893, "global_step": 81608, "epoch": 1943} {"train_loss": -6.270748615264893, "global_step": 81609, "epoch": 1943} {"train_loss": -6.186651706695557, "global_step": 81610, "epoch": 1943} {"train_loss": -6.33759069442749, "global_step": 81611, "epoch": 1943} {"train_loss": -6.254024505615234, "global_step": 81612, "epoch": 1943} {"train_loss": -6.2118940353393555, "global_step": 81613, "epoch": 1943} {"train_loss": -6.1925048828125, "global_step": 81614, "epoch": 1943} {"train_loss": -6.061680793762207, "global_step": 81615, "epoch": 1943} {"train_loss": -6.190985202789307, "global_step": 81616, "epoch": 1943} {"train_loss": -6.058506965637207, "global_step": 81617, "epoch": 1943} {"train_loss": -6.24152946472168, "global_step": 81618, "epoch": 1943} {"train_loss": -6.1218156814575195, "global_step": 81619, "epoch": 1943} {"train_loss": -6.202195167541504, "global_step": 81620, "epoch": 1943} {"train_loss": -6.002259254455566, "global_step": 81621, "epoch": 1943} {"train_loss": -6.113903045654297, "global_step": 81622, "epoch": 1943} {"train_loss": -6.117722511291504, "global_step": 81623, "epoch": 1943} {"train_loss": -6.1672444343566895, "global_step": 81624, "epoch": 1943} {"train_loss": -6.091885089874268, "global_step": 81625, "epoch": 1943} {"train_loss": -6.231420516967773, "global_step": 81626, "epoch": 1943} {"train_loss": -6.111078262329102, "global_step": 81627, "epoch": 1943} {"train_loss": -6.260624885559082, "global_step": 81628, "epoch": 1943} {"train_loss": -6.187010765075684, "global_step": 81629, "epoch": 1943} {"train_loss": -6.086726188659668, "global_step": 81630, "epoch": 1943} {"train_loss": -6.198590278625488, "global_step": 81631, "epoch": 1943} {"train_loss": -6.212957382202148, "global_step": 81632, "epoch": 1943} {"train_loss": -6.013873100280762, "global_step": 81633, "epoch": 1943} {"train_loss": -6.264708042144775, "global_step": 81634, "epoch": 1943} {"train_loss": -5.986622333526611, "global_step": 81635, "epoch": 1943} {"train_loss": -6.226004600524902, "global_step": 81636, "epoch": 1943} {"train_loss": -6.090249061584473, "global_step": 81637, "epoch": 1943} {"train_loss": -6.186883926391602, "global_step": 81638, "epoch": 1943} {"train_loss": -6.184379577636719, "global_step": 81639, "epoch": 1943} {"train_loss": -6.200201034545898, "global_step": 81640, "epoch": 1943} {"train_loss": -6.074457168579102, "global_step": 81641, "epoch": 1943} {"train_loss": -6.242203235626221, "global_step": 81642, "epoch": 1943} {"train_loss": -6.140618801116943, "global_step": 81643, "epoch": 1943} {"train_loss": -6.110685348510742, "global_step": 81644, "epoch": 1943} {"train_loss": -6.203451156616211, "global_step": 81645, "epoch": 1943} {"train_loss": -6.157454013824463, "global_step": 81646, "epoch": 1943} {"train_loss": -6.160989715939476, "global_step": 81647, "epoch": 1943, "val_loss": 62240.5703125} {"train_loss": -6.225468635559082, "global_step": 81648, "epoch": 1944} {"train_loss": -6.282882213592529, "global_step": 81649, "epoch": 1944} {"train_loss": -6.1324896812438965, "global_step": 81650, "epoch": 1944} {"train_loss": -6.109981536865234, "global_step": 81651, "epoch": 1944} {"train_loss": -6.126025199890137, "global_step": 81652, "epoch": 1944} {"train_loss": -6.206385612487793, "global_step": 81653, "epoch": 1944} {"train_loss": -6.187573432922363, "global_step": 81654, "epoch": 1944} {"train_loss": -6.12548303604126, "global_step": 81655, "epoch": 1944} {"train_loss": -6.127679824829102, "global_step": 81656, "epoch": 1944} {"train_loss": -6.243819713592529, "global_step": 81657, "epoch": 1944} {"train_loss": -6.149288654327393, "global_step": 81658, "epoch": 1944} {"train_loss": -6.2173662185668945, "global_step": 81659, "epoch": 1944} {"train_loss": -6.130475997924805, "global_step": 81660, "epoch": 1944} {"train_loss": -6.113255023956299, "global_step": 81661, "epoch": 1944} {"train_loss": -6.242311477661133, "global_step": 81662, "epoch": 1944} {"train_loss": -6.208559513092041, "global_step": 81663, "epoch": 1944} {"train_loss": -6.124273777008057, "global_step": 81664, "epoch": 1944} {"train_loss": -6.134016990661621, "global_step": 81665, "epoch": 1944} {"train_loss": -6.036930084228516, "global_step": 81666, "epoch": 1944} {"train_loss": -6.033485412597656, "global_step": 81667, "epoch": 1944} {"train_loss": -6.138659477233887, "global_step": 81668, "epoch": 1944} {"train_loss": -6.15723991394043, "global_step": 81669, "epoch": 1944} {"train_loss": -6.087558269500732, "global_step": 81670, "epoch": 1944} {"train_loss": -6.194755554199219, "global_step": 81671, "epoch": 1944} {"train_loss": -6.108614921569824, "global_step": 81672, "epoch": 1944} {"train_loss": -6.064055919647217, "global_step": 81673, "epoch": 1944} {"train_loss": -6.099879741668701, "global_step": 81674, "epoch": 1944} {"train_loss": -6.194085121154785, "global_step": 81675, "epoch": 1944} {"train_loss": -6.232206344604492, "global_step": 81676, "epoch": 1944} {"train_loss": -6.120741367340088, "global_step": 81677, "epoch": 1944} {"train_loss": -6.160840034484863, "global_step": 81678, "epoch": 1944} {"train_loss": -6.207172393798828, "global_step": 81679, "epoch": 1944} {"train_loss": -6.1153364181518555, "global_step": 81680, "epoch": 1944} {"train_loss": -6.144129276275635, "global_step": 81681, "epoch": 1944} {"train_loss": -6.182905197143555, "global_step": 81682, "epoch": 1944} {"train_loss": -6.125470161437988, "global_step": 81683, "epoch": 1944} {"train_loss": -6.172188758850098, "global_step": 81684, "epoch": 1944} {"train_loss": -6.199892997741699, "global_step": 81685, "epoch": 1944} {"train_loss": -6.293457984924316, "global_step": 81686, "epoch": 1944} {"train_loss": -6.1864776611328125, "global_step": 81687, "epoch": 1944} {"train_loss": -6.093172073364258, "global_step": 81688, "epoch": 1944} {"train_loss": -6.157281307947068, "global_step": 81689, "epoch": 1944, "val_loss": 62452.2421875} {"train_loss": -6.180438995361328, "global_step": 81690, "epoch": 1945} {"train_loss": -6.119821548461914, "global_step": 81691, "epoch": 1945} {"train_loss": -6.246855735778809, "global_step": 81692, "epoch": 1945} {"train_loss": -6.1080098152160645, "global_step": 81693, "epoch": 1945} {"train_loss": -6.1492414474487305, "global_step": 81694, "epoch": 1945} {"train_loss": -6.2209601402282715, "global_step": 81695, "epoch": 1945} {"train_loss": -6.077792167663574, "global_step": 81696, "epoch": 1945} {"train_loss": -6.138126373291016, "global_step": 81697, "epoch": 1945} {"train_loss": -6.0593581199646, "global_step": 81698, "epoch": 1945} {"train_loss": -6.16865348815918, "global_step": 81699, "epoch": 1945} {"train_loss": -6.1468353271484375, "global_step": 81700, "epoch": 1945} {"train_loss": -6.118157386779785, "global_step": 81701, "epoch": 1945} {"train_loss": -6.08055305480957, "global_step": 81702, "epoch": 1945} {"train_loss": -6.222933769226074, "global_step": 81703, "epoch": 1945} {"train_loss": -6.032336235046387, "global_step": 81704, "epoch": 1945} {"train_loss": -6.167611122131348, "global_step": 81705, "epoch": 1945} {"train_loss": -6.072973251342773, "global_step": 81706, "epoch": 1945} {"train_loss": -5.979973316192627, "global_step": 81707, "epoch": 1945} {"train_loss": -6.301565647125244, "global_step": 81708, "epoch": 1945} {"train_loss": -6.084772109985352, "global_step": 81709, "epoch": 1945} {"train_loss": -6.28065299987793, "global_step": 81710, "epoch": 1945} {"train_loss": -6.136704444885254, "global_step": 81711, "epoch": 1945} {"train_loss": -6.190584659576416, "global_step": 81712, "epoch": 1945} {"train_loss": -6.163260459899902, "global_step": 81713, "epoch": 1945} {"train_loss": -6.03778600692749, "global_step": 81714, "epoch": 1945} {"train_loss": -6.08375358581543, "global_step": 81715, "epoch": 1945} {"train_loss": -6.194435119628906, "global_step": 81716, "epoch": 1945} {"train_loss": -6.161080360412598, "global_step": 81717, "epoch": 1945} {"train_loss": -6.1417059898376465, "global_step": 81718, "epoch": 1945} {"train_loss": -6.022931098937988, "global_step": 81719, "epoch": 1945} {"train_loss": -6.003956317901611, "global_step": 81720, "epoch": 1945} {"train_loss": -6.184849739074707, "global_step": 81721, "epoch": 1945} {"train_loss": -6.103598117828369, "global_step": 81722, "epoch": 1945} {"train_loss": -6.182069301605225, "global_step": 81723, "epoch": 1945} {"train_loss": -6.105865478515625, "global_step": 81724, "epoch": 1945} {"train_loss": -6.2174577713012695, "global_step": 81725, "epoch": 1945} {"train_loss": -6.099856376647949, "global_step": 81726, "epoch": 1945} {"train_loss": -6.131941795349121, "global_step": 81727, "epoch": 1945} {"train_loss": -6.125635147094727, "global_step": 81728, "epoch": 1945} {"train_loss": -6.263506889343262, "global_step": 81729, "epoch": 1945} {"train_loss": -6.185647964477539, "global_step": 81730, "epoch": 1945} {"train_loss": -6.1404005118778775, "global_step": 81731, "epoch": 1945, "val_loss": 62383.33984375} {"train_loss": -6.131418228149414, "global_step": 81732, "epoch": 1946} {"train_loss": -6.0269694328308105, "global_step": 81733, "epoch": 1946} {"train_loss": -6.188394546508789, "global_step": 81734, "epoch": 1946} {"train_loss": -6.241089344024658, "global_step": 81735, "epoch": 1946} {"train_loss": -6.0353684425354, "global_step": 81736, "epoch": 1946} {"train_loss": -6.23468542098999, "global_step": 81737, "epoch": 1946} {"train_loss": -6.197903633117676, "global_step": 81738, "epoch": 1946} {"train_loss": -6.170357704162598, "global_step": 81739, "epoch": 1946} {"train_loss": -6.098832130432129, "global_step": 81740, "epoch": 1946} {"train_loss": -6.040933609008789, "global_step": 81741, "epoch": 1946} {"train_loss": -6.152132987976074, "global_step": 81742, "epoch": 1946} {"train_loss": -6.265161991119385, "global_step": 81743, "epoch": 1946} {"train_loss": -6.153888702392578, "global_step": 81744, "epoch": 1946} {"train_loss": -6.3542680740356445, "global_step": 81745, "epoch": 1946} {"train_loss": -6.14984130859375, "global_step": 81746, "epoch": 1946} {"train_loss": -6.195298671722412, "global_step": 81747, "epoch": 1946} {"train_loss": -6.214351654052734, "global_step": 81748, "epoch": 1946} {"train_loss": -6.057559967041016, "global_step": 81749, "epoch": 1946} {"train_loss": -6.213265895843506, "global_step": 81750, "epoch": 1946} {"train_loss": -6.130027770996094, "global_step": 81751, "epoch": 1946} {"train_loss": -6.14996337890625, "global_step": 81752, "epoch": 1946} {"train_loss": -6.12168550491333, "global_step": 81753, "epoch": 1946} {"train_loss": -6.126481056213379, "global_step": 81754, "epoch": 1946} {"train_loss": -6.141383171081543, "global_step": 81755, "epoch": 1946} {"train_loss": -6.123434066772461, "global_step": 81756, "epoch": 1946} {"train_loss": -6.129865646362305, "global_step": 81757, "epoch": 1946} {"train_loss": -6.20612907409668, "global_step": 81758, "epoch": 1946} {"train_loss": -6.2241363525390625, "global_step": 81759, "epoch": 1946} {"train_loss": -6.219409942626953, "global_step": 81760, "epoch": 1946} {"train_loss": -6.273632049560547, "global_step": 81761, "epoch": 1946} {"train_loss": -6.231051921844482, "global_step": 81762, "epoch": 1946} {"train_loss": -6.135354995727539, "global_step": 81763, "epoch": 1946} {"train_loss": -6.168592929840088, "global_step": 81764, "epoch": 1946} {"train_loss": -6.222724914550781, "global_step": 81765, "epoch": 1946} {"train_loss": -6.206114292144775, "global_step": 81766, "epoch": 1946} {"train_loss": -6.182365417480469, "global_step": 81767, "epoch": 1946} {"train_loss": -6.098444938659668, "global_step": 81768, "epoch": 1946} {"train_loss": -6.091196060180664, "global_step": 81769, "epoch": 1946} {"train_loss": -6.171128749847412, "global_step": 81770, "epoch": 1946} {"train_loss": -6.173762321472168, "global_step": 81771, "epoch": 1946} {"train_loss": -6.130232810974121, "global_step": 81772, "epoch": 1946} {"train_loss": -6.163782993952434, "global_step": 81773, "epoch": 1946, "val_loss": 62528.92578125} {"train_loss": -6.258760452270508, "global_step": 81774, "epoch": 1947} {"train_loss": -6.247838020324707, "global_step": 81775, "epoch": 1947} {"train_loss": -6.071394920349121, "global_step": 81776, "epoch": 1947} {"train_loss": -6.1331377029418945, "global_step": 81777, "epoch": 1947} {"train_loss": -6.0758585929870605, "global_step": 81778, "epoch": 1947} {"train_loss": -6.1916608810424805, "global_step": 81779, "epoch": 1947} {"train_loss": -6.258220672607422, "global_step": 81780, "epoch": 1947} {"train_loss": -6.146435737609863, "global_step": 81781, "epoch": 1947} {"train_loss": -6.102142333984375, "global_step": 81782, "epoch": 1947} {"train_loss": -6.082867622375488, "global_step": 81783, "epoch": 1947} {"train_loss": -6.226747512817383, "global_step": 81784, "epoch": 1947} {"train_loss": -6.175887584686279, "global_step": 81785, "epoch": 1947} {"train_loss": -6.106480598449707, "global_step": 81786, "epoch": 1947} {"train_loss": -6.205713748931885, "global_step": 81787, "epoch": 1947} {"train_loss": -6.155411243438721, "global_step": 81788, "epoch": 1947} {"train_loss": -6.223674774169922, "global_step": 81789, "epoch": 1947} {"train_loss": -6.193661212921143, "global_step": 81790, "epoch": 1947} {"train_loss": -5.883378028869629, "global_step": 81791, "epoch": 1947} {"train_loss": -6.137406349182129, "global_step": 81792, "epoch": 1947} {"train_loss": -6.085562705993652, "global_step": 81793, "epoch": 1947} {"train_loss": -6.123317241668701, "global_step": 81794, "epoch": 1947} {"train_loss": -6.2942118644714355, "global_step": 81795, "epoch": 1947} {"train_loss": -6.213427543640137, "global_step": 81796, "epoch": 1947} {"train_loss": -6.1350555419921875, "global_step": 81797, "epoch": 1947} {"train_loss": -6.110172271728516, "global_step": 81798, "epoch": 1947} {"train_loss": -6.1583404541015625, "global_step": 81799, "epoch": 1947} {"train_loss": -6.03902530670166, "global_step": 81800, "epoch": 1947} {"train_loss": -6.143181324005127, "global_step": 81801, "epoch": 1947} {"train_loss": -6.074802875518799, "global_step": 81802, "epoch": 1947} {"train_loss": -6.163207530975342, "global_step": 81803, "epoch": 1947} {"train_loss": -6.13184118270874, "global_step": 81804, "epoch": 1947} {"train_loss": -6.245985984802246, "global_step": 81805, "epoch": 1947} {"train_loss": -6.082521915435791, "global_step": 81806, "epoch": 1947} {"train_loss": -6.156531810760498, "global_step": 81807, "epoch": 1947} {"train_loss": -6.195528030395508, "global_step": 81808, "epoch": 1947} {"train_loss": -6.049596309661865, "global_step": 81809, "epoch": 1947} {"train_loss": -6.171991348266602, "global_step": 81810, "epoch": 1947} {"train_loss": -6.115828514099121, "global_step": 81811, "epoch": 1947} {"train_loss": -6.0901103019714355, "global_step": 81812, "epoch": 1947} {"train_loss": -6.161542892456055, "global_step": 81813, "epoch": 1947} {"train_loss": -6.2495927810668945, "global_step": 81814, "epoch": 1947} {"train_loss": -6.147141172772362, "global_step": 81815, "epoch": 1947, "val_loss": 62665.54296875} {"train_loss": -6.092379093170166, "global_step": 81816, "epoch": 1948} {"train_loss": -6.223133087158203, "global_step": 81817, "epoch": 1948} {"train_loss": -6.2125654220581055, "global_step": 81818, "epoch": 1948} {"train_loss": -6.114189147949219, "global_step": 81819, "epoch": 1948} {"train_loss": -6.199087619781494, "global_step": 81820, "epoch": 1948} {"train_loss": -6.240571975708008, "global_step": 81821, "epoch": 1948} {"train_loss": -6.160380840301514, "global_step": 81822, "epoch": 1948} {"train_loss": -6.155813217163086, "global_step": 81823, "epoch": 1948} {"train_loss": -6.064831256866455, "global_step": 81824, "epoch": 1948} {"train_loss": -6.25473165512085, "global_step": 81825, "epoch": 1948} {"train_loss": -5.99638557434082, "global_step": 81826, "epoch": 1948} {"train_loss": -6.1542158126831055, "global_step": 81827, "epoch": 1948} {"train_loss": -6.110751152038574, "global_step": 81828, "epoch": 1948} {"train_loss": -6.201868057250977, "global_step": 81829, "epoch": 1948} {"train_loss": -6.232544898986816, "global_step": 81830, "epoch": 1948} {"train_loss": -6.087932586669922, "global_step": 81831, "epoch": 1948} {"train_loss": -6.220461368560791, "global_step": 81832, "epoch": 1948} {"train_loss": -6.174553394317627, "global_step": 81833, "epoch": 1948} {"train_loss": -6.268777847290039, "global_step": 81834, "epoch": 1948} {"train_loss": -6.09726619720459, "global_step": 81835, "epoch": 1948} {"train_loss": -6.175527095794678, "global_step": 81836, "epoch": 1948} {"train_loss": -6.140764236450195, "global_step": 81837, "epoch": 1948} {"train_loss": -6.154942512512207, "global_step": 81838, "epoch": 1948} {"train_loss": -6.202297687530518, "global_step": 81839, "epoch": 1948} {"train_loss": -6.194089889526367, "global_step": 81840, "epoch": 1948} {"train_loss": -6.213942527770996, "global_step": 81841, "epoch": 1948} {"train_loss": -6.294253826141357, "global_step": 81842, "epoch": 1948} {"train_loss": -6.15173864364624, "global_step": 81843, "epoch": 1948} {"train_loss": -6.350398540496826, "global_step": 81844, "epoch": 1948} {"train_loss": -6.246950149536133, "global_step": 81845, "epoch": 1948} {"train_loss": -6.132720470428467, "global_step": 81846, "epoch": 1948} {"train_loss": -6.210675239562988, "global_step": 81847, "epoch": 1948} {"train_loss": -6.148737907409668, "global_step": 81848, "epoch": 1948} {"train_loss": -6.027064323425293, "global_step": 81849, "epoch": 1948} {"train_loss": -6.141342639923096, "global_step": 81850, "epoch": 1948} {"train_loss": -6.0029497146606445, "global_step": 81851, "epoch": 1948} {"train_loss": -6.103371620178223, "global_step": 81852, "epoch": 1948} {"train_loss": -6.014614105224609, "global_step": 81853, "epoch": 1948} {"train_loss": -6.031706809997559, "global_step": 81854, "epoch": 1948} {"train_loss": -6.125566005706787, "global_step": 81855, "epoch": 1948} {"train_loss": -6.211614608764648, "global_step": 81856, "epoch": 1948} {"train_loss": -6.159894227981567, "global_step": 81857, "epoch": 1948, "val_loss": 62586.3359375} {"train_loss": -6.236758232116699, "global_step": 81858, "epoch": 1949} {"train_loss": -6.090023040771484, "global_step": 81859, "epoch": 1949} {"train_loss": -6.082925796508789, "global_step": 81860, "epoch": 1949} {"train_loss": -6.107734680175781, "global_step": 81861, "epoch": 1949} {"train_loss": -6.207579612731934, "global_step": 81862, "epoch": 1949} {"train_loss": -6.177533149719238, "global_step": 81863, "epoch": 1949} {"train_loss": -6.196984767913818, "global_step": 81864, "epoch": 1949} {"train_loss": -6.180203914642334, "global_step": 81865, "epoch": 1949} {"train_loss": -6.2221879959106445, "global_step": 81866, "epoch": 1949} {"train_loss": -6.2103962898254395, "global_step": 81867, "epoch": 1949} {"train_loss": -6.126958847045898, "global_step": 81868, "epoch": 1949} {"train_loss": -6.159511566162109, "global_step": 81869, "epoch": 1949} {"train_loss": -6.051052093505859, "global_step": 81870, "epoch": 1949} {"train_loss": -6.057765007019043, "global_step": 81871, "epoch": 1949} {"train_loss": -6.196068286895752, "global_step": 81872, "epoch": 1949} {"train_loss": -6.151020050048828, "global_step": 81873, "epoch": 1949} {"train_loss": -6.189491271972656, "global_step": 81874, "epoch": 1949} {"train_loss": -6.133089542388916, "global_step": 81875, "epoch": 1949} {"train_loss": -6.0720062255859375, "global_step": 81876, "epoch": 1949} {"train_loss": -6.247421741485596, "global_step": 81877, "epoch": 1949} {"train_loss": -6.1523237228393555, "global_step": 81878, "epoch": 1949} {"train_loss": -6.220076084136963, "global_step": 81879, "epoch": 1949} {"train_loss": -6.1272478103637695, "global_step": 81880, "epoch": 1949} {"train_loss": -6.048581600189209, "global_step": 81881, "epoch": 1949} {"train_loss": -6.27104377746582, "global_step": 81882, "epoch": 1949} {"train_loss": -6.0461297035217285, "global_step": 81883, "epoch": 1949} {"train_loss": -6.119095325469971, "global_step": 81884, "epoch": 1949} {"train_loss": -6.185507774353027, "global_step": 81885, "epoch": 1949} {"train_loss": -6.152250289916992, "global_step": 81886, "epoch": 1949} {"train_loss": -6.119551658630371, "global_step": 81887, "epoch": 1949} {"train_loss": -6.15549373626709, "global_step": 81888, "epoch": 1949} {"train_loss": -6.2008137702941895, "global_step": 81889, "epoch": 1949} {"train_loss": -6.020719528198242, "global_step": 81890, "epoch": 1949} {"train_loss": -6.232621192932129, "global_step": 81891, "epoch": 1949} {"train_loss": -6.254697799682617, "global_step": 81892, "epoch": 1949} {"train_loss": -6.186999320983887, "global_step": 81893, "epoch": 1949} {"train_loss": -6.1630120277404785, "global_step": 81894, "epoch": 1949} {"train_loss": -6.129614353179932, "global_step": 81895, "epoch": 1949} {"train_loss": -6.040021896362305, "global_step": 81896, "epoch": 1949} {"train_loss": -6.161049842834473, "global_step": 81897, "epoch": 1949} {"train_loss": -6.068255424499512, "global_step": 81898, "epoch": 1949} {"train_loss": -6.152119295937674, "global_step": 81899, "epoch": 1949, "val_loss": 62406.703125} {"train_loss": -6.12911319732666, "global_step": 81900, "epoch": 1950} {"train_loss": -5.9498291015625, "global_step": 81901, "epoch": 1950} {"train_loss": -6.117342472076416, "global_step": 81902, "epoch": 1950} {"train_loss": -6.12375545501709, "global_step": 81903, "epoch": 1950} {"train_loss": -6.170860767364502, "global_step": 81904, "epoch": 1950} {"train_loss": -6.102363586425781, "global_step": 81905, "epoch": 1950} {"train_loss": -6.179036617279053, "global_step": 81906, "epoch": 1950} {"train_loss": -6.073417663574219, "global_step": 81907, "epoch": 1950} {"train_loss": -6.227738380432129, "global_step": 81908, "epoch": 1950} {"train_loss": -6.051333904266357, "global_step": 81909, "epoch": 1950} {"train_loss": -6.079533100128174, "global_step": 81910, "epoch": 1950} {"train_loss": -6.136685371398926, "global_step": 81911, "epoch": 1950} {"train_loss": -6.191923141479492, "global_step": 81912, "epoch": 1950} {"train_loss": -6.173670768737793, "global_step": 81913, "epoch": 1950} {"train_loss": -6.231620788574219, "global_step": 81914, "epoch": 1950} {"train_loss": -6.050956726074219, "global_step": 81915, "epoch": 1950} {"train_loss": -6.132063865661621, "global_step": 81916, "epoch": 1950} {"train_loss": -6.069452285766602, "global_step": 81917, "epoch": 1950} {"train_loss": -6.274328708648682, "global_step": 81918, "epoch": 1950} {"train_loss": -6.280634880065918, "global_step": 81919, "epoch": 1950} {"train_loss": -6.152413368225098, "global_step": 81920, "epoch": 1950} {"train_loss": -6.178586006164551, "global_step": 81921, "epoch": 1950} {"train_loss": -6.210883140563965, "global_step": 81922, "epoch": 1950} {"train_loss": -6.237622261047363, "global_step": 81923, "epoch": 1950} {"train_loss": -6.1878981590271, "global_step": 81924, "epoch": 1950} {"train_loss": -6.061206817626953, "global_step": 81925, "epoch": 1950} {"train_loss": -6.20552921295166, "global_step": 81926, "epoch": 1950} {"train_loss": -6.089321136474609, "global_step": 81927, "epoch": 1950} {"train_loss": -6.086824893951416, "global_step": 81928, "epoch": 1950} {"train_loss": -6.209726333618164, "global_step": 81929, "epoch": 1950} {"train_loss": -6.073535442352295, "global_step": 81930, "epoch": 1950} {"train_loss": -6.290417671203613, "global_step": 81931, "epoch": 1950} {"train_loss": -6.239375114440918, "global_step": 81932, "epoch": 1950} {"train_loss": -6.098239421844482, "global_step": 81933, "epoch": 1950} {"train_loss": -6.205502510070801, "global_step": 81934, "epoch": 1950} {"train_loss": -6.226511001586914, "global_step": 81935, "epoch": 1950} {"train_loss": -6.192919731140137, "global_step": 81936, "epoch": 1950} {"train_loss": -6.148965835571289, "global_step": 81937, "epoch": 1950} {"train_loss": -6.260648250579834, "global_step": 81938, "epoch": 1950} {"train_loss": -6.232025146484375, "global_step": 81939, "epoch": 1950} {"train_loss": -6.12186336517334, "global_step": 81940, "epoch": 1950} {"train_loss": -6.157310349600656, "global_step": 81941, "epoch": 1950, "train/sim_max_reward_0": 0.37038637003307323, "train/sim_max_reward_1": 0.8338045662598779, "train/sim_max_reward_2": 0.1821453183840025, "train/sim_max_reward_3": 0.8313597581545246, "train/sim_max_reward_4": 0.850414327321744, "train/sim_max_reward_5": 0.3675389932556964, "test/sim_max_reward_4300000": 0.6771516564037645, "test/sim_max_reward_4300001": 0.4078773114463445, "test/sim_max_reward_4300002": 0.8528859569900699, "test/sim_max_reward_4300003": 0.6993095110157749, "test/sim_max_reward_4300004": 0.3551799958636364, "test/sim_max_reward_4300005": 0.995164668983194, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.5805836214787101, "test/sim_max_reward_4300008": 0.46889623479563797, "test/sim_max_reward_4300009": 0.8321911375051301, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.3979449839312887, "test/sim_max_reward_4300012": 0.8323075998168157, "test/sim_max_reward_4300013": 0.7124151934131217, "test/sim_max_reward_4300014": 0.8362384564576164, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.9032452419806092, "test/sim_max_reward_4300017": 0.9218300557812045, "test/sim_max_reward_4300018": 0.41202575032111566, "test/sim_max_reward_4300019": 0.18617245701319426, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.34949179205494985, "test/sim_max_reward_4300022": 0.9951619066693972, "test/sim_max_reward_4300023": 0.3395640680069691, "test/sim_max_reward_4300024": 0.14025808793549774, "test/sim_max_reward_4300025": 0.9505962353753998, "test/sim_max_reward_4300026": 0.050878423390650566, "test/sim_max_reward_4300027": 0.9293505665866576, "test/sim_max_reward_4300028": 0.0007426128997104187, "test/sim_max_reward_4300029": 0.013189627525790506, "test/sim_max_reward_4300030": 0.8779258067436618, "test/sim_max_reward_4300031": 0.9466644918696345, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.45634397310440594, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.3942713802076951, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9775730856747117, "test/sim_max_reward_4300038": 0.8266135097164358, "test/sim_max_reward_4300039": 0.43738117340736393, "test/sim_max_reward_4300040": 0.9259138784513624, "test/sim_max_reward_4300041": 0.5506631876772407, "test/sim_max_reward_4300042": 0.599009638721593, "test/sim_max_reward_4300043": 0.6158156516728539, "test/sim_max_reward_4300044": 0.942520890357802, "test/sim_max_reward_4300045": 0.18717567883950575, "test/sim_max_reward_4300046": 0.9294103202817489, "test/sim_max_reward_4300047": 0.3446890652120165, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.20890006901785874, "train/mean_score": 0.5726082222348198, "test/mean_score": 0.5452143814032324, "val_loss": 62513.02734375} {"train_loss": -6.033679008483887, "global_step": 81942, "epoch": 1951} {"train_loss": -6.278698921203613, "global_step": 81943, "epoch": 1951} {"train_loss": -6.136921405792236, "global_step": 81944, "epoch": 1951} {"train_loss": -6.081583023071289, "global_step": 81945, "epoch": 1951} {"train_loss": -6.137650012969971, "global_step": 81946, "epoch": 1951} {"train_loss": -6.266329288482666, "global_step": 81947, "epoch": 1951} {"train_loss": -6.1402764320373535, "global_step": 81948, "epoch": 1951} {"train_loss": -6.236754417419434, "global_step": 81949, "epoch": 1951} {"train_loss": -6.233057975769043, "global_step": 81950, "epoch": 1951} {"train_loss": -6.222454071044922, "global_step": 81951, "epoch": 1951} {"train_loss": -6.227118015289307, "global_step": 81952, "epoch": 1951} {"train_loss": -6.184666633605957, "global_step": 81953, "epoch": 1951} {"train_loss": -6.156792640686035, "global_step": 81954, "epoch": 1951} {"train_loss": -6.176013946533203, "global_step": 81955, "epoch": 1951} {"train_loss": -6.167250633239746, "global_step": 81956, "epoch": 1951} {"train_loss": -6.165252685546875, "global_step": 81957, "epoch": 1951} {"train_loss": -6.112079620361328, "global_step": 81958, "epoch": 1951} {"train_loss": -6.144428253173828, "global_step": 81959, "epoch": 1951} {"train_loss": -6.116151809692383, "global_step": 81960, "epoch": 1951} {"train_loss": -6.232007026672363, "global_step": 81961, "epoch": 1951} {"train_loss": -6.125582218170166, "global_step": 81962, "epoch": 1951} {"train_loss": -6.14537239074707, "global_step": 81963, "epoch": 1951} {"train_loss": -6.233861446380615, "global_step": 81964, "epoch": 1951} {"train_loss": -6.19523811340332, "global_step": 81965, "epoch": 1951} {"train_loss": -6.111325263977051, "global_step": 81966, "epoch": 1951} {"train_loss": -6.208271503448486, "global_step": 81967, "epoch": 1951} {"train_loss": -6.163404941558838, "global_step": 81968, "epoch": 1951} {"train_loss": -6.22636604309082, "global_step": 81969, "epoch": 1951} {"train_loss": -6.188724517822266, "global_step": 81970, "epoch": 1951} {"train_loss": -6.249141216278076, "global_step": 81971, "epoch": 1951} {"train_loss": -6.176882266998291, "global_step": 81972, "epoch": 1951} {"train_loss": -6.173595428466797, "global_step": 81973, "epoch": 1951} {"train_loss": -6.246759414672852, "global_step": 81974, "epoch": 1951} {"train_loss": -6.216597557067871, "global_step": 81975, "epoch": 1951} {"train_loss": -6.199061870574951, "global_step": 81976, "epoch": 1951} {"train_loss": -6.194573402404785, "global_step": 81977, "epoch": 1951} {"train_loss": -6.186791896820068, "global_step": 81978, "epoch": 1951} {"train_loss": -6.140622138977051, "global_step": 81979, "epoch": 1951} {"train_loss": -6.318916320800781, "global_step": 81980, "epoch": 1951} {"train_loss": -6.12890100479126, "global_step": 81981, "epoch": 1951} {"train_loss": -6.165318012237549, "global_step": 81982, "epoch": 1951} {"train_loss": -6.17773943855649, "global_step": 81983, "epoch": 1951, "val_loss": 62358.34765625} {"train_loss": -6.109852313995361, "global_step": 81984, "epoch": 1952} {"train_loss": -6.045516014099121, "global_step": 81985, "epoch": 1952} {"train_loss": -6.102787971496582, "global_step": 81986, "epoch": 1952} {"train_loss": -6.257053375244141, "global_step": 81987, "epoch": 1952} {"train_loss": -6.1582207679748535, "global_step": 81988, "epoch": 1952} {"train_loss": -6.215387344360352, "global_step": 81989, "epoch": 1952} {"train_loss": -6.202607154846191, "global_step": 81990, "epoch": 1952} {"train_loss": -6.221018314361572, "global_step": 81991, "epoch": 1952} {"train_loss": -6.126784801483154, "global_step": 81992, "epoch": 1952} {"train_loss": -6.247898101806641, "global_step": 81993, "epoch": 1952} {"train_loss": -6.11575174331665, "global_step": 81994, "epoch": 1952} {"train_loss": -6.3025360107421875, "global_step": 81995, "epoch": 1952} {"train_loss": -6.20463228225708, "global_step": 81996, "epoch": 1952} {"train_loss": -6.238924026489258, "global_step": 81997, "epoch": 1952} {"train_loss": -6.089067459106445, "global_step": 81998, "epoch": 1952} {"train_loss": -6.166367530822754, "global_step": 81999, "epoch": 1952} {"train_loss": -6.141112327575684, "global_step": 82000, "epoch": 1952} {"train_loss": -6.154565811157227, "global_step": 82001, "epoch": 1952} {"train_loss": -6.156397819519043, "global_step": 82002, "epoch": 1952} {"train_loss": -6.163679122924805, "global_step": 82003, "epoch": 1952} {"train_loss": -6.219362258911133, "global_step": 82004, "epoch": 1952} {"train_loss": -6.156420707702637, "global_step": 82005, "epoch": 1952} {"train_loss": -6.1798858642578125, "global_step": 82006, "epoch": 1952} {"train_loss": -6.104891777038574, "global_step": 82007, "epoch": 1952} {"train_loss": -6.246710300445557, "global_step": 82008, "epoch": 1952} {"train_loss": -6.209371566772461, "global_step": 82009, "epoch": 1952} {"train_loss": -6.180322170257568, "global_step": 82010, "epoch": 1952} {"train_loss": -6.118586540222168, "global_step": 82011, "epoch": 1952} {"train_loss": -6.088894367218018, "global_step": 82012, "epoch": 1952} {"train_loss": -6.209681034088135, "global_step": 82013, "epoch": 1952} {"train_loss": -6.225177764892578, "global_step": 82014, "epoch": 1952} {"train_loss": -6.041381359100342, "global_step": 82015, "epoch": 1952} {"train_loss": -6.2927446365356445, "global_step": 82016, "epoch": 1952} {"train_loss": -6.189447402954102, "global_step": 82017, "epoch": 1952} {"train_loss": -6.0853729248046875, "global_step": 82018, "epoch": 1952} {"train_loss": -6.227224826812744, "global_step": 82019, "epoch": 1952} {"train_loss": -6.193245887756348, "global_step": 82020, "epoch": 1952} {"train_loss": -6.1857805252075195, "global_step": 82021, "epoch": 1952} {"train_loss": -6.251087188720703, "global_step": 82022, "epoch": 1952} {"train_loss": -6.110028266906738, "global_step": 82023, "epoch": 1952} {"train_loss": -6.061832427978516, "global_step": 82024, "epoch": 1952} {"train_loss": -6.169533956618536, "global_step": 82025, "epoch": 1952, "val_loss": 62363.7890625} {"train_loss": -6.210470199584961, "global_step": 82026, "epoch": 1953} {"train_loss": -6.101893424987793, "global_step": 82027, "epoch": 1953} {"train_loss": -6.244060516357422, "global_step": 82028, "epoch": 1953} {"train_loss": -6.1391096115112305, "global_step": 82029, "epoch": 1953} {"train_loss": -6.208998680114746, "global_step": 82030, "epoch": 1953} {"train_loss": -6.280971527099609, "global_step": 82031, "epoch": 1953} {"train_loss": -6.165007591247559, "global_step": 82032, "epoch": 1953} {"train_loss": -6.28975248336792, "global_step": 82033, "epoch": 1953} {"train_loss": -6.1061601638793945, "global_step": 82034, "epoch": 1953} {"train_loss": -6.166774272918701, "global_step": 82035, "epoch": 1953} {"train_loss": -6.04030704498291, "global_step": 82036, "epoch": 1953} {"train_loss": -6.191554069519043, "global_step": 82037, "epoch": 1953} {"train_loss": -6.177276611328125, "global_step": 82038, "epoch": 1953} {"train_loss": -6.148789405822754, "global_step": 82039, "epoch": 1953} {"train_loss": -6.172916412353516, "global_step": 82040, "epoch": 1953} {"train_loss": -6.159095287322998, "global_step": 82041, "epoch": 1953} {"train_loss": -6.162734031677246, "global_step": 82042, "epoch": 1953} {"train_loss": -6.280591011047363, "global_step": 82043, "epoch": 1953} {"train_loss": -6.171234130859375, "global_step": 82044, "epoch": 1953} {"train_loss": -6.177236557006836, "global_step": 82045, "epoch": 1953} {"train_loss": -6.094638347625732, "global_step": 82046, "epoch": 1953} {"train_loss": -6.225934982299805, "global_step": 82047, "epoch": 1953} {"train_loss": -6.313591957092285, "global_step": 82048, "epoch": 1953} {"train_loss": -6.209834575653076, "global_step": 82049, "epoch": 1953} {"train_loss": -6.121132850646973, "global_step": 82050, "epoch": 1953} {"train_loss": -6.210034370422363, "global_step": 82051, "epoch": 1953} {"train_loss": -6.112394332885742, "global_step": 82052, "epoch": 1953} {"train_loss": -6.181819438934326, "global_step": 82053, "epoch": 1953} {"train_loss": -6.269791126251221, "global_step": 82054, "epoch": 1953} {"train_loss": -6.142300128936768, "global_step": 82055, "epoch": 1953} {"train_loss": -6.2355241775512695, "global_step": 82056, "epoch": 1953} {"train_loss": -6.052033424377441, "global_step": 82057, "epoch": 1953} {"train_loss": -6.164412498474121, "global_step": 82058, "epoch": 1953} {"train_loss": -6.250916481018066, "global_step": 82059, "epoch": 1953} {"train_loss": -6.045184135437012, "global_step": 82060, "epoch": 1953} {"train_loss": -6.187713146209717, "global_step": 82061, "epoch": 1953} {"train_loss": -6.176473617553711, "global_step": 82062, "epoch": 1953} {"train_loss": -6.286218643188477, "global_step": 82063, "epoch": 1953} {"train_loss": -6.202958106994629, "global_step": 82064, "epoch": 1953} {"train_loss": -6.293460845947266, "global_step": 82065, "epoch": 1953} {"train_loss": -6.326414108276367, "global_step": 82066, "epoch": 1953} {"train_loss": -6.189655621846517, "global_step": 82067, "epoch": 1953, "val_loss": 62602.42578125} {"train_loss": -6.189280986785889, "global_step": 82068, "epoch": 1954} {"train_loss": -6.2459259033203125, "global_step": 82069, "epoch": 1954} {"train_loss": -6.290072441101074, "global_step": 82070, "epoch": 1954} {"train_loss": -6.08991813659668, "global_step": 82071, "epoch": 1954} {"train_loss": -6.2230377197265625, "global_step": 82072, "epoch": 1954} {"train_loss": -6.2458176612854, "global_step": 82073, "epoch": 1954} {"train_loss": -6.053283214569092, "global_step": 82074, "epoch": 1954} {"train_loss": -6.247132301330566, "global_step": 82075, "epoch": 1954} {"train_loss": -6.049234867095947, "global_step": 82076, "epoch": 1954} {"train_loss": -6.050555229187012, "global_step": 82077, "epoch": 1954} {"train_loss": -6.335330009460449, "global_step": 82078, "epoch": 1954} {"train_loss": -6.122143745422363, "global_step": 82079, "epoch": 1954} {"train_loss": -6.142683506011963, "global_step": 82080, "epoch": 1954} {"train_loss": -6.182032585144043, "global_step": 82081, "epoch": 1954} {"train_loss": -6.139847755432129, "global_step": 82082, "epoch": 1954} {"train_loss": -6.258879661560059, "global_step": 82083, "epoch": 1954} {"train_loss": -6.237447738647461, "global_step": 82084, "epoch": 1954} {"train_loss": -6.255682945251465, "global_step": 82085, "epoch": 1954} {"train_loss": -6.183507919311523, "global_step": 82086, "epoch": 1954} {"train_loss": -6.186817169189453, "global_step": 82087, "epoch": 1954} {"train_loss": -6.189587593078613, "global_step": 82088, "epoch": 1954} {"train_loss": -6.199706077575684, "global_step": 82089, "epoch": 1954} {"train_loss": -6.1116862297058105, "global_step": 82090, "epoch": 1954} {"train_loss": -6.283037185668945, "global_step": 82091, "epoch": 1954} {"train_loss": -6.126794815063477, "global_step": 82092, "epoch": 1954} {"train_loss": -6.26458215713501, "global_step": 82093, "epoch": 1954} {"train_loss": -6.145650863647461, "global_step": 82094, "epoch": 1954} {"train_loss": -6.169094085693359, "global_step": 82095, "epoch": 1954} {"train_loss": -6.118304252624512, "global_step": 82096, "epoch": 1954} {"train_loss": -6.175018310546875, "global_step": 82097, "epoch": 1954} {"train_loss": -6.13709831237793, "global_step": 82098, "epoch": 1954} {"train_loss": -6.06511116027832, "global_step": 82099, "epoch": 1954} {"train_loss": -6.071206569671631, "global_step": 82100, "epoch": 1954} {"train_loss": -6.0760650634765625, "global_step": 82101, "epoch": 1954} {"train_loss": -6.1757965087890625, "global_step": 82102, "epoch": 1954} {"train_loss": -6.23054313659668, "global_step": 82103, "epoch": 1954} {"train_loss": -6.126458168029785, "global_step": 82104, "epoch": 1954} {"train_loss": -6.073795318603516, "global_step": 82105, "epoch": 1954} {"train_loss": -6.194576740264893, "global_step": 82106, "epoch": 1954} {"train_loss": -6.136539459228516, "global_step": 82107, "epoch": 1954} {"train_loss": -6.18556547164917, "global_step": 82108, "epoch": 1954} {"train_loss": -6.1695975462595625, "global_step": 82109, "epoch": 1954, "val_loss": 62559.1953125} {"train_loss": -6.178178787231445, "global_step": 82110, "epoch": 1955} {"train_loss": -6.202126502990723, "global_step": 82111, "epoch": 1955} {"train_loss": -6.2129597663879395, "global_step": 82112, "epoch": 1955} {"train_loss": -6.1585307121276855, "global_step": 82113, "epoch": 1955} {"train_loss": -6.138741493225098, "global_step": 82114, "epoch": 1955} {"train_loss": -6.057492256164551, "global_step": 82115, "epoch": 1955} {"train_loss": -6.189228057861328, "global_step": 82116, "epoch": 1955} {"train_loss": -6.291661739349365, "global_step": 82117, "epoch": 1955} {"train_loss": -6.302169322967529, "global_step": 82118, "epoch": 1955} {"train_loss": -6.122000694274902, "global_step": 82119, "epoch": 1955} {"train_loss": -6.2206525802612305, "global_step": 82120, "epoch": 1955} {"train_loss": -6.2480340003967285, "global_step": 82121, "epoch": 1955} {"train_loss": -6.1735053062438965, "global_step": 82122, "epoch": 1955} {"train_loss": -6.2148942947387695, "global_step": 82123, "epoch": 1955} {"train_loss": -6.130290985107422, "global_step": 82124, "epoch": 1955} {"train_loss": -6.096404075622559, "global_step": 82125, "epoch": 1955} {"train_loss": -6.223614692687988, "global_step": 82126, "epoch": 1955} {"train_loss": -6.152114391326904, "global_step": 82127, "epoch": 1955} {"train_loss": -6.197152137756348, "global_step": 82128, "epoch": 1955} {"train_loss": -6.23359489440918, "global_step": 82129, "epoch": 1955} {"train_loss": -6.160616874694824, "global_step": 82130, "epoch": 1955} {"train_loss": -6.239063262939453, "global_step": 82131, "epoch": 1955} {"train_loss": -6.144634246826172, "global_step": 82132, "epoch": 1955} {"train_loss": -6.131054878234863, "global_step": 82133, "epoch": 1955} {"train_loss": -6.193521022796631, "global_step": 82134, "epoch": 1955} {"train_loss": -6.257599830627441, "global_step": 82135, "epoch": 1955} {"train_loss": -6.187186241149902, "global_step": 82136, "epoch": 1955} {"train_loss": -6.230258464813232, "global_step": 82137, "epoch": 1955} {"train_loss": -6.049158096313477, "global_step": 82138, "epoch": 1955} {"train_loss": -6.088935852050781, "global_step": 82139, "epoch": 1955} {"train_loss": -6.2338690757751465, "global_step": 82140, "epoch": 1955} {"train_loss": -6.128298759460449, "global_step": 82141, "epoch": 1955} {"train_loss": -6.189702033996582, "global_step": 82142, "epoch": 1955} {"train_loss": -6.168829917907715, "global_step": 82143, "epoch": 1955} {"train_loss": -6.214363098144531, "global_step": 82144, "epoch": 1955} {"train_loss": -6.288113594055176, "global_step": 82145, "epoch": 1955} {"train_loss": -6.166495323181152, "global_step": 82146, "epoch": 1955} {"train_loss": -6.104158878326416, "global_step": 82147, "epoch": 1955} {"train_loss": -6.143822193145752, "global_step": 82148, "epoch": 1955} {"train_loss": -6.069759845733643, "global_step": 82149, "epoch": 1955} {"train_loss": -6.145261287689209, "global_step": 82150, "epoch": 1955} {"train_loss": -6.1790617761157804, "global_step": 82151, "epoch": 1955, "val_loss": 62652.91015625} {"train_loss": -6.011838912963867, "global_step": 82152, "epoch": 1956} {"train_loss": -6.183287620544434, "global_step": 82153, "epoch": 1956} {"train_loss": -6.106157302856445, "global_step": 82154, "epoch": 1956} {"train_loss": -6.112593650817871, "global_step": 82155, "epoch": 1956} {"train_loss": -6.140282154083252, "global_step": 82156, "epoch": 1956} {"train_loss": -6.041921138763428, "global_step": 82157, "epoch": 1956} {"train_loss": -6.072839260101318, "global_step": 82158, "epoch": 1956} {"train_loss": -6.051537036895752, "global_step": 82159, "epoch": 1956} {"train_loss": -6.150496959686279, "global_step": 82160, "epoch": 1956} {"train_loss": -6.048527240753174, "global_step": 82161, "epoch": 1956} {"train_loss": -6.1034417152404785, "global_step": 82162, "epoch": 1956} {"train_loss": -6.082499027252197, "global_step": 82163, "epoch": 1956} {"train_loss": -6.152100563049316, "global_step": 82164, "epoch": 1956} {"train_loss": -6.036191940307617, "global_step": 82165, "epoch": 1956} {"train_loss": -6.037382125854492, "global_step": 82166, "epoch": 1956} {"train_loss": -5.965731143951416, "global_step": 82167, "epoch": 1956} {"train_loss": -6.0508503913879395, "global_step": 82168, "epoch": 1956} {"train_loss": -6.091081619262695, "global_step": 82169, "epoch": 1956} {"train_loss": -6.160294532775879, "global_step": 82170, "epoch": 1956} {"train_loss": -6.078432083129883, "global_step": 82171, "epoch": 1956} {"train_loss": -6.089599609375, "global_step": 82172, "epoch": 1956} {"train_loss": -6.136697769165039, "global_step": 82173, "epoch": 1956} {"train_loss": -6.1055097579956055, "global_step": 82174, "epoch": 1956} {"train_loss": -6.05638313293457, "global_step": 82175, "epoch": 1956} {"train_loss": -6.086459159851074, "global_step": 82176, "epoch": 1956} {"train_loss": -6.168545722961426, "global_step": 82177, "epoch": 1956} {"train_loss": -6.14290714263916, "global_step": 82178, "epoch": 1956} {"train_loss": -6.305395126342773, "global_step": 82179, "epoch": 1956} {"train_loss": -6.171413421630859, "global_step": 82180, "epoch": 1956} {"train_loss": -6.200007915496826, "global_step": 82181, "epoch": 1956} {"train_loss": -6.135026931762695, "global_step": 82182, "epoch": 1956} {"train_loss": -6.153306007385254, "global_step": 82183, "epoch": 1956} {"train_loss": -6.080837249755859, "global_step": 82184, "epoch": 1956} {"train_loss": -6.036368370056152, "global_step": 82185, "epoch": 1956} {"train_loss": -6.038625717163086, "global_step": 82186, "epoch": 1956} {"train_loss": -6.2534379959106445, "global_step": 82187, "epoch": 1956} {"train_loss": -6.1358184814453125, "global_step": 82188, "epoch": 1956} {"train_loss": -6.077122688293457, "global_step": 82189, "epoch": 1956} {"train_loss": -6.190644264221191, "global_step": 82190, "epoch": 1956} {"train_loss": -6.15230131149292, "global_step": 82191, "epoch": 1956} {"train_loss": -6.0838775634765625, "global_step": 82192, "epoch": 1956} {"train_loss": -6.111905415852864, "global_step": 82193, "epoch": 1956, "val_loss": 62530.33203125} {"train_loss": -6.091886520385742, "global_step": 82194, "epoch": 1957} {"train_loss": -6.212822914123535, "global_step": 82195, "epoch": 1957} {"train_loss": -6.282384872436523, "global_step": 82196, "epoch": 1957} {"train_loss": -6.160795211791992, "global_step": 82197, "epoch": 1957} {"train_loss": -6.133964538574219, "global_step": 82198, "epoch": 1957} {"train_loss": -6.204231262207031, "global_step": 82199, "epoch": 1957} {"train_loss": -6.2808146476745605, "global_step": 82200, "epoch": 1957} {"train_loss": -6.224811553955078, "global_step": 82201, "epoch": 1957} {"train_loss": -6.234304904937744, "global_step": 82202, "epoch": 1957} {"train_loss": -6.2032084465026855, "global_step": 82203, "epoch": 1957} {"train_loss": -6.184523582458496, "global_step": 82204, "epoch": 1957} {"train_loss": -6.232639312744141, "global_step": 82205, "epoch": 1957} {"train_loss": -6.137935638427734, "global_step": 82206, "epoch": 1957} {"train_loss": -6.235702991485596, "global_step": 82207, "epoch": 1957} {"train_loss": -6.204331874847412, "global_step": 82208, "epoch": 1957} {"train_loss": -6.165356636047363, "global_step": 82209, "epoch": 1957} {"train_loss": -6.389484405517578, "global_step": 82210, "epoch": 1957} {"train_loss": -6.301194190979004, "global_step": 82211, "epoch": 1957} {"train_loss": -6.189481735229492, "global_step": 82212, "epoch": 1957} {"train_loss": -6.052473068237305, "global_step": 82213, "epoch": 1957} {"train_loss": -6.264399528503418, "global_step": 82214, "epoch": 1957} {"train_loss": -6.157745361328125, "global_step": 82215, "epoch": 1957} {"train_loss": -6.189723968505859, "global_step": 82216, "epoch": 1957} {"train_loss": -6.182268142700195, "global_step": 82217, "epoch": 1957} {"train_loss": -6.148911476135254, "global_step": 82218, "epoch": 1957} {"train_loss": -6.161525249481201, "global_step": 82219, "epoch": 1957} {"train_loss": -6.241157531738281, "global_step": 82220, "epoch": 1957} {"train_loss": -6.147101402282715, "global_step": 82221, "epoch": 1957} {"train_loss": -6.118000030517578, "global_step": 82222, "epoch": 1957} {"train_loss": -5.979787826538086, "global_step": 82223, "epoch": 1957} {"train_loss": -6.208931922912598, "global_step": 82224, "epoch": 1957} {"train_loss": -6.135185241699219, "global_step": 82225, "epoch": 1957} {"train_loss": -6.137264251708984, "global_step": 82226, "epoch": 1957} {"train_loss": -6.08416748046875, "global_step": 82227, "epoch": 1957} {"train_loss": -6.114501953125, "global_step": 82228, "epoch": 1957} {"train_loss": -6.0194292068481445, "global_step": 82229, "epoch": 1957} {"train_loss": -6.211870193481445, "global_step": 82230, "epoch": 1957} {"train_loss": -6.306881904602051, "global_step": 82231, "epoch": 1957} {"train_loss": -6.305296421051025, "global_step": 82232, "epoch": 1957} {"train_loss": -6.199127197265625, "global_step": 82233, "epoch": 1957} {"train_loss": -6.214069366455078, "global_step": 82234, "epoch": 1957} {"train_loss": -6.18608596211388, "global_step": 82235, "epoch": 1957, "val_loss": 62527.5078125} {"train_loss": -6.20533561706543, "global_step": 82236, "epoch": 1958} {"train_loss": -6.180230617523193, "global_step": 82237, "epoch": 1958} {"train_loss": -6.133597373962402, "global_step": 82238, "epoch": 1958} {"train_loss": -6.157166957855225, "global_step": 82239, "epoch": 1958} {"train_loss": -6.084294319152832, "global_step": 82240, "epoch": 1958} {"train_loss": -6.079511642456055, "global_step": 82241, "epoch": 1958} {"train_loss": -6.183979511260986, "global_step": 82242, "epoch": 1958} {"train_loss": -6.164273738861084, "global_step": 82243, "epoch": 1958} {"train_loss": -6.1182661056518555, "global_step": 82244, "epoch": 1958} {"train_loss": -6.169150352478027, "global_step": 82245, "epoch": 1958} {"train_loss": -6.121243476867676, "global_step": 82246, "epoch": 1958} {"train_loss": -6.099571228027344, "global_step": 82247, "epoch": 1958} {"train_loss": -6.115874290466309, "global_step": 82248, "epoch": 1958} {"train_loss": -6.180096626281738, "global_step": 82249, "epoch": 1958} {"train_loss": -6.237563133239746, "global_step": 82250, "epoch": 1958} {"train_loss": -6.20483922958374, "global_step": 82251, "epoch": 1958} {"train_loss": -6.1720380783081055, "global_step": 82252, "epoch": 1958} {"train_loss": -6.214568138122559, "global_step": 82253, "epoch": 1958} {"train_loss": -6.186342716217041, "global_step": 82254, "epoch": 1958} {"train_loss": -6.1573967933654785, "global_step": 82255, "epoch": 1958} {"train_loss": -6.346562385559082, "global_step": 82256, "epoch": 1958} {"train_loss": -6.244379997253418, "global_step": 82257, "epoch": 1958} {"train_loss": -6.0936384201049805, "global_step": 82258, "epoch": 1958} {"train_loss": -6.234288215637207, "global_step": 82259, "epoch": 1958} {"train_loss": -6.118933200836182, "global_step": 82260, "epoch": 1958} {"train_loss": -6.1286702156066895, "global_step": 82261, "epoch": 1958} {"train_loss": -6.235018253326416, "global_step": 82262, "epoch": 1958} {"train_loss": -6.078872203826904, "global_step": 82263, "epoch": 1958} {"train_loss": -6.203479766845703, "global_step": 82264, "epoch": 1958} {"train_loss": -6.138956069946289, "global_step": 82265, "epoch": 1958} {"train_loss": -6.194306373596191, "global_step": 82266, "epoch": 1958} {"train_loss": -6.186763286590576, "global_step": 82267, "epoch": 1958} {"train_loss": -6.186557769775391, "global_step": 82268, "epoch": 1958} {"train_loss": -6.174023151397705, "global_step": 82269, "epoch": 1958} {"train_loss": -6.164365768432617, "global_step": 82270, "epoch": 1958} {"train_loss": -6.145837783813477, "global_step": 82271, "epoch": 1958} {"train_loss": -6.007355213165283, "global_step": 82272, "epoch": 1958} {"train_loss": -6.161811828613281, "global_step": 82273, "epoch": 1958} {"train_loss": -6.09490966796875, "global_step": 82274, "epoch": 1958} {"train_loss": -6.13557243347168, "global_step": 82275, "epoch": 1958} {"train_loss": -6.2352375984191895, "global_step": 82276, "epoch": 1958} {"train_loss": -6.163137731097994, "global_step": 82277, "epoch": 1958, "val_loss": 62478.97265625} {"train_loss": -6.131556510925293, "global_step": 82278, "epoch": 1959} {"train_loss": -6.279090881347656, "global_step": 82279, "epoch": 1959} {"train_loss": -6.214690208435059, "global_step": 82280, "epoch": 1959} {"train_loss": -6.247088432312012, "global_step": 82281, "epoch": 1959} {"train_loss": -6.127083778381348, "global_step": 82282, "epoch": 1959} {"train_loss": -6.1123504638671875, "global_step": 82283, "epoch": 1959} {"train_loss": -6.258730888366699, "global_step": 82284, "epoch": 1959} {"train_loss": -6.152229309082031, "global_step": 82285, "epoch": 1959} {"train_loss": -6.129250526428223, "global_step": 82286, "epoch": 1959} {"train_loss": -6.171811580657959, "global_step": 82287, "epoch": 1959} {"train_loss": -6.119206428527832, "global_step": 82288, "epoch": 1959} {"train_loss": -6.167729377746582, "global_step": 82289, "epoch": 1959} {"train_loss": -6.203094482421875, "global_step": 82290, "epoch": 1959} {"train_loss": -6.317766189575195, "global_step": 82291, "epoch": 1959} {"train_loss": -6.202359199523926, "global_step": 82292, "epoch": 1959} {"train_loss": -6.130404472351074, "global_step": 82293, "epoch": 1959} {"train_loss": -6.137383460998535, "global_step": 82294, "epoch": 1959} {"train_loss": -6.17409610748291, "global_step": 82295, "epoch": 1959} {"train_loss": -6.165868282318115, "global_step": 82296, "epoch": 1959} {"train_loss": -6.17767333984375, "global_step": 82297, "epoch": 1959} {"train_loss": -6.191529273986816, "global_step": 82298, "epoch": 1959} {"train_loss": -6.13271427154541, "global_step": 82299, "epoch": 1959} {"train_loss": -6.24860954284668, "global_step": 82300, "epoch": 1959} {"train_loss": -6.134553909301758, "global_step": 82301, "epoch": 1959} {"train_loss": -6.126331329345703, "global_step": 82302, "epoch": 1959} {"train_loss": -6.055938720703125, "global_step": 82303, "epoch": 1959} {"train_loss": -6.152747631072998, "global_step": 82304, "epoch": 1959} {"train_loss": -6.214710235595703, "global_step": 82305, "epoch": 1959} {"train_loss": -6.17970085144043, "global_step": 82306, "epoch": 1959} {"train_loss": -6.094726085662842, "global_step": 82307, "epoch": 1959} {"train_loss": -6.22105598449707, "global_step": 82308, "epoch": 1959} {"train_loss": -6.1230926513671875, "global_step": 82309, "epoch": 1959} {"train_loss": -6.209842205047607, "global_step": 82310, "epoch": 1959} {"train_loss": -6.041556358337402, "global_step": 82311, "epoch": 1959} {"train_loss": -5.998382568359375, "global_step": 82312, "epoch": 1959} {"train_loss": -6.0704803466796875, "global_step": 82313, "epoch": 1959} {"train_loss": -6.0821943283081055, "global_step": 82314, "epoch": 1959} {"train_loss": -6.219526767730713, "global_step": 82315, "epoch": 1959} {"train_loss": -6.121899127960205, "global_step": 82316, "epoch": 1959} {"train_loss": -6.140548229217529, "global_step": 82317, "epoch": 1959} {"train_loss": -6.090882301330566, "global_step": 82318, "epoch": 1959} {"train_loss": -6.156021038691203, "global_step": 82319, "epoch": 1959, "val_loss": 62576.5625} {"train_loss": -6.032374858856201, "global_step": 82320, "epoch": 1960} {"train_loss": -6.291998863220215, "global_step": 82321, "epoch": 1960} {"train_loss": -6.091256141662598, "global_step": 82322, "epoch": 1960} {"train_loss": -6.129344940185547, "global_step": 82323, "epoch": 1960} {"train_loss": -6.060856819152832, "global_step": 82324, "epoch": 1960} {"train_loss": -6.187032699584961, "global_step": 82325, "epoch": 1960} {"train_loss": -6.050347805023193, "global_step": 82326, "epoch": 1960} {"train_loss": -6.0808868408203125, "global_step": 82327, "epoch": 1960} {"train_loss": -6.053888320922852, "global_step": 82328, "epoch": 1960} {"train_loss": -6.196107864379883, "global_step": 82329, "epoch": 1960} {"train_loss": -6.183707237243652, "global_step": 82330, "epoch": 1960} {"train_loss": -6.188103675842285, "global_step": 82331, "epoch": 1960} {"train_loss": -6.335502624511719, "global_step": 82332, "epoch": 1960} {"train_loss": -6.145655632019043, "global_step": 82333, "epoch": 1960} {"train_loss": -6.189691543579102, "global_step": 82334, "epoch": 1960} {"train_loss": -6.190457344055176, "global_step": 82335, "epoch": 1960} {"train_loss": -6.1897382736206055, "global_step": 82336, "epoch": 1960} {"train_loss": -6.236577033996582, "global_step": 82337, "epoch": 1960} {"train_loss": -6.105153560638428, "global_step": 82338, "epoch": 1960} {"train_loss": -6.190977573394775, "global_step": 82339, "epoch": 1960} {"train_loss": -6.135902404785156, "global_step": 82340, "epoch": 1960} {"train_loss": -6.162481307983398, "global_step": 82341, "epoch": 1960} {"train_loss": -6.137884140014648, "global_step": 82342, "epoch": 1960} {"train_loss": -6.263732433319092, "global_step": 82343, "epoch": 1960} {"train_loss": -6.205327033996582, "global_step": 82344, "epoch": 1960} {"train_loss": -6.160214900970459, "global_step": 82345, "epoch": 1960} {"train_loss": -6.166669845581055, "global_step": 82346, "epoch": 1960} {"train_loss": -6.133878231048584, "global_step": 82347, "epoch": 1960} {"train_loss": -6.237720012664795, "global_step": 82348, "epoch": 1960} {"train_loss": -6.196211814880371, "global_step": 82349, "epoch": 1960} {"train_loss": -6.128446102142334, "global_step": 82350, "epoch": 1960} {"train_loss": -6.251583099365234, "global_step": 82351, "epoch": 1960} {"train_loss": -6.238766670227051, "global_step": 82352, "epoch": 1960} {"train_loss": -6.241888523101807, "global_step": 82353, "epoch": 1960} {"train_loss": -6.196102142333984, "global_step": 82354, "epoch": 1960} {"train_loss": -6.14930534362793, "global_step": 82355, "epoch": 1960} {"train_loss": -6.183727264404297, "global_step": 82356, "epoch": 1960} {"train_loss": -6.194430828094482, "global_step": 82357, "epoch": 1960} {"train_loss": -6.182748794555664, "global_step": 82358, "epoch": 1960} {"train_loss": -6.189177513122559, "global_step": 82359, "epoch": 1960} {"train_loss": -6.202948570251465, "global_step": 82360, "epoch": 1960} {"train_loss": -6.1756880851019, "global_step": 82361, "epoch": 1960, "val_loss": 62399.0390625} {"train_loss": -6.250241756439209, "global_step": 82362, "epoch": 1961} {"train_loss": -6.241727828979492, "global_step": 82363, "epoch": 1961} {"train_loss": -6.2024431228637695, "global_step": 82364, "epoch": 1961} {"train_loss": -6.191426753997803, "global_step": 82365, "epoch": 1961} {"train_loss": -6.18580436706543, "global_step": 82366, "epoch": 1961} {"train_loss": -6.127415657043457, "global_step": 82367, "epoch": 1961} {"train_loss": -6.136890411376953, "global_step": 82368, "epoch": 1961} {"train_loss": -6.165733337402344, "global_step": 82369, "epoch": 1961} {"train_loss": -6.298181056976318, "global_step": 82370, "epoch": 1961} {"train_loss": -6.1751837730407715, "global_step": 82371, "epoch": 1961} {"train_loss": -6.261281967163086, "global_step": 82372, "epoch": 1961} {"train_loss": -6.235287666320801, "global_step": 82373, "epoch": 1961} {"train_loss": -6.098984718322754, "global_step": 82374, "epoch": 1961} {"train_loss": -6.213594436645508, "global_step": 82375, "epoch": 1961} {"train_loss": -6.285484790802002, "global_step": 82376, "epoch": 1961} {"train_loss": -6.279366493225098, "global_step": 82377, "epoch": 1961} {"train_loss": -6.250194549560547, "global_step": 82378, "epoch": 1961} {"train_loss": -6.151174545288086, "global_step": 82379, "epoch": 1961} {"train_loss": -6.202614784240723, "global_step": 82380, "epoch": 1961} {"train_loss": -6.047117233276367, "global_step": 82381, "epoch": 1961} {"train_loss": -6.177786350250244, "global_step": 82382, "epoch": 1961} {"train_loss": -6.084152698516846, "global_step": 82383, "epoch": 1961} {"train_loss": -6.262187957763672, "global_step": 82384, "epoch": 1961} {"train_loss": -6.169053077697754, "global_step": 82385, "epoch": 1961} {"train_loss": -6.05780029296875, "global_step": 82386, "epoch": 1961} {"train_loss": -6.194886207580566, "global_step": 82387, "epoch": 1961} {"train_loss": -6.083189964294434, "global_step": 82388, "epoch": 1961} {"train_loss": -6.156659126281738, "global_step": 82389, "epoch": 1961} {"train_loss": -6.1559834480285645, "global_step": 82390, "epoch": 1961} {"train_loss": -6.118763446807861, "global_step": 82391, "epoch": 1961} {"train_loss": -6.215801239013672, "global_step": 82392, "epoch": 1961} {"train_loss": -6.153229236602783, "global_step": 82393, "epoch": 1961} {"train_loss": -6.179194450378418, "global_step": 82394, "epoch": 1961} {"train_loss": -6.190813064575195, "global_step": 82395, "epoch": 1961} {"train_loss": -6.2662353515625, "global_step": 82396, "epoch": 1961} {"train_loss": -6.157214164733887, "global_step": 82397, "epoch": 1961} {"train_loss": -6.270107746124268, "global_step": 82398, "epoch": 1961} {"train_loss": -6.236156463623047, "global_step": 82399, "epoch": 1961} {"train_loss": -6.1602325439453125, "global_step": 82400, "epoch": 1961} {"train_loss": -6.2137837409973145, "global_step": 82401, "epoch": 1961} {"train_loss": -6.155886650085449, "global_step": 82402, "epoch": 1961} {"train_loss": -6.188511178607032, "global_step": 82403, "epoch": 1961, "val_loss": 62396.515625} {"train_loss": -6.156640529632568, "global_step": 82404, "epoch": 1962} {"train_loss": -6.1854658126831055, "global_step": 82405, "epoch": 1962} {"train_loss": -6.2627973556518555, "global_step": 82406, "epoch": 1962} {"train_loss": -6.2236857414245605, "global_step": 82407, "epoch": 1962} {"train_loss": -6.09805965423584, "global_step": 82408, "epoch": 1962} {"train_loss": -6.170965194702148, "global_step": 82409, "epoch": 1962} {"train_loss": -6.222643852233887, "global_step": 82410, "epoch": 1962} {"train_loss": -6.271826267242432, "global_step": 82411, "epoch": 1962} {"train_loss": -6.1947736740112305, "global_step": 82412, "epoch": 1962} {"train_loss": -6.180928707122803, "global_step": 82413, "epoch": 1962} {"train_loss": -6.168633460998535, "global_step": 82414, "epoch": 1962} {"train_loss": -6.181746482849121, "global_step": 82415, "epoch": 1962} {"train_loss": -6.273044109344482, "global_step": 82416, "epoch": 1962} {"train_loss": -6.21954870223999, "global_step": 82417, "epoch": 1962} {"train_loss": -6.186025142669678, "global_step": 82418, "epoch": 1962} {"train_loss": -6.163081645965576, "global_step": 82419, "epoch": 1962} {"train_loss": -6.174991607666016, "global_step": 82420, "epoch": 1962} {"train_loss": -6.171158313751221, "global_step": 82421, "epoch": 1962} {"train_loss": -6.158834934234619, "global_step": 82422, "epoch": 1962} {"train_loss": -6.234567165374756, "global_step": 82423, "epoch": 1962} {"train_loss": -6.056427955627441, "global_step": 82424, "epoch": 1962} {"train_loss": -6.176819801330566, "global_step": 82425, "epoch": 1962} {"train_loss": -6.169015884399414, "global_step": 82426, "epoch": 1962} {"train_loss": -6.27107572555542, "global_step": 82427, "epoch": 1962} {"train_loss": -6.19320011138916, "global_step": 82428, "epoch": 1962} {"train_loss": -6.11885929107666, "global_step": 82429, "epoch": 1962} {"train_loss": -6.1603498458862305, "global_step": 82430, "epoch": 1962} {"train_loss": -6.176485061645508, "global_step": 82431, "epoch": 1962} {"train_loss": -6.165308475494385, "global_step": 82432, "epoch": 1962} {"train_loss": -6.181652545928955, "global_step": 82433, "epoch": 1962} {"train_loss": -6.282529830932617, "global_step": 82434, "epoch": 1962} {"train_loss": -6.140655517578125, "global_step": 82435, "epoch": 1962} {"train_loss": -6.0786895751953125, "global_step": 82436, "epoch": 1962} {"train_loss": -6.192990303039551, "global_step": 82437, "epoch": 1962} {"train_loss": -6.132953643798828, "global_step": 82438, "epoch": 1962} {"train_loss": -6.0521087646484375, "global_step": 82439, "epoch": 1962} {"train_loss": -6.189474105834961, "global_step": 82440, "epoch": 1962} {"train_loss": -6.275423049926758, "global_step": 82441, "epoch": 1962} {"train_loss": -6.2672810554504395, "global_step": 82442, "epoch": 1962} {"train_loss": -6.118263244628906, "global_step": 82443, "epoch": 1962} {"train_loss": -6.187159538269043, "global_step": 82444, "epoch": 1962} {"train_loss": -6.179692302431379, "global_step": 82445, "epoch": 1962, "val_loss": 62593.96875} {"train_loss": -6.152899742126465, "global_step": 82446, "epoch": 1963} {"train_loss": -6.096343517303467, "global_step": 82447, "epoch": 1963} {"train_loss": -6.12300443649292, "global_step": 82448, "epoch": 1963} {"train_loss": -6.137117385864258, "global_step": 82449, "epoch": 1963} {"train_loss": -6.128513336181641, "global_step": 82450, "epoch": 1963} {"train_loss": -6.033783912658691, "global_step": 82451, "epoch": 1963} {"train_loss": -6.22745418548584, "global_step": 82452, "epoch": 1963} {"train_loss": -6.265567779541016, "global_step": 82453, "epoch": 1963} {"train_loss": -6.165587425231934, "global_step": 82454, "epoch": 1963} {"train_loss": -6.228815078735352, "global_step": 82455, "epoch": 1963} {"train_loss": -6.36818790435791, "global_step": 82456, "epoch": 1963} {"train_loss": -6.223319053649902, "global_step": 82457, "epoch": 1963} {"train_loss": -6.199827194213867, "global_step": 82458, "epoch": 1963} {"train_loss": -6.09598445892334, "global_step": 82459, "epoch": 1963} {"train_loss": -6.221580505371094, "global_step": 82460, "epoch": 1963} {"train_loss": -6.171160697937012, "global_step": 82461, "epoch": 1963} {"train_loss": -6.181921482086182, "global_step": 82462, "epoch": 1963} {"train_loss": -6.1710896492004395, "global_step": 82463, "epoch": 1963} {"train_loss": -6.066133499145508, "global_step": 82464, "epoch": 1963} {"train_loss": -6.212501049041748, "global_step": 82465, "epoch": 1963} {"train_loss": -5.913017272949219, "global_step": 82466, "epoch": 1963} {"train_loss": -5.970591068267822, "global_step": 82467, "epoch": 1963} {"train_loss": -6.270181655883789, "global_step": 82468, "epoch": 1963} {"train_loss": -5.987316131591797, "global_step": 82469, "epoch": 1963} {"train_loss": -6.009106636047363, "global_step": 82470, "epoch": 1963} {"train_loss": -5.980571746826172, "global_step": 82471, "epoch": 1963} {"train_loss": -6.102941513061523, "global_step": 82472, "epoch": 1963} {"train_loss": -6.098964214324951, "global_step": 82473, "epoch": 1963} {"train_loss": -6.1687188148498535, "global_step": 82474, "epoch": 1963} {"train_loss": -6.187391757965088, "global_step": 82475, "epoch": 1963} {"train_loss": -6.157443046569824, "global_step": 82476, "epoch": 1963} {"train_loss": -6.119027614593506, "global_step": 82477, "epoch": 1963} {"train_loss": -6.133430480957031, "global_step": 82478, "epoch": 1963} {"train_loss": -6.10001802444458, "global_step": 82479, "epoch": 1963} {"train_loss": -6.168442249298096, "global_step": 82480, "epoch": 1963} {"train_loss": -6.104554653167725, "global_step": 82481, "epoch": 1963} {"train_loss": -6.019924163818359, "global_step": 82482, "epoch": 1963} {"train_loss": -6.094758987426758, "global_step": 82483, "epoch": 1963} {"train_loss": -6.140317916870117, "global_step": 82484, "epoch": 1963} {"train_loss": -6.156980991363525, "global_step": 82485, "epoch": 1963} {"train_loss": -6.114279747009277, "global_step": 82486, "epoch": 1963} {"train_loss": -6.133313837505522, "global_step": 82487, "epoch": 1963, "val_loss": 62630.84375} {"train_loss": -6.16285514831543, "global_step": 82488, "epoch": 1964} {"train_loss": -6.16074275970459, "global_step": 82489, "epoch": 1964} {"train_loss": -6.122956275939941, "global_step": 82490, "epoch": 1964} {"train_loss": -6.1475372314453125, "global_step": 82491, "epoch": 1964} {"train_loss": -6.148001670837402, "global_step": 82492, "epoch": 1964} {"train_loss": -6.135524749755859, "global_step": 82493, "epoch": 1964} {"train_loss": -6.238711357116699, "global_step": 82494, "epoch": 1964} {"train_loss": -6.195908546447754, "global_step": 82495, "epoch": 1964} {"train_loss": -6.2737226486206055, "global_step": 82496, "epoch": 1964} {"train_loss": -6.028481960296631, "global_step": 82497, "epoch": 1964} {"train_loss": -6.176602363586426, "global_step": 82498, "epoch": 1964} {"train_loss": -6.196349143981934, "global_step": 82499, "epoch": 1964} {"train_loss": -6.172634124755859, "global_step": 82500, "epoch": 1964} {"train_loss": -6.181099891662598, "global_step": 82501, "epoch": 1964} {"train_loss": -6.206737995147705, "global_step": 82502, "epoch": 1964} {"train_loss": -6.2120819091796875, "global_step": 82503, "epoch": 1964} {"train_loss": -6.14637565612793, "global_step": 82504, "epoch": 1964} {"train_loss": -6.153552055358887, "global_step": 82505, "epoch": 1964} {"train_loss": -6.309229373931885, "global_step": 82506, "epoch": 1964} {"train_loss": -6.127765655517578, "global_step": 82507, "epoch": 1964} {"train_loss": -6.284687519073486, "global_step": 82508, "epoch": 1964} {"train_loss": -6.2273454666137695, "global_step": 82509, "epoch": 1964} {"train_loss": -6.186978340148926, "global_step": 82510, "epoch": 1964} {"train_loss": -6.05602502822876, "global_step": 82511, "epoch": 1964} {"train_loss": -6.255350589752197, "global_step": 82512, "epoch": 1964} {"train_loss": -6.241389274597168, "global_step": 82513, "epoch": 1964} {"train_loss": -6.140482425689697, "global_step": 82514, "epoch": 1964} {"train_loss": -6.226141929626465, "global_step": 82515, "epoch": 1964} {"train_loss": -6.156130313873291, "global_step": 82516, "epoch": 1964} {"train_loss": -6.131360054016113, "global_step": 82517, "epoch": 1964} {"train_loss": -6.229814529418945, "global_step": 82518, "epoch": 1964} {"train_loss": -6.296994686126709, "global_step": 82519, "epoch": 1964} {"train_loss": -6.240534782409668, "global_step": 82520, "epoch": 1964} {"train_loss": -6.23172664642334, "global_step": 82521, "epoch": 1964} {"train_loss": -6.1490044593811035, "global_step": 82522, "epoch": 1964} {"train_loss": -6.1945600509643555, "global_step": 82523, "epoch": 1964} {"train_loss": -6.301947593688965, "global_step": 82524, "epoch": 1964} {"train_loss": -6.241901874542236, "global_step": 82525, "epoch": 1964} {"train_loss": -6.144904613494873, "global_step": 82526, "epoch": 1964} {"train_loss": -6.289693832397461, "global_step": 82527, "epoch": 1964} {"train_loss": -6.235655784606934, "global_step": 82528, "epoch": 1964} {"train_loss": -6.194787456875756, "global_step": 82529, "epoch": 1964, "val_loss": 62542.2265625} {"train_loss": -6.267887592315674, "global_step": 82530, "epoch": 1965} {"train_loss": -6.277558326721191, "global_step": 82531, "epoch": 1965} {"train_loss": -6.172540664672852, "global_step": 82532, "epoch": 1965} {"train_loss": -6.203819274902344, "global_step": 82533, "epoch": 1965} {"train_loss": -6.338927268981934, "global_step": 82534, "epoch": 1965} {"train_loss": -6.115900993347168, "global_step": 82535, "epoch": 1965} {"train_loss": -6.14997673034668, "global_step": 82536, "epoch": 1965} {"train_loss": -6.183772087097168, "global_step": 82537, "epoch": 1965} {"train_loss": -6.2549333572387695, "global_step": 82538, "epoch": 1965} {"train_loss": -6.256821632385254, "global_step": 82539, "epoch": 1965} {"train_loss": -6.226587772369385, "global_step": 82540, "epoch": 1965} {"train_loss": -6.141822814941406, "global_step": 82541, "epoch": 1965} {"train_loss": -6.185030937194824, "global_step": 82542, "epoch": 1965} {"train_loss": -6.164882183074951, "global_step": 82543, "epoch": 1965} {"train_loss": -6.114621639251709, "global_step": 82544, "epoch": 1965} {"train_loss": -6.236294746398926, "global_step": 82545, "epoch": 1965} {"train_loss": -6.094181060791016, "global_step": 82546, "epoch": 1965} {"train_loss": -6.083095550537109, "global_step": 82547, "epoch": 1965} {"train_loss": -6.149681091308594, "global_step": 82548, "epoch": 1965} {"train_loss": -6.157928466796875, "global_step": 82549, "epoch": 1965} {"train_loss": -6.182459831237793, "global_step": 82550, "epoch": 1965} {"train_loss": -6.111128807067871, "global_step": 82551, "epoch": 1965} {"train_loss": -6.2558183670043945, "global_step": 82552, "epoch": 1965} {"train_loss": -6.135653018951416, "global_step": 82553, "epoch": 1965} {"train_loss": -6.208474159240723, "global_step": 82554, "epoch": 1965} {"train_loss": -6.244320869445801, "global_step": 82555, "epoch": 1965} {"train_loss": -6.202764511108398, "global_step": 82556, "epoch": 1965} {"train_loss": -6.1183881759643555, "global_step": 82557, "epoch": 1965} {"train_loss": -6.118256092071533, "global_step": 82558, "epoch": 1965} {"train_loss": -6.27773380279541, "global_step": 82559, "epoch": 1965} {"train_loss": -6.29580545425415, "global_step": 82560, "epoch": 1965} {"train_loss": -6.223111152648926, "global_step": 82561, "epoch": 1965} {"train_loss": -6.213149070739746, "global_step": 82562, "epoch": 1965} {"train_loss": -6.09906530380249, "global_step": 82563, "epoch": 1965} {"train_loss": -6.086138725280762, "global_step": 82564, "epoch": 1965} {"train_loss": -6.130887985229492, "global_step": 82565, "epoch": 1965} {"train_loss": -6.190517425537109, "global_step": 82566, "epoch": 1965} {"train_loss": -6.242648124694824, "global_step": 82567, "epoch": 1965} {"train_loss": -6.175509452819824, "global_step": 82568, "epoch": 1965} {"train_loss": -6.1893720626831055, "global_step": 82569, "epoch": 1965} {"train_loss": -6.07427978515625, "global_step": 82570, "epoch": 1965} {"train_loss": -6.181863807496571, "global_step": 82571, "epoch": 1965, "val_loss": 62626.80078125} {"train_loss": -6.196593284606934, "global_step": 82572, "epoch": 1966} {"train_loss": -6.342723369598389, "global_step": 82573, "epoch": 1966} {"train_loss": -6.066473960876465, "global_step": 82574, "epoch": 1966} {"train_loss": -6.093395233154297, "global_step": 82575, "epoch": 1966} {"train_loss": -6.00893497467041, "global_step": 82576, "epoch": 1966} {"train_loss": -6.225836277008057, "global_step": 82577, "epoch": 1966} {"train_loss": -5.981610298156738, "global_step": 82578, "epoch": 1966} {"train_loss": -6.052961349487305, "global_step": 82579, "epoch": 1966} {"train_loss": -6.145886421203613, "global_step": 82580, "epoch": 1966} {"train_loss": -6.043514251708984, "global_step": 82581, "epoch": 1966} {"train_loss": -6.0333099365234375, "global_step": 82582, "epoch": 1966} {"train_loss": -6.012537956237793, "global_step": 82583, "epoch": 1966} {"train_loss": -6.079148292541504, "global_step": 82584, "epoch": 1966} {"train_loss": -6.142322540283203, "global_step": 82585, "epoch": 1966} {"train_loss": -6.0260725021362305, "global_step": 82586, "epoch": 1966} {"train_loss": -6.196640491485596, "global_step": 82587, "epoch": 1966} {"train_loss": -6.062344551086426, "global_step": 82588, "epoch": 1966} {"train_loss": -6.1692094802856445, "global_step": 82589, "epoch": 1966} {"train_loss": -6.009735107421875, "global_step": 82590, "epoch": 1966} {"train_loss": -6.218409538269043, "global_step": 82591, "epoch": 1966} {"train_loss": -6.043081283569336, "global_step": 82592, "epoch": 1966} {"train_loss": -6.037337779998779, "global_step": 82593, "epoch": 1966} {"train_loss": -6.084015846252441, "global_step": 82594, "epoch": 1966} {"train_loss": -6.075098991394043, "global_step": 82595, "epoch": 1966} {"train_loss": -6.068581581115723, "global_step": 82596, "epoch": 1966} {"train_loss": -6.11232852935791, "global_step": 82597, "epoch": 1966} {"train_loss": -6.1648335456848145, "global_step": 82598, "epoch": 1966} {"train_loss": -6.064641952514648, "global_step": 82599, "epoch": 1966} {"train_loss": -6.171074390411377, "global_step": 82600, "epoch": 1966} {"train_loss": -6.219860076904297, "global_step": 82601, "epoch": 1966} {"train_loss": -6.099306106567383, "global_step": 82602, "epoch": 1966} {"train_loss": -6.117979049682617, "global_step": 82603, "epoch": 1966} {"train_loss": -6.183061122894287, "global_step": 82604, "epoch": 1966} {"train_loss": -6.098407745361328, "global_step": 82605, "epoch": 1966} {"train_loss": -6.248229026794434, "global_step": 82606, "epoch": 1966} {"train_loss": -6.242466926574707, "global_step": 82607, "epoch": 1966} {"train_loss": -6.121325969696045, "global_step": 82608, "epoch": 1966} {"train_loss": -6.146727561950684, "global_step": 82609, "epoch": 1966} {"train_loss": -6.172192573547363, "global_step": 82610, "epoch": 1966} {"train_loss": -6.175640106201172, "global_step": 82611, "epoch": 1966} {"train_loss": -6.135983467102051, "global_step": 82612, "epoch": 1966} {"train_loss": -6.118235133943104, "global_step": 82613, "epoch": 1966, "val_loss": 62653.0390625} {"train_loss": -6.227837562561035, "global_step": 82614, "epoch": 1967} {"train_loss": -6.163332939147949, "global_step": 82615, "epoch": 1967} {"train_loss": -6.119333267211914, "global_step": 82616, "epoch": 1967} {"train_loss": -6.276122093200684, "global_step": 82617, "epoch": 1967} {"train_loss": -6.10765266418457, "global_step": 82618, "epoch": 1967} {"train_loss": -6.216621398925781, "global_step": 82619, "epoch": 1967} {"train_loss": -6.210750579833984, "global_step": 82620, "epoch": 1967} {"train_loss": -6.1628570556640625, "global_step": 82621, "epoch": 1967} {"train_loss": -6.2083330154418945, "global_step": 82622, "epoch": 1967} {"train_loss": -6.140851020812988, "global_step": 82623, "epoch": 1967} {"train_loss": -6.206478118896484, "global_step": 82624, "epoch": 1967} {"train_loss": -6.219032287597656, "global_step": 82625, "epoch": 1967} {"train_loss": -6.068020343780518, "global_step": 82626, "epoch": 1967} {"train_loss": -6.226408004760742, "global_step": 82627, "epoch": 1967} {"train_loss": -6.063740253448486, "global_step": 82628, "epoch": 1967} {"train_loss": -6.2121262550354, "global_step": 82629, "epoch": 1967} {"train_loss": -6.100456237792969, "global_step": 82630, "epoch": 1967} {"train_loss": -6.09133243560791, "global_step": 82631, "epoch": 1967} {"train_loss": -6.0416717529296875, "global_step": 82632, "epoch": 1967} {"train_loss": -6.074756622314453, "global_step": 82633, "epoch": 1967} {"train_loss": -6.117317199707031, "global_step": 82634, "epoch": 1967} {"train_loss": -6.1594648361206055, "global_step": 82635, "epoch": 1967} {"train_loss": -6.188813209533691, "global_step": 82636, "epoch": 1967} {"train_loss": -6.212137222290039, "global_step": 82637, "epoch": 1967} {"train_loss": -6.0172858238220215, "global_step": 82638, "epoch": 1967} {"train_loss": -6.16811466217041, "global_step": 82639, "epoch": 1967} {"train_loss": -6.137444496154785, "global_step": 82640, "epoch": 1967} {"train_loss": -6.103046417236328, "global_step": 82641, "epoch": 1967} {"train_loss": -6.086997032165527, "global_step": 82642, "epoch": 1967} {"train_loss": -6.087535858154297, "global_step": 82643, "epoch": 1967} {"train_loss": -6.151759624481201, "global_step": 82644, "epoch": 1967} {"train_loss": -6.200139045715332, "global_step": 82645, "epoch": 1967} {"train_loss": -6.117059707641602, "global_step": 82646, "epoch": 1967} {"train_loss": -6.129251480102539, "global_step": 82647, "epoch": 1967} {"train_loss": -6.251550197601318, "global_step": 82648, "epoch": 1967} {"train_loss": -6.187579154968262, "global_step": 82649, "epoch": 1967} {"train_loss": -6.18732213973999, "global_step": 82650, "epoch": 1967} {"train_loss": -6.188490867614746, "global_step": 82651, "epoch": 1967} {"train_loss": -6.26963996887207, "global_step": 82652, "epoch": 1967} {"train_loss": -6.1523590087890625, "global_step": 82653, "epoch": 1967} {"train_loss": -6.212579250335693, "global_step": 82654, "epoch": 1967} {"train_loss": -6.157282136735462, "global_step": 82655, "epoch": 1967, "val_loss": 62620.453125} {"train_loss": -6.231195449829102, "global_step": 82656, "epoch": 1968} {"train_loss": -6.027434349060059, "global_step": 82657, "epoch": 1968} {"train_loss": -6.266478061676025, "global_step": 82658, "epoch": 1968} {"train_loss": -6.220644950866699, "global_step": 82659, "epoch": 1968} {"train_loss": -6.124154090881348, "global_step": 82660, "epoch": 1968} {"train_loss": -6.255622863769531, "global_step": 82661, "epoch": 1968} {"train_loss": -6.220066070556641, "global_step": 82662, "epoch": 1968} {"train_loss": -6.122672080993652, "global_step": 82663, "epoch": 1968} {"train_loss": -5.986081600189209, "global_step": 82664, "epoch": 1968} {"train_loss": -6.054078102111816, "global_step": 82665, "epoch": 1968} {"train_loss": -5.9590253829956055, "global_step": 82666, "epoch": 1968} {"train_loss": -6.050992965698242, "global_step": 82667, "epoch": 1968} {"train_loss": -5.980430603027344, "global_step": 82668, "epoch": 1968} {"train_loss": -6.108916759490967, "global_step": 82669, "epoch": 1968} {"train_loss": -6.095863342285156, "global_step": 82670, "epoch": 1968} {"train_loss": -6.018414497375488, "global_step": 82671, "epoch": 1968} {"train_loss": -6.219677925109863, "global_step": 82672, "epoch": 1968} {"train_loss": -6.231453895568848, "global_step": 82673, "epoch": 1968} {"train_loss": -6.188395023345947, "global_step": 82674, "epoch": 1968} {"train_loss": -6.164026260375977, "global_step": 82675, "epoch": 1968} {"train_loss": -6.203577041625977, "global_step": 82676, "epoch": 1968} {"train_loss": -6.221075057983398, "global_step": 82677, "epoch": 1968} {"train_loss": -6.233839988708496, "global_step": 82678, "epoch": 1968} {"train_loss": -6.110838890075684, "global_step": 82679, "epoch": 1968} {"train_loss": -6.153845310211182, "global_step": 82680, "epoch": 1968} {"train_loss": -6.165960311889648, "global_step": 82681, "epoch": 1968} {"train_loss": -6.14427375793457, "global_step": 82682, "epoch": 1968} {"train_loss": -6.083322525024414, "global_step": 82683, "epoch": 1968} {"train_loss": -6.199159622192383, "global_step": 82684, "epoch": 1968} {"train_loss": -6.204275131225586, "global_step": 82685, "epoch": 1968} {"train_loss": -6.245245933532715, "global_step": 82686, "epoch": 1968} {"train_loss": -6.151065826416016, "global_step": 82687, "epoch": 1968} {"train_loss": -6.240087509155273, "global_step": 82688, "epoch": 1968} {"train_loss": -6.175561428070068, "global_step": 82689, "epoch": 1968} {"train_loss": -6.052658557891846, "global_step": 82690, "epoch": 1968} {"train_loss": -6.104099273681641, "global_step": 82691, "epoch": 1968} {"train_loss": -6.262520790100098, "global_step": 82692, "epoch": 1968} {"train_loss": -6.215296745300293, "global_step": 82693, "epoch": 1968} {"train_loss": -6.284492492675781, "global_step": 82694, "epoch": 1968} {"train_loss": -6.207456588745117, "global_step": 82695, "epoch": 1968} {"train_loss": -6.163434028625488, "global_step": 82696, "epoch": 1968} {"train_loss": -6.157330319994972, "global_step": 82697, "epoch": 1968, "val_loss": 62359.01953125} {"train_loss": -6.2411088943481445, "global_step": 82698, "epoch": 1969} {"train_loss": -6.125359535217285, "global_step": 82699, "epoch": 1969} {"train_loss": -6.112979888916016, "global_step": 82700, "epoch": 1969} {"train_loss": -6.1838579177856445, "global_step": 82701, "epoch": 1969} {"train_loss": -6.11894416809082, "global_step": 82702, "epoch": 1969} {"train_loss": -6.245669364929199, "global_step": 82703, "epoch": 1969} {"train_loss": -6.223188400268555, "global_step": 82704, "epoch": 1969} {"train_loss": -6.01181697845459, "global_step": 82705, "epoch": 1969} {"train_loss": -6.228476524353027, "global_step": 82706, "epoch": 1969} {"train_loss": -6.236017227172852, "global_step": 82707, "epoch": 1969} {"train_loss": -6.181731700897217, "global_step": 82708, "epoch": 1969} {"train_loss": -6.242620468139648, "global_step": 82709, "epoch": 1969} {"train_loss": -6.167661190032959, "global_step": 82710, "epoch": 1969} {"train_loss": -6.3641533851623535, "global_step": 82711, "epoch": 1969} {"train_loss": -6.174064636230469, "global_step": 82712, "epoch": 1969} {"train_loss": -6.210609436035156, "global_step": 82713, "epoch": 1969} {"train_loss": -6.24373722076416, "global_step": 82714, "epoch": 1969} {"train_loss": -6.254387378692627, "global_step": 82715, "epoch": 1969} {"train_loss": -6.136677265167236, "global_step": 82716, "epoch": 1969} {"train_loss": -6.277345657348633, "global_step": 82717, "epoch": 1969} {"train_loss": -6.348443984985352, "global_step": 82718, "epoch": 1969} {"train_loss": -6.270355224609375, "global_step": 82719, "epoch": 1969} {"train_loss": -6.1089887619018555, "global_step": 82720, "epoch": 1969} {"train_loss": -6.141617774963379, "global_step": 82721, "epoch": 1969} {"train_loss": -6.180519104003906, "global_step": 82722, "epoch": 1969} {"train_loss": -6.202723979949951, "global_step": 82723, "epoch": 1969} {"train_loss": -6.219756126403809, "global_step": 82724, "epoch": 1969} {"train_loss": -6.236320495605469, "global_step": 82725, "epoch": 1969} {"train_loss": -6.228300094604492, "global_step": 82726, "epoch": 1969} {"train_loss": -6.149046897888184, "global_step": 82727, "epoch": 1969} {"train_loss": -6.218481063842773, "global_step": 82728, "epoch": 1969} {"train_loss": -6.107495307922363, "global_step": 82729, "epoch": 1969} {"train_loss": -6.354018211364746, "global_step": 82730, "epoch": 1969} {"train_loss": -6.2196044921875, "global_step": 82731, "epoch": 1969} {"train_loss": -6.131048679351807, "global_step": 82732, "epoch": 1969} {"train_loss": -6.165022373199463, "global_step": 82733, "epoch": 1969} {"train_loss": -6.171054840087891, "global_step": 82734, "epoch": 1969} {"train_loss": -6.295161247253418, "global_step": 82735, "epoch": 1969} {"train_loss": -6.187237739562988, "global_step": 82736, "epoch": 1969} {"train_loss": -6.245270252227783, "global_step": 82737, "epoch": 1969} {"train_loss": -6.08209228515625, "global_step": 82738, "epoch": 1969} {"train_loss": -6.201254992257981, "global_step": 82739, "epoch": 1969, "val_loss": 62604.046875} {"train_loss": -6.235208034515381, "global_step": 82740, "epoch": 1970} {"train_loss": -6.174747467041016, "global_step": 82741, "epoch": 1970} {"train_loss": -6.246197700500488, "global_step": 82742, "epoch": 1970} {"train_loss": -6.191323757171631, "global_step": 82743, "epoch": 1970} {"train_loss": -6.293237209320068, "global_step": 82744, "epoch": 1970} {"train_loss": -6.293385982513428, "global_step": 82745, "epoch": 1970} {"train_loss": -6.165493011474609, "global_step": 82746, "epoch": 1970} {"train_loss": -6.201990127563477, "global_step": 82747, "epoch": 1970} {"train_loss": -6.091372489929199, "global_step": 82748, "epoch": 1970} {"train_loss": -6.13134765625, "global_step": 82749, "epoch": 1970} {"train_loss": -6.220229148864746, "global_step": 82750, "epoch": 1970} {"train_loss": -6.0112104415893555, "global_step": 82751, "epoch": 1970} {"train_loss": -6.235615253448486, "global_step": 82752, "epoch": 1970} {"train_loss": -6.189693927764893, "global_step": 82753, "epoch": 1970} {"train_loss": -6.186765193939209, "global_step": 82754, "epoch": 1970} {"train_loss": -6.123058319091797, "global_step": 82755, "epoch": 1970} {"train_loss": -6.162173271179199, "global_step": 82756, "epoch": 1970} {"train_loss": -6.181778907775879, "global_step": 82757, "epoch": 1970} {"train_loss": -6.267026901245117, "global_step": 82758, "epoch": 1970} {"train_loss": -6.134026527404785, "global_step": 82759, "epoch": 1970} {"train_loss": -6.03236722946167, "global_step": 82760, "epoch": 1970} {"train_loss": -6.193397045135498, "global_step": 82761, "epoch": 1970} {"train_loss": -6.179512023925781, "global_step": 82762, "epoch": 1970} {"train_loss": -6.151409149169922, "global_step": 82763, "epoch": 1970} {"train_loss": -6.326432228088379, "global_step": 82764, "epoch": 1970} {"train_loss": -6.268057823181152, "global_step": 82765, "epoch": 1970} {"train_loss": -6.338874816894531, "global_step": 82766, "epoch": 1970} {"train_loss": -6.130234718322754, "global_step": 82767, "epoch": 1970} {"train_loss": -6.171896934509277, "global_step": 82768, "epoch": 1970} {"train_loss": -6.220850944519043, "global_step": 82769, "epoch": 1970} {"train_loss": -6.177480697631836, "global_step": 82770, "epoch": 1970} {"train_loss": -6.193572998046875, "global_step": 82771, "epoch": 1970} {"train_loss": -6.104996204376221, "global_step": 82772, "epoch": 1970} {"train_loss": -6.1419806480407715, "global_step": 82773, "epoch": 1970} {"train_loss": -6.198642730712891, "global_step": 82774, "epoch": 1970} {"train_loss": -6.197979927062988, "global_step": 82775, "epoch": 1970} {"train_loss": -6.196578025817871, "global_step": 82776, "epoch": 1970} {"train_loss": -6.137753963470459, "global_step": 82777, "epoch": 1970} {"train_loss": -6.191989898681641, "global_step": 82778, "epoch": 1970} {"train_loss": -6.07448673248291, "global_step": 82779, "epoch": 1970} {"train_loss": -6.172890663146973, "global_step": 82780, "epoch": 1970} {"train_loss": -6.183123838333857, "global_step": 82781, "epoch": 1970, "val_loss": 62435.3203125} {"train_loss": -6.2546892166137695, "global_step": 82782, "epoch": 1971} {"train_loss": -6.1787543296813965, "global_step": 82783, "epoch": 1971} {"train_loss": -6.228484153747559, "global_step": 82784, "epoch": 1971} {"train_loss": -6.205954551696777, "global_step": 82785, "epoch": 1971} {"train_loss": -6.227383136749268, "global_step": 82786, "epoch": 1971} {"train_loss": -6.19632625579834, "global_step": 82787, "epoch": 1971} {"train_loss": -6.215048789978027, "global_step": 82788, "epoch": 1971} {"train_loss": -6.039104461669922, "global_step": 82789, "epoch": 1971} {"train_loss": -6.173370361328125, "global_step": 82790, "epoch": 1971} {"train_loss": -6.102231025695801, "global_step": 82791, "epoch": 1971} {"train_loss": -6.045759201049805, "global_step": 82792, "epoch": 1971} {"train_loss": -6.2233428955078125, "global_step": 82793, "epoch": 1971} {"train_loss": -5.979920387268066, "global_step": 82794, "epoch": 1971} {"train_loss": -6.104628562927246, "global_step": 82795, "epoch": 1971} {"train_loss": -6.024290084838867, "global_step": 82796, "epoch": 1971} {"train_loss": -6.166805267333984, "global_step": 82797, "epoch": 1971} {"train_loss": -6.158385753631592, "global_step": 82798, "epoch": 1971} {"train_loss": -6.044729709625244, "global_step": 82799, "epoch": 1971} {"train_loss": -6.18355655670166, "global_step": 82800, "epoch": 1971} {"train_loss": -6.123044013977051, "global_step": 82801, "epoch": 1971} {"train_loss": -6.125970840454102, "global_step": 82802, "epoch": 1971} {"train_loss": -6.194888114929199, "global_step": 82803, "epoch": 1971} {"train_loss": -6.046603202819824, "global_step": 82804, "epoch": 1971} {"train_loss": -6.0514421463012695, "global_step": 82805, "epoch": 1971} {"train_loss": -6.0995893478393555, "global_step": 82806, "epoch": 1971} {"train_loss": -6.13460111618042, "global_step": 82807, "epoch": 1971} {"train_loss": -6.105291366577148, "global_step": 82808, "epoch": 1971} {"train_loss": -6.06543493270874, "global_step": 82809, "epoch": 1971} {"train_loss": -6.1908674240112305, "global_step": 82810, "epoch": 1971} {"train_loss": -6.108172416687012, "global_step": 82811, "epoch": 1971} {"train_loss": -6.088926315307617, "global_step": 82812, "epoch": 1971} {"train_loss": -6.12224817276001, "global_step": 82813, "epoch": 1971} {"train_loss": -6.143497943878174, "global_step": 82814, "epoch": 1971} {"train_loss": -6.285628318786621, "global_step": 82815, "epoch": 1971} {"train_loss": -6.2598876953125, "global_step": 82816, "epoch": 1971} {"train_loss": -6.291360855102539, "global_step": 82817, "epoch": 1971} {"train_loss": -6.211945056915283, "global_step": 82818, "epoch": 1971} {"train_loss": -6.139657497406006, "global_step": 82819, "epoch": 1971} {"train_loss": -6.19563627243042, "global_step": 82820, "epoch": 1971} {"train_loss": -6.256740570068359, "global_step": 82821, "epoch": 1971} {"train_loss": -6.1086273193359375, "global_step": 82822, "epoch": 1971} {"train_loss": -6.151144913264683, "global_step": 82823, "epoch": 1971, "val_loss": 62511.36328125} {"train_loss": -6.17673921585083, "global_step": 82824, "epoch": 1972} {"train_loss": -6.202109336853027, "global_step": 82825, "epoch": 1972} {"train_loss": -6.17708683013916, "global_step": 82826, "epoch": 1972} {"train_loss": -6.087763786315918, "global_step": 82827, "epoch": 1972} {"train_loss": -6.1639604568481445, "global_step": 82828, "epoch": 1972} {"train_loss": -6.177920341491699, "global_step": 82829, "epoch": 1972} {"train_loss": -6.101400852203369, "global_step": 82830, "epoch": 1972} {"train_loss": -6.121344566345215, "global_step": 82831, "epoch": 1972} {"train_loss": -6.156479835510254, "global_step": 82832, "epoch": 1972} {"train_loss": -6.144207954406738, "global_step": 82833, "epoch": 1972} {"train_loss": -6.144801139831543, "global_step": 82834, "epoch": 1972} {"train_loss": -6.178071975708008, "global_step": 82835, "epoch": 1972} {"train_loss": -6.36699104309082, "global_step": 82836, "epoch": 1972} {"train_loss": -6.292903900146484, "global_step": 82837, "epoch": 1972} {"train_loss": -6.230725288391113, "global_step": 82838, "epoch": 1972} {"train_loss": -6.204517841339111, "global_step": 82839, "epoch": 1972} {"train_loss": -6.272443771362305, "global_step": 82840, "epoch": 1972} {"train_loss": -6.181253433227539, "global_step": 82841, "epoch": 1972} {"train_loss": -6.10410213470459, "global_step": 82842, "epoch": 1972} {"train_loss": -6.137989044189453, "global_step": 82843, "epoch": 1972} {"train_loss": -6.103560924530029, "global_step": 82844, "epoch": 1972} {"train_loss": -6.208321571350098, "global_step": 82845, "epoch": 1972} {"train_loss": -6.148746967315674, "global_step": 82846, "epoch": 1972} {"train_loss": -6.153236389160156, "global_step": 82847, "epoch": 1972} {"train_loss": -6.191006183624268, "global_step": 82848, "epoch": 1972} {"train_loss": -6.164912223815918, "global_step": 82849, "epoch": 1972} {"train_loss": -6.237936973571777, "global_step": 82850, "epoch": 1972} {"train_loss": -6.058541774749756, "global_step": 82851, "epoch": 1972} {"train_loss": -6.21828556060791, "global_step": 82852, "epoch": 1972} {"train_loss": -6.148548603057861, "global_step": 82853, "epoch": 1972} {"train_loss": -6.219974517822266, "global_step": 82854, "epoch": 1972} {"train_loss": -6.131348609924316, "global_step": 82855, "epoch": 1972} {"train_loss": -6.152990341186523, "global_step": 82856, "epoch": 1972} {"train_loss": -6.217132568359375, "global_step": 82857, "epoch": 1972} {"train_loss": -6.245303630828857, "global_step": 82858, "epoch": 1972} {"train_loss": -6.295941352844238, "global_step": 82859, "epoch": 1972} {"train_loss": -6.176093101501465, "global_step": 82860, "epoch": 1972} {"train_loss": -6.302677154541016, "global_step": 82861, "epoch": 1972} {"train_loss": -6.160334587097168, "global_step": 82862, "epoch": 1972} {"train_loss": -6.238046169281006, "global_step": 82863, "epoch": 1972} {"train_loss": -6.13442325592041, "global_step": 82864, "epoch": 1972} {"train_loss": -6.180041403997512, "global_step": 82865, "epoch": 1972, "val_loss": 62596.89453125} {"train_loss": -6.160825252532959, "global_step": 82866, "epoch": 1973} {"train_loss": -6.167803764343262, "global_step": 82867, "epoch": 1973} {"train_loss": -6.266791820526123, "global_step": 82868, "epoch": 1973} {"train_loss": -6.145977020263672, "global_step": 82869, "epoch": 1973} {"train_loss": -6.2145185470581055, "global_step": 82870, "epoch": 1973} {"train_loss": -6.069768905639648, "global_step": 82871, "epoch": 1973} {"train_loss": -6.214573860168457, "global_step": 82872, "epoch": 1973} {"train_loss": -6.330191612243652, "global_step": 82873, "epoch": 1973} {"train_loss": -6.183468818664551, "global_step": 82874, "epoch": 1973} {"train_loss": -6.144418716430664, "global_step": 82875, "epoch": 1973} {"train_loss": -6.160975456237793, "global_step": 82876, "epoch": 1973} {"train_loss": -6.128091812133789, "global_step": 82877, "epoch": 1973} {"train_loss": -6.3215789794921875, "global_step": 82878, "epoch": 1973} {"train_loss": -6.118046760559082, "global_step": 82879, "epoch": 1973} {"train_loss": -6.265721797943115, "global_step": 82880, "epoch": 1973} {"train_loss": -6.233207702636719, "global_step": 82881, "epoch": 1973} {"train_loss": -6.0946807861328125, "global_step": 82882, "epoch": 1973} {"train_loss": -6.3080830574035645, "global_step": 82883, "epoch": 1973} {"train_loss": -6.181258678436279, "global_step": 82884, "epoch": 1973} {"train_loss": -6.223750114440918, "global_step": 82885, "epoch": 1973} {"train_loss": -6.13508415222168, "global_step": 82886, "epoch": 1973} {"train_loss": -6.0675249099731445, "global_step": 82887, "epoch": 1973} {"train_loss": -6.037792205810547, "global_step": 82888, "epoch": 1973} {"train_loss": -6.21504020690918, "global_step": 82889, "epoch": 1973} {"train_loss": -6.149384021759033, "global_step": 82890, "epoch": 1973} {"train_loss": -6.126819133758545, "global_step": 82891, "epoch": 1973} {"train_loss": -6.238771915435791, "global_step": 82892, "epoch": 1973} {"train_loss": -6.139298915863037, "global_step": 82893, "epoch": 1973} {"train_loss": -6.229894638061523, "global_step": 82894, "epoch": 1973} {"train_loss": -6.208479881286621, "global_step": 82895, "epoch": 1973} {"train_loss": -6.264963150024414, "global_step": 82896, "epoch": 1973} {"train_loss": -6.184144020080566, "global_step": 82897, "epoch": 1973} {"train_loss": -6.295393943786621, "global_step": 82898, "epoch": 1973} {"train_loss": -6.153841018676758, "global_step": 82899, "epoch": 1973} {"train_loss": -6.131787300109863, "global_step": 82900, "epoch": 1973} {"train_loss": -6.140395164489746, "global_step": 82901, "epoch": 1973} {"train_loss": -6.21745491027832, "global_step": 82902, "epoch": 1973} {"train_loss": -6.23089599609375, "global_step": 82903, "epoch": 1973} {"train_loss": -6.163226127624512, "global_step": 82904, "epoch": 1973} {"train_loss": -6.282427787780762, "global_step": 82905, "epoch": 1973} {"train_loss": -6.199141502380371, "global_step": 82906, "epoch": 1973} {"train_loss": -6.190893457049415, "global_step": 82907, "epoch": 1973, "val_loss": 62505.45703125} {"train_loss": -6.2216339111328125, "global_step": 82908, "epoch": 1974} {"train_loss": -6.111126899719238, "global_step": 82909, "epoch": 1974} {"train_loss": -6.180000305175781, "global_step": 82910, "epoch": 1974} {"train_loss": -6.1917524337768555, "global_step": 82911, "epoch": 1974} {"train_loss": -6.236173629760742, "global_step": 82912, "epoch": 1974} {"train_loss": -6.310375690460205, "global_step": 82913, "epoch": 1974} {"train_loss": -6.227537155151367, "global_step": 82914, "epoch": 1974} {"train_loss": -6.226232051849365, "global_step": 82915, "epoch": 1974} {"train_loss": -6.231663227081299, "global_step": 82916, "epoch": 1974} {"train_loss": -6.1945953369140625, "global_step": 82917, "epoch": 1974} {"train_loss": -6.23520565032959, "global_step": 82918, "epoch": 1974} {"train_loss": -6.169214248657227, "global_step": 82919, "epoch": 1974} {"train_loss": -6.210507392883301, "global_step": 82920, "epoch": 1974} {"train_loss": -6.236728191375732, "global_step": 82921, "epoch": 1974} {"train_loss": -6.123938083648682, "global_step": 82922, "epoch": 1974} {"train_loss": -6.034483432769775, "global_step": 82923, "epoch": 1974} {"train_loss": -6.2206220626831055, "global_step": 82924, "epoch": 1974} {"train_loss": -6.168773174285889, "global_step": 82925, "epoch": 1974} {"train_loss": -6.188325881958008, "global_step": 82926, "epoch": 1974} {"train_loss": -6.1110920906066895, "global_step": 82927, "epoch": 1974} {"train_loss": -6.149495601654053, "global_step": 82928, "epoch": 1974} {"train_loss": -6.332964897155762, "global_step": 82929, "epoch": 1974} {"train_loss": -6.186661720275879, "global_step": 82930, "epoch": 1974} {"train_loss": -6.0989580154418945, "global_step": 82931, "epoch": 1974} {"train_loss": -6.061515808105469, "global_step": 82932, "epoch": 1974} {"train_loss": -6.135242938995361, "global_step": 82933, "epoch": 1974} {"train_loss": -6.241747856140137, "global_step": 82934, "epoch": 1974} {"train_loss": -6.103025436401367, "global_step": 82935, "epoch": 1974} {"train_loss": -6.102090835571289, "global_step": 82936, "epoch": 1974} {"train_loss": -6.144096374511719, "global_step": 82937, "epoch": 1974} {"train_loss": -5.9898600578308105, "global_step": 82938, "epoch": 1974} {"train_loss": -6.19373893737793, "global_step": 82939, "epoch": 1974} {"train_loss": -6.2360639572143555, "global_step": 82940, "epoch": 1974} {"train_loss": -6.060586929321289, "global_step": 82941, "epoch": 1974} {"train_loss": -6.041317462921143, "global_step": 82942, "epoch": 1974} {"train_loss": -6.190945625305176, "global_step": 82943, "epoch": 1974} {"train_loss": -6.26015043258667, "global_step": 82944, "epoch": 1974} {"train_loss": -6.039766788482666, "global_step": 82945, "epoch": 1974} {"train_loss": -6.223755359649658, "global_step": 82946, "epoch": 1974} {"train_loss": -6.168179035186768, "global_step": 82947, "epoch": 1974} {"train_loss": -6.292318344116211, "global_step": 82948, "epoch": 1974} {"train_loss": -6.171897888183594, "global_step": 82949, "epoch": 1974, "val_loss": 62452.26953125} {"train_loss": -6.3170342445373535, "global_step": 82950, "epoch": 1975} {"train_loss": -6.268154144287109, "global_step": 82951, "epoch": 1975} {"train_loss": -6.115594863891602, "global_step": 82952, "epoch": 1975} {"train_loss": -6.224373817443848, "global_step": 82953, "epoch": 1975} {"train_loss": -6.337325096130371, "global_step": 82954, "epoch": 1975} {"train_loss": -6.1375627517700195, "global_step": 82955, "epoch": 1975} {"train_loss": -6.14375638961792, "global_step": 82956, "epoch": 1975} {"train_loss": -6.0814409255981445, "global_step": 82957, "epoch": 1975} {"train_loss": -6.227879524230957, "global_step": 82958, "epoch": 1975} {"train_loss": -6.095080852508545, "global_step": 82959, "epoch": 1975} {"train_loss": -6.163743019104004, "global_step": 82960, "epoch": 1975} {"train_loss": -6.108514785766602, "global_step": 82961, "epoch": 1975} {"train_loss": -6.153985023498535, "global_step": 82962, "epoch": 1975} {"train_loss": -6.079531669616699, "global_step": 82963, "epoch": 1975} {"train_loss": -6.185810565948486, "global_step": 82964, "epoch": 1975} {"train_loss": -6.194242477416992, "global_step": 82965, "epoch": 1975} {"train_loss": -6.156839370727539, "global_step": 82966, "epoch": 1975} {"train_loss": -6.224286079406738, "global_step": 82967, "epoch": 1975} {"train_loss": -6.092406272888184, "global_step": 82968, "epoch": 1975} {"train_loss": -6.113462924957275, "global_step": 82969, "epoch": 1975} {"train_loss": -6.1842522621154785, "global_step": 82970, "epoch": 1975} {"train_loss": -6.311326026916504, "global_step": 82971, "epoch": 1975} {"train_loss": -6.167068958282471, "global_step": 82972, "epoch": 1975} {"train_loss": -6.296089172363281, "global_step": 82973, "epoch": 1975} {"train_loss": -6.100125789642334, "global_step": 82974, "epoch": 1975} {"train_loss": -6.304010391235352, "global_step": 82975, "epoch": 1975} {"train_loss": -6.150640487670898, "global_step": 82976, "epoch": 1975} {"train_loss": -6.169504165649414, "global_step": 82977, "epoch": 1975} {"train_loss": -6.187960147857666, "global_step": 82978, "epoch": 1975} {"train_loss": -6.016587734222412, "global_step": 82979, "epoch": 1975} {"train_loss": -6.168327331542969, "global_step": 82980, "epoch": 1975} {"train_loss": -6.243946075439453, "global_step": 82981, "epoch": 1975} {"train_loss": -6.015896797180176, "global_step": 82982, "epoch": 1975} {"train_loss": -6.1403889656066895, "global_step": 82983, "epoch": 1975} {"train_loss": -6.122799396514893, "global_step": 82984, "epoch": 1975} {"train_loss": -6.164240837097168, "global_step": 82985, "epoch": 1975} {"train_loss": -6.233791351318359, "global_step": 82986, "epoch": 1975} {"train_loss": -6.324455738067627, "global_step": 82987, "epoch": 1975} {"train_loss": -6.127081394195557, "global_step": 82988, "epoch": 1975} {"train_loss": -6.243701457977295, "global_step": 82989, "epoch": 1975} {"train_loss": -6.183255195617676, "global_step": 82990, "epoch": 1975} {"train_loss": -6.1802335920788, "global_step": 82991, "epoch": 1975, "val_loss": 62562.37890625} {"train_loss": -6.214717864990234, "global_step": 82992, "epoch": 1976} {"train_loss": -6.331923961639404, "global_step": 82993, "epoch": 1976} {"train_loss": -6.330667972564697, "global_step": 82994, "epoch": 1976} {"train_loss": -6.189520835876465, "global_step": 82995, "epoch": 1976} {"train_loss": -6.244720458984375, "global_step": 82996, "epoch": 1976} {"train_loss": -6.295382499694824, "global_step": 82997, "epoch": 1976} {"train_loss": -6.094335556030273, "global_step": 82998, "epoch": 1976} {"train_loss": -6.28365421295166, "global_step": 82999, "epoch": 1976} {"train_loss": -6.263853073120117, "global_step": 83000, "epoch": 1976} {"train_loss": -6.178567409515381, "global_step": 83001, "epoch": 1976} {"train_loss": -6.1738176345825195, "global_step": 83002, "epoch": 1976} {"train_loss": -6.28460693359375, "global_step": 83003, "epoch": 1976} {"train_loss": -6.2165021896362305, "global_step": 83004, "epoch": 1976} {"train_loss": -6.169220924377441, "global_step": 83005, "epoch": 1976} {"train_loss": -6.199088096618652, "global_step": 83006, "epoch": 1976} {"train_loss": -6.048521041870117, "global_step": 83007, "epoch": 1976} {"train_loss": -6.146331787109375, "global_step": 83008, "epoch": 1976} {"train_loss": -6.2650933265686035, "global_step": 83009, "epoch": 1976} {"train_loss": -6.179904937744141, "global_step": 83010, "epoch": 1976} {"train_loss": -6.182888984680176, "global_step": 83011, "epoch": 1976} {"train_loss": -6.191723823547363, "global_step": 83012, "epoch": 1976} {"train_loss": -6.136892318725586, "global_step": 83013, "epoch": 1976} {"train_loss": -6.084336280822754, "global_step": 83014, "epoch": 1976} {"train_loss": -6.236285209655762, "global_step": 83015, "epoch": 1976} {"train_loss": -6.142462253570557, "global_step": 83016, "epoch": 1976} {"train_loss": -6.238317489624023, "global_step": 83017, "epoch": 1976} {"train_loss": -6.176290035247803, "global_step": 83018, "epoch": 1976} {"train_loss": -6.2059783935546875, "global_step": 83019, "epoch": 1976} {"train_loss": -6.125298500061035, "global_step": 83020, "epoch": 1976} {"train_loss": -6.2712578773498535, "global_step": 83021, "epoch": 1976} {"train_loss": -6.150300979614258, "global_step": 83022, "epoch": 1976} {"train_loss": -6.10923433303833, "global_step": 83023, "epoch": 1976} {"train_loss": -6.122551918029785, "global_step": 83024, "epoch": 1976} {"train_loss": -6.180842876434326, "global_step": 83025, "epoch": 1976} {"train_loss": -6.132061004638672, "global_step": 83026, "epoch": 1976} {"train_loss": -6.060958385467529, "global_step": 83027, "epoch": 1976} {"train_loss": -6.130265235900879, "global_step": 83028, "epoch": 1976} {"train_loss": -6.167726516723633, "global_step": 83029, "epoch": 1976} {"train_loss": -6.121471881866455, "global_step": 83030, "epoch": 1976} {"train_loss": -6.158317565917969, "global_step": 83031, "epoch": 1976} {"train_loss": -6.110725402832031, "global_step": 83032, "epoch": 1976} {"train_loss": -6.183730556851342, "global_step": 83033, "epoch": 1976, "val_loss": 62645.3828125} {"train_loss": -6.187229156494141, "global_step": 83034, "epoch": 1977} {"train_loss": -6.354510307312012, "global_step": 83035, "epoch": 1977} {"train_loss": -6.208001136779785, "global_step": 83036, "epoch": 1977} {"train_loss": -6.108365058898926, "global_step": 83037, "epoch": 1977} {"train_loss": -6.296196460723877, "global_step": 83038, "epoch": 1977} {"train_loss": -6.117539405822754, "global_step": 83039, "epoch": 1977} {"train_loss": -6.043212413787842, "global_step": 83040, "epoch": 1977} {"train_loss": -6.090865612030029, "global_step": 83041, "epoch": 1977} {"train_loss": -6.027338981628418, "global_step": 83042, "epoch": 1977} {"train_loss": -6.074748992919922, "global_step": 83043, "epoch": 1977} {"train_loss": -6.120110988616943, "global_step": 83044, "epoch": 1977} {"train_loss": -6.1262617111206055, "global_step": 83045, "epoch": 1977} {"train_loss": -6.1082258224487305, "global_step": 83046, "epoch": 1977} {"train_loss": -6.219535827636719, "global_step": 83047, "epoch": 1977} {"train_loss": -6.223207473754883, "global_step": 83048, "epoch": 1977} {"train_loss": -6.166543483734131, "global_step": 83049, "epoch": 1977} {"train_loss": -6.241686820983887, "global_step": 83050, "epoch": 1977} {"train_loss": -6.18892765045166, "global_step": 83051, "epoch": 1977} {"train_loss": -6.21822452545166, "global_step": 83052, "epoch": 1977} {"train_loss": -6.147375106811523, "global_step": 83053, "epoch": 1977} {"train_loss": -6.192461967468262, "global_step": 83054, "epoch": 1977} {"train_loss": -6.200500965118408, "global_step": 83055, "epoch": 1977} {"train_loss": -6.205353736877441, "global_step": 83056, "epoch": 1977} {"train_loss": -6.225307464599609, "global_step": 83057, "epoch": 1977} {"train_loss": -6.184637546539307, "global_step": 83058, "epoch": 1977} {"train_loss": -6.211142539978027, "global_step": 83059, "epoch": 1977} {"train_loss": -6.165107727050781, "global_step": 83060, "epoch": 1977} {"train_loss": -6.151313781738281, "global_step": 83061, "epoch": 1977} {"train_loss": -6.104395389556885, "global_step": 83062, "epoch": 1977} {"train_loss": -6.086264610290527, "global_step": 83063, "epoch": 1977} {"train_loss": -6.259284496307373, "global_step": 83064, "epoch": 1977} {"train_loss": -6.235840320587158, "global_step": 83065, "epoch": 1977} {"train_loss": -6.1033244132995605, "global_step": 83066, "epoch": 1977} {"train_loss": -6.160434722900391, "global_step": 83067, "epoch": 1977} {"train_loss": -6.062211513519287, "global_step": 83068, "epoch": 1977} {"train_loss": -6.234131813049316, "global_step": 83069, "epoch": 1977} {"train_loss": -6.161858081817627, "global_step": 83070, "epoch": 1977} {"train_loss": -6.167947769165039, "global_step": 83071, "epoch": 1977} {"train_loss": -6.107265472412109, "global_step": 83072, "epoch": 1977} {"train_loss": -6.002346992492676, "global_step": 83073, "epoch": 1977} {"train_loss": -6.075194358825684, "global_step": 83074, "epoch": 1977} {"train_loss": -6.155654010318575, "global_step": 83075, "epoch": 1977, "val_loss": 62492.55078125} {"train_loss": -6.2331132888793945, "global_step": 83076, "epoch": 1978} {"train_loss": -6.124905586242676, "global_step": 83077, "epoch": 1978} {"train_loss": -6.204456806182861, "global_step": 83078, "epoch": 1978} {"train_loss": -6.163124084472656, "global_step": 83079, "epoch": 1978} {"train_loss": -6.094862937927246, "global_step": 83080, "epoch": 1978} {"train_loss": -6.15882682800293, "global_step": 83081, "epoch": 1978} {"train_loss": -6.2913947105407715, "global_step": 83082, "epoch": 1978} {"train_loss": -6.128399848937988, "global_step": 83083, "epoch": 1978} {"train_loss": -6.155240058898926, "global_step": 83084, "epoch": 1978} {"train_loss": -6.268450736999512, "global_step": 83085, "epoch": 1978} {"train_loss": -6.107640743255615, "global_step": 83086, "epoch": 1978} {"train_loss": -6.131884574890137, "global_step": 83087, "epoch": 1978} {"train_loss": -6.039799690246582, "global_step": 83088, "epoch": 1978} {"train_loss": -6.006014347076416, "global_step": 83089, "epoch": 1978} {"train_loss": -6.037930488586426, "global_step": 83090, "epoch": 1978} {"train_loss": -5.981799125671387, "global_step": 83091, "epoch": 1978} {"train_loss": -5.982163429260254, "global_step": 83092, "epoch": 1978} {"train_loss": -6.042207717895508, "global_step": 83093, "epoch": 1978} {"train_loss": -6.124782562255859, "global_step": 83094, "epoch": 1978} {"train_loss": -6.123705863952637, "global_step": 83095, "epoch": 1978} {"train_loss": -6.138303756713867, "global_step": 83096, "epoch": 1978} {"train_loss": -6.14854621887207, "global_step": 83097, "epoch": 1978} {"train_loss": -6.059699058532715, "global_step": 83098, "epoch": 1978} {"train_loss": -6.068874359130859, "global_step": 83099, "epoch": 1978} {"train_loss": -6.260434627532959, "global_step": 83100, "epoch": 1978} {"train_loss": -6.0875115394592285, "global_step": 83101, "epoch": 1978} {"train_loss": -6.208899021148682, "global_step": 83102, "epoch": 1978} {"train_loss": -6.142813205718994, "global_step": 83103, "epoch": 1978} {"train_loss": -6.050492286682129, "global_step": 83104, "epoch": 1978} {"train_loss": -6.169321060180664, "global_step": 83105, "epoch": 1978} {"train_loss": -5.962672233581543, "global_step": 83106, "epoch": 1978} {"train_loss": -6.058293342590332, "global_step": 83107, "epoch": 1978} {"train_loss": -6.046058654785156, "global_step": 83108, "epoch": 1978} {"train_loss": -6.218987941741943, "global_step": 83109, "epoch": 1978} {"train_loss": -6.098178386688232, "global_step": 83110, "epoch": 1978} {"train_loss": -6.128430366516113, "global_step": 83111, "epoch": 1978} {"train_loss": -6.156937599182129, "global_step": 83112, "epoch": 1978} {"train_loss": -6.212605953216553, "global_step": 83113, "epoch": 1978} {"train_loss": -6.126028060913086, "global_step": 83114, "epoch": 1978} {"train_loss": -6.168395519256592, "global_step": 83115, "epoch": 1978} {"train_loss": -6.171531677246094, "global_step": 83116, "epoch": 1978} {"train_loss": -6.123713118689401, "global_step": 83117, "epoch": 1978, "val_loss": 62564.57421875} {"train_loss": -6.169317722320557, "global_step": 83118, "epoch": 1979} {"train_loss": -6.248186111450195, "global_step": 83119, "epoch": 1979} {"train_loss": -6.240682601928711, "global_step": 83120, "epoch": 1979} {"train_loss": -6.232074737548828, "global_step": 83121, "epoch": 1979} {"train_loss": -6.113354682922363, "global_step": 83122, "epoch": 1979} {"train_loss": -6.101327896118164, "global_step": 83123, "epoch": 1979} {"train_loss": -6.174948692321777, "global_step": 83124, "epoch": 1979} {"train_loss": -6.106162071228027, "global_step": 83125, "epoch": 1979} {"train_loss": -6.1860504150390625, "global_step": 83126, "epoch": 1979} {"train_loss": -6.129131317138672, "global_step": 83127, "epoch": 1979} {"train_loss": -6.101596355438232, "global_step": 83128, "epoch": 1979} {"train_loss": -6.101824760437012, "global_step": 83129, "epoch": 1979} {"train_loss": -6.202274322509766, "global_step": 83130, "epoch": 1979} {"train_loss": -6.154160499572754, "global_step": 83131, "epoch": 1979} {"train_loss": -6.187045574188232, "global_step": 83132, "epoch": 1979} {"train_loss": -6.166477680206299, "global_step": 83133, "epoch": 1979} {"train_loss": -6.159791946411133, "global_step": 83134, "epoch": 1979} {"train_loss": -6.242677688598633, "global_step": 83135, "epoch": 1979} {"train_loss": -6.223865509033203, "global_step": 83136, "epoch": 1979} {"train_loss": -6.166579723358154, "global_step": 83137, "epoch": 1979} {"train_loss": -6.270323753356934, "global_step": 83138, "epoch": 1979} {"train_loss": -6.267080783843994, "global_step": 83139, "epoch": 1979} {"train_loss": -6.199593544006348, "global_step": 83140, "epoch": 1979} {"train_loss": -6.192637920379639, "global_step": 83141, "epoch": 1979} {"train_loss": -6.12681770324707, "global_step": 83142, "epoch": 1979} {"train_loss": -6.150976181030273, "global_step": 83143, "epoch": 1979} {"train_loss": -6.170563697814941, "global_step": 83144, "epoch": 1979} {"train_loss": -6.16786003112793, "global_step": 83145, "epoch": 1979} {"train_loss": -6.188148021697998, "global_step": 83146, "epoch": 1979} {"train_loss": -6.191437721252441, "global_step": 83147, "epoch": 1979} {"train_loss": -6.208772659301758, "global_step": 83148, "epoch": 1979} {"train_loss": -6.204953193664551, "global_step": 83149, "epoch": 1979} {"train_loss": -6.060556411743164, "global_step": 83150, "epoch": 1979} {"train_loss": -6.229516983032227, "global_step": 83151, "epoch": 1979} {"train_loss": -6.036606788635254, "global_step": 83152, "epoch": 1979} {"train_loss": -6.173495292663574, "global_step": 83153, "epoch": 1979} {"train_loss": -6.177994728088379, "global_step": 83154, "epoch": 1979} {"train_loss": -6.0549468994140625, "global_step": 83155, "epoch": 1979} {"train_loss": -6.084134101867676, "global_step": 83156, "epoch": 1979} {"train_loss": -6.028992176055908, "global_step": 83157, "epoch": 1979} {"train_loss": -5.961860179901123, "global_step": 83158, "epoch": 1979} {"train_loss": -6.160081500098819, "global_step": 83159, "epoch": 1979, "val_loss": 62507.4921875} {"train_loss": -6.139556884765625, "global_step": 83160, "epoch": 1980} {"train_loss": -6.088879108428955, "global_step": 83161, "epoch": 1980} {"train_loss": -6.084802627563477, "global_step": 83162, "epoch": 1980} {"train_loss": -6.195945739746094, "global_step": 83163, "epoch": 1980} {"train_loss": -6.148650646209717, "global_step": 83164, "epoch": 1980} {"train_loss": -6.23885440826416, "global_step": 83165, "epoch": 1980} {"train_loss": -6.126695156097412, "global_step": 83166, "epoch": 1980} {"train_loss": -6.178919792175293, "global_step": 83167, "epoch": 1980} {"train_loss": -6.137660980224609, "global_step": 83168, "epoch": 1980} {"train_loss": -6.166604518890381, "global_step": 83169, "epoch": 1980} {"train_loss": -6.195392608642578, "global_step": 83170, "epoch": 1980} {"train_loss": -6.065852642059326, "global_step": 83171, "epoch": 1980} {"train_loss": -6.191819667816162, "global_step": 83172, "epoch": 1980} {"train_loss": -6.2486162185668945, "global_step": 83173, "epoch": 1980} {"train_loss": -6.280690670013428, "global_step": 83174, "epoch": 1980} {"train_loss": -6.093892574310303, "global_step": 83175, "epoch": 1980} {"train_loss": -6.109493732452393, "global_step": 83176, "epoch": 1980} {"train_loss": -6.1741485595703125, "global_step": 83177, "epoch": 1980} {"train_loss": -6.150076389312744, "global_step": 83178, "epoch": 1980} {"train_loss": -6.09015417098999, "global_step": 83179, "epoch": 1980} {"train_loss": -6.234572410583496, "global_step": 83180, "epoch": 1980} {"train_loss": -6.161890029907227, "global_step": 83181, "epoch": 1980} {"train_loss": -6.2348103523254395, "global_step": 83182, "epoch": 1980} {"train_loss": -6.127790451049805, "global_step": 83183, "epoch": 1980} {"train_loss": -6.154293060302734, "global_step": 83184, "epoch": 1980} {"train_loss": -6.172139644622803, "global_step": 83185, "epoch": 1980} {"train_loss": -6.108793258666992, "global_step": 83186, "epoch": 1980} {"train_loss": -6.203996181488037, "global_step": 83187, "epoch": 1980} {"train_loss": -6.388261795043945, "global_step": 83188, "epoch": 1980} {"train_loss": -6.224126815795898, "global_step": 83189, "epoch": 1980} {"train_loss": -6.232723712921143, "global_step": 83190, "epoch": 1980} {"train_loss": -6.2696661949157715, "global_step": 83191, "epoch": 1980} {"train_loss": -6.307470321655273, "global_step": 83192, "epoch": 1980} {"train_loss": -6.216011047363281, "global_step": 83193, "epoch": 1980} {"train_loss": -6.313873291015625, "global_step": 83194, "epoch": 1980} {"train_loss": -6.152688026428223, "global_step": 83195, "epoch": 1980} {"train_loss": -6.223074913024902, "global_step": 83196, "epoch": 1980} {"train_loss": -6.139049053192139, "global_step": 83197, "epoch": 1980} {"train_loss": -6.150504112243652, "global_step": 83198, "epoch": 1980} {"train_loss": -6.158400535583496, "global_step": 83199, "epoch": 1980} {"train_loss": -6.271073341369629, "global_step": 83200, "epoch": 1980} {"train_loss": -6.185276882989066, "global_step": 83201, "epoch": 1980, "val_loss": 62657.9921875} {"train_loss": -6.161832809448242, "global_step": 83202, "epoch": 1981} {"train_loss": -6.2170090675354, "global_step": 83203, "epoch": 1981} {"train_loss": -6.279390335083008, "global_step": 83204, "epoch": 1981} {"train_loss": -6.224267959594727, "global_step": 83205, "epoch": 1981} {"train_loss": -6.166996002197266, "global_step": 83206, "epoch": 1981} {"train_loss": -6.214862823486328, "global_step": 83207, "epoch": 1981} {"train_loss": -6.251824378967285, "global_step": 83208, "epoch": 1981} {"train_loss": -6.1171698570251465, "global_step": 83209, "epoch": 1981} {"train_loss": -6.107122898101807, "global_step": 83210, "epoch": 1981} {"train_loss": -6.236804962158203, "global_step": 83211, "epoch": 1981} {"train_loss": -6.248775482177734, "global_step": 83212, "epoch": 1981} {"train_loss": -6.1164164543151855, "global_step": 83213, "epoch": 1981} {"train_loss": -6.226203441619873, "global_step": 83214, "epoch": 1981} {"train_loss": -6.2463531494140625, "global_step": 83215, "epoch": 1981} {"train_loss": -6.184581756591797, "global_step": 83216, "epoch": 1981} {"train_loss": -6.326102256774902, "global_step": 83217, "epoch": 1981} {"train_loss": -6.075457572937012, "global_step": 83218, "epoch": 1981} {"train_loss": -6.1090312004089355, "global_step": 83219, "epoch": 1981} {"train_loss": -6.259671688079834, "global_step": 83220, "epoch": 1981} {"train_loss": -6.288980484008789, "global_step": 83221, "epoch": 1981} {"train_loss": -6.2156982421875, "global_step": 83222, "epoch": 1981} {"train_loss": -6.15408992767334, "global_step": 83223, "epoch": 1981} {"train_loss": -6.314268112182617, "global_step": 83224, "epoch": 1981} {"train_loss": -6.063013076782227, "global_step": 83225, "epoch": 1981} {"train_loss": -6.143272399902344, "global_step": 83226, "epoch": 1981} {"train_loss": -6.155145645141602, "global_step": 83227, "epoch": 1981} {"train_loss": -6.1517534255981445, "global_step": 83228, "epoch": 1981} {"train_loss": -6.225383758544922, "global_step": 83229, "epoch": 1981} {"train_loss": -6.264303684234619, "global_step": 83230, "epoch": 1981} {"train_loss": -6.078624248504639, "global_step": 83231, "epoch": 1981} {"train_loss": -6.136913776397705, "global_step": 83232, "epoch": 1981} {"train_loss": -6.3188700675964355, "global_step": 83233, "epoch": 1981} {"train_loss": -6.191832065582275, "global_step": 83234, "epoch": 1981} {"train_loss": -6.17501163482666, "global_step": 83235, "epoch": 1981} {"train_loss": -6.251806259155273, "global_step": 83236, "epoch": 1981} {"train_loss": -6.258439540863037, "global_step": 83237, "epoch": 1981} {"train_loss": -6.239171981811523, "global_step": 83238, "epoch": 1981} {"train_loss": -6.191816329956055, "global_step": 83239, "epoch": 1981} {"train_loss": -6.186855316162109, "global_step": 83240, "epoch": 1981} {"train_loss": -6.144990921020508, "global_step": 83241, "epoch": 1981} {"train_loss": -6.1186676025390625, "global_step": 83242, "epoch": 1981} {"train_loss": -6.197508721124558, "global_step": 83243, "epoch": 1981, "val_loss": 62344.32421875} {"train_loss": -6.23633337020874, "global_step": 83244, "epoch": 1982} {"train_loss": -6.215683937072754, "global_step": 83245, "epoch": 1982} {"train_loss": -6.019286155700684, "global_step": 83246, "epoch": 1982} {"train_loss": -6.237102508544922, "global_step": 83247, "epoch": 1982} {"train_loss": -6.10244083404541, "global_step": 83248, "epoch": 1982} {"train_loss": -6.1944990158081055, "global_step": 83249, "epoch": 1982} {"train_loss": -6.168615341186523, "global_step": 83250, "epoch": 1982} {"train_loss": -6.241391181945801, "global_step": 83251, "epoch": 1982} {"train_loss": -6.190090656280518, "global_step": 83252, "epoch": 1982} {"train_loss": -6.207598686218262, "global_step": 83253, "epoch": 1982} {"train_loss": -6.290292739868164, "global_step": 83254, "epoch": 1982} {"train_loss": -6.157845497131348, "global_step": 83255, "epoch": 1982} {"train_loss": -6.2458014488220215, "global_step": 83256, "epoch": 1982} {"train_loss": -6.131203651428223, "global_step": 83257, "epoch": 1982} {"train_loss": -6.251181602478027, "global_step": 83258, "epoch": 1982} {"train_loss": -6.167502403259277, "global_step": 83259, "epoch": 1982} {"train_loss": -6.369139671325684, "global_step": 83260, "epoch": 1982} {"train_loss": -6.120946884155273, "global_step": 83261, "epoch": 1982} {"train_loss": -6.099417686462402, "global_step": 83262, "epoch": 1982} {"train_loss": -6.284427642822266, "global_step": 83263, "epoch": 1982} {"train_loss": -6.090104103088379, "global_step": 83264, "epoch": 1982} {"train_loss": -6.090919494628906, "global_step": 83265, "epoch": 1982} {"train_loss": -6.257062911987305, "global_step": 83266, "epoch": 1982} {"train_loss": -6.272846698760986, "global_step": 83267, "epoch": 1982} {"train_loss": -6.306329727172852, "global_step": 83268, "epoch": 1982} {"train_loss": -6.17167329788208, "global_step": 83269, "epoch": 1982} {"train_loss": -6.135941982269287, "global_step": 83270, "epoch": 1982} {"train_loss": -6.202788352966309, "global_step": 83271, "epoch": 1982} {"train_loss": -6.22882080078125, "global_step": 83272, "epoch": 1982} {"train_loss": -6.04801607131958, "global_step": 83273, "epoch": 1982} {"train_loss": -6.21541690826416, "global_step": 83274, "epoch": 1982} {"train_loss": -6.156834602355957, "global_step": 83275, "epoch": 1982} {"train_loss": -6.2090044021606445, "global_step": 83276, "epoch": 1982} {"train_loss": -6.161827087402344, "global_step": 83277, "epoch": 1982} {"train_loss": -6.142443656921387, "global_step": 83278, "epoch": 1982} {"train_loss": -6.048967361450195, "global_step": 83279, "epoch": 1982} {"train_loss": -6.280359268188477, "global_step": 83280, "epoch": 1982} {"train_loss": -6.183690071105957, "global_step": 83281, "epoch": 1982} {"train_loss": -6.137716770172119, "global_step": 83282, "epoch": 1982} {"train_loss": -6.181385040283203, "global_step": 83283, "epoch": 1982} {"train_loss": -6.162226676940918, "global_step": 83284, "epoch": 1982} {"train_loss": -6.187049604597545, "global_step": 83285, "epoch": 1982, "val_loss": 62617.2265625} {"train_loss": -6.201569557189941, "global_step": 83286, "epoch": 1983} {"train_loss": -6.259180068969727, "global_step": 83287, "epoch": 1983} {"train_loss": -6.178206443786621, "global_step": 83288, "epoch": 1983} {"train_loss": -6.092082500457764, "global_step": 83289, "epoch": 1983} {"train_loss": -6.117544174194336, "global_step": 83290, "epoch": 1983} {"train_loss": -6.211609840393066, "global_step": 83291, "epoch": 1983} {"train_loss": -6.18544864654541, "global_step": 83292, "epoch": 1983} {"train_loss": -6.121351718902588, "global_step": 83293, "epoch": 1983} {"train_loss": -6.31418514251709, "global_step": 83294, "epoch": 1983} {"train_loss": -6.190296173095703, "global_step": 83295, "epoch": 1983} {"train_loss": -6.087735176086426, "global_step": 83296, "epoch": 1983} {"train_loss": -6.154317855834961, "global_step": 83297, "epoch": 1983} {"train_loss": -6.1190996170043945, "global_step": 83298, "epoch": 1983} {"train_loss": -6.1600341796875, "global_step": 83299, "epoch": 1983} {"train_loss": -6.32264518737793, "global_step": 83300, "epoch": 1983} {"train_loss": -6.112895965576172, "global_step": 83301, "epoch": 1983} {"train_loss": -6.103607654571533, "global_step": 83302, "epoch": 1983} {"train_loss": -6.197475433349609, "global_step": 83303, "epoch": 1983} {"train_loss": -6.235457420349121, "global_step": 83304, "epoch": 1983} {"train_loss": -5.998162269592285, "global_step": 83305, "epoch": 1983} {"train_loss": -6.12211799621582, "global_step": 83306, "epoch": 1983} {"train_loss": -6.095110893249512, "global_step": 83307, "epoch": 1983} {"train_loss": -6.0782790184021, "global_step": 83308, "epoch": 1983} {"train_loss": -6.18585205078125, "global_step": 83309, "epoch": 1983} {"train_loss": -6.196577072143555, "global_step": 83310, "epoch": 1983} {"train_loss": -6.19467830657959, "global_step": 83311, "epoch": 1983} {"train_loss": -6.125659465789795, "global_step": 83312, "epoch": 1983} {"train_loss": -6.13526725769043, "global_step": 83313, "epoch": 1983} {"train_loss": -6.154726028442383, "global_step": 83314, "epoch": 1983} {"train_loss": -6.125011920928955, "global_step": 83315, "epoch": 1983} {"train_loss": -6.112871170043945, "global_step": 83316, "epoch": 1983} {"train_loss": -6.169872283935547, "global_step": 83317, "epoch": 1983} {"train_loss": -6.277637004852295, "global_step": 83318, "epoch": 1983} {"train_loss": -6.243298053741455, "global_step": 83319, "epoch": 1983} {"train_loss": -6.314840316772461, "global_step": 83320, "epoch": 1983} {"train_loss": -6.147582530975342, "global_step": 83321, "epoch": 1983} {"train_loss": -6.12005615234375, "global_step": 83322, "epoch": 1983} {"train_loss": -6.184270858764648, "global_step": 83323, "epoch": 1983} {"train_loss": -6.237061500549316, "global_step": 83324, "epoch": 1983} {"train_loss": -6.208055019378662, "global_step": 83325, "epoch": 1983} {"train_loss": -6.173643589019775, "global_step": 83326, "epoch": 1983} {"train_loss": -6.172464779445103, "global_step": 83327, "epoch": 1983, "val_loss": 62735.48046875} {"train_loss": -6.223469257354736, "global_step": 83328, "epoch": 1984} {"train_loss": -6.152388572692871, "global_step": 83329, "epoch": 1984} {"train_loss": -6.215157985687256, "global_step": 83330, "epoch": 1984} {"train_loss": -6.1454315185546875, "global_step": 83331, "epoch": 1984} {"train_loss": -6.1595258712768555, "global_step": 83332, "epoch": 1984} {"train_loss": -6.151961326599121, "global_step": 83333, "epoch": 1984} {"train_loss": -6.333625316619873, "global_step": 83334, "epoch": 1984} {"train_loss": -6.103045463562012, "global_step": 83335, "epoch": 1984} {"train_loss": -6.147726058959961, "global_step": 83336, "epoch": 1984} {"train_loss": -6.187261581420898, "global_step": 83337, "epoch": 1984} {"train_loss": -6.191181182861328, "global_step": 83338, "epoch": 1984} {"train_loss": -6.214430332183838, "global_step": 83339, "epoch": 1984} {"train_loss": -6.113539695739746, "global_step": 83340, "epoch": 1984} {"train_loss": -6.266140937805176, "global_step": 83341, "epoch": 1984} {"train_loss": -6.185549736022949, "global_step": 83342, "epoch": 1984} {"train_loss": -6.203655242919922, "global_step": 83343, "epoch": 1984} {"train_loss": -6.162914276123047, "global_step": 83344, "epoch": 1984} {"train_loss": -6.181808948516846, "global_step": 83345, "epoch": 1984} {"train_loss": -6.099193096160889, "global_step": 83346, "epoch": 1984} {"train_loss": -6.160117149353027, "global_step": 83347, "epoch": 1984} {"train_loss": -6.200187683105469, "global_step": 83348, "epoch": 1984} {"train_loss": -6.170532703399658, "global_step": 83349, "epoch": 1984} {"train_loss": -6.271880149841309, "global_step": 83350, "epoch": 1984} {"train_loss": -6.1496405601501465, "global_step": 83351, "epoch": 1984} {"train_loss": -6.173921585083008, "global_step": 83352, "epoch": 1984} {"train_loss": -6.208159446716309, "global_step": 83353, "epoch": 1984} {"train_loss": -6.255824565887451, "global_step": 83354, "epoch": 1984} {"train_loss": -6.266476154327393, "global_step": 83355, "epoch": 1984} {"train_loss": -6.21180534362793, "global_step": 83356, "epoch": 1984} {"train_loss": -6.211618423461914, "global_step": 83357, "epoch": 1984} {"train_loss": -6.31080961227417, "global_step": 83358, "epoch": 1984} {"train_loss": -6.188647270202637, "global_step": 83359, "epoch": 1984} {"train_loss": -6.239561080932617, "global_step": 83360, "epoch": 1984} {"train_loss": -6.2136335372924805, "global_step": 83361, "epoch": 1984} {"train_loss": -6.202910423278809, "global_step": 83362, "epoch": 1984} {"train_loss": -6.205438613891602, "global_step": 83363, "epoch": 1984} {"train_loss": -6.152358055114746, "global_step": 83364, "epoch": 1984} {"train_loss": -6.201784133911133, "global_step": 83365, "epoch": 1984} {"train_loss": -6.2718329429626465, "global_step": 83366, "epoch": 1984} {"train_loss": -6.145711898803711, "global_step": 83367, "epoch": 1984} {"train_loss": -6.22712516784668, "global_step": 83368, "epoch": 1984} {"train_loss": -6.196260100319272, "global_step": 83369, "epoch": 1984, "val_loss": 62700.54296875} {"train_loss": -6.2186174392700195, "global_step": 83370, "epoch": 1985} {"train_loss": -6.154488563537598, "global_step": 83371, "epoch": 1985} {"train_loss": -6.237678527832031, "global_step": 83372, "epoch": 1985} {"train_loss": -6.151730537414551, "global_step": 83373, "epoch": 1985} {"train_loss": -6.22012996673584, "global_step": 83374, "epoch": 1985} {"train_loss": -6.080848693847656, "global_step": 83375, "epoch": 1985} {"train_loss": -6.163051128387451, "global_step": 83376, "epoch": 1985} {"train_loss": -6.168523788452148, "global_step": 83377, "epoch": 1985} {"train_loss": -6.14321231842041, "global_step": 83378, "epoch": 1985} {"train_loss": -6.230798721313477, "global_step": 83379, "epoch": 1985} {"train_loss": -6.223678112030029, "global_step": 83380, "epoch": 1985} {"train_loss": -6.188342094421387, "global_step": 83381, "epoch": 1985} {"train_loss": -6.074713230133057, "global_step": 83382, "epoch": 1985} {"train_loss": -6.169474124908447, "global_step": 83383, "epoch": 1985} {"train_loss": -6.098008155822754, "global_step": 83384, "epoch": 1985} {"train_loss": -6.053790092468262, "global_step": 83385, "epoch": 1985} {"train_loss": -6.146322250366211, "global_step": 83386, "epoch": 1985} {"train_loss": -5.967597961425781, "global_step": 83387, "epoch": 1985} {"train_loss": -6.212241172790527, "global_step": 83388, "epoch": 1985} {"train_loss": -6.1016082763671875, "global_step": 83389, "epoch": 1985} {"train_loss": -6.007037162780762, "global_step": 83390, "epoch": 1985} {"train_loss": -6.0862603187561035, "global_step": 83391, "epoch": 1985} {"train_loss": -6.1167192459106445, "global_step": 83392, "epoch": 1985} {"train_loss": -6.155783653259277, "global_step": 83393, "epoch": 1985} {"train_loss": -6.0836663246154785, "global_step": 83394, "epoch": 1985} {"train_loss": -6.214048385620117, "global_step": 83395, "epoch": 1985} {"train_loss": -6.203486919403076, "global_step": 83396, "epoch": 1985} {"train_loss": -6.140923500061035, "global_step": 83397, "epoch": 1985} {"train_loss": -6.432193279266357, "global_step": 83398, "epoch": 1985} {"train_loss": -6.193306922912598, "global_step": 83399, "epoch": 1985} {"train_loss": -6.143861770629883, "global_step": 83400, "epoch": 1985} {"train_loss": -6.1191086769104, "global_step": 83401, "epoch": 1985} {"train_loss": -6.143106937408447, "global_step": 83402, "epoch": 1985} {"train_loss": -6.309385299682617, "global_step": 83403, "epoch": 1985} {"train_loss": -6.2350616455078125, "global_step": 83404, "epoch": 1985} {"train_loss": -6.122696876525879, "global_step": 83405, "epoch": 1985} {"train_loss": -6.134316921234131, "global_step": 83406, "epoch": 1985} {"train_loss": -6.295358657836914, "global_step": 83407, "epoch": 1985} {"train_loss": -6.159217834472656, "global_step": 83408, "epoch": 1985} {"train_loss": -6.177052021026611, "global_step": 83409, "epoch": 1985} {"train_loss": -6.1991868019104, "global_step": 83410, "epoch": 1985} {"train_loss": -6.1594295388176326, "global_step": 83411, "epoch": 1985, "val_loss": 62453.8046875} {"train_loss": -6.195188522338867, "global_step": 83412, "epoch": 1986} {"train_loss": -6.1808929443359375, "global_step": 83413, "epoch": 1986} {"train_loss": -6.237370491027832, "global_step": 83414, "epoch": 1986} {"train_loss": -6.141773223876953, "global_step": 83415, "epoch": 1986} {"train_loss": -6.113434791564941, "global_step": 83416, "epoch": 1986} {"train_loss": -6.199168682098389, "global_step": 83417, "epoch": 1986} {"train_loss": -6.050046443939209, "global_step": 83418, "epoch": 1986} {"train_loss": -6.14967155456543, "global_step": 83419, "epoch": 1986} {"train_loss": -6.2287445068359375, "global_step": 83420, "epoch": 1986} {"train_loss": -6.234139919281006, "global_step": 83421, "epoch": 1986} {"train_loss": -6.12348747253418, "global_step": 83422, "epoch": 1986} {"train_loss": -6.274897575378418, "global_step": 83423, "epoch": 1986} {"train_loss": -6.16189432144165, "global_step": 83424, "epoch": 1986} {"train_loss": -6.228160858154297, "global_step": 83425, "epoch": 1986} {"train_loss": -6.214029312133789, "global_step": 83426, "epoch": 1986} {"train_loss": -6.239727973937988, "global_step": 83427, "epoch": 1986} {"train_loss": -6.18118953704834, "global_step": 83428, "epoch": 1986} {"train_loss": -6.168375015258789, "global_step": 83429, "epoch": 1986} {"train_loss": -6.11077880859375, "global_step": 83430, "epoch": 1986} {"train_loss": -6.080973148345947, "global_step": 83431, "epoch": 1986} {"train_loss": -6.218160629272461, "global_step": 83432, "epoch": 1986} {"train_loss": -6.171741485595703, "global_step": 83433, "epoch": 1986} {"train_loss": -6.181524276733398, "global_step": 83434, "epoch": 1986} {"train_loss": -6.275777816772461, "global_step": 83435, "epoch": 1986} {"train_loss": -6.281280994415283, "global_step": 83436, "epoch": 1986} {"train_loss": -6.252507209777832, "global_step": 83437, "epoch": 1986} {"train_loss": -6.178617000579834, "global_step": 83438, "epoch": 1986} {"train_loss": -6.189763069152832, "global_step": 83439, "epoch": 1986} {"train_loss": -6.148214817047119, "global_step": 83440, "epoch": 1986} {"train_loss": -6.266772270202637, "global_step": 83441, "epoch": 1986} {"train_loss": -6.206384181976318, "global_step": 83442, "epoch": 1986} {"train_loss": -6.159682273864746, "global_step": 83443, "epoch": 1986} {"train_loss": -6.202919006347656, "global_step": 83444, "epoch": 1986} {"train_loss": -6.159814834594727, "global_step": 83445, "epoch": 1986} {"train_loss": -6.2375946044921875, "global_step": 83446, "epoch": 1986} {"train_loss": -6.244904041290283, "global_step": 83447, "epoch": 1986} {"train_loss": -6.192034721374512, "global_step": 83448, "epoch": 1986} {"train_loss": -6.197086334228516, "global_step": 83449, "epoch": 1986} {"train_loss": -6.126193523406982, "global_step": 83450, "epoch": 1986} {"train_loss": -6.124192237854004, "global_step": 83451, "epoch": 1986} {"train_loss": -6.113641262054443, "global_step": 83452, "epoch": 1986} {"train_loss": -6.1853878157479425, "global_step": 83453, "epoch": 1986, "val_loss": 62459.99609375} {"train_loss": -6.212098121643066, "global_step": 83454, "epoch": 1987} {"train_loss": -6.135003566741943, "global_step": 83455, "epoch": 1987} {"train_loss": -6.158764362335205, "global_step": 83456, "epoch": 1987} {"train_loss": -6.182396411895752, "global_step": 83457, "epoch": 1987} {"train_loss": -6.071218490600586, "global_step": 83458, "epoch": 1987} {"train_loss": -6.176724433898926, "global_step": 83459, "epoch": 1987} {"train_loss": -6.120894432067871, "global_step": 83460, "epoch": 1987} {"train_loss": -6.189922332763672, "global_step": 83461, "epoch": 1987} {"train_loss": -6.1727824211120605, "global_step": 83462, "epoch": 1987} {"train_loss": -6.210190296173096, "global_step": 83463, "epoch": 1987} {"train_loss": -6.0854363441467285, "global_step": 83464, "epoch": 1987} {"train_loss": -6.258303642272949, "global_step": 83465, "epoch": 1987} {"train_loss": -6.3030476570129395, "global_step": 83466, "epoch": 1987} {"train_loss": -6.078072547912598, "global_step": 83467, "epoch": 1987} {"train_loss": -6.180974960327148, "global_step": 83468, "epoch": 1987} {"train_loss": -6.136487007141113, "global_step": 83469, "epoch": 1987} {"train_loss": -6.206732273101807, "global_step": 83470, "epoch": 1987} {"train_loss": -6.189986705780029, "global_step": 83471, "epoch": 1987} {"train_loss": -6.251432418823242, "global_step": 83472, "epoch": 1987} {"train_loss": -6.170429706573486, "global_step": 83473, "epoch": 1987} {"train_loss": -6.281355857849121, "global_step": 83474, "epoch": 1987} {"train_loss": -6.296511650085449, "global_step": 83475, "epoch": 1987} {"train_loss": -6.240200519561768, "global_step": 83476, "epoch": 1987} {"train_loss": -6.243777751922607, "global_step": 83477, "epoch": 1987} {"train_loss": -6.175925254821777, "global_step": 83478, "epoch": 1987} {"train_loss": -6.245818138122559, "global_step": 83479, "epoch": 1987} {"train_loss": -6.278140544891357, "global_step": 83480, "epoch": 1987} {"train_loss": -6.024872303009033, "global_step": 83481, "epoch": 1987} {"train_loss": -6.138503074645996, "global_step": 83482, "epoch": 1987} {"train_loss": -6.347023010253906, "global_step": 83483, "epoch": 1987} {"train_loss": -6.19407844543457, "global_step": 83484, "epoch": 1987} {"train_loss": -6.178635597229004, "global_step": 83485, "epoch": 1987} {"train_loss": -6.334066390991211, "global_step": 83486, "epoch": 1987} {"train_loss": -6.227688789367676, "global_step": 83487, "epoch": 1987} {"train_loss": -6.20869255065918, "global_step": 83488, "epoch": 1987} {"train_loss": -6.105010986328125, "global_step": 83489, "epoch": 1987} {"train_loss": -6.266917705535889, "global_step": 83490, "epoch": 1987} {"train_loss": -6.171326160430908, "global_step": 83491, "epoch": 1987} {"train_loss": -6.069159984588623, "global_step": 83492, "epoch": 1987} {"train_loss": -6.249650955200195, "global_step": 83493, "epoch": 1987} {"train_loss": -6.141271591186523, "global_step": 83494, "epoch": 1987} {"train_loss": -6.192141158240182, "global_step": 83495, "epoch": 1987, "val_loss": 62593.99609375} {"train_loss": -6.205052852630615, "global_step": 83496, "epoch": 1988} {"train_loss": -6.245365619659424, "global_step": 83497, "epoch": 1988} {"train_loss": -6.170665740966797, "global_step": 83498, "epoch": 1988} {"train_loss": -6.240353107452393, "global_step": 83499, "epoch": 1988} {"train_loss": -6.1001787185668945, "global_step": 83500, "epoch": 1988} {"train_loss": -6.253481864929199, "global_step": 83501, "epoch": 1988} {"train_loss": -6.128857135772705, "global_step": 83502, "epoch": 1988} {"train_loss": -6.144713878631592, "global_step": 83503, "epoch": 1988} {"train_loss": -6.180264472961426, "global_step": 83504, "epoch": 1988} {"train_loss": -6.092215538024902, "global_step": 83505, "epoch": 1988} {"train_loss": -6.174962043762207, "global_step": 83506, "epoch": 1988} {"train_loss": -6.143238544464111, "global_step": 83507, "epoch": 1988} {"train_loss": -6.131308555603027, "global_step": 83508, "epoch": 1988} {"train_loss": -6.184977054595947, "global_step": 83509, "epoch": 1988} {"train_loss": -6.062659740447998, "global_step": 83510, "epoch": 1988} {"train_loss": -6.096170425415039, "global_step": 83511, "epoch": 1988} {"train_loss": -6.154205322265625, "global_step": 83512, "epoch": 1988} {"train_loss": -6.208826541900635, "global_step": 83513, "epoch": 1988} {"train_loss": -6.132974147796631, "global_step": 83514, "epoch": 1988} {"train_loss": -6.164438247680664, "global_step": 83515, "epoch": 1988} {"train_loss": -6.00761604309082, "global_step": 83516, "epoch": 1988} {"train_loss": -6.290925025939941, "global_step": 83517, "epoch": 1988} {"train_loss": -6.067950248718262, "global_step": 83518, "epoch": 1988} {"train_loss": -6.25181245803833, "global_step": 83519, "epoch": 1988} {"train_loss": -6.081164360046387, "global_step": 83520, "epoch": 1988} {"train_loss": -6.065330505371094, "global_step": 83521, "epoch": 1988} {"train_loss": -6.115284442901611, "global_step": 83522, "epoch": 1988} {"train_loss": -6.126132011413574, "global_step": 83523, "epoch": 1988} {"train_loss": -6.124011039733887, "global_step": 83524, "epoch": 1988} {"train_loss": -6.083675384521484, "global_step": 83525, "epoch": 1988} {"train_loss": -6.285976886749268, "global_step": 83526, "epoch": 1988} {"train_loss": -6.1575026512146, "global_step": 83527, "epoch": 1988} {"train_loss": -6.17642879486084, "global_step": 83528, "epoch": 1988} {"train_loss": -6.150927543640137, "global_step": 83529, "epoch": 1988} {"train_loss": -6.331218242645264, "global_step": 83530, "epoch": 1988} {"train_loss": -6.259535312652588, "global_step": 83531, "epoch": 1988} {"train_loss": -6.259237766265869, "global_step": 83532, "epoch": 1988} {"train_loss": -6.24181604385376, "global_step": 83533, "epoch": 1988} {"train_loss": -6.208542823791504, "global_step": 83534, "epoch": 1988} {"train_loss": -6.329960823059082, "global_step": 83535, "epoch": 1988} {"train_loss": -6.145768165588379, "global_step": 83536, "epoch": 1988} {"train_loss": -6.169868003754389, "global_step": 83537, "epoch": 1988, "val_loss": 62651.78125} {"train_loss": -6.185952186584473, "global_step": 83538, "epoch": 1989} {"train_loss": -6.240309715270996, "global_step": 83539, "epoch": 1989} {"train_loss": -6.122211456298828, "global_step": 83540, "epoch": 1989} {"train_loss": -6.127768516540527, "global_step": 83541, "epoch": 1989} {"train_loss": -6.092909812927246, "global_step": 83542, "epoch": 1989} {"train_loss": -6.123908996582031, "global_step": 83543, "epoch": 1989} {"train_loss": -6.236726760864258, "global_step": 83544, "epoch": 1989} {"train_loss": -6.2051496505737305, "global_step": 83545, "epoch": 1989} {"train_loss": -6.167819023132324, "global_step": 83546, "epoch": 1989} {"train_loss": -6.241072654724121, "global_step": 83547, "epoch": 1989} {"train_loss": -6.232453346252441, "global_step": 83548, "epoch": 1989} {"train_loss": -6.142042636871338, "global_step": 83549, "epoch": 1989} {"train_loss": -6.0961408615112305, "global_step": 83550, "epoch": 1989} {"train_loss": -6.1231489181518555, "global_step": 83551, "epoch": 1989} {"train_loss": -6.167386054992676, "global_step": 83552, "epoch": 1989} {"train_loss": -6.233037948608398, "global_step": 83553, "epoch": 1989} {"train_loss": -6.218066692352295, "global_step": 83554, "epoch": 1989} {"train_loss": -6.182211875915527, "global_step": 83555, "epoch": 1989} {"train_loss": -6.262517929077148, "global_step": 83556, "epoch": 1989} {"train_loss": -6.062361717224121, "global_step": 83557, "epoch": 1989} {"train_loss": -6.2427473068237305, "global_step": 83558, "epoch": 1989} {"train_loss": -6.211075782775879, "global_step": 83559, "epoch": 1989} {"train_loss": -6.137989044189453, "global_step": 83560, "epoch": 1989} {"train_loss": -6.14762020111084, "global_step": 83561, "epoch": 1989} {"train_loss": -6.1669464111328125, "global_step": 83562, "epoch": 1989} {"train_loss": -6.2304487228393555, "global_step": 83563, "epoch": 1989} {"train_loss": -6.1732001304626465, "global_step": 83564, "epoch": 1989} {"train_loss": -6.155128002166748, "global_step": 83565, "epoch": 1989} {"train_loss": -6.121939182281494, "global_step": 83566, "epoch": 1989} {"train_loss": -6.235260963439941, "global_step": 83567, "epoch": 1989} {"train_loss": -6.0310869216918945, "global_step": 83568, "epoch": 1989} {"train_loss": -6.1020731925964355, "global_step": 83569, "epoch": 1989} {"train_loss": -6.056313514709473, "global_step": 83570, "epoch": 1989} {"train_loss": -6.040390968322754, "global_step": 83571, "epoch": 1989} {"train_loss": -6.113760471343994, "global_step": 83572, "epoch": 1989} {"train_loss": -6.194474220275879, "global_step": 83573, "epoch": 1989} {"train_loss": -6.027341365814209, "global_step": 83574, "epoch": 1989} {"train_loss": -6.1894636154174805, "global_step": 83575, "epoch": 1989} {"train_loss": -6.151519775390625, "global_step": 83576, "epoch": 1989} {"train_loss": -5.986949920654297, "global_step": 83577, "epoch": 1989} {"train_loss": -6.194602966308594, "global_step": 83578, "epoch": 1989} {"train_loss": -6.154689652579171, "global_step": 83579, "epoch": 1989, "val_loss": 62890.23046875} {"train_loss": -6.120304584503174, "global_step": 83580, "epoch": 1990} {"train_loss": -6.3050408363342285, "global_step": 83581, "epoch": 1990} {"train_loss": -6.166893005371094, "global_step": 83582, "epoch": 1990} {"train_loss": -6.17625617980957, "global_step": 83583, "epoch": 1990} {"train_loss": -6.220893859863281, "global_step": 83584, "epoch": 1990} {"train_loss": -6.216418266296387, "global_step": 83585, "epoch": 1990} {"train_loss": -6.178337097167969, "global_step": 83586, "epoch": 1990} {"train_loss": -6.161314010620117, "global_step": 83587, "epoch": 1990} {"train_loss": -6.213588714599609, "global_step": 83588, "epoch": 1990} {"train_loss": -6.103387832641602, "global_step": 83589, "epoch": 1990} {"train_loss": -6.233292579650879, "global_step": 83590, "epoch": 1990} {"train_loss": -6.223117351531982, "global_step": 83591, "epoch": 1990} {"train_loss": -6.1884284019470215, "global_step": 83592, "epoch": 1990} {"train_loss": -6.276148796081543, "global_step": 83593, "epoch": 1990} {"train_loss": -6.220341682434082, "global_step": 83594, "epoch": 1990} {"train_loss": -6.185196876525879, "global_step": 83595, "epoch": 1990} {"train_loss": -6.123377799987793, "global_step": 83596, "epoch": 1990} {"train_loss": -6.247962474822998, "global_step": 83597, "epoch": 1990} {"train_loss": -6.232132434844971, "global_step": 83598, "epoch": 1990} {"train_loss": -6.194725513458252, "global_step": 83599, "epoch": 1990} {"train_loss": -6.250563144683838, "global_step": 83600, "epoch": 1990} {"train_loss": -6.101720809936523, "global_step": 83601, "epoch": 1990} {"train_loss": -6.130040645599365, "global_step": 83602, "epoch": 1990} {"train_loss": -6.083446025848389, "global_step": 83603, "epoch": 1990} {"train_loss": -6.0703630447387695, "global_step": 83604, "epoch": 1990} {"train_loss": -6.041332244873047, "global_step": 83605, "epoch": 1990} {"train_loss": -6.196281909942627, "global_step": 83606, "epoch": 1990} {"train_loss": -6.069764614105225, "global_step": 83607, "epoch": 1990} {"train_loss": -6.147247314453125, "global_step": 83608, "epoch": 1990} {"train_loss": -6.150173187255859, "global_step": 83609, "epoch": 1990} {"train_loss": -6.125384330749512, "global_step": 83610, "epoch": 1990} {"train_loss": -6.144610404968262, "global_step": 83611, "epoch": 1990} {"train_loss": -6.145011901855469, "global_step": 83612, "epoch": 1990} {"train_loss": -6.254202842712402, "global_step": 83613, "epoch": 1990} {"train_loss": -6.285604000091553, "global_step": 83614, "epoch": 1990} {"train_loss": -6.131535053253174, "global_step": 83615, "epoch": 1990} {"train_loss": -6.077988624572754, "global_step": 83616, "epoch": 1990} {"train_loss": -6.164880275726318, "global_step": 83617, "epoch": 1990} {"train_loss": -6.167123317718506, "global_step": 83618, "epoch": 1990} {"train_loss": -6.264605522155762, "global_step": 83619, "epoch": 1990} {"train_loss": -6.138242721557617, "global_step": 83620, "epoch": 1990} {"train_loss": -6.172892831620716, "global_step": 83621, "epoch": 1990, "val_loss": 62449.2421875} {"train_loss": -6.180681228637695, "global_step": 83622, "epoch": 1991} {"train_loss": -6.251776695251465, "global_step": 83623, "epoch": 1991} {"train_loss": -6.180972576141357, "global_step": 83624, "epoch": 1991} {"train_loss": -6.27675724029541, "global_step": 83625, "epoch": 1991} {"train_loss": -6.29226541519165, "global_step": 83626, "epoch": 1991} {"train_loss": -6.116116523742676, "global_step": 83627, "epoch": 1991} {"train_loss": -6.212802410125732, "global_step": 83628, "epoch": 1991} {"train_loss": -6.227424621582031, "global_step": 83629, "epoch": 1991} {"train_loss": -6.153954982757568, "global_step": 83630, "epoch": 1991} {"train_loss": -6.233114242553711, "global_step": 83631, "epoch": 1991} {"train_loss": -6.250503063201904, "global_step": 83632, "epoch": 1991} {"train_loss": -6.101338863372803, "global_step": 83633, "epoch": 1991} {"train_loss": -6.109166145324707, "global_step": 83634, "epoch": 1991} {"train_loss": -6.264357566833496, "global_step": 83635, "epoch": 1991} {"train_loss": -6.155778884887695, "global_step": 83636, "epoch": 1991} {"train_loss": -6.202457427978516, "global_step": 83637, "epoch": 1991} {"train_loss": -6.262674331665039, "global_step": 83638, "epoch": 1991} {"train_loss": -6.248930931091309, "global_step": 83639, "epoch": 1991} {"train_loss": -6.199550628662109, "global_step": 83640, "epoch": 1991} {"train_loss": -6.242856025695801, "global_step": 83641, "epoch": 1991} {"train_loss": -6.184742450714111, "global_step": 83642, "epoch": 1991} {"train_loss": -6.253066062927246, "global_step": 83643, "epoch": 1991} {"train_loss": -6.2545366287231445, "global_step": 83644, "epoch": 1991} {"train_loss": -6.278042316436768, "global_step": 83645, "epoch": 1991} {"train_loss": -6.179051399230957, "global_step": 83646, "epoch": 1991} {"train_loss": -6.207040786743164, "global_step": 83647, "epoch": 1991} {"train_loss": -6.241349220275879, "global_step": 83648, "epoch": 1991} {"train_loss": -6.09987735748291, "global_step": 83649, "epoch": 1991} {"train_loss": -6.323348045349121, "global_step": 83650, "epoch": 1991} {"train_loss": -6.280719757080078, "global_step": 83651, "epoch": 1991} {"train_loss": -6.2542405128479, "global_step": 83652, "epoch": 1991} {"train_loss": -6.3189239501953125, "global_step": 83653, "epoch": 1991} {"train_loss": -6.229398727416992, "global_step": 83654, "epoch": 1991} {"train_loss": -6.148336410522461, "global_step": 83655, "epoch": 1991} {"train_loss": -6.200760841369629, "global_step": 83656, "epoch": 1991} {"train_loss": -6.178849220275879, "global_step": 83657, "epoch": 1991} {"train_loss": -6.207704544067383, "global_step": 83658, "epoch": 1991} {"train_loss": -6.21956729888916, "global_step": 83659, "epoch": 1991} {"train_loss": -6.111949920654297, "global_step": 83660, "epoch": 1991} {"train_loss": -6.335544586181641, "global_step": 83661, "epoch": 1991} {"train_loss": -6.3153581619262695, "global_step": 83662, "epoch": 1991} {"train_loss": -6.220520643960862, "global_step": 83663, "epoch": 1991, "val_loss": 62547.859375} {"train_loss": -6.262928009033203, "global_step": 83664, "epoch": 1992} {"train_loss": -6.31015682220459, "global_step": 83665, "epoch": 1992} {"train_loss": -6.228437423706055, "global_step": 83666, "epoch": 1992} {"train_loss": -6.286205291748047, "global_step": 83667, "epoch": 1992} {"train_loss": -6.286887168884277, "global_step": 83668, "epoch": 1992} {"train_loss": -6.096401214599609, "global_step": 83669, "epoch": 1992} {"train_loss": -6.090045928955078, "global_step": 83670, "epoch": 1992} {"train_loss": -6.206731796264648, "global_step": 83671, "epoch": 1992} {"train_loss": -6.143579006195068, "global_step": 83672, "epoch": 1992} {"train_loss": -6.214423179626465, "global_step": 83673, "epoch": 1992} {"train_loss": -6.19554328918457, "global_step": 83674, "epoch": 1992} {"train_loss": -6.184596061706543, "global_step": 83675, "epoch": 1992} {"train_loss": -6.163603782653809, "global_step": 83676, "epoch": 1992} {"train_loss": -6.124795436859131, "global_step": 83677, "epoch": 1992} {"train_loss": -6.203818321228027, "global_step": 83678, "epoch": 1992} {"train_loss": -6.195716381072998, "global_step": 83679, "epoch": 1992} {"train_loss": -6.145263671875, "global_step": 83680, "epoch": 1992} {"train_loss": -6.178105354309082, "global_step": 83681, "epoch": 1992} {"train_loss": -6.064755439758301, "global_step": 83682, "epoch": 1992} {"train_loss": -6.127892017364502, "global_step": 83683, "epoch": 1992} {"train_loss": -6.153409481048584, "global_step": 83684, "epoch": 1992} {"train_loss": -6.038229465484619, "global_step": 83685, "epoch": 1992} {"train_loss": -6.17075252532959, "global_step": 83686, "epoch": 1992} {"train_loss": -6.103848457336426, "global_step": 83687, "epoch": 1992} {"train_loss": -6.201986312866211, "global_step": 83688, "epoch": 1992} {"train_loss": -6.118398189544678, "global_step": 83689, "epoch": 1992} {"train_loss": -6.103546142578125, "global_step": 83690, "epoch": 1992} {"train_loss": -6.140995979309082, "global_step": 83691, "epoch": 1992} {"train_loss": -6.1169023513793945, "global_step": 83692, "epoch": 1992} {"train_loss": -6.124941825866699, "global_step": 83693, "epoch": 1992} {"train_loss": -6.1635589599609375, "global_step": 83694, "epoch": 1992} {"train_loss": -6.198237419128418, "global_step": 83695, "epoch": 1992} {"train_loss": -6.183499336242676, "global_step": 83696, "epoch": 1992} {"train_loss": -6.23746395111084, "global_step": 83697, "epoch": 1992} {"train_loss": -6.193674564361572, "global_step": 83698, "epoch": 1992} {"train_loss": -6.172548770904541, "global_step": 83699, "epoch": 1992} {"train_loss": -6.185600280761719, "global_step": 83700, "epoch": 1992} {"train_loss": -6.0873212814331055, "global_step": 83701, "epoch": 1992} {"train_loss": -6.113964080810547, "global_step": 83702, "epoch": 1992} {"train_loss": -6.2567057609558105, "global_step": 83703, "epoch": 1992} {"train_loss": -6.097895622253418, "global_step": 83704, "epoch": 1992} {"train_loss": -6.166832174573626, "global_step": 83705, "epoch": 1992, "val_loss": 62512.08203125} {"train_loss": -6.2837677001953125, "global_step": 83706, "epoch": 1993} {"train_loss": -6.106863975524902, "global_step": 83707, "epoch": 1993} {"train_loss": -6.214141845703125, "global_step": 83708, "epoch": 1993} {"train_loss": -6.2490339279174805, "global_step": 83709, "epoch": 1993} {"train_loss": -6.160411357879639, "global_step": 83710, "epoch": 1993} {"train_loss": -6.198922157287598, "global_step": 83711, "epoch": 1993} {"train_loss": -6.217885971069336, "global_step": 83712, "epoch": 1993} {"train_loss": -6.198225498199463, "global_step": 83713, "epoch": 1993} {"train_loss": -6.219353675842285, "global_step": 83714, "epoch": 1993} {"train_loss": -6.063697814941406, "global_step": 83715, "epoch": 1993} {"train_loss": -6.250147819519043, "global_step": 83716, "epoch": 1993} {"train_loss": -6.169892311096191, "global_step": 83717, "epoch": 1993} {"train_loss": -6.272335052490234, "global_step": 83718, "epoch": 1993} {"train_loss": -6.232789039611816, "global_step": 83719, "epoch": 1993} {"train_loss": -6.022650718688965, "global_step": 83720, "epoch": 1993} {"train_loss": -6.1132683753967285, "global_step": 83721, "epoch": 1993} {"train_loss": -6.116589069366455, "global_step": 83722, "epoch": 1993} {"train_loss": -6.27504301071167, "global_step": 83723, "epoch": 1993} {"train_loss": -6.244447708129883, "global_step": 83724, "epoch": 1993} {"train_loss": -6.2302350997924805, "global_step": 83725, "epoch": 1993} {"train_loss": -6.222309589385986, "global_step": 83726, "epoch": 1993} {"train_loss": -6.185339450836182, "global_step": 83727, "epoch": 1993} {"train_loss": -6.086197376251221, "global_step": 83728, "epoch": 1993} {"train_loss": -6.191405773162842, "global_step": 83729, "epoch": 1993} {"train_loss": -6.071238040924072, "global_step": 83730, "epoch": 1993} {"train_loss": -6.118111610412598, "global_step": 83731, "epoch": 1993} {"train_loss": -6.237592697143555, "global_step": 83732, "epoch": 1993} {"train_loss": -6.162102699279785, "global_step": 83733, "epoch": 1993} {"train_loss": -6.145489692687988, "global_step": 83734, "epoch": 1993} {"train_loss": -6.17120361328125, "global_step": 83735, "epoch": 1993} {"train_loss": -6.287115573883057, "global_step": 83736, "epoch": 1993} {"train_loss": -6.222263336181641, "global_step": 83737, "epoch": 1993} {"train_loss": -6.2071533203125, "global_step": 83738, "epoch": 1993} {"train_loss": -6.168327808380127, "global_step": 83739, "epoch": 1993} {"train_loss": -6.201319217681885, "global_step": 83740, "epoch": 1993} {"train_loss": -6.155972480773926, "global_step": 83741, "epoch": 1993} {"train_loss": -6.172277927398682, "global_step": 83742, "epoch": 1993} {"train_loss": -6.034262657165527, "global_step": 83743, "epoch": 1993} {"train_loss": -6.179629325866699, "global_step": 83744, "epoch": 1993} {"train_loss": -6.160750389099121, "global_step": 83745, "epoch": 1993} {"train_loss": -6.208327770233154, "global_step": 83746, "epoch": 1993} {"train_loss": -6.183715843019032, "global_step": 83747, "epoch": 1993, "val_loss": 62718.359375} {"train_loss": -6.18988561630249, "global_step": 83748, "epoch": 1994} {"train_loss": -6.271676063537598, "global_step": 83749, "epoch": 1994} {"train_loss": -6.146462440490723, "global_step": 83750, "epoch": 1994} {"train_loss": -6.276639938354492, "global_step": 83751, "epoch": 1994} {"train_loss": -6.0206451416015625, "global_step": 83752, "epoch": 1994} {"train_loss": -6.305085182189941, "global_step": 83753, "epoch": 1994} {"train_loss": -6.167214870452881, "global_step": 83754, "epoch": 1994} {"train_loss": -6.213848114013672, "global_step": 83755, "epoch": 1994} {"train_loss": -6.190781593322754, "global_step": 83756, "epoch": 1994} {"train_loss": -6.217564105987549, "global_step": 83757, "epoch": 1994} {"train_loss": -6.186562538146973, "global_step": 83758, "epoch": 1994} {"train_loss": -6.259146690368652, "global_step": 83759, "epoch": 1994} {"train_loss": -6.154195785522461, "global_step": 83760, "epoch": 1994} {"train_loss": -6.073781490325928, "global_step": 83761, "epoch": 1994} {"train_loss": -6.246290683746338, "global_step": 83762, "epoch": 1994} {"train_loss": -6.108298301696777, "global_step": 83763, "epoch": 1994} {"train_loss": -6.174093246459961, "global_step": 83764, "epoch": 1994} {"train_loss": -6.1341071128845215, "global_step": 83765, "epoch": 1994} {"train_loss": -6.303438186645508, "global_step": 83766, "epoch": 1994} {"train_loss": -6.2162017822265625, "global_step": 83767, "epoch": 1994} {"train_loss": -6.112806797027588, "global_step": 83768, "epoch": 1994} {"train_loss": -6.164767265319824, "global_step": 83769, "epoch": 1994} {"train_loss": -6.181550979614258, "global_step": 83770, "epoch": 1994} {"train_loss": -6.204946041107178, "global_step": 83771, "epoch": 1994} {"train_loss": -6.179849624633789, "global_step": 83772, "epoch": 1994} {"train_loss": -6.255545616149902, "global_step": 83773, "epoch": 1994} {"train_loss": -6.142443656921387, "global_step": 83774, "epoch": 1994} {"train_loss": -6.282558917999268, "global_step": 83775, "epoch": 1994} {"train_loss": -6.211794853210449, "global_step": 83776, "epoch": 1994} {"train_loss": -6.254824638366699, "global_step": 83777, "epoch": 1994} {"train_loss": -6.168687343597412, "global_step": 83778, "epoch": 1994} {"train_loss": -6.234644889831543, "global_step": 83779, "epoch": 1994} {"train_loss": -6.352283477783203, "global_step": 83780, "epoch": 1994} {"train_loss": -6.301403999328613, "global_step": 83781, "epoch": 1994} {"train_loss": -6.154102802276611, "global_step": 83782, "epoch": 1994} {"train_loss": -6.151542663574219, "global_step": 83783, "epoch": 1994} {"train_loss": -6.182448387145996, "global_step": 83784, "epoch": 1994} {"train_loss": -6.171319007873535, "global_step": 83785, "epoch": 1994} {"train_loss": -6.218680381774902, "global_step": 83786, "epoch": 1994} {"train_loss": -6.071879863739014, "global_step": 83787, "epoch": 1994} {"train_loss": -6.1821088790893555, "global_step": 83788, "epoch": 1994} {"train_loss": -6.19609987168085, "global_step": 83789, "epoch": 1994, "val_loss": 62494.11328125} {"train_loss": -6.204428672790527, "global_step": 83790, "epoch": 1995} {"train_loss": -6.2741570472717285, "global_step": 83791, "epoch": 1995} {"train_loss": -6.201314926147461, "global_step": 83792, "epoch": 1995} {"train_loss": -6.325815677642822, "global_step": 83793, "epoch": 1995} {"train_loss": -6.2422308921813965, "global_step": 83794, "epoch": 1995} {"train_loss": -6.248564720153809, "global_step": 83795, "epoch": 1995} {"train_loss": -6.279801368713379, "global_step": 83796, "epoch": 1995} {"train_loss": -6.1820173263549805, "global_step": 83797, "epoch": 1995} {"train_loss": -6.217449188232422, "global_step": 83798, "epoch": 1995} {"train_loss": -6.190956115722656, "global_step": 83799, "epoch": 1995} {"train_loss": -6.2021284103393555, "global_step": 83800, "epoch": 1995} {"train_loss": -6.105492115020752, "global_step": 83801, "epoch": 1995} {"train_loss": -6.227612495422363, "global_step": 83802, "epoch": 1995} {"train_loss": -6.108076095581055, "global_step": 83803, "epoch": 1995} {"train_loss": -6.022378921508789, "global_step": 83804, "epoch": 1995} {"train_loss": -6.139828681945801, "global_step": 83805, "epoch": 1995} {"train_loss": -6.34632682800293, "global_step": 83806, "epoch": 1995} {"train_loss": -6.047428131103516, "global_step": 83807, "epoch": 1995} {"train_loss": -6.086575508117676, "global_step": 83808, "epoch": 1995} {"train_loss": -6.151045799255371, "global_step": 83809, "epoch": 1995} {"train_loss": -6.225975036621094, "global_step": 83810, "epoch": 1995} {"train_loss": -6.182699680328369, "global_step": 83811, "epoch": 1995} {"train_loss": -6.240679740905762, "global_step": 83812, "epoch": 1995} {"train_loss": -6.056794166564941, "global_step": 83813, "epoch": 1995} {"train_loss": -6.1623334884643555, "global_step": 83814, "epoch": 1995} {"train_loss": -6.11072301864624, "global_step": 83815, "epoch": 1995} {"train_loss": -6.215810775756836, "global_step": 83816, "epoch": 1995} {"train_loss": -6.05394172668457, "global_step": 83817, "epoch": 1995} {"train_loss": -6.233335494995117, "global_step": 83818, "epoch": 1995} {"train_loss": -5.911567211151123, "global_step": 83819, "epoch": 1995} {"train_loss": -5.9187846183776855, "global_step": 83820, "epoch": 1995} {"train_loss": -6.272728443145752, "global_step": 83821, "epoch": 1995} {"train_loss": -6.010763168334961, "global_step": 83822, "epoch": 1995} {"train_loss": -6.148166179656982, "global_step": 83823, "epoch": 1995} {"train_loss": -6.209554195404053, "global_step": 83824, "epoch": 1995} {"train_loss": -6.161888122558594, "global_step": 83825, "epoch": 1995} {"train_loss": -6.111889362335205, "global_step": 83826, "epoch": 1995} {"train_loss": -6.0871992111206055, "global_step": 83827, "epoch": 1995} {"train_loss": -6.052313804626465, "global_step": 83828, "epoch": 1995} {"train_loss": -6.176487922668457, "global_step": 83829, "epoch": 1995} {"train_loss": -6.1837158203125, "global_step": 83830, "epoch": 1995} {"train_loss": -6.158525546391805, "global_step": 83831, "epoch": 1995, "val_loss": 62681.15234375} {"train_loss": -6.293386459350586, "global_step": 83832, "epoch": 1996} {"train_loss": -6.167207717895508, "global_step": 83833, "epoch": 1996} {"train_loss": -6.229635238647461, "global_step": 83834, "epoch": 1996} {"train_loss": -6.146988868713379, "global_step": 83835, "epoch": 1996} {"train_loss": -6.079333305358887, "global_step": 83836, "epoch": 1996} {"train_loss": -6.167010307312012, "global_step": 83837, "epoch": 1996} {"train_loss": -6.170668601989746, "global_step": 83838, "epoch": 1996} {"train_loss": -6.167891502380371, "global_step": 83839, "epoch": 1996} {"train_loss": -6.197854995727539, "global_step": 83840, "epoch": 1996} {"train_loss": -6.220444679260254, "global_step": 83841, "epoch": 1996} {"train_loss": -6.083619117736816, "global_step": 83842, "epoch": 1996} {"train_loss": -6.253979682922363, "global_step": 83843, "epoch": 1996} {"train_loss": -6.162520408630371, "global_step": 83844, "epoch": 1996} {"train_loss": -6.088629722595215, "global_step": 83845, "epoch": 1996} {"train_loss": -6.179315567016602, "global_step": 83846, "epoch": 1996} {"train_loss": -6.332505226135254, "global_step": 83847, "epoch": 1996} {"train_loss": -6.21831750869751, "global_step": 83848, "epoch": 1996} {"train_loss": -6.2472991943359375, "global_step": 83849, "epoch": 1996} {"train_loss": -6.221728324890137, "global_step": 83850, "epoch": 1996} {"train_loss": -6.2761945724487305, "global_step": 83851, "epoch": 1996} {"train_loss": -6.298797607421875, "global_step": 83852, "epoch": 1996} {"train_loss": -6.153194427490234, "global_step": 83853, "epoch": 1996} {"train_loss": -6.252170562744141, "global_step": 83854, "epoch": 1996} {"train_loss": -6.113768100738525, "global_step": 83855, "epoch": 1996} {"train_loss": -6.27573299407959, "global_step": 83856, "epoch": 1996} {"train_loss": -6.187283039093018, "global_step": 83857, "epoch": 1996} {"train_loss": -6.2192792892456055, "global_step": 83858, "epoch": 1996} {"train_loss": -6.323943614959717, "global_step": 83859, "epoch": 1996} {"train_loss": -6.203090667724609, "global_step": 83860, "epoch": 1996} {"train_loss": -6.153441429138184, "global_step": 83861, "epoch": 1996} {"train_loss": -6.138764381408691, "global_step": 83862, "epoch": 1996} {"train_loss": -6.160506248474121, "global_step": 83863, "epoch": 1996} {"train_loss": -6.197940826416016, "global_step": 83864, "epoch": 1996} {"train_loss": -6.176574230194092, "global_step": 83865, "epoch": 1996} {"train_loss": -6.189270973205566, "global_step": 83866, "epoch": 1996} {"train_loss": -6.124979019165039, "global_step": 83867, "epoch": 1996} {"train_loss": -6.190390586853027, "global_step": 83868, "epoch": 1996} {"train_loss": -6.174863815307617, "global_step": 83869, "epoch": 1996} {"train_loss": -6.048032760620117, "global_step": 83870, "epoch": 1996} {"train_loss": -6.144800186157227, "global_step": 83871, "epoch": 1996} {"train_loss": -6.064572811126709, "global_step": 83872, "epoch": 1996} {"train_loss": -6.188830443790981, "global_step": 83873, "epoch": 1996, "val_loss": 62601.41796875} {"train_loss": -6.150723457336426, "global_step": 83874, "epoch": 1997} {"train_loss": -6.156649589538574, "global_step": 83875, "epoch": 1997} {"train_loss": -6.270172119140625, "global_step": 83876, "epoch": 1997} {"train_loss": -6.161088466644287, "global_step": 83877, "epoch": 1997} {"train_loss": -6.164409637451172, "global_step": 83878, "epoch": 1997} {"train_loss": -6.177987575531006, "global_step": 83879, "epoch": 1997} {"train_loss": -6.31803035736084, "global_step": 83880, "epoch": 1997} {"train_loss": -6.330574989318848, "global_step": 83881, "epoch": 1997} {"train_loss": -6.232206344604492, "global_step": 83882, "epoch": 1997} {"train_loss": -6.231482028961182, "global_step": 83883, "epoch": 1997} {"train_loss": -6.272856712341309, "global_step": 83884, "epoch": 1997} {"train_loss": -6.2956342697143555, "global_step": 83885, "epoch": 1997} {"train_loss": -6.176891326904297, "global_step": 83886, "epoch": 1997} {"train_loss": -6.271245002746582, "global_step": 83887, "epoch": 1997} {"train_loss": -6.301299095153809, "global_step": 83888, "epoch": 1997} {"train_loss": -6.237373352050781, "global_step": 83889, "epoch": 1997} {"train_loss": -6.141108512878418, "global_step": 83890, "epoch": 1997} {"train_loss": -6.205753326416016, "global_step": 83891, "epoch": 1997} {"train_loss": -6.198814392089844, "global_step": 83892, "epoch": 1997} {"train_loss": -6.174679756164551, "global_step": 83893, "epoch": 1997} {"train_loss": -6.249765396118164, "global_step": 83894, "epoch": 1997} {"train_loss": -6.147495269775391, "global_step": 83895, "epoch": 1997} {"train_loss": -6.131784439086914, "global_step": 83896, "epoch": 1997} {"train_loss": -6.3656110763549805, "global_step": 83897, "epoch": 1997} {"train_loss": -6.371425151824951, "global_step": 83898, "epoch": 1997} {"train_loss": -6.169331073760986, "global_step": 83899, "epoch": 1997} {"train_loss": -6.326859474182129, "global_step": 83900, "epoch": 1997} {"train_loss": -6.299875259399414, "global_step": 83901, "epoch": 1997} {"train_loss": -6.313576698303223, "global_step": 83902, "epoch": 1997} {"train_loss": -6.26406192779541, "global_step": 83903, "epoch": 1997} {"train_loss": -6.273275375366211, "global_step": 83904, "epoch": 1997} {"train_loss": -6.2658796310424805, "global_step": 83905, "epoch": 1997} {"train_loss": -6.231158256530762, "global_step": 83906, "epoch": 1997} {"train_loss": -6.21369743347168, "global_step": 83907, "epoch": 1997} {"train_loss": -6.136569023132324, "global_step": 83908, "epoch": 1997} {"train_loss": -6.196874618530273, "global_step": 83909, "epoch": 1997} {"train_loss": -6.130369186401367, "global_step": 83910, "epoch": 1997} {"train_loss": -6.114677429199219, "global_step": 83911, "epoch": 1997} {"train_loss": -6.247566223144531, "global_step": 83912, "epoch": 1997} {"train_loss": -6.125927925109863, "global_step": 83913, "epoch": 1997} {"train_loss": -6.159764766693115, "global_step": 83914, "epoch": 1997} {"train_loss": -6.2186652932848245, "global_step": 83915, "epoch": 1997, "val_loss": 62628.41796875} {"train_loss": -6.187516212463379, "global_step": 83916, "epoch": 1998} {"train_loss": -6.141186714172363, "global_step": 83917, "epoch": 1998} {"train_loss": -6.232710838317871, "global_step": 83918, "epoch": 1998} {"train_loss": -6.2183356285095215, "global_step": 83919, "epoch": 1998} {"train_loss": -6.119095802307129, "global_step": 83920, "epoch": 1998} {"train_loss": -6.127747058868408, "global_step": 83921, "epoch": 1998} {"train_loss": -6.152635097503662, "global_step": 83922, "epoch": 1998} {"train_loss": -6.253768444061279, "global_step": 83923, "epoch": 1998} {"train_loss": -6.161618232727051, "global_step": 83924, "epoch": 1998} {"train_loss": -6.252044200897217, "global_step": 83925, "epoch": 1998} {"train_loss": -6.211021900177002, "global_step": 83926, "epoch": 1998} {"train_loss": -6.1884446144104, "global_step": 83927, "epoch": 1998} {"train_loss": -6.147319793701172, "global_step": 83928, "epoch": 1998} {"train_loss": -6.162307262420654, "global_step": 83929, "epoch": 1998} {"train_loss": -6.1659674644470215, "global_step": 83930, "epoch": 1998} {"train_loss": -6.206740379333496, "global_step": 83931, "epoch": 1998} {"train_loss": -6.306026458740234, "global_step": 83932, "epoch": 1998} {"train_loss": -6.087061405181885, "global_step": 83933, "epoch": 1998} {"train_loss": -6.122840404510498, "global_step": 83934, "epoch": 1998} {"train_loss": -6.287282943725586, "global_step": 83935, "epoch": 1998} {"train_loss": -6.1755876541137695, "global_step": 83936, "epoch": 1998} {"train_loss": -6.285029411315918, "global_step": 83937, "epoch": 1998} {"train_loss": -6.224884033203125, "global_step": 83938, "epoch": 1998} {"train_loss": -6.178834915161133, "global_step": 83939, "epoch": 1998} {"train_loss": -6.241207599639893, "global_step": 83940, "epoch": 1998} {"train_loss": -6.237586975097656, "global_step": 83941, "epoch": 1998} {"train_loss": -6.190126419067383, "global_step": 83942, "epoch": 1998} {"train_loss": -6.2216997146606445, "global_step": 83943, "epoch": 1998} {"train_loss": -6.183102607727051, "global_step": 83944, "epoch": 1998} {"train_loss": -6.274751663208008, "global_step": 83945, "epoch": 1998} {"train_loss": -6.260868549346924, "global_step": 83946, "epoch": 1998} {"train_loss": -6.238959789276123, "global_step": 83947, "epoch": 1998} {"train_loss": -6.156589508056641, "global_step": 83948, "epoch": 1998} {"train_loss": -6.216598987579346, "global_step": 83949, "epoch": 1998} {"train_loss": -6.126280784606934, "global_step": 83950, "epoch": 1998} {"train_loss": -6.201885223388672, "global_step": 83951, "epoch": 1998} {"train_loss": -6.275875568389893, "global_step": 83952, "epoch": 1998} {"train_loss": -6.179749488830566, "global_step": 83953, "epoch": 1998} {"train_loss": -6.1585516929626465, "global_step": 83954, "epoch": 1998} {"train_loss": -6.212869167327881, "global_step": 83955, "epoch": 1998} {"train_loss": -6.21773624420166, "global_step": 83956, "epoch": 1998} {"train_loss": -6.200256336302984, "global_step": 83957, "epoch": 1998, "val_loss": 62622.8828125} {"train_loss": -6.261285781860352, "global_step": 83958, "epoch": 1999} {"train_loss": -6.196308135986328, "global_step": 83959, "epoch": 1999} {"train_loss": -6.012826919555664, "global_step": 83960, "epoch": 1999} {"train_loss": -6.157522201538086, "global_step": 83961, "epoch": 1999} {"train_loss": -6.257786750793457, "global_step": 83962, "epoch": 1999} {"train_loss": -6.227513313293457, "global_step": 83963, "epoch": 1999} {"train_loss": -6.096089839935303, "global_step": 83964, "epoch": 1999} {"train_loss": -6.311832427978516, "global_step": 83965, "epoch": 1999} {"train_loss": -6.123015403747559, "global_step": 83966, "epoch": 1999} {"train_loss": -6.223084926605225, "global_step": 83967, "epoch": 1999} {"train_loss": -6.231992244720459, "global_step": 83968, "epoch": 1999} {"train_loss": -6.217772483825684, "global_step": 83969, "epoch": 1999} {"train_loss": -6.291373252868652, "global_step": 83970, "epoch": 1999} {"train_loss": -6.220048904418945, "global_step": 83971, "epoch": 1999} {"train_loss": -6.1523871421813965, "global_step": 83972, "epoch": 1999} {"train_loss": -6.080008506774902, "global_step": 83973, "epoch": 1999} {"train_loss": -6.2559404373168945, "global_step": 83974, "epoch": 1999} {"train_loss": -6.110373497009277, "global_step": 83975, "epoch": 1999} {"train_loss": -6.238597393035889, "global_step": 83976, "epoch": 1999} {"train_loss": -6.114195823669434, "global_step": 83977, "epoch": 1999} {"train_loss": -6.127023696899414, "global_step": 83978, "epoch": 1999} {"train_loss": -6.179305076599121, "global_step": 83979, "epoch": 1999} {"train_loss": -6.243446350097656, "global_step": 83980, "epoch": 1999} {"train_loss": -6.128852367401123, "global_step": 83981, "epoch": 1999} {"train_loss": -6.149553298950195, "global_step": 83982, "epoch": 1999} {"train_loss": -6.192829608917236, "global_step": 83983, "epoch": 1999} {"train_loss": -6.103525638580322, "global_step": 83984, "epoch": 1999} {"train_loss": -6.177030563354492, "global_step": 83985, "epoch": 1999} {"train_loss": -6.202810287475586, "global_step": 83986, "epoch": 1999} {"train_loss": -6.198718070983887, "global_step": 83987, "epoch": 1999} {"train_loss": -6.186136722564697, "global_step": 83988, "epoch": 1999} {"train_loss": -6.25955867767334, "global_step": 83989, "epoch": 1999} {"train_loss": -6.2994537353515625, "global_step": 83990, "epoch": 1999} {"train_loss": -6.245136737823486, "global_step": 83991, "epoch": 1999} {"train_loss": -6.230058670043945, "global_step": 83992, "epoch": 1999} {"train_loss": -6.317289352416992, "global_step": 83993, "epoch": 1999} {"train_loss": -6.086044788360596, "global_step": 83994, "epoch": 1999} {"train_loss": -6.142175674438477, "global_step": 83995, "epoch": 1999} {"train_loss": -6.256069183349609, "global_step": 83996, "epoch": 1999} {"train_loss": -6.135372161865234, "global_step": 83997, "epoch": 1999} {"train_loss": -6.204945087432861, "global_step": 83998, "epoch": 1999} {"train_loss": -6.191117161796207, "global_step": 83999, "epoch": 1999, "val_loss": 62645.14453125} {"train_loss": -6.164548873901367, "global_step": 84000, "epoch": 2000} {"train_loss": -6.223147392272949, "global_step": 84001, "epoch": 2000} {"train_loss": -6.163599014282227, "global_step": 84002, "epoch": 2000} {"train_loss": -6.139348030090332, "global_step": 84003, "epoch": 2000} {"train_loss": -6.302004814147949, "global_step": 84004, "epoch": 2000} {"train_loss": -6.159222602844238, "global_step": 84005, "epoch": 2000} {"train_loss": -6.188546180725098, "global_step": 84006, "epoch": 2000} {"train_loss": -6.216864585876465, "global_step": 84007, "epoch": 2000} {"train_loss": -6.125503063201904, "global_step": 84008, "epoch": 2000} {"train_loss": -6.1791510581970215, "global_step": 84009, "epoch": 2000} {"train_loss": -6.262618064880371, "global_step": 84010, "epoch": 2000} {"train_loss": -6.172852039337158, "global_step": 84011, "epoch": 2000} {"train_loss": -6.184490203857422, "global_step": 84012, "epoch": 2000} {"train_loss": -6.111019134521484, "global_step": 84013, "epoch": 2000} {"train_loss": -6.195563793182373, "global_step": 84014, "epoch": 2000} {"train_loss": -6.2022294998168945, "global_step": 84015, "epoch": 2000} {"train_loss": -6.165859222412109, "global_step": 84016, "epoch": 2000} {"train_loss": -6.187087059020996, "global_step": 84017, "epoch": 2000} {"train_loss": -6.211247444152832, "global_step": 84018, "epoch": 2000} {"train_loss": -6.262187957763672, "global_step": 84019, "epoch": 2000} {"train_loss": -6.149281978607178, "global_step": 84020, "epoch": 2000} {"train_loss": -6.335872650146484, "global_step": 84021, "epoch": 2000} {"train_loss": -6.331233024597168, "global_step": 84022, "epoch": 2000} {"train_loss": -6.166330337524414, "global_step": 84023, "epoch": 2000} {"train_loss": -6.010289192199707, "global_step": 84024, "epoch": 2000} {"train_loss": -6.049242973327637, "global_step": 84025, "epoch": 2000} {"train_loss": -6.244410514831543, "global_step": 84026, "epoch": 2000} {"train_loss": -6.239768028259277, "global_step": 84027, "epoch": 2000} {"train_loss": -6.117073059082031, "global_step": 84028, "epoch": 2000} {"train_loss": -6.1673994064331055, "global_step": 84029, "epoch": 2000} {"train_loss": -6.211401462554932, "global_step": 84030, "epoch": 2000} {"train_loss": -6.241909980773926, "global_step": 84031, "epoch": 2000} {"train_loss": -6.070993900299072, "global_step": 84032, "epoch": 2000} {"train_loss": -6.182631015777588, "global_step": 84033, "epoch": 2000} {"train_loss": -6.256705284118652, "global_step": 84034, "epoch": 2000} {"train_loss": -6.202784538269043, "global_step": 84035, "epoch": 2000} {"train_loss": -6.148571014404297, "global_step": 84036, "epoch": 2000} {"train_loss": -6.205446243286133, "global_step": 84037, "epoch": 2000} {"train_loss": -6.332303047180176, "global_step": 84038, "epoch": 2000} {"train_loss": -6.149681091308594, "global_step": 84039, "epoch": 2000} {"train_loss": -6.140225410461426, "global_step": 84040, "epoch": 2000} {"train_loss": -6.19067889168149, "global_step": 84041, "epoch": 2000, "train/sim_max_reward_0": 0.35789538565753964, "train/sim_max_reward_1": 0.970342800759528, "train/sim_max_reward_2": 0.8112058999332968, "train/sim_max_reward_3": 0.9391980321581702, "train/sim_max_reward_4": 0.9912337729208788, "train/sim_max_reward_5": 0.9317130956280771, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.3769433142186419, "test/sim_max_reward_4300002": 0.8476447926948074, "test/sim_max_reward_4300003": 0.9888123750803218, "test/sim_max_reward_4300004": 0.31060253101106694, "test/sim_max_reward_4300005": 0.6304633612827869, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3142168338662511, "test/sim_max_reward_4300008": 0.6906268316669422, "test/sim_max_reward_4300009": 0.9039699265059963, "test/sim_max_reward_4300010": 0.469890513034788, "test/sim_max_reward_4300011": 0.31428922900758915, "test/sim_max_reward_4300012": 0.964980477327148, "test/sim_max_reward_4300013": 0.9084237213914949, "test/sim_max_reward_4300014": 0.8852441271034982, "test/sim_max_reward_4300015": 0.9268627545839521, "test/sim_max_reward_4300016": 1.0, "test/sim_max_reward_4300017": 0.8808691541672384, "test/sim_max_reward_4300018": 0.45326605604972187, "test/sim_max_reward_4300019": 0.18630607903262786, "test/sim_max_reward_4300020": 0.9195745730173291, "test/sim_max_reward_4300021": 0.9417305518278442, "test/sim_max_reward_4300022": 0.9401810812821778, "test/sim_max_reward_4300023": 0.3333464722556291, "test/sim_max_reward_4300024": 0.8256632335352699, "test/sim_max_reward_4300025": 0.8864415649174601, "test/sim_max_reward_4300026": 0.06945070191384556, "test/sim_max_reward_4300027": 0.9518620164477565, "test/sim_max_reward_4300028": 0.8639515489020106, "test/sim_max_reward_4300029": 0.0052152194585360625, "test/sim_max_reward_4300030": 0.9706159310902498, "test/sim_max_reward_4300031": 0.9283589690145534, "test/sim_max_reward_4300032": 0.9460293790646894, "test/sim_max_reward_4300033": 0.9791475337740425, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.44352213666142437, "test/sim_max_reward_4300036": 0.20730390367851434, "test/sim_max_reward_4300037": 0.9372942221235686, "test/sim_max_reward_4300038": 0.9358500463943746, "test/sim_max_reward_4300039": 0.534245103653495, "test/sim_max_reward_4300040": 0.858817708782757, "test/sim_max_reward_4300041": 0.9355208632837929, "test/sim_max_reward_4300042": 0.9614178619674373, "test/sim_max_reward_4300043": 0.12142079123759829, "test/sim_max_reward_4300044": 0.7578392012744629, "test/sim_max_reward_4300045": 0.945593475894246, "test/sim_max_reward_4300046": 0.11797813880366959, "test/sim_max_reward_4300047": 1.0, "test/sim_max_reward_4300048": 0.2932547263883613, "test/sim_max_reward_4300049": 3.0594255423669716e-09, "train/mean_score": 0.8335981645095818, "test/mean_score": 0.633300780754588, "val_loss": 62539.42578125} {"train_loss": -6.153744697570801, "global_step": 84042, "epoch": 2001} {"train_loss": -6.201759338378906, "global_step": 84043, "epoch": 2001} {"train_loss": -6.166308403015137, "global_step": 84044, "epoch": 2001} {"train_loss": -6.277883529663086, "global_step": 84045, "epoch": 2001} {"train_loss": -6.225375652313232, "global_step": 84046, "epoch": 2001} {"train_loss": -6.269342422485352, "global_step": 84047, "epoch": 2001} {"train_loss": -6.144132614135742, "global_step": 84048, "epoch": 2001} {"train_loss": -6.169668197631836, "global_step": 84049, "epoch": 2001} {"train_loss": -6.2588911056518555, "global_step": 84050, "epoch": 2001} {"train_loss": -6.273382186889648, "global_step": 84051, "epoch": 2001} {"train_loss": -6.271245002746582, "global_step": 84052, "epoch": 2001} {"train_loss": -6.20950174331665, "global_step": 84053, "epoch": 2001} {"train_loss": -6.288030624389648, "global_step": 84054, "epoch": 2001} {"train_loss": -6.222318649291992, "global_step": 84055, "epoch": 2001} {"train_loss": -6.181709289550781, "global_step": 84056, "epoch": 2001} {"train_loss": -6.168695449829102, "global_step": 84057, "epoch": 2001} {"train_loss": -6.202192306518555, "global_step": 84058, "epoch": 2001} {"train_loss": -6.285050868988037, "global_step": 84059, "epoch": 2001} {"train_loss": -6.227362632751465, "global_step": 84060, "epoch": 2001} {"train_loss": -6.149561882019043, "global_step": 84061, "epoch": 2001} {"train_loss": -6.207370758056641, "global_step": 84062, "epoch": 2001} {"train_loss": -6.1852264404296875, "global_step": 84063, "epoch": 2001} {"train_loss": -6.049251556396484, "global_step": 84064, "epoch": 2001} {"train_loss": -6.240044593811035, "global_step": 84065, "epoch": 2001} {"train_loss": -6.137991905212402, "global_step": 84066, "epoch": 2001} {"train_loss": -6.144285202026367, "global_step": 84067, "epoch": 2001} {"train_loss": -6.216531753540039, "global_step": 84068, "epoch": 2001} {"train_loss": -6.236558437347412, "global_step": 84069, "epoch": 2001} {"train_loss": -6.188202857971191, "global_step": 84070, "epoch": 2001} {"train_loss": -6.154180526733398, "global_step": 84071, "epoch": 2001} {"train_loss": -6.1547088623046875, "global_step": 84072, "epoch": 2001} {"train_loss": -6.303616523742676, "global_step": 84073, "epoch": 2001} {"train_loss": -6.186560153961182, "global_step": 84074, "epoch": 2001} {"train_loss": -6.254648685455322, "global_step": 84075, "epoch": 2001} {"train_loss": -6.140145301818848, "global_step": 84076, "epoch": 2001} {"train_loss": -6.202362060546875, "global_step": 84077, "epoch": 2001} {"train_loss": -6.164698600769043, "global_step": 84078, "epoch": 2001} {"train_loss": -6.2025957107543945, "global_step": 84079, "epoch": 2001} {"train_loss": -6.207720756530762, "global_step": 84080, "epoch": 2001} {"train_loss": -6.133936882019043, "global_step": 84081, "epoch": 2001} {"train_loss": -6.245155334472656, "global_step": 84082, "epoch": 2001} {"train_loss": -6.2052787485576815, "global_step": 84083, "epoch": 2001, "val_loss": 62635.890625} {"train_loss": -6.2257981300354, "global_step": 84084, "epoch": 2002} {"train_loss": -6.185611724853516, "global_step": 84085, "epoch": 2002} {"train_loss": -6.09249210357666, "global_step": 84086, "epoch": 2002} {"train_loss": -6.295049667358398, "global_step": 84087, "epoch": 2002} {"train_loss": -6.268822193145752, "global_step": 84088, "epoch": 2002} {"train_loss": -6.339632034301758, "global_step": 84089, "epoch": 2002} {"train_loss": -6.2494330406188965, "global_step": 84090, "epoch": 2002} {"train_loss": -6.227627754211426, "global_step": 84091, "epoch": 2002} {"train_loss": -6.209104537963867, "global_step": 84092, "epoch": 2002} {"train_loss": -6.13374662399292, "global_step": 84093, "epoch": 2002} {"train_loss": -6.331652641296387, "global_step": 84094, "epoch": 2002} {"train_loss": -6.284192085266113, "global_step": 84095, "epoch": 2002} {"train_loss": -6.2314453125, "global_step": 84096, "epoch": 2002} {"train_loss": -6.183284282684326, "global_step": 84097, "epoch": 2002} {"train_loss": -6.212296485900879, "global_step": 84098, "epoch": 2002} {"train_loss": -6.27639102935791, "global_step": 84099, "epoch": 2002} {"train_loss": -6.238212585449219, "global_step": 84100, "epoch": 2002} {"train_loss": -6.2972307205200195, "global_step": 84101, "epoch": 2002} {"train_loss": -6.314096450805664, "global_step": 84102, "epoch": 2002} {"train_loss": -6.177178382873535, "global_step": 84103, "epoch": 2002} {"train_loss": -6.0955119132995605, "global_step": 84104, "epoch": 2002} {"train_loss": -6.2183637619018555, "global_step": 84105, "epoch": 2002} {"train_loss": -6.112334728240967, "global_step": 84106, "epoch": 2002} {"train_loss": -6.1656060218811035, "global_step": 84107, "epoch": 2002} {"train_loss": -6.331421852111816, "global_step": 84108, "epoch": 2002} {"train_loss": -5.999543190002441, "global_step": 84109, "epoch": 2002} {"train_loss": -6.093591690063477, "global_step": 84110, "epoch": 2002} {"train_loss": -6.099307060241699, "global_step": 84111, "epoch": 2002} {"train_loss": -6.099081993103027, "global_step": 84112, "epoch": 2002} {"train_loss": -6.059144496917725, "global_step": 84113, "epoch": 2002} {"train_loss": -5.987085819244385, "global_step": 84114, "epoch": 2002} {"train_loss": -6.0723114013671875, "global_step": 84115, "epoch": 2002} {"train_loss": -6.145281791687012, "global_step": 84116, "epoch": 2002} {"train_loss": -6.061056613922119, "global_step": 84117, "epoch": 2002} {"train_loss": -6.217409133911133, "global_step": 84118, "epoch": 2002} {"train_loss": -6.0817341804504395, "global_step": 84119, "epoch": 2002} {"train_loss": -6.116332530975342, "global_step": 84120, "epoch": 2002} {"train_loss": -6.081288814544678, "global_step": 84121, "epoch": 2002} {"train_loss": -6.109847068786621, "global_step": 84122, "epoch": 2002} {"train_loss": -6.06932258605957, "global_step": 84123, "epoch": 2002} {"train_loss": -6.0089006423950195, "global_step": 84124, "epoch": 2002} {"train_loss": -6.169657605034964, "global_step": 84125, "epoch": 2002, "val_loss": 63051.78125} {"train_loss": -6.095652103424072, "global_step": 84126, "epoch": 2003} {"train_loss": -6.200747013092041, "global_step": 84127, "epoch": 2003} {"train_loss": -5.975934028625488, "global_step": 84128, "epoch": 2003} {"train_loss": -6.13272762298584, "global_step": 84129, "epoch": 2003} {"train_loss": -6.020681381225586, "global_step": 84130, "epoch": 2003} {"train_loss": -6.148845672607422, "global_step": 84131, "epoch": 2003} {"train_loss": -6.106644630432129, "global_step": 84132, "epoch": 2003} {"train_loss": -6.109366416931152, "global_step": 84133, "epoch": 2003} {"train_loss": -6.122683525085449, "global_step": 84134, "epoch": 2003} {"train_loss": -6.218273162841797, "global_step": 84135, "epoch": 2003} {"train_loss": -6.213565826416016, "global_step": 84136, "epoch": 2003} {"train_loss": -6.222193717956543, "global_step": 84137, "epoch": 2003} {"train_loss": -6.12773323059082, "global_step": 84138, "epoch": 2003} {"train_loss": -6.216972827911377, "global_step": 84139, "epoch": 2003} {"train_loss": -6.155157089233398, "global_step": 84140, "epoch": 2003} {"train_loss": -6.094498634338379, "global_step": 84141, "epoch": 2003} {"train_loss": -6.181962013244629, "global_step": 84142, "epoch": 2003} {"train_loss": -6.173366546630859, "global_step": 84143, "epoch": 2003} {"train_loss": -6.046447277069092, "global_step": 84144, "epoch": 2003} {"train_loss": -6.151080131530762, "global_step": 84145, "epoch": 2003} {"train_loss": -6.210911273956299, "global_step": 84146, "epoch": 2003} {"train_loss": -6.103034973144531, "global_step": 84147, "epoch": 2003} {"train_loss": -6.165162563323975, "global_step": 84148, "epoch": 2003} {"train_loss": -6.192998886108398, "global_step": 84149, "epoch": 2003} {"train_loss": -6.106658935546875, "global_step": 84150, "epoch": 2003} {"train_loss": -6.074218273162842, "global_step": 84151, "epoch": 2003} {"train_loss": -6.2228899002075195, "global_step": 84152, "epoch": 2003} {"train_loss": -6.251433849334717, "global_step": 84153, "epoch": 2003} {"train_loss": -6.136853218078613, "global_step": 84154, "epoch": 2003} {"train_loss": -6.159639835357666, "global_step": 84155, "epoch": 2003} {"train_loss": -6.168773651123047, "global_step": 84156, "epoch": 2003} {"train_loss": -6.184736728668213, "global_step": 84157, "epoch": 2003} {"train_loss": -6.070062160491943, "global_step": 84158, "epoch": 2003} {"train_loss": -6.105134963989258, "global_step": 84159, "epoch": 2003} {"train_loss": -6.313248634338379, "global_step": 84160, "epoch": 2003} {"train_loss": -6.161264419555664, "global_step": 84161, "epoch": 2003} {"train_loss": -6.212202548980713, "global_step": 84162, "epoch": 2003} {"train_loss": -6.188969612121582, "global_step": 84163, "epoch": 2003} {"train_loss": -6.145988941192627, "global_step": 84164, "epoch": 2003} {"train_loss": -6.156228065490723, "global_step": 84165, "epoch": 2003} {"train_loss": -6.167430877685547, "global_step": 84166, "epoch": 2003} {"train_loss": -6.151477643421718, "global_step": 84167, "epoch": 2003, "val_loss": 62733.4453125} {"train_loss": -6.221134662628174, "global_step": 84168, "epoch": 2004} {"train_loss": -6.277108192443848, "global_step": 84169, "epoch": 2004} {"train_loss": -6.239898681640625, "global_step": 84170, "epoch": 2004} {"train_loss": -6.168233871459961, "global_step": 84171, "epoch": 2004} {"train_loss": -6.129734039306641, "global_step": 84172, "epoch": 2004} {"train_loss": -6.1958794593811035, "global_step": 84173, "epoch": 2004} {"train_loss": -6.282363414764404, "global_step": 84174, "epoch": 2004} {"train_loss": -6.236082077026367, "global_step": 84175, "epoch": 2004} {"train_loss": -6.162968635559082, "global_step": 84176, "epoch": 2004} {"train_loss": -6.247838497161865, "global_step": 84177, "epoch": 2004} {"train_loss": -6.267704010009766, "global_step": 84178, "epoch": 2004} {"train_loss": -6.2232255935668945, "global_step": 84179, "epoch": 2004} {"train_loss": -6.168679237365723, "global_step": 84180, "epoch": 2004} {"train_loss": -6.256328582763672, "global_step": 84181, "epoch": 2004} {"train_loss": -6.206615924835205, "global_step": 84182, "epoch": 2004} {"train_loss": -6.257123947143555, "global_step": 84183, "epoch": 2004} {"train_loss": -6.290087699890137, "global_step": 84184, "epoch": 2004} {"train_loss": -6.306041717529297, "global_step": 84185, "epoch": 2004} {"train_loss": -6.093109607696533, "global_step": 84186, "epoch": 2004} {"train_loss": -6.233623504638672, "global_step": 84187, "epoch": 2004} {"train_loss": -6.033398151397705, "global_step": 84188, "epoch": 2004} {"train_loss": -6.083003044128418, "global_step": 84189, "epoch": 2004} {"train_loss": -6.201043128967285, "global_step": 84190, "epoch": 2004} {"train_loss": -6.2533416748046875, "global_step": 84191, "epoch": 2004} {"train_loss": -6.127467632293701, "global_step": 84192, "epoch": 2004} {"train_loss": -6.0976433753967285, "global_step": 84193, "epoch": 2004} {"train_loss": -6.169754981994629, "global_step": 84194, "epoch": 2004} {"train_loss": -6.264230251312256, "global_step": 84195, "epoch": 2004} {"train_loss": -6.242042541503906, "global_step": 84196, "epoch": 2004} {"train_loss": -6.09938907623291, "global_step": 84197, "epoch": 2004} {"train_loss": -6.18876838684082, "global_step": 84198, "epoch": 2004} {"train_loss": -6.2348151206970215, "global_step": 84199, "epoch": 2004} {"train_loss": -6.207149505615234, "global_step": 84200, "epoch": 2004} {"train_loss": -6.253050804138184, "global_step": 84201, "epoch": 2004} {"train_loss": -6.190046787261963, "global_step": 84202, "epoch": 2004} {"train_loss": -6.174333095550537, "global_step": 84203, "epoch": 2004} {"train_loss": -6.171609878540039, "global_step": 84204, "epoch": 2004} {"train_loss": -6.269739151000977, "global_step": 84205, "epoch": 2004} {"train_loss": -6.282083511352539, "global_step": 84206, "epoch": 2004} {"train_loss": -6.137775421142578, "global_step": 84207, "epoch": 2004} {"train_loss": -6.328582763671875, "global_step": 84208, "epoch": 2004} {"train_loss": -6.204012280418759, "global_step": 84209, "epoch": 2004, "val_loss": 62499.33984375} {"train_loss": -6.202126502990723, "global_step": 84210, "epoch": 2005} {"train_loss": -6.18088436126709, "global_step": 84211, "epoch": 2005} {"train_loss": -6.26249361038208, "global_step": 84212, "epoch": 2005} {"train_loss": -6.381706237792969, "global_step": 84213, "epoch": 2005} {"train_loss": -6.246936798095703, "global_step": 84214, "epoch": 2005} {"train_loss": -6.302331924438477, "global_step": 84215, "epoch": 2005} {"train_loss": -6.207060813903809, "global_step": 84216, "epoch": 2005} {"train_loss": -6.167141437530518, "global_step": 84217, "epoch": 2005} {"train_loss": -6.203902721405029, "global_step": 84218, "epoch": 2005} {"train_loss": -6.20217227935791, "global_step": 84219, "epoch": 2005} {"train_loss": -6.359040260314941, "global_step": 84220, "epoch": 2005} {"train_loss": -6.200865745544434, "global_step": 84221, "epoch": 2005} {"train_loss": -6.17250919342041, "global_step": 84222, "epoch": 2005} {"train_loss": -6.263700485229492, "global_step": 84223, "epoch": 2005} {"train_loss": -6.097296714782715, "global_step": 84224, "epoch": 2005} {"train_loss": -6.142163276672363, "global_step": 84225, "epoch": 2005} {"train_loss": -6.168001174926758, "global_step": 84226, "epoch": 2005} {"train_loss": -6.120638847351074, "global_step": 84227, "epoch": 2005} {"train_loss": -6.242701530456543, "global_step": 84228, "epoch": 2005} {"train_loss": -6.247458457946777, "global_step": 84229, "epoch": 2005} {"train_loss": -6.023453712463379, "global_step": 84230, "epoch": 2005} {"train_loss": -6.199950218200684, "global_step": 84231, "epoch": 2005} {"train_loss": -6.33372688293457, "global_step": 84232, "epoch": 2005} {"train_loss": -6.169625282287598, "global_step": 84233, "epoch": 2005} {"train_loss": -6.094041347503662, "global_step": 84234, "epoch": 2005} {"train_loss": -6.271271228790283, "global_step": 84235, "epoch": 2005} {"train_loss": -6.113984107971191, "global_step": 84236, "epoch": 2005} {"train_loss": -6.244892597198486, "global_step": 84237, "epoch": 2005} {"train_loss": -6.2065935134887695, "global_step": 84238, "epoch": 2005} {"train_loss": -6.168728351593018, "global_step": 84239, "epoch": 2005} {"train_loss": -6.161616802215576, "global_step": 84240, "epoch": 2005} {"train_loss": -6.215733528137207, "global_step": 84241, "epoch": 2005} {"train_loss": -6.171725273132324, "global_step": 84242, "epoch": 2005} {"train_loss": -6.161731719970703, "global_step": 84243, "epoch": 2005} {"train_loss": -6.212804794311523, "global_step": 84244, "epoch": 2005} {"train_loss": -6.186836242675781, "global_step": 84245, "epoch": 2005} {"train_loss": -6.168096542358398, "global_step": 84246, "epoch": 2005} {"train_loss": -6.130908966064453, "global_step": 84247, "epoch": 2005} {"train_loss": -6.127623081207275, "global_step": 84248, "epoch": 2005} {"train_loss": -6.233609199523926, "global_step": 84249, "epoch": 2005} {"train_loss": -6.046950817108154, "global_step": 84250, "epoch": 2005} {"train_loss": -6.194943371273222, "global_step": 84251, "epoch": 2005, "val_loss": 62720.24609375} {"train_loss": -6.0365753173828125, "global_step": 84252, "epoch": 2006} {"train_loss": -6.126190185546875, "global_step": 84253, "epoch": 2006} {"train_loss": -6.071052074432373, "global_step": 84254, "epoch": 2006} {"train_loss": -6.2162652015686035, "global_step": 84255, "epoch": 2006} {"train_loss": -6.1609344482421875, "global_step": 84256, "epoch": 2006} {"train_loss": -6.170732498168945, "global_step": 84257, "epoch": 2006} {"train_loss": -6.168147087097168, "global_step": 84258, "epoch": 2006} {"train_loss": -6.187943458557129, "global_step": 84259, "epoch": 2006} {"train_loss": -6.0800371170043945, "global_step": 84260, "epoch": 2006} {"train_loss": -6.209716796875, "global_step": 84261, "epoch": 2006} {"train_loss": -6.307360649108887, "global_step": 84262, "epoch": 2006} {"train_loss": -6.1717705726623535, "global_step": 84263, "epoch": 2006} {"train_loss": -6.290260314941406, "global_step": 84264, "epoch": 2006} {"train_loss": -6.256861209869385, "global_step": 84265, "epoch": 2006} {"train_loss": -6.148560523986816, "global_step": 84266, "epoch": 2006} {"train_loss": -6.311250686645508, "global_step": 84267, "epoch": 2006} {"train_loss": -6.076355457305908, "global_step": 84268, "epoch": 2006} {"train_loss": -6.184584617614746, "global_step": 84269, "epoch": 2006} {"train_loss": -6.0980544090271, "global_step": 84270, "epoch": 2006} {"train_loss": -6.159830093383789, "global_step": 84271, "epoch": 2006} {"train_loss": -6.1759490966796875, "global_step": 84272, "epoch": 2006} {"train_loss": -6.310246467590332, "global_step": 84273, "epoch": 2006} {"train_loss": -6.1893310546875, "global_step": 84274, "epoch": 2006} {"train_loss": -6.270756244659424, "global_step": 84275, "epoch": 2006} {"train_loss": -6.135746002197266, "global_step": 84276, "epoch": 2006} {"train_loss": -6.224300384521484, "global_step": 84277, "epoch": 2006} {"train_loss": -6.22702693939209, "global_step": 84278, "epoch": 2006} {"train_loss": -6.31019926071167, "global_step": 84279, "epoch": 2006} {"train_loss": -6.253836631774902, "global_step": 84280, "epoch": 2006} {"train_loss": -6.224815368652344, "global_step": 84281, "epoch": 2006} {"train_loss": -6.196033954620361, "global_step": 84282, "epoch": 2006} {"train_loss": -6.184318542480469, "global_step": 84283, "epoch": 2006} {"train_loss": -6.15250301361084, "global_step": 84284, "epoch": 2006} {"train_loss": -6.286639213562012, "global_step": 84285, "epoch": 2006} {"train_loss": -6.275659084320068, "global_step": 84286, "epoch": 2006} {"train_loss": -6.190134525299072, "global_step": 84287, "epoch": 2006} {"train_loss": -6.247864723205566, "global_step": 84288, "epoch": 2006} {"train_loss": -6.078804016113281, "global_step": 84289, "epoch": 2006} {"train_loss": -6.092072010040283, "global_step": 84290, "epoch": 2006} {"train_loss": -6.2507195472717285, "global_step": 84291, "epoch": 2006} {"train_loss": -6.227982997894287, "global_step": 84292, "epoch": 2006} {"train_loss": -6.196889536721366, "global_step": 84293, "epoch": 2006, "val_loss": 62571.7734375} {"train_loss": -6.210256576538086, "global_step": 84294, "epoch": 2007} {"train_loss": -6.244022369384766, "global_step": 84295, "epoch": 2007} {"train_loss": -6.2103424072265625, "global_step": 84296, "epoch": 2007} {"train_loss": -6.140562534332275, "global_step": 84297, "epoch": 2007} {"train_loss": -6.20900821685791, "global_step": 84298, "epoch": 2007} {"train_loss": -6.166838645935059, "global_step": 84299, "epoch": 2007} {"train_loss": -6.246218681335449, "global_step": 84300, "epoch": 2007} {"train_loss": -6.24166202545166, "global_step": 84301, "epoch": 2007} {"train_loss": -6.217454433441162, "global_step": 84302, "epoch": 2007} {"train_loss": -6.1866631507873535, "global_step": 84303, "epoch": 2007} {"train_loss": -6.210365295410156, "global_step": 84304, "epoch": 2007} {"train_loss": -6.1733903884887695, "global_step": 84305, "epoch": 2007} {"train_loss": -6.239812850952148, "global_step": 84306, "epoch": 2007} {"train_loss": -6.186656951904297, "global_step": 84307, "epoch": 2007} {"train_loss": -6.36102819442749, "global_step": 84308, "epoch": 2007} {"train_loss": -6.248712062835693, "global_step": 84309, "epoch": 2007} {"train_loss": -6.222500801086426, "global_step": 84310, "epoch": 2007} {"train_loss": -6.206270217895508, "global_step": 84311, "epoch": 2007} {"train_loss": -6.226779937744141, "global_step": 84312, "epoch": 2007} {"train_loss": -6.134328842163086, "global_step": 84313, "epoch": 2007} {"train_loss": -6.15750789642334, "global_step": 84314, "epoch": 2007} {"train_loss": -6.316774368286133, "global_step": 84315, "epoch": 2007} {"train_loss": -6.183568954467773, "global_step": 84316, "epoch": 2007} {"train_loss": -6.131609916687012, "global_step": 84317, "epoch": 2007} {"train_loss": -6.14873743057251, "global_step": 84318, "epoch": 2007} {"train_loss": -6.206602096557617, "global_step": 84319, "epoch": 2007} {"train_loss": -6.159002304077148, "global_step": 84320, "epoch": 2007} {"train_loss": -6.213835716247559, "global_step": 84321, "epoch": 2007} {"train_loss": -6.170899391174316, "global_step": 84322, "epoch": 2007} {"train_loss": -6.2304887771606445, "global_step": 84323, "epoch": 2007} {"train_loss": -6.109535217285156, "global_step": 84324, "epoch": 2007} {"train_loss": -6.164600372314453, "global_step": 84325, "epoch": 2007} {"train_loss": -6.075005531311035, "global_step": 84326, "epoch": 2007} {"train_loss": -6.196361064910889, "global_step": 84327, "epoch": 2007} {"train_loss": -6.144049644470215, "global_step": 84328, "epoch": 2007} {"train_loss": -6.2828779220581055, "global_step": 84329, "epoch": 2007} {"train_loss": -6.1742377281188965, "global_step": 84330, "epoch": 2007} {"train_loss": -6.201279640197754, "global_step": 84331, "epoch": 2007} {"train_loss": -6.221787452697754, "global_step": 84332, "epoch": 2007} {"train_loss": -6.1621928215026855, "global_step": 84333, "epoch": 2007} {"train_loss": -6.288417816162109, "global_step": 84334, "epoch": 2007} {"train_loss": -6.2002699715750555, "global_step": 84335, "epoch": 2007, "val_loss": 62766.4375} {"train_loss": -6.1790571212768555, "global_step": 84336, "epoch": 2008} {"train_loss": -6.312934398651123, "global_step": 84337, "epoch": 2008} {"train_loss": -6.176445007324219, "global_step": 84338, "epoch": 2008} {"train_loss": -6.177469730377197, "global_step": 84339, "epoch": 2008} {"train_loss": -6.20690393447876, "global_step": 84340, "epoch": 2008} {"train_loss": -6.222473621368408, "global_step": 84341, "epoch": 2008} {"train_loss": -6.2241716384887695, "global_step": 84342, "epoch": 2008} {"train_loss": -6.228614807128906, "global_step": 84343, "epoch": 2008} {"train_loss": -6.1616621017456055, "global_step": 84344, "epoch": 2008} {"train_loss": -6.1578049659729, "global_step": 84345, "epoch": 2008} {"train_loss": -6.343944072723389, "global_step": 84346, "epoch": 2008} {"train_loss": -6.341904640197754, "global_step": 84347, "epoch": 2008} {"train_loss": -6.243446350097656, "global_step": 84348, "epoch": 2008} {"train_loss": -6.263589382171631, "global_step": 84349, "epoch": 2008} {"train_loss": -6.241639137268066, "global_step": 84350, "epoch": 2008} {"train_loss": -6.123381614685059, "global_step": 84351, "epoch": 2008} {"train_loss": -6.197933197021484, "global_step": 84352, "epoch": 2008} {"train_loss": -6.11583137512207, "global_step": 84353, "epoch": 2008} {"train_loss": -6.132687568664551, "global_step": 84354, "epoch": 2008} {"train_loss": -6.132463455200195, "global_step": 84355, "epoch": 2008} {"train_loss": -6.10040283203125, "global_step": 84356, "epoch": 2008} {"train_loss": -6.174171447753906, "global_step": 84357, "epoch": 2008} {"train_loss": -6.171186447143555, "global_step": 84358, "epoch": 2008} {"train_loss": -6.093290328979492, "global_step": 84359, "epoch": 2008} {"train_loss": -6.285573482513428, "global_step": 84360, "epoch": 2008} {"train_loss": -6.098978042602539, "global_step": 84361, "epoch": 2008} {"train_loss": -6.036715984344482, "global_step": 84362, "epoch": 2008} {"train_loss": -6.187494277954102, "global_step": 84363, "epoch": 2008} {"train_loss": -6.190273761749268, "global_step": 84364, "epoch": 2008} {"train_loss": -6.123592376708984, "global_step": 84365, "epoch": 2008} {"train_loss": -6.036314010620117, "global_step": 84366, "epoch": 2008} {"train_loss": -6.220191955566406, "global_step": 84367, "epoch": 2008} {"train_loss": -6.225955009460449, "global_step": 84368, "epoch": 2008} {"train_loss": -6.182371616363525, "global_step": 84369, "epoch": 2008} {"train_loss": -6.221793174743652, "global_step": 84370, "epoch": 2008} {"train_loss": -6.161581993103027, "global_step": 84371, "epoch": 2008} {"train_loss": -6.207157135009766, "global_step": 84372, "epoch": 2008} {"train_loss": -6.208812713623047, "global_step": 84373, "epoch": 2008} {"train_loss": -6.227166652679443, "global_step": 84374, "epoch": 2008} {"train_loss": -6.095405101776123, "global_step": 84375, "epoch": 2008} {"train_loss": -6.273220539093018, "global_step": 84376, "epoch": 2008} {"train_loss": -6.189268543606713, "global_step": 84377, "epoch": 2008, "val_loss": 62731.74609375} {"train_loss": -6.12786865234375, "global_step": 84378, "epoch": 2009} {"train_loss": -6.138497352600098, "global_step": 84379, "epoch": 2009} {"train_loss": -6.187690258026123, "global_step": 84380, "epoch": 2009} {"train_loss": -6.20058012008667, "global_step": 84381, "epoch": 2009} {"train_loss": -6.196027755737305, "global_step": 84382, "epoch": 2009} {"train_loss": -6.240285873413086, "global_step": 84383, "epoch": 2009} {"train_loss": -6.231561660766602, "global_step": 84384, "epoch": 2009} {"train_loss": -6.047516822814941, "global_step": 84385, "epoch": 2009} {"train_loss": -6.146080017089844, "global_step": 84386, "epoch": 2009} {"train_loss": -6.239799976348877, "global_step": 84387, "epoch": 2009} {"train_loss": -6.345241546630859, "global_step": 84388, "epoch": 2009} {"train_loss": -6.174163818359375, "global_step": 84389, "epoch": 2009} {"train_loss": -6.134150505065918, "global_step": 84390, "epoch": 2009} {"train_loss": -6.121150016784668, "global_step": 84391, "epoch": 2009} {"train_loss": -6.2043986320495605, "global_step": 84392, "epoch": 2009} {"train_loss": -6.224785327911377, "global_step": 84393, "epoch": 2009} {"train_loss": -6.235315322875977, "global_step": 84394, "epoch": 2009} {"train_loss": -6.278541088104248, "global_step": 84395, "epoch": 2009} {"train_loss": -6.192844390869141, "global_step": 84396, "epoch": 2009} {"train_loss": -6.244333744049072, "global_step": 84397, "epoch": 2009} {"train_loss": -6.2835893630981445, "global_step": 84398, "epoch": 2009} {"train_loss": -6.173277854919434, "global_step": 84399, "epoch": 2009} {"train_loss": -6.1303205490112305, "global_step": 84400, "epoch": 2009} {"train_loss": -6.173094749450684, "global_step": 84401, "epoch": 2009} {"train_loss": -6.084184646606445, "global_step": 84402, "epoch": 2009} {"train_loss": -6.291439533233643, "global_step": 84403, "epoch": 2009} {"train_loss": -6.151689529418945, "global_step": 84404, "epoch": 2009} {"train_loss": -6.0487518310546875, "global_step": 84405, "epoch": 2009} {"train_loss": -6.266287326812744, "global_step": 84406, "epoch": 2009} {"train_loss": -6.001745700836182, "global_step": 84407, "epoch": 2009} {"train_loss": -6.142520904541016, "global_step": 84408, "epoch": 2009} {"train_loss": -6.007053852081299, "global_step": 84409, "epoch": 2009} {"train_loss": -6.049531936645508, "global_step": 84410, "epoch": 2009} {"train_loss": -6.090865612030029, "global_step": 84411, "epoch": 2009} {"train_loss": -6.158608913421631, "global_step": 84412, "epoch": 2009} {"train_loss": -6.243816375732422, "global_step": 84413, "epoch": 2009} {"train_loss": -6.255731582641602, "global_step": 84414, "epoch": 2009} {"train_loss": -6.101683616638184, "global_step": 84415, "epoch": 2009} {"train_loss": -6.159323692321777, "global_step": 84416, "epoch": 2009} {"train_loss": -6.127203941345215, "global_step": 84417, "epoch": 2009} {"train_loss": -6.107482433319092, "global_step": 84418, "epoch": 2009} {"train_loss": -6.169074421837216, "global_step": 84419, "epoch": 2009, "val_loss": 62605.41796875} {"train_loss": -6.229754447937012, "global_step": 84420, "epoch": 2010} {"train_loss": -6.160268306732178, "global_step": 84421, "epoch": 2010} {"train_loss": -6.179149627685547, "global_step": 84422, "epoch": 2010} {"train_loss": -6.243541717529297, "global_step": 84423, "epoch": 2010} {"train_loss": -6.161670684814453, "global_step": 84424, "epoch": 2010} {"train_loss": -6.097605228424072, "global_step": 84425, "epoch": 2010} {"train_loss": -6.151528358459473, "global_step": 84426, "epoch": 2010} {"train_loss": -6.147186279296875, "global_step": 84427, "epoch": 2010} {"train_loss": -6.166352272033691, "global_step": 84428, "epoch": 2010} {"train_loss": -6.170969486236572, "global_step": 84429, "epoch": 2010} {"train_loss": -6.234316825866699, "global_step": 84430, "epoch": 2010} {"train_loss": -6.1675705909729, "global_step": 84431, "epoch": 2010} {"train_loss": -6.202611923217773, "global_step": 84432, "epoch": 2010} {"train_loss": -6.163339614868164, "global_step": 84433, "epoch": 2010} {"train_loss": -6.189786911010742, "global_step": 84434, "epoch": 2010} {"train_loss": -6.282050132751465, "global_step": 84435, "epoch": 2010} {"train_loss": -6.14154052734375, "global_step": 84436, "epoch": 2010} {"train_loss": -6.160578727722168, "global_step": 84437, "epoch": 2010} {"train_loss": -6.228274345397949, "global_step": 84438, "epoch": 2010} {"train_loss": -6.199773788452148, "global_step": 84439, "epoch": 2010} {"train_loss": -6.280270576477051, "global_step": 84440, "epoch": 2010} {"train_loss": -6.201159954071045, "global_step": 84441, "epoch": 2010} {"train_loss": -6.243474006652832, "global_step": 84442, "epoch": 2010} {"train_loss": -6.19783878326416, "global_step": 84443, "epoch": 2010} {"train_loss": -6.3015265464782715, "global_step": 84444, "epoch": 2010} {"train_loss": -6.250985622406006, "global_step": 84445, "epoch": 2010} {"train_loss": -6.102447509765625, "global_step": 84446, "epoch": 2010} {"train_loss": -6.293462753295898, "global_step": 84447, "epoch": 2010} {"train_loss": -6.168531894683838, "global_step": 84448, "epoch": 2010} {"train_loss": -6.196144104003906, "global_step": 84449, "epoch": 2010} {"train_loss": -6.214394569396973, "global_step": 84450, "epoch": 2010} {"train_loss": -6.1428914070129395, "global_step": 84451, "epoch": 2010} {"train_loss": -6.033873081207275, "global_step": 84452, "epoch": 2010} {"train_loss": -6.20357608795166, "global_step": 84453, "epoch": 2010} {"train_loss": -6.06302547454834, "global_step": 84454, "epoch": 2010} {"train_loss": -5.981484413146973, "global_step": 84455, "epoch": 2010} {"train_loss": -6.132161617279053, "global_step": 84456, "epoch": 2010} {"train_loss": -5.9994940757751465, "global_step": 84457, "epoch": 2010} {"train_loss": -6.271607398986816, "global_step": 84458, "epoch": 2010} {"train_loss": -6.132320880889893, "global_step": 84459, "epoch": 2010} {"train_loss": -6.196707725524902, "global_step": 84460, "epoch": 2010} {"train_loss": -6.174418472108387, "global_step": 84461, "epoch": 2010, "val_loss": 62540.5} {"train_loss": -6.206460952758789, "global_step": 84462, "epoch": 2011} {"train_loss": -6.1015119552612305, "global_step": 84463, "epoch": 2011} {"train_loss": -6.0476531982421875, "global_step": 84464, "epoch": 2011} {"train_loss": -6.178593635559082, "global_step": 84465, "epoch": 2011} {"train_loss": -6.170336723327637, "global_step": 84466, "epoch": 2011} {"train_loss": -6.168831825256348, "global_step": 84467, "epoch": 2011} {"train_loss": -6.116757392883301, "global_step": 84468, "epoch": 2011} {"train_loss": -6.238358974456787, "global_step": 84469, "epoch": 2011} {"train_loss": -6.149931907653809, "global_step": 84470, "epoch": 2011} {"train_loss": -6.1207427978515625, "global_step": 84471, "epoch": 2011} {"train_loss": -6.188689231872559, "global_step": 84472, "epoch": 2011} {"train_loss": -6.220383644104004, "global_step": 84473, "epoch": 2011} {"train_loss": -6.113079071044922, "global_step": 84474, "epoch": 2011} {"train_loss": -6.292516708374023, "global_step": 84475, "epoch": 2011} {"train_loss": -6.0510358810424805, "global_step": 84476, "epoch": 2011} {"train_loss": -6.178533554077148, "global_step": 84477, "epoch": 2011} {"train_loss": -6.15103006362915, "global_step": 84478, "epoch": 2011} {"train_loss": -6.050689220428467, "global_step": 84479, "epoch": 2011} {"train_loss": -6.060439586639404, "global_step": 84480, "epoch": 2011} {"train_loss": -6.1674981117248535, "global_step": 84481, "epoch": 2011} {"train_loss": -6.21612548828125, "global_step": 84482, "epoch": 2011} {"train_loss": -6.132157325744629, "global_step": 84483, "epoch": 2011} {"train_loss": -6.174675941467285, "global_step": 84484, "epoch": 2011} {"train_loss": -6.197020530700684, "global_step": 84485, "epoch": 2011} {"train_loss": -6.1817626953125, "global_step": 84486, "epoch": 2011} {"train_loss": -6.136824607849121, "global_step": 84487, "epoch": 2011} {"train_loss": -6.172812461853027, "global_step": 84488, "epoch": 2011} {"train_loss": -6.305293083190918, "global_step": 84489, "epoch": 2011} {"train_loss": -6.1675615310668945, "global_step": 84490, "epoch": 2011} {"train_loss": -6.336272239685059, "global_step": 84491, "epoch": 2011} {"train_loss": -6.267810344696045, "global_step": 84492, "epoch": 2011} {"train_loss": -6.2339887619018555, "global_step": 84493, "epoch": 2011} {"train_loss": -6.264996528625488, "global_step": 84494, "epoch": 2011} {"train_loss": -6.147578239440918, "global_step": 84495, "epoch": 2011} {"train_loss": -6.10251522064209, "global_step": 84496, "epoch": 2011} {"train_loss": -6.231071472167969, "global_step": 84497, "epoch": 2011} {"train_loss": -6.153456211090088, "global_step": 84498, "epoch": 2011} {"train_loss": -6.042898654937744, "global_step": 84499, "epoch": 2011} {"train_loss": -6.139996528625488, "global_step": 84500, "epoch": 2011} {"train_loss": -6.147939682006836, "global_step": 84501, "epoch": 2011} {"train_loss": -6.07951545715332, "global_step": 84502, "epoch": 2011} {"train_loss": -6.167279754366193, "global_step": 84503, "epoch": 2011, "val_loss": 62574.234375} {"train_loss": -6.1124958992004395, "global_step": 84504, "epoch": 2012} {"train_loss": -6.110123634338379, "global_step": 84505, "epoch": 2012} {"train_loss": -6.323916435241699, "global_step": 84506, "epoch": 2012} {"train_loss": -6.190371513366699, "global_step": 84507, "epoch": 2012} {"train_loss": -6.283761978149414, "global_step": 84508, "epoch": 2012} {"train_loss": -6.216705322265625, "global_step": 84509, "epoch": 2012} {"train_loss": -6.219283103942871, "global_step": 84510, "epoch": 2012} {"train_loss": -6.210935115814209, "global_step": 84511, "epoch": 2012} {"train_loss": -6.26829719543457, "global_step": 84512, "epoch": 2012} {"train_loss": -6.0859270095825195, "global_step": 84513, "epoch": 2012} {"train_loss": -6.157482147216797, "global_step": 84514, "epoch": 2012} {"train_loss": -6.277614593505859, "global_step": 84515, "epoch": 2012} {"train_loss": -6.101287841796875, "global_step": 84516, "epoch": 2012} {"train_loss": -6.143553733825684, "global_step": 84517, "epoch": 2012} {"train_loss": -6.1568732261657715, "global_step": 84518, "epoch": 2012} {"train_loss": -6.123255729675293, "global_step": 84519, "epoch": 2012} {"train_loss": -6.008528709411621, "global_step": 84520, "epoch": 2012} {"train_loss": -6.2109904289245605, "global_step": 84521, "epoch": 2012} {"train_loss": -6.244969367980957, "global_step": 84522, "epoch": 2012} {"train_loss": -6.196804046630859, "global_step": 84523, "epoch": 2012} {"train_loss": -6.217440128326416, "global_step": 84524, "epoch": 2012} {"train_loss": -6.099765300750732, "global_step": 84525, "epoch": 2012} {"train_loss": -6.187587261199951, "global_step": 84526, "epoch": 2012} {"train_loss": -6.240190505981445, "global_step": 84527, "epoch": 2012} {"train_loss": -6.182720184326172, "global_step": 84528, "epoch": 2012} {"train_loss": -6.173262119293213, "global_step": 84529, "epoch": 2012} {"train_loss": -6.271040916442871, "global_step": 84530, "epoch": 2012} {"train_loss": -6.184593200683594, "global_step": 84531, "epoch": 2012} {"train_loss": -6.228606224060059, "global_step": 84532, "epoch": 2012} {"train_loss": -6.26899528503418, "global_step": 84533, "epoch": 2012} {"train_loss": -6.173636436462402, "global_step": 84534, "epoch": 2012} {"train_loss": -6.099676132202148, "global_step": 84535, "epoch": 2012} {"train_loss": -6.249569892883301, "global_step": 84536, "epoch": 2012} {"train_loss": -6.100607872009277, "global_step": 84537, "epoch": 2012} {"train_loss": -6.230983734130859, "global_step": 84538, "epoch": 2012} {"train_loss": -6.228849411010742, "global_step": 84539, "epoch": 2012} {"train_loss": -6.122086524963379, "global_step": 84540, "epoch": 2012} {"train_loss": -6.233767032623291, "global_step": 84541, "epoch": 2012} {"train_loss": -6.187352180480957, "global_step": 84542, "epoch": 2012} {"train_loss": -6.226861953735352, "global_step": 84543, "epoch": 2012} {"train_loss": -6.382463455200195, "global_step": 84544, "epoch": 2012} {"train_loss": -6.192554723648798, "global_step": 84545, "epoch": 2012, "val_loss": 62735.7265625} {"train_loss": -6.164108753204346, "global_step": 84546, "epoch": 2013} {"train_loss": -6.2101240158081055, "global_step": 84547, "epoch": 2013} {"train_loss": -6.290781497955322, "global_step": 84548, "epoch": 2013} {"train_loss": -6.313021659851074, "global_step": 84549, "epoch": 2013} {"train_loss": -6.333015441894531, "global_step": 84550, "epoch": 2013} {"train_loss": -6.215143203735352, "global_step": 84551, "epoch": 2013} {"train_loss": -6.249734878540039, "global_step": 84552, "epoch": 2013} {"train_loss": -6.225162029266357, "global_step": 84553, "epoch": 2013} {"train_loss": -6.187002182006836, "global_step": 84554, "epoch": 2013} {"train_loss": -6.125884056091309, "global_step": 84555, "epoch": 2013} {"train_loss": -6.231470108032227, "global_step": 84556, "epoch": 2013} {"train_loss": -6.207973003387451, "global_step": 84557, "epoch": 2013} {"train_loss": -6.191298007965088, "global_step": 84558, "epoch": 2013} {"train_loss": -6.215048789978027, "global_step": 84559, "epoch": 2013} {"train_loss": -6.41273307800293, "global_step": 84560, "epoch": 2013} {"train_loss": -6.292030334472656, "global_step": 84561, "epoch": 2013} {"train_loss": -6.139533519744873, "global_step": 84562, "epoch": 2013} {"train_loss": -6.285408020019531, "global_step": 84563, "epoch": 2013} {"train_loss": -6.304802894592285, "global_step": 84564, "epoch": 2013} {"train_loss": -6.342065334320068, "global_step": 84565, "epoch": 2013} {"train_loss": -6.166210651397705, "global_step": 84566, "epoch": 2013} {"train_loss": -6.232479095458984, "global_step": 84567, "epoch": 2013} {"train_loss": -6.176380634307861, "global_step": 84568, "epoch": 2013} {"train_loss": -6.14154052734375, "global_step": 84569, "epoch": 2013} {"train_loss": -6.055382251739502, "global_step": 84570, "epoch": 2013} {"train_loss": -6.161638259887695, "global_step": 84571, "epoch": 2013} {"train_loss": -6.219903469085693, "global_step": 84572, "epoch": 2013} {"train_loss": -6.332898139953613, "global_step": 84573, "epoch": 2013} {"train_loss": -6.097590446472168, "global_step": 84574, "epoch": 2013} {"train_loss": -6.15015172958374, "global_step": 84575, "epoch": 2013} {"train_loss": -6.1584320068359375, "global_step": 84576, "epoch": 2013} {"train_loss": -6.062076568603516, "global_step": 84577, "epoch": 2013} {"train_loss": -6.097615718841553, "global_step": 84578, "epoch": 2013} {"train_loss": -6.140865325927734, "global_step": 84579, "epoch": 2013} {"train_loss": -6.136639595031738, "global_step": 84580, "epoch": 2013} {"train_loss": -6.126264572143555, "global_step": 84581, "epoch": 2013} {"train_loss": -6.051108360290527, "global_step": 84582, "epoch": 2013} {"train_loss": -6.047367095947266, "global_step": 84583, "epoch": 2013} {"train_loss": -6.205470561981201, "global_step": 84584, "epoch": 2013} {"train_loss": -6.233870029449463, "global_step": 84585, "epoch": 2013} {"train_loss": -6.093300819396973, "global_step": 84586, "epoch": 2013} {"train_loss": -6.19511942636399, "global_step": 84587, "epoch": 2013, "val_loss": 62857.84375} {"train_loss": -6.1611008644104, "global_step": 84588, "epoch": 2014} {"train_loss": -6.210366249084473, "global_step": 84589, "epoch": 2014} {"train_loss": -6.211402893066406, "global_step": 84590, "epoch": 2014} {"train_loss": -6.182900428771973, "global_step": 84591, "epoch": 2014} {"train_loss": -6.374566078186035, "global_step": 84592, "epoch": 2014} {"train_loss": -6.192110538482666, "global_step": 84593, "epoch": 2014} {"train_loss": -6.192771911621094, "global_step": 84594, "epoch": 2014} {"train_loss": -6.138700008392334, "global_step": 84595, "epoch": 2014} {"train_loss": -6.279224395751953, "global_step": 84596, "epoch": 2014} {"train_loss": -6.3196539878845215, "global_step": 84597, "epoch": 2014} {"train_loss": -6.160533905029297, "global_step": 84598, "epoch": 2014} {"train_loss": -6.258615016937256, "global_step": 84599, "epoch": 2014} {"train_loss": -6.229946136474609, "global_step": 84600, "epoch": 2014} {"train_loss": -6.283769607543945, "global_step": 84601, "epoch": 2014} {"train_loss": -6.085038185119629, "global_step": 84602, "epoch": 2014} {"train_loss": -6.242681503295898, "global_step": 84603, "epoch": 2014} {"train_loss": -6.314091682434082, "global_step": 84604, "epoch": 2014} {"train_loss": -6.200233459472656, "global_step": 84605, "epoch": 2014} {"train_loss": -6.141521453857422, "global_step": 84606, "epoch": 2014} {"train_loss": -6.1200270652771, "global_step": 84607, "epoch": 2014} {"train_loss": -6.168898582458496, "global_step": 84608, "epoch": 2014} {"train_loss": -6.190423011779785, "global_step": 84609, "epoch": 2014} {"train_loss": -6.256125450134277, "global_step": 84610, "epoch": 2014} {"train_loss": -6.20400333404541, "global_step": 84611, "epoch": 2014} {"train_loss": -6.247197151184082, "global_step": 84612, "epoch": 2014} {"train_loss": -6.189735412597656, "global_step": 84613, "epoch": 2014} {"train_loss": -6.190489768981934, "global_step": 84614, "epoch": 2014} {"train_loss": -6.165193557739258, "global_step": 84615, "epoch": 2014} {"train_loss": -6.1782965660095215, "global_step": 84616, "epoch": 2014} {"train_loss": -6.198971748352051, "global_step": 84617, "epoch": 2014} {"train_loss": -6.150934219360352, "global_step": 84618, "epoch": 2014} {"train_loss": -6.256224632263184, "global_step": 84619, "epoch": 2014} {"train_loss": -6.233635902404785, "global_step": 84620, "epoch": 2014} {"train_loss": -6.154214859008789, "global_step": 84621, "epoch": 2014} {"train_loss": -6.053839206695557, "global_step": 84622, "epoch": 2014} {"train_loss": -6.174777984619141, "global_step": 84623, "epoch": 2014} {"train_loss": -6.234476089477539, "global_step": 84624, "epoch": 2014} {"train_loss": -6.257616996765137, "global_step": 84625, "epoch": 2014} {"train_loss": -6.241721153259277, "global_step": 84626, "epoch": 2014} {"train_loss": -6.083025932312012, "global_step": 84627, "epoch": 2014} {"train_loss": -6.200493812561035, "global_step": 84628, "epoch": 2014} {"train_loss": -6.202301286515736, "global_step": 84629, "epoch": 2014, "val_loss": 62855.0} {"train_loss": -6.187168121337891, "global_step": 84630, "epoch": 2015} {"train_loss": -6.198692798614502, "global_step": 84631, "epoch": 2015} {"train_loss": -6.123837947845459, "global_step": 84632, "epoch": 2015} {"train_loss": -6.272939682006836, "global_step": 84633, "epoch": 2015} {"train_loss": -6.239331245422363, "global_step": 84634, "epoch": 2015} {"train_loss": -6.221645355224609, "global_step": 84635, "epoch": 2015} {"train_loss": -6.178323268890381, "global_step": 84636, "epoch": 2015} {"train_loss": -6.240966796875, "global_step": 84637, "epoch": 2015} {"train_loss": -6.197221279144287, "global_step": 84638, "epoch": 2015} {"train_loss": -6.286155700683594, "global_step": 84639, "epoch": 2015} {"train_loss": -6.2661662101745605, "global_step": 84640, "epoch": 2015} {"train_loss": -6.315525054931641, "global_step": 84641, "epoch": 2015} {"train_loss": -6.233679294586182, "global_step": 84642, "epoch": 2015} {"train_loss": -6.241800785064697, "global_step": 84643, "epoch": 2015} {"train_loss": -6.234787940979004, "global_step": 84644, "epoch": 2015} {"train_loss": -6.135924339294434, "global_step": 84645, "epoch": 2015} {"train_loss": -6.17238712310791, "global_step": 84646, "epoch": 2015} {"train_loss": -6.284228324890137, "global_step": 84647, "epoch": 2015} {"train_loss": -6.258899688720703, "global_step": 84648, "epoch": 2015} {"train_loss": -6.182825565338135, "global_step": 84649, "epoch": 2015} {"train_loss": -6.173690319061279, "global_step": 84650, "epoch": 2015} {"train_loss": -6.163762092590332, "global_step": 84651, "epoch": 2015} {"train_loss": -6.174613952636719, "global_step": 84652, "epoch": 2015} {"train_loss": -6.272008419036865, "global_step": 84653, "epoch": 2015} {"train_loss": -6.147322654724121, "global_step": 84654, "epoch": 2015} {"train_loss": -6.34409236907959, "global_step": 84655, "epoch": 2015} {"train_loss": -6.2300004959106445, "global_step": 84656, "epoch": 2015} {"train_loss": -6.3271164894104, "global_step": 84657, "epoch": 2015} {"train_loss": -6.161614418029785, "global_step": 84658, "epoch": 2015} {"train_loss": -6.175541400909424, "global_step": 84659, "epoch": 2015} {"train_loss": -6.018603324890137, "global_step": 84660, "epoch": 2015} {"train_loss": -6.181920528411865, "global_step": 84661, "epoch": 2015} {"train_loss": -6.160495281219482, "global_step": 84662, "epoch": 2015} {"train_loss": -6.1641998291015625, "global_step": 84663, "epoch": 2015} {"train_loss": -6.181324005126953, "global_step": 84664, "epoch": 2015} {"train_loss": -6.339080810546875, "global_step": 84665, "epoch": 2015} {"train_loss": -6.2082438468933105, "global_step": 84666, "epoch": 2015} {"train_loss": -6.254192352294922, "global_step": 84667, "epoch": 2015} {"train_loss": -6.192634582519531, "global_step": 84668, "epoch": 2015} {"train_loss": -6.266253471374512, "global_step": 84669, "epoch": 2015} {"train_loss": -6.266733646392822, "global_step": 84670, "epoch": 2015} {"train_loss": -6.217248848506382, "global_step": 84671, "epoch": 2015, "val_loss": 62676.66796875} {"train_loss": -6.22897481918335, "global_step": 84672, "epoch": 2016} {"train_loss": -6.300049781799316, "global_step": 84673, "epoch": 2016} {"train_loss": -6.269037246704102, "global_step": 84674, "epoch": 2016} {"train_loss": -6.241119861602783, "global_step": 84675, "epoch": 2016} {"train_loss": -6.198393821716309, "global_step": 84676, "epoch": 2016} {"train_loss": -6.144040107727051, "global_step": 84677, "epoch": 2016} {"train_loss": -6.238335609436035, "global_step": 84678, "epoch": 2016} {"train_loss": -6.268641948699951, "global_step": 84679, "epoch": 2016} {"train_loss": -6.260120391845703, "global_step": 84680, "epoch": 2016} {"train_loss": -6.257438659667969, "global_step": 84681, "epoch": 2016} {"train_loss": -6.171642303466797, "global_step": 84682, "epoch": 2016} {"train_loss": -6.188048362731934, "global_step": 84683, "epoch": 2016} {"train_loss": -6.195128440856934, "global_step": 84684, "epoch": 2016} {"train_loss": -6.359091758728027, "global_step": 84685, "epoch": 2016} {"train_loss": -6.255404949188232, "global_step": 84686, "epoch": 2016} {"train_loss": -6.207919597625732, "global_step": 84687, "epoch": 2016} {"train_loss": -6.302251815795898, "global_step": 84688, "epoch": 2016} {"train_loss": -6.261910438537598, "global_step": 84689, "epoch": 2016} {"train_loss": -6.204930782318115, "global_step": 84690, "epoch": 2016} {"train_loss": -6.312263488769531, "global_step": 84691, "epoch": 2016} {"train_loss": -6.259485244750977, "global_step": 84692, "epoch": 2016} {"train_loss": -6.264123439788818, "global_step": 84693, "epoch": 2016} {"train_loss": -6.359285831451416, "global_step": 84694, "epoch": 2016} {"train_loss": -6.190150260925293, "global_step": 84695, "epoch": 2016} {"train_loss": -6.2705278396606445, "global_step": 84696, "epoch": 2016} {"train_loss": -6.121380805969238, "global_step": 84697, "epoch": 2016} {"train_loss": -6.27811336517334, "global_step": 84698, "epoch": 2016} {"train_loss": -6.158168792724609, "global_step": 84699, "epoch": 2016} {"train_loss": -6.279646396636963, "global_step": 84700, "epoch": 2016} {"train_loss": -6.243474006652832, "global_step": 84701, "epoch": 2016} {"train_loss": -6.373597145080566, "global_step": 84702, "epoch": 2016} {"train_loss": -6.318812847137451, "global_step": 84703, "epoch": 2016} {"train_loss": -6.115312576293945, "global_step": 84704, "epoch": 2016} {"train_loss": -6.324686050415039, "global_step": 84705, "epoch": 2016} {"train_loss": -6.160935401916504, "global_step": 84706, "epoch": 2016} {"train_loss": -6.146753311157227, "global_step": 84707, "epoch": 2016} {"train_loss": -6.146385192871094, "global_step": 84708, "epoch": 2016} {"train_loss": -6.132443904876709, "global_step": 84709, "epoch": 2016} {"train_loss": -6.190269470214844, "global_step": 84710, "epoch": 2016} {"train_loss": -6.193622589111328, "global_step": 84711, "epoch": 2016} {"train_loss": -6.2706499099731445, "global_step": 84712, "epoch": 2016} {"train_loss": -6.234705062139602, "global_step": 84713, "epoch": 2016, "val_loss": 62753.11328125} {"train_loss": -6.306697845458984, "global_step": 84714, "epoch": 2017} {"train_loss": -6.249214172363281, "global_step": 84715, "epoch": 2017} {"train_loss": -6.281821250915527, "global_step": 84716, "epoch": 2017} {"train_loss": -6.302401542663574, "global_step": 84717, "epoch": 2017} {"train_loss": -6.3139262199401855, "global_step": 84718, "epoch": 2017} {"train_loss": -6.223987579345703, "global_step": 84719, "epoch": 2017} {"train_loss": -6.149551868438721, "global_step": 84720, "epoch": 2017} {"train_loss": -6.2622270584106445, "global_step": 84721, "epoch": 2017} {"train_loss": -6.2836151123046875, "global_step": 84722, "epoch": 2017} {"train_loss": -6.146834850311279, "global_step": 84723, "epoch": 2017} {"train_loss": -6.213974952697754, "global_step": 84724, "epoch": 2017} {"train_loss": -6.210709571838379, "global_step": 84725, "epoch": 2017} {"train_loss": -6.078620910644531, "global_step": 84726, "epoch": 2017} {"train_loss": -6.167377948760986, "global_step": 84727, "epoch": 2017} {"train_loss": -6.196178436279297, "global_step": 84728, "epoch": 2017} {"train_loss": -6.212479114532471, "global_step": 84729, "epoch": 2017} {"train_loss": -6.240220069885254, "global_step": 84730, "epoch": 2017} {"train_loss": -6.172337532043457, "global_step": 84731, "epoch": 2017} {"train_loss": -6.104778289794922, "global_step": 84732, "epoch": 2017} {"train_loss": -6.285004138946533, "global_step": 84733, "epoch": 2017} {"train_loss": -6.1948137283325195, "global_step": 84734, "epoch": 2017} {"train_loss": -6.0781569480896, "global_step": 84735, "epoch": 2017} {"train_loss": -6.1291937828063965, "global_step": 84736, "epoch": 2017} {"train_loss": -6.197883605957031, "global_step": 84737, "epoch": 2017} {"train_loss": -6.1557416915893555, "global_step": 84738, "epoch": 2017} {"train_loss": -6.094351291656494, "global_step": 84739, "epoch": 2017} {"train_loss": -6.241765022277832, "global_step": 84740, "epoch": 2017} {"train_loss": -6.222415924072266, "global_step": 84741, "epoch": 2017} {"train_loss": -6.13405704498291, "global_step": 84742, "epoch": 2017} {"train_loss": -6.076287269592285, "global_step": 84743, "epoch": 2017} {"train_loss": -6.135125160217285, "global_step": 84744, "epoch": 2017} {"train_loss": -6.193599224090576, "global_step": 84745, "epoch": 2017} {"train_loss": -6.2533345222473145, "global_step": 84746, "epoch": 2017} {"train_loss": -6.225823402404785, "global_step": 84747, "epoch": 2017} {"train_loss": -6.209061622619629, "global_step": 84748, "epoch": 2017} {"train_loss": -6.316886901855469, "global_step": 84749, "epoch": 2017} {"train_loss": -6.151632308959961, "global_step": 84750, "epoch": 2017} {"train_loss": -6.186802864074707, "global_step": 84751, "epoch": 2017} {"train_loss": -6.1347336769104, "global_step": 84752, "epoch": 2017} {"train_loss": -6.201381683349609, "global_step": 84753, "epoch": 2017} {"train_loss": -6.246002197265625, "global_step": 84754, "epoch": 2017} {"train_loss": -6.197410685675485, "global_step": 84755, "epoch": 2017, "val_loss": 62474.1875} {"train_loss": -6.211654186248779, "global_step": 84756, "epoch": 2018} {"train_loss": -6.211187839508057, "global_step": 84757, "epoch": 2018} {"train_loss": -6.222024917602539, "global_step": 84758, "epoch": 2018} {"train_loss": -6.1948137283325195, "global_step": 84759, "epoch": 2018} {"train_loss": -6.254269123077393, "global_step": 84760, "epoch": 2018} {"train_loss": -6.058346271514893, "global_step": 84761, "epoch": 2018} {"train_loss": -6.095129489898682, "global_step": 84762, "epoch": 2018} {"train_loss": -6.153712749481201, "global_step": 84763, "epoch": 2018} {"train_loss": -6.062139511108398, "global_step": 84764, "epoch": 2018} {"train_loss": -6.267738342285156, "global_step": 84765, "epoch": 2018} {"train_loss": -6.239049911499023, "global_step": 84766, "epoch": 2018} {"train_loss": -6.182221412658691, "global_step": 84767, "epoch": 2018} {"train_loss": -6.126816749572754, "global_step": 84768, "epoch": 2018} {"train_loss": -6.126769542694092, "global_step": 84769, "epoch": 2018} {"train_loss": -6.263788223266602, "global_step": 84770, "epoch": 2018} {"train_loss": -6.3294854164123535, "global_step": 84771, "epoch": 2018} {"train_loss": -6.313520431518555, "global_step": 84772, "epoch": 2018} {"train_loss": -6.186091423034668, "global_step": 84773, "epoch": 2018} {"train_loss": -6.081111907958984, "global_step": 84774, "epoch": 2018} {"train_loss": -6.241233825683594, "global_step": 84775, "epoch": 2018} {"train_loss": -6.140478610992432, "global_step": 84776, "epoch": 2018} {"train_loss": -6.265494346618652, "global_step": 84777, "epoch": 2018} {"train_loss": -6.076784133911133, "global_step": 84778, "epoch": 2018} {"train_loss": -6.32367467880249, "global_step": 84779, "epoch": 2018} {"train_loss": -6.2309770584106445, "global_step": 84780, "epoch": 2018} {"train_loss": -6.119341850280762, "global_step": 84781, "epoch": 2018} {"train_loss": -6.314033031463623, "global_step": 84782, "epoch": 2018} {"train_loss": -6.314115524291992, "global_step": 84783, "epoch": 2018} {"train_loss": -6.030591011047363, "global_step": 84784, "epoch": 2018} {"train_loss": -6.196488380432129, "global_step": 84785, "epoch": 2018} {"train_loss": -6.046525001525879, "global_step": 84786, "epoch": 2018} {"train_loss": -6.161578178405762, "global_step": 84787, "epoch": 2018} {"train_loss": -6.152796745300293, "global_step": 84788, "epoch": 2018} {"train_loss": -6.130751609802246, "global_step": 84789, "epoch": 2018} {"train_loss": -6.129360198974609, "global_step": 84790, "epoch": 2018} {"train_loss": -6.208559513092041, "global_step": 84791, "epoch": 2018} {"train_loss": -6.080269813537598, "global_step": 84792, "epoch": 2018} {"train_loss": -6.125619888305664, "global_step": 84793, "epoch": 2018} {"train_loss": -6.124917030334473, "global_step": 84794, "epoch": 2018} {"train_loss": -6.122078895568848, "global_step": 84795, "epoch": 2018} {"train_loss": -6.118404388427734, "global_step": 84796, "epoch": 2018} {"train_loss": -6.178074689138503, "global_step": 84797, "epoch": 2018, "val_loss": 62475.0234375} {"train_loss": -6.26530122756958, "global_step": 84798, "epoch": 2019} {"train_loss": -6.21496057510376, "global_step": 84799, "epoch": 2019} {"train_loss": -6.209936618804932, "global_step": 84800, "epoch": 2019} {"train_loss": -6.281028747558594, "global_step": 84801, "epoch": 2019} {"train_loss": -6.087568283081055, "global_step": 84802, "epoch": 2019} {"train_loss": -6.166022300720215, "global_step": 84803, "epoch": 2019} {"train_loss": -6.278258323669434, "global_step": 84804, "epoch": 2019} {"train_loss": -6.207918167114258, "global_step": 84805, "epoch": 2019} {"train_loss": -6.172598838806152, "global_step": 84806, "epoch": 2019} {"train_loss": -6.40922737121582, "global_step": 84807, "epoch": 2019} {"train_loss": -6.258833885192871, "global_step": 84808, "epoch": 2019} {"train_loss": -6.158224105834961, "global_step": 84809, "epoch": 2019} {"train_loss": -6.174491882324219, "global_step": 84810, "epoch": 2019} {"train_loss": -6.1896514892578125, "global_step": 84811, "epoch": 2019} {"train_loss": -6.266152381896973, "global_step": 84812, "epoch": 2019} {"train_loss": -6.294573783874512, "global_step": 84813, "epoch": 2019} {"train_loss": -6.409162521362305, "global_step": 84814, "epoch": 2019} {"train_loss": -6.217270851135254, "global_step": 84815, "epoch": 2019} {"train_loss": -6.1351494789123535, "global_step": 84816, "epoch": 2019} {"train_loss": -6.141564846038818, "global_step": 84817, "epoch": 2019} {"train_loss": -6.208384990692139, "global_step": 84818, "epoch": 2019} {"train_loss": -6.2642130851745605, "global_step": 84819, "epoch": 2019} {"train_loss": -6.2798848152160645, "global_step": 84820, "epoch": 2019} {"train_loss": -6.28196382522583, "global_step": 84821, "epoch": 2019} {"train_loss": -6.303690433502197, "global_step": 84822, "epoch": 2019} {"train_loss": -6.1657514572143555, "global_step": 84823, "epoch": 2019} {"train_loss": -6.123033046722412, "global_step": 84824, "epoch": 2019} {"train_loss": -6.1989006996154785, "global_step": 84825, "epoch": 2019} {"train_loss": -6.11519193649292, "global_step": 84826, "epoch": 2019} {"train_loss": -6.233802795410156, "global_step": 84827, "epoch": 2019} {"train_loss": -6.203344345092773, "global_step": 84828, "epoch": 2019} {"train_loss": -6.22530460357666, "global_step": 84829, "epoch": 2019} {"train_loss": -6.239519119262695, "global_step": 84830, "epoch": 2019} {"train_loss": -6.196333885192871, "global_step": 84831, "epoch": 2019} {"train_loss": -6.207032680511475, "global_step": 84832, "epoch": 2019} {"train_loss": -6.237980842590332, "global_step": 84833, "epoch": 2019} {"train_loss": -6.252508640289307, "global_step": 84834, "epoch": 2019} {"train_loss": -6.176159858703613, "global_step": 84835, "epoch": 2019} {"train_loss": -6.263098239898682, "global_step": 84836, "epoch": 2019} {"train_loss": -6.158918380737305, "global_step": 84837, "epoch": 2019} {"train_loss": -6.186147212982178, "global_step": 84838, "epoch": 2019} {"train_loss": -6.218939803895497, "global_step": 84839, "epoch": 2019, "val_loss": 62924.33203125} {"train_loss": -6.168769359588623, "global_step": 84840, "epoch": 2020} {"train_loss": -6.150038719177246, "global_step": 84841, "epoch": 2020} {"train_loss": -6.22637939453125, "global_step": 84842, "epoch": 2020} {"train_loss": -6.166436195373535, "global_step": 84843, "epoch": 2020} {"train_loss": -6.181052207946777, "global_step": 84844, "epoch": 2020} {"train_loss": -6.133666515350342, "global_step": 84845, "epoch": 2020} {"train_loss": -6.204965591430664, "global_step": 84846, "epoch": 2020} {"train_loss": -6.170017242431641, "global_step": 84847, "epoch": 2020} {"train_loss": -6.2272796630859375, "global_step": 84848, "epoch": 2020} {"train_loss": -6.174889087677002, "global_step": 84849, "epoch": 2020} {"train_loss": -6.099267482757568, "global_step": 84850, "epoch": 2020} {"train_loss": -6.1367621421813965, "global_step": 84851, "epoch": 2020} {"train_loss": -6.128209590911865, "global_step": 84852, "epoch": 2020} {"train_loss": -6.216526031494141, "global_step": 84853, "epoch": 2020} {"train_loss": -6.229681968688965, "global_step": 84854, "epoch": 2020} {"train_loss": -6.0899529457092285, "global_step": 84855, "epoch": 2020} {"train_loss": -6.320873260498047, "global_step": 84856, "epoch": 2020} {"train_loss": -6.157585144042969, "global_step": 84857, "epoch": 2020} {"train_loss": -6.197615623474121, "global_step": 84858, "epoch": 2020} {"train_loss": -6.228089809417725, "global_step": 84859, "epoch": 2020} {"train_loss": -6.239063262939453, "global_step": 84860, "epoch": 2020} {"train_loss": -6.151609897613525, "global_step": 84861, "epoch": 2020} {"train_loss": -6.284336566925049, "global_step": 84862, "epoch": 2020} {"train_loss": -6.170253276824951, "global_step": 84863, "epoch": 2020} {"train_loss": -6.182303428649902, "global_step": 84864, "epoch": 2020} {"train_loss": -6.265524864196777, "global_step": 84865, "epoch": 2020} {"train_loss": -6.247344017028809, "global_step": 84866, "epoch": 2020} {"train_loss": -6.233343124389648, "global_step": 84867, "epoch": 2020} {"train_loss": -6.204475402832031, "global_step": 84868, "epoch": 2020} {"train_loss": -6.049593448638916, "global_step": 84869, "epoch": 2020} {"train_loss": -6.259679317474365, "global_step": 84870, "epoch": 2020} {"train_loss": -6.280952453613281, "global_step": 84871, "epoch": 2020} {"train_loss": -6.062289237976074, "global_step": 84872, "epoch": 2020} {"train_loss": -6.12030029296875, "global_step": 84873, "epoch": 2020} {"train_loss": -6.114907741546631, "global_step": 84874, "epoch": 2020} {"train_loss": -6.19254732131958, "global_step": 84875, "epoch": 2020} {"train_loss": -6.217988014221191, "global_step": 84876, "epoch": 2020} {"train_loss": -6.175163269042969, "global_step": 84877, "epoch": 2020} {"train_loss": -6.239144802093506, "global_step": 84878, "epoch": 2020} {"train_loss": -6.218262672424316, "global_step": 84879, "epoch": 2020} {"train_loss": -6.170336723327637, "global_step": 84880, "epoch": 2020} {"train_loss": -6.186215400695801, "global_step": 84881, "epoch": 2020, "val_loss": 62656.25} {"train_loss": -6.265777587890625, "global_step": 84882, "epoch": 2021} {"train_loss": -6.27987003326416, "global_step": 84883, "epoch": 2021} {"train_loss": -6.247281074523926, "global_step": 84884, "epoch": 2021} {"train_loss": -6.198184967041016, "global_step": 84885, "epoch": 2021} {"train_loss": -6.275918483734131, "global_step": 84886, "epoch": 2021} {"train_loss": -6.269175052642822, "global_step": 84887, "epoch": 2021} {"train_loss": -6.322197437286377, "global_step": 84888, "epoch": 2021} {"train_loss": -6.1669206619262695, "global_step": 84889, "epoch": 2021} {"train_loss": -6.257369041442871, "global_step": 84890, "epoch": 2021} {"train_loss": -6.259328842163086, "global_step": 84891, "epoch": 2021} {"train_loss": -6.303672790527344, "global_step": 84892, "epoch": 2021} {"train_loss": -6.258378028869629, "global_step": 84893, "epoch": 2021} {"train_loss": -6.174641132354736, "global_step": 84894, "epoch": 2021} {"train_loss": -6.208099365234375, "global_step": 84895, "epoch": 2021} {"train_loss": -6.171319007873535, "global_step": 84896, "epoch": 2021} {"train_loss": -6.353253364562988, "global_step": 84897, "epoch": 2021} {"train_loss": -6.136102676391602, "global_step": 84898, "epoch": 2021} {"train_loss": -6.105417251586914, "global_step": 84899, "epoch": 2021} {"train_loss": -6.1444549560546875, "global_step": 84900, "epoch": 2021} {"train_loss": -6.068173408508301, "global_step": 84901, "epoch": 2021} {"train_loss": -6.103480815887451, "global_step": 84902, "epoch": 2021} {"train_loss": -6.184398651123047, "global_step": 84903, "epoch": 2021} {"train_loss": -6.202444553375244, "global_step": 84904, "epoch": 2021} {"train_loss": -6.173279762268066, "global_step": 84905, "epoch": 2021} {"train_loss": -6.241869926452637, "global_step": 84906, "epoch": 2021} {"train_loss": -6.143254280090332, "global_step": 84907, "epoch": 2021} {"train_loss": -6.290287971496582, "global_step": 84908, "epoch": 2021} {"train_loss": -6.2779693603515625, "global_step": 84909, "epoch": 2021} {"train_loss": -6.225136756896973, "global_step": 84910, "epoch": 2021} {"train_loss": -6.185357093811035, "global_step": 84911, "epoch": 2021} {"train_loss": -6.107444763183594, "global_step": 84912, "epoch": 2021} {"train_loss": -6.335599899291992, "global_step": 84913, "epoch": 2021} {"train_loss": -6.225171089172363, "global_step": 84914, "epoch": 2021} {"train_loss": -6.118334770202637, "global_step": 84915, "epoch": 2021} {"train_loss": -6.243817329406738, "global_step": 84916, "epoch": 2021} {"train_loss": -6.385262489318848, "global_step": 84917, "epoch": 2021} {"train_loss": -6.212750434875488, "global_step": 84918, "epoch": 2021} {"train_loss": -6.209166526794434, "global_step": 84919, "epoch": 2021} {"train_loss": -6.341202259063721, "global_step": 84920, "epoch": 2021} {"train_loss": -6.233563423156738, "global_step": 84921, "epoch": 2021} {"train_loss": -6.337145805358887, "global_step": 84922, "epoch": 2021} {"train_loss": -6.22674686568124, "global_step": 84923, "epoch": 2021, "val_loss": 62853.75390625} {"train_loss": -6.166265487670898, "global_step": 84924, "epoch": 2022} {"train_loss": -6.239514350891113, "global_step": 84925, "epoch": 2022} {"train_loss": -6.336874008178711, "global_step": 84926, "epoch": 2022} {"train_loss": -6.166232109069824, "global_step": 84927, "epoch": 2022} {"train_loss": -6.202312469482422, "global_step": 84928, "epoch": 2022} {"train_loss": -6.0117950439453125, "global_step": 84929, "epoch": 2022} {"train_loss": -6.065849304199219, "global_step": 84930, "epoch": 2022} {"train_loss": -6.240317344665527, "global_step": 84931, "epoch": 2022} {"train_loss": -6.147955417633057, "global_step": 84932, "epoch": 2022} {"train_loss": -6.203536033630371, "global_step": 84933, "epoch": 2022} {"train_loss": -6.219944000244141, "global_step": 84934, "epoch": 2022} {"train_loss": -6.198284149169922, "global_step": 84935, "epoch": 2022} {"train_loss": -6.305408477783203, "global_step": 84936, "epoch": 2022} {"train_loss": -6.323896408081055, "global_step": 84937, "epoch": 2022} {"train_loss": -6.293800354003906, "global_step": 84938, "epoch": 2022} {"train_loss": -6.30411958694458, "global_step": 84939, "epoch": 2022} {"train_loss": -6.317424774169922, "global_step": 84940, "epoch": 2022} {"train_loss": -6.182342052459717, "global_step": 84941, "epoch": 2022} {"train_loss": -6.25825834274292, "global_step": 84942, "epoch": 2022} {"train_loss": -6.241594314575195, "global_step": 84943, "epoch": 2022} {"train_loss": -6.1675872802734375, "global_step": 84944, "epoch": 2022} {"train_loss": -6.203982353210449, "global_step": 84945, "epoch": 2022} {"train_loss": -6.195997714996338, "global_step": 84946, "epoch": 2022} {"train_loss": -6.1792802810668945, "global_step": 84947, "epoch": 2022} {"train_loss": -6.144927024841309, "global_step": 84948, "epoch": 2022} {"train_loss": -6.189310073852539, "global_step": 84949, "epoch": 2022} {"train_loss": -6.132175922393799, "global_step": 84950, "epoch": 2022} {"train_loss": -6.195083141326904, "global_step": 84951, "epoch": 2022} {"train_loss": -6.175637722015381, "global_step": 84952, "epoch": 2022} {"train_loss": -6.316205024719238, "global_step": 84953, "epoch": 2022} {"train_loss": -6.21452522277832, "global_step": 84954, "epoch": 2022} {"train_loss": -6.103926658630371, "global_step": 84955, "epoch": 2022} {"train_loss": -6.214503765106201, "global_step": 84956, "epoch": 2022} {"train_loss": -6.143028736114502, "global_step": 84957, "epoch": 2022} {"train_loss": -6.122407913208008, "global_step": 84958, "epoch": 2022} {"train_loss": -6.312430381774902, "global_step": 84959, "epoch": 2022} {"train_loss": -6.157157897949219, "global_step": 84960, "epoch": 2022} {"train_loss": -6.211928367614746, "global_step": 84961, "epoch": 2022} {"train_loss": -6.181268215179443, "global_step": 84962, "epoch": 2022} {"train_loss": -6.158510208129883, "global_step": 84963, "epoch": 2022} {"train_loss": -6.2206525802612305, "global_step": 84964, "epoch": 2022} {"train_loss": -6.20700706754412, "global_step": 84965, "epoch": 2022, "val_loss": 62650.1171875} {"train_loss": -6.278791427612305, "global_step": 84966, "epoch": 2023} {"train_loss": -6.235526084899902, "global_step": 84967, "epoch": 2023} {"train_loss": -6.233399391174316, "global_step": 84968, "epoch": 2023} {"train_loss": -6.2252678871154785, "global_step": 84969, "epoch": 2023} {"train_loss": -6.202754020690918, "global_step": 84970, "epoch": 2023} {"train_loss": -6.125269889831543, "global_step": 84971, "epoch": 2023} {"train_loss": -6.374320983886719, "global_step": 84972, "epoch": 2023} {"train_loss": -6.303645133972168, "global_step": 84973, "epoch": 2023} {"train_loss": -6.276419162750244, "global_step": 84974, "epoch": 2023} {"train_loss": -6.135860919952393, "global_step": 84975, "epoch": 2023} {"train_loss": -6.292424201965332, "global_step": 84976, "epoch": 2023} {"train_loss": -6.232463836669922, "global_step": 84977, "epoch": 2023} {"train_loss": -6.203433990478516, "global_step": 84978, "epoch": 2023} {"train_loss": -6.1681318283081055, "global_step": 84979, "epoch": 2023} {"train_loss": -6.203887939453125, "global_step": 84980, "epoch": 2023} {"train_loss": -6.210277080535889, "global_step": 84981, "epoch": 2023} {"train_loss": -6.162133693695068, "global_step": 84982, "epoch": 2023} {"train_loss": -6.244117259979248, "global_step": 84983, "epoch": 2023} {"train_loss": -6.166247367858887, "global_step": 84984, "epoch": 2023} {"train_loss": -6.294947624206543, "global_step": 84985, "epoch": 2023} {"train_loss": -6.315431118011475, "global_step": 84986, "epoch": 2023} {"train_loss": -6.212812423706055, "global_step": 84987, "epoch": 2023} {"train_loss": -6.123551368713379, "global_step": 84988, "epoch": 2023} {"train_loss": -6.202695846557617, "global_step": 84989, "epoch": 2023} {"train_loss": -6.1630048751831055, "global_step": 84990, "epoch": 2023} {"train_loss": -6.2804999351501465, "global_step": 84991, "epoch": 2023} {"train_loss": -6.189997673034668, "global_step": 84992, "epoch": 2023} {"train_loss": -6.2189178466796875, "global_step": 84993, "epoch": 2023} {"train_loss": -6.179577827453613, "global_step": 84994, "epoch": 2023} {"train_loss": -6.2712907791137695, "global_step": 84995, "epoch": 2023} {"train_loss": -6.269206523895264, "global_step": 84996, "epoch": 2023} {"train_loss": -6.096384048461914, "global_step": 84997, "epoch": 2023} {"train_loss": -6.248825550079346, "global_step": 84998, "epoch": 2023} {"train_loss": -6.1862688064575195, "global_step": 84999, "epoch": 2023} {"train_loss": -6.173689842224121, "global_step": 85000, "epoch": 2023} {"train_loss": -6.21743106842041, "global_step": 85001, "epoch": 2023} {"train_loss": -6.227324962615967, "global_step": 85002, "epoch": 2023} {"train_loss": -6.256646156311035, "global_step": 85003, "epoch": 2023} {"train_loss": -6.192227363586426, "global_step": 85004, "epoch": 2023} {"train_loss": -6.180874824523926, "global_step": 85005, "epoch": 2023} {"train_loss": -6.138680934906006, "global_step": 85006, "epoch": 2023} {"train_loss": -6.218732039133708, "global_step": 85007, "epoch": 2023, "val_loss": 62740.27734375} {"train_loss": -6.265120029449463, "global_step": 85008, "epoch": 2024} {"train_loss": -6.202338695526123, "global_step": 85009, "epoch": 2024} {"train_loss": -6.370393753051758, "global_step": 85010, "epoch": 2024} {"train_loss": -6.127079010009766, "global_step": 85011, "epoch": 2024} {"train_loss": -6.255679130554199, "global_step": 85012, "epoch": 2024} {"train_loss": -6.259974479675293, "global_step": 85013, "epoch": 2024} {"train_loss": -6.229235649108887, "global_step": 85014, "epoch": 2024} {"train_loss": -6.234077453613281, "global_step": 85015, "epoch": 2024} {"train_loss": -6.188749313354492, "global_step": 85016, "epoch": 2024} {"train_loss": -6.247429847717285, "global_step": 85017, "epoch": 2024} {"train_loss": -6.172123432159424, "global_step": 85018, "epoch": 2024} {"train_loss": -6.240616321563721, "global_step": 85019, "epoch": 2024} {"train_loss": -6.228764057159424, "global_step": 85020, "epoch": 2024} {"train_loss": -6.28856086730957, "global_step": 85021, "epoch": 2024} {"train_loss": -6.243929386138916, "global_step": 85022, "epoch": 2024} {"train_loss": -6.281895160675049, "global_step": 85023, "epoch": 2024} {"train_loss": -6.226084232330322, "global_step": 85024, "epoch": 2024} {"train_loss": -6.087345123291016, "global_step": 85025, "epoch": 2024} {"train_loss": -6.2093505859375, "global_step": 85026, "epoch": 2024} {"train_loss": -6.156702995300293, "global_step": 85027, "epoch": 2024} {"train_loss": -6.10236930847168, "global_step": 85028, "epoch": 2024} {"train_loss": -6.2966485023498535, "global_step": 85029, "epoch": 2024} {"train_loss": -6.173510551452637, "global_step": 85030, "epoch": 2024} {"train_loss": -6.1794233322143555, "global_step": 85031, "epoch": 2024} {"train_loss": -6.258881092071533, "global_step": 85032, "epoch": 2024} {"train_loss": -6.163218021392822, "global_step": 85033, "epoch": 2024} {"train_loss": -6.218687057495117, "global_step": 85034, "epoch": 2024} {"train_loss": -6.1232500076293945, "global_step": 85035, "epoch": 2024} {"train_loss": -6.170707702636719, "global_step": 85036, "epoch": 2024} {"train_loss": -6.187603950500488, "global_step": 85037, "epoch": 2024} {"train_loss": -6.261654853820801, "global_step": 85038, "epoch": 2024} {"train_loss": -6.133244514465332, "global_step": 85039, "epoch": 2024} {"train_loss": -6.259311199188232, "global_step": 85040, "epoch": 2024} {"train_loss": -6.202980041503906, "global_step": 85041, "epoch": 2024} {"train_loss": -6.182412147521973, "global_step": 85042, "epoch": 2024} {"train_loss": -6.159529685974121, "global_step": 85043, "epoch": 2024} {"train_loss": -6.133140563964844, "global_step": 85044, "epoch": 2024} {"train_loss": -6.165990829467773, "global_step": 85045, "epoch": 2024} {"train_loss": -6.1057586669921875, "global_step": 85046, "epoch": 2024} {"train_loss": -6.221893787384033, "global_step": 85047, "epoch": 2024} {"train_loss": -6.226019859313965, "global_step": 85048, "epoch": 2024} {"train_loss": -6.20636096454802, "global_step": 85049, "epoch": 2024, "val_loss": 62500.24609375} {"train_loss": -6.21391487121582, "global_step": 85050, "epoch": 2025} {"train_loss": -6.205602169036865, "global_step": 85051, "epoch": 2025} {"train_loss": -6.20777702331543, "global_step": 85052, "epoch": 2025} {"train_loss": -6.252758026123047, "global_step": 85053, "epoch": 2025} {"train_loss": -6.090275764465332, "global_step": 85054, "epoch": 2025} {"train_loss": -6.127859592437744, "global_step": 85055, "epoch": 2025} {"train_loss": -6.214652061462402, "global_step": 85056, "epoch": 2025} {"train_loss": -6.16574764251709, "global_step": 85057, "epoch": 2025} {"train_loss": -6.263420104980469, "global_step": 85058, "epoch": 2025} {"train_loss": -6.179437160491943, "global_step": 85059, "epoch": 2025} {"train_loss": -6.055205345153809, "global_step": 85060, "epoch": 2025} {"train_loss": -6.2291646003723145, "global_step": 85061, "epoch": 2025} {"train_loss": -6.200688362121582, "global_step": 85062, "epoch": 2025} {"train_loss": -6.286081314086914, "global_step": 85063, "epoch": 2025} {"train_loss": -6.147983551025391, "global_step": 85064, "epoch": 2025} {"train_loss": -6.247718811035156, "global_step": 85065, "epoch": 2025} {"train_loss": -6.220261573791504, "global_step": 85066, "epoch": 2025} {"train_loss": -6.164172172546387, "global_step": 85067, "epoch": 2025} {"train_loss": -6.114995956420898, "global_step": 85068, "epoch": 2025} {"train_loss": -6.17838191986084, "global_step": 85069, "epoch": 2025} {"train_loss": -6.1833953857421875, "global_step": 85070, "epoch": 2025} {"train_loss": -6.1606364250183105, "global_step": 85071, "epoch": 2025} {"train_loss": -6.238189697265625, "global_step": 85072, "epoch": 2025} {"train_loss": -6.268926620483398, "global_step": 85073, "epoch": 2025} {"train_loss": -6.276640892028809, "global_step": 85074, "epoch": 2025} {"train_loss": -6.201053619384766, "global_step": 85075, "epoch": 2025} {"train_loss": -6.178235054016113, "global_step": 85076, "epoch": 2025} {"train_loss": -6.196859836578369, "global_step": 85077, "epoch": 2025} {"train_loss": -6.146780967712402, "global_step": 85078, "epoch": 2025} {"train_loss": -6.169443607330322, "global_step": 85079, "epoch": 2025} {"train_loss": -6.028905868530273, "global_step": 85080, "epoch": 2025} {"train_loss": -6.188921928405762, "global_step": 85081, "epoch": 2025} {"train_loss": -6.243762969970703, "global_step": 85082, "epoch": 2025} {"train_loss": -6.087630271911621, "global_step": 85083, "epoch": 2025} {"train_loss": -6.174879550933838, "global_step": 85084, "epoch": 2025} {"train_loss": -6.172863006591797, "global_step": 85085, "epoch": 2025} {"train_loss": -6.277070045471191, "global_step": 85086, "epoch": 2025} {"train_loss": -6.2168684005737305, "global_step": 85087, "epoch": 2025} {"train_loss": -6.162789344787598, "global_step": 85088, "epoch": 2025} {"train_loss": -6.24948263168335, "global_step": 85089, "epoch": 2025} {"train_loss": -6.182939529418945, "global_step": 85090, "epoch": 2025} {"train_loss": -6.189823593412127, "global_step": 85091, "epoch": 2025, "val_loss": 62550.22265625} {"train_loss": -6.288630962371826, "global_step": 85092, "epoch": 2026} {"train_loss": -6.240570068359375, "global_step": 85093, "epoch": 2026} {"train_loss": -6.151477336883545, "global_step": 85094, "epoch": 2026} {"train_loss": -6.265509605407715, "global_step": 85095, "epoch": 2026} {"train_loss": -6.288730621337891, "global_step": 85096, "epoch": 2026} {"train_loss": -6.193292140960693, "global_step": 85097, "epoch": 2026} {"train_loss": -6.107065200805664, "global_step": 85098, "epoch": 2026} {"train_loss": -6.26624059677124, "global_step": 85099, "epoch": 2026} {"train_loss": -6.211780548095703, "global_step": 85100, "epoch": 2026} {"train_loss": -6.247459411621094, "global_step": 85101, "epoch": 2026} {"train_loss": -6.152657508850098, "global_step": 85102, "epoch": 2026} {"train_loss": -6.264475345611572, "global_step": 85103, "epoch": 2026} {"train_loss": -6.166264057159424, "global_step": 85104, "epoch": 2026} {"train_loss": -6.096732139587402, "global_step": 85105, "epoch": 2026} {"train_loss": -6.251859188079834, "global_step": 85106, "epoch": 2026} {"train_loss": -6.097352981567383, "global_step": 85107, "epoch": 2026} {"train_loss": -6.07041597366333, "global_step": 85108, "epoch": 2026} {"train_loss": -6.2044997215271, "global_step": 85109, "epoch": 2026} {"train_loss": -6.268805027008057, "global_step": 85110, "epoch": 2026} {"train_loss": -6.2484025955200195, "global_step": 85111, "epoch": 2026} {"train_loss": -6.2665252685546875, "global_step": 85112, "epoch": 2026} {"train_loss": -6.294294357299805, "global_step": 85113, "epoch": 2026} {"train_loss": -6.14837646484375, "global_step": 85114, "epoch": 2026} {"train_loss": -6.210892677307129, "global_step": 85115, "epoch": 2026} {"train_loss": -6.309933185577393, "global_step": 85116, "epoch": 2026} {"train_loss": -6.313663482666016, "global_step": 85117, "epoch": 2026} {"train_loss": -6.26193904876709, "global_step": 85118, "epoch": 2026} {"train_loss": -6.23751974105835, "global_step": 85119, "epoch": 2026} {"train_loss": -6.284575462341309, "global_step": 85120, "epoch": 2026} {"train_loss": -6.269796371459961, "global_step": 85121, "epoch": 2026} {"train_loss": -6.240912437438965, "global_step": 85122, "epoch": 2026} {"train_loss": -6.236811637878418, "global_step": 85123, "epoch": 2026} {"train_loss": -6.200353145599365, "global_step": 85124, "epoch": 2026} {"train_loss": -6.232059955596924, "global_step": 85125, "epoch": 2026} {"train_loss": -6.238956451416016, "global_step": 85126, "epoch": 2026} {"train_loss": -6.153897285461426, "global_step": 85127, "epoch": 2026} {"train_loss": -6.20790433883667, "global_step": 85128, "epoch": 2026} {"train_loss": -6.280195236206055, "global_step": 85129, "epoch": 2026} {"train_loss": -6.205513000488281, "global_step": 85130, "epoch": 2026} {"train_loss": -6.1629133224487305, "global_step": 85131, "epoch": 2026} {"train_loss": -6.1395134925842285, "global_step": 85132, "epoch": 2026} {"train_loss": -6.216371547608149, "global_step": 85133, "epoch": 2026, "val_loss": 62564.1953125} {"train_loss": -6.243315696716309, "global_step": 85134, "epoch": 2027} {"train_loss": -6.266146659851074, "global_step": 85135, "epoch": 2027} {"train_loss": -6.050049781799316, "global_step": 85136, "epoch": 2027} {"train_loss": -6.108212471008301, "global_step": 85137, "epoch": 2027} {"train_loss": -6.282598495483398, "global_step": 85138, "epoch": 2027} {"train_loss": -6.250823497772217, "global_step": 85139, "epoch": 2027} {"train_loss": -6.176980018615723, "global_step": 85140, "epoch": 2027} {"train_loss": -6.24451208114624, "global_step": 85141, "epoch": 2027} {"train_loss": -6.256189346313477, "global_step": 85142, "epoch": 2027} {"train_loss": -6.193936347961426, "global_step": 85143, "epoch": 2027} {"train_loss": -6.280078887939453, "global_step": 85144, "epoch": 2027} {"train_loss": -6.185741424560547, "global_step": 85145, "epoch": 2027} {"train_loss": -6.22423791885376, "global_step": 85146, "epoch": 2027} {"train_loss": -6.188597679138184, "global_step": 85147, "epoch": 2027} {"train_loss": -6.140337944030762, "global_step": 85148, "epoch": 2027} {"train_loss": -6.24696683883667, "global_step": 85149, "epoch": 2027} {"train_loss": -6.245140075683594, "global_step": 85150, "epoch": 2027} {"train_loss": -6.331753730773926, "global_step": 85151, "epoch": 2027} {"train_loss": -6.223667144775391, "global_step": 85152, "epoch": 2027} {"train_loss": -6.242460250854492, "global_step": 85153, "epoch": 2027} {"train_loss": -6.08257532119751, "global_step": 85154, "epoch": 2027} {"train_loss": -6.302319526672363, "global_step": 85155, "epoch": 2027} {"train_loss": -6.246649742126465, "global_step": 85156, "epoch": 2027} {"train_loss": -6.225994110107422, "global_step": 85157, "epoch": 2027} {"train_loss": -6.175331115722656, "global_step": 85158, "epoch": 2027} {"train_loss": -6.179072856903076, "global_step": 85159, "epoch": 2027} {"train_loss": -6.143307209014893, "global_step": 85160, "epoch": 2027} {"train_loss": -6.26069450378418, "global_step": 85161, "epoch": 2027} {"train_loss": -6.20857048034668, "global_step": 85162, "epoch": 2027} {"train_loss": -6.179852485656738, "global_step": 85163, "epoch": 2027} {"train_loss": -6.243896484375, "global_step": 85164, "epoch": 2027} {"train_loss": -6.33189582824707, "global_step": 85165, "epoch": 2027} {"train_loss": -6.292377471923828, "global_step": 85166, "epoch": 2027} {"train_loss": -6.239529132843018, "global_step": 85167, "epoch": 2027} {"train_loss": -6.176848888397217, "global_step": 85168, "epoch": 2027} {"train_loss": -6.210864067077637, "global_step": 85169, "epoch": 2027} {"train_loss": -6.254385471343994, "global_step": 85170, "epoch": 2027} {"train_loss": -6.233546733856201, "global_step": 85171, "epoch": 2027} {"train_loss": -6.0753679275512695, "global_step": 85172, "epoch": 2027} {"train_loss": -6.152403831481934, "global_step": 85173, "epoch": 2027} {"train_loss": -6.220995903015137, "global_step": 85174, "epoch": 2027} {"train_loss": -6.213191531953358, "global_step": 85175, "epoch": 2027, "val_loss": 62919.8125} {"train_loss": -6.20401668548584, "global_step": 85176, "epoch": 2028} {"train_loss": -6.078455924987793, "global_step": 85177, "epoch": 2028} {"train_loss": -6.19036865234375, "global_step": 85178, "epoch": 2028} {"train_loss": -6.135049343109131, "global_step": 85179, "epoch": 2028} {"train_loss": -6.143640518188477, "global_step": 85180, "epoch": 2028} {"train_loss": -6.228836536407471, "global_step": 85181, "epoch": 2028} {"train_loss": -6.172013759613037, "global_step": 85182, "epoch": 2028} {"train_loss": -6.1449713706970215, "global_step": 85183, "epoch": 2028} {"train_loss": -6.337247848510742, "global_step": 85184, "epoch": 2028} {"train_loss": -6.092952728271484, "global_step": 85185, "epoch": 2028} {"train_loss": -6.065334796905518, "global_step": 85186, "epoch": 2028} {"train_loss": -6.191165447235107, "global_step": 85187, "epoch": 2028} {"train_loss": -5.994037628173828, "global_step": 85188, "epoch": 2028} {"train_loss": -6.178783893585205, "global_step": 85189, "epoch": 2028} {"train_loss": -6.232287883758545, "global_step": 85190, "epoch": 2028} {"train_loss": -6.079297065734863, "global_step": 85191, "epoch": 2028} {"train_loss": -6.227537631988525, "global_step": 85192, "epoch": 2028} {"train_loss": -6.216011047363281, "global_step": 85193, "epoch": 2028} {"train_loss": -6.164755344390869, "global_step": 85194, "epoch": 2028} {"train_loss": -6.189946174621582, "global_step": 85195, "epoch": 2028} {"train_loss": -6.1545562744140625, "global_step": 85196, "epoch": 2028} {"train_loss": -6.301566123962402, "global_step": 85197, "epoch": 2028} {"train_loss": -6.120660305023193, "global_step": 85198, "epoch": 2028} {"train_loss": -6.253565788269043, "global_step": 85199, "epoch": 2028} {"train_loss": -6.35379695892334, "global_step": 85200, "epoch": 2028} {"train_loss": -6.274264335632324, "global_step": 85201, "epoch": 2028} {"train_loss": -6.249786376953125, "global_step": 85202, "epoch": 2028} {"train_loss": -6.175448417663574, "global_step": 85203, "epoch": 2028} {"train_loss": -6.296097755432129, "global_step": 85204, "epoch": 2028} {"train_loss": -6.210367202758789, "global_step": 85205, "epoch": 2028} {"train_loss": -6.079545021057129, "global_step": 85206, "epoch": 2028} {"train_loss": -6.220373153686523, "global_step": 85207, "epoch": 2028} {"train_loss": -6.210497856140137, "global_step": 85208, "epoch": 2028} {"train_loss": -6.236219882965088, "global_step": 85209, "epoch": 2028} {"train_loss": -6.219327449798584, "global_step": 85210, "epoch": 2028} {"train_loss": -6.181567192077637, "global_step": 85211, "epoch": 2028} {"train_loss": -6.209445953369141, "global_step": 85212, "epoch": 2028} {"train_loss": -6.240041732788086, "global_step": 85213, "epoch": 2028} {"train_loss": -6.22672176361084, "global_step": 85214, "epoch": 2028} {"train_loss": -6.1508026123046875, "global_step": 85215, "epoch": 2028} {"train_loss": -6.200009346008301, "global_step": 85216, "epoch": 2028} {"train_loss": -6.192897172201247, "global_step": 85217, "epoch": 2028, "val_loss": 62606.65625} {"train_loss": -6.2572174072265625, "global_step": 85218, "epoch": 2029} {"train_loss": -6.2111592292785645, "global_step": 85219, "epoch": 2029} {"train_loss": -6.134620666503906, "global_step": 85220, "epoch": 2029} {"train_loss": -6.3221564292907715, "global_step": 85221, "epoch": 2029} {"train_loss": -6.284968376159668, "global_step": 85222, "epoch": 2029} {"train_loss": -6.155567169189453, "global_step": 85223, "epoch": 2029} {"train_loss": -6.31613826751709, "global_step": 85224, "epoch": 2029} {"train_loss": -6.334292888641357, "global_step": 85225, "epoch": 2029} {"train_loss": -6.314168930053711, "global_step": 85226, "epoch": 2029} {"train_loss": -6.1928253173828125, "global_step": 85227, "epoch": 2029} {"train_loss": -6.240095615386963, "global_step": 85228, "epoch": 2029} {"train_loss": -6.189374923706055, "global_step": 85229, "epoch": 2029} {"train_loss": -6.166003704071045, "global_step": 85230, "epoch": 2029} {"train_loss": -6.188368797302246, "global_step": 85231, "epoch": 2029} {"train_loss": -6.195519924163818, "global_step": 85232, "epoch": 2029} {"train_loss": -6.142143249511719, "global_step": 85233, "epoch": 2029} {"train_loss": -6.225513935089111, "global_step": 85234, "epoch": 2029} {"train_loss": -6.27714729309082, "global_step": 85235, "epoch": 2029} {"train_loss": -6.14605188369751, "global_step": 85236, "epoch": 2029} {"train_loss": -6.253497123718262, "global_step": 85237, "epoch": 2029} {"train_loss": -6.102898120880127, "global_step": 85238, "epoch": 2029} {"train_loss": -6.122185707092285, "global_step": 85239, "epoch": 2029} {"train_loss": -6.242450714111328, "global_step": 85240, "epoch": 2029} {"train_loss": -6.232694149017334, "global_step": 85241, "epoch": 2029} {"train_loss": -6.151691913604736, "global_step": 85242, "epoch": 2029} {"train_loss": -6.160881042480469, "global_step": 85243, "epoch": 2029} {"train_loss": -6.209535121917725, "global_step": 85244, "epoch": 2029} {"train_loss": -6.351668357849121, "global_step": 85245, "epoch": 2029} {"train_loss": -6.255342960357666, "global_step": 85246, "epoch": 2029} {"train_loss": -6.269929885864258, "global_step": 85247, "epoch": 2029} {"train_loss": -6.225491523742676, "global_step": 85248, "epoch": 2029} {"train_loss": -6.250975608825684, "global_step": 85249, "epoch": 2029} {"train_loss": -6.243481636047363, "global_step": 85250, "epoch": 2029} {"train_loss": -6.254647254943848, "global_step": 85251, "epoch": 2029} {"train_loss": -6.2062201499938965, "global_step": 85252, "epoch": 2029} {"train_loss": -6.178936958312988, "global_step": 85253, "epoch": 2029} {"train_loss": -6.339949131011963, "global_step": 85254, "epoch": 2029} {"train_loss": -6.19674825668335, "global_step": 85255, "epoch": 2029} {"train_loss": -6.117329120635986, "global_step": 85256, "epoch": 2029} {"train_loss": -6.105266571044922, "global_step": 85257, "epoch": 2029} {"train_loss": -6.222540855407715, "global_step": 85258, "epoch": 2029} {"train_loss": -6.217531930832636, "global_step": 85259, "epoch": 2029, "val_loss": 62758.83984375} {"train_loss": -6.1967926025390625, "global_step": 85260, "epoch": 2030} {"train_loss": -6.240496635437012, "global_step": 85261, "epoch": 2030} {"train_loss": -6.2823967933654785, "global_step": 85262, "epoch": 2030} {"train_loss": -6.155837535858154, "global_step": 85263, "epoch": 2030} {"train_loss": -6.152665138244629, "global_step": 85264, "epoch": 2030} {"train_loss": -6.27256441116333, "global_step": 85265, "epoch": 2030} {"train_loss": -6.287489414215088, "global_step": 85266, "epoch": 2030} {"train_loss": -6.176050186157227, "global_step": 85267, "epoch": 2030} {"train_loss": -6.191187858581543, "global_step": 85268, "epoch": 2030} {"train_loss": -6.1794891357421875, "global_step": 85269, "epoch": 2030} {"train_loss": -6.301271438598633, "global_step": 85270, "epoch": 2030} {"train_loss": -6.073095321655273, "global_step": 85271, "epoch": 2030} {"train_loss": -6.191723823547363, "global_step": 85272, "epoch": 2030} {"train_loss": -6.0885725021362305, "global_step": 85273, "epoch": 2030} {"train_loss": -6.1233673095703125, "global_step": 85274, "epoch": 2030} {"train_loss": -6.124384880065918, "global_step": 85275, "epoch": 2030} {"train_loss": -6.19973611831665, "global_step": 85276, "epoch": 2030} {"train_loss": -6.156467437744141, "global_step": 85277, "epoch": 2030} {"train_loss": -6.120861053466797, "global_step": 85278, "epoch": 2030} {"train_loss": -6.153194427490234, "global_step": 85279, "epoch": 2030} {"train_loss": -6.1504058837890625, "global_step": 85280, "epoch": 2030} {"train_loss": -6.2276835441589355, "global_step": 85281, "epoch": 2030} {"train_loss": -6.172763824462891, "global_step": 85282, "epoch": 2030} {"train_loss": -6.1542744636535645, "global_step": 85283, "epoch": 2030} {"train_loss": -6.23599100112915, "global_step": 85284, "epoch": 2030} {"train_loss": -6.284609794616699, "global_step": 85285, "epoch": 2030} {"train_loss": -6.191046714782715, "global_step": 85286, "epoch": 2030} {"train_loss": -6.183304309844971, "global_step": 85287, "epoch": 2030} {"train_loss": -6.14520788192749, "global_step": 85288, "epoch": 2030} {"train_loss": -6.1302642822265625, "global_step": 85289, "epoch": 2030} {"train_loss": -6.162411212921143, "global_step": 85290, "epoch": 2030} {"train_loss": -6.21462345123291, "global_step": 85291, "epoch": 2030} {"train_loss": -6.13635778427124, "global_step": 85292, "epoch": 2030} {"train_loss": -6.224452495574951, "global_step": 85293, "epoch": 2030} {"train_loss": -6.153097152709961, "global_step": 85294, "epoch": 2030} {"train_loss": -6.210622310638428, "global_step": 85295, "epoch": 2030} {"train_loss": -6.204497814178467, "global_step": 85296, "epoch": 2030} {"train_loss": -6.207466125488281, "global_step": 85297, "epoch": 2030} {"train_loss": -6.045919418334961, "global_step": 85298, "epoch": 2030} {"train_loss": -6.201676368713379, "global_step": 85299, "epoch": 2030} {"train_loss": -6.149703502655029, "global_step": 85300, "epoch": 2030} {"train_loss": -6.180716560000465, "global_step": 85301, "epoch": 2030, "val_loss": 62684.81640625} {"train_loss": -6.243309020996094, "global_step": 85302, "epoch": 2031} {"train_loss": -6.0883026123046875, "global_step": 85303, "epoch": 2031} {"train_loss": -6.080211162567139, "global_step": 85304, "epoch": 2031} {"train_loss": -6.203025817871094, "global_step": 85305, "epoch": 2031} {"train_loss": -6.015425682067871, "global_step": 85306, "epoch": 2031} {"train_loss": -6.11479377746582, "global_step": 85307, "epoch": 2031} {"train_loss": -6.193182945251465, "global_step": 85308, "epoch": 2031} {"train_loss": -6.081490993499756, "global_step": 85309, "epoch": 2031} {"train_loss": -6.084223747253418, "global_step": 85310, "epoch": 2031} {"train_loss": -6.124952793121338, "global_step": 85311, "epoch": 2031} {"train_loss": -6.076631546020508, "global_step": 85312, "epoch": 2031} {"train_loss": -6.120232582092285, "global_step": 85313, "epoch": 2031} {"train_loss": -6.163934707641602, "global_step": 85314, "epoch": 2031} {"train_loss": -6.070884704589844, "global_step": 85315, "epoch": 2031} {"train_loss": -6.115288257598877, "global_step": 85316, "epoch": 2031} {"train_loss": -6.267386436462402, "global_step": 85317, "epoch": 2031} {"train_loss": -6.119181156158447, "global_step": 85318, "epoch": 2031} {"train_loss": -6.194432258605957, "global_step": 85319, "epoch": 2031} {"train_loss": -6.217432975769043, "global_step": 85320, "epoch": 2031} {"train_loss": -6.133410930633545, "global_step": 85321, "epoch": 2031} {"train_loss": -6.220553398132324, "global_step": 85322, "epoch": 2031} {"train_loss": -6.233707904815674, "global_step": 85323, "epoch": 2031} {"train_loss": -6.1136369705200195, "global_step": 85324, "epoch": 2031} {"train_loss": -6.188736915588379, "global_step": 85325, "epoch": 2031} {"train_loss": -6.143088340759277, "global_step": 85326, "epoch": 2031} {"train_loss": -6.210809707641602, "global_step": 85327, "epoch": 2031} {"train_loss": -6.079619407653809, "global_step": 85328, "epoch": 2031} {"train_loss": -6.199469566345215, "global_step": 85329, "epoch": 2031} {"train_loss": -6.31076717376709, "global_step": 85330, "epoch": 2031} {"train_loss": -6.048164367675781, "global_step": 85331, "epoch": 2031} {"train_loss": -6.1578450202941895, "global_step": 85332, "epoch": 2031} {"train_loss": -6.121903896331787, "global_step": 85333, "epoch": 2031} {"train_loss": -6.088639259338379, "global_step": 85334, "epoch": 2031} {"train_loss": -6.1554155349731445, "global_step": 85335, "epoch": 2031} {"train_loss": -6.2699995040893555, "global_step": 85336, "epoch": 2031} {"train_loss": -6.219099521636963, "global_step": 85337, "epoch": 2031} {"train_loss": -6.183221817016602, "global_step": 85338, "epoch": 2031} {"train_loss": -6.158978462219238, "global_step": 85339, "epoch": 2031} {"train_loss": -6.31119966506958, "global_step": 85340, "epoch": 2031} {"train_loss": -6.1963791847229, "global_step": 85341, "epoch": 2031} {"train_loss": -6.2103352546691895, "global_step": 85342, "epoch": 2031} {"train_loss": -6.160703477405367, "global_step": 85343, "epoch": 2031, "val_loss": 62958.50390625} {"train_loss": -6.2045722007751465, "global_step": 85344, "epoch": 2032} {"train_loss": -6.238831520080566, "global_step": 85345, "epoch": 2032} {"train_loss": -6.172146797180176, "global_step": 85346, "epoch": 2032} {"train_loss": -6.081132411956787, "global_step": 85347, "epoch": 2032} {"train_loss": -6.267422199249268, "global_step": 85348, "epoch": 2032} {"train_loss": -6.133912086486816, "global_step": 85349, "epoch": 2032} {"train_loss": -6.107134819030762, "global_step": 85350, "epoch": 2032} {"train_loss": -6.148623466491699, "global_step": 85351, "epoch": 2032} {"train_loss": -6.198562145233154, "global_step": 85352, "epoch": 2032} {"train_loss": -6.129215240478516, "global_step": 85353, "epoch": 2032} {"train_loss": -6.240391731262207, "global_step": 85354, "epoch": 2032} {"train_loss": -6.197981357574463, "global_step": 85355, "epoch": 2032} {"train_loss": -6.150729179382324, "global_step": 85356, "epoch": 2032} {"train_loss": -6.243598937988281, "global_step": 85357, "epoch": 2032} {"train_loss": -6.207564353942871, "global_step": 85358, "epoch": 2032} {"train_loss": -6.122962951660156, "global_step": 85359, "epoch": 2032} {"train_loss": -6.0444440841674805, "global_step": 85360, "epoch": 2032} {"train_loss": -6.088772773742676, "global_step": 85361, "epoch": 2032} {"train_loss": -6.217446327209473, "global_step": 85362, "epoch": 2032} {"train_loss": -6.14514684677124, "global_step": 85363, "epoch": 2032} {"train_loss": -6.085012435913086, "global_step": 85364, "epoch": 2032} {"train_loss": -6.095247268676758, "global_step": 85365, "epoch": 2032} {"train_loss": -6.176000595092773, "global_step": 85366, "epoch": 2032} {"train_loss": -6.116823673248291, "global_step": 85367, "epoch": 2032} {"train_loss": -6.203376770019531, "global_step": 85368, "epoch": 2032} {"train_loss": -6.248450756072998, "global_step": 85369, "epoch": 2032} {"train_loss": -6.216960906982422, "global_step": 85370, "epoch": 2032} {"train_loss": -6.296658515930176, "global_step": 85371, "epoch": 2032} {"train_loss": -6.243170261383057, "global_step": 85372, "epoch": 2032} {"train_loss": -6.273727893829346, "global_step": 85373, "epoch": 2032} {"train_loss": -6.262429237365723, "global_step": 85374, "epoch": 2032} {"train_loss": -6.2675371170043945, "global_step": 85375, "epoch": 2032} {"train_loss": -6.128807544708252, "global_step": 85376, "epoch": 2032} {"train_loss": -6.223789215087891, "global_step": 85377, "epoch": 2032} {"train_loss": -6.256447792053223, "global_step": 85378, "epoch": 2032} {"train_loss": -6.201556205749512, "global_step": 85379, "epoch": 2032} {"train_loss": -6.179693698883057, "global_step": 85380, "epoch": 2032} {"train_loss": -6.212443828582764, "global_step": 85381, "epoch": 2032} {"train_loss": -6.313328742980957, "global_step": 85382, "epoch": 2032} {"train_loss": -6.314507484436035, "global_step": 85383, "epoch": 2032} {"train_loss": -6.1657304763793945, "global_step": 85384, "epoch": 2032} {"train_loss": -6.192527271452404, "global_step": 85385, "epoch": 2032, "val_loss": 62578.14453125} {"train_loss": -6.202152252197266, "global_step": 85386, "epoch": 2033} {"train_loss": -6.044652938842773, "global_step": 85387, "epoch": 2033} {"train_loss": -6.221987724304199, "global_step": 85388, "epoch": 2033} {"train_loss": -6.172280311584473, "global_step": 85389, "epoch": 2033} {"train_loss": -6.256077766418457, "global_step": 85390, "epoch": 2033} {"train_loss": -6.296459197998047, "global_step": 85391, "epoch": 2033} {"train_loss": -6.2334136962890625, "global_step": 85392, "epoch": 2033} {"train_loss": -6.356993675231934, "global_step": 85393, "epoch": 2033} {"train_loss": -6.29252815246582, "global_step": 85394, "epoch": 2033} {"train_loss": -6.098905563354492, "global_step": 85395, "epoch": 2033} {"train_loss": -6.1099853515625, "global_step": 85396, "epoch": 2033} {"train_loss": -6.246114730834961, "global_step": 85397, "epoch": 2033} {"train_loss": -6.181126594543457, "global_step": 85398, "epoch": 2033} {"train_loss": -6.195659637451172, "global_step": 85399, "epoch": 2033} {"train_loss": -6.203574180603027, "global_step": 85400, "epoch": 2033} {"train_loss": -6.276717185974121, "global_step": 85401, "epoch": 2033} {"train_loss": -6.150156021118164, "global_step": 85402, "epoch": 2033} {"train_loss": -6.031642913818359, "global_step": 85403, "epoch": 2033} {"train_loss": -6.297199249267578, "global_step": 85404, "epoch": 2033} {"train_loss": -6.165511131286621, "global_step": 85405, "epoch": 2033} {"train_loss": -6.246185779571533, "global_step": 85406, "epoch": 2033} {"train_loss": -6.087456226348877, "global_step": 85407, "epoch": 2033} {"train_loss": -6.1859564781188965, "global_step": 85408, "epoch": 2033} {"train_loss": -6.196139335632324, "global_step": 85409, "epoch": 2033} {"train_loss": -6.13114595413208, "global_step": 85410, "epoch": 2033} {"train_loss": -6.130546569824219, "global_step": 85411, "epoch": 2033} {"train_loss": -6.264646530151367, "global_step": 85412, "epoch": 2033} {"train_loss": -6.167479038238525, "global_step": 85413, "epoch": 2033} {"train_loss": -6.192777633666992, "global_step": 85414, "epoch": 2033} {"train_loss": -6.24120569229126, "global_step": 85415, "epoch": 2033} {"train_loss": -6.229556560516357, "global_step": 85416, "epoch": 2033} {"train_loss": -6.194693088531494, "global_step": 85417, "epoch": 2033} {"train_loss": -6.11370849609375, "global_step": 85418, "epoch": 2033} {"train_loss": -6.307963848114014, "global_step": 85419, "epoch": 2033} {"train_loss": -6.274978160858154, "global_step": 85420, "epoch": 2033} {"train_loss": -6.157112121582031, "global_step": 85421, "epoch": 2033} {"train_loss": -6.2114105224609375, "global_step": 85422, "epoch": 2033} {"train_loss": -6.096593379974365, "global_step": 85423, "epoch": 2033} {"train_loss": -6.228538990020752, "global_step": 85424, "epoch": 2033} {"train_loss": -6.169358253479004, "global_step": 85425, "epoch": 2033} {"train_loss": -6.2179059982299805, "global_step": 85426, "epoch": 2033} {"train_loss": -6.197696560905094, "global_step": 85427, "epoch": 2033, "val_loss": 62818.8828125} {"train_loss": -6.266661643981934, "global_step": 85428, "epoch": 2034} {"train_loss": -6.223446369171143, "global_step": 85429, "epoch": 2034} {"train_loss": -6.2110185623168945, "global_step": 85430, "epoch": 2034} {"train_loss": -6.195426940917969, "global_step": 85431, "epoch": 2034} {"train_loss": -6.1328229904174805, "global_step": 85432, "epoch": 2034} {"train_loss": -6.184520721435547, "global_step": 85433, "epoch": 2034} {"train_loss": -6.1468305587768555, "global_step": 85434, "epoch": 2034} {"train_loss": -6.366399765014648, "global_step": 85435, "epoch": 2034} {"train_loss": -6.181960105895996, "global_step": 85436, "epoch": 2034} {"train_loss": -6.205734729766846, "global_step": 85437, "epoch": 2034} {"train_loss": -6.274094581604004, "global_step": 85438, "epoch": 2034} {"train_loss": -6.185298919677734, "global_step": 85439, "epoch": 2034} {"train_loss": -6.195201873779297, "global_step": 85440, "epoch": 2034} {"train_loss": -6.1840362548828125, "global_step": 85441, "epoch": 2034} {"train_loss": -6.287409782409668, "global_step": 85442, "epoch": 2034} {"train_loss": -6.145401954650879, "global_step": 85443, "epoch": 2034} {"train_loss": -6.069618225097656, "global_step": 85444, "epoch": 2034} {"train_loss": -6.143797874450684, "global_step": 85445, "epoch": 2034} {"train_loss": -6.08833646774292, "global_step": 85446, "epoch": 2034} {"train_loss": -6.143650054931641, "global_step": 85447, "epoch": 2034} {"train_loss": -6.1583147048950195, "global_step": 85448, "epoch": 2034} {"train_loss": -6.064145088195801, "global_step": 85449, "epoch": 2034} {"train_loss": -6.29359245300293, "global_step": 85450, "epoch": 2034} {"train_loss": -6.280112266540527, "global_step": 85451, "epoch": 2034} {"train_loss": -6.217212677001953, "global_step": 85452, "epoch": 2034} {"train_loss": -6.18095588684082, "global_step": 85453, "epoch": 2034} {"train_loss": -6.1561689376831055, "global_step": 85454, "epoch": 2034} {"train_loss": -6.196283340454102, "global_step": 85455, "epoch": 2034} {"train_loss": -6.135770320892334, "global_step": 85456, "epoch": 2034} {"train_loss": -6.256365776062012, "global_step": 85457, "epoch": 2034} {"train_loss": -6.117283821105957, "global_step": 85458, "epoch": 2034} {"train_loss": -6.084864616394043, "global_step": 85459, "epoch": 2034} {"train_loss": -6.2207512855529785, "global_step": 85460, "epoch": 2034} {"train_loss": -6.172430515289307, "global_step": 85461, "epoch": 2034} {"train_loss": -6.224372863769531, "global_step": 85462, "epoch": 2034} {"train_loss": -6.182497978210449, "global_step": 85463, "epoch": 2034} {"train_loss": -6.217217445373535, "global_step": 85464, "epoch": 2034} {"train_loss": -6.240060806274414, "global_step": 85465, "epoch": 2034} {"train_loss": -6.258268356323242, "global_step": 85466, "epoch": 2034} {"train_loss": -6.22650146484375, "global_step": 85467, "epoch": 2034} {"train_loss": -6.196898460388184, "global_step": 85468, "epoch": 2034} {"train_loss": -6.192128749120803, "global_step": 85469, "epoch": 2034, "val_loss": 62779.97265625} {"train_loss": -6.2225260734558105, "global_step": 85470, "epoch": 2035} {"train_loss": -6.270041465759277, "global_step": 85471, "epoch": 2035} {"train_loss": -6.27985954284668, "global_step": 85472, "epoch": 2035} {"train_loss": -6.211334228515625, "global_step": 85473, "epoch": 2035} {"train_loss": -6.2734479904174805, "global_step": 85474, "epoch": 2035} {"train_loss": -6.149304389953613, "global_step": 85475, "epoch": 2035} {"train_loss": -6.2075514793396, "global_step": 85476, "epoch": 2035} {"train_loss": -6.235064506530762, "global_step": 85477, "epoch": 2035} {"train_loss": -6.256608009338379, "global_step": 85478, "epoch": 2035} {"train_loss": -6.237149715423584, "global_step": 85479, "epoch": 2035} {"train_loss": -6.340705871582031, "global_step": 85480, "epoch": 2035} {"train_loss": -6.284268379211426, "global_step": 85481, "epoch": 2035} {"train_loss": -6.264865875244141, "global_step": 85482, "epoch": 2035} {"train_loss": -6.266905307769775, "global_step": 85483, "epoch": 2035} {"train_loss": -6.282589435577393, "global_step": 85484, "epoch": 2035} {"train_loss": -6.127191066741943, "global_step": 85485, "epoch": 2035} {"train_loss": -6.343766212463379, "global_step": 85486, "epoch": 2035} {"train_loss": -6.180595397949219, "global_step": 85487, "epoch": 2035} {"train_loss": -6.170176029205322, "global_step": 85488, "epoch": 2035} {"train_loss": -6.145673751831055, "global_step": 85489, "epoch": 2035} {"train_loss": -6.303664207458496, "global_step": 85490, "epoch": 2035} {"train_loss": -6.160797119140625, "global_step": 85491, "epoch": 2035} {"train_loss": -6.2230424880981445, "global_step": 85492, "epoch": 2035} {"train_loss": -6.216659069061279, "global_step": 85493, "epoch": 2035} {"train_loss": -6.158425331115723, "global_step": 85494, "epoch": 2035} {"train_loss": -6.34761381149292, "global_step": 85495, "epoch": 2035} {"train_loss": -6.15669584274292, "global_step": 85496, "epoch": 2035} {"train_loss": -6.203699588775635, "global_step": 85497, "epoch": 2035} {"train_loss": -6.233038902282715, "global_step": 85498, "epoch": 2035} {"train_loss": -6.233499050140381, "global_step": 85499, "epoch": 2035} {"train_loss": -6.134442329406738, "global_step": 85500, "epoch": 2035} {"train_loss": -6.173583984375, "global_step": 85501, "epoch": 2035} {"train_loss": -6.113666534423828, "global_step": 85502, "epoch": 2035} {"train_loss": -6.203486442565918, "global_step": 85503, "epoch": 2035} {"train_loss": -6.281043529510498, "global_step": 85504, "epoch": 2035} {"train_loss": -6.077496528625488, "global_step": 85505, "epoch": 2035} {"train_loss": -6.161563873291016, "global_step": 85506, "epoch": 2035} {"train_loss": -6.1996870040893555, "global_step": 85507, "epoch": 2035} {"train_loss": -6.1535139083862305, "global_step": 85508, "epoch": 2035} {"train_loss": -6.244671821594238, "global_step": 85509, "epoch": 2035} {"train_loss": -6.130013465881348, "global_step": 85510, "epoch": 2035} {"train_loss": -6.212977772667294, "global_step": 85511, "epoch": 2035, "val_loss": 62813.76953125} {"train_loss": -6.175384521484375, "global_step": 85512, "epoch": 2036} {"train_loss": -6.11062479019165, "global_step": 85513, "epoch": 2036} {"train_loss": -6.1826982498168945, "global_step": 85514, "epoch": 2036} {"train_loss": -6.156517505645752, "global_step": 85515, "epoch": 2036} {"train_loss": -6.260251998901367, "global_step": 85516, "epoch": 2036} {"train_loss": -6.222406387329102, "global_step": 85517, "epoch": 2036} {"train_loss": -6.274658203125, "global_step": 85518, "epoch": 2036} {"train_loss": -6.175534248352051, "global_step": 85519, "epoch": 2036} {"train_loss": -6.22182559967041, "global_step": 85520, "epoch": 2036} {"train_loss": -6.092476844787598, "global_step": 85521, "epoch": 2036} {"train_loss": -6.228612899780273, "global_step": 85522, "epoch": 2036} {"train_loss": -6.262779235839844, "global_step": 85523, "epoch": 2036} {"train_loss": -6.2391157150268555, "global_step": 85524, "epoch": 2036} {"train_loss": -6.279265403747559, "global_step": 85525, "epoch": 2036} {"train_loss": -6.326898574829102, "global_step": 85526, "epoch": 2036} {"train_loss": -6.21236515045166, "global_step": 85527, "epoch": 2036} {"train_loss": -6.225622653961182, "global_step": 85528, "epoch": 2036} {"train_loss": -6.193334579467773, "global_step": 85529, "epoch": 2036} {"train_loss": -6.256989479064941, "global_step": 85530, "epoch": 2036} {"train_loss": -6.218642234802246, "global_step": 85531, "epoch": 2036} {"train_loss": -6.241777420043945, "global_step": 85532, "epoch": 2036} {"train_loss": -6.2523040771484375, "global_step": 85533, "epoch": 2036} {"train_loss": -6.251742839813232, "global_step": 85534, "epoch": 2036} {"train_loss": -6.11818790435791, "global_step": 85535, "epoch": 2036} {"train_loss": -6.25037145614624, "global_step": 85536, "epoch": 2036} {"train_loss": -6.224371433258057, "global_step": 85537, "epoch": 2036} {"train_loss": -6.114988803863525, "global_step": 85538, "epoch": 2036} {"train_loss": -6.251996040344238, "global_step": 85539, "epoch": 2036} {"train_loss": -6.299984931945801, "global_step": 85540, "epoch": 2036} {"train_loss": -6.2483625411987305, "global_step": 85541, "epoch": 2036} {"train_loss": -6.219337463378906, "global_step": 85542, "epoch": 2036} {"train_loss": -6.205106735229492, "global_step": 85543, "epoch": 2036} {"train_loss": -6.134282112121582, "global_step": 85544, "epoch": 2036} {"train_loss": -6.150759696960449, "global_step": 85545, "epoch": 2036} {"train_loss": -6.298859119415283, "global_step": 85546, "epoch": 2036} {"train_loss": -6.147398948669434, "global_step": 85547, "epoch": 2036} {"train_loss": -6.261090278625488, "global_step": 85548, "epoch": 2036} {"train_loss": -6.208902359008789, "global_step": 85549, "epoch": 2036} {"train_loss": -6.187838077545166, "global_step": 85550, "epoch": 2036} {"train_loss": -6.237718105316162, "global_step": 85551, "epoch": 2036} {"train_loss": -6.1601386070251465, "global_step": 85552, "epoch": 2036} {"train_loss": -6.216637577329363, "global_step": 85553, "epoch": 2036, "val_loss": 62655.06640625} {"train_loss": -6.260078430175781, "global_step": 85554, "epoch": 2037} {"train_loss": -6.193296432495117, "global_step": 85555, "epoch": 2037} {"train_loss": -6.2203288078308105, "global_step": 85556, "epoch": 2037} {"train_loss": -6.2501726150512695, "global_step": 85557, "epoch": 2037} {"train_loss": -6.202451705932617, "global_step": 85558, "epoch": 2037} {"train_loss": -6.283233642578125, "global_step": 85559, "epoch": 2037} {"train_loss": -6.276899337768555, "global_step": 85560, "epoch": 2037} {"train_loss": -6.103378772735596, "global_step": 85561, "epoch": 2037} {"train_loss": -6.278786659240723, "global_step": 85562, "epoch": 2037} {"train_loss": -6.153788089752197, "global_step": 85563, "epoch": 2037} {"train_loss": -6.173882484436035, "global_step": 85564, "epoch": 2037} {"train_loss": -6.183690547943115, "global_step": 85565, "epoch": 2037} {"train_loss": -6.033890724182129, "global_step": 85566, "epoch": 2037} {"train_loss": -6.061020851135254, "global_step": 85567, "epoch": 2037} {"train_loss": -6.222804069519043, "global_step": 85568, "epoch": 2037} {"train_loss": -6.053581237792969, "global_step": 85569, "epoch": 2037} {"train_loss": -6.083134174346924, "global_step": 85570, "epoch": 2037} {"train_loss": -6.077709674835205, "global_step": 85571, "epoch": 2037} {"train_loss": -6.034446716308594, "global_step": 85572, "epoch": 2037} {"train_loss": -6.08513069152832, "global_step": 85573, "epoch": 2037} {"train_loss": -6.00202751159668, "global_step": 85574, "epoch": 2037} {"train_loss": -6.06279182434082, "global_step": 85575, "epoch": 2037} {"train_loss": -5.952793121337891, "global_step": 85576, "epoch": 2037} {"train_loss": -6.143461227416992, "global_step": 85577, "epoch": 2037} {"train_loss": -5.973027229309082, "global_step": 85578, "epoch": 2037} {"train_loss": -6.227627754211426, "global_step": 85579, "epoch": 2037} {"train_loss": -6.092681407928467, "global_step": 85580, "epoch": 2037} {"train_loss": -6.1230316162109375, "global_step": 85581, "epoch": 2037} {"train_loss": -6.148931980133057, "global_step": 85582, "epoch": 2037} {"train_loss": -6.231656074523926, "global_step": 85583, "epoch": 2037} {"train_loss": -6.224503517150879, "global_step": 85584, "epoch": 2037} {"train_loss": -6.13248348236084, "global_step": 85585, "epoch": 2037} {"train_loss": -6.20020866394043, "global_step": 85586, "epoch": 2037} {"train_loss": -6.142201900482178, "global_step": 85587, "epoch": 2037} {"train_loss": -6.372054100036621, "global_step": 85588, "epoch": 2037} {"train_loss": -6.119738578796387, "global_step": 85589, "epoch": 2037} {"train_loss": -6.185249328613281, "global_step": 85590, "epoch": 2037} {"train_loss": -6.232357978820801, "global_step": 85591, "epoch": 2037} {"train_loss": -6.280758857727051, "global_step": 85592, "epoch": 2037} {"train_loss": -6.220346450805664, "global_step": 85593, "epoch": 2037} {"train_loss": -6.084781169891357, "global_step": 85594, "epoch": 2037} {"train_loss": -6.155990078335717, "global_step": 85595, "epoch": 2037, "val_loss": 62775.90625} {"train_loss": -6.202690601348877, "global_step": 85596, "epoch": 2038} {"train_loss": -6.2759294509887695, "global_step": 85597, "epoch": 2038} {"train_loss": -6.246132850646973, "global_step": 85598, "epoch": 2038} {"train_loss": -6.112393379211426, "global_step": 85599, "epoch": 2038} {"train_loss": -6.319873332977295, "global_step": 85600, "epoch": 2038} {"train_loss": -6.234402656555176, "global_step": 85601, "epoch": 2038} {"train_loss": -6.247006416320801, "global_step": 85602, "epoch": 2038} {"train_loss": -6.331710338592529, "global_step": 85603, "epoch": 2038} {"train_loss": -6.108373641967773, "global_step": 85604, "epoch": 2038} {"train_loss": -6.095635414123535, "global_step": 85605, "epoch": 2038} {"train_loss": -6.185633182525635, "global_step": 85606, "epoch": 2038} {"train_loss": -6.117104530334473, "global_step": 85607, "epoch": 2038} {"train_loss": -6.2021613121032715, "global_step": 85608, "epoch": 2038} {"train_loss": -6.298103332519531, "global_step": 85609, "epoch": 2038} {"train_loss": -6.183516979217529, "global_step": 85610, "epoch": 2038} {"train_loss": -6.176684856414795, "global_step": 85611, "epoch": 2038} {"train_loss": -6.143404006958008, "global_step": 85612, "epoch": 2038} {"train_loss": -6.256478786468506, "global_step": 85613, "epoch": 2038} {"train_loss": -6.201947212219238, "global_step": 85614, "epoch": 2038} {"train_loss": -6.218955993652344, "global_step": 85615, "epoch": 2038} {"train_loss": -6.227301597595215, "global_step": 85616, "epoch": 2038} {"train_loss": -6.228031158447266, "global_step": 85617, "epoch": 2038} {"train_loss": -6.10878849029541, "global_step": 85618, "epoch": 2038} {"train_loss": -6.212412357330322, "global_step": 85619, "epoch": 2038} {"train_loss": -6.261972427368164, "global_step": 85620, "epoch": 2038} {"train_loss": -6.250826835632324, "global_step": 85621, "epoch": 2038} {"train_loss": -6.249590873718262, "global_step": 85622, "epoch": 2038} {"train_loss": -6.20886754989624, "global_step": 85623, "epoch": 2038} {"train_loss": -6.330841064453125, "global_step": 85624, "epoch": 2038} {"train_loss": -6.305624008178711, "global_step": 85625, "epoch": 2038} {"train_loss": -6.319436073303223, "global_step": 85626, "epoch": 2038} {"train_loss": -6.360238552093506, "global_step": 85627, "epoch": 2038} {"train_loss": -6.2592573165893555, "global_step": 85628, "epoch": 2038} {"train_loss": -6.145565986633301, "global_step": 85629, "epoch": 2038} {"train_loss": -6.339140892028809, "global_step": 85630, "epoch": 2038} {"train_loss": -6.2506937980651855, "global_step": 85631, "epoch": 2038} {"train_loss": -6.193373680114746, "global_step": 85632, "epoch": 2038} {"train_loss": -6.194828987121582, "global_step": 85633, "epoch": 2038} {"train_loss": -6.370451927185059, "global_step": 85634, "epoch": 2038} {"train_loss": -6.120454788208008, "global_step": 85635, "epoch": 2038} {"train_loss": -6.184835433959961, "global_step": 85636, "epoch": 2038} {"train_loss": -6.226471469515846, "global_step": 85637, "epoch": 2038, "val_loss": 62650.21875} {"train_loss": -6.266103744506836, "global_step": 85638, "epoch": 2039} {"train_loss": -6.174846649169922, "global_step": 85639, "epoch": 2039} {"train_loss": -6.054091930389404, "global_step": 85640, "epoch": 2039} {"train_loss": -6.163229942321777, "global_step": 85641, "epoch": 2039} {"train_loss": -6.136233329772949, "global_step": 85642, "epoch": 2039} {"train_loss": -6.278630256652832, "global_step": 85643, "epoch": 2039} {"train_loss": -6.329553127288818, "global_step": 85644, "epoch": 2039} {"train_loss": -6.189844131469727, "global_step": 85645, "epoch": 2039} {"train_loss": -6.105567932128906, "global_step": 85646, "epoch": 2039} {"train_loss": -6.234152793884277, "global_step": 85647, "epoch": 2039} {"train_loss": -6.3531413078308105, "global_step": 85648, "epoch": 2039} {"train_loss": -6.131801605224609, "global_step": 85649, "epoch": 2039} {"train_loss": -6.286993980407715, "global_step": 85650, "epoch": 2039} {"train_loss": -6.203638076782227, "global_step": 85651, "epoch": 2039} {"train_loss": -6.269534111022949, "global_step": 85652, "epoch": 2039} {"train_loss": -6.270687580108643, "global_step": 85653, "epoch": 2039} {"train_loss": -6.220917224884033, "global_step": 85654, "epoch": 2039} {"train_loss": -6.295243740081787, "global_step": 85655, "epoch": 2039} {"train_loss": -6.2205424308776855, "global_step": 85656, "epoch": 2039} {"train_loss": -6.197930335998535, "global_step": 85657, "epoch": 2039} {"train_loss": -6.197636127471924, "global_step": 85658, "epoch": 2039} {"train_loss": -6.309077739715576, "global_step": 85659, "epoch": 2039} {"train_loss": -6.163219451904297, "global_step": 85660, "epoch": 2039} {"train_loss": -6.318533420562744, "global_step": 85661, "epoch": 2039} {"train_loss": -6.265447616577148, "global_step": 85662, "epoch": 2039} {"train_loss": -6.234131336212158, "global_step": 85663, "epoch": 2039} {"train_loss": -6.174284934997559, "global_step": 85664, "epoch": 2039} {"train_loss": -6.214336395263672, "global_step": 85665, "epoch": 2039} {"train_loss": -6.2678656578063965, "global_step": 85666, "epoch": 2039} {"train_loss": -6.189626693725586, "global_step": 85667, "epoch": 2039} {"train_loss": -6.249321460723877, "global_step": 85668, "epoch": 2039} {"train_loss": -6.232435703277588, "global_step": 85669, "epoch": 2039} {"train_loss": -6.2450785636901855, "global_step": 85670, "epoch": 2039} {"train_loss": -6.291617393493652, "global_step": 85671, "epoch": 2039} {"train_loss": -6.2327423095703125, "global_step": 85672, "epoch": 2039} {"train_loss": -6.242897987365723, "global_step": 85673, "epoch": 2039} {"train_loss": -6.261282920837402, "global_step": 85674, "epoch": 2039} {"train_loss": -6.194784164428711, "global_step": 85675, "epoch": 2039} {"train_loss": -6.15739107131958, "global_step": 85676, "epoch": 2039} {"train_loss": -6.14886474609375, "global_step": 85677, "epoch": 2039} {"train_loss": -6.133905410766602, "global_step": 85678, "epoch": 2039} {"train_loss": -6.219550791240874, "global_step": 85679, "epoch": 2039, "val_loss": 62846.3125} {"train_loss": -6.199821472167969, "global_step": 85680, "epoch": 2040} {"train_loss": -6.165879249572754, "global_step": 85681, "epoch": 2040} {"train_loss": -6.2010650634765625, "global_step": 85682, "epoch": 2040} {"train_loss": -6.238475799560547, "global_step": 85683, "epoch": 2040} {"train_loss": -6.235650062561035, "global_step": 85684, "epoch": 2040} {"train_loss": -6.224135398864746, "global_step": 85685, "epoch": 2040} {"train_loss": -6.232290267944336, "global_step": 85686, "epoch": 2040} {"train_loss": -6.1919660568237305, "global_step": 85687, "epoch": 2040} {"train_loss": -6.15821647644043, "global_step": 85688, "epoch": 2040} {"train_loss": -6.337320327758789, "global_step": 85689, "epoch": 2040} {"train_loss": -6.317561149597168, "global_step": 85690, "epoch": 2040} {"train_loss": -6.187335968017578, "global_step": 85691, "epoch": 2040} {"train_loss": -6.204892158508301, "global_step": 85692, "epoch": 2040} {"train_loss": -6.362752914428711, "global_step": 85693, "epoch": 2040} {"train_loss": -6.197659492492676, "global_step": 85694, "epoch": 2040} {"train_loss": -5.958156108856201, "global_step": 85695, "epoch": 2040} {"train_loss": -6.192558765411377, "global_step": 85696, "epoch": 2040} {"train_loss": -6.245486259460449, "global_step": 85697, "epoch": 2040} {"train_loss": -6.128018379211426, "global_step": 85698, "epoch": 2040} {"train_loss": -6.1189188957214355, "global_step": 85699, "epoch": 2040} {"train_loss": -6.196253776550293, "global_step": 85700, "epoch": 2040} {"train_loss": -6.076082706451416, "global_step": 85701, "epoch": 2040} {"train_loss": -6.150605201721191, "global_step": 85702, "epoch": 2040} {"train_loss": -6.141664981842041, "global_step": 85703, "epoch": 2040} {"train_loss": -6.064241886138916, "global_step": 85704, "epoch": 2040} {"train_loss": -6.229401588439941, "global_step": 85705, "epoch": 2040} {"train_loss": -6.211382865905762, "global_step": 85706, "epoch": 2040} {"train_loss": -6.158905029296875, "global_step": 85707, "epoch": 2040} {"train_loss": -6.209103584289551, "global_step": 85708, "epoch": 2040} {"train_loss": -6.182985782623291, "global_step": 85709, "epoch": 2040} {"train_loss": -6.192091941833496, "global_step": 85710, "epoch": 2040} {"train_loss": -6.213010787963867, "global_step": 85711, "epoch": 2040} {"train_loss": -6.076648712158203, "global_step": 85712, "epoch": 2040} {"train_loss": -6.282682418823242, "global_step": 85713, "epoch": 2040} {"train_loss": -6.16063117980957, "global_step": 85714, "epoch": 2040} {"train_loss": -6.2455620765686035, "global_step": 85715, "epoch": 2040} {"train_loss": -6.093809127807617, "global_step": 85716, "epoch": 2040} {"train_loss": -6.198894023895264, "global_step": 85717, "epoch": 2040} {"train_loss": -6.193617820739746, "global_step": 85718, "epoch": 2040} {"train_loss": -6.258547306060791, "global_step": 85719, "epoch": 2040} {"train_loss": -6.230317115783691, "global_step": 85720, "epoch": 2040} {"train_loss": -6.191932246798561, "global_step": 85721, "epoch": 2040, "val_loss": 63030.34375} {"train_loss": -6.226536273956299, "global_step": 85722, "epoch": 2041} {"train_loss": -6.241356372833252, "global_step": 85723, "epoch": 2041} {"train_loss": -6.294611930847168, "global_step": 85724, "epoch": 2041} {"train_loss": -6.19087028503418, "global_step": 85725, "epoch": 2041} {"train_loss": -6.182181358337402, "global_step": 85726, "epoch": 2041} {"train_loss": -6.306238174438477, "global_step": 85727, "epoch": 2041} {"train_loss": -6.198869228363037, "global_step": 85728, "epoch": 2041} {"train_loss": -6.004772663116455, "global_step": 85729, "epoch": 2041} {"train_loss": -6.191834449768066, "global_step": 85730, "epoch": 2041} {"train_loss": -6.188773155212402, "global_step": 85731, "epoch": 2041} {"train_loss": -6.088347434997559, "global_step": 85732, "epoch": 2041} {"train_loss": -6.24127197265625, "global_step": 85733, "epoch": 2041} {"train_loss": -6.161140441894531, "global_step": 85734, "epoch": 2041} {"train_loss": -6.221364974975586, "global_step": 85735, "epoch": 2041} {"train_loss": -6.258486270904541, "global_step": 85736, "epoch": 2041} {"train_loss": -6.129588603973389, "global_step": 85737, "epoch": 2041} {"train_loss": -6.244451999664307, "global_step": 85738, "epoch": 2041} {"train_loss": -6.141195297241211, "global_step": 85739, "epoch": 2041} {"train_loss": -6.175111293792725, "global_step": 85740, "epoch": 2041} {"train_loss": -6.194430351257324, "global_step": 85741, "epoch": 2041} {"train_loss": -6.318866729736328, "global_step": 85742, "epoch": 2041} {"train_loss": -6.176522254943848, "global_step": 85743, "epoch": 2041} {"train_loss": -6.243350505828857, "global_step": 85744, "epoch": 2041} {"train_loss": -6.163033485412598, "global_step": 85745, "epoch": 2041} {"train_loss": -6.175530433654785, "global_step": 85746, "epoch": 2041} {"train_loss": -6.159426689147949, "global_step": 85747, "epoch": 2041} {"train_loss": -6.195622444152832, "global_step": 85748, "epoch": 2041} {"train_loss": -6.227541923522949, "global_step": 85749, "epoch": 2041} {"train_loss": -6.200510025024414, "global_step": 85750, "epoch": 2041} {"train_loss": -6.308298110961914, "global_step": 85751, "epoch": 2041} {"train_loss": -6.248083114624023, "global_step": 85752, "epoch": 2041} {"train_loss": -6.256307125091553, "global_step": 85753, "epoch": 2041} {"train_loss": -6.227234840393066, "global_step": 85754, "epoch": 2041} {"train_loss": -6.3170623779296875, "global_step": 85755, "epoch": 2041} {"train_loss": -6.2527360916137695, "global_step": 85756, "epoch": 2041} {"train_loss": -6.186477184295654, "global_step": 85757, "epoch": 2041} {"train_loss": -6.13857889175415, "global_step": 85758, "epoch": 2041} {"train_loss": -6.2216386795043945, "global_step": 85759, "epoch": 2041} {"train_loss": -6.275933742523193, "global_step": 85760, "epoch": 2041} {"train_loss": -6.181523323059082, "global_step": 85761, "epoch": 2041} {"train_loss": -6.190516948699951, "global_step": 85762, "epoch": 2041} {"train_loss": -6.208605414345151, "global_step": 85763, "epoch": 2041, "val_loss": 62911.16015625} {"train_loss": -6.058443069458008, "global_step": 85764, "epoch": 2042} {"train_loss": -6.201079368591309, "global_step": 85765, "epoch": 2042} {"train_loss": -6.282094955444336, "global_step": 85766, "epoch": 2042} {"train_loss": -6.2387471199035645, "global_step": 85767, "epoch": 2042} {"train_loss": -6.182137489318848, "global_step": 85768, "epoch": 2042} {"train_loss": -6.223643779754639, "global_step": 85769, "epoch": 2042} {"train_loss": -6.177283763885498, "global_step": 85770, "epoch": 2042} {"train_loss": -6.242081642150879, "global_step": 85771, "epoch": 2042} {"train_loss": -6.221186637878418, "global_step": 85772, "epoch": 2042} {"train_loss": -6.1364359855651855, "global_step": 85773, "epoch": 2042} {"train_loss": -6.07000732421875, "global_step": 85774, "epoch": 2042} {"train_loss": -6.185758590698242, "global_step": 85775, "epoch": 2042} {"train_loss": -6.185937881469727, "global_step": 85776, "epoch": 2042} {"train_loss": -6.256896018981934, "global_step": 85777, "epoch": 2042} {"train_loss": -6.1647138595581055, "global_step": 85778, "epoch": 2042} {"train_loss": -6.1853861808776855, "global_step": 85779, "epoch": 2042} {"train_loss": -6.258996486663818, "global_step": 85780, "epoch": 2042} {"train_loss": -6.176456451416016, "global_step": 85781, "epoch": 2042} {"train_loss": -6.219422817230225, "global_step": 85782, "epoch": 2042} {"train_loss": -6.12124490737915, "global_step": 85783, "epoch": 2042} {"train_loss": -6.289244651794434, "global_step": 85784, "epoch": 2042} {"train_loss": -6.151317596435547, "global_step": 85785, "epoch": 2042} {"train_loss": -6.245218276977539, "global_step": 85786, "epoch": 2042} {"train_loss": -6.301925182342529, "global_step": 85787, "epoch": 2042} {"train_loss": -6.165968894958496, "global_step": 85788, "epoch": 2042} {"train_loss": -6.239690780639648, "global_step": 85789, "epoch": 2042} {"train_loss": -6.235874652862549, "global_step": 85790, "epoch": 2042} {"train_loss": -6.217103004455566, "global_step": 85791, "epoch": 2042} {"train_loss": -6.171154975891113, "global_step": 85792, "epoch": 2042} {"train_loss": -6.199769496917725, "global_step": 85793, "epoch": 2042} {"train_loss": -6.241495609283447, "global_step": 85794, "epoch": 2042} {"train_loss": -6.236227035522461, "global_step": 85795, "epoch": 2042} {"train_loss": -6.165545463562012, "global_step": 85796, "epoch": 2042} {"train_loss": -6.228153228759766, "global_step": 85797, "epoch": 2042} {"train_loss": -6.152393817901611, "global_step": 85798, "epoch": 2042} {"train_loss": -6.159324645996094, "global_step": 85799, "epoch": 2042} {"train_loss": -6.257238388061523, "global_step": 85800, "epoch": 2042} {"train_loss": -6.177020072937012, "global_step": 85801, "epoch": 2042} {"train_loss": -6.16109561920166, "global_step": 85802, "epoch": 2042} {"train_loss": -6.305214881896973, "global_step": 85803, "epoch": 2042} {"train_loss": -6.276931285858154, "global_step": 85804, "epoch": 2042} {"train_loss": -6.200739576703026, "global_step": 85805, "epoch": 2042, "val_loss": 62583.6640625} {"train_loss": -6.172768592834473, "global_step": 85806, "epoch": 2043} {"train_loss": -6.281538963317871, "global_step": 85807, "epoch": 2043} {"train_loss": -6.153963565826416, "global_step": 85808, "epoch": 2043} {"train_loss": -6.2141032218933105, "global_step": 85809, "epoch": 2043} {"train_loss": -6.302912712097168, "global_step": 85810, "epoch": 2043} {"train_loss": -6.273873329162598, "global_step": 85811, "epoch": 2043} {"train_loss": -6.2773237228393555, "global_step": 85812, "epoch": 2043} {"train_loss": -6.084802627563477, "global_step": 85813, "epoch": 2043} {"train_loss": -6.21746826171875, "global_step": 85814, "epoch": 2043} {"train_loss": -6.1161346435546875, "global_step": 85815, "epoch": 2043} {"train_loss": -6.174508094787598, "global_step": 85816, "epoch": 2043} {"train_loss": -6.0770792961120605, "global_step": 85817, "epoch": 2043} {"train_loss": -6.184186935424805, "global_step": 85818, "epoch": 2043} {"train_loss": -6.272641658782959, "global_step": 85819, "epoch": 2043} {"train_loss": -6.228080749511719, "global_step": 85820, "epoch": 2043} {"train_loss": -6.149075031280518, "global_step": 85821, "epoch": 2043} {"train_loss": -6.233898162841797, "global_step": 85822, "epoch": 2043} {"train_loss": -6.309311866760254, "global_step": 85823, "epoch": 2043} {"train_loss": -6.298033237457275, "global_step": 85824, "epoch": 2043} {"train_loss": -6.219369888305664, "global_step": 85825, "epoch": 2043} {"train_loss": -6.144075393676758, "global_step": 85826, "epoch": 2043} {"train_loss": -6.147601127624512, "global_step": 85827, "epoch": 2043} {"train_loss": -6.265340805053711, "global_step": 85828, "epoch": 2043} {"train_loss": -6.251919746398926, "global_step": 85829, "epoch": 2043} {"train_loss": -6.224971771240234, "global_step": 85830, "epoch": 2043} {"train_loss": -6.24123477935791, "global_step": 85831, "epoch": 2043} {"train_loss": -6.133920669555664, "global_step": 85832, "epoch": 2043} {"train_loss": -6.136560440063477, "global_step": 85833, "epoch": 2043} {"train_loss": -6.355538368225098, "global_step": 85834, "epoch": 2043} {"train_loss": -6.073729991912842, "global_step": 85835, "epoch": 2043} {"train_loss": -6.290202617645264, "global_step": 85836, "epoch": 2043} {"train_loss": -6.228740692138672, "global_step": 85837, "epoch": 2043} {"train_loss": -6.242908477783203, "global_step": 85838, "epoch": 2043} {"train_loss": -6.194923400878906, "global_step": 85839, "epoch": 2043} {"train_loss": -6.14014196395874, "global_step": 85840, "epoch": 2043} {"train_loss": -6.171356201171875, "global_step": 85841, "epoch": 2043} {"train_loss": -6.189823627471924, "global_step": 85842, "epoch": 2043} {"train_loss": -6.302292823791504, "global_step": 85843, "epoch": 2043} {"train_loss": -6.1946516036987305, "global_step": 85844, "epoch": 2043} {"train_loss": -6.237915515899658, "global_step": 85845, "epoch": 2043} {"train_loss": -6.138089179992676, "global_step": 85846, "epoch": 2043} {"train_loss": -6.210008575802758, "global_step": 85847, "epoch": 2043, "val_loss": 62637.96875} {"train_loss": -6.157299518585205, "global_step": 85848, "epoch": 2044} {"train_loss": -6.255439281463623, "global_step": 85849, "epoch": 2044} {"train_loss": -6.151127338409424, "global_step": 85850, "epoch": 2044} {"train_loss": -6.208004474639893, "global_step": 85851, "epoch": 2044} {"train_loss": -6.183040618896484, "global_step": 85852, "epoch": 2044} {"train_loss": -6.260685920715332, "global_step": 85853, "epoch": 2044} {"train_loss": -6.281293869018555, "global_step": 85854, "epoch": 2044} {"train_loss": -6.21524715423584, "global_step": 85855, "epoch": 2044} {"train_loss": -6.216610431671143, "global_step": 85856, "epoch": 2044} {"train_loss": -6.363228797912598, "global_step": 85857, "epoch": 2044} {"train_loss": -6.276592254638672, "global_step": 85858, "epoch": 2044} {"train_loss": -6.1078033447265625, "global_step": 85859, "epoch": 2044} {"train_loss": -6.199875354766846, "global_step": 85860, "epoch": 2044} {"train_loss": -6.164562702178955, "global_step": 85861, "epoch": 2044} {"train_loss": -6.295392036437988, "global_step": 85862, "epoch": 2044} {"train_loss": -6.2613043785095215, "global_step": 85863, "epoch": 2044} {"train_loss": -6.2281694412231445, "global_step": 85864, "epoch": 2044} {"train_loss": -6.10158634185791, "global_step": 85865, "epoch": 2044} {"train_loss": -6.230830669403076, "global_step": 85866, "epoch": 2044} {"train_loss": -6.325155258178711, "global_step": 85867, "epoch": 2044} {"train_loss": -6.227481842041016, "global_step": 85868, "epoch": 2044} {"train_loss": -6.223452091217041, "global_step": 85869, "epoch": 2044} {"train_loss": -6.126380443572998, "global_step": 85870, "epoch": 2044} {"train_loss": -6.306582450866699, "global_step": 85871, "epoch": 2044} {"train_loss": -6.219545841217041, "global_step": 85872, "epoch": 2044} {"train_loss": -6.132784843444824, "global_step": 85873, "epoch": 2044} {"train_loss": -6.27126932144165, "global_step": 85874, "epoch": 2044} {"train_loss": -6.210590362548828, "global_step": 85875, "epoch": 2044} {"train_loss": -6.233030319213867, "global_step": 85876, "epoch": 2044} {"train_loss": -6.1052775382995605, "global_step": 85877, "epoch": 2044} {"train_loss": -6.163642883300781, "global_step": 85878, "epoch": 2044} {"train_loss": -6.221054553985596, "global_step": 85879, "epoch": 2044} {"train_loss": -6.248465061187744, "global_step": 85880, "epoch": 2044} {"train_loss": -6.071018695831299, "global_step": 85881, "epoch": 2044} {"train_loss": -6.067929267883301, "global_step": 85882, "epoch": 2044} {"train_loss": -6.180593490600586, "global_step": 85883, "epoch": 2044} {"train_loss": -6.053332328796387, "global_step": 85884, "epoch": 2044} {"train_loss": -6.172295570373535, "global_step": 85885, "epoch": 2044} {"train_loss": -6.139364242553711, "global_step": 85886, "epoch": 2044} {"train_loss": -6.120391845703125, "global_step": 85887, "epoch": 2044} {"train_loss": -6.1500468254089355, "global_step": 85888, "epoch": 2044} {"train_loss": -6.199289548964727, "global_step": 85889, "epoch": 2044, "val_loss": 62985.28125} {"train_loss": -6.144224643707275, "global_step": 85890, "epoch": 2045} {"train_loss": -6.09342098236084, "global_step": 85891, "epoch": 2045} {"train_loss": -6.078579902648926, "global_step": 85892, "epoch": 2045} {"train_loss": -6.214751243591309, "global_step": 85893, "epoch": 2045} {"train_loss": -6.028177261352539, "global_step": 85894, "epoch": 2045} {"train_loss": -6.293199062347412, "global_step": 85895, "epoch": 2045} {"train_loss": -6.256634712219238, "global_step": 85896, "epoch": 2045} {"train_loss": -6.084550857543945, "global_step": 85897, "epoch": 2045} {"train_loss": -6.1508073806762695, "global_step": 85898, "epoch": 2045} {"train_loss": -6.254061222076416, "global_step": 85899, "epoch": 2045} {"train_loss": -6.2810540199279785, "global_step": 85900, "epoch": 2045} {"train_loss": -6.2816033363342285, "global_step": 85901, "epoch": 2045} {"train_loss": -6.285342216491699, "global_step": 85902, "epoch": 2045} {"train_loss": -6.175482273101807, "global_step": 85903, "epoch": 2045} {"train_loss": -6.218476295471191, "global_step": 85904, "epoch": 2045} {"train_loss": -6.202998161315918, "global_step": 85905, "epoch": 2045} {"train_loss": -6.277807235717773, "global_step": 85906, "epoch": 2045} {"train_loss": -6.200987815856934, "global_step": 85907, "epoch": 2045} {"train_loss": -6.217362403869629, "global_step": 85908, "epoch": 2045} {"train_loss": -6.240665912628174, "global_step": 85909, "epoch": 2045} {"train_loss": -6.144533634185791, "global_step": 85910, "epoch": 2045} {"train_loss": -6.310794353485107, "global_step": 85911, "epoch": 2045} {"train_loss": -6.213760852813721, "global_step": 85912, "epoch": 2045} {"train_loss": -6.226362228393555, "global_step": 85913, "epoch": 2045} {"train_loss": -6.183957576751709, "global_step": 85914, "epoch": 2045} {"train_loss": -6.1802825927734375, "global_step": 85915, "epoch": 2045} {"train_loss": -6.365558624267578, "global_step": 85916, "epoch": 2045} {"train_loss": -6.217531681060791, "global_step": 85917, "epoch": 2045} {"train_loss": -6.064761161804199, "global_step": 85918, "epoch": 2045} {"train_loss": -6.153019428253174, "global_step": 85919, "epoch": 2045} {"train_loss": -6.263660907745361, "global_step": 85920, "epoch": 2045} {"train_loss": -6.122952461242676, "global_step": 85921, "epoch": 2045} {"train_loss": -6.1966729164123535, "global_step": 85922, "epoch": 2045} {"train_loss": -6.144157409667969, "global_step": 85923, "epoch": 2045} {"train_loss": -6.137630462646484, "global_step": 85924, "epoch": 2045} {"train_loss": -6.208771705627441, "global_step": 85925, "epoch": 2045} {"train_loss": -6.220977783203125, "global_step": 85926, "epoch": 2045} {"train_loss": -6.186539173126221, "global_step": 85927, "epoch": 2045} {"train_loss": -6.332761764526367, "global_step": 85928, "epoch": 2045} {"train_loss": -6.220415115356445, "global_step": 85929, "epoch": 2045} {"train_loss": -6.236609935760498, "global_step": 85930, "epoch": 2045} {"train_loss": -6.202863034747896, "global_step": 85931, "epoch": 2045, "val_loss": 62761.0546875} {"train_loss": -6.213642120361328, "global_step": 85932, "epoch": 2046} {"train_loss": -6.207103729248047, "global_step": 85933, "epoch": 2046} {"train_loss": -6.269781112670898, "global_step": 85934, "epoch": 2046} {"train_loss": -6.166053295135498, "global_step": 85935, "epoch": 2046} {"train_loss": -6.203812599182129, "global_step": 85936, "epoch": 2046} {"train_loss": -6.151216506958008, "global_step": 85937, "epoch": 2046} {"train_loss": -6.1016387939453125, "global_step": 85938, "epoch": 2046} {"train_loss": -6.124707221984863, "global_step": 85939, "epoch": 2046} {"train_loss": -6.2721052169799805, "global_step": 85940, "epoch": 2046} {"train_loss": -6.265064239501953, "global_step": 85941, "epoch": 2046} {"train_loss": -6.2857770919799805, "global_step": 85942, "epoch": 2046} {"train_loss": -6.240588188171387, "global_step": 85943, "epoch": 2046} {"train_loss": -6.23602819442749, "global_step": 85944, "epoch": 2046} {"train_loss": -6.229496002197266, "global_step": 85945, "epoch": 2046} {"train_loss": -6.100920677185059, "global_step": 85946, "epoch": 2046} {"train_loss": -6.276110649108887, "global_step": 85947, "epoch": 2046} {"train_loss": -6.205454349517822, "global_step": 85948, "epoch": 2046} {"train_loss": -6.287547588348389, "global_step": 85949, "epoch": 2046} {"train_loss": -6.237570762634277, "global_step": 85950, "epoch": 2046} {"train_loss": -6.175976276397705, "global_step": 85951, "epoch": 2046} {"train_loss": -6.015817642211914, "global_step": 85952, "epoch": 2046} {"train_loss": -6.290152549743652, "global_step": 85953, "epoch": 2046} {"train_loss": -6.332905292510986, "global_step": 85954, "epoch": 2046} {"train_loss": -6.223854064941406, "global_step": 85955, "epoch": 2046} {"train_loss": -6.151695251464844, "global_step": 85956, "epoch": 2046} {"train_loss": -6.2974629402160645, "global_step": 85957, "epoch": 2046} {"train_loss": -6.1906819343566895, "global_step": 85958, "epoch": 2046} {"train_loss": -6.217601299285889, "global_step": 85959, "epoch": 2046} {"train_loss": -6.208799362182617, "global_step": 85960, "epoch": 2046} {"train_loss": -6.325454235076904, "global_step": 85961, "epoch": 2046} {"train_loss": -6.2188639640808105, "global_step": 85962, "epoch": 2046} {"train_loss": -6.220098495483398, "global_step": 85963, "epoch": 2046} {"train_loss": -6.234125137329102, "global_step": 85964, "epoch": 2046} {"train_loss": -6.177487850189209, "global_step": 85965, "epoch": 2046} {"train_loss": -6.084983825683594, "global_step": 85966, "epoch": 2046} {"train_loss": -6.227879524230957, "global_step": 85967, "epoch": 2046} {"train_loss": -6.245553016662598, "global_step": 85968, "epoch": 2046} {"train_loss": -6.114621639251709, "global_step": 85969, "epoch": 2046} {"train_loss": -6.177901268005371, "global_step": 85970, "epoch": 2046} {"train_loss": -6.077449798583984, "global_step": 85971, "epoch": 2046} {"train_loss": -6.106305122375488, "global_step": 85972, "epoch": 2046} {"train_loss": -6.202196257455008, "global_step": 85973, "epoch": 2046, "val_loss": 62804.08984375} {"train_loss": -6.221046447753906, "global_step": 85974, "epoch": 2047} {"train_loss": -6.10026741027832, "global_step": 85975, "epoch": 2047} {"train_loss": -6.232539176940918, "global_step": 85976, "epoch": 2047} {"train_loss": -6.211930274963379, "global_step": 85977, "epoch": 2047} {"train_loss": -6.13824462890625, "global_step": 85978, "epoch": 2047} {"train_loss": -6.138267993927002, "global_step": 85979, "epoch": 2047} {"train_loss": -6.238728046417236, "global_step": 85980, "epoch": 2047} {"train_loss": -6.197135925292969, "global_step": 85981, "epoch": 2047} {"train_loss": -6.354465007781982, "global_step": 85982, "epoch": 2047} {"train_loss": -6.182056903839111, "global_step": 85983, "epoch": 2047} {"train_loss": -6.3251237869262695, "global_step": 85984, "epoch": 2047} {"train_loss": -6.301534175872803, "global_step": 85985, "epoch": 2047} {"train_loss": -6.213505268096924, "global_step": 85986, "epoch": 2047} {"train_loss": -6.113267421722412, "global_step": 85987, "epoch": 2047} {"train_loss": -6.260568618774414, "global_step": 85988, "epoch": 2047} {"train_loss": -6.185009479522705, "global_step": 85989, "epoch": 2047} {"train_loss": -6.3456621170043945, "global_step": 85990, "epoch": 2047} {"train_loss": -6.272043228149414, "global_step": 85991, "epoch": 2047} {"train_loss": -6.12813663482666, "global_step": 85992, "epoch": 2047} {"train_loss": -6.232113838195801, "global_step": 85993, "epoch": 2047} {"train_loss": -6.159344673156738, "global_step": 85994, "epoch": 2047} {"train_loss": -6.114529132843018, "global_step": 85995, "epoch": 2047} {"train_loss": -6.161740303039551, "global_step": 85996, "epoch": 2047} {"train_loss": -6.248658180236816, "global_step": 85997, "epoch": 2047} {"train_loss": -6.187901496887207, "global_step": 85998, "epoch": 2047} {"train_loss": -6.1787238121032715, "global_step": 85999, "epoch": 2047} {"train_loss": -6.2417707443237305, "global_step": 86000, "epoch": 2047} {"train_loss": -6.211647987365723, "global_step": 86001, "epoch": 2047} {"train_loss": -6.307700157165527, "global_step": 86002, "epoch": 2047} {"train_loss": -6.17081880569458, "global_step": 86003, "epoch": 2047} {"train_loss": -6.213386535644531, "global_step": 86004, "epoch": 2047} {"train_loss": -6.163585186004639, "global_step": 86005, "epoch": 2047} {"train_loss": -6.1834235191345215, "global_step": 86006, "epoch": 2047} {"train_loss": -6.20778751373291, "global_step": 86007, "epoch": 2047} {"train_loss": -6.187824249267578, "global_step": 86008, "epoch": 2047} {"train_loss": -6.1555867195129395, "global_step": 86009, "epoch": 2047} {"train_loss": -6.148210048675537, "global_step": 86010, "epoch": 2047} {"train_loss": -6.296937942504883, "global_step": 86011, "epoch": 2047} {"train_loss": -6.145956039428711, "global_step": 86012, "epoch": 2047} {"train_loss": -6.067601203918457, "global_step": 86013, "epoch": 2047} {"train_loss": -6.1504340171813965, "global_step": 86014, "epoch": 2047} {"train_loss": -6.201721588770549, "global_step": 86015, "epoch": 2047, "val_loss": 62753.546875} {"train_loss": -6.255845069885254, "global_step": 86016, "epoch": 2048} {"train_loss": -6.128342628479004, "global_step": 86017, "epoch": 2048} {"train_loss": -6.257828235626221, "global_step": 86018, "epoch": 2048} {"train_loss": -6.227579116821289, "global_step": 86019, "epoch": 2048} {"train_loss": -6.202336311340332, "global_step": 86020, "epoch": 2048} {"train_loss": -6.21379280090332, "global_step": 86021, "epoch": 2048} {"train_loss": -6.181339263916016, "global_step": 86022, "epoch": 2048} {"train_loss": -6.287530899047852, "global_step": 86023, "epoch": 2048} {"train_loss": -6.1474809646606445, "global_step": 86024, "epoch": 2048} {"train_loss": -6.076657295227051, "global_step": 86025, "epoch": 2048} {"train_loss": -6.057002067565918, "global_step": 86026, "epoch": 2048} {"train_loss": -6.183495998382568, "global_step": 86027, "epoch": 2048} {"train_loss": -6.150433540344238, "global_step": 86028, "epoch": 2048} {"train_loss": -6.233663558959961, "global_step": 86029, "epoch": 2048} {"train_loss": -6.162961483001709, "global_step": 86030, "epoch": 2048} {"train_loss": -6.118814945220947, "global_step": 86031, "epoch": 2048} {"train_loss": -6.198594570159912, "global_step": 86032, "epoch": 2048} {"train_loss": -6.152876377105713, "global_step": 86033, "epoch": 2048} {"train_loss": -6.220808029174805, "global_step": 86034, "epoch": 2048} {"train_loss": -6.234136581420898, "global_step": 86035, "epoch": 2048} {"train_loss": -6.09476375579834, "global_step": 86036, "epoch": 2048} {"train_loss": -6.218851089477539, "global_step": 86037, "epoch": 2048} {"train_loss": -6.252649784088135, "global_step": 86038, "epoch": 2048} {"train_loss": -6.29941463470459, "global_step": 86039, "epoch": 2048} {"train_loss": -6.309218406677246, "global_step": 86040, "epoch": 2048} {"train_loss": -6.201572418212891, "global_step": 86041, "epoch": 2048} {"train_loss": -6.125308513641357, "global_step": 86042, "epoch": 2048} {"train_loss": -6.282412528991699, "global_step": 86043, "epoch": 2048} {"train_loss": -6.217770576477051, "global_step": 86044, "epoch": 2048} {"train_loss": -6.1923980712890625, "global_step": 86045, "epoch": 2048} {"train_loss": -6.230283737182617, "global_step": 86046, "epoch": 2048} {"train_loss": -6.312836647033691, "global_step": 86047, "epoch": 2048} {"train_loss": -6.1686859130859375, "global_step": 86048, "epoch": 2048} {"train_loss": -6.241275787353516, "global_step": 86049, "epoch": 2048} {"train_loss": -6.240923881530762, "global_step": 86050, "epoch": 2048} {"train_loss": -6.219057083129883, "global_step": 86051, "epoch": 2048} {"train_loss": -6.19651985168457, "global_step": 86052, "epoch": 2048} {"train_loss": -6.162743091583252, "global_step": 86053, "epoch": 2048} {"train_loss": -6.029651165008545, "global_step": 86054, "epoch": 2048} {"train_loss": -6.215025424957275, "global_step": 86055, "epoch": 2048} {"train_loss": -6.0842413902282715, "global_step": 86056, "epoch": 2048} {"train_loss": -6.192522162482852, "global_step": 86057, "epoch": 2048, "val_loss": 63070.54296875} {"train_loss": -6.179553031921387, "global_step": 86058, "epoch": 2049} {"train_loss": -6.109168529510498, "global_step": 86059, "epoch": 2049} {"train_loss": -6.07982063293457, "global_step": 86060, "epoch": 2049} {"train_loss": -6.1846160888671875, "global_step": 86061, "epoch": 2049} {"train_loss": -6.184233665466309, "global_step": 86062, "epoch": 2049} {"train_loss": -6.042020320892334, "global_step": 86063, "epoch": 2049} {"train_loss": -6.255934238433838, "global_step": 86064, "epoch": 2049} {"train_loss": -6.204951286315918, "global_step": 86065, "epoch": 2049} {"train_loss": -6.13397216796875, "global_step": 86066, "epoch": 2049} {"train_loss": -6.072606086730957, "global_step": 86067, "epoch": 2049} {"train_loss": -6.168788909912109, "global_step": 86068, "epoch": 2049} {"train_loss": -6.17615270614624, "global_step": 86069, "epoch": 2049} {"train_loss": -6.1563310623168945, "global_step": 86070, "epoch": 2049} {"train_loss": -6.051801681518555, "global_step": 86071, "epoch": 2049} {"train_loss": -6.146081447601318, "global_step": 86072, "epoch": 2049} {"train_loss": -6.100287437438965, "global_step": 86073, "epoch": 2049} {"train_loss": -6.200998306274414, "global_step": 86074, "epoch": 2049} {"train_loss": -6.261122703552246, "global_step": 86075, "epoch": 2049} {"train_loss": -6.2342848777771, "global_step": 86076, "epoch": 2049} {"train_loss": -6.153607368469238, "global_step": 86077, "epoch": 2049} {"train_loss": -6.215020656585693, "global_step": 86078, "epoch": 2049} {"train_loss": -6.296379089355469, "global_step": 86079, "epoch": 2049} {"train_loss": -6.208772659301758, "global_step": 86080, "epoch": 2049} {"train_loss": -6.127972602844238, "global_step": 86081, "epoch": 2049} {"train_loss": -6.3143391609191895, "global_step": 86082, "epoch": 2049} {"train_loss": -6.21610164642334, "global_step": 86083, "epoch": 2049} {"train_loss": -6.221192836761475, "global_step": 86084, "epoch": 2049} {"train_loss": -6.278080463409424, "global_step": 86085, "epoch": 2049} {"train_loss": -6.140983581542969, "global_step": 86086, "epoch": 2049} {"train_loss": -6.290802001953125, "global_step": 86087, "epoch": 2049} {"train_loss": -6.1890764236450195, "global_step": 86088, "epoch": 2049} {"train_loss": -6.223401069641113, "global_step": 86089, "epoch": 2049} {"train_loss": -6.195833206176758, "global_step": 86090, "epoch": 2049} {"train_loss": -6.212946891784668, "global_step": 86091, "epoch": 2049} {"train_loss": -6.27264928817749, "global_step": 86092, "epoch": 2049} {"train_loss": -6.226489543914795, "global_step": 86093, "epoch": 2049} {"train_loss": -6.3283843994140625, "global_step": 86094, "epoch": 2049} {"train_loss": -6.363283634185791, "global_step": 86095, "epoch": 2049} {"train_loss": -6.0755228996276855, "global_step": 86096, "epoch": 2049} {"train_loss": -6.285076141357422, "global_step": 86097, "epoch": 2049} {"train_loss": -6.201818943023682, "global_step": 86098, "epoch": 2049} {"train_loss": -6.1947320983523415, "global_step": 86099, "epoch": 2049, "val_loss": 62931.72265625} {"train_loss": -6.2383012771606445, "global_step": 86100, "epoch": 2050} {"train_loss": -6.226689338684082, "global_step": 86101, "epoch": 2050} {"train_loss": -6.255061149597168, "global_step": 86102, "epoch": 2050} {"train_loss": -6.2100605964660645, "global_step": 86103, "epoch": 2050} {"train_loss": -6.147848129272461, "global_step": 86104, "epoch": 2050} {"train_loss": -6.340534210205078, "global_step": 86105, "epoch": 2050} {"train_loss": -6.190235137939453, "global_step": 86106, "epoch": 2050} {"train_loss": -6.240691184997559, "global_step": 86107, "epoch": 2050} {"train_loss": -6.225401878356934, "global_step": 86108, "epoch": 2050} {"train_loss": -6.171015739440918, "global_step": 86109, "epoch": 2050} {"train_loss": -6.199364185333252, "global_step": 86110, "epoch": 2050} {"train_loss": -6.282011032104492, "global_step": 86111, "epoch": 2050} {"train_loss": -6.1243462562561035, "global_step": 86112, "epoch": 2050} {"train_loss": -6.133419036865234, "global_step": 86113, "epoch": 2050} {"train_loss": -6.173286437988281, "global_step": 86114, "epoch": 2050} {"train_loss": -6.155406951904297, "global_step": 86115, "epoch": 2050} {"train_loss": -6.179173469543457, "global_step": 86116, "epoch": 2050} {"train_loss": -6.210303783416748, "global_step": 86117, "epoch": 2050} {"train_loss": -6.198424339294434, "global_step": 86118, "epoch": 2050} {"train_loss": -6.158090591430664, "global_step": 86119, "epoch": 2050} {"train_loss": -6.323084831237793, "global_step": 86120, "epoch": 2050} {"train_loss": -6.302707672119141, "global_step": 86121, "epoch": 2050} {"train_loss": -6.271170616149902, "global_step": 86122, "epoch": 2050} {"train_loss": -6.21524715423584, "global_step": 86123, "epoch": 2050} {"train_loss": -6.085221290588379, "global_step": 86124, "epoch": 2050} {"train_loss": -6.134498596191406, "global_step": 86125, "epoch": 2050} {"train_loss": -6.21829080581665, "global_step": 86126, "epoch": 2050} {"train_loss": -6.256281852722168, "global_step": 86127, "epoch": 2050} {"train_loss": -6.194520950317383, "global_step": 86128, "epoch": 2050} {"train_loss": -6.315473556518555, "global_step": 86129, "epoch": 2050} {"train_loss": -6.129944801330566, "global_step": 86130, "epoch": 2050} {"train_loss": -6.1028218269348145, "global_step": 86131, "epoch": 2050} {"train_loss": -6.179306507110596, "global_step": 86132, "epoch": 2050} {"train_loss": -6.28629207611084, "global_step": 86133, "epoch": 2050} {"train_loss": -6.263430595397949, "global_step": 86134, "epoch": 2050} {"train_loss": -6.0610671043396, "global_step": 86135, "epoch": 2050} {"train_loss": -6.268026351928711, "global_step": 86136, "epoch": 2050} {"train_loss": -6.181046962738037, "global_step": 86137, "epoch": 2050} {"train_loss": -6.210361480712891, "global_step": 86138, "epoch": 2050} {"train_loss": -6.14669132232666, "global_step": 86139, "epoch": 2050} {"train_loss": -6.086103439331055, "global_step": 86140, "epoch": 2050} {"train_loss": -6.203292460668655, "global_step": 86141, "epoch": 2050, "train/sim_max_reward_0": 0.19788164756883553, "train/sim_max_reward_1": 0.8996800073324261, "train/sim_max_reward_2": 0.9131790524564043, "train/sim_max_reward_3": 0.6999041178935329, "train/sim_max_reward_4": 0.9459579734286987, "train/sim_max_reward_5": 0.9841143979617649, "test/sim_max_reward_4300000": 0.1384628391774553, "test/sim_max_reward_4300001": 0.5734091234600505, "test/sim_max_reward_4300002": 0.8829495130076248, "test/sim_max_reward_4300003": 0.886185283390145, "test/sim_max_reward_4300004": 0.23170503147064522, "test/sim_max_reward_4300005": 0.8898500387283115, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.46608396807067054, "test/sim_max_reward_4300008": 0.820177172209766, "test/sim_max_reward_4300009": 0.7950806327436173, "test/sim_max_reward_4300010": 1.0, "test/sim_max_reward_4300011": 0.38264552127569185, "test/sim_max_reward_4300012": 0.9310967739816017, "test/sim_max_reward_4300013": 0.41274078134881864, "test/sim_max_reward_4300014": 0.74114967312225, "test/sim_max_reward_4300015": 0.9581477133142845, "test/sim_max_reward_4300016": 0.9489850952595364, "test/sim_max_reward_4300017": 0.8926732664845635, "test/sim_max_reward_4300018": 0.3206750767483088, "test/sim_max_reward_4300019": 0.18556295056646327, "test/sim_max_reward_4300020": 0.9397399998111551, "test/sim_max_reward_4300021": 0.9854726176356193, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.34905033285669257, "test/sim_max_reward_4300024": 0.929419724485512, "test/sim_max_reward_4300025": 0.8508244281478778, "test/sim_max_reward_4300026": 0.08017986696628279, "test/sim_max_reward_4300027": 0.9036795698926341, "test/sim_max_reward_4300028": 0.8889378658851129, "test/sim_max_reward_4300029": 0.9146903319765943, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.3132899277726237, "test/sim_max_reward_4300032": 0.9244358396498136, "test/sim_max_reward_4300033": 0.8791632857740447, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.9028630740409999, "test/sim_max_reward_4300036": 0.20939569530483287, "test/sim_max_reward_4300037": 0.9888147389244492, "test/sim_max_reward_4300038": 0.39596930135789443, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.8215044835660216, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.9997296089442912, "test/sim_max_reward_4300043": 0.7133811350589703, "test/sim_max_reward_4300044": 0.7137327462978351, "test/sim_max_reward_4300045": 0.6123119416317903, "test/sim_max_reward_4300046": 0.09043882771687772, "test/sim_max_reward_4300047": 0.74151890576158, "test/sim_max_reward_4300048": 1.0, "test/sim_max_reward_4300049": 0.0, "train/mean_score": 0.7734528661069437, "test/mean_score": 0.6321224940763862, "val_loss": 62915.609375} {"train_loss": -6.200920104980469, "global_step": 86142, "epoch": 2051} {"train_loss": -6.10911750793457, "global_step": 86143, "epoch": 2051} {"train_loss": -6.228359222412109, "global_step": 86144, "epoch": 2051} {"train_loss": -6.178820610046387, "global_step": 86145, "epoch": 2051} {"train_loss": -6.212058067321777, "global_step": 86146, "epoch": 2051} {"train_loss": -6.243353843688965, "global_step": 86147, "epoch": 2051} {"train_loss": -6.207755088806152, "global_step": 86148, "epoch": 2051} {"train_loss": -6.251852512359619, "global_step": 86149, "epoch": 2051} {"train_loss": -6.2081708908081055, "global_step": 86150, "epoch": 2051} {"train_loss": -6.308135986328125, "global_step": 86151, "epoch": 2051} {"train_loss": -6.14943790435791, "global_step": 86152, "epoch": 2051} {"train_loss": -6.157602787017822, "global_step": 86153, "epoch": 2051} {"train_loss": -6.228097915649414, "global_step": 86154, "epoch": 2051} {"train_loss": -6.137495040893555, "global_step": 86155, "epoch": 2051} {"train_loss": -6.309056282043457, "global_step": 86156, "epoch": 2051} {"train_loss": -6.0681915283203125, "global_step": 86157, "epoch": 2051} {"train_loss": -6.320617198944092, "global_step": 86158, "epoch": 2051} {"train_loss": -6.330202579498291, "global_step": 86159, "epoch": 2051} {"train_loss": -6.228957176208496, "global_step": 86160, "epoch": 2051} {"train_loss": -6.230274200439453, "global_step": 86161, "epoch": 2051} {"train_loss": -6.220787048339844, "global_step": 86162, "epoch": 2051} {"train_loss": -6.219985008239746, "global_step": 86163, "epoch": 2051} {"train_loss": -6.128462314605713, "global_step": 86164, "epoch": 2051} {"train_loss": -6.281241416931152, "global_step": 86165, "epoch": 2051} {"train_loss": -6.2924909591674805, "global_step": 86166, "epoch": 2051} {"train_loss": -6.236793041229248, "global_step": 86167, "epoch": 2051} {"train_loss": -6.37397575378418, "global_step": 86168, "epoch": 2051} {"train_loss": -6.147446632385254, "global_step": 86169, "epoch": 2051} {"train_loss": -6.158435821533203, "global_step": 86170, "epoch": 2051} {"train_loss": -6.3951497077941895, "global_step": 86171, "epoch": 2051} {"train_loss": -6.238808631896973, "global_step": 86172, "epoch": 2051} {"train_loss": -6.170481204986572, "global_step": 86173, "epoch": 2051} {"train_loss": -6.29887580871582, "global_step": 86174, "epoch": 2051} {"train_loss": -6.31019401550293, "global_step": 86175, "epoch": 2051} {"train_loss": -6.175469398498535, "global_step": 86176, "epoch": 2051} {"train_loss": -6.1976189613342285, "global_step": 86177, "epoch": 2051} {"train_loss": -6.25124979019165, "global_step": 86178, "epoch": 2051} {"train_loss": -6.264674186706543, "global_step": 86179, "epoch": 2051} {"train_loss": -6.180431365966797, "global_step": 86180, "epoch": 2051} {"train_loss": -6.24199914932251, "global_step": 86181, "epoch": 2051} {"train_loss": -6.037569999694824, "global_step": 86182, "epoch": 2051} {"train_loss": -6.221642619087582, "global_step": 86183, "epoch": 2051, "val_loss": 62964.63671875} {"train_loss": -6.294322967529297, "global_step": 86184, "epoch": 2052} {"train_loss": -6.248246192932129, "global_step": 86185, "epoch": 2052} {"train_loss": -6.297912120819092, "global_step": 86186, "epoch": 2052} {"train_loss": -6.314387321472168, "global_step": 86187, "epoch": 2052} {"train_loss": -6.277398109436035, "global_step": 86188, "epoch": 2052} {"train_loss": -6.344027519226074, "global_step": 86189, "epoch": 2052} {"train_loss": -6.235074043273926, "global_step": 86190, "epoch": 2052} {"train_loss": -6.205055236816406, "global_step": 86191, "epoch": 2052} {"train_loss": -6.253073215484619, "global_step": 86192, "epoch": 2052} {"train_loss": -6.154248237609863, "global_step": 86193, "epoch": 2052} {"train_loss": -6.166098594665527, "global_step": 86194, "epoch": 2052} {"train_loss": -6.308259010314941, "global_step": 86195, "epoch": 2052} {"train_loss": -6.128177642822266, "global_step": 86196, "epoch": 2052} {"train_loss": -6.178830146789551, "global_step": 86197, "epoch": 2052} {"train_loss": -6.139532566070557, "global_step": 86198, "epoch": 2052} {"train_loss": -6.11830472946167, "global_step": 86199, "epoch": 2052} {"train_loss": -6.193178653717041, "global_step": 86200, "epoch": 2052} {"train_loss": -6.227661609649658, "global_step": 86201, "epoch": 2052} {"train_loss": -6.216772556304932, "global_step": 86202, "epoch": 2052} {"train_loss": -6.108019828796387, "global_step": 86203, "epoch": 2052} {"train_loss": -6.1682281494140625, "global_step": 86204, "epoch": 2052} {"train_loss": -6.183133602142334, "global_step": 86205, "epoch": 2052} {"train_loss": -6.201141357421875, "global_step": 86206, "epoch": 2052} {"train_loss": -6.08751106262207, "global_step": 86207, "epoch": 2052} {"train_loss": -6.212353706359863, "global_step": 86208, "epoch": 2052} {"train_loss": -6.240012168884277, "global_step": 86209, "epoch": 2052} {"train_loss": -6.100857734680176, "global_step": 86210, "epoch": 2052} {"train_loss": -6.234281539916992, "global_step": 86211, "epoch": 2052} {"train_loss": -6.187692165374756, "global_step": 86212, "epoch": 2052} {"train_loss": -6.222842216491699, "global_step": 86213, "epoch": 2052} {"train_loss": -6.127920150756836, "global_step": 86214, "epoch": 2052} {"train_loss": -6.245290279388428, "global_step": 86215, "epoch": 2052} {"train_loss": -6.210901737213135, "global_step": 86216, "epoch": 2052} {"train_loss": -6.208725929260254, "global_step": 86217, "epoch": 2052} {"train_loss": -6.233442306518555, "global_step": 86218, "epoch": 2052} {"train_loss": -6.060405731201172, "global_step": 86219, "epoch": 2052} {"train_loss": -6.2456231117248535, "global_step": 86220, "epoch": 2052} {"train_loss": -6.331542015075684, "global_step": 86221, "epoch": 2052} {"train_loss": -6.212357521057129, "global_step": 86222, "epoch": 2052} {"train_loss": -6.2477617263793945, "global_step": 86223, "epoch": 2052} {"train_loss": -6.216121673583984, "global_step": 86224, "epoch": 2052} {"train_loss": -6.207947708311535, "global_step": 86225, "epoch": 2052, "val_loss": 62744.21875} {"train_loss": -6.171417236328125, "global_step": 86226, "epoch": 2053} {"train_loss": -6.2434563636779785, "global_step": 86227, "epoch": 2053} {"train_loss": -6.252138137817383, "global_step": 86228, "epoch": 2053} {"train_loss": -6.179947853088379, "global_step": 86229, "epoch": 2053} {"train_loss": -6.275787353515625, "global_step": 86230, "epoch": 2053} {"train_loss": -6.198278427124023, "global_step": 86231, "epoch": 2053} {"train_loss": -6.265727996826172, "global_step": 86232, "epoch": 2053} {"train_loss": -6.416773796081543, "global_step": 86233, "epoch": 2053} {"train_loss": -6.2304558753967285, "global_step": 86234, "epoch": 2053} {"train_loss": -6.123147964477539, "global_step": 86235, "epoch": 2053} {"train_loss": -6.2443389892578125, "global_step": 86236, "epoch": 2053} {"train_loss": -6.249688148498535, "global_step": 86237, "epoch": 2053} {"train_loss": -6.126047134399414, "global_step": 86238, "epoch": 2053} {"train_loss": -6.283787250518799, "global_step": 86239, "epoch": 2053} {"train_loss": -6.27156925201416, "global_step": 86240, "epoch": 2053} {"train_loss": -6.0623979568481445, "global_step": 86241, "epoch": 2053} {"train_loss": -6.185406684875488, "global_step": 86242, "epoch": 2053} {"train_loss": -6.138452053070068, "global_step": 86243, "epoch": 2053} {"train_loss": -6.251339912414551, "global_step": 86244, "epoch": 2053} {"train_loss": -6.226015090942383, "global_step": 86245, "epoch": 2053} {"train_loss": -6.053330421447754, "global_step": 86246, "epoch": 2053} {"train_loss": -6.22312068939209, "global_step": 86247, "epoch": 2053} {"train_loss": -6.176642894744873, "global_step": 86248, "epoch": 2053} {"train_loss": -6.186018943786621, "global_step": 86249, "epoch": 2053} {"train_loss": -6.278144836425781, "global_step": 86250, "epoch": 2053} {"train_loss": -6.1092729568481445, "global_step": 86251, "epoch": 2053} {"train_loss": -6.210237503051758, "global_step": 86252, "epoch": 2053} {"train_loss": -6.14764404296875, "global_step": 86253, "epoch": 2053} {"train_loss": -6.230690002441406, "global_step": 86254, "epoch": 2053} {"train_loss": -6.197210311889648, "global_step": 86255, "epoch": 2053} {"train_loss": -6.194443702697754, "global_step": 86256, "epoch": 2053} {"train_loss": -6.204354286193848, "global_step": 86257, "epoch": 2053} {"train_loss": -6.240464210510254, "global_step": 86258, "epoch": 2053} {"train_loss": -6.191652774810791, "global_step": 86259, "epoch": 2053} {"train_loss": -6.236438274383545, "global_step": 86260, "epoch": 2053} {"train_loss": -6.319581985473633, "global_step": 86261, "epoch": 2053} {"train_loss": -6.241335391998291, "global_step": 86262, "epoch": 2053} {"train_loss": -6.1762871742248535, "global_step": 86263, "epoch": 2053} {"train_loss": -6.22781229019165, "global_step": 86264, "epoch": 2053} {"train_loss": -6.188284397125244, "global_step": 86265, "epoch": 2053} {"train_loss": -6.172689437866211, "global_step": 86266, "epoch": 2053} {"train_loss": -6.209630864007132, "global_step": 86267, "epoch": 2053, "val_loss": 62878.72265625} {"train_loss": -6.163880825042725, "global_step": 86268, "epoch": 2054} {"train_loss": -6.236151695251465, "global_step": 86269, "epoch": 2054} {"train_loss": -6.287501335144043, "global_step": 86270, "epoch": 2054} {"train_loss": -6.271940231323242, "global_step": 86271, "epoch": 2054} {"train_loss": -6.178708553314209, "global_step": 86272, "epoch": 2054} {"train_loss": -6.117624282836914, "global_step": 86273, "epoch": 2054} {"train_loss": -6.305298805236816, "global_step": 86274, "epoch": 2054} {"train_loss": -6.289026260375977, "global_step": 86275, "epoch": 2054} {"train_loss": -6.235008239746094, "global_step": 86276, "epoch": 2054} {"train_loss": -6.26112174987793, "global_step": 86277, "epoch": 2054} {"train_loss": -6.175564289093018, "global_step": 86278, "epoch": 2054} {"train_loss": -6.045569896697998, "global_step": 86279, "epoch": 2054} {"train_loss": -6.185253143310547, "global_step": 86280, "epoch": 2054} {"train_loss": -5.943601608276367, "global_step": 86281, "epoch": 2054} {"train_loss": -6.058470726013184, "global_step": 86282, "epoch": 2054} {"train_loss": -6.191023826599121, "global_step": 86283, "epoch": 2054} {"train_loss": -6.284101486206055, "global_step": 86284, "epoch": 2054} {"train_loss": -6.165721893310547, "global_step": 86285, "epoch": 2054} {"train_loss": -6.295198917388916, "global_step": 86286, "epoch": 2054} {"train_loss": -6.164243698120117, "global_step": 86287, "epoch": 2054} {"train_loss": -6.228224754333496, "global_step": 86288, "epoch": 2054} {"train_loss": -6.371071815490723, "global_step": 86289, "epoch": 2054} {"train_loss": -6.312278747558594, "global_step": 86290, "epoch": 2054} {"train_loss": -6.2780256271362305, "global_step": 86291, "epoch": 2054} {"train_loss": -6.22065544128418, "global_step": 86292, "epoch": 2054} {"train_loss": -6.286259651184082, "global_step": 86293, "epoch": 2054} {"train_loss": -6.183011054992676, "global_step": 86294, "epoch": 2054} {"train_loss": -6.206593990325928, "global_step": 86295, "epoch": 2054} {"train_loss": -6.326391220092773, "global_step": 86296, "epoch": 2054} {"train_loss": -6.25333833694458, "global_step": 86297, "epoch": 2054} {"train_loss": -6.257164001464844, "global_step": 86298, "epoch": 2054} {"train_loss": -6.2847700119018555, "global_step": 86299, "epoch": 2054} {"train_loss": -6.213512420654297, "global_step": 86300, "epoch": 2054} {"train_loss": -6.311374187469482, "global_step": 86301, "epoch": 2054} {"train_loss": -6.3674540519714355, "global_step": 86302, "epoch": 2054} {"train_loss": -6.341567039489746, "global_step": 86303, "epoch": 2054} {"train_loss": -6.225386619567871, "global_step": 86304, "epoch": 2054} {"train_loss": -6.178096294403076, "global_step": 86305, "epoch": 2054} {"train_loss": -6.231179237365723, "global_step": 86306, "epoch": 2054} {"train_loss": -6.260326385498047, "global_step": 86307, "epoch": 2054} {"train_loss": -6.30262565612793, "global_step": 86308, "epoch": 2054} {"train_loss": -6.231208982921782, "global_step": 86309, "epoch": 2054, "val_loss": 62910.51953125} {"train_loss": -6.277989387512207, "global_step": 86310, "epoch": 2055} {"train_loss": -6.250075340270996, "global_step": 86311, "epoch": 2055} {"train_loss": -6.202489852905273, "global_step": 86312, "epoch": 2055} {"train_loss": -6.245126724243164, "global_step": 86313, "epoch": 2055} {"train_loss": -6.204972267150879, "global_step": 86314, "epoch": 2055} {"train_loss": -6.294609069824219, "global_step": 86315, "epoch": 2055} {"train_loss": -6.270936965942383, "global_step": 86316, "epoch": 2055} {"train_loss": -6.221240043640137, "global_step": 86317, "epoch": 2055} {"train_loss": -6.2447509765625, "global_step": 86318, "epoch": 2055} {"train_loss": -6.2175822257995605, "global_step": 86319, "epoch": 2055} {"train_loss": -6.0784406661987305, "global_step": 86320, "epoch": 2055} {"train_loss": -6.22281551361084, "global_step": 86321, "epoch": 2055} {"train_loss": -6.148977279663086, "global_step": 86322, "epoch": 2055} {"train_loss": -6.2233123779296875, "global_step": 86323, "epoch": 2055} {"train_loss": -6.306954860687256, "global_step": 86324, "epoch": 2055} {"train_loss": -6.296773910522461, "global_step": 86325, "epoch": 2055} {"train_loss": -6.317961692810059, "global_step": 86326, "epoch": 2055} {"train_loss": -6.109315872192383, "global_step": 86327, "epoch": 2055} {"train_loss": -6.212603569030762, "global_step": 86328, "epoch": 2055} {"train_loss": -6.157303810119629, "global_step": 86329, "epoch": 2055} {"train_loss": -6.168485641479492, "global_step": 86330, "epoch": 2055} {"train_loss": -6.364631652832031, "global_step": 86331, "epoch": 2055} {"train_loss": -6.220987319946289, "global_step": 86332, "epoch": 2055} {"train_loss": -6.186142921447754, "global_step": 86333, "epoch": 2055} {"train_loss": -6.2380876541137695, "global_step": 86334, "epoch": 2055} {"train_loss": -6.257933616638184, "global_step": 86335, "epoch": 2055} {"train_loss": -6.217768669128418, "global_step": 86336, "epoch": 2055} {"train_loss": -6.30494499206543, "global_step": 86337, "epoch": 2055} {"train_loss": -6.119664192199707, "global_step": 86338, "epoch": 2055} {"train_loss": -6.076310157775879, "global_step": 86339, "epoch": 2055} {"train_loss": -6.3047285079956055, "global_step": 86340, "epoch": 2055} {"train_loss": -6.141425132751465, "global_step": 86341, "epoch": 2055} {"train_loss": -6.114306449890137, "global_step": 86342, "epoch": 2055} {"train_loss": -6.258642196655273, "global_step": 86343, "epoch": 2055} {"train_loss": -6.085962295532227, "global_step": 86344, "epoch": 2055} {"train_loss": -6.07547664642334, "global_step": 86345, "epoch": 2055} {"train_loss": -6.115259647369385, "global_step": 86346, "epoch": 2055} {"train_loss": -6.218747615814209, "global_step": 86347, "epoch": 2055} {"train_loss": -6.2094855308532715, "global_step": 86348, "epoch": 2055} {"train_loss": -6.241495132446289, "global_step": 86349, "epoch": 2055} {"train_loss": -6.2572479248046875, "global_step": 86350, "epoch": 2055} {"train_loss": -6.21186317716326, "global_step": 86351, "epoch": 2055, "val_loss": 62909.9609375} {"train_loss": -6.194694519042969, "global_step": 86352, "epoch": 2056} {"train_loss": -6.157051086425781, "global_step": 86353, "epoch": 2056} {"train_loss": -6.2296037673950195, "global_step": 86354, "epoch": 2056} {"train_loss": -6.125736236572266, "global_step": 86355, "epoch": 2056} {"train_loss": -6.18978214263916, "global_step": 86356, "epoch": 2056} {"train_loss": -6.141024589538574, "global_step": 86357, "epoch": 2056} {"train_loss": -6.082280158996582, "global_step": 86358, "epoch": 2056} {"train_loss": -6.2662553787231445, "global_step": 86359, "epoch": 2056} {"train_loss": -6.149850845336914, "global_step": 86360, "epoch": 2056} {"train_loss": -6.267223358154297, "global_step": 86361, "epoch": 2056} {"train_loss": -6.180979251861572, "global_step": 86362, "epoch": 2056} {"train_loss": -6.02536678314209, "global_step": 86363, "epoch": 2056} {"train_loss": -6.293571949005127, "global_step": 86364, "epoch": 2056} {"train_loss": -6.1926374435424805, "global_step": 86365, "epoch": 2056} {"train_loss": -6.130152702331543, "global_step": 86366, "epoch": 2056} {"train_loss": -6.135045051574707, "global_step": 86367, "epoch": 2056} {"train_loss": -6.061362266540527, "global_step": 86368, "epoch": 2056} {"train_loss": -6.136269569396973, "global_step": 86369, "epoch": 2056} {"train_loss": -6.242547988891602, "global_step": 86370, "epoch": 2056} {"train_loss": -6.065830707550049, "global_step": 86371, "epoch": 2056} {"train_loss": -6.157557487487793, "global_step": 86372, "epoch": 2056} {"train_loss": -6.271672248840332, "global_step": 86373, "epoch": 2056} {"train_loss": -6.18484354019165, "global_step": 86374, "epoch": 2056} {"train_loss": -6.269575595855713, "global_step": 86375, "epoch": 2056} {"train_loss": -6.212054252624512, "global_step": 86376, "epoch": 2056} {"train_loss": -6.13031005859375, "global_step": 86377, "epoch": 2056} {"train_loss": -6.277383804321289, "global_step": 86378, "epoch": 2056} {"train_loss": -6.08737850189209, "global_step": 86379, "epoch": 2056} {"train_loss": -6.234323024749756, "global_step": 86380, "epoch": 2056} {"train_loss": -6.167341232299805, "global_step": 86381, "epoch": 2056} {"train_loss": -6.1554670333862305, "global_step": 86382, "epoch": 2056} {"train_loss": -6.234015464782715, "global_step": 86383, "epoch": 2056} {"train_loss": -6.190077781677246, "global_step": 86384, "epoch": 2056} {"train_loss": -6.140225887298584, "global_step": 86385, "epoch": 2056} {"train_loss": -6.186841011047363, "global_step": 86386, "epoch": 2056} {"train_loss": -6.142867565155029, "global_step": 86387, "epoch": 2056} {"train_loss": -6.228900909423828, "global_step": 86388, "epoch": 2056} {"train_loss": -6.105027675628662, "global_step": 86389, "epoch": 2056} {"train_loss": -6.167802810668945, "global_step": 86390, "epoch": 2056} {"train_loss": -6.220386505126953, "global_step": 86391, "epoch": 2056} {"train_loss": -6.2188310623168945, "global_step": 86392, "epoch": 2056} {"train_loss": -6.174905322846913, "global_step": 86393, "epoch": 2056, "val_loss": 62996.08984375} {"train_loss": -6.071297645568848, "global_step": 86394, "epoch": 2057} {"train_loss": -6.338790416717529, "global_step": 86395, "epoch": 2057} {"train_loss": -6.253604888916016, "global_step": 86396, "epoch": 2057} {"train_loss": -6.255551815032959, "global_step": 86397, "epoch": 2057} {"train_loss": -6.292813301086426, "global_step": 86398, "epoch": 2057} {"train_loss": -6.311129570007324, "global_step": 86399, "epoch": 2057} {"train_loss": -6.286646842956543, "global_step": 86400, "epoch": 2057} {"train_loss": -6.237700462341309, "global_step": 86401, "epoch": 2057} {"train_loss": -6.139631271362305, "global_step": 86402, "epoch": 2057} {"train_loss": -6.259677410125732, "global_step": 86403, "epoch": 2057} {"train_loss": -6.213336944580078, "global_step": 86404, "epoch": 2057} {"train_loss": -6.308916091918945, "global_step": 86405, "epoch": 2057} {"train_loss": -6.184791564941406, "global_step": 86406, "epoch": 2057} {"train_loss": -6.091670036315918, "global_step": 86407, "epoch": 2057} {"train_loss": -6.176224708557129, "global_step": 86408, "epoch": 2057} {"train_loss": -6.359679222106934, "global_step": 86409, "epoch": 2057} {"train_loss": -6.251792907714844, "global_step": 86410, "epoch": 2057} {"train_loss": -6.137659549713135, "global_step": 86411, "epoch": 2057} {"train_loss": -6.227178573608398, "global_step": 86412, "epoch": 2057} {"train_loss": -6.1154937744140625, "global_step": 86413, "epoch": 2057} {"train_loss": -6.139104843139648, "global_step": 86414, "epoch": 2057} {"train_loss": -6.117274284362793, "global_step": 86415, "epoch": 2057} {"train_loss": -6.212447166442871, "global_step": 86416, "epoch": 2057} {"train_loss": -6.255985260009766, "global_step": 86417, "epoch": 2057} {"train_loss": -6.13517951965332, "global_step": 86418, "epoch": 2057} {"train_loss": -6.246964454650879, "global_step": 86419, "epoch": 2057} {"train_loss": -6.208863258361816, "global_step": 86420, "epoch": 2057} {"train_loss": -6.158364295959473, "global_step": 86421, "epoch": 2057} {"train_loss": -6.1102142333984375, "global_step": 86422, "epoch": 2057} {"train_loss": -6.1844635009765625, "global_step": 86423, "epoch": 2057} {"train_loss": -6.3326849937438965, "global_step": 86424, "epoch": 2057} {"train_loss": -6.198714733123779, "global_step": 86425, "epoch": 2057} {"train_loss": -6.245269775390625, "global_step": 86426, "epoch": 2057} {"train_loss": -6.118646144866943, "global_step": 86427, "epoch": 2057} {"train_loss": -6.2761454582214355, "global_step": 86428, "epoch": 2057} {"train_loss": -6.221095085144043, "global_step": 86429, "epoch": 2057} {"train_loss": -6.159395217895508, "global_step": 86430, "epoch": 2057} {"train_loss": -6.113363265991211, "global_step": 86431, "epoch": 2057} {"train_loss": -6.18276309967041, "global_step": 86432, "epoch": 2057} {"train_loss": -6.282609939575195, "global_step": 86433, "epoch": 2057} {"train_loss": -6.212982177734375, "global_step": 86434, "epoch": 2057} {"train_loss": -6.210559220541091, "global_step": 86435, "epoch": 2057, "val_loss": 62569.65234375} {"train_loss": -6.205173492431641, "global_step": 86436, "epoch": 2058} {"train_loss": -6.135031700134277, "global_step": 86437, "epoch": 2058} {"train_loss": -6.230485439300537, "global_step": 86438, "epoch": 2058} {"train_loss": -6.326167583465576, "global_step": 86439, "epoch": 2058} {"train_loss": -6.301654815673828, "global_step": 86440, "epoch": 2058} {"train_loss": -6.2225422859191895, "global_step": 86441, "epoch": 2058} {"train_loss": -6.191266059875488, "global_step": 86442, "epoch": 2058} {"train_loss": -6.2630767822265625, "global_step": 86443, "epoch": 2058} {"train_loss": -6.300046920776367, "global_step": 86444, "epoch": 2058} {"train_loss": -6.216279029846191, "global_step": 86445, "epoch": 2058} {"train_loss": -6.155889987945557, "global_step": 86446, "epoch": 2058} {"train_loss": -6.272749900817871, "global_step": 86447, "epoch": 2058} {"train_loss": -6.295234680175781, "global_step": 86448, "epoch": 2058} {"train_loss": -6.230075836181641, "global_step": 86449, "epoch": 2058} {"train_loss": -6.212100028991699, "global_step": 86450, "epoch": 2058} {"train_loss": -6.297074317932129, "global_step": 86451, "epoch": 2058} {"train_loss": -6.327060222625732, "global_step": 86452, "epoch": 2058} {"train_loss": -6.218326091766357, "global_step": 86453, "epoch": 2058} {"train_loss": -6.209019184112549, "global_step": 86454, "epoch": 2058} {"train_loss": -6.227977752685547, "global_step": 86455, "epoch": 2058} {"train_loss": -6.210224151611328, "global_step": 86456, "epoch": 2058} {"train_loss": -6.182889938354492, "global_step": 86457, "epoch": 2058} {"train_loss": -6.232051849365234, "global_step": 86458, "epoch": 2058} {"train_loss": -6.224275588989258, "global_step": 86459, "epoch": 2058} {"train_loss": -6.180872917175293, "global_step": 86460, "epoch": 2058} {"train_loss": -6.230882167816162, "global_step": 86461, "epoch": 2058} {"train_loss": -6.302115440368652, "global_step": 86462, "epoch": 2058} {"train_loss": -6.138725280761719, "global_step": 86463, "epoch": 2058} {"train_loss": -6.258732318878174, "global_step": 86464, "epoch": 2058} {"train_loss": -6.253519058227539, "global_step": 86465, "epoch": 2058} {"train_loss": -6.230412483215332, "global_step": 86466, "epoch": 2058} {"train_loss": -6.174023628234863, "global_step": 86467, "epoch": 2058} {"train_loss": -6.235605239868164, "global_step": 86468, "epoch": 2058} {"train_loss": -6.225632667541504, "global_step": 86469, "epoch": 2058} {"train_loss": -6.156798362731934, "global_step": 86470, "epoch": 2058} {"train_loss": -6.260285377502441, "global_step": 86471, "epoch": 2058} {"train_loss": -6.176248550415039, "global_step": 86472, "epoch": 2058} {"train_loss": -6.150306224822998, "global_step": 86473, "epoch": 2058} {"train_loss": -6.213214874267578, "global_step": 86474, "epoch": 2058} {"train_loss": -6.185311317443848, "global_step": 86475, "epoch": 2058} {"train_loss": -6.183506965637207, "global_step": 86476, "epoch": 2058} {"train_loss": -6.225196270715623, "global_step": 86477, "epoch": 2058, "val_loss": 62919.234375} {"train_loss": -6.102646827697754, "global_step": 86478, "epoch": 2059} {"train_loss": -6.130273818969727, "global_step": 86479, "epoch": 2059} {"train_loss": -6.1034345626831055, "global_step": 86480, "epoch": 2059} {"train_loss": -6.358495712280273, "global_step": 86481, "epoch": 2059} {"train_loss": -6.052939414978027, "global_step": 86482, "epoch": 2059} {"train_loss": -6.1687726974487305, "global_step": 86483, "epoch": 2059} {"train_loss": -6.129817962646484, "global_step": 86484, "epoch": 2059} {"train_loss": -6.033322334289551, "global_step": 86485, "epoch": 2059} {"train_loss": -6.215229511260986, "global_step": 86486, "epoch": 2059} {"train_loss": -6.213262557983398, "global_step": 86487, "epoch": 2059} {"train_loss": -6.101693630218506, "global_step": 86488, "epoch": 2059} {"train_loss": -6.178692817687988, "global_step": 86489, "epoch": 2059} {"train_loss": -6.202089309692383, "global_step": 86490, "epoch": 2059} {"train_loss": -6.069242477416992, "global_step": 86491, "epoch": 2059} {"train_loss": -6.2223381996154785, "global_step": 86492, "epoch": 2059} {"train_loss": -6.159379959106445, "global_step": 86493, "epoch": 2059} {"train_loss": -6.242420673370361, "global_step": 86494, "epoch": 2059} {"train_loss": -6.1840715408325195, "global_step": 86495, "epoch": 2059} {"train_loss": -6.1296281814575195, "global_step": 86496, "epoch": 2059} {"train_loss": -6.154642581939697, "global_step": 86497, "epoch": 2059} {"train_loss": -6.150200843811035, "global_step": 86498, "epoch": 2059} {"train_loss": -6.210991382598877, "global_step": 86499, "epoch": 2059} {"train_loss": -6.0581560134887695, "global_step": 86500, "epoch": 2059} {"train_loss": -6.247374534606934, "global_step": 86501, "epoch": 2059} {"train_loss": -6.028830051422119, "global_step": 86502, "epoch": 2059} {"train_loss": -6.108098983764648, "global_step": 86503, "epoch": 2059} {"train_loss": -6.198798656463623, "global_step": 86504, "epoch": 2059} {"train_loss": -6.07606840133667, "global_step": 86505, "epoch": 2059} {"train_loss": -6.095313549041748, "global_step": 86506, "epoch": 2059} {"train_loss": -5.981292724609375, "global_step": 86507, "epoch": 2059} {"train_loss": -6.075895309448242, "global_step": 86508, "epoch": 2059} {"train_loss": -6.171713829040527, "global_step": 86509, "epoch": 2059} {"train_loss": -6.162267684936523, "global_step": 86510, "epoch": 2059} {"train_loss": -6.154479503631592, "global_step": 86511, "epoch": 2059} {"train_loss": -6.262683391571045, "global_step": 86512, "epoch": 2059} {"train_loss": -6.281338691711426, "global_step": 86513, "epoch": 2059} {"train_loss": -6.359996795654297, "global_step": 86514, "epoch": 2059} {"train_loss": -6.1920928955078125, "global_step": 86515, "epoch": 2059} {"train_loss": -6.150117874145508, "global_step": 86516, "epoch": 2059} {"train_loss": -6.321189880371094, "global_step": 86517, "epoch": 2059} {"train_loss": -6.181164741516113, "global_step": 86518, "epoch": 2059} {"train_loss": -6.165843100774856, "global_step": 86519, "epoch": 2059, "val_loss": 62816.6328125} {"train_loss": -6.0878753662109375, "global_step": 86520, "epoch": 2060} {"train_loss": -6.267000675201416, "global_step": 86521, "epoch": 2060} {"train_loss": -6.269025802612305, "global_step": 86522, "epoch": 2060} {"train_loss": -6.187321662902832, "global_step": 86523, "epoch": 2060} {"train_loss": -6.292277812957764, "global_step": 86524, "epoch": 2060} {"train_loss": -6.217381477355957, "global_step": 86525, "epoch": 2060} {"train_loss": -6.167906761169434, "global_step": 86526, "epoch": 2060} {"train_loss": -6.268964767456055, "global_step": 86527, "epoch": 2060} {"train_loss": -6.1318535804748535, "global_step": 86528, "epoch": 2060} {"train_loss": -6.358444690704346, "global_step": 86529, "epoch": 2060} {"train_loss": -6.220691680908203, "global_step": 86530, "epoch": 2060} {"train_loss": -6.253809452056885, "global_step": 86531, "epoch": 2060} {"train_loss": -6.266180992126465, "global_step": 86532, "epoch": 2060} {"train_loss": -6.150069236755371, "global_step": 86533, "epoch": 2060} {"train_loss": -6.286384582519531, "global_step": 86534, "epoch": 2060} {"train_loss": -6.222517013549805, "global_step": 86535, "epoch": 2060} {"train_loss": -6.238442420959473, "global_step": 86536, "epoch": 2060} {"train_loss": -6.329709529876709, "global_step": 86537, "epoch": 2060} {"train_loss": -6.233575820922852, "global_step": 86538, "epoch": 2060} {"train_loss": -6.276806831359863, "global_step": 86539, "epoch": 2060} {"train_loss": -6.264734268188477, "global_step": 86540, "epoch": 2060} {"train_loss": -6.30955171585083, "global_step": 86541, "epoch": 2060} {"train_loss": -6.242209434509277, "global_step": 86542, "epoch": 2060} {"train_loss": -6.234312534332275, "global_step": 86543, "epoch": 2060} {"train_loss": -6.375954627990723, "global_step": 86544, "epoch": 2060} {"train_loss": -6.303857326507568, "global_step": 86545, "epoch": 2060} {"train_loss": -6.141790390014648, "global_step": 86546, "epoch": 2060} {"train_loss": -6.208291053771973, "global_step": 86547, "epoch": 2060} {"train_loss": -6.213421821594238, "global_step": 86548, "epoch": 2060} {"train_loss": -6.221269607543945, "global_step": 86549, "epoch": 2060} {"train_loss": -6.334699630737305, "global_step": 86550, "epoch": 2060} {"train_loss": -6.311460494995117, "global_step": 86551, "epoch": 2060} {"train_loss": -6.313281059265137, "global_step": 86552, "epoch": 2060} {"train_loss": -6.346189498901367, "global_step": 86553, "epoch": 2060} {"train_loss": -6.277122974395752, "global_step": 86554, "epoch": 2060} {"train_loss": -6.247627258300781, "global_step": 86555, "epoch": 2060} {"train_loss": -6.265576362609863, "global_step": 86556, "epoch": 2060} {"train_loss": -6.2393412590026855, "global_step": 86557, "epoch": 2060} {"train_loss": -6.174647331237793, "global_step": 86558, "epoch": 2060} {"train_loss": -6.417351722717285, "global_step": 86559, "epoch": 2060} {"train_loss": -6.259692668914795, "global_step": 86560, "epoch": 2060} {"train_loss": -6.252198855082194, "global_step": 86561, "epoch": 2060, "val_loss": 62699.1875} {"train_loss": -6.327004909515381, "global_step": 86562, "epoch": 2061} {"train_loss": -6.226569175720215, "global_step": 86563, "epoch": 2061} {"train_loss": -6.169848918914795, "global_step": 86564, "epoch": 2061} {"train_loss": -6.280703544616699, "global_step": 86565, "epoch": 2061} {"train_loss": -6.216670036315918, "global_step": 86566, "epoch": 2061} {"train_loss": -6.166914939880371, "global_step": 86567, "epoch": 2061} {"train_loss": -6.264422416687012, "global_step": 86568, "epoch": 2061} {"train_loss": -6.288580894470215, "global_step": 86569, "epoch": 2061} {"train_loss": -6.291770935058594, "global_step": 86570, "epoch": 2061} {"train_loss": -6.156768321990967, "global_step": 86571, "epoch": 2061} {"train_loss": -6.227993488311768, "global_step": 86572, "epoch": 2061} {"train_loss": -6.330077171325684, "global_step": 86573, "epoch": 2061} {"train_loss": -6.203880310058594, "global_step": 86574, "epoch": 2061} {"train_loss": -6.281440258026123, "global_step": 86575, "epoch": 2061} {"train_loss": -6.122157096862793, "global_step": 86576, "epoch": 2061} {"train_loss": -6.317078590393066, "global_step": 86577, "epoch": 2061} {"train_loss": -6.3081865310668945, "global_step": 86578, "epoch": 2061} {"train_loss": -6.183083534240723, "global_step": 86579, "epoch": 2061} {"train_loss": -6.188271999359131, "global_step": 86580, "epoch": 2061} {"train_loss": -6.168180465698242, "global_step": 86581, "epoch": 2061} {"train_loss": -6.151701927185059, "global_step": 86582, "epoch": 2061} {"train_loss": -6.287289142608643, "global_step": 86583, "epoch": 2061} {"train_loss": -6.083181381225586, "global_step": 86584, "epoch": 2061} {"train_loss": -6.249728202819824, "global_step": 86585, "epoch": 2061} {"train_loss": -6.19814395904541, "global_step": 86586, "epoch": 2061} {"train_loss": -6.1546430587768555, "global_step": 86587, "epoch": 2061} {"train_loss": -6.238786220550537, "global_step": 86588, "epoch": 2061} {"train_loss": -6.244442939758301, "global_step": 86589, "epoch": 2061} {"train_loss": -6.1918206214904785, "global_step": 86590, "epoch": 2061} {"train_loss": -6.292218208312988, "global_step": 86591, "epoch": 2061} {"train_loss": -6.2984209060668945, "global_step": 86592, "epoch": 2061} {"train_loss": -6.2389092445373535, "global_step": 86593, "epoch": 2061} {"train_loss": -6.1680684089660645, "global_step": 86594, "epoch": 2061} {"train_loss": -6.238772392272949, "global_step": 86595, "epoch": 2061} {"train_loss": -6.272634983062744, "global_step": 86596, "epoch": 2061} {"train_loss": -6.287471294403076, "global_step": 86597, "epoch": 2061} {"train_loss": -6.122068405151367, "global_step": 86598, "epoch": 2061} {"train_loss": -6.309665679931641, "global_step": 86599, "epoch": 2061} {"train_loss": -6.313379287719727, "global_step": 86600, "epoch": 2061} {"train_loss": -6.166147232055664, "global_step": 86601, "epoch": 2061} {"train_loss": -6.319363117218018, "global_step": 86602, "epoch": 2061} {"train_loss": -6.232874813533964, "global_step": 86603, "epoch": 2061, "val_loss": 62714.37109375} {"train_loss": -6.185046672821045, "global_step": 86604, "epoch": 2062} {"train_loss": -6.315347671508789, "global_step": 86605, "epoch": 2062} {"train_loss": -6.146446228027344, "global_step": 86606, "epoch": 2062} {"train_loss": -6.187047958374023, "global_step": 86607, "epoch": 2062} {"train_loss": -6.2920098304748535, "global_step": 86608, "epoch": 2062} {"train_loss": -6.206351280212402, "global_step": 86609, "epoch": 2062} {"train_loss": -6.235632419586182, "global_step": 86610, "epoch": 2062} {"train_loss": -6.136791229248047, "global_step": 86611, "epoch": 2062} {"train_loss": -6.154613018035889, "global_step": 86612, "epoch": 2062} {"train_loss": -6.200456619262695, "global_step": 86613, "epoch": 2062} {"train_loss": -6.191300392150879, "global_step": 86614, "epoch": 2062} {"train_loss": -6.312496185302734, "global_step": 86615, "epoch": 2062} {"train_loss": -6.154436111450195, "global_step": 86616, "epoch": 2062} {"train_loss": -6.237296104431152, "global_step": 86617, "epoch": 2062} {"train_loss": -6.280788898468018, "global_step": 86618, "epoch": 2062} {"train_loss": -6.099426746368408, "global_step": 86619, "epoch": 2062} {"train_loss": -6.289600372314453, "global_step": 86620, "epoch": 2062} {"train_loss": -6.260833740234375, "global_step": 86621, "epoch": 2062} {"train_loss": -6.2585129737854, "global_step": 86622, "epoch": 2062} {"train_loss": -6.06577730178833, "global_step": 86623, "epoch": 2062} {"train_loss": -6.21626615524292, "global_step": 86624, "epoch": 2062} {"train_loss": -6.287137031555176, "global_step": 86625, "epoch": 2062} {"train_loss": -6.201786041259766, "global_step": 86626, "epoch": 2062} {"train_loss": -6.262340545654297, "global_step": 86627, "epoch": 2062} {"train_loss": -6.321622371673584, "global_step": 86628, "epoch": 2062} {"train_loss": -6.223438739776611, "global_step": 86629, "epoch": 2062} {"train_loss": -6.198625564575195, "global_step": 86630, "epoch": 2062} {"train_loss": -6.210750579833984, "global_step": 86631, "epoch": 2062} {"train_loss": -6.237029075622559, "global_step": 86632, "epoch": 2062} {"train_loss": -6.266885757446289, "global_step": 86633, "epoch": 2062} {"train_loss": -6.160686016082764, "global_step": 86634, "epoch": 2062} {"train_loss": -6.220819473266602, "global_step": 86635, "epoch": 2062} {"train_loss": -6.286019325256348, "global_step": 86636, "epoch": 2062} {"train_loss": -6.067282199859619, "global_step": 86637, "epoch": 2062} {"train_loss": -6.1641693115234375, "global_step": 86638, "epoch": 2062} {"train_loss": -6.253866672515869, "global_step": 86639, "epoch": 2062} {"train_loss": -6.165637493133545, "global_step": 86640, "epoch": 2062} {"train_loss": -6.223685264587402, "global_step": 86641, "epoch": 2062} {"train_loss": -6.270753383636475, "global_step": 86642, "epoch": 2062} {"train_loss": -6.149924278259277, "global_step": 86643, "epoch": 2062} {"train_loss": -6.2942795753479, "global_step": 86644, "epoch": 2062} {"train_loss": -6.214504128410702, "global_step": 86645, "epoch": 2062, "val_loss": 62728.765625} {"train_loss": -6.341746807098389, "global_step": 86646, "epoch": 2063} {"train_loss": -6.303030967712402, "global_step": 86647, "epoch": 2063} {"train_loss": -6.094021320343018, "global_step": 86648, "epoch": 2063} {"train_loss": -6.249168872833252, "global_step": 86649, "epoch": 2063} {"train_loss": -6.217617988586426, "global_step": 86650, "epoch": 2063} {"train_loss": -6.233097076416016, "global_step": 86651, "epoch": 2063} {"train_loss": -6.163372039794922, "global_step": 86652, "epoch": 2063} {"train_loss": -6.091580867767334, "global_step": 86653, "epoch": 2063} {"train_loss": -6.08160924911499, "global_step": 86654, "epoch": 2063} {"train_loss": -6.097330570220947, "global_step": 86655, "epoch": 2063} {"train_loss": -6.124333381652832, "global_step": 86656, "epoch": 2063} {"train_loss": -6.086406707763672, "global_step": 86657, "epoch": 2063} {"train_loss": -6.089799404144287, "global_step": 86658, "epoch": 2063} {"train_loss": -6.230865478515625, "global_step": 86659, "epoch": 2063} {"train_loss": -6.081897735595703, "global_step": 86660, "epoch": 2063} {"train_loss": -6.159535884857178, "global_step": 86661, "epoch": 2063} {"train_loss": -6.182687759399414, "global_step": 86662, "epoch": 2063} {"train_loss": -6.24815559387207, "global_step": 86663, "epoch": 2063} {"train_loss": -6.11590576171875, "global_step": 86664, "epoch": 2063} {"train_loss": -6.244516372680664, "global_step": 86665, "epoch": 2063} {"train_loss": -6.184611797332764, "global_step": 86666, "epoch": 2063} {"train_loss": -6.2564473152160645, "global_step": 86667, "epoch": 2063} {"train_loss": -6.180763244628906, "global_step": 86668, "epoch": 2063} {"train_loss": -6.301156997680664, "global_step": 86669, "epoch": 2063} {"train_loss": -6.1840925216674805, "global_step": 86670, "epoch": 2063} {"train_loss": -6.314243316650391, "global_step": 86671, "epoch": 2063} {"train_loss": -6.165402889251709, "global_step": 86672, "epoch": 2063} {"train_loss": -6.18491268157959, "global_step": 86673, "epoch": 2063} {"train_loss": -6.221070766448975, "global_step": 86674, "epoch": 2063} {"train_loss": -6.156759738922119, "global_step": 86675, "epoch": 2063} {"train_loss": -6.276777267456055, "global_step": 86676, "epoch": 2063} {"train_loss": -6.2112135887146, "global_step": 86677, "epoch": 2063} {"train_loss": -6.205273628234863, "global_step": 86678, "epoch": 2063} {"train_loss": -6.276251316070557, "global_step": 86679, "epoch": 2063} {"train_loss": -6.154415607452393, "global_step": 86680, "epoch": 2063} {"train_loss": -6.286334991455078, "global_step": 86681, "epoch": 2063} {"train_loss": -6.190038204193115, "global_step": 86682, "epoch": 2063} {"train_loss": -6.145779609680176, "global_step": 86683, "epoch": 2063} {"train_loss": -6.151861190795898, "global_step": 86684, "epoch": 2063} {"train_loss": -6.233403205871582, "global_step": 86685, "epoch": 2063} {"train_loss": -6.091261863708496, "global_step": 86686, "epoch": 2063} {"train_loss": -6.189153886976696, "global_step": 86687, "epoch": 2063, "val_loss": 62734.890625} {"train_loss": -6.023216247558594, "global_step": 86688, "epoch": 2064} {"train_loss": -6.137307167053223, "global_step": 86689, "epoch": 2064} {"train_loss": -6.279320240020752, "global_step": 86690, "epoch": 2064} {"train_loss": -6.2844743728637695, "global_step": 86691, "epoch": 2064} {"train_loss": -6.185609340667725, "global_step": 86692, "epoch": 2064} {"train_loss": -6.222490310668945, "global_step": 86693, "epoch": 2064} {"train_loss": -6.185603141784668, "global_step": 86694, "epoch": 2064} {"train_loss": -6.168139457702637, "global_step": 86695, "epoch": 2064} {"train_loss": -6.200357913970947, "global_step": 86696, "epoch": 2064} {"train_loss": -6.32981538772583, "global_step": 86697, "epoch": 2064} {"train_loss": -6.283751487731934, "global_step": 86698, "epoch": 2064} {"train_loss": -6.239317893981934, "global_step": 86699, "epoch": 2064} {"train_loss": -6.222062110900879, "global_step": 86700, "epoch": 2064} {"train_loss": -6.0208539962768555, "global_step": 86701, "epoch": 2064} {"train_loss": -6.146931171417236, "global_step": 86702, "epoch": 2064} {"train_loss": -6.217853546142578, "global_step": 86703, "epoch": 2064} {"train_loss": -6.2057085037231445, "global_step": 86704, "epoch": 2064} {"train_loss": -6.283426284790039, "global_step": 86705, "epoch": 2064} {"train_loss": -6.240124702453613, "global_step": 86706, "epoch": 2064} {"train_loss": -6.077381134033203, "global_step": 86707, "epoch": 2064} {"train_loss": -6.1757001876831055, "global_step": 86708, "epoch": 2064} {"train_loss": -6.155406951904297, "global_step": 86709, "epoch": 2064} {"train_loss": -6.097059726715088, "global_step": 86710, "epoch": 2064} {"train_loss": -6.191742897033691, "global_step": 86711, "epoch": 2064} {"train_loss": -6.183470726013184, "global_step": 86712, "epoch": 2064} {"train_loss": -6.207178115844727, "global_step": 86713, "epoch": 2064} {"train_loss": -6.335304260253906, "global_step": 86714, "epoch": 2064} {"train_loss": -6.138967990875244, "global_step": 86715, "epoch": 2064} {"train_loss": -6.214154243469238, "global_step": 86716, "epoch": 2064} {"train_loss": -6.2322187423706055, "global_step": 86717, "epoch": 2064} {"train_loss": -6.271249771118164, "global_step": 86718, "epoch": 2064} {"train_loss": -6.209682941436768, "global_step": 86719, "epoch": 2064} {"train_loss": -6.171029567718506, "global_step": 86720, "epoch": 2064} {"train_loss": -6.114424705505371, "global_step": 86721, "epoch": 2064} {"train_loss": -6.272093772888184, "global_step": 86722, "epoch": 2064} {"train_loss": -6.171782493591309, "global_step": 86723, "epoch": 2064} {"train_loss": -6.13001823425293, "global_step": 86724, "epoch": 2064} {"train_loss": -6.278784275054932, "global_step": 86725, "epoch": 2064} {"train_loss": -6.211910247802734, "global_step": 86726, "epoch": 2064} {"train_loss": -6.270565032958984, "global_step": 86727, "epoch": 2064} {"train_loss": -6.2446112632751465, "global_step": 86728, "epoch": 2064} {"train_loss": -6.199996743883405, "global_step": 86729, "epoch": 2064, "val_loss": 62977.45703125} {"train_loss": -6.13559627532959, "global_step": 86730, "epoch": 2065} {"train_loss": -6.231894493103027, "global_step": 86731, "epoch": 2065} {"train_loss": -6.186460971832275, "global_step": 86732, "epoch": 2065} {"train_loss": -6.187066078186035, "global_step": 86733, "epoch": 2065} {"train_loss": -6.158049583435059, "global_step": 86734, "epoch": 2065} {"train_loss": -6.213751792907715, "global_step": 86735, "epoch": 2065} {"train_loss": -6.249621391296387, "global_step": 86736, "epoch": 2065} {"train_loss": -6.171028137207031, "global_step": 86737, "epoch": 2065} {"train_loss": -6.196451187133789, "global_step": 86738, "epoch": 2065} {"train_loss": -6.214081764221191, "global_step": 86739, "epoch": 2065} {"train_loss": -6.188525676727295, "global_step": 86740, "epoch": 2065} {"train_loss": -6.239282608032227, "global_step": 86741, "epoch": 2065} {"train_loss": -6.169029235839844, "global_step": 86742, "epoch": 2065} {"train_loss": -6.183990478515625, "global_step": 86743, "epoch": 2065} {"train_loss": -6.103890419006348, "global_step": 86744, "epoch": 2065} {"train_loss": -6.122692108154297, "global_step": 86745, "epoch": 2065} {"train_loss": -6.257266998291016, "global_step": 86746, "epoch": 2065} {"train_loss": -6.266007423400879, "global_step": 86747, "epoch": 2065} {"train_loss": -6.1940717697143555, "global_step": 86748, "epoch": 2065} {"train_loss": -6.234487533569336, "global_step": 86749, "epoch": 2065} {"train_loss": -6.175929069519043, "global_step": 86750, "epoch": 2065} {"train_loss": -6.1263933181762695, "global_step": 86751, "epoch": 2065} {"train_loss": -6.1372480392456055, "global_step": 86752, "epoch": 2065} {"train_loss": -6.223484992980957, "global_step": 86753, "epoch": 2065} {"train_loss": -6.26491641998291, "global_step": 86754, "epoch": 2065} {"train_loss": -6.1933488845825195, "global_step": 86755, "epoch": 2065} {"train_loss": -6.314942359924316, "global_step": 86756, "epoch": 2065} {"train_loss": -6.151375770568848, "global_step": 86757, "epoch": 2065} {"train_loss": -6.091762542724609, "global_step": 86758, "epoch": 2065} {"train_loss": -6.259149074554443, "global_step": 86759, "epoch": 2065} {"train_loss": -6.303798675537109, "global_step": 86760, "epoch": 2065} {"train_loss": -6.248321533203125, "global_step": 86761, "epoch": 2065} {"train_loss": -6.271036624908447, "global_step": 86762, "epoch": 2065} {"train_loss": -6.326766014099121, "global_step": 86763, "epoch": 2065} {"train_loss": -6.225905418395996, "global_step": 86764, "epoch": 2065} {"train_loss": -6.2103071212768555, "global_step": 86765, "epoch": 2065} {"train_loss": -6.2644147872924805, "global_step": 86766, "epoch": 2065} {"train_loss": -6.227729320526123, "global_step": 86767, "epoch": 2065} {"train_loss": -6.203478813171387, "global_step": 86768, "epoch": 2065} {"train_loss": -6.13160514831543, "global_step": 86769, "epoch": 2065} {"train_loss": -6.4006242752075195, "global_step": 86770, "epoch": 2065} {"train_loss": -6.212008862268357, "global_step": 86771, "epoch": 2065, "val_loss": 62686.859375} {"train_loss": -6.20468807220459, "global_step": 86772, "epoch": 2066} {"train_loss": -6.308010578155518, "global_step": 86773, "epoch": 2066} {"train_loss": -6.305397987365723, "global_step": 86774, "epoch": 2066} {"train_loss": -6.181805610656738, "global_step": 86775, "epoch": 2066} {"train_loss": -6.28551721572876, "global_step": 86776, "epoch": 2066} {"train_loss": -6.265056133270264, "global_step": 86777, "epoch": 2066} {"train_loss": -6.097403526306152, "global_step": 86778, "epoch": 2066} {"train_loss": -6.209724426269531, "global_step": 86779, "epoch": 2066} {"train_loss": -6.259516716003418, "global_step": 86780, "epoch": 2066} {"train_loss": -6.215916156768799, "global_step": 86781, "epoch": 2066} {"train_loss": -6.295831680297852, "global_step": 86782, "epoch": 2066} {"train_loss": -6.417477607727051, "global_step": 86783, "epoch": 2066} {"train_loss": -6.221574783325195, "global_step": 86784, "epoch": 2066} {"train_loss": -6.260405540466309, "global_step": 86785, "epoch": 2066} {"train_loss": -6.215559005737305, "global_step": 86786, "epoch": 2066} {"train_loss": -6.184878349304199, "global_step": 86787, "epoch": 2066} {"train_loss": -6.2027506828308105, "global_step": 86788, "epoch": 2066} {"train_loss": -6.216460227966309, "global_step": 86789, "epoch": 2066} {"train_loss": -6.354981422424316, "global_step": 86790, "epoch": 2066} {"train_loss": -6.198636531829834, "global_step": 86791, "epoch": 2066} {"train_loss": -6.239723205566406, "global_step": 86792, "epoch": 2066} {"train_loss": -6.177616596221924, "global_step": 86793, "epoch": 2066} {"train_loss": -6.251555919647217, "global_step": 86794, "epoch": 2066} {"train_loss": -6.133571624755859, "global_step": 86795, "epoch": 2066} {"train_loss": -6.35723876953125, "global_step": 86796, "epoch": 2066} {"train_loss": -6.212286472320557, "global_step": 86797, "epoch": 2066} {"train_loss": -6.322805404663086, "global_step": 86798, "epoch": 2066} {"train_loss": -6.188033103942871, "global_step": 86799, "epoch": 2066} {"train_loss": -6.327402591705322, "global_step": 86800, "epoch": 2066} {"train_loss": -6.3370161056518555, "global_step": 86801, "epoch": 2066} {"train_loss": -6.274893760681152, "global_step": 86802, "epoch": 2066} {"train_loss": -6.220733642578125, "global_step": 86803, "epoch": 2066} {"train_loss": -6.198519706726074, "global_step": 86804, "epoch": 2066} {"train_loss": -6.324361801147461, "global_step": 86805, "epoch": 2066} {"train_loss": -6.228611469268799, "global_step": 86806, "epoch": 2066} {"train_loss": -6.285550117492676, "global_step": 86807, "epoch": 2066} {"train_loss": -6.272076606750488, "global_step": 86808, "epoch": 2066} {"train_loss": -6.232755661010742, "global_step": 86809, "epoch": 2066} {"train_loss": -6.208495140075684, "global_step": 86810, "epoch": 2066} {"train_loss": -6.256691932678223, "global_step": 86811, "epoch": 2066} {"train_loss": -6.201995372772217, "global_step": 86812, "epoch": 2066} {"train_loss": -6.251102731341407, "global_step": 86813, "epoch": 2066, "val_loss": 62903.11328125} {"train_loss": -6.178950309753418, "global_step": 86814, "epoch": 2067} {"train_loss": -6.235261917114258, "global_step": 86815, "epoch": 2067} {"train_loss": -6.164771556854248, "global_step": 86816, "epoch": 2067} {"train_loss": -6.191725730895996, "global_step": 86817, "epoch": 2067} {"train_loss": -6.262633323669434, "global_step": 86818, "epoch": 2067} {"train_loss": -6.22627592086792, "global_step": 86819, "epoch": 2067} {"train_loss": -6.36746883392334, "global_step": 86820, "epoch": 2067} {"train_loss": -6.288431167602539, "global_step": 86821, "epoch": 2067} {"train_loss": -6.24323844909668, "global_step": 86822, "epoch": 2067} {"train_loss": -6.263755798339844, "global_step": 86823, "epoch": 2067} {"train_loss": -6.270819664001465, "global_step": 86824, "epoch": 2067} {"train_loss": -6.280058860778809, "global_step": 86825, "epoch": 2067} {"train_loss": -6.159430980682373, "global_step": 86826, "epoch": 2067} {"train_loss": -6.333617210388184, "global_step": 86827, "epoch": 2067} {"train_loss": -6.350492477416992, "global_step": 86828, "epoch": 2067} {"train_loss": -6.2985029220581055, "global_step": 86829, "epoch": 2067} {"train_loss": -6.23582649230957, "global_step": 86830, "epoch": 2067} {"train_loss": -6.209362983703613, "global_step": 86831, "epoch": 2067} {"train_loss": -6.2349700927734375, "global_step": 86832, "epoch": 2067} {"train_loss": -6.272148132324219, "global_step": 86833, "epoch": 2067} {"train_loss": -6.248049736022949, "global_step": 86834, "epoch": 2067} {"train_loss": -6.25473690032959, "global_step": 86835, "epoch": 2067} {"train_loss": -6.139588832855225, "global_step": 86836, "epoch": 2067} {"train_loss": -6.271943092346191, "global_step": 86837, "epoch": 2067} {"train_loss": -6.386876106262207, "global_step": 86838, "epoch": 2067} {"train_loss": -6.283736228942871, "global_step": 86839, "epoch": 2067} {"train_loss": -6.319449424743652, "global_step": 86840, "epoch": 2067} {"train_loss": -6.135970115661621, "global_step": 86841, "epoch": 2067} {"train_loss": -6.1828742027282715, "global_step": 86842, "epoch": 2067} {"train_loss": -6.1568684577941895, "global_step": 86843, "epoch": 2067} {"train_loss": -6.2627153396606445, "global_step": 86844, "epoch": 2067} {"train_loss": -6.249650001525879, "global_step": 86845, "epoch": 2067} {"train_loss": -6.188382625579834, "global_step": 86846, "epoch": 2067} {"train_loss": -6.3201165199279785, "global_step": 86847, "epoch": 2067} {"train_loss": -6.193465709686279, "global_step": 86848, "epoch": 2067} {"train_loss": -6.32304573059082, "global_step": 86849, "epoch": 2067} {"train_loss": -6.240851402282715, "global_step": 86850, "epoch": 2067} {"train_loss": -6.153317451477051, "global_step": 86851, "epoch": 2067} {"train_loss": -6.1660966873168945, "global_step": 86852, "epoch": 2067} {"train_loss": -6.30582332611084, "global_step": 86853, "epoch": 2067} {"train_loss": -6.294796943664551, "global_step": 86854, "epoch": 2067} {"train_loss": -6.247520673842657, "global_step": 86855, "epoch": 2067, "val_loss": 62832.0546875} {"train_loss": -6.352496147155762, "global_step": 86856, "epoch": 2068} {"train_loss": -6.359194755554199, "global_step": 86857, "epoch": 2068} {"train_loss": -6.324357986450195, "global_step": 86858, "epoch": 2068} {"train_loss": -6.263835430145264, "global_step": 86859, "epoch": 2068} {"train_loss": -6.21380090713501, "global_step": 86860, "epoch": 2068} {"train_loss": -6.182535171508789, "global_step": 86861, "epoch": 2068} {"train_loss": -6.269256591796875, "global_step": 86862, "epoch": 2068} {"train_loss": -6.202996253967285, "global_step": 86863, "epoch": 2068} {"train_loss": -6.1264543533325195, "global_step": 86864, "epoch": 2068} {"train_loss": -6.119738578796387, "global_step": 86865, "epoch": 2068} {"train_loss": -6.081086158752441, "global_step": 86866, "epoch": 2068} {"train_loss": -6.2871294021606445, "global_step": 86867, "epoch": 2068} {"train_loss": -6.15224552154541, "global_step": 86868, "epoch": 2068} {"train_loss": -5.98390007019043, "global_step": 86869, "epoch": 2068} {"train_loss": -6.144346237182617, "global_step": 86870, "epoch": 2068} {"train_loss": -5.989606857299805, "global_step": 86871, "epoch": 2068} {"train_loss": -6.068889141082764, "global_step": 86872, "epoch": 2068} {"train_loss": -6.134510040283203, "global_step": 86873, "epoch": 2068} {"train_loss": -5.981209754943848, "global_step": 86874, "epoch": 2068} {"train_loss": -6.0848541259765625, "global_step": 86875, "epoch": 2068} {"train_loss": -5.966897964477539, "global_step": 86876, "epoch": 2068} {"train_loss": -6.195683479309082, "global_step": 86877, "epoch": 2068} {"train_loss": -6.014496803283691, "global_step": 86878, "epoch": 2068} {"train_loss": -6.0266852378845215, "global_step": 86879, "epoch": 2068} {"train_loss": -6.215594291687012, "global_step": 86880, "epoch": 2068} {"train_loss": -6.122125148773193, "global_step": 86881, "epoch": 2068} {"train_loss": -6.170331001281738, "global_step": 86882, "epoch": 2068} {"train_loss": -6.083107948303223, "global_step": 86883, "epoch": 2068} {"train_loss": -6.08407735824585, "global_step": 86884, "epoch": 2068} {"train_loss": -6.175239562988281, "global_step": 86885, "epoch": 2068} {"train_loss": -6.198516845703125, "global_step": 86886, "epoch": 2068} {"train_loss": -6.119776248931885, "global_step": 86887, "epoch": 2068} {"train_loss": -6.205241680145264, "global_step": 86888, "epoch": 2068} {"train_loss": -6.144423484802246, "global_step": 86889, "epoch": 2068} {"train_loss": -6.195974349975586, "global_step": 86890, "epoch": 2068} {"train_loss": -6.1247782707214355, "global_step": 86891, "epoch": 2068} {"train_loss": -6.333812713623047, "global_step": 86892, "epoch": 2068} {"train_loss": -6.065330505371094, "global_step": 86893, "epoch": 2068} {"train_loss": -6.083712100982666, "global_step": 86894, "epoch": 2068} {"train_loss": -6.277819633483887, "global_step": 86895, "epoch": 2068} {"train_loss": -6.14877986907959, "global_step": 86896, "epoch": 2068} {"train_loss": -6.153853518622262, "global_step": 86897, "epoch": 2068, "val_loss": 62951.35546875} {"train_loss": -6.244518756866455, "global_step": 86898, "epoch": 2069} {"train_loss": -6.208963394165039, "global_step": 86899, "epoch": 2069} {"train_loss": -6.225264549255371, "global_step": 86900, "epoch": 2069} {"train_loss": -6.115616798400879, "global_step": 86901, "epoch": 2069} {"train_loss": -6.232616424560547, "global_step": 86902, "epoch": 2069} {"train_loss": -6.199637413024902, "global_step": 86903, "epoch": 2069} {"train_loss": -6.172163963317871, "global_step": 86904, "epoch": 2069} {"train_loss": -6.366177558898926, "global_step": 86905, "epoch": 2069} {"train_loss": -6.230449676513672, "global_step": 86906, "epoch": 2069} {"train_loss": -6.209650993347168, "global_step": 86907, "epoch": 2069} {"train_loss": -6.247285842895508, "global_step": 86908, "epoch": 2069} {"train_loss": -6.235039710998535, "global_step": 86909, "epoch": 2069} {"train_loss": -6.228097915649414, "global_step": 86910, "epoch": 2069} {"train_loss": -6.299751281738281, "global_step": 86911, "epoch": 2069} {"train_loss": -6.247828483581543, "global_step": 86912, "epoch": 2069} {"train_loss": -6.332073211669922, "global_step": 86913, "epoch": 2069} {"train_loss": -6.247265815734863, "global_step": 86914, "epoch": 2069} {"train_loss": -6.197759628295898, "global_step": 86915, "epoch": 2069} {"train_loss": -6.306527614593506, "global_step": 86916, "epoch": 2069} {"train_loss": -6.281414985656738, "global_step": 86917, "epoch": 2069} {"train_loss": -6.189048767089844, "global_step": 86918, "epoch": 2069} {"train_loss": -6.23758602142334, "global_step": 86919, "epoch": 2069} {"train_loss": -6.271266937255859, "global_step": 86920, "epoch": 2069} {"train_loss": -6.292812347412109, "global_step": 86921, "epoch": 2069} {"train_loss": -6.16110897064209, "global_step": 86922, "epoch": 2069} {"train_loss": -6.355770111083984, "global_step": 86923, "epoch": 2069} {"train_loss": -6.199745178222656, "global_step": 86924, "epoch": 2069} {"train_loss": -6.238150119781494, "global_step": 86925, "epoch": 2069} {"train_loss": -6.265544414520264, "global_step": 86926, "epoch": 2069} {"train_loss": -6.247899532318115, "global_step": 86927, "epoch": 2069} {"train_loss": -6.177439212799072, "global_step": 86928, "epoch": 2069} {"train_loss": -6.281829833984375, "global_step": 86929, "epoch": 2069} {"train_loss": -6.127175807952881, "global_step": 86930, "epoch": 2069} {"train_loss": -6.178845405578613, "global_step": 86931, "epoch": 2069} {"train_loss": -6.106699466705322, "global_step": 86932, "epoch": 2069} {"train_loss": -6.236171722412109, "global_step": 86933, "epoch": 2069} {"train_loss": -6.182211399078369, "global_step": 86934, "epoch": 2069} {"train_loss": -6.148708820343018, "global_step": 86935, "epoch": 2069} {"train_loss": -6.193533420562744, "global_step": 86936, "epoch": 2069} {"train_loss": -6.114903450012207, "global_step": 86937, "epoch": 2069} {"train_loss": -6.059108734130859, "global_step": 86938, "epoch": 2069} {"train_loss": -6.223055203755696, "global_step": 86939, "epoch": 2069, "val_loss": 62899.2265625} {"train_loss": -6.194437026977539, "global_step": 86940, "epoch": 2070} {"train_loss": -6.142979621887207, "global_step": 86941, "epoch": 2070} {"train_loss": -6.225095272064209, "global_step": 86942, "epoch": 2070} {"train_loss": -6.2970709800720215, "global_step": 86943, "epoch": 2070} {"train_loss": -6.289475440979004, "global_step": 86944, "epoch": 2070} {"train_loss": -6.2303924560546875, "global_step": 86945, "epoch": 2070} {"train_loss": -6.160702705383301, "global_step": 86946, "epoch": 2070} {"train_loss": -6.158201217651367, "global_step": 86947, "epoch": 2070} {"train_loss": -6.15626335144043, "global_step": 86948, "epoch": 2070} {"train_loss": -6.336167335510254, "global_step": 86949, "epoch": 2070} {"train_loss": -6.25362491607666, "global_step": 86950, "epoch": 2070} {"train_loss": -6.410656929016113, "global_step": 86951, "epoch": 2070} {"train_loss": -6.257236003875732, "global_step": 86952, "epoch": 2070} {"train_loss": -6.272915840148926, "global_step": 86953, "epoch": 2070} {"train_loss": -6.316959381103516, "global_step": 86954, "epoch": 2070} {"train_loss": -6.231637954711914, "global_step": 86955, "epoch": 2070} {"train_loss": -6.132198810577393, "global_step": 86956, "epoch": 2070} {"train_loss": -6.284276962280273, "global_step": 86957, "epoch": 2070} {"train_loss": -6.098913669586182, "global_step": 86958, "epoch": 2070} {"train_loss": -6.289875507354736, "global_step": 86959, "epoch": 2070} {"train_loss": -6.2304301261901855, "global_step": 86960, "epoch": 2070} {"train_loss": -6.31047248840332, "global_step": 86961, "epoch": 2070} {"train_loss": -6.218825340270996, "global_step": 86962, "epoch": 2070} {"train_loss": -6.245664596557617, "global_step": 86963, "epoch": 2070} {"train_loss": -6.251884460449219, "global_step": 86964, "epoch": 2070} {"train_loss": -6.178276062011719, "global_step": 86965, "epoch": 2070} {"train_loss": -6.193072319030762, "global_step": 86966, "epoch": 2070} {"train_loss": -6.245846748352051, "global_step": 86967, "epoch": 2070} {"train_loss": -6.236478805541992, "global_step": 86968, "epoch": 2070} {"train_loss": -6.182621002197266, "global_step": 86969, "epoch": 2070} {"train_loss": -6.2481889724731445, "global_step": 86970, "epoch": 2070} {"train_loss": -6.26776123046875, "global_step": 86971, "epoch": 2070} {"train_loss": -6.250329971313477, "global_step": 86972, "epoch": 2070} {"train_loss": -6.280324459075928, "global_step": 86973, "epoch": 2070} {"train_loss": -6.155783653259277, "global_step": 86974, "epoch": 2070} {"train_loss": -6.2016401290893555, "global_step": 86975, "epoch": 2070} {"train_loss": -6.20566987991333, "global_step": 86976, "epoch": 2070} {"train_loss": -6.228431224822998, "global_step": 86977, "epoch": 2070} {"train_loss": -6.267269134521484, "global_step": 86978, "epoch": 2070} {"train_loss": -6.317657470703125, "global_step": 86979, "epoch": 2070} {"train_loss": -6.327989101409912, "global_step": 86980, "epoch": 2070} {"train_loss": -6.239617892674038, "global_step": 86981, "epoch": 2070, "val_loss": 62920.7265625} {"train_loss": -6.200117111206055, "global_step": 86982, "epoch": 2071} {"train_loss": -6.247565746307373, "global_step": 86983, "epoch": 2071} {"train_loss": -6.235284805297852, "global_step": 86984, "epoch": 2071} {"train_loss": -6.277237415313721, "global_step": 86985, "epoch": 2071} {"train_loss": -6.157677173614502, "global_step": 86986, "epoch": 2071} {"train_loss": -6.152897834777832, "global_step": 86987, "epoch": 2071} {"train_loss": -6.410669326782227, "global_step": 86988, "epoch": 2071} {"train_loss": -6.074744701385498, "global_step": 86989, "epoch": 2071} {"train_loss": -6.157410621643066, "global_step": 86990, "epoch": 2071} {"train_loss": -6.090367317199707, "global_step": 86991, "epoch": 2071} {"train_loss": -6.219674110412598, "global_step": 86992, "epoch": 2071} {"train_loss": -6.096745491027832, "global_step": 86993, "epoch": 2071} {"train_loss": -6.194673538208008, "global_step": 86994, "epoch": 2071} {"train_loss": -6.1917595863342285, "global_step": 86995, "epoch": 2071} {"train_loss": -6.249444961547852, "global_step": 86996, "epoch": 2071} {"train_loss": -6.2089056968688965, "global_step": 86997, "epoch": 2071} {"train_loss": -6.330390930175781, "global_step": 86998, "epoch": 2071} {"train_loss": -6.33349084854126, "global_step": 86999, "epoch": 2071} {"train_loss": -6.1725592613220215, "global_step": 87000, "epoch": 2071} {"train_loss": -6.27217960357666, "global_step": 87001, "epoch": 2071} {"train_loss": -6.1862335205078125, "global_step": 87002, "epoch": 2071} {"train_loss": -6.267402648925781, "global_step": 87003, "epoch": 2071} {"train_loss": -6.290885925292969, "global_step": 87004, "epoch": 2071} {"train_loss": -6.1831865310668945, "global_step": 87005, "epoch": 2071} {"train_loss": -6.287200927734375, "global_step": 87006, "epoch": 2071} {"train_loss": -6.370424270629883, "global_step": 87007, "epoch": 2071} {"train_loss": -6.172394752502441, "global_step": 87008, "epoch": 2071} {"train_loss": -6.312191963195801, "global_step": 87009, "epoch": 2071} {"train_loss": -6.224601745605469, "global_step": 87010, "epoch": 2071} {"train_loss": -6.232146739959717, "global_step": 87011, "epoch": 2071} {"train_loss": -6.303670883178711, "global_step": 87012, "epoch": 2071} {"train_loss": -6.180340766906738, "global_step": 87013, "epoch": 2071} {"train_loss": -6.227910041809082, "global_step": 87014, "epoch": 2071} {"train_loss": -6.365601539611816, "global_step": 87015, "epoch": 2071} {"train_loss": -6.268012523651123, "global_step": 87016, "epoch": 2071} {"train_loss": -6.179859161376953, "global_step": 87017, "epoch": 2071} {"train_loss": -6.241333961486816, "global_step": 87018, "epoch": 2071} {"train_loss": -6.219460964202881, "global_step": 87019, "epoch": 2071} {"train_loss": -6.196596145629883, "global_step": 87020, "epoch": 2071} {"train_loss": -6.243538856506348, "global_step": 87021, "epoch": 2071} {"train_loss": -6.275184154510498, "global_step": 87022, "epoch": 2071} {"train_loss": -6.233020453225999, "global_step": 87023, "epoch": 2071, "val_loss": 62783.74609375} {"train_loss": -6.308941841125488, "global_step": 87024, "epoch": 2072} {"train_loss": -6.238947868347168, "global_step": 87025, "epoch": 2072} {"train_loss": -6.214874267578125, "global_step": 87026, "epoch": 2072} {"train_loss": -6.140964508056641, "global_step": 87027, "epoch": 2072} {"train_loss": -6.2216339111328125, "global_step": 87028, "epoch": 2072} {"train_loss": -6.19737434387207, "global_step": 87029, "epoch": 2072} {"train_loss": -6.1909966468811035, "global_step": 87030, "epoch": 2072} {"train_loss": -6.2028045654296875, "global_step": 87031, "epoch": 2072} {"train_loss": -6.257135391235352, "global_step": 87032, "epoch": 2072} {"train_loss": -6.151366710662842, "global_step": 87033, "epoch": 2072} {"train_loss": -6.241535186767578, "global_step": 87034, "epoch": 2072} {"train_loss": -6.246073246002197, "global_step": 87035, "epoch": 2072} {"train_loss": -6.306083679199219, "global_step": 87036, "epoch": 2072} {"train_loss": -6.349609375, "global_step": 87037, "epoch": 2072} {"train_loss": -6.252404689788818, "global_step": 87038, "epoch": 2072} {"train_loss": -6.254947662353516, "global_step": 87039, "epoch": 2072} {"train_loss": -6.254221439361572, "global_step": 87040, "epoch": 2072} {"train_loss": -6.207956314086914, "global_step": 87041, "epoch": 2072} {"train_loss": -6.129815101623535, "global_step": 87042, "epoch": 2072} {"train_loss": -6.346385955810547, "global_step": 87043, "epoch": 2072} {"train_loss": -6.258014678955078, "global_step": 87044, "epoch": 2072} {"train_loss": -6.264366149902344, "global_step": 87045, "epoch": 2072} {"train_loss": -6.322416305541992, "global_step": 87046, "epoch": 2072} {"train_loss": -6.2478508949279785, "global_step": 87047, "epoch": 2072} {"train_loss": -6.270298957824707, "global_step": 87048, "epoch": 2072} {"train_loss": -6.230316162109375, "global_step": 87049, "epoch": 2072} {"train_loss": -6.215353965759277, "global_step": 87050, "epoch": 2072} {"train_loss": -6.199939727783203, "global_step": 87051, "epoch": 2072} {"train_loss": -6.139777183532715, "global_step": 87052, "epoch": 2072} {"train_loss": -6.117028713226318, "global_step": 87053, "epoch": 2072} {"train_loss": -6.221424102783203, "global_step": 87054, "epoch": 2072} {"train_loss": -6.153153419494629, "global_step": 87055, "epoch": 2072} {"train_loss": -6.059425354003906, "global_step": 87056, "epoch": 2072} {"train_loss": -6.16285514831543, "global_step": 87057, "epoch": 2072} {"train_loss": -6.031093120574951, "global_step": 87058, "epoch": 2072} {"train_loss": -6.20161247253418, "global_step": 87059, "epoch": 2072} {"train_loss": -6.25607442855835, "global_step": 87060, "epoch": 2072} {"train_loss": -6.114646911621094, "global_step": 87061, "epoch": 2072} {"train_loss": -6.146123886108398, "global_step": 87062, "epoch": 2072} {"train_loss": -6.269726753234863, "global_step": 87063, "epoch": 2072} {"train_loss": -6.18034029006958, "global_step": 87064, "epoch": 2072} {"train_loss": -6.212905293419247, "global_step": 87065, "epoch": 2072, "val_loss": 63322.2421875} {"train_loss": -6.248311996459961, "global_step": 87066, "epoch": 2073} {"train_loss": -6.240734100341797, "global_step": 87067, "epoch": 2073} {"train_loss": -6.079327583312988, "global_step": 87068, "epoch": 2073} {"train_loss": -6.183626174926758, "global_step": 87069, "epoch": 2073} {"train_loss": -6.287332534790039, "global_step": 87070, "epoch": 2073} {"train_loss": -6.172822952270508, "global_step": 87071, "epoch": 2073} {"train_loss": -6.253129005432129, "global_step": 87072, "epoch": 2073} {"train_loss": -6.117959022521973, "global_step": 87073, "epoch": 2073} {"train_loss": -6.235550880432129, "global_step": 87074, "epoch": 2073} {"train_loss": -6.322026252746582, "global_step": 87075, "epoch": 2073} {"train_loss": -6.2877349853515625, "global_step": 87076, "epoch": 2073} {"train_loss": -6.297013282775879, "global_step": 87077, "epoch": 2073} {"train_loss": -6.274334907531738, "global_step": 87078, "epoch": 2073} {"train_loss": -6.1772918701171875, "global_step": 87079, "epoch": 2073} {"train_loss": -6.310815811157227, "global_step": 87080, "epoch": 2073} {"train_loss": -6.29216194152832, "global_step": 87081, "epoch": 2073} {"train_loss": -6.255611896514893, "global_step": 87082, "epoch": 2073} {"train_loss": -6.250191688537598, "global_step": 87083, "epoch": 2073} {"train_loss": -6.212747097015381, "global_step": 87084, "epoch": 2073} {"train_loss": -6.2486162185668945, "global_step": 87085, "epoch": 2073} {"train_loss": -6.215986251831055, "global_step": 87086, "epoch": 2073} {"train_loss": -6.287531852722168, "global_step": 87087, "epoch": 2073} {"train_loss": -6.259553909301758, "global_step": 87088, "epoch": 2073} {"train_loss": -6.0784101486206055, "global_step": 87089, "epoch": 2073} {"train_loss": -6.2879438400268555, "global_step": 87090, "epoch": 2073} {"train_loss": -6.334549903869629, "global_step": 87091, "epoch": 2073} {"train_loss": -6.296865463256836, "global_step": 87092, "epoch": 2073} {"train_loss": -6.204971790313721, "global_step": 87093, "epoch": 2073} {"train_loss": -6.258904457092285, "global_step": 87094, "epoch": 2073} {"train_loss": -6.246191024780273, "global_step": 87095, "epoch": 2073} {"train_loss": -6.367650032043457, "global_step": 87096, "epoch": 2073} {"train_loss": -6.199804306030273, "global_step": 87097, "epoch": 2073} {"train_loss": -6.217400074005127, "global_step": 87098, "epoch": 2073} {"train_loss": -6.344379901885986, "global_step": 87099, "epoch": 2073} {"train_loss": -6.153979301452637, "global_step": 87100, "epoch": 2073} {"train_loss": -6.161459922790527, "global_step": 87101, "epoch": 2073} {"train_loss": -6.2074384689331055, "global_step": 87102, "epoch": 2073} {"train_loss": -6.183401107788086, "global_step": 87103, "epoch": 2073} {"train_loss": -6.194613456726074, "global_step": 87104, "epoch": 2073} {"train_loss": -6.247443199157715, "global_step": 87105, "epoch": 2073} {"train_loss": -6.26304292678833, "global_step": 87106, "epoch": 2073} {"train_loss": -6.237182083584013, "global_step": 87107, "epoch": 2073, "val_loss": 62789.6796875} {"train_loss": -6.341095924377441, "global_step": 87108, "epoch": 2074} {"train_loss": -6.186311721801758, "global_step": 87109, "epoch": 2074} {"train_loss": -6.298947334289551, "global_step": 87110, "epoch": 2074} {"train_loss": -6.19467306137085, "global_step": 87111, "epoch": 2074} {"train_loss": -6.318930149078369, "global_step": 87112, "epoch": 2074} {"train_loss": -6.310258388519287, "global_step": 87113, "epoch": 2074} {"train_loss": -6.214686393737793, "global_step": 87114, "epoch": 2074} {"train_loss": -6.240034103393555, "global_step": 87115, "epoch": 2074} {"train_loss": -6.100217342376709, "global_step": 87116, "epoch": 2074} {"train_loss": -6.271862983703613, "global_step": 87117, "epoch": 2074} {"train_loss": -6.252623081207275, "global_step": 87118, "epoch": 2074} {"train_loss": -6.172493934631348, "global_step": 87119, "epoch": 2074} {"train_loss": -6.3402533531188965, "global_step": 87120, "epoch": 2074} {"train_loss": -6.294461727142334, "global_step": 87121, "epoch": 2074} {"train_loss": -6.130262851715088, "global_step": 87122, "epoch": 2074} {"train_loss": -6.267690658569336, "global_step": 87123, "epoch": 2074} {"train_loss": -6.21074914932251, "global_step": 87124, "epoch": 2074} {"train_loss": -6.283359527587891, "global_step": 87125, "epoch": 2074} {"train_loss": -6.263741493225098, "global_step": 87126, "epoch": 2074} {"train_loss": -6.219277381896973, "global_step": 87127, "epoch": 2074} {"train_loss": -6.085371971130371, "global_step": 87128, "epoch": 2074} {"train_loss": -6.217256546020508, "global_step": 87129, "epoch": 2074} {"train_loss": -6.251760482788086, "global_step": 87130, "epoch": 2074} {"train_loss": -6.099932670593262, "global_step": 87131, "epoch": 2074} {"train_loss": -6.249942779541016, "global_step": 87132, "epoch": 2074} {"train_loss": -6.057056427001953, "global_step": 87133, "epoch": 2074} {"train_loss": -6.059201240539551, "global_step": 87134, "epoch": 2074} {"train_loss": -6.19387674331665, "global_step": 87135, "epoch": 2074} {"train_loss": -6.13377571105957, "global_step": 87136, "epoch": 2074} {"train_loss": -6.302296161651611, "global_step": 87137, "epoch": 2074} {"train_loss": -6.060449600219727, "global_step": 87138, "epoch": 2074} {"train_loss": -6.20493221282959, "global_step": 87139, "epoch": 2074} {"train_loss": -6.204607963562012, "global_step": 87140, "epoch": 2074} {"train_loss": -6.176347732543945, "global_step": 87141, "epoch": 2074} {"train_loss": -6.136318683624268, "global_step": 87142, "epoch": 2074} {"train_loss": -6.028195381164551, "global_step": 87143, "epoch": 2074} {"train_loss": -6.236701965332031, "global_step": 87144, "epoch": 2074} {"train_loss": -6.242090225219727, "global_step": 87145, "epoch": 2074} {"train_loss": -6.105775833129883, "global_step": 87146, "epoch": 2074} {"train_loss": -6.108088493347168, "global_step": 87147, "epoch": 2074} {"train_loss": -6.1982879638671875, "global_step": 87148, "epoch": 2074} {"train_loss": -6.200974782307942, "global_step": 87149, "epoch": 2074, "val_loss": 62860.2265625} {"train_loss": -6.242572784423828, "global_step": 87150, "epoch": 2075} {"train_loss": -6.167080879211426, "global_step": 87151, "epoch": 2075} {"train_loss": -6.169135570526123, "global_step": 87152, "epoch": 2075} {"train_loss": -6.0900163650512695, "global_step": 87153, "epoch": 2075} {"train_loss": -6.22723388671875, "global_step": 87154, "epoch": 2075} {"train_loss": -6.115847587585449, "global_step": 87155, "epoch": 2075} {"train_loss": -6.17623233795166, "global_step": 87156, "epoch": 2075} {"train_loss": -6.283198356628418, "global_step": 87157, "epoch": 2075} {"train_loss": -6.261315822601318, "global_step": 87158, "epoch": 2075} {"train_loss": -6.209296703338623, "global_step": 87159, "epoch": 2075} {"train_loss": -6.184486389160156, "global_step": 87160, "epoch": 2075} {"train_loss": -6.23530387878418, "global_step": 87161, "epoch": 2075} {"train_loss": -6.223203659057617, "global_step": 87162, "epoch": 2075} {"train_loss": -6.2189202308654785, "global_step": 87163, "epoch": 2075} {"train_loss": -6.262391567230225, "global_step": 87164, "epoch": 2075} {"train_loss": -6.171447277069092, "global_step": 87165, "epoch": 2075} {"train_loss": -6.139660835266113, "global_step": 87166, "epoch": 2075} {"train_loss": -6.219510555267334, "global_step": 87167, "epoch": 2075} {"train_loss": -6.148258209228516, "global_step": 87168, "epoch": 2075} {"train_loss": -6.119397163391113, "global_step": 87169, "epoch": 2075} {"train_loss": -6.189416408538818, "global_step": 87170, "epoch": 2075} {"train_loss": -6.170507907867432, "global_step": 87171, "epoch": 2075} {"train_loss": -6.182880401611328, "global_step": 87172, "epoch": 2075} {"train_loss": -6.214125633239746, "global_step": 87173, "epoch": 2075} {"train_loss": -6.1143035888671875, "global_step": 87174, "epoch": 2075} {"train_loss": -6.0866899490356445, "global_step": 87175, "epoch": 2075} {"train_loss": -6.284420967102051, "global_step": 87176, "epoch": 2075} {"train_loss": -6.1707048416137695, "global_step": 87177, "epoch": 2075} {"train_loss": -6.120236396789551, "global_step": 87178, "epoch": 2075} {"train_loss": -6.225668907165527, "global_step": 87179, "epoch": 2075} {"train_loss": -6.044119834899902, "global_step": 87180, "epoch": 2075} {"train_loss": -6.267978191375732, "global_step": 87181, "epoch": 2075} {"train_loss": -5.9835205078125, "global_step": 87182, "epoch": 2075} {"train_loss": -6.0316667556762695, "global_step": 87183, "epoch": 2075} {"train_loss": -6.312224864959717, "global_step": 87184, "epoch": 2075} {"train_loss": -6.139176368713379, "global_step": 87185, "epoch": 2075} {"train_loss": -6.266229629516602, "global_step": 87186, "epoch": 2075} {"train_loss": -6.155381202697754, "global_step": 87187, "epoch": 2075} {"train_loss": -6.103054046630859, "global_step": 87188, "epoch": 2075} {"train_loss": -6.3392486572265625, "global_step": 87189, "epoch": 2075} {"train_loss": -6.09737491607666, "global_step": 87190, "epoch": 2075} {"train_loss": -6.1811889580317905, "global_step": 87191, "epoch": 2075, "val_loss": 62923.7734375} {"train_loss": -6.185543060302734, "global_step": 87192, "epoch": 2076} {"train_loss": -6.24105167388916, "global_step": 87193, "epoch": 2076} {"train_loss": -6.241006851196289, "global_step": 87194, "epoch": 2076} {"train_loss": -6.275205612182617, "global_step": 87195, "epoch": 2076} {"train_loss": -6.251126766204834, "global_step": 87196, "epoch": 2076} {"train_loss": -6.250653266906738, "global_step": 87197, "epoch": 2076} {"train_loss": -6.229362487792969, "global_step": 87198, "epoch": 2076} {"train_loss": -6.240767478942871, "global_step": 87199, "epoch": 2076} {"train_loss": -6.169036865234375, "global_step": 87200, "epoch": 2076} {"train_loss": -6.245275497436523, "global_step": 87201, "epoch": 2076} {"train_loss": -6.252786159515381, "global_step": 87202, "epoch": 2076} {"train_loss": -6.2753190994262695, "global_step": 87203, "epoch": 2076} {"train_loss": -6.125114440917969, "global_step": 87204, "epoch": 2076} {"train_loss": -6.296742916107178, "global_step": 87205, "epoch": 2076} {"train_loss": -6.320655822753906, "global_step": 87206, "epoch": 2076} {"train_loss": -6.251288414001465, "global_step": 87207, "epoch": 2076} {"train_loss": -6.185110092163086, "global_step": 87208, "epoch": 2076} {"train_loss": -6.314797878265381, "global_step": 87209, "epoch": 2076} {"train_loss": -6.334047794342041, "global_step": 87210, "epoch": 2076} {"train_loss": -6.206995010375977, "global_step": 87211, "epoch": 2076} {"train_loss": -6.1631622314453125, "global_step": 87212, "epoch": 2076} {"train_loss": -6.202759742736816, "global_step": 87213, "epoch": 2076} {"train_loss": -6.2588982582092285, "global_step": 87214, "epoch": 2076} {"train_loss": -6.357547760009766, "global_step": 87215, "epoch": 2076} {"train_loss": -6.252647399902344, "global_step": 87216, "epoch": 2076} {"train_loss": -6.304673194885254, "global_step": 87217, "epoch": 2076} {"train_loss": -6.291783332824707, "global_step": 87218, "epoch": 2076} {"train_loss": -6.15322208404541, "global_step": 87219, "epoch": 2076} {"train_loss": -6.295693874359131, "global_step": 87220, "epoch": 2076} {"train_loss": -6.21930456161499, "global_step": 87221, "epoch": 2076} {"train_loss": -6.226008415222168, "global_step": 87222, "epoch": 2076} {"train_loss": -6.152646541595459, "global_step": 87223, "epoch": 2076} {"train_loss": -6.2242631912231445, "global_step": 87224, "epoch": 2076} {"train_loss": -6.175512313842773, "global_step": 87225, "epoch": 2076} {"train_loss": -6.234603404998779, "global_step": 87226, "epoch": 2076} {"train_loss": -6.025969505310059, "global_step": 87227, "epoch": 2076} {"train_loss": -6.27631950378418, "global_step": 87228, "epoch": 2076} {"train_loss": -6.13340950012207, "global_step": 87229, "epoch": 2076} {"train_loss": -6.121477127075195, "global_step": 87230, "epoch": 2076} {"train_loss": -6.206981658935547, "global_step": 87231, "epoch": 2076} {"train_loss": -6.1768364906311035, "global_step": 87232, "epoch": 2076} {"train_loss": -6.2275664465768, "global_step": 87233, "epoch": 2076, "val_loss": 62871.265625} {"train_loss": -6.187388896942139, "global_step": 87234, "epoch": 2077} {"train_loss": -6.104644775390625, "global_step": 87235, "epoch": 2077} {"train_loss": -6.2111358642578125, "global_step": 87236, "epoch": 2077} {"train_loss": -6.116275787353516, "global_step": 87237, "epoch": 2077} {"train_loss": -6.204158782958984, "global_step": 87238, "epoch": 2077} {"train_loss": -6.2160420417785645, "global_step": 87239, "epoch": 2077} {"train_loss": -6.412592887878418, "global_step": 87240, "epoch": 2077} {"train_loss": -6.090976715087891, "global_step": 87241, "epoch": 2077} {"train_loss": -6.104101181030273, "global_step": 87242, "epoch": 2077} {"train_loss": -6.188744068145752, "global_step": 87243, "epoch": 2077} {"train_loss": -6.04429817199707, "global_step": 87244, "epoch": 2077} {"train_loss": -6.131351947784424, "global_step": 87245, "epoch": 2077} {"train_loss": -6.160332679748535, "global_step": 87246, "epoch": 2077} {"train_loss": -6.277305603027344, "global_step": 87247, "epoch": 2077} {"train_loss": -6.202305793762207, "global_step": 87248, "epoch": 2077} {"train_loss": -6.225334167480469, "global_step": 87249, "epoch": 2077} {"train_loss": -6.171011924743652, "global_step": 87250, "epoch": 2077} {"train_loss": -6.248081684112549, "global_step": 87251, "epoch": 2077} {"train_loss": -6.159623146057129, "global_step": 87252, "epoch": 2077} {"train_loss": -6.2327423095703125, "global_step": 87253, "epoch": 2077} {"train_loss": -6.212061882019043, "global_step": 87254, "epoch": 2077} {"train_loss": -6.294745445251465, "global_step": 87255, "epoch": 2077} {"train_loss": -6.217323303222656, "global_step": 87256, "epoch": 2077} {"train_loss": -6.176090717315674, "global_step": 87257, "epoch": 2077} {"train_loss": -6.229166030883789, "global_step": 87258, "epoch": 2077} {"train_loss": -6.201992511749268, "global_step": 87259, "epoch": 2077} {"train_loss": -6.222667217254639, "global_step": 87260, "epoch": 2077} {"train_loss": -6.346033573150635, "global_step": 87261, "epoch": 2077} {"train_loss": -6.143606662750244, "global_step": 87262, "epoch": 2077} {"train_loss": -6.115815162658691, "global_step": 87263, "epoch": 2077} {"train_loss": -6.194459915161133, "global_step": 87264, "epoch": 2077} {"train_loss": -6.178773403167725, "global_step": 87265, "epoch": 2077} {"train_loss": -6.1528778076171875, "global_step": 87266, "epoch": 2077} {"train_loss": -6.124991416931152, "global_step": 87267, "epoch": 2077} {"train_loss": -6.221792221069336, "global_step": 87268, "epoch": 2077} {"train_loss": -6.2497076988220215, "global_step": 87269, "epoch": 2077} {"train_loss": -6.2576823234558105, "global_step": 87270, "epoch": 2077} {"train_loss": -6.174999237060547, "global_step": 87271, "epoch": 2077} {"train_loss": -6.149538040161133, "global_step": 87272, "epoch": 2077} {"train_loss": -6.268959999084473, "global_step": 87273, "epoch": 2077} {"train_loss": -6.324251651763916, "global_step": 87274, "epoch": 2077} {"train_loss": -6.199339333034697, "global_step": 87275, "epoch": 2077, "val_loss": 62793.2109375} {"train_loss": -6.259524345397949, "global_step": 87276, "epoch": 2078} {"train_loss": -6.344906806945801, "global_step": 87277, "epoch": 2078} {"train_loss": -6.386168003082275, "global_step": 87278, "epoch": 2078} {"train_loss": -6.204779148101807, "global_step": 87279, "epoch": 2078} {"train_loss": -6.275923728942871, "global_step": 87280, "epoch": 2078} {"train_loss": -6.257048606872559, "global_step": 87281, "epoch": 2078} {"train_loss": -6.196448802947998, "global_step": 87282, "epoch": 2078} {"train_loss": -6.295982837677002, "global_step": 87283, "epoch": 2078} {"train_loss": -6.355132102966309, "global_step": 87284, "epoch": 2078} {"train_loss": -6.280338287353516, "global_step": 87285, "epoch": 2078} {"train_loss": -6.286057949066162, "global_step": 87286, "epoch": 2078} {"train_loss": -6.224968910217285, "global_step": 87287, "epoch": 2078} {"train_loss": -6.315171718597412, "global_step": 87288, "epoch": 2078} {"train_loss": -6.186239719390869, "global_step": 87289, "epoch": 2078} {"train_loss": -6.206888675689697, "global_step": 87290, "epoch": 2078} {"train_loss": -6.19244384765625, "global_step": 87291, "epoch": 2078} {"train_loss": -6.295411586761475, "global_step": 87292, "epoch": 2078} {"train_loss": -6.275201797485352, "global_step": 87293, "epoch": 2078} {"train_loss": -6.317408561706543, "global_step": 87294, "epoch": 2078} {"train_loss": -6.199004650115967, "global_step": 87295, "epoch": 2078} {"train_loss": -6.232186317443848, "global_step": 87296, "epoch": 2078} {"train_loss": -6.285536766052246, "global_step": 87297, "epoch": 2078} {"train_loss": -6.2853007316589355, "global_step": 87298, "epoch": 2078} {"train_loss": -6.297133445739746, "global_step": 87299, "epoch": 2078} {"train_loss": -6.114977836608887, "global_step": 87300, "epoch": 2078} {"train_loss": -6.200527667999268, "global_step": 87301, "epoch": 2078} {"train_loss": -6.226144313812256, "global_step": 87302, "epoch": 2078} {"train_loss": -6.209194183349609, "global_step": 87303, "epoch": 2078} {"train_loss": -6.2595014572143555, "global_step": 87304, "epoch": 2078} {"train_loss": -6.331112861633301, "global_step": 87305, "epoch": 2078} {"train_loss": -6.328588485717773, "global_step": 87306, "epoch": 2078} {"train_loss": -6.213860511779785, "global_step": 87307, "epoch": 2078} {"train_loss": -6.243520736694336, "global_step": 87308, "epoch": 2078} {"train_loss": -6.291091442108154, "global_step": 87309, "epoch": 2078} {"train_loss": -6.14614200592041, "global_step": 87310, "epoch": 2078} {"train_loss": -6.150215148925781, "global_step": 87311, "epoch": 2078} {"train_loss": -6.188948631286621, "global_step": 87312, "epoch": 2078} {"train_loss": -6.183841705322266, "global_step": 87313, "epoch": 2078} {"train_loss": -6.093662261962891, "global_step": 87314, "epoch": 2078} {"train_loss": -6.267928600311279, "global_step": 87315, "epoch": 2078} {"train_loss": -6.112893104553223, "global_step": 87316, "epoch": 2078} {"train_loss": -6.242073002315703, "global_step": 87317, "epoch": 2078, "val_loss": 62871.90625} {"train_loss": -6.208043098449707, "global_step": 87318, "epoch": 2079} {"train_loss": -6.256451606750488, "global_step": 87319, "epoch": 2079} {"train_loss": -6.188261032104492, "global_step": 87320, "epoch": 2079} {"train_loss": -6.273402214050293, "global_step": 87321, "epoch": 2079} {"train_loss": -6.313271522521973, "global_step": 87322, "epoch": 2079} {"train_loss": -6.203203201293945, "global_step": 87323, "epoch": 2079} {"train_loss": -6.2745890617370605, "global_step": 87324, "epoch": 2079} {"train_loss": -6.253734588623047, "global_step": 87325, "epoch": 2079} {"train_loss": -6.095335006713867, "global_step": 87326, "epoch": 2079} {"train_loss": -6.295950412750244, "global_step": 87327, "epoch": 2079} {"train_loss": -6.388845443725586, "global_step": 87328, "epoch": 2079} {"train_loss": -6.242942810058594, "global_step": 87329, "epoch": 2079} {"train_loss": -6.211394786834717, "global_step": 87330, "epoch": 2079} {"train_loss": -6.248986721038818, "global_step": 87331, "epoch": 2079} {"train_loss": -6.09724235534668, "global_step": 87332, "epoch": 2079} {"train_loss": -6.120151519775391, "global_step": 87333, "epoch": 2079} {"train_loss": -6.228553295135498, "global_step": 87334, "epoch": 2079} {"train_loss": -6.220303535461426, "global_step": 87335, "epoch": 2079} {"train_loss": -6.157528877258301, "global_step": 87336, "epoch": 2079} {"train_loss": -6.2597856521606445, "global_step": 87337, "epoch": 2079} {"train_loss": -6.182994842529297, "global_step": 87338, "epoch": 2079} {"train_loss": -6.217535972595215, "global_step": 87339, "epoch": 2079} {"train_loss": -6.338456630706787, "global_step": 87340, "epoch": 2079} {"train_loss": -6.198122024536133, "global_step": 87341, "epoch": 2079} {"train_loss": -6.183621406555176, "global_step": 87342, "epoch": 2079} {"train_loss": -6.277132987976074, "global_step": 87343, "epoch": 2079} {"train_loss": -6.251211166381836, "global_step": 87344, "epoch": 2079} {"train_loss": -6.346362113952637, "global_step": 87345, "epoch": 2079} {"train_loss": -6.089742660522461, "global_step": 87346, "epoch": 2079} {"train_loss": -6.316498279571533, "global_step": 87347, "epoch": 2079} {"train_loss": -6.301090240478516, "global_step": 87348, "epoch": 2079} {"train_loss": -6.30324125289917, "global_step": 87349, "epoch": 2079} {"train_loss": -6.1419148445129395, "global_step": 87350, "epoch": 2079} {"train_loss": -6.342053413391113, "global_step": 87351, "epoch": 2079} {"train_loss": -6.315302848815918, "global_step": 87352, "epoch": 2079} {"train_loss": -6.151788234710693, "global_step": 87353, "epoch": 2079} {"train_loss": -6.122879981994629, "global_step": 87354, "epoch": 2079} {"train_loss": -6.255538463592529, "global_step": 87355, "epoch": 2079} {"train_loss": -6.1758270263671875, "global_step": 87356, "epoch": 2079} {"train_loss": -6.155124664306641, "global_step": 87357, "epoch": 2079} {"train_loss": -6.175479888916016, "global_step": 87358, "epoch": 2079} {"train_loss": -6.226943186351231, "global_step": 87359, "epoch": 2079, "val_loss": 63120.390625} {"train_loss": -6.102169990539551, "global_step": 87360, "epoch": 2080} {"train_loss": -6.320975303649902, "global_step": 87361, "epoch": 2080} {"train_loss": -6.271985054016113, "global_step": 87362, "epoch": 2080} {"train_loss": -6.029630184173584, "global_step": 87363, "epoch": 2080} {"train_loss": -6.168229103088379, "global_step": 87364, "epoch": 2080} {"train_loss": -6.257894515991211, "global_step": 87365, "epoch": 2080} {"train_loss": -6.245682716369629, "global_step": 87366, "epoch": 2080} {"train_loss": -6.203851699829102, "global_step": 87367, "epoch": 2080} {"train_loss": -6.161624431610107, "global_step": 87368, "epoch": 2080} {"train_loss": -6.225329399108887, "global_step": 87369, "epoch": 2080} {"train_loss": -6.207449913024902, "global_step": 87370, "epoch": 2080} {"train_loss": -6.2148847579956055, "global_step": 87371, "epoch": 2080} {"train_loss": -6.284767150878906, "global_step": 87372, "epoch": 2080} {"train_loss": -6.156486511230469, "global_step": 87373, "epoch": 2080} {"train_loss": -6.240821361541748, "global_step": 87374, "epoch": 2080} {"train_loss": -6.233154296875, "global_step": 87375, "epoch": 2080} {"train_loss": -6.210807800292969, "global_step": 87376, "epoch": 2080} {"train_loss": -6.1997528076171875, "global_step": 87377, "epoch": 2080} {"train_loss": -6.233058452606201, "global_step": 87378, "epoch": 2080} {"train_loss": -6.327337741851807, "global_step": 87379, "epoch": 2080} {"train_loss": -6.1474409103393555, "global_step": 87380, "epoch": 2080} {"train_loss": -6.192526817321777, "global_step": 87381, "epoch": 2080} {"train_loss": -6.298067092895508, "global_step": 87382, "epoch": 2080} {"train_loss": -6.1822004318237305, "global_step": 87383, "epoch": 2080} {"train_loss": -6.190253257751465, "global_step": 87384, "epoch": 2080} {"train_loss": -6.21660041809082, "global_step": 87385, "epoch": 2080} {"train_loss": -6.282858848571777, "global_step": 87386, "epoch": 2080} {"train_loss": -6.108141899108887, "global_step": 87387, "epoch": 2080} {"train_loss": -6.137874603271484, "global_step": 87388, "epoch": 2080} {"train_loss": -6.265012741088867, "global_step": 87389, "epoch": 2080} {"train_loss": -6.132784366607666, "global_step": 87390, "epoch": 2080} {"train_loss": -6.238694190979004, "global_step": 87391, "epoch": 2080} {"train_loss": -6.1762614250183105, "global_step": 87392, "epoch": 2080} {"train_loss": -6.130295753479004, "global_step": 87393, "epoch": 2080} {"train_loss": -6.197483062744141, "global_step": 87394, "epoch": 2080} {"train_loss": -6.366080284118652, "global_step": 87395, "epoch": 2080} {"train_loss": -6.347076416015625, "global_step": 87396, "epoch": 2080} {"train_loss": -6.170910835266113, "global_step": 87397, "epoch": 2080} {"train_loss": -6.18846321105957, "global_step": 87398, "epoch": 2080} {"train_loss": -6.2510199546813965, "global_step": 87399, "epoch": 2080} {"train_loss": -6.240612506866455, "global_step": 87400, "epoch": 2080} {"train_loss": -6.211480924061367, "global_step": 87401, "epoch": 2080, "val_loss": 63017.0} {"train_loss": -6.152059555053711, "global_step": 87402, "epoch": 2081} {"train_loss": -6.205496311187744, "global_step": 87403, "epoch": 2081} {"train_loss": -6.335740089416504, "global_step": 87404, "epoch": 2081} {"train_loss": -6.232666015625, "global_step": 87405, "epoch": 2081} {"train_loss": -6.247244358062744, "global_step": 87406, "epoch": 2081} {"train_loss": -6.38817834854126, "global_step": 87407, "epoch": 2081} {"train_loss": -6.114819526672363, "global_step": 87408, "epoch": 2081} {"train_loss": -6.250273704528809, "global_step": 87409, "epoch": 2081} {"train_loss": -6.235039710998535, "global_step": 87410, "epoch": 2081} {"train_loss": -6.1863250732421875, "global_step": 87411, "epoch": 2081} {"train_loss": -6.208134174346924, "global_step": 87412, "epoch": 2081} {"train_loss": -6.3052897453308105, "global_step": 87413, "epoch": 2081} {"train_loss": -6.121192932128906, "global_step": 87414, "epoch": 2081} {"train_loss": -6.12132453918457, "global_step": 87415, "epoch": 2081} {"train_loss": -6.167865753173828, "global_step": 87416, "epoch": 2081} {"train_loss": -6.084269046783447, "global_step": 87417, "epoch": 2081} {"train_loss": -6.059172630310059, "global_step": 87418, "epoch": 2081} {"train_loss": -6.217691421508789, "global_step": 87419, "epoch": 2081} {"train_loss": -6.190000534057617, "global_step": 87420, "epoch": 2081} {"train_loss": -6.201909065246582, "global_step": 87421, "epoch": 2081} {"train_loss": -6.059656143188477, "global_step": 87422, "epoch": 2081} {"train_loss": -6.18673849105835, "global_step": 87423, "epoch": 2081} {"train_loss": -6.2491865158081055, "global_step": 87424, "epoch": 2081} {"train_loss": -6.162294387817383, "global_step": 87425, "epoch": 2081} {"train_loss": -6.236451625823975, "global_step": 87426, "epoch": 2081} {"train_loss": -6.0949859619140625, "global_step": 87427, "epoch": 2081} {"train_loss": -6.218229293823242, "global_step": 87428, "epoch": 2081} {"train_loss": -6.184525489807129, "global_step": 87429, "epoch": 2081} {"train_loss": -6.203485488891602, "global_step": 87430, "epoch": 2081} {"train_loss": -6.246678352355957, "global_step": 87431, "epoch": 2081} {"train_loss": -6.199692726135254, "global_step": 87432, "epoch": 2081} {"train_loss": -6.234652042388916, "global_step": 87433, "epoch": 2081} {"train_loss": -6.302212238311768, "global_step": 87434, "epoch": 2081} {"train_loss": -6.1923041343688965, "global_step": 87435, "epoch": 2081} {"train_loss": -6.277403831481934, "global_step": 87436, "epoch": 2081} {"train_loss": -6.171786308288574, "global_step": 87437, "epoch": 2081} {"train_loss": -6.277367115020752, "global_step": 87438, "epoch": 2081} {"train_loss": -6.345833778381348, "global_step": 87439, "epoch": 2081} {"train_loss": -6.282585620880127, "global_step": 87440, "epoch": 2081} {"train_loss": -6.131930351257324, "global_step": 87441, "epoch": 2081} {"train_loss": -6.283633232116699, "global_step": 87442, "epoch": 2081} {"train_loss": -6.2109772477831156, "global_step": 87443, "epoch": 2081, "val_loss": 62769.11328125} {"train_loss": -6.334807395935059, "global_step": 87444, "epoch": 2082} {"train_loss": -6.1763811111450195, "global_step": 87445, "epoch": 2082} {"train_loss": -6.334405422210693, "global_step": 87446, "epoch": 2082} {"train_loss": -6.266186714172363, "global_step": 87447, "epoch": 2082} {"train_loss": -6.2270379066467285, "global_step": 87448, "epoch": 2082} {"train_loss": -6.266898155212402, "global_step": 87449, "epoch": 2082} {"train_loss": -6.2972869873046875, "global_step": 87450, "epoch": 2082} {"train_loss": -6.125904083251953, "global_step": 87451, "epoch": 2082} {"train_loss": -6.22228479385376, "global_step": 87452, "epoch": 2082} {"train_loss": -6.330509185791016, "global_step": 87453, "epoch": 2082} {"train_loss": -6.24603271484375, "global_step": 87454, "epoch": 2082} {"train_loss": -6.1932244300842285, "global_step": 87455, "epoch": 2082} {"train_loss": -6.184624671936035, "global_step": 87456, "epoch": 2082} {"train_loss": -6.09338903427124, "global_step": 87457, "epoch": 2082} {"train_loss": -6.11494255065918, "global_step": 87458, "epoch": 2082} {"train_loss": -6.225772380828857, "global_step": 87459, "epoch": 2082} {"train_loss": -6.001901626586914, "global_step": 87460, "epoch": 2082} {"train_loss": -6.173698425292969, "global_step": 87461, "epoch": 2082} {"train_loss": -6.292871475219727, "global_step": 87462, "epoch": 2082} {"train_loss": -6.15816593170166, "global_step": 87463, "epoch": 2082} {"train_loss": -6.178507328033447, "global_step": 87464, "epoch": 2082} {"train_loss": -6.114219665527344, "global_step": 87465, "epoch": 2082} {"train_loss": -6.241807460784912, "global_step": 87466, "epoch": 2082} {"train_loss": -6.238929748535156, "global_step": 87467, "epoch": 2082} {"train_loss": -6.155860424041748, "global_step": 87468, "epoch": 2082} {"train_loss": -6.162505149841309, "global_step": 87469, "epoch": 2082} {"train_loss": -6.213273048400879, "global_step": 87470, "epoch": 2082} {"train_loss": -6.276549339294434, "global_step": 87471, "epoch": 2082} {"train_loss": -6.23573112487793, "global_step": 87472, "epoch": 2082} {"train_loss": -6.24403715133667, "global_step": 87473, "epoch": 2082} {"train_loss": -6.326545715332031, "global_step": 87474, "epoch": 2082} {"train_loss": -6.170090198516846, "global_step": 87475, "epoch": 2082} {"train_loss": -6.232437610626221, "global_step": 87476, "epoch": 2082} {"train_loss": -6.2565765380859375, "global_step": 87477, "epoch": 2082} {"train_loss": -6.249867916107178, "global_step": 87478, "epoch": 2082} {"train_loss": -6.258544921875, "global_step": 87479, "epoch": 2082} {"train_loss": -6.137545108795166, "global_step": 87480, "epoch": 2082} {"train_loss": -6.310810089111328, "global_step": 87481, "epoch": 2082} {"train_loss": -6.294957637786865, "global_step": 87482, "epoch": 2082} {"train_loss": -6.141109466552734, "global_step": 87483, "epoch": 2082} {"train_loss": -6.200805187225342, "global_step": 87484, "epoch": 2082} {"train_loss": -6.219119571504139, "global_step": 87485, "epoch": 2082, "val_loss": 62663.6875} {"train_loss": -6.363226890563965, "global_step": 87486, "epoch": 2083} {"train_loss": -6.174470901489258, "global_step": 87487, "epoch": 2083} {"train_loss": -6.321450233459473, "global_step": 87488, "epoch": 2083} {"train_loss": -6.162595748901367, "global_step": 87489, "epoch": 2083} {"train_loss": -6.289915561676025, "global_step": 87490, "epoch": 2083} {"train_loss": -6.316976547241211, "global_step": 87491, "epoch": 2083} {"train_loss": -6.262925148010254, "global_step": 87492, "epoch": 2083} {"train_loss": -6.459364891052246, "global_step": 87493, "epoch": 2083} {"train_loss": -6.310518264770508, "global_step": 87494, "epoch": 2083} {"train_loss": -6.30303955078125, "global_step": 87495, "epoch": 2083} {"train_loss": -6.1769256591796875, "global_step": 87496, "epoch": 2083} {"train_loss": -6.194262981414795, "global_step": 87497, "epoch": 2083} {"train_loss": -6.265311241149902, "global_step": 87498, "epoch": 2083} {"train_loss": -6.373930931091309, "global_step": 87499, "epoch": 2083} {"train_loss": -6.272437572479248, "global_step": 87500, "epoch": 2083} {"train_loss": -6.225913047790527, "global_step": 87501, "epoch": 2083} {"train_loss": -6.260765075683594, "global_step": 87502, "epoch": 2083} {"train_loss": -6.261419296264648, "global_step": 87503, "epoch": 2083} {"train_loss": -6.272708892822266, "global_step": 87504, "epoch": 2083} {"train_loss": -6.266819000244141, "global_step": 87505, "epoch": 2083} {"train_loss": -6.275715351104736, "global_step": 87506, "epoch": 2083} {"train_loss": -6.366549491882324, "global_step": 87507, "epoch": 2083} {"train_loss": -6.166191101074219, "global_step": 87508, "epoch": 2083} {"train_loss": -6.376565933227539, "global_step": 87509, "epoch": 2083} {"train_loss": -6.2513885498046875, "global_step": 87510, "epoch": 2083} {"train_loss": -6.1629414558410645, "global_step": 87511, "epoch": 2083} {"train_loss": -6.307027339935303, "global_step": 87512, "epoch": 2083} {"train_loss": -6.2861785888671875, "global_step": 87513, "epoch": 2083} {"train_loss": -6.258447647094727, "global_step": 87514, "epoch": 2083} {"train_loss": -6.2410888671875, "global_step": 87515, "epoch": 2083} {"train_loss": -6.312507629394531, "global_step": 87516, "epoch": 2083} {"train_loss": -6.3020830154418945, "global_step": 87517, "epoch": 2083} {"train_loss": -6.242455959320068, "global_step": 87518, "epoch": 2083} {"train_loss": -6.058719635009766, "global_step": 87519, "epoch": 2083} {"train_loss": -6.265906810760498, "global_step": 87520, "epoch": 2083} {"train_loss": -6.326728820800781, "global_step": 87521, "epoch": 2083} {"train_loss": -6.293934345245361, "global_step": 87522, "epoch": 2083} {"train_loss": -6.271538257598877, "global_step": 87523, "epoch": 2083} {"train_loss": -6.319290637969971, "global_step": 87524, "epoch": 2083} {"train_loss": -6.196288108825684, "global_step": 87525, "epoch": 2083} {"train_loss": -6.351539611816406, "global_step": 87526, "epoch": 2083} {"train_loss": -6.273673886344547, "global_step": 87527, "epoch": 2083, "val_loss": 62773.24609375} {"train_loss": -6.080445766448975, "global_step": 87528, "epoch": 2084} {"train_loss": -6.197515487670898, "global_step": 87529, "epoch": 2084} {"train_loss": -6.296134948730469, "global_step": 87530, "epoch": 2084} {"train_loss": -6.287498474121094, "global_step": 87531, "epoch": 2084} {"train_loss": -6.167128086090088, "global_step": 87532, "epoch": 2084} {"train_loss": -6.169126987457275, "global_step": 87533, "epoch": 2084} {"train_loss": -6.259234428405762, "global_step": 87534, "epoch": 2084} {"train_loss": -6.236146450042725, "global_step": 87535, "epoch": 2084} {"train_loss": -6.098843097686768, "global_step": 87536, "epoch": 2084} {"train_loss": -6.283509731292725, "global_step": 87537, "epoch": 2084} {"train_loss": -6.149537086486816, "global_step": 87538, "epoch": 2084} {"train_loss": -6.149774074554443, "global_step": 87539, "epoch": 2084} {"train_loss": -6.100424766540527, "global_step": 87540, "epoch": 2084} {"train_loss": -6.093439102172852, "global_step": 87541, "epoch": 2084} {"train_loss": -6.280828475952148, "global_step": 87542, "epoch": 2084} {"train_loss": -6.119410991668701, "global_step": 87543, "epoch": 2084} {"train_loss": -6.267444133758545, "global_step": 87544, "epoch": 2084} {"train_loss": -6.147136688232422, "global_step": 87545, "epoch": 2084} {"train_loss": -6.2156147956848145, "global_step": 87546, "epoch": 2084} {"train_loss": -6.220137596130371, "global_step": 87547, "epoch": 2084} {"train_loss": -6.209585189819336, "global_step": 87548, "epoch": 2084} {"train_loss": -6.265108108520508, "global_step": 87549, "epoch": 2084} {"train_loss": -6.236965179443359, "global_step": 87550, "epoch": 2084} {"train_loss": -6.170481204986572, "global_step": 87551, "epoch": 2084} {"train_loss": -6.3321685791015625, "global_step": 87552, "epoch": 2084} {"train_loss": -6.24254035949707, "global_step": 87553, "epoch": 2084} {"train_loss": -6.317739009857178, "global_step": 87554, "epoch": 2084} {"train_loss": -6.218025207519531, "global_step": 87555, "epoch": 2084} {"train_loss": -6.264101982116699, "global_step": 87556, "epoch": 2084} {"train_loss": -6.366101264953613, "global_step": 87557, "epoch": 2084} {"train_loss": -6.302410125732422, "global_step": 87558, "epoch": 2084} {"train_loss": -6.2874250411987305, "global_step": 87559, "epoch": 2084} {"train_loss": -6.357916831970215, "global_step": 87560, "epoch": 2084} {"train_loss": -6.288635730743408, "global_step": 87561, "epoch": 2084} {"train_loss": -6.247443675994873, "global_step": 87562, "epoch": 2084} {"train_loss": -6.299238204956055, "global_step": 87563, "epoch": 2084} {"train_loss": -6.348896026611328, "global_step": 87564, "epoch": 2084} {"train_loss": -6.1887102127075195, "global_step": 87565, "epoch": 2084} {"train_loss": -6.242610454559326, "global_step": 87566, "epoch": 2084} {"train_loss": -6.344081401824951, "global_step": 87567, "epoch": 2084} {"train_loss": -6.341681480407715, "global_step": 87568, "epoch": 2084} {"train_loss": -6.233772482190814, "global_step": 87569, "epoch": 2084, "val_loss": 62711.5078125} {"train_loss": -6.275341510772705, "global_step": 87570, "epoch": 2085} {"train_loss": -6.298619747161865, "global_step": 87571, "epoch": 2085} {"train_loss": -6.246048927307129, "global_step": 87572, "epoch": 2085} {"train_loss": -6.310147285461426, "global_step": 87573, "epoch": 2085} {"train_loss": -6.3029937744140625, "global_step": 87574, "epoch": 2085} {"train_loss": -6.135281562805176, "global_step": 87575, "epoch": 2085} {"train_loss": -6.422444820404053, "global_step": 87576, "epoch": 2085} {"train_loss": -6.215405464172363, "global_step": 87577, "epoch": 2085} {"train_loss": -6.133829593658447, "global_step": 87578, "epoch": 2085} {"train_loss": -6.279585838317871, "global_step": 87579, "epoch": 2085} {"train_loss": -6.218449592590332, "global_step": 87580, "epoch": 2085} {"train_loss": -6.141894817352295, "global_step": 87581, "epoch": 2085} {"train_loss": -6.113125801086426, "global_step": 87582, "epoch": 2085} {"train_loss": -6.17913293838501, "global_step": 87583, "epoch": 2085} {"train_loss": -6.295938014984131, "global_step": 87584, "epoch": 2085} {"train_loss": -6.197296142578125, "global_step": 87585, "epoch": 2085} {"train_loss": -6.253061771392822, "global_step": 87586, "epoch": 2085} {"train_loss": -6.129976272583008, "global_step": 87587, "epoch": 2085} {"train_loss": -6.1495442390441895, "global_step": 87588, "epoch": 2085} {"train_loss": -6.187789440155029, "global_step": 87589, "epoch": 2085} {"train_loss": -6.072832107543945, "global_step": 87590, "epoch": 2085} {"train_loss": -6.217291831970215, "global_step": 87591, "epoch": 2085} {"train_loss": -6.169520378112793, "global_step": 87592, "epoch": 2085} {"train_loss": -6.391380310058594, "global_step": 87593, "epoch": 2085} {"train_loss": -6.242749214172363, "global_step": 87594, "epoch": 2085} {"train_loss": -6.060463905334473, "global_step": 87595, "epoch": 2085} {"train_loss": -6.252772331237793, "global_step": 87596, "epoch": 2085} {"train_loss": -6.15513801574707, "global_step": 87597, "epoch": 2085} {"train_loss": -6.230508327484131, "global_step": 87598, "epoch": 2085} {"train_loss": -6.166158676147461, "global_step": 87599, "epoch": 2085} {"train_loss": -6.257755756378174, "global_step": 87600, "epoch": 2085} {"train_loss": -6.300457954406738, "global_step": 87601, "epoch": 2085} {"train_loss": -6.218055248260498, "global_step": 87602, "epoch": 2085} {"train_loss": -6.295655250549316, "global_step": 87603, "epoch": 2085} {"train_loss": -6.27119779586792, "global_step": 87604, "epoch": 2085} {"train_loss": -6.19136381149292, "global_step": 87605, "epoch": 2085} {"train_loss": -6.29255485534668, "global_step": 87606, "epoch": 2085} {"train_loss": -6.285778999328613, "global_step": 87607, "epoch": 2085} {"train_loss": -6.22614860534668, "global_step": 87608, "epoch": 2085} {"train_loss": -6.188937664031982, "global_step": 87609, "epoch": 2085} {"train_loss": -6.261028289794922, "global_step": 87610, "epoch": 2085} {"train_loss": -6.225811629068284, "global_step": 87611, "epoch": 2085, "val_loss": 62990.546875} {"train_loss": -6.200566291809082, "global_step": 87612, "epoch": 2086} {"train_loss": -6.295764923095703, "global_step": 87613, "epoch": 2086} {"train_loss": -6.267749309539795, "global_step": 87614, "epoch": 2086} {"train_loss": -6.2432732582092285, "global_step": 87615, "epoch": 2086} {"train_loss": -6.329827308654785, "global_step": 87616, "epoch": 2086} {"train_loss": -6.248983383178711, "global_step": 87617, "epoch": 2086} {"train_loss": -6.277677059173584, "global_step": 87618, "epoch": 2086} {"train_loss": -6.303580284118652, "global_step": 87619, "epoch": 2086} {"train_loss": -6.363872528076172, "global_step": 87620, "epoch": 2086} {"train_loss": -6.2548418045043945, "global_step": 87621, "epoch": 2086} {"train_loss": -6.200386047363281, "global_step": 87622, "epoch": 2086} {"train_loss": -6.251384735107422, "global_step": 87623, "epoch": 2086} {"train_loss": -6.291794776916504, "global_step": 87624, "epoch": 2086} {"train_loss": -6.292027473449707, "global_step": 87625, "epoch": 2086} {"train_loss": -6.179163932800293, "global_step": 87626, "epoch": 2086} {"train_loss": -6.193612098693848, "global_step": 87627, "epoch": 2086} {"train_loss": -6.21995735168457, "global_step": 87628, "epoch": 2086} {"train_loss": -6.261017799377441, "global_step": 87629, "epoch": 2086} {"train_loss": -6.28961706161499, "global_step": 87630, "epoch": 2086} {"train_loss": -6.316886901855469, "global_step": 87631, "epoch": 2086} {"train_loss": -6.301760673522949, "global_step": 87632, "epoch": 2086} {"train_loss": -6.209527492523193, "global_step": 87633, "epoch": 2086} {"train_loss": -6.186483383178711, "global_step": 87634, "epoch": 2086} {"train_loss": -6.291908264160156, "global_step": 87635, "epoch": 2086} {"train_loss": -6.221083641052246, "global_step": 87636, "epoch": 2086} {"train_loss": -6.3216047286987305, "global_step": 87637, "epoch": 2086} {"train_loss": -6.205643177032471, "global_step": 87638, "epoch": 2086} {"train_loss": -6.266429424285889, "global_step": 87639, "epoch": 2086} {"train_loss": -6.065933704376221, "global_step": 87640, "epoch": 2086} {"train_loss": -6.352075576782227, "global_step": 87641, "epoch": 2086} {"train_loss": -6.279743194580078, "global_step": 87642, "epoch": 2086} {"train_loss": -6.225998878479004, "global_step": 87643, "epoch": 2086} {"train_loss": -6.165916919708252, "global_step": 87644, "epoch": 2086} {"train_loss": -6.24343204498291, "global_step": 87645, "epoch": 2086} {"train_loss": -6.193417549133301, "global_step": 87646, "epoch": 2086} {"train_loss": -6.175692558288574, "global_step": 87647, "epoch": 2086} {"train_loss": -6.227688789367676, "global_step": 87648, "epoch": 2086} {"train_loss": -6.309764385223389, "global_step": 87649, "epoch": 2086} {"train_loss": -6.236594200134277, "global_step": 87650, "epoch": 2086} {"train_loss": -6.176364898681641, "global_step": 87651, "epoch": 2086} {"train_loss": -6.229650497436523, "global_step": 87652, "epoch": 2086} {"train_loss": -6.245282888412476, "global_step": 87653, "epoch": 2086, "val_loss": 62978.97265625} {"train_loss": -6.327370643615723, "global_step": 87654, "epoch": 2087} {"train_loss": -6.157756328582764, "global_step": 87655, "epoch": 2087} {"train_loss": -6.251734733581543, "global_step": 87656, "epoch": 2087} {"train_loss": -6.257214069366455, "global_step": 87657, "epoch": 2087} {"train_loss": -6.262884140014648, "global_step": 87658, "epoch": 2087} {"train_loss": -6.364336013793945, "global_step": 87659, "epoch": 2087} {"train_loss": -6.37471866607666, "global_step": 87660, "epoch": 2087} {"train_loss": -6.270491600036621, "global_step": 87661, "epoch": 2087} {"train_loss": -6.26738166809082, "global_step": 87662, "epoch": 2087} {"train_loss": -6.238266944885254, "global_step": 87663, "epoch": 2087} {"train_loss": -6.249265193939209, "global_step": 87664, "epoch": 2087} {"train_loss": -6.1368207931518555, "global_step": 87665, "epoch": 2087} {"train_loss": -6.208197593688965, "global_step": 87666, "epoch": 2087} {"train_loss": -6.268962860107422, "global_step": 87667, "epoch": 2087} {"train_loss": -6.217967510223389, "global_step": 87668, "epoch": 2087} {"train_loss": -6.347774505615234, "global_step": 87669, "epoch": 2087} {"train_loss": -6.129863739013672, "global_step": 87670, "epoch": 2087} {"train_loss": -6.260095596313477, "global_step": 87671, "epoch": 2087} {"train_loss": -6.186601638793945, "global_step": 87672, "epoch": 2087} {"train_loss": -6.15300178527832, "global_step": 87673, "epoch": 2087} {"train_loss": -6.280399322509766, "global_step": 87674, "epoch": 2087} {"train_loss": -6.107398986816406, "global_step": 87675, "epoch": 2087} {"train_loss": -6.1519036293029785, "global_step": 87676, "epoch": 2087} {"train_loss": -6.238792419433594, "global_step": 87677, "epoch": 2087} {"train_loss": -6.1476850509643555, "global_step": 87678, "epoch": 2087} {"train_loss": -6.152298450469971, "global_step": 87679, "epoch": 2087} {"train_loss": -6.162663459777832, "global_step": 87680, "epoch": 2087} {"train_loss": -6.269650936126709, "global_step": 87681, "epoch": 2087} {"train_loss": -6.294416427612305, "global_step": 87682, "epoch": 2087} {"train_loss": -6.117707252502441, "global_step": 87683, "epoch": 2087} {"train_loss": -6.266252517700195, "global_step": 87684, "epoch": 2087} {"train_loss": -6.2399749755859375, "global_step": 87685, "epoch": 2087} {"train_loss": -6.104538917541504, "global_step": 87686, "epoch": 2087} {"train_loss": -6.256971836090088, "global_step": 87687, "epoch": 2087} {"train_loss": -6.3079047203063965, "global_step": 87688, "epoch": 2087} {"train_loss": -6.190298080444336, "global_step": 87689, "epoch": 2087} {"train_loss": -6.187744140625, "global_step": 87690, "epoch": 2087} {"train_loss": -6.18005895614624, "global_step": 87691, "epoch": 2087} {"train_loss": -6.107479095458984, "global_step": 87692, "epoch": 2087} {"train_loss": -6.205639839172363, "global_step": 87693, "epoch": 2087} {"train_loss": -6.27036190032959, "global_step": 87694, "epoch": 2087} {"train_loss": -6.224226917539324, "global_step": 87695, "epoch": 2087, "val_loss": 62721.6328125} {"train_loss": -6.283841133117676, "global_step": 87696, "epoch": 2088} {"train_loss": -6.263206481933594, "global_step": 87697, "epoch": 2088} {"train_loss": -6.225431442260742, "global_step": 87698, "epoch": 2088} {"train_loss": -6.185795307159424, "global_step": 87699, "epoch": 2088} {"train_loss": -6.225261688232422, "global_step": 87700, "epoch": 2088} {"train_loss": -6.161245822906494, "global_step": 87701, "epoch": 2088} {"train_loss": -6.152708053588867, "global_step": 87702, "epoch": 2088} {"train_loss": -6.158447265625, "global_step": 87703, "epoch": 2088} {"train_loss": -6.104937553405762, "global_step": 87704, "epoch": 2088} {"train_loss": -6.256165504455566, "global_step": 87705, "epoch": 2088} {"train_loss": -6.077096939086914, "global_step": 87706, "epoch": 2088} {"train_loss": -6.2036452293396, "global_step": 87707, "epoch": 2088} {"train_loss": -6.084335803985596, "global_step": 87708, "epoch": 2088} {"train_loss": -6.133164882659912, "global_step": 87709, "epoch": 2088} {"train_loss": -6.234328746795654, "global_step": 87710, "epoch": 2088} {"train_loss": -6.181840419769287, "global_step": 87711, "epoch": 2088} {"train_loss": -6.087191581726074, "global_step": 87712, "epoch": 2088} {"train_loss": -6.299145698547363, "global_step": 87713, "epoch": 2088} {"train_loss": -6.324593544006348, "global_step": 87714, "epoch": 2088} {"train_loss": -6.163808345794678, "global_step": 87715, "epoch": 2088} {"train_loss": -6.221512794494629, "global_step": 87716, "epoch": 2088} {"train_loss": -6.141502857208252, "global_step": 87717, "epoch": 2088} {"train_loss": -6.18369197845459, "global_step": 87718, "epoch": 2088} {"train_loss": -6.148716926574707, "global_step": 87719, "epoch": 2088} {"train_loss": -6.3161845207214355, "global_step": 87720, "epoch": 2088} {"train_loss": -6.212806701660156, "global_step": 87721, "epoch": 2088} {"train_loss": -6.230830192565918, "global_step": 87722, "epoch": 2088} {"train_loss": -6.1399922370910645, "global_step": 87723, "epoch": 2088} {"train_loss": -6.212601661682129, "global_step": 87724, "epoch": 2088} {"train_loss": -6.364058494567871, "global_step": 87725, "epoch": 2088} {"train_loss": -6.267991065979004, "global_step": 87726, "epoch": 2088} {"train_loss": -6.365473747253418, "global_step": 87727, "epoch": 2088} {"train_loss": -6.228534698486328, "global_step": 87728, "epoch": 2088} {"train_loss": -6.257163047790527, "global_step": 87729, "epoch": 2088} {"train_loss": -6.212256908416748, "global_step": 87730, "epoch": 2088} {"train_loss": -6.1707940101623535, "global_step": 87731, "epoch": 2088} {"train_loss": -6.112668991088867, "global_step": 87732, "epoch": 2088} {"train_loss": -6.1985931396484375, "global_step": 87733, "epoch": 2088} {"train_loss": -6.283239364624023, "global_step": 87734, "epoch": 2088} {"train_loss": -6.213763236999512, "global_step": 87735, "epoch": 2088} {"train_loss": -6.191512107849121, "global_step": 87736, "epoch": 2088} {"train_loss": -6.202911274773734, "global_step": 87737, "epoch": 2088, "val_loss": 62966.87890625} {"train_loss": -6.239529609680176, "global_step": 87738, "epoch": 2089} {"train_loss": -6.19156551361084, "global_step": 87739, "epoch": 2089} {"train_loss": -6.163282871246338, "global_step": 87740, "epoch": 2089} {"train_loss": -6.32710599899292, "global_step": 87741, "epoch": 2089} {"train_loss": -6.169658660888672, "global_step": 87742, "epoch": 2089} {"train_loss": -6.279714584350586, "global_step": 87743, "epoch": 2089} {"train_loss": -6.219669818878174, "global_step": 87744, "epoch": 2089} {"train_loss": -6.30035400390625, "global_step": 87745, "epoch": 2089} {"train_loss": -6.236616611480713, "global_step": 87746, "epoch": 2089} {"train_loss": -6.229655742645264, "global_step": 87747, "epoch": 2089} {"train_loss": -6.2522149085998535, "global_step": 87748, "epoch": 2089} {"train_loss": -6.2906951904296875, "global_step": 87749, "epoch": 2089} {"train_loss": -6.259076118469238, "global_step": 87750, "epoch": 2089} {"train_loss": -6.2301836013793945, "global_step": 87751, "epoch": 2089} {"train_loss": -6.3222527503967285, "global_step": 87752, "epoch": 2089} {"train_loss": -6.16602897644043, "global_step": 87753, "epoch": 2089} {"train_loss": -6.189830780029297, "global_step": 87754, "epoch": 2089} {"train_loss": -6.154689788818359, "global_step": 87755, "epoch": 2089} {"train_loss": -6.284562110900879, "global_step": 87756, "epoch": 2089} {"train_loss": -6.245888710021973, "global_step": 87757, "epoch": 2089} {"train_loss": -6.251221179962158, "global_step": 87758, "epoch": 2089} {"train_loss": -6.157501220703125, "global_step": 87759, "epoch": 2089} {"train_loss": -6.220275402069092, "global_step": 87760, "epoch": 2089} {"train_loss": -6.286725997924805, "global_step": 87761, "epoch": 2089} {"train_loss": -6.291681289672852, "global_step": 87762, "epoch": 2089} {"train_loss": -6.25115442276001, "global_step": 87763, "epoch": 2089} {"train_loss": -6.244246482849121, "global_step": 87764, "epoch": 2089} {"train_loss": -6.141197681427002, "global_step": 87765, "epoch": 2089} {"train_loss": -6.3567585945129395, "global_step": 87766, "epoch": 2089} {"train_loss": -6.2655463218688965, "global_step": 87767, "epoch": 2089} {"train_loss": -6.313836574554443, "global_step": 87768, "epoch": 2089} {"train_loss": -6.225282669067383, "global_step": 87769, "epoch": 2089} {"train_loss": -6.178074836730957, "global_step": 87770, "epoch": 2089} {"train_loss": -6.24493932723999, "global_step": 87771, "epoch": 2089} {"train_loss": -6.233729362487793, "global_step": 87772, "epoch": 2089} {"train_loss": -6.263771057128906, "global_step": 87773, "epoch": 2089} {"train_loss": -6.180476665496826, "global_step": 87774, "epoch": 2089} {"train_loss": -6.209882736206055, "global_step": 87775, "epoch": 2089} {"train_loss": -6.416465759277344, "global_step": 87776, "epoch": 2089} {"train_loss": -6.198546409606934, "global_step": 87777, "epoch": 2089} {"train_loss": -6.146143436431885, "global_step": 87778, "epoch": 2089} {"train_loss": -6.24085259437561, "global_step": 87779, "epoch": 2089, "val_loss": 63120.18359375} {"train_loss": -6.0999274253845215, "global_step": 87780, "epoch": 2090} {"train_loss": -6.232851505279541, "global_step": 87781, "epoch": 2090} {"train_loss": -6.1886701583862305, "global_step": 87782, "epoch": 2090} {"train_loss": -6.112605571746826, "global_step": 87783, "epoch": 2090} {"train_loss": -6.262314796447754, "global_step": 87784, "epoch": 2090} {"train_loss": -6.2908172607421875, "global_step": 87785, "epoch": 2090} {"train_loss": -6.177102565765381, "global_step": 87786, "epoch": 2090} {"train_loss": -6.349893569946289, "global_step": 87787, "epoch": 2090} {"train_loss": -6.247659683227539, "global_step": 87788, "epoch": 2090} {"train_loss": -6.369598388671875, "global_step": 87789, "epoch": 2090} {"train_loss": -6.188380718231201, "global_step": 87790, "epoch": 2090} {"train_loss": -6.065953731536865, "global_step": 87791, "epoch": 2090} {"train_loss": -6.1178388595581055, "global_step": 87792, "epoch": 2090} {"train_loss": -6.2821044921875, "global_step": 87793, "epoch": 2090} {"train_loss": -6.135194778442383, "global_step": 87794, "epoch": 2090} {"train_loss": -6.2663397789001465, "global_step": 87795, "epoch": 2090} {"train_loss": -6.110722541809082, "global_step": 87796, "epoch": 2090} {"train_loss": -6.187023162841797, "global_step": 87797, "epoch": 2090} {"train_loss": -6.187177658081055, "global_step": 87798, "epoch": 2090} {"train_loss": -6.144629955291748, "global_step": 87799, "epoch": 2090} {"train_loss": -6.168160438537598, "global_step": 87800, "epoch": 2090} {"train_loss": -6.124082565307617, "global_step": 87801, "epoch": 2090} {"train_loss": -6.278313636779785, "global_step": 87802, "epoch": 2090} {"train_loss": -6.167746067047119, "global_step": 87803, "epoch": 2090} {"train_loss": -6.162954807281494, "global_step": 87804, "epoch": 2090} {"train_loss": -6.065154075622559, "global_step": 87805, "epoch": 2090} {"train_loss": -6.390746116638184, "global_step": 87806, "epoch": 2090} {"train_loss": -6.221154689788818, "global_step": 87807, "epoch": 2090} {"train_loss": -6.322708606719971, "global_step": 87808, "epoch": 2090} {"train_loss": -6.2526445388793945, "global_step": 87809, "epoch": 2090} {"train_loss": -6.357882976531982, "global_step": 87810, "epoch": 2090} {"train_loss": -6.315135478973389, "global_step": 87811, "epoch": 2090} {"train_loss": -6.331664562225342, "global_step": 87812, "epoch": 2090} {"train_loss": -6.168536186218262, "global_step": 87813, "epoch": 2090} {"train_loss": -6.261292457580566, "global_step": 87814, "epoch": 2090} {"train_loss": -6.235708236694336, "global_step": 87815, "epoch": 2090} {"train_loss": -6.242110252380371, "global_step": 87816, "epoch": 2090} {"train_loss": -6.319982528686523, "global_step": 87817, "epoch": 2090} {"train_loss": -6.196403503417969, "global_step": 87818, "epoch": 2090} {"train_loss": -6.22232723236084, "global_step": 87819, "epoch": 2090} {"train_loss": -6.2093963623046875, "global_step": 87820, "epoch": 2090} {"train_loss": -6.21991955666315, "global_step": 87821, "epoch": 2090, "val_loss": 63154.640625} {"train_loss": -6.293524742126465, "global_step": 87822, "epoch": 2091} {"train_loss": -6.215163230895996, "global_step": 87823, "epoch": 2091} {"train_loss": -6.189889907836914, "global_step": 87824, "epoch": 2091} {"train_loss": -6.2642621994018555, "global_step": 87825, "epoch": 2091} {"train_loss": -6.17324161529541, "global_step": 87826, "epoch": 2091} {"train_loss": -6.29168701171875, "global_step": 87827, "epoch": 2091} {"train_loss": -6.244781494140625, "global_step": 87828, "epoch": 2091} {"train_loss": -6.221693515777588, "global_step": 87829, "epoch": 2091} {"train_loss": -6.333374977111816, "global_step": 87830, "epoch": 2091} {"train_loss": -6.193375587463379, "global_step": 87831, "epoch": 2091} {"train_loss": -6.345126628875732, "global_step": 87832, "epoch": 2091} {"train_loss": -6.179012775421143, "global_step": 87833, "epoch": 2091} {"train_loss": -6.141418933868408, "global_step": 87834, "epoch": 2091} {"train_loss": -6.215860366821289, "global_step": 87835, "epoch": 2091} {"train_loss": -6.217693328857422, "global_step": 87836, "epoch": 2091} {"train_loss": -6.265429496765137, "global_step": 87837, "epoch": 2091} {"train_loss": -6.292780876159668, "global_step": 87838, "epoch": 2091} {"train_loss": -6.129145622253418, "global_step": 87839, "epoch": 2091} {"train_loss": -6.254889488220215, "global_step": 87840, "epoch": 2091} {"train_loss": -6.24049186706543, "global_step": 87841, "epoch": 2091} {"train_loss": -6.199105739593506, "global_step": 87842, "epoch": 2091} {"train_loss": -6.287075996398926, "global_step": 87843, "epoch": 2091} {"train_loss": -6.314306259155273, "global_step": 87844, "epoch": 2091} {"train_loss": -6.206479072570801, "global_step": 87845, "epoch": 2091} {"train_loss": -6.232194900512695, "global_step": 87846, "epoch": 2091} {"train_loss": -6.105558395385742, "global_step": 87847, "epoch": 2091} {"train_loss": -6.128816604614258, "global_step": 87848, "epoch": 2091} {"train_loss": -6.2567901611328125, "global_step": 87849, "epoch": 2091} {"train_loss": -6.122831344604492, "global_step": 87850, "epoch": 2091} {"train_loss": -6.2532806396484375, "global_step": 87851, "epoch": 2091} {"train_loss": -6.16309928894043, "global_step": 87852, "epoch": 2091} {"train_loss": -6.154824256896973, "global_step": 87853, "epoch": 2091} {"train_loss": -6.300532341003418, "global_step": 87854, "epoch": 2091} {"train_loss": -6.217748641967773, "global_step": 87855, "epoch": 2091} {"train_loss": -6.228734970092773, "global_step": 87856, "epoch": 2091} {"train_loss": -6.31231164932251, "global_step": 87857, "epoch": 2091} {"train_loss": -6.288405418395996, "global_step": 87858, "epoch": 2091} {"train_loss": -6.3059186935424805, "global_step": 87859, "epoch": 2091} {"train_loss": -6.198789596557617, "global_step": 87860, "epoch": 2091} {"train_loss": -6.250856399536133, "global_step": 87861, "epoch": 2091} {"train_loss": -6.118365287780762, "global_step": 87862, "epoch": 2091} {"train_loss": -6.22792861575172, "global_step": 87863, "epoch": 2091, "val_loss": 62923.63671875} {"train_loss": -6.315584182739258, "global_step": 87864, "epoch": 2092} {"train_loss": -6.197679042816162, "global_step": 87865, "epoch": 2092} {"train_loss": -6.269530296325684, "global_step": 87866, "epoch": 2092} {"train_loss": -6.146946907043457, "global_step": 87867, "epoch": 2092} {"train_loss": -6.174991607666016, "global_step": 87868, "epoch": 2092} {"train_loss": -6.252843379974365, "global_step": 87869, "epoch": 2092} {"train_loss": -6.182070732116699, "global_step": 87870, "epoch": 2092} {"train_loss": -6.170299053192139, "global_step": 87871, "epoch": 2092} {"train_loss": -6.156724452972412, "global_step": 87872, "epoch": 2092} {"train_loss": -6.119224548339844, "global_step": 87873, "epoch": 2092} {"train_loss": -6.114250183105469, "global_step": 87874, "epoch": 2092} {"train_loss": -6.186847686767578, "global_step": 87875, "epoch": 2092} {"train_loss": -6.038369178771973, "global_step": 87876, "epoch": 2092} {"train_loss": -6.234527587890625, "global_step": 87877, "epoch": 2092} {"train_loss": -6.3771586418151855, "global_step": 87878, "epoch": 2092} {"train_loss": -6.167809009552002, "global_step": 87879, "epoch": 2092} {"train_loss": -6.2419633865356445, "global_step": 87880, "epoch": 2092} {"train_loss": -6.16817045211792, "global_step": 87881, "epoch": 2092} {"train_loss": -6.219674587249756, "global_step": 87882, "epoch": 2092} {"train_loss": -6.230101585388184, "global_step": 87883, "epoch": 2092} {"train_loss": -6.2024126052856445, "global_step": 87884, "epoch": 2092} {"train_loss": -6.2003092765808105, "global_step": 87885, "epoch": 2092} {"train_loss": -5.999399662017822, "global_step": 87886, "epoch": 2092} {"train_loss": -6.2157416343688965, "global_step": 87887, "epoch": 2092} {"train_loss": -6.106889724731445, "global_step": 87888, "epoch": 2092} {"train_loss": -6.089914798736572, "global_step": 87889, "epoch": 2092} {"train_loss": -6.193221092224121, "global_step": 87890, "epoch": 2092} {"train_loss": -6.21630334854126, "global_step": 87891, "epoch": 2092} {"train_loss": -6.272129535675049, "global_step": 87892, "epoch": 2092} {"train_loss": -6.095653533935547, "global_step": 87893, "epoch": 2092} {"train_loss": -6.207840919494629, "global_step": 87894, "epoch": 2092} {"train_loss": -6.280407905578613, "global_step": 87895, "epoch": 2092} {"train_loss": -6.277007102966309, "global_step": 87896, "epoch": 2092} {"train_loss": -6.283880710601807, "global_step": 87897, "epoch": 2092} {"train_loss": -6.202767848968506, "global_step": 87898, "epoch": 2092} {"train_loss": -6.289853096008301, "global_step": 87899, "epoch": 2092} {"train_loss": -6.258913040161133, "global_step": 87900, "epoch": 2092} {"train_loss": -6.294379234313965, "global_step": 87901, "epoch": 2092} {"train_loss": -6.218256950378418, "global_step": 87902, "epoch": 2092} {"train_loss": -6.217942237854004, "global_step": 87903, "epoch": 2092} {"train_loss": -6.265005588531494, "global_step": 87904, "epoch": 2092} {"train_loss": -6.204467909676688, "global_step": 87905, "epoch": 2092, "val_loss": 63012.109375} {"train_loss": -6.1839189529418945, "global_step": 87906, "epoch": 2093} {"train_loss": -6.206735134124756, "global_step": 87907, "epoch": 2093} {"train_loss": -6.285155296325684, "global_step": 87908, "epoch": 2093} {"train_loss": -6.251537799835205, "global_step": 87909, "epoch": 2093} {"train_loss": -6.252650737762451, "global_step": 87910, "epoch": 2093} {"train_loss": -6.210254669189453, "global_step": 87911, "epoch": 2093} {"train_loss": -6.264335632324219, "global_step": 87912, "epoch": 2093} {"train_loss": -6.134825229644775, "global_step": 87913, "epoch": 2093} {"train_loss": -6.3030548095703125, "global_step": 87914, "epoch": 2093} {"train_loss": -6.344878673553467, "global_step": 87915, "epoch": 2093} {"train_loss": -6.094726085662842, "global_step": 87916, "epoch": 2093} {"train_loss": -6.222973823547363, "global_step": 87917, "epoch": 2093} {"train_loss": -6.3191328048706055, "global_step": 87918, "epoch": 2093} {"train_loss": -6.243127822875977, "global_step": 87919, "epoch": 2093} {"train_loss": -6.243864059448242, "global_step": 87920, "epoch": 2093} {"train_loss": -6.389372825622559, "global_step": 87921, "epoch": 2093} {"train_loss": -6.145963668823242, "global_step": 87922, "epoch": 2093} {"train_loss": -6.23328971862793, "global_step": 87923, "epoch": 2093} {"train_loss": -6.202475070953369, "global_step": 87924, "epoch": 2093} {"train_loss": -6.3724212646484375, "global_step": 87925, "epoch": 2093} {"train_loss": -6.200967311859131, "global_step": 87926, "epoch": 2093} {"train_loss": -6.279242038726807, "global_step": 87927, "epoch": 2093} {"train_loss": -6.206250190734863, "global_step": 87928, "epoch": 2093} {"train_loss": -6.217400550842285, "global_step": 87929, "epoch": 2093} {"train_loss": -6.202455520629883, "global_step": 87930, "epoch": 2093} {"train_loss": -6.20539665222168, "global_step": 87931, "epoch": 2093} {"train_loss": -6.239136695861816, "global_step": 87932, "epoch": 2093} {"train_loss": -6.250028133392334, "global_step": 87933, "epoch": 2093} {"train_loss": -6.226334571838379, "global_step": 87934, "epoch": 2093} {"train_loss": -6.157217979431152, "global_step": 87935, "epoch": 2093} {"train_loss": -6.08442497253418, "global_step": 87936, "epoch": 2093} {"train_loss": -6.246668815612793, "global_step": 87937, "epoch": 2093} {"train_loss": -6.1628522872924805, "global_step": 87938, "epoch": 2093} {"train_loss": -6.208980560302734, "global_step": 87939, "epoch": 2093} {"train_loss": -6.239377498626709, "global_step": 87940, "epoch": 2093} {"train_loss": -6.190143585205078, "global_step": 87941, "epoch": 2093} {"train_loss": -6.280055046081543, "global_step": 87942, "epoch": 2093} {"train_loss": -6.291023254394531, "global_step": 87943, "epoch": 2093} {"train_loss": -6.296566963195801, "global_step": 87944, "epoch": 2093} {"train_loss": -6.27459716796875, "global_step": 87945, "epoch": 2093} {"train_loss": -6.169971466064453, "global_step": 87946, "epoch": 2093} {"train_loss": -6.2283489136468795, "global_step": 87947, "epoch": 2093, "val_loss": 62789.703125} {"train_loss": -6.253484725952148, "global_step": 87948, "epoch": 2094} {"train_loss": -6.228742599487305, "global_step": 87949, "epoch": 2094} {"train_loss": -6.25297212600708, "global_step": 87950, "epoch": 2094} {"train_loss": -6.254373550415039, "global_step": 87951, "epoch": 2094} {"train_loss": -6.26076078414917, "global_step": 87952, "epoch": 2094} {"train_loss": -6.124734878540039, "global_step": 87953, "epoch": 2094} {"train_loss": -6.2158284187316895, "global_step": 87954, "epoch": 2094} {"train_loss": -6.352133750915527, "global_step": 87955, "epoch": 2094} {"train_loss": -6.221183776855469, "global_step": 87956, "epoch": 2094} {"train_loss": -6.166629791259766, "global_step": 87957, "epoch": 2094} {"train_loss": -6.080969333648682, "global_step": 87958, "epoch": 2094} {"train_loss": -6.214015960693359, "global_step": 87959, "epoch": 2094} {"train_loss": -6.271369457244873, "global_step": 87960, "epoch": 2094} {"train_loss": -6.249073505401611, "global_step": 87961, "epoch": 2094} {"train_loss": -6.242888450622559, "global_step": 87962, "epoch": 2094} {"train_loss": -6.226284980773926, "global_step": 87963, "epoch": 2094} {"train_loss": -6.1973748207092285, "global_step": 87964, "epoch": 2094} {"train_loss": -6.2946696281433105, "global_step": 87965, "epoch": 2094} {"train_loss": -6.24721097946167, "global_step": 87966, "epoch": 2094} {"train_loss": -6.259144306182861, "global_step": 87967, "epoch": 2094} {"train_loss": -6.258823394775391, "global_step": 87968, "epoch": 2094} {"train_loss": -6.261976718902588, "global_step": 87969, "epoch": 2094} {"train_loss": -6.249075889587402, "global_step": 87970, "epoch": 2094} {"train_loss": -6.247244834899902, "global_step": 87971, "epoch": 2094} {"train_loss": -6.296469688415527, "global_step": 87972, "epoch": 2094} {"train_loss": -6.3345160484313965, "global_step": 87973, "epoch": 2094} {"train_loss": -6.192049026489258, "global_step": 87974, "epoch": 2094} {"train_loss": -6.254579544067383, "global_step": 87975, "epoch": 2094} {"train_loss": -6.215017318725586, "global_step": 87976, "epoch": 2094} {"train_loss": -6.301965236663818, "global_step": 87977, "epoch": 2094} {"train_loss": -6.185758590698242, "global_step": 87978, "epoch": 2094} {"train_loss": -6.220925331115723, "global_step": 87979, "epoch": 2094} {"train_loss": -6.223625183105469, "global_step": 87980, "epoch": 2094} {"train_loss": -6.244075775146484, "global_step": 87981, "epoch": 2094} {"train_loss": -6.338578224182129, "global_step": 87982, "epoch": 2094} {"train_loss": -6.248739242553711, "global_step": 87983, "epoch": 2094} {"train_loss": -6.134549140930176, "global_step": 87984, "epoch": 2094} {"train_loss": -6.130422115325928, "global_step": 87985, "epoch": 2094} {"train_loss": -6.073726177215576, "global_step": 87986, "epoch": 2094} {"train_loss": -6.194327354431152, "global_step": 87987, "epoch": 2094} {"train_loss": -6.1198320388793945, "global_step": 87988, "epoch": 2094} {"train_loss": -6.23106913339524, "global_step": 87989, "epoch": 2094, "val_loss": 62900.44921875} {"train_loss": -6.192843437194824, "global_step": 87990, "epoch": 2095} {"train_loss": -6.2293524742126465, "global_step": 87991, "epoch": 2095} {"train_loss": -6.310677528381348, "global_step": 87992, "epoch": 2095} {"train_loss": -6.207437992095947, "global_step": 87993, "epoch": 2095} {"train_loss": -6.312094211578369, "global_step": 87994, "epoch": 2095} {"train_loss": -6.172098159790039, "global_step": 87995, "epoch": 2095} {"train_loss": -6.2028489112854, "global_step": 87996, "epoch": 2095} {"train_loss": -6.196254730224609, "global_step": 87997, "epoch": 2095} {"train_loss": -6.158213138580322, "global_step": 87998, "epoch": 2095} {"train_loss": -6.125268936157227, "global_step": 87999, "epoch": 2095} {"train_loss": -6.1556830406188965, "global_step": 88000, "epoch": 2095} {"train_loss": -6.2052507400512695, "global_step": 88001, "epoch": 2095} {"train_loss": -6.31710147857666, "global_step": 88002, "epoch": 2095} {"train_loss": -6.18656063079834, "global_step": 88003, "epoch": 2095} {"train_loss": -6.206693649291992, "global_step": 88004, "epoch": 2095} {"train_loss": -6.17429256439209, "global_step": 88005, "epoch": 2095} {"train_loss": -6.182986259460449, "global_step": 88006, "epoch": 2095} {"train_loss": -6.173833847045898, "global_step": 88007, "epoch": 2095} {"train_loss": -6.168487071990967, "global_step": 88008, "epoch": 2095} {"train_loss": -6.199304580688477, "global_step": 88009, "epoch": 2095} {"train_loss": -6.192140102386475, "global_step": 88010, "epoch": 2095} {"train_loss": -6.394231796264648, "global_step": 88011, "epoch": 2095} {"train_loss": -6.221043109893799, "global_step": 88012, "epoch": 2095} {"train_loss": -6.32531213760376, "global_step": 88013, "epoch": 2095} {"train_loss": -6.261409759521484, "global_step": 88014, "epoch": 2095} {"train_loss": -6.269364356994629, "global_step": 88015, "epoch": 2095} {"train_loss": -6.232341289520264, "global_step": 88016, "epoch": 2095} {"train_loss": -6.23846435546875, "global_step": 88017, "epoch": 2095} {"train_loss": -6.295398712158203, "global_step": 88018, "epoch": 2095} {"train_loss": -6.277540683746338, "global_step": 88019, "epoch": 2095} {"train_loss": -6.166396617889404, "global_step": 88020, "epoch": 2095} {"train_loss": -6.176009178161621, "global_step": 88021, "epoch": 2095} {"train_loss": -6.227968215942383, "global_step": 88022, "epoch": 2095} {"train_loss": -6.238200664520264, "global_step": 88023, "epoch": 2095} {"train_loss": -6.251782417297363, "global_step": 88024, "epoch": 2095} {"train_loss": -6.276432514190674, "global_step": 88025, "epoch": 2095} {"train_loss": -6.37894344329834, "global_step": 88026, "epoch": 2095} {"train_loss": -6.137843132019043, "global_step": 88027, "epoch": 2095} {"train_loss": -6.051060199737549, "global_step": 88028, "epoch": 2095} {"train_loss": -6.198125839233398, "global_step": 88029, "epoch": 2095} {"train_loss": -6.1773905754089355, "global_step": 88030, "epoch": 2095} {"train_loss": -6.220284768513271, "global_step": 88031, "epoch": 2095, "val_loss": 63155.49609375} {"train_loss": -6.33804178237915, "global_step": 88032, "epoch": 2096} {"train_loss": -6.185910701751709, "global_step": 88033, "epoch": 2096} {"train_loss": -6.239684581756592, "global_step": 88034, "epoch": 2096} {"train_loss": -6.310094833374023, "global_step": 88035, "epoch": 2096} {"train_loss": -6.219518184661865, "global_step": 88036, "epoch": 2096} {"train_loss": -6.14162540435791, "global_step": 88037, "epoch": 2096} {"train_loss": -6.175846576690674, "global_step": 88038, "epoch": 2096} {"train_loss": -6.144061088562012, "global_step": 88039, "epoch": 2096} {"train_loss": -6.205664157867432, "global_step": 88040, "epoch": 2096} {"train_loss": -6.302735328674316, "global_step": 88041, "epoch": 2096} {"train_loss": -6.147351264953613, "global_step": 88042, "epoch": 2096} {"train_loss": -6.09237003326416, "global_step": 88043, "epoch": 2096} {"train_loss": -6.1763434410095215, "global_step": 88044, "epoch": 2096} {"train_loss": -6.068596839904785, "global_step": 88045, "epoch": 2096} {"train_loss": -6.227090835571289, "global_step": 88046, "epoch": 2096} {"train_loss": -6.22398567199707, "global_step": 88047, "epoch": 2096} {"train_loss": -6.121176719665527, "global_step": 88048, "epoch": 2096} {"train_loss": -6.121427536010742, "global_step": 88049, "epoch": 2096} {"train_loss": -6.287168979644775, "global_step": 88050, "epoch": 2096} {"train_loss": -6.2029523849487305, "global_step": 88051, "epoch": 2096} {"train_loss": -6.097003936767578, "global_step": 88052, "epoch": 2096} {"train_loss": -6.275607109069824, "global_step": 88053, "epoch": 2096} {"train_loss": -6.077068328857422, "global_step": 88054, "epoch": 2096} {"train_loss": -6.201773643493652, "global_step": 88055, "epoch": 2096} {"train_loss": -6.178658485412598, "global_step": 88056, "epoch": 2096} {"train_loss": -6.167447090148926, "global_step": 88057, "epoch": 2096} {"train_loss": -6.2297515869140625, "global_step": 88058, "epoch": 2096} {"train_loss": -6.270375728607178, "global_step": 88059, "epoch": 2096} {"train_loss": -6.253912925720215, "global_step": 88060, "epoch": 2096} {"train_loss": -6.220664024353027, "global_step": 88061, "epoch": 2096} {"train_loss": -6.23477840423584, "global_step": 88062, "epoch": 2096} {"train_loss": -6.288187026977539, "global_step": 88063, "epoch": 2096} {"train_loss": -6.360084056854248, "global_step": 88064, "epoch": 2096} {"train_loss": -6.236658573150635, "global_step": 88065, "epoch": 2096} {"train_loss": -6.304600715637207, "global_step": 88066, "epoch": 2096} {"train_loss": -6.279888153076172, "global_step": 88067, "epoch": 2096} {"train_loss": -6.235199451446533, "global_step": 88068, "epoch": 2096} {"train_loss": -6.427455425262451, "global_step": 88069, "epoch": 2096} {"train_loss": -6.20449686050415, "global_step": 88070, "epoch": 2096} {"train_loss": -6.3240556716918945, "global_step": 88071, "epoch": 2096} {"train_loss": -6.2539825439453125, "global_step": 88072, "epoch": 2096} {"train_loss": -6.223567281450544, "global_step": 88073, "epoch": 2096, "val_loss": 62878.046875} {"train_loss": -6.178386688232422, "global_step": 88074, "epoch": 2097} {"train_loss": -6.068599700927734, "global_step": 88075, "epoch": 2097} {"train_loss": -6.297564506530762, "global_step": 88076, "epoch": 2097} {"train_loss": -6.175670623779297, "global_step": 88077, "epoch": 2097} {"train_loss": -6.356210708618164, "global_step": 88078, "epoch": 2097} {"train_loss": -6.3241868019104, "global_step": 88079, "epoch": 2097} {"train_loss": -6.342696189880371, "global_step": 88080, "epoch": 2097} {"train_loss": -6.304200172424316, "global_step": 88081, "epoch": 2097} {"train_loss": -6.235910415649414, "global_step": 88082, "epoch": 2097} {"train_loss": -6.2699198722839355, "global_step": 88083, "epoch": 2097} {"train_loss": -6.203123092651367, "global_step": 88084, "epoch": 2097} {"train_loss": -6.210139274597168, "global_step": 88085, "epoch": 2097} {"train_loss": -6.369869709014893, "global_step": 88086, "epoch": 2097} {"train_loss": -6.301529884338379, "global_step": 88087, "epoch": 2097} {"train_loss": -6.173064231872559, "global_step": 88088, "epoch": 2097} {"train_loss": -6.297962665557861, "global_step": 88089, "epoch": 2097} {"train_loss": -6.225620269775391, "global_step": 88090, "epoch": 2097} {"train_loss": -6.278641223907471, "global_step": 88091, "epoch": 2097} {"train_loss": -6.3061394691467285, "global_step": 88092, "epoch": 2097} {"train_loss": -6.2290143966674805, "global_step": 88093, "epoch": 2097} {"train_loss": -6.142199993133545, "global_step": 88094, "epoch": 2097} {"train_loss": -6.244792938232422, "global_step": 88095, "epoch": 2097} {"train_loss": -6.219170570373535, "global_step": 88096, "epoch": 2097} {"train_loss": -6.196531295776367, "global_step": 88097, "epoch": 2097} {"train_loss": -6.217141151428223, "global_step": 88098, "epoch": 2097} {"train_loss": -6.266397476196289, "global_step": 88099, "epoch": 2097} {"train_loss": -6.225335597991943, "global_step": 88100, "epoch": 2097} {"train_loss": -6.216616630554199, "global_step": 88101, "epoch": 2097} {"train_loss": -6.2047529220581055, "global_step": 88102, "epoch": 2097} {"train_loss": -6.284772872924805, "global_step": 88103, "epoch": 2097} {"train_loss": -6.181575775146484, "global_step": 88104, "epoch": 2097} {"train_loss": -6.217015266418457, "global_step": 88105, "epoch": 2097} {"train_loss": -6.275503635406494, "global_step": 88106, "epoch": 2097} {"train_loss": -6.336935997009277, "global_step": 88107, "epoch": 2097} {"train_loss": -6.187233924865723, "global_step": 88108, "epoch": 2097} {"train_loss": -6.302911281585693, "global_step": 88109, "epoch": 2097} {"train_loss": -6.240164279937744, "global_step": 88110, "epoch": 2097} {"train_loss": -6.203271389007568, "global_step": 88111, "epoch": 2097} {"train_loss": -6.2244415283203125, "global_step": 88112, "epoch": 2097} {"train_loss": -6.317282199859619, "global_step": 88113, "epoch": 2097} {"train_loss": -6.365490913391113, "global_step": 88114, "epoch": 2097} {"train_loss": -6.252313875016712, "global_step": 88115, "epoch": 2097, "val_loss": 62970.90234375} {"train_loss": -6.257834434509277, "global_step": 88116, "epoch": 2098} {"train_loss": -6.266322135925293, "global_step": 88117, "epoch": 2098} {"train_loss": -6.231204986572266, "global_step": 88118, "epoch": 2098} {"train_loss": -6.25651741027832, "global_step": 88119, "epoch": 2098} {"train_loss": -6.257612705230713, "global_step": 88120, "epoch": 2098} {"train_loss": -6.265565872192383, "global_step": 88121, "epoch": 2098} {"train_loss": -6.355228424072266, "global_step": 88122, "epoch": 2098} {"train_loss": -6.293254375457764, "global_step": 88123, "epoch": 2098} {"train_loss": -6.2389235496521, "global_step": 88124, "epoch": 2098} {"train_loss": -6.2228193283081055, "global_step": 88125, "epoch": 2098} {"train_loss": -6.190001487731934, "global_step": 88126, "epoch": 2098} {"train_loss": -6.204647541046143, "global_step": 88127, "epoch": 2098} {"train_loss": -6.237585067749023, "global_step": 88128, "epoch": 2098} {"train_loss": -6.239660263061523, "global_step": 88129, "epoch": 2098} {"train_loss": -6.124234199523926, "global_step": 88130, "epoch": 2098} {"train_loss": -6.230893135070801, "global_step": 88131, "epoch": 2098} {"train_loss": -6.346854209899902, "global_step": 88132, "epoch": 2098} {"train_loss": -6.321080207824707, "global_step": 88133, "epoch": 2098} {"train_loss": -6.2733917236328125, "global_step": 88134, "epoch": 2098} {"train_loss": -6.290395736694336, "global_step": 88135, "epoch": 2098} {"train_loss": -6.284938335418701, "global_step": 88136, "epoch": 2098} {"train_loss": -6.283718585968018, "global_step": 88137, "epoch": 2098} {"train_loss": -6.3359150886535645, "global_step": 88138, "epoch": 2098} {"train_loss": -6.182697296142578, "global_step": 88139, "epoch": 2098} {"train_loss": -6.237752914428711, "global_step": 88140, "epoch": 2098} {"train_loss": -6.174796104431152, "global_step": 88141, "epoch": 2098} {"train_loss": -6.270066261291504, "global_step": 88142, "epoch": 2098} {"train_loss": -6.20729923248291, "global_step": 88143, "epoch": 2098} {"train_loss": -6.276514530181885, "global_step": 88144, "epoch": 2098} {"train_loss": -6.327014923095703, "global_step": 88145, "epoch": 2098} {"train_loss": -6.210114479064941, "global_step": 88146, "epoch": 2098} {"train_loss": -6.236753463745117, "global_step": 88147, "epoch": 2098} {"train_loss": -6.286606788635254, "global_step": 88148, "epoch": 2098} {"train_loss": -6.186078071594238, "global_step": 88149, "epoch": 2098} {"train_loss": -6.274531841278076, "global_step": 88150, "epoch": 2098} {"train_loss": -6.263411521911621, "global_step": 88151, "epoch": 2098} {"train_loss": -6.274270534515381, "global_step": 88152, "epoch": 2098} {"train_loss": -6.272281646728516, "global_step": 88153, "epoch": 2098} {"train_loss": -6.377891540527344, "global_step": 88154, "epoch": 2098} {"train_loss": -6.197415351867676, "global_step": 88155, "epoch": 2098} {"train_loss": -6.1901535987854, "global_step": 88156, "epoch": 2098} {"train_loss": -6.254862467447917, "global_step": 88157, "epoch": 2098, "val_loss": 63044.6796875} {"train_loss": -6.252874374389648, "global_step": 88158, "epoch": 2099} {"train_loss": -6.187752723693848, "global_step": 88159, "epoch": 2099} {"train_loss": -6.297597885131836, "global_step": 88160, "epoch": 2099} {"train_loss": -6.230782985687256, "global_step": 88161, "epoch": 2099} {"train_loss": -6.182324409484863, "global_step": 88162, "epoch": 2099} {"train_loss": -6.2390007972717285, "global_step": 88163, "epoch": 2099} {"train_loss": -6.3859357833862305, "global_step": 88164, "epoch": 2099} {"train_loss": -6.213705062866211, "global_step": 88165, "epoch": 2099} {"train_loss": -6.258179664611816, "global_step": 88166, "epoch": 2099} {"train_loss": -6.198139667510986, "global_step": 88167, "epoch": 2099} {"train_loss": -6.322148323059082, "global_step": 88168, "epoch": 2099} {"train_loss": -6.294957160949707, "global_step": 88169, "epoch": 2099} {"train_loss": -6.218900680541992, "global_step": 88170, "epoch": 2099} {"train_loss": -6.188714504241943, "global_step": 88171, "epoch": 2099} {"train_loss": -6.2978973388671875, "global_step": 88172, "epoch": 2099} {"train_loss": -6.24948787689209, "global_step": 88173, "epoch": 2099} {"train_loss": -6.262795925140381, "global_step": 88174, "epoch": 2099} {"train_loss": -6.245030879974365, "global_step": 88175, "epoch": 2099} {"train_loss": -6.222754001617432, "global_step": 88176, "epoch": 2099} {"train_loss": -6.235529899597168, "global_step": 88177, "epoch": 2099} {"train_loss": -6.246641635894775, "global_step": 88178, "epoch": 2099} {"train_loss": -6.1960368156433105, "global_step": 88179, "epoch": 2099} {"train_loss": -6.1668195724487305, "global_step": 88180, "epoch": 2099} {"train_loss": -6.180705547332764, "global_step": 88181, "epoch": 2099} {"train_loss": -6.13824462890625, "global_step": 88182, "epoch": 2099} {"train_loss": -6.247320652008057, "global_step": 88183, "epoch": 2099} {"train_loss": -6.096197128295898, "global_step": 88184, "epoch": 2099} {"train_loss": -6.359749794006348, "global_step": 88185, "epoch": 2099} {"train_loss": -6.144855499267578, "global_step": 88186, "epoch": 2099} {"train_loss": -6.119416236877441, "global_step": 88187, "epoch": 2099} {"train_loss": -6.149385452270508, "global_step": 88188, "epoch": 2099} {"train_loss": -6.19373083114624, "global_step": 88189, "epoch": 2099} {"train_loss": -6.285490989685059, "global_step": 88190, "epoch": 2099} {"train_loss": -6.257397651672363, "global_step": 88191, "epoch": 2099} {"train_loss": -6.241937160491943, "global_step": 88192, "epoch": 2099} {"train_loss": -6.269199848175049, "global_step": 88193, "epoch": 2099} {"train_loss": -6.2075653076171875, "global_step": 88194, "epoch": 2099} {"train_loss": -6.280040740966797, "global_step": 88195, "epoch": 2099} {"train_loss": -6.186611175537109, "global_step": 88196, "epoch": 2099} {"train_loss": -6.203721046447754, "global_step": 88197, "epoch": 2099} {"train_loss": -6.341751575469971, "global_step": 88198, "epoch": 2099} {"train_loss": -6.23308751696632, "global_step": 88199, "epoch": 2099, "val_loss": 62956.4921875} {"train_loss": -6.25180196762085, "global_step": 88200, "epoch": 2100} {"train_loss": -6.35294246673584, "global_step": 88201, "epoch": 2100} {"train_loss": -6.289010047912598, "global_step": 88202, "epoch": 2100} {"train_loss": -6.248498916625977, "global_step": 88203, "epoch": 2100} {"train_loss": -6.29148006439209, "global_step": 88204, "epoch": 2100} {"train_loss": -6.21661376953125, "global_step": 88205, "epoch": 2100} {"train_loss": -6.122637748718262, "global_step": 88206, "epoch": 2100} {"train_loss": -6.253222942352295, "global_step": 88207, "epoch": 2100} {"train_loss": -6.194043159484863, "global_step": 88208, "epoch": 2100} {"train_loss": -6.2154083251953125, "global_step": 88209, "epoch": 2100} {"train_loss": -6.30488395690918, "global_step": 88210, "epoch": 2100} {"train_loss": -6.207067489624023, "global_step": 88211, "epoch": 2100} {"train_loss": -6.226167678833008, "global_step": 88212, "epoch": 2100} {"train_loss": -6.358633041381836, "global_step": 88213, "epoch": 2100} {"train_loss": -6.338035583496094, "global_step": 88214, "epoch": 2100} {"train_loss": -6.255488872528076, "global_step": 88215, "epoch": 2100} {"train_loss": -6.268436431884766, "global_step": 88216, "epoch": 2100} {"train_loss": -6.2183756828308105, "global_step": 88217, "epoch": 2100} {"train_loss": -6.212802886962891, "global_step": 88218, "epoch": 2100} {"train_loss": -6.196598052978516, "global_step": 88219, "epoch": 2100} {"train_loss": -6.294342041015625, "global_step": 88220, "epoch": 2100} {"train_loss": -6.232478141784668, "global_step": 88221, "epoch": 2100} {"train_loss": -6.183088302612305, "global_step": 88222, "epoch": 2100} {"train_loss": -6.275867462158203, "global_step": 88223, "epoch": 2100} {"train_loss": -6.3026323318481445, "global_step": 88224, "epoch": 2100} {"train_loss": -6.224952697753906, "global_step": 88225, "epoch": 2100} {"train_loss": -6.255222797393799, "global_step": 88226, "epoch": 2100} {"train_loss": -6.252986907958984, "global_step": 88227, "epoch": 2100} {"train_loss": -6.209355354309082, "global_step": 88228, "epoch": 2100} {"train_loss": -6.2102460861206055, "global_step": 88229, "epoch": 2100} {"train_loss": -6.217574119567871, "global_step": 88230, "epoch": 2100} {"train_loss": -6.190154075622559, "global_step": 88231, "epoch": 2100} {"train_loss": -6.273748397827148, "global_step": 88232, "epoch": 2100} {"train_loss": -6.2346954345703125, "global_step": 88233, "epoch": 2100} {"train_loss": -6.17468786239624, "global_step": 88234, "epoch": 2100} {"train_loss": -6.269392013549805, "global_step": 88235, "epoch": 2100} {"train_loss": -6.187282562255859, "global_step": 88236, "epoch": 2100} {"train_loss": -6.170691013336182, "global_step": 88237, "epoch": 2100} {"train_loss": -6.170249938964844, "global_step": 88238, "epoch": 2100} {"train_loss": -6.197256088256836, "global_step": 88239, "epoch": 2100} {"train_loss": -6.245152473449707, "global_step": 88240, "epoch": 2100} {"train_loss": -6.237841117949713, "global_step": 88241, "epoch": 2100, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.40300937490008953, "train/sim_max_reward_2": 0.9480466258514498, "train/sim_max_reward_3": 0.9472375491281937, "train/sim_max_reward_4": 0.8212499771387358, "train/sim_max_reward_5": 0.1998423264066568, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.9501152809109512, "test/sim_max_reward_4300002": 0.9137151685211218, "test/sim_max_reward_4300003": 0.91700837228848, "test/sim_max_reward_4300004": 0.18793354588734645, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9372647722214511, "test/sim_max_reward_4300008": 0.4456637494521126, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.4212483601526555, "test/sim_max_reward_4300011": 0.9601935327054892, "test/sim_max_reward_4300012": 0.8681850918458262, "test/sim_max_reward_4300013": 0.8664953407592753, "test/sim_max_reward_4300014": 0.977624127235803, "test/sim_max_reward_4300015": 0.8733043432554541, "test/sim_max_reward_4300016": 0.9358044787485896, "test/sim_max_reward_4300017": 0.8412184243005423, "test/sim_max_reward_4300018": 0.4120604711236146, "test/sim_max_reward_4300019": 0.18601973958037568, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9743124026555042, "test/sim_max_reward_4300022": 0.9241139734265739, "test/sim_max_reward_4300023": 0.8768681949616902, "test/sim_max_reward_4300024": 0.4798921529764748, "test/sim_max_reward_4300025": 0.9453687035224826, "test/sim_max_reward_4300026": 0.0902069506124957, "test/sim_max_reward_4300027": 0.10929573901510459, "test/sim_max_reward_4300028": 0.9602697848157568, "test/sim_max_reward_4300029": 0.8601448901465234, "test/sim_max_reward_4300030": 0.9123410735247188, "test/sim_max_reward_4300031": 0.22266942805763584, "test/sim_max_reward_4300032": 0.9523137054969992, "test/sim_max_reward_4300033": 0.7192546608898076, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.815484393442618, "test/sim_max_reward_4300036": 0.20897536147111911, "test/sim_max_reward_4300037": 0.818791097795105, "test/sim_max_reward_4300038": 0.9980421326823875, "test/sim_max_reward_4300039": 0.7728744778332436, "test/sim_max_reward_4300040": 0.4993058274555307, "test/sim_max_reward_4300041": 0.14226758816235333, "test/sim_max_reward_4300042": 0.7263049789468496, "test/sim_max_reward_4300043": 0.13220427815969626, "test/sim_max_reward_4300044": 0.616639043017383, "test/sim_max_reward_4300045": 0.9410013242158063, "test/sim_max_reward_4300046": 0.8276373716463398, "test/sim_max_reward_4300047": 0.9388214738523125, "test/sim_max_reward_4300048": 0.002766691393919552, "test/sim_max_reward_4300049": 0.05244250355798751, "train/mean_score": 0.5849472250051964, "test/mean_score": 0.6242893000544701, "val_loss": 62860.6796875} {"train_loss": -6.180328369140625, "global_step": 88242, "epoch": 2101} {"train_loss": -6.250890731811523, "global_step": 88243, "epoch": 2101} {"train_loss": -6.198232173919678, "global_step": 88244, "epoch": 2101} {"train_loss": -6.3375396728515625, "global_step": 88245, "epoch": 2101} {"train_loss": -6.203582763671875, "global_step": 88246, "epoch": 2101} {"train_loss": -6.263454914093018, "global_step": 88247, "epoch": 2101} {"train_loss": -6.266509532928467, "global_step": 88248, "epoch": 2101} {"train_loss": -6.191483020782471, "global_step": 88249, "epoch": 2101} {"train_loss": -6.153201103210449, "global_step": 88250, "epoch": 2101} {"train_loss": -6.350717544555664, "global_step": 88251, "epoch": 2101} {"train_loss": -6.221746444702148, "global_step": 88252, "epoch": 2101} {"train_loss": -6.206766128540039, "global_step": 88253, "epoch": 2101} {"train_loss": -6.160824775695801, "global_step": 88254, "epoch": 2101} {"train_loss": -6.273037910461426, "global_step": 88255, "epoch": 2101} {"train_loss": -6.23246955871582, "global_step": 88256, "epoch": 2101} {"train_loss": -6.240480422973633, "global_step": 88257, "epoch": 2101} {"train_loss": -6.221186637878418, "global_step": 88258, "epoch": 2101} {"train_loss": -6.2205071449279785, "global_step": 88259, "epoch": 2101} {"train_loss": -6.309029579162598, "global_step": 88260, "epoch": 2101} {"train_loss": -6.166957855224609, "global_step": 88261, "epoch": 2101} {"train_loss": -6.308982849121094, "global_step": 88262, "epoch": 2101} {"train_loss": -6.254855155944824, "global_step": 88263, "epoch": 2101} {"train_loss": -6.295475959777832, "global_step": 88264, "epoch": 2101} {"train_loss": -6.378465175628662, "global_step": 88265, "epoch": 2101} {"train_loss": -6.211421012878418, "global_step": 88266, "epoch": 2101} {"train_loss": -6.276919364929199, "global_step": 88267, "epoch": 2101} {"train_loss": -6.191124439239502, "global_step": 88268, "epoch": 2101} {"train_loss": -6.262120723724365, "global_step": 88269, "epoch": 2101} {"train_loss": -6.200963973999023, "global_step": 88270, "epoch": 2101} {"train_loss": -6.338062286376953, "global_step": 88271, "epoch": 2101} {"train_loss": -6.167455196380615, "global_step": 88272, "epoch": 2101} {"train_loss": -6.2038140296936035, "global_step": 88273, "epoch": 2101} {"train_loss": -6.245136260986328, "global_step": 88274, "epoch": 2101} {"train_loss": -6.264403820037842, "global_step": 88275, "epoch": 2101} {"train_loss": -6.209771156311035, "global_step": 88276, "epoch": 2101} {"train_loss": -6.218294143676758, "global_step": 88277, "epoch": 2101} {"train_loss": -6.15922737121582, "global_step": 88278, "epoch": 2101} {"train_loss": -6.246875762939453, "global_step": 88279, "epoch": 2101} {"train_loss": -6.322704315185547, "global_step": 88280, "epoch": 2101} {"train_loss": -6.197399616241455, "global_step": 88281, "epoch": 2101} {"train_loss": -6.244968414306641, "global_step": 88282, "epoch": 2101} {"train_loss": -6.2391070411318825, "global_step": 88283, "epoch": 2101, "val_loss": 63003.484375} {"train_loss": -6.27639102935791, "global_step": 88284, "epoch": 2102} {"train_loss": -6.2470221519470215, "global_step": 88285, "epoch": 2102} {"train_loss": -6.28901481628418, "global_step": 88286, "epoch": 2102} {"train_loss": -6.147502899169922, "global_step": 88287, "epoch": 2102} {"train_loss": -6.181608200073242, "global_step": 88288, "epoch": 2102} {"train_loss": -6.308002948760986, "global_step": 88289, "epoch": 2102} {"train_loss": -6.191278457641602, "global_step": 88290, "epoch": 2102} {"train_loss": -6.1660261154174805, "global_step": 88291, "epoch": 2102} {"train_loss": -6.2121052742004395, "global_step": 88292, "epoch": 2102} {"train_loss": -6.208736419677734, "global_step": 88293, "epoch": 2102} {"train_loss": -6.300188064575195, "global_step": 88294, "epoch": 2102} {"train_loss": -6.213283061981201, "global_step": 88295, "epoch": 2102} {"train_loss": -6.155505180358887, "global_step": 88296, "epoch": 2102} {"train_loss": -6.130669593811035, "global_step": 88297, "epoch": 2102} {"train_loss": -6.272123336791992, "global_step": 88298, "epoch": 2102} {"train_loss": -6.141316890716553, "global_step": 88299, "epoch": 2102} {"train_loss": -6.348609924316406, "global_step": 88300, "epoch": 2102} {"train_loss": -6.352943420410156, "global_step": 88301, "epoch": 2102} {"train_loss": -6.10807466506958, "global_step": 88302, "epoch": 2102} {"train_loss": -6.190031051635742, "global_step": 88303, "epoch": 2102} {"train_loss": -5.998691558837891, "global_step": 88304, "epoch": 2102} {"train_loss": -6.185920238494873, "global_step": 88305, "epoch": 2102} {"train_loss": -6.085224151611328, "global_step": 88306, "epoch": 2102} {"train_loss": -6.12247371673584, "global_step": 88307, "epoch": 2102} {"train_loss": -6.156029224395752, "global_step": 88308, "epoch": 2102} {"train_loss": -6.233855247497559, "global_step": 88309, "epoch": 2102} {"train_loss": -6.152743339538574, "global_step": 88310, "epoch": 2102} {"train_loss": -6.219407081604004, "global_step": 88311, "epoch": 2102} {"train_loss": -6.094134330749512, "global_step": 88312, "epoch": 2102} {"train_loss": -6.230489253997803, "global_step": 88313, "epoch": 2102} {"train_loss": -6.200152397155762, "global_step": 88314, "epoch": 2102} {"train_loss": -6.171486854553223, "global_step": 88315, "epoch": 2102} {"train_loss": -6.06648063659668, "global_step": 88316, "epoch": 2102} {"train_loss": -6.158565521240234, "global_step": 88317, "epoch": 2102} {"train_loss": -6.189714431762695, "global_step": 88318, "epoch": 2102} {"train_loss": -6.201936721801758, "global_step": 88319, "epoch": 2102} {"train_loss": -6.173614978790283, "global_step": 88320, "epoch": 2102} {"train_loss": -6.27883243560791, "global_step": 88321, "epoch": 2102} {"train_loss": -6.201345443725586, "global_step": 88322, "epoch": 2102} {"train_loss": -6.244275093078613, "global_step": 88323, "epoch": 2102} {"train_loss": -6.146727085113525, "global_step": 88324, "epoch": 2102} {"train_loss": -6.193099373862857, "global_step": 88325, "epoch": 2102, "val_loss": 62677.83203125} {"train_loss": -6.291089057922363, "global_step": 88326, "epoch": 2103} {"train_loss": -6.227625370025635, "global_step": 88327, "epoch": 2103} {"train_loss": -6.302309036254883, "global_step": 88328, "epoch": 2103} {"train_loss": -6.203132629394531, "global_step": 88329, "epoch": 2103} {"train_loss": -6.176993370056152, "global_step": 88330, "epoch": 2103} {"train_loss": -6.2882843017578125, "global_step": 88331, "epoch": 2103} {"train_loss": -6.199326515197754, "global_step": 88332, "epoch": 2103} {"train_loss": -6.193176746368408, "global_step": 88333, "epoch": 2103} {"train_loss": -6.125201225280762, "global_step": 88334, "epoch": 2103} {"train_loss": -6.167242050170898, "global_step": 88335, "epoch": 2103} {"train_loss": -6.250185489654541, "global_step": 88336, "epoch": 2103} {"train_loss": -6.212098121643066, "global_step": 88337, "epoch": 2103} {"train_loss": -6.254411220550537, "global_step": 88338, "epoch": 2103} {"train_loss": -6.176468849182129, "global_step": 88339, "epoch": 2103} {"train_loss": -6.3322858810424805, "global_step": 88340, "epoch": 2103} {"train_loss": -6.334089756011963, "global_step": 88341, "epoch": 2103} {"train_loss": -6.2263689041137695, "global_step": 88342, "epoch": 2103} {"train_loss": -6.356410980224609, "global_step": 88343, "epoch": 2103} {"train_loss": -6.258209228515625, "global_step": 88344, "epoch": 2103} {"train_loss": -6.222406387329102, "global_step": 88345, "epoch": 2103} {"train_loss": -6.180429458618164, "global_step": 88346, "epoch": 2103} {"train_loss": -6.143153190612793, "global_step": 88347, "epoch": 2103} {"train_loss": -6.244635581970215, "global_step": 88348, "epoch": 2103} {"train_loss": -6.27794885635376, "global_step": 88349, "epoch": 2103} {"train_loss": -6.192658424377441, "global_step": 88350, "epoch": 2103} {"train_loss": -6.266250133514404, "global_step": 88351, "epoch": 2103} {"train_loss": -6.339632034301758, "global_step": 88352, "epoch": 2103} {"train_loss": -6.304755687713623, "global_step": 88353, "epoch": 2103} {"train_loss": -6.287578582763672, "global_step": 88354, "epoch": 2103} {"train_loss": -6.328690528869629, "global_step": 88355, "epoch": 2103} {"train_loss": -6.179562568664551, "global_step": 88356, "epoch": 2103} {"train_loss": -6.3843488693237305, "global_step": 88357, "epoch": 2103} {"train_loss": -6.357998847961426, "global_step": 88358, "epoch": 2103} {"train_loss": -6.307509422302246, "global_step": 88359, "epoch": 2103} {"train_loss": -6.39369535446167, "global_step": 88360, "epoch": 2103} {"train_loss": -6.38102388381958, "global_step": 88361, "epoch": 2103} {"train_loss": -6.312915802001953, "global_step": 88362, "epoch": 2103} {"train_loss": -6.331976413726807, "global_step": 88363, "epoch": 2103} {"train_loss": -6.139670372009277, "global_step": 88364, "epoch": 2103} {"train_loss": -6.131256103515625, "global_step": 88365, "epoch": 2103} {"train_loss": -6.265923500061035, "global_step": 88366, "epoch": 2103} {"train_loss": -6.256621678670247, "global_step": 88367, "epoch": 2103, "val_loss": 62947.21875} {"train_loss": -6.266072750091553, "global_step": 88368, "epoch": 2104} {"train_loss": -6.199764251708984, "global_step": 88369, "epoch": 2104} {"train_loss": -6.213478088378906, "global_step": 88370, "epoch": 2104} {"train_loss": -6.198200702667236, "global_step": 88371, "epoch": 2104} {"train_loss": -6.227160453796387, "global_step": 88372, "epoch": 2104} {"train_loss": -6.20783805847168, "global_step": 88373, "epoch": 2104} {"train_loss": -6.134923934936523, "global_step": 88374, "epoch": 2104} {"train_loss": -6.221971035003662, "global_step": 88375, "epoch": 2104} {"train_loss": -6.296321868896484, "global_step": 88376, "epoch": 2104} {"train_loss": -6.159639835357666, "global_step": 88377, "epoch": 2104} {"train_loss": -6.302631378173828, "global_step": 88378, "epoch": 2104} {"train_loss": -6.210251808166504, "global_step": 88379, "epoch": 2104} {"train_loss": -6.2400970458984375, "global_step": 88380, "epoch": 2104} {"train_loss": -6.366522789001465, "global_step": 88381, "epoch": 2104} {"train_loss": -6.250008583068848, "global_step": 88382, "epoch": 2104} {"train_loss": -6.116071701049805, "global_step": 88383, "epoch": 2104} {"train_loss": -6.301565170288086, "global_step": 88384, "epoch": 2104} {"train_loss": -6.088956832885742, "global_step": 88385, "epoch": 2104} {"train_loss": -6.254828453063965, "global_step": 88386, "epoch": 2104} {"train_loss": -6.256622791290283, "global_step": 88387, "epoch": 2104} {"train_loss": -6.23160457611084, "global_step": 88388, "epoch": 2104} {"train_loss": -6.246302127838135, "global_step": 88389, "epoch": 2104} {"train_loss": -6.10058069229126, "global_step": 88390, "epoch": 2104} {"train_loss": -6.227839946746826, "global_step": 88391, "epoch": 2104} {"train_loss": -6.168633460998535, "global_step": 88392, "epoch": 2104} {"train_loss": -6.201731204986572, "global_step": 88393, "epoch": 2104} {"train_loss": -6.19123649597168, "global_step": 88394, "epoch": 2104} {"train_loss": -6.208353042602539, "global_step": 88395, "epoch": 2104} {"train_loss": -6.247732162475586, "global_step": 88396, "epoch": 2104} {"train_loss": -6.234369277954102, "global_step": 88397, "epoch": 2104} {"train_loss": -6.111915588378906, "global_step": 88398, "epoch": 2104} {"train_loss": -6.283685207366943, "global_step": 88399, "epoch": 2104} {"train_loss": -6.191492557525635, "global_step": 88400, "epoch": 2104} {"train_loss": -6.184900283813477, "global_step": 88401, "epoch": 2104} {"train_loss": -6.376694679260254, "global_step": 88402, "epoch": 2104} {"train_loss": -6.279499053955078, "global_step": 88403, "epoch": 2104} {"train_loss": -6.2257795333862305, "global_step": 88404, "epoch": 2104} {"train_loss": -6.34718132019043, "global_step": 88405, "epoch": 2104} {"train_loss": -6.232293128967285, "global_step": 88406, "epoch": 2104} {"train_loss": -6.408262252807617, "global_step": 88407, "epoch": 2104} {"train_loss": -6.253087520599365, "global_step": 88408, "epoch": 2104} {"train_loss": -6.229797124862671, "global_step": 88409, "epoch": 2104, "val_loss": 62939.35546875} {"train_loss": -6.083868026733398, "global_step": 88410, "epoch": 2105} {"train_loss": -6.191756248474121, "global_step": 88411, "epoch": 2105} {"train_loss": -6.291144371032715, "global_step": 88412, "epoch": 2105} {"train_loss": -6.171751022338867, "global_step": 88413, "epoch": 2105} {"train_loss": -6.288765907287598, "global_step": 88414, "epoch": 2105} {"train_loss": -6.2915544509887695, "global_step": 88415, "epoch": 2105} {"train_loss": -6.2412214279174805, "global_step": 88416, "epoch": 2105} {"train_loss": -6.245248794555664, "global_step": 88417, "epoch": 2105} {"train_loss": -6.238282203674316, "global_step": 88418, "epoch": 2105} {"train_loss": -6.3356804847717285, "global_step": 88419, "epoch": 2105} {"train_loss": -6.301468849182129, "global_step": 88420, "epoch": 2105} {"train_loss": -6.153545379638672, "global_step": 88421, "epoch": 2105} {"train_loss": -6.289839744567871, "global_step": 88422, "epoch": 2105} {"train_loss": -6.260753154754639, "global_step": 88423, "epoch": 2105} {"train_loss": -6.321651935577393, "global_step": 88424, "epoch": 2105} {"train_loss": -6.337363243103027, "global_step": 88425, "epoch": 2105} {"train_loss": -6.298931121826172, "global_step": 88426, "epoch": 2105} {"train_loss": -6.242574691772461, "global_step": 88427, "epoch": 2105} {"train_loss": -6.248682975769043, "global_step": 88428, "epoch": 2105} {"train_loss": -6.2758469581604, "global_step": 88429, "epoch": 2105} {"train_loss": -6.3680524826049805, "global_step": 88430, "epoch": 2105} {"train_loss": -6.213558673858643, "global_step": 88431, "epoch": 2105} {"train_loss": -6.307516098022461, "global_step": 88432, "epoch": 2105} {"train_loss": -6.214644908905029, "global_step": 88433, "epoch": 2105} {"train_loss": -6.303606033325195, "global_step": 88434, "epoch": 2105} {"train_loss": -6.259239673614502, "global_step": 88435, "epoch": 2105} {"train_loss": -6.215540409088135, "global_step": 88436, "epoch": 2105} {"train_loss": -6.247302055358887, "global_step": 88437, "epoch": 2105} {"train_loss": -6.185519218444824, "global_step": 88438, "epoch": 2105} {"train_loss": -6.238288402557373, "global_step": 88439, "epoch": 2105} {"train_loss": -6.418132781982422, "global_step": 88440, "epoch": 2105} {"train_loss": -6.09694766998291, "global_step": 88441, "epoch": 2105} {"train_loss": -6.228564262390137, "global_step": 88442, "epoch": 2105} {"train_loss": -6.244592666625977, "global_step": 88443, "epoch": 2105} {"train_loss": -6.231060981750488, "global_step": 88444, "epoch": 2105} {"train_loss": -6.157930850982666, "global_step": 88445, "epoch": 2105} {"train_loss": -6.345792770385742, "global_step": 88446, "epoch": 2105} {"train_loss": -6.1713056564331055, "global_step": 88447, "epoch": 2105} {"train_loss": -6.2468366622924805, "global_step": 88448, "epoch": 2105} {"train_loss": -6.184774398803711, "global_step": 88449, "epoch": 2105} {"train_loss": -6.273075580596924, "global_step": 88450, "epoch": 2105} {"train_loss": -6.24640755426316, "global_step": 88451, "epoch": 2105, "val_loss": 62890.515625} {"train_loss": -6.352120399475098, "global_step": 88452, "epoch": 2106} {"train_loss": -6.1722259521484375, "global_step": 88453, "epoch": 2106} {"train_loss": -6.150031566619873, "global_step": 88454, "epoch": 2106} {"train_loss": -6.239116668701172, "global_step": 88455, "epoch": 2106} {"train_loss": -6.149999618530273, "global_step": 88456, "epoch": 2106} {"train_loss": -6.301626205444336, "global_step": 88457, "epoch": 2106} {"train_loss": -6.116602897644043, "global_step": 88458, "epoch": 2106} {"train_loss": -6.2195539474487305, "global_step": 88459, "epoch": 2106} {"train_loss": -6.2491455078125, "global_step": 88460, "epoch": 2106} {"train_loss": -6.272230625152588, "global_step": 88461, "epoch": 2106} {"train_loss": -6.195296287536621, "global_step": 88462, "epoch": 2106} {"train_loss": -6.247422218322754, "global_step": 88463, "epoch": 2106} {"train_loss": -6.13674259185791, "global_step": 88464, "epoch": 2106} {"train_loss": -6.218579292297363, "global_step": 88465, "epoch": 2106} {"train_loss": -6.125489234924316, "global_step": 88466, "epoch": 2106} {"train_loss": -6.187900543212891, "global_step": 88467, "epoch": 2106} {"train_loss": -6.234048843383789, "global_step": 88468, "epoch": 2106} {"train_loss": -6.163400650024414, "global_step": 88469, "epoch": 2106} {"train_loss": -6.12197732925415, "global_step": 88470, "epoch": 2106} {"train_loss": -6.1999993324279785, "global_step": 88471, "epoch": 2106} {"train_loss": -6.223431587219238, "global_step": 88472, "epoch": 2106} {"train_loss": -6.178066253662109, "global_step": 88473, "epoch": 2106} {"train_loss": -6.108511924743652, "global_step": 88474, "epoch": 2106} {"train_loss": -6.281869888305664, "global_step": 88475, "epoch": 2106} {"train_loss": -6.108315944671631, "global_step": 88476, "epoch": 2106} {"train_loss": -6.077188968658447, "global_step": 88477, "epoch": 2106} {"train_loss": -6.297194480895996, "global_step": 88478, "epoch": 2106} {"train_loss": -6.19201135635376, "global_step": 88479, "epoch": 2106} {"train_loss": -6.267138481140137, "global_step": 88480, "epoch": 2106} {"train_loss": -6.062822341918945, "global_step": 88481, "epoch": 2106} {"train_loss": -6.2031755447387695, "global_step": 88482, "epoch": 2106} {"train_loss": -6.259129047393799, "global_step": 88483, "epoch": 2106} {"train_loss": -6.208017826080322, "global_step": 88484, "epoch": 2106} {"train_loss": -6.223077774047852, "global_step": 88485, "epoch": 2106} {"train_loss": -6.156448841094971, "global_step": 88486, "epoch": 2106} {"train_loss": -6.322395324707031, "global_step": 88487, "epoch": 2106} {"train_loss": -6.334626197814941, "global_step": 88488, "epoch": 2106} {"train_loss": -6.343902111053467, "global_step": 88489, "epoch": 2106} {"train_loss": -6.242842674255371, "global_step": 88490, "epoch": 2106} {"train_loss": -6.232759952545166, "global_step": 88491, "epoch": 2106} {"train_loss": -6.362320423126221, "global_step": 88492, "epoch": 2106} {"train_loss": -6.213118428275699, "global_step": 88493, "epoch": 2106, "val_loss": 62724.0078125} {"train_loss": -6.2205810546875, "global_step": 88494, "epoch": 2107} {"train_loss": -6.190125465393066, "global_step": 88495, "epoch": 2107} {"train_loss": -6.313358783721924, "global_step": 88496, "epoch": 2107} {"train_loss": -6.275197505950928, "global_step": 88497, "epoch": 2107} {"train_loss": -6.221359729766846, "global_step": 88498, "epoch": 2107} {"train_loss": -6.294449806213379, "global_step": 88499, "epoch": 2107} {"train_loss": -6.209864616394043, "global_step": 88500, "epoch": 2107} {"train_loss": -6.418595790863037, "global_step": 88501, "epoch": 2107} {"train_loss": -6.186378002166748, "global_step": 88502, "epoch": 2107} {"train_loss": -6.205348968505859, "global_step": 88503, "epoch": 2107} {"train_loss": -6.323421478271484, "global_step": 88504, "epoch": 2107} {"train_loss": -6.288908004760742, "global_step": 88505, "epoch": 2107} {"train_loss": -6.257370948791504, "global_step": 88506, "epoch": 2107} {"train_loss": -6.2453083992004395, "global_step": 88507, "epoch": 2107} {"train_loss": -6.217855930328369, "global_step": 88508, "epoch": 2107} {"train_loss": -6.126157760620117, "global_step": 88509, "epoch": 2107} {"train_loss": -6.275669574737549, "global_step": 88510, "epoch": 2107} {"train_loss": -6.269101619720459, "global_step": 88511, "epoch": 2107} {"train_loss": -6.226211071014404, "global_step": 88512, "epoch": 2107} {"train_loss": -6.195400238037109, "global_step": 88513, "epoch": 2107} {"train_loss": -6.158166885375977, "global_step": 88514, "epoch": 2107} {"train_loss": -6.17569637298584, "global_step": 88515, "epoch": 2107} {"train_loss": -6.272787094116211, "global_step": 88516, "epoch": 2107} {"train_loss": -6.139886856079102, "global_step": 88517, "epoch": 2107} {"train_loss": -6.1917219161987305, "global_step": 88518, "epoch": 2107} {"train_loss": -6.1952104568481445, "global_step": 88519, "epoch": 2107} {"train_loss": -6.18778657913208, "global_step": 88520, "epoch": 2107} {"train_loss": -6.274139881134033, "global_step": 88521, "epoch": 2107} {"train_loss": -6.375219345092773, "global_step": 88522, "epoch": 2107} {"train_loss": -6.278053283691406, "global_step": 88523, "epoch": 2107} {"train_loss": -6.291875839233398, "global_step": 88524, "epoch": 2107} {"train_loss": -6.191237449645996, "global_step": 88525, "epoch": 2107} {"train_loss": -6.2374701499938965, "global_step": 88526, "epoch": 2107} {"train_loss": -6.245320796966553, "global_step": 88527, "epoch": 2107} {"train_loss": -6.32612419128418, "global_step": 88528, "epoch": 2107} {"train_loss": -6.207697868347168, "global_step": 88529, "epoch": 2107} {"train_loss": -6.138718605041504, "global_step": 88530, "epoch": 2107} {"train_loss": -6.255062103271484, "global_step": 88531, "epoch": 2107} {"train_loss": -6.148306846618652, "global_step": 88532, "epoch": 2107} {"train_loss": -6.263470649719238, "global_step": 88533, "epoch": 2107} {"train_loss": -6.222983360290527, "global_step": 88534, "epoch": 2107} {"train_loss": -6.236944266727993, "global_step": 88535, "epoch": 2107, "val_loss": 63022.1796875} {"train_loss": -6.162779331207275, "global_step": 88536, "epoch": 2108} {"train_loss": -6.315282821655273, "global_step": 88537, "epoch": 2108} {"train_loss": -6.362301826477051, "global_step": 88538, "epoch": 2108} {"train_loss": -6.334342956542969, "global_step": 88539, "epoch": 2108} {"train_loss": -6.36888313293457, "global_step": 88540, "epoch": 2108} {"train_loss": -6.287538528442383, "global_step": 88541, "epoch": 2108} {"train_loss": -6.220733642578125, "global_step": 88542, "epoch": 2108} {"train_loss": -6.1351118087768555, "global_step": 88543, "epoch": 2108} {"train_loss": -6.234000205993652, "global_step": 88544, "epoch": 2108} {"train_loss": -6.184173583984375, "global_step": 88545, "epoch": 2108} {"train_loss": -6.15106725692749, "global_step": 88546, "epoch": 2108} {"train_loss": -6.20561408996582, "global_step": 88547, "epoch": 2108} {"train_loss": -6.246055603027344, "global_step": 88548, "epoch": 2108} {"train_loss": -6.173558235168457, "global_step": 88549, "epoch": 2108} {"train_loss": -6.156825542449951, "global_step": 88550, "epoch": 2108} {"train_loss": -6.178767204284668, "global_step": 88551, "epoch": 2108} {"train_loss": -6.184281826019287, "global_step": 88552, "epoch": 2108} {"train_loss": -6.235914707183838, "global_step": 88553, "epoch": 2108} {"train_loss": -6.174551963806152, "global_step": 88554, "epoch": 2108} {"train_loss": -6.171417236328125, "global_step": 88555, "epoch": 2108} {"train_loss": -6.202445030212402, "global_step": 88556, "epoch": 2108} {"train_loss": -6.240516662597656, "global_step": 88557, "epoch": 2108} {"train_loss": -6.22894287109375, "global_step": 88558, "epoch": 2108} {"train_loss": -6.121016025543213, "global_step": 88559, "epoch": 2108} {"train_loss": -6.15934419631958, "global_step": 88560, "epoch": 2108} {"train_loss": -6.114253997802734, "global_step": 88561, "epoch": 2108} {"train_loss": -6.198067665100098, "global_step": 88562, "epoch": 2108} {"train_loss": -6.237563133239746, "global_step": 88563, "epoch": 2108} {"train_loss": -6.180342674255371, "global_step": 88564, "epoch": 2108} {"train_loss": -6.275784492492676, "global_step": 88565, "epoch": 2108} {"train_loss": -6.237020015716553, "global_step": 88566, "epoch": 2108} {"train_loss": -6.260358810424805, "global_step": 88567, "epoch": 2108} {"train_loss": -6.32553768157959, "global_step": 88568, "epoch": 2108} {"train_loss": -6.27264404296875, "global_step": 88569, "epoch": 2108} {"train_loss": -6.179610252380371, "global_step": 88570, "epoch": 2108} {"train_loss": -6.2637038230896, "global_step": 88571, "epoch": 2108} {"train_loss": -6.264060020446777, "global_step": 88572, "epoch": 2108} {"train_loss": -6.274415016174316, "global_step": 88573, "epoch": 2108} {"train_loss": -6.205010414123535, "global_step": 88574, "epoch": 2108} {"train_loss": -6.316869735717773, "global_step": 88575, "epoch": 2108} {"train_loss": -6.317163467407227, "global_step": 88576, "epoch": 2108} {"train_loss": -6.230029242379325, "global_step": 88577, "epoch": 2108, "val_loss": 62931.50390625} {"train_loss": -6.4550580978393555, "global_step": 88578, "epoch": 2109} {"train_loss": -6.3079094886779785, "global_step": 88579, "epoch": 2109} {"train_loss": -6.195522785186768, "global_step": 88580, "epoch": 2109} {"train_loss": -6.247461318969727, "global_step": 88581, "epoch": 2109} {"train_loss": -6.215150833129883, "global_step": 88582, "epoch": 2109} {"train_loss": -6.271060943603516, "global_step": 88583, "epoch": 2109} {"train_loss": -6.294764995574951, "global_step": 88584, "epoch": 2109} {"train_loss": -6.343788146972656, "global_step": 88585, "epoch": 2109} {"train_loss": -6.369747161865234, "global_step": 88586, "epoch": 2109} {"train_loss": -6.110462188720703, "global_step": 88587, "epoch": 2109} {"train_loss": -6.245389938354492, "global_step": 88588, "epoch": 2109} {"train_loss": -6.237534046173096, "global_step": 88589, "epoch": 2109} {"train_loss": -6.217617034912109, "global_step": 88590, "epoch": 2109} {"train_loss": -6.264089584350586, "global_step": 88591, "epoch": 2109} {"train_loss": -6.305253028869629, "global_step": 88592, "epoch": 2109} {"train_loss": -6.164735794067383, "global_step": 88593, "epoch": 2109} {"train_loss": -6.301179885864258, "global_step": 88594, "epoch": 2109} {"train_loss": -6.227307319641113, "global_step": 88595, "epoch": 2109} {"train_loss": -6.208132743835449, "global_step": 88596, "epoch": 2109} {"train_loss": -6.228047847747803, "global_step": 88597, "epoch": 2109} {"train_loss": -6.22353458404541, "global_step": 88598, "epoch": 2109} {"train_loss": -6.18293571472168, "global_step": 88599, "epoch": 2109} {"train_loss": -6.130646705627441, "global_step": 88600, "epoch": 2109} {"train_loss": -6.285717010498047, "global_step": 88601, "epoch": 2109} {"train_loss": -6.118392467498779, "global_step": 88602, "epoch": 2109} {"train_loss": -6.162999153137207, "global_step": 88603, "epoch": 2109} {"train_loss": -6.243559837341309, "global_step": 88604, "epoch": 2109} {"train_loss": -6.219664573669434, "global_step": 88605, "epoch": 2109} {"train_loss": -6.220775604248047, "global_step": 88606, "epoch": 2109} {"train_loss": -6.238716125488281, "global_step": 88607, "epoch": 2109} {"train_loss": -6.233770847320557, "global_step": 88608, "epoch": 2109} {"train_loss": -6.198198318481445, "global_step": 88609, "epoch": 2109} {"train_loss": -6.244724273681641, "global_step": 88610, "epoch": 2109} {"train_loss": -6.26685905456543, "global_step": 88611, "epoch": 2109} {"train_loss": -6.3383684158325195, "global_step": 88612, "epoch": 2109} {"train_loss": -6.381011962890625, "global_step": 88613, "epoch": 2109} {"train_loss": -6.262468338012695, "global_step": 88614, "epoch": 2109} {"train_loss": -6.353780746459961, "global_step": 88615, "epoch": 2109} {"train_loss": -6.370399475097656, "global_step": 88616, "epoch": 2109} {"train_loss": -6.126713752746582, "global_step": 88617, "epoch": 2109} {"train_loss": -6.288820266723633, "global_step": 88618, "epoch": 2109} {"train_loss": -6.251718759536743, "global_step": 88619, "epoch": 2109, "val_loss": 62960.47265625} {"train_loss": -6.3087053298950195, "global_step": 88620, "epoch": 2110} {"train_loss": -6.219537734985352, "global_step": 88621, "epoch": 2110} {"train_loss": -6.273136138916016, "global_step": 88622, "epoch": 2110} {"train_loss": -6.283939361572266, "global_step": 88623, "epoch": 2110} {"train_loss": -6.241560935974121, "global_step": 88624, "epoch": 2110} {"train_loss": -6.324791431427002, "global_step": 88625, "epoch": 2110} {"train_loss": -6.390470027923584, "global_step": 88626, "epoch": 2110} {"train_loss": -6.238673210144043, "global_step": 88627, "epoch": 2110} {"train_loss": -6.228992462158203, "global_step": 88628, "epoch": 2110} {"train_loss": -6.246323585510254, "global_step": 88629, "epoch": 2110} {"train_loss": -6.354862213134766, "global_step": 88630, "epoch": 2110} {"train_loss": -6.261703014373779, "global_step": 88631, "epoch": 2110} {"train_loss": -6.256099224090576, "global_step": 88632, "epoch": 2110} {"train_loss": -6.234663486480713, "global_step": 88633, "epoch": 2110} {"train_loss": -6.240215301513672, "global_step": 88634, "epoch": 2110} {"train_loss": -6.274374008178711, "global_step": 88635, "epoch": 2110} {"train_loss": -6.198185443878174, "global_step": 88636, "epoch": 2110} {"train_loss": -6.231321811676025, "global_step": 88637, "epoch": 2110} {"train_loss": -6.179329872131348, "global_step": 88638, "epoch": 2110} {"train_loss": -6.296555995941162, "global_step": 88639, "epoch": 2110} {"train_loss": -6.363870143890381, "global_step": 88640, "epoch": 2110} {"train_loss": -6.173868179321289, "global_step": 88641, "epoch": 2110} {"train_loss": -6.276043891906738, "global_step": 88642, "epoch": 2110} {"train_loss": -6.225342750549316, "global_step": 88643, "epoch": 2110} {"train_loss": -6.236487865447998, "global_step": 88644, "epoch": 2110} {"train_loss": -6.318928241729736, "global_step": 88645, "epoch": 2110} {"train_loss": -6.210025787353516, "global_step": 88646, "epoch": 2110} {"train_loss": -6.172028064727783, "global_step": 88647, "epoch": 2110} {"train_loss": -6.232274055480957, "global_step": 88648, "epoch": 2110} {"train_loss": -6.262930393218994, "global_step": 88649, "epoch": 2110} {"train_loss": -6.137788772583008, "global_step": 88650, "epoch": 2110} {"train_loss": -6.194108009338379, "global_step": 88651, "epoch": 2110} {"train_loss": -6.2490739822387695, "global_step": 88652, "epoch": 2110} {"train_loss": -6.183366298675537, "global_step": 88653, "epoch": 2110} {"train_loss": -6.243671417236328, "global_step": 88654, "epoch": 2110} {"train_loss": -6.303676605224609, "global_step": 88655, "epoch": 2110} {"train_loss": -6.239714622497559, "global_step": 88656, "epoch": 2110} {"train_loss": -6.28226900100708, "global_step": 88657, "epoch": 2110} {"train_loss": -6.169980049133301, "global_step": 88658, "epoch": 2110} {"train_loss": -6.21901798248291, "global_step": 88659, "epoch": 2110} {"train_loss": -6.185328483581543, "global_step": 88660, "epoch": 2110} {"train_loss": -6.249262389682588, "global_step": 88661, "epoch": 2110, "val_loss": 63003.7734375} {"train_loss": -6.187440395355225, "global_step": 88662, "epoch": 2111} {"train_loss": -6.119521617889404, "global_step": 88663, "epoch": 2111} {"train_loss": -6.1398844718933105, "global_step": 88664, "epoch": 2111} {"train_loss": -6.165593147277832, "global_step": 88665, "epoch": 2111} {"train_loss": -6.222141265869141, "global_step": 88666, "epoch": 2111} {"train_loss": -6.228468418121338, "global_step": 88667, "epoch": 2111} {"train_loss": -6.143948554992676, "global_step": 88668, "epoch": 2111} {"train_loss": -6.194972515106201, "global_step": 88669, "epoch": 2111} {"train_loss": -6.3285231590271, "global_step": 88670, "epoch": 2111} {"train_loss": -6.287327766418457, "global_step": 88671, "epoch": 2111} {"train_loss": -6.223476886749268, "global_step": 88672, "epoch": 2111} {"train_loss": -6.238910675048828, "global_step": 88673, "epoch": 2111} {"train_loss": -6.332231521606445, "global_step": 88674, "epoch": 2111} {"train_loss": -6.279823303222656, "global_step": 88675, "epoch": 2111} {"train_loss": -6.271987438201904, "global_step": 88676, "epoch": 2111} {"train_loss": -6.274007320404053, "global_step": 88677, "epoch": 2111} {"train_loss": -6.27247953414917, "global_step": 88678, "epoch": 2111} {"train_loss": -6.2599711418151855, "global_step": 88679, "epoch": 2111} {"train_loss": -6.1950364112854, "global_step": 88680, "epoch": 2111} {"train_loss": -6.340208053588867, "global_step": 88681, "epoch": 2111} {"train_loss": -6.204375267028809, "global_step": 88682, "epoch": 2111} {"train_loss": -6.236110210418701, "global_step": 88683, "epoch": 2111} {"train_loss": -6.188731670379639, "global_step": 88684, "epoch": 2111} {"train_loss": -6.227221488952637, "global_step": 88685, "epoch": 2111} {"train_loss": -6.2343950271606445, "global_step": 88686, "epoch": 2111} {"train_loss": -6.269227981567383, "global_step": 88687, "epoch": 2111} {"train_loss": -6.275825023651123, "global_step": 88688, "epoch": 2111} {"train_loss": -6.207052230834961, "global_step": 88689, "epoch": 2111} {"train_loss": -6.191954612731934, "global_step": 88690, "epoch": 2111} {"train_loss": -6.218057632446289, "global_step": 88691, "epoch": 2111} {"train_loss": -6.306961536407471, "global_step": 88692, "epoch": 2111} {"train_loss": -6.283816337585449, "global_step": 88693, "epoch": 2111} {"train_loss": -6.28410530090332, "global_step": 88694, "epoch": 2111} {"train_loss": -6.220980167388916, "global_step": 88695, "epoch": 2111} {"train_loss": -6.2953782081604, "global_step": 88696, "epoch": 2111} {"train_loss": -6.246471405029297, "global_step": 88697, "epoch": 2111} {"train_loss": -6.212734699249268, "global_step": 88698, "epoch": 2111} {"train_loss": -6.325824737548828, "global_step": 88699, "epoch": 2111} {"train_loss": -6.120724201202393, "global_step": 88700, "epoch": 2111} {"train_loss": -6.196458339691162, "global_step": 88701, "epoch": 2111} {"train_loss": -6.395514488220215, "global_step": 88702, "epoch": 2111} {"train_loss": -6.23924385933649, "global_step": 88703, "epoch": 2111, "val_loss": 63000.10546875} {"train_loss": -6.179914474487305, "global_step": 88704, "epoch": 2112} {"train_loss": -6.248595237731934, "global_step": 88705, "epoch": 2112} {"train_loss": -6.006072998046875, "global_step": 88706, "epoch": 2112} {"train_loss": -6.1743927001953125, "global_step": 88707, "epoch": 2112} {"train_loss": -6.175477981567383, "global_step": 88708, "epoch": 2112} {"train_loss": -6.093271732330322, "global_step": 88709, "epoch": 2112} {"train_loss": -6.264606475830078, "global_step": 88710, "epoch": 2112} {"train_loss": -6.3136515617370605, "global_step": 88711, "epoch": 2112} {"train_loss": -6.2481842041015625, "global_step": 88712, "epoch": 2112} {"train_loss": -6.222995281219482, "global_step": 88713, "epoch": 2112} {"train_loss": -6.21425724029541, "global_step": 88714, "epoch": 2112} {"train_loss": -6.131680488586426, "global_step": 88715, "epoch": 2112} {"train_loss": -6.196150302886963, "global_step": 88716, "epoch": 2112} {"train_loss": -6.320658206939697, "global_step": 88717, "epoch": 2112} {"train_loss": -6.185187339782715, "global_step": 88718, "epoch": 2112} {"train_loss": -6.157754421234131, "global_step": 88719, "epoch": 2112} {"train_loss": -6.176856994628906, "global_step": 88720, "epoch": 2112} {"train_loss": -6.092807292938232, "global_step": 88721, "epoch": 2112} {"train_loss": -6.264471054077148, "global_step": 88722, "epoch": 2112} {"train_loss": -6.084848880767822, "global_step": 88723, "epoch": 2112} {"train_loss": -6.174464702606201, "global_step": 88724, "epoch": 2112} {"train_loss": -6.16089391708374, "global_step": 88725, "epoch": 2112} {"train_loss": -6.16174840927124, "global_step": 88726, "epoch": 2112} {"train_loss": -6.126074314117432, "global_step": 88727, "epoch": 2112} {"train_loss": -6.336973190307617, "global_step": 88728, "epoch": 2112} {"train_loss": -6.236018180847168, "global_step": 88729, "epoch": 2112} {"train_loss": -6.127567291259766, "global_step": 88730, "epoch": 2112} {"train_loss": -6.218358039855957, "global_step": 88731, "epoch": 2112} {"train_loss": -6.229541778564453, "global_step": 88732, "epoch": 2112} {"train_loss": -6.208037376403809, "global_step": 88733, "epoch": 2112} {"train_loss": -6.108836650848389, "global_step": 88734, "epoch": 2112} {"train_loss": -6.127467632293701, "global_step": 88735, "epoch": 2112} {"train_loss": -6.18403434753418, "global_step": 88736, "epoch": 2112} {"train_loss": -6.101546287536621, "global_step": 88737, "epoch": 2112} {"train_loss": -6.152987480163574, "global_step": 88738, "epoch": 2112} {"train_loss": -6.129489898681641, "global_step": 88739, "epoch": 2112} {"train_loss": -6.254031181335449, "global_step": 88740, "epoch": 2112} {"train_loss": -6.244417190551758, "global_step": 88741, "epoch": 2112} {"train_loss": -6.176191329956055, "global_step": 88742, "epoch": 2112} {"train_loss": -6.143497943878174, "global_step": 88743, "epoch": 2112} {"train_loss": -6.180325508117676, "global_step": 88744, "epoch": 2112} {"train_loss": -6.1818352199736095, "global_step": 88745, "epoch": 2112, "val_loss": 63056.1875} {"train_loss": -6.236394882202148, "global_step": 88746, "epoch": 2113} {"train_loss": -6.162192344665527, "global_step": 88747, "epoch": 2113} {"train_loss": -6.23330545425415, "global_step": 88748, "epoch": 2113} {"train_loss": -6.124858856201172, "global_step": 88749, "epoch": 2113} {"train_loss": -6.298251628875732, "global_step": 88750, "epoch": 2113} {"train_loss": -6.162779808044434, "global_step": 88751, "epoch": 2113} {"train_loss": -6.23599100112915, "global_step": 88752, "epoch": 2113} {"train_loss": -6.2017412185668945, "global_step": 88753, "epoch": 2113} {"train_loss": -6.171172142028809, "global_step": 88754, "epoch": 2113} {"train_loss": -6.278493881225586, "global_step": 88755, "epoch": 2113} {"train_loss": -6.342390060424805, "global_step": 88756, "epoch": 2113} {"train_loss": -6.229411602020264, "global_step": 88757, "epoch": 2113} {"train_loss": -6.347591400146484, "global_step": 88758, "epoch": 2113} {"train_loss": -6.33896541595459, "global_step": 88759, "epoch": 2113} {"train_loss": -6.222264289855957, "global_step": 88760, "epoch": 2113} {"train_loss": -6.201573371887207, "global_step": 88761, "epoch": 2113} {"train_loss": -6.383302211761475, "global_step": 88762, "epoch": 2113} {"train_loss": -6.189881324768066, "global_step": 88763, "epoch": 2113} {"train_loss": -6.293674468994141, "global_step": 88764, "epoch": 2113} {"train_loss": -6.292125225067139, "global_step": 88765, "epoch": 2113} {"train_loss": -6.2553887367248535, "global_step": 88766, "epoch": 2113} {"train_loss": -6.19985294342041, "global_step": 88767, "epoch": 2113} {"train_loss": -6.1871185302734375, "global_step": 88768, "epoch": 2113} {"train_loss": -6.264998435974121, "global_step": 88769, "epoch": 2113} {"train_loss": -6.209211349487305, "global_step": 88770, "epoch": 2113} {"train_loss": -6.22529935836792, "global_step": 88771, "epoch": 2113} {"train_loss": -6.315406799316406, "global_step": 88772, "epoch": 2113} {"train_loss": -6.222851276397705, "global_step": 88773, "epoch": 2113} {"train_loss": -6.165882110595703, "global_step": 88774, "epoch": 2113} {"train_loss": -6.228811740875244, "global_step": 88775, "epoch": 2113} {"train_loss": -6.144732475280762, "global_step": 88776, "epoch": 2113} {"train_loss": -6.316563129425049, "global_step": 88777, "epoch": 2113} {"train_loss": -6.191051006317139, "global_step": 88778, "epoch": 2113} {"train_loss": -6.277511119842529, "global_step": 88779, "epoch": 2113} {"train_loss": -6.232048034667969, "global_step": 88780, "epoch": 2113} {"train_loss": -6.260688781738281, "global_step": 88781, "epoch": 2113} {"train_loss": -6.374377727508545, "global_step": 88782, "epoch": 2113} {"train_loss": -6.2120866775512695, "global_step": 88783, "epoch": 2113} {"train_loss": -6.188712120056152, "global_step": 88784, "epoch": 2113} {"train_loss": -6.236786365509033, "global_step": 88785, "epoch": 2113} {"train_loss": -6.356473445892334, "global_step": 88786, "epoch": 2113} {"train_loss": -6.242857728685651, "global_step": 88787, "epoch": 2113, "val_loss": 62924.0390625} {"train_loss": -6.215305328369141, "global_step": 88788, "epoch": 2114} {"train_loss": -6.170607566833496, "global_step": 88789, "epoch": 2114} {"train_loss": -6.27495002746582, "global_step": 88790, "epoch": 2114} {"train_loss": -6.313218116760254, "global_step": 88791, "epoch": 2114} {"train_loss": -6.198177337646484, "global_step": 88792, "epoch": 2114} {"train_loss": -6.211729526519775, "global_step": 88793, "epoch": 2114} {"train_loss": -6.3480939865112305, "global_step": 88794, "epoch": 2114} {"train_loss": -6.207741737365723, "global_step": 88795, "epoch": 2114} {"train_loss": -6.163435935974121, "global_step": 88796, "epoch": 2114} {"train_loss": -6.251425743103027, "global_step": 88797, "epoch": 2114} {"train_loss": -6.193240165710449, "global_step": 88798, "epoch": 2114} {"train_loss": -6.225188255310059, "global_step": 88799, "epoch": 2114} {"train_loss": -6.2294440269470215, "global_step": 88800, "epoch": 2114} {"train_loss": -6.346927642822266, "global_step": 88801, "epoch": 2114} {"train_loss": -6.168395519256592, "global_step": 88802, "epoch": 2114} {"train_loss": -6.243867874145508, "global_step": 88803, "epoch": 2114} {"train_loss": -6.311493873596191, "global_step": 88804, "epoch": 2114} {"train_loss": -6.281144618988037, "global_step": 88805, "epoch": 2114} {"train_loss": -6.3456244468688965, "global_step": 88806, "epoch": 2114} {"train_loss": -6.310141563415527, "global_step": 88807, "epoch": 2114} {"train_loss": -6.1871337890625, "global_step": 88808, "epoch": 2114} {"train_loss": -6.199522018432617, "global_step": 88809, "epoch": 2114} {"train_loss": -6.310751914978027, "global_step": 88810, "epoch": 2114} {"train_loss": -6.247386932373047, "global_step": 88811, "epoch": 2114} {"train_loss": -6.2728471755981445, "global_step": 88812, "epoch": 2114} {"train_loss": -6.2874555587768555, "global_step": 88813, "epoch": 2114} {"train_loss": -6.1967620849609375, "global_step": 88814, "epoch": 2114} {"train_loss": -6.329129695892334, "global_step": 88815, "epoch": 2114} {"train_loss": -6.376833438873291, "global_step": 88816, "epoch": 2114} {"train_loss": -6.259807586669922, "global_step": 88817, "epoch": 2114} {"train_loss": -6.290469646453857, "global_step": 88818, "epoch": 2114} {"train_loss": -6.3273725509643555, "global_step": 88819, "epoch": 2114} {"train_loss": -6.213813781738281, "global_step": 88820, "epoch": 2114} {"train_loss": -6.17366886138916, "global_step": 88821, "epoch": 2114} {"train_loss": -6.226790428161621, "global_step": 88822, "epoch": 2114} {"train_loss": -6.323093414306641, "global_step": 88823, "epoch": 2114} {"train_loss": -6.2076263427734375, "global_step": 88824, "epoch": 2114} {"train_loss": -6.32415771484375, "global_step": 88825, "epoch": 2114} {"train_loss": -6.243427276611328, "global_step": 88826, "epoch": 2114} {"train_loss": -6.225522994995117, "global_step": 88827, "epoch": 2114} {"train_loss": -6.249462127685547, "global_step": 88828, "epoch": 2114} {"train_loss": -6.254470143999372, "global_step": 88829, "epoch": 2114, "val_loss": 62958.203125} {"train_loss": -6.317892074584961, "global_step": 88830, "epoch": 2115} {"train_loss": -6.213964462280273, "global_step": 88831, "epoch": 2115} {"train_loss": -6.2994489669799805, "global_step": 88832, "epoch": 2115} {"train_loss": -6.22456169128418, "global_step": 88833, "epoch": 2115} {"train_loss": -6.288675308227539, "global_step": 88834, "epoch": 2115} {"train_loss": -6.299752235412598, "global_step": 88835, "epoch": 2115} {"train_loss": -6.238033771514893, "global_step": 88836, "epoch": 2115} {"train_loss": -6.198576927185059, "global_step": 88837, "epoch": 2115} {"train_loss": -6.373015403747559, "global_step": 88838, "epoch": 2115} {"train_loss": -6.284929275512695, "global_step": 88839, "epoch": 2115} {"train_loss": -6.329742431640625, "global_step": 88840, "epoch": 2115} {"train_loss": -6.280161380767822, "global_step": 88841, "epoch": 2115} {"train_loss": -6.241039276123047, "global_step": 88842, "epoch": 2115} {"train_loss": -6.3314361572265625, "global_step": 88843, "epoch": 2115} {"train_loss": -6.15225887298584, "global_step": 88844, "epoch": 2115} {"train_loss": -6.375178337097168, "global_step": 88845, "epoch": 2115} {"train_loss": -6.305280685424805, "global_step": 88846, "epoch": 2115} {"train_loss": -6.366024494171143, "global_step": 88847, "epoch": 2115} {"train_loss": -6.381216049194336, "global_step": 88848, "epoch": 2115} {"train_loss": -6.25606632232666, "global_step": 88849, "epoch": 2115} {"train_loss": -6.316498756408691, "global_step": 88850, "epoch": 2115} {"train_loss": -6.2067131996154785, "global_step": 88851, "epoch": 2115} {"train_loss": -6.262204647064209, "global_step": 88852, "epoch": 2115} {"train_loss": -6.279231071472168, "global_step": 88853, "epoch": 2115} {"train_loss": -6.229696273803711, "global_step": 88854, "epoch": 2115} {"train_loss": -6.200013160705566, "global_step": 88855, "epoch": 2115} {"train_loss": -6.326167106628418, "global_step": 88856, "epoch": 2115} {"train_loss": -6.263153553009033, "global_step": 88857, "epoch": 2115} {"train_loss": -6.268915176391602, "global_step": 88858, "epoch": 2115} {"train_loss": -6.150524139404297, "global_step": 88859, "epoch": 2115} {"train_loss": -6.26035737991333, "global_step": 88860, "epoch": 2115} {"train_loss": -6.346944808959961, "global_step": 88861, "epoch": 2115} {"train_loss": -6.265292167663574, "global_step": 88862, "epoch": 2115} {"train_loss": -6.227236270904541, "global_step": 88863, "epoch": 2115} {"train_loss": -6.269327163696289, "global_step": 88864, "epoch": 2115} {"train_loss": -6.220760345458984, "global_step": 88865, "epoch": 2115} {"train_loss": -6.146042346954346, "global_step": 88866, "epoch": 2115} {"train_loss": -6.3539958000183105, "global_step": 88867, "epoch": 2115} {"train_loss": -6.147724151611328, "global_step": 88868, "epoch": 2115} {"train_loss": -6.188820838928223, "global_step": 88869, "epoch": 2115} {"train_loss": -6.250615119934082, "global_step": 88870, "epoch": 2115} {"train_loss": -6.262951487586612, "global_step": 88871, "epoch": 2115, "val_loss": 62984.6953125} {"train_loss": -6.250649452209473, "global_step": 88872, "epoch": 2116} {"train_loss": -6.261292457580566, "global_step": 88873, "epoch": 2116} {"train_loss": -6.079799652099609, "global_step": 88874, "epoch": 2116} {"train_loss": -6.1973090171813965, "global_step": 88875, "epoch": 2116} {"train_loss": -6.1421098709106445, "global_step": 88876, "epoch": 2116} {"train_loss": -6.2489728927612305, "global_step": 88877, "epoch": 2116} {"train_loss": -6.23158073425293, "global_step": 88878, "epoch": 2116} {"train_loss": -6.287955284118652, "global_step": 88879, "epoch": 2116} {"train_loss": -6.213932037353516, "global_step": 88880, "epoch": 2116} {"train_loss": -6.176472187042236, "global_step": 88881, "epoch": 2116} {"train_loss": -6.244086742401123, "global_step": 88882, "epoch": 2116} {"train_loss": -6.192016124725342, "global_step": 88883, "epoch": 2116} {"train_loss": -6.346388816833496, "global_step": 88884, "epoch": 2116} {"train_loss": -6.310791015625, "global_step": 88885, "epoch": 2116} {"train_loss": -6.223691940307617, "global_step": 88886, "epoch": 2116} {"train_loss": -6.2207489013671875, "global_step": 88887, "epoch": 2116} {"train_loss": -6.241950035095215, "global_step": 88888, "epoch": 2116} {"train_loss": -6.273519515991211, "global_step": 88889, "epoch": 2116} {"train_loss": -6.212261199951172, "global_step": 88890, "epoch": 2116} {"train_loss": -6.1904425621032715, "global_step": 88891, "epoch": 2116} {"train_loss": -6.118856906890869, "global_step": 88892, "epoch": 2116} {"train_loss": -6.103724002838135, "global_step": 88893, "epoch": 2116} {"train_loss": -6.078126430511475, "global_step": 88894, "epoch": 2116} {"train_loss": -6.17625617980957, "global_step": 88895, "epoch": 2116} {"train_loss": -6.191452980041504, "global_step": 88896, "epoch": 2116} {"train_loss": -6.284305095672607, "global_step": 88897, "epoch": 2116} {"train_loss": -6.24224853515625, "global_step": 88898, "epoch": 2116} {"train_loss": -6.150243759155273, "global_step": 88899, "epoch": 2116} {"train_loss": -6.239603042602539, "global_step": 88900, "epoch": 2116} {"train_loss": -6.2237114906311035, "global_step": 88901, "epoch": 2116} {"train_loss": -6.259376525878906, "global_step": 88902, "epoch": 2116} {"train_loss": -6.100332736968994, "global_step": 88903, "epoch": 2116} {"train_loss": -6.148551940917969, "global_step": 88904, "epoch": 2116} {"train_loss": -6.15980339050293, "global_step": 88905, "epoch": 2116} {"train_loss": -6.251863479614258, "global_step": 88906, "epoch": 2116} {"train_loss": -6.247568130493164, "global_step": 88907, "epoch": 2116} {"train_loss": -6.302640438079834, "global_step": 88908, "epoch": 2116} {"train_loss": -6.153067588806152, "global_step": 88909, "epoch": 2116} {"train_loss": -6.225946426391602, "global_step": 88910, "epoch": 2116} {"train_loss": -6.171316623687744, "global_step": 88911, "epoch": 2116} {"train_loss": -6.266049385070801, "global_step": 88912, "epoch": 2116} {"train_loss": -6.210889066968646, "global_step": 88913, "epoch": 2116, "val_loss": 63055.015625} {"train_loss": -6.302602291107178, "global_step": 88914, "epoch": 2117} {"train_loss": -6.2987060546875, "global_step": 88915, "epoch": 2117} {"train_loss": -6.265912055969238, "global_step": 88916, "epoch": 2117} {"train_loss": -6.165497779846191, "global_step": 88917, "epoch": 2117} {"train_loss": -6.173290252685547, "global_step": 88918, "epoch": 2117} {"train_loss": -6.21933650970459, "global_step": 88919, "epoch": 2117} {"train_loss": -6.243649959564209, "global_step": 88920, "epoch": 2117} {"train_loss": -6.238382339477539, "global_step": 88921, "epoch": 2117} {"train_loss": -6.252303123474121, "global_step": 88922, "epoch": 2117} {"train_loss": -6.24813985824585, "global_step": 88923, "epoch": 2117} {"train_loss": -6.291206359863281, "global_step": 88924, "epoch": 2117} {"train_loss": -6.268618583679199, "global_step": 88925, "epoch": 2117} {"train_loss": -6.160019874572754, "global_step": 88926, "epoch": 2117} {"train_loss": -6.284323692321777, "global_step": 88927, "epoch": 2117} {"train_loss": -6.326176643371582, "global_step": 88928, "epoch": 2117} {"train_loss": -6.188735485076904, "global_step": 88929, "epoch": 2117} {"train_loss": -6.337041854858398, "global_step": 88930, "epoch": 2117} {"train_loss": -6.2104620933532715, "global_step": 88931, "epoch": 2117} {"train_loss": -6.304307460784912, "global_step": 88932, "epoch": 2117} {"train_loss": -6.270003795623779, "global_step": 88933, "epoch": 2117} {"train_loss": -6.22509765625, "global_step": 88934, "epoch": 2117} {"train_loss": -6.273118495941162, "global_step": 88935, "epoch": 2117} {"train_loss": -6.290826797485352, "global_step": 88936, "epoch": 2117} {"train_loss": -6.115303039550781, "global_step": 88937, "epoch": 2117} {"train_loss": -6.166714668273926, "global_step": 88938, "epoch": 2117} {"train_loss": -6.267933368682861, "global_step": 88939, "epoch": 2117} {"train_loss": -6.233339309692383, "global_step": 88940, "epoch": 2117} {"train_loss": -6.216472625732422, "global_step": 88941, "epoch": 2117} {"train_loss": -6.3831281661987305, "global_step": 88942, "epoch": 2117} {"train_loss": -6.274507522583008, "global_step": 88943, "epoch": 2117} {"train_loss": -6.25621223449707, "global_step": 88944, "epoch": 2117} {"train_loss": -6.2688140869140625, "global_step": 88945, "epoch": 2117} {"train_loss": -6.1941118240356445, "global_step": 88946, "epoch": 2117} {"train_loss": -6.264243125915527, "global_step": 88947, "epoch": 2117} {"train_loss": -6.310220718383789, "global_step": 88948, "epoch": 2117} {"train_loss": -6.2887187004089355, "global_step": 88949, "epoch": 2117} {"train_loss": -6.255709648132324, "global_step": 88950, "epoch": 2117} {"train_loss": -6.414063453674316, "global_step": 88951, "epoch": 2117} {"train_loss": -6.211156845092773, "global_step": 88952, "epoch": 2117} {"train_loss": -6.108639240264893, "global_step": 88953, "epoch": 2117} {"train_loss": -6.301959991455078, "global_step": 88954, "epoch": 2117} {"train_loss": -6.249651590983073, "global_step": 88955, "epoch": 2117, "val_loss": 63078.984375} {"train_loss": -6.296797752380371, "global_step": 88956, "epoch": 2118} {"train_loss": -6.2554216384887695, "global_step": 88957, "epoch": 2118} {"train_loss": -6.200996398925781, "global_step": 88958, "epoch": 2118} {"train_loss": -6.222562789916992, "global_step": 88959, "epoch": 2118} {"train_loss": -6.108925819396973, "global_step": 88960, "epoch": 2118} {"train_loss": -6.247703552246094, "global_step": 88961, "epoch": 2118} {"train_loss": -6.2588300704956055, "global_step": 88962, "epoch": 2118} {"train_loss": -6.366745471954346, "global_step": 88963, "epoch": 2118} {"train_loss": -6.286561012268066, "global_step": 88964, "epoch": 2118} {"train_loss": -6.339599132537842, "global_step": 88965, "epoch": 2118} {"train_loss": -6.343474388122559, "global_step": 88966, "epoch": 2118} {"train_loss": -6.335541725158691, "global_step": 88967, "epoch": 2118} {"train_loss": -6.337296962738037, "global_step": 88968, "epoch": 2118} {"train_loss": -6.315274715423584, "global_step": 88969, "epoch": 2118} {"train_loss": -6.172127723693848, "global_step": 88970, "epoch": 2118} {"train_loss": -6.269165992736816, "global_step": 88971, "epoch": 2118} {"train_loss": -6.250091075897217, "global_step": 88972, "epoch": 2118} {"train_loss": -6.344595909118652, "global_step": 88973, "epoch": 2118} {"train_loss": -6.240627288818359, "global_step": 88974, "epoch": 2118} {"train_loss": -6.30476713180542, "global_step": 88975, "epoch": 2118} {"train_loss": -6.316313743591309, "global_step": 88976, "epoch": 2118} {"train_loss": -6.223907470703125, "global_step": 88977, "epoch": 2118} {"train_loss": -6.22947883605957, "global_step": 88978, "epoch": 2118} {"train_loss": -6.337270736694336, "global_step": 88979, "epoch": 2118} {"train_loss": -6.174627780914307, "global_step": 88980, "epoch": 2118} {"train_loss": -6.36152458190918, "global_step": 88981, "epoch": 2118} {"train_loss": -6.2948479652404785, "global_step": 88982, "epoch": 2118} {"train_loss": -6.19527530670166, "global_step": 88983, "epoch": 2118} {"train_loss": -6.281206130981445, "global_step": 88984, "epoch": 2118} {"train_loss": -6.252284049987793, "global_step": 88985, "epoch": 2118} {"train_loss": -6.224762439727783, "global_step": 88986, "epoch": 2118} {"train_loss": -6.154963970184326, "global_step": 88987, "epoch": 2118} {"train_loss": -6.239940166473389, "global_step": 88988, "epoch": 2118} {"train_loss": -6.268253803253174, "global_step": 88989, "epoch": 2118} {"train_loss": -6.261737823486328, "global_step": 88990, "epoch": 2118} {"train_loss": -6.271270751953125, "global_step": 88991, "epoch": 2118} {"train_loss": -6.210994243621826, "global_step": 88992, "epoch": 2118} {"train_loss": -6.180031776428223, "global_step": 88993, "epoch": 2118} {"train_loss": -6.265308380126953, "global_step": 88994, "epoch": 2118} {"train_loss": -6.27695894241333, "global_step": 88995, "epoch": 2118} {"train_loss": -6.211208820343018, "global_step": 88996, "epoch": 2118} {"train_loss": -6.261075224195208, "global_step": 88997, "epoch": 2118, "val_loss": 62887.703125} {"train_loss": -6.375223159790039, "global_step": 88998, "epoch": 2119} {"train_loss": -6.313324928283691, "global_step": 88999, "epoch": 2119} {"train_loss": -6.267005443572998, "global_step": 89000, "epoch": 2119} {"train_loss": -6.3463945388793945, "global_step": 89001, "epoch": 2119} {"train_loss": -6.2792816162109375, "global_step": 89002, "epoch": 2119} {"train_loss": -6.282290458679199, "global_step": 89003, "epoch": 2119} {"train_loss": -6.217297077178955, "global_step": 89004, "epoch": 2119} {"train_loss": -6.314615726470947, "global_step": 89005, "epoch": 2119} {"train_loss": -6.299036979675293, "global_step": 89006, "epoch": 2119} {"train_loss": -6.291986465454102, "global_step": 89007, "epoch": 2119} {"train_loss": -6.293083190917969, "global_step": 89008, "epoch": 2119} {"train_loss": -6.313408374786377, "global_step": 89009, "epoch": 2119} {"train_loss": -6.229403018951416, "global_step": 89010, "epoch": 2119} {"train_loss": -6.18458366394043, "global_step": 89011, "epoch": 2119} {"train_loss": -6.297027587890625, "global_step": 89012, "epoch": 2119} {"train_loss": -6.148409366607666, "global_step": 89013, "epoch": 2119} {"train_loss": -6.031787872314453, "global_step": 89014, "epoch": 2119} {"train_loss": -6.3361945152282715, "global_step": 89015, "epoch": 2119} {"train_loss": -6.232931613922119, "global_step": 89016, "epoch": 2119} {"train_loss": -6.312180519104004, "global_step": 89017, "epoch": 2119} {"train_loss": -6.170843124389648, "global_step": 89018, "epoch": 2119} {"train_loss": -6.147969722747803, "global_step": 89019, "epoch": 2119} {"train_loss": -6.264086723327637, "global_step": 89020, "epoch": 2119} {"train_loss": -6.289628028869629, "global_step": 89021, "epoch": 2119} {"train_loss": -6.248224258422852, "global_step": 89022, "epoch": 2119} {"train_loss": -6.24848747253418, "global_step": 89023, "epoch": 2119} {"train_loss": -6.23412561416626, "global_step": 89024, "epoch": 2119} {"train_loss": -6.1478753089904785, "global_step": 89025, "epoch": 2119} {"train_loss": -6.21620512008667, "global_step": 89026, "epoch": 2119} {"train_loss": -6.319787979125977, "global_step": 89027, "epoch": 2119} {"train_loss": -6.169186592102051, "global_step": 89028, "epoch": 2119} {"train_loss": -6.287814140319824, "global_step": 89029, "epoch": 2119} {"train_loss": -6.213646411895752, "global_step": 89030, "epoch": 2119} {"train_loss": -6.214097023010254, "global_step": 89031, "epoch": 2119} {"train_loss": -6.3128342628479, "global_step": 89032, "epoch": 2119} {"train_loss": -6.297090530395508, "global_step": 89033, "epoch": 2119} {"train_loss": -6.2696533203125, "global_step": 89034, "epoch": 2119} {"train_loss": -6.225428581237793, "global_step": 89035, "epoch": 2119} {"train_loss": -6.305496692657471, "global_step": 89036, "epoch": 2119} {"train_loss": -6.173070907592773, "global_step": 89037, "epoch": 2119} {"train_loss": -6.138045310974121, "global_step": 89038, "epoch": 2119} {"train_loss": -6.247764314923968, "global_step": 89039, "epoch": 2119, "val_loss": 63222.26953125} {"train_loss": -6.180173397064209, "global_step": 89040, "epoch": 2120} {"train_loss": -6.21955680847168, "global_step": 89041, "epoch": 2120} {"train_loss": -6.283116817474365, "global_step": 89042, "epoch": 2120} {"train_loss": -6.239534854888916, "global_step": 89043, "epoch": 2120} {"train_loss": -6.193005561828613, "global_step": 89044, "epoch": 2120} {"train_loss": -6.179041862487793, "global_step": 89045, "epoch": 2120} {"train_loss": -6.272048473358154, "global_step": 89046, "epoch": 2120} {"train_loss": -6.142260551452637, "global_step": 89047, "epoch": 2120} {"train_loss": -6.097594738006592, "global_step": 89048, "epoch": 2120} {"train_loss": -6.157321929931641, "global_step": 89049, "epoch": 2120} {"train_loss": -6.210183143615723, "global_step": 89050, "epoch": 2120} {"train_loss": -6.101010322570801, "global_step": 89051, "epoch": 2120} {"train_loss": -6.136562824249268, "global_step": 89052, "epoch": 2120} {"train_loss": -6.258758544921875, "global_step": 89053, "epoch": 2120} {"train_loss": -6.067086219787598, "global_step": 89054, "epoch": 2120} {"train_loss": -6.21243953704834, "global_step": 89055, "epoch": 2120} {"train_loss": -6.136051177978516, "global_step": 89056, "epoch": 2120} {"train_loss": -6.216178894042969, "global_step": 89057, "epoch": 2120} {"train_loss": -6.0961432456970215, "global_step": 89058, "epoch": 2120} {"train_loss": -6.2051591873168945, "global_step": 89059, "epoch": 2120} {"train_loss": -6.140489101409912, "global_step": 89060, "epoch": 2120} {"train_loss": -6.070354461669922, "global_step": 89061, "epoch": 2120} {"train_loss": -6.121441841125488, "global_step": 89062, "epoch": 2120} {"train_loss": -6.131422519683838, "global_step": 89063, "epoch": 2120} {"train_loss": -6.155417442321777, "global_step": 89064, "epoch": 2120} {"train_loss": -6.116087913513184, "global_step": 89065, "epoch": 2120} {"train_loss": -6.187263488769531, "global_step": 89066, "epoch": 2120} {"train_loss": -6.108758449554443, "global_step": 89067, "epoch": 2120} {"train_loss": -6.089916706085205, "global_step": 89068, "epoch": 2120} {"train_loss": -6.189120292663574, "global_step": 89069, "epoch": 2120} {"train_loss": -6.24532413482666, "global_step": 89070, "epoch": 2120} {"train_loss": -6.180865287780762, "global_step": 89071, "epoch": 2120} {"train_loss": -6.235054016113281, "global_step": 89072, "epoch": 2120} {"train_loss": -6.365139484405518, "global_step": 89073, "epoch": 2120} {"train_loss": -6.237607002258301, "global_step": 89074, "epoch": 2120} {"train_loss": -6.261795520782471, "global_step": 89075, "epoch": 2120} {"train_loss": -6.351150989532471, "global_step": 89076, "epoch": 2120} {"train_loss": -6.248781681060791, "global_step": 89077, "epoch": 2120} {"train_loss": -6.228522777557373, "global_step": 89078, "epoch": 2120} {"train_loss": -6.201738357543945, "global_step": 89079, "epoch": 2120} {"train_loss": -6.251067161560059, "global_step": 89080, "epoch": 2120} {"train_loss": -6.190359070187523, "global_step": 89081, "epoch": 2120, "val_loss": 62857.1171875} {"train_loss": -6.199989318847656, "global_step": 89082, "epoch": 2121} {"train_loss": -6.241088390350342, "global_step": 89083, "epoch": 2121} {"train_loss": -6.2040276527404785, "global_step": 89084, "epoch": 2121} {"train_loss": -6.146712779998779, "global_step": 89085, "epoch": 2121} {"train_loss": -6.29692268371582, "global_step": 89086, "epoch": 2121} {"train_loss": -6.239044666290283, "global_step": 89087, "epoch": 2121} {"train_loss": -6.353058815002441, "global_step": 89088, "epoch": 2121} {"train_loss": -6.148016929626465, "global_step": 89089, "epoch": 2121} {"train_loss": -6.158529758453369, "global_step": 89090, "epoch": 2121} {"train_loss": -6.203369140625, "global_step": 89091, "epoch": 2121} {"train_loss": -6.21858024597168, "global_step": 89092, "epoch": 2121} {"train_loss": -6.268836975097656, "global_step": 89093, "epoch": 2121} {"train_loss": -6.160520076751709, "global_step": 89094, "epoch": 2121} {"train_loss": -6.187461853027344, "global_step": 89095, "epoch": 2121} {"train_loss": -6.152499198913574, "global_step": 89096, "epoch": 2121} {"train_loss": -6.404745578765869, "global_step": 89097, "epoch": 2121} {"train_loss": -6.317599296569824, "global_step": 89098, "epoch": 2121} {"train_loss": -6.351379871368408, "global_step": 89099, "epoch": 2121} {"train_loss": -6.280762672424316, "global_step": 89100, "epoch": 2121} {"train_loss": -6.255676746368408, "global_step": 89101, "epoch": 2121} {"train_loss": -6.367565155029297, "global_step": 89102, "epoch": 2121} {"train_loss": -6.268543720245361, "global_step": 89103, "epoch": 2121} {"train_loss": -6.274617671966553, "global_step": 89104, "epoch": 2121} {"train_loss": -6.362060546875, "global_step": 89105, "epoch": 2121} {"train_loss": -6.305845260620117, "global_step": 89106, "epoch": 2121} {"train_loss": -6.204848289489746, "global_step": 89107, "epoch": 2121} {"train_loss": -6.227785110473633, "global_step": 89108, "epoch": 2121} {"train_loss": -6.287775039672852, "global_step": 89109, "epoch": 2121} {"train_loss": -6.29457950592041, "global_step": 89110, "epoch": 2121} {"train_loss": -6.312558174133301, "global_step": 89111, "epoch": 2121} {"train_loss": -6.280522346496582, "global_step": 89112, "epoch": 2121} {"train_loss": -6.374516487121582, "global_step": 89113, "epoch": 2121} {"train_loss": -6.253662109375, "global_step": 89114, "epoch": 2121} {"train_loss": -6.329830646514893, "global_step": 89115, "epoch": 2121} {"train_loss": -6.283248424530029, "global_step": 89116, "epoch": 2121} {"train_loss": -6.291097164154053, "global_step": 89117, "epoch": 2121} {"train_loss": -6.355817794799805, "global_step": 89118, "epoch": 2121} {"train_loss": -6.1967315673828125, "global_step": 89119, "epoch": 2121} {"train_loss": -6.220147609710693, "global_step": 89120, "epoch": 2121} {"train_loss": -6.322264671325684, "global_step": 89121, "epoch": 2121} {"train_loss": -6.198267459869385, "global_step": 89122, "epoch": 2121} {"train_loss": -6.26496274130685, "global_step": 89123, "epoch": 2121, "val_loss": 62999.0234375} {"train_loss": -6.28950834274292, "global_step": 89124, "epoch": 2122} {"train_loss": -6.250577926635742, "global_step": 89125, "epoch": 2122} {"train_loss": -6.281022071838379, "global_step": 89126, "epoch": 2122} {"train_loss": -6.197161674499512, "global_step": 89127, "epoch": 2122} {"train_loss": -6.295236587524414, "global_step": 89128, "epoch": 2122} {"train_loss": -6.350976467132568, "global_step": 89129, "epoch": 2122} {"train_loss": -6.225280284881592, "global_step": 89130, "epoch": 2122} {"train_loss": -6.226531028747559, "global_step": 89131, "epoch": 2122} {"train_loss": -6.1644134521484375, "global_step": 89132, "epoch": 2122} {"train_loss": -6.171063423156738, "global_step": 89133, "epoch": 2122} {"train_loss": -6.230206489562988, "global_step": 89134, "epoch": 2122} {"train_loss": -6.185966968536377, "global_step": 89135, "epoch": 2122} {"train_loss": -6.138128280639648, "global_step": 89136, "epoch": 2122} {"train_loss": -6.239317417144775, "global_step": 89137, "epoch": 2122} {"train_loss": -6.288952350616455, "global_step": 89138, "epoch": 2122} {"train_loss": -6.112038612365723, "global_step": 89139, "epoch": 2122} {"train_loss": -6.17573356628418, "global_step": 89140, "epoch": 2122} {"train_loss": -6.114221572875977, "global_step": 89141, "epoch": 2122} {"train_loss": -6.169866561889648, "global_step": 89142, "epoch": 2122} {"train_loss": -6.075589179992676, "global_step": 89143, "epoch": 2122} {"train_loss": -6.148329734802246, "global_step": 89144, "epoch": 2122} {"train_loss": -6.135599136352539, "global_step": 89145, "epoch": 2122} {"train_loss": -6.252133369445801, "global_step": 89146, "epoch": 2122} {"train_loss": -6.01718807220459, "global_step": 89147, "epoch": 2122} {"train_loss": -6.281593322753906, "global_step": 89148, "epoch": 2122} {"train_loss": -6.1758904457092285, "global_step": 89149, "epoch": 2122} {"train_loss": -6.138477325439453, "global_step": 89150, "epoch": 2122} {"train_loss": -6.246707439422607, "global_step": 89151, "epoch": 2122} {"train_loss": -6.212599754333496, "global_step": 89152, "epoch": 2122} {"train_loss": -6.150907516479492, "global_step": 89153, "epoch": 2122} {"train_loss": -6.15186882019043, "global_step": 89154, "epoch": 2122} {"train_loss": -6.237235069274902, "global_step": 89155, "epoch": 2122} {"train_loss": -6.2131805419921875, "global_step": 89156, "epoch": 2122} {"train_loss": -6.263174057006836, "global_step": 89157, "epoch": 2122} {"train_loss": -6.25154447555542, "global_step": 89158, "epoch": 2122} {"train_loss": -6.267117500305176, "global_step": 89159, "epoch": 2122} {"train_loss": -6.3042402267456055, "global_step": 89160, "epoch": 2122} {"train_loss": -6.175938606262207, "global_step": 89161, "epoch": 2122} {"train_loss": -6.351616859436035, "global_step": 89162, "epoch": 2122} {"train_loss": -6.219415187835693, "global_step": 89163, "epoch": 2122} {"train_loss": -6.342230796813965, "global_step": 89164, "epoch": 2122} {"train_loss": -6.214051314762661, "global_step": 89165, "epoch": 2122, "val_loss": 62900.67578125} {"train_loss": -6.306172847747803, "global_step": 89166, "epoch": 2123} {"train_loss": -6.297706604003906, "global_step": 89167, "epoch": 2123} {"train_loss": -6.259337425231934, "global_step": 89168, "epoch": 2123} {"train_loss": -6.182318687438965, "global_step": 89169, "epoch": 2123} {"train_loss": -6.330867767333984, "global_step": 89170, "epoch": 2123} {"train_loss": -6.275420188903809, "global_step": 89171, "epoch": 2123} {"train_loss": -6.198365211486816, "global_step": 89172, "epoch": 2123} {"train_loss": -6.259788513183594, "global_step": 89173, "epoch": 2123} {"train_loss": -6.22163200378418, "global_step": 89174, "epoch": 2123} {"train_loss": -6.328247547149658, "global_step": 89175, "epoch": 2123} {"train_loss": -6.134250640869141, "global_step": 89176, "epoch": 2123} {"train_loss": -6.264676094055176, "global_step": 89177, "epoch": 2123} {"train_loss": -6.178814888000488, "global_step": 89178, "epoch": 2123} {"train_loss": -6.309011936187744, "global_step": 89179, "epoch": 2123} {"train_loss": -6.323055267333984, "global_step": 89180, "epoch": 2123} {"train_loss": -6.28605318069458, "global_step": 89181, "epoch": 2123} {"train_loss": -6.209197998046875, "global_step": 89182, "epoch": 2123} {"train_loss": -6.194250583648682, "global_step": 89183, "epoch": 2123} {"train_loss": -6.200457572937012, "global_step": 89184, "epoch": 2123} {"train_loss": -6.230048179626465, "global_step": 89185, "epoch": 2123} {"train_loss": -6.158974647521973, "global_step": 89186, "epoch": 2123} {"train_loss": -6.165957450866699, "global_step": 89187, "epoch": 2123} {"train_loss": -6.1942338943481445, "global_step": 89188, "epoch": 2123} {"train_loss": -6.206064224243164, "global_step": 89189, "epoch": 2123} {"train_loss": -6.238988399505615, "global_step": 89190, "epoch": 2123} {"train_loss": -6.250079154968262, "global_step": 89191, "epoch": 2123} {"train_loss": -6.217596054077148, "global_step": 89192, "epoch": 2123} {"train_loss": -6.203815460205078, "global_step": 89193, "epoch": 2123} {"train_loss": -6.249875068664551, "global_step": 89194, "epoch": 2123} {"train_loss": -6.049084186553955, "global_step": 89195, "epoch": 2123} {"train_loss": -6.2559051513671875, "global_step": 89196, "epoch": 2123} {"train_loss": -6.166613578796387, "global_step": 89197, "epoch": 2123} {"train_loss": -6.201171875, "global_step": 89198, "epoch": 2123} {"train_loss": -6.201799392700195, "global_step": 89199, "epoch": 2123} {"train_loss": -6.213396072387695, "global_step": 89200, "epoch": 2123} {"train_loss": -6.251047611236572, "global_step": 89201, "epoch": 2123} {"train_loss": -6.307283401489258, "global_step": 89202, "epoch": 2123} {"train_loss": -6.303472518920898, "global_step": 89203, "epoch": 2123} {"train_loss": -6.148990631103516, "global_step": 89204, "epoch": 2123} {"train_loss": -6.1398162841796875, "global_step": 89205, "epoch": 2123} {"train_loss": -6.235947608947754, "global_step": 89206, "epoch": 2123} {"train_loss": -6.230921075457618, "global_step": 89207, "epoch": 2123, "val_loss": 63049.4296875} {"train_loss": -6.162357330322266, "global_step": 89208, "epoch": 2124} {"train_loss": -6.378534317016602, "global_step": 89209, "epoch": 2124} {"train_loss": -6.176178932189941, "global_step": 89210, "epoch": 2124} {"train_loss": -6.0918402671813965, "global_step": 89211, "epoch": 2124} {"train_loss": -6.374506950378418, "global_step": 89212, "epoch": 2124} {"train_loss": -6.0851616859436035, "global_step": 89213, "epoch": 2124} {"train_loss": -6.204334259033203, "global_step": 89214, "epoch": 2124} {"train_loss": -6.213793754577637, "global_step": 89215, "epoch": 2124} {"train_loss": -6.0466790199279785, "global_step": 89216, "epoch": 2124} {"train_loss": -6.297709941864014, "global_step": 89217, "epoch": 2124} {"train_loss": -6.110739707946777, "global_step": 89218, "epoch": 2124} {"train_loss": -6.133977890014648, "global_step": 89219, "epoch": 2124} {"train_loss": -6.127923011779785, "global_step": 89220, "epoch": 2124} {"train_loss": -6.230774879455566, "global_step": 89221, "epoch": 2124} {"train_loss": -6.128435134887695, "global_step": 89222, "epoch": 2124} {"train_loss": -6.1629486083984375, "global_step": 89223, "epoch": 2124} {"train_loss": -6.193944931030273, "global_step": 89224, "epoch": 2124} {"train_loss": -6.234859943389893, "global_step": 89225, "epoch": 2124} {"train_loss": -6.322687149047852, "global_step": 89226, "epoch": 2124} {"train_loss": -6.1792802810668945, "global_step": 89227, "epoch": 2124} {"train_loss": -6.311828136444092, "global_step": 89228, "epoch": 2124} {"train_loss": -6.1164679527282715, "global_step": 89229, "epoch": 2124} {"train_loss": -6.307723045349121, "global_step": 89230, "epoch": 2124} {"train_loss": -6.329434871673584, "global_step": 89231, "epoch": 2124} {"train_loss": -6.281284332275391, "global_step": 89232, "epoch": 2124} {"train_loss": -6.212176322937012, "global_step": 89233, "epoch": 2124} {"train_loss": -6.362749099731445, "global_step": 89234, "epoch": 2124} {"train_loss": -6.316835403442383, "global_step": 89235, "epoch": 2124} {"train_loss": -6.234612464904785, "global_step": 89236, "epoch": 2124} {"train_loss": -6.188133239746094, "global_step": 89237, "epoch": 2124} {"train_loss": -6.324799537658691, "global_step": 89238, "epoch": 2124} {"train_loss": -6.198883533477783, "global_step": 89239, "epoch": 2124} {"train_loss": -6.265575408935547, "global_step": 89240, "epoch": 2124} {"train_loss": -6.211927890777588, "global_step": 89241, "epoch": 2124} {"train_loss": -6.232179641723633, "global_step": 89242, "epoch": 2124} {"train_loss": -6.248612403869629, "global_step": 89243, "epoch": 2124} {"train_loss": -6.2218122482299805, "global_step": 89244, "epoch": 2124} {"train_loss": -6.303347587585449, "global_step": 89245, "epoch": 2124} {"train_loss": -6.197811603546143, "global_step": 89246, "epoch": 2124} {"train_loss": -6.313081741333008, "global_step": 89247, "epoch": 2124} {"train_loss": -6.228165149688721, "global_step": 89248, "epoch": 2124} {"train_loss": -6.227005935850597, "global_step": 89249, "epoch": 2124, "val_loss": 63050.4453125} {"train_loss": -6.350369453430176, "global_step": 89250, "epoch": 2125} {"train_loss": -6.278822898864746, "global_step": 89251, "epoch": 2125} {"train_loss": -6.337488174438477, "global_step": 89252, "epoch": 2125} {"train_loss": -6.185554504394531, "global_step": 89253, "epoch": 2125} {"train_loss": -6.293203353881836, "global_step": 89254, "epoch": 2125} {"train_loss": -6.275397300720215, "global_step": 89255, "epoch": 2125} {"train_loss": -6.094637870788574, "global_step": 89256, "epoch": 2125} {"train_loss": -6.347768783569336, "global_step": 89257, "epoch": 2125} {"train_loss": -6.176240921020508, "global_step": 89258, "epoch": 2125} {"train_loss": -6.0915913581848145, "global_step": 89259, "epoch": 2125} {"train_loss": -6.251386642456055, "global_step": 89260, "epoch": 2125} {"train_loss": -6.177549839019775, "global_step": 89261, "epoch": 2125} {"train_loss": -6.315467834472656, "global_step": 89262, "epoch": 2125} {"train_loss": -6.203675270080566, "global_step": 89263, "epoch": 2125} {"train_loss": -6.164920806884766, "global_step": 89264, "epoch": 2125} {"train_loss": -6.306008815765381, "global_step": 89265, "epoch": 2125} {"train_loss": -6.184764862060547, "global_step": 89266, "epoch": 2125} {"train_loss": -6.156027793884277, "global_step": 89267, "epoch": 2125} {"train_loss": -5.97702693939209, "global_step": 89268, "epoch": 2125} {"train_loss": -6.200916767120361, "global_step": 89269, "epoch": 2125} {"train_loss": -6.115296363830566, "global_step": 89270, "epoch": 2125} {"train_loss": -6.111063003540039, "global_step": 89271, "epoch": 2125} {"train_loss": -6.15907096862793, "global_step": 89272, "epoch": 2125} {"train_loss": -6.176277160644531, "global_step": 89273, "epoch": 2125} {"train_loss": -6.087717056274414, "global_step": 89274, "epoch": 2125} {"train_loss": -6.273809432983398, "global_step": 89275, "epoch": 2125} {"train_loss": -6.0999250411987305, "global_step": 89276, "epoch": 2125} {"train_loss": -6.079127311706543, "global_step": 89277, "epoch": 2125} {"train_loss": -6.068326473236084, "global_step": 89278, "epoch": 2125} {"train_loss": -6.243765830993652, "global_step": 89279, "epoch": 2125} {"train_loss": -6.141051292419434, "global_step": 89280, "epoch": 2125} {"train_loss": -6.185603141784668, "global_step": 89281, "epoch": 2125} {"train_loss": -6.048683166503906, "global_step": 89282, "epoch": 2125} {"train_loss": -6.179581642150879, "global_step": 89283, "epoch": 2125} {"train_loss": -6.187346935272217, "global_step": 89284, "epoch": 2125} {"train_loss": -6.178468227386475, "global_step": 89285, "epoch": 2125} {"train_loss": -5.964113235473633, "global_step": 89286, "epoch": 2125} {"train_loss": -6.233184814453125, "global_step": 89287, "epoch": 2125} {"train_loss": -6.182767868041992, "global_step": 89288, "epoch": 2125} {"train_loss": -6.263592720031738, "global_step": 89289, "epoch": 2125} {"train_loss": -6.0420451164245605, "global_step": 89290, "epoch": 2125} {"train_loss": -6.180081810270037, "global_step": 89291, "epoch": 2125, "val_loss": 63451.06640625} {"train_loss": -6.161597728729248, "global_step": 89292, "epoch": 2126} {"train_loss": -6.299150466918945, "global_step": 89293, "epoch": 2126} {"train_loss": -6.057703971862793, "global_step": 89294, "epoch": 2126} {"train_loss": -6.239556312561035, "global_step": 89295, "epoch": 2126} {"train_loss": -6.025117874145508, "global_step": 89296, "epoch": 2126} {"train_loss": -6.186716079711914, "global_step": 89297, "epoch": 2126} {"train_loss": -6.117325782775879, "global_step": 89298, "epoch": 2126} {"train_loss": -6.2567949295043945, "global_step": 89299, "epoch": 2126} {"train_loss": -6.177910804748535, "global_step": 89300, "epoch": 2126} {"train_loss": -6.237968444824219, "global_step": 89301, "epoch": 2126} {"train_loss": -6.248991966247559, "global_step": 89302, "epoch": 2126} {"train_loss": -6.104974746704102, "global_step": 89303, "epoch": 2126} {"train_loss": -6.155243396759033, "global_step": 89304, "epoch": 2126} {"train_loss": -6.128138542175293, "global_step": 89305, "epoch": 2126} {"train_loss": -6.187017440795898, "global_step": 89306, "epoch": 2126} {"train_loss": -6.159185409545898, "global_step": 89307, "epoch": 2126} {"train_loss": -6.158630847930908, "global_step": 89308, "epoch": 2126} {"train_loss": -6.205348968505859, "global_step": 89309, "epoch": 2126} {"train_loss": -6.179065704345703, "global_step": 89310, "epoch": 2126} {"train_loss": -6.302819728851318, "global_step": 89311, "epoch": 2126} {"train_loss": -6.400117874145508, "global_step": 89312, "epoch": 2126} {"train_loss": -6.280608177185059, "global_step": 89313, "epoch": 2126} {"train_loss": -6.338671684265137, "global_step": 89314, "epoch": 2126} {"train_loss": -6.299022674560547, "global_step": 89315, "epoch": 2126} {"train_loss": -6.342058181762695, "global_step": 89316, "epoch": 2126} {"train_loss": -6.294458389282227, "global_step": 89317, "epoch": 2126} {"train_loss": -6.2614850997924805, "global_step": 89318, "epoch": 2126} {"train_loss": -6.192543983459473, "global_step": 89319, "epoch": 2126} {"train_loss": -6.337132930755615, "global_step": 89320, "epoch": 2126} {"train_loss": -6.371786117553711, "global_step": 89321, "epoch": 2126} {"train_loss": -6.25546407699585, "global_step": 89322, "epoch": 2126} {"train_loss": -6.287776947021484, "global_step": 89323, "epoch": 2126} {"train_loss": -6.313667297363281, "global_step": 89324, "epoch": 2126} {"train_loss": -6.305622100830078, "global_step": 89325, "epoch": 2126} {"train_loss": -6.29414701461792, "global_step": 89326, "epoch": 2126} {"train_loss": -6.248831748962402, "global_step": 89327, "epoch": 2126} {"train_loss": -6.2906928062438965, "global_step": 89328, "epoch": 2126} {"train_loss": -6.222301483154297, "global_step": 89329, "epoch": 2126} {"train_loss": -6.2399492263793945, "global_step": 89330, "epoch": 2126} {"train_loss": -6.174108982086182, "global_step": 89331, "epoch": 2126} {"train_loss": -6.198670864105225, "global_step": 89332, "epoch": 2126} {"train_loss": -6.235207500911894, "global_step": 89333, "epoch": 2126, "val_loss": 63086.08984375} {"train_loss": -6.217336654663086, "global_step": 89334, "epoch": 2127} {"train_loss": -6.318507671356201, "global_step": 89335, "epoch": 2127} {"train_loss": -6.293185234069824, "global_step": 89336, "epoch": 2127} {"train_loss": -6.155004501342773, "global_step": 89337, "epoch": 2127} {"train_loss": -6.280412673950195, "global_step": 89338, "epoch": 2127} {"train_loss": -6.303401947021484, "global_step": 89339, "epoch": 2127} {"train_loss": -6.3065595626831055, "global_step": 89340, "epoch": 2127} {"train_loss": -6.291184425354004, "global_step": 89341, "epoch": 2127} {"train_loss": -6.237442970275879, "global_step": 89342, "epoch": 2127} {"train_loss": -6.3085832595825195, "global_step": 89343, "epoch": 2127} {"train_loss": -6.307185173034668, "global_step": 89344, "epoch": 2127} {"train_loss": -6.255782604217529, "global_step": 89345, "epoch": 2127} {"train_loss": -6.047649383544922, "global_step": 89346, "epoch": 2127} {"train_loss": -6.318324089050293, "global_step": 89347, "epoch": 2127} {"train_loss": -6.210437774658203, "global_step": 89348, "epoch": 2127} {"train_loss": -6.255397796630859, "global_step": 89349, "epoch": 2127} {"train_loss": -6.256025791168213, "global_step": 89350, "epoch": 2127} {"train_loss": -6.127187728881836, "global_step": 89351, "epoch": 2127} {"train_loss": -6.316347122192383, "global_step": 89352, "epoch": 2127} {"train_loss": -6.156400680541992, "global_step": 89353, "epoch": 2127} {"train_loss": -6.210744857788086, "global_step": 89354, "epoch": 2127} {"train_loss": -6.28623104095459, "global_step": 89355, "epoch": 2127} {"train_loss": -6.2356343269348145, "global_step": 89356, "epoch": 2127} {"train_loss": -6.203437805175781, "global_step": 89357, "epoch": 2127} {"train_loss": -6.212003707885742, "global_step": 89358, "epoch": 2127} {"train_loss": -6.3064470291137695, "global_step": 89359, "epoch": 2127} {"train_loss": -6.212814807891846, "global_step": 89360, "epoch": 2127} {"train_loss": -6.329580307006836, "global_step": 89361, "epoch": 2127} {"train_loss": -6.228128433227539, "global_step": 89362, "epoch": 2127} {"train_loss": -6.130038261413574, "global_step": 89363, "epoch": 2127} {"train_loss": -6.305347442626953, "global_step": 89364, "epoch": 2127} {"train_loss": -6.249168395996094, "global_step": 89365, "epoch": 2127} {"train_loss": -6.236321449279785, "global_step": 89366, "epoch": 2127} {"train_loss": -6.230259418487549, "global_step": 89367, "epoch": 2127} {"train_loss": -6.158820152282715, "global_step": 89368, "epoch": 2127} {"train_loss": -6.364453315734863, "global_step": 89369, "epoch": 2127} {"train_loss": -6.170009136199951, "global_step": 89370, "epoch": 2127} {"train_loss": -6.283557891845703, "global_step": 89371, "epoch": 2127} {"train_loss": -6.190811634063721, "global_step": 89372, "epoch": 2127} {"train_loss": -6.1697187423706055, "global_step": 89373, "epoch": 2127} {"train_loss": -6.208417892456055, "global_step": 89374, "epoch": 2127} {"train_loss": -6.237974303109305, "global_step": 89375, "epoch": 2127, "val_loss": 63090.15234375} {"train_loss": -6.21749210357666, "global_step": 89376, "epoch": 2128} {"train_loss": -6.32047176361084, "global_step": 89377, "epoch": 2128} {"train_loss": -6.194881916046143, "global_step": 89378, "epoch": 2128} {"train_loss": -6.223931789398193, "global_step": 89379, "epoch": 2128} {"train_loss": -6.255336761474609, "global_step": 89380, "epoch": 2128} {"train_loss": -6.258484840393066, "global_step": 89381, "epoch": 2128} {"train_loss": -6.311118125915527, "global_step": 89382, "epoch": 2128} {"train_loss": -6.371540069580078, "global_step": 89383, "epoch": 2128} {"train_loss": -6.218444347381592, "global_step": 89384, "epoch": 2128} {"train_loss": -6.2190327644348145, "global_step": 89385, "epoch": 2128} {"train_loss": -6.311248779296875, "global_step": 89386, "epoch": 2128} {"train_loss": -6.342109680175781, "global_step": 89387, "epoch": 2128} {"train_loss": -6.219291687011719, "global_step": 89388, "epoch": 2128} {"train_loss": -6.236781120300293, "global_step": 89389, "epoch": 2128} {"train_loss": -6.187021255493164, "global_step": 89390, "epoch": 2128} {"train_loss": -6.358868598937988, "global_step": 89391, "epoch": 2128} {"train_loss": -6.088278770446777, "global_step": 89392, "epoch": 2128} {"train_loss": -6.263400077819824, "global_step": 89393, "epoch": 2128} {"train_loss": -6.232011795043945, "global_step": 89394, "epoch": 2128} {"train_loss": -6.141726493835449, "global_step": 89395, "epoch": 2128} {"train_loss": -6.153217315673828, "global_step": 89396, "epoch": 2128} {"train_loss": -6.23654842376709, "global_step": 89397, "epoch": 2128} {"train_loss": -6.273171901702881, "global_step": 89398, "epoch": 2128} {"train_loss": -6.315179347991943, "global_step": 89399, "epoch": 2128} {"train_loss": -6.276922225952148, "global_step": 89400, "epoch": 2128} {"train_loss": -6.245298862457275, "global_step": 89401, "epoch": 2128} {"train_loss": -6.252704620361328, "global_step": 89402, "epoch": 2128} {"train_loss": -6.203685283660889, "global_step": 89403, "epoch": 2128} {"train_loss": -6.242008209228516, "global_step": 89404, "epoch": 2128} {"train_loss": -6.331406116485596, "global_step": 89405, "epoch": 2128} {"train_loss": -6.109139442443848, "global_step": 89406, "epoch": 2128} {"train_loss": -6.108798980712891, "global_step": 89407, "epoch": 2128} {"train_loss": -6.19287109375, "global_step": 89408, "epoch": 2128} {"train_loss": -6.180127143859863, "global_step": 89409, "epoch": 2128} {"train_loss": -6.184179306030273, "global_step": 89410, "epoch": 2128} {"train_loss": -6.072398662567139, "global_step": 89411, "epoch": 2128} {"train_loss": -6.213972091674805, "global_step": 89412, "epoch": 2128} {"train_loss": -6.0737810134887695, "global_step": 89413, "epoch": 2128} {"train_loss": -6.305424690246582, "global_step": 89414, "epoch": 2128} {"train_loss": -6.164440631866455, "global_step": 89415, "epoch": 2128} {"train_loss": -6.294126987457275, "global_step": 89416, "epoch": 2128} {"train_loss": -6.228023858297439, "global_step": 89417, "epoch": 2128, "val_loss": 63239.33203125} {"train_loss": -6.203179359436035, "global_step": 89418, "epoch": 2129} {"train_loss": -6.2096476554870605, "global_step": 89419, "epoch": 2129} {"train_loss": -6.1871867179870605, "global_step": 89420, "epoch": 2129} {"train_loss": -6.324283123016357, "global_step": 89421, "epoch": 2129} {"train_loss": -6.286594867706299, "global_step": 89422, "epoch": 2129} {"train_loss": -6.300958156585693, "global_step": 89423, "epoch": 2129} {"train_loss": -6.313319206237793, "global_step": 89424, "epoch": 2129} {"train_loss": -6.341895580291748, "global_step": 89425, "epoch": 2129} {"train_loss": -6.33327054977417, "global_step": 89426, "epoch": 2129} {"train_loss": -6.3996453285217285, "global_step": 89427, "epoch": 2129} {"train_loss": -6.234121322631836, "global_step": 89428, "epoch": 2129} {"train_loss": -6.309341907501221, "global_step": 89429, "epoch": 2129} {"train_loss": -6.29995059967041, "global_step": 89430, "epoch": 2129} {"train_loss": -6.323184013366699, "global_step": 89431, "epoch": 2129} {"train_loss": -6.3187150955200195, "global_step": 89432, "epoch": 2129} {"train_loss": -6.231451034545898, "global_step": 89433, "epoch": 2129} {"train_loss": -6.134164333343506, "global_step": 89434, "epoch": 2129} {"train_loss": -6.24372673034668, "global_step": 89435, "epoch": 2129} {"train_loss": -6.343845367431641, "global_step": 89436, "epoch": 2129} {"train_loss": -6.237238883972168, "global_step": 89437, "epoch": 2129} {"train_loss": -6.31508731842041, "global_step": 89438, "epoch": 2129} {"train_loss": -6.279995441436768, "global_step": 89439, "epoch": 2129} {"train_loss": -6.399317741394043, "global_step": 89440, "epoch": 2129} {"train_loss": -6.280020713806152, "global_step": 89441, "epoch": 2129} {"train_loss": -6.295840263366699, "global_step": 89442, "epoch": 2129} {"train_loss": -6.196112632751465, "global_step": 89443, "epoch": 2129} {"train_loss": -6.302971363067627, "global_step": 89444, "epoch": 2129} {"train_loss": -6.244441986083984, "global_step": 89445, "epoch": 2129} {"train_loss": -6.257671356201172, "global_step": 89446, "epoch": 2129} {"train_loss": -6.226263999938965, "global_step": 89447, "epoch": 2129} {"train_loss": -6.169739723205566, "global_step": 89448, "epoch": 2129} {"train_loss": -6.245668411254883, "global_step": 89449, "epoch": 2129} {"train_loss": -6.259890079498291, "global_step": 89450, "epoch": 2129} {"train_loss": -6.298284530639648, "global_step": 89451, "epoch": 2129} {"train_loss": -6.238615989685059, "global_step": 89452, "epoch": 2129} {"train_loss": -6.229714870452881, "global_step": 89453, "epoch": 2129} {"train_loss": -6.279766082763672, "global_step": 89454, "epoch": 2129} {"train_loss": -6.166834831237793, "global_step": 89455, "epoch": 2129} {"train_loss": -6.3608551025390625, "global_step": 89456, "epoch": 2129} {"train_loss": -6.267324447631836, "global_step": 89457, "epoch": 2129} {"train_loss": -6.200457572937012, "global_step": 89458, "epoch": 2129} {"train_loss": -6.2687725112551735, "global_step": 89459, "epoch": 2129, "val_loss": 63248.23046875} {"train_loss": -6.276733875274658, "global_step": 89460, "epoch": 2130} {"train_loss": -6.228668212890625, "global_step": 89461, "epoch": 2130} {"train_loss": -6.235302925109863, "global_step": 89462, "epoch": 2130} {"train_loss": -6.271049976348877, "global_step": 89463, "epoch": 2130} {"train_loss": -6.286498069763184, "global_step": 89464, "epoch": 2130} {"train_loss": -6.232973098754883, "global_step": 89465, "epoch": 2130} {"train_loss": -6.275539875030518, "global_step": 89466, "epoch": 2130} {"train_loss": -6.357269763946533, "global_step": 89467, "epoch": 2130} {"train_loss": -6.1665568351745605, "global_step": 89468, "epoch": 2130} {"train_loss": -6.219383716583252, "global_step": 89469, "epoch": 2130} {"train_loss": -6.321552276611328, "global_step": 89470, "epoch": 2130} {"train_loss": -6.211681842803955, "global_step": 89471, "epoch": 2130} {"train_loss": -6.256866931915283, "global_step": 89472, "epoch": 2130} {"train_loss": -6.190496921539307, "global_step": 89473, "epoch": 2130} {"train_loss": -6.184265613555908, "global_step": 89474, "epoch": 2130} {"train_loss": -6.303912162780762, "global_step": 89475, "epoch": 2130} {"train_loss": -6.3230719566345215, "global_step": 89476, "epoch": 2130} {"train_loss": -6.317273139953613, "global_step": 89477, "epoch": 2130} {"train_loss": -6.335622787475586, "global_step": 89478, "epoch": 2130} {"train_loss": -6.270451068878174, "global_step": 89479, "epoch": 2130} {"train_loss": -6.3082075119018555, "global_step": 89480, "epoch": 2130} {"train_loss": -6.282553672790527, "global_step": 89481, "epoch": 2130} {"train_loss": -6.187572479248047, "global_step": 89482, "epoch": 2130} {"train_loss": -6.3777923583984375, "global_step": 89483, "epoch": 2130} {"train_loss": -6.2493577003479, "global_step": 89484, "epoch": 2130} {"train_loss": -6.319305419921875, "global_step": 89485, "epoch": 2130} {"train_loss": -6.2447428703308105, "global_step": 89486, "epoch": 2130} {"train_loss": -6.237988471984863, "global_step": 89487, "epoch": 2130} {"train_loss": -6.270636081695557, "global_step": 89488, "epoch": 2130} {"train_loss": -6.271352767944336, "global_step": 89489, "epoch": 2130} {"train_loss": -6.279697418212891, "global_step": 89490, "epoch": 2130} {"train_loss": -6.23239278793335, "global_step": 89491, "epoch": 2130} {"train_loss": -6.210963249206543, "global_step": 89492, "epoch": 2130} {"train_loss": -6.332396507263184, "global_step": 89493, "epoch": 2130} {"train_loss": -6.236445426940918, "global_step": 89494, "epoch": 2130} {"train_loss": -6.196107864379883, "global_step": 89495, "epoch": 2130} {"train_loss": -6.319246292114258, "global_step": 89496, "epoch": 2130} {"train_loss": -6.344674110412598, "global_step": 89497, "epoch": 2130} {"train_loss": -6.318001747131348, "global_step": 89498, "epoch": 2130} {"train_loss": -6.179679870605469, "global_step": 89499, "epoch": 2130} {"train_loss": -6.319676399230957, "global_step": 89500, "epoch": 2130} {"train_loss": -6.268599930263701, "global_step": 89501, "epoch": 2130, "val_loss": 63071.83984375} {"train_loss": -6.288416862487793, "global_step": 89502, "epoch": 2131} {"train_loss": -6.236795425415039, "global_step": 89503, "epoch": 2131} {"train_loss": -6.283282279968262, "global_step": 89504, "epoch": 2131} {"train_loss": -6.273505210876465, "global_step": 89505, "epoch": 2131} {"train_loss": -6.27044677734375, "global_step": 89506, "epoch": 2131} {"train_loss": -6.185056686401367, "global_step": 89507, "epoch": 2131} {"train_loss": -6.234704971313477, "global_step": 89508, "epoch": 2131} {"train_loss": -6.322247505187988, "global_step": 89509, "epoch": 2131} {"train_loss": -6.260369777679443, "global_step": 89510, "epoch": 2131} {"train_loss": -6.195675849914551, "global_step": 89511, "epoch": 2131} {"train_loss": -6.265276908874512, "global_step": 89512, "epoch": 2131} {"train_loss": -6.222905158996582, "global_step": 89513, "epoch": 2131} {"train_loss": -6.204331398010254, "global_step": 89514, "epoch": 2131} {"train_loss": -6.388883590698242, "global_step": 89515, "epoch": 2131} {"train_loss": -6.181060791015625, "global_step": 89516, "epoch": 2131} {"train_loss": -6.272843837738037, "global_step": 89517, "epoch": 2131} {"train_loss": -6.241808891296387, "global_step": 89518, "epoch": 2131} {"train_loss": -6.349249839782715, "global_step": 89519, "epoch": 2131} {"train_loss": -6.058758735656738, "global_step": 89520, "epoch": 2131} {"train_loss": -6.270149230957031, "global_step": 89521, "epoch": 2131} {"train_loss": -6.261166572570801, "global_step": 89522, "epoch": 2131} {"train_loss": -6.091802597045898, "global_step": 89523, "epoch": 2131} {"train_loss": -6.326531887054443, "global_step": 89524, "epoch": 2131} {"train_loss": -6.283718109130859, "global_step": 89525, "epoch": 2131} {"train_loss": -6.166407108306885, "global_step": 89526, "epoch": 2131} {"train_loss": -6.16556453704834, "global_step": 89527, "epoch": 2131} {"train_loss": -6.230382919311523, "global_step": 89528, "epoch": 2131} {"train_loss": -6.231350898742676, "global_step": 89529, "epoch": 2131} {"train_loss": -6.129795551300049, "global_step": 89530, "epoch": 2131} {"train_loss": -6.161187171936035, "global_step": 89531, "epoch": 2131} {"train_loss": -6.200307846069336, "global_step": 89532, "epoch": 2131} {"train_loss": -6.280271530151367, "global_step": 89533, "epoch": 2131} {"train_loss": -6.143248558044434, "global_step": 89534, "epoch": 2131} {"train_loss": -6.281765937805176, "global_step": 89535, "epoch": 2131} {"train_loss": -6.266867637634277, "global_step": 89536, "epoch": 2131} {"train_loss": -6.277582168579102, "global_step": 89537, "epoch": 2131} {"train_loss": -6.291688919067383, "global_step": 89538, "epoch": 2131} {"train_loss": -6.238876819610596, "global_step": 89539, "epoch": 2131} {"train_loss": -6.221804618835449, "global_step": 89540, "epoch": 2131} {"train_loss": -6.282060623168945, "global_step": 89541, "epoch": 2131} {"train_loss": -6.282976150512695, "global_step": 89542, "epoch": 2131} {"train_loss": -6.240828900110154, "global_step": 89543, "epoch": 2131, "val_loss": 63084.27734375} {"train_loss": -6.310638427734375, "global_step": 89544, "epoch": 2132} {"train_loss": -6.262158393859863, "global_step": 89545, "epoch": 2132} {"train_loss": -6.244168758392334, "global_step": 89546, "epoch": 2132} {"train_loss": -6.2000579833984375, "global_step": 89547, "epoch": 2132} {"train_loss": -6.237364292144775, "global_step": 89548, "epoch": 2132} {"train_loss": -6.31998348236084, "global_step": 89549, "epoch": 2132} {"train_loss": -6.256987571716309, "global_step": 89550, "epoch": 2132} {"train_loss": -6.31771183013916, "global_step": 89551, "epoch": 2132} {"train_loss": -6.224767684936523, "global_step": 89552, "epoch": 2132} {"train_loss": -6.177875995635986, "global_step": 89553, "epoch": 2132} {"train_loss": -6.183337211608887, "global_step": 89554, "epoch": 2132} {"train_loss": -6.227298736572266, "global_step": 89555, "epoch": 2132} {"train_loss": -6.381110191345215, "global_step": 89556, "epoch": 2132} {"train_loss": -6.125028610229492, "global_step": 89557, "epoch": 2132} {"train_loss": -6.14997673034668, "global_step": 89558, "epoch": 2132} {"train_loss": -6.2041916847229, "global_step": 89559, "epoch": 2132} {"train_loss": -6.1701273918151855, "global_step": 89560, "epoch": 2132} {"train_loss": -6.188232421875, "global_step": 89561, "epoch": 2132} {"train_loss": -6.175997257232666, "global_step": 89562, "epoch": 2132} {"train_loss": -6.161359786987305, "global_step": 89563, "epoch": 2132} {"train_loss": -6.13348913192749, "global_step": 89564, "epoch": 2132} {"train_loss": -6.349079132080078, "global_step": 89565, "epoch": 2132} {"train_loss": -6.177825927734375, "global_step": 89566, "epoch": 2132} {"train_loss": -6.16976261138916, "global_step": 89567, "epoch": 2132} {"train_loss": -6.2631025314331055, "global_step": 89568, "epoch": 2132} {"train_loss": -6.112092018127441, "global_step": 89569, "epoch": 2132} {"train_loss": -6.153128623962402, "global_step": 89570, "epoch": 2132} {"train_loss": -6.129403114318848, "global_step": 89571, "epoch": 2132} {"train_loss": -6.276459217071533, "global_step": 89572, "epoch": 2132} {"train_loss": -6.2776079177856445, "global_step": 89573, "epoch": 2132} {"train_loss": -6.248618125915527, "global_step": 89574, "epoch": 2132} {"train_loss": -6.245739936828613, "global_step": 89575, "epoch": 2132} {"train_loss": -6.217535018920898, "global_step": 89576, "epoch": 2132} {"train_loss": -6.2660064697265625, "global_step": 89577, "epoch": 2132} {"train_loss": -6.209425926208496, "global_step": 89578, "epoch": 2132} {"train_loss": -6.213274002075195, "global_step": 89579, "epoch": 2132} {"train_loss": -6.3119916915893555, "global_step": 89580, "epoch": 2132} {"train_loss": -6.192389965057373, "global_step": 89581, "epoch": 2132} {"train_loss": -6.28825044631958, "global_step": 89582, "epoch": 2132} {"train_loss": -6.17573356628418, "global_step": 89583, "epoch": 2132} {"train_loss": -6.359182834625244, "global_step": 89584, "epoch": 2132} {"train_loss": -6.224362623123896, "global_step": 89585, "epoch": 2132, "val_loss": 63007.984375} {"train_loss": -6.315685272216797, "global_step": 89586, "epoch": 2133} {"train_loss": -6.1247758865356445, "global_step": 89587, "epoch": 2133} {"train_loss": -6.080785751342773, "global_step": 89588, "epoch": 2133} {"train_loss": -6.188014030456543, "global_step": 89589, "epoch": 2133} {"train_loss": -6.340410232543945, "global_step": 89590, "epoch": 2133} {"train_loss": -6.332447052001953, "global_step": 89591, "epoch": 2133} {"train_loss": -6.330482482910156, "global_step": 89592, "epoch": 2133} {"train_loss": -6.24940824508667, "global_step": 89593, "epoch": 2133} {"train_loss": -6.328124046325684, "global_step": 89594, "epoch": 2133} {"train_loss": -6.293306350708008, "global_step": 89595, "epoch": 2133} {"train_loss": -6.235522747039795, "global_step": 89596, "epoch": 2133} {"train_loss": -6.326253414154053, "global_step": 89597, "epoch": 2133} {"train_loss": -6.307085037231445, "global_step": 89598, "epoch": 2133} {"train_loss": -6.145125865936279, "global_step": 89599, "epoch": 2133} {"train_loss": -6.348446846008301, "global_step": 89600, "epoch": 2133} {"train_loss": -6.229249954223633, "global_step": 89601, "epoch": 2133} {"train_loss": -6.204555511474609, "global_step": 89602, "epoch": 2133} {"train_loss": -6.298122406005859, "global_step": 89603, "epoch": 2133} {"train_loss": -6.20061731338501, "global_step": 89604, "epoch": 2133} {"train_loss": -6.314434051513672, "global_step": 89605, "epoch": 2133} {"train_loss": -6.292543411254883, "global_step": 89606, "epoch": 2133} {"train_loss": -6.261162757873535, "global_step": 89607, "epoch": 2133} {"train_loss": -6.382375717163086, "global_step": 89608, "epoch": 2133} {"train_loss": -6.215973854064941, "global_step": 89609, "epoch": 2133} {"train_loss": -6.279454231262207, "global_step": 89610, "epoch": 2133} {"train_loss": -6.178098678588867, "global_step": 89611, "epoch": 2133} {"train_loss": -6.241143226623535, "global_step": 89612, "epoch": 2133} {"train_loss": -6.227791786193848, "global_step": 89613, "epoch": 2133} {"train_loss": -6.387854099273682, "global_step": 89614, "epoch": 2133} {"train_loss": -6.320265769958496, "global_step": 89615, "epoch": 2133} {"train_loss": -6.2744340896606445, "global_step": 89616, "epoch": 2133} {"train_loss": -6.3755950927734375, "global_step": 89617, "epoch": 2133} {"train_loss": -6.161660194396973, "global_step": 89618, "epoch": 2133} {"train_loss": -6.251180648803711, "global_step": 89619, "epoch": 2133} {"train_loss": -6.278998374938965, "global_step": 89620, "epoch": 2133} {"train_loss": -6.2893781661987305, "global_step": 89621, "epoch": 2133} {"train_loss": -6.184697151184082, "global_step": 89622, "epoch": 2133} {"train_loss": -6.341492176055908, "global_step": 89623, "epoch": 2133} {"train_loss": -6.200969696044922, "global_step": 89624, "epoch": 2133} {"train_loss": -6.2715840339660645, "global_step": 89625, "epoch": 2133} {"train_loss": -6.151470184326172, "global_step": 89626, "epoch": 2133} {"train_loss": -6.259994450069609, "global_step": 89627, "epoch": 2133, "val_loss": 63139.265625} {"train_loss": -6.292242050170898, "global_step": 89628, "epoch": 2134} {"train_loss": -6.3467583656311035, "global_step": 89629, "epoch": 2134} {"train_loss": -6.287256240844727, "global_step": 89630, "epoch": 2134} {"train_loss": -6.25392484664917, "global_step": 89631, "epoch": 2134} {"train_loss": -6.28260612487793, "global_step": 89632, "epoch": 2134} {"train_loss": -6.166667938232422, "global_step": 89633, "epoch": 2134} {"train_loss": -6.291085243225098, "global_step": 89634, "epoch": 2134} {"train_loss": -6.275335311889648, "global_step": 89635, "epoch": 2134} {"train_loss": -6.254528999328613, "global_step": 89636, "epoch": 2134} {"train_loss": -6.2981367111206055, "global_step": 89637, "epoch": 2134} {"train_loss": -6.152165412902832, "global_step": 89638, "epoch": 2134} {"train_loss": -6.194881916046143, "global_step": 89639, "epoch": 2134} {"train_loss": -6.158657550811768, "global_step": 89640, "epoch": 2134} {"train_loss": -6.200891971588135, "global_step": 89641, "epoch": 2134} {"train_loss": -6.209504127502441, "global_step": 89642, "epoch": 2134} {"train_loss": -6.1124067306518555, "global_step": 89643, "epoch": 2134} {"train_loss": -6.330412864685059, "global_step": 89644, "epoch": 2134} {"train_loss": -6.202628135681152, "global_step": 89645, "epoch": 2134} {"train_loss": -6.262657165527344, "global_step": 89646, "epoch": 2134} {"train_loss": -6.269711494445801, "global_step": 89647, "epoch": 2134} {"train_loss": -6.310878753662109, "global_step": 89648, "epoch": 2134} {"train_loss": -6.257313251495361, "global_step": 89649, "epoch": 2134} {"train_loss": -6.296648979187012, "global_step": 89650, "epoch": 2134} {"train_loss": -6.359508514404297, "global_step": 89651, "epoch": 2134} {"train_loss": -6.363663196563721, "global_step": 89652, "epoch": 2134} {"train_loss": -6.400335311889648, "global_step": 89653, "epoch": 2134} {"train_loss": -6.215636730194092, "global_step": 89654, "epoch": 2134} {"train_loss": -6.278182506561279, "global_step": 89655, "epoch": 2134} {"train_loss": -6.218329429626465, "global_step": 89656, "epoch": 2134} {"train_loss": -6.296011447906494, "global_step": 89657, "epoch": 2134} {"train_loss": -6.176438331604004, "global_step": 89658, "epoch": 2134} {"train_loss": -6.205879211425781, "global_step": 89659, "epoch": 2134} {"train_loss": -6.259286880493164, "global_step": 89660, "epoch": 2134} {"train_loss": -6.155648231506348, "global_step": 89661, "epoch": 2134} {"train_loss": -6.225131988525391, "global_step": 89662, "epoch": 2134} {"train_loss": -6.152790069580078, "global_step": 89663, "epoch": 2134} {"train_loss": -6.176807880401611, "global_step": 89664, "epoch": 2134} {"train_loss": -6.322527885437012, "global_step": 89665, "epoch": 2134} {"train_loss": -6.162202835083008, "global_step": 89666, "epoch": 2134} {"train_loss": -6.13641357421875, "global_step": 89667, "epoch": 2134} {"train_loss": -6.268858909606934, "global_step": 89668, "epoch": 2134} {"train_loss": -6.244842608769734, "global_step": 89669, "epoch": 2134, "val_loss": 63137.6171875} {"train_loss": -6.239871025085449, "global_step": 89670, "epoch": 2135} {"train_loss": -6.302549362182617, "global_step": 89671, "epoch": 2135} {"train_loss": -6.250019073486328, "global_step": 89672, "epoch": 2135} {"train_loss": -6.322208404541016, "global_step": 89673, "epoch": 2135} {"train_loss": -6.355907440185547, "global_step": 89674, "epoch": 2135} {"train_loss": -6.177978038787842, "global_step": 89675, "epoch": 2135} {"train_loss": -6.181789875030518, "global_step": 89676, "epoch": 2135} {"train_loss": -6.263208866119385, "global_step": 89677, "epoch": 2135} {"train_loss": -6.243804931640625, "global_step": 89678, "epoch": 2135} {"train_loss": -6.283869743347168, "global_step": 89679, "epoch": 2135} {"train_loss": -6.242692470550537, "global_step": 89680, "epoch": 2135} {"train_loss": -6.211664199829102, "global_step": 89681, "epoch": 2135} {"train_loss": -6.323034763336182, "global_step": 89682, "epoch": 2135} {"train_loss": -6.241410255432129, "global_step": 89683, "epoch": 2135} {"train_loss": -6.351596355438232, "global_step": 89684, "epoch": 2135} {"train_loss": -6.332446098327637, "global_step": 89685, "epoch": 2135} {"train_loss": -6.278213024139404, "global_step": 89686, "epoch": 2135} {"train_loss": -6.217430591583252, "global_step": 89687, "epoch": 2135} {"train_loss": -6.181800842285156, "global_step": 89688, "epoch": 2135} {"train_loss": -6.234064102172852, "global_step": 89689, "epoch": 2135} {"train_loss": -6.299510955810547, "global_step": 89690, "epoch": 2135} {"train_loss": -6.242711067199707, "global_step": 89691, "epoch": 2135} {"train_loss": -6.294650554656982, "global_step": 89692, "epoch": 2135} {"train_loss": -6.217531204223633, "global_step": 89693, "epoch": 2135} {"train_loss": -6.20650577545166, "global_step": 89694, "epoch": 2135} {"train_loss": -6.270913124084473, "global_step": 89695, "epoch": 2135} {"train_loss": -6.267557144165039, "global_step": 89696, "epoch": 2135} {"train_loss": -6.257155418395996, "global_step": 89697, "epoch": 2135} {"train_loss": -6.3515496253967285, "global_step": 89698, "epoch": 2135} {"train_loss": -6.298308372497559, "global_step": 89699, "epoch": 2135} {"train_loss": -6.342456817626953, "global_step": 89700, "epoch": 2135} {"train_loss": -6.164237022399902, "global_step": 89701, "epoch": 2135} {"train_loss": -6.233062267303467, "global_step": 89702, "epoch": 2135} {"train_loss": -6.2613091468811035, "global_step": 89703, "epoch": 2135} {"train_loss": -6.279502868652344, "global_step": 89704, "epoch": 2135} {"train_loss": -6.217811107635498, "global_step": 89705, "epoch": 2135} {"train_loss": -6.400968551635742, "global_step": 89706, "epoch": 2135} {"train_loss": -6.089111328125, "global_step": 89707, "epoch": 2135} {"train_loss": -6.232685089111328, "global_step": 89708, "epoch": 2135} {"train_loss": -6.263895034790039, "global_step": 89709, "epoch": 2135} {"train_loss": -6.114711761474609, "global_step": 89710, "epoch": 2135} {"train_loss": -6.260073684510731, "global_step": 89711, "epoch": 2135, "val_loss": 63286.9140625} {"train_loss": -6.287120819091797, "global_step": 89712, "epoch": 2136} {"train_loss": -6.250306129455566, "global_step": 89713, "epoch": 2136} {"train_loss": -6.211668014526367, "global_step": 89714, "epoch": 2136} {"train_loss": -6.28886604309082, "global_step": 89715, "epoch": 2136} {"train_loss": -6.350648403167725, "global_step": 89716, "epoch": 2136} {"train_loss": -6.244590759277344, "global_step": 89717, "epoch": 2136} {"train_loss": -6.326763153076172, "global_step": 89718, "epoch": 2136} {"train_loss": -6.233332633972168, "global_step": 89719, "epoch": 2136} {"train_loss": -6.2832465171813965, "global_step": 89720, "epoch": 2136} {"train_loss": -6.3484039306640625, "global_step": 89721, "epoch": 2136} {"train_loss": -6.267938613891602, "global_step": 89722, "epoch": 2136} {"train_loss": -6.142829895019531, "global_step": 89723, "epoch": 2136} {"train_loss": -6.384318828582764, "global_step": 89724, "epoch": 2136} {"train_loss": -6.3872480392456055, "global_step": 89725, "epoch": 2136} {"train_loss": -6.3004865646362305, "global_step": 89726, "epoch": 2136} {"train_loss": -6.28183126449585, "global_step": 89727, "epoch": 2136} {"train_loss": -6.255683422088623, "global_step": 89728, "epoch": 2136} {"train_loss": -6.187487602233887, "global_step": 89729, "epoch": 2136} {"train_loss": -6.1832709312438965, "global_step": 89730, "epoch": 2136} {"train_loss": -6.327732563018799, "global_step": 89731, "epoch": 2136} {"train_loss": -6.316278457641602, "global_step": 89732, "epoch": 2136} {"train_loss": -6.2574262619018555, "global_step": 89733, "epoch": 2136} {"train_loss": -6.249865531921387, "global_step": 89734, "epoch": 2136} {"train_loss": -6.24898099899292, "global_step": 89735, "epoch": 2136} {"train_loss": -6.146045684814453, "global_step": 89736, "epoch": 2136} {"train_loss": -6.374794960021973, "global_step": 89737, "epoch": 2136} {"train_loss": -6.3579487800598145, "global_step": 89738, "epoch": 2136} {"train_loss": -6.246417999267578, "global_step": 89739, "epoch": 2136} {"train_loss": -6.372988700866699, "global_step": 89740, "epoch": 2136} {"train_loss": -6.341506004333496, "global_step": 89741, "epoch": 2136} {"train_loss": -6.229372024536133, "global_step": 89742, "epoch": 2136} {"train_loss": -6.255141735076904, "global_step": 89743, "epoch": 2136} {"train_loss": -6.335197448730469, "global_step": 89744, "epoch": 2136} {"train_loss": -6.3417158126831055, "global_step": 89745, "epoch": 2136} {"train_loss": -6.390882968902588, "global_step": 89746, "epoch": 2136} {"train_loss": -6.260033130645752, "global_step": 89747, "epoch": 2136} {"train_loss": -6.317869186401367, "global_step": 89748, "epoch": 2136} {"train_loss": -6.283061504364014, "global_step": 89749, "epoch": 2136} {"train_loss": -6.287486553192139, "global_step": 89750, "epoch": 2136} {"train_loss": -6.202945232391357, "global_step": 89751, "epoch": 2136} {"train_loss": -6.379699230194092, "global_step": 89752, "epoch": 2136} {"train_loss": -6.283104567300706, "global_step": 89753, "epoch": 2136, "val_loss": 63020.9453125} {"train_loss": -6.229423522949219, "global_step": 89754, "epoch": 2137} {"train_loss": -6.292252063751221, "global_step": 89755, "epoch": 2137} {"train_loss": -6.132278919219971, "global_step": 89756, "epoch": 2137} {"train_loss": -6.284426212310791, "global_step": 89757, "epoch": 2137} {"train_loss": -6.255897521972656, "global_step": 89758, "epoch": 2137} {"train_loss": -6.337176322937012, "global_step": 89759, "epoch": 2137} {"train_loss": -6.236953258514404, "global_step": 89760, "epoch": 2137} {"train_loss": -6.317060470581055, "global_step": 89761, "epoch": 2137} {"train_loss": -6.289836406707764, "global_step": 89762, "epoch": 2137} {"train_loss": -6.266751289367676, "global_step": 89763, "epoch": 2137} {"train_loss": -6.249685287475586, "global_step": 89764, "epoch": 2137} {"train_loss": -6.133234977722168, "global_step": 89765, "epoch": 2137} {"train_loss": -6.1674652099609375, "global_step": 89766, "epoch": 2137} {"train_loss": -6.2214484214782715, "global_step": 89767, "epoch": 2137} {"train_loss": -6.205005645751953, "global_step": 89768, "epoch": 2137} {"train_loss": -6.322575569152832, "global_step": 89769, "epoch": 2137} {"train_loss": -6.336862087249756, "global_step": 89770, "epoch": 2137} {"train_loss": -6.27787971496582, "global_step": 89771, "epoch": 2137} {"train_loss": -6.285506248474121, "global_step": 89772, "epoch": 2137} {"train_loss": -6.399679183959961, "global_step": 89773, "epoch": 2137} {"train_loss": -6.259812831878662, "global_step": 89774, "epoch": 2137} {"train_loss": -6.261019706726074, "global_step": 89775, "epoch": 2137} {"train_loss": -6.361937522888184, "global_step": 89776, "epoch": 2137} {"train_loss": -6.193058967590332, "global_step": 89777, "epoch": 2137} {"train_loss": -6.281608581542969, "global_step": 89778, "epoch": 2137} {"train_loss": -6.223536491394043, "global_step": 89779, "epoch": 2137} {"train_loss": -6.16207218170166, "global_step": 89780, "epoch": 2137} {"train_loss": -6.215726852416992, "global_step": 89781, "epoch": 2137} {"train_loss": -6.149412155151367, "global_step": 89782, "epoch": 2137} {"train_loss": -6.245118141174316, "global_step": 89783, "epoch": 2137} {"train_loss": -6.286322593688965, "global_step": 89784, "epoch": 2137} {"train_loss": -6.3484930992126465, "global_step": 89785, "epoch": 2137} {"train_loss": -6.268221855163574, "global_step": 89786, "epoch": 2137} {"train_loss": -6.2512125968933105, "global_step": 89787, "epoch": 2137} {"train_loss": -6.154051303863525, "global_step": 89788, "epoch": 2137} {"train_loss": -6.270637035369873, "global_step": 89789, "epoch": 2137} {"train_loss": -6.346396446228027, "global_step": 89790, "epoch": 2137} {"train_loss": -6.337608337402344, "global_step": 89791, "epoch": 2137} {"train_loss": -6.395909309387207, "global_step": 89792, "epoch": 2137} {"train_loss": -6.368117332458496, "global_step": 89793, "epoch": 2137} {"train_loss": -6.186831474304199, "global_step": 89794, "epoch": 2137} {"train_loss": -6.26380941981361, "global_step": 89795, "epoch": 2137, "val_loss": 63079.5390625} {"train_loss": -6.3930463790893555, "global_step": 89796, "epoch": 2138} {"train_loss": -6.179129600524902, "global_step": 89797, "epoch": 2138} {"train_loss": -6.343161582946777, "global_step": 89798, "epoch": 2138} {"train_loss": -6.278209686279297, "global_step": 89799, "epoch": 2138} {"train_loss": -6.173295021057129, "global_step": 89800, "epoch": 2138} {"train_loss": -6.206038475036621, "global_step": 89801, "epoch": 2138} {"train_loss": -6.110517978668213, "global_step": 89802, "epoch": 2138} {"train_loss": -6.349218368530273, "global_step": 89803, "epoch": 2138} {"train_loss": -6.100077152252197, "global_step": 89804, "epoch": 2138} {"train_loss": -6.2790703773498535, "global_step": 89805, "epoch": 2138} {"train_loss": -6.25058126449585, "global_step": 89806, "epoch": 2138} {"train_loss": -6.323681831359863, "global_step": 89807, "epoch": 2138} {"train_loss": -6.326094627380371, "global_step": 89808, "epoch": 2138} {"train_loss": -6.288713455200195, "global_step": 89809, "epoch": 2138} {"train_loss": -6.2586469650268555, "global_step": 89810, "epoch": 2138} {"train_loss": -6.1956305503845215, "global_step": 89811, "epoch": 2138} {"train_loss": -6.188769340515137, "global_step": 89812, "epoch": 2138} {"train_loss": -6.1952433586120605, "global_step": 89813, "epoch": 2138} {"train_loss": -6.267599105834961, "global_step": 89814, "epoch": 2138} {"train_loss": -6.188570499420166, "global_step": 89815, "epoch": 2138} {"train_loss": -6.200305938720703, "global_step": 89816, "epoch": 2138} {"train_loss": -6.162482261657715, "global_step": 89817, "epoch": 2138} {"train_loss": -6.2284746170043945, "global_step": 89818, "epoch": 2138} {"train_loss": -6.181694030761719, "global_step": 89819, "epoch": 2138} {"train_loss": -6.309965133666992, "global_step": 89820, "epoch": 2138} {"train_loss": -6.1459245681762695, "global_step": 89821, "epoch": 2138} {"train_loss": -6.2566070556640625, "global_step": 89822, "epoch": 2138} {"train_loss": -6.276670455932617, "global_step": 89823, "epoch": 2138} {"train_loss": -6.129205226898193, "global_step": 89824, "epoch": 2138} {"train_loss": -6.280566215515137, "global_step": 89825, "epoch": 2138} {"train_loss": -6.198046684265137, "global_step": 89826, "epoch": 2138} {"train_loss": -6.185360908508301, "global_step": 89827, "epoch": 2138} {"train_loss": -6.24779748916626, "global_step": 89828, "epoch": 2138} {"train_loss": -6.196378707885742, "global_step": 89829, "epoch": 2138} {"train_loss": -6.261660575866699, "global_step": 89830, "epoch": 2138} {"train_loss": -6.341211795806885, "global_step": 89831, "epoch": 2138} {"train_loss": -6.228436470031738, "global_step": 89832, "epoch": 2138} {"train_loss": -6.256392002105713, "global_step": 89833, "epoch": 2138} {"train_loss": -6.253767013549805, "global_step": 89834, "epoch": 2138} {"train_loss": -6.155353546142578, "global_step": 89835, "epoch": 2138} {"train_loss": -6.222715377807617, "global_step": 89836, "epoch": 2138} {"train_loss": -6.233637900579543, "global_step": 89837, "epoch": 2138, "val_loss": 63381.23046875} {"train_loss": -6.102669715881348, "global_step": 89838, "epoch": 2139} {"train_loss": -6.33463716506958, "global_step": 89839, "epoch": 2139} {"train_loss": -6.274592399597168, "global_step": 89840, "epoch": 2139} {"train_loss": -6.241087913513184, "global_step": 89841, "epoch": 2139} {"train_loss": -6.3097686767578125, "global_step": 89842, "epoch": 2139} {"train_loss": -6.237592697143555, "global_step": 89843, "epoch": 2139} {"train_loss": -6.276567459106445, "global_step": 89844, "epoch": 2139} {"train_loss": -6.240941524505615, "global_step": 89845, "epoch": 2139} {"train_loss": -6.2201433181762695, "global_step": 89846, "epoch": 2139} {"train_loss": -6.376023292541504, "global_step": 89847, "epoch": 2139} {"train_loss": -6.303197860717773, "global_step": 89848, "epoch": 2139} {"train_loss": -6.222764015197754, "global_step": 89849, "epoch": 2139} {"train_loss": -6.342550277709961, "global_step": 89850, "epoch": 2139} {"train_loss": -6.345605850219727, "global_step": 89851, "epoch": 2139} {"train_loss": -6.1556291580200195, "global_step": 89852, "epoch": 2139} {"train_loss": -6.320801734924316, "global_step": 89853, "epoch": 2139} {"train_loss": -6.311076641082764, "global_step": 89854, "epoch": 2139} {"train_loss": -6.25862455368042, "global_step": 89855, "epoch": 2139} {"train_loss": -6.182436466217041, "global_step": 89856, "epoch": 2139} {"train_loss": -6.316474914550781, "global_step": 89857, "epoch": 2139} {"train_loss": -6.276910305023193, "global_step": 89858, "epoch": 2139} {"train_loss": -6.245984077453613, "global_step": 89859, "epoch": 2139} {"train_loss": -6.231626987457275, "global_step": 89860, "epoch": 2139} {"train_loss": -6.209820747375488, "global_step": 89861, "epoch": 2139} {"train_loss": -6.306874752044678, "global_step": 89862, "epoch": 2139} {"train_loss": -6.2167840003967285, "global_step": 89863, "epoch": 2139} {"train_loss": -6.207956314086914, "global_step": 89864, "epoch": 2139} {"train_loss": -6.35339879989624, "global_step": 89865, "epoch": 2139} {"train_loss": -6.322763919830322, "global_step": 89866, "epoch": 2139} {"train_loss": -6.361705780029297, "global_step": 89867, "epoch": 2139} {"train_loss": -6.345088481903076, "global_step": 89868, "epoch": 2139} {"train_loss": -6.257513999938965, "global_step": 89869, "epoch": 2139} {"train_loss": -6.336142539978027, "global_step": 89870, "epoch": 2139} {"train_loss": -6.279698371887207, "global_step": 89871, "epoch": 2139} {"train_loss": -6.244974136352539, "global_step": 89872, "epoch": 2139} {"train_loss": -6.275177955627441, "global_step": 89873, "epoch": 2139} {"train_loss": -6.3294267654418945, "global_step": 89874, "epoch": 2139} {"train_loss": -6.351172924041748, "global_step": 89875, "epoch": 2139} {"train_loss": -6.1549530029296875, "global_step": 89876, "epoch": 2139} {"train_loss": -6.249037265777588, "global_step": 89877, "epoch": 2139} {"train_loss": -6.217089653015137, "global_step": 89878, "epoch": 2139} {"train_loss": -6.271227961494809, "global_step": 89879, "epoch": 2139, "val_loss": 63251.5} {"train_loss": -6.292712211608887, "global_step": 89880, "epoch": 2140} {"train_loss": -6.247673034667969, "global_step": 89881, "epoch": 2140} {"train_loss": -6.296661376953125, "global_step": 89882, "epoch": 2140} {"train_loss": -6.358090400695801, "global_step": 89883, "epoch": 2140} {"train_loss": -6.260443687438965, "global_step": 89884, "epoch": 2140} {"train_loss": -6.235292434692383, "global_step": 89885, "epoch": 2140} {"train_loss": -6.299936294555664, "global_step": 89886, "epoch": 2140} {"train_loss": -6.240317344665527, "global_step": 89887, "epoch": 2140} {"train_loss": -6.1773881912231445, "global_step": 89888, "epoch": 2140} {"train_loss": -6.357677459716797, "global_step": 89889, "epoch": 2140} {"train_loss": -6.278006553649902, "global_step": 89890, "epoch": 2140} {"train_loss": -6.205410957336426, "global_step": 89891, "epoch": 2140} {"train_loss": -6.2530436515808105, "global_step": 89892, "epoch": 2140} {"train_loss": -6.3122406005859375, "global_step": 89893, "epoch": 2140} {"train_loss": -6.169295310974121, "global_step": 89894, "epoch": 2140} {"train_loss": -6.1352152824401855, "global_step": 89895, "epoch": 2140} {"train_loss": -6.42117977142334, "global_step": 89896, "epoch": 2140} {"train_loss": -6.187387466430664, "global_step": 89897, "epoch": 2140} {"train_loss": -6.267265796661377, "global_step": 89898, "epoch": 2140} {"train_loss": -6.30235481262207, "global_step": 89899, "epoch": 2140} {"train_loss": -6.32906436920166, "global_step": 89900, "epoch": 2140} {"train_loss": -6.22856330871582, "global_step": 89901, "epoch": 2140} {"train_loss": -6.327409267425537, "global_step": 89902, "epoch": 2140} {"train_loss": -6.237069129943848, "global_step": 89903, "epoch": 2140} {"train_loss": -6.367732048034668, "global_step": 89904, "epoch": 2140} {"train_loss": -6.304612159729004, "global_step": 89905, "epoch": 2140} {"train_loss": -6.259703636169434, "global_step": 89906, "epoch": 2140} {"train_loss": -6.3731584548950195, "global_step": 89907, "epoch": 2140} {"train_loss": -6.230569839477539, "global_step": 89908, "epoch": 2140} {"train_loss": -6.29215145111084, "global_step": 89909, "epoch": 2140} {"train_loss": -6.257330894470215, "global_step": 89910, "epoch": 2140} {"train_loss": -6.204002857208252, "global_step": 89911, "epoch": 2140} {"train_loss": -6.244332313537598, "global_step": 89912, "epoch": 2140} {"train_loss": -6.226693630218506, "global_step": 89913, "epoch": 2140} {"train_loss": -6.178348541259766, "global_step": 89914, "epoch": 2140} {"train_loss": -6.200556755065918, "global_step": 89915, "epoch": 2140} {"train_loss": -6.37932014465332, "global_step": 89916, "epoch": 2140} {"train_loss": -6.262728691101074, "global_step": 89917, "epoch": 2140} {"train_loss": -6.246778964996338, "global_step": 89918, "epoch": 2140} {"train_loss": -6.252654552459717, "global_step": 89919, "epoch": 2140} {"train_loss": -6.392568588256836, "global_step": 89920, "epoch": 2140} {"train_loss": -6.270912238529751, "global_step": 89921, "epoch": 2140, "val_loss": 63211.6875} {"train_loss": -6.278786659240723, "global_step": 89922, "epoch": 2141} {"train_loss": -6.312605857849121, "global_step": 89923, "epoch": 2141} {"train_loss": -6.281358242034912, "global_step": 89924, "epoch": 2141} {"train_loss": -6.259753227233887, "global_step": 89925, "epoch": 2141} {"train_loss": -6.249829292297363, "global_step": 89926, "epoch": 2141} {"train_loss": -6.21600341796875, "global_step": 89927, "epoch": 2141} {"train_loss": -6.244915008544922, "global_step": 89928, "epoch": 2141} {"train_loss": -6.34837007522583, "global_step": 89929, "epoch": 2141} {"train_loss": -6.26024866104126, "global_step": 89930, "epoch": 2141} {"train_loss": -6.18265962600708, "global_step": 89931, "epoch": 2141} {"train_loss": -6.217247009277344, "global_step": 89932, "epoch": 2141} {"train_loss": -6.258049488067627, "global_step": 89933, "epoch": 2141} {"train_loss": -6.154013633728027, "global_step": 89934, "epoch": 2141} {"train_loss": -6.348998546600342, "global_step": 89935, "epoch": 2141} {"train_loss": -6.324029922485352, "global_step": 89936, "epoch": 2141} {"train_loss": -6.162327766418457, "global_step": 89937, "epoch": 2141} {"train_loss": -6.148490905761719, "global_step": 89938, "epoch": 2141} {"train_loss": -6.292119979858398, "global_step": 89939, "epoch": 2141} {"train_loss": -6.138788223266602, "global_step": 89940, "epoch": 2141} {"train_loss": -6.192770957946777, "global_step": 89941, "epoch": 2141} {"train_loss": -6.23792839050293, "global_step": 89942, "epoch": 2141} {"train_loss": -6.214081287384033, "global_step": 89943, "epoch": 2141} {"train_loss": -6.305919170379639, "global_step": 89944, "epoch": 2141} {"train_loss": -6.2178473472595215, "global_step": 89945, "epoch": 2141} {"train_loss": -6.312206268310547, "global_step": 89946, "epoch": 2141} {"train_loss": -6.094875335693359, "global_step": 89947, "epoch": 2141} {"train_loss": -6.309274196624756, "global_step": 89948, "epoch": 2141} {"train_loss": -6.157708644866943, "global_step": 89949, "epoch": 2141} {"train_loss": -6.269286155700684, "global_step": 89950, "epoch": 2141} {"train_loss": -6.152198314666748, "global_step": 89951, "epoch": 2141} {"train_loss": -6.133412837982178, "global_step": 89952, "epoch": 2141} {"train_loss": -6.388149261474609, "global_step": 89953, "epoch": 2141} {"train_loss": -6.239702224731445, "global_step": 89954, "epoch": 2141} {"train_loss": -6.298990249633789, "global_step": 89955, "epoch": 2141} {"train_loss": -6.251900672912598, "global_step": 89956, "epoch": 2141} {"train_loss": -6.271770477294922, "global_step": 89957, "epoch": 2141} {"train_loss": -6.330379486083984, "global_step": 89958, "epoch": 2141} {"train_loss": -6.271727561950684, "global_step": 89959, "epoch": 2141} {"train_loss": -6.338150978088379, "global_step": 89960, "epoch": 2141} {"train_loss": -6.337498664855957, "global_step": 89961, "epoch": 2141} {"train_loss": -6.158404350280762, "global_step": 89962, "epoch": 2141} {"train_loss": -6.246269282840547, "global_step": 89963, "epoch": 2141, "val_loss": 63087.27734375} {"train_loss": -6.348067283630371, "global_step": 89964, "epoch": 2142} {"train_loss": -6.279779434204102, "global_step": 89965, "epoch": 2142} {"train_loss": -6.168966293334961, "global_step": 89966, "epoch": 2142} {"train_loss": -6.246493339538574, "global_step": 89967, "epoch": 2142} {"train_loss": -6.408840179443359, "global_step": 89968, "epoch": 2142} {"train_loss": -6.282393455505371, "global_step": 89969, "epoch": 2142} {"train_loss": -6.256167888641357, "global_step": 89970, "epoch": 2142} {"train_loss": -6.2715559005737305, "global_step": 89971, "epoch": 2142} {"train_loss": -6.265031814575195, "global_step": 89972, "epoch": 2142} {"train_loss": -6.205345630645752, "global_step": 89973, "epoch": 2142} {"train_loss": -6.088717937469482, "global_step": 89974, "epoch": 2142} {"train_loss": -6.254772663116455, "global_step": 89975, "epoch": 2142} {"train_loss": -6.363808631896973, "global_step": 89976, "epoch": 2142} {"train_loss": -6.3538007736206055, "global_step": 89977, "epoch": 2142} {"train_loss": -6.247719764709473, "global_step": 89978, "epoch": 2142} {"train_loss": -6.223618507385254, "global_step": 89979, "epoch": 2142} {"train_loss": -6.254107475280762, "global_step": 89980, "epoch": 2142} {"train_loss": -6.286404609680176, "global_step": 89981, "epoch": 2142} {"train_loss": -6.232813835144043, "global_step": 89982, "epoch": 2142} {"train_loss": -6.284687519073486, "global_step": 89983, "epoch": 2142} {"train_loss": -6.251559257507324, "global_step": 89984, "epoch": 2142} {"train_loss": -6.311107158660889, "global_step": 89985, "epoch": 2142} {"train_loss": -6.339632987976074, "global_step": 89986, "epoch": 2142} {"train_loss": -6.256536960601807, "global_step": 89987, "epoch": 2142} {"train_loss": -6.248603820800781, "global_step": 89988, "epoch": 2142} {"train_loss": -6.294544219970703, "global_step": 89989, "epoch": 2142} {"train_loss": -6.323764801025391, "global_step": 89990, "epoch": 2142} {"train_loss": -6.354254245758057, "global_step": 89991, "epoch": 2142} {"train_loss": -6.298029899597168, "global_step": 89992, "epoch": 2142} {"train_loss": -6.197158336639404, "global_step": 89993, "epoch": 2142} {"train_loss": -6.302107810974121, "global_step": 89994, "epoch": 2142} {"train_loss": -6.245491981506348, "global_step": 89995, "epoch": 2142} {"train_loss": -6.118771553039551, "global_step": 89996, "epoch": 2142} {"train_loss": -6.271730899810791, "global_step": 89997, "epoch": 2142} {"train_loss": -6.327547073364258, "global_step": 89998, "epoch": 2142} {"train_loss": -6.258864879608154, "global_step": 89999, "epoch": 2142} {"train_loss": -6.373693466186523, "global_step": 90000, "epoch": 2142} {"train_loss": -6.349145889282227, "global_step": 90001, "epoch": 2142} {"train_loss": -6.284074783325195, "global_step": 90002, "epoch": 2142} {"train_loss": -6.396816730499268, "global_step": 90003, "epoch": 2142} {"train_loss": -6.372217655181885, "global_step": 90004, "epoch": 2142} {"train_loss": -6.282756260463169, "global_step": 90005, "epoch": 2142, "val_loss": 63045.16015625} {"train_loss": -6.2944111824035645, "global_step": 90006, "epoch": 2143} {"train_loss": -6.358416557312012, "global_step": 90007, "epoch": 2143} {"train_loss": -6.375524997711182, "global_step": 90008, "epoch": 2143} {"train_loss": -6.268221855163574, "global_step": 90009, "epoch": 2143} {"train_loss": -6.22883939743042, "global_step": 90010, "epoch": 2143} {"train_loss": -6.3513593673706055, "global_step": 90011, "epoch": 2143} {"train_loss": -6.208150863647461, "global_step": 90012, "epoch": 2143} {"train_loss": -6.275452613830566, "global_step": 90013, "epoch": 2143} {"train_loss": -6.284639358520508, "global_step": 90014, "epoch": 2143} {"train_loss": -6.238966941833496, "global_step": 90015, "epoch": 2143} {"train_loss": -6.22739839553833, "global_step": 90016, "epoch": 2143} {"train_loss": -6.311033248901367, "global_step": 90017, "epoch": 2143} {"train_loss": -6.457449436187744, "global_step": 90018, "epoch": 2143} {"train_loss": -6.323405742645264, "global_step": 90019, "epoch": 2143} {"train_loss": -6.261421203613281, "global_step": 90020, "epoch": 2143} {"train_loss": -6.2552385330200195, "global_step": 90021, "epoch": 2143} {"train_loss": -6.263823509216309, "global_step": 90022, "epoch": 2143} {"train_loss": -6.341324806213379, "global_step": 90023, "epoch": 2143} {"train_loss": -6.3046064376831055, "global_step": 90024, "epoch": 2143} {"train_loss": -6.394342422485352, "global_step": 90025, "epoch": 2143} {"train_loss": -6.191824913024902, "global_step": 90026, "epoch": 2143} {"train_loss": -6.25120210647583, "global_step": 90027, "epoch": 2143} {"train_loss": -6.386213779449463, "global_step": 90028, "epoch": 2143} {"train_loss": -6.185304641723633, "global_step": 90029, "epoch": 2143} {"train_loss": -6.326343536376953, "global_step": 90030, "epoch": 2143} {"train_loss": -6.271757125854492, "global_step": 90031, "epoch": 2143} {"train_loss": -6.331491470336914, "global_step": 90032, "epoch": 2143} {"train_loss": -6.288298606872559, "global_step": 90033, "epoch": 2143} {"train_loss": -6.309685707092285, "global_step": 90034, "epoch": 2143} {"train_loss": -6.218371391296387, "global_step": 90035, "epoch": 2143} {"train_loss": -6.341218948364258, "global_step": 90036, "epoch": 2143} {"train_loss": -6.341495990753174, "global_step": 90037, "epoch": 2143} {"train_loss": -6.255988121032715, "global_step": 90038, "epoch": 2143} {"train_loss": -6.302646636962891, "global_step": 90039, "epoch": 2143} {"train_loss": -6.257383823394775, "global_step": 90040, "epoch": 2143} {"train_loss": -6.269634246826172, "global_step": 90041, "epoch": 2143} {"train_loss": -6.302215576171875, "global_step": 90042, "epoch": 2143} {"train_loss": -6.293030738830566, "global_step": 90043, "epoch": 2143} {"train_loss": -6.164615631103516, "global_step": 90044, "epoch": 2143} {"train_loss": -6.218940734863281, "global_step": 90045, "epoch": 2143} {"train_loss": -6.244928359985352, "global_step": 90046, "epoch": 2143} {"train_loss": -6.2842464333488826, "global_step": 90047, "epoch": 2143, "val_loss": 63165.9296875} {"train_loss": -6.214105129241943, "global_step": 90048, "epoch": 2144} {"train_loss": -6.316528797149658, "global_step": 90049, "epoch": 2144} {"train_loss": -6.190486907958984, "global_step": 90050, "epoch": 2144} {"train_loss": -6.203190803527832, "global_step": 90051, "epoch": 2144} {"train_loss": -6.232942581176758, "global_step": 90052, "epoch": 2144} {"train_loss": -6.284703254699707, "global_step": 90053, "epoch": 2144} {"train_loss": -6.202481746673584, "global_step": 90054, "epoch": 2144} {"train_loss": -6.219988822937012, "global_step": 90055, "epoch": 2144} {"train_loss": -6.18681526184082, "global_step": 90056, "epoch": 2144} {"train_loss": -6.268405914306641, "global_step": 90057, "epoch": 2144} {"train_loss": -6.275509834289551, "global_step": 90058, "epoch": 2144} {"train_loss": -6.225691795349121, "global_step": 90059, "epoch": 2144} {"train_loss": -6.26149845123291, "global_step": 90060, "epoch": 2144} {"train_loss": -6.337900161743164, "global_step": 90061, "epoch": 2144} {"train_loss": -6.18056583404541, "global_step": 90062, "epoch": 2144} {"train_loss": -6.380142688751221, "global_step": 90063, "epoch": 2144} {"train_loss": -6.333948135375977, "global_step": 90064, "epoch": 2144} {"train_loss": -6.227153778076172, "global_step": 90065, "epoch": 2144} {"train_loss": -6.29750394821167, "global_step": 90066, "epoch": 2144} {"train_loss": -6.312283515930176, "global_step": 90067, "epoch": 2144} {"train_loss": -6.295040607452393, "global_step": 90068, "epoch": 2144} {"train_loss": -6.251946449279785, "global_step": 90069, "epoch": 2144} {"train_loss": -6.119708061218262, "global_step": 90070, "epoch": 2144} {"train_loss": -6.295051574707031, "global_step": 90071, "epoch": 2144} {"train_loss": -6.213588237762451, "global_step": 90072, "epoch": 2144} {"train_loss": -6.03843879699707, "global_step": 90073, "epoch": 2144} {"train_loss": -6.3258161544799805, "global_step": 90074, "epoch": 2144} {"train_loss": -6.23769998550415, "global_step": 90075, "epoch": 2144} {"train_loss": -6.315410137176514, "global_step": 90076, "epoch": 2144} {"train_loss": -6.23032808303833, "global_step": 90077, "epoch": 2144} {"train_loss": -6.25521183013916, "global_step": 90078, "epoch": 2144} {"train_loss": -6.143706321716309, "global_step": 90079, "epoch": 2144} {"train_loss": -6.1914777755737305, "global_step": 90080, "epoch": 2144} {"train_loss": -6.153188228607178, "global_step": 90081, "epoch": 2144} {"train_loss": -6.248126029968262, "global_step": 90082, "epoch": 2144} {"train_loss": -6.302735805511475, "global_step": 90083, "epoch": 2144} {"train_loss": -6.119928359985352, "global_step": 90084, "epoch": 2144} {"train_loss": -6.202199935913086, "global_step": 90085, "epoch": 2144} {"train_loss": -6.078365325927734, "global_step": 90086, "epoch": 2144} {"train_loss": -6.281165599822998, "global_step": 90087, "epoch": 2144} {"train_loss": -6.261822700500488, "global_step": 90088, "epoch": 2144} {"train_loss": -6.238772959936233, "global_step": 90089, "epoch": 2144, "val_loss": 62933.9765625} {"train_loss": -6.327796936035156, "global_step": 90090, "epoch": 2145} {"train_loss": -6.226043224334717, "global_step": 90091, "epoch": 2145} {"train_loss": -6.228434085845947, "global_step": 90092, "epoch": 2145} {"train_loss": -6.275148391723633, "global_step": 90093, "epoch": 2145} {"train_loss": -6.116933822631836, "global_step": 90094, "epoch": 2145} {"train_loss": -6.180537700653076, "global_step": 90095, "epoch": 2145} {"train_loss": -6.274633884429932, "global_step": 90096, "epoch": 2145} {"train_loss": -6.142266273498535, "global_step": 90097, "epoch": 2145} {"train_loss": -6.20913028717041, "global_step": 90098, "epoch": 2145} {"train_loss": -6.297016143798828, "global_step": 90099, "epoch": 2145} {"train_loss": -6.301690101623535, "global_step": 90100, "epoch": 2145} {"train_loss": -6.229109287261963, "global_step": 90101, "epoch": 2145} {"train_loss": -6.276055335998535, "global_step": 90102, "epoch": 2145} {"train_loss": -6.249404430389404, "global_step": 90103, "epoch": 2145} {"train_loss": -6.137754440307617, "global_step": 90104, "epoch": 2145} {"train_loss": -6.212368011474609, "global_step": 90105, "epoch": 2145} {"train_loss": -6.1393256187438965, "global_step": 90106, "epoch": 2145} {"train_loss": -6.153222560882568, "global_step": 90107, "epoch": 2145} {"train_loss": -6.248050689697266, "global_step": 90108, "epoch": 2145} {"train_loss": -6.274406433105469, "global_step": 90109, "epoch": 2145} {"train_loss": -6.1767964363098145, "global_step": 90110, "epoch": 2145} {"train_loss": -6.245548725128174, "global_step": 90111, "epoch": 2145} {"train_loss": -6.268680572509766, "global_step": 90112, "epoch": 2145} {"train_loss": -6.153759002685547, "global_step": 90113, "epoch": 2145} {"train_loss": -6.253260612487793, "global_step": 90114, "epoch": 2145} {"train_loss": -6.165753364562988, "global_step": 90115, "epoch": 2145} {"train_loss": -6.246770858764648, "global_step": 90116, "epoch": 2145} {"train_loss": -6.23104190826416, "global_step": 90117, "epoch": 2145} {"train_loss": -6.095961570739746, "global_step": 90118, "epoch": 2145} {"train_loss": -6.223273277282715, "global_step": 90119, "epoch": 2145} {"train_loss": -6.274616718292236, "global_step": 90120, "epoch": 2145} {"train_loss": -6.315467834472656, "global_step": 90121, "epoch": 2145} {"train_loss": -6.309002876281738, "global_step": 90122, "epoch": 2145} {"train_loss": -6.289893627166748, "global_step": 90123, "epoch": 2145} {"train_loss": -6.259990692138672, "global_step": 90124, "epoch": 2145} {"train_loss": -6.225957870483398, "global_step": 90125, "epoch": 2145} {"train_loss": -6.33388614654541, "global_step": 90126, "epoch": 2145} {"train_loss": -6.354538917541504, "global_step": 90127, "epoch": 2145} {"train_loss": -6.294586181640625, "global_step": 90128, "epoch": 2145} {"train_loss": -6.143804550170898, "global_step": 90129, "epoch": 2145} {"train_loss": -6.243226051330566, "global_step": 90130, "epoch": 2145} {"train_loss": -6.234812146141415, "global_step": 90131, "epoch": 2145, "val_loss": 63151.5859375} {"train_loss": -6.270246505737305, "global_step": 90132, "epoch": 2146} {"train_loss": -6.223642349243164, "global_step": 90133, "epoch": 2146} {"train_loss": -6.277007579803467, "global_step": 90134, "epoch": 2146} {"train_loss": -6.1728515625, "global_step": 90135, "epoch": 2146} {"train_loss": -6.231540203094482, "global_step": 90136, "epoch": 2146} {"train_loss": -6.252001762390137, "global_step": 90137, "epoch": 2146} {"train_loss": -6.1432600021362305, "global_step": 90138, "epoch": 2146} {"train_loss": -6.352959632873535, "global_step": 90139, "epoch": 2146} {"train_loss": -6.21132230758667, "global_step": 90140, "epoch": 2146} {"train_loss": -6.254711151123047, "global_step": 90141, "epoch": 2146} {"train_loss": -6.191553115844727, "global_step": 90142, "epoch": 2146} {"train_loss": -6.246545791625977, "global_step": 90143, "epoch": 2146} {"train_loss": -6.301252365112305, "global_step": 90144, "epoch": 2146} {"train_loss": -6.274529457092285, "global_step": 90145, "epoch": 2146} {"train_loss": -6.217380523681641, "global_step": 90146, "epoch": 2146} {"train_loss": -6.29293155670166, "global_step": 90147, "epoch": 2146} {"train_loss": -6.242508888244629, "global_step": 90148, "epoch": 2146} {"train_loss": -6.28388786315918, "global_step": 90149, "epoch": 2146} {"train_loss": -6.313968658447266, "global_step": 90150, "epoch": 2146} {"train_loss": -6.182631969451904, "global_step": 90151, "epoch": 2146} {"train_loss": -6.190787315368652, "global_step": 90152, "epoch": 2146} {"train_loss": -6.223729610443115, "global_step": 90153, "epoch": 2146} {"train_loss": -6.26770544052124, "global_step": 90154, "epoch": 2146} {"train_loss": -6.345797061920166, "global_step": 90155, "epoch": 2146} {"train_loss": -6.252386569976807, "global_step": 90156, "epoch": 2146} {"train_loss": -6.306507110595703, "global_step": 90157, "epoch": 2146} {"train_loss": -6.349714756011963, "global_step": 90158, "epoch": 2146} {"train_loss": -6.308944225311279, "global_step": 90159, "epoch": 2146} {"train_loss": -6.308035373687744, "global_step": 90160, "epoch": 2146} {"train_loss": -6.230655670166016, "global_step": 90161, "epoch": 2146} {"train_loss": -6.248065948486328, "global_step": 90162, "epoch": 2146} {"train_loss": -6.294981956481934, "global_step": 90163, "epoch": 2146} {"train_loss": -6.294847011566162, "global_step": 90164, "epoch": 2146} {"train_loss": -6.305511474609375, "global_step": 90165, "epoch": 2146} {"train_loss": -6.289740562438965, "global_step": 90166, "epoch": 2146} {"train_loss": -6.378204345703125, "global_step": 90167, "epoch": 2146} {"train_loss": -6.239959239959717, "global_step": 90168, "epoch": 2146} {"train_loss": -6.102494239807129, "global_step": 90169, "epoch": 2146} {"train_loss": -6.361735820770264, "global_step": 90170, "epoch": 2146} {"train_loss": -6.297861099243164, "global_step": 90171, "epoch": 2146} {"train_loss": -6.233312129974365, "global_step": 90172, "epoch": 2146} {"train_loss": -6.261505501610892, "global_step": 90173, "epoch": 2146, "val_loss": 63192.203125} {"train_loss": -6.195954322814941, "global_step": 90174, "epoch": 2147} {"train_loss": -6.265615940093994, "global_step": 90175, "epoch": 2147} {"train_loss": -6.2827677726745605, "global_step": 90176, "epoch": 2147} {"train_loss": -6.1211442947387695, "global_step": 90177, "epoch": 2147} {"train_loss": -6.22917366027832, "global_step": 90178, "epoch": 2147} {"train_loss": -6.340121269226074, "global_step": 90179, "epoch": 2147} {"train_loss": -6.167636871337891, "global_step": 90180, "epoch": 2147} {"train_loss": -6.197354793548584, "global_step": 90181, "epoch": 2147} {"train_loss": -6.2969465255737305, "global_step": 90182, "epoch": 2147} {"train_loss": -6.286642551422119, "global_step": 90183, "epoch": 2147} {"train_loss": -6.3184356689453125, "global_step": 90184, "epoch": 2147} {"train_loss": -6.161511421203613, "global_step": 90185, "epoch": 2147} {"train_loss": -6.367051124572754, "global_step": 90186, "epoch": 2147} {"train_loss": -6.181861877441406, "global_step": 90187, "epoch": 2147} {"train_loss": -6.329400062561035, "global_step": 90188, "epoch": 2147} {"train_loss": -6.181864261627197, "global_step": 90189, "epoch": 2147} {"train_loss": -6.256424427032471, "global_step": 90190, "epoch": 2147} {"train_loss": -6.319319248199463, "global_step": 90191, "epoch": 2147} {"train_loss": -6.213749885559082, "global_step": 90192, "epoch": 2147} {"train_loss": -6.290323257446289, "global_step": 90193, "epoch": 2147} {"train_loss": -6.1964311599731445, "global_step": 90194, "epoch": 2147} {"train_loss": -6.13334321975708, "global_step": 90195, "epoch": 2147} {"train_loss": -6.189235687255859, "global_step": 90196, "epoch": 2147} {"train_loss": -6.257126331329346, "global_step": 90197, "epoch": 2147} {"train_loss": -6.214632987976074, "global_step": 90198, "epoch": 2147} {"train_loss": -6.234976768493652, "global_step": 90199, "epoch": 2147} {"train_loss": -6.195955276489258, "global_step": 90200, "epoch": 2147} {"train_loss": -6.2929887771606445, "global_step": 90201, "epoch": 2147} {"train_loss": -6.155272960662842, "global_step": 90202, "epoch": 2147} {"train_loss": -6.2036848068237305, "global_step": 90203, "epoch": 2147} {"train_loss": -6.246859550476074, "global_step": 90204, "epoch": 2147} {"train_loss": -6.171928405761719, "global_step": 90205, "epoch": 2147} {"train_loss": -6.1855573654174805, "global_step": 90206, "epoch": 2147} {"train_loss": -6.284549236297607, "global_step": 90207, "epoch": 2147} {"train_loss": -6.266968250274658, "global_step": 90208, "epoch": 2147} {"train_loss": -6.234208583831787, "global_step": 90209, "epoch": 2147} {"train_loss": -6.177700996398926, "global_step": 90210, "epoch": 2147} {"train_loss": -6.25098991394043, "global_step": 90211, "epoch": 2147} {"train_loss": -6.039584159851074, "global_step": 90212, "epoch": 2147} {"train_loss": -6.177553653717041, "global_step": 90213, "epoch": 2147} {"train_loss": -6.208072662353516, "global_step": 90214, "epoch": 2147} {"train_loss": -6.226583957672119, "global_step": 90215, "epoch": 2147, "val_loss": 63254.9453125} {"train_loss": -6.156172752380371, "global_step": 90216, "epoch": 2148} {"train_loss": -6.326369285583496, "global_step": 90217, "epoch": 2148} {"train_loss": -6.224328517913818, "global_step": 90218, "epoch": 2148} {"train_loss": -6.200301647186279, "global_step": 90219, "epoch": 2148} {"train_loss": -6.203631401062012, "global_step": 90220, "epoch": 2148} {"train_loss": -6.335890769958496, "global_step": 90221, "epoch": 2148} {"train_loss": -6.257568359375, "global_step": 90222, "epoch": 2148} {"train_loss": -6.3129801750183105, "global_step": 90223, "epoch": 2148} {"train_loss": -6.178702354431152, "global_step": 90224, "epoch": 2148} {"train_loss": -6.243564605712891, "global_step": 90225, "epoch": 2148} {"train_loss": -6.236320972442627, "global_step": 90226, "epoch": 2148} {"train_loss": -6.300985813140869, "global_step": 90227, "epoch": 2148} {"train_loss": -6.256178855895996, "global_step": 90228, "epoch": 2148} {"train_loss": -6.249238967895508, "global_step": 90229, "epoch": 2148} {"train_loss": -6.187788009643555, "global_step": 90230, "epoch": 2148} {"train_loss": -6.238188743591309, "global_step": 90231, "epoch": 2148} {"train_loss": -6.230923652648926, "global_step": 90232, "epoch": 2148} {"train_loss": -6.188493728637695, "global_step": 90233, "epoch": 2148} {"train_loss": -6.182599067687988, "global_step": 90234, "epoch": 2148} {"train_loss": -6.1794209480285645, "global_step": 90235, "epoch": 2148} {"train_loss": -6.242460250854492, "global_step": 90236, "epoch": 2148} {"train_loss": -6.228489875793457, "global_step": 90237, "epoch": 2148} {"train_loss": -6.305803298950195, "global_step": 90238, "epoch": 2148} {"train_loss": -6.294921875, "global_step": 90239, "epoch": 2148} {"train_loss": -6.234023094177246, "global_step": 90240, "epoch": 2148} {"train_loss": -6.3082122802734375, "global_step": 90241, "epoch": 2148} {"train_loss": -6.246757507324219, "global_step": 90242, "epoch": 2148} {"train_loss": -6.265444755554199, "global_step": 90243, "epoch": 2148} {"train_loss": -6.215737342834473, "global_step": 90244, "epoch": 2148} {"train_loss": -6.084747314453125, "global_step": 90245, "epoch": 2148} {"train_loss": -6.346443176269531, "global_step": 90246, "epoch": 2148} {"train_loss": -6.235024929046631, "global_step": 90247, "epoch": 2148} {"train_loss": -6.226602554321289, "global_step": 90248, "epoch": 2148} {"train_loss": -6.124669551849365, "global_step": 90249, "epoch": 2148} {"train_loss": -6.296372413635254, "global_step": 90250, "epoch": 2148} {"train_loss": -6.206408500671387, "global_step": 90251, "epoch": 2148} {"train_loss": -6.2873663902282715, "global_step": 90252, "epoch": 2148} {"train_loss": -6.229018688201904, "global_step": 90253, "epoch": 2148} {"train_loss": -6.206047058105469, "global_step": 90254, "epoch": 2148} {"train_loss": -6.194276809692383, "global_step": 90255, "epoch": 2148} {"train_loss": -6.010378837585449, "global_step": 90256, "epoch": 2148} {"train_loss": -6.233431736628215, "global_step": 90257, "epoch": 2148, "val_loss": 63221.19921875} {"train_loss": -6.21526575088501, "global_step": 90258, "epoch": 2149} {"train_loss": -6.076831817626953, "global_step": 90259, "epoch": 2149} {"train_loss": -6.256193161010742, "global_step": 90260, "epoch": 2149} {"train_loss": -6.09506893157959, "global_step": 90261, "epoch": 2149} {"train_loss": -6.118310928344727, "global_step": 90262, "epoch": 2149} {"train_loss": -6.249224662780762, "global_step": 90263, "epoch": 2149} {"train_loss": -6.065306663513184, "global_step": 90264, "epoch": 2149} {"train_loss": -6.102721214294434, "global_step": 90265, "epoch": 2149} {"train_loss": -6.112045764923096, "global_step": 90266, "epoch": 2149} {"train_loss": -6.232842445373535, "global_step": 90267, "epoch": 2149} {"train_loss": -6.142605781555176, "global_step": 90268, "epoch": 2149} {"train_loss": -6.189981460571289, "global_step": 90269, "epoch": 2149} {"train_loss": -6.078394412994385, "global_step": 90270, "epoch": 2149} {"train_loss": -6.168726444244385, "global_step": 90271, "epoch": 2149} {"train_loss": -6.180627822875977, "global_step": 90272, "epoch": 2149} {"train_loss": -6.2382965087890625, "global_step": 90273, "epoch": 2149} {"train_loss": -6.272833824157715, "global_step": 90274, "epoch": 2149} {"train_loss": -6.203086853027344, "global_step": 90275, "epoch": 2149} {"train_loss": -6.204859733581543, "global_step": 90276, "epoch": 2149} {"train_loss": -6.2840142250061035, "global_step": 90277, "epoch": 2149} {"train_loss": -6.3003458976745605, "global_step": 90278, "epoch": 2149} {"train_loss": -6.211191177368164, "global_step": 90279, "epoch": 2149} {"train_loss": -6.336507320404053, "global_step": 90280, "epoch": 2149} {"train_loss": -6.236359596252441, "global_step": 90281, "epoch": 2149} {"train_loss": -6.400155067443848, "global_step": 90282, "epoch": 2149} {"train_loss": -6.408877372741699, "global_step": 90283, "epoch": 2149} {"train_loss": -6.254260063171387, "global_step": 90284, "epoch": 2149} {"train_loss": -6.282671928405762, "global_step": 90285, "epoch": 2149} {"train_loss": -6.345278263092041, "global_step": 90286, "epoch": 2149} {"train_loss": -6.259090423583984, "global_step": 90287, "epoch": 2149} {"train_loss": -6.262370586395264, "global_step": 90288, "epoch": 2149} {"train_loss": -6.349703788757324, "global_step": 90289, "epoch": 2149} {"train_loss": -6.167046070098877, "global_step": 90290, "epoch": 2149} {"train_loss": -6.2483038902282715, "global_step": 90291, "epoch": 2149} {"train_loss": -6.252208709716797, "global_step": 90292, "epoch": 2149} {"train_loss": -6.248273849487305, "global_step": 90293, "epoch": 2149} {"train_loss": -6.349481582641602, "global_step": 90294, "epoch": 2149} {"train_loss": -6.328409194946289, "global_step": 90295, "epoch": 2149} {"train_loss": -6.243958473205566, "global_step": 90296, "epoch": 2149} {"train_loss": -6.334466934204102, "global_step": 90297, "epoch": 2149} {"train_loss": -6.288054466247559, "global_step": 90298, "epoch": 2149} {"train_loss": -6.2311374459947855, "global_step": 90299, "epoch": 2149, "val_loss": 62986.24609375} {"train_loss": -6.184761047363281, "global_step": 90300, "epoch": 2150} {"train_loss": -6.268101692199707, "global_step": 90301, "epoch": 2150} {"train_loss": -6.299762725830078, "global_step": 90302, "epoch": 2150} {"train_loss": -6.322318077087402, "global_step": 90303, "epoch": 2150} {"train_loss": -6.24925422668457, "global_step": 90304, "epoch": 2150} {"train_loss": -6.263125419616699, "global_step": 90305, "epoch": 2150} {"train_loss": -6.3037238121032715, "global_step": 90306, "epoch": 2150} {"train_loss": -6.155317306518555, "global_step": 90307, "epoch": 2150} {"train_loss": -6.2085161209106445, "global_step": 90308, "epoch": 2150} {"train_loss": -6.261773109436035, "global_step": 90309, "epoch": 2150} {"train_loss": -6.307933330535889, "global_step": 90310, "epoch": 2150} {"train_loss": -6.423321723937988, "global_step": 90311, "epoch": 2150} {"train_loss": -6.212946891784668, "global_step": 90312, "epoch": 2150} {"train_loss": -6.3657755851745605, "global_step": 90313, "epoch": 2150} {"train_loss": -6.254652976989746, "global_step": 90314, "epoch": 2150} {"train_loss": -6.2500410079956055, "global_step": 90315, "epoch": 2150} {"train_loss": -6.295499801635742, "global_step": 90316, "epoch": 2150} {"train_loss": -6.289859771728516, "global_step": 90317, "epoch": 2150} {"train_loss": -6.264847755432129, "global_step": 90318, "epoch": 2150} {"train_loss": -6.243488311767578, "global_step": 90319, "epoch": 2150} {"train_loss": -6.265857219696045, "global_step": 90320, "epoch": 2150} {"train_loss": -6.223781585693359, "global_step": 90321, "epoch": 2150} {"train_loss": -6.275393962860107, "global_step": 90322, "epoch": 2150} {"train_loss": -6.217001914978027, "global_step": 90323, "epoch": 2150} {"train_loss": -6.155045986175537, "global_step": 90324, "epoch": 2150} {"train_loss": -6.297303676605225, "global_step": 90325, "epoch": 2150} {"train_loss": -6.303732872009277, "global_step": 90326, "epoch": 2150} {"train_loss": -6.277509689331055, "global_step": 90327, "epoch": 2150} {"train_loss": -6.3046159744262695, "global_step": 90328, "epoch": 2150} {"train_loss": -6.251431465148926, "global_step": 90329, "epoch": 2150} {"train_loss": -6.292201042175293, "global_step": 90330, "epoch": 2150} {"train_loss": -6.3712286949157715, "global_step": 90331, "epoch": 2150} {"train_loss": -6.317098140716553, "global_step": 90332, "epoch": 2150} {"train_loss": -6.265901565551758, "global_step": 90333, "epoch": 2150} {"train_loss": -6.274707794189453, "global_step": 90334, "epoch": 2150} {"train_loss": -6.259111404418945, "global_step": 90335, "epoch": 2150} {"train_loss": -6.178023338317871, "global_step": 90336, "epoch": 2150} {"train_loss": -6.142746925354004, "global_step": 90337, "epoch": 2150} {"train_loss": -6.321690559387207, "global_step": 90338, "epoch": 2150} {"train_loss": -6.362094402313232, "global_step": 90339, "epoch": 2150} {"train_loss": -6.30721378326416, "global_step": 90340, "epoch": 2150} {"train_loss": -6.2663482938494, "global_step": 90341, "epoch": 2150, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.6959234015635173, "train/sim_max_reward_2": 0.5564735438849577, "train/sim_max_reward_3": 0.8900739739324064, "train/sim_max_reward_4": 0.8964526147654395, "train/sim_max_reward_5": 0.8568881336571068, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5346715181398239, "test/sim_max_reward_4300002": 0.7396772013687546, "test/sim_max_reward_4300003": 0.8383551714208906, "test/sim_max_reward_4300004": 0.33212107361957066, "test/sim_max_reward_4300005": 0.40727233294544013, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.8415448185558836, "test/sim_max_reward_4300008": 0.41967176841570114, "test/sim_max_reward_4300009": 0.9411141789207268, "test/sim_max_reward_4300010": 1.0, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.407894113014345, "test/sim_max_reward_4300014": 0.9773930473818382, "test/sim_max_reward_4300015": 0.9455256174668892, "test/sim_max_reward_4300016": 0.9901708182320155, "test/sim_max_reward_4300017": 0.7508538570132189, "test/sim_max_reward_4300018": 0.37233336905610764, "test/sim_max_reward_4300019": 0.186700697705285, "test/sim_max_reward_4300020": 0.900716680675871, "test/sim_max_reward_4300021": 0.9625982324981921, "test/sim_max_reward_4300022": 0.8712957571344339, "test/sim_max_reward_4300023": 0.33635255573637257, "test/sim_max_reward_4300024": 0.9610582630958187, "test/sim_max_reward_4300025": 0.9538134400404888, "test/sim_max_reward_4300026": 0.14923442192186204, "test/sim_max_reward_4300027": 0.0, "test/sim_max_reward_4300028": 0.788590797402764, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.35041853733253514, "test/sim_max_reward_4300031": 0.9539076757343093, "test/sim_max_reward_4300032": 0.9476377197167836, "test/sim_max_reward_4300033": 0.9584036254688061, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.378186432044245, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9081452812472024, "test/sim_max_reward_4300038": 0.8539532902330614, "test/sim_max_reward_4300039": 0.9948210726558626, "test/sim_max_reward_4300040": 0.2429841480905784, "test/sim_max_reward_4300041": 0.23515324676728236, "test/sim_max_reward_4300042": 0.6890730715666817, "test/sim_max_reward_4300043": 0.09003424390002039, "test/sim_max_reward_4300044": 0.7355771115387248, "test/sim_max_reward_4300045": 0.971174222658767, "test/sim_max_reward_4300046": 0.8696650969986993, "test/sim_max_reward_4300047": 0.9305504462786868, "test/sim_max_reward_4300048": 0.8322752993629019, "test/sim_max_reward_4300049": 0.14651517709765716, "train/mean_score": 0.6810181940682467, "test/mean_score": 0.6179325909203716, "val_loss": 63223.7734375} {"train_loss": -6.261188507080078, "global_step": 90342, "epoch": 2151} {"train_loss": -6.270401477813721, "global_step": 90343, "epoch": 2151} {"train_loss": -6.316755294799805, "global_step": 90344, "epoch": 2151} {"train_loss": -6.216177940368652, "global_step": 90345, "epoch": 2151} {"train_loss": -6.221774101257324, "global_step": 90346, "epoch": 2151} {"train_loss": -6.191034317016602, "global_step": 90347, "epoch": 2151} {"train_loss": -6.3335161209106445, "global_step": 90348, "epoch": 2151} {"train_loss": -6.252782821655273, "global_step": 90349, "epoch": 2151} {"train_loss": -6.2993693351745605, "global_step": 90350, "epoch": 2151} {"train_loss": -6.182263374328613, "global_step": 90351, "epoch": 2151} {"train_loss": -6.255414009094238, "global_step": 90352, "epoch": 2151} {"train_loss": -6.3676605224609375, "global_step": 90353, "epoch": 2151} {"train_loss": -6.2646379470825195, "global_step": 90354, "epoch": 2151} {"train_loss": -6.37913179397583, "global_step": 90355, "epoch": 2151} {"train_loss": -6.313688278198242, "global_step": 90356, "epoch": 2151} {"train_loss": -6.3445329666137695, "global_step": 90357, "epoch": 2151} {"train_loss": -6.332695007324219, "global_step": 90358, "epoch": 2151} {"train_loss": -6.2180280685424805, "global_step": 90359, "epoch": 2151} {"train_loss": -6.326687335968018, "global_step": 90360, "epoch": 2151} {"train_loss": -6.222658157348633, "global_step": 90361, "epoch": 2151} {"train_loss": -6.302955150604248, "global_step": 90362, "epoch": 2151} {"train_loss": -6.269433975219727, "global_step": 90363, "epoch": 2151} {"train_loss": -6.283439636230469, "global_step": 90364, "epoch": 2151} {"train_loss": -6.405393600463867, "global_step": 90365, "epoch": 2151} {"train_loss": -6.2732086181640625, "global_step": 90366, "epoch": 2151} {"train_loss": -6.301862716674805, "global_step": 90367, "epoch": 2151} {"train_loss": -6.242180824279785, "global_step": 90368, "epoch": 2151} {"train_loss": -6.306130409240723, "global_step": 90369, "epoch": 2151} {"train_loss": -6.308603763580322, "global_step": 90370, "epoch": 2151} {"train_loss": -6.270137310028076, "global_step": 90371, "epoch": 2151} {"train_loss": -6.225229740142822, "global_step": 90372, "epoch": 2151} {"train_loss": -6.2324371337890625, "global_step": 90373, "epoch": 2151} {"train_loss": -6.244563102722168, "global_step": 90374, "epoch": 2151} {"train_loss": -6.188998699188232, "global_step": 90375, "epoch": 2151} {"train_loss": -6.319700241088867, "global_step": 90376, "epoch": 2151} {"train_loss": -6.3333892822265625, "global_step": 90377, "epoch": 2151} {"train_loss": -6.244573593139648, "global_step": 90378, "epoch": 2151} {"train_loss": -6.292729377746582, "global_step": 90379, "epoch": 2151} {"train_loss": -6.235483169555664, "global_step": 90380, "epoch": 2151} {"train_loss": -6.290714263916016, "global_step": 90381, "epoch": 2151} {"train_loss": -6.2994585037231445, "global_step": 90382, "epoch": 2151} {"train_loss": -6.279566730771746, "global_step": 90383, "epoch": 2151, "val_loss": 63361.80078125} {"train_loss": -6.241995811462402, "global_step": 90384, "epoch": 2152} {"train_loss": -6.255027770996094, "global_step": 90385, "epoch": 2152} {"train_loss": -6.270279884338379, "global_step": 90386, "epoch": 2152} {"train_loss": -6.263923645019531, "global_step": 90387, "epoch": 2152} {"train_loss": -6.280642509460449, "global_step": 90388, "epoch": 2152} {"train_loss": -6.394355773925781, "global_step": 90389, "epoch": 2152} {"train_loss": -6.326667785644531, "global_step": 90390, "epoch": 2152} {"train_loss": -6.381224632263184, "global_step": 90391, "epoch": 2152} {"train_loss": -6.289844512939453, "global_step": 90392, "epoch": 2152} {"train_loss": -6.3815016746521, "global_step": 90393, "epoch": 2152} {"train_loss": -6.295558929443359, "global_step": 90394, "epoch": 2152} {"train_loss": -6.262697219848633, "global_step": 90395, "epoch": 2152} {"train_loss": -6.310062885284424, "global_step": 90396, "epoch": 2152} {"train_loss": -6.273249626159668, "global_step": 90397, "epoch": 2152} {"train_loss": -6.363052845001221, "global_step": 90398, "epoch": 2152} {"train_loss": -6.295838356018066, "global_step": 90399, "epoch": 2152} {"train_loss": -6.051372051239014, "global_step": 90400, "epoch": 2152} {"train_loss": -6.220362663269043, "global_step": 90401, "epoch": 2152} {"train_loss": -6.3508992195129395, "global_step": 90402, "epoch": 2152} {"train_loss": -6.223356246948242, "global_step": 90403, "epoch": 2152} {"train_loss": -6.096640586853027, "global_step": 90404, "epoch": 2152} {"train_loss": -6.154140949249268, "global_step": 90405, "epoch": 2152} {"train_loss": -6.17864465713501, "global_step": 90406, "epoch": 2152} {"train_loss": -6.265113830566406, "global_step": 90407, "epoch": 2152} {"train_loss": -6.098379135131836, "global_step": 90408, "epoch": 2152} {"train_loss": -6.173696517944336, "global_step": 90409, "epoch": 2152} {"train_loss": -6.112250328063965, "global_step": 90410, "epoch": 2152} {"train_loss": -6.178361415863037, "global_step": 90411, "epoch": 2152} {"train_loss": -6.190512180328369, "global_step": 90412, "epoch": 2152} {"train_loss": -6.167564868927002, "global_step": 90413, "epoch": 2152} {"train_loss": -6.2366943359375, "global_step": 90414, "epoch": 2152} {"train_loss": -6.166247367858887, "global_step": 90415, "epoch": 2152} {"train_loss": -6.330039024353027, "global_step": 90416, "epoch": 2152} {"train_loss": -6.216546058654785, "global_step": 90417, "epoch": 2152} {"train_loss": -6.223703861236572, "global_step": 90418, "epoch": 2152} {"train_loss": -6.283390045166016, "global_step": 90419, "epoch": 2152} {"train_loss": -6.202220916748047, "global_step": 90420, "epoch": 2152} {"train_loss": -6.266323089599609, "global_step": 90421, "epoch": 2152} {"train_loss": -6.250619888305664, "global_step": 90422, "epoch": 2152} {"train_loss": -6.248586654663086, "global_step": 90423, "epoch": 2152} {"train_loss": -6.200075626373291, "global_step": 90424, "epoch": 2152} {"train_loss": -6.241838409787133, "global_step": 90425, "epoch": 2152, "val_loss": 63066.1640625} {"train_loss": -6.315823078155518, "global_step": 90426, "epoch": 2153} {"train_loss": -6.245453834533691, "global_step": 90427, "epoch": 2153} {"train_loss": -6.153338432312012, "global_step": 90428, "epoch": 2153} {"train_loss": -6.189815044403076, "global_step": 90429, "epoch": 2153} {"train_loss": -6.190559387207031, "global_step": 90430, "epoch": 2153} {"train_loss": -6.215860843658447, "global_step": 90431, "epoch": 2153} {"train_loss": -6.13558292388916, "global_step": 90432, "epoch": 2153} {"train_loss": -6.314894199371338, "global_step": 90433, "epoch": 2153} {"train_loss": -6.3466620445251465, "global_step": 90434, "epoch": 2153} {"train_loss": -6.22802209854126, "global_step": 90435, "epoch": 2153} {"train_loss": -6.172949314117432, "global_step": 90436, "epoch": 2153} {"train_loss": -6.3481950759887695, "global_step": 90437, "epoch": 2153} {"train_loss": -6.21400260925293, "global_step": 90438, "epoch": 2153} {"train_loss": -6.15910530090332, "global_step": 90439, "epoch": 2153} {"train_loss": -6.244969844818115, "global_step": 90440, "epoch": 2153} {"train_loss": -6.203439712524414, "global_step": 90441, "epoch": 2153} {"train_loss": -6.306149482727051, "global_step": 90442, "epoch": 2153} {"train_loss": -6.273170471191406, "global_step": 90443, "epoch": 2153} {"train_loss": -6.182777404785156, "global_step": 90444, "epoch": 2153} {"train_loss": -6.327391624450684, "global_step": 90445, "epoch": 2153} {"train_loss": -6.154421806335449, "global_step": 90446, "epoch": 2153} {"train_loss": -6.263693809509277, "global_step": 90447, "epoch": 2153} {"train_loss": -6.266600608825684, "global_step": 90448, "epoch": 2153} {"train_loss": -6.30120849609375, "global_step": 90449, "epoch": 2153} {"train_loss": -6.133910179138184, "global_step": 90450, "epoch": 2153} {"train_loss": -6.248203754425049, "global_step": 90451, "epoch": 2153} {"train_loss": -6.29270076751709, "global_step": 90452, "epoch": 2153} {"train_loss": -6.071508407592773, "global_step": 90453, "epoch": 2153} {"train_loss": -6.249442100524902, "global_step": 90454, "epoch": 2153} {"train_loss": -6.189737319946289, "global_step": 90455, "epoch": 2153} {"train_loss": -6.18988561630249, "global_step": 90456, "epoch": 2153} {"train_loss": -6.21400260925293, "global_step": 90457, "epoch": 2153} {"train_loss": -6.3588175773620605, "global_step": 90458, "epoch": 2153} {"train_loss": -6.187572479248047, "global_step": 90459, "epoch": 2153} {"train_loss": -6.239254951477051, "global_step": 90460, "epoch": 2153} {"train_loss": -6.192544460296631, "global_step": 90461, "epoch": 2153} {"train_loss": -6.3018999099731445, "global_step": 90462, "epoch": 2153} {"train_loss": -6.361236572265625, "global_step": 90463, "epoch": 2153} {"train_loss": -6.408647537231445, "global_step": 90464, "epoch": 2153} {"train_loss": -6.184161186218262, "global_step": 90465, "epoch": 2153} {"train_loss": -6.114290237426758, "global_step": 90466, "epoch": 2153} {"train_loss": -6.236007906141735, "global_step": 90467, "epoch": 2153, "val_loss": 63196.11328125} {"train_loss": -6.1321539878845215, "global_step": 90468, "epoch": 2154} {"train_loss": -6.142428398132324, "global_step": 90469, "epoch": 2154} {"train_loss": -6.175992012023926, "global_step": 90470, "epoch": 2154} {"train_loss": -6.384142875671387, "global_step": 90471, "epoch": 2154} {"train_loss": -6.276356220245361, "global_step": 90472, "epoch": 2154} {"train_loss": -6.165983200073242, "global_step": 90473, "epoch": 2154} {"train_loss": -6.263033866882324, "global_step": 90474, "epoch": 2154} {"train_loss": -6.195653915405273, "global_step": 90475, "epoch": 2154} {"train_loss": -6.186346054077148, "global_step": 90476, "epoch": 2154} {"train_loss": -6.308743000030518, "global_step": 90477, "epoch": 2154} {"train_loss": -6.317130088806152, "global_step": 90478, "epoch": 2154} {"train_loss": -6.277247428894043, "global_step": 90479, "epoch": 2154} {"train_loss": -6.234318256378174, "global_step": 90480, "epoch": 2154} {"train_loss": -6.310628890991211, "global_step": 90481, "epoch": 2154} {"train_loss": -6.281494140625, "global_step": 90482, "epoch": 2154} {"train_loss": -6.322525978088379, "global_step": 90483, "epoch": 2154} {"train_loss": -6.227537155151367, "global_step": 90484, "epoch": 2154} {"train_loss": -6.286386966705322, "global_step": 90485, "epoch": 2154} {"train_loss": -6.308841705322266, "global_step": 90486, "epoch": 2154} {"train_loss": -6.2803425788879395, "global_step": 90487, "epoch": 2154} {"train_loss": -6.279412746429443, "global_step": 90488, "epoch": 2154} {"train_loss": -6.24788761138916, "global_step": 90489, "epoch": 2154} {"train_loss": -6.389376640319824, "global_step": 90490, "epoch": 2154} {"train_loss": -6.248183727264404, "global_step": 90491, "epoch": 2154} {"train_loss": -6.290169715881348, "global_step": 90492, "epoch": 2154} {"train_loss": -6.251304626464844, "global_step": 90493, "epoch": 2154} {"train_loss": -6.294880390167236, "global_step": 90494, "epoch": 2154} {"train_loss": -6.25785493850708, "global_step": 90495, "epoch": 2154} {"train_loss": -6.282858371734619, "global_step": 90496, "epoch": 2154} {"train_loss": -6.29785680770874, "global_step": 90497, "epoch": 2154} {"train_loss": -6.232795715332031, "global_step": 90498, "epoch": 2154} {"train_loss": -6.254796028137207, "global_step": 90499, "epoch": 2154} {"train_loss": -6.2701334953308105, "global_step": 90500, "epoch": 2154} {"train_loss": -6.193583011627197, "global_step": 90501, "epoch": 2154} {"train_loss": -6.223428726196289, "global_step": 90502, "epoch": 2154} {"train_loss": -6.167492866516113, "global_step": 90503, "epoch": 2154} {"train_loss": -6.313641548156738, "global_step": 90504, "epoch": 2154} {"train_loss": -6.224701881408691, "global_step": 90505, "epoch": 2154} {"train_loss": -6.271040916442871, "global_step": 90506, "epoch": 2154} {"train_loss": -6.225319862365723, "global_step": 90507, "epoch": 2154} {"train_loss": -6.134306907653809, "global_step": 90508, "epoch": 2154} {"train_loss": -6.254149402890887, "global_step": 90509, "epoch": 2154, "val_loss": 63288.3046875} {"train_loss": -6.261638641357422, "global_step": 90510, "epoch": 2155} {"train_loss": -6.319767475128174, "global_step": 90511, "epoch": 2155} {"train_loss": -6.298130989074707, "global_step": 90512, "epoch": 2155} {"train_loss": -6.2130045890808105, "global_step": 90513, "epoch": 2155} {"train_loss": -6.258064270019531, "global_step": 90514, "epoch": 2155} {"train_loss": -6.206615447998047, "global_step": 90515, "epoch": 2155} {"train_loss": -6.248881816864014, "global_step": 90516, "epoch": 2155} {"train_loss": -6.394048690795898, "global_step": 90517, "epoch": 2155} {"train_loss": -6.207803726196289, "global_step": 90518, "epoch": 2155} {"train_loss": -6.325674057006836, "global_step": 90519, "epoch": 2155} {"train_loss": -6.335936546325684, "global_step": 90520, "epoch": 2155} {"train_loss": -6.246532440185547, "global_step": 90521, "epoch": 2155} {"train_loss": -6.305174350738525, "global_step": 90522, "epoch": 2155} {"train_loss": -6.224247932434082, "global_step": 90523, "epoch": 2155} {"train_loss": -6.171310901641846, "global_step": 90524, "epoch": 2155} {"train_loss": -6.281989097595215, "global_step": 90525, "epoch": 2155} {"train_loss": -6.284772872924805, "global_step": 90526, "epoch": 2155} {"train_loss": -6.3544111251831055, "global_step": 90527, "epoch": 2155} {"train_loss": -6.393226623535156, "global_step": 90528, "epoch": 2155} {"train_loss": -6.36012077331543, "global_step": 90529, "epoch": 2155} {"train_loss": -6.311643600463867, "global_step": 90530, "epoch": 2155} {"train_loss": -6.348149299621582, "global_step": 90531, "epoch": 2155} {"train_loss": -6.157161712646484, "global_step": 90532, "epoch": 2155} {"train_loss": -6.224215030670166, "global_step": 90533, "epoch": 2155} {"train_loss": -6.263002395629883, "global_step": 90534, "epoch": 2155} {"train_loss": -6.2656097412109375, "global_step": 90535, "epoch": 2155} {"train_loss": -6.330120086669922, "global_step": 90536, "epoch": 2155} {"train_loss": -6.221879959106445, "global_step": 90537, "epoch": 2155} {"train_loss": -6.400974273681641, "global_step": 90538, "epoch": 2155} {"train_loss": -6.266812801361084, "global_step": 90539, "epoch": 2155} {"train_loss": -6.3225202560424805, "global_step": 90540, "epoch": 2155} {"train_loss": -6.347043037414551, "global_step": 90541, "epoch": 2155} {"train_loss": -6.20689058303833, "global_step": 90542, "epoch": 2155} {"train_loss": -6.263096809387207, "global_step": 90543, "epoch": 2155} {"train_loss": -6.202243804931641, "global_step": 90544, "epoch": 2155} {"train_loss": -6.360177993774414, "global_step": 90545, "epoch": 2155} {"train_loss": -6.163295745849609, "global_step": 90546, "epoch": 2155} {"train_loss": -6.368984222412109, "global_step": 90547, "epoch": 2155} {"train_loss": -6.257055282592773, "global_step": 90548, "epoch": 2155} {"train_loss": -6.333659648895264, "global_step": 90549, "epoch": 2155} {"train_loss": -6.330656051635742, "global_step": 90550, "epoch": 2155} {"train_loss": -6.285479239055088, "global_step": 90551, "epoch": 2155, "val_loss": 63109.01953125} {"train_loss": -6.307950019836426, "global_step": 90552, "epoch": 2156} {"train_loss": -6.275508403778076, "global_step": 90553, "epoch": 2156} {"train_loss": -6.250173568725586, "global_step": 90554, "epoch": 2156} {"train_loss": -6.214312553405762, "global_step": 90555, "epoch": 2156} {"train_loss": -6.29233455657959, "global_step": 90556, "epoch": 2156} {"train_loss": -6.375979900360107, "global_step": 90557, "epoch": 2156} {"train_loss": -6.241142272949219, "global_step": 90558, "epoch": 2156} {"train_loss": -6.319936752319336, "global_step": 90559, "epoch": 2156} {"train_loss": -6.357710838317871, "global_step": 90560, "epoch": 2156} {"train_loss": -6.263401031494141, "global_step": 90561, "epoch": 2156} {"train_loss": -6.205977916717529, "global_step": 90562, "epoch": 2156} {"train_loss": -6.192509174346924, "global_step": 90563, "epoch": 2156} {"train_loss": -6.281531810760498, "global_step": 90564, "epoch": 2156} {"train_loss": -6.287993431091309, "global_step": 90565, "epoch": 2156} {"train_loss": -6.237760543823242, "global_step": 90566, "epoch": 2156} {"train_loss": -6.2771782875061035, "global_step": 90567, "epoch": 2156} {"train_loss": -6.332379341125488, "global_step": 90568, "epoch": 2156} {"train_loss": -6.278835773468018, "global_step": 90569, "epoch": 2156} {"train_loss": -6.280584812164307, "global_step": 90570, "epoch": 2156} {"train_loss": -6.367785453796387, "global_step": 90571, "epoch": 2156} {"train_loss": -6.168732166290283, "global_step": 90572, "epoch": 2156} {"train_loss": -6.210114479064941, "global_step": 90573, "epoch": 2156} {"train_loss": -6.348031044006348, "global_step": 90574, "epoch": 2156} {"train_loss": -6.47249698638916, "global_step": 90575, "epoch": 2156} {"train_loss": -6.282773017883301, "global_step": 90576, "epoch": 2156} {"train_loss": -6.316149711608887, "global_step": 90577, "epoch": 2156} {"train_loss": -6.133700370788574, "global_step": 90578, "epoch": 2156} {"train_loss": -6.349737167358398, "global_step": 90579, "epoch": 2156} {"train_loss": -6.299307346343994, "global_step": 90580, "epoch": 2156} {"train_loss": -6.082657814025879, "global_step": 90581, "epoch": 2156} {"train_loss": -6.323978424072266, "global_step": 90582, "epoch": 2156} {"train_loss": -6.329911708831787, "global_step": 90583, "epoch": 2156} {"train_loss": -6.166778564453125, "global_step": 90584, "epoch": 2156} {"train_loss": -6.302666664123535, "global_step": 90585, "epoch": 2156} {"train_loss": -6.184511661529541, "global_step": 90586, "epoch": 2156} {"train_loss": -6.071102142333984, "global_step": 90587, "epoch": 2156} {"train_loss": -6.101019859313965, "global_step": 90588, "epoch": 2156} {"train_loss": -6.212223052978516, "global_step": 90589, "epoch": 2156} {"train_loss": -6.255246162414551, "global_step": 90590, "epoch": 2156} {"train_loss": -6.302604675292969, "global_step": 90591, "epoch": 2156} {"train_loss": -6.313811302185059, "global_step": 90592, "epoch": 2156} {"train_loss": -6.264381340571812, "global_step": 90593, "epoch": 2156, "val_loss": 63351.58203125} {"train_loss": -6.254550933837891, "global_step": 90594, "epoch": 2157} {"train_loss": -6.302148342132568, "global_step": 90595, "epoch": 2157} {"train_loss": -6.1219587326049805, "global_step": 90596, "epoch": 2157} {"train_loss": -6.269039154052734, "global_step": 90597, "epoch": 2157} {"train_loss": -6.3504486083984375, "global_step": 90598, "epoch": 2157} {"train_loss": -6.25872802734375, "global_step": 90599, "epoch": 2157} {"train_loss": -6.147714614868164, "global_step": 90600, "epoch": 2157} {"train_loss": -6.262613296508789, "global_step": 90601, "epoch": 2157} {"train_loss": -6.284881591796875, "global_step": 90602, "epoch": 2157} {"train_loss": -6.2489824295043945, "global_step": 90603, "epoch": 2157} {"train_loss": -6.308565139770508, "global_step": 90604, "epoch": 2157} {"train_loss": -6.234807014465332, "global_step": 90605, "epoch": 2157} {"train_loss": -6.219461441040039, "global_step": 90606, "epoch": 2157} {"train_loss": -6.378383636474609, "global_step": 90607, "epoch": 2157} {"train_loss": -6.408912658691406, "global_step": 90608, "epoch": 2157} {"train_loss": -6.304103851318359, "global_step": 90609, "epoch": 2157} {"train_loss": -6.225707054138184, "global_step": 90610, "epoch": 2157} {"train_loss": -6.391690254211426, "global_step": 90611, "epoch": 2157} {"train_loss": -6.34329891204834, "global_step": 90612, "epoch": 2157} {"train_loss": -6.206876754760742, "global_step": 90613, "epoch": 2157} {"train_loss": -6.375078201293945, "global_step": 90614, "epoch": 2157} {"train_loss": -6.234172821044922, "global_step": 90615, "epoch": 2157} {"train_loss": -6.2847161293029785, "global_step": 90616, "epoch": 2157} {"train_loss": -6.1768798828125, "global_step": 90617, "epoch": 2157} {"train_loss": -6.345088958740234, "global_step": 90618, "epoch": 2157} {"train_loss": -6.263577461242676, "global_step": 90619, "epoch": 2157} {"train_loss": -6.293188095092773, "global_step": 90620, "epoch": 2157} {"train_loss": -6.170536041259766, "global_step": 90621, "epoch": 2157} {"train_loss": -6.332164287567139, "global_step": 90622, "epoch": 2157} {"train_loss": -6.345978736877441, "global_step": 90623, "epoch": 2157} {"train_loss": -6.2728657722473145, "global_step": 90624, "epoch": 2157} {"train_loss": -6.269472122192383, "global_step": 90625, "epoch": 2157} {"train_loss": -6.271965026855469, "global_step": 90626, "epoch": 2157} {"train_loss": -6.2936015129089355, "global_step": 90627, "epoch": 2157} {"train_loss": -6.174271583557129, "global_step": 90628, "epoch": 2157} {"train_loss": -6.26027774810791, "global_step": 90629, "epoch": 2157} {"train_loss": -6.365461349487305, "global_step": 90630, "epoch": 2157} {"train_loss": -6.170289039611816, "global_step": 90631, "epoch": 2157} {"train_loss": -6.3343024253845215, "global_step": 90632, "epoch": 2157} {"train_loss": -6.247721195220947, "global_step": 90633, "epoch": 2157} {"train_loss": -6.341557502746582, "global_step": 90634, "epoch": 2157} {"train_loss": -6.275188309805734, "global_step": 90635, "epoch": 2157, "val_loss": 63060.93359375} {"train_loss": -6.3801751136779785, "global_step": 90636, "epoch": 2158} {"train_loss": -6.25321102142334, "global_step": 90637, "epoch": 2158} {"train_loss": -6.365799903869629, "global_step": 90638, "epoch": 2158} {"train_loss": -6.297580242156982, "global_step": 90639, "epoch": 2158} {"train_loss": -6.190361022949219, "global_step": 90640, "epoch": 2158} {"train_loss": -6.334968566894531, "global_step": 90641, "epoch": 2158} {"train_loss": -6.2682294845581055, "global_step": 90642, "epoch": 2158} {"train_loss": -6.284842014312744, "global_step": 90643, "epoch": 2158} {"train_loss": -6.320649147033691, "global_step": 90644, "epoch": 2158} {"train_loss": -6.196990013122559, "global_step": 90645, "epoch": 2158} {"train_loss": -6.220425605773926, "global_step": 90646, "epoch": 2158} {"train_loss": -6.214547157287598, "global_step": 90647, "epoch": 2158} {"train_loss": -6.27386474609375, "global_step": 90648, "epoch": 2158} {"train_loss": -6.142907619476318, "global_step": 90649, "epoch": 2158} {"train_loss": -6.219248294830322, "global_step": 90650, "epoch": 2158} {"train_loss": -6.3022685050964355, "global_step": 90651, "epoch": 2158} {"train_loss": -6.268171310424805, "global_step": 90652, "epoch": 2158} {"train_loss": -6.211735725402832, "global_step": 90653, "epoch": 2158} {"train_loss": -6.261855602264404, "global_step": 90654, "epoch": 2158} {"train_loss": -6.173162937164307, "global_step": 90655, "epoch": 2158} {"train_loss": -6.254477024078369, "global_step": 90656, "epoch": 2158} {"train_loss": -6.210110664367676, "global_step": 90657, "epoch": 2158} {"train_loss": -6.1652069091796875, "global_step": 90658, "epoch": 2158} {"train_loss": -6.115315914154053, "global_step": 90659, "epoch": 2158} {"train_loss": -6.188241958618164, "global_step": 90660, "epoch": 2158} {"train_loss": -6.156648635864258, "global_step": 90661, "epoch": 2158} {"train_loss": -5.983355522155762, "global_step": 90662, "epoch": 2158} {"train_loss": -6.286336898803711, "global_step": 90663, "epoch": 2158} {"train_loss": -6.259151458740234, "global_step": 90664, "epoch": 2158} {"train_loss": -6.14237642288208, "global_step": 90665, "epoch": 2158} {"train_loss": -6.108551502227783, "global_step": 90666, "epoch": 2158} {"train_loss": -6.2193145751953125, "global_step": 90667, "epoch": 2158} {"train_loss": -6.254754066467285, "global_step": 90668, "epoch": 2158} {"train_loss": -6.258071422576904, "global_step": 90669, "epoch": 2158} {"train_loss": -6.350751876831055, "global_step": 90670, "epoch": 2158} {"train_loss": -6.234123229980469, "global_step": 90671, "epoch": 2158} {"train_loss": -6.33525276184082, "global_step": 90672, "epoch": 2158} {"train_loss": -6.122160911560059, "global_step": 90673, "epoch": 2158} {"train_loss": -6.348343849182129, "global_step": 90674, "epoch": 2158} {"train_loss": -6.106903076171875, "global_step": 90675, "epoch": 2158} {"train_loss": -6.181150436401367, "global_step": 90676, "epoch": 2158} {"train_loss": -6.232257763544719, "global_step": 90677, "epoch": 2158, "val_loss": 63079.4921875} {"train_loss": -6.299530029296875, "global_step": 90678, "epoch": 2159} {"train_loss": -6.297267436981201, "global_step": 90679, "epoch": 2159} {"train_loss": -6.325711727142334, "global_step": 90680, "epoch": 2159} {"train_loss": -6.1887969970703125, "global_step": 90681, "epoch": 2159} {"train_loss": -6.365164756774902, "global_step": 90682, "epoch": 2159} {"train_loss": -6.339953899383545, "global_step": 90683, "epoch": 2159} {"train_loss": -6.447802543640137, "global_step": 90684, "epoch": 2159} {"train_loss": -6.27536678314209, "global_step": 90685, "epoch": 2159} {"train_loss": -6.144654750823975, "global_step": 90686, "epoch": 2159} {"train_loss": -6.365422248840332, "global_step": 90687, "epoch": 2159} {"train_loss": -6.251624584197998, "global_step": 90688, "epoch": 2159} {"train_loss": -6.204478740692139, "global_step": 90689, "epoch": 2159} {"train_loss": -6.3322248458862305, "global_step": 90690, "epoch": 2159} {"train_loss": -6.321857452392578, "global_step": 90691, "epoch": 2159} {"train_loss": -6.2198638916015625, "global_step": 90692, "epoch": 2159} {"train_loss": -6.168082237243652, "global_step": 90693, "epoch": 2159} {"train_loss": -6.365453243255615, "global_step": 90694, "epoch": 2159} {"train_loss": -6.194025039672852, "global_step": 90695, "epoch": 2159} {"train_loss": -6.059989929199219, "global_step": 90696, "epoch": 2159} {"train_loss": -6.3094964027404785, "global_step": 90697, "epoch": 2159} {"train_loss": -6.124247074127197, "global_step": 90698, "epoch": 2159} {"train_loss": -6.186437606811523, "global_step": 90699, "epoch": 2159} {"train_loss": -6.220047950744629, "global_step": 90700, "epoch": 2159} {"train_loss": -6.084562301635742, "global_step": 90701, "epoch": 2159} {"train_loss": -6.327826976776123, "global_step": 90702, "epoch": 2159} {"train_loss": -6.177944183349609, "global_step": 90703, "epoch": 2159} {"train_loss": -6.248955726623535, "global_step": 90704, "epoch": 2159} {"train_loss": -6.239047050476074, "global_step": 90705, "epoch": 2159} {"train_loss": -6.211462020874023, "global_step": 90706, "epoch": 2159} {"train_loss": -6.251461982727051, "global_step": 90707, "epoch": 2159} {"train_loss": -6.204099655151367, "global_step": 90708, "epoch": 2159} {"train_loss": -6.197196006774902, "global_step": 90709, "epoch": 2159} {"train_loss": -6.1092023849487305, "global_step": 90710, "epoch": 2159} {"train_loss": -6.213491439819336, "global_step": 90711, "epoch": 2159} {"train_loss": -6.377129077911377, "global_step": 90712, "epoch": 2159} {"train_loss": -6.217423439025879, "global_step": 90713, "epoch": 2159} {"train_loss": -6.293999671936035, "global_step": 90714, "epoch": 2159} {"train_loss": -6.262270927429199, "global_step": 90715, "epoch": 2159} {"train_loss": -6.179806709289551, "global_step": 90716, "epoch": 2159} {"train_loss": -6.234175205230713, "global_step": 90717, "epoch": 2159} {"train_loss": -6.321911334991455, "global_step": 90718, "epoch": 2159} {"train_loss": -6.249608891350882, "global_step": 90719, "epoch": 2159, "val_loss": 63294.30078125} {"train_loss": -6.200377464294434, "global_step": 90720, "epoch": 2160} {"train_loss": -6.283873558044434, "global_step": 90721, "epoch": 2160} {"train_loss": -6.376125335693359, "global_step": 90722, "epoch": 2160} {"train_loss": -6.32762336730957, "global_step": 90723, "epoch": 2160} {"train_loss": -6.165313720703125, "global_step": 90724, "epoch": 2160} {"train_loss": -6.19140625, "global_step": 90725, "epoch": 2160} {"train_loss": -6.291272163391113, "global_step": 90726, "epoch": 2160} {"train_loss": -6.113018989562988, "global_step": 90727, "epoch": 2160} {"train_loss": -6.221652030944824, "global_step": 90728, "epoch": 2160} {"train_loss": -6.214252471923828, "global_step": 90729, "epoch": 2160} {"train_loss": -6.311591148376465, "global_step": 90730, "epoch": 2160} {"train_loss": -6.2308669090271, "global_step": 90731, "epoch": 2160} {"train_loss": -6.327569961547852, "global_step": 90732, "epoch": 2160} {"train_loss": -6.248078346252441, "global_step": 90733, "epoch": 2160} {"train_loss": -6.3101606369018555, "global_step": 90734, "epoch": 2160} {"train_loss": -6.381608963012695, "global_step": 90735, "epoch": 2160} {"train_loss": -6.180136680603027, "global_step": 90736, "epoch": 2160} {"train_loss": -6.325685024261475, "global_step": 90737, "epoch": 2160} {"train_loss": -6.2603864669799805, "global_step": 90738, "epoch": 2160} {"train_loss": -6.228768348693848, "global_step": 90739, "epoch": 2160} {"train_loss": -6.352189064025879, "global_step": 90740, "epoch": 2160} {"train_loss": -6.202683925628662, "global_step": 90741, "epoch": 2160} {"train_loss": -6.307293891906738, "global_step": 90742, "epoch": 2160} {"train_loss": -6.342226028442383, "global_step": 90743, "epoch": 2160} {"train_loss": -6.228747367858887, "global_step": 90744, "epoch": 2160} {"train_loss": -6.2616448402404785, "global_step": 90745, "epoch": 2160} {"train_loss": -6.287372589111328, "global_step": 90746, "epoch": 2160} {"train_loss": -6.38588285446167, "global_step": 90747, "epoch": 2160} {"train_loss": -6.377386093139648, "global_step": 90748, "epoch": 2160} {"train_loss": -6.245771408081055, "global_step": 90749, "epoch": 2160} {"train_loss": -6.228332042694092, "global_step": 90750, "epoch": 2160} {"train_loss": -6.217987060546875, "global_step": 90751, "epoch": 2160} {"train_loss": -6.291007041931152, "global_step": 90752, "epoch": 2160} {"train_loss": -6.276449203491211, "global_step": 90753, "epoch": 2160} {"train_loss": -6.361849784851074, "global_step": 90754, "epoch": 2160} {"train_loss": -6.31507682800293, "global_step": 90755, "epoch": 2160} {"train_loss": -6.27284574508667, "global_step": 90756, "epoch": 2160} {"train_loss": -6.189974784851074, "global_step": 90757, "epoch": 2160} {"train_loss": -6.3767805099487305, "global_step": 90758, "epoch": 2160} {"train_loss": -6.2432050704956055, "global_step": 90759, "epoch": 2160} {"train_loss": -6.186611175537109, "global_step": 90760, "epoch": 2160} {"train_loss": -6.27478830019633, "global_step": 90761, "epoch": 2160, "val_loss": 63355.63671875} {"train_loss": -6.326412200927734, "global_step": 90762, "epoch": 2161} {"train_loss": -6.3333330154418945, "global_step": 90763, "epoch": 2161} {"train_loss": -6.319492340087891, "global_step": 90764, "epoch": 2161} {"train_loss": -6.363348960876465, "global_step": 90765, "epoch": 2161} {"train_loss": -6.14167594909668, "global_step": 90766, "epoch": 2161} {"train_loss": -6.233193874359131, "global_step": 90767, "epoch": 2161} {"train_loss": -6.1685004234313965, "global_step": 90768, "epoch": 2161} {"train_loss": -6.114009857177734, "global_step": 90769, "epoch": 2161} {"train_loss": -6.0747504234313965, "global_step": 90770, "epoch": 2161} {"train_loss": -6.2886152267456055, "global_step": 90771, "epoch": 2161} {"train_loss": -6.168499946594238, "global_step": 90772, "epoch": 2161} {"train_loss": -6.120932579040527, "global_step": 90773, "epoch": 2161} {"train_loss": -6.209952354431152, "global_step": 90774, "epoch": 2161} {"train_loss": -6.216466903686523, "global_step": 90775, "epoch": 2161} {"train_loss": -6.237269878387451, "global_step": 90776, "epoch": 2161} {"train_loss": -6.258340835571289, "global_step": 90777, "epoch": 2161} {"train_loss": -6.272939682006836, "global_step": 90778, "epoch": 2161} {"train_loss": -6.243165016174316, "global_step": 90779, "epoch": 2161} {"train_loss": -6.315694808959961, "global_step": 90780, "epoch": 2161} {"train_loss": -6.168217658996582, "global_step": 90781, "epoch": 2161} {"train_loss": -6.341914653778076, "global_step": 90782, "epoch": 2161} {"train_loss": -6.263638019561768, "global_step": 90783, "epoch": 2161} {"train_loss": -6.189692497253418, "global_step": 90784, "epoch": 2161} {"train_loss": -6.261379718780518, "global_step": 90785, "epoch": 2161} {"train_loss": -6.211717128753662, "global_step": 90786, "epoch": 2161} {"train_loss": -6.325222015380859, "global_step": 90787, "epoch": 2161} {"train_loss": -6.425474643707275, "global_step": 90788, "epoch": 2161} {"train_loss": -6.283321380615234, "global_step": 90789, "epoch": 2161} {"train_loss": -6.29567813873291, "global_step": 90790, "epoch": 2161} {"train_loss": -6.276522159576416, "global_step": 90791, "epoch": 2161} {"train_loss": -6.218031406402588, "global_step": 90792, "epoch": 2161} {"train_loss": -6.184453010559082, "global_step": 90793, "epoch": 2161} {"train_loss": -6.156221866607666, "global_step": 90794, "epoch": 2161} {"train_loss": -6.234642505645752, "global_step": 90795, "epoch": 2161} {"train_loss": -6.229979991912842, "global_step": 90796, "epoch": 2161} {"train_loss": -6.32225227355957, "global_step": 90797, "epoch": 2161} {"train_loss": -6.2064208984375, "global_step": 90798, "epoch": 2161} {"train_loss": -6.076204299926758, "global_step": 90799, "epoch": 2161} {"train_loss": -6.103602409362793, "global_step": 90800, "epoch": 2161} {"train_loss": -6.281107425689697, "global_step": 90801, "epoch": 2161} {"train_loss": -6.224513053894043, "global_step": 90802, "epoch": 2161} {"train_loss": -6.239022561482021, "global_step": 90803, "epoch": 2161, "val_loss": 63019.30078125} {"train_loss": -6.36553430557251, "global_step": 90804, "epoch": 2162} {"train_loss": -6.3594160079956055, "global_step": 90805, "epoch": 2162} {"train_loss": -6.260498046875, "global_step": 90806, "epoch": 2162} {"train_loss": -6.224997520446777, "global_step": 90807, "epoch": 2162} {"train_loss": -6.305020332336426, "global_step": 90808, "epoch": 2162} {"train_loss": -6.331592559814453, "global_step": 90809, "epoch": 2162} {"train_loss": -6.3319783210754395, "global_step": 90810, "epoch": 2162} {"train_loss": -6.2811689376831055, "global_step": 90811, "epoch": 2162} {"train_loss": -6.311699867248535, "global_step": 90812, "epoch": 2162} {"train_loss": -6.232561111450195, "global_step": 90813, "epoch": 2162} {"train_loss": -6.2816057205200195, "global_step": 90814, "epoch": 2162} {"train_loss": -6.194943904876709, "global_step": 90815, "epoch": 2162} {"train_loss": -6.276504039764404, "global_step": 90816, "epoch": 2162} {"train_loss": -6.3820929527282715, "global_step": 90817, "epoch": 2162} {"train_loss": -6.338076114654541, "global_step": 90818, "epoch": 2162} {"train_loss": -6.312678337097168, "global_step": 90819, "epoch": 2162} {"train_loss": -6.343051910400391, "global_step": 90820, "epoch": 2162} {"train_loss": -6.3831987380981445, "global_step": 90821, "epoch": 2162} {"train_loss": -6.2831292152404785, "global_step": 90822, "epoch": 2162} {"train_loss": -6.367937088012695, "global_step": 90823, "epoch": 2162} {"train_loss": -6.291837215423584, "global_step": 90824, "epoch": 2162} {"train_loss": -6.1860270500183105, "global_step": 90825, "epoch": 2162} {"train_loss": -6.229748725891113, "global_step": 90826, "epoch": 2162} {"train_loss": -6.426837921142578, "global_step": 90827, "epoch": 2162} {"train_loss": -6.070721626281738, "global_step": 90828, "epoch": 2162} {"train_loss": -6.1180524826049805, "global_step": 90829, "epoch": 2162} {"train_loss": -6.303075790405273, "global_step": 90830, "epoch": 2162} {"train_loss": -6.278408527374268, "global_step": 90831, "epoch": 2162} {"train_loss": -6.269518852233887, "global_step": 90832, "epoch": 2162} {"train_loss": -6.307541847229004, "global_step": 90833, "epoch": 2162} {"train_loss": -6.234445571899414, "global_step": 90834, "epoch": 2162} {"train_loss": -6.191343307495117, "global_step": 90835, "epoch": 2162} {"train_loss": -6.273092746734619, "global_step": 90836, "epoch": 2162} {"train_loss": -6.313690185546875, "global_step": 90837, "epoch": 2162} {"train_loss": -6.1401591300964355, "global_step": 90838, "epoch": 2162} {"train_loss": -6.245333194732666, "global_step": 90839, "epoch": 2162} {"train_loss": -6.208259105682373, "global_step": 90840, "epoch": 2162} {"train_loss": -6.164043426513672, "global_step": 90841, "epoch": 2162} {"train_loss": -6.211475372314453, "global_step": 90842, "epoch": 2162} {"train_loss": -6.241220951080322, "global_step": 90843, "epoch": 2162} {"train_loss": -6.0685834884643555, "global_step": 90844, "epoch": 2162} {"train_loss": -6.2662450813111805, "global_step": 90845, "epoch": 2162, "val_loss": 63261.31640625} {"train_loss": -6.207937240600586, "global_step": 90846, "epoch": 2163} {"train_loss": -6.238724708557129, "global_step": 90847, "epoch": 2163} {"train_loss": -6.272924423217773, "global_step": 90848, "epoch": 2163} {"train_loss": -6.225408554077148, "global_step": 90849, "epoch": 2163} {"train_loss": -6.168745040893555, "global_step": 90850, "epoch": 2163} {"train_loss": -6.186178684234619, "global_step": 90851, "epoch": 2163} {"train_loss": -6.17323112487793, "global_step": 90852, "epoch": 2163} {"train_loss": -6.241497993469238, "global_step": 90853, "epoch": 2163} {"train_loss": -6.310674667358398, "global_step": 90854, "epoch": 2163} {"train_loss": -6.145639419555664, "global_step": 90855, "epoch": 2163} {"train_loss": -6.392120838165283, "global_step": 90856, "epoch": 2163} {"train_loss": -6.037995338439941, "global_step": 90857, "epoch": 2163} {"train_loss": -6.332601070404053, "global_step": 90858, "epoch": 2163} {"train_loss": -6.028176307678223, "global_step": 90859, "epoch": 2163} {"train_loss": -6.210786819458008, "global_step": 90860, "epoch": 2163} {"train_loss": -6.128948211669922, "global_step": 90861, "epoch": 2163} {"train_loss": -6.206674575805664, "global_step": 90862, "epoch": 2163} {"train_loss": -6.204540252685547, "global_step": 90863, "epoch": 2163} {"train_loss": -6.176609992980957, "global_step": 90864, "epoch": 2163} {"train_loss": -6.237176418304443, "global_step": 90865, "epoch": 2163} {"train_loss": -6.124423027038574, "global_step": 90866, "epoch": 2163} {"train_loss": -6.370555877685547, "global_step": 90867, "epoch": 2163} {"train_loss": -6.250792503356934, "global_step": 90868, "epoch": 2163} {"train_loss": -6.286293029785156, "global_step": 90869, "epoch": 2163} {"train_loss": -6.244599342346191, "global_step": 90870, "epoch": 2163} {"train_loss": -6.170398712158203, "global_step": 90871, "epoch": 2163} {"train_loss": -6.206242561340332, "global_step": 90872, "epoch": 2163} {"train_loss": -6.190228462219238, "global_step": 90873, "epoch": 2163} {"train_loss": -6.219542980194092, "global_step": 90874, "epoch": 2163} {"train_loss": -6.275444030761719, "global_step": 90875, "epoch": 2163} {"train_loss": -6.330726146697998, "global_step": 90876, "epoch": 2163} {"train_loss": -6.314236640930176, "global_step": 90877, "epoch": 2163} {"train_loss": -6.337644577026367, "global_step": 90878, "epoch": 2163} {"train_loss": -6.233479022979736, "global_step": 90879, "epoch": 2163} {"train_loss": -6.27720832824707, "global_step": 90880, "epoch": 2163} {"train_loss": -6.177947998046875, "global_step": 90881, "epoch": 2163} {"train_loss": -6.209632873535156, "global_step": 90882, "epoch": 2163} {"train_loss": -6.261967182159424, "global_step": 90883, "epoch": 2163} {"train_loss": -6.098052978515625, "global_step": 90884, "epoch": 2163} {"train_loss": -6.233564376831055, "global_step": 90885, "epoch": 2163} {"train_loss": -6.238637924194336, "global_step": 90886, "epoch": 2163} {"train_loss": -6.222594317935762, "global_step": 90887, "epoch": 2163, "val_loss": 63176.19921875} {"train_loss": -6.218741416931152, "global_step": 90888, "epoch": 2164} {"train_loss": -6.224189281463623, "global_step": 90889, "epoch": 2164} {"train_loss": -6.3541669845581055, "global_step": 90890, "epoch": 2164} {"train_loss": -6.221933364868164, "global_step": 90891, "epoch": 2164} {"train_loss": -6.3214545249938965, "global_step": 90892, "epoch": 2164} {"train_loss": -6.2453718185424805, "global_step": 90893, "epoch": 2164} {"train_loss": -6.359286308288574, "global_step": 90894, "epoch": 2164} {"train_loss": -6.27591609954834, "global_step": 90895, "epoch": 2164} {"train_loss": -6.2835893630981445, "global_step": 90896, "epoch": 2164} {"train_loss": -6.196529388427734, "global_step": 90897, "epoch": 2164} {"train_loss": -6.157955169677734, "global_step": 90898, "epoch": 2164} {"train_loss": -6.348329544067383, "global_step": 90899, "epoch": 2164} {"train_loss": -6.278739929199219, "global_step": 90900, "epoch": 2164} {"train_loss": -6.246840476989746, "global_step": 90901, "epoch": 2164} {"train_loss": -6.312297821044922, "global_step": 90902, "epoch": 2164} {"train_loss": -6.255720138549805, "global_step": 90903, "epoch": 2164} {"train_loss": -6.269415855407715, "global_step": 90904, "epoch": 2164} {"train_loss": -6.3940205574035645, "global_step": 90905, "epoch": 2164} {"train_loss": -6.3240485191345215, "global_step": 90906, "epoch": 2164} {"train_loss": -6.4284539222717285, "global_step": 90907, "epoch": 2164} {"train_loss": -6.344083309173584, "global_step": 90908, "epoch": 2164} {"train_loss": -6.3062424659729, "global_step": 90909, "epoch": 2164} {"train_loss": -6.310973644256592, "global_step": 90910, "epoch": 2164} {"train_loss": -6.283486366271973, "global_step": 90911, "epoch": 2164} {"train_loss": -6.243232727050781, "global_step": 90912, "epoch": 2164} {"train_loss": -6.310347557067871, "global_step": 90913, "epoch": 2164} {"train_loss": -6.178177833557129, "global_step": 90914, "epoch": 2164} {"train_loss": -6.306340217590332, "global_step": 90915, "epoch": 2164} {"train_loss": -6.232420921325684, "global_step": 90916, "epoch": 2164} {"train_loss": -6.169363975524902, "global_step": 90917, "epoch": 2164} {"train_loss": -6.205084800720215, "global_step": 90918, "epoch": 2164} {"train_loss": -6.133792877197266, "global_step": 90919, "epoch": 2164} {"train_loss": -6.254844665527344, "global_step": 90920, "epoch": 2164} {"train_loss": -6.171379089355469, "global_step": 90921, "epoch": 2164} {"train_loss": -6.331499099731445, "global_step": 90922, "epoch": 2164} {"train_loss": -6.320555686950684, "global_step": 90923, "epoch": 2164} {"train_loss": -6.220742225646973, "global_step": 90924, "epoch": 2164} {"train_loss": -6.254067420959473, "global_step": 90925, "epoch": 2164} {"train_loss": -6.336577415466309, "global_step": 90926, "epoch": 2164} {"train_loss": -6.327550888061523, "global_step": 90927, "epoch": 2164} {"train_loss": -6.262378692626953, "global_step": 90928, "epoch": 2164} {"train_loss": -6.27378005073184, "global_step": 90929, "epoch": 2164, "val_loss": 63344.0546875} {"train_loss": -6.337625503540039, "global_step": 90930, "epoch": 2165} {"train_loss": -6.204926490783691, "global_step": 90931, "epoch": 2165} {"train_loss": -6.28093957901001, "global_step": 90932, "epoch": 2165} {"train_loss": -6.28257942199707, "global_step": 90933, "epoch": 2165} {"train_loss": -6.1443986892700195, "global_step": 90934, "epoch": 2165} {"train_loss": -6.1927995681762695, "global_step": 90935, "epoch": 2165} {"train_loss": -6.220679759979248, "global_step": 90936, "epoch": 2165} {"train_loss": -6.31353235244751, "global_step": 90937, "epoch": 2165} {"train_loss": -6.280559539794922, "global_step": 90938, "epoch": 2165} {"train_loss": -6.305304527282715, "global_step": 90939, "epoch": 2165} {"train_loss": -6.180129528045654, "global_step": 90940, "epoch": 2165} {"train_loss": -6.222395896911621, "global_step": 90941, "epoch": 2165} {"train_loss": -6.2309651374816895, "global_step": 90942, "epoch": 2165} {"train_loss": -6.238734245300293, "global_step": 90943, "epoch": 2165} {"train_loss": -6.276156425476074, "global_step": 90944, "epoch": 2165} {"train_loss": -6.2456254959106445, "global_step": 90945, "epoch": 2165} {"train_loss": -6.232453346252441, "global_step": 90946, "epoch": 2165} {"train_loss": -6.268355369567871, "global_step": 90947, "epoch": 2165} {"train_loss": -6.348240375518799, "global_step": 90948, "epoch": 2165} {"train_loss": -6.288366317749023, "global_step": 90949, "epoch": 2165} {"train_loss": -6.3159074783325195, "global_step": 90950, "epoch": 2165} {"train_loss": -6.184844017028809, "global_step": 90951, "epoch": 2165} {"train_loss": -6.233908653259277, "global_step": 90952, "epoch": 2165} {"train_loss": -6.29296875, "global_step": 90953, "epoch": 2165} {"train_loss": -6.230783462524414, "global_step": 90954, "epoch": 2165} {"train_loss": -6.141170024871826, "global_step": 90955, "epoch": 2165} {"train_loss": -6.242010116577148, "global_step": 90956, "epoch": 2165} {"train_loss": -6.193253993988037, "global_step": 90957, "epoch": 2165} {"train_loss": -6.278072834014893, "global_step": 90958, "epoch": 2165} {"train_loss": -6.1165008544921875, "global_step": 90959, "epoch": 2165} {"train_loss": -6.329809188842773, "global_step": 90960, "epoch": 2165} {"train_loss": -6.173293590545654, "global_step": 90961, "epoch": 2165} {"train_loss": -6.293806076049805, "global_step": 90962, "epoch": 2165} {"train_loss": -6.371482849121094, "global_step": 90963, "epoch": 2165} {"train_loss": -6.248748302459717, "global_step": 90964, "epoch": 2165} {"train_loss": -6.240805625915527, "global_step": 90965, "epoch": 2165} {"train_loss": -6.319550037384033, "global_step": 90966, "epoch": 2165} {"train_loss": -6.1912522315979, "global_step": 90967, "epoch": 2165} {"train_loss": -6.1349334716796875, "global_step": 90968, "epoch": 2165} {"train_loss": -6.339024543762207, "global_step": 90969, "epoch": 2165} {"train_loss": -6.199434757232666, "global_step": 90970, "epoch": 2165} {"train_loss": -6.249769142695835, "global_step": 90971, "epoch": 2165, "val_loss": 63169.9140625} {"train_loss": -6.317967414855957, "global_step": 90972, "epoch": 2166} {"train_loss": -6.29812479019165, "global_step": 90973, "epoch": 2166} {"train_loss": -6.294429302215576, "global_step": 90974, "epoch": 2166} {"train_loss": -6.331398963928223, "global_step": 90975, "epoch": 2166} {"train_loss": -6.3105149269104, "global_step": 90976, "epoch": 2166} {"train_loss": -6.274112701416016, "global_step": 90977, "epoch": 2166} {"train_loss": -6.310959339141846, "global_step": 90978, "epoch": 2166} {"train_loss": -6.193022727966309, "global_step": 90979, "epoch": 2166} {"train_loss": -6.324787139892578, "global_step": 90980, "epoch": 2166} {"train_loss": -6.19805908203125, "global_step": 90981, "epoch": 2166} {"train_loss": -6.311650276184082, "global_step": 90982, "epoch": 2166} {"train_loss": -6.254489898681641, "global_step": 90983, "epoch": 2166} {"train_loss": -6.097826957702637, "global_step": 90984, "epoch": 2166} {"train_loss": -6.240392684936523, "global_step": 90985, "epoch": 2166} {"train_loss": -6.290794372558594, "global_step": 90986, "epoch": 2166} {"train_loss": -6.251667022705078, "global_step": 90987, "epoch": 2166} {"train_loss": -6.302804946899414, "global_step": 90988, "epoch": 2166} {"train_loss": -6.348598480224609, "global_step": 90989, "epoch": 2166} {"train_loss": -6.281212329864502, "global_step": 90990, "epoch": 2166} {"train_loss": -6.309122085571289, "global_step": 90991, "epoch": 2166} {"train_loss": -6.3054609298706055, "global_step": 90992, "epoch": 2166} {"train_loss": -6.321101188659668, "global_step": 90993, "epoch": 2166} {"train_loss": -6.31962776184082, "global_step": 90994, "epoch": 2166} {"train_loss": -6.285682678222656, "global_step": 90995, "epoch": 2166} {"train_loss": -6.2467851638793945, "global_step": 90996, "epoch": 2166} {"train_loss": -6.3463544845581055, "global_step": 90997, "epoch": 2166} {"train_loss": -6.3017578125, "global_step": 90998, "epoch": 2166} {"train_loss": -6.303380966186523, "global_step": 90999, "epoch": 2166} {"train_loss": -6.237372875213623, "global_step": 91000, "epoch": 2166} {"train_loss": -6.402656555175781, "global_step": 91001, "epoch": 2166} {"train_loss": -6.3151702880859375, "global_step": 91002, "epoch": 2166} {"train_loss": -6.2459869384765625, "global_step": 91003, "epoch": 2166} {"train_loss": -6.343288421630859, "global_step": 91004, "epoch": 2166} {"train_loss": -6.284684181213379, "global_step": 91005, "epoch": 2166} {"train_loss": -6.198981761932373, "global_step": 91006, "epoch": 2166} {"train_loss": -6.209585189819336, "global_step": 91007, "epoch": 2166} {"train_loss": -6.308428764343262, "global_step": 91008, "epoch": 2166} {"train_loss": -6.3554205894470215, "global_step": 91009, "epoch": 2166} {"train_loss": -6.304043292999268, "global_step": 91010, "epoch": 2166} {"train_loss": -6.269369602203369, "global_step": 91011, "epoch": 2166} {"train_loss": -6.279854774475098, "global_step": 91012, "epoch": 2166} {"train_loss": -6.287095603488741, "global_step": 91013, "epoch": 2166, "val_loss": 63187.99609375} {"train_loss": -6.186630725860596, "global_step": 91014, "epoch": 2167} {"train_loss": -6.253241062164307, "global_step": 91015, "epoch": 2167} {"train_loss": -6.265811443328857, "global_step": 91016, "epoch": 2167} {"train_loss": -6.238493919372559, "global_step": 91017, "epoch": 2167} {"train_loss": -6.265105724334717, "global_step": 91018, "epoch": 2167} {"train_loss": -6.27353572845459, "global_step": 91019, "epoch": 2167} {"train_loss": -6.244219779968262, "global_step": 91020, "epoch": 2167} {"train_loss": -6.394023895263672, "global_step": 91021, "epoch": 2167} {"train_loss": -6.19877815246582, "global_step": 91022, "epoch": 2167} {"train_loss": -6.234919548034668, "global_step": 91023, "epoch": 2167} {"train_loss": -6.162412643432617, "global_step": 91024, "epoch": 2167} {"train_loss": -6.2008466720581055, "global_step": 91025, "epoch": 2167} {"train_loss": -6.218092918395996, "global_step": 91026, "epoch": 2167} {"train_loss": -6.3834428787231445, "global_step": 91027, "epoch": 2167} {"train_loss": -6.104421138763428, "global_step": 91028, "epoch": 2167} {"train_loss": -6.28613805770874, "global_step": 91029, "epoch": 2167} {"train_loss": -6.259552001953125, "global_step": 91030, "epoch": 2167} {"train_loss": -6.219486713409424, "global_step": 91031, "epoch": 2167} {"train_loss": -6.173351287841797, "global_step": 91032, "epoch": 2167} {"train_loss": -6.064556121826172, "global_step": 91033, "epoch": 2167} {"train_loss": -6.132090091705322, "global_step": 91034, "epoch": 2167} {"train_loss": -6.255931854248047, "global_step": 91035, "epoch": 2167} {"train_loss": -6.2157487869262695, "global_step": 91036, "epoch": 2167} {"train_loss": -6.14220666885376, "global_step": 91037, "epoch": 2167} {"train_loss": -6.268144607543945, "global_step": 91038, "epoch": 2167} {"train_loss": -6.138458251953125, "global_step": 91039, "epoch": 2167} {"train_loss": -6.271949768066406, "global_step": 91040, "epoch": 2167} {"train_loss": -6.261880397796631, "global_step": 91041, "epoch": 2167} {"train_loss": -6.12206506729126, "global_step": 91042, "epoch": 2167} {"train_loss": -6.258937835693359, "global_step": 91043, "epoch": 2167} {"train_loss": -6.259303092956543, "global_step": 91044, "epoch": 2167} {"train_loss": -6.309182167053223, "global_step": 91045, "epoch": 2167} {"train_loss": -6.261893272399902, "global_step": 91046, "epoch": 2167} {"train_loss": -6.32460880279541, "global_step": 91047, "epoch": 2167} {"train_loss": -6.283275604248047, "global_step": 91048, "epoch": 2167} {"train_loss": -6.304666519165039, "global_step": 91049, "epoch": 2167} {"train_loss": -6.26318359375, "global_step": 91050, "epoch": 2167} {"train_loss": -6.334808826446533, "global_step": 91051, "epoch": 2167} {"train_loss": -6.358888626098633, "global_step": 91052, "epoch": 2167} {"train_loss": -6.299405574798584, "global_step": 91053, "epoch": 2167} {"train_loss": -6.276816368103027, "global_step": 91054, "epoch": 2167} {"train_loss": -6.242784568241665, "global_step": 91055, "epoch": 2167, "val_loss": 63071.16015625} {"train_loss": -6.280148506164551, "global_step": 91056, "epoch": 2168} {"train_loss": -6.34387731552124, "global_step": 91057, "epoch": 2168} {"train_loss": -6.147380352020264, "global_step": 91058, "epoch": 2168} {"train_loss": -6.294206619262695, "global_step": 91059, "epoch": 2168} {"train_loss": -6.313134670257568, "global_step": 91060, "epoch": 2168} {"train_loss": -6.2950119972229, "global_step": 91061, "epoch": 2168} {"train_loss": -6.264594554901123, "global_step": 91062, "epoch": 2168} {"train_loss": -6.327151298522949, "global_step": 91063, "epoch": 2168} {"train_loss": -6.199720859527588, "global_step": 91064, "epoch": 2168} {"train_loss": -6.219870567321777, "global_step": 91065, "epoch": 2168} {"train_loss": -6.3378753662109375, "global_step": 91066, "epoch": 2168} {"train_loss": -6.200399398803711, "global_step": 91067, "epoch": 2168} {"train_loss": -6.229214191436768, "global_step": 91068, "epoch": 2168} {"train_loss": -6.183952808380127, "global_step": 91069, "epoch": 2168} {"train_loss": -6.317649841308594, "global_step": 91070, "epoch": 2168} {"train_loss": -6.304185390472412, "global_step": 91071, "epoch": 2168} {"train_loss": -6.354281902313232, "global_step": 91072, "epoch": 2168} {"train_loss": -6.196928977966309, "global_step": 91073, "epoch": 2168} {"train_loss": -6.260077476501465, "global_step": 91074, "epoch": 2168} {"train_loss": -6.263035774230957, "global_step": 91075, "epoch": 2168} {"train_loss": -6.279433727264404, "global_step": 91076, "epoch": 2168} {"train_loss": -6.297506332397461, "global_step": 91077, "epoch": 2168} {"train_loss": -6.207453727722168, "global_step": 91078, "epoch": 2168} {"train_loss": -6.422024726867676, "global_step": 91079, "epoch": 2168} {"train_loss": -6.200498580932617, "global_step": 91080, "epoch": 2168} {"train_loss": -6.26643705368042, "global_step": 91081, "epoch": 2168} {"train_loss": -6.355837821960449, "global_step": 91082, "epoch": 2168} {"train_loss": -6.287051677703857, "global_step": 91083, "epoch": 2168} {"train_loss": -6.255861759185791, "global_step": 91084, "epoch": 2168} {"train_loss": -6.212048530578613, "global_step": 91085, "epoch": 2168} {"train_loss": -6.441166400909424, "global_step": 91086, "epoch": 2168} {"train_loss": -6.384079933166504, "global_step": 91087, "epoch": 2168} {"train_loss": -6.248748779296875, "global_step": 91088, "epoch": 2168} {"train_loss": -6.286532402038574, "global_step": 91089, "epoch": 2168} {"train_loss": -6.354673385620117, "global_step": 91090, "epoch": 2168} {"train_loss": -6.375375270843506, "global_step": 91091, "epoch": 2168} {"train_loss": -6.378302574157715, "global_step": 91092, "epoch": 2168} {"train_loss": -6.30192756652832, "global_step": 91093, "epoch": 2168} {"train_loss": -6.322296142578125, "global_step": 91094, "epoch": 2168} {"train_loss": -6.478560447692871, "global_step": 91095, "epoch": 2168} {"train_loss": -6.214823246002197, "global_step": 91096, "epoch": 2168} {"train_loss": -6.289789733432588, "global_step": 91097, "epoch": 2168, "val_loss": 63205.71875} {"train_loss": -6.420097827911377, "global_step": 91098, "epoch": 2169} {"train_loss": -6.363987445831299, "global_step": 91099, "epoch": 2169} {"train_loss": -6.361988067626953, "global_step": 91100, "epoch": 2169} {"train_loss": -6.252007961273193, "global_step": 91101, "epoch": 2169} {"train_loss": -6.304018974304199, "global_step": 91102, "epoch": 2169} {"train_loss": -6.236806869506836, "global_step": 91103, "epoch": 2169} {"train_loss": -6.373106956481934, "global_step": 91104, "epoch": 2169} {"train_loss": -6.35491943359375, "global_step": 91105, "epoch": 2169} {"train_loss": -6.233782768249512, "global_step": 91106, "epoch": 2169} {"train_loss": -6.219959259033203, "global_step": 91107, "epoch": 2169} {"train_loss": -6.314027786254883, "global_step": 91108, "epoch": 2169} {"train_loss": -6.478402137756348, "global_step": 91109, "epoch": 2169} {"train_loss": -6.377167701721191, "global_step": 91110, "epoch": 2169} {"train_loss": -6.326614856719971, "global_step": 91111, "epoch": 2169} {"train_loss": -6.398604869842529, "global_step": 91112, "epoch": 2169} {"train_loss": -6.214970588684082, "global_step": 91113, "epoch": 2169} {"train_loss": -6.208703994750977, "global_step": 91114, "epoch": 2169} {"train_loss": -6.2720794677734375, "global_step": 91115, "epoch": 2169} {"train_loss": -6.31889009475708, "global_step": 91116, "epoch": 2169} {"train_loss": -6.193912982940674, "global_step": 91117, "epoch": 2169} {"train_loss": -6.230031490325928, "global_step": 91118, "epoch": 2169} {"train_loss": -6.380944728851318, "global_step": 91119, "epoch": 2169} {"train_loss": -6.361557960510254, "global_step": 91120, "epoch": 2169} {"train_loss": -6.191158771514893, "global_step": 91121, "epoch": 2169} {"train_loss": -6.345663070678711, "global_step": 91122, "epoch": 2169} {"train_loss": -6.186898708343506, "global_step": 91123, "epoch": 2169} {"train_loss": -6.257789134979248, "global_step": 91124, "epoch": 2169} {"train_loss": -6.192451477050781, "global_step": 91125, "epoch": 2169} {"train_loss": -6.24324369430542, "global_step": 91126, "epoch": 2169} {"train_loss": -6.290633201599121, "global_step": 91127, "epoch": 2169} {"train_loss": -6.239270210266113, "global_step": 91128, "epoch": 2169} {"train_loss": -6.226174354553223, "global_step": 91129, "epoch": 2169} {"train_loss": -6.2109270095825195, "global_step": 91130, "epoch": 2169} {"train_loss": -6.31522274017334, "global_step": 91131, "epoch": 2169} {"train_loss": -6.222583293914795, "global_step": 91132, "epoch": 2169} {"train_loss": -6.258349418640137, "global_step": 91133, "epoch": 2169} {"train_loss": -6.249037742614746, "global_step": 91134, "epoch": 2169} {"train_loss": -6.209883689880371, "global_step": 91135, "epoch": 2169} {"train_loss": -6.324201583862305, "global_step": 91136, "epoch": 2169} {"train_loss": -6.198957920074463, "global_step": 91137, "epoch": 2169} {"train_loss": -6.367937088012695, "global_step": 91138, "epoch": 2169} {"train_loss": -6.284051929201398, "global_step": 91139, "epoch": 2169, "val_loss": 63240.47265625} {"train_loss": -6.257208824157715, "global_step": 91140, "epoch": 2170} {"train_loss": -6.328798294067383, "global_step": 91141, "epoch": 2170} {"train_loss": -6.148489952087402, "global_step": 91142, "epoch": 2170} {"train_loss": -6.284634590148926, "global_step": 91143, "epoch": 2170} {"train_loss": -6.28816032409668, "global_step": 91144, "epoch": 2170} {"train_loss": -6.306883335113525, "global_step": 91145, "epoch": 2170} {"train_loss": -6.3310651779174805, "global_step": 91146, "epoch": 2170} {"train_loss": -6.2967915534973145, "global_step": 91147, "epoch": 2170} {"train_loss": -6.302879810333252, "global_step": 91148, "epoch": 2170} {"train_loss": -6.279027462005615, "global_step": 91149, "epoch": 2170} {"train_loss": -6.262197017669678, "global_step": 91150, "epoch": 2170} {"train_loss": -6.3495893478393555, "global_step": 91151, "epoch": 2170} {"train_loss": -6.279718399047852, "global_step": 91152, "epoch": 2170} {"train_loss": -6.268552780151367, "global_step": 91153, "epoch": 2170} {"train_loss": -6.23110294342041, "global_step": 91154, "epoch": 2170} {"train_loss": -6.156595706939697, "global_step": 91155, "epoch": 2170} {"train_loss": -6.246934413909912, "global_step": 91156, "epoch": 2170} {"train_loss": -6.366661548614502, "global_step": 91157, "epoch": 2170} {"train_loss": -6.3136749267578125, "global_step": 91158, "epoch": 2170} {"train_loss": -6.356617450714111, "global_step": 91159, "epoch": 2170} {"train_loss": -6.233739852905273, "global_step": 91160, "epoch": 2170} {"train_loss": -6.356756687164307, "global_step": 91161, "epoch": 2170} {"train_loss": -6.221126556396484, "global_step": 91162, "epoch": 2170} {"train_loss": -6.294207572937012, "global_step": 91163, "epoch": 2170} {"train_loss": -6.328864097595215, "global_step": 91164, "epoch": 2170} {"train_loss": -6.190888404846191, "global_step": 91165, "epoch": 2170} {"train_loss": -6.208222389221191, "global_step": 91166, "epoch": 2170} {"train_loss": -6.189808368682861, "global_step": 91167, "epoch": 2170} {"train_loss": -6.110013484954834, "global_step": 91168, "epoch": 2170} {"train_loss": -6.349183082580566, "global_step": 91169, "epoch": 2170} {"train_loss": -6.341094017028809, "global_step": 91170, "epoch": 2170} {"train_loss": -6.295798301696777, "global_step": 91171, "epoch": 2170} {"train_loss": -6.33823299407959, "global_step": 91172, "epoch": 2170} {"train_loss": -6.266523361206055, "global_step": 91173, "epoch": 2170} {"train_loss": -6.346405029296875, "global_step": 91174, "epoch": 2170} {"train_loss": -6.279681205749512, "global_step": 91175, "epoch": 2170} {"train_loss": -6.214723110198975, "global_step": 91176, "epoch": 2170} {"train_loss": -6.3490800857543945, "global_step": 91177, "epoch": 2170} {"train_loss": -6.28488826751709, "global_step": 91178, "epoch": 2170} {"train_loss": -6.266058444976807, "global_step": 91179, "epoch": 2170} {"train_loss": -6.31584358215332, "global_step": 91180, "epoch": 2170} {"train_loss": -6.279263269333613, "global_step": 91181, "epoch": 2170, "val_loss": 63251.47265625} {"train_loss": -6.2692742347717285, "global_step": 91182, "epoch": 2171} {"train_loss": -6.346691131591797, "global_step": 91183, "epoch": 2171} {"train_loss": -6.330817222595215, "global_step": 91184, "epoch": 2171} {"train_loss": -6.290802955627441, "global_step": 91185, "epoch": 2171} {"train_loss": -6.146672248840332, "global_step": 91186, "epoch": 2171} {"train_loss": -6.183869361877441, "global_step": 91187, "epoch": 2171} {"train_loss": -6.294339179992676, "global_step": 91188, "epoch": 2171} {"train_loss": -6.18666934967041, "global_step": 91189, "epoch": 2171} {"train_loss": -6.2621636390686035, "global_step": 91190, "epoch": 2171} {"train_loss": -6.18867301940918, "global_step": 91191, "epoch": 2171} {"train_loss": -6.271921157836914, "global_step": 91192, "epoch": 2171} {"train_loss": -6.2688798904418945, "global_step": 91193, "epoch": 2171} {"train_loss": -6.312323570251465, "global_step": 91194, "epoch": 2171} {"train_loss": -6.208261013031006, "global_step": 91195, "epoch": 2171} {"train_loss": -6.257076263427734, "global_step": 91196, "epoch": 2171} {"train_loss": -6.32494592666626, "global_step": 91197, "epoch": 2171} {"train_loss": -6.330819129943848, "global_step": 91198, "epoch": 2171} {"train_loss": -6.3041839599609375, "global_step": 91199, "epoch": 2171} {"train_loss": -6.321242332458496, "global_step": 91200, "epoch": 2171} {"train_loss": -6.36112117767334, "global_step": 91201, "epoch": 2171} {"train_loss": -6.316198348999023, "global_step": 91202, "epoch": 2171} {"train_loss": -6.168798923492432, "global_step": 91203, "epoch": 2171} {"train_loss": -6.321815013885498, "global_step": 91204, "epoch": 2171} {"train_loss": -6.321981430053711, "global_step": 91205, "epoch": 2171} {"train_loss": -6.2337446212768555, "global_step": 91206, "epoch": 2171} {"train_loss": -6.214235305786133, "global_step": 91207, "epoch": 2171} {"train_loss": -6.377772331237793, "global_step": 91208, "epoch": 2171} {"train_loss": -6.298310279846191, "global_step": 91209, "epoch": 2171} {"train_loss": -6.167382717132568, "global_step": 91210, "epoch": 2171} {"train_loss": -6.291405200958252, "global_step": 91211, "epoch": 2171} {"train_loss": -6.359709739685059, "global_step": 91212, "epoch": 2171} {"train_loss": -6.202854156494141, "global_step": 91213, "epoch": 2171} {"train_loss": -6.260998249053955, "global_step": 91214, "epoch": 2171} {"train_loss": -6.155769348144531, "global_step": 91215, "epoch": 2171} {"train_loss": -6.296634674072266, "global_step": 91216, "epoch": 2171} {"train_loss": -6.28924036026001, "global_step": 91217, "epoch": 2171} {"train_loss": -6.240285396575928, "global_step": 91218, "epoch": 2171} {"train_loss": -6.320993900299072, "global_step": 91219, "epoch": 2171} {"train_loss": -6.299384117126465, "global_step": 91220, "epoch": 2171} {"train_loss": -6.3727946281433105, "global_step": 91221, "epoch": 2171} {"train_loss": -6.3639020919799805, "global_step": 91222, "epoch": 2171} {"train_loss": -6.276725019727435, "global_step": 91223, "epoch": 2171, "val_loss": 63311.63671875} {"train_loss": -6.251074314117432, "global_step": 91224, "epoch": 2172} {"train_loss": -6.300080299377441, "global_step": 91225, "epoch": 2172} {"train_loss": -6.279147148132324, "global_step": 91226, "epoch": 2172} {"train_loss": -6.272950172424316, "global_step": 91227, "epoch": 2172} {"train_loss": -6.27140998840332, "global_step": 91228, "epoch": 2172} {"train_loss": -6.266678810119629, "global_step": 91229, "epoch": 2172} {"train_loss": -6.360452651977539, "global_step": 91230, "epoch": 2172} {"train_loss": -6.269664287567139, "global_step": 91231, "epoch": 2172} {"train_loss": -6.167102813720703, "global_step": 91232, "epoch": 2172} {"train_loss": -6.329506874084473, "global_step": 91233, "epoch": 2172} {"train_loss": -6.2513651847839355, "global_step": 91234, "epoch": 2172} {"train_loss": -6.351853370666504, "global_step": 91235, "epoch": 2172} {"train_loss": -6.284793853759766, "global_step": 91236, "epoch": 2172} {"train_loss": -6.214808464050293, "global_step": 91237, "epoch": 2172} {"train_loss": -6.313757419586182, "global_step": 91238, "epoch": 2172} {"train_loss": -6.267692565917969, "global_step": 91239, "epoch": 2172} {"train_loss": -6.367582321166992, "global_step": 91240, "epoch": 2172} {"train_loss": -6.40504789352417, "global_step": 91241, "epoch": 2172} {"train_loss": -6.263120651245117, "global_step": 91242, "epoch": 2172} {"train_loss": -6.339406967163086, "global_step": 91243, "epoch": 2172} {"train_loss": -6.391416072845459, "global_step": 91244, "epoch": 2172} {"train_loss": -6.4042439460754395, "global_step": 91245, "epoch": 2172} {"train_loss": -6.264241695404053, "global_step": 91246, "epoch": 2172} {"train_loss": -6.230587482452393, "global_step": 91247, "epoch": 2172} {"train_loss": -6.2981133460998535, "global_step": 91248, "epoch": 2172} {"train_loss": -6.311507225036621, "global_step": 91249, "epoch": 2172} {"train_loss": -6.298496246337891, "global_step": 91250, "epoch": 2172} {"train_loss": -6.207362174987793, "global_step": 91251, "epoch": 2172} {"train_loss": -6.398811340332031, "global_step": 91252, "epoch": 2172} {"train_loss": -6.283613204956055, "global_step": 91253, "epoch": 2172} {"train_loss": -6.216115951538086, "global_step": 91254, "epoch": 2172} {"train_loss": -6.1626081466674805, "global_step": 91255, "epoch": 2172} {"train_loss": -6.341486930847168, "global_step": 91256, "epoch": 2172} {"train_loss": -6.1700439453125, "global_step": 91257, "epoch": 2172} {"train_loss": -6.318061828613281, "global_step": 91258, "epoch": 2172} {"train_loss": -6.221568584442139, "global_step": 91259, "epoch": 2172} {"train_loss": -6.081147193908691, "global_step": 91260, "epoch": 2172} {"train_loss": -6.1636881828308105, "global_step": 91261, "epoch": 2172} {"train_loss": -6.256711483001709, "global_step": 91262, "epoch": 2172} {"train_loss": -6.209486961364746, "global_step": 91263, "epoch": 2172} {"train_loss": -6.24713659286499, "global_step": 91264, "epoch": 2172} {"train_loss": -6.272743645168486, "global_step": 91265, "epoch": 2172, "val_loss": 63066.4453125} {"train_loss": -6.248686790466309, "global_step": 91266, "epoch": 2173} {"train_loss": -6.226281642913818, "global_step": 91267, "epoch": 2173} {"train_loss": -6.352104187011719, "global_step": 91268, "epoch": 2173} {"train_loss": -6.291861057281494, "global_step": 91269, "epoch": 2173} {"train_loss": -6.25970458984375, "global_step": 91270, "epoch": 2173} {"train_loss": -6.204283714294434, "global_step": 91271, "epoch": 2173} {"train_loss": -6.083040237426758, "global_step": 91272, "epoch": 2173} {"train_loss": -6.308393478393555, "global_step": 91273, "epoch": 2173} {"train_loss": -6.362157821655273, "global_step": 91274, "epoch": 2173} {"train_loss": -6.214354038238525, "global_step": 91275, "epoch": 2173} {"train_loss": -6.287941932678223, "global_step": 91276, "epoch": 2173} {"train_loss": -6.279947757720947, "global_step": 91277, "epoch": 2173} {"train_loss": -6.318236351013184, "global_step": 91278, "epoch": 2173} {"train_loss": -6.203349590301514, "global_step": 91279, "epoch": 2173} {"train_loss": -6.250311851501465, "global_step": 91280, "epoch": 2173} {"train_loss": -6.276829719543457, "global_step": 91281, "epoch": 2173} {"train_loss": -6.130315780639648, "global_step": 91282, "epoch": 2173} {"train_loss": -6.229265213012695, "global_step": 91283, "epoch": 2173} {"train_loss": -6.345573425292969, "global_step": 91284, "epoch": 2173} {"train_loss": -6.282840728759766, "global_step": 91285, "epoch": 2173} {"train_loss": -6.268073558807373, "global_step": 91286, "epoch": 2173} {"train_loss": -6.427071571350098, "global_step": 91287, "epoch": 2173} {"train_loss": -6.339977741241455, "global_step": 91288, "epoch": 2173} {"train_loss": -6.308026313781738, "global_step": 91289, "epoch": 2173} {"train_loss": -6.312260150909424, "global_step": 91290, "epoch": 2173} {"train_loss": -6.303176403045654, "global_step": 91291, "epoch": 2173} {"train_loss": -6.138298034667969, "global_step": 91292, "epoch": 2173} {"train_loss": -6.206727027893066, "global_step": 91293, "epoch": 2173} {"train_loss": -6.231559753417969, "global_step": 91294, "epoch": 2173} {"train_loss": -6.277063369750977, "global_step": 91295, "epoch": 2173} {"train_loss": -6.400087356567383, "global_step": 91296, "epoch": 2173} {"train_loss": -6.257788181304932, "global_step": 91297, "epoch": 2173} {"train_loss": -6.273954391479492, "global_step": 91298, "epoch": 2173} {"train_loss": -6.234596252441406, "global_step": 91299, "epoch": 2173} {"train_loss": -6.168583869934082, "global_step": 91300, "epoch": 2173} {"train_loss": -6.155856132507324, "global_step": 91301, "epoch": 2173} {"train_loss": -6.110340595245361, "global_step": 91302, "epoch": 2173} {"train_loss": -6.387002944946289, "global_step": 91303, "epoch": 2173} {"train_loss": -6.25725793838501, "global_step": 91304, "epoch": 2173} {"train_loss": -6.408727645874023, "global_step": 91305, "epoch": 2173} {"train_loss": -6.217627048492432, "global_step": 91306, "epoch": 2173} {"train_loss": -6.262577908379691, "global_step": 91307, "epoch": 2173, "val_loss": 63203.55078125} {"train_loss": -6.399951457977295, "global_step": 91308, "epoch": 2174} {"train_loss": -6.145038604736328, "global_step": 91309, "epoch": 2174} {"train_loss": -6.2451629638671875, "global_step": 91310, "epoch": 2174} {"train_loss": -6.345361709594727, "global_step": 91311, "epoch": 2174} {"train_loss": -6.277329444885254, "global_step": 91312, "epoch": 2174} {"train_loss": -6.2173752784729, "global_step": 91313, "epoch": 2174} {"train_loss": -6.231361389160156, "global_step": 91314, "epoch": 2174} {"train_loss": -6.161260604858398, "global_step": 91315, "epoch": 2174} {"train_loss": -6.157589912414551, "global_step": 91316, "epoch": 2174} {"train_loss": -6.309237003326416, "global_step": 91317, "epoch": 2174} {"train_loss": -6.256239891052246, "global_step": 91318, "epoch": 2174} {"train_loss": -6.206560134887695, "global_step": 91319, "epoch": 2174} {"train_loss": -6.224442005157471, "global_step": 91320, "epoch": 2174} {"train_loss": -6.2166748046875, "global_step": 91321, "epoch": 2174} {"train_loss": -6.14532470703125, "global_step": 91322, "epoch": 2174} {"train_loss": -6.356000900268555, "global_step": 91323, "epoch": 2174} {"train_loss": -6.175112724304199, "global_step": 91324, "epoch": 2174} {"train_loss": -6.351163864135742, "global_step": 91325, "epoch": 2174} {"train_loss": -6.188632965087891, "global_step": 91326, "epoch": 2174} {"train_loss": -6.185206413269043, "global_step": 91327, "epoch": 2174} {"train_loss": -6.283698558807373, "global_step": 91328, "epoch": 2174} {"train_loss": -6.202124118804932, "global_step": 91329, "epoch": 2174} {"train_loss": -6.345917224884033, "global_step": 91330, "epoch": 2174} {"train_loss": -6.248439311981201, "global_step": 91331, "epoch": 2174} {"train_loss": -6.281069755554199, "global_step": 91332, "epoch": 2174} {"train_loss": -6.232058525085449, "global_step": 91333, "epoch": 2174} {"train_loss": -6.260166645050049, "global_step": 91334, "epoch": 2174} {"train_loss": -6.238431930541992, "global_step": 91335, "epoch": 2174} {"train_loss": -6.367776870727539, "global_step": 91336, "epoch": 2174} {"train_loss": -6.340038299560547, "global_step": 91337, "epoch": 2174} {"train_loss": -6.325462341308594, "global_step": 91338, "epoch": 2174} {"train_loss": -6.257645606994629, "global_step": 91339, "epoch": 2174} {"train_loss": -6.2912492752075195, "global_step": 91340, "epoch": 2174} {"train_loss": -6.207058906555176, "global_step": 91341, "epoch": 2174} {"train_loss": -6.411664962768555, "global_step": 91342, "epoch": 2174} {"train_loss": -6.34157657623291, "global_step": 91343, "epoch": 2174} {"train_loss": -6.367796421051025, "global_step": 91344, "epoch": 2174} {"train_loss": -6.349033355712891, "global_step": 91345, "epoch": 2174} {"train_loss": -6.3520307540893555, "global_step": 91346, "epoch": 2174} {"train_loss": -6.2342963218688965, "global_step": 91347, "epoch": 2174} {"train_loss": -6.307432174682617, "global_step": 91348, "epoch": 2174} {"train_loss": -6.26963852700733, "global_step": 91349, "epoch": 2174, "val_loss": 63144.515625} {"train_loss": -6.188713073730469, "global_step": 91350, "epoch": 2175} {"train_loss": -6.352736473083496, "global_step": 91351, "epoch": 2175} {"train_loss": -6.268945693969727, "global_step": 91352, "epoch": 2175} {"train_loss": -6.229344367980957, "global_step": 91353, "epoch": 2175} {"train_loss": -6.2829909324646, "global_step": 91354, "epoch": 2175} {"train_loss": -6.2590765953063965, "global_step": 91355, "epoch": 2175} {"train_loss": -6.260061740875244, "global_step": 91356, "epoch": 2175} {"train_loss": -6.297576904296875, "global_step": 91357, "epoch": 2175} {"train_loss": -6.365973472595215, "global_step": 91358, "epoch": 2175} {"train_loss": -6.274292945861816, "global_step": 91359, "epoch": 2175} {"train_loss": -6.218043327331543, "global_step": 91360, "epoch": 2175} {"train_loss": -6.279531478881836, "global_step": 91361, "epoch": 2175} {"train_loss": -6.287585258483887, "global_step": 91362, "epoch": 2175} {"train_loss": -6.2408647537231445, "global_step": 91363, "epoch": 2175} {"train_loss": -6.337536334991455, "global_step": 91364, "epoch": 2175} {"train_loss": -6.2722930908203125, "global_step": 91365, "epoch": 2175} {"train_loss": -6.157750129699707, "global_step": 91366, "epoch": 2175} {"train_loss": -6.283822059631348, "global_step": 91367, "epoch": 2175} {"train_loss": -6.193173408508301, "global_step": 91368, "epoch": 2175} {"train_loss": -6.211142539978027, "global_step": 91369, "epoch": 2175} {"train_loss": -6.229585647583008, "global_step": 91370, "epoch": 2175} {"train_loss": -6.248408317565918, "global_step": 91371, "epoch": 2175} {"train_loss": -6.2482404708862305, "global_step": 91372, "epoch": 2175} {"train_loss": -6.268040657043457, "global_step": 91373, "epoch": 2175} {"train_loss": -6.18719482421875, "global_step": 91374, "epoch": 2175} {"train_loss": -6.305365085601807, "global_step": 91375, "epoch": 2175} {"train_loss": -6.346829414367676, "global_step": 91376, "epoch": 2175} {"train_loss": -6.176468849182129, "global_step": 91377, "epoch": 2175} {"train_loss": -6.222756385803223, "global_step": 91378, "epoch": 2175} {"train_loss": -6.308186054229736, "global_step": 91379, "epoch": 2175} {"train_loss": -6.3243913650512695, "global_step": 91380, "epoch": 2175} {"train_loss": -6.303682327270508, "global_step": 91381, "epoch": 2175} {"train_loss": -6.2423014640808105, "global_step": 91382, "epoch": 2175} {"train_loss": -6.267574310302734, "global_step": 91383, "epoch": 2175} {"train_loss": -6.27944803237915, "global_step": 91384, "epoch": 2175} {"train_loss": -6.316195964813232, "global_step": 91385, "epoch": 2175} {"train_loss": -6.331683158874512, "global_step": 91386, "epoch": 2175} {"train_loss": -6.345340728759766, "global_step": 91387, "epoch": 2175} {"train_loss": -6.233298301696777, "global_step": 91388, "epoch": 2175} {"train_loss": -6.256775856018066, "global_step": 91389, "epoch": 2175} {"train_loss": -6.296928405761719, "global_step": 91390, "epoch": 2175} {"train_loss": -6.2681435971033, "global_step": 91391, "epoch": 2175, "val_loss": 63167.546875} {"train_loss": -6.293754577636719, "global_step": 91392, "epoch": 2176} {"train_loss": -6.3008012771606445, "global_step": 91393, "epoch": 2176} {"train_loss": -6.219062328338623, "global_step": 91394, "epoch": 2176} {"train_loss": -6.276279449462891, "global_step": 91395, "epoch": 2176} {"train_loss": -6.250365257263184, "global_step": 91396, "epoch": 2176} {"train_loss": -6.32451868057251, "global_step": 91397, "epoch": 2176} {"train_loss": -6.271332740783691, "global_step": 91398, "epoch": 2176} {"train_loss": -6.378105163574219, "global_step": 91399, "epoch": 2176} {"train_loss": -6.328063011169434, "global_step": 91400, "epoch": 2176} {"train_loss": -6.2969231605529785, "global_step": 91401, "epoch": 2176} {"train_loss": -6.264800071716309, "global_step": 91402, "epoch": 2176} {"train_loss": -6.222419738769531, "global_step": 91403, "epoch": 2176} {"train_loss": -6.295895576477051, "global_step": 91404, "epoch": 2176} {"train_loss": -6.366982460021973, "global_step": 91405, "epoch": 2176} {"train_loss": -6.398337364196777, "global_step": 91406, "epoch": 2176} {"train_loss": -6.294035911560059, "global_step": 91407, "epoch": 2176} {"train_loss": -6.275992393493652, "global_step": 91408, "epoch": 2176} {"train_loss": -6.157443523406982, "global_step": 91409, "epoch": 2176} {"train_loss": -6.138314247131348, "global_step": 91410, "epoch": 2176} {"train_loss": -6.351265907287598, "global_step": 91411, "epoch": 2176} {"train_loss": -6.253076553344727, "global_step": 91412, "epoch": 2176} {"train_loss": -6.1822333335876465, "global_step": 91413, "epoch": 2176} {"train_loss": -6.38985013961792, "global_step": 91414, "epoch": 2176} {"train_loss": -6.243321418762207, "global_step": 91415, "epoch": 2176} {"train_loss": -6.2321624755859375, "global_step": 91416, "epoch": 2176} {"train_loss": -6.37704610824585, "global_step": 91417, "epoch": 2176} {"train_loss": -6.267698287963867, "global_step": 91418, "epoch": 2176} {"train_loss": -6.178115367889404, "global_step": 91419, "epoch": 2176} {"train_loss": -6.246318340301514, "global_step": 91420, "epoch": 2176} {"train_loss": -6.212536811828613, "global_step": 91421, "epoch": 2176} {"train_loss": -6.204483985900879, "global_step": 91422, "epoch": 2176} {"train_loss": -6.28347635269165, "global_step": 91423, "epoch": 2176} {"train_loss": -6.081956386566162, "global_step": 91424, "epoch": 2176} {"train_loss": -6.279381275177002, "global_step": 91425, "epoch": 2176} {"train_loss": -6.279356002807617, "global_step": 91426, "epoch": 2176} {"train_loss": -6.197223663330078, "global_step": 91427, "epoch": 2176} {"train_loss": -6.308770656585693, "global_step": 91428, "epoch": 2176} {"train_loss": -6.210243225097656, "global_step": 91429, "epoch": 2176} {"train_loss": -6.145240783691406, "global_step": 91430, "epoch": 2176} {"train_loss": -6.171273231506348, "global_step": 91431, "epoch": 2176} {"train_loss": -6.229671001434326, "global_step": 91432, "epoch": 2176} {"train_loss": -6.259925944464547, "global_step": 91433, "epoch": 2176, "val_loss": 63256.87890625} {"train_loss": -6.125375747680664, "global_step": 91434, "epoch": 2177} {"train_loss": -6.2651262283325195, "global_step": 91435, "epoch": 2177} {"train_loss": -6.110064506530762, "global_step": 91436, "epoch": 2177} {"train_loss": -6.301344394683838, "global_step": 91437, "epoch": 2177} {"train_loss": -6.120533466339111, "global_step": 91438, "epoch": 2177} {"train_loss": -6.174739837646484, "global_step": 91439, "epoch": 2177} {"train_loss": -6.241995811462402, "global_step": 91440, "epoch": 2177} {"train_loss": -6.267369270324707, "global_step": 91441, "epoch": 2177} {"train_loss": -6.233963966369629, "global_step": 91442, "epoch": 2177} {"train_loss": -6.3329997062683105, "global_step": 91443, "epoch": 2177} {"train_loss": -6.250395774841309, "global_step": 91444, "epoch": 2177} {"train_loss": -6.174640655517578, "global_step": 91445, "epoch": 2177} {"train_loss": -6.109613418579102, "global_step": 91446, "epoch": 2177} {"train_loss": -6.178483009338379, "global_step": 91447, "epoch": 2177} {"train_loss": -6.21882963180542, "global_step": 91448, "epoch": 2177} {"train_loss": -6.193955421447754, "global_step": 91449, "epoch": 2177} {"train_loss": -6.188150405883789, "global_step": 91450, "epoch": 2177} {"train_loss": -6.208497047424316, "global_step": 91451, "epoch": 2177} {"train_loss": -6.335947036743164, "global_step": 91452, "epoch": 2177} {"train_loss": -6.231250286102295, "global_step": 91453, "epoch": 2177} {"train_loss": -6.2330780029296875, "global_step": 91454, "epoch": 2177} {"train_loss": -6.180418491363525, "global_step": 91455, "epoch": 2177} {"train_loss": -6.286497116088867, "global_step": 91456, "epoch": 2177} {"train_loss": -6.382486343383789, "global_step": 91457, "epoch": 2177} {"train_loss": -6.245434761047363, "global_step": 91458, "epoch": 2177} {"train_loss": -6.273865699768066, "global_step": 91459, "epoch": 2177} {"train_loss": -6.295206069946289, "global_step": 91460, "epoch": 2177} {"train_loss": -6.240120887756348, "global_step": 91461, "epoch": 2177} {"train_loss": -6.352975845336914, "global_step": 91462, "epoch": 2177} {"train_loss": -6.418572425842285, "global_step": 91463, "epoch": 2177} {"train_loss": -6.259392738342285, "global_step": 91464, "epoch": 2177} {"train_loss": -6.2522406578063965, "global_step": 91465, "epoch": 2177} {"train_loss": -6.258810043334961, "global_step": 91466, "epoch": 2177} {"train_loss": -6.266632080078125, "global_step": 91467, "epoch": 2177} {"train_loss": -6.348122596740723, "global_step": 91468, "epoch": 2177} {"train_loss": -6.1912665367126465, "global_step": 91469, "epoch": 2177} {"train_loss": -6.253340721130371, "global_step": 91470, "epoch": 2177} {"train_loss": -6.256087303161621, "global_step": 91471, "epoch": 2177} {"train_loss": -6.117447853088379, "global_step": 91472, "epoch": 2177} {"train_loss": -6.329504013061523, "global_step": 91473, "epoch": 2177} {"train_loss": -6.276124954223633, "global_step": 91474, "epoch": 2177} {"train_loss": -6.242488974616641, "global_step": 91475, "epoch": 2177, "val_loss": 63367.765625} {"train_loss": -6.274159908294678, "global_step": 91476, "epoch": 2178} {"train_loss": -6.1864190101623535, "global_step": 91477, "epoch": 2178} {"train_loss": -6.3224616050720215, "global_step": 91478, "epoch": 2178} {"train_loss": -6.26980447769165, "global_step": 91479, "epoch": 2178} {"train_loss": -6.263431549072266, "global_step": 91480, "epoch": 2178} {"train_loss": -6.235438346862793, "global_step": 91481, "epoch": 2178} {"train_loss": -6.2577805519104, "global_step": 91482, "epoch": 2178} {"train_loss": -6.305789947509766, "global_step": 91483, "epoch": 2178} {"train_loss": -6.218328475952148, "global_step": 91484, "epoch": 2178} {"train_loss": -6.274683475494385, "global_step": 91485, "epoch": 2178} {"train_loss": -6.314182281494141, "global_step": 91486, "epoch": 2178} {"train_loss": -6.227053165435791, "global_step": 91487, "epoch": 2178} {"train_loss": -6.294775009155273, "global_step": 91488, "epoch": 2178} {"train_loss": -6.195948600769043, "global_step": 91489, "epoch": 2178} {"train_loss": -6.293487071990967, "global_step": 91490, "epoch": 2178} {"train_loss": -6.300135612487793, "global_step": 91491, "epoch": 2178} {"train_loss": -6.252511501312256, "global_step": 91492, "epoch": 2178} {"train_loss": -6.262815475463867, "global_step": 91493, "epoch": 2178} {"train_loss": -6.419046401977539, "global_step": 91494, "epoch": 2178} {"train_loss": -6.29976749420166, "global_step": 91495, "epoch": 2178} {"train_loss": -6.326056957244873, "global_step": 91496, "epoch": 2178} {"train_loss": -6.338267803192139, "global_step": 91497, "epoch": 2178} {"train_loss": -6.430610656738281, "global_step": 91498, "epoch": 2178} {"train_loss": -6.285374641418457, "global_step": 91499, "epoch": 2178} {"train_loss": -6.312687397003174, "global_step": 91500, "epoch": 2178} {"train_loss": -6.325732707977295, "global_step": 91501, "epoch": 2178} {"train_loss": -6.2465667724609375, "global_step": 91502, "epoch": 2178} {"train_loss": -6.195699691772461, "global_step": 91503, "epoch": 2178} {"train_loss": -6.249020576477051, "global_step": 91504, "epoch": 2178} {"train_loss": -6.204146385192871, "global_step": 91505, "epoch": 2178} {"train_loss": -6.255332946777344, "global_step": 91506, "epoch": 2178} {"train_loss": -6.323979377746582, "global_step": 91507, "epoch": 2178} {"train_loss": -6.332938194274902, "global_step": 91508, "epoch": 2178} {"train_loss": -6.270541191101074, "global_step": 91509, "epoch": 2178} {"train_loss": -6.217169284820557, "global_step": 91510, "epoch": 2178} {"train_loss": -6.213431358337402, "global_step": 91511, "epoch": 2178} {"train_loss": -6.333505630493164, "global_step": 91512, "epoch": 2178} {"train_loss": -6.29890251159668, "global_step": 91513, "epoch": 2178} {"train_loss": -6.189140796661377, "global_step": 91514, "epoch": 2178} {"train_loss": -6.336034774780273, "global_step": 91515, "epoch": 2178} {"train_loss": -6.300107479095459, "global_step": 91516, "epoch": 2178} {"train_loss": -6.284204233260382, "global_step": 91517, "epoch": 2178, "val_loss": 63050.8671875} {"train_loss": -6.295438766479492, "global_step": 91518, "epoch": 2179} {"train_loss": -6.221131324768066, "global_step": 91519, "epoch": 2179} {"train_loss": -6.272769927978516, "global_step": 91520, "epoch": 2179} {"train_loss": -6.212510108947754, "global_step": 91521, "epoch": 2179} {"train_loss": -6.348354339599609, "global_step": 91522, "epoch": 2179} {"train_loss": -6.282168865203857, "global_step": 91523, "epoch": 2179} {"train_loss": -6.2043256759643555, "global_step": 91524, "epoch": 2179} {"train_loss": -6.3572492599487305, "global_step": 91525, "epoch": 2179} {"train_loss": -6.306977272033691, "global_step": 91526, "epoch": 2179} {"train_loss": -6.31437349319458, "global_step": 91527, "epoch": 2179} {"train_loss": -6.125899314880371, "global_step": 91528, "epoch": 2179} {"train_loss": -6.200350761413574, "global_step": 91529, "epoch": 2179} {"train_loss": -6.307685852050781, "global_step": 91530, "epoch": 2179} {"train_loss": -6.418320655822754, "global_step": 91531, "epoch": 2179} {"train_loss": -6.207837104797363, "global_step": 91532, "epoch": 2179} {"train_loss": -6.2045207023620605, "global_step": 91533, "epoch": 2179} {"train_loss": -6.339651107788086, "global_step": 91534, "epoch": 2179} {"train_loss": -6.167191505432129, "global_step": 91535, "epoch": 2179} {"train_loss": -6.184091567993164, "global_step": 91536, "epoch": 2179} {"train_loss": -6.3111653327941895, "global_step": 91537, "epoch": 2179} {"train_loss": -6.099764823913574, "global_step": 91538, "epoch": 2179} {"train_loss": -6.194753646850586, "global_step": 91539, "epoch": 2179} {"train_loss": -6.174556732177734, "global_step": 91540, "epoch": 2179} {"train_loss": -6.127632141113281, "global_step": 91541, "epoch": 2179} {"train_loss": -6.373288154602051, "global_step": 91542, "epoch": 2179} {"train_loss": -6.2048234939575195, "global_step": 91543, "epoch": 2179} {"train_loss": -6.271327495574951, "global_step": 91544, "epoch": 2179} {"train_loss": -6.187464714050293, "global_step": 91545, "epoch": 2179} {"train_loss": -6.21304988861084, "global_step": 91546, "epoch": 2179} {"train_loss": -6.203497886657715, "global_step": 91547, "epoch": 2179} {"train_loss": -6.2986650466918945, "global_step": 91548, "epoch": 2179} {"train_loss": -6.33964729309082, "global_step": 91549, "epoch": 2179} {"train_loss": -6.424944877624512, "global_step": 91550, "epoch": 2179} {"train_loss": -6.241244316101074, "global_step": 91551, "epoch": 2179} {"train_loss": -6.2042388916015625, "global_step": 91552, "epoch": 2179} {"train_loss": -6.2307024002075195, "global_step": 91553, "epoch": 2179} {"train_loss": -6.337357521057129, "global_step": 91554, "epoch": 2179} {"train_loss": -6.354395866394043, "global_step": 91555, "epoch": 2179} {"train_loss": -6.2959394454956055, "global_step": 91556, "epoch": 2179} {"train_loss": -6.243467330932617, "global_step": 91557, "epoch": 2179} {"train_loss": -6.278848648071289, "global_step": 91558, "epoch": 2179} {"train_loss": -6.259572835195632, "global_step": 91559, "epoch": 2179, "val_loss": 63206.0390625} {"train_loss": -6.3745222091674805, "global_step": 91560, "epoch": 2180} {"train_loss": -6.375744819641113, "global_step": 91561, "epoch": 2180} {"train_loss": -6.174747943878174, "global_step": 91562, "epoch": 2180} {"train_loss": -6.3173909187316895, "global_step": 91563, "epoch": 2180} {"train_loss": -6.302818775177002, "global_step": 91564, "epoch": 2180} {"train_loss": -6.4062299728393555, "global_step": 91565, "epoch": 2180} {"train_loss": -6.35784912109375, "global_step": 91566, "epoch": 2180} {"train_loss": -6.212715148925781, "global_step": 91567, "epoch": 2180} {"train_loss": -6.272686958312988, "global_step": 91568, "epoch": 2180} {"train_loss": -6.381962776184082, "global_step": 91569, "epoch": 2180} {"train_loss": -6.2183732986450195, "global_step": 91570, "epoch": 2180} {"train_loss": -6.293225288391113, "global_step": 91571, "epoch": 2180} {"train_loss": -6.2633843421936035, "global_step": 91572, "epoch": 2180} {"train_loss": -6.2259416580200195, "global_step": 91573, "epoch": 2180} {"train_loss": -6.366111755371094, "global_step": 91574, "epoch": 2180} {"train_loss": -6.331028938293457, "global_step": 91575, "epoch": 2180} {"train_loss": -6.31368350982666, "global_step": 91576, "epoch": 2180} {"train_loss": -6.342482089996338, "global_step": 91577, "epoch": 2180} {"train_loss": -6.373100757598877, "global_step": 91578, "epoch": 2180} {"train_loss": -6.309874057769775, "global_step": 91579, "epoch": 2180} {"train_loss": -6.2758917808532715, "global_step": 91580, "epoch": 2180} {"train_loss": -6.244807243347168, "global_step": 91581, "epoch": 2180} {"train_loss": -6.368366241455078, "global_step": 91582, "epoch": 2180} {"train_loss": -6.2760233879089355, "global_step": 91583, "epoch": 2180} {"train_loss": -6.294092655181885, "global_step": 91584, "epoch": 2180} {"train_loss": -6.228837966918945, "global_step": 91585, "epoch": 2180} {"train_loss": -6.310168743133545, "global_step": 91586, "epoch": 2180} {"train_loss": -6.331615924835205, "global_step": 91587, "epoch": 2180} {"train_loss": -6.273811340332031, "global_step": 91588, "epoch": 2180} {"train_loss": -6.241245269775391, "global_step": 91589, "epoch": 2180} {"train_loss": -6.26234245300293, "global_step": 91590, "epoch": 2180} {"train_loss": -6.282934188842773, "global_step": 91591, "epoch": 2180} {"train_loss": -6.257726669311523, "global_step": 91592, "epoch": 2180} {"train_loss": -6.302511215209961, "global_step": 91593, "epoch": 2180} {"train_loss": -6.285702228546143, "global_step": 91594, "epoch": 2180} {"train_loss": -6.340455055236816, "global_step": 91595, "epoch": 2180} {"train_loss": -6.353372573852539, "global_step": 91596, "epoch": 2180} {"train_loss": -6.1689133644104, "global_step": 91597, "epoch": 2180} {"train_loss": -6.223360061645508, "global_step": 91598, "epoch": 2180} {"train_loss": -6.252349376678467, "global_step": 91599, "epoch": 2180} {"train_loss": -6.155500888824463, "global_step": 91600, "epoch": 2180} {"train_loss": -6.287675142288208, "global_step": 91601, "epoch": 2180, "val_loss": 63453.02734375} {"train_loss": -6.222657680511475, "global_step": 91602, "epoch": 2181} {"train_loss": -6.244542598724365, "global_step": 91603, "epoch": 2181} {"train_loss": -6.300537109375, "global_step": 91604, "epoch": 2181} {"train_loss": -6.232324123382568, "global_step": 91605, "epoch": 2181} {"train_loss": -6.247926712036133, "global_step": 91606, "epoch": 2181} {"train_loss": -6.132540225982666, "global_step": 91607, "epoch": 2181} {"train_loss": -6.278191566467285, "global_step": 91608, "epoch": 2181} {"train_loss": -6.283237934112549, "global_step": 91609, "epoch": 2181} {"train_loss": -6.041698455810547, "global_step": 91610, "epoch": 2181} {"train_loss": -6.251729488372803, "global_step": 91611, "epoch": 2181} {"train_loss": -6.176409721374512, "global_step": 91612, "epoch": 2181} {"train_loss": -6.279308319091797, "global_step": 91613, "epoch": 2181} {"train_loss": -6.263258934020996, "global_step": 91614, "epoch": 2181} {"train_loss": -6.3011250495910645, "global_step": 91615, "epoch": 2181} {"train_loss": -6.26308536529541, "global_step": 91616, "epoch": 2181} {"train_loss": -6.284245014190674, "global_step": 91617, "epoch": 2181} {"train_loss": -6.2308478355407715, "global_step": 91618, "epoch": 2181} {"train_loss": -6.219202041625977, "global_step": 91619, "epoch": 2181} {"train_loss": -6.3101396560668945, "global_step": 91620, "epoch": 2181} {"train_loss": -6.183619499206543, "global_step": 91621, "epoch": 2181} {"train_loss": -6.338101387023926, "global_step": 91622, "epoch": 2181} {"train_loss": -6.312110424041748, "global_step": 91623, "epoch": 2181} {"train_loss": -6.309566497802734, "global_step": 91624, "epoch": 2181} {"train_loss": -6.270707130432129, "global_step": 91625, "epoch": 2181} {"train_loss": -6.094622611999512, "global_step": 91626, "epoch": 2181} {"train_loss": -6.2867112159729, "global_step": 91627, "epoch": 2181} {"train_loss": -6.174263954162598, "global_step": 91628, "epoch": 2181} {"train_loss": -6.127922058105469, "global_step": 91629, "epoch": 2181} {"train_loss": -6.229111194610596, "global_step": 91630, "epoch": 2181} {"train_loss": -6.189849853515625, "global_step": 91631, "epoch": 2181} {"train_loss": -6.287909507751465, "global_step": 91632, "epoch": 2181} {"train_loss": -6.16226863861084, "global_step": 91633, "epoch": 2181} {"train_loss": -6.276752471923828, "global_step": 91634, "epoch": 2181} {"train_loss": -6.090211868286133, "global_step": 91635, "epoch": 2181} {"train_loss": -6.340521812438965, "global_step": 91636, "epoch": 2181} {"train_loss": -6.303972244262695, "global_step": 91637, "epoch": 2181} {"train_loss": -6.211703300476074, "global_step": 91638, "epoch": 2181} {"train_loss": -6.326599597930908, "global_step": 91639, "epoch": 2181} {"train_loss": -6.2123494148254395, "global_step": 91640, "epoch": 2181} {"train_loss": -6.3830790519714355, "global_step": 91641, "epoch": 2181} {"train_loss": -6.26907205581665, "global_step": 91642, "epoch": 2181} {"train_loss": -6.241791929517474, "global_step": 91643, "epoch": 2181, "val_loss": 63336.31640625} {"train_loss": -6.136177062988281, "global_step": 91644, "epoch": 2182} {"train_loss": -6.251487731933594, "global_step": 91645, "epoch": 2182} {"train_loss": -6.427409648895264, "global_step": 91646, "epoch": 2182} {"train_loss": -6.275805473327637, "global_step": 91647, "epoch": 2182} {"train_loss": -6.173069000244141, "global_step": 91648, "epoch": 2182} {"train_loss": -6.294669151306152, "global_step": 91649, "epoch": 2182} {"train_loss": -6.330003261566162, "global_step": 91650, "epoch": 2182} {"train_loss": -6.281955718994141, "global_step": 91651, "epoch": 2182} {"train_loss": -6.255590438842773, "global_step": 91652, "epoch": 2182} {"train_loss": -6.17044734954834, "global_step": 91653, "epoch": 2182} {"train_loss": -6.259321212768555, "global_step": 91654, "epoch": 2182} {"train_loss": -6.237149715423584, "global_step": 91655, "epoch": 2182} {"train_loss": -6.259396553039551, "global_step": 91656, "epoch": 2182} {"train_loss": -6.275781154632568, "global_step": 91657, "epoch": 2182} {"train_loss": -6.190742492675781, "global_step": 91658, "epoch": 2182} {"train_loss": -6.293315887451172, "global_step": 91659, "epoch": 2182} {"train_loss": -6.201247215270996, "global_step": 91660, "epoch": 2182} {"train_loss": -6.319965839385986, "global_step": 91661, "epoch": 2182} {"train_loss": -6.385379791259766, "global_step": 91662, "epoch": 2182} {"train_loss": -6.256375312805176, "global_step": 91663, "epoch": 2182} {"train_loss": -6.256335258483887, "global_step": 91664, "epoch": 2182} {"train_loss": -6.197967529296875, "global_step": 91665, "epoch": 2182} {"train_loss": -6.324832916259766, "global_step": 91666, "epoch": 2182} {"train_loss": -6.303116798400879, "global_step": 91667, "epoch": 2182} {"train_loss": -6.350710868835449, "global_step": 91668, "epoch": 2182} {"train_loss": -6.28257942199707, "global_step": 91669, "epoch": 2182} {"train_loss": -6.340472221374512, "global_step": 91670, "epoch": 2182} {"train_loss": -6.356240749359131, "global_step": 91671, "epoch": 2182} {"train_loss": -6.418329238891602, "global_step": 91672, "epoch": 2182} {"train_loss": -6.278725624084473, "global_step": 91673, "epoch": 2182} {"train_loss": -6.370610237121582, "global_step": 91674, "epoch": 2182} {"train_loss": -6.233197212219238, "global_step": 91675, "epoch": 2182} {"train_loss": -6.333163261413574, "global_step": 91676, "epoch": 2182} {"train_loss": -6.234959602355957, "global_step": 91677, "epoch": 2182} {"train_loss": -6.262360572814941, "global_step": 91678, "epoch": 2182} {"train_loss": -6.351692199707031, "global_step": 91679, "epoch": 2182} {"train_loss": -6.403761863708496, "global_step": 91680, "epoch": 2182} {"train_loss": -6.330295085906982, "global_step": 91681, "epoch": 2182} {"train_loss": -6.344305992126465, "global_step": 91682, "epoch": 2182} {"train_loss": -6.229701995849609, "global_step": 91683, "epoch": 2182} {"train_loss": -6.108111381530762, "global_step": 91684, "epoch": 2182} {"train_loss": -6.281603688285465, "global_step": 91685, "epoch": 2182, "val_loss": 63243.88671875} {"train_loss": -6.267138957977295, "global_step": 91686, "epoch": 2183} {"train_loss": -6.364537715911865, "global_step": 91687, "epoch": 2183} {"train_loss": -6.320330619812012, "global_step": 91688, "epoch": 2183} {"train_loss": -6.191814422607422, "global_step": 91689, "epoch": 2183} {"train_loss": -6.197353363037109, "global_step": 91690, "epoch": 2183} {"train_loss": -6.216649055480957, "global_step": 91691, "epoch": 2183} {"train_loss": -6.275600433349609, "global_step": 91692, "epoch": 2183} {"train_loss": -6.407743453979492, "global_step": 91693, "epoch": 2183} {"train_loss": -6.26209831237793, "global_step": 91694, "epoch": 2183} {"train_loss": -6.207479000091553, "global_step": 91695, "epoch": 2183} {"train_loss": -6.345710754394531, "global_step": 91696, "epoch": 2183} {"train_loss": -6.237635612487793, "global_step": 91697, "epoch": 2183} {"train_loss": -6.361488342285156, "global_step": 91698, "epoch": 2183} {"train_loss": -6.197840690612793, "global_step": 91699, "epoch": 2183} {"train_loss": -6.304660797119141, "global_step": 91700, "epoch": 2183} {"train_loss": -6.3786187171936035, "global_step": 91701, "epoch": 2183} {"train_loss": -6.290927886962891, "global_step": 91702, "epoch": 2183} {"train_loss": -6.252623081207275, "global_step": 91703, "epoch": 2183} {"train_loss": -6.373377323150635, "global_step": 91704, "epoch": 2183} {"train_loss": -6.42779541015625, "global_step": 91705, "epoch": 2183} {"train_loss": -6.307239532470703, "global_step": 91706, "epoch": 2183} {"train_loss": -6.377788543701172, "global_step": 91707, "epoch": 2183} {"train_loss": -6.2812042236328125, "global_step": 91708, "epoch": 2183} {"train_loss": -6.3323869705200195, "global_step": 91709, "epoch": 2183} {"train_loss": -6.275330066680908, "global_step": 91710, "epoch": 2183} {"train_loss": -6.405017852783203, "global_step": 91711, "epoch": 2183} {"train_loss": -6.336208343505859, "global_step": 91712, "epoch": 2183} {"train_loss": -6.358490943908691, "global_step": 91713, "epoch": 2183} {"train_loss": -6.329867839813232, "global_step": 91714, "epoch": 2183} {"train_loss": -6.315906524658203, "global_step": 91715, "epoch": 2183} {"train_loss": -6.396201133728027, "global_step": 91716, "epoch": 2183} {"train_loss": -6.24917459487915, "global_step": 91717, "epoch": 2183} {"train_loss": -6.2705278396606445, "global_step": 91718, "epoch": 2183} {"train_loss": -6.191208839416504, "global_step": 91719, "epoch": 2183} {"train_loss": -6.235910415649414, "global_step": 91720, "epoch": 2183} {"train_loss": -6.213457107543945, "global_step": 91721, "epoch": 2183} {"train_loss": -6.337732315063477, "global_step": 91722, "epoch": 2183} {"train_loss": -6.185253143310547, "global_step": 91723, "epoch": 2183} {"train_loss": -6.229997158050537, "global_step": 91724, "epoch": 2183} {"train_loss": -6.372769355773926, "global_step": 91725, "epoch": 2183} {"train_loss": -6.180799961090088, "global_step": 91726, "epoch": 2183} {"train_loss": -6.2948548793792725, "global_step": 91727, "epoch": 2183, "val_loss": 63473.0} {"train_loss": -6.302384376525879, "global_step": 91728, "epoch": 2184} {"train_loss": -6.231592178344727, "global_step": 91729, "epoch": 2184} {"train_loss": -6.337027549743652, "global_step": 91730, "epoch": 2184} {"train_loss": -6.212303161621094, "global_step": 91731, "epoch": 2184} {"train_loss": -6.189937591552734, "global_step": 91732, "epoch": 2184} {"train_loss": -6.234954833984375, "global_step": 91733, "epoch": 2184} {"train_loss": -6.285168647766113, "global_step": 91734, "epoch": 2184} {"train_loss": -6.224289894104004, "global_step": 91735, "epoch": 2184} {"train_loss": -6.190816402435303, "global_step": 91736, "epoch": 2184} {"train_loss": -6.441903114318848, "global_step": 91737, "epoch": 2184} {"train_loss": -6.188657283782959, "global_step": 91738, "epoch": 2184} {"train_loss": -6.240424633026123, "global_step": 91739, "epoch": 2184} {"train_loss": -6.33145809173584, "global_step": 91740, "epoch": 2184} {"train_loss": -6.2432451248168945, "global_step": 91741, "epoch": 2184} {"train_loss": -6.251901626586914, "global_step": 91742, "epoch": 2184} {"train_loss": -6.297819137573242, "global_step": 91743, "epoch": 2184} {"train_loss": -6.177694320678711, "global_step": 91744, "epoch": 2184} {"train_loss": -6.330207824707031, "global_step": 91745, "epoch": 2184} {"train_loss": -6.239022731781006, "global_step": 91746, "epoch": 2184} {"train_loss": -6.303671836853027, "global_step": 91747, "epoch": 2184} {"train_loss": -6.331666946411133, "global_step": 91748, "epoch": 2184} {"train_loss": -6.279515266418457, "global_step": 91749, "epoch": 2184} {"train_loss": -6.357306957244873, "global_step": 91750, "epoch": 2184} {"train_loss": -6.377500534057617, "global_step": 91751, "epoch": 2184} {"train_loss": -6.27696418762207, "global_step": 91752, "epoch": 2184} {"train_loss": -6.314896583557129, "global_step": 91753, "epoch": 2184} {"train_loss": -6.351254463195801, "global_step": 91754, "epoch": 2184} {"train_loss": -6.216862678527832, "global_step": 91755, "epoch": 2184} {"train_loss": -6.2349419593811035, "global_step": 91756, "epoch": 2184} {"train_loss": -6.277731895446777, "global_step": 91757, "epoch": 2184} {"train_loss": -6.342901706695557, "global_step": 91758, "epoch": 2184} {"train_loss": -6.11826229095459, "global_step": 91759, "epoch": 2184} {"train_loss": -6.194417953491211, "global_step": 91760, "epoch": 2184} {"train_loss": -6.271367073059082, "global_step": 91761, "epoch": 2184} {"train_loss": -6.249906063079834, "global_step": 91762, "epoch": 2184} {"train_loss": -6.230541229248047, "global_step": 91763, "epoch": 2184} {"train_loss": -6.192933559417725, "global_step": 91764, "epoch": 2184} {"train_loss": -6.2685747146606445, "global_step": 91765, "epoch": 2184} {"train_loss": -6.203301429748535, "global_step": 91766, "epoch": 2184} {"train_loss": -6.12639045715332, "global_step": 91767, "epoch": 2184} {"train_loss": -6.162362098693848, "global_step": 91768, "epoch": 2184} {"train_loss": -6.260714065460932, "global_step": 91769, "epoch": 2184, "val_loss": 63405.234375} {"train_loss": -6.235664367675781, "global_step": 91770, "epoch": 2185} {"train_loss": -6.178281307220459, "global_step": 91771, "epoch": 2185} {"train_loss": -6.182165145874023, "global_step": 91772, "epoch": 2185} {"train_loss": -6.250720977783203, "global_step": 91773, "epoch": 2185} {"train_loss": -6.155575275421143, "global_step": 91774, "epoch": 2185} {"train_loss": -6.310214519500732, "global_step": 91775, "epoch": 2185} {"train_loss": -6.083481311798096, "global_step": 91776, "epoch": 2185} {"train_loss": -6.240535736083984, "global_step": 91777, "epoch": 2185} {"train_loss": -6.217522621154785, "global_step": 91778, "epoch": 2185} {"train_loss": -6.216050148010254, "global_step": 91779, "epoch": 2185} {"train_loss": -6.265950679779053, "global_step": 91780, "epoch": 2185} {"train_loss": -6.304461479187012, "global_step": 91781, "epoch": 2185} {"train_loss": -6.244600296020508, "global_step": 91782, "epoch": 2185} {"train_loss": -6.336698532104492, "global_step": 91783, "epoch": 2185} {"train_loss": -6.238629341125488, "global_step": 91784, "epoch": 2185} {"train_loss": -6.252898216247559, "global_step": 91785, "epoch": 2185} {"train_loss": -6.334635257720947, "global_step": 91786, "epoch": 2185} {"train_loss": -6.249463081359863, "global_step": 91787, "epoch": 2185} {"train_loss": -6.265416145324707, "global_step": 91788, "epoch": 2185} {"train_loss": -6.22408390045166, "global_step": 91789, "epoch": 2185} {"train_loss": -6.344674110412598, "global_step": 91790, "epoch": 2185} {"train_loss": -6.395878314971924, "global_step": 91791, "epoch": 2185} {"train_loss": -6.130005836486816, "global_step": 91792, "epoch": 2185} {"train_loss": -6.163050651550293, "global_step": 91793, "epoch": 2185} {"train_loss": -6.201555252075195, "global_step": 91794, "epoch": 2185} {"train_loss": -6.233642578125, "global_step": 91795, "epoch": 2185} {"train_loss": -6.312466621398926, "global_step": 91796, "epoch": 2185} {"train_loss": -6.139776229858398, "global_step": 91797, "epoch": 2185} {"train_loss": -6.235637664794922, "global_step": 91798, "epoch": 2185} {"train_loss": -6.246667861938477, "global_step": 91799, "epoch": 2185} {"train_loss": -6.154055118560791, "global_step": 91800, "epoch": 2185} {"train_loss": -6.2663726806640625, "global_step": 91801, "epoch": 2185} {"train_loss": -6.2774481773376465, "global_step": 91802, "epoch": 2185} {"train_loss": -6.173605918884277, "global_step": 91803, "epoch": 2185} {"train_loss": -6.1790313720703125, "global_step": 91804, "epoch": 2185} {"train_loss": -6.3182597160339355, "global_step": 91805, "epoch": 2185} {"train_loss": -6.207184791564941, "global_step": 91806, "epoch": 2185} {"train_loss": -6.27984619140625, "global_step": 91807, "epoch": 2185} {"train_loss": -6.199040412902832, "global_step": 91808, "epoch": 2185} {"train_loss": -6.203617095947266, "global_step": 91809, "epoch": 2185} {"train_loss": -6.174235820770264, "global_step": 91810, "epoch": 2185} {"train_loss": -6.235700368881226, "global_step": 91811, "epoch": 2185, "val_loss": 63383.6171875} {"train_loss": -6.325174331665039, "global_step": 91812, "epoch": 2186} {"train_loss": -6.191581726074219, "global_step": 91813, "epoch": 2186} {"train_loss": -6.196959495544434, "global_step": 91814, "epoch": 2186} {"train_loss": -6.236096382141113, "global_step": 91815, "epoch": 2186} {"train_loss": -6.294694900512695, "global_step": 91816, "epoch": 2186} {"train_loss": -6.147438049316406, "global_step": 91817, "epoch": 2186} {"train_loss": -6.342722415924072, "global_step": 91818, "epoch": 2186} {"train_loss": -6.2157087326049805, "global_step": 91819, "epoch": 2186} {"train_loss": -6.135698318481445, "global_step": 91820, "epoch": 2186} {"train_loss": -6.31617546081543, "global_step": 91821, "epoch": 2186} {"train_loss": -6.220293998718262, "global_step": 91822, "epoch": 2186} {"train_loss": -6.220716953277588, "global_step": 91823, "epoch": 2186} {"train_loss": -6.171994209289551, "global_step": 91824, "epoch": 2186} {"train_loss": -6.148207664489746, "global_step": 91825, "epoch": 2186} {"train_loss": -6.373181343078613, "global_step": 91826, "epoch": 2186} {"train_loss": -6.289850234985352, "global_step": 91827, "epoch": 2186} {"train_loss": -6.301884651184082, "global_step": 91828, "epoch": 2186} {"train_loss": -6.33499813079834, "global_step": 91829, "epoch": 2186} {"train_loss": -6.303071022033691, "global_step": 91830, "epoch": 2186} {"train_loss": -6.312143802642822, "global_step": 91831, "epoch": 2186} {"train_loss": -6.390148639678955, "global_step": 91832, "epoch": 2186} {"train_loss": -6.25904655456543, "global_step": 91833, "epoch": 2186} {"train_loss": -6.331483364105225, "global_step": 91834, "epoch": 2186} {"train_loss": -6.325678825378418, "global_step": 91835, "epoch": 2186} {"train_loss": -6.262442111968994, "global_step": 91836, "epoch": 2186} {"train_loss": -6.3332719802856445, "global_step": 91837, "epoch": 2186} {"train_loss": -6.272010803222656, "global_step": 91838, "epoch": 2186} {"train_loss": -6.352841854095459, "global_step": 91839, "epoch": 2186} {"train_loss": -6.346768379211426, "global_step": 91840, "epoch": 2186} {"train_loss": -6.247729301452637, "global_step": 91841, "epoch": 2186} {"train_loss": -6.292097091674805, "global_step": 91842, "epoch": 2186} {"train_loss": -6.30883264541626, "global_step": 91843, "epoch": 2186} {"train_loss": -6.346356391906738, "global_step": 91844, "epoch": 2186} {"train_loss": -6.309779167175293, "global_step": 91845, "epoch": 2186} {"train_loss": -6.394730567932129, "global_step": 91846, "epoch": 2186} {"train_loss": -6.310919761657715, "global_step": 91847, "epoch": 2186} {"train_loss": -6.314270973205566, "global_step": 91848, "epoch": 2186} {"train_loss": -6.353147029876709, "global_step": 91849, "epoch": 2186} {"train_loss": -6.3797221183776855, "global_step": 91850, "epoch": 2186} {"train_loss": -6.225057601928711, "global_step": 91851, "epoch": 2186} {"train_loss": -6.320849418640137, "global_step": 91852, "epoch": 2186} {"train_loss": -6.285797550564721, "global_step": 91853, "epoch": 2186, "val_loss": 63133.265625} {"train_loss": -6.297571182250977, "global_step": 91854, "epoch": 2187} {"train_loss": -6.261027812957764, "global_step": 91855, "epoch": 2187} {"train_loss": -6.221534729003906, "global_step": 91856, "epoch": 2187} {"train_loss": -6.319165229797363, "global_step": 91857, "epoch": 2187} {"train_loss": -6.328421592712402, "global_step": 91858, "epoch": 2187} {"train_loss": -6.285289287567139, "global_step": 91859, "epoch": 2187} {"train_loss": -6.341765403747559, "global_step": 91860, "epoch": 2187} {"train_loss": -6.246098518371582, "global_step": 91861, "epoch": 2187} {"train_loss": -6.332072734832764, "global_step": 91862, "epoch": 2187} {"train_loss": -6.269997596740723, "global_step": 91863, "epoch": 2187} {"train_loss": -6.2787065505981445, "global_step": 91864, "epoch": 2187} {"train_loss": -6.287349700927734, "global_step": 91865, "epoch": 2187} {"train_loss": -6.269773483276367, "global_step": 91866, "epoch": 2187} {"train_loss": -6.142279148101807, "global_step": 91867, "epoch": 2187} {"train_loss": -6.432965278625488, "global_step": 91868, "epoch": 2187} {"train_loss": -6.262733459472656, "global_step": 91869, "epoch": 2187} {"train_loss": -6.2501444816589355, "global_step": 91870, "epoch": 2187} {"train_loss": -6.342134475708008, "global_step": 91871, "epoch": 2187} {"train_loss": -6.222439765930176, "global_step": 91872, "epoch": 2187} {"train_loss": -6.396108150482178, "global_step": 91873, "epoch": 2187} {"train_loss": -6.314866065979004, "global_step": 91874, "epoch": 2187} {"train_loss": -6.250943183898926, "global_step": 91875, "epoch": 2187} {"train_loss": -6.223264217376709, "global_step": 91876, "epoch": 2187} {"train_loss": -6.35251522064209, "global_step": 91877, "epoch": 2187} {"train_loss": -6.2370805740356445, "global_step": 91878, "epoch": 2187} {"train_loss": -6.320703983306885, "global_step": 91879, "epoch": 2187} {"train_loss": -6.275314807891846, "global_step": 91880, "epoch": 2187} {"train_loss": -6.326177597045898, "global_step": 91881, "epoch": 2187} {"train_loss": -6.339313507080078, "global_step": 91882, "epoch": 2187} {"train_loss": -6.293639183044434, "global_step": 91883, "epoch": 2187} {"train_loss": -6.231182098388672, "global_step": 91884, "epoch": 2187} {"train_loss": -6.357269763946533, "global_step": 91885, "epoch": 2187} {"train_loss": -6.295065879821777, "global_step": 91886, "epoch": 2187} {"train_loss": -6.283777713775635, "global_step": 91887, "epoch": 2187} {"train_loss": -6.266716480255127, "global_step": 91888, "epoch": 2187} {"train_loss": -6.251317977905273, "global_step": 91889, "epoch": 2187} {"train_loss": -6.245817184448242, "global_step": 91890, "epoch": 2187} {"train_loss": -6.425691604614258, "global_step": 91891, "epoch": 2187} {"train_loss": -6.234006881713867, "global_step": 91892, "epoch": 2187} {"train_loss": -6.238593101501465, "global_step": 91893, "epoch": 2187} {"train_loss": -6.269227027893066, "global_step": 91894, "epoch": 2187} {"train_loss": -6.288581711905343, "global_step": 91895, "epoch": 2187, "val_loss": 63535.2890625} {"train_loss": -6.359129905700684, "global_step": 91896, "epoch": 2188} {"train_loss": -6.265852928161621, "global_step": 91897, "epoch": 2188} {"train_loss": -6.1574201583862305, "global_step": 91898, "epoch": 2188} {"train_loss": -6.286731243133545, "global_step": 91899, "epoch": 2188} {"train_loss": -6.155819416046143, "global_step": 91900, "epoch": 2188} {"train_loss": -6.301630020141602, "global_step": 91901, "epoch": 2188} {"train_loss": -6.319530010223389, "global_step": 91902, "epoch": 2188} {"train_loss": -6.40932559967041, "global_step": 91903, "epoch": 2188} {"train_loss": -6.30429744720459, "global_step": 91904, "epoch": 2188} {"train_loss": -6.229920387268066, "global_step": 91905, "epoch": 2188} {"train_loss": -6.350967884063721, "global_step": 91906, "epoch": 2188} {"train_loss": -6.352748870849609, "global_step": 91907, "epoch": 2188} {"train_loss": -6.297628402709961, "global_step": 91908, "epoch": 2188} {"train_loss": -6.296499729156494, "global_step": 91909, "epoch": 2188} {"train_loss": -6.221924781799316, "global_step": 91910, "epoch": 2188} {"train_loss": -6.196167945861816, "global_step": 91911, "epoch": 2188} {"train_loss": -6.3268351554870605, "global_step": 91912, "epoch": 2188} {"train_loss": -6.216196060180664, "global_step": 91913, "epoch": 2188} {"train_loss": -6.331734657287598, "global_step": 91914, "epoch": 2188} {"train_loss": -6.443657398223877, "global_step": 91915, "epoch": 2188} {"train_loss": -6.355504035949707, "global_step": 91916, "epoch": 2188} {"train_loss": -6.327070713043213, "global_step": 91917, "epoch": 2188} {"train_loss": -6.291017532348633, "global_step": 91918, "epoch": 2188} {"train_loss": -6.328730583190918, "global_step": 91919, "epoch": 2188} {"train_loss": -6.209906578063965, "global_step": 91920, "epoch": 2188} {"train_loss": -6.391550064086914, "global_step": 91921, "epoch": 2188} {"train_loss": -6.285851001739502, "global_step": 91922, "epoch": 2188} {"train_loss": -6.302448749542236, "global_step": 91923, "epoch": 2188} {"train_loss": -6.262945175170898, "global_step": 91924, "epoch": 2188} {"train_loss": -6.2117438316345215, "global_step": 91925, "epoch": 2188} {"train_loss": -6.2846479415893555, "global_step": 91926, "epoch": 2188} {"train_loss": -6.27253532409668, "global_step": 91927, "epoch": 2188} {"train_loss": -6.233515739440918, "global_step": 91928, "epoch": 2188} {"train_loss": -6.295342922210693, "global_step": 91929, "epoch": 2188} {"train_loss": -6.27814245223999, "global_step": 91930, "epoch": 2188} {"train_loss": -6.140039443969727, "global_step": 91931, "epoch": 2188} {"train_loss": -6.188168525695801, "global_step": 91932, "epoch": 2188} {"train_loss": -6.231205940246582, "global_step": 91933, "epoch": 2188} {"train_loss": -6.255638122558594, "global_step": 91934, "epoch": 2188} {"train_loss": -6.278613567352295, "global_step": 91935, "epoch": 2188} {"train_loss": -6.164000988006592, "global_step": 91936, "epoch": 2188} {"train_loss": -6.28010014125279, "global_step": 91937, "epoch": 2188, "val_loss": 63070.01953125} {"train_loss": -6.28783655166626, "global_step": 91938, "epoch": 2189} {"train_loss": -6.389325141906738, "global_step": 91939, "epoch": 2189} {"train_loss": -6.210152626037598, "global_step": 91940, "epoch": 2189} {"train_loss": -6.327959060668945, "global_step": 91941, "epoch": 2189} {"train_loss": -6.350055694580078, "global_step": 91942, "epoch": 2189} {"train_loss": -6.284061431884766, "global_step": 91943, "epoch": 2189} {"train_loss": -6.302883148193359, "global_step": 91944, "epoch": 2189} {"train_loss": -6.205620765686035, "global_step": 91945, "epoch": 2189} {"train_loss": -6.2767205238342285, "global_step": 91946, "epoch": 2189} {"train_loss": -6.4092559814453125, "global_step": 91947, "epoch": 2189} {"train_loss": -6.249917030334473, "global_step": 91948, "epoch": 2189} {"train_loss": -6.262265205383301, "global_step": 91949, "epoch": 2189} {"train_loss": -6.297750473022461, "global_step": 91950, "epoch": 2189} {"train_loss": -6.219658851623535, "global_step": 91951, "epoch": 2189} {"train_loss": -6.2511115074157715, "global_step": 91952, "epoch": 2189} {"train_loss": -6.246551513671875, "global_step": 91953, "epoch": 2189} {"train_loss": -6.312272071838379, "global_step": 91954, "epoch": 2189} {"train_loss": -6.2077813148498535, "global_step": 91955, "epoch": 2189} {"train_loss": -6.292726516723633, "global_step": 91956, "epoch": 2189} {"train_loss": -6.283030033111572, "global_step": 91957, "epoch": 2189} {"train_loss": -6.279392242431641, "global_step": 91958, "epoch": 2189} {"train_loss": -6.29954719543457, "global_step": 91959, "epoch": 2189} {"train_loss": -6.261134147644043, "global_step": 91960, "epoch": 2189} {"train_loss": -6.356348037719727, "global_step": 91961, "epoch": 2189} {"train_loss": -6.315365791320801, "global_step": 91962, "epoch": 2189} {"train_loss": -6.410163879394531, "global_step": 91963, "epoch": 2189} {"train_loss": -6.307440757751465, "global_step": 91964, "epoch": 2189} {"train_loss": -6.337746620178223, "global_step": 91965, "epoch": 2189} {"train_loss": -6.325267791748047, "global_step": 91966, "epoch": 2189} {"train_loss": -6.1872358322143555, "global_step": 91967, "epoch": 2189} {"train_loss": -6.408236503601074, "global_step": 91968, "epoch": 2189} {"train_loss": -6.166131973266602, "global_step": 91969, "epoch": 2189} {"train_loss": -6.282735824584961, "global_step": 91970, "epoch": 2189} {"train_loss": -6.243063926696777, "global_step": 91971, "epoch": 2189} {"train_loss": -6.289547443389893, "global_step": 91972, "epoch": 2189} {"train_loss": -6.3411478996276855, "global_step": 91973, "epoch": 2189} {"train_loss": -6.335776329040527, "global_step": 91974, "epoch": 2189} {"train_loss": -6.268272399902344, "global_step": 91975, "epoch": 2189} {"train_loss": -6.349161148071289, "global_step": 91976, "epoch": 2189} {"train_loss": -6.433139324188232, "global_step": 91977, "epoch": 2189} {"train_loss": -6.2662248611450195, "global_step": 91978, "epoch": 2189} {"train_loss": -6.29724661509196, "global_step": 91979, "epoch": 2189, "val_loss": 63489.65625} {"train_loss": -6.313342571258545, "global_step": 91980, "epoch": 2190} {"train_loss": -6.271977424621582, "global_step": 91981, "epoch": 2190} {"train_loss": -6.357497215270996, "global_step": 91982, "epoch": 2190} {"train_loss": -6.401661396026611, "global_step": 91983, "epoch": 2190} {"train_loss": -6.330441474914551, "global_step": 91984, "epoch": 2190} {"train_loss": -6.256444931030273, "global_step": 91985, "epoch": 2190} {"train_loss": -6.216826438903809, "global_step": 91986, "epoch": 2190} {"train_loss": -6.284289360046387, "global_step": 91987, "epoch": 2190} {"train_loss": -6.383420944213867, "global_step": 91988, "epoch": 2190} {"train_loss": -6.337719917297363, "global_step": 91989, "epoch": 2190} {"train_loss": -6.303224086761475, "global_step": 91990, "epoch": 2190} {"train_loss": -6.378256320953369, "global_step": 91991, "epoch": 2190} {"train_loss": -6.2123942375183105, "global_step": 91992, "epoch": 2190} {"train_loss": -6.39484977722168, "global_step": 91993, "epoch": 2190} {"train_loss": -6.2974395751953125, "global_step": 91994, "epoch": 2190} {"train_loss": -6.378507137298584, "global_step": 91995, "epoch": 2190} {"train_loss": -6.219620704650879, "global_step": 91996, "epoch": 2190} {"train_loss": -6.28803825378418, "global_step": 91997, "epoch": 2190} {"train_loss": -6.250371932983398, "global_step": 91998, "epoch": 2190} {"train_loss": -6.302424907684326, "global_step": 91999, "epoch": 2190} {"train_loss": -6.224674224853516, "global_step": 92000, "epoch": 2190} {"train_loss": -6.219278812408447, "global_step": 92001, "epoch": 2190} {"train_loss": -6.267753601074219, "global_step": 92002, "epoch": 2190} {"train_loss": -6.288412094116211, "global_step": 92003, "epoch": 2190} {"train_loss": -6.3386759757995605, "global_step": 92004, "epoch": 2190} {"train_loss": -6.237843990325928, "global_step": 92005, "epoch": 2190} {"train_loss": -6.2827372550964355, "global_step": 92006, "epoch": 2190} {"train_loss": -6.255159378051758, "global_step": 92007, "epoch": 2190} {"train_loss": -6.293416976928711, "global_step": 92008, "epoch": 2190} {"train_loss": -6.38759708404541, "global_step": 92009, "epoch": 2190} {"train_loss": -6.290430068969727, "global_step": 92010, "epoch": 2190} {"train_loss": -6.262874126434326, "global_step": 92011, "epoch": 2190} {"train_loss": -6.323908805847168, "global_step": 92012, "epoch": 2190} {"train_loss": -6.224244117736816, "global_step": 92013, "epoch": 2190} {"train_loss": -6.305729866027832, "global_step": 92014, "epoch": 2190} {"train_loss": -6.326557159423828, "global_step": 92015, "epoch": 2190} {"train_loss": -6.28054141998291, "global_step": 92016, "epoch": 2190} {"train_loss": -6.299407482147217, "global_step": 92017, "epoch": 2190} {"train_loss": -6.3141021728515625, "global_step": 92018, "epoch": 2190} {"train_loss": -6.34827184677124, "global_step": 92019, "epoch": 2190} {"train_loss": -6.287270545959473, "global_step": 92020, "epoch": 2190} {"train_loss": -6.299568619046893, "global_step": 92021, "epoch": 2190, "val_loss": 63263.5390625} {"train_loss": -6.437857627868652, "global_step": 92022, "epoch": 2191} {"train_loss": -6.32901668548584, "global_step": 92023, "epoch": 2191} {"train_loss": -6.411900997161865, "global_step": 92024, "epoch": 2191} {"train_loss": -6.354888439178467, "global_step": 92025, "epoch": 2191} {"train_loss": -6.4461283683776855, "global_step": 92026, "epoch": 2191} {"train_loss": -6.215664863586426, "global_step": 92027, "epoch": 2191} {"train_loss": -6.378636360168457, "global_step": 92028, "epoch": 2191} {"train_loss": -6.273001670837402, "global_step": 92029, "epoch": 2191} {"train_loss": -6.193000793457031, "global_step": 92030, "epoch": 2191} {"train_loss": -6.33428955078125, "global_step": 92031, "epoch": 2191} {"train_loss": -6.295537948608398, "global_step": 92032, "epoch": 2191} {"train_loss": -6.334527492523193, "global_step": 92033, "epoch": 2191} {"train_loss": -6.321063041687012, "global_step": 92034, "epoch": 2191} {"train_loss": -6.244782447814941, "global_step": 92035, "epoch": 2191} {"train_loss": -6.231071472167969, "global_step": 92036, "epoch": 2191} {"train_loss": -6.235857009887695, "global_step": 92037, "epoch": 2191} {"train_loss": -6.218985557556152, "global_step": 92038, "epoch": 2191} {"train_loss": -6.300896644592285, "global_step": 92039, "epoch": 2191} {"train_loss": -6.252660274505615, "global_step": 92040, "epoch": 2191} {"train_loss": -6.284452438354492, "global_step": 92041, "epoch": 2191} {"train_loss": -6.144824981689453, "global_step": 92042, "epoch": 2191} {"train_loss": -6.2685465812683105, "global_step": 92043, "epoch": 2191} {"train_loss": -6.329904556274414, "global_step": 92044, "epoch": 2191} {"train_loss": -6.206700325012207, "global_step": 92045, "epoch": 2191} {"train_loss": -6.210346221923828, "global_step": 92046, "epoch": 2191} {"train_loss": -6.284252643585205, "global_step": 92047, "epoch": 2191} {"train_loss": -6.231636047363281, "global_step": 92048, "epoch": 2191} {"train_loss": -6.314620018005371, "global_step": 92049, "epoch": 2191} {"train_loss": -6.251565933227539, "global_step": 92050, "epoch": 2191} {"train_loss": -6.396274089813232, "global_step": 92051, "epoch": 2191} {"train_loss": -6.245763301849365, "global_step": 92052, "epoch": 2191} {"train_loss": -6.305405616760254, "global_step": 92053, "epoch": 2191} {"train_loss": -6.198322296142578, "global_step": 92054, "epoch": 2191} {"train_loss": -6.19667387008667, "global_step": 92055, "epoch": 2191} {"train_loss": -6.2856645584106445, "global_step": 92056, "epoch": 2191} {"train_loss": -6.227242469787598, "global_step": 92057, "epoch": 2191} {"train_loss": -6.255607604980469, "global_step": 92058, "epoch": 2191} {"train_loss": -6.200682640075684, "global_step": 92059, "epoch": 2191} {"train_loss": -6.361041069030762, "global_step": 92060, "epoch": 2191} {"train_loss": -6.188309669494629, "global_step": 92061, "epoch": 2191} {"train_loss": -6.342633247375488, "global_step": 92062, "epoch": 2191} {"train_loss": -6.281945330756051, "global_step": 92063, "epoch": 2191, "val_loss": 63679.7265625} {"train_loss": -6.1948113441467285, "global_step": 92064, "epoch": 2192} {"train_loss": -6.255838871002197, "global_step": 92065, "epoch": 2192} {"train_loss": -6.259999752044678, "global_step": 92066, "epoch": 2192} {"train_loss": -6.327127456665039, "global_step": 92067, "epoch": 2192} {"train_loss": -6.278779029846191, "global_step": 92068, "epoch": 2192} {"train_loss": -6.322319507598877, "global_step": 92069, "epoch": 2192} {"train_loss": -6.160336017608643, "global_step": 92070, "epoch": 2192} {"train_loss": -6.327749252319336, "global_step": 92071, "epoch": 2192} {"train_loss": -6.2533721923828125, "global_step": 92072, "epoch": 2192} {"train_loss": -6.251052379608154, "global_step": 92073, "epoch": 2192} {"train_loss": -6.3238525390625, "global_step": 92074, "epoch": 2192} {"train_loss": -6.4270524978637695, "global_step": 92075, "epoch": 2192} {"train_loss": -6.444336891174316, "global_step": 92076, "epoch": 2192} {"train_loss": -6.330255508422852, "global_step": 92077, "epoch": 2192} {"train_loss": -6.3034162521362305, "global_step": 92078, "epoch": 2192} {"train_loss": -6.448147296905518, "global_step": 92079, "epoch": 2192} {"train_loss": -6.280001640319824, "global_step": 92080, "epoch": 2192} {"train_loss": -6.236922264099121, "global_step": 92081, "epoch": 2192} {"train_loss": -6.333451271057129, "global_step": 92082, "epoch": 2192} {"train_loss": -6.286072731018066, "global_step": 92083, "epoch": 2192} {"train_loss": -6.208215713500977, "global_step": 92084, "epoch": 2192} {"train_loss": -6.217901706695557, "global_step": 92085, "epoch": 2192} {"train_loss": -6.288867950439453, "global_step": 92086, "epoch": 2192} {"train_loss": -6.418697357177734, "global_step": 92087, "epoch": 2192} {"train_loss": -6.328474998474121, "global_step": 92088, "epoch": 2192} {"train_loss": -6.218011856079102, "global_step": 92089, "epoch": 2192} {"train_loss": -6.361185550689697, "global_step": 92090, "epoch": 2192} {"train_loss": -6.194004058837891, "global_step": 92091, "epoch": 2192} {"train_loss": -6.1722731590271, "global_step": 92092, "epoch": 2192} {"train_loss": -6.218514442443848, "global_step": 92093, "epoch": 2192} {"train_loss": -6.2720818519592285, "global_step": 92094, "epoch": 2192} {"train_loss": -6.330044746398926, "global_step": 92095, "epoch": 2192} {"train_loss": -6.250114440917969, "global_step": 92096, "epoch": 2192} {"train_loss": -6.201898574829102, "global_step": 92097, "epoch": 2192} {"train_loss": -6.29864501953125, "global_step": 92098, "epoch": 2192} {"train_loss": -6.2668538093566895, "global_step": 92099, "epoch": 2192} {"train_loss": -6.233809471130371, "global_step": 92100, "epoch": 2192} {"train_loss": -6.199826240539551, "global_step": 92101, "epoch": 2192} {"train_loss": -6.251404762268066, "global_step": 92102, "epoch": 2192} {"train_loss": -6.374135971069336, "global_step": 92103, "epoch": 2192} {"train_loss": -6.119510650634766, "global_step": 92104, "epoch": 2192} {"train_loss": -6.277705521810622, "global_step": 92105, "epoch": 2192, "val_loss": 63425.78125} {"train_loss": -6.358811378479004, "global_step": 92106, "epoch": 2193} {"train_loss": -6.233343601226807, "global_step": 92107, "epoch": 2193} {"train_loss": -6.3228607177734375, "global_step": 92108, "epoch": 2193} {"train_loss": -6.253590106964111, "global_step": 92109, "epoch": 2193} {"train_loss": -6.172419548034668, "global_step": 92110, "epoch": 2193} {"train_loss": -6.340417861938477, "global_step": 92111, "epoch": 2193} {"train_loss": -6.3078107833862305, "global_step": 92112, "epoch": 2193} {"train_loss": -6.310916423797607, "global_step": 92113, "epoch": 2193} {"train_loss": -6.382851600646973, "global_step": 92114, "epoch": 2193} {"train_loss": -6.248439788818359, "global_step": 92115, "epoch": 2193} {"train_loss": -6.300423622131348, "global_step": 92116, "epoch": 2193} {"train_loss": -6.276050090789795, "global_step": 92117, "epoch": 2193} {"train_loss": -6.333295822143555, "global_step": 92118, "epoch": 2193} {"train_loss": -6.3096184730529785, "global_step": 92119, "epoch": 2193} {"train_loss": -6.248137474060059, "global_step": 92120, "epoch": 2193} {"train_loss": -6.294232368469238, "global_step": 92121, "epoch": 2193} {"train_loss": -6.407743453979492, "global_step": 92122, "epoch": 2193} {"train_loss": -6.238897323608398, "global_step": 92123, "epoch": 2193} {"train_loss": -6.3944597244262695, "global_step": 92124, "epoch": 2193} {"train_loss": -6.357314109802246, "global_step": 92125, "epoch": 2193} {"train_loss": -6.363126277923584, "global_step": 92126, "epoch": 2193} {"train_loss": -6.299228668212891, "global_step": 92127, "epoch": 2193} {"train_loss": -6.1466064453125, "global_step": 92128, "epoch": 2193} {"train_loss": -6.168639183044434, "global_step": 92129, "epoch": 2193} {"train_loss": -6.296244144439697, "global_step": 92130, "epoch": 2193} {"train_loss": -6.2149763107299805, "global_step": 92131, "epoch": 2193} {"train_loss": -6.361855506896973, "global_step": 92132, "epoch": 2193} {"train_loss": -6.259852409362793, "global_step": 92133, "epoch": 2193} {"train_loss": -6.1961493492126465, "global_step": 92134, "epoch": 2193} {"train_loss": -6.305262088775635, "global_step": 92135, "epoch": 2193} {"train_loss": -6.2304768562316895, "global_step": 92136, "epoch": 2193} {"train_loss": -6.270159721374512, "global_step": 92137, "epoch": 2193} {"train_loss": -6.291563034057617, "global_step": 92138, "epoch": 2193} {"train_loss": -6.228435516357422, "global_step": 92139, "epoch": 2193} {"train_loss": -6.287588119506836, "global_step": 92140, "epoch": 2193} {"train_loss": -6.229489803314209, "global_step": 92141, "epoch": 2193} {"train_loss": -6.267359733581543, "global_step": 92142, "epoch": 2193} {"train_loss": -6.313656806945801, "global_step": 92143, "epoch": 2193} {"train_loss": -6.0903754234313965, "global_step": 92144, "epoch": 2193} {"train_loss": -6.2629852294921875, "global_step": 92145, "epoch": 2193} {"train_loss": -6.1840314865112305, "global_step": 92146, "epoch": 2193} {"train_loss": -6.276542016438076, "global_step": 92147, "epoch": 2193, "val_loss": 63455.16796875} {"train_loss": -6.297051906585693, "global_step": 92148, "epoch": 2194} {"train_loss": -6.221514701843262, "global_step": 92149, "epoch": 2194} {"train_loss": -6.310023307800293, "global_step": 92150, "epoch": 2194} {"train_loss": -6.343524932861328, "global_step": 92151, "epoch": 2194} {"train_loss": -6.350268363952637, "global_step": 92152, "epoch": 2194} {"train_loss": -6.3224334716796875, "global_step": 92153, "epoch": 2194} {"train_loss": -6.234315872192383, "global_step": 92154, "epoch": 2194} {"train_loss": -6.285513877868652, "global_step": 92155, "epoch": 2194} {"train_loss": -6.3092193603515625, "global_step": 92156, "epoch": 2194} {"train_loss": -6.153365135192871, "global_step": 92157, "epoch": 2194} {"train_loss": -6.252405166625977, "global_step": 92158, "epoch": 2194} {"train_loss": -6.2900800704956055, "global_step": 92159, "epoch": 2194} {"train_loss": -6.2609944343566895, "global_step": 92160, "epoch": 2194} {"train_loss": -6.385765075683594, "global_step": 92161, "epoch": 2194} {"train_loss": -6.334305286407471, "global_step": 92162, "epoch": 2194} {"train_loss": -6.236581325531006, "global_step": 92163, "epoch": 2194} {"train_loss": -6.417954921722412, "global_step": 92164, "epoch": 2194} {"train_loss": -6.22780704498291, "global_step": 92165, "epoch": 2194} {"train_loss": -6.2596025466918945, "global_step": 92166, "epoch": 2194} {"train_loss": -6.392838478088379, "global_step": 92167, "epoch": 2194} {"train_loss": -6.196587085723877, "global_step": 92168, "epoch": 2194} {"train_loss": -6.299372673034668, "global_step": 92169, "epoch": 2194} {"train_loss": -6.195943832397461, "global_step": 92170, "epoch": 2194} {"train_loss": -6.264138698577881, "global_step": 92171, "epoch": 2194} {"train_loss": -6.268599033355713, "global_step": 92172, "epoch": 2194} {"train_loss": -6.318110942840576, "global_step": 92173, "epoch": 2194} {"train_loss": -6.241098880767822, "global_step": 92174, "epoch": 2194} {"train_loss": -6.387199401855469, "global_step": 92175, "epoch": 2194} {"train_loss": -6.250415802001953, "global_step": 92176, "epoch": 2194} {"train_loss": -6.324494361877441, "global_step": 92177, "epoch": 2194} {"train_loss": -6.366241455078125, "global_step": 92178, "epoch": 2194} {"train_loss": -6.2967424392700195, "global_step": 92179, "epoch": 2194} {"train_loss": -6.335140228271484, "global_step": 92180, "epoch": 2194} {"train_loss": -6.336036205291748, "global_step": 92181, "epoch": 2194} {"train_loss": -6.384515762329102, "global_step": 92182, "epoch": 2194} {"train_loss": -6.358955383300781, "global_step": 92183, "epoch": 2194} {"train_loss": -6.126211166381836, "global_step": 92184, "epoch": 2194} {"train_loss": -6.358871936798096, "global_step": 92185, "epoch": 2194} {"train_loss": -6.40852689743042, "global_step": 92186, "epoch": 2194} {"train_loss": -6.224830627441406, "global_step": 92187, "epoch": 2194} {"train_loss": -6.260109901428223, "global_step": 92188, "epoch": 2194} {"train_loss": -6.29400186311631, "global_step": 92189, "epoch": 2194, "val_loss": 63379.09765625} {"train_loss": -6.309746742248535, "global_step": 92190, "epoch": 2195} {"train_loss": -6.375283718109131, "global_step": 92191, "epoch": 2195} {"train_loss": -6.280597686767578, "global_step": 92192, "epoch": 2195} {"train_loss": -6.239931106567383, "global_step": 92193, "epoch": 2195} {"train_loss": -6.29574728012085, "global_step": 92194, "epoch": 2195} {"train_loss": -6.214890480041504, "global_step": 92195, "epoch": 2195} {"train_loss": -6.225220680236816, "global_step": 92196, "epoch": 2195} {"train_loss": -6.332484722137451, "global_step": 92197, "epoch": 2195} {"train_loss": -6.293030738830566, "global_step": 92198, "epoch": 2195} {"train_loss": -6.368465423583984, "global_step": 92199, "epoch": 2195} {"train_loss": -6.236788272857666, "global_step": 92200, "epoch": 2195} {"train_loss": -6.287264823913574, "global_step": 92201, "epoch": 2195} {"train_loss": -6.363164901733398, "global_step": 92202, "epoch": 2195} {"train_loss": -6.304376602172852, "global_step": 92203, "epoch": 2195} {"train_loss": -6.305238246917725, "global_step": 92204, "epoch": 2195} {"train_loss": -6.265267372131348, "global_step": 92205, "epoch": 2195} {"train_loss": -6.2711005210876465, "global_step": 92206, "epoch": 2195} {"train_loss": -6.16458797454834, "global_step": 92207, "epoch": 2195} {"train_loss": -6.31512451171875, "global_step": 92208, "epoch": 2195} {"train_loss": -6.206835746765137, "global_step": 92209, "epoch": 2195} {"train_loss": -6.239336967468262, "global_step": 92210, "epoch": 2195} {"train_loss": -6.2434892654418945, "global_step": 92211, "epoch": 2195} {"train_loss": -6.36346960067749, "global_step": 92212, "epoch": 2195} {"train_loss": -6.259101867675781, "global_step": 92213, "epoch": 2195} {"train_loss": -6.261301517486572, "global_step": 92214, "epoch": 2195} {"train_loss": -6.30222225189209, "global_step": 92215, "epoch": 2195} {"train_loss": -6.372426986694336, "global_step": 92216, "epoch": 2195} {"train_loss": -6.336634635925293, "global_step": 92217, "epoch": 2195} {"train_loss": -6.4746551513671875, "global_step": 92218, "epoch": 2195} {"train_loss": -6.224864959716797, "global_step": 92219, "epoch": 2195} {"train_loss": -6.2749409675598145, "global_step": 92220, "epoch": 2195} {"train_loss": -6.367255210876465, "global_step": 92221, "epoch": 2195} {"train_loss": -6.290348052978516, "global_step": 92222, "epoch": 2195} {"train_loss": -6.326413631439209, "global_step": 92223, "epoch": 2195} {"train_loss": -6.390449047088623, "global_step": 92224, "epoch": 2195} {"train_loss": -6.2949371337890625, "global_step": 92225, "epoch": 2195} {"train_loss": -6.310260772705078, "global_step": 92226, "epoch": 2195} {"train_loss": -6.324747085571289, "global_step": 92227, "epoch": 2195} {"train_loss": -6.372124671936035, "global_step": 92228, "epoch": 2195} {"train_loss": -6.249789237976074, "global_step": 92229, "epoch": 2195} {"train_loss": -6.328556060791016, "global_step": 92230, "epoch": 2195} {"train_loss": -6.296877656664167, "global_step": 92231, "epoch": 2195, "val_loss": 63460.78125} {"train_loss": -6.2538557052612305, "global_step": 92232, "epoch": 2196} {"train_loss": -6.319052219390869, "global_step": 92233, "epoch": 2196} {"train_loss": -6.269961833953857, "global_step": 92234, "epoch": 2196} {"train_loss": -6.331450462341309, "global_step": 92235, "epoch": 2196} {"train_loss": -6.364217758178711, "global_step": 92236, "epoch": 2196} {"train_loss": -6.161716461181641, "global_step": 92237, "epoch": 2196} {"train_loss": -6.337327003479004, "global_step": 92238, "epoch": 2196} {"train_loss": -6.370256423950195, "global_step": 92239, "epoch": 2196} {"train_loss": -6.207972526550293, "global_step": 92240, "epoch": 2196} {"train_loss": -6.231019020080566, "global_step": 92241, "epoch": 2196} {"train_loss": -6.256420612335205, "global_step": 92242, "epoch": 2196} {"train_loss": -6.254855155944824, "global_step": 92243, "epoch": 2196} {"train_loss": -6.327377796173096, "global_step": 92244, "epoch": 2196} {"train_loss": -6.135341167449951, "global_step": 92245, "epoch": 2196} {"train_loss": -6.237119674682617, "global_step": 92246, "epoch": 2196} {"train_loss": -6.183796405792236, "global_step": 92247, "epoch": 2196} {"train_loss": -6.211550235748291, "global_step": 92248, "epoch": 2196} {"train_loss": -6.297829627990723, "global_step": 92249, "epoch": 2196} {"train_loss": -6.259688377380371, "global_step": 92250, "epoch": 2196} {"train_loss": -6.219582557678223, "global_step": 92251, "epoch": 2196} {"train_loss": -6.280884742736816, "global_step": 92252, "epoch": 2196} {"train_loss": -6.17283296585083, "global_step": 92253, "epoch": 2196} {"train_loss": -6.336864948272705, "global_step": 92254, "epoch": 2196} {"train_loss": -6.2239179611206055, "global_step": 92255, "epoch": 2196} {"train_loss": -6.286942005157471, "global_step": 92256, "epoch": 2196} {"train_loss": -6.413043975830078, "global_step": 92257, "epoch": 2196} {"train_loss": -6.219715118408203, "global_step": 92258, "epoch": 2196} {"train_loss": -6.293560028076172, "global_step": 92259, "epoch": 2196} {"train_loss": -6.2457275390625, "global_step": 92260, "epoch": 2196} {"train_loss": -6.2768707275390625, "global_step": 92261, "epoch": 2196} {"train_loss": -6.1355671882629395, "global_step": 92262, "epoch": 2196} {"train_loss": -6.171755790710449, "global_step": 92263, "epoch": 2196} {"train_loss": -6.249810218811035, "global_step": 92264, "epoch": 2196} {"train_loss": -6.239418029785156, "global_step": 92265, "epoch": 2196} {"train_loss": -6.396402835845947, "global_step": 92266, "epoch": 2196} {"train_loss": -6.269532680511475, "global_step": 92267, "epoch": 2196} {"train_loss": -6.213536262512207, "global_step": 92268, "epoch": 2196} {"train_loss": -6.2530903816223145, "global_step": 92269, "epoch": 2196} {"train_loss": -6.283790588378906, "global_step": 92270, "epoch": 2196} {"train_loss": -6.2881598472595215, "global_step": 92271, "epoch": 2196} {"train_loss": -6.2858171463012695, "global_step": 92272, "epoch": 2196} {"train_loss": -6.2635286422002885, "global_step": 92273, "epoch": 2196, "val_loss": 63351.90625} {"train_loss": -6.3293352127075195, "global_step": 92274, "epoch": 2197} {"train_loss": -6.2526421546936035, "global_step": 92275, "epoch": 2197} {"train_loss": -6.2298173904418945, "global_step": 92276, "epoch": 2197} {"train_loss": -6.313006401062012, "global_step": 92277, "epoch": 2197} {"train_loss": -6.2582011222839355, "global_step": 92278, "epoch": 2197} {"train_loss": -6.162213325500488, "global_step": 92279, "epoch": 2197} {"train_loss": -6.292402267456055, "global_step": 92280, "epoch": 2197} {"train_loss": -6.332582473754883, "global_step": 92281, "epoch": 2197} {"train_loss": -6.377655982971191, "global_step": 92282, "epoch": 2197} {"train_loss": -6.3044939041137695, "global_step": 92283, "epoch": 2197} {"train_loss": -6.318990230560303, "global_step": 92284, "epoch": 2197} {"train_loss": -6.239382743835449, "global_step": 92285, "epoch": 2197} {"train_loss": -6.233114242553711, "global_step": 92286, "epoch": 2197} {"train_loss": -6.260909080505371, "global_step": 92287, "epoch": 2197} {"train_loss": -6.365274429321289, "global_step": 92288, "epoch": 2197} {"train_loss": -6.091059684753418, "global_step": 92289, "epoch": 2197} {"train_loss": -6.171875953674316, "global_step": 92290, "epoch": 2197} {"train_loss": -6.339362621307373, "global_step": 92291, "epoch": 2197} {"train_loss": -6.344378471374512, "global_step": 92292, "epoch": 2197} {"train_loss": -6.128637313842773, "global_step": 92293, "epoch": 2197} {"train_loss": -6.31764030456543, "global_step": 92294, "epoch": 2197} {"train_loss": -6.240261077880859, "global_step": 92295, "epoch": 2197} {"train_loss": -6.20549201965332, "global_step": 92296, "epoch": 2197} {"train_loss": -6.295539855957031, "global_step": 92297, "epoch": 2197} {"train_loss": -6.224100112915039, "global_step": 92298, "epoch": 2197} {"train_loss": -6.25896692276001, "global_step": 92299, "epoch": 2197} {"train_loss": -6.32459020614624, "global_step": 92300, "epoch": 2197} {"train_loss": -6.340012550354004, "global_step": 92301, "epoch": 2197} {"train_loss": -6.299535274505615, "global_step": 92302, "epoch": 2197} {"train_loss": -6.259039878845215, "global_step": 92303, "epoch": 2197} {"train_loss": -6.326012134552002, "global_step": 92304, "epoch": 2197} {"train_loss": -6.342215061187744, "global_step": 92305, "epoch": 2197} {"train_loss": -6.201055526733398, "global_step": 92306, "epoch": 2197} {"train_loss": -6.199605941772461, "global_step": 92307, "epoch": 2197} {"train_loss": -6.253580093383789, "global_step": 92308, "epoch": 2197} {"train_loss": -6.204654216766357, "global_step": 92309, "epoch": 2197} {"train_loss": -6.232550621032715, "global_step": 92310, "epoch": 2197} {"train_loss": -6.320200443267822, "global_step": 92311, "epoch": 2197} {"train_loss": -6.322966575622559, "global_step": 92312, "epoch": 2197} {"train_loss": -6.119569778442383, "global_step": 92313, "epoch": 2197} {"train_loss": -6.3188958168029785, "global_step": 92314, "epoch": 2197} {"train_loss": -6.267632427669707, "global_step": 92315, "epoch": 2197, "val_loss": 63477.07421875} {"train_loss": -6.338247299194336, "global_step": 92316, "epoch": 2198} {"train_loss": -6.265408515930176, "global_step": 92317, "epoch": 2198} {"train_loss": -6.2470293045043945, "global_step": 92318, "epoch": 2198} {"train_loss": -6.358074188232422, "global_step": 92319, "epoch": 2198} {"train_loss": -6.395066261291504, "global_step": 92320, "epoch": 2198} {"train_loss": -6.278050899505615, "global_step": 92321, "epoch": 2198} {"train_loss": -6.144305229187012, "global_step": 92322, "epoch": 2198} {"train_loss": -6.259319305419922, "global_step": 92323, "epoch": 2198} {"train_loss": -6.259616374969482, "global_step": 92324, "epoch": 2198} {"train_loss": -6.317497730255127, "global_step": 92325, "epoch": 2198} {"train_loss": -6.187501907348633, "global_step": 92326, "epoch": 2198} {"train_loss": -6.292691230773926, "global_step": 92327, "epoch": 2198} {"train_loss": -6.208953857421875, "global_step": 92328, "epoch": 2198} {"train_loss": -6.344390869140625, "global_step": 92329, "epoch": 2198} {"train_loss": -6.312328338623047, "global_step": 92330, "epoch": 2198} {"train_loss": -6.138106346130371, "global_step": 92331, "epoch": 2198} {"train_loss": -6.249670028686523, "global_step": 92332, "epoch": 2198} {"train_loss": -6.242720603942871, "global_step": 92333, "epoch": 2198} {"train_loss": -6.311391830444336, "global_step": 92334, "epoch": 2198} {"train_loss": -6.258213043212891, "global_step": 92335, "epoch": 2198} {"train_loss": -6.2169084548950195, "global_step": 92336, "epoch": 2198} {"train_loss": -6.359727382659912, "global_step": 92337, "epoch": 2198} {"train_loss": -6.253817081451416, "global_step": 92338, "epoch": 2198} {"train_loss": -6.261936187744141, "global_step": 92339, "epoch": 2198} {"train_loss": -6.394412040710449, "global_step": 92340, "epoch": 2198} {"train_loss": -6.184534549713135, "global_step": 92341, "epoch": 2198} {"train_loss": -6.325505256652832, "global_step": 92342, "epoch": 2198} {"train_loss": -6.250946998596191, "global_step": 92343, "epoch": 2198} {"train_loss": -6.215871810913086, "global_step": 92344, "epoch": 2198} {"train_loss": -6.322054386138916, "global_step": 92345, "epoch": 2198} {"train_loss": -6.257838249206543, "global_step": 92346, "epoch": 2198} {"train_loss": -6.2315673828125, "global_step": 92347, "epoch": 2198} {"train_loss": -6.262239933013916, "global_step": 92348, "epoch": 2198} {"train_loss": -6.328326225280762, "global_step": 92349, "epoch": 2198} {"train_loss": -6.312649726867676, "global_step": 92350, "epoch": 2198} {"train_loss": -6.2556867599487305, "global_step": 92351, "epoch": 2198} {"train_loss": -6.233623504638672, "global_step": 92352, "epoch": 2198} {"train_loss": -6.23655891418457, "global_step": 92353, "epoch": 2198} {"train_loss": -6.285353660583496, "global_step": 92354, "epoch": 2198} {"train_loss": -6.290946960449219, "global_step": 92355, "epoch": 2198} {"train_loss": -6.203106880187988, "global_step": 92356, "epoch": 2198} {"train_loss": -6.269140084584554, "global_step": 92357, "epoch": 2198, "val_loss": 63217.9765625} {"train_loss": -6.244733810424805, "global_step": 92358, "epoch": 2199} {"train_loss": -6.38370418548584, "global_step": 92359, "epoch": 2199} {"train_loss": -6.181910514831543, "global_step": 92360, "epoch": 2199} {"train_loss": -6.22917366027832, "global_step": 92361, "epoch": 2199} {"train_loss": -6.279129981994629, "global_step": 92362, "epoch": 2199} {"train_loss": -6.200920104980469, "global_step": 92363, "epoch": 2199} {"train_loss": -6.330045700073242, "global_step": 92364, "epoch": 2199} {"train_loss": -6.351324081420898, "global_step": 92365, "epoch": 2199} {"train_loss": -6.186107158660889, "global_step": 92366, "epoch": 2199} {"train_loss": -6.341228485107422, "global_step": 92367, "epoch": 2199} {"train_loss": -6.240593910217285, "global_step": 92368, "epoch": 2199} {"train_loss": -6.237288951873779, "global_step": 92369, "epoch": 2199} {"train_loss": -6.291170120239258, "global_step": 92370, "epoch": 2199} {"train_loss": -6.263803482055664, "global_step": 92371, "epoch": 2199} {"train_loss": -6.157570838928223, "global_step": 92372, "epoch": 2199} {"train_loss": -6.2030110359191895, "global_step": 92373, "epoch": 2199} {"train_loss": -6.213695049285889, "global_step": 92374, "epoch": 2199} {"train_loss": -6.108595371246338, "global_step": 92375, "epoch": 2199} {"train_loss": -6.144593238830566, "global_step": 92376, "epoch": 2199} {"train_loss": -6.247377395629883, "global_step": 92377, "epoch": 2199} {"train_loss": -6.238498687744141, "global_step": 92378, "epoch": 2199} {"train_loss": -6.165260314941406, "global_step": 92379, "epoch": 2199} {"train_loss": -6.205597400665283, "global_step": 92380, "epoch": 2199} {"train_loss": -6.265485763549805, "global_step": 92381, "epoch": 2199} {"train_loss": -6.234190940856934, "global_step": 92382, "epoch": 2199} {"train_loss": -6.29279899597168, "global_step": 92383, "epoch": 2199} {"train_loss": -6.306092262268066, "global_step": 92384, "epoch": 2199} {"train_loss": -6.137951850891113, "global_step": 92385, "epoch": 2199} {"train_loss": -6.225236892700195, "global_step": 92386, "epoch": 2199} {"train_loss": -6.293444633483887, "global_step": 92387, "epoch": 2199} {"train_loss": -6.318430423736572, "global_step": 92388, "epoch": 2199} {"train_loss": -6.187483787536621, "global_step": 92389, "epoch": 2199} {"train_loss": -6.164419174194336, "global_step": 92390, "epoch": 2199} {"train_loss": -6.251481533050537, "global_step": 92391, "epoch": 2199} {"train_loss": -6.2441301345825195, "global_step": 92392, "epoch": 2199} {"train_loss": -6.279408931732178, "global_step": 92393, "epoch": 2199} {"train_loss": -6.349865913391113, "global_step": 92394, "epoch": 2199} {"train_loss": -6.316514015197754, "global_step": 92395, "epoch": 2199} {"train_loss": -6.35706901550293, "global_step": 92396, "epoch": 2199} {"train_loss": -6.308995723724365, "global_step": 92397, "epoch": 2199} {"train_loss": -6.237427711486816, "global_step": 92398, "epoch": 2199} {"train_loss": -6.249843892597017, "global_step": 92399, "epoch": 2199, "val_loss": 63160.75390625} {"train_loss": -6.210637092590332, "global_step": 92400, "epoch": 2200} {"train_loss": -6.3242902755737305, "global_step": 92401, "epoch": 2200} {"train_loss": -6.3722028732299805, "global_step": 92402, "epoch": 2200} {"train_loss": -6.29630708694458, "global_step": 92403, "epoch": 2200} {"train_loss": -6.3911261558532715, "global_step": 92404, "epoch": 2200} {"train_loss": -6.3581037521362305, "global_step": 92405, "epoch": 2200} {"train_loss": -6.259027481079102, "global_step": 92406, "epoch": 2200} {"train_loss": -6.3274455070495605, "global_step": 92407, "epoch": 2200} {"train_loss": -6.254950523376465, "global_step": 92408, "epoch": 2200} {"train_loss": -6.309921741485596, "global_step": 92409, "epoch": 2200} {"train_loss": -6.3376922607421875, "global_step": 92410, "epoch": 2200} {"train_loss": -6.2395710945129395, "global_step": 92411, "epoch": 2200} {"train_loss": -6.31114387512207, "global_step": 92412, "epoch": 2200} {"train_loss": -6.253866195678711, "global_step": 92413, "epoch": 2200} {"train_loss": -6.364879608154297, "global_step": 92414, "epoch": 2200} {"train_loss": -6.209780693054199, "global_step": 92415, "epoch": 2200} {"train_loss": -6.240628242492676, "global_step": 92416, "epoch": 2200} {"train_loss": -6.223586082458496, "global_step": 92417, "epoch": 2200} {"train_loss": -6.251257419586182, "global_step": 92418, "epoch": 2200} {"train_loss": -6.261717319488525, "global_step": 92419, "epoch": 2200} {"train_loss": -6.285887718200684, "global_step": 92420, "epoch": 2200} {"train_loss": -6.191746711730957, "global_step": 92421, "epoch": 2200} {"train_loss": -6.268563270568848, "global_step": 92422, "epoch": 2200} {"train_loss": -6.150949001312256, "global_step": 92423, "epoch": 2200} {"train_loss": -6.274930953979492, "global_step": 92424, "epoch": 2200} {"train_loss": -6.3398051261901855, "global_step": 92425, "epoch": 2200} {"train_loss": -6.280616283416748, "global_step": 92426, "epoch": 2200} {"train_loss": -6.366013050079346, "global_step": 92427, "epoch": 2200} {"train_loss": -6.348043441772461, "global_step": 92428, "epoch": 2200} {"train_loss": -6.3103814125061035, "global_step": 92429, "epoch": 2200} {"train_loss": -6.220367431640625, "global_step": 92430, "epoch": 2200} {"train_loss": -6.198299407958984, "global_step": 92431, "epoch": 2200} {"train_loss": -6.323076248168945, "global_step": 92432, "epoch": 2200} {"train_loss": -6.262932777404785, "global_step": 92433, "epoch": 2200} {"train_loss": -6.285637378692627, "global_step": 92434, "epoch": 2200} {"train_loss": -6.276264190673828, "global_step": 92435, "epoch": 2200} {"train_loss": -6.23250150680542, "global_step": 92436, "epoch": 2200} {"train_loss": -6.274977207183838, "global_step": 92437, "epoch": 2200} {"train_loss": -6.205417633056641, "global_step": 92438, "epoch": 2200} {"train_loss": -6.349175453186035, "global_step": 92439, "epoch": 2200} {"train_loss": -6.282312393188477, "global_step": 92440, "epoch": 2200} {"train_loss": -6.280322665259952, "global_step": 92441, "epoch": 2200, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.308412083937713, "train/sim_max_reward_2": 0.7845828171439228, "train/sim_max_reward_3": 0.4268609107647355, "train/sim_max_reward_4": 0.969505350385452, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.021047152400894463, "test/sim_max_reward_4300001": 0.5565661725766061, "test/sim_max_reward_4300002": 0.9852411379600496, "test/sim_max_reward_4300003": 0.958261892075495, "test/sim_max_reward_4300004": 0.2173013292395665, "test/sim_max_reward_4300005": 0.9638937361404047, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.6904943089457469, "test/sim_max_reward_4300008": 0.8390318075537441, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9760712363637792, "test/sim_max_reward_4300012": 0.8269342560960299, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.8891013274384282, "test/sim_max_reward_4300016": 0.5743867607018214, "test/sim_max_reward_4300017": 0.3060227962242664, "test/sim_max_reward_4300018": 0.3644006480414135, "test/sim_max_reward_4300019": 0.18668266039892828, "test/sim_max_reward_4300020": 0.9999106011961917, "test/sim_max_reward_4300021": 0.9371305919968017, "test/sim_max_reward_4300022": 0.9136002787230254, "test/sim_max_reward_4300023": 0.3297529980876195, "test/sim_max_reward_4300024": 0.9069838187087618, "test/sim_max_reward_4300025": 0.6744429781834156, "test/sim_max_reward_4300026": 0.13471692744510333, "test/sim_max_reward_4300027": 0.8106085642908483, "test/sim_max_reward_4300028": 0.7786831706100951, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.980686782722905, "test/sim_max_reward_4300031": 0.9089341991986345, "test/sim_max_reward_4300032": 0.9635523519614327, "test/sim_max_reward_4300033": 0.7854323437815097, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.3401259399681094, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.926165270561198, "test/sim_max_reward_4300038": 0.8239337300152064, "test/sim_max_reward_4300039": 0.9351593351884752, "test/sim_max_reward_4300040": 0.9459572209377929, "test/sim_max_reward_4300041": 0.9449262374146282, "test/sim_max_reward_4300042": 0.8407534071569034, "test/sim_max_reward_4300043": 0.5836647123887679, "test/sim_max_reward_4300044": 0.9589169599007493, "test/sim_max_reward_4300045": 0.19529554474234373, "test/sim_max_reward_4300046": 0.9667697838966609, "test/sim_max_reward_4300047": 0.6669184524057589, "test/sim_max_reward_4300048": 0.34897602493437047, "test/sim_max_reward_4300049": 0.3427161666498444, "train/mean_score": 0.4787739030333438, "test/mean_score": 0.6499869146157562, "val_loss": 63309.65625} {"train_loss": -6.220101356506348, "global_step": 92442, "epoch": 2201} {"train_loss": -6.196750640869141, "global_step": 92443, "epoch": 2201} {"train_loss": -6.275049686431885, "global_step": 92444, "epoch": 2201} {"train_loss": -6.319971561431885, "global_step": 92445, "epoch": 2201} {"train_loss": -6.294830322265625, "global_step": 92446, "epoch": 2201} {"train_loss": -6.243115425109863, "global_step": 92447, "epoch": 2201} {"train_loss": -6.340299606323242, "global_step": 92448, "epoch": 2201} {"train_loss": -6.3229899406433105, "global_step": 92449, "epoch": 2201} {"train_loss": -6.3020453453063965, "global_step": 92450, "epoch": 2201} {"train_loss": -6.2868266105651855, "global_step": 92451, "epoch": 2201} {"train_loss": -6.336417198181152, "global_step": 92452, "epoch": 2201} {"train_loss": -6.389153957366943, "global_step": 92453, "epoch": 2201} {"train_loss": -6.402128219604492, "global_step": 92454, "epoch": 2201} {"train_loss": -6.21060848236084, "global_step": 92455, "epoch": 2201} {"train_loss": -6.288455009460449, "global_step": 92456, "epoch": 2201} {"train_loss": -6.266665458679199, "global_step": 92457, "epoch": 2201} {"train_loss": -6.18880558013916, "global_step": 92458, "epoch": 2201} {"train_loss": -6.398650169372559, "global_step": 92459, "epoch": 2201} {"train_loss": -6.279474258422852, "global_step": 92460, "epoch": 2201} {"train_loss": -6.323385715484619, "global_step": 92461, "epoch": 2201} {"train_loss": -6.206287384033203, "global_step": 92462, "epoch": 2201} {"train_loss": -6.313422203063965, "global_step": 92463, "epoch": 2201} {"train_loss": -6.313745498657227, "global_step": 92464, "epoch": 2201} {"train_loss": -6.151344299316406, "global_step": 92465, "epoch": 2201} {"train_loss": -6.268660068511963, "global_step": 92466, "epoch": 2201} {"train_loss": -6.177515506744385, "global_step": 92467, "epoch": 2201} {"train_loss": -6.241155624389648, "global_step": 92468, "epoch": 2201} {"train_loss": -6.321070194244385, "global_step": 92469, "epoch": 2201} {"train_loss": -6.167444705963135, "global_step": 92470, "epoch": 2201} {"train_loss": -6.228849411010742, "global_step": 92471, "epoch": 2201} {"train_loss": -6.238272190093994, "global_step": 92472, "epoch": 2201} {"train_loss": -6.2730255126953125, "global_step": 92473, "epoch": 2201} {"train_loss": -6.230121612548828, "global_step": 92474, "epoch": 2201} {"train_loss": -6.282232761383057, "global_step": 92475, "epoch": 2201} {"train_loss": -6.219182968139648, "global_step": 92476, "epoch": 2201} {"train_loss": -6.210885524749756, "global_step": 92477, "epoch": 2201} {"train_loss": -6.277165412902832, "global_step": 92478, "epoch": 2201} {"train_loss": -6.269141674041748, "global_step": 92479, "epoch": 2201} {"train_loss": -6.254236221313477, "global_step": 92480, "epoch": 2201} {"train_loss": -6.268178939819336, "global_step": 92481, "epoch": 2201} {"train_loss": -6.394190311431885, "global_step": 92482, "epoch": 2201} {"train_loss": -6.275498549143474, "global_step": 92483, "epoch": 2201, "val_loss": 63333.58203125} {"train_loss": -6.277898788452148, "global_step": 92484, "epoch": 2202} {"train_loss": -6.2295451164245605, "global_step": 92485, "epoch": 2202} {"train_loss": -6.320666790008545, "global_step": 92486, "epoch": 2202} {"train_loss": -6.30515718460083, "global_step": 92487, "epoch": 2202} {"train_loss": -6.360485553741455, "global_step": 92488, "epoch": 2202} {"train_loss": -6.3026814460754395, "global_step": 92489, "epoch": 2202} {"train_loss": -6.312847137451172, "global_step": 92490, "epoch": 2202} {"train_loss": -6.265621185302734, "global_step": 92491, "epoch": 2202} {"train_loss": -6.335527420043945, "global_step": 92492, "epoch": 2202} {"train_loss": -6.268492221832275, "global_step": 92493, "epoch": 2202} {"train_loss": -6.393701553344727, "global_step": 92494, "epoch": 2202} {"train_loss": -6.305605888366699, "global_step": 92495, "epoch": 2202} {"train_loss": -6.169007301330566, "global_step": 92496, "epoch": 2202} {"train_loss": -6.24064826965332, "global_step": 92497, "epoch": 2202} {"train_loss": -6.40077018737793, "global_step": 92498, "epoch": 2202} {"train_loss": -6.182929515838623, "global_step": 92499, "epoch": 2202} {"train_loss": -6.2461371421813965, "global_step": 92500, "epoch": 2202} {"train_loss": -6.245849609375, "global_step": 92501, "epoch": 2202} {"train_loss": -6.303564071655273, "global_step": 92502, "epoch": 2202} {"train_loss": -6.233549118041992, "global_step": 92503, "epoch": 2202} {"train_loss": -6.241281509399414, "global_step": 92504, "epoch": 2202} {"train_loss": -6.396566390991211, "global_step": 92505, "epoch": 2202} {"train_loss": -6.433371543884277, "global_step": 92506, "epoch": 2202} {"train_loss": -6.204463005065918, "global_step": 92507, "epoch": 2202} {"train_loss": -6.320923328399658, "global_step": 92508, "epoch": 2202} {"train_loss": -6.188159942626953, "global_step": 92509, "epoch": 2202} {"train_loss": -6.191749095916748, "global_step": 92510, "epoch": 2202} {"train_loss": -6.332869529724121, "global_step": 92511, "epoch": 2202} {"train_loss": -6.293989181518555, "global_step": 92512, "epoch": 2202} {"train_loss": -6.262557029724121, "global_step": 92513, "epoch": 2202} {"train_loss": -6.284723281860352, "global_step": 92514, "epoch": 2202} {"train_loss": -6.28154182434082, "global_step": 92515, "epoch": 2202} {"train_loss": -6.247864246368408, "global_step": 92516, "epoch": 2202} {"train_loss": -6.390449523925781, "global_step": 92517, "epoch": 2202} {"train_loss": -6.3152666091918945, "global_step": 92518, "epoch": 2202} {"train_loss": -6.400372505187988, "global_step": 92519, "epoch": 2202} {"train_loss": -6.307412147521973, "global_step": 92520, "epoch": 2202} {"train_loss": -6.335930824279785, "global_step": 92521, "epoch": 2202} {"train_loss": -6.224275588989258, "global_step": 92522, "epoch": 2202} {"train_loss": -6.266389846801758, "global_step": 92523, "epoch": 2202} {"train_loss": -6.264627933502197, "global_step": 92524, "epoch": 2202} {"train_loss": -6.292497827893212, "global_step": 92525, "epoch": 2202, "val_loss": 63257.046875} {"train_loss": -6.33663272857666, "global_step": 92526, "epoch": 2203} {"train_loss": -6.343545913696289, "global_step": 92527, "epoch": 2203} {"train_loss": -6.236257553100586, "global_step": 92528, "epoch": 2203} {"train_loss": -6.249144554138184, "global_step": 92529, "epoch": 2203} {"train_loss": -6.344446182250977, "global_step": 92530, "epoch": 2203} {"train_loss": -6.245323181152344, "global_step": 92531, "epoch": 2203} {"train_loss": -6.310855388641357, "global_step": 92532, "epoch": 2203} {"train_loss": -6.2408037185668945, "global_step": 92533, "epoch": 2203} {"train_loss": -6.294975280761719, "global_step": 92534, "epoch": 2203} {"train_loss": -6.251699447631836, "global_step": 92535, "epoch": 2203} {"train_loss": -6.2457356452941895, "global_step": 92536, "epoch": 2203} {"train_loss": -6.307244300842285, "global_step": 92537, "epoch": 2203} {"train_loss": -6.350365161895752, "global_step": 92538, "epoch": 2203} {"train_loss": -6.2536091804504395, "global_step": 92539, "epoch": 2203} {"train_loss": -6.250147819519043, "global_step": 92540, "epoch": 2203} {"train_loss": -6.27000617980957, "global_step": 92541, "epoch": 2203} {"train_loss": -6.338254928588867, "global_step": 92542, "epoch": 2203} {"train_loss": -6.378270149230957, "global_step": 92543, "epoch": 2203} {"train_loss": -6.27419376373291, "global_step": 92544, "epoch": 2203} {"train_loss": -6.25257682800293, "global_step": 92545, "epoch": 2203} {"train_loss": -6.281041145324707, "global_step": 92546, "epoch": 2203} {"train_loss": -6.2592387199401855, "global_step": 92547, "epoch": 2203} {"train_loss": -6.404265403747559, "global_step": 92548, "epoch": 2203} {"train_loss": -6.211581707000732, "global_step": 92549, "epoch": 2203} {"train_loss": -6.265689849853516, "global_step": 92550, "epoch": 2203} {"train_loss": -6.333621978759766, "global_step": 92551, "epoch": 2203} {"train_loss": -6.258213996887207, "global_step": 92552, "epoch": 2203} {"train_loss": -6.334427833557129, "global_step": 92553, "epoch": 2203} {"train_loss": -6.226059913635254, "global_step": 92554, "epoch": 2203} {"train_loss": -6.215868949890137, "global_step": 92555, "epoch": 2203} {"train_loss": -6.297390937805176, "global_step": 92556, "epoch": 2203} {"train_loss": -6.210757255554199, "global_step": 92557, "epoch": 2203} {"train_loss": -6.3011369705200195, "global_step": 92558, "epoch": 2203} {"train_loss": -6.275812149047852, "global_step": 92559, "epoch": 2203} {"train_loss": -6.265130996704102, "global_step": 92560, "epoch": 2203} {"train_loss": -6.238747596740723, "global_step": 92561, "epoch": 2203} {"train_loss": -6.185395240783691, "global_step": 92562, "epoch": 2203} {"train_loss": -6.266087055206299, "global_step": 92563, "epoch": 2203} {"train_loss": -6.168910026550293, "global_step": 92564, "epoch": 2203} {"train_loss": -6.2524003982543945, "global_step": 92565, "epoch": 2203} {"train_loss": -6.2342610359191895, "global_step": 92566, "epoch": 2203} {"train_loss": -6.273278009323847, "global_step": 92567, "epoch": 2203, "val_loss": 63486.48046875} {"train_loss": -6.252508163452148, "global_step": 92568, "epoch": 2204} {"train_loss": -6.215243339538574, "global_step": 92569, "epoch": 2204} {"train_loss": -6.255982398986816, "global_step": 92570, "epoch": 2204} {"train_loss": -6.208409309387207, "global_step": 92571, "epoch": 2204} {"train_loss": -6.233239650726318, "global_step": 92572, "epoch": 2204} {"train_loss": -6.323982238769531, "global_step": 92573, "epoch": 2204} {"train_loss": -6.283262252807617, "global_step": 92574, "epoch": 2204} {"train_loss": -6.255073070526123, "global_step": 92575, "epoch": 2204} {"train_loss": -6.24267578125, "global_step": 92576, "epoch": 2204} {"train_loss": -6.224233150482178, "global_step": 92577, "epoch": 2204} {"train_loss": -6.179813385009766, "global_step": 92578, "epoch": 2204} {"train_loss": -6.248810768127441, "global_step": 92579, "epoch": 2204} {"train_loss": -6.425865173339844, "global_step": 92580, "epoch": 2204} {"train_loss": -6.270935535430908, "global_step": 92581, "epoch": 2204} {"train_loss": -6.286805152893066, "global_step": 92582, "epoch": 2204} {"train_loss": -6.312095642089844, "global_step": 92583, "epoch": 2204} {"train_loss": -6.339725494384766, "global_step": 92584, "epoch": 2204} {"train_loss": -6.276801586151123, "global_step": 92585, "epoch": 2204} {"train_loss": -6.264168739318848, "global_step": 92586, "epoch": 2204} {"train_loss": -6.252721786499023, "global_step": 92587, "epoch": 2204} {"train_loss": -6.261874198913574, "global_step": 92588, "epoch": 2204} {"train_loss": -6.337912559509277, "global_step": 92589, "epoch": 2204} {"train_loss": -6.292801856994629, "global_step": 92590, "epoch": 2204} {"train_loss": -6.31336784362793, "global_step": 92591, "epoch": 2204} {"train_loss": -6.233553409576416, "global_step": 92592, "epoch": 2204} {"train_loss": -6.24847936630249, "global_step": 92593, "epoch": 2204} {"train_loss": -6.383699893951416, "global_step": 92594, "epoch": 2204} {"train_loss": -6.333050727844238, "global_step": 92595, "epoch": 2204} {"train_loss": -6.251107692718506, "global_step": 92596, "epoch": 2204} {"train_loss": -6.231040000915527, "global_step": 92597, "epoch": 2204} {"train_loss": -6.3415327072143555, "global_step": 92598, "epoch": 2204} {"train_loss": -6.355591773986816, "global_step": 92599, "epoch": 2204} {"train_loss": -6.249732494354248, "global_step": 92600, "epoch": 2204} {"train_loss": -6.274303436279297, "global_step": 92601, "epoch": 2204} {"train_loss": -6.274792671203613, "global_step": 92602, "epoch": 2204} {"train_loss": -6.303617000579834, "global_step": 92603, "epoch": 2204} {"train_loss": -6.368281364440918, "global_step": 92604, "epoch": 2204} {"train_loss": -6.244867324829102, "global_step": 92605, "epoch": 2204} {"train_loss": -6.380020618438721, "global_step": 92606, "epoch": 2204} {"train_loss": -6.236367225646973, "global_step": 92607, "epoch": 2204} {"train_loss": -6.312434196472168, "global_step": 92608, "epoch": 2204} {"train_loss": -6.278766223362514, "global_step": 92609, "epoch": 2204, "val_loss": 63140.52734375} {"train_loss": -6.205692291259766, "global_step": 92610, "epoch": 2205} {"train_loss": -6.2935028076171875, "global_step": 92611, "epoch": 2205} {"train_loss": -6.315745830535889, "global_step": 92612, "epoch": 2205} {"train_loss": -6.202751636505127, "global_step": 92613, "epoch": 2205} {"train_loss": -6.285772323608398, "global_step": 92614, "epoch": 2205} {"train_loss": -6.394299030303955, "global_step": 92615, "epoch": 2205} {"train_loss": -6.352159023284912, "global_step": 92616, "epoch": 2205} {"train_loss": -6.284992218017578, "global_step": 92617, "epoch": 2205} {"train_loss": -6.355442047119141, "global_step": 92618, "epoch": 2205} {"train_loss": -6.260567665100098, "global_step": 92619, "epoch": 2205} {"train_loss": -6.244596481323242, "global_step": 92620, "epoch": 2205} {"train_loss": -6.136934280395508, "global_step": 92621, "epoch": 2205} {"train_loss": -6.259347438812256, "global_step": 92622, "epoch": 2205} {"train_loss": -6.294456958770752, "global_step": 92623, "epoch": 2205} {"train_loss": -6.219110012054443, "global_step": 92624, "epoch": 2205} {"train_loss": -6.30732536315918, "global_step": 92625, "epoch": 2205} {"train_loss": -6.271937370300293, "global_step": 92626, "epoch": 2205} {"train_loss": -6.2678632736206055, "global_step": 92627, "epoch": 2205} {"train_loss": -6.2145676612854, "global_step": 92628, "epoch": 2205} {"train_loss": -6.3071088790893555, "global_step": 92629, "epoch": 2205} {"train_loss": -6.252740383148193, "global_step": 92630, "epoch": 2205} {"train_loss": -6.212482452392578, "global_step": 92631, "epoch": 2205} {"train_loss": -6.333186626434326, "global_step": 92632, "epoch": 2205} {"train_loss": -6.378204345703125, "global_step": 92633, "epoch": 2205} {"train_loss": -6.263149261474609, "global_step": 92634, "epoch": 2205} {"train_loss": -6.1768035888671875, "global_step": 92635, "epoch": 2205} {"train_loss": -6.283527374267578, "global_step": 92636, "epoch": 2205} {"train_loss": -6.364115238189697, "global_step": 92637, "epoch": 2205} {"train_loss": -6.382013320922852, "global_step": 92638, "epoch": 2205} {"train_loss": -6.186140060424805, "global_step": 92639, "epoch": 2205} {"train_loss": -6.249837875366211, "global_step": 92640, "epoch": 2205} {"train_loss": -6.164562225341797, "global_step": 92641, "epoch": 2205} {"train_loss": -6.321168899536133, "global_step": 92642, "epoch": 2205} {"train_loss": -6.199644565582275, "global_step": 92643, "epoch": 2205} {"train_loss": -6.233180046081543, "global_step": 92644, "epoch": 2205} {"train_loss": -6.316065788269043, "global_step": 92645, "epoch": 2205} {"train_loss": -6.272643089294434, "global_step": 92646, "epoch": 2205} {"train_loss": -6.287353515625, "global_step": 92647, "epoch": 2205} {"train_loss": -6.293593883514404, "global_step": 92648, "epoch": 2205} {"train_loss": -6.187736511230469, "global_step": 92649, "epoch": 2205} {"train_loss": -6.283567428588867, "global_step": 92650, "epoch": 2205} {"train_loss": -6.270026649747576, "global_step": 92651, "epoch": 2205, "val_loss": 63417.6796875} {"train_loss": -6.273804664611816, "global_step": 92652, "epoch": 2206} {"train_loss": -6.25420618057251, "global_step": 92653, "epoch": 2206} {"train_loss": -6.268683433532715, "global_step": 92654, "epoch": 2206} {"train_loss": -6.316810131072998, "global_step": 92655, "epoch": 2206} {"train_loss": -6.241115570068359, "global_step": 92656, "epoch": 2206} {"train_loss": -6.27894401550293, "global_step": 92657, "epoch": 2206} {"train_loss": -6.219390869140625, "global_step": 92658, "epoch": 2206} {"train_loss": -6.221490383148193, "global_step": 92659, "epoch": 2206} {"train_loss": -6.385315895080566, "global_step": 92660, "epoch": 2206} {"train_loss": -6.279444694519043, "global_step": 92661, "epoch": 2206} {"train_loss": -6.256914138793945, "global_step": 92662, "epoch": 2206} {"train_loss": -6.342198371887207, "global_step": 92663, "epoch": 2206} {"train_loss": -6.317717552185059, "global_step": 92664, "epoch": 2206} {"train_loss": -6.2352752685546875, "global_step": 92665, "epoch": 2206} {"train_loss": -6.320003986358643, "global_step": 92666, "epoch": 2206} {"train_loss": -6.233458518981934, "global_step": 92667, "epoch": 2206} {"train_loss": -6.339916229248047, "global_step": 92668, "epoch": 2206} {"train_loss": -6.441742897033691, "global_step": 92669, "epoch": 2206} {"train_loss": -6.3211774826049805, "global_step": 92670, "epoch": 2206} {"train_loss": -6.412165641784668, "global_step": 92671, "epoch": 2206} {"train_loss": -6.319426536560059, "global_step": 92672, "epoch": 2206} {"train_loss": -6.320065498352051, "global_step": 92673, "epoch": 2206} {"train_loss": -6.316371917724609, "global_step": 92674, "epoch": 2206} {"train_loss": -6.186565399169922, "global_step": 92675, "epoch": 2206} {"train_loss": -6.247556209564209, "global_step": 92676, "epoch": 2206} {"train_loss": -6.298568248748779, "global_step": 92677, "epoch": 2206} {"train_loss": -6.3081135749816895, "global_step": 92678, "epoch": 2206} {"train_loss": -6.313398361206055, "global_step": 92679, "epoch": 2206} {"train_loss": -6.264509201049805, "global_step": 92680, "epoch": 2206} {"train_loss": -6.388364791870117, "global_step": 92681, "epoch": 2206} {"train_loss": -6.233280658721924, "global_step": 92682, "epoch": 2206} {"train_loss": -6.244570732116699, "global_step": 92683, "epoch": 2206} {"train_loss": -6.289957046508789, "global_step": 92684, "epoch": 2206} {"train_loss": -6.2248406410217285, "global_step": 92685, "epoch": 2206} {"train_loss": -6.4117279052734375, "global_step": 92686, "epoch": 2206} {"train_loss": -6.257528781890869, "global_step": 92687, "epoch": 2206} {"train_loss": -6.324155330657959, "global_step": 92688, "epoch": 2206} {"train_loss": -6.307041168212891, "global_step": 92689, "epoch": 2206} {"train_loss": -6.27508544921875, "global_step": 92690, "epoch": 2206} {"train_loss": -6.304337024688721, "global_step": 92691, "epoch": 2206} {"train_loss": -6.206273078918457, "global_step": 92692, "epoch": 2206} {"train_loss": -6.291798784619286, "global_step": 92693, "epoch": 2206, "val_loss": 63543.43359375} {"train_loss": -6.337047576904297, "global_step": 92694, "epoch": 2207} {"train_loss": -6.2387847900390625, "global_step": 92695, "epoch": 2207} {"train_loss": -6.255337715148926, "global_step": 92696, "epoch": 2207} {"train_loss": -6.327301025390625, "global_step": 92697, "epoch": 2207} {"train_loss": -6.259907245635986, "global_step": 92698, "epoch": 2207} {"train_loss": -6.171154022216797, "global_step": 92699, "epoch": 2207} {"train_loss": -6.120593547821045, "global_step": 92700, "epoch": 2207} {"train_loss": -6.351004123687744, "global_step": 92701, "epoch": 2207} {"train_loss": -6.329097747802734, "global_step": 92702, "epoch": 2207} {"train_loss": -6.29207706451416, "global_step": 92703, "epoch": 2207} {"train_loss": -6.311898231506348, "global_step": 92704, "epoch": 2207} {"train_loss": -6.282712936401367, "global_step": 92705, "epoch": 2207} {"train_loss": -6.396197319030762, "global_step": 92706, "epoch": 2207} {"train_loss": -6.369542598724365, "global_step": 92707, "epoch": 2207} {"train_loss": -6.373867988586426, "global_step": 92708, "epoch": 2207} {"train_loss": -6.253193378448486, "global_step": 92709, "epoch": 2207} {"train_loss": -6.271150588989258, "global_step": 92710, "epoch": 2207} {"train_loss": -6.241290092468262, "global_step": 92711, "epoch": 2207} {"train_loss": -6.207223892211914, "global_step": 92712, "epoch": 2207} {"train_loss": -6.343465805053711, "global_step": 92713, "epoch": 2207} {"train_loss": -6.29309606552124, "global_step": 92714, "epoch": 2207} {"train_loss": -6.216201305389404, "global_step": 92715, "epoch": 2207} {"train_loss": -6.162450313568115, "global_step": 92716, "epoch": 2207} {"train_loss": -6.212531089782715, "global_step": 92717, "epoch": 2207} {"train_loss": -6.186270236968994, "global_step": 92718, "epoch": 2207} {"train_loss": -6.277105808258057, "global_step": 92719, "epoch": 2207} {"train_loss": -6.191344738006592, "global_step": 92720, "epoch": 2207} {"train_loss": -6.202913761138916, "global_step": 92721, "epoch": 2207} {"train_loss": -6.208268165588379, "global_step": 92722, "epoch": 2207} {"train_loss": -6.286383152008057, "global_step": 92723, "epoch": 2207} {"train_loss": -6.255120277404785, "global_step": 92724, "epoch": 2207} {"train_loss": -6.306293487548828, "global_step": 92725, "epoch": 2207} {"train_loss": -6.1797990798950195, "global_step": 92726, "epoch": 2207} {"train_loss": -6.246507167816162, "global_step": 92727, "epoch": 2207} {"train_loss": -6.246938705444336, "global_step": 92728, "epoch": 2207} {"train_loss": -6.180905818939209, "global_step": 92729, "epoch": 2207} {"train_loss": -6.278757095336914, "global_step": 92730, "epoch": 2207} {"train_loss": -6.281445503234863, "global_step": 92731, "epoch": 2207} {"train_loss": -6.260387420654297, "global_step": 92732, "epoch": 2207} {"train_loss": -6.268834590911865, "global_step": 92733, "epoch": 2207} {"train_loss": -6.301275253295898, "global_step": 92734, "epoch": 2207} {"train_loss": -6.266083478927612, "global_step": 92735, "epoch": 2207, "val_loss": 63241.06640625} {"train_loss": -6.3277435302734375, "global_step": 92736, "epoch": 2208} {"train_loss": -6.171483993530273, "global_step": 92737, "epoch": 2208} {"train_loss": -6.25293493270874, "global_step": 92738, "epoch": 2208} {"train_loss": -6.33766508102417, "global_step": 92739, "epoch": 2208} {"train_loss": -6.44403076171875, "global_step": 92740, "epoch": 2208} {"train_loss": -6.344291687011719, "global_step": 92741, "epoch": 2208} {"train_loss": -6.375171661376953, "global_step": 92742, "epoch": 2208} {"train_loss": -6.229548454284668, "global_step": 92743, "epoch": 2208} {"train_loss": -6.340801239013672, "global_step": 92744, "epoch": 2208} {"train_loss": -6.165323734283447, "global_step": 92745, "epoch": 2208} {"train_loss": -6.234322547912598, "global_step": 92746, "epoch": 2208} {"train_loss": -6.279702186584473, "global_step": 92747, "epoch": 2208} {"train_loss": -6.248340129852295, "global_step": 92748, "epoch": 2208} {"train_loss": -6.219089031219482, "global_step": 92749, "epoch": 2208} {"train_loss": -6.217398643493652, "global_step": 92750, "epoch": 2208} {"train_loss": -6.245571136474609, "global_step": 92751, "epoch": 2208} {"train_loss": -6.273345947265625, "global_step": 92752, "epoch": 2208} {"train_loss": -6.1531572341918945, "global_step": 92753, "epoch": 2208} {"train_loss": -6.207759857177734, "global_step": 92754, "epoch": 2208} {"train_loss": -6.267112731933594, "global_step": 92755, "epoch": 2208} {"train_loss": -6.162503719329834, "global_step": 92756, "epoch": 2208} {"train_loss": -6.205197334289551, "global_step": 92757, "epoch": 2208} {"train_loss": -6.183925628662109, "global_step": 92758, "epoch": 2208} {"train_loss": -6.250456809997559, "global_step": 92759, "epoch": 2208} {"train_loss": -6.1431403160095215, "global_step": 92760, "epoch": 2208} {"train_loss": -6.248610973358154, "global_step": 92761, "epoch": 2208} {"train_loss": -6.147468566894531, "global_step": 92762, "epoch": 2208} {"train_loss": -6.309492111206055, "global_step": 92763, "epoch": 2208} {"train_loss": -6.239957332611084, "global_step": 92764, "epoch": 2208} {"train_loss": -6.306623458862305, "global_step": 92765, "epoch": 2208} {"train_loss": -6.329502105712891, "global_step": 92766, "epoch": 2208} {"train_loss": -6.2290191650390625, "global_step": 92767, "epoch": 2208} {"train_loss": -6.221151351928711, "global_step": 92768, "epoch": 2208} {"train_loss": -6.272505760192871, "global_step": 92769, "epoch": 2208} {"train_loss": -6.2906694412231445, "global_step": 92770, "epoch": 2208} {"train_loss": -6.309476852416992, "global_step": 92771, "epoch": 2208} {"train_loss": -6.287234306335449, "global_step": 92772, "epoch": 2208} {"train_loss": -6.239274024963379, "global_step": 92773, "epoch": 2208} {"train_loss": -6.352456092834473, "global_step": 92774, "epoch": 2208} {"train_loss": -6.271196365356445, "global_step": 92775, "epoch": 2208} {"train_loss": -6.328304290771484, "global_step": 92776, "epoch": 2208} {"train_loss": -6.259351321629116, "global_step": 92777, "epoch": 2208, "val_loss": 63570.81640625} {"train_loss": -6.27060079574585, "global_step": 92778, "epoch": 2209} {"train_loss": -6.30251407623291, "global_step": 92779, "epoch": 2209} {"train_loss": -6.261935234069824, "global_step": 92780, "epoch": 2209} {"train_loss": -6.296600341796875, "global_step": 92781, "epoch": 2209} {"train_loss": -6.310944557189941, "global_step": 92782, "epoch": 2209} {"train_loss": -6.324749946594238, "global_step": 92783, "epoch": 2209} {"train_loss": -6.315827369689941, "global_step": 92784, "epoch": 2209} {"train_loss": -6.270781993865967, "global_step": 92785, "epoch": 2209} {"train_loss": -6.379378795623779, "global_step": 92786, "epoch": 2209} {"train_loss": -6.296854496002197, "global_step": 92787, "epoch": 2209} {"train_loss": -6.232254981994629, "global_step": 92788, "epoch": 2209} {"train_loss": -6.291688919067383, "global_step": 92789, "epoch": 2209} {"train_loss": -6.301774024963379, "global_step": 92790, "epoch": 2209} {"train_loss": -6.345248222351074, "global_step": 92791, "epoch": 2209} {"train_loss": -6.2477240562438965, "global_step": 92792, "epoch": 2209} {"train_loss": -6.3994975090026855, "global_step": 92793, "epoch": 2209} {"train_loss": -6.2145514488220215, "global_step": 92794, "epoch": 2209} {"train_loss": -6.327630043029785, "global_step": 92795, "epoch": 2209} {"train_loss": -6.257859706878662, "global_step": 92796, "epoch": 2209} {"train_loss": -6.32558536529541, "global_step": 92797, "epoch": 2209} {"train_loss": -6.383376121520996, "global_step": 92798, "epoch": 2209} {"train_loss": -6.343405723571777, "global_step": 92799, "epoch": 2209} {"train_loss": -6.332108497619629, "global_step": 92800, "epoch": 2209} {"train_loss": -6.30760383605957, "global_step": 92801, "epoch": 2209} {"train_loss": -6.299981117248535, "global_step": 92802, "epoch": 2209} {"train_loss": -6.284587860107422, "global_step": 92803, "epoch": 2209} {"train_loss": -6.362204551696777, "global_step": 92804, "epoch": 2209} {"train_loss": -6.226720333099365, "global_step": 92805, "epoch": 2209} {"train_loss": -6.369776725769043, "global_step": 92806, "epoch": 2209} {"train_loss": -6.271656513214111, "global_step": 92807, "epoch": 2209} {"train_loss": -6.231508255004883, "global_step": 92808, "epoch": 2209} {"train_loss": -6.287034511566162, "global_step": 92809, "epoch": 2209} {"train_loss": -6.106801986694336, "global_step": 92810, "epoch": 2209} {"train_loss": -6.215211868286133, "global_step": 92811, "epoch": 2209} {"train_loss": -6.206075668334961, "global_step": 92812, "epoch": 2209} {"train_loss": -6.344789028167725, "global_step": 92813, "epoch": 2209} {"train_loss": -6.237721920013428, "global_step": 92814, "epoch": 2209} {"train_loss": -6.280930519104004, "global_step": 92815, "epoch": 2209} {"train_loss": -6.250493049621582, "global_step": 92816, "epoch": 2209} {"train_loss": -6.380914211273193, "global_step": 92817, "epoch": 2209} {"train_loss": -6.206685543060303, "global_step": 92818, "epoch": 2209} {"train_loss": -6.290962605249314, "global_step": 92819, "epoch": 2209, "val_loss": 63409.8359375} {"train_loss": -6.185003280639648, "global_step": 92820, "epoch": 2210} {"train_loss": -6.324419975280762, "global_step": 92821, "epoch": 2210} {"train_loss": -6.283022880554199, "global_step": 92822, "epoch": 2210} {"train_loss": -6.36093807220459, "global_step": 92823, "epoch": 2210} {"train_loss": -6.243137836456299, "global_step": 92824, "epoch": 2210} {"train_loss": -6.219028472900391, "global_step": 92825, "epoch": 2210} {"train_loss": -6.350388526916504, "global_step": 92826, "epoch": 2210} {"train_loss": -6.228773593902588, "global_step": 92827, "epoch": 2210} {"train_loss": -6.332851409912109, "global_step": 92828, "epoch": 2210} {"train_loss": -6.340280532836914, "global_step": 92829, "epoch": 2210} {"train_loss": -6.211726188659668, "global_step": 92830, "epoch": 2210} {"train_loss": -6.250083923339844, "global_step": 92831, "epoch": 2210} {"train_loss": -6.141427516937256, "global_step": 92832, "epoch": 2210} {"train_loss": -6.2129974365234375, "global_step": 92833, "epoch": 2210} {"train_loss": -6.171483993530273, "global_step": 92834, "epoch": 2210} {"train_loss": -6.1929497718811035, "global_step": 92835, "epoch": 2210} {"train_loss": -6.30567741394043, "global_step": 92836, "epoch": 2210} {"train_loss": -6.244900703430176, "global_step": 92837, "epoch": 2210} {"train_loss": -6.269266128540039, "global_step": 92838, "epoch": 2210} {"train_loss": -6.210865020751953, "global_step": 92839, "epoch": 2210} {"train_loss": -6.149388313293457, "global_step": 92840, "epoch": 2210} {"train_loss": -6.248640537261963, "global_step": 92841, "epoch": 2210} {"train_loss": -6.221426010131836, "global_step": 92842, "epoch": 2210} {"train_loss": -6.22507381439209, "global_step": 92843, "epoch": 2210} {"train_loss": -6.316242694854736, "global_step": 92844, "epoch": 2210} {"train_loss": -6.308650016784668, "global_step": 92845, "epoch": 2210} {"train_loss": -6.295799255371094, "global_step": 92846, "epoch": 2210} {"train_loss": -6.377768516540527, "global_step": 92847, "epoch": 2210} {"train_loss": -6.231549263000488, "global_step": 92848, "epoch": 2210} {"train_loss": -6.367351055145264, "global_step": 92849, "epoch": 2210} {"train_loss": -6.239850997924805, "global_step": 92850, "epoch": 2210} {"train_loss": -6.321996212005615, "global_step": 92851, "epoch": 2210} {"train_loss": -6.299581527709961, "global_step": 92852, "epoch": 2210} {"train_loss": -6.243563652038574, "global_step": 92853, "epoch": 2210} {"train_loss": -6.355226039886475, "global_step": 92854, "epoch": 2210} {"train_loss": -6.479623317718506, "global_step": 92855, "epoch": 2210} {"train_loss": -6.363249778747559, "global_step": 92856, "epoch": 2210} {"train_loss": -6.305512428283691, "global_step": 92857, "epoch": 2210} {"train_loss": -6.318864822387695, "global_step": 92858, "epoch": 2210} {"train_loss": -6.218132495880127, "global_step": 92859, "epoch": 2210} {"train_loss": -6.377909183502197, "global_step": 92860, "epoch": 2210} {"train_loss": -6.279603538059053, "global_step": 92861, "epoch": 2210, "val_loss": 63428.72265625} {"train_loss": -6.371580123901367, "global_step": 92862, "epoch": 2211} {"train_loss": -6.340606689453125, "global_step": 92863, "epoch": 2211} {"train_loss": -6.235835552215576, "global_step": 92864, "epoch": 2211} {"train_loss": -6.3792619705200195, "global_step": 92865, "epoch": 2211} {"train_loss": -6.291309356689453, "global_step": 92866, "epoch": 2211} {"train_loss": -6.288995265960693, "global_step": 92867, "epoch": 2211} {"train_loss": -6.328539848327637, "global_step": 92868, "epoch": 2211} {"train_loss": -6.348995208740234, "global_step": 92869, "epoch": 2211} {"train_loss": -6.377101898193359, "global_step": 92870, "epoch": 2211} {"train_loss": -6.389926433563232, "global_step": 92871, "epoch": 2211} {"train_loss": -6.267849922180176, "global_step": 92872, "epoch": 2211} {"train_loss": -6.374187469482422, "global_step": 92873, "epoch": 2211} {"train_loss": -6.263995170593262, "global_step": 92874, "epoch": 2211} {"train_loss": -6.314494609832764, "global_step": 92875, "epoch": 2211} {"train_loss": -6.380044460296631, "global_step": 92876, "epoch": 2211} {"train_loss": -6.294077396392822, "global_step": 92877, "epoch": 2211} {"train_loss": -6.379753589630127, "global_step": 92878, "epoch": 2211} {"train_loss": -6.33249044418335, "global_step": 92879, "epoch": 2211} {"train_loss": -6.17808723449707, "global_step": 92880, "epoch": 2211} {"train_loss": -6.310740947723389, "global_step": 92881, "epoch": 2211} {"train_loss": -6.272271633148193, "global_step": 92882, "epoch": 2211} {"train_loss": -6.174873352050781, "global_step": 92883, "epoch": 2211} {"train_loss": -6.368078231811523, "global_step": 92884, "epoch": 2211} {"train_loss": -6.187195777893066, "global_step": 92885, "epoch": 2211} {"train_loss": -6.43623161315918, "global_step": 92886, "epoch": 2211} {"train_loss": -6.40554666519165, "global_step": 92887, "epoch": 2211} {"train_loss": -6.318642616271973, "global_step": 92888, "epoch": 2211} {"train_loss": -6.270895957946777, "global_step": 92889, "epoch": 2211} {"train_loss": -6.161398887634277, "global_step": 92890, "epoch": 2211} {"train_loss": -6.2723894119262695, "global_step": 92891, "epoch": 2211} {"train_loss": -6.330377578735352, "global_step": 92892, "epoch": 2211} {"train_loss": -6.307643890380859, "global_step": 92893, "epoch": 2211} {"train_loss": -6.315262794494629, "global_step": 92894, "epoch": 2211} {"train_loss": -6.428426742553711, "global_step": 92895, "epoch": 2211} {"train_loss": -6.146882057189941, "global_step": 92896, "epoch": 2211} {"train_loss": -6.21727991104126, "global_step": 92897, "epoch": 2211} {"train_loss": -6.384772300720215, "global_step": 92898, "epoch": 2211} {"train_loss": -6.331786155700684, "global_step": 92899, "epoch": 2211} {"train_loss": -6.2860188484191895, "global_step": 92900, "epoch": 2211} {"train_loss": -6.312273979187012, "global_step": 92901, "epoch": 2211} {"train_loss": -6.293842315673828, "global_step": 92902, "epoch": 2211} {"train_loss": -6.312672762643723, "global_step": 92903, "epoch": 2211, "val_loss": 63357.00390625} {"train_loss": -6.2550153732299805, "global_step": 92904, "epoch": 2212} {"train_loss": -6.183658123016357, "global_step": 92905, "epoch": 2212} {"train_loss": -6.418332576751709, "global_step": 92906, "epoch": 2212} {"train_loss": -6.297869682312012, "global_step": 92907, "epoch": 2212} {"train_loss": -6.312127113342285, "global_step": 92908, "epoch": 2212} {"train_loss": -6.219764709472656, "global_step": 92909, "epoch": 2212} {"train_loss": -6.364691734313965, "global_step": 92910, "epoch": 2212} {"train_loss": -6.1408843994140625, "global_step": 92911, "epoch": 2212} {"train_loss": -6.345157623291016, "global_step": 92912, "epoch": 2212} {"train_loss": -6.0815229415893555, "global_step": 92913, "epoch": 2212} {"train_loss": -6.290634632110596, "global_step": 92914, "epoch": 2212} {"train_loss": -6.334097862243652, "global_step": 92915, "epoch": 2212} {"train_loss": -6.288986682891846, "global_step": 92916, "epoch": 2212} {"train_loss": -6.225236415863037, "global_step": 92917, "epoch": 2212} {"train_loss": -6.410196781158447, "global_step": 92918, "epoch": 2212} {"train_loss": -6.241433143615723, "global_step": 92919, "epoch": 2212} {"train_loss": -6.208972454071045, "global_step": 92920, "epoch": 2212} {"train_loss": -6.300395488739014, "global_step": 92921, "epoch": 2212} {"train_loss": -6.220990180969238, "global_step": 92922, "epoch": 2212} {"train_loss": -6.188508033752441, "global_step": 92923, "epoch": 2212} {"train_loss": -6.367928981781006, "global_step": 92924, "epoch": 2212} {"train_loss": -6.185852527618408, "global_step": 92925, "epoch": 2212} {"train_loss": -6.247488021850586, "global_step": 92926, "epoch": 2212} {"train_loss": -6.214029788970947, "global_step": 92927, "epoch": 2212} {"train_loss": -6.331377029418945, "global_step": 92928, "epoch": 2212} {"train_loss": -6.286669731140137, "global_step": 92929, "epoch": 2212} {"train_loss": -6.222372055053711, "global_step": 92930, "epoch": 2212} {"train_loss": -6.236516952514648, "global_step": 92931, "epoch": 2212} {"train_loss": -6.24901008605957, "global_step": 92932, "epoch": 2212} {"train_loss": -6.167860984802246, "global_step": 92933, "epoch": 2212} {"train_loss": -6.203062057495117, "global_step": 92934, "epoch": 2212} {"train_loss": -6.441461086273193, "global_step": 92935, "epoch": 2212} {"train_loss": -6.343209266662598, "global_step": 92936, "epoch": 2212} {"train_loss": -6.437071800231934, "global_step": 92937, "epoch": 2212} {"train_loss": -6.1941938400268555, "global_step": 92938, "epoch": 2212} {"train_loss": -6.2375030517578125, "global_step": 92939, "epoch": 2212} {"train_loss": -6.320436477661133, "global_step": 92940, "epoch": 2212} {"train_loss": -6.311714172363281, "global_step": 92941, "epoch": 2212} {"train_loss": -6.280828475952148, "global_step": 92942, "epoch": 2212} {"train_loss": -6.433215141296387, "global_step": 92943, "epoch": 2212} {"train_loss": -6.288774013519287, "global_step": 92944, "epoch": 2212} {"train_loss": -6.274568273907616, "global_step": 92945, "epoch": 2212, "val_loss": 63237.07421875} {"train_loss": -6.306547164916992, "global_step": 92946, "epoch": 2213} {"train_loss": -6.145895004272461, "global_step": 92947, "epoch": 2213} {"train_loss": -6.2351884841918945, "global_step": 92948, "epoch": 2213} {"train_loss": -6.319708824157715, "global_step": 92949, "epoch": 2213} {"train_loss": -6.259988784790039, "global_step": 92950, "epoch": 2213} {"train_loss": -6.128273963928223, "global_step": 92951, "epoch": 2213} {"train_loss": -6.370555400848389, "global_step": 92952, "epoch": 2213} {"train_loss": -6.26845645904541, "global_step": 92953, "epoch": 2213} {"train_loss": -6.237919807434082, "global_step": 92954, "epoch": 2213} {"train_loss": -6.274906635284424, "global_step": 92955, "epoch": 2213} {"train_loss": -6.108497142791748, "global_step": 92956, "epoch": 2213} {"train_loss": -6.356605529785156, "global_step": 92957, "epoch": 2213} {"train_loss": -6.225104331970215, "global_step": 92958, "epoch": 2213} {"train_loss": -6.224187850952148, "global_step": 92959, "epoch": 2213} {"train_loss": -6.279438018798828, "global_step": 92960, "epoch": 2213} {"train_loss": -6.16497802734375, "global_step": 92961, "epoch": 2213} {"train_loss": -6.336132049560547, "global_step": 92962, "epoch": 2213} {"train_loss": -6.208171844482422, "global_step": 92963, "epoch": 2213} {"train_loss": -6.302403450012207, "global_step": 92964, "epoch": 2213} {"train_loss": -6.171560287475586, "global_step": 92965, "epoch": 2213} {"train_loss": -6.378548622131348, "global_step": 92966, "epoch": 2213} {"train_loss": -6.305588722229004, "global_step": 92967, "epoch": 2213} {"train_loss": -6.292930603027344, "global_step": 92968, "epoch": 2213} {"train_loss": -6.233561038970947, "global_step": 92969, "epoch": 2213} {"train_loss": -6.292586326599121, "global_step": 92970, "epoch": 2213} {"train_loss": -6.336172103881836, "global_step": 92971, "epoch": 2213} {"train_loss": -6.172671318054199, "global_step": 92972, "epoch": 2213} {"train_loss": -6.1553730964660645, "global_step": 92973, "epoch": 2213} {"train_loss": -6.209774494171143, "global_step": 92974, "epoch": 2213} {"train_loss": -6.1958327293396, "global_step": 92975, "epoch": 2213} {"train_loss": -6.374847888946533, "global_step": 92976, "epoch": 2213} {"train_loss": -6.333741188049316, "global_step": 92977, "epoch": 2213} {"train_loss": -6.254472732543945, "global_step": 92978, "epoch": 2213} {"train_loss": -6.315181732177734, "global_step": 92979, "epoch": 2213} {"train_loss": -6.1300811767578125, "global_step": 92980, "epoch": 2213} {"train_loss": -6.356110572814941, "global_step": 92981, "epoch": 2213} {"train_loss": -6.33502197265625, "global_step": 92982, "epoch": 2213} {"train_loss": -6.291695594787598, "global_step": 92983, "epoch": 2213} {"train_loss": -6.322299957275391, "global_step": 92984, "epoch": 2213} {"train_loss": -6.201021194458008, "global_step": 92985, "epoch": 2213} {"train_loss": -6.3051300048828125, "global_step": 92986, "epoch": 2213} {"train_loss": -6.2605171998341875, "global_step": 92987, "epoch": 2213, "val_loss": 63420.90234375} {"train_loss": -6.136418342590332, "global_step": 92988, "epoch": 2214} {"train_loss": -6.355628967285156, "global_step": 92989, "epoch": 2214} {"train_loss": -6.198917388916016, "global_step": 92990, "epoch": 2214} {"train_loss": -6.229079246520996, "global_step": 92991, "epoch": 2214} {"train_loss": -6.083668231964111, "global_step": 92992, "epoch": 2214} {"train_loss": -6.326314449310303, "global_step": 92993, "epoch": 2214} {"train_loss": -6.125748634338379, "global_step": 92994, "epoch": 2214} {"train_loss": -6.211492538452148, "global_step": 92995, "epoch": 2214} {"train_loss": -6.318492889404297, "global_step": 92996, "epoch": 2214} {"train_loss": -6.251471042633057, "global_step": 92997, "epoch": 2214} {"train_loss": -6.276989936828613, "global_step": 92998, "epoch": 2214} {"train_loss": -6.148794174194336, "global_step": 92999, "epoch": 2214} {"train_loss": -6.2136616706848145, "global_step": 93000, "epoch": 2214} {"train_loss": -6.298340797424316, "global_step": 93001, "epoch": 2214} {"train_loss": -6.299522399902344, "global_step": 93002, "epoch": 2214} {"train_loss": -6.303746700286865, "global_step": 93003, "epoch": 2214} {"train_loss": -6.255943298339844, "global_step": 93004, "epoch": 2214} {"train_loss": -6.452639579772949, "global_step": 93005, "epoch": 2214} {"train_loss": -6.3981781005859375, "global_step": 93006, "epoch": 2214} {"train_loss": -6.394626617431641, "global_step": 93007, "epoch": 2214} {"train_loss": -6.216712951660156, "global_step": 93008, "epoch": 2214} {"train_loss": -6.376105308532715, "global_step": 93009, "epoch": 2214} {"train_loss": -6.312923431396484, "global_step": 93010, "epoch": 2214} {"train_loss": -6.212951183319092, "global_step": 93011, "epoch": 2214} {"train_loss": -6.356734275817871, "global_step": 93012, "epoch": 2214} {"train_loss": -6.3041839599609375, "global_step": 93013, "epoch": 2214} {"train_loss": -6.338646411895752, "global_step": 93014, "epoch": 2214} {"train_loss": -6.4005842208862305, "global_step": 93015, "epoch": 2214} {"train_loss": -6.313923358917236, "global_step": 93016, "epoch": 2214} {"train_loss": -6.357748985290527, "global_step": 93017, "epoch": 2214} {"train_loss": -6.231080532073975, "global_step": 93018, "epoch": 2214} {"train_loss": -6.235726833343506, "global_step": 93019, "epoch": 2214} {"train_loss": -6.246199607849121, "global_step": 93020, "epoch": 2214} {"train_loss": -6.2857465744018555, "global_step": 93021, "epoch": 2214} {"train_loss": -6.25919246673584, "global_step": 93022, "epoch": 2214} {"train_loss": -6.439267158508301, "global_step": 93023, "epoch": 2214} {"train_loss": -6.229765892028809, "global_step": 93024, "epoch": 2214} {"train_loss": -6.214054107666016, "global_step": 93025, "epoch": 2214} {"train_loss": -6.433367729187012, "global_step": 93026, "epoch": 2214} {"train_loss": -6.351204872131348, "global_step": 93027, "epoch": 2214} {"train_loss": -6.284309387207031, "global_step": 93028, "epoch": 2214} {"train_loss": -6.2867747488475985, "global_step": 93029, "epoch": 2214, "val_loss": 63783.8671875} {"train_loss": -6.217985153198242, "global_step": 93030, "epoch": 2215} {"train_loss": -6.211736679077148, "global_step": 93031, "epoch": 2215} {"train_loss": -6.222921371459961, "global_step": 93032, "epoch": 2215} {"train_loss": -6.24289608001709, "global_step": 93033, "epoch": 2215} {"train_loss": -6.312884330749512, "global_step": 93034, "epoch": 2215} {"train_loss": -6.2891035079956055, "global_step": 93035, "epoch": 2215} {"train_loss": -6.428505897521973, "global_step": 93036, "epoch": 2215} {"train_loss": -6.249884605407715, "global_step": 93037, "epoch": 2215} {"train_loss": -6.219710350036621, "global_step": 93038, "epoch": 2215} {"train_loss": -6.381012916564941, "global_step": 93039, "epoch": 2215} {"train_loss": -6.222749710083008, "global_step": 93040, "epoch": 2215} {"train_loss": -6.242989540100098, "global_step": 93041, "epoch": 2215} {"train_loss": -6.353734016418457, "global_step": 93042, "epoch": 2215} {"train_loss": -6.33534049987793, "global_step": 93043, "epoch": 2215} {"train_loss": -6.33116340637207, "global_step": 93044, "epoch": 2215} {"train_loss": -6.221858024597168, "global_step": 93045, "epoch": 2215} {"train_loss": -6.349183082580566, "global_step": 93046, "epoch": 2215} {"train_loss": -6.211693286895752, "global_step": 93047, "epoch": 2215} {"train_loss": -6.325126647949219, "global_step": 93048, "epoch": 2215} {"train_loss": -6.205172538757324, "global_step": 93049, "epoch": 2215} {"train_loss": -6.335644721984863, "global_step": 93050, "epoch": 2215} {"train_loss": -6.217517852783203, "global_step": 93051, "epoch": 2215} {"train_loss": -6.1907477378845215, "global_step": 93052, "epoch": 2215} {"train_loss": -6.2664337158203125, "global_step": 93053, "epoch": 2215} {"train_loss": -6.281791687011719, "global_step": 93054, "epoch": 2215} {"train_loss": -6.3459343910217285, "global_step": 93055, "epoch": 2215} {"train_loss": -6.201803207397461, "global_step": 93056, "epoch": 2215} {"train_loss": -6.173613548278809, "global_step": 93057, "epoch": 2215} {"train_loss": -6.232781410217285, "global_step": 93058, "epoch": 2215} {"train_loss": -6.279847621917725, "global_step": 93059, "epoch": 2215} {"train_loss": -6.293247222900391, "global_step": 93060, "epoch": 2215} {"train_loss": -6.243537902832031, "global_step": 93061, "epoch": 2215} {"train_loss": -6.348714351654053, "global_step": 93062, "epoch": 2215} {"train_loss": -6.287933826446533, "global_step": 93063, "epoch": 2215} {"train_loss": -6.259285926818848, "global_step": 93064, "epoch": 2215} {"train_loss": -6.25843620300293, "global_step": 93065, "epoch": 2215} {"train_loss": -6.280292987823486, "global_step": 93066, "epoch": 2215} {"train_loss": -6.214484691619873, "global_step": 93067, "epoch": 2215} {"train_loss": -6.268316268920898, "global_step": 93068, "epoch": 2215} {"train_loss": -6.274411678314209, "global_step": 93069, "epoch": 2215} {"train_loss": -6.275585651397705, "global_step": 93070, "epoch": 2215} {"train_loss": -6.270962681089129, "global_step": 93071, "epoch": 2215, "val_loss": 63584.15234375} {"train_loss": -6.377620220184326, "global_step": 93072, "epoch": 2216} {"train_loss": -6.209205627441406, "global_step": 93073, "epoch": 2216} {"train_loss": -6.327627658843994, "global_step": 93074, "epoch": 2216} {"train_loss": -6.27983283996582, "global_step": 93075, "epoch": 2216} {"train_loss": -6.263840675354004, "global_step": 93076, "epoch": 2216} {"train_loss": -6.362420082092285, "global_step": 93077, "epoch": 2216} {"train_loss": -6.25272274017334, "global_step": 93078, "epoch": 2216} {"train_loss": -6.266322135925293, "global_step": 93079, "epoch": 2216} {"train_loss": -6.368825912475586, "global_step": 93080, "epoch": 2216} {"train_loss": -6.264836311340332, "global_step": 93081, "epoch": 2216} {"train_loss": -6.4236836433410645, "global_step": 93082, "epoch": 2216} {"train_loss": -6.412219524383545, "global_step": 93083, "epoch": 2216} {"train_loss": -6.323512077331543, "global_step": 93084, "epoch": 2216} {"train_loss": -6.2499260902404785, "global_step": 93085, "epoch": 2216} {"train_loss": -6.256711483001709, "global_step": 93086, "epoch": 2216} {"train_loss": -6.336429119110107, "global_step": 93087, "epoch": 2216} {"train_loss": -6.255199432373047, "global_step": 93088, "epoch": 2216} {"train_loss": -6.345368385314941, "global_step": 93089, "epoch": 2216} {"train_loss": -6.343841552734375, "global_step": 93090, "epoch": 2216} {"train_loss": -6.417458534240723, "global_step": 93091, "epoch": 2216} {"train_loss": -6.315134048461914, "global_step": 93092, "epoch": 2216} {"train_loss": -6.177175521850586, "global_step": 93093, "epoch": 2216} {"train_loss": -6.370420455932617, "global_step": 93094, "epoch": 2216} {"train_loss": -6.336425304412842, "global_step": 93095, "epoch": 2216} {"train_loss": -6.309128761291504, "global_step": 93096, "epoch": 2216} {"train_loss": -6.3827409744262695, "global_step": 93097, "epoch": 2216} {"train_loss": -6.268573760986328, "global_step": 93098, "epoch": 2216} {"train_loss": -6.415923118591309, "global_step": 93099, "epoch": 2216} {"train_loss": -6.243317604064941, "global_step": 93100, "epoch": 2216} {"train_loss": -6.364394187927246, "global_step": 93101, "epoch": 2216} {"train_loss": -6.254810333251953, "global_step": 93102, "epoch": 2216} {"train_loss": -6.382532119750977, "global_step": 93103, "epoch": 2216} {"train_loss": -6.253935813903809, "global_step": 93104, "epoch": 2216} {"train_loss": -6.290450096130371, "global_step": 93105, "epoch": 2216} {"train_loss": -6.303609371185303, "global_step": 93106, "epoch": 2216} {"train_loss": -6.345759391784668, "global_step": 93107, "epoch": 2216} {"train_loss": -6.256732940673828, "global_step": 93108, "epoch": 2216} {"train_loss": -6.278676986694336, "global_step": 93109, "epoch": 2216} {"train_loss": -6.3302483558654785, "global_step": 93110, "epoch": 2216} {"train_loss": -6.408336639404297, "global_step": 93111, "epoch": 2216} {"train_loss": -6.376668930053711, "global_step": 93112, "epoch": 2216} {"train_loss": -6.316189970288958, "global_step": 93113, "epoch": 2216, "val_loss": 63304.22265625} {"train_loss": -6.289626121520996, "global_step": 93114, "epoch": 2217} {"train_loss": -6.456146717071533, "global_step": 93115, "epoch": 2217} {"train_loss": -6.320686340332031, "global_step": 93116, "epoch": 2217} {"train_loss": -6.404561996459961, "global_step": 93117, "epoch": 2217} {"train_loss": -6.205995559692383, "global_step": 93118, "epoch": 2217} {"train_loss": -6.249131202697754, "global_step": 93119, "epoch": 2217} {"train_loss": -6.419733047485352, "global_step": 93120, "epoch": 2217} {"train_loss": -6.351320266723633, "global_step": 93121, "epoch": 2217} {"train_loss": -6.2568039894104, "global_step": 93122, "epoch": 2217} {"train_loss": -6.161075115203857, "global_step": 93123, "epoch": 2217} {"train_loss": -6.0715250968933105, "global_step": 93124, "epoch": 2217} {"train_loss": -6.243021011352539, "global_step": 93125, "epoch": 2217} {"train_loss": -6.131957054138184, "global_step": 93126, "epoch": 2217} {"train_loss": -6.101712226867676, "global_step": 93127, "epoch": 2217} {"train_loss": -6.261981964111328, "global_step": 93128, "epoch": 2217} {"train_loss": -6.339172840118408, "global_step": 93129, "epoch": 2217} {"train_loss": -6.222698211669922, "global_step": 93130, "epoch": 2217} {"train_loss": -6.452485084533691, "global_step": 93131, "epoch": 2217} {"train_loss": -6.196725845336914, "global_step": 93132, "epoch": 2217} {"train_loss": -6.352053642272949, "global_step": 93133, "epoch": 2217} {"train_loss": -6.219901084899902, "global_step": 93134, "epoch": 2217} {"train_loss": -6.259703159332275, "global_step": 93135, "epoch": 2217} {"train_loss": -6.282701015472412, "global_step": 93136, "epoch": 2217} {"train_loss": -6.2320661544799805, "global_step": 93137, "epoch": 2217} {"train_loss": -6.297158241271973, "global_step": 93138, "epoch": 2217} {"train_loss": -6.225771903991699, "global_step": 93139, "epoch": 2217} {"train_loss": -6.415389060974121, "global_step": 93140, "epoch": 2217} {"train_loss": -6.2503790855407715, "global_step": 93141, "epoch": 2217} {"train_loss": -6.212652206420898, "global_step": 93142, "epoch": 2217} {"train_loss": -6.245561122894287, "global_step": 93143, "epoch": 2217} {"train_loss": -6.198851585388184, "global_step": 93144, "epoch": 2217} {"train_loss": -6.2072882652282715, "global_step": 93145, "epoch": 2217} {"train_loss": -6.255467414855957, "global_step": 93146, "epoch": 2217} {"train_loss": -6.274610996246338, "global_step": 93147, "epoch": 2217} {"train_loss": -6.192906379699707, "global_step": 93148, "epoch": 2217} {"train_loss": -6.180283546447754, "global_step": 93149, "epoch": 2217} {"train_loss": -6.263311386108398, "global_step": 93150, "epoch": 2217} {"train_loss": -6.290253639221191, "global_step": 93151, "epoch": 2217} {"train_loss": -6.249482154846191, "global_step": 93152, "epoch": 2217} {"train_loss": -6.296093940734863, "global_step": 93153, "epoch": 2217} {"train_loss": -6.30059814453125, "global_step": 93154, "epoch": 2217} {"train_loss": -6.263514007840838, "global_step": 93155, "epoch": 2217, "val_loss": 63307.953125} {"train_loss": -6.333026885986328, "global_step": 93156, "epoch": 2218} {"train_loss": -6.209468364715576, "global_step": 93157, "epoch": 2218} {"train_loss": -6.315609455108643, "global_step": 93158, "epoch": 2218} {"train_loss": -6.2148237228393555, "global_step": 93159, "epoch": 2218} {"train_loss": -6.319512367248535, "global_step": 93160, "epoch": 2218} {"train_loss": -6.333215713500977, "global_step": 93161, "epoch": 2218} {"train_loss": -6.164094924926758, "global_step": 93162, "epoch": 2218} {"train_loss": -6.375580787658691, "global_step": 93163, "epoch": 2218} {"train_loss": -6.421667575836182, "global_step": 93164, "epoch": 2218} {"train_loss": -6.215096473693848, "global_step": 93165, "epoch": 2218} {"train_loss": -6.286873817443848, "global_step": 93166, "epoch": 2218} {"train_loss": -6.246184349060059, "global_step": 93167, "epoch": 2218} {"train_loss": -6.3656768798828125, "global_step": 93168, "epoch": 2218} {"train_loss": -6.368556976318359, "global_step": 93169, "epoch": 2218} {"train_loss": -6.298776149749756, "global_step": 93170, "epoch": 2218} {"train_loss": -6.273062705993652, "global_step": 93171, "epoch": 2218} {"train_loss": -6.2109222412109375, "global_step": 93172, "epoch": 2218} {"train_loss": -6.42233943939209, "global_step": 93173, "epoch": 2218} {"train_loss": -6.2442121505737305, "global_step": 93174, "epoch": 2218} {"train_loss": -6.392409324645996, "global_step": 93175, "epoch": 2218} {"train_loss": -6.377708435058594, "global_step": 93176, "epoch": 2218} {"train_loss": -6.312495231628418, "global_step": 93177, "epoch": 2218} {"train_loss": -6.3437981605529785, "global_step": 93178, "epoch": 2218} {"train_loss": -6.33936882019043, "global_step": 93179, "epoch": 2218} {"train_loss": -6.397095680236816, "global_step": 93180, "epoch": 2218} {"train_loss": -6.350671768188477, "global_step": 93181, "epoch": 2218} {"train_loss": -6.361766815185547, "global_step": 93182, "epoch": 2218} {"train_loss": -6.2568464279174805, "global_step": 93183, "epoch": 2218} {"train_loss": -6.334743499755859, "global_step": 93184, "epoch": 2218} {"train_loss": -6.333008766174316, "global_step": 93185, "epoch": 2218} {"train_loss": -6.235638618469238, "global_step": 93186, "epoch": 2218} {"train_loss": -6.142169952392578, "global_step": 93187, "epoch": 2218} {"train_loss": -6.367525100708008, "global_step": 93188, "epoch": 2218} {"train_loss": -6.21660852432251, "global_step": 93189, "epoch": 2218} {"train_loss": -6.192705154418945, "global_step": 93190, "epoch": 2218} {"train_loss": -6.354075908660889, "global_step": 93191, "epoch": 2218} {"train_loss": -6.164801120758057, "global_step": 93192, "epoch": 2218} {"train_loss": -6.383796691894531, "global_step": 93193, "epoch": 2218} {"train_loss": -6.319990158081055, "global_step": 93194, "epoch": 2218} {"train_loss": -6.201735973358154, "global_step": 93195, "epoch": 2218} {"train_loss": -6.356499671936035, "global_step": 93196, "epoch": 2218} {"train_loss": -6.3004012789045065, "global_step": 93197, "epoch": 2218, "val_loss": 63450.7890625} {"train_loss": -6.32534122467041, "global_step": 93198, "epoch": 2219} {"train_loss": -6.198826789855957, "global_step": 93199, "epoch": 2219} {"train_loss": -6.215670585632324, "global_step": 93200, "epoch": 2219} {"train_loss": -6.230338096618652, "global_step": 93201, "epoch": 2219} {"train_loss": -6.272021770477295, "global_step": 93202, "epoch": 2219} {"train_loss": -6.309598922729492, "global_step": 93203, "epoch": 2219} {"train_loss": -6.319236755371094, "global_step": 93204, "epoch": 2219} {"train_loss": -6.300199508666992, "global_step": 93205, "epoch": 2219} {"train_loss": -6.336718559265137, "global_step": 93206, "epoch": 2219} {"train_loss": -6.310002326965332, "global_step": 93207, "epoch": 2219} {"train_loss": -6.172971248626709, "global_step": 93208, "epoch": 2219} {"train_loss": -6.193121910095215, "global_step": 93209, "epoch": 2219} {"train_loss": -6.304340362548828, "global_step": 93210, "epoch": 2219} {"train_loss": -6.34562873840332, "global_step": 93211, "epoch": 2219} {"train_loss": -6.32327938079834, "global_step": 93212, "epoch": 2219} {"train_loss": -6.263730049133301, "global_step": 93213, "epoch": 2219} {"train_loss": -6.2828569412231445, "global_step": 93214, "epoch": 2219} {"train_loss": -6.312567710876465, "global_step": 93215, "epoch": 2219} {"train_loss": -6.412187576293945, "global_step": 93216, "epoch": 2219} {"train_loss": -6.335133075714111, "global_step": 93217, "epoch": 2219} {"train_loss": -6.374824523925781, "global_step": 93218, "epoch": 2219} {"train_loss": -6.481595516204834, "global_step": 93219, "epoch": 2219} {"train_loss": -6.221673011779785, "global_step": 93220, "epoch": 2219} {"train_loss": -6.3831281661987305, "global_step": 93221, "epoch": 2219} {"train_loss": -6.385673999786377, "global_step": 93222, "epoch": 2219} {"train_loss": -6.4388322830200195, "global_step": 93223, "epoch": 2219} {"train_loss": -6.278326511383057, "global_step": 93224, "epoch": 2219} {"train_loss": -6.301485538482666, "global_step": 93225, "epoch": 2219} {"train_loss": -6.213974952697754, "global_step": 93226, "epoch": 2219} {"train_loss": -6.354836463928223, "global_step": 93227, "epoch": 2219} {"train_loss": -6.184369087219238, "global_step": 93228, "epoch": 2219} {"train_loss": -6.284793376922607, "global_step": 93229, "epoch": 2219} {"train_loss": -6.369830131530762, "global_step": 93230, "epoch": 2219} {"train_loss": -6.22994327545166, "global_step": 93231, "epoch": 2219} {"train_loss": -6.38431453704834, "global_step": 93232, "epoch": 2219} {"train_loss": -6.302756309509277, "global_step": 93233, "epoch": 2219} {"train_loss": -6.241294860839844, "global_step": 93234, "epoch": 2219} {"train_loss": -6.269557952880859, "global_step": 93235, "epoch": 2219} {"train_loss": -6.196258544921875, "global_step": 93236, "epoch": 2219} {"train_loss": -6.360653877258301, "global_step": 93237, "epoch": 2219} {"train_loss": -6.304694652557373, "global_step": 93238, "epoch": 2219} {"train_loss": -6.299713747841971, "global_step": 93239, "epoch": 2219, "val_loss": 63540.0078125} {"train_loss": -6.148013114929199, "global_step": 93240, "epoch": 2220} {"train_loss": -6.268893241882324, "global_step": 93241, "epoch": 2220} {"train_loss": -6.314796447753906, "global_step": 93242, "epoch": 2220} {"train_loss": -6.307121753692627, "global_step": 93243, "epoch": 2220} {"train_loss": -6.337313652038574, "global_step": 93244, "epoch": 2220} {"train_loss": -6.277498245239258, "global_step": 93245, "epoch": 2220} {"train_loss": -6.225284576416016, "global_step": 93246, "epoch": 2220} {"train_loss": -6.395359516143799, "global_step": 93247, "epoch": 2220} {"train_loss": -6.305069923400879, "global_step": 93248, "epoch": 2220} {"train_loss": -6.432326316833496, "global_step": 93249, "epoch": 2220} {"train_loss": -6.462252616882324, "global_step": 93250, "epoch": 2220} {"train_loss": -6.267683982849121, "global_step": 93251, "epoch": 2220} {"train_loss": -6.431708335876465, "global_step": 93252, "epoch": 2220} {"train_loss": -6.230429172515869, "global_step": 93253, "epoch": 2220} {"train_loss": -6.232669830322266, "global_step": 93254, "epoch": 2220} {"train_loss": -6.225425720214844, "global_step": 93255, "epoch": 2220} {"train_loss": -6.388724327087402, "global_step": 93256, "epoch": 2220} {"train_loss": -6.229870796203613, "global_step": 93257, "epoch": 2220} {"train_loss": -6.366771697998047, "global_step": 93258, "epoch": 2220} {"train_loss": -6.326877593994141, "global_step": 93259, "epoch": 2220} {"train_loss": -6.300172805786133, "global_step": 93260, "epoch": 2220} {"train_loss": -6.3047637939453125, "global_step": 93261, "epoch": 2220} {"train_loss": -6.212129592895508, "global_step": 93262, "epoch": 2220} {"train_loss": -6.262138366699219, "global_step": 93263, "epoch": 2220} {"train_loss": -6.305247783660889, "global_step": 93264, "epoch": 2220} {"train_loss": -6.245232105255127, "global_step": 93265, "epoch": 2220} {"train_loss": -6.328716278076172, "global_step": 93266, "epoch": 2220} {"train_loss": -6.320435523986816, "global_step": 93267, "epoch": 2220} {"train_loss": -6.345025539398193, "global_step": 93268, "epoch": 2220} {"train_loss": -6.3018341064453125, "global_step": 93269, "epoch": 2220} {"train_loss": -6.346200942993164, "global_step": 93270, "epoch": 2220} {"train_loss": -6.351418972015381, "global_step": 93271, "epoch": 2220} {"train_loss": -6.2054290771484375, "global_step": 93272, "epoch": 2220} {"train_loss": -6.319299221038818, "global_step": 93273, "epoch": 2220} {"train_loss": -6.406859397888184, "global_step": 93274, "epoch": 2220} {"train_loss": -6.266306400299072, "global_step": 93275, "epoch": 2220} {"train_loss": -6.229748249053955, "global_step": 93276, "epoch": 2220} {"train_loss": -6.221562385559082, "global_step": 93277, "epoch": 2220} {"train_loss": -6.217339992523193, "global_step": 93278, "epoch": 2220} {"train_loss": -6.328139305114746, "global_step": 93279, "epoch": 2220} {"train_loss": -6.241215705871582, "global_step": 93280, "epoch": 2220} {"train_loss": -6.299742165065947, "global_step": 93281, "epoch": 2220, "val_loss": 63407.890625} {"train_loss": -6.327482223510742, "global_step": 93282, "epoch": 2221} {"train_loss": -6.257505416870117, "global_step": 93283, "epoch": 2221} {"train_loss": -6.330389976501465, "global_step": 93284, "epoch": 2221} {"train_loss": -6.2529096603393555, "global_step": 93285, "epoch": 2221} {"train_loss": -6.211256980895996, "global_step": 93286, "epoch": 2221} {"train_loss": -6.252205848693848, "global_step": 93287, "epoch": 2221} {"train_loss": -6.219894886016846, "global_step": 93288, "epoch": 2221} {"train_loss": -6.272098064422607, "global_step": 93289, "epoch": 2221} {"train_loss": -6.277860641479492, "global_step": 93290, "epoch": 2221} {"train_loss": -6.366766929626465, "global_step": 93291, "epoch": 2221} {"train_loss": -6.359050273895264, "global_step": 93292, "epoch": 2221} {"train_loss": -6.342751502990723, "global_step": 93293, "epoch": 2221} {"train_loss": -6.25014591217041, "global_step": 93294, "epoch": 2221} {"train_loss": -6.426701068878174, "global_step": 93295, "epoch": 2221} {"train_loss": -6.305932998657227, "global_step": 93296, "epoch": 2221} {"train_loss": -6.383121967315674, "global_step": 93297, "epoch": 2221} {"train_loss": -6.325132369995117, "global_step": 93298, "epoch": 2221} {"train_loss": -6.25350284576416, "global_step": 93299, "epoch": 2221} {"train_loss": -6.379337310791016, "global_step": 93300, "epoch": 2221} {"train_loss": -6.206058502197266, "global_step": 93301, "epoch": 2221} {"train_loss": -6.324437141418457, "global_step": 93302, "epoch": 2221} {"train_loss": -6.421536445617676, "global_step": 93303, "epoch": 2221} {"train_loss": -6.212583541870117, "global_step": 93304, "epoch": 2221} {"train_loss": -6.277688980102539, "global_step": 93305, "epoch": 2221} {"train_loss": -6.304829120635986, "global_step": 93306, "epoch": 2221} {"train_loss": -6.317842483520508, "global_step": 93307, "epoch": 2221} {"train_loss": -6.310173034667969, "global_step": 93308, "epoch": 2221} {"train_loss": -6.2024245262146, "global_step": 93309, "epoch": 2221} {"train_loss": -6.247781753540039, "global_step": 93310, "epoch": 2221} {"train_loss": -6.1691694259643555, "global_step": 93311, "epoch": 2221} {"train_loss": -6.1454572677612305, "global_step": 93312, "epoch": 2221} {"train_loss": -6.138514518737793, "global_step": 93313, "epoch": 2221} {"train_loss": -6.262544631958008, "global_step": 93314, "epoch": 2221} {"train_loss": -6.3185625076293945, "global_step": 93315, "epoch": 2221} {"train_loss": -6.2946367263793945, "global_step": 93316, "epoch": 2221} {"train_loss": -6.2089619636535645, "global_step": 93317, "epoch": 2221} {"train_loss": -6.239166736602783, "global_step": 93318, "epoch": 2221} {"train_loss": -6.255231857299805, "global_step": 93319, "epoch": 2221} {"train_loss": -6.269365310668945, "global_step": 93320, "epoch": 2221} {"train_loss": -6.27316951751709, "global_step": 93321, "epoch": 2221} {"train_loss": -6.310854911804199, "global_step": 93322, "epoch": 2221} {"train_loss": -6.280296325683594, "global_step": 93323, "epoch": 2221, "val_loss": 63227.765625} {"train_loss": -6.353458404541016, "global_step": 93324, "epoch": 2222} {"train_loss": -6.318342208862305, "global_step": 93325, "epoch": 2222} {"train_loss": -6.236238479614258, "global_step": 93326, "epoch": 2222} {"train_loss": -6.332823753356934, "global_step": 93327, "epoch": 2222} {"train_loss": -6.220883369445801, "global_step": 93328, "epoch": 2222} {"train_loss": -6.291925430297852, "global_step": 93329, "epoch": 2222} {"train_loss": -6.312237739562988, "global_step": 93330, "epoch": 2222} {"train_loss": -6.322464466094971, "global_step": 93331, "epoch": 2222} {"train_loss": -6.386542320251465, "global_step": 93332, "epoch": 2222} {"train_loss": -6.336259841918945, "global_step": 93333, "epoch": 2222} {"train_loss": -6.258003234863281, "global_step": 93334, "epoch": 2222} {"train_loss": -6.283204078674316, "global_step": 93335, "epoch": 2222} {"train_loss": -6.395678520202637, "global_step": 93336, "epoch": 2222} {"train_loss": -6.376506805419922, "global_step": 93337, "epoch": 2222} {"train_loss": -6.313257217407227, "global_step": 93338, "epoch": 2222} {"train_loss": -6.318978309631348, "global_step": 93339, "epoch": 2222} {"train_loss": -6.335679054260254, "global_step": 93340, "epoch": 2222} {"train_loss": -6.193392753601074, "global_step": 93341, "epoch": 2222} {"train_loss": -6.22149658203125, "global_step": 93342, "epoch": 2222} {"train_loss": -6.348395347595215, "global_step": 93343, "epoch": 2222} {"train_loss": -6.257755279541016, "global_step": 93344, "epoch": 2222} {"train_loss": -6.271396636962891, "global_step": 93345, "epoch": 2222} {"train_loss": -6.25251579284668, "global_step": 93346, "epoch": 2222} {"train_loss": -6.267284393310547, "global_step": 93347, "epoch": 2222} {"train_loss": -6.330026149749756, "global_step": 93348, "epoch": 2222} {"train_loss": -6.192936897277832, "global_step": 93349, "epoch": 2222} {"train_loss": -6.375884056091309, "global_step": 93350, "epoch": 2222} {"train_loss": -6.325255393981934, "global_step": 93351, "epoch": 2222} {"train_loss": -6.276826858520508, "global_step": 93352, "epoch": 2222} {"train_loss": -6.282609939575195, "global_step": 93353, "epoch": 2222} {"train_loss": -6.289149284362793, "global_step": 93354, "epoch": 2222} {"train_loss": -6.294015884399414, "global_step": 93355, "epoch": 2222} {"train_loss": -6.350894927978516, "global_step": 93356, "epoch": 2222} {"train_loss": -6.317025661468506, "global_step": 93357, "epoch": 2222} {"train_loss": -6.308736324310303, "global_step": 93358, "epoch": 2222} {"train_loss": -6.32713508605957, "global_step": 93359, "epoch": 2222} {"train_loss": -6.274758815765381, "global_step": 93360, "epoch": 2222} {"train_loss": -6.359167098999023, "global_step": 93361, "epoch": 2222} {"train_loss": -6.4099836349487305, "global_step": 93362, "epoch": 2222} {"train_loss": -6.292840003967285, "global_step": 93363, "epoch": 2222} {"train_loss": -6.411355018615723, "global_step": 93364, "epoch": 2222} {"train_loss": -6.3117955185118175, "global_step": 93365, "epoch": 2222, "val_loss": 63348.69921875} {"train_loss": -6.35438871383667, "global_step": 93366, "epoch": 2223} {"train_loss": -6.341179370880127, "global_step": 93367, "epoch": 2223} {"train_loss": -6.359851360321045, "global_step": 93368, "epoch": 2223} {"train_loss": -6.398420810699463, "global_step": 93369, "epoch": 2223} {"train_loss": -6.494964122772217, "global_step": 93370, "epoch": 2223} {"train_loss": -6.34853458404541, "global_step": 93371, "epoch": 2223} {"train_loss": -6.219244003295898, "global_step": 93372, "epoch": 2223} {"train_loss": -6.384922981262207, "global_step": 93373, "epoch": 2223} {"train_loss": -6.332313537597656, "global_step": 93374, "epoch": 2223} {"train_loss": -6.4051713943481445, "global_step": 93375, "epoch": 2223} {"train_loss": -6.244067668914795, "global_step": 93376, "epoch": 2223} {"train_loss": -6.237172603607178, "global_step": 93377, "epoch": 2223} {"train_loss": -6.239627838134766, "global_step": 93378, "epoch": 2223} {"train_loss": -6.260942459106445, "global_step": 93379, "epoch": 2223} {"train_loss": -6.205351829528809, "global_step": 93380, "epoch": 2223} {"train_loss": -6.405660152435303, "global_step": 93381, "epoch": 2223} {"train_loss": -6.352215766906738, "global_step": 93382, "epoch": 2223} {"train_loss": -6.2843403816223145, "global_step": 93383, "epoch": 2223} {"train_loss": -6.273737907409668, "global_step": 93384, "epoch": 2223} {"train_loss": -6.318073749542236, "global_step": 93385, "epoch": 2223} {"train_loss": -6.308897018432617, "global_step": 93386, "epoch": 2223} {"train_loss": -6.300858974456787, "global_step": 93387, "epoch": 2223} {"train_loss": -6.286558628082275, "global_step": 93388, "epoch": 2223} {"train_loss": -6.338901042938232, "global_step": 93389, "epoch": 2223} {"train_loss": -6.090306282043457, "global_step": 93390, "epoch": 2223} {"train_loss": -6.2843098640441895, "global_step": 93391, "epoch": 2223} {"train_loss": -6.372043132781982, "global_step": 93392, "epoch": 2223} {"train_loss": -6.279748916625977, "global_step": 93393, "epoch": 2223} {"train_loss": -6.316906929016113, "global_step": 93394, "epoch": 2223} {"train_loss": -6.306109428405762, "global_step": 93395, "epoch": 2223} {"train_loss": -6.330842971801758, "global_step": 93396, "epoch": 2223} {"train_loss": -6.159177780151367, "global_step": 93397, "epoch": 2223} {"train_loss": -6.258955478668213, "global_step": 93398, "epoch": 2223} {"train_loss": -6.254322528839111, "global_step": 93399, "epoch": 2223} {"train_loss": -6.287685394287109, "global_step": 93400, "epoch": 2223} {"train_loss": -6.264294147491455, "global_step": 93401, "epoch": 2223} {"train_loss": -6.343855381011963, "global_step": 93402, "epoch": 2223} {"train_loss": -6.388832092285156, "global_step": 93403, "epoch": 2223} {"train_loss": -6.253058433532715, "global_step": 93404, "epoch": 2223} {"train_loss": -6.2888946533203125, "global_step": 93405, "epoch": 2223} {"train_loss": -6.279083251953125, "global_step": 93406, "epoch": 2223} {"train_loss": -6.305233626138596, "global_step": 93407, "epoch": 2223, "val_loss": 63622.890625} {"train_loss": -6.273690700531006, "global_step": 93408, "epoch": 2224} {"train_loss": -6.402563095092773, "global_step": 93409, "epoch": 2224} {"train_loss": -6.35997200012207, "global_step": 93410, "epoch": 2224} {"train_loss": -6.334414482116699, "global_step": 93411, "epoch": 2224} {"train_loss": -6.382026195526123, "global_step": 93412, "epoch": 2224} {"train_loss": -6.266294956207275, "global_step": 93413, "epoch": 2224} {"train_loss": -6.297826766967773, "global_step": 93414, "epoch": 2224} {"train_loss": -6.283913612365723, "global_step": 93415, "epoch": 2224} {"train_loss": -6.318941116333008, "global_step": 93416, "epoch": 2224} {"train_loss": -6.321028232574463, "global_step": 93417, "epoch": 2224} {"train_loss": -6.2487053871154785, "global_step": 93418, "epoch": 2224} {"train_loss": -6.301136016845703, "global_step": 93419, "epoch": 2224} {"train_loss": -6.310842990875244, "global_step": 93420, "epoch": 2224} {"train_loss": -6.348647117614746, "global_step": 93421, "epoch": 2224} {"train_loss": -6.354474067687988, "global_step": 93422, "epoch": 2224} {"train_loss": -6.368865966796875, "global_step": 93423, "epoch": 2224} {"train_loss": -6.193571090698242, "global_step": 93424, "epoch": 2224} {"train_loss": -6.29941463470459, "global_step": 93425, "epoch": 2224} {"train_loss": -6.310009956359863, "global_step": 93426, "epoch": 2224} {"train_loss": -6.3218092918396, "global_step": 93427, "epoch": 2224} {"train_loss": -6.197345733642578, "global_step": 93428, "epoch": 2224} {"train_loss": -6.285744667053223, "global_step": 93429, "epoch": 2224} {"train_loss": -6.208714485168457, "global_step": 93430, "epoch": 2224} {"train_loss": -6.173703193664551, "global_step": 93431, "epoch": 2224} {"train_loss": -6.258004665374756, "global_step": 93432, "epoch": 2224} {"train_loss": -6.140487194061279, "global_step": 93433, "epoch": 2224} {"train_loss": -6.386618614196777, "global_step": 93434, "epoch": 2224} {"train_loss": -6.300439834594727, "global_step": 93435, "epoch": 2224} {"train_loss": -6.195948600769043, "global_step": 93436, "epoch": 2224} {"train_loss": -6.271237373352051, "global_step": 93437, "epoch": 2224} {"train_loss": -6.298742771148682, "global_step": 93438, "epoch": 2224} {"train_loss": -6.24735689163208, "global_step": 93439, "epoch": 2224} {"train_loss": -6.287806987762451, "global_step": 93440, "epoch": 2224} {"train_loss": -6.31315803527832, "global_step": 93441, "epoch": 2224} {"train_loss": -6.299894332885742, "global_step": 93442, "epoch": 2224} {"train_loss": -6.336493492126465, "global_step": 93443, "epoch": 2224} {"train_loss": -6.291919231414795, "global_step": 93444, "epoch": 2224} {"train_loss": -6.361486434936523, "global_step": 93445, "epoch": 2224} {"train_loss": -6.293489933013916, "global_step": 93446, "epoch": 2224} {"train_loss": -6.33119010925293, "global_step": 93447, "epoch": 2224} {"train_loss": -6.3296403884887695, "global_step": 93448, "epoch": 2224} {"train_loss": -6.293544735227313, "global_step": 93449, "epoch": 2224, "val_loss": 63612.65234375} {"train_loss": -6.291497707366943, "global_step": 93450, "epoch": 2225} {"train_loss": -6.361560821533203, "global_step": 93451, "epoch": 2225} {"train_loss": -6.341044902801514, "global_step": 93452, "epoch": 2225} {"train_loss": -6.387157440185547, "global_step": 93453, "epoch": 2225} {"train_loss": -6.307015419006348, "global_step": 93454, "epoch": 2225} {"train_loss": -6.341989994049072, "global_step": 93455, "epoch": 2225} {"train_loss": -6.327184677124023, "global_step": 93456, "epoch": 2225} {"train_loss": -6.397034645080566, "global_step": 93457, "epoch": 2225} {"train_loss": -6.354536056518555, "global_step": 93458, "epoch": 2225} {"train_loss": -6.291021347045898, "global_step": 93459, "epoch": 2225} {"train_loss": -6.2451677322387695, "global_step": 93460, "epoch": 2225} {"train_loss": -6.307884216308594, "global_step": 93461, "epoch": 2225} {"train_loss": -6.21943998336792, "global_step": 93462, "epoch": 2225} {"train_loss": -6.267124652862549, "global_step": 93463, "epoch": 2225} {"train_loss": -6.351875305175781, "global_step": 93464, "epoch": 2225} {"train_loss": -6.286923408508301, "global_step": 93465, "epoch": 2225} {"train_loss": -6.376923561096191, "global_step": 93466, "epoch": 2225} {"train_loss": -6.4460248947143555, "global_step": 93467, "epoch": 2225} {"train_loss": -6.345888614654541, "global_step": 93468, "epoch": 2225} {"train_loss": -6.418218612670898, "global_step": 93469, "epoch": 2225} {"train_loss": -6.301553726196289, "global_step": 93470, "epoch": 2225} {"train_loss": -6.247861862182617, "global_step": 93471, "epoch": 2225} {"train_loss": -6.306734561920166, "global_step": 93472, "epoch": 2225} {"train_loss": -6.282434463500977, "global_step": 93473, "epoch": 2225} {"train_loss": -6.215676784515381, "global_step": 93474, "epoch": 2225} {"train_loss": -6.300304412841797, "global_step": 93475, "epoch": 2225} {"train_loss": -6.265716552734375, "global_step": 93476, "epoch": 2225} {"train_loss": -6.256588935852051, "global_step": 93477, "epoch": 2225} {"train_loss": -6.276228427886963, "global_step": 93478, "epoch": 2225} {"train_loss": -6.384434700012207, "global_step": 93479, "epoch": 2225} {"train_loss": -6.229648590087891, "global_step": 93480, "epoch": 2225} {"train_loss": -6.2992753982543945, "global_step": 93481, "epoch": 2225} {"train_loss": -6.333307266235352, "global_step": 93482, "epoch": 2225} {"train_loss": -6.251792907714844, "global_step": 93483, "epoch": 2225} {"train_loss": -6.337315082550049, "global_step": 93484, "epoch": 2225} {"train_loss": -6.31107234954834, "global_step": 93485, "epoch": 2225} {"train_loss": -6.364858627319336, "global_step": 93486, "epoch": 2225} {"train_loss": -6.341065406799316, "global_step": 93487, "epoch": 2225} {"train_loss": -6.302020072937012, "global_step": 93488, "epoch": 2225} {"train_loss": -6.27644157409668, "global_step": 93489, "epoch": 2225} {"train_loss": -6.2848310470581055, "global_step": 93490, "epoch": 2225} {"train_loss": -6.313183443886893, "global_step": 93491, "epoch": 2225, "val_loss": 63483.12109375} {"train_loss": -6.400952339172363, "global_step": 93492, "epoch": 2226} {"train_loss": -6.339332580566406, "global_step": 93493, "epoch": 2226} {"train_loss": -6.111932754516602, "global_step": 93494, "epoch": 2226} {"train_loss": -6.34735107421875, "global_step": 93495, "epoch": 2226} {"train_loss": -6.114444732666016, "global_step": 93496, "epoch": 2226} {"train_loss": -6.279660224914551, "global_step": 93497, "epoch": 2226} {"train_loss": -6.3106794357299805, "global_step": 93498, "epoch": 2226} {"train_loss": -6.183026313781738, "global_step": 93499, "epoch": 2226} {"train_loss": -6.317030906677246, "global_step": 93500, "epoch": 2226} {"train_loss": -6.356096267700195, "global_step": 93501, "epoch": 2226} {"train_loss": -6.236992835998535, "global_step": 93502, "epoch": 2226} {"train_loss": -6.319727897644043, "global_step": 93503, "epoch": 2226} {"train_loss": -6.288586139678955, "global_step": 93504, "epoch": 2226} {"train_loss": -6.260127067565918, "global_step": 93505, "epoch": 2226} {"train_loss": -6.248925685882568, "global_step": 93506, "epoch": 2226} {"train_loss": -6.256086349487305, "global_step": 93507, "epoch": 2226} {"train_loss": -6.3313446044921875, "global_step": 93508, "epoch": 2226} {"train_loss": -6.247886657714844, "global_step": 93509, "epoch": 2226} {"train_loss": -6.249783039093018, "global_step": 93510, "epoch": 2226} {"train_loss": -6.319609642028809, "global_step": 93511, "epoch": 2226} {"train_loss": -6.145123481750488, "global_step": 93512, "epoch": 2226} {"train_loss": -6.288026809692383, "global_step": 93513, "epoch": 2226} {"train_loss": -6.279059410095215, "global_step": 93514, "epoch": 2226} {"train_loss": -6.261557579040527, "global_step": 93515, "epoch": 2226} {"train_loss": -6.286576747894287, "global_step": 93516, "epoch": 2226} {"train_loss": -6.153725624084473, "global_step": 93517, "epoch": 2226} {"train_loss": -6.336173057556152, "global_step": 93518, "epoch": 2226} {"train_loss": -6.305888652801514, "global_step": 93519, "epoch": 2226} {"train_loss": -6.17885160446167, "global_step": 93520, "epoch": 2226} {"train_loss": -6.216492652893066, "global_step": 93521, "epoch": 2226} {"train_loss": -6.186409950256348, "global_step": 93522, "epoch": 2226} {"train_loss": -6.148347854614258, "global_step": 93523, "epoch": 2226} {"train_loss": -6.132948875427246, "global_step": 93524, "epoch": 2226} {"train_loss": -6.254067420959473, "global_step": 93525, "epoch": 2226} {"train_loss": -6.339852809906006, "global_step": 93526, "epoch": 2226} {"train_loss": -6.139413833618164, "global_step": 93527, "epoch": 2226} {"train_loss": -6.265862464904785, "global_step": 93528, "epoch": 2226} {"train_loss": -6.234519004821777, "global_step": 93529, "epoch": 2226} {"train_loss": -6.208840847015381, "global_step": 93530, "epoch": 2226} {"train_loss": -6.178299427032471, "global_step": 93531, "epoch": 2226} {"train_loss": -6.255219459533691, "global_step": 93532, "epoch": 2226} {"train_loss": -6.252101171584356, "global_step": 93533, "epoch": 2226, "val_loss": 63719.44921875} {"train_loss": -6.1396164894104, "global_step": 93534, "epoch": 2227} {"train_loss": -6.260896682739258, "global_step": 93535, "epoch": 2227} {"train_loss": -6.201505661010742, "global_step": 93536, "epoch": 2227} {"train_loss": -6.110162734985352, "global_step": 93537, "epoch": 2227} {"train_loss": -6.151386260986328, "global_step": 93538, "epoch": 2227} {"train_loss": -6.366927146911621, "global_step": 93539, "epoch": 2227} {"train_loss": -6.3131208419799805, "global_step": 93540, "epoch": 2227} {"train_loss": -6.204970836639404, "global_step": 93541, "epoch": 2227} {"train_loss": -6.162367343902588, "global_step": 93542, "epoch": 2227} {"train_loss": -6.117157936096191, "global_step": 93543, "epoch": 2227} {"train_loss": -6.343114852905273, "global_step": 93544, "epoch": 2227} {"train_loss": -6.3053741455078125, "global_step": 93545, "epoch": 2227} {"train_loss": -6.213334560394287, "global_step": 93546, "epoch": 2227} {"train_loss": -6.218401908874512, "global_step": 93547, "epoch": 2227} {"train_loss": -6.206544876098633, "global_step": 93548, "epoch": 2227} {"train_loss": -6.171003341674805, "global_step": 93549, "epoch": 2227} {"train_loss": -6.257223129272461, "global_step": 93550, "epoch": 2227} {"train_loss": -6.162158966064453, "global_step": 93551, "epoch": 2227} {"train_loss": -6.139224052429199, "global_step": 93552, "epoch": 2227} {"train_loss": -6.392928123474121, "global_step": 93553, "epoch": 2227} {"train_loss": -6.237834930419922, "global_step": 93554, "epoch": 2227} {"train_loss": -6.386754035949707, "global_step": 93555, "epoch": 2227} {"train_loss": -6.2579145431518555, "global_step": 93556, "epoch": 2227} {"train_loss": -6.274443626403809, "global_step": 93557, "epoch": 2227} {"train_loss": -6.35171365737915, "global_step": 93558, "epoch": 2227} {"train_loss": -6.278202533721924, "global_step": 93559, "epoch": 2227} {"train_loss": -6.2855424880981445, "global_step": 93560, "epoch": 2227} {"train_loss": -6.237165927886963, "global_step": 93561, "epoch": 2227} {"train_loss": -6.060977935791016, "global_step": 93562, "epoch": 2227} {"train_loss": -6.266479969024658, "global_step": 93563, "epoch": 2227} {"train_loss": -6.259877681732178, "global_step": 93564, "epoch": 2227} {"train_loss": -6.321592807769775, "global_step": 93565, "epoch": 2227} {"train_loss": -6.133182048797607, "global_step": 93566, "epoch": 2227} {"train_loss": -6.273161888122559, "global_step": 93567, "epoch": 2227} {"train_loss": -6.141736030578613, "global_step": 93568, "epoch": 2227} {"train_loss": -6.283898830413818, "global_step": 93569, "epoch": 2227} {"train_loss": -6.229391098022461, "global_step": 93570, "epoch": 2227} {"train_loss": -6.2007269859313965, "global_step": 93571, "epoch": 2227} {"train_loss": -6.294797420501709, "global_step": 93572, "epoch": 2227} {"train_loss": -6.179594039916992, "global_step": 93573, "epoch": 2227} {"train_loss": -6.246858596801758, "global_step": 93574, "epoch": 2227} {"train_loss": -6.236760003226144, "global_step": 93575, "epoch": 2227, "val_loss": 63481.47265625} {"train_loss": -6.2283735275268555, "global_step": 93576, "epoch": 2228} {"train_loss": -6.238875389099121, "global_step": 93577, "epoch": 2228} {"train_loss": -6.296882629394531, "global_step": 93578, "epoch": 2228} {"train_loss": -6.23206901550293, "global_step": 93579, "epoch": 2228} {"train_loss": -6.279801368713379, "global_step": 93580, "epoch": 2228} {"train_loss": -6.359264373779297, "global_step": 93581, "epoch": 2228} {"train_loss": -6.287600517272949, "global_step": 93582, "epoch": 2228} {"train_loss": -6.256804943084717, "global_step": 93583, "epoch": 2228} {"train_loss": -6.2960004806518555, "global_step": 93584, "epoch": 2228} {"train_loss": -6.170773983001709, "global_step": 93585, "epoch": 2228} {"train_loss": -6.369673252105713, "global_step": 93586, "epoch": 2228} {"train_loss": -6.319094181060791, "global_step": 93587, "epoch": 2228} {"train_loss": -6.361477851867676, "global_step": 93588, "epoch": 2228} {"train_loss": -6.218274116516113, "global_step": 93589, "epoch": 2228} {"train_loss": -6.379866600036621, "global_step": 93590, "epoch": 2228} {"train_loss": -6.316088676452637, "global_step": 93591, "epoch": 2228} {"train_loss": -6.321902275085449, "global_step": 93592, "epoch": 2228} {"train_loss": -6.397777080535889, "global_step": 93593, "epoch": 2228} {"train_loss": -6.287201881408691, "global_step": 93594, "epoch": 2228} {"train_loss": -6.345409393310547, "global_step": 93595, "epoch": 2228} {"train_loss": -6.368473052978516, "global_step": 93596, "epoch": 2228} {"train_loss": -6.391631126403809, "global_step": 93597, "epoch": 2228} {"train_loss": -6.262970924377441, "global_step": 93598, "epoch": 2228} {"train_loss": -6.367244243621826, "global_step": 93599, "epoch": 2228} {"train_loss": -6.387754440307617, "global_step": 93600, "epoch": 2228} {"train_loss": -6.318083763122559, "global_step": 93601, "epoch": 2228} {"train_loss": -6.317516326904297, "global_step": 93602, "epoch": 2228} {"train_loss": -6.3291473388671875, "global_step": 93603, "epoch": 2228} {"train_loss": -6.309939384460449, "global_step": 93604, "epoch": 2228} {"train_loss": -6.323853969573975, "global_step": 93605, "epoch": 2228} {"train_loss": -6.373811721801758, "global_step": 93606, "epoch": 2228} {"train_loss": -6.352621078491211, "global_step": 93607, "epoch": 2228} {"train_loss": -6.233370780944824, "global_step": 93608, "epoch": 2228} {"train_loss": -6.371660232543945, "global_step": 93609, "epoch": 2228} {"train_loss": -6.291844844818115, "global_step": 93610, "epoch": 2228} {"train_loss": -6.279412269592285, "global_step": 93611, "epoch": 2228} {"train_loss": -6.364389419555664, "global_step": 93612, "epoch": 2228} {"train_loss": -6.242834091186523, "global_step": 93613, "epoch": 2228} {"train_loss": -6.265283107757568, "global_step": 93614, "epoch": 2228} {"train_loss": -6.408236503601074, "global_step": 93615, "epoch": 2228} {"train_loss": -6.231762886047363, "global_step": 93616, "epoch": 2228} {"train_loss": -6.312435661043439, "global_step": 93617, "epoch": 2228, "val_loss": 63646.4296875} {"train_loss": -6.4043989181518555, "global_step": 93618, "epoch": 2229} {"train_loss": -6.352500915527344, "global_step": 93619, "epoch": 2229} {"train_loss": -6.432461261749268, "global_step": 93620, "epoch": 2229} {"train_loss": -6.307145118713379, "global_step": 93621, "epoch": 2229} {"train_loss": -6.267937183380127, "global_step": 93622, "epoch": 2229} {"train_loss": -6.349609375, "global_step": 93623, "epoch": 2229} {"train_loss": -6.196242332458496, "global_step": 93624, "epoch": 2229} {"train_loss": -6.214322566986084, "global_step": 93625, "epoch": 2229} {"train_loss": -6.263962745666504, "global_step": 93626, "epoch": 2229} {"train_loss": -6.205852508544922, "global_step": 93627, "epoch": 2229} {"train_loss": -6.283991813659668, "global_step": 93628, "epoch": 2229} {"train_loss": -6.2067365646362305, "global_step": 93629, "epoch": 2229} {"train_loss": -6.251662254333496, "global_step": 93630, "epoch": 2229} {"train_loss": -6.288100719451904, "global_step": 93631, "epoch": 2229} {"train_loss": -6.133862495422363, "global_step": 93632, "epoch": 2229} {"train_loss": -6.348622798919678, "global_step": 93633, "epoch": 2229} {"train_loss": -6.27463960647583, "global_step": 93634, "epoch": 2229} {"train_loss": -6.4112348556518555, "global_step": 93635, "epoch": 2229} {"train_loss": -6.2232513427734375, "global_step": 93636, "epoch": 2229} {"train_loss": -6.335171699523926, "global_step": 93637, "epoch": 2229} {"train_loss": -6.352495193481445, "global_step": 93638, "epoch": 2229} {"train_loss": -6.2678680419921875, "global_step": 93639, "epoch": 2229} {"train_loss": -6.272639274597168, "global_step": 93640, "epoch": 2229} {"train_loss": -6.399481296539307, "global_step": 93641, "epoch": 2229} {"train_loss": -6.343008041381836, "global_step": 93642, "epoch": 2229} {"train_loss": -6.354605674743652, "global_step": 93643, "epoch": 2229} {"train_loss": -6.246137619018555, "global_step": 93644, "epoch": 2229} {"train_loss": -6.2812089920043945, "global_step": 93645, "epoch": 2229} {"train_loss": -6.345427513122559, "global_step": 93646, "epoch": 2229} {"train_loss": -6.4112396240234375, "global_step": 93647, "epoch": 2229} {"train_loss": -6.326703071594238, "global_step": 93648, "epoch": 2229} {"train_loss": -6.304374694824219, "global_step": 93649, "epoch": 2229} {"train_loss": -6.261313438415527, "global_step": 93650, "epoch": 2229} {"train_loss": -6.306223392486572, "global_step": 93651, "epoch": 2229} {"train_loss": -6.404370307922363, "global_step": 93652, "epoch": 2229} {"train_loss": -6.299976348876953, "global_step": 93653, "epoch": 2229} {"train_loss": -6.25626277923584, "global_step": 93654, "epoch": 2229} {"train_loss": -6.282440185546875, "global_step": 93655, "epoch": 2229} {"train_loss": -6.326645374298096, "global_step": 93656, "epoch": 2229} {"train_loss": -6.206443786621094, "global_step": 93657, "epoch": 2229} {"train_loss": -6.248406410217285, "global_step": 93658, "epoch": 2229} {"train_loss": -6.296780279704502, "global_step": 93659, "epoch": 2229, "val_loss": 63483.8046875} {"train_loss": -6.336848735809326, "global_step": 93660, "epoch": 2230} {"train_loss": -6.23837947845459, "global_step": 93661, "epoch": 2230} {"train_loss": -6.250221252441406, "global_step": 93662, "epoch": 2230} {"train_loss": -6.353852272033691, "global_step": 93663, "epoch": 2230} {"train_loss": -6.3311309814453125, "global_step": 93664, "epoch": 2230} {"train_loss": -6.287806510925293, "global_step": 93665, "epoch": 2230} {"train_loss": -6.156710147857666, "global_step": 93666, "epoch": 2230} {"train_loss": -6.25261926651001, "global_step": 93667, "epoch": 2230} {"train_loss": -6.348200798034668, "global_step": 93668, "epoch": 2230} {"train_loss": -6.431346893310547, "global_step": 93669, "epoch": 2230} {"train_loss": -6.330545425415039, "global_step": 93670, "epoch": 2230} {"train_loss": -6.25034236907959, "global_step": 93671, "epoch": 2230} {"train_loss": -6.366825103759766, "global_step": 93672, "epoch": 2230} {"train_loss": -6.232571601867676, "global_step": 93673, "epoch": 2230} {"train_loss": -6.20781135559082, "global_step": 93674, "epoch": 2230} {"train_loss": -6.331808090209961, "global_step": 93675, "epoch": 2230} {"train_loss": -6.291727066040039, "global_step": 93676, "epoch": 2230} {"train_loss": -6.347278594970703, "global_step": 93677, "epoch": 2230} {"train_loss": -6.258798599243164, "global_step": 93678, "epoch": 2230} {"train_loss": -6.337310314178467, "global_step": 93679, "epoch": 2230} {"train_loss": -6.268870830535889, "global_step": 93680, "epoch": 2230} {"train_loss": -6.347395896911621, "global_step": 93681, "epoch": 2230} {"train_loss": -6.379551410675049, "global_step": 93682, "epoch": 2230} {"train_loss": -6.390568733215332, "global_step": 93683, "epoch": 2230} {"train_loss": -6.293403625488281, "global_step": 93684, "epoch": 2230} {"train_loss": -6.304664611816406, "global_step": 93685, "epoch": 2230} {"train_loss": -6.359577178955078, "global_step": 93686, "epoch": 2230} {"train_loss": -6.334630489349365, "global_step": 93687, "epoch": 2230} {"train_loss": -6.401081562042236, "global_step": 93688, "epoch": 2230} {"train_loss": -6.303432941436768, "global_step": 93689, "epoch": 2230} {"train_loss": -6.307216644287109, "global_step": 93690, "epoch": 2230} {"train_loss": -6.270742893218994, "global_step": 93691, "epoch": 2230} {"train_loss": -6.3594160079956055, "global_step": 93692, "epoch": 2230} {"train_loss": -6.3524489402771, "global_step": 93693, "epoch": 2230} {"train_loss": -6.314793109893799, "global_step": 93694, "epoch": 2230} {"train_loss": -6.358765602111816, "global_step": 93695, "epoch": 2230} {"train_loss": -6.337341785430908, "global_step": 93696, "epoch": 2230} {"train_loss": -6.376262664794922, "global_step": 93697, "epoch": 2230} {"train_loss": -6.304940223693848, "global_step": 93698, "epoch": 2230} {"train_loss": -6.278071880340576, "global_step": 93699, "epoch": 2230} {"train_loss": -6.273313999176025, "global_step": 93700, "epoch": 2230} {"train_loss": -6.314187753768194, "global_step": 93701, "epoch": 2230, "val_loss": 63379.22265625} {"train_loss": -6.342370510101318, "global_step": 93702, "epoch": 2231} {"train_loss": -6.402141094207764, "global_step": 93703, "epoch": 2231} {"train_loss": -6.357010841369629, "global_step": 93704, "epoch": 2231} {"train_loss": -6.456549644470215, "global_step": 93705, "epoch": 2231} {"train_loss": -6.31362247467041, "global_step": 93706, "epoch": 2231} {"train_loss": -6.125721454620361, "global_step": 93707, "epoch": 2231} {"train_loss": -6.261642932891846, "global_step": 93708, "epoch": 2231} {"train_loss": -6.304213523864746, "global_step": 93709, "epoch": 2231} {"train_loss": -6.2292022705078125, "global_step": 93710, "epoch": 2231} {"train_loss": -6.338476657867432, "global_step": 93711, "epoch": 2231} {"train_loss": -6.267660140991211, "global_step": 93712, "epoch": 2231} {"train_loss": -6.240653991699219, "global_step": 93713, "epoch": 2231} {"train_loss": -6.298826217651367, "global_step": 93714, "epoch": 2231} {"train_loss": -6.234546661376953, "global_step": 93715, "epoch": 2231} {"train_loss": -6.218064785003662, "global_step": 93716, "epoch": 2231} {"train_loss": -6.1872477531433105, "global_step": 93717, "epoch": 2231} {"train_loss": -6.277135848999023, "global_step": 93718, "epoch": 2231} {"train_loss": -6.284307479858398, "global_step": 93719, "epoch": 2231} {"train_loss": -6.2388153076171875, "global_step": 93720, "epoch": 2231} {"train_loss": -6.331085205078125, "global_step": 93721, "epoch": 2231} {"train_loss": -6.172869682312012, "global_step": 93722, "epoch": 2231} {"train_loss": -6.275945663452148, "global_step": 93723, "epoch": 2231} {"train_loss": -6.215280532836914, "global_step": 93724, "epoch": 2231} {"train_loss": -6.241674423217773, "global_step": 93725, "epoch": 2231} {"train_loss": -6.228884696960449, "global_step": 93726, "epoch": 2231} {"train_loss": -6.263845920562744, "global_step": 93727, "epoch": 2231} {"train_loss": -6.2061920166015625, "global_step": 93728, "epoch": 2231} {"train_loss": -6.233576774597168, "global_step": 93729, "epoch": 2231} {"train_loss": -6.263579368591309, "global_step": 93730, "epoch": 2231} {"train_loss": -6.217006206512451, "global_step": 93731, "epoch": 2231} {"train_loss": -6.252685546875, "global_step": 93732, "epoch": 2231} {"train_loss": -6.190274238586426, "global_step": 93733, "epoch": 2231} {"train_loss": -6.198721885681152, "global_step": 93734, "epoch": 2231} {"train_loss": -6.268150806427002, "global_step": 93735, "epoch": 2231} {"train_loss": -6.281543731689453, "global_step": 93736, "epoch": 2231} {"train_loss": -6.262233734130859, "global_step": 93737, "epoch": 2231} {"train_loss": -6.269937992095947, "global_step": 93738, "epoch": 2231} {"train_loss": -6.229927062988281, "global_step": 93739, "epoch": 2231} {"train_loss": -6.307975769042969, "global_step": 93740, "epoch": 2231} {"train_loss": -6.12591552734375, "global_step": 93741, "epoch": 2231} {"train_loss": -6.360826015472412, "global_step": 93742, "epoch": 2231} {"train_loss": -6.26352554275876, "global_step": 93743, "epoch": 2231, "val_loss": 63673.66796875} {"train_loss": -6.271042823791504, "global_step": 93744, "epoch": 2232} {"train_loss": -6.31646728515625, "global_step": 93745, "epoch": 2232} {"train_loss": -6.267566204071045, "global_step": 93746, "epoch": 2232} {"train_loss": -6.2441582679748535, "global_step": 93747, "epoch": 2232} {"train_loss": -6.261320114135742, "global_step": 93748, "epoch": 2232} {"train_loss": -6.284877777099609, "global_step": 93749, "epoch": 2232} {"train_loss": -6.277921676635742, "global_step": 93750, "epoch": 2232} {"train_loss": -6.281329154968262, "global_step": 93751, "epoch": 2232} {"train_loss": -6.337643623352051, "global_step": 93752, "epoch": 2232} {"train_loss": -6.295690536499023, "global_step": 93753, "epoch": 2232} {"train_loss": -6.3645172119140625, "global_step": 93754, "epoch": 2232} {"train_loss": -6.275412559509277, "global_step": 93755, "epoch": 2232} {"train_loss": -6.388726711273193, "global_step": 93756, "epoch": 2232} {"train_loss": -6.30472469329834, "global_step": 93757, "epoch": 2232} {"train_loss": -6.310910224914551, "global_step": 93758, "epoch": 2232} {"train_loss": -6.277203559875488, "global_step": 93759, "epoch": 2232} {"train_loss": -6.315224647521973, "global_step": 93760, "epoch": 2232} {"train_loss": -6.355109691619873, "global_step": 93761, "epoch": 2232} {"train_loss": -6.401902198791504, "global_step": 93762, "epoch": 2232} {"train_loss": -6.408053398132324, "global_step": 93763, "epoch": 2232} {"train_loss": -6.254273414611816, "global_step": 93764, "epoch": 2232} {"train_loss": -6.250901222229004, "global_step": 93765, "epoch": 2232} {"train_loss": -6.076230525970459, "global_step": 93766, "epoch": 2232} {"train_loss": -6.223418235778809, "global_step": 93767, "epoch": 2232} {"train_loss": -6.373068809509277, "global_step": 93768, "epoch": 2232} {"train_loss": -6.349405288696289, "global_step": 93769, "epoch": 2232} {"train_loss": -6.17082405090332, "global_step": 93770, "epoch": 2232} {"train_loss": -6.354439735412598, "global_step": 93771, "epoch": 2232} {"train_loss": -6.295830726623535, "global_step": 93772, "epoch": 2232} {"train_loss": -6.247175216674805, "global_step": 93773, "epoch": 2232} {"train_loss": -6.203935623168945, "global_step": 93774, "epoch": 2232} {"train_loss": -6.228263854980469, "global_step": 93775, "epoch": 2232} {"train_loss": -6.248706817626953, "global_step": 93776, "epoch": 2232} {"train_loss": -6.288082122802734, "global_step": 93777, "epoch": 2232} {"train_loss": -6.398088455200195, "global_step": 93778, "epoch": 2232} {"train_loss": -6.344235420227051, "global_step": 93779, "epoch": 2232} {"train_loss": -6.257508277893066, "global_step": 93780, "epoch": 2232} {"train_loss": -6.315217971801758, "global_step": 93781, "epoch": 2232} {"train_loss": -6.303483486175537, "global_step": 93782, "epoch": 2232} {"train_loss": -6.4233927726745605, "global_step": 93783, "epoch": 2232} {"train_loss": -6.236736297607422, "global_step": 93784, "epoch": 2232} {"train_loss": -6.293798367182414, "global_step": 93785, "epoch": 2232, "val_loss": 63412.0390625} {"train_loss": -6.2526445388793945, "global_step": 93786, "epoch": 2233} {"train_loss": -6.298386573791504, "global_step": 93787, "epoch": 2233} {"train_loss": -6.2345194816589355, "global_step": 93788, "epoch": 2233} {"train_loss": -6.219298362731934, "global_step": 93789, "epoch": 2233} {"train_loss": -6.355259895324707, "global_step": 93790, "epoch": 2233} {"train_loss": -6.3322296142578125, "global_step": 93791, "epoch": 2233} {"train_loss": -6.240067481994629, "global_step": 93792, "epoch": 2233} {"train_loss": -6.254927635192871, "global_step": 93793, "epoch": 2233} {"train_loss": -6.352214813232422, "global_step": 93794, "epoch": 2233} {"train_loss": -6.397858619689941, "global_step": 93795, "epoch": 2233} {"train_loss": -6.1967082023620605, "global_step": 93796, "epoch": 2233} {"train_loss": -6.338113784790039, "global_step": 93797, "epoch": 2233} {"train_loss": -6.228219032287598, "global_step": 93798, "epoch": 2233} {"train_loss": -6.359233379364014, "global_step": 93799, "epoch": 2233} {"train_loss": -6.327603340148926, "global_step": 93800, "epoch": 2233} {"train_loss": -6.164575099945068, "global_step": 93801, "epoch": 2233} {"train_loss": -6.240527153015137, "global_step": 93802, "epoch": 2233} {"train_loss": -6.347472667694092, "global_step": 93803, "epoch": 2233} {"train_loss": -6.254857063293457, "global_step": 93804, "epoch": 2233} {"train_loss": -6.345315933227539, "global_step": 93805, "epoch": 2233} {"train_loss": -6.360589027404785, "global_step": 93806, "epoch": 2233} {"train_loss": -6.41418981552124, "global_step": 93807, "epoch": 2233} {"train_loss": -6.25750732421875, "global_step": 93808, "epoch": 2233} {"train_loss": -6.344359397888184, "global_step": 93809, "epoch": 2233} {"train_loss": -6.340190887451172, "global_step": 93810, "epoch": 2233} {"train_loss": -6.312821388244629, "global_step": 93811, "epoch": 2233} {"train_loss": -6.250554084777832, "global_step": 93812, "epoch": 2233} {"train_loss": -6.3673553466796875, "global_step": 93813, "epoch": 2233} {"train_loss": -6.308012962341309, "global_step": 93814, "epoch": 2233} {"train_loss": -6.246167182922363, "global_step": 93815, "epoch": 2233} {"train_loss": -6.381386756896973, "global_step": 93816, "epoch": 2233} {"train_loss": -6.216574668884277, "global_step": 93817, "epoch": 2233} {"train_loss": -6.363107681274414, "global_step": 93818, "epoch": 2233} {"train_loss": -6.221889972686768, "global_step": 93819, "epoch": 2233} {"train_loss": -6.25441837310791, "global_step": 93820, "epoch": 2233} {"train_loss": -6.30757999420166, "global_step": 93821, "epoch": 2233} {"train_loss": -6.272017002105713, "global_step": 93822, "epoch": 2233} {"train_loss": -6.354004859924316, "global_step": 93823, "epoch": 2233} {"train_loss": -6.197635650634766, "global_step": 93824, "epoch": 2233} {"train_loss": -6.316976547241211, "global_step": 93825, "epoch": 2233} {"train_loss": -6.390966892242432, "global_step": 93826, "epoch": 2233} {"train_loss": -6.299111650103614, "global_step": 93827, "epoch": 2233, "val_loss": 63486.7890625} {"train_loss": -6.40485954284668, "global_step": 93828, "epoch": 2234} {"train_loss": -6.386480331420898, "global_step": 93829, "epoch": 2234} {"train_loss": -6.332331657409668, "global_step": 93830, "epoch": 2234} {"train_loss": -6.36869478225708, "global_step": 93831, "epoch": 2234} {"train_loss": -6.14808464050293, "global_step": 93832, "epoch": 2234} {"train_loss": -6.336688041687012, "global_step": 93833, "epoch": 2234} {"train_loss": -6.2572174072265625, "global_step": 93834, "epoch": 2234} {"train_loss": -6.294414520263672, "global_step": 93835, "epoch": 2234} {"train_loss": -6.226936340332031, "global_step": 93836, "epoch": 2234} {"train_loss": -6.242486953735352, "global_step": 93837, "epoch": 2234} {"train_loss": -6.31892204284668, "global_step": 93838, "epoch": 2234} {"train_loss": -6.212155342102051, "global_step": 93839, "epoch": 2234} {"train_loss": -6.323554515838623, "global_step": 93840, "epoch": 2234} {"train_loss": -6.317663669586182, "global_step": 93841, "epoch": 2234} {"train_loss": -6.395396709442139, "global_step": 93842, "epoch": 2234} {"train_loss": -6.384450912475586, "global_step": 93843, "epoch": 2234} {"train_loss": -6.392942428588867, "global_step": 93844, "epoch": 2234} {"train_loss": -6.391773223876953, "global_step": 93845, "epoch": 2234} {"train_loss": -6.211615562438965, "global_step": 93846, "epoch": 2234} {"train_loss": -6.375056266784668, "global_step": 93847, "epoch": 2234} {"train_loss": -6.360475063323975, "global_step": 93848, "epoch": 2234} {"train_loss": -6.2652740478515625, "global_step": 93849, "epoch": 2234} {"train_loss": -6.355892181396484, "global_step": 93850, "epoch": 2234} {"train_loss": -6.375523567199707, "global_step": 93851, "epoch": 2234} {"train_loss": -6.276311874389648, "global_step": 93852, "epoch": 2234} {"train_loss": -6.2620768547058105, "global_step": 93853, "epoch": 2234} {"train_loss": -6.429306983947754, "global_step": 93854, "epoch": 2234} {"train_loss": -6.31257438659668, "global_step": 93855, "epoch": 2234} {"train_loss": -6.306413173675537, "global_step": 93856, "epoch": 2234} {"train_loss": -6.302764892578125, "global_step": 93857, "epoch": 2234} {"train_loss": -6.279808044433594, "global_step": 93858, "epoch": 2234} {"train_loss": -6.305591583251953, "global_step": 93859, "epoch": 2234} {"train_loss": -6.2986369132995605, "global_step": 93860, "epoch": 2234} {"train_loss": -6.403002738952637, "global_step": 93861, "epoch": 2234} {"train_loss": -6.2875189781188965, "global_step": 93862, "epoch": 2234} {"train_loss": -6.309795379638672, "global_step": 93863, "epoch": 2234} {"train_loss": -6.275547027587891, "global_step": 93864, "epoch": 2234} {"train_loss": -6.333857536315918, "global_step": 93865, "epoch": 2234} {"train_loss": -6.260716438293457, "global_step": 93866, "epoch": 2234} {"train_loss": -6.273674011230469, "global_step": 93867, "epoch": 2234} {"train_loss": -6.3349714279174805, "global_step": 93868, "epoch": 2234} {"train_loss": -6.316223655428205, "global_step": 93869, "epoch": 2234, "val_loss": 63563.2734375} {"train_loss": -6.244617938995361, "global_step": 93870, "epoch": 2235} {"train_loss": -6.379961013793945, "global_step": 93871, "epoch": 2235} {"train_loss": -6.237775802612305, "global_step": 93872, "epoch": 2235} {"train_loss": -6.317115783691406, "global_step": 93873, "epoch": 2235} {"train_loss": -6.375458717346191, "global_step": 93874, "epoch": 2235} {"train_loss": -6.344040393829346, "global_step": 93875, "epoch": 2235} {"train_loss": -6.3157734870910645, "global_step": 93876, "epoch": 2235} {"train_loss": -6.277467250823975, "global_step": 93877, "epoch": 2235} {"train_loss": -6.353461265563965, "global_step": 93878, "epoch": 2235} {"train_loss": -6.212933540344238, "global_step": 93879, "epoch": 2235} {"train_loss": -6.3267998695373535, "global_step": 93880, "epoch": 2235} {"train_loss": -6.291512489318848, "global_step": 93881, "epoch": 2235} {"train_loss": -6.280835151672363, "global_step": 93882, "epoch": 2235} {"train_loss": -6.2614850997924805, "global_step": 93883, "epoch": 2235} {"train_loss": -6.284151077270508, "global_step": 93884, "epoch": 2235} {"train_loss": -6.319982528686523, "global_step": 93885, "epoch": 2235} {"train_loss": -6.376055717468262, "global_step": 93886, "epoch": 2235} {"train_loss": -6.37968635559082, "global_step": 93887, "epoch": 2235} {"train_loss": -6.229966640472412, "global_step": 93888, "epoch": 2235} {"train_loss": -6.317558288574219, "global_step": 93889, "epoch": 2235} {"train_loss": -6.269416332244873, "global_step": 93890, "epoch": 2235} {"train_loss": -6.264639377593994, "global_step": 93891, "epoch": 2235} {"train_loss": -6.2645368576049805, "global_step": 93892, "epoch": 2235} {"train_loss": -6.226696968078613, "global_step": 93893, "epoch": 2235} {"train_loss": -6.252437591552734, "global_step": 93894, "epoch": 2235} {"train_loss": -6.292034149169922, "global_step": 93895, "epoch": 2235} {"train_loss": -6.195409774780273, "global_step": 93896, "epoch": 2235} {"train_loss": -6.225343227386475, "global_step": 93897, "epoch": 2235} {"train_loss": -6.312989234924316, "global_step": 93898, "epoch": 2235} {"train_loss": -6.215386390686035, "global_step": 93899, "epoch": 2235} {"train_loss": -6.309671401977539, "global_step": 93900, "epoch": 2235} {"train_loss": -6.19528865814209, "global_step": 93901, "epoch": 2235} {"train_loss": -6.2338762283325195, "global_step": 93902, "epoch": 2235} {"train_loss": -6.118919372558594, "global_step": 93903, "epoch": 2235} {"train_loss": -6.278669357299805, "global_step": 93904, "epoch": 2235} {"train_loss": -6.338284969329834, "global_step": 93905, "epoch": 2235} {"train_loss": -6.333042621612549, "global_step": 93906, "epoch": 2235} {"train_loss": -6.230100631713867, "global_step": 93907, "epoch": 2235} {"train_loss": -6.230937957763672, "global_step": 93908, "epoch": 2235} {"train_loss": -6.288187026977539, "global_step": 93909, "epoch": 2235} {"train_loss": -6.26216983795166, "global_step": 93910, "epoch": 2235} {"train_loss": -6.28252074832008, "global_step": 93911, "epoch": 2235, "val_loss": 63453.953125} {"train_loss": -6.251397609710693, "global_step": 93912, "epoch": 2236} {"train_loss": -6.393523216247559, "global_step": 93913, "epoch": 2236} {"train_loss": -6.205595016479492, "global_step": 93914, "epoch": 2236} {"train_loss": -6.297569274902344, "global_step": 93915, "epoch": 2236} {"train_loss": -6.176565170288086, "global_step": 93916, "epoch": 2236} {"train_loss": -6.243279933929443, "global_step": 93917, "epoch": 2236} {"train_loss": -6.3755621910095215, "global_step": 93918, "epoch": 2236} {"train_loss": -6.196376323699951, "global_step": 93919, "epoch": 2236} {"train_loss": -6.220648288726807, "global_step": 93920, "epoch": 2236} {"train_loss": -6.329405784606934, "global_step": 93921, "epoch": 2236} {"train_loss": -6.309598445892334, "global_step": 93922, "epoch": 2236} {"train_loss": -6.35299015045166, "global_step": 93923, "epoch": 2236} {"train_loss": -6.347984313964844, "global_step": 93924, "epoch": 2236} {"train_loss": -6.324624061584473, "global_step": 93925, "epoch": 2236} {"train_loss": -6.212802410125732, "global_step": 93926, "epoch": 2236} {"train_loss": -6.344529628753662, "global_step": 93927, "epoch": 2236} {"train_loss": -6.372089385986328, "global_step": 93928, "epoch": 2236} {"train_loss": -6.336066246032715, "global_step": 93929, "epoch": 2236} {"train_loss": -6.383934020996094, "global_step": 93930, "epoch": 2236} {"train_loss": -6.256824016571045, "global_step": 93931, "epoch": 2236} {"train_loss": -6.333804130554199, "global_step": 93932, "epoch": 2236} {"train_loss": -6.243261337280273, "global_step": 93933, "epoch": 2236} {"train_loss": -6.2403035163879395, "global_step": 93934, "epoch": 2236} {"train_loss": -6.29997444152832, "global_step": 93935, "epoch": 2236} {"train_loss": -6.268887996673584, "global_step": 93936, "epoch": 2236} {"train_loss": -6.314525604248047, "global_step": 93937, "epoch": 2236} {"train_loss": -6.392600059509277, "global_step": 93938, "epoch": 2236} {"train_loss": -6.286306381225586, "global_step": 93939, "epoch": 2236} {"train_loss": -6.29659366607666, "global_step": 93940, "epoch": 2236} {"train_loss": -6.374227046966553, "global_step": 93941, "epoch": 2236} {"train_loss": -6.272696018218994, "global_step": 93942, "epoch": 2236} {"train_loss": -6.147611141204834, "global_step": 93943, "epoch": 2236} {"train_loss": -6.356323719024658, "global_step": 93944, "epoch": 2236} {"train_loss": -6.406332015991211, "global_step": 93945, "epoch": 2236} {"train_loss": -6.253350257873535, "global_step": 93946, "epoch": 2236} {"train_loss": -6.348616600036621, "global_step": 93947, "epoch": 2236} {"train_loss": -6.286469459533691, "global_step": 93948, "epoch": 2236} {"train_loss": -6.324733734130859, "global_step": 93949, "epoch": 2236} {"train_loss": -6.137811660766602, "global_step": 93950, "epoch": 2236} {"train_loss": -6.245124816894531, "global_step": 93951, "epoch": 2236} {"train_loss": -6.258646488189697, "global_step": 93952, "epoch": 2236} {"train_loss": -6.295904216312227, "global_step": 93953, "epoch": 2236, "val_loss": 63838.37890625} {"train_loss": -6.046326637268066, "global_step": 93954, "epoch": 2237} {"train_loss": -6.284024238586426, "global_step": 93955, "epoch": 2237} {"train_loss": -6.200593948364258, "global_step": 93956, "epoch": 2237} {"train_loss": -6.069438934326172, "global_step": 93957, "epoch": 2237} {"train_loss": -6.24070405960083, "global_step": 93958, "epoch": 2237} {"train_loss": -6.126120090484619, "global_step": 93959, "epoch": 2237} {"train_loss": -6.24498176574707, "global_step": 93960, "epoch": 2237} {"train_loss": -6.182499885559082, "global_step": 93961, "epoch": 2237} {"train_loss": -6.196216583251953, "global_step": 93962, "epoch": 2237} {"train_loss": -6.1455302238464355, "global_step": 93963, "epoch": 2237} {"train_loss": -6.231651306152344, "global_step": 93964, "epoch": 2237} {"train_loss": -6.3147478103637695, "global_step": 93965, "epoch": 2237} {"train_loss": -6.226390838623047, "global_step": 93966, "epoch": 2237} {"train_loss": -6.291341781616211, "global_step": 93967, "epoch": 2237} {"train_loss": -6.24862003326416, "global_step": 93968, "epoch": 2237} {"train_loss": -6.384974002838135, "global_step": 93969, "epoch": 2237} {"train_loss": -6.362366676330566, "global_step": 93970, "epoch": 2237} {"train_loss": -6.338788986206055, "global_step": 93971, "epoch": 2237} {"train_loss": -6.307553291320801, "global_step": 93972, "epoch": 2237} {"train_loss": -6.270057678222656, "global_step": 93973, "epoch": 2237} {"train_loss": -6.319394111633301, "global_step": 93974, "epoch": 2237} {"train_loss": -6.287042140960693, "global_step": 93975, "epoch": 2237} {"train_loss": -6.258636474609375, "global_step": 93976, "epoch": 2237} {"train_loss": -6.357921123504639, "global_step": 93977, "epoch": 2237} {"train_loss": -6.398465633392334, "global_step": 93978, "epoch": 2237} {"train_loss": -6.364358901977539, "global_step": 93979, "epoch": 2237} {"train_loss": -6.304929733276367, "global_step": 93980, "epoch": 2237} {"train_loss": -6.253483772277832, "global_step": 93981, "epoch": 2237} {"train_loss": -6.227994918823242, "global_step": 93982, "epoch": 2237} {"train_loss": -6.269066333770752, "global_step": 93983, "epoch": 2237} {"train_loss": -6.338276386260986, "global_step": 93984, "epoch": 2237} {"train_loss": -6.315328598022461, "global_step": 93985, "epoch": 2237} {"train_loss": -6.346145153045654, "global_step": 93986, "epoch": 2237} {"train_loss": -6.272342681884766, "global_step": 93987, "epoch": 2237} {"train_loss": -6.253101348876953, "global_step": 93988, "epoch": 2237} {"train_loss": -6.393697738647461, "global_step": 93989, "epoch": 2237} {"train_loss": -6.357879638671875, "global_step": 93990, "epoch": 2237} {"train_loss": -6.317024230957031, "global_step": 93991, "epoch": 2237} {"train_loss": -6.468200206756592, "global_step": 93992, "epoch": 2237} {"train_loss": -6.393941879272461, "global_step": 93993, "epoch": 2237} {"train_loss": -6.263553142547607, "global_step": 93994, "epoch": 2237} {"train_loss": -6.280705917449224, "global_step": 93995, "epoch": 2237, "val_loss": 63816.2421875} {"train_loss": -6.195092678070068, "global_step": 93996, "epoch": 2238} {"train_loss": -6.310946464538574, "global_step": 93997, "epoch": 2238} {"train_loss": -6.288381576538086, "global_step": 93998, "epoch": 2238} {"train_loss": -6.186394214630127, "global_step": 93999, "epoch": 2238} {"train_loss": -6.336769104003906, "global_step": 94000, "epoch": 2238} {"train_loss": -6.177523612976074, "global_step": 94001, "epoch": 2238} {"train_loss": -6.138791084289551, "global_step": 94002, "epoch": 2238} {"train_loss": -6.277912139892578, "global_step": 94003, "epoch": 2238} {"train_loss": -6.304359436035156, "global_step": 94004, "epoch": 2238} {"train_loss": -6.1922221183776855, "global_step": 94005, "epoch": 2238} {"train_loss": -6.234245300292969, "global_step": 94006, "epoch": 2238} {"train_loss": -6.359134674072266, "global_step": 94007, "epoch": 2238} {"train_loss": -6.291220664978027, "global_step": 94008, "epoch": 2238} {"train_loss": -6.3086090087890625, "global_step": 94009, "epoch": 2238} {"train_loss": -6.315202713012695, "global_step": 94010, "epoch": 2238} {"train_loss": -6.236233711242676, "global_step": 94011, "epoch": 2238} {"train_loss": -6.173851490020752, "global_step": 94012, "epoch": 2238} {"train_loss": -6.263911724090576, "global_step": 94013, "epoch": 2238} {"train_loss": -6.191079616546631, "global_step": 94014, "epoch": 2238} {"train_loss": -6.2368550300598145, "global_step": 94015, "epoch": 2238} {"train_loss": -6.17963981628418, "global_step": 94016, "epoch": 2238} {"train_loss": -6.349118232727051, "global_step": 94017, "epoch": 2238} {"train_loss": -6.25584602355957, "global_step": 94018, "epoch": 2238} {"train_loss": -6.325453758239746, "global_step": 94019, "epoch": 2238} {"train_loss": -6.232151031494141, "global_step": 94020, "epoch": 2238} {"train_loss": -6.208148956298828, "global_step": 94021, "epoch": 2238} {"train_loss": -6.239809036254883, "global_step": 94022, "epoch": 2238} {"train_loss": -6.2225494384765625, "global_step": 94023, "epoch": 2238} {"train_loss": -6.288003921508789, "global_step": 94024, "epoch": 2238} {"train_loss": -6.293422698974609, "global_step": 94025, "epoch": 2238} {"train_loss": -6.256740570068359, "global_step": 94026, "epoch": 2238} {"train_loss": -6.321191787719727, "global_step": 94027, "epoch": 2238} {"train_loss": -6.2204132080078125, "global_step": 94028, "epoch": 2238} {"train_loss": -6.393024921417236, "global_step": 94029, "epoch": 2238} {"train_loss": -6.236291408538818, "global_step": 94030, "epoch": 2238} {"train_loss": -6.246111869812012, "global_step": 94031, "epoch": 2238} {"train_loss": -6.29185676574707, "global_step": 94032, "epoch": 2238} {"train_loss": -6.376610279083252, "global_step": 94033, "epoch": 2238} {"train_loss": -6.357844352722168, "global_step": 94034, "epoch": 2238} {"train_loss": -6.264389514923096, "global_step": 94035, "epoch": 2238} {"train_loss": -6.324825286865234, "global_step": 94036, "epoch": 2238} {"train_loss": -6.270237161999657, "global_step": 94037, "epoch": 2238, "val_loss": 63528.5078125} {"train_loss": -6.379040718078613, "global_step": 94038, "epoch": 2239} {"train_loss": -6.265351295471191, "global_step": 94039, "epoch": 2239} {"train_loss": -6.246587753295898, "global_step": 94040, "epoch": 2239} {"train_loss": -6.354443550109863, "global_step": 94041, "epoch": 2239} {"train_loss": -6.467579364776611, "global_step": 94042, "epoch": 2239} {"train_loss": -6.365267276763916, "global_step": 94043, "epoch": 2239} {"train_loss": -6.299917221069336, "global_step": 94044, "epoch": 2239} {"train_loss": -6.438076019287109, "global_step": 94045, "epoch": 2239} {"train_loss": -6.440589904785156, "global_step": 94046, "epoch": 2239} {"train_loss": -6.349617958068848, "global_step": 94047, "epoch": 2239} {"train_loss": -6.298772811889648, "global_step": 94048, "epoch": 2239} {"train_loss": -6.277529716491699, "global_step": 94049, "epoch": 2239} {"train_loss": -6.335282325744629, "global_step": 94050, "epoch": 2239} {"train_loss": -6.342506408691406, "global_step": 94051, "epoch": 2239} {"train_loss": -6.217220306396484, "global_step": 94052, "epoch": 2239} {"train_loss": -6.325263023376465, "global_step": 94053, "epoch": 2239} {"train_loss": -6.314896583557129, "global_step": 94054, "epoch": 2239} {"train_loss": -6.272452354431152, "global_step": 94055, "epoch": 2239} {"train_loss": -6.257912635803223, "global_step": 94056, "epoch": 2239} {"train_loss": -6.335351943969727, "global_step": 94057, "epoch": 2239} {"train_loss": -6.360490322113037, "global_step": 94058, "epoch": 2239} {"train_loss": -6.2632527351379395, "global_step": 94059, "epoch": 2239} {"train_loss": -6.295446872711182, "global_step": 94060, "epoch": 2239} {"train_loss": -6.286444664001465, "global_step": 94061, "epoch": 2239} {"train_loss": -6.292572975158691, "global_step": 94062, "epoch": 2239} {"train_loss": -6.2396674156188965, "global_step": 94063, "epoch": 2239} {"train_loss": -6.309050559997559, "global_step": 94064, "epoch": 2239} {"train_loss": -6.38464879989624, "global_step": 94065, "epoch": 2239} {"train_loss": -6.119753837585449, "global_step": 94066, "epoch": 2239} {"train_loss": -6.4318389892578125, "global_step": 94067, "epoch": 2239} {"train_loss": -6.129639625549316, "global_step": 94068, "epoch": 2239} {"train_loss": -6.279853820800781, "global_step": 94069, "epoch": 2239} {"train_loss": -6.285343170166016, "global_step": 94070, "epoch": 2239} {"train_loss": -6.232146263122559, "global_step": 94071, "epoch": 2239} {"train_loss": -6.21757698059082, "global_step": 94072, "epoch": 2239} {"train_loss": -6.3311543464660645, "global_step": 94073, "epoch": 2239} {"train_loss": -6.183199882507324, "global_step": 94074, "epoch": 2239} {"train_loss": -6.323819637298584, "global_step": 94075, "epoch": 2239} {"train_loss": -6.333823204040527, "global_step": 94076, "epoch": 2239} {"train_loss": -6.299524784088135, "global_step": 94077, "epoch": 2239} {"train_loss": -6.26830530166626, "global_step": 94078, "epoch": 2239} {"train_loss": -6.302864233652751, "global_step": 94079, "epoch": 2239, "val_loss": 63580.09765625} {"train_loss": -6.160545349121094, "global_step": 94080, "epoch": 2240} {"train_loss": -6.222172737121582, "global_step": 94081, "epoch": 2240} {"train_loss": -6.358577728271484, "global_step": 94082, "epoch": 2240} {"train_loss": -6.245602607727051, "global_step": 94083, "epoch": 2240} {"train_loss": -6.415615081787109, "global_step": 94084, "epoch": 2240} {"train_loss": -6.223507881164551, "global_step": 94085, "epoch": 2240} {"train_loss": -6.292075157165527, "global_step": 94086, "epoch": 2240} {"train_loss": -6.41903018951416, "global_step": 94087, "epoch": 2240} {"train_loss": -6.286465644836426, "global_step": 94088, "epoch": 2240} {"train_loss": -6.402703762054443, "global_step": 94089, "epoch": 2240} {"train_loss": -6.2505645751953125, "global_step": 94090, "epoch": 2240} {"train_loss": -6.393036842346191, "global_step": 94091, "epoch": 2240} {"train_loss": -6.41751766204834, "global_step": 94092, "epoch": 2240} {"train_loss": -6.215089797973633, "global_step": 94093, "epoch": 2240} {"train_loss": -6.339866638183594, "global_step": 94094, "epoch": 2240} {"train_loss": -6.225615501403809, "global_step": 94095, "epoch": 2240} {"train_loss": -6.211239814758301, "global_step": 94096, "epoch": 2240} {"train_loss": -6.244865417480469, "global_step": 94097, "epoch": 2240} {"train_loss": -6.263975143432617, "global_step": 94098, "epoch": 2240} {"train_loss": -6.2439494132995605, "global_step": 94099, "epoch": 2240} {"train_loss": -6.188216209411621, "global_step": 94100, "epoch": 2240} {"train_loss": -6.306641101837158, "global_step": 94101, "epoch": 2240} {"train_loss": -6.340658187866211, "global_step": 94102, "epoch": 2240} {"train_loss": -6.198864936828613, "global_step": 94103, "epoch": 2240} {"train_loss": -6.258986473083496, "global_step": 94104, "epoch": 2240} {"train_loss": -6.393283843994141, "global_step": 94105, "epoch": 2240} {"train_loss": -6.328946113586426, "global_step": 94106, "epoch": 2240} {"train_loss": -6.37936544418335, "global_step": 94107, "epoch": 2240} {"train_loss": -6.363537311553955, "global_step": 94108, "epoch": 2240} {"train_loss": -6.253308296203613, "global_step": 94109, "epoch": 2240} {"train_loss": -6.307921409606934, "global_step": 94110, "epoch": 2240} {"train_loss": -6.2658586502075195, "global_step": 94111, "epoch": 2240} {"train_loss": -6.398375511169434, "global_step": 94112, "epoch": 2240} {"train_loss": -6.392551898956299, "global_step": 94113, "epoch": 2240} {"train_loss": -6.3238348960876465, "global_step": 94114, "epoch": 2240} {"train_loss": -6.3998517990112305, "global_step": 94115, "epoch": 2240} {"train_loss": -6.18886661529541, "global_step": 94116, "epoch": 2240} {"train_loss": -6.317697048187256, "global_step": 94117, "epoch": 2240} {"train_loss": -6.34962272644043, "global_step": 94118, "epoch": 2240} {"train_loss": -6.3504743576049805, "global_step": 94119, "epoch": 2240} {"train_loss": -6.32145357131958, "global_step": 94120, "epoch": 2240} {"train_loss": -6.304962771279471, "global_step": 94121, "epoch": 2240, "val_loss": 63522.0859375} {"train_loss": -6.238089561462402, "global_step": 94122, "epoch": 2241} {"train_loss": -6.303601264953613, "global_step": 94123, "epoch": 2241} {"train_loss": -6.335464954376221, "global_step": 94124, "epoch": 2241} {"train_loss": -6.367631435394287, "global_step": 94125, "epoch": 2241} {"train_loss": -6.39787483215332, "global_step": 94126, "epoch": 2241} {"train_loss": -6.331711769104004, "global_step": 94127, "epoch": 2241} {"train_loss": -6.249743461608887, "global_step": 94128, "epoch": 2241} {"train_loss": -6.263548851013184, "global_step": 94129, "epoch": 2241} {"train_loss": -6.39338493347168, "global_step": 94130, "epoch": 2241} {"train_loss": -6.32163143157959, "global_step": 94131, "epoch": 2241} {"train_loss": -6.352227210998535, "global_step": 94132, "epoch": 2241} {"train_loss": -6.189935207366943, "global_step": 94133, "epoch": 2241} {"train_loss": -6.288747787475586, "global_step": 94134, "epoch": 2241} {"train_loss": -6.28076696395874, "global_step": 94135, "epoch": 2241} {"train_loss": -6.147036075592041, "global_step": 94136, "epoch": 2241} {"train_loss": -6.3517656326293945, "global_step": 94137, "epoch": 2241} {"train_loss": -6.093260288238525, "global_step": 94138, "epoch": 2241} {"train_loss": -6.195346832275391, "global_step": 94139, "epoch": 2241} {"train_loss": -6.245237827301025, "global_step": 94140, "epoch": 2241} {"train_loss": -6.093569755554199, "global_step": 94141, "epoch": 2241} {"train_loss": -6.307775497436523, "global_step": 94142, "epoch": 2241} {"train_loss": -6.001225471496582, "global_step": 94143, "epoch": 2241} {"train_loss": -6.075928688049316, "global_step": 94144, "epoch": 2241} {"train_loss": -6.100886344909668, "global_step": 94145, "epoch": 2241} {"train_loss": -6.072617530822754, "global_step": 94146, "epoch": 2241} {"train_loss": -6.268784046173096, "global_step": 94147, "epoch": 2241} {"train_loss": -6.018150329589844, "global_step": 94148, "epoch": 2241} {"train_loss": -6.307809829711914, "global_step": 94149, "epoch": 2241} {"train_loss": -5.979928970336914, "global_step": 94150, "epoch": 2241} {"train_loss": -6.153045654296875, "global_step": 94151, "epoch": 2241} {"train_loss": -5.999871253967285, "global_step": 94152, "epoch": 2241} {"train_loss": -6.262540817260742, "global_step": 94153, "epoch": 2241} {"train_loss": -6.087061882019043, "global_step": 94154, "epoch": 2241} {"train_loss": -6.211944103240967, "global_step": 94155, "epoch": 2241} {"train_loss": -6.044215202331543, "global_step": 94156, "epoch": 2241} {"train_loss": -6.215807914733887, "global_step": 94157, "epoch": 2241} {"train_loss": -6.240602493286133, "global_step": 94158, "epoch": 2241} {"train_loss": -6.245450019836426, "global_step": 94159, "epoch": 2241} {"train_loss": -6.14317512512207, "global_step": 94160, "epoch": 2241} {"train_loss": -6.098261833190918, "global_step": 94161, "epoch": 2241} {"train_loss": -6.186358451843262, "global_step": 94162, "epoch": 2241} {"train_loss": -6.2014619168781095, "global_step": 94163, "epoch": 2241, "val_loss": 64010.55078125} {"train_loss": -6.163516044616699, "global_step": 94164, "epoch": 2242} {"train_loss": -6.1949663162231445, "global_step": 94165, "epoch": 2242} {"train_loss": -6.243330955505371, "global_step": 94166, "epoch": 2242} {"train_loss": -6.20670223236084, "global_step": 94167, "epoch": 2242} {"train_loss": -6.201929569244385, "global_step": 94168, "epoch": 2242} {"train_loss": -6.23138952255249, "global_step": 94169, "epoch": 2242} {"train_loss": -6.199272155761719, "global_step": 94170, "epoch": 2242} {"train_loss": -6.346330642700195, "global_step": 94171, "epoch": 2242} {"train_loss": -6.297969341278076, "global_step": 94172, "epoch": 2242} {"train_loss": -6.289175987243652, "global_step": 94173, "epoch": 2242} {"train_loss": -6.427680492401123, "global_step": 94174, "epoch": 2242} {"train_loss": -6.2522993087768555, "global_step": 94175, "epoch": 2242} {"train_loss": -6.202160835266113, "global_step": 94176, "epoch": 2242} {"train_loss": -6.286742210388184, "global_step": 94177, "epoch": 2242} {"train_loss": -6.198807239532471, "global_step": 94178, "epoch": 2242} {"train_loss": -6.2297868728637695, "global_step": 94179, "epoch": 2242} {"train_loss": -6.356150150299072, "global_step": 94180, "epoch": 2242} {"train_loss": -6.260570049285889, "global_step": 94181, "epoch": 2242} {"train_loss": -6.308951377868652, "global_step": 94182, "epoch": 2242} {"train_loss": -6.2557244300842285, "global_step": 94183, "epoch": 2242} {"train_loss": -6.3336992263793945, "global_step": 94184, "epoch": 2242} {"train_loss": -6.257959842681885, "global_step": 94185, "epoch": 2242} {"train_loss": -6.245627403259277, "global_step": 94186, "epoch": 2242} {"train_loss": -6.269779205322266, "global_step": 94187, "epoch": 2242} {"train_loss": -6.243461608886719, "global_step": 94188, "epoch": 2242} {"train_loss": -6.453380107879639, "global_step": 94189, "epoch": 2242} {"train_loss": -6.295462131500244, "global_step": 94190, "epoch": 2242} {"train_loss": -6.38527250289917, "global_step": 94191, "epoch": 2242} {"train_loss": -6.398904800415039, "global_step": 94192, "epoch": 2242} {"train_loss": -6.303753852844238, "global_step": 94193, "epoch": 2242} {"train_loss": -6.363221168518066, "global_step": 94194, "epoch": 2242} {"train_loss": -6.299540996551514, "global_step": 94195, "epoch": 2242} {"train_loss": -6.363372325897217, "global_step": 94196, "epoch": 2242} {"train_loss": -6.367315292358398, "global_step": 94197, "epoch": 2242} {"train_loss": -6.39363956451416, "global_step": 94198, "epoch": 2242} {"train_loss": -6.313058853149414, "global_step": 94199, "epoch": 2242} {"train_loss": -6.3465352058410645, "global_step": 94200, "epoch": 2242} {"train_loss": -6.389662742614746, "global_step": 94201, "epoch": 2242} {"train_loss": -6.208712577819824, "global_step": 94202, "epoch": 2242} {"train_loss": -6.2705841064453125, "global_step": 94203, "epoch": 2242} {"train_loss": -6.340155601501465, "global_step": 94204, "epoch": 2242} {"train_loss": -6.291993504478818, "global_step": 94205, "epoch": 2242, "val_loss": 63594.16015625} {"train_loss": -6.284246444702148, "global_step": 94206, "epoch": 2243} {"train_loss": -6.273188591003418, "global_step": 94207, "epoch": 2243} {"train_loss": -6.230302333831787, "global_step": 94208, "epoch": 2243} {"train_loss": -6.25968074798584, "global_step": 94209, "epoch": 2243} {"train_loss": -6.35146427154541, "global_step": 94210, "epoch": 2243} {"train_loss": -6.370821952819824, "global_step": 94211, "epoch": 2243} {"train_loss": -6.333051681518555, "global_step": 94212, "epoch": 2243} {"train_loss": -6.433239936828613, "global_step": 94213, "epoch": 2243} {"train_loss": -6.459026336669922, "global_step": 94214, "epoch": 2243} {"train_loss": -6.393255233764648, "global_step": 94215, "epoch": 2243} {"train_loss": -6.394377708435059, "global_step": 94216, "epoch": 2243} {"train_loss": -6.424825668334961, "global_step": 94217, "epoch": 2243} {"train_loss": -6.306048393249512, "global_step": 94218, "epoch": 2243} {"train_loss": -6.423872947692871, "global_step": 94219, "epoch": 2243} {"train_loss": -6.347314834594727, "global_step": 94220, "epoch": 2243} {"train_loss": -6.303398132324219, "global_step": 94221, "epoch": 2243} {"train_loss": -6.394308090209961, "global_step": 94222, "epoch": 2243} {"train_loss": -6.373029708862305, "global_step": 94223, "epoch": 2243} {"train_loss": -6.411988258361816, "global_step": 94224, "epoch": 2243} {"train_loss": -6.328792572021484, "global_step": 94225, "epoch": 2243} {"train_loss": -6.39093017578125, "global_step": 94226, "epoch": 2243} {"train_loss": -6.301121711730957, "global_step": 94227, "epoch": 2243} {"train_loss": -6.311568260192871, "global_step": 94228, "epoch": 2243} {"train_loss": -6.358445167541504, "global_step": 94229, "epoch": 2243} {"train_loss": -6.291975021362305, "global_step": 94230, "epoch": 2243} {"train_loss": -6.286581993103027, "global_step": 94231, "epoch": 2243} {"train_loss": -6.344480514526367, "global_step": 94232, "epoch": 2243} {"train_loss": -6.321262836456299, "global_step": 94233, "epoch": 2243} {"train_loss": -6.344356536865234, "global_step": 94234, "epoch": 2243} {"train_loss": -6.36749267578125, "global_step": 94235, "epoch": 2243} {"train_loss": -6.408857345581055, "global_step": 94236, "epoch": 2243} {"train_loss": -6.381547927856445, "global_step": 94237, "epoch": 2243} {"train_loss": -6.381856441497803, "global_step": 94238, "epoch": 2243} {"train_loss": -6.413052558898926, "global_step": 94239, "epoch": 2243} {"train_loss": -6.349129676818848, "global_step": 94240, "epoch": 2243} {"train_loss": -6.409862518310547, "global_step": 94241, "epoch": 2243} {"train_loss": -6.292304039001465, "global_step": 94242, "epoch": 2243} {"train_loss": -6.337470054626465, "global_step": 94243, "epoch": 2243} {"train_loss": -6.254662036895752, "global_step": 94244, "epoch": 2243} {"train_loss": -6.415236473083496, "global_step": 94245, "epoch": 2243} {"train_loss": -6.357842445373535, "global_step": 94246, "epoch": 2243} {"train_loss": -6.3542934485844205, "global_step": 94247, "epoch": 2243, "val_loss": 63433.45703125} {"train_loss": -6.480882167816162, "global_step": 94248, "epoch": 2244} {"train_loss": -6.38945198059082, "global_step": 94249, "epoch": 2244} {"train_loss": -6.391538619995117, "global_step": 94250, "epoch": 2244} {"train_loss": -6.291387557983398, "global_step": 94251, "epoch": 2244} {"train_loss": -6.139649391174316, "global_step": 94252, "epoch": 2244} {"train_loss": -6.292400360107422, "global_step": 94253, "epoch": 2244} {"train_loss": -6.308457851409912, "global_step": 94254, "epoch": 2244} {"train_loss": -6.278023719787598, "global_step": 94255, "epoch": 2244} {"train_loss": -6.3681416511535645, "global_step": 94256, "epoch": 2244} {"train_loss": -6.198664665222168, "global_step": 94257, "epoch": 2244} {"train_loss": -6.265949726104736, "global_step": 94258, "epoch": 2244} {"train_loss": -6.2838239669799805, "global_step": 94259, "epoch": 2244} {"train_loss": -6.250959873199463, "global_step": 94260, "epoch": 2244} {"train_loss": -6.2436418533325195, "global_step": 94261, "epoch": 2244} {"train_loss": -6.150599479675293, "global_step": 94262, "epoch": 2244} {"train_loss": -6.157116889953613, "global_step": 94263, "epoch": 2244} {"train_loss": -6.265223503112793, "global_step": 94264, "epoch": 2244} {"train_loss": -6.170770168304443, "global_step": 94265, "epoch": 2244} {"train_loss": -6.152667045593262, "global_step": 94266, "epoch": 2244} {"train_loss": -6.273725509643555, "global_step": 94267, "epoch": 2244} {"train_loss": -6.223443031311035, "global_step": 94268, "epoch": 2244} {"train_loss": -6.338436603546143, "global_step": 94269, "epoch": 2244} {"train_loss": -6.26052188873291, "global_step": 94270, "epoch": 2244} {"train_loss": -6.245628356933594, "global_step": 94271, "epoch": 2244} {"train_loss": -6.2772626876831055, "global_step": 94272, "epoch": 2244} {"train_loss": -6.28352165222168, "global_step": 94273, "epoch": 2244} {"train_loss": -6.193922996520996, "global_step": 94274, "epoch": 2244} {"train_loss": -6.293972969055176, "global_step": 94275, "epoch": 2244} {"train_loss": -6.119050979614258, "global_step": 94276, "epoch": 2244} {"train_loss": -6.28884220123291, "global_step": 94277, "epoch": 2244} {"train_loss": -6.243429660797119, "global_step": 94278, "epoch": 2244} {"train_loss": -6.126676559448242, "global_step": 94279, "epoch": 2244} {"train_loss": -6.294283390045166, "global_step": 94280, "epoch": 2244} {"train_loss": -6.182676315307617, "global_step": 94281, "epoch": 2244} {"train_loss": -6.406211853027344, "global_step": 94282, "epoch": 2244} {"train_loss": -6.392892837524414, "global_step": 94283, "epoch": 2244} {"train_loss": -6.347148895263672, "global_step": 94284, "epoch": 2244} {"train_loss": -6.237347602844238, "global_step": 94285, "epoch": 2244} {"train_loss": -6.334589004516602, "global_step": 94286, "epoch": 2244} {"train_loss": -6.223788738250732, "global_step": 94287, "epoch": 2244} {"train_loss": -6.295811653137207, "global_step": 94288, "epoch": 2244} {"train_loss": -6.26592907451448, "global_step": 94289, "epoch": 2244, "val_loss": 63730.484375} {"train_loss": -6.300001621246338, "global_step": 94290, "epoch": 2245} {"train_loss": -6.351532459259033, "global_step": 94291, "epoch": 2245} {"train_loss": -6.296697616577148, "global_step": 94292, "epoch": 2245} {"train_loss": -6.328897476196289, "global_step": 94293, "epoch": 2245} {"train_loss": -6.3202104568481445, "global_step": 94294, "epoch": 2245} {"train_loss": -6.255202770233154, "global_step": 94295, "epoch": 2245} {"train_loss": -6.206211090087891, "global_step": 94296, "epoch": 2245} {"train_loss": -6.267847061157227, "global_step": 94297, "epoch": 2245} {"train_loss": -6.212253570556641, "global_step": 94298, "epoch": 2245} {"train_loss": -6.423807144165039, "global_step": 94299, "epoch": 2245} {"train_loss": -6.248286247253418, "global_step": 94300, "epoch": 2245} {"train_loss": -6.376692771911621, "global_step": 94301, "epoch": 2245} {"train_loss": -6.298367977142334, "global_step": 94302, "epoch": 2245} {"train_loss": -6.230019569396973, "global_step": 94303, "epoch": 2245} {"train_loss": -6.336246967315674, "global_step": 94304, "epoch": 2245} {"train_loss": -6.179112434387207, "global_step": 94305, "epoch": 2245} {"train_loss": -6.345110893249512, "global_step": 94306, "epoch": 2245} {"train_loss": -6.23640251159668, "global_step": 94307, "epoch": 2245} {"train_loss": -6.171963691711426, "global_step": 94308, "epoch": 2245} {"train_loss": -6.244807720184326, "global_step": 94309, "epoch": 2245} {"train_loss": -6.138949871063232, "global_step": 94310, "epoch": 2245} {"train_loss": -6.221673488616943, "global_step": 94311, "epoch": 2245} {"train_loss": -6.359219551086426, "global_step": 94312, "epoch": 2245} {"train_loss": -6.254029273986816, "global_step": 94313, "epoch": 2245} {"train_loss": -6.353074073791504, "global_step": 94314, "epoch": 2245} {"train_loss": -6.27182674407959, "global_step": 94315, "epoch": 2245} {"train_loss": -6.2908196449279785, "global_step": 94316, "epoch": 2245} {"train_loss": -6.27879524230957, "global_step": 94317, "epoch": 2245} {"train_loss": -6.264923572540283, "global_step": 94318, "epoch": 2245} {"train_loss": -6.261037349700928, "global_step": 94319, "epoch": 2245} {"train_loss": -6.299717426300049, "global_step": 94320, "epoch": 2245} {"train_loss": -6.318830490112305, "global_step": 94321, "epoch": 2245} {"train_loss": -6.18848991394043, "global_step": 94322, "epoch": 2245} {"train_loss": -6.3064751625061035, "global_step": 94323, "epoch": 2245} {"train_loss": -6.302799224853516, "global_step": 94324, "epoch": 2245} {"train_loss": -6.302389621734619, "global_step": 94325, "epoch": 2245} {"train_loss": -6.3307785987854, "global_step": 94326, "epoch": 2245} {"train_loss": -6.413237571716309, "global_step": 94327, "epoch": 2245} {"train_loss": -6.216701030731201, "global_step": 94328, "epoch": 2245} {"train_loss": -6.413488864898682, "global_step": 94329, "epoch": 2245} {"train_loss": -6.346728324890137, "global_step": 94330, "epoch": 2245} {"train_loss": -6.2885707560039705, "global_step": 94331, "epoch": 2245, "val_loss": 63651.12890625} {"train_loss": -6.323247909545898, "global_step": 94332, "epoch": 2246} {"train_loss": -6.279506683349609, "global_step": 94333, "epoch": 2246} {"train_loss": -6.392533779144287, "global_step": 94334, "epoch": 2246} {"train_loss": -6.311725616455078, "global_step": 94335, "epoch": 2246} {"train_loss": -6.270198822021484, "global_step": 94336, "epoch": 2246} {"train_loss": -6.390545845031738, "global_step": 94337, "epoch": 2246} {"train_loss": -6.312319278717041, "global_step": 94338, "epoch": 2246} {"train_loss": -6.225318431854248, "global_step": 94339, "epoch": 2246} {"train_loss": -6.3537092208862305, "global_step": 94340, "epoch": 2246} {"train_loss": -6.33730411529541, "global_step": 94341, "epoch": 2246} {"train_loss": -6.265460014343262, "global_step": 94342, "epoch": 2246} {"train_loss": -6.268256664276123, "global_step": 94343, "epoch": 2246} {"train_loss": -6.25202751159668, "global_step": 94344, "epoch": 2246} {"train_loss": -6.333887100219727, "global_step": 94345, "epoch": 2246} {"train_loss": -6.320337295532227, "global_step": 94346, "epoch": 2246} {"train_loss": -6.322813987731934, "global_step": 94347, "epoch": 2246} {"train_loss": -6.296478271484375, "global_step": 94348, "epoch": 2246} {"train_loss": -6.232817649841309, "global_step": 94349, "epoch": 2246} {"train_loss": -6.213339805603027, "global_step": 94350, "epoch": 2246} {"train_loss": -6.276068687438965, "global_step": 94351, "epoch": 2246} {"train_loss": -6.272536277770996, "global_step": 94352, "epoch": 2246} {"train_loss": -6.236086845397949, "global_step": 94353, "epoch": 2246} {"train_loss": -6.385668754577637, "global_step": 94354, "epoch": 2246} {"train_loss": -6.191001892089844, "global_step": 94355, "epoch": 2246} {"train_loss": -6.261598587036133, "global_step": 94356, "epoch": 2246} {"train_loss": -6.2622575759887695, "global_step": 94357, "epoch": 2246} {"train_loss": -6.2910637855529785, "global_step": 94358, "epoch": 2246} {"train_loss": -6.3740129470825195, "global_step": 94359, "epoch": 2246} {"train_loss": -6.287442207336426, "global_step": 94360, "epoch": 2246} {"train_loss": -6.211608409881592, "global_step": 94361, "epoch": 2246} {"train_loss": -6.303854465484619, "global_step": 94362, "epoch": 2246} {"train_loss": -6.426907539367676, "global_step": 94363, "epoch": 2246} {"train_loss": -6.394200325012207, "global_step": 94364, "epoch": 2246} {"train_loss": -6.3079514503479, "global_step": 94365, "epoch": 2246} {"train_loss": -6.327005386352539, "global_step": 94366, "epoch": 2246} {"train_loss": -6.338701248168945, "global_step": 94367, "epoch": 2246} {"train_loss": -6.254265785217285, "global_step": 94368, "epoch": 2246} {"train_loss": -6.322449684143066, "global_step": 94369, "epoch": 2246} {"train_loss": -6.272007465362549, "global_step": 94370, "epoch": 2246} {"train_loss": -6.189513206481934, "global_step": 94371, "epoch": 2246} {"train_loss": -6.299109935760498, "global_step": 94372, "epoch": 2246} {"train_loss": -6.300953955877395, "global_step": 94373, "epoch": 2246, "val_loss": 63373.23046875} {"train_loss": -6.293513774871826, "global_step": 94374, "epoch": 2247} {"train_loss": -6.348999500274658, "global_step": 94375, "epoch": 2247} {"train_loss": -6.37303352355957, "global_step": 94376, "epoch": 2247} {"train_loss": -6.356663703918457, "global_step": 94377, "epoch": 2247} {"train_loss": -6.391445159912109, "global_step": 94378, "epoch": 2247} {"train_loss": -6.390541076660156, "global_step": 94379, "epoch": 2247} {"train_loss": -6.324355602264404, "global_step": 94380, "epoch": 2247} {"train_loss": -6.420356273651123, "global_step": 94381, "epoch": 2247} {"train_loss": -6.398252487182617, "global_step": 94382, "epoch": 2247} {"train_loss": -6.3889360427856445, "global_step": 94383, "epoch": 2247} {"train_loss": -6.305764675140381, "global_step": 94384, "epoch": 2247} {"train_loss": -6.331024169921875, "global_step": 94385, "epoch": 2247} {"train_loss": -6.302739143371582, "global_step": 94386, "epoch": 2247} {"train_loss": -6.354839324951172, "global_step": 94387, "epoch": 2247} {"train_loss": -6.289060115814209, "global_step": 94388, "epoch": 2247} {"train_loss": -6.348855018615723, "global_step": 94389, "epoch": 2247} {"train_loss": -6.278998851776123, "global_step": 94390, "epoch": 2247} {"train_loss": -6.3087921142578125, "global_step": 94391, "epoch": 2247} {"train_loss": -6.366832733154297, "global_step": 94392, "epoch": 2247} {"train_loss": -6.3420000076293945, "global_step": 94393, "epoch": 2247} {"train_loss": -6.282238006591797, "global_step": 94394, "epoch": 2247} {"train_loss": -6.235232830047607, "global_step": 94395, "epoch": 2247} {"train_loss": -6.268135070800781, "global_step": 94396, "epoch": 2247} {"train_loss": -6.195222854614258, "global_step": 94397, "epoch": 2247} {"train_loss": -6.349810600280762, "global_step": 94398, "epoch": 2247} {"train_loss": -6.291139602661133, "global_step": 94399, "epoch": 2247} {"train_loss": -6.385071754455566, "global_step": 94400, "epoch": 2247} {"train_loss": -6.317482948303223, "global_step": 94401, "epoch": 2247} {"train_loss": -6.308206558227539, "global_step": 94402, "epoch": 2247} {"train_loss": -6.350088119506836, "global_step": 94403, "epoch": 2247} {"train_loss": -6.274690628051758, "global_step": 94404, "epoch": 2247} {"train_loss": -6.344230651855469, "global_step": 94405, "epoch": 2247} {"train_loss": -6.24320125579834, "global_step": 94406, "epoch": 2247} {"train_loss": -6.290365695953369, "global_step": 94407, "epoch": 2247} {"train_loss": -6.272095680236816, "global_step": 94408, "epoch": 2247} {"train_loss": -6.226590156555176, "global_step": 94409, "epoch": 2247} {"train_loss": -6.353402614593506, "global_step": 94410, "epoch": 2247} {"train_loss": -6.236696243286133, "global_step": 94411, "epoch": 2247} {"train_loss": -6.2994279861450195, "global_step": 94412, "epoch": 2247} {"train_loss": -6.227130889892578, "global_step": 94413, "epoch": 2247} {"train_loss": -6.354123115539551, "global_step": 94414, "epoch": 2247} {"train_loss": -6.316785142535255, "global_step": 94415, "epoch": 2247, "val_loss": 63441.73046875} {"train_loss": -6.310241222381592, "global_step": 94416, "epoch": 2248} {"train_loss": -6.347653388977051, "global_step": 94417, "epoch": 2248} {"train_loss": -6.357852458953857, "global_step": 94418, "epoch": 2248} {"train_loss": -6.402229309082031, "global_step": 94419, "epoch": 2248} {"train_loss": -6.101166725158691, "global_step": 94420, "epoch": 2248} {"train_loss": -6.317259311676025, "global_step": 94421, "epoch": 2248} {"train_loss": -6.352376937866211, "global_step": 94422, "epoch": 2248} {"train_loss": -6.285202980041504, "global_step": 94423, "epoch": 2248} {"train_loss": -6.378030776977539, "global_step": 94424, "epoch": 2248} {"train_loss": -6.28509521484375, "global_step": 94425, "epoch": 2248} {"train_loss": -6.370582580566406, "global_step": 94426, "epoch": 2248} {"train_loss": -6.321239948272705, "global_step": 94427, "epoch": 2248} {"train_loss": -6.403714179992676, "global_step": 94428, "epoch": 2248} {"train_loss": -6.321538925170898, "global_step": 94429, "epoch": 2248} {"train_loss": -6.429658889770508, "global_step": 94430, "epoch": 2248} {"train_loss": -6.376199722290039, "global_step": 94431, "epoch": 2248} {"train_loss": -6.32225227355957, "global_step": 94432, "epoch": 2248} {"train_loss": -6.359601020812988, "global_step": 94433, "epoch": 2248} {"train_loss": -6.408256530761719, "global_step": 94434, "epoch": 2248} {"train_loss": -6.305699348449707, "global_step": 94435, "epoch": 2248} {"train_loss": -6.317520618438721, "global_step": 94436, "epoch": 2248} {"train_loss": -6.177323818206787, "global_step": 94437, "epoch": 2248} {"train_loss": -6.24135684967041, "global_step": 94438, "epoch": 2248} {"train_loss": -6.273379325866699, "global_step": 94439, "epoch": 2248} {"train_loss": -6.33143949508667, "global_step": 94440, "epoch": 2248} {"train_loss": -6.393759727478027, "global_step": 94441, "epoch": 2248} {"train_loss": -6.241039276123047, "global_step": 94442, "epoch": 2248} {"train_loss": -6.383231163024902, "global_step": 94443, "epoch": 2248} {"train_loss": -6.215530872344971, "global_step": 94444, "epoch": 2248} {"train_loss": -6.274979591369629, "global_step": 94445, "epoch": 2248} {"train_loss": -6.205695152282715, "global_step": 94446, "epoch": 2248} {"train_loss": -6.329108715057373, "global_step": 94447, "epoch": 2248} {"train_loss": -6.388790607452393, "global_step": 94448, "epoch": 2248} {"train_loss": -6.200368404388428, "global_step": 94449, "epoch": 2248} {"train_loss": -6.323175430297852, "global_step": 94450, "epoch": 2248} {"train_loss": -6.2506818771362305, "global_step": 94451, "epoch": 2248} {"train_loss": -6.286581039428711, "global_step": 94452, "epoch": 2248} {"train_loss": -6.2829084396362305, "global_step": 94453, "epoch": 2248} {"train_loss": -6.07084846496582, "global_step": 94454, "epoch": 2248} {"train_loss": -6.131925582885742, "global_step": 94455, "epoch": 2248} {"train_loss": -6.14748477935791, "global_step": 94456, "epoch": 2248} {"train_loss": -6.298444918223789, "global_step": 94457, "epoch": 2248, "val_loss": 63669.61328125} {"train_loss": -6.286621570587158, "global_step": 94458, "epoch": 2249} {"train_loss": -6.275577068328857, "global_step": 94459, "epoch": 2249} {"train_loss": -6.237329483032227, "global_step": 94460, "epoch": 2249} {"train_loss": -6.156060218811035, "global_step": 94461, "epoch": 2249} {"train_loss": -6.290131092071533, "global_step": 94462, "epoch": 2249} {"train_loss": -6.2790985107421875, "global_step": 94463, "epoch": 2249} {"train_loss": -6.341196060180664, "global_step": 94464, "epoch": 2249} {"train_loss": -6.229036331176758, "global_step": 94465, "epoch": 2249} {"train_loss": -6.286067485809326, "global_step": 94466, "epoch": 2249} {"train_loss": -6.40592622756958, "global_step": 94467, "epoch": 2249} {"train_loss": -6.361597061157227, "global_step": 94468, "epoch": 2249} {"train_loss": -6.436983108520508, "global_step": 94469, "epoch": 2249} {"train_loss": -6.432894706726074, "global_step": 94470, "epoch": 2249} {"train_loss": -6.304930686950684, "global_step": 94471, "epoch": 2249} {"train_loss": -6.28658390045166, "global_step": 94472, "epoch": 2249} {"train_loss": -6.270374298095703, "global_step": 94473, "epoch": 2249} {"train_loss": -6.258517265319824, "global_step": 94474, "epoch": 2249} {"train_loss": -6.3465576171875, "global_step": 94475, "epoch": 2249} {"train_loss": -6.374611854553223, "global_step": 94476, "epoch": 2249} {"train_loss": -6.327930450439453, "global_step": 94477, "epoch": 2249} {"train_loss": -6.284120559692383, "global_step": 94478, "epoch": 2249} {"train_loss": -6.342645645141602, "global_step": 94479, "epoch": 2249} {"train_loss": -6.280702590942383, "global_step": 94480, "epoch": 2249} {"train_loss": -6.308154106140137, "global_step": 94481, "epoch": 2249} {"train_loss": -6.34096622467041, "global_step": 94482, "epoch": 2249} {"train_loss": -6.306882858276367, "global_step": 94483, "epoch": 2249} {"train_loss": -6.324612617492676, "global_step": 94484, "epoch": 2249} {"train_loss": -6.323314666748047, "global_step": 94485, "epoch": 2249} {"train_loss": -6.41123104095459, "global_step": 94486, "epoch": 2249} {"train_loss": -6.256353378295898, "global_step": 94487, "epoch": 2249} {"train_loss": -6.368988513946533, "global_step": 94488, "epoch": 2249} {"train_loss": -6.418880462646484, "global_step": 94489, "epoch": 2249} {"train_loss": -6.485692977905273, "global_step": 94490, "epoch": 2249} {"train_loss": -6.3318634033203125, "global_step": 94491, "epoch": 2249} {"train_loss": -6.361015796661377, "global_step": 94492, "epoch": 2249} {"train_loss": -6.2973175048828125, "global_step": 94493, "epoch": 2249} {"train_loss": -6.31121826171875, "global_step": 94494, "epoch": 2249} {"train_loss": -6.2380218505859375, "global_step": 94495, "epoch": 2249} {"train_loss": -6.286034107208252, "global_step": 94496, "epoch": 2249} {"train_loss": -6.293304920196533, "global_step": 94497, "epoch": 2249} {"train_loss": -6.100133419036865, "global_step": 94498, "epoch": 2249} {"train_loss": -6.312053203582764, "global_step": 94499, "epoch": 2249, "val_loss": 63484.296875} {"train_loss": -6.350805282592773, "global_step": 94500, "epoch": 2250} {"train_loss": -6.355540752410889, "global_step": 94501, "epoch": 2250} {"train_loss": -6.271965980529785, "global_step": 94502, "epoch": 2250} {"train_loss": -6.299380302429199, "global_step": 94503, "epoch": 2250} {"train_loss": -6.32391881942749, "global_step": 94504, "epoch": 2250} {"train_loss": -6.2455596923828125, "global_step": 94505, "epoch": 2250} {"train_loss": -6.335654258728027, "global_step": 94506, "epoch": 2250} {"train_loss": -6.274245738983154, "global_step": 94507, "epoch": 2250} {"train_loss": -6.226090908050537, "global_step": 94508, "epoch": 2250} {"train_loss": -6.255173683166504, "global_step": 94509, "epoch": 2250} {"train_loss": -6.207420349121094, "global_step": 94510, "epoch": 2250} {"train_loss": -6.392274856567383, "global_step": 94511, "epoch": 2250} {"train_loss": -6.362260818481445, "global_step": 94512, "epoch": 2250} {"train_loss": -6.282793998718262, "global_step": 94513, "epoch": 2250} {"train_loss": -6.444665908813477, "global_step": 94514, "epoch": 2250} {"train_loss": -6.391282558441162, "global_step": 94515, "epoch": 2250} {"train_loss": -6.399677276611328, "global_step": 94516, "epoch": 2250} {"train_loss": -6.385429382324219, "global_step": 94517, "epoch": 2250} {"train_loss": -6.3674092292785645, "global_step": 94518, "epoch": 2250} {"train_loss": -6.388026237487793, "global_step": 94519, "epoch": 2250} {"train_loss": -6.326135635375977, "global_step": 94520, "epoch": 2250} {"train_loss": -6.233973979949951, "global_step": 94521, "epoch": 2250} {"train_loss": -6.336859226226807, "global_step": 94522, "epoch": 2250} {"train_loss": -6.38019323348999, "global_step": 94523, "epoch": 2250} {"train_loss": -6.392116069793701, "global_step": 94524, "epoch": 2250} {"train_loss": -6.423252105712891, "global_step": 94525, "epoch": 2250} {"train_loss": -6.43374490737915, "global_step": 94526, "epoch": 2250} {"train_loss": -6.286099433898926, "global_step": 94527, "epoch": 2250} {"train_loss": -6.342957496643066, "global_step": 94528, "epoch": 2250} {"train_loss": -6.241748809814453, "global_step": 94529, "epoch": 2250} {"train_loss": -6.341562747955322, "global_step": 94530, "epoch": 2250} {"train_loss": -6.260720252990723, "global_step": 94531, "epoch": 2250} {"train_loss": -6.298693656921387, "global_step": 94532, "epoch": 2250} {"train_loss": -6.27918815612793, "global_step": 94533, "epoch": 2250} {"train_loss": -6.288779258728027, "global_step": 94534, "epoch": 2250} {"train_loss": -6.361582279205322, "global_step": 94535, "epoch": 2250} {"train_loss": -6.2492475509643555, "global_step": 94536, "epoch": 2250} {"train_loss": -6.366292953491211, "global_step": 94537, "epoch": 2250} {"train_loss": -6.292659759521484, "global_step": 94538, "epoch": 2250} {"train_loss": -6.177033424377441, "global_step": 94539, "epoch": 2250} {"train_loss": -6.274881362915039, "global_step": 94540, "epoch": 2250} {"train_loss": -6.316660949162075, "global_step": 94541, "epoch": 2250, "train/sim_max_reward_0": 0.22875401829971423, "train/sim_max_reward_1": 0.8266322232763185, "train/sim_max_reward_2": 0.5910700676922536, "train/sim_max_reward_3": 0.9879519292607563, "train/sim_max_reward_4": 0.7122561350716042, "train/sim_max_reward_5": 0.9868436475979916, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5589876925272299, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.8310355040670976, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.460815135627413, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.8136095243747287, "test/sim_max_reward_4300008": 0.9051420892880834, "test/sim_max_reward_4300009": 0.9790774871339725, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.2917274646330866, "test/sim_max_reward_4300012": 0.7612134376655982, "test/sim_max_reward_4300013": 0.3087005263470075, "test/sim_max_reward_4300014": 0.9625462641945561, "test/sim_max_reward_4300015": 0.9756492459985342, "test/sim_max_reward_4300016": 0.9103162944176785, "test/sim_max_reward_4300017": 0.8461371342592583, "test/sim_max_reward_4300018": 0.4662291554835666, "test/sim_max_reward_4300019": 0.18485269589615302, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9559264881266962, "test/sim_max_reward_4300022": 0.8713274283070961, "test/sim_max_reward_4300023": 0.3368870598510916, "test/sim_max_reward_4300024": 0.9367180149749176, "test/sim_max_reward_4300025": 0.9388080916140356, "test/sim_max_reward_4300026": 0.8544580056829286, "test/sim_max_reward_4300027": 0.8555830504703099, "test/sim_max_reward_4300028": 0.9495286335611889, "test/sim_max_reward_4300029": 0.97936855137637, "test/sim_max_reward_4300030": 0.7263814218727496, "test/sim_max_reward_4300031": 0.190319631426957, "test/sim_max_reward_4300032": 0.9340442494130055, "test/sim_max_reward_4300033": 0.521728272362302, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.5886646414344059, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8729479695394651, "test/sim_max_reward_4300038": 0.4471958087642955, "test/sim_max_reward_4300039": 0.9061543256327252, "test/sim_max_reward_4300040": 0.34544491004799577, "test/sim_max_reward_4300041": 0.22048617413324836, "test/sim_max_reward_4300042": 0.5564069248835336, "test/sim_max_reward_4300043": 0.1340049938624912, "test/sim_max_reward_4300044": 0.6214164601352201, "test/sim_max_reward_4300045": 0.671816615965786, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.9680389677887423, "test/sim_max_reward_4300048": 0.7688104845105983, "test/sim_max_reward_4300049": 0.2934448153333973, "train/mean_score": 0.7222513368664396, "test/mean_score": 0.5983395972671657, "val_loss": 63607.2109375} {"train_loss": -6.271475315093994, "global_step": 94542, "epoch": 2251} {"train_loss": -6.272438049316406, "global_step": 94543, "epoch": 2251} {"train_loss": -6.171255588531494, "global_step": 94544, "epoch": 2251} {"train_loss": -6.307796955108643, "global_step": 94545, "epoch": 2251} {"train_loss": -6.269353866577148, "global_step": 94546, "epoch": 2251} {"train_loss": -6.243466854095459, "global_step": 94547, "epoch": 2251} {"train_loss": -6.481619834899902, "global_step": 94548, "epoch": 2251} {"train_loss": -6.3137922286987305, "global_step": 94549, "epoch": 2251} {"train_loss": -6.251406669616699, "global_step": 94550, "epoch": 2251} {"train_loss": -6.308950424194336, "global_step": 94551, "epoch": 2251} {"train_loss": -6.3890228271484375, "global_step": 94552, "epoch": 2251} {"train_loss": -6.208125591278076, "global_step": 94553, "epoch": 2251} {"train_loss": -6.390519142150879, "global_step": 94554, "epoch": 2251} {"train_loss": -6.301458835601807, "global_step": 94555, "epoch": 2251} {"train_loss": -6.273488998413086, "global_step": 94556, "epoch": 2251} {"train_loss": -6.405948162078857, "global_step": 94557, "epoch": 2251} {"train_loss": -6.416628837585449, "global_step": 94558, "epoch": 2251} {"train_loss": -6.354508399963379, "global_step": 94559, "epoch": 2251} {"train_loss": -6.278617858886719, "global_step": 94560, "epoch": 2251} {"train_loss": -6.3141937255859375, "global_step": 94561, "epoch": 2251} {"train_loss": -6.381899833679199, "global_step": 94562, "epoch": 2251} {"train_loss": -6.278463363647461, "global_step": 94563, "epoch": 2251} {"train_loss": -6.276928901672363, "global_step": 94564, "epoch": 2251} {"train_loss": -6.230144500732422, "global_step": 94565, "epoch": 2251} {"train_loss": -6.314193248748779, "global_step": 94566, "epoch": 2251} {"train_loss": -6.112612724304199, "global_step": 94567, "epoch": 2251} {"train_loss": -6.310663223266602, "global_step": 94568, "epoch": 2251} {"train_loss": -6.291513442993164, "global_step": 94569, "epoch": 2251} {"train_loss": -6.147466659545898, "global_step": 94570, "epoch": 2251} {"train_loss": -6.339771270751953, "global_step": 94571, "epoch": 2251} {"train_loss": -6.375383377075195, "global_step": 94572, "epoch": 2251} {"train_loss": -6.273501396179199, "global_step": 94573, "epoch": 2251} {"train_loss": -6.263934135437012, "global_step": 94574, "epoch": 2251} {"train_loss": -6.282444000244141, "global_step": 94575, "epoch": 2251} {"train_loss": -6.27918815612793, "global_step": 94576, "epoch": 2251} {"train_loss": -6.342004776000977, "global_step": 94577, "epoch": 2251} {"train_loss": -6.208425045013428, "global_step": 94578, "epoch": 2251} {"train_loss": -6.367629528045654, "global_step": 94579, "epoch": 2251} {"train_loss": -6.277861595153809, "global_step": 94580, "epoch": 2251} {"train_loss": -6.348280429840088, "global_step": 94581, "epoch": 2251} {"train_loss": -6.285587310791016, "global_step": 94582, "epoch": 2251} {"train_loss": -6.29845792906625, "global_step": 94583, "epoch": 2251, "val_loss": 63589.55078125} {"train_loss": -6.345258712768555, "global_step": 94584, "epoch": 2252} {"train_loss": -6.357526779174805, "global_step": 94585, "epoch": 2252} {"train_loss": -6.393517017364502, "global_step": 94586, "epoch": 2252} {"train_loss": -6.3546881675720215, "global_step": 94587, "epoch": 2252} {"train_loss": -6.366337299346924, "global_step": 94588, "epoch": 2252} {"train_loss": -6.375049591064453, "global_step": 94589, "epoch": 2252} {"train_loss": -6.3941850662231445, "global_step": 94590, "epoch": 2252} {"train_loss": -6.264043807983398, "global_step": 94591, "epoch": 2252} {"train_loss": -6.3981828689575195, "global_step": 94592, "epoch": 2252} {"train_loss": -6.320446014404297, "global_step": 94593, "epoch": 2252} {"train_loss": -6.3658270835876465, "global_step": 94594, "epoch": 2252} {"train_loss": -6.4777750968933105, "global_step": 94595, "epoch": 2252} {"train_loss": -6.391731262207031, "global_step": 94596, "epoch": 2252} {"train_loss": -6.31837272644043, "global_step": 94597, "epoch": 2252} {"train_loss": -6.3198699951171875, "global_step": 94598, "epoch": 2252} {"train_loss": -6.3835601806640625, "global_step": 94599, "epoch": 2252} {"train_loss": -6.174448013305664, "global_step": 94600, "epoch": 2252} {"train_loss": -6.363001823425293, "global_step": 94601, "epoch": 2252} {"train_loss": -6.333034515380859, "global_step": 94602, "epoch": 2252} {"train_loss": -6.277729034423828, "global_step": 94603, "epoch": 2252} {"train_loss": -6.34794807434082, "global_step": 94604, "epoch": 2252} {"train_loss": -6.428288459777832, "global_step": 94605, "epoch": 2252} {"train_loss": -6.316930294036865, "global_step": 94606, "epoch": 2252} {"train_loss": -6.311727523803711, "global_step": 94607, "epoch": 2252} {"train_loss": -6.3081278800964355, "global_step": 94608, "epoch": 2252} {"train_loss": -6.345270156860352, "global_step": 94609, "epoch": 2252} {"train_loss": -6.3230204582214355, "global_step": 94610, "epoch": 2252} {"train_loss": -6.281519889831543, "global_step": 94611, "epoch": 2252} {"train_loss": -6.26784610748291, "global_step": 94612, "epoch": 2252} {"train_loss": -6.16713809967041, "global_step": 94613, "epoch": 2252} {"train_loss": -6.380438804626465, "global_step": 94614, "epoch": 2252} {"train_loss": -6.196619033813477, "global_step": 94615, "epoch": 2252} {"train_loss": -6.243261337280273, "global_step": 94616, "epoch": 2252} {"train_loss": -6.297630310058594, "global_step": 94617, "epoch": 2252} {"train_loss": -6.235987186431885, "global_step": 94618, "epoch": 2252} {"train_loss": -6.378307342529297, "global_step": 94619, "epoch": 2252} {"train_loss": -6.266315460205078, "global_step": 94620, "epoch": 2252} {"train_loss": -6.307748317718506, "global_step": 94621, "epoch": 2252} {"train_loss": -6.386050701141357, "global_step": 94622, "epoch": 2252} {"train_loss": -6.309122085571289, "global_step": 94623, "epoch": 2252} {"train_loss": -6.166304588317871, "global_step": 94624, "epoch": 2252} {"train_loss": -6.3208710466112406, "global_step": 94625, "epoch": 2252, "val_loss": 63512.8671875} {"train_loss": -6.412684440612793, "global_step": 94626, "epoch": 2253} {"train_loss": -6.322627067565918, "global_step": 94627, "epoch": 2253} {"train_loss": -6.311066627502441, "global_step": 94628, "epoch": 2253} {"train_loss": -6.173583984375, "global_step": 94629, "epoch": 2253} {"train_loss": -6.2765607833862305, "global_step": 94630, "epoch": 2253} {"train_loss": -6.330389022827148, "global_step": 94631, "epoch": 2253} {"train_loss": -6.2565460205078125, "global_step": 94632, "epoch": 2253} {"train_loss": -6.268987655639648, "global_step": 94633, "epoch": 2253} {"train_loss": -6.167520999908447, "global_step": 94634, "epoch": 2253} {"train_loss": -6.260644912719727, "global_step": 94635, "epoch": 2253} {"train_loss": -6.181880950927734, "global_step": 94636, "epoch": 2253} {"train_loss": -6.39298152923584, "global_step": 94637, "epoch": 2253} {"train_loss": -6.270806312561035, "global_step": 94638, "epoch": 2253} {"train_loss": -6.150995254516602, "global_step": 94639, "epoch": 2253} {"train_loss": -6.308635711669922, "global_step": 94640, "epoch": 2253} {"train_loss": -6.254167556762695, "global_step": 94641, "epoch": 2253} {"train_loss": -6.2312822341918945, "global_step": 94642, "epoch": 2253} {"train_loss": -6.375437259674072, "global_step": 94643, "epoch": 2253} {"train_loss": -6.264405250549316, "global_step": 94644, "epoch": 2253} {"train_loss": -6.241521835327148, "global_step": 94645, "epoch": 2253} {"train_loss": -6.270569801330566, "global_step": 94646, "epoch": 2253} {"train_loss": -6.071768760681152, "global_step": 94647, "epoch": 2253} {"train_loss": -6.253129005432129, "global_step": 94648, "epoch": 2253} {"train_loss": -6.2025041580200195, "global_step": 94649, "epoch": 2253} {"train_loss": -6.327093601226807, "global_step": 94650, "epoch": 2253} {"train_loss": -6.168109893798828, "global_step": 94651, "epoch": 2253} {"train_loss": -6.146503448486328, "global_step": 94652, "epoch": 2253} {"train_loss": -6.383426666259766, "global_step": 94653, "epoch": 2253} {"train_loss": -6.153998374938965, "global_step": 94654, "epoch": 2253} {"train_loss": -6.397439956665039, "global_step": 94655, "epoch": 2253} {"train_loss": -6.13336181640625, "global_step": 94656, "epoch": 2253} {"train_loss": -6.2597455978393555, "global_step": 94657, "epoch": 2253} {"train_loss": -6.1798319816589355, "global_step": 94658, "epoch": 2253} {"train_loss": -6.2762908935546875, "global_step": 94659, "epoch": 2253} {"train_loss": -6.390554428100586, "global_step": 94660, "epoch": 2253} {"train_loss": -6.177181243896484, "global_step": 94661, "epoch": 2253} {"train_loss": -6.2889909744262695, "global_step": 94662, "epoch": 2253} {"train_loss": -6.256203651428223, "global_step": 94663, "epoch": 2253} {"train_loss": -6.343172073364258, "global_step": 94664, "epoch": 2253} {"train_loss": -6.3307881355285645, "global_step": 94665, "epoch": 2253} {"train_loss": -6.296426296234131, "global_step": 94666, "epoch": 2253} {"train_loss": -6.264940409433274, "global_step": 94667, "epoch": 2253, "val_loss": 63571.66015625} {"train_loss": -6.38064432144165, "global_step": 94668, "epoch": 2254} {"train_loss": -6.223083972930908, "global_step": 94669, "epoch": 2254} {"train_loss": -6.3181681632995605, "global_step": 94670, "epoch": 2254} {"train_loss": -6.352794647216797, "global_step": 94671, "epoch": 2254} {"train_loss": -6.247196197509766, "global_step": 94672, "epoch": 2254} {"train_loss": -6.29782772064209, "global_step": 94673, "epoch": 2254} {"train_loss": -6.287147521972656, "global_step": 94674, "epoch": 2254} {"train_loss": -6.322118759155273, "global_step": 94675, "epoch": 2254} {"train_loss": -6.38649845123291, "global_step": 94676, "epoch": 2254} {"train_loss": -6.256527900695801, "global_step": 94677, "epoch": 2254} {"train_loss": -6.243293762207031, "global_step": 94678, "epoch": 2254} {"train_loss": -6.248541355133057, "global_step": 94679, "epoch": 2254} {"train_loss": -6.333616256713867, "global_step": 94680, "epoch": 2254} {"train_loss": -6.34630012512207, "global_step": 94681, "epoch": 2254} {"train_loss": -6.224522590637207, "global_step": 94682, "epoch": 2254} {"train_loss": -6.355714321136475, "global_step": 94683, "epoch": 2254} {"train_loss": -6.440109729766846, "global_step": 94684, "epoch": 2254} {"train_loss": -6.436339378356934, "global_step": 94685, "epoch": 2254} {"train_loss": -6.357479095458984, "global_step": 94686, "epoch": 2254} {"train_loss": -6.362799644470215, "global_step": 94687, "epoch": 2254} {"train_loss": -6.348775863647461, "global_step": 94688, "epoch": 2254} {"train_loss": -6.318150520324707, "global_step": 94689, "epoch": 2254} {"train_loss": -6.327393531799316, "global_step": 94690, "epoch": 2254} {"train_loss": -6.307961463928223, "global_step": 94691, "epoch": 2254} {"train_loss": -6.329900741577148, "global_step": 94692, "epoch": 2254} {"train_loss": -6.377815246582031, "global_step": 94693, "epoch": 2254} {"train_loss": -6.39845609664917, "global_step": 94694, "epoch": 2254} {"train_loss": -6.358625888824463, "global_step": 94695, "epoch": 2254} {"train_loss": -6.46750545501709, "global_step": 94696, "epoch": 2254} {"train_loss": -6.335451602935791, "global_step": 94697, "epoch": 2254} {"train_loss": -6.301970481872559, "global_step": 94698, "epoch": 2254} {"train_loss": -6.415474891662598, "global_step": 94699, "epoch": 2254} {"train_loss": -6.349479675292969, "global_step": 94700, "epoch": 2254} {"train_loss": -6.401411056518555, "global_step": 94701, "epoch": 2254} {"train_loss": -6.358410835266113, "global_step": 94702, "epoch": 2254} {"train_loss": -6.402011871337891, "global_step": 94703, "epoch": 2254} {"train_loss": -6.321000099182129, "global_step": 94704, "epoch": 2254} {"train_loss": -6.37461519241333, "global_step": 94705, "epoch": 2254} {"train_loss": -6.2927703857421875, "global_step": 94706, "epoch": 2254} {"train_loss": -6.334659576416016, "global_step": 94707, "epoch": 2254} {"train_loss": -6.3660502433776855, "global_step": 94708, "epoch": 2254} {"train_loss": -6.338162717365083, "global_step": 94709, "epoch": 2254, "val_loss": 63591.01953125} {"train_loss": -6.308477878570557, "global_step": 94710, "epoch": 2255} {"train_loss": -6.310702323913574, "global_step": 94711, "epoch": 2255} {"train_loss": -6.419855117797852, "global_step": 94712, "epoch": 2255} {"train_loss": -6.416898727416992, "global_step": 94713, "epoch": 2255} {"train_loss": -6.321389198303223, "global_step": 94714, "epoch": 2255} {"train_loss": -6.387539863586426, "global_step": 94715, "epoch": 2255} {"train_loss": -6.227958679199219, "global_step": 94716, "epoch": 2255} {"train_loss": -6.356439590454102, "global_step": 94717, "epoch": 2255} {"train_loss": -6.2494215965271, "global_step": 94718, "epoch": 2255} {"train_loss": -6.234382152557373, "global_step": 94719, "epoch": 2255} {"train_loss": -6.199591636657715, "global_step": 94720, "epoch": 2255} {"train_loss": -6.296414375305176, "global_step": 94721, "epoch": 2255} {"train_loss": -6.3207244873046875, "global_step": 94722, "epoch": 2255} {"train_loss": -6.185760974884033, "global_step": 94723, "epoch": 2255} {"train_loss": -6.275042533874512, "global_step": 94724, "epoch": 2255} {"train_loss": -6.258734703063965, "global_step": 94725, "epoch": 2255} {"train_loss": -6.312270164489746, "global_step": 94726, "epoch": 2255} {"train_loss": -6.2644362449646, "global_step": 94727, "epoch": 2255} {"train_loss": -6.278446197509766, "global_step": 94728, "epoch": 2255} {"train_loss": -6.362348556518555, "global_step": 94729, "epoch": 2255} {"train_loss": -6.351767063140869, "global_step": 94730, "epoch": 2255} {"train_loss": -6.199420928955078, "global_step": 94731, "epoch": 2255} {"train_loss": -6.311347007751465, "global_step": 94732, "epoch": 2255} {"train_loss": -6.221179008483887, "global_step": 94733, "epoch": 2255} {"train_loss": -6.415044784545898, "global_step": 94734, "epoch": 2255} {"train_loss": -6.301481246948242, "global_step": 94735, "epoch": 2255} {"train_loss": -6.226839065551758, "global_step": 94736, "epoch": 2255} {"train_loss": -6.343112945556641, "global_step": 94737, "epoch": 2255} {"train_loss": -6.246303558349609, "global_step": 94738, "epoch": 2255} {"train_loss": -6.2533769607543945, "global_step": 94739, "epoch": 2255} {"train_loss": -6.419269561767578, "global_step": 94740, "epoch": 2255} {"train_loss": -6.270917892456055, "global_step": 94741, "epoch": 2255} {"train_loss": -6.3028717041015625, "global_step": 94742, "epoch": 2255} {"train_loss": -6.341529369354248, "global_step": 94743, "epoch": 2255} {"train_loss": -6.177175045013428, "global_step": 94744, "epoch": 2255} {"train_loss": -6.311083793640137, "global_step": 94745, "epoch": 2255} {"train_loss": -6.153687477111816, "global_step": 94746, "epoch": 2255} {"train_loss": -6.286789894104004, "global_step": 94747, "epoch": 2255} {"train_loss": -6.17477560043335, "global_step": 94748, "epoch": 2255} {"train_loss": -6.254364013671875, "global_step": 94749, "epoch": 2255} {"train_loss": -6.286138534545898, "global_step": 94750, "epoch": 2255} {"train_loss": -6.285738490876698, "global_step": 94751, "epoch": 2255, "val_loss": 63673.0390625} {"train_loss": -6.222770690917969, "global_step": 94752, "epoch": 2256} {"train_loss": -6.186646461486816, "global_step": 94753, "epoch": 2256} {"train_loss": -6.267271518707275, "global_step": 94754, "epoch": 2256} {"train_loss": -6.246458053588867, "global_step": 94755, "epoch": 2256} {"train_loss": -6.258295059204102, "global_step": 94756, "epoch": 2256} {"train_loss": -6.220346927642822, "global_step": 94757, "epoch": 2256} {"train_loss": -6.361507415771484, "global_step": 94758, "epoch": 2256} {"train_loss": -6.239418029785156, "global_step": 94759, "epoch": 2256} {"train_loss": -6.312692642211914, "global_step": 94760, "epoch": 2256} {"train_loss": -6.244585990905762, "global_step": 94761, "epoch": 2256} {"train_loss": -6.350653648376465, "global_step": 94762, "epoch": 2256} {"train_loss": -6.310032844543457, "global_step": 94763, "epoch": 2256} {"train_loss": -6.187743663787842, "global_step": 94764, "epoch": 2256} {"train_loss": -6.371337413787842, "global_step": 94765, "epoch": 2256} {"train_loss": -6.221327781677246, "global_step": 94766, "epoch": 2256} {"train_loss": -6.3200154304504395, "global_step": 94767, "epoch": 2256} {"train_loss": -6.32808780670166, "global_step": 94768, "epoch": 2256} {"train_loss": -6.324803829193115, "global_step": 94769, "epoch": 2256} {"train_loss": -6.3501787185668945, "global_step": 94770, "epoch": 2256} {"train_loss": -6.299161911010742, "global_step": 94771, "epoch": 2256} {"train_loss": -6.319458484649658, "global_step": 94772, "epoch": 2256} {"train_loss": -6.306108474731445, "global_step": 94773, "epoch": 2256} {"train_loss": -6.216691017150879, "global_step": 94774, "epoch": 2256} {"train_loss": -6.281303405761719, "global_step": 94775, "epoch": 2256} {"train_loss": -6.288642883300781, "global_step": 94776, "epoch": 2256} {"train_loss": -6.391018867492676, "global_step": 94777, "epoch": 2256} {"train_loss": -6.413025379180908, "global_step": 94778, "epoch": 2256} {"train_loss": -6.336096286773682, "global_step": 94779, "epoch": 2256} {"train_loss": -6.278548240661621, "global_step": 94780, "epoch": 2256} {"train_loss": -6.383127212524414, "global_step": 94781, "epoch": 2256} {"train_loss": -6.386136054992676, "global_step": 94782, "epoch": 2256} {"train_loss": -6.328984260559082, "global_step": 94783, "epoch": 2256} {"train_loss": -6.318803787231445, "global_step": 94784, "epoch": 2256} {"train_loss": -6.389547348022461, "global_step": 94785, "epoch": 2256} {"train_loss": -6.307478904724121, "global_step": 94786, "epoch": 2256} {"train_loss": -6.393413543701172, "global_step": 94787, "epoch": 2256} {"train_loss": -6.3815717697143555, "global_step": 94788, "epoch": 2256} {"train_loss": -6.286604404449463, "global_step": 94789, "epoch": 2256} {"train_loss": -6.345589637756348, "global_step": 94790, "epoch": 2256} {"train_loss": -6.282007217407227, "global_step": 94791, "epoch": 2256} {"train_loss": -6.335545539855957, "global_step": 94792, "epoch": 2256} {"train_loss": -6.308596315838042, "global_step": 94793, "epoch": 2256, "val_loss": 63552.20703125} {"train_loss": -6.301753520965576, "global_step": 94794, "epoch": 2257} {"train_loss": -6.372129917144775, "global_step": 94795, "epoch": 2257} {"train_loss": -6.332710266113281, "global_step": 94796, "epoch": 2257} {"train_loss": -6.247283935546875, "global_step": 94797, "epoch": 2257} {"train_loss": -6.330296993255615, "global_step": 94798, "epoch": 2257} {"train_loss": -6.477209091186523, "global_step": 94799, "epoch": 2257} {"train_loss": -6.277254581451416, "global_step": 94800, "epoch": 2257} {"train_loss": -6.292162895202637, "global_step": 94801, "epoch": 2257} {"train_loss": -6.308289527893066, "global_step": 94802, "epoch": 2257} {"train_loss": -6.240717887878418, "global_step": 94803, "epoch": 2257} {"train_loss": -6.287210464477539, "global_step": 94804, "epoch": 2257} {"train_loss": -6.286412715911865, "global_step": 94805, "epoch": 2257} {"train_loss": -6.354221343994141, "global_step": 94806, "epoch": 2257} {"train_loss": -6.354837417602539, "global_step": 94807, "epoch": 2257} {"train_loss": -6.205330848693848, "global_step": 94808, "epoch": 2257} {"train_loss": -6.300715923309326, "global_step": 94809, "epoch": 2257} {"train_loss": -6.319052696228027, "global_step": 94810, "epoch": 2257} {"train_loss": -6.281294822692871, "global_step": 94811, "epoch": 2257} {"train_loss": -6.398661136627197, "global_step": 94812, "epoch": 2257} {"train_loss": -6.413728713989258, "global_step": 94813, "epoch": 2257} {"train_loss": -6.424687385559082, "global_step": 94814, "epoch": 2257} {"train_loss": -6.404707431793213, "global_step": 94815, "epoch": 2257} {"train_loss": -6.379964828491211, "global_step": 94816, "epoch": 2257} {"train_loss": -6.382818222045898, "global_step": 94817, "epoch": 2257} {"train_loss": -6.361458778381348, "global_step": 94818, "epoch": 2257} {"train_loss": -6.345545768737793, "global_step": 94819, "epoch": 2257} {"train_loss": -6.351256370544434, "global_step": 94820, "epoch": 2257} {"train_loss": -6.3759942054748535, "global_step": 94821, "epoch": 2257} {"train_loss": -6.369582176208496, "global_step": 94822, "epoch": 2257} {"train_loss": -6.467852592468262, "global_step": 94823, "epoch": 2257} {"train_loss": -6.294519424438477, "global_step": 94824, "epoch": 2257} {"train_loss": -6.347540855407715, "global_step": 94825, "epoch": 2257} {"train_loss": -6.252198219299316, "global_step": 94826, "epoch": 2257} {"train_loss": -6.369998455047607, "global_step": 94827, "epoch": 2257} {"train_loss": -6.341795921325684, "global_step": 94828, "epoch": 2257} {"train_loss": -6.360622406005859, "global_step": 94829, "epoch": 2257} {"train_loss": -6.270733833312988, "global_step": 94830, "epoch": 2257} {"train_loss": -6.355118751525879, "global_step": 94831, "epoch": 2257} {"train_loss": -6.2562432289123535, "global_step": 94832, "epoch": 2257} {"train_loss": -6.350952625274658, "global_step": 94833, "epoch": 2257} {"train_loss": -6.357816696166992, "global_step": 94834, "epoch": 2257} {"train_loss": -6.334747359866188, "global_step": 94835, "epoch": 2257, "val_loss": 63655.6171875} {"train_loss": -6.3381853103637695, "global_step": 94836, "epoch": 2258} {"train_loss": -6.485894203186035, "global_step": 94837, "epoch": 2258} {"train_loss": -6.298338413238525, "global_step": 94838, "epoch": 2258} {"train_loss": -6.428416728973389, "global_step": 94839, "epoch": 2258} {"train_loss": -6.315036773681641, "global_step": 94840, "epoch": 2258} {"train_loss": -6.389785289764404, "global_step": 94841, "epoch": 2258} {"train_loss": -6.230887413024902, "global_step": 94842, "epoch": 2258} {"train_loss": -6.287770748138428, "global_step": 94843, "epoch": 2258} {"train_loss": -6.266059875488281, "global_step": 94844, "epoch": 2258} {"train_loss": -6.2245683670043945, "global_step": 94845, "epoch": 2258} {"train_loss": -6.430971145629883, "global_step": 94846, "epoch": 2258} {"train_loss": -6.31337833404541, "global_step": 94847, "epoch": 2258} {"train_loss": -6.320054054260254, "global_step": 94848, "epoch": 2258} {"train_loss": -6.329067230224609, "global_step": 94849, "epoch": 2258} {"train_loss": -6.313199043273926, "global_step": 94850, "epoch": 2258} {"train_loss": -6.264711380004883, "global_step": 94851, "epoch": 2258} {"train_loss": -6.243160247802734, "global_step": 94852, "epoch": 2258} {"train_loss": -6.214072227478027, "global_step": 94853, "epoch": 2258} {"train_loss": -6.272640228271484, "global_step": 94854, "epoch": 2258} {"train_loss": -6.396149158477783, "global_step": 94855, "epoch": 2258} {"train_loss": -6.325652599334717, "global_step": 94856, "epoch": 2258} {"train_loss": -6.335994720458984, "global_step": 94857, "epoch": 2258} {"train_loss": -6.245577812194824, "global_step": 94858, "epoch": 2258} {"train_loss": -6.419378757476807, "global_step": 94859, "epoch": 2258} {"train_loss": -6.362789630889893, "global_step": 94860, "epoch": 2258} {"train_loss": -6.288334369659424, "global_step": 94861, "epoch": 2258} {"train_loss": -6.244097709655762, "global_step": 94862, "epoch": 2258} {"train_loss": -6.118133068084717, "global_step": 94863, "epoch": 2258} {"train_loss": -6.299107074737549, "global_step": 94864, "epoch": 2258} {"train_loss": -6.25068473815918, "global_step": 94865, "epoch": 2258} {"train_loss": -6.286018371582031, "global_step": 94866, "epoch": 2258} {"train_loss": -6.232911109924316, "global_step": 94867, "epoch": 2258} {"train_loss": -6.192934036254883, "global_step": 94868, "epoch": 2258} {"train_loss": -6.350244045257568, "global_step": 94869, "epoch": 2258} {"train_loss": -6.224004745483398, "global_step": 94870, "epoch": 2258} {"train_loss": -6.371604919433594, "global_step": 94871, "epoch": 2258} {"train_loss": -6.237061500549316, "global_step": 94872, "epoch": 2258} {"train_loss": -6.211982727050781, "global_step": 94873, "epoch": 2258} {"train_loss": -6.287978172302246, "global_step": 94874, "epoch": 2258} {"train_loss": -6.254500389099121, "global_step": 94875, "epoch": 2258} {"train_loss": -6.352845191955566, "global_step": 94876, "epoch": 2258} {"train_loss": -6.296858004161289, "global_step": 94877, "epoch": 2258, "val_loss": 63394.64453125} {"train_loss": -6.211712837219238, "global_step": 94878, "epoch": 2259} {"train_loss": -6.1418914794921875, "global_step": 94879, "epoch": 2259} {"train_loss": -6.305155277252197, "global_step": 94880, "epoch": 2259} {"train_loss": -6.202859878540039, "global_step": 94881, "epoch": 2259} {"train_loss": -6.3357319831848145, "global_step": 94882, "epoch": 2259} {"train_loss": -6.2608842849731445, "global_step": 94883, "epoch": 2259} {"train_loss": -6.3727216720581055, "global_step": 94884, "epoch": 2259} {"train_loss": -6.271766662597656, "global_step": 94885, "epoch": 2259} {"train_loss": -6.144343376159668, "global_step": 94886, "epoch": 2259} {"train_loss": -6.33128547668457, "global_step": 94887, "epoch": 2259} {"train_loss": -6.167360782623291, "global_step": 94888, "epoch": 2259} {"train_loss": -6.135431289672852, "global_step": 94889, "epoch": 2259} {"train_loss": -6.240220069885254, "global_step": 94890, "epoch": 2259} {"train_loss": -5.987966537475586, "global_step": 94891, "epoch": 2259} {"train_loss": -6.180330276489258, "global_step": 94892, "epoch": 2259} {"train_loss": -6.336297035217285, "global_step": 94893, "epoch": 2259} {"train_loss": -6.238640308380127, "global_step": 94894, "epoch": 2259} {"train_loss": -6.2184529304504395, "global_step": 94895, "epoch": 2259} {"train_loss": -6.201077461242676, "global_step": 94896, "epoch": 2259} {"train_loss": -6.354535102844238, "global_step": 94897, "epoch": 2259} {"train_loss": -6.177789211273193, "global_step": 94898, "epoch": 2259} {"train_loss": -6.263096809387207, "global_step": 94899, "epoch": 2259} {"train_loss": -6.215254306793213, "global_step": 94900, "epoch": 2259} {"train_loss": -6.29679012298584, "global_step": 94901, "epoch": 2259} {"train_loss": -6.288408279418945, "global_step": 94902, "epoch": 2259} {"train_loss": -6.274473190307617, "global_step": 94903, "epoch": 2259} {"train_loss": -6.216004848480225, "global_step": 94904, "epoch": 2259} {"train_loss": -6.331568241119385, "global_step": 94905, "epoch": 2259} {"train_loss": -6.2173051834106445, "global_step": 94906, "epoch": 2259} {"train_loss": -6.317018508911133, "global_step": 94907, "epoch": 2259} {"train_loss": -6.194350719451904, "global_step": 94908, "epoch": 2259} {"train_loss": -6.282978057861328, "global_step": 94909, "epoch": 2259} {"train_loss": -6.423811912536621, "global_step": 94910, "epoch": 2259} {"train_loss": -6.339323997497559, "global_step": 94911, "epoch": 2259} {"train_loss": -6.3383870124816895, "global_step": 94912, "epoch": 2259} {"train_loss": -6.3040666580200195, "global_step": 94913, "epoch": 2259} {"train_loss": -6.406038284301758, "global_step": 94914, "epoch": 2259} {"train_loss": -6.369041442871094, "global_step": 94915, "epoch": 2259} {"train_loss": -6.383779525756836, "global_step": 94916, "epoch": 2259} {"train_loss": -6.324339866638184, "global_step": 94917, "epoch": 2259} {"train_loss": -6.341960430145264, "global_step": 94918, "epoch": 2259} {"train_loss": -6.271013657251994, "global_step": 94919, "epoch": 2259, "val_loss": 63535.6796875} {"train_loss": -6.331876754760742, "global_step": 94920, "epoch": 2260} {"train_loss": -6.3466033935546875, "global_step": 94921, "epoch": 2260} {"train_loss": -6.408599853515625, "global_step": 94922, "epoch": 2260} {"train_loss": -6.3315229415893555, "global_step": 94923, "epoch": 2260} {"train_loss": -6.26164436340332, "global_step": 94924, "epoch": 2260} {"train_loss": -6.319799423217773, "global_step": 94925, "epoch": 2260} {"train_loss": -6.259947776794434, "global_step": 94926, "epoch": 2260} {"train_loss": -6.406328201293945, "global_step": 94927, "epoch": 2260} {"train_loss": -6.381813049316406, "global_step": 94928, "epoch": 2260} {"train_loss": -6.237057685852051, "global_step": 94929, "epoch": 2260} {"train_loss": -6.277951717376709, "global_step": 94930, "epoch": 2260} {"train_loss": -6.370476722717285, "global_step": 94931, "epoch": 2260} {"train_loss": -6.253852367401123, "global_step": 94932, "epoch": 2260} {"train_loss": -6.265942573547363, "global_step": 94933, "epoch": 2260} {"train_loss": -6.351552963256836, "global_step": 94934, "epoch": 2260} {"train_loss": -6.171143054962158, "global_step": 94935, "epoch": 2260} {"train_loss": -6.284267425537109, "global_step": 94936, "epoch": 2260} {"train_loss": -6.229833602905273, "global_step": 94937, "epoch": 2260} {"train_loss": -6.134969711303711, "global_step": 94938, "epoch": 2260} {"train_loss": -6.396658897399902, "global_step": 94939, "epoch": 2260} {"train_loss": -6.2649078369140625, "global_step": 94940, "epoch": 2260} {"train_loss": -6.315577507019043, "global_step": 94941, "epoch": 2260} {"train_loss": -6.331095218658447, "global_step": 94942, "epoch": 2260} {"train_loss": -6.215455055236816, "global_step": 94943, "epoch": 2260} {"train_loss": -6.268002033233643, "global_step": 94944, "epoch": 2260} {"train_loss": -6.343837738037109, "global_step": 94945, "epoch": 2260} {"train_loss": -6.264331817626953, "global_step": 94946, "epoch": 2260} {"train_loss": -6.36983585357666, "global_step": 94947, "epoch": 2260} {"train_loss": -6.273141860961914, "global_step": 94948, "epoch": 2260} {"train_loss": -6.284555435180664, "global_step": 94949, "epoch": 2260} {"train_loss": -6.309194564819336, "global_step": 94950, "epoch": 2260} {"train_loss": -6.311897277832031, "global_step": 94951, "epoch": 2260} {"train_loss": -6.348044395446777, "global_step": 94952, "epoch": 2260} {"train_loss": -6.379034519195557, "global_step": 94953, "epoch": 2260} {"train_loss": -6.427910327911377, "global_step": 94954, "epoch": 2260} {"train_loss": -6.257850170135498, "global_step": 94955, "epoch": 2260} {"train_loss": -6.346138000488281, "global_step": 94956, "epoch": 2260} {"train_loss": -6.349021911621094, "global_step": 94957, "epoch": 2260} {"train_loss": -6.374266624450684, "global_step": 94958, "epoch": 2260} {"train_loss": -6.322465896606445, "global_step": 94959, "epoch": 2260} {"train_loss": -6.3571624755859375, "global_step": 94960, "epoch": 2260} {"train_loss": -6.310687371662685, "global_step": 94961, "epoch": 2260, "val_loss": 63854.75390625} {"train_loss": -6.315759181976318, "global_step": 94962, "epoch": 2261} {"train_loss": -6.2767486572265625, "global_step": 94963, "epoch": 2261} {"train_loss": -6.484540939331055, "global_step": 94964, "epoch": 2261} {"train_loss": -6.300822734832764, "global_step": 94965, "epoch": 2261} {"train_loss": -6.288931846618652, "global_step": 94966, "epoch": 2261} {"train_loss": -6.327909469604492, "global_step": 94967, "epoch": 2261} {"train_loss": -6.362210273742676, "global_step": 94968, "epoch": 2261} {"train_loss": -6.2776384353637695, "global_step": 94969, "epoch": 2261} {"train_loss": -6.185336589813232, "global_step": 94970, "epoch": 2261} {"train_loss": -6.273573398590088, "global_step": 94971, "epoch": 2261} {"train_loss": -6.244023323059082, "global_step": 94972, "epoch": 2261} {"train_loss": -6.371323585510254, "global_step": 94973, "epoch": 2261} {"train_loss": -6.11874532699585, "global_step": 94974, "epoch": 2261} {"train_loss": -6.24684476852417, "global_step": 94975, "epoch": 2261} {"train_loss": -6.176751613616943, "global_step": 94976, "epoch": 2261} {"train_loss": -6.288646697998047, "global_step": 94977, "epoch": 2261} {"train_loss": -6.264078140258789, "global_step": 94978, "epoch": 2261} {"train_loss": -6.3179850578308105, "global_step": 94979, "epoch": 2261} {"train_loss": -6.414437294006348, "global_step": 94980, "epoch": 2261} {"train_loss": -6.253604412078857, "global_step": 94981, "epoch": 2261} {"train_loss": -6.427804946899414, "global_step": 94982, "epoch": 2261} {"train_loss": -6.26264762878418, "global_step": 94983, "epoch": 2261} {"train_loss": -6.375482082366943, "global_step": 94984, "epoch": 2261} {"train_loss": -6.4269819259643555, "global_step": 94985, "epoch": 2261} {"train_loss": -6.23392391204834, "global_step": 94986, "epoch": 2261} {"train_loss": -6.3617377281188965, "global_step": 94987, "epoch": 2261} {"train_loss": -6.304757118225098, "global_step": 94988, "epoch": 2261} {"train_loss": -6.350367069244385, "global_step": 94989, "epoch": 2261} {"train_loss": -6.12646484375, "global_step": 94990, "epoch": 2261} {"train_loss": -6.235741138458252, "global_step": 94991, "epoch": 2261} {"train_loss": -6.3212738037109375, "global_step": 94992, "epoch": 2261} {"train_loss": -6.312991142272949, "global_step": 94993, "epoch": 2261} {"train_loss": -6.303226470947266, "global_step": 94994, "epoch": 2261} {"train_loss": -6.326956272125244, "global_step": 94995, "epoch": 2261} {"train_loss": -6.228143692016602, "global_step": 94996, "epoch": 2261} {"train_loss": -6.34425687789917, "global_step": 94997, "epoch": 2261} {"train_loss": -6.197267532348633, "global_step": 94998, "epoch": 2261} {"train_loss": -6.239039421081543, "global_step": 94999, "epoch": 2261} {"train_loss": -6.3160719871521, "global_step": 95000, "epoch": 2261} {"train_loss": -6.160486221313477, "global_step": 95001, "epoch": 2261} {"train_loss": -6.221615791320801, "global_step": 95002, "epoch": 2261} {"train_loss": -6.291502032961164, "global_step": 95003, "epoch": 2261, "val_loss": 63542.54296875} {"train_loss": -6.158858299255371, "global_step": 95004, "epoch": 2262} {"train_loss": -6.282392501831055, "global_step": 95005, "epoch": 2262} {"train_loss": -6.167063236236572, "global_step": 95006, "epoch": 2262} {"train_loss": -6.286928176879883, "global_step": 95007, "epoch": 2262} {"train_loss": -6.239025592803955, "global_step": 95008, "epoch": 2262} {"train_loss": -6.321424961090088, "global_step": 95009, "epoch": 2262} {"train_loss": -6.409250259399414, "global_step": 95010, "epoch": 2262} {"train_loss": -6.152942657470703, "global_step": 95011, "epoch": 2262} {"train_loss": -6.371173858642578, "global_step": 95012, "epoch": 2262} {"train_loss": -6.245774269104004, "global_step": 95013, "epoch": 2262} {"train_loss": -6.253627777099609, "global_step": 95014, "epoch": 2262} {"train_loss": -6.307526111602783, "global_step": 95015, "epoch": 2262} {"train_loss": -6.303091526031494, "global_step": 95016, "epoch": 2262} {"train_loss": -6.347870826721191, "global_step": 95017, "epoch": 2262} {"train_loss": -6.222358703613281, "global_step": 95018, "epoch": 2262} {"train_loss": -6.338925361633301, "global_step": 95019, "epoch": 2262} {"train_loss": -6.27977991104126, "global_step": 95020, "epoch": 2262} {"train_loss": -6.269810199737549, "global_step": 95021, "epoch": 2262} {"train_loss": -6.307720184326172, "global_step": 95022, "epoch": 2262} {"train_loss": -6.302873134613037, "global_step": 95023, "epoch": 2262} {"train_loss": -6.305379867553711, "global_step": 95024, "epoch": 2262} {"train_loss": -6.2783074378967285, "global_step": 95025, "epoch": 2262} {"train_loss": -6.269303321838379, "global_step": 95026, "epoch": 2262} {"train_loss": -6.1992292404174805, "global_step": 95027, "epoch": 2262} {"train_loss": -6.354097843170166, "global_step": 95028, "epoch": 2262} {"train_loss": -6.29293155670166, "global_step": 95029, "epoch": 2262} {"train_loss": -6.244053840637207, "global_step": 95030, "epoch": 2262} {"train_loss": -6.267704010009766, "global_step": 95031, "epoch": 2262} {"train_loss": -6.375979423522949, "global_step": 95032, "epoch": 2262} {"train_loss": -6.1878509521484375, "global_step": 95033, "epoch": 2262} {"train_loss": -6.187340259552002, "global_step": 95034, "epoch": 2262} {"train_loss": -6.295571327209473, "global_step": 95035, "epoch": 2262} {"train_loss": -6.192470073699951, "global_step": 95036, "epoch": 2262} {"train_loss": -6.299186706542969, "global_step": 95037, "epoch": 2262} {"train_loss": -6.308926582336426, "global_step": 95038, "epoch": 2262} {"train_loss": -6.278903007507324, "global_step": 95039, "epoch": 2262} {"train_loss": -6.386159896850586, "global_step": 95040, "epoch": 2262} {"train_loss": -6.292239189147949, "global_step": 95041, "epoch": 2262} {"train_loss": -6.339140892028809, "global_step": 95042, "epoch": 2262} {"train_loss": -6.290805816650391, "global_step": 95043, "epoch": 2262} {"train_loss": -6.257772922515869, "global_step": 95044, "epoch": 2262} {"train_loss": -6.28032770610991, "global_step": 95045, "epoch": 2262, "val_loss": 63497.6953125} {"train_loss": -6.336110591888428, "global_step": 95046, "epoch": 2263} {"train_loss": -6.469592571258545, "global_step": 95047, "epoch": 2263} {"train_loss": -6.137353897094727, "global_step": 95048, "epoch": 2263} {"train_loss": -6.265271186828613, "global_step": 95049, "epoch": 2263} {"train_loss": -6.30155611038208, "global_step": 95050, "epoch": 2263} {"train_loss": -6.299942493438721, "global_step": 95051, "epoch": 2263} {"train_loss": -6.305437088012695, "global_step": 95052, "epoch": 2263} {"train_loss": -6.321805000305176, "global_step": 95053, "epoch": 2263} {"train_loss": -6.257380485534668, "global_step": 95054, "epoch": 2263} {"train_loss": -6.385883808135986, "global_step": 95055, "epoch": 2263} {"train_loss": -6.279552936553955, "global_step": 95056, "epoch": 2263} {"train_loss": -6.336747169494629, "global_step": 95057, "epoch": 2263} {"train_loss": -6.374629497528076, "global_step": 95058, "epoch": 2263} {"train_loss": -6.322943210601807, "global_step": 95059, "epoch": 2263} {"train_loss": -6.237727165222168, "global_step": 95060, "epoch": 2263} {"train_loss": -6.320130348205566, "global_step": 95061, "epoch": 2263} {"train_loss": -6.311062812805176, "global_step": 95062, "epoch": 2263} {"train_loss": -6.348343849182129, "global_step": 95063, "epoch": 2263} {"train_loss": -6.315838813781738, "global_step": 95064, "epoch": 2263} {"train_loss": -6.382889747619629, "global_step": 95065, "epoch": 2263} {"train_loss": -6.208379745483398, "global_step": 95066, "epoch": 2263} {"train_loss": -6.269033432006836, "global_step": 95067, "epoch": 2263} {"train_loss": -6.271445274353027, "global_step": 95068, "epoch": 2263} {"train_loss": -6.336047649383545, "global_step": 95069, "epoch": 2263} {"train_loss": -6.27689266204834, "global_step": 95070, "epoch": 2263} {"train_loss": -6.324507713317871, "global_step": 95071, "epoch": 2263} {"train_loss": -6.349303245544434, "global_step": 95072, "epoch": 2263} {"train_loss": -6.256045341491699, "global_step": 95073, "epoch": 2263} {"train_loss": -6.347765922546387, "global_step": 95074, "epoch": 2263} {"train_loss": -6.339171409606934, "global_step": 95075, "epoch": 2263} {"train_loss": -6.410139083862305, "global_step": 95076, "epoch": 2263} {"train_loss": -6.269631385803223, "global_step": 95077, "epoch": 2263} {"train_loss": -6.334900856018066, "global_step": 95078, "epoch": 2263} {"train_loss": -6.450244903564453, "global_step": 95079, "epoch": 2263} {"train_loss": -6.343122482299805, "global_step": 95080, "epoch": 2263} {"train_loss": -6.300124645233154, "global_step": 95081, "epoch": 2263} {"train_loss": -6.381415367126465, "global_step": 95082, "epoch": 2263} {"train_loss": -6.311890602111816, "global_step": 95083, "epoch": 2263} {"train_loss": -6.388481140136719, "global_step": 95084, "epoch": 2263} {"train_loss": -6.5125908851623535, "global_step": 95085, "epoch": 2263} {"train_loss": -6.324618339538574, "global_step": 95086, "epoch": 2263} {"train_loss": -6.326833327611287, "global_step": 95087, "epoch": 2263, "val_loss": 63616.546875} {"train_loss": -6.363768577575684, "global_step": 95088, "epoch": 2264} {"train_loss": -6.296274662017822, "global_step": 95089, "epoch": 2264} {"train_loss": -6.402179718017578, "global_step": 95090, "epoch": 2264} {"train_loss": -6.427139759063721, "global_step": 95091, "epoch": 2264} {"train_loss": -6.327645778656006, "global_step": 95092, "epoch": 2264} {"train_loss": -6.427196502685547, "global_step": 95093, "epoch": 2264} {"train_loss": -6.35260009765625, "global_step": 95094, "epoch": 2264} {"train_loss": -6.136499404907227, "global_step": 95095, "epoch": 2264} {"train_loss": -6.3688225746154785, "global_step": 95096, "epoch": 2264} {"train_loss": -6.23630952835083, "global_step": 95097, "epoch": 2264} {"train_loss": -6.256617546081543, "global_step": 95098, "epoch": 2264} {"train_loss": -6.341639518737793, "global_step": 95099, "epoch": 2264} {"train_loss": -6.30753231048584, "global_step": 95100, "epoch": 2264} {"train_loss": -6.257213592529297, "global_step": 95101, "epoch": 2264} {"train_loss": -6.3463897705078125, "global_step": 95102, "epoch": 2264} {"train_loss": -6.345889091491699, "global_step": 95103, "epoch": 2264} {"train_loss": -6.322267055511475, "global_step": 95104, "epoch": 2264} {"train_loss": -6.398184776306152, "global_step": 95105, "epoch": 2264} {"train_loss": -6.357851028442383, "global_step": 95106, "epoch": 2264} {"train_loss": -6.344744682312012, "global_step": 95107, "epoch": 2264} {"train_loss": -6.2695722579956055, "global_step": 95108, "epoch": 2264} {"train_loss": -6.287372589111328, "global_step": 95109, "epoch": 2264} {"train_loss": -6.3985490798950195, "global_step": 95110, "epoch": 2264} {"train_loss": -6.2675886154174805, "global_step": 95111, "epoch": 2264} {"train_loss": -6.328559875488281, "global_step": 95112, "epoch": 2264} {"train_loss": -6.20882511138916, "global_step": 95113, "epoch": 2264} {"train_loss": -6.288018226623535, "global_step": 95114, "epoch": 2264} {"train_loss": -6.27735710144043, "global_step": 95115, "epoch": 2264} {"train_loss": -6.308599472045898, "global_step": 95116, "epoch": 2264} {"train_loss": -6.386441230773926, "global_step": 95117, "epoch": 2264} {"train_loss": -6.346800804138184, "global_step": 95118, "epoch": 2264} {"train_loss": -6.327205657958984, "global_step": 95119, "epoch": 2264} {"train_loss": -6.308073997497559, "global_step": 95120, "epoch": 2264} {"train_loss": -6.2153120040893555, "global_step": 95121, "epoch": 2264} {"train_loss": -6.251359939575195, "global_step": 95122, "epoch": 2264} {"train_loss": -6.322943210601807, "global_step": 95123, "epoch": 2264} {"train_loss": -6.213710308074951, "global_step": 95124, "epoch": 2264} {"train_loss": -6.276358604431152, "global_step": 95125, "epoch": 2264} {"train_loss": -6.325492858886719, "global_step": 95126, "epoch": 2264} {"train_loss": -6.322117328643799, "global_step": 95127, "epoch": 2264} {"train_loss": -6.222431182861328, "global_step": 95128, "epoch": 2264} {"train_loss": -6.310047637848627, "global_step": 95129, "epoch": 2264, "val_loss": 63709.08203125} {"train_loss": -6.282615661621094, "global_step": 95130, "epoch": 2265} {"train_loss": -6.389540672302246, "global_step": 95131, "epoch": 2265} {"train_loss": -6.284952163696289, "global_step": 95132, "epoch": 2265} {"train_loss": -6.329468727111816, "global_step": 95133, "epoch": 2265} {"train_loss": -6.3983659744262695, "global_step": 95134, "epoch": 2265} {"train_loss": -6.272578239440918, "global_step": 95135, "epoch": 2265} {"train_loss": -6.46893310546875, "global_step": 95136, "epoch": 2265} {"train_loss": -6.336806297302246, "global_step": 95137, "epoch": 2265} {"train_loss": -6.286874771118164, "global_step": 95138, "epoch": 2265} {"train_loss": -6.195135116577148, "global_step": 95139, "epoch": 2265} {"train_loss": -6.309994697570801, "global_step": 95140, "epoch": 2265} {"train_loss": -6.272773265838623, "global_step": 95141, "epoch": 2265} {"train_loss": -6.304195404052734, "global_step": 95142, "epoch": 2265} {"train_loss": -6.31126070022583, "global_step": 95143, "epoch": 2265} {"train_loss": -6.326199531555176, "global_step": 95144, "epoch": 2265} {"train_loss": -6.400179386138916, "global_step": 95145, "epoch": 2265} {"train_loss": -6.259189605712891, "global_step": 95146, "epoch": 2265} {"train_loss": -6.349759101867676, "global_step": 95147, "epoch": 2265} {"train_loss": -6.384411811828613, "global_step": 95148, "epoch": 2265} {"train_loss": -6.22247838973999, "global_step": 95149, "epoch": 2265} {"train_loss": -6.287535190582275, "global_step": 95150, "epoch": 2265} {"train_loss": -6.354588985443115, "global_step": 95151, "epoch": 2265} {"train_loss": -6.338915824890137, "global_step": 95152, "epoch": 2265} {"train_loss": -6.424456596374512, "global_step": 95153, "epoch": 2265} {"train_loss": -6.186136245727539, "global_step": 95154, "epoch": 2265} {"train_loss": -6.350318908691406, "global_step": 95155, "epoch": 2265} {"train_loss": -6.311598300933838, "global_step": 95156, "epoch": 2265} {"train_loss": -6.362085342407227, "global_step": 95157, "epoch": 2265} {"train_loss": -6.2960405349731445, "global_step": 95158, "epoch": 2265} {"train_loss": -6.3155517578125, "global_step": 95159, "epoch": 2265} {"train_loss": -6.251152992248535, "global_step": 95160, "epoch": 2265} {"train_loss": -6.306532859802246, "global_step": 95161, "epoch": 2265} {"train_loss": -6.306714057922363, "global_step": 95162, "epoch": 2265} {"train_loss": -6.249793529510498, "global_step": 95163, "epoch": 2265} {"train_loss": -6.3951215744018555, "global_step": 95164, "epoch": 2265} {"train_loss": -6.337297439575195, "global_step": 95165, "epoch": 2265} {"train_loss": -6.261292457580566, "global_step": 95166, "epoch": 2265} {"train_loss": -6.3830766677856445, "global_step": 95167, "epoch": 2265} {"train_loss": -6.292754650115967, "global_step": 95168, "epoch": 2265} {"train_loss": -6.331022262573242, "global_step": 95169, "epoch": 2265} {"train_loss": -6.353634834289551, "global_step": 95170, "epoch": 2265} {"train_loss": -6.320384615943546, "global_step": 95171, "epoch": 2265, "val_loss": 63573.74609375} {"train_loss": -6.401980400085449, "global_step": 95172, "epoch": 2266} {"train_loss": -6.371799945831299, "global_step": 95173, "epoch": 2266} {"train_loss": -6.287492752075195, "global_step": 95174, "epoch": 2266} {"train_loss": -6.361007213592529, "global_step": 95175, "epoch": 2266} {"train_loss": -6.283646583557129, "global_step": 95176, "epoch": 2266} {"train_loss": -6.285533428192139, "global_step": 95177, "epoch": 2266} {"train_loss": -6.38950252532959, "global_step": 95178, "epoch": 2266} {"train_loss": -6.308224201202393, "global_step": 95179, "epoch": 2266} {"train_loss": -6.438657760620117, "global_step": 95180, "epoch": 2266} {"train_loss": -6.440237045288086, "global_step": 95181, "epoch": 2266} {"train_loss": -6.364357948303223, "global_step": 95182, "epoch": 2266} {"train_loss": -6.325522422790527, "global_step": 95183, "epoch": 2266} {"train_loss": -6.323023319244385, "global_step": 95184, "epoch": 2266} {"train_loss": -6.336879730224609, "global_step": 95185, "epoch": 2266} {"train_loss": -6.3461785316467285, "global_step": 95186, "epoch": 2266} {"train_loss": -6.323166370391846, "global_step": 95187, "epoch": 2266} {"train_loss": -6.3925347328186035, "global_step": 95188, "epoch": 2266} {"train_loss": -6.334606170654297, "global_step": 95189, "epoch": 2266} {"train_loss": -6.2775726318359375, "global_step": 95190, "epoch": 2266} {"train_loss": -6.397983551025391, "global_step": 95191, "epoch": 2266} {"train_loss": -6.327824592590332, "global_step": 95192, "epoch": 2266} {"train_loss": -6.284629821777344, "global_step": 95193, "epoch": 2266} {"train_loss": -6.371333122253418, "global_step": 95194, "epoch": 2266} {"train_loss": -6.285321235656738, "global_step": 95195, "epoch": 2266} {"train_loss": -6.3020172119140625, "global_step": 95196, "epoch": 2266} {"train_loss": -6.267356872558594, "global_step": 95197, "epoch": 2266} {"train_loss": -6.365515232086182, "global_step": 95198, "epoch": 2266} {"train_loss": -6.283101558685303, "global_step": 95199, "epoch": 2266} {"train_loss": -6.24561882019043, "global_step": 95200, "epoch": 2266} {"train_loss": -6.374842166900635, "global_step": 95201, "epoch": 2266} {"train_loss": -6.3412628173828125, "global_step": 95202, "epoch": 2266} {"train_loss": -6.353854179382324, "global_step": 95203, "epoch": 2266} {"train_loss": -6.275844573974609, "global_step": 95204, "epoch": 2266} {"train_loss": -6.392351150512695, "global_step": 95205, "epoch": 2266} {"train_loss": -6.308703422546387, "global_step": 95206, "epoch": 2266} {"train_loss": -6.357513427734375, "global_step": 95207, "epoch": 2266} {"train_loss": -6.323955535888672, "global_step": 95208, "epoch": 2266} {"train_loss": -6.453893184661865, "global_step": 95209, "epoch": 2266} {"train_loss": -6.281038761138916, "global_step": 95210, "epoch": 2266} {"train_loss": -6.440223217010498, "global_step": 95211, "epoch": 2266} {"train_loss": -6.366434574127197, "global_step": 95212, "epoch": 2266} {"train_loss": -6.338625431060791, "global_step": 95213, "epoch": 2266, "val_loss": 63481.01953125} {"train_loss": -6.4057183265686035, "global_step": 95214, "epoch": 2267} {"train_loss": -6.326637268066406, "global_step": 95215, "epoch": 2267} {"train_loss": -6.313343524932861, "global_step": 95216, "epoch": 2267} {"train_loss": -6.333295822143555, "global_step": 95217, "epoch": 2267} {"train_loss": -6.363250255584717, "global_step": 95218, "epoch": 2267} {"train_loss": -6.249146461486816, "global_step": 95219, "epoch": 2267} {"train_loss": -6.289507865905762, "global_step": 95220, "epoch": 2267} {"train_loss": -6.286232948303223, "global_step": 95221, "epoch": 2267} {"train_loss": -6.28018856048584, "global_step": 95222, "epoch": 2267} {"train_loss": -6.321509838104248, "global_step": 95223, "epoch": 2267} {"train_loss": -6.366094589233398, "global_step": 95224, "epoch": 2267} {"train_loss": -6.4515461921691895, "global_step": 95225, "epoch": 2267} {"train_loss": -6.3662428855896, "global_step": 95226, "epoch": 2267} {"train_loss": -6.278575897216797, "global_step": 95227, "epoch": 2267} {"train_loss": -6.4215898513793945, "global_step": 95228, "epoch": 2267} {"train_loss": -6.301016807556152, "global_step": 95229, "epoch": 2267} {"train_loss": -6.269959449768066, "global_step": 95230, "epoch": 2267} {"train_loss": -6.306822776794434, "global_step": 95231, "epoch": 2267} {"train_loss": -6.266496658325195, "global_step": 95232, "epoch": 2267} {"train_loss": -6.274999618530273, "global_step": 95233, "epoch": 2267} {"train_loss": -6.257237911224365, "global_step": 95234, "epoch": 2267} {"train_loss": -6.284308910369873, "global_step": 95235, "epoch": 2267} {"train_loss": -6.301901817321777, "global_step": 95236, "epoch": 2267} {"train_loss": -6.29181432723999, "global_step": 95237, "epoch": 2267} {"train_loss": -6.407191276550293, "global_step": 95238, "epoch": 2267} {"train_loss": -6.355903625488281, "global_step": 95239, "epoch": 2267} {"train_loss": -6.363283157348633, "global_step": 95240, "epoch": 2267} {"train_loss": -6.310251235961914, "global_step": 95241, "epoch": 2267} {"train_loss": -6.340001106262207, "global_step": 95242, "epoch": 2267} {"train_loss": -6.218201637268066, "global_step": 95243, "epoch": 2267} {"train_loss": -6.259071350097656, "global_step": 95244, "epoch": 2267} {"train_loss": -6.3169732093811035, "global_step": 95245, "epoch": 2267} {"train_loss": -6.274654865264893, "global_step": 95246, "epoch": 2267} {"train_loss": -6.364909648895264, "global_step": 95247, "epoch": 2267} {"train_loss": -6.256509780883789, "global_step": 95248, "epoch": 2267} {"train_loss": -6.3780341148376465, "global_step": 95249, "epoch": 2267} {"train_loss": -6.275943756103516, "global_step": 95250, "epoch": 2267} {"train_loss": -6.193655967712402, "global_step": 95251, "epoch": 2267} {"train_loss": -6.20551872253418, "global_step": 95252, "epoch": 2267} {"train_loss": -6.2015886306762695, "global_step": 95253, "epoch": 2267} {"train_loss": -6.352028846740723, "global_step": 95254, "epoch": 2267} {"train_loss": -6.305191993713379, "global_step": 95255, "epoch": 2267, "val_loss": 63809.83203125} {"train_loss": -6.341284275054932, "global_step": 95256, "epoch": 2268} {"train_loss": -6.371024131774902, "global_step": 95257, "epoch": 2268} {"train_loss": -6.311254024505615, "global_step": 95258, "epoch": 2268} {"train_loss": -6.2413434982299805, "global_step": 95259, "epoch": 2268} {"train_loss": -6.259527683258057, "global_step": 95260, "epoch": 2268} {"train_loss": -6.265730857849121, "global_step": 95261, "epoch": 2268} {"train_loss": -6.236868381500244, "global_step": 95262, "epoch": 2268} {"train_loss": -6.327083110809326, "global_step": 95263, "epoch": 2268} {"train_loss": -6.277926445007324, "global_step": 95264, "epoch": 2268} {"train_loss": -6.297737121582031, "global_step": 95265, "epoch": 2268} {"train_loss": -6.335945129394531, "global_step": 95266, "epoch": 2268} {"train_loss": -6.221011161804199, "global_step": 95267, "epoch": 2268} {"train_loss": -6.305781364440918, "global_step": 95268, "epoch": 2268} {"train_loss": -6.249451637268066, "global_step": 95269, "epoch": 2268} {"train_loss": -6.299081802368164, "global_step": 95270, "epoch": 2268} {"train_loss": -6.117785453796387, "global_step": 95271, "epoch": 2268} {"train_loss": -6.115833759307861, "global_step": 95272, "epoch": 2268} {"train_loss": -6.263796806335449, "global_step": 95273, "epoch": 2268} {"train_loss": -6.205547332763672, "global_step": 95274, "epoch": 2268} {"train_loss": -6.31014347076416, "global_step": 95275, "epoch": 2268} {"train_loss": -6.257296562194824, "global_step": 95276, "epoch": 2268} {"train_loss": -6.324645042419434, "global_step": 95277, "epoch": 2268} {"train_loss": -6.324135780334473, "global_step": 95278, "epoch": 2268} {"train_loss": -6.221298694610596, "global_step": 95279, "epoch": 2268} {"train_loss": -6.27388334274292, "global_step": 95280, "epoch": 2268} {"train_loss": -6.247864723205566, "global_step": 95281, "epoch": 2268} {"train_loss": -6.40142297744751, "global_step": 95282, "epoch": 2268} {"train_loss": -6.164818286895752, "global_step": 95283, "epoch": 2268} {"train_loss": -6.220293998718262, "global_step": 95284, "epoch": 2268} {"train_loss": -6.332208156585693, "global_step": 95285, "epoch": 2268} {"train_loss": -6.236453056335449, "global_step": 95286, "epoch": 2268} {"train_loss": -6.308820724487305, "global_step": 95287, "epoch": 2268} {"train_loss": -6.1940507888793945, "global_step": 95288, "epoch": 2268} {"train_loss": -6.328675270080566, "global_step": 95289, "epoch": 2268} {"train_loss": -6.383325576782227, "global_step": 95290, "epoch": 2268} {"train_loss": -6.3970947265625, "global_step": 95291, "epoch": 2268} {"train_loss": -6.272818565368652, "global_step": 95292, "epoch": 2268} {"train_loss": -6.2616376876831055, "global_step": 95293, "epoch": 2268} {"train_loss": -6.329928398132324, "global_step": 95294, "epoch": 2268} {"train_loss": -6.317016124725342, "global_step": 95295, "epoch": 2268} {"train_loss": -6.425942420959473, "global_step": 95296, "epoch": 2268} {"train_loss": -6.282453582400367, "global_step": 95297, "epoch": 2268, "val_loss": 63676.2265625} {"train_loss": -6.3038530349731445, "global_step": 95298, "epoch": 2269} {"train_loss": -6.350334167480469, "global_step": 95299, "epoch": 2269} {"train_loss": -6.335409164428711, "global_step": 95300, "epoch": 2269} {"train_loss": -6.4245285987854, "global_step": 95301, "epoch": 2269} {"train_loss": -6.359950542449951, "global_step": 95302, "epoch": 2269} {"train_loss": -6.307060241699219, "global_step": 95303, "epoch": 2269} {"train_loss": -6.380310535430908, "global_step": 95304, "epoch": 2269} {"train_loss": -6.3300604820251465, "global_step": 95305, "epoch": 2269} {"train_loss": -6.286220550537109, "global_step": 95306, "epoch": 2269} {"train_loss": -6.298069953918457, "global_step": 95307, "epoch": 2269} {"train_loss": -6.2378668785095215, "global_step": 95308, "epoch": 2269} {"train_loss": -6.328784942626953, "global_step": 95309, "epoch": 2269} {"train_loss": -6.248032569885254, "global_step": 95310, "epoch": 2269} {"train_loss": -6.32032585144043, "global_step": 95311, "epoch": 2269} {"train_loss": -6.382264614105225, "global_step": 95312, "epoch": 2269} {"train_loss": -6.3599348068237305, "global_step": 95313, "epoch": 2269} {"train_loss": -6.3348388671875, "global_step": 95314, "epoch": 2269} {"train_loss": -6.2774457931518555, "global_step": 95315, "epoch": 2269} {"train_loss": -6.354247093200684, "global_step": 95316, "epoch": 2269} {"train_loss": -6.276153564453125, "global_step": 95317, "epoch": 2269} {"train_loss": -6.298387050628662, "global_step": 95318, "epoch": 2269} {"train_loss": -6.290277481079102, "global_step": 95319, "epoch": 2269} {"train_loss": -6.361001014709473, "global_step": 95320, "epoch": 2269} {"train_loss": -6.334495544433594, "global_step": 95321, "epoch": 2269} {"train_loss": -6.214200019836426, "global_step": 95322, "epoch": 2269} {"train_loss": -6.388851165771484, "global_step": 95323, "epoch": 2269} {"train_loss": -6.303170204162598, "global_step": 95324, "epoch": 2269} {"train_loss": -6.270439147949219, "global_step": 95325, "epoch": 2269} {"train_loss": -6.348178863525391, "global_step": 95326, "epoch": 2269} {"train_loss": -6.234738826751709, "global_step": 95327, "epoch": 2269} {"train_loss": -6.334891319274902, "global_step": 95328, "epoch": 2269} {"train_loss": -6.339743614196777, "global_step": 95329, "epoch": 2269} {"train_loss": -6.345627784729004, "global_step": 95330, "epoch": 2269} {"train_loss": -6.381792068481445, "global_step": 95331, "epoch": 2269} {"train_loss": -6.358462810516357, "global_step": 95332, "epoch": 2269} {"train_loss": -6.3736467361450195, "global_step": 95333, "epoch": 2269} {"train_loss": -6.356872081756592, "global_step": 95334, "epoch": 2269} {"train_loss": -6.284477710723877, "global_step": 95335, "epoch": 2269} {"train_loss": -6.367636203765869, "global_step": 95336, "epoch": 2269} {"train_loss": -6.270198822021484, "global_step": 95337, "epoch": 2269} {"train_loss": -6.404726505279541, "global_step": 95338, "epoch": 2269} {"train_loss": -6.325806890215192, "global_step": 95339, "epoch": 2269, "val_loss": 63637.046875} {"train_loss": -6.314115524291992, "global_step": 95340, "epoch": 2270} {"train_loss": -6.245643615722656, "global_step": 95341, "epoch": 2270} {"train_loss": -6.391978740692139, "global_step": 95342, "epoch": 2270} {"train_loss": -6.3393168449401855, "global_step": 95343, "epoch": 2270} {"train_loss": -6.36221981048584, "global_step": 95344, "epoch": 2270} {"train_loss": -6.238903045654297, "global_step": 95345, "epoch": 2270} {"train_loss": -6.309761047363281, "global_step": 95346, "epoch": 2270} {"train_loss": -6.301693916320801, "global_step": 95347, "epoch": 2270} {"train_loss": -6.271697044372559, "global_step": 95348, "epoch": 2270} {"train_loss": -6.306982517242432, "global_step": 95349, "epoch": 2270} {"train_loss": -6.24510383605957, "global_step": 95350, "epoch": 2270} {"train_loss": -6.356899261474609, "global_step": 95351, "epoch": 2270} {"train_loss": -6.327525615692139, "global_step": 95352, "epoch": 2270} {"train_loss": -6.289034843444824, "global_step": 95353, "epoch": 2270} {"train_loss": -6.31892204284668, "global_step": 95354, "epoch": 2270} {"train_loss": -6.310003280639648, "global_step": 95355, "epoch": 2270} {"train_loss": -6.380784511566162, "global_step": 95356, "epoch": 2270} {"train_loss": -6.292219161987305, "global_step": 95357, "epoch": 2270} {"train_loss": -6.397599220275879, "global_step": 95358, "epoch": 2270} {"train_loss": -6.24272346496582, "global_step": 95359, "epoch": 2270} {"train_loss": -6.3488616943359375, "global_step": 95360, "epoch": 2270} {"train_loss": -6.362049579620361, "global_step": 95361, "epoch": 2270} {"train_loss": -6.299370288848877, "global_step": 95362, "epoch": 2270} {"train_loss": -6.417243480682373, "global_step": 95363, "epoch": 2270} {"train_loss": -6.329311370849609, "global_step": 95364, "epoch": 2270} {"train_loss": -6.3573808670043945, "global_step": 95365, "epoch": 2270} {"train_loss": -6.286132335662842, "global_step": 95366, "epoch": 2270} {"train_loss": -6.367669105529785, "global_step": 95367, "epoch": 2270} {"train_loss": -6.354119300842285, "global_step": 95368, "epoch": 2270} {"train_loss": -6.2606072425842285, "global_step": 95369, "epoch": 2270} {"train_loss": -6.419451713562012, "global_step": 95370, "epoch": 2270} {"train_loss": -6.304995536804199, "global_step": 95371, "epoch": 2270} {"train_loss": -6.170833587646484, "global_step": 95372, "epoch": 2270} {"train_loss": -6.391087532043457, "global_step": 95373, "epoch": 2270} {"train_loss": -6.264554977416992, "global_step": 95374, "epoch": 2270} {"train_loss": -6.353928089141846, "global_step": 95375, "epoch": 2270} {"train_loss": -6.310005187988281, "global_step": 95376, "epoch": 2270} {"train_loss": -6.263882637023926, "global_step": 95377, "epoch": 2270} {"train_loss": -6.391013145446777, "global_step": 95378, "epoch": 2270} {"train_loss": -6.353928089141846, "global_step": 95379, "epoch": 2270} {"train_loss": -6.282964706420898, "global_step": 95380, "epoch": 2270} {"train_loss": -6.320661987577166, "global_step": 95381, "epoch": 2270, "val_loss": 63291.07421875} {"train_loss": -6.283536434173584, "global_step": 95382, "epoch": 2271} {"train_loss": -6.33162260055542, "global_step": 95383, "epoch": 2271} {"train_loss": -6.246766090393066, "global_step": 95384, "epoch": 2271} {"train_loss": -6.364194869995117, "global_step": 95385, "epoch": 2271} {"train_loss": -6.368603706359863, "global_step": 95386, "epoch": 2271} {"train_loss": -6.381797790527344, "global_step": 95387, "epoch": 2271} {"train_loss": -6.233388900756836, "global_step": 95388, "epoch": 2271} {"train_loss": -6.2758636474609375, "global_step": 95389, "epoch": 2271} {"train_loss": -6.3556671142578125, "global_step": 95390, "epoch": 2271} {"train_loss": -6.180952072143555, "global_step": 95391, "epoch": 2271} {"train_loss": -6.3629961013793945, "global_step": 95392, "epoch": 2271} {"train_loss": -6.307304382324219, "global_step": 95393, "epoch": 2271} {"train_loss": -6.259121894836426, "global_step": 95394, "epoch": 2271} {"train_loss": -6.365088939666748, "global_step": 95395, "epoch": 2271} {"train_loss": -6.38031005859375, "global_step": 95396, "epoch": 2271} {"train_loss": -6.367621421813965, "global_step": 95397, "epoch": 2271} {"train_loss": -6.49336051940918, "global_step": 95398, "epoch": 2271} {"train_loss": -6.338397979736328, "global_step": 95399, "epoch": 2271} {"train_loss": -6.401933193206787, "global_step": 95400, "epoch": 2271} {"train_loss": -6.324183464050293, "global_step": 95401, "epoch": 2271} {"train_loss": -6.346893310546875, "global_step": 95402, "epoch": 2271} {"train_loss": -6.345058441162109, "global_step": 95403, "epoch": 2271} {"train_loss": -6.401162147521973, "global_step": 95404, "epoch": 2271} {"train_loss": -6.350412368774414, "global_step": 95405, "epoch": 2271} {"train_loss": -6.369803428649902, "global_step": 95406, "epoch": 2271} {"train_loss": -6.285344123840332, "global_step": 95407, "epoch": 2271} {"train_loss": -6.412136077880859, "global_step": 95408, "epoch": 2271} {"train_loss": -6.410083770751953, "global_step": 95409, "epoch": 2271} {"train_loss": -6.415970802307129, "global_step": 95410, "epoch": 2271} {"train_loss": -6.3263678550720215, "global_step": 95411, "epoch": 2271} {"train_loss": -6.277688026428223, "global_step": 95412, "epoch": 2271} {"train_loss": -6.258559226989746, "global_step": 95413, "epoch": 2271} {"train_loss": -6.2829999923706055, "global_step": 95414, "epoch": 2271} {"train_loss": -6.382698059082031, "global_step": 95415, "epoch": 2271} {"train_loss": -6.319149494171143, "global_step": 95416, "epoch": 2271} {"train_loss": -6.2495317459106445, "global_step": 95417, "epoch": 2271} {"train_loss": -6.373729705810547, "global_step": 95418, "epoch": 2271} {"train_loss": -6.171683311462402, "global_step": 95419, "epoch": 2271} {"train_loss": -6.268558502197266, "global_step": 95420, "epoch": 2271} {"train_loss": -6.300281047821045, "global_step": 95421, "epoch": 2271} {"train_loss": -6.2628254890441895, "global_step": 95422, "epoch": 2271} {"train_loss": -6.327757210958572, "global_step": 95423, "epoch": 2271, "val_loss": 63763.5390625} {"train_loss": -6.341649055480957, "global_step": 95424, "epoch": 2272} {"train_loss": -6.3148016929626465, "global_step": 95425, "epoch": 2272} {"train_loss": -6.336261749267578, "global_step": 95426, "epoch": 2272} {"train_loss": -6.322874069213867, "global_step": 95427, "epoch": 2272} {"train_loss": -6.2768778800964355, "global_step": 95428, "epoch": 2272} {"train_loss": -6.235655784606934, "global_step": 95429, "epoch": 2272} {"train_loss": -6.36879301071167, "global_step": 95430, "epoch": 2272} {"train_loss": -6.373197555541992, "global_step": 95431, "epoch": 2272} {"train_loss": -6.139640808105469, "global_step": 95432, "epoch": 2272} {"train_loss": -6.366144180297852, "global_step": 95433, "epoch": 2272} {"train_loss": -6.321385860443115, "global_step": 95434, "epoch": 2272} {"train_loss": -6.374235153198242, "global_step": 95435, "epoch": 2272} {"train_loss": -6.349835395812988, "global_step": 95436, "epoch": 2272} {"train_loss": -6.307384490966797, "global_step": 95437, "epoch": 2272} {"train_loss": -6.486824989318848, "global_step": 95438, "epoch": 2272} {"train_loss": -6.243538856506348, "global_step": 95439, "epoch": 2272} {"train_loss": -6.338944435119629, "global_step": 95440, "epoch": 2272} {"train_loss": -6.286740303039551, "global_step": 95441, "epoch": 2272} {"train_loss": -6.236178398132324, "global_step": 95442, "epoch": 2272} {"train_loss": -6.283451080322266, "global_step": 95443, "epoch": 2272} {"train_loss": -6.343920707702637, "global_step": 95444, "epoch": 2272} {"train_loss": -6.323762893676758, "global_step": 95445, "epoch": 2272} {"train_loss": -6.245131015777588, "global_step": 95446, "epoch": 2272} {"train_loss": -6.402559280395508, "global_step": 95447, "epoch": 2272} {"train_loss": -6.339922904968262, "global_step": 95448, "epoch": 2272} {"train_loss": -6.308307647705078, "global_step": 95449, "epoch": 2272} {"train_loss": -6.302168369293213, "global_step": 95450, "epoch": 2272} {"train_loss": -6.353965759277344, "global_step": 95451, "epoch": 2272} {"train_loss": -6.454872131347656, "global_step": 95452, "epoch": 2272} {"train_loss": -6.248478889465332, "global_step": 95453, "epoch": 2272} {"train_loss": -6.47037410736084, "global_step": 95454, "epoch": 2272} {"train_loss": -6.170285224914551, "global_step": 95455, "epoch": 2272} {"train_loss": -6.440515518188477, "global_step": 95456, "epoch": 2272} {"train_loss": -6.302574157714844, "global_step": 95457, "epoch": 2272} {"train_loss": -6.276058673858643, "global_step": 95458, "epoch": 2272} {"train_loss": -6.357677936553955, "global_step": 95459, "epoch": 2272} {"train_loss": -6.321471214294434, "global_step": 95460, "epoch": 2272} {"train_loss": -6.265835762023926, "global_step": 95461, "epoch": 2272} {"train_loss": -6.217414855957031, "global_step": 95462, "epoch": 2272} {"train_loss": -6.328205108642578, "global_step": 95463, "epoch": 2272} {"train_loss": -6.288993835449219, "global_step": 95464, "epoch": 2272} {"train_loss": -6.317568143208821, "global_step": 95465, "epoch": 2272, "val_loss": 63653.44921875} {"train_loss": -6.32784366607666, "global_step": 95466, "epoch": 2273} {"train_loss": -6.362868785858154, "global_step": 95467, "epoch": 2273} {"train_loss": -6.33073616027832, "global_step": 95468, "epoch": 2273} {"train_loss": -6.358922481536865, "global_step": 95469, "epoch": 2273} {"train_loss": -6.3648881912231445, "global_step": 95470, "epoch": 2273} {"train_loss": -6.320345878601074, "global_step": 95471, "epoch": 2273} {"train_loss": -6.383207321166992, "global_step": 95472, "epoch": 2273} {"train_loss": -6.4169230461120605, "global_step": 95473, "epoch": 2273} {"train_loss": -6.348885536193848, "global_step": 95474, "epoch": 2273} {"train_loss": -6.352032661437988, "global_step": 95475, "epoch": 2273} {"train_loss": -6.1641364097595215, "global_step": 95476, "epoch": 2273} {"train_loss": -6.386396408081055, "global_step": 95477, "epoch": 2273} {"train_loss": -6.3044586181640625, "global_step": 95478, "epoch": 2273} {"train_loss": -6.224408149719238, "global_step": 95479, "epoch": 2273} {"train_loss": -6.340090274810791, "global_step": 95480, "epoch": 2273} {"train_loss": -6.375154495239258, "global_step": 95481, "epoch": 2273} {"train_loss": -6.375598907470703, "global_step": 95482, "epoch": 2273} {"train_loss": -6.273009777069092, "global_step": 95483, "epoch": 2273} {"train_loss": -6.409972190856934, "global_step": 95484, "epoch": 2273} {"train_loss": -6.130468368530273, "global_step": 95485, "epoch": 2273} {"train_loss": -6.306808948516846, "global_step": 95486, "epoch": 2273} {"train_loss": -6.279077529907227, "global_step": 95487, "epoch": 2273} {"train_loss": -6.229668617248535, "global_step": 95488, "epoch": 2273} {"train_loss": -6.360065460205078, "global_step": 95489, "epoch": 2273} {"train_loss": -6.239863395690918, "global_step": 95490, "epoch": 2273} {"train_loss": -6.331188201904297, "global_step": 95491, "epoch": 2273} {"train_loss": -6.260549068450928, "global_step": 95492, "epoch": 2273} {"train_loss": -6.2390007972717285, "global_step": 95493, "epoch": 2273} {"train_loss": -6.26552152633667, "global_step": 95494, "epoch": 2273} {"train_loss": -6.2675347328186035, "global_step": 95495, "epoch": 2273} {"train_loss": -6.156333923339844, "global_step": 95496, "epoch": 2273} {"train_loss": -6.2246174812316895, "global_step": 95497, "epoch": 2273} {"train_loss": -6.230967998504639, "global_step": 95498, "epoch": 2273} {"train_loss": -6.368198394775391, "global_step": 95499, "epoch": 2273} {"train_loss": -6.22369384765625, "global_step": 95500, "epoch": 2273} {"train_loss": -6.281259059906006, "global_step": 95501, "epoch": 2273} {"train_loss": -6.3165483474731445, "global_step": 95502, "epoch": 2273} {"train_loss": -6.1490092277526855, "global_step": 95503, "epoch": 2273} {"train_loss": -6.304230690002441, "global_step": 95504, "epoch": 2273} {"train_loss": -6.1568756103515625, "global_step": 95505, "epoch": 2273} {"train_loss": -6.310044765472412, "global_step": 95506, "epoch": 2273} {"train_loss": -6.294197230111985, "global_step": 95507, "epoch": 2273, "val_loss": 63803.09375} {"train_loss": -6.335504531860352, "global_step": 95508, "epoch": 2274} {"train_loss": -6.2530364990234375, "global_step": 95509, "epoch": 2274} {"train_loss": -6.261263847351074, "global_step": 95510, "epoch": 2274} {"train_loss": -6.3639116287231445, "global_step": 95511, "epoch": 2274} {"train_loss": -6.2555646896362305, "global_step": 95512, "epoch": 2274} {"train_loss": -6.350793838500977, "global_step": 95513, "epoch": 2274} {"train_loss": -6.291540145874023, "global_step": 95514, "epoch": 2274} {"train_loss": -6.2636284828186035, "global_step": 95515, "epoch": 2274} {"train_loss": -6.407365322113037, "global_step": 95516, "epoch": 2274} {"train_loss": -6.264222145080566, "global_step": 95517, "epoch": 2274} {"train_loss": -6.36187744140625, "global_step": 95518, "epoch": 2274} {"train_loss": -6.504580497741699, "global_step": 95519, "epoch": 2274} {"train_loss": -6.378011703491211, "global_step": 95520, "epoch": 2274} {"train_loss": -6.3982133865356445, "global_step": 95521, "epoch": 2274} {"train_loss": -6.4102678298950195, "global_step": 95522, "epoch": 2274} {"train_loss": -6.358171463012695, "global_step": 95523, "epoch": 2274} {"train_loss": -6.3047685623168945, "global_step": 95524, "epoch": 2274} {"train_loss": -6.435666561126709, "global_step": 95525, "epoch": 2274} {"train_loss": -6.241790771484375, "global_step": 95526, "epoch": 2274} {"train_loss": -6.438209533691406, "global_step": 95527, "epoch": 2274} {"train_loss": -6.24997615814209, "global_step": 95528, "epoch": 2274} {"train_loss": -6.347983360290527, "global_step": 95529, "epoch": 2274} {"train_loss": -6.344633102416992, "global_step": 95530, "epoch": 2274} {"train_loss": -6.3875885009765625, "global_step": 95531, "epoch": 2274} {"train_loss": -6.4320387840271, "global_step": 95532, "epoch": 2274} {"train_loss": -6.318018913269043, "global_step": 95533, "epoch": 2274} {"train_loss": -6.359550476074219, "global_step": 95534, "epoch": 2274} {"train_loss": -6.230637073516846, "global_step": 95535, "epoch": 2274} {"train_loss": -6.40650749206543, "global_step": 95536, "epoch": 2274} {"train_loss": -6.270103931427002, "global_step": 95537, "epoch": 2274} {"train_loss": -6.390720367431641, "global_step": 95538, "epoch": 2274} {"train_loss": -6.3948211669921875, "global_step": 95539, "epoch": 2274} {"train_loss": -6.277494430541992, "global_step": 95540, "epoch": 2274} {"train_loss": -6.254538059234619, "global_step": 95541, "epoch": 2274} {"train_loss": -6.261971473693848, "global_step": 95542, "epoch": 2274} {"train_loss": -6.323838233947754, "global_step": 95543, "epoch": 2274} {"train_loss": -6.34814453125, "global_step": 95544, "epoch": 2274} {"train_loss": -6.252420902252197, "global_step": 95545, "epoch": 2274} {"train_loss": -6.33476448059082, "global_step": 95546, "epoch": 2274} {"train_loss": -6.408026218414307, "global_step": 95547, "epoch": 2274} {"train_loss": -6.1345953941345215, "global_step": 95548, "epoch": 2274} {"train_loss": -6.33027340116955, "global_step": 95549, "epoch": 2274, "val_loss": 63765.68359375} {"train_loss": -6.301916599273682, "global_step": 95550, "epoch": 2275} {"train_loss": -6.269736289978027, "global_step": 95551, "epoch": 2275} {"train_loss": -6.271693229675293, "global_step": 95552, "epoch": 2275} {"train_loss": -6.362298011779785, "global_step": 95553, "epoch": 2275} {"train_loss": -6.306816101074219, "global_step": 95554, "epoch": 2275} {"train_loss": -6.243367671966553, "global_step": 95555, "epoch": 2275} {"train_loss": -6.241504669189453, "global_step": 95556, "epoch": 2275} {"train_loss": -6.18203067779541, "global_step": 95557, "epoch": 2275} {"train_loss": -6.317214012145996, "global_step": 95558, "epoch": 2275} {"train_loss": -6.288843154907227, "global_step": 95559, "epoch": 2275} {"train_loss": -6.246249198913574, "global_step": 95560, "epoch": 2275} {"train_loss": -6.393723487854004, "global_step": 95561, "epoch": 2275} {"train_loss": -6.296076774597168, "global_step": 95562, "epoch": 2275} {"train_loss": -6.267128944396973, "global_step": 95563, "epoch": 2275} {"train_loss": -6.35591983795166, "global_step": 95564, "epoch": 2275} {"train_loss": -6.348126411437988, "global_step": 95565, "epoch": 2275} {"train_loss": -6.259637355804443, "global_step": 95566, "epoch": 2275} {"train_loss": -6.408153057098389, "global_step": 95567, "epoch": 2275} {"train_loss": -6.274660110473633, "global_step": 95568, "epoch": 2275} {"train_loss": -6.226895332336426, "global_step": 95569, "epoch": 2275} {"train_loss": -6.215913772583008, "global_step": 95570, "epoch": 2275} {"train_loss": -6.43977165222168, "global_step": 95571, "epoch": 2275} {"train_loss": -6.323885917663574, "global_step": 95572, "epoch": 2275} {"train_loss": -6.369439125061035, "global_step": 95573, "epoch": 2275} {"train_loss": -6.325562000274658, "global_step": 95574, "epoch": 2275} {"train_loss": -6.333561897277832, "global_step": 95575, "epoch": 2275} {"train_loss": -6.3172807693481445, "global_step": 95576, "epoch": 2275} {"train_loss": -6.32731819152832, "global_step": 95577, "epoch": 2275} {"train_loss": -6.3908233642578125, "global_step": 95578, "epoch": 2275} {"train_loss": -6.338927745819092, "global_step": 95579, "epoch": 2275} {"train_loss": -6.344820976257324, "global_step": 95580, "epoch": 2275} {"train_loss": -6.431147575378418, "global_step": 95581, "epoch": 2275} {"train_loss": -6.437745571136475, "global_step": 95582, "epoch": 2275} {"train_loss": -6.29866886138916, "global_step": 95583, "epoch": 2275} {"train_loss": -6.431059837341309, "global_step": 95584, "epoch": 2275} {"train_loss": -6.335613250732422, "global_step": 95585, "epoch": 2275} {"train_loss": -6.346750259399414, "global_step": 95586, "epoch": 2275} {"train_loss": -6.35056209564209, "global_step": 95587, "epoch": 2275} {"train_loss": -6.24990177154541, "global_step": 95588, "epoch": 2275} {"train_loss": -6.17958402633667, "global_step": 95589, "epoch": 2275} {"train_loss": -6.305099010467529, "global_step": 95590, "epoch": 2275} {"train_loss": -6.314933617909749, "global_step": 95591, "epoch": 2275, "val_loss": 63665.88671875} {"train_loss": -6.394829750061035, "global_step": 95592, "epoch": 2276} {"train_loss": -6.274900436401367, "global_step": 95593, "epoch": 2276} {"train_loss": -6.154475688934326, "global_step": 95594, "epoch": 2276} {"train_loss": -6.323343276977539, "global_step": 95595, "epoch": 2276} {"train_loss": -6.2822771072387695, "global_step": 95596, "epoch": 2276} {"train_loss": -6.284136772155762, "global_step": 95597, "epoch": 2276} {"train_loss": -6.18879508972168, "global_step": 95598, "epoch": 2276} {"train_loss": -6.183623313903809, "global_step": 95599, "epoch": 2276} {"train_loss": -6.218211650848389, "global_step": 95600, "epoch": 2276} {"train_loss": -6.253615379333496, "global_step": 95601, "epoch": 2276} {"train_loss": -6.227864742279053, "global_step": 95602, "epoch": 2276} {"train_loss": -6.236371040344238, "global_step": 95603, "epoch": 2276} {"train_loss": -6.17825984954834, "global_step": 95604, "epoch": 2276} {"train_loss": -6.252930164337158, "global_step": 95605, "epoch": 2276} {"train_loss": -6.350799083709717, "global_step": 95606, "epoch": 2276} {"train_loss": -6.317322731018066, "global_step": 95607, "epoch": 2276} {"train_loss": -6.364149570465088, "global_step": 95608, "epoch": 2276} {"train_loss": -6.317499160766602, "global_step": 95609, "epoch": 2276} {"train_loss": -6.403053283691406, "global_step": 95610, "epoch": 2276} {"train_loss": -6.401178359985352, "global_step": 95611, "epoch": 2276} {"train_loss": -6.367532730102539, "global_step": 95612, "epoch": 2276} {"train_loss": -6.368442535400391, "global_step": 95613, "epoch": 2276} {"train_loss": -6.3329644203186035, "global_step": 95614, "epoch": 2276} {"train_loss": -6.372148513793945, "global_step": 95615, "epoch": 2276} {"train_loss": -6.457456111907959, "global_step": 95616, "epoch": 2276} {"train_loss": -6.254538536071777, "global_step": 95617, "epoch": 2276} {"train_loss": -6.3722639083862305, "global_step": 95618, "epoch": 2276} {"train_loss": -6.396129608154297, "global_step": 95619, "epoch": 2276} {"train_loss": -6.361865997314453, "global_step": 95620, "epoch": 2276} {"train_loss": -6.343416213989258, "global_step": 95621, "epoch": 2276} {"train_loss": -6.291715621948242, "global_step": 95622, "epoch": 2276} {"train_loss": -6.365573883056641, "global_step": 95623, "epoch": 2276} {"train_loss": -6.415422439575195, "global_step": 95624, "epoch": 2276} {"train_loss": -6.314853191375732, "global_step": 95625, "epoch": 2276} {"train_loss": -6.390822410583496, "global_step": 95626, "epoch": 2276} {"train_loss": -6.316460609436035, "global_step": 95627, "epoch": 2276} {"train_loss": -6.24139404296875, "global_step": 95628, "epoch": 2276} {"train_loss": -6.346426486968994, "global_step": 95629, "epoch": 2276} {"train_loss": -6.440542221069336, "global_step": 95630, "epoch": 2276} {"train_loss": -6.354574680328369, "global_step": 95631, "epoch": 2276} {"train_loss": -6.3624467849731445, "global_step": 95632, "epoch": 2276} {"train_loss": -6.31941522870745, "global_step": 95633, "epoch": 2276, "val_loss": 63734.81640625} {"train_loss": -6.3358612060546875, "global_step": 95634, "epoch": 2277} {"train_loss": -6.431713581085205, "global_step": 95635, "epoch": 2277} {"train_loss": -6.35107421875, "global_step": 95636, "epoch": 2277} {"train_loss": -6.386105060577393, "global_step": 95637, "epoch": 2277} {"train_loss": -6.32620906829834, "global_step": 95638, "epoch": 2277} {"train_loss": -6.246931552886963, "global_step": 95639, "epoch": 2277} {"train_loss": -6.302649974822998, "global_step": 95640, "epoch": 2277} {"train_loss": -6.332784175872803, "global_step": 95641, "epoch": 2277} {"train_loss": -6.312971115112305, "global_step": 95642, "epoch": 2277} {"train_loss": -6.3613505363464355, "global_step": 95643, "epoch": 2277} {"train_loss": -6.338050842285156, "global_step": 95644, "epoch": 2277} {"train_loss": -6.487915992736816, "global_step": 95645, "epoch": 2277} {"train_loss": -6.409065246582031, "global_step": 95646, "epoch": 2277} {"train_loss": -6.453221321105957, "global_step": 95647, "epoch": 2277} {"train_loss": -6.440450668334961, "global_step": 95648, "epoch": 2277} {"train_loss": -6.342983245849609, "global_step": 95649, "epoch": 2277} {"train_loss": -6.358137130737305, "global_step": 95650, "epoch": 2277} {"train_loss": -6.232900619506836, "global_step": 95651, "epoch": 2277} {"train_loss": -6.3206939697265625, "global_step": 95652, "epoch": 2277} {"train_loss": -6.366215705871582, "global_step": 95653, "epoch": 2277} {"train_loss": -6.3670973777771, "global_step": 95654, "epoch": 2277} {"train_loss": -6.400277137756348, "global_step": 95655, "epoch": 2277} {"train_loss": -6.330103397369385, "global_step": 95656, "epoch": 2277} {"train_loss": -6.372410297393799, "global_step": 95657, "epoch": 2277} {"train_loss": -6.388236045837402, "global_step": 95658, "epoch": 2277} {"train_loss": -6.442349433898926, "global_step": 95659, "epoch": 2277} {"train_loss": -6.174650192260742, "global_step": 95660, "epoch": 2277} {"train_loss": -6.294061660766602, "global_step": 95661, "epoch": 2277} {"train_loss": -6.292299270629883, "global_step": 95662, "epoch": 2277} {"train_loss": -6.270899772644043, "global_step": 95663, "epoch": 2277} {"train_loss": -6.483916282653809, "global_step": 95664, "epoch": 2277} {"train_loss": -6.305320739746094, "global_step": 95665, "epoch": 2277} {"train_loss": -6.31109619140625, "global_step": 95666, "epoch": 2277} {"train_loss": -6.37983512878418, "global_step": 95667, "epoch": 2277} {"train_loss": -6.304871082305908, "global_step": 95668, "epoch": 2277} {"train_loss": -6.113481521606445, "global_step": 95669, "epoch": 2277} {"train_loss": -6.259199619293213, "global_step": 95670, "epoch": 2277} {"train_loss": -6.255651473999023, "global_step": 95671, "epoch": 2277} {"train_loss": -6.281444549560547, "global_step": 95672, "epoch": 2277} {"train_loss": -6.410804271697998, "global_step": 95673, "epoch": 2277} {"train_loss": -6.294059753417969, "global_step": 95674, "epoch": 2277} {"train_loss": -6.339226620537894, "global_step": 95675, "epoch": 2277, "val_loss": 64010.16015625} {"train_loss": -6.372262954711914, "global_step": 95676, "epoch": 2278} {"train_loss": -6.248916149139404, "global_step": 95677, "epoch": 2278} {"train_loss": -6.2478179931640625, "global_step": 95678, "epoch": 2278} {"train_loss": -6.408374786376953, "global_step": 95679, "epoch": 2278} {"train_loss": -6.395364761352539, "global_step": 95680, "epoch": 2278} {"train_loss": -6.3161749839782715, "global_step": 95681, "epoch": 2278} {"train_loss": -6.318286895751953, "global_step": 95682, "epoch": 2278} {"train_loss": -6.333364486694336, "global_step": 95683, "epoch": 2278} {"train_loss": -6.270008087158203, "global_step": 95684, "epoch": 2278} {"train_loss": -6.363400459289551, "global_step": 95685, "epoch": 2278} {"train_loss": -6.3160529136657715, "global_step": 95686, "epoch": 2278} {"train_loss": -6.328533172607422, "global_step": 95687, "epoch": 2278} {"train_loss": -6.238486289978027, "global_step": 95688, "epoch": 2278} {"train_loss": -6.338055610656738, "global_step": 95689, "epoch": 2278} {"train_loss": -6.3438544273376465, "global_step": 95690, "epoch": 2278} {"train_loss": -6.358569145202637, "global_step": 95691, "epoch": 2278} {"train_loss": -6.3564019203186035, "global_step": 95692, "epoch": 2278} {"train_loss": -6.2840166091918945, "global_step": 95693, "epoch": 2278} {"train_loss": -6.382389068603516, "global_step": 95694, "epoch": 2278} {"train_loss": -6.361459255218506, "global_step": 95695, "epoch": 2278} {"train_loss": -6.279480934143066, "global_step": 95696, "epoch": 2278} {"train_loss": -6.228425025939941, "global_step": 95697, "epoch": 2278} {"train_loss": -6.332752227783203, "global_step": 95698, "epoch": 2278} {"train_loss": -6.227864742279053, "global_step": 95699, "epoch": 2278} {"train_loss": -6.288965225219727, "global_step": 95700, "epoch": 2278} {"train_loss": -6.302433490753174, "global_step": 95701, "epoch": 2278} {"train_loss": -6.213869571685791, "global_step": 95702, "epoch": 2278} {"train_loss": -6.353399753570557, "global_step": 95703, "epoch": 2278} {"train_loss": -6.339479446411133, "global_step": 95704, "epoch": 2278} {"train_loss": -6.223569869995117, "global_step": 95705, "epoch": 2278} {"train_loss": -6.295288562774658, "global_step": 95706, "epoch": 2278} {"train_loss": -6.3020148277282715, "global_step": 95707, "epoch": 2278} {"train_loss": -6.300575256347656, "global_step": 95708, "epoch": 2278} {"train_loss": -6.305180549621582, "global_step": 95709, "epoch": 2278} {"train_loss": -6.40623140335083, "global_step": 95710, "epoch": 2278} {"train_loss": -6.228672981262207, "global_step": 95711, "epoch": 2278} {"train_loss": -6.324341773986816, "global_step": 95712, "epoch": 2278} {"train_loss": -6.194141387939453, "global_step": 95713, "epoch": 2278} {"train_loss": -6.314502716064453, "global_step": 95714, "epoch": 2278} {"train_loss": -6.314007759094238, "global_step": 95715, "epoch": 2278} {"train_loss": -6.390964508056641, "global_step": 95716, "epoch": 2278} {"train_loss": -6.308613731747582, "global_step": 95717, "epoch": 2278, "val_loss": 63755.03125} {"train_loss": -6.2290143966674805, "global_step": 95718, "epoch": 2279} {"train_loss": -6.269865036010742, "global_step": 95719, "epoch": 2279} {"train_loss": -6.305166244506836, "global_step": 95720, "epoch": 2279} {"train_loss": -6.178210735321045, "global_step": 95721, "epoch": 2279} {"train_loss": -6.225152015686035, "global_step": 95722, "epoch": 2279} {"train_loss": -6.28622579574585, "global_step": 95723, "epoch": 2279} {"train_loss": -6.246706962585449, "global_step": 95724, "epoch": 2279} {"train_loss": -6.26116418838501, "global_step": 95725, "epoch": 2279} {"train_loss": -6.331515312194824, "global_step": 95726, "epoch": 2279} {"train_loss": -6.1894917488098145, "global_step": 95727, "epoch": 2279} {"train_loss": -6.292189121246338, "global_step": 95728, "epoch": 2279} {"train_loss": -6.272157669067383, "global_step": 95729, "epoch": 2279} {"train_loss": -6.291978359222412, "global_step": 95730, "epoch": 2279} {"train_loss": -6.466160774230957, "global_step": 95731, "epoch": 2279} {"train_loss": -6.27995491027832, "global_step": 95732, "epoch": 2279} {"train_loss": -6.133847236633301, "global_step": 95733, "epoch": 2279} {"train_loss": -6.348685264587402, "global_step": 95734, "epoch": 2279} {"train_loss": -6.307337760925293, "global_step": 95735, "epoch": 2279} {"train_loss": -6.198139190673828, "global_step": 95736, "epoch": 2279} {"train_loss": -6.3257365226745605, "global_step": 95737, "epoch": 2279} {"train_loss": -6.235524654388428, "global_step": 95738, "epoch": 2279} {"train_loss": -6.297282695770264, "global_step": 95739, "epoch": 2279} {"train_loss": -6.301910400390625, "global_step": 95740, "epoch": 2279} {"train_loss": -6.221250057220459, "global_step": 95741, "epoch": 2279} {"train_loss": -6.305082321166992, "global_step": 95742, "epoch": 2279} {"train_loss": -6.23353385925293, "global_step": 95743, "epoch": 2279} {"train_loss": -6.343877792358398, "global_step": 95744, "epoch": 2279} {"train_loss": -6.415249347686768, "global_step": 95745, "epoch": 2279} {"train_loss": -6.369657516479492, "global_step": 95746, "epoch": 2279} {"train_loss": -6.261076927185059, "global_step": 95747, "epoch": 2279} {"train_loss": -6.183207988739014, "global_step": 95748, "epoch": 2279} {"train_loss": -6.207788467407227, "global_step": 95749, "epoch": 2279} {"train_loss": -6.259817123413086, "global_step": 95750, "epoch": 2279} {"train_loss": -6.2441020011901855, "global_step": 95751, "epoch": 2279} {"train_loss": -6.265069961547852, "global_step": 95752, "epoch": 2279} {"train_loss": -6.353275299072266, "global_step": 95753, "epoch": 2279} {"train_loss": -6.260527610778809, "global_step": 95754, "epoch": 2279} {"train_loss": -6.296586990356445, "global_step": 95755, "epoch": 2279} {"train_loss": -6.325573921203613, "global_step": 95756, "epoch": 2279} {"train_loss": -6.246091842651367, "global_step": 95757, "epoch": 2279} {"train_loss": -6.215236663818359, "global_step": 95758, "epoch": 2279} {"train_loss": -6.276037534077962, "global_step": 95759, "epoch": 2279, "val_loss": 63887.60546875} {"train_loss": -6.408943176269531, "global_step": 95760, "epoch": 2280} {"train_loss": -6.191568374633789, "global_step": 95761, "epoch": 2280} {"train_loss": -6.281556129455566, "global_step": 95762, "epoch": 2280} {"train_loss": -6.318289756774902, "global_step": 95763, "epoch": 2280} {"train_loss": -6.313861846923828, "global_step": 95764, "epoch": 2280} {"train_loss": -6.270012855529785, "global_step": 95765, "epoch": 2280} {"train_loss": -6.293386936187744, "global_step": 95766, "epoch": 2280} {"train_loss": -6.388425827026367, "global_step": 95767, "epoch": 2280} {"train_loss": -6.313103675842285, "global_step": 95768, "epoch": 2280} {"train_loss": -6.313698768615723, "global_step": 95769, "epoch": 2280} {"train_loss": -6.343522548675537, "global_step": 95770, "epoch": 2280} {"train_loss": -6.334245681762695, "global_step": 95771, "epoch": 2280} {"train_loss": -6.400199890136719, "global_step": 95772, "epoch": 2280} {"train_loss": -6.358111381530762, "global_step": 95773, "epoch": 2280} {"train_loss": -6.4088029861450195, "global_step": 95774, "epoch": 2280} {"train_loss": -6.388584136962891, "global_step": 95775, "epoch": 2280} {"train_loss": -6.222635746002197, "global_step": 95776, "epoch": 2280} {"train_loss": -6.371062278747559, "global_step": 95777, "epoch": 2280} {"train_loss": -6.392299652099609, "global_step": 95778, "epoch": 2280} {"train_loss": -6.43386173248291, "global_step": 95779, "epoch": 2280} {"train_loss": -6.326973915100098, "global_step": 95780, "epoch": 2280} {"train_loss": -6.4032135009765625, "global_step": 95781, "epoch": 2280} {"train_loss": -6.338462829589844, "global_step": 95782, "epoch": 2280} {"train_loss": -6.363895416259766, "global_step": 95783, "epoch": 2280} {"train_loss": -6.471468448638916, "global_step": 95784, "epoch": 2280} {"train_loss": -6.405828952789307, "global_step": 95785, "epoch": 2280} {"train_loss": -6.38530969619751, "global_step": 95786, "epoch": 2280} {"train_loss": -6.3427300453186035, "global_step": 95787, "epoch": 2280} {"train_loss": -6.40519380569458, "global_step": 95788, "epoch": 2280} {"train_loss": -6.363909721374512, "global_step": 95789, "epoch": 2280} {"train_loss": -6.338741779327393, "global_step": 95790, "epoch": 2280} {"train_loss": -6.340046405792236, "global_step": 95791, "epoch": 2280} {"train_loss": -6.245847702026367, "global_step": 95792, "epoch": 2280} {"train_loss": -6.392580986022949, "global_step": 95793, "epoch": 2280} {"train_loss": -6.355320930480957, "global_step": 95794, "epoch": 2280} {"train_loss": -6.3262763023376465, "global_step": 95795, "epoch": 2280} {"train_loss": -6.3605241775512695, "global_step": 95796, "epoch": 2280} {"train_loss": -6.219511032104492, "global_step": 95797, "epoch": 2280} {"train_loss": -6.283545970916748, "global_step": 95798, "epoch": 2280} {"train_loss": -6.329174518585205, "global_step": 95799, "epoch": 2280} {"train_loss": -6.204742908477783, "global_step": 95800, "epoch": 2280} {"train_loss": -6.342407192502703, "global_step": 95801, "epoch": 2280, "val_loss": 63559.015625} {"train_loss": -6.406505584716797, "global_step": 95802, "epoch": 2281} {"train_loss": -6.425185203552246, "global_step": 95803, "epoch": 2281} {"train_loss": -6.2987775802612305, "global_step": 95804, "epoch": 2281} {"train_loss": -6.368242263793945, "global_step": 95805, "epoch": 2281} {"train_loss": -6.447978496551514, "global_step": 95806, "epoch": 2281} {"train_loss": -6.306431770324707, "global_step": 95807, "epoch": 2281} {"train_loss": -6.277096271514893, "global_step": 95808, "epoch": 2281} {"train_loss": -6.219629287719727, "global_step": 95809, "epoch": 2281} {"train_loss": -6.425881385803223, "global_step": 95810, "epoch": 2281} {"train_loss": -6.322719573974609, "global_step": 95811, "epoch": 2281} {"train_loss": -6.327085494995117, "global_step": 95812, "epoch": 2281} {"train_loss": -6.381791114807129, "global_step": 95813, "epoch": 2281} {"train_loss": -6.426567077636719, "global_step": 95814, "epoch": 2281} {"train_loss": -6.244841575622559, "global_step": 95815, "epoch": 2281} {"train_loss": -6.359615325927734, "global_step": 95816, "epoch": 2281} {"train_loss": -6.346377372741699, "global_step": 95817, "epoch": 2281} {"train_loss": -6.380745887756348, "global_step": 95818, "epoch": 2281} {"train_loss": -6.228843688964844, "global_step": 95819, "epoch": 2281} {"train_loss": -6.280123710632324, "global_step": 95820, "epoch": 2281} {"train_loss": -6.303855895996094, "global_step": 95821, "epoch": 2281} {"train_loss": -6.2896575927734375, "global_step": 95822, "epoch": 2281} {"train_loss": -6.387629508972168, "global_step": 95823, "epoch": 2281} {"train_loss": -6.419607162475586, "global_step": 95824, "epoch": 2281} {"train_loss": -6.385106086730957, "global_step": 95825, "epoch": 2281} {"train_loss": -6.377105712890625, "global_step": 95826, "epoch": 2281} {"train_loss": -6.2185564041137695, "global_step": 95827, "epoch": 2281} {"train_loss": -6.368866920471191, "global_step": 95828, "epoch": 2281} {"train_loss": -6.353523254394531, "global_step": 95829, "epoch": 2281} {"train_loss": -6.300827980041504, "global_step": 95830, "epoch": 2281} {"train_loss": -6.2229814529418945, "global_step": 95831, "epoch": 2281} {"train_loss": -6.305466175079346, "global_step": 95832, "epoch": 2281} {"train_loss": -6.348334789276123, "global_step": 95833, "epoch": 2281} {"train_loss": -6.2920732498168945, "global_step": 95834, "epoch": 2281} {"train_loss": -6.321335315704346, "global_step": 95835, "epoch": 2281} {"train_loss": -6.316417694091797, "global_step": 95836, "epoch": 2281} {"train_loss": -6.267739295959473, "global_step": 95837, "epoch": 2281} {"train_loss": -6.375218391418457, "global_step": 95838, "epoch": 2281} {"train_loss": -6.305373191833496, "global_step": 95839, "epoch": 2281} {"train_loss": -6.388188362121582, "global_step": 95840, "epoch": 2281} {"train_loss": -6.323200225830078, "global_step": 95841, "epoch": 2281} {"train_loss": -6.336562156677246, "global_step": 95842, "epoch": 2281} {"train_loss": -6.334329253151303, "global_step": 95843, "epoch": 2281, "val_loss": 63787.12109375} {"train_loss": -6.391834259033203, "global_step": 95844, "epoch": 2282} {"train_loss": -6.299706935882568, "global_step": 95845, "epoch": 2282} {"train_loss": -6.320417881011963, "global_step": 95846, "epoch": 2282} {"train_loss": -6.452391147613525, "global_step": 95847, "epoch": 2282} {"train_loss": -6.4073381423950195, "global_step": 95848, "epoch": 2282} {"train_loss": -6.409420013427734, "global_step": 95849, "epoch": 2282} {"train_loss": -6.385034561157227, "global_step": 95850, "epoch": 2282} {"train_loss": -6.30126953125, "global_step": 95851, "epoch": 2282} {"train_loss": -6.316087245941162, "global_step": 95852, "epoch": 2282} {"train_loss": -6.310647964477539, "global_step": 95853, "epoch": 2282} {"train_loss": -6.274711608886719, "global_step": 95854, "epoch": 2282} {"train_loss": -6.248879432678223, "global_step": 95855, "epoch": 2282} {"train_loss": -6.451184272766113, "global_step": 95856, "epoch": 2282} {"train_loss": -6.417792320251465, "global_step": 95857, "epoch": 2282} {"train_loss": -6.143303871154785, "global_step": 95858, "epoch": 2282} {"train_loss": -6.275449275970459, "global_step": 95859, "epoch": 2282} {"train_loss": -6.374967575073242, "global_step": 95860, "epoch": 2282} {"train_loss": -6.374818801879883, "global_step": 95861, "epoch": 2282} {"train_loss": -6.264206886291504, "global_step": 95862, "epoch": 2282} {"train_loss": -6.298784255981445, "global_step": 95863, "epoch": 2282} {"train_loss": -6.4723005294799805, "global_step": 95864, "epoch": 2282} {"train_loss": -6.287322044372559, "global_step": 95865, "epoch": 2282} {"train_loss": -6.341525077819824, "global_step": 95866, "epoch": 2282} {"train_loss": -6.312849044799805, "global_step": 95867, "epoch": 2282} {"train_loss": -6.230804443359375, "global_step": 95868, "epoch": 2282} {"train_loss": -6.331322193145752, "global_step": 95869, "epoch": 2282} {"train_loss": -6.3027825355529785, "global_step": 95870, "epoch": 2282} {"train_loss": -6.25753116607666, "global_step": 95871, "epoch": 2282} {"train_loss": -6.162344932556152, "global_step": 95872, "epoch": 2282} {"train_loss": -6.2150373458862305, "global_step": 95873, "epoch": 2282} {"train_loss": -6.354544162750244, "global_step": 95874, "epoch": 2282} {"train_loss": -6.3449296951293945, "global_step": 95875, "epoch": 2282} {"train_loss": -6.364859580993652, "global_step": 95876, "epoch": 2282} {"train_loss": -6.416398525238037, "global_step": 95877, "epoch": 2282} {"train_loss": -6.247955322265625, "global_step": 95878, "epoch": 2282} {"train_loss": -6.371356964111328, "global_step": 95879, "epoch": 2282} {"train_loss": -6.382820129394531, "global_step": 95880, "epoch": 2282} {"train_loss": -6.392403602600098, "global_step": 95881, "epoch": 2282} {"train_loss": -6.337802886962891, "global_step": 95882, "epoch": 2282} {"train_loss": -6.45710563659668, "global_step": 95883, "epoch": 2282} {"train_loss": -6.330780506134033, "global_step": 95884, "epoch": 2282} {"train_loss": -6.3347767648242765, "global_step": 95885, "epoch": 2282, "val_loss": 63738.20703125} {"train_loss": -6.313312530517578, "global_step": 95886, "epoch": 2283} {"train_loss": -6.377355575561523, "global_step": 95887, "epoch": 2283} {"train_loss": -6.245244026184082, "global_step": 95888, "epoch": 2283} {"train_loss": -6.412108421325684, "global_step": 95889, "epoch": 2283} {"train_loss": -6.235910415649414, "global_step": 95890, "epoch": 2283} {"train_loss": -6.276719093322754, "global_step": 95891, "epoch": 2283} {"train_loss": -6.227609634399414, "global_step": 95892, "epoch": 2283} {"train_loss": -6.309998989105225, "global_step": 95893, "epoch": 2283} {"train_loss": -6.293795585632324, "global_step": 95894, "epoch": 2283} {"train_loss": -6.260790824890137, "global_step": 95895, "epoch": 2283} {"train_loss": -6.414482116699219, "global_step": 95896, "epoch": 2283} {"train_loss": -6.2832183837890625, "global_step": 95897, "epoch": 2283} {"train_loss": -6.422244071960449, "global_step": 95898, "epoch": 2283} {"train_loss": -6.343640327453613, "global_step": 95899, "epoch": 2283} {"train_loss": -6.364809989929199, "global_step": 95900, "epoch": 2283} {"train_loss": -6.310554504394531, "global_step": 95901, "epoch": 2283} {"train_loss": -6.335119247436523, "global_step": 95902, "epoch": 2283} {"train_loss": -6.254321575164795, "global_step": 95903, "epoch": 2283} {"train_loss": -6.265070915222168, "global_step": 95904, "epoch": 2283} {"train_loss": -6.332815170288086, "global_step": 95905, "epoch": 2283} {"train_loss": -6.275673866271973, "global_step": 95906, "epoch": 2283} {"train_loss": -6.372939586639404, "global_step": 95907, "epoch": 2283} {"train_loss": -6.341268539428711, "global_step": 95908, "epoch": 2283} {"train_loss": -6.320465087890625, "global_step": 95909, "epoch": 2283} {"train_loss": -6.349309921264648, "global_step": 95910, "epoch": 2283} {"train_loss": -6.201031684875488, "global_step": 95911, "epoch": 2283} {"train_loss": -6.422289848327637, "global_step": 95912, "epoch": 2283} {"train_loss": -6.394383907318115, "global_step": 95913, "epoch": 2283} {"train_loss": -6.408788681030273, "global_step": 95914, "epoch": 2283} {"train_loss": -6.332056999206543, "global_step": 95915, "epoch": 2283} {"train_loss": -6.33286714553833, "global_step": 95916, "epoch": 2283} {"train_loss": -6.261063575744629, "global_step": 95917, "epoch": 2283} {"train_loss": -6.300520896911621, "global_step": 95918, "epoch": 2283} {"train_loss": -6.31891393661499, "global_step": 95919, "epoch": 2283} {"train_loss": -6.3573784828186035, "global_step": 95920, "epoch": 2283} {"train_loss": -6.35252046585083, "global_step": 95921, "epoch": 2283} {"train_loss": -6.330305576324463, "global_step": 95922, "epoch": 2283} {"train_loss": -6.329784393310547, "global_step": 95923, "epoch": 2283} {"train_loss": -6.2878947257995605, "global_step": 95924, "epoch": 2283} {"train_loss": -6.299773693084717, "global_step": 95925, "epoch": 2283} {"train_loss": -6.235587120056152, "global_step": 95926, "epoch": 2283} {"train_loss": -6.317449308577038, "global_step": 95927, "epoch": 2283, "val_loss": 63902.77734375} {"train_loss": -6.283856391906738, "global_step": 95928, "epoch": 2284} {"train_loss": -6.407357215881348, "global_step": 95929, "epoch": 2284} {"train_loss": -6.232736587524414, "global_step": 95930, "epoch": 2284} {"train_loss": -6.177982330322266, "global_step": 95931, "epoch": 2284} {"train_loss": -6.425835609436035, "global_step": 95932, "epoch": 2284} {"train_loss": -6.142853736877441, "global_step": 95933, "epoch": 2284} {"train_loss": -6.381105899810791, "global_step": 95934, "epoch": 2284} {"train_loss": -6.319405555725098, "global_step": 95935, "epoch": 2284} {"train_loss": -6.288246154785156, "global_step": 95936, "epoch": 2284} {"train_loss": -6.211057662963867, "global_step": 95937, "epoch": 2284} {"train_loss": -6.334903717041016, "global_step": 95938, "epoch": 2284} {"train_loss": -6.338214874267578, "global_step": 95939, "epoch": 2284} {"train_loss": -6.30269718170166, "global_step": 95940, "epoch": 2284} {"train_loss": -6.310439109802246, "global_step": 95941, "epoch": 2284} {"train_loss": -6.505353927612305, "global_step": 95942, "epoch": 2284} {"train_loss": -6.268790245056152, "global_step": 95943, "epoch": 2284} {"train_loss": -6.315770149230957, "global_step": 95944, "epoch": 2284} {"train_loss": -6.359305381774902, "global_step": 95945, "epoch": 2284} {"train_loss": -6.425478458404541, "global_step": 95946, "epoch": 2284} {"train_loss": -6.32819128036499, "global_step": 95947, "epoch": 2284} {"train_loss": -6.213527679443359, "global_step": 95948, "epoch": 2284} {"train_loss": -6.337658882141113, "global_step": 95949, "epoch": 2284} {"train_loss": -6.3752641677856445, "global_step": 95950, "epoch": 2284} {"train_loss": -6.305230140686035, "global_step": 95951, "epoch": 2284} {"train_loss": -6.353455066680908, "global_step": 95952, "epoch": 2284} {"train_loss": -6.335478782653809, "global_step": 95953, "epoch": 2284} {"train_loss": -6.296199798583984, "global_step": 95954, "epoch": 2284} {"train_loss": -6.327301502227783, "global_step": 95955, "epoch": 2284} {"train_loss": -6.197466850280762, "global_step": 95956, "epoch": 2284} {"train_loss": -6.314918518066406, "global_step": 95957, "epoch": 2284} {"train_loss": -6.272947788238525, "global_step": 95958, "epoch": 2284} {"train_loss": -6.376424789428711, "global_step": 95959, "epoch": 2284} {"train_loss": -6.386996746063232, "global_step": 95960, "epoch": 2284} {"train_loss": -6.35987663269043, "global_step": 95961, "epoch": 2284} {"train_loss": -6.3055620193481445, "global_step": 95962, "epoch": 2284} {"train_loss": -6.33106803894043, "global_step": 95963, "epoch": 2284} {"train_loss": -6.349435806274414, "global_step": 95964, "epoch": 2284} {"train_loss": -6.385444641113281, "global_step": 95965, "epoch": 2284} {"train_loss": -6.28790283203125, "global_step": 95966, "epoch": 2284} {"train_loss": -6.289941310882568, "global_step": 95967, "epoch": 2284} {"train_loss": -6.330589294433594, "global_step": 95968, "epoch": 2284} {"train_loss": -6.319214321318126, "global_step": 95969, "epoch": 2284, "val_loss": 63665.15625} {"train_loss": -6.277128219604492, "global_step": 95970, "epoch": 2285} {"train_loss": -6.316134452819824, "global_step": 95971, "epoch": 2285} {"train_loss": -6.267918586730957, "global_step": 95972, "epoch": 2285} {"train_loss": -6.253807067871094, "global_step": 95973, "epoch": 2285} {"train_loss": -6.27987813949585, "global_step": 95974, "epoch": 2285} {"train_loss": -6.270936012268066, "global_step": 95975, "epoch": 2285} {"train_loss": -6.138550758361816, "global_step": 95976, "epoch": 2285} {"train_loss": -6.28441047668457, "global_step": 95977, "epoch": 2285} {"train_loss": -6.425195693969727, "global_step": 95978, "epoch": 2285} {"train_loss": -6.300748348236084, "global_step": 95979, "epoch": 2285} {"train_loss": -6.337891578674316, "global_step": 95980, "epoch": 2285} {"train_loss": -6.359629154205322, "global_step": 95981, "epoch": 2285} {"train_loss": -6.41580867767334, "global_step": 95982, "epoch": 2285} {"train_loss": -6.406556129455566, "global_step": 95983, "epoch": 2285} {"train_loss": -6.387720584869385, "global_step": 95984, "epoch": 2285} {"train_loss": -6.413978576660156, "global_step": 95985, "epoch": 2285} {"train_loss": -6.4557647705078125, "global_step": 95986, "epoch": 2285} {"train_loss": -6.322583198547363, "global_step": 95987, "epoch": 2285} {"train_loss": -6.411929130554199, "global_step": 95988, "epoch": 2285} {"train_loss": -6.347024440765381, "global_step": 95989, "epoch": 2285} {"train_loss": -6.402798652648926, "global_step": 95990, "epoch": 2285} {"train_loss": -6.350441932678223, "global_step": 95991, "epoch": 2285} {"train_loss": -6.337813377380371, "global_step": 95992, "epoch": 2285} {"train_loss": -6.411272048950195, "global_step": 95993, "epoch": 2285} {"train_loss": -6.313652038574219, "global_step": 95994, "epoch": 2285} {"train_loss": -6.411640167236328, "global_step": 95995, "epoch": 2285} {"train_loss": -6.207314491271973, "global_step": 95996, "epoch": 2285} {"train_loss": -6.299934387207031, "global_step": 95997, "epoch": 2285} {"train_loss": -6.341184616088867, "global_step": 95998, "epoch": 2285} {"train_loss": -6.257190704345703, "global_step": 95999, "epoch": 2285} {"train_loss": -6.31032657623291, "global_step": 96000, "epoch": 2285} {"train_loss": -6.2327680587768555, "global_step": 96001, "epoch": 2285} {"train_loss": -6.26066780090332, "global_step": 96002, "epoch": 2285} {"train_loss": -6.323400497436523, "global_step": 96003, "epoch": 2285} {"train_loss": -6.259832382202148, "global_step": 96004, "epoch": 2285} {"train_loss": -6.298830509185791, "global_step": 96005, "epoch": 2285} {"train_loss": -6.271468162536621, "global_step": 96006, "epoch": 2285} {"train_loss": -6.300720691680908, "global_step": 96007, "epoch": 2285} {"train_loss": -6.327335834503174, "global_step": 96008, "epoch": 2285} {"train_loss": -6.3057169914245605, "global_step": 96009, "epoch": 2285} {"train_loss": -6.37607479095459, "global_step": 96010, "epoch": 2285} {"train_loss": -6.322374514171055, "global_step": 96011, "epoch": 2285, "val_loss": 64073.39453125} {"train_loss": -6.207069396972656, "global_step": 96012, "epoch": 2286} {"train_loss": -6.382379531860352, "global_step": 96013, "epoch": 2286} {"train_loss": -6.248867034912109, "global_step": 96014, "epoch": 2286} {"train_loss": -6.380925178527832, "global_step": 96015, "epoch": 2286} {"train_loss": -6.323359966278076, "global_step": 96016, "epoch": 2286} {"train_loss": -6.428848743438721, "global_step": 96017, "epoch": 2286} {"train_loss": -6.354729652404785, "global_step": 96018, "epoch": 2286} {"train_loss": -6.392604827880859, "global_step": 96019, "epoch": 2286} {"train_loss": -6.330479621887207, "global_step": 96020, "epoch": 2286} {"train_loss": -6.252535343170166, "global_step": 96021, "epoch": 2286} {"train_loss": -6.300492286682129, "global_step": 96022, "epoch": 2286} {"train_loss": -6.320978164672852, "global_step": 96023, "epoch": 2286} {"train_loss": -6.344300270080566, "global_step": 96024, "epoch": 2286} {"train_loss": -6.333477020263672, "global_step": 96025, "epoch": 2286} {"train_loss": -6.396261215209961, "global_step": 96026, "epoch": 2286} {"train_loss": -6.350429058074951, "global_step": 96027, "epoch": 2286} {"train_loss": -6.460721969604492, "global_step": 96028, "epoch": 2286} {"train_loss": -6.394669055938721, "global_step": 96029, "epoch": 2286} {"train_loss": -6.410618782043457, "global_step": 96030, "epoch": 2286} {"train_loss": -6.329451560974121, "global_step": 96031, "epoch": 2286} {"train_loss": -6.381114959716797, "global_step": 96032, "epoch": 2286} {"train_loss": -6.3556013107299805, "global_step": 96033, "epoch": 2286} {"train_loss": -6.346526145935059, "global_step": 96034, "epoch": 2286} {"train_loss": -6.376282215118408, "global_step": 96035, "epoch": 2286} {"train_loss": -6.3039116859436035, "global_step": 96036, "epoch": 2286} {"train_loss": -6.429241180419922, "global_step": 96037, "epoch": 2286} {"train_loss": -6.399064064025879, "global_step": 96038, "epoch": 2286} {"train_loss": -6.307019233703613, "global_step": 96039, "epoch": 2286} {"train_loss": -6.330155849456787, "global_step": 96040, "epoch": 2286} {"train_loss": -6.398086071014404, "global_step": 96041, "epoch": 2286} {"train_loss": -6.416382789611816, "global_step": 96042, "epoch": 2286} {"train_loss": -6.473266124725342, "global_step": 96043, "epoch": 2286} {"train_loss": -6.2618818283081055, "global_step": 96044, "epoch": 2286} {"train_loss": -6.43204402923584, "global_step": 96045, "epoch": 2286} {"train_loss": -6.371781826019287, "global_step": 96046, "epoch": 2286} {"train_loss": -6.408177375793457, "global_step": 96047, "epoch": 2286} {"train_loss": -6.428651809692383, "global_step": 96048, "epoch": 2286} {"train_loss": -6.381575584411621, "global_step": 96049, "epoch": 2286} {"train_loss": -6.365955829620361, "global_step": 96050, "epoch": 2286} {"train_loss": -6.3383307456970215, "global_step": 96051, "epoch": 2286} {"train_loss": -6.279387474060059, "global_step": 96052, "epoch": 2286} {"train_loss": -6.3583036831447055, "global_step": 96053, "epoch": 2286, "val_loss": 63722.0625} {"train_loss": -6.368145942687988, "global_step": 96054, "epoch": 2287} {"train_loss": -6.446517467498779, "global_step": 96055, "epoch": 2287} {"train_loss": -6.509200096130371, "global_step": 96056, "epoch": 2287} {"train_loss": -6.378596782684326, "global_step": 96057, "epoch": 2287} {"train_loss": -6.407161712646484, "global_step": 96058, "epoch": 2287} {"train_loss": -6.300953388214111, "global_step": 96059, "epoch": 2287} {"train_loss": -6.351634979248047, "global_step": 96060, "epoch": 2287} {"train_loss": -6.506221771240234, "global_step": 96061, "epoch": 2287} {"train_loss": -6.231543064117432, "global_step": 96062, "epoch": 2287} {"train_loss": -6.302870273590088, "global_step": 96063, "epoch": 2287} {"train_loss": -6.379639625549316, "global_step": 96064, "epoch": 2287} {"train_loss": -6.387314796447754, "global_step": 96065, "epoch": 2287} {"train_loss": -6.401952743530273, "global_step": 96066, "epoch": 2287} {"train_loss": -6.397481918334961, "global_step": 96067, "epoch": 2287} {"train_loss": -6.391932010650635, "global_step": 96068, "epoch": 2287} {"train_loss": -6.308966636657715, "global_step": 96069, "epoch": 2287} {"train_loss": -6.385047912597656, "global_step": 96070, "epoch": 2287} {"train_loss": -6.431990623474121, "global_step": 96071, "epoch": 2287} {"train_loss": -6.337424278259277, "global_step": 96072, "epoch": 2287} {"train_loss": -6.365394592285156, "global_step": 96073, "epoch": 2287} {"train_loss": -6.36873197555542, "global_step": 96074, "epoch": 2287} {"train_loss": -6.360639572143555, "global_step": 96075, "epoch": 2287} {"train_loss": -6.2537736892700195, "global_step": 96076, "epoch": 2287} {"train_loss": -6.354164123535156, "global_step": 96077, "epoch": 2287} {"train_loss": -6.349789619445801, "global_step": 96078, "epoch": 2287} {"train_loss": -6.244877815246582, "global_step": 96079, "epoch": 2287} {"train_loss": -6.244494915008545, "global_step": 96080, "epoch": 2287} {"train_loss": -6.353066444396973, "global_step": 96081, "epoch": 2287} {"train_loss": -6.263273239135742, "global_step": 96082, "epoch": 2287} {"train_loss": -6.209836959838867, "global_step": 96083, "epoch": 2287} {"train_loss": -6.2402119636535645, "global_step": 96084, "epoch": 2287} {"train_loss": -6.14846658706665, "global_step": 96085, "epoch": 2287} {"train_loss": -6.302223205566406, "global_step": 96086, "epoch": 2287} {"train_loss": -6.17418098449707, "global_step": 96087, "epoch": 2287} {"train_loss": -6.214706897735596, "global_step": 96088, "epoch": 2287} {"train_loss": -6.096856594085693, "global_step": 96089, "epoch": 2287} {"train_loss": -6.132732391357422, "global_step": 96090, "epoch": 2287} {"train_loss": -6.362504959106445, "global_step": 96091, "epoch": 2287} {"train_loss": -6.160909652709961, "global_step": 96092, "epoch": 2287} {"train_loss": -6.358964920043945, "global_step": 96093, "epoch": 2287} {"train_loss": -6.275783061981201, "global_step": 96094, "epoch": 2287} {"train_loss": -6.319938886733282, "global_step": 96095, "epoch": 2287, "val_loss": 63697.15234375} {"train_loss": -6.350778579711914, "global_step": 96096, "epoch": 2288} {"train_loss": -6.181039333343506, "global_step": 96097, "epoch": 2288} {"train_loss": -6.327603816986084, "global_step": 96098, "epoch": 2288} {"train_loss": -5.978111267089844, "global_step": 96099, "epoch": 2288} {"train_loss": -6.260137557983398, "global_step": 96100, "epoch": 2288} {"train_loss": -6.139994144439697, "global_step": 96101, "epoch": 2288} {"train_loss": -6.267070770263672, "global_step": 96102, "epoch": 2288} {"train_loss": -6.1464667320251465, "global_step": 96103, "epoch": 2288} {"train_loss": -6.229851722717285, "global_step": 96104, "epoch": 2288} {"train_loss": -6.23256778717041, "global_step": 96105, "epoch": 2288} {"train_loss": -6.138965606689453, "global_step": 96106, "epoch": 2288} {"train_loss": -6.17996883392334, "global_step": 96107, "epoch": 2288} {"train_loss": -6.141717433929443, "global_step": 96108, "epoch": 2288} {"train_loss": -6.362476348876953, "global_step": 96109, "epoch": 2288} {"train_loss": -6.180037021636963, "global_step": 96110, "epoch": 2288} {"train_loss": -6.410006999969482, "global_step": 96111, "epoch": 2288} {"train_loss": -6.037795066833496, "global_step": 96112, "epoch": 2288} {"train_loss": -6.229269981384277, "global_step": 96113, "epoch": 2288} {"train_loss": -6.2929534912109375, "global_step": 96114, "epoch": 2288} {"train_loss": -6.213775634765625, "global_step": 96115, "epoch": 2288} {"train_loss": -6.230491638183594, "global_step": 96116, "epoch": 2288} {"train_loss": -6.253717422485352, "global_step": 96117, "epoch": 2288} {"train_loss": -6.3093743324279785, "global_step": 96118, "epoch": 2288} {"train_loss": -6.3654303550720215, "global_step": 96119, "epoch": 2288} {"train_loss": -6.2750244140625, "global_step": 96120, "epoch": 2288} {"train_loss": -6.203352928161621, "global_step": 96121, "epoch": 2288} {"train_loss": -6.315038681030273, "global_step": 96122, "epoch": 2288} {"train_loss": -6.198076248168945, "global_step": 96123, "epoch": 2288} {"train_loss": -6.316412448883057, "global_step": 96124, "epoch": 2288} {"train_loss": -6.3139753341674805, "global_step": 96125, "epoch": 2288} {"train_loss": -6.30367374420166, "global_step": 96126, "epoch": 2288} {"train_loss": -6.344583034515381, "global_step": 96127, "epoch": 2288} {"train_loss": -6.337271690368652, "global_step": 96128, "epoch": 2288} {"train_loss": -6.276578903198242, "global_step": 96129, "epoch": 2288} {"train_loss": -6.314816474914551, "global_step": 96130, "epoch": 2288} {"train_loss": -6.339722633361816, "global_step": 96131, "epoch": 2288} {"train_loss": -6.318584442138672, "global_step": 96132, "epoch": 2288} {"train_loss": -6.337689399719238, "global_step": 96133, "epoch": 2288} {"train_loss": -6.302792072296143, "global_step": 96134, "epoch": 2288} {"train_loss": -6.388667106628418, "global_step": 96135, "epoch": 2288} {"train_loss": -6.295262813568115, "global_step": 96136, "epoch": 2288} {"train_loss": -6.25963815053304, "global_step": 96137, "epoch": 2288, "val_loss": 63482.8046875} {"train_loss": -6.339727878570557, "global_step": 96138, "epoch": 2289} {"train_loss": -6.308943748474121, "global_step": 96139, "epoch": 2289} {"train_loss": -6.282099723815918, "global_step": 96140, "epoch": 2289} {"train_loss": -6.256453514099121, "global_step": 96141, "epoch": 2289} {"train_loss": -6.3012895584106445, "global_step": 96142, "epoch": 2289} {"train_loss": -6.429018974304199, "global_step": 96143, "epoch": 2289} {"train_loss": -6.287924766540527, "global_step": 96144, "epoch": 2289} {"train_loss": -6.236650466918945, "global_step": 96145, "epoch": 2289} {"train_loss": -6.284828186035156, "global_step": 96146, "epoch": 2289} {"train_loss": -6.22722053527832, "global_step": 96147, "epoch": 2289} {"train_loss": -6.333022117614746, "global_step": 96148, "epoch": 2289} {"train_loss": -6.257171630859375, "global_step": 96149, "epoch": 2289} {"train_loss": -6.172237873077393, "global_step": 96150, "epoch": 2289} {"train_loss": -6.253740310668945, "global_step": 96151, "epoch": 2289} {"train_loss": -6.349583148956299, "global_step": 96152, "epoch": 2289} {"train_loss": -6.215002059936523, "global_step": 96153, "epoch": 2289} {"train_loss": -6.391027927398682, "global_step": 96154, "epoch": 2289} {"train_loss": -6.3092875480651855, "global_step": 96155, "epoch": 2289} {"train_loss": -6.251227855682373, "global_step": 96156, "epoch": 2289} {"train_loss": -6.319192409515381, "global_step": 96157, "epoch": 2289} {"train_loss": -6.3621344566345215, "global_step": 96158, "epoch": 2289} {"train_loss": -6.296470642089844, "global_step": 96159, "epoch": 2289} {"train_loss": -6.4809675216674805, "global_step": 96160, "epoch": 2289} {"train_loss": -6.391354084014893, "global_step": 96161, "epoch": 2289} {"train_loss": -6.18405818939209, "global_step": 96162, "epoch": 2289} {"train_loss": -6.344062805175781, "global_step": 96163, "epoch": 2289} {"train_loss": -6.327856063842773, "global_step": 96164, "epoch": 2289} {"train_loss": -6.342409133911133, "global_step": 96165, "epoch": 2289} {"train_loss": -6.321377277374268, "global_step": 96166, "epoch": 2289} {"train_loss": -6.267576217651367, "global_step": 96167, "epoch": 2289} {"train_loss": -6.309118270874023, "global_step": 96168, "epoch": 2289} {"train_loss": -6.428535461425781, "global_step": 96169, "epoch": 2289} {"train_loss": -6.363574981689453, "global_step": 96170, "epoch": 2289} {"train_loss": -6.37639045715332, "global_step": 96171, "epoch": 2289} {"train_loss": -6.385112762451172, "global_step": 96172, "epoch": 2289} {"train_loss": -6.349875450134277, "global_step": 96173, "epoch": 2289} {"train_loss": -6.404382705688477, "global_step": 96174, "epoch": 2289} {"train_loss": -6.326107025146484, "global_step": 96175, "epoch": 2289} {"train_loss": -6.3167724609375, "global_step": 96176, "epoch": 2289} {"train_loss": -6.310318946838379, "global_step": 96177, "epoch": 2289} {"train_loss": -6.503861904144287, "global_step": 96178, "epoch": 2289} {"train_loss": -6.32103875705174, "global_step": 96179, "epoch": 2289, "val_loss": 63623.4140625} {"train_loss": -6.331120491027832, "global_step": 96180, "epoch": 2290} {"train_loss": -6.36555290222168, "global_step": 96181, "epoch": 2290} {"train_loss": -6.432920932769775, "global_step": 96182, "epoch": 2290} {"train_loss": -6.318737983703613, "global_step": 96183, "epoch": 2290} {"train_loss": -6.2927045822143555, "global_step": 96184, "epoch": 2290} {"train_loss": -6.224688529968262, "global_step": 96185, "epoch": 2290} {"train_loss": -6.34577751159668, "global_step": 96186, "epoch": 2290} {"train_loss": -6.300465106964111, "global_step": 96187, "epoch": 2290} {"train_loss": -6.349419116973877, "global_step": 96188, "epoch": 2290} {"train_loss": -6.453434944152832, "global_step": 96189, "epoch": 2290} {"train_loss": -6.28035831451416, "global_step": 96190, "epoch": 2290} {"train_loss": -6.374241352081299, "global_step": 96191, "epoch": 2290} {"train_loss": -6.319496154785156, "global_step": 96192, "epoch": 2290} {"train_loss": -6.30650520324707, "global_step": 96193, "epoch": 2290} {"train_loss": -6.362391948699951, "global_step": 96194, "epoch": 2290} {"train_loss": -6.325067520141602, "global_step": 96195, "epoch": 2290} {"train_loss": -6.441176414489746, "global_step": 96196, "epoch": 2290} {"train_loss": -6.434667587280273, "global_step": 96197, "epoch": 2290} {"train_loss": -6.38887357711792, "global_step": 96198, "epoch": 2290} {"train_loss": -6.251522541046143, "global_step": 96199, "epoch": 2290} {"train_loss": -6.4432373046875, "global_step": 96200, "epoch": 2290} {"train_loss": -6.295260429382324, "global_step": 96201, "epoch": 2290} {"train_loss": -6.278755187988281, "global_step": 96202, "epoch": 2290} {"train_loss": -6.401562213897705, "global_step": 96203, "epoch": 2290} {"train_loss": -6.41825008392334, "global_step": 96204, "epoch": 2290} {"train_loss": -6.217077732086182, "global_step": 96205, "epoch": 2290} {"train_loss": -6.36836051940918, "global_step": 96206, "epoch": 2290} {"train_loss": -6.361428260803223, "global_step": 96207, "epoch": 2290} {"train_loss": -6.179047584533691, "global_step": 96208, "epoch": 2290} {"train_loss": -6.393487930297852, "global_step": 96209, "epoch": 2290} {"train_loss": -6.222508430480957, "global_step": 96210, "epoch": 2290} {"train_loss": -6.356904029846191, "global_step": 96211, "epoch": 2290} {"train_loss": -6.258344650268555, "global_step": 96212, "epoch": 2290} {"train_loss": -6.405965805053711, "global_step": 96213, "epoch": 2290} {"train_loss": -6.248648166656494, "global_step": 96214, "epoch": 2290} {"train_loss": -6.379040718078613, "global_step": 96215, "epoch": 2290} {"train_loss": -6.270956993103027, "global_step": 96216, "epoch": 2290} {"train_loss": -6.2624921798706055, "global_step": 96217, "epoch": 2290} {"train_loss": -6.231356620788574, "global_step": 96218, "epoch": 2290} {"train_loss": -6.270158767700195, "global_step": 96219, "epoch": 2290} {"train_loss": -6.196201324462891, "global_step": 96220, "epoch": 2290} {"train_loss": -6.324724855877104, "global_step": 96221, "epoch": 2290, "val_loss": 63875.84765625} {"train_loss": -6.202442646026611, "global_step": 96222, "epoch": 2291} {"train_loss": -6.286797046661377, "global_step": 96223, "epoch": 2291} {"train_loss": -6.313966274261475, "global_step": 96224, "epoch": 2291} {"train_loss": -6.135978698730469, "global_step": 96225, "epoch": 2291} {"train_loss": -6.211130142211914, "global_step": 96226, "epoch": 2291} {"train_loss": -6.405023574829102, "global_step": 96227, "epoch": 2291} {"train_loss": -6.252011775970459, "global_step": 96228, "epoch": 2291} {"train_loss": -6.421520233154297, "global_step": 96229, "epoch": 2291} {"train_loss": -6.2656731605529785, "global_step": 96230, "epoch": 2291} {"train_loss": -6.317540168762207, "global_step": 96231, "epoch": 2291} {"train_loss": -6.402675628662109, "global_step": 96232, "epoch": 2291} {"train_loss": -6.169903755187988, "global_step": 96233, "epoch": 2291} {"train_loss": -6.349092960357666, "global_step": 96234, "epoch": 2291} {"train_loss": -6.404543399810791, "global_step": 96235, "epoch": 2291} {"train_loss": -6.317719459533691, "global_step": 96236, "epoch": 2291} {"train_loss": -6.289034843444824, "global_step": 96237, "epoch": 2291} {"train_loss": -6.389638900756836, "global_step": 96238, "epoch": 2291} {"train_loss": -6.286357402801514, "global_step": 96239, "epoch": 2291} {"train_loss": -6.330286026000977, "global_step": 96240, "epoch": 2291} {"train_loss": -6.338663101196289, "global_step": 96241, "epoch": 2291} {"train_loss": -6.327099800109863, "global_step": 96242, "epoch": 2291} {"train_loss": -6.272381782531738, "global_step": 96243, "epoch": 2291} {"train_loss": -6.277763366699219, "global_step": 96244, "epoch": 2291} {"train_loss": -6.268054962158203, "global_step": 96245, "epoch": 2291} {"train_loss": -6.325706481933594, "global_step": 96246, "epoch": 2291} {"train_loss": -6.315214157104492, "global_step": 96247, "epoch": 2291} {"train_loss": -6.259716987609863, "global_step": 96248, "epoch": 2291} {"train_loss": -6.401275634765625, "global_step": 96249, "epoch": 2291} {"train_loss": -6.286986351013184, "global_step": 96250, "epoch": 2291} {"train_loss": -6.273096084594727, "global_step": 96251, "epoch": 2291} {"train_loss": -6.224827289581299, "global_step": 96252, "epoch": 2291} {"train_loss": -6.239751815795898, "global_step": 96253, "epoch": 2291} {"train_loss": -6.316835880279541, "global_step": 96254, "epoch": 2291} {"train_loss": -6.295464515686035, "global_step": 96255, "epoch": 2291} {"train_loss": -6.391419410705566, "global_step": 96256, "epoch": 2291} {"train_loss": -6.270698547363281, "global_step": 96257, "epoch": 2291} {"train_loss": -6.224614143371582, "global_step": 96258, "epoch": 2291} {"train_loss": -6.253453254699707, "global_step": 96259, "epoch": 2291} {"train_loss": -6.275378704071045, "global_step": 96260, "epoch": 2291} {"train_loss": -6.324225425720215, "global_step": 96261, "epoch": 2291} {"train_loss": -6.381366729736328, "global_step": 96262, "epoch": 2291} {"train_loss": -6.3003533113570445, "global_step": 96263, "epoch": 2291, "val_loss": 63918.73046875} {"train_loss": -6.189844131469727, "global_step": 96264, "epoch": 2292} {"train_loss": -6.241474628448486, "global_step": 96265, "epoch": 2292} {"train_loss": -6.209145545959473, "global_step": 96266, "epoch": 2292} {"train_loss": -6.225518226623535, "global_step": 96267, "epoch": 2292} {"train_loss": -6.3760905265808105, "global_step": 96268, "epoch": 2292} {"train_loss": -6.346095085144043, "global_step": 96269, "epoch": 2292} {"train_loss": -6.330356121063232, "global_step": 96270, "epoch": 2292} {"train_loss": -6.302755355834961, "global_step": 96271, "epoch": 2292} {"train_loss": -6.220735549926758, "global_step": 96272, "epoch": 2292} {"train_loss": -6.385400772094727, "global_step": 96273, "epoch": 2292} {"train_loss": -6.2211833000183105, "global_step": 96274, "epoch": 2292} {"train_loss": -6.3837480545043945, "global_step": 96275, "epoch": 2292} {"train_loss": -6.283414840698242, "global_step": 96276, "epoch": 2292} {"train_loss": -6.26857852935791, "global_step": 96277, "epoch": 2292} {"train_loss": -6.14267635345459, "global_step": 96278, "epoch": 2292} {"train_loss": -6.327808856964111, "global_step": 96279, "epoch": 2292} {"train_loss": -6.348017692565918, "global_step": 96280, "epoch": 2292} {"train_loss": -6.196602821350098, "global_step": 96281, "epoch": 2292} {"train_loss": -6.3322553634643555, "global_step": 96282, "epoch": 2292} {"train_loss": -6.25693941116333, "global_step": 96283, "epoch": 2292} {"train_loss": -6.172097206115723, "global_step": 96284, "epoch": 2292} {"train_loss": -6.319964408874512, "global_step": 96285, "epoch": 2292} {"train_loss": -6.239025115966797, "global_step": 96286, "epoch": 2292} {"train_loss": -6.407336235046387, "global_step": 96287, "epoch": 2292} {"train_loss": -6.22298526763916, "global_step": 96288, "epoch": 2292} {"train_loss": -6.400990009307861, "global_step": 96289, "epoch": 2292} {"train_loss": -6.203037261962891, "global_step": 96290, "epoch": 2292} {"train_loss": -6.382596015930176, "global_step": 96291, "epoch": 2292} {"train_loss": -6.28818416595459, "global_step": 96292, "epoch": 2292} {"train_loss": -6.359249114990234, "global_step": 96293, "epoch": 2292} {"train_loss": -6.384214878082275, "global_step": 96294, "epoch": 2292} {"train_loss": -6.329282760620117, "global_step": 96295, "epoch": 2292} {"train_loss": -6.323361396789551, "global_step": 96296, "epoch": 2292} {"train_loss": -6.258448123931885, "global_step": 96297, "epoch": 2292} {"train_loss": -6.123751640319824, "global_step": 96298, "epoch": 2292} {"train_loss": -6.368503093719482, "global_step": 96299, "epoch": 2292} {"train_loss": -6.243415355682373, "global_step": 96300, "epoch": 2292} {"train_loss": -6.21702766418457, "global_step": 96301, "epoch": 2292} {"train_loss": -6.2813029289245605, "global_step": 96302, "epoch": 2292} {"train_loss": -6.281156539916992, "global_step": 96303, "epoch": 2292} {"train_loss": -6.258265018463135, "global_step": 96304, "epoch": 2292} {"train_loss": -6.284151837939308, "global_step": 96305, "epoch": 2292, "val_loss": 63798.9140625} {"train_loss": -6.3723955154418945, "global_step": 96306, "epoch": 2293} {"train_loss": -6.303823471069336, "global_step": 96307, "epoch": 2293} {"train_loss": -6.224161148071289, "global_step": 96308, "epoch": 2293} {"train_loss": -6.29315185546875, "global_step": 96309, "epoch": 2293} {"train_loss": -6.2729997634887695, "global_step": 96310, "epoch": 2293} {"train_loss": -6.336529731750488, "global_step": 96311, "epoch": 2293} {"train_loss": -6.440500259399414, "global_step": 96312, "epoch": 2293} {"train_loss": -6.292085647583008, "global_step": 96313, "epoch": 2293} {"train_loss": -6.39011287689209, "global_step": 96314, "epoch": 2293} {"train_loss": -6.361326217651367, "global_step": 96315, "epoch": 2293} {"train_loss": -6.319831848144531, "global_step": 96316, "epoch": 2293} {"train_loss": -6.317126274108887, "global_step": 96317, "epoch": 2293} {"train_loss": -6.374831676483154, "global_step": 96318, "epoch": 2293} {"train_loss": -6.471302509307861, "global_step": 96319, "epoch": 2293} {"train_loss": -6.378479957580566, "global_step": 96320, "epoch": 2293} {"train_loss": -6.32719087600708, "global_step": 96321, "epoch": 2293} {"train_loss": -6.33098030090332, "global_step": 96322, "epoch": 2293} {"train_loss": -6.396474361419678, "global_step": 96323, "epoch": 2293} {"train_loss": -6.24647331237793, "global_step": 96324, "epoch": 2293} {"train_loss": -6.366044998168945, "global_step": 96325, "epoch": 2293} {"train_loss": -6.322174549102783, "global_step": 96326, "epoch": 2293} {"train_loss": -6.333773612976074, "global_step": 96327, "epoch": 2293} {"train_loss": -6.263485908508301, "global_step": 96328, "epoch": 2293} {"train_loss": -6.416266441345215, "global_step": 96329, "epoch": 2293} {"train_loss": -6.330236911773682, "global_step": 96330, "epoch": 2293} {"train_loss": -6.3613739013671875, "global_step": 96331, "epoch": 2293} {"train_loss": -6.278201103210449, "global_step": 96332, "epoch": 2293} {"train_loss": -6.383734703063965, "global_step": 96333, "epoch": 2293} {"train_loss": -6.287060260772705, "global_step": 96334, "epoch": 2293} {"train_loss": -6.3714189529418945, "global_step": 96335, "epoch": 2293} {"train_loss": -6.303231239318848, "global_step": 96336, "epoch": 2293} {"train_loss": -6.351683616638184, "global_step": 96337, "epoch": 2293} {"train_loss": -6.2805633544921875, "global_step": 96338, "epoch": 2293} {"train_loss": -6.255849838256836, "global_step": 96339, "epoch": 2293} {"train_loss": -6.357220649719238, "global_step": 96340, "epoch": 2293} {"train_loss": -6.398115158081055, "global_step": 96341, "epoch": 2293} {"train_loss": -6.347104072570801, "global_step": 96342, "epoch": 2293} {"train_loss": -6.313755989074707, "global_step": 96343, "epoch": 2293} {"train_loss": -6.390336513519287, "global_step": 96344, "epoch": 2293} {"train_loss": -6.361879348754883, "global_step": 96345, "epoch": 2293} {"train_loss": -6.423449993133545, "global_step": 96346, "epoch": 2293} {"train_loss": -6.341378268741426, "global_step": 96347, "epoch": 2293, "val_loss": 63632.05078125} {"train_loss": -6.4596476554870605, "global_step": 96348, "epoch": 2294} {"train_loss": -6.328807830810547, "global_step": 96349, "epoch": 2294} {"train_loss": -6.326798439025879, "global_step": 96350, "epoch": 2294} {"train_loss": -6.438527584075928, "global_step": 96351, "epoch": 2294} {"train_loss": -6.363842010498047, "global_step": 96352, "epoch": 2294} {"train_loss": -6.333641529083252, "global_step": 96353, "epoch": 2294} {"train_loss": -6.269323348999023, "global_step": 96354, "epoch": 2294} {"train_loss": -6.3527679443359375, "global_step": 96355, "epoch": 2294} {"train_loss": -6.381131172180176, "global_step": 96356, "epoch": 2294} {"train_loss": -6.338817596435547, "global_step": 96357, "epoch": 2294} {"train_loss": -6.320172309875488, "global_step": 96358, "epoch": 2294} {"train_loss": -6.282027244567871, "global_step": 96359, "epoch": 2294} {"train_loss": -6.30090856552124, "global_step": 96360, "epoch": 2294} {"train_loss": -6.364221572875977, "global_step": 96361, "epoch": 2294} {"train_loss": -6.244290351867676, "global_step": 96362, "epoch": 2294} {"train_loss": -6.376778602600098, "global_step": 96363, "epoch": 2294} {"train_loss": -6.289043426513672, "global_step": 96364, "epoch": 2294} {"train_loss": -6.29656982421875, "global_step": 96365, "epoch": 2294} {"train_loss": -6.2646484375, "global_step": 96366, "epoch": 2294} {"train_loss": -6.374478340148926, "global_step": 96367, "epoch": 2294} {"train_loss": -6.351832389831543, "global_step": 96368, "epoch": 2294} {"train_loss": -6.370223045349121, "global_step": 96369, "epoch": 2294} {"train_loss": -6.491215229034424, "global_step": 96370, "epoch": 2294} {"train_loss": -6.428086757659912, "global_step": 96371, "epoch": 2294} {"train_loss": -6.441074371337891, "global_step": 96372, "epoch": 2294} {"train_loss": -6.358743667602539, "global_step": 96373, "epoch": 2294} {"train_loss": -6.4131269454956055, "global_step": 96374, "epoch": 2294} {"train_loss": -6.481143474578857, "global_step": 96375, "epoch": 2294} {"train_loss": -6.345973491668701, "global_step": 96376, "epoch": 2294} {"train_loss": -6.396857261657715, "global_step": 96377, "epoch": 2294} {"train_loss": -6.445117473602295, "global_step": 96378, "epoch": 2294} {"train_loss": -6.301754951477051, "global_step": 96379, "epoch": 2294} {"train_loss": -6.373919486999512, "global_step": 96380, "epoch": 2294} {"train_loss": -6.352504730224609, "global_step": 96381, "epoch": 2294} {"train_loss": -6.32611083984375, "global_step": 96382, "epoch": 2294} {"train_loss": -6.340719699859619, "global_step": 96383, "epoch": 2294} {"train_loss": -6.345202922821045, "global_step": 96384, "epoch": 2294} {"train_loss": -6.364123821258545, "global_step": 96385, "epoch": 2294} {"train_loss": -6.330750465393066, "global_step": 96386, "epoch": 2294} {"train_loss": -6.331653594970703, "global_step": 96387, "epoch": 2294} {"train_loss": -6.407508373260498, "global_step": 96388, "epoch": 2294} {"train_loss": -6.356918857211158, "global_step": 96389, "epoch": 2294, "val_loss": 63620.66015625} {"train_loss": -6.43412971496582, "global_step": 96390, "epoch": 2295} {"train_loss": -6.3847455978393555, "global_step": 96391, "epoch": 2295} {"train_loss": -6.299187660217285, "global_step": 96392, "epoch": 2295} {"train_loss": -6.3431854248046875, "global_step": 96393, "epoch": 2295} {"train_loss": -6.392947673797607, "global_step": 96394, "epoch": 2295} {"train_loss": -6.334640979766846, "global_step": 96395, "epoch": 2295} {"train_loss": -6.439974308013916, "global_step": 96396, "epoch": 2295} {"train_loss": -6.385614395141602, "global_step": 96397, "epoch": 2295} {"train_loss": -6.290199279785156, "global_step": 96398, "epoch": 2295} {"train_loss": -6.413276672363281, "global_step": 96399, "epoch": 2295} {"train_loss": -6.346563339233398, "global_step": 96400, "epoch": 2295} {"train_loss": -6.401853561401367, "global_step": 96401, "epoch": 2295} {"train_loss": -6.360091686248779, "global_step": 96402, "epoch": 2295} {"train_loss": -6.30296516418457, "global_step": 96403, "epoch": 2295} {"train_loss": -6.361865043640137, "global_step": 96404, "epoch": 2295} {"train_loss": -6.337131977081299, "global_step": 96405, "epoch": 2295} {"train_loss": -6.43398380279541, "global_step": 96406, "epoch": 2295} {"train_loss": -6.215476989746094, "global_step": 96407, "epoch": 2295} {"train_loss": -6.358284950256348, "global_step": 96408, "epoch": 2295} {"train_loss": -6.426946640014648, "global_step": 96409, "epoch": 2295} {"train_loss": -6.272782325744629, "global_step": 96410, "epoch": 2295} {"train_loss": -6.35866641998291, "global_step": 96411, "epoch": 2295} {"train_loss": -6.367569923400879, "global_step": 96412, "epoch": 2295} {"train_loss": -6.382909297943115, "global_step": 96413, "epoch": 2295} {"train_loss": -6.554764270782471, "global_step": 96414, "epoch": 2295} {"train_loss": -6.376444339752197, "global_step": 96415, "epoch": 2295} {"train_loss": -6.22641134262085, "global_step": 96416, "epoch": 2295} {"train_loss": -6.4194536209106445, "global_step": 96417, "epoch": 2295} {"train_loss": -6.315788269042969, "global_step": 96418, "epoch": 2295} {"train_loss": -6.273178577423096, "global_step": 96419, "epoch": 2295} {"train_loss": -6.344359397888184, "global_step": 96420, "epoch": 2295} {"train_loss": -6.421233654022217, "global_step": 96421, "epoch": 2295} {"train_loss": -6.345867156982422, "global_step": 96422, "epoch": 2295} {"train_loss": -6.3133440017700195, "global_step": 96423, "epoch": 2295} {"train_loss": -6.456889629364014, "global_step": 96424, "epoch": 2295} {"train_loss": -6.436347961425781, "global_step": 96425, "epoch": 2295} {"train_loss": -6.290922164916992, "global_step": 96426, "epoch": 2295} {"train_loss": -6.364750862121582, "global_step": 96427, "epoch": 2295} {"train_loss": -6.4061970710754395, "global_step": 96428, "epoch": 2295} {"train_loss": -6.377201557159424, "global_step": 96429, "epoch": 2295} {"train_loss": -6.412153244018555, "global_step": 96430, "epoch": 2295} {"train_loss": -6.367701678048997, "global_step": 96431, "epoch": 2295, "val_loss": 63816.5625} {"train_loss": -6.352965354919434, "global_step": 96432, "epoch": 2296} {"train_loss": -6.390725135803223, "global_step": 96433, "epoch": 2296} {"train_loss": -6.365198135375977, "global_step": 96434, "epoch": 2296} {"train_loss": -6.506288528442383, "global_step": 96435, "epoch": 2296} {"train_loss": -6.390114784240723, "global_step": 96436, "epoch": 2296} {"train_loss": -6.374695777893066, "global_step": 96437, "epoch": 2296} {"train_loss": -6.354554176330566, "global_step": 96438, "epoch": 2296} {"train_loss": -6.293294906616211, "global_step": 96439, "epoch": 2296} {"train_loss": -6.255609512329102, "global_step": 96440, "epoch": 2296} {"train_loss": -6.408171653747559, "global_step": 96441, "epoch": 2296} {"train_loss": -6.3602399826049805, "global_step": 96442, "epoch": 2296} {"train_loss": -6.212933540344238, "global_step": 96443, "epoch": 2296} {"train_loss": -6.328957557678223, "global_step": 96444, "epoch": 2296} {"train_loss": -6.222575664520264, "global_step": 96445, "epoch": 2296} {"train_loss": -6.324199676513672, "global_step": 96446, "epoch": 2296} {"train_loss": -6.314154148101807, "global_step": 96447, "epoch": 2296} {"train_loss": -6.228889465332031, "global_step": 96448, "epoch": 2296} {"train_loss": -6.390268325805664, "global_step": 96449, "epoch": 2296} {"train_loss": -6.331088066101074, "global_step": 96450, "epoch": 2296} {"train_loss": -6.426446914672852, "global_step": 96451, "epoch": 2296} {"train_loss": -6.311717510223389, "global_step": 96452, "epoch": 2296} {"train_loss": -6.4013261795043945, "global_step": 96453, "epoch": 2296} {"train_loss": -6.371798515319824, "global_step": 96454, "epoch": 2296} {"train_loss": -6.521215438842773, "global_step": 96455, "epoch": 2296} {"train_loss": -6.332231521606445, "global_step": 96456, "epoch": 2296} {"train_loss": -6.401390075683594, "global_step": 96457, "epoch": 2296} {"train_loss": -6.3707594871521, "global_step": 96458, "epoch": 2296} {"train_loss": -6.338430404663086, "global_step": 96459, "epoch": 2296} {"train_loss": -6.3505964279174805, "global_step": 96460, "epoch": 2296} {"train_loss": -6.342718601226807, "global_step": 96461, "epoch": 2296} {"train_loss": -6.306128025054932, "global_step": 96462, "epoch": 2296} {"train_loss": -6.170328140258789, "global_step": 96463, "epoch": 2296} {"train_loss": -6.2754411697387695, "global_step": 96464, "epoch": 2296} {"train_loss": -6.118305206298828, "global_step": 96465, "epoch": 2296} {"train_loss": -6.333776950836182, "global_step": 96466, "epoch": 2296} {"train_loss": -6.13936710357666, "global_step": 96467, "epoch": 2296} {"train_loss": -6.150035381317139, "global_step": 96468, "epoch": 2296} {"train_loss": -6.258492469787598, "global_step": 96469, "epoch": 2296} {"train_loss": -6.234215259552002, "global_step": 96470, "epoch": 2296} {"train_loss": -6.266315937042236, "global_step": 96471, "epoch": 2296} {"train_loss": -6.151186466217041, "global_step": 96472, "epoch": 2296} {"train_loss": -6.3162299905504495, "global_step": 96473, "epoch": 2296, "val_loss": 63830.109375} {"train_loss": -6.289011001586914, "global_step": 96474, "epoch": 2297} {"train_loss": -6.17875862121582, "global_step": 96475, "epoch": 2297} {"train_loss": -6.261113166809082, "global_step": 96476, "epoch": 2297} {"train_loss": -6.195864677429199, "global_step": 96477, "epoch": 2297} {"train_loss": -6.208713531494141, "global_step": 96478, "epoch": 2297} {"train_loss": -6.19808292388916, "global_step": 96479, "epoch": 2297} {"train_loss": -6.42382287979126, "global_step": 96480, "epoch": 2297} {"train_loss": -6.330057144165039, "global_step": 96481, "epoch": 2297} {"train_loss": -6.340407848358154, "global_step": 96482, "epoch": 2297} {"train_loss": -6.1707611083984375, "global_step": 96483, "epoch": 2297} {"train_loss": -6.234618663787842, "global_step": 96484, "epoch": 2297} {"train_loss": -6.337322235107422, "global_step": 96485, "epoch": 2297} {"train_loss": -6.2802839279174805, "global_step": 96486, "epoch": 2297} {"train_loss": -6.284934043884277, "global_step": 96487, "epoch": 2297} {"train_loss": -6.457015037536621, "global_step": 96488, "epoch": 2297} {"train_loss": -6.363880157470703, "global_step": 96489, "epoch": 2297} {"train_loss": -6.382925987243652, "global_step": 96490, "epoch": 2297} {"train_loss": -6.261204719543457, "global_step": 96491, "epoch": 2297} {"train_loss": -6.326138019561768, "global_step": 96492, "epoch": 2297} {"train_loss": -6.299839496612549, "global_step": 96493, "epoch": 2297} {"train_loss": -6.270386695861816, "global_step": 96494, "epoch": 2297} {"train_loss": -6.3294219970703125, "global_step": 96495, "epoch": 2297} {"train_loss": -6.325617790222168, "global_step": 96496, "epoch": 2297} {"train_loss": -6.273503303527832, "global_step": 96497, "epoch": 2297} {"train_loss": -6.3017168045043945, "global_step": 96498, "epoch": 2297} {"train_loss": -6.274904251098633, "global_step": 96499, "epoch": 2297} {"train_loss": -6.219043731689453, "global_step": 96500, "epoch": 2297} {"train_loss": -6.277935028076172, "global_step": 96501, "epoch": 2297} {"train_loss": -6.318803310394287, "global_step": 96502, "epoch": 2297} {"train_loss": -6.33613395690918, "global_step": 96503, "epoch": 2297} {"train_loss": -6.349420547485352, "global_step": 96504, "epoch": 2297} {"train_loss": -6.344474792480469, "global_step": 96505, "epoch": 2297} {"train_loss": -6.362015724182129, "global_step": 96506, "epoch": 2297} {"train_loss": -6.233679294586182, "global_step": 96507, "epoch": 2297} {"train_loss": -6.36848258972168, "global_step": 96508, "epoch": 2297} {"train_loss": -6.276741027832031, "global_step": 96509, "epoch": 2297} {"train_loss": -6.366229057312012, "global_step": 96510, "epoch": 2297} {"train_loss": -6.311123847961426, "global_step": 96511, "epoch": 2297} {"train_loss": -6.4325995445251465, "global_step": 96512, "epoch": 2297} {"train_loss": -6.405828952789307, "global_step": 96513, "epoch": 2297} {"train_loss": -6.454939842224121, "global_step": 96514, "epoch": 2297} {"train_loss": -6.311588525772095, "global_step": 96515, "epoch": 2297, "val_loss": 63515.1875} {"train_loss": -6.296473026275635, "global_step": 96516, "epoch": 2298} {"train_loss": -6.323133945465088, "global_step": 96517, "epoch": 2298} {"train_loss": -6.337532043457031, "global_step": 96518, "epoch": 2298} {"train_loss": -6.303531646728516, "global_step": 96519, "epoch": 2298} {"train_loss": -6.436747074127197, "global_step": 96520, "epoch": 2298} {"train_loss": -6.343341827392578, "global_step": 96521, "epoch": 2298} {"train_loss": -6.351325035095215, "global_step": 96522, "epoch": 2298} {"train_loss": -6.442913055419922, "global_step": 96523, "epoch": 2298} {"train_loss": -6.378657341003418, "global_step": 96524, "epoch": 2298} {"train_loss": -6.368363380432129, "global_step": 96525, "epoch": 2298} {"train_loss": -6.291441440582275, "global_step": 96526, "epoch": 2298} {"train_loss": -6.218658447265625, "global_step": 96527, "epoch": 2298} {"train_loss": -6.308689117431641, "global_step": 96528, "epoch": 2298} {"train_loss": -6.314210414886475, "global_step": 96529, "epoch": 2298} {"train_loss": -6.311676502227783, "global_step": 96530, "epoch": 2298} {"train_loss": -6.399694442749023, "global_step": 96531, "epoch": 2298} {"train_loss": -6.274831295013428, "global_step": 96532, "epoch": 2298} {"train_loss": -6.409242630004883, "global_step": 96533, "epoch": 2298} {"train_loss": -6.29056453704834, "global_step": 96534, "epoch": 2298} {"train_loss": -6.324932098388672, "global_step": 96535, "epoch": 2298} {"train_loss": -6.306834697723389, "global_step": 96536, "epoch": 2298} {"train_loss": -6.442276954650879, "global_step": 96537, "epoch": 2298} {"train_loss": -6.358007431030273, "global_step": 96538, "epoch": 2298} {"train_loss": -6.366595268249512, "global_step": 96539, "epoch": 2298} {"train_loss": -6.15683126449585, "global_step": 96540, "epoch": 2298} {"train_loss": -6.294308662414551, "global_step": 96541, "epoch": 2298} {"train_loss": -6.234633445739746, "global_step": 96542, "epoch": 2298} {"train_loss": -6.349032878875732, "global_step": 96543, "epoch": 2298} {"train_loss": -6.436413764953613, "global_step": 96544, "epoch": 2298} {"train_loss": -6.3729400634765625, "global_step": 96545, "epoch": 2298} {"train_loss": -6.259573936462402, "global_step": 96546, "epoch": 2298} {"train_loss": -6.297970771789551, "global_step": 96547, "epoch": 2298} {"train_loss": -6.3939337730407715, "global_step": 96548, "epoch": 2298} {"train_loss": -6.412506580352783, "global_step": 96549, "epoch": 2298} {"train_loss": -6.3251190185546875, "global_step": 96550, "epoch": 2298} {"train_loss": -6.323676586151123, "global_step": 96551, "epoch": 2298} {"train_loss": -6.264034271240234, "global_step": 96552, "epoch": 2298} {"train_loss": -6.377091407775879, "global_step": 96553, "epoch": 2298} {"train_loss": -6.252127647399902, "global_step": 96554, "epoch": 2298} {"train_loss": -6.385754585266113, "global_step": 96555, "epoch": 2298} {"train_loss": -6.314177513122559, "global_step": 96556, "epoch": 2298} {"train_loss": -6.331583715620495, "global_step": 96557, "epoch": 2298, "val_loss": 63712.7265625} {"train_loss": -6.390467643737793, "global_step": 96558, "epoch": 2299} {"train_loss": -6.279452323913574, "global_step": 96559, "epoch": 2299} {"train_loss": -6.308475494384766, "global_step": 96560, "epoch": 2299} {"train_loss": -6.225613117218018, "global_step": 96561, "epoch": 2299} {"train_loss": -6.172578811645508, "global_step": 96562, "epoch": 2299} {"train_loss": -6.278308391571045, "global_step": 96563, "epoch": 2299} {"train_loss": -6.209632873535156, "global_step": 96564, "epoch": 2299} {"train_loss": -6.326635360717773, "global_step": 96565, "epoch": 2299} {"train_loss": -6.367765426635742, "global_step": 96566, "epoch": 2299} {"train_loss": -6.297484874725342, "global_step": 96567, "epoch": 2299} {"train_loss": -6.311473846435547, "global_step": 96568, "epoch": 2299} {"train_loss": -6.250120162963867, "global_step": 96569, "epoch": 2299} {"train_loss": -6.388322830200195, "global_step": 96570, "epoch": 2299} {"train_loss": -6.290818691253662, "global_step": 96571, "epoch": 2299} {"train_loss": -6.204939365386963, "global_step": 96572, "epoch": 2299} {"train_loss": -6.326575756072998, "global_step": 96573, "epoch": 2299} {"train_loss": -6.390226364135742, "global_step": 96574, "epoch": 2299} {"train_loss": -6.198389053344727, "global_step": 96575, "epoch": 2299} {"train_loss": -6.330333232879639, "global_step": 96576, "epoch": 2299} {"train_loss": -6.190803527832031, "global_step": 96577, "epoch": 2299} {"train_loss": -6.322663307189941, "global_step": 96578, "epoch": 2299} {"train_loss": -6.353089332580566, "global_step": 96579, "epoch": 2299} {"train_loss": -6.345699310302734, "global_step": 96580, "epoch": 2299} {"train_loss": -6.167911529541016, "global_step": 96581, "epoch": 2299} {"train_loss": -6.34519100189209, "global_step": 96582, "epoch": 2299} {"train_loss": -6.3580322265625, "global_step": 96583, "epoch": 2299} {"train_loss": -6.258718967437744, "global_step": 96584, "epoch": 2299} {"train_loss": -6.305613994598389, "global_step": 96585, "epoch": 2299} {"train_loss": -6.416299819946289, "global_step": 96586, "epoch": 2299} {"train_loss": -6.3881635665893555, "global_step": 96587, "epoch": 2299} {"train_loss": -6.367114067077637, "global_step": 96588, "epoch": 2299} {"train_loss": -6.332406997680664, "global_step": 96589, "epoch": 2299} {"train_loss": -6.1965436935424805, "global_step": 96590, "epoch": 2299} {"train_loss": -6.279095649719238, "global_step": 96591, "epoch": 2299} {"train_loss": -6.303040504455566, "global_step": 96592, "epoch": 2299} {"train_loss": -6.309557914733887, "global_step": 96593, "epoch": 2299} {"train_loss": -6.385549545288086, "global_step": 96594, "epoch": 2299} {"train_loss": -6.365803241729736, "global_step": 96595, "epoch": 2299} {"train_loss": -6.301823616027832, "global_step": 96596, "epoch": 2299} {"train_loss": -6.228433609008789, "global_step": 96597, "epoch": 2299} {"train_loss": -6.281002044677734, "global_step": 96598, "epoch": 2299} {"train_loss": -6.297198522658575, "global_step": 96599, "epoch": 2299, "val_loss": 63667.70703125} {"train_loss": -6.287755966186523, "global_step": 96600, "epoch": 2300} {"train_loss": -6.300661563873291, "global_step": 96601, "epoch": 2300} {"train_loss": -6.2657084465026855, "global_step": 96602, "epoch": 2300} {"train_loss": -6.338079452514648, "global_step": 96603, "epoch": 2300} {"train_loss": -6.349954605102539, "global_step": 96604, "epoch": 2300} {"train_loss": -6.284102439880371, "global_step": 96605, "epoch": 2300} {"train_loss": -6.2166523933410645, "global_step": 96606, "epoch": 2300} {"train_loss": -6.325615406036377, "global_step": 96607, "epoch": 2300} {"train_loss": -6.338195323944092, "global_step": 96608, "epoch": 2300} {"train_loss": -6.39385986328125, "global_step": 96609, "epoch": 2300} {"train_loss": -6.2238616943359375, "global_step": 96610, "epoch": 2300} {"train_loss": -6.327706336975098, "global_step": 96611, "epoch": 2300} {"train_loss": -6.131965637207031, "global_step": 96612, "epoch": 2300} {"train_loss": -6.2444915771484375, "global_step": 96613, "epoch": 2300} {"train_loss": -6.189716339111328, "global_step": 96614, "epoch": 2300} {"train_loss": -6.283280849456787, "global_step": 96615, "epoch": 2300} {"train_loss": -6.327652931213379, "global_step": 96616, "epoch": 2300} {"train_loss": -6.312525272369385, "global_step": 96617, "epoch": 2300} {"train_loss": -6.338291168212891, "global_step": 96618, "epoch": 2300} {"train_loss": -6.283381462097168, "global_step": 96619, "epoch": 2300} {"train_loss": -6.28040885925293, "global_step": 96620, "epoch": 2300} {"train_loss": -6.314193248748779, "global_step": 96621, "epoch": 2300} {"train_loss": -6.294306755065918, "global_step": 96622, "epoch": 2300} {"train_loss": -6.379702568054199, "global_step": 96623, "epoch": 2300} {"train_loss": -6.308098316192627, "global_step": 96624, "epoch": 2300} {"train_loss": -6.425081253051758, "global_step": 96625, "epoch": 2300} {"train_loss": -6.318421840667725, "global_step": 96626, "epoch": 2300} {"train_loss": -6.29702091217041, "global_step": 96627, "epoch": 2300} {"train_loss": -6.282599449157715, "global_step": 96628, "epoch": 2300} {"train_loss": -6.265519142150879, "global_step": 96629, "epoch": 2300} {"train_loss": -6.335744857788086, "global_step": 96630, "epoch": 2300} {"train_loss": -6.219160556793213, "global_step": 96631, "epoch": 2300} {"train_loss": -6.40349817276001, "global_step": 96632, "epoch": 2300} {"train_loss": -6.275994300842285, "global_step": 96633, "epoch": 2300} {"train_loss": -6.3187384605407715, "global_step": 96634, "epoch": 2300} {"train_loss": -6.324676513671875, "global_step": 96635, "epoch": 2300} {"train_loss": -6.349234104156494, "global_step": 96636, "epoch": 2300} {"train_loss": -6.3367228507995605, "global_step": 96637, "epoch": 2300} {"train_loss": -6.381804466247559, "global_step": 96638, "epoch": 2300} {"train_loss": -6.319197654724121, "global_step": 96639, "epoch": 2300} {"train_loss": -6.339956283569336, "global_step": 96640, "epoch": 2300} {"train_loss": -6.305930148987543, "global_step": 96641, "epoch": 2300, "train/sim_max_reward_0": 0.1954843083584081, "train/sim_max_reward_1": 0.799053383596171, "train/sim_max_reward_2": 0.79462819896227, "train/sim_max_reward_3": 0.36902606197038695, "train/sim_max_reward_4": 0.9458841640345467, "train/sim_max_reward_5": 0.7786701457442778, "test/sim_max_reward_4300000": 0.19719661186391346, "test/sim_max_reward_4300001": 0.5384298923490244, "test/sim_max_reward_4300002": 0.9148462940766927, "test/sim_max_reward_4300003": 0.8973244237747575, "test/sim_max_reward_4300004": 0.3015456391363297, "test/sim_max_reward_4300005": 0.9368990578337145, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9760176086875095, "test/sim_max_reward_4300008": 0.9703917649951507, "test/sim_max_reward_4300009": 0.9982611496484369, "test/sim_max_reward_4300010": 0.28125130269226045, "test/sim_max_reward_4300011": 0.8760515151655538, "test/sim_max_reward_4300012": 0.9859227688199121, "test/sim_max_reward_4300013": 0.4053656290695427, "test/sim_max_reward_4300014": 0.9293023537473457, "test/sim_max_reward_4300015": 0.9252926797291128, "test/sim_max_reward_4300016": 0.10185736333821549, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.427876257591976, "test/sim_max_reward_4300019": 0.18562395343918173, "test/sim_max_reward_4300020": 0.1561771986047126, "test/sim_max_reward_4300021": 0.9822297578039465, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.33706509441267585, "test/sim_max_reward_4300024": 0.9695738703706248, "test/sim_max_reward_4300025": 0.9238382218791743, "test/sim_max_reward_4300026": 0.1546711427826813, "test/sim_max_reward_4300027": 0.894514147004192, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.00753689997903318, "test/sim_max_reward_4300030": 0.37400988665767, "test/sim_max_reward_4300031": 0.18666852990529853, "test/sim_max_reward_4300032": 0.996090190050786, "test/sim_max_reward_4300033": 0.6098787618122125, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.8015478971067301, "test/sim_max_reward_4300036": 0.21183021573807032, "test/sim_max_reward_4300037": 0.7800354916594548, "test/sim_max_reward_4300038": 0.8239080981117424, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.31557370632690424, "test/sim_max_reward_4300041": 0.8927614521057171, "test/sim_max_reward_4300042": 0.7148198842581799, "test/sim_max_reward_4300043": 0.12759509945021055, "test/sim_max_reward_4300044": 0.7535790265837315, "test/sim_max_reward_4300045": 0.9039144905714035, "test/sim_max_reward_4300046": 0.30426822140335674, "test/sim_max_reward_4300047": 0.8838618228787508, "test/sim_max_reward_4300048": 0.7168835530751112, "test/sim_max_reward_4300049": 0.10525278714803774, "train/mean_score": 0.6471243771110101, "test/mean_score": 0.5955508342727808, "val_loss": 63827.1953125} {"train_loss": -6.352578163146973, "global_step": 96642, "epoch": 2301} {"train_loss": -6.290065765380859, "global_step": 96643, "epoch": 2301} {"train_loss": -6.355255126953125, "global_step": 96644, "epoch": 2301} {"train_loss": -6.425773620605469, "global_step": 96645, "epoch": 2301} {"train_loss": -6.340994834899902, "global_step": 96646, "epoch": 2301} {"train_loss": -6.348650932312012, "global_step": 96647, "epoch": 2301} {"train_loss": -6.349062919616699, "global_step": 96648, "epoch": 2301} {"train_loss": -6.442580223083496, "global_step": 96649, "epoch": 2301} {"train_loss": -6.338556289672852, "global_step": 96650, "epoch": 2301} {"train_loss": -6.458914756774902, "global_step": 96651, "epoch": 2301} {"train_loss": -6.293003559112549, "global_step": 96652, "epoch": 2301} {"train_loss": -6.33392858505249, "global_step": 96653, "epoch": 2301} {"train_loss": -6.34358549118042, "global_step": 96654, "epoch": 2301} {"train_loss": -6.316900730133057, "global_step": 96655, "epoch": 2301} {"train_loss": -6.358147621154785, "global_step": 96656, "epoch": 2301} {"train_loss": -6.28964900970459, "global_step": 96657, "epoch": 2301} {"train_loss": -6.487076759338379, "global_step": 96658, "epoch": 2301} {"train_loss": -6.451040267944336, "global_step": 96659, "epoch": 2301} {"train_loss": -6.491605281829834, "global_step": 96660, "epoch": 2301} {"train_loss": -6.365097999572754, "global_step": 96661, "epoch": 2301} {"train_loss": -6.376166820526123, "global_step": 96662, "epoch": 2301} {"train_loss": -6.2886176109313965, "global_step": 96663, "epoch": 2301} {"train_loss": -6.336814880371094, "global_step": 96664, "epoch": 2301} {"train_loss": -6.303768634796143, "global_step": 96665, "epoch": 2301} {"train_loss": -6.41657829284668, "global_step": 96666, "epoch": 2301} {"train_loss": -6.398617744445801, "global_step": 96667, "epoch": 2301} {"train_loss": -6.298224449157715, "global_step": 96668, "epoch": 2301} {"train_loss": -6.361977577209473, "global_step": 96669, "epoch": 2301} {"train_loss": -6.3669328689575195, "global_step": 96670, "epoch": 2301} {"train_loss": -6.262160778045654, "global_step": 96671, "epoch": 2301} {"train_loss": -6.402195930480957, "global_step": 96672, "epoch": 2301} {"train_loss": -6.302097797393799, "global_step": 96673, "epoch": 2301} {"train_loss": -6.410637855529785, "global_step": 96674, "epoch": 2301} {"train_loss": -6.2598795890808105, "global_step": 96675, "epoch": 2301} {"train_loss": -6.323683261871338, "global_step": 96676, "epoch": 2301} {"train_loss": -6.2722578048706055, "global_step": 96677, "epoch": 2301} {"train_loss": -6.431093215942383, "global_step": 96678, "epoch": 2301} {"train_loss": -6.325160980224609, "global_step": 96679, "epoch": 2301} {"train_loss": -6.234854698181152, "global_step": 96680, "epoch": 2301} {"train_loss": -6.319540977478027, "global_step": 96681, "epoch": 2301} {"train_loss": -6.343490123748779, "global_step": 96682, "epoch": 2301} {"train_loss": -6.351010277157738, "global_step": 96683, "epoch": 2301, "val_loss": 63705.203125} {"train_loss": -6.458597183227539, "global_step": 96684, "epoch": 2302} {"train_loss": -6.334605693817139, "global_step": 96685, "epoch": 2302} {"train_loss": -6.367951393127441, "global_step": 96686, "epoch": 2302} {"train_loss": -6.455087661743164, "global_step": 96687, "epoch": 2302} {"train_loss": -6.435866355895996, "global_step": 96688, "epoch": 2302} {"train_loss": -6.300233364105225, "global_step": 96689, "epoch": 2302} {"train_loss": -6.349815368652344, "global_step": 96690, "epoch": 2302} {"train_loss": -6.387997627258301, "global_step": 96691, "epoch": 2302} {"train_loss": -6.4660420417785645, "global_step": 96692, "epoch": 2302} {"train_loss": -6.403170108795166, "global_step": 96693, "epoch": 2302} {"train_loss": -6.380092620849609, "global_step": 96694, "epoch": 2302} {"train_loss": -6.419261932373047, "global_step": 96695, "epoch": 2302} {"train_loss": -6.295158863067627, "global_step": 96696, "epoch": 2302} {"train_loss": -6.397879600524902, "global_step": 96697, "epoch": 2302} {"train_loss": -6.30761194229126, "global_step": 96698, "epoch": 2302} {"train_loss": -6.291295051574707, "global_step": 96699, "epoch": 2302} {"train_loss": -6.394724369049072, "global_step": 96700, "epoch": 2302} {"train_loss": -6.36887264251709, "global_step": 96701, "epoch": 2302} {"train_loss": -6.408675193786621, "global_step": 96702, "epoch": 2302} {"train_loss": -6.292942047119141, "global_step": 96703, "epoch": 2302} {"train_loss": -6.301630020141602, "global_step": 96704, "epoch": 2302} {"train_loss": -6.281050205230713, "global_step": 96705, "epoch": 2302} {"train_loss": -6.368654251098633, "global_step": 96706, "epoch": 2302} {"train_loss": -6.332301139831543, "global_step": 96707, "epoch": 2302} {"train_loss": -6.314952373504639, "global_step": 96708, "epoch": 2302} {"train_loss": -6.235265731811523, "global_step": 96709, "epoch": 2302} {"train_loss": -6.350021839141846, "global_step": 96710, "epoch": 2302} {"train_loss": -6.238784313201904, "global_step": 96711, "epoch": 2302} {"train_loss": -6.378874778747559, "global_step": 96712, "epoch": 2302} {"train_loss": -6.381162643432617, "global_step": 96713, "epoch": 2302} {"train_loss": -6.329626560211182, "global_step": 96714, "epoch": 2302} {"train_loss": -6.381624221801758, "global_step": 96715, "epoch": 2302} {"train_loss": -6.275221824645996, "global_step": 96716, "epoch": 2302} {"train_loss": -6.34175968170166, "global_step": 96717, "epoch": 2302} {"train_loss": -6.356235980987549, "global_step": 96718, "epoch": 2302} {"train_loss": -6.298580646514893, "global_step": 96719, "epoch": 2302} {"train_loss": -6.325643539428711, "global_step": 96720, "epoch": 2302} {"train_loss": -6.377954483032227, "global_step": 96721, "epoch": 2302} {"train_loss": -6.18569803237915, "global_step": 96722, "epoch": 2302} {"train_loss": -6.354048728942871, "global_step": 96723, "epoch": 2302} {"train_loss": -6.287820816040039, "global_step": 96724, "epoch": 2302} {"train_loss": -6.3451048873719715, "global_step": 96725, "epoch": 2302, "val_loss": 63728.83984375} {"train_loss": -6.423556327819824, "global_step": 96726, "epoch": 2303} {"train_loss": -6.41383171081543, "global_step": 96727, "epoch": 2303} {"train_loss": -6.356668472290039, "global_step": 96728, "epoch": 2303} {"train_loss": -6.285341262817383, "global_step": 96729, "epoch": 2303} {"train_loss": -6.2905426025390625, "global_step": 96730, "epoch": 2303} {"train_loss": -6.341241836547852, "global_step": 96731, "epoch": 2303} {"train_loss": -6.360715866088867, "global_step": 96732, "epoch": 2303} {"train_loss": -6.263293266296387, "global_step": 96733, "epoch": 2303} {"train_loss": -6.3977508544921875, "global_step": 96734, "epoch": 2303} {"train_loss": -6.347370147705078, "global_step": 96735, "epoch": 2303} {"train_loss": -6.342493057250977, "global_step": 96736, "epoch": 2303} {"train_loss": -6.364523410797119, "global_step": 96737, "epoch": 2303} {"train_loss": -6.383183479309082, "global_step": 96738, "epoch": 2303} {"train_loss": -6.287729263305664, "global_step": 96739, "epoch": 2303} {"train_loss": -6.294976711273193, "global_step": 96740, "epoch": 2303} {"train_loss": -6.463617324829102, "global_step": 96741, "epoch": 2303} {"train_loss": -6.402985572814941, "global_step": 96742, "epoch": 2303} {"train_loss": -6.401094436645508, "global_step": 96743, "epoch": 2303} {"train_loss": -6.388954162597656, "global_step": 96744, "epoch": 2303} {"train_loss": -6.218972206115723, "global_step": 96745, "epoch": 2303} {"train_loss": -6.314289093017578, "global_step": 96746, "epoch": 2303} {"train_loss": -6.313380718231201, "global_step": 96747, "epoch": 2303} {"train_loss": -6.361999034881592, "global_step": 96748, "epoch": 2303} {"train_loss": -6.336843490600586, "global_step": 96749, "epoch": 2303} {"train_loss": -6.322668075561523, "global_step": 96750, "epoch": 2303} {"train_loss": -6.316313743591309, "global_step": 96751, "epoch": 2303} {"train_loss": -6.24967098236084, "global_step": 96752, "epoch": 2303} {"train_loss": -6.289973258972168, "global_step": 96753, "epoch": 2303} {"train_loss": -6.267244815826416, "global_step": 96754, "epoch": 2303} {"train_loss": -6.283452033996582, "global_step": 96755, "epoch": 2303} {"train_loss": -6.2559099197387695, "global_step": 96756, "epoch": 2303} {"train_loss": -6.285126686096191, "global_step": 96757, "epoch": 2303} {"train_loss": -6.440186977386475, "global_step": 96758, "epoch": 2303} {"train_loss": -6.2973456382751465, "global_step": 96759, "epoch": 2303} {"train_loss": -6.37604284286499, "global_step": 96760, "epoch": 2303} {"train_loss": -6.341021537780762, "global_step": 96761, "epoch": 2303} {"train_loss": -6.392496109008789, "global_step": 96762, "epoch": 2303} {"train_loss": -6.217432975769043, "global_step": 96763, "epoch": 2303} {"train_loss": -6.358024597167969, "global_step": 96764, "epoch": 2303} {"train_loss": -6.445291519165039, "global_step": 96765, "epoch": 2303} {"train_loss": -6.366683006286621, "global_step": 96766, "epoch": 2303} {"train_loss": -6.337576684497652, "global_step": 96767, "epoch": 2303, "val_loss": 63804.49609375} {"train_loss": -6.151925563812256, "global_step": 96768, "epoch": 2304} {"train_loss": -6.35926628112793, "global_step": 96769, "epoch": 2304} {"train_loss": -6.229527473449707, "global_step": 96770, "epoch": 2304} {"train_loss": -6.23545503616333, "global_step": 96771, "epoch": 2304} {"train_loss": -6.330295562744141, "global_step": 96772, "epoch": 2304} {"train_loss": -6.1907854080200195, "global_step": 96773, "epoch": 2304} {"train_loss": -6.281970977783203, "global_step": 96774, "epoch": 2304} {"train_loss": -6.352900505065918, "global_step": 96775, "epoch": 2304} {"train_loss": -6.309090614318848, "global_step": 96776, "epoch": 2304} {"train_loss": -6.224390983581543, "global_step": 96777, "epoch": 2304} {"train_loss": -6.365949630737305, "global_step": 96778, "epoch": 2304} {"train_loss": -6.2508721351623535, "global_step": 96779, "epoch": 2304} {"train_loss": -6.408931732177734, "global_step": 96780, "epoch": 2304} {"train_loss": -6.262645244598389, "global_step": 96781, "epoch": 2304} {"train_loss": -6.33719539642334, "global_step": 96782, "epoch": 2304} {"train_loss": -6.3025383949279785, "global_step": 96783, "epoch": 2304} {"train_loss": -6.3973236083984375, "global_step": 96784, "epoch": 2304} {"train_loss": -6.406769275665283, "global_step": 96785, "epoch": 2304} {"train_loss": -6.292104721069336, "global_step": 96786, "epoch": 2304} {"train_loss": -6.323551177978516, "global_step": 96787, "epoch": 2304} {"train_loss": -6.30069637298584, "global_step": 96788, "epoch": 2304} {"train_loss": -6.39324951171875, "global_step": 96789, "epoch": 2304} {"train_loss": -6.417977809906006, "global_step": 96790, "epoch": 2304} {"train_loss": -6.408405303955078, "global_step": 96791, "epoch": 2304} {"train_loss": -6.448116302490234, "global_step": 96792, "epoch": 2304} {"train_loss": -6.311774253845215, "global_step": 96793, "epoch": 2304} {"train_loss": -6.413883686065674, "global_step": 96794, "epoch": 2304} {"train_loss": -6.452190399169922, "global_step": 96795, "epoch": 2304} {"train_loss": -6.464107990264893, "global_step": 96796, "epoch": 2304} {"train_loss": -6.344297409057617, "global_step": 96797, "epoch": 2304} {"train_loss": -6.418188095092773, "global_step": 96798, "epoch": 2304} {"train_loss": -6.39992618560791, "global_step": 96799, "epoch": 2304} {"train_loss": -6.4544758796691895, "global_step": 96800, "epoch": 2304} {"train_loss": -6.355734348297119, "global_step": 96801, "epoch": 2304} {"train_loss": -6.346249580383301, "global_step": 96802, "epoch": 2304} {"train_loss": -6.3853759765625, "global_step": 96803, "epoch": 2304} {"train_loss": -6.3669819831848145, "global_step": 96804, "epoch": 2304} {"train_loss": -6.290770530700684, "global_step": 96805, "epoch": 2304} {"train_loss": -6.237395286560059, "global_step": 96806, "epoch": 2304} {"train_loss": -6.449714183807373, "global_step": 96807, "epoch": 2304} {"train_loss": -6.16270637512207, "global_step": 96808, "epoch": 2304} {"train_loss": -6.334199632917132, "global_step": 96809, "epoch": 2304, "val_loss": 63859.42578125} {"train_loss": -6.28611946105957, "global_step": 96810, "epoch": 2305} {"train_loss": -6.236727237701416, "global_step": 96811, "epoch": 2305} {"train_loss": -6.318320274353027, "global_step": 96812, "epoch": 2305} {"train_loss": -6.215448379516602, "global_step": 96813, "epoch": 2305} {"train_loss": -6.362735271453857, "global_step": 96814, "epoch": 2305} {"train_loss": -6.353185653686523, "global_step": 96815, "epoch": 2305} {"train_loss": -6.244011878967285, "global_step": 96816, "epoch": 2305} {"train_loss": -6.235019683837891, "global_step": 96817, "epoch": 2305} {"train_loss": -6.386373519897461, "global_step": 96818, "epoch": 2305} {"train_loss": -6.356834411621094, "global_step": 96819, "epoch": 2305} {"train_loss": -6.353134632110596, "global_step": 96820, "epoch": 2305} {"train_loss": -6.290412902832031, "global_step": 96821, "epoch": 2305} {"train_loss": -6.269975185394287, "global_step": 96822, "epoch": 2305} {"train_loss": -6.258089065551758, "global_step": 96823, "epoch": 2305} {"train_loss": -6.369855880737305, "global_step": 96824, "epoch": 2305} {"train_loss": -6.403530120849609, "global_step": 96825, "epoch": 2305} {"train_loss": -6.329668998718262, "global_step": 96826, "epoch": 2305} {"train_loss": -6.336225509643555, "global_step": 96827, "epoch": 2305} {"train_loss": -6.2982563972473145, "global_step": 96828, "epoch": 2305} {"train_loss": -6.37322998046875, "global_step": 96829, "epoch": 2305} {"train_loss": -6.302975654602051, "global_step": 96830, "epoch": 2305} {"train_loss": -6.230778694152832, "global_step": 96831, "epoch": 2305} {"train_loss": -6.414571762084961, "global_step": 96832, "epoch": 2305} {"train_loss": -6.324227333068848, "global_step": 96833, "epoch": 2305} {"train_loss": -6.2721147537231445, "global_step": 96834, "epoch": 2305} {"train_loss": -6.410457611083984, "global_step": 96835, "epoch": 2305} {"train_loss": -6.369126319885254, "global_step": 96836, "epoch": 2305} {"train_loss": -6.290696144104004, "global_step": 96837, "epoch": 2305} {"train_loss": -6.357585906982422, "global_step": 96838, "epoch": 2305} {"train_loss": -6.201444625854492, "global_step": 96839, "epoch": 2305} {"train_loss": -6.320046901702881, "global_step": 96840, "epoch": 2305} {"train_loss": -6.3612284660339355, "global_step": 96841, "epoch": 2305} {"train_loss": -6.287837028503418, "global_step": 96842, "epoch": 2305} {"train_loss": -6.30966854095459, "global_step": 96843, "epoch": 2305} {"train_loss": -6.235682010650635, "global_step": 96844, "epoch": 2305} {"train_loss": -6.335287570953369, "global_step": 96845, "epoch": 2305} {"train_loss": -6.316283702850342, "global_step": 96846, "epoch": 2305} {"train_loss": -6.336518287658691, "global_step": 96847, "epoch": 2305} {"train_loss": -6.273017406463623, "global_step": 96848, "epoch": 2305} {"train_loss": -6.34797477722168, "global_step": 96849, "epoch": 2305} {"train_loss": -6.3747429847717285, "global_step": 96850, "epoch": 2305} {"train_loss": -6.313401426587786, "global_step": 96851, "epoch": 2305, "val_loss": 63830.80078125} {"train_loss": -6.421151638031006, "global_step": 96852, "epoch": 2306} {"train_loss": -6.283013343811035, "global_step": 96853, "epoch": 2306} {"train_loss": -6.371352195739746, "global_step": 96854, "epoch": 2306} {"train_loss": -6.39198112487793, "global_step": 96855, "epoch": 2306} {"train_loss": -6.349985122680664, "global_step": 96856, "epoch": 2306} {"train_loss": -6.372593402862549, "global_step": 96857, "epoch": 2306} {"train_loss": -6.145538330078125, "global_step": 96858, "epoch": 2306} {"train_loss": -6.347094535827637, "global_step": 96859, "epoch": 2306} {"train_loss": -6.24636173248291, "global_step": 96860, "epoch": 2306} {"train_loss": -6.3272905349731445, "global_step": 96861, "epoch": 2306} {"train_loss": -6.386724948883057, "global_step": 96862, "epoch": 2306} {"train_loss": -6.083839416503906, "global_step": 96863, "epoch": 2306} {"train_loss": -6.495201110839844, "global_step": 96864, "epoch": 2306} {"train_loss": -6.383570671081543, "global_step": 96865, "epoch": 2306} {"train_loss": -6.238303184509277, "global_step": 96866, "epoch": 2306} {"train_loss": -6.390045642852783, "global_step": 96867, "epoch": 2306} {"train_loss": -6.291313171386719, "global_step": 96868, "epoch": 2306} {"train_loss": -6.391826629638672, "global_step": 96869, "epoch": 2306} {"train_loss": -6.2865118980407715, "global_step": 96870, "epoch": 2306} {"train_loss": -6.429636478424072, "global_step": 96871, "epoch": 2306} {"train_loss": -6.283689975738525, "global_step": 96872, "epoch": 2306} {"train_loss": -6.353020668029785, "global_step": 96873, "epoch": 2306} {"train_loss": -6.38114070892334, "global_step": 96874, "epoch": 2306} {"train_loss": -6.398968696594238, "global_step": 96875, "epoch": 2306} {"train_loss": -6.277422904968262, "global_step": 96876, "epoch": 2306} {"train_loss": -6.289527893066406, "global_step": 96877, "epoch": 2306} {"train_loss": -6.389580249786377, "global_step": 96878, "epoch": 2306} {"train_loss": -6.328307628631592, "global_step": 96879, "epoch": 2306} {"train_loss": -6.339165687561035, "global_step": 96880, "epoch": 2306} {"train_loss": -6.164201259613037, "global_step": 96881, "epoch": 2306} {"train_loss": -6.43602180480957, "global_step": 96882, "epoch": 2306} {"train_loss": -6.3595123291015625, "global_step": 96883, "epoch": 2306} {"train_loss": -6.32800817489624, "global_step": 96884, "epoch": 2306} {"train_loss": -6.462927341461182, "global_step": 96885, "epoch": 2306} {"train_loss": -6.407278060913086, "global_step": 96886, "epoch": 2306} {"train_loss": -6.350564956665039, "global_step": 96887, "epoch": 2306} {"train_loss": -6.451533317565918, "global_step": 96888, "epoch": 2306} {"train_loss": -6.395655632019043, "global_step": 96889, "epoch": 2306} {"train_loss": -6.331846237182617, "global_step": 96890, "epoch": 2306} {"train_loss": -6.364716529846191, "global_step": 96891, "epoch": 2306} {"train_loss": -6.2397918701171875, "global_step": 96892, "epoch": 2306} {"train_loss": -6.344235363460722, "global_step": 96893, "epoch": 2306, "val_loss": 63677.1875} {"train_loss": -6.453370094299316, "global_step": 96894, "epoch": 2307} {"train_loss": -6.293268203735352, "global_step": 96895, "epoch": 2307} {"train_loss": -6.369354248046875, "global_step": 96896, "epoch": 2307} {"train_loss": -6.379655838012695, "global_step": 96897, "epoch": 2307} {"train_loss": -6.439360618591309, "global_step": 96898, "epoch": 2307} {"train_loss": -6.425749778747559, "global_step": 96899, "epoch": 2307} {"train_loss": -6.405187129974365, "global_step": 96900, "epoch": 2307} {"train_loss": -6.326962947845459, "global_step": 96901, "epoch": 2307} {"train_loss": -6.378513813018799, "global_step": 96902, "epoch": 2307} {"train_loss": -6.262330532073975, "global_step": 96903, "epoch": 2307} {"train_loss": -6.229303359985352, "global_step": 96904, "epoch": 2307} {"train_loss": -6.324154376983643, "global_step": 96905, "epoch": 2307} {"train_loss": -6.339554786682129, "global_step": 96906, "epoch": 2307} {"train_loss": -6.279130935668945, "global_step": 96907, "epoch": 2307} {"train_loss": -6.315580368041992, "global_step": 96908, "epoch": 2307} {"train_loss": -6.132319927215576, "global_step": 96909, "epoch": 2307} {"train_loss": -6.175113677978516, "global_step": 96910, "epoch": 2307} {"train_loss": -6.16070556640625, "global_step": 96911, "epoch": 2307} {"train_loss": -6.247204780578613, "global_step": 96912, "epoch": 2307} {"train_loss": -6.176163673400879, "global_step": 96913, "epoch": 2307} {"train_loss": -6.147269248962402, "global_step": 96914, "epoch": 2307} {"train_loss": -6.2225871086120605, "global_step": 96915, "epoch": 2307} {"train_loss": -6.185116767883301, "global_step": 96916, "epoch": 2307} {"train_loss": -6.108628273010254, "global_step": 96917, "epoch": 2307} {"train_loss": -6.177717208862305, "global_step": 96918, "epoch": 2307} {"train_loss": -6.292799472808838, "global_step": 96919, "epoch": 2307} {"train_loss": -6.236218452453613, "global_step": 96920, "epoch": 2307} {"train_loss": -6.319467544555664, "global_step": 96921, "epoch": 2307} {"train_loss": -6.151147365570068, "global_step": 96922, "epoch": 2307} {"train_loss": -6.205777645111084, "global_step": 96923, "epoch": 2307} {"train_loss": -6.360444068908691, "global_step": 96924, "epoch": 2307} {"train_loss": -6.201780319213867, "global_step": 96925, "epoch": 2307} {"train_loss": -6.302190780639648, "global_step": 96926, "epoch": 2307} {"train_loss": -6.235683441162109, "global_step": 96927, "epoch": 2307} {"train_loss": -6.306175231933594, "global_step": 96928, "epoch": 2307} {"train_loss": -6.3681840896606445, "global_step": 96929, "epoch": 2307} {"train_loss": -6.36597204208374, "global_step": 96930, "epoch": 2307} {"train_loss": -6.3384599685668945, "global_step": 96931, "epoch": 2307} {"train_loss": -6.318817138671875, "global_step": 96932, "epoch": 2307} {"train_loss": -6.4521403312683105, "global_step": 96933, "epoch": 2307} {"train_loss": -6.383644104003906, "global_step": 96934, "epoch": 2307} {"train_loss": -6.288402137302217, "global_step": 96935, "epoch": 2307, "val_loss": 63836.3671875} {"train_loss": -6.342445373535156, "global_step": 96936, "epoch": 2308} {"train_loss": -6.290962219238281, "global_step": 96937, "epoch": 2308} {"train_loss": -6.301114082336426, "global_step": 96938, "epoch": 2308} {"train_loss": -6.290159225463867, "global_step": 96939, "epoch": 2308} {"train_loss": -6.336200714111328, "global_step": 96940, "epoch": 2308} {"train_loss": -6.446652412414551, "global_step": 96941, "epoch": 2308} {"train_loss": -6.230391979217529, "global_step": 96942, "epoch": 2308} {"train_loss": -6.236650466918945, "global_step": 96943, "epoch": 2308} {"train_loss": -6.453306674957275, "global_step": 96944, "epoch": 2308} {"train_loss": -6.243316650390625, "global_step": 96945, "epoch": 2308} {"train_loss": -6.185777187347412, "global_step": 96946, "epoch": 2308} {"train_loss": -6.347214698791504, "global_step": 96947, "epoch": 2308} {"train_loss": -6.112990856170654, "global_step": 96948, "epoch": 2308} {"train_loss": -6.242467403411865, "global_step": 96949, "epoch": 2308} {"train_loss": -6.205430030822754, "global_step": 96950, "epoch": 2308} {"train_loss": -6.226116180419922, "global_step": 96951, "epoch": 2308} {"train_loss": -6.3174028396606445, "global_step": 96952, "epoch": 2308} {"train_loss": -6.303216934204102, "global_step": 96953, "epoch": 2308} {"train_loss": -6.292260646820068, "global_step": 96954, "epoch": 2308} {"train_loss": -6.237340927124023, "global_step": 96955, "epoch": 2308} {"train_loss": -6.3044939041137695, "global_step": 96956, "epoch": 2308} {"train_loss": -6.2613935470581055, "global_step": 96957, "epoch": 2308} {"train_loss": -6.271093368530273, "global_step": 96958, "epoch": 2308} {"train_loss": -6.151131629943848, "global_step": 96959, "epoch": 2308} {"train_loss": -6.2665605545043945, "global_step": 96960, "epoch": 2308} {"train_loss": -6.384330749511719, "global_step": 96961, "epoch": 2308} {"train_loss": -6.291808605194092, "global_step": 96962, "epoch": 2308} {"train_loss": -6.342277526855469, "global_step": 96963, "epoch": 2308} {"train_loss": -6.383149147033691, "global_step": 96964, "epoch": 2308} {"train_loss": -6.345641136169434, "global_step": 96965, "epoch": 2308} {"train_loss": -6.341745376586914, "global_step": 96966, "epoch": 2308} {"train_loss": -6.279747486114502, "global_step": 96967, "epoch": 2308} {"train_loss": -6.3461127281188965, "global_step": 96968, "epoch": 2308} {"train_loss": -6.397615432739258, "global_step": 96969, "epoch": 2308} {"train_loss": -6.305813789367676, "global_step": 96970, "epoch": 2308} {"train_loss": -6.386548042297363, "global_step": 96971, "epoch": 2308} {"train_loss": -6.321659088134766, "global_step": 96972, "epoch": 2308} {"train_loss": -6.428035736083984, "global_step": 96973, "epoch": 2308} {"train_loss": -6.3090009689331055, "global_step": 96974, "epoch": 2308} {"train_loss": -6.370368003845215, "global_step": 96975, "epoch": 2308} {"train_loss": -6.371685981750488, "global_step": 96976, "epoch": 2308} {"train_loss": -6.30674317904881, "global_step": 96977, "epoch": 2308, "val_loss": 63744.1328125} {"train_loss": -6.387386322021484, "global_step": 96978, "epoch": 2309} {"train_loss": -6.342942237854004, "global_step": 96979, "epoch": 2309} {"train_loss": -6.339268684387207, "global_step": 96980, "epoch": 2309} {"train_loss": -6.3715338706970215, "global_step": 96981, "epoch": 2309} {"train_loss": -6.412138938903809, "global_step": 96982, "epoch": 2309} {"train_loss": -6.341047286987305, "global_step": 96983, "epoch": 2309} {"train_loss": -6.364041328430176, "global_step": 96984, "epoch": 2309} {"train_loss": -6.343015670776367, "global_step": 96985, "epoch": 2309} {"train_loss": -6.346186637878418, "global_step": 96986, "epoch": 2309} {"train_loss": -6.3170270919799805, "global_step": 96987, "epoch": 2309} {"train_loss": -6.1549906730651855, "global_step": 96988, "epoch": 2309} {"train_loss": -6.317063331604004, "global_step": 96989, "epoch": 2309} {"train_loss": -6.114197731018066, "global_step": 96990, "epoch": 2309} {"train_loss": -6.259232997894287, "global_step": 96991, "epoch": 2309} {"train_loss": -6.248682975769043, "global_step": 96992, "epoch": 2309} {"train_loss": -6.305294990539551, "global_step": 96993, "epoch": 2309} {"train_loss": -6.2026777267456055, "global_step": 96994, "epoch": 2309} {"train_loss": -6.374102592468262, "global_step": 96995, "epoch": 2309} {"train_loss": -6.238577842712402, "global_step": 96996, "epoch": 2309} {"train_loss": -6.294430732727051, "global_step": 96997, "epoch": 2309} {"train_loss": -6.239408016204834, "global_step": 96998, "epoch": 2309} {"train_loss": -6.380784034729004, "global_step": 96999, "epoch": 2309} {"train_loss": -6.382448196411133, "global_step": 97000, "epoch": 2309} {"train_loss": -6.458661079406738, "global_step": 97001, "epoch": 2309} {"train_loss": -6.31711483001709, "global_step": 97002, "epoch": 2309} {"train_loss": -6.243512153625488, "global_step": 97003, "epoch": 2309} {"train_loss": -6.3250956535339355, "global_step": 97004, "epoch": 2309} {"train_loss": -6.261066436767578, "global_step": 97005, "epoch": 2309} {"train_loss": -6.347234725952148, "global_step": 97006, "epoch": 2309} {"train_loss": -6.274460792541504, "global_step": 97007, "epoch": 2309} {"train_loss": -6.366636753082275, "global_step": 97008, "epoch": 2309} {"train_loss": -6.182164192199707, "global_step": 97009, "epoch": 2309} {"train_loss": -6.321646690368652, "global_step": 97010, "epoch": 2309} {"train_loss": -6.235386371612549, "global_step": 97011, "epoch": 2309} {"train_loss": -6.373711109161377, "global_step": 97012, "epoch": 2309} {"train_loss": -6.3312859535217285, "global_step": 97013, "epoch": 2309} {"train_loss": -6.315834999084473, "global_step": 97014, "epoch": 2309} {"train_loss": -6.309874534606934, "global_step": 97015, "epoch": 2309} {"train_loss": -6.363080978393555, "global_step": 97016, "epoch": 2309} {"train_loss": -6.366296768188477, "global_step": 97017, "epoch": 2309} {"train_loss": -6.304034233093262, "global_step": 97018, "epoch": 2309} {"train_loss": -6.311304909842355, "global_step": 97019, "epoch": 2309, "val_loss": 63865.75390625} {"train_loss": -6.27650785446167, "global_step": 97020, "epoch": 2310} {"train_loss": -6.323673248291016, "global_step": 97021, "epoch": 2310} {"train_loss": -6.417210578918457, "global_step": 97022, "epoch": 2310} {"train_loss": -6.331019401550293, "global_step": 97023, "epoch": 2310} {"train_loss": -6.298905372619629, "global_step": 97024, "epoch": 2310} {"train_loss": -6.295511245727539, "global_step": 97025, "epoch": 2310} {"train_loss": -6.406174182891846, "global_step": 97026, "epoch": 2310} {"train_loss": -6.392823219299316, "global_step": 97027, "epoch": 2310} {"train_loss": -6.3301310539245605, "global_step": 97028, "epoch": 2310} {"train_loss": -6.450238227844238, "global_step": 97029, "epoch": 2310} {"train_loss": -6.457566261291504, "global_step": 97030, "epoch": 2310} {"train_loss": -6.3796539306640625, "global_step": 97031, "epoch": 2310} {"train_loss": -6.361539840698242, "global_step": 97032, "epoch": 2310} {"train_loss": -6.387775897979736, "global_step": 97033, "epoch": 2310} {"train_loss": -6.385274887084961, "global_step": 97034, "epoch": 2310} {"train_loss": -6.440915584564209, "global_step": 97035, "epoch": 2310} {"train_loss": -6.389313220977783, "global_step": 97036, "epoch": 2310} {"train_loss": -6.441493511199951, "global_step": 97037, "epoch": 2310} {"train_loss": -6.3736958503723145, "global_step": 97038, "epoch": 2310} {"train_loss": -6.282900810241699, "global_step": 97039, "epoch": 2310} {"train_loss": -6.303397178649902, "global_step": 97040, "epoch": 2310} {"train_loss": -6.335343837738037, "global_step": 97041, "epoch": 2310} {"train_loss": -6.410389423370361, "global_step": 97042, "epoch": 2310} {"train_loss": -6.245425224304199, "global_step": 97043, "epoch": 2310} {"train_loss": -6.375482559204102, "global_step": 97044, "epoch": 2310} {"train_loss": -6.36995267868042, "global_step": 97045, "epoch": 2310} {"train_loss": -6.360445499420166, "global_step": 97046, "epoch": 2310} {"train_loss": -6.429819107055664, "global_step": 97047, "epoch": 2310} {"train_loss": -6.215210914611816, "global_step": 97048, "epoch": 2310} {"train_loss": -6.298165798187256, "global_step": 97049, "epoch": 2310} {"train_loss": -6.365725517272949, "global_step": 97050, "epoch": 2310} {"train_loss": -6.2225189208984375, "global_step": 97051, "epoch": 2310} {"train_loss": -6.3856730461120605, "global_step": 97052, "epoch": 2310} {"train_loss": -6.29521369934082, "global_step": 97053, "epoch": 2310} {"train_loss": -6.412139892578125, "global_step": 97054, "epoch": 2310} {"train_loss": -6.235248565673828, "global_step": 97055, "epoch": 2310} {"train_loss": -6.3986992835998535, "global_step": 97056, "epoch": 2310} {"train_loss": -6.432461738586426, "global_step": 97057, "epoch": 2310} {"train_loss": -6.397480010986328, "global_step": 97058, "epoch": 2310} {"train_loss": -6.368417739868164, "global_step": 97059, "epoch": 2310} {"train_loss": -6.240499019622803, "global_step": 97060, "epoch": 2310} {"train_loss": -6.3546194803147085, "global_step": 97061, "epoch": 2310, "val_loss": 63660.47265625} {"train_loss": -6.374197006225586, "global_step": 97062, "epoch": 2311} {"train_loss": -6.412212371826172, "global_step": 97063, "epoch": 2311} {"train_loss": -6.304129600524902, "global_step": 97064, "epoch": 2311} {"train_loss": -6.348736763000488, "global_step": 97065, "epoch": 2311} {"train_loss": -6.472327709197998, "global_step": 97066, "epoch": 2311} {"train_loss": -6.307490348815918, "global_step": 97067, "epoch": 2311} {"train_loss": -6.414017677307129, "global_step": 97068, "epoch": 2311} {"train_loss": -6.321157455444336, "global_step": 97069, "epoch": 2311} {"train_loss": -6.331937789916992, "global_step": 97070, "epoch": 2311} {"train_loss": -6.244244575500488, "global_step": 97071, "epoch": 2311} {"train_loss": -6.232564926147461, "global_step": 97072, "epoch": 2311} {"train_loss": -6.443365097045898, "global_step": 97073, "epoch": 2311} {"train_loss": -6.345104217529297, "global_step": 97074, "epoch": 2311} {"train_loss": -6.441076278686523, "global_step": 97075, "epoch": 2311} {"train_loss": -6.334998607635498, "global_step": 97076, "epoch": 2311} {"train_loss": -6.236176490783691, "global_step": 97077, "epoch": 2311} {"train_loss": -6.328462600708008, "global_step": 97078, "epoch": 2311} {"train_loss": -6.4110493659973145, "global_step": 97079, "epoch": 2311} {"train_loss": -6.4132585525512695, "global_step": 97080, "epoch": 2311} {"train_loss": -6.228785514831543, "global_step": 97081, "epoch": 2311} {"train_loss": -6.396762847900391, "global_step": 97082, "epoch": 2311} {"train_loss": -6.5244364738464355, "global_step": 97083, "epoch": 2311} {"train_loss": -6.337721824645996, "global_step": 97084, "epoch": 2311} {"train_loss": -6.461549758911133, "global_step": 97085, "epoch": 2311} {"train_loss": -6.331181049346924, "global_step": 97086, "epoch": 2311} {"train_loss": -6.373246669769287, "global_step": 97087, "epoch": 2311} {"train_loss": -6.351393699645996, "global_step": 97088, "epoch": 2311} {"train_loss": -6.316773414611816, "global_step": 97089, "epoch": 2311} {"train_loss": -6.3917388916015625, "global_step": 97090, "epoch": 2311} {"train_loss": -6.3868608474731445, "global_step": 97091, "epoch": 2311} {"train_loss": -6.365009307861328, "global_step": 97092, "epoch": 2311} {"train_loss": -6.285180568695068, "global_step": 97093, "epoch": 2311} {"train_loss": -6.5271220207214355, "global_step": 97094, "epoch": 2311} {"train_loss": -6.361514091491699, "global_step": 97095, "epoch": 2311} {"train_loss": -6.524140357971191, "global_step": 97096, "epoch": 2311} {"train_loss": -6.341437816619873, "global_step": 97097, "epoch": 2311} {"train_loss": -6.429774761199951, "global_step": 97098, "epoch": 2311} {"train_loss": -6.40311861038208, "global_step": 97099, "epoch": 2311} {"train_loss": -6.3111677169799805, "global_step": 97100, "epoch": 2311} {"train_loss": -6.40378475189209, "global_step": 97101, "epoch": 2311} {"train_loss": -6.322585105895996, "global_step": 97102, "epoch": 2311} {"train_loss": -6.370032333192372, "global_step": 97103, "epoch": 2311, "val_loss": 63891.47265625} {"train_loss": -6.41953182220459, "global_step": 97104, "epoch": 2312} {"train_loss": -6.385249137878418, "global_step": 97105, "epoch": 2312} {"train_loss": -6.428707122802734, "global_step": 97106, "epoch": 2312} {"train_loss": -6.415789604187012, "global_step": 97107, "epoch": 2312} {"train_loss": -6.320394515991211, "global_step": 97108, "epoch": 2312} {"train_loss": -6.322256565093994, "global_step": 97109, "epoch": 2312} {"train_loss": -6.366356372833252, "global_step": 97110, "epoch": 2312} {"train_loss": -6.298835754394531, "global_step": 97111, "epoch": 2312} {"train_loss": -6.332427978515625, "global_step": 97112, "epoch": 2312} {"train_loss": -6.396352767944336, "global_step": 97113, "epoch": 2312} {"train_loss": -6.4056525230407715, "global_step": 97114, "epoch": 2312} {"train_loss": -6.354108810424805, "global_step": 97115, "epoch": 2312} {"train_loss": -6.5291924476623535, "global_step": 97116, "epoch": 2312} {"train_loss": -6.229668140411377, "global_step": 97117, "epoch": 2312} {"train_loss": -6.388755798339844, "global_step": 97118, "epoch": 2312} {"train_loss": -6.247605323791504, "global_step": 97119, "epoch": 2312} {"train_loss": -6.182546138763428, "global_step": 97120, "epoch": 2312} {"train_loss": -6.463193893432617, "global_step": 97121, "epoch": 2312} {"train_loss": -6.232193470001221, "global_step": 97122, "epoch": 2312} {"train_loss": -6.2287726402282715, "global_step": 97123, "epoch": 2312} {"train_loss": -6.274145126342773, "global_step": 97124, "epoch": 2312} {"train_loss": -6.308403968811035, "global_step": 97125, "epoch": 2312} {"train_loss": -6.310277938842773, "global_step": 97126, "epoch": 2312} {"train_loss": -6.242971897125244, "global_step": 97127, "epoch": 2312} {"train_loss": -6.496953010559082, "global_step": 97128, "epoch": 2312} {"train_loss": -6.3425703048706055, "global_step": 97129, "epoch": 2312} {"train_loss": -6.412369728088379, "global_step": 97130, "epoch": 2312} {"train_loss": -6.299246788024902, "global_step": 97131, "epoch": 2312} {"train_loss": -6.48115348815918, "global_step": 97132, "epoch": 2312} {"train_loss": -6.466976642608643, "global_step": 97133, "epoch": 2312} {"train_loss": -6.404196262359619, "global_step": 97134, "epoch": 2312} {"train_loss": -6.26993465423584, "global_step": 97135, "epoch": 2312} {"train_loss": -6.378430366516113, "global_step": 97136, "epoch": 2312} {"train_loss": -6.415958404541016, "global_step": 97137, "epoch": 2312} {"train_loss": -6.361303329467773, "global_step": 97138, "epoch": 2312} {"train_loss": -6.295206546783447, "global_step": 97139, "epoch": 2312} {"train_loss": -6.288364410400391, "global_step": 97140, "epoch": 2312} {"train_loss": -6.371411323547363, "global_step": 97141, "epoch": 2312} {"train_loss": -6.197810649871826, "global_step": 97142, "epoch": 2312} {"train_loss": -6.386743068695068, "global_step": 97143, "epoch": 2312} {"train_loss": -6.371629238128662, "global_step": 97144, "epoch": 2312} {"train_loss": -6.346884727478027, "global_step": 97145, "epoch": 2312, "val_loss": 63760.90234375} {"train_loss": -6.323448657989502, "global_step": 97146, "epoch": 2313} {"train_loss": -6.237131118774414, "global_step": 97147, "epoch": 2313} {"train_loss": -6.314281463623047, "global_step": 97148, "epoch": 2313} {"train_loss": -6.304147720336914, "global_step": 97149, "epoch": 2313} {"train_loss": -6.396875381469727, "global_step": 97150, "epoch": 2313} {"train_loss": -6.364452362060547, "global_step": 97151, "epoch": 2313} {"train_loss": -6.354428291320801, "global_step": 97152, "epoch": 2313} {"train_loss": -6.342333793640137, "global_step": 97153, "epoch": 2313} {"train_loss": -6.194479942321777, "global_step": 97154, "epoch": 2313} {"train_loss": -6.316576957702637, "global_step": 97155, "epoch": 2313} {"train_loss": -6.352148056030273, "global_step": 97156, "epoch": 2313} {"train_loss": -6.297616481781006, "global_step": 97157, "epoch": 2313} {"train_loss": -6.372784614562988, "global_step": 97158, "epoch": 2313} {"train_loss": -6.285283088684082, "global_step": 97159, "epoch": 2313} {"train_loss": -6.235354423522949, "global_step": 97160, "epoch": 2313} {"train_loss": -6.263641357421875, "global_step": 97161, "epoch": 2313} {"train_loss": -6.403267860412598, "global_step": 97162, "epoch": 2313} {"train_loss": -6.290671348571777, "global_step": 97163, "epoch": 2313} {"train_loss": -6.252675533294678, "global_step": 97164, "epoch": 2313} {"train_loss": -6.340024948120117, "global_step": 97165, "epoch": 2313} {"train_loss": -6.410574913024902, "global_step": 97166, "epoch": 2313} {"train_loss": -6.396377086639404, "global_step": 97167, "epoch": 2313} {"train_loss": -6.378654479980469, "global_step": 97168, "epoch": 2313} {"train_loss": -6.3488359451293945, "global_step": 97169, "epoch": 2313} {"train_loss": -6.333187103271484, "global_step": 97170, "epoch": 2313} {"train_loss": -6.308942794799805, "global_step": 97171, "epoch": 2313} {"train_loss": -6.391822814941406, "global_step": 97172, "epoch": 2313} {"train_loss": -6.190303802490234, "global_step": 97173, "epoch": 2313} {"train_loss": -6.336267471313477, "global_step": 97174, "epoch": 2313} {"train_loss": -6.284189224243164, "global_step": 97175, "epoch": 2313} {"train_loss": -6.224979400634766, "global_step": 97176, "epoch": 2313} {"train_loss": -6.273874282836914, "global_step": 97177, "epoch": 2313} {"train_loss": -6.388916969299316, "global_step": 97178, "epoch": 2313} {"train_loss": -6.454401016235352, "global_step": 97179, "epoch": 2313} {"train_loss": -6.322917938232422, "global_step": 97180, "epoch": 2313} {"train_loss": -6.383283615112305, "global_step": 97181, "epoch": 2313} {"train_loss": -6.353243350982666, "global_step": 97182, "epoch": 2313} {"train_loss": -6.375301837921143, "global_step": 97183, "epoch": 2313} {"train_loss": -6.351479530334473, "global_step": 97184, "epoch": 2313} {"train_loss": -6.366312026977539, "global_step": 97185, "epoch": 2313} {"train_loss": -6.302051067352295, "global_step": 97186, "epoch": 2313} {"train_loss": -6.326812403542655, "global_step": 97187, "epoch": 2313, "val_loss": 63645.11328125} {"train_loss": -6.361905574798584, "global_step": 97188, "epoch": 2314} {"train_loss": -6.294411659240723, "global_step": 97189, "epoch": 2314} {"train_loss": -6.4060282707214355, "global_step": 97190, "epoch": 2314} {"train_loss": -6.291839599609375, "global_step": 97191, "epoch": 2314} {"train_loss": -6.382633209228516, "global_step": 97192, "epoch": 2314} {"train_loss": -6.270810127258301, "global_step": 97193, "epoch": 2314} {"train_loss": -6.337748050689697, "global_step": 97194, "epoch": 2314} {"train_loss": -6.303937911987305, "global_step": 97195, "epoch": 2314} {"train_loss": -6.310751914978027, "global_step": 97196, "epoch": 2314} {"train_loss": -6.3715314865112305, "global_step": 97197, "epoch": 2314} {"train_loss": -6.378880500793457, "global_step": 97198, "epoch": 2314} {"train_loss": -6.276628494262695, "global_step": 97199, "epoch": 2314} {"train_loss": -6.324688911437988, "global_step": 97200, "epoch": 2314} {"train_loss": -6.288601398468018, "global_step": 97201, "epoch": 2314} {"train_loss": -6.2338666915893555, "global_step": 97202, "epoch": 2314} {"train_loss": -6.322476387023926, "global_step": 97203, "epoch": 2314} {"train_loss": -6.410099983215332, "global_step": 97204, "epoch": 2314} {"train_loss": -6.235134124755859, "global_step": 97205, "epoch": 2314} {"train_loss": -6.345985412597656, "global_step": 97206, "epoch": 2314} {"train_loss": -6.3126678466796875, "global_step": 97207, "epoch": 2314} {"train_loss": -6.2878499031066895, "global_step": 97208, "epoch": 2314} {"train_loss": -6.381490230560303, "global_step": 97209, "epoch": 2314} {"train_loss": -6.362814903259277, "global_step": 97210, "epoch": 2314} {"train_loss": -6.306117534637451, "global_step": 97211, "epoch": 2314} {"train_loss": -6.318739891052246, "global_step": 97212, "epoch": 2314} {"train_loss": -6.188945770263672, "global_step": 97213, "epoch": 2314} {"train_loss": -6.361189842224121, "global_step": 97214, "epoch": 2314} {"train_loss": -6.322681427001953, "global_step": 97215, "epoch": 2314} {"train_loss": -6.272800445556641, "global_step": 97216, "epoch": 2314} {"train_loss": -6.359813690185547, "global_step": 97217, "epoch": 2314} {"train_loss": -6.260706901550293, "global_step": 97218, "epoch": 2314} {"train_loss": -6.299186706542969, "global_step": 97219, "epoch": 2314} {"train_loss": -6.339702606201172, "global_step": 97220, "epoch": 2314} {"train_loss": -6.362130165100098, "global_step": 97221, "epoch": 2314} {"train_loss": -6.201868057250977, "global_step": 97222, "epoch": 2314} {"train_loss": -6.4002532958984375, "global_step": 97223, "epoch": 2314} {"train_loss": -6.388993263244629, "global_step": 97224, "epoch": 2314} {"train_loss": -6.2309393882751465, "global_step": 97225, "epoch": 2314} {"train_loss": -6.297406196594238, "global_step": 97226, "epoch": 2314} {"train_loss": -6.452622413635254, "global_step": 97227, "epoch": 2314} {"train_loss": -6.195496082305908, "global_step": 97228, "epoch": 2314} {"train_loss": -6.320088023231143, "global_step": 97229, "epoch": 2314, "val_loss": 63824.0390625} {"train_loss": -6.322276592254639, "global_step": 97230, "epoch": 2315} {"train_loss": -6.240819931030273, "global_step": 97231, "epoch": 2315} {"train_loss": -6.461393356323242, "global_step": 97232, "epoch": 2315} {"train_loss": -6.3918585777282715, "global_step": 97233, "epoch": 2315} {"train_loss": -6.368190765380859, "global_step": 97234, "epoch": 2315} {"train_loss": -6.404741287231445, "global_step": 97235, "epoch": 2315} {"train_loss": -6.246224403381348, "global_step": 97236, "epoch": 2315} {"train_loss": -6.164262294769287, "global_step": 97237, "epoch": 2315} {"train_loss": -6.273954391479492, "global_step": 97238, "epoch": 2315} {"train_loss": -6.263073921203613, "global_step": 97239, "epoch": 2315} {"train_loss": -6.139520168304443, "global_step": 97240, "epoch": 2315} {"train_loss": -6.163146018981934, "global_step": 97241, "epoch": 2315} {"train_loss": -6.323816776275635, "global_step": 97242, "epoch": 2315} {"train_loss": -6.234626770019531, "global_step": 97243, "epoch": 2315} {"train_loss": -6.3208818435668945, "global_step": 97244, "epoch": 2315} {"train_loss": -6.3832268714904785, "global_step": 97245, "epoch": 2315} {"train_loss": -6.212061405181885, "global_step": 97246, "epoch": 2315} {"train_loss": -6.329023361206055, "global_step": 97247, "epoch": 2315} {"train_loss": -6.414810657501221, "global_step": 97248, "epoch": 2315} {"train_loss": -6.3010406494140625, "global_step": 97249, "epoch": 2315} {"train_loss": -6.430520534515381, "global_step": 97250, "epoch": 2315} {"train_loss": -6.375306606292725, "global_step": 97251, "epoch": 2315} {"train_loss": -6.369065761566162, "global_step": 97252, "epoch": 2315} {"train_loss": -6.281533718109131, "global_step": 97253, "epoch": 2315} {"train_loss": -6.364266872406006, "global_step": 97254, "epoch": 2315} {"train_loss": -6.342405319213867, "global_step": 97255, "epoch": 2315} {"train_loss": -6.31767463684082, "global_step": 97256, "epoch": 2315} {"train_loss": -6.353782653808594, "global_step": 97257, "epoch": 2315} {"train_loss": -6.266289710998535, "global_step": 97258, "epoch": 2315} {"train_loss": -6.365218639373779, "global_step": 97259, "epoch": 2315} {"train_loss": -6.207118034362793, "global_step": 97260, "epoch": 2315} {"train_loss": -6.336530685424805, "global_step": 97261, "epoch": 2315} {"train_loss": -6.353208541870117, "global_step": 97262, "epoch": 2315} {"train_loss": -6.160924434661865, "global_step": 97263, "epoch": 2315} {"train_loss": -6.244839668273926, "global_step": 97264, "epoch": 2315} {"train_loss": -6.29010534286499, "global_step": 97265, "epoch": 2315} {"train_loss": -6.2581281661987305, "global_step": 97266, "epoch": 2315} {"train_loss": -6.23307991027832, "global_step": 97267, "epoch": 2315} {"train_loss": -6.261728286743164, "global_step": 97268, "epoch": 2315} {"train_loss": -6.249386787414551, "global_step": 97269, "epoch": 2315} {"train_loss": -6.296276569366455, "global_step": 97270, "epoch": 2315} {"train_loss": -6.302274352028256, "global_step": 97271, "epoch": 2315, "val_loss": 63875.17578125} {"train_loss": -6.174181938171387, "global_step": 97272, "epoch": 2316} {"train_loss": -6.3772125244140625, "global_step": 97273, "epoch": 2316} {"train_loss": -6.349462032318115, "global_step": 97274, "epoch": 2316} {"train_loss": -6.278368949890137, "global_step": 97275, "epoch": 2316} {"train_loss": -6.233948707580566, "global_step": 97276, "epoch": 2316} {"train_loss": -6.314901351928711, "global_step": 97277, "epoch": 2316} {"train_loss": -6.276683330535889, "global_step": 97278, "epoch": 2316} {"train_loss": -6.283842086791992, "global_step": 97279, "epoch": 2316} {"train_loss": -6.30153751373291, "global_step": 97280, "epoch": 2316} {"train_loss": -6.32042932510376, "global_step": 97281, "epoch": 2316} {"train_loss": -6.308358669281006, "global_step": 97282, "epoch": 2316} {"train_loss": -6.38300085067749, "global_step": 97283, "epoch": 2316} {"train_loss": -6.361490249633789, "global_step": 97284, "epoch": 2316} {"train_loss": -6.3874616622924805, "global_step": 97285, "epoch": 2316} {"train_loss": -6.423641204833984, "global_step": 97286, "epoch": 2316} {"train_loss": -6.373555660247803, "global_step": 97287, "epoch": 2316} {"train_loss": -6.2463908195495605, "global_step": 97288, "epoch": 2316} {"train_loss": -6.256938457489014, "global_step": 97289, "epoch": 2316} {"train_loss": -6.29140043258667, "global_step": 97290, "epoch": 2316} {"train_loss": -6.548457622528076, "global_step": 97291, "epoch": 2316} {"train_loss": -6.347944259643555, "global_step": 97292, "epoch": 2316} {"train_loss": -6.3390092849731445, "global_step": 97293, "epoch": 2316} {"train_loss": -6.396416664123535, "global_step": 97294, "epoch": 2316} {"train_loss": -6.33638334274292, "global_step": 97295, "epoch": 2316} {"train_loss": -6.444934844970703, "global_step": 97296, "epoch": 2316} {"train_loss": -6.307506084442139, "global_step": 97297, "epoch": 2316} {"train_loss": -6.294122695922852, "global_step": 97298, "epoch": 2316} {"train_loss": -6.327348709106445, "global_step": 97299, "epoch": 2316} {"train_loss": -6.4450459480285645, "global_step": 97300, "epoch": 2316} {"train_loss": -6.422493934631348, "global_step": 97301, "epoch": 2316} {"train_loss": -6.290346622467041, "global_step": 97302, "epoch": 2316} {"train_loss": -6.417450904846191, "global_step": 97303, "epoch": 2316} {"train_loss": -6.30087947845459, "global_step": 97304, "epoch": 2316} {"train_loss": -6.338283538818359, "global_step": 97305, "epoch": 2316} {"train_loss": -6.3662333488464355, "global_step": 97306, "epoch": 2316} {"train_loss": -6.375025272369385, "global_step": 97307, "epoch": 2316} {"train_loss": -6.3210320472717285, "global_step": 97308, "epoch": 2316} {"train_loss": -6.431122779846191, "global_step": 97309, "epoch": 2316} {"train_loss": -6.464084148406982, "global_step": 97310, "epoch": 2316} {"train_loss": -6.4304423332214355, "global_step": 97311, "epoch": 2316} {"train_loss": -6.522675514221191, "global_step": 97312, "epoch": 2316} {"train_loss": -6.351775328318278, "global_step": 97313, "epoch": 2316, "val_loss": 63673.7265625} {"train_loss": -6.371183395385742, "global_step": 97314, "epoch": 2317} {"train_loss": -6.282057762145996, "global_step": 97315, "epoch": 2317} {"train_loss": -6.407815456390381, "global_step": 97316, "epoch": 2317} {"train_loss": -6.433945655822754, "global_step": 97317, "epoch": 2317} {"train_loss": -6.3372392654418945, "global_step": 97318, "epoch": 2317} {"train_loss": -6.303905487060547, "global_step": 97319, "epoch": 2317} {"train_loss": -6.384000778198242, "global_step": 97320, "epoch": 2317} {"train_loss": -6.378264427185059, "global_step": 97321, "epoch": 2317} {"train_loss": -6.383021354675293, "global_step": 97322, "epoch": 2317} {"train_loss": -6.415804386138916, "global_step": 97323, "epoch": 2317} {"train_loss": -6.434037208557129, "global_step": 97324, "epoch": 2317} {"train_loss": -6.421713829040527, "global_step": 97325, "epoch": 2317} {"train_loss": -6.336235523223877, "global_step": 97326, "epoch": 2317} {"train_loss": -6.3267822265625, "global_step": 97327, "epoch": 2317} {"train_loss": -6.338860511779785, "global_step": 97328, "epoch": 2317} {"train_loss": -6.328863143920898, "global_step": 97329, "epoch": 2317} {"train_loss": -6.329185485839844, "global_step": 97330, "epoch": 2317} {"train_loss": -6.504993915557861, "global_step": 97331, "epoch": 2317} {"train_loss": -6.439286708831787, "global_step": 97332, "epoch": 2317} {"train_loss": -6.471778869628906, "global_step": 97333, "epoch": 2317} {"train_loss": -6.405549049377441, "global_step": 97334, "epoch": 2317} {"train_loss": -6.374137878417969, "global_step": 97335, "epoch": 2317} {"train_loss": -6.361064910888672, "global_step": 97336, "epoch": 2317} {"train_loss": -6.406854629516602, "global_step": 97337, "epoch": 2317} {"train_loss": -6.251107215881348, "global_step": 97338, "epoch": 2317} {"train_loss": -6.374515533447266, "global_step": 97339, "epoch": 2317} {"train_loss": -6.412188529968262, "global_step": 97340, "epoch": 2317} {"train_loss": -6.283312797546387, "global_step": 97341, "epoch": 2317} {"train_loss": -6.290683746337891, "global_step": 97342, "epoch": 2317} {"train_loss": -6.299630641937256, "global_step": 97343, "epoch": 2317} {"train_loss": -6.2917799949646, "global_step": 97344, "epoch": 2317} {"train_loss": -6.304564476013184, "global_step": 97345, "epoch": 2317} {"train_loss": -6.336156368255615, "global_step": 97346, "epoch": 2317} {"train_loss": -6.28891658782959, "global_step": 97347, "epoch": 2317} {"train_loss": -6.233234405517578, "global_step": 97348, "epoch": 2317} {"train_loss": -6.407818794250488, "global_step": 97349, "epoch": 2317} {"train_loss": -6.352050304412842, "global_step": 97350, "epoch": 2317} {"train_loss": -6.4304094314575195, "global_step": 97351, "epoch": 2317} {"train_loss": -6.359807968139648, "global_step": 97352, "epoch": 2317} {"train_loss": -6.35277795791626, "global_step": 97353, "epoch": 2317} {"train_loss": -6.2733988761901855, "global_step": 97354, "epoch": 2317} {"train_loss": -6.358103649956839, "global_step": 97355, "epoch": 2317, "val_loss": 63987.6640625} {"train_loss": -6.34253454208374, "global_step": 97356, "epoch": 2318} {"train_loss": -6.5096540451049805, "global_step": 97357, "epoch": 2318} {"train_loss": -6.386505126953125, "global_step": 97358, "epoch": 2318} {"train_loss": -6.337863922119141, "global_step": 97359, "epoch": 2318} {"train_loss": -6.362213611602783, "global_step": 97360, "epoch": 2318} {"train_loss": -6.320806503295898, "global_step": 97361, "epoch": 2318} {"train_loss": -6.439413547515869, "global_step": 97362, "epoch": 2318} {"train_loss": -6.340421676635742, "global_step": 97363, "epoch": 2318} {"train_loss": -6.445891380310059, "global_step": 97364, "epoch": 2318} {"train_loss": -6.566512107849121, "global_step": 97365, "epoch": 2318} {"train_loss": -6.343515872955322, "global_step": 97366, "epoch": 2318} {"train_loss": -6.391822338104248, "global_step": 97367, "epoch": 2318} {"train_loss": -6.370354652404785, "global_step": 97368, "epoch": 2318} {"train_loss": -6.346061706542969, "global_step": 97369, "epoch": 2318} {"train_loss": -6.206723213195801, "global_step": 97370, "epoch": 2318} {"train_loss": -6.352835655212402, "global_step": 97371, "epoch": 2318} {"train_loss": -6.253779411315918, "global_step": 97372, "epoch": 2318} {"train_loss": -6.405388832092285, "global_step": 97373, "epoch": 2318} {"train_loss": -6.353012561798096, "global_step": 97374, "epoch": 2318} {"train_loss": -6.266633987426758, "global_step": 97375, "epoch": 2318} {"train_loss": -6.1804518699646, "global_step": 97376, "epoch": 2318} {"train_loss": -6.379815578460693, "global_step": 97377, "epoch": 2318} {"train_loss": -6.146501541137695, "global_step": 97378, "epoch": 2318} {"train_loss": -6.196475982666016, "global_step": 97379, "epoch": 2318} {"train_loss": -6.484116554260254, "global_step": 97380, "epoch": 2318} {"train_loss": -6.252960681915283, "global_step": 97381, "epoch": 2318} {"train_loss": -6.246025085449219, "global_step": 97382, "epoch": 2318} {"train_loss": -6.324095726013184, "global_step": 97383, "epoch": 2318} {"train_loss": -6.22877311706543, "global_step": 97384, "epoch": 2318} {"train_loss": -6.327610969543457, "global_step": 97385, "epoch": 2318} {"train_loss": -6.335172653198242, "global_step": 97386, "epoch": 2318} {"train_loss": -6.26480770111084, "global_step": 97387, "epoch": 2318} {"train_loss": -6.254626750946045, "global_step": 97388, "epoch": 2318} {"train_loss": -6.18394660949707, "global_step": 97389, "epoch": 2318} {"train_loss": -6.263882160186768, "global_step": 97390, "epoch": 2318} {"train_loss": -6.3213791847229, "global_step": 97391, "epoch": 2318} {"train_loss": -6.2636213302612305, "global_step": 97392, "epoch": 2318} {"train_loss": -6.239801406860352, "global_step": 97393, "epoch": 2318} {"train_loss": -6.386923789978027, "global_step": 97394, "epoch": 2318} {"train_loss": -6.320805549621582, "global_step": 97395, "epoch": 2318} {"train_loss": -6.270003318786621, "global_step": 97396, "epoch": 2318} {"train_loss": -6.323364587057204, "global_step": 97397, "epoch": 2318, "val_loss": 63824.265625} {"train_loss": -6.368690490722656, "global_step": 97398, "epoch": 2319} {"train_loss": -6.401505470275879, "global_step": 97399, "epoch": 2319} {"train_loss": -6.311992645263672, "global_step": 97400, "epoch": 2319} {"train_loss": -6.319128513336182, "global_step": 97401, "epoch": 2319} {"train_loss": -6.368250370025635, "global_step": 97402, "epoch": 2319} {"train_loss": -6.3193464279174805, "global_step": 97403, "epoch": 2319} {"train_loss": -6.405162811279297, "global_step": 97404, "epoch": 2319} {"train_loss": -6.3187785148620605, "global_step": 97405, "epoch": 2319} {"train_loss": -6.342782974243164, "global_step": 97406, "epoch": 2319} {"train_loss": -6.336177825927734, "global_step": 97407, "epoch": 2319} {"train_loss": -6.319616317749023, "global_step": 97408, "epoch": 2319} {"train_loss": -6.381223678588867, "global_step": 97409, "epoch": 2319} {"train_loss": -6.353314399719238, "global_step": 97410, "epoch": 2319} {"train_loss": -6.2953081130981445, "global_step": 97411, "epoch": 2319} {"train_loss": -6.362157821655273, "global_step": 97412, "epoch": 2319} {"train_loss": -6.354274272918701, "global_step": 97413, "epoch": 2319} {"train_loss": -6.327966213226318, "global_step": 97414, "epoch": 2319} {"train_loss": -6.183050632476807, "global_step": 97415, "epoch": 2319} {"train_loss": -6.2799906730651855, "global_step": 97416, "epoch": 2319} {"train_loss": -6.398892402648926, "global_step": 97417, "epoch": 2319} {"train_loss": -6.394076347351074, "global_step": 97418, "epoch": 2319} {"train_loss": -6.2625041007995605, "global_step": 97419, "epoch": 2319} {"train_loss": -6.3922343254089355, "global_step": 97420, "epoch": 2319} {"train_loss": -6.318961143493652, "global_step": 97421, "epoch": 2319} {"train_loss": -6.320964813232422, "global_step": 97422, "epoch": 2319} {"train_loss": -6.310348987579346, "global_step": 97423, "epoch": 2319} {"train_loss": -6.358877658843994, "global_step": 97424, "epoch": 2319} {"train_loss": -6.437870025634766, "global_step": 97425, "epoch": 2319} {"train_loss": -6.423614501953125, "global_step": 97426, "epoch": 2319} {"train_loss": -6.379250526428223, "global_step": 97427, "epoch": 2319} {"train_loss": -6.3863372802734375, "global_step": 97428, "epoch": 2319} {"train_loss": -6.341546058654785, "global_step": 97429, "epoch": 2319} {"train_loss": -6.312930107116699, "global_step": 97430, "epoch": 2319} {"train_loss": -6.378013610839844, "global_step": 97431, "epoch": 2319} {"train_loss": -6.381817817687988, "global_step": 97432, "epoch": 2319} {"train_loss": -6.3231706619262695, "global_step": 97433, "epoch": 2319} {"train_loss": -6.334835052490234, "global_step": 97434, "epoch": 2319} {"train_loss": -6.2366414070129395, "global_step": 97435, "epoch": 2319} {"train_loss": -6.460324287414551, "global_step": 97436, "epoch": 2319} {"train_loss": -6.322654724121094, "global_step": 97437, "epoch": 2319} {"train_loss": -6.435965538024902, "global_step": 97438, "epoch": 2319} {"train_loss": -6.347933269682384, "global_step": 97439, "epoch": 2319, "val_loss": 63679.88671875} {"train_loss": -6.323479652404785, "global_step": 97440, "epoch": 2320} {"train_loss": -6.395278453826904, "global_step": 97441, "epoch": 2320} {"train_loss": -6.410316467285156, "global_step": 97442, "epoch": 2320} {"train_loss": -6.39047908782959, "global_step": 97443, "epoch": 2320} {"train_loss": -6.363262176513672, "global_step": 97444, "epoch": 2320} {"train_loss": -6.4595184326171875, "global_step": 97445, "epoch": 2320} {"train_loss": -6.164313316345215, "global_step": 97446, "epoch": 2320} {"train_loss": -6.309436798095703, "global_step": 97447, "epoch": 2320} {"train_loss": -6.259139537811279, "global_step": 97448, "epoch": 2320} {"train_loss": -6.297977447509766, "global_step": 97449, "epoch": 2320} {"train_loss": -6.238714218139648, "global_step": 97450, "epoch": 2320} {"train_loss": -6.391971588134766, "global_step": 97451, "epoch": 2320} {"train_loss": -6.400228023529053, "global_step": 97452, "epoch": 2320} {"train_loss": -6.31375789642334, "global_step": 97453, "epoch": 2320} {"train_loss": -6.22622537612915, "global_step": 97454, "epoch": 2320} {"train_loss": -6.2972564697265625, "global_step": 97455, "epoch": 2320} {"train_loss": -6.339062213897705, "global_step": 97456, "epoch": 2320} {"train_loss": -6.243912696838379, "global_step": 97457, "epoch": 2320} {"train_loss": -6.244182586669922, "global_step": 97458, "epoch": 2320} {"train_loss": -6.138978004455566, "global_step": 97459, "epoch": 2320} {"train_loss": -6.25300931930542, "global_step": 97460, "epoch": 2320} {"train_loss": -6.3062028884887695, "global_step": 97461, "epoch": 2320} {"train_loss": -6.261872291564941, "global_step": 97462, "epoch": 2320} {"train_loss": -6.416786193847656, "global_step": 97463, "epoch": 2320} {"train_loss": -6.226485729217529, "global_step": 97464, "epoch": 2320} {"train_loss": -6.19163703918457, "global_step": 97465, "epoch": 2320} {"train_loss": -6.41826868057251, "global_step": 97466, "epoch": 2320} {"train_loss": -6.22227668762207, "global_step": 97467, "epoch": 2320} {"train_loss": -6.247818946838379, "global_step": 97468, "epoch": 2320} {"train_loss": -6.233828067779541, "global_step": 97469, "epoch": 2320} {"train_loss": -6.234732627868652, "global_step": 97470, "epoch": 2320} {"train_loss": -6.26665735244751, "global_step": 97471, "epoch": 2320} {"train_loss": -6.302441596984863, "global_step": 97472, "epoch": 2320} {"train_loss": -6.218287467956543, "global_step": 97473, "epoch": 2320} {"train_loss": -6.184144973754883, "global_step": 97474, "epoch": 2320} {"train_loss": -6.27915096282959, "global_step": 97475, "epoch": 2320} {"train_loss": -6.228592872619629, "global_step": 97476, "epoch": 2320} {"train_loss": -6.290294647216797, "global_step": 97477, "epoch": 2320} {"train_loss": -6.248877048492432, "global_step": 97478, "epoch": 2320} {"train_loss": -6.3843302726745605, "global_step": 97479, "epoch": 2320} {"train_loss": -6.264835357666016, "global_step": 97480, "epoch": 2320} {"train_loss": -6.288389217285883, "global_step": 97481, "epoch": 2320, "val_loss": 63775.33203125} {"train_loss": -6.368880271911621, "global_step": 97482, "epoch": 2321} {"train_loss": -6.285634994506836, "global_step": 97483, "epoch": 2321} {"train_loss": -6.371845722198486, "global_step": 97484, "epoch": 2321} {"train_loss": -6.321210861206055, "global_step": 97485, "epoch": 2321} {"train_loss": -6.347958087921143, "global_step": 97486, "epoch": 2321} {"train_loss": -6.294975757598877, "global_step": 97487, "epoch": 2321} {"train_loss": -6.328577518463135, "global_step": 97488, "epoch": 2321} {"train_loss": -6.298468589782715, "global_step": 97489, "epoch": 2321} {"train_loss": -6.326541900634766, "global_step": 97490, "epoch": 2321} {"train_loss": -6.264097213745117, "global_step": 97491, "epoch": 2321} {"train_loss": -6.35738468170166, "global_step": 97492, "epoch": 2321} {"train_loss": -6.2809929847717285, "global_step": 97493, "epoch": 2321} {"train_loss": -6.39279317855835, "global_step": 97494, "epoch": 2321} {"train_loss": -6.4332404136657715, "global_step": 97495, "epoch": 2321} {"train_loss": -6.279785633087158, "global_step": 97496, "epoch": 2321} {"train_loss": -6.241940021514893, "global_step": 97497, "epoch": 2321} {"train_loss": -6.382206916809082, "global_step": 97498, "epoch": 2321} {"train_loss": -6.317471027374268, "global_step": 97499, "epoch": 2321} {"train_loss": -6.3343400955200195, "global_step": 97500, "epoch": 2321} {"train_loss": -6.405943870544434, "global_step": 97501, "epoch": 2321} {"train_loss": -6.402721881866455, "global_step": 97502, "epoch": 2321} {"train_loss": -6.285933494567871, "global_step": 97503, "epoch": 2321} {"train_loss": -6.317079544067383, "global_step": 97504, "epoch": 2321} {"train_loss": -6.368152618408203, "global_step": 97505, "epoch": 2321} {"train_loss": -6.337752819061279, "global_step": 97506, "epoch": 2321} {"train_loss": -6.337156295776367, "global_step": 97507, "epoch": 2321} {"train_loss": -6.38648796081543, "global_step": 97508, "epoch": 2321} {"train_loss": -6.267972946166992, "global_step": 97509, "epoch": 2321} {"train_loss": -6.4145402908325195, "global_step": 97510, "epoch": 2321} {"train_loss": -6.425396919250488, "global_step": 97511, "epoch": 2321} {"train_loss": -6.3631157875061035, "global_step": 97512, "epoch": 2321} {"train_loss": -6.28456974029541, "global_step": 97513, "epoch": 2321} {"train_loss": -6.411219120025635, "global_step": 97514, "epoch": 2321} {"train_loss": -6.334484577178955, "global_step": 97515, "epoch": 2321} {"train_loss": -6.396032333374023, "global_step": 97516, "epoch": 2321} {"train_loss": -6.206886291503906, "global_step": 97517, "epoch": 2321} {"train_loss": -6.446580410003662, "global_step": 97518, "epoch": 2321} {"train_loss": -6.329922676086426, "global_step": 97519, "epoch": 2321} {"train_loss": -6.369551658630371, "global_step": 97520, "epoch": 2321} {"train_loss": -6.38887357711792, "global_step": 97521, "epoch": 2321} {"train_loss": -6.304415702819824, "global_step": 97522, "epoch": 2321} {"train_loss": -6.340852998551869, "global_step": 97523, "epoch": 2321, "val_loss": 63995.60546875} {"train_loss": -6.317568778991699, "global_step": 97524, "epoch": 2322} {"train_loss": -6.282304763793945, "global_step": 97525, "epoch": 2322} {"train_loss": -6.3191680908203125, "global_step": 97526, "epoch": 2322} {"train_loss": -6.155149459838867, "global_step": 97527, "epoch": 2322} {"train_loss": -6.31514310836792, "global_step": 97528, "epoch": 2322} {"train_loss": -6.2916083335876465, "global_step": 97529, "epoch": 2322} {"train_loss": -6.2422332763671875, "global_step": 97530, "epoch": 2322} {"train_loss": -6.29464864730835, "global_step": 97531, "epoch": 2322} {"train_loss": -6.267828941345215, "global_step": 97532, "epoch": 2322} {"train_loss": -6.333366394042969, "global_step": 97533, "epoch": 2322} {"train_loss": -6.429895401000977, "global_step": 97534, "epoch": 2322} {"train_loss": -6.347733497619629, "global_step": 97535, "epoch": 2322} {"train_loss": -6.308862209320068, "global_step": 97536, "epoch": 2322} {"train_loss": -6.172746658325195, "global_step": 97537, "epoch": 2322} {"train_loss": -6.34140682220459, "global_step": 97538, "epoch": 2322} {"train_loss": -6.299984931945801, "global_step": 97539, "epoch": 2322} {"train_loss": -6.2403740882873535, "global_step": 97540, "epoch": 2322} {"train_loss": -6.380563735961914, "global_step": 97541, "epoch": 2322} {"train_loss": -6.325295925140381, "global_step": 97542, "epoch": 2322} {"train_loss": -6.3090314865112305, "global_step": 97543, "epoch": 2322} {"train_loss": -6.277973175048828, "global_step": 97544, "epoch": 2322} {"train_loss": -6.3777241706848145, "global_step": 97545, "epoch": 2322} {"train_loss": -6.29814338684082, "global_step": 97546, "epoch": 2322} {"train_loss": -6.339498996734619, "global_step": 97547, "epoch": 2322} {"train_loss": -6.290914535522461, "global_step": 97548, "epoch": 2322} {"train_loss": -6.496071815490723, "global_step": 97549, "epoch": 2322} {"train_loss": -6.3065996170043945, "global_step": 97550, "epoch": 2322} {"train_loss": -6.367551803588867, "global_step": 97551, "epoch": 2322} {"train_loss": -6.385621070861816, "global_step": 97552, "epoch": 2322} {"train_loss": -6.324437618255615, "global_step": 97553, "epoch": 2322} {"train_loss": -6.438846588134766, "global_step": 97554, "epoch": 2322} {"train_loss": -6.316781044006348, "global_step": 97555, "epoch": 2322} {"train_loss": -6.342477798461914, "global_step": 97556, "epoch": 2322} {"train_loss": -6.214260101318359, "global_step": 97557, "epoch": 2322} {"train_loss": -6.3639349937438965, "global_step": 97558, "epoch": 2322} {"train_loss": -6.360050201416016, "global_step": 97559, "epoch": 2322} {"train_loss": -6.362565994262695, "global_step": 97560, "epoch": 2322} {"train_loss": -6.486668586730957, "global_step": 97561, "epoch": 2322} {"train_loss": -6.427142143249512, "global_step": 97562, "epoch": 2322} {"train_loss": -6.348511695861816, "global_step": 97563, "epoch": 2322} {"train_loss": -6.446016311645508, "global_step": 97564, "epoch": 2322} {"train_loss": -6.333156086149669, "global_step": 97565, "epoch": 2322, "val_loss": 63912.3671875} {"train_loss": -6.4225664138793945, "global_step": 97566, "epoch": 2323} {"train_loss": -6.347513198852539, "global_step": 97567, "epoch": 2323} {"train_loss": -6.352691173553467, "global_step": 97568, "epoch": 2323} {"train_loss": -6.375824928283691, "global_step": 97569, "epoch": 2323} {"train_loss": -6.271171569824219, "global_step": 97570, "epoch": 2323} {"train_loss": -6.431859016418457, "global_step": 97571, "epoch": 2323} {"train_loss": -6.358147621154785, "global_step": 97572, "epoch": 2323} {"train_loss": -6.307558536529541, "global_step": 97573, "epoch": 2323} {"train_loss": -6.3098907470703125, "global_step": 97574, "epoch": 2323} {"train_loss": -6.391249179840088, "global_step": 97575, "epoch": 2323} {"train_loss": -6.275062561035156, "global_step": 97576, "epoch": 2323} {"train_loss": -6.349954605102539, "global_step": 97577, "epoch": 2323} {"train_loss": -6.272046089172363, "global_step": 97578, "epoch": 2323} {"train_loss": -6.318007469177246, "global_step": 97579, "epoch": 2323} {"train_loss": -6.2560224533081055, "global_step": 97580, "epoch": 2323} {"train_loss": -6.378398895263672, "global_step": 97581, "epoch": 2323} {"train_loss": -6.35296630859375, "global_step": 97582, "epoch": 2323} {"train_loss": -6.312673568725586, "global_step": 97583, "epoch": 2323} {"train_loss": -6.385721206665039, "global_step": 97584, "epoch": 2323} {"train_loss": -6.26617431640625, "global_step": 97585, "epoch": 2323} {"train_loss": -6.275892734527588, "global_step": 97586, "epoch": 2323} {"train_loss": -6.276881217956543, "global_step": 97587, "epoch": 2323} {"train_loss": -6.296512603759766, "global_step": 97588, "epoch": 2323} {"train_loss": -6.257844924926758, "global_step": 97589, "epoch": 2323} {"train_loss": -6.2685627937316895, "global_step": 97590, "epoch": 2323} {"train_loss": -6.458146095275879, "global_step": 97591, "epoch": 2323} {"train_loss": -6.266024112701416, "global_step": 97592, "epoch": 2323} {"train_loss": -6.274131774902344, "global_step": 97593, "epoch": 2323} {"train_loss": -6.314453601837158, "global_step": 97594, "epoch": 2323} {"train_loss": -6.158996105194092, "global_step": 97595, "epoch": 2323} {"train_loss": -6.28926944732666, "global_step": 97596, "epoch": 2323} {"train_loss": -6.304634094238281, "global_step": 97597, "epoch": 2323} {"train_loss": -6.211929798126221, "global_step": 97598, "epoch": 2323} {"train_loss": -6.315525054931641, "global_step": 97599, "epoch": 2323} {"train_loss": -6.222765922546387, "global_step": 97600, "epoch": 2323} {"train_loss": -6.267324447631836, "global_step": 97601, "epoch": 2323} {"train_loss": -6.164281368255615, "global_step": 97602, "epoch": 2323} {"train_loss": -6.167364120483398, "global_step": 97603, "epoch": 2323} {"train_loss": -6.3251471519470215, "global_step": 97604, "epoch": 2323} {"train_loss": -6.2254815101623535, "global_step": 97605, "epoch": 2323} {"train_loss": -6.3381147384643555, "global_step": 97606, "epoch": 2323} {"train_loss": -6.302053792136056, "global_step": 97607, "epoch": 2323, "val_loss": 64154.41796875} {"train_loss": -6.281275272369385, "global_step": 97608, "epoch": 2324} {"train_loss": -6.244419574737549, "global_step": 97609, "epoch": 2324} {"train_loss": -6.322055816650391, "global_step": 97610, "epoch": 2324} {"train_loss": -6.384607315063477, "global_step": 97611, "epoch": 2324} {"train_loss": -6.23433256149292, "global_step": 97612, "epoch": 2324} {"train_loss": -6.2569732666015625, "global_step": 97613, "epoch": 2324} {"train_loss": -6.360781669616699, "global_step": 97614, "epoch": 2324} {"train_loss": -6.341342926025391, "global_step": 97615, "epoch": 2324} {"train_loss": -6.353026390075684, "global_step": 97616, "epoch": 2324} {"train_loss": -6.333125114440918, "global_step": 97617, "epoch": 2324} {"train_loss": -6.309295654296875, "global_step": 97618, "epoch": 2324} {"train_loss": -6.20931339263916, "global_step": 97619, "epoch": 2324} {"train_loss": -6.238368034362793, "global_step": 97620, "epoch": 2324} {"train_loss": -6.3412184715271, "global_step": 97621, "epoch": 2324} {"train_loss": -6.20197057723999, "global_step": 97622, "epoch": 2324} {"train_loss": -6.3460235595703125, "global_step": 97623, "epoch": 2324} {"train_loss": -6.297380447387695, "global_step": 97624, "epoch": 2324} {"train_loss": -6.421334266662598, "global_step": 97625, "epoch": 2324} {"train_loss": -6.424056053161621, "global_step": 97626, "epoch": 2324} {"train_loss": -6.238916397094727, "global_step": 97627, "epoch": 2324} {"train_loss": -6.282081127166748, "global_step": 97628, "epoch": 2324} {"train_loss": -6.313104629516602, "global_step": 97629, "epoch": 2324} {"train_loss": -6.250414848327637, "global_step": 97630, "epoch": 2324} {"train_loss": -6.359832763671875, "global_step": 97631, "epoch": 2324} {"train_loss": -6.303808212280273, "global_step": 97632, "epoch": 2324} {"train_loss": -6.341114044189453, "global_step": 97633, "epoch": 2324} {"train_loss": -6.499879837036133, "global_step": 97634, "epoch": 2324} {"train_loss": -6.414414405822754, "global_step": 97635, "epoch": 2324} {"train_loss": -6.391898155212402, "global_step": 97636, "epoch": 2324} {"train_loss": -6.311387062072754, "global_step": 97637, "epoch": 2324} {"train_loss": -6.4543046951293945, "global_step": 97638, "epoch": 2324} {"train_loss": -6.361424446105957, "global_step": 97639, "epoch": 2324} {"train_loss": -6.375813961029053, "global_step": 97640, "epoch": 2324} {"train_loss": -6.425558090209961, "global_step": 97641, "epoch": 2324} {"train_loss": -6.173071384429932, "global_step": 97642, "epoch": 2324} {"train_loss": -6.273602485656738, "global_step": 97643, "epoch": 2324} {"train_loss": -6.372803211212158, "global_step": 97644, "epoch": 2324} {"train_loss": -6.355997562408447, "global_step": 97645, "epoch": 2324} {"train_loss": -6.286945343017578, "global_step": 97646, "epoch": 2324} {"train_loss": -6.308582782745361, "global_step": 97647, "epoch": 2324} {"train_loss": -6.244749069213867, "global_step": 97648, "epoch": 2324} {"train_loss": -6.326164461317516, "global_step": 97649, "epoch": 2324, "val_loss": 63839.1875} {"train_loss": -6.203405380249023, "global_step": 97650, "epoch": 2325} {"train_loss": -6.348997116088867, "global_step": 97651, "epoch": 2325} {"train_loss": -6.316454887390137, "global_step": 97652, "epoch": 2325} {"train_loss": -6.351357936859131, "global_step": 97653, "epoch": 2325} {"train_loss": -6.402968883514404, "global_step": 97654, "epoch": 2325} {"train_loss": -6.441773414611816, "global_step": 97655, "epoch": 2325} {"train_loss": -6.234480857849121, "global_step": 97656, "epoch": 2325} {"train_loss": -6.295445919036865, "global_step": 97657, "epoch": 2325} {"train_loss": -6.296781539916992, "global_step": 97658, "epoch": 2325} {"train_loss": -6.3951873779296875, "global_step": 97659, "epoch": 2325} {"train_loss": -6.284679412841797, "global_step": 97660, "epoch": 2325} {"train_loss": -6.282607555389404, "global_step": 97661, "epoch": 2325} {"train_loss": -6.358275890350342, "global_step": 97662, "epoch": 2325} {"train_loss": -6.352320671081543, "global_step": 97663, "epoch": 2325} {"train_loss": -6.317108631134033, "global_step": 97664, "epoch": 2325} {"train_loss": -6.333576202392578, "global_step": 97665, "epoch": 2325} {"train_loss": -6.374799728393555, "global_step": 97666, "epoch": 2325} {"train_loss": -6.36434268951416, "global_step": 97667, "epoch": 2325} {"train_loss": -6.347104072570801, "global_step": 97668, "epoch": 2325} {"train_loss": -6.226108551025391, "global_step": 97669, "epoch": 2325} {"train_loss": -6.434143543243408, "global_step": 97670, "epoch": 2325} {"train_loss": -6.385401248931885, "global_step": 97671, "epoch": 2325} {"train_loss": -6.466451644897461, "global_step": 97672, "epoch": 2325} {"train_loss": -6.467253684997559, "global_step": 97673, "epoch": 2325} {"train_loss": -6.265207290649414, "global_step": 97674, "epoch": 2325} {"train_loss": -6.490483283996582, "global_step": 97675, "epoch": 2325} {"train_loss": -6.41684627532959, "global_step": 97676, "epoch": 2325} {"train_loss": -6.335353851318359, "global_step": 97677, "epoch": 2325} {"train_loss": -6.464202404022217, "global_step": 97678, "epoch": 2325} {"train_loss": -6.465578079223633, "global_step": 97679, "epoch": 2325} {"train_loss": -6.45184850692749, "global_step": 97680, "epoch": 2325} {"train_loss": -6.283443927764893, "global_step": 97681, "epoch": 2325} {"train_loss": -6.402599334716797, "global_step": 97682, "epoch": 2325} {"train_loss": -6.396719932556152, "global_step": 97683, "epoch": 2325} {"train_loss": -6.3380560874938965, "global_step": 97684, "epoch": 2325} {"train_loss": -6.43039608001709, "global_step": 97685, "epoch": 2325} {"train_loss": -6.404711723327637, "global_step": 97686, "epoch": 2325} {"train_loss": -6.441195964813232, "global_step": 97687, "epoch": 2325} {"train_loss": -6.351637840270996, "global_step": 97688, "epoch": 2325} {"train_loss": -6.39506721496582, "global_step": 97689, "epoch": 2325} {"train_loss": -6.409575462341309, "global_step": 97690, "epoch": 2325} {"train_loss": -6.368645940508161, "global_step": 97691, "epoch": 2325, "val_loss": 63661.17578125} {"train_loss": -6.447355270385742, "global_step": 97692, "epoch": 2326} {"train_loss": -6.35599946975708, "global_step": 97693, "epoch": 2326} {"train_loss": -6.363377094268799, "global_step": 97694, "epoch": 2326} {"train_loss": -6.3289475440979, "global_step": 97695, "epoch": 2326} {"train_loss": -6.468889236450195, "global_step": 97696, "epoch": 2326} {"train_loss": -6.38840913772583, "global_step": 97697, "epoch": 2326} {"train_loss": -6.382140159606934, "global_step": 97698, "epoch": 2326} {"train_loss": -6.420541763305664, "global_step": 97699, "epoch": 2326} {"train_loss": -6.3871259689331055, "global_step": 97700, "epoch": 2326} {"train_loss": -6.308656692504883, "global_step": 97701, "epoch": 2326} {"train_loss": -6.300197601318359, "global_step": 97702, "epoch": 2326} {"train_loss": -6.390728950500488, "global_step": 97703, "epoch": 2326} {"train_loss": -6.300374984741211, "global_step": 97704, "epoch": 2326} {"train_loss": -6.330564498901367, "global_step": 97705, "epoch": 2326} {"train_loss": -6.335911273956299, "global_step": 97706, "epoch": 2326} {"train_loss": -6.3770904541015625, "global_step": 97707, "epoch": 2326} {"train_loss": -6.44415807723999, "global_step": 97708, "epoch": 2326} {"train_loss": -6.358945846557617, "global_step": 97709, "epoch": 2326} {"train_loss": -6.376613616943359, "global_step": 97710, "epoch": 2326} {"train_loss": -6.422461032867432, "global_step": 97711, "epoch": 2326} {"train_loss": -6.318795680999756, "global_step": 97712, "epoch": 2326} {"train_loss": -6.310262680053711, "global_step": 97713, "epoch": 2326} {"train_loss": -6.2813873291015625, "global_step": 97714, "epoch": 2326} {"train_loss": -6.281506538391113, "global_step": 97715, "epoch": 2326} {"train_loss": -6.3817901611328125, "global_step": 97716, "epoch": 2326} {"train_loss": -6.3786492347717285, "global_step": 97717, "epoch": 2326} {"train_loss": -6.345429420471191, "global_step": 97718, "epoch": 2326} {"train_loss": -6.238935470581055, "global_step": 97719, "epoch": 2326} {"train_loss": -6.411373138427734, "global_step": 97720, "epoch": 2326} {"train_loss": -6.430816173553467, "global_step": 97721, "epoch": 2326} {"train_loss": -6.369175910949707, "global_step": 97722, "epoch": 2326} {"train_loss": -6.216037750244141, "global_step": 97723, "epoch": 2326} {"train_loss": -6.3779497146606445, "global_step": 97724, "epoch": 2326} {"train_loss": -6.35300350189209, "global_step": 97725, "epoch": 2326} {"train_loss": -6.34765625, "global_step": 97726, "epoch": 2326} {"train_loss": -6.306900978088379, "global_step": 97727, "epoch": 2326} {"train_loss": -6.29123592376709, "global_step": 97728, "epoch": 2326} {"train_loss": -6.262934684753418, "global_step": 97729, "epoch": 2326} {"train_loss": -6.342884540557861, "global_step": 97730, "epoch": 2326} {"train_loss": -6.394346237182617, "global_step": 97731, "epoch": 2326} {"train_loss": -6.452760219573975, "global_step": 97732, "epoch": 2326} {"train_loss": -6.353766588937669, "global_step": 97733, "epoch": 2326, "val_loss": 63968.06640625} {"train_loss": -6.384892463684082, "global_step": 97734, "epoch": 2327} {"train_loss": -6.28394079208374, "global_step": 97735, "epoch": 2327} {"train_loss": -6.3124589920043945, "global_step": 97736, "epoch": 2327} {"train_loss": -6.293753623962402, "global_step": 97737, "epoch": 2327} {"train_loss": -6.257537841796875, "global_step": 97738, "epoch": 2327} {"train_loss": -6.421804904937744, "global_step": 97739, "epoch": 2327} {"train_loss": -6.344725608825684, "global_step": 97740, "epoch": 2327} {"train_loss": -6.4081830978393555, "global_step": 97741, "epoch": 2327} {"train_loss": -6.3477911949157715, "global_step": 97742, "epoch": 2327} {"train_loss": -6.2870612144470215, "global_step": 97743, "epoch": 2327} {"train_loss": -6.3310651779174805, "global_step": 97744, "epoch": 2327} {"train_loss": -6.287596702575684, "global_step": 97745, "epoch": 2327} {"train_loss": -6.264723300933838, "global_step": 97746, "epoch": 2327} {"train_loss": -6.375006675720215, "global_step": 97747, "epoch": 2327} {"train_loss": -6.289828300476074, "global_step": 97748, "epoch": 2327} {"train_loss": -6.2995734214782715, "global_step": 97749, "epoch": 2327} {"train_loss": -6.351840019226074, "global_step": 97750, "epoch": 2327} {"train_loss": -6.352633953094482, "global_step": 97751, "epoch": 2327} {"train_loss": -6.44025993347168, "global_step": 97752, "epoch": 2327} {"train_loss": -6.296696662902832, "global_step": 97753, "epoch": 2327} {"train_loss": -6.372008323669434, "global_step": 97754, "epoch": 2327} {"train_loss": -6.389862537384033, "global_step": 97755, "epoch": 2327} {"train_loss": -6.335230350494385, "global_step": 97756, "epoch": 2327} {"train_loss": -6.2904052734375, "global_step": 97757, "epoch": 2327} {"train_loss": -6.30987548828125, "global_step": 97758, "epoch": 2327} {"train_loss": -6.342570781707764, "global_step": 97759, "epoch": 2327} {"train_loss": -6.3471198081970215, "global_step": 97760, "epoch": 2327} {"train_loss": -6.401895523071289, "global_step": 97761, "epoch": 2327} {"train_loss": -6.454171180725098, "global_step": 97762, "epoch": 2327} {"train_loss": -6.418513298034668, "global_step": 97763, "epoch": 2327} {"train_loss": -6.313577175140381, "global_step": 97764, "epoch": 2327} {"train_loss": -6.343339920043945, "global_step": 97765, "epoch": 2327} {"train_loss": -6.1974639892578125, "global_step": 97766, "epoch": 2327} {"train_loss": -6.349149227142334, "global_step": 97767, "epoch": 2327} {"train_loss": -6.398595809936523, "global_step": 97768, "epoch": 2327} {"train_loss": -6.309881210327148, "global_step": 97769, "epoch": 2327} {"train_loss": -6.342787742614746, "global_step": 97770, "epoch": 2327} {"train_loss": -6.3450927734375, "global_step": 97771, "epoch": 2327} {"train_loss": -6.193826675415039, "global_step": 97772, "epoch": 2327} {"train_loss": -6.234336853027344, "global_step": 97773, "epoch": 2327} {"train_loss": -6.263294696807861, "global_step": 97774, "epoch": 2327} {"train_loss": -6.330524251574562, "global_step": 97775, "epoch": 2327, "val_loss": 64031.6328125} {"train_loss": -6.178443908691406, "global_step": 97776, "epoch": 2328} {"train_loss": -6.438849449157715, "global_step": 97777, "epoch": 2328} {"train_loss": -6.23390531539917, "global_step": 97778, "epoch": 2328} {"train_loss": -6.278137683868408, "global_step": 97779, "epoch": 2328} {"train_loss": -6.339560508728027, "global_step": 97780, "epoch": 2328} {"train_loss": -6.359440803527832, "global_step": 97781, "epoch": 2328} {"train_loss": -6.239912033081055, "global_step": 97782, "epoch": 2328} {"train_loss": -6.295372009277344, "global_step": 97783, "epoch": 2328} {"train_loss": -6.254574775695801, "global_step": 97784, "epoch": 2328} {"train_loss": -6.185443878173828, "global_step": 97785, "epoch": 2328} {"train_loss": -6.3006086349487305, "global_step": 97786, "epoch": 2328} {"train_loss": -6.307718276977539, "global_step": 97787, "epoch": 2328} {"train_loss": -6.299211502075195, "global_step": 97788, "epoch": 2328} {"train_loss": -6.235922813415527, "global_step": 97789, "epoch": 2328} {"train_loss": -6.302863597869873, "global_step": 97790, "epoch": 2328} {"train_loss": -6.259737968444824, "global_step": 97791, "epoch": 2328} {"train_loss": -6.245818138122559, "global_step": 97792, "epoch": 2328} {"train_loss": -6.269495964050293, "global_step": 97793, "epoch": 2328} {"train_loss": -6.332020282745361, "global_step": 97794, "epoch": 2328} {"train_loss": -6.215888023376465, "global_step": 97795, "epoch": 2328} {"train_loss": -6.358870506286621, "global_step": 97796, "epoch": 2328} {"train_loss": -6.366430282592773, "global_step": 97797, "epoch": 2328} {"train_loss": -6.415698051452637, "global_step": 97798, "epoch": 2328} {"train_loss": -6.329680919647217, "global_step": 97799, "epoch": 2328} {"train_loss": -6.408771514892578, "global_step": 97800, "epoch": 2328} {"train_loss": -6.403357028961182, "global_step": 97801, "epoch": 2328} {"train_loss": -6.331332206726074, "global_step": 97802, "epoch": 2328} {"train_loss": -6.197235107421875, "global_step": 97803, "epoch": 2328} {"train_loss": -6.249361991882324, "global_step": 97804, "epoch": 2328} {"train_loss": -6.3678178787231445, "global_step": 97805, "epoch": 2328} {"train_loss": -6.337486743927002, "global_step": 97806, "epoch": 2328} {"train_loss": -6.431894302368164, "global_step": 97807, "epoch": 2328} {"train_loss": -6.325075149536133, "global_step": 97808, "epoch": 2328} {"train_loss": -6.264944076538086, "global_step": 97809, "epoch": 2328} {"train_loss": -6.419406890869141, "global_step": 97810, "epoch": 2328} {"train_loss": -6.274540901184082, "global_step": 97811, "epoch": 2328} {"train_loss": -6.441594123840332, "global_step": 97812, "epoch": 2328} {"train_loss": -6.313654899597168, "global_step": 97813, "epoch": 2328} {"train_loss": -6.418723106384277, "global_step": 97814, "epoch": 2328} {"train_loss": -6.170082092285156, "global_step": 97815, "epoch": 2328} {"train_loss": -6.199509620666504, "global_step": 97816, "epoch": 2328} {"train_loss": -6.305494297118414, "global_step": 97817, "epoch": 2328, "val_loss": 63886.40234375} {"train_loss": -6.280999183654785, "global_step": 97818, "epoch": 2329} {"train_loss": -6.315103530883789, "global_step": 97819, "epoch": 2329} {"train_loss": -6.329026222229004, "global_step": 97820, "epoch": 2329} {"train_loss": -6.444775104522705, "global_step": 97821, "epoch": 2329} {"train_loss": -6.521839618682861, "global_step": 97822, "epoch": 2329} {"train_loss": -6.273037910461426, "global_step": 97823, "epoch": 2329} {"train_loss": -6.259260654449463, "global_step": 97824, "epoch": 2329} {"train_loss": -6.379127502441406, "global_step": 97825, "epoch": 2329} {"train_loss": -6.486377239227295, "global_step": 97826, "epoch": 2329} {"train_loss": -6.163064002990723, "global_step": 97827, "epoch": 2329} {"train_loss": -6.359619140625, "global_step": 97828, "epoch": 2329} {"train_loss": -6.3841729164123535, "global_step": 97829, "epoch": 2329} {"train_loss": -6.258567810058594, "global_step": 97830, "epoch": 2329} {"train_loss": -6.365707874298096, "global_step": 97831, "epoch": 2329} {"train_loss": -6.3287034034729, "global_step": 97832, "epoch": 2329} {"train_loss": -6.315805912017822, "global_step": 97833, "epoch": 2329} {"train_loss": -6.409030914306641, "global_step": 97834, "epoch": 2329} {"train_loss": -6.301239490509033, "global_step": 97835, "epoch": 2329} {"train_loss": -6.380437850952148, "global_step": 97836, "epoch": 2329} {"train_loss": -6.100035667419434, "global_step": 97837, "epoch": 2329} {"train_loss": -6.360118865966797, "global_step": 97838, "epoch": 2329} {"train_loss": -6.398914813995361, "global_step": 97839, "epoch": 2329} {"train_loss": -6.162402153015137, "global_step": 97840, "epoch": 2329} {"train_loss": -6.3253254890441895, "global_step": 97841, "epoch": 2329} {"train_loss": -6.3628411293029785, "global_step": 97842, "epoch": 2329} {"train_loss": -6.2434401512146, "global_step": 97843, "epoch": 2329} {"train_loss": -6.3501081466674805, "global_step": 97844, "epoch": 2329} {"train_loss": -6.328816890716553, "global_step": 97845, "epoch": 2329} {"train_loss": -6.386263847351074, "global_step": 97846, "epoch": 2329} {"train_loss": -6.289027214050293, "global_step": 97847, "epoch": 2329} {"train_loss": -6.309230327606201, "global_step": 97848, "epoch": 2329} {"train_loss": -6.495841979980469, "global_step": 97849, "epoch": 2329} {"train_loss": -6.295767784118652, "global_step": 97850, "epoch": 2329} {"train_loss": -6.222092628479004, "global_step": 97851, "epoch": 2329} {"train_loss": -6.384418487548828, "global_step": 97852, "epoch": 2329} {"train_loss": -6.323232173919678, "global_step": 97853, "epoch": 2329} {"train_loss": -6.39408540725708, "global_step": 97854, "epoch": 2329} {"train_loss": -6.366940021514893, "global_step": 97855, "epoch": 2329} {"train_loss": -6.396261215209961, "global_step": 97856, "epoch": 2329} {"train_loss": -6.2435503005981445, "global_step": 97857, "epoch": 2329} {"train_loss": -6.3318400382995605, "global_step": 97858, "epoch": 2329} {"train_loss": -6.329676196688697, "global_step": 97859, "epoch": 2329, "val_loss": 63802.8203125} {"train_loss": -6.321710586547852, "global_step": 97860, "epoch": 2330} {"train_loss": -6.270183086395264, "global_step": 97861, "epoch": 2330} {"train_loss": -6.482924461364746, "global_step": 97862, "epoch": 2330} {"train_loss": -6.3083906173706055, "global_step": 97863, "epoch": 2330} {"train_loss": -6.244068145751953, "global_step": 97864, "epoch": 2330} {"train_loss": -6.3589959144592285, "global_step": 97865, "epoch": 2330} {"train_loss": -6.241155624389648, "global_step": 97866, "epoch": 2330} {"train_loss": -6.247127532958984, "global_step": 97867, "epoch": 2330} {"train_loss": -6.402742862701416, "global_step": 97868, "epoch": 2330} {"train_loss": -6.327339172363281, "global_step": 97869, "epoch": 2330} {"train_loss": -6.37183952331543, "global_step": 97870, "epoch": 2330} {"train_loss": -6.230889320373535, "global_step": 97871, "epoch": 2330} {"train_loss": -6.3890838623046875, "global_step": 97872, "epoch": 2330} {"train_loss": -6.367584228515625, "global_step": 97873, "epoch": 2330} {"train_loss": -6.36775016784668, "global_step": 97874, "epoch": 2330} {"train_loss": -6.343205451965332, "global_step": 97875, "epoch": 2330} {"train_loss": -6.365631103515625, "global_step": 97876, "epoch": 2330} {"train_loss": -6.406198501586914, "global_step": 97877, "epoch": 2330} {"train_loss": -6.389145851135254, "global_step": 97878, "epoch": 2330} {"train_loss": -6.442464828491211, "global_step": 97879, "epoch": 2330} {"train_loss": -6.413021087646484, "global_step": 97880, "epoch": 2330} {"train_loss": -6.481841564178467, "global_step": 97881, "epoch": 2330} {"train_loss": -6.351342678070068, "global_step": 97882, "epoch": 2330} {"train_loss": -6.30474328994751, "global_step": 97883, "epoch": 2330} {"train_loss": -6.398307800292969, "global_step": 97884, "epoch": 2330} {"train_loss": -6.25963020324707, "global_step": 97885, "epoch": 2330} {"train_loss": -6.385642051696777, "global_step": 97886, "epoch": 2330} {"train_loss": -6.19655704498291, "global_step": 97887, "epoch": 2330} {"train_loss": -6.357922554016113, "global_step": 97888, "epoch": 2330} {"train_loss": -6.390255451202393, "global_step": 97889, "epoch": 2330} {"train_loss": -6.366812705993652, "global_step": 97890, "epoch": 2330} {"train_loss": -6.290650367736816, "global_step": 97891, "epoch": 2330} {"train_loss": -6.3093061447143555, "global_step": 97892, "epoch": 2330} {"train_loss": -6.325174331665039, "global_step": 97893, "epoch": 2330} {"train_loss": -6.337867736816406, "global_step": 97894, "epoch": 2330} {"train_loss": -6.3713860511779785, "global_step": 97895, "epoch": 2330} {"train_loss": -6.357305526733398, "global_step": 97896, "epoch": 2330} {"train_loss": -6.273719787597656, "global_step": 97897, "epoch": 2330} {"train_loss": -6.311164855957031, "global_step": 97898, "epoch": 2330} {"train_loss": -6.393214225769043, "global_step": 97899, "epoch": 2330} {"train_loss": -6.4517340660095215, "global_step": 97900, "epoch": 2330} {"train_loss": -6.346224955150059, "global_step": 97901, "epoch": 2330, "val_loss": 63840.64453125} {"train_loss": -6.245250225067139, "global_step": 97902, "epoch": 2331} {"train_loss": -6.370646953582764, "global_step": 97903, "epoch": 2331} {"train_loss": -6.366667747497559, "global_step": 97904, "epoch": 2331} {"train_loss": -6.3925886154174805, "global_step": 97905, "epoch": 2331} {"train_loss": -6.338130950927734, "global_step": 97906, "epoch": 2331} {"train_loss": -6.294735908508301, "global_step": 97907, "epoch": 2331} {"train_loss": -6.461146354675293, "global_step": 97908, "epoch": 2331} {"train_loss": -6.269779205322266, "global_step": 97909, "epoch": 2331} {"train_loss": -6.241761684417725, "global_step": 97910, "epoch": 2331} {"train_loss": -6.296783924102783, "global_step": 97911, "epoch": 2331} {"train_loss": -6.181693077087402, "global_step": 97912, "epoch": 2331} {"train_loss": -6.279061317443848, "global_step": 97913, "epoch": 2331} {"train_loss": -6.233870506286621, "global_step": 97914, "epoch": 2331} {"train_loss": -6.368114471435547, "global_step": 97915, "epoch": 2331} {"train_loss": -6.430066108703613, "global_step": 97916, "epoch": 2331} {"train_loss": -6.239534854888916, "global_step": 97917, "epoch": 2331} {"train_loss": -6.1455488204956055, "global_step": 97918, "epoch": 2331} {"train_loss": -6.316477298736572, "global_step": 97919, "epoch": 2331} {"train_loss": -6.435638427734375, "global_step": 97920, "epoch": 2331} {"train_loss": -6.227678298950195, "global_step": 97921, "epoch": 2331} {"train_loss": -6.272892951965332, "global_step": 97922, "epoch": 2331} {"train_loss": -6.216771125793457, "global_step": 97923, "epoch": 2331} {"train_loss": -6.352011203765869, "global_step": 97924, "epoch": 2331} {"train_loss": -6.267524719238281, "global_step": 97925, "epoch": 2331} {"train_loss": -6.198009490966797, "global_step": 97926, "epoch": 2331} {"train_loss": -6.270351886749268, "global_step": 97927, "epoch": 2331} {"train_loss": -6.246517181396484, "global_step": 97928, "epoch": 2331} {"train_loss": -6.379255294799805, "global_step": 97929, "epoch": 2331} {"train_loss": -6.4134111404418945, "global_step": 97930, "epoch": 2331} {"train_loss": -6.308183193206787, "global_step": 97931, "epoch": 2331} {"train_loss": -6.2253007888793945, "global_step": 97932, "epoch": 2331} {"train_loss": -6.3959550857543945, "global_step": 97933, "epoch": 2331} {"train_loss": -6.331150531768799, "global_step": 97934, "epoch": 2331} {"train_loss": -6.407870292663574, "global_step": 97935, "epoch": 2331} {"train_loss": -6.3152055740356445, "global_step": 97936, "epoch": 2331} {"train_loss": -6.315451145172119, "global_step": 97937, "epoch": 2331} {"train_loss": -6.302281856536865, "global_step": 97938, "epoch": 2331} {"train_loss": -6.357994556427002, "global_step": 97939, "epoch": 2331} {"train_loss": -6.261273384094238, "global_step": 97940, "epoch": 2331} {"train_loss": -6.493246078491211, "global_step": 97941, "epoch": 2331} {"train_loss": -6.228238582611084, "global_step": 97942, "epoch": 2331} {"train_loss": -6.308028993152437, "global_step": 97943, "epoch": 2331, "val_loss": 63784.33984375} {"train_loss": -6.275875091552734, "global_step": 97944, "epoch": 2332} {"train_loss": -6.358574867248535, "global_step": 97945, "epoch": 2332} {"train_loss": -6.446096420288086, "global_step": 97946, "epoch": 2332} {"train_loss": -6.375274181365967, "global_step": 97947, "epoch": 2332} {"train_loss": -6.272597312927246, "global_step": 97948, "epoch": 2332} {"train_loss": -6.420280933380127, "global_step": 97949, "epoch": 2332} {"train_loss": -6.3645734786987305, "global_step": 97950, "epoch": 2332} {"train_loss": -6.453696250915527, "global_step": 97951, "epoch": 2332} {"train_loss": -6.333394527435303, "global_step": 97952, "epoch": 2332} {"train_loss": -6.448114395141602, "global_step": 97953, "epoch": 2332} {"train_loss": -6.459173202514648, "global_step": 97954, "epoch": 2332} {"train_loss": -6.329909801483154, "global_step": 97955, "epoch": 2332} {"train_loss": -6.299572467803955, "global_step": 97956, "epoch": 2332} {"train_loss": -6.231818199157715, "global_step": 97957, "epoch": 2332} {"train_loss": -6.359678268432617, "global_step": 97958, "epoch": 2332} {"train_loss": -6.397955417633057, "global_step": 97959, "epoch": 2332} {"train_loss": -6.369560241699219, "global_step": 97960, "epoch": 2332} {"train_loss": -6.364857196807861, "global_step": 97961, "epoch": 2332} {"train_loss": -6.378442764282227, "global_step": 97962, "epoch": 2332} {"train_loss": -6.205313682556152, "global_step": 97963, "epoch": 2332} {"train_loss": -6.37783145904541, "global_step": 97964, "epoch": 2332} {"train_loss": -6.225994110107422, "global_step": 97965, "epoch": 2332} {"train_loss": -6.280939102172852, "global_step": 97966, "epoch": 2332} {"train_loss": -6.268856525421143, "global_step": 97967, "epoch": 2332} {"train_loss": -6.1951494216918945, "global_step": 97968, "epoch": 2332} {"train_loss": -6.48784065246582, "global_step": 97969, "epoch": 2332} {"train_loss": -6.300985813140869, "global_step": 97970, "epoch": 2332} {"train_loss": -6.153156280517578, "global_step": 97971, "epoch": 2332} {"train_loss": -6.438830375671387, "global_step": 97972, "epoch": 2332} {"train_loss": -6.258023738861084, "global_step": 97973, "epoch": 2332} {"train_loss": -6.302826881408691, "global_step": 97974, "epoch": 2332} {"train_loss": -6.370881080627441, "global_step": 97975, "epoch": 2332} {"train_loss": -6.283347129821777, "global_step": 97976, "epoch": 2332} {"train_loss": -6.434454441070557, "global_step": 97977, "epoch": 2332} {"train_loss": -6.339078426361084, "global_step": 97978, "epoch": 2332} {"train_loss": -6.316671371459961, "global_step": 97979, "epoch": 2332} {"train_loss": -6.286120891571045, "global_step": 97980, "epoch": 2332} {"train_loss": -6.412844657897949, "global_step": 97981, "epoch": 2332} {"train_loss": -6.288138389587402, "global_step": 97982, "epoch": 2332} {"train_loss": -6.319025039672852, "global_step": 97983, "epoch": 2332} {"train_loss": -6.321950912475586, "global_step": 97984, "epoch": 2332} {"train_loss": -6.335315431867327, "global_step": 97985, "epoch": 2332, "val_loss": 63911.57421875} {"train_loss": -6.2113189697265625, "global_step": 97986, "epoch": 2333} {"train_loss": -6.335129737854004, "global_step": 97987, "epoch": 2333} {"train_loss": -6.30620813369751, "global_step": 97988, "epoch": 2333} {"train_loss": -6.29983377456665, "global_step": 97989, "epoch": 2333} {"train_loss": -6.3455986976623535, "global_step": 97990, "epoch": 2333} {"train_loss": -6.346963882446289, "global_step": 97991, "epoch": 2333} {"train_loss": -6.442468643188477, "global_step": 97992, "epoch": 2333} {"train_loss": -6.286837100982666, "global_step": 97993, "epoch": 2333} {"train_loss": -6.222458362579346, "global_step": 97994, "epoch": 2333} {"train_loss": -6.38775634765625, "global_step": 97995, "epoch": 2333} {"train_loss": -6.402000904083252, "global_step": 97996, "epoch": 2333} {"train_loss": -6.476227283477783, "global_step": 97997, "epoch": 2333} {"train_loss": -6.4181013107299805, "global_step": 97998, "epoch": 2333} {"train_loss": -6.373279094696045, "global_step": 97999, "epoch": 2333} {"train_loss": -6.329134941101074, "global_step": 98000, "epoch": 2333} {"train_loss": -6.410064697265625, "global_step": 98001, "epoch": 2333} {"train_loss": -6.3472137451171875, "global_step": 98002, "epoch": 2333} {"train_loss": -6.338030815124512, "global_step": 98003, "epoch": 2333} {"train_loss": -6.296263217926025, "global_step": 98004, "epoch": 2333} {"train_loss": -6.370711326599121, "global_step": 98005, "epoch": 2333} {"train_loss": -6.34029483795166, "global_step": 98006, "epoch": 2333} {"train_loss": -6.35690975189209, "global_step": 98007, "epoch": 2333} {"train_loss": -6.381466388702393, "global_step": 98008, "epoch": 2333} {"train_loss": -6.269232749938965, "global_step": 98009, "epoch": 2333} {"train_loss": -6.445624351501465, "global_step": 98010, "epoch": 2333} {"train_loss": -6.3577799797058105, "global_step": 98011, "epoch": 2333} {"train_loss": -6.2896952629089355, "global_step": 98012, "epoch": 2333} {"train_loss": -6.296541213989258, "global_step": 98013, "epoch": 2333} {"train_loss": -6.366353988647461, "global_step": 98014, "epoch": 2333} {"train_loss": -6.445079803466797, "global_step": 98015, "epoch": 2333} {"train_loss": -6.31883430480957, "global_step": 98016, "epoch": 2333} {"train_loss": -6.342654228210449, "global_step": 98017, "epoch": 2333} {"train_loss": -6.2654290199279785, "global_step": 98018, "epoch": 2333} {"train_loss": -6.1949334144592285, "global_step": 98019, "epoch": 2333} {"train_loss": -6.383108139038086, "global_step": 98020, "epoch": 2333} {"train_loss": -6.252103328704834, "global_step": 98021, "epoch": 2333} {"train_loss": -6.184429168701172, "global_step": 98022, "epoch": 2333} {"train_loss": -6.3202924728393555, "global_step": 98023, "epoch": 2333} {"train_loss": -6.449831008911133, "global_step": 98024, "epoch": 2333} {"train_loss": -6.329651832580566, "global_step": 98025, "epoch": 2333} {"train_loss": -6.370916366577148, "global_step": 98026, "epoch": 2333} {"train_loss": -6.340108530861991, "global_step": 98027, "epoch": 2333, "val_loss": 63973.1796875} {"train_loss": -6.290541648864746, "global_step": 98028, "epoch": 2334} {"train_loss": -6.484980583190918, "global_step": 98029, "epoch": 2334} {"train_loss": -6.353266716003418, "global_step": 98030, "epoch": 2334} {"train_loss": -6.384682655334473, "global_step": 98031, "epoch": 2334} {"train_loss": -6.384346008300781, "global_step": 98032, "epoch": 2334} {"train_loss": -6.362658500671387, "global_step": 98033, "epoch": 2334} {"train_loss": -6.3219404220581055, "global_step": 98034, "epoch": 2334} {"train_loss": -6.272533416748047, "global_step": 98035, "epoch": 2334} {"train_loss": -6.239492416381836, "global_step": 98036, "epoch": 2334} {"train_loss": -6.356415271759033, "global_step": 98037, "epoch": 2334} {"train_loss": -6.370866775512695, "global_step": 98038, "epoch": 2334} {"train_loss": -6.260114669799805, "global_step": 98039, "epoch": 2334} {"train_loss": -6.265785217285156, "global_step": 98040, "epoch": 2334} {"train_loss": -6.393585205078125, "global_step": 98041, "epoch": 2334} {"train_loss": -6.29946231842041, "global_step": 98042, "epoch": 2334} {"train_loss": -6.253881454467773, "global_step": 98043, "epoch": 2334} {"train_loss": -6.45408821105957, "global_step": 98044, "epoch": 2334} {"train_loss": -6.300029754638672, "global_step": 98045, "epoch": 2334} {"train_loss": -6.425583839416504, "global_step": 98046, "epoch": 2334} {"train_loss": -6.432419776916504, "global_step": 98047, "epoch": 2334} {"train_loss": -6.317609786987305, "global_step": 98048, "epoch": 2334} {"train_loss": -6.385821342468262, "global_step": 98049, "epoch": 2334} {"train_loss": -6.371186256408691, "global_step": 98050, "epoch": 2334} {"train_loss": -6.355914115905762, "global_step": 98051, "epoch": 2334} {"train_loss": -6.481242656707764, "global_step": 98052, "epoch": 2334} {"train_loss": -6.210966110229492, "global_step": 98053, "epoch": 2334} {"train_loss": -6.245868682861328, "global_step": 98054, "epoch": 2334} {"train_loss": -6.297147750854492, "global_step": 98055, "epoch": 2334} {"train_loss": -6.313436985015869, "global_step": 98056, "epoch": 2334} {"train_loss": -6.288212299346924, "global_step": 98057, "epoch": 2334} {"train_loss": -6.422999858856201, "global_step": 98058, "epoch": 2334} {"train_loss": -6.3516998291015625, "global_step": 98059, "epoch": 2334} {"train_loss": -6.524753093719482, "global_step": 98060, "epoch": 2334} {"train_loss": -6.3908371925354, "global_step": 98061, "epoch": 2334} {"train_loss": -6.365616798400879, "global_step": 98062, "epoch": 2334} {"train_loss": -6.242386341094971, "global_step": 98063, "epoch": 2334} {"train_loss": -6.361102104187012, "global_step": 98064, "epoch": 2334} {"train_loss": -6.385610580444336, "global_step": 98065, "epoch": 2334} {"train_loss": -6.315722465515137, "global_step": 98066, "epoch": 2334} {"train_loss": -6.342371940612793, "global_step": 98067, "epoch": 2334} {"train_loss": -6.322535037994385, "global_step": 98068, "epoch": 2334} {"train_loss": -6.348065784999302, "global_step": 98069, "epoch": 2334, "val_loss": 63889.43359375} {"train_loss": -6.281528472900391, "global_step": 98070, "epoch": 2335} {"train_loss": -6.276092529296875, "global_step": 98071, "epoch": 2335} {"train_loss": -6.321439266204834, "global_step": 98072, "epoch": 2335} {"train_loss": -6.373290061950684, "global_step": 98073, "epoch": 2335} {"train_loss": -6.422410011291504, "global_step": 98074, "epoch": 2335} {"train_loss": -6.354963779449463, "global_step": 98075, "epoch": 2335} {"train_loss": -6.443626880645752, "global_step": 98076, "epoch": 2335} {"train_loss": -6.495197772979736, "global_step": 98077, "epoch": 2335} {"train_loss": -6.404683589935303, "global_step": 98078, "epoch": 2335} {"train_loss": -6.341287612915039, "global_step": 98079, "epoch": 2335} {"train_loss": -6.313671112060547, "global_step": 98080, "epoch": 2335} {"train_loss": -6.391347885131836, "global_step": 98081, "epoch": 2335} {"train_loss": -6.439806938171387, "global_step": 98082, "epoch": 2335} {"train_loss": -6.437005043029785, "global_step": 98083, "epoch": 2335} {"train_loss": -6.263727188110352, "global_step": 98084, "epoch": 2335} {"train_loss": -6.2561445236206055, "global_step": 98085, "epoch": 2335} {"train_loss": -6.424610614776611, "global_step": 98086, "epoch": 2335} {"train_loss": -6.324626445770264, "global_step": 98087, "epoch": 2335} {"train_loss": -6.467221736907959, "global_step": 98088, "epoch": 2335} {"train_loss": -6.452737808227539, "global_step": 98089, "epoch": 2335} {"train_loss": -6.3388824462890625, "global_step": 98090, "epoch": 2335} {"train_loss": -6.309983253479004, "global_step": 98091, "epoch": 2335} {"train_loss": -6.347965717315674, "global_step": 98092, "epoch": 2335} {"train_loss": -6.361983299255371, "global_step": 98093, "epoch": 2335} {"train_loss": -6.333359718322754, "global_step": 98094, "epoch": 2335} {"train_loss": -6.322537422180176, "global_step": 98095, "epoch": 2335} {"train_loss": -6.400723457336426, "global_step": 98096, "epoch": 2335} {"train_loss": -6.414505958557129, "global_step": 98097, "epoch": 2335} {"train_loss": -6.4212236404418945, "global_step": 98098, "epoch": 2335} {"train_loss": -6.344094276428223, "global_step": 98099, "epoch": 2335} {"train_loss": -6.368730545043945, "global_step": 98100, "epoch": 2335} {"train_loss": -6.318142890930176, "global_step": 98101, "epoch": 2335} {"train_loss": -6.4040021896362305, "global_step": 98102, "epoch": 2335} {"train_loss": -6.328426837921143, "global_step": 98103, "epoch": 2335} {"train_loss": -6.272275447845459, "global_step": 98104, "epoch": 2335} {"train_loss": -6.32759952545166, "global_step": 98105, "epoch": 2335} {"train_loss": -6.286379814147949, "global_step": 98106, "epoch": 2335} {"train_loss": -6.3427886962890625, "global_step": 98107, "epoch": 2335} {"train_loss": -6.301596164703369, "global_step": 98108, "epoch": 2335} {"train_loss": -6.338128089904785, "global_step": 98109, "epoch": 2335} {"train_loss": -6.258485794067383, "global_step": 98110, "epoch": 2335} {"train_loss": -6.356924079713368, "global_step": 98111, "epoch": 2335, "val_loss": 64228.0546875} {"train_loss": -6.4118757247924805, "global_step": 98112, "epoch": 2336} {"train_loss": -6.364844799041748, "global_step": 98113, "epoch": 2336} {"train_loss": -6.332832336425781, "global_step": 98114, "epoch": 2336} {"train_loss": -6.183104991912842, "global_step": 98115, "epoch": 2336} {"train_loss": -6.458316802978516, "global_step": 98116, "epoch": 2336} {"train_loss": -6.325325965881348, "global_step": 98117, "epoch": 2336} {"train_loss": -6.329939842224121, "global_step": 98118, "epoch": 2336} {"train_loss": -6.3811235427856445, "global_step": 98119, "epoch": 2336} {"train_loss": -6.251288414001465, "global_step": 98120, "epoch": 2336} {"train_loss": -6.455974578857422, "global_step": 98121, "epoch": 2336} {"train_loss": -6.219383239746094, "global_step": 98122, "epoch": 2336} {"train_loss": -6.308196067810059, "global_step": 98123, "epoch": 2336} {"train_loss": -6.444216728210449, "global_step": 98124, "epoch": 2336} {"train_loss": -6.32396125793457, "global_step": 98125, "epoch": 2336} {"train_loss": -6.275799751281738, "global_step": 98126, "epoch": 2336} {"train_loss": -6.328645706176758, "global_step": 98127, "epoch": 2336} {"train_loss": -6.127122402191162, "global_step": 98128, "epoch": 2336} {"train_loss": -6.216727256774902, "global_step": 98129, "epoch": 2336} {"train_loss": -6.3998188972473145, "global_step": 98130, "epoch": 2336} {"train_loss": -6.287265777587891, "global_step": 98131, "epoch": 2336} {"train_loss": -6.323022842407227, "global_step": 98132, "epoch": 2336} {"train_loss": -6.25286865234375, "global_step": 98133, "epoch": 2336} {"train_loss": -6.4405975341796875, "global_step": 98134, "epoch": 2336} {"train_loss": -6.39525032043457, "global_step": 98135, "epoch": 2336} {"train_loss": -6.3194122314453125, "global_step": 98136, "epoch": 2336} {"train_loss": -6.360594749450684, "global_step": 98137, "epoch": 2336} {"train_loss": -6.23928689956665, "global_step": 98138, "epoch": 2336} {"train_loss": -6.4425249099731445, "global_step": 98139, "epoch": 2336} {"train_loss": -6.355316638946533, "global_step": 98140, "epoch": 2336} {"train_loss": -6.429089546203613, "global_step": 98141, "epoch": 2336} {"train_loss": -6.393479347229004, "global_step": 98142, "epoch": 2336} {"train_loss": -6.357822418212891, "global_step": 98143, "epoch": 2336} {"train_loss": -6.368659019470215, "global_step": 98144, "epoch": 2336} {"train_loss": -6.365134239196777, "global_step": 98145, "epoch": 2336} {"train_loss": -6.232036113739014, "global_step": 98146, "epoch": 2336} {"train_loss": -6.438838005065918, "global_step": 98147, "epoch": 2336} {"train_loss": -6.366003036499023, "global_step": 98148, "epoch": 2336} {"train_loss": -6.356661796569824, "global_step": 98149, "epoch": 2336} {"train_loss": -6.373632431030273, "global_step": 98150, "epoch": 2336} {"train_loss": -6.282681465148926, "global_step": 98151, "epoch": 2336} {"train_loss": -6.359896659851074, "global_step": 98152, "epoch": 2336} {"train_loss": -6.339203414462862, "global_step": 98153, "epoch": 2336, "val_loss": 64008.140625} {"train_loss": -6.372973442077637, "global_step": 98154, "epoch": 2337} {"train_loss": -6.312295913696289, "global_step": 98155, "epoch": 2337} {"train_loss": -6.526541709899902, "global_step": 98156, "epoch": 2337} {"train_loss": -6.390917778015137, "global_step": 98157, "epoch": 2337} {"train_loss": -6.362783432006836, "global_step": 98158, "epoch": 2337} {"train_loss": -6.374680042266846, "global_step": 98159, "epoch": 2337} {"train_loss": -6.344959259033203, "global_step": 98160, "epoch": 2337} {"train_loss": -6.33304500579834, "global_step": 98161, "epoch": 2337} {"train_loss": -6.370851516723633, "global_step": 98162, "epoch": 2337} {"train_loss": -6.261015892028809, "global_step": 98163, "epoch": 2337} {"train_loss": -6.452172756195068, "global_step": 98164, "epoch": 2337} {"train_loss": -6.31194543838501, "global_step": 98165, "epoch": 2337} {"train_loss": -6.345637321472168, "global_step": 98166, "epoch": 2337} {"train_loss": -6.200098991394043, "global_step": 98167, "epoch": 2337} {"train_loss": -6.332571029663086, "global_step": 98168, "epoch": 2337} {"train_loss": -6.299139022827148, "global_step": 98169, "epoch": 2337} {"train_loss": -6.200203895568848, "global_step": 98170, "epoch": 2337} {"train_loss": -6.31758451461792, "global_step": 98171, "epoch": 2337} {"train_loss": -6.433620452880859, "global_step": 98172, "epoch": 2337} {"train_loss": -6.406171798706055, "global_step": 98173, "epoch": 2337} {"train_loss": -6.406477928161621, "global_step": 98174, "epoch": 2337} {"train_loss": -6.394488334655762, "global_step": 98175, "epoch": 2337} {"train_loss": -6.29788875579834, "global_step": 98176, "epoch": 2337} {"train_loss": -6.275055885314941, "global_step": 98177, "epoch": 2337} {"train_loss": -6.363862037658691, "global_step": 98178, "epoch": 2337} {"train_loss": -6.458599090576172, "global_step": 98179, "epoch": 2337} {"train_loss": -6.250419616699219, "global_step": 98180, "epoch": 2337} {"train_loss": -6.362561225891113, "global_step": 98181, "epoch": 2337} {"train_loss": -6.189050674438477, "global_step": 98182, "epoch": 2337} {"train_loss": -6.385468482971191, "global_step": 98183, "epoch": 2337} {"train_loss": -6.302000045776367, "global_step": 98184, "epoch": 2337} {"train_loss": -6.278205394744873, "global_step": 98185, "epoch": 2337} {"train_loss": -6.483983516693115, "global_step": 98186, "epoch": 2337} {"train_loss": -6.229654312133789, "global_step": 98187, "epoch": 2337} {"train_loss": -6.39811897277832, "global_step": 98188, "epoch": 2337} {"train_loss": -6.37306022644043, "global_step": 98189, "epoch": 2337} {"train_loss": -6.342177867889404, "global_step": 98190, "epoch": 2337} {"train_loss": -6.414239883422852, "global_step": 98191, "epoch": 2337} {"train_loss": -6.334558963775635, "global_step": 98192, "epoch": 2337} {"train_loss": -6.394900321960449, "global_step": 98193, "epoch": 2337} {"train_loss": -6.432931423187256, "global_step": 98194, "epoch": 2337} {"train_loss": -6.347007365453811, "global_step": 98195, "epoch": 2337, "val_loss": 63892.0625} {"train_loss": -6.339851379394531, "global_step": 98196, "epoch": 2338} {"train_loss": -6.373252868652344, "global_step": 98197, "epoch": 2338} {"train_loss": -6.344047546386719, "global_step": 98198, "epoch": 2338} {"train_loss": -6.324355125427246, "global_step": 98199, "epoch": 2338} {"train_loss": -6.367447376251221, "global_step": 98200, "epoch": 2338} {"train_loss": -6.371420860290527, "global_step": 98201, "epoch": 2338} {"train_loss": -6.245677471160889, "global_step": 98202, "epoch": 2338} {"train_loss": -6.371711730957031, "global_step": 98203, "epoch": 2338} {"train_loss": -6.2582011222839355, "global_step": 98204, "epoch": 2338} {"train_loss": -6.311408042907715, "global_step": 98205, "epoch": 2338} {"train_loss": -6.365773677825928, "global_step": 98206, "epoch": 2338} {"train_loss": -6.331523418426514, "global_step": 98207, "epoch": 2338} {"train_loss": -6.417677879333496, "global_step": 98208, "epoch": 2338} {"train_loss": -6.319691181182861, "global_step": 98209, "epoch": 2338} {"train_loss": -6.253380298614502, "global_step": 98210, "epoch": 2338} {"train_loss": -6.331099510192871, "global_step": 98211, "epoch": 2338} {"train_loss": -6.391998291015625, "global_step": 98212, "epoch": 2338} {"train_loss": -6.4561767578125, "global_step": 98213, "epoch": 2338} {"train_loss": -6.360113143920898, "global_step": 98214, "epoch": 2338} {"train_loss": -6.367142677307129, "global_step": 98215, "epoch": 2338} {"train_loss": -6.3714599609375, "global_step": 98216, "epoch": 2338} {"train_loss": -6.332950592041016, "global_step": 98217, "epoch": 2338} {"train_loss": -6.27424430847168, "global_step": 98218, "epoch": 2338} {"train_loss": -6.273549556732178, "global_step": 98219, "epoch": 2338} {"train_loss": -6.41121768951416, "global_step": 98220, "epoch": 2338} {"train_loss": -6.363338470458984, "global_step": 98221, "epoch": 2338} {"train_loss": -6.518560409545898, "global_step": 98222, "epoch": 2338} {"train_loss": -6.379030227661133, "global_step": 98223, "epoch": 2338} {"train_loss": -6.454878807067871, "global_step": 98224, "epoch": 2338} {"train_loss": -6.405313968658447, "global_step": 98225, "epoch": 2338} {"train_loss": -6.400226593017578, "global_step": 98226, "epoch": 2338} {"train_loss": -6.3600544929504395, "global_step": 98227, "epoch": 2338} {"train_loss": -6.402190208435059, "global_step": 98228, "epoch": 2338} {"train_loss": -6.291010856628418, "global_step": 98229, "epoch": 2338} {"train_loss": -6.420557022094727, "global_step": 98230, "epoch": 2338} {"train_loss": -6.304143905639648, "global_step": 98231, "epoch": 2338} {"train_loss": -6.333372116088867, "global_step": 98232, "epoch": 2338} {"train_loss": -6.491795063018799, "global_step": 98233, "epoch": 2338} {"train_loss": -6.255338191986084, "global_step": 98234, "epoch": 2338} {"train_loss": -6.397099494934082, "global_step": 98235, "epoch": 2338} {"train_loss": -6.289265155792236, "global_step": 98236, "epoch": 2338} {"train_loss": -6.359574283872332, "global_step": 98237, "epoch": 2338, "val_loss": 63913.8828125} {"train_loss": -6.332399368286133, "global_step": 98238, "epoch": 2339} {"train_loss": -6.2483344078063965, "global_step": 98239, "epoch": 2339} {"train_loss": -6.3342390060424805, "global_step": 98240, "epoch": 2339} {"train_loss": -6.298543930053711, "global_step": 98241, "epoch": 2339} {"train_loss": -6.4281840324401855, "global_step": 98242, "epoch": 2339} {"train_loss": -6.360223293304443, "global_step": 98243, "epoch": 2339} {"train_loss": -6.434232711791992, "global_step": 98244, "epoch": 2339} {"train_loss": -6.348575592041016, "global_step": 98245, "epoch": 2339} {"train_loss": -6.356983184814453, "global_step": 98246, "epoch": 2339} {"train_loss": -6.345474720001221, "global_step": 98247, "epoch": 2339} {"train_loss": -6.428210735321045, "global_step": 98248, "epoch": 2339} {"train_loss": -6.477701187133789, "global_step": 98249, "epoch": 2339} {"train_loss": -6.3726725578308105, "global_step": 98250, "epoch": 2339} {"train_loss": -6.327938079833984, "global_step": 98251, "epoch": 2339} {"train_loss": -6.389111518859863, "global_step": 98252, "epoch": 2339} {"train_loss": -6.485038757324219, "global_step": 98253, "epoch": 2339} {"train_loss": -6.292054176330566, "global_step": 98254, "epoch": 2339} {"train_loss": -6.399076461791992, "global_step": 98255, "epoch": 2339} {"train_loss": -6.338212490081787, "global_step": 98256, "epoch": 2339} {"train_loss": -6.369937419891357, "global_step": 98257, "epoch": 2339} {"train_loss": -6.322689056396484, "global_step": 98258, "epoch": 2339} {"train_loss": -6.506734848022461, "global_step": 98259, "epoch": 2339} {"train_loss": -6.298614501953125, "global_step": 98260, "epoch": 2339} {"train_loss": -6.328279495239258, "global_step": 98261, "epoch": 2339} {"train_loss": -6.236346244812012, "global_step": 98262, "epoch": 2339} {"train_loss": -6.282670021057129, "global_step": 98263, "epoch": 2339} {"train_loss": -6.305739879608154, "global_step": 98264, "epoch": 2339} {"train_loss": -6.392431735992432, "global_step": 98265, "epoch": 2339} {"train_loss": -6.346747398376465, "global_step": 98266, "epoch": 2339} {"train_loss": -6.503192901611328, "global_step": 98267, "epoch": 2339} {"train_loss": -6.352762222290039, "global_step": 98268, "epoch": 2339} {"train_loss": -6.306037902832031, "global_step": 98269, "epoch": 2339} {"train_loss": -6.264171123504639, "global_step": 98270, "epoch": 2339} {"train_loss": -6.308006286621094, "global_step": 98271, "epoch": 2339} {"train_loss": -6.432175636291504, "global_step": 98272, "epoch": 2339} {"train_loss": -6.295815467834473, "global_step": 98273, "epoch": 2339} {"train_loss": -6.358136177062988, "global_step": 98274, "epoch": 2339} {"train_loss": -6.400646209716797, "global_step": 98275, "epoch": 2339} {"train_loss": -6.337390899658203, "global_step": 98276, "epoch": 2339} {"train_loss": -6.40020751953125, "global_step": 98277, "epoch": 2339} {"train_loss": -6.3845624923706055, "global_step": 98278, "epoch": 2339} {"train_loss": -6.358624878383818, "global_step": 98279, "epoch": 2339, "val_loss": 63917.64453125} {"train_loss": -6.44330358505249, "global_step": 98280, "epoch": 2340} {"train_loss": -6.348890781402588, "global_step": 98281, "epoch": 2340} {"train_loss": -6.389229774475098, "global_step": 98282, "epoch": 2340} {"train_loss": -6.398358345031738, "global_step": 98283, "epoch": 2340} {"train_loss": -6.418855667114258, "global_step": 98284, "epoch": 2340} {"train_loss": -6.426632881164551, "global_step": 98285, "epoch": 2340} {"train_loss": -6.465057373046875, "global_step": 98286, "epoch": 2340} {"train_loss": -6.311822414398193, "global_step": 98287, "epoch": 2340} {"train_loss": -6.347841262817383, "global_step": 98288, "epoch": 2340} {"train_loss": -6.342731475830078, "global_step": 98289, "epoch": 2340} {"train_loss": -6.310866832733154, "global_step": 98290, "epoch": 2340} {"train_loss": -6.420332908630371, "global_step": 98291, "epoch": 2340} {"train_loss": -6.3183746337890625, "global_step": 98292, "epoch": 2340} {"train_loss": -6.266543388366699, "global_step": 98293, "epoch": 2340} {"train_loss": -6.330038070678711, "global_step": 98294, "epoch": 2340} {"train_loss": -6.42484188079834, "global_step": 98295, "epoch": 2340} {"train_loss": -6.364105224609375, "global_step": 98296, "epoch": 2340} {"train_loss": -6.357450485229492, "global_step": 98297, "epoch": 2340} {"train_loss": -6.277589321136475, "global_step": 98298, "epoch": 2340} {"train_loss": -6.3753252029418945, "global_step": 98299, "epoch": 2340} {"train_loss": -6.307530403137207, "global_step": 98300, "epoch": 2340} {"train_loss": -6.349570274353027, "global_step": 98301, "epoch": 2340} {"train_loss": -6.406910419464111, "global_step": 98302, "epoch": 2340} {"train_loss": -6.357611656188965, "global_step": 98303, "epoch": 2340} {"train_loss": -6.222813129425049, "global_step": 98304, "epoch": 2340} {"train_loss": -6.465303421020508, "global_step": 98305, "epoch": 2340} {"train_loss": -6.348583221435547, "global_step": 98306, "epoch": 2340} {"train_loss": -6.26975679397583, "global_step": 98307, "epoch": 2340} {"train_loss": -6.2214860916137695, "global_step": 98308, "epoch": 2340} {"train_loss": -6.265013694763184, "global_step": 98309, "epoch": 2340} {"train_loss": -6.335223197937012, "global_step": 98310, "epoch": 2340} {"train_loss": -6.217893600463867, "global_step": 98311, "epoch": 2340} {"train_loss": -6.392733573913574, "global_step": 98312, "epoch": 2340} {"train_loss": -6.288829803466797, "global_step": 98313, "epoch": 2340} {"train_loss": -6.145434379577637, "global_step": 98314, "epoch": 2340} {"train_loss": -6.364715576171875, "global_step": 98315, "epoch": 2340} {"train_loss": -6.236985683441162, "global_step": 98316, "epoch": 2340} {"train_loss": -6.305806636810303, "global_step": 98317, "epoch": 2340} {"train_loss": -6.317392349243164, "global_step": 98318, "epoch": 2340} {"train_loss": -6.319338321685791, "global_step": 98319, "epoch": 2340} {"train_loss": -6.3462114334106445, "global_step": 98320, "epoch": 2340} {"train_loss": -6.337751956213088, "global_step": 98321, "epoch": 2340, "val_loss": 64062.046875} {"train_loss": -6.321684837341309, "global_step": 98322, "epoch": 2341} {"train_loss": -6.289935111999512, "global_step": 98323, "epoch": 2341} {"train_loss": -6.387773513793945, "global_step": 98324, "epoch": 2341} {"train_loss": -6.473255157470703, "global_step": 98325, "epoch": 2341} {"train_loss": -6.308732986450195, "global_step": 98326, "epoch": 2341} {"train_loss": -6.463150978088379, "global_step": 98327, "epoch": 2341} {"train_loss": -6.290993690490723, "global_step": 98328, "epoch": 2341} {"train_loss": -6.3463287353515625, "global_step": 98329, "epoch": 2341} {"train_loss": -6.2229509353637695, "global_step": 98330, "epoch": 2341} {"train_loss": -6.279574871063232, "global_step": 98331, "epoch": 2341} {"train_loss": -6.316481590270996, "global_step": 98332, "epoch": 2341} {"train_loss": -6.26704216003418, "global_step": 98333, "epoch": 2341} {"train_loss": -6.245741367340088, "global_step": 98334, "epoch": 2341} {"train_loss": -6.378827095031738, "global_step": 98335, "epoch": 2341} {"train_loss": -6.270451068878174, "global_step": 98336, "epoch": 2341} {"train_loss": -6.257927894592285, "global_step": 98337, "epoch": 2341} {"train_loss": -6.3676676750183105, "global_step": 98338, "epoch": 2341} {"train_loss": -6.2952985763549805, "global_step": 98339, "epoch": 2341} {"train_loss": -6.372019290924072, "global_step": 98340, "epoch": 2341} {"train_loss": -6.379950523376465, "global_step": 98341, "epoch": 2341} {"train_loss": -6.5015082359313965, "global_step": 98342, "epoch": 2341} {"train_loss": -6.27453088760376, "global_step": 98343, "epoch": 2341} {"train_loss": -6.328315734863281, "global_step": 98344, "epoch": 2341} {"train_loss": -6.286659240722656, "global_step": 98345, "epoch": 2341} {"train_loss": -6.343742370605469, "global_step": 98346, "epoch": 2341} {"train_loss": -6.408401012420654, "global_step": 98347, "epoch": 2341} {"train_loss": -6.340577125549316, "global_step": 98348, "epoch": 2341} {"train_loss": -6.323245048522949, "global_step": 98349, "epoch": 2341} {"train_loss": -6.488279819488525, "global_step": 98350, "epoch": 2341} {"train_loss": -6.36810827255249, "global_step": 98351, "epoch": 2341} {"train_loss": -6.274257183074951, "global_step": 98352, "epoch": 2341} {"train_loss": -6.360245227813721, "global_step": 98353, "epoch": 2341} {"train_loss": -6.353374481201172, "global_step": 98354, "epoch": 2341} {"train_loss": -6.4424824714660645, "global_step": 98355, "epoch": 2341} {"train_loss": -6.400187969207764, "global_step": 98356, "epoch": 2341} {"train_loss": -6.377687454223633, "global_step": 98357, "epoch": 2341} {"train_loss": -6.386687755584717, "global_step": 98358, "epoch": 2341} {"train_loss": -6.3635969161987305, "global_step": 98359, "epoch": 2341} {"train_loss": -6.453657150268555, "global_step": 98360, "epoch": 2341} {"train_loss": -6.440604209899902, "global_step": 98361, "epoch": 2341} {"train_loss": -6.278120994567871, "global_step": 98362, "epoch": 2341} {"train_loss": -6.349930967603411, "global_step": 98363, "epoch": 2341, "val_loss": 63977.1328125} {"train_loss": -6.336524486541748, "global_step": 98364, "epoch": 2342} {"train_loss": -6.3035807609558105, "global_step": 98365, "epoch": 2342} {"train_loss": -6.348308563232422, "global_step": 98366, "epoch": 2342} {"train_loss": -6.312161445617676, "global_step": 98367, "epoch": 2342} {"train_loss": -6.398075103759766, "global_step": 98368, "epoch": 2342} {"train_loss": -6.304853439331055, "global_step": 98369, "epoch": 2342} {"train_loss": -6.520171165466309, "global_step": 98370, "epoch": 2342} {"train_loss": -6.412869453430176, "global_step": 98371, "epoch": 2342} {"train_loss": -6.151520252227783, "global_step": 98372, "epoch": 2342} {"train_loss": -6.310580730438232, "global_step": 98373, "epoch": 2342} {"train_loss": -6.441289901733398, "global_step": 98374, "epoch": 2342} {"train_loss": -6.325814247131348, "global_step": 98375, "epoch": 2342} {"train_loss": -6.328641891479492, "global_step": 98376, "epoch": 2342} {"train_loss": -6.297298431396484, "global_step": 98377, "epoch": 2342} {"train_loss": -6.149314880371094, "global_step": 98378, "epoch": 2342} {"train_loss": -6.298898696899414, "global_step": 98379, "epoch": 2342} {"train_loss": -6.326502323150635, "global_step": 98380, "epoch": 2342} {"train_loss": -6.310264587402344, "global_step": 98381, "epoch": 2342} {"train_loss": -6.187069416046143, "global_step": 98382, "epoch": 2342} {"train_loss": -6.371369361877441, "global_step": 98383, "epoch": 2342} {"train_loss": -6.325356483459473, "global_step": 98384, "epoch": 2342} {"train_loss": -6.19539737701416, "global_step": 98385, "epoch": 2342} {"train_loss": -6.294912338256836, "global_step": 98386, "epoch": 2342} {"train_loss": -6.265859603881836, "global_step": 98387, "epoch": 2342} {"train_loss": -6.293696403503418, "global_step": 98388, "epoch": 2342} {"train_loss": -6.352729797363281, "global_step": 98389, "epoch": 2342} {"train_loss": -6.356696128845215, "global_step": 98390, "epoch": 2342} {"train_loss": -6.431456089019775, "global_step": 98391, "epoch": 2342} {"train_loss": -6.316022872924805, "global_step": 98392, "epoch": 2342} {"train_loss": -6.336478233337402, "global_step": 98393, "epoch": 2342} {"train_loss": -6.342196941375732, "global_step": 98394, "epoch": 2342} {"train_loss": -6.259968280792236, "global_step": 98395, "epoch": 2342} {"train_loss": -6.376832962036133, "global_step": 98396, "epoch": 2342} {"train_loss": -6.388936996459961, "global_step": 98397, "epoch": 2342} {"train_loss": -6.454287528991699, "global_step": 98398, "epoch": 2342} {"train_loss": -6.384700775146484, "global_step": 98399, "epoch": 2342} {"train_loss": -6.3039960861206055, "global_step": 98400, "epoch": 2342} {"train_loss": -6.298316478729248, "global_step": 98401, "epoch": 2342} {"train_loss": -6.32332181930542, "global_step": 98402, "epoch": 2342} {"train_loss": -6.477607727050781, "global_step": 98403, "epoch": 2342} {"train_loss": -6.439906597137451, "global_step": 98404, "epoch": 2342} {"train_loss": -6.33514454251244, "global_step": 98405, "epoch": 2342, "val_loss": 63894.09765625} {"train_loss": -6.33345890045166, "global_step": 98406, "epoch": 2343} {"train_loss": -6.360151290893555, "global_step": 98407, "epoch": 2343} {"train_loss": -6.442661762237549, "global_step": 98408, "epoch": 2343} {"train_loss": -6.49952507019043, "global_step": 98409, "epoch": 2343} {"train_loss": -6.419366359710693, "global_step": 98410, "epoch": 2343} {"train_loss": -6.410554885864258, "global_step": 98411, "epoch": 2343} {"train_loss": -6.423781871795654, "global_step": 98412, "epoch": 2343} {"train_loss": -6.480959892272949, "global_step": 98413, "epoch": 2343} {"train_loss": -6.358028411865234, "global_step": 98414, "epoch": 2343} {"train_loss": -6.317875862121582, "global_step": 98415, "epoch": 2343} {"train_loss": -6.425058364868164, "global_step": 98416, "epoch": 2343} {"train_loss": -6.388754844665527, "global_step": 98417, "epoch": 2343} {"train_loss": -6.374701023101807, "global_step": 98418, "epoch": 2343} {"train_loss": -6.380966663360596, "global_step": 98419, "epoch": 2343} {"train_loss": -6.305400371551514, "global_step": 98420, "epoch": 2343} {"train_loss": -6.403872966766357, "global_step": 98421, "epoch": 2343} {"train_loss": -6.4474334716796875, "global_step": 98422, "epoch": 2343} {"train_loss": -6.231429100036621, "global_step": 98423, "epoch": 2343} {"train_loss": -6.325320720672607, "global_step": 98424, "epoch": 2343} {"train_loss": -6.31386661529541, "global_step": 98425, "epoch": 2343} {"train_loss": -6.207009792327881, "global_step": 98426, "epoch": 2343} {"train_loss": -6.329261779785156, "global_step": 98427, "epoch": 2343} {"train_loss": -6.341439247131348, "global_step": 98428, "epoch": 2343} {"train_loss": -6.3154449462890625, "global_step": 98429, "epoch": 2343} {"train_loss": -6.350531101226807, "global_step": 98430, "epoch": 2343} {"train_loss": -6.2587785720825195, "global_step": 98431, "epoch": 2343} {"train_loss": -6.2853899002075195, "global_step": 98432, "epoch": 2343} {"train_loss": -6.310296058654785, "global_step": 98433, "epoch": 2343} {"train_loss": -6.420122146606445, "global_step": 98434, "epoch": 2343} {"train_loss": -6.355685710906982, "global_step": 98435, "epoch": 2343} {"train_loss": -6.4163103103637695, "global_step": 98436, "epoch": 2343} {"train_loss": -6.215692520141602, "global_step": 98437, "epoch": 2343} {"train_loss": -6.437878608703613, "global_step": 98438, "epoch": 2343} {"train_loss": -6.294795989990234, "global_step": 98439, "epoch": 2343} {"train_loss": -6.314064979553223, "global_step": 98440, "epoch": 2343} {"train_loss": -6.486423492431641, "global_step": 98441, "epoch": 2343} {"train_loss": -6.26377010345459, "global_step": 98442, "epoch": 2343} {"train_loss": -6.32970666885376, "global_step": 98443, "epoch": 2343} {"train_loss": -6.42604923248291, "global_step": 98444, "epoch": 2343} {"train_loss": -6.395337104797363, "global_step": 98445, "epoch": 2343} {"train_loss": -6.2584381103515625, "global_step": 98446, "epoch": 2343} {"train_loss": -6.358122541790917, "global_step": 98447, "epoch": 2343, "val_loss": 63768.0078125} {"train_loss": -6.347145080566406, "global_step": 98448, "epoch": 2344} {"train_loss": -6.315917015075684, "global_step": 98449, "epoch": 2344} {"train_loss": -6.489050388336182, "global_step": 98450, "epoch": 2344} {"train_loss": -6.420162200927734, "global_step": 98451, "epoch": 2344} {"train_loss": -6.386673927307129, "global_step": 98452, "epoch": 2344} {"train_loss": -6.305708885192871, "global_step": 98453, "epoch": 2344} {"train_loss": -6.507269382476807, "global_step": 98454, "epoch": 2344} {"train_loss": -6.365509986877441, "global_step": 98455, "epoch": 2344} {"train_loss": -6.352829456329346, "global_step": 98456, "epoch": 2344} {"train_loss": -6.457937717437744, "global_step": 98457, "epoch": 2344} {"train_loss": -6.331918239593506, "global_step": 98458, "epoch": 2344} {"train_loss": -6.186841011047363, "global_step": 98459, "epoch": 2344} {"train_loss": -6.479540824890137, "global_step": 98460, "epoch": 2344} {"train_loss": -6.331067085266113, "global_step": 98461, "epoch": 2344} {"train_loss": -6.493315696716309, "global_step": 98462, "epoch": 2344} {"train_loss": -6.400176525115967, "global_step": 98463, "epoch": 2344} {"train_loss": -6.38714599609375, "global_step": 98464, "epoch": 2344} {"train_loss": -6.330078601837158, "global_step": 98465, "epoch": 2344} {"train_loss": -6.452177047729492, "global_step": 98466, "epoch": 2344} {"train_loss": -6.238866329193115, "global_step": 98467, "epoch": 2344} {"train_loss": -6.399819374084473, "global_step": 98468, "epoch": 2344} {"train_loss": -6.3365254402160645, "global_step": 98469, "epoch": 2344} {"train_loss": -6.302628993988037, "global_step": 98470, "epoch": 2344} {"train_loss": -6.305314540863037, "global_step": 98471, "epoch": 2344} {"train_loss": -6.294882774353027, "global_step": 98472, "epoch": 2344} {"train_loss": -6.3758015632629395, "global_step": 98473, "epoch": 2344} {"train_loss": -6.240350723266602, "global_step": 98474, "epoch": 2344} {"train_loss": -6.321986675262451, "global_step": 98475, "epoch": 2344} {"train_loss": -6.27896785736084, "global_step": 98476, "epoch": 2344} {"train_loss": -6.267454147338867, "global_step": 98477, "epoch": 2344} {"train_loss": -6.176928520202637, "global_step": 98478, "epoch": 2344} {"train_loss": -6.348358154296875, "global_step": 98479, "epoch": 2344} {"train_loss": -6.277734756469727, "global_step": 98480, "epoch": 2344} {"train_loss": -6.310769557952881, "global_step": 98481, "epoch": 2344} {"train_loss": -6.253787517547607, "global_step": 98482, "epoch": 2344} {"train_loss": -6.304600715637207, "global_step": 98483, "epoch": 2344} {"train_loss": -6.270565509796143, "global_step": 98484, "epoch": 2344} {"train_loss": -6.379822731018066, "global_step": 98485, "epoch": 2344} {"train_loss": -6.35679817199707, "global_step": 98486, "epoch": 2344} {"train_loss": -6.281154155731201, "global_step": 98487, "epoch": 2344} {"train_loss": -6.246636390686035, "global_step": 98488, "epoch": 2344} {"train_loss": -6.33969927969433, "global_step": 98489, "epoch": 2344, "val_loss": 63847.12109375} {"train_loss": -6.217824459075928, "global_step": 98490, "epoch": 2345} {"train_loss": -6.381983757019043, "global_step": 98491, "epoch": 2345} {"train_loss": -6.239977836608887, "global_step": 98492, "epoch": 2345} {"train_loss": -6.381606101989746, "global_step": 98493, "epoch": 2345} {"train_loss": -6.256225109100342, "global_step": 98494, "epoch": 2345} {"train_loss": -6.2750773429870605, "global_step": 98495, "epoch": 2345} {"train_loss": -6.268132209777832, "global_step": 98496, "epoch": 2345} {"train_loss": -6.2812652587890625, "global_step": 98497, "epoch": 2345} {"train_loss": -6.308746814727783, "global_step": 98498, "epoch": 2345} {"train_loss": -6.329237937927246, "global_step": 98499, "epoch": 2345} {"train_loss": -6.333378791809082, "global_step": 98500, "epoch": 2345} {"train_loss": -6.378839015960693, "global_step": 98501, "epoch": 2345} {"train_loss": -6.37382698059082, "global_step": 98502, "epoch": 2345} {"train_loss": -6.293092250823975, "global_step": 98503, "epoch": 2345} {"train_loss": -6.3951520919799805, "global_step": 98504, "epoch": 2345} {"train_loss": -6.3669352531433105, "global_step": 98505, "epoch": 2345} {"train_loss": -6.441679000854492, "global_step": 98506, "epoch": 2345} {"train_loss": -6.308717727661133, "global_step": 98507, "epoch": 2345} {"train_loss": -6.420409202575684, "global_step": 98508, "epoch": 2345} {"train_loss": -6.3277587890625, "global_step": 98509, "epoch": 2345} {"train_loss": -6.344836711883545, "global_step": 98510, "epoch": 2345} {"train_loss": -6.400082111358643, "global_step": 98511, "epoch": 2345} {"train_loss": -6.278603553771973, "global_step": 98512, "epoch": 2345} {"train_loss": -6.385916709899902, "global_step": 98513, "epoch": 2345} {"train_loss": -6.4148783683776855, "global_step": 98514, "epoch": 2345} {"train_loss": -6.370023727416992, "global_step": 98515, "epoch": 2345} {"train_loss": -6.433633804321289, "global_step": 98516, "epoch": 2345} {"train_loss": -6.362203121185303, "global_step": 98517, "epoch": 2345} {"train_loss": -6.352712631225586, "global_step": 98518, "epoch": 2345} {"train_loss": -6.4033308029174805, "global_step": 98519, "epoch": 2345} {"train_loss": -6.27146053314209, "global_step": 98520, "epoch": 2345} {"train_loss": -6.282232761383057, "global_step": 98521, "epoch": 2345} {"train_loss": -6.344639301300049, "global_step": 98522, "epoch": 2345} {"train_loss": -6.338505744934082, "global_step": 98523, "epoch": 2345} {"train_loss": -6.466948509216309, "global_step": 98524, "epoch": 2345} {"train_loss": -6.260245323181152, "global_step": 98525, "epoch": 2345} {"train_loss": -6.324061393737793, "global_step": 98526, "epoch": 2345} {"train_loss": -6.221840858459473, "global_step": 98527, "epoch": 2345} {"train_loss": -6.402065277099609, "global_step": 98528, "epoch": 2345} {"train_loss": -6.428134918212891, "global_step": 98529, "epoch": 2345} {"train_loss": -6.321230888366699, "global_step": 98530, "epoch": 2345} {"train_loss": -6.341636839367094, "global_step": 98531, "epoch": 2345, "val_loss": 63902.5390625} {"train_loss": -6.33396577835083, "global_step": 98532, "epoch": 2346} {"train_loss": -6.2847580909729, "global_step": 98533, "epoch": 2346} {"train_loss": -6.34641170501709, "global_step": 98534, "epoch": 2346} {"train_loss": -6.448722839355469, "global_step": 98535, "epoch": 2346} {"train_loss": -6.310133934020996, "global_step": 98536, "epoch": 2346} {"train_loss": -6.472929000854492, "global_step": 98537, "epoch": 2346} {"train_loss": -6.3304853439331055, "global_step": 98538, "epoch": 2346} {"train_loss": -6.434930801391602, "global_step": 98539, "epoch": 2346} {"train_loss": -6.3221211433410645, "global_step": 98540, "epoch": 2346} {"train_loss": -6.38167667388916, "global_step": 98541, "epoch": 2346} {"train_loss": -6.451088905334473, "global_step": 98542, "epoch": 2346} {"train_loss": -6.328722953796387, "global_step": 98543, "epoch": 2346} {"train_loss": -6.341821193695068, "global_step": 98544, "epoch": 2346} {"train_loss": -6.273001670837402, "global_step": 98545, "epoch": 2346} {"train_loss": -6.223869323730469, "global_step": 98546, "epoch": 2346} {"train_loss": -6.214239597320557, "global_step": 98547, "epoch": 2346} {"train_loss": -6.426820755004883, "global_step": 98548, "epoch": 2346} {"train_loss": -6.187464714050293, "global_step": 98549, "epoch": 2346} {"train_loss": -6.258430004119873, "global_step": 98550, "epoch": 2346} {"train_loss": -6.147843837738037, "global_step": 98551, "epoch": 2346} {"train_loss": -6.101985931396484, "global_step": 98552, "epoch": 2346} {"train_loss": -6.118412971496582, "global_step": 98553, "epoch": 2346} {"train_loss": -6.31611442565918, "global_step": 98554, "epoch": 2346} {"train_loss": -6.279901027679443, "global_step": 98555, "epoch": 2346} {"train_loss": -6.22895622253418, "global_step": 98556, "epoch": 2346} {"train_loss": -6.2746405601501465, "global_step": 98557, "epoch": 2346} {"train_loss": -6.441804885864258, "global_step": 98558, "epoch": 2346} {"train_loss": -6.3314924240112305, "global_step": 98559, "epoch": 2346} {"train_loss": -6.227889060974121, "global_step": 98560, "epoch": 2346} {"train_loss": -6.209598541259766, "global_step": 98561, "epoch": 2346} {"train_loss": -6.266978740692139, "global_step": 98562, "epoch": 2346} {"train_loss": -6.286435127258301, "global_step": 98563, "epoch": 2346} {"train_loss": -6.401257038116455, "global_step": 98564, "epoch": 2346} {"train_loss": -6.337751388549805, "global_step": 98565, "epoch": 2346} {"train_loss": -6.256847381591797, "global_step": 98566, "epoch": 2346} {"train_loss": -6.299405097961426, "global_step": 98567, "epoch": 2346} {"train_loss": -6.4051713943481445, "global_step": 98568, "epoch": 2346} {"train_loss": -6.421773910522461, "global_step": 98569, "epoch": 2346} {"train_loss": -6.430312156677246, "global_step": 98570, "epoch": 2346} {"train_loss": -6.383949279785156, "global_step": 98571, "epoch": 2346} {"train_loss": -6.338836669921875, "global_step": 98572, "epoch": 2346} {"train_loss": -6.314557915642148, "global_step": 98573, "epoch": 2346, "val_loss": 63625.38671875} {"train_loss": -6.32835578918457, "global_step": 98574, "epoch": 2347} {"train_loss": -6.374861717224121, "global_step": 98575, "epoch": 2347} {"train_loss": -6.407693862915039, "global_step": 98576, "epoch": 2347} {"train_loss": -6.396087169647217, "global_step": 98577, "epoch": 2347} {"train_loss": -6.296957015991211, "global_step": 98578, "epoch": 2347} {"train_loss": -6.322248458862305, "global_step": 98579, "epoch": 2347} {"train_loss": -6.330286979675293, "global_step": 98580, "epoch": 2347} {"train_loss": -6.319576263427734, "global_step": 98581, "epoch": 2347} {"train_loss": -6.363428115844727, "global_step": 98582, "epoch": 2347} {"train_loss": -6.423299789428711, "global_step": 98583, "epoch": 2347} {"train_loss": -6.334776878356934, "global_step": 98584, "epoch": 2347} {"train_loss": -6.2537713050842285, "global_step": 98585, "epoch": 2347} {"train_loss": -6.328179836273193, "global_step": 98586, "epoch": 2347} {"train_loss": -6.53474235534668, "global_step": 98587, "epoch": 2347} {"train_loss": -6.412909507751465, "global_step": 98588, "epoch": 2347} {"train_loss": -6.319336891174316, "global_step": 98589, "epoch": 2347} {"train_loss": -6.489215850830078, "global_step": 98590, "epoch": 2347} {"train_loss": -6.438357353210449, "global_step": 98591, "epoch": 2347} {"train_loss": -6.43326473236084, "global_step": 98592, "epoch": 2347} {"train_loss": -6.337973594665527, "global_step": 98593, "epoch": 2347} {"train_loss": -6.4468913078308105, "global_step": 98594, "epoch": 2347} {"train_loss": -6.481192111968994, "global_step": 98595, "epoch": 2347} {"train_loss": -6.259974956512451, "global_step": 98596, "epoch": 2347} {"train_loss": -6.429640293121338, "global_step": 98597, "epoch": 2347} {"train_loss": -6.337277412414551, "global_step": 98598, "epoch": 2347} {"train_loss": -6.362237930297852, "global_step": 98599, "epoch": 2347} {"train_loss": -6.4404215812683105, "global_step": 98600, "epoch": 2347} {"train_loss": -6.3333563804626465, "global_step": 98601, "epoch": 2347} {"train_loss": -6.263369560241699, "global_step": 98602, "epoch": 2347} {"train_loss": -6.419360160827637, "global_step": 98603, "epoch": 2347} {"train_loss": -6.382570266723633, "global_step": 98604, "epoch": 2347} {"train_loss": -6.307610034942627, "global_step": 98605, "epoch": 2347} {"train_loss": -6.3854827880859375, "global_step": 98606, "epoch": 2347} {"train_loss": -6.370328426361084, "global_step": 98607, "epoch": 2347} {"train_loss": -6.336918354034424, "global_step": 98608, "epoch": 2347} {"train_loss": -6.448803901672363, "global_step": 98609, "epoch": 2347} {"train_loss": -6.4193549156188965, "global_step": 98610, "epoch": 2347} {"train_loss": -6.368572235107422, "global_step": 98611, "epoch": 2347} {"train_loss": -6.358316421508789, "global_step": 98612, "epoch": 2347} {"train_loss": -6.3373589515686035, "global_step": 98613, "epoch": 2347} {"train_loss": -6.4097771644592285, "global_step": 98614, "epoch": 2347} {"train_loss": -6.375967184702556, "global_step": 98615, "epoch": 2347, "val_loss": 63909.16796875} {"train_loss": -6.3677239418029785, "global_step": 98616, "epoch": 2348} {"train_loss": -6.374381065368652, "global_step": 98617, "epoch": 2348} {"train_loss": -6.426369667053223, "global_step": 98618, "epoch": 2348} {"train_loss": -6.444892406463623, "global_step": 98619, "epoch": 2348} {"train_loss": -6.2878570556640625, "global_step": 98620, "epoch": 2348} {"train_loss": -6.366009712219238, "global_step": 98621, "epoch": 2348} {"train_loss": -6.454597473144531, "global_step": 98622, "epoch": 2348} {"train_loss": -6.369244575500488, "global_step": 98623, "epoch": 2348} {"train_loss": -6.440976142883301, "global_step": 98624, "epoch": 2348} {"train_loss": -6.443048477172852, "global_step": 98625, "epoch": 2348} {"train_loss": -6.355774402618408, "global_step": 98626, "epoch": 2348} {"train_loss": -6.3254594802856445, "global_step": 98627, "epoch": 2348} {"train_loss": -6.329068183898926, "global_step": 98628, "epoch": 2348} {"train_loss": -6.343474388122559, "global_step": 98629, "epoch": 2348} {"train_loss": -6.450204372406006, "global_step": 98630, "epoch": 2348} {"train_loss": -6.313195705413818, "global_step": 98631, "epoch": 2348} {"train_loss": -6.360121726989746, "global_step": 98632, "epoch": 2348} {"train_loss": -6.357662200927734, "global_step": 98633, "epoch": 2348} {"train_loss": -6.271302223205566, "global_step": 98634, "epoch": 2348} {"train_loss": -6.340336799621582, "global_step": 98635, "epoch": 2348} {"train_loss": -6.389229774475098, "global_step": 98636, "epoch": 2348} {"train_loss": -6.329074382781982, "global_step": 98637, "epoch": 2348} {"train_loss": -6.437231063842773, "global_step": 98638, "epoch": 2348} {"train_loss": -6.367180824279785, "global_step": 98639, "epoch": 2348} {"train_loss": -6.329652309417725, "global_step": 98640, "epoch": 2348} {"train_loss": -6.209071159362793, "global_step": 98641, "epoch": 2348} {"train_loss": -6.357634544372559, "global_step": 98642, "epoch": 2348} {"train_loss": -6.2648820877075195, "global_step": 98643, "epoch": 2348} {"train_loss": -6.304047584533691, "global_step": 98644, "epoch": 2348} {"train_loss": -6.351505279541016, "global_step": 98645, "epoch": 2348} {"train_loss": -6.25953483581543, "global_step": 98646, "epoch": 2348} {"train_loss": -6.252763748168945, "global_step": 98647, "epoch": 2348} {"train_loss": -6.335561752319336, "global_step": 98648, "epoch": 2348} {"train_loss": -6.240400791168213, "global_step": 98649, "epoch": 2348} {"train_loss": -6.348561763763428, "global_step": 98650, "epoch": 2348} {"train_loss": -6.229227066040039, "global_step": 98651, "epoch": 2348} {"train_loss": -6.267453193664551, "global_step": 98652, "epoch": 2348} {"train_loss": -6.355197906494141, "global_step": 98653, "epoch": 2348} {"train_loss": -6.188170909881592, "global_step": 98654, "epoch": 2348} {"train_loss": -6.359126091003418, "global_step": 98655, "epoch": 2348} {"train_loss": -6.386876583099365, "global_step": 98656, "epoch": 2348} {"train_loss": -6.3392270519619895, "global_step": 98657, "epoch": 2348, "val_loss": 63817.92578125} {"train_loss": -6.3796000480651855, "global_step": 98658, "epoch": 2349} {"train_loss": -6.311288833618164, "global_step": 98659, "epoch": 2349} {"train_loss": -6.297695159912109, "global_step": 98660, "epoch": 2349} {"train_loss": -6.303858280181885, "global_step": 98661, "epoch": 2349} {"train_loss": -6.251720428466797, "global_step": 98662, "epoch": 2349} {"train_loss": -6.281132698059082, "global_step": 98663, "epoch": 2349} {"train_loss": -6.41007137298584, "global_step": 98664, "epoch": 2349} {"train_loss": -6.44512414932251, "global_step": 98665, "epoch": 2349} {"train_loss": -6.311374664306641, "global_step": 98666, "epoch": 2349} {"train_loss": -6.261399269104004, "global_step": 98667, "epoch": 2349} {"train_loss": -6.239197731018066, "global_step": 98668, "epoch": 2349} {"train_loss": -6.397188663482666, "global_step": 98669, "epoch": 2349} {"train_loss": -6.336670875549316, "global_step": 98670, "epoch": 2349} {"train_loss": -6.283527851104736, "global_step": 98671, "epoch": 2349} {"train_loss": -6.296723365783691, "global_step": 98672, "epoch": 2349} {"train_loss": -6.284820079803467, "global_step": 98673, "epoch": 2349} {"train_loss": -6.319921493530273, "global_step": 98674, "epoch": 2349} {"train_loss": -6.276787757873535, "global_step": 98675, "epoch": 2349} {"train_loss": -6.306112289428711, "global_step": 98676, "epoch": 2349} {"train_loss": -6.381072044372559, "global_step": 98677, "epoch": 2349} {"train_loss": -6.222988128662109, "global_step": 98678, "epoch": 2349} {"train_loss": -6.171164512634277, "global_step": 98679, "epoch": 2349} {"train_loss": -6.3842010498046875, "global_step": 98680, "epoch": 2349} {"train_loss": -6.206470012664795, "global_step": 98681, "epoch": 2349} {"train_loss": -6.2627058029174805, "global_step": 98682, "epoch": 2349} {"train_loss": -6.379785537719727, "global_step": 98683, "epoch": 2349} {"train_loss": -6.238219738006592, "global_step": 98684, "epoch": 2349} {"train_loss": -6.393429756164551, "global_step": 98685, "epoch": 2349} {"train_loss": -6.238696098327637, "global_step": 98686, "epoch": 2349} {"train_loss": -6.377089023590088, "global_step": 98687, "epoch": 2349} {"train_loss": -6.173595428466797, "global_step": 98688, "epoch": 2349} {"train_loss": -6.384390830993652, "global_step": 98689, "epoch": 2349} {"train_loss": -6.156678676605225, "global_step": 98690, "epoch": 2349} {"train_loss": -6.383024215698242, "global_step": 98691, "epoch": 2349} {"train_loss": -6.368165969848633, "global_step": 98692, "epoch": 2349} {"train_loss": -6.381970405578613, "global_step": 98693, "epoch": 2349} {"train_loss": -6.404081344604492, "global_step": 98694, "epoch": 2349} {"train_loss": -6.337306022644043, "global_step": 98695, "epoch": 2349} {"train_loss": -6.279313564300537, "global_step": 98696, "epoch": 2349} {"train_loss": -6.21605110168457, "global_step": 98697, "epoch": 2349} {"train_loss": -6.350905418395996, "global_step": 98698, "epoch": 2349} {"train_loss": -6.307319947651455, "global_step": 98699, "epoch": 2349, "val_loss": 63916.61328125} {"train_loss": -6.3866987228393555, "global_step": 98700, "epoch": 2350} {"train_loss": -6.328823089599609, "global_step": 98701, "epoch": 2350} {"train_loss": -6.352646827697754, "global_step": 98702, "epoch": 2350} {"train_loss": -6.257627964019775, "global_step": 98703, "epoch": 2350} {"train_loss": -6.389801025390625, "global_step": 98704, "epoch": 2350} {"train_loss": -6.422232151031494, "global_step": 98705, "epoch": 2350} {"train_loss": -6.254848480224609, "global_step": 98706, "epoch": 2350} {"train_loss": -6.2797465324401855, "global_step": 98707, "epoch": 2350} {"train_loss": -6.225369453430176, "global_step": 98708, "epoch": 2350} {"train_loss": -6.2924981117248535, "global_step": 98709, "epoch": 2350} {"train_loss": -6.28818416595459, "global_step": 98710, "epoch": 2350} {"train_loss": -6.436301231384277, "global_step": 98711, "epoch": 2350} {"train_loss": -6.31394100189209, "global_step": 98712, "epoch": 2350} {"train_loss": -6.313979148864746, "global_step": 98713, "epoch": 2350} {"train_loss": -6.432412624359131, "global_step": 98714, "epoch": 2350} {"train_loss": -6.314615726470947, "global_step": 98715, "epoch": 2350} {"train_loss": -6.418931007385254, "global_step": 98716, "epoch": 2350} {"train_loss": -6.314475059509277, "global_step": 98717, "epoch": 2350} {"train_loss": -6.279854774475098, "global_step": 98718, "epoch": 2350} {"train_loss": -6.442872047424316, "global_step": 98719, "epoch": 2350} {"train_loss": -6.372108459472656, "global_step": 98720, "epoch": 2350} {"train_loss": -6.294480800628662, "global_step": 98721, "epoch": 2350} {"train_loss": -6.375136852264404, "global_step": 98722, "epoch": 2350} {"train_loss": -6.307901382446289, "global_step": 98723, "epoch": 2350} {"train_loss": -6.332571029663086, "global_step": 98724, "epoch": 2350} {"train_loss": -6.344234466552734, "global_step": 98725, "epoch": 2350} {"train_loss": -6.370725631713867, "global_step": 98726, "epoch": 2350} {"train_loss": -6.352606773376465, "global_step": 98727, "epoch": 2350} {"train_loss": -6.269554138183594, "global_step": 98728, "epoch": 2350} {"train_loss": -6.434252738952637, "global_step": 98729, "epoch": 2350} {"train_loss": -6.300775527954102, "global_step": 98730, "epoch": 2350} {"train_loss": -6.468387603759766, "global_step": 98731, "epoch": 2350} {"train_loss": -6.279211521148682, "global_step": 98732, "epoch": 2350} {"train_loss": -6.31027889251709, "global_step": 98733, "epoch": 2350} {"train_loss": -6.229599475860596, "global_step": 98734, "epoch": 2350} {"train_loss": -6.287177085876465, "global_step": 98735, "epoch": 2350} {"train_loss": -6.229005813598633, "global_step": 98736, "epoch": 2350} {"train_loss": -6.314435005187988, "global_step": 98737, "epoch": 2350} {"train_loss": -6.409267425537109, "global_step": 98738, "epoch": 2350} {"train_loss": -6.333898544311523, "global_step": 98739, "epoch": 2350} {"train_loss": -6.262081146240234, "global_step": 98740, "epoch": 2350} {"train_loss": -6.335104397365025, "global_step": 98741, "epoch": 2350, "train/sim_max_reward_0": 0.193914672423072, "train/sim_max_reward_1": 0.7439632630563929, "train/sim_max_reward_2": 0.9686541669783005, "train/sim_max_reward_3": 0.15735980324804372, "train/sim_max_reward_4": 0.9576763024845929, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.927338929145573, "test/sim_max_reward_4300001": 0.16928462517578735, "test/sim_max_reward_4300002": 0.8198015099799528, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.7006779782822034, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.40037301221658667, "test/sim_max_reward_4300008": 0.912844107573803, "test/sim_max_reward_4300009": 0.9423169664108468, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9982945364232779, "test/sim_max_reward_4300012": 0.9195586267455202, "test/sim_max_reward_4300013": 0.4031297127386631, "test/sim_max_reward_4300014": 0.8759083879817107, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.14291828515719596, "test/sim_max_reward_4300017": 0.9109517502897604, "test/sim_max_reward_4300018": 0.4222216174280053, "test/sim_max_reward_4300019": 0.18390711570839133, "test/sim_max_reward_4300020": 0.18261138778187844, "test/sim_max_reward_4300021": 0.9842142473140859, "test/sim_max_reward_4300022": 0.9429640938098932, "test/sim_max_reward_4300023": 0.9571925560330629, "test/sim_max_reward_4300024": 1.0, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.050878423390650566, "test/sim_max_reward_4300027": 0.8769925413806963, "test/sim_max_reward_4300028": 1.0, "test/sim_max_reward_4300029": 0.8051093893997727, "test/sim_max_reward_4300030": 0.5070795155400659, "test/sim_max_reward_4300031": 0.2353773333799473, "test/sim_max_reward_4300032": 0.9398042296463133, "test/sim_max_reward_4300033": 0.8448474808412161, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.3439795876543174, "test/sim_max_reward_4300036": 0.20817863776355444, "test/sim_max_reward_4300037": 0.7944401816372717, "test/sim_max_reward_4300038": 0.8840307964953704, "test/sim_max_reward_4300039": 0.9074383424908681, "test/sim_max_reward_4300040": 0.9734370149611867, "test/sim_max_reward_4300041": 0.909692583035985, "test/sim_max_reward_4300042": 0.7061774859144526, "test/sim_max_reward_4300043": 0.1708662104293933, "test/sim_max_reward_4300044": 0.9154962679456873, "test/sim_max_reward_4300045": 0.17410012766550395, "test/sim_max_reward_4300046": 0.23559431078409557, "test/sim_max_reward_4300047": 0.10297633145125701, "test/sim_max_reward_4300048": 0.9926511183140858, "test/sim_max_reward_4300049": 0.5472377623883906, "train/mean_score": 0.5357588279254316, "test/mean_score": 0.6187745844703113, "val_loss": 64076.44921875} {"train_loss": -6.3322649002075195, "global_step": 98742, "epoch": 2351} {"train_loss": -6.345738887786865, "global_step": 98743, "epoch": 2351} {"train_loss": -6.354593276977539, "global_step": 98744, "epoch": 2351} {"train_loss": -6.35753059387207, "global_step": 98745, "epoch": 2351} {"train_loss": -6.29821252822876, "global_step": 98746, "epoch": 2351} {"train_loss": -6.320583820343018, "global_step": 98747, "epoch": 2351} {"train_loss": -6.263760566711426, "global_step": 98748, "epoch": 2351} {"train_loss": -6.344921112060547, "global_step": 98749, "epoch": 2351} {"train_loss": -6.3739728927612305, "global_step": 98750, "epoch": 2351} {"train_loss": -6.285019397735596, "global_step": 98751, "epoch": 2351} {"train_loss": -6.417126655578613, "global_step": 98752, "epoch": 2351} {"train_loss": -6.380784034729004, "global_step": 98753, "epoch": 2351} {"train_loss": -6.338230133056641, "global_step": 98754, "epoch": 2351} {"train_loss": -6.370619297027588, "global_step": 98755, "epoch": 2351} {"train_loss": -6.43516731262207, "global_step": 98756, "epoch": 2351} {"train_loss": -6.39957857131958, "global_step": 98757, "epoch": 2351} {"train_loss": -6.340395927429199, "global_step": 98758, "epoch": 2351} {"train_loss": -6.207459449768066, "global_step": 98759, "epoch": 2351} {"train_loss": -6.311868667602539, "global_step": 98760, "epoch": 2351} {"train_loss": -6.281832695007324, "global_step": 98761, "epoch": 2351} {"train_loss": -6.222453594207764, "global_step": 98762, "epoch": 2351} {"train_loss": -6.444559097290039, "global_step": 98763, "epoch": 2351} {"train_loss": -6.26072359085083, "global_step": 98764, "epoch": 2351} {"train_loss": -6.233558654785156, "global_step": 98765, "epoch": 2351} {"train_loss": -6.424164772033691, "global_step": 98766, "epoch": 2351} {"train_loss": -6.2767510414123535, "global_step": 98767, "epoch": 2351} {"train_loss": -6.350018501281738, "global_step": 98768, "epoch": 2351} {"train_loss": -6.405170440673828, "global_step": 98769, "epoch": 2351} {"train_loss": -6.3091230392456055, "global_step": 98770, "epoch": 2351} {"train_loss": -6.44785213470459, "global_step": 98771, "epoch": 2351} {"train_loss": -6.383538722991943, "global_step": 98772, "epoch": 2351} {"train_loss": -6.273077964782715, "global_step": 98773, "epoch": 2351} {"train_loss": -6.318550109863281, "global_step": 98774, "epoch": 2351} {"train_loss": -6.391807556152344, "global_step": 98775, "epoch": 2351} {"train_loss": -6.319902420043945, "global_step": 98776, "epoch": 2351} {"train_loss": -6.45773983001709, "global_step": 98777, "epoch": 2351} {"train_loss": -6.349940299987793, "global_step": 98778, "epoch": 2351} {"train_loss": -6.368101119995117, "global_step": 98779, "epoch": 2351} {"train_loss": -6.389184951782227, "global_step": 98780, "epoch": 2351} {"train_loss": -6.44241189956665, "global_step": 98781, "epoch": 2351} {"train_loss": -6.339344024658203, "global_step": 98782, "epoch": 2351} {"train_loss": -6.345463355382283, "global_step": 98783, "epoch": 2351, "val_loss": 64073.08984375} {"train_loss": -6.284177780151367, "global_step": 98784, "epoch": 2352} {"train_loss": -6.3400115966796875, "global_step": 98785, "epoch": 2352} {"train_loss": -6.255404472351074, "global_step": 98786, "epoch": 2352} {"train_loss": -6.322225570678711, "global_step": 98787, "epoch": 2352} {"train_loss": -6.363908767700195, "global_step": 98788, "epoch": 2352} {"train_loss": -6.22274112701416, "global_step": 98789, "epoch": 2352} {"train_loss": -6.350183010101318, "global_step": 98790, "epoch": 2352} {"train_loss": -6.2460808753967285, "global_step": 98791, "epoch": 2352} {"train_loss": -6.435558319091797, "global_step": 98792, "epoch": 2352} {"train_loss": -6.293398857116699, "global_step": 98793, "epoch": 2352} {"train_loss": -6.29146671295166, "global_step": 98794, "epoch": 2352} {"train_loss": -6.420476913452148, "global_step": 98795, "epoch": 2352} {"train_loss": -6.3720383644104, "global_step": 98796, "epoch": 2352} {"train_loss": -6.239648818969727, "global_step": 98797, "epoch": 2352} {"train_loss": -6.362444877624512, "global_step": 98798, "epoch": 2352} {"train_loss": -6.417873859405518, "global_step": 98799, "epoch": 2352} {"train_loss": -6.379246711730957, "global_step": 98800, "epoch": 2352} {"train_loss": -6.2439470291137695, "global_step": 98801, "epoch": 2352} {"train_loss": -6.389966011047363, "global_step": 98802, "epoch": 2352} {"train_loss": -6.305332660675049, "global_step": 98803, "epoch": 2352} {"train_loss": -6.411808013916016, "global_step": 98804, "epoch": 2352} {"train_loss": -6.324698448181152, "global_step": 98805, "epoch": 2352} {"train_loss": -6.314158916473389, "global_step": 98806, "epoch": 2352} {"train_loss": -6.369924068450928, "global_step": 98807, "epoch": 2352} {"train_loss": -6.524632930755615, "global_step": 98808, "epoch": 2352} {"train_loss": -6.354495048522949, "global_step": 98809, "epoch": 2352} {"train_loss": -6.479816913604736, "global_step": 98810, "epoch": 2352} {"train_loss": -6.308742046356201, "global_step": 98811, "epoch": 2352} {"train_loss": -6.277088165283203, "global_step": 98812, "epoch": 2352} {"train_loss": -6.441332817077637, "global_step": 98813, "epoch": 2352} {"train_loss": -6.1957621574401855, "global_step": 98814, "epoch": 2352} {"train_loss": -6.26737642288208, "global_step": 98815, "epoch": 2352} {"train_loss": -6.225627899169922, "global_step": 98816, "epoch": 2352} {"train_loss": -6.312746047973633, "global_step": 98817, "epoch": 2352} {"train_loss": -6.30340576171875, "global_step": 98818, "epoch": 2352} {"train_loss": -6.255714416503906, "global_step": 98819, "epoch": 2352} {"train_loss": -6.3582844734191895, "global_step": 98820, "epoch": 2352} {"train_loss": -6.415467262268066, "global_step": 98821, "epoch": 2352} {"train_loss": -6.334344863891602, "global_step": 98822, "epoch": 2352} {"train_loss": -6.278640270233154, "global_step": 98823, "epoch": 2352} {"train_loss": -6.240053653717041, "global_step": 98824, "epoch": 2352} {"train_loss": -6.330466860816593, "global_step": 98825, "epoch": 2352, "val_loss": 64122.53125} {"train_loss": -6.137478828430176, "global_step": 98826, "epoch": 2353} {"train_loss": -6.387099266052246, "global_step": 98827, "epoch": 2353} {"train_loss": -6.262725830078125, "global_step": 98828, "epoch": 2353} {"train_loss": -6.424554824829102, "global_step": 98829, "epoch": 2353} {"train_loss": -6.37625789642334, "global_step": 98830, "epoch": 2353} {"train_loss": -6.406213760375977, "global_step": 98831, "epoch": 2353} {"train_loss": -6.370575428009033, "global_step": 98832, "epoch": 2353} {"train_loss": -6.40777587890625, "global_step": 98833, "epoch": 2353} {"train_loss": -6.382598876953125, "global_step": 98834, "epoch": 2353} {"train_loss": -6.343480110168457, "global_step": 98835, "epoch": 2353} {"train_loss": -6.5356550216674805, "global_step": 98836, "epoch": 2353} {"train_loss": -6.322138786315918, "global_step": 98837, "epoch": 2353} {"train_loss": -6.408115386962891, "global_step": 98838, "epoch": 2353} {"train_loss": -6.299753189086914, "global_step": 98839, "epoch": 2353} {"train_loss": -6.3859710693359375, "global_step": 98840, "epoch": 2353} {"train_loss": -6.327445983886719, "global_step": 98841, "epoch": 2353} {"train_loss": -6.430030822753906, "global_step": 98842, "epoch": 2353} {"train_loss": -6.44066858291626, "global_step": 98843, "epoch": 2353} {"train_loss": -6.332518577575684, "global_step": 98844, "epoch": 2353} {"train_loss": -6.3770575523376465, "global_step": 98845, "epoch": 2353} {"train_loss": -6.350844383239746, "global_step": 98846, "epoch": 2353} {"train_loss": -6.260604381561279, "global_step": 98847, "epoch": 2353} {"train_loss": -6.358633518218994, "global_step": 98848, "epoch": 2353} {"train_loss": -6.337362766265869, "global_step": 98849, "epoch": 2353} {"train_loss": -6.4554443359375, "global_step": 98850, "epoch": 2353} {"train_loss": -6.3411545753479, "global_step": 98851, "epoch": 2353} {"train_loss": -6.448924541473389, "global_step": 98852, "epoch": 2353} {"train_loss": -6.369998931884766, "global_step": 98853, "epoch": 2353} {"train_loss": -6.365237712860107, "global_step": 98854, "epoch": 2353} {"train_loss": -6.345877647399902, "global_step": 98855, "epoch": 2353} {"train_loss": -6.239352226257324, "global_step": 98856, "epoch": 2353} {"train_loss": -6.3350958824157715, "global_step": 98857, "epoch": 2353} {"train_loss": -6.404655456542969, "global_step": 98858, "epoch": 2353} {"train_loss": -6.3180437088012695, "global_step": 98859, "epoch": 2353} {"train_loss": -6.323860168457031, "global_step": 98860, "epoch": 2353} {"train_loss": -6.293045997619629, "global_step": 98861, "epoch": 2353} {"train_loss": -6.364941596984863, "global_step": 98862, "epoch": 2353} {"train_loss": -6.12647819519043, "global_step": 98863, "epoch": 2353} {"train_loss": -6.267866611480713, "global_step": 98864, "epoch": 2353} {"train_loss": -6.312412261962891, "global_step": 98865, "epoch": 2353} {"train_loss": -6.227553367614746, "global_step": 98866, "epoch": 2353} {"train_loss": -6.348898002079555, "global_step": 98867, "epoch": 2353, "val_loss": 64031.93359375} {"train_loss": -6.271350860595703, "global_step": 98868, "epoch": 2354} {"train_loss": -6.309779167175293, "global_step": 98869, "epoch": 2354} {"train_loss": -6.312494277954102, "global_step": 98870, "epoch": 2354} {"train_loss": -6.331539630889893, "global_step": 98871, "epoch": 2354} {"train_loss": -6.374336242675781, "global_step": 98872, "epoch": 2354} {"train_loss": -6.3182783126831055, "global_step": 98873, "epoch": 2354} {"train_loss": -6.407177448272705, "global_step": 98874, "epoch": 2354} {"train_loss": -6.314366817474365, "global_step": 98875, "epoch": 2354} {"train_loss": -6.3650007247924805, "global_step": 98876, "epoch": 2354} {"train_loss": -6.316204071044922, "global_step": 98877, "epoch": 2354} {"train_loss": -6.289997100830078, "global_step": 98878, "epoch": 2354} {"train_loss": -6.218296051025391, "global_step": 98879, "epoch": 2354} {"train_loss": -6.342004776000977, "global_step": 98880, "epoch": 2354} {"train_loss": -6.322231292724609, "global_step": 98881, "epoch": 2354} {"train_loss": -6.350133895874023, "global_step": 98882, "epoch": 2354} {"train_loss": -6.449822425842285, "global_step": 98883, "epoch": 2354} {"train_loss": -6.37325382232666, "global_step": 98884, "epoch": 2354} {"train_loss": -6.2754807472229, "global_step": 98885, "epoch": 2354} {"train_loss": -6.47694206237793, "global_step": 98886, "epoch": 2354} {"train_loss": -6.310251712799072, "global_step": 98887, "epoch": 2354} {"train_loss": -6.3147687911987305, "global_step": 98888, "epoch": 2354} {"train_loss": -6.402520656585693, "global_step": 98889, "epoch": 2354} {"train_loss": -6.371413230895996, "global_step": 98890, "epoch": 2354} {"train_loss": -6.429871559143066, "global_step": 98891, "epoch": 2354} {"train_loss": -6.399822235107422, "global_step": 98892, "epoch": 2354} {"train_loss": -6.391877174377441, "global_step": 98893, "epoch": 2354} {"train_loss": -6.300512790679932, "global_step": 98894, "epoch": 2354} {"train_loss": -6.344216823577881, "global_step": 98895, "epoch": 2354} {"train_loss": -6.41873025894165, "global_step": 98896, "epoch": 2354} {"train_loss": -6.390933036804199, "global_step": 98897, "epoch": 2354} {"train_loss": -6.387042999267578, "global_step": 98898, "epoch": 2354} {"train_loss": -6.365607738494873, "global_step": 98899, "epoch": 2354} {"train_loss": -6.397745132446289, "global_step": 98900, "epoch": 2354} {"train_loss": -6.3676066398620605, "global_step": 98901, "epoch": 2354} {"train_loss": -6.295393943786621, "global_step": 98902, "epoch": 2354} {"train_loss": -6.390140533447266, "global_step": 98903, "epoch": 2354} {"train_loss": -6.39698600769043, "global_step": 98904, "epoch": 2354} {"train_loss": -6.361763954162598, "global_step": 98905, "epoch": 2354} {"train_loss": -6.260769367218018, "global_step": 98906, "epoch": 2354} {"train_loss": -6.449979782104492, "global_step": 98907, "epoch": 2354} {"train_loss": -6.396686553955078, "global_step": 98908, "epoch": 2354} {"train_loss": -6.354625361306327, "global_step": 98909, "epoch": 2354, "val_loss": 63854.29296875} {"train_loss": -6.4338507652282715, "global_step": 98910, "epoch": 2355} {"train_loss": -6.307159423828125, "global_step": 98911, "epoch": 2355} {"train_loss": -6.325362682342529, "global_step": 98912, "epoch": 2355} {"train_loss": -6.383634090423584, "global_step": 98913, "epoch": 2355} {"train_loss": -6.443855285644531, "global_step": 98914, "epoch": 2355} {"train_loss": -6.345973491668701, "global_step": 98915, "epoch": 2355} {"train_loss": -6.402810573577881, "global_step": 98916, "epoch": 2355} {"train_loss": -6.209134101867676, "global_step": 98917, "epoch": 2355} {"train_loss": -6.366897106170654, "global_step": 98918, "epoch": 2355} {"train_loss": -6.274672508239746, "global_step": 98919, "epoch": 2355} {"train_loss": -6.442587852478027, "global_step": 98920, "epoch": 2355} {"train_loss": -6.307747840881348, "global_step": 98921, "epoch": 2355} {"train_loss": -6.374248504638672, "global_step": 98922, "epoch": 2355} {"train_loss": -6.272118091583252, "global_step": 98923, "epoch": 2355} {"train_loss": -6.314148902893066, "global_step": 98924, "epoch": 2355} {"train_loss": -6.384533882141113, "global_step": 98925, "epoch": 2355} {"train_loss": -6.401088714599609, "global_step": 98926, "epoch": 2355} {"train_loss": -6.258806228637695, "global_step": 98927, "epoch": 2355} {"train_loss": -6.337839603424072, "global_step": 98928, "epoch": 2355} {"train_loss": -6.4257426261901855, "global_step": 98929, "epoch": 2355} {"train_loss": -6.419499397277832, "global_step": 98930, "epoch": 2355} {"train_loss": -6.2947797775268555, "global_step": 98931, "epoch": 2355} {"train_loss": -6.412666320800781, "global_step": 98932, "epoch": 2355} {"train_loss": -6.382943153381348, "global_step": 98933, "epoch": 2355} {"train_loss": -6.418754577636719, "global_step": 98934, "epoch": 2355} {"train_loss": -6.302803039550781, "global_step": 98935, "epoch": 2355} {"train_loss": -6.369821548461914, "global_step": 98936, "epoch": 2355} {"train_loss": -6.372387886047363, "global_step": 98937, "epoch": 2355} {"train_loss": -6.185324668884277, "global_step": 98938, "epoch": 2355} {"train_loss": -6.312893867492676, "global_step": 98939, "epoch": 2355} {"train_loss": -6.3411946296691895, "global_step": 98940, "epoch": 2355} {"train_loss": -6.340851783752441, "global_step": 98941, "epoch": 2355} {"train_loss": -6.384864807128906, "global_step": 98942, "epoch": 2355} {"train_loss": -6.207697868347168, "global_step": 98943, "epoch": 2355} {"train_loss": -6.3269500732421875, "global_step": 98944, "epoch": 2355} {"train_loss": -6.41181755065918, "global_step": 98945, "epoch": 2355} {"train_loss": -6.496433734893799, "global_step": 98946, "epoch": 2355} {"train_loss": -6.340043067932129, "global_step": 98947, "epoch": 2355} {"train_loss": -6.440585613250732, "global_step": 98948, "epoch": 2355} {"train_loss": -6.371477127075195, "global_step": 98949, "epoch": 2355} {"train_loss": -6.353725433349609, "global_step": 98950, "epoch": 2355} {"train_loss": -6.352193945930118, "global_step": 98951, "epoch": 2355, "val_loss": 63916.69921875} {"train_loss": -6.365509986877441, "global_step": 98952, "epoch": 2356} {"train_loss": -6.267183303833008, "global_step": 98953, "epoch": 2356} {"train_loss": -6.424891948699951, "global_step": 98954, "epoch": 2356} {"train_loss": -6.3944854736328125, "global_step": 98955, "epoch": 2356} {"train_loss": -6.301675796508789, "global_step": 98956, "epoch": 2356} {"train_loss": -6.218390464782715, "global_step": 98957, "epoch": 2356} {"train_loss": -6.382470607757568, "global_step": 98958, "epoch": 2356} {"train_loss": -6.294040679931641, "global_step": 98959, "epoch": 2356} {"train_loss": -6.249886512756348, "global_step": 98960, "epoch": 2356} {"train_loss": -6.416303634643555, "global_step": 98961, "epoch": 2356} {"train_loss": -6.330574989318848, "global_step": 98962, "epoch": 2356} {"train_loss": -6.340844631195068, "global_step": 98963, "epoch": 2356} {"train_loss": -6.419835567474365, "global_step": 98964, "epoch": 2356} {"train_loss": -6.235412120819092, "global_step": 98965, "epoch": 2356} {"train_loss": -6.292119979858398, "global_step": 98966, "epoch": 2356} {"train_loss": -6.426548004150391, "global_step": 98967, "epoch": 2356} {"train_loss": -6.365625858306885, "global_step": 98968, "epoch": 2356} {"train_loss": -6.227660179138184, "global_step": 98969, "epoch": 2356} {"train_loss": -6.254636287689209, "global_step": 98970, "epoch": 2356} {"train_loss": -6.391576766967773, "global_step": 98971, "epoch": 2356} {"train_loss": -6.362188339233398, "global_step": 98972, "epoch": 2356} {"train_loss": -6.393484592437744, "global_step": 98973, "epoch": 2356} {"train_loss": -6.298191070556641, "global_step": 98974, "epoch": 2356} {"train_loss": -6.372946739196777, "global_step": 98975, "epoch": 2356} {"train_loss": -6.38194465637207, "global_step": 98976, "epoch": 2356} {"train_loss": -6.424223899841309, "global_step": 98977, "epoch": 2356} {"train_loss": -6.381608009338379, "global_step": 98978, "epoch": 2356} {"train_loss": -6.454350471496582, "global_step": 98979, "epoch": 2356} {"train_loss": -6.384471893310547, "global_step": 98980, "epoch": 2356} {"train_loss": -6.330767631530762, "global_step": 98981, "epoch": 2356} {"train_loss": -6.33960485458374, "global_step": 98982, "epoch": 2356} {"train_loss": -6.3307905197143555, "global_step": 98983, "epoch": 2356} {"train_loss": -6.373098373413086, "global_step": 98984, "epoch": 2356} {"train_loss": -6.355280876159668, "global_step": 98985, "epoch": 2356} {"train_loss": -6.333745002746582, "global_step": 98986, "epoch": 2356} {"train_loss": -6.403020858764648, "global_step": 98987, "epoch": 2356} {"train_loss": -6.411240100860596, "global_step": 98988, "epoch": 2356} {"train_loss": -6.409605026245117, "global_step": 98989, "epoch": 2356} {"train_loss": -6.4468207359313965, "global_step": 98990, "epoch": 2356} {"train_loss": -6.411794185638428, "global_step": 98991, "epoch": 2356} {"train_loss": -6.404532432556152, "global_step": 98992, "epoch": 2356} {"train_loss": -6.359372116270519, "global_step": 98993, "epoch": 2356, "val_loss": 63892.18359375} {"train_loss": -6.4437456130981445, "global_step": 98994, "epoch": 2357} {"train_loss": -6.3724565505981445, "global_step": 98995, "epoch": 2357} {"train_loss": -6.426759243011475, "global_step": 98996, "epoch": 2357} {"train_loss": -6.485618591308594, "global_step": 98997, "epoch": 2357} {"train_loss": -6.320682525634766, "global_step": 98998, "epoch": 2357} {"train_loss": -6.330059051513672, "global_step": 98999, "epoch": 2357} {"train_loss": -6.287010192871094, "global_step": 99000, "epoch": 2357} {"train_loss": -6.387587070465088, "global_step": 99001, "epoch": 2357} {"train_loss": -6.437192916870117, "global_step": 99002, "epoch": 2357} {"train_loss": -6.310808181762695, "global_step": 99003, "epoch": 2357} {"train_loss": -6.458404541015625, "global_step": 99004, "epoch": 2357} {"train_loss": -6.397091865539551, "global_step": 99005, "epoch": 2357} {"train_loss": -6.390761375427246, "global_step": 99006, "epoch": 2357} {"train_loss": -6.358261585235596, "global_step": 99007, "epoch": 2357} {"train_loss": -6.349591255187988, "global_step": 99008, "epoch": 2357} {"train_loss": -6.308907508850098, "global_step": 99009, "epoch": 2357} {"train_loss": -6.410284996032715, "global_step": 99010, "epoch": 2357} {"train_loss": -6.305483818054199, "global_step": 99011, "epoch": 2357} {"train_loss": -6.193820476531982, "global_step": 99012, "epoch": 2357} {"train_loss": -6.4243621826171875, "global_step": 99013, "epoch": 2357} {"train_loss": -6.326384544372559, "global_step": 99014, "epoch": 2357} {"train_loss": -6.172699928283691, "global_step": 99015, "epoch": 2357} {"train_loss": -6.318539619445801, "global_step": 99016, "epoch": 2357} {"train_loss": -6.31667947769165, "global_step": 99017, "epoch": 2357} {"train_loss": -6.320463180541992, "global_step": 99018, "epoch": 2357} {"train_loss": -6.306756973266602, "global_step": 99019, "epoch": 2357} {"train_loss": -6.3894548416137695, "global_step": 99020, "epoch": 2357} {"train_loss": -6.267492294311523, "global_step": 99021, "epoch": 2357} {"train_loss": -6.338468551635742, "global_step": 99022, "epoch": 2357} {"train_loss": -6.372835159301758, "global_step": 99023, "epoch": 2357} {"train_loss": -6.322783470153809, "global_step": 99024, "epoch": 2357} {"train_loss": -6.283670425415039, "global_step": 99025, "epoch": 2357} {"train_loss": -6.364080429077148, "global_step": 99026, "epoch": 2357} {"train_loss": -6.35884952545166, "global_step": 99027, "epoch": 2357} {"train_loss": -6.455692291259766, "global_step": 99028, "epoch": 2357} {"train_loss": -6.4749274253845215, "global_step": 99029, "epoch": 2357} {"train_loss": -6.3831353187561035, "global_step": 99030, "epoch": 2357} {"train_loss": -6.332439422607422, "global_step": 99031, "epoch": 2357} {"train_loss": -6.318427085876465, "global_step": 99032, "epoch": 2357} {"train_loss": -6.354676246643066, "global_step": 99033, "epoch": 2357} {"train_loss": -6.414793968200684, "global_step": 99034, "epoch": 2357} {"train_loss": -6.356273469470796, "global_step": 99035, "epoch": 2357, "val_loss": 63907.6953125} {"train_loss": -6.358463764190674, "global_step": 99036, "epoch": 2358} {"train_loss": -6.413994312286377, "global_step": 99037, "epoch": 2358} {"train_loss": -6.414732933044434, "global_step": 99038, "epoch": 2358} {"train_loss": -6.416338920593262, "global_step": 99039, "epoch": 2358} {"train_loss": -6.398223876953125, "global_step": 99040, "epoch": 2358} {"train_loss": -6.34965705871582, "global_step": 99041, "epoch": 2358} {"train_loss": -6.424949645996094, "global_step": 99042, "epoch": 2358} {"train_loss": -6.341830253601074, "global_step": 99043, "epoch": 2358} {"train_loss": -6.356236457824707, "global_step": 99044, "epoch": 2358} {"train_loss": -6.397556304931641, "global_step": 99045, "epoch": 2358} {"train_loss": -6.399848937988281, "global_step": 99046, "epoch": 2358} {"train_loss": -6.377546310424805, "global_step": 99047, "epoch": 2358} {"train_loss": -6.410935878753662, "global_step": 99048, "epoch": 2358} {"train_loss": -6.364230155944824, "global_step": 99049, "epoch": 2358} {"train_loss": -6.3173723220825195, "global_step": 99050, "epoch": 2358} {"train_loss": -6.475931167602539, "global_step": 99051, "epoch": 2358} {"train_loss": -6.456804275512695, "global_step": 99052, "epoch": 2358} {"train_loss": -6.375308990478516, "global_step": 99053, "epoch": 2358} {"train_loss": -6.40982723236084, "global_step": 99054, "epoch": 2358} {"train_loss": -6.501087665557861, "global_step": 99055, "epoch": 2358} {"train_loss": -6.382763862609863, "global_step": 99056, "epoch": 2358} {"train_loss": -6.343488693237305, "global_step": 99057, "epoch": 2358} {"train_loss": -6.32210636138916, "global_step": 99058, "epoch": 2358} {"train_loss": -6.2562103271484375, "global_step": 99059, "epoch": 2358} {"train_loss": -6.255867004394531, "global_step": 99060, "epoch": 2358} {"train_loss": -6.417463302612305, "global_step": 99061, "epoch": 2358} {"train_loss": -6.324603080749512, "global_step": 99062, "epoch": 2358} {"train_loss": -6.418729782104492, "global_step": 99063, "epoch": 2358} {"train_loss": -6.279064655303955, "global_step": 99064, "epoch": 2358} {"train_loss": -6.195981025695801, "global_step": 99065, "epoch": 2358} {"train_loss": -6.284058570861816, "global_step": 99066, "epoch": 2358} {"train_loss": -6.364309787750244, "global_step": 99067, "epoch": 2358} {"train_loss": -6.416828155517578, "global_step": 99068, "epoch": 2358} {"train_loss": -6.396031379699707, "global_step": 99069, "epoch": 2358} {"train_loss": -6.292459487915039, "global_step": 99070, "epoch": 2358} {"train_loss": -6.286184787750244, "global_step": 99071, "epoch": 2358} {"train_loss": -6.385871887207031, "global_step": 99072, "epoch": 2358} {"train_loss": -6.445106506347656, "global_step": 99073, "epoch": 2358} {"train_loss": -6.344646453857422, "global_step": 99074, "epoch": 2358} {"train_loss": -6.379970550537109, "global_step": 99075, "epoch": 2358} {"train_loss": -6.381200790405273, "global_step": 99076, "epoch": 2358} {"train_loss": -6.367479574112665, "global_step": 99077, "epoch": 2358, "val_loss": 64142.6875} {"train_loss": -6.393359184265137, "global_step": 99078, "epoch": 2359} {"train_loss": -6.299964904785156, "global_step": 99079, "epoch": 2359} {"train_loss": -6.415464878082275, "global_step": 99080, "epoch": 2359} {"train_loss": -6.315190315246582, "global_step": 99081, "epoch": 2359} {"train_loss": -6.415444374084473, "global_step": 99082, "epoch": 2359} {"train_loss": -6.446769714355469, "global_step": 99083, "epoch": 2359} {"train_loss": -6.396795272827148, "global_step": 99084, "epoch": 2359} {"train_loss": -6.4410014152526855, "global_step": 99085, "epoch": 2359} {"train_loss": -6.270326137542725, "global_step": 99086, "epoch": 2359} {"train_loss": -6.4962615966796875, "global_step": 99087, "epoch": 2359} {"train_loss": -6.370432376861572, "global_step": 99088, "epoch": 2359} {"train_loss": -6.415215492248535, "global_step": 99089, "epoch": 2359} {"train_loss": -6.377263069152832, "global_step": 99090, "epoch": 2359} {"train_loss": -6.385228633880615, "global_step": 99091, "epoch": 2359} {"train_loss": -6.444808483123779, "global_step": 99092, "epoch": 2359} {"train_loss": -6.258424758911133, "global_step": 99093, "epoch": 2359} {"train_loss": -6.4106035232543945, "global_step": 99094, "epoch": 2359} {"train_loss": -6.365194797515869, "global_step": 99095, "epoch": 2359} {"train_loss": -6.371612548828125, "global_step": 99096, "epoch": 2359} {"train_loss": -6.372045516967773, "global_step": 99097, "epoch": 2359} {"train_loss": -6.400202751159668, "global_step": 99098, "epoch": 2359} {"train_loss": -6.415563583374023, "global_step": 99099, "epoch": 2359} {"train_loss": -6.335465431213379, "global_step": 99100, "epoch": 2359} {"train_loss": -6.342698574066162, "global_step": 99101, "epoch": 2359} {"train_loss": -6.470288276672363, "global_step": 99102, "epoch": 2359} {"train_loss": -6.4428253173828125, "global_step": 99103, "epoch": 2359} {"train_loss": -6.246051788330078, "global_step": 99104, "epoch": 2359} {"train_loss": -6.208324909210205, "global_step": 99105, "epoch": 2359} {"train_loss": -6.285490989685059, "global_step": 99106, "epoch": 2359} {"train_loss": -6.375477313995361, "global_step": 99107, "epoch": 2359} {"train_loss": -6.382672309875488, "global_step": 99108, "epoch": 2359} {"train_loss": -6.4558000564575195, "global_step": 99109, "epoch": 2359} {"train_loss": -6.470828533172607, "global_step": 99110, "epoch": 2359} {"train_loss": -6.321560859680176, "global_step": 99111, "epoch": 2359} {"train_loss": -6.36698579788208, "global_step": 99112, "epoch": 2359} {"train_loss": -6.390614032745361, "global_step": 99113, "epoch": 2359} {"train_loss": -6.2214508056640625, "global_step": 99114, "epoch": 2359} {"train_loss": -6.350948333740234, "global_step": 99115, "epoch": 2359} {"train_loss": -6.259025573730469, "global_step": 99116, "epoch": 2359} {"train_loss": -6.3719482421875, "global_step": 99117, "epoch": 2359} {"train_loss": -6.381424427032471, "global_step": 99118, "epoch": 2359} {"train_loss": -6.370600552785964, "global_step": 99119, "epoch": 2359, "val_loss": 64043.2265625} {"train_loss": -6.458600044250488, "global_step": 99120, "epoch": 2360} {"train_loss": -6.446495532989502, "global_step": 99121, "epoch": 2360} {"train_loss": -6.355280876159668, "global_step": 99122, "epoch": 2360} {"train_loss": -6.360994338989258, "global_step": 99123, "epoch": 2360} {"train_loss": -6.359300136566162, "global_step": 99124, "epoch": 2360} {"train_loss": -6.444587707519531, "global_step": 99125, "epoch": 2360} {"train_loss": -6.340427398681641, "global_step": 99126, "epoch": 2360} {"train_loss": -6.407855987548828, "global_step": 99127, "epoch": 2360} {"train_loss": -6.399367809295654, "global_step": 99128, "epoch": 2360} {"train_loss": -6.406583309173584, "global_step": 99129, "epoch": 2360} {"train_loss": -6.462330341339111, "global_step": 99130, "epoch": 2360} {"train_loss": -6.520715713500977, "global_step": 99131, "epoch": 2360} {"train_loss": -6.412064552307129, "global_step": 99132, "epoch": 2360} {"train_loss": -6.45460319519043, "global_step": 99133, "epoch": 2360} {"train_loss": -6.3415117263793945, "global_step": 99134, "epoch": 2360} {"train_loss": -6.364333629608154, "global_step": 99135, "epoch": 2360} {"train_loss": -6.356425762176514, "global_step": 99136, "epoch": 2360} {"train_loss": -6.281709671020508, "global_step": 99137, "epoch": 2360} {"train_loss": -6.351110935211182, "global_step": 99138, "epoch": 2360} {"train_loss": -6.417787075042725, "global_step": 99139, "epoch": 2360} {"train_loss": -6.331869125366211, "global_step": 99140, "epoch": 2360} {"train_loss": -6.353304862976074, "global_step": 99141, "epoch": 2360} {"train_loss": -6.433185577392578, "global_step": 99142, "epoch": 2360} {"train_loss": -6.329646587371826, "global_step": 99143, "epoch": 2360} {"train_loss": -6.328577518463135, "global_step": 99144, "epoch": 2360} {"train_loss": -6.383862495422363, "global_step": 99145, "epoch": 2360} {"train_loss": -6.235162734985352, "global_step": 99146, "epoch": 2360} {"train_loss": -6.403400897979736, "global_step": 99147, "epoch": 2360} {"train_loss": -6.443826675415039, "global_step": 99148, "epoch": 2360} {"train_loss": -6.362587928771973, "global_step": 99149, "epoch": 2360} {"train_loss": -6.440642356872559, "global_step": 99150, "epoch": 2360} {"train_loss": -6.433979034423828, "global_step": 99151, "epoch": 2360} {"train_loss": -6.454585075378418, "global_step": 99152, "epoch": 2360} {"train_loss": -6.324280738830566, "global_step": 99153, "epoch": 2360} {"train_loss": -6.32574462890625, "global_step": 99154, "epoch": 2360} {"train_loss": -6.333406925201416, "global_step": 99155, "epoch": 2360} {"train_loss": -6.3740644454956055, "global_step": 99156, "epoch": 2360} {"train_loss": -6.414361476898193, "global_step": 99157, "epoch": 2360} {"train_loss": -6.333920478820801, "global_step": 99158, "epoch": 2360} {"train_loss": -6.381216049194336, "global_step": 99159, "epoch": 2360} {"train_loss": -6.365842342376709, "global_step": 99160, "epoch": 2360} {"train_loss": -6.38187100773766, "global_step": 99161, "epoch": 2360, "val_loss": 64053.89453125} {"train_loss": -6.412971496582031, "global_step": 99162, "epoch": 2361} {"train_loss": -6.382104873657227, "global_step": 99163, "epoch": 2361} {"train_loss": -6.400036811828613, "global_step": 99164, "epoch": 2361} {"train_loss": -6.213499069213867, "global_step": 99165, "epoch": 2361} {"train_loss": -6.416722297668457, "global_step": 99166, "epoch": 2361} {"train_loss": -6.342662811279297, "global_step": 99167, "epoch": 2361} {"train_loss": -6.459075450897217, "global_step": 99168, "epoch": 2361} {"train_loss": -6.271810531616211, "global_step": 99169, "epoch": 2361} {"train_loss": -6.4114227294921875, "global_step": 99170, "epoch": 2361} {"train_loss": -6.346166133880615, "global_step": 99171, "epoch": 2361} {"train_loss": -6.374751567840576, "global_step": 99172, "epoch": 2361} {"train_loss": -6.295261383056641, "global_step": 99173, "epoch": 2361} {"train_loss": -6.405109882354736, "global_step": 99174, "epoch": 2361} {"train_loss": -6.410229206085205, "global_step": 99175, "epoch": 2361} {"train_loss": -6.28539514541626, "global_step": 99176, "epoch": 2361} {"train_loss": -6.403098106384277, "global_step": 99177, "epoch": 2361} {"train_loss": -6.454634666442871, "global_step": 99178, "epoch": 2361} {"train_loss": -6.238332748413086, "global_step": 99179, "epoch": 2361} {"train_loss": -6.503442764282227, "global_step": 99180, "epoch": 2361} {"train_loss": -6.301520347595215, "global_step": 99181, "epoch": 2361} {"train_loss": -6.47644567489624, "global_step": 99182, "epoch": 2361} {"train_loss": -6.364951133728027, "global_step": 99183, "epoch": 2361} {"train_loss": -6.350644111633301, "global_step": 99184, "epoch": 2361} {"train_loss": -6.3800249099731445, "global_step": 99185, "epoch": 2361} {"train_loss": -6.440423488616943, "global_step": 99186, "epoch": 2361} {"train_loss": -6.333590030670166, "global_step": 99187, "epoch": 2361} {"train_loss": -6.323835372924805, "global_step": 99188, "epoch": 2361} {"train_loss": -6.481220245361328, "global_step": 99189, "epoch": 2361} {"train_loss": -6.39595890045166, "global_step": 99190, "epoch": 2361} {"train_loss": -6.426502704620361, "global_step": 99191, "epoch": 2361} {"train_loss": -6.466923713684082, "global_step": 99192, "epoch": 2361} {"train_loss": -6.357548713684082, "global_step": 99193, "epoch": 2361} {"train_loss": -6.388934135437012, "global_step": 99194, "epoch": 2361} {"train_loss": -6.367610931396484, "global_step": 99195, "epoch": 2361} {"train_loss": -6.497513294219971, "global_step": 99196, "epoch": 2361} {"train_loss": -6.294720649719238, "global_step": 99197, "epoch": 2361} {"train_loss": -6.439018249511719, "global_step": 99198, "epoch": 2361} {"train_loss": -6.2596282958984375, "global_step": 99199, "epoch": 2361} {"train_loss": -6.445021629333496, "global_step": 99200, "epoch": 2361} {"train_loss": -6.369526386260986, "global_step": 99201, "epoch": 2361} {"train_loss": -6.43118143081665, "global_step": 99202, "epoch": 2361} {"train_loss": -6.382680223101661, "global_step": 99203, "epoch": 2361, "val_loss": 64295.9140625} {"train_loss": -6.312366485595703, "global_step": 99204, "epoch": 2362} {"train_loss": -6.283386707305908, "global_step": 99205, "epoch": 2362} {"train_loss": -6.390866279602051, "global_step": 99206, "epoch": 2362} {"train_loss": -6.356969356536865, "global_step": 99207, "epoch": 2362} {"train_loss": -6.32688045501709, "global_step": 99208, "epoch": 2362} {"train_loss": -6.382589340209961, "global_step": 99209, "epoch": 2362} {"train_loss": -6.409931182861328, "global_step": 99210, "epoch": 2362} {"train_loss": -6.400363445281982, "global_step": 99211, "epoch": 2362} {"train_loss": -6.386270523071289, "global_step": 99212, "epoch": 2362} {"train_loss": -6.352684497833252, "global_step": 99213, "epoch": 2362} {"train_loss": -6.418672561645508, "global_step": 99214, "epoch": 2362} {"train_loss": -6.264809608459473, "global_step": 99215, "epoch": 2362} {"train_loss": -6.371642112731934, "global_step": 99216, "epoch": 2362} {"train_loss": -6.380850791931152, "global_step": 99217, "epoch": 2362} {"train_loss": -6.328899383544922, "global_step": 99218, "epoch": 2362} {"train_loss": -6.350471496582031, "global_step": 99219, "epoch": 2362} {"train_loss": -6.348024368286133, "global_step": 99220, "epoch": 2362} {"train_loss": -6.4317240715026855, "global_step": 99221, "epoch": 2362} {"train_loss": -6.381863117218018, "global_step": 99222, "epoch": 2362} {"train_loss": -6.4428534507751465, "global_step": 99223, "epoch": 2362} {"train_loss": -6.310492038726807, "global_step": 99224, "epoch": 2362} {"train_loss": -6.2466020584106445, "global_step": 99225, "epoch": 2362} {"train_loss": -6.223970413208008, "global_step": 99226, "epoch": 2362} {"train_loss": -6.504321098327637, "global_step": 99227, "epoch": 2362} {"train_loss": -6.3064422607421875, "global_step": 99228, "epoch": 2362} {"train_loss": -6.381593704223633, "global_step": 99229, "epoch": 2362} {"train_loss": -6.394589424133301, "global_step": 99230, "epoch": 2362} {"train_loss": -6.219444274902344, "global_step": 99231, "epoch": 2362} {"train_loss": -6.205127239227295, "global_step": 99232, "epoch": 2362} {"train_loss": -6.47370719909668, "global_step": 99233, "epoch": 2362} {"train_loss": -6.26591682434082, "global_step": 99234, "epoch": 2362} {"train_loss": -6.283101558685303, "global_step": 99235, "epoch": 2362} {"train_loss": -6.239999771118164, "global_step": 99236, "epoch": 2362} {"train_loss": -6.322945594787598, "global_step": 99237, "epoch": 2362} {"train_loss": -6.271032333374023, "global_step": 99238, "epoch": 2362} {"train_loss": -6.295519828796387, "global_step": 99239, "epoch": 2362} {"train_loss": -6.243375301361084, "global_step": 99240, "epoch": 2362} {"train_loss": -6.283231735229492, "global_step": 99241, "epoch": 2362} {"train_loss": -6.262660980224609, "global_step": 99242, "epoch": 2362} {"train_loss": -6.3240509033203125, "global_step": 99243, "epoch": 2362} {"train_loss": -6.191932678222656, "global_step": 99244, "epoch": 2362} {"train_loss": -6.327998774392264, "global_step": 99245, "epoch": 2362, "val_loss": 64174.77734375} {"train_loss": -6.234362602233887, "global_step": 99246, "epoch": 2363} {"train_loss": -6.37630033493042, "global_step": 99247, "epoch": 2363} {"train_loss": -6.219869613647461, "global_step": 99248, "epoch": 2363} {"train_loss": -6.325780868530273, "global_step": 99249, "epoch": 2363} {"train_loss": -6.262238025665283, "global_step": 99250, "epoch": 2363} {"train_loss": -6.241455554962158, "global_step": 99251, "epoch": 2363} {"train_loss": -6.336163520812988, "global_step": 99252, "epoch": 2363} {"train_loss": -6.298078536987305, "global_step": 99253, "epoch": 2363} {"train_loss": -6.24387264251709, "global_step": 99254, "epoch": 2363} {"train_loss": -6.286417007446289, "global_step": 99255, "epoch": 2363} {"train_loss": -6.196254730224609, "global_step": 99256, "epoch": 2363} {"train_loss": -6.243180751800537, "global_step": 99257, "epoch": 2363} {"train_loss": -6.360757827758789, "global_step": 99258, "epoch": 2363} {"train_loss": -6.326105117797852, "global_step": 99259, "epoch": 2363} {"train_loss": -6.225653648376465, "global_step": 99260, "epoch": 2363} {"train_loss": -6.294138431549072, "global_step": 99261, "epoch": 2363} {"train_loss": -6.281805038452148, "global_step": 99262, "epoch": 2363} {"train_loss": -6.293623924255371, "global_step": 99263, "epoch": 2363} {"train_loss": -6.271478652954102, "global_step": 99264, "epoch": 2363} {"train_loss": -6.334951400756836, "global_step": 99265, "epoch": 2363} {"train_loss": -6.302176475524902, "global_step": 99266, "epoch": 2363} {"train_loss": -6.215105056762695, "global_step": 99267, "epoch": 2363} {"train_loss": -6.341801643371582, "global_step": 99268, "epoch": 2363} {"train_loss": -6.2585530281066895, "global_step": 99269, "epoch": 2363} {"train_loss": -6.480804443359375, "global_step": 99270, "epoch": 2363} {"train_loss": -6.308190822601318, "global_step": 99271, "epoch": 2363} {"train_loss": -6.453021049499512, "global_step": 99272, "epoch": 2363} {"train_loss": -6.328372955322266, "global_step": 99273, "epoch": 2363} {"train_loss": -6.492926597595215, "global_step": 99274, "epoch": 2363} {"train_loss": -6.340816497802734, "global_step": 99275, "epoch": 2363} {"train_loss": -6.457737922668457, "global_step": 99276, "epoch": 2363} {"train_loss": -6.425082206726074, "global_step": 99277, "epoch": 2363} {"train_loss": -6.48454475402832, "global_step": 99278, "epoch": 2363} {"train_loss": -6.401946067810059, "global_step": 99279, "epoch": 2363} {"train_loss": -6.418804168701172, "global_step": 99280, "epoch": 2363} {"train_loss": -6.39912223815918, "global_step": 99281, "epoch": 2363} {"train_loss": -6.540837287902832, "global_step": 99282, "epoch": 2363} {"train_loss": -6.416505813598633, "global_step": 99283, "epoch": 2363} {"train_loss": -6.285507678985596, "global_step": 99284, "epoch": 2363} {"train_loss": -6.349100112915039, "global_step": 99285, "epoch": 2363} {"train_loss": -6.391888618469238, "global_step": 99286, "epoch": 2363} {"train_loss": -6.336068391799927, "global_step": 99287, "epoch": 2363, "val_loss": 64053.5390625} {"train_loss": -6.376385688781738, "global_step": 99288, "epoch": 2364} {"train_loss": -6.488536834716797, "global_step": 99289, "epoch": 2364} {"train_loss": -6.4029645919799805, "global_step": 99290, "epoch": 2364} {"train_loss": -6.333879470825195, "global_step": 99291, "epoch": 2364} {"train_loss": -6.398586273193359, "global_step": 99292, "epoch": 2364} {"train_loss": -6.322846412658691, "global_step": 99293, "epoch": 2364} {"train_loss": -6.434565544128418, "global_step": 99294, "epoch": 2364} {"train_loss": -6.5254740715026855, "global_step": 99295, "epoch": 2364} {"train_loss": -6.313389301300049, "global_step": 99296, "epoch": 2364} {"train_loss": -6.384420394897461, "global_step": 99297, "epoch": 2364} {"train_loss": -6.361965179443359, "global_step": 99298, "epoch": 2364} {"train_loss": -6.313087463378906, "global_step": 99299, "epoch": 2364} {"train_loss": -6.2997145652771, "global_step": 99300, "epoch": 2364} {"train_loss": -6.4231085777282715, "global_step": 99301, "epoch": 2364} {"train_loss": -6.404435634613037, "global_step": 99302, "epoch": 2364} {"train_loss": -6.459415912628174, "global_step": 99303, "epoch": 2364} {"train_loss": -6.407547950744629, "global_step": 99304, "epoch": 2364} {"train_loss": -6.357268333435059, "global_step": 99305, "epoch": 2364} {"train_loss": -6.430143356323242, "global_step": 99306, "epoch": 2364} {"train_loss": -6.401052951812744, "global_step": 99307, "epoch": 2364} {"train_loss": -6.3877763748168945, "global_step": 99308, "epoch": 2364} {"train_loss": -6.355774402618408, "global_step": 99309, "epoch": 2364} {"train_loss": -6.487082004547119, "global_step": 99310, "epoch": 2364} {"train_loss": -6.293668746948242, "global_step": 99311, "epoch": 2364} {"train_loss": -6.258330345153809, "global_step": 99312, "epoch": 2364} {"train_loss": -6.252779483795166, "global_step": 99313, "epoch": 2364} {"train_loss": -6.196785926818848, "global_step": 99314, "epoch": 2364} {"train_loss": -6.304897308349609, "global_step": 99315, "epoch": 2364} {"train_loss": -6.274679660797119, "global_step": 99316, "epoch": 2364} {"train_loss": -6.332514762878418, "global_step": 99317, "epoch": 2364} {"train_loss": -6.352321147918701, "global_step": 99318, "epoch": 2364} {"train_loss": -6.207867622375488, "global_step": 99319, "epoch": 2364} {"train_loss": -6.2298054695129395, "global_step": 99320, "epoch": 2364} {"train_loss": -6.314263820648193, "global_step": 99321, "epoch": 2364} {"train_loss": -6.352982997894287, "global_step": 99322, "epoch": 2364} {"train_loss": -6.195040225982666, "global_step": 99323, "epoch": 2364} {"train_loss": -6.412724018096924, "global_step": 99324, "epoch": 2364} {"train_loss": -6.285089492797852, "global_step": 99325, "epoch": 2364} {"train_loss": -6.2781219482421875, "global_step": 99326, "epoch": 2364} {"train_loss": -6.400706768035889, "global_step": 99327, "epoch": 2364} {"train_loss": -6.228856086730957, "global_step": 99328, "epoch": 2364} {"train_loss": -6.344771998269217, "global_step": 99329, "epoch": 2364, "val_loss": 63856.9609375} {"train_loss": -6.325806617736816, "global_step": 99330, "epoch": 2365} {"train_loss": -6.362971782684326, "global_step": 99331, "epoch": 2365} {"train_loss": -6.466692924499512, "global_step": 99332, "epoch": 2365} {"train_loss": -6.374240875244141, "global_step": 99333, "epoch": 2365} {"train_loss": -6.3036675453186035, "global_step": 99334, "epoch": 2365} {"train_loss": -6.299840927124023, "global_step": 99335, "epoch": 2365} {"train_loss": -6.245054244995117, "global_step": 99336, "epoch": 2365} {"train_loss": -6.361512184143066, "global_step": 99337, "epoch": 2365} {"train_loss": -6.2272491455078125, "global_step": 99338, "epoch": 2365} {"train_loss": -6.305593013763428, "global_step": 99339, "epoch": 2365} {"train_loss": -6.436492443084717, "global_step": 99340, "epoch": 2365} {"train_loss": -6.425300121307373, "global_step": 99341, "epoch": 2365} {"train_loss": -6.3149566650390625, "global_step": 99342, "epoch": 2365} {"train_loss": -6.408435821533203, "global_step": 99343, "epoch": 2365} {"train_loss": -6.306809425354004, "global_step": 99344, "epoch": 2365} {"train_loss": -6.245104789733887, "global_step": 99345, "epoch": 2365} {"train_loss": -6.424406051635742, "global_step": 99346, "epoch": 2365} {"train_loss": -6.298642158508301, "global_step": 99347, "epoch": 2365} {"train_loss": -6.258554458618164, "global_step": 99348, "epoch": 2365} {"train_loss": -6.380675315856934, "global_step": 99349, "epoch": 2365} {"train_loss": -6.369574546813965, "global_step": 99350, "epoch": 2365} {"train_loss": -6.382518768310547, "global_step": 99351, "epoch": 2365} {"train_loss": -6.339863300323486, "global_step": 99352, "epoch": 2365} {"train_loss": -6.294254779815674, "global_step": 99353, "epoch": 2365} {"train_loss": -6.432836055755615, "global_step": 99354, "epoch": 2365} {"train_loss": -6.350285530090332, "global_step": 99355, "epoch": 2365} {"train_loss": -6.357693195343018, "global_step": 99356, "epoch": 2365} {"train_loss": -6.267045974731445, "global_step": 99357, "epoch": 2365} {"train_loss": -6.307722091674805, "global_step": 99358, "epoch": 2365} {"train_loss": -6.4268927574157715, "global_step": 99359, "epoch": 2365} {"train_loss": -6.371551990509033, "global_step": 99360, "epoch": 2365} {"train_loss": -6.379157543182373, "global_step": 99361, "epoch": 2365} {"train_loss": -6.230786323547363, "global_step": 99362, "epoch": 2365} {"train_loss": -6.423426151275635, "global_step": 99363, "epoch": 2365} {"train_loss": -6.435657501220703, "global_step": 99364, "epoch": 2365} {"train_loss": -6.470498085021973, "global_step": 99365, "epoch": 2365} {"train_loss": -6.277024269104004, "global_step": 99366, "epoch": 2365} {"train_loss": -6.35053825378418, "global_step": 99367, "epoch": 2365} {"train_loss": -6.286299228668213, "global_step": 99368, "epoch": 2365} {"train_loss": -6.346592903137207, "global_step": 99369, "epoch": 2365} {"train_loss": -6.398156642913818, "global_step": 99370, "epoch": 2365} {"train_loss": -6.348135039919899, "global_step": 99371, "epoch": 2365, "val_loss": 63945.51953125} {"train_loss": -6.3946027755737305, "global_step": 99372, "epoch": 2366} {"train_loss": -6.392341136932373, "global_step": 99373, "epoch": 2366} {"train_loss": -6.398083686828613, "global_step": 99374, "epoch": 2366} {"train_loss": -6.500955581665039, "global_step": 99375, "epoch": 2366} {"train_loss": -6.319057464599609, "global_step": 99376, "epoch": 2366} {"train_loss": -6.382074356079102, "global_step": 99377, "epoch": 2366} {"train_loss": -6.43848991394043, "global_step": 99378, "epoch": 2366} {"train_loss": -6.46083927154541, "global_step": 99379, "epoch": 2366} {"train_loss": -6.257658004760742, "global_step": 99380, "epoch": 2366} {"train_loss": -6.47442626953125, "global_step": 99381, "epoch": 2366} {"train_loss": -6.374025821685791, "global_step": 99382, "epoch": 2366} {"train_loss": -6.274393081665039, "global_step": 99383, "epoch": 2366} {"train_loss": -6.3298869132995605, "global_step": 99384, "epoch": 2366} {"train_loss": -6.231003761291504, "global_step": 99385, "epoch": 2366} {"train_loss": -6.378795623779297, "global_step": 99386, "epoch": 2366} {"train_loss": -6.347434997558594, "global_step": 99387, "epoch": 2366} {"train_loss": -6.379354953765869, "global_step": 99388, "epoch": 2366} {"train_loss": -6.357438087463379, "global_step": 99389, "epoch": 2366} {"train_loss": -6.437551975250244, "global_step": 99390, "epoch": 2366} {"train_loss": -6.385382652282715, "global_step": 99391, "epoch": 2366} {"train_loss": -6.435063362121582, "global_step": 99392, "epoch": 2366} {"train_loss": -6.360502243041992, "global_step": 99393, "epoch": 2366} {"train_loss": -6.392449378967285, "global_step": 99394, "epoch": 2366} {"train_loss": -6.430149078369141, "global_step": 99395, "epoch": 2366} {"train_loss": -6.305678367614746, "global_step": 99396, "epoch": 2366} {"train_loss": -6.399747848510742, "global_step": 99397, "epoch": 2366} {"train_loss": -6.30941104888916, "global_step": 99398, "epoch": 2366} {"train_loss": -6.399209976196289, "global_step": 99399, "epoch": 2366} {"train_loss": -6.2998247146606445, "global_step": 99400, "epoch": 2366} {"train_loss": -6.291959762573242, "global_step": 99401, "epoch": 2366} {"train_loss": -6.363551616668701, "global_step": 99402, "epoch": 2366} {"train_loss": -6.476894378662109, "global_step": 99403, "epoch": 2366} {"train_loss": -6.256812572479248, "global_step": 99404, "epoch": 2366} {"train_loss": -6.363438129425049, "global_step": 99405, "epoch": 2366} {"train_loss": -6.208130359649658, "global_step": 99406, "epoch": 2366} {"train_loss": -6.233567237854004, "global_step": 99407, "epoch": 2366} {"train_loss": -6.321432590484619, "global_step": 99408, "epoch": 2366} {"train_loss": -6.31272029876709, "global_step": 99409, "epoch": 2366} {"train_loss": -6.282985687255859, "global_step": 99410, "epoch": 2366} {"train_loss": -6.319845199584961, "global_step": 99411, "epoch": 2366} {"train_loss": -6.315774917602539, "global_step": 99412, "epoch": 2366} {"train_loss": -6.356213694527035, "global_step": 99413, "epoch": 2366, "val_loss": 64102.6171875} {"train_loss": -6.402253150939941, "global_step": 99414, "epoch": 2367} {"train_loss": -6.333136558532715, "global_step": 99415, "epoch": 2367} {"train_loss": -6.380070686340332, "global_step": 99416, "epoch": 2367} {"train_loss": -6.430260181427002, "global_step": 99417, "epoch": 2367} {"train_loss": -6.31690788269043, "global_step": 99418, "epoch": 2367} {"train_loss": -6.340702056884766, "global_step": 99419, "epoch": 2367} {"train_loss": -6.293079853057861, "global_step": 99420, "epoch": 2367} {"train_loss": -6.291810989379883, "global_step": 99421, "epoch": 2367} {"train_loss": -6.431441783905029, "global_step": 99422, "epoch": 2367} {"train_loss": -6.326176643371582, "global_step": 99423, "epoch": 2367} {"train_loss": -6.3660407066345215, "global_step": 99424, "epoch": 2367} {"train_loss": -6.373774528503418, "global_step": 99425, "epoch": 2367} {"train_loss": -6.276503562927246, "global_step": 99426, "epoch": 2367} {"train_loss": -6.237165927886963, "global_step": 99427, "epoch": 2367} {"train_loss": -6.405492305755615, "global_step": 99428, "epoch": 2367} {"train_loss": -6.214443683624268, "global_step": 99429, "epoch": 2367} {"train_loss": -6.347133159637451, "global_step": 99430, "epoch": 2367} {"train_loss": -6.385128021240234, "global_step": 99431, "epoch": 2367} {"train_loss": -6.323299407958984, "global_step": 99432, "epoch": 2367} {"train_loss": -6.3065185546875, "global_step": 99433, "epoch": 2367} {"train_loss": -6.233250617980957, "global_step": 99434, "epoch": 2367} {"train_loss": -6.388471603393555, "global_step": 99435, "epoch": 2367} {"train_loss": -6.330097675323486, "global_step": 99436, "epoch": 2367} {"train_loss": -6.346702575683594, "global_step": 99437, "epoch": 2367} {"train_loss": -6.28666877746582, "global_step": 99438, "epoch": 2367} {"train_loss": -6.258867263793945, "global_step": 99439, "epoch": 2367} {"train_loss": -6.331467628479004, "global_step": 99440, "epoch": 2367} {"train_loss": -6.350008964538574, "global_step": 99441, "epoch": 2367} {"train_loss": -6.439704895019531, "global_step": 99442, "epoch": 2367} {"train_loss": -6.242116928100586, "global_step": 99443, "epoch": 2367} {"train_loss": -6.376763343811035, "global_step": 99444, "epoch": 2367} {"train_loss": -6.317327976226807, "global_step": 99445, "epoch": 2367} {"train_loss": -6.329834938049316, "global_step": 99446, "epoch": 2367} {"train_loss": -6.232314109802246, "global_step": 99447, "epoch": 2367} {"train_loss": -6.222918510437012, "global_step": 99448, "epoch": 2367} {"train_loss": -6.357831954956055, "global_step": 99449, "epoch": 2367} {"train_loss": -6.291214942932129, "global_step": 99450, "epoch": 2367} {"train_loss": -6.374127388000488, "global_step": 99451, "epoch": 2367} {"train_loss": -6.366037368774414, "global_step": 99452, "epoch": 2367} {"train_loss": -6.302600383758545, "global_step": 99453, "epoch": 2367} {"train_loss": -6.347569465637207, "global_step": 99454, "epoch": 2367} {"train_loss": -6.328832353864398, "global_step": 99455, "epoch": 2367, "val_loss": 63904.5859375} {"train_loss": -6.366087913513184, "global_step": 99456, "epoch": 2368} {"train_loss": -6.291338920593262, "global_step": 99457, "epoch": 2368} {"train_loss": -6.387914657592773, "global_step": 99458, "epoch": 2368} {"train_loss": -6.319744110107422, "global_step": 99459, "epoch": 2368} {"train_loss": -6.390950679779053, "global_step": 99460, "epoch": 2368} {"train_loss": -6.3275909423828125, "global_step": 99461, "epoch": 2368} {"train_loss": -6.533092975616455, "global_step": 99462, "epoch": 2368} {"train_loss": -6.316364765167236, "global_step": 99463, "epoch": 2368} {"train_loss": -6.311309814453125, "global_step": 99464, "epoch": 2368} {"train_loss": -6.262360095977783, "global_step": 99465, "epoch": 2368} {"train_loss": -6.358194351196289, "global_step": 99466, "epoch": 2368} {"train_loss": -6.393736362457275, "global_step": 99467, "epoch": 2368} {"train_loss": -6.337563514709473, "global_step": 99468, "epoch": 2368} {"train_loss": -6.3890700340271, "global_step": 99469, "epoch": 2368} {"train_loss": -6.4514288902282715, "global_step": 99470, "epoch": 2368} {"train_loss": -6.372910022735596, "global_step": 99471, "epoch": 2368} {"train_loss": -6.379620552062988, "global_step": 99472, "epoch": 2368} {"train_loss": -6.352046012878418, "global_step": 99473, "epoch": 2368} {"train_loss": -6.408890724182129, "global_step": 99474, "epoch": 2368} {"train_loss": -6.3817901611328125, "global_step": 99475, "epoch": 2368} {"train_loss": -6.344827651977539, "global_step": 99476, "epoch": 2368} {"train_loss": -6.279418468475342, "global_step": 99477, "epoch": 2368} {"train_loss": -6.39345645904541, "global_step": 99478, "epoch": 2368} {"train_loss": -6.435859680175781, "global_step": 99479, "epoch": 2368} {"train_loss": -6.324648857116699, "global_step": 99480, "epoch": 2368} {"train_loss": -6.4069719314575195, "global_step": 99481, "epoch": 2368} {"train_loss": -6.417006492614746, "global_step": 99482, "epoch": 2368} {"train_loss": -6.399174213409424, "global_step": 99483, "epoch": 2368} {"train_loss": -6.386331558227539, "global_step": 99484, "epoch": 2368} {"train_loss": -6.280035972595215, "global_step": 99485, "epoch": 2368} {"train_loss": -6.355748176574707, "global_step": 99486, "epoch": 2368} {"train_loss": -6.298127174377441, "global_step": 99487, "epoch": 2368} {"train_loss": -6.362466812133789, "global_step": 99488, "epoch": 2368} {"train_loss": -6.332352638244629, "global_step": 99489, "epoch": 2368} {"train_loss": -6.31013822555542, "global_step": 99490, "epoch": 2368} {"train_loss": -6.283204078674316, "global_step": 99491, "epoch": 2368} {"train_loss": -6.3381547927856445, "global_step": 99492, "epoch": 2368} {"train_loss": -6.314682960510254, "global_step": 99493, "epoch": 2368} {"train_loss": -6.458429336547852, "global_step": 99494, "epoch": 2368} {"train_loss": -6.287775039672852, "global_step": 99495, "epoch": 2368} {"train_loss": -6.299929618835449, "global_step": 99496, "epoch": 2368} {"train_loss": -6.359886237553188, "global_step": 99497, "epoch": 2368, "val_loss": 64034.3046875} {"train_loss": -6.456773281097412, "global_step": 99498, "epoch": 2369} {"train_loss": -6.380666732788086, "global_step": 99499, "epoch": 2369} {"train_loss": -6.416672706604004, "global_step": 99500, "epoch": 2369} {"train_loss": -6.459821701049805, "global_step": 99501, "epoch": 2369} {"train_loss": -6.365893363952637, "global_step": 99502, "epoch": 2369} {"train_loss": -6.363602638244629, "global_step": 99503, "epoch": 2369} {"train_loss": -6.387338638305664, "global_step": 99504, "epoch": 2369} {"train_loss": -6.41917085647583, "global_step": 99505, "epoch": 2369} {"train_loss": -6.30516242980957, "global_step": 99506, "epoch": 2369} {"train_loss": -6.515122890472412, "global_step": 99507, "epoch": 2369} {"train_loss": -6.35814094543457, "global_step": 99508, "epoch": 2369} {"train_loss": -6.302114486694336, "global_step": 99509, "epoch": 2369} {"train_loss": -6.477967262268066, "global_step": 99510, "epoch": 2369} {"train_loss": -6.401144027709961, "global_step": 99511, "epoch": 2369} {"train_loss": -6.471323490142822, "global_step": 99512, "epoch": 2369} {"train_loss": -6.4648332595825195, "global_step": 99513, "epoch": 2369} {"train_loss": -6.3842267990112305, "global_step": 99514, "epoch": 2369} {"train_loss": -6.242908000946045, "global_step": 99515, "epoch": 2369} {"train_loss": -6.355806827545166, "global_step": 99516, "epoch": 2369} {"train_loss": -6.471599578857422, "global_step": 99517, "epoch": 2369} {"train_loss": -6.340368270874023, "global_step": 99518, "epoch": 2369} {"train_loss": -6.344597816467285, "global_step": 99519, "epoch": 2369} {"train_loss": -6.454902648925781, "global_step": 99520, "epoch": 2369} {"train_loss": -6.363802909851074, "global_step": 99521, "epoch": 2369} {"train_loss": -6.33026123046875, "global_step": 99522, "epoch": 2369} {"train_loss": -6.403365135192871, "global_step": 99523, "epoch": 2369} {"train_loss": -6.348827362060547, "global_step": 99524, "epoch": 2369} {"train_loss": -6.411991596221924, "global_step": 99525, "epoch": 2369} {"train_loss": -6.4940080642700195, "global_step": 99526, "epoch": 2369} {"train_loss": -6.283907413482666, "global_step": 99527, "epoch": 2369} {"train_loss": -6.306722640991211, "global_step": 99528, "epoch": 2369} {"train_loss": -6.202042579650879, "global_step": 99529, "epoch": 2369} {"train_loss": -6.28087043762207, "global_step": 99530, "epoch": 2369} {"train_loss": -6.312110424041748, "global_step": 99531, "epoch": 2369} {"train_loss": -6.515357971191406, "global_step": 99532, "epoch": 2369} {"train_loss": -6.403109073638916, "global_step": 99533, "epoch": 2369} {"train_loss": -6.431746482849121, "global_step": 99534, "epoch": 2369} {"train_loss": -6.369985580444336, "global_step": 99535, "epoch": 2369} {"train_loss": -6.391761779785156, "global_step": 99536, "epoch": 2369} {"train_loss": -6.411039352416992, "global_step": 99537, "epoch": 2369} {"train_loss": -6.322554111480713, "global_step": 99538, "epoch": 2369} {"train_loss": -6.386170148849487, "global_step": 99539, "epoch": 2369, "val_loss": 64115.33984375} {"train_loss": -6.3348188400268555, "global_step": 99540, "epoch": 2370} {"train_loss": -6.2532758712768555, "global_step": 99541, "epoch": 2370} {"train_loss": -6.422595024108887, "global_step": 99542, "epoch": 2370} {"train_loss": -6.413179874420166, "global_step": 99543, "epoch": 2370} {"train_loss": -6.4463324546813965, "global_step": 99544, "epoch": 2370} {"train_loss": -6.33601188659668, "global_step": 99545, "epoch": 2370} {"train_loss": -6.182615280151367, "global_step": 99546, "epoch": 2370} {"train_loss": -6.387843132019043, "global_step": 99547, "epoch": 2370} {"train_loss": -6.402862548828125, "global_step": 99548, "epoch": 2370} {"train_loss": -6.375429153442383, "global_step": 99549, "epoch": 2370} {"train_loss": -6.340380668640137, "global_step": 99550, "epoch": 2370} {"train_loss": -6.388095855712891, "global_step": 99551, "epoch": 2370} {"train_loss": -6.404485702514648, "global_step": 99552, "epoch": 2370} {"train_loss": -6.391798973083496, "global_step": 99553, "epoch": 2370} {"train_loss": -6.301405429840088, "global_step": 99554, "epoch": 2370} {"train_loss": -6.482616901397705, "global_step": 99555, "epoch": 2370} {"train_loss": -6.418816089630127, "global_step": 99556, "epoch": 2370} {"train_loss": -6.405490875244141, "global_step": 99557, "epoch": 2370} {"train_loss": -6.2071380615234375, "global_step": 99558, "epoch": 2370} {"train_loss": -6.392669200897217, "global_step": 99559, "epoch": 2370} {"train_loss": -6.481106281280518, "global_step": 99560, "epoch": 2370} {"train_loss": -6.394135475158691, "global_step": 99561, "epoch": 2370} {"train_loss": -6.382709980010986, "global_step": 99562, "epoch": 2370} {"train_loss": -6.386898994445801, "global_step": 99563, "epoch": 2370} {"train_loss": -6.324791431427002, "global_step": 99564, "epoch": 2370} {"train_loss": -6.435006141662598, "global_step": 99565, "epoch": 2370} {"train_loss": -6.522942066192627, "global_step": 99566, "epoch": 2370} {"train_loss": -6.297455310821533, "global_step": 99567, "epoch": 2370} {"train_loss": -6.3912200927734375, "global_step": 99568, "epoch": 2370} {"train_loss": -6.2617621421813965, "global_step": 99569, "epoch": 2370} {"train_loss": -6.373263359069824, "global_step": 99570, "epoch": 2370} {"train_loss": -6.4268341064453125, "global_step": 99571, "epoch": 2370} {"train_loss": -6.3650689125061035, "global_step": 99572, "epoch": 2370} {"train_loss": -6.42627477645874, "global_step": 99573, "epoch": 2370} {"train_loss": -6.373660087585449, "global_step": 99574, "epoch": 2370} {"train_loss": -6.457787990570068, "global_step": 99575, "epoch": 2370} {"train_loss": -6.462285041809082, "global_step": 99576, "epoch": 2370} {"train_loss": -6.398088455200195, "global_step": 99577, "epoch": 2370} {"train_loss": -6.388436794281006, "global_step": 99578, "epoch": 2370} {"train_loss": -6.470591068267822, "global_step": 99579, "epoch": 2370} {"train_loss": -6.356855392456055, "global_step": 99580, "epoch": 2370} {"train_loss": -6.3782862935747415, "global_step": 99581, "epoch": 2370, "val_loss": 64081.60546875} {"train_loss": -6.469203472137451, "global_step": 99582, "epoch": 2371} {"train_loss": -6.34119987487793, "global_step": 99583, "epoch": 2371} {"train_loss": -6.276104927062988, "global_step": 99584, "epoch": 2371} {"train_loss": -6.408458232879639, "global_step": 99585, "epoch": 2371} {"train_loss": -6.406403541564941, "global_step": 99586, "epoch": 2371} {"train_loss": -6.34175968170166, "global_step": 99587, "epoch": 2371} {"train_loss": -6.39083194732666, "global_step": 99588, "epoch": 2371} {"train_loss": -6.3556718826293945, "global_step": 99589, "epoch": 2371} {"train_loss": -6.371965408325195, "global_step": 99590, "epoch": 2371} {"train_loss": -6.36445426940918, "global_step": 99591, "epoch": 2371} {"train_loss": -6.354753494262695, "global_step": 99592, "epoch": 2371} {"train_loss": -6.419049263000488, "global_step": 99593, "epoch": 2371} {"train_loss": -6.305875778198242, "global_step": 99594, "epoch": 2371} {"train_loss": -6.321086883544922, "global_step": 99595, "epoch": 2371} {"train_loss": -6.329567909240723, "global_step": 99596, "epoch": 2371} {"train_loss": -6.294493675231934, "global_step": 99597, "epoch": 2371} {"train_loss": -6.23728084564209, "global_step": 99598, "epoch": 2371} {"train_loss": -6.3602375984191895, "global_step": 99599, "epoch": 2371} {"train_loss": -6.375261306762695, "global_step": 99600, "epoch": 2371} {"train_loss": -6.332907676696777, "global_step": 99601, "epoch": 2371} {"train_loss": -6.330760955810547, "global_step": 99602, "epoch": 2371} {"train_loss": -6.312070846557617, "global_step": 99603, "epoch": 2371} {"train_loss": -6.30061149597168, "global_step": 99604, "epoch": 2371} {"train_loss": -6.272853851318359, "global_step": 99605, "epoch": 2371} {"train_loss": -6.401910781860352, "global_step": 99606, "epoch": 2371} {"train_loss": -6.292623519897461, "global_step": 99607, "epoch": 2371} {"train_loss": -6.422666549682617, "global_step": 99608, "epoch": 2371} {"train_loss": -6.243188858032227, "global_step": 99609, "epoch": 2371} {"train_loss": -6.290778160095215, "global_step": 99610, "epoch": 2371} {"train_loss": -6.386844635009766, "global_step": 99611, "epoch": 2371} {"train_loss": -6.376772880554199, "global_step": 99612, "epoch": 2371} {"train_loss": -6.274521827697754, "global_step": 99613, "epoch": 2371} {"train_loss": -6.271878719329834, "global_step": 99614, "epoch": 2371} {"train_loss": -6.30046272277832, "global_step": 99615, "epoch": 2371} {"train_loss": -6.407051086425781, "global_step": 99616, "epoch": 2371} {"train_loss": -6.3309807777404785, "global_step": 99617, "epoch": 2371} {"train_loss": -6.307941436767578, "global_step": 99618, "epoch": 2371} {"train_loss": -6.261623382568359, "global_step": 99619, "epoch": 2371} {"train_loss": -6.329730987548828, "global_step": 99620, "epoch": 2371} {"train_loss": -6.395162582397461, "global_step": 99621, "epoch": 2371} {"train_loss": -6.284211158752441, "global_step": 99622, "epoch": 2371} {"train_loss": -6.336041143962315, "global_step": 99623, "epoch": 2371, "val_loss": 63973.81640625} {"train_loss": -6.360220909118652, "global_step": 99624, "epoch": 2372} {"train_loss": -6.3272905349731445, "global_step": 99625, "epoch": 2372} {"train_loss": -6.274156093597412, "global_step": 99626, "epoch": 2372} {"train_loss": -6.310031414031982, "global_step": 99627, "epoch": 2372} {"train_loss": -6.275986671447754, "global_step": 99628, "epoch": 2372} {"train_loss": -6.3455915451049805, "global_step": 99629, "epoch": 2372} {"train_loss": -6.339907169342041, "global_step": 99630, "epoch": 2372} {"train_loss": -6.383486270904541, "global_step": 99631, "epoch": 2372} {"train_loss": -6.517682075500488, "global_step": 99632, "epoch": 2372} {"train_loss": -6.32319974899292, "global_step": 99633, "epoch": 2372} {"train_loss": -6.458959579467773, "global_step": 99634, "epoch": 2372} {"train_loss": -6.41957950592041, "global_step": 99635, "epoch": 2372} {"train_loss": -6.377220153808594, "global_step": 99636, "epoch": 2372} {"train_loss": -6.362650394439697, "global_step": 99637, "epoch": 2372} {"train_loss": -6.334433078765869, "global_step": 99638, "epoch": 2372} {"train_loss": -6.387179374694824, "global_step": 99639, "epoch": 2372} {"train_loss": -6.374739646911621, "global_step": 99640, "epoch": 2372} {"train_loss": -6.4557294845581055, "global_step": 99641, "epoch": 2372} {"train_loss": -6.271933555603027, "global_step": 99642, "epoch": 2372} {"train_loss": -6.355023384094238, "global_step": 99643, "epoch": 2372} {"train_loss": -6.39829158782959, "global_step": 99644, "epoch": 2372} {"train_loss": -6.311405658721924, "global_step": 99645, "epoch": 2372} {"train_loss": -6.404024124145508, "global_step": 99646, "epoch": 2372} {"train_loss": -6.454834938049316, "global_step": 99647, "epoch": 2372} {"train_loss": -6.3977556228637695, "global_step": 99648, "epoch": 2372} {"train_loss": -6.423537254333496, "global_step": 99649, "epoch": 2372} {"train_loss": -6.375671863555908, "global_step": 99650, "epoch": 2372} {"train_loss": -6.316860198974609, "global_step": 99651, "epoch": 2372} {"train_loss": -6.28074836730957, "global_step": 99652, "epoch": 2372} {"train_loss": -6.3414459228515625, "global_step": 99653, "epoch": 2372} {"train_loss": -6.317155361175537, "global_step": 99654, "epoch": 2372} {"train_loss": -6.343568801879883, "global_step": 99655, "epoch": 2372} {"train_loss": -6.27834415435791, "global_step": 99656, "epoch": 2372} {"train_loss": -6.389789581298828, "global_step": 99657, "epoch": 2372} {"train_loss": -6.425826072692871, "global_step": 99658, "epoch": 2372} {"train_loss": -6.432313919067383, "global_step": 99659, "epoch": 2372} {"train_loss": -6.442525863647461, "global_step": 99660, "epoch": 2372} {"train_loss": -6.288513660430908, "global_step": 99661, "epoch": 2372} {"train_loss": -6.20074462890625, "global_step": 99662, "epoch": 2372} {"train_loss": -6.344381809234619, "global_step": 99663, "epoch": 2372} {"train_loss": -6.393950939178467, "global_step": 99664, "epoch": 2372} {"train_loss": -6.362107878639584, "global_step": 99665, "epoch": 2372, "val_loss": 64155.54296875} {"train_loss": -6.40233850479126, "global_step": 99666, "epoch": 2373} {"train_loss": -6.322436332702637, "global_step": 99667, "epoch": 2373} {"train_loss": -6.313149929046631, "global_step": 99668, "epoch": 2373} {"train_loss": -6.444140911102295, "global_step": 99669, "epoch": 2373} {"train_loss": -6.403017520904541, "global_step": 99670, "epoch": 2373} {"train_loss": -6.364040851593018, "global_step": 99671, "epoch": 2373} {"train_loss": -6.380551338195801, "global_step": 99672, "epoch": 2373} {"train_loss": -6.4976725578308105, "global_step": 99673, "epoch": 2373} {"train_loss": -6.433285236358643, "global_step": 99674, "epoch": 2373} {"train_loss": -6.3217363357543945, "global_step": 99675, "epoch": 2373} {"train_loss": -6.243632793426514, "global_step": 99676, "epoch": 2373} {"train_loss": -6.4323835372924805, "global_step": 99677, "epoch": 2373} {"train_loss": -6.346628189086914, "global_step": 99678, "epoch": 2373} {"train_loss": -6.304080486297607, "global_step": 99679, "epoch": 2373} {"train_loss": -6.3946733474731445, "global_step": 99680, "epoch": 2373} {"train_loss": -6.441250801086426, "global_step": 99681, "epoch": 2373} {"train_loss": -6.439923286437988, "global_step": 99682, "epoch": 2373} {"train_loss": -6.424132347106934, "global_step": 99683, "epoch": 2373} {"train_loss": -6.395293712615967, "global_step": 99684, "epoch": 2373} {"train_loss": -6.333106994628906, "global_step": 99685, "epoch": 2373} {"train_loss": -6.4520978927612305, "global_step": 99686, "epoch": 2373} {"train_loss": -6.323090553283691, "global_step": 99687, "epoch": 2373} {"train_loss": -6.408206939697266, "global_step": 99688, "epoch": 2373} {"train_loss": -6.39412784576416, "global_step": 99689, "epoch": 2373} {"train_loss": -6.436160087585449, "global_step": 99690, "epoch": 2373} {"train_loss": -6.315112113952637, "global_step": 99691, "epoch": 2373} {"train_loss": -6.341579437255859, "global_step": 99692, "epoch": 2373} {"train_loss": -6.432222366333008, "global_step": 99693, "epoch": 2373} {"train_loss": -6.435550689697266, "global_step": 99694, "epoch": 2373} {"train_loss": -6.308047294616699, "global_step": 99695, "epoch": 2373} {"train_loss": -6.388619422912598, "global_step": 99696, "epoch": 2373} {"train_loss": -6.302325248718262, "global_step": 99697, "epoch": 2373} {"train_loss": -6.088850975036621, "global_step": 99698, "epoch": 2373} {"train_loss": -6.435305118560791, "global_step": 99699, "epoch": 2373} {"train_loss": -6.237438201904297, "global_step": 99700, "epoch": 2373} {"train_loss": -6.3181915283203125, "global_step": 99701, "epoch": 2373} {"train_loss": -6.396548271179199, "global_step": 99702, "epoch": 2373} {"train_loss": -6.315977573394775, "global_step": 99703, "epoch": 2373} {"train_loss": -6.365556716918945, "global_step": 99704, "epoch": 2373} {"train_loss": -6.368692398071289, "global_step": 99705, "epoch": 2373} {"train_loss": -6.276678085327148, "global_step": 99706, "epoch": 2373} {"train_loss": -6.3664964607783725, "global_step": 99707, "epoch": 2373, "val_loss": 64109.296875} {"train_loss": -6.430620193481445, "global_step": 99708, "epoch": 2374} {"train_loss": -6.287215232849121, "global_step": 99709, "epoch": 2374} {"train_loss": -6.3753252029418945, "global_step": 99710, "epoch": 2374} {"train_loss": -6.257536888122559, "global_step": 99711, "epoch": 2374} {"train_loss": -6.385778427124023, "global_step": 99712, "epoch": 2374} {"train_loss": -6.3975510597229, "global_step": 99713, "epoch": 2374} {"train_loss": -6.340453624725342, "global_step": 99714, "epoch": 2374} {"train_loss": -6.257699966430664, "global_step": 99715, "epoch": 2374} {"train_loss": -6.348549842834473, "global_step": 99716, "epoch": 2374} {"train_loss": -6.418003559112549, "global_step": 99717, "epoch": 2374} {"train_loss": -6.432448387145996, "global_step": 99718, "epoch": 2374} {"train_loss": -6.373810768127441, "global_step": 99719, "epoch": 2374} {"train_loss": -6.277897834777832, "global_step": 99720, "epoch": 2374} {"train_loss": -6.326141357421875, "global_step": 99721, "epoch": 2374} {"train_loss": -6.39315128326416, "global_step": 99722, "epoch": 2374} {"train_loss": -6.398716926574707, "global_step": 99723, "epoch": 2374} {"train_loss": -6.271790981292725, "global_step": 99724, "epoch": 2374} {"train_loss": -6.383167266845703, "global_step": 99725, "epoch": 2374} {"train_loss": -6.292464256286621, "global_step": 99726, "epoch": 2374} {"train_loss": -6.339305877685547, "global_step": 99727, "epoch": 2374} {"train_loss": -6.396369457244873, "global_step": 99728, "epoch": 2374} {"train_loss": -6.299172401428223, "global_step": 99729, "epoch": 2374} {"train_loss": -6.371310234069824, "global_step": 99730, "epoch": 2374} {"train_loss": -6.250433444976807, "global_step": 99731, "epoch": 2374} {"train_loss": -6.302973747253418, "global_step": 99732, "epoch": 2374} {"train_loss": -6.303011894226074, "global_step": 99733, "epoch": 2374} {"train_loss": -6.341348648071289, "global_step": 99734, "epoch": 2374} {"train_loss": -6.2690653800964355, "global_step": 99735, "epoch": 2374} {"train_loss": -6.32015323638916, "global_step": 99736, "epoch": 2374} {"train_loss": -6.303038597106934, "global_step": 99737, "epoch": 2374} {"train_loss": -6.356770992279053, "global_step": 99738, "epoch": 2374} {"train_loss": -6.334390163421631, "global_step": 99739, "epoch": 2374} {"train_loss": -6.327567100524902, "global_step": 99740, "epoch": 2374} {"train_loss": -6.35883903503418, "global_step": 99741, "epoch": 2374} {"train_loss": -6.336480140686035, "global_step": 99742, "epoch": 2374} {"train_loss": -6.3932647705078125, "global_step": 99743, "epoch": 2374} {"train_loss": -6.353011131286621, "global_step": 99744, "epoch": 2374} {"train_loss": -6.442114353179932, "global_step": 99745, "epoch": 2374} {"train_loss": -6.483466625213623, "global_step": 99746, "epoch": 2374} {"train_loss": -6.381403923034668, "global_step": 99747, "epoch": 2374} {"train_loss": -6.366021156311035, "global_step": 99748, "epoch": 2374} {"train_loss": -6.351002522877285, "global_step": 99749, "epoch": 2374, "val_loss": 64206.796875} {"train_loss": -6.342574119567871, "global_step": 99750, "epoch": 2375} {"train_loss": -6.2711944580078125, "global_step": 99751, "epoch": 2375} {"train_loss": -6.446328163146973, "global_step": 99752, "epoch": 2375} {"train_loss": -6.358436107635498, "global_step": 99753, "epoch": 2375} {"train_loss": -6.294356822967529, "global_step": 99754, "epoch": 2375} {"train_loss": -6.3997931480407715, "global_step": 99755, "epoch": 2375} {"train_loss": -6.3662638664245605, "global_step": 99756, "epoch": 2375} {"train_loss": -6.352120399475098, "global_step": 99757, "epoch": 2375} {"train_loss": -6.3936920166015625, "global_step": 99758, "epoch": 2375} {"train_loss": -6.345545768737793, "global_step": 99759, "epoch": 2375} {"train_loss": -6.425774097442627, "global_step": 99760, "epoch": 2375} {"train_loss": -6.3514018058776855, "global_step": 99761, "epoch": 2375} {"train_loss": -6.261386871337891, "global_step": 99762, "epoch": 2375} {"train_loss": -6.252507209777832, "global_step": 99763, "epoch": 2375} {"train_loss": -6.386949062347412, "global_step": 99764, "epoch": 2375} {"train_loss": -6.372737884521484, "global_step": 99765, "epoch": 2375} {"train_loss": -6.315805435180664, "global_step": 99766, "epoch": 2375} {"train_loss": -6.344614028930664, "global_step": 99767, "epoch": 2375} {"train_loss": -6.297983169555664, "global_step": 99768, "epoch": 2375} {"train_loss": -6.375662803649902, "global_step": 99769, "epoch": 2375} {"train_loss": -6.418989658355713, "global_step": 99770, "epoch": 2375} {"train_loss": -6.484793663024902, "global_step": 99771, "epoch": 2375} {"train_loss": -6.40107536315918, "global_step": 99772, "epoch": 2375} {"train_loss": -6.408317565917969, "global_step": 99773, "epoch": 2375} {"train_loss": -6.45789098739624, "global_step": 99774, "epoch": 2375} {"train_loss": -6.318396091461182, "global_step": 99775, "epoch": 2375} {"train_loss": -6.316350936889648, "global_step": 99776, "epoch": 2375} {"train_loss": -6.393349647521973, "global_step": 99777, "epoch": 2375} {"train_loss": -6.345617294311523, "global_step": 99778, "epoch": 2375} {"train_loss": -6.49259090423584, "global_step": 99779, "epoch": 2375} {"train_loss": -6.324021339416504, "global_step": 99780, "epoch": 2375} {"train_loss": -6.446370601654053, "global_step": 99781, "epoch": 2375} {"train_loss": -6.4809722900390625, "global_step": 99782, "epoch": 2375} {"train_loss": -6.374111175537109, "global_step": 99783, "epoch": 2375} {"train_loss": -6.291323661804199, "global_step": 99784, "epoch": 2375} {"train_loss": -6.2589263916015625, "global_step": 99785, "epoch": 2375} {"train_loss": -6.340595245361328, "global_step": 99786, "epoch": 2375} {"train_loss": -6.343916416168213, "global_step": 99787, "epoch": 2375} {"train_loss": -6.316985130310059, "global_step": 99788, "epoch": 2375} {"train_loss": -6.353473663330078, "global_step": 99789, "epoch": 2375} {"train_loss": -6.208907127380371, "global_step": 99790, "epoch": 2375} {"train_loss": -6.35709361802964, "global_step": 99791, "epoch": 2375, "val_loss": 64346.07421875} {"train_loss": -6.395866870880127, "global_step": 99792, "epoch": 2376} {"train_loss": -6.323824882507324, "global_step": 99793, "epoch": 2376} {"train_loss": -6.387709617614746, "global_step": 99794, "epoch": 2376} {"train_loss": -6.347957134246826, "global_step": 99795, "epoch": 2376} {"train_loss": -6.352435111999512, "global_step": 99796, "epoch": 2376} {"train_loss": -6.329588890075684, "global_step": 99797, "epoch": 2376} {"train_loss": -6.33117151260376, "global_step": 99798, "epoch": 2376} {"train_loss": -6.3660125732421875, "global_step": 99799, "epoch": 2376} {"train_loss": -6.3800578117370605, "global_step": 99800, "epoch": 2376} {"train_loss": -6.407204627990723, "global_step": 99801, "epoch": 2376} {"train_loss": -6.344156265258789, "global_step": 99802, "epoch": 2376} {"train_loss": -6.336467742919922, "global_step": 99803, "epoch": 2376} {"train_loss": -6.429800987243652, "global_step": 99804, "epoch": 2376} {"train_loss": -6.232046127319336, "global_step": 99805, "epoch": 2376} {"train_loss": -6.271489143371582, "global_step": 99806, "epoch": 2376} {"train_loss": -6.391448497772217, "global_step": 99807, "epoch": 2376} {"train_loss": -6.334017753601074, "global_step": 99808, "epoch": 2376} {"train_loss": -6.365771293640137, "global_step": 99809, "epoch": 2376} {"train_loss": -6.24445104598999, "global_step": 99810, "epoch": 2376} {"train_loss": -6.440732002258301, "global_step": 99811, "epoch": 2376} {"train_loss": -6.367746829986572, "global_step": 99812, "epoch": 2376} {"train_loss": -6.356627464294434, "global_step": 99813, "epoch": 2376} {"train_loss": -6.323023796081543, "global_step": 99814, "epoch": 2376} {"train_loss": -6.389254570007324, "global_step": 99815, "epoch": 2376} {"train_loss": -6.349778175354004, "global_step": 99816, "epoch": 2376} {"train_loss": -6.420734405517578, "global_step": 99817, "epoch": 2376} {"train_loss": -6.486060619354248, "global_step": 99818, "epoch": 2376} {"train_loss": -6.304706573486328, "global_step": 99819, "epoch": 2376} {"train_loss": -6.461045265197754, "global_step": 99820, "epoch": 2376} {"train_loss": -6.3155412673950195, "global_step": 99821, "epoch": 2376} {"train_loss": -6.50167179107666, "global_step": 99822, "epoch": 2376} {"train_loss": -6.3711347579956055, "global_step": 99823, "epoch": 2376} {"train_loss": -6.2969465255737305, "global_step": 99824, "epoch": 2376} {"train_loss": -6.256918907165527, "global_step": 99825, "epoch": 2376} {"train_loss": -6.367592811584473, "global_step": 99826, "epoch": 2376} {"train_loss": -6.454103469848633, "global_step": 99827, "epoch": 2376} {"train_loss": -6.2926530838012695, "global_step": 99828, "epoch": 2376} {"train_loss": -6.330240249633789, "global_step": 99829, "epoch": 2376} {"train_loss": -6.267751693725586, "global_step": 99830, "epoch": 2376} {"train_loss": -6.371679306030273, "global_step": 99831, "epoch": 2376} {"train_loss": -6.317042350769043, "global_step": 99832, "epoch": 2376} {"train_loss": -6.356705688294911, "global_step": 99833, "epoch": 2376, "val_loss": 64139.1875} {"train_loss": -6.362178802490234, "global_step": 99834, "epoch": 2377} {"train_loss": -6.436954498291016, "global_step": 99835, "epoch": 2377} {"train_loss": -6.427618980407715, "global_step": 99836, "epoch": 2377} {"train_loss": -6.303410530090332, "global_step": 99837, "epoch": 2377} {"train_loss": -6.396389961242676, "global_step": 99838, "epoch": 2377} {"train_loss": -6.360372543334961, "global_step": 99839, "epoch": 2377} {"train_loss": -6.338174343109131, "global_step": 99840, "epoch": 2377} {"train_loss": -6.428045272827148, "global_step": 99841, "epoch": 2377} {"train_loss": -6.316153526306152, "global_step": 99842, "epoch": 2377} {"train_loss": -6.430019378662109, "global_step": 99843, "epoch": 2377} {"train_loss": -6.343530654907227, "global_step": 99844, "epoch": 2377} {"train_loss": -6.5150885581970215, "global_step": 99845, "epoch": 2377} {"train_loss": -6.445127487182617, "global_step": 99846, "epoch": 2377} {"train_loss": -6.54276704788208, "global_step": 99847, "epoch": 2377} {"train_loss": -6.39101505279541, "global_step": 99848, "epoch": 2377} {"train_loss": -6.4238176345825195, "global_step": 99849, "epoch": 2377} {"train_loss": -6.462084770202637, "global_step": 99850, "epoch": 2377} {"train_loss": -6.361813545227051, "global_step": 99851, "epoch": 2377} {"train_loss": -6.427458763122559, "global_step": 99852, "epoch": 2377} {"train_loss": -6.371581077575684, "global_step": 99853, "epoch": 2377} {"train_loss": -6.374427795410156, "global_step": 99854, "epoch": 2377} {"train_loss": -6.358304977416992, "global_step": 99855, "epoch": 2377} {"train_loss": -6.327001571655273, "global_step": 99856, "epoch": 2377} {"train_loss": -6.2877278327941895, "global_step": 99857, "epoch": 2377} {"train_loss": -6.407927513122559, "global_step": 99858, "epoch": 2377} {"train_loss": -6.268591403961182, "global_step": 99859, "epoch": 2377} {"train_loss": -6.344391345977783, "global_step": 99860, "epoch": 2377} {"train_loss": -6.387302398681641, "global_step": 99861, "epoch": 2377} {"train_loss": -6.368955135345459, "global_step": 99862, "epoch": 2377} {"train_loss": -6.426102638244629, "global_step": 99863, "epoch": 2377} {"train_loss": -6.350975036621094, "global_step": 99864, "epoch": 2377} {"train_loss": -6.351917266845703, "global_step": 99865, "epoch": 2377} {"train_loss": -6.4437150955200195, "global_step": 99866, "epoch": 2377} {"train_loss": -6.514995574951172, "global_step": 99867, "epoch": 2377} {"train_loss": -6.337197303771973, "global_step": 99868, "epoch": 2377} {"train_loss": -6.344283103942871, "global_step": 99869, "epoch": 2377} {"train_loss": -6.368379592895508, "global_step": 99870, "epoch": 2377} {"train_loss": -6.28397274017334, "global_step": 99871, "epoch": 2377} {"train_loss": -6.251352787017822, "global_step": 99872, "epoch": 2377} {"train_loss": -6.317035675048828, "global_step": 99873, "epoch": 2377} {"train_loss": -6.287774562835693, "global_step": 99874, "epoch": 2377} {"train_loss": -6.376045181637719, "global_step": 99875, "epoch": 2377, "val_loss": 64315.5078125} {"train_loss": -6.27173376083374, "global_step": 99876, "epoch": 2378} {"train_loss": -6.334097385406494, "global_step": 99877, "epoch": 2378} {"train_loss": -6.394507884979248, "global_step": 99878, "epoch": 2378} {"train_loss": -6.337737083435059, "global_step": 99879, "epoch": 2378} {"train_loss": -6.346064567565918, "global_step": 99880, "epoch": 2378} {"train_loss": -6.171579360961914, "global_step": 99881, "epoch": 2378} {"train_loss": -6.3721184730529785, "global_step": 99882, "epoch": 2378} {"train_loss": -6.308286666870117, "global_step": 99883, "epoch": 2378} {"train_loss": -6.227698802947998, "global_step": 99884, "epoch": 2378} {"train_loss": -6.299103736877441, "global_step": 99885, "epoch": 2378} {"train_loss": -6.168478965759277, "global_step": 99886, "epoch": 2378} {"train_loss": -6.242038726806641, "global_step": 99887, "epoch": 2378} {"train_loss": -6.449976921081543, "global_step": 99888, "epoch": 2378} {"train_loss": -6.224062919616699, "global_step": 99889, "epoch": 2378} {"train_loss": -6.267168045043945, "global_step": 99890, "epoch": 2378} {"train_loss": -6.255958557128906, "global_step": 99891, "epoch": 2378} {"train_loss": -6.154933929443359, "global_step": 99892, "epoch": 2378} {"train_loss": -6.33751106262207, "global_step": 99893, "epoch": 2378} {"train_loss": -6.3548784255981445, "global_step": 99894, "epoch": 2378} {"train_loss": -6.2190704345703125, "global_step": 99895, "epoch": 2378} {"train_loss": -6.257651329040527, "global_step": 99896, "epoch": 2378} {"train_loss": -6.245275974273682, "global_step": 99897, "epoch": 2378} {"train_loss": -6.288729667663574, "global_step": 99898, "epoch": 2378} {"train_loss": -6.309636116027832, "global_step": 99899, "epoch": 2378} {"train_loss": -6.335967540740967, "global_step": 99900, "epoch": 2378} {"train_loss": -6.276200771331787, "global_step": 99901, "epoch": 2378} {"train_loss": -6.355879783630371, "global_step": 99902, "epoch": 2378} {"train_loss": -6.509644031524658, "global_step": 99903, "epoch": 2378} {"train_loss": -6.321748733520508, "global_step": 99904, "epoch": 2378} {"train_loss": -6.333696365356445, "global_step": 99905, "epoch": 2378} {"train_loss": -6.371984958648682, "global_step": 99906, "epoch": 2378} {"train_loss": -6.523397445678711, "global_step": 99907, "epoch": 2378} {"train_loss": -6.382937431335449, "global_step": 99908, "epoch": 2378} {"train_loss": -6.359931468963623, "global_step": 99909, "epoch": 2378} {"train_loss": -6.3939971923828125, "global_step": 99910, "epoch": 2378} {"train_loss": -6.406765460968018, "global_step": 99911, "epoch": 2378} {"train_loss": -6.39858341217041, "global_step": 99912, "epoch": 2378} {"train_loss": -6.394961357116699, "global_step": 99913, "epoch": 2378} {"train_loss": -6.3140869140625, "global_step": 99914, "epoch": 2378} {"train_loss": -6.453344821929932, "global_step": 99915, "epoch": 2378} {"train_loss": -6.363153457641602, "global_step": 99916, "epoch": 2378} {"train_loss": -6.327369099571591, "global_step": 99917, "epoch": 2378, "val_loss": 64020.01953125} {"train_loss": -6.364470481872559, "global_step": 99918, "epoch": 2379} {"train_loss": -6.366846561431885, "global_step": 99919, "epoch": 2379} {"train_loss": -6.4270734786987305, "global_step": 99920, "epoch": 2379} {"train_loss": -6.438681602478027, "global_step": 99921, "epoch": 2379} {"train_loss": -6.374608993530273, "global_step": 99922, "epoch": 2379} {"train_loss": -6.382630348205566, "global_step": 99923, "epoch": 2379} {"train_loss": -6.4880571365356445, "global_step": 99924, "epoch": 2379} {"train_loss": -6.337334632873535, "global_step": 99925, "epoch": 2379} {"train_loss": -6.253311634063721, "global_step": 99926, "epoch": 2379} {"train_loss": -6.358022689819336, "global_step": 99927, "epoch": 2379} {"train_loss": -6.313991546630859, "global_step": 99928, "epoch": 2379} {"train_loss": -6.308464050292969, "global_step": 99929, "epoch": 2379} {"train_loss": -6.353708744049072, "global_step": 99930, "epoch": 2379} {"train_loss": -6.460208415985107, "global_step": 99931, "epoch": 2379} {"train_loss": -6.367274284362793, "global_step": 99932, "epoch": 2379} {"train_loss": -6.363381862640381, "global_step": 99933, "epoch": 2379} {"train_loss": -6.373716354370117, "global_step": 99934, "epoch": 2379} {"train_loss": -6.471837520599365, "global_step": 99935, "epoch": 2379} {"train_loss": -6.312136173248291, "global_step": 99936, "epoch": 2379} {"train_loss": -6.452392101287842, "global_step": 99937, "epoch": 2379} {"train_loss": -6.405202388763428, "global_step": 99938, "epoch": 2379} {"train_loss": -6.399250507354736, "global_step": 99939, "epoch": 2379} {"train_loss": -6.332178115844727, "global_step": 99940, "epoch": 2379} {"train_loss": -6.347907066345215, "global_step": 99941, "epoch": 2379} {"train_loss": -6.368640899658203, "global_step": 99942, "epoch": 2379} {"train_loss": -6.3904218673706055, "global_step": 99943, "epoch": 2379} {"train_loss": -6.19326114654541, "global_step": 99944, "epoch": 2379} {"train_loss": -6.424616813659668, "global_step": 99945, "epoch": 2379} {"train_loss": -6.454801082611084, "global_step": 99946, "epoch": 2379} {"train_loss": -6.414886474609375, "global_step": 99947, "epoch": 2379} {"train_loss": -6.342707633972168, "global_step": 99948, "epoch": 2379} {"train_loss": -6.47628116607666, "global_step": 99949, "epoch": 2379} {"train_loss": -6.322378158569336, "global_step": 99950, "epoch": 2379} {"train_loss": -6.430203437805176, "global_step": 99951, "epoch": 2379} {"train_loss": -6.377795219421387, "global_step": 99952, "epoch": 2379} {"train_loss": -6.289117813110352, "global_step": 99953, "epoch": 2379} {"train_loss": -6.369483947753906, "global_step": 99954, "epoch": 2379} {"train_loss": -6.415921211242676, "global_step": 99955, "epoch": 2379} {"train_loss": -6.394883632659912, "global_step": 99956, "epoch": 2379} {"train_loss": -6.385323524475098, "global_step": 99957, "epoch": 2379} {"train_loss": -6.44486141204834, "global_step": 99958, "epoch": 2379} {"train_loss": -6.380159514290946, "global_step": 99959, "epoch": 2379, "val_loss": 63956.37109375} {"train_loss": -6.381847381591797, "global_step": 99960, "epoch": 2380} {"train_loss": -6.409800052642822, "global_step": 99961, "epoch": 2380} {"train_loss": -6.365670204162598, "global_step": 99962, "epoch": 2380} {"train_loss": -6.371535301208496, "global_step": 99963, "epoch": 2380} {"train_loss": -6.335546493530273, "global_step": 99964, "epoch": 2380} {"train_loss": -6.347609519958496, "global_step": 99965, "epoch": 2380} {"train_loss": -6.215413570404053, "global_step": 99966, "epoch": 2380} {"train_loss": -6.323948860168457, "global_step": 99967, "epoch": 2380} {"train_loss": -6.200613975524902, "global_step": 99968, "epoch": 2380} {"train_loss": -6.29551362991333, "global_step": 99969, "epoch": 2380} {"train_loss": -6.487028121948242, "global_step": 99970, "epoch": 2380} {"train_loss": -6.419967174530029, "global_step": 99971, "epoch": 2380} {"train_loss": -6.252529621124268, "global_step": 99972, "epoch": 2380} {"train_loss": -6.413686752319336, "global_step": 99973, "epoch": 2380} {"train_loss": -6.411680221557617, "global_step": 99974, "epoch": 2380} {"train_loss": -6.370163440704346, "global_step": 99975, "epoch": 2380} {"train_loss": -6.418032646179199, "global_step": 99976, "epoch": 2380} {"train_loss": -6.364819526672363, "global_step": 99977, "epoch": 2380} {"train_loss": -6.3506975173950195, "global_step": 99978, "epoch": 2380} {"train_loss": -6.306661128997803, "global_step": 99979, "epoch": 2380} {"train_loss": -6.193704605102539, "global_step": 99980, "epoch": 2380} {"train_loss": -6.2990803718566895, "global_step": 99981, "epoch": 2380} {"train_loss": -6.38205099105835, "global_step": 99982, "epoch": 2380} {"train_loss": -6.282626152038574, "global_step": 99983, "epoch": 2380} {"train_loss": -6.317166328430176, "global_step": 99984, "epoch": 2380} {"train_loss": -6.3164777755737305, "global_step": 99985, "epoch": 2380} {"train_loss": -6.39777946472168, "global_step": 99986, "epoch": 2380} {"train_loss": -6.295772552490234, "global_step": 99987, "epoch": 2380} {"train_loss": -6.168615818023682, "global_step": 99988, "epoch": 2380} {"train_loss": -6.303279399871826, "global_step": 99989, "epoch": 2380} {"train_loss": -6.231348037719727, "global_step": 99990, "epoch": 2380} {"train_loss": -6.433582305908203, "global_step": 99991, "epoch": 2380} {"train_loss": -6.246397972106934, "global_step": 99992, "epoch": 2380} {"train_loss": -6.321557998657227, "global_step": 99993, "epoch": 2380} {"train_loss": -6.246334552764893, "global_step": 99994, "epoch": 2380} {"train_loss": -6.230269432067871, "global_step": 99995, "epoch": 2380} {"train_loss": -6.327291488647461, "global_step": 99996, "epoch": 2380} {"train_loss": -6.3198137283325195, "global_step": 99997, "epoch": 2380} {"train_loss": -6.31986141204834, "global_step": 99998, "epoch": 2380} {"train_loss": -6.326589584350586, "global_step": 99999, "epoch": 2380} {"train_loss": -6.422978401184082, "global_step": 100000, "epoch": 2380} {"train_loss": -6.328184752237229, "global_step": 100001, "epoch": 2380, "val_loss": 63922.109375} {"train_loss": -6.379781723022461, "global_step": 100002, "epoch": 2381} {"train_loss": -6.249258995056152, "global_step": 100003, "epoch": 2381} {"train_loss": -6.293455123901367, "global_step": 100004, "epoch": 2381} {"train_loss": -6.301064491271973, "global_step": 100005, "epoch": 2381} {"train_loss": -6.450863838195801, "global_step": 100006, "epoch": 2381} {"train_loss": -6.363773345947266, "global_step": 100007, "epoch": 2381} {"train_loss": -6.394008159637451, "global_step": 100008, "epoch": 2381} {"train_loss": -6.411843299865723, "global_step": 100009, "epoch": 2381} {"train_loss": -6.409646034240723, "global_step": 100010, "epoch": 2381} {"train_loss": -6.48782205581665, "global_step": 100011, "epoch": 2381} {"train_loss": -6.434116363525391, "global_step": 100012, "epoch": 2381} {"train_loss": -6.513375759124756, "global_step": 100013, "epoch": 2381} {"train_loss": -6.397040367126465, "global_step": 100014, "epoch": 2381} {"train_loss": -6.295859336853027, "global_step": 100015, "epoch": 2381} {"train_loss": -6.237974166870117, "global_step": 100016, "epoch": 2381} {"train_loss": -6.275676727294922, "global_step": 100017, "epoch": 2381} {"train_loss": -6.3245673179626465, "global_step": 100018, "epoch": 2381} {"train_loss": -6.349978446960449, "global_step": 100019, "epoch": 2381} {"train_loss": -6.326351642608643, "global_step": 100020, "epoch": 2381} {"train_loss": -6.451388359069824, "global_step": 100021, "epoch": 2381} {"train_loss": -6.410998344421387, "global_step": 100022, "epoch": 2381} {"train_loss": -6.254850387573242, "global_step": 100023, "epoch": 2381} {"train_loss": -6.275253772735596, "global_step": 100024, "epoch": 2381} {"train_loss": -6.356888771057129, "global_step": 100025, "epoch": 2381} {"train_loss": -6.2762627601623535, "global_step": 100026, "epoch": 2381} {"train_loss": -6.255495071411133, "global_step": 100027, "epoch": 2381} {"train_loss": -6.284347057342529, "global_step": 100028, "epoch": 2381} {"train_loss": -6.2508225440979, "global_step": 100029, "epoch": 2381} {"train_loss": -6.324845314025879, "global_step": 100030, "epoch": 2381} {"train_loss": -6.445205211639404, "global_step": 100031, "epoch": 2381} {"train_loss": -6.26485013961792, "global_step": 100032, "epoch": 2381} {"train_loss": -6.5017194747924805, "global_step": 100033, "epoch": 2381} {"train_loss": -6.288384437561035, "global_step": 100034, "epoch": 2381} {"train_loss": -6.353997230529785, "global_step": 100035, "epoch": 2381} {"train_loss": -6.397706985473633, "global_step": 100036, "epoch": 2381} {"train_loss": -6.420106410980225, "global_step": 100037, "epoch": 2381} {"train_loss": -6.404753684997559, "global_step": 100038, "epoch": 2381} {"train_loss": -6.2992143630981445, "global_step": 100039, "epoch": 2381} {"train_loss": -6.209959030151367, "global_step": 100040, "epoch": 2381} {"train_loss": -6.442407131195068, "global_step": 100041, "epoch": 2381} {"train_loss": -6.344831466674805, "global_step": 100042, "epoch": 2381} {"train_loss": -6.350957654771351, "global_step": 100043, "epoch": 2381, "val_loss": 64047.6171875} {"train_loss": -6.4150614738464355, "global_step": 100044, "epoch": 2382} {"train_loss": -6.2306718826293945, "global_step": 100045, "epoch": 2382} {"train_loss": -6.448681831359863, "global_step": 100046, "epoch": 2382} {"train_loss": -6.248347759246826, "global_step": 100047, "epoch": 2382} {"train_loss": -6.45947265625, "global_step": 100048, "epoch": 2382} {"train_loss": -6.30853271484375, "global_step": 100049, "epoch": 2382} {"train_loss": -6.403791427612305, "global_step": 100050, "epoch": 2382} {"train_loss": -6.410398483276367, "global_step": 100051, "epoch": 2382} {"train_loss": -6.411687850952148, "global_step": 100052, "epoch": 2382} {"train_loss": -6.339653968811035, "global_step": 100053, "epoch": 2382} {"train_loss": -6.437445640563965, "global_step": 100054, "epoch": 2382} {"train_loss": -6.32124137878418, "global_step": 100055, "epoch": 2382} {"train_loss": -6.342604637145996, "global_step": 100056, "epoch": 2382} {"train_loss": -6.280671119689941, "global_step": 100057, "epoch": 2382} {"train_loss": -6.434137344360352, "global_step": 100058, "epoch": 2382} {"train_loss": -6.3623857498168945, "global_step": 100059, "epoch": 2382} {"train_loss": -6.323146820068359, "global_step": 100060, "epoch": 2382} {"train_loss": -6.345104217529297, "global_step": 100061, "epoch": 2382} {"train_loss": -6.253237724304199, "global_step": 100062, "epoch": 2382} {"train_loss": -6.2973175048828125, "global_step": 100063, "epoch": 2382} {"train_loss": -6.260499000549316, "global_step": 100064, "epoch": 2382} {"train_loss": -6.247727394104004, "global_step": 100065, "epoch": 2382} {"train_loss": -6.245509147644043, "global_step": 100066, "epoch": 2382} {"train_loss": -6.265149116516113, "global_step": 100067, "epoch": 2382} {"train_loss": -6.241670608520508, "global_step": 100068, "epoch": 2382} {"train_loss": -6.32196044921875, "global_step": 100069, "epoch": 2382} {"train_loss": -6.048464298248291, "global_step": 100070, "epoch": 2382} {"train_loss": -6.44952917098999, "global_step": 100071, "epoch": 2382} {"train_loss": -6.264350891113281, "global_step": 100072, "epoch": 2382} {"train_loss": -6.2826762199401855, "global_step": 100073, "epoch": 2382} {"train_loss": -6.33203125, "global_step": 100074, "epoch": 2382} {"train_loss": -6.384433746337891, "global_step": 100075, "epoch": 2382} {"train_loss": -6.322948932647705, "global_step": 100076, "epoch": 2382} {"train_loss": -6.296770095825195, "global_step": 100077, "epoch": 2382} {"train_loss": -6.313138961791992, "global_step": 100078, "epoch": 2382} {"train_loss": -6.438652992248535, "global_step": 100079, "epoch": 2382} {"train_loss": -6.3241119384765625, "global_step": 100080, "epoch": 2382} {"train_loss": -6.338733673095703, "global_step": 100081, "epoch": 2382} {"train_loss": -6.319720268249512, "global_step": 100082, "epoch": 2382} {"train_loss": -6.319645404815674, "global_step": 100083, "epoch": 2382} {"train_loss": -6.392552852630615, "global_step": 100084, "epoch": 2382} {"train_loss": -6.328360739208403, "global_step": 100085, "epoch": 2382, "val_loss": 64156.34375} {"train_loss": -6.367265701293945, "global_step": 100086, "epoch": 2383} {"train_loss": -6.2604475021362305, "global_step": 100087, "epoch": 2383} {"train_loss": -6.26115608215332, "global_step": 100088, "epoch": 2383} {"train_loss": -6.436635971069336, "global_step": 100089, "epoch": 2383} {"train_loss": -6.206625938415527, "global_step": 100090, "epoch": 2383} {"train_loss": -6.267241954803467, "global_step": 100091, "epoch": 2383} {"train_loss": -6.361106872558594, "global_step": 100092, "epoch": 2383} {"train_loss": -6.264893054962158, "global_step": 100093, "epoch": 2383} {"train_loss": -6.348080158233643, "global_step": 100094, "epoch": 2383} {"train_loss": -6.314455032348633, "global_step": 100095, "epoch": 2383} {"train_loss": -6.331623077392578, "global_step": 100096, "epoch": 2383} {"train_loss": -6.347552299499512, "global_step": 100097, "epoch": 2383} {"train_loss": -6.357516288757324, "global_step": 100098, "epoch": 2383} {"train_loss": -6.313892364501953, "global_step": 100099, "epoch": 2383} {"train_loss": -6.471697807312012, "global_step": 100100, "epoch": 2383} {"train_loss": -6.249146461486816, "global_step": 100101, "epoch": 2383} {"train_loss": -6.269893169403076, "global_step": 100102, "epoch": 2383} {"train_loss": -6.332244873046875, "global_step": 100103, "epoch": 2383} {"train_loss": -6.282194137573242, "global_step": 100104, "epoch": 2383} {"train_loss": -6.481276035308838, "global_step": 100105, "epoch": 2383} {"train_loss": -6.440709114074707, "global_step": 100106, "epoch": 2383} {"train_loss": -6.305244445800781, "global_step": 100107, "epoch": 2383} {"train_loss": -6.232617378234863, "global_step": 100108, "epoch": 2383} {"train_loss": -6.329302787780762, "global_step": 100109, "epoch": 2383} {"train_loss": -6.2727227210998535, "global_step": 100110, "epoch": 2383} {"train_loss": -6.320473670959473, "global_step": 100111, "epoch": 2383} {"train_loss": -6.379511833190918, "global_step": 100112, "epoch": 2383} {"train_loss": -6.257350921630859, "global_step": 100113, "epoch": 2383} {"train_loss": -6.324657440185547, "global_step": 100114, "epoch": 2383} {"train_loss": -6.29189395904541, "global_step": 100115, "epoch": 2383} {"train_loss": -6.322980880737305, "global_step": 100116, "epoch": 2383} {"train_loss": -6.344246864318848, "global_step": 100117, "epoch": 2383} {"train_loss": -6.267940521240234, "global_step": 100118, "epoch": 2383} {"train_loss": -6.278355598449707, "global_step": 100119, "epoch": 2383} {"train_loss": -6.451830863952637, "global_step": 100120, "epoch": 2383} {"train_loss": -6.311875820159912, "global_step": 100121, "epoch": 2383} {"train_loss": -6.260947227478027, "global_step": 100122, "epoch": 2383} {"train_loss": -6.255377769470215, "global_step": 100123, "epoch": 2383} {"train_loss": -6.276918411254883, "global_step": 100124, "epoch": 2383} {"train_loss": -6.239615440368652, "global_step": 100125, "epoch": 2383} {"train_loss": -6.217495918273926, "global_step": 100126, "epoch": 2383} {"train_loss": -6.314778804779053, "global_step": 100127, "epoch": 2383, "val_loss": 64056.4921875} {"train_loss": -6.2576704025268555, "global_step": 100128, "epoch": 2384} {"train_loss": -6.296267509460449, "global_step": 100129, "epoch": 2384} {"train_loss": -6.329148769378662, "global_step": 100130, "epoch": 2384} {"train_loss": -6.283023834228516, "global_step": 100131, "epoch": 2384} {"train_loss": -6.361981391906738, "global_step": 100132, "epoch": 2384} {"train_loss": -6.410633087158203, "global_step": 100133, "epoch": 2384} {"train_loss": -6.421891689300537, "global_step": 100134, "epoch": 2384} {"train_loss": -6.507716178894043, "global_step": 100135, "epoch": 2384} {"train_loss": -6.303317546844482, "global_step": 100136, "epoch": 2384} {"train_loss": -6.417359352111816, "global_step": 100137, "epoch": 2384} {"train_loss": -6.389992713928223, "global_step": 100138, "epoch": 2384} {"train_loss": -6.3092803955078125, "global_step": 100139, "epoch": 2384} {"train_loss": -6.375457286834717, "global_step": 100140, "epoch": 2384} {"train_loss": -6.338623046875, "global_step": 100141, "epoch": 2384} {"train_loss": -6.4733052253723145, "global_step": 100142, "epoch": 2384} {"train_loss": -6.429110527038574, "global_step": 100143, "epoch": 2384} {"train_loss": -6.328118324279785, "global_step": 100144, "epoch": 2384} {"train_loss": -6.285887718200684, "global_step": 100145, "epoch": 2384} {"train_loss": -6.301743507385254, "global_step": 100146, "epoch": 2384} {"train_loss": -6.279275417327881, "global_step": 100147, "epoch": 2384} {"train_loss": -6.37607479095459, "global_step": 100148, "epoch": 2384} {"train_loss": -6.295856952667236, "global_step": 100149, "epoch": 2384} {"train_loss": -6.406853675842285, "global_step": 100150, "epoch": 2384} {"train_loss": -6.281939506530762, "global_step": 100151, "epoch": 2384} {"train_loss": -6.310473442077637, "global_step": 100152, "epoch": 2384} {"train_loss": -6.403722763061523, "global_step": 100153, "epoch": 2384} {"train_loss": -6.366693019866943, "global_step": 100154, "epoch": 2384} {"train_loss": -6.305405616760254, "global_step": 100155, "epoch": 2384} {"train_loss": -6.375552654266357, "global_step": 100156, "epoch": 2384} {"train_loss": -6.473038673400879, "global_step": 100157, "epoch": 2384} {"train_loss": -6.3211212158203125, "global_step": 100158, "epoch": 2384} {"train_loss": -6.317178726196289, "global_step": 100159, "epoch": 2384} {"train_loss": -6.260446071624756, "global_step": 100160, "epoch": 2384} {"train_loss": -6.434634208679199, "global_step": 100161, "epoch": 2384} {"train_loss": -6.36269998550415, "global_step": 100162, "epoch": 2384} {"train_loss": -6.368076324462891, "global_step": 100163, "epoch": 2384} {"train_loss": -6.331230640411377, "global_step": 100164, "epoch": 2384} {"train_loss": -6.412598609924316, "global_step": 100165, "epoch": 2384} {"train_loss": -6.309298515319824, "global_step": 100166, "epoch": 2384} {"train_loss": -6.355720520019531, "global_step": 100167, "epoch": 2384} {"train_loss": -6.4632368087768555, "global_step": 100168, "epoch": 2384} {"train_loss": -6.356853848411923, "global_step": 100169, "epoch": 2384, "val_loss": 64133.9375} {"train_loss": -6.3485236167907715, "global_step": 100170, "epoch": 2385} {"train_loss": -6.4120988845825195, "global_step": 100171, "epoch": 2385} {"train_loss": -6.395362854003906, "global_step": 100172, "epoch": 2385} {"train_loss": -6.310962677001953, "global_step": 100173, "epoch": 2385} {"train_loss": -6.302065849304199, "global_step": 100174, "epoch": 2385} {"train_loss": -6.41719388961792, "global_step": 100175, "epoch": 2385} {"train_loss": -6.413926124572754, "global_step": 100176, "epoch": 2385} {"train_loss": -6.341867446899414, "global_step": 100177, "epoch": 2385} {"train_loss": -6.382843971252441, "global_step": 100178, "epoch": 2385} {"train_loss": -6.4222564697265625, "global_step": 100179, "epoch": 2385} {"train_loss": -6.388117790222168, "global_step": 100180, "epoch": 2385} {"train_loss": -6.442690849304199, "global_step": 100181, "epoch": 2385} {"train_loss": -6.40953254699707, "global_step": 100182, "epoch": 2385} {"train_loss": -6.272418022155762, "global_step": 100183, "epoch": 2385} {"train_loss": -6.342379093170166, "global_step": 100184, "epoch": 2385} {"train_loss": -6.497087478637695, "global_step": 100185, "epoch": 2385} {"train_loss": -6.371789932250977, "global_step": 100186, "epoch": 2385} {"train_loss": -6.359379768371582, "global_step": 100187, "epoch": 2385} {"train_loss": -6.4012250900268555, "global_step": 100188, "epoch": 2385} {"train_loss": -6.399350166320801, "global_step": 100189, "epoch": 2385} {"train_loss": -6.419907569885254, "global_step": 100190, "epoch": 2385} {"train_loss": -6.329930305480957, "global_step": 100191, "epoch": 2385} {"train_loss": -6.240408897399902, "global_step": 100192, "epoch": 2385} {"train_loss": -6.4637274742126465, "global_step": 100193, "epoch": 2385} {"train_loss": -6.407243728637695, "global_step": 100194, "epoch": 2385} {"train_loss": -6.353849411010742, "global_step": 100195, "epoch": 2385} {"train_loss": -6.428219318389893, "global_step": 100196, "epoch": 2385} {"train_loss": -6.301487445831299, "global_step": 100197, "epoch": 2385} {"train_loss": -6.364950180053711, "global_step": 100198, "epoch": 2385} {"train_loss": -6.221911430358887, "global_step": 100199, "epoch": 2385} {"train_loss": -6.355083465576172, "global_step": 100200, "epoch": 2385} {"train_loss": -6.281412124633789, "global_step": 100201, "epoch": 2385} {"train_loss": -6.378530979156494, "global_step": 100202, "epoch": 2385} {"train_loss": -6.37966251373291, "global_step": 100203, "epoch": 2385} {"train_loss": -6.385625839233398, "global_step": 100204, "epoch": 2385} {"train_loss": -6.445396423339844, "global_step": 100205, "epoch": 2385} {"train_loss": -6.408539772033691, "global_step": 100206, "epoch": 2385} {"train_loss": -6.289249420166016, "global_step": 100207, "epoch": 2385} {"train_loss": -6.447991371154785, "global_step": 100208, "epoch": 2385} {"train_loss": -6.3379693031311035, "global_step": 100209, "epoch": 2385} {"train_loss": -6.390323638916016, "global_step": 100210, "epoch": 2385} {"train_loss": -6.370772077923729, "global_step": 100211, "epoch": 2385, "val_loss": 64016.76953125} {"train_loss": -6.3607892990112305, "global_step": 100212, "epoch": 2386} {"train_loss": -6.3699517250061035, "global_step": 100213, "epoch": 2386} {"train_loss": -6.40048360824585, "global_step": 100214, "epoch": 2386} {"train_loss": -6.444563865661621, "global_step": 100215, "epoch": 2386} {"train_loss": -6.427910804748535, "global_step": 100216, "epoch": 2386} {"train_loss": -6.406006336212158, "global_step": 100217, "epoch": 2386} {"train_loss": -6.347954273223877, "global_step": 100218, "epoch": 2386} {"train_loss": -6.507693290710449, "global_step": 100219, "epoch": 2386} {"train_loss": -6.454379558563232, "global_step": 100220, "epoch": 2386} {"train_loss": -6.354386329650879, "global_step": 100221, "epoch": 2386} {"train_loss": -6.324535369873047, "global_step": 100222, "epoch": 2386} {"train_loss": -6.4823384284973145, "global_step": 100223, "epoch": 2386} {"train_loss": -6.394940376281738, "global_step": 100224, "epoch": 2386} {"train_loss": -6.5021653175354, "global_step": 100225, "epoch": 2386} {"train_loss": -6.237600803375244, "global_step": 100226, "epoch": 2386} {"train_loss": -6.3380351066589355, "global_step": 100227, "epoch": 2386} {"train_loss": -6.483280181884766, "global_step": 100228, "epoch": 2386} {"train_loss": -6.323977947235107, "global_step": 100229, "epoch": 2386} {"train_loss": -6.284128189086914, "global_step": 100230, "epoch": 2386} {"train_loss": -6.496263027191162, "global_step": 100231, "epoch": 2386} {"train_loss": -6.380560874938965, "global_step": 100232, "epoch": 2386} {"train_loss": -6.266233444213867, "global_step": 100233, "epoch": 2386} {"train_loss": -6.436918258666992, "global_step": 100234, "epoch": 2386} {"train_loss": -6.407008647918701, "global_step": 100235, "epoch": 2386} {"train_loss": -6.33366060256958, "global_step": 100236, "epoch": 2386} {"train_loss": -6.316235065460205, "global_step": 100237, "epoch": 2386} {"train_loss": -6.212147235870361, "global_step": 100238, "epoch": 2386} {"train_loss": -6.411738872528076, "global_step": 100239, "epoch": 2386} {"train_loss": -6.416575908660889, "global_step": 100240, "epoch": 2386} {"train_loss": -6.43796443939209, "global_step": 100241, "epoch": 2386} {"train_loss": -6.34785795211792, "global_step": 100242, "epoch": 2386} {"train_loss": -6.339173316955566, "global_step": 100243, "epoch": 2386} {"train_loss": -6.369602680206299, "global_step": 100244, "epoch": 2386} {"train_loss": -6.268453598022461, "global_step": 100245, "epoch": 2386} {"train_loss": -6.2896270751953125, "global_step": 100246, "epoch": 2386} {"train_loss": -6.432071208953857, "global_step": 100247, "epoch": 2386} {"train_loss": -6.310523986816406, "global_step": 100248, "epoch": 2386} {"train_loss": -6.363068580627441, "global_step": 100249, "epoch": 2386} {"train_loss": -6.433612823486328, "global_step": 100250, "epoch": 2386} {"train_loss": -6.302487373352051, "global_step": 100251, "epoch": 2386} {"train_loss": -6.375193119049072, "global_step": 100252, "epoch": 2386} {"train_loss": -6.372219914481754, "global_step": 100253, "epoch": 2386, "val_loss": 64195.0546875} {"train_loss": -6.438302040100098, "global_step": 100254, "epoch": 2387} {"train_loss": -6.286667823791504, "global_step": 100255, "epoch": 2387} {"train_loss": -6.224851131439209, "global_step": 100256, "epoch": 2387} {"train_loss": -6.439715385437012, "global_step": 100257, "epoch": 2387} {"train_loss": -6.286474227905273, "global_step": 100258, "epoch": 2387} {"train_loss": -6.418944835662842, "global_step": 100259, "epoch": 2387} {"train_loss": -6.283780574798584, "global_step": 100260, "epoch": 2387} {"train_loss": -6.250258922576904, "global_step": 100261, "epoch": 2387} {"train_loss": -6.293749809265137, "global_step": 100262, "epoch": 2387} {"train_loss": -6.451555252075195, "global_step": 100263, "epoch": 2387} {"train_loss": -6.341752529144287, "global_step": 100264, "epoch": 2387} {"train_loss": -6.380906105041504, "global_step": 100265, "epoch": 2387} {"train_loss": -6.320690155029297, "global_step": 100266, "epoch": 2387} {"train_loss": -6.3681182861328125, "global_step": 100267, "epoch": 2387} {"train_loss": -6.316795349121094, "global_step": 100268, "epoch": 2387} {"train_loss": -6.416160583496094, "global_step": 100269, "epoch": 2387} {"train_loss": -6.441135406494141, "global_step": 100270, "epoch": 2387} {"train_loss": -6.381772518157959, "global_step": 100271, "epoch": 2387} {"train_loss": -6.369490146636963, "global_step": 100272, "epoch": 2387} {"train_loss": -6.369612693786621, "global_step": 100273, "epoch": 2387} {"train_loss": -6.471738815307617, "global_step": 100274, "epoch": 2387} {"train_loss": -6.507332801818848, "global_step": 100275, "epoch": 2387} {"train_loss": -6.477227210998535, "global_step": 100276, "epoch": 2387} {"train_loss": -6.442142486572266, "global_step": 100277, "epoch": 2387} {"train_loss": -6.286999225616455, "global_step": 100278, "epoch": 2387} {"train_loss": -6.469141960144043, "global_step": 100279, "epoch": 2387} {"train_loss": -6.384241580963135, "global_step": 100280, "epoch": 2387} {"train_loss": -6.349682807922363, "global_step": 100281, "epoch": 2387} {"train_loss": -6.47203254699707, "global_step": 100282, "epoch": 2387} {"train_loss": -6.329404830932617, "global_step": 100283, "epoch": 2387} {"train_loss": -6.424239158630371, "global_step": 100284, "epoch": 2387} {"train_loss": -6.3637566566467285, "global_step": 100285, "epoch": 2387} {"train_loss": -6.226024627685547, "global_step": 100286, "epoch": 2387} {"train_loss": -6.3117899894714355, "global_step": 100287, "epoch": 2387} {"train_loss": -6.4084153175354, "global_step": 100288, "epoch": 2387} {"train_loss": -6.458274841308594, "global_step": 100289, "epoch": 2387} {"train_loss": -6.374419212341309, "global_step": 100290, "epoch": 2387} {"train_loss": -6.46065616607666, "global_step": 100291, "epoch": 2387} {"train_loss": -6.240206718444824, "global_step": 100292, "epoch": 2387} {"train_loss": -6.440194606781006, "global_step": 100293, "epoch": 2387} {"train_loss": -6.350522994995117, "global_step": 100294, "epoch": 2387} {"train_loss": -6.373925526936849, "global_step": 100295, "epoch": 2387, "val_loss": 64155.08203125} {"train_loss": -6.342840194702148, "global_step": 100296, "epoch": 2388} {"train_loss": -6.247115135192871, "global_step": 100297, "epoch": 2388} {"train_loss": -6.3771514892578125, "global_step": 100298, "epoch": 2388} {"train_loss": -6.365105152130127, "global_step": 100299, "epoch": 2388} {"train_loss": -6.524362087249756, "global_step": 100300, "epoch": 2388} {"train_loss": -6.385869026184082, "global_step": 100301, "epoch": 2388} {"train_loss": -6.362083911895752, "global_step": 100302, "epoch": 2388} {"train_loss": -6.4409499168396, "global_step": 100303, "epoch": 2388} {"train_loss": -6.40345573425293, "global_step": 100304, "epoch": 2388} {"train_loss": -6.3250017166137695, "global_step": 100305, "epoch": 2388} {"train_loss": -6.517263412475586, "global_step": 100306, "epoch": 2388} {"train_loss": -6.29424524307251, "global_step": 100307, "epoch": 2388} {"train_loss": -6.407783031463623, "global_step": 100308, "epoch": 2388} {"train_loss": -6.496710777282715, "global_step": 100309, "epoch": 2388} {"train_loss": -6.536172389984131, "global_step": 100310, "epoch": 2388} {"train_loss": -6.424684047698975, "global_step": 100311, "epoch": 2388} {"train_loss": -6.3868408203125, "global_step": 100312, "epoch": 2388} {"train_loss": -6.470154285430908, "global_step": 100313, "epoch": 2388} {"train_loss": -6.327445983886719, "global_step": 100314, "epoch": 2388} {"train_loss": -6.464944839477539, "global_step": 100315, "epoch": 2388} {"train_loss": -6.435915946960449, "global_step": 100316, "epoch": 2388} {"train_loss": -6.426120281219482, "global_step": 100317, "epoch": 2388} {"train_loss": -6.4883131980896, "global_step": 100318, "epoch": 2388} {"train_loss": -6.485716342926025, "global_step": 100319, "epoch": 2388} {"train_loss": -6.278680324554443, "global_step": 100320, "epoch": 2388} {"train_loss": -6.372031211853027, "global_step": 100321, "epoch": 2388} {"train_loss": -6.372561454772949, "global_step": 100322, "epoch": 2388} {"train_loss": -6.401004314422607, "global_step": 100323, "epoch": 2388} {"train_loss": -6.345905303955078, "global_step": 100324, "epoch": 2388} {"train_loss": -6.2643537521362305, "global_step": 100325, "epoch": 2388} {"train_loss": -6.350153923034668, "global_step": 100326, "epoch": 2388} {"train_loss": -6.536755561828613, "global_step": 100327, "epoch": 2388} {"train_loss": -6.3756866455078125, "global_step": 100328, "epoch": 2388} {"train_loss": -6.35925817489624, "global_step": 100329, "epoch": 2388} {"train_loss": -6.446402549743652, "global_step": 100330, "epoch": 2388} {"train_loss": -6.391565322875977, "global_step": 100331, "epoch": 2388} {"train_loss": -6.381078720092773, "global_step": 100332, "epoch": 2388} {"train_loss": -6.423871040344238, "global_step": 100333, "epoch": 2388} {"train_loss": -6.345357418060303, "global_step": 100334, "epoch": 2388} {"train_loss": -6.32161808013916, "global_step": 100335, "epoch": 2388} {"train_loss": -6.319512367248535, "global_step": 100336, "epoch": 2388} {"train_loss": -6.393992344538371, "global_step": 100337, "epoch": 2388, "val_loss": 64094.9609375} {"train_loss": -6.356468677520752, "global_step": 100338, "epoch": 2389} {"train_loss": -6.323920726776123, "global_step": 100339, "epoch": 2389} {"train_loss": -6.293983459472656, "global_step": 100340, "epoch": 2389} {"train_loss": -6.440004348754883, "global_step": 100341, "epoch": 2389} {"train_loss": -6.359763145446777, "global_step": 100342, "epoch": 2389} {"train_loss": -6.423266410827637, "global_step": 100343, "epoch": 2389} {"train_loss": -6.366838455200195, "global_step": 100344, "epoch": 2389} {"train_loss": -6.373076915740967, "global_step": 100345, "epoch": 2389} {"train_loss": -6.3288726806640625, "global_step": 100346, "epoch": 2389} {"train_loss": -6.510487079620361, "global_step": 100347, "epoch": 2389} {"train_loss": -6.3318891525268555, "global_step": 100348, "epoch": 2389} {"train_loss": -6.348248481750488, "global_step": 100349, "epoch": 2389} {"train_loss": -6.45296573638916, "global_step": 100350, "epoch": 2389} {"train_loss": -6.31402587890625, "global_step": 100351, "epoch": 2389} {"train_loss": -6.3490400314331055, "global_step": 100352, "epoch": 2389} {"train_loss": -6.53118371963501, "global_step": 100353, "epoch": 2389} {"train_loss": -6.417956352233887, "global_step": 100354, "epoch": 2389} {"train_loss": -6.430999279022217, "global_step": 100355, "epoch": 2389} {"train_loss": -6.407496452331543, "global_step": 100356, "epoch": 2389} {"train_loss": -6.244706153869629, "global_step": 100357, "epoch": 2389} {"train_loss": -6.3927412033081055, "global_step": 100358, "epoch": 2389} {"train_loss": -6.24793815612793, "global_step": 100359, "epoch": 2389} {"train_loss": -6.437807559967041, "global_step": 100360, "epoch": 2389} {"train_loss": -6.429930686950684, "global_step": 100361, "epoch": 2389} {"train_loss": -6.346922874450684, "global_step": 100362, "epoch": 2389} {"train_loss": -6.325937747955322, "global_step": 100363, "epoch": 2389} {"train_loss": -6.289322853088379, "global_step": 100364, "epoch": 2389} {"train_loss": -6.398143291473389, "global_step": 100365, "epoch": 2389} {"train_loss": -6.363185882568359, "global_step": 100366, "epoch": 2389} {"train_loss": -6.384293079376221, "global_step": 100367, "epoch": 2389} {"train_loss": -6.334863662719727, "global_step": 100368, "epoch": 2389} {"train_loss": -6.277122497558594, "global_step": 100369, "epoch": 2389} {"train_loss": -6.3454132080078125, "global_step": 100370, "epoch": 2389} {"train_loss": -6.3021955490112305, "global_step": 100371, "epoch": 2389} {"train_loss": -6.297695159912109, "global_step": 100372, "epoch": 2389} {"train_loss": -6.344207763671875, "global_step": 100373, "epoch": 2389} {"train_loss": -6.320022106170654, "global_step": 100374, "epoch": 2389} {"train_loss": -6.403936862945557, "global_step": 100375, "epoch": 2389} {"train_loss": -6.430748462677002, "global_step": 100376, "epoch": 2389} {"train_loss": -6.2540106773376465, "global_step": 100377, "epoch": 2389} {"train_loss": -6.41523551940918, "global_step": 100378, "epoch": 2389} {"train_loss": -6.364087116150629, "global_step": 100379, "epoch": 2389, "val_loss": 64110.86328125} {"train_loss": -6.405237197875977, "global_step": 100380, "epoch": 2390} {"train_loss": -6.316159248352051, "global_step": 100381, "epoch": 2390} {"train_loss": -6.269559860229492, "global_step": 100382, "epoch": 2390} {"train_loss": -6.290728569030762, "global_step": 100383, "epoch": 2390} {"train_loss": -6.34588623046875, "global_step": 100384, "epoch": 2390} {"train_loss": -6.280055522918701, "global_step": 100385, "epoch": 2390} {"train_loss": -6.266190052032471, "global_step": 100386, "epoch": 2390} {"train_loss": -6.439270496368408, "global_step": 100387, "epoch": 2390} {"train_loss": -6.355936050415039, "global_step": 100388, "epoch": 2390} {"train_loss": -6.384897232055664, "global_step": 100389, "epoch": 2390} {"train_loss": -6.3039960861206055, "global_step": 100390, "epoch": 2390} {"train_loss": -6.401844024658203, "global_step": 100391, "epoch": 2390} {"train_loss": -6.294793605804443, "global_step": 100392, "epoch": 2390} {"train_loss": -6.295329570770264, "global_step": 100393, "epoch": 2390} {"train_loss": -6.391518592834473, "global_step": 100394, "epoch": 2390} {"train_loss": -6.36521053314209, "global_step": 100395, "epoch": 2390} {"train_loss": -6.363612174987793, "global_step": 100396, "epoch": 2390} {"train_loss": -6.303544044494629, "global_step": 100397, "epoch": 2390} {"train_loss": -6.462602615356445, "global_step": 100398, "epoch": 2390} {"train_loss": -6.376956939697266, "global_step": 100399, "epoch": 2390} {"train_loss": -6.374632358551025, "global_step": 100400, "epoch": 2390} {"train_loss": -6.36729621887207, "global_step": 100401, "epoch": 2390} {"train_loss": -6.483186721801758, "global_step": 100402, "epoch": 2390} {"train_loss": -6.350584983825684, "global_step": 100403, "epoch": 2390} {"train_loss": -6.534239768981934, "global_step": 100404, "epoch": 2390} {"train_loss": -6.385430335998535, "global_step": 100405, "epoch": 2390} {"train_loss": -6.342217922210693, "global_step": 100406, "epoch": 2390} {"train_loss": -6.274782657623291, "global_step": 100407, "epoch": 2390} {"train_loss": -6.358003616333008, "global_step": 100408, "epoch": 2390} {"train_loss": -6.259552478790283, "global_step": 100409, "epoch": 2390} {"train_loss": -6.496272087097168, "global_step": 100410, "epoch": 2390} {"train_loss": -6.436007022857666, "global_step": 100411, "epoch": 2390} {"train_loss": -6.464409828186035, "global_step": 100412, "epoch": 2390} {"train_loss": -6.4403486251831055, "global_step": 100413, "epoch": 2390} {"train_loss": -6.293335914611816, "global_step": 100414, "epoch": 2390} {"train_loss": -6.383937358856201, "global_step": 100415, "epoch": 2390} {"train_loss": -6.354323387145996, "global_step": 100416, "epoch": 2390} {"train_loss": -6.22111701965332, "global_step": 100417, "epoch": 2390} {"train_loss": -6.379768371582031, "global_step": 100418, "epoch": 2390} {"train_loss": -6.47919225692749, "global_step": 100419, "epoch": 2390} {"train_loss": -6.364119529724121, "global_step": 100420, "epoch": 2390} {"train_loss": -6.365030345462618, "global_step": 100421, "epoch": 2390, "val_loss": 64097.06640625} {"train_loss": -6.4430999755859375, "global_step": 100422, "epoch": 2391} {"train_loss": -6.320815563201904, "global_step": 100423, "epoch": 2391} {"train_loss": -6.362059116363525, "global_step": 100424, "epoch": 2391} {"train_loss": -6.391098976135254, "global_step": 100425, "epoch": 2391} {"train_loss": -6.497957229614258, "global_step": 100426, "epoch": 2391} {"train_loss": -6.328064441680908, "global_step": 100427, "epoch": 2391} {"train_loss": -6.442911148071289, "global_step": 100428, "epoch": 2391} {"train_loss": -6.401891708374023, "global_step": 100429, "epoch": 2391} {"train_loss": -6.358034133911133, "global_step": 100430, "epoch": 2391} {"train_loss": -6.3647260665893555, "global_step": 100431, "epoch": 2391} {"train_loss": -6.425391674041748, "global_step": 100432, "epoch": 2391} {"train_loss": -6.31089973449707, "global_step": 100433, "epoch": 2391} {"train_loss": -6.31601619720459, "global_step": 100434, "epoch": 2391} {"train_loss": -6.411572456359863, "global_step": 100435, "epoch": 2391} {"train_loss": -6.425743103027344, "global_step": 100436, "epoch": 2391} {"train_loss": -6.381296634674072, "global_step": 100437, "epoch": 2391} {"train_loss": -6.40669059753418, "global_step": 100438, "epoch": 2391} {"train_loss": -6.442238807678223, "global_step": 100439, "epoch": 2391} {"train_loss": -6.319936752319336, "global_step": 100440, "epoch": 2391} {"train_loss": -6.220021724700928, "global_step": 100441, "epoch": 2391} {"train_loss": -6.3935041427612305, "global_step": 100442, "epoch": 2391} {"train_loss": -6.366537094116211, "global_step": 100443, "epoch": 2391} {"train_loss": -6.361257553100586, "global_step": 100444, "epoch": 2391} {"train_loss": -6.376482963562012, "global_step": 100445, "epoch": 2391} {"train_loss": -6.305769443511963, "global_step": 100446, "epoch": 2391} {"train_loss": -6.357820510864258, "global_step": 100447, "epoch": 2391} {"train_loss": -6.366311073303223, "global_step": 100448, "epoch": 2391} {"train_loss": -6.387805938720703, "global_step": 100449, "epoch": 2391} {"train_loss": -6.340837478637695, "global_step": 100450, "epoch": 2391} {"train_loss": -6.426197052001953, "global_step": 100451, "epoch": 2391} {"train_loss": -6.392797470092773, "global_step": 100452, "epoch": 2391} {"train_loss": -6.409205436706543, "global_step": 100453, "epoch": 2391} {"train_loss": -6.463075160980225, "global_step": 100454, "epoch": 2391} {"train_loss": -6.313882827758789, "global_step": 100455, "epoch": 2391} {"train_loss": -6.356128692626953, "global_step": 100456, "epoch": 2391} {"train_loss": -6.395790100097656, "global_step": 100457, "epoch": 2391} {"train_loss": -6.514510154724121, "global_step": 100458, "epoch": 2391} {"train_loss": -6.4846086502075195, "global_step": 100459, "epoch": 2391} {"train_loss": -6.471285343170166, "global_step": 100460, "epoch": 2391} {"train_loss": -6.355447769165039, "global_step": 100461, "epoch": 2391} {"train_loss": -6.3700714111328125, "global_step": 100462, "epoch": 2391} {"train_loss": -6.386613391694569, "global_step": 100463, "epoch": 2391, "val_loss": 64164.90234375} {"train_loss": -6.445779323577881, "global_step": 100464, "epoch": 2392} {"train_loss": -6.4435577392578125, "global_step": 100465, "epoch": 2392} {"train_loss": -6.552859306335449, "global_step": 100466, "epoch": 2392} {"train_loss": -6.476734161376953, "global_step": 100467, "epoch": 2392} {"train_loss": -6.386865139007568, "global_step": 100468, "epoch": 2392} {"train_loss": -6.436175346374512, "global_step": 100469, "epoch": 2392} {"train_loss": -6.398782730102539, "global_step": 100470, "epoch": 2392} {"train_loss": -6.479722023010254, "global_step": 100471, "epoch": 2392} {"train_loss": -6.318819046020508, "global_step": 100472, "epoch": 2392} {"train_loss": -6.402286529541016, "global_step": 100473, "epoch": 2392} {"train_loss": -6.371894836425781, "global_step": 100474, "epoch": 2392} {"train_loss": -6.320523262023926, "global_step": 100475, "epoch": 2392} {"train_loss": -6.4151506423950195, "global_step": 100476, "epoch": 2392} {"train_loss": -6.471671104431152, "global_step": 100477, "epoch": 2392} {"train_loss": -6.402461528778076, "global_step": 100478, "epoch": 2392} {"train_loss": -6.23974609375, "global_step": 100479, "epoch": 2392} {"train_loss": -6.346606254577637, "global_step": 100480, "epoch": 2392} {"train_loss": -6.305360794067383, "global_step": 100481, "epoch": 2392} {"train_loss": -6.297073841094971, "global_step": 100482, "epoch": 2392} {"train_loss": -6.312062740325928, "global_step": 100483, "epoch": 2392} {"train_loss": -6.396397590637207, "global_step": 100484, "epoch": 2392} {"train_loss": -6.430802345275879, "global_step": 100485, "epoch": 2392} {"train_loss": -6.420378684997559, "global_step": 100486, "epoch": 2392} {"train_loss": -6.316388130187988, "global_step": 100487, "epoch": 2392} {"train_loss": -6.367064476013184, "global_step": 100488, "epoch": 2392} {"train_loss": -6.303976535797119, "global_step": 100489, "epoch": 2392} {"train_loss": -6.325946807861328, "global_step": 100490, "epoch": 2392} {"train_loss": -6.419676303863525, "global_step": 100491, "epoch": 2392} {"train_loss": -6.354200839996338, "global_step": 100492, "epoch": 2392} {"train_loss": -6.381213665008545, "global_step": 100493, "epoch": 2392} {"train_loss": -6.386286735534668, "global_step": 100494, "epoch": 2392} {"train_loss": -6.4120941162109375, "global_step": 100495, "epoch": 2392} {"train_loss": -6.505599498748779, "global_step": 100496, "epoch": 2392} {"train_loss": -6.329971790313721, "global_step": 100497, "epoch": 2392} {"train_loss": -6.259994983673096, "global_step": 100498, "epoch": 2392} {"train_loss": -6.465839385986328, "global_step": 100499, "epoch": 2392} {"train_loss": -6.281911849975586, "global_step": 100500, "epoch": 2392} {"train_loss": -6.342648506164551, "global_step": 100501, "epoch": 2392} {"train_loss": -6.339072227478027, "global_step": 100502, "epoch": 2392} {"train_loss": -6.313844680786133, "global_step": 100503, "epoch": 2392} {"train_loss": -6.412836074829102, "global_step": 100504, "epoch": 2392} {"train_loss": -6.382001104808989, "global_step": 100505, "epoch": 2392, "val_loss": 63992.99609375} {"train_loss": -6.380012512207031, "global_step": 100506, "epoch": 2393} {"train_loss": -6.396330833435059, "global_step": 100507, "epoch": 2393} {"train_loss": -6.5338335037231445, "global_step": 100508, "epoch": 2393} {"train_loss": -6.206551551818848, "global_step": 100509, "epoch": 2393} {"train_loss": -6.375068664550781, "global_step": 100510, "epoch": 2393} {"train_loss": -6.436107635498047, "global_step": 100511, "epoch": 2393} {"train_loss": -6.320184230804443, "global_step": 100512, "epoch": 2393} {"train_loss": -6.287147045135498, "global_step": 100513, "epoch": 2393} {"train_loss": -6.426522254943848, "global_step": 100514, "epoch": 2393} {"train_loss": -6.2970170974731445, "global_step": 100515, "epoch": 2393} {"train_loss": -6.402052879333496, "global_step": 100516, "epoch": 2393} {"train_loss": -6.1794562339782715, "global_step": 100517, "epoch": 2393} {"train_loss": -6.395120143890381, "global_step": 100518, "epoch": 2393} {"train_loss": -6.412957668304443, "global_step": 100519, "epoch": 2393} {"train_loss": -6.435379981994629, "global_step": 100520, "epoch": 2393} {"train_loss": -6.37714958190918, "global_step": 100521, "epoch": 2393} {"train_loss": -6.401085376739502, "global_step": 100522, "epoch": 2393} {"train_loss": -6.373874664306641, "global_step": 100523, "epoch": 2393} {"train_loss": -6.42263650894165, "global_step": 100524, "epoch": 2393} {"train_loss": -6.360095024108887, "global_step": 100525, "epoch": 2393} {"train_loss": -6.435741424560547, "global_step": 100526, "epoch": 2393} {"train_loss": -6.388561248779297, "global_step": 100527, "epoch": 2393} {"train_loss": -6.545499801635742, "global_step": 100528, "epoch": 2393} {"train_loss": -6.439755916595459, "global_step": 100529, "epoch": 2393} {"train_loss": -6.26646614074707, "global_step": 100530, "epoch": 2393} {"train_loss": -6.354031562805176, "global_step": 100531, "epoch": 2393} {"train_loss": -6.360925674438477, "global_step": 100532, "epoch": 2393} {"train_loss": -6.401832580566406, "global_step": 100533, "epoch": 2393} {"train_loss": -6.369194984436035, "global_step": 100534, "epoch": 2393} {"train_loss": -6.447375297546387, "global_step": 100535, "epoch": 2393} {"train_loss": -6.393560409545898, "global_step": 100536, "epoch": 2393} {"train_loss": -6.427367210388184, "global_step": 100537, "epoch": 2393} {"train_loss": -6.432267189025879, "global_step": 100538, "epoch": 2393} {"train_loss": -6.3217926025390625, "global_step": 100539, "epoch": 2393} {"train_loss": -6.468776226043701, "global_step": 100540, "epoch": 2393} {"train_loss": -6.335183143615723, "global_step": 100541, "epoch": 2393} {"train_loss": -6.343093395233154, "global_step": 100542, "epoch": 2393} {"train_loss": -6.410397052764893, "global_step": 100543, "epoch": 2393} {"train_loss": -6.445919990539551, "global_step": 100544, "epoch": 2393} {"train_loss": -6.302173614501953, "global_step": 100545, "epoch": 2393} {"train_loss": -6.282949924468994, "global_step": 100546, "epoch": 2393} {"train_loss": -6.377060958317348, "global_step": 100547, "epoch": 2393, "val_loss": 64259.49609375} {"train_loss": -6.444419860839844, "global_step": 100548, "epoch": 2394} {"train_loss": -6.355659008026123, "global_step": 100549, "epoch": 2394} {"train_loss": -6.301806926727295, "global_step": 100550, "epoch": 2394} {"train_loss": -6.512533664703369, "global_step": 100551, "epoch": 2394} {"train_loss": -6.368656158447266, "global_step": 100552, "epoch": 2394} {"train_loss": -6.380045413970947, "global_step": 100553, "epoch": 2394} {"train_loss": -6.376128196716309, "global_step": 100554, "epoch": 2394} {"train_loss": -6.358546257019043, "global_step": 100555, "epoch": 2394} {"train_loss": -6.433032989501953, "global_step": 100556, "epoch": 2394} {"train_loss": -6.3274054527282715, "global_step": 100557, "epoch": 2394} {"train_loss": -6.363311767578125, "global_step": 100558, "epoch": 2394} {"train_loss": -6.376531600952148, "global_step": 100559, "epoch": 2394} {"train_loss": -6.470317840576172, "global_step": 100560, "epoch": 2394} {"train_loss": -6.418107986450195, "global_step": 100561, "epoch": 2394} {"train_loss": -6.372596740722656, "global_step": 100562, "epoch": 2394} {"train_loss": -6.483933448791504, "global_step": 100563, "epoch": 2394} {"train_loss": -6.407113552093506, "global_step": 100564, "epoch": 2394} {"train_loss": -6.418523788452148, "global_step": 100565, "epoch": 2394} {"train_loss": -6.200794219970703, "global_step": 100566, "epoch": 2394} {"train_loss": -6.460417747497559, "global_step": 100567, "epoch": 2394} {"train_loss": -6.376997947692871, "global_step": 100568, "epoch": 2394} {"train_loss": -6.346484661102295, "global_step": 100569, "epoch": 2394} {"train_loss": -6.423095226287842, "global_step": 100570, "epoch": 2394} {"train_loss": -6.2787346839904785, "global_step": 100571, "epoch": 2394} {"train_loss": -6.412640571594238, "global_step": 100572, "epoch": 2394} {"train_loss": -6.428651332855225, "global_step": 100573, "epoch": 2394} {"train_loss": -6.288484573364258, "global_step": 100574, "epoch": 2394} {"train_loss": -6.357831001281738, "global_step": 100575, "epoch": 2394} {"train_loss": -6.300490379333496, "global_step": 100576, "epoch": 2394} {"train_loss": -6.3001484870910645, "global_step": 100577, "epoch": 2394} {"train_loss": -6.273143768310547, "global_step": 100578, "epoch": 2394} {"train_loss": -6.391599178314209, "global_step": 100579, "epoch": 2394} {"train_loss": -6.416667461395264, "global_step": 100580, "epoch": 2394} {"train_loss": -6.3350749015808105, "global_step": 100581, "epoch": 2394} {"train_loss": -6.3688812255859375, "global_step": 100582, "epoch": 2394} {"train_loss": -6.354146957397461, "global_step": 100583, "epoch": 2394} {"train_loss": -6.380596160888672, "global_step": 100584, "epoch": 2394} {"train_loss": -6.19393253326416, "global_step": 100585, "epoch": 2394} {"train_loss": -6.340423583984375, "global_step": 100586, "epoch": 2394} {"train_loss": -6.366327285766602, "global_step": 100587, "epoch": 2394} {"train_loss": -6.236530780792236, "global_step": 100588, "epoch": 2394} {"train_loss": -6.362106084823608, "global_step": 100589, "epoch": 2394, "val_loss": 64346.984375} {"train_loss": -6.329197883605957, "global_step": 100590, "epoch": 2395} {"train_loss": -6.282415390014648, "global_step": 100591, "epoch": 2395} {"train_loss": -6.184561729431152, "global_step": 100592, "epoch": 2395} {"train_loss": -6.380438804626465, "global_step": 100593, "epoch": 2395} {"train_loss": -6.248854637145996, "global_step": 100594, "epoch": 2395} {"train_loss": -6.3195061683654785, "global_step": 100595, "epoch": 2395} {"train_loss": -6.403767108917236, "global_step": 100596, "epoch": 2395} {"train_loss": -6.2277631759643555, "global_step": 100597, "epoch": 2395} {"train_loss": -6.272941589355469, "global_step": 100598, "epoch": 2395} {"train_loss": -6.348201751708984, "global_step": 100599, "epoch": 2395} {"train_loss": -6.384422779083252, "global_step": 100600, "epoch": 2395} {"train_loss": -6.334227561950684, "global_step": 100601, "epoch": 2395} {"train_loss": -6.340023040771484, "global_step": 100602, "epoch": 2395} {"train_loss": -6.44998836517334, "global_step": 100603, "epoch": 2395} {"train_loss": -6.436093807220459, "global_step": 100604, "epoch": 2395} {"train_loss": -6.311653137207031, "global_step": 100605, "epoch": 2395} {"train_loss": -6.388040542602539, "global_step": 100606, "epoch": 2395} {"train_loss": -6.41972017288208, "global_step": 100607, "epoch": 2395} {"train_loss": -6.378861427307129, "global_step": 100608, "epoch": 2395} {"train_loss": -6.408831596374512, "global_step": 100609, "epoch": 2395} {"train_loss": -6.280706882476807, "global_step": 100610, "epoch": 2395} {"train_loss": -6.3497514724731445, "global_step": 100611, "epoch": 2395} {"train_loss": -6.289220809936523, "global_step": 100612, "epoch": 2395} {"train_loss": -6.364941596984863, "global_step": 100613, "epoch": 2395} {"train_loss": -6.353703498840332, "global_step": 100614, "epoch": 2395} {"train_loss": -6.500998020172119, "global_step": 100615, "epoch": 2395} {"train_loss": -6.431613922119141, "global_step": 100616, "epoch": 2395} {"train_loss": -6.28237247467041, "global_step": 100617, "epoch": 2395} {"train_loss": -6.353250980377197, "global_step": 100618, "epoch": 2395} {"train_loss": -6.334670066833496, "global_step": 100619, "epoch": 2395} {"train_loss": -6.194761276245117, "global_step": 100620, "epoch": 2395} {"train_loss": -6.416267395019531, "global_step": 100621, "epoch": 2395} {"train_loss": -6.343953609466553, "global_step": 100622, "epoch": 2395} {"train_loss": -6.264274597167969, "global_step": 100623, "epoch": 2395} {"train_loss": -6.398228168487549, "global_step": 100624, "epoch": 2395} {"train_loss": -6.466380596160889, "global_step": 100625, "epoch": 2395} {"train_loss": -6.323925971984863, "global_step": 100626, "epoch": 2395} {"train_loss": -6.390398979187012, "global_step": 100627, "epoch": 2395} {"train_loss": -6.425520420074463, "global_step": 100628, "epoch": 2395} {"train_loss": -6.429945468902588, "global_step": 100629, "epoch": 2395} {"train_loss": -6.343602180480957, "global_step": 100630, "epoch": 2395} {"train_loss": -6.352273941040039, "global_step": 100631, "epoch": 2395, "val_loss": 63964.109375} {"train_loss": -6.385705471038818, "global_step": 100632, "epoch": 2396} {"train_loss": -6.399008750915527, "global_step": 100633, "epoch": 2396} {"train_loss": -6.442987442016602, "global_step": 100634, "epoch": 2396} {"train_loss": -6.471005916595459, "global_step": 100635, "epoch": 2396} {"train_loss": -6.341386795043945, "global_step": 100636, "epoch": 2396} {"train_loss": -6.420829772949219, "global_step": 100637, "epoch": 2396} {"train_loss": -6.401827335357666, "global_step": 100638, "epoch": 2396} {"train_loss": -6.319138526916504, "global_step": 100639, "epoch": 2396} {"train_loss": -6.221744537353516, "global_step": 100640, "epoch": 2396} {"train_loss": -6.388859748840332, "global_step": 100641, "epoch": 2396} {"train_loss": -6.322479724884033, "global_step": 100642, "epoch": 2396} {"train_loss": -6.516112327575684, "global_step": 100643, "epoch": 2396} {"train_loss": -6.306468963623047, "global_step": 100644, "epoch": 2396} {"train_loss": -6.411871910095215, "global_step": 100645, "epoch": 2396} {"train_loss": -6.397470951080322, "global_step": 100646, "epoch": 2396} {"train_loss": -6.369500637054443, "global_step": 100647, "epoch": 2396} {"train_loss": -6.328778266906738, "global_step": 100648, "epoch": 2396} {"train_loss": -6.384676933288574, "global_step": 100649, "epoch": 2396} {"train_loss": -6.419987201690674, "global_step": 100650, "epoch": 2396} {"train_loss": -6.377903938293457, "global_step": 100651, "epoch": 2396} {"train_loss": -6.406031608581543, "global_step": 100652, "epoch": 2396} {"train_loss": -6.36248779296875, "global_step": 100653, "epoch": 2396} {"train_loss": -6.356364727020264, "global_step": 100654, "epoch": 2396} {"train_loss": -6.292845726013184, "global_step": 100655, "epoch": 2396} {"train_loss": -6.325385093688965, "global_step": 100656, "epoch": 2396} {"train_loss": -6.335899353027344, "global_step": 100657, "epoch": 2396} {"train_loss": -6.371084213256836, "global_step": 100658, "epoch": 2396} {"train_loss": -6.416907787322998, "global_step": 100659, "epoch": 2396} {"train_loss": -6.442268371582031, "global_step": 100660, "epoch": 2396} {"train_loss": -6.38070011138916, "global_step": 100661, "epoch": 2396} {"train_loss": -6.438238620758057, "global_step": 100662, "epoch": 2396} {"train_loss": -6.19360876083374, "global_step": 100663, "epoch": 2396} {"train_loss": -6.3275146484375, "global_step": 100664, "epoch": 2396} {"train_loss": -6.484196186065674, "global_step": 100665, "epoch": 2396} {"train_loss": -6.267960071563721, "global_step": 100666, "epoch": 2396} {"train_loss": -6.328784942626953, "global_step": 100667, "epoch": 2396} {"train_loss": -6.471253395080566, "global_step": 100668, "epoch": 2396} {"train_loss": -6.343481063842773, "global_step": 100669, "epoch": 2396} {"train_loss": -6.411806583404541, "global_step": 100670, "epoch": 2396} {"train_loss": -6.26052188873291, "global_step": 100671, "epoch": 2396} {"train_loss": -6.221142292022705, "global_step": 100672, "epoch": 2396} {"train_loss": -6.3659510271889825, "global_step": 100673, "epoch": 2396, "val_loss": 64381.64453125} {"train_loss": -6.394523620605469, "global_step": 100674, "epoch": 2397} {"train_loss": -6.3777852058410645, "global_step": 100675, "epoch": 2397} {"train_loss": -6.161273002624512, "global_step": 100676, "epoch": 2397} {"train_loss": -6.241930961608887, "global_step": 100677, "epoch": 2397} {"train_loss": -6.355128765106201, "global_step": 100678, "epoch": 2397} {"train_loss": -6.349016189575195, "global_step": 100679, "epoch": 2397} {"train_loss": -6.379943370819092, "global_step": 100680, "epoch": 2397} {"train_loss": -6.341875076293945, "global_step": 100681, "epoch": 2397} {"train_loss": -6.43714714050293, "global_step": 100682, "epoch": 2397} {"train_loss": -6.44735050201416, "global_step": 100683, "epoch": 2397} {"train_loss": -6.323565483093262, "global_step": 100684, "epoch": 2397} {"train_loss": -6.397944450378418, "global_step": 100685, "epoch": 2397} {"train_loss": -6.400599479675293, "global_step": 100686, "epoch": 2397} {"train_loss": -6.392451286315918, "global_step": 100687, "epoch": 2397} {"train_loss": -6.271201133728027, "global_step": 100688, "epoch": 2397} {"train_loss": -6.273024559020996, "global_step": 100689, "epoch": 2397} {"train_loss": -6.338647842407227, "global_step": 100690, "epoch": 2397} {"train_loss": -6.400531768798828, "global_step": 100691, "epoch": 2397} {"train_loss": -6.504156589508057, "global_step": 100692, "epoch": 2397} {"train_loss": -6.3492231369018555, "global_step": 100693, "epoch": 2397} {"train_loss": -6.360987186431885, "global_step": 100694, "epoch": 2397} {"train_loss": -6.359301567077637, "global_step": 100695, "epoch": 2397} {"train_loss": -6.381171226501465, "global_step": 100696, "epoch": 2397} {"train_loss": -6.400047779083252, "global_step": 100697, "epoch": 2397} {"train_loss": -6.29401159286499, "global_step": 100698, "epoch": 2397} {"train_loss": -6.294668674468994, "global_step": 100699, "epoch": 2397} {"train_loss": -6.387189865112305, "global_step": 100700, "epoch": 2397} {"train_loss": -6.359521865844727, "global_step": 100701, "epoch": 2397} {"train_loss": -6.325058937072754, "global_step": 100702, "epoch": 2397} {"train_loss": -6.434237480163574, "global_step": 100703, "epoch": 2397} {"train_loss": -6.363445281982422, "global_step": 100704, "epoch": 2397} {"train_loss": -6.434126377105713, "global_step": 100705, "epoch": 2397} {"train_loss": -6.387228012084961, "global_step": 100706, "epoch": 2397} {"train_loss": -6.328498840332031, "global_step": 100707, "epoch": 2397} {"train_loss": -6.281496047973633, "global_step": 100708, "epoch": 2397} {"train_loss": -6.36810302734375, "global_step": 100709, "epoch": 2397} {"train_loss": -6.407039642333984, "global_step": 100710, "epoch": 2397} {"train_loss": -6.4006500244140625, "global_step": 100711, "epoch": 2397} {"train_loss": -6.337953567504883, "global_step": 100712, "epoch": 2397} {"train_loss": -6.411577224731445, "global_step": 100713, "epoch": 2397} {"train_loss": -6.4497175216674805, "global_step": 100714, "epoch": 2397} {"train_loss": -6.3623667898632235, "global_step": 100715, "epoch": 2397, "val_loss": 64225.8359375} {"train_loss": -6.371255874633789, "global_step": 100716, "epoch": 2398} {"train_loss": -6.36192512512207, "global_step": 100717, "epoch": 2398} {"train_loss": -6.438688278198242, "global_step": 100718, "epoch": 2398} {"train_loss": -6.367641448974609, "global_step": 100719, "epoch": 2398} {"train_loss": -6.351161003112793, "global_step": 100720, "epoch": 2398} {"train_loss": -6.451522350311279, "global_step": 100721, "epoch": 2398} {"train_loss": -6.433070182800293, "global_step": 100722, "epoch": 2398} {"train_loss": -6.354369163513184, "global_step": 100723, "epoch": 2398} {"train_loss": -6.402156829833984, "global_step": 100724, "epoch": 2398} {"train_loss": -6.482453346252441, "global_step": 100725, "epoch": 2398} {"train_loss": -6.4019341468811035, "global_step": 100726, "epoch": 2398} {"train_loss": -6.344318866729736, "global_step": 100727, "epoch": 2398} {"train_loss": -6.45989990234375, "global_step": 100728, "epoch": 2398} {"train_loss": -6.44658088684082, "global_step": 100729, "epoch": 2398} {"train_loss": -6.469106674194336, "global_step": 100730, "epoch": 2398} {"train_loss": -6.423317909240723, "global_step": 100731, "epoch": 2398} {"train_loss": -6.335463047027588, "global_step": 100732, "epoch": 2398} {"train_loss": -6.416545867919922, "global_step": 100733, "epoch": 2398} {"train_loss": -6.357722282409668, "global_step": 100734, "epoch": 2398} {"train_loss": -6.313906669616699, "global_step": 100735, "epoch": 2398} {"train_loss": -6.362432479858398, "global_step": 100736, "epoch": 2398} {"train_loss": -6.324854850769043, "global_step": 100737, "epoch": 2398} {"train_loss": -6.421296119689941, "global_step": 100738, "epoch": 2398} {"train_loss": -6.4204301834106445, "global_step": 100739, "epoch": 2398} {"train_loss": -6.448946475982666, "global_step": 100740, "epoch": 2398} {"train_loss": -6.411225318908691, "global_step": 100741, "epoch": 2398} {"train_loss": -6.321845054626465, "global_step": 100742, "epoch": 2398} {"train_loss": -6.391919136047363, "global_step": 100743, "epoch": 2398} {"train_loss": -6.329791069030762, "global_step": 100744, "epoch": 2398} {"train_loss": -6.403567314147949, "global_step": 100745, "epoch": 2398} {"train_loss": -6.431809902191162, "global_step": 100746, "epoch": 2398} {"train_loss": -6.404664516448975, "global_step": 100747, "epoch": 2398} {"train_loss": -6.3394365310668945, "global_step": 100748, "epoch": 2398} {"train_loss": -6.4596099853515625, "global_step": 100749, "epoch": 2398} {"train_loss": -6.319819927215576, "global_step": 100750, "epoch": 2398} {"train_loss": -6.358255386352539, "global_step": 100751, "epoch": 2398} {"train_loss": -6.422786235809326, "global_step": 100752, "epoch": 2398} {"train_loss": -6.31341552734375, "global_step": 100753, "epoch": 2398} {"train_loss": -6.331510066986084, "global_step": 100754, "epoch": 2398} {"train_loss": -6.3914384841918945, "global_step": 100755, "epoch": 2398} {"train_loss": -6.402035713195801, "global_step": 100756, "epoch": 2398} {"train_loss": -6.3908371925354, "global_step": 100757, "epoch": 2398, "val_loss": 64227.5859375} {"train_loss": -6.384098052978516, "global_step": 100758, "epoch": 2399} {"train_loss": -6.456930160522461, "global_step": 100759, "epoch": 2399} {"train_loss": -6.384683132171631, "global_step": 100760, "epoch": 2399} {"train_loss": -6.35382604598999, "global_step": 100761, "epoch": 2399} {"train_loss": -6.417280197143555, "global_step": 100762, "epoch": 2399} {"train_loss": -6.370870113372803, "global_step": 100763, "epoch": 2399} {"train_loss": -6.420526504516602, "global_step": 100764, "epoch": 2399} {"train_loss": -6.292562961578369, "global_step": 100765, "epoch": 2399} {"train_loss": -6.30815315246582, "global_step": 100766, "epoch": 2399} {"train_loss": -6.340238571166992, "global_step": 100767, "epoch": 2399} {"train_loss": -6.343958854675293, "global_step": 100768, "epoch": 2399} {"train_loss": -6.3195695877075195, "global_step": 100769, "epoch": 2399} {"train_loss": -6.304013252258301, "global_step": 100770, "epoch": 2399} {"train_loss": -6.390689849853516, "global_step": 100771, "epoch": 2399} {"train_loss": -6.363646984100342, "global_step": 100772, "epoch": 2399} {"train_loss": -6.30178165435791, "global_step": 100773, "epoch": 2399} {"train_loss": -6.352320194244385, "global_step": 100774, "epoch": 2399} {"train_loss": -6.394035816192627, "global_step": 100775, "epoch": 2399} {"train_loss": -6.309608459472656, "global_step": 100776, "epoch": 2399} {"train_loss": -6.37548303604126, "global_step": 100777, "epoch": 2399} {"train_loss": -6.2522406578063965, "global_step": 100778, "epoch": 2399} {"train_loss": -6.337375164031982, "global_step": 100779, "epoch": 2399} {"train_loss": -6.214982032775879, "global_step": 100780, "epoch": 2399} {"train_loss": -6.358349323272705, "global_step": 100781, "epoch": 2399} {"train_loss": -6.420206069946289, "global_step": 100782, "epoch": 2399} {"train_loss": -6.308372974395752, "global_step": 100783, "epoch": 2399} {"train_loss": -6.435076713562012, "global_step": 100784, "epoch": 2399} {"train_loss": -6.386581897735596, "global_step": 100785, "epoch": 2399} {"train_loss": -6.422020435333252, "global_step": 100786, "epoch": 2399} {"train_loss": -6.426430702209473, "global_step": 100787, "epoch": 2399} {"train_loss": -6.351580619812012, "global_step": 100788, "epoch": 2399} {"train_loss": -6.4815778732299805, "global_step": 100789, "epoch": 2399} {"train_loss": -6.488888263702393, "global_step": 100790, "epoch": 2399} {"train_loss": -6.380876064300537, "global_step": 100791, "epoch": 2399} {"train_loss": -6.393139839172363, "global_step": 100792, "epoch": 2399} {"train_loss": -6.331792831420898, "global_step": 100793, "epoch": 2399} {"train_loss": -6.336230754852295, "global_step": 100794, "epoch": 2399} {"train_loss": -6.406305313110352, "global_step": 100795, "epoch": 2399} {"train_loss": -6.554188251495361, "global_step": 100796, "epoch": 2399} {"train_loss": -6.411370754241943, "global_step": 100797, "epoch": 2399} {"train_loss": -6.513967990875244, "global_step": 100798, "epoch": 2399} {"train_loss": -6.374406837281727, "global_step": 100799, "epoch": 2399, "val_loss": 64214.98046875} {"train_loss": -6.482666969299316, "global_step": 100800, "epoch": 2400} {"train_loss": -6.495319366455078, "global_step": 100801, "epoch": 2400} {"train_loss": -6.371935844421387, "global_step": 100802, "epoch": 2400} {"train_loss": -6.302210807800293, "global_step": 100803, "epoch": 2400} {"train_loss": -6.523744583129883, "global_step": 100804, "epoch": 2400} {"train_loss": -6.324798583984375, "global_step": 100805, "epoch": 2400} {"train_loss": -6.285196304321289, "global_step": 100806, "epoch": 2400} {"train_loss": -6.314716339111328, "global_step": 100807, "epoch": 2400} {"train_loss": -6.3069610595703125, "global_step": 100808, "epoch": 2400} {"train_loss": -6.271718502044678, "global_step": 100809, "epoch": 2400} {"train_loss": -6.03928804397583, "global_step": 100810, "epoch": 2400} {"train_loss": -6.211557388305664, "global_step": 100811, "epoch": 2400} {"train_loss": -6.1899895668029785, "global_step": 100812, "epoch": 2400} {"train_loss": -6.128899097442627, "global_step": 100813, "epoch": 2400} {"train_loss": -6.322007656097412, "global_step": 100814, "epoch": 2400} {"train_loss": -6.1335906982421875, "global_step": 100815, "epoch": 2400} {"train_loss": -6.230186462402344, "global_step": 100816, "epoch": 2400} {"train_loss": -6.288025856018066, "global_step": 100817, "epoch": 2400} {"train_loss": -6.117698669433594, "global_step": 100818, "epoch": 2400} {"train_loss": -6.074819564819336, "global_step": 100819, "epoch": 2400} {"train_loss": -6.178096771240234, "global_step": 100820, "epoch": 2400} {"train_loss": -6.268415451049805, "global_step": 100821, "epoch": 2400} {"train_loss": -6.094099044799805, "global_step": 100822, "epoch": 2400} {"train_loss": -6.244372367858887, "global_step": 100823, "epoch": 2400} {"train_loss": -6.1714887619018555, "global_step": 100824, "epoch": 2400} {"train_loss": -6.277470111846924, "global_step": 100825, "epoch": 2400} {"train_loss": -6.1670331954956055, "global_step": 100826, "epoch": 2400} {"train_loss": -6.370146751403809, "global_step": 100827, "epoch": 2400} {"train_loss": -6.336696624755859, "global_step": 100828, "epoch": 2400} {"train_loss": -6.322685718536377, "global_step": 100829, "epoch": 2400} {"train_loss": -6.4064226150512695, "global_step": 100830, "epoch": 2400} {"train_loss": -6.3222222328186035, "global_step": 100831, "epoch": 2400} {"train_loss": -6.264979362487793, "global_step": 100832, "epoch": 2400} {"train_loss": -6.333978176116943, "global_step": 100833, "epoch": 2400} {"train_loss": -6.120820045471191, "global_step": 100834, "epoch": 2400} {"train_loss": -6.472443103790283, "global_step": 100835, "epoch": 2400} {"train_loss": -6.320772171020508, "global_step": 100836, "epoch": 2400} {"train_loss": -6.357463359832764, "global_step": 100837, "epoch": 2400} {"train_loss": -6.361973285675049, "global_step": 100838, "epoch": 2400} {"train_loss": -6.379830837249756, "global_step": 100839, "epoch": 2400} {"train_loss": -6.358936309814453, "global_step": 100840, "epoch": 2400} {"train_loss": -6.282402220226469, "global_step": 100841, "epoch": 2400, "train/sim_max_reward_0": 0.2002524574240264, "train/sim_max_reward_1": 0.42672764436552224, "train/sim_max_reward_2": 0.5871450533670717, "train/sim_max_reward_3": 0.14268539874841843, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5302863108979905, "test/sim_max_reward_4300002": 0.9926630108744683, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9597088053958841, "test/sim_max_reward_4300006": 0.8631860667996208, "test/sim_max_reward_4300007": 0.31962974068531597, "test/sim_max_reward_4300008": 0.949945412157292, "test/sim_max_reward_4300009": 0.9027205922298316, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.3117560237656531, "test/sim_max_reward_4300012": 0.9778509737137134, "test/sim_max_reward_4300013": 0.8576484508240798, "test/sim_max_reward_4300014": 0.9804988281259769, "test/sim_max_reward_4300015": 0.938079289787822, "test/sim_max_reward_4300016": 0.5238304399086409, "test/sim_max_reward_4300017": 0.9289012189944926, "test/sim_max_reward_4300018": 0.989997351204947, "test/sim_max_reward_4300019": 0.185604979353344, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8028010724749424, "test/sim_max_reward_4300022": 0.5571055046630686, "test/sim_max_reward_4300023": 0.8769698918536005, "test/sim_max_reward_4300024": 0.983044711486975, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.36727148630880163, "test/sim_max_reward_4300027": 0.9510629815357292, "test/sim_max_reward_4300028": 0.8759201079436109, "test/sim_max_reward_4300029": 0.6759283826830604, "test/sim_max_reward_4300030": 0.3305034289197607, "test/sim_max_reward_4300031": 0.40325285059630317, "test/sim_max_reward_4300032": 0.9836714054615114, "test/sim_max_reward_4300033": 0.932922214867278, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.7859859615830126, "test/sim_max_reward_4300036": 0.202378356603296, "test/sim_max_reward_4300037": 0.875747125469047, "test/sim_max_reward_4300038": 0.8293044940761622, "test/sim_max_reward_4300039": 0.9599017527751824, "test/sim_max_reward_4300040": 0.9831432743867246, "test/sim_max_reward_4300041": 0.5936014172564037, "test/sim_max_reward_4300042": 0.9310363805219136, "test/sim_max_reward_4300043": 0.08628527634233162, "test/sim_max_reward_4300044": 0.9814512657484716, "test/sim_max_reward_4300045": 0.9677448023975325, "test/sim_max_reward_4300046": 0.8818292660786943, "test/sim_max_reward_4300047": 0.16619332304925047, "test/sim_max_reward_4300048": 0.01621067913468921, "test/sim_max_reward_4300049": 0.2302895727191951, "train/mean_score": 0.4249658855445377, "test/mean_score": 0.649193971729298, "val_loss": 64078.34765625} {"train_loss": -6.43941068649292, "global_step": 100842, "epoch": 2401} {"train_loss": -6.329158782958984, "global_step": 100843, "epoch": 2401} {"train_loss": -6.346307754516602, "global_step": 100844, "epoch": 2401} {"train_loss": -6.306667327880859, "global_step": 100845, "epoch": 2401} {"train_loss": -6.363515853881836, "global_step": 100846, "epoch": 2401} {"train_loss": -6.346311569213867, "global_step": 100847, "epoch": 2401} {"train_loss": -6.4061174392700195, "global_step": 100848, "epoch": 2401} {"train_loss": -6.333559513092041, "global_step": 100849, "epoch": 2401} {"train_loss": -6.4199137687683105, "global_step": 100850, "epoch": 2401} {"train_loss": -6.434728622436523, "global_step": 100851, "epoch": 2401} {"train_loss": -6.370761871337891, "global_step": 100852, "epoch": 2401} {"train_loss": -6.267181396484375, "global_step": 100853, "epoch": 2401} {"train_loss": -6.321591854095459, "global_step": 100854, "epoch": 2401} {"train_loss": -6.280965805053711, "global_step": 100855, "epoch": 2401} {"train_loss": -6.329067230224609, "global_step": 100856, "epoch": 2401} {"train_loss": -6.4870452880859375, "global_step": 100857, "epoch": 2401} {"train_loss": -6.2962822914123535, "global_step": 100858, "epoch": 2401} {"train_loss": -6.372039794921875, "global_step": 100859, "epoch": 2401} {"train_loss": -6.390462875366211, "global_step": 100860, "epoch": 2401} {"train_loss": -6.2482733726501465, "global_step": 100861, "epoch": 2401} {"train_loss": -6.332439422607422, "global_step": 100862, "epoch": 2401} {"train_loss": -6.244981288909912, "global_step": 100863, "epoch": 2401} {"train_loss": -6.171795845031738, "global_step": 100864, "epoch": 2401} {"train_loss": -6.395280838012695, "global_step": 100865, "epoch": 2401} {"train_loss": -6.137859344482422, "global_step": 100866, "epoch": 2401} {"train_loss": -6.399685382843018, "global_step": 100867, "epoch": 2401} {"train_loss": -6.31644344329834, "global_step": 100868, "epoch": 2401} {"train_loss": -6.199620246887207, "global_step": 100869, "epoch": 2401} {"train_loss": -6.376314163208008, "global_step": 100870, "epoch": 2401} {"train_loss": -6.321475028991699, "global_step": 100871, "epoch": 2401} {"train_loss": -6.353389739990234, "global_step": 100872, "epoch": 2401} {"train_loss": -6.339583396911621, "global_step": 100873, "epoch": 2401} {"train_loss": -6.308934211730957, "global_step": 100874, "epoch": 2401} {"train_loss": -6.337984561920166, "global_step": 100875, "epoch": 2401} {"train_loss": -6.255758285522461, "global_step": 100876, "epoch": 2401} {"train_loss": -6.437007904052734, "global_step": 100877, "epoch": 2401} {"train_loss": -6.484510898590088, "global_step": 100878, "epoch": 2401} {"train_loss": -6.306861877441406, "global_step": 100879, "epoch": 2401} {"train_loss": -6.403205871582031, "global_step": 100880, "epoch": 2401} {"train_loss": -6.557780742645264, "global_step": 100881, "epoch": 2401} {"train_loss": -6.361212730407715, "global_step": 100882, "epoch": 2401} {"train_loss": -6.344444093250093, "global_step": 100883, "epoch": 2401, "val_loss": 64032.98046875} {"train_loss": -6.383527755737305, "global_step": 100884, "epoch": 2402} {"train_loss": -6.225468158721924, "global_step": 100885, "epoch": 2402} {"train_loss": -6.443027496337891, "global_step": 100886, "epoch": 2402} {"train_loss": -6.440911769866943, "global_step": 100887, "epoch": 2402} {"train_loss": -6.403953552246094, "global_step": 100888, "epoch": 2402} {"train_loss": -6.401011943817139, "global_step": 100889, "epoch": 2402} {"train_loss": -6.406303405761719, "global_step": 100890, "epoch": 2402} {"train_loss": -6.342985153198242, "global_step": 100891, "epoch": 2402} {"train_loss": -6.433686256408691, "global_step": 100892, "epoch": 2402} {"train_loss": -6.414329528808594, "global_step": 100893, "epoch": 2402} {"train_loss": -6.452817916870117, "global_step": 100894, "epoch": 2402} {"train_loss": -6.37385368347168, "global_step": 100895, "epoch": 2402} {"train_loss": -6.349681854248047, "global_step": 100896, "epoch": 2402} {"train_loss": -6.418949127197266, "global_step": 100897, "epoch": 2402} {"train_loss": -6.3806633949279785, "global_step": 100898, "epoch": 2402} {"train_loss": -6.371435165405273, "global_step": 100899, "epoch": 2402} {"train_loss": -6.548130989074707, "global_step": 100900, "epoch": 2402} {"train_loss": -6.462653160095215, "global_step": 100901, "epoch": 2402} {"train_loss": -6.3703155517578125, "global_step": 100902, "epoch": 2402} {"train_loss": -6.452561378479004, "global_step": 100903, "epoch": 2402} {"train_loss": -6.371677875518799, "global_step": 100904, "epoch": 2402} {"train_loss": -6.399051666259766, "global_step": 100905, "epoch": 2402} {"train_loss": -6.4029622077941895, "global_step": 100906, "epoch": 2402} {"train_loss": -6.293295860290527, "global_step": 100907, "epoch": 2402} {"train_loss": -6.437564849853516, "global_step": 100908, "epoch": 2402} {"train_loss": -6.416614055633545, "global_step": 100909, "epoch": 2402} {"train_loss": -6.399999618530273, "global_step": 100910, "epoch": 2402} {"train_loss": -6.374941349029541, "global_step": 100911, "epoch": 2402} {"train_loss": -6.3211798667907715, "global_step": 100912, "epoch": 2402} {"train_loss": -6.33511209487915, "global_step": 100913, "epoch": 2402} {"train_loss": -6.404028415679932, "global_step": 100914, "epoch": 2402} {"train_loss": -6.375737190246582, "global_step": 100915, "epoch": 2402} {"train_loss": -6.396912574768066, "global_step": 100916, "epoch": 2402} {"train_loss": -6.4878387451171875, "global_step": 100917, "epoch": 2402} {"train_loss": -6.390480995178223, "global_step": 100918, "epoch": 2402} {"train_loss": -6.390146732330322, "global_step": 100919, "epoch": 2402} {"train_loss": -6.3925371170043945, "global_step": 100920, "epoch": 2402} {"train_loss": -6.30106782913208, "global_step": 100921, "epoch": 2402} {"train_loss": -6.408937454223633, "global_step": 100922, "epoch": 2402} {"train_loss": -6.344425201416016, "global_step": 100923, "epoch": 2402} {"train_loss": -6.401758193969727, "global_step": 100924, "epoch": 2402} {"train_loss": -6.392488513674055, "global_step": 100925, "epoch": 2402, "val_loss": 64258.7109375} {"train_loss": -6.331518173217773, "global_step": 100926, "epoch": 2403} {"train_loss": -6.416671276092529, "global_step": 100927, "epoch": 2403} {"train_loss": -6.306523323059082, "global_step": 100928, "epoch": 2403} {"train_loss": -6.409304618835449, "global_step": 100929, "epoch": 2403} {"train_loss": -6.386421203613281, "global_step": 100930, "epoch": 2403} {"train_loss": -6.33426570892334, "global_step": 100931, "epoch": 2403} {"train_loss": -6.3757405281066895, "global_step": 100932, "epoch": 2403} {"train_loss": -6.3749098777771, "global_step": 100933, "epoch": 2403} {"train_loss": -6.233544826507568, "global_step": 100934, "epoch": 2403} {"train_loss": -6.359062194824219, "global_step": 100935, "epoch": 2403} {"train_loss": -6.343707084655762, "global_step": 100936, "epoch": 2403} {"train_loss": -6.282288551330566, "global_step": 100937, "epoch": 2403} {"train_loss": -6.388307094573975, "global_step": 100938, "epoch": 2403} {"train_loss": -6.397146224975586, "global_step": 100939, "epoch": 2403} {"train_loss": -6.298056125640869, "global_step": 100940, "epoch": 2403} {"train_loss": -6.310443878173828, "global_step": 100941, "epoch": 2403} {"train_loss": -6.341696739196777, "global_step": 100942, "epoch": 2403} {"train_loss": -6.406739234924316, "global_step": 100943, "epoch": 2403} {"train_loss": -6.257625579833984, "global_step": 100944, "epoch": 2403} {"train_loss": -6.448661804199219, "global_step": 100945, "epoch": 2403} {"train_loss": -6.192455291748047, "global_step": 100946, "epoch": 2403} {"train_loss": -6.336339950561523, "global_step": 100947, "epoch": 2403} {"train_loss": -6.47336483001709, "global_step": 100948, "epoch": 2403} {"train_loss": -6.32102108001709, "global_step": 100949, "epoch": 2403} {"train_loss": -6.376071929931641, "global_step": 100950, "epoch": 2403} {"train_loss": -6.373570442199707, "global_step": 100951, "epoch": 2403} {"train_loss": -6.346963882446289, "global_step": 100952, "epoch": 2403} {"train_loss": -6.298647403717041, "global_step": 100953, "epoch": 2403} {"train_loss": -6.360812187194824, "global_step": 100954, "epoch": 2403} {"train_loss": -6.398553371429443, "global_step": 100955, "epoch": 2403} {"train_loss": -6.461017608642578, "global_step": 100956, "epoch": 2403} {"train_loss": -6.34676456451416, "global_step": 100957, "epoch": 2403} {"train_loss": -6.377777099609375, "global_step": 100958, "epoch": 2403} {"train_loss": -6.423550128936768, "global_step": 100959, "epoch": 2403} {"train_loss": -6.284236431121826, "global_step": 100960, "epoch": 2403} {"train_loss": -6.513193130493164, "global_step": 100961, "epoch": 2403} {"train_loss": -6.350581169128418, "global_step": 100962, "epoch": 2403} {"train_loss": -6.3987016677856445, "global_step": 100963, "epoch": 2403} {"train_loss": -6.367331504821777, "global_step": 100964, "epoch": 2403} {"train_loss": -6.354874610900879, "global_step": 100965, "epoch": 2403} {"train_loss": -6.404745578765869, "global_step": 100966, "epoch": 2403} {"train_loss": -6.36055638676598, "global_step": 100967, "epoch": 2403, "val_loss": 64178.0} {"train_loss": -6.390192031860352, "global_step": 100968, "epoch": 2404} {"train_loss": -6.427307605743408, "global_step": 100969, "epoch": 2404} {"train_loss": -6.411915302276611, "global_step": 100970, "epoch": 2404} {"train_loss": -6.3524322509765625, "global_step": 100971, "epoch": 2404} {"train_loss": -6.354419708251953, "global_step": 100972, "epoch": 2404} {"train_loss": -6.420248985290527, "global_step": 100973, "epoch": 2404} {"train_loss": -6.372610569000244, "global_step": 100974, "epoch": 2404} {"train_loss": -6.355921268463135, "global_step": 100975, "epoch": 2404} {"train_loss": -6.325757026672363, "global_step": 100976, "epoch": 2404} {"train_loss": -6.4121503829956055, "global_step": 100977, "epoch": 2404} {"train_loss": -6.366879463195801, "global_step": 100978, "epoch": 2404} {"train_loss": -6.346881866455078, "global_step": 100979, "epoch": 2404} {"train_loss": -6.287483215332031, "global_step": 100980, "epoch": 2404} {"train_loss": -6.420752048492432, "global_step": 100981, "epoch": 2404} {"train_loss": -6.382693290710449, "global_step": 100982, "epoch": 2404} {"train_loss": -6.3626251220703125, "global_step": 100983, "epoch": 2404} {"train_loss": -6.3885416984558105, "global_step": 100984, "epoch": 2404} {"train_loss": -6.442661285400391, "global_step": 100985, "epoch": 2404} {"train_loss": -6.454666614532471, "global_step": 100986, "epoch": 2404} {"train_loss": -6.308196544647217, "global_step": 100987, "epoch": 2404} {"train_loss": -6.373445987701416, "global_step": 100988, "epoch": 2404} {"train_loss": -6.304652214050293, "global_step": 100989, "epoch": 2404} {"train_loss": -6.322007179260254, "global_step": 100990, "epoch": 2404} {"train_loss": -6.303427696228027, "global_step": 100991, "epoch": 2404} {"train_loss": -6.283083915710449, "global_step": 100992, "epoch": 2404} {"train_loss": -6.376468658447266, "global_step": 100993, "epoch": 2404} {"train_loss": -6.496707916259766, "global_step": 100994, "epoch": 2404} {"train_loss": -6.431272506713867, "global_step": 100995, "epoch": 2404} {"train_loss": -6.305896759033203, "global_step": 100996, "epoch": 2404} {"train_loss": -6.3666558265686035, "global_step": 100997, "epoch": 2404} {"train_loss": -6.321279525756836, "global_step": 100998, "epoch": 2404} {"train_loss": -6.436654567718506, "global_step": 100999, "epoch": 2404} {"train_loss": -6.489899635314941, "global_step": 101000, "epoch": 2404} {"train_loss": -6.270308494567871, "global_step": 101001, "epoch": 2404} {"train_loss": -6.265386581420898, "global_step": 101002, "epoch": 2404} {"train_loss": -6.3865509033203125, "global_step": 101003, "epoch": 2404} {"train_loss": -6.2879557609558105, "global_step": 101004, "epoch": 2404} {"train_loss": -6.372739791870117, "global_step": 101005, "epoch": 2404} {"train_loss": -6.275951862335205, "global_step": 101006, "epoch": 2404} {"train_loss": -6.334352493286133, "global_step": 101007, "epoch": 2404} {"train_loss": -6.40939474105835, "global_step": 101008, "epoch": 2404} {"train_loss": -6.367603483654204, "global_step": 101009, "epoch": 2404, "val_loss": 64142.109375} {"train_loss": -6.354554176330566, "global_step": 101010, "epoch": 2405} {"train_loss": -6.408046722412109, "global_step": 101011, "epoch": 2405} {"train_loss": -6.4187912940979, "global_step": 101012, "epoch": 2405} {"train_loss": -6.422533988952637, "global_step": 101013, "epoch": 2405} {"train_loss": -6.456966876983643, "global_step": 101014, "epoch": 2405} {"train_loss": -6.38136100769043, "global_step": 101015, "epoch": 2405} {"train_loss": -6.463977813720703, "global_step": 101016, "epoch": 2405} {"train_loss": -6.391969203948975, "global_step": 101017, "epoch": 2405} {"train_loss": -6.360245704650879, "global_step": 101018, "epoch": 2405} {"train_loss": -6.25424861907959, "global_step": 101019, "epoch": 2405} {"train_loss": -6.3351545333862305, "global_step": 101020, "epoch": 2405} {"train_loss": -6.333935737609863, "global_step": 101021, "epoch": 2405} {"train_loss": -6.347189426422119, "global_step": 101022, "epoch": 2405} {"train_loss": -6.364144802093506, "global_step": 101023, "epoch": 2405} {"train_loss": -6.4126410484313965, "global_step": 101024, "epoch": 2405} {"train_loss": -6.288883686065674, "global_step": 101025, "epoch": 2405} {"train_loss": -6.384329795837402, "global_step": 101026, "epoch": 2405} {"train_loss": -6.36635684967041, "global_step": 101027, "epoch": 2405} {"train_loss": -6.218340873718262, "global_step": 101028, "epoch": 2405} {"train_loss": -6.294589042663574, "global_step": 101029, "epoch": 2405} {"train_loss": -6.291304111480713, "global_step": 101030, "epoch": 2405} {"train_loss": -6.39809513092041, "global_step": 101031, "epoch": 2405} {"train_loss": -6.425063133239746, "global_step": 101032, "epoch": 2405} {"train_loss": -6.402876853942871, "global_step": 101033, "epoch": 2405} {"train_loss": -6.318899631500244, "global_step": 101034, "epoch": 2405} {"train_loss": -6.377256870269775, "global_step": 101035, "epoch": 2405} {"train_loss": -6.428017616271973, "global_step": 101036, "epoch": 2405} {"train_loss": -6.500913619995117, "global_step": 101037, "epoch": 2405} {"train_loss": -6.251115798950195, "global_step": 101038, "epoch": 2405} {"train_loss": -6.352616310119629, "global_step": 101039, "epoch": 2405} {"train_loss": -6.41854190826416, "global_step": 101040, "epoch": 2405} {"train_loss": -6.429879665374756, "global_step": 101041, "epoch": 2405} {"train_loss": -6.234198570251465, "global_step": 101042, "epoch": 2405} {"train_loss": -6.3758931159973145, "global_step": 101043, "epoch": 2405} {"train_loss": -6.330046653747559, "global_step": 101044, "epoch": 2405} {"train_loss": -6.454069137573242, "global_step": 101045, "epoch": 2405} {"train_loss": -6.323668479919434, "global_step": 101046, "epoch": 2405} {"train_loss": -6.383110046386719, "global_step": 101047, "epoch": 2405} {"train_loss": -6.551372051239014, "global_step": 101048, "epoch": 2405} {"train_loss": -6.315881729125977, "global_step": 101049, "epoch": 2405} {"train_loss": -6.35035514831543, "global_step": 101050, "epoch": 2405} {"train_loss": -6.368264243716285, "global_step": 101051, "epoch": 2405, "val_loss": 64135.70703125} {"train_loss": -6.42842960357666, "global_step": 101052, "epoch": 2406} {"train_loss": -6.480344772338867, "global_step": 101053, "epoch": 2406} {"train_loss": -6.359267234802246, "global_step": 101054, "epoch": 2406} {"train_loss": -6.467568874359131, "global_step": 101055, "epoch": 2406} {"train_loss": -6.476888656616211, "global_step": 101056, "epoch": 2406} {"train_loss": -6.435262680053711, "global_step": 101057, "epoch": 2406} {"train_loss": -6.458690643310547, "global_step": 101058, "epoch": 2406} {"train_loss": -6.358840465545654, "global_step": 101059, "epoch": 2406} {"train_loss": -6.436185836791992, "global_step": 101060, "epoch": 2406} {"train_loss": -6.3899383544921875, "global_step": 101061, "epoch": 2406} {"train_loss": -6.368911266326904, "global_step": 101062, "epoch": 2406} {"train_loss": -6.436476707458496, "global_step": 101063, "epoch": 2406} {"train_loss": -6.397540092468262, "global_step": 101064, "epoch": 2406} {"train_loss": -6.3442702293396, "global_step": 101065, "epoch": 2406} {"train_loss": -6.38770866394043, "global_step": 101066, "epoch": 2406} {"train_loss": -6.311999320983887, "global_step": 101067, "epoch": 2406} {"train_loss": -6.33099889755249, "global_step": 101068, "epoch": 2406} {"train_loss": -6.398220539093018, "global_step": 101069, "epoch": 2406} {"train_loss": -6.402371883392334, "global_step": 101070, "epoch": 2406} {"train_loss": -6.499837398529053, "global_step": 101071, "epoch": 2406} {"train_loss": -6.325192928314209, "global_step": 101072, "epoch": 2406} {"train_loss": -6.430290222167969, "global_step": 101073, "epoch": 2406} {"train_loss": -6.362779140472412, "global_step": 101074, "epoch": 2406} {"train_loss": -6.316551208496094, "global_step": 101075, "epoch": 2406} {"train_loss": -6.40125846862793, "global_step": 101076, "epoch": 2406} {"train_loss": -6.226675033569336, "global_step": 101077, "epoch": 2406} {"train_loss": -6.3239850997924805, "global_step": 101078, "epoch": 2406} {"train_loss": -6.529239654541016, "global_step": 101079, "epoch": 2406} {"train_loss": -6.238237380981445, "global_step": 101080, "epoch": 2406} {"train_loss": -6.373272895812988, "global_step": 101081, "epoch": 2406} {"train_loss": -6.3080735206604, "global_step": 101082, "epoch": 2406} {"train_loss": -6.310390949249268, "global_step": 101083, "epoch": 2406} {"train_loss": -6.3868632316589355, "global_step": 101084, "epoch": 2406} {"train_loss": -6.4295148849487305, "global_step": 101085, "epoch": 2406} {"train_loss": -6.315658092498779, "global_step": 101086, "epoch": 2406} {"train_loss": -6.339075088500977, "global_step": 101087, "epoch": 2406} {"train_loss": -6.406420707702637, "global_step": 101088, "epoch": 2406} {"train_loss": -6.245786666870117, "global_step": 101089, "epoch": 2406} {"train_loss": -6.338911533355713, "global_step": 101090, "epoch": 2406} {"train_loss": -6.350438594818115, "global_step": 101091, "epoch": 2406} {"train_loss": -6.393239974975586, "global_step": 101092, "epoch": 2406} {"train_loss": -6.380480414345151, "global_step": 101093, "epoch": 2406, "val_loss": 64199.0} {"train_loss": -6.251730918884277, "global_step": 101094, "epoch": 2407} {"train_loss": -6.430021286010742, "global_step": 101095, "epoch": 2407} {"train_loss": -6.450929641723633, "global_step": 101096, "epoch": 2407} {"train_loss": -6.310698509216309, "global_step": 101097, "epoch": 2407} {"train_loss": -6.312390327453613, "global_step": 101098, "epoch": 2407} {"train_loss": -6.305456161499023, "global_step": 101099, "epoch": 2407} {"train_loss": -6.3889360427856445, "global_step": 101100, "epoch": 2407} {"train_loss": -6.321934700012207, "global_step": 101101, "epoch": 2407} {"train_loss": -6.401261806488037, "global_step": 101102, "epoch": 2407} {"train_loss": -6.334619522094727, "global_step": 101103, "epoch": 2407} {"train_loss": -6.377633094787598, "global_step": 101104, "epoch": 2407} {"train_loss": -6.327777862548828, "global_step": 101105, "epoch": 2407} {"train_loss": -6.399361610412598, "global_step": 101106, "epoch": 2407} {"train_loss": -6.3718953132629395, "global_step": 101107, "epoch": 2407} {"train_loss": -6.304401397705078, "global_step": 101108, "epoch": 2407} {"train_loss": -6.380416393280029, "global_step": 101109, "epoch": 2407} {"train_loss": -6.264487266540527, "global_step": 101110, "epoch": 2407} {"train_loss": -6.233728408813477, "global_step": 101111, "epoch": 2407} {"train_loss": -6.36090087890625, "global_step": 101112, "epoch": 2407} {"train_loss": -6.108702182769775, "global_step": 101113, "epoch": 2407} {"train_loss": -6.223237991333008, "global_step": 101114, "epoch": 2407} {"train_loss": -6.402462959289551, "global_step": 101115, "epoch": 2407} {"train_loss": -6.220792770385742, "global_step": 101116, "epoch": 2407} {"train_loss": -6.30276346206665, "global_step": 101117, "epoch": 2407} {"train_loss": -6.334528923034668, "global_step": 101118, "epoch": 2407} {"train_loss": -6.264863967895508, "global_step": 101119, "epoch": 2407} {"train_loss": -6.382517337799072, "global_step": 101120, "epoch": 2407} {"train_loss": -6.213635444641113, "global_step": 101121, "epoch": 2407} {"train_loss": -6.405040264129639, "global_step": 101122, "epoch": 2407} {"train_loss": -6.222939491271973, "global_step": 101123, "epoch": 2407} {"train_loss": -6.224212646484375, "global_step": 101124, "epoch": 2407} {"train_loss": -6.274683952331543, "global_step": 101125, "epoch": 2407} {"train_loss": -6.232706069946289, "global_step": 101126, "epoch": 2407} {"train_loss": -6.347336292266846, "global_step": 101127, "epoch": 2407} {"train_loss": -6.129613399505615, "global_step": 101128, "epoch": 2407} {"train_loss": -6.45362663269043, "global_step": 101129, "epoch": 2407} {"train_loss": -6.285549640655518, "global_step": 101130, "epoch": 2407} {"train_loss": -6.394844055175781, "global_step": 101131, "epoch": 2407} {"train_loss": -6.191946983337402, "global_step": 101132, "epoch": 2407} {"train_loss": -6.332233428955078, "global_step": 101133, "epoch": 2407} {"train_loss": -6.389476776123047, "global_step": 101134, "epoch": 2407} {"train_loss": -6.315041962124052, "global_step": 101135, "epoch": 2407, "val_loss": 64158.2734375} {"train_loss": -6.367631912231445, "global_step": 101136, "epoch": 2408} {"train_loss": -6.371347427368164, "global_step": 101137, "epoch": 2408} {"train_loss": -6.297892093658447, "global_step": 101138, "epoch": 2408} {"train_loss": -6.390623092651367, "global_step": 101139, "epoch": 2408} {"train_loss": -6.358114242553711, "global_step": 101140, "epoch": 2408} {"train_loss": -6.458456039428711, "global_step": 101141, "epoch": 2408} {"train_loss": -6.37214994430542, "global_step": 101142, "epoch": 2408} {"train_loss": -6.4176249504089355, "global_step": 101143, "epoch": 2408} {"train_loss": -6.293450355529785, "global_step": 101144, "epoch": 2408} {"train_loss": -6.373668670654297, "global_step": 101145, "epoch": 2408} {"train_loss": -6.464977264404297, "global_step": 101146, "epoch": 2408} {"train_loss": -6.451513290405273, "global_step": 101147, "epoch": 2408} {"train_loss": -6.365408897399902, "global_step": 101148, "epoch": 2408} {"train_loss": -6.3843278884887695, "global_step": 101149, "epoch": 2408} {"train_loss": -6.427183151245117, "global_step": 101150, "epoch": 2408} {"train_loss": -6.343565940856934, "global_step": 101151, "epoch": 2408} {"train_loss": -6.384470462799072, "global_step": 101152, "epoch": 2408} {"train_loss": -6.324081897735596, "global_step": 101153, "epoch": 2408} {"train_loss": -6.436261177062988, "global_step": 101154, "epoch": 2408} {"train_loss": -6.371110439300537, "global_step": 101155, "epoch": 2408} {"train_loss": -6.431786060333252, "global_step": 101156, "epoch": 2408} {"train_loss": -6.370909214019775, "global_step": 101157, "epoch": 2408} {"train_loss": -6.3802876472473145, "global_step": 101158, "epoch": 2408} {"train_loss": -6.30985164642334, "global_step": 101159, "epoch": 2408} {"train_loss": -6.44992733001709, "global_step": 101160, "epoch": 2408} {"train_loss": -6.3332037925720215, "global_step": 101161, "epoch": 2408} {"train_loss": -6.290783882141113, "global_step": 101162, "epoch": 2408} {"train_loss": -6.3890533447265625, "global_step": 101163, "epoch": 2408} {"train_loss": -6.254520416259766, "global_step": 101164, "epoch": 2408} {"train_loss": -6.343463897705078, "global_step": 101165, "epoch": 2408} {"train_loss": -6.362269878387451, "global_step": 101166, "epoch": 2408} {"train_loss": -6.360348701477051, "global_step": 101167, "epoch": 2408} {"train_loss": -6.307806015014648, "global_step": 101168, "epoch": 2408} {"train_loss": -6.2884063720703125, "global_step": 101169, "epoch": 2408} {"train_loss": -6.2814788818359375, "global_step": 101170, "epoch": 2408} {"train_loss": -6.4156036376953125, "global_step": 101171, "epoch": 2408} {"train_loss": -6.322502613067627, "global_step": 101172, "epoch": 2408} {"train_loss": -6.510876655578613, "global_step": 101173, "epoch": 2408} {"train_loss": -6.377711772918701, "global_step": 101174, "epoch": 2408} {"train_loss": -6.368928909301758, "global_step": 101175, "epoch": 2408} {"train_loss": -6.3073930740356445, "global_step": 101176, "epoch": 2408} {"train_loss": -6.36821114449274, "global_step": 101177, "epoch": 2408, "val_loss": 64050.890625} {"train_loss": -6.292098045349121, "global_step": 101178, "epoch": 2409} {"train_loss": -6.390322685241699, "global_step": 101179, "epoch": 2409} {"train_loss": -6.466554641723633, "global_step": 101180, "epoch": 2409} {"train_loss": -6.372315406799316, "global_step": 101181, "epoch": 2409} {"train_loss": -6.3443756103515625, "global_step": 101182, "epoch": 2409} {"train_loss": -6.307929992675781, "global_step": 101183, "epoch": 2409} {"train_loss": -6.278191089630127, "global_step": 101184, "epoch": 2409} {"train_loss": -6.453321933746338, "global_step": 101185, "epoch": 2409} {"train_loss": -6.210536479949951, "global_step": 101186, "epoch": 2409} {"train_loss": -6.302077293395996, "global_step": 101187, "epoch": 2409} {"train_loss": -6.374899864196777, "global_step": 101188, "epoch": 2409} {"train_loss": -6.361183166503906, "global_step": 101189, "epoch": 2409} {"train_loss": -6.416619777679443, "global_step": 101190, "epoch": 2409} {"train_loss": -6.345582008361816, "global_step": 101191, "epoch": 2409} {"train_loss": -6.430018424987793, "global_step": 101192, "epoch": 2409} {"train_loss": -6.43283224105835, "global_step": 101193, "epoch": 2409} {"train_loss": -6.509073257446289, "global_step": 101194, "epoch": 2409} {"train_loss": -6.358222007751465, "global_step": 101195, "epoch": 2409} {"train_loss": -6.370102882385254, "global_step": 101196, "epoch": 2409} {"train_loss": -6.479233741760254, "global_step": 101197, "epoch": 2409} {"train_loss": -6.379774570465088, "global_step": 101198, "epoch": 2409} {"train_loss": -6.368000030517578, "global_step": 101199, "epoch": 2409} {"train_loss": -6.357769966125488, "global_step": 101200, "epoch": 2409} {"train_loss": -6.439619541168213, "global_step": 101201, "epoch": 2409} {"train_loss": -6.428677082061768, "global_step": 101202, "epoch": 2409} {"train_loss": -6.39870023727417, "global_step": 101203, "epoch": 2409} {"train_loss": -6.336954116821289, "global_step": 101204, "epoch": 2409} {"train_loss": -6.270318984985352, "global_step": 101205, "epoch": 2409} {"train_loss": -6.388692378997803, "global_step": 101206, "epoch": 2409} {"train_loss": -6.36483097076416, "global_step": 101207, "epoch": 2409} {"train_loss": -6.387500762939453, "global_step": 101208, "epoch": 2409} {"train_loss": -6.453573226928711, "global_step": 101209, "epoch": 2409} {"train_loss": -6.289557456970215, "global_step": 101210, "epoch": 2409} {"train_loss": -6.474247932434082, "global_step": 101211, "epoch": 2409} {"train_loss": -6.344679832458496, "global_step": 101212, "epoch": 2409} {"train_loss": -6.360410690307617, "global_step": 101213, "epoch": 2409} {"train_loss": -6.506631851196289, "global_step": 101214, "epoch": 2409} {"train_loss": -6.371423244476318, "global_step": 101215, "epoch": 2409} {"train_loss": -6.386955261230469, "global_step": 101216, "epoch": 2409} {"train_loss": -6.371201992034912, "global_step": 101217, "epoch": 2409} {"train_loss": -6.2875895500183105, "global_step": 101218, "epoch": 2409} {"train_loss": -6.374844596499488, "global_step": 101219, "epoch": 2409, "val_loss": 64366.64453125} {"train_loss": -6.4139251708984375, "global_step": 101220, "epoch": 2410} {"train_loss": -6.382935523986816, "global_step": 101221, "epoch": 2410} {"train_loss": -6.227981090545654, "global_step": 101222, "epoch": 2410} {"train_loss": -6.288842678070068, "global_step": 101223, "epoch": 2410} {"train_loss": -6.38932466506958, "global_step": 101224, "epoch": 2410} {"train_loss": -6.327369689941406, "global_step": 101225, "epoch": 2410} {"train_loss": -6.517831802368164, "global_step": 101226, "epoch": 2410} {"train_loss": -6.290872573852539, "global_step": 101227, "epoch": 2410} {"train_loss": -6.351670742034912, "global_step": 101228, "epoch": 2410} {"train_loss": -6.3723297119140625, "global_step": 101229, "epoch": 2410} {"train_loss": -6.207891464233398, "global_step": 101230, "epoch": 2410} {"train_loss": -6.470164775848389, "global_step": 101231, "epoch": 2410} {"train_loss": -6.177031517028809, "global_step": 101232, "epoch": 2410} {"train_loss": -6.3929219245910645, "global_step": 101233, "epoch": 2410} {"train_loss": -6.373322486877441, "global_step": 101234, "epoch": 2410} {"train_loss": -6.374421119689941, "global_step": 101235, "epoch": 2410} {"train_loss": -6.385481834411621, "global_step": 101236, "epoch": 2410} {"train_loss": -6.392157077789307, "global_step": 101237, "epoch": 2410} {"train_loss": -6.339077472686768, "global_step": 101238, "epoch": 2410} {"train_loss": -6.433429718017578, "global_step": 101239, "epoch": 2410} {"train_loss": -6.344120979309082, "global_step": 101240, "epoch": 2410} {"train_loss": -6.454599857330322, "global_step": 101241, "epoch": 2410} {"train_loss": -6.369462490081787, "global_step": 101242, "epoch": 2410} {"train_loss": -6.404130935668945, "global_step": 101243, "epoch": 2410} {"train_loss": -6.299973011016846, "global_step": 101244, "epoch": 2410} {"train_loss": -6.483631610870361, "global_step": 101245, "epoch": 2410} {"train_loss": -6.337428092956543, "global_step": 101246, "epoch": 2410} {"train_loss": -6.377984523773193, "global_step": 101247, "epoch": 2410} {"train_loss": -6.516425132751465, "global_step": 101248, "epoch": 2410} {"train_loss": -6.26377534866333, "global_step": 101249, "epoch": 2410} {"train_loss": -6.405726432800293, "global_step": 101250, "epoch": 2410} {"train_loss": -6.399530410766602, "global_step": 101251, "epoch": 2410} {"train_loss": -6.3331499099731445, "global_step": 101252, "epoch": 2410} {"train_loss": -6.308239936828613, "global_step": 101253, "epoch": 2410} {"train_loss": -6.462103843688965, "global_step": 101254, "epoch": 2410} {"train_loss": -6.292140483856201, "global_step": 101255, "epoch": 2410} {"train_loss": -6.230311870574951, "global_step": 101256, "epoch": 2410} {"train_loss": -6.343437671661377, "global_step": 101257, "epoch": 2410} {"train_loss": -6.338888168334961, "global_step": 101258, "epoch": 2410} {"train_loss": -6.386587142944336, "global_step": 101259, "epoch": 2410} {"train_loss": -6.438148498535156, "global_step": 101260, "epoch": 2410} {"train_loss": -6.362161182221913, "global_step": 101261, "epoch": 2410, "val_loss": 64284.15625} {"train_loss": -6.238109111785889, "global_step": 101262, "epoch": 2411} {"train_loss": -6.458243370056152, "global_step": 101263, "epoch": 2411} {"train_loss": -6.3025407791137695, "global_step": 101264, "epoch": 2411} {"train_loss": -6.322495460510254, "global_step": 101265, "epoch": 2411} {"train_loss": -6.334141731262207, "global_step": 101266, "epoch": 2411} {"train_loss": -6.294041633605957, "global_step": 101267, "epoch": 2411} {"train_loss": -6.329181671142578, "global_step": 101268, "epoch": 2411} {"train_loss": -6.379447937011719, "global_step": 101269, "epoch": 2411} {"train_loss": -6.3022260665893555, "global_step": 101270, "epoch": 2411} {"train_loss": -6.393766403198242, "global_step": 101271, "epoch": 2411} {"train_loss": -6.306568622589111, "global_step": 101272, "epoch": 2411} {"train_loss": -6.362473964691162, "global_step": 101273, "epoch": 2411} {"train_loss": -6.3199076652526855, "global_step": 101274, "epoch": 2411} {"train_loss": -6.397538185119629, "global_step": 101275, "epoch": 2411} {"train_loss": -6.428127765655518, "global_step": 101276, "epoch": 2411} {"train_loss": -6.300564289093018, "global_step": 101277, "epoch": 2411} {"train_loss": -6.458273887634277, "global_step": 101278, "epoch": 2411} {"train_loss": -6.440840721130371, "global_step": 101279, "epoch": 2411} {"train_loss": -6.479182243347168, "global_step": 101280, "epoch": 2411} {"train_loss": -6.329278469085693, "global_step": 101281, "epoch": 2411} {"train_loss": -6.396701335906982, "global_step": 101282, "epoch": 2411} {"train_loss": -6.422213554382324, "global_step": 101283, "epoch": 2411} {"train_loss": -6.462357521057129, "global_step": 101284, "epoch": 2411} {"train_loss": -6.434874534606934, "global_step": 101285, "epoch": 2411} {"train_loss": -6.422696590423584, "global_step": 101286, "epoch": 2411} {"train_loss": -6.367721080780029, "global_step": 101287, "epoch": 2411} {"train_loss": -6.379991054534912, "global_step": 101288, "epoch": 2411} {"train_loss": -6.336028575897217, "global_step": 101289, "epoch": 2411} {"train_loss": -6.338206768035889, "global_step": 101290, "epoch": 2411} {"train_loss": -6.247751712799072, "global_step": 101291, "epoch": 2411} {"train_loss": -6.486947059631348, "global_step": 101292, "epoch": 2411} {"train_loss": -6.512078285217285, "global_step": 101293, "epoch": 2411} {"train_loss": -6.396958351135254, "global_step": 101294, "epoch": 2411} {"train_loss": -6.386701583862305, "global_step": 101295, "epoch": 2411} {"train_loss": -6.429337978363037, "global_step": 101296, "epoch": 2411} {"train_loss": -6.461802005767822, "global_step": 101297, "epoch": 2411} {"train_loss": -6.402767658233643, "global_step": 101298, "epoch": 2411} {"train_loss": -6.274077892303467, "global_step": 101299, "epoch": 2411} {"train_loss": -6.453732490539551, "global_step": 101300, "epoch": 2411} {"train_loss": -6.463822364807129, "global_step": 101301, "epoch": 2411} {"train_loss": -6.444792747497559, "global_step": 101302, "epoch": 2411} {"train_loss": -6.3820875485738116, "global_step": 101303, "epoch": 2411, "val_loss": 64094.44921875} {"train_loss": -6.3220672607421875, "global_step": 101304, "epoch": 2412} {"train_loss": -6.468897819519043, "global_step": 101305, "epoch": 2412} {"train_loss": -6.483551979064941, "global_step": 101306, "epoch": 2412} {"train_loss": -6.383369445800781, "global_step": 101307, "epoch": 2412} {"train_loss": -6.365426540374756, "global_step": 101308, "epoch": 2412} {"train_loss": -6.442227363586426, "global_step": 101309, "epoch": 2412} {"train_loss": -6.4654107093811035, "global_step": 101310, "epoch": 2412} {"train_loss": -6.409046173095703, "global_step": 101311, "epoch": 2412} {"train_loss": -6.377006530761719, "global_step": 101312, "epoch": 2412} {"train_loss": -6.390649795532227, "global_step": 101313, "epoch": 2412} {"train_loss": -6.573886871337891, "global_step": 101314, "epoch": 2412} {"train_loss": -6.58483362197876, "global_step": 101315, "epoch": 2412} {"train_loss": -6.385904312133789, "global_step": 101316, "epoch": 2412} {"train_loss": -6.407337665557861, "global_step": 101317, "epoch": 2412} {"train_loss": -6.365141868591309, "global_step": 101318, "epoch": 2412} {"train_loss": -6.3345842361450195, "global_step": 101319, "epoch": 2412} {"train_loss": -6.445402145385742, "global_step": 101320, "epoch": 2412} {"train_loss": -6.491497039794922, "global_step": 101321, "epoch": 2412} {"train_loss": -6.341734886169434, "global_step": 101322, "epoch": 2412} {"train_loss": -6.437748908996582, "global_step": 101323, "epoch": 2412} {"train_loss": -6.537393093109131, "global_step": 101324, "epoch": 2412} {"train_loss": -6.441701889038086, "global_step": 101325, "epoch": 2412} {"train_loss": -6.31866455078125, "global_step": 101326, "epoch": 2412} {"train_loss": -6.575186729431152, "global_step": 101327, "epoch": 2412} {"train_loss": -6.4433746337890625, "global_step": 101328, "epoch": 2412} {"train_loss": -6.424924373626709, "global_step": 101329, "epoch": 2412} {"train_loss": -6.422582626342773, "global_step": 101330, "epoch": 2412} {"train_loss": -6.401093482971191, "global_step": 101331, "epoch": 2412} {"train_loss": -6.338550567626953, "global_step": 101332, "epoch": 2412} {"train_loss": -6.295071125030518, "global_step": 101333, "epoch": 2412} {"train_loss": -6.356457710266113, "global_step": 101334, "epoch": 2412} {"train_loss": -6.435299873352051, "global_step": 101335, "epoch": 2412} {"train_loss": -6.400468826293945, "global_step": 101336, "epoch": 2412} {"train_loss": -6.499523162841797, "global_step": 101337, "epoch": 2412} {"train_loss": -6.494726181030273, "global_step": 101338, "epoch": 2412} {"train_loss": -6.362431049346924, "global_step": 101339, "epoch": 2412} {"train_loss": -6.404311180114746, "global_step": 101340, "epoch": 2412} {"train_loss": -6.546359062194824, "global_step": 101341, "epoch": 2412} {"train_loss": -6.349726676940918, "global_step": 101342, "epoch": 2412} {"train_loss": -6.443149089813232, "global_step": 101343, "epoch": 2412} {"train_loss": -6.39998197555542, "global_step": 101344, "epoch": 2412} {"train_loss": -6.424419051124936, "global_step": 101345, "epoch": 2412, "val_loss": 64217.62109375} {"train_loss": -6.378347873687744, "global_step": 101346, "epoch": 2413} {"train_loss": -6.454592704772949, "global_step": 101347, "epoch": 2413} {"train_loss": -6.34758996963501, "global_step": 101348, "epoch": 2413} {"train_loss": -6.3792877197265625, "global_step": 101349, "epoch": 2413} {"train_loss": -6.516110420227051, "global_step": 101350, "epoch": 2413} {"train_loss": -6.500314712524414, "global_step": 101351, "epoch": 2413} {"train_loss": -6.527507781982422, "global_step": 101352, "epoch": 2413} {"train_loss": -6.462300777435303, "global_step": 101353, "epoch": 2413} {"train_loss": -6.439897060394287, "global_step": 101354, "epoch": 2413} {"train_loss": -6.40824031829834, "global_step": 101355, "epoch": 2413} {"train_loss": -6.412336349487305, "global_step": 101356, "epoch": 2413} {"train_loss": -6.369926929473877, "global_step": 101357, "epoch": 2413} {"train_loss": -6.383012771606445, "global_step": 101358, "epoch": 2413} {"train_loss": -6.348358154296875, "global_step": 101359, "epoch": 2413} {"train_loss": -6.310884952545166, "global_step": 101360, "epoch": 2413} {"train_loss": -6.432855606079102, "global_step": 101361, "epoch": 2413} {"train_loss": -6.318887710571289, "global_step": 101362, "epoch": 2413} {"train_loss": -6.31178617477417, "global_step": 101363, "epoch": 2413} {"train_loss": -6.317682266235352, "global_step": 101364, "epoch": 2413} {"train_loss": -6.429316520690918, "global_step": 101365, "epoch": 2413} {"train_loss": -6.343453884124756, "global_step": 101366, "epoch": 2413} {"train_loss": -6.331048011779785, "global_step": 101367, "epoch": 2413} {"train_loss": -6.363920211791992, "global_step": 101368, "epoch": 2413} {"train_loss": -6.320677757263184, "global_step": 101369, "epoch": 2413} {"train_loss": -6.388918876647949, "global_step": 101370, "epoch": 2413} {"train_loss": -6.226004600524902, "global_step": 101371, "epoch": 2413} {"train_loss": -6.3585286140441895, "global_step": 101372, "epoch": 2413} {"train_loss": -6.361480712890625, "global_step": 101373, "epoch": 2413} {"train_loss": -6.283709526062012, "global_step": 101374, "epoch": 2413} {"train_loss": -6.516814231872559, "global_step": 101375, "epoch": 2413} {"train_loss": -6.3711161613464355, "global_step": 101376, "epoch": 2413} {"train_loss": -6.360631942749023, "global_step": 101377, "epoch": 2413} {"train_loss": -6.399622917175293, "global_step": 101378, "epoch": 2413} {"train_loss": -6.3377766609191895, "global_step": 101379, "epoch": 2413} {"train_loss": -6.358272552490234, "global_step": 101380, "epoch": 2413} {"train_loss": -6.437273025512695, "global_step": 101381, "epoch": 2413} {"train_loss": -6.337136745452881, "global_step": 101382, "epoch": 2413} {"train_loss": -6.353265285491943, "global_step": 101383, "epoch": 2413} {"train_loss": -6.476408004760742, "global_step": 101384, "epoch": 2413} {"train_loss": -6.368813514709473, "global_step": 101385, "epoch": 2413} {"train_loss": -6.368338584899902, "global_step": 101386, "epoch": 2413} {"train_loss": -6.384423267273676, "global_step": 101387, "epoch": 2413, "val_loss": 64192.33984375} {"train_loss": -6.425637245178223, "global_step": 101388, "epoch": 2414} {"train_loss": -6.427767753601074, "global_step": 101389, "epoch": 2414} {"train_loss": -6.439912796020508, "global_step": 101390, "epoch": 2414} {"train_loss": -6.357175350189209, "global_step": 101391, "epoch": 2414} {"train_loss": -6.420926570892334, "global_step": 101392, "epoch": 2414} {"train_loss": -6.373993396759033, "global_step": 101393, "epoch": 2414} {"train_loss": -6.345439910888672, "global_step": 101394, "epoch": 2414} {"train_loss": -6.3922200202941895, "global_step": 101395, "epoch": 2414} {"train_loss": -6.340195655822754, "global_step": 101396, "epoch": 2414} {"train_loss": -6.294696807861328, "global_step": 101397, "epoch": 2414} {"train_loss": -6.411012172698975, "global_step": 101398, "epoch": 2414} {"train_loss": -6.403669834136963, "global_step": 101399, "epoch": 2414} {"train_loss": -6.338258743286133, "global_step": 101400, "epoch": 2414} {"train_loss": -6.540550231933594, "global_step": 101401, "epoch": 2414} {"train_loss": -6.326178550720215, "global_step": 101402, "epoch": 2414} {"train_loss": -6.333998680114746, "global_step": 101403, "epoch": 2414} {"train_loss": -6.386051654815674, "global_step": 101404, "epoch": 2414} {"train_loss": -6.306118965148926, "global_step": 101405, "epoch": 2414} {"train_loss": -6.3312530517578125, "global_step": 101406, "epoch": 2414} {"train_loss": -6.401492595672607, "global_step": 101407, "epoch": 2414} {"train_loss": -6.291516304016113, "global_step": 101408, "epoch": 2414} {"train_loss": -6.352126121520996, "global_step": 101409, "epoch": 2414} {"train_loss": -6.392321586608887, "global_step": 101410, "epoch": 2414} {"train_loss": -6.409006118774414, "global_step": 101411, "epoch": 2414} {"train_loss": -6.325078964233398, "global_step": 101412, "epoch": 2414} {"train_loss": -6.314157485961914, "global_step": 101413, "epoch": 2414} {"train_loss": -6.293942451477051, "global_step": 101414, "epoch": 2414} {"train_loss": -6.219325542449951, "global_step": 101415, "epoch": 2414} {"train_loss": -6.391991138458252, "global_step": 101416, "epoch": 2414} {"train_loss": -6.359435081481934, "global_step": 101417, "epoch": 2414} {"train_loss": -6.293010234832764, "global_step": 101418, "epoch": 2414} {"train_loss": -6.385412216186523, "global_step": 101419, "epoch": 2414} {"train_loss": -6.326926231384277, "global_step": 101420, "epoch": 2414} {"train_loss": -6.231586456298828, "global_step": 101421, "epoch": 2414} {"train_loss": -6.421365261077881, "global_step": 101422, "epoch": 2414} {"train_loss": -6.214273452758789, "global_step": 101423, "epoch": 2414} {"train_loss": -6.297936916351318, "global_step": 101424, "epoch": 2414} {"train_loss": -6.3172502517700195, "global_step": 101425, "epoch": 2414} {"train_loss": -6.346798419952393, "global_step": 101426, "epoch": 2414} {"train_loss": -6.252758979797363, "global_step": 101427, "epoch": 2414} {"train_loss": -6.250925064086914, "global_step": 101428, "epoch": 2414} {"train_loss": -6.347696542739868, "global_step": 101429, "epoch": 2414, "val_loss": 64098.90234375} {"train_loss": -6.340061187744141, "global_step": 101430, "epoch": 2415} {"train_loss": -6.399694442749023, "global_step": 101431, "epoch": 2415} {"train_loss": -6.3912434577941895, "global_step": 101432, "epoch": 2415} {"train_loss": -6.365370273590088, "global_step": 101433, "epoch": 2415} {"train_loss": -6.355992794036865, "global_step": 101434, "epoch": 2415} {"train_loss": -6.370203971862793, "global_step": 101435, "epoch": 2415} {"train_loss": -6.297964572906494, "global_step": 101436, "epoch": 2415} {"train_loss": -6.331357002258301, "global_step": 101437, "epoch": 2415} {"train_loss": -6.216215133666992, "global_step": 101438, "epoch": 2415} {"train_loss": -6.396999359130859, "global_step": 101439, "epoch": 2415} {"train_loss": -6.372344970703125, "global_step": 101440, "epoch": 2415} {"train_loss": -6.287635803222656, "global_step": 101441, "epoch": 2415} {"train_loss": -6.421590805053711, "global_step": 101442, "epoch": 2415} {"train_loss": -6.434576988220215, "global_step": 101443, "epoch": 2415} {"train_loss": -6.218834400177002, "global_step": 101444, "epoch": 2415} {"train_loss": -6.334489822387695, "global_step": 101445, "epoch": 2415} {"train_loss": -6.400808811187744, "global_step": 101446, "epoch": 2415} {"train_loss": -6.397090435028076, "global_step": 101447, "epoch": 2415} {"train_loss": -6.380768775939941, "global_step": 101448, "epoch": 2415} {"train_loss": -6.34807014465332, "global_step": 101449, "epoch": 2415} {"train_loss": -6.222857475280762, "global_step": 101450, "epoch": 2415} {"train_loss": -6.271995544433594, "global_step": 101451, "epoch": 2415} {"train_loss": -6.384855270385742, "global_step": 101452, "epoch": 2415} {"train_loss": -6.340090751647949, "global_step": 101453, "epoch": 2415} {"train_loss": -6.328556060791016, "global_step": 101454, "epoch": 2415} {"train_loss": -6.320042133331299, "global_step": 101455, "epoch": 2415} {"train_loss": -6.321144104003906, "global_step": 101456, "epoch": 2415} {"train_loss": -6.434840679168701, "global_step": 101457, "epoch": 2415} {"train_loss": -6.276092529296875, "global_step": 101458, "epoch": 2415} {"train_loss": -6.467371940612793, "global_step": 101459, "epoch": 2415} {"train_loss": -6.410733222961426, "global_step": 101460, "epoch": 2415} {"train_loss": -6.4544291496276855, "global_step": 101461, "epoch": 2415} {"train_loss": -6.442100524902344, "global_step": 101462, "epoch": 2415} {"train_loss": -6.422469139099121, "global_step": 101463, "epoch": 2415} {"train_loss": -6.281986236572266, "global_step": 101464, "epoch": 2415} {"train_loss": -6.431175231933594, "global_step": 101465, "epoch": 2415} {"train_loss": -6.278243064880371, "global_step": 101466, "epoch": 2415} {"train_loss": -6.267038345336914, "global_step": 101467, "epoch": 2415} {"train_loss": -6.471428871154785, "global_step": 101468, "epoch": 2415} {"train_loss": -6.21217155456543, "global_step": 101469, "epoch": 2415} {"train_loss": -6.483456134796143, "global_step": 101470, "epoch": 2415} {"train_loss": -6.356476045790172, "global_step": 101471, "epoch": 2415, "val_loss": 64510.734375} {"train_loss": -6.354247093200684, "global_step": 101472, "epoch": 2416} {"train_loss": -6.374326229095459, "global_step": 101473, "epoch": 2416} {"train_loss": -6.31912088394165, "global_step": 101474, "epoch": 2416} {"train_loss": -6.398988723754883, "global_step": 101475, "epoch": 2416} {"train_loss": -6.381926536560059, "global_step": 101476, "epoch": 2416} {"train_loss": -6.364930152893066, "global_step": 101477, "epoch": 2416} {"train_loss": -6.355696678161621, "global_step": 101478, "epoch": 2416} {"train_loss": -6.331293106079102, "global_step": 101479, "epoch": 2416} {"train_loss": -6.325554370880127, "global_step": 101480, "epoch": 2416} {"train_loss": -6.283882141113281, "global_step": 101481, "epoch": 2416} {"train_loss": -6.427632808685303, "global_step": 101482, "epoch": 2416} {"train_loss": -6.314759731292725, "global_step": 101483, "epoch": 2416} {"train_loss": -6.391179084777832, "global_step": 101484, "epoch": 2416} {"train_loss": -6.391823768615723, "global_step": 101485, "epoch": 2416} {"train_loss": -6.384406089782715, "global_step": 101486, "epoch": 2416} {"train_loss": -6.316314220428467, "global_step": 101487, "epoch": 2416} {"train_loss": -6.3031086921691895, "global_step": 101488, "epoch": 2416} {"train_loss": -6.445094585418701, "global_step": 101489, "epoch": 2416} {"train_loss": -6.270743370056152, "global_step": 101490, "epoch": 2416} {"train_loss": -6.266473293304443, "global_step": 101491, "epoch": 2416} {"train_loss": -6.370380878448486, "global_step": 101492, "epoch": 2416} {"train_loss": -6.391522407531738, "global_step": 101493, "epoch": 2416} {"train_loss": -6.510255813598633, "global_step": 101494, "epoch": 2416} {"train_loss": -6.408289909362793, "global_step": 101495, "epoch": 2416} {"train_loss": -6.392307758331299, "global_step": 101496, "epoch": 2416} {"train_loss": -6.421435356140137, "global_step": 101497, "epoch": 2416} {"train_loss": -6.459170341491699, "global_step": 101498, "epoch": 2416} {"train_loss": -6.4102020263671875, "global_step": 101499, "epoch": 2416} {"train_loss": -6.394624710083008, "global_step": 101500, "epoch": 2416} {"train_loss": -6.369747638702393, "global_step": 101501, "epoch": 2416} {"train_loss": -6.48358154296875, "global_step": 101502, "epoch": 2416} {"train_loss": -6.401109218597412, "global_step": 101503, "epoch": 2416} {"train_loss": -6.3635711669921875, "global_step": 101504, "epoch": 2416} {"train_loss": -6.454572677612305, "global_step": 101505, "epoch": 2416} {"train_loss": -6.415498733520508, "global_step": 101506, "epoch": 2416} {"train_loss": -6.396247863769531, "global_step": 101507, "epoch": 2416} {"train_loss": -6.372657775878906, "global_step": 101508, "epoch": 2416} {"train_loss": -6.356178283691406, "global_step": 101509, "epoch": 2416} {"train_loss": -6.50313138961792, "global_step": 101510, "epoch": 2416} {"train_loss": -6.3339996337890625, "global_step": 101511, "epoch": 2416} {"train_loss": -6.4467453956604, "global_step": 101512, "epoch": 2416} {"train_loss": -6.382002603440058, "global_step": 101513, "epoch": 2416, "val_loss": 64175.97265625} {"train_loss": -6.44663667678833, "global_step": 101514, "epoch": 2417} {"train_loss": -6.414252281188965, "global_step": 101515, "epoch": 2417} {"train_loss": -6.349038124084473, "global_step": 101516, "epoch": 2417} {"train_loss": -6.413444995880127, "global_step": 101517, "epoch": 2417} {"train_loss": -6.3164825439453125, "global_step": 101518, "epoch": 2417} {"train_loss": -6.426445960998535, "global_step": 101519, "epoch": 2417} {"train_loss": -6.554211616516113, "global_step": 101520, "epoch": 2417} {"train_loss": -6.34121036529541, "global_step": 101521, "epoch": 2417} {"train_loss": -6.364995002746582, "global_step": 101522, "epoch": 2417} {"train_loss": -6.305119037628174, "global_step": 101523, "epoch": 2417} {"train_loss": -6.500987529754639, "global_step": 101524, "epoch": 2417} {"train_loss": -6.347169876098633, "global_step": 101525, "epoch": 2417} {"train_loss": -6.375212669372559, "global_step": 101526, "epoch": 2417} {"train_loss": -6.348067760467529, "global_step": 101527, "epoch": 2417} {"train_loss": -6.479762077331543, "global_step": 101528, "epoch": 2417} {"train_loss": -6.3753557205200195, "global_step": 101529, "epoch": 2417} {"train_loss": -6.399712562561035, "global_step": 101530, "epoch": 2417} {"train_loss": -6.4534173011779785, "global_step": 101531, "epoch": 2417} {"train_loss": -6.308442115783691, "global_step": 101532, "epoch": 2417} {"train_loss": -6.528586387634277, "global_step": 101533, "epoch": 2417} {"train_loss": -6.448166370391846, "global_step": 101534, "epoch": 2417} {"train_loss": -6.338212966918945, "global_step": 101535, "epoch": 2417} {"train_loss": -6.296726703643799, "global_step": 101536, "epoch": 2417} {"train_loss": -6.417538642883301, "global_step": 101537, "epoch": 2417} {"train_loss": -6.380638122558594, "global_step": 101538, "epoch": 2417} {"train_loss": -6.456933975219727, "global_step": 101539, "epoch": 2417} {"train_loss": -6.315461158752441, "global_step": 101540, "epoch": 2417} {"train_loss": -6.469766139984131, "global_step": 101541, "epoch": 2417} {"train_loss": -6.383208274841309, "global_step": 101542, "epoch": 2417} {"train_loss": -6.510900020599365, "global_step": 101543, "epoch": 2417} {"train_loss": -6.28610897064209, "global_step": 101544, "epoch": 2417} {"train_loss": -6.2873358726501465, "global_step": 101545, "epoch": 2417} {"train_loss": -6.444174289703369, "global_step": 101546, "epoch": 2417} {"train_loss": -6.463356971740723, "global_step": 101547, "epoch": 2417} {"train_loss": -6.4782562255859375, "global_step": 101548, "epoch": 2417} {"train_loss": -6.35980224609375, "global_step": 101549, "epoch": 2417} {"train_loss": -6.414285659790039, "global_step": 101550, "epoch": 2417} {"train_loss": -6.421724796295166, "global_step": 101551, "epoch": 2417} {"train_loss": -6.342967987060547, "global_step": 101552, "epoch": 2417} {"train_loss": -6.36311149597168, "global_step": 101553, "epoch": 2417} {"train_loss": -6.450414180755615, "global_step": 101554, "epoch": 2417} {"train_loss": -6.400963374546596, "global_step": 101555, "epoch": 2417, "val_loss": 64169.12890625} {"train_loss": -6.389963150024414, "global_step": 101556, "epoch": 2418} {"train_loss": -6.438426971435547, "global_step": 101557, "epoch": 2418} {"train_loss": -6.394900321960449, "global_step": 101558, "epoch": 2418} {"train_loss": -6.4828643798828125, "global_step": 101559, "epoch": 2418} {"train_loss": -6.43850040435791, "global_step": 101560, "epoch": 2418} {"train_loss": -6.318656921386719, "global_step": 101561, "epoch": 2418} {"train_loss": -6.570617198944092, "global_step": 101562, "epoch": 2418} {"train_loss": -6.4025163650512695, "global_step": 101563, "epoch": 2418} {"train_loss": -6.2701544761657715, "global_step": 101564, "epoch": 2418} {"train_loss": -6.334550857543945, "global_step": 101565, "epoch": 2418} {"train_loss": -6.513161659240723, "global_step": 101566, "epoch": 2418} {"train_loss": -6.416741371154785, "global_step": 101567, "epoch": 2418} {"train_loss": -6.26048469543457, "global_step": 101568, "epoch": 2418} {"train_loss": -6.3391289710998535, "global_step": 101569, "epoch": 2418} {"train_loss": -6.417411804199219, "global_step": 101570, "epoch": 2418} {"train_loss": -6.218306064605713, "global_step": 101571, "epoch": 2418} {"train_loss": -6.313685417175293, "global_step": 101572, "epoch": 2418} {"train_loss": -6.22594690322876, "global_step": 101573, "epoch": 2418} {"train_loss": -6.218017578125, "global_step": 101574, "epoch": 2418} {"train_loss": -6.270812034606934, "global_step": 101575, "epoch": 2418} {"train_loss": -6.2869343757629395, "global_step": 101576, "epoch": 2418} {"train_loss": -6.259500980377197, "global_step": 101577, "epoch": 2418} {"train_loss": -6.303318023681641, "global_step": 101578, "epoch": 2418} {"train_loss": -6.392962455749512, "global_step": 101579, "epoch": 2418} {"train_loss": -6.301372051239014, "global_step": 101580, "epoch": 2418} {"train_loss": -6.38121223449707, "global_step": 101581, "epoch": 2418} {"train_loss": -6.398613929748535, "global_step": 101582, "epoch": 2418} {"train_loss": -6.2433905601501465, "global_step": 101583, "epoch": 2418} {"train_loss": -6.350763320922852, "global_step": 101584, "epoch": 2418} {"train_loss": -6.287415027618408, "global_step": 101585, "epoch": 2418} {"train_loss": -6.393553733825684, "global_step": 101586, "epoch": 2418} {"train_loss": -6.283949375152588, "global_step": 101587, "epoch": 2418} {"train_loss": -6.3502912521362305, "global_step": 101588, "epoch": 2418} {"train_loss": -6.294278144836426, "global_step": 101589, "epoch": 2418} {"train_loss": -6.31999397277832, "global_step": 101590, "epoch": 2418} {"train_loss": -6.385331153869629, "global_step": 101591, "epoch": 2418} {"train_loss": -6.393793106079102, "global_step": 101592, "epoch": 2418} {"train_loss": -6.5080647468566895, "global_step": 101593, "epoch": 2418} {"train_loss": -6.289227485656738, "global_step": 101594, "epoch": 2418} {"train_loss": -6.385685920715332, "global_step": 101595, "epoch": 2418} {"train_loss": -6.248002052307129, "global_step": 101596, "epoch": 2418} {"train_loss": -6.353153035754249, "global_step": 101597, "epoch": 2418, "val_loss": 64086.09765625} {"train_loss": -6.356950759887695, "global_step": 101598, "epoch": 2419} {"train_loss": -6.375174522399902, "global_step": 101599, "epoch": 2419} {"train_loss": -6.283870220184326, "global_step": 101600, "epoch": 2419} {"train_loss": -6.382232666015625, "global_step": 101601, "epoch": 2419} {"train_loss": -6.3786773681640625, "global_step": 101602, "epoch": 2419} {"train_loss": -6.462707042694092, "global_step": 101603, "epoch": 2419} {"train_loss": -6.338421821594238, "global_step": 101604, "epoch": 2419} {"train_loss": -6.4862165451049805, "global_step": 101605, "epoch": 2419} {"train_loss": -6.365961074829102, "global_step": 101606, "epoch": 2419} {"train_loss": -6.378552436828613, "global_step": 101607, "epoch": 2419} {"train_loss": -6.424422740936279, "global_step": 101608, "epoch": 2419} {"train_loss": -6.544788360595703, "global_step": 101609, "epoch": 2419} {"train_loss": -6.467394828796387, "global_step": 101610, "epoch": 2419} {"train_loss": -6.484168529510498, "global_step": 101611, "epoch": 2419} {"train_loss": -6.290305137634277, "global_step": 101612, "epoch": 2419} {"train_loss": -6.379352569580078, "global_step": 101613, "epoch": 2419} {"train_loss": -6.368268013000488, "global_step": 101614, "epoch": 2419} {"train_loss": -6.5025248527526855, "global_step": 101615, "epoch": 2419} {"train_loss": -6.390070915222168, "global_step": 101616, "epoch": 2419} {"train_loss": -6.355823516845703, "global_step": 101617, "epoch": 2419} {"train_loss": -6.28782320022583, "global_step": 101618, "epoch": 2419} {"train_loss": -6.376811981201172, "global_step": 101619, "epoch": 2419} {"train_loss": -6.303200721740723, "global_step": 101620, "epoch": 2419} {"train_loss": -6.494610786437988, "global_step": 101621, "epoch": 2419} {"train_loss": -6.476311683654785, "global_step": 101622, "epoch": 2419} {"train_loss": -6.580140113830566, "global_step": 101623, "epoch": 2419} {"train_loss": -6.281834602355957, "global_step": 101624, "epoch": 2419} {"train_loss": -6.429922103881836, "global_step": 101625, "epoch": 2419} {"train_loss": -6.362149238586426, "global_step": 101626, "epoch": 2419} {"train_loss": -6.4109578132629395, "global_step": 101627, "epoch": 2419} {"train_loss": -6.403834819793701, "global_step": 101628, "epoch": 2419} {"train_loss": -6.451958656311035, "global_step": 101629, "epoch": 2419} {"train_loss": -6.41398811340332, "global_step": 101630, "epoch": 2419} {"train_loss": -6.298755168914795, "global_step": 101631, "epoch": 2419} {"train_loss": -6.540963649749756, "global_step": 101632, "epoch": 2419} {"train_loss": -6.395919322967529, "global_step": 101633, "epoch": 2419} {"train_loss": -6.480917930603027, "global_step": 101634, "epoch": 2419} {"train_loss": -6.448916435241699, "global_step": 101635, "epoch": 2419} {"train_loss": -6.409314155578613, "global_step": 101636, "epoch": 2419} {"train_loss": -6.368110656738281, "global_step": 101637, "epoch": 2419} {"train_loss": -6.435155868530273, "global_step": 101638, "epoch": 2419} {"train_loss": -6.405979122434344, "global_step": 101639, "epoch": 2419, "val_loss": 64332.74609375} {"train_loss": -6.417113304138184, "global_step": 101640, "epoch": 2420} {"train_loss": -6.427303314208984, "global_step": 101641, "epoch": 2420} {"train_loss": -6.3720703125, "global_step": 101642, "epoch": 2420} {"train_loss": -6.379302978515625, "global_step": 101643, "epoch": 2420} {"train_loss": -6.407801628112793, "global_step": 101644, "epoch": 2420} {"train_loss": -6.393298149108887, "global_step": 101645, "epoch": 2420} {"train_loss": -6.393759727478027, "global_step": 101646, "epoch": 2420} {"train_loss": -6.235278606414795, "global_step": 101647, "epoch": 2420} {"train_loss": -6.288286209106445, "global_step": 101648, "epoch": 2420} {"train_loss": -6.369019985198975, "global_step": 101649, "epoch": 2420} {"train_loss": -6.404565334320068, "global_step": 101650, "epoch": 2420} {"train_loss": -6.3165435791015625, "global_step": 101651, "epoch": 2420} {"train_loss": -6.283403396606445, "global_step": 101652, "epoch": 2420} {"train_loss": -6.40507173538208, "global_step": 101653, "epoch": 2420} {"train_loss": -6.28533411026001, "global_step": 101654, "epoch": 2420} {"train_loss": -6.378410816192627, "global_step": 101655, "epoch": 2420} {"train_loss": -6.319729804992676, "global_step": 101656, "epoch": 2420} {"train_loss": -6.329371452331543, "global_step": 101657, "epoch": 2420} {"train_loss": -6.419168949127197, "global_step": 101658, "epoch": 2420} {"train_loss": -6.2690958976745605, "global_step": 101659, "epoch": 2420} {"train_loss": -6.266812801361084, "global_step": 101660, "epoch": 2420} {"train_loss": -6.395847320556641, "global_step": 101661, "epoch": 2420} {"train_loss": -6.434228420257568, "global_step": 101662, "epoch": 2420} {"train_loss": -6.334700584411621, "global_step": 101663, "epoch": 2420} {"train_loss": -6.429159164428711, "global_step": 101664, "epoch": 2420} {"train_loss": -6.342947483062744, "global_step": 101665, "epoch": 2420} {"train_loss": -6.383274078369141, "global_step": 101666, "epoch": 2420} {"train_loss": -6.347933769226074, "global_step": 101667, "epoch": 2420} {"train_loss": -6.354318618774414, "global_step": 101668, "epoch": 2420} {"train_loss": -6.380592346191406, "global_step": 101669, "epoch": 2420} {"train_loss": -6.392943382263184, "global_step": 101670, "epoch": 2420} {"train_loss": -6.353207111358643, "global_step": 101671, "epoch": 2420} {"train_loss": -6.377705097198486, "global_step": 101672, "epoch": 2420} {"train_loss": -6.301219940185547, "global_step": 101673, "epoch": 2420} {"train_loss": -6.541233062744141, "global_step": 101674, "epoch": 2420} {"train_loss": -6.391938209533691, "global_step": 101675, "epoch": 2420} {"train_loss": -6.345445156097412, "global_step": 101676, "epoch": 2420} {"train_loss": -6.394023418426514, "global_step": 101677, "epoch": 2420} {"train_loss": -6.3754401206970215, "global_step": 101678, "epoch": 2420} {"train_loss": -6.402900695800781, "global_step": 101679, "epoch": 2420} {"train_loss": -6.297282695770264, "global_step": 101680, "epoch": 2420} {"train_loss": -6.363626253037226, "global_step": 101681, "epoch": 2420, "val_loss": 64157.6171875} {"train_loss": -6.405333995819092, "global_step": 101682, "epoch": 2421} {"train_loss": -6.393314838409424, "global_step": 101683, "epoch": 2421} {"train_loss": -6.365605354309082, "global_step": 101684, "epoch": 2421} {"train_loss": -6.4339799880981445, "global_step": 101685, "epoch": 2421} {"train_loss": -6.480687141418457, "global_step": 101686, "epoch": 2421} {"train_loss": -6.453553676605225, "global_step": 101687, "epoch": 2421} {"train_loss": -6.36328125, "global_step": 101688, "epoch": 2421} {"train_loss": -6.236132621765137, "global_step": 101689, "epoch": 2421} {"train_loss": -6.392210006713867, "global_step": 101690, "epoch": 2421} {"train_loss": -6.3931565284729, "global_step": 101691, "epoch": 2421} {"train_loss": -6.363767623901367, "global_step": 101692, "epoch": 2421} {"train_loss": -6.416006565093994, "global_step": 101693, "epoch": 2421} {"train_loss": -6.460926055908203, "global_step": 101694, "epoch": 2421} {"train_loss": -6.397032260894775, "global_step": 101695, "epoch": 2421} {"train_loss": -6.4029221534729, "global_step": 101696, "epoch": 2421} {"train_loss": -6.415400505065918, "global_step": 101697, "epoch": 2421} {"train_loss": -6.3868889808654785, "global_step": 101698, "epoch": 2421} {"train_loss": -6.493391513824463, "global_step": 101699, "epoch": 2421} {"train_loss": -6.306858062744141, "global_step": 101700, "epoch": 2421} {"train_loss": -6.314945697784424, "global_step": 101701, "epoch": 2421} {"train_loss": -6.41261100769043, "global_step": 101702, "epoch": 2421} {"train_loss": -6.353640556335449, "global_step": 101703, "epoch": 2421} {"train_loss": -6.448788166046143, "global_step": 101704, "epoch": 2421} {"train_loss": -6.358137130737305, "global_step": 101705, "epoch": 2421} {"train_loss": -6.441777229309082, "global_step": 101706, "epoch": 2421} {"train_loss": -6.329805374145508, "global_step": 101707, "epoch": 2421} {"train_loss": -6.346026420593262, "global_step": 101708, "epoch": 2421} {"train_loss": -6.391155242919922, "global_step": 101709, "epoch": 2421} {"train_loss": -6.425461769104004, "global_step": 101710, "epoch": 2421} {"train_loss": -6.42580509185791, "global_step": 101711, "epoch": 2421} {"train_loss": -6.4074506759643555, "global_step": 101712, "epoch": 2421} {"train_loss": -6.406442165374756, "global_step": 101713, "epoch": 2421} {"train_loss": -6.408481121063232, "global_step": 101714, "epoch": 2421} {"train_loss": -6.457479953765869, "global_step": 101715, "epoch": 2421} {"train_loss": -6.422183990478516, "global_step": 101716, "epoch": 2421} {"train_loss": -6.474190711975098, "global_step": 101717, "epoch": 2421} {"train_loss": -6.473363876342773, "global_step": 101718, "epoch": 2421} {"train_loss": -6.3327531814575195, "global_step": 101719, "epoch": 2421} {"train_loss": -6.431632041931152, "global_step": 101720, "epoch": 2421} {"train_loss": -6.341437816619873, "global_step": 101721, "epoch": 2421} {"train_loss": -6.402682304382324, "global_step": 101722, "epoch": 2421} {"train_loss": -6.402318102972848, "global_step": 101723, "epoch": 2421, "val_loss": 64433.65234375} {"train_loss": -6.3772454261779785, "global_step": 101724, "epoch": 2422} {"train_loss": -6.33405065536499, "global_step": 101725, "epoch": 2422} {"train_loss": -6.264795303344727, "global_step": 101726, "epoch": 2422} {"train_loss": -6.374261856079102, "global_step": 101727, "epoch": 2422} {"train_loss": -6.547266960144043, "global_step": 101728, "epoch": 2422} {"train_loss": -6.3269758224487305, "global_step": 101729, "epoch": 2422} {"train_loss": -6.473038196563721, "global_step": 101730, "epoch": 2422} {"train_loss": -6.359523773193359, "global_step": 101731, "epoch": 2422} {"train_loss": -6.467874526977539, "global_step": 101732, "epoch": 2422} {"train_loss": -6.531979560852051, "global_step": 101733, "epoch": 2422} {"train_loss": -6.500949859619141, "global_step": 101734, "epoch": 2422} {"train_loss": -6.4392924308776855, "global_step": 101735, "epoch": 2422} {"train_loss": -6.483402729034424, "global_step": 101736, "epoch": 2422} {"train_loss": -6.517603874206543, "global_step": 101737, "epoch": 2422} {"train_loss": -6.307693004608154, "global_step": 101738, "epoch": 2422} {"train_loss": -6.38840389251709, "global_step": 101739, "epoch": 2422} {"train_loss": -6.427623748779297, "global_step": 101740, "epoch": 2422} {"train_loss": -6.37131929397583, "global_step": 101741, "epoch": 2422} {"train_loss": -6.389091968536377, "global_step": 101742, "epoch": 2422} {"train_loss": -6.517385482788086, "global_step": 101743, "epoch": 2422} {"train_loss": -6.367693901062012, "global_step": 101744, "epoch": 2422} {"train_loss": -6.3194475173950195, "global_step": 101745, "epoch": 2422} {"train_loss": -6.43296480178833, "global_step": 101746, "epoch": 2422} {"train_loss": -6.332310676574707, "global_step": 101747, "epoch": 2422} {"train_loss": -6.265546798706055, "global_step": 101748, "epoch": 2422} {"train_loss": -6.390237808227539, "global_step": 101749, "epoch": 2422} {"train_loss": -6.378866672515869, "global_step": 101750, "epoch": 2422} {"train_loss": -6.315561771392822, "global_step": 101751, "epoch": 2422} {"train_loss": -6.369938850402832, "global_step": 101752, "epoch": 2422} {"train_loss": -6.389411926269531, "global_step": 101753, "epoch": 2422} {"train_loss": -6.315549373626709, "global_step": 101754, "epoch": 2422} {"train_loss": -6.34147834777832, "global_step": 101755, "epoch": 2422} {"train_loss": -6.46143913269043, "global_step": 101756, "epoch": 2422} {"train_loss": -6.274444580078125, "global_step": 101757, "epoch": 2422} {"train_loss": -6.394137382507324, "global_step": 101758, "epoch": 2422} {"train_loss": -6.192320823669434, "global_step": 101759, "epoch": 2422} {"train_loss": -6.326362609863281, "global_step": 101760, "epoch": 2422} {"train_loss": -6.168450355529785, "global_step": 101761, "epoch": 2422} {"train_loss": -6.412517547607422, "global_step": 101762, "epoch": 2422} {"train_loss": -6.267514705657959, "global_step": 101763, "epoch": 2422} {"train_loss": -6.23258638381958, "global_step": 101764, "epoch": 2422} {"train_loss": -6.370444524855841, "global_step": 101765, "epoch": 2422, "val_loss": 64243.75390625} {"train_loss": -6.257807731628418, "global_step": 101766, "epoch": 2423} {"train_loss": -6.290156364440918, "global_step": 101767, "epoch": 2423} {"train_loss": -6.245104789733887, "global_step": 101768, "epoch": 2423} {"train_loss": -6.3108601570129395, "global_step": 101769, "epoch": 2423} {"train_loss": -6.188136100769043, "global_step": 101770, "epoch": 2423} {"train_loss": -6.352019786834717, "global_step": 101771, "epoch": 2423} {"train_loss": -6.1204328536987305, "global_step": 101772, "epoch": 2423} {"train_loss": -6.387188911437988, "global_step": 101773, "epoch": 2423} {"train_loss": -6.297680377960205, "global_step": 101774, "epoch": 2423} {"train_loss": -6.403690338134766, "global_step": 101775, "epoch": 2423} {"train_loss": -6.3149919509887695, "global_step": 101776, "epoch": 2423} {"train_loss": -6.27208137512207, "global_step": 101777, "epoch": 2423} {"train_loss": -6.295975685119629, "global_step": 101778, "epoch": 2423} {"train_loss": -6.300365447998047, "global_step": 101779, "epoch": 2423} {"train_loss": -6.389434337615967, "global_step": 101780, "epoch": 2423} {"train_loss": -6.256705284118652, "global_step": 101781, "epoch": 2423} {"train_loss": -6.263373374938965, "global_step": 101782, "epoch": 2423} {"train_loss": -6.278660774230957, "global_step": 101783, "epoch": 2423} {"train_loss": -6.252110004425049, "global_step": 101784, "epoch": 2423} {"train_loss": -6.372366905212402, "global_step": 101785, "epoch": 2423} {"train_loss": -6.41171932220459, "global_step": 101786, "epoch": 2423} {"train_loss": -6.297679901123047, "global_step": 101787, "epoch": 2423} {"train_loss": -6.233743190765381, "global_step": 101788, "epoch": 2423} {"train_loss": -6.4165802001953125, "global_step": 101789, "epoch": 2423} {"train_loss": -6.348705291748047, "global_step": 101790, "epoch": 2423} {"train_loss": -6.376851558685303, "global_step": 101791, "epoch": 2423} {"train_loss": -6.363354206085205, "global_step": 101792, "epoch": 2423} {"train_loss": -6.38667106628418, "global_step": 101793, "epoch": 2423} {"train_loss": -6.379619598388672, "global_step": 101794, "epoch": 2423} {"train_loss": -6.31000280380249, "global_step": 101795, "epoch": 2423} {"train_loss": -6.404784202575684, "global_step": 101796, "epoch": 2423} {"train_loss": -6.459142208099365, "global_step": 101797, "epoch": 2423} {"train_loss": -6.410340309143066, "global_step": 101798, "epoch": 2423} {"train_loss": -6.383342742919922, "global_step": 101799, "epoch": 2423} {"train_loss": -6.330626487731934, "global_step": 101800, "epoch": 2423} {"train_loss": -6.480976104736328, "global_step": 101801, "epoch": 2423} {"train_loss": -6.384191513061523, "global_step": 101802, "epoch": 2423} {"train_loss": -6.332696914672852, "global_step": 101803, "epoch": 2423} {"train_loss": -6.366398334503174, "global_step": 101804, "epoch": 2423} {"train_loss": -6.427994251251221, "global_step": 101805, "epoch": 2423} {"train_loss": -6.247076034545898, "global_step": 101806, "epoch": 2423} {"train_loss": -6.334160407384236, "global_step": 101807, "epoch": 2423, "val_loss": 64433.31640625} {"train_loss": -6.356407165527344, "global_step": 101808, "epoch": 2424} {"train_loss": -6.413869857788086, "global_step": 101809, "epoch": 2424} {"train_loss": -6.348026752471924, "global_step": 101810, "epoch": 2424} {"train_loss": -6.277177810668945, "global_step": 101811, "epoch": 2424} {"train_loss": -6.433145046234131, "global_step": 101812, "epoch": 2424} {"train_loss": -6.341997146606445, "global_step": 101813, "epoch": 2424} {"train_loss": -6.419868469238281, "global_step": 101814, "epoch": 2424} {"train_loss": -6.441694259643555, "global_step": 101815, "epoch": 2424} {"train_loss": -6.370171546936035, "global_step": 101816, "epoch": 2424} {"train_loss": -6.439487934112549, "global_step": 101817, "epoch": 2424} {"train_loss": -6.392904281616211, "global_step": 101818, "epoch": 2424} {"train_loss": -6.380471229553223, "global_step": 101819, "epoch": 2424} {"train_loss": -6.330686569213867, "global_step": 101820, "epoch": 2424} {"train_loss": -6.364565849304199, "global_step": 101821, "epoch": 2424} {"train_loss": -6.368650913238525, "global_step": 101822, "epoch": 2424} {"train_loss": -6.432336807250977, "global_step": 101823, "epoch": 2424} {"train_loss": -6.238173484802246, "global_step": 101824, "epoch": 2424} {"train_loss": -6.400608062744141, "global_step": 101825, "epoch": 2424} {"train_loss": -6.395652770996094, "global_step": 101826, "epoch": 2424} {"train_loss": -6.339212894439697, "global_step": 101827, "epoch": 2424} {"train_loss": -6.44231653213501, "global_step": 101828, "epoch": 2424} {"train_loss": -6.3719162940979, "global_step": 101829, "epoch": 2424} {"train_loss": -6.5715742111206055, "global_step": 101830, "epoch": 2424} {"train_loss": -6.390049934387207, "global_step": 101831, "epoch": 2424} {"train_loss": -6.417754650115967, "global_step": 101832, "epoch": 2424} {"train_loss": -6.466274738311768, "global_step": 101833, "epoch": 2424} {"train_loss": -6.385893821716309, "global_step": 101834, "epoch": 2424} {"train_loss": -6.6097612380981445, "global_step": 101835, "epoch": 2424} {"train_loss": -6.41438627243042, "global_step": 101836, "epoch": 2424} {"train_loss": -6.4674458503723145, "global_step": 101837, "epoch": 2424} {"train_loss": -6.439421653747559, "global_step": 101838, "epoch": 2424} {"train_loss": -6.51821231842041, "global_step": 101839, "epoch": 2424} {"train_loss": -6.5343451499938965, "global_step": 101840, "epoch": 2424} {"train_loss": -6.407255172729492, "global_step": 101841, "epoch": 2424} {"train_loss": -6.340811252593994, "global_step": 101842, "epoch": 2424} {"train_loss": -6.320030212402344, "global_step": 101843, "epoch": 2424} {"train_loss": -6.316775798797607, "global_step": 101844, "epoch": 2424} {"train_loss": -6.3817291259765625, "global_step": 101845, "epoch": 2424} {"train_loss": -6.41593074798584, "global_step": 101846, "epoch": 2424} {"train_loss": -6.380231857299805, "global_step": 101847, "epoch": 2424} {"train_loss": -6.3754682540893555, "global_step": 101848, "epoch": 2424} {"train_loss": -6.401630753562564, "global_step": 101849, "epoch": 2424, "val_loss": 64319.5703125} {"train_loss": -6.2218403816223145, "global_step": 101850, "epoch": 2425} {"train_loss": -6.382601261138916, "global_step": 101851, "epoch": 2425} {"train_loss": -6.309724807739258, "global_step": 101852, "epoch": 2425} {"train_loss": -6.32816219329834, "global_step": 101853, "epoch": 2425} {"train_loss": -6.35497522354126, "global_step": 101854, "epoch": 2425} {"train_loss": -6.319801330566406, "global_step": 101855, "epoch": 2425} {"train_loss": -6.408935546875, "global_step": 101856, "epoch": 2425} {"train_loss": -6.471194267272949, "global_step": 101857, "epoch": 2425} {"train_loss": -6.224451541900635, "global_step": 101858, "epoch": 2425} {"train_loss": -6.24617862701416, "global_step": 101859, "epoch": 2425} {"train_loss": -6.358905792236328, "global_step": 101860, "epoch": 2425} {"train_loss": -6.310129165649414, "global_step": 101861, "epoch": 2425} {"train_loss": -6.344935417175293, "global_step": 101862, "epoch": 2425} {"train_loss": -6.250511169433594, "global_step": 101863, "epoch": 2425} {"train_loss": -6.2828826904296875, "global_step": 101864, "epoch": 2425} {"train_loss": -6.325721740722656, "global_step": 101865, "epoch": 2425} {"train_loss": -6.231961250305176, "global_step": 101866, "epoch": 2425} {"train_loss": -6.4535017013549805, "global_step": 101867, "epoch": 2425} {"train_loss": -6.327692031860352, "global_step": 101868, "epoch": 2425} {"train_loss": -6.357144355773926, "global_step": 101869, "epoch": 2425} {"train_loss": -6.251517295837402, "global_step": 101870, "epoch": 2425} {"train_loss": -6.416781902313232, "global_step": 101871, "epoch": 2425} {"train_loss": -6.355989933013916, "global_step": 101872, "epoch": 2425} {"train_loss": -6.350894451141357, "global_step": 101873, "epoch": 2425} {"train_loss": -6.303772449493408, "global_step": 101874, "epoch": 2425} {"train_loss": -6.3624114990234375, "global_step": 101875, "epoch": 2425} {"train_loss": -6.555538177490234, "global_step": 101876, "epoch": 2425} {"train_loss": -6.29688024520874, "global_step": 101877, "epoch": 2425} {"train_loss": -6.408555507659912, "global_step": 101878, "epoch": 2425} {"train_loss": -6.324429512023926, "global_step": 101879, "epoch": 2425} {"train_loss": -6.466042995452881, "global_step": 101880, "epoch": 2425} {"train_loss": -6.4370222091674805, "global_step": 101881, "epoch": 2425} {"train_loss": -6.431816577911377, "global_step": 101882, "epoch": 2425} {"train_loss": -6.329506874084473, "global_step": 101883, "epoch": 2425} {"train_loss": -6.515859603881836, "global_step": 101884, "epoch": 2425} {"train_loss": -6.237026214599609, "global_step": 101885, "epoch": 2425} {"train_loss": -6.310498237609863, "global_step": 101886, "epoch": 2425} {"train_loss": -6.285722255706787, "global_step": 101887, "epoch": 2425} {"train_loss": -6.405335903167725, "global_step": 101888, "epoch": 2425} {"train_loss": -6.230617523193359, "global_step": 101889, "epoch": 2425} {"train_loss": -6.371480941772461, "global_step": 101890, "epoch": 2425} {"train_loss": -6.347836846397037, "global_step": 101891, "epoch": 2425, "val_loss": 64232.78125} {"train_loss": -6.300083160400391, "global_step": 101892, "epoch": 2426} {"train_loss": -6.382299423217773, "global_step": 101893, "epoch": 2426} {"train_loss": -6.327106475830078, "global_step": 101894, "epoch": 2426} {"train_loss": -6.498917579650879, "global_step": 101895, "epoch": 2426} {"train_loss": -6.4103779792785645, "global_step": 101896, "epoch": 2426} {"train_loss": -6.3381781578063965, "global_step": 101897, "epoch": 2426} {"train_loss": -6.2854814529418945, "global_step": 101898, "epoch": 2426} {"train_loss": -6.4195332527160645, "global_step": 101899, "epoch": 2426} {"train_loss": -6.392074108123779, "global_step": 101900, "epoch": 2426} {"train_loss": -6.519982814788818, "global_step": 101901, "epoch": 2426} {"train_loss": -6.348764419555664, "global_step": 101902, "epoch": 2426} {"train_loss": -6.432668685913086, "global_step": 101903, "epoch": 2426} {"train_loss": -6.432084083557129, "global_step": 101904, "epoch": 2426} {"train_loss": -6.429165363311768, "global_step": 101905, "epoch": 2426} {"train_loss": -6.329527854919434, "global_step": 101906, "epoch": 2426} {"train_loss": -6.3888936042785645, "global_step": 101907, "epoch": 2426} {"train_loss": -6.581217288970947, "global_step": 101908, "epoch": 2426} {"train_loss": -6.436034679412842, "global_step": 101909, "epoch": 2426} {"train_loss": -6.42119026184082, "global_step": 101910, "epoch": 2426} {"train_loss": -6.352667331695557, "global_step": 101911, "epoch": 2426} {"train_loss": -6.324963569641113, "global_step": 101912, "epoch": 2426} {"train_loss": -6.539344787597656, "global_step": 101913, "epoch": 2426} {"train_loss": -6.363922119140625, "global_step": 101914, "epoch": 2426} {"train_loss": -6.3431267738342285, "global_step": 101915, "epoch": 2426} {"train_loss": -6.331012725830078, "global_step": 101916, "epoch": 2426} {"train_loss": -6.337211608886719, "global_step": 101917, "epoch": 2426} {"train_loss": -6.341012001037598, "global_step": 101918, "epoch": 2426} {"train_loss": -6.366472244262695, "global_step": 101919, "epoch": 2426} {"train_loss": -6.335183620452881, "global_step": 101920, "epoch": 2426} {"train_loss": -6.359171390533447, "global_step": 101921, "epoch": 2426} {"train_loss": -6.238312721252441, "global_step": 101922, "epoch": 2426} {"train_loss": -6.36358642578125, "global_step": 101923, "epoch": 2426} {"train_loss": -6.273709774017334, "global_step": 101924, "epoch": 2426} {"train_loss": -6.370314121246338, "global_step": 101925, "epoch": 2426} {"train_loss": -6.319402694702148, "global_step": 101926, "epoch": 2426} {"train_loss": -6.254950046539307, "global_step": 101927, "epoch": 2426} {"train_loss": -6.266529083251953, "global_step": 101928, "epoch": 2426} {"train_loss": -6.201390266418457, "global_step": 101929, "epoch": 2426} {"train_loss": -6.482539176940918, "global_step": 101930, "epoch": 2426} {"train_loss": -6.290137767791748, "global_step": 101931, "epoch": 2426} {"train_loss": -6.337169170379639, "global_step": 101932, "epoch": 2426} {"train_loss": -6.368052868616013, "global_step": 101933, "epoch": 2426, "val_loss": 64215.80078125} {"train_loss": -6.26120662689209, "global_step": 101934, "epoch": 2427} {"train_loss": -6.352595329284668, "global_step": 101935, "epoch": 2427} {"train_loss": -6.435629844665527, "global_step": 101936, "epoch": 2427} {"train_loss": -6.369227409362793, "global_step": 101937, "epoch": 2427} {"train_loss": -6.491927146911621, "global_step": 101938, "epoch": 2427} {"train_loss": -6.323196887969971, "global_step": 101939, "epoch": 2427} {"train_loss": -6.285015106201172, "global_step": 101940, "epoch": 2427} {"train_loss": -6.359487533569336, "global_step": 101941, "epoch": 2427} {"train_loss": -6.335921764373779, "global_step": 101942, "epoch": 2427} {"train_loss": -6.397796154022217, "global_step": 101943, "epoch": 2427} {"train_loss": -6.437963962554932, "global_step": 101944, "epoch": 2427} {"train_loss": -6.34495735168457, "global_step": 101945, "epoch": 2427} {"train_loss": -6.407100200653076, "global_step": 101946, "epoch": 2427} {"train_loss": -6.397314548492432, "global_step": 101947, "epoch": 2427} {"train_loss": -6.38646936416626, "global_step": 101948, "epoch": 2427} {"train_loss": -6.479361534118652, "global_step": 101949, "epoch": 2427} {"train_loss": -6.384876728057861, "global_step": 101950, "epoch": 2427} {"train_loss": -6.463754177093506, "global_step": 101951, "epoch": 2427} {"train_loss": -6.383721351623535, "global_step": 101952, "epoch": 2427} {"train_loss": -6.441161155700684, "global_step": 101953, "epoch": 2427} {"train_loss": -6.372366428375244, "global_step": 101954, "epoch": 2427} {"train_loss": -6.381141662597656, "global_step": 101955, "epoch": 2427} {"train_loss": -6.406577110290527, "global_step": 101956, "epoch": 2427} {"train_loss": -6.356192111968994, "global_step": 101957, "epoch": 2427} {"train_loss": -6.365055084228516, "global_step": 101958, "epoch": 2427} {"train_loss": -6.431122779846191, "global_step": 101959, "epoch": 2427} {"train_loss": -6.346292018890381, "global_step": 101960, "epoch": 2427} {"train_loss": -6.479940891265869, "global_step": 101961, "epoch": 2427} {"train_loss": -6.348482131958008, "global_step": 101962, "epoch": 2427} {"train_loss": -6.336549758911133, "global_step": 101963, "epoch": 2427} {"train_loss": -6.535280227661133, "global_step": 101964, "epoch": 2427} {"train_loss": -6.3168487548828125, "global_step": 101965, "epoch": 2427} {"train_loss": -6.391400337219238, "global_step": 101966, "epoch": 2427} {"train_loss": -6.432260036468506, "global_step": 101967, "epoch": 2427} {"train_loss": -6.385227203369141, "global_step": 101968, "epoch": 2427} {"train_loss": -6.318382263183594, "global_step": 101969, "epoch": 2427} {"train_loss": -6.36108922958374, "global_step": 101970, "epoch": 2427} {"train_loss": -6.311903953552246, "global_step": 101971, "epoch": 2427} {"train_loss": -6.258140563964844, "global_step": 101972, "epoch": 2427} {"train_loss": -6.499472618103027, "global_step": 101973, "epoch": 2427} {"train_loss": -6.322563171386719, "global_step": 101974, "epoch": 2427} {"train_loss": -6.380262181872413, "global_step": 101975, "epoch": 2427, "val_loss": 64165.40234375} {"train_loss": -6.4039106369018555, "global_step": 101976, "epoch": 2428} {"train_loss": -6.427666664123535, "global_step": 101977, "epoch": 2428} {"train_loss": -6.432803153991699, "global_step": 101978, "epoch": 2428} {"train_loss": -6.40935754776001, "global_step": 101979, "epoch": 2428} {"train_loss": -6.382391452789307, "global_step": 101980, "epoch": 2428} {"train_loss": -6.384076118469238, "global_step": 101981, "epoch": 2428} {"train_loss": -6.469298839569092, "global_step": 101982, "epoch": 2428} {"train_loss": -6.250698089599609, "global_step": 101983, "epoch": 2428} {"train_loss": -6.298317909240723, "global_step": 101984, "epoch": 2428} {"train_loss": -6.366262912750244, "global_step": 101985, "epoch": 2428} {"train_loss": -6.344511032104492, "global_step": 101986, "epoch": 2428} {"train_loss": -6.360319137573242, "global_step": 101987, "epoch": 2428} {"train_loss": -6.363428115844727, "global_step": 101988, "epoch": 2428} {"train_loss": -6.376469612121582, "global_step": 101989, "epoch": 2428} {"train_loss": -6.547675132751465, "global_step": 101990, "epoch": 2428} {"train_loss": -6.409867763519287, "global_step": 101991, "epoch": 2428} {"train_loss": -6.377248764038086, "global_step": 101992, "epoch": 2428} {"train_loss": -6.531589508056641, "global_step": 101993, "epoch": 2428} {"train_loss": -6.344782829284668, "global_step": 101994, "epoch": 2428} {"train_loss": -6.3184638023376465, "global_step": 101995, "epoch": 2428} {"train_loss": -6.392145156860352, "global_step": 101996, "epoch": 2428} {"train_loss": -6.440664291381836, "global_step": 101997, "epoch": 2428} {"train_loss": -6.365505218505859, "global_step": 101998, "epoch": 2428} {"train_loss": -6.436906814575195, "global_step": 101999, "epoch": 2428} {"train_loss": -6.401674270629883, "global_step": 102000, "epoch": 2428} {"train_loss": -6.502504825592041, "global_step": 102001, "epoch": 2428} {"train_loss": -6.290438652038574, "global_step": 102002, "epoch": 2428} {"train_loss": -6.3998847007751465, "global_step": 102003, "epoch": 2428} {"train_loss": -6.489743232727051, "global_step": 102004, "epoch": 2428} {"train_loss": -6.514788627624512, "global_step": 102005, "epoch": 2428} {"train_loss": -6.376224517822266, "global_step": 102006, "epoch": 2428} {"train_loss": -6.4948930740356445, "global_step": 102007, "epoch": 2428} {"train_loss": -6.438594818115234, "global_step": 102008, "epoch": 2428} {"train_loss": -6.337490081787109, "global_step": 102009, "epoch": 2428} {"train_loss": -6.388819694519043, "global_step": 102010, "epoch": 2428} {"train_loss": -6.346399307250977, "global_step": 102011, "epoch": 2428} {"train_loss": -6.338720321655273, "global_step": 102012, "epoch": 2428} {"train_loss": -6.375107765197754, "global_step": 102013, "epoch": 2428} {"train_loss": -6.279537677764893, "global_step": 102014, "epoch": 2428} {"train_loss": -6.444300174713135, "global_step": 102015, "epoch": 2428} {"train_loss": -6.311393737792969, "global_step": 102016, "epoch": 2428} {"train_loss": -6.393748181206839, "global_step": 102017, "epoch": 2428, "val_loss": 64227.32421875} {"train_loss": -6.370215892791748, "global_step": 102018, "epoch": 2429} {"train_loss": -6.303312301635742, "global_step": 102019, "epoch": 2429} {"train_loss": -6.414475440979004, "global_step": 102020, "epoch": 2429} {"train_loss": -6.235172748565674, "global_step": 102021, "epoch": 2429} {"train_loss": -6.446208953857422, "global_step": 102022, "epoch": 2429} {"train_loss": -6.29166841506958, "global_step": 102023, "epoch": 2429} {"train_loss": -6.315684795379639, "global_step": 102024, "epoch": 2429} {"train_loss": -6.384587287902832, "global_step": 102025, "epoch": 2429} {"train_loss": -6.382041931152344, "global_step": 102026, "epoch": 2429} {"train_loss": -6.345755577087402, "global_step": 102027, "epoch": 2429} {"train_loss": -6.436705112457275, "global_step": 102028, "epoch": 2429} {"train_loss": -6.313821792602539, "global_step": 102029, "epoch": 2429} {"train_loss": -6.29664945602417, "global_step": 102030, "epoch": 2429} {"train_loss": -6.398317337036133, "global_step": 102031, "epoch": 2429} {"train_loss": -6.431820869445801, "global_step": 102032, "epoch": 2429} {"train_loss": -6.333390235900879, "global_step": 102033, "epoch": 2429} {"train_loss": -6.363725185394287, "global_step": 102034, "epoch": 2429} {"train_loss": -6.456462383270264, "global_step": 102035, "epoch": 2429} {"train_loss": -6.4264726638793945, "global_step": 102036, "epoch": 2429} {"train_loss": -6.3637895584106445, "global_step": 102037, "epoch": 2429} {"train_loss": -6.434000492095947, "global_step": 102038, "epoch": 2429} {"train_loss": -6.414012908935547, "global_step": 102039, "epoch": 2429} {"train_loss": -6.387341022491455, "global_step": 102040, "epoch": 2429} {"train_loss": -6.497898578643799, "global_step": 102041, "epoch": 2429} {"train_loss": -6.411345481872559, "global_step": 102042, "epoch": 2429} {"train_loss": -6.373723983764648, "global_step": 102043, "epoch": 2429} {"train_loss": -6.428290367126465, "global_step": 102044, "epoch": 2429} {"train_loss": -6.467568397521973, "global_step": 102045, "epoch": 2429} {"train_loss": -6.364575386047363, "global_step": 102046, "epoch": 2429} {"train_loss": -6.479048728942871, "global_step": 102047, "epoch": 2429} {"train_loss": -6.338578224182129, "global_step": 102048, "epoch": 2429} {"train_loss": -6.324487686157227, "global_step": 102049, "epoch": 2429} {"train_loss": -6.377593040466309, "global_step": 102050, "epoch": 2429} {"train_loss": -6.429594993591309, "global_step": 102051, "epoch": 2429} {"train_loss": -6.3353271484375, "global_step": 102052, "epoch": 2429} {"train_loss": -6.367373466491699, "global_step": 102053, "epoch": 2429} {"train_loss": -6.409536361694336, "global_step": 102054, "epoch": 2429} {"train_loss": -6.37107515335083, "global_step": 102055, "epoch": 2429} {"train_loss": -6.3708038330078125, "global_step": 102056, "epoch": 2429} {"train_loss": -6.303033828735352, "global_step": 102057, "epoch": 2429} {"train_loss": -6.408590793609619, "global_step": 102058, "epoch": 2429} {"train_loss": -6.3778816518329435, "global_step": 102059, "epoch": 2429, "val_loss": 64173.94921875} {"train_loss": -6.354640960693359, "global_step": 102060, "epoch": 2430} {"train_loss": -6.465534210205078, "global_step": 102061, "epoch": 2430} {"train_loss": -6.3128557205200195, "global_step": 102062, "epoch": 2430} {"train_loss": -6.331232070922852, "global_step": 102063, "epoch": 2430} {"train_loss": -6.4322004318237305, "global_step": 102064, "epoch": 2430} {"train_loss": -6.304556846618652, "global_step": 102065, "epoch": 2430} {"train_loss": -6.390482425689697, "global_step": 102066, "epoch": 2430} {"train_loss": -6.43485689163208, "global_step": 102067, "epoch": 2430} {"train_loss": -6.330997467041016, "global_step": 102068, "epoch": 2430} {"train_loss": -6.3815178871154785, "global_step": 102069, "epoch": 2430} {"train_loss": -6.419271469116211, "global_step": 102070, "epoch": 2430} {"train_loss": -6.472645282745361, "global_step": 102071, "epoch": 2430} {"train_loss": -6.399104118347168, "global_step": 102072, "epoch": 2430} {"train_loss": -6.369061470031738, "global_step": 102073, "epoch": 2430} {"train_loss": -6.471631050109863, "global_step": 102074, "epoch": 2430} {"train_loss": -6.468437194824219, "global_step": 102075, "epoch": 2430} {"train_loss": -6.383587837219238, "global_step": 102076, "epoch": 2430} {"train_loss": -6.449828147888184, "global_step": 102077, "epoch": 2430} {"train_loss": -6.452362537384033, "global_step": 102078, "epoch": 2430} {"train_loss": -6.331596374511719, "global_step": 102079, "epoch": 2430} {"train_loss": -6.30210542678833, "global_step": 102080, "epoch": 2430} {"train_loss": -6.507702350616455, "global_step": 102081, "epoch": 2430} {"train_loss": -6.340933799743652, "global_step": 102082, "epoch": 2430} {"train_loss": -6.398968696594238, "global_step": 102083, "epoch": 2430} {"train_loss": -6.380054473876953, "global_step": 102084, "epoch": 2430} {"train_loss": -6.351587295532227, "global_step": 102085, "epoch": 2430} {"train_loss": -6.312416076660156, "global_step": 102086, "epoch": 2430} {"train_loss": -6.344777584075928, "global_step": 102087, "epoch": 2430} {"train_loss": -6.396803379058838, "global_step": 102088, "epoch": 2430} {"train_loss": -6.315667152404785, "global_step": 102089, "epoch": 2430} {"train_loss": -6.305440902709961, "global_step": 102090, "epoch": 2430} {"train_loss": -6.4215922355651855, "global_step": 102091, "epoch": 2430} {"train_loss": -6.361948013305664, "global_step": 102092, "epoch": 2430} {"train_loss": -6.391149520874023, "global_step": 102093, "epoch": 2430} {"train_loss": -6.397372245788574, "global_step": 102094, "epoch": 2430} {"train_loss": -6.396071910858154, "global_step": 102095, "epoch": 2430} {"train_loss": -6.345945835113525, "global_step": 102096, "epoch": 2430} {"train_loss": -6.398443698883057, "global_step": 102097, "epoch": 2430} {"train_loss": -6.379746913909912, "global_step": 102098, "epoch": 2430} {"train_loss": -6.405979156494141, "global_step": 102099, "epoch": 2430} {"train_loss": -6.476863384246826, "global_step": 102100, "epoch": 2430} {"train_loss": -6.388777165185838, "global_step": 102101, "epoch": 2430, "val_loss": 63967.69921875} {"train_loss": -6.385991096496582, "global_step": 102102, "epoch": 2431} {"train_loss": -6.418511390686035, "global_step": 102103, "epoch": 2431} {"train_loss": -6.3246235847473145, "global_step": 102104, "epoch": 2431} {"train_loss": -6.340709686279297, "global_step": 102105, "epoch": 2431} {"train_loss": -6.3670268058776855, "global_step": 102106, "epoch": 2431} {"train_loss": -6.295085906982422, "global_step": 102107, "epoch": 2431} {"train_loss": -6.390404224395752, "global_step": 102108, "epoch": 2431} {"train_loss": -6.348085880279541, "global_step": 102109, "epoch": 2431} {"train_loss": -6.360220432281494, "global_step": 102110, "epoch": 2431} {"train_loss": -6.435514450073242, "global_step": 102111, "epoch": 2431} {"train_loss": -6.371677875518799, "global_step": 102112, "epoch": 2431} {"train_loss": -6.399358749389648, "global_step": 102113, "epoch": 2431} {"train_loss": -6.443763256072998, "global_step": 102114, "epoch": 2431} {"train_loss": -6.335012435913086, "global_step": 102115, "epoch": 2431} {"train_loss": -6.381627559661865, "global_step": 102116, "epoch": 2431} {"train_loss": -6.376952171325684, "global_step": 102117, "epoch": 2431} {"train_loss": -6.360475540161133, "global_step": 102118, "epoch": 2431} {"train_loss": -6.425711631774902, "global_step": 102119, "epoch": 2431} {"train_loss": -6.482593536376953, "global_step": 102120, "epoch": 2431} {"train_loss": -6.38443660736084, "global_step": 102121, "epoch": 2431} {"train_loss": -6.571427345275879, "global_step": 102122, "epoch": 2431} {"train_loss": -6.388360977172852, "global_step": 102123, "epoch": 2431} {"train_loss": -6.24398946762085, "global_step": 102124, "epoch": 2431} {"train_loss": -6.439812660217285, "global_step": 102125, "epoch": 2431} {"train_loss": -6.326499938964844, "global_step": 102126, "epoch": 2431} {"train_loss": -6.334560871124268, "global_step": 102127, "epoch": 2431} {"train_loss": -6.303600311279297, "global_step": 102128, "epoch": 2431} {"train_loss": -6.314929485321045, "global_step": 102129, "epoch": 2431} {"train_loss": -6.426111698150635, "global_step": 102130, "epoch": 2431} {"train_loss": -6.344104766845703, "global_step": 102131, "epoch": 2431} {"train_loss": -6.303203582763672, "global_step": 102132, "epoch": 2431} {"train_loss": -6.35441780090332, "global_step": 102133, "epoch": 2431} {"train_loss": -6.291449069976807, "global_step": 102134, "epoch": 2431} {"train_loss": -6.334989070892334, "global_step": 102135, "epoch": 2431} {"train_loss": -6.305310249328613, "global_step": 102136, "epoch": 2431} {"train_loss": -6.421125411987305, "global_step": 102137, "epoch": 2431} {"train_loss": -6.399246692657471, "global_step": 102138, "epoch": 2431} {"train_loss": -6.435300350189209, "global_step": 102139, "epoch": 2431} {"train_loss": -6.291508197784424, "global_step": 102140, "epoch": 2431} {"train_loss": -6.313343048095703, "global_step": 102141, "epoch": 2431} {"train_loss": -6.320044994354248, "global_step": 102142, "epoch": 2431} {"train_loss": -6.367809500013079, "global_step": 102143, "epoch": 2431, "val_loss": 64125.2109375} {"train_loss": -6.374544143676758, "global_step": 102144, "epoch": 2432} {"train_loss": -6.312931537628174, "global_step": 102145, "epoch": 2432} {"train_loss": -6.381191730499268, "global_step": 102146, "epoch": 2432} {"train_loss": -6.426566123962402, "global_step": 102147, "epoch": 2432} {"train_loss": -6.41575288772583, "global_step": 102148, "epoch": 2432} {"train_loss": -6.507761001586914, "global_step": 102149, "epoch": 2432} {"train_loss": -6.474695205688477, "global_step": 102150, "epoch": 2432} {"train_loss": -6.384860515594482, "global_step": 102151, "epoch": 2432} {"train_loss": -6.412661552429199, "global_step": 102152, "epoch": 2432} {"train_loss": -6.465025901794434, "global_step": 102153, "epoch": 2432} {"train_loss": -6.420942306518555, "global_step": 102154, "epoch": 2432} {"train_loss": -6.349859237670898, "global_step": 102155, "epoch": 2432} {"train_loss": -6.302347183227539, "global_step": 102156, "epoch": 2432} {"train_loss": -6.412900924682617, "global_step": 102157, "epoch": 2432} {"train_loss": -6.361112117767334, "global_step": 102158, "epoch": 2432} {"train_loss": -6.426178932189941, "global_step": 102159, "epoch": 2432} {"train_loss": -6.457211971282959, "global_step": 102160, "epoch": 2432} {"train_loss": -6.33565616607666, "global_step": 102161, "epoch": 2432} {"train_loss": -6.41210412979126, "global_step": 102162, "epoch": 2432} {"train_loss": -6.377135753631592, "global_step": 102163, "epoch": 2432} {"train_loss": -6.439652442932129, "global_step": 102164, "epoch": 2432} {"train_loss": -6.277503967285156, "global_step": 102165, "epoch": 2432} {"train_loss": -6.370547294616699, "global_step": 102166, "epoch": 2432} {"train_loss": -6.412510395050049, "global_step": 102167, "epoch": 2432} {"train_loss": -6.4523725509643555, "global_step": 102168, "epoch": 2432} {"train_loss": -6.401979446411133, "global_step": 102169, "epoch": 2432} {"train_loss": -6.383152008056641, "global_step": 102170, "epoch": 2432} {"train_loss": -6.451735973358154, "global_step": 102171, "epoch": 2432} {"train_loss": -6.4215192794799805, "global_step": 102172, "epoch": 2432} {"train_loss": -6.365833759307861, "global_step": 102173, "epoch": 2432} {"train_loss": -6.421303749084473, "global_step": 102174, "epoch": 2432} {"train_loss": -6.413458347320557, "global_step": 102175, "epoch": 2432} {"train_loss": -6.272414207458496, "global_step": 102176, "epoch": 2432} {"train_loss": -6.4394707679748535, "global_step": 102177, "epoch": 2432} {"train_loss": -6.443429946899414, "global_step": 102178, "epoch": 2432} {"train_loss": -6.328526020050049, "global_step": 102179, "epoch": 2432} {"train_loss": -6.364336013793945, "global_step": 102180, "epoch": 2432} {"train_loss": -6.363016128540039, "global_step": 102181, "epoch": 2432} {"train_loss": -6.473899841308594, "global_step": 102182, "epoch": 2432} {"train_loss": -6.412077903747559, "global_step": 102183, "epoch": 2432} {"train_loss": -6.323591709136963, "global_step": 102184, "epoch": 2432} {"train_loss": -6.397543748219808, "global_step": 102185, "epoch": 2432, "val_loss": 64265.7578125} {"train_loss": -6.391911506652832, "global_step": 102186, "epoch": 2433} {"train_loss": -6.536323547363281, "global_step": 102187, "epoch": 2433} {"train_loss": -6.2417378425598145, "global_step": 102188, "epoch": 2433} {"train_loss": -6.425518035888672, "global_step": 102189, "epoch": 2433} {"train_loss": -6.477789878845215, "global_step": 102190, "epoch": 2433} {"train_loss": -6.410071849822998, "global_step": 102191, "epoch": 2433} {"train_loss": -6.371918201446533, "global_step": 102192, "epoch": 2433} {"train_loss": -6.329379081726074, "global_step": 102193, "epoch": 2433} {"train_loss": -6.218269348144531, "global_step": 102194, "epoch": 2433} {"train_loss": -6.3407487869262695, "global_step": 102195, "epoch": 2433} {"train_loss": -6.4945068359375, "global_step": 102196, "epoch": 2433} {"train_loss": -6.379096984863281, "global_step": 102197, "epoch": 2433} {"train_loss": -6.495877265930176, "global_step": 102198, "epoch": 2433} {"train_loss": -6.393319129943848, "global_step": 102199, "epoch": 2433} {"train_loss": -6.400381088256836, "global_step": 102200, "epoch": 2433} {"train_loss": -6.410198211669922, "global_step": 102201, "epoch": 2433} {"train_loss": -6.4073166847229, "global_step": 102202, "epoch": 2433} {"train_loss": -6.464685440063477, "global_step": 102203, "epoch": 2433} {"train_loss": -6.464590072631836, "global_step": 102204, "epoch": 2433} {"train_loss": -6.39961051940918, "global_step": 102205, "epoch": 2433} {"train_loss": -6.403234481811523, "global_step": 102206, "epoch": 2433} {"train_loss": -6.357023239135742, "global_step": 102207, "epoch": 2433} {"train_loss": -6.323124408721924, "global_step": 102208, "epoch": 2433} {"train_loss": -6.28597354888916, "global_step": 102209, "epoch": 2433} {"train_loss": -6.451455593109131, "global_step": 102210, "epoch": 2433} {"train_loss": -6.417006969451904, "global_step": 102211, "epoch": 2433} {"train_loss": -6.452303886413574, "global_step": 102212, "epoch": 2433} {"train_loss": -6.397410869598389, "global_step": 102213, "epoch": 2433} {"train_loss": -6.367912769317627, "global_step": 102214, "epoch": 2433} {"train_loss": -6.470736026763916, "global_step": 102215, "epoch": 2433} {"train_loss": -6.467073440551758, "global_step": 102216, "epoch": 2433} {"train_loss": -6.394382476806641, "global_step": 102217, "epoch": 2433} {"train_loss": -6.391406059265137, "global_step": 102218, "epoch": 2433} {"train_loss": -6.3950042724609375, "global_step": 102219, "epoch": 2433} {"train_loss": -6.4400787353515625, "global_step": 102220, "epoch": 2433} {"train_loss": -6.455132484436035, "global_step": 102221, "epoch": 2433} {"train_loss": -6.169124603271484, "global_step": 102222, "epoch": 2433} {"train_loss": -6.492593288421631, "global_step": 102223, "epoch": 2433} {"train_loss": -6.263161659240723, "global_step": 102224, "epoch": 2433} {"train_loss": -6.275251388549805, "global_step": 102225, "epoch": 2433} {"train_loss": -6.394405364990234, "global_step": 102226, "epoch": 2433} {"train_loss": -6.394304831822713, "global_step": 102227, "epoch": 2433, "val_loss": 64463.1328125} {"train_loss": -6.371316432952881, "global_step": 102228, "epoch": 2434} {"train_loss": -6.4619035720825195, "global_step": 102229, "epoch": 2434} {"train_loss": -6.364725112915039, "global_step": 102230, "epoch": 2434} {"train_loss": -6.463001251220703, "global_step": 102231, "epoch": 2434} {"train_loss": -6.383716583251953, "global_step": 102232, "epoch": 2434} {"train_loss": -6.264405250549316, "global_step": 102233, "epoch": 2434} {"train_loss": -6.403554916381836, "global_step": 102234, "epoch": 2434} {"train_loss": -6.159776210784912, "global_step": 102235, "epoch": 2434} {"train_loss": -6.4164299964904785, "global_step": 102236, "epoch": 2434} {"train_loss": -6.2729949951171875, "global_step": 102237, "epoch": 2434} {"train_loss": -6.381538391113281, "global_step": 102238, "epoch": 2434} {"train_loss": -6.293058395385742, "global_step": 102239, "epoch": 2434} {"train_loss": -6.355573654174805, "global_step": 102240, "epoch": 2434} {"train_loss": -6.379303932189941, "global_step": 102241, "epoch": 2434} {"train_loss": -6.289313316345215, "global_step": 102242, "epoch": 2434} {"train_loss": -6.288207054138184, "global_step": 102243, "epoch": 2434} {"train_loss": -6.458196640014648, "global_step": 102244, "epoch": 2434} {"train_loss": -6.439769744873047, "global_step": 102245, "epoch": 2434} {"train_loss": -6.415228843688965, "global_step": 102246, "epoch": 2434} {"train_loss": -6.427253246307373, "global_step": 102247, "epoch": 2434} {"train_loss": -6.454505920410156, "global_step": 102248, "epoch": 2434} {"train_loss": -6.386376857757568, "global_step": 102249, "epoch": 2434} {"train_loss": -6.316333770751953, "global_step": 102250, "epoch": 2434} {"train_loss": -6.340112209320068, "global_step": 102251, "epoch": 2434} {"train_loss": -6.390648365020752, "global_step": 102252, "epoch": 2434} {"train_loss": -6.341893196105957, "global_step": 102253, "epoch": 2434} {"train_loss": -6.386894702911377, "global_step": 102254, "epoch": 2434} {"train_loss": -6.3450846672058105, "global_step": 102255, "epoch": 2434} {"train_loss": -6.280953407287598, "global_step": 102256, "epoch": 2434} {"train_loss": -6.305685043334961, "global_step": 102257, "epoch": 2434} {"train_loss": -6.404661178588867, "global_step": 102258, "epoch": 2434} {"train_loss": -6.351945400238037, "global_step": 102259, "epoch": 2434} {"train_loss": -6.4524431228637695, "global_step": 102260, "epoch": 2434} {"train_loss": -6.37442684173584, "global_step": 102261, "epoch": 2434} {"train_loss": -6.40859317779541, "global_step": 102262, "epoch": 2434} {"train_loss": -6.325997352600098, "global_step": 102263, "epoch": 2434} {"train_loss": -6.430422782897949, "global_step": 102264, "epoch": 2434} {"train_loss": -6.329371929168701, "global_step": 102265, "epoch": 2434} {"train_loss": -6.451892852783203, "global_step": 102266, "epoch": 2434} {"train_loss": -6.409318447113037, "global_step": 102267, "epoch": 2434} {"train_loss": -6.315390586853027, "global_step": 102268, "epoch": 2434} {"train_loss": -6.3710714521862215, "global_step": 102269, "epoch": 2434, "val_loss": 64185.80078125} {"train_loss": -6.4789533615112305, "global_step": 102270, "epoch": 2435} {"train_loss": -6.339971542358398, "global_step": 102271, "epoch": 2435} {"train_loss": -6.350127220153809, "global_step": 102272, "epoch": 2435} {"train_loss": -6.463730812072754, "global_step": 102273, "epoch": 2435} {"train_loss": -6.47617244720459, "global_step": 102274, "epoch": 2435} {"train_loss": -6.3923797607421875, "global_step": 102275, "epoch": 2435} {"train_loss": -6.395532608032227, "global_step": 102276, "epoch": 2435} {"train_loss": -6.364431381225586, "global_step": 102277, "epoch": 2435} {"train_loss": -6.399417877197266, "global_step": 102278, "epoch": 2435} {"train_loss": -6.4190497398376465, "global_step": 102279, "epoch": 2435} {"train_loss": -6.281343936920166, "global_step": 102280, "epoch": 2435} {"train_loss": -6.4647321701049805, "global_step": 102281, "epoch": 2435} {"train_loss": -6.410639762878418, "global_step": 102282, "epoch": 2435} {"train_loss": -6.4337158203125, "global_step": 102283, "epoch": 2435} {"train_loss": -6.443802833557129, "global_step": 102284, "epoch": 2435} {"train_loss": -6.5434112548828125, "global_step": 102285, "epoch": 2435} {"train_loss": -6.464764595031738, "global_step": 102286, "epoch": 2435} {"train_loss": -6.3948445320129395, "global_step": 102287, "epoch": 2435} {"train_loss": -6.528875350952148, "global_step": 102288, "epoch": 2435} {"train_loss": -6.399474143981934, "global_step": 102289, "epoch": 2435} {"train_loss": -6.312650680541992, "global_step": 102290, "epoch": 2435} {"train_loss": -6.455011367797852, "global_step": 102291, "epoch": 2435} {"train_loss": -6.397979736328125, "global_step": 102292, "epoch": 2435} {"train_loss": -6.370704650878906, "global_step": 102293, "epoch": 2435} {"train_loss": -6.4088850021362305, "global_step": 102294, "epoch": 2435} {"train_loss": -6.375596046447754, "global_step": 102295, "epoch": 2435} {"train_loss": -6.371427536010742, "global_step": 102296, "epoch": 2435} {"train_loss": -6.454324722290039, "global_step": 102297, "epoch": 2435} {"train_loss": -6.375297546386719, "global_step": 102298, "epoch": 2435} {"train_loss": -6.420647621154785, "global_step": 102299, "epoch": 2435} {"train_loss": -6.498795509338379, "global_step": 102300, "epoch": 2435} {"train_loss": -6.354287624359131, "global_step": 102301, "epoch": 2435} {"train_loss": -6.274299621582031, "global_step": 102302, "epoch": 2435} {"train_loss": -6.45815372467041, "global_step": 102303, "epoch": 2435} {"train_loss": -6.2306671142578125, "global_step": 102304, "epoch": 2435} {"train_loss": -6.451598167419434, "global_step": 102305, "epoch": 2435} {"train_loss": -6.290511131286621, "global_step": 102306, "epoch": 2435} {"train_loss": -6.3687615394592285, "global_step": 102307, "epoch": 2435} {"train_loss": -6.449512004852295, "global_step": 102308, "epoch": 2435} {"train_loss": -6.416659355163574, "global_step": 102309, "epoch": 2435} {"train_loss": -6.337772369384766, "global_step": 102310, "epoch": 2435} {"train_loss": -6.4021547975994295, "global_step": 102311, "epoch": 2435, "val_loss": 64383.25390625} {"train_loss": -6.256534576416016, "global_step": 102312, "epoch": 2436} {"train_loss": -6.420538425445557, "global_step": 102313, "epoch": 2436} {"train_loss": -6.294976711273193, "global_step": 102314, "epoch": 2436} {"train_loss": -6.265059947967529, "global_step": 102315, "epoch": 2436} {"train_loss": -6.301370143890381, "global_step": 102316, "epoch": 2436} {"train_loss": -6.339814186096191, "global_step": 102317, "epoch": 2436} {"train_loss": -6.426795959472656, "global_step": 102318, "epoch": 2436} {"train_loss": -6.463224411010742, "global_step": 102319, "epoch": 2436} {"train_loss": -6.386849403381348, "global_step": 102320, "epoch": 2436} {"train_loss": -6.355422019958496, "global_step": 102321, "epoch": 2436} {"train_loss": -6.229283332824707, "global_step": 102322, "epoch": 2436} {"train_loss": -6.424921035766602, "global_step": 102323, "epoch": 2436} {"train_loss": -6.259765625, "global_step": 102324, "epoch": 2436} {"train_loss": -6.373587608337402, "global_step": 102325, "epoch": 2436} {"train_loss": -6.418734550476074, "global_step": 102326, "epoch": 2436} {"train_loss": -6.395821571350098, "global_step": 102327, "epoch": 2436} {"train_loss": -6.438882827758789, "global_step": 102328, "epoch": 2436} {"train_loss": -6.330809593200684, "global_step": 102329, "epoch": 2436} {"train_loss": -6.405194282531738, "global_step": 102330, "epoch": 2436} {"train_loss": -6.372061252593994, "global_step": 102331, "epoch": 2436} {"train_loss": -6.430941581726074, "global_step": 102332, "epoch": 2436} {"train_loss": -6.440277099609375, "global_step": 102333, "epoch": 2436} {"train_loss": -6.410619735717773, "global_step": 102334, "epoch": 2436} {"train_loss": -6.4827728271484375, "global_step": 102335, "epoch": 2436} {"train_loss": -6.32606315612793, "global_step": 102336, "epoch": 2436} {"train_loss": -6.383511543273926, "global_step": 102337, "epoch": 2436} {"train_loss": -6.429171085357666, "global_step": 102338, "epoch": 2436} {"train_loss": -6.320219039916992, "global_step": 102339, "epoch": 2436} {"train_loss": -6.42668342590332, "global_step": 102340, "epoch": 2436} {"train_loss": -6.427329063415527, "global_step": 102341, "epoch": 2436} {"train_loss": -6.485138416290283, "global_step": 102342, "epoch": 2436} {"train_loss": -6.384218215942383, "global_step": 102343, "epoch": 2436} {"train_loss": -6.378978729248047, "global_step": 102344, "epoch": 2436} {"train_loss": -6.400211334228516, "global_step": 102345, "epoch": 2436} {"train_loss": -6.458003044128418, "global_step": 102346, "epoch": 2436} {"train_loss": -6.447697162628174, "global_step": 102347, "epoch": 2436} {"train_loss": -6.3786516189575195, "global_step": 102348, "epoch": 2436} {"train_loss": -6.390228271484375, "global_step": 102349, "epoch": 2436} {"train_loss": -6.400743007659912, "global_step": 102350, "epoch": 2436} {"train_loss": -6.336704254150391, "global_step": 102351, "epoch": 2436} {"train_loss": -6.454869270324707, "global_step": 102352, "epoch": 2436} {"train_loss": -6.381362336022513, "global_step": 102353, "epoch": 2436, "val_loss": 64607.5078125} {"train_loss": -6.394402980804443, "global_step": 102354, "epoch": 2437} {"train_loss": -6.346707344055176, "global_step": 102355, "epoch": 2437} {"train_loss": -6.408376216888428, "global_step": 102356, "epoch": 2437} {"train_loss": -6.454595565795898, "global_step": 102357, "epoch": 2437} {"train_loss": -6.394670486450195, "global_step": 102358, "epoch": 2437} {"train_loss": -6.354785919189453, "global_step": 102359, "epoch": 2437} {"train_loss": -6.439020156860352, "global_step": 102360, "epoch": 2437} {"train_loss": -6.403967380523682, "global_step": 102361, "epoch": 2437} {"train_loss": -6.395126819610596, "global_step": 102362, "epoch": 2437} {"train_loss": -6.378718852996826, "global_step": 102363, "epoch": 2437} {"train_loss": -6.348020076751709, "global_step": 102364, "epoch": 2437} {"train_loss": -6.444879531860352, "global_step": 102365, "epoch": 2437} {"train_loss": -6.286002159118652, "global_step": 102366, "epoch": 2437} {"train_loss": -6.364345550537109, "global_step": 102367, "epoch": 2437} {"train_loss": -6.371528625488281, "global_step": 102368, "epoch": 2437} {"train_loss": -6.419125556945801, "global_step": 102369, "epoch": 2437} {"train_loss": -6.495972633361816, "global_step": 102370, "epoch": 2437} {"train_loss": -6.390593528747559, "global_step": 102371, "epoch": 2437} {"train_loss": -6.377006530761719, "global_step": 102372, "epoch": 2437} {"train_loss": -6.259716510772705, "global_step": 102373, "epoch": 2437} {"train_loss": -6.34689474105835, "global_step": 102374, "epoch": 2437} {"train_loss": -6.49854850769043, "global_step": 102375, "epoch": 2437} {"train_loss": -6.352269172668457, "global_step": 102376, "epoch": 2437} {"train_loss": -6.364537239074707, "global_step": 102377, "epoch": 2437} {"train_loss": -6.157800197601318, "global_step": 102378, "epoch": 2437} {"train_loss": -6.3544020652771, "global_step": 102379, "epoch": 2437} {"train_loss": -6.317140102386475, "global_step": 102380, "epoch": 2437} {"train_loss": -6.333834648132324, "global_step": 102381, "epoch": 2437} {"train_loss": -6.387696743011475, "global_step": 102382, "epoch": 2437} {"train_loss": -6.477477550506592, "global_step": 102383, "epoch": 2437} {"train_loss": -6.476195335388184, "global_step": 102384, "epoch": 2437} {"train_loss": -6.428390979766846, "global_step": 102385, "epoch": 2437} {"train_loss": -6.483767032623291, "global_step": 102386, "epoch": 2437} {"train_loss": -6.353105545043945, "global_step": 102387, "epoch": 2437} {"train_loss": -6.333747863769531, "global_step": 102388, "epoch": 2437} {"train_loss": -6.4742631912231445, "global_step": 102389, "epoch": 2437} {"train_loss": -6.431461334228516, "global_step": 102390, "epoch": 2437} {"train_loss": -6.506397247314453, "global_step": 102391, "epoch": 2437} {"train_loss": -6.464106559753418, "global_step": 102392, "epoch": 2437} {"train_loss": -6.410195350646973, "global_step": 102393, "epoch": 2437} {"train_loss": -6.397315979003906, "global_step": 102394, "epoch": 2437} {"train_loss": -6.391230832962763, "global_step": 102395, "epoch": 2437, "val_loss": 64300.79296875} {"train_loss": -6.331454753875732, "global_step": 102396, "epoch": 2438} {"train_loss": -6.382966041564941, "global_step": 102397, "epoch": 2438} {"train_loss": -6.247127532958984, "global_step": 102398, "epoch": 2438} {"train_loss": -6.463933944702148, "global_step": 102399, "epoch": 2438} {"train_loss": -6.346250534057617, "global_step": 102400, "epoch": 2438} {"train_loss": -6.438605785369873, "global_step": 102401, "epoch": 2438} {"train_loss": -6.500491142272949, "global_step": 102402, "epoch": 2438} {"train_loss": -6.458549499511719, "global_step": 102403, "epoch": 2438} {"train_loss": -6.452413082122803, "global_step": 102404, "epoch": 2438} {"train_loss": -6.560004711151123, "global_step": 102405, "epoch": 2438} {"train_loss": -6.344236373901367, "global_step": 102406, "epoch": 2438} {"train_loss": -6.297192573547363, "global_step": 102407, "epoch": 2438} {"train_loss": -6.400363922119141, "global_step": 102408, "epoch": 2438} {"train_loss": -6.350592613220215, "global_step": 102409, "epoch": 2438} {"train_loss": -6.249291896820068, "global_step": 102410, "epoch": 2438} {"train_loss": -6.4324445724487305, "global_step": 102411, "epoch": 2438} {"train_loss": -6.3933844566345215, "global_step": 102412, "epoch": 2438} {"train_loss": -6.293455123901367, "global_step": 102413, "epoch": 2438} {"train_loss": -6.415642738342285, "global_step": 102414, "epoch": 2438} {"train_loss": -6.36837100982666, "global_step": 102415, "epoch": 2438} {"train_loss": -6.443280220031738, "global_step": 102416, "epoch": 2438} {"train_loss": -6.457902431488037, "global_step": 102417, "epoch": 2438} {"train_loss": -6.389266014099121, "global_step": 102418, "epoch": 2438} {"train_loss": -6.362540245056152, "global_step": 102419, "epoch": 2438} {"train_loss": -6.427152633666992, "global_step": 102420, "epoch": 2438} {"train_loss": -6.487680912017822, "global_step": 102421, "epoch": 2438} {"train_loss": -6.447359561920166, "global_step": 102422, "epoch": 2438} {"train_loss": -6.336352348327637, "global_step": 102423, "epoch": 2438} {"train_loss": -6.339093208312988, "global_step": 102424, "epoch": 2438} {"train_loss": -6.483959197998047, "global_step": 102425, "epoch": 2438} {"train_loss": -6.362611770629883, "global_step": 102426, "epoch": 2438} {"train_loss": -6.418715476989746, "global_step": 102427, "epoch": 2438} {"train_loss": -6.385000705718994, "global_step": 102428, "epoch": 2438} {"train_loss": -6.461008548736572, "global_step": 102429, "epoch": 2438} {"train_loss": -6.414371490478516, "global_step": 102430, "epoch": 2438} {"train_loss": -6.322597026824951, "global_step": 102431, "epoch": 2438} {"train_loss": -6.361580848693848, "global_step": 102432, "epoch": 2438} {"train_loss": -6.436309814453125, "global_step": 102433, "epoch": 2438} {"train_loss": -6.433041572570801, "global_step": 102434, "epoch": 2438} {"train_loss": -6.376485824584961, "global_step": 102435, "epoch": 2438} {"train_loss": -6.339701175689697, "global_step": 102436, "epoch": 2438} {"train_loss": -6.393661078952608, "global_step": 102437, "epoch": 2438, "val_loss": 64207.6640625} {"train_loss": -6.477014541625977, "global_step": 102438, "epoch": 2439} {"train_loss": -6.409727573394775, "global_step": 102439, "epoch": 2439} {"train_loss": -6.36950159072876, "global_step": 102440, "epoch": 2439} {"train_loss": -6.502165794372559, "global_step": 102441, "epoch": 2439} {"train_loss": -6.321002006530762, "global_step": 102442, "epoch": 2439} {"train_loss": -6.27946138381958, "global_step": 102443, "epoch": 2439} {"train_loss": -6.4868550300598145, "global_step": 102444, "epoch": 2439} {"train_loss": -6.234020233154297, "global_step": 102445, "epoch": 2439} {"train_loss": -6.437641143798828, "global_step": 102446, "epoch": 2439} {"train_loss": -6.399595260620117, "global_step": 102447, "epoch": 2439} {"train_loss": -6.448443412780762, "global_step": 102448, "epoch": 2439} {"train_loss": -6.385200500488281, "global_step": 102449, "epoch": 2439} {"train_loss": -6.413330078125, "global_step": 102450, "epoch": 2439} {"train_loss": -6.436694145202637, "global_step": 102451, "epoch": 2439} {"train_loss": -6.30916690826416, "global_step": 102452, "epoch": 2439} {"train_loss": -6.375557899475098, "global_step": 102453, "epoch": 2439} {"train_loss": -6.468328475952148, "global_step": 102454, "epoch": 2439} {"train_loss": -6.452693939208984, "global_step": 102455, "epoch": 2439} {"train_loss": -6.408442497253418, "global_step": 102456, "epoch": 2439} {"train_loss": -6.392560958862305, "global_step": 102457, "epoch": 2439} {"train_loss": -6.381069660186768, "global_step": 102458, "epoch": 2439} {"train_loss": -6.397645950317383, "global_step": 102459, "epoch": 2439} {"train_loss": -6.412932872772217, "global_step": 102460, "epoch": 2439} {"train_loss": -6.4466142654418945, "global_step": 102461, "epoch": 2439} {"train_loss": -6.360576629638672, "global_step": 102462, "epoch": 2439} {"train_loss": -6.3578596115112305, "global_step": 102463, "epoch": 2439} {"train_loss": -6.297027587890625, "global_step": 102464, "epoch": 2439} {"train_loss": -6.357852935791016, "global_step": 102465, "epoch": 2439} {"train_loss": -6.2905659675598145, "global_step": 102466, "epoch": 2439} {"train_loss": -6.217953681945801, "global_step": 102467, "epoch": 2439} {"train_loss": -6.418872356414795, "global_step": 102468, "epoch": 2439} {"train_loss": -6.247569561004639, "global_step": 102469, "epoch": 2439} {"train_loss": -6.207550048828125, "global_step": 102470, "epoch": 2439} {"train_loss": -6.378439903259277, "global_step": 102471, "epoch": 2439} {"train_loss": -6.253775596618652, "global_step": 102472, "epoch": 2439} {"train_loss": -6.241706848144531, "global_step": 102473, "epoch": 2439} {"train_loss": -6.417922019958496, "global_step": 102474, "epoch": 2439} {"train_loss": -6.3247785568237305, "global_step": 102475, "epoch": 2439} {"train_loss": -6.31492805480957, "global_step": 102476, "epoch": 2439} {"train_loss": -6.3676910400390625, "global_step": 102477, "epoch": 2439} {"train_loss": -6.298081398010254, "global_step": 102478, "epoch": 2439} {"train_loss": -6.367469957896641, "global_step": 102479, "epoch": 2439, "val_loss": 64623.20703125} {"train_loss": -6.391547203063965, "global_step": 102480, "epoch": 2440} {"train_loss": -6.279359817504883, "global_step": 102481, "epoch": 2440} {"train_loss": -6.357321739196777, "global_step": 102482, "epoch": 2440} {"train_loss": -6.308653831481934, "global_step": 102483, "epoch": 2440} {"train_loss": -6.233922958374023, "global_step": 102484, "epoch": 2440} {"train_loss": -6.360838890075684, "global_step": 102485, "epoch": 2440} {"train_loss": -6.36023473739624, "global_step": 102486, "epoch": 2440} {"train_loss": -6.4346466064453125, "global_step": 102487, "epoch": 2440} {"train_loss": -6.426537036895752, "global_step": 102488, "epoch": 2440} {"train_loss": -6.35653018951416, "global_step": 102489, "epoch": 2440} {"train_loss": -6.315151691436768, "global_step": 102490, "epoch": 2440} {"train_loss": -6.523024082183838, "global_step": 102491, "epoch": 2440} {"train_loss": -6.3756022453308105, "global_step": 102492, "epoch": 2440} {"train_loss": -6.298234462738037, "global_step": 102493, "epoch": 2440} {"train_loss": -6.384436130523682, "global_step": 102494, "epoch": 2440} {"train_loss": -6.2695159912109375, "global_step": 102495, "epoch": 2440} {"train_loss": -6.391039848327637, "global_step": 102496, "epoch": 2440} {"train_loss": -6.458215236663818, "global_step": 102497, "epoch": 2440} {"train_loss": -6.2543044090271, "global_step": 102498, "epoch": 2440} {"train_loss": -6.440121173858643, "global_step": 102499, "epoch": 2440} {"train_loss": -6.417097568511963, "global_step": 102500, "epoch": 2440} {"train_loss": -6.320282936096191, "global_step": 102501, "epoch": 2440} {"train_loss": -6.3390398025512695, "global_step": 102502, "epoch": 2440} {"train_loss": -6.326155662536621, "global_step": 102503, "epoch": 2440} {"train_loss": -6.346139430999756, "global_step": 102504, "epoch": 2440} {"train_loss": -6.404953956604004, "global_step": 102505, "epoch": 2440} {"train_loss": -6.3358283042907715, "global_step": 102506, "epoch": 2440} {"train_loss": -6.455505847930908, "global_step": 102507, "epoch": 2440} {"train_loss": -6.321534633636475, "global_step": 102508, "epoch": 2440} {"train_loss": -6.482675075531006, "global_step": 102509, "epoch": 2440} {"train_loss": -6.399888038635254, "global_step": 102510, "epoch": 2440} {"train_loss": -6.3334856033325195, "global_step": 102511, "epoch": 2440} {"train_loss": -6.342468738555908, "global_step": 102512, "epoch": 2440} {"train_loss": -6.382405757904053, "global_step": 102513, "epoch": 2440} {"train_loss": -6.303249835968018, "global_step": 102514, "epoch": 2440} {"train_loss": -6.378301620483398, "global_step": 102515, "epoch": 2440} {"train_loss": -6.247084617614746, "global_step": 102516, "epoch": 2440} {"train_loss": -6.371212005615234, "global_step": 102517, "epoch": 2440} {"train_loss": -6.46146297454834, "global_step": 102518, "epoch": 2440} {"train_loss": -6.426068305969238, "global_step": 102519, "epoch": 2440} {"train_loss": -6.436040878295898, "global_step": 102520, "epoch": 2440} {"train_loss": -6.370975460324969, "global_step": 102521, "epoch": 2440, "val_loss": 64382.97265625} {"train_loss": -6.415059566497803, "global_step": 102522, "epoch": 2441} {"train_loss": -6.324613094329834, "global_step": 102523, "epoch": 2441} {"train_loss": -6.3260884284973145, "global_step": 102524, "epoch": 2441} {"train_loss": -6.483861923217773, "global_step": 102525, "epoch": 2441} {"train_loss": -6.461519241333008, "global_step": 102526, "epoch": 2441} {"train_loss": -6.4937663078308105, "global_step": 102527, "epoch": 2441} {"train_loss": -6.37067985534668, "global_step": 102528, "epoch": 2441} {"train_loss": -6.430124759674072, "global_step": 102529, "epoch": 2441} {"train_loss": -6.342896938323975, "global_step": 102530, "epoch": 2441} {"train_loss": -6.386442184448242, "global_step": 102531, "epoch": 2441} {"train_loss": -6.408883094787598, "global_step": 102532, "epoch": 2441} {"train_loss": -6.429006099700928, "global_step": 102533, "epoch": 2441} {"train_loss": -6.248499870300293, "global_step": 102534, "epoch": 2441} {"train_loss": -6.393287658691406, "global_step": 102535, "epoch": 2441} {"train_loss": -6.334179401397705, "global_step": 102536, "epoch": 2441} {"train_loss": -6.443408012390137, "global_step": 102537, "epoch": 2441} {"train_loss": -6.289732933044434, "global_step": 102538, "epoch": 2441} {"train_loss": -6.336514949798584, "global_step": 102539, "epoch": 2441} {"train_loss": -6.392289161682129, "global_step": 102540, "epoch": 2441} {"train_loss": -6.405055522918701, "global_step": 102541, "epoch": 2441} {"train_loss": -6.485867500305176, "global_step": 102542, "epoch": 2441} {"train_loss": -6.384250164031982, "global_step": 102543, "epoch": 2441} {"train_loss": -6.2537384033203125, "global_step": 102544, "epoch": 2441} {"train_loss": -6.386293411254883, "global_step": 102545, "epoch": 2441} {"train_loss": -6.437008857727051, "global_step": 102546, "epoch": 2441} {"train_loss": -6.433461666107178, "global_step": 102547, "epoch": 2441} {"train_loss": -6.495216369628906, "global_step": 102548, "epoch": 2441} {"train_loss": -6.389761447906494, "global_step": 102549, "epoch": 2441} {"train_loss": -6.249422073364258, "global_step": 102550, "epoch": 2441} {"train_loss": -6.4840779304504395, "global_step": 102551, "epoch": 2441} {"train_loss": -6.252031326293945, "global_step": 102552, "epoch": 2441} {"train_loss": -6.469804286956787, "global_step": 102553, "epoch": 2441} {"train_loss": -6.507245063781738, "global_step": 102554, "epoch": 2441} {"train_loss": -6.401111602783203, "global_step": 102555, "epoch": 2441} {"train_loss": -6.483605861663818, "global_step": 102556, "epoch": 2441} {"train_loss": -6.516143798828125, "global_step": 102557, "epoch": 2441} {"train_loss": -6.2422332763671875, "global_step": 102558, "epoch": 2441} {"train_loss": -6.300536632537842, "global_step": 102559, "epoch": 2441} {"train_loss": -6.486568450927734, "global_step": 102560, "epoch": 2441} {"train_loss": -6.334247589111328, "global_step": 102561, "epoch": 2441} {"train_loss": -6.35490083694458, "global_step": 102562, "epoch": 2441} {"train_loss": -6.393399919782366, "global_step": 102563, "epoch": 2441, "val_loss": 64551.35546875} {"train_loss": -6.256368160247803, "global_step": 102564, "epoch": 2442} {"train_loss": -6.4371442794799805, "global_step": 102565, "epoch": 2442} {"train_loss": -6.343805313110352, "global_step": 102566, "epoch": 2442} {"train_loss": -6.3579301834106445, "global_step": 102567, "epoch": 2442} {"train_loss": -6.508806228637695, "global_step": 102568, "epoch": 2442} {"train_loss": -6.399887561798096, "global_step": 102569, "epoch": 2442} {"train_loss": -6.4071125984191895, "global_step": 102570, "epoch": 2442} {"train_loss": -6.439492225646973, "global_step": 102571, "epoch": 2442} {"train_loss": -6.336422920227051, "global_step": 102572, "epoch": 2442} {"train_loss": -6.395294666290283, "global_step": 102573, "epoch": 2442} {"train_loss": -6.380220413208008, "global_step": 102574, "epoch": 2442} {"train_loss": -6.4762420654296875, "global_step": 102575, "epoch": 2442} {"train_loss": -6.405335426330566, "global_step": 102576, "epoch": 2442} {"train_loss": -6.308032989501953, "global_step": 102577, "epoch": 2442} {"train_loss": -6.442568302154541, "global_step": 102578, "epoch": 2442} {"train_loss": -6.374174118041992, "global_step": 102579, "epoch": 2442} {"train_loss": -6.293369293212891, "global_step": 102580, "epoch": 2442} {"train_loss": -6.383431911468506, "global_step": 102581, "epoch": 2442} {"train_loss": -6.350440979003906, "global_step": 102582, "epoch": 2442} {"train_loss": -6.236078262329102, "global_step": 102583, "epoch": 2442} {"train_loss": -6.3453779220581055, "global_step": 102584, "epoch": 2442} {"train_loss": -6.330061912536621, "global_step": 102585, "epoch": 2442} {"train_loss": -6.31673526763916, "global_step": 102586, "epoch": 2442} {"train_loss": -6.299311637878418, "global_step": 102587, "epoch": 2442} {"train_loss": -6.287428379058838, "global_step": 102588, "epoch": 2442} {"train_loss": -6.470141410827637, "global_step": 102589, "epoch": 2442} {"train_loss": -6.267133712768555, "global_step": 102590, "epoch": 2442} {"train_loss": -6.3150835037231445, "global_step": 102591, "epoch": 2442} {"train_loss": -6.426418304443359, "global_step": 102592, "epoch": 2442} {"train_loss": -6.1978912353515625, "global_step": 102593, "epoch": 2442} {"train_loss": -6.346197128295898, "global_step": 102594, "epoch": 2442} {"train_loss": -6.400899887084961, "global_step": 102595, "epoch": 2442} {"train_loss": -6.406550884246826, "global_step": 102596, "epoch": 2442} {"train_loss": -6.310358047485352, "global_step": 102597, "epoch": 2442} {"train_loss": -6.320043563842773, "global_step": 102598, "epoch": 2442} {"train_loss": -6.370976448059082, "global_step": 102599, "epoch": 2442} {"train_loss": -6.38749361038208, "global_step": 102600, "epoch": 2442} {"train_loss": -6.526719570159912, "global_step": 102601, "epoch": 2442} {"train_loss": -6.419001579284668, "global_step": 102602, "epoch": 2442} {"train_loss": -6.291409492492676, "global_step": 102603, "epoch": 2442} {"train_loss": -6.516965866088867, "global_step": 102604, "epoch": 2442} {"train_loss": -6.3697232859475275, "global_step": 102605, "epoch": 2442, "val_loss": 64537.80078125} {"train_loss": -6.412455081939697, "global_step": 102606, "epoch": 2443} {"train_loss": -6.449334144592285, "global_step": 102607, "epoch": 2443} {"train_loss": -6.517936706542969, "global_step": 102608, "epoch": 2443} {"train_loss": -6.4171857833862305, "global_step": 102609, "epoch": 2443} {"train_loss": -6.356926918029785, "global_step": 102610, "epoch": 2443} {"train_loss": -6.383217811584473, "global_step": 102611, "epoch": 2443} {"train_loss": -6.440683841705322, "global_step": 102612, "epoch": 2443} {"train_loss": -6.456550598144531, "global_step": 102613, "epoch": 2443} {"train_loss": -6.3589396476745605, "global_step": 102614, "epoch": 2443} {"train_loss": -6.386933326721191, "global_step": 102615, "epoch": 2443} {"train_loss": -6.4645490646362305, "global_step": 102616, "epoch": 2443} {"train_loss": -6.377002239227295, "global_step": 102617, "epoch": 2443} {"train_loss": -6.461071491241455, "global_step": 102618, "epoch": 2443} {"train_loss": -6.169123649597168, "global_step": 102619, "epoch": 2443} {"train_loss": -6.407552242279053, "global_step": 102620, "epoch": 2443} {"train_loss": -6.3189826011657715, "global_step": 102621, "epoch": 2443} {"train_loss": -6.376394271850586, "global_step": 102622, "epoch": 2443} {"train_loss": -6.344974994659424, "global_step": 102623, "epoch": 2443} {"train_loss": -6.291500568389893, "global_step": 102624, "epoch": 2443} {"train_loss": -6.312917709350586, "global_step": 102625, "epoch": 2443} {"train_loss": -6.419398307800293, "global_step": 102626, "epoch": 2443} {"train_loss": -6.36904764175415, "global_step": 102627, "epoch": 2443} {"train_loss": -6.401546478271484, "global_step": 102628, "epoch": 2443} {"train_loss": -6.424483299255371, "global_step": 102629, "epoch": 2443} {"train_loss": -6.356504440307617, "global_step": 102630, "epoch": 2443} {"train_loss": -6.453581809997559, "global_step": 102631, "epoch": 2443} {"train_loss": -6.336908340454102, "global_step": 102632, "epoch": 2443} {"train_loss": -6.3990397453308105, "global_step": 102633, "epoch": 2443} {"train_loss": -6.336113929748535, "global_step": 102634, "epoch": 2443} {"train_loss": -6.344779014587402, "global_step": 102635, "epoch": 2443} {"train_loss": -6.396429061889648, "global_step": 102636, "epoch": 2443} {"train_loss": -6.452186584472656, "global_step": 102637, "epoch": 2443} {"train_loss": -6.414878845214844, "global_step": 102638, "epoch": 2443} {"train_loss": -6.435133934020996, "global_step": 102639, "epoch": 2443} {"train_loss": -6.432957649230957, "global_step": 102640, "epoch": 2443} {"train_loss": -6.5277910232543945, "global_step": 102641, "epoch": 2443} {"train_loss": -6.430324554443359, "global_step": 102642, "epoch": 2443} {"train_loss": -6.428818702697754, "global_step": 102643, "epoch": 2443} {"train_loss": -6.397922992706299, "global_step": 102644, "epoch": 2443} {"train_loss": -6.358659744262695, "global_step": 102645, "epoch": 2443} {"train_loss": -6.472717761993408, "global_step": 102646, "epoch": 2443} {"train_loss": -6.396275622504098, "global_step": 102647, "epoch": 2443, "val_loss": 64431.04296875} {"train_loss": -6.57427978515625, "global_step": 102648, "epoch": 2444} {"train_loss": -6.5025739669799805, "global_step": 102649, "epoch": 2444} {"train_loss": -6.430188179016113, "global_step": 102650, "epoch": 2444} {"train_loss": -6.475279808044434, "global_step": 102651, "epoch": 2444} {"train_loss": -6.384228706359863, "global_step": 102652, "epoch": 2444} {"train_loss": -6.457503318786621, "global_step": 102653, "epoch": 2444} {"train_loss": -6.369632244110107, "global_step": 102654, "epoch": 2444} {"train_loss": -6.4373064041137695, "global_step": 102655, "epoch": 2444} {"train_loss": -6.453891754150391, "global_step": 102656, "epoch": 2444} {"train_loss": -6.2149200439453125, "global_step": 102657, "epoch": 2444} {"train_loss": -6.362148761749268, "global_step": 102658, "epoch": 2444} {"train_loss": -6.4452314376831055, "global_step": 102659, "epoch": 2444} {"train_loss": -6.362712860107422, "global_step": 102660, "epoch": 2444} {"train_loss": -6.4061994552612305, "global_step": 102661, "epoch": 2444} {"train_loss": -6.423473358154297, "global_step": 102662, "epoch": 2444} {"train_loss": -6.389066696166992, "global_step": 102663, "epoch": 2444} {"train_loss": -6.409951210021973, "global_step": 102664, "epoch": 2444} {"train_loss": -6.370635986328125, "global_step": 102665, "epoch": 2444} {"train_loss": -6.487391471862793, "global_step": 102666, "epoch": 2444} {"train_loss": -6.406048774719238, "global_step": 102667, "epoch": 2444} {"train_loss": -6.361517906188965, "global_step": 102668, "epoch": 2444} {"train_loss": -6.470576286315918, "global_step": 102669, "epoch": 2444} {"train_loss": -6.389065742492676, "global_step": 102670, "epoch": 2444} {"train_loss": -6.442067623138428, "global_step": 102671, "epoch": 2444} {"train_loss": -6.330001354217529, "global_step": 102672, "epoch": 2444} {"train_loss": -6.475815773010254, "global_step": 102673, "epoch": 2444} {"train_loss": -6.349729537963867, "global_step": 102674, "epoch": 2444} {"train_loss": -6.518294811248779, "global_step": 102675, "epoch": 2444} {"train_loss": -6.419844150543213, "global_step": 102676, "epoch": 2444} {"train_loss": -6.428691864013672, "global_step": 102677, "epoch": 2444} {"train_loss": -6.225074291229248, "global_step": 102678, "epoch": 2444} {"train_loss": -6.428032875061035, "global_step": 102679, "epoch": 2444} {"train_loss": -6.260174751281738, "global_step": 102680, "epoch": 2444} {"train_loss": -6.397229194641113, "global_step": 102681, "epoch": 2444} {"train_loss": -6.364171981811523, "global_step": 102682, "epoch": 2444} {"train_loss": -6.3504157066345215, "global_step": 102683, "epoch": 2444} {"train_loss": -6.364950180053711, "global_step": 102684, "epoch": 2444} {"train_loss": -6.391153335571289, "global_step": 102685, "epoch": 2444} {"train_loss": -6.313695907592773, "global_step": 102686, "epoch": 2444} {"train_loss": -6.392465114593506, "global_step": 102687, "epoch": 2444} {"train_loss": -6.147819519042969, "global_step": 102688, "epoch": 2444} {"train_loss": -6.3921287059783936, "global_step": 102689, "epoch": 2444, "val_loss": 64302.8125} {"train_loss": -6.335309982299805, "global_step": 102690, "epoch": 2445} {"train_loss": -6.365958213806152, "global_step": 102691, "epoch": 2445} {"train_loss": -6.328789234161377, "global_step": 102692, "epoch": 2445} {"train_loss": -6.30898904800415, "global_step": 102693, "epoch": 2445} {"train_loss": -6.21005916595459, "global_step": 102694, "epoch": 2445} {"train_loss": -6.315145015716553, "global_step": 102695, "epoch": 2445} {"train_loss": -6.316089630126953, "global_step": 102696, "epoch": 2445} {"train_loss": -6.388009071350098, "global_step": 102697, "epoch": 2445} {"train_loss": -6.340198516845703, "global_step": 102698, "epoch": 2445} {"train_loss": -6.207221984863281, "global_step": 102699, "epoch": 2445} {"train_loss": -6.325428009033203, "global_step": 102700, "epoch": 2445} {"train_loss": -6.420398712158203, "global_step": 102701, "epoch": 2445} {"train_loss": -6.258163928985596, "global_step": 102702, "epoch": 2445} {"train_loss": -6.365195274353027, "global_step": 102703, "epoch": 2445} {"train_loss": -6.350790977478027, "global_step": 102704, "epoch": 2445} {"train_loss": -6.268810272216797, "global_step": 102705, "epoch": 2445} {"train_loss": -6.313530445098877, "global_step": 102706, "epoch": 2445} {"train_loss": -6.2926764488220215, "global_step": 102707, "epoch": 2445} {"train_loss": -6.274706840515137, "global_step": 102708, "epoch": 2445} {"train_loss": -6.171401023864746, "global_step": 102709, "epoch": 2445} {"train_loss": -6.344065189361572, "global_step": 102710, "epoch": 2445} {"train_loss": -6.22899055480957, "global_step": 102711, "epoch": 2445} {"train_loss": -6.2708845138549805, "global_step": 102712, "epoch": 2445} {"train_loss": -6.3822221755981445, "global_step": 102713, "epoch": 2445} {"train_loss": -6.288827419281006, "global_step": 102714, "epoch": 2445} {"train_loss": -6.341844081878662, "global_step": 102715, "epoch": 2445} {"train_loss": -6.2367658615112305, "global_step": 102716, "epoch": 2445} {"train_loss": -6.2271881103515625, "global_step": 102717, "epoch": 2445} {"train_loss": -6.2715606689453125, "global_step": 102718, "epoch": 2445} {"train_loss": -6.237682342529297, "global_step": 102719, "epoch": 2445} {"train_loss": -6.301060676574707, "global_step": 102720, "epoch": 2445} {"train_loss": -6.240726470947266, "global_step": 102721, "epoch": 2445} {"train_loss": -6.324028015136719, "global_step": 102722, "epoch": 2445} {"train_loss": -6.398375511169434, "global_step": 102723, "epoch": 2445} {"train_loss": -6.378361225128174, "global_step": 102724, "epoch": 2445} {"train_loss": -6.3428120613098145, "global_step": 102725, "epoch": 2445} {"train_loss": -6.346460342407227, "global_step": 102726, "epoch": 2445} {"train_loss": -6.362368583679199, "global_step": 102727, "epoch": 2445} {"train_loss": -6.437060356140137, "global_step": 102728, "epoch": 2445} {"train_loss": -6.301485061645508, "global_step": 102729, "epoch": 2445} {"train_loss": -6.365890979766846, "global_step": 102730, "epoch": 2445} {"train_loss": -6.314528238205683, "global_step": 102731, "epoch": 2445, "val_loss": 64284.76953125} {"train_loss": -6.441717624664307, "global_step": 102732, "epoch": 2446} {"train_loss": -6.338069915771484, "global_step": 102733, "epoch": 2446} {"train_loss": -6.319441795349121, "global_step": 102734, "epoch": 2446} {"train_loss": -6.510264873504639, "global_step": 102735, "epoch": 2446} {"train_loss": -6.380711555480957, "global_step": 102736, "epoch": 2446} {"train_loss": -6.350926876068115, "global_step": 102737, "epoch": 2446} {"train_loss": -6.430971145629883, "global_step": 102738, "epoch": 2446} {"train_loss": -6.384692192077637, "global_step": 102739, "epoch": 2446} {"train_loss": -6.475949287414551, "global_step": 102740, "epoch": 2446} {"train_loss": -6.360464572906494, "global_step": 102741, "epoch": 2446} {"train_loss": -6.315892219543457, "global_step": 102742, "epoch": 2446} {"train_loss": -6.429882049560547, "global_step": 102743, "epoch": 2446} {"train_loss": -6.407729148864746, "global_step": 102744, "epoch": 2446} {"train_loss": -6.293169975280762, "global_step": 102745, "epoch": 2446} {"train_loss": -6.290274620056152, "global_step": 102746, "epoch": 2446} {"train_loss": -6.325812339782715, "global_step": 102747, "epoch": 2446} {"train_loss": -6.490786552429199, "global_step": 102748, "epoch": 2446} {"train_loss": -6.349357604980469, "global_step": 102749, "epoch": 2446} {"train_loss": -6.41550350189209, "global_step": 102750, "epoch": 2446} {"train_loss": -6.30803108215332, "global_step": 102751, "epoch": 2446} {"train_loss": -6.359193801879883, "global_step": 102752, "epoch": 2446} {"train_loss": -6.367644786834717, "global_step": 102753, "epoch": 2446} {"train_loss": -6.337566375732422, "global_step": 102754, "epoch": 2446} {"train_loss": -6.353341102600098, "global_step": 102755, "epoch": 2446} {"train_loss": -6.2973456382751465, "global_step": 102756, "epoch": 2446} {"train_loss": -6.312641143798828, "global_step": 102757, "epoch": 2446} {"train_loss": -6.332461357116699, "global_step": 102758, "epoch": 2446} {"train_loss": -6.387088775634766, "global_step": 102759, "epoch": 2446} {"train_loss": -6.384344577789307, "global_step": 102760, "epoch": 2446} {"train_loss": -6.241872787475586, "global_step": 102761, "epoch": 2446} {"train_loss": -6.424917221069336, "global_step": 102762, "epoch": 2446} {"train_loss": -6.4696855545043945, "global_step": 102763, "epoch": 2446} {"train_loss": -6.362560272216797, "global_step": 102764, "epoch": 2446} {"train_loss": -6.55810022354126, "global_step": 102765, "epoch": 2446} {"train_loss": -6.388584136962891, "global_step": 102766, "epoch": 2446} {"train_loss": -6.471774578094482, "global_step": 102767, "epoch": 2446} {"train_loss": -6.473791122436523, "global_step": 102768, "epoch": 2446} {"train_loss": -6.463221549987793, "global_step": 102769, "epoch": 2446} {"train_loss": -6.423637866973877, "global_step": 102770, "epoch": 2446} {"train_loss": -6.256814956665039, "global_step": 102771, "epoch": 2446} {"train_loss": -6.452760696411133, "global_step": 102772, "epoch": 2446} {"train_loss": -6.384547097342355, "global_step": 102773, "epoch": 2446, "val_loss": 64183.3671875} {"train_loss": -6.424458026885986, "global_step": 102774, "epoch": 2447} {"train_loss": -6.481101036071777, "global_step": 102775, "epoch": 2447} {"train_loss": -6.4453864097595215, "global_step": 102776, "epoch": 2447} {"train_loss": -6.434188365936279, "global_step": 102777, "epoch": 2447} {"train_loss": -6.400629043579102, "global_step": 102778, "epoch": 2447} {"train_loss": -6.355740547180176, "global_step": 102779, "epoch": 2447} {"train_loss": -6.47646427154541, "global_step": 102780, "epoch": 2447} {"train_loss": -6.439748764038086, "global_step": 102781, "epoch": 2447} {"train_loss": -6.275732040405273, "global_step": 102782, "epoch": 2447} {"train_loss": -6.471251487731934, "global_step": 102783, "epoch": 2447} {"train_loss": -6.455538272857666, "global_step": 102784, "epoch": 2447} {"train_loss": -6.284575462341309, "global_step": 102785, "epoch": 2447} {"train_loss": -6.453952789306641, "global_step": 102786, "epoch": 2447} {"train_loss": -6.3687944412231445, "global_step": 102787, "epoch": 2447} {"train_loss": -6.301310062408447, "global_step": 102788, "epoch": 2447} {"train_loss": -6.44704532623291, "global_step": 102789, "epoch": 2447} {"train_loss": -6.438327312469482, "global_step": 102790, "epoch": 2447} {"train_loss": -6.4361114501953125, "global_step": 102791, "epoch": 2447} {"train_loss": -6.423247337341309, "global_step": 102792, "epoch": 2447} {"train_loss": -6.47243595123291, "global_step": 102793, "epoch": 2447} {"train_loss": -6.426562309265137, "global_step": 102794, "epoch": 2447} {"train_loss": -6.34919548034668, "global_step": 102795, "epoch": 2447} {"train_loss": -6.366302490234375, "global_step": 102796, "epoch": 2447} {"train_loss": -6.325571537017822, "global_step": 102797, "epoch": 2447} {"train_loss": -6.382445335388184, "global_step": 102798, "epoch": 2447} {"train_loss": -6.429714679718018, "global_step": 102799, "epoch": 2447} {"train_loss": -6.4346723556518555, "global_step": 102800, "epoch": 2447} {"train_loss": -6.279608726501465, "global_step": 102801, "epoch": 2447} {"train_loss": -6.420042991638184, "global_step": 102802, "epoch": 2447} {"train_loss": -6.420867919921875, "global_step": 102803, "epoch": 2447} {"train_loss": -6.381313323974609, "global_step": 102804, "epoch": 2447} {"train_loss": -6.469154357910156, "global_step": 102805, "epoch": 2447} {"train_loss": -6.416788101196289, "global_step": 102806, "epoch": 2447} {"train_loss": -6.42698335647583, "global_step": 102807, "epoch": 2447} {"train_loss": -6.378564834594727, "global_step": 102808, "epoch": 2447} {"train_loss": -6.333704471588135, "global_step": 102809, "epoch": 2447} {"train_loss": -6.441690444946289, "global_step": 102810, "epoch": 2447} {"train_loss": -6.523305416107178, "global_step": 102811, "epoch": 2447} {"train_loss": -6.328225135803223, "global_step": 102812, "epoch": 2447} {"train_loss": -6.38804292678833, "global_step": 102813, "epoch": 2447} {"train_loss": -6.530930519104004, "global_step": 102814, "epoch": 2447} {"train_loss": -6.407819100788662, "global_step": 102815, "epoch": 2447, "val_loss": 64460.0859375} {"train_loss": -6.424160957336426, "global_step": 102816, "epoch": 2448} {"train_loss": -6.467573165893555, "global_step": 102817, "epoch": 2448} {"train_loss": -6.345348834991455, "global_step": 102818, "epoch": 2448} {"train_loss": -6.371016502380371, "global_step": 102819, "epoch": 2448} {"train_loss": -6.480852127075195, "global_step": 102820, "epoch": 2448} {"train_loss": -6.366774559020996, "global_step": 102821, "epoch": 2448} {"train_loss": -6.393988132476807, "global_step": 102822, "epoch": 2448} {"train_loss": -6.366315841674805, "global_step": 102823, "epoch": 2448} {"train_loss": -6.440759181976318, "global_step": 102824, "epoch": 2448} {"train_loss": -6.475905418395996, "global_step": 102825, "epoch": 2448} {"train_loss": -6.441130638122559, "global_step": 102826, "epoch": 2448} {"train_loss": -6.369269847869873, "global_step": 102827, "epoch": 2448} {"train_loss": -6.384275913238525, "global_step": 102828, "epoch": 2448} {"train_loss": -6.476194381713867, "global_step": 102829, "epoch": 2448} {"train_loss": -6.452538967132568, "global_step": 102830, "epoch": 2448} {"train_loss": -6.4906744956970215, "global_step": 102831, "epoch": 2448} {"train_loss": -6.358234882354736, "global_step": 102832, "epoch": 2448} {"train_loss": -6.371854782104492, "global_step": 102833, "epoch": 2448} {"train_loss": -6.4929351806640625, "global_step": 102834, "epoch": 2448} {"train_loss": -6.570952892303467, "global_step": 102835, "epoch": 2448} {"train_loss": -6.462352275848389, "global_step": 102836, "epoch": 2448} {"train_loss": -6.425624847412109, "global_step": 102837, "epoch": 2448} {"train_loss": -6.46461296081543, "global_step": 102838, "epoch": 2448} {"train_loss": -6.424106121063232, "global_step": 102839, "epoch": 2448} {"train_loss": -6.415724277496338, "global_step": 102840, "epoch": 2448} {"train_loss": -6.430720806121826, "global_step": 102841, "epoch": 2448} {"train_loss": -6.3809404373168945, "global_step": 102842, "epoch": 2448} {"train_loss": -6.4511213302612305, "global_step": 102843, "epoch": 2448} {"train_loss": -6.385988712310791, "global_step": 102844, "epoch": 2448} {"train_loss": -6.449160575866699, "global_step": 102845, "epoch": 2448} {"train_loss": -6.399888515472412, "global_step": 102846, "epoch": 2448} {"train_loss": -6.451211452484131, "global_step": 102847, "epoch": 2448} {"train_loss": -6.370750427246094, "global_step": 102848, "epoch": 2448} {"train_loss": -6.447831153869629, "global_step": 102849, "epoch": 2448} {"train_loss": -6.497773170471191, "global_step": 102850, "epoch": 2448} {"train_loss": -6.343975067138672, "global_step": 102851, "epoch": 2448} {"train_loss": -6.352982044219971, "global_step": 102852, "epoch": 2448} {"train_loss": -6.4057159423828125, "global_step": 102853, "epoch": 2448} {"train_loss": -6.328351974487305, "global_step": 102854, "epoch": 2448} {"train_loss": -6.626571178436279, "global_step": 102855, "epoch": 2448} {"train_loss": -6.438088417053223, "global_step": 102856, "epoch": 2448} {"train_loss": -6.427353382110596, "global_step": 102857, "epoch": 2448, "val_loss": 64389.05078125} {"train_loss": -6.368817329406738, "global_step": 102858, "epoch": 2449} {"train_loss": -6.476405143737793, "global_step": 102859, "epoch": 2449} {"train_loss": -6.496724605560303, "global_step": 102860, "epoch": 2449} {"train_loss": -6.533444404602051, "global_step": 102861, "epoch": 2449} {"train_loss": -6.344448089599609, "global_step": 102862, "epoch": 2449} {"train_loss": -6.520673751831055, "global_step": 102863, "epoch": 2449} {"train_loss": -6.547447204589844, "global_step": 102864, "epoch": 2449} {"train_loss": -6.52894926071167, "global_step": 102865, "epoch": 2449} {"train_loss": -6.425395965576172, "global_step": 102866, "epoch": 2449} {"train_loss": -6.426314353942871, "global_step": 102867, "epoch": 2449} {"train_loss": -6.527456283569336, "global_step": 102868, "epoch": 2449} {"train_loss": -6.3243303298950195, "global_step": 102869, "epoch": 2449} {"train_loss": -6.288931369781494, "global_step": 102870, "epoch": 2449} {"train_loss": -6.376880168914795, "global_step": 102871, "epoch": 2449} {"train_loss": -6.376697540283203, "global_step": 102872, "epoch": 2449} {"train_loss": -6.367293357849121, "global_step": 102873, "epoch": 2449} {"train_loss": -6.484088897705078, "global_step": 102874, "epoch": 2449} {"train_loss": -6.289724349975586, "global_step": 102875, "epoch": 2449} {"train_loss": -6.278707504272461, "global_step": 102876, "epoch": 2449} {"train_loss": -6.376127243041992, "global_step": 102877, "epoch": 2449} {"train_loss": -6.303491592407227, "global_step": 102878, "epoch": 2449} {"train_loss": -6.198731899261475, "global_step": 102879, "epoch": 2449} {"train_loss": -6.355010986328125, "global_step": 102880, "epoch": 2449} {"train_loss": -6.208049774169922, "global_step": 102881, "epoch": 2449} {"train_loss": -6.364352226257324, "global_step": 102882, "epoch": 2449} {"train_loss": -6.266813278198242, "global_step": 102883, "epoch": 2449} {"train_loss": -6.349921226501465, "global_step": 102884, "epoch": 2449} {"train_loss": -6.3939008712768555, "global_step": 102885, "epoch": 2449} {"train_loss": -6.346817493438721, "global_step": 102886, "epoch": 2449} {"train_loss": -6.461536884307861, "global_step": 102887, "epoch": 2449} {"train_loss": -6.422025203704834, "global_step": 102888, "epoch": 2449} {"train_loss": -6.367673873901367, "global_step": 102889, "epoch": 2449} {"train_loss": -6.32503604888916, "global_step": 102890, "epoch": 2449} {"train_loss": -6.411020278930664, "global_step": 102891, "epoch": 2449} {"train_loss": -6.362390518188477, "global_step": 102892, "epoch": 2449} {"train_loss": -6.365182399749756, "global_step": 102893, "epoch": 2449} {"train_loss": -6.394371032714844, "global_step": 102894, "epoch": 2449} {"train_loss": -6.458188056945801, "global_step": 102895, "epoch": 2449} {"train_loss": -6.373562812805176, "global_step": 102896, "epoch": 2449} {"train_loss": -6.367542266845703, "global_step": 102897, "epoch": 2449} {"train_loss": -6.392287731170654, "global_step": 102898, "epoch": 2449} {"train_loss": -6.386957577296665, "global_step": 102899, "epoch": 2449, "val_loss": 64412.92578125} {"train_loss": -6.470737934112549, "global_step": 102900, "epoch": 2450} {"train_loss": -6.436136722564697, "global_step": 102901, "epoch": 2450} {"train_loss": -6.321206092834473, "global_step": 102902, "epoch": 2450} {"train_loss": -6.478105545043945, "global_step": 102903, "epoch": 2450} {"train_loss": -6.417150020599365, "global_step": 102904, "epoch": 2450} {"train_loss": -6.385078430175781, "global_step": 102905, "epoch": 2450} {"train_loss": -6.440460681915283, "global_step": 102906, "epoch": 2450} {"train_loss": -6.496112823486328, "global_step": 102907, "epoch": 2450} {"train_loss": -6.403214454650879, "global_step": 102908, "epoch": 2450} {"train_loss": -6.458954811096191, "global_step": 102909, "epoch": 2450} {"train_loss": -6.37818717956543, "global_step": 102910, "epoch": 2450} {"train_loss": -6.377817153930664, "global_step": 102911, "epoch": 2450} {"train_loss": -6.487859725952148, "global_step": 102912, "epoch": 2450} {"train_loss": -6.459907054901123, "global_step": 102913, "epoch": 2450} {"train_loss": -6.532101631164551, "global_step": 102914, "epoch": 2450} {"train_loss": -6.402931213378906, "global_step": 102915, "epoch": 2450} {"train_loss": -6.378063678741455, "global_step": 102916, "epoch": 2450} {"train_loss": -6.312005996704102, "global_step": 102917, "epoch": 2450} {"train_loss": -6.295269966125488, "global_step": 102918, "epoch": 2450} {"train_loss": -6.384042739868164, "global_step": 102919, "epoch": 2450} {"train_loss": -6.425005912780762, "global_step": 102920, "epoch": 2450} {"train_loss": -6.489780902862549, "global_step": 102921, "epoch": 2450} {"train_loss": -6.345768928527832, "global_step": 102922, "epoch": 2450} {"train_loss": -6.246875762939453, "global_step": 102923, "epoch": 2450} {"train_loss": -6.442307949066162, "global_step": 102924, "epoch": 2450} {"train_loss": -6.401349067687988, "global_step": 102925, "epoch": 2450} {"train_loss": -6.422094821929932, "global_step": 102926, "epoch": 2450} {"train_loss": -6.385639190673828, "global_step": 102927, "epoch": 2450} {"train_loss": -6.3890156745910645, "global_step": 102928, "epoch": 2450} {"train_loss": -6.3547468185424805, "global_step": 102929, "epoch": 2450} {"train_loss": -6.438719749450684, "global_step": 102930, "epoch": 2450} {"train_loss": -6.451791763305664, "global_step": 102931, "epoch": 2450} {"train_loss": -6.365668296813965, "global_step": 102932, "epoch": 2450} {"train_loss": -6.300666809082031, "global_step": 102933, "epoch": 2450} {"train_loss": -6.356110095977783, "global_step": 102934, "epoch": 2450} {"train_loss": -6.310125827789307, "global_step": 102935, "epoch": 2450} {"train_loss": -6.369991302490234, "global_step": 102936, "epoch": 2450} {"train_loss": -6.400836944580078, "global_step": 102937, "epoch": 2450} {"train_loss": -6.341791152954102, "global_step": 102938, "epoch": 2450} {"train_loss": -6.354142189025879, "global_step": 102939, "epoch": 2450} {"train_loss": -6.226157188415527, "global_step": 102940, "epoch": 2450} {"train_loss": -6.3938977264222645, "global_step": 102941, "epoch": 2450, "train/sim_max_reward_0": 0.19369788050148218, "train/sim_max_reward_1": 0.8130088836199486, "train/sim_max_reward_2": 0.8285933770824708, "train/sim_max_reward_3": 0.9795645245485267, "train/sim_max_reward_4": 0.9334240649282894, "train/sim_max_reward_5": 0.839443111465618, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.39582529539337685, "test/sim_max_reward_4300002": 0.9209885865622253, "test/sim_max_reward_4300003": 0.893580335743714, "test/sim_max_reward_4300004": 0.32038477572476104, "test/sim_max_reward_4300005": 0.5929618470180373, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.853526505632724, "test/sim_max_reward_4300008": 0.9875324779167924, "test/sim_max_reward_4300009": 0.9394984421307961, "test/sim_max_reward_4300010": 0.2651600047277854, "test/sim_max_reward_4300011": 0.30274546890242543, "test/sim_max_reward_4300012": 0.9492166927792306, "test/sim_max_reward_4300013": 0.411741732728802, "test/sim_max_reward_4300014": 0.9973692280083897, "test/sim_max_reward_4300015": 0.937464320393974, "test/sim_max_reward_4300016": 0.9563947976070648, "test/sim_max_reward_4300017": 0.6153538367465877, "test/sim_max_reward_4300018": 0.4393153143158452, "test/sim_max_reward_4300019": 0.1859560878829494, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8989190518833051, "test/sim_max_reward_4300022": 0.8950540585115276, "test/sim_max_reward_4300023": 0.3425770695882814, "test/sim_max_reward_4300024": 0.6082231846250628, "test/sim_max_reward_4300025": 0.6815360903339618, "test/sim_max_reward_4300026": 0.14667561306317067, "test/sim_max_reward_4300027": 0.9045879591006306, "test/sim_max_reward_4300028": 0.0135356799870151, "test/sim_max_reward_4300029": 0.6105955649292535, "test/sim_max_reward_4300030": 1.0, "test/sim_max_reward_4300031": 0.3870836043022726, "test/sim_max_reward_4300032": 0.9442084791738742, "test/sim_max_reward_4300033": 0.7580505531661762, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.42046137511566173, "test/sim_max_reward_4300036": 0.2022331595084727, "test/sim_max_reward_4300037": 1.0, "test/sim_max_reward_4300038": 0.6296824442497821, "test/sim_max_reward_4300039": 0.17192477318134766, "test/sim_max_reward_4300040": 0.36377367631356794, "test/sim_max_reward_4300041": 1.0, "test/sim_max_reward_4300042": 0.6124876334789066, "test/sim_max_reward_4300043": 0.994543828629462, "test/sim_max_reward_4300044": 0.6352568696368506, "test/sim_max_reward_4300045": 0.19193358387063633, "test/sim_max_reward_4300046": 0.8348682969024939, "test/sim_max_reward_4300047": 0.9206437199089713, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.06714009445518898, "train/mean_score": 0.7646219736910559, "test/mean_score": 0.564020242282627, "val_loss": 64630.22265625} {"train_loss": -6.4234418869018555, "global_step": 102942, "epoch": 2451} {"train_loss": -6.3443074226379395, "global_step": 102943, "epoch": 2451} {"train_loss": -6.342520236968994, "global_step": 102944, "epoch": 2451} {"train_loss": -6.282861709594727, "global_step": 102945, "epoch": 2451} {"train_loss": -6.5115203857421875, "global_step": 102946, "epoch": 2451} {"train_loss": -6.3376030921936035, "global_step": 102947, "epoch": 2451} {"train_loss": -6.2870330810546875, "global_step": 102948, "epoch": 2451} {"train_loss": -6.372923851013184, "global_step": 102949, "epoch": 2451} {"train_loss": -6.302369117736816, "global_step": 102950, "epoch": 2451} {"train_loss": -6.390058517456055, "global_step": 102951, "epoch": 2451} {"train_loss": -6.316438674926758, "global_step": 102952, "epoch": 2451} {"train_loss": -6.4285173416137695, "global_step": 102953, "epoch": 2451} {"train_loss": -6.357421875, "global_step": 102954, "epoch": 2451} {"train_loss": -6.32014799118042, "global_step": 102955, "epoch": 2451} {"train_loss": -6.455488204956055, "global_step": 102956, "epoch": 2451} {"train_loss": -6.361461162567139, "global_step": 102957, "epoch": 2451} {"train_loss": -6.345690727233887, "global_step": 102958, "epoch": 2451} {"train_loss": -6.341242790222168, "global_step": 102959, "epoch": 2451} {"train_loss": -6.482251167297363, "global_step": 102960, "epoch": 2451} {"train_loss": -6.380451202392578, "global_step": 102961, "epoch": 2451} {"train_loss": -6.362895965576172, "global_step": 102962, "epoch": 2451} {"train_loss": -6.474381446838379, "global_step": 102963, "epoch": 2451} {"train_loss": -6.2819108963012695, "global_step": 102964, "epoch": 2451} {"train_loss": -6.377805233001709, "global_step": 102965, "epoch": 2451} {"train_loss": -6.335227966308594, "global_step": 102966, "epoch": 2451} {"train_loss": -6.429792881011963, "global_step": 102967, "epoch": 2451} {"train_loss": -6.358330726623535, "global_step": 102968, "epoch": 2451} {"train_loss": -6.33723783493042, "global_step": 102969, "epoch": 2451} {"train_loss": -6.453660488128662, "global_step": 102970, "epoch": 2451} {"train_loss": -6.30562686920166, "global_step": 102971, "epoch": 2451} {"train_loss": -6.428377151489258, "global_step": 102972, "epoch": 2451} {"train_loss": -6.338953018188477, "global_step": 102973, "epoch": 2451} {"train_loss": -6.387462615966797, "global_step": 102974, "epoch": 2451} {"train_loss": -6.426782608032227, "global_step": 102975, "epoch": 2451} {"train_loss": -6.478023529052734, "global_step": 102976, "epoch": 2451} {"train_loss": -6.409337043762207, "global_step": 102977, "epoch": 2451} {"train_loss": -6.341923713684082, "global_step": 102978, "epoch": 2451} {"train_loss": -6.2723164558410645, "global_step": 102979, "epoch": 2451} {"train_loss": -6.323042869567871, "global_step": 102980, "epoch": 2451} {"train_loss": -6.331037521362305, "global_step": 102981, "epoch": 2451} {"train_loss": -6.354445457458496, "global_step": 102982, "epoch": 2451} {"train_loss": -6.370378868920462, "global_step": 102983, "epoch": 2451, "val_loss": 64594.48046875} {"train_loss": -6.390920162200928, "global_step": 102984, "epoch": 2452} {"train_loss": -6.284702777862549, "global_step": 102985, "epoch": 2452} {"train_loss": -6.410575866699219, "global_step": 102986, "epoch": 2452} {"train_loss": -6.346805572509766, "global_step": 102987, "epoch": 2452} {"train_loss": -6.389012336730957, "global_step": 102988, "epoch": 2452} {"train_loss": -6.394309997558594, "global_step": 102989, "epoch": 2452} {"train_loss": -6.360475540161133, "global_step": 102990, "epoch": 2452} {"train_loss": -6.4959917068481445, "global_step": 102991, "epoch": 2452} {"train_loss": -6.289595603942871, "global_step": 102992, "epoch": 2452} {"train_loss": -6.393089294433594, "global_step": 102993, "epoch": 2452} {"train_loss": -6.413584232330322, "global_step": 102994, "epoch": 2452} {"train_loss": -6.360311031341553, "global_step": 102995, "epoch": 2452} {"train_loss": -6.499239921569824, "global_step": 102996, "epoch": 2452} {"train_loss": -6.507012367248535, "global_step": 102997, "epoch": 2452} {"train_loss": -6.372092247009277, "global_step": 102998, "epoch": 2452} {"train_loss": -6.355910778045654, "global_step": 102999, "epoch": 2452} {"train_loss": -6.426059246063232, "global_step": 103000, "epoch": 2452} {"train_loss": -6.42603874206543, "global_step": 103001, "epoch": 2452} {"train_loss": -6.560223579406738, "global_step": 103002, "epoch": 2452} {"train_loss": -6.472573280334473, "global_step": 103003, "epoch": 2452} {"train_loss": -6.4978766441345215, "global_step": 103004, "epoch": 2452} {"train_loss": -6.493068695068359, "global_step": 103005, "epoch": 2452} {"train_loss": -6.424285888671875, "global_step": 103006, "epoch": 2452} {"train_loss": -6.407312393188477, "global_step": 103007, "epoch": 2452} {"train_loss": -6.524423122406006, "global_step": 103008, "epoch": 2452} {"train_loss": -6.326449394226074, "global_step": 103009, "epoch": 2452} {"train_loss": -6.392141342163086, "global_step": 103010, "epoch": 2452} {"train_loss": -6.385376930236816, "global_step": 103011, "epoch": 2452} {"train_loss": -6.389191627502441, "global_step": 103012, "epoch": 2452} {"train_loss": -6.490666389465332, "global_step": 103013, "epoch": 2452} {"train_loss": -6.3821258544921875, "global_step": 103014, "epoch": 2452} {"train_loss": -6.252289772033691, "global_step": 103015, "epoch": 2452} {"train_loss": -6.40511417388916, "global_step": 103016, "epoch": 2452} {"train_loss": -6.355975151062012, "global_step": 103017, "epoch": 2452} {"train_loss": -6.396496295928955, "global_step": 103018, "epoch": 2452} {"train_loss": -6.449183464050293, "global_step": 103019, "epoch": 2452} {"train_loss": -6.427348613739014, "global_step": 103020, "epoch": 2452} {"train_loss": -6.494104862213135, "global_step": 103021, "epoch": 2452} {"train_loss": -6.422217845916748, "global_step": 103022, "epoch": 2452} {"train_loss": -6.441712856292725, "global_step": 103023, "epoch": 2452} {"train_loss": -6.488862037658691, "global_step": 103024, "epoch": 2452} {"train_loss": -6.412657669612339, "global_step": 103025, "epoch": 2452, "val_loss": 64403.78125} {"train_loss": -6.4323835372924805, "global_step": 103026, "epoch": 2453} {"train_loss": -6.412459373474121, "global_step": 103027, "epoch": 2453} {"train_loss": -6.399112224578857, "global_step": 103028, "epoch": 2453} {"train_loss": -6.4651665687561035, "global_step": 103029, "epoch": 2453} {"train_loss": -6.422550201416016, "global_step": 103030, "epoch": 2453} {"train_loss": -6.343332290649414, "global_step": 103031, "epoch": 2453} {"train_loss": -6.374695301055908, "global_step": 103032, "epoch": 2453} {"train_loss": -6.432508945465088, "global_step": 103033, "epoch": 2453} {"train_loss": -6.390350341796875, "global_step": 103034, "epoch": 2453} {"train_loss": -6.349289894104004, "global_step": 103035, "epoch": 2453} {"train_loss": -6.307477951049805, "global_step": 103036, "epoch": 2453} {"train_loss": -6.418824195861816, "global_step": 103037, "epoch": 2453} {"train_loss": -6.314339637756348, "global_step": 103038, "epoch": 2453} {"train_loss": -6.31887149810791, "global_step": 103039, "epoch": 2453} {"train_loss": -6.308444976806641, "global_step": 103040, "epoch": 2453} {"train_loss": -6.387827396392822, "global_step": 103041, "epoch": 2453} {"train_loss": -6.3528876304626465, "global_step": 103042, "epoch": 2453} {"train_loss": -6.49272346496582, "global_step": 103043, "epoch": 2453} {"train_loss": -6.367610931396484, "global_step": 103044, "epoch": 2453} {"train_loss": -6.319535255432129, "global_step": 103045, "epoch": 2453} {"train_loss": -6.419661045074463, "global_step": 103046, "epoch": 2453} {"train_loss": -6.399361610412598, "global_step": 103047, "epoch": 2453} {"train_loss": -6.433083534240723, "global_step": 103048, "epoch": 2453} {"train_loss": -6.400446891784668, "global_step": 103049, "epoch": 2453} {"train_loss": -6.4435882568359375, "global_step": 103050, "epoch": 2453} {"train_loss": -6.479464530944824, "global_step": 103051, "epoch": 2453} {"train_loss": -6.497590065002441, "global_step": 103052, "epoch": 2453} {"train_loss": -6.503522872924805, "global_step": 103053, "epoch": 2453} {"train_loss": -6.384110450744629, "global_step": 103054, "epoch": 2453} {"train_loss": -6.440844535827637, "global_step": 103055, "epoch": 2453} {"train_loss": -6.3339104652404785, "global_step": 103056, "epoch": 2453} {"train_loss": -6.375506401062012, "global_step": 103057, "epoch": 2453} {"train_loss": -6.355195045471191, "global_step": 103058, "epoch": 2453} {"train_loss": -6.217896938323975, "global_step": 103059, "epoch": 2453} {"train_loss": -6.404555320739746, "global_step": 103060, "epoch": 2453} {"train_loss": -6.425081253051758, "global_step": 103061, "epoch": 2453} {"train_loss": -6.468733787536621, "global_step": 103062, "epoch": 2453} {"train_loss": -6.454634666442871, "global_step": 103063, "epoch": 2453} {"train_loss": -6.4600958824157715, "global_step": 103064, "epoch": 2453} {"train_loss": -6.344199180603027, "global_step": 103065, "epoch": 2453} {"train_loss": -6.438518524169922, "global_step": 103066, "epoch": 2453} {"train_loss": -6.399586041768392, "global_step": 103067, "epoch": 2453, "val_loss": 64339.12109375} {"train_loss": -6.427485466003418, "global_step": 103068, "epoch": 2454} {"train_loss": -6.404326438903809, "global_step": 103069, "epoch": 2454} {"train_loss": -6.392335891723633, "global_step": 103070, "epoch": 2454} {"train_loss": -6.516919136047363, "global_step": 103071, "epoch": 2454} {"train_loss": -6.416444778442383, "global_step": 103072, "epoch": 2454} {"train_loss": -6.488694190979004, "global_step": 103073, "epoch": 2454} {"train_loss": -6.515064239501953, "global_step": 103074, "epoch": 2454} {"train_loss": -6.516640663146973, "global_step": 103075, "epoch": 2454} {"train_loss": -6.402741432189941, "global_step": 103076, "epoch": 2454} {"train_loss": -6.372923851013184, "global_step": 103077, "epoch": 2454} {"train_loss": -6.37162971496582, "global_step": 103078, "epoch": 2454} {"train_loss": -6.472538948059082, "global_step": 103079, "epoch": 2454} {"train_loss": -6.47725772857666, "global_step": 103080, "epoch": 2454} {"train_loss": -6.407018661499023, "global_step": 103081, "epoch": 2454} {"train_loss": -6.4771504402160645, "global_step": 103082, "epoch": 2454} {"train_loss": -6.543027400970459, "global_step": 103083, "epoch": 2454} {"train_loss": -6.295856952667236, "global_step": 103084, "epoch": 2454} {"train_loss": -6.308881759643555, "global_step": 103085, "epoch": 2454} {"train_loss": -6.339064598083496, "global_step": 103086, "epoch": 2454} {"train_loss": -6.465631484985352, "global_step": 103087, "epoch": 2454} {"train_loss": -6.485918998718262, "global_step": 103088, "epoch": 2454} {"train_loss": -6.5624823570251465, "global_step": 103089, "epoch": 2454} {"train_loss": -6.489567279815674, "global_step": 103090, "epoch": 2454} {"train_loss": -6.409609794616699, "global_step": 103091, "epoch": 2454} {"train_loss": -6.428574562072754, "global_step": 103092, "epoch": 2454} {"train_loss": -6.427912712097168, "global_step": 103093, "epoch": 2454} {"train_loss": -6.531624794006348, "global_step": 103094, "epoch": 2454} {"train_loss": -6.4158453941345215, "global_step": 103095, "epoch": 2454} {"train_loss": -6.404814720153809, "global_step": 103096, "epoch": 2454} {"train_loss": -6.392844200134277, "global_step": 103097, "epoch": 2454} {"train_loss": -6.395914077758789, "global_step": 103098, "epoch": 2454} {"train_loss": -6.359451770782471, "global_step": 103099, "epoch": 2454} {"train_loss": -6.414246559143066, "global_step": 103100, "epoch": 2454} {"train_loss": -6.268510818481445, "global_step": 103101, "epoch": 2454} {"train_loss": -6.431735038757324, "global_step": 103102, "epoch": 2454} {"train_loss": -6.3712873458862305, "global_step": 103103, "epoch": 2454} {"train_loss": -6.376698970794678, "global_step": 103104, "epoch": 2454} {"train_loss": -6.491680145263672, "global_step": 103105, "epoch": 2454} {"train_loss": -6.408134937286377, "global_step": 103106, "epoch": 2454} {"train_loss": -6.517530918121338, "global_step": 103107, "epoch": 2454} {"train_loss": -6.358892917633057, "global_step": 103108, "epoch": 2454} {"train_loss": -6.422452960695539, "global_step": 103109, "epoch": 2454, "val_loss": 64279.18359375} {"train_loss": -6.320634365081787, "global_step": 103110, "epoch": 2455} {"train_loss": -6.440113067626953, "global_step": 103111, "epoch": 2455} {"train_loss": -6.356348991394043, "global_step": 103112, "epoch": 2455} {"train_loss": -6.4279327392578125, "global_step": 103113, "epoch": 2455} {"train_loss": -6.483260631561279, "global_step": 103114, "epoch": 2455} {"train_loss": -6.524226188659668, "global_step": 103115, "epoch": 2455} {"train_loss": -6.433292388916016, "global_step": 103116, "epoch": 2455} {"train_loss": -6.5245795249938965, "global_step": 103117, "epoch": 2455} {"train_loss": -6.434383869171143, "global_step": 103118, "epoch": 2455} {"train_loss": -6.451739311218262, "global_step": 103119, "epoch": 2455} {"train_loss": -6.422440528869629, "global_step": 103120, "epoch": 2455} {"train_loss": -6.457249164581299, "global_step": 103121, "epoch": 2455} {"train_loss": -6.319418907165527, "global_step": 103122, "epoch": 2455} {"train_loss": -6.3866095542907715, "global_step": 103123, "epoch": 2455} {"train_loss": -6.516111850738525, "global_step": 103124, "epoch": 2455} {"train_loss": -6.42921257019043, "global_step": 103125, "epoch": 2455} {"train_loss": -6.418715476989746, "global_step": 103126, "epoch": 2455} {"train_loss": -6.365565299987793, "global_step": 103127, "epoch": 2455} {"train_loss": -6.385250568389893, "global_step": 103128, "epoch": 2455} {"train_loss": -6.523597240447998, "global_step": 103129, "epoch": 2455} {"train_loss": -6.436740875244141, "global_step": 103130, "epoch": 2455} {"train_loss": -6.4313812255859375, "global_step": 103131, "epoch": 2455} {"train_loss": -6.410452842712402, "global_step": 103132, "epoch": 2455} {"train_loss": -6.378865718841553, "global_step": 103133, "epoch": 2455} {"train_loss": -6.431060791015625, "global_step": 103134, "epoch": 2455} {"train_loss": -6.372553825378418, "global_step": 103135, "epoch": 2455} {"train_loss": -6.491229057312012, "global_step": 103136, "epoch": 2455} {"train_loss": -6.39732551574707, "global_step": 103137, "epoch": 2455} {"train_loss": -6.428611755371094, "global_step": 103138, "epoch": 2455} {"train_loss": -6.425265312194824, "global_step": 103139, "epoch": 2455} {"train_loss": -6.435739517211914, "global_step": 103140, "epoch": 2455} {"train_loss": -6.3924455642700195, "global_step": 103141, "epoch": 2455} {"train_loss": -6.334653854370117, "global_step": 103142, "epoch": 2455} {"train_loss": -6.364145278930664, "global_step": 103143, "epoch": 2455} {"train_loss": -6.345717906951904, "global_step": 103144, "epoch": 2455} {"train_loss": -6.333998680114746, "global_step": 103145, "epoch": 2455} {"train_loss": -6.5152788162231445, "global_step": 103146, "epoch": 2455} {"train_loss": -6.420698642730713, "global_step": 103147, "epoch": 2455} {"train_loss": -6.4805908203125, "global_step": 103148, "epoch": 2455} {"train_loss": -6.34654426574707, "global_step": 103149, "epoch": 2455} {"train_loss": -6.354034423828125, "global_step": 103150, "epoch": 2455} {"train_loss": -6.418800649188814, "global_step": 103151, "epoch": 2455, "val_loss": 64320.25390625} {"train_loss": -6.440059661865234, "global_step": 103152, "epoch": 2456} {"train_loss": -6.434804439544678, "global_step": 103153, "epoch": 2456} {"train_loss": -6.341928482055664, "global_step": 103154, "epoch": 2456} {"train_loss": -6.3127946853637695, "global_step": 103155, "epoch": 2456} {"train_loss": -6.41806697845459, "global_step": 103156, "epoch": 2456} {"train_loss": -6.443154335021973, "global_step": 103157, "epoch": 2456} {"train_loss": -6.319032192230225, "global_step": 103158, "epoch": 2456} {"train_loss": -6.372747421264648, "global_step": 103159, "epoch": 2456} {"train_loss": -6.412430763244629, "global_step": 103160, "epoch": 2456} {"train_loss": -6.574973106384277, "global_step": 103161, "epoch": 2456} {"train_loss": -6.452967166900635, "global_step": 103162, "epoch": 2456} {"train_loss": -6.491343021392822, "global_step": 103163, "epoch": 2456} {"train_loss": -6.49992036819458, "global_step": 103164, "epoch": 2456} {"train_loss": -6.338750839233398, "global_step": 103165, "epoch": 2456} {"train_loss": -6.304441452026367, "global_step": 103166, "epoch": 2456} {"train_loss": -6.369207382202148, "global_step": 103167, "epoch": 2456} {"train_loss": -6.342313766479492, "global_step": 103168, "epoch": 2456} {"train_loss": -6.2069091796875, "global_step": 103169, "epoch": 2456} {"train_loss": -6.427030563354492, "global_step": 103170, "epoch": 2456} {"train_loss": -6.390205383300781, "global_step": 103171, "epoch": 2456} {"train_loss": -6.380823612213135, "global_step": 103172, "epoch": 2456} {"train_loss": -6.407337188720703, "global_step": 103173, "epoch": 2456} {"train_loss": -6.436631679534912, "global_step": 103174, "epoch": 2456} {"train_loss": -6.419011116027832, "global_step": 103175, "epoch": 2456} {"train_loss": -6.446916580200195, "global_step": 103176, "epoch": 2456} {"train_loss": -6.535404205322266, "global_step": 103177, "epoch": 2456} {"train_loss": -6.446219444274902, "global_step": 103178, "epoch": 2456} {"train_loss": -6.484671592712402, "global_step": 103179, "epoch": 2456} {"train_loss": -6.49333381652832, "global_step": 103180, "epoch": 2456} {"train_loss": -6.574384689331055, "global_step": 103181, "epoch": 2456} {"train_loss": -6.40666389465332, "global_step": 103182, "epoch": 2456} {"train_loss": -6.445427894592285, "global_step": 103183, "epoch": 2456} {"train_loss": -6.403243064880371, "global_step": 103184, "epoch": 2456} {"train_loss": -6.538974761962891, "global_step": 103185, "epoch": 2456} {"train_loss": -6.405501842498779, "global_step": 103186, "epoch": 2456} {"train_loss": -6.451066017150879, "global_step": 103187, "epoch": 2456} {"train_loss": -6.423451900482178, "global_step": 103188, "epoch": 2456} {"train_loss": -6.409322738647461, "global_step": 103189, "epoch": 2456} {"train_loss": -6.47260856628418, "global_step": 103190, "epoch": 2456} {"train_loss": -6.314586639404297, "global_step": 103191, "epoch": 2456} {"train_loss": -6.512768745422363, "global_step": 103192, "epoch": 2456} {"train_loss": -6.422611440931048, "global_step": 103193, "epoch": 2456, "val_loss": 64295.15234375} {"train_loss": -6.462085723876953, "global_step": 103194, "epoch": 2457} {"train_loss": -6.461197853088379, "global_step": 103195, "epoch": 2457} {"train_loss": -6.314425468444824, "global_step": 103196, "epoch": 2457} {"train_loss": -6.487783432006836, "global_step": 103197, "epoch": 2457} {"train_loss": -6.367599010467529, "global_step": 103198, "epoch": 2457} {"train_loss": -6.409271240234375, "global_step": 103199, "epoch": 2457} {"train_loss": -6.327340602874756, "global_step": 103200, "epoch": 2457} {"train_loss": -6.430411338806152, "global_step": 103201, "epoch": 2457} {"train_loss": -6.388157844543457, "global_step": 103202, "epoch": 2457} {"train_loss": -6.482455253601074, "global_step": 103203, "epoch": 2457} {"train_loss": -6.321718692779541, "global_step": 103204, "epoch": 2457} {"train_loss": -6.37691593170166, "global_step": 103205, "epoch": 2457} {"train_loss": -6.335719585418701, "global_step": 103206, "epoch": 2457} {"train_loss": -6.431240558624268, "global_step": 103207, "epoch": 2457} {"train_loss": -6.443645477294922, "global_step": 103208, "epoch": 2457} {"train_loss": -6.416767120361328, "global_step": 103209, "epoch": 2457} {"train_loss": -6.291453838348389, "global_step": 103210, "epoch": 2457} {"train_loss": -6.284477233886719, "global_step": 103211, "epoch": 2457} {"train_loss": -6.358621597290039, "global_step": 103212, "epoch": 2457} {"train_loss": -6.387786865234375, "global_step": 103213, "epoch": 2457} {"train_loss": -6.3148603439331055, "global_step": 103214, "epoch": 2457} {"train_loss": -6.306638717651367, "global_step": 103215, "epoch": 2457} {"train_loss": -6.343473434448242, "global_step": 103216, "epoch": 2457} {"train_loss": -6.294527053833008, "global_step": 103217, "epoch": 2457} {"train_loss": -6.386911869049072, "global_step": 103218, "epoch": 2457} {"train_loss": -6.382512092590332, "global_step": 103219, "epoch": 2457} {"train_loss": -6.307291030883789, "global_step": 103220, "epoch": 2457} {"train_loss": -6.253072738647461, "global_step": 103221, "epoch": 2457} {"train_loss": -6.2310333251953125, "global_step": 103222, "epoch": 2457} {"train_loss": -6.348634719848633, "global_step": 103223, "epoch": 2457} {"train_loss": -6.279532432556152, "global_step": 103224, "epoch": 2457} {"train_loss": -6.32935905456543, "global_step": 103225, "epoch": 2457} {"train_loss": -6.367988586425781, "global_step": 103226, "epoch": 2457} {"train_loss": -6.361078262329102, "global_step": 103227, "epoch": 2457} {"train_loss": -6.26304817199707, "global_step": 103228, "epoch": 2457} {"train_loss": -6.373417854309082, "global_step": 103229, "epoch": 2457} {"train_loss": -6.322216510772705, "global_step": 103230, "epoch": 2457} {"train_loss": -6.288381576538086, "global_step": 103231, "epoch": 2457} {"train_loss": -6.488614559173584, "global_step": 103232, "epoch": 2457} {"train_loss": -6.376686096191406, "global_step": 103233, "epoch": 2457} {"train_loss": -6.367005348205566, "global_step": 103234, "epoch": 2457} {"train_loss": -6.359403280984788, "global_step": 103235, "epoch": 2457, "val_loss": 64415.10546875} {"train_loss": -6.304056167602539, "global_step": 103236, "epoch": 2458} {"train_loss": -6.28945779800415, "global_step": 103237, "epoch": 2458} {"train_loss": -6.427356719970703, "global_step": 103238, "epoch": 2458} {"train_loss": -6.378596305847168, "global_step": 103239, "epoch": 2458} {"train_loss": -6.343298435211182, "global_step": 103240, "epoch": 2458} {"train_loss": -6.440924167633057, "global_step": 103241, "epoch": 2458} {"train_loss": -6.403717994689941, "global_step": 103242, "epoch": 2458} {"train_loss": -6.357407569885254, "global_step": 103243, "epoch": 2458} {"train_loss": -6.348639488220215, "global_step": 103244, "epoch": 2458} {"train_loss": -6.4307146072387695, "global_step": 103245, "epoch": 2458} {"train_loss": -6.498633861541748, "global_step": 103246, "epoch": 2458} {"train_loss": -6.519193172454834, "global_step": 103247, "epoch": 2458} {"train_loss": -6.477176666259766, "global_step": 103248, "epoch": 2458} {"train_loss": -6.466947078704834, "global_step": 103249, "epoch": 2458} {"train_loss": -6.475072860717773, "global_step": 103250, "epoch": 2458} {"train_loss": -6.4320068359375, "global_step": 103251, "epoch": 2458} {"train_loss": -6.4838032722473145, "global_step": 103252, "epoch": 2458} {"train_loss": -6.429957389831543, "global_step": 103253, "epoch": 2458} {"train_loss": -6.523730278015137, "global_step": 103254, "epoch": 2458} {"train_loss": -6.476650714874268, "global_step": 103255, "epoch": 2458} {"train_loss": -6.383033752441406, "global_step": 103256, "epoch": 2458} {"train_loss": -6.477316856384277, "global_step": 103257, "epoch": 2458} {"train_loss": -6.436680793762207, "global_step": 103258, "epoch": 2458} {"train_loss": -6.510534286499023, "global_step": 103259, "epoch": 2458} {"train_loss": -6.384551048278809, "global_step": 103260, "epoch": 2458} {"train_loss": -6.420663833618164, "global_step": 103261, "epoch": 2458} {"train_loss": -6.387948513031006, "global_step": 103262, "epoch": 2458} {"train_loss": -6.525559425354004, "global_step": 103263, "epoch": 2458} {"train_loss": -6.376518249511719, "global_step": 103264, "epoch": 2458} {"train_loss": -6.411069393157959, "global_step": 103265, "epoch": 2458} {"train_loss": -6.38355827331543, "global_step": 103266, "epoch": 2458} {"train_loss": -6.330401420593262, "global_step": 103267, "epoch": 2458} {"train_loss": -6.302358627319336, "global_step": 103268, "epoch": 2458} {"train_loss": -6.321022987365723, "global_step": 103269, "epoch": 2458} {"train_loss": -6.478010654449463, "global_step": 103270, "epoch": 2458} {"train_loss": -6.325070858001709, "global_step": 103271, "epoch": 2458} {"train_loss": -6.409732818603516, "global_step": 103272, "epoch": 2458} {"train_loss": -6.36171817779541, "global_step": 103273, "epoch": 2458} {"train_loss": -6.358750343322754, "global_step": 103274, "epoch": 2458} {"train_loss": -6.478005409240723, "global_step": 103275, "epoch": 2458} {"train_loss": -6.329504013061523, "global_step": 103276, "epoch": 2458} {"train_loss": -6.413746856507801, "global_step": 103277, "epoch": 2458, "val_loss": 64414.09375} {"train_loss": -6.500576019287109, "global_step": 103278, "epoch": 2459} {"train_loss": -6.390692710876465, "global_step": 103279, "epoch": 2459} {"train_loss": -6.479486465454102, "global_step": 103280, "epoch": 2459} {"train_loss": -6.445069789886475, "global_step": 103281, "epoch": 2459} {"train_loss": -6.546594619750977, "global_step": 103282, "epoch": 2459} {"train_loss": -6.4833984375, "global_step": 103283, "epoch": 2459} {"train_loss": -6.317380905151367, "global_step": 103284, "epoch": 2459} {"train_loss": -6.382631778717041, "global_step": 103285, "epoch": 2459} {"train_loss": -6.486728191375732, "global_step": 103286, "epoch": 2459} {"train_loss": -6.463345527648926, "global_step": 103287, "epoch": 2459} {"train_loss": -6.496546745300293, "global_step": 103288, "epoch": 2459} {"train_loss": -6.433253288269043, "global_step": 103289, "epoch": 2459} {"train_loss": -6.443885326385498, "global_step": 103290, "epoch": 2459} {"train_loss": -6.392386436462402, "global_step": 103291, "epoch": 2459} {"train_loss": -6.40763521194458, "global_step": 103292, "epoch": 2459} {"train_loss": -6.422967433929443, "global_step": 103293, "epoch": 2459} {"train_loss": -6.376148223876953, "global_step": 103294, "epoch": 2459} {"train_loss": -6.307494640350342, "global_step": 103295, "epoch": 2459} {"train_loss": -6.512777805328369, "global_step": 103296, "epoch": 2459} {"train_loss": -6.357534408569336, "global_step": 103297, "epoch": 2459} {"train_loss": -6.32074499130249, "global_step": 103298, "epoch": 2459} {"train_loss": -6.409809112548828, "global_step": 103299, "epoch": 2459} {"train_loss": -6.405824184417725, "global_step": 103300, "epoch": 2459} {"train_loss": -6.326670169830322, "global_step": 103301, "epoch": 2459} {"train_loss": -6.372365951538086, "global_step": 103302, "epoch": 2459} {"train_loss": -6.3503098487854, "global_step": 103303, "epoch": 2459} {"train_loss": -6.408105850219727, "global_step": 103304, "epoch": 2459} {"train_loss": -6.376367568969727, "global_step": 103305, "epoch": 2459} {"train_loss": -6.377132415771484, "global_step": 103306, "epoch": 2459} {"train_loss": -6.439141273498535, "global_step": 103307, "epoch": 2459} {"train_loss": -6.473069190979004, "global_step": 103308, "epoch": 2459} {"train_loss": -6.536571979522705, "global_step": 103309, "epoch": 2459} {"train_loss": -6.278326988220215, "global_step": 103310, "epoch": 2459} {"train_loss": -6.470174789428711, "global_step": 103311, "epoch": 2459} {"train_loss": -6.336008548736572, "global_step": 103312, "epoch": 2459} {"train_loss": -6.460214138031006, "global_step": 103313, "epoch": 2459} {"train_loss": -6.419633865356445, "global_step": 103314, "epoch": 2459} {"train_loss": -6.339591026306152, "global_step": 103315, "epoch": 2459} {"train_loss": -6.462983131408691, "global_step": 103316, "epoch": 2459} {"train_loss": -6.5472822189331055, "global_step": 103317, "epoch": 2459} {"train_loss": -6.425880432128906, "global_step": 103318, "epoch": 2459} {"train_loss": -6.420672518866403, "global_step": 103319, "epoch": 2459, "val_loss": 64287.859375} {"train_loss": -6.442801475524902, "global_step": 103320, "epoch": 2460} {"train_loss": -6.5578083992004395, "global_step": 103321, "epoch": 2460} {"train_loss": -6.257788181304932, "global_step": 103322, "epoch": 2460} {"train_loss": -6.33494758605957, "global_step": 103323, "epoch": 2460} {"train_loss": -6.29269552230835, "global_step": 103324, "epoch": 2460} {"train_loss": -6.357755184173584, "global_step": 103325, "epoch": 2460} {"train_loss": -6.426170349121094, "global_step": 103326, "epoch": 2460} {"train_loss": -6.394749641418457, "global_step": 103327, "epoch": 2460} {"train_loss": -6.312340259552002, "global_step": 103328, "epoch": 2460} {"train_loss": -6.508190155029297, "global_step": 103329, "epoch": 2460} {"train_loss": -6.453685760498047, "global_step": 103330, "epoch": 2460} {"train_loss": -6.487826824188232, "global_step": 103331, "epoch": 2460} {"train_loss": -6.321556568145752, "global_step": 103332, "epoch": 2460} {"train_loss": -6.40549373626709, "global_step": 103333, "epoch": 2460} {"train_loss": -6.473669052124023, "global_step": 103334, "epoch": 2460} {"train_loss": -6.375502586364746, "global_step": 103335, "epoch": 2460} {"train_loss": -6.453309059143066, "global_step": 103336, "epoch": 2460} {"train_loss": -6.529477119445801, "global_step": 103337, "epoch": 2460} {"train_loss": -6.2927751541137695, "global_step": 103338, "epoch": 2460} {"train_loss": -6.638542175292969, "global_step": 103339, "epoch": 2460} {"train_loss": -6.250449180603027, "global_step": 103340, "epoch": 2460} {"train_loss": -6.332149028778076, "global_step": 103341, "epoch": 2460} {"train_loss": -6.438510894775391, "global_step": 103342, "epoch": 2460} {"train_loss": -6.249654769897461, "global_step": 103343, "epoch": 2460} {"train_loss": -6.400389671325684, "global_step": 103344, "epoch": 2460} {"train_loss": -6.452134132385254, "global_step": 103345, "epoch": 2460} {"train_loss": -6.469747543334961, "global_step": 103346, "epoch": 2460} {"train_loss": -6.309605598449707, "global_step": 103347, "epoch": 2460} {"train_loss": -6.295539855957031, "global_step": 103348, "epoch": 2460} {"train_loss": -6.306362628936768, "global_step": 103349, "epoch": 2460} {"train_loss": -6.323925971984863, "global_step": 103350, "epoch": 2460} {"train_loss": -6.33480978012085, "global_step": 103351, "epoch": 2460} {"train_loss": -6.313873291015625, "global_step": 103352, "epoch": 2460} {"train_loss": -6.265069007873535, "global_step": 103353, "epoch": 2460} {"train_loss": -6.329317092895508, "global_step": 103354, "epoch": 2460} {"train_loss": -6.337263584136963, "global_step": 103355, "epoch": 2460} {"train_loss": -6.3911237716674805, "global_step": 103356, "epoch": 2460} {"train_loss": -6.360966205596924, "global_step": 103357, "epoch": 2460} {"train_loss": -6.444437026977539, "global_step": 103358, "epoch": 2460} {"train_loss": -6.466376304626465, "global_step": 103359, "epoch": 2460} {"train_loss": -6.349369049072266, "global_step": 103360, "epoch": 2460} {"train_loss": -6.384307373137701, "global_step": 103361, "epoch": 2460, "val_loss": 64368.9921875} {"train_loss": -6.407452583312988, "global_step": 103362, "epoch": 2461} {"train_loss": -6.506838798522949, "global_step": 103363, "epoch": 2461} {"train_loss": -6.262743949890137, "global_step": 103364, "epoch": 2461} {"train_loss": -6.465116500854492, "global_step": 103365, "epoch": 2461} {"train_loss": -6.486931324005127, "global_step": 103366, "epoch": 2461} {"train_loss": -6.3242011070251465, "global_step": 103367, "epoch": 2461} {"train_loss": -6.297936916351318, "global_step": 103368, "epoch": 2461} {"train_loss": -6.408292770385742, "global_step": 103369, "epoch": 2461} {"train_loss": -6.3927106857299805, "global_step": 103370, "epoch": 2461} {"train_loss": -6.44296407699585, "global_step": 103371, "epoch": 2461} {"train_loss": -6.321541786193848, "global_step": 103372, "epoch": 2461} {"train_loss": -6.386361122131348, "global_step": 103373, "epoch": 2461} {"train_loss": -6.307451248168945, "global_step": 103374, "epoch": 2461} {"train_loss": -6.4202094078063965, "global_step": 103375, "epoch": 2461} {"train_loss": -6.477450370788574, "global_step": 103376, "epoch": 2461} {"train_loss": -6.514402389526367, "global_step": 103377, "epoch": 2461} {"train_loss": -6.34977388381958, "global_step": 103378, "epoch": 2461} {"train_loss": -6.414041042327881, "global_step": 103379, "epoch": 2461} {"train_loss": -6.401575088500977, "global_step": 103380, "epoch": 2461} {"train_loss": -6.450108528137207, "global_step": 103381, "epoch": 2461} {"train_loss": -6.45341682434082, "global_step": 103382, "epoch": 2461} {"train_loss": -6.518801689147949, "global_step": 103383, "epoch": 2461} {"train_loss": -6.479864597320557, "global_step": 103384, "epoch": 2461} {"train_loss": -6.49429178237915, "global_step": 103385, "epoch": 2461} {"train_loss": -6.504612445831299, "global_step": 103386, "epoch": 2461} {"train_loss": -6.504332542419434, "global_step": 103387, "epoch": 2461} {"train_loss": -6.490606307983398, "global_step": 103388, "epoch": 2461} {"train_loss": -6.402015686035156, "global_step": 103389, "epoch": 2461} {"train_loss": -6.41426944732666, "global_step": 103390, "epoch": 2461} {"train_loss": -6.344686031341553, "global_step": 103391, "epoch": 2461} {"train_loss": -6.333662986755371, "global_step": 103392, "epoch": 2461} {"train_loss": -6.421154975891113, "global_step": 103393, "epoch": 2461} {"train_loss": -6.4425554275512695, "global_step": 103394, "epoch": 2461} {"train_loss": -6.495870590209961, "global_step": 103395, "epoch": 2461} {"train_loss": -6.422850608825684, "global_step": 103396, "epoch": 2461} {"train_loss": -6.413200855255127, "global_step": 103397, "epoch": 2461} {"train_loss": -6.432130813598633, "global_step": 103398, "epoch": 2461} {"train_loss": -6.442326545715332, "global_step": 103399, "epoch": 2461} {"train_loss": -6.457649230957031, "global_step": 103400, "epoch": 2461} {"train_loss": -6.455080032348633, "global_step": 103401, "epoch": 2461} {"train_loss": -6.402467727661133, "global_step": 103402, "epoch": 2461} {"train_loss": -6.421614238194057, "global_step": 103403, "epoch": 2461, "val_loss": 64328.5859375} {"train_loss": -6.498544216156006, "global_step": 103404, "epoch": 2462} {"train_loss": -6.55418586730957, "global_step": 103405, "epoch": 2462} {"train_loss": -6.45558500289917, "global_step": 103406, "epoch": 2462} {"train_loss": -6.407044410705566, "global_step": 103407, "epoch": 2462} {"train_loss": -6.364315986633301, "global_step": 103408, "epoch": 2462} {"train_loss": -6.447333335876465, "global_step": 103409, "epoch": 2462} {"train_loss": -6.402610778808594, "global_step": 103410, "epoch": 2462} {"train_loss": -6.436600685119629, "global_step": 103411, "epoch": 2462} {"train_loss": -6.442422389984131, "global_step": 103412, "epoch": 2462} {"train_loss": -6.387942314147949, "global_step": 103413, "epoch": 2462} {"train_loss": -6.436497688293457, "global_step": 103414, "epoch": 2462} {"train_loss": -6.5493483543396, "global_step": 103415, "epoch": 2462} {"train_loss": -6.416567802429199, "global_step": 103416, "epoch": 2462} {"train_loss": -6.25839900970459, "global_step": 103417, "epoch": 2462} {"train_loss": -6.422068119049072, "global_step": 103418, "epoch": 2462} {"train_loss": -6.331384658813477, "global_step": 103419, "epoch": 2462} {"train_loss": -6.471224784851074, "global_step": 103420, "epoch": 2462} {"train_loss": -6.5029706954956055, "global_step": 103421, "epoch": 2462} {"train_loss": -6.275946617126465, "global_step": 103422, "epoch": 2462} {"train_loss": -6.43224573135376, "global_step": 103423, "epoch": 2462} {"train_loss": -6.454645156860352, "global_step": 103424, "epoch": 2462} {"train_loss": -6.328564167022705, "global_step": 103425, "epoch": 2462} {"train_loss": -6.344045639038086, "global_step": 103426, "epoch": 2462} {"train_loss": -6.405216693878174, "global_step": 103427, "epoch": 2462} {"train_loss": -6.311047554016113, "global_step": 103428, "epoch": 2462} {"train_loss": -6.388609886169434, "global_step": 103429, "epoch": 2462} {"train_loss": -6.323562145233154, "global_step": 103430, "epoch": 2462} {"train_loss": -6.457187175750732, "global_step": 103431, "epoch": 2462} {"train_loss": -6.398563385009766, "global_step": 103432, "epoch": 2462} {"train_loss": -6.275341510772705, "global_step": 103433, "epoch": 2462} {"train_loss": -6.268341064453125, "global_step": 103434, "epoch": 2462} {"train_loss": -6.325651168823242, "global_step": 103435, "epoch": 2462} {"train_loss": -6.433290958404541, "global_step": 103436, "epoch": 2462} {"train_loss": -6.212497711181641, "global_step": 103437, "epoch": 2462} {"train_loss": -6.514420509338379, "global_step": 103438, "epoch": 2462} {"train_loss": -6.098959922790527, "global_step": 103439, "epoch": 2462} {"train_loss": -6.35845947265625, "global_step": 103440, "epoch": 2462} {"train_loss": -6.419178485870361, "global_step": 103441, "epoch": 2462} {"train_loss": -6.295413017272949, "global_step": 103442, "epoch": 2462} {"train_loss": -6.4110846519470215, "global_step": 103443, "epoch": 2462} {"train_loss": -6.394092559814453, "global_step": 103444, "epoch": 2462} {"train_loss": -6.386773245675223, "global_step": 103445, "epoch": 2462, "val_loss": 64471.81640625} {"train_loss": -6.391823768615723, "global_step": 103446, "epoch": 2463} {"train_loss": -6.459720611572266, "global_step": 103447, "epoch": 2463} {"train_loss": -6.462829113006592, "global_step": 103448, "epoch": 2463} {"train_loss": -6.443395614624023, "global_step": 103449, "epoch": 2463} {"train_loss": -6.298045635223389, "global_step": 103450, "epoch": 2463} {"train_loss": -6.4743242263793945, "global_step": 103451, "epoch": 2463} {"train_loss": -6.483877658843994, "global_step": 103452, "epoch": 2463} {"train_loss": -6.46865177154541, "global_step": 103453, "epoch": 2463} {"train_loss": -6.378856182098389, "global_step": 103454, "epoch": 2463} {"train_loss": -6.3968329429626465, "global_step": 103455, "epoch": 2463} {"train_loss": -6.394883632659912, "global_step": 103456, "epoch": 2463} {"train_loss": -6.478076934814453, "global_step": 103457, "epoch": 2463} {"train_loss": -6.307989597320557, "global_step": 103458, "epoch": 2463} {"train_loss": -6.387581825256348, "global_step": 103459, "epoch": 2463} {"train_loss": -6.356878280639648, "global_step": 103460, "epoch": 2463} {"train_loss": -6.233522891998291, "global_step": 103461, "epoch": 2463} {"train_loss": -6.36016845703125, "global_step": 103462, "epoch": 2463} {"train_loss": -6.426204681396484, "global_step": 103463, "epoch": 2463} {"train_loss": -6.459957122802734, "global_step": 103464, "epoch": 2463} {"train_loss": -6.372713088989258, "global_step": 103465, "epoch": 2463} {"train_loss": -6.473989486694336, "global_step": 103466, "epoch": 2463} {"train_loss": -6.473529815673828, "global_step": 103467, "epoch": 2463} {"train_loss": -6.404871463775635, "global_step": 103468, "epoch": 2463} {"train_loss": -6.247147560119629, "global_step": 103469, "epoch": 2463} {"train_loss": -6.398950576782227, "global_step": 103470, "epoch": 2463} {"train_loss": -6.285815715789795, "global_step": 103471, "epoch": 2463} {"train_loss": -6.422911643981934, "global_step": 103472, "epoch": 2463} {"train_loss": -6.359170913696289, "global_step": 103473, "epoch": 2463} {"train_loss": -6.358406066894531, "global_step": 103474, "epoch": 2463} {"train_loss": -6.48796272277832, "global_step": 103475, "epoch": 2463} {"train_loss": -6.382062911987305, "global_step": 103476, "epoch": 2463} {"train_loss": -6.370586395263672, "global_step": 103477, "epoch": 2463} {"train_loss": -6.348878383636475, "global_step": 103478, "epoch": 2463} {"train_loss": -6.39222526550293, "global_step": 103479, "epoch": 2463} {"train_loss": -6.42610502243042, "global_step": 103480, "epoch": 2463} {"train_loss": -6.2345709800720215, "global_step": 103481, "epoch": 2463} {"train_loss": -6.386103630065918, "global_step": 103482, "epoch": 2463} {"train_loss": -6.37954044342041, "global_step": 103483, "epoch": 2463} {"train_loss": -6.461265563964844, "global_step": 103484, "epoch": 2463} {"train_loss": -6.385675430297852, "global_step": 103485, "epoch": 2463} {"train_loss": -6.344762802124023, "global_step": 103486, "epoch": 2463} {"train_loss": -6.393507753099714, "global_step": 103487, "epoch": 2463, "val_loss": 64536.7109375} {"train_loss": -6.407277584075928, "global_step": 103488, "epoch": 2464} {"train_loss": -6.415433883666992, "global_step": 103489, "epoch": 2464} {"train_loss": -6.385488033294678, "global_step": 103490, "epoch": 2464} {"train_loss": -6.371110439300537, "global_step": 103491, "epoch": 2464} {"train_loss": -6.331387519836426, "global_step": 103492, "epoch": 2464} {"train_loss": -6.36573600769043, "global_step": 103493, "epoch": 2464} {"train_loss": -6.3410234451293945, "global_step": 103494, "epoch": 2464} {"train_loss": -6.414073944091797, "global_step": 103495, "epoch": 2464} {"train_loss": -6.4087724685668945, "global_step": 103496, "epoch": 2464} {"train_loss": -6.369314193725586, "global_step": 103497, "epoch": 2464} {"train_loss": -6.4616289138793945, "global_step": 103498, "epoch": 2464} {"train_loss": -6.395138263702393, "global_step": 103499, "epoch": 2464} {"train_loss": -6.498377799987793, "global_step": 103500, "epoch": 2464} {"train_loss": -6.311421871185303, "global_step": 103501, "epoch": 2464} {"train_loss": -6.453590393066406, "global_step": 103502, "epoch": 2464} {"train_loss": -6.271076202392578, "global_step": 103503, "epoch": 2464} {"train_loss": -6.38477897644043, "global_step": 103504, "epoch": 2464} {"train_loss": -6.376850128173828, "global_step": 103505, "epoch": 2464} {"train_loss": -6.2689127922058105, "global_step": 103506, "epoch": 2464} {"train_loss": -6.412239074707031, "global_step": 103507, "epoch": 2464} {"train_loss": -6.424833297729492, "global_step": 103508, "epoch": 2464} {"train_loss": -6.341461181640625, "global_step": 103509, "epoch": 2464} {"train_loss": -6.331573486328125, "global_step": 103510, "epoch": 2464} {"train_loss": -6.508344650268555, "global_step": 103511, "epoch": 2464} {"train_loss": -6.318181991577148, "global_step": 103512, "epoch": 2464} {"train_loss": -6.351645469665527, "global_step": 103513, "epoch": 2464} {"train_loss": -6.253293037414551, "global_step": 103514, "epoch": 2464} {"train_loss": -6.401638031005859, "global_step": 103515, "epoch": 2464} {"train_loss": -6.46571159362793, "global_step": 103516, "epoch": 2464} {"train_loss": -6.348175048828125, "global_step": 103517, "epoch": 2464} {"train_loss": -6.325349807739258, "global_step": 103518, "epoch": 2464} {"train_loss": -6.427510738372803, "global_step": 103519, "epoch": 2464} {"train_loss": -6.466571807861328, "global_step": 103520, "epoch": 2464} {"train_loss": -6.370762348175049, "global_step": 103521, "epoch": 2464} {"train_loss": -6.426743507385254, "global_step": 103522, "epoch": 2464} {"train_loss": -6.390861511230469, "global_step": 103523, "epoch": 2464} {"train_loss": -6.474875450134277, "global_step": 103524, "epoch": 2464} {"train_loss": -6.395368576049805, "global_step": 103525, "epoch": 2464} {"train_loss": -6.3890380859375, "global_step": 103526, "epoch": 2464} {"train_loss": -6.42012357711792, "global_step": 103527, "epoch": 2464} {"train_loss": -6.347317218780518, "global_step": 103528, "epoch": 2464} {"train_loss": -6.389240923381987, "global_step": 103529, "epoch": 2464, "val_loss": 64638.65234375} {"train_loss": -6.466450214385986, "global_step": 103530, "epoch": 2465} {"train_loss": -6.555647373199463, "global_step": 103531, "epoch": 2465} {"train_loss": -6.566684246063232, "global_step": 103532, "epoch": 2465} {"train_loss": -6.4126129150390625, "global_step": 103533, "epoch": 2465} {"train_loss": -6.367588520050049, "global_step": 103534, "epoch": 2465} {"train_loss": -6.3736572265625, "global_step": 103535, "epoch": 2465} {"train_loss": -6.580559253692627, "global_step": 103536, "epoch": 2465} {"train_loss": -6.45318078994751, "global_step": 103537, "epoch": 2465} {"train_loss": -6.442748069763184, "global_step": 103538, "epoch": 2465} {"train_loss": -6.546664237976074, "global_step": 103539, "epoch": 2465} {"train_loss": -6.458036422729492, "global_step": 103540, "epoch": 2465} {"train_loss": -6.518162250518799, "global_step": 103541, "epoch": 2465} {"train_loss": -6.430985450744629, "global_step": 103542, "epoch": 2465} {"train_loss": -6.477095127105713, "global_step": 103543, "epoch": 2465} {"train_loss": -6.395511150360107, "global_step": 103544, "epoch": 2465} {"train_loss": -6.3789262771606445, "global_step": 103545, "epoch": 2465} {"train_loss": -6.414109230041504, "global_step": 103546, "epoch": 2465} {"train_loss": -6.383523464202881, "global_step": 103547, "epoch": 2465} {"train_loss": -6.439697742462158, "global_step": 103548, "epoch": 2465} {"train_loss": -6.459792137145996, "global_step": 103549, "epoch": 2465} {"train_loss": -6.423585891723633, "global_step": 103550, "epoch": 2465} {"train_loss": -6.434447288513184, "global_step": 103551, "epoch": 2465} {"train_loss": -6.332235336303711, "global_step": 103552, "epoch": 2465} {"train_loss": -6.484729766845703, "global_step": 103553, "epoch": 2465} {"train_loss": -6.4845051765441895, "global_step": 103554, "epoch": 2465} {"train_loss": -6.390862464904785, "global_step": 103555, "epoch": 2465} {"train_loss": -6.4293646812438965, "global_step": 103556, "epoch": 2465} {"train_loss": -6.580535888671875, "global_step": 103557, "epoch": 2465} {"train_loss": -6.423552989959717, "global_step": 103558, "epoch": 2465} {"train_loss": -6.367009162902832, "global_step": 103559, "epoch": 2465} {"train_loss": -6.428264141082764, "global_step": 103560, "epoch": 2465} {"train_loss": -6.348135948181152, "global_step": 103561, "epoch": 2465} {"train_loss": -6.330119609832764, "global_step": 103562, "epoch": 2465} {"train_loss": -6.3818864822387695, "global_step": 103563, "epoch": 2465} {"train_loss": -6.4172210693359375, "global_step": 103564, "epoch": 2465} {"train_loss": -6.388397216796875, "global_step": 103565, "epoch": 2465} {"train_loss": -6.480903148651123, "global_step": 103566, "epoch": 2465} {"train_loss": -6.310047149658203, "global_step": 103567, "epoch": 2465} {"train_loss": -6.326826572418213, "global_step": 103568, "epoch": 2465} {"train_loss": -6.352089881896973, "global_step": 103569, "epoch": 2465} {"train_loss": -6.35697078704834, "global_step": 103570, "epoch": 2465} {"train_loss": -6.422802686691284, "global_step": 103571, "epoch": 2465, "val_loss": 64683.4765625} {"train_loss": -6.398869514465332, "global_step": 103572, "epoch": 2466} {"train_loss": -6.174862861633301, "global_step": 103573, "epoch": 2466} {"train_loss": -6.2196149826049805, "global_step": 103574, "epoch": 2466} {"train_loss": -6.329891204833984, "global_step": 103575, "epoch": 2466} {"train_loss": -6.324333190917969, "global_step": 103576, "epoch": 2466} {"train_loss": -6.122453689575195, "global_step": 103577, "epoch": 2466} {"train_loss": -6.103863716125488, "global_step": 103578, "epoch": 2466} {"train_loss": -6.182985305786133, "global_step": 103579, "epoch": 2466} {"train_loss": -6.247902870178223, "global_step": 103580, "epoch": 2466} {"train_loss": -6.183525562286377, "global_step": 103581, "epoch": 2466} {"train_loss": -6.323624610900879, "global_step": 103582, "epoch": 2466} {"train_loss": -6.291285991668701, "global_step": 103583, "epoch": 2466} {"train_loss": -6.289979934692383, "global_step": 103584, "epoch": 2466} {"train_loss": -6.110774993896484, "global_step": 103585, "epoch": 2466} {"train_loss": -6.28696870803833, "global_step": 103586, "epoch": 2466} {"train_loss": -6.245614051818848, "global_step": 103587, "epoch": 2466} {"train_loss": -6.294343948364258, "global_step": 103588, "epoch": 2466} {"train_loss": -6.2333292961120605, "global_step": 103589, "epoch": 2466} {"train_loss": -6.3913445472717285, "global_step": 103590, "epoch": 2466} {"train_loss": -6.339885711669922, "global_step": 103591, "epoch": 2466} {"train_loss": -6.391794204711914, "global_step": 103592, "epoch": 2466} {"train_loss": -6.316318511962891, "global_step": 103593, "epoch": 2466} {"train_loss": -6.355208873748779, "global_step": 103594, "epoch": 2466} {"train_loss": -6.392180442810059, "global_step": 103595, "epoch": 2466} {"train_loss": -6.2464823722839355, "global_step": 103596, "epoch": 2466} {"train_loss": -6.427119255065918, "global_step": 103597, "epoch": 2466} {"train_loss": -6.28914737701416, "global_step": 103598, "epoch": 2466} {"train_loss": -6.399955749511719, "global_step": 103599, "epoch": 2466} {"train_loss": -6.396679401397705, "global_step": 103600, "epoch": 2466} {"train_loss": -6.374256610870361, "global_step": 103601, "epoch": 2466} {"train_loss": -6.437148571014404, "global_step": 103602, "epoch": 2466} {"train_loss": -6.276139259338379, "global_step": 103603, "epoch": 2466} {"train_loss": -6.360240459442139, "global_step": 103604, "epoch": 2466} {"train_loss": -6.405694961547852, "global_step": 103605, "epoch": 2466} {"train_loss": -6.331270217895508, "global_step": 103606, "epoch": 2466} {"train_loss": -6.344690322875977, "global_step": 103607, "epoch": 2466} {"train_loss": -6.404335975646973, "global_step": 103608, "epoch": 2466} {"train_loss": -6.349678039550781, "global_step": 103609, "epoch": 2466} {"train_loss": -6.355107307434082, "global_step": 103610, "epoch": 2466} {"train_loss": -6.3422746658325195, "global_step": 103611, "epoch": 2466} {"train_loss": -6.262765407562256, "global_step": 103612, "epoch": 2466} {"train_loss": -6.309397038959322, "global_step": 103613, "epoch": 2466, "val_loss": 64661.57421875} {"train_loss": -6.429757118225098, "global_step": 103614, "epoch": 2467} {"train_loss": -6.239785194396973, "global_step": 103615, "epoch": 2467} {"train_loss": -6.346329212188721, "global_step": 103616, "epoch": 2467} {"train_loss": -6.320389747619629, "global_step": 103617, "epoch": 2467} {"train_loss": -6.374994277954102, "global_step": 103618, "epoch": 2467} {"train_loss": -6.271361351013184, "global_step": 103619, "epoch": 2467} {"train_loss": -6.39854621887207, "global_step": 103620, "epoch": 2467} {"train_loss": -6.342503547668457, "global_step": 103621, "epoch": 2467} {"train_loss": -6.376681327819824, "global_step": 103622, "epoch": 2467} {"train_loss": -6.332250595092773, "global_step": 103623, "epoch": 2467} {"train_loss": -6.327909469604492, "global_step": 103624, "epoch": 2467} {"train_loss": -6.3891143798828125, "global_step": 103625, "epoch": 2467} {"train_loss": -6.4077911376953125, "global_step": 103626, "epoch": 2467} {"train_loss": -6.41059684753418, "global_step": 103627, "epoch": 2467} {"train_loss": -6.383250713348389, "global_step": 103628, "epoch": 2467} {"train_loss": -6.418816566467285, "global_step": 103629, "epoch": 2467} {"train_loss": -6.386407375335693, "global_step": 103630, "epoch": 2467} {"train_loss": -6.445887565612793, "global_step": 103631, "epoch": 2467} {"train_loss": -6.311650276184082, "global_step": 103632, "epoch": 2467} {"train_loss": -6.269804000854492, "global_step": 103633, "epoch": 2467} {"train_loss": -6.441493988037109, "global_step": 103634, "epoch": 2467} {"train_loss": -6.4333672523498535, "global_step": 103635, "epoch": 2467} {"train_loss": -6.359331130981445, "global_step": 103636, "epoch": 2467} {"train_loss": -6.413015365600586, "global_step": 103637, "epoch": 2467} {"train_loss": -6.37840461730957, "global_step": 103638, "epoch": 2467} {"train_loss": -6.4778828620910645, "global_step": 103639, "epoch": 2467} {"train_loss": -6.362490653991699, "global_step": 103640, "epoch": 2467} {"train_loss": -6.2692179679870605, "global_step": 103641, "epoch": 2467} {"train_loss": -6.411123275756836, "global_step": 103642, "epoch": 2467} {"train_loss": -6.303902626037598, "global_step": 103643, "epoch": 2467} {"train_loss": -6.251096248626709, "global_step": 103644, "epoch": 2467} {"train_loss": -6.3175506591796875, "global_step": 103645, "epoch": 2467} {"train_loss": -6.3175835609436035, "global_step": 103646, "epoch": 2467} {"train_loss": -6.381128787994385, "global_step": 103647, "epoch": 2467} {"train_loss": -6.407632827758789, "global_step": 103648, "epoch": 2467} {"train_loss": -6.452598571777344, "global_step": 103649, "epoch": 2467} {"train_loss": -6.451801776885986, "global_step": 103650, "epoch": 2467} {"train_loss": -6.441640853881836, "global_step": 103651, "epoch": 2467} {"train_loss": -6.417198181152344, "global_step": 103652, "epoch": 2467} {"train_loss": -6.473297119140625, "global_step": 103653, "epoch": 2467} {"train_loss": -6.3886284828186035, "global_step": 103654, "epoch": 2467} {"train_loss": -6.374087685630435, "global_step": 103655, "epoch": 2467, "val_loss": 64391.7421875} {"train_loss": -6.407109260559082, "global_step": 103656, "epoch": 2468} {"train_loss": -6.490893840789795, "global_step": 103657, "epoch": 2468} {"train_loss": -6.301724433898926, "global_step": 103658, "epoch": 2468} {"train_loss": -6.449936866760254, "global_step": 103659, "epoch": 2468} {"train_loss": -6.428808212280273, "global_step": 103660, "epoch": 2468} {"train_loss": -6.416287899017334, "global_step": 103661, "epoch": 2468} {"train_loss": -6.536785125732422, "global_step": 103662, "epoch": 2468} {"train_loss": -6.423098564147949, "global_step": 103663, "epoch": 2468} {"train_loss": -6.414189338684082, "global_step": 103664, "epoch": 2468} {"train_loss": -6.383969306945801, "global_step": 103665, "epoch": 2468} {"train_loss": -6.379555702209473, "global_step": 103666, "epoch": 2468} {"train_loss": -6.4303812980651855, "global_step": 103667, "epoch": 2468} {"train_loss": -6.514796733856201, "global_step": 103668, "epoch": 2468} {"train_loss": -6.302387714385986, "global_step": 103669, "epoch": 2468} {"train_loss": -6.3777031898498535, "global_step": 103670, "epoch": 2468} {"train_loss": -6.355998516082764, "global_step": 103671, "epoch": 2468} {"train_loss": -6.338055610656738, "global_step": 103672, "epoch": 2468} {"train_loss": -6.413496017456055, "global_step": 103673, "epoch": 2468} {"train_loss": -6.4673614501953125, "global_step": 103674, "epoch": 2468} {"train_loss": -6.510763168334961, "global_step": 103675, "epoch": 2468} {"train_loss": -6.504228591918945, "global_step": 103676, "epoch": 2468} {"train_loss": -6.438333511352539, "global_step": 103677, "epoch": 2468} {"train_loss": -6.4346418380737305, "global_step": 103678, "epoch": 2468} {"train_loss": -6.377708435058594, "global_step": 103679, "epoch": 2468} {"train_loss": -6.35297966003418, "global_step": 103680, "epoch": 2468} {"train_loss": -6.399880409240723, "global_step": 103681, "epoch": 2468} {"train_loss": -6.380795955657959, "global_step": 103682, "epoch": 2468} {"train_loss": -6.501928329467773, "global_step": 103683, "epoch": 2468} {"train_loss": -6.364940643310547, "global_step": 103684, "epoch": 2468} {"train_loss": -6.4541239738464355, "global_step": 103685, "epoch": 2468} {"train_loss": -6.411767959594727, "global_step": 103686, "epoch": 2468} {"train_loss": -6.457610130310059, "global_step": 103687, "epoch": 2468} {"train_loss": -6.490944862365723, "global_step": 103688, "epoch": 2468} {"train_loss": -6.414017677307129, "global_step": 103689, "epoch": 2468} {"train_loss": -6.579409599304199, "global_step": 103690, "epoch": 2468} {"train_loss": -6.536330223083496, "global_step": 103691, "epoch": 2468} {"train_loss": -6.477671146392822, "global_step": 103692, "epoch": 2468} {"train_loss": -6.362333297729492, "global_step": 103693, "epoch": 2468} {"train_loss": -6.470550537109375, "global_step": 103694, "epoch": 2468} {"train_loss": -6.476941108703613, "global_step": 103695, "epoch": 2468} {"train_loss": -6.480633735656738, "global_step": 103696, "epoch": 2468} {"train_loss": -6.4338918299902055, "global_step": 103697, "epoch": 2468, "val_loss": 64365.79296875} {"train_loss": -6.451735496520996, "global_step": 103698, "epoch": 2469} {"train_loss": -6.382594585418701, "global_step": 103699, "epoch": 2469} {"train_loss": -6.405040740966797, "global_step": 103700, "epoch": 2469} {"train_loss": -6.536563396453857, "global_step": 103701, "epoch": 2469} {"train_loss": -6.45731258392334, "global_step": 103702, "epoch": 2469} {"train_loss": -6.354216575622559, "global_step": 103703, "epoch": 2469} {"train_loss": -6.435314178466797, "global_step": 103704, "epoch": 2469} {"train_loss": -6.386045932769775, "global_step": 103705, "epoch": 2469} {"train_loss": -6.393720626831055, "global_step": 103706, "epoch": 2469} {"train_loss": -6.598393440246582, "global_step": 103707, "epoch": 2469} {"train_loss": -6.4341278076171875, "global_step": 103708, "epoch": 2469} {"train_loss": -6.525943279266357, "global_step": 103709, "epoch": 2469} {"train_loss": -6.464098930358887, "global_step": 103710, "epoch": 2469} {"train_loss": -6.409409523010254, "global_step": 103711, "epoch": 2469} {"train_loss": -6.468142509460449, "global_step": 103712, "epoch": 2469} {"train_loss": -6.568514347076416, "global_step": 103713, "epoch": 2469} {"train_loss": -6.4270219802856445, "global_step": 103714, "epoch": 2469} {"train_loss": -6.509067058563232, "global_step": 103715, "epoch": 2469} {"train_loss": -6.494986057281494, "global_step": 103716, "epoch": 2469} {"train_loss": -6.47857666015625, "global_step": 103717, "epoch": 2469} {"train_loss": -6.445066928863525, "global_step": 103718, "epoch": 2469} {"train_loss": -6.40132999420166, "global_step": 103719, "epoch": 2469} {"train_loss": -6.460768699645996, "global_step": 103720, "epoch": 2469} {"train_loss": -6.397739410400391, "global_step": 103721, "epoch": 2469} {"train_loss": -6.386577129364014, "global_step": 103722, "epoch": 2469} {"train_loss": -6.321675777435303, "global_step": 103723, "epoch": 2469} {"train_loss": -6.379976272583008, "global_step": 103724, "epoch": 2469} {"train_loss": -6.402207851409912, "global_step": 103725, "epoch": 2469} {"train_loss": -6.34355354309082, "global_step": 103726, "epoch": 2469} {"train_loss": -6.423444747924805, "global_step": 103727, "epoch": 2469} {"train_loss": -6.244901657104492, "global_step": 103728, "epoch": 2469} {"train_loss": -6.259355545043945, "global_step": 103729, "epoch": 2469} {"train_loss": -6.399777412414551, "global_step": 103730, "epoch": 2469} {"train_loss": -6.340298652648926, "global_step": 103731, "epoch": 2469} {"train_loss": -6.3188581466674805, "global_step": 103732, "epoch": 2469} {"train_loss": -6.311829566955566, "global_step": 103733, "epoch": 2469} {"train_loss": -6.332111358642578, "global_step": 103734, "epoch": 2469} {"train_loss": -6.332764625549316, "global_step": 103735, "epoch": 2469} {"train_loss": -6.245586395263672, "global_step": 103736, "epoch": 2469} {"train_loss": -6.390551567077637, "global_step": 103737, "epoch": 2469} {"train_loss": -6.309348106384277, "global_step": 103738, "epoch": 2469} {"train_loss": -6.405019442240397, "global_step": 103739, "epoch": 2469, "val_loss": 64247.5078125} {"train_loss": -6.437403678894043, "global_step": 103740, "epoch": 2470} {"train_loss": -6.50142240524292, "global_step": 103741, "epoch": 2470} {"train_loss": -6.49341344833374, "global_step": 103742, "epoch": 2470} {"train_loss": -6.453099250793457, "global_step": 103743, "epoch": 2470} {"train_loss": -6.328693866729736, "global_step": 103744, "epoch": 2470} {"train_loss": -6.433196544647217, "global_step": 103745, "epoch": 2470} {"train_loss": -6.275068759918213, "global_step": 103746, "epoch": 2470} {"train_loss": -6.476274013519287, "global_step": 103747, "epoch": 2470} {"train_loss": -6.3996171951293945, "global_step": 103748, "epoch": 2470} {"train_loss": -6.460119247436523, "global_step": 103749, "epoch": 2470} {"train_loss": -6.302684307098389, "global_step": 103750, "epoch": 2470} {"train_loss": -6.399685859680176, "global_step": 103751, "epoch": 2470} {"train_loss": -6.587170600891113, "global_step": 103752, "epoch": 2470} {"train_loss": -6.482048988342285, "global_step": 103753, "epoch": 2470} {"train_loss": -6.487974166870117, "global_step": 103754, "epoch": 2470} {"train_loss": -6.434389114379883, "global_step": 103755, "epoch": 2470} {"train_loss": -6.470276832580566, "global_step": 103756, "epoch": 2470} {"train_loss": -6.332322120666504, "global_step": 103757, "epoch": 2470} {"train_loss": -6.429923057556152, "global_step": 103758, "epoch": 2470} {"train_loss": -6.531775951385498, "global_step": 103759, "epoch": 2470} {"train_loss": -6.542768955230713, "global_step": 103760, "epoch": 2470} {"train_loss": -6.384047031402588, "global_step": 103761, "epoch": 2470} {"train_loss": -6.485121726989746, "global_step": 103762, "epoch": 2470} {"train_loss": -6.378815174102783, "global_step": 103763, "epoch": 2470} {"train_loss": -6.3112382888793945, "global_step": 103764, "epoch": 2470} {"train_loss": -6.462376594543457, "global_step": 103765, "epoch": 2470} {"train_loss": -6.50399112701416, "global_step": 103766, "epoch": 2470} {"train_loss": -6.5400495529174805, "global_step": 103767, "epoch": 2470} {"train_loss": -6.4811320304870605, "global_step": 103768, "epoch": 2470} {"train_loss": -6.383286476135254, "global_step": 103769, "epoch": 2470} {"train_loss": -6.373047351837158, "global_step": 103770, "epoch": 2470} {"train_loss": -6.420071125030518, "global_step": 103771, "epoch": 2470} {"train_loss": -6.343282699584961, "global_step": 103772, "epoch": 2470} {"train_loss": -6.427586555480957, "global_step": 103773, "epoch": 2470} {"train_loss": -6.377322196960449, "global_step": 103774, "epoch": 2470} {"train_loss": -6.4723310470581055, "global_step": 103775, "epoch": 2470} {"train_loss": -6.453981399536133, "global_step": 103776, "epoch": 2470} {"train_loss": -6.3607354164123535, "global_step": 103777, "epoch": 2470} {"train_loss": -6.454381942749023, "global_step": 103778, "epoch": 2470} {"train_loss": -6.261475563049316, "global_step": 103779, "epoch": 2470} {"train_loss": -6.454827308654785, "global_step": 103780, "epoch": 2470} {"train_loss": -6.429793539501372, "global_step": 103781, "epoch": 2470, "val_loss": 64431.6328125} {"train_loss": -6.480525970458984, "global_step": 103782, "epoch": 2471} {"train_loss": -6.442502975463867, "global_step": 103783, "epoch": 2471} {"train_loss": -6.462261199951172, "global_step": 103784, "epoch": 2471} {"train_loss": -6.446772575378418, "global_step": 103785, "epoch": 2471} {"train_loss": -6.462649345397949, "global_step": 103786, "epoch": 2471} {"train_loss": -6.348973274230957, "global_step": 103787, "epoch": 2471} {"train_loss": -6.440264701843262, "global_step": 103788, "epoch": 2471} {"train_loss": -6.467460632324219, "global_step": 103789, "epoch": 2471} {"train_loss": -6.33527946472168, "global_step": 103790, "epoch": 2471} {"train_loss": -6.410701274871826, "global_step": 103791, "epoch": 2471} {"train_loss": -6.414159297943115, "global_step": 103792, "epoch": 2471} {"train_loss": -6.505838871002197, "global_step": 103793, "epoch": 2471} {"train_loss": -6.395808219909668, "global_step": 103794, "epoch": 2471} {"train_loss": -6.436378479003906, "global_step": 103795, "epoch": 2471} {"train_loss": -6.364619731903076, "global_step": 103796, "epoch": 2471} {"train_loss": -6.30637264251709, "global_step": 103797, "epoch": 2471} {"train_loss": -6.331196308135986, "global_step": 103798, "epoch": 2471} {"train_loss": -6.282540321350098, "global_step": 103799, "epoch": 2471} {"train_loss": -6.301769256591797, "global_step": 103800, "epoch": 2471} {"train_loss": -6.393023490905762, "global_step": 103801, "epoch": 2471} {"train_loss": -6.482595443725586, "global_step": 103802, "epoch": 2471} {"train_loss": -6.498252868652344, "global_step": 103803, "epoch": 2471} {"train_loss": -6.399567127227783, "global_step": 103804, "epoch": 2471} {"train_loss": -6.419647216796875, "global_step": 103805, "epoch": 2471} {"train_loss": -6.315878868103027, "global_step": 103806, "epoch": 2471} {"train_loss": -6.443029403686523, "global_step": 103807, "epoch": 2471} {"train_loss": -6.371923446655273, "global_step": 103808, "epoch": 2471} {"train_loss": -6.420222282409668, "global_step": 103809, "epoch": 2471} {"train_loss": -6.417947769165039, "global_step": 103810, "epoch": 2471} {"train_loss": -6.445208549499512, "global_step": 103811, "epoch": 2471} {"train_loss": -6.431802749633789, "global_step": 103812, "epoch": 2471} {"train_loss": -6.432939052581787, "global_step": 103813, "epoch": 2471} {"train_loss": -6.3681721687316895, "global_step": 103814, "epoch": 2471} {"train_loss": -6.350772380828857, "global_step": 103815, "epoch": 2471} {"train_loss": -6.294852256774902, "global_step": 103816, "epoch": 2471} {"train_loss": -6.350149154663086, "global_step": 103817, "epoch": 2471} {"train_loss": -6.296106338500977, "global_step": 103818, "epoch": 2471} {"train_loss": -6.381522178649902, "global_step": 103819, "epoch": 2471} {"train_loss": -6.325827598571777, "global_step": 103820, "epoch": 2471} {"train_loss": -6.297776222229004, "global_step": 103821, "epoch": 2471} {"train_loss": -6.348907947540283, "global_step": 103822, "epoch": 2471} {"train_loss": -6.393533638545445, "global_step": 103823, "epoch": 2471, "val_loss": 64598.96875} {"train_loss": -6.4270477294921875, "global_step": 103824, "epoch": 2472} {"train_loss": -6.473333358764648, "global_step": 103825, "epoch": 2472} {"train_loss": -6.396726131439209, "global_step": 103826, "epoch": 2472} {"train_loss": -6.468722343444824, "global_step": 103827, "epoch": 2472} {"train_loss": -6.273282051086426, "global_step": 103828, "epoch": 2472} {"train_loss": -6.425806045532227, "global_step": 103829, "epoch": 2472} {"train_loss": -6.379916191101074, "global_step": 103830, "epoch": 2472} {"train_loss": -6.459348678588867, "global_step": 103831, "epoch": 2472} {"train_loss": -6.504378318786621, "global_step": 103832, "epoch": 2472} {"train_loss": -6.396145820617676, "global_step": 103833, "epoch": 2472} {"train_loss": -6.441990852355957, "global_step": 103834, "epoch": 2472} {"train_loss": -6.46139669418335, "global_step": 103835, "epoch": 2472} {"train_loss": -6.351751327514648, "global_step": 103836, "epoch": 2472} {"train_loss": -6.411924839019775, "global_step": 103837, "epoch": 2472} {"train_loss": -6.430678367614746, "global_step": 103838, "epoch": 2472} {"train_loss": -6.356372833251953, "global_step": 103839, "epoch": 2472} {"train_loss": -6.441864967346191, "global_step": 103840, "epoch": 2472} {"train_loss": -6.443835258483887, "global_step": 103841, "epoch": 2472} {"train_loss": -6.3758416175842285, "global_step": 103842, "epoch": 2472} {"train_loss": -6.3483123779296875, "global_step": 103843, "epoch": 2472} {"train_loss": -6.549753665924072, "global_step": 103844, "epoch": 2472} {"train_loss": -6.515749931335449, "global_step": 103845, "epoch": 2472} {"train_loss": -6.480803489685059, "global_step": 103846, "epoch": 2472} {"train_loss": -6.477665901184082, "global_step": 103847, "epoch": 2472} {"train_loss": -6.475910186767578, "global_step": 103848, "epoch": 2472} {"train_loss": -6.483470439910889, "global_step": 103849, "epoch": 2472} {"train_loss": -6.33476448059082, "global_step": 103850, "epoch": 2472} {"train_loss": -6.39547061920166, "global_step": 103851, "epoch": 2472} {"train_loss": -6.577635288238525, "global_step": 103852, "epoch": 2472} {"train_loss": -6.444599151611328, "global_step": 103853, "epoch": 2472} {"train_loss": -6.27717399597168, "global_step": 103854, "epoch": 2472} {"train_loss": -6.37167501449585, "global_step": 103855, "epoch": 2472} {"train_loss": -6.373064994812012, "global_step": 103856, "epoch": 2472} {"train_loss": -6.447197914123535, "global_step": 103857, "epoch": 2472} {"train_loss": -6.477508544921875, "global_step": 103858, "epoch": 2472} {"train_loss": -6.358164310455322, "global_step": 103859, "epoch": 2472} {"train_loss": -6.3577117919921875, "global_step": 103860, "epoch": 2472} {"train_loss": -6.437511920928955, "global_step": 103861, "epoch": 2472} {"train_loss": -6.473808765411377, "global_step": 103862, "epoch": 2472} {"train_loss": -6.291328430175781, "global_step": 103863, "epoch": 2472} {"train_loss": -6.359278202056885, "global_step": 103864, "epoch": 2472} {"train_loss": -6.417456059228806, "global_step": 103865, "epoch": 2472, "val_loss": 64586.77734375} {"train_loss": -6.281999111175537, "global_step": 103866, "epoch": 2473} {"train_loss": -6.414552688598633, "global_step": 103867, "epoch": 2473} {"train_loss": -6.436539649963379, "global_step": 103868, "epoch": 2473} {"train_loss": -6.397251129150391, "global_step": 103869, "epoch": 2473} {"train_loss": -6.468851089477539, "global_step": 103870, "epoch": 2473} {"train_loss": -6.436945915222168, "global_step": 103871, "epoch": 2473} {"train_loss": -6.292444229125977, "global_step": 103872, "epoch": 2473} {"train_loss": -6.491125106811523, "global_step": 103873, "epoch": 2473} {"train_loss": -6.416801452636719, "global_step": 103874, "epoch": 2473} {"train_loss": -6.355393409729004, "global_step": 103875, "epoch": 2473} {"train_loss": -6.362971305847168, "global_step": 103876, "epoch": 2473} {"train_loss": -6.403626441955566, "global_step": 103877, "epoch": 2473} {"train_loss": -6.402288436889648, "global_step": 103878, "epoch": 2473} {"train_loss": -6.351258277893066, "global_step": 103879, "epoch": 2473} {"train_loss": -6.362932205200195, "global_step": 103880, "epoch": 2473} {"train_loss": -6.377342224121094, "global_step": 103881, "epoch": 2473} {"train_loss": -6.360296249389648, "global_step": 103882, "epoch": 2473} {"train_loss": -6.503338813781738, "global_step": 103883, "epoch": 2473} {"train_loss": -6.297835350036621, "global_step": 103884, "epoch": 2473} {"train_loss": -6.385617256164551, "global_step": 103885, "epoch": 2473} {"train_loss": -6.297889709472656, "global_step": 103886, "epoch": 2473} {"train_loss": -6.314515113830566, "global_step": 103887, "epoch": 2473} {"train_loss": -6.344718933105469, "global_step": 103888, "epoch": 2473} {"train_loss": -6.411991119384766, "global_step": 103889, "epoch": 2473} {"train_loss": -6.410369873046875, "global_step": 103890, "epoch": 2473} {"train_loss": -6.39730167388916, "global_step": 103891, "epoch": 2473} {"train_loss": -6.440193176269531, "global_step": 103892, "epoch": 2473} {"train_loss": -6.275025367736816, "global_step": 103893, "epoch": 2473} {"train_loss": -6.3993330001831055, "global_step": 103894, "epoch": 2473} {"train_loss": -6.429878234863281, "global_step": 103895, "epoch": 2473} {"train_loss": -6.501467227935791, "global_step": 103896, "epoch": 2473} {"train_loss": -6.459738731384277, "global_step": 103897, "epoch": 2473} {"train_loss": -6.45021915435791, "global_step": 103898, "epoch": 2473} {"train_loss": -6.376400947570801, "global_step": 103899, "epoch": 2473} {"train_loss": -6.4538397789001465, "global_step": 103900, "epoch": 2473} {"train_loss": -6.478428840637207, "global_step": 103901, "epoch": 2473} {"train_loss": -6.318062782287598, "global_step": 103902, "epoch": 2473} {"train_loss": -6.350404739379883, "global_step": 103903, "epoch": 2473} {"train_loss": -6.321913242340088, "global_step": 103904, "epoch": 2473} {"train_loss": -6.398996353149414, "global_step": 103905, "epoch": 2473} {"train_loss": -6.416903495788574, "global_step": 103906, "epoch": 2473} {"train_loss": -6.390628780637469, "global_step": 103907, "epoch": 2473, "val_loss": 64315.0546875} {"train_loss": -6.385438919067383, "global_step": 103908, "epoch": 2474} {"train_loss": -6.4356207847595215, "global_step": 103909, "epoch": 2474} {"train_loss": -6.364948749542236, "global_step": 103910, "epoch": 2474} {"train_loss": -6.410204887390137, "global_step": 103911, "epoch": 2474} {"train_loss": -6.357531547546387, "global_step": 103912, "epoch": 2474} {"train_loss": -6.433340072631836, "global_step": 103913, "epoch": 2474} {"train_loss": -6.368402481079102, "global_step": 103914, "epoch": 2474} {"train_loss": -6.446372032165527, "global_step": 103915, "epoch": 2474} {"train_loss": -6.369083404541016, "global_step": 103916, "epoch": 2474} {"train_loss": -6.391385078430176, "global_step": 103917, "epoch": 2474} {"train_loss": -6.383524417877197, "global_step": 103918, "epoch": 2474} {"train_loss": -6.268171310424805, "global_step": 103919, "epoch": 2474} {"train_loss": -6.337444305419922, "global_step": 103920, "epoch": 2474} {"train_loss": -6.444145679473877, "global_step": 103921, "epoch": 2474} {"train_loss": -6.503549098968506, "global_step": 103922, "epoch": 2474} {"train_loss": -6.308432579040527, "global_step": 103923, "epoch": 2474} {"train_loss": -6.4227495193481445, "global_step": 103924, "epoch": 2474} {"train_loss": -6.399651527404785, "global_step": 103925, "epoch": 2474} {"train_loss": -6.3988037109375, "global_step": 103926, "epoch": 2474} {"train_loss": -6.395317077636719, "global_step": 103927, "epoch": 2474} {"train_loss": -6.396561622619629, "global_step": 103928, "epoch": 2474} {"train_loss": -6.383879661560059, "global_step": 103929, "epoch": 2474} {"train_loss": -6.38992166519165, "global_step": 103930, "epoch": 2474} {"train_loss": -6.478635311126709, "global_step": 103931, "epoch": 2474} {"train_loss": -6.445016860961914, "global_step": 103932, "epoch": 2474} {"train_loss": -6.389212131500244, "global_step": 103933, "epoch": 2474} {"train_loss": -6.455171585083008, "global_step": 103934, "epoch": 2474} {"train_loss": -6.502962589263916, "global_step": 103935, "epoch": 2474} {"train_loss": -6.318513870239258, "global_step": 103936, "epoch": 2474} {"train_loss": -6.486672401428223, "global_step": 103937, "epoch": 2474} {"train_loss": -6.299009323120117, "global_step": 103938, "epoch": 2474} {"train_loss": -6.375812530517578, "global_step": 103939, "epoch": 2474} {"train_loss": -6.37790584564209, "global_step": 103940, "epoch": 2474} {"train_loss": -6.428536415100098, "global_step": 103941, "epoch": 2474} {"train_loss": -6.379337787628174, "global_step": 103942, "epoch": 2474} {"train_loss": -6.300765514373779, "global_step": 103943, "epoch": 2474} {"train_loss": -6.362811088562012, "global_step": 103944, "epoch": 2474} {"train_loss": -6.4307861328125, "global_step": 103945, "epoch": 2474} {"train_loss": -6.332094192504883, "global_step": 103946, "epoch": 2474} {"train_loss": -6.299498558044434, "global_step": 103947, "epoch": 2474} {"train_loss": -6.440218448638916, "global_step": 103948, "epoch": 2474} {"train_loss": -6.394107943489438, "global_step": 103949, "epoch": 2474, "val_loss": 64424.3046875} {"train_loss": -6.348877429962158, "global_step": 103950, "epoch": 2475} {"train_loss": -6.343913555145264, "global_step": 103951, "epoch": 2475} {"train_loss": -6.467116832733154, "global_step": 103952, "epoch": 2475} {"train_loss": -6.532655715942383, "global_step": 103953, "epoch": 2475} {"train_loss": -6.43665885925293, "global_step": 103954, "epoch": 2475} {"train_loss": -6.413764953613281, "global_step": 103955, "epoch": 2475} {"train_loss": -6.461392879486084, "global_step": 103956, "epoch": 2475} {"train_loss": -6.376751899719238, "global_step": 103957, "epoch": 2475} {"train_loss": -6.41893196105957, "global_step": 103958, "epoch": 2475} {"train_loss": -6.525594711303711, "global_step": 103959, "epoch": 2475} {"train_loss": -6.320457458496094, "global_step": 103960, "epoch": 2475} {"train_loss": -6.3123602867126465, "global_step": 103961, "epoch": 2475} {"train_loss": -6.282036781311035, "global_step": 103962, "epoch": 2475} {"train_loss": -6.518723487854004, "global_step": 103963, "epoch": 2475} {"train_loss": -6.445978164672852, "global_step": 103964, "epoch": 2475} {"train_loss": -6.434244632720947, "global_step": 103965, "epoch": 2475} {"train_loss": -6.399806976318359, "global_step": 103966, "epoch": 2475} {"train_loss": -6.400045394897461, "global_step": 103967, "epoch": 2475} {"train_loss": -6.403775691986084, "global_step": 103968, "epoch": 2475} {"train_loss": -6.4591755867004395, "global_step": 103969, "epoch": 2475} {"train_loss": -6.479434013366699, "global_step": 103970, "epoch": 2475} {"train_loss": -6.430364608764648, "global_step": 103971, "epoch": 2475} {"train_loss": -6.254428863525391, "global_step": 103972, "epoch": 2475} {"train_loss": -6.4111433029174805, "global_step": 103973, "epoch": 2475} {"train_loss": -6.4937639236450195, "global_step": 103974, "epoch": 2475} {"train_loss": -6.610270023345947, "global_step": 103975, "epoch": 2475} {"train_loss": -6.454794406890869, "global_step": 103976, "epoch": 2475} {"train_loss": -6.486868381500244, "global_step": 103977, "epoch": 2475} {"train_loss": -6.314400672912598, "global_step": 103978, "epoch": 2475} {"train_loss": -6.4216156005859375, "global_step": 103979, "epoch": 2475} {"train_loss": -6.378628730773926, "global_step": 103980, "epoch": 2475} {"train_loss": -6.230792999267578, "global_step": 103981, "epoch": 2475} {"train_loss": -6.400974273681641, "global_step": 103982, "epoch": 2475} {"train_loss": -6.353937149047852, "global_step": 103983, "epoch": 2475} {"train_loss": -6.229918479919434, "global_step": 103984, "epoch": 2475} {"train_loss": -6.402408599853516, "global_step": 103985, "epoch": 2475} {"train_loss": -6.335472583770752, "global_step": 103986, "epoch": 2475} {"train_loss": -6.362423896789551, "global_step": 103987, "epoch": 2475} {"train_loss": -6.467164993286133, "global_step": 103988, "epoch": 2475} {"train_loss": -6.352578163146973, "global_step": 103989, "epoch": 2475} {"train_loss": -6.373413562774658, "global_step": 103990, "epoch": 2475} {"train_loss": -6.4028759343283514, "global_step": 103991, "epoch": 2475, "val_loss": 64328.83203125} {"train_loss": -6.4389848709106445, "global_step": 103992, "epoch": 2476} {"train_loss": -6.46807336807251, "global_step": 103993, "epoch": 2476} {"train_loss": -6.47900915145874, "global_step": 103994, "epoch": 2476} {"train_loss": -6.346559524536133, "global_step": 103995, "epoch": 2476} {"train_loss": -6.415632247924805, "global_step": 103996, "epoch": 2476} {"train_loss": -6.372931480407715, "global_step": 103997, "epoch": 2476} {"train_loss": -6.456569194793701, "global_step": 103998, "epoch": 2476} {"train_loss": -6.521360874176025, "global_step": 103999, "epoch": 2476} {"train_loss": -6.506467819213867, "global_step": 104000, "epoch": 2476} {"train_loss": -6.418735504150391, "global_step": 104001, "epoch": 2476} {"train_loss": -6.494997978210449, "global_step": 104002, "epoch": 2476} {"train_loss": -6.394822120666504, "global_step": 104003, "epoch": 2476} {"train_loss": -6.417932987213135, "global_step": 104004, "epoch": 2476} {"train_loss": -6.482165813446045, "global_step": 104005, "epoch": 2476} {"train_loss": -6.348814964294434, "global_step": 104006, "epoch": 2476} {"train_loss": -6.381876468658447, "global_step": 104007, "epoch": 2476} {"train_loss": -6.470005989074707, "global_step": 104008, "epoch": 2476} {"train_loss": -6.330680847167969, "global_step": 104009, "epoch": 2476} {"train_loss": -6.445583820343018, "global_step": 104010, "epoch": 2476} {"train_loss": -6.396735191345215, "global_step": 104011, "epoch": 2476} {"train_loss": -6.38308048248291, "global_step": 104012, "epoch": 2476} {"train_loss": -6.470524787902832, "global_step": 104013, "epoch": 2476} {"train_loss": -6.395002365112305, "global_step": 104014, "epoch": 2476} {"train_loss": -6.360646724700928, "global_step": 104015, "epoch": 2476} {"train_loss": -6.375730991363525, "global_step": 104016, "epoch": 2476} {"train_loss": -6.344237804412842, "global_step": 104017, "epoch": 2476} {"train_loss": -6.485915660858154, "global_step": 104018, "epoch": 2476} {"train_loss": -6.40203857421875, "global_step": 104019, "epoch": 2476} {"train_loss": -6.37407112121582, "global_step": 104020, "epoch": 2476} {"train_loss": -6.447755813598633, "global_step": 104021, "epoch": 2476} {"train_loss": -6.433208465576172, "global_step": 104022, "epoch": 2476} {"train_loss": -6.465792179107666, "global_step": 104023, "epoch": 2476} {"train_loss": -6.399709701538086, "global_step": 104024, "epoch": 2476} {"train_loss": -6.371339321136475, "global_step": 104025, "epoch": 2476} {"train_loss": -6.410130023956299, "global_step": 104026, "epoch": 2476} {"train_loss": -6.38131046295166, "global_step": 104027, "epoch": 2476} {"train_loss": -6.464687824249268, "global_step": 104028, "epoch": 2476} {"train_loss": -6.498902320861816, "global_step": 104029, "epoch": 2476} {"train_loss": -6.3361430168151855, "global_step": 104030, "epoch": 2476} {"train_loss": -6.3399810791015625, "global_step": 104031, "epoch": 2476} {"train_loss": -6.413402557373047, "global_step": 104032, "epoch": 2476} {"train_loss": -6.414224942525228, "global_step": 104033, "epoch": 2476, "val_loss": 64363.12890625} {"train_loss": -6.407990455627441, "global_step": 104034, "epoch": 2477} {"train_loss": -6.309348106384277, "global_step": 104035, "epoch": 2477} {"train_loss": -6.413435459136963, "global_step": 104036, "epoch": 2477} {"train_loss": -6.473782539367676, "global_step": 104037, "epoch": 2477} {"train_loss": -6.3097639083862305, "global_step": 104038, "epoch": 2477} {"train_loss": -6.3857502937316895, "global_step": 104039, "epoch": 2477} {"train_loss": -6.388083457946777, "global_step": 104040, "epoch": 2477} {"train_loss": -6.445921897888184, "global_step": 104041, "epoch": 2477} {"train_loss": -6.410329341888428, "global_step": 104042, "epoch": 2477} {"train_loss": -6.363109111785889, "global_step": 104043, "epoch": 2477} {"train_loss": -6.261111259460449, "global_step": 104044, "epoch": 2477} {"train_loss": -6.301294326782227, "global_step": 104045, "epoch": 2477} {"train_loss": -6.489975452423096, "global_step": 104046, "epoch": 2477} {"train_loss": -6.4603376388549805, "global_step": 104047, "epoch": 2477} {"train_loss": -6.490257263183594, "global_step": 104048, "epoch": 2477} {"train_loss": -6.41499137878418, "global_step": 104049, "epoch": 2477} {"train_loss": -6.436732292175293, "global_step": 104050, "epoch": 2477} {"train_loss": -6.403223037719727, "global_step": 104051, "epoch": 2477} {"train_loss": -6.386074066162109, "global_step": 104052, "epoch": 2477} {"train_loss": -6.345491409301758, "global_step": 104053, "epoch": 2477} {"train_loss": -6.36452579498291, "global_step": 104054, "epoch": 2477} {"train_loss": -6.407923698425293, "global_step": 104055, "epoch": 2477} {"train_loss": -6.310431003570557, "global_step": 104056, "epoch": 2477} {"train_loss": -6.390810012817383, "global_step": 104057, "epoch": 2477} {"train_loss": -6.446846008300781, "global_step": 104058, "epoch": 2477} {"train_loss": -6.314939022064209, "global_step": 104059, "epoch": 2477} {"train_loss": -6.459084510803223, "global_step": 104060, "epoch": 2477} {"train_loss": -6.438366413116455, "global_step": 104061, "epoch": 2477} {"train_loss": -6.451564788818359, "global_step": 104062, "epoch": 2477} {"train_loss": -6.335855484008789, "global_step": 104063, "epoch": 2477} {"train_loss": -6.459881782531738, "global_step": 104064, "epoch": 2477} {"train_loss": -6.244966983795166, "global_step": 104065, "epoch": 2477} {"train_loss": -6.409726619720459, "global_step": 104066, "epoch": 2477} {"train_loss": -6.250901222229004, "global_step": 104067, "epoch": 2477} {"train_loss": -6.39925479888916, "global_step": 104068, "epoch": 2477} {"train_loss": -6.402570724487305, "global_step": 104069, "epoch": 2477} {"train_loss": -6.425979137420654, "global_step": 104070, "epoch": 2477} {"train_loss": -6.457489013671875, "global_step": 104071, "epoch": 2477} {"train_loss": -6.406402587890625, "global_step": 104072, "epoch": 2477} {"train_loss": -6.292000770568848, "global_step": 104073, "epoch": 2477} {"train_loss": -6.559287071228027, "global_step": 104074, "epoch": 2477} {"train_loss": -6.388733682178316, "global_step": 104075, "epoch": 2477, "val_loss": 64444.7109375} {"train_loss": -6.4414825439453125, "global_step": 104076, "epoch": 2478} {"train_loss": -6.4757184982299805, "global_step": 104077, "epoch": 2478} {"train_loss": -6.43975830078125, "global_step": 104078, "epoch": 2478} {"train_loss": -6.468083381652832, "global_step": 104079, "epoch": 2478} {"train_loss": -6.300739288330078, "global_step": 104080, "epoch": 2478} {"train_loss": -6.443852424621582, "global_step": 104081, "epoch": 2478} {"train_loss": -6.333388805389404, "global_step": 104082, "epoch": 2478} {"train_loss": -6.401737213134766, "global_step": 104083, "epoch": 2478} {"train_loss": -6.371977806091309, "global_step": 104084, "epoch": 2478} {"train_loss": -6.394041061401367, "global_step": 104085, "epoch": 2478} {"train_loss": -6.423642158508301, "global_step": 104086, "epoch": 2478} {"train_loss": -6.313180923461914, "global_step": 104087, "epoch": 2478} {"train_loss": -6.467035293579102, "global_step": 104088, "epoch": 2478} {"train_loss": -6.360343933105469, "global_step": 104089, "epoch": 2478} {"train_loss": -6.419008255004883, "global_step": 104090, "epoch": 2478} {"train_loss": -6.455295085906982, "global_step": 104091, "epoch": 2478} {"train_loss": -6.416877746582031, "global_step": 104092, "epoch": 2478} {"train_loss": -6.376750946044922, "global_step": 104093, "epoch": 2478} {"train_loss": -6.435573577880859, "global_step": 104094, "epoch": 2478} {"train_loss": -6.432289123535156, "global_step": 104095, "epoch": 2478} {"train_loss": -6.451066493988037, "global_step": 104096, "epoch": 2478} {"train_loss": -6.398758888244629, "global_step": 104097, "epoch": 2478} {"train_loss": -6.427866458892822, "global_step": 104098, "epoch": 2478} {"train_loss": -6.397366523742676, "global_step": 104099, "epoch": 2478} {"train_loss": -6.415327072143555, "global_step": 104100, "epoch": 2478} {"train_loss": -6.459339141845703, "global_step": 104101, "epoch": 2478} {"train_loss": -6.2966413497924805, "global_step": 104102, "epoch": 2478} {"train_loss": -6.520181179046631, "global_step": 104103, "epoch": 2478} {"train_loss": -6.497864246368408, "global_step": 104104, "epoch": 2478} {"train_loss": -6.402345657348633, "global_step": 104105, "epoch": 2478} {"train_loss": -6.586198806762695, "global_step": 104106, "epoch": 2478} {"train_loss": -6.504434585571289, "global_step": 104107, "epoch": 2478} {"train_loss": -6.4841179847717285, "global_step": 104108, "epoch": 2478} {"train_loss": -6.35504674911499, "global_step": 104109, "epoch": 2478} {"train_loss": -6.413299560546875, "global_step": 104110, "epoch": 2478} {"train_loss": -6.388293266296387, "global_step": 104111, "epoch": 2478} {"train_loss": -6.511508941650391, "global_step": 104112, "epoch": 2478} {"train_loss": -6.369369029998779, "global_step": 104113, "epoch": 2478} {"train_loss": -6.416008949279785, "global_step": 104114, "epoch": 2478} {"train_loss": -6.398724555969238, "global_step": 104115, "epoch": 2478} {"train_loss": -6.541995048522949, "global_step": 104116, "epoch": 2478} {"train_loss": -6.424871842066447, "global_step": 104117, "epoch": 2478, "val_loss": 64428.41015625} {"train_loss": -6.527156829833984, "global_step": 104118, "epoch": 2479} {"train_loss": -6.368332862854004, "global_step": 104119, "epoch": 2479} {"train_loss": -6.463053226470947, "global_step": 104120, "epoch": 2479} {"train_loss": -6.522804260253906, "global_step": 104121, "epoch": 2479} {"train_loss": -6.340444087982178, "global_step": 104122, "epoch": 2479} {"train_loss": -6.502967834472656, "global_step": 104123, "epoch": 2479} {"train_loss": -6.461890697479248, "global_step": 104124, "epoch": 2479} {"train_loss": -6.430445194244385, "global_step": 104125, "epoch": 2479} {"train_loss": -6.500105381011963, "global_step": 104126, "epoch": 2479} {"train_loss": -6.370607852935791, "global_step": 104127, "epoch": 2479} {"train_loss": -6.417300701141357, "global_step": 104128, "epoch": 2479} {"train_loss": -6.4982452392578125, "global_step": 104129, "epoch": 2479} {"train_loss": -6.333007335662842, "global_step": 104130, "epoch": 2479} {"train_loss": -6.3808698654174805, "global_step": 104131, "epoch": 2479} {"train_loss": -6.459357261657715, "global_step": 104132, "epoch": 2479} {"train_loss": -6.340950012207031, "global_step": 104133, "epoch": 2479} {"train_loss": -6.3200531005859375, "global_step": 104134, "epoch": 2479} {"train_loss": -6.461935997009277, "global_step": 104135, "epoch": 2479} {"train_loss": -6.337463855743408, "global_step": 104136, "epoch": 2479} {"train_loss": -6.344585418701172, "global_step": 104137, "epoch": 2479} {"train_loss": -6.414491653442383, "global_step": 104138, "epoch": 2479} {"train_loss": -6.337193965911865, "global_step": 104139, "epoch": 2479} {"train_loss": -6.27640962600708, "global_step": 104140, "epoch": 2479} {"train_loss": -6.489512920379639, "global_step": 104141, "epoch": 2479} {"train_loss": -6.288112640380859, "global_step": 104142, "epoch": 2479} {"train_loss": -6.363143444061279, "global_step": 104143, "epoch": 2479} {"train_loss": -6.439188480377197, "global_step": 104144, "epoch": 2479} {"train_loss": -6.225313186645508, "global_step": 104145, "epoch": 2479} {"train_loss": -6.41103458404541, "global_step": 104146, "epoch": 2479} {"train_loss": -6.360060691833496, "global_step": 104147, "epoch": 2479} {"train_loss": -6.450165748596191, "global_step": 104148, "epoch": 2479} {"train_loss": -6.576285362243652, "global_step": 104149, "epoch": 2479} {"train_loss": -6.42868709564209, "global_step": 104150, "epoch": 2479} {"train_loss": -6.35042667388916, "global_step": 104151, "epoch": 2479} {"train_loss": -6.428030967712402, "global_step": 104152, "epoch": 2479} {"train_loss": -6.31742000579834, "global_step": 104153, "epoch": 2479} {"train_loss": -6.313617706298828, "global_step": 104154, "epoch": 2479} {"train_loss": -6.380963325500488, "global_step": 104155, "epoch": 2479} {"train_loss": -6.394003391265869, "global_step": 104156, "epoch": 2479} {"train_loss": -6.455598831176758, "global_step": 104157, "epoch": 2479} {"train_loss": -6.377205848693848, "global_step": 104158, "epoch": 2479} {"train_loss": -6.399592240651448, "global_step": 104159, "epoch": 2479, "val_loss": 64577.9921875} {"train_loss": -6.485483646392822, "global_step": 104160, "epoch": 2480} {"train_loss": -6.427036285400391, "global_step": 104161, "epoch": 2480} {"train_loss": -6.452298164367676, "global_step": 104162, "epoch": 2480} {"train_loss": -6.36236047744751, "global_step": 104163, "epoch": 2480} {"train_loss": -6.376527786254883, "global_step": 104164, "epoch": 2480} {"train_loss": -6.328558444976807, "global_step": 104165, "epoch": 2480} {"train_loss": -6.43510103225708, "global_step": 104166, "epoch": 2480} {"train_loss": -6.5334062576293945, "global_step": 104167, "epoch": 2480} {"train_loss": -6.262203216552734, "global_step": 104168, "epoch": 2480} {"train_loss": -6.555081367492676, "global_step": 104169, "epoch": 2480} {"train_loss": -6.427236557006836, "global_step": 104170, "epoch": 2480} {"train_loss": -6.4343791007995605, "global_step": 104171, "epoch": 2480} {"train_loss": -6.429644584655762, "global_step": 104172, "epoch": 2480} {"train_loss": -6.451296806335449, "global_step": 104173, "epoch": 2480} {"train_loss": -6.440413475036621, "global_step": 104174, "epoch": 2480} {"train_loss": -6.492441654205322, "global_step": 104175, "epoch": 2480} {"train_loss": -6.48738431930542, "global_step": 104176, "epoch": 2480} {"train_loss": -6.261962890625, "global_step": 104177, "epoch": 2480} {"train_loss": -6.459310054779053, "global_step": 104178, "epoch": 2480} {"train_loss": -6.500102996826172, "global_step": 104179, "epoch": 2480} {"train_loss": -6.412869453430176, "global_step": 104180, "epoch": 2480} {"train_loss": -6.441339492797852, "global_step": 104181, "epoch": 2480} {"train_loss": -6.417593955993652, "global_step": 104182, "epoch": 2480} {"train_loss": -6.466763496398926, "global_step": 104183, "epoch": 2480} {"train_loss": -6.466653823852539, "global_step": 104184, "epoch": 2480} {"train_loss": -6.468743324279785, "global_step": 104185, "epoch": 2480} {"train_loss": -6.45189094543457, "global_step": 104186, "epoch": 2480} {"train_loss": -6.497861862182617, "global_step": 104187, "epoch": 2480} {"train_loss": -6.415637016296387, "global_step": 104188, "epoch": 2480} {"train_loss": -6.452273368835449, "global_step": 104189, "epoch": 2480} {"train_loss": -6.457221031188965, "global_step": 104190, "epoch": 2480} {"train_loss": -6.433831214904785, "global_step": 104191, "epoch": 2480} {"train_loss": -6.391520023345947, "global_step": 104192, "epoch": 2480} {"train_loss": -6.4424591064453125, "global_step": 104193, "epoch": 2480} {"train_loss": -6.424056529998779, "global_step": 104194, "epoch": 2480} {"train_loss": -6.33616828918457, "global_step": 104195, "epoch": 2480} {"train_loss": -6.435819625854492, "global_step": 104196, "epoch": 2480} {"train_loss": -6.397215366363525, "global_step": 104197, "epoch": 2480} {"train_loss": -6.330698013305664, "global_step": 104198, "epoch": 2480} {"train_loss": -6.490573883056641, "global_step": 104199, "epoch": 2480} {"train_loss": -6.203629970550537, "global_step": 104200, "epoch": 2480} {"train_loss": -6.425277119591122, "global_step": 104201, "epoch": 2480, "val_loss": 64392.12109375} {"train_loss": -6.367620468139648, "global_step": 104202, "epoch": 2481} {"train_loss": -6.34735631942749, "global_step": 104203, "epoch": 2481} {"train_loss": -6.405086517333984, "global_step": 104204, "epoch": 2481} {"train_loss": -6.475733280181885, "global_step": 104205, "epoch": 2481} {"train_loss": -6.39792537689209, "global_step": 104206, "epoch": 2481} {"train_loss": -6.397609233856201, "global_step": 104207, "epoch": 2481} {"train_loss": -6.441653251647949, "global_step": 104208, "epoch": 2481} {"train_loss": -6.286096572875977, "global_step": 104209, "epoch": 2481} {"train_loss": -6.463088035583496, "global_step": 104210, "epoch": 2481} {"train_loss": -6.35148811340332, "global_step": 104211, "epoch": 2481} {"train_loss": -6.415494441986084, "global_step": 104212, "epoch": 2481} {"train_loss": -6.416496753692627, "global_step": 104213, "epoch": 2481} {"train_loss": -6.45684814453125, "global_step": 104214, "epoch": 2481} {"train_loss": -6.512810707092285, "global_step": 104215, "epoch": 2481} {"train_loss": -6.306461334228516, "global_step": 104216, "epoch": 2481} {"train_loss": -6.426887512207031, "global_step": 104217, "epoch": 2481} {"train_loss": -6.316767692565918, "global_step": 104218, "epoch": 2481} {"train_loss": -6.364209175109863, "global_step": 104219, "epoch": 2481} {"train_loss": -6.391510963439941, "global_step": 104220, "epoch": 2481} {"train_loss": -6.335867881774902, "global_step": 104221, "epoch": 2481} {"train_loss": -6.3258209228515625, "global_step": 104222, "epoch": 2481} {"train_loss": -6.361728668212891, "global_step": 104223, "epoch": 2481} {"train_loss": -6.209339141845703, "global_step": 104224, "epoch": 2481} {"train_loss": -6.3890485763549805, "global_step": 104225, "epoch": 2481} {"train_loss": -6.376997470855713, "global_step": 104226, "epoch": 2481} {"train_loss": -6.2407426834106445, "global_step": 104227, "epoch": 2481} {"train_loss": -6.2979960441589355, "global_step": 104228, "epoch": 2481} {"train_loss": -6.355031967163086, "global_step": 104229, "epoch": 2481} {"train_loss": -6.342508792877197, "global_step": 104230, "epoch": 2481} {"train_loss": -6.421647071838379, "global_step": 104231, "epoch": 2481} {"train_loss": -6.291446685791016, "global_step": 104232, "epoch": 2481} {"train_loss": -6.309835910797119, "global_step": 104233, "epoch": 2481} {"train_loss": -6.422904968261719, "global_step": 104234, "epoch": 2481} {"train_loss": -6.300238609313965, "global_step": 104235, "epoch": 2481} {"train_loss": -6.381960391998291, "global_step": 104236, "epoch": 2481} {"train_loss": -6.34241247177124, "global_step": 104237, "epoch": 2481} {"train_loss": -6.328478813171387, "global_step": 104238, "epoch": 2481} {"train_loss": -6.424020767211914, "global_step": 104239, "epoch": 2481} {"train_loss": -6.406184196472168, "global_step": 104240, "epoch": 2481} {"train_loss": -6.395453453063965, "global_step": 104241, "epoch": 2481} {"train_loss": -6.3524861335754395, "global_step": 104242, "epoch": 2481} {"train_loss": -6.369383528119042, "global_step": 104243, "epoch": 2481, "val_loss": 64508.26953125} {"train_loss": -6.46718168258667, "global_step": 104244, "epoch": 2482} {"train_loss": -6.488309860229492, "global_step": 104245, "epoch": 2482} {"train_loss": -6.348836421966553, "global_step": 104246, "epoch": 2482} {"train_loss": -6.500818252563477, "global_step": 104247, "epoch": 2482} {"train_loss": -6.408261299133301, "global_step": 104248, "epoch": 2482} {"train_loss": -6.406412601470947, "global_step": 104249, "epoch": 2482} {"train_loss": -6.332243919372559, "global_step": 104250, "epoch": 2482} {"train_loss": -6.219695091247559, "global_step": 104251, "epoch": 2482} {"train_loss": -6.384817123413086, "global_step": 104252, "epoch": 2482} {"train_loss": -6.415485382080078, "global_step": 104253, "epoch": 2482} {"train_loss": -6.391704082489014, "global_step": 104254, "epoch": 2482} {"train_loss": -6.273334503173828, "global_step": 104255, "epoch": 2482} {"train_loss": -6.393198013305664, "global_step": 104256, "epoch": 2482} {"train_loss": -6.42884635925293, "global_step": 104257, "epoch": 2482} {"train_loss": -6.249350547790527, "global_step": 104258, "epoch": 2482} {"train_loss": -6.427319049835205, "global_step": 104259, "epoch": 2482} {"train_loss": -6.432432174682617, "global_step": 104260, "epoch": 2482} {"train_loss": -6.3795695304870605, "global_step": 104261, "epoch": 2482} {"train_loss": -6.319381237030029, "global_step": 104262, "epoch": 2482} {"train_loss": -6.351776123046875, "global_step": 104263, "epoch": 2482} {"train_loss": -6.327605247497559, "global_step": 104264, "epoch": 2482} {"train_loss": -6.362809658050537, "global_step": 104265, "epoch": 2482} {"train_loss": -6.358447551727295, "global_step": 104266, "epoch": 2482} {"train_loss": -6.3580827713012695, "global_step": 104267, "epoch": 2482} {"train_loss": -6.3896918296813965, "global_step": 104268, "epoch": 2482} {"train_loss": -6.349084854125977, "global_step": 104269, "epoch": 2482} {"train_loss": -6.380722999572754, "global_step": 104270, "epoch": 2482} {"train_loss": -6.383870601654053, "global_step": 104271, "epoch": 2482} {"train_loss": -6.399847984313965, "global_step": 104272, "epoch": 2482} {"train_loss": -6.360620498657227, "global_step": 104273, "epoch": 2482} {"train_loss": -6.37269926071167, "global_step": 104274, "epoch": 2482} {"train_loss": -6.484511375427246, "global_step": 104275, "epoch": 2482} {"train_loss": -6.382159233093262, "global_step": 104276, "epoch": 2482} {"train_loss": -6.325909614562988, "global_step": 104277, "epoch": 2482} {"train_loss": -6.317529201507568, "global_step": 104278, "epoch": 2482} {"train_loss": -6.4279632568359375, "global_step": 104279, "epoch": 2482} {"train_loss": -6.387015342712402, "global_step": 104280, "epoch": 2482} {"train_loss": -6.450474262237549, "global_step": 104281, "epoch": 2482} {"train_loss": -6.363686561584473, "global_step": 104282, "epoch": 2482} {"train_loss": -6.453812599182129, "global_step": 104283, "epoch": 2482} {"train_loss": -6.487778663635254, "global_step": 104284, "epoch": 2482} {"train_loss": -6.386604502087548, "global_step": 104285, "epoch": 2482, "val_loss": 64422.75390625} {"train_loss": -6.433747291564941, "global_step": 104286, "epoch": 2483} {"train_loss": -6.434656620025635, "global_step": 104287, "epoch": 2483} {"train_loss": -6.456191062927246, "global_step": 104288, "epoch": 2483} {"train_loss": -6.427000045776367, "global_step": 104289, "epoch": 2483} {"train_loss": -6.386654853820801, "global_step": 104290, "epoch": 2483} {"train_loss": -6.448313236236572, "global_step": 104291, "epoch": 2483} {"train_loss": -6.364170551300049, "global_step": 104292, "epoch": 2483} {"train_loss": -6.372003078460693, "global_step": 104293, "epoch": 2483} {"train_loss": -6.476906776428223, "global_step": 104294, "epoch": 2483} {"train_loss": -6.451959609985352, "global_step": 104295, "epoch": 2483} {"train_loss": -6.479703903198242, "global_step": 104296, "epoch": 2483} {"train_loss": -6.425918102264404, "global_step": 104297, "epoch": 2483} {"train_loss": -6.430622100830078, "global_step": 104298, "epoch": 2483} {"train_loss": -6.467691421508789, "global_step": 104299, "epoch": 2483} {"train_loss": -6.399213790893555, "global_step": 104300, "epoch": 2483} {"train_loss": -6.424749374389648, "global_step": 104301, "epoch": 2483} {"train_loss": -6.407317161560059, "global_step": 104302, "epoch": 2483} {"train_loss": -6.418893337249756, "global_step": 104303, "epoch": 2483} {"train_loss": -6.382688999176025, "global_step": 104304, "epoch": 2483} {"train_loss": -6.334200859069824, "global_step": 104305, "epoch": 2483} {"train_loss": -6.383162021636963, "global_step": 104306, "epoch": 2483} {"train_loss": -6.312443733215332, "global_step": 104307, "epoch": 2483} {"train_loss": -6.445186614990234, "global_step": 104308, "epoch": 2483} {"train_loss": -6.383101940155029, "global_step": 104309, "epoch": 2483} {"train_loss": -6.403789043426514, "global_step": 104310, "epoch": 2483} {"train_loss": -6.306926250457764, "global_step": 104311, "epoch": 2483} {"train_loss": -6.288976192474365, "global_step": 104312, "epoch": 2483} {"train_loss": -6.542987823486328, "global_step": 104313, "epoch": 2483} {"train_loss": -6.435673713684082, "global_step": 104314, "epoch": 2483} {"train_loss": -6.342627048492432, "global_step": 104315, "epoch": 2483} {"train_loss": -6.413771629333496, "global_step": 104316, "epoch": 2483} {"train_loss": -6.500883102416992, "global_step": 104317, "epoch": 2483} {"train_loss": -6.490311622619629, "global_step": 104318, "epoch": 2483} {"train_loss": -6.364800453186035, "global_step": 104319, "epoch": 2483} {"train_loss": -6.441936492919922, "global_step": 104320, "epoch": 2483} {"train_loss": -6.444216251373291, "global_step": 104321, "epoch": 2483} {"train_loss": -6.423303604125977, "global_step": 104322, "epoch": 2483} {"train_loss": -6.401152610778809, "global_step": 104323, "epoch": 2483} {"train_loss": -6.379066467285156, "global_step": 104324, "epoch": 2483} {"train_loss": -6.458522796630859, "global_step": 104325, "epoch": 2483} {"train_loss": -6.396632194519043, "global_step": 104326, "epoch": 2483} {"train_loss": -6.412186599913097, "global_step": 104327, "epoch": 2483, "val_loss": 64596.3125} {"train_loss": -6.358675003051758, "global_step": 104328, "epoch": 2484} {"train_loss": -6.492268085479736, "global_step": 104329, "epoch": 2484} {"train_loss": -6.229677677154541, "global_step": 104330, "epoch": 2484} {"train_loss": -6.389761924743652, "global_step": 104331, "epoch": 2484} {"train_loss": -6.297060489654541, "global_step": 104332, "epoch": 2484} {"train_loss": -6.454826354980469, "global_step": 104333, "epoch": 2484} {"train_loss": -6.452798366546631, "global_step": 104334, "epoch": 2484} {"train_loss": -6.3602423667907715, "global_step": 104335, "epoch": 2484} {"train_loss": -6.451915264129639, "global_step": 104336, "epoch": 2484} {"train_loss": -6.443695068359375, "global_step": 104337, "epoch": 2484} {"train_loss": -6.346819877624512, "global_step": 104338, "epoch": 2484} {"train_loss": -6.456576824188232, "global_step": 104339, "epoch": 2484} {"train_loss": -6.442988395690918, "global_step": 104340, "epoch": 2484} {"train_loss": -6.4741950035095215, "global_step": 104341, "epoch": 2484} {"train_loss": -6.453567028045654, "global_step": 104342, "epoch": 2484} {"train_loss": -6.431911468505859, "global_step": 104343, "epoch": 2484} {"train_loss": -6.450812816619873, "global_step": 104344, "epoch": 2484} {"train_loss": -6.428485870361328, "global_step": 104345, "epoch": 2484} {"train_loss": -6.473113059997559, "global_step": 104346, "epoch": 2484} {"train_loss": -6.404209136962891, "global_step": 104347, "epoch": 2484} {"train_loss": -6.258203506469727, "global_step": 104348, "epoch": 2484} {"train_loss": -6.475946426391602, "global_step": 104349, "epoch": 2484} {"train_loss": -6.390998840332031, "global_step": 104350, "epoch": 2484} {"train_loss": -6.398550033569336, "global_step": 104351, "epoch": 2484} {"train_loss": -6.415897369384766, "global_step": 104352, "epoch": 2484} {"train_loss": -6.373098373413086, "global_step": 104353, "epoch": 2484} {"train_loss": -6.432226181030273, "global_step": 104354, "epoch": 2484} {"train_loss": -6.417830467224121, "global_step": 104355, "epoch": 2484} {"train_loss": -6.421257972717285, "global_step": 104356, "epoch": 2484} {"train_loss": -6.513788223266602, "global_step": 104357, "epoch": 2484} {"train_loss": -6.35836124420166, "global_step": 104358, "epoch": 2484} {"train_loss": -6.3468780517578125, "global_step": 104359, "epoch": 2484} {"train_loss": -6.330707550048828, "global_step": 104360, "epoch": 2484} {"train_loss": -6.527690887451172, "global_step": 104361, "epoch": 2484} {"train_loss": -6.498380661010742, "global_step": 104362, "epoch": 2484} {"train_loss": -6.3979597091674805, "global_step": 104363, "epoch": 2484} {"train_loss": -6.4441962242126465, "global_step": 104364, "epoch": 2484} {"train_loss": -6.358863830566406, "global_step": 104365, "epoch": 2484} {"train_loss": -6.450643062591553, "global_step": 104366, "epoch": 2484} {"train_loss": -6.437219619750977, "global_step": 104367, "epoch": 2484} {"train_loss": -6.323942184448242, "global_step": 104368, "epoch": 2484} {"train_loss": -6.41143140338716, "global_step": 104369, "epoch": 2484, "val_loss": 64599.0859375} {"train_loss": -6.440520286560059, "global_step": 104370, "epoch": 2485} {"train_loss": -6.385695457458496, "global_step": 104371, "epoch": 2485} {"train_loss": -6.359416961669922, "global_step": 104372, "epoch": 2485} {"train_loss": -6.371977806091309, "global_step": 104373, "epoch": 2485} {"train_loss": -6.25230598449707, "global_step": 104374, "epoch": 2485} {"train_loss": -6.473283767700195, "global_step": 104375, "epoch": 2485} {"train_loss": -6.319869041442871, "global_step": 104376, "epoch": 2485} {"train_loss": -6.347774505615234, "global_step": 104377, "epoch": 2485} {"train_loss": -6.252838134765625, "global_step": 104378, "epoch": 2485} {"train_loss": -6.3110270500183105, "global_step": 104379, "epoch": 2485} {"train_loss": -6.380887031555176, "global_step": 104380, "epoch": 2485} {"train_loss": -6.304123401641846, "global_step": 104381, "epoch": 2485} {"train_loss": -6.509550094604492, "global_step": 104382, "epoch": 2485} {"train_loss": -6.254619598388672, "global_step": 104383, "epoch": 2485} {"train_loss": -6.3983612060546875, "global_step": 104384, "epoch": 2485} {"train_loss": -6.237768650054932, "global_step": 104385, "epoch": 2485} {"train_loss": -6.30418062210083, "global_step": 104386, "epoch": 2485} {"train_loss": -6.43288516998291, "global_step": 104387, "epoch": 2485} {"train_loss": -6.371725082397461, "global_step": 104388, "epoch": 2485} {"train_loss": -6.412060737609863, "global_step": 104389, "epoch": 2485} {"train_loss": -6.177084922790527, "global_step": 104390, "epoch": 2485} {"train_loss": -6.344693183898926, "global_step": 104391, "epoch": 2485} {"train_loss": -6.390480995178223, "global_step": 104392, "epoch": 2485} {"train_loss": -6.3019232749938965, "global_step": 104393, "epoch": 2485} {"train_loss": -6.294482231140137, "global_step": 104394, "epoch": 2485} {"train_loss": -6.40188455581665, "global_step": 104395, "epoch": 2485} {"train_loss": -6.437048435211182, "global_step": 104396, "epoch": 2485} {"train_loss": -6.411749362945557, "global_step": 104397, "epoch": 2485} {"train_loss": -6.362109184265137, "global_step": 104398, "epoch": 2485} {"train_loss": -6.381056785583496, "global_step": 104399, "epoch": 2485} {"train_loss": -6.384235382080078, "global_step": 104400, "epoch": 2485} {"train_loss": -6.375496864318848, "global_step": 104401, "epoch": 2485} {"train_loss": -6.498401165008545, "global_step": 104402, "epoch": 2485} {"train_loss": -6.2774858474731445, "global_step": 104403, "epoch": 2485} {"train_loss": -6.416656494140625, "global_step": 104404, "epoch": 2485} {"train_loss": -6.386911392211914, "global_step": 104405, "epoch": 2485} {"train_loss": -6.437359809875488, "global_step": 104406, "epoch": 2485} {"train_loss": -6.398207187652588, "global_step": 104407, "epoch": 2485} {"train_loss": -6.469030380249023, "global_step": 104408, "epoch": 2485} {"train_loss": -6.415003776550293, "global_step": 104409, "epoch": 2485} {"train_loss": -6.403180122375488, "global_step": 104410, "epoch": 2485} {"train_loss": -6.36875749769665, "global_step": 104411, "epoch": 2485, "val_loss": 64410.86328125} {"train_loss": -6.444700717926025, "global_step": 104412, "epoch": 2486} {"train_loss": -6.329773426055908, "global_step": 104413, "epoch": 2486} {"train_loss": -6.405368804931641, "global_step": 104414, "epoch": 2486} {"train_loss": -6.375996112823486, "global_step": 104415, "epoch": 2486} {"train_loss": -6.535973072052002, "global_step": 104416, "epoch": 2486} {"train_loss": -6.383762359619141, "global_step": 104417, "epoch": 2486} {"train_loss": -6.426313400268555, "global_step": 104418, "epoch": 2486} {"train_loss": -6.34648323059082, "global_step": 104419, "epoch": 2486} {"train_loss": -6.458205223083496, "global_step": 104420, "epoch": 2486} {"train_loss": -6.508660316467285, "global_step": 104421, "epoch": 2486} {"train_loss": -6.369445323944092, "global_step": 104422, "epoch": 2486} {"train_loss": -6.4647698402404785, "global_step": 104423, "epoch": 2486} {"train_loss": -6.42621374130249, "global_step": 104424, "epoch": 2486} {"train_loss": -6.444272994995117, "global_step": 104425, "epoch": 2486} {"train_loss": -6.331974029541016, "global_step": 104426, "epoch": 2486} {"train_loss": -6.444808006286621, "global_step": 104427, "epoch": 2486} {"train_loss": -6.343342304229736, "global_step": 104428, "epoch": 2486} {"train_loss": -6.379453182220459, "global_step": 104429, "epoch": 2486} {"train_loss": -6.523332118988037, "global_step": 104430, "epoch": 2486} {"train_loss": -6.358482360839844, "global_step": 104431, "epoch": 2486} {"train_loss": -6.377777576446533, "global_step": 104432, "epoch": 2486} {"train_loss": -6.427083969116211, "global_step": 104433, "epoch": 2486} {"train_loss": -6.365312576293945, "global_step": 104434, "epoch": 2486} {"train_loss": -6.4316182136535645, "global_step": 104435, "epoch": 2486} {"train_loss": -6.444275856018066, "global_step": 104436, "epoch": 2486} {"train_loss": -6.415136337280273, "global_step": 104437, "epoch": 2486} {"train_loss": -6.383275985717773, "global_step": 104438, "epoch": 2486} {"train_loss": -6.501652717590332, "global_step": 104439, "epoch": 2486} {"train_loss": -6.465872287750244, "global_step": 104440, "epoch": 2486} {"train_loss": -6.493649959564209, "global_step": 104441, "epoch": 2486} {"train_loss": -6.473822593688965, "global_step": 104442, "epoch": 2486} {"train_loss": -6.431502342224121, "global_step": 104443, "epoch": 2486} {"train_loss": -6.423248767852783, "global_step": 104444, "epoch": 2486} {"train_loss": -6.393185138702393, "global_step": 104445, "epoch": 2486} {"train_loss": -6.576147079467773, "global_step": 104446, "epoch": 2486} {"train_loss": -6.49759578704834, "global_step": 104447, "epoch": 2486} {"train_loss": -6.324493885040283, "global_step": 104448, "epoch": 2486} {"train_loss": -6.383594512939453, "global_step": 104449, "epoch": 2486} {"train_loss": -6.520928859710693, "global_step": 104450, "epoch": 2486} {"train_loss": -6.407781600952148, "global_step": 104451, "epoch": 2486} {"train_loss": -6.540896892547607, "global_step": 104452, "epoch": 2486} {"train_loss": -6.43246374811445, "global_step": 104453, "epoch": 2486, "val_loss": 64236.68359375} {"train_loss": -6.384655952453613, "global_step": 104454, "epoch": 2487} {"train_loss": -6.517181396484375, "global_step": 104455, "epoch": 2487} {"train_loss": -6.482856273651123, "global_step": 104456, "epoch": 2487} {"train_loss": -6.434492588043213, "global_step": 104457, "epoch": 2487} {"train_loss": -6.366175651550293, "global_step": 104458, "epoch": 2487} {"train_loss": -6.353936195373535, "global_step": 104459, "epoch": 2487} {"train_loss": -6.4246907234191895, "global_step": 104460, "epoch": 2487} {"train_loss": -6.365939140319824, "global_step": 104461, "epoch": 2487} {"train_loss": -6.379058837890625, "global_step": 104462, "epoch": 2487} {"train_loss": -6.473512649536133, "global_step": 104463, "epoch": 2487} {"train_loss": -6.417171955108643, "global_step": 104464, "epoch": 2487} {"train_loss": -6.288784027099609, "global_step": 104465, "epoch": 2487} {"train_loss": -6.389998435974121, "global_step": 104466, "epoch": 2487} {"train_loss": -6.268819808959961, "global_step": 104467, "epoch": 2487} {"train_loss": -6.390050888061523, "global_step": 104468, "epoch": 2487} {"train_loss": -6.310111999511719, "global_step": 104469, "epoch": 2487} {"train_loss": -6.40932035446167, "global_step": 104470, "epoch": 2487} {"train_loss": -6.268362998962402, "global_step": 104471, "epoch": 2487} {"train_loss": -6.359318256378174, "global_step": 104472, "epoch": 2487} {"train_loss": -6.3963212966918945, "global_step": 104473, "epoch": 2487} {"train_loss": -6.308752059936523, "global_step": 104474, "epoch": 2487} {"train_loss": -6.331018447875977, "global_step": 104475, "epoch": 2487} {"train_loss": -6.293155193328857, "global_step": 104476, "epoch": 2487} {"train_loss": -6.185061454772949, "global_step": 104477, "epoch": 2487} {"train_loss": -6.331867694854736, "global_step": 104478, "epoch": 2487} {"train_loss": -6.360454082489014, "global_step": 104479, "epoch": 2487} {"train_loss": -6.458913803100586, "global_step": 104480, "epoch": 2487} {"train_loss": -6.453939437866211, "global_step": 104481, "epoch": 2487} {"train_loss": -6.367379188537598, "global_step": 104482, "epoch": 2487} {"train_loss": -6.40559196472168, "global_step": 104483, "epoch": 2487} {"train_loss": -6.399204254150391, "global_step": 104484, "epoch": 2487} {"train_loss": -6.331240653991699, "global_step": 104485, "epoch": 2487} {"train_loss": -6.458045959472656, "global_step": 104486, "epoch": 2487} {"train_loss": -6.488183975219727, "global_step": 104487, "epoch": 2487} {"train_loss": -6.3444294929504395, "global_step": 104488, "epoch": 2487} {"train_loss": -6.4149370193481445, "global_step": 104489, "epoch": 2487} {"train_loss": -6.457583427429199, "global_step": 104490, "epoch": 2487} {"train_loss": -6.517608642578125, "global_step": 104491, "epoch": 2487} {"train_loss": -6.466643333435059, "global_step": 104492, "epoch": 2487} {"train_loss": -6.305469036102295, "global_step": 104493, "epoch": 2487} {"train_loss": -6.467748165130615, "global_step": 104494, "epoch": 2487} {"train_loss": -6.38646445955549, "global_step": 104495, "epoch": 2487, "val_loss": 64536.52734375} {"train_loss": -6.433557510375977, "global_step": 104496, "epoch": 2488} {"train_loss": -6.359932899475098, "global_step": 104497, "epoch": 2488} {"train_loss": -6.399035930633545, "global_step": 104498, "epoch": 2488} {"train_loss": -6.46253776550293, "global_step": 104499, "epoch": 2488} {"train_loss": -6.4400129318237305, "global_step": 104500, "epoch": 2488} {"train_loss": -6.420047283172607, "global_step": 104501, "epoch": 2488} {"train_loss": -6.420467376708984, "global_step": 104502, "epoch": 2488} {"train_loss": -6.55582332611084, "global_step": 104503, "epoch": 2488} {"train_loss": -6.389838218688965, "global_step": 104504, "epoch": 2488} {"train_loss": -6.37248420715332, "global_step": 104505, "epoch": 2488} {"train_loss": -6.419405937194824, "global_step": 104506, "epoch": 2488} {"train_loss": -6.326035499572754, "global_step": 104507, "epoch": 2488} {"train_loss": -6.528229713439941, "global_step": 104508, "epoch": 2488} {"train_loss": -6.529018402099609, "global_step": 104509, "epoch": 2488} {"train_loss": -6.398756980895996, "global_step": 104510, "epoch": 2488} {"train_loss": -6.518088340759277, "global_step": 104511, "epoch": 2488} {"train_loss": -6.413395881652832, "global_step": 104512, "epoch": 2488} {"train_loss": -6.382433891296387, "global_step": 104513, "epoch": 2488} {"train_loss": -6.436200141906738, "global_step": 104514, "epoch": 2488} {"train_loss": -6.317559242248535, "global_step": 104515, "epoch": 2488} {"train_loss": -6.376711845397949, "global_step": 104516, "epoch": 2488} {"train_loss": -6.330584526062012, "global_step": 104517, "epoch": 2488} {"train_loss": -6.4771270751953125, "global_step": 104518, "epoch": 2488} {"train_loss": -6.3401031494140625, "global_step": 104519, "epoch": 2488} {"train_loss": -6.300925254821777, "global_step": 104520, "epoch": 2488} {"train_loss": -6.327967643737793, "global_step": 104521, "epoch": 2488} {"train_loss": -6.333540916442871, "global_step": 104522, "epoch": 2488} {"train_loss": -6.2957963943481445, "global_step": 104523, "epoch": 2488} {"train_loss": -6.42430305480957, "global_step": 104524, "epoch": 2488} {"train_loss": -6.306881427764893, "global_step": 104525, "epoch": 2488} {"train_loss": -6.492979526519775, "global_step": 104526, "epoch": 2488} {"train_loss": -6.478574752807617, "global_step": 104527, "epoch": 2488} {"train_loss": -6.431668758392334, "global_step": 104528, "epoch": 2488} {"train_loss": -6.424654960632324, "global_step": 104529, "epoch": 2488} {"train_loss": -6.379942893981934, "global_step": 104530, "epoch": 2488} {"train_loss": -6.426136016845703, "global_step": 104531, "epoch": 2488} {"train_loss": -6.468136787414551, "global_step": 104532, "epoch": 2488} {"train_loss": -6.385103702545166, "global_step": 104533, "epoch": 2488} {"train_loss": -6.4608917236328125, "global_step": 104534, "epoch": 2488} {"train_loss": -6.393400192260742, "global_step": 104535, "epoch": 2488} {"train_loss": -6.401331901550293, "global_step": 104536, "epoch": 2488} {"train_loss": -6.411683411825271, "global_step": 104537, "epoch": 2488, "val_loss": 64382.953125} {"train_loss": -6.574167728424072, "global_step": 104538, "epoch": 2489} {"train_loss": -6.426363468170166, "global_step": 104539, "epoch": 2489} {"train_loss": -6.494059085845947, "global_step": 104540, "epoch": 2489} {"train_loss": -6.4149017333984375, "global_step": 104541, "epoch": 2489} {"train_loss": -6.523789882659912, "global_step": 104542, "epoch": 2489} {"train_loss": -6.468573093414307, "global_step": 104543, "epoch": 2489} {"train_loss": -6.481119155883789, "global_step": 104544, "epoch": 2489} {"train_loss": -6.470661640167236, "global_step": 104545, "epoch": 2489} {"train_loss": -6.429896354675293, "global_step": 104546, "epoch": 2489} {"train_loss": -6.52521276473999, "global_step": 104547, "epoch": 2489} {"train_loss": -6.47312068939209, "global_step": 104548, "epoch": 2489} {"train_loss": -6.392486572265625, "global_step": 104549, "epoch": 2489} {"train_loss": -6.408444404602051, "global_step": 104550, "epoch": 2489} {"train_loss": -6.412415981292725, "global_step": 104551, "epoch": 2489} {"train_loss": -6.401674747467041, "global_step": 104552, "epoch": 2489} {"train_loss": -6.460085868835449, "global_step": 104553, "epoch": 2489} {"train_loss": -6.452145576477051, "global_step": 104554, "epoch": 2489} {"train_loss": -6.479970455169678, "global_step": 104555, "epoch": 2489} {"train_loss": -6.220226764678955, "global_step": 104556, "epoch": 2489} {"train_loss": -6.429815292358398, "global_step": 104557, "epoch": 2489} {"train_loss": -6.555652618408203, "global_step": 104558, "epoch": 2489} {"train_loss": -6.4785356521606445, "global_step": 104559, "epoch": 2489} {"train_loss": -6.574092864990234, "global_step": 104560, "epoch": 2489} {"train_loss": -6.383151054382324, "global_step": 104561, "epoch": 2489} {"train_loss": -6.4734930992126465, "global_step": 104562, "epoch": 2489} {"train_loss": -6.54062557220459, "global_step": 104563, "epoch": 2489} {"train_loss": -6.510982513427734, "global_step": 104564, "epoch": 2489} {"train_loss": -6.4662628173828125, "global_step": 104565, "epoch": 2489} {"train_loss": -6.471879005432129, "global_step": 104566, "epoch": 2489} {"train_loss": -6.321895599365234, "global_step": 104567, "epoch": 2489} {"train_loss": -6.383286952972412, "global_step": 104568, "epoch": 2489} {"train_loss": -6.277870178222656, "global_step": 104569, "epoch": 2489} {"train_loss": -6.422071933746338, "global_step": 104570, "epoch": 2489} {"train_loss": -6.307301044464111, "global_step": 104571, "epoch": 2489} {"train_loss": -6.455211639404297, "global_step": 104572, "epoch": 2489} {"train_loss": -6.366052627563477, "global_step": 104573, "epoch": 2489} {"train_loss": -6.357451915740967, "global_step": 104574, "epoch": 2489} {"train_loss": -6.529541492462158, "global_step": 104575, "epoch": 2489} {"train_loss": -6.3576273918151855, "global_step": 104576, "epoch": 2489} {"train_loss": -6.354212760925293, "global_step": 104577, "epoch": 2489} {"train_loss": -6.377140522003174, "global_step": 104578, "epoch": 2489} {"train_loss": -6.434948228654408, "global_step": 104579, "epoch": 2489, "val_loss": 64649.91796875} {"train_loss": -6.291379928588867, "global_step": 104580, "epoch": 2490} {"train_loss": -6.408299446105957, "global_step": 104581, "epoch": 2490} {"train_loss": -6.389182090759277, "global_step": 104582, "epoch": 2490} {"train_loss": -6.2939066886901855, "global_step": 104583, "epoch": 2490} {"train_loss": -6.436295986175537, "global_step": 104584, "epoch": 2490} {"train_loss": -6.3935627937316895, "global_step": 104585, "epoch": 2490} {"train_loss": -6.342075347900391, "global_step": 104586, "epoch": 2490} {"train_loss": -6.46307373046875, "global_step": 104587, "epoch": 2490} {"train_loss": -6.4471306800842285, "global_step": 104588, "epoch": 2490} {"train_loss": -6.415423393249512, "global_step": 104589, "epoch": 2490} {"train_loss": -6.3069047927856445, "global_step": 104590, "epoch": 2490} {"train_loss": -6.408505439758301, "global_step": 104591, "epoch": 2490} {"train_loss": -6.292215347290039, "global_step": 104592, "epoch": 2490} {"train_loss": -6.449104309082031, "global_step": 104593, "epoch": 2490} {"train_loss": -6.371418476104736, "global_step": 104594, "epoch": 2490} {"train_loss": -6.3652801513671875, "global_step": 104595, "epoch": 2490} {"train_loss": -6.318082809448242, "global_step": 104596, "epoch": 2490} {"train_loss": -6.344459533691406, "global_step": 104597, "epoch": 2490} {"train_loss": -6.36620569229126, "global_step": 104598, "epoch": 2490} {"train_loss": -6.533472537994385, "global_step": 104599, "epoch": 2490} {"train_loss": -6.374205589294434, "global_step": 104600, "epoch": 2490} {"train_loss": -6.4155120849609375, "global_step": 104601, "epoch": 2490} {"train_loss": -6.5181498527526855, "global_step": 104602, "epoch": 2490} {"train_loss": -6.212175369262695, "global_step": 104603, "epoch": 2490} {"train_loss": -6.413158893585205, "global_step": 104604, "epoch": 2490} {"train_loss": -6.456617832183838, "global_step": 104605, "epoch": 2490} {"train_loss": -6.408715724945068, "global_step": 104606, "epoch": 2490} {"train_loss": -6.496452331542969, "global_step": 104607, "epoch": 2490} {"train_loss": -6.466470718383789, "global_step": 104608, "epoch": 2490} {"train_loss": -6.273229598999023, "global_step": 104609, "epoch": 2490} {"train_loss": -6.420381546020508, "global_step": 104610, "epoch": 2490} {"train_loss": -6.271647930145264, "global_step": 104611, "epoch": 2490} {"train_loss": -6.34207820892334, "global_step": 104612, "epoch": 2490} {"train_loss": -6.445500373840332, "global_step": 104613, "epoch": 2490} {"train_loss": -6.33093786239624, "global_step": 104614, "epoch": 2490} {"train_loss": -6.313577651977539, "global_step": 104615, "epoch": 2490} {"train_loss": -6.45550537109375, "global_step": 104616, "epoch": 2490} {"train_loss": -6.3497490882873535, "global_step": 104617, "epoch": 2490} {"train_loss": -6.415565490722656, "global_step": 104618, "epoch": 2490} {"train_loss": -6.419600963592529, "global_step": 104619, "epoch": 2490} {"train_loss": -6.424177169799805, "global_step": 104620, "epoch": 2490} {"train_loss": -6.388463292803083, "global_step": 104621, "epoch": 2490, "val_loss": 64299.27734375} {"train_loss": -6.455778121948242, "global_step": 104622, "epoch": 2491} {"train_loss": -6.337205410003662, "global_step": 104623, "epoch": 2491} {"train_loss": -6.3629961013793945, "global_step": 104624, "epoch": 2491} {"train_loss": -6.312106132507324, "global_step": 104625, "epoch": 2491} {"train_loss": -6.236634254455566, "global_step": 104626, "epoch": 2491} {"train_loss": -6.402736663818359, "global_step": 104627, "epoch": 2491} {"train_loss": -6.4796977043151855, "global_step": 104628, "epoch": 2491} {"train_loss": -6.28639554977417, "global_step": 104629, "epoch": 2491} {"train_loss": -6.388782501220703, "global_step": 104630, "epoch": 2491} {"train_loss": -6.462395191192627, "global_step": 104631, "epoch": 2491} {"train_loss": -6.383375644683838, "global_step": 104632, "epoch": 2491} {"train_loss": -6.328341960906982, "global_step": 104633, "epoch": 2491} {"train_loss": -6.282548904418945, "global_step": 104634, "epoch": 2491} {"train_loss": -6.457337379455566, "global_step": 104635, "epoch": 2491} {"train_loss": -6.427562713623047, "global_step": 104636, "epoch": 2491} {"train_loss": -6.26008939743042, "global_step": 104637, "epoch": 2491} {"train_loss": -6.3788347244262695, "global_step": 104638, "epoch": 2491} {"train_loss": -6.232855796813965, "global_step": 104639, "epoch": 2491} {"train_loss": -6.465959072113037, "global_step": 104640, "epoch": 2491} {"train_loss": -6.397361755371094, "global_step": 104641, "epoch": 2491} {"train_loss": -6.3406081199646, "global_step": 104642, "epoch": 2491} {"train_loss": -6.443092346191406, "global_step": 104643, "epoch": 2491} {"train_loss": -6.3546037673950195, "global_step": 104644, "epoch": 2491} {"train_loss": -6.3960795402526855, "global_step": 104645, "epoch": 2491} {"train_loss": -6.4248576164245605, "global_step": 104646, "epoch": 2491} {"train_loss": -6.433474540710449, "global_step": 104647, "epoch": 2491} {"train_loss": -6.329975128173828, "global_step": 104648, "epoch": 2491} {"train_loss": -6.318662166595459, "global_step": 104649, "epoch": 2491} {"train_loss": -6.497791767120361, "global_step": 104650, "epoch": 2491} {"train_loss": -6.360875129699707, "global_step": 104651, "epoch": 2491} {"train_loss": -6.408292293548584, "global_step": 104652, "epoch": 2491} {"train_loss": -6.3455023765563965, "global_step": 104653, "epoch": 2491} {"train_loss": -6.504620552062988, "global_step": 104654, "epoch": 2491} {"train_loss": -6.4049763679504395, "global_step": 104655, "epoch": 2491} {"train_loss": -6.369055271148682, "global_step": 104656, "epoch": 2491} {"train_loss": -6.467134475708008, "global_step": 104657, "epoch": 2491} {"train_loss": -6.404646873474121, "global_step": 104658, "epoch": 2491} {"train_loss": -6.365945816040039, "global_step": 104659, "epoch": 2491} {"train_loss": -6.497821807861328, "global_step": 104660, "epoch": 2491} {"train_loss": -6.456661224365234, "global_step": 104661, "epoch": 2491} {"train_loss": -6.292430400848389, "global_step": 104662, "epoch": 2491} {"train_loss": -6.385211059025356, "global_step": 104663, "epoch": 2491, "val_loss": 64559.25} {"train_loss": -6.4293928146362305, "global_step": 104664, "epoch": 2492} {"train_loss": -6.272743225097656, "global_step": 104665, "epoch": 2492} {"train_loss": -6.264157295227051, "global_step": 104666, "epoch": 2492} {"train_loss": -6.308710098266602, "global_step": 104667, "epoch": 2492} {"train_loss": -6.039039134979248, "global_step": 104668, "epoch": 2492} {"train_loss": -6.359066963195801, "global_step": 104669, "epoch": 2492} {"train_loss": -5.9423723220825195, "global_step": 104670, "epoch": 2492} {"train_loss": -6.226578712463379, "global_step": 104671, "epoch": 2492} {"train_loss": -6.1572041511535645, "global_step": 104672, "epoch": 2492} {"train_loss": -6.262007713317871, "global_step": 104673, "epoch": 2492} {"train_loss": -6.235490322113037, "global_step": 104674, "epoch": 2492} {"train_loss": -6.305801868438721, "global_step": 104675, "epoch": 2492} {"train_loss": -6.222723960876465, "global_step": 104676, "epoch": 2492} {"train_loss": -6.389427185058594, "global_step": 104677, "epoch": 2492} {"train_loss": -6.192876815795898, "global_step": 104678, "epoch": 2492} {"train_loss": -6.317430019378662, "global_step": 104679, "epoch": 2492} {"train_loss": -6.234886169433594, "global_step": 104680, "epoch": 2492} {"train_loss": -6.315069675445557, "global_step": 104681, "epoch": 2492} {"train_loss": -6.327747344970703, "global_step": 104682, "epoch": 2492} {"train_loss": -6.276108741760254, "global_step": 104683, "epoch": 2492} {"train_loss": -6.299203872680664, "global_step": 104684, "epoch": 2492} {"train_loss": -6.241377830505371, "global_step": 104685, "epoch": 2492} {"train_loss": -6.251148223876953, "global_step": 104686, "epoch": 2492} {"train_loss": -6.338733196258545, "global_step": 104687, "epoch": 2492} {"train_loss": -6.3240814208984375, "global_step": 104688, "epoch": 2492} {"train_loss": -6.342819690704346, "global_step": 104689, "epoch": 2492} {"train_loss": -6.465115547180176, "global_step": 104690, "epoch": 2492} {"train_loss": -6.2839555740356445, "global_step": 104691, "epoch": 2492} {"train_loss": -6.335768222808838, "global_step": 104692, "epoch": 2492} {"train_loss": -6.435506343841553, "global_step": 104693, "epoch": 2492} {"train_loss": -6.407268524169922, "global_step": 104694, "epoch": 2492} {"train_loss": -6.378471374511719, "global_step": 104695, "epoch": 2492} {"train_loss": -6.489133358001709, "global_step": 104696, "epoch": 2492} {"train_loss": -6.251799583435059, "global_step": 104697, "epoch": 2492} {"train_loss": -6.434704780578613, "global_step": 104698, "epoch": 2492} {"train_loss": -6.432552814483643, "global_step": 104699, "epoch": 2492} {"train_loss": -6.4053730964660645, "global_step": 104700, "epoch": 2492} {"train_loss": -6.45222282409668, "global_step": 104701, "epoch": 2492} {"train_loss": -6.367196083068848, "global_step": 104702, "epoch": 2492} {"train_loss": -6.4711809158325195, "global_step": 104703, "epoch": 2492} {"train_loss": -6.4554266929626465, "global_step": 104704, "epoch": 2492} {"train_loss": -6.318507796242123, "global_step": 104705, "epoch": 2492, "val_loss": 64478.0703125} {"train_loss": -6.420503616333008, "global_step": 104706, "epoch": 2493} {"train_loss": -6.378085136413574, "global_step": 104707, "epoch": 2493} {"train_loss": -6.450368404388428, "global_step": 104708, "epoch": 2493} {"train_loss": -6.431388854980469, "global_step": 104709, "epoch": 2493} {"train_loss": -6.343279838562012, "global_step": 104710, "epoch": 2493} {"train_loss": -6.438819885253906, "global_step": 104711, "epoch": 2493} {"train_loss": -6.389429092407227, "global_step": 104712, "epoch": 2493} {"train_loss": -6.315823554992676, "global_step": 104713, "epoch": 2493} {"train_loss": -6.439583778381348, "global_step": 104714, "epoch": 2493} {"train_loss": -6.228997230529785, "global_step": 104715, "epoch": 2493} {"train_loss": -6.468595027923584, "global_step": 104716, "epoch": 2493} {"train_loss": -6.400909900665283, "global_step": 104717, "epoch": 2493} {"train_loss": -6.502265930175781, "global_step": 104718, "epoch": 2493} {"train_loss": -6.380168914794922, "global_step": 104719, "epoch": 2493} {"train_loss": -6.39816951751709, "global_step": 104720, "epoch": 2493} {"train_loss": -6.456870079040527, "global_step": 104721, "epoch": 2493} {"train_loss": -6.414760112762451, "global_step": 104722, "epoch": 2493} {"train_loss": -6.367879867553711, "global_step": 104723, "epoch": 2493} {"train_loss": -6.44462251663208, "global_step": 104724, "epoch": 2493} {"train_loss": -6.477240562438965, "global_step": 104725, "epoch": 2493} {"train_loss": -6.430563926696777, "global_step": 104726, "epoch": 2493} {"train_loss": -6.38893985748291, "global_step": 104727, "epoch": 2493} {"train_loss": -6.467720031738281, "global_step": 104728, "epoch": 2493} {"train_loss": -6.450489044189453, "global_step": 104729, "epoch": 2493} {"train_loss": -6.407174110412598, "global_step": 104730, "epoch": 2493} {"train_loss": -6.372311592102051, "global_step": 104731, "epoch": 2493} {"train_loss": -6.457019805908203, "global_step": 104732, "epoch": 2493} {"train_loss": -6.401596546173096, "global_step": 104733, "epoch": 2493} {"train_loss": -6.369993209838867, "global_step": 104734, "epoch": 2493} {"train_loss": -6.2884392738342285, "global_step": 104735, "epoch": 2493} {"train_loss": -6.364470481872559, "global_step": 104736, "epoch": 2493} {"train_loss": -6.362888336181641, "global_step": 104737, "epoch": 2493} {"train_loss": -6.446284770965576, "global_step": 104738, "epoch": 2493} {"train_loss": -6.4282636642456055, "global_step": 104739, "epoch": 2493} {"train_loss": -6.350054740905762, "global_step": 104740, "epoch": 2493} {"train_loss": -6.438761234283447, "global_step": 104741, "epoch": 2493} {"train_loss": -6.311681270599365, "global_step": 104742, "epoch": 2493} {"train_loss": -6.407539367675781, "global_step": 104743, "epoch": 2493} {"train_loss": -6.295993328094482, "global_step": 104744, "epoch": 2493} {"train_loss": -6.449501991271973, "global_step": 104745, "epoch": 2493} {"train_loss": -6.434264183044434, "global_step": 104746, "epoch": 2493} {"train_loss": -6.399316424415225, "global_step": 104747, "epoch": 2493, "val_loss": 64406.46875} {"train_loss": -6.342212200164795, "global_step": 104748, "epoch": 2494} {"train_loss": -6.329165458679199, "global_step": 104749, "epoch": 2494} {"train_loss": -6.39051628112793, "global_step": 104750, "epoch": 2494} {"train_loss": -6.482342720031738, "global_step": 104751, "epoch": 2494} {"train_loss": -6.311724662780762, "global_step": 104752, "epoch": 2494} {"train_loss": -6.411283493041992, "global_step": 104753, "epoch": 2494} {"train_loss": -6.504667282104492, "global_step": 104754, "epoch": 2494} {"train_loss": -6.307121753692627, "global_step": 104755, "epoch": 2494} {"train_loss": -6.314101219177246, "global_step": 104756, "epoch": 2494} {"train_loss": -6.536341190338135, "global_step": 104757, "epoch": 2494} {"train_loss": -6.4452104568481445, "global_step": 104758, "epoch": 2494} {"train_loss": -6.387650966644287, "global_step": 104759, "epoch": 2494} {"train_loss": -6.362925052642822, "global_step": 104760, "epoch": 2494} {"train_loss": -6.324540138244629, "global_step": 104761, "epoch": 2494} {"train_loss": -6.384426116943359, "global_step": 104762, "epoch": 2494} {"train_loss": -6.391324043273926, "global_step": 104763, "epoch": 2494} {"train_loss": -6.423428535461426, "global_step": 104764, "epoch": 2494} {"train_loss": -6.466573715209961, "global_step": 104765, "epoch": 2494} {"train_loss": -6.353081703186035, "global_step": 104766, "epoch": 2494} {"train_loss": -6.415970325469971, "global_step": 104767, "epoch": 2494} {"train_loss": -6.489814758300781, "global_step": 104768, "epoch": 2494} {"train_loss": -6.42183256149292, "global_step": 104769, "epoch": 2494} {"train_loss": -6.369508743286133, "global_step": 104770, "epoch": 2494} {"train_loss": -6.483757019042969, "global_step": 104771, "epoch": 2494} {"train_loss": -6.452021598815918, "global_step": 104772, "epoch": 2494} {"train_loss": -6.449689865112305, "global_step": 104773, "epoch": 2494} {"train_loss": -6.556312084197998, "global_step": 104774, "epoch": 2494} {"train_loss": -6.461450099945068, "global_step": 104775, "epoch": 2494} {"train_loss": -6.524324417114258, "global_step": 104776, "epoch": 2494} {"train_loss": -6.4653120040893555, "global_step": 104777, "epoch": 2494} {"train_loss": -6.48052453994751, "global_step": 104778, "epoch": 2494} {"train_loss": -6.472180366516113, "global_step": 104779, "epoch": 2494} {"train_loss": -6.459237575531006, "global_step": 104780, "epoch": 2494} {"train_loss": -6.4862446784973145, "global_step": 104781, "epoch": 2494} {"train_loss": -6.4824323654174805, "global_step": 104782, "epoch": 2494} {"train_loss": -6.368454933166504, "global_step": 104783, "epoch": 2494} {"train_loss": -6.459888935089111, "global_step": 104784, "epoch": 2494} {"train_loss": -6.4593610763549805, "global_step": 104785, "epoch": 2494} {"train_loss": -6.367304801940918, "global_step": 104786, "epoch": 2494} {"train_loss": -6.379238128662109, "global_step": 104787, "epoch": 2494} {"train_loss": -6.312480926513672, "global_step": 104788, "epoch": 2494} {"train_loss": -6.424382573082333, "global_step": 104789, "epoch": 2494, "val_loss": 64319.12109375} {"train_loss": -6.542352676391602, "global_step": 104790, "epoch": 2495} {"train_loss": -6.491297245025635, "global_step": 104791, "epoch": 2495} {"train_loss": -6.460931301116943, "global_step": 104792, "epoch": 2495} {"train_loss": -6.409980773925781, "global_step": 104793, "epoch": 2495} {"train_loss": -6.446333885192871, "global_step": 104794, "epoch": 2495} {"train_loss": -6.451681137084961, "global_step": 104795, "epoch": 2495} {"train_loss": -6.430948257446289, "global_step": 104796, "epoch": 2495} {"train_loss": -6.438408851623535, "global_step": 104797, "epoch": 2495} {"train_loss": -6.342887878417969, "global_step": 104798, "epoch": 2495} {"train_loss": -6.555102348327637, "global_step": 104799, "epoch": 2495} {"train_loss": -6.358180046081543, "global_step": 104800, "epoch": 2495} {"train_loss": -6.424476623535156, "global_step": 104801, "epoch": 2495} {"train_loss": -6.479985237121582, "global_step": 104802, "epoch": 2495} {"train_loss": -6.4150872230529785, "global_step": 104803, "epoch": 2495} {"train_loss": -6.466930389404297, "global_step": 104804, "epoch": 2495} {"train_loss": -6.34112548828125, "global_step": 104805, "epoch": 2495} {"train_loss": -6.342516899108887, "global_step": 104806, "epoch": 2495} {"train_loss": -6.513444423675537, "global_step": 104807, "epoch": 2495} {"train_loss": -6.305197238922119, "global_step": 104808, "epoch": 2495} {"train_loss": -6.4633073806762695, "global_step": 104809, "epoch": 2495} {"train_loss": -6.499148368835449, "global_step": 104810, "epoch": 2495} {"train_loss": -6.479866981506348, "global_step": 104811, "epoch": 2495} {"train_loss": -6.430419445037842, "global_step": 104812, "epoch": 2495} {"train_loss": -6.445516109466553, "global_step": 104813, "epoch": 2495} {"train_loss": -6.528354644775391, "global_step": 104814, "epoch": 2495} {"train_loss": -6.407777786254883, "global_step": 104815, "epoch": 2495} {"train_loss": -6.458355903625488, "global_step": 104816, "epoch": 2495} {"train_loss": -6.382089614868164, "global_step": 104817, "epoch": 2495} {"train_loss": -6.486665725708008, "global_step": 104818, "epoch": 2495} {"train_loss": -6.595628261566162, "global_step": 104819, "epoch": 2495} {"train_loss": -6.37751579284668, "global_step": 104820, "epoch": 2495} {"train_loss": -6.421415328979492, "global_step": 104821, "epoch": 2495} {"train_loss": -6.5372748374938965, "global_step": 104822, "epoch": 2495} {"train_loss": -6.436184883117676, "global_step": 104823, "epoch": 2495} {"train_loss": -6.491957187652588, "global_step": 104824, "epoch": 2495} {"train_loss": -6.426676273345947, "global_step": 104825, "epoch": 2495} {"train_loss": -6.411961078643799, "global_step": 104826, "epoch": 2495} {"train_loss": -6.4240217208862305, "global_step": 104827, "epoch": 2495} {"train_loss": -6.333089828491211, "global_step": 104828, "epoch": 2495} {"train_loss": -6.40794563293457, "global_step": 104829, "epoch": 2495} {"train_loss": -6.413338661193848, "global_step": 104830, "epoch": 2495} {"train_loss": -6.435885134197417, "global_step": 104831, "epoch": 2495, "val_loss": 64510.390625} {"train_loss": -6.502806663513184, "global_step": 104832, "epoch": 2496} {"train_loss": -6.467463970184326, "global_step": 104833, "epoch": 2496} {"train_loss": -6.261541366577148, "global_step": 104834, "epoch": 2496} {"train_loss": -6.386140823364258, "global_step": 104835, "epoch": 2496} {"train_loss": -6.280528545379639, "global_step": 104836, "epoch": 2496} {"train_loss": -6.511873722076416, "global_step": 104837, "epoch": 2496} {"train_loss": -6.543615341186523, "global_step": 104838, "epoch": 2496} {"train_loss": -6.356550216674805, "global_step": 104839, "epoch": 2496} {"train_loss": -6.480236053466797, "global_step": 104840, "epoch": 2496} {"train_loss": -6.34266471862793, "global_step": 104841, "epoch": 2496} {"train_loss": -6.484571933746338, "global_step": 104842, "epoch": 2496} {"train_loss": -6.4296417236328125, "global_step": 104843, "epoch": 2496} {"train_loss": -6.388434410095215, "global_step": 104844, "epoch": 2496} {"train_loss": -6.422313213348389, "global_step": 104845, "epoch": 2496} {"train_loss": -6.485644340515137, "global_step": 104846, "epoch": 2496} {"train_loss": -6.440675735473633, "global_step": 104847, "epoch": 2496} {"train_loss": -6.523158073425293, "global_step": 104848, "epoch": 2496} {"train_loss": -6.476780414581299, "global_step": 104849, "epoch": 2496} {"train_loss": -6.592355728149414, "global_step": 104850, "epoch": 2496} {"train_loss": -6.416726112365723, "global_step": 104851, "epoch": 2496} {"train_loss": -6.426220417022705, "global_step": 104852, "epoch": 2496} {"train_loss": -6.470804691314697, "global_step": 104853, "epoch": 2496} {"train_loss": -6.407268524169922, "global_step": 104854, "epoch": 2496} {"train_loss": -6.421335220336914, "global_step": 104855, "epoch": 2496} {"train_loss": -6.376967430114746, "global_step": 104856, "epoch": 2496} {"train_loss": -6.417563438415527, "global_step": 104857, "epoch": 2496} {"train_loss": -6.399517059326172, "global_step": 104858, "epoch": 2496} {"train_loss": -6.5558247566223145, "global_step": 104859, "epoch": 2496} {"train_loss": -6.4168806076049805, "global_step": 104860, "epoch": 2496} {"train_loss": -6.400421619415283, "global_step": 104861, "epoch": 2496} {"train_loss": -6.450366973876953, "global_step": 104862, "epoch": 2496} {"train_loss": -6.439714431762695, "global_step": 104863, "epoch": 2496} {"train_loss": -6.384312629699707, "global_step": 104864, "epoch": 2496} {"train_loss": -6.357306957244873, "global_step": 104865, "epoch": 2496} {"train_loss": -6.430896759033203, "global_step": 104866, "epoch": 2496} {"train_loss": -6.439407825469971, "global_step": 104867, "epoch": 2496} {"train_loss": -6.355851173400879, "global_step": 104868, "epoch": 2496} {"train_loss": -6.39922571182251, "global_step": 104869, "epoch": 2496} {"train_loss": -6.419174671173096, "global_step": 104870, "epoch": 2496} {"train_loss": -6.470633506774902, "global_step": 104871, "epoch": 2496} {"train_loss": -6.448639869689941, "global_step": 104872, "epoch": 2496} {"train_loss": -6.431397222337269, "global_step": 104873, "epoch": 2496, "val_loss": 64376.00390625} {"train_loss": -6.45864200592041, "global_step": 104874, "epoch": 2497} {"train_loss": -6.470328330993652, "global_step": 104875, "epoch": 2497} {"train_loss": -6.503557205200195, "global_step": 104876, "epoch": 2497} {"train_loss": -6.516115665435791, "global_step": 104877, "epoch": 2497} {"train_loss": -6.424637317657471, "global_step": 104878, "epoch": 2497} {"train_loss": -6.474998474121094, "global_step": 104879, "epoch": 2497} {"train_loss": -6.446368217468262, "global_step": 104880, "epoch": 2497} {"train_loss": -6.418856620788574, "global_step": 104881, "epoch": 2497} {"train_loss": -6.5313920974731445, "global_step": 104882, "epoch": 2497} {"train_loss": -6.333738803863525, "global_step": 104883, "epoch": 2497} {"train_loss": -6.465109825134277, "global_step": 104884, "epoch": 2497} {"train_loss": -6.359201431274414, "global_step": 104885, "epoch": 2497} {"train_loss": -6.505216598510742, "global_step": 104886, "epoch": 2497} {"train_loss": -6.451329231262207, "global_step": 104887, "epoch": 2497} {"train_loss": -6.453264236450195, "global_step": 104888, "epoch": 2497} {"train_loss": -6.429991245269775, "global_step": 104889, "epoch": 2497} {"train_loss": -6.435817718505859, "global_step": 104890, "epoch": 2497} {"train_loss": -6.488329887390137, "global_step": 104891, "epoch": 2497} {"train_loss": -6.451709270477295, "global_step": 104892, "epoch": 2497} {"train_loss": -6.404476165771484, "global_step": 104893, "epoch": 2497} {"train_loss": -6.499481678009033, "global_step": 104894, "epoch": 2497} {"train_loss": -6.405426025390625, "global_step": 104895, "epoch": 2497} {"train_loss": -6.440639019012451, "global_step": 104896, "epoch": 2497} {"train_loss": -6.364583969116211, "global_step": 104897, "epoch": 2497} {"train_loss": -6.427740097045898, "global_step": 104898, "epoch": 2497} {"train_loss": -6.376908302307129, "global_step": 104899, "epoch": 2497} {"train_loss": -6.41644811630249, "global_step": 104900, "epoch": 2497} {"train_loss": -6.579174995422363, "global_step": 104901, "epoch": 2497} {"train_loss": -6.527910232543945, "global_step": 104902, "epoch": 2497} {"train_loss": -6.375271797180176, "global_step": 104903, "epoch": 2497} {"train_loss": -6.407112121582031, "global_step": 104904, "epoch": 2497} {"train_loss": -6.3789381980896, "global_step": 104905, "epoch": 2497} {"train_loss": -6.491373538970947, "global_step": 104906, "epoch": 2497} {"train_loss": -6.455779552459717, "global_step": 104907, "epoch": 2497} {"train_loss": -6.478302955627441, "global_step": 104908, "epoch": 2497} {"train_loss": -6.44066858291626, "global_step": 104909, "epoch": 2497} {"train_loss": -6.40669584274292, "global_step": 104910, "epoch": 2497} {"train_loss": -6.429523468017578, "global_step": 104911, "epoch": 2497} {"train_loss": -6.359508514404297, "global_step": 104912, "epoch": 2497} {"train_loss": -6.400590896606445, "global_step": 104913, "epoch": 2497} {"train_loss": -6.5110602378845215, "global_step": 104914, "epoch": 2497} {"train_loss": -6.446878728412447, "global_step": 104915, "epoch": 2497, "val_loss": 64492.546875} {"train_loss": -6.491336345672607, "global_step": 104916, "epoch": 2498} {"train_loss": -6.366045951843262, "global_step": 104917, "epoch": 2498} {"train_loss": -6.474059581756592, "global_step": 104918, "epoch": 2498} {"train_loss": -6.333126068115234, "global_step": 104919, "epoch": 2498} {"train_loss": -6.436860084533691, "global_step": 104920, "epoch": 2498} {"train_loss": -6.544183731079102, "global_step": 104921, "epoch": 2498} {"train_loss": -6.435964584350586, "global_step": 104922, "epoch": 2498} {"train_loss": -6.372140407562256, "global_step": 104923, "epoch": 2498} {"train_loss": -6.475161075592041, "global_step": 104924, "epoch": 2498} {"train_loss": -6.260594367980957, "global_step": 104925, "epoch": 2498} {"train_loss": -6.383294105529785, "global_step": 104926, "epoch": 2498} {"train_loss": -6.383172035217285, "global_step": 104927, "epoch": 2498} {"train_loss": -6.314138412475586, "global_step": 104928, "epoch": 2498} {"train_loss": -6.5085296630859375, "global_step": 104929, "epoch": 2498} {"train_loss": -6.281889915466309, "global_step": 104930, "epoch": 2498} {"train_loss": -6.437571048736572, "global_step": 104931, "epoch": 2498} {"train_loss": -6.408308982849121, "global_step": 104932, "epoch": 2498} {"train_loss": -6.282100677490234, "global_step": 104933, "epoch": 2498} {"train_loss": -6.504541397094727, "global_step": 104934, "epoch": 2498} {"train_loss": -6.367824554443359, "global_step": 104935, "epoch": 2498} {"train_loss": -6.417287826538086, "global_step": 104936, "epoch": 2498} {"train_loss": -6.451311111450195, "global_step": 104937, "epoch": 2498} {"train_loss": -6.32972526550293, "global_step": 104938, "epoch": 2498} {"train_loss": -6.422529220581055, "global_step": 104939, "epoch": 2498} {"train_loss": -6.3782453536987305, "global_step": 104940, "epoch": 2498} {"train_loss": -6.4127068519592285, "global_step": 104941, "epoch": 2498} {"train_loss": -6.432308197021484, "global_step": 104942, "epoch": 2498} {"train_loss": -6.291444778442383, "global_step": 104943, "epoch": 2498} {"train_loss": -6.501888275146484, "global_step": 104944, "epoch": 2498} {"train_loss": -6.390246391296387, "global_step": 104945, "epoch": 2498} {"train_loss": -6.453022003173828, "global_step": 104946, "epoch": 2498} {"train_loss": -6.390888214111328, "global_step": 104947, "epoch": 2498} {"train_loss": -6.334403991699219, "global_step": 104948, "epoch": 2498} {"train_loss": -6.395318984985352, "global_step": 104949, "epoch": 2498} {"train_loss": -6.47570276260376, "global_step": 104950, "epoch": 2498} {"train_loss": -6.348093032836914, "global_step": 104951, "epoch": 2498} {"train_loss": -6.293241024017334, "global_step": 104952, "epoch": 2498} {"train_loss": -6.367361068725586, "global_step": 104953, "epoch": 2498} {"train_loss": -6.4582672119140625, "global_step": 104954, "epoch": 2498} {"train_loss": -6.56691837310791, "global_step": 104955, "epoch": 2498} {"train_loss": -6.398298263549805, "global_step": 104956, "epoch": 2498} {"train_loss": -6.404187531698318, "global_step": 104957, "epoch": 2498, "val_loss": 64568.234375} {"train_loss": -6.448528289794922, "global_step": 104958, "epoch": 2499} {"train_loss": -6.456277370452881, "global_step": 104959, "epoch": 2499} {"train_loss": -6.405426025390625, "global_step": 104960, "epoch": 2499} {"train_loss": -6.374351501464844, "global_step": 104961, "epoch": 2499} {"train_loss": -6.493847370147705, "global_step": 104962, "epoch": 2499} {"train_loss": -6.296866416931152, "global_step": 104963, "epoch": 2499} {"train_loss": -6.418037414550781, "global_step": 104964, "epoch": 2499} {"train_loss": -6.4350762367248535, "global_step": 104965, "epoch": 2499} {"train_loss": -6.332913398742676, "global_step": 104966, "epoch": 2499} {"train_loss": -6.416719913482666, "global_step": 104967, "epoch": 2499} {"train_loss": -6.459238052368164, "global_step": 104968, "epoch": 2499} {"train_loss": -6.308023929595947, "global_step": 104969, "epoch": 2499} {"train_loss": -6.363354682922363, "global_step": 104970, "epoch": 2499} {"train_loss": -6.448356628417969, "global_step": 104971, "epoch": 2499} {"train_loss": -6.375483989715576, "global_step": 104972, "epoch": 2499} {"train_loss": -6.343987464904785, "global_step": 104973, "epoch": 2499} {"train_loss": -6.334621429443359, "global_step": 104974, "epoch": 2499} {"train_loss": -6.406084060668945, "global_step": 104975, "epoch": 2499} {"train_loss": -6.335475921630859, "global_step": 104976, "epoch": 2499} {"train_loss": -6.391380310058594, "global_step": 104977, "epoch": 2499} {"train_loss": -6.390069961547852, "global_step": 104978, "epoch": 2499} {"train_loss": -6.417006492614746, "global_step": 104979, "epoch": 2499} {"train_loss": -6.327203750610352, "global_step": 104980, "epoch": 2499} {"train_loss": -6.3860039710998535, "global_step": 104981, "epoch": 2499} {"train_loss": -6.456449031829834, "global_step": 104982, "epoch": 2499} {"train_loss": -6.450339317321777, "global_step": 104983, "epoch": 2499} {"train_loss": -6.337784767150879, "global_step": 104984, "epoch": 2499} {"train_loss": -6.4199323654174805, "global_step": 104985, "epoch": 2499} {"train_loss": -6.379757881164551, "global_step": 104986, "epoch": 2499} {"train_loss": -6.294510841369629, "global_step": 104987, "epoch": 2499} {"train_loss": -6.500409126281738, "global_step": 104988, "epoch": 2499} {"train_loss": -6.419081211090088, "global_step": 104989, "epoch": 2499} {"train_loss": -6.477640151977539, "global_step": 104990, "epoch": 2499} {"train_loss": -6.394369125366211, "global_step": 104991, "epoch": 2499} {"train_loss": -6.4868083000183105, "global_step": 104992, "epoch": 2499} {"train_loss": -6.497847080230713, "global_step": 104993, "epoch": 2499} {"train_loss": -6.513936996459961, "global_step": 104994, "epoch": 2499} {"train_loss": -6.434816360473633, "global_step": 104995, "epoch": 2499} {"train_loss": -6.370514869689941, "global_step": 104996, "epoch": 2499} {"train_loss": -6.520252227783203, "global_step": 104997, "epoch": 2499} {"train_loss": -6.446290493011475, "global_step": 104998, "epoch": 2499} {"train_loss": -6.409824870881581, "global_step": 104999, "epoch": 2499, "val_loss": 64393.63671875} {"train_loss": -6.353299140930176, "global_step": 105000, "epoch": 2500} {"train_loss": -6.46268892288208, "global_step": 105001, "epoch": 2500} {"train_loss": -6.513291835784912, "global_step": 105002, "epoch": 2500} {"train_loss": -6.420424461364746, "global_step": 105003, "epoch": 2500} {"train_loss": -6.435966968536377, "global_step": 105004, "epoch": 2500} {"train_loss": -6.514777183532715, "global_step": 105005, "epoch": 2500} {"train_loss": -6.551887512207031, "global_step": 105006, "epoch": 2500} {"train_loss": -6.492435455322266, "global_step": 105007, "epoch": 2500} {"train_loss": -6.336463928222656, "global_step": 105008, "epoch": 2500} {"train_loss": -6.557019233703613, "global_step": 105009, "epoch": 2500} {"train_loss": -6.3929924964904785, "global_step": 105010, "epoch": 2500} {"train_loss": -6.465707302093506, "global_step": 105011, "epoch": 2500} {"train_loss": -6.405444145202637, "global_step": 105012, "epoch": 2500} {"train_loss": -6.423929214477539, "global_step": 105013, "epoch": 2500} {"train_loss": -6.314352035522461, "global_step": 105014, "epoch": 2500} {"train_loss": -6.433378219604492, "global_step": 105015, "epoch": 2500} {"train_loss": -6.521270275115967, "global_step": 105016, "epoch": 2500} {"train_loss": -6.398180961608887, "global_step": 105017, "epoch": 2500} {"train_loss": -6.424449920654297, "global_step": 105018, "epoch": 2500} {"train_loss": -6.563751697540283, "global_step": 105019, "epoch": 2500} {"train_loss": -6.485211372375488, "global_step": 105020, "epoch": 2500} {"train_loss": -6.45577335357666, "global_step": 105021, "epoch": 2500} {"train_loss": -6.559499263763428, "global_step": 105022, "epoch": 2500} {"train_loss": -6.374011993408203, "global_step": 105023, "epoch": 2500} {"train_loss": -6.5005598068237305, "global_step": 105024, "epoch": 2500} {"train_loss": -6.517885208129883, "global_step": 105025, "epoch": 2500} {"train_loss": -6.428930759429932, "global_step": 105026, "epoch": 2500} {"train_loss": -6.536983966827393, "global_step": 105027, "epoch": 2500} {"train_loss": -6.41216516494751, "global_step": 105028, "epoch": 2500} {"train_loss": -6.425068378448486, "global_step": 105029, "epoch": 2500} {"train_loss": -6.401976108551025, "global_step": 105030, "epoch": 2500} {"train_loss": -6.462152481079102, "global_step": 105031, "epoch": 2500} {"train_loss": -6.457576751708984, "global_step": 105032, "epoch": 2500} {"train_loss": -6.439627647399902, "global_step": 105033, "epoch": 2500} {"train_loss": -6.347243309020996, "global_step": 105034, "epoch": 2500} {"train_loss": -6.4336934089660645, "global_step": 105035, "epoch": 2500} {"train_loss": -6.357051372528076, "global_step": 105036, "epoch": 2500} {"train_loss": -6.4947428703308105, "global_step": 105037, "epoch": 2500} {"train_loss": -6.419751167297363, "global_step": 105038, "epoch": 2500} {"train_loss": -6.366264343261719, "global_step": 105039, "epoch": 2500} {"train_loss": -6.362654685974121, "global_step": 105040, "epoch": 2500} {"train_loss": -6.445463600612822, "global_step": 105041, "epoch": 2500, "train/sim_max_reward_0": 0.9270446293427806, "train/sim_max_reward_1": 0.8286763611615577, "train/sim_max_reward_2": 0.9507233649512076, "train/sim_max_reward_3": 0.12837326463869955, "train/sim_max_reward_4": 0.9670554917352957, "train/sim_max_reward_5": 0.7939620468090356, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5739192660856793, "test/sim_max_reward_4300002": 0.8658894310521126, "test/sim_max_reward_4300003": 0.7890788696762641, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8921991983807264, "test/sim_max_reward_4300006": 0.8464728869768314, "test/sim_max_reward_4300007": 0.3129914357330199, "test/sim_max_reward_4300008": 0.8189109429318866, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9191394474942546, "test/sim_max_reward_4300012": 0.8624262651056179, "test/sim_max_reward_4300013": 0.6667042701135352, "test/sim_max_reward_4300014": 0.8385412688613917, "test/sim_max_reward_4300015": 0.970036761831589, "test/sim_max_reward_4300016": 0.1391373186854413, "test/sim_max_reward_4300017": 0.9482414221054868, "test/sim_max_reward_4300018": 0.43985683120822267, "test/sim_max_reward_4300019": 0.18609689689466002, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9805710912207909, "test/sim_max_reward_4300022": 0.9390790485605397, "test/sim_max_reward_4300023": 0.9551791675124275, "test/sim_max_reward_4300024": 0.9081651892656716, "test/sim_max_reward_4300025": 0.8932453876122642, "test/sim_max_reward_4300026": 0.841024288491635, "test/sim_max_reward_4300027": 0.8036681614848017, "test/sim_max_reward_4300028": 0.010368216231651878, "test/sim_max_reward_4300029": 0.4217019129234963, "test/sim_max_reward_4300030": 0.8396851193073052, "test/sim_max_reward_4300031": 0.20909778579984895, "test/sim_max_reward_4300032": 0.8661677307664108, "test/sim_max_reward_4300033": 0.9010288821716493, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.16566042171927603, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8830511757411867, "test/sim_max_reward_4300038": 0.5583696678990017, "test/sim_max_reward_4300039": 0.9796420912780585, "test/sim_max_reward_4300040": 0.869292425009698, "test/sim_max_reward_4300041": 0.9870500370575789, "test/sim_max_reward_4300042": 0.7224871273546764, "test/sim_max_reward_4300043": 0.18602001185721495, "test/sim_max_reward_4300044": 0.9847515630841479, "test/sim_max_reward_4300045": 0.17831054915096228, "test/sim_max_reward_4300046": 0.9544516345708939, "test/sim_max_reward_4300047": 0.9572099360229834, "test/sim_max_reward_4300048": 0.0014947158102293532, "test/sim_max_reward_4300049": 0.25833978796887325, "train/mean_score": 0.7659725264397629, "test/mean_score": 0.6107956771876552, "val_loss": 64560.33203125} {"train_loss": -6.496939659118652, "global_step": 105042, "epoch": 2501} {"train_loss": -6.499393939971924, "global_step": 105043, "epoch": 2501} {"train_loss": -6.419687271118164, "global_step": 105044, "epoch": 2501} {"train_loss": -6.484280109405518, "global_step": 105045, "epoch": 2501} {"train_loss": -6.373312950134277, "global_step": 105046, "epoch": 2501} {"train_loss": -6.571981430053711, "global_step": 105047, "epoch": 2501} {"train_loss": -6.4058122634887695, "global_step": 105048, "epoch": 2501} {"train_loss": -6.3976030349731445, "global_step": 105049, "epoch": 2501} {"train_loss": -6.485062599182129, "global_step": 105050, "epoch": 2501} {"train_loss": -6.280113697052002, "global_step": 105051, "epoch": 2501} {"train_loss": -6.484733581542969, "global_step": 105052, "epoch": 2501} {"train_loss": -6.360453128814697, "global_step": 105053, "epoch": 2501} {"train_loss": -6.225313186645508, "global_step": 105054, "epoch": 2501} {"train_loss": -6.332803249359131, "global_step": 105055, "epoch": 2501} {"train_loss": -6.263216972351074, "global_step": 105056, "epoch": 2501} {"train_loss": -6.393950462341309, "global_step": 105057, "epoch": 2501} {"train_loss": -6.271856307983398, "global_step": 105058, "epoch": 2501} {"train_loss": -6.336088180541992, "global_step": 105059, "epoch": 2501} {"train_loss": -6.424831867218018, "global_step": 105060, "epoch": 2501} {"train_loss": -6.183535099029541, "global_step": 105061, "epoch": 2501} {"train_loss": -6.419360160827637, "global_step": 105062, "epoch": 2501} {"train_loss": -6.345478057861328, "global_step": 105063, "epoch": 2501} {"train_loss": -6.562893867492676, "global_step": 105064, "epoch": 2501} {"train_loss": -6.378368377685547, "global_step": 105065, "epoch": 2501} {"train_loss": -6.434221267700195, "global_step": 105066, "epoch": 2501} {"train_loss": -6.442678928375244, "global_step": 105067, "epoch": 2501} {"train_loss": -6.380135536193848, "global_step": 105068, "epoch": 2501} {"train_loss": -6.419314861297607, "global_step": 105069, "epoch": 2501} {"train_loss": -6.32003116607666, "global_step": 105070, "epoch": 2501} {"train_loss": -6.354296684265137, "global_step": 105071, "epoch": 2501} {"train_loss": -6.377925872802734, "global_step": 105072, "epoch": 2501} {"train_loss": -6.2553534507751465, "global_step": 105073, "epoch": 2501} {"train_loss": -6.426840782165527, "global_step": 105074, "epoch": 2501} {"train_loss": -6.347588062286377, "global_step": 105075, "epoch": 2501} {"train_loss": -6.416651725769043, "global_step": 105076, "epoch": 2501} {"train_loss": -6.384866237640381, "global_step": 105077, "epoch": 2501} {"train_loss": -6.41347599029541, "global_step": 105078, "epoch": 2501} {"train_loss": -6.36379337310791, "global_step": 105079, "epoch": 2501} {"train_loss": -6.1920976638793945, "global_step": 105080, "epoch": 2501} {"train_loss": -6.565208435058594, "global_step": 105081, "epoch": 2501} {"train_loss": -6.38652229309082, "global_step": 105082, "epoch": 2501} {"train_loss": -6.3885044029780795, "global_step": 105083, "epoch": 2501, "val_loss": 64451.90625} {"train_loss": -6.5079665184021, "global_step": 105084, "epoch": 2502} {"train_loss": -6.394020080566406, "global_step": 105085, "epoch": 2502} {"train_loss": -6.376328468322754, "global_step": 105086, "epoch": 2502} {"train_loss": -6.313258171081543, "global_step": 105087, "epoch": 2502} {"train_loss": -6.417396068572998, "global_step": 105088, "epoch": 2502} {"train_loss": -6.408141613006592, "global_step": 105089, "epoch": 2502} {"train_loss": -6.356572151184082, "global_step": 105090, "epoch": 2502} {"train_loss": -6.469599723815918, "global_step": 105091, "epoch": 2502} {"train_loss": -6.437527179718018, "global_step": 105092, "epoch": 2502} {"train_loss": -6.450928688049316, "global_step": 105093, "epoch": 2502} {"train_loss": -6.446722030639648, "global_step": 105094, "epoch": 2502} {"train_loss": -6.238591194152832, "global_step": 105095, "epoch": 2502} {"train_loss": -6.380181789398193, "global_step": 105096, "epoch": 2502} {"train_loss": -6.340500831604004, "global_step": 105097, "epoch": 2502} {"train_loss": -6.411563873291016, "global_step": 105098, "epoch": 2502} {"train_loss": -6.440179347991943, "global_step": 105099, "epoch": 2502} {"train_loss": -6.445937156677246, "global_step": 105100, "epoch": 2502} {"train_loss": -6.523344993591309, "global_step": 105101, "epoch": 2502} {"train_loss": -6.471747398376465, "global_step": 105102, "epoch": 2502} {"train_loss": -6.525866985321045, "global_step": 105103, "epoch": 2502} {"train_loss": -6.400785446166992, "global_step": 105104, "epoch": 2502} {"train_loss": -6.482316970825195, "global_step": 105105, "epoch": 2502} {"train_loss": -6.417392730712891, "global_step": 105106, "epoch": 2502} {"train_loss": -6.457648277282715, "global_step": 105107, "epoch": 2502} {"train_loss": -6.3871073722839355, "global_step": 105108, "epoch": 2502} {"train_loss": -6.418089389801025, "global_step": 105109, "epoch": 2502} {"train_loss": -6.4741973876953125, "global_step": 105110, "epoch": 2502} {"train_loss": -6.547889232635498, "global_step": 105111, "epoch": 2502} {"train_loss": -6.559320449829102, "global_step": 105112, "epoch": 2502} {"train_loss": -6.408503532409668, "global_step": 105113, "epoch": 2502} {"train_loss": -6.458954811096191, "global_step": 105114, "epoch": 2502} {"train_loss": -6.409637451171875, "global_step": 105115, "epoch": 2502} {"train_loss": -6.403824806213379, "global_step": 105116, "epoch": 2502} {"train_loss": -6.455382823944092, "global_step": 105117, "epoch": 2502} {"train_loss": -6.503523826599121, "global_step": 105118, "epoch": 2502} {"train_loss": -6.177053451538086, "global_step": 105119, "epoch": 2502} {"train_loss": -6.28169059753418, "global_step": 105120, "epoch": 2502} {"train_loss": -6.33908748626709, "global_step": 105121, "epoch": 2502} {"train_loss": -6.239066123962402, "global_step": 105122, "epoch": 2502} {"train_loss": -6.323240280151367, "global_step": 105123, "epoch": 2502} {"train_loss": -6.300332069396973, "global_step": 105124, "epoch": 2502} {"train_loss": -6.406959579104469, "global_step": 105125, "epoch": 2502, "val_loss": 64407.6875} {"train_loss": -6.414695739746094, "global_step": 105126, "epoch": 2503} {"train_loss": -6.308119773864746, "global_step": 105127, "epoch": 2503} {"train_loss": -6.249838829040527, "global_step": 105128, "epoch": 2503} {"train_loss": -6.352145671844482, "global_step": 105129, "epoch": 2503} {"train_loss": -6.391903877258301, "global_step": 105130, "epoch": 2503} {"train_loss": -6.347251892089844, "global_step": 105131, "epoch": 2503} {"train_loss": -6.366920471191406, "global_step": 105132, "epoch": 2503} {"train_loss": -6.540297985076904, "global_step": 105133, "epoch": 2503} {"train_loss": -6.42970609664917, "global_step": 105134, "epoch": 2503} {"train_loss": -6.402839660644531, "global_step": 105135, "epoch": 2503} {"train_loss": -6.453680038452148, "global_step": 105136, "epoch": 2503} {"train_loss": -6.44660758972168, "global_step": 105137, "epoch": 2503} {"train_loss": -6.406881809234619, "global_step": 105138, "epoch": 2503} {"train_loss": -6.3952484130859375, "global_step": 105139, "epoch": 2503} {"train_loss": -6.578788757324219, "global_step": 105140, "epoch": 2503} {"train_loss": -6.378890037536621, "global_step": 105141, "epoch": 2503} {"train_loss": -6.39414119720459, "global_step": 105142, "epoch": 2503} {"train_loss": -6.515634536743164, "global_step": 105143, "epoch": 2503} {"train_loss": -6.42972469329834, "global_step": 105144, "epoch": 2503} {"train_loss": -6.443432807922363, "global_step": 105145, "epoch": 2503} {"train_loss": -6.436481952667236, "global_step": 105146, "epoch": 2503} {"train_loss": -6.443631172180176, "global_step": 105147, "epoch": 2503} {"train_loss": -6.546034812927246, "global_step": 105148, "epoch": 2503} {"train_loss": -6.396882057189941, "global_step": 105149, "epoch": 2503} {"train_loss": -6.568841934204102, "global_step": 105150, "epoch": 2503} {"train_loss": -6.463295936584473, "global_step": 105151, "epoch": 2503} {"train_loss": -6.437016487121582, "global_step": 105152, "epoch": 2503} {"train_loss": -6.392494201660156, "global_step": 105153, "epoch": 2503} {"train_loss": -6.399975776672363, "global_step": 105154, "epoch": 2503} {"train_loss": -6.581155776977539, "global_step": 105155, "epoch": 2503} {"train_loss": -6.299901485443115, "global_step": 105156, "epoch": 2503} {"train_loss": -6.3659257888793945, "global_step": 105157, "epoch": 2503} {"train_loss": -6.503155708312988, "global_step": 105158, "epoch": 2503} {"train_loss": -6.357273101806641, "global_step": 105159, "epoch": 2503} {"train_loss": -6.3784990310668945, "global_step": 105160, "epoch": 2503} {"train_loss": -6.4290995597839355, "global_step": 105161, "epoch": 2503} {"train_loss": -6.2428741455078125, "global_step": 105162, "epoch": 2503} {"train_loss": -6.360706329345703, "global_step": 105163, "epoch": 2503} {"train_loss": -6.527606010437012, "global_step": 105164, "epoch": 2503} {"train_loss": -6.289131164550781, "global_step": 105165, "epoch": 2503} {"train_loss": -6.362017631530762, "global_step": 105166, "epoch": 2503} {"train_loss": -6.4145106588091165, "global_step": 105167, "epoch": 2503, "val_loss": 64648.24609375} {"train_loss": -6.45733642578125, "global_step": 105168, "epoch": 2504} {"train_loss": -6.380273818969727, "global_step": 105169, "epoch": 2504} {"train_loss": -6.495495796203613, "global_step": 105170, "epoch": 2504} {"train_loss": -6.47570276260376, "global_step": 105171, "epoch": 2504} {"train_loss": -6.349382400512695, "global_step": 105172, "epoch": 2504} {"train_loss": -6.449103355407715, "global_step": 105173, "epoch": 2504} {"train_loss": -6.488081932067871, "global_step": 105174, "epoch": 2504} {"train_loss": -6.52882194519043, "global_step": 105175, "epoch": 2504} {"train_loss": -6.453003406524658, "global_step": 105176, "epoch": 2504} {"train_loss": -6.423757553100586, "global_step": 105177, "epoch": 2504} {"train_loss": -6.441352367401123, "global_step": 105178, "epoch": 2504} {"train_loss": -6.393477916717529, "global_step": 105179, "epoch": 2504} {"train_loss": -6.505581378936768, "global_step": 105180, "epoch": 2504} {"train_loss": -6.383423805236816, "global_step": 105181, "epoch": 2504} {"train_loss": -6.444897651672363, "global_step": 105182, "epoch": 2504} {"train_loss": -6.477959632873535, "global_step": 105183, "epoch": 2504} {"train_loss": -6.41653299331665, "global_step": 105184, "epoch": 2504} {"train_loss": -6.444136619567871, "global_step": 105185, "epoch": 2504} {"train_loss": -6.355711936950684, "global_step": 105186, "epoch": 2504} {"train_loss": -6.415511131286621, "global_step": 105187, "epoch": 2504} {"train_loss": -6.524350643157959, "global_step": 105188, "epoch": 2504} {"train_loss": -6.409507751464844, "global_step": 105189, "epoch": 2504} {"train_loss": -6.422231674194336, "global_step": 105190, "epoch": 2504} {"train_loss": -6.3564653396606445, "global_step": 105191, "epoch": 2504} {"train_loss": -6.4456987380981445, "global_step": 105192, "epoch": 2504} {"train_loss": -6.454470634460449, "global_step": 105193, "epoch": 2504} {"train_loss": -6.431612968444824, "global_step": 105194, "epoch": 2504} {"train_loss": -6.419337272644043, "global_step": 105195, "epoch": 2504} {"train_loss": -6.468596458435059, "global_step": 105196, "epoch": 2504} {"train_loss": -6.3824896812438965, "global_step": 105197, "epoch": 2504} {"train_loss": -6.5412187576293945, "global_step": 105198, "epoch": 2504} {"train_loss": -6.44760799407959, "global_step": 105199, "epoch": 2504} {"train_loss": -6.368326663970947, "global_step": 105200, "epoch": 2504} {"train_loss": -6.342336177825928, "global_step": 105201, "epoch": 2504} {"train_loss": -6.379140853881836, "global_step": 105202, "epoch": 2504} {"train_loss": -6.449530124664307, "global_step": 105203, "epoch": 2504} {"train_loss": -6.445729732513428, "global_step": 105204, "epoch": 2504} {"train_loss": -6.353701591491699, "global_step": 105205, "epoch": 2504} {"train_loss": -6.422922134399414, "global_step": 105206, "epoch": 2504} {"train_loss": -6.563838005065918, "global_step": 105207, "epoch": 2504} {"train_loss": -6.425711154937744, "global_step": 105208, "epoch": 2504} {"train_loss": -6.435126361392793, "global_step": 105209, "epoch": 2504, "val_loss": 64533.9140625} {"train_loss": -6.4656901359558105, "global_step": 105210, "epoch": 2505} {"train_loss": -6.530848503112793, "global_step": 105211, "epoch": 2505} {"train_loss": -6.400642395019531, "global_step": 105212, "epoch": 2505} {"train_loss": -6.453934669494629, "global_step": 105213, "epoch": 2505} {"train_loss": -6.379532337188721, "global_step": 105214, "epoch": 2505} {"train_loss": -6.395292282104492, "global_step": 105215, "epoch": 2505} {"train_loss": -6.394847393035889, "global_step": 105216, "epoch": 2505} {"train_loss": -6.459908485412598, "global_step": 105217, "epoch": 2505} {"train_loss": -6.447244167327881, "global_step": 105218, "epoch": 2505} {"train_loss": -6.489263534545898, "global_step": 105219, "epoch": 2505} {"train_loss": -6.342258930206299, "global_step": 105220, "epoch": 2505} {"train_loss": -6.414030075073242, "global_step": 105221, "epoch": 2505} {"train_loss": -6.323410987854004, "global_step": 105222, "epoch": 2505} {"train_loss": -6.423105239868164, "global_step": 105223, "epoch": 2505} {"train_loss": -6.4280853271484375, "global_step": 105224, "epoch": 2505} {"train_loss": -6.388706684112549, "global_step": 105225, "epoch": 2505} {"train_loss": -6.44782829284668, "global_step": 105226, "epoch": 2505} {"train_loss": -6.3944854736328125, "global_step": 105227, "epoch": 2505} {"train_loss": -6.483647346496582, "global_step": 105228, "epoch": 2505} {"train_loss": -6.419771194458008, "global_step": 105229, "epoch": 2505} {"train_loss": -6.414036750793457, "global_step": 105230, "epoch": 2505} {"train_loss": -6.3141679763793945, "global_step": 105231, "epoch": 2505} {"train_loss": -6.452180862426758, "global_step": 105232, "epoch": 2505} {"train_loss": -6.211153984069824, "global_step": 105233, "epoch": 2505} {"train_loss": -6.393387317657471, "global_step": 105234, "epoch": 2505} {"train_loss": -6.4253621101379395, "global_step": 105235, "epoch": 2505} {"train_loss": -6.425048828125, "global_step": 105236, "epoch": 2505} {"train_loss": -6.354368209838867, "global_step": 105237, "epoch": 2505} {"train_loss": -6.412193298339844, "global_step": 105238, "epoch": 2505} {"train_loss": -6.369007587432861, "global_step": 105239, "epoch": 2505} {"train_loss": -6.4170989990234375, "global_step": 105240, "epoch": 2505} {"train_loss": -6.430832386016846, "global_step": 105241, "epoch": 2505} {"train_loss": -6.465446949005127, "global_step": 105242, "epoch": 2505} {"train_loss": -6.388748645782471, "global_step": 105243, "epoch": 2505} {"train_loss": -6.435758113861084, "global_step": 105244, "epoch": 2505} {"train_loss": -6.272387504577637, "global_step": 105245, "epoch": 2505} {"train_loss": -6.401879787445068, "global_step": 105246, "epoch": 2505} {"train_loss": -6.296006202697754, "global_step": 105247, "epoch": 2505} {"train_loss": -6.3461503982543945, "global_step": 105248, "epoch": 2505} {"train_loss": -6.3933610916137695, "global_step": 105249, "epoch": 2505} {"train_loss": -6.526874542236328, "global_step": 105250, "epoch": 2505} {"train_loss": -6.405709981918335, "global_step": 105251, "epoch": 2505, "val_loss": 64472.2109375} {"train_loss": -6.491628646850586, "global_step": 105252, "epoch": 2506} {"train_loss": -6.35534143447876, "global_step": 105253, "epoch": 2506} {"train_loss": -6.377063274383545, "global_step": 105254, "epoch": 2506} {"train_loss": -6.460575103759766, "global_step": 105255, "epoch": 2506} {"train_loss": -6.3675336837768555, "global_step": 105256, "epoch": 2506} {"train_loss": -6.383139610290527, "global_step": 105257, "epoch": 2506} {"train_loss": -6.474915504455566, "global_step": 105258, "epoch": 2506} {"train_loss": -6.463666915893555, "global_step": 105259, "epoch": 2506} {"train_loss": -6.423398971557617, "global_step": 105260, "epoch": 2506} {"train_loss": -6.3871660232543945, "global_step": 105261, "epoch": 2506} {"train_loss": -6.4755754470825195, "global_step": 105262, "epoch": 2506} {"train_loss": -6.382218360900879, "global_step": 105263, "epoch": 2506} {"train_loss": -6.495898246765137, "global_step": 105264, "epoch": 2506} {"train_loss": -6.493832588195801, "global_step": 105265, "epoch": 2506} {"train_loss": -6.449710369110107, "global_step": 105266, "epoch": 2506} {"train_loss": -6.529671669006348, "global_step": 105267, "epoch": 2506} {"train_loss": -6.3987135887146, "global_step": 105268, "epoch": 2506} {"train_loss": -6.327444076538086, "global_step": 105269, "epoch": 2506} {"train_loss": -6.460754871368408, "global_step": 105270, "epoch": 2506} {"train_loss": -6.370020866394043, "global_step": 105271, "epoch": 2506} {"train_loss": -6.442167282104492, "global_step": 105272, "epoch": 2506} {"train_loss": -6.5116729736328125, "global_step": 105273, "epoch": 2506} {"train_loss": -6.543543815612793, "global_step": 105274, "epoch": 2506} {"train_loss": -6.289196968078613, "global_step": 105275, "epoch": 2506} {"train_loss": -6.386364459991455, "global_step": 105276, "epoch": 2506} {"train_loss": -6.412573337554932, "global_step": 105277, "epoch": 2506} {"train_loss": -6.417994499206543, "global_step": 105278, "epoch": 2506} {"train_loss": -6.390851974487305, "global_step": 105279, "epoch": 2506} {"train_loss": -6.480653762817383, "global_step": 105280, "epoch": 2506} {"train_loss": -6.369199752807617, "global_step": 105281, "epoch": 2506} {"train_loss": -6.355365753173828, "global_step": 105282, "epoch": 2506} {"train_loss": -6.589846611022949, "global_step": 105283, "epoch": 2506} {"train_loss": -6.253550052642822, "global_step": 105284, "epoch": 2506} {"train_loss": -6.284501075744629, "global_step": 105285, "epoch": 2506} {"train_loss": -6.477608680725098, "global_step": 105286, "epoch": 2506} {"train_loss": -6.3429412841796875, "global_step": 105287, "epoch": 2506} {"train_loss": -6.3633551597595215, "global_step": 105288, "epoch": 2506} {"train_loss": -6.468743324279785, "global_step": 105289, "epoch": 2506} {"train_loss": -6.429013252258301, "global_step": 105290, "epoch": 2506} {"train_loss": -6.484260559082031, "global_step": 105291, "epoch": 2506} {"train_loss": -6.278351306915283, "global_step": 105292, "epoch": 2506} {"train_loss": -6.420030627931867, "global_step": 105293, "epoch": 2506, "val_loss": 64522.37890625} {"train_loss": -6.297119140625, "global_step": 105294, "epoch": 2507} {"train_loss": -6.503856182098389, "global_step": 105295, "epoch": 2507} {"train_loss": -6.397552490234375, "global_step": 105296, "epoch": 2507} {"train_loss": -6.398968696594238, "global_step": 105297, "epoch": 2507} {"train_loss": -6.380145072937012, "global_step": 105298, "epoch": 2507} {"train_loss": -6.5078935623168945, "global_step": 105299, "epoch": 2507} {"train_loss": -6.477091312408447, "global_step": 105300, "epoch": 2507} {"train_loss": -6.387426376342773, "global_step": 105301, "epoch": 2507} {"train_loss": -6.482542991638184, "global_step": 105302, "epoch": 2507} {"train_loss": -6.423708915710449, "global_step": 105303, "epoch": 2507} {"train_loss": -6.403791427612305, "global_step": 105304, "epoch": 2507} {"train_loss": -6.42726993560791, "global_step": 105305, "epoch": 2507} {"train_loss": -6.477317810058594, "global_step": 105306, "epoch": 2507} {"train_loss": -6.46922492980957, "global_step": 105307, "epoch": 2507} {"train_loss": -6.3498992919921875, "global_step": 105308, "epoch": 2507} {"train_loss": -6.451162338256836, "global_step": 105309, "epoch": 2507} {"train_loss": -6.4247727394104, "global_step": 105310, "epoch": 2507} {"train_loss": -6.707289695739746, "global_step": 105311, "epoch": 2507} {"train_loss": -6.445422649383545, "global_step": 105312, "epoch": 2507} {"train_loss": -6.484989166259766, "global_step": 105313, "epoch": 2507} {"train_loss": -6.516306400299072, "global_step": 105314, "epoch": 2507} {"train_loss": -6.474090576171875, "global_step": 105315, "epoch": 2507} {"train_loss": -6.3433427810668945, "global_step": 105316, "epoch": 2507} {"train_loss": -6.518832206726074, "global_step": 105317, "epoch": 2507} {"train_loss": -6.406577110290527, "global_step": 105318, "epoch": 2507} {"train_loss": -6.441514015197754, "global_step": 105319, "epoch": 2507} {"train_loss": -6.491086959838867, "global_step": 105320, "epoch": 2507} {"train_loss": -6.463962078094482, "global_step": 105321, "epoch": 2507} {"train_loss": -6.429035186767578, "global_step": 105322, "epoch": 2507} {"train_loss": -6.424368858337402, "global_step": 105323, "epoch": 2507} {"train_loss": -6.512422561645508, "global_step": 105324, "epoch": 2507} {"train_loss": -6.416499614715576, "global_step": 105325, "epoch": 2507} {"train_loss": -6.476014137268066, "global_step": 105326, "epoch": 2507} {"train_loss": -6.550856590270996, "global_step": 105327, "epoch": 2507} {"train_loss": -6.5289130210876465, "global_step": 105328, "epoch": 2507} {"train_loss": -6.423264026641846, "global_step": 105329, "epoch": 2507} {"train_loss": -6.472240447998047, "global_step": 105330, "epoch": 2507} {"train_loss": -6.485273838043213, "global_step": 105331, "epoch": 2507} {"train_loss": -6.307647705078125, "global_step": 105332, "epoch": 2507} {"train_loss": -6.417794227600098, "global_step": 105333, "epoch": 2507} {"train_loss": -6.446883201599121, "global_step": 105334, "epoch": 2507} {"train_loss": -6.450019711539859, "global_step": 105335, "epoch": 2507, "val_loss": 64751.84375} {"train_loss": -6.362884998321533, "global_step": 105336, "epoch": 2508} {"train_loss": -6.329009056091309, "global_step": 105337, "epoch": 2508} {"train_loss": -6.478604316711426, "global_step": 105338, "epoch": 2508} {"train_loss": -6.453246593475342, "global_step": 105339, "epoch": 2508} {"train_loss": -6.414734840393066, "global_step": 105340, "epoch": 2508} {"train_loss": -6.504327774047852, "global_step": 105341, "epoch": 2508} {"train_loss": -6.67597770690918, "global_step": 105342, "epoch": 2508} {"train_loss": -6.520546913146973, "global_step": 105343, "epoch": 2508} {"train_loss": -6.413763523101807, "global_step": 105344, "epoch": 2508} {"train_loss": -6.452118873596191, "global_step": 105345, "epoch": 2508} {"train_loss": -6.389832019805908, "global_step": 105346, "epoch": 2508} {"train_loss": -6.414498329162598, "global_step": 105347, "epoch": 2508} {"train_loss": -6.416712760925293, "global_step": 105348, "epoch": 2508} {"train_loss": -6.3715715408325195, "global_step": 105349, "epoch": 2508} {"train_loss": -6.339044094085693, "global_step": 105350, "epoch": 2508} {"train_loss": -6.4529619216918945, "global_step": 105351, "epoch": 2508} {"train_loss": -6.482913017272949, "global_step": 105352, "epoch": 2508} {"train_loss": -6.405335426330566, "global_step": 105353, "epoch": 2508} {"train_loss": -6.349054336547852, "global_step": 105354, "epoch": 2508} {"train_loss": -6.388640403747559, "global_step": 105355, "epoch": 2508} {"train_loss": -6.350625038146973, "global_step": 105356, "epoch": 2508} {"train_loss": -6.445009231567383, "global_step": 105357, "epoch": 2508} {"train_loss": -6.447660446166992, "global_step": 105358, "epoch": 2508} {"train_loss": -6.290500164031982, "global_step": 105359, "epoch": 2508} {"train_loss": -6.431191444396973, "global_step": 105360, "epoch": 2508} {"train_loss": -6.488105773925781, "global_step": 105361, "epoch": 2508} {"train_loss": -6.4256391525268555, "global_step": 105362, "epoch": 2508} {"train_loss": -6.455643653869629, "global_step": 105363, "epoch": 2508} {"train_loss": -6.359742164611816, "global_step": 105364, "epoch": 2508} {"train_loss": -6.463162422180176, "global_step": 105365, "epoch": 2508} {"train_loss": -6.4031853675842285, "global_step": 105366, "epoch": 2508} {"train_loss": -6.466901779174805, "global_step": 105367, "epoch": 2508} {"train_loss": -6.34242057800293, "global_step": 105368, "epoch": 2508} {"train_loss": -6.505892753601074, "global_step": 105369, "epoch": 2508} {"train_loss": -6.388239860534668, "global_step": 105370, "epoch": 2508} {"train_loss": -6.403120994567871, "global_step": 105371, "epoch": 2508} {"train_loss": -6.43193244934082, "global_step": 105372, "epoch": 2508} {"train_loss": -6.481667518615723, "global_step": 105373, "epoch": 2508} {"train_loss": -6.5063934326171875, "global_step": 105374, "epoch": 2508} {"train_loss": -6.402332305908203, "global_step": 105375, "epoch": 2508} {"train_loss": -6.411919593811035, "global_step": 105376, "epoch": 2508} {"train_loss": -6.42706096739996, "global_step": 105377, "epoch": 2508, "val_loss": 64571.65625} {"train_loss": -6.414367198944092, "global_step": 105378, "epoch": 2509} {"train_loss": -6.379603385925293, "global_step": 105379, "epoch": 2509} {"train_loss": -6.448606491088867, "global_step": 105380, "epoch": 2509} {"train_loss": -6.401073455810547, "global_step": 105381, "epoch": 2509} {"train_loss": -6.423624038696289, "global_step": 105382, "epoch": 2509} {"train_loss": -6.417978286743164, "global_step": 105383, "epoch": 2509} {"train_loss": -6.408432960510254, "global_step": 105384, "epoch": 2509} {"train_loss": -6.394036293029785, "global_step": 105385, "epoch": 2509} {"train_loss": -6.463175296783447, "global_step": 105386, "epoch": 2509} {"train_loss": -6.496028423309326, "global_step": 105387, "epoch": 2509} {"train_loss": -6.479538917541504, "global_step": 105388, "epoch": 2509} {"train_loss": -6.503933429718018, "global_step": 105389, "epoch": 2509} {"train_loss": -6.473940849304199, "global_step": 105390, "epoch": 2509} {"train_loss": -6.438540458679199, "global_step": 105391, "epoch": 2509} {"train_loss": -6.43532133102417, "global_step": 105392, "epoch": 2509} {"train_loss": -6.478259086608887, "global_step": 105393, "epoch": 2509} {"train_loss": -6.481734752655029, "global_step": 105394, "epoch": 2509} {"train_loss": -6.39658260345459, "global_step": 105395, "epoch": 2509} {"train_loss": -6.476156711578369, "global_step": 105396, "epoch": 2509} {"train_loss": -6.380832195281982, "global_step": 105397, "epoch": 2509} {"train_loss": -6.38349723815918, "global_step": 105398, "epoch": 2509} {"train_loss": -6.3224778175354, "global_step": 105399, "epoch": 2509} {"train_loss": -6.403278350830078, "global_step": 105400, "epoch": 2509} {"train_loss": -6.416516304016113, "global_step": 105401, "epoch": 2509} {"train_loss": -6.336143493652344, "global_step": 105402, "epoch": 2509} {"train_loss": -6.564476013183594, "global_step": 105403, "epoch": 2509} {"train_loss": -6.474147796630859, "global_step": 105404, "epoch": 2509} {"train_loss": -6.400891304016113, "global_step": 105405, "epoch": 2509} {"train_loss": -6.392603874206543, "global_step": 105406, "epoch": 2509} {"train_loss": -6.388225555419922, "global_step": 105407, "epoch": 2509} {"train_loss": -6.424455642700195, "global_step": 105408, "epoch": 2509} {"train_loss": -6.292565822601318, "global_step": 105409, "epoch": 2509} {"train_loss": -6.462629318237305, "global_step": 105410, "epoch": 2509} {"train_loss": -6.463259696960449, "global_step": 105411, "epoch": 2509} {"train_loss": -6.484606742858887, "global_step": 105412, "epoch": 2509} {"train_loss": -6.4750213623046875, "global_step": 105413, "epoch": 2509} {"train_loss": -6.461840629577637, "global_step": 105414, "epoch": 2509} {"train_loss": -6.433365821838379, "global_step": 105415, "epoch": 2509} {"train_loss": -6.46819543838501, "global_step": 105416, "epoch": 2509} {"train_loss": -6.366532802581787, "global_step": 105417, "epoch": 2509} {"train_loss": -6.413318634033203, "global_step": 105418, "epoch": 2509} {"train_loss": -6.4296611831301735, "global_step": 105419, "epoch": 2509, "val_loss": 64615.46875} {"train_loss": -6.441972732543945, "global_step": 105420, "epoch": 2510} {"train_loss": -6.4261474609375, "global_step": 105421, "epoch": 2510} {"train_loss": -6.471958160400391, "global_step": 105422, "epoch": 2510} {"train_loss": -6.486965179443359, "global_step": 105423, "epoch": 2510} {"train_loss": -6.300682067871094, "global_step": 105424, "epoch": 2510} {"train_loss": -6.436498165130615, "global_step": 105425, "epoch": 2510} {"train_loss": -6.495630264282227, "global_step": 105426, "epoch": 2510} {"train_loss": -6.468639373779297, "global_step": 105427, "epoch": 2510} {"train_loss": -6.501153945922852, "global_step": 105428, "epoch": 2510} {"train_loss": -6.398153781890869, "global_step": 105429, "epoch": 2510} {"train_loss": -6.479933738708496, "global_step": 105430, "epoch": 2510} {"train_loss": -6.420355796813965, "global_step": 105431, "epoch": 2510} {"train_loss": -6.380002498626709, "global_step": 105432, "epoch": 2510} {"train_loss": -6.4207072257995605, "global_step": 105433, "epoch": 2510} {"train_loss": -6.490857124328613, "global_step": 105434, "epoch": 2510} {"train_loss": -6.3384857177734375, "global_step": 105435, "epoch": 2510} {"train_loss": -6.330821990966797, "global_step": 105436, "epoch": 2510} {"train_loss": -6.476480484008789, "global_step": 105437, "epoch": 2510} {"train_loss": -6.233077526092529, "global_step": 105438, "epoch": 2510} {"train_loss": -6.358280181884766, "global_step": 105439, "epoch": 2510} {"train_loss": -6.463212490081787, "global_step": 105440, "epoch": 2510} {"train_loss": -6.4113569259643555, "global_step": 105441, "epoch": 2510} {"train_loss": -6.416408538818359, "global_step": 105442, "epoch": 2510} {"train_loss": -6.446678638458252, "global_step": 105443, "epoch": 2510} {"train_loss": -6.470391273498535, "global_step": 105444, "epoch": 2510} {"train_loss": -6.503468990325928, "global_step": 105445, "epoch": 2510} {"train_loss": -6.3293352127075195, "global_step": 105446, "epoch": 2510} {"train_loss": -6.4381103515625, "global_step": 105447, "epoch": 2510} {"train_loss": -6.4616804122924805, "global_step": 105448, "epoch": 2510} {"train_loss": -6.326909065246582, "global_step": 105449, "epoch": 2510} {"train_loss": -6.502385139465332, "global_step": 105450, "epoch": 2510} {"train_loss": -6.3908796310424805, "global_step": 105451, "epoch": 2510} {"train_loss": -6.3414306640625, "global_step": 105452, "epoch": 2510} {"train_loss": -6.455364227294922, "global_step": 105453, "epoch": 2510} {"train_loss": -6.452620506286621, "global_step": 105454, "epoch": 2510} {"train_loss": -6.355058670043945, "global_step": 105455, "epoch": 2510} {"train_loss": -6.464802265167236, "global_step": 105456, "epoch": 2510} {"train_loss": -6.511018753051758, "global_step": 105457, "epoch": 2510} {"train_loss": -6.381436347961426, "global_step": 105458, "epoch": 2510} {"train_loss": -6.394850730895996, "global_step": 105459, "epoch": 2510} {"train_loss": -6.372208595275879, "global_step": 105460, "epoch": 2510} {"train_loss": -6.421967608588083, "global_step": 105461, "epoch": 2510, "val_loss": 64675.76953125} {"train_loss": -6.3697991371154785, "global_step": 105462, "epoch": 2511} {"train_loss": -6.388235092163086, "global_step": 105463, "epoch": 2511} {"train_loss": -6.542693138122559, "global_step": 105464, "epoch": 2511} {"train_loss": -6.425152778625488, "global_step": 105465, "epoch": 2511} {"train_loss": -6.495648384094238, "global_step": 105466, "epoch": 2511} {"train_loss": -6.486265659332275, "global_step": 105467, "epoch": 2511} {"train_loss": -6.4866204261779785, "global_step": 105468, "epoch": 2511} {"train_loss": -6.519460678100586, "global_step": 105469, "epoch": 2511} {"train_loss": -6.563499927520752, "global_step": 105470, "epoch": 2511} {"train_loss": -6.346109867095947, "global_step": 105471, "epoch": 2511} {"train_loss": -6.433398246765137, "global_step": 105472, "epoch": 2511} {"train_loss": -6.444645881652832, "global_step": 105473, "epoch": 2511} {"train_loss": -6.352636814117432, "global_step": 105474, "epoch": 2511} {"train_loss": -6.350246906280518, "global_step": 105475, "epoch": 2511} {"train_loss": -6.353002548217773, "global_step": 105476, "epoch": 2511} {"train_loss": -6.4603166580200195, "global_step": 105477, "epoch": 2511} {"train_loss": -6.429900169372559, "global_step": 105478, "epoch": 2511} {"train_loss": -6.406501293182373, "global_step": 105479, "epoch": 2511} {"train_loss": -6.436644554138184, "global_step": 105480, "epoch": 2511} {"train_loss": -6.45188045501709, "global_step": 105481, "epoch": 2511} {"train_loss": -6.2975897789001465, "global_step": 105482, "epoch": 2511} {"train_loss": -6.379887580871582, "global_step": 105483, "epoch": 2511} {"train_loss": -6.3958740234375, "global_step": 105484, "epoch": 2511} {"train_loss": -6.408819675445557, "global_step": 105485, "epoch": 2511} {"train_loss": -6.457798004150391, "global_step": 105486, "epoch": 2511} {"train_loss": -6.537721633911133, "global_step": 105487, "epoch": 2511} {"train_loss": -6.390205383300781, "global_step": 105488, "epoch": 2511} {"train_loss": -6.371102333068848, "global_step": 105489, "epoch": 2511} {"train_loss": -6.440181732177734, "global_step": 105490, "epoch": 2511} {"train_loss": -6.5225749015808105, "global_step": 105491, "epoch": 2511} {"train_loss": -6.470231533050537, "global_step": 105492, "epoch": 2511} {"train_loss": -6.409389972686768, "global_step": 105493, "epoch": 2511} {"train_loss": -6.4654541015625, "global_step": 105494, "epoch": 2511} {"train_loss": -6.34483528137207, "global_step": 105495, "epoch": 2511} {"train_loss": -6.517325401306152, "global_step": 105496, "epoch": 2511} {"train_loss": -6.363077163696289, "global_step": 105497, "epoch": 2511} {"train_loss": -6.43265962600708, "global_step": 105498, "epoch": 2511} {"train_loss": -6.531789779663086, "global_step": 105499, "epoch": 2511} {"train_loss": -6.395855903625488, "global_step": 105500, "epoch": 2511} {"train_loss": -6.421228408813477, "global_step": 105501, "epoch": 2511} {"train_loss": -6.375441551208496, "global_step": 105502, "epoch": 2511} {"train_loss": -6.431550321124849, "global_step": 105503, "epoch": 2511, "val_loss": 64559.39453125} {"train_loss": -6.511207103729248, "global_step": 105504, "epoch": 2512} {"train_loss": -6.342462539672852, "global_step": 105505, "epoch": 2512} {"train_loss": -6.507232666015625, "global_step": 105506, "epoch": 2512} {"train_loss": -6.433516025543213, "global_step": 105507, "epoch": 2512} {"train_loss": -6.442337989807129, "global_step": 105508, "epoch": 2512} {"train_loss": -6.455676078796387, "global_step": 105509, "epoch": 2512} {"train_loss": -6.429995059967041, "global_step": 105510, "epoch": 2512} {"train_loss": -6.418896675109863, "global_step": 105511, "epoch": 2512} {"train_loss": -6.481288909912109, "global_step": 105512, "epoch": 2512} {"train_loss": -6.423133850097656, "global_step": 105513, "epoch": 2512} {"train_loss": -6.323118209838867, "global_step": 105514, "epoch": 2512} {"train_loss": -6.438579559326172, "global_step": 105515, "epoch": 2512} {"train_loss": -6.520024299621582, "global_step": 105516, "epoch": 2512} {"train_loss": -6.428093433380127, "global_step": 105517, "epoch": 2512} {"train_loss": -6.365528583526611, "global_step": 105518, "epoch": 2512} {"train_loss": -6.372530937194824, "global_step": 105519, "epoch": 2512} {"train_loss": -6.409701824188232, "global_step": 105520, "epoch": 2512} {"train_loss": -6.415870666503906, "global_step": 105521, "epoch": 2512} {"train_loss": -6.409829139709473, "global_step": 105522, "epoch": 2512} {"train_loss": -6.399194240570068, "global_step": 105523, "epoch": 2512} {"train_loss": -6.295083045959473, "global_step": 105524, "epoch": 2512} {"train_loss": -6.435379981994629, "global_step": 105525, "epoch": 2512} {"train_loss": -6.427480697631836, "global_step": 105526, "epoch": 2512} {"train_loss": -6.521120071411133, "global_step": 105527, "epoch": 2512} {"train_loss": -6.519570350646973, "global_step": 105528, "epoch": 2512} {"train_loss": -6.405426025390625, "global_step": 105529, "epoch": 2512} {"train_loss": -6.555181503295898, "global_step": 105530, "epoch": 2512} {"train_loss": -6.477303504943848, "global_step": 105531, "epoch": 2512} {"train_loss": -6.436106204986572, "global_step": 105532, "epoch": 2512} {"train_loss": -6.4219160079956055, "global_step": 105533, "epoch": 2512} {"train_loss": -6.4630208015441895, "global_step": 105534, "epoch": 2512} {"train_loss": -6.4058003425598145, "global_step": 105535, "epoch": 2512} {"train_loss": -6.397538185119629, "global_step": 105536, "epoch": 2512} {"train_loss": -6.4832563400268555, "global_step": 105537, "epoch": 2512} {"train_loss": -6.493520259857178, "global_step": 105538, "epoch": 2512} {"train_loss": -6.484958171844482, "global_step": 105539, "epoch": 2512} {"train_loss": -6.397585868835449, "global_step": 105540, "epoch": 2512} {"train_loss": -6.49947452545166, "global_step": 105541, "epoch": 2512} {"train_loss": -6.483880519866943, "global_step": 105542, "epoch": 2512} {"train_loss": -6.429513454437256, "global_step": 105543, "epoch": 2512} {"train_loss": -6.470705986022949, "global_step": 105544, "epoch": 2512} {"train_loss": -6.440695126851399, "global_step": 105545, "epoch": 2512, "val_loss": 64649.54296875} {"train_loss": -6.498682022094727, "global_step": 105546, "epoch": 2513} {"train_loss": -6.506880283355713, "global_step": 105547, "epoch": 2513} {"train_loss": -6.338748931884766, "global_step": 105548, "epoch": 2513} {"train_loss": -6.406696319580078, "global_step": 105549, "epoch": 2513} {"train_loss": -6.424726486206055, "global_step": 105550, "epoch": 2513} {"train_loss": -6.453534126281738, "global_step": 105551, "epoch": 2513} {"train_loss": -6.401819229125977, "global_step": 105552, "epoch": 2513} {"train_loss": -6.539712905883789, "global_step": 105553, "epoch": 2513} {"train_loss": -6.506828308105469, "global_step": 105554, "epoch": 2513} {"train_loss": -6.4312286376953125, "global_step": 105555, "epoch": 2513} {"train_loss": -6.5083489418029785, "global_step": 105556, "epoch": 2513} {"train_loss": -6.490696907043457, "global_step": 105557, "epoch": 2513} {"train_loss": -6.4176130294799805, "global_step": 105558, "epoch": 2513} {"train_loss": -6.3955488204956055, "global_step": 105559, "epoch": 2513} {"train_loss": -6.418830871582031, "global_step": 105560, "epoch": 2513} {"train_loss": -6.520930290222168, "global_step": 105561, "epoch": 2513} {"train_loss": -6.433381080627441, "global_step": 105562, "epoch": 2513} {"train_loss": -6.4711503982543945, "global_step": 105563, "epoch": 2513} {"train_loss": -6.5091753005981445, "global_step": 105564, "epoch": 2513} {"train_loss": -6.400640487670898, "global_step": 105565, "epoch": 2513} {"train_loss": -6.429745197296143, "global_step": 105566, "epoch": 2513} {"train_loss": -6.442256450653076, "global_step": 105567, "epoch": 2513} {"train_loss": -6.549768447875977, "global_step": 105568, "epoch": 2513} {"train_loss": -6.438724517822266, "global_step": 105569, "epoch": 2513} {"train_loss": -6.530941009521484, "global_step": 105570, "epoch": 2513} {"train_loss": -6.523431777954102, "global_step": 105571, "epoch": 2513} {"train_loss": -6.387474060058594, "global_step": 105572, "epoch": 2513} {"train_loss": -6.4882402420043945, "global_step": 105573, "epoch": 2513} {"train_loss": -6.568902015686035, "global_step": 105574, "epoch": 2513} {"train_loss": -6.507913589477539, "global_step": 105575, "epoch": 2513} {"train_loss": -6.364058971405029, "global_step": 105576, "epoch": 2513} {"train_loss": -6.38109016418457, "global_step": 105577, "epoch": 2513} {"train_loss": -6.346526622772217, "global_step": 105578, "epoch": 2513} {"train_loss": -6.449596881866455, "global_step": 105579, "epoch": 2513} {"train_loss": -6.381718635559082, "global_step": 105580, "epoch": 2513} {"train_loss": -6.493941783905029, "global_step": 105581, "epoch": 2513} {"train_loss": -6.350935935974121, "global_step": 105582, "epoch": 2513} {"train_loss": -6.409884929656982, "global_step": 105583, "epoch": 2513} {"train_loss": -6.323276519775391, "global_step": 105584, "epoch": 2513} {"train_loss": -6.431301116943359, "global_step": 105585, "epoch": 2513} {"train_loss": -6.196708679199219, "global_step": 105586, "epoch": 2513} {"train_loss": -6.4372467313494, "global_step": 105587, "epoch": 2513, "val_loss": 64625.0} {"train_loss": -6.3687286376953125, "global_step": 105588, "epoch": 2514} {"train_loss": -6.174953460693359, "global_step": 105589, "epoch": 2514} {"train_loss": -6.388545989990234, "global_step": 105590, "epoch": 2514} {"train_loss": -6.436287879943848, "global_step": 105591, "epoch": 2514} {"train_loss": -6.405217170715332, "global_step": 105592, "epoch": 2514} {"train_loss": -6.512679576873779, "global_step": 105593, "epoch": 2514} {"train_loss": -6.338757514953613, "global_step": 105594, "epoch": 2514} {"train_loss": -6.392985820770264, "global_step": 105595, "epoch": 2514} {"train_loss": -6.386363983154297, "global_step": 105596, "epoch": 2514} {"train_loss": -6.365054607391357, "global_step": 105597, "epoch": 2514} {"train_loss": -6.362873554229736, "global_step": 105598, "epoch": 2514} {"train_loss": -6.47087287902832, "global_step": 105599, "epoch": 2514} {"train_loss": -6.351541996002197, "global_step": 105600, "epoch": 2514} {"train_loss": -6.434967994689941, "global_step": 105601, "epoch": 2514} {"train_loss": -6.332513809204102, "global_step": 105602, "epoch": 2514} {"train_loss": -6.415185928344727, "global_step": 105603, "epoch": 2514} {"train_loss": -6.275006294250488, "global_step": 105604, "epoch": 2514} {"train_loss": -6.3202996253967285, "global_step": 105605, "epoch": 2514} {"train_loss": -6.435453414916992, "global_step": 105606, "epoch": 2514} {"train_loss": -6.401942253112793, "global_step": 105607, "epoch": 2514} {"train_loss": -6.453034400939941, "global_step": 105608, "epoch": 2514} {"train_loss": -6.356237411499023, "global_step": 105609, "epoch": 2514} {"train_loss": -6.4139404296875, "global_step": 105610, "epoch": 2514} {"train_loss": -6.496560096740723, "global_step": 105611, "epoch": 2514} {"train_loss": -6.284106254577637, "global_step": 105612, "epoch": 2514} {"train_loss": -6.482321739196777, "global_step": 105613, "epoch": 2514} {"train_loss": -6.404473304748535, "global_step": 105614, "epoch": 2514} {"train_loss": -6.396019458770752, "global_step": 105615, "epoch": 2514} {"train_loss": -6.408190727233887, "global_step": 105616, "epoch": 2514} {"train_loss": -6.3471879959106445, "global_step": 105617, "epoch": 2514} {"train_loss": -6.4644975662231445, "global_step": 105618, "epoch": 2514} {"train_loss": -6.451155662536621, "global_step": 105619, "epoch": 2514} {"train_loss": -6.455649375915527, "global_step": 105620, "epoch": 2514} {"train_loss": -6.306910991668701, "global_step": 105621, "epoch": 2514} {"train_loss": -6.477545738220215, "global_step": 105622, "epoch": 2514} {"train_loss": -6.324209213256836, "global_step": 105623, "epoch": 2514} {"train_loss": -6.3608293533325195, "global_step": 105624, "epoch": 2514} {"train_loss": -6.4155731201171875, "global_step": 105625, "epoch": 2514} {"train_loss": -6.450061321258545, "global_step": 105626, "epoch": 2514} {"train_loss": -6.46996545791626, "global_step": 105627, "epoch": 2514} {"train_loss": -6.439506530761719, "global_step": 105628, "epoch": 2514} {"train_loss": -6.398428054082961, "global_step": 105629, "epoch": 2514, "val_loss": 64732.8125} {"train_loss": -6.464572906494141, "global_step": 105630, "epoch": 2515} {"train_loss": -6.344198703765869, "global_step": 105631, "epoch": 2515} {"train_loss": -6.425199508666992, "global_step": 105632, "epoch": 2515} {"train_loss": -6.373703956604004, "global_step": 105633, "epoch": 2515} {"train_loss": -6.309715270996094, "global_step": 105634, "epoch": 2515} {"train_loss": -6.4286417961120605, "global_step": 105635, "epoch": 2515} {"train_loss": -6.431163787841797, "global_step": 105636, "epoch": 2515} {"train_loss": -6.395557880401611, "global_step": 105637, "epoch": 2515} {"train_loss": -6.465810775756836, "global_step": 105638, "epoch": 2515} {"train_loss": -6.304535865783691, "global_step": 105639, "epoch": 2515} {"train_loss": -6.336377143859863, "global_step": 105640, "epoch": 2515} {"train_loss": -6.415552139282227, "global_step": 105641, "epoch": 2515} {"train_loss": -6.461426734924316, "global_step": 105642, "epoch": 2515} {"train_loss": -6.359613418579102, "global_step": 105643, "epoch": 2515} {"train_loss": -6.410483360290527, "global_step": 105644, "epoch": 2515} {"train_loss": -6.4337568283081055, "global_step": 105645, "epoch": 2515} {"train_loss": -6.3997273445129395, "global_step": 105646, "epoch": 2515} {"train_loss": -6.340062618255615, "global_step": 105647, "epoch": 2515} {"train_loss": -6.410539150238037, "global_step": 105648, "epoch": 2515} {"train_loss": -6.394610404968262, "global_step": 105649, "epoch": 2515} {"train_loss": -6.409479141235352, "global_step": 105650, "epoch": 2515} {"train_loss": -6.40674352645874, "global_step": 105651, "epoch": 2515} {"train_loss": -6.318912506103516, "global_step": 105652, "epoch": 2515} {"train_loss": -6.435676574707031, "global_step": 105653, "epoch": 2515} {"train_loss": -6.340207099914551, "global_step": 105654, "epoch": 2515} {"train_loss": -6.368527412414551, "global_step": 105655, "epoch": 2515} {"train_loss": -6.392311096191406, "global_step": 105656, "epoch": 2515} {"train_loss": -6.458581447601318, "global_step": 105657, "epoch": 2515} {"train_loss": -6.431671142578125, "global_step": 105658, "epoch": 2515} {"train_loss": -6.38834285736084, "global_step": 105659, "epoch": 2515} {"train_loss": -6.492609977722168, "global_step": 105660, "epoch": 2515} {"train_loss": -6.46637487411499, "global_step": 105661, "epoch": 2515} {"train_loss": -6.493019104003906, "global_step": 105662, "epoch": 2515} {"train_loss": -6.407124042510986, "global_step": 105663, "epoch": 2515} {"train_loss": -6.449034690856934, "global_step": 105664, "epoch": 2515} {"train_loss": -6.544558525085449, "global_step": 105665, "epoch": 2515} {"train_loss": -6.3625922203063965, "global_step": 105666, "epoch": 2515} {"train_loss": -6.462078094482422, "global_step": 105667, "epoch": 2515} {"train_loss": -6.560003280639648, "global_step": 105668, "epoch": 2515} {"train_loss": -6.406700611114502, "global_step": 105669, "epoch": 2515} {"train_loss": -6.461025238037109, "global_step": 105670, "epoch": 2515} {"train_loss": -6.415172236306327, "global_step": 105671, "epoch": 2515, "val_loss": 64616.6875} {"train_loss": -6.482892990112305, "global_step": 105672, "epoch": 2516} {"train_loss": -6.5214457511901855, "global_step": 105673, "epoch": 2516} {"train_loss": -6.5128068923950195, "global_step": 105674, "epoch": 2516} {"train_loss": -6.534335136413574, "global_step": 105675, "epoch": 2516} {"train_loss": -6.486828804016113, "global_step": 105676, "epoch": 2516} {"train_loss": -6.456851959228516, "global_step": 105677, "epoch": 2516} {"train_loss": -6.488824844360352, "global_step": 105678, "epoch": 2516} {"train_loss": -6.548261642456055, "global_step": 105679, "epoch": 2516} {"train_loss": -6.424978256225586, "global_step": 105680, "epoch": 2516} {"train_loss": -6.35914421081543, "global_step": 105681, "epoch": 2516} {"train_loss": -6.533076286315918, "global_step": 105682, "epoch": 2516} {"train_loss": -6.435577392578125, "global_step": 105683, "epoch": 2516} {"train_loss": -6.455674171447754, "global_step": 105684, "epoch": 2516} {"train_loss": -6.531427383422852, "global_step": 105685, "epoch": 2516} {"train_loss": -6.427042007446289, "global_step": 105686, "epoch": 2516} {"train_loss": -6.497478485107422, "global_step": 105687, "epoch": 2516} {"train_loss": -6.392723560333252, "global_step": 105688, "epoch": 2516} {"train_loss": -6.355016708374023, "global_step": 105689, "epoch": 2516} {"train_loss": -6.243816375732422, "global_step": 105690, "epoch": 2516} {"train_loss": -6.439908027648926, "global_step": 105691, "epoch": 2516} {"train_loss": -6.387574195861816, "global_step": 105692, "epoch": 2516} {"train_loss": -6.368289947509766, "global_step": 105693, "epoch": 2516} {"train_loss": -6.515894889831543, "global_step": 105694, "epoch": 2516} {"train_loss": -6.342463970184326, "global_step": 105695, "epoch": 2516} {"train_loss": -6.426652431488037, "global_step": 105696, "epoch": 2516} {"train_loss": -6.36494255065918, "global_step": 105697, "epoch": 2516} {"train_loss": -6.36083459854126, "global_step": 105698, "epoch": 2516} {"train_loss": -6.281065940856934, "global_step": 105699, "epoch": 2516} {"train_loss": -6.365483283996582, "global_step": 105700, "epoch": 2516} {"train_loss": -6.351568698883057, "global_step": 105701, "epoch": 2516} {"train_loss": -6.316340446472168, "global_step": 105702, "epoch": 2516} {"train_loss": -6.4704909324646, "global_step": 105703, "epoch": 2516} {"train_loss": -6.370602607727051, "global_step": 105704, "epoch": 2516} {"train_loss": -6.477638244628906, "global_step": 105705, "epoch": 2516} {"train_loss": -6.376151084899902, "global_step": 105706, "epoch": 2516} {"train_loss": -6.394571304321289, "global_step": 105707, "epoch": 2516} {"train_loss": -6.508522987365723, "global_step": 105708, "epoch": 2516} {"train_loss": -6.47292423248291, "global_step": 105709, "epoch": 2516} {"train_loss": -6.353534698486328, "global_step": 105710, "epoch": 2516} {"train_loss": -6.399570465087891, "global_step": 105711, "epoch": 2516} {"train_loss": -6.5463972091674805, "global_step": 105712, "epoch": 2516} {"train_loss": -6.429174672989618, "global_step": 105713, "epoch": 2516, "val_loss": 64669.87890625} {"train_loss": -6.456655502319336, "global_step": 105714, "epoch": 2517} {"train_loss": -6.4734907150268555, "global_step": 105715, "epoch": 2517} {"train_loss": -6.496551513671875, "global_step": 105716, "epoch": 2517} {"train_loss": -6.3666582107543945, "global_step": 105717, "epoch": 2517} {"train_loss": -6.5526347160339355, "global_step": 105718, "epoch": 2517} {"train_loss": -6.430642604827881, "global_step": 105719, "epoch": 2517} {"train_loss": -6.362523555755615, "global_step": 105720, "epoch": 2517} {"train_loss": -6.449468612670898, "global_step": 105721, "epoch": 2517} {"train_loss": -6.427316188812256, "global_step": 105722, "epoch": 2517} {"train_loss": -6.5311079025268555, "global_step": 105723, "epoch": 2517} {"train_loss": -6.463420391082764, "global_step": 105724, "epoch": 2517} {"train_loss": -6.327031135559082, "global_step": 105725, "epoch": 2517} {"train_loss": -6.336574554443359, "global_step": 105726, "epoch": 2517} {"train_loss": -6.557136058807373, "global_step": 105727, "epoch": 2517} {"train_loss": -6.408254623413086, "global_step": 105728, "epoch": 2517} {"train_loss": -6.487331390380859, "global_step": 105729, "epoch": 2517} {"train_loss": -6.388660430908203, "global_step": 105730, "epoch": 2517} {"train_loss": -6.458078384399414, "global_step": 105731, "epoch": 2517} {"train_loss": -6.515385150909424, "global_step": 105732, "epoch": 2517} {"train_loss": -6.419218063354492, "global_step": 105733, "epoch": 2517} {"train_loss": -6.4560747146606445, "global_step": 105734, "epoch": 2517} {"train_loss": -6.489698886871338, "global_step": 105735, "epoch": 2517} {"train_loss": -6.463232517242432, "global_step": 105736, "epoch": 2517} {"train_loss": -6.502713203430176, "global_step": 105737, "epoch": 2517} {"train_loss": -6.451869010925293, "global_step": 105738, "epoch": 2517} {"train_loss": -6.399819850921631, "global_step": 105739, "epoch": 2517} {"train_loss": -6.410192489624023, "global_step": 105740, "epoch": 2517} {"train_loss": -6.50926399230957, "global_step": 105741, "epoch": 2517} {"train_loss": -6.523967266082764, "global_step": 105742, "epoch": 2517} {"train_loss": -6.495295524597168, "global_step": 105743, "epoch": 2517} {"train_loss": -6.530363082885742, "global_step": 105744, "epoch": 2517} {"train_loss": -6.425759315490723, "global_step": 105745, "epoch": 2517} {"train_loss": -6.3949995040893555, "global_step": 105746, "epoch": 2517} {"train_loss": -6.401793479919434, "global_step": 105747, "epoch": 2517} {"train_loss": -6.530622482299805, "global_step": 105748, "epoch": 2517} {"train_loss": -6.426482200622559, "global_step": 105749, "epoch": 2517} {"train_loss": -6.494383335113525, "global_step": 105750, "epoch": 2517} {"train_loss": -6.482903480529785, "global_step": 105751, "epoch": 2517} {"train_loss": -6.33204460144043, "global_step": 105752, "epoch": 2517} {"train_loss": -6.389029502868652, "global_step": 105753, "epoch": 2517} {"train_loss": -6.40755558013916, "global_step": 105754, "epoch": 2517} {"train_loss": -6.4488645281110495, "global_step": 105755, "epoch": 2517, "val_loss": 64716.91796875} {"train_loss": -6.453420639038086, "global_step": 105756, "epoch": 2518} {"train_loss": -6.411802768707275, "global_step": 105757, "epoch": 2518} {"train_loss": -6.3606977462768555, "global_step": 105758, "epoch": 2518} {"train_loss": -6.379461765289307, "global_step": 105759, "epoch": 2518} {"train_loss": -6.482998847961426, "global_step": 105760, "epoch": 2518} {"train_loss": -6.413760185241699, "global_step": 105761, "epoch": 2518} {"train_loss": -6.437877655029297, "global_step": 105762, "epoch": 2518} {"train_loss": -6.395574569702148, "global_step": 105763, "epoch": 2518} {"train_loss": -6.467598915100098, "global_step": 105764, "epoch": 2518} {"train_loss": -6.427110195159912, "global_step": 105765, "epoch": 2518} {"train_loss": -6.459156513214111, "global_step": 105766, "epoch": 2518} {"train_loss": -6.439599514007568, "global_step": 105767, "epoch": 2518} {"train_loss": -6.446382522583008, "global_step": 105768, "epoch": 2518} {"train_loss": -6.401466369628906, "global_step": 105769, "epoch": 2518} {"train_loss": -6.355502128601074, "global_step": 105770, "epoch": 2518} {"train_loss": -6.368715763092041, "global_step": 105771, "epoch": 2518} {"train_loss": -6.369616508483887, "global_step": 105772, "epoch": 2518} {"train_loss": -6.51873254776001, "global_step": 105773, "epoch": 2518} {"train_loss": -6.451696395874023, "global_step": 105774, "epoch": 2518} {"train_loss": -6.548205375671387, "global_step": 105775, "epoch": 2518} {"train_loss": -6.36505651473999, "global_step": 105776, "epoch": 2518} {"train_loss": -6.44480562210083, "global_step": 105777, "epoch": 2518} {"train_loss": -6.448538780212402, "global_step": 105778, "epoch": 2518} {"train_loss": -6.5330400466918945, "global_step": 105779, "epoch": 2518} {"train_loss": -6.491064071655273, "global_step": 105780, "epoch": 2518} {"train_loss": -6.521876335144043, "global_step": 105781, "epoch": 2518} {"train_loss": -6.329459190368652, "global_step": 105782, "epoch": 2518} {"train_loss": -6.517002105712891, "global_step": 105783, "epoch": 2518} {"train_loss": -6.4270524978637695, "global_step": 105784, "epoch": 2518} {"train_loss": -6.441848278045654, "global_step": 105785, "epoch": 2518} {"train_loss": -6.442323684692383, "global_step": 105786, "epoch": 2518} {"train_loss": -6.426881313323975, "global_step": 105787, "epoch": 2518} {"train_loss": -6.521475315093994, "global_step": 105788, "epoch": 2518} {"train_loss": -6.482536315917969, "global_step": 105789, "epoch": 2518} {"train_loss": -6.418439865112305, "global_step": 105790, "epoch": 2518} {"train_loss": -6.4599151611328125, "global_step": 105791, "epoch": 2518} {"train_loss": -6.5060038566589355, "global_step": 105792, "epoch": 2518} {"train_loss": -6.461770057678223, "global_step": 105793, "epoch": 2518} {"train_loss": -6.406435966491699, "global_step": 105794, "epoch": 2518} {"train_loss": -6.495755195617676, "global_step": 105795, "epoch": 2518} {"train_loss": -6.348637580871582, "global_step": 105796, "epoch": 2518} {"train_loss": -6.439609448115031, "global_step": 105797, "epoch": 2518, "val_loss": 64434.21875} {"train_loss": -6.488718032836914, "global_step": 105798, "epoch": 2519} {"train_loss": -6.430694103240967, "global_step": 105799, "epoch": 2519} {"train_loss": -6.376963138580322, "global_step": 105800, "epoch": 2519} {"train_loss": -6.313262939453125, "global_step": 105801, "epoch": 2519} {"train_loss": -6.381940841674805, "global_step": 105802, "epoch": 2519} {"train_loss": -6.304283142089844, "global_step": 105803, "epoch": 2519} {"train_loss": -6.302873134613037, "global_step": 105804, "epoch": 2519} {"train_loss": -6.406224250793457, "global_step": 105805, "epoch": 2519} {"train_loss": -6.400352478027344, "global_step": 105806, "epoch": 2519} {"train_loss": -6.367225646972656, "global_step": 105807, "epoch": 2519} {"train_loss": -6.473479747772217, "global_step": 105808, "epoch": 2519} {"train_loss": -6.346607685089111, "global_step": 105809, "epoch": 2519} {"train_loss": -6.350381851196289, "global_step": 105810, "epoch": 2519} {"train_loss": -6.3405442237854, "global_step": 105811, "epoch": 2519} {"train_loss": -6.3423614501953125, "global_step": 105812, "epoch": 2519} {"train_loss": -6.386075973510742, "global_step": 105813, "epoch": 2519} {"train_loss": -6.407581329345703, "global_step": 105814, "epoch": 2519} {"train_loss": -6.353384494781494, "global_step": 105815, "epoch": 2519} {"train_loss": -6.365488529205322, "global_step": 105816, "epoch": 2519} {"train_loss": -6.446141242980957, "global_step": 105817, "epoch": 2519} {"train_loss": -6.472002983093262, "global_step": 105818, "epoch": 2519} {"train_loss": -6.508297920227051, "global_step": 105819, "epoch": 2519} {"train_loss": -6.356681823730469, "global_step": 105820, "epoch": 2519} {"train_loss": -6.405187606811523, "global_step": 105821, "epoch": 2519} {"train_loss": -6.278017997741699, "global_step": 105822, "epoch": 2519} {"train_loss": -6.475539684295654, "global_step": 105823, "epoch": 2519} {"train_loss": -6.369541168212891, "global_step": 105824, "epoch": 2519} {"train_loss": -6.471700191497803, "global_step": 105825, "epoch": 2519} {"train_loss": -6.364826679229736, "global_step": 105826, "epoch": 2519} {"train_loss": -6.401244640350342, "global_step": 105827, "epoch": 2519} {"train_loss": -6.414028644561768, "global_step": 105828, "epoch": 2519} {"train_loss": -6.295807361602783, "global_step": 105829, "epoch": 2519} {"train_loss": -6.3460893630981445, "global_step": 105830, "epoch": 2519} {"train_loss": -6.396924018859863, "global_step": 105831, "epoch": 2519} {"train_loss": -6.427662372589111, "global_step": 105832, "epoch": 2519} {"train_loss": -6.364666938781738, "global_step": 105833, "epoch": 2519} {"train_loss": -6.379877090454102, "global_step": 105834, "epoch": 2519} {"train_loss": -6.438109874725342, "global_step": 105835, "epoch": 2519} {"train_loss": -6.174447059631348, "global_step": 105836, "epoch": 2519} {"train_loss": -6.372063159942627, "global_step": 105837, "epoch": 2519} {"train_loss": -6.408578395843506, "global_step": 105838, "epoch": 2519} {"train_loss": -6.37911581993103, "global_step": 105839, "epoch": 2519, "val_loss": 64711.65234375} {"train_loss": -6.360782623291016, "global_step": 105840, "epoch": 2520} {"train_loss": -6.309638977050781, "global_step": 105841, "epoch": 2520} {"train_loss": -6.4199042320251465, "global_step": 105842, "epoch": 2520} {"train_loss": -6.437046051025391, "global_step": 105843, "epoch": 2520} {"train_loss": -6.2078938484191895, "global_step": 105844, "epoch": 2520} {"train_loss": -6.437008857727051, "global_step": 105845, "epoch": 2520} {"train_loss": -6.297908782958984, "global_step": 105846, "epoch": 2520} {"train_loss": -6.416031837463379, "global_step": 105847, "epoch": 2520} {"train_loss": -6.335948944091797, "global_step": 105848, "epoch": 2520} {"train_loss": -6.311877250671387, "global_step": 105849, "epoch": 2520} {"train_loss": -6.285511016845703, "global_step": 105850, "epoch": 2520} {"train_loss": -6.399455547332764, "global_step": 105851, "epoch": 2520} {"train_loss": -6.458487033843994, "global_step": 105852, "epoch": 2520} {"train_loss": -6.388894081115723, "global_step": 105853, "epoch": 2520} {"train_loss": -6.524903297424316, "global_step": 105854, "epoch": 2520} {"train_loss": -6.3413987159729, "global_step": 105855, "epoch": 2520} {"train_loss": -6.399967670440674, "global_step": 105856, "epoch": 2520} {"train_loss": -6.481746673583984, "global_step": 105857, "epoch": 2520} {"train_loss": -6.545859336853027, "global_step": 105858, "epoch": 2520} {"train_loss": -6.490538120269775, "global_step": 105859, "epoch": 2520} {"train_loss": -6.427057266235352, "global_step": 105860, "epoch": 2520} {"train_loss": -6.457510948181152, "global_step": 105861, "epoch": 2520} {"train_loss": -6.449461460113525, "global_step": 105862, "epoch": 2520} {"train_loss": -6.367478847503662, "global_step": 105863, "epoch": 2520} {"train_loss": -6.38485050201416, "global_step": 105864, "epoch": 2520} {"train_loss": -6.469599723815918, "global_step": 105865, "epoch": 2520} {"train_loss": -6.40877628326416, "global_step": 105866, "epoch": 2520} {"train_loss": -6.407083511352539, "global_step": 105867, "epoch": 2520} {"train_loss": -6.398920059204102, "global_step": 105868, "epoch": 2520} {"train_loss": -6.369636535644531, "global_step": 105869, "epoch": 2520} {"train_loss": -6.3681640625, "global_step": 105870, "epoch": 2520} {"train_loss": -6.4126482009887695, "global_step": 105871, "epoch": 2520} {"train_loss": -6.4095048904418945, "global_step": 105872, "epoch": 2520} {"train_loss": -6.508941650390625, "global_step": 105873, "epoch": 2520} {"train_loss": -6.336615562438965, "global_step": 105874, "epoch": 2520} {"train_loss": -6.512700080871582, "global_step": 105875, "epoch": 2520} {"train_loss": -6.342566967010498, "global_step": 105876, "epoch": 2520} {"train_loss": -6.424250602722168, "global_step": 105877, "epoch": 2520} {"train_loss": -6.470076084136963, "global_step": 105878, "epoch": 2520} {"train_loss": -6.485350608825684, "global_step": 105879, "epoch": 2520} {"train_loss": -6.474042892456055, "global_step": 105880, "epoch": 2520} {"train_loss": -6.41072694460551, "global_step": 105881, "epoch": 2520, "val_loss": 64621.7890625} {"train_loss": -6.432818412780762, "global_step": 105882, "epoch": 2521} {"train_loss": -6.548619747161865, "global_step": 105883, "epoch": 2521} {"train_loss": -6.465919494628906, "global_step": 105884, "epoch": 2521} {"train_loss": -6.472806930541992, "global_step": 105885, "epoch": 2521} {"train_loss": -6.511962890625, "global_step": 105886, "epoch": 2521} {"train_loss": -6.486970901489258, "global_step": 105887, "epoch": 2521} {"train_loss": -6.470076560974121, "global_step": 105888, "epoch": 2521} {"train_loss": -6.509045124053955, "global_step": 105889, "epoch": 2521} {"train_loss": -6.514948844909668, "global_step": 105890, "epoch": 2521} {"train_loss": -6.446135997772217, "global_step": 105891, "epoch": 2521} {"train_loss": -6.417200088500977, "global_step": 105892, "epoch": 2521} {"train_loss": -6.435817718505859, "global_step": 105893, "epoch": 2521} {"train_loss": -6.416302680969238, "global_step": 105894, "epoch": 2521} {"train_loss": -6.406993865966797, "global_step": 105895, "epoch": 2521} {"train_loss": -6.208903789520264, "global_step": 105896, "epoch": 2521} {"train_loss": -6.379180908203125, "global_step": 105897, "epoch": 2521} {"train_loss": -6.4163737297058105, "global_step": 105898, "epoch": 2521} {"train_loss": -6.400564193725586, "global_step": 105899, "epoch": 2521} {"train_loss": -6.486210823059082, "global_step": 105900, "epoch": 2521} {"train_loss": -6.33418083190918, "global_step": 105901, "epoch": 2521} {"train_loss": -6.21042537689209, "global_step": 105902, "epoch": 2521} {"train_loss": -6.488397598266602, "global_step": 105903, "epoch": 2521} {"train_loss": -6.328960418701172, "global_step": 105904, "epoch": 2521} {"train_loss": -6.312173843383789, "global_step": 105905, "epoch": 2521} {"train_loss": -6.4538469314575195, "global_step": 105906, "epoch": 2521} {"train_loss": -6.339962959289551, "global_step": 105907, "epoch": 2521} {"train_loss": -6.464023113250732, "global_step": 105908, "epoch": 2521} {"train_loss": -6.423083305358887, "global_step": 105909, "epoch": 2521} {"train_loss": -6.486104488372803, "global_step": 105910, "epoch": 2521} {"train_loss": -6.4671101570129395, "global_step": 105911, "epoch": 2521} {"train_loss": -6.477080345153809, "global_step": 105912, "epoch": 2521} {"train_loss": -6.518476486206055, "global_step": 105913, "epoch": 2521} {"train_loss": -6.325819969177246, "global_step": 105914, "epoch": 2521} {"train_loss": -6.367000102996826, "global_step": 105915, "epoch": 2521} {"train_loss": -6.391302108764648, "global_step": 105916, "epoch": 2521} {"train_loss": -6.325167179107666, "global_step": 105917, "epoch": 2521} {"train_loss": -6.316831111907959, "global_step": 105918, "epoch": 2521} {"train_loss": -6.453238010406494, "global_step": 105919, "epoch": 2521} {"train_loss": -6.393464088439941, "global_step": 105920, "epoch": 2521} {"train_loss": -6.40810489654541, "global_step": 105921, "epoch": 2521} {"train_loss": -6.34444522857666, "global_step": 105922, "epoch": 2521} {"train_loss": -6.416771616254534, "global_step": 105923, "epoch": 2521, "val_loss": 64835.22265625} {"train_loss": -6.332088470458984, "global_step": 105924, "epoch": 2522} {"train_loss": -6.322036266326904, "global_step": 105925, "epoch": 2522} {"train_loss": -6.55964469909668, "global_step": 105926, "epoch": 2522} {"train_loss": -6.386371612548828, "global_step": 105927, "epoch": 2522} {"train_loss": -6.503539085388184, "global_step": 105928, "epoch": 2522} {"train_loss": -6.427772045135498, "global_step": 105929, "epoch": 2522} {"train_loss": -6.3579182624816895, "global_step": 105930, "epoch": 2522} {"train_loss": -6.503316402435303, "global_step": 105931, "epoch": 2522} {"train_loss": -6.324174880981445, "global_step": 105932, "epoch": 2522} {"train_loss": -6.374058723449707, "global_step": 105933, "epoch": 2522} {"train_loss": -6.361019134521484, "global_step": 105934, "epoch": 2522} {"train_loss": -6.395702838897705, "global_step": 105935, "epoch": 2522} {"train_loss": -6.387529373168945, "global_step": 105936, "epoch": 2522} {"train_loss": -6.42042350769043, "global_step": 105937, "epoch": 2522} {"train_loss": -6.388556480407715, "global_step": 105938, "epoch": 2522} {"train_loss": -6.299617767333984, "global_step": 105939, "epoch": 2522} {"train_loss": -6.439998626708984, "global_step": 105940, "epoch": 2522} {"train_loss": -6.293875694274902, "global_step": 105941, "epoch": 2522} {"train_loss": -6.2327351570129395, "global_step": 105942, "epoch": 2522} {"train_loss": -6.314151287078857, "global_step": 105943, "epoch": 2522} {"train_loss": -6.280295372009277, "global_step": 105944, "epoch": 2522} {"train_loss": -6.435544013977051, "global_step": 105945, "epoch": 2522} {"train_loss": -6.411425590515137, "global_step": 105946, "epoch": 2522} {"train_loss": -6.291539192199707, "global_step": 105947, "epoch": 2522} {"train_loss": -6.273967742919922, "global_step": 105948, "epoch": 2522} {"train_loss": -6.25017786026001, "global_step": 105949, "epoch": 2522} {"train_loss": -6.395658493041992, "global_step": 105950, "epoch": 2522} {"train_loss": -6.310643196105957, "global_step": 105951, "epoch": 2522} {"train_loss": -6.427888870239258, "global_step": 105952, "epoch": 2522} {"train_loss": -6.392051696777344, "global_step": 105953, "epoch": 2522} {"train_loss": -6.429584980010986, "global_step": 105954, "epoch": 2522} {"train_loss": -6.353081226348877, "global_step": 105955, "epoch": 2522} {"train_loss": -6.358914852142334, "global_step": 105956, "epoch": 2522} {"train_loss": -6.306169509887695, "global_step": 105957, "epoch": 2522} {"train_loss": -6.405238151550293, "global_step": 105958, "epoch": 2522} {"train_loss": -6.523359775543213, "global_step": 105959, "epoch": 2522} {"train_loss": -6.483160018920898, "global_step": 105960, "epoch": 2522} {"train_loss": -6.375891208648682, "global_step": 105961, "epoch": 2522} {"train_loss": -6.366866588592529, "global_step": 105962, "epoch": 2522} {"train_loss": -6.438612937927246, "global_step": 105963, "epoch": 2522} {"train_loss": -6.442038536071777, "global_step": 105964, "epoch": 2522} {"train_loss": -6.3808064460754395, "global_step": 105965, "epoch": 2522, "val_loss": 64433.76953125} {"train_loss": -6.511009216308594, "global_step": 105966, "epoch": 2523} {"train_loss": -6.472522735595703, "global_step": 105967, "epoch": 2523} {"train_loss": -6.408886432647705, "global_step": 105968, "epoch": 2523} {"train_loss": -6.458641052246094, "global_step": 105969, "epoch": 2523} {"train_loss": -6.564157485961914, "global_step": 105970, "epoch": 2523} {"train_loss": -6.370525360107422, "global_step": 105971, "epoch": 2523} {"train_loss": -6.423330783843994, "global_step": 105972, "epoch": 2523} {"train_loss": -6.460234642028809, "global_step": 105973, "epoch": 2523} {"train_loss": -6.53646183013916, "global_step": 105974, "epoch": 2523} {"train_loss": -6.554281234741211, "global_step": 105975, "epoch": 2523} {"train_loss": -6.528994560241699, "global_step": 105976, "epoch": 2523} {"train_loss": -6.485512733459473, "global_step": 105977, "epoch": 2523} {"train_loss": -6.365808486938477, "global_step": 105978, "epoch": 2523} {"train_loss": -6.433795928955078, "global_step": 105979, "epoch": 2523} {"train_loss": -6.440697193145752, "global_step": 105980, "epoch": 2523} {"train_loss": -6.605101108551025, "global_step": 105981, "epoch": 2523} {"train_loss": -6.4217915534973145, "global_step": 105982, "epoch": 2523} {"train_loss": -6.447397708892822, "global_step": 105983, "epoch": 2523} {"train_loss": -6.52665901184082, "global_step": 105984, "epoch": 2523} {"train_loss": -6.524764060974121, "global_step": 105985, "epoch": 2523} {"train_loss": -6.459565162658691, "global_step": 105986, "epoch": 2523} {"train_loss": -6.372298717498779, "global_step": 105987, "epoch": 2523} {"train_loss": -6.320614337921143, "global_step": 105988, "epoch": 2523} {"train_loss": -6.443169593811035, "global_step": 105989, "epoch": 2523} {"train_loss": -6.5402326583862305, "global_step": 105990, "epoch": 2523} {"train_loss": -6.46647834777832, "global_step": 105991, "epoch": 2523} {"train_loss": -6.3089470863342285, "global_step": 105992, "epoch": 2523} {"train_loss": -6.446922302246094, "global_step": 105993, "epoch": 2523} {"train_loss": -6.4735565185546875, "global_step": 105994, "epoch": 2523} {"train_loss": -6.420185089111328, "global_step": 105995, "epoch": 2523} {"train_loss": -6.404297351837158, "global_step": 105996, "epoch": 2523} {"train_loss": -6.431647777557373, "global_step": 105997, "epoch": 2523} {"train_loss": -6.55189323425293, "global_step": 105998, "epoch": 2523} {"train_loss": -6.366621971130371, "global_step": 105999, "epoch": 2523} {"train_loss": -6.4486083984375, "global_step": 106000, "epoch": 2523} {"train_loss": -6.355921268463135, "global_step": 106001, "epoch": 2523} {"train_loss": -6.473295211791992, "global_step": 106002, "epoch": 2523} {"train_loss": -6.346268653869629, "global_step": 106003, "epoch": 2523} {"train_loss": -6.321798801422119, "global_step": 106004, "epoch": 2523} {"train_loss": -6.422598838806152, "global_step": 106005, "epoch": 2523} {"train_loss": -6.466390609741211, "global_step": 106006, "epoch": 2523} {"train_loss": -6.443501006989252, "global_step": 106007, "epoch": 2523, "val_loss": 64790.45703125} {"train_loss": -6.35596227645874, "global_step": 106008, "epoch": 2524} {"train_loss": -6.408789157867432, "global_step": 106009, "epoch": 2524} {"train_loss": -6.419437885284424, "global_step": 106010, "epoch": 2524} {"train_loss": -6.277527809143066, "global_step": 106011, "epoch": 2524} {"train_loss": -6.419989109039307, "global_step": 106012, "epoch": 2524} {"train_loss": -6.390740394592285, "global_step": 106013, "epoch": 2524} {"train_loss": -6.289651870727539, "global_step": 106014, "epoch": 2524} {"train_loss": -6.4870405197143555, "global_step": 106015, "epoch": 2524} {"train_loss": -6.357276916503906, "global_step": 106016, "epoch": 2524} {"train_loss": -6.431203365325928, "global_step": 106017, "epoch": 2524} {"train_loss": -6.529661178588867, "global_step": 106018, "epoch": 2524} {"train_loss": -6.422908306121826, "global_step": 106019, "epoch": 2524} {"train_loss": -6.462594032287598, "global_step": 106020, "epoch": 2524} {"train_loss": -6.374585151672363, "global_step": 106021, "epoch": 2524} {"train_loss": -6.4219512939453125, "global_step": 106022, "epoch": 2524} {"train_loss": -6.358665466308594, "global_step": 106023, "epoch": 2524} {"train_loss": -6.3743438720703125, "global_step": 106024, "epoch": 2524} {"train_loss": -6.398021221160889, "global_step": 106025, "epoch": 2524} {"train_loss": -6.390966415405273, "global_step": 106026, "epoch": 2524} {"train_loss": -6.337141990661621, "global_step": 106027, "epoch": 2524} {"train_loss": -6.43547248840332, "global_step": 106028, "epoch": 2524} {"train_loss": -6.401673316955566, "global_step": 106029, "epoch": 2524} {"train_loss": -6.37680721282959, "global_step": 106030, "epoch": 2524} {"train_loss": -6.356558322906494, "global_step": 106031, "epoch": 2524} {"train_loss": -6.440116882324219, "global_step": 106032, "epoch": 2524} {"train_loss": -6.336483001708984, "global_step": 106033, "epoch": 2524} {"train_loss": -6.308599472045898, "global_step": 106034, "epoch": 2524} {"train_loss": -6.310338973999023, "global_step": 106035, "epoch": 2524} {"train_loss": -6.245197296142578, "global_step": 106036, "epoch": 2524} {"train_loss": -6.425358772277832, "global_step": 106037, "epoch": 2524} {"train_loss": -6.258500099182129, "global_step": 106038, "epoch": 2524} {"train_loss": -6.418344020843506, "global_step": 106039, "epoch": 2524} {"train_loss": -6.42024040222168, "global_step": 106040, "epoch": 2524} {"train_loss": -6.444929122924805, "global_step": 106041, "epoch": 2524} {"train_loss": -6.428711414337158, "global_step": 106042, "epoch": 2524} {"train_loss": -6.221437454223633, "global_step": 106043, "epoch": 2524} {"train_loss": -6.444822311401367, "global_step": 106044, "epoch": 2524} {"train_loss": -6.375922679901123, "global_step": 106045, "epoch": 2524} {"train_loss": -6.305138111114502, "global_step": 106046, "epoch": 2524} {"train_loss": -6.488993167877197, "global_step": 106047, "epoch": 2524} {"train_loss": -6.42487096786499, "global_step": 106048, "epoch": 2524} {"train_loss": -6.386997291019985, "global_step": 106049, "epoch": 2524, "val_loss": 64561.11328125} {"train_loss": -6.368147850036621, "global_step": 106050, "epoch": 2525} {"train_loss": -6.452915668487549, "global_step": 106051, "epoch": 2525} {"train_loss": -6.564962387084961, "global_step": 106052, "epoch": 2525} {"train_loss": -6.431941986083984, "global_step": 106053, "epoch": 2525} {"train_loss": -6.413536548614502, "global_step": 106054, "epoch": 2525} {"train_loss": -6.3198442459106445, "global_step": 106055, "epoch": 2525} {"train_loss": -6.402011871337891, "global_step": 106056, "epoch": 2525} {"train_loss": -6.452122211456299, "global_step": 106057, "epoch": 2525} {"train_loss": -6.480367183685303, "global_step": 106058, "epoch": 2525} {"train_loss": -6.447514533996582, "global_step": 106059, "epoch": 2525} {"train_loss": -6.36110258102417, "global_step": 106060, "epoch": 2525} {"train_loss": -6.450098514556885, "global_step": 106061, "epoch": 2525} {"train_loss": -6.425922870635986, "global_step": 106062, "epoch": 2525} {"train_loss": -6.396655559539795, "global_step": 106063, "epoch": 2525} {"train_loss": -6.529373645782471, "global_step": 106064, "epoch": 2525} {"train_loss": -6.404334545135498, "global_step": 106065, "epoch": 2525} {"train_loss": -6.515213966369629, "global_step": 106066, "epoch": 2525} {"train_loss": -6.319999694824219, "global_step": 106067, "epoch": 2525} {"train_loss": -6.452183723449707, "global_step": 106068, "epoch": 2525} {"train_loss": -6.398780345916748, "global_step": 106069, "epoch": 2525} {"train_loss": -6.443038463592529, "global_step": 106070, "epoch": 2525} {"train_loss": -6.349155426025391, "global_step": 106071, "epoch": 2525} {"train_loss": -6.300509452819824, "global_step": 106072, "epoch": 2525} {"train_loss": -6.483773231506348, "global_step": 106073, "epoch": 2525} {"train_loss": -6.46385383605957, "global_step": 106074, "epoch": 2525} {"train_loss": -6.401547431945801, "global_step": 106075, "epoch": 2525} {"train_loss": -6.321428298950195, "global_step": 106076, "epoch": 2525} {"train_loss": -6.424817085266113, "global_step": 106077, "epoch": 2525} {"train_loss": -6.400461196899414, "global_step": 106078, "epoch": 2525} {"train_loss": -6.511539459228516, "global_step": 106079, "epoch": 2525} {"train_loss": -6.435377597808838, "global_step": 106080, "epoch": 2525} {"train_loss": -6.362237930297852, "global_step": 106081, "epoch": 2525} {"train_loss": -6.389111042022705, "global_step": 106082, "epoch": 2525} {"train_loss": -6.393206596374512, "global_step": 106083, "epoch": 2525} {"train_loss": -6.425821781158447, "global_step": 106084, "epoch": 2525} {"train_loss": -6.428703308105469, "global_step": 106085, "epoch": 2525} {"train_loss": -6.2480669021606445, "global_step": 106086, "epoch": 2525} {"train_loss": -6.345853805541992, "global_step": 106087, "epoch": 2525} {"train_loss": -6.374286651611328, "global_step": 106088, "epoch": 2525} {"train_loss": -6.332752227783203, "global_step": 106089, "epoch": 2525} {"train_loss": -6.326284408569336, "global_step": 106090, "epoch": 2525} {"train_loss": -6.405998354866391, "global_step": 106091, "epoch": 2525, "val_loss": 64480.60546875} {"train_loss": -6.425427436828613, "global_step": 106092, "epoch": 2526} {"train_loss": -6.256987571716309, "global_step": 106093, "epoch": 2526} {"train_loss": -6.424751281738281, "global_step": 106094, "epoch": 2526} {"train_loss": -6.337007522583008, "global_step": 106095, "epoch": 2526} {"train_loss": -6.298367500305176, "global_step": 106096, "epoch": 2526} {"train_loss": -6.310395240783691, "global_step": 106097, "epoch": 2526} {"train_loss": -6.306453704833984, "global_step": 106098, "epoch": 2526} {"train_loss": -6.337723731994629, "global_step": 106099, "epoch": 2526} {"train_loss": -6.3929314613342285, "global_step": 106100, "epoch": 2526} {"train_loss": -6.3997907638549805, "global_step": 106101, "epoch": 2526} {"train_loss": -6.336713790893555, "global_step": 106102, "epoch": 2526} {"train_loss": -6.232424736022949, "global_step": 106103, "epoch": 2526} {"train_loss": -6.270014762878418, "global_step": 106104, "epoch": 2526} {"train_loss": -6.415765762329102, "global_step": 106105, "epoch": 2526} {"train_loss": -6.363369464874268, "global_step": 106106, "epoch": 2526} {"train_loss": -6.428471088409424, "global_step": 106107, "epoch": 2526} {"train_loss": -6.414571762084961, "global_step": 106108, "epoch": 2526} {"train_loss": -6.476980209350586, "global_step": 106109, "epoch": 2526} {"train_loss": -6.540037631988525, "global_step": 106110, "epoch": 2526} {"train_loss": -6.432608604431152, "global_step": 106111, "epoch": 2526} {"train_loss": -6.480852127075195, "global_step": 106112, "epoch": 2526} {"train_loss": -6.390565872192383, "global_step": 106113, "epoch": 2526} {"train_loss": -6.319990634918213, "global_step": 106114, "epoch": 2526} {"train_loss": -6.279059410095215, "global_step": 106115, "epoch": 2526} {"train_loss": -6.463257312774658, "global_step": 106116, "epoch": 2526} {"train_loss": -6.434415817260742, "global_step": 106117, "epoch": 2526} {"train_loss": -6.474292755126953, "global_step": 106118, "epoch": 2526} {"train_loss": -6.48250675201416, "global_step": 106119, "epoch": 2526} {"train_loss": -6.4740190505981445, "global_step": 106120, "epoch": 2526} {"train_loss": -6.431103229522705, "global_step": 106121, "epoch": 2526} {"train_loss": -6.390044212341309, "global_step": 106122, "epoch": 2526} {"train_loss": -6.5400238037109375, "global_step": 106123, "epoch": 2526} {"train_loss": -6.389721870422363, "global_step": 106124, "epoch": 2526} {"train_loss": -6.500093460083008, "global_step": 106125, "epoch": 2526} {"train_loss": -6.5201416015625, "global_step": 106126, "epoch": 2526} {"train_loss": -6.4912614822387695, "global_step": 106127, "epoch": 2526} {"train_loss": -6.4491753578186035, "global_step": 106128, "epoch": 2526} {"train_loss": -6.443526268005371, "global_step": 106129, "epoch": 2526} {"train_loss": -6.493614196777344, "global_step": 106130, "epoch": 2526} {"train_loss": -6.519926071166992, "global_step": 106131, "epoch": 2526} {"train_loss": -6.487975597381592, "global_step": 106132, "epoch": 2526} {"train_loss": -6.412954023906162, "global_step": 106133, "epoch": 2526, "val_loss": 64709.26953125} {"train_loss": -6.464936256408691, "global_step": 106134, "epoch": 2527} {"train_loss": -6.477262496948242, "global_step": 106135, "epoch": 2527} {"train_loss": -6.360199928283691, "global_step": 106136, "epoch": 2527} {"train_loss": -6.346724510192871, "global_step": 106137, "epoch": 2527} {"train_loss": -6.4547905921936035, "global_step": 106138, "epoch": 2527} {"train_loss": -6.434462547302246, "global_step": 106139, "epoch": 2527} {"train_loss": -6.446104526519775, "global_step": 106140, "epoch": 2527} {"train_loss": -6.583871841430664, "global_step": 106141, "epoch": 2527} {"train_loss": -6.400986671447754, "global_step": 106142, "epoch": 2527} {"train_loss": -6.361528396606445, "global_step": 106143, "epoch": 2527} {"train_loss": -6.467599868774414, "global_step": 106144, "epoch": 2527} {"train_loss": -6.448122024536133, "global_step": 106145, "epoch": 2527} {"train_loss": -6.424976348876953, "global_step": 106146, "epoch": 2527} {"train_loss": -6.530519485473633, "global_step": 106147, "epoch": 2527} {"train_loss": -6.3438401222229, "global_step": 106148, "epoch": 2527} {"train_loss": -6.395642280578613, "global_step": 106149, "epoch": 2527} {"train_loss": -6.402823448181152, "global_step": 106150, "epoch": 2527} {"train_loss": -6.482378959655762, "global_step": 106151, "epoch": 2527} {"train_loss": -6.426852226257324, "global_step": 106152, "epoch": 2527} {"train_loss": -6.541053771972656, "global_step": 106153, "epoch": 2527} {"train_loss": -6.387312412261963, "global_step": 106154, "epoch": 2527} {"train_loss": -6.329687595367432, "global_step": 106155, "epoch": 2527} {"train_loss": -6.352875709533691, "global_step": 106156, "epoch": 2527} {"train_loss": -6.3134002685546875, "global_step": 106157, "epoch": 2527} {"train_loss": -6.331925392150879, "global_step": 106158, "epoch": 2527} {"train_loss": -6.332981109619141, "global_step": 106159, "epoch": 2527} {"train_loss": -6.456455230712891, "global_step": 106160, "epoch": 2527} {"train_loss": -6.291346549987793, "global_step": 106161, "epoch": 2527} {"train_loss": -6.500425815582275, "global_step": 106162, "epoch": 2527} {"train_loss": -6.338502883911133, "global_step": 106163, "epoch": 2527} {"train_loss": -6.414467811584473, "global_step": 106164, "epoch": 2527} {"train_loss": -6.490017890930176, "global_step": 106165, "epoch": 2527} {"train_loss": -6.402681350708008, "global_step": 106166, "epoch": 2527} {"train_loss": -6.462255954742432, "global_step": 106167, "epoch": 2527} {"train_loss": -6.538605690002441, "global_step": 106168, "epoch": 2527} {"train_loss": -6.389287948608398, "global_step": 106169, "epoch": 2527} {"train_loss": -6.376916885375977, "global_step": 106170, "epoch": 2527} {"train_loss": -6.549073696136475, "global_step": 106171, "epoch": 2527} {"train_loss": -6.442646026611328, "global_step": 106172, "epoch": 2527} {"train_loss": -6.473780632019043, "global_step": 106173, "epoch": 2527} {"train_loss": -6.3534722328186035, "global_step": 106174, "epoch": 2527} {"train_loss": -6.421073243731544, "global_step": 106175, "epoch": 2527, "val_loss": 64623.62109375} {"train_loss": -6.506281852722168, "global_step": 106176, "epoch": 2528} {"train_loss": -6.408648490905762, "global_step": 106177, "epoch": 2528} {"train_loss": -6.452084541320801, "global_step": 106178, "epoch": 2528} {"train_loss": -6.322420120239258, "global_step": 106179, "epoch": 2528} {"train_loss": -6.510715961456299, "global_step": 106180, "epoch": 2528} {"train_loss": -6.514253616333008, "global_step": 106181, "epoch": 2528} {"train_loss": -6.465610980987549, "global_step": 106182, "epoch": 2528} {"train_loss": -6.513665676116943, "global_step": 106183, "epoch": 2528} {"train_loss": -6.41605806350708, "global_step": 106184, "epoch": 2528} {"train_loss": -6.440417289733887, "global_step": 106185, "epoch": 2528} {"train_loss": -6.550136566162109, "global_step": 106186, "epoch": 2528} {"train_loss": -6.37338399887085, "global_step": 106187, "epoch": 2528} {"train_loss": -6.437032699584961, "global_step": 106188, "epoch": 2528} {"train_loss": -6.3639302253723145, "global_step": 106189, "epoch": 2528} {"train_loss": -6.331879615783691, "global_step": 106190, "epoch": 2528} {"train_loss": -6.494378089904785, "global_step": 106191, "epoch": 2528} {"train_loss": -6.398337364196777, "global_step": 106192, "epoch": 2528} {"train_loss": -6.509154319763184, "global_step": 106193, "epoch": 2528} {"train_loss": -6.378814697265625, "global_step": 106194, "epoch": 2528} {"train_loss": -6.48372220993042, "global_step": 106195, "epoch": 2528} {"train_loss": -6.41717529296875, "global_step": 106196, "epoch": 2528} {"train_loss": -6.401909828186035, "global_step": 106197, "epoch": 2528} {"train_loss": -6.41648006439209, "global_step": 106198, "epoch": 2528} {"train_loss": -6.493136405944824, "global_step": 106199, "epoch": 2528} {"train_loss": -6.375380516052246, "global_step": 106200, "epoch": 2528} {"train_loss": -6.394100189208984, "global_step": 106201, "epoch": 2528} {"train_loss": -6.517523765563965, "global_step": 106202, "epoch": 2528} {"train_loss": -6.473284721374512, "global_step": 106203, "epoch": 2528} {"train_loss": -6.452031135559082, "global_step": 106204, "epoch": 2528} {"train_loss": -6.459442138671875, "global_step": 106205, "epoch": 2528} {"train_loss": -6.383922576904297, "global_step": 106206, "epoch": 2528} {"train_loss": -6.285039901733398, "global_step": 106207, "epoch": 2528} {"train_loss": -6.465524196624756, "global_step": 106208, "epoch": 2528} {"train_loss": -6.5552778244018555, "global_step": 106209, "epoch": 2528} {"train_loss": -6.4309468269348145, "global_step": 106210, "epoch": 2528} {"train_loss": -6.509589195251465, "global_step": 106211, "epoch": 2528} {"train_loss": -6.447554111480713, "global_step": 106212, "epoch": 2528} {"train_loss": -6.475407600402832, "global_step": 106213, "epoch": 2528} {"train_loss": -6.447046756744385, "global_step": 106214, "epoch": 2528} {"train_loss": -6.437831878662109, "global_step": 106215, "epoch": 2528} {"train_loss": -6.423685550689697, "global_step": 106216, "epoch": 2528} {"train_loss": -6.4417156264895485, "global_step": 106217, "epoch": 2528, "val_loss": 64626.65234375} {"train_loss": -6.483642578125, "global_step": 106218, "epoch": 2529} {"train_loss": -6.415679454803467, "global_step": 106219, "epoch": 2529} {"train_loss": -6.389291763305664, "global_step": 106220, "epoch": 2529} {"train_loss": -6.417261600494385, "global_step": 106221, "epoch": 2529} {"train_loss": -6.401362419128418, "global_step": 106222, "epoch": 2529} {"train_loss": -6.449298858642578, "global_step": 106223, "epoch": 2529} {"train_loss": -6.43082857131958, "global_step": 106224, "epoch": 2529} {"train_loss": -6.376222610473633, "global_step": 106225, "epoch": 2529} {"train_loss": -6.459489345550537, "global_step": 106226, "epoch": 2529} {"train_loss": -6.406818389892578, "global_step": 106227, "epoch": 2529} {"train_loss": -6.242086410522461, "global_step": 106228, "epoch": 2529} {"train_loss": -6.3477678298950195, "global_step": 106229, "epoch": 2529} {"train_loss": -6.455521583557129, "global_step": 106230, "epoch": 2529} {"train_loss": -6.319558143615723, "global_step": 106231, "epoch": 2529} {"train_loss": -6.407341957092285, "global_step": 106232, "epoch": 2529} {"train_loss": -6.3848114013671875, "global_step": 106233, "epoch": 2529} {"train_loss": -6.208797931671143, "global_step": 106234, "epoch": 2529} {"train_loss": -6.501958847045898, "global_step": 106235, "epoch": 2529} {"train_loss": -6.296792030334473, "global_step": 106236, "epoch": 2529} {"train_loss": -6.350545406341553, "global_step": 106237, "epoch": 2529} {"train_loss": -6.439917087554932, "global_step": 106238, "epoch": 2529} {"train_loss": -6.182614326477051, "global_step": 106239, "epoch": 2529} {"train_loss": -6.353900909423828, "global_step": 106240, "epoch": 2529} {"train_loss": -6.251651763916016, "global_step": 106241, "epoch": 2529} {"train_loss": -6.4177045822143555, "global_step": 106242, "epoch": 2529} {"train_loss": -6.327146530151367, "global_step": 106243, "epoch": 2529} {"train_loss": -6.250729084014893, "global_step": 106244, "epoch": 2529} {"train_loss": -6.256118297576904, "global_step": 106245, "epoch": 2529} {"train_loss": -6.377159118652344, "global_step": 106246, "epoch": 2529} {"train_loss": -6.3559675216674805, "global_step": 106247, "epoch": 2529} {"train_loss": -6.440685272216797, "global_step": 106248, "epoch": 2529} {"train_loss": -6.472938537597656, "global_step": 106249, "epoch": 2529} {"train_loss": -6.418708801269531, "global_step": 106250, "epoch": 2529} {"train_loss": -6.547581672668457, "global_step": 106251, "epoch": 2529} {"train_loss": -6.434447765350342, "global_step": 106252, "epoch": 2529} {"train_loss": -6.427731990814209, "global_step": 106253, "epoch": 2529} {"train_loss": -6.380674362182617, "global_step": 106254, "epoch": 2529} {"train_loss": -6.357307434082031, "global_step": 106255, "epoch": 2529} {"train_loss": -6.3802385330200195, "global_step": 106256, "epoch": 2529} {"train_loss": -6.361418724060059, "global_step": 106257, "epoch": 2529} {"train_loss": -6.4542555809021, "global_step": 106258, "epoch": 2529} {"train_loss": -6.381140084493728, "global_step": 106259, "epoch": 2529, "val_loss": 64514.390625} {"train_loss": -6.430291175842285, "global_step": 106260, "epoch": 2530} {"train_loss": -6.438294410705566, "global_step": 106261, "epoch": 2530} {"train_loss": -6.465099334716797, "global_step": 106262, "epoch": 2530} {"train_loss": -6.447393894195557, "global_step": 106263, "epoch": 2530} {"train_loss": -6.412036418914795, "global_step": 106264, "epoch": 2530} {"train_loss": -6.458462238311768, "global_step": 106265, "epoch": 2530} {"train_loss": -6.434950828552246, "global_step": 106266, "epoch": 2530} {"train_loss": -6.431765556335449, "global_step": 106267, "epoch": 2530} {"train_loss": -6.357571125030518, "global_step": 106268, "epoch": 2530} {"train_loss": -6.379931449890137, "global_step": 106269, "epoch": 2530} {"train_loss": -6.5653181076049805, "global_step": 106270, "epoch": 2530} {"train_loss": -6.400168418884277, "global_step": 106271, "epoch": 2530} {"train_loss": -6.458514213562012, "global_step": 106272, "epoch": 2530} {"train_loss": -6.4325761795043945, "global_step": 106273, "epoch": 2530} {"train_loss": -6.475649833679199, "global_step": 106274, "epoch": 2530} {"train_loss": -6.525490760803223, "global_step": 106275, "epoch": 2530} {"train_loss": -6.47551965713501, "global_step": 106276, "epoch": 2530} {"train_loss": -6.441850662231445, "global_step": 106277, "epoch": 2530} {"train_loss": -6.576138496398926, "global_step": 106278, "epoch": 2530} {"train_loss": -6.3972063064575195, "global_step": 106279, "epoch": 2530} {"train_loss": -6.5444488525390625, "global_step": 106280, "epoch": 2530} {"train_loss": -6.426387786865234, "global_step": 106281, "epoch": 2530} {"train_loss": -6.4184112548828125, "global_step": 106282, "epoch": 2530} {"train_loss": -6.399506568908691, "global_step": 106283, "epoch": 2530} {"train_loss": -6.329260349273682, "global_step": 106284, "epoch": 2530} {"train_loss": -6.479625225067139, "global_step": 106285, "epoch": 2530} {"train_loss": -6.3600969314575195, "global_step": 106286, "epoch": 2530} {"train_loss": -6.445662498474121, "global_step": 106287, "epoch": 2530} {"train_loss": -6.3308515548706055, "global_step": 106288, "epoch": 2530} {"train_loss": -6.352701663970947, "global_step": 106289, "epoch": 2530} {"train_loss": -6.389440059661865, "global_step": 106290, "epoch": 2530} {"train_loss": -6.5052809715271, "global_step": 106291, "epoch": 2530} {"train_loss": -6.469707489013672, "global_step": 106292, "epoch": 2530} {"train_loss": -6.42059326171875, "global_step": 106293, "epoch": 2530} {"train_loss": -6.42191743850708, "global_step": 106294, "epoch": 2530} {"train_loss": -6.450554370880127, "global_step": 106295, "epoch": 2530} {"train_loss": -6.429345607757568, "global_step": 106296, "epoch": 2530} {"train_loss": -6.434441566467285, "global_step": 106297, "epoch": 2530} {"train_loss": -6.533946990966797, "global_step": 106298, "epoch": 2530} {"train_loss": -6.389639377593994, "global_step": 106299, "epoch": 2530} {"train_loss": -6.482419013977051, "global_step": 106300, "epoch": 2530} {"train_loss": -6.441714593342373, "global_step": 106301, "epoch": 2530, "val_loss": 64797.57421875} {"train_loss": -6.4592204093933105, "global_step": 106302, "epoch": 2531} {"train_loss": -6.485865592956543, "global_step": 106303, "epoch": 2531} {"train_loss": -6.40573787689209, "global_step": 106304, "epoch": 2531} {"train_loss": -6.382746696472168, "global_step": 106305, "epoch": 2531} {"train_loss": -6.459540843963623, "global_step": 106306, "epoch": 2531} {"train_loss": -6.41082763671875, "global_step": 106307, "epoch": 2531} {"train_loss": -6.3847174644470215, "global_step": 106308, "epoch": 2531} {"train_loss": -6.377121925354004, "global_step": 106309, "epoch": 2531} {"train_loss": -6.448746681213379, "global_step": 106310, "epoch": 2531} {"train_loss": -6.38842248916626, "global_step": 106311, "epoch": 2531} {"train_loss": -6.334501266479492, "global_step": 106312, "epoch": 2531} {"train_loss": -6.378507614135742, "global_step": 106313, "epoch": 2531} {"train_loss": -6.413730621337891, "global_step": 106314, "epoch": 2531} {"train_loss": -6.375613212585449, "global_step": 106315, "epoch": 2531} {"train_loss": -6.597146987915039, "global_step": 106316, "epoch": 2531} {"train_loss": -6.499268531799316, "global_step": 106317, "epoch": 2531} {"train_loss": -6.495001792907715, "global_step": 106318, "epoch": 2531} {"train_loss": -6.585148334503174, "global_step": 106319, "epoch": 2531} {"train_loss": -6.486875057220459, "global_step": 106320, "epoch": 2531} {"train_loss": -6.3613386154174805, "global_step": 106321, "epoch": 2531} {"train_loss": -6.489272117614746, "global_step": 106322, "epoch": 2531} {"train_loss": -6.429368019104004, "global_step": 106323, "epoch": 2531} {"train_loss": -6.33594274520874, "global_step": 106324, "epoch": 2531} {"train_loss": -6.50782585144043, "global_step": 106325, "epoch": 2531} {"train_loss": -6.520206451416016, "global_step": 106326, "epoch": 2531} {"train_loss": -6.360384941101074, "global_step": 106327, "epoch": 2531} {"train_loss": -6.401012420654297, "global_step": 106328, "epoch": 2531} {"train_loss": -6.428548812866211, "global_step": 106329, "epoch": 2531} {"train_loss": -6.360340595245361, "global_step": 106330, "epoch": 2531} {"train_loss": -6.456715106964111, "global_step": 106331, "epoch": 2531} {"train_loss": -6.317267894744873, "global_step": 106332, "epoch": 2531} {"train_loss": -6.396912574768066, "global_step": 106333, "epoch": 2531} {"train_loss": -6.426242828369141, "global_step": 106334, "epoch": 2531} {"train_loss": -6.345222473144531, "global_step": 106335, "epoch": 2531} {"train_loss": -6.286752223968506, "global_step": 106336, "epoch": 2531} {"train_loss": -6.463671684265137, "global_step": 106337, "epoch": 2531} {"train_loss": -6.227487564086914, "global_step": 106338, "epoch": 2531} {"train_loss": -6.464822292327881, "global_step": 106339, "epoch": 2531} {"train_loss": -6.4212965965271, "global_step": 106340, "epoch": 2531} {"train_loss": -6.370296478271484, "global_step": 106341, "epoch": 2531} {"train_loss": -6.346285820007324, "global_step": 106342, "epoch": 2531} {"train_loss": -6.414230414799282, "global_step": 106343, "epoch": 2531, "val_loss": 64609.7734375} {"train_loss": -6.379693508148193, "global_step": 106344, "epoch": 2532} {"train_loss": -6.335634231567383, "global_step": 106345, "epoch": 2532} {"train_loss": -6.286691665649414, "global_step": 106346, "epoch": 2532} {"train_loss": -6.303405284881592, "global_step": 106347, "epoch": 2532} {"train_loss": -6.368154525756836, "global_step": 106348, "epoch": 2532} {"train_loss": -6.309988975524902, "global_step": 106349, "epoch": 2532} {"train_loss": -6.400903701782227, "global_step": 106350, "epoch": 2532} {"train_loss": -6.4575066566467285, "global_step": 106351, "epoch": 2532} {"train_loss": -6.434725761413574, "global_step": 106352, "epoch": 2532} {"train_loss": -6.354804039001465, "global_step": 106353, "epoch": 2532} {"train_loss": -6.467784404754639, "global_step": 106354, "epoch": 2532} {"train_loss": -6.444576740264893, "global_step": 106355, "epoch": 2532} {"train_loss": -6.335354328155518, "global_step": 106356, "epoch": 2532} {"train_loss": -6.372813701629639, "global_step": 106357, "epoch": 2532} {"train_loss": -6.471845626831055, "global_step": 106358, "epoch": 2532} {"train_loss": -6.471134185791016, "global_step": 106359, "epoch": 2532} {"train_loss": -6.39570951461792, "global_step": 106360, "epoch": 2532} {"train_loss": -6.476980686187744, "global_step": 106361, "epoch": 2532} {"train_loss": -6.494643211364746, "global_step": 106362, "epoch": 2532} {"train_loss": -6.499506950378418, "global_step": 106363, "epoch": 2532} {"train_loss": -6.54121208190918, "global_step": 106364, "epoch": 2532} {"train_loss": -6.368378639221191, "global_step": 106365, "epoch": 2532} {"train_loss": -6.3610029220581055, "global_step": 106366, "epoch": 2532} {"train_loss": -6.454922676086426, "global_step": 106367, "epoch": 2532} {"train_loss": -6.3888349533081055, "global_step": 106368, "epoch": 2532} {"train_loss": -6.406653881072998, "global_step": 106369, "epoch": 2532} {"train_loss": -6.42633581161499, "global_step": 106370, "epoch": 2532} {"train_loss": -6.381381988525391, "global_step": 106371, "epoch": 2532} {"train_loss": -6.453174114227295, "global_step": 106372, "epoch": 2532} {"train_loss": -6.486509323120117, "global_step": 106373, "epoch": 2532} {"train_loss": -6.513993740081787, "global_step": 106374, "epoch": 2532} {"train_loss": -6.550396919250488, "global_step": 106375, "epoch": 2532} {"train_loss": -6.448272228240967, "global_step": 106376, "epoch": 2532} {"train_loss": -6.382746696472168, "global_step": 106377, "epoch": 2532} {"train_loss": -6.374346733093262, "global_step": 106378, "epoch": 2532} {"train_loss": -6.559466361999512, "global_step": 106379, "epoch": 2532} {"train_loss": -6.410947799682617, "global_step": 106380, "epoch": 2532} {"train_loss": -6.497369766235352, "global_step": 106381, "epoch": 2532} {"train_loss": -6.423453330993652, "global_step": 106382, "epoch": 2532} {"train_loss": -6.360592842102051, "global_step": 106383, "epoch": 2532} {"train_loss": -6.407366752624512, "global_step": 106384, "epoch": 2532} {"train_loss": -6.4198549929119295, "global_step": 106385, "epoch": 2532, "val_loss": 64708.12109375} {"train_loss": -6.446667671203613, "global_step": 106386, "epoch": 2533} {"train_loss": -6.504817485809326, "global_step": 106387, "epoch": 2533} {"train_loss": -6.463588714599609, "global_step": 106388, "epoch": 2533} {"train_loss": -6.468320846557617, "global_step": 106389, "epoch": 2533} {"train_loss": -6.503035545349121, "global_step": 106390, "epoch": 2533} {"train_loss": -6.546726703643799, "global_step": 106391, "epoch": 2533} {"train_loss": -6.32211971282959, "global_step": 106392, "epoch": 2533} {"train_loss": -6.466695308685303, "global_step": 106393, "epoch": 2533} {"train_loss": -6.429408073425293, "global_step": 106394, "epoch": 2533} {"train_loss": -6.483193874359131, "global_step": 106395, "epoch": 2533} {"train_loss": -6.521523475646973, "global_step": 106396, "epoch": 2533} {"train_loss": -6.4340105056762695, "global_step": 106397, "epoch": 2533} {"train_loss": -6.419758319854736, "global_step": 106398, "epoch": 2533} {"train_loss": -6.507240295410156, "global_step": 106399, "epoch": 2533} {"train_loss": -6.410419464111328, "global_step": 106400, "epoch": 2533} {"train_loss": -6.332477569580078, "global_step": 106401, "epoch": 2533} {"train_loss": -6.464541912078857, "global_step": 106402, "epoch": 2533} {"train_loss": -6.458708763122559, "global_step": 106403, "epoch": 2533} {"train_loss": -6.313323020935059, "global_step": 106404, "epoch": 2533} {"train_loss": -6.484663963317871, "global_step": 106405, "epoch": 2533} {"train_loss": -6.489136695861816, "global_step": 106406, "epoch": 2533} {"train_loss": -6.453921318054199, "global_step": 106407, "epoch": 2533} {"train_loss": -6.336831092834473, "global_step": 106408, "epoch": 2533} {"train_loss": -6.342245578765869, "global_step": 106409, "epoch": 2533} {"train_loss": -6.492245674133301, "global_step": 106410, "epoch": 2533} {"train_loss": -6.197319984436035, "global_step": 106411, "epoch": 2533} {"train_loss": -6.362829208374023, "global_step": 106412, "epoch": 2533} {"train_loss": -6.396550178527832, "global_step": 106413, "epoch": 2533} {"train_loss": -6.28190803527832, "global_step": 106414, "epoch": 2533} {"train_loss": -6.464160919189453, "global_step": 106415, "epoch": 2533} {"train_loss": -6.396854400634766, "global_step": 106416, "epoch": 2533} {"train_loss": -6.475770950317383, "global_step": 106417, "epoch": 2533} {"train_loss": -6.4513349533081055, "global_step": 106418, "epoch": 2533} {"train_loss": -6.470785617828369, "global_step": 106419, "epoch": 2533} {"train_loss": -6.447318077087402, "global_step": 106420, "epoch": 2533} {"train_loss": -6.561217784881592, "global_step": 106421, "epoch": 2533} {"train_loss": -6.407443046569824, "global_step": 106422, "epoch": 2533} {"train_loss": -6.408964157104492, "global_step": 106423, "epoch": 2533} {"train_loss": -6.3942389488220215, "global_step": 106424, "epoch": 2533} {"train_loss": -6.420660495758057, "global_step": 106425, "epoch": 2533} {"train_loss": -6.395613670349121, "global_step": 106426, "epoch": 2533} {"train_loss": -6.430006833303542, "global_step": 106427, "epoch": 2533, "val_loss": 64521.4609375} {"train_loss": -6.412603378295898, "global_step": 106428, "epoch": 2534} {"train_loss": -6.518964767456055, "global_step": 106429, "epoch": 2534} {"train_loss": -6.360719203948975, "global_step": 106430, "epoch": 2534} {"train_loss": -6.487786769866943, "global_step": 106431, "epoch": 2534} {"train_loss": -6.376856803894043, "global_step": 106432, "epoch": 2534} {"train_loss": -6.322340965270996, "global_step": 106433, "epoch": 2534} {"train_loss": -6.487934112548828, "global_step": 106434, "epoch": 2534} {"train_loss": -6.51408052444458, "global_step": 106435, "epoch": 2534} {"train_loss": -6.400849342346191, "global_step": 106436, "epoch": 2534} {"train_loss": -6.4236860275268555, "global_step": 106437, "epoch": 2534} {"train_loss": -6.37833833694458, "global_step": 106438, "epoch": 2534} {"train_loss": -6.526904582977295, "global_step": 106439, "epoch": 2534} {"train_loss": -6.452121734619141, "global_step": 106440, "epoch": 2534} {"train_loss": -6.632963180541992, "global_step": 106441, "epoch": 2534} {"train_loss": -6.4362993240356445, "global_step": 106442, "epoch": 2534} {"train_loss": -6.47662878036499, "global_step": 106443, "epoch": 2534} {"train_loss": -6.617517948150635, "global_step": 106444, "epoch": 2534} {"train_loss": -6.492018699645996, "global_step": 106445, "epoch": 2534} {"train_loss": -6.438700199127197, "global_step": 106446, "epoch": 2534} {"train_loss": -6.523967742919922, "global_step": 106447, "epoch": 2534} {"train_loss": -6.543068885803223, "global_step": 106448, "epoch": 2534} {"train_loss": -6.379354953765869, "global_step": 106449, "epoch": 2534} {"train_loss": -6.387439727783203, "global_step": 106450, "epoch": 2534} {"train_loss": -6.522709846496582, "global_step": 106451, "epoch": 2534} {"train_loss": -6.4474945068359375, "global_step": 106452, "epoch": 2534} {"train_loss": -6.492495536804199, "global_step": 106453, "epoch": 2534} {"train_loss": -6.426699638366699, "global_step": 106454, "epoch": 2534} {"train_loss": -6.317333221435547, "global_step": 106455, "epoch": 2534} {"train_loss": -6.5144524574279785, "global_step": 106456, "epoch": 2534} {"train_loss": -6.4701738357543945, "global_step": 106457, "epoch": 2534} {"train_loss": -6.417396545410156, "global_step": 106458, "epoch": 2534} {"train_loss": -6.571603775024414, "global_step": 106459, "epoch": 2534} {"train_loss": -6.5011796951293945, "global_step": 106460, "epoch": 2534} {"train_loss": -6.47237491607666, "global_step": 106461, "epoch": 2534} {"train_loss": -6.514517784118652, "global_step": 106462, "epoch": 2534} {"train_loss": -6.464272499084473, "global_step": 106463, "epoch": 2534} {"train_loss": -6.512955665588379, "global_step": 106464, "epoch": 2534} {"train_loss": -6.446498394012451, "global_step": 106465, "epoch": 2534} {"train_loss": -6.4065046310424805, "global_step": 106466, "epoch": 2534} {"train_loss": -6.591988563537598, "global_step": 106467, "epoch": 2534} {"train_loss": -6.48320198059082, "global_step": 106468, "epoch": 2534} {"train_loss": -6.4640519959586005, "global_step": 106469, "epoch": 2534, "val_loss": 64662.56640625} {"train_loss": -6.5024518966674805, "global_step": 106470, "epoch": 2535} {"train_loss": -6.400312423706055, "global_step": 106471, "epoch": 2535} {"train_loss": -6.379666328430176, "global_step": 106472, "epoch": 2535} {"train_loss": -6.48774528503418, "global_step": 106473, "epoch": 2535} {"train_loss": -6.230779647827148, "global_step": 106474, "epoch": 2535} {"train_loss": -6.2380146980285645, "global_step": 106475, "epoch": 2535} {"train_loss": -6.3730549812316895, "global_step": 106476, "epoch": 2535} {"train_loss": -6.38143253326416, "global_step": 106477, "epoch": 2535} {"train_loss": -6.427942276000977, "global_step": 106478, "epoch": 2535} {"train_loss": -6.497808456420898, "global_step": 106479, "epoch": 2535} {"train_loss": -6.518427848815918, "global_step": 106480, "epoch": 2535} {"train_loss": -6.5001373291015625, "global_step": 106481, "epoch": 2535} {"train_loss": -6.44851016998291, "global_step": 106482, "epoch": 2535} {"train_loss": -6.423923492431641, "global_step": 106483, "epoch": 2535} {"train_loss": -6.493387222290039, "global_step": 106484, "epoch": 2535} {"train_loss": -6.500950813293457, "global_step": 106485, "epoch": 2535} {"train_loss": -6.545774936676025, "global_step": 106486, "epoch": 2535} {"train_loss": -6.447403430938721, "global_step": 106487, "epoch": 2535} {"train_loss": -6.461447715759277, "global_step": 106488, "epoch": 2535} {"train_loss": -6.409284591674805, "global_step": 106489, "epoch": 2535} {"train_loss": -6.405975818634033, "global_step": 106490, "epoch": 2535} {"train_loss": -6.438107490539551, "global_step": 106491, "epoch": 2535} {"train_loss": -6.4780120849609375, "global_step": 106492, "epoch": 2535} {"train_loss": -6.560995101928711, "global_step": 106493, "epoch": 2535} {"train_loss": -6.582324028015137, "global_step": 106494, "epoch": 2535} {"train_loss": -6.453896999359131, "global_step": 106495, "epoch": 2535} {"train_loss": -6.36240291595459, "global_step": 106496, "epoch": 2535} {"train_loss": -6.518095970153809, "global_step": 106497, "epoch": 2535} {"train_loss": -6.351667404174805, "global_step": 106498, "epoch": 2535} {"train_loss": -6.558150768280029, "global_step": 106499, "epoch": 2535} {"train_loss": -6.460432529449463, "global_step": 106500, "epoch": 2535} {"train_loss": -6.400511741638184, "global_step": 106501, "epoch": 2535} {"train_loss": -6.532561302185059, "global_step": 106502, "epoch": 2535} {"train_loss": -6.360348701477051, "global_step": 106503, "epoch": 2535} {"train_loss": -6.275723457336426, "global_step": 106504, "epoch": 2535} {"train_loss": -6.4477620124816895, "global_step": 106505, "epoch": 2535} {"train_loss": -6.326990604400635, "global_step": 106506, "epoch": 2535} {"train_loss": -6.435715675354004, "global_step": 106507, "epoch": 2535} {"train_loss": -6.518792152404785, "global_step": 106508, "epoch": 2535} {"train_loss": -6.323455810546875, "global_step": 106509, "epoch": 2535} {"train_loss": -6.311444282531738, "global_step": 106510, "epoch": 2535} {"train_loss": -6.433385417574928, "global_step": 106511, "epoch": 2535, "val_loss": 64767.7265625} {"train_loss": -6.406703948974609, "global_step": 106512, "epoch": 2536} {"train_loss": -6.34425163269043, "global_step": 106513, "epoch": 2536} {"train_loss": -6.364871025085449, "global_step": 106514, "epoch": 2536} {"train_loss": -6.350769519805908, "global_step": 106515, "epoch": 2536} {"train_loss": -6.492541313171387, "global_step": 106516, "epoch": 2536} {"train_loss": -6.376928806304932, "global_step": 106517, "epoch": 2536} {"train_loss": -6.355539321899414, "global_step": 106518, "epoch": 2536} {"train_loss": -6.516986846923828, "global_step": 106519, "epoch": 2536} {"train_loss": -6.441620826721191, "global_step": 106520, "epoch": 2536} {"train_loss": -6.343278884887695, "global_step": 106521, "epoch": 2536} {"train_loss": -6.482336521148682, "global_step": 106522, "epoch": 2536} {"train_loss": -6.380193710327148, "global_step": 106523, "epoch": 2536} {"train_loss": -6.4087677001953125, "global_step": 106524, "epoch": 2536} {"train_loss": -6.407885551452637, "global_step": 106525, "epoch": 2536} {"train_loss": -6.497585296630859, "global_step": 106526, "epoch": 2536} {"train_loss": -6.427463531494141, "global_step": 106527, "epoch": 2536} {"train_loss": -6.409858226776123, "global_step": 106528, "epoch": 2536} {"train_loss": -6.438871383666992, "global_step": 106529, "epoch": 2536} {"train_loss": -6.429538726806641, "global_step": 106530, "epoch": 2536} {"train_loss": -6.428982734680176, "global_step": 106531, "epoch": 2536} {"train_loss": -6.48343563079834, "global_step": 106532, "epoch": 2536} {"train_loss": -6.3218584060668945, "global_step": 106533, "epoch": 2536} {"train_loss": -6.357997894287109, "global_step": 106534, "epoch": 2536} {"train_loss": -6.461244583129883, "global_step": 106535, "epoch": 2536} {"train_loss": -6.446048736572266, "global_step": 106536, "epoch": 2536} {"train_loss": -6.490550518035889, "global_step": 106537, "epoch": 2536} {"train_loss": -6.349832534790039, "global_step": 106538, "epoch": 2536} {"train_loss": -6.38641881942749, "global_step": 106539, "epoch": 2536} {"train_loss": -6.293160438537598, "global_step": 106540, "epoch": 2536} {"train_loss": -6.442197799682617, "global_step": 106541, "epoch": 2536} {"train_loss": -6.419887542724609, "global_step": 106542, "epoch": 2536} {"train_loss": -6.404933452606201, "global_step": 106543, "epoch": 2536} {"train_loss": -6.4981818199157715, "global_step": 106544, "epoch": 2536} {"train_loss": -6.481698989868164, "global_step": 106545, "epoch": 2536} {"train_loss": -6.463872909545898, "global_step": 106546, "epoch": 2536} {"train_loss": -6.490785598754883, "global_step": 106547, "epoch": 2536} {"train_loss": -6.235315322875977, "global_step": 106548, "epoch": 2536} {"train_loss": -6.475100994110107, "global_step": 106549, "epoch": 2536} {"train_loss": -6.445162773132324, "global_step": 106550, "epoch": 2536} {"train_loss": -6.436807632446289, "global_step": 106551, "epoch": 2536} {"train_loss": -6.393979072570801, "global_step": 106552, "epoch": 2536} {"train_loss": -6.41833818526495, "global_step": 106553, "epoch": 2536, "val_loss": 64683.20703125} {"train_loss": -6.378767967224121, "global_step": 106554, "epoch": 2537} {"train_loss": -6.513284206390381, "global_step": 106555, "epoch": 2537} {"train_loss": -6.3637285232543945, "global_step": 106556, "epoch": 2537} {"train_loss": -6.487360954284668, "global_step": 106557, "epoch": 2537} {"train_loss": -6.429233551025391, "global_step": 106558, "epoch": 2537} {"train_loss": -6.364473819732666, "global_step": 106559, "epoch": 2537} {"train_loss": -6.454019546508789, "global_step": 106560, "epoch": 2537} {"train_loss": -6.339138031005859, "global_step": 106561, "epoch": 2537} {"train_loss": -6.475488662719727, "global_step": 106562, "epoch": 2537} {"train_loss": -6.522211074829102, "global_step": 106563, "epoch": 2537} {"train_loss": -6.456120491027832, "global_step": 106564, "epoch": 2537} {"train_loss": -6.4519453048706055, "global_step": 106565, "epoch": 2537} {"train_loss": -6.499972343444824, "global_step": 106566, "epoch": 2537} {"train_loss": -6.458506107330322, "global_step": 106567, "epoch": 2537} {"train_loss": -6.3910441398620605, "global_step": 106568, "epoch": 2537} {"train_loss": -6.5731964111328125, "global_step": 106569, "epoch": 2537} {"train_loss": -6.422740936279297, "global_step": 106570, "epoch": 2537} {"train_loss": -6.521915912628174, "global_step": 106571, "epoch": 2537} {"train_loss": -6.4889421463012695, "global_step": 106572, "epoch": 2537} {"train_loss": -6.382905006408691, "global_step": 106573, "epoch": 2537} {"train_loss": -6.4226837158203125, "global_step": 106574, "epoch": 2537} {"train_loss": -6.384779930114746, "global_step": 106575, "epoch": 2537} {"train_loss": -6.3659515380859375, "global_step": 106576, "epoch": 2537} {"train_loss": -6.374174118041992, "global_step": 106577, "epoch": 2537} {"train_loss": -6.457680702209473, "global_step": 106578, "epoch": 2537} {"train_loss": -6.3880133628845215, "global_step": 106579, "epoch": 2537} {"train_loss": -6.399946689605713, "global_step": 106580, "epoch": 2537} {"train_loss": -6.442657470703125, "global_step": 106581, "epoch": 2537} {"train_loss": -6.5391340255737305, "global_step": 106582, "epoch": 2537} {"train_loss": -6.344525337219238, "global_step": 106583, "epoch": 2537} {"train_loss": -6.3951334953308105, "global_step": 106584, "epoch": 2537} {"train_loss": -6.478739261627197, "global_step": 106585, "epoch": 2537} {"train_loss": -6.485755920410156, "global_step": 106586, "epoch": 2537} {"train_loss": -6.536651611328125, "global_step": 106587, "epoch": 2537} {"train_loss": -6.493048667907715, "global_step": 106588, "epoch": 2537} {"train_loss": -6.528595924377441, "global_step": 106589, "epoch": 2537} {"train_loss": -6.5114569664001465, "global_step": 106590, "epoch": 2537} {"train_loss": -6.473362922668457, "global_step": 106591, "epoch": 2537} {"train_loss": -6.525541305541992, "global_step": 106592, "epoch": 2537} {"train_loss": -6.489314079284668, "global_step": 106593, "epoch": 2537} {"train_loss": -6.491792678833008, "global_step": 106594, "epoch": 2537} {"train_loss": -6.450285355250041, "global_step": 106595, "epoch": 2537, "val_loss": 64605.24609375} {"train_loss": -6.569087028503418, "global_step": 106596, "epoch": 2538} {"train_loss": -6.468513488769531, "global_step": 106597, "epoch": 2538} {"train_loss": -6.428843021392822, "global_step": 106598, "epoch": 2538} {"train_loss": -6.56564998626709, "global_step": 106599, "epoch": 2538} {"train_loss": -6.466493606567383, "global_step": 106600, "epoch": 2538} {"train_loss": -6.405570983886719, "global_step": 106601, "epoch": 2538} {"train_loss": -6.354008674621582, "global_step": 106602, "epoch": 2538} {"train_loss": -6.4694671630859375, "global_step": 106603, "epoch": 2538} {"train_loss": -6.526376724243164, "global_step": 106604, "epoch": 2538} {"train_loss": -6.461605548858643, "global_step": 106605, "epoch": 2538} {"train_loss": -6.395895957946777, "global_step": 106606, "epoch": 2538} {"train_loss": -6.396603584289551, "global_step": 106607, "epoch": 2538} {"train_loss": -6.392321586608887, "global_step": 106608, "epoch": 2538} {"train_loss": -6.508628845214844, "global_step": 106609, "epoch": 2538} {"train_loss": -6.415873050689697, "global_step": 106610, "epoch": 2538} {"train_loss": -6.397355556488037, "global_step": 106611, "epoch": 2538} {"train_loss": -6.417090892791748, "global_step": 106612, "epoch": 2538} {"train_loss": -6.407915115356445, "global_step": 106613, "epoch": 2538} {"train_loss": -6.460052490234375, "global_step": 106614, "epoch": 2538} {"train_loss": -6.410905361175537, "global_step": 106615, "epoch": 2538} {"train_loss": -6.3255109786987305, "global_step": 106616, "epoch": 2538} {"train_loss": -6.519130229949951, "global_step": 106617, "epoch": 2538} {"train_loss": -6.320544242858887, "global_step": 106618, "epoch": 2538} {"train_loss": -6.393275737762451, "global_step": 106619, "epoch": 2538} {"train_loss": -6.30555534362793, "global_step": 106620, "epoch": 2538} {"train_loss": -6.365965366363525, "global_step": 106621, "epoch": 2538} {"train_loss": -6.323172569274902, "global_step": 106622, "epoch": 2538} {"train_loss": -6.297645568847656, "global_step": 106623, "epoch": 2538} {"train_loss": -6.448728561401367, "global_step": 106624, "epoch": 2538} {"train_loss": -6.396965503692627, "global_step": 106625, "epoch": 2538} {"train_loss": -6.411798477172852, "global_step": 106626, "epoch": 2538} {"train_loss": -6.297191143035889, "global_step": 106627, "epoch": 2538} {"train_loss": -6.451770782470703, "global_step": 106628, "epoch": 2538} {"train_loss": -6.40952205657959, "global_step": 106629, "epoch": 2538} {"train_loss": -6.4241743087768555, "global_step": 106630, "epoch": 2538} {"train_loss": -6.360507965087891, "global_step": 106631, "epoch": 2538} {"train_loss": -6.2710089683532715, "global_step": 106632, "epoch": 2538} {"train_loss": -6.339386940002441, "global_step": 106633, "epoch": 2538} {"train_loss": -6.318880558013916, "global_step": 106634, "epoch": 2538} {"train_loss": -6.431063652038574, "global_step": 106635, "epoch": 2538} {"train_loss": -6.373882293701172, "global_step": 106636, "epoch": 2538} {"train_loss": -6.408198402041481, "global_step": 106637, "epoch": 2538, "val_loss": 64440.8046875} {"train_loss": -6.3618927001953125, "global_step": 106638, "epoch": 2539} {"train_loss": -6.483832359313965, "global_step": 106639, "epoch": 2539} {"train_loss": -6.480224132537842, "global_step": 106640, "epoch": 2539} {"train_loss": -6.4135823249816895, "global_step": 106641, "epoch": 2539} {"train_loss": -6.376781463623047, "global_step": 106642, "epoch": 2539} {"train_loss": -6.553661346435547, "global_step": 106643, "epoch": 2539} {"train_loss": -6.323315143585205, "global_step": 106644, "epoch": 2539} {"train_loss": -6.404759407043457, "global_step": 106645, "epoch": 2539} {"train_loss": -6.517265319824219, "global_step": 106646, "epoch": 2539} {"train_loss": -6.481685161590576, "global_step": 106647, "epoch": 2539} {"train_loss": -6.385239124298096, "global_step": 106648, "epoch": 2539} {"train_loss": -6.316183090209961, "global_step": 106649, "epoch": 2539} {"train_loss": -6.577866554260254, "global_step": 106650, "epoch": 2539} {"train_loss": -6.447038650512695, "global_step": 106651, "epoch": 2539} {"train_loss": -6.337845802307129, "global_step": 106652, "epoch": 2539} {"train_loss": -6.491153717041016, "global_step": 106653, "epoch": 2539} {"train_loss": -6.38829231262207, "global_step": 106654, "epoch": 2539} {"train_loss": -6.395051002502441, "global_step": 106655, "epoch": 2539} {"train_loss": -6.408517360687256, "global_step": 106656, "epoch": 2539} {"train_loss": -6.539977073669434, "global_step": 106657, "epoch": 2539} {"train_loss": -6.539177417755127, "global_step": 106658, "epoch": 2539} {"train_loss": -6.554306983947754, "global_step": 106659, "epoch": 2539} {"train_loss": -6.362085342407227, "global_step": 106660, "epoch": 2539} {"train_loss": -6.4637651443481445, "global_step": 106661, "epoch": 2539} {"train_loss": -6.4204936027526855, "global_step": 106662, "epoch": 2539} {"train_loss": -6.500080108642578, "global_step": 106663, "epoch": 2539} {"train_loss": -6.4697489738464355, "global_step": 106664, "epoch": 2539} {"train_loss": -6.402726650238037, "global_step": 106665, "epoch": 2539} {"train_loss": -6.356874465942383, "global_step": 106666, "epoch": 2539} {"train_loss": -6.48972225189209, "global_step": 106667, "epoch": 2539} {"train_loss": -6.474799156188965, "global_step": 106668, "epoch": 2539} {"train_loss": -6.430009841918945, "global_step": 106669, "epoch": 2539} {"train_loss": -6.4486083984375, "global_step": 106670, "epoch": 2539} {"train_loss": -6.3719987869262695, "global_step": 106671, "epoch": 2539} {"train_loss": -6.431547164916992, "global_step": 106672, "epoch": 2539} {"train_loss": -6.454914569854736, "global_step": 106673, "epoch": 2539} {"train_loss": -6.356556415557861, "global_step": 106674, "epoch": 2539} {"train_loss": -6.46665096282959, "global_step": 106675, "epoch": 2539} {"train_loss": -6.323427200317383, "global_step": 106676, "epoch": 2539} {"train_loss": -6.514537334442139, "global_step": 106677, "epoch": 2539} {"train_loss": -6.3988423347473145, "global_step": 106678, "epoch": 2539} {"train_loss": -6.43567088672093, "global_step": 106679, "epoch": 2539, "val_loss": 64744.86328125} {"train_loss": -6.464944839477539, "global_step": 106680, "epoch": 2540} {"train_loss": -6.407071113586426, "global_step": 106681, "epoch": 2540} {"train_loss": -6.351635932922363, "global_step": 106682, "epoch": 2540} {"train_loss": -6.371153831481934, "global_step": 106683, "epoch": 2540} {"train_loss": -6.3901448249816895, "global_step": 106684, "epoch": 2540} {"train_loss": -6.240604400634766, "global_step": 106685, "epoch": 2540} {"train_loss": -6.470497131347656, "global_step": 106686, "epoch": 2540} {"train_loss": -6.357182025909424, "global_step": 106687, "epoch": 2540} {"train_loss": -6.425207138061523, "global_step": 106688, "epoch": 2540} {"train_loss": -6.362490653991699, "global_step": 106689, "epoch": 2540} {"train_loss": -6.365569114685059, "global_step": 106690, "epoch": 2540} {"train_loss": -6.345029830932617, "global_step": 106691, "epoch": 2540} {"train_loss": -6.297210216522217, "global_step": 106692, "epoch": 2540} {"train_loss": -6.435378074645996, "global_step": 106693, "epoch": 2540} {"train_loss": -6.3012237548828125, "global_step": 106694, "epoch": 2540} {"train_loss": -6.288605690002441, "global_step": 106695, "epoch": 2540} {"train_loss": -6.422687530517578, "global_step": 106696, "epoch": 2540} {"train_loss": -6.370606422424316, "global_step": 106697, "epoch": 2540} {"train_loss": -6.457693576812744, "global_step": 106698, "epoch": 2540} {"train_loss": -6.487321853637695, "global_step": 106699, "epoch": 2540} {"train_loss": -6.381303310394287, "global_step": 106700, "epoch": 2540} {"train_loss": -6.500125408172607, "global_step": 106701, "epoch": 2540} {"train_loss": -6.403749465942383, "global_step": 106702, "epoch": 2540} {"train_loss": -6.532968997955322, "global_step": 106703, "epoch": 2540} {"train_loss": -6.455109119415283, "global_step": 106704, "epoch": 2540} {"train_loss": -6.487147331237793, "global_step": 106705, "epoch": 2540} {"train_loss": -6.484720230102539, "global_step": 106706, "epoch": 2540} {"train_loss": -6.362783432006836, "global_step": 106707, "epoch": 2540} {"train_loss": -6.422711372375488, "global_step": 106708, "epoch": 2540} {"train_loss": -6.355562210083008, "global_step": 106709, "epoch": 2540} {"train_loss": -6.460273742675781, "global_step": 106710, "epoch": 2540} {"train_loss": -6.379755973815918, "global_step": 106711, "epoch": 2540} {"train_loss": -6.5388336181640625, "global_step": 106712, "epoch": 2540} {"train_loss": -6.414438724517822, "global_step": 106713, "epoch": 2540} {"train_loss": -6.494924545288086, "global_step": 106714, "epoch": 2540} {"train_loss": -6.450778961181641, "global_step": 106715, "epoch": 2540} {"train_loss": -6.507783889770508, "global_step": 106716, "epoch": 2540} {"train_loss": -6.390084266662598, "global_step": 106717, "epoch": 2540} {"train_loss": -6.402867317199707, "global_step": 106718, "epoch": 2540} {"train_loss": -6.385451316833496, "global_step": 106719, "epoch": 2540} {"train_loss": -6.415958404541016, "global_step": 106720, "epoch": 2540} {"train_loss": -6.409713642937796, "global_step": 106721, "epoch": 2540, "val_loss": 64757.5390625} {"train_loss": -6.434043884277344, "global_step": 106722, "epoch": 2541} {"train_loss": -6.309107303619385, "global_step": 106723, "epoch": 2541} {"train_loss": -6.485547065734863, "global_step": 106724, "epoch": 2541} {"train_loss": -6.425776958465576, "global_step": 106725, "epoch": 2541} {"train_loss": -6.476701736450195, "global_step": 106726, "epoch": 2541} {"train_loss": -6.409248352050781, "global_step": 106727, "epoch": 2541} {"train_loss": -6.565345764160156, "global_step": 106728, "epoch": 2541} {"train_loss": -6.45424747467041, "global_step": 106729, "epoch": 2541} {"train_loss": -6.527782440185547, "global_step": 106730, "epoch": 2541} {"train_loss": -6.415097713470459, "global_step": 106731, "epoch": 2541} {"train_loss": -6.46051025390625, "global_step": 106732, "epoch": 2541} {"train_loss": -6.401932239532471, "global_step": 106733, "epoch": 2541} {"train_loss": -6.45497465133667, "global_step": 106734, "epoch": 2541} {"train_loss": -6.5507307052612305, "global_step": 106735, "epoch": 2541} {"train_loss": -6.595686912536621, "global_step": 106736, "epoch": 2541} {"train_loss": -6.485743045806885, "global_step": 106737, "epoch": 2541} {"train_loss": -6.372729301452637, "global_step": 106738, "epoch": 2541} {"train_loss": -6.544386863708496, "global_step": 106739, "epoch": 2541} {"train_loss": -6.563177108764648, "global_step": 106740, "epoch": 2541} {"train_loss": -6.424737930297852, "global_step": 106741, "epoch": 2541} {"train_loss": -6.423912525177002, "global_step": 106742, "epoch": 2541} {"train_loss": -6.422405242919922, "global_step": 106743, "epoch": 2541} {"train_loss": -6.437860488891602, "global_step": 106744, "epoch": 2541} {"train_loss": -6.418305397033691, "global_step": 106745, "epoch": 2541} {"train_loss": -6.487555027008057, "global_step": 106746, "epoch": 2541} {"train_loss": -6.298813819885254, "global_step": 106747, "epoch": 2541} {"train_loss": -6.517490386962891, "global_step": 106748, "epoch": 2541} {"train_loss": -6.44078254699707, "global_step": 106749, "epoch": 2541} {"train_loss": -6.350833892822266, "global_step": 106750, "epoch": 2541} {"train_loss": -6.464824676513672, "global_step": 106751, "epoch": 2541} {"train_loss": -6.433582305908203, "global_step": 106752, "epoch": 2541} {"train_loss": -6.385544300079346, "global_step": 106753, "epoch": 2541} {"train_loss": -6.520708084106445, "global_step": 106754, "epoch": 2541} {"train_loss": -6.483048439025879, "global_step": 106755, "epoch": 2541} {"train_loss": -6.444140434265137, "global_step": 106756, "epoch": 2541} {"train_loss": -6.402839660644531, "global_step": 106757, "epoch": 2541} {"train_loss": -6.3531341552734375, "global_step": 106758, "epoch": 2541} {"train_loss": -6.44634485244751, "global_step": 106759, "epoch": 2541} {"train_loss": -6.526537895202637, "global_step": 106760, "epoch": 2541} {"train_loss": -6.436508655548096, "global_step": 106761, "epoch": 2541} {"train_loss": -6.438798904418945, "global_step": 106762, "epoch": 2541} {"train_loss": -6.453400975181943, "global_step": 106763, "epoch": 2541, "val_loss": 64559.06640625} {"train_loss": -6.493786811828613, "global_step": 106764, "epoch": 2542} {"train_loss": -6.529916763305664, "global_step": 106765, "epoch": 2542} {"train_loss": -6.439614295959473, "global_step": 106766, "epoch": 2542} {"train_loss": -6.49162483215332, "global_step": 106767, "epoch": 2542} {"train_loss": -6.474150657653809, "global_step": 106768, "epoch": 2542} {"train_loss": -6.541523456573486, "global_step": 106769, "epoch": 2542} {"train_loss": -6.409887313842773, "global_step": 106770, "epoch": 2542} {"train_loss": -6.445134162902832, "global_step": 106771, "epoch": 2542} {"train_loss": -6.616393089294434, "global_step": 106772, "epoch": 2542} {"train_loss": -6.527895927429199, "global_step": 106773, "epoch": 2542} {"train_loss": -6.395933628082275, "global_step": 106774, "epoch": 2542} {"train_loss": -6.457900524139404, "global_step": 106775, "epoch": 2542} {"train_loss": -6.57170295715332, "global_step": 106776, "epoch": 2542} {"train_loss": -6.501543045043945, "global_step": 106777, "epoch": 2542} {"train_loss": -6.396104335784912, "global_step": 106778, "epoch": 2542} {"train_loss": -6.333715915679932, "global_step": 106779, "epoch": 2542} {"train_loss": -6.363237380981445, "global_step": 106780, "epoch": 2542} {"train_loss": -6.440506935119629, "global_step": 106781, "epoch": 2542} {"train_loss": -6.397890090942383, "global_step": 106782, "epoch": 2542} {"train_loss": -6.322380065917969, "global_step": 106783, "epoch": 2542} {"train_loss": -6.478188514709473, "global_step": 106784, "epoch": 2542} {"train_loss": -6.506717681884766, "global_step": 106785, "epoch": 2542} {"train_loss": -6.393048286437988, "global_step": 106786, "epoch": 2542} {"train_loss": -6.486184120178223, "global_step": 106787, "epoch": 2542} {"train_loss": -6.461897850036621, "global_step": 106788, "epoch": 2542} {"train_loss": -6.448185443878174, "global_step": 106789, "epoch": 2542} {"train_loss": -6.342168807983398, "global_step": 106790, "epoch": 2542} {"train_loss": -6.4285688400268555, "global_step": 106791, "epoch": 2542} {"train_loss": -6.482143878936768, "global_step": 106792, "epoch": 2542} {"train_loss": -6.390591621398926, "global_step": 106793, "epoch": 2542} {"train_loss": -6.411066055297852, "global_step": 106794, "epoch": 2542} {"train_loss": -6.381942272186279, "global_step": 106795, "epoch": 2542} {"train_loss": -6.4232587814331055, "global_step": 106796, "epoch": 2542} {"train_loss": -6.505526065826416, "global_step": 106797, "epoch": 2542} {"train_loss": -6.3820037841796875, "global_step": 106798, "epoch": 2542} {"train_loss": -6.432263374328613, "global_step": 106799, "epoch": 2542} {"train_loss": -6.527866363525391, "global_step": 106800, "epoch": 2542} {"train_loss": -6.4217000007629395, "global_step": 106801, "epoch": 2542} {"train_loss": -6.415982246398926, "global_step": 106802, "epoch": 2542} {"train_loss": -6.466253280639648, "global_step": 106803, "epoch": 2542} {"train_loss": -6.461215972900391, "global_step": 106804, "epoch": 2542} {"train_loss": -6.451808861323765, "global_step": 106805, "epoch": 2542, "val_loss": 64714.203125} {"train_loss": -6.414217472076416, "global_step": 106806, "epoch": 2543} {"train_loss": -6.437771797180176, "global_step": 106807, "epoch": 2543} {"train_loss": -6.471219062805176, "global_step": 106808, "epoch": 2543} {"train_loss": -6.497302055358887, "global_step": 106809, "epoch": 2543} {"train_loss": -6.511469841003418, "global_step": 106810, "epoch": 2543} {"train_loss": -6.429159641265869, "global_step": 106811, "epoch": 2543} {"train_loss": -6.534555435180664, "global_step": 106812, "epoch": 2543} {"train_loss": -6.409736633300781, "global_step": 106813, "epoch": 2543} {"train_loss": -6.41616153717041, "global_step": 106814, "epoch": 2543} {"train_loss": -6.456829071044922, "global_step": 106815, "epoch": 2543} {"train_loss": -6.443446159362793, "global_step": 106816, "epoch": 2543} {"train_loss": -6.4152140617370605, "global_step": 106817, "epoch": 2543} {"train_loss": -6.455900192260742, "global_step": 106818, "epoch": 2543} {"train_loss": -6.505810737609863, "global_step": 106819, "epoch": 2543} {"train_loss": -6.408639907836914, "global_step": 106820, "epoch": 2543} {"train_loss": -6.449470520019531, "global_step": 106821, "epoch": 2543} {"train_loss": -6.4697184562683105, "global_step": 106822, "epoch": 2543} {"train_loss": -6.616763114929199, "global_step": 106823, "epoch": 2543} {"train_loss": -6.424751281738281, "global_step": 106824, "epoch": 2543} {"train_loss": -6.5095415115356445, "global_step": 106825, "epoch": 2543} {"train_loss": -6.394588470458984, "global_step": 106826, "epoch": 2543} {"train_loss": -6.354343414306641, "global_step": 106827, "epoch": 2543} {"train_loss": -6.4254608154296875, "global_step": 106828, "epoch": 2543} {"train_loss": -6.326667308807373, "global_step": 106829, "epoch": 2543} {"train_loss": -6.370144844055176, "global_step": 106830, "epoch": 2543} {"train_loss": -6.481161594390869, "global_step": 106831, "epoch": 2543} {"train_loss": -6.286097049713135, "global_step": 106832, "epoch": 2543} {"train_loss": -6.512548446655273, "global_step": 106833, "epoch": 2543} {"train_loss": -6.466891288757324, "global_step": 106834, "epoch": 2543} {"train_loss": -6.387016773223877, "global_step": 106835, "epoch": 2543} {"train_loss": -6.435790061950684, "global_step": 106836, "epoch": 2543} {"train_loss": -6.372859954833984, "global_step": 106837, "epoch": 2543} {"train_loss": -6.503725051879883, "global_step": 106838, "epoch": 2543} {"train_loss": -6.468411445617676, "global_step": 106839, "epoch": 2543} {"train_loss": -6.338459014892578, "global_step": 106840, "epoch": 2543} {"train_loss": -6.442511558532715, "global_step": 106841, "epoch": 2543} {"train_loss": -6.396291732788086, "global_step": 106842, "epoch": 2543} {"train_loss": -6.47470235824585, "global_step": 106843, "epoch": 2543} {"train_loss": -6.339959621429443, "global_step": 106844, "epoch": 2543} {"train_loss": -6.248035430908203, "global_step": 106845, "epoch": 2543} {"train_loss": -6.483155250549316, "global_step": 106846, "epoch": 2543} {"train_loss": -6.433853626251221, "global_step": 106847, "epoch": 2543, "val_loss": 64986.18359375} {"train_loss": -6.320539951324463, "global_step": 106848, "epoch": 2544} {"train_loss": -6.361382484436035, "global_step": 106849, "epoch": 2544} {"train_loss": -6.359800338745117, "global_step": 106850, "epoch": 2544} {"train_loss": -6.471993446350098, "global_step": 106851, "epoch": 2544} {"train_loss": -6.281347751617432, "global_step": 106852, "epoch": 2544} {"train_loss": -6.315975189208984, "global_step": 106853, "epoch": 2544} {"train_loss": -6.46779727935791, "global_step": 106854, "epoch": 2544} {"train_loss": -6.2341203689575195, "global_step": 106855, "epoch": 2544} {"train_loss": -6.363409996032715, "global_step": 106856, "epoch": 2544} {"train_loss": -6.333732604980469, "global_step": 106857, "epoch": 2544} {"train_loss": -6.368518829345703, "global_step": 106858, "epoch": 2544} {"train_loss": -6.425729751586914, "global_step": 106859, "epoch": 2544} {"train_loss": -6.369552135467529, "global_step": 106860, "epoch": 2544} {"train_loss": -6.437127113342285, "global_step": 106861, "epoch": 2544} {"train_loss": -6.401941776275635, "global_step": 106862, "epoch": 2544} {"train_loss": -6.487885475158691, "global_step": 106863, "epoch": 2544} {"train_loss": -6.318297863006592, "global_step": 106864, "epoch": 2544} {"train_loss": -6.3620100021362305, "global_step": 106865, "epoch": 2544} {"train_loss": -6.410747528076172, "global_step": 106866, "epoch": 2544} {"train_loss": -6.301809787750244, "global_step": 106867, "epoch": 2544} {"train_loss": -6.450078964233398, "global_step": 106868, "epoch": 2544} {"train_loss": -6.414454460144043, "global_step": 106869, "epoch": 2544} {"train_loss": -6.376562595367432, "global_step": 106870, "epoch": 2544} {"train_loss": -6.341868877410889, "global_step": 106871, "epoch": 2544} {"train_loss": -6.45681095123291, "global_step": 106872, "epoch": 2544} {"train_loss": -6.439054489135742, "global_step": 106873, "epoch": 2544} {"train_loss": -6.479447364807129, "global_step": 106874, "epoch": 2544} {"train_loss": -6.370128154754639, "global_step": 106875, "epoch": 2544} {"train_loss": -6.479022026062012, "global_step": 106876, "epoch": 2544} {"train_loss": -6.3733415603637695, "global_step": 106877, "epoch": 2544} {"train_loss": -6.346000671386719, "global_step": 106878, "epoch": 2544} {"train_loss": -6.438510894775391, "global_step": 106879, "epoch": 2544} {"train_loss": -6.382808685302734, "global_step": 106880, "epoch": 2544} {"train_loss": -6.328232765197754, "global_step": 106881, "epoch": 2544} {"train_loss": -6.470829963684082, "global_step": 106882, "epoch": 2544} {"train_loss": -6.381069183349609, "global_step": 106883, "epoch": 2544} {"train_loss": -6.43058967590332, "global_step": 106884, "epoch": 2544} {"train_loss": -6.504891395568848, "global_step": 106885, "epoch": 2544} {"train_loss": -6.412805557250977, "global_step": 106886, "epoch": 2544} {"train_loss": -6.397197246551514, "global_step": 106887, "epoch": 2544} {"train_loss": -6.346959590911865, "global_step": 106888, "epoch": 2544} {"train_loss": -6.391867172150385, "global_step": 106889, "epoch": 2544, "val_loss": 64811.1328125} {"train_loss": -6.385591983795166, "global_step": 106890, "epoch": 2545} {"train_loss": -6.445416450500488, "global_step": 106891, "epoch": 2545} {"train_loss": -6.42460298538208, "global_step": 106892, "epoch": 2545} {"train_loss": -6.369788646697998, "global_step": 106893, "epoch": 2545} {"train_loss": -6.4514946937561035, "global_step": 106894, "epoch": 2545} {"train_loss": -6.441272735595703, "global_step": 106895, "epoch": 2545} {"train_loss": -6.509666442871094, "global_step": 106896, "epoch": 2545} {"train_loss": -6.420524597167969, "global_step": 106897, "epoch": 2545} {"train_loss": -6.399054527282715, "global_step": 106898, "epoch": 2545} {"train_loss": -6.42080020904541, "global_step": 106899, "epoch": 2545} {"train_loss": -6.423858642578125, "global_step": 106900, "epoch": 2545} {"train_loss": -6.3165483474731445, "global_step": 106901, "epoch": 2545} {"train_loss": -6.338099956512451, "global_step": 106902, "epoch": 2545} {"train_loss": -6.407813549041748, "global_step": 106903, "epoch": 2545} {"train_loss": -6.399476528167725, "global_step": 106904, "epoch": 2545} {"train_loss": -6.418542861938477, "global_step": 106905, "epoch": 2545} {"train_loss": -6.393085479736328, "global_step": 106906, "epoch": 2545} {"train_loss": -6.522069931030273, "global_step": 106907, "epoch": 2545} {"train_loss": -6.4612717628479, "global_step": 106908, "epoch": 2545} {"train_loss": -6.485819339752197, "global_step": 106909, "epoch": 2545} {"train_loss": -6.459898948669434, "global_step": 106910, "epoch": 2545} {"train_loss": -6.443588733673096, "global_step": 106911, "epoch": 2545} {"train_loss": -6.4686055183410645, "global_step": 106912, "epoch": 2545} {"train_loss": -6.34542179107666, "global_step": 106913, "epoch": 2545} {"train_loss": -6.42624568939209, "global_step": 106914, "epoch": 2545} {"train_loss": -6.418590068817139, "global_step": 106915, "epoch": 2545} {"train_loss": -6.400521278381348, "global_step": 106916, "epoch": 2545} {"train_loss": -6.296152114868164, "global_step": 106917, "epoch": 2545} {"train_loss": -6.509387016296387, "global_step": 106918, "epoch": 2545} {"train_loss": -6.441878318786621, "global_step": 106919, "epoch": 2545} {"train_loss": -6.292810440063477, "global_step": 106920, "epoch": 2545} {"train_loss": -6.367830276489258, "global_step": 106921, "epoch": 2545} {"train_loss": -6.24235725402832, "global_step": 106922, "epoch": 2545} {"train_loss": -6.444659233093262, "global_step": 106923, "epoch": 2545} {"train_loss": -6.353724479675293, "global_step": 106924, "epoch": 2545} {"train_loss": -6.344781875610352, "global_step": 106925, "epoch": 2545} {"train_loss": -6.434836387634277, "global_step": 106926, "epoch": 2545} {"train_loss": -6.3494110107421875, "global_step": 106927, "epoch": 2545} {"train_loss": -6.530160903930664, "global_step": 106928, "epoch": 2545} {"train_loss": -6.327310562133789, "global_step": 106929, "epoch": 2545} {"train_loss": -6.401589393615723, "global_step": 106930, "epoch": 2545} {"train_loss": -6.406890312830607, "global_step": 106931, "epoch": 2545, "val_loss": 64742.7109375} {"train_loss": -6.4031758308410645, "global_step": 106932, "epoch": 2546} {"train_loss": -6.230804920196533, "global_step": 106933, "epoch": 2546} {"train_loss": -6.471420764923096, "global_step": 106934, "epoch": 2546} {"train_loss": -6.360466480255127, "global_step": 106935, "epoch": 2546} {"train_loss": -6.48869514465332, "global_step": 106936, "epoch": 2546} {"train_loss": -6.348359107971191, "global_step": 106937, "epoch": 2546} {"train_loss": -6.382399559020996, "global_step": 106938, "epoch": 2546} {"train_loss": -6.3785834312438965, "global_step": 106939, "epoch": 2546} {"train_loss": -6.3874077796936035, "global_step": 106940, "epoch": 2546} {"train_loss": -6.38480806350708, "global_step": 106941, "epoch": 2546} {"train_loss": -6.420248985290527, "global_step": 106942, "epoch": 2546} {"train_loss": -6.422269344329834, "global_step": 106943, "epoch": 2546} {"train_loss": -6.4769816398620605, "global_step": 106944, "epoch": 2546} {"train_loss": -6.482998847961426, "global_step": 106945, "epoch": 2546} {"train_loss": -6.541173458099365, "global_step": 106946, "epoch": 2546} {"train_loss": -6.40099573135376, "global_step": 106947, "epoch": 2546} {"train_loss": -6.309234142303467, "global_step": 106948, "epoch": 2546} {"train_loss": -6.379214286804199, "global_step": 106949, "epoch": 2546} {"train_loss": -6.398556232452393, "global_step": 106950, "epoch": 2546} {"train_loss": -6.489693641662598, "global_step": 106951, "epoch": 2546} {"train_loss": -6.528858184814453, "global_step": 106952, "epoch": 2546} {"train_loss": -6.4276862144470215, "global_step": 106953, "epoch": 2546} {"train_loss": -6.417014122009277, "global_step": 106954, "epoch": 2546} {"train_loss": -6.52436637878418, "global_step": 106955, "epoch": 2546} {"train_loss": -6.428840637207031, "global_step": 106956, "epoch": 2546} {"train_loss": -6.392085075378418, "global_step": 106957, "epoch": 2546} {"train_loss": -6.418000221252441, "global_step": 106958, "epoch": 2546} {"train_loss": -6.460647106170654, "global_step": 106959, "epoch": 2546} {"train_loss": -6.415259838104248, "global_step": 106960, "epoch": 2546} {"train_loss": -6.466986656188965, "global_step": 106961, "epoch": 2546} {"train_loss": -6.374924659729004, "global_step": 106962, "epoch": 2546} {"train_loss": -6.421922206878662, "global_step": 106963, "epoch": 2546} {"train_loss": -6.460459232330322, "global_step": 106964, "epoch": 2546} {"train_loss": -6.394277572631836, "global_step": 106965, "epoch": 2546} {"train_loss": -6.40660285949707, "global_step": 106966, "epoch": 2546} {"train_loss": -6.434221267700195, "global_step": 106967, "epoch": 2546} {"train_loss": -6.439665794372559, "global_step": 106968, "epoch": 2546} {"train_loss": -6.3814849853515625, "global_step": 106969, "epoch": 2546} {"train_loss": -6.392495155334473, "global_step": 106970, "epoch": 2546} {"train_loss": -6.449904441833496, "global_step": 106971, "epoch": 2546} {"train_loss": -6.444568157196045, "global_step": 106972, "epoch": 2546} {"train_loss": -6.419924985794794, "global_step": 106973, "epoch": 2546, "val_loss": 64640.11328125} {"train_loss": -6.483048915863037, "global_step": 106974, "epoch": 2547} {"train_loss": -6.601111888885498, "global_step": 106975, "epoch": 2547} {"train_loss": -6.403532028198242, "global_step": 106976, "epoch": 2547} {"train_loss": -6.492339134216309, "global_step": 106977, "epoch": 2547} {"train_loss": -6.474699974060059, "global_step": 106978, "epoch": 2547} {"train_loss": -6.393538475036621, "global_step": 106979, "epoch": 2547} {"train_loss": -6.477219104766846, "global_step": 106980, "epoch": 2547} {"train_loss": -6.628650188446045, "global_step": 106981, "epoch": 2547} {"train_loss": -6.423008918762207, "global_step": 106982, "epoch": 2547} {"train_loss": -6.5892791748046875, "global_step": 106983, "epoch": 2547} {"train_loss": -6.461997985839844, "global_step": 106984, "epoch": 2547} {"train_loss": -6.484703063964844, "global_step": 106985, "epoch": 2547} {"train_loss": -6.441030979156494, "global_step": 106986, "epoch": 2547} {"train_loss": -6.463939666748047, "global_step": 106987, "epoch": 2547} {"train_loss": -6.467386245727539, "global_step": 106988, "epoch": 2547} {"train_loss": -6.437880039215088, "global_step": 106989, "epoch": 2547} {"train_loss": -6.511019706726074, "global_step": 106990, "epoch": 2547} {"train_loss": -6.4020280838012695, "global_step": 106991, "epoch": 2547} {"train_loss": -6.595813751220703, "global_step": 106992, "epoch": 2547} {"train_loss": -6.5596232414245605, "global_step": 106993, "epoch": 2547} {"train_loss": -6.421918869018555, "global_step": 106994, "epoch": 2547} {"train_loss": -6.56894588470459, "global_step": 106995, "epoch": 2547} {"train_loss": -6.563390731811523, "global_step": 106996, "epoch": 2547} {"train_loss": -6.552711486816406, "global_step": 106997, "epoch": 2547} {"train_loss": -6.507661819458008, "global_step": 106998, "epoch": 2547} {"train_loss": -6.410037994384766, "global_step": 106999, "epoch": 2547} {"train_loss": -6.505838871002197, "global_step": 107000, "epoch": 2547} {"train_loss": -6.5003132820129395, "global_step": 107001, "epoch": 2547} {"train_loss": -6.425589561462402, "global_step": 107002, "epoch": 2547} {"train_loss": -6.545773983001709, "global_step": 107003, "epoch": 2547} {"train_loss": -6.364828109741211, "global_step": 107004, "epoch": 2547} {"train_loss": -6.475617408752441, "global_step": 107005, "epoch": 2547} {"train_loss": -6.538677215576172, "global_step": 107006, "epoch": 2547} {"train_loss": -6.409704208374023, "global_step": 107007, "epoch": 2547} {"train_loss": -6.544447898864746, "global_step": 107008, "epoch": 2547} {"train_loss": -6.439900875091553, "global_step": 107009, "epoch": 2547} {"train_loss": -6.492469310760498, "global_step": 107010, "epoch": 2547} {"train_loss": -6.473241806030273, "global_step": 107011, "epoch": 2547} {"train_loss": -6.502050399780273, "global_step": 107012, "epoch": 2547} {"train_loss": -6.551601409912109, "global_step": 107013, "epoch": 2547} {"train_loss": -6.411399841308594, "global_step": 107014, "epoch": 2547} {"train_loss": -6.488120601290748, "global_step": 107015, "epoch": 2547, "val_loss": 64668.046875} {"train_loss": -6.417956352233887, "global_step": 107016, "epoch": 2548} {"train_loss": -6.516744136810303, "global_step": 107017, "epoch": 2548} {"train_loss": -6.561468124389648, "global_step": 107018, "epoch": 2548} {"train_loss": -6.4776763916015625, "global_step": 107019, "epoch": 2548} {"train_loss": -6.437762260437012, "global_step": 107020, "epoch": 2548} {"train_loss": -6.562475204467773, "global_step": 107021, "epoch": 2548} {"train_loss": -6.49705696105957, "global_step": 107022, "epoch": 2548} {"train_loss": -6.466882705688477, "global_step": 107023, "epoch": 2548} {"train_loss": -6.430768966674805, "global_step": 107024, "epoch": 2548} {"train_loss": -6.424732685089111, "global_step": 107025, "epoch": 2548} {"train_loss": -6.50463342666626, "global_step": 107026, "epoch": 2548} {"train_loss": -6.486993312835693, "global_step": 107027, "epoch": 2548} {"train_loss": -6.470398426055908, "global_step": 107028, "epoch": 2548} {"train_loss": -6.380547523498535, "global_step": 107029, "epoch": 2548} {"train_loss": -6.575181484222412, "global_step": 107030, "epoch": 2548} {"train_loss": -6.447420120239258, "global_step": 107031, "epoch": 2548} {"train_loss": -6.4458394050598145, "global_step": 107032, "epoch": 2548} {"train_loss": -6.437899589538574, "global_step": 107033, "epoch": 2548} {"train_loss": -6.435473442077637, "global_step": 107034, "epoch": 2548} {"train_loss": -6.492612838745117, "global_step": 107035, "epoch": 2548} {"train_loss": -6.418660640716553, "global_step": 107036, "epoch": 2548} {"train_loss": -6.4236297607421875, "global_step": 107037, "epoch": 2548} {"train_loss": -6.45088005065918, "global_step": 107038, "epoch": 2548} {"train_loss": -6.455327987670898, "global_step": 107039, "epoch": 2548} {"train_loss": -6.4886369705200195, "global_step": 107040, "epoch": 2548} {"train_loss": -6.439499855041504, "global_step": 107041, "epoch": 2548} {"train_loss": -6.520488739013672, "global_step": 107042, "epoch": 2548} {"train_loss": -6.438054084777832, "global_step": 107043, "epoch": 2548} {"train_loss": -6.553164482116699, "global_step": 107044, "epoch": 2548} {"train_loss": -6.536169052124023, "global_step": 107045, "epoch": 2548} {"train_loss": -6.486878395080566, "global_step": 107046, "epoch": 2548} {"train_loss": -6.400582313537598, "global_step": 107047, "epoch": 2548} {"train_loss": -6.389307975769043, "global_step": 107048, "epoch": 2548} {"train_loss": -6.504147052764893, "global_step": 107049, "epoch": 2548} {"train_loss": -6.454991340637207, "global_step": 107050, "epoch": 2548} {"train_loss": -6.4844770431518555, "global_step": 107051, "epoch": 2548} {"train_loss": -6.342517375946045, "global_step": 107052, "epoch": 2548} {"train_loss": -6.472918510437012, "global_step": 107053, "epoch": 2548} {"train_loss": -6.471327781677246, "global_step": 107054, "epoch": 2548} {"train_loss": -6.587759971618652, "global_step": 107055, "epoch": 2548} {"train_loss": -6.440720081329346, "global_step": 107056, "epoch": 2548} {"train_loss": -6.468638976414998, "global_step": 107057, "epoch": 2548, "val_loss": 64760.62109375} {"train_loss": -6.5170063972473145, "global_step": 107058, "epoch": 2549} {"train_loss": -6.439345359802246, "global_step": 107059, "epoch": 2549} {"train_loss": -6.535099029541016, "global_step": 107060, "epoch": 2549} {"train_loss": -6.478017807006836, "global_step": 107061, "epoch": 2549} {"train_loss": -6.518860816955566, "global_step": 107062, "epoch": 2549} {"train_loss": -6.484318733215332, "global_step": 107063, "epoch": 2549} {"train_loss": -6.543916702270508, "global_step": 107064, "epoch": 2549} {"train_loss": -6.479796409606934, "global_step": 107065, "epoch": 2549} {"train_loss": -6.449276924133301, "global_step": 107066, "epoch": 2549} {"train_loss": -6.435269355773926, "global_step": 107067, "epoch": 2549} {"train_loss": -6.413127899169922, "global_step": 107068, "epoch": 2549} {"train_loss": -6.461337089538574, "global_step": 107069, "epoch": 2549} {"train_loss": -6.505917549133301, "global_step": 107070, "epoch": 2549} {"train_loss": -6.441137313842773, "global_step": 107071, "epoch": 2549} {"train_loss": -6.469877243041992, "global_step": 107072, "epoch": 2549} {"train_loss": -6.3430328369140625, "global_step": 107073, "epoch": 2549} {"train_loss": -6.4730119705200195, "global_step": 107074, "epoch": 2549} {"train_loss": -6.515190124511719, "global_step": 107075, "epoch": 2549} {"train_loss": -6.515763282775879, "global_step": 107076, "epoch": 2549} {"train_loss": -6.408144950866699, "global_step": 107077, "epoch": 2549} {"train_loss": -6.479631423950195, "global_step": 107078, "epoch": 2549} {"train_loss": -6.465900421142578, "global_step": 107079, "epoch": 2549} {"train_loss": -6.413933277130127, "global_step": 107080, "epoch": 2549} {"train_loss": -6.422290802001953, "global_step": 107081, "epoch": 2549} {"train_loss": -6.335296630859375, "global_step": 107082, "epoch": 2549} {"train_loss": -6.275890350341797, "global_step": 107083, "epoch": 2549} {"train_loss": -6.28478479385376, "global_step": 107084, "epoch": 2549} {"train_loss": -6.387693405151367, "global_step": 107085, "epoch": 2549} {"train_loss": -6.375738620758057, "global_step": 107086, "epoch": 2549} {"train_loss": -6.415253639221191, "global_step": 107087, "epoch": 2549} {"train_loss": -6.334615230560303, "global_step": 107088, "epoch": 2549} {"train_loss": -6.399974822998047, "global_step": 107089, "epoch": 2549} {"train_loss": -6.34576416015625, "global_step": 107090, "epoch": 2549} {"train_loss": -6.340032577514648, "global_step": 107091, "epoch": 2549} {"train_loss": -6.357308864593506, "global_step": 107092, "epoch": 2549} {"train_loss": -6.351367473602295, "global_step": 107093, "epoch": 2549} {"train_loss": -6.347529411315918, "global_step": 107094, "epoch": 2549} {"train_loss": -6.340821743011475, "global_step": 107095, "epoch": 2549} {"train_loss": -6.451661586761475, "global_step": 107096, "epoch": 2549} {"train_loss": -6.379068374633789, "global_step": 107097, "epoch": 2549} {"train_loss": -6.427079677581787, "global_step": 107098, "epoch": 2549} {"train_loss": -6.424534525190081, "global_step": 107099, "epoch": 2549, "val_loss": 65085.7109375} {"train_loss": -6.413583755493164, "global_step": 107100, "epoch": 2550} {"train_loss": -6.383162021636963, "global_step": 107101, "epoch": 2550} {"train_loss": -6.498035907745361, "global_step": 107102, "epoch": 2550} {"train_loss": -6.453641414642334, "global_step": 107103, "epoch": 2550} {"train_loss": -6.4991936683654785, "global_step": 107104, "epoch": 2550} {"train_loss": -6.287240028381348, "global_step": 107105, "epoch": 2550} {"train_loss": -6.3894243240356445, "global_step": 107106, "epoch": 2550} {"train_loss": -6.386305809020996, "global_step": 107107, "epoch": 2550} {"train_loss": -6.4556779861450195, "global_step": 107108, "epoch": 2550} {"train_loss": -6.274608612060547, "global_step": 107109, "epoch": 2550} {"train_loss": -6.385004997253418, "global_step": 107110, "epoch": 2550} {"train_loss": -6.506071090698242, "global_step": 107111, "epoch": 2550} {"train_loss": -6.318500518798828, "global_step": 107112, "epoch": 2550} {"train_loss": -6.292216777801514, "global_step": 107113, "epoch": 2550} {"train_loss": -6.368952751159668, "global_step": 107114, "epoch": 2550} {"train_loss": -6.309122085571289, "global_step": 107115, "epoch": 2550} {"train_loss": -6.417544364929199, "global_step": 107116, "epoch": 2550} {"train_loss": -6.322422027587891, "global_step": 107117, "epoch": 2550} {"train_loss": -6.309466361999512, "global_step": 107118, "epoch": 2550} {"train_loss": -6.4121270179748535, "global_step": 107119, "epoch": 2550} {"train_loss": -6.367722511291504, "global_step": 107120, "epoch": 2550} {"train_loss": -6.344013690948486, "global_step": 107121, "epoch": 2550} {"train_loss": -6.396894454956055, "global_step": 107122, "epoch": 2550} {"train_loss": -6.451958179473877, "global_step": 107123, "epoch": 2550} {"train_loss": -6.5329484939575195, "global_step": 107124, "epoch": 2550} {"train_loss": -6.397958755493164, "global_step": 107125, "epoch": 2550} {"train_loss": -6.327387809753418, "global_step": 107126, "epoch": 2550} {"train_loss": -6.443846702575684, "global_step": 107127, "epoch": 2550} {"train_loss": -6.331754684448242, "global_step": 107128, "epoch": 2550} {"train_loss": -6.314944744110107, "global_step": 107129, "epoch": 2550} {"train_loss": -6.400264739990234, "global_step": 107130, "epoch": 2550} {"train_loss": -6.401785850524902, "global_step": 107131, "epoch": 2550} {"train_loss": -6.473672866821289, "global_step": 107132, "epoch": 2550} {"train_loss": -6.521563529968262, "global_step": 107133, "epoch": 2550} {"train_loss": -6.4471869468688965, "global_step": 107134, "epoch": 2550} {"train_loss": -6.592358589172363, "global_step": 107135, "epoch": 2550} {"train_loss": -6.483870029449463, "global_step": 107136, "epoch": 2550} {"train_loss": -6.495694160461426, "global_step": 107137, "epoch": 2550} {"train_loss": -6.392030715942383, "global_step": 107138, "epoch": 2550} {"train_loss": -6.42061185836792, "global_step": 107139, "epoch": 2550} {"train_loss": -6.372071743011475, "global_step": 107140, "epoch": 2550} {"train_loss": -6.4031214486984975, "global_step": 107141, "epoch": 2550, "train/sim_max_reward_0": 0.19868765511341854, "train/sim_max_reward_1": 0.3404817814427169, "train/sim_max_reward_2": 0.2513251528723951, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.9596948891704477, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.16728468496085802, "test/sim_max_reward_4300001": 0.6612757024354092, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.8116309237128706, "test/sim_max_reward_4300004": 0.2794289634073585, "test/sim_max_reward_4300005": 0.7407889988468563, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.602198522469132, "test/sim_max_reward_4300008": 0.9330331934451971, "test/sim_max_reward_4300009": 0.909734934824126, "test/sim_max_reward_4300010": 0.9140242264986826, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.9737729876526191, "test/sim_max_reward_4300013": 0.9878011876702265, "test/sim_max_reward_4300014": 0.9871999694475478, "test/sim_max_reward_4300015": 0.974637715057875, "test/sim_max_reward_4300016": 0.9593759477836482, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.3944740204031552, "test/sim_max_reward_4300019": 0.18806271942120417, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8868116321907047, "test/sim_max_reward_4300022": 0.9682974786211397, "test/sim_max_reward_4300023": 0.4217248366850533, "test/sim_max_reward_4300024": 0.32609463275106104, "test/sim_max_reward_4300025": 0.34006500255556965, "test/sim_max_reward_4300026": 0.18321907219848627, "test/sim_max_reward_4300027": 0.9015649458949498, "test/sim_max_reward_4300028": 0.004232253590618785, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.1589448297325597, "test/sim_max_reward_4300031": 0.21265363329572856, "test/sim_max_reward_4300032": 0.8660572125279274, "test/sim_max_reward_4300033": 1.0, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.3039539033731744, "test/sim_max_reward_4300036": 0.1999799473227696, "test/sim_max_reward_4300037": 0.8463465217886442, "test/sim_max_reward_4300038": 0.0, "test/sim_max_reward_4300039": 0.7643303376894777, "test/sim_max_reward_4300040": 0.6677840055291009, "test/sim_max_reward_4300041": 0.9423121193134986, "test/sim_max_reward_4300042": 0.9760510790998825, "test/sim_max_reward_4300043": 0.02508858726066159, "test/sim_max_reward_4300044": 0.9724064783031987, "test/sim_max_reward_4300045": 0.1863667832688025, "test/sim_max_reward_4300046": 0.9779857917167262, "test/sim_max_reward_4300047": 0.8960181130641557, "test/sim_max_reward_4300048": 0.8494086645771094, "test/sim_max_reward_4300049": 0.15362857068160063, "train/mean_score": 0.4905290396601943, "test/mean_score": 0.5903210226213873, "val_loss": 64622.39453125} {"train_loss": -6.413485527038574, "global_step": 107142, "epoch": 2551} {"train_loss": -6.506434440612793, "global_step": 107143, "epoch": 2551} {"train_loss": -6.413218021392822, "global_step": 107144, "epoch": 2551} {"train_loss": -6.4678473472595215, "global_step": 107145, "epoch": 2551} {"train_loss": -6.358532905578613, "global_step": 107146, "epoch": 2551} {"train_loss": -6.468681335449219, "global_step": 107147, "epoch": 2551} {"train_loss": -6.448945999145508, "global_step": 107148, "epoch": 2551} {"train_loss": -6.453459739685059, "global_step": 107149, "epoch": 2551} {"train_loss": -6.371905326843262, "global_step": 107150, "epoch": 2551} {"train_loss": -6.388510227203369, "global_step": 107151, "epoch": 2551} {"train_loss": -6.492358207702637, "global_step": 107152, "epoch": 2551} {"train_loss": -6.542842864990234, "global_step": 107153, "epoch": 2551} {"train_loss": -6.490749359130859, "global_step": 107154, "epoch": 2551} {"train_loss": -6.377919673919678, "global_step": 107155, "epoch": 2551} {"train_loss": -6.448929309844971, "global_step": 107156, "epoch": 2551} {"train_loss": -6.570473670959473, "global_step": 107157, "epoch": 2551} {"train_loss": -6.211672782897949, "global_step": 107158, "epoch": 2551} {"train_loss": -6.422917366027832, "global_step": 107159, "epoch": 2551} {"train_loss": -6.494615077972412, "global_step": 107160, "epoch": 2551} {"train_loss": -6.332265853881836, "global_step": 107161, "epoch": 2551} {"train_loss": -6.453084945678711, "global_step": 107162, "epoch": 2551} {"train_loss": -6.303068161010742, "global_step": 107163, "epoch": 2551} {"train_loss": -6.325771331787109, "global_step": 107164, "epoch": 2551} {"train_loss": -6.417265892028809, "global_step": 107165, "epoch": 2551} {"train_loss": -6.455880165100098, "global_step": 107166, "epoch": 2551} {"train_loss": -6.308382511138916, "global_step": 107167, "epoch": 2551} {"train_loss": -6.4934539794921875, "global_step": 107168, "epoch": 2551} {"train_loss": -6.266549110412598, "global_step": 107169, "epoch": 2551} {"train_loss": -6.414483070373535, "global_step": 107170, "epoch": 2551} {"train_loss": -6.371551036834717, "global_step": 107171, "epoch": 2551} {"train_loss": -6.271486282348633, "global_step": 107172, "epoch": 2551} {"train_loss": -6.4491071701049805, "global_step": 107173, "epoch": 2551} {"train_loss": -6.294365882873535, "global_step": 107174, "epoch": 2551} {"train_loss": -6.414082050323486, "global_step": 107175, "epoch": 2551} {"train_loss": -6.307740211486816, "global_step": 107176, "epoch": 2551} {"train_loss": -6.40308141708374, "global_step": 107177, "epoch": 2551} {"train_loss": -6.332742691040039, "global_step": 107178, "epoch": 2551} {"train_loss": -6.387899875640869, "global_step": 107179, "epoch": 2551} {"train_loss": -6.42097282409668, "global_step": 107180, "epoch": 2551} {"train_loss": -6.351323127746582, "global_step": 107181, "epoch": 2551} {"train_loss": -6.3134918212890625, "global_step": 107182, "epoch": 2551} {"train_loss": -6.398929573240734, "global_step": 107183, "epoch": 2551, "val_loss": 64575.72265625} {"train_loss": -6.3361358642578125, "global_step": 107184, "epoch": 2552} {"train_loss": -6.381185531616211, "global_step": 107185, "epoch": 2552} {"train_loss": -6.450510025024414, "global_step": 107186, "epoch": 2552} {"train_loss": -6.323984146118164, "global_step": 107187, "epoch": 2552} {"train_loss": -6.432516574859619, "global_step": 107188, "epoch": 2552} {"train_loss": -6.423732280731201, "global_step": 107189, "epoch": 2552} {"train_loss": -6.429858207702637, "global_step": 107190, "epoch": 2552} {"train_loss": -6.41159200668335, "global_step": 107191, "epoch": 2552} {"train_loss": -6.459259033203125, "global_step": 107192, "epoch": 2552} {"train_loss": -6.411660194396973, "global_step": 107193, "epoch": 2552} {"train_loss": -6.5073347091674805, "global_step": 107194, "epoch": 2552} {"train_loss": -6.471748352050781, "global_step": 107195, "epoch": 2552} {"train_loss": -6.532392978668213, "global_step": 107196, "epoch": 2552} {"train_loss": -6.405597686767578, "global_step": 107197, "epoch": 2552} {"train_loss": -6.516654968261719, "global_step": 107198, "epoch": 2552} {"train_loss": -6.472631454467773, "global_step": 107199, "epoch": 2552} {"train_loss": -6.363415718078613, "global_step": 107200, "epoch": 2552} {"train_loss": -6.409418106079102, "global_step": 107201, "epoch": 2552} {"train_loss": -6.365618705749512, "global_step": 107202, "epoch": 2552} {"train_loss": -6.483863830566406, "global_step": 107203, "epoch": 2552} {"train_loss": -6.339922904968262, "global_step": 107204, "epoch": 2552} {"train_loss": -6.407691955566406, "global_step": 107205, "epoch": 2552} {"train_loss": -6.429262161254883, "global_step": 107206, "epoch": 2552} {"train_loss": -6.394263744354248, "global_step": 107207, "epoch": 2552} {"train_loss": -6.428745746612549, "global_step": 107208, "epoch": 2552} {"train_loss": -6.3354363441467285, "global_step": 107209, "epoch": 2552} {"train_loss": -6.541836738586426, "global_step": 107210, "epoch": 2552} {"train_loss": -6.508338928222656, "global_step": 107211, "epoch": 2552} {"train_loss": -6.409738540649414, "global_step": 107212, "epoch": 2552} {"train_loss": -6.428411483764648, "global_step": 107213, "epoch": 2552} {"train_loss": -6.4148712158203125, "global_step": 107214, "epoch": 2552} {"train_loss": -6.411136627197266, "global_step": 107215, "epoch": 2552} {"train_loss": -6.500030517578125, "global_step": 107216, "epoch": 2552} {"train_loss": -6.42294979095459, "global_step": 107217, "epoch": 2552} {"train_loss": -6.475054740905762, "global_step": 107218, "epoch": 2552} {"train_loss": -6.35003137588501, "global_step": 107219, "epoch": 2552} {"train_loss": -6.497862815856934, "global_step": 107220, "epoch": 2552} {"train_loss": -6.381526947021484, "global_step": 107221, "epoch": 2552} {"train_loss": -6.5495405197143555, "global_step": 107222, "epoch": 2552} {"train_loss": -6.293661594390869, "global_step": 107223, "epoch": 2552} {"train_loss": -6.48013973236084, "global_step": 107224, "epoch": 2552} {"train_loss": -6.427796216238113, "global_step": 107225, "epoch": 2552, "val_loss": 64932.7734375} {"train_loss": -6.395527362823486, "global_step": 107226, "epoch": 2553} {"train_loss": -6.422922134399414, "global_step": 107227, "epoch": 2553} {"train_loss": -6.500782012939453, "global_step": 107228, "epoch": 2553} {"train_loss": -6.4366559982299805, "global_step": 107229, "epoch": 2553} {"train_loss": -6.418133735656738, "global_step": 107230, "epoch": 2553} {"train_loss": -6.467157363891602, "global_step": 107231, "epoch": 2553} {"train_loss": -6.42159366607666, "global_step": 107232, "epoch": 2553} {"train_loss": -6.336439609527588, "global_step": 107233, "epoch": 2553} {"train_loss": -6.471336364746094, "global_step": 107234, "epoch": 2553} {"train_loss": -6.458793640136719, "global_step": 107235, "epoch": 2553} {"train_loss": -6.3879899978637695, "global_step": 107236, "epoch": 2553} {"train_loss": -6.365548133850098, "global_step": 107237, "epoch": 2553} {"train_loss": -6.347036361694336, "global_step": 107238, "epoch": 2553} {"train_loss": -6.302910327911377, "global_step": 107239, "epoch": 2553} {"train_loss": -6.304287433624268, "global_step": 107240, "epoch": 2553} {"train_loss": -6.405631065368652, "global_step": 107241, "epoch": 2553} {"train_loss": -6.3538031578063965, "global_step": 107242, "epoch": 2553} {"train_loss": -6.476390838623047, "global_step": 107243, "epoch": 2553} {"train_loss": -6.397904396057129, "global_step": 107244, "epoch": 2553} {"train_loss": -6.330216407775879, "global_step": 107245, "epoch": 2553} {"train_loss": -6.503262042999268, "global_step": 107246, "epoch": 2553} {"train_loss": -6.354760646820068, "global_step": 107247, "epoch": 2553} {"train_loss": -6.422016143798828, "global_step": 107248, "epoch": 2553} {"train_loss": -6.26637077331543, "global_step": 107249, "epoch": 2553} {"train_loss": -6.337250709533691, "global_step": 107250, "epoch": 2553} {"train_loss": -6.447694301605225, "global_step": 107251, "epoch": 2553} {"train_loss": -6.376100063323975, "global_step": 107252, "epoch": 2553} {"train_loss": -6.5091986656188965, "global_step": 107253, "epoch": 2553} {"train_loss": -6.3178629875183105, "global_step": 107254, "epoch": 2553} {"train_loss": -6.521648406982422, "global_step": 107255, "epoch": 2553} {"train_loss": -6.310117721557617, "global_step": 107256, "epoch": 2553} {"train_loss": -6.3431854248046875, "global_step": 107257, "epoch": 2553} {"train_loss": -6.413177490234375, "global_step": 107258, "epoch": 2553} {"train_loss": -6.412451267242432, "global_step": 107259, "epoch": 2553} {"train_loss": -6.531612396240234, "global_step": 107260, "epoch": 2553} {"train_loss": -6.371699333190918, "global_step": 107261, "epoch": 2553} {"train_loss": -6.436432838439941, "global_step": 107262, "epoch": 2553} {"train_loss": -6.44649600982666, "global_step": 107263, "epoch": 2553} {"train_loss": -6.428885459899902, "global_step": 107264, "epoch": 2553} {"train_loss": -6.454115867614746, "global_step": 107265, "epoch": 2553} {"train_loss": -6.5254740715026855, "global_step": 107266, "epoch": 2553} {"train_loss": -6.409262157621837, "global_step": 107267, "epoch": 2553, "val_loss": 64502.25} {"train_loss": -6.500783443450928, "global_step": 107268, "epoch": 2554} {"train_loss": -6.4290080070495605, "global_step": 107269, "epoch": 2554} {"train_loss": -6.480599403381348, "global_step": 107270, "epoch": 2554} {"train_loss": -6.463920593261719, "global_step": 107271, "epoch": 2554} {"train_loss": -6.340662956237793, "global_step": 107272, "epoch": 2554} {"train_loss": -6.522717475891113, "global_step": 107273, "epoch": 2554} {"train_loss": -6.461676120758057, "global_step": 107274, "epoch": 2554} {"train_loss": -6.528635025024414, "global_step": 107275, "epoch": 2554} {"train_loss": -6.605462074279785, "global_step": 107276, "epoch": 2554} {"train_loss": -6.52010440826416, "global_step": 107277, "epoch": 2554} {"train_loss": -6.515416145324707, "global_step": 107278, "epoch": 2554} {"train_loss": -6.395259857177734, "global_step": 107279, "epoch": 2554} {"train_loss": -6.461038589477539, "global_step": 107280, "epoch": 2554} {"train_loss": -6.473857879638672, "global_step": 107281, "epoch": 2554} {"train_loss": -6.313385009765625, "global_step": 107282, "epoch": 2554} {"train_loss": -6.523373603820801, "global_step": 107283, "epoch": 2554} {"train_loss": -6.520310401916504, "global_step": 107284, "epoch": 2554} {"train_loss": -6.358456611633301, "global_step": 107285, "epoch": 2554} {"train_loss": -6.349071025848389, "global_step": 107286, "epoch": 2554} {"train_loss": -6.500693321228027, "global_step": 107287, "epoch": 2554} {"train_loss": -6.452345371246338, "global_step": 107288, "epoch": 2554} {"train_loss": -6.427796840667725, "global_step": 107289, "epoch": 2554} {"train_loss": -6.454908847808838, "global_step": 107290, "epoch": 2554} {"train_loss": -6.468857765197754, "global_step": 107291, "epoch": 2554} {"train_loss": -6.45180606842041, "global_step": 107292, "epoch": 2554} {"train_loss": -6.542949199676514, "global_step": 107293, "epoch": 2554} {"train_loss": -6.462039947509766, "global_step": 107294, "epoch": 2554} {"train_loss": -6.511730194091797, "global_step": 107295, "epoch": 2554} {"train_loss": -6.427073955535889, "global_step": 107296, "epoch": 2554} {"train_loss": -6.511138916015625, "global_step": 107297, "epoch": 2554} {"train_loss": -6.457414627075195, "global_step": 107298, "epoch": 2554} {"train_loss": -6.500247478485107, "global_step": 107299, "epoch": 2554} {"train_loss": -6.412574768066406, "global_step": 107300, "epoch": 2554} {"train_loss": -6.530320644378662, "global_step": 107301, "epoch": 2554} {"train_loss": -6.371733665466309, "global_step": 107302, "epoch": 2554} {"train_loss": -6.412321090698242, "global_step": 107303, "epoch": 2554} {"train_loss": -6.318552017211914, "global_step": 107304, "epoch": 2554} {"train_loss": -6.368799686431885, "global_step": 107305, "epoch": 2554} {"train_loss": -6.35329532623291, "global_step": 107306, "epoch": 2554} {"train_loss": -6.289950370788574, "global_step": 107307, "epoch": 2554} {"train_loss": -6.4350128173828125, "global_step": 107308, "epoch": 2554} {"train_loss": -6.450731163933163, "global_step": 107309, "epoch": 2554, "val_loss": 64781.1875} {"train_loss": -6.46815299987793, "global_step": 107310, "epoch": 2555} {"train_loss": -6.44879150390625, "global_step": 107311, "epoch": 2555} {"train_loss": -6.415402412414551, "global_step": 107312, "epoch": 2555} {"train_loss": -6.527291297912598, "global_step": 107313, "epoch": 2555} {"train_loss": -6.448648452758789, "global_step": 107314, "epoch": 2555} {"train_loss": -6.3993449211120605, "global_step": 107315, "epoch": 2555} {"train_loss": -6.465986251831055, "global_step": 107316, "epoch": 2555} {"train_loss": -6.470624923706055, "global_step": 107317, "epoch": 2555} {"train_loss": -6.462296009063721, "global_step": 107318, "epoch": 2555} {"train_loss": -6.5843505859375, "global_step": 107319, "epoch": 2555} {"train_loss": -6.360494613647461, "global_step": 107320, "epoch": 2555} {"train_loss": -6.335982799530029, "global_step": 107321, "epoch": 2555} {"train_loss": -6.438929557800293, "global_step": 107322, "epoch": 2555} {"train_loss": -6.486288070678711, "global_step": 107323, "epoch": 2555} {"train_loss": -6.372777938842773, "global_step": 107324, "epoch": 2555} {"train_loss": -6.423343658447266, "global_step": 107325, "epoch": 2555} {"train_loss": -6.41856050491333, "global_step": 107326, "epoch": 2555} {"train_loss": -6.393469333648682, "global_step": 107327, "epoch": 2555} {"train_loss": -6.4182610511779785, "global_step": 107328, "epoch": 2555} {"train_loss": -6.451170444488525, "global_step": 107329, "epoch": 2555} {"train_loss": -6.435927391052246, "global_step": 107330, "epoch": 2555} {"train_loss": -6.288570404052734, "global_step": 107331, "epoch": 2555} {"train_loss": -6.399370193481445, "global_step": 107332, "epoch": 2555} {"train_loss": -6.430531978607178, "global_step": 107333, "epoch": 2555} {"train_loss": -6.395135879516602, "global_step": 107334, "epoch": 2555} {"train_loss": -6.398908615112305, "global_step": 107335, "epoch": 2555} {"train_loss": -6.4937028884887695, "global_step": 107336, "epoch": 2555} {"train_loss": -6.4554219245910645, "global_step": 107337, "epoch": 2555} {"train_loss": -6.310864448547363, "global_step": 107338, "epoch": 2555} {"train_loss": -6.476728439331055, "global_step": 107339, "epoch": 2555} {"train_loss": -6.468598365783691, "global_step": 107340, "epoch": 2555} {"train_loss": -6.496212005615234, "global_step": 107341, "epoch": 2555} {"train_loss": -6.437165260314941, "global_step": 107342, "epoch": 2555} {"train_loss": -6.489928245544434, "global_step": 107343, "epoch": 2555} {"train_loss": -6.49256706237793, "global_step": 107344, "epoch": 2555} {"train_loss": -6.401234149932861, "global_step": 107345, "epoch": 2555} {"train_loss": -6.392242908477783, "global_step": 107346, "epoch": 2555} {"train_loss": -6.508528709411621, "global_step": 107347, "epoch": 2555} {"train_loss": -6.567244052886963, "global_step": 107348, "epoch": 2555} {"train_loss": -6.47819709777832, "global_step": 107349, "epoch": 2555} {"train_loss": -6.440520286560059, "global_step": 107350, "epoch": 2555} {"train_loss": -6.442640315918696, "global_step": 107351, "epoch": 2555, "val_loss": 64855.88671875} {"train_loss": -6.537179946899414, "global_step": 107352, "epoch": 2556} {"train_loss": -6.527736663818359, "global_step": 107353, "epoch": 2556} {"train_loss": -6.399507522583008, "global_step": 107354, "epoch": 2556} {"train_loss": -6.498767852783203, "global_step": 107355, "epoch": 2556} {"train_loss": -6.43228816986084, "global_step": 107356, "epoch": 2556} {"train_loss": -6.517542362213135, "global_step": 107357, "epoch": 2556} {"train_loss": -6.473971366882324, "global_step": 107358, "epoch": 2556} {"train_loss": -6.327393531799316, "global_step": 107359, "epoch": 2556} {"train_loss": -6.4005045890808105, "global_step": 107360, "epoch": 2556} {"train_loss": -6.440850257873535, "global_step": 107361, "epoch": 2556} {"train_loss": -6.423394203186035, "global_step": 107362, "epoch": 2556} {"train_loss": -6.376666069030762, "global_step": 107363, "epoch": 2556} {"train_loss": -6.410281658172607, "global_step": 107364, "epoch": 2556} {"train_loss": -6.383477687835693, "global_step": 107365, "epoch": 2556} {"train_loss": -6.494359970092773, "global_step": 107366, "epoch": 2556} {"train_loss": -6.475278854370117, "global_step": 107367, "epoch": 2556} {"train_loss": -6.294303894042969, "global_step": 107368, "epoch": 2556} {"train_loss": -6.496831893920898, "global_step": 107369, "epoch": 2556} {"train_loss": -6.373175621032715, "global_step": 107370, "epoch": 2556} {"train_loss": -6.323276996612549, "global_step": 107371, "epoch": 2556} {"train_loss": -6.451140403747559, "global_step": 107372, "epoch": 2556} {"train_loss": -6.4696784019470215, "global_step": 107373, "epoch": 2556} {"train_loss": -6.323919296264648, "global_step": 107374, "epoch": 2556} {"train_loss": -6.4186177253723145, "global_step": 107375, "epoch": 2556} {"train_loss": -6.2917327880859375, "global_step": 107376, "epoch": 2556} {"train_loss": -6.527682304382324, "global_step": 107377, "epoch": 2556} {"train_loss": -6.364953994750977, "global_step": 107378, "epoch": 2556} {"train_loss": -6.414945602416992, "global_step": 107379, "epoch": 2556} {"train_loss": -6.437158584594727, "global_step": 107380, "epoch": 2556} {"train_loss": -6.464334964752197, "global_step": 107381, "epoch": 2556} {"train_loss": -6.3124542236328125, "global_step": 107382, "epoch": 2556} {"train_loss": -6.352566719055176, "global_step": 107383, "epoch": 2556} {"train_loss": -6.292015075683594, "global_step": 107384, "epoch": 2556} {"train_loss": -6.317671775817871, "global_step": 107385, "epoch": 2556} {"train_loss": -6.41448974609375, "global_step": 107386, "epoch": 2556} {"train_loss": -6.355839729309082, "global_step": 107387, "epoch": 2556} {"train_loss": -6.486220359802246, "global_step": 107388, "epoch": 2556} {"train_loss": -6.410614967346191, "global_step": 107389, "epoch": 2556} {"train_loss": -6.408010959625244, "global_step": 107390, "epoch": 2556} {"train_loss": -6.425642013549805, "global_step": 107391, "epoch": 2556} {"train_loss": -6.452581405639648, "global_step": 107392, "epoch": 2556} {"train_loss": -6.4165818350655695, "global_step": 107393, "epoch": 2556, "val_loss": 64682.05078125} {"train_loss": -6.547238826751709, "global_step": 107394, "epoch": 2557} {"train_loss": -6.572164535522461, "global_step": 107395, "epoch": 2557} {"train_loss": -6.538010597229004, "global_step": 107396, "epoch": 2557} {"train_loss": -6.467979907989502, "global_step": 107397, "epoch": 2557} {"train_loss": -6.609840393066406, "global_step": 107398, "epoch": 2557} {"train_loss": -6.448478698730469, "global_step": 107399, "epoch": 2557} {"train_loss": -6.4983110427856445, "global_step": 107400, "epoch": 2557} {"train_loss": -6.520163536071777, "global_step": 107401, "epoch": 2557} {"train_loss": -6.487874984741211, "global_step": 107402, "epoch": 2557} {"train_loss": -6.460914611816406, "global_step": 107403, "epoch": 2557} {"train_loss": -6.4233856201171875, "global_step": 107404, "epoch": 2557} {"train_loss": -6.391808032989502, "global_step": 107405, "epoch": 2557} {"train_loss": -6.476567268371582, "global_step": 107406, "epoch": 2557} {"train_loss": -6.402132511138916, "global_step": 107407, "epoch": 2557} {"train_loss": -6.443891525268555, "global_step": 107408, "epoch": 2557} {"train_loss": -6.500208377838135, "global_step": 107409, "epoch": 2557} {"train_loss": -6.441723823547363, "global_step": 107410, "epoch": 2557} {"train_loss": -6.518808364868164, "global_step": 107411, "epoch": 2557} {"train_loss": -6.439840316772461, "global_step": 107412, "epoch": 2557} {"train_loss": -6.490413188934326, "global_step": 107413, "epoch": 2557} {"train_loss": -6.439704895019531, "global_step": 107414, "epoch": 2557} {"train_loss": -6.464176654815674, "global_step": 107415, "epoch": 2557} {"train_loss": -6.490917205810547, "global_step": 107416, "epoch": 2557} {"train_loss": -6.405643463134766, "global_step": 107417, "epoch": 2557} {"train_loss": -6.453683853149414, "global_step": 107418, "epoch": 2557} {"train_loss": -6.580346584320068, "global_step": 107419, "epoch": 2557} {"train_loss": -6.481771469116211, "global_step": 107420, "epoch": 2557} {"train_loss": -6.557559967041016, "global_step": 107421, "epoch": 2557} {"train_loss": -6.532896041870117, "global_step": 107422, "epoch": 2557} {"train_loss": -6.494617462158203, "global_step": 107423, "epoch": 2557} {"train_loss": -6.435859680175781, "global_step": 107424, "epoch": 2557} {"train_loss": -6.5634565353393555, "global_step": 107425, "epoch": 2557} {"train_loss": -6.478565216064453, "global_step": 107426, "epoch": 2557} {"train_loss": -6.565722465515137, "global_step": 107427, "epoch": 2557} {"train_loss": -6.32259464263916, "global_step": 107428, "epoch": 2557} {"train_loss": -6.521810054779053, "global_step": 107429, "epoch": 2557} {"train_loss": -6.383939266204834, "global_step": 107430, "epoch": 2557} {"train_loss": -6.263095855712891, "global_step": 107431, "epoch": 2557} {"train_loss": -6.364562034606934, "global_step": 107432, "epoch": 2557} {"train_loss": -6.392746925354004, "global_step": 107433, "epoch": 2557} {"train_loss": -6.375073432922363, "global_step": 107434, "epoch": 2557} {"train_loss": -6.471025500978742, "global_step": 107435, "epoch": 2557, "val_loss": 64723.4140625} {"train_loss": -6.50179386138916, "global_step": 107436, "epoch": 2558} {"train_loss": -6.421095848083496, "global_step": 107437, "epoch": 2558} {"train_loss": -6.458282470703125, "global_step": 107438, "epoch": 2558} {"train_loss": -6.444311141967773, "global_step": 107439, "epoch": 2558} {"train_loss": -6.389894485473633, "global_step": 107440, "epoch": 2558} {"train_loss": -6.416624069213867, "global_step": 107441, "epoch": 2558} {"train_loss": -6.414708614349365, "global_step": 107442, "epoch": 2558} {"train_loss": -6.409415245056152, "global_step": 107443, "epoch": 2558} {"train_loss": -6.345768928527832, "global_step": 107444, "epoch": 2558} {"train_loss": -6.400841236114502, "global_step": 107445, "epoch": 2558} {"train_loss": -6.481947898864746, "global_step": 107446, "epoch": 2558} {"train_loss": -6.343291759490967, "global_step": 107447, "epoch": 2558} {"train_loss": -6.380006313323975, "global_step": 107448, "epoch": 2558} {"train_loss": -6.49318790435791, "global_step": 107449, "epoch": 2558} {"train_loss": -6.377213478088379, "global_step": 107450, "epoch": 2558} {"train_loss": -6.51606559753418, "global_step": 107451, "epoch": 2558} {"train_loss": -6.478352069854736, "global_step": 107452, "epoch": 2558} {"train_loss": -6.4370880126953125, "global_step": 107453, "epoch": 2558} {"train_loss": -6.451842784881592, "global_step": 107454, "epoch": 2558} {"train_loss": -6.423382759094238, "global_step": 107455, "epoch": 2558} {"train_loss": -6.297968864440918, "global_step": 107456, "epoch": 2558} {"train_loss": -6.394426345825195, "global_step": 107457, "epoch": 2558} {"train_loss": -6.378966808319092, "global_step": 107458, "epoch": 2558} {"train_loss": -6.328327178955078, "global_step": 107459, "epoch": 2558} {"train_loss": -6.424102306365967, "global_step": 107460, "epoch": 2558} {"train_loss": -6.44223690032959, "global_step": 107461, "epoch": 2558} {"train_loss": -6.434969902038574, "global_step": 107462, "epoch": 2558} {"train_loss": -6.434793472290039, "global_step": 107463, "epoch": 2558} {"train_loss": -6.330700874328613, "global_step": 107464, "epoch": 2558} {"train_loss": -6.5090131759643555, "global_step": 107465, "epoch": 2558} {"train_loss": -6.643466949462891, "global_step": 107466, "epoch": 2558} {"train_loss": -6.522819519042969, "global_step": 107467, "epoch": 2558} {"train_loss": -6.414342880249023, "global_step": 107468, "epoch": 2558} {"train_loss": -6.431801795959473, "global_step": 107469, "epoch": 2558} {"train_loss": -6.554068565368652, "global_step": 107470, "epoch": 2558} {"train_loss": -6.4611968994140625, "global_step": 107471, "epoch": 2558} {"train_loss": -6.54304313659668, "global_step": 107472, "epoch": 2558} {"train_loss": -6.5426249504089355, "global_step": 107473, "epoch": 2558} {"train_loss": -6.520986557006836, "global_step": 107474, "epoch": 2558} {"train_loss": -6.445016860961914, "global_step": 107475, "epoch": 2558} {"train_loss": -6.525002479553223, "global_step": 107476, "epoch": 2558} {"train_loss": -6.444076821917579, "global_step": 107477, "epoch": 2558, "val_loss": 64619.7265625} {"train_loss": -6.457947731018066, "global_step": 107478, "epoch": 2559} {"train_loss": -6.53421688079834, "global_step": 107479, "epoch": 2559} {"train_loss": -6.543642044067383, "global_step": 107480, "epoch": 2559} {"train_loss": -6.438377380371094, "global_step": 107481, "epoch": 2559} {"train_loss": -6.325366973876953, "global_step": 107482, "epoch": 2559} {"train_loss": -6.48427152633667, "global_step": 107483, "epoch": 2559} {"train_loss": -6.505025863647461, "global_step": 107484, "epoch": 2559} {"train_loss": -6.555011749267578, "global_step": 107485, "epoch": 2559} {"train_loss": -6.4765753746032715, "global_step": 107486, "epoch": 2559} {"train_loss": -6.53214168548584, "global_step": 107487, "epoch": 2559} {"train_loss": -6.482639312744141, "global_step": 107488, "epoch": 2559} {"train_loss": -6.507546424865723, "global_step": 107489, "epoch": 2559} {"train_loss": -6.5207366943359375, "global_step": 107490, "epoch": 2559} {"train_loss": -6.460589408874512, "global_step": 107491, "epoch": 2559} {"train_loss": -6.41244649887085, "global_step": 107492, "epoch": 2559} {"train_loss": -6.480754852294922, "global_step": 107493, "epoch": 2559} {"train_loss": -6.494017124176025, "global_step": 107494, "epoch": 2559} {"train_loss": -6.586448669433594, "global_step": 107495, "epoch": 2559} {"train_loss": -6.567541122436523, "global_step": 107496, "epoch": 2559} {"train_loss": -6.386375427246094, "global_step": 107497, "epoch": 2559} {"train_loss": -6.396018028259277, "global_step": 107498, "epoch": 2559} {"train_loss": -6.593730926513672, "global_step": 107499, "epoch": 2559} {"train_loss": -6.486812591552734, "global_step": 107500, "epoch": 2559} {"train_loss": -6.460050582885742, "global_step": 107501, "epoch": 2559} {"train_loss": -6.449417591094971, "global_step": 107502, "epoch": 2559} {"train_loss": -6.362697124481201, "global_step": 107503, "epoch": 2559} {"train_loss": -6.389833450317383, "global_step": 107504, "epoch": 2559} {"train_loss": -6.406206130981445, "global_step": 107505, "epoch": 2559} {"train_loss": -6.495121955871582, "global_step": 107506, "epoch": 2559} {"train_loss": -6.57033634185791, "global_step": 107507, "epoch": 2559} {"train_loss": -6.433887958526611, "global_step": 107508, "epoch": 2559} {"train_loss": -6.490443706512451, "global_step": 107509, "epoch": 2559} {"train_loss": -6.499790191650391, "global_step": 107510, "epoch": 2559} {"train_loss": -6.43553352355957, "global_step": 107511, "epoch": 2559} {"train_loss": -6.467380523681641, "global_step": 107512, "epoch": 2559} {"train_loss": -6.385183811187744, "global_step": 107513, "epoch": 2559} {"train_loss": -6.483813285827637, "global_step": 107514, "epoch": 2559} {"train_loss": -6.311977386474609, "global_step": 107515, "epoch": 2559} {"train_loss": -6.3524980545043945, "global_step": 107516, "epoch": 2559} {"train_loss": -6.462611198425293, "global_step": 107517, "epoch": 2559} {"train_loss": -6.520359039306641, "global_step": 107518, "epoch": 2559} {"train_loss": -6.464834440322149, "global_step": 107519, "epoch": 2559, "val_loss": 64800.6328125} {"train_loss": -6.4090576171875, "global_step": 107520, "epoch": 2560} {"train_loss": -6.539532661437988, "global_step": 107521, "epoch": 2560} {"train_loss": -6.494041442871094, "global_step": 107522, "epoch": 2560} {"train_loss": -6.416995525360107, "global_step": 107523, "epoch": 2560} {"train_loss": -6.385441303253174, "global_step": 107524, "epoch": 2560} {"train_loss": -6.56183385848999, "global_step": 107525, "epoch": 2560} {"train_loss": -6.427055358886719, "global_step": 107526, "epoch": 2560} {"train_loss": -6.475522994995117, "global_step": 107527, "epoch": 2560} {"train_loss": -6.392142295837402, "global_step": 107528, "epoch": 2560} {"train_loss": -6.3769683837890625, "global_step": 107529, "epoch": 2560} {"train_loss": -6.46384859085083, "global_step": 107530, "epoch": 2560} {"train_loss": -6.469358921051025, "global_step": 107531, "epoch": 2560} {"train_loss": -6.476036548614502, "global_step": 107532, "epoch": 2560} {"train_loss": -6.363725662231445, "global_step": 107533, "epoch": 2560} {"train_loss": -6.472640514373779, "global_step": 107534, "epoch": 2560} {"train_loss": -6.4452338218688965, "global_step": 107535, "epoch": 2560} {"train_loss": -6.4391398429870605, "global_step": 107536, "epoch": 2560} {"train_loss": -6.497169017791748, "global_step": 107537, "epoch": 2560} {"train_loss": -6.328302383422852, "global_step": 107538, "epoch": 2560} {"train_loss": -6.441075325012207, "global_step": 107539, "epoch": 2560} {"train_loss": -6.43450927734375, "global_step": 107540, "epoch": 2560} {"train_loss": -6.586938858032227, "global_step": 107541, "epoch": 2560} {"train_loss": -6.4647603034973145, "global_step": 107542, "epoch": 2560} {"train_loss": -6.445744514465332, "global_step": 107543, "epoch": 2560} {"train_loss": -6.4065728187561035, "global_step": 107544, "epoch": 2560} {"train_loss": -6.574707984924316, "global_step": 107545, "epoch": 2560} {"train_loss": -6.455795764923096, "global_step": 107546, "epoch": 2560} {"train_loss": -6.4848480224609375, "global_step": 107547, "epoch": 2560} {"train_loss": -6.4395551681518555, "global_step": 107548, "epoch": 2560} {"train_loss": -6.412132263183594, "global_step": 107549, "epoch": 2560} {"train_loss": -6.446812629699707, "global_step": 107550, "epoch": 2560} {"train_loss": -6.538122177124023, "global_step": 107551, "epoch": 2560} {"train_loss": -6.372585296630859, "global_step": 107552, "epoch": 2560} {"train_loss": -6.454305648803711, "global_step": 107553, "epoch": 2560} {"train_loss": -6.50563907623291, "global_step": 107554, "epoch": 2560} {"train_loss": -6.485500812530518, "global_step": 107555, "epoch": 2560} {"train_loss": -6.419923305511475, "global_step": 107556, "epoch": 2560} {"train_loss": -6.433154106140137, "global_step": 107557, "epoch": 2560} {"train_loss": -6.492154121398926, "global_step": 107558, "epoch": 2560} {"train_loss": -6.528085708618164, "global_step": 107559, "epoch": 2560} {"train_loss": -6.479609489440918, "global_step": 107560, "epoch": 2560} {"train_loss": -6.457884459268479, "global_step": 107561, "epoch": 2560, "val_loss": 64637.1953125} {"train_loss": -6.492091178894043, "global_step": 107562, "epoch": 2561} {"train_loss": -6.47782039642334, "global_step": 107563, "epoch": 2561} {"train_loss": -6.4932861328125, "global_step": 107564, "epoch": 2561} {"train_loss": -6.4193525314331055, "global_step": 107565, "epoch": 2561} {"train_loss": -6.445230007171631, "global_step": 107566, "epoch": 2561} {"train_loss": -6.458654403686523, "global_step": 107567, "epoch": 2561} {"train_loss": -6.514101982116699, "global_step": 107568, "epoch": 2561} {"train_loss": -6.4927568435668945, "global_step": 107569, "epoch": 2561} {"train_loss": -6.450460433959961, "global_step": 107570, "epoch": 2561} {"train_loss": -6.532201766967773, "global_step": 107571, "epoch": 2561} {"train_loss": -6.410296440124512, "global_step": 107572, "epoch": 2561} {"train_loss": -6.457741737365723, "global_step": 107573, "epoch": 2561} {"train_loss": -6.461186408996582, "global_step": 107574, "epoch": 2561} {"train_loss": -6.446681976318359, "global_step": 107575, "epoch": 2561} {"train_loss": -6.48463249206543, "global_step": 107576, "epoch": 2561} {"train_loss": -6.415800094604492, "global_step": 107577, "epoch": 2561} {"train_loss": -6.505654811859131, "global_step": 107578, "epoch": 2561} {"train_loss": -6.581568717956543, "global_step": 107579, "epoch": 2561} {"train_loss": -6.473034858703613, "global_step": 107580, "epoch": 2561} {"train_loss": -6.25777530670166, "global_step": 107581, "epoch": 2561} {"train_loss": -6.410863399505615, "global_step": 107582, "epoch": 2561} {"train_loss": -6.584524631500244, "global_step": 107583, "epoch": 2561} {"train_loss": -6.428706169128418, "global_step": 107584, "epoch": 2561} {"train_loss": -6.572132110595703, "global_step": 107585, "epoch": 2561} {"train_loss": -6.4633469581604, "global_step": 107586, "epoch": 2561} {"train_loss": -6.496054172515869, "global_step": 107587, "epoch": 2561} {"train_loss": -6.521474838256836, "global_step": 107588, "epoch": 2561} {"train_loss": -6.3817458152771, "global_step": 107589, "epoch": 2561} {"train_loss": -6.385757923126221, "global_step": 107590, "epoch": 2561} {"train_loss": -6.4521403312683105, "global_step": 107591, "epoch": 2561} {"train_loss": -6.50449275970459, "global_step": 107592, "epoch": 2561} {"train_loss": -6.374317169189453, "global_step": 107593, "epoch": 2561} {"train_loss": -6.455436706542969, "global_step": 107594, "epoch": 2561} {"train_loss": -6.544317722320557, "global_step": 107595, "epoch": 2561} {"train_loss": -6.446353912353516, "global_step": 107596, "epoch": 2561} {"train_loss": -6.456843852996826, "global_step": 107597, "epoch": 2561} {"train_loss": -6.462136745452881, "global_step": 107598, "epoch": 2561} {"train_loss": -6.45699405670166, "global_step": 107599, "epoch": 2561} {"train_loss": -6.48441219329834, "global_step": 107600, "epoch": 2561} {"train_loss": -6.40679407119751, "global_step": 107601, "epoch": 2561} {"train_loss": -6.457396507263184, "global_step": 107602, "epoch": 2561} {"train_loss": -6.465324674333845, "global_step": 107603, "epoch": 2561, "val_loss": 64689.60546875} {"train_loss": -6.526325225830078, "global_step": 107604, "epoch": 2562} {"train_loss": -6.441310882568359, "global_step": 107605, "epoch": 2562} {"train_loss": -6.352535247802734, "global_step": 107606, "epoch": 2562} {"train_loss": -6.495075225830078, "global_step": 107607, "epoch": 2562} {"train_loss": -6.416847229003906, "global_step": 107608, "epoch": 2562} {"train_loss": -6.41897439956665, "global_step": 107609, "epoch": 2562} {"train_loss": -6.432493209838867, "global_step": 107610, "epoch": 2562} {"train_loss": -6.415014266967773, "global_step": 107611, "epoch": 2562} {"train_loss": -6.574018478393555, "global_step": 107612, "epoch": 2562} {"train_loss": -6.389997959136963, "global_step": 107613, "epoch": 2562} {"train_loss": -6.411060333251953, "global_step": 107614, "epoch": 2562} {"train_loss": -6.414242267608643, "global_step": 107615, "epoch": 2562} {"train_loss": -6.401071548461914, "global_step": 107616, "epoch": 2562} {"train_loss": -6.323797702789307, "global_step": 107617, "epoch": 2562} {"train_loss": -6.428563117980957, "global_step": 107618, "epoch": 2562} {"train_loss": -6.463216781616211, "global_step": 107619, "epoch": 2562} {"train_loss": -6.374098777770996, "global_step": 107620, "epoch": 2562} {"train_loss": -6.396076202392578, "global_step": 107621, "epoch": 2562} {"train_loss": -6.448215484619141, "global_step": 107622, "epoch": 2562} {"train_loss": -6.453304290771484, "global_step": 107623, "epoch": 2562} {"train_loss": -6.538004398345947, "global_step": 107624, "epoch": 2562} {"train_loss": -6.4753336906433105, "global_step": 107625, "epoch": 2562} {"train_loss": -6.444247245788574, "global_step": 107626, "epoch": 2562} {"train_loss": -6.514834880828857, "global_step": 107627, "epoch": 2562} {"train_loss": -6.451277732849121, "global_step": 107628, "epoch": 2562} {"train_loss": -6.4901838302612305, "global_step": 107629, "epoch": 2562} {"train_loss": -6.412235736846924, "global_step": 107630, "epoch": 2562} {"train_loss": -6.499968528747559, "global_step": 107631, "epoch": 2562} {"train_loss": -6.444397926330566, "global_step": 107632, "epoch": 2562} {"train_loss": -6.550280570983887, "global_step": 107633, "epoch": 2562} {"train_loss": -6.527059078216553, "global_step": 107634, "epoch": 2562} {"train_loss": -6.454475402832031, "global_step": 107635, "epoch": 2562} {"train_loss": -6.353238582611084, "global_step": 107636, "epoch": 2562} {"train_loss": -6.485723495483398, "global_step": 107637, "epoch": 2562} {"train_loss": -6.567808151245117, "global_step": 107638, "epoch": 2562} {"train_loss": -6.439812660217285, "global_step": 107639, "epoch": 2562} {"train_loss": -6.457940578460693, "global_step": 107640, "epoch": 2562} {"train_loss": -6.451740741729736, "global_step": 107641, "epoch": 2562} {"train_loss": -6.513352394104004, "global_step": 107642, "epoch": 2562} {"train_loss": -6.322783470153809, "global_step": 107643, "epoch": 2562} {"train_loss": -6.379361152648926, "global_step": 107644, "epoch": 2562} {"train_loss": -6.4464891865139915, "global_step": 107645, "epoch": 2562, "val_loss": 64965.37109375} {"train_loss": -6.402872085571289, "global_step": 107646, "epoch": 2563} {"train_loss": -6.393222332000732, "global_step": 107647, "epoch": 2563} {"train_loss": -6.473964691162109, "global_step": 107648, "epoch": 2563} {"train_loss": -6.506990909576416, "global_step": 107649, "epoch": 2563} {"train_loss": -6.433926105499268, "global_step": 107650, "epoch": 2563} {"train_loss": -6.400199890136719, "global_step": 107651, "epoch": 2563} {"train_loss": -6.4509782791137695, "global_step": 107652, "epoch": 2563} {"train_loss": -6.275900363922119, "global_step": 107653, "epoch": 2563} {"train_loss": -6.420969009399414, "global_step": 107654, "epoch": 2563} {"train_loss": -6.514545440673828, "global_step": 107655, "epoch": 2563} {"train_loss": -6.384339809417725, "global_step": 107656, "epoch": 2563} {"train_loss": -6.509950160980225, "global_step": 107657, "epoch": 2563} {"train_loss": -6.400570869445801, "global_step": 107658, "epoch": 2563} {"train_loss": -6.341650009155273, "global_step": 107659, "epoch": 2563} {"train_loss": -6.418628692626953, "global_step": 107660, "epoch": 2563} {"train_loss": -6.511081218719482, "global_step": 107661, "epoch": 2563} {"train_loss": -6.356614112854004, "global_step": 107662, "epoch": 2563} {"train_loss": -6.48974609375, "global_step": 107663, "epoch": 2563} {"train_loss": -6.459745407104492, "global_step": 107664, "epoch": 2563} {"train_loss": -6.327846527099609, "global_step": 107665, "epoch": 2563} {"train_loss": -6.335540771484375, "global_step": 107666, "epoch": 2563} {"train_loss": -6.456170558929443, "global_step": 107667, "epoch": 2563} {"train_loss": -6.362377166748047, "global_step": 107668, "epoch": 2563} {"train_loss": -6.346792221069336, "global_step": 107669, "epoch": 2563} {"train_loss": -6.521913528442383, "global_step": 107670, "epoch": 2563} {"train_loss": -6.438372611999512, "global_step": 107671, "epoch": 2563} {"train_loss": -6.463090419769287, "global_step": 107672, "epoch": 2563} {"train_loss": -6.36074161529541, "global_step": 107673, "epoch": 2563} {"train_loss": -6.427920341491699, "global_step": 107674, "epoch": 2563} {"train_loss": -6.444282531738281, "global_step": 107675, "epoch": 2563} {"train_loss": -6.357761383056641, "global_step": 107676, "epoch": 2563} {"train_loss": -6.336877822875977, "global_step": 107677, "epoch": 2563} {"train_loss": -6.2344279289245605, "global_step": 107678, "epoch": 2563} {"train_loss": -6.3808207511901855, "global_step": 107679, "epoch": 2563} {"train_loss": -6.2818403244018555, "global_step": 107680, "epoch": 2563} {"train_loss": -6.431813716888428, "global_step": 107681, "epoch": 2563} {"train_loss": -6.483297348022461, "global_step": 107682, "epoch": 2563} {"train_loss": -6.295184135437012, "global_step": 107683, "epoch": 2563} {"train_loss": -6.445199966430664, "global_step": 107684, "epoch": 2563} {"train_loss": -6.306435585021973, "global_step": 107685, "epoch": 2563} {"train_loss": -6.33519983291626, "global_step": 107686, "epoch": 2563} {"train_loss": -6.403706720897129, "global_step": 107687, "epoch": 2563, "val_loss": 65002.234375} {"train_loss": -6.466797351837158, "global_step": 107688, "epoch": 2564} {"train_loss": -6.365550518035889, "global_step": 107689, "epoch": 2564} {"train_loss": -6.488160610198975, "global_step": 107690, "epoch": 2564} {"train_loss": -6.371194362640381, "global_step": 107691, "epoch": 2564} {"train_loss": -6.335647106170654, "global_step": 107692, "epoch": 2564} {"train_loss": -6.466866493225098, "global_step": 107693, "epoch": 2564} {"train_loss": -6.3844218254089355, "global_step": 107694, "epoch": 2564} {"train_loss": -6.528439044952393, "global_step": 107695, "epoch": 2564} {"train_loss": -6.532437324523926, "global_step": 107696, "epoch": 2564} {"train_loss": -6.347166538238525, "global_step": 107697, "epoch": 2564} {"train_loss": -6.595032215118408, "global_step": 107698, "epoch": 2564} {"train_loss": -6.327488899230957, "global_step": 107699, "epoch": 2564} {"train_loss": -6.458287239074707, "global_step": 107700, "epoch": 2564} {"train_loss": -6.497605800628662, "global_step": 107701, "epoch": 2564} {"train_loss": -6.463875770568848, "global_step": 107702, "epoch": 2564} {"train_loss": -6.541184425354004, "global_step": 107703, "epoch": 2564} {"train_loss": -6.436004638671875, "global_step": 107704, "epoch": 2564} {"train_loss": -6.4300761222839355, "global_step": 107705, "epoch": 2564} {"train_loss": -6.383906364440918, "global_step": 107706, "epoch": 2564} {"train_loss": -6.213762283325195, "global_step": 107707, "epoch": 2564} {"train_loss": -6.448949813842773, "global_step": 107708, "epoch": 2564} {"train_loss": -6.439091205596924, "global_step": 107709, "epoch": 2564} {"train_loss": -6.408849716186523, "global_step": 107710, "epoch": 2564} {"train_loss": -6.4652509689331055, "global_step": 107711, "epoch": 2564} {"train_loss": -6.504469394683838, "global_step": 107712, "epoch": 2564} {"train_loss": -6.5109477043151855, "global_step": 107713, "epoch": 2564} {"train_loss": -6.4684882164001465, "global_step": 107714, "epoch": 2564} {"train_loss": -6.478861331939697, "global_step": 107715, "epoch": 2564} {"train_loss": -6.38232421875, "global_step": 107716, "epoch": 2564} {"train_loss": -6.460997581481934, "global_step": 107717, "epoch": 2564} {"train_loss": -6.424868583679199, "global_step": 107718, "epoch": 2564} {"train_loss": -6.372048377990723, "global_step": 107719, "epoch": 2564} {"train_loss": -6.390995502471924, "global_step": 107720, "epoch": 2564} {"train_loss": -6.48196268081665, "global_step": 107721, "epoch": 2564} {"train_loss": -6.4302473068237305, "global_step": 107722, "epoch": 2564} {"train_loss": -6.453464508056641, "global_step": 107723, "epoch": 2564} {"train_loss": -6.419624328613281, "global_step": 107724, "epoch": 2564} {"train_loss": -6.427825927734375, "global_step": 107725, "epoch": 2564} {"train_loss": -6.499629020690918, "global_step": 107726, "epoch": 2564} {"train_loss": -6.534155368804932, "global_step": 107727, "epoch": 2564} {"train_loss": -6.478107929229736, "global_step": 107728, "epoch": 2564} {"train_loss": -6.442592371077764, "global_step": 107729, "epoch": 2564, "val_loss": 64623.0390625} {"train_loss": -6.552277565002441, "global_step": 107730, "epoch": 2565} {"train_loss": -6.362085342407227, "global_step": 107731, "epoch": 2565} {"train_loss": -6.582273006439209, "global_step": 107732, "epoch": 2565} {"train_loss": -6.489445209503174, "global_step": 107733, "epoch": 2565} {"train_loss": -6.500521183013916, "global_step": 107734, "epoch": 2565} {"train_loss": -6.3315629959106445, "global_step": 107735, "epoch": 2565} {"train_loss": -6.497328758239746, "global_step": 107736, "epoch": 2565} {"train_loss": -6.320225715637207, "global_step": 107737, "epoch": 2565} {"train_loss": -6.427603721618652, "global_step": 107738, "epoch": 2565} {"train_loss": -6.3410797119140625, "global_step": 107739, "epoch": 2565} {"train_loss": -6.518510818481445, "global_step": 107740, "epoch": 2565} {"train_loss": -6.54604434967041, "global_step": 107741, "epoch": 2565} {"train_loss": -6.438312530517578, "global_step": 107742, "epoch": 2565} {"train_loss": -6.550908088684082, "global_step": 107743, "epoch": 2565} {"train_loss": -6.449145317077637, "global_step": 107744, "epoch": 2565} {"train_loss": -6.525538444519043, "global_step": 107745, "epoch": 2565} {"train_loss": -6.468076229095459, "global_step": 107746, "epoch": 2565} {"train_loss": -6.457469463348389, "global_step": 107747, "epoch": 2565} {"train_loss": -6.486867904663086, "global_step": 107748, "epoch": 2565} {"train_loss": -6.429743766784668, "global_step": 107749, "epoch": 2565} {"train_loss": -6.428606986999512, "global_step": 107750, "epoch": 2565} {"train_loss": -6.436616897583008, "global_step": 107751, "epoch": 2565} {"train_loss": -6.499762535095215, "global_step": 107752, "epoch": 2565} {"train_loss": -6.4853835105896, "global_step": 107753, "epoch": 2565} {"train_loss": -6.505222320556641, "global_step": 107754, "epoch": 2565} {"train_loss": -6.412548065185547, "global_step": 107755, "epoch": 2565} {"train_loss": -6.352046966552734, "global_step": 107756, "epoch": 2565} {"train_loss": -6.489670276641846, "global_step": 107757, "epoch": 2565} {"train_loss": -6.408435344696045, "global_step": 107758, "epoch": 2565} {"train_loss": -6.361674785614014, "global_step": 107759, "epoch": 2565} {"train_loss": -6.386031150817871, "global_step": 107760, "epoch": 2565} {"train_loss": -6.498920440673828, "global_step": 107761, "epoch": 2565} {"train_loss": -6.389324188232422, "global_step": 107762, "epoch": 2565} {"train_loss": -6.413793087005615, "global_step": 107763, "epoch": 2565} {"train_loss": -6.497221946716309, "global_step": 107764, "epoch": 2565} {"train_loss": -6.503056526184082, "global_step": 107765, "epoch": 2565} {"train_loss": -6.444573402404785, "global_step": 107766, "epoch": 2565} {"train_loss": -6.461196422576904, "global_step": 107767, "epoch": 2565} {"train_loss": -6.387253761291504, "global_step": 107768, "epoch": 2565} {"train_loss": -6.491977691650391, "global_step": 107769, "epoch": 2565} {"train_loss": -6.45434045791626, "global_step": 107770, "epoch": 2565} {"train_loss": -6.455184732164655, "global_step": 107771, "epoch": 2565, "val_loss": 64583.53125} {"train_loss": -6.4665207862854, "global_step": 107772, "epoch": 2566} {"train_loss": -6.437195777893066, "global_step": 107773, "epoch": 2566} {"train_loss": -6.422143936157227, "global_step": 107774, "epoch": 2566} {"train_loss": -6.475818634033203, "global_step": 107775, "epoch": 2566} {"train_loss": -6.497384071350098, "global_step": 107776, "epoch": 2566} {"train_loss": -6.442483901977539, "global_step": 107777, "epoch": 2566} {"train_loss": -6.474081993103027, "global_step": 107778, "epoch": 2566} {"train_loss": -6.532397270202637, "global_step": 107779, "epoch": 2566} {"train_loss": -6.278449058532715, "global_step": 107780, "epoch": 2566} {"train_loss": -6.417564392089844, "global_step": 107781, "epoch": 2566} {"train_loss": -6.499617576599121, "global_step": 107782, "epoch": 2566} {"train_loss": -6.518043518066406, "global_step": 107783, "epoch": 2566} {"train_loss": -6.342036247253418, "global_step": 107784, "epoch": 2566} {"train_loss": -6.365004539489746, "global_step": 107785, "epoch": 2566} {"train_loss": -6.462349891662598, "global_step": 107786, "epoch": 2566} {"train_loss": -6.447015762329102, "global_step": 107787, "epoch": 2566} {"train_loss": -6.353806018829346, "global_step": 107788, "epoch": 2566} {"train_loss": -6.412360191345215, "global_step": 107789, "epoch": 2566} {"train_loss": -6.450629234313965, "global_step": 107790, "epoch": 2566} {"train_loss": -6.412910461425781, "global_step": 107791, "epoch": 2566} {"train_loss": -6.344429016113281, "global_step": 107792, "epoch": 2566} {"train_loss": -6.3525190353393555, "global_step": 107793, "epoch": 2566} {"train_loss": -6.387057304382324, "global_step": 107794, "epoch": 2566} {"train_loss": -6.444467067718506, "global_step": 107795, "epoch": 2566} {"train_loss": -6.369163513183594, "global_step": 107796, "epoch": 2566} {"train_loss": -6.519354820251465, "global_step": 107797, "epoch": 2566} {"train_loss": -6.346336364746094, "global_step": 107798, "epoch": 2566} {"train_loss": -6.42607307434082, "global_step": 107799, "epoch": 2566} {"train_loss": -6.407149791717529, "global_step": 107800, "epoch": 2566} {"train_loss": -6.53529167175293, "global_step": 107801, "epoch": 2566} {"train_loss": -6.444157123565674, "global_step": 107802, "epoch": 2566} {"train_loss": -6.462512493133545, "global_step": 107803, "epoch": 2566} {"train_loss": -6.380666255950928, "global_step": 107804, "epoch": 2566} {"train_loss": -6.547586441040039, "global_step": 107805, "epoch": 2566} {"train_loss": -6.472552299499512, "global_step": 107806, "epoch": 2566} {"train_loss": -6.456264972686768, "global_step": 107807, "epoch": 2566} {"train_loss": -6.343411922454834, "global_step": 107808, "epoch": 2566} {"train_loss": -6.540365219116211, "global_step": 107809, "epoch": 2566} {"train_loss": -6.368548393249512, "global_step": 107810, "epoch": 2566} {"train_loss": -6.439563751220703, "global_step": 107811, "epoch": 2566} {"train_loss": -6.469992637634277, "global_step": 107812, "epoch": 2566} {"train_loss": -6.431858119510469, "global_step": 107813, "epoch": 2566, "val_loss": 64700.58203125} {"train_loss": -6.326692581176758, "global_step": 107814, "epoch": 2567} {"train_loss": -6.353941917419434, "global_step": 107815, "epoch": 2567} {"train_loss": -6.377445220947266, "global_step": 107816, "epoch": 2567} {"train_loss": -6.452498912811279, "global_step": 107817, "epoch": 2567} {"train_loss": -6.4852705001831055, "global_step": 107818, "epoch": 2567} {"train_loss": -6.47752571105957, "global_step": 107819, "epoch": 2567} {"train_loss": -6.404253959655762, "global_step": 107820, "epoch": 2567} {"train_loss": -6.495281219482422, "global_step": 107821, "epoch": 2567} {"train_loss": -6.328485012054443, "global_step": 107822, "epoch": 2567} {"train_loss": -6.473264694213867, "global_step": 107823, "epoch": 2567} {"train_loss": -6.357307434082031, "global_step": 107824, "epoch": 2567} {"train_loss": -6.4771623611450195, "global_step": 107825, "epoch": 2567} {"train_loss": -6.455999851226807, "global_step": 107826, "epoch": 2567} {"train_loss": -6.392148494720459, "global_step": 107827, "epoch": 2567} {"train_loss": -6.483160018920898, "global_step": 107828, "epoch": 2567} {"train_loss": -6.486720085144043, "global_step": 107829, "epoch": 2567} {"train_loss": -6.489794731140137, "global_step": 107830, "epoch": 2567} {"train_loss": -6.436020851135254, "global_step": 107831, "epoch": 2567} {"train_loss": -6.457179546356201, "global_step": 107832, "epoch": 2567} {"train_loss": -6.480397701263428, "global_step": 107833, "epoch": 2567} {"train_loss": -6.419676780700684, "global_step": 107834, "epoch": 2567} {"train_loss": -6.46299934387207, "global_step": 107835, "epoch": 2567} {"train_loss": -6.395138740539551, "global_step": 107836, "epoch": 2567} {"train_loss": -6.350556373596191, "global_step": 107837, "epoch": 2567} {"train_loss": -6.539386749267578, "global_step": 107838, "epoch": 2567} {"train_loss": -6.525619029998779, "global_step": 107839, "epoch": 2567} {"train_loss": -6.405821800231934, "global_step": 107840, "epoch": 2567} {"train_loss": -6.589106559753418, "global_step": 107841, "epoch": 2567} {"train_loss": -6.540752410888672, "global_step": 107842, "epoch": 2567} {"train_loss": -6.432046890258789, "global_step": 107843, "epoch": 2567} {"train_loss": -6.444860935211182, "global_step": 107844, "epoch": 2567} {"train_loss": -6.484630107879639, "global_step": 107845, "epoch": 2567} {"train_loss": -6.451076507568359, "global_step": 107846, "epoch": 2567} {"train_loss": -6.398501873016357, "global_step": 107847, "epoch": 2567} {"train_loss": -6.491072654724121, "global_step": 107848, "epoch": 2567} {"train_loss": -6.487497806549072, "global_step": 107849, "epoch": 2567} {"train_loss": -6.419636249542236, "global_step": 107850, "epoch": 2567} {"train_loss": -6.408975601196289, "global_step": 107851, "epoch": 2567} {"train_loss": -6.590271949768066, "global_step": 107852, "epoch": 2567} {"train_loss": -6.486654281616211, "global_step": 107853, "epoch": 2567} {"train_loss": -6.449715614318848, "global_step": 107854, "epoch": 2567} {"train_loss": -6.450182506016323, "global_step": 107855, "epoch": 2567, "val_loss": 64738.140625} {"train_loss": -6.455063819885254, "global_step": 107856, "epoch": 2568} {"train_loss": -6.535216331481934, "global_step": 107857, "epoch": 2568} {"train_loss": -6.547048091888428, "global_step": 107858, "epoch": 2568} {"train_loss": -6.482850074768066, "global_step": 107859, "epoch": 2568} {"train_loss": -6.544902801513672, "global_step": 107860, "epoch": 2568} {"train_loss": -6.4025983810424805, "global_step": 107861, "epoch": 2568} {"train_loss": -6.4394378662109375, "global_step": 107862, "epoch": 2568} {"train_loss": -6.410275459289551, "global_step": 107863, "epoch": 2568} {"train_loss": -6.501482009887695, "global_step": 107864, "epoch": 2568} {"train_loss": -6.432033538818359, "global_step": 107865, "epoch": 2568} {"train_loss": -6.547316551208496, "global_step": 107866, "epoch": 2568} {"train_loss": -6.299766540527344, "global_step": 107867, "epoch": 2568} {"train_loss": -6.507494926452637, "global_step": 107868, "epoch": 2568} {"train_loss": -6.436895370483398, "global_step": 107869, "epoch": 2568} {"train_loss": -6.381688117980957, "global_step": 107870, "epoch": 2568} {"train_loss": -6.472320556640625, "global_step": 107871, "epoch": 2568} {"train_loss": -6.554811477661133, "global_step": 107872, "epoch": 2568} {"train_loss": -6.598678112030029, "global_step": 107873, "epoch": 2568} {"train_loss": -6.486630439758301, "global_step": 107874, "epoch": 2568} {"train_loss": -6.481842041015625, "global_step": 107875, "epoch": 2568} {"train_loss": -6.490416526794434, "global_step": 107876, "epoch": 2568} {"train_loss": -6.4061126708984375, "global_step": 107877, "epoch": 2568} {"train_loss": -6.4106364250183105, "global_step": 107878, "epoch": 2568} {"train_loss": -6.590211868286133, "global_step": 107879, "epoch": 2568} {"train_loss": -6.44061279296875, "global_step": 107880, "epoch": 2568} {"train_loss": -6.484648704528809, "global_step": 107881, "epoch": 2568} {"train_loss": -6.4869303703308105, "global_step": 107882, "epoch": 2568} {"train_loss": -6.412965774536133, "global_step": 107883, "epoch": 2568} {"train_loss": -6.4328837394714355, "global_step": 107884, "epoch": 2568} {"train_loss": -6.47208833694458, "global_step": 107885, "epoch": 2568} {"train_loss": -6.426913261413574, "global_step": 107886, "epoch": 2568} {"train_loss": -6.5460309982299805, "global_step": 107887, "epoch": 2568} {"train_loss": -6.46665096282959, "global_step": 107888, "epoch": 2568} {"train_loss": -6.410613059997559, "global_step": 107889, "epoch": 2568} {"train_loss": -6.362640380859375, "global_step": 107890, "epoch": 2568} {"train_loss": -6.4114508628845215, "global_step": 107891, "epoch": 2568} {"train_loss": -6.481536388397217, "global_step": 107892, "epoch": 2568} {"train_loss": -6.435230255126953, "global_step": 107893, "epoch": 2568} {"train_loss": -6.346726417541504, "global_step": 107894, "epoch": 2568} {"train_loss": -6.443903923034668, "global_step": 107895, "epoch": 2568} {"train_loss": -6.390167713165283, "global_step": 107896, "epoch": 2568} {"train_loss": -6.459499870027814, "global_step": 107897, "epoch": 2568, "val_loss": 64633.75390625} {"train_loss": -6.564958095550537, "global_step": 107898, "epoch": 2569} {"train_loss": -6.44071102142334, "global_step": 107899, "epoch": 2569} {"train_loss": -6.41888427734375, "global_step": 107900, "epoch": 2569} {"train_loss": -6.531543731689453, "global_step": 107901, "epoch": 2569} {"train_loss": -6.448456287384033, "global_step": 107902, "epoch": 2569} {"train_loss": -6.624502182006836, "global_step": 107903, "epoch": 2569} {"train_loss": -6.5180816650390625, "global_step": 107904, "epoch": 2569} {"train_loss": -6.458425521850586, "global_step": 107905, "epoch": 2569} {"train_loss": -6.481956481933594, "global_step": 107906, "epoch": 2569} {"train_loss": -6.451278209686279, "global_step": 107907, "epoch": 2569} {"train_loss": -6.456958293914795, "global_step": 107908, "epoch": 2569} {"train_loss": -6.496245861053467, "global_step": 107909, "epoch": 2569} {"train_loss": -6.465822219848633, "global_step": 107910, "epoch": 2569} {"train_loss": -6.385781288146973, "global_step": 107911, "epoch": 2569} {"train_loss": -6.549802780151367, "global_step": 107912, "epoch": 2569} {"train_loss": -6.5257158279418945, "global_step": 107913, "epoch": 2569} {"train_loss": -6.420510292053223, "global_step": 107914, "epoch": 2569} {"train_loss": -6.447969913482666, "global_step": 107915, "epoch": 2569} {"train_loss": -6.373693466186523, "global_step": 107916, "epoch": 2569} {"train_loss": -6.463079452514648, "global_step": 107917, "epoch": 2569} {"train_loss": -6.459756851196289, "global_step": 107918, "epoch": 2569} {"train_loss": -6.4689154624938965, "global_step": 107919, "epoch": 2569} {"train_loss": -6.462364196777344, "global_step": 107920, "epoch": 2569} {"train_loss": -6.397789001464844, "global_step": 107921, "epoch": 2569} {"train_loss": -6.443518161773682, "global_step": 107922, "epoch": 2569} {"train_loss": -6.410496711730957, "global_step": 107923, "epoch": 2569} {"train_loss": -6.490780830383301, "global_step": 107924, "epoch": 2569} {"train_loss": -6.521936416625977, "global_step": 107925, "epoch": 2569} {"train_loss": -6.375335216522217, "global_step": 107926, "epoch": 2569} {"train_loss": -6.373446464538574, "global_step": 107927, "epoch": 2569} {"train_loss": -6.41188907623291, "global_step": 107928, "epoch": 2569} {"train_loss": -6.362773895263672, "global_step": 107929, "epoch": 2569} {"train_loss": -6.428701877593994, "global_step": 107930, "epoch": 2569} {"train_loss": -6.4539337158203125, "global_step": 107931, "epoch": 2569} {"train_loss": -6.379899978637695, "global_step": 107932, "epoch": 2569} {"train_loss": -6.403087615966797, "global_step": 107933, "epoch": 2569} {"train_loss": -6.556976318359375, "global_step": 107934, "epoch": 2569} {"train_loss": -6.404191017150879, "global_step": 107935, "epoch": 2569} {"train_loss": -6.423243999481201, "global_step": 107936, "epoch": 2569} {"train_loss": -6.513017654418945, "global_step": 107937, "epoch": 2569} {"train_loss": -6.3680315017700195, "global_step": 107938, "epoch": 2569} {"train_loss": -6.453261965797061, "global_step": 107939, "epoch": 2569, "val_loss": 64747.5625} {"train_loss": -6.368007659912109, "global_step": 107940, "epoch": 2570} {"train_loss": -6.455305099487305, "global_step": 107941, "epoch": 2570} {"train_loss": -6.39323616027832, "global_step": 107942, "epoch": 2570} {"train_loss": -6.256420135498047, "global_step": 107943, "epoch": 2570} {"train_loss": -6.465394973754883, "global_step": 107944, "epoch": 2570} {"train_loss": -6.432215690612793, "global_step": 107945, "epoch": 2570} {"train_loss": -6.438617706298828, "global_step": 107946, "epoch": 2570} {"train_loss": -6.495095252990723, "global_step": 107947, "epoch": 2570} {"train_loss": -6.456177711486816, "global_step": 107948, "epoch": 2570} {"train_loss": -6.428000450134277, "global_step": 107949, "epoch": 2570} {"train_loss": -6.443801403045654, "global_step": 107950, "epoch": 2570} {"train_loss": -6.39137601852417, "global_step": 107951, "epoch": 2570} {"train_loss": -6.530290126800537, "global_step": 107952, "epoch": 2570} {"train_loss": -6.414068698883057, "global_step": 107953, "epoch": 2570} {"train_loss": -6.432580471038818, "global_step": 107954, "epoch": 2570} {"train_loss": -6.3229827880859375, "global_step": 107955, "epoch": 2570} {"train_loss": -6.277605056762695, "global_step": 107956, "epoch": 2570} {"train_loss": -6.470262050628662, "global_step": 107957, "epoch": 2570} {"train_loss": -6.279123306274414, "global_step": 107958, "epoch": 2570} {"train_loss": -6.4518351554870605, "global_step": 107959, "epoch": 2570} {"train_loss": -6.3621110916137695, "global_step": 107960, "epoch": 2570} {"train_loss": -6.51942253112793, "global_step": 107961, "epoch": 2570} {"train_loss": -6.490255832672119, "global_step": 107962, "epoch": 2570} {"train_loss": -6.381582260131836, "global_step": 107963, "epoch": 2570} {"train_loss": -6.488837242126465, "global_step": 107964, "epoch": 2570} {"train_loss": -6.350893020629883, "global_step": 107965, "epoch": 2570} {"train_loss": -6.413456916809082, "global_step": 107966, "epoch": 2570} {"train_loss": -6.469799995422363, "global_step": 107967, "epoch": 2570} {"train_loss": -6.31114387512207, "global_step": 107968, "epoch": 2570} {"train_loss": -6.424033164978027, "global_step": 107969, "epoch": 2570} {"train_loss": -6.4732160568237305, "global_step": 107970, "epoch": 2570} {"train_loss": -6.356250762939453, "global_step": 107971, "epoch": 2570} {"train_loss": -6.438702583312988, "global_step": 107972, "epoch": 2570} {"train_loss": -6.3289899826049805, "global_step": 107973, "epoch": 2570} {"train_loss": -6.430628776550293, "global_step": 107974, "epoch": 2570} {"train_loss": -6.373345375061035, "global_step": 107975, "epoch": 2570} {"train_loss": -6.52210807800293, "global_step": 107976, "epoch": 2570} {"train_loss": -6.463653564453125, "global_step": 107977, "epoch": 2570} {"train_loss": -6.391157150268555, "global_step": 107978, "epoch": 2570} {"train_loss": -6.467240810394287, "global_step": 107979, "epoch": 2570} {"train_loss": -6.318513870239258, "global_step": 107980, "epoch": 2570} {"train_loss": -6.412512461344401, "global_step": 107981, "epoch": 2570, "val_loss": 64980.48046875} {"train_loss": -6.533846378326416, "global_step": 107982, "epoch": 2571} {"train_loss": -6.343170166015625, "global_step": 107983, "epoch": 2571} {"train_loss": -6.4995856285095215, "global_step": 107984, "epoch": 2571} {"train_loss": -6.3674187660217285, "global_step": 107985, "epoch": 2571} {"train_loss": -6.554828643798828, "global_step": 107986, "epoch": 2571} {"train_loss": -6.393816947937012, "global_step": 107987, "epoch": 2571} {"train_loss": -6.381402015686035, "global_step": 107988, "epoch": 2571} {"train_loss": -6.431384086608887, "global_step": 107989, "epoch": 2571} {"train_loss": -6.443553924560547, "global_step": 107990, "epoch": 2571} {"train_loss": -6.463305950164795, "global_step": 107991, "epoch": 2571} {"train_loss": -6.292232513427734, "global_step": 107992, "epoch": 2571} {"train_loss": -6.488819122314453, "global_step": 107993, "epoch": 2571} {"train_loss": -6.341653823852539, "global_step": 107994, "epoch": 2571} {"train_loss": -6.379185676574707, "global_step": 107995, "epoch": 2571} {"train_loss": -6.4599127769470215, "global_step": 107996, "epoch": 2571} {"train_loss": -6.447079658508301, "global_step": 107997, "epoch": 2571} {"train_loss": -6.46060037612915, "global_step": 107998, "epoch": 2571} {"train_loss": -6.3436279296875, "global_step": 107999, "epoch": 2571} {"train_loss": -6.436489582061768, "global_step": 108000, "epoch": 2571} {"train_loss": -6.477795600891113, "global_step": 108001, "epoch": 2571} {"train_loss": -6.405622482299805, "global_step": 108002, "epoch": 2571} {"train_loss": -6.496213912963867, "global_step": 108003, "epoch": 2571} {"train_loss": -6.420559883117676, "global_step": 108004, "epoch": 2571} {"train_loss": -6.429224014282227, "global_step": 108005, "epoch": 2571} {"train_loss": -6.258964538574219, "global_step": 108006, "epoch": 2571} {"train_loss": -6.482060432434082, "global_step": 108007, "epoch": 2571} {"train_loss": -6.416965484619141, "global_step": 108008, "epoch": 2571} {"train_loss": -6.26640510559082, "global_step": 108009, "epoch": 2571} {"train_loss": -6.448741912841797, "global_step": 108010, "epoch": 2571} {"train_loss": -6.474220275878906, "global_step": 108011, "epoch": 2571} {"train_loss": -6.332531452178955, "global_step": 108012, "epoch": 2571} {"train_loss": -6.3385233879089355, "global_step": 108013, "epoch": 2571} {"train_loss": -6.34542179107666, "global_step": 108014, "epoch": 2571} {"train_loss": -6.4613494873046875, "global_step": 108015, "epoch": 2571} {"train_loss": -6.3184967041015625, "global_step": 108016, "epoch": 2571} {"train_loss": -6.479320526123047, "global_step": 108017, "epoch": 2571} {"train_loss": -6.4582672119140625, "global_step": 108018, "epoch": 2571} {"train_loss": -6.428889274597168, "global_step": 108019, "epoch": 2571} {"train_loss": -6.397818565368652, "global_step": 108020, "epoch": 2571} {"train_loss": -6.391254425048828, "global_step": 108021, "epoch": 2571} {"train_loss": -6.538669586181641, "global_step": 108022, "epoch": 2571} {"train_loss": -6.419342574619112, "global_step": 108023, "epoch": 2571, "val_loss": 64663.5234375} {"train_loss": -6.461618900299072, "global_step": 108024, "epoch": 2572} {"train_loss": -6.423923492431641, "global_step": 108025, "epoch": 2572} {"train_loss": -6.3295207023620605, "global_step": 108026, "epoch": 2572} {"train_loss": -6.358147621154785, "global_step": 108027, "epoch": 2572} {"train_loss": -6.4373250007629395, "global_step": 108028, "epoch": 2572} {"train_loss": -6.374141693115234, "global_step": 108029, "epoch": 2572} {"train_loss": -6.511530876159668, "global_step": 108030, "epoch": 2572} {"train_loss": -6.451821327209473, "global_step": 108031, "epoch": 2572} {"train_loss": -6.507299423217773, "global_step": 108032, "epoch": 2572} {"train_loss": -6.501400947570801, "global_step": 108033, "epoch": 2572} {"train_loss": -6.339976787567139, "global_step": 108034, "epoch": 2572} {"train_loss": -6.440965175628662, "global_step": 108035, "epoch": 2572} {"train_loss": -6.390081405639648, "global_step": 108036, "epoch": 2572} {"train_loss": -6.346905708312988, "global_step": 108037, "epoch": 2572} {"train_loss": -6.448687553405762, "global_step": 108038, "epoch": 2572} {"train_loss": -6.471791744232178, "global_step": 108039, "epoch": 2572} {"train_loss": -6.484199523925781, "global_step": 108040, "epoch": 2572} {"train_loss": -6.389949798583984, "global_step": 108041, "epoch": 2572} {"train_loss": -6.411386966705322, "global_step": 108042, "epoch": 2572} {"train_loss": -6.410959243774414, "global_step": 108043, "epoch": 2572} {"train_loss": -6.380992412567139, "global_step": 108044, "epoch": 2572} {"train_loss": -6.490297317504883, "global_step": 108045, "epoch": 2572} {"train_loss": -6.39545202255249, "global_step": 108046, "epoch": 2572} {"train_loss": -6.485410690307617, "global_step": 108047, "epoch": 2572} {"train_loss": -6.429776191711426, "global_step": 108048, "epoch": 2572} {"train_loss": -6.309775352478027, "global_step": 108049, "epoch": 2572} {"train_loss": -6.397305488586426, "global_step": 108050, "epoch": 2572} {"train_loss": -6.384693145751953, "global_step": 108051, "epoch": 2572} {"train_loss": -6.364936828613281, "global_step": 108052, "epoch": 2572} {"train_loss": -6.571704387664795, "global_step": 108053, "epoch": 2572} {"train_loss": -6.432405471801758, "global_step": 108054, "epoch": 2572} {"train_loss": -6.399855136871338, "global_step": 108055, "epoch": 2572} {"train_loss": -6.522709846496582, "global_step": 108056, "epoch": 2572} {"train_loss": -6.4106950759887695, "global_step": 108057, "epoch": 2572} {"train_loss": -6.486767768859863, "global_step": 108058, "epoch": 2572} {"train_loss": -6.44462776184082, "global_step": 108059, "epoch": 2572} {"train_loss": -6.47591495513916, "global_step": 108060, "epoch": 2572} {"train_loss": -6.50064754486084, "global_step": 108061, "epoch": 2572} {"train_loss": -6.459746360778809, "global_step": 108062, "epoch": 2572} {"train_loss": -6.571849346160889, "global_step": 108063, "epoch": 2572} {"train_loss": -6.396843433380127, "global_step": 108064, "epoch": 2572} {"train_loss": -6.436101039250691, "global_step": 108065, "epoch": 2572, "val_loss": 64790.5859375} {"train_loss": -6.458703517913818, "global_step": 108066, "epoch": 2573} {"train_loss": -6.393840789794922, "global_step": 108067, "epoch": 2573} {"train_loss": -6.4653143882751465, "global_step": 108068, "epoch": 2573} {"train_loss": -6.535537242889404, "global_step": 108069, "epoch": 2573} {"train_loss": -6.474294662475586, "global_step": 108070, "epoch": 2573} {"train_loss": -6.406190872192383, "global_step": 108071, "epoch": 2573} {"train_loss": -6.467565059661865, "global_step": 108072, "epoch": 2573} {"train_loss": -6.403532028198242, "global_step": 108073, "epoch": 2573} {"train_loss": -6.3491387367248535, "global_step": 108074, "epoch": 2573} {"train_loss": -6.493542671203613, "global_step": 108075, "epoch": 2573} {"train_loss": -6.4359025955200195, "global_step": 108076, "epoch": 2573} {"train_loss": -6.466558456420898, "global_step": 108077, "epoch": 2573} {"train_loss": -6.473453521728516, "global_step": 108078, "epoch": 2573} {"train_loss": -6.4469451904296875, "global_step": 108079, "epoch": 2573} {"train_loss": -6.390712738037109, "global_step": 108080, "epoch": 2573} {"train_loss": -6.530488967895508, "global_step": 108081, "epoch": 2573} {"train_loss": -6.485115051269531, "global_step": 108082, "epoch": 2573} {"train_loss": -6.44207763671875, "global_step": 108083, "epoch": 2573} {"train_loss": -6.520097732543945, "global_step": 108084, "epoch": 2573} {"train_loss": -6.485151290893555, "global_step": 108085, "epoch": 2573} {"train_loss": -6.472844123840332, "global_step": 108086, "epoch": 2573} {"train_loss": -6.516750335693359, "global_step": 108087, "epoch": 2573} {"train_loss": -6.4078874588012695, "global_step": 108088, "epoch": 2573} {"train_loss": -6.46547794342041, "global_step": 108089, "epoch": 2573} {"train_loss": -6.490687370300293, "global_step": 108090, "epoch": 2573} {"train_loss": -6.499768257141113, "global_step": 108091, "epoch": 2573} {"train_loss": -6.431639671325684, "global_step": 108092, "epoch": 2573} {"train_loss": -6.5753326416015625, "global_step": 108093, "epoch": 2573} {"train_loss": -6.496626853942871, "global_step": 108094, "epoch": 2573} {"train_loss": -6.456104755401611, "global_step": 108095, "epoch": 2573} {"train_loss": -6.453065395355225, "global_step": 108096, "epoch": 2573} {"train_loss": -6.487560272216797, "global_step": 108097, "epoch": 2573} {"train_loss": -6.470796585083008, "global_step": 108098, "epoch": 2573} {"train_loss": -6.441218376159668, "global_step": 108099, "epoch": 2573} {"train_loss": -6.4963274002075195, "global_step": 108100, "epoch": 2573} {"train_loss": -6.427937030792236, "global_step": 108101, "epoch": 2573} {"train_loss": -6.484320640563965, "global_step": 108102, "epoch": 2573} {"train_loss": -6.397299289703369, "global_step": 108103, "epoch": 2573} {"train_loss": -6.4675374031066895, "global_step": 108104, "epoch": 2573} {"train_loss": -6.365962982177734, "global_step": 108105, "epoch": 2573} {"train_loss": -6.430215835571289, "global_step": 108106, "epoch": 2573} {"train_loss": -6.458357152484712, "global_step": 108107, "epoch": 2573, "val_loss": 64731.0} {"train_loss": -6.431783676147461, "global_step": 108108, "epoch": 2574} {"train_loss": -6.460881233215332, "global_step": 108109, "epoch": 2574} {"train_loss": -6.539074897766113, "global_step": 108110, "epoch": 2574} {"train_loss": -6.517019748687744, "global_step": 108111, "epoch": 2574} {"train_loss": -6.4900312423706055, "global_step": 108112, "epoch": 2574} {"train_loss": -6.385412216186523, "global_step": 108113, "epoch": 2574} {"train_loss": -6.586273193359375, "global_step": 108114, "epoch": 2574} {"train_loss": -6.649348735809326, "global_step": 108115, "epoch": 2574} {"train_loss": -6.421013832092285, "global_step": 108116, "epoch": 2574} {"train_loss": -6.40662145614624, "global_step": 108117, "epoch": 2574} {"train_loss": -6.388395309448242, "global_step": 108118, "epoch": 2574} {"train_loss": -6.504228115081787, "global_step": 108119, "epoch": 2574} {"train_loss": -6.488508224487305, "global_step": 108120, "epoch": 2574} {"train_loss": -6.456529140472412, "global_step": 108121, "epoch": 2574} {"train_loss": -6.517338752746582, "global_step": 108122, "epoch": 2574} {"train_loss": -6.415813446044922, "global_step": 108123, "epoch": 2574} {"train_loss": -6.49201774597168, "global_step": 108124, "epoch": 2574} {"train_loss": -6.586493492126465, "global_step": 108125, "epoch": 2574} {"train_loss": -6.5927300453186035, "global_step": 108126, "epoch": 2574} {"train_loss": -6.46191930770874, "global_step": 108127, "epoch": 2574} {"train_loss": -6.533852577209473, "global_step": 108128, "epoch": 2574} {"train_loss": -6.521366119384766, "global_step": 108129, "epoch": 2574} {"train_loss": -6.515318870544434, "global_step": 108130, "epoch": 2574} {"train_loss": -6.536273002624512, "global_step": 108131, "epoch": 2574} {"train_loss": -6.3847246170043945, "global_step": 108132, "epoch": 2574} {"train_loss": -6.549587726593018, "global_step": 108133, "epoch": 2574} {"train_loss": -6.445122718811035, "global_step": 108134, "epoch": 2574} {"train_loss": -6.466835021972656, "global_step": 108135, "epoch": 2574} {"train_loss": -6.391824722290039, "global_step": 108136, "epoch": 2574} {"train_loss": -6.553014755249023, "global_step": 108137, "epoch": 2574} {"train_loss": -6.4964213371276855, "global_step": 108138, "epoch": 2574} {"train_loss": -6.509223937988281, "global_step": 108139, "epoch": 2574} {"train_loss": -6.486643314361572, "global_step": 108140, "epoch": 2574} {"train_loss": -6.425046443939209, "global_step": 108141, "epoch": 2574} {"train_loss": -6.463229179382324, "global_step": 108142, "epoch": 2574} {"train_loss": -6.481203079223633, "global_step": 108143, "epoch": 2574} {"train_loss": -6.374626159667969, "global_step": 108144, "epoch": 2574} {"train_loss": -6.439333438873291, "global_step": 108145, "epoch": 2574} {"train_loss": -6.525028705596924, "global_step": 108146, "epoch": 2574} {"train_loss": -6.49420166015625, "global_step": 108147, "epoch": 2574} {"train_loss": -6.4558820724487305, "global_step": 108148, "epoch": 2574} {"train_loss": -6.484575214840117, "global_step": 108149, "epoch": 2574, "val_loss": 64742.0078125} {"train_loss": -6.504814147949219, "global_step": 108150, "epoch": 2575} {"train_loss": -6.409335136413574, "global_step": 108151, "epoch": 2575} {"train_loss": -6.5314435958862305, "global_step": 108152, "epoch": 2575} {"train_loss": -6.5405473709106445, "global_step": 108153, "epoch": 2575} {"train_loss": -6.566643714904785, "global_step": 108154, "epoch": 2575} {"train_loss": -6.421328067779541, "global_step": 108155, "epoch": 2575} {"train_loss": -6.537990093231201, "global_step": 108156, "epoch": 2575} {"train_loss": -6.396575927734375, "global_step": 108157, "epoch": 2575} {"train_loss": -6.452645301818848, "global_step": 108158, "epoch": 2575} {"train_loss": -6.331414222717285, "global_step": 108159, "epoch": 2575} {"train_loss": -6.334752082824707, "global_step": 108160, "epoch": 2575} {"train_loss": -6.425991058349609, "global_step": 108161, "epoch": 2575} {"train_loss": -6.403774261474609, "global_step": 108162, "epoch": 2575} {"train_loss": -6.206292629241943, "global_step": 108163, "epoch": 2575} {"train_loss": -6.296114444732666, "global_step": 108164, "epoch": 2575} {"train_loss": -6.2536516189575195, "global_step": 108165, "epoch": 2575} {"train_loss": -6.4094696044921875, "global_step": 108166, "epoch": 2575} {"train_loss": -6.395053386688232, "global_step": 108167, "epoch": 2575} {"train_loss": -6.308481216430664, "global_step": 108168, "epoch": 2575} {"train_loss": -6.354487419128418, "global_step": 108169, "epoch": 2575} {"train_loss": -6.329944133758545, "global_step": 108170, "epoch": 2575} {"train_loss": -6.199204444885254, "global_step": 108171, "epoch": 2575} {"train_loss": -6.285248279571533, "global_step": 108172, "epoch": 2575} {"train_loss": -6.354787349700928, "global_step": 108173, "epoch": 2575} {"train_loss": -6.35165548324585, "global_step": 108174, "epoch": 2575} {"train_loss": -6.213046073913574, "global_step": 108175, "epoch": 2575} {"train_loss": -6.302207946777344, "global_step": 108176, "epoch": 2575} {"train_loss": -6.375261306762695, "global_step": 108177, "epoch": 2575} {"train_loss": -6.362468719482422, "global_step": 108178, "epoch": 2575} {"train_loss": -6.384164810180664, "global_step": 108179, "epoch": 2575} {"train_loss": -6.430367469787598, "global_step": 108180, "epoch": 2575} {"train_loss": -6.382911682128906, "global_step": 108181, "epoch": 2575} {"train_loss": -6.359602928161621, "global_step": 108182, "epoch": 2575} {"train_loss": -6.308876037597656, "global_step": 108183, "epoch": 2575} {"train_loss": -6.403743267059326, "global_step": 108184, "epoch": 2575} {"train_loss": -6.405886650085449, "global_step": 108185, "epoch": 2575} {"train_loss": -6.401022911071777, "global_step": 108186, "epoch": 2575} {"train_loss": -6.500666618347168, "global_step": 108187, "epoch": 2575} {"train_loss": -6.292422771453857, "global_step": 108188, "epoch": 2575} {"train_loss": -6.477052211761475, "global_step": 108189, "epoch": 2575} {"train_loss": -6.323405742645264, "global_step": 108190, "epoch": 2575} {"train_loss": -6.379070384161813, "global_step": 108191, "epoch": 2575, "val_loss": 64764.89453125} {"train_loss": -6.370261192321777, "global_step": 108192, "epoch": 2576} {"train_loss": -6.437806606292725, "global_step": 108193, "epoch": 2576} {"train_loss": -6.3932414054870605, "global_step": 108194, "epoch": 2576} {"train_loss": -6.317960262298584, "global_step": 108195, "epoch": 2576} {"train_loss": -6.319443702697754, "global_step": 108196, "epoch": 2576} {"train_loss": -6.415010452270508, "global_step": 108197, "epoch": 2576} {"train_loss": -6.458837509155273, "global_step": 108198, "epoch": 2576} {"train_loss": -6.333840370178223, "global_step": 108199, "epoch": 2576} {"train_loss": -6.503736972808838, "global_step": 108200, "epoch": 2576} {"train_loss": -6.339459419250488, "global_step": 108201, "epoch": 2576} {"train_loss": -6.456322193145752, "global_step": 108202, "epoch": 2576} {"train_loss": -6.386852264404297, "global_step": 108203, "epoch": 2576} {"train_loss": -6.46916389465332, "global_step": 108204, "epoch": 2576} {"train_loss": -6.489080905914307, "global_step": 108205, "epoch": 2576} {"train_loss": -6.3996124267578125, "global_step": 108206, "epoch": 2576} {"train_loss": -6.430203914642334, "global_step": 108207, "epoch": 2576} {"train_loss": -6.437854290008545, "global_step": 108208, "epoch": 2576} {"train_loss": -6.436095237731934, "global_step": 108209, "epoch": 2576} {"train_loss": -6.493487358093262, "global_step": 108210, "epoch": 2576} {"train_loss": -6.376475811004639, "global_step": 108211, "epoch": 2576} {"train_loss": -6.482687950134277, "global_step": 108212, "epoch": 2576} {"train_loss": -6.477924346923828, "global_step": 108213, "epoch": 2576} {"train_loss": -6.378881454467773, "global_step": 108214, "epoch": 2576} {"train_loss": -6.551241874694824, "global_step": 108215, "epoch": 2576} {"train_loss": -6.40394926071167, "global_step": 108216, "epoch": 2576} {"train_loss": -6.565299987792969, "global_step": 108217, "epoch": 2576} {"train_loss": -6.423572540283203, "global_step": 108218, "epoch": 2576} {"train_loss": -6.3297438621521, "global_step": 108219, "epoch": 2576} {"train_loss": -6.380209922790527, "global_step": 108220, "epoch": 2576} {"train_loss": -6.392289161682129, "global_step": 108221, "epoch": 2576} {"train_loss": -6.38839054107666, "global_step": 108222, "epoch": 2576} {"train_loss": -6.527176856994629, "global_step": 108223, "epoch": 2576} {"train_loss": -6.32435941696167, "global_step": 108224, "epoch": 2576} {"train_loss": -6.479282855987549, "global_step": 108225, "epoch": 2576} {"train_loss": -6.414389610290527, "global_step": 108226, "epoch": 2576} {"train_loss": -6.481432914733887, "global_step": 108227, "epoch": 2576} {"train_loss": -6.469429016113281, "global_step": 108228, "epoch": 2576} {"train_loss": -6.471316814422607, "global_step": 108229, "epoch": 2576} {"train_loss": -6.484665393829346, "global_step": 108230, "epoch": 2576} {"train_loss": -6.368626117706299, "global_step": 108231, "epoch": 2576} {"train_loss": -6.4476318359375, "global_step": 108232, "epoch": 2576} {"train_loss": -6.428484008425758, "global_step": 108233, "epoch": 2576, "val_loss": 64851.57421875} {"train_loss": -6.333675384521484, "global_step": 108234, "epoch": 2577} {"train_loss": -6.451420307159424, "global_step": 108235, "epoch": 2577} {"train_loss": -6.446188449859619, "global_step": 108236, "epoch": 2577} {"train_loss": -6.462702751159668, "global_step": 108237, "epoch": 2577} {"train_loss": -6.478989601135254, "global_step": 108238, "epoch": 2577} {"train_loss": -6.521636962890625, "global_step": 108239, "epoch": 2577} {"train_loss": -6.472254753112793, "global_step": 108240, "epoch": 2577} {"train_loss": -6.547314643859863, "global_step": 108241, "epoch": 2577} {"train_loss": -6.374917507171631, "global_step": 108242, "epoch": 2577} {"train_loss": -6.4674272537231445, "global_step": 108243, "epoch": 2577} {"train_loss": -6.4598283767700195, "global_step": 108244, "epoch": 2577} {"train_loss": -6.401950359344482, "global_step": 108245, "epoch": 2577} {"train_loss": -6.361184597015381, "global_step": 108246, "epoch": 2577} {"train_loss": -6.383855819702148, "global_step": 108247, "epoch": 2577} {"train_loss": -6.4313273429870605, "global_step": 108248, "epoch": 2577} {"train_loss": -6.562066555023193, "global_step": 108249, "epoch": 2577} {"train_loss": -6.350732326507568, "global_step": 108250, "epoch": 2577} {"train_loss": -6.445446968078613, "global_step": 108251, "epoch": 2577} {"train_loss": -6.476104736328125, "global_step": 108252, "epoch": 2577} {"train_loss": -6.4695024490356445, "global_step": 108253, "epoch": 2577} {"train_loss": -6.396907806396484, "global_step": 108254, "epoch": 2577} {"train_loss": -6.482166767120361, "global_step": 108255, "epoch": 2577} {"train_loss": -6.5500946044921875, "global_step": 108256, "epoch": 2577} {"train_loss": -6.546097755432129, "global_step": 108257, "epoch": 2577} {"train_loss": -6.411035537719727, "global_step": 108258, "epoch": 2577} {"train_loss": -6.460391998291016, "global_step": 108259, "epoch": 2577} {"train_loss": -6.5605669021606445, "global_step": 108260, "epoch": 2577} {"train_loss": -6.503185272216797, "global_step": 108261, "epoch": 2577} {"train_loss": -6.498830795288086, "global_step": 108262, "epoch": 2577} {"train_loss": -6.474780559539795, "global_step": 108263, "epoch": 2577} {"train_loss": -6.531858444213867, "global_step": 108264, "epoch": 2577} {"train_loss": -6.360620498657227, "global_step": 108265, "epoch": 2577} {"train_loss": -6.355208396911621, "global_step": 108266, "epoch": 2577} {"train_loss": -6.338832855224609, "global_step": 108267, "epoch": 2577} {"train_loss": -6.443888187408447, "global_step": 108268, "epoch": 2577} {"train_loss": -6.4687089920043945, "global_step": 108269, "epoch": 2577} {"train_loss": -6.341294288635254, "global_step": 108270, "epoch": 2577} {"train_loss": -6.405645847320557, "global_step": 108271, "epoch": 2577} {"train_loss": -6.412723541259766, "global_step": 108272, "epoch": 2577} {"train_loss": -6.510860443115234, "global_step": 108273, "epoch": 2577} {"train_loss": -6.436567306518555, "global_step": 108274, "epoch": 2577} {"train_loss": -6.444627773194086, "global_step": 108275, "epoch": 2577, "val_loss": 64859.703125} {"train_loss": -6.515442848205566, "global_step": 108276, "epoch": 2578} {"train_loss": -6.444306373596191, "global_step": 108277, "epoch": 2578} {"train_loss": -6.3099493980407715, "global_step": 108278, "epoch": 2578} {"train_loss": -6.489152431488037, "global_step": 108279, "epoch": 2578} {"train_loss": -6.322055816650391, "global_step": 108280, "epoch": 2578} {"train_loss": -6.469444274902344, "global_step": 108281, "epoch": 2578} {"train_loss": -6.351522445678711, "global_step": 108282, "epoch": 2578} {"train_loss": -6.390700340270996, "global_step": 108283, "epoch": 2578} {"train_loss": -6.434905529022217, "global_step": 108284, "epoch": 2578} {"train_loss": -6.443299770355225, "global_step": 108285, "epoch": 2578} {"train_loss": -6.4820051193237305, "global_step": 108286, "epoch": 2578} {"train_loss": -6.304079055786133, "global_step": 108287, "epoch": 2578} {"train_loss": -6.3943963050842285, "global_step": 108288, "epoch": 2578} {"train_loss": -6.497516632080078, "global_step": 108289, "epoch": 2578} {"train_loss": -6.331549644470215, "global_step": 108290, "epoch": 2578} {"train_loss": -6.2654595375061035, "global_step": 108291, "epoch": 2578} {"train_loss": -6.439112663269043, "global_step": 108292, "epoch": 2578} {"train_loss": -6.416854381561279, "global_step": 108293, "epoch": 2578} {"train_loss": -6.426922798156738, "global_step": 108294, "epoch": 2578} {"train_loss": -6.45162296295166, "global_step": 108295, "epoch": 2578} {"train_loss": -6.378363609313965, "global_step": 108296, "epoch": 2578} {"train_loss": -6.428030967712402, "global_step": 108297, "epoch": 2578} {"train_loss": -6.324718475341797, "global_step": 108298, "epoch": 2578} {"train_loss": -6.470701217651367, "global_step": 108299, "epoch": 2578} {"train_loss": -6.453963279724121, "global_step": 108300, "epoch": 2578} {"train_loss": -6.432915687561035, "global_step": 108301, "epoch": 2578} {"train_loss": -6.418067932128906, "global_step": 108302, "epoch": 2578} {"train_loss": -6.391468048095703, "global_step": 108303, "epoch": 2578} {"train_loss": -6.435993194580078, "global_step": 108304, "epoch": 2578} {"train_loss": -6.3665289878845215, "global_step": 108305, "epoch": 2578} {"train_loss": -6.540937423706055, "global_step": 108306, "epoch": 2578} {"train_loss": -6.398099899291992, "global_step": 108307, "epoch": 2578} {"train_loss": -6.591916561126709, "global_step": 108308, "epoch": 2578} {"train_loss": -6.4262847900390625, "global_step": 108309, "epoch": 2578} {"train_loss": -6.336321830749512, "global_step": 108310, "epoch": 2578} {"train_loss": -6.498006820678711, "global_step": 108311, "epoch": 2578} {"train_loss": -6.4643940925598145, "global_step": 108312, "epoch": 2578} {"train_loss": -6.462907314300537, "global_step": 108313, "epoch": 2578} {"train_loss": -6.47250509262085, "global_step": 108314, "epoch": 2578} {"train_loss": -6.54726505279541, "global_step": 108315, "epoch": 2578} {"train_loss": -6.5387115478515625, "global_step": 108316, "epoch": 2578} {"train_loss": -6.427436817260015, "global_step": 108317, "epoch": 2578, "val_loss": 64663.34375} {"train_loss": -6.54349422454834, "global_step": 108318, "epoch": 2579} {"train_loss": -6.518804550170898, "global_step": 108319, "epoch": 2579} {"train_loss": -6.486083507537842, "global_step": 108320, "epoch": 2579} {"train_loss": -6.446537494659424, "global_step": 108321, "epoch": 2579} {"train_loss": -6.3891143798828125, "global_step": 108322, "epoch": 2579} {"train_loss": -6.494650840759277, "global_step": 108323, "epoch": 2579} {"train_loss": -6.392481803894043, "global_step": 108324, "epoch": 2579} {"train_loss": -6.465580940246582, "global_step": 108325, "epoch": 2579} {"train_loss": -6.529962062835693, "global_step": 108326, "epoch": 2579} {"train_loss": -6.3963799476623535, "global_step": 108327, "epoch": 2579} {"train_loss": -6.388897895812988, "global_step": 108328, "epoch": 2579} {"train_loss": -6.52458381652832, "global_step": 108329, "epoch": 2579} {"train_loss": -6.407691478729248, "global_step": 108330, "epoch": 2579} {"train_loss": -6.545319080352783, "global_step": 108331, "epoch": 2579} {"train_loss": -6.370718955993652, "global_step": 108332, "epoch": 2579} {"train_loss": -6.480771064758301, "global_step": 108333, "epoch": 2579} {"train_loss": -6.497085094451904, "global_step": 108334, "epoch": 2579} {"train_loss": -6.471010208129883, "global_step": 108335, "epoch": 2579} {"train_loss": -6.514122009277344, "global_step": 108336, "epoch": 2579} {"train_loss": -6.474664211273193, "global_step": 108337, "epoch": 2579} {"train_loss": -6.434963226318359, "global_step": 108338, "epoch": 2579} {"train_loss": -6.480175971984863, "global_step": 108339, "epoch": 2579} {"train_loss": -6.4835615158081055, "global_step": 108340, "epoch": 2579} {"train_loss": -6.514455795288086, "global_step": 108341, "epoch": 2579} {"train_loss": -6.446889877319336, "global_step": 108342, "epoch": 2579} {"train_loss": -6.499292373657227, "global_step": 108343, "epoch": 2579} {"train_loss": -6.492118835449219, "global_step": 108344, "epoch": 2579} {"train_loss": -6.445248126983643, "global_step": 108345, "epoch": 2579} {"train_loss": -6.495772361755371, "global_step": 108346, "epoch": 2579} {"train_loss": -6.581984519958496, "global_step": 108347, "epoch": 2579} {"train_loss": -6.472253799438477, "global_step": 108348, "epoch": 2579} {"train_loss": -6.503432273864746, "global_step": 108349, "epoch": 2579} {"train_loss": -6.473141670227051, "global_step": 108350, "epoch": 2579} {"train_loss": -6.572714805603027, "global_step": 108351, "epoch": 2579} {"train_loss": -6.488720417022705, "global_step": 108352, "epoch": 2579} {"train_loss": -6.543631076812744, "global_step": 108353, "epoch": 2579} {"train_loss": -6.596795558929443, "global_step": 108354, "epoch": 2579} {"train_loss": -6.34187650680542, "global_step": 108355, "epoch": 2579} {"train_loss": -6.516119003295898, "global_step": 108356, "epoch": 2579} {"train_loss": -6.554173469543457, "global_step": 108357, "epoch": 2579} {"train_loss": -6.5141987800598145, "global_step": 108358, "epoch": 2579} {"train_loss": -6.484308151971726, "global_step": 108359, "epoch": 2579, "val_loss": 64683.6796875} {"train_loss": -6.552829742431641, "global_step": 108360, "epoch": 2580} {"train_loss": -6.556851387023926, "global_step": 108361, "epoch": 2580} {"train_loss": -6.555098056793213, "global_step": 108362, "epoch": 2580} {"train_loss": -6.509680271148682, "global_step": 108363, "epoch": 2580} {"train_loss": -6.499882698059082, "global_step": 108364, "epoch": 2580} {"train_loss": -6.585150718688965, "global_step": 108365, "epoch": 2580} {"train_loss": -6.587888240814209, "global_step": 108366, "epoch": 2580} {"train_loss": -6.485316753387451, "global_step": 108367, "epoch": 2580} {"train_loss": -6.469945907592773, "global_step": 108368, "epoch": 2580} {"train_loss": -6.555674076080322, "global_step": 108369, "epoch": 2580} {"train_loss": -6.4047136306762695, "global_step": 108370, "epoch": 2580} {"train_loss": -6.513995170593262, "global_step": 108371, "epoch": 2580} {"train_loss": -6.454876899719238, "global_step": 108372, "epoch": 2580} {"train_loss": -6.435612678527832, "global_step": 108373, "epoch": 2580} {"train_loss": -6.514852046966553, "global_step": 108374, "epoch": 2580} {"train_loss": -6.575525283813477, "global_step": 108375, "epoch": 2580} {"train_loss": -6.499359130859375, "global_step": 108376, "epoch": 2580} {"train_loss": -6.48098087310791, "global_step": 108377, "epoch": 2580} {"train_loss": -6.518715858459473, "global_step": 108378, "epoch": 2580} {"train_loss": -6.53997802734375, "global_step": 108379, "epoch": 2580} {"train_loss": -6.550795555114746, "global_step": 108380, "epoch": 2580} {"train_loss": -6.613587379455566, "global_step": 108381, "epoch": 2580} {"train_loss": -6.566859245300293, "global_step": 108382, "epoch": 2580} {"train_loss": -6.530936241149902, "global_step": 108383, "epoch": 2580} {"train_loss": -6.521510124206543, "global_step": 108384, "epoch": 2580} {"train_loss": -6.4058732986450195, "global_step": 108385, "epoch": 2580} {"train_loss": -6.44542121887207, "global_step": 108386, "epoch": 2580} {"train_loss": -6.349948406219482, "global_step": 108387, "epoch": 2580} {"train_loss": -6.497514724731445, "global_step": 108388, "epoch": 2580} {"train_loss": -6.366395473480225, "global_step": 108389, "epoch": 2580} {"train_loss": -6.488070011138916, "global_step": 108390, "epoch": 2580} {"train_loss": -6.546919822692871, "global_step": 108391, "epoch": 2580} {"train_loss": -6.3808722496032715, "global_step": 108392, "epoch": 2580} {"train_loss": -6.4233808517456055, "global_step": 108393, "epoch": 2580} {"train_loss": -6.472476482391357, "global_step": 108394, "epoch": 2580} {"train_loss": -6.459131717681885, "global_step": 108395, "epoch": 2580} {"train_loss": -6.4722185134887695, "global_step": 108396, "epoch": 2580} {"train_loss": -6.528512954711914, "global_step": 108397, "epoch": 2580} {"train_loss": -6.433022499084473, "global_step": 108398, "epoch": 2580} {"train_loss": -6.340597152709961, "global_step": 108399, "epoch": 2580} {"train_loss": -6.502279281616211, "global_step": 108400, "epoch": 2580} {"train_loss": -6.491925546101162, "global_step": 108401, "epoch": 2580, "val_loss": 64839.16015625} {"train_loss": -6.4506611824035645, "global_step": 108402, "epoch": 2581} {"train_loss": -6.490659713745117, "global_step": 108403, "epoch": 2581} {"train_loss": -6.5257463455200195, "global_step": 108404, "epoch": 2581} {"train_loss": -6.552829742431641, "global_step": 108405, "epoch": 2581} {"train_loss": -6.641310691833496, "global_step": 108406, "epoch": 2581} {"train_loss": -6.527200698852539, "global_step": 108407, "epoch": 2581} {"train_loss": -6.307214736938477, "global_step": 108408, "epoch": 2581} {"train_loss": -6.445234298706055, "global_step": 108409, "epoch": 2581} {"train_loss": -6.420502185821533, "global_step": 108410, "epoch": 2581} {"train_loss": -6.463052272796631, "global_step": 108411, "epoch": 2581} {"train_loss": -6.385781288146973, "global_step": 108412, "epoch": 2581} {"train_loss": -6.287662029266357, "global_step": 108413, "epoch": 2581} {"train_loss": -6.429015159606934, "global_step": 108414, "epoch": 2581} {"train_loss": -6.359264373779297, "global_step": 108415, "epoch": 2581} {"train_loss": -6.33518648147583, "global_step": 108416, "epoch": 2581} {"train_loss": -6.4415669441223145, "global_step": 108417, "epoch": 2581} {"train_loss": -6.323313236236572, "global_step": 108418, "epoch": 2581} {"train_loss": -6.446044921875, "global_step": 108419, "epoch": 2581} {"train_loss": -6.427024841308594, "global_step": 108420, "epoch": 2581} {"train_loss": -6.262575626373291, "global_step": 108421, "epoch": 2581} {"train_loss": -6.346771717071533, "global_step": 108422, "epoch": 2581} {"train_loss": -6.377147674560547, "global_step": 108423, "epoch": 2581} {"train_loss": -6.36602258682251, "global_step": 108424, "epoch": 2581} {"train_loss": -6.402008056640625, "global_step": 108425, "epoch": 2581} {"train_loss": -6.388840675354004, "global_step": 108426, "epoch": 2581} {"train_loss": -6.310430526733398, "global_step": 108427, "epoch": 2581} {"train_loss": -6.231593608856201, "global_step": 108428, "epoch": 2581} {"train_loss": -6.499960899353027, "global_step": 108429, "epoch": 2581} {"train_loss": -6.366644382476807, "global_step": 108430, "epoch": 2581} {"train_loss": -6.313693046569824, "global_step": 108431, "epoch": 2581} {"train_loss": -6.318861961364746, "global_step": 108432, "epoch": 2581} {"train_loss": -6.3256001472473145, "global_step": 108433, "epoch": 2581} {"train_loss": -6.345213413238525, "global_step": 108434, "epoch": 2581} {"train_loss": -6.345630645751953, "global_step": 108435, "epoch": 2581} {"train_loss": -6.511970520019531, "global_step": 108436, "epoch": 2581} {"train_loss": -6.377517223358154, "global_step": 108437, "epoch": 2581} {"train_loss": -6.356382369995117, "global_step": 108438, "epoch": 2581} {"train_loss": -6.419670104980469, "global_step": 108439, "epoch": 2581} {"train_loss": -6.401279926300049, "global_step": 108440, "epoch": 2581} {"train_loss": -6.478513240814209, "global_step": 108441, "epoch": 2581} {"train_loss": -6.3929338455200195, "global_step": 108442, "epoch": 2581} {"train_loss": -6.398807571047828, "global_step": 108443, "epoch": 2581, "val_loss": 64981.4296875} {"train_loss": -6.31855583190918, "global_step": 108444, "epoch": 2582} {"train_loss": -6.54006814956665, "global_step": 108445, "epoch": 2582} {"train_loss": -6.447556018829346, "global_step": 108446, "epoch": 2582} {"train_loss": -6.505357265472412, "global_step": 108447, "epoch": 2582} {"train_loss": -6.435286521911621, "global_step": 108448, "epoch": 2582} {"train_loss": -6.4176926612854, "global_step": 108449, "epoch": 2582} {"train_loss": -6.47003173828125, "global_step": 108450, "epoch": 2582} {"train_loss": -6.539752006530762, "global_step": 108451, "epoch": 2582} {"train_loss": -6.406726837158203, "global_step": 108452, "epoch": 2582} {"train_loss": -6.498634338378906, "global_step": 108453, "epoch": 2582} {"train_loss": -6.49355411529541, "global_step": 108454, "epoch": 2582} {"train_loss": -6.412771224975586, "global_step": 108455, "epoch": 2582} {"train_loss": -6.515106201171875, "global_step": 108456, "epoch": 2582} {"train_loss": -6.354175567626953, "global_step": 108457, "epoch": 2582} {"train_loss": -6.426192283630371, "global_step": 108458, "epoch": 2582} {"train_loss": -6.405965805053711, "global_step": 108459, "epoch": 2582} {"train_loss": -6.4465155601501465, "global_step": 108460, "epoch": 2582} {"train_loss": -6.483669281005859, "global_step": 108461, "epoch": 2582} {"train_loss": -6.2877516746521, "global_step": 108462, "epoch": 2582} {"train_loss": -6.422183513641357, "global_step": 108463, "epoch": 2582} {"train_loss": -6.45695686340332, "global_step": 108464, "epoch": 2582} {"train_loss": -6.290925025939941, "global_step": 108465, "epoch": 2582} {"train_loss": -6.511590957641602, "global_step": 108466, "epoch": 2582} {"train_loss": -6.434642791748047, "global_step": 108467, "epoch": 2582} {"train_loss": -6.360830307006836, "global_step": 108468, "epoch": 2582} {"train_loss": -6.550879955291748, "global_step": 108469, "epoch": 2582} {"train_loss": -6.393226623535156, "global_step": 108470, "epoch": 2582} {"train_loss": -6.493587493896484, "global_step": 108471, "epoch": 2582} {"train_loss": -6.376327991485596, "global_step": 108472, "epoch": 2582} {"train_loss": -6.453728675842285, "global_step": 108473, "epoch": 2582} {"train_loss": -6.456831932067871, "global_step": 108474, "epoch": 2582} {"train_loss": -6.52653169631958, "global_step": 108475, "epoch": 2582} {"train_loss": -6.535661697387695, "global_step": 108476, "epoch": 2582} {"train_loss": -6.392920017242432, "global_step": 108477, "epoch": 2582} {"train_loss": -6.286736011505127, "global_step": 108478, "epoch": 2582} {"train_loss": -6.475923538208008, "global_step": 108479, "epoch": 2582} {"train_loss": -6.573017120361328, "global_step": 108480, "epoch": 2582} {"train_loss": -6.533320426940918, "global_step": 108481, "epoch": 2582} {"train_loss": -6.558037757873535, "global_step": 108482, "epoch": 2582} {"train_loss": -6.423239707946777, "global_step": 108483, "epoch": 2582} {"train_loss": -6.448781490325928, "global_step": 108484, "epoch": 2582} {"train_loss": -6.4474809396834605, "global_step": 108485, "epoch": 2582, "val_loss": 64823.109375} {"train_loss": -6.548221111297607, "global_step": 108486, "epoch": 2583} {"train_loss": -6.518914699554443, "global_step": 108487, "epoch": 2583} {"train_loss": -6.565800189971924, "global_step": 108488, "epoch": 2583} {"train_loss": -6.435833930969238, "global_step": 108489, "epoch": 2583} {"train_loss": -6.557456016540527, "global_step": 108490, "epoch": 2583} {"train_loss": -6.468465805053711, "global_step": 108491, "epoch": 2583} {"train_loss": -6.514078140258789, "global_step": 108492, "epoch": 2583} {"train_loss": -6.340005874633789, "global_step": 108493, "epoch": 2583} {"train_loss": -6.376113414764404, "global_step": 108494, "epoch": 2583} {"train_loss": -6.463548183441162, "global_step": 108495, "epoch": 2583} {"train_loss": -6.4775004386901855, "global_step": 108496, "epoch": 2583} {"train_loss": -6.422861099243164, "global_step": 108497, "epoch": 2583} {"train_loss": -6.440458297729492, "global_step": 108498, "epoch": 2583} {"train_loss": -6.529528617858887, "global_step": 108499, "epoch": 2583} {"train_loss": -6.452605247497559, "global_step": 108500, "epoch": 2583} {"train_loss": -6.463621139526367, "global_step": 108501, "epoch": 2583} {"train_loss": -6.560365676879883, "global_step": 108502, "epoch": 2583} {"train_loss": -6.443734645843506, "global_step": 108503, "epoch": 2583} {"train_loss": -6.505478382110596, "global_step": 108504, "epoch": 2583} {"train_loss": -6.464816570281982, "global_step": 108505, "epoch": 2583} {"train_loss": -6.438304424285889, "global_step": 108506, "epoch": 2583} {"train_loss": -6.51285982131958, "global_step": 108507, "epoch": 2583} {"train_loss": -6.477513313293457, "global_step": 108508, "epoch": 2583} {"train_loss": -6.346908092498779, "global_step": 108509, "epoch": 2583} {"train_loss": -6.479519844055176, "global_step": 108510, "epoch": 2583} {"train_loss": -6.438271522521973, "global_step": 108511, "epoch": 2583} {"train_loss": -6.586259841918945, "global_step": 108512, "epoch": 2583} {"train_loss": -6.353188514709473, "global_step": 108513, "epoch": 2583} {"train_loss": -6.3585710525512695, "global_step": 108514, "epoch": 2583} {"train_loss": -6.471567153930664, "global_step": 108515, "epoch": 2583} {"train_loss": -6.418367385864258, "global_step": 108516, "epoch": 2583} {"train_loss": -6.371933937072754, "global_step": 108517, "epoch": 2583} {"train_loss": -6.40049409866333, "global_step": 108518, "epoch": 2583} {"train_loss": -6.531493663787842, "global_step": 108519, "epoch": 2583} {"train_loss": -6.514764785766602, "global_step": 108520, "epoch": 2583} {"train_loss": -6.4808502197265625, "global_step": 108521, "epoch": 2583} {"train_loss": -6.415119647979736, "global_step": 108522, "epoch": 2583} {"train_loss": -6.395257949829102, "global_step": 108523, "epoch": 2583} {"train_loss": -6.445220947265625, "global_step": 108524, "epoch": 2583} {"train_loss": -6.391204833984375, "global_step": 108525, "epoch": 2583} {"train_loss": -6.530613899230957, "global_step": 108526, "epoch": 2583} {"train_loss": -6.458251215162731, "global_step": 108527, "epoch": 2583, "val_loss": 64751.75390625} {"train_loss": -6.586894989013672, "global_step": 108528, "epoch": 2584} {"train_loss": -6.468694686889648, "global_step": 108529, "epoch": 2584} {"train_loss": -6.59445858001709, "global_step": 108530, "epoch": 2584} {"train_loss": -6.470770835876465, "global_step": 108531, "epoch": 2584} {"train_loss": -6.431129455566406, "global_step": 108532, "epoch": 2584} {"train_loss": -6.600521564483643, "global_step": 108533, "epoch": 2584} {"train_loss": -6.4238176345825195, "global_step": 108534, "epoch": 2584} {"train_loss": -6.480651378631592, "global_step": 108535, "epoch": 2584} {"train_loss": -6.5136799812316895, "global_step": 108536, "epoch": 2584} {"train_loss": -6.587282180786133, "global_step": 108537, "epoch": 2584} {"train_loss": -6.461560249328613, "global_step": 108538, "epoch": 2584} {"train_loss": -6.463772773742676, "global_step": 108539, "epoch": 2584} {"train_loss": -6.447128772735596, "global_step": 108540, "epoch": 2584} {"train_loss": -6.582784652709961, "global_step": 108541, "epoch": 2584} {"train_loss": -6.4806294441223145, "global_step": 108542, "epoch": 2584} {"train_loss": -6.556697845458984, "global_step": 108543, "epoch": 2584} {"train_loss": -6.347508430480957, "global_step": 108544, "epoch": 2584} {"train_loss": -6.423070907592773, "global_step": 108545, "epoch": 2584} {"train_loss": -6.420907974243164, "global_step": 108546, "epoch": 2584} {"train_loss": -6.521207809448242, "global_step": 108547, "epoch": 2584} {"train_loss": -6.425705909729004, "global_step": 108548, "epoch": 2584} {"train_loss": -6.59407377243042, "global_step": 108549, "epoch": 2584} {"train_loss": -6.455625534057617, "global_step": 108550, "epoch": 2584} {"train_loss": -6.451879501342773, "global_step": 108551, "epoch": 2584} {"train_loss": -6.415866374969482, "global_step": 108552, "epoch": 2584} {"train_loss": -6.54149055480957, "global_step": 108553, "epoch": 2584} {"train_loss": -6.640840530395508, "global_step": 108554, "epoch": 2584} {"train_loss": -6.548046112060547, "global_step": 108555, "epoch": 2584} {"train_loss": -6.534571647644043, "global_step": 108556, "epoch": 2584} {"train_loss": -6.489333152770996, "global_step": 108557, "epoch": 2584} {"train_loss": -6.46602725982666, "global_step": 108558, "epoch": 2584} {"train_loss": -6.5340375900268555, "global_step": 108559, "epoch": 2584} {"train_loss": -6.340099334716797, "global_step": 108560, "epoch": 2584} {"train_loss": -6.559507846832275, "global_step": 108561, "epoch": 2584} {"train_loss": -6.512463569641113, "global_step": 108562, "epoch": 2584} {"train_loss": -6.525062084197998, "global_step": 108563, "epoch": 2584} {"train_loss": -6.424568176269531, "global_step": 108564, "epoch": 2584} {"train_loss": -6.563923358917236, "global_step": 108565, "epoch": 2584} {"train_loss": -6.382535934448242, "global_step": 108566, "epoch": 2584} {"train_loss": -6.362676620483398, "global_step": 108567, "epoch": 2584} {"train_loss": -6.507485389709473, "global_step": 108568, "epoch": 2584} {"train_loss": -6.490287417457218, "global_step": 108569, "epoch": 2584, "val_loss": 64903.83984375} {"train_loss": -6.454349994659424, "global_step": 108570, "epoch": 2585} {"train_loss": -6.497405529022217, "global_step": 108571, "epoch": 2585} {"train_loss": -6.338805198669434, "global_step": 108572, "epoch": 2585} {"train_loss": -6.476655960083008, "global_step": 108573, "epoch": 2585} {"train_loss": -6.58988094329834, "global_step": 108574, "epoch": 2585} {"train_loss": -6.539548873901367, "global_step": 108575, "epoch": 2585} {"train_loss": -6.402607440948486, "global_step": 108576, "epoch": 2585} {"train_loss": -6.539796829223633, "global_step": 108577, "epoch": 2585} {"train_loss": -6.348686695098877, "global_step": 108578, "epoch": 2585} {"train_loss": -6.450261116027832, "global_step": 108579, "epoch": 2585} {"train_loss": -6.562228202819824, "global_step": 108580, "epoch": 2585} {"train_loss": -6.372422695159912, "global_step": 108581, "epoch": 2585} {"train_loss": -6.366529941558838, "global_step": 108582, "epoch": 2585} {"train_loss": -6.631738662719727, "global_step": 108583, "epoch": 2585} {"train_loss": -6.484426021575928, "global_step": 108584, "epoch": 2585} {"train_loss": -6.497620582580566, "global_step": 108585, "epoch": 2585} {"train_loss": -6.42894172668457, "global_step": 108586, "epoch": 2585} {"train_loss": -6.499856948852539, "global_step": 108587, "epoch": 2585} {"train_loss": -6.392460346221924, "global_step": 108588, "epoch": 2585} {"train_loss": -6.444948196411133, "global_step": 108589, "epoch": 2585} {"train_loss": -6.4756340980529785, "global_step": 108590, "epoch": 2585} {"train_loss": -6.355844497680664, "global_step": 108591, "epoch": 2585} {"train_loss": -6.384086608886719, "global_step": 108592, "epoch": 2585} {"train_loss": -6.3637895584106445, "global_step": 108593, "epoch": 2585} {"train_loss": -6.339882850646973, "global_step": 108594, "epoch": 2585} {"train_loss": -6.383947372436523, "global_step": 108595, "epoch": 2585} {"train_loss": -6.406693458557129, "global_step": 108596, "epoch": 2585} {"train_loss": -6.4302287101745605, "global_step": 108597, "epoch": 2585} {"train_loss": -6.435915946960449, "global_step": 108598, "epoch": 2585} {"train_loss": -6.35366153717041, "global_step": 108599, "epoch": 2585} {"train_loss": -6.438889503479004, "global_step": 108600, "epoch": 2585} {"train_loss": -6.375067710876465, "global_step": 108601, "epoch": 2585} {"train_loss": -6.413436412811279, "global_step": 108602, "epoch": 2585} {"train_loss": -6.460383892059326, "global_step": 108603, "epoch": 2585} {"train_loss": -6.497682094573975, "global_step": 108604, "epoch": 2585} {"train_loss": -6.458391189575195, "global_step": 108605, "epoch": 2585} {"train_loss": -6.424938201904297, "global_step": 108606, "epoch": 2585} {"train_loss": -6.42526912689209, "global_step": 108607, "epoch": 2585} {"train_loss": -6.521247386932373, "global_step": 108608, "epoch": 2585} {"train_loss": -6.399369716644287, "global_step": 108609, "epoch": 2585} {"train_loss": -6.533743381500244, "global_step": 108610, "epoch": 2585} {"train_loss": -6.445871534801665, "global_step": 108611, "epoch": 2585, "val_loss": 64888.0859375} {"train_loss": -6.465974807739258, "global_step": 108612, "epoch": 2586} {"train_loss": -6.533581733703613, "global_step": 108613, "epoch": 2586} {"train_loss": -6.532495498657227, "global_step": 108614, "epoch": 2586} {"train_loss": -6.599100112915039, "global_step": 108615, "epoch": 2586} {"train_loss": -6.493832588195801, "global_step": 108616, "epoch": 2586} {"train_loss": -6.410407543182373, "global_step": 108617, "epoch": 2586} {"train_loss": -6.414908409118652, "global_step": 108618, "epoch": 2586} {"train_loss": -6.495145320892334, "global_step": 108619, "epoch": 2586} {"train_loss": -6.638047695159912, "global_step": 108620, "epoch": 2586} {"train_loss": -6.4091033935546875, "global_step": 108621, "epoch": 2586} {"train_loss": -6.478365898132324, "global_step": 108622, "epoch": 2586} {"train_loss": -6.586174011230469, "global_step": 108623, "epoch": 2586} {"train_loss": -6.469602584838867, "global_step": 108624, "epoch": 2586} {"train_loss": -6.4829535484313965, "global_step": 108625, "epoch": 2586} {"train_loss": -6.427664279937744, "global_step": 108626, "epoch": 2586} {"train_loss": -6.468578338623047, "global_step": 108627, "epoch": 2586} {"train_loss": -6.47031831741333, "global_step": 108628, "epoch": 2586} {"train_loss": -6.461714744567871, "global_step": 108629, "epoch": 2586} {"train_loss": -6.505853176116943, "global_step": 108630, "epoch": 2586} {"train_loss": -6.555611610412598, "global_step": 108631, "epoch": 2586} {"train_loss": -6.464550971984863, "global_step": 108632, "epoch": 2586} {"train_loss": -6.403438568115234, "global_step": 108633, "epoch": 2586} {"train_loss": -6.511126518249512, "global_step": 108634, "epoch": 2586} {"train_loss": -6.389193534851074, "global_step": 108635, "epoch": 2586} {"train_loss": -6.518390655517578, "global_step": 108636, "epoch": 2586} {"train_loss": -6.465169906616211, "global_step": 108637, "epoch": 2586} {"train_loss": -6.502857208251953, "global_step": 108638, "epoch": 2586} {"train_loss": -6.433645248413086, "global_step": 108639, "epoch": 2586} {"train_loss": -6.449251651763916, "global_step": 108640, "epoch": 2586} {"train_loss": -6.594762325286865, "global_step": 108641, "epoch": 2586} {"train_loss": -6.501920700073242, "global_step": 108642, "epoch": 2586} {"train_loss": -6.475769996643066, "global_step": 108643, "epoch": 2586} {"train_loss": -6.59904146194458, "global_step": 108644, "epoch": 2586} {"train_loss": -6.506167411804199, "global_step": 108645, "epoch": 2586} {"train_loss": -6.567922592163086, "global_step": 108646, "epoch": 2586} {"train_loss": -6.383123397827148, "global_step": 108647, "epoch": 2586} {"train_loss": -6.391651153564453, "global_step": 108648, "epoch": 2586} {"train_loss": -6.4754743576049805, "global_step": 108649, "epoch": 2586} {"train_loss": -6.498884201049805, "global_step": 108650, "epoch": 2586} {"train_loss": -6.540119647979736, "global_step": 108651, "epoch": 2586} {"train_loss": -6.4382195472717285, "global_step": 108652, "epoch": 2586} {"train_loss": -6.487854208265032, "global_step": 108653, "epoch": 2586, "val_loss": 64879.60546875} {"train_loss": -6.471912860870361, "global_step": 108654, "epoch": 2587} {"train_loss": -6.524333953857422, "global_step": 108655, "epoch": 2587} {"train_loss": -6.4259796142578125, "global_step": 108656, "epoch": 2587} {"train_loss": -6.487788677215576, "global_step": 108657, "epoch": 2587} {"train_loss": -6.464641094207764, "global_step": 108658, "epoch": 2587} {"train_loss": -6.515089988708496, "global_step": 108659, "epoch": 2587} {"train_loss": -6.482616424560547, "global_step": 108660, "epoch": 2587} {"train_loss": -6.5256171226501465, "global_step": 108661, "epoch": 2587} {"train_loss": -6.4674601554870605, "global_step": 108662, "epoch": 2587} {"train_loss": -6.351798057556152, "global_step": 108663, "epoch": 2587} {"train_loss": -6.426459312438965, "global_step": 108664, "epoch": 2587} {"train_loss": -6.474411964416504, "global_step": 108665, "epoch": 2587} {"train_loss": -6.352212429046631, "global_step": 108666, "epoch": 2587} {"train_loss": -6.28928279876709, "global_step": 108667, "epoch": 2587} {"train_loss": -6.323535919189453, "global_step": 108668, "epoch": 2587} {"train_loss": -6.438450813293457, "global_step": 108669, "epoch": 2587} {"train_loss": -6.282019138336182, "global_step": 108670, "epoch": 2587} {"train_loss": -6.266507148742676, "global_step": 108671, "epoch": 2587} {"train_loss": -6.490418910980225, "global_step": 108672, "epoch": 2587} {"train_loss": -6.3908162117004395, "global_step": 108673, "epoch": 2587} {"train_loss": -6.308825492858887, "global_step": 108674, "epoch": 2587} {"train_loss": -6.388173580169678, "global_step": 108675, "epoch": 2587} {"train_loss": -6.32882022857666, "global_step": 108676, "epoch": 2587} {"train_loss": -6.331196308135986, "global_step": 108677, "epoch": 2587} {"train_loss": -6.282265663146973, "global_step": 108678, "epoch": 2587} {"train_loss": -6.387172698974609, "global_step": 108679, "epoch": 2587} {"train_loss": -6.37484073638916, "global_step": 108680, "epoch": 2587} {"train_loss": -6.357470512390137, "global_step": 108681, "epoch": 2587} {"train_loss": -6.379255294799805, "global_step": 108682, "epoch": 2587} {"train_loss": -6.265847206115723, "global_step": 108683, "epoch": 2587} {"train_loss": -6.38755464553833, "global_step": 108684, "epoch": 2587} {"train_loss": -6.323920249938965, "global_step": 108685, "epoch": 2587} {"train_loss": -6.424347877502441, "global_step": 108686, "epoch": 2587} {"train_loss": -6.378718376159668, "global_step": 108687, "epoch": 2587} {"train_loss": -6.4822187423706055, "global_step": 108688, "epoch": 2587} {"train_loss": -6.40993595123291, "global_step": 108689, "epoch": 2587} {"train_loss": -6.362541198730469, "global_step": 108690, "epoch": 2587} {"train_loss": -6.409299850463867, "global_step": 108691, "epoch": 2587} {"train_loss": -6.235152244567871, "global_step": 108692, "epoch": 2587} {"train_loss": -6.427028179168701, "global_step": 108693, "epoch": 2587} {"train_loss": -6.321788787841797, "global_step": 108694, "epoch": 2587} {"train_loss": -6.3916440804799395, "global_step": 108695, "epoch": 2587, "val_loss": 64628.08203125} {"train_loss": -6.326357841491699, "global_step": 108696, "epoch": 2588} {"train_loss": -6.440317630767822, "global_step": 108697, "epoch": 2588} {"train_loss": -6.329363822937012, "global_step": 108698, "epoch": 2588} {"train_loss": -6.297768592834473, "global_step": 108699, "epoch": 2588} {"train_loss": -6.361597061157227, "global_step": 108700, "epoch": 2588} {"train_loss": -6.399641990661621, "global_step": 108701, "epoch": 2588} {"train_loss": -6.3615522384643555, "global_step": 108702, "epoch": 2588} {"train_loss": -6.269587993621826, "global_step": 108703, "epoch": 2588} {"train_loss": -6.428427696228027, "global_step": 108704, "epoch": 2588} {"train_loss": -6.41663932800293, "global_step": 108705, "epoch": 2588} {"train_loss": -6.43120813369751, "global_step": 108706, "epoch": 2588} {"train_loss": -6.479576110839844, "global_step": 108707, "epoch": 2588} {"train_loss": -6.356274604797363, "global_step": 108708, "epoch": 2588} {"train_loss": -6.451463222503662, "global_step": 108709, "epoch": 2588} {"train_loss": -6.36509895324707, "global_step": 108710, "epoch": 2588} {"train_loss": -6.394272804260254, "global_step": 108711, "epoch": 2588} {"train_loss": -6.434499740600586, "global_step": 108712, "epoch": 2588} {"train_loss": -6.312959671020508, "global_step": 108713, "epoch": 2588} {"train_loss": -6.510415077209473, "global_step": 108714, "epoch": 2588} {"train_loss": -6.377832412719727, "global_step": 108715, "epoch": 2588} {"train_loss": -6.453540802001953, "global_step": 108716, "epoch": 2588} {"train_loss": -6.415003776550293, "global_step": 108717, "epoch": 2588} {"train_loss": -6.3550214767456055, "global_step": 108718, "epoch": 2588} {"train_loss": -6.359251022338867, "global_step": 108719, "epoch": 2588} {"train_loss": -6.430885314941406, "global_step": 108720, "epoch": 2588} {"train_loss": -6.480251312255859, "global_step": 108721, "epoch": 2588} {"train_loss": -6.484963417053223, "global_step": 108722, "epoch": 2588} {"train_loss": -6.422390937805176, "global_step": 108723, "epoch": 2588} {"train_loss": -6.383240222930908, "global_step": 108724, "epoch": 2588} {"train_loss": -6.461297035217285, "global_step": 108725, "epoch": 2588} {"train_loss": -6.527901649475098, "global_step": 108726, "epoch": 2588} {"train_loss": -6.474885940551758, "global_step": 108727, "epoch": 2588} {"train_loss": -6.603944778442383, "global_step": 108728, "epoch": 2588} {"train_loss": -6.388920783996582, "global_step": 108729, "epoch": 2588} {"train_loss": -6.447904586791992, "global_step": 108730, "epoch": 2588} {"train_loss": -6.514216899871826, "global_step": 108731, "epoch": 2588} {"train_loss": -6.452960014343262, "global_step": 108732, "epoch": 2588} {"train_loss": -6.511165618896484, "global_step": 108733, "epoch": 2588} {"train_loss": -6.407010078430176, "global_step": 108734, "epoch": 2588} {"train_loss": -6.433379650115967, "global_step": 108735, "epoch": 2588} {"train_loss": -6.396740913391113, "global_step": 108736, "epoch": 2588} {"train_loss": -6.420251244590396, "global_step": 108737, "epoch": 2588, "val_loss": 64703.77734375} {"train_loss": -6.5632524490356445, "global_step": 108738, "epoch": 2589} {"train_loss": -6.452983856201172, "global_step": 108739, "epoch": 2589} {"train_loss": -6.4845685958862305, "global_step": 108740, "epoch": 2589} {"train_loss": -6.581439018249512, "global_step": 108741, "epoch": 2589} {"train_loss": -6.463762283325195, "global_step": 108742, "epoch": 2589} {"train_loss": -6.299333572387695, "global_step": 108743, "epoch": 2589} {"train_loss": -6.4638471603393555, "global_step": 108744, "epoch": 2589} {"train_loss": -6.489785194396973, "global_step": 108745, "epoch": 2589} {"train_loss": -6.54251766204834, "global_step": 108746, "epoch": 2589} {"train_loss": -6.582726955413818, "global_step": 108747, "epoch": 2589} {"train_loss": -6.528109550476074, "global_step": 108748, "epoch": 2589} {"train_loss": -6.392728328704834, "global_step": 108749, "epoch": 2589} {"train_loss": -6.448383808135986, "global_step": 108750, "epoch": 2589} {"train_loss": -6.417781829833984, "global_step": 108751, "epoch": 2589} {"train_loss": -6.4331841468811035, "global_step": 108752, "epoch": 2589} {"train_loss": -6.255916595458984, "global_step": 108753, "epoch": 2589} {"train_loss": -6.311105251312256, "global_step": 108754, "epoch": 2589} {"train_loss": -6.428983688354492, "global_step": 108755, "epoch": 2589} {"train_loss": -6.302657604217529, "global_step": 108756, "epoch": 2589} {"train_loss": -6.47120475769043, "global_step": 108757, "epoch": 2589} {"train_loss": -6.458122253417969, "global_step": 108758, "epoch": 2589} {"train_loss": -6.342612266540527, "global_step": 108759, "epoch": 2589} {"train_loss": -6.494095325469971, "global_step": 108760, "epoch": 2589} {"train_loss": -6.348995208740234, "global_step": 108761, "epoch": 2589} {"train_loss": -6.349900722503662, "global_step": 108762, "epoch": 2589} {"train_loss": -6.423321723937988, "global_step": 108763, "epoch": 2589} {"train_loss": -6.30842924118042, "global_step": 108764, "epoch": 2589} {"train_loss": -6.419488906860352, "global_step": 108765, "epoch": 2589} {"train_loss": -6.389520168304443, "global_step": 108766, "epoch": 2589} {"train_loss": -6.473598480224609, "global_step": 108767, "epoch": 2589} {"train_loss": -6.3183135986328125, "global_step": 108768, "epoch": 2589} {"train_loss": -6.326236724853516, "global_step": 108769, "epoch": 2589} {"train_loss": -6.446794033050537, "global_step": 108770, "epoch": 2589} {"train_loss": -6.392049789428711, "global_step": 108771, "epoch": 2589} {"train_loss": -6.373317718505859, "global_step": 108772, "epoch": 2589} {"train_loss": -6.372565269470215, "global_step": 108773, "epoch": 2589} {"train_loss": -6.435859680175781, "global_step": 108774, "epoch": 2589} {"train_loss": -6.335456371307373, "global_step": 108775, "epoch": 2589} {"train_loss": -6.470739841461182, "global_step": 108776, "epoch": 2589} {"train_loss": -6.566293716430664, "global_step": 108777, "epoch": 2589} {"train_loss": -6.419511795043945, "global_step": 108778, "epoch": 2589} {"train_loss": -6.425103380566552, "global_step": 108779, "epoch": 2589, "val_loss": 64789.3359375} {"train_loss": -6.430718421936035, "global_step": 108780, "epoch": 2590} {"train_loss": -6.377706527709961, "global_step": 108781, "epoch": 2590} {"train_loss": -6.430607795715332, "global_step": 108782, "epoch": 2590} {"train_loss": -6.404971599578857, "global_step": 108783, "epoch": 2590} {"train_loss": -6.379133224487305, "global_step": 108784, "epoch": 2590} {"train_loss": -6.36480712890625, "global_step": 108785, "epoch": 2590} {"train_loss": -6.489854335784912, "global_step": 108786, "epoch": 2590} {"train_loss": -6.552906036376953, "global_step": 108787, "epoch": 2590} {"train_loss": -6.444250583648682, "global_step": 108788, "epoch": 2590} {"train_loss": -6.572071075439453, "global_step": 108789, "epoch": 2590} {"train_loss": -6.415106296539307, "global_step": 108790, "epoch": 2590} {"train_loss": -6.50237512588501, "global_step": 108791, "epoch": 2590} {"train_loss": -6.575760364532471, "global_step": 108792, "epoch": 2590} {"train_loss": -6.45867919921875, "global_step": 108793, "epoch": 2590} {"train_loss": -6.502330303192139, "global_step": 108794, "epoch": 2590} {"train_loss": -6.477567672729492, "global_step": 108795, "epoch": 2590} {"train_loss": -6.4264655113220215, "global_step": 108796, "epoch": 2590} {"train_loss": -6.385807037353516, "global_step": 108797, "epoch": 2590} {"train_loss": -6.557778358459473, "global_step": 108798, "epoch": 2590} {"train_loss": -6.4706950187683105, "global_step": 108799, "epoch": 2590} {"train_loss": -6.44185209274292, "global_step": 108800, "epoch": 2590} {"train_loss": -6.450323104858398, "global_step": 108801, "epoch": 2590} {"train_loss": -6.4982171058654785, "global_step": 108802, "epoch": 2590} {"train_loss": -6.547152519226074, "global_step": 108803, "epoch": 2590} {"train_loss": -6.432708740234375, "global_step": 108804, "epoch": 2590} {"train_loss": -6.481825828552246, "global_step": 108805, "epoch": 2590} {"train_loss": -6.503672122955322, "global_step": 108806, "epoch": 2590} {"train_loss": -6.455939769744873, "global_step": 108807, "epoch": 2590} {"train_loss": -6.507301330566406, "global_step": 108808, "epoch": 2590} {"train_loss": -6.417207717895508, "global_step": 108809, "epoch": 2590} {"train_loss": -6.414175510406494, "global_step": 108810, "epoch": 2590} {"train_loss": -6.5704522132873535, "global_step": 108811, "epoch": 2590} {"train_loss": -6.521205425262451, "global_step": 108812, "epoch": 2590} {"train_loss": -6.411090850830078, "global_step": 108813, "epoch": 2590} {"train_loss": -6.503229141235352, "global_step": 108814, "epoch": 2590} {"train_loss": -6.4014692306518555, "global_step": 108815, "epoch": 2590} {"train_loss": -6.526894569396973, "global_step": 108816, "epoch": 2590} {"train_loss": -6.418814659118652, "global_step": 108817, "epoch": 2590} {"train_loss": -6.524918556213379, "global_step": 108818, "epoch": 2590} {"train_loss": -6.45616340637207, "global_step": 108819, "epoch": 2590} {"train_loss": -6.462349891662598, "global_step": 108820, "epoch": 2590} {"train_loss": -6.466611589704241, "global_step": 108821, "epoch": 2590, "val_loss": 64866.359375} {"train_loss": -6.521857738494873, "global_step": 108822, "epoch": 2591} {"train_loss": -6.514265060424805, "global_step": 108823, "epoch": 2591} {"train_loss": -6.556476593017578, "global_step": 108824, "epoch": 2591} {"train_loss": -6.554088592529297, "global_step": 108825, "epoch": 2591} {"train_loss": -6.4228057861328125, "global_step": 108826, "epoch": 2591} {"train_loss": -6.437138080596924, "global_step": 108827, "epoch": 2591} {"train_loss": -6.385151386260986, "global_step": 108828, "epoch": 2591} {"train_loss": -6.377811908721924, "global_step": 108829, "epoch": 2591} {"train_loss": -6.447220802307129, "global_step": 108830, "epoch": 2591} {"train_loss": -6.464012145996094, "global_step": 108831, "epoch": 2591} {"train_loss": -6.515658378601074, "global_step": 108832, "epoch": 2591} {"train_loss": -6.425745010375977, "global_step": 108833, "epoch": 2591} {"train_loss": -6.427252769470215, "global_step": 108834, "epoch": 2591} {"train_loss": -6.542649269104004, "global_step": 108835, "epoch": 2591} {"train_loss": -6.366613388061523, "global_step": 108836, "epoch": 2591} {"train_loss": -6.465949058532715, "global_step": 108837, "epoch": 2591} {"train_loss": -6.435796737670898, "global_step": 108838, "epoch": 2591} {"train_loss": -6.319721221923828, "global_step": 108839, "epoch": 2591} {"train_loss": -6.552204608917236, "global_step": 108840, "epoch": 2591} {"train_loss": -6.459568023681641, "global_step": 108841, "epoch": 2591} {"train_loss": -6.524191856384277, "global_step": 108842, "epoch": 2591} {"train_loss": -6.503105640411377, "global_step": 108843, "epoch": 2591} {"train_loss": -6.486085891723633, "global_step": 108844, "epoch": 2591} {"train_loss": -6.462185859680176, "global_step": 108845, "epoch": 2591} {"train_loss": -6.46142578125, "global_step": 108846, "epoch": 2591} {"train_loss": -6.4661054611206055, "global_step": 108847, "epoch": 2591} {"train_loss": -6.547601222991943, "global_step": 108848, "epoch": 2591} {"train_loss": -6.493361473083496, "global_step": 108849, "epoch": 2591} {"train_loss": -6.579918384552002, "global_step": 108850, "epoch": 2591} {"train_loss": -6.421657085418701, "global_step": 108851, "epoch": 2591} {"train_loss": -6.537441730499268, "global_step": 108852, "epoch": 2591} {"train_loss": -6.416770935058594, "global_step": 108853, "epoch": 2591} {"train_loss": -6.4153971672058105, "global_step": 108854, "epoch": 2591} {"train_loss": -6.268451690673828, "global_step": 108855, "epoch": 2591} {"train_loss": -6.473252296447754, "global_step": 108856, "epoch": 2591} {"train_loss": -6.393479347229004, "global_step": 108857, "epoch": 2591} {"train_loss": -6.202241897583008, "global_step": 108858, "epoch": 2591} {"train_loss": -6.529520511627197, "global_step": 108859, "epoch": 2591} {"train_loss": -6.383439064025879, "global_step": 108860, "epoch": 2591} {"train_loss": -6.343520164489746, "global_step": 108861, "epoch": 2591} {"train_loss": -6.517274856567383, "global_step": 108862, "epoch": 2591} {"train_loss": -6.4476489680153986, "global_step": 108863, "epoch": 2591, "val_loss": 64925.3203125} {"train_loss": -6.5272417068481445, "global_step": 108864, "epoch": 2592} {"train_loss": -6.411838531494141, "global_step": 108865, "epoch": 2592} {"train_loss": -6.378366470336914, "global_step": 108866, "epoch": 2592} {"train_loss": -6.429551601409912, "global_step": 108867, "epoch": 2592} {"train_loss": -6.387819766998291, "global_step": 108868, "epoch": 2592} {"train_loss": -6.469823360443115, "global_step": 108869, "epoch": 2592} {"train_loss": -6.4046478271484375, "global_step": 108870, "epoch": 2592} {"train_loss": -6.49697208404541, "global_step": 108871, "epoch": 2592} {"train_loss": -6.518899440765381, "global_step": 108872, "epoch": 2592} {"train_loss": -6.475439071655273, "global_step": 108873, "epoch": 2592} {"train_loss": -6.453366756439209, "global_step": 108874, "epoch": 2592} {"train_loss": -6.432010650634766, "global_step": 108875, "epoch": 2592} {"train_loss": -6.488504886627197, "global_step": 108876, "epoch": 2592} {"train_loss": -6.515685081481934, "global_step": 108877, "epoch": 2592} {"train_loss": -6.439913272857666, "global_step": 108878, "epoch": 2592} {"train_loss": -6.396496772766113, "global_step": 108879, "epoch": 2592} {"train_loss": -6.575547695159912, "global_step": 108880, "epoch": 2592} {"train_loss": -6.44623327255249, "global_step": 108881, "epoch": 2592} {"train_loss": -6.4002814292907715, "global_step": 108882, "epoch": 2592} {"train_loss": -6.508406639099121, "global_step": 108883, "epoch": 2592} {"train_loss": -6.369243144989014, "global_step": 108884, "epoch": 2592} {"train_loss": -6.407824516296387, "global_step": 108885, "epoch": 2592} {"train_loss": -6.451790809631348, "global_step": 108886, "epoch": 2592} {"train_loss": -6.3292155265808105, "global_step": 108887, "epoch": 2592} {"train_loss": -6.341896057128906, "global_step": 108888, "epoch": 2592} {"train_loss": -6.457643508911133, "global_step": 108889, "epoch": 2592} {"train_loss": -6.398285865783691, "global_step": 108890, "epoch": 2592} {"train_loss": -6.590765953063965, "global_step": 108891, "epoch": 2592} {"train_loss": -6.413626194000244, "global_step": 108892, "epoch": 2592} {"train_loss": -6.454398155212402, "global_step": 108893, "epoch": 2592} {"train_loss": -6.453782081604004, "global_step": 108894, "epoch": 2592} {"train_loss": -6.382133483886719, "global_step": 108895, "epoch": 2592} {"train_loss": -6.5957865715026855, "global_step": 108896, "epoch": 2592} {"train_loss": -6.470822334289551, "global_step": 108897, "epoch": 2592} {"train_loss": -6.43875789642334, "global_step": 108898, "epoch": 2592} {"train_loss": -6.43379020690918, "global_step": 108899, "epoch": 2592} {"train_loss": -6.483845233917236, "global_step": 108900, "epoch": 2592} {"train_loss": -6.585829257965088, "global_step": 108901, "epoch": 2592} {"train_loss": -6.455462455749512, "global_step": 108902, "epoch": 2592} {"train_loss": -6.4638519287109375, "global_step": 108903, "epoch": 2592} {"train_loss": -6.402172088623047, "global_step": 108904, "epoch": 2592} {"train_loss": -6.452296393258231, "global_step": 108905, "epoch": 2592, "val_loss": 64647.46875} {"train_loss": -6.540093898773193, "global_step": 108906, "epoch": 2593} {"train_loss": -6.353501796722412, "global_step": 108907, "epoch": 2593} {"train_loss": -6.402270317077637, "global_step": 108908, "epoch": 2593} {"train_loss": -6.57050895690918, "global_step": 108909, "epoch": 2593} {"train_loss": -6.42329740524292, "global_step": 108910, "epoch": 2593} {"train_loss": -6.332342147827148, "global_step": 108911, "epoch": 2593} {"train_loss": -6.515037536621094, "global_step": 108912, "epoch": 2593} {"train_loss": -6.409942150115967, "global_step": 108913, "epoch": 2593} {"train_loss": -6.359053611755371, "global_step": 108914, "epoch": 2593} {"train_loss": -6.46563720703125, "global_step": 108915, "epoch": 2593} {"train_loss": -6.4569573402404785, "global_step": 108916, "epoch": 2593} {"train_loss": -6.472578048706055, "global_step": 108917, "epoch": 2593} {"train_loss": -6.4323530197143555, "global_step": 108918, "epoch": 2593} {"train_loss": -6.463954925537109, "global_step": 108919, "epoch": 2593} {"train_loss": -6.485481262207031, "global_step": 108920, "epoch": 2593} {"train_loss": -6.399566650390625, "global_step": 108921, "epoch": 2593} {"train_loss": -6.343829154968262, "global_step": 108922, "epoch": 2593} {"train_loss": -6.450541973114014, "global_step": 108923, "epoch": 2593} {"train_loss": -6.509741306304932, "global_step": 108924, "epoch": 2593} {"train_loss": -6.450592041015625, "global_step": 108925, "epoch": 2593} {"train_loss": -6.411574363708496, "global_step": 108926, "epoch": 2593} {"train_loss": -6.482618808746338, "global_step": 108927, "epoch": 2593} {"train_loss": -6.4438910484313965, "global_step": 108928, "epoch": 2593} {"train_loss": -6.477533340454102, "global_step": 108929, "epoch": 2593} {"train_loss": -6.397162437438965, "global_step": 108930, "epoch": 2593} {"train_loss": -6.394840717315674, "global_step": 108931, "epoch": 2593} {"train_loss": -6.483536243438721, "global_step": 108932, "epoch": 2593} {"train_loss": -6.3518571853637695, "global_step": 108933, "epoch": 2593} {"train_loss": -6.295624256134033, "global_step": 108934, "epoch": 2593} {"train_loss": -6.534686088562012, "global_step": 108935, "epoch": 2593} {"train_loss": -6.305386543273926, "global_step": 108936, "epoch": 2593} {"train_loss": -6.519708633422852, "global_step": 108937, "epoch": 2593} {"train_loss": -6.534002304077148, "global_step": 108938, "epoch": 2593} {"train_loss": -6.195962905883789, "global_step": 108939, "epoch": 2593} {"train_loss": -6.4690327644348145, "global_step": 108940, "epoch": 2593} {"train_loss": -6.4191789627075195, "global_step": 108941, "epoch": 2593} {"train_loss": -6.3539018630981445, "global_step": 108942, "epoch": 2593} {"train_loss": -6.4862260818481445, "global_step": 108943, "epoch": 2593} {"train_loss": -6.388236045837402, "global_step": 108944, "epoch": 2593} {"train_loss": -6.393415451049805, "global_step": 108945, "epoch": 2593} {"train_loss": -6.322175979614258, "global_step": 108946, "epoch": 2593} {"train_loss": -6.424759376616705, "global_step": 108947, "epoch": 2593, "val_loss": 64720.1875} {"train_loss": -6.386700630187988, "global_step": 108948, "epoch": 2594} {"train_loss": -6.390828609466553, "global_step": 108949, "epoch": 2594} {"train_loss": -6.528940677642822, "global_step": 108950, "epoch": 2594} {"train_loss": -6.526172637939453, "global_step": 108951, "epoch": 2594} {"train_loss": -6.441376686096191, "global_step": 108952, "epoch": 2594} {"train_loss": -6.409773826599121, "global_step": 108953, "epoch": 2594} {"train_loss": -6.465987205505371, "global_step": 108954, "epoch": 2594} {"train_loss": -6.443752288818359, "global_step": 108955, "epoch": 2594} {"train_loss": -6.4755473136901855, "global_step": 108956, "epoch": 2594} {"train_loss": -6.411330223083496, "global_step": 108957, "epoch": 2594} {"train_loss": -6.445324897766113, "global_step": 108958, "epoch": 2594} {"train_loss": -6.64896821975708, "global_step": 108959, "epoch": 2594} {"train_loss": -6.345868110656738, "global_step": 108960, "epoch": 2594} {"train_loss": -6.410037040710449, "global_step": 108961, "epoch": 2594} {"train_loss": -6.40740966796875, "global_step": 108962, "epoch": 2594} {"train_loss": -6.285183429718018, "global_step": 108963, "epoch": 2594} {"train_loss": -6.550618648529053, "global_step": 108964, "epoch": 2594} {"train_loss": -6.373074531555176, "global_step": 108965, "epoch": 2594} {"train_loss": -6.533308029174805, "global_step": 108966, "epoch": 2594} {"train_loss": -6.441232681274414, "global_step": 108967, "epoch": 2594} {"train_loss": -6.410210609436035, "global_step": 108968, "epoch": 2594} {"train_loss": -6.428044319152832, "global_step": 108969, "epoch": 2594} {"train_loss": -6.365543842315674, "global_step": 108970, "epoch": 2594} {"train_loss": -6.349341869354248, "global_step": 108971, "epoch": 2594} {"train_loss": -6.3839287757873535, "global_step": 108972, "epoch": 2594} {"train_loss": -6.482098579406738, "global_step": 108973, "epoch": 2594} {"train_loss": -6.450984001159668, "global_step": 108974, "epoch": 2594} {"train_loss": -6.478925704956055, "global_step": 108975, "epoch": 2594} {"train_loss": -6.495755672454834, "global_step": 108976, "epoch": 2594} {"train_loss": -6.459298610687256, "global_step": 108977, "epoch": 2594} {"train_loss": -6.479888439178467, "global_step": 108978, "epoch": 2594} {"train_loss": -6.391695022583008, "global_step": 108979, "epoch": 2594} {"train_loss": -6.427391529083252, "global_step": 108980, "epoch": 2594} {"train_loss": -6.461723327636719, "global_step": 108981, "epoch": 2594} {"train_loss": -6.334616661071777, "global_step": 108982, "epoch": 2594} {"train_loss": -6.495889186859131, "global_step": 108983, "epoch": 2594} {"train_loss": -6.305153846740723, "global_step": 108984, "epoch": 2594} {"train_loss": -6.398685455322266, "global_step": 108985, "epoch": 2594} {"train_loss": -6.44204044342041, "global_step": 108986, "epoch": 2594} {"train_loss": -6.4614787101745605, "global_step": 108987, "epoch": 2594} {"train_loss": -6.438821315765381, "global_step": 108988, "epoch": 2594} {"train_loss": -6.4322469007401235, "global_step": 108989, "epoch": 2594, "val_loss": 65026.5390625} {"train_loss": -6.456203460693359, "global_step": 108990, "epoch": 2595} {"train_loss": -6.395273208618164, "global_step": 108991, "epoch": 2595} {"train_loss": -6.511837005615234, "global_step": 108992, "epoch": 2595} {"train_loss": -6.40109395980835, "global_step": 108993, "epoch": 2595} {"train_loss": -6.370316028594971, "global_step": 108994, "epoch": 2595} {"train_loss": -6.440051078796387, "global_step": 108995, "epoch": 2595} {"train_loss": -6.3209428787231445, "global_step": 108996, "epoch": 2595} {"train_loss": -6.279178619384766, "global_step": 108997, "epoch": 2595} {"train_loss": -6.465911388397217, "global_step": 108998, "epoch": 2595} {"train_loss": -6.287047386169434, "global_step": 108999, "epoch": 2595} {"train_loss": -6.328492641448975, "global_step": 109000, "epoch": 2595} {"train_loss": -6.481922149658203, "global_step": 109001, "epoch": 2595} {"train_loss": -6.379094123840332, "global_step": 109002, "epoch": 2595} {"train_loss": -6.467935562133789, "global_step": 109003, "epoch": 2595} {"train_loss": -6.249695777893066, "global_step": 109004, "epoch": 2595} {"train_loss": -6.411054611206055, "global_step": 109005, "epoch": 2595} {"train_loss": -6.354918956756592, "global_step": 109006, "epoch": 2595} {"train_loss": -6.3825483322143555, "global_step": 109007, "epoch": 2595} {"train_loss": -6.378037452697754, "global_step": 109008, "epoch": 2595} {"train_loss": -6.490956783294678, "global_step": 109009, "epoch": 2595} {"train_loss": -6.280726432800293, "global_step": 109010, "epoch": 2595} {"train_loss": -6.4772491455078125, "global_step": 109011, "epoch": 2595} {"train_loss": -6.365750789642334, "global_step": 109012, "epoch": 2595} {"train_loss": -6.4528303146362305, "global_step": 109013, "epoch": 2595} {"train_loss": -6.491735458374023, "global_step": 109014, "epoch": 2595} {"train_loss": -6.445119857788086, "global_step": 109015, "epoch": 2595} {"train_loss": -6.298440933227539, "global_step": 109016, "epoch": 2595} {"train_loss": -6.425535202026367, "global_step": 109017, "epoch": 2595} {"train_loss": -6.424622535705566, "global_step": 109018, "epoch": 2595} {"train_loss": -6.350028991699219, "global_step": 109019, "epoch": 2595} {"train_loss": -6.4824628829956055, "global_step": 109020, "epoch": 2595} {"train_loss": -6.471722602844238, "global_step": 109021, "epoch": 2595} {"train_loss": -6.373341083526611, "global_step": 109022, "epoch": 2595} {"train_loss": -6.336568355560303, "global_step": 109023, "epoch": 2595} {"train_loss": -6.477145195007324, "global_step": 109024, "epoch": 2595} {"train_loss": -6.39537239074707, "global_step": 109025, "epoch": 2595} {"train_loss": -6.391397476196289, "global_step": 109026, "epoch": 2595} {"train_loss": -6.520175933837891, "global_step": 109027, "epoch": 2595} {"train_loss": -6.583621978759766, "global_step": 109028, "epoch": 2595} {"train_loss": -6.514122009277344, "global_step": 109029, "epoch": 2595} {"train_loss": -6.427163124084473, "global_step": 109030, "epoch": 2595} {"train_loss": -6.413683085214524, "global_step": 109031, "epoch": 2595, "val_loss": 65023.640625} {"train_loss": -6.5422563552856445, "global_step": 109032, "epoch": 2596} {"train_loss": -6.49100399017334, "global_step": 109033, "epoch": 2596} {"train_loss": -6.520050048828125, "global_step": 109034, "epoch": 2596} {"train_loss": -6.44102668762207, "global_step": 109035, "epoch": 2596} {"train_loss": -6.442498683929443, "global_step": 109036, "epoch": 2596} {"train_loss": -6.416337013244629, "global_step": 109037, "epoch": 2596} {"train_loss": -6.56733512878418, "global_step": 109038, "epoch": 2596} {"train_loss": -6.505547523498535, "global_step": 109039, "epoch": 2596} {"train_loss": -6.323604106903076, "global_step": 109040, "epoch": 2596} {"train_loss": -6.5097432136535645, "global_step": 109041, "epoch": 2596} {"train_loss": -6.4770827293396, "global_step": 109042, "epoch": 2596} {"train_loss": -6.4880452156066895, "global_step": 109043, "epoch": 2596} {"train_loss": -6.474870204925537, "global_step": 109044, "epoch": 2596} {"train_loss": -6.3741350173950195, "global_step": 109045, "epoch": 2596} {"train_loss": -6.535493850708008, "global_step": 109046, "epoch": 2596} {"train_loss": -6.4396491050720215, "global_step": 109047, "epoch": 2596} {"train_loss": -6.4328765869140625, "global_step": 109048, "epoch": 2596} {"train_loss": -6.495491981506348, "global_step": 109049, "epoch": 2596} {"train_loss": -6.377349853515625, "global_step": 109050, "epoch": 2596} {"train_loss": -6.396002769470215, "global_step": 109051, "epoch": 2596} {"train_loss": -6.457561492919922, "global_step": 109052, "epoch": 2596} {"train_loss": -6.514074802398682, "global_step": 109053, "epoch": 2596} {"train_loss": -6.443933486938477, "global_step": 109054, "epoch": 2596} {"train_loss": -6.588992118835449, "global_step": 109055, "epoch": 2596} {"train_loss": -6.525657653808594, "global_step": 109056, "epoch": 2596} {"train_loss": -6.545131206512451, "global_step": 109057, "epoch": 2596} {"train_loss": -6.621280670166016, "global_step": 109058, "epoch": 2596} {"train_loss": -6.428463459014893, "global_step": 109059, "epoch": 2596} {"train_loss": -6.468705177307129, "global_step": 109060, "epoch": 2596} {"train_loss": -6.422573089599609, "global_step": 109061, "epoch": 2596} {"train_loss": -6.4554595947265625, "global_step": 109062, "epoch": 2596} {"train_loss": -6.483526229858398, "global_step": 109063, "epoch": 2596} {"train_loss": -6.51746940612793, "global_step": 109064, "epoch": 2596} {"train_loss": -6.496694564819336, "global_step": 109065, "epoch": 2596} {"train_loss": -6.534809112548828, "global_step": 109066, "epoch": 2596} {"train_loss": -6.465873718261719, "global_step": 109067, "epoch": 2596} {"train_loss": -6.559844017028809, "global_step": 109068, "epoch": 2596} {"train_loss": -6.495400905609131, "global_step": 109069, "epoch": 2596} {"train_loss": -6.51538610458374, "global_step": 109070, "epoch": 2596} {"train_loss": -6.494229316711426, "global_step": 109071, "epoch": 2596} {"train_loss": -6.534761905670166, "global_step": 109072, "epoch": 2596} {"train_loss": -6.484686351957775, "global_step": 109073, "epoch": 2596, "val_loss": 64755.21875} {"train_loss": -6.439621925354004, "global_step": 109074, "epoch": 2597} {"train_loss": -6.53776741027832, "global_step": 109075, "epoch": 2597} {"train_loss": -6.482945919036865, "global_step": 109076, "epoch": 2597} {"train_loss": -6.563216209411621, "global_step": 109077, "epoch": 2597} {"train_loss": -6.436139106750488, "global_step": 109078, "epoch": 2597} {"train_loss": -6.482426643371582, "global_step": 109079, "epoch": 2597} {"train_loss": -6.558495044708252, "global_step": 109080, "epoch": 2597} {"train_loss": -6.509308815002441, "global_step": 109081, "epoch": 2597} {"train_loss": -6.502985954284668, "global_step": 109082, "epoch": 2597} {"train_loss": -6.570509910583496, "global_step": 109083, "epoch": 2597} {"train_loss": -6.649064064025879, "global_step": 109084, "epoch": 2597} {"train_loss": -6.592101097106934, "global_step": 109085, "epoch": 2597} {"train_loss": -6.544194221496582, "global_step": 109086, "epoch": 2597} {"train_loss": -6.536327362060547, "global_step": 109087, "epoch": 2597} {"train_loss": -6.529730319976807, "global_step": 109088, "epoch": 2597} {"train_loss": -6.601191520690918, "global_step": 109089, "epoch": 2597} {"train_loss": -6.373086452484131, "global_step": 109090, "epoch": 2597} {"train_loss": -6.4874725341796875, "global_step": 109091, "epoch": 2597} {"train_loss": -6.581953048706055, "global_step": 109092, "epoch": 2597} {"train_loss": -6.542069911956787, "global_step": 109093, "epoch": 2597} {"train_loss": -6.455285549163818, "global_step": 109094, "epoch": 2597} {"train_loss": -6.553285598754883, "global_step": 109095, "epoch": 2597} {"train_loss": -6.479351043701172, "global_step": 109096, "epoch": 2597} {"train_loss": -6.504272937774658, "global_step": 109097, "epoch": 2597} {"train_loss": -6.419646263122559, "global_step": 109098, "epoch": 2597} {"train_loss": -6.499431610107422, "global_step": 109099, "epoch": 2597} {"train_loss": -6.462726593017578, "global_step": 109100, "epoch": 2597} {"train_loss": -6.459397315979004, "global_step": 109101, "epoch": 2597} {"train_loss": -6.52306604385376, "global_step": 109102, "epoch": 2597} {"train_loss": -6.453892230987549, "global_step": 109103, "epoch": 2597} {"train_loss": -6.463245391845703, "global_step": 109104, "epoch": 2597} {"train_loss": -6.48862361907959, "global_step": 109105, "epoch": 2597} {"train_loss": -6.543017387390137, "global_step": 109106, "epoch": 2597} {"train_loss": -6.384214401245117, "global_step": 109107, "epoch": 2597} {"train_loss": -6.573553085327148, "global_step": 109108, "epoch": 2597} {"train_loss": -6.479709148406982, "global_step": 109109, "epoch": 2597} {"train_loss": -6.420988082885742, "global_step": 109110, "epoch": 2597} {"train_loss": -6.60588264465332, "global_step": 109111, "epoch": 2597} {"train_loss": -6.436676025390625, "global_step": 109112, "epoch": 2597} {"train_loss": -6.480170249938965, "global_step": 109113, "epoch": 2597} {"train_loss": -6.470867156982422, "global_step": 109114, "epoch": 2597} {"train_loss": -6.501816431681315, "global_step": 109115, "epoch": 2597, "val_loss": 64827.26953125} {"train_loss": -6.5019145011901855, "global_step": 109116, "epoch": 2598} {"train_loss": -6.4388628005981445, "global_step": 109117, "epoch": 2598} {"train_loss": -6.476102828979492, "global_step": 109118, "epoch": 2598} {"train_loss": -6.456349849700928, "global_step": 109119, "epoch": 2598} {"train_loss": -6.5421037673950195, "global_step": 109120, "epoch": 2598} {"train_loss": -6.367208957672119, "global_step": 109121, "epoch": 2598} {"train_loss": -6.441648483276367, "global_step": 109122, "epoch": 2598} {"train_loss": -6.5627946853637695, "global_step": 109123, "epoch": 2598} {"train_loss": -6.504878997802734, "global_step": 109124, "epoch": 2598} {"train_loss": -6.502878189086914, "global_step": 109125, "epoch": 2598} {"train_loss": -6.518242835998535, "global_step": 109126, "epoch": 2598} {"train_loss": -6.486094951629639, "global_step": 109127, "epoch": 2598} {"train_loss": -6.420127868652344, "global_step": 109128, "epoch": 2598} {"train_loss": -6.543346881866455, "global_step": 109129, "epoch": 2598} {"train_loss": -6.4057841300964355, "global_step": 109130, "epoch": 2598} {"train_loss": -6.515273094177246, "global_step": 109131, "epoch": 2598} {"train_loss": -6.618834495544434, "global_step": 109132, "epoch": 2598} {"train_loss": -6.5364251136779785, "global_step": 109133, "epoch": 2598} {"train_loss": -6.5179948806762695, "global_step": 109134, "epoch": 2598} {"train_loss": -6.375593185424805, "global_step": 109135, "epoch": 2598} {"train_loss": -6.521810531616211, "global_step": 109136, "epoch": 2598} {"train_loss": -6.399563789367676, "global_step": 109137, "epoch": 2598} {"train_loss": -6.390256404876709, "global_step": 109138, "epoch": 2598} {"train_loss": -6.4112958908081055, "global_step": 109139, "epoch": 2598} {"train_loss": -6.495578289031982, "global_step": 109140, "epoch": 2598} {"train_loss": -6.435145854949951, "global_step": 109141, "epoch": 2598} {"train_loss": -6.530055046081543, "global_step": 109142, "epoch": 2598} {"train_loss": -6.6056623458862305, "global_step": 109143, "epoch": 2598} {"train_loss": -6.411224842071533, "global_step": 109144, "epoch": 2598} {"train_loss": -6.438913822174072, "global_step": 109145, "epoch": 2598} {"train_loss": -6.441429615020752, "global_step": 109146, "epoch": 2598} {"train_loss": -6.516156196594238, "global_step": 109147, "epoch": 2598} {"train_loss": -6.477473258972168, "global_step": 109148, "epoch": 2598} {"train_loss": -6.394108295440674, "global_step": 109149, "epoch": 2598} {"train_loss": -6.451554775238037, "global_step": 109150, "epoch": 2598} {"train_loss": -6.4595441818237305, "global_step": 109151, "epoch": 2598} {"train_loss": -6.567358016967773, "global_step": 109152, "epoch": 2598} {"train_loss": -6.438570976257324, "global_step": 109153, "epoch": 2598} {"train_loss": -6.3781585693359375, "global_step": 109154, "epoch": 2598} {"train_loss": -6.541365623474121, "global_step": 109155, "epoch": 2598} {"train_loss": -6.405964374542236, "global_step": 109156, "epoch": 2598} {"train_loss": -6.472523814155942, "global_step": 109157, "epoch": 2598, "val_loss": 64972.26953125} {"train_loss": -6.45551872253418, "global_step": 109158, "epoch": 2599} {"train_loss": -6.391781806945801, "global_step": 109159, "epoch": 2599} {"train_loss": -6.372656345367432, "global_step": 109160, "epoch": 2599} {"train_loss": -6.441819190979004, "global_step": 109161, "epoch": 2599} {"train_loss": -6.392788887023926, "global_step": 109162, "epoch": 2599} {"train_loss": -6.520185947418213, "global_step": 109163, "epoch": 2599} {"train_loss": -6.401980876922607, "global_step": 109164, "epoch": 2599} {"train_loss": -6.443785667419434, "global_step": 109165, "epoch": 2599} {"train_loss": -6.4911909103393555, "global_step": 109166, "epoch": 2599} {"train_loss": -6.329909801483154, "global_step": 109167, "epoch": 2599} {"train_loss": -6.472229957580566, "global_step": 109168, "epoch": 2599} {"train_loss": -6.453256607055664, "global_step": 109169, "epoch": 2599} {"train_loss": -6.457189559936523, "global_step": 109170, "epoch": 2599} {"train_loss": -6.461434364318848, "global_step": 109171, "epoch": 2599} {"train_loss": -6.472593307495117, "global_step": 109172, "epoch": 2599} {"train_loss": -6.568763732910156, "global_step": 109173, "epoch": 2599} {"train_loss": -6.546225547790527, "global_step": 109174, "epoch": 2599} {"train_loss": -6.535300254821777, "global_step": 109175, "epoch": 2599} {"train_loss": -6.471303939819336, "global_step": 109176, "epoch": 2599} {"train_loss": -6.475390434265137, "global_step": 109177, "epoch": 2599} {"train_loss": -6.460476875305176, "global_step": 109178, "epoch": 2599} {"train_loss": -6.464532375335693, "global_step": 109179, "epoch": 2599} {"train_loss": -6.459157943725586, "global_step": 109180, "epoch": 2599} {"train_loss": -6.4992523193359375, "global_step": 109181, "epoch": 2599} {"train_loss": -6.407290935516357, "global_step": 109182, "epoch": 2599} {"train_loss": -6.240569114685059, "global_step": 109183, "epoch": 2599} {"train_loss": -6.45003604888916, "global_step": 109184, "epoch": 2599} {"train_loss": -6.5034637451171875, "global_step": 109185, "epoch": 2599} {"train_loss": -6.470950603485107, "global_step": 109186, "epoch": 2599} {"train_loss": -6.394162654876709, "global_step": 109187, "epoch": 2599} {"train_loss": -6.3868088722229, "global_step": 109188, "epoch": 2599} {"train_loss": -6.398775100708008, "global_step": 109189, "epoch": 2599} {"train_loss": -6.413787841796875, "global_step": 109190, "epoch": 2599} {"train_loss": -6.453026294708252, "global_step": 109191, "epoch": 2599} {"train_loss": -6.531662464141846, "global_step": 109192, "epoch": 2599} {"train_loss": -6.344788551330566, "global_step": 109193, "epoch": 2599} {"train_loss": -6.394179821014404, "global_step": 109194, "epoch": 2599} {"train_loss": -6.366343975067139, "global_step": 109195, "epoch": 2599} {"train_loss": -6.438383102416992, "global_step": 109196, "epoch": 2599} {"train_loss": -6.531421661376953, "global_step": 109197, "epoch": 2599} {"train_loss": -6.530336380004883, "global_step": 109198, "epoch": 2599} {"train_loss": -6.446714957555135, "global_step": 109199, "epoch": 2599, "val_loss": 65221.76953125} {"train_loss": -6.444385051727295, "global_step": 109200, "epoch": 2600} {"train_loss": -6.475116729736328, "global_step": 109201, "epoch": 2600} {"train_loss": -6.3307342529296875, "global_step": 109202, "epoch": 2600} {"train_loss": -6.4867448806762695, "global_step": 109203, "epoch": 2600} {"train_loss": -6.4899067878723145, "global_step": 109204, "epoch": 2600} {"train_loss": -6.449026107788086, "global_step": 109205, "epoch": 2600} {"train_loss": -6.401410102844238, "global_step": 109206, "epoch": 2600} {"train_loss": -6.398128986358643, "global_step": 109207, "epoch": 2600} {"train_loss": -6.540994167327881, "global_step": 109208, "epoch": 2600} {"train_loss": -6.435122489929199, "global_step": 109209, "epoch": 2600} {"train_loss": -6.505788803100586, "global_step": 109210, "epoch": 2600} {"train_loss": -6.468628883361816, "global_step": 109211, "epoch": 2600} {"train_loss": -6.456595420837402, "global_step": 109212, "epoch": 2600} {"train_loss": -6.51097297668457, "global_step": 109213, "epoch": 2600} {"train_loss": -6.4936394691467285, "global_step": 109214, "epoch": 2600} {"train_loss": -6.390070915222168, "global_step": 109215, "epoch": 2600} {"train_loss": -6.485854148864746, "global_step": 109216, "epoch": 2600} {"train_loss": -6.498254776000977, "global_step": 109217, "epoch": 2600} {"train_loss": -6.511696815490723, "global_step": 109218, "epoch": 2600} {"train_loss": -6.472705841064453, "global_step": 109219, "epoch": 2600} {"train_loss": -6.475422382354736, "global_step": 109220, "epoch": 2600} {"train_loss": -6.47891902923584, "global_step": 109221, "epoch": 2600} {"train_loss": -6.469438076019287, "global_step": 109222, "epoch": 2600} {"train_loss": -6.4372429847717285, "global_step": 109223, "epoch": 2600} {"train_loss": -6.528312683105469, "global_step": 109224, "epoch": 2600} {"train_loss": -6.411794662475586, "global_step": 109225, "epoch": 2600} {"train_loss": -6.430697441101074, "global_step": 109226, "epoch": 2600} {"train_loss": -6.425942420959473, "global_step": 109227, "epoch": 2600} {"train_loss": -6.473573207855225, "global_step": 109228, "epoch": 2600} {"train_loss": -6.423327445983887, "global_step": 109229, "epoch": 2600} {"train_loss": -6.471208572387695, "global_step": 109230, "epoch": 2600} {"train_loss": -6.198702812194824, "global_step": 109231, "epoch": 2600} {"train_loss": -6.488912105560303, "global_step": 109232, "epoch": 2600} {"train_loss": -6.445008277893066, "global_step": 109233, "epoch": 2600} {"train_loss": -6.364612579345703, "global_step": 109234, "epoch": 2600} {"train_loss": -6.454366683959961, "global_step": 109235, "epoch": 2600} {"train_loss": -6.457577705383301, "global_step": 109236, "epoch": 2600} {"train_loss": -6.4879961013793945, "global_step": 109237, "epoch": 2600} {"train_loss": -6.53952693939209, "global_step": 109238, "epoch": 2600} {"train_loss": -6.464329719543457, "global_step": 109239, "epoch": 2600} {"train_loss": -6.458484172821045, "global_step": 109240, "epoch": 2600} {"train_loss": -6.456629071916852, "global_step": 109241, "epoch": 2600, "train/sim_max_reward_0": 0.1991785506736286, "train/sim_max_reward_1": 0.8637593776070972, "train/sim_max_reward_2": 0.9608119971583656, "train/sim_max_reward_3": 0.13795058176248118, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.8955658453742819, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5865143669308673, "test/sim_max_reward_4300002": 0.9612279829464985, "test/sim_max_reward_4300003": 0.9949761197747982, "test/sim_max_reward_4300004": 0.3332162275941879, "test/sim_max_reward_4300005": 0.9984709019986708, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.29389785563994514, "test/sim_max_reward_4300008": 0.9257020856024085, "test/sim_max_reward_4300009": 0.9887347520114103, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9708103775095278, "test/sim_max_reward_4300012": 0.9104198858304609, "test/sim_max_reward_4300013": 0.40576652993233037, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9830018230762636, "test/sim_max_reward_4300016": 1.0, "test/sim_max_reward_4300017": 0.9722452596971026, "test/sim_max_reward_4300018": 0.9326322227989536, "test/sim_max_reward_4300019": 0.18336971762867632, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.948118859297155, "test/sim_max_reward_4300022": 0.8913244985208486, "test/sim_max_reward_4300023": 0.886793879942847, "test/sim_max_reward_4300024": 0.8202038291034255, "test/sim_max_reward_4300025": 0.9099020674718621, "test/sim_max_reward_4300026": 0.9768726050154585, "test/sim_max_reward_4300027": 0.9394816208948188, "test/sim_max_reward_4300028": 0.9088913133081823, "test/sim_max_reward_4300029": 0.8065323597385553, "test/sim_max_reward_4300030": 0.09423920333453928, "test/sim_max_reward_4300031": 0.2204106801328182, "test/sim_max_reward_4300032": 0.9128837980219141, "test/sim_max_reward_4300033": 0.6949975964558234, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.8966622957019599, "test/sim_max_reward_4300036": 0.19920139830616873, "test/sim_max_reward_4300037": 0.9188260022044605, "test/sim_max_reward_4300038": 0.5656280224232354, "test/sim_max_reward_4300039": 0.9368102422642756, "test/sim_max_reward_4300040": 0.9231004211348017, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.9577951692138752, "test/sim_max_reward_4300043": 0.1401048407555109, "test/sim_max_reward_4300044": 0.9194331918745945, "test/sim_max_reward_4300045": 0.9533786804260176, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.14257641390813647, "test/sim_max_reward_4300048": 1.0, "test/sim_max_reward_4300049": 0.2550843332625472, "train/mean_score": 0.6762110587626425, "test/mean_score": 0.6652047886337187, "val_loss": 64819.140625} {"train_loss": -6.3982744216918945, "global_step": 109242, "epoch": 2601} {"train_loss": -6.501121997833252, "global_step": 109243, "epoch": 2601} {"train_loss": -6.435483455657959, "global_step": 109244, "epoch": 2601} {"train_loss": -6.486485004425049, "global_step": 109245, "epoch": 2601} {"train_loss": -6.497663497924805, "global_step": 109246, "epoch": 2601} {"train_loss": -6.460538864135742, "global_step": 109247, "epoch": 2601} {"train_loss": -6.455824375152588, "global_step": 109248, "epoch": 2601} {"train_loss": -6.452199935913086, "global_step": 109249, "epoch": 2601} {"train_loss": -6.50652551651001, "global_step": 109250, "epoch": 2601} {"train_loss": -6.5598859786987305, "global_step": 109251, "epoch": 2601} {"train_loss": -6.513376712799072, "global_step": 109252, "epoch": 2601} {"train_loss": -6.487130641937256, "global_step": 109253, "epoch": 2601} {"train_loss": -6.485149383544922, "global_step": 109254, "epoch": 2601} {"train_loss": -6.443417072296143, "global_step": 109255, "epoch": 2601} {"train_loss": -6.5086350440979, "global_step": 109256, "epoch": 2601} {"train_loss": -6.484119415283203, "global_step": 109257, "epoch": 2601} {"train_loss": -6.480412483215332, "global_step": 109258, "epoch": 2601} {"train_loss": -6.430712699890137, "global_step": 109259, "epoch": 2601} {"train_loss": -6.5547380447387695, "global_step": 109260, "epoch": 2601} {"train_loss": -6.546838283538818, "global_step": 109261, "epoch": 2601} {"train_loss": -6.407801151275635, "global_step": 109262, "epoch": 2601} {"train_loss": -6.538697242736816, "global_step": 109263, "epoch": 2601} {"train_loss": -6.484140872955322, "global_step": 109264, "epoch": 2601} {"train_loss": -6.428037643432617, "global_step": 109265, "epoch": 2601} {"train_loss": -6.457525253295898, "global_step": 109266, "epoch": 2601} {"train_loss": -6.501378059387207, "global_step": 109267, "epoch": 2601} {"train_loss": -6.512696266174316, "global_step": 109268, "epoch": 2601} {"train_loss": -6.537568092346191, "global_step": 109269, "epoch": 2601} {"train_loss": -6.498715400695801, "global_step": 109270, "epoch": 2601} {"train_loss": -6.478034019470215, "global_step": 109271, "epoch": 2601} {"train_loss": -6.53288459777832, "global_step": 109272, "epoch": 2601} {"train_loss": -6.313169479370117, "global_step": 109273, "epoch": 2601} {"train_loss": -6.568099021911621, "global_step": 109274, "epoch": 2601} {"train_loss": -6.5317816734313965, "global_step": 109275, "epoch": 2601} {"train_loss": -6.51035213470459, "global_step": 109276, "epoch": 2601} {"train_loss": -6.44218635559082, "global_step": 109277, "epoch": 2601} {"train_loss": -6.454866886138916, "global_step": 109278, "epoch": 2601} {"train_loss": -6.53288459777832, "global_step": 109279, "epoch": 2601} {"train_loss": -6.551592826843262, "global_step": 109280, "epoch": 2601} {"train_loss": -6.490743637084961, "global_step": 109281, "epoch": 2601} {"train_loss": -6.468223571777344, "global_step": 109282, "epoch": 2601} {"train_loss": -6.486019861130488, "global_step": 109283, "epoch": 2601, "val_loss": 64863.28125} {"train_loss": -6.539755821228027, "global_step": 109284, "epoch": 2602} {"train_loss": -6.408997058868408, "global_step": 109285, "epoch": 2602} {"train_loss": -6.355340003967285, "global_step": 109286, "epoch": 2602} {"train_loss": -6.302638053894043, "global_step": 109287, "epoch": 2602} {"train_loss": -6.422610282897949, "global_step": 109288, "epoch": 2602} {"train_loss": -6.480986595153809, "global_step": 109289, "epoch": 2602} {"train_loss": -6.502871513366699, "global_step": 109290, "epoch": 2602} {"train_loss": -6.340289115905762, "global_step": 109291, "epoch": 2602} {"train_loss": -6.42172908782959, "global_step": 109292, "epoch": 2602} {"train_loss": -6.479009628295898, "global_step": 109293, "epoch": 2602} {"train_loss": -6.376613616943359, "global_step": 109294, "epoch": 2602} {"train_loss": -6.449096202850342, "global_step": 109295, "epoch": 2602} {"train_loss": -6.438155174255371, "global_step": 109296, "epoch": 2602} {"train_loss": -6.515264511108398, "global_step": 109297, "epoch": 2602} {"train_loss": -6.43607234954834, "global_step": 109298, "epoch": 2602} {"train_loss": -6.47041130065918, "global_step": 109299, "epoch": 2602} {"train_loss": -6.543278217315674, "global_step": 109300, "epoch": 2602} {"train_loss": -6.487888336181641, "global_step": 109301, "epoch": 2602} {"train_loss": -6.517492294311523, "global_step": 109302, "epoch": 2602} {"train_loss": -6.515925407409668, "global_step": 109303, "epoch": 2602} {"train_loss": -6.507305145263672, "global_step": 109304, "epoch": 2602} {"train_loss": -6.578771591186523, "global_step": 109305, "epoch": 2602} {"train_loss": -6.498450756072998, "global_step": 109306, "epoch": 2602} {"train_loss": -6.534126281738281, "global_step": 109307, "epoch": 2602} {"train_loss": -6.50437593460083, "global_step": 109308, "epoch": 2602} {"train_loss": -6.51170539855957, "global_step": 109309, "epoch": 2602} {"train_loss": -6.476998329162598, "global_step": 109310, "epoch": 2602} {"train_loss": -6.3934326171875, "global_step": 109311, "epoch": 2602} {"train_loss": -6.408500671386719, "global_step": 109312, "epoch": 2602} {"train_loss": -6.473939418792725, "global_step": 109313, "epoch": 2602} {"train_loss": -6.567008972167969, "global_step": 109314, "epoch": 2602} {"train_loss": -6.572073936462402, "global_step": 109315, "epoch": 2602} {"train_loss": -6.425271987915039, "global_step": 109316, "epoch": 2602} {"train_loss": -6.491533279418945, "global_step": 109317, "epoch": 2602} {"train_loss": -6.373430252075195, "global_step": 109318, "epoch": 2602} {"train_loss": -6.516990661621094, "global_step": 109319, "epoch": 2602} {"train_loss": -6.441810607910156, "global_step": 109320, "epoch": 2602} {"train_loss": -6.531771659851074, "global_step": 109321, "epoch": 2602} {"train_loss": -6.439711570739746, "global_step": 109322, "epoch": 2602} {"train_loss": -6.459189414978027, "global_step": 109323, "epoch": 2602} {"train_loss": -6.470660209655762, "global_step": 109324, "epoch": 2602} {"train_loss": -6.470272563752674, "global_step": 109325, "epoch": 2602, "val_loss": 64879.47265625} {"train_loss": -6.528076171875, "global_step": 109326, "epoch": 2603} {"train_loss": -6.367031574249268, "global_step": 109327, "epoch": 2603} {"train_loss": -6.599428653717041, "global_step": 109328, "epoch": 2603} {"train_loss": -6.435380458831787, "global_step": 109329, "epoch": 2603} {"train_loss": -6.522025108337402, "global_step": 109330, "epoch": 2603} {"train_loss": -6.641086578369141, "global_step": 109331, "epoch": 2603} {"train_loss": -6.494274616241455, "global_step": 109332, "epoch": 2603} {"train_loss": -6.464210510253906, "global_step": 109333, "epoch": 2603} {"train_loss": -6.561567306518555, "global_step": 109334, "epoch": 2603} {"train_loss": -6.442022323608398, "global_step": 109335, "epoch": 2603} {"train_loss": -6.497308731079102, "global_step": 109336, "epoch": 2603} {"train_loss": -6.595919609069824, "global_step": 109337, "epoch": 2603} {"train_loss": -6.511634826660156, "global_step": 109338, "epoch": 2603} {"train_loss": -6.427222728729248, "global_step": 109339, "epoch": 2603} {"train_loss": -6.557031631469727, "global_step": 109340, "epoch": 2603} {"train_loss": -6.503754615783691, "global_step": 109341, "epoch": 2603} {"train_loss": -6.440434455871582, "global_step": 109342, "epoch": 2603} {"train_loss": -6.51563835144043, "global_step": 109343, "epoch": 2603} {"train_loss": -6.388178825378418, "global_step": 109344, "epoch": 2603} {"train_loss": -6.556428909301758, "global_step": 109345, "epoch": 2603} {"train_loss": -6.374256610870361, "global_step": 109346, "epoch": 2603} {"train_loss": -6.394924640655518, "global_step": 109347, "epoch": 2603} {"train_loss": -6.381918430328369, "global_step": 109348, "epoch": 2603} {"train_loss": -6.419835567474365, "global_step": 109349, "epoch": 2603} {"train_loss": -6.505138397216797, "global_step": 109350, "epoch": 2603} {"train_loss": -6.645412445068359, "global_step": 109351, "epoch": 2603} {"train_loss": -6.493216514587402, "global_step": 109352, "epoch": 2603} {"train_loss": -6.486312389373779, "global_step": 109353, "epoch": 2603} {"train_loss": -6.523371696472168, "global_step": 109354, "epoch": 2603} {"train_loss": -6.563567638397217, "global_step": 109355, "epoch": 2603} {"train_loss": -6.525118350982666, "global_step": 109356, "epoch": 2603} {"train_loss": -6.582681655883789, "global_step": 109357, "epoch": 2603} {"train_loss": -6.469602584838867, "global_step": 109358, "epoch": 2603} {"train_loss": -6.524331092834473, "global_step": 109359, "epoch": 2603} {"train_loss": -6.495283126831055, "global_step": 109360, "epoch": 2603} {"train_loss": -6.460930347442627, "global_step": 109361, "epoch": 2603} {"train_loss": -6.5155181884765625, "global_step": 109362, "epoch": 2603} {"train_loss": -6.461203098297119, "global_step": 109363, "epoch": 2603} {"train_loss": -6.433378219604492, "global_step": 109364, "epoch": 2603} {"train_loss": -6.340400218963623, "global_step": 109365, "epoch": 2603} {"train_loss": -6.479756832122803, "global_step": 109366, "epoch": 2603} {"train_loss": -6.4877148015158514, "global_step": 109367, "epoch": 2603, "val_loss": 64890.34375} {"train_loss": -6.41367769241333, "global_step": 109368, "epoch": 2604} {"train_loss": -6.504506587982178, "global_step": 109369, "epoch": 2604} {"train_loss": -6.394223213195801, "global_step": 109370, "epoch": 2604} {"train_loss": -6.424149513244629, "global_step": 109371, "epoch": 2604} {"train_loss": -6.475445747375488, "global_step": 109372, "epoch": 2604} {"train_loss": -6.497133255004883, "global_step": 109373, "epoch": 2604} {"train_loss": -6.398900032043457, "global_step": 109374, "epoch": 2604} {"train_loss": -6.397729873657227, "global_step": 109375, "epoch": 2604} {"train_loss": -6.436709403991699, "global_step": 109376, "epoch": 2604} {"train_loss": -6.500878810882568, "global_step": 109377, "epoch": 2604} {"train_loss": -6.451231956481934, "global_step": 109378, "epoch": 2604} {"train_loss": -6.402459144592285, "global_step": 109379, "epoch": 2604} {"train_loss": -6.536609649658203, "global_step": 109380, "epoch": 2604} {"train_loss": -6.41803503036499, "global_step": 109381, "epoch": 2604} {"train_loss": -6.461780548095703, "global_step": 109382, "epoch": 2604} {"train_loss": -6.475337982177734, "global_step": 109383, "epoch": 2604} {"train_loss": -6.467935562133789, "global_step": 109384, "epoch": 2604} {"train_loss": -6.446778297424316, "global_step": 109385, "epoch": 2604} {"train_loss": -6.549715995788574, "global_step": 109386, "epoch": 2604} {"train_loss": -6.495357513427734, "global_step": 109387, "epoch": 2604} {"train_loss": -6.406856536865234, "global_step": 109388, "epoch": 2604} {"train_loss": -6.458723068237305, "global_step": 109389, "epoch": 2604} {"train_loss": -6.444314002990723, "global_step": 109390, "epoch": 2604} {"train_loss": -6.562758445739746, "global_step": 109391, "epoch": 2604} {"train_loss": -6.568844795227051, "global_step": 109392, "epoch": 2604} {"train_loss": -6.468177795410156, "global_step": 109393, "epoch": 2604} {"train_loss": -6.484017372131348, "global_step": 109394, "epoch": 2604} {"train_loss": -6.434015274047852, "global_step": 109395, "epoch": 2604} {"train_loss": -6.574673175811768, "global_step": 109396, "epoch": 2604} {"train_loss": -6.502377510070801, "global_step": 109397, "epoch": 2604} {"train_loss": -6.437380313873291, "global_step": 109398, "epoch": 2604} {"train_loss": -6.390423774719238, "global_step": 109399, "epoch": 2604} {"train_loss": -6.414356231689453, "global_step": 109400, "epoch": 2604} {"train_loss": -6.39150333404541, "global_step": 109401, "epoch": 2604} {"train_loss": -6.439873695373535, "global_step": 109402, "epoch": 2604} {"train_loss": -6.347298622131348, "global_step": 109403, "epoch": 2604} {"train_loss": -6.469582557678223, "global_step": 109404, "epoch": 2604} {"train_loss": -6.427187442779541, "global_step": 109405, "epoch": 2604} {"train_loss": -6.544547080993652, "global_step": 109406, "epoch": 2604} {"train_loss": -6.435968399047852, "global_step": 109407, "epoch": 2604} {"train_loss": -6.451555252075195, "global_step": 109408, "epoch": 2604} {"train_loss": -6.457844790958223, "global_step": 109409, "epoch": 2604, "val_loss": 64809.62109375} {"train_loss": -6.434016704559326, "global_step": 109410, "epoch": 2605} {"train_loss": -6.38958740234375, "global_step": 109411, "epoch": 2605} {"train_loss": -6.42398738861084, "global_step": 109412, "epoch": 2605} {"train_loss": -6.498212814331055, "global_step": 109413, "epoch": 2605} {"train_loss": -6.433980464935303, "global_step": 109414, "epoch": 2605} {"train_loss": -6.50931453704834, "global_step": 109415, "epoch": 2605} {"train_loss": -6.585320949554443, "global_step": 109416, "epoch": 2605} {"train_loss": -6.581860542297363, "global_step": 109417, "epoch": 2605} {"train_loss": -6.400422096252441, "global_step": 109418, "epoch": 2605} {"train_loss": -6.5193681716918945, "global_step": 109419, "epoch": 2605} {"train_loss": -6.506825923919678, "global_step": 109420, "epoch": 2605} {"train_loss": -6.401819705963135, "global_step": 109421, "epoch": 2605} {"train_loss": -6.503763198852539, "global_step": 109422, "epoch": 2605} {"train_loss": -6.42580509185791, "global_step": 109423, "epoch": 2605} {"train_loss": -6.465740203857422, "global_step": 109424, "epoch": 2605} {"train_loss": -6.383086681365967, "global_step": 109425, "epoch": 2605} {"train_loss": -6.237584114074707, "global_step": 109426, "epoch": 2605} {"train_loss": -6.504328727722168, "global_step": 109427, "epoch": 2605} {"train_loss": -6.305426597595215, "global_step": 109428, "epoch": 2605} {"train_loss": -6.361108303070068, "global_step": 109429, "epoch": 2605} {"train_loss": -6.370992183685303, "global_step": 109430, "epoch": 2605} {"train_loss": -6.2563323974609375, "global_step": 109431, "epoch": 2605} {"train_loss": -6.368792533874512, "global_step": 109432, "epoch": 2605} {"train_loss": -6.349156379699707, "global_step": 109433, "epoch": 2605} {"train_loss": -6.35225248336792, "global_step": 109434, "epoch": 2605} {"train_loss": -6.377353668212891, "global_step": 109435, "epoch": 2605} {"train_loss": -6.293665885925293, "global_step": 109436, "epoch": 2605} {"train_loss": -6.3069047927856445, "global_step": 109437, "epoch": 2605} {"train_loss": -6.388161659240723, "global_step": 109438, "epoch": 2605} {"train_loss": -6.374406814575195, "global_step": 109439, "epoch": 2605} {"train_loss": -6.243617057800293, "global_step": 109440, "epoch": 2605} {"train_loss": -6.453107833862305, "global_step": 109441, "epoch": 2605} {"train_loss": -6.3958821296691895, "global_step": 109442, "epoch": 2605} {"train_loss": -6.279053688049316, "global_step": 109443, "epoch": 2605} {"train_loss": -6.34197998046875, "global_step": 109444, "epoch": 2605} {"train_loss": -6.38087797164917, "global_step": 109445, "epoch": 2605} {"train_loss": -6.480161666870117, "global_step": 109446, "epoch": 2605} {"train_loss": -6.360417366027832, "global_step": 109447, "epoch": 2605} {"train_loss": -6.366672515869141, "global_step": 109448, "epoch": 2605} {"train_loss": -6.304686546325684, "global_step": 109449, "epoch": 2605} {"train_loss": -6.361138820648193, "global_step": 109450, "epoch": 2605} {"train_loss": -6.395621583575294, "global_step": 109451, "epoch": 2605, "val_loss": 64961.98046875} {"train_loss": -6.4353227615356445, "global_step": 109452, "epoch": 2606} {"train_loss": -6.435820579528809, "global_step": 109453, "epoch": 2606} {"train_loss": -6.465907096862793, "global_step": 109454, "epoch": 2606} {"train_loss": -6.3961286544799805, "global_step": 109455, "epoch": 2606} {"train_loss": -6.411961078643799, "global_step": 109456, "epoch": 2606} {"train_loss": -6.462104320526123, "global_step": 109457, "epoch": 2606} {"train_loss": -6.464240074157715, "global_step": 109458, "epoch": 2606} {"train_loss": -6.435835838317871, "global_step": 109459, "epoch": 2606} {"train_loss": -6.418295860290527, "global_step": 109460, "epoch": 2606} {"train_loss": -6.463850498199463, "global_step": 109461, "epoch": 2606} {"train_loss": -6.518680572509766, "global_step": 109462, "epoch": 2606} {"train_loss": -6.593350410461426, "global_step": 109463, "epoch": 2606} {"train_loss": -6.5190205574035645, "global_step": 109464, "epoch": 2606} {"train_loss": -6.3925981521606445, "global_step": 109465, "epoch": 2606} {"train_loss": -6.438839435577393, "global_step": 109466, "epoch": 2606} {"train_loss": -6.322579860687256, "global_step": 109467, "epoch": 2606} {"train_loss": -6.503907203674316, "global_step": 109468, "epoch": 2606} {"train_loss": -6.417731285095215, "global_step": 109469, "epoch": 2606} {"train_loss": -6.448758125305176, "global_step": 109470, "epoch": 2606} {"train_loss": -6.451447486877441, "global_step": 109471, "epoch": 2606} {"train_loss": -6.3104448318481445, "global_step": 109472, "epoch": 2606} {"train_loss": -6.394838809967041, "global_step": 109473, "epoch": 2606} {"train_loss": -6.508349895477295, "global_step": 109474, "epoch": 2606} {"train_loss": -6.424994468688965, "global_step": 109475, "epoch": 2606} {"train_loss": -6.498249053955078, "global_step": 109476, "epoch": 2606} {"train_loss": -6.4416046142578125, "global_step": 109477, "epoch": 2606} {"train_loss": -6.477906703948975, "global_step": 109478, "epoch": 2606} {"train_loss": -6.5433759689331055, "global_step": 109479, "epoch": 2606} {"train_loss": -6.554535388946533, "global_step": 109480, "epoch": 2606} {"train_loss": -6.547461986541748, "global_step": 109481, "epoch": 2606} {"train_loss": -6.432344436645508, "global_step": 109482, "epoch": 2606} {"train_loss": -6.58970308303833, "global_step": 109483, "epoch": 2606} {"train_loss": -6.459074020385742, "global_step": 109484, "epoch": 2606} {"train_loss": -6.445392608642578, "global_step": 109485, "epoch": 2606} {"train_loss": -6.550571441650391, "global_step": 109486, "epoch": 2606} {"train_loss": -6.549217700958252, "global_step": 109487, "epoch": 2606} {"train_loss": -6.501230239868164, "global_step": 109488, "epoch": 2606} {"train_loss": -6.506547927856445, "global_step": 109489, "epoch": 2606} {"train_loss": -6.673112869262695, "global_step": 109490, "epoch": 2606} {"train_loss": -6.595965385437012, "global_step": 109491, "epoch": 2606} {"train_loss": -6.550703048706055, "global_step": 109492, "epoch": 2606} {"train_loss": -6.480853262401762, "global_step": 109493, "epoch": 2606, "val_loss": 64872.3046875} {"train_loss": -6.452724456787109, "global_step": 109494, "epoch": 2607} {"train_loss": -6.537911415100098, "global_step": 109495, "epoch": 2607} {"train_loss": -6.491686820983887, "global_step": 109496, "epoch": 2607} {"train_loss": -6.406950950622559, "global_step": 109497, "epoch": 2607} {"train_loss": -6.5924224853515625, "global_step": 109498, "epoch": 2607} {"train_loss": -6.436413764953613, "global_step": 109499, "epoch": 2607} {"train_loss": -6.565803527832031, "global_step": 109500, "epoch": 2607} {"train_loss": -6.517403602600098, "global_step": 109501, "epoch": 2607} {"train_loss": -6.474401473999023, "global_step": 109502, "epoch": 2607} {"train_loss": -6.534601211547852, "global_step": 109503, "epoch": 2607} {"train_loss": -6.555986404418945, "global_step": 109504, "epoch": 2607} {"train_loss": -6.399313449859619, "global_step": 109505, "epoch": 2607} {"train_loss": -6.459296226501465, "global_step": 109506, "epoch": 2607} {"train_loss": -6.512503623962402, "global_step": 109507, "epoch": 2607} {"train_loss": -6.420948505401611, "global_step": 109508, "epoch": 2607} {"train_loss": -6.457645416259766, "global_step": 109509, "epoch": 2607} {"train_loss": -6.395516395568848, "global_step": 109510, "epoch": 2607} {"train_loss": -6.379751205444336, "global_step": 109511, "epoch": 2607} {"train_loss": -6.489874839782715, "global_step": 109512, "epoch": 2607} {"train_loss": -6.416633129119873, "global_step": 109513, "epoch": 2607} {"train_loss": -6.339939594268799, "global_step": 109514, "epoch": 2607} {"train_loss": -6.529058933258057, "global_step": 109515, "epoch": 2607} {"train_loss": -6.268660068511963, "global_step": 109516, "epoch": 2607} {"train_loss": -6.522987365722656, "global_step": 109517, "epoch": 2607} {"train_loss": -6.491718292236328, "global_step": 109518, "epoch": 2607} {"train_loss": -6.454848289489746, "global_step": 109519, "epoch": 2607} {"train_loss": -6.414928913116455, "global_step": 109520, "epoch": 2607} {"train_loss": -6.386063098907471, "global_step": 109521, "epoch": 2607} {"train_loss": -6.488842964172363, "global_step": 109522, "epoch": 2607} {"train_loss": -6.4237060546875, "global_step": 109523, "epoch": 2607} {"train_loss": -6.3299431800842285, "global_step": 109524, "epoch": 2607} {"train_loss": -6.406457901000977, "global_step": 109525, "epoch": 2607} {"train_loss": -6.465415000915527, "global_step": 109526, "epoch": 2607} {"train_loss": -6.3692121505737305, "global_step": 109527, "epoch": 2607} {"train_loss": -6.405500411987305, "global_step": 109528, "epoch": 2607} {"train_loss": -6.5579423904418945, "global_step": 109529, "epoch": 2607} {"train_loss": -6.496676921844482, "global_step": 109530, "epoch": 2607} {"train_loss": -6.5109357833862305, "global_step": 109531, "epoch": 2607} {"train_loss": -6.453119277954102, "global_step": 109532, "epoch": 2607} {"train_loss": -6.4581708908081055, "global_step": 109533, "epoch": 2607} {"train_loss": -6.634949684143066, "global_step": 109534, "epoch": 2607} {"train_loss": -6.459680920555478, "global_step": 109535, "epoch": 2607, "val_loss": 65017.4453125} {"train_loss": -6.490169525146484, "global_step": 109536, "epoch": 2608} {"train_loss": -6.450371742248535, "global_step": 109537, "epoch": 2608} {"train_loss": -6.468935012817383, "global_step": 109538, "epoch": 2608} {"train_loss": -6.411669731140137, "global_step": 109539, "epoch": 2608} {"train_loss": -6.422748565673828, "global_step": 109540, "epoch": 2608} {"train_loss": -6.4175519943237305, "global_step": 109541, "epoch": 2608} {"train_loss": -6.541982650756836, "global_step": 109542, "epoch": 2608} {"train_loss": -6.495844841003418, "global_step": 109543, "epoch": 2608} {"train_loss": -6.505974292755127, "global_step": 109544, "epoch": 2608} {"train_loss": -6.490621566772461, "global_step": 109545, "epoch": 2608} {"train_loss": -6.422998905181885, "global_step": 109546, "epoch": 2608} {"train_loss": -6.4505720138549805, "global_step": 109547, "epoch": 2608} {"train_loss": -6.4950127601623535, "global_step": 109548, "epoch": 2608} {"train_loss": -6.4626288414001465, "global_step": 109549, "epoch": 2608} {"train_loss": -6.523512840270996, "global_step": 109550, "epoch": 2608} {"train_loss": -6.658027648925781, "global_step": 109551, "epoch": 2608} {"train_loss": -6.664346694946289, "global_step": 109552, "epoch": 2608} {"train_loss": -6.428651809692383, "global_step": 109553, "epoch": 2608} {"train_loss": -6.521278381347656, "global_step": 109554, "epoch": 2608} {"train_loss": -6.48426628112793, "global_step": 109555, "epoch": 2608} {"train_loss": -6.495877265930176, "global_step": 109556, "epoch": 2608} {"train_loss": -6.461756706237793, "global_step": 109557, "epoch": 2608} {"train_loss": -6.4931793212890625, "global_step": 109558, "epoch": 2608} {"train_loss": -6.508759021759033, "global_step": 109559, "epoch": 2608} {"train_loss": -6.453705787658691, "global_step": 109560, "epoch": 2608} {"train_loss": -6.555244445800781, "global_step": 109561, "epoch": 2608} {"train_loss": -6.414000511169434, "global_step": 109562, "epoch": 2608} {"train_loss": -6.577378273010254, "global_step": 109563, "epoch": 2608} {"train_loss": -6.430882453918457, "global_step": 109564, "epoch": 2608} {"train_loss": -6.490825176239014, "global_step": 109565, "epoch": 2608} {"train_loss": -6.447430610656738, "global_step": 109566, "epoch": 2608} {"train_loss": -6.457977294921875, "global_step": 109567, "epoch": 2608} {"train_loss": -6.456925392150879, "global_step": 109568, "epoch": 2608} {"train_loss": -6.456880569458008, "global_step": 109569, "epoch": 2608} {"train_loss": -6.5917558670043945, "global_step": 109570, "epoch": 2608} {"train_loss": -6.508261680603027, "global_step": 109571, "epoch": 2608} {"train_loss": -6.455758571624756, "global_step": 109572, "epoch": 2608} {"train_loss": -6.5303754806518555, "global_step": 109573, "epoch": 2608} {"train_loss": -6.396282196044922, "global_step": 109574, "epoch": 2608} {"train_loss": -6.41709566116333, "global_step": 109575, "epoch": 2608} {"train_loss": -6.407658100128174, "global_step": 109576, "epoch": 2608} {"train_loss": -6.482141188212803, "global_step": 109577, "epoch": 2608, "val_loss": 64823.0625} {"train_loss": -6.513485908508301, "global_step": 109578, "epoch": 2609} {"train_loss": -6.49929666519165, "global_step": 109579, "epoch": 2609} {"train_loss": -6.484981536865234, "global_step": 109580, "epoch": 2609} {"train_loss": -6.4028730392456055, "global_step": 109581, "epoch": 2609} {"train_loss": -6.415355682373047, "global_step": 109582, "epoch": 2609} {"train_loss": -6.506363868713379, "global_step": 109583, "epoch": 2609} {"train_loss": -6.414620876312256, "global_step": 109584, "epoch": 2609} {"train_loss": -6.494702339172363, "global_step": 109585, "epoch": 2609} {"train_loss": -6.636557579040527, "global_step": 109586, "epoch": 2609} {"train_loss": -6.480746746063232, "global_step": 109587, "epoch": 2609} {"train_loss": -6.5051984786987305, "global_step": 109588, "epoch": 2609} {"train_loss": -6.5238356590271, "global_step": 109589, "epoch": 2609} {"train_loss": -6.405460357666016, "global_step": 109590, "epoch": 2609} {"train_loss": -6.682394504547119, "global_step": 109591, "epoch": 2609} {"train_loss": -6.483578681945801, "global_step": 109592, "epoch": 2609} {"train_loss": -6.4303364753723145, "global_step": 109593, "epoch": 2609} {"train_loss": -6.496115207672119, "global_step": 109594, "epoch": 2609} {"train_loss": -6.498189449310303, "global_step": 109595, "epoch": 2609} {"train_loss": -6.453374862670898, "global_step": 109596, "epoch": 2609} {"train_loss": -6.490144729614258, "global_step": 109597, "epoch": 2609} {"train_loss": -6.575593948364258, "global_step": 109598, "epoch": 2609} {"train_loss": -6.4008684158325195, "global_step": 109599, "epoch": 2609} {"train_loss": -6.501302242279053, "global_step": 109600, "epoch": 2609} {"train_loss": -6.5638108253479, "global_step": 109601, "epoch": 2609} {"train_loss": -6.476891040802002, "global_step": 109602, "epoch": 2609} {"train_loss": -6.495366096496582, "global_step": 109603, "epoch": 2609} {"train_loss": -6.457982063293457, "global_step": 109604, "epoch": 2609} {"train_loss": -6.45913553237915, "global_step": 109605, "epoch": 2609} {"train_loss": -6.492345809936523, "global_step": 109606, "epoch": 2609} {"train_loss": -6.530356407165527, "global_step": 109607, "epoch": 2609} {"train_loss": -6.412332534790039, "global_step": 109608, "epoch": 2609} {"train_loss": -6.563065528869629, "global_step": 109609, "epoch": 2609} {"train_loss": -6.566349029541016, "global_step": 109610, "epoch": 2609} {"train_loss": -6.53961181640625, "global_step": 109611, "epoch": 2609} {"train_loss": -6.526350498199463, "global_step": 109612, "epoch": 2609} {"train_loss": -6.439815521240234, "global_step": 109613, "epoch": 2609} {"train_loss": -6.506366729736328, "global_step": 109614, "epoch": 2609} {"train_loss": -6.491147994995117, "global_step": 109615, "epoch": 2609} {"train_loss": -6.613992691040039, "global_step": 109616, "epoch": 2609} {"train_loss": -6.582523822784424, "global_step": 109617, "epoch": 2609} {"train_loss": -6.472333908081055, "global_step": 109618, "epoch": 2609} {"train_loss": -6.49924651781718, "global_step": 109619, "epoch": 2609, "val_loss": 64960.8203125} {"train_loss": -6.547721862792969, "global_step": 109620, "epoch": 2610} {"train_loss": -6.445863246917725, "global_step": 109621, "epoch": 2610} {"train_loss": -6.370040416717529, "global_step": 109622, "epoch": 2610} {"train_loss": -6.574398994445801, "global_step": 109623, "epoch": 2610} {"train_loss": -6.516812324523926, "global_step": 109624, "epoch": 2610} {"train_loss": -6.475903034210205, "global_step": 109625, "epoch": 2610} {"train_loss": -6.451858043670654, "global_step": 109626, "epoch": 2610} {"train_loss": -6.502190589904785, "global_step": 109627, "epoch": 2610} {"train_loss": -6.470280647277832, "global_step": 109628, "epoch": 2610} {"train_loss": -6.3852362632751465, "global_step": 109629, "epoch": 2610} {"train_loss": -6.541623115539551, "global_step": 109630, "epoch": 2610} {"train_loss": -6.4913434982299805, "global_step": 109631, "epoch": 2610} {"train_loss": -6.355278968811035, "global_step": 109632, "epoch": 2610} {"train_loss": -6.528229236602783, "global_step": 109633, "epoch": 2610} {"train_loss": -6.317812919616699, "global_step": 109634, "epoch": 2610} {"train_loss": -6.400995254516602, "global_step": 109635, "epoch": 2610} {"train_loss": -6.497068405151367, "global_step": 109636, "epoch": 2610} {"train_loss": -6.384124755859375, "global_step": 109637, "epoch": 2610} {"train_loss": -6.424991607666016, "global_step": 109638, "epoch": 2610} {"train_loss": -6.455011367797852, "global_step": 109639, "epoch": 2610} {"train_loss": -6.41459846496582, "global_step": 109640, "epoch": 2610} {"train_loss": -6.4241557121276855, "global_step": 109641, "epoch": 2610} {"train_loss": -6.471951007843018, "global_step": 109642, "epoch": 2610} {"train_loss": -6.518477916717529, "global_step": 109643, "epoch": 2610} {"train_loss": -6.425230026245117, "global_step": 109644, "epoch": 2610} {"train_loss": -6.529797554016113, "global_step": 109645, "epoch": 2610} {"train_loss": -6.469405651092529, "global_step": 109646, "epoch": 2610} {"train_loss": -6.5177106857299805, "global_step": 109647, "epoch": 2610} {"train_loss": -6.569387912750244, "global_step": 109648, "epoch": 2610} {"train_loss": -6.428296089172363, "global_step": 109649, "epoch": 2610} {"train_loss": -6.4628143310546875, "global_step": 109650, "epoch": 2610} {"train_loss": -6.557466983795166, "global_step": 109651, "epoch": 2610} {"train_loss": -6.419042587280273, "global_step": 109652, "epoch": 2610} {"train_loss": -6.478677749633789, "global_step": 109653, "epoch": 2610} {"train_loss": -6.370465278625488, "global_step": 109654, "epoch": 2610} {"train_loss": -6.484450340270996, "global_step": 109655, "epoch": 2610} {"train_loss": -6.4287872314453125, "global_step": 109656, "epoch": 2610} {"train_loss": -6.321210861206055, "global_step": 109657, "epoch": 2610} {"train_loss": -6.459585666656494, "global_step": 109658, "epoch": 2610} {"train_loss": -6.490772247314453, "global_step": 109659, "epoch": 2610} {"train_loss": -6.366218090057373, "global_step": 109660, "epoch": 2610} {"train_loss": -6.459345442908151, "global_step": 109661, "epoch": 2610, "val_loss": 65040.65234375} {"train_loss": -6.573391914367676, "global_step": 109662, "epoch": 2611} {"train_loss": -6.510266304016113, "global_step": 109663, "epoch": 2611} {"train_loss": -6.489452362060547, "global_step": 109664, "epoch": 2611} {"train_loss": -6.516848564147949, "global_step": 109665, "epoch": 2611} {"train_loss": -6.51260232925415, "global_step": 109666, "epoch": 2611} {"train_loss": -6.422633647918701, "global_step": 109667, "epoch": 2611} {"train_loss": -6.562994956970215, "global_step": 109668, "epoch": 2611} {"train_loss": -6.542176246643066, "global_step": 109669, "epoch": 2611} {"train_loss": -6.436147689819336, "global_step": 109670, "epoch": 2611} {"train_loss": -6.432468891143799, "global_step": 109671, "epoch": 2611} {"train_loss": -6.50439453125, "global_step": 109672, "epoch": 2611} {"train_loss": -6.341753005981445, "global_step": 109673, "epoch": 2611} {"train_loss": -6.4343414306640625, "global_step": 109674, "epoch": 2611} {"train_loss": -6.545684337615967, "global_step": 109675, "epoch": 2611} {"train_loss": -6.504094123840332, "global_step": 109676, "epoch": 2611} {"train_loss": -6.381648540496826, "global_step": 109677, "epoch": 2611} {"train_loss": -6.466245651245117, "global_step": 109678, "epoch": 2611} {"train_loss": -6.5224714279174805, "global_step": 109679, "epoch": 2611} {"train_loss": -6.510091781616211, "global_step": 109680, "epoch": 2611} {"train_loss": -6.363850116729736, "global_step": 109681, "epoch": 2611} {"train_loss": -6.385544776916504, "global_step": 109682, "epoch": 2611} {"train_loss": -6.498534202575684, "global_step": 109683, "epoch": 2611} {"train_loss": -6.484604835510254, "global_step": 109684, "epoch": 2611} {"train_loss": -6.492236137390137, "global_step": 109685, "epoch": 2611} {"train_loss": -6.480129718780518, "global_step": 109686, "epoch": 2611} {"train_loss": -6.37045955657959, "global_step": 109687, "epoch": 2611} {"train_loss": -6.377575397491455, "global_step": 109688, "epoch": 2611} {"train_loss": -6.372530937194824, "global_step": 109689, "epoch": 2611} {"train_loss": -6.3730926513671875, "global_step": 109690, "epoch": 2611} {"train_loss": -6.407983303070068, "global_step": 109691, "epoch": 2611} {"train_loss": -6.559972763061523, "global_step": 109692, "epoch": 2611} {"train_loss": -6.3599958419799805, "global_step": 109693, "epoch": 2611} {"train_loss": -6.4484148025512695, "global_step": 109694, "epoch": 2611} {"train_loss": -6.53498649597168, "global_step": 109695, "epoch": 2611} {"train_loss": -6.441539764404297, "global_step": 109696, "epoch": 2611} {"train_loss": -6.426748275756836, "global_step": 109697, "epoch": 2611} {"train_loss": -6.378090858459473, "global_step": 109698, "epoch": 2611} {"train_loss": -6.484898567199707, "global_step": 109699, "epoch": 2611} {"train_loss": -6.377276420593262, "global_step": 109700, "epoch": 2611} {"train_loss": -6.461161136627197, "global_step": 109701, "epoch": 2611} {"train_loss": -6.325597763061523, "global_step": 109702, "epoch": 2611} {"train_loss": -6.4555009092603415, "global_step": 109703, "epoch": 2611, "val_loss": 64879.95703125} {"train_loss": -6.555889129638672, "global_step": 109704, "epoch": 2612} {"train_loss": -6.352068901062012, "global_step": 109705, "epoch": 2612} {"train_loss": -6.502081871032715, "global_step": 109706, "epoch": 2612} {"train_loss": -6.46547794342041, "global_step": 109707, "epoch": 2612} {"train_loss": -6.462034225463867, "global_step": 109708, "epoch": 2612} {"train_loss": -6.501477241516113, "global_step": 109709, "epoch": 2612} {"train_loss": -6.518062114715576, "global_step": 109710, "epoch": 2612} {"train_loss": -6.399072170257568, "global_step": 109711, "epoch": 2612} {"train_loss": -6.5342583656311035, "global_step": 109712, "epoch": 2612} {"train_loss": -6.384793281555176, "global_step": 109713, "epoch": 2612} {"train_loss": -6.480364799499512, "global_step": 109714, "epoch": 2612} {"train_loss": -6.443984031677246, "global_step": 109715, "epoch": 2612} {"train_loss": -6.4346537590026855, "global_step": 109716, "epoch": 2612} {"train_loss": -6.564305305480957, "global_step": 109717, "epoch": 2612} {"train_loss": -6.4627299308776855, "global_step": 109718, "epoch": 2612} {"train_loss": -6.525739669799805, "global_step": 109719, "epoch": 2612} {"train_loss": -6.419075965881348, "global_step": 109720, "epoch": 2612} {"train_loss": -6.5723981857299805, "global_step": 109721, "epoch": 2612} {"train_loss": -6.563145637512207, "global_step": 109722, "epoch": 2612} {"train_loss": -6.452846527099609, "global_step": 109723, "epoch": 2612} {"train_loss": -6.391952037811279, "global_step": 109724, "epoch": 2612} {"train_loss": -6.525489807128906, "global_step": 109725, "epoch": 2612} {"train_loss": -6.53571081161499, "global_step": 109726, "epoch": 2612} {"train_loss": -6.443820476531982, "global_step": 109727, "epoch": 2612} {"train_loss": -6.589076995849609, "global_step": 109728, "epoch": 2612} {"train_loss": -6.538657188415527, "global_step": 109729, "epoch": 2612} {"train_loss": -6.504309177398682, "global_step": 109730, "epoch": 2612} {"train_loss": -6.5179901123046875, "global_step": 109731, "epoch": 2612} {"train_loss": -6.440450191497803, "global_step": 109732, "epoch": 2612} {"train_loss": -6.275831699371338, "global_step": 109733, "epoch": 2612} {"train_loss": -6.428091049194336, "global_step": 109734, "epoch": 2612} {"train_loss": -6.495664596557617, "global_step": 109735, "epoch": 2612} {"train_loss": -6.453445911407471, "global_step": 109736, "epoch": 2612} {"train_loss": -6.369086742401123, "global_step": 109737, "epoch": 2612} {"train_loss": -6.410064697265625, "global_step": 109738, "epoch": 2612} {"train_loss": -6.476543426513672, "global_step": 109739, "epoch": 2612} {"train_loss": -6.350625991821289, "global_step": 109740, "epoch": 2612} {"train_loss": -6.411679267883301, "global_step": 109741, "epoch": 2612} {"train_loss": -6.451827526092529, "global_step": 109742, "epoch": 2612} {"train_loss": -6.346256732940674, "global_step": 109743, "epoch": 2612} {"train_loss": -6.485273361206055, "global_step": 109744, "epoch": 2612} {"train_loss": -6.462204308736892, "global_step": 109745, "epoch": 2612, "val_loss": 64921.25} {"train_loss": -6.49990177154541, "global_step": 109746, "epoch": 2613} {"train_loss": -6.418561935424805, "global_step": 109747, "epoch": 2613} {"train_loss": -6.428441524505615, "global_step": 109748, "epoch": 2613} {"train_loss": -6.479172229766846, "global_step": 109749, "epoch": 2613} {"train_loss": -6.414735317230225, "global_step": 109750, "epoch": 2613} {"train_loss": -6.338757514953613, "global_step": 109751, "epoch": 2613} {"train_loss": -6.449470520019531, "global_step": 109752, "epoch": 2613} {"train_loss": -6.3614912033081055, "global_step": 109753, "epoch": 2613} {"train_loss": -6.437306880950928, "global_step": 109754, "epoch": 2613} {"train_loss": -6.355220794677734, "global_step": 109755, "epoch": 2613} {"train_loss": -6.519381523132324, "global_step": 109756, "epoch": 2613} {"train_loss": -6.478373050689697, "global_step": 109757, "epoch": 2613} {"train_loss": -6.481455326080322, "global_step": 109758, "epoch": 2613} {"train_loss": -6.420964241027832, "global_step": 109759, "epoch": 2613} {"train_loss": -6.438362121582031, "global_step": 109760, "epoch": 2613} {"train_loss": -6.469447135925293, "global_step": 109761, "epoch": 2613} {"train_loss": -6.579390525817871, "global_step": 109762, "epoch": 2613} {"train_loss": -6.523400783538818, "global_step": 109763, "epoch": 2613} {"train_loss": -6.3803205490112305, "global_step": 109764, "epoch": 2613} {"train_loss": -6.4361982345581055, "global_step": 109765, "epoch": 2613} {"train_loss": -6.605589866638184, "global_step": 109766, "epoch": 2613} {"train_loss": -6.411190032958984, "global_step": 109767, "epoch": 2613} {"train_loss": -6.420304298400879, "global_step": 109768, "epoch": 2613} {"train_loss": -6.388462543487549, "global_step": 109769, "epoch": 2613} {"train_loss": -6.391110420227051, "global_step": 109770, "epoch": 2613} {"train_loss": -6.471172332763672, "global_step": 109771, "epoch": 2613} {"train_loss": -6.44903564453125, "global_step": 109772, "epoch": 2613} {"train_loss": -6.44420051574707, "global_step": 109773, "epoch": 2613} {"train_loss": -6.500589370727539, "global_step": 109774, "epoch": 2613} {"train_loss": -6.39508056640625, "global_step": 109775, "epoch": 2613} {"train_loss": -6.4938812255859375, "global_step": 109776, "epoch": 2613} {"train_loss": -6.470117568969727, "global_step": 109777, "epoch": 2613} {"train_loss": -6.4785475730896, "global_step": 109778, "epoch": 2613} {"train_loss": -6.457876205444336, "global_step": 109779, "epoch": 2613} {"train_loss": -6.475557804107666, "global_step": 109780, "epoch": 2613} {"train_loss": -6.450549125671387, "global_step": 109781, "epoch": 2613} {"train_loss": -6.526777267456055, "global_step": 109782, "epoch": 2613} {"train_loss": -6.3960676193237305, "global_step": 109783, "epoch": 2613} {"train_loss": -6.536761283874512, "global_step": 109784, "epoch": 2613} {"train_loss": -6.422881126403809, "global_step": 109785, "epoch": 2613} {"train_loss": -6.458582878112793, "global_step": 109786, "epoch": 2613} {"train_loss": -6.4528102193559915, "global_step": 109787, "epoch": 2613, "val_loss": 64966.66015625} {"train_loss": -6.381962776184082, "global_step": 109788, "epoch": 2614} {"train_loss": -6.368938446044922, "global_step": 109789, "epoch": 2614} {"train_loss": -6.51032829284668, "global_step": 109790, "epoch": 2614} {"train_loss": -6.382173538208008, "global_step": 109791, "epoch": 2614} {"train_loss": -6.6033806800842285, "global_step": 109792, "epoch": 2614} {"train_loss": -6.331419467926025, "global_step": 109793, "epoch": 2614} {"train_loss": -6.263100624084473, "global_step": 109794, "epoch": 2614} {"train_loss": -6.428794860839844, "global_step": 109795, "epoch": 2614} {"train_loss": -6.266393184661865, "global_step": 109796, "epoch": 2614} {"train_loss": -6.384864807128906, "global_step": 109797, "epoch": 2614} {"train_loss": -6.205366611480713, "global_step": 109798, "epoch": 2614} {"train_loss": -6.260279178619385, "global_step": 109799, "epoch": 2614} {"train_loss": -6.455738067626953, "global_step": 109800, "epoch": 2614} {"train_loss": -6.381000518798828, "global_step": 109801, "epoch": 2614} {"train_loss": -6.265295505523682, "global_step": 109802, "epoch": 2614} {"train_loss": -6.268647193908691, "global_step": 109803, "epoch": 2614} {"train_loss": -6.433046340942383, "global_step": 109804, "epoch": 2614} {"train_loss": -6.295619010925293, "global_step": 109805, "epoch": 2614} {"train_loss": -6.314160346984863, "global_step": 109806, "epoch": 2614} {"train_loss": -6.418826103210449, "global_step": 109807, "epoch": 2614} {"train_loss": -6.287027359008789, "global_step": 109808, "epoch": 2614} {"train_loss": -6.395838260650635, "global_step": 109809, "epoch": 2614} {"train_loss": -6.324336051940918, "global_step": 109810, "epoch": 2614} {"train_loss": -6.467606544494629, "global_step": 109811, "epoch": 2614} {"train_loss": -6.339942932128906, "global_step": 109812, "epoch": 2614} {"train_loss": -6.371252536773682, "global_step": 109813, "epoch": 2614} {"train_loss": -6.40316104888916, "global_step": 109814, "epoch": 2614} {"train_loss": -6.381142616271973, "global_step": 109815, "epoch": 2614} {"train_loss": -6.325153350830078, "global_step": 109816, "epoch": 2614} {"train_loss": -6.458727836608887, "global_step": 109817, "epoch": 2614} {"train_loss": -6.440038681030273, "global_step": 109818, "epoch": 2614} {"train_loss": -6.479240417480469, "global_step": 109819, "epoch": 2614} {"train_loss": -6.371844291687012, "global_step": 109820, "epoch": 2614} {"train_loss": -6.499311447143555, "global_step": 109821, "epoch": 2614} {"train_loss": -6.455446243286133, "global_step": 109822, "epoch": 2614} {"train_loss": -6.424856185913086, "global_step": 109823, "epoch": 2614} {"train_loss": -6.476255416870117, "global_step": 109824, "epoch": 2614} {"train_loss": -6.49620246887207, "global_step": 109825, "epoch": 2614} {"train_loss": -6.430951118469238, "global_step": 109826, "epoch": 2614} {"train_loss": -6.457232475280762, "global_step": 109827, "epoch": 2614} {"train_loss": -6.3331146240234375, "global_step": 109828, "epoch": 2614} {"train_loss": -6.389148235321045, "global_step": 109829, "epoch": 2614, "val_loss": 64866.0} {"train_loss": -6.426824569702148, "global_step": 109830, "epoch": 2615} {"train_loss": -6.514103889465332, "global_step": 109831, "epoch": 2615} {"train_loss": -6.402451038360596, "global_step": 109832, "epoch": 2615} {"train_loss": -6.385464191436768, "global_step": 109833, "epoch": 2615} {"train_loss": -6.4470014572143555, "global_step": 109834, "epoch": 2615} {"train_loss": -6.33900260925293, "global_step": 109835, "epoch": 2615} {"train_loss": -6.465517044067383, "global_step": 109836, "epoch": 2615} {"train_loss": -6.439576625823975, "global_step": 109837, "epoch": 2615} {"train_loss": -6.5386152267456055, "global_step": 109838, "epoch": 2615} {"train_loss": -6.460996627807617, "global_step": 109839, "epoch": 2615} {"train_loss": -6.369123935699463, "global_step": 109840, "epoch": 2615} {"train_loss": -6.447494983673096, "global_step": 109841, "epoch": 2615} {"train_loss": -6.506336688995361, "global_step": 109842, "epoch": 2615} {"train_loss": -6.462166786193848, "global_step": 109843, "epoch": 2615} {"train_loss": -6.497325897216797, "global_step": 109844, "epoch": 2615} {"train_loss": -6.357048988342285, "global_step": 109845, "epoch": 2615} {"train_loss": -6.414011478424072, "global_step": 109846, "epoch": 2615} {"train_loss": -6.370821475982666, "global_step": 109847, "epoch": 2615} {"train_loss": -6.359176158905029, "global_step": 109848, "epoch": 2615} {"train_loss": -6.442478656768799, "global_step": 109849, "epoch": 2615} {"train_loss": -6.396574974060059, "global_step": 109850, "epoch": 2615} {"train_loss": -6.4284281730651855, "global_step": 109851, "epoch": 2615} {"train_loss": -6.4466657638549805, "global_step": 109852, "epoch": 2615} {"train_loss": -6.355260848999023, "global_step": 109853, "epoch": 2615} {"train_loss": -6.418789863586426, "global_step": 109854, "epoch": 2615} {"train_loss": -6.414417743682861, "global_step": 109855, "epoch": 2615} {"train_loss": -6.469507217407227, "global_step": 109856, "epoch": 2615} {"train_loss": -6.320580005645752, "global_step": 109857, "epoch": 2615} {"train_loss": -6.461520195007324, "global_step": 109858, "epoch": 2615} {"train_loss": -6.44081449508667, "global_step": 109859, "epoch": 2615} {"train_loss": -6.447628021240234, "global_step": 109860, "epoch": 2615} {"train_loss": -6.402927398681641, "global_step": 109861, "epoch": 2615} {"train_loss": -6.351690292358398, "global_step": 109862, "epoch": 2615} {"train_loss": -6.570262908935547, "global_step": 109863, "epoch": 2615} {"train_loss": -6.467687129974365, "global_step": 109864, "epoch": 2615} {"train_loss": -6.473392486572266, "global_step": 109865, "epoch": 2615} {"train_loss": -6.469377040863037, "global_step": 109866, "epoch": 2615} {"train_loss": -6.405272006988525, "global_step": 109867, "epoch": 2615} {"train_loss": -6.366239547729492, "global_step": 109868, "epoch": 2615} {"train_loss": -6.408953666687012, "global_step": 109869, "epoch": 2615} {"train_loss": -6.395380020141602, "global_step": 109870, "epoch": 2615} {"train_loss": -6.426929099219186, "global_step": 109871, "epoch": 2615, "val_loss": 64883.9921875} {"train_loss": -6.50338888168335, "global_step": 109872, "epoch": 2616} {"train_loss": -6.441032886505127, "global_step": 109873, "epoch": 2616} {"train_loss": -6.4174323081970215, "global_step": 109874, "epoch": 2616} {"train_loss": -6.565485954284668, "global_step": 109875, "epoch": 2616} {"train_loss": -6.404794692993164, "global_step": 109876, "epoch": 2616} {"train_loss": -6.500814914703369, "global_step": 109877, "epoch": 2616} {"train_loss": -6.281192302703857, "global_step": 109878, "epoch": 2616} {"train_loss": -6.449240684509277, "global_step": 109879, "epoch": 2616} {"train_loss": -6.388021469116211, "global_step": 109880, "epoch": 2616} {"train_loss": -6.266812801361084, "global_step": 109881, "epoch": 2616} {"train_loss": -6.377608299255371, "global_step": 109882, "epoch": 2616} {"train_loss": -6.4112701416015625, "global_step": 109883, "epoch": 2616} {"train_loss": -6.462356090545654, "global_step": 109884, "epoch": 2616} {"train_loss": -6.485517501831055, "global_step": 109885, "epoch": 2616} {"train_loss": -6.335426330566406, "global_step": 109886, "epoch": 2616} {"train_loss": -6.421614646911621, "global_step": 109887, "epoch": 2616} {"train_loss": -6.377924919128418, "global_step": 109888, "epoch": 2616} {"train_loss": -6.5253520011901855, "global_step": 109889, "epoch": 2616} {"train_loss": -6.391532897949219, "global_step": 109890, "epoch": 2616} {"train_loss": -6.516423225402832, "global_step": 109891, "epoch": 2616} {"train_loss": -6.488008499145508, "global_step": 109892, "epoch": 2616} {"train_loss": -6.519443511962891, "global_step": 109893, "epoch": 2616} {"train_loss": -6.42282247543335, "global_step": 109894, "epoch": 2616} {"train_loss": -6.500076770782471, "global_step": 109895, "epoch": 2616} {"train_loss": -6.4646759033203125, "global_step": 109896, "epoch": 2616} {"train_loss": -6.58327054977417, "global_step": 109897, "epoch": 2616} {"train_loss": -6.538231372833252, "global_step": 109898, "epoch": 2616} {"train_loss": -6.420660972595215, "global_step": 109899, "epoch": 2616} {"train_loss": -6.463923931121826, "global_step": 109900, "epoch": 2616} {"train_loss": -6.454092025756836, "global_step": 109901, "epoch": 2616} {"train_loss": -6.495962142944336, "global_step": 109902, "epoch": 2616} {"train_loss": -6.400146007537842, "global_step": 109903, "epoch": 2616} {"train_loss": -6.488238334655762, "global_step": 109904, "epoch": 2616} {"train_loss": -6.5439958572387695, "global_step": 109905, "epoch": 2616} {"train_loss": -6.5013861656188965, "global_step": 109906, "epoch": 2616} {"train_loss": -6.434497833251953, "global_step": 109907, "epoch": 2616} {"train_loss": -6.412985801696777, "global_step": 109908, "epoch": 2616} {"train_loss": -6.4905805587768555, "global_step": 109909, "epoch": 2616} {"train_loss": -6.407120227813721, "global_step": 109910, "epoch": 2616} {"train_loss": -6.5752739906311035, "global_step": 109911, "epoch": 2616} {"train_loss": -6.489902496337891, "global_step": 109912, "epoch": 2616} {"train_loss": -6.454136428378877, "global_step": 109913, "epoch": 2616, "val_loss": 64876.87109375} {"train_loss": -6.4542555809021, "global_step": 109914, "epoch": 2617} {"train_loss": -6.571150302886963, "global_step": 109915, "epoch": 2617} {"train_loss": -6.562811374664307, "global_step": 109916, "epoch": 2617} {"train_loss": -6.384516716003418, "global_step": 109917, "epoch": 2617} {"train_loss": -6.598649501800537, "global_step": 109918, "epoch": 2617} {"train_loss": -6.541028022766113, "global_step": 109919, "epoch": 2617} {"train_loss": -6.403546333312988, "global_step": 109920, "epoch": 2617} {"train_loss": -6.376171112060547, "global_step": 109921, "epoch": 2617} {"train_loss": -6.444957733154297, "global_step": 109922, "epoch": 2617} {"train_loss": -6.50982666015625, "global_step": 109923, "epoch": 2617} {"train_loss": -6.533713340759277, "global_step": 109924, "epoch": 2617} {"train_loss": -6.599031925201416, "global_step": 109925, "epoch": 2617} {"train_loss": -6.576720714569092, "global_step": 109926, "epoch": 2617} {"train_loss": -6.504919052124023, "global_step": 109927, "epoch": 2617} {"train_loss": -6.557201385498047, "global_step": 109928, "epoch": 2617} {"train_loss": -6.421998977661133, "global_step": 109929, "epoch": 2617} {"train_loss": -6.4497294425964355, "global_step": 109930, "epoch": 2617} {"train_loss": -6.518465042114258, "global_step": 109931, "epoch": 2617} {"train_loss": -6.509757041931152, "global_step": 109932, "epoch": 2617} {"train_loss": -6.483133316040039, "global_step": 109933, "epoch": 2617} {"train_loss": -6.563942909240723, "global_step": 109934, "epoch": 2617} {"train_loss": -6.509794235229492, "global_step": 109935, "epoch": 2617} {"train_loss": -6.523276329040527, "global_step": 109936, "epoch": 2617} {"train_loss": -6.552838325500488, "global_step": 109937, "epoch": 2617} {"train_loss": -6.580946445465088, "global_step": 109938, "epoch": 2617} {"train_loss": -6.409969329833984, "global_step": 109939, "epoch": 2617} {"train_loss": -6.516414642333984, "global_step": 109940, "epoch": 2617} {"train_loss": -6.393044471740723, "global_step": 109941, "epoch": 2617} {"train_loss": -6.428548812866211, "global_step": 109942, "epoch": 2617} {"train_loss": -6.450017929077148, "global_step": 109943, "epoch": 2617} {"train_loss": -6.472053050994873, "global_step": 109944, "epoch": 2617} {"train_loss": -6.37324333190918, "global_step": 109945, "epoch": 2617} {"train_loss": -6.508577346801758, "global_step": 109946, "epoch": 2617} {"train_loss": -6.407912731170654, "global_step": 109947, "epoch": 2617} {"train_loss": -6.451587200164795, "global_step": 109948, "epoch": 2617} {"train_loss": -6.600034713745117, "global_step": 109949, "epoch": 2617} {"train_loss": -6.4898505210876465, "global_step": 109950, "epoch": 2617} {"train_loss": -6.485648155212402, "global_step": 109951, "epoch": 2617} {"train_loss": -6.326001167297363, "global_step": 109952, "epoch": 2617} {"train_loss": -6.440662384033203, "global_step": 109953, "epoch": 2617} {"train_loss": -6.522169589996338, "global_step": 109954, "epoch": 2617} {"train_loss": -6.48781570934114, "global_step": 109955, "epoch": 2617, "val_loss": 65056.6640625} {"train_loss": -6.583812236785889, "global_step": 109956, "epoch": 2618} {"train_loss": -6.388698577880859, "global_step": 109957, "epoch": 2618} {"train_loss": -6.52873420715332, "global_step": 109958, "epoch": 2618} {"train_loss": -6.375783920288086, "global_step": 109959, "epoch": 2618} {"train_loss": -6.452897071838379, "global_step": 109960, "epoch": 2618} {"train_loss": -6.38004207611084, "global_step": 109961, "epoch": 2618} {"train_loss": -6.535418510437012, "global_step": 109962, "epoch": 2618} {"train_loss": -6.520460605621338, "global_step": 109963, "epoch": 2618} {"train_loss": -6.580221176147461, "global_step": 109964, "epoch": 2618} {"train_loss": -6.573453903198242, "global_step": 109965, "epoch": 2618} {"train_loss": -6.571720600128174, "global_step": 109966, "epoch": 2618} {"train_loss": -6.530414581298828, "global_step": 109967, "epoch": 2618} {"train_loss": -6.431031703948975, "global_step": 109968, "epoch": 2618} {"train_loss": -6.547365188598633, "global_step": 109969, "epoch": 2618} {"train_loss": -6.603022575378418, "global_step": 109970, "epoch": 2618} {"train_loss": -6.455376625061035, "global_step": 109971, "epoch": 2618} {"train_loss": -6.533087730407715, "global_step": 109972, "epoch": 2618} {"train_loss": -6.536134243011475, "global_step": 109973, "epoch": 2618} {"train_loss": -6.456752777099609, "global_step": 109974, "epoch": 2618} {"train_loss": -6.420472145080566, "global_step": 109975, "epoch": 2618} {"train_loss": -6.407573223114014, "global_step": 109976, "epoch": 2618} {"train_loss": -6.439160346984863, "global_step": 109977, "epoch": 2618} {"train_loss": -6.485060691833496, "global_step": 109978, "epoch": 2618} {"train_loss": -6.5250244140625, "global_step": 109979, "epoch": 2618} {"train_loss": -6.4413933753967285, "global_step": 109980, "epoch": 2618} {"train_loss": -6.509348392486572, "global_step": 109981, "epoch": 2618} {"train_loss": -6.51644229888916, "global_step": 109982, "epoch": 2618} {"train_loss": -6.5972900390625, "global_step": 109983, "epoch": 2618} {"train_loss": -6.520886421203613, "global_step": 109984, "epoch": 2618} {"train_loss": -6.567223072052002, "global_step": 109985, "epoch": 2618} {"train_loss": -6.52117395401001, "global_step": 109986, "epoch": 2618} {"train_loss": -6.4036078453063965, "global_step": 109987, "epoch": 2618} {"train_loss": -6.433145046234131, "global_step": 109988, "epoch": 2618} {"train_loss": -6.51484489440918, "global_step": 109989, "epoch": 2618} {"train_loss": -6.454322814941406, "global_step": 109990, "epoch": 2618} {"train_loss": -6.559878349304199, "global_step": 109991, "epoch": 2618} {"train_loss": -6.457685470581055, "global_step": 109992, "epoch": 2618} {"train_loss": -6.462142467498779, "global_step": 109993, "epoch": 2618} {"train_loss": -6.527743339538574, "global_step": 109994, "epoch": 2618} {"train_loss": -6.432408809661865, "global_step": 109995, "epoch": 2618} {"train_loss": -6.444187164306641, "global_step": 109996, "epoch": 2618} {"train_loss": -6.490569069271996, "global_step": 109997, "epoch": 2618, "val_loss": 64822.734375} {"train_loss": -6.4676923751831055, "global_step": 109998, "epoch": 2619} {"train_loss": -6.534664154052734, "global_step": 109999, "epoch": 2619} {"train_loss": -6.513514041900635, "global_step": 110000, "epoch": 2619} {"train_loss": -6.5049824714660645, "global_step": 110001, "epoch": 2619} {"train_loss": -6.4838972091674805, "global_step": 110002, "epoch": 2619} {"train_loss": -6.377668857574463, "global_step": 110003, "epoch": 2619} {"train_loss": -6.540979862213135, "global_step": 110004, "epoch": 2619} {"train_loss": -6.386451721191406, "global_step": 110005, "epoch": 2619} {"train_loss": -6.404787063598633, "global_step": 110006, "epoch": 2619} {"train_loss": -6.411634922027588, "global_step": 110007, "epoch": 2619} {"train_loss": -6.365655422210693, "global_step": 110008, "epoch": 2619} {"train_loss": -6.57719612121582, "global_step": 110009, "epoch": 2619} {"train_loss": -6.501585960388184, "global_step": 110010, "epoch": 2619} {"train_loss": -6.433121681213379, "global_step": 110011, "epoch": 2619} {"train_loss": -6.538888931274414, "global_step": 110012, "epoch": 2619} {"train_loss": -6.423921585083008, "global_step": 110013, "epoch": 2619} {"train_loss": -6.5548529624938965, "global_step": 110014, "epoch": 2619} {"train_loss": -6.4411516189575195, "global_step": 110015, "epoch": 2619} {"train_loss": -6.459342956542969, "global_step": 110016, "epoch": 2619} {"train_loss": -6.3930463790893555, "global_step": 110017, "epoch": 2619} {"train_loss": -6.455829620361328, "global_step": 110018, "epoch": 2619} {"train_loss": -6.529172420501709, "global_step": 110019, "epoch": 2619} {"train_loss": -6.484140396118164, "global_step": 110020, "epoch": 2619} {"train_loss": -6.452110290527344, "global_step": 110021, "epoch": 2619} {"train_loss": -6.450046062469482, "global_step": 110022, "epoch": 2619} {"train_loss": -6.381264686584473, "global_step": 110023, "epoch": 2619} {"train_loss": -6.534090042114258, "global_step": 110024, "epoch": 2619} {"train_loss": -6.541831016540527, "global_step": 110025, "epoch": 2619} {"train_loss": -6.5299272537231445, "global_step": 110026, "epoch": 2619} {"train_loss": -6.411371231079102, "global_step": 110027, "epoch": 2619} {"train_loss": -6.342095851898193, "global_step": 110028, "epoch": 2619} {"train_loss": -6.433786392211914, "global_step": 110029, "epoch": 2619} {"train_loss": -6.493019104003906, "global_step": 110030, "epoch": 2619} {"train_loss": -6.43798303604126, "global_step": 110031, "epoch": 2619} {"train_loss": -6.391709804534912, "global_step": 110032, "epoch": 2619} {"train_loss": -6.5569562911987305, "global_step": 110033, "epoch": 2619} {"train_loss": -6.412178039550781, "global_step": 110034, "epoch": 2619} {"train_loss": -6.417837142944336, "global_step": 110035, "epoch": 2619} {"train_loss": -6.486040115356445, "global_step": 110036, "epoch": 2619} {"train_loss": -6.437201976776123, "global_step": 110037, "epoch": 2619} {"train_loss": -6.357576370239258, "global_step": 110038, "epoch": 2619} {"train_loss": -6.456614778155372, "global_step": 110039, "epoch": 2619, "val_loss": 65124.92578125} {"train_loss": -6.496248245239258, "global_step": 110040, "epoch": 2620} {"train_loss": -6.349365234375, "global_step": 110041, "epoch": 2620} {"train_loss": -6.314150810241699, "global_step": 110042, "epoch": 2620} {"train_loss": -6.481891632080078, "global_step": 110043, "epoch": 2620} {"train_loss": -6.450135707855225, "global_step": 110044, "epoch": 2620} {"train_loss": -6.529010772705078, "global_step": 110045, "epoch": 2620} {"train_loss": -6.539318084716797, "global_step": 110046, "epoch": 2620} {"train_loss": -6.520245552062988, "global_step": 110047, "epoch": 2620} {"train_loss": -6.457269668579102, "global_step": 110048, "epoch": 2620} {"train_loss": -6.406673908233643, "global_step": 110049, "epoch": 2620} {"train_loss": -6.321539402008057, "global_step": 110050, "epoch": 2620} {"train_loss": -6.359753131866455, "global_step": 110051, "epoch": 2620} {"train_loss": -6.434711933135986, "global_step": 110052, "epoch": 2620} {"train_loss": -6.346564769744873, "global_step": 110053, "epoch": 2620} {"train_loss": -6.509684085845947, "global_step": 110054, "epoch": 2620} {"train_loss": -6.30073881149292, "global_step": 110055, "epoch": 2620} {"train_loss": -6.411821365356445, "global_step": 110056, "epoch": 2620} {"train_loss": -6.474891662597656, "global_step": 110057, "epoch": 2620} {"train_loss": -6.422194957733154, "global_step": 110058, "epoch": 2620} {"train_loss": -6.393212795257568, "global_step": 110059, "epoch": 2620} {"train_loss": -6.462808609008789, "global_step": 110060, "epoch": 2620} {"train_loss": -6.378954887390137, "global_step": 110061, "epoch": 2620} {"train_loss": -6.416589736938477, "global_step": 110062, "epoch": 2620} {"train_loss": -6.441056728363037, "global_step": 110063, "epoch": 2620} {"train_loss": -6.493411064147949, "global_step": 110064, "epoch": 2620} {"train_loss": -6.366416931152344, "global_step": 110065, "epoch": 2620} {"train_loss": -6.3890180587768555, "global_step": 110066, "epoch": 2620} {"train_loss": -6.422296047210693, "global_step": 110067, "epoch": 2620} {"train_loss": -6.461215972900391, "global_step": 110068, "epoch": 2620} {"train_loss": -6.392665863037109, "global_step": 110069, "epoch": 2620} {"train_loss": -6.397319793701172, "global_step": 110070, "epoch": 2620} {"train_loss": -6.468364715576172, "global_step": 110071, "epoch": 2620} {"train_loss": -6.502366065979004, "global_step": 110072, "epoch": 2620} {"train_loss": -6.59174919128418, "global_step": 110073, "epoch": 2620} {"train_loss": -6.537670612335205, "global_step": 110074, "epoch": 2620} {"train_loss": -6.434579849243164, "global_step": 110075, "epoch": 2620} {"train_loss": -6.373719215393066, "global_step": 110076, "epoch": 2620} {"train_loss": -6.337355613708496, "global_step": 110077, "epoch": 2620} {"train_loss": -6.435502052307129, "global_step": 110078, "epoch": 2620} {"train_loss": -6.454704761505127, "global_step": 110079, "epoch": 2620} {"train_loss": -6.584325790405273, "global_step": 110080, "epoch": 2620} {"train_loss": -6.438423156738281, "global_step": 110081, "epoch": 2620, "val_loss": 64883.99609375} {"train_loss": -6.554204940795898, "global_step": 110082, "epoch": 2621} {"train_loss": -6.569622993469238, "global_step": 110083, "epoch": 2621} {"train_loss": -6.568701267242432, "global_step": 110084, "epoch": 2621} {"train_loss": -6.494336128234863, "global_step": 110085, "epoch": 2621} {"train_loss": -6.600712776184082, "global_step": 110086, "epoch": 2621} {"train_loss": -6.405712604522705, "global_step": 110087, "epoch": 2621} {"train_loss": -6.505525588989258, "global_step": 110088, "epoch": 2621} {"train_loss": -6.46919584274292, "global_step": 110089, "epoch": 2621} {"train_loss": -6.53938102722168, "global_step": 110090, "epoch": 2621} {"train_loss": -6.442647457122803, "global_step": 110091, "epoch": 2621} {"train_loss": -6.5371785163879395, "global_step": 110092, "epoch": 2621} {"train_loss": -6.513378620147705, "global_step": 110093, "epoch": 2621} {"train_loss": -6.51186466217041, "global_step": 110094, "epoch": 2621} {"train_loss": -6.684627056121826, "global_step": 110095, "epoch": 2621} {"train_loss": -6.52464485168457, "global_step": 110096, "epoch": 2621} {"train_loss": -6.44941520690918, "global_step": 110097, "epoch": 2621} {"train_loss": -6.490495681762695, "global_step": 110098, "epoch": 2621} {"train_loss": -6.4706878662109375, "global_step": 110099, "epoch": 2621} {"train_loss": -6.485698699951172, "global_step": 110100, "epoch": 2621} {"train_loss": -6.6335530281066895, "global_step": 110101, "epoch": 2621} {"train_loss": -6.488557815551758, "global_step": 110102, "epoch": 2621} {"train_loss": -6.6233062744140625, "global_step": 110103, "epoch": 2621} {"train_loss": -6.530045509338379, "global_step": 110104, "epoch": 2621} {"train_loss": -6.549533843994141, "global_step": 110105, "epoch": 2621} {"train_loss": -6.61644172668457, "global_step": 110106, "epoch": 2621} {"train_loss": -6.430901527404785, "global_step": 110107, "epoch": 2621} {"train_loss": -6.452031135559082, "global_step": 110108, "epoch": 2621} {"train_loss": -6.498147964477539, "global_step": 110109, "epoch": 2621} {"train_loss": -6.463683605194092, "global_step": 110110, "epoch": 2621} {"train_loss": -6.49008846282959, "global_step": 110111, "epoch": 2621} {"train_loss": -6.621376991271973, "global_step": 110112, "epoch": 2621} {"train_loss": -6.536277770996094, "global_step": 110113, "epoch": 2621} {"train_loss": -6.431065082550049, "global_step": 110114, "epoch": 2621} {"train_loss": -6.46324348449707, "global_step": 110115, "epoch": 2621} {"train_loss": -6.432060241699219, "global_step": 110116, "epoch": 2621} {"train_loss": -6.544255256652832, "global_step": 110117, "epoch": 2621} {"train_loss": -6.57222843170166, "global_step": 110118, "epoch": 2621} {"train_loss": -6.478891372680664, "global_step": 110119, "epoch": 2621} {"train_loss": -6.523367881774902, "global_step": 110120, "epoch": 2621} {"train_loss": -6.493935585021973, "global_step": 110121, "epoch": 2621} {"train_loss": -6.465363502502441, "global_step": 110122, "epoch": 2621} {"train_loss": -6.516862630844116, "global_step": 110123, "epoch": 2621, "val_loss": 64932.5234375} {"train_loss": -6.557504177093506, "global_step": 110124, "epoch": 2622} {"train_loss": -6.4205169677734375, "global_step": 110125, "epoch": 2622} {"train_loss": -6.542422294616699, "global_step": 110126, "epoch": 2622} {"train_loss": -6.508476734161377, "global_step": 110127, "epoch": 2622} {"train_loss": -6.4652204513549805, "global_step": 110128, "epoch": 2622} {"train_loss": -6.484441757202148, "global_step": 110129, "epoch": 2622} {"train_loss": -6.496255397796631, "global_step": 110130, "epoch": 2622} {"train_loss": -6.390557289123535, "global_step": 110131, "epoch": 2622} {"train_loss": -6.516290664672852, "global_step": 110132, "epoch": 2622} {"train_loss": -6.4871134757995605, "global_step": 110133, "epoch": 2622} {"train_loss": -6.583431720733643, "global_step": 110134, "epoch": 2622} {"train_loss": -6.364286422729492, "global_step": 110135, "epoch": 2622} {"train_loss": -6.532008171081543, "global_step": 110136, "epoch": 2622} {"train_loss": -6.522187232971191, "global_step": 110137, "epoch": 2622} {"train_loss": -6.489682674407959, "global_step": 110138, "epoch": 2622} {"train_loss": -6.45652437210083, "global_step": 110139, "epoch": 2622} {"train_loss": -6.411403656005859, "global_step": 110140, "epoch": 2622} {"train_loss": -6.454869747161865, "global_step": 110141, "epoch": 2622} {"train_loss": -6.491912841796875, "global_step": 110142, "epoch": 2622} {"train_loss": -6.606869697570801, "global_step": 110143, "epoch": 2622} {"train_loss": -6.4296345710754395, "global_step": 110144, "epoch": 2622} {"train_loss": -6.454240798950195, "global_step": 110145, "epoch": 2622} {"train_loss": -6.4469146728515625, "global_step": 110146, "epoch": 2622} {"train_loss": -6.400897979736328, "global_step": 110147, "epoch": 2622} {"train_loss": -6.3256964683532715, "global_step": 110148, "epoch": 2622} {"train_loss": -6.51933479309082, "global_step": 110149, "epoch": 2622} {"train_loss": -6.498889923095703, "global_step": 110150, "epoch": 2622} {"train_loss": -6.398900508880615, "global_step": 110151, "epoch": 2622} {"train_loss": -6.466133117675781, "global_step": 110152, "epoch": 2622} {"train_loss": -6.340677738189697, "global_step": 110153, "epoch": 2622} {"train_loss": -6.404674530029297, "global_step": 110154, "epoch": 2622} {"train_loss": -6.403988838195801, "global_step": 110155, "epoch": 2622} {"train_loss": -6.470422744750977, "global_step": 110156, "epoch": 2622} {"train_loss": -6.440439224243164, "global_step": 110157, "epoch": 2622} {"train_loss": -6.492873191833496, "global_step": 110158, "epoch": 2622} {"train_loss": -6.502837657928467, "global_step": 110159, "epoch": 2622} {"train_loss": -6.476137161254883, "global_step": 110160, "epoch": 2622} {"train_loss": -6.449640274047852, "global_step": 110161, "epoch": 2622} {"train_loss": -6.349272727966309, "global_step": 110162, "epoch": 2622} {"train_loss": -6.485461235046387, "global_step": 110163, "epoch": 2622} {"train_loss": -6.504438400268555, "global_step": 110164, "epoch": 2622} {"train_loss": -6.46376421338036, "global_step": 110165, "epoch": 2622, "val_loss": 64902.61328125} {"train_loss": -6.559892654418945, "global_step": 110166, "epoch": 2623} {"train_loss": -6.445904731750488, "global_step": 110167, "epoch": 2623} {"train_loss": -6.484308242797852, "global_step": 110168, "epoch": 2623} {"train_loss": -6.594486236572266, "global_step": 110169, "epoch": 2623} {"train_loss": -6.560235023498535, "global_step": 110170, "epoch": 2623} {"train_loss": -6.455660343170166, "global_step": 110171, "epoch": 2623} {"train_loss": -6.468766212463379, "global_step": 110172, "epoch": 2623} {"train_loss": -6.434154987335205, "global_step": 110173, "epoch": 2623} {"train_loss": -6.488964557647705, "global_step": 110174, "epoch": 2623} {"train_loss": -6.476572513580322, "global_step": 110175, "epoch": 2623} {"train_loss": -6.480096340179443, "global_step": 110176, "epoch": 2623} {"train_loss": -6.4957685470581055, "global_step": 110177, "epoch": 2623} {"train_loss": -6.446734428405762, "global_step": 110178, "epoch": 2623} {"train_loss": -6.507407188415527, "global_step": 110179, "epoch": 2623} {"train_loss": -6.395521640777588, "global_step": 110180, "epoch": 2623} {"train_loss": -6.386833667755127, "global_step": 110181, "epoch": 2623} {"train_loss": -6.40362024307251, "global_step": 110182, "epoch": 2623} {"train_loss": -6.524609565734863, "global_step": 110183, "epoch": 2623} {"train_loss": -6.39609432220459, "global_step": 110184, "epoch": 2623} {"train_loss": -6.462515830993652, "global_step": 110185, "epoch": 2623} {"train_loss": -6.419698715209961, "global_step": 110186, "epoch": 2623} {"train_loss": -6.429050445556641, "global_step": 110187, "epoch": 2623} {"train_loss": -6.545785903930664, "global_step": 110188, "epoch": 2623} {"train_loss": -6.4550251960754395, "global_step": 110189, "epoch": 2623} {"train_loss": -6.33261775970459, "global_step": 110190, "epoch": 2623} {"train_loss": -6.460460186004639, "global_step": 110191, "epoch": 2623} {"train_loss": -6.319129943847656, "global_step": 110192, "epoch": 2623} {"train_loss": -6.419856548309326, "global_step": 110193, "epoch": 2623} {"train_loss": -6.5090179443359375, "global_step": 110194, "epoch": 2623} {"train_loss": -6.507556915283203, "global_step": 110195, "epoch": 2623} {"train_loss": -6.447796821594238, "global_step": 110196, "epoch": 2623} {"train_loss": -6.455718994140625, "global_step": 110197, "epoch": 2623} {"train_loss": -6.285772800445557, "global_step": 110198, "epoch": 2623} {"train_loss": -6.472064018249512, "global_step": 110199, "epoch": 2623} {"train_loss": -6.502246856689453, "global_step": 110200, "epoch": 2623} {"train_loss": -6.3430585861206055, "global_step": 110201, "epoch": 2623} {"train_loss": -6.474477291107178, "global_step": 110202, "epoch": 2623} {"train_loss": -6.487276077270508, "global_step": 110203, "epoch": 2623} {"train_loss": -6.3977437019348145, "global_step": 110204, "epoch": 2623} {"train_loss": -6.490993499755859, "global_step": 110205, "epoch": 2623} {"train_loss": -6.424273490905762, "global_step": 110206, "epoch": 2623} {"train_loss": -6.455096585409982, "global_step": 110207, "epoch": 2623, "val_loss": 65055.66015625} {"train_loss": -6.500873565673828, "global_step": 110208, "epoch": 2624} {"train_loss": -6.414339065551758, "global_step": 110209, "epoch": 2624} {"train_loss": -6.506717681884766, "global_step": 110210, "epoch": 2624} {"train_loss": -6.5814995765686035, "global_step": 110211, "epoch": 2624} {"train_loss": -6.419180870056152, "global_step": 110212, "epoch": 2624} {"train_loss": -6.410351276397705, "global_step": 110213, "epoch": 2624} {"train_loss": -6.414119720458984, "global_step": 110214, "epoch": 2624} {"train_loss": -6.3278045654296875, "global_step": 110215, "epoch": 2624} {"train_loss": -6.470095157623291, "global_step": 110216, "epoch": 2624} {"train_loss": -6.487990379333496, "global_step": 110217, "epoch": 2624} {"train_loss": -6.591143608093262, "global_step": 110218, "epoch": 2624} {"train_loss": -6.514883041381836, "global_step": 110219, "epoch": 2624} {"train_loss": -6.494138717651367, "global_step": 110220, "epoch": 2624} {"train_loss": -6.459277153015137, "global_step": 110221, "epoch": 2624} {"train_loss": -6.471565246582031, "global_step": 110222, "epoch": 2624} {"train_loss": -6.537687301635742, "global_step": 110223, "epoch": 2624} {"train_loss": -6.398622512817383, "global_step": 110224, "epoch": 2624} {"train_loss": -6.449480056762695, "global_step": 110225, "epoch": 2624} {"train_loss": -6.4937028884887695, "global_step": 110226, "epoch": 2624} {"train_loss": -6.526856899261475, "global_step": 110227, "epoch": 2624} {"train_loss": -6.55662202835083, "global_step": 110228, "epoch": 2624} {"train_loss": -6.536629676818848, "global_step": 110229, "epoch": 2624} {"train_loss": -6.452004909515381, "global_step": 110230, "epoch": 2624} {"train_loss": -6.5312299728393555, "global_step": 110231, "epoch": 2624} {"train_loss": -6.540746688842773, "global_step": 110232, "epoch": 2624} {"train_loss": -6.52778434753418, "global_step": 110233, "epoch": 2624} {"train_loss": -6.466297149658203, "global_step": 110234, "epoch": 2624} {"train_loss": -6.587771415710449, "global_step": 110235, "epoch": 2624} {"train_loss": -6.475685119628906, "global_step": 110236, "epoch": 2624} {"train_loss": -6.527819633483887, "global_step": 110237, "epoch": 2624} {"train_loss": -6.424350738525391, "global_step": 110238, "epoch": 2624} {"train_loss": -6.448975563049316, "global_step": 110239, "epoch": 2624} {"train_loss": -6.504275798797607, "global_step": 110240, "epoch": 2624} {"train_loss": -6.423308372497559, "global_step": 110241, "epoch": 2624} {"train_loss": -6.435892105102539, "global_step": 110242, "epoch": 2624} {"train_loss": -6.4306182861328125, "global_step": 110243, "epoch": 2624} {"train_loss": -6.42877197265625, "global_step": 110244, "epoch": 2624} {"train_loss": -6.540252208709717, "global_step": 110245, "epoch": 2624} {"train_loss": -6.30556583404541, "global_step": 110246, "epoch": 2624} {"train_loss": -6.340676307678223, "global_step": 110247, "epoch": 2624} {"train_loss": -6.266524314880371, "global_step": 110248, "epoch": 2624} {"train_loss": -6.466662406921387, "global_step": 110249, "epoch": 2624, "val_loss": 65400.015625} {"train_loss": -6.359709739685059, "global_step": 110250, "epoch": 2625} {"train_loss": -6.274350166320801, "global_step": 110251, "epoch": 2625} {"train_loss": -6.383896827697754, "global_step": 110252, "epoch": 2625} {"train_loss": -6.463624954223633, "global_step": 110253, "epoch": 2625} {"train_loss": -6.313775062561035, "global_step": 110254, "epoch": 2625} {"train_loss": -6.442307472229004, "global_step": 110255, "epoch": 2625} {"train_loss": -6.522272109985352, "global_step": 110256, "epoch": 2625} {"train_loss": -6.359907150268555, "global_step": 110257, "epoch": 2625} {"train_loss": -6.364814758300781, "global_step": 110258, "epoch": 2625} {"train_loss": -6.479595184326172, "global_step": 110259, "epoch": 2625} {"train_loss": -6.415774345397949, "global_step": 110260, "epoch": 2625} {"train_loss": -6.491580486297607, "global_step": 110261, "epoch": 2625} {"train_loss": -6.414945125579834, "global_step": 110262, "epoch": 2625} {"train_loss": -6.377796173095703, "global_step": 110263, "epoch": 2625} {"train_loss": -6.312021732330322, "global_step": 110264, "epoch": 2625} {"train_loss": -6.370275020599365, "global_step": 110265, "epoch": 2625} {"train_loss": -6.387115478515625, "global_step": 110266, "epoch": 2625} {"train_loss": -6.508009910583496, "global_step": 110267, "epoch": 2625} {"train_loss": -6.436741828918457, "global_step": 110268, "epoch": 2625} {"train_loss": -6.460358142852783, "global_step": 110269, "epoch": 2625} {"train_loss": -6.476804256439209, "global_step": 110270, "epoch": 2625} {"train_loss": -6.404944896697998, "global_step": 110271, "epoch": 2625} {"train_loss": -6.421543121337891, "global_step": 110272, "epoch": 2625} {"train_loss": -6.477865219116211, "global_step": 110273, "epoch": 2625} {"train_loss": -6.4524455070495605, "global_step": 110274, "epoch": 2625} {"train_loss": -6.431784152984619, "global_step": 110275, "epoch": 2625} {"train_loss": -6.476681709289551, "global_step": 110276, "epoch": 2625} {"train_loss": -6.511054515838623, "global_step": 110277, "epoch": 2625} {"train_loss": -6.380989074707031, "global_step": 110278, "epoch": 2625} {"train_loss": -6.424959182739258, "global_step": 110279, "epoch": 2625} {"train_loss": -6.434855937957764, "global_step": 110280, "epoch": 2625} {"train_loss": -6.454398155212402, "global_step": 110281, "epoch": 2625} {"train_loss": -6.408315658569336, "global_step": 110282, "epoch": 2625} {"train_loss": -6.51536750793457, "global_step": 110283, "epoch": 2625} {"train_loss": -6.511982440948486, "global_step": 110284, "epoch": 2625} {"train_loss": -6.327836036682129, "global_step": 110285, "epoch": 2625} {"train_loss": -6.424314022064209, "global_step": 110286, "epoch": 2625} {"train_loss": -6.566265106201172, "global_step": 110287, "epoch": 2625} {"train_loss": -6.359227657318115, "global_step": 110288, "epoch": 2625} {"train_loss": -6.515637397766113, "global_step": 110289, "epoch": 2625} {"train_loss": -6.443612098693848, "global_step": 110290, "epoch": 2625} {"train_loss": -6.428368863605318, "global_step": 110291, "epoch": 2625, "val_loss": 64991.4296875} {"train_loss": -6.5239577293396, "global_step": 110292, "epoch": 2626} {"train_loss": -6.493213653564453, "global_step": 110293, "epoch": 2626} {"train_loss": -6.471660614013672, "global_step": 110294, "epoch": 2626} {"train_loss": -6.401657581329346, "global_step": 110295, "epoch": 2626} {"train_loss": -6.4903669357299805, "global_step": 110296, "epoch": 2626} {"train_loss": -6.4603271484375, "global_step": 110297, "epoch": 2626} {"train_loss": -6.419864654541016, "global_step": 110298, "epoch": 2626} {"train_loss": -6.688505172729492, "global_step": 110299, "epoch": 2626} {"train_loss": -6.481393814086914, "global_step": 110300, "epoch": 2626} {"train_loss": -6.352391242980957, "global_step": 110301, "epoch": 2626} {"train_loss": -6.380119323730469, "global_step": 110302, "epoch": 2626} {"train_loss": -6.457557678222656, "global_step": 110303, "epoch": 2626} {"train_loss": -6.402005195617676, "global_step": 110304, "epoch": 2626} {"train_loss": -6.44699764251709, "global_step": 110305, "epoch": 2626} {"train_loss": -6.4407057762146, "global_step": 110306, "epoch": 2626} {"train_loss": -6.515017509460449, "global_step": 110307, "epoch": 2626} {"train_loss": -6.5383100509643555, "global_step": 110308, "epoch": 2626} {"train_loss": -6.478546142578125, "global_step": 110309, "epoch": 2626} {"train_loss": -6.495684623718262, "global_step": 110310, "epoch": 2626} {"train_loss": -6.475230693817139, "global_step": 110311, "epoch": 2626} {"train_loss": -6.428900718688965, "global_step": 110312, "epoch": 2626} {"train_loss": -6.523233890533447, "global_step": 110313, "epoch": 2626} {"train_loss": -6.422179222106934, "global_step": 110314, "epoch": 2626} {"train_loss": -6.488654136657715, "global_step": 110315, "epoch": 2626} {"train_loss": -6.519062042236328, "global_step": 110316, "epoch": 2626} {"train_loss": -6.443774223327637, "global_step": 110317, "epoch": 2626} {"train_loss": -6.485321044921875, "global_step": 110318, "epoch": 2626} {"train_loss": -6.482987403869629, "global_step": 110319, "epoch": 2626} {"train_loss": -6.409875392913818, "global_step": 110320, "epoch": 2626} {"train_loss": -6.493771553039551, "global_step": 110321, "epoch": 2626} {"train_loss": -6.346055030822754, "global_step": 110322, "epoch": 2626} {"train_loss": -6.36262321472168, "global_step": 110323, "epoch": 2626} {"train_loss": -6.4700422286987305, "global_step": 110324, "epoch": 2626} {"train_loss": -6.406298637390137, "global_step": 110325, "epoch": 2626} {"train_loss": -6.489462852478027, "global_step": 110326, "epoch": 2626} {"train_loss": -6.371116638183594, "global_step": 110327, "epoch": 2626} {"train_loss": -6.3578104972839355, "global_step": 110328, "epoch": 2626} {"train_loss": -6.558659553527832, "global_step": 110329, "epoch": 2626} {"train_loss": -6.375759124755859, "global_step": 110330, "epoch": 2626} {"train_loss": -6.331671714782715, "global_step": 110331, "epoch": 2626} {"train_loss": -6.49254846572876, "global_step": 110332, "epoch": 2626} {"train_loss": -6.453720126833234, "global_step": 110333, "epoch": 2626, "val_loss": 65148.60546875} {"train_loss": -6.493746757507324, "global_step": 110334, "epoch": 2627} {"train_loss": -6.469852447509766, "global_step": 110335, "epoch": 2627} {"train_loss": -6.393831253051758, "global_step": 110336, "epoch": 2627} {"train_loss": -6.402556896209717, "global_step": 110337, "epoch": 2627} {"train_loss": -6.43322229385376, "global_step": 110338, "epoch": 2627} {"train_loss": -6.443344593048096, "global_step": 110339, "epoch": 2627} {"train_loss": -6.446435928344727, "global_step": 110340, "epoch": 2627} {"train_loss": -6.447587013244629, "global_step": 110341, "epoch": 2627} {"train_loss": -6.509937286376953, "global_step": 110342, "epoch": 2627} {"train_loss": -6.505146026611328, "global_step": 110343, "epoch": 2627} {"train_loss": -6.450374603271484, "global_step": 110344, "epoch": 2627} {"train_loss": -6.522775650024414, "global_step": 110345, "epoch": 2627} {"train_loss": -6.471269607543945, "global_step": 110346, "epoch": 2627} {"train_loss": -6.517134666442871, "global_step": 110347, "epoch": 2627} {"train_loss": -6.477399826049805, "global_step": 110348, "epoch": 2627} {"train_loss": -6.486078262329102, "global_step": 110349, "epoch": 2627} {"train_loss": -6.627911567687988, "global_step": 110350, "epoch": 2627} {"train_loss": -6.5409746170043945, "global_step": 110351, "epoch": 2627} {"train_loss": -6.54266881942749, "global_step": 110352, "epoch": 2627} {"train_loss": -6.4180707931518555, "global_step": 110353, "epoch": 2627} {"train_loss": -6.457025051116943, "global_step": 110354, "epoch": 2627} {"train_loss": -6.459553241729736, "global_step": 110355, "epoch": 2627} {"train_loss": -6.62744140625, "global_step": 110356, "epoch": 2627} {"train_loss": -6.471489906311035, "global_step": 110357, "epoch": 2627} {"train_loss": -6.38471794128418, "global_step": 110358, "epoch": 2627} {"train_loss": -6.538500785827637, "global_step": 110359, "epoch": 2627} {"train_loss": -6.489541053771973, "global_step": 110360, "epoch": 2627} {"train_loss": -6.4307355880737305, "global_step": 110361, "epoch": 2627} {"train_loss": -6.526537895202637, "global_step": 110362, "epoch": 2627} {"train_loss": -6.264691352844238, "global_step": 110363, "epoch": 2627} {"train_loss": -6.39362907409668, "global_step": 110364, "epoch": 2627} {"train_loss": -6.44182014465332, "global_step": 110365, "epoch": 2627} {"train_loss": -6.490018367767334, "global_step": 110366, "epoch": 2627} {"train_loss": -6.434843063354492, "global_step": 110367, "epoch": 2627} {"train_loss": -6.461542129516602, "global_step": 110368, "epoch": 2627} {"train_loss": -6.539794921875, "global_step": 110369, "epoch": 2627} {"train_loss": -6.56036376953125, "global_step": 110370, "epoch": 2627} {"train_loss": -6.496157169342041, "global_step": 110371, "epoch": 2627} {"train_loss": -6.399039268493652, "global_step": 110372, "epoch": 2627} {"train_loss": -6.502175331115723, "global_step": 110373, "epoch": 2627} {"train_loss": -6.482217788696289, "global_step": 110374, "epoch": 2627} {"train_loss": -6.474325350352696, "global_step": 110375, "epoch": 2627, "val_loss": 65059.38671875} {"train_loss": -6.3818535804748535, "global_step": 110376, "epoch": 2628} {"train_loss": -6.549322128295898, "global_step": 110377, "epoch": 2628} {"train_loss": -6.517536163330078, "global_step": 110378, "epoch": 2628} {"train_loss": -6.420572280883789, "global_step": 110379, "epoch": 2628} {"train_loss": -6.44467830657959, "global_step": 110380, "epoch": 2628} {"train_loss": -6.501053810119629, "global_step": 110381, "epoch": 2628} {"train_loss": -6.486358642578125, "global_step": 110382, "epoch": 2628} {"train_loss": -6.455146312713623, "global_step": 110383, "epoch": 2628} {"train_loss": -6.506718158721924, "global_step": 110384, "epoch": 2628} {"train_loss": -6.269356727600098, "global_step": 110385, "epoch": 2628} {"train_loss": -6.472153663635254, "global_step": 110386, "epoch": 2628} {"train_loss": -6.532845973968506, "global_step": 110387, "epoch": 2628} {"train_loss": -6.441363334655762, "global_step": 110388, "epoch": 2628} {"train_loss": -6.392160415649414, "global_step": 110389, "epoch": 2628} {"train_loss": -6.456418037414551, "global_step": 110390, "epoch": 2628} {"train_loss": -6.523307800292969, "global_step": 110391, "epoch": 2628} {"train_loss": -6.489321231842041, "global_step": 110392, "epoch": 2628} {"train_loss": -6.378653049468994, "global_step": 110393, "epoch": 2628} {"train_loss": -6.454348564147949, "global_step": 110394, "epoch": 2628} {"train_loss": -6.334092140197754, "global_step": 110395, "epoch": 2628} {"train_loss": -6.542201995849609, "global_step": 110396, "epoch": 2628} {"train_loss": -6.389179229736328, "global_step": 110397, "epoch": 2628} {"train_loss": -6.48000955581665, "global_step": 110398, "epoch": 2628} {"train_loss": -6.447877883911133, "global_step": 110399, "epoch": 2628} {"train_loss": -6.42204475402832, "global_step": 110400, "epoch": 2628} {"train_loss": -6.410773277282715, "global_step": 110401, "epoch": 2628} {"train_loss": -6.247262001037598, "global_step": 110402, "epoch": 2628} {"train_loss": -6.340766906738281, "global_step": 110403, "epoch": 2628} {"train_loss": -6.353355407714844, "global_step": 110404, "epoch": 2628} {"train_loss": -6.314911842346191, "global_step": 110405, "epoch": 2628} {"train_loss": -6.506643295288086, "global_step": 110406, "epoch": 2628} {"train_loss": -6.337519645690918, "global_step": 110407, "epoch": 2628} {"train_loss": -6.4075775146484375, "global_step": 110408, "epoch": 2628} {"train_loss": -6.367929458618164, "global_step": 110409, "epoch": 2628} {"train_loss": -6.370657444000244, "global_step": 110410, "epoch": 2628} {"train_loss": -6.307572841644287, "global_step": 110411, "epoch": 2628} {"train_loss": -6.382770538330078, "global_step": 110412, "epoch": 2628} {"train_loss": -6.385715484619141, "global_step": 110413, "epoch": 2628} {"train_loss": -6.280814170837402, "global_step": 110414, "epoch": 2628} {"train_loss": -6.466764450073242, "global_step": 110415, "epoch": 2628} {"train_loss": -6.3436431884765625, "global_step": 110416, "epoch": 2628} {"train_loss": -6.421534050078619, "global_step": 110417, "epoch": 2628, "val_loss": 64932.09375} {"train_loss": -6.281552791595459, "global_step": 110418, "epoch": 2629} {"train_loss": -6.385196685791016, "global_step": 110419, "epoch": 2629} {"train_loss": -6.391869068145752, "global_step": 110420, "epoch": 2629} {"train_loss": -6.536460876464844, "global_step": 110421, "epoch": 2629} {"train_loss": -6.4228515625, "global_step": 110422, "epoch": 2629} {"train_loss": -6.478350639343262, "global_step": 110423, "epoch": 2629} {"train_loss": -6.51301383972168, "global_step": 110424, "epoch": 2629} {"train_loss": -6.4508819580078125, "global_step": 110425, "epoch": 2629} {"train_loss": -6.5058135986328125, "global_step": 110426, "epoch": 2629} {"train_loss": -6.427987098693848, "global_step": 110427, "epoch": 2629} {"train_loss": -6.401741027832031, "global_step": 110428, "epoch": 2629} {"train_loss": -6.494670391082764, "global_step": 110429, "epoch": 2629} {"train_loss": -6.412071228027344, "global_step": 110430, "epoch": 2629} {"train_loss": -6.363836288452148, "global_step": 110431, "epoch": 2629} {"train_loss": -6.444504261016846, "global_step": 110432, "epoch": 2629} {"train_loss": -6.375983238220215, "global_step": 110433, "epoch": 2629} {"train_loss": -6.4724836349487305, "global_step": 110434, "epoch": 2629} {"train_loss": -6.432466506958008, "global_step": 110435, "epoch": 2629} {"train_loss": -6.572682857513428, "global_step": 110436, "epoch": 2629} {"train_loss": -6.558403968811035, "global_step": 110437, "epoch": 2629} {"train_loss": -6.485350608825684, "global_step": 110438, "epoch": 2629} {"train_loss": -6.5157060623168945, "global_step": 110439, "epoch": 2629} {"train_loss": -6.47028112411499, "global_step": 110440, "epoch": 2629} {"train_loss": -6.382387638092041, "global_step": 110441, "epoch": 2629} {"train_loss": -6.4153056144714355, "global_step": 110442, "epoch": 2629} {"train_loss": -6.532950401306152, "global_step": 110443, "epoch": 2629} {"train_loss": -6.505936622619629, "global_step": 110444, "epoch": 2629} {"train_loss": -6.348609924316406, "global_step": 110445, "epoch": 2629} {"train_loss": -6.593849182128906, "global_step": 110446, "epoch": 2629} {"train_loss": -6.546780586242676, "global_step": 110447, "epoch": 2629} {"train_loss": -6.603282451629639, "global_step": 110448, "epoch": 2629} {"train_loss": -6.547916412353516, "global_step": 110449, "epoch": 2629} {"train_loss": -6.341438293457031, "global_step": 110450, "epoch": 2629} {"train_loss": -6.561221599578857, "global_step": 110451, "epoch": 2629} {"train_loss": -6.477026462554932, "global_step": 110452, "epoch": 2629} {"train_loss": -6.469883918762207, "global_step": 110453, "epoch": 2629} {"train_loss": -6.498993873596191, "global_step": 110454, "epoch": 2629} {"train_loss": -6.477664947509766, "global_step": 110455, "epoch": 2629} {"train_loss": -6.554774284362793, "global_step": 110456, "epoch": 2629} {"train_loss": -6.464597225189209, "global_step": 110457, "epoch": 2629} {"train_loss": -6.588421821594238, "global_step": 110458, "epoch": 2629} {"train_loss": -6.469184864135015, "global_step": 110459, "epoch": 2629, "val_loss": 65003.16015625} {"train_loss": -6.472655773162842, "global_step": 110460, "epoch": 2630} {"train_loss": -6.500244140625, "global_step": 110461, "epoch": 2630} {"train_loss": -6.592449188232422, "global_step": 110462, "epoch": 2630} {"train_loss": -6.584481239318848, "global_step": 110463, "epoch": 2630} {"train_loss": -6.566704273223877, "global_step": 110464, "epoch": 2630} {"train_loss": -6.604721546173096, "global_step": 110465, "epoch": 2630} {"train_loss": -6.465747356414795, "global_step": 110466, "epoch": 2630} {"train_loss": -6.49988317489624, "global_step": 110467, "epoch": 2630} {"train_loss": -6.52448844909668, "global_step": 110468, "epoch": 2630} {"train_loss": -6.516080856323242, "global_step": 110469, "epoch": 2630} {"train_loss": -6.5756635665893555, "global_step": 110470, "epoch": 2630} {"train_loss": -6.608978271484375, "global_step": 110471, "epoch": 2630} {"train_loss": -6.572509765625, "global_step": 110472, "epoch": 2630} {"train_loss": -6.5453386306762695, "global_step": 110473, "epoch": 2630} {"train_loss": -6.637964725494385, "global_step": 110474, "epoch": 2630} {"train_loss": -6.481123924255371, "global_step": 110475, "epoch": 2630} {"train_loss": -6.599428176879883, "global_step": 110476, "epoch": 2630} {"train_loss": -6.484938621520996, "global_step": 110477, "epoch": 2630} {"train_loss": -6.591169357299805, "global_step": 110478, "epoch": 2630} {"train_loss": -6.50921106338501, "global_step": 110479, "epoch": 2630} {"train_loss": -6.455214500427246, "global_step": 110480, "epoch": 2630} {"train_loss": -6.60451602935791, "global_step": 110481, "epoch": 2630} {"train_loss": -6.441705226898193, "global_step": 110482, "epoch": 2630} {"train_loss": -6.546082496643066, "global_step": 110483, "epoch": 2630} {"train_loss": -6.5021538734436035, "global_step": 110484, "epoch": 2630} {"train_loss": -6.568930625915527, "global_step": 110485, "epoch": 2630} {"train_loss": -6.5939621925354, "global_step": 110486, "epoch": 2630} {"train_loss": -6.527279376983643, "global_step": 110487, "epoch": 2630} {"train_loss": -6.446819305419922, "global_step": 110488, "epoch": 2630} {"train_loss": -6.569733619689941, "global_step": 110489, "epoch": 2630} {"train_loss": -6.593760013580322, "global_step": 110490, "epoch": 2630} {"train_loss": -6.340195655822754, "global_step": 110491, "epoch": 2630} {"train_loss": -6.47241735458374, "global_step": 110492, "epoch": 2630} {"train_loss": -6.568591117858887, "global_step": 110493, "epoch": 2630} {"train_loss": -6.47777795791626, "global_step": 110494, "epoch": 2630} {"train_loss": -6.531787872314453, "global_step": 110495, "epoch": 2630} {"train_loss": -6.531001567840576, "global_step": 110496, "epoch": 2630} {"train_loss": -6.466277122497559, "global_step": 110497, "epoch": 2630} {"train_loss": -6.470077037811279, "global_step": 110498, "epoch": 2630} {"train_loss": -6.483498573303223, "global_step": 110499, "epoch": 2630} {"train_loss": -6.508847713470459, "global_step": 110500, "epoch": 2630} {"train_loss": -6.530784436634609, "global_step": 110501, "epoch": 2630, "val_loss": 65133.60546875} {"train_loss": -6.379659175872803, "global_step": 110502, "epoch": 2631} {"train_loss": -6.409125328063965, "global_step": 110503, "epoch": 2631} {"train_loss": -6.526250839233398, "global_step": 110504, "epoch": 2631} {"train_loss": -6.482558250427246, "global_step": 110505, "epoch": 2631} {"train_loss": -6.554804801940918, "global_step": 110506, "epoch": 2631} {"train_loss": -6.537252426147461, "global_step": 110507, "epoch": 2631} {"train_loss": -6.535313129425049, "global_step": 110508, "epoch": 2631} {"train_loss": -6.479204177856445, "global_step": 110509, "epoch": 2631} {"train_loss": -6.5184712409973145, "global_step": 110510, "epoch": 2631} {"train_loss": -6.53419303894043, "global_step": 110511, "epoch": 2631} {"train_loss": -6.464851379394531, "global_step": 110512, "epoch": 2631} {"train_loss": -6.435708045959473, "global_step": 110513, "epoch": 2631} {"train_loss": -6.513836860656738, "global_step": 110514, "epoch": 2631} {"train_loss": -6.344812393188477, "global_step": 110515, "epoch": 2631} {"train_loss": -6.545924186706543, "global_step": 110516, "epoch": 2631} {"train_loss": -6.497404098510742, "global_step": 110517, "epoch": 2631} {"train_loss": -6.545546054840088, "global_step": 110518, "epoch": 2631} {"train_loss": -6.484748363494873, "global_step": 110519, "epoch": 2631} {"train_loss": -6.430893898010254, "global_step": 110520, "epoch": 2631} {"train_loss": -6.494992256164551, "global_step": 110521, "epoch": 2631} {"train_loss": -6.427539825439453, "global_step": 110522, "epoch": 2631} {"train_loss": -6.490644454956055, "global_step": 110523, "epoch": 2631} {"train_loss": -6.548827171325684, "global_step": 110524, "epoch": 2631} {"train_loss": -6.484355926513672, "global_step": 110525, "epoch": 2631} {"train_loss": -6.5069427490234375, "global_step": 110526, "epoch": 2631} {"train_loss": -6.555566787719727, "global_step": 110527, "epoch": 2631} {"train_loss": -6.386911392211914, "global_step": 110528, "epoch": 2631} {"train_loss": -6.595473289489746, "global_step": 110529, "epoch": 2631} {"train_loss": -6.461733818054199, "global_step": 110530, "epoch": 2631} {"train_loss": -6.618009567260742, "global_step": 110531, "epoch": 2631} {"train_loss": -6.646790504455566, "global_step": 110532, "epoch": 2631} {"train_loss": -6.542342185974121, "global_step": 110533, "epoch": 2631} {"train_loss": -6.554994583129883, "global_step": 110534, "epoch": 2631} {"train_loss": -6.500903129577637, "global_step": 110535, "epoch": 2631} {"train_loss": -6.510315418243408, "global_step": 110536, "epoch": 2631} {"train_loss": -6.362539291381836, "global_step": 110537, "epoch": 2631} {"train_loss": -6.396790504455566, "global_step": 110538, "epoch": 2631} {"train_loss": -6.554694175720215, "global_step": 110539, "epoch": 2631} {"train_loss": -6.497892379760742, "global_step": 110540, "epoch": 2631} {"train_loss": -6.465057373046875, "global_step": 110541, "epoch": 2631} {"train_loss": -6.528965950012207, "global_step": 110542, "epoch": 2631} {"train_loss": -6.496704532986596, "global_step": 110543, "epoch": 2631, "val_loss": 65179.046875} {"train_loss": -6.456467151641846, "global_step": 110544, "epoch": 2632} {"train_loss": -6.547024726867676, "global_step": 110545, "epoch": 2632} {"train_loss": -6.572133541107178, "global_step": 110546, "epoch": 2632} {"train_loss": -6.447824001312256, "global_step": 110547, "epoch": 2632} {"train_loss": -6.4267706871032715, "global_step": 110548, "epoch": 2632} {"train_loss": -6.532601833343506, "global_step": 110549, "epoch": 2632} {"train_loss": -6.422083377838135, "global_step": 110550, "epoch": 2632} {"train_loss": -6.529776573181152, "global_step": 110551, "epoch": 2632} {"train_loss": -6.47629451751709, "global_step": 110552, "epoch": 2632} {"train_loss": -6.519522190093994, "global_step": 110553, "epoch": 2632} {"train_loss": -6.476051330566406, "global_step": 110554, "epoch": 2632} {"train_loss": -6.472200393676758, "global_step": 110555, "epoch": 2632} {"train_loss": -6.477110385894775, "global_step": 110556, "epoch": 2632} {"train_loss": -6.414504051208496, "global_step": 110557, "epoch": 2632} {"train_loss": -6.565701961517334, "global_step": 110558, "epoch": 2632} {"train_loss": -6.529380798339844, "global_step": 110559, "epoch": 2632} {"train_loss": -6.368229866027832, "global_step": 110560, "epoch": 2632} {"train_loss": -6.483970642089844, "global_step": 110561, "epoch": 2632} {"train_loss": -6.33087158203125, "global_step": 110562, "epoch": 2632} {"train_loss": -6.346958160400391, "global_step": 110563, "epoch": 2632} {"train_loss": -6.483782768249512, "global_step": 110564, "epoch": 2632} {"train_loss": -6.396805286407471, "global_step": 110565, "epoch": 2632} {"train_loss": -6.344631195068359, "global_step": 110566, "epoch": 2632} {"train_loss": -6.523754596710205, "global_step": 110567, "epoch": 2632} {"train_loss": -6.473402500152588, "global_step": 110568, "epoch": 2632} {"train_loss": -6.4236321449279785, "global_step": 110569, "epoch": 2632} {"train_loss": -6.501059532165527, "global_step": 110570, "epoch": 2632} {"train_loss": -6.454308986663818, "global_step": 110571, "epoch": 2632} {"train_loss": -6.5115556716918945, "global_step": 110572, "epoch": 2632} {"train_loss": -6.467921257019043, "global_step": 110573, "epoch": 2632} {"train_loss": -6.432138442993164, "global_step": 110574, "epoch": 2632} {"train_loss": -6.4249043464660645, "global_step": 110575, "epoch": 2632} {"train_loss": -6.4292707443237305, "global_step": 110576, "epoch": 2632} {"train_loss": -6.462189197540283, "global_step": 110577, "epoch": 2632} {"train_loss": -6.375732421875, "global_step": 110578, "epoch": 2632} {"train_loss": -6.484745025634766, "global_step": 110579, "epoch": 2632} {"train_loss": -6.412583827972412, "global_step": 110580, "epoch": 2632} {"train_loss": -6.500983238220215, "global_step": 110581, "epoch": 2632} {"train_loss": -6.555539131164551, "global_step": 110582, "epoch": 2632} {"train_loss": -6.40020751953125, "global_step": 110583, "epoch": 2632} {"train_loss": -6.291427135467529, "global_step": 110584, "epoch": 2632} {"train_loss": -6.45759441739037, "global_step": 110585, "epoch": 2632, "val_loss": 65079.98046875} {"train_loss": -6.457191467285156, "global_step": 110586, "epoch": 2633} {"train_loss": -6.493830680847168, "global_step": 110587, "epoch": 2633} {"train_loss": -6.494032859802246, "global_step": 110588, "epoch": 2633} {"train_loss": -6.463178634643555, "global_step": 110589, "epoch": 2633} {"train_loss": -6.43044376373291, "global_step": 110590, "epoch": 2633} {"train_loss": -6.416377544403076, "global_step": 110591, "epoch": 2633} {"train_loss": -6.447169780731201, "global_step": 110592, "epoch": 2633} {"train_loss": -6.535880088806152, "global_step": 110593, "epoch": 2633} {"train_loss": -6.4361982345581055, "global_step": 110594, "epoch": 2633} {"train_loss": -6.417284965515137, "global_step": 110595, "epoch": 2633} {"train_loss": -6.465399742126465, "global_step": 110596, "epoch": 2633} {"train_loss": -6.545442581176758, "global_step": 110597, "epoch": 2633} {"train_loss": -6.416642665863037, "global_step": 110598, "epoch": 2633} {"train_loss": -6.403608322143555, "global_step": 110599, "epoch": 2633} {"train_loss": -6.450902938842773, "global_step": 110600, "epoch": 2633} {"train_loss": -6.552317142486572, "global_step": 110601, "epoch": 2633} {"train_loss": -6.5111589431762695, "global_step": 110602, "epoch": 2633} {"train_loss": -6.510173797607422, "global_step": 110603, "epoch": 2633} {"train_loss": -6.524812698364258, "global_step": 110604, "epoch": 2633} {"train_loss": -6.541813373565674, "global_step": 110605, "epoch": 2633} {"train_loss": -6.52391242980957, "global_step": 110606, "epoch": 2633} {"train_loss": -6.3972673416137695, "global_step": 110607, "epoch": 2633} {"train_loss": -6.5867109298706055, "global_step": 110608, "epoch": 2633} {"train_loss": -6.472524166107178, "global_step": 110609, "epoch": 2633} {"train_loss": -6.450963020324707, "global_step": 110610, "epoch": 2633} {"train_loss": -6.590077877044678, "global_step": 110611, "epoch": 2633} {"train_loss": -6.4092512130737305, "global_step": 110612, "epoch": 2633} {"train_loss": -6.49791955947876, "global_step": 110613, "epoch": 2633} {"train_loss": -6.391765117645264, "global_step": 110614, "epoch": 2633} {"train_loss": -6.478124141693115, "global_step": 110615, "epoch": 2633} {"train_loss": -6.475841522216797, "global_step": 110616, "epoch": 2633} {"train_loss": -6.430903434753418, "global_step": 110617, "epoch": 2633} {"train_loss": -6.509387016296387, "global_step": 110618, "epoch": 2633} {"train_loss": -6.576138973236084, "global_step": 110619, "epoch": 2633} {"train_loss": -6.504117965698242, "global_step": 110620, "epoch": 2633} {"train_loss": -6.4822235107421875, "global_step": 110621, "epoch": 2633} {"train_loss": -6.35260534286499, "global_step": 110622, "epoch": 2633} {"train_loss": -6.410572052001953, "global_step": 110623, "epoch": 2633} {"train_loss": -6.508669853210449, "global_step": 110624, "epoch": 2633} {"train_loss": -6.511108875274658, "global_step": 110625, "epoch": 2633} {"train_loss": -6.534798622131348, "global_step": 110626, "epoch": 2633} {"train_loss": -6.479210705984206, "global_step": 110627, "epoch": 2633, "val_loss": 65036.33203125} {"train_loss": -6.49700927734375, "global_step": 110628, "epoch": 2634} {"train_loss": -6.589850425720215, "global_step": 110629, "epoch": 2634} {"train_loss": -6.4671125411987305, "global_step": 110630, "epoch": 2634} {"train_loss": -6.455630779266357, "global_step": 110631, "epoch": 2634} {"train_loss": -6.543485641479492, "global_step": 110632, "epoch": 2634} {"train_loss": -6.533661842346191, "global_step": 110633, "epoch": 2634} {"train_loss": -6.5637006759643555, "global_step": 110634, "epoch": 2634} {"train_loss": -6.542422771453857, "global_step": 110635, "epoch": 2634} {"train_loss": -6.518443584442139, "global_step": 110636, "epoch": 2634} {"train_loss": -6.591630935668945, "global_step": 110637, "epoch": 2634} {"train_loss": -6.543123245239258, "global_step": 110638, "epoch": 2634} {"train_loss": -6.5111565589904785, "global_step": 110639, "epoch": 2634} {"train_loss": -6.486212730407715, "global_step": 110640, "epoch": 2634} {"train_loss": -6.553747177124023, "global_step": 110641, "epoch": 2634} {"train_loss": -6.524569511413574, "global_step": 110642, "epoch": 2634} {"train_loss": -6.401904106140137, "global_step": 110643, "epoch": 2634} {"train_loss": -6.470834255218506, "global_step": 110644, "epoch": 2634} {"train_loss": -6.516369819641113, "global_step": 110645, "epoch": 2634} {"train_loss": -6.4526472091674805, "global_step": 110646, "epoch": 2634} {"train_loss": -6.450748920440674, "global_step": 110647, "epoch": 2634} {"train_loss": -6.541650772094727, "global_step": 110648, "epoch": 2634} {"train_loss": -6.449270725250244, "global_step": 110649, "epoch": 2634} {"train_loss": -6.324814796447754, "global_step": 110650, "epoch": 2634} {"train_loss": -6.415435791015625, "global_step": 110651, "epoch": 2634} {"train_loss": -6.47805643081665, "global_step": 110652, "epoch": 2634} {"train_loss": -6.352010726928711, "global_step": 110653, "epoch": 2634} {"train_loss": -6.520109176635742, "global_step": 110654, "epoch": 2634} {"train_loss": -6.366333484649658, "global_step": 110655, "epoch": 2634} {"train_loss": -6.528756141662598, "global_step": 110656, "epoch": 2634} {"train_loss": -6.429146766662598, "global_step": 110657, "epoch": 2634} {"train_loss": -6.5458173751831055, "global_step": 110658, "epoch": 2634} {"train_loss": -6.376614093780518, "global_step": 110659, "epoch": 2634} {"train_loss": -6.506801128387451, "global_step": 110660, "epoch": 2634} {"train_loss": -6.430600166320801, "global_step": 110661, "epoch": 2634} {"train_loss": -6.4713239669799805, "global_step": 110662, "epoch": 2634} {"train_loss": -6.493011474609375, "global_step": 110663, "epoch": 2634} {"train_loss": -6.495218276977539, "global_step": 110664, "epoch": 2634} {"train_loss": -6.443554878234863, "global_step": 110665, "epoch": 2634} {"train_loss": -6.574502944946289, "global_step": 110666, "epoch": 2634} {"train_loss": -6.376772403717041, "global_step": 110667, "epoch": 2634} {"train_loss": -6.551313400268555, "global_step": 110668, "epoch": 2634} {"train_loss": -6.48318946929205, "global_step": 110669, "epoch": 2634, "val_loss": 64823.16015625} {"train_loss": -6.486870765686035, "global_step": 110670, "epoch": 2635} {"train_loss": -6.4907331466674805, "global_step": 110671, "epoch": 2635} {"train_loss": -6.52195930480957, "global_step": 110672, "epoch": 2635} {"train_loss": -6.447998523712158, "global_step": 110673, "epoch": 2635} {"train_loss": -6.364076614379883, "global_step": 110674, "epoch": 2635} {"train_loss": -6.550950527191162, "global_step": 110675, "epoch": 2635} {"train_loss": -6.447568416595459, "global_step": 110676, "epoch": 2635} {"train_loss": -6.400860786437988, "global_step": 110677, "epoch": 2635} {"train_loss": -6.423539638519287, "global_step": 110678, "epoch": 2635} {"train_loss": -6.535399913787842, "global_step": 110679, "epoch": 2635} {"train_loss": -6.422712326049805, "global_step": 110680, "epoch": 2635} {"train_loss": -6.450830459594727, "global_step": 110681, "epoch": 2635} {"train_loss": -6.498255729675293, "global_step": 110682, "epoch": 2635} {"train_loss": -6.33827018737793, "global_step": 110683, "epoch": 2635} {"train_loss": -6.390274524688721, "global_step": 110684, "epoch": 2635} {"train_loss": -6.387991905212402, "global_step": 110685, "epoch": 2635} {"train_loss": -6.544492721557617, "global_step": 110686, "epoch": 2635} {"train_loss": -6.417757511138916, "global_step": 110687, "epoch": 2635} {"train_loss": -6.539304733276367, "global_step": 110688, "epoch": 2635} {"train_loss": -6.481215476989746, "global_step": 110689, "epoch": 2635} {"train_loss": -6.481092929840088, "global_step": 110690, "epoch": 2635} {"train_loss": -6.52023983001709, "global_step": 110691, "epoch": 2635} {"train_loss": -6.576974868774414, "global_step": 110692, "epoch": 2635} {"train_loss": -6.478642463684082, "global_step": 110693, "epoch": 2635} {"train_loss": -6.2980875968933105, "global_step": 110694, "epoch": 2635} {"train_loss": -6.502073287963867, "global_step": 110695, "epoch": 2635} {"train_loss": -6.495863914489746, "global_step": 110696, "epoch": 2635} {"train_loss": -6.559286117553711, "global_step": 110697, "epoch": 2635} {"train_loss": -6.5505781173706055, "global_step": 110698, "epoch": 2635} {"train_loss": -6.397833824157715, "global_step": 110699, "epoch": 2635} {"train_loss": -6.439321041107178, "global_step": 110700, "epoch": 2635} {"train_loss": -6.331975936889648, "global_step": 110701, "epoch": 2635} {"train_loss": -6.473143577575684, "global_step": 110702, "epoch": 2635} {"train_loss": -6.459822177886963, "global_step": 110703, "epoch": 2635} {"train_loss": -6.50274133682251, "global_step": 110704, "epoch": 2635} {"train_loss": -6.458215713500977, "global_step": 110705, "epoch": 2635} {"train_loss": -6.398721218109131, "global_step": 110706, "epoch": 2635} {"train_loss": -6.488445281982422, "global_step": 110707, "epoch": 2635} {"train_loss": -6.445882320404053, "global_step": 110708, "epoch": 2635} {"train_loss": -6.483360290527344, "global_step": 110709, "epoch": 2635} {"train_loss": -6.457169532775879, "global_step": 110710, "epoch": 2635} {"train_loss": -6.4609925746917725, "global_step": 110711, "epoch": 2635, "val_loss": 65036.65625} {"train_loss": -6.510526657104492, "global_step": 110712, "epoch": 2636} {"train_loss": -6.46120548248291, "global_step": 110713, "epoch": 2636} {"train_loss": -6.471014976501465, "global_step": 110714, "epoch": 2636} {"train_loss": -6.41770076751709, "global_step": 110715, "epoch": 2636} {"train_loss": -6.3935160636901855, "global_step": 110716, "epoch": 2636} {"train_loss": -6.456018924713135, "global_step": 110717, "epoch": 2636} {"train_loss": -6.4661455154418945, "global_step": 110718, "epoch": 2636} {"train_loss": -6.445215702056885, "global_step": 110719, "epoch": 2636} {"train_loss": -6.538480281829834, "global_step": 110720, "epoch": 2636} {"train_loss": -6.424471855163574, "global_step": 110721, "epoch": 2636} {"train_loss": -6.446556091308594, "global_step": 110722, "epoch": 2636} {"train_loss": -6.4169158935546875, "global_step": 110723, "epoch": 2636} {"train_loss": -6.539175033569336, "global_step": 110724, "epoch": 2636} {"train_loss": -6.441596031188965, "global_step": 110725, "epoch": 2636} {"train_loss": -6.463170528411865, "global_step": 110726, "epoch": 2636} {"train_loss": -6.48998498916626, "global_step": 110727, "epoch": 2636} {"train_loss": -6.431849956512451, "global_step": 110728, "epoch": 2636} {"train_loss": -6.594335556030273, "global_step": 110729, "epoch": 2636} {"train_loss": -6.503996849060059, "global_step": 110730, "epoch": 2636} {"train_loss": -6.3775787353515625, "global_step": 110731, "epoch": 2636} {"train_loss": -6.436522960662842, "global_step": 110732, "epoch": 2636} {"train_loss": -6.360012054443359, "global_step": 110733, "epoch": 2636} {"train_loss": -6.450375556945801, "global_step": 110734, "epoch": 2636} {"train_loss": -6.453667640686035, "global_step": 110735, "epoch": 2636} {"train_loss": -6.390669822692871, "global_step": 110736, "epoch": 2636} {"train_loss": -6.522487640380859, "global_step": 110737, "epoch": 2636} {"train_loss": -6.524347305297852, "global_step": 110738, "epoch": 2636} {"train_loss": -6.547133445739746, "global_step": 110739, "epoch": 2636} {"train_loss": -6.488253593444824, "global_step": 110740, "epoch": 2636} {"train_loss": -6.359029769897461, "global_step": 110741, "epoch": 2636} {"train_loss": -6.554513931274414, "global_step": 110742, "epoch": 2636} {"train_loss": -6.482444763183594, "global_step": 110743, "epoch": 2636} {"train_loss": -6.418427467346191, "global_step": 110744, "epoch": 2636} {"train_loss": -6.460517883300781, "global_step": 110745, "epoch": 2636} {"train_loss": -6.48846960067749, "global_step": 110746, "epoch": 2636} {"train_loss": -6.473971366882324, "global_step": 110747, "epoch": 2636} {"train_loss": -6.431826114654541, "global_step": 110748, "epoch": 2636} {"train_loss": -6.414595603942871, "global_step": 110749, "epoch": 2636} {"train_loss": -6.442229270935059, "global_step": 110750, "epoch": 2636} {"train_loss": -6.557167053222656, "global_step": 110751, "epoch": 2636} {"train_loss": -6.52543306350708, "global_step": 110752, "epoch": 2636} {"train_loss": -6.463327657608759, "global_step": 110753, "epoch": 2636, "val_loss": 65109.80078125} {"train_loss": -6.461393356323242, "global_step": 110754, "epoch": 2637} {"train_loss": -6.469606399536133, "global_step": 110755, "epoch": 2637} {"train_loss": -6.396655082702637, "global_step": 110756, "epoch": 2637} {"train_loss": -6.445614337921143, "global_step": 110757, "epoch": 2637} {"train_loss": -6.520643711090088, "global_step": 110758, "epoch": 2637} {"train_loss": -6.413195610046387, "global_step": 110759, "epoch": 2637} {"train_loss": -6.46869421005249, "global_step": 110760, "epoch": 2637} {"train_loss": -6.4095354080200195, "global_step": 110761, "epoch": 2637} {"train_loss": -6.330344200134277, "global_step": 110762, "epoch": 2637} {"train_loss": -6.378641128540039, "global_step": 110763, "epoch": 2637} {"train_loss": -6.485867977142334, "global_step": 110764, "epoch": 2637} {"train_loss": -6.5118889808654785, "global_step": 110765, "epoch": 2637} {"train_loss": -6.534036636352539, "global_step": 110766, "epoch": 2637} {"train_loss": -6.633565902709961, "global_step": 110767, "epoch": 2637} {"train_loss": -6.5055036544799805, "global_step": 110768, "epoch": 2637} {"train_loss": -6.468321800231934, "global_step": 110769, "epoch": 2637} {"train_loss": -6.517843246459961, "global_step": 110770, "epoch": 2637} {"train_loss": -6.411888122558594, "global_step": 110771, "epoch": 2637} {"train_loss": -6.528289318084717, "global_step": 110772, "epoch": 2637} {"train_loss": -6.62984561920166, "global_step": 110773, "epoch": 2637} {"train_loss": -6.576937198638916, "global_step": 110774, "epoch": 2637} {"train_loss": -6.537133693695068, "global_step": 110775, "epoch": 2637} {"train_loss": -6.5752997398376465, "global_step": 110776, "epoch": 2637} {"train_loss": -6.524242401123047, "global_step": 110777, "epoch": 2637} {"train_loss": -6.406943321228027, "global_step": 110778, "epoch": 2637} {"train_loss": -6.565398693084717, "global_step": 110779, "epoch": 2637} {"train_loss": -6.478072166442871, "global_step": 110780, "epoch": 2637} {"train_loss": -6.469603538513184, "global_step": 110781, "epoch": 2637} {"train_loss": -6.433211326599121, "global_step": 110782, "epoch": 2637} {"train_loss": -6.48577880859375, "global_step": 110783, "epoch": 2637} {"train_loss": -6.573047637939453, "global_step": 110784, "epoch": 2637} {"train_loss": -6.457772254943848, "global_step": 110785, "epoch": 2637} {"train_loss": -6.544492244720459, "global_step": 110786, "epoch": 2637} {"train_loss": -6.469745635986328, "global_step": 110787, "epoch": 2637} {"train_loss": -6.193320274353027, "global_step": 110788, "epoch": 2637} {"train_loss": -6.45207405090332, "global_step": 110789, "epoch": 2637} {"train_loss": -6.405708312988281, "global_step": 110790, "epoch": 2637} {"train_loss": -6.356328964233398, "global_step": 110791, "epoch": 2637} {"train_loss": -6.484867095947266, "global_step": 110792, "epoch": 2637} {"train_loss": -6.531375408172607, "global_step": 110793, "epoch": 2637} {"train_loss": -6.529600143432617, "global_step": 110794, "epoch": 2637} {"train_loss": -6.477803627649943, "global_step": 110795, "epoch": 2637, "val_loss": 64994.90234375} {"train_loss": -6.495785713195801, "global_step": 110796, "epoch": 2638} {"train_loss": -6.582470893859863, "global_step": 110797, "epoch": 2638} {"train_loss": -6.541559219360352, "global_step": 110798, "epoch": 2638} {"train_loss": -6.502419471740723, "global_step": 110799, "epoch": 2638} {"train_loss": -6.515204429626465, "global_step": 110800, "epoch": 2638} {"train_loss": -6.5856170654296875, "global_step": 110801, "epoch": 2638} {"train_loss": -6.553552627563477, "global_step": 110802, "epoch": 2638} {"train_loss": -6.555653095245361, "global_step": 110803, "epoch": 2638} {"train_loss": -6.624004364013672, "global_step": 110804, "epoch": 2638} {"train_loss": -6.491981506347656, "global_step": 110805, "epoch": 2638} {"train_loss": -6.462165832519531, "global_step": 110806, "epoch": 2638} {"train_loss": -6.481573581695557, "global_step": 110807, "epoch": 2638} {"train_loss": -6.422231674194336, "global_step": 110808, "epoch": 2638} {"train_loss": -6.519322395324707, "global_step": 110809, "epoch": 2638} {"train_loss": -6.518914222717285, "global_step": 110810, "epoch": 2638} {"train_loss": -6.481876373291016, "global_step": 110811, "epoch": 2638} {"train_loss": -6.491943836212158, "global_step": 110812, "epoch": 2638} {"train_loss": -6.376491546630859, "global_step": 110813, "epoch": 2638} {"train_loss": -6.642867088317871, "global_step": 110814, "epoch": 2638} {"train_loss": -6.534458160400391, "global_step": 110815, "epoch": 2638} {"train_loss": -6.375284194946289, "global_step": 110816, "epoch": 2638} {"train_loss": -6.603395462036133, "global_step": 110817, "epoch": 2638} {"train_loss": -6.5483293533325195, "global_step": 110818, "epoch": 2638} {"train_loss": -6.51466178894043, "global_step": 110819, "epoch": 2638} {"train_loss": -6.492955684661865, "global_step": 110820, "epoch": 2638} {"train_loss": -6.491698265075684, "global_step": 110821, "epoch": 2638} {"train_loss": -6.378549575805664, "global_step": 110822, "epoch": 2638} {"train_loss": -6.412529945373535, "global_step": 110823, "epoch": 2638} {"train_loss": -6.450572967529297, "global_step": 110824, "epoch": 2638} {"train_loss": -6.384448528289795, "global_step": 110825, "epoch": 2638} {"train_loss": -6.449094772338867, "global_step": 110826, "epoch": 2638} {"train_loss": -6.547560214996338, "global_step": 110827, "epoch": 2638} {"train_loss": -6.447840690612793, "global_step": 110828, "epoch": 2638} {"train_loss": -6.366055011749268, "global_step": 110829, "epoch": 2638} {"train_loss": -6.580611228942871, "global_step": 110830, "epoch": 2638} {"train_loss": -6.441642761230469, "global_step": 110831, "epoch": 2638} {"train_loss": -6.464205741882324, "global_step": 110832, "epoch": 2638} {"train_loss": -6.562224388122559, "global_step": 110833, "epoch": 2638} {"train_loss": -6.461350440979004, "global_step": 110834, "epoch": 2638} {"train_loss": -6.294404029846191, "global_step": 110835, "epoch": 2638} {"train_loss": -6.490766525268555, "global_step": 110836, "epoch": 2638} {"train_loss": -6.488489241827102, "global_step": 110837, "epoch": 2638, "val_loss": 64979.54296875} {"train_loss": -6.27633810043335, "global_step": 110838, "epoch": 2639} {"train_loss": -6.519301414489746, "global_step": 110839, "epoch": 2639} {"train_loss": -6.390886306762695, "global_step": 110840, "epoch": 2639} {"train_loss": -6.468799591064453, "global_step": 110841, "epoch": 2639} {"train_loss": -6.478156089782715, "global_step": 110842, "epoch": 2639} {"train_loss": -6.598047256469727, "global_step": 110843, "epoch": 2639} {"train_loss": -6.508711814880371, "global_step": 110844, "epoch": 2639} {"train_loss": -6.459966659545898, "global_step": 110845, "epoch": 2639} {"train_loss": -6.566544532775879, "global_step": 110846, "epoch": 2639} {"train_loss": -6.44670295715332, "global_step": 110847, "epoch": 2639} {"train_loss": -6.559708118438721, "global_step": 110848, "epoch": 2639} {"train_loss": -6.602518558502197, "global_step": 110849, "epoch": 2639} {"train_loss": -6.4380035400390625, "global_step": 110850, "epoch": 2639} {"train_loss": -6.5275750160217285, "global_step": 110851, "epoch": 2639} {"train_loss": -6.37966251373291, "global_step": 110852, "epoch": 2639} {"train_loss": -6.470216274261475, "global_step": 110853, "epoch": 2639} {"train_loss": -6.512617111206055, "global_step": 110854, "epoch": 2639} {"train_loss": -6.40103816986084, "global_step": 110855, "epoch": 2639} {"train_loss": -6.4640302658081055, "global_step": 110856, "epoch": 2639} {"train_loss": -6.475134372711182, "global_step": 110857, "epoch": 2639} {"train_loss": -6.406994342803955, "global_step": 110858, "epoch": 2639} {"train_loss": -6.570539474487305, "global_step": 110859, "epoch": 2639} {"train_loss": -6.517568111419678, "global_step": 110860, "epoch": 2639} {"train_loss": -6.469719409942627, "global_step": 110861, "epoch": 2639} {"train_loss": -6.544055461883545, "global_step": 110862, "epoch": 2639} {"train_loss": -6.475951194763184, "global_step": 110863, "epoch": 2639} {"train_loss": -6.42214822769165, "global_step": 110864, "epoch": 2639} {"train_loss": -6.413712978363037, "global_step": 110865, "epoch": 2639} {"train_loss": -6.439123153686523, "global_step": 110866, "epoch": 2639} {"train_loss": -6.566860198974609, "global_step": 110867, "epoch": 2639} {"train_loss": -6.411625862121582, "global_step": 110868, "epoch": 2639} {"train_loss": -6.503261089324951, "global_step": 110869, "epoch": 2639} {"train_loss": -6.4852800369262695, "global_step": 110870, "epoch": 2639} {"train_loss": -6.508566856384277, "global_step": 110871, "epoch": 2639} {"train_loss": -6.520076751708984, "global_step": 110872, "epoch": 2639} {"train_loss": -6.348464012145996, "global_step": 110873, "epoch": 2639} {"train_loss": -6.5810394287109375, "global_step": 110874, "epoch": 2639} {"train_loss": -6.473269939422607, "global_step": 110875, "epoch": 2639} {"train_loss": -6.550683498382568, "global_step": 110876, "epoch": 2639} {"train_loss": -6.522903919219971, "global_step": 110877, "epoch": 2639} {"train_loss": -6.491174221038818, "global_step": 110878, "epoch": 2639} {"train_loss": -6.483603046053932, "global_step": 110879, "epoch": 2639, "val_loss": 65090.56640625} {"train_loss": -6.603510856628418, "global_step": 110880, "epoch": 2640} {"train_loss": -6.540976047515869, "global_step": 110881, "epoch": 2640} {"train_loss": -6.570683479309082, "global_step": 110882, "epoch": 2640} {"train_loss": -6.5329670906066895, "global_step": 110883, "epoch": 2640} {"train_loss": -6.480799674987793, "global_step": 110884, "epoch": 2640} {"train_loss": -6.58595085144043, "global_step": 110885, "epoch": 2640} {"train_loss": -6.522334575653076, "global_step": 110886, "epoch": 2640} {"train_loss": -6.490592956542969, "global_step": 110887, "epoch": 2640} {"train_loss": -6.552037715911865, "global_step": 110888, "epoch": 2640} {"train_loss": -6.34886360168457, "global_step": 110889, "epoch": 2640} {"train_loss": -6.567818641662598, "global_step": 110890, "epoch": 2640} {"train_loss": -6.48000955581665, "global_step": 110891, "epoch": 2640} {"train_loss": -6.3746232986450195, "global_step": 110892, "epoch": 2640} {"train_loss": -6.4799909591674805, "global_step": 110893, "epoch": 2640} {"train_loss": -6.526650428771973, "global_step": 110894, "epoch": 2640} {"train_loss": -6.3969926834106445, "global_step": 110895, "epoch": 2640} {"train_loss": -6.4228339195251465, "global_step": 110896, "epoch": 2640} {"train_loss": -6.443326473236084, "global_step": 110897, "epoch": 2640} {"train_loss": -6.516368865966797, "global_step": 110898, "epoch": 2640} {"train_loss": -6.509222984313965, "global_step": 110899, "epoch": 2640} {"train_loss": -6.495347023010254, "global_step": 110900, "epoch": 2640} {"train_loss": -6.473174095153809, "global_step": 110901, "epoch": 2640} {"train_loss": -6.503447532653809, "global_step": 110902, "epoch": 2640} {"train_loss": -6.491434097290039, "global_step": 110903, "epoch": 2640} {"train_loss": -6.388751029968262, "global_step": 110904, "epoch": 2640} {"train_loss": -6.46293830871582, "global_step": 110905, "epoch": 2640} {"train_loss": -6.573760509490967, "global_step": 110906, "epoch": 2640} {"train_loss": -6.459140777587891, "global_step": 110907, "epoch": 2640} {"train_loss": -6.500072956085205, "global_step": 110908, "epoch": 2640} {"train_loss": -6.51918363571167, "global_step": 110909, "epoch": 2640} {"train_loss": -6.413418769836426, "global_step": 110910, "epoch": 2640} {"train_loss": -6.484053611755371, "global_step": 110911, "epoch": 2640} {"train_loss": -6.552696704864502, "global_step": 110912, "epoch": 2640} {"train_loss": -6.496494293212891, "global_step": 110913, "epoch": 2640} {"train_loss": -6.476680278778076, "global_step": 110914, "epoch": 2640} {"train_loss": -6.508805751800537, "global_step": 110915, "epoch": 2640} {"train_loss": -6.433464050292969, "global_step": 110916, "epoch": 2640} {"train_loss": -6.415038585662842, "global_step": 110917, "epoch": 2640} {"train_loss": -6.565950870513916, "global_step": 110918, "epoch": 2640} {"train_loss": -6.514415740966797, "global_step": 110919, "epoch": 2640} {"train_loss": -6.266945838928223, "global_step": 110920, "epoch": 2640} {"train_loss": -6.487391517275856, "global_step": 110921, "epoch": 2640, "val_loss": 64933.7421875} {"train_loss": -6.598362922668457, "global_step": 110922, "epoch": 2641} {"train_loss": -6.469742298126221, "global_step": 110923, "epoch": 2641} {"train_loss": -6.592525482177734, "global_step": 110924, "epoch": 2641} {"train_loss": -6.422151565551758, "global_step": 110925, "epoch": 2641} {"train_loss": -6.420839309692383, "global_step": 110926, "epoch": 2641} {"train_loss": -6.559810638427734, "global_step": 110927, "epoch": 2641} {"train_loss": -6.435116291046143, "global_step": 110928, "epoch": 2641} {"train_loss": -6.526025772094727, "global_step": 110929, "epoch": 2641} {"train_loss": -6.416520118713379, "global_step": 110930, "epoch": 2641} {"train_loss": -6.480228424072266, "global_step": 110931, "epoch": 2641} {"train_loss": -6.479880332946777, "global_step": 110932, "epoch": 2641} {"train_loss": -6.554986000061035, "global_step": 110933, "epoch": 2641} {"train_loss": -6.468448638916016, "global_step": 110934, "epoch": 2641} {"train_loss": -6.604218482971191, "global_step": 110935, "epoch": 2641} {"train_loss": -6.555758953094482, "global_step": 110936, "epoch": 2641} {"train_loss": -6.461195945739746, "global_step": 110937, "epoch": 2641} {"train_loss": -6.36431884765625, "global_step": 110938, "epoch": 2641} {"train_loss": -6.567686080932617, "global_step": 110939, "epoch": 2641} {"train_loss": -6.4209136962890625, "global_step": 110940, "epoch": 2641} {"train_loss": -6.391471862792969, "global_step": 110941, "epoch": 2641} {"train_loss": -6.443626880645752, "global_step": 110942, "epoch": 2641} {"train_loss": -6.3444013595581055, "global_step": 110943, "epoch": 2641} {"train_loss": -6.450773239135742, "global_step": 110944, "epoch": 2641} {"train_loss": -6.456249713897705, "global_step": 110945, "epoch": 2641} {"train_loss": -6.465878486633301, "global_step": 110946, "epoch": 2641} {"train_loss": -6.5774335861206055, "global_step": 110947, "epoch": 2641} {"train_loss": -6.544595718383789, "global_step": 110948, "epoch": 2641} {"train_loss": -6.572470664978027, "global_step": 110949, "epoch": 2641} {"train_loss": -6.469348907470703, "global_step": 110950, "epoch": 2641} {"train_loss": -6.527056694030762, "global_step": 110951, "epoch": 2641} {"train_loss": -6.583550453186035, "global_step": 110952, "epoch": 2641} {"train_loss": -6.434321403503418, "global_step": 110953, "epoch": 2641} {"train_loss": -6.581682205200195, "global_step": 110954, "epoch": 2641} {"train_loss": -6.553955554962158, "global_step": 110955, "epoch": 2641} {"train_loss": -6.449216365814209, "global_step": 110956, "epoch": 2641} {"train_loss": -6.518469333648682, "global_step": 110957, "epoch": 2641} {"train_loss": -6.533907890319824, "global_step": 110958, "epoch": 2641} {"train_loss": -6.472731590270996, "global_step": 110959, "epoch": 2641} {"train_loss": -6.4696736335754395, "global_step": 110960, "epoch": 2641} {"train_loss": -6.591596603393555, "global_step": 110961, "epoch": 2641} {"train_loss": -6.482420921325684, "global_step": 110962, "epoch": 2641} {"train_loss": -6.497648012070429, "global_step": 110963, "epoch": 2641, "val_loss": 65084.4609375} {"train_loss": -6.488018989562988, "global_step": 110964, "epoch": 2642} {"train_loss": -6.536300182342529, "global_step": 110965, "epoch": 2642} {"train_loss": -6.583017349243164, "global_step": 110966, "epoch": 2642} {"train_loss": -6.490549087524414, "global_step": 110967, "epoch": 2642} {"train_loss": -6.665702819824219, "global_step": 110968, "epoch": 2642} {"train_loss": -6.540002346038818, "global_step": 110969, "epoch": 2642} {"train_loss": -6.4849162101745605, "global_step": 110970, "epoch": 2642} {"train_loss": -6.514078617095947, "global_step": 110971, "epoch": 2642} {"train_loss": -6.619651794433594, "global_step": 110972, "epoch": 2642} {"train_loss": -6.379978179931641, "global_step": 110973, "epoch": 2642} {"train_loss": -6.313637733459473, "global_step": 110974, "epoch": 2642} {"train_loss": -6.520462989807129, "global_step": 110975, "epoch": 2642} {"train_loss": -6.439069747924805, "global_step": 110976, "epoch": 2642} {"train_loss": -6.550528049468994, "global_step": 110977, "epoch": 2642} {"train_loss": -6.589742183685303, "global_step": 110978, "epoch": 2642} {"train_loss": -6.526066780090332, "global_step": 110979, "epoch": 2642} {"train_loss": -6.608311653137207, "global_step": 110980, "epoch": 2642} {"train_loss": -6.5209808349609375, "global_step": 110981, "epoch": 2642} {"train_loss": -6.466591835021973, "global_step": 110982, "epoch": 2642} {"train_loss": -6.5758867263793945, "global_step": 110983, "epoch": 2642} {"train_loss": -6.555471420288086, "global_step": 110984, "epoch": 2642} {"train_loss": -6.461450099945068, "global_step": 110985, "epoch": 2642} {"train_loss": -6.566807746887207, "global_step": 110986, "epoch": 2642} {"train_loss": -6.431084632873535, "global_step": 110987, "epoch": 2642} {"train_loss": -6.457530975341797, "global_step": 110988, "epoch": 2642} {"train_loss": -6.517327308654785, "global_step": 110989, "epoch": 2642} {"train_loss": -6.570436000823975, "global_step": 110990, "epoch": 2642} {"train_loss": -6.557321548461914, "global_step": 110991, "epoch": 2642} {"train_loss": -6.543766021728516, "global_step": 110992, "epoch": 2642} {"train_loss": -6.56983757019043, "global_step": 110993, "epoch": 2642} {"train_loss": -6.462479114532471, "global_step": 110994, "epoch": 2642} {"train_loss": -6.521384239196777, "global_step": 110995, "epoch": 2642} {"train_loss": -6.422018051147461, "global_step": 110996, "epoch": 2642} {"train_loss": -6.401134490966797, "global_step": 110997, "epoch": 2642} {"train_loss": -6.48916482925415, "global_step": 110998, "epoch": 2642} {"train_loss": -6.455140113830566, "global_step": 110999, "epoch": 2642} {"train_loss": -6.572760581970215, "global_step": 111000, "epoch": 2642} {"train_loss": -6.421706199645996, "global_step": 111001, "epoch": 2642} {"train_loss": -6.4991865158081055, "global_step": 111002, "epoch": 2642} {"train_loss": -6.44561767578125, "global_step": 111003, "epoch": 2642} {"train_loss": -6.457469463348389, "global_step": 111004, "epoch": 2642} {"train_loss": -6.504500775110154, "global_step": 111005, "epoch": 2642, "val_loss": 64985.60546875} {"train_loss": -6.5055389404296875, "global_step": 111006, "epoch": 2643} {"train_loss": -6.566545009613037, "global_step": 111007, "epoch": 2643} {"train_loss": -6.415035247802734, "global_step": 111008, "epoch": 2643} {"train_loss": -6.5402913093566895, "global_step": 111009, "epoch": 2643} {"train_loss": -6.480025768280029, "global_step": 111010, "epoch": 2643} {"train_loss": -6.432958602905273, "global_step": 111011, "epoch": 2643} {"train_loss": -6.46844482421875, "global_step": 111012, "epoch": 2643} {"train_loss": -6.55719518661499, "global_step": 111013, "epoch": 2643} {"train_loss": -6.499841690063477, "global_step": 111014, "epoch": 2643} {"train_loss": -6.422639846801758, "global_step": 111015, "epoch": 2643} {"train_loss": -6.525168418884277, "global_step": 111016, "epoch": 2643} {"train_loss": -6.514797687530518, "global_step": 111017, "epoch": 2643} {"train_loss": -6.566139221191406, "global_step": 111018, "epoch": 2643} {"train_loss": -6.517688751220703, "global_step": 111019, "epoch": 2643} {"train_loss": -6.558310508728027, "global_step": 111020, "epoch": 2643} {"train_loss": -6.460348129272461, "global_step": 111021, "epoch": 2643} {"train_loss": -6.559952735900879, "global_step": 111022, "epoch": 2643} {"train_loss": -6.515941619873047, "global_step": 111023, "epoch": 2643} {"train_loss": -6.429274559020996, "global_step": 111024, "epoch": 2643} {"train_loss": -6.4589972496032715, "global_step": 111025, "epoch": 2643} {"train_loss": -6.442483901977539, "global_step": 111026, "epoch": 2643} {"train_loss": -6.409297466278076, "global_step": 111027, "epoch": 2643} {"train_loss": -6.413751125335693, "global_step": 111028, "epoch": 2643} {"train_loss": -6.422496318817139, "global_step": 111029, "epoch": 2643} {"train_loss": -6.436850547790527, "global_step": 111030, "epoch": 2643} {"train_loss": -6.544408798217773, "global_step": 111031, "epoch": 2643} {"train_loss": -6.390978813171387, "global_step": 111032, "epoch": 2643} {"train_loss": -6.315918445587158, "global_step": 111033, "epoch": 2643} {"train_loss": -6.310184478759766, "global_step": 111034, "epoch": 2643} {"train_loss": -6.429176330566406, "global_step": 111035, "epoch": 2643} {"train_loss": -6.4532341957092285, "global_step": 111036, "epoch": 2643} {"train_loss": -6.480799674987793, "global_step": 111037, "epoch": 2643} {"train_loss": -6.377521514892578, "global_step": 111038, "epoch": 2643} {"train_loss": -6.529899597167969, "global_step": 111039, "epoch": 2643} {"train_loss": -6.419430732727051, "global_step": 111040, "epoch": 2643} {"train_loss": -6.302959442138672, "global_step": 111041, "epoch": 2643} {"train_loss": -6.392314910888672, "global_step": 111042, "epoch": 2643} {"train_loss": -6.404631614685059, "global_step": 111043, "epoch": 2643} {"train_loss": -6.465212821960449, "global_step": 111044, "epoch": 2643} {"train_loss": -6.413705825805664, "global_step": 111045, "epoch": 2643} {"train_loss": -6.347990989685059, "global_step": 111046, "epoch": 2643} {"train_loss": -6.455391338893345, "global_step": 111047, "epoch": 2643, "val_loss": 65201.8046875} {"train_loss": -6.450946807861328, "global_step": 111048, "epoch": 2644} {"train_loss": -6.411159515380859, "global_step": 111049, "epoch": 2644} {"train_loss": -6.437062740325928, "global_step": 111050, "epoch": 2644} {"train_loss": -6.542565822601318, "global_step": 111051, "epoch": 2644} {"train_loss": -6.559073448181152, "global_step": 111052, "epoch": 2644} {"train_loss": -6.457866191864014, "global_step": 111053, "epoch": 2644} {"train_loss": -6.361366271972656, "global_step": 111054, "epoch": 2644} {"train_loss": -6.462468147277832, "global_step": 111055, "epoch": 2644} {"train_loss": -6.4574432373046875, "global_step": 111056, "epoch": 2644} {"train_loss": -6.5443644523620605, "global_step": 111057, "epoch": 2644} {"train_loss": -6.510315895080566, "global_step": 111058, "epoch": 2644} {"train_loss": -6.4240007400512695, "global_step": 111059, "epoch": 2644} {"train_loss": -6.550504207611084, "global_step": 111060, "epoch": 2644} {"train_loss": -6.559514045715332, "global_step": 111061, "epoch": 2644} {"train_loss": -6.499667167663574, "global_step": 111062, "epoch": 2644} {"train_loss": -6.611968517303467, "global_step": 111063, "epoch": 2644} {"train_loss": -6.540489196777344, "global_step": 111064, "epoch": 2644} {"train_loss": -6.523709297180176, "global_step": 111065, "epoch": 2644} {"train_loss": -6.370934963226318, "global_step": 111066, "epoch": 2644} {"train_loss": -6.45566463470459, "global_step": 111067, "epoch": 2644} {"train_loss": -6.501936435699463, "global_step": 111068, "epoch": 2644} {"train_loss": -6.459024429321289, "global_step": 111069, "epoch": 2644} {"train_loss": -6.513491153717041, "global_step": 111070, "epoch": 2644} {"train_loss": -6.442168712615967, "global_step": 111071, "epoch": 2644} {"train_loss": -6.460962295532227, "global_step": 111072, "epoch": 2644} {"train_loss": -6.4751691818237305, "global_step": 111073, "epoch": 2644} {"train_loss": -6.388056755065918, "global_step": 111074, "epoch": 2644} {"train_loss": -6.489285945892334, "global_step": 111075, "epoch": 2644} {"train_loss": -6.4469475746154785, "global_step": 111076, "epoch": 2644} {"train_loss": -6.528079509735107, "global_step": 111077, "epoch": 2644} {"train_loss": -6.399619102478027, "global_step": 111078, "epoch": 2644} {"train_loss": -6.4239044189453125, "global_step": 111079, "epoch": 2644} {"train_loss": -6.549393653869629, "global_step": 111080, "epoch": 2644} {"train_loss": -6.433272361755371, "global_step": 111081, "epoch": 2644} {"train_loss": -6.515310287475586, "global_step": 111082, "epoch": 2644} {"train_loss": -6.455020427703857, "global_step": 111083, "epoch": 2644} {"train_loss": -6.515625476837158, "global_step": 111084, "epoch": 2644} {"train_loss": -6.46989631652832, "global_step": 111085, "epoch": 2644} {"train_loss": -6.539547920227051, "global_step": 111086, "epoch": 2644} {"train_loss": -6.447577476501465, "global_step": 111087, "epoch": 2644} {"train_loss": -6.398223876953125, "global_step": 111088, "epoch": 2644} {"train_loss": -6.477963878994896, "global_step": 111089, "epoch": 2644, "val_loss": 64704.046875} {"train_loss": -6.392613887786865, "global_step": 111090, "epoch": 2645} {"train_loss": -6.537154674530029, "global_step": 111091, "epoch": 2645} {"train_loss": -6.461086750030518, "global_step": 111092, "epoch": 2645} {"train_loss": -6.429156303405762, "global_step": 111093, "epoch": 2645} {"train_loss": -6.542865753173828, "global_step": 111094, "epoch": 2645} {"train_loss": -6.467151165008545, "global_step": 111095, "epoch": 2645} {"train_loss": -6.464591979980469, "global_step": 111096, "epoch": 2645} {"train_loss": -6.511658668518066, "global_step": 111097, "epoch": 2645} {"train_loss": -6.500668525695801, "global_step": 111098, "epoch": 2645} {"train_loss": -6.419387340545654, "global_step": 111099, "epoch": 2645} {"train_loss": -6.481128692626953, "global_step": 111100, "epoch": 2645} {"train_loss": -6.3602142333984375, "global_step": 111101, "epoch": 2645} {"train_loss": -6.462379455566406, "global_step": 111102, "epoch": 2645} {"train_loss": -6.440276145935059, "global_step": 111103, "epoch": 2645} {"train_loss": -6.434360980987549, "global_step": 111104, "epoch": 2645} {"train_loss": -6.488650798797607, "global_step": 111105, "epoch": 2645} {"train_loss": -6.454905033111572, "global_step": 111106, "epoch": 2645} {"train_loss": -6.450803756713867, "global_step": 111107, "epoch": 2645} {"train_loss": -6.418789386749268, "global_step": 111108, "epoch": 2645} {"train_loss": -6.453171253204346, "global_step": 111109, "epoch": 2645} {"train_loss": -6.423580646514893, "global_step": 111110, "epoch": 2645} {"train_loss": -6.603819370269775, "global_step": 111111, "epoch": 2645} {"train_loss": -6.493314743041992, "global_step": 111112, "epoch": 2645} {"train_loss": -6.4352874755859375, "global_step": 111113, "epoch": 2645} {"train_loss": -6.520369529724121, "global_step": 111114, "epoch": 2645} {"train_loss": -6.441580295562744, "global_step": 111115, "epoch": 2645} {"train_loss": -6.434289455413818, "global_step": 111116, "epoch": 2645} {"train_loss": -6.577071189880371, "global_step": 111117, "epoch": 2645} {"train_loss": -6.493728160858154, "global_step": 111118, "epoch": 2645} {"train_loss": -6.476046562194824, "global_step": 111119, "epoch": 2645} {"train_loss": -6.54127836227417, "global_step": 111120, "epoch": 2645} {"train_loss": -6.564546585083008, "global_step": 111121, "epoch": 2645} {"train_loss": -6.41457986831665, "global_step": 111122, "epoch": 2645} {"train_loss": -6.431918144226074, "global_step": 111123, "epoch": 2645} {"train_loss": -6.429525375366211, "global_step": 111124, "epoch": 2645} {"train_loss": -6.436145782470703, "global_step": 111125, "epoch": 2645} {"train_loss": -6.387693881988525, "global_step": 111126, "epoch": 2645} {"train_loss": -6.330621719360352, "global_step": 111127, "epoch": 2645} {"train_loss": -6.4372758865356445, "global_step": 111128, "epoch": 2645} {"train_loss": -6.503548622131348, "global_step": 111129, "epoch": 2645} {"train_loss": -6.568142890930176, "global_step": 111130, "epoch": 2645} {"train_loss": -6.468591849009196, "global_step": 111131, "epoch": 2645, "val_loss": 64895.140625} {"train_loss": -6.480558395385742, "global_step": 111132, "epoch": 2646} {"train_loss": -6.470176696777344, "global_step": 111133, "epoch": 2646} {"train_loss": -6.448210716247559, "global_step": 111134, "epoch": 2646} {"train_loss": -6.531740665435791, "global_step": 111135, "epoch": 2646} {"train_loss": -6.482466697692871, "global_step": 111136, "epoch": 2646} {"train_loss": -6.535645008087158, "global_step": 111137, "epoch": 2646} {"train_loss": -6.411577224731445, "global_step": 111138, "epoch": 2646} {"train_loss": -6.481867790222168, "global_step": 111139, "epoch": 2646} {"train_loss": -6.627374172210693, "global_step": 111140, "epoch": 2646} {"train_loss": -6.407393455505371, "global_step": 111141, "epoch": 2646} {"train_loss": -6.55808162689209, "global_step": 111142, "epoch": 2646} {"train_loss": -6.4406867027282715, "global_step": 111143, "epoch": 2646} {"train_loss": -6.43763542175293, "global_step": 111144, "epoch": 2646} {"train_loss": -6.428493499755859, "global_step": 111145, "epoch": 2646} {"train_loss": -6.485848426818848, "global_step": 111146, "epoch": 2646} {"train_loss": -6.471549987792969, "global_step": 111147, "epoch": 2646} {"train_loss": -6.4840407371521, "global_step": 111148, "epoch": 2646} {"train_loss": -6.51849365234375, "global_step": 111149, "epoch": 2646} {"train_loss": -6.422684669494629, "global_step": 111150, "epoch": 2646} {"train_loss": -6.460808753967285, "global_step": 111151, "epoch": 2646} {"train_loss": -6.4952239990234375, "global_step": 111152, "epoch": 2646} {"train_loss": -6.5571980476379395, "global_step": 111153, "epoch": 2646} {"train_loss": -6.411052703857422, "global_step": 111154, "epoch": 2646} {"train_loss": -6.592511177062988, "global_step": 111155, "epoch": 2646} {"train_loss": -6.575120449066162, "global_step": 111156, "epoch": 2646} {"train_loss": -6.53218412399292, "global_step": 111157, "epoch": 2646} {"train_loss": -6.481971740722656, "global_step": 111158, "epoch": 2646} {"train_loss": -6.4820661544799805, "global_step": 111159, "epoch": 2646} {"train_loss": -6.391213893890381, "global_step": 111160, "epoch": 2646} {"train_loss": -6.472644805908203, "global_step": 111161, "epoch": 2646} {"train_loss": -6.491955757141113, "global_step": 111162, "epoch": 2646} {"train_loss": -6.374839782714844, "global_step": 111163, "epoch": 2646} {"train_loss": -6.294416427612305, "global_step": 111164, "epoch": 2646} {"train_loss": -6.3583903312683105, "global_step": 111165, "epoch": 2646} {"train_loss": -6.618859767913818, "global_step": 111166, "epoch": 2646} {"train_loss": -6.378837585449219, "global_step": 111167, "epoch": 2646} {"train_loss": -6.537580490112305, "global_step": 111168, "epoch": 2646} {"train_loss": -6.497990608215332, "global_step": 111169, "epoch": 2646} {"train_loss": -6.414846420288086, "global_step": 111170, "epoch": 2646} {"train_loss": -6.610136985778809, "global_step": 111171, "epoch": 2646} {"train_loss": -6.538018703460693, "global_step": 111172, "epoch": 2646} {"train_loss": -6.479724747794015, "global_step": 111173, "epoch": 2646, "val_loss": 65025.25390625} {"train_loss": -6.431440830230713, "global_step": 111174, "epoch": 2647} {"train_loss": -6.516765594482422, "global_step": 111175, "epoch": 2647} {"train_loss": -6.603792667388916, "global_step": 111176, "epoch": 2647} {"train_loss": -6.490570068359375, "global_step": 111177, "epoch": 2647} {"train_loss": -6.4678239822387695, "global_step": 111178, "epoch": 2647} {"train_loss": -6.474703788757324, "global_step": 111179, "epoch": 2647} {"train_loss": -6.512199878692627, "global_step": 111180, "epoch": 2647} {"train_loss": -6.396352767944336, "global_step": 111181, "epoch": 2647} {"train_loss": -6.430490970611572, "global_step": 111182, "epoch": 2647} {"train_loss": -6.440614700317383, "global_step": 111183, "epoch": 2647} {"train_loss": -6.560280799865723, "global_step": 111184, "epoch": 2647} {"train_loss": -6.460789680480957, "global_step": 111185, "epoch": 2647} {"train_loss": -6.381208896636963, "global_step": 111186, "epoch": 2647} {"train_loss": -6.518136978149414, "global_step": 111187, "epoch": 2647} {"train_loss": -6.471867561340332, "global_step": 111188, "epoch": 2647} {"train_loss": -6.5331573486328125, "global_step": 111189, "epoch": 2647} {"train_loss": -6.4576263427734375, "global_step": 111190, "epoch": 2647} {"train_loss": -6.424045562744141, "global_step": 111191, "epoch": 2647} {"train_loss": -6.50724983215332, "global_step": 111192, "epoch": 2647} {"train_loss": -6.465996265411377, "global_step": 111193, "epoch": 2647} {"train_loss": -6.529029369354248, "global_step": 111194, "epoch": 2647} {"train_loss": -6.496214866638184, "global_step": 111195, "epoch": 2647} {"train_loss": -6.514026165008545, "global_step": 111196, "epoch": 2647} {"train_loss": -6.560372352600098, "global_step": 111197, "epoch": 2647} {"train_loss": -6.451877593994141, "global_step": 111198, "epoch": 2647} {"train_loss": -6.397197723388672, "global_step": 111199, "epoch": 2647} {"train_loss": -6.4964141845703125, "global_step": 111200, "epoch": 2647} {"train_loss": -6.575841903686523, "global_step": 111201, "epoch": 2647} {"train_loss": -6.298398494720459, "global_step": 111202, "epoch": 2647} {"train_loss": -6.504762649536133, "global_step": 111203, "epoch": 2647} {"train_loss": -6.3785176277160645, "global_step": 111204, "epoch": 2647} {"train_loss": -6.512414932250977, "global_step": 111205, "epoch": 2647} {"train_loss": -6.298059463500977, "global_step": 111206, "epoch": 2647} {"train_loss": -6.361946105957031, "global_step": 111207, "epoch": 2647} {"train_loss": -6.504319667816162, "global_step": 111208, "epoch": 2647} {"train_loss": -6.406526565551758, "global_step": 111209, "epoch": 2647} {"train_loss": -6.423321723937988, "global_step": 111210, "epoch": 2647} {"train_loss": -6.368074417114258, "global_step": 111211, "epoch": 2647} {"train_loss": -6.379258155822754, "global_step": 111212, "epoch": 2647} {"train_loss": -6.485662460327148, "global_step": 111213, "epoch": 2647} {"train_loss": -6.470909118652344, "global_step": 111214, "epoch": 2647} {"train_loss": -6.463023878279186, "global_step": 111215, "epoch": 2647, "val_loss": 64980.87890625} {"train_loss": -6.4925689697265625, "global_step": 111216, "epoch": 2648} {"train_loss": -6.487651824951172, "global_step": 111217, "epoch": 2648} {"train_loss": -6.461540222167969, "global_step": 111218, "epoch": 2648} {"train_loss": -6.339717864990234, "global_step": 111219, "epoch": 2648} {"train_loss": -6.446523666381836, "global_step": 111220, "epoch": 2648} {"train_loss": -6.588171482086182, "global_step": 111221, "epoch": 2648} {"train_loss": -6.313126564025879, "global_step": 111222, "epoch": 2648} {"train_loss": -6.457897186279297, "global_step": 111223, "epoch": 2648} {"train_loss": -6.4820051193237305, "global_step": 111224, "epoch": 2648} {"train_loss": -6.337435245513916, "global_step": 111225, "epoch": 2648} {"train_loss": -6.414011001586914, "global_step": 111226, "epoch": 2648} {"train_loss": -6.507513046264648, "global_step": 111227, "epoch": 2648} {"train_loss": -6.469564437866211, "global_step": 111228, "epoch": 2648} {"train_loss": -6.406390190124512, "global_step": 111229, "epoch": 2648} {"train_loss": -6.476713180541992, "global_step": 111230, "epoch": 2648} {"train_loss": -6.329566478729248, "global_step": 111231, "epoch": 2648} {"train_loss": -6.427565574645996, "global_step": 111232, "epoch": 2648} {"train_loss": -6.383768081665039, "global_step": 111233, "epoch": 2648} {"train_loss": -6.423901557922363, "global_step": 111234, "epoch": 2648} {"train_loss": -6.3798418045043945, "global_step": 111235, "epoch": 2648} {"train_loss": -6.460308074951172, "global_step": 111236, "epoch": 2648} {"train_loss": -6.387679100036621, "global_step": 111237, "epoch": 2648} {"train_loss": -6.485791206359863, "global_step": 111238, "epoch": 2648} {"train_loss": -6.443044662475586, "global_step": 111239, "epoch": 2648} {"train_loss": -6.626263618469238, "global_step": 111240, "epoch": 2648} {"train_loss": -6.414978981018066, "global_step": 111241, "epoch": 2648} {"train_loss": -6.42203426361084, "global_step": 111242, "epoch": 2648} {"train_loss": -6.333676338195801, "global_step": 111243, "epoch": 2648} {"train_loss": -6.437291145324707, "global_step": 111244, "epoch": 2648} {"train_loss": -6.3676557540893555, "global_step": 111245, "epoch": 2648} {"train_loss": -6.37739372253418, "global_step": 111246, "epoch": 2648} {"train_loss": -6.37436056137085, "global_step": 111247, "epoch": 2648} {"train_loss": -6.496909141540527, "global_step": 111248, "epoch": 2648} {"train_loss": -6.439334869384766, "global_step": 111249, "epoch": 2648} {"train_loss": -6.431282997131348, "global_step": 111250, "epoch": 2648} {"train_loss": -6.409915924072266, "global_step": 111251, "epoch": 2648} {"train_loss": -6.359308242797852, "global_step": 111252, "epoch": 2648} {"train_loss": -6.379635810852051, "global_step": 111253, "epoch": 2648} {"train_loss": -6.445014953613281, "global_step": 111254, "epoch": 2648} {"train_loss": -6.474085330963135, "global_step": 111255, "epoch": 2648} {"train_loss": -6.513110637664795, "global_step": 111256, "epoch": 2648} {"train_loss": -6.431375003996349, "global_step": 111257, "epoch": 2648, "val_loss": 64899.890625} {"train_loss": -6.580397605895996, "global_step": 111258, "epoch": 2649} {"train_loss": -6.475641250610352, "global_step": 111259, "epoch": 2649} {"train_loss": -6.496652126312256, "global_step": 111260, "epoch": 2649} {"train_loss": -6.529952049255371, "global_step": 111261, "epoch": 2649} {"train_loss": -6.542878150939941, "global_step": 111262, "epoch": 2649} {"train_loss": -6.426074028015137, "global_step": 111263, "epoch": 2649} {"train_loss": -6.625821113586426, "global_step": 111264, "epoch": 2649} {"train_loss": -6.516887187957764, "global_step": 111265, "epoch": 2649} {"train_loss": -6.557778358459473, "global_step": 111266, "epoch": 2649} {"train_loss": -6.484223365783691, "global_step": 111267, "epoch": 2649} {"train_loss": -6.563595771789551, "global_step": 111268, "epoch": 2649} {"train_loss": -6.493673801422119, "global_step": 111269, "epoch": 2649} {"train_loss": -6.571800231933594, "global_step": 111270, "epoch": 2649} {"train_loss": -6.3184099197387695, "global_step": 111271, "epoch": 2649} {"train_loss": -6.48073673248291, "global_step": 111272, "epoch": 2649} {"train_loss": -6.627965927124023, "global_step": 111273, "epoch": 2649} {"train_loss": -6.46273136138916, "global_step": 111274, "epoch": 2649} {"train_loss": -6.463088035583496, "global_step": 111275, "epoch": 2649} {"train_loss": -6.431811332702637, "global_step": 111276, "epoch": 2649} {"train_loss": -6.519251823425293, "global_step": 111277, "epoch": 2649} {"train_loss": -6.548465728759766, "global_step": 111278, "epoch": 2649} {"train_loss": -6.384518623352051, "global_step": 111279, "epoch": 2649} {"train_loss": -6.223507404327393, "global_step": 111280, "epoch": 2649} {"train_loss": -6.445425510406494, "global_step": 111281, "epoch": 2649} {"train_loss": -6.4431304931640625, "global_step": 111282, "epoch": 2649} {"train_loss": -6.510655403137207, "global_step": 111283, "epoch": 2649} {"train_loss": -6.434671878814697, "global_step": 111284, "epoch": 2649} {"train_loss": -6.478878974914551, "global_step": 111285, "epoch": 2649} {"train_loss": -6.3852996826171875, "global_step": 111286, "epoch": 2649} {"train_loss": -6.422989845275879, "global_step": 111287, "epoch": 2649} {"train_loss": -6.430990695953369, "global_step": 111288, "epoch": 2649} {"train_loss": -6.496603012084961, "global_step": 111289, "epoch": 2649} {"train_loss": -6.562745094299316, "global_step": 111290, "epoch": 2649} {"train_loss": -6.455859184265137, "global_step": 111291, "epoch": 2649} {"train_loss": -6.468698501586914, "global_step": 111292, "epoch": 2649} {"train_loss": -6.603594779968262, "global_step": 111293, "epoch": 2649} {"train_loss": -6.520665168762207, "global_step": 111294, "epoch": 2649} {"train_loss": -6.519759178161621, "global_step": 111295, "epoch": 2649} {"train_loss": -6.459393501281738, "global_step": 111296, "epoch": 2649} {"train_loss": -6.436286926269531, "global_step": 111297, "epoch": 2649} {"train_loss": -6.456414699554443, "global_step": 111298, "epoch": 2649} {"train_loss": -6.48353860491798, "global_step": 111299, "epoch": 2649, "val_loss": 65028.16796875} {"train_loss": -6.458097457885742, "global_step": 111300, "epoch": 2650} {"train_loss": -6.504491806030273, "global_step": 111301, "epoch": 2650} {"train_loss": -6.355437278747559, "global_step": 111302, "epoch": 2650} {"train_loss": -6.5236968994140625, "global_step": 111303, "epoch": 2650} {"train_loss": -6.4573211669921875, "global_step": 111304, "epoch": 2650} {"train_loss": -6.446833610534668, "global_step": 111305, "epoch": 2650} {"train_loss": -6.435365200042725, "global_step": 111306, "epoch": 2650} {"train_loss": -6.417060852050781, "global_step": 111307, "epoch": 2650} {"train_loss": -6.341207027435303, "global_step": 111308, "epoch": 2650} {"train_loss": -6.527501106262207, "global_step": 111309, "epoch": 2650} {"train_loss": -6.436811923980713, "global_step": 111310, "epoch": 2650} {"train_loss": -6.532212734222412, "global_step": 111311, "epoch": 2650} {"train_loss": -6.419768333435059, "global_step": 111312, "epoch": 2650} {"train_loss": -6.404299736022949, "global_step": 111313, "epoch": 2650} {"train_loss": -6.312481880187988, "global_step": 111314, "epoch": 2650} {"train_loss": -6.447880744934082, "global_step": 111315, "epoch": 2650} {"train_loss": -6.389262676239014, "global_step": 111316, "epoch": 2650} {"train_loss": -6.445905685424805, "global_step": 111317, "epoch": 2650} {"train_loss": -6.4737629890441895, "global_step": 111318, "epoch": 2650} {"train_loss": -6.405597686767578, "global_step": 111319, "epoch": 2650} {"train_loss": -6.490335464477539, "global_step": 111320, "epoch": 2650} {"train_loss": -6.605803489685059, "global_step": 111321, "epoch": 2650} {"train_loss": -6.427961349487305, "global_step": 111322, "epoch": 2650} {"train_loss": -6.447987079620361, "global_step": 111323, "epoch": 2650} {"train_loss": -6.510312080383301, "global_step": 111324, "epoch": 2650} {"train_loss": -6.390223026275635, "global_step": 111325, "epoch": 2650} {"train_loss": -6.547773838043213, "global_step": 111326, "epoch": 2650} {"train_loss": -6.290016174316406, "global_step": 111327, "epoch": 2650} {"train_loss": -6.37058162689209, "global_step": 111328, "epoch": 2650} {"train_loss": -6.522336006164551, "global_step": 111329, "epoch": 2650} {"train_loss": -6.459586143493652, "global_step": 111330, "epoch": 2650} {"train_loss": -6.473684310913086, "global_step": 111331, "epoch": 2650} {"train_loss": -6.374264717102051, "global_step": 111332, "epoch": 2650} {"train_loss": -6.391142845153809, "global_step": 111333, "epoch": 2650} {"train_loss": -6.345619201660156, "global_step": 111334, "epoch": 2650} {"train_loss": -6.341784954071045, "global_step": 111335, "epoch": 2650} {"train_loss": -6.508305549621582, "global_step": 111336, "epoch": 2650} {"train_loss": -6.45210075378418, "global_step": 111337, "epoch": 2650} {"train_loss": -6.477514266967773, "global_step": 111338, "epoch": 2650} {"train_loss": -6.51975154876709, "global_step": 111339, "epoch": 2650} {"train_loss": -6.419304847717285, "global_step": 111340, "epoch": 2650} {"train_loss": -6.439459789366949, "global_step": 111341, "epoch": 2650, "train/sim_max_reward_0": 0.19225697441426964, "train/sim_max_reward_1": 0.9674657580572893, "train/sim_max_reward_2": 0.8039084673124899, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.9086933175352289, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5446122240480569, "test/sim_max_reward_4300002": 0.8316465773563197, "test/sim_max_reward_4300003": 0.9842288005464023, "test/sim_max_reward_4300004": 0.3347853046752913, "test/sim_max_reward_4300005": 0.9741658818744562, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3211785082082945, "test/sim_max_reward_4300008": 0.9294085406970638, "test/sim_max_reward_4300009": 0.9417173579301916, "test/sim_max_reward_4300010": 0.7720533248723136, "test/sim_max_reward_4300011": 0.8758345910924156, "test/sim_max_reward_4300012": 0.16123959756641615, "test/sim_max_reward_4300013": 0.9976895169981123, "test/sim_max_reward_4300014": 0.9037102318881184, "test/sim_max_reward_4300015": 0.9883638314419511, "test/sim_max_reward_4300016": 0.9773562576949275, "test/sim_max_reward_4300017": 0.43592342385634014, "test/sim_max_reward_4300018": 0.4181668574384324, "test/sim_max_reward_4300019": 0.18621035510814127, "test/sim_max_reward_4300020": 0.8637039287767274, "test/sim_max_reward_4300021": 0.9629669737685628, "test/sim_max_reward_4300022": 0.8949357753728127, "test/sim_max_reward_4300023": 0.9683248547766106, "test/sim_max_reward_4300024": 0.8666510102624152, "test/sim_max_reward_4300025": 0.8677878468163632, "test/sim_max_reward_4300026": 0.1652572872195134, "test/sim_max_reward_4300027": 0.8776985520088499, "test/sim_max_reward_4300028": 0.972889113088392, "test/sim_max_reward_4300029": 0.9043587353352297, "test/sim_max_reward_4300030": 0.005935462985564976, "test/sim_max_reward_4300031": 0.22307625287047061, "test/sim_max_reward_4300032": 0.9325471720122859, "test/sim_max_reward_4300033": 0.9888048626971372, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.6778154813971248, "test/sim_max_reward_4300036": 0.24807957898739671, "test/sim_max_reward_4300037": 0.9921914188813861, "test/sim_max_reward_4300038": 0.7839402375675111, "test/sim_max_reward_4300039": 0.5754129864473434, "test/sim_max_reward_4300040": 0.831622990195404, "test/sim_max_reward_4300041": 1.0, "test/sim_max_reward_4300042": 0.7077542559997554, "test/sim_max_reward_4300043": 0.8138862129295292, "test/sim_max_reward_4300044": 0.9451428529338158, "test/sim_max_reward_4300045": 0.18556059355113658, "test/sim_max_reward_4300046": 0.9249928650931643, "test/sim_max_reward_4300047": 0.14814976719922152, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.015521381329440871, "train/mean_score": 0.6775515461135776, "test/mean_score": 0.6384659926759282, "val_loss": 65355.203125} {"train_loss": -6.377436637878418, "global_step": 111342, "epoch": 2651} {"train_loss": -6.467862606048584, "global_step": 111343, "epoch": 2651} {"train_loss": -6.532455921173096, "global_step": 111344, "epoch": 2651} {"train_loss": -6.523401260375977, "global_step": 111345, "epoch": 2651} {"train_loss": -6.494592666625977, "global_step": 111346, "epoch": 2651} {"train_loss": -6.412440299987793, "global_step": 111347, "epoch": 2651} {"train_loss": -6.436155796051025, "global_step": 111348, "epoch": 2651} {"train_loss": -6.50446891784668, "global_step": 111349, "epoch": 2651} {"train_loss": -6.529118537902832, "global_step": 111350, "epoch": 2651} {"train_loss": -6.443560600280762, "global_step": 111351, "epoch": 2651} {"train_loss": -6.492232322692871, "global_step": 111352, "epoch": 2651} {"train_loss": -6.432077407836914, "global_step": 111353, "epoch": 2651} {"train_loss": -6.605642318725586, "global_step": 111354, "epoch": 2651} {"train_loss": -6.447168350219727, "global_step": 111355, "epoch": 2651} {"train_loss": -6.505664825439453, "global_step": 111356, "epoch": 2651} {"train_loss": -6.504055976867676, "global_step": 111357, "epoch": 2651} {"train_loss": -6.492565155029297, "global_step": 111358, "epoch": 2651} {"train_loss": -6.464594841003418, "global_step": 111359, "epoch": 2651} {"train_loss": -6.4876708984375, "global_step": 111360, "epoch": 2651} {"train_loss": -6.596846580505371, "global_step": 111361, "epoch": 2651} {"train_loss": -6.572977066040039, "global_step": 111362, "epoch": 2651} {"train_loss": -6.462672233581543, "global_step": 111363, "epoch": 2651} {"train_loss": -6.576026916503906, "global_step": 111364, "epoch": 2651} {"train_loss": -6.493569374084473, "global_step": 111365, "epoch": 2651} {"train_loss": -6.465939521789551, "global_step": 111366, "epoch": 2651} {"train_loss": -6.469193935394287, "global_step": 111367, "epoch": 2651} {"train_loss": -6.400967121124268, "global_step": 111368, "epoch": 2651} {"train_loss": -6.569032192230225, "global_step": 111369, "epoch": 2651} {"train_loss": -6.537226676940918, "global_step": 111370, "epoch": 2651} {"train_loss": -6.463022232055664, "global_step": 111371, "epoch": 2651} {"train_loss": -6.565738677978516, "global_step": 111372, "epoch": 2651} {"train_loss": -6.513558387756348, "global_step": 111373, "epoch": 2651} {"train_loss": -6.51332426071167, "global_step": 111374, "epoch": 2651} {"train_loss": -6.543923377990723, "global_step": 111375, "epoch": 2651} {"train_loss": -6.508038520812988, "global_step": 111376, "epoch": 2651} {"train_loss": -6.450806617736816, "global_step": 111377, "epoch": 2651} {"train_loss": -6.5106282234191895, "global_step": 111378, "epoch": 2651} {"train_loss": -6.518402099609375, "global_step": 111379, "epoch": 2651} {"train_loss": -6.516911506652832, "global_step": 111380, "epoch": 2651} {"train_loss": -6.4172682762146, "global_step": 111381, "epoch": 2651} {"train_loss": -6.433856964111328, "global_step": 111382, "epoch": 2651} {"train_loss": -6.494199764160883, "global_step": 111383, "epoch": 2651, "val_loss": 65355.6953125} {"train_loss": -6.370676517486572, "global_step": 111384, "epoch": 2652} {"train_loss": -6.490224838256836, "global_step": 111385, "epoch": 2652} {"train_loss": -6.5485076904296875, "global_step": 111386, "epoch": 2652} {"train_loss": -6.390846252441406, "global_step": 111387, "epoch": 2652} {"train_loss": -6.395281791687012, "global_step": 111388, "epoch": 2652} {"train_loss": -6.443911075592041, "global_step": 111389, "epoch": 2652} {"train_loss": -6.425537586212158, "global_step": 111390, "epoch": 2652} {"train_loss": -6.561444282531738, "global_step": 111391, "epoch": 2652} {"train_loss": -6.404582977294922, "global_step": 111392, "epoch": 2652} {"train_loss": -6.529677391052246, "global_step": 111393, "epoch": 2652} {"train_loss": -6.505235195159912, "global_step": 111394, "epoch": 2652} {"train_loss": -6.453563690185547, "global_step": 111395, "epoch": 2652} {"train_loss": -6.41865348815918, "global_step": 111396, "epoch": 2652} {"train_loss": -6.454765319824219, "global_step": 111397, "epoch": 2652} {"train_loss": -6.4318013191223145, "global_step": 111398, "epoch": 2652} {"train_loss": -6.520753383636475, "global_step": 111399, "epoch": 2652} {"train_loss": -6.41031551361084, "global_step": 111400, "epoch": 2652} {"train_loss": -6.516837120056152, "global_step": 111401, "epoch": 2652} {"train_loss": -6.459578990936279, "global_step": 111402, "epoch": 2652} {"train_loss": -6.524080276489258, "global_step": 111403, "epoch": 2652} {"train_loss": -6.498100280761719, "global_step": 111404, "epoch": 2652} {"train_loss": -6.493456840515137, "global_step": 111405, "epoch": 2652} {"train_loss": -6.637286186218262, "global_step": 111406, "epoch": 2652} {"train_loss": -6.5634260177612305, "global_step": 111407, "epoch": 2652} {"train_loss": -6.481829643249512, "global_step": 111408, "epoch": 2652} {"train_loss": -6.545154571533203, "global_step": 111409, "epoch": 2652} {"train_loss": -6.519299507141113, "global_step": 111410, "epoch": 2652} {"train_loss": -6.43949031829834, "global_step": 111411, "epoch": 2652} {"train_loss": -6.499612808227539, "global_step": 111412, "epoch": 2652} {"train_loss": -6.414187431335449, "global_step": 111413, "epoch": 2652} {"train_loss": -6.535428047180176, "global_step": 111414, "epoch": 2652} {"train_loss": -6.546316623687744, "global_step": 111415, "epoch": 2652} {"train_loss": -6.403038501739502, "global_step": 111416, "epoch": 2652} {"train_loss": -6.5724663734436035, "global_step": 111417, "epoch": 2652} {"train_loss": -6.476052284240723, "global_step": 111418, "epoch": 2652} {"train_loss": -6.542901992797852, "global_step": 111419, "epoch": 2652} {"train_loss": -6.501553535461426, "global_step": 111420, "epoch": 2652} {"train_loss": -6.44914436340332, "global_step": 111421, "epoch": 2652} {"train_loss": -6.508999347686768, "global_step": 111422, "epoch": 2652} {"train_loss": -6.463206768035889, "global_step": 111423, "epoch": 2652} {"train_loss": -6.5449981689453125, "global_step": 111424, "epoch": 2652} {"train_loss": -6.4851719084240145, "global_step": 111425, "epoch": 2652, "val_loss": 64887.546875} {"train_loss": -6.5684380531311035, "global_step": 111426, "epoch": 2653} {"train_loss": -6.44047737121582, "global_step": 111427, "epoch": 2653} {"train_loss": -6.55715799331665, "global_step": 111428, "epoch": 2653} {"train_loss": -6.479343891143799, "global_step": 111429, "epoch": 2653} {"train_loss": -6.417997360229492, "global_step": 111430, "epoch": 2653} {"train_loss": -6.41963005065918, "global_step": 111431, "epoch": 2653} {"train_loss": -6.459197521209717, "global_step": 111432, "epoch": 2653} {"train_loss": -6.545655250549316, "global_step": 111433, "epoch": 2653} {"train_loss": -6.550750732421875, "global_step": 111434, "epoch": 2653} {"train_loss": -6.406103134155273, "global_step": 111435, "epoch": 2653} {"train_loss": -6.501694679260254, "global_step": 111436, "epoch": 2653} {"train_loss": -6.587285041809082, "global_step": 111437, "epoch": 2653} {"train_loss": -6.476883888244629, "global_step": 111438, "epoch": 2653} {"train_loss": -6.498309135437012, "global_step": 111439, "epoch": 2653} {"train_loss": -6.502427577972412, "global_step": 111440, "epoch": 2653} {"train_loss": -6.509266376495361, "global_step": 111441, "epoch": 2653} {"train_loss": -6.4675374031066895, "global_step": 111442, "epoch": 2653} {"train_loss": -6.528120994567871, "global_step": 111443, "epoch": 2653} {"train_loss": -6.54710578918457, "global_step": 111444, "epoch": 2653} {"train_loss": -6.507846355438232, "global_step": 111445, "epoch": 2653} {"train_loss": -6.46616268157959, "global_step": 111446, "epoch": 2653} {"train_loss": -6.352377891540527, "global_step": 111447, "epoch": 2653} {"train_loss": -6.567173957824707, "global_step": 111448, "epoch": 2653} {"train_loss": -6.392189979553223, "global_step": 111449, "epoch": 2653} {"train_loss": -6.41154670715332, "global_step": 111450, "epoch": 2653} {"train_loss": -6.453460693359375, "global_step": 111451, "epoch": 2653} {"train_loss": -6.3282976150512695, "global_step": 111452, "epoch": 2653} {"train_loss": -6.349994659423828, "global_step": 111453, "epoch": 2653} {"train_loss": -6.430262565612793, "global_step": 111454, "epoch": 2653} {"train_loss": -6.398577690124512, "global_step": 111455, "epoch": 2653} {"train_loss": -6.361650466918945, "global_step": 111456, "epoch": 2653} {"train_loss": -6.376420974731445, "global_step": 111457, "epoch": 2653} {"train_loss": -6.464373588562012, "global_step": 111458, "epoch": 2653} {"train_loss": -6.433656692504883, "global_step": 111459, "epoch": 2653} {"train_loss": -6.353573799133301, "global_step": 111460, "epoch": 2653} {"train_loss": -6.4662675857543945, "global_step": 111461, "epoch": 2653} {"train_loss": -6.351814270019531, "global_step": 111462, "epoch": 2653} {"train_loss": -6.483855247497559, "global_step": 111463, "epoch": 2653} {"train_loss": -6.426236152648926, "global_step": 111464, "epoch": 2653} {"train_loss": -6.384064674377441, "global_step": 111465, "epoch": 2653} {"train_loss": -6.464031219482422, "global_step": 111466, "epoch": 2653} {"train_loss": -6.455895333063035, "global_step": 111467, "epoch": 2653, "val_loss": 65069.56640625} {"train_loss": -6.488221645355225, "global_step": 111468, "epoch": 2654} {"train_loss": -6.34641695022583, "global_step": 111469, "epoch": 2654} {"train_loss": -6.437560558319092, "global_step": 111470, "epoch": 2654} {"train_loss": -6.505417346954346, "global_step": 111471, "epoch": 2654} {"train_loss": -6.376883506774902, "global_step": 111472, "epoch": 2654} {"train_loss": -6.535386085510254, "global_step": 111473, "epoch": 2654} {"train_loss": -6.559491157531738, "global_step": 111474, "epoch": 2654} {"train_loss": -6.380806922912598, "global_step": 111475, "epoch": 2654} {"train_loss": -6.505434513092041, "global_step": 111476, "epoch": 2654} {"train_loss": -6.597656726837158, "global_step": 111477, "epoch": 2654} {"train_loss": -6.438417434692383, "global_step": 111478, "epoch": 2654} {"train_loss": -6.6347784996032715, "global_step": 111479, "epoch": 2654} {"train_loss": -6.365744113922119, "global_step": 111480, "epoch": 2654} {"train_loss": -6.399619102478027, "global_step": 111481, "epoch": 2654} {"train_loss": -6.509216785430908, "global_step": 111482, "epoch": 2654} {"train_loss": -6.497166633605957, "global_step": 111483, "epoch": 2654} {"train_loss": -6.5636186599731445, "global_step": 111484, "epoch": 2654} {"train_loss": -6.436333656311035, "global_step": 111485, "epoch": 2654} {"train_loss": -6.51169490814209, "global_step": 111486, "epoch": 2654} {"train_loss": -6.481132507324219, "global_step": 111487, "epoch": 2654} {"train_loss": -6.507330417633057, "global_step": 111488, "epoch": 2654} {"train_loss": -6.510125160217285, "global_step": 111489, "epoch": 2654} {"train_loss": -6.50039529800415, "global_step": 111490, "epoch": 2654} {"train_loss": -6.47661018371582, "global_step": 111491, "epoch": 2654} {"train_loss": -6.496481418609619, "global_step": 111492, "epoch": 2654} {"train_loss": -6.515104293823242, "global_step": 111493, "epoch": 2654} {"train_loss": -6.50309944152832, "global_step": 111494, "epoch": 2654} {"train_loss": -6.452224254608154, "global_step": 111495, "epoch": 2654} {"train_loss": -6.455982208251953, "global_step": 111496, "epoch": 2654} {"train_loss": -6.429660797119141, "global_step": 111497, "epoch": 2654} {"train_loss": -6.459012031555176, "global_step": 111498, "epoch": 2654} {"train_loss": -6.52030086517334, "global_step": 111499, "epoch": 2654} {"train_loss": -6.463811874389648, "global_step": 111500, "epoch": 2654} {"train_loss": -6.353669166564941, "global_step": 111501, "epoch": 2654} {"train_loss": -6.565331935882568, "global_step": 111502, "epoch": 2654} {"train_loss": -6.455733776092529, "global_step": 111503, "epoch": 2654} {"train_loss": -6.40458869934082, "global_step": 111504, "epoch": 2654} {"train_loss": -6.541745185852051, "global_step": 111505, "epoch": 2654} {"train_loss": -6.4908952713012695, "global_step": 111506, "epoch": 2654} {"train_loss": -6.405360221862793, "global_step": 111507, "epoch": 2654} {"train_loss": -6.528104305267334, "global_step": 111508, "epoch": 2654} {"train_loss": -6.476910738717942, "global_step": 111509, "epoch": 2654, "val_loss": 64989.5390625} {"train_loss": -6.552544593811035, "global_step": 111510, "epoch": 2655} {"train_loss": -6.511016368865967, "global_step": 111511, "epoch": 2655} {"train_loss": -6.490706920623779, "global_step": 111512, "epoch": 2655} {"train_loss": -6.562077522277832, "global_step": 111513, "epoch": 2655} {"train_loss": -6.546894550323486, "global_step": 111514, "epoch": 2655} {"train_loss": -6.612584114074707, "global_step": 111515, "epoch": 2655} {"train_loss": -6.448537826538086, "global_step": 111516, "epoch": 2655} {"train_loss": -6.558238983154297, "global_step": 111517, "epoch": 2655} {"train_loss": -6.5324931144714355, "global_step": 111518, "epoch": 2655} {"train_loss": -6.414450645446777, "global_step": 111519, "epoch": 2655} {"train_loss": -6.394824981689453, "global_step": 111520, "epoch": 2655} {"train_loss": -6.619932174682617, "global_step": 111521, "epoch": 2655} {"train_loss": -6.459621429443359, "global_step": 111522, "epoch": 2655} {"train_loss": -6.627753257751465, "global_step": 111523, "epoch": 2655} {"train_loss": -6.408059120178223, "global_step": 111524, "epoch": 2655} {"train_loss": -6.5346293449401855, "global_step": 111525, "epoch": 2655} {"train_loss": -6.5440216064453125, "global_step": 111526, "epoch": 2655} {"train_loss": -6.452035903930664, "global_step": 111527, "epoch": 2655} {"train_loss": -6.525733947753906, "global_step": 111528, "epoch": 2655} {"train_loss": -6.501871585845947, "global_step": 111529, "epoch": 2655} {"train_loss": -6.510721206665039, "global_step": 111530, "epoch": 2655} {"train_loss": -6.484346389770508, "global_step": 111531, "epoch": 2655} {"train_loss": -6.505335330963135, "global_step": 111532, "epoch": 2655} {"train_loss": -6.5321245193481445, "global_step": 111533, "epoch": 2655} {"train_loss": -6.463837623596191, "global_step": 111534, "epoch": 2655} {"train_loss": -6.514995574951172, "global_step": 111535, "epoch": 2655} {"train_loss": -6.564885139465332, "global_step": 111536, "epoch": 2655} {"train_loss": -6.505882263183594, "global_step": 111537, "epoch": 2655} {"train_loss": -6.499713897705078, "global_step": 111538, "epoch": 2655} {"train_loss": -6.425575256347656, "global_step": 111539, "epoch": 2655} {"train_loss": -6.448033332824707, "global_step": 111540, "epoch": 2655} {"train_loss": -6.488858699798584, "global_step": 111541, "epoch": 2655} {"train_loss": -6.580694675445557, "global_step": 111542, "epoch": 2655} {"train_loss": -6.48985481262207, "global_step": 111543, "epoch": 2655} {"train_loss": -6.51409912109375, "global_step": 111544, "epoch": 2655} {"train_loss": -6.446076393127441, "global_step": 111545, "epoch": 2655} {"train_loss": -6.564098358154297, "global_step": 111546, "epoch": 2655} {"train_loss": -6.461259365081787, "global_step": 111547, "epoch": 2655} {"train_loss": -6.548712730407715, "global_step": 111548, "epoch": 2655} {"train_loss": -6.5979719161987305, "global_step": 111549, "epoch": 2655} {"train_loss": -6.574974060058594, "global_step": 111550, "epoch": 2655} {"train_loss": -6.5127762499309725, "global_step": 111551, "epoch": 2655, "val_loss": 65132.77734375} {"train_loss": -6.531477451324463, "global_step": 111552, "epoch": 2656} {"train_loss": -6.5328474044799805, "global_step": 111553, "epoch": 2656} {"train_loss": -6.338588714599609, "global_step": 111554, "epoch": 2656} {"train_loss": -6.564489364624023, "global_step": 111555, "epoch": 2656} {"train_loss": -6.287444114685059, "global_step": 111556, "epoch": 2656} {"train_loss": -6.448673248291016, "global_step": 111557, "epoch": 2656} {"train_loss": -6.5410990715026855, "global_step": 111558, "epoch": 2656} {"train_loss": -6.316534042358398, "global_step": 111559, "epoch": 2656} {"train_loss": -6.502615928649902, "global_step": 111560, "epoch": 2656} {"train_loss": -6.4720001220703125, "global_step": 111561, "epoch": 2656} {"train_loss": -6.445842266082764, "global_step": 111562, "epoch": 2656} {"train_loss": -6.524292469024658, "global_step": 111563, "epoch": 2656} {"train_loss": -6.428767204284668, "global_step": 111564, "epoch": 2656} {"train_loss": -6.402274131774902, "global_step": 111565, "epoch": 2656} {"train_loss": -6.4686970710754395, "global_step": 111566, "epoch": 2656} {"train_loss": -6.325715065002441, "global_step": 111567, "epoch": 2656} {"train_loss": -6.444982528686523, "global_step": 111568, "epoch": 2656} {"train_loss": -6.434277057647705, "global_step": 111569, "epoch": 2656} {"train_loss": -6.304913520812988, "global_step": 111570, "epoch": 2656} {"train_loss": -6.521584987640381, "global_step": 111571, "epoch": 2656} {"train_loss": -6.485177040100098, "global_step": 111572, "epoch": 2656} {"train_loss": -6.443512916564941, "global_step": 111573, "epoch": 2656} {"train_loss": -6.333643913269043, "global_step": 111574, "epoch": 2656} {"train_loss": -6.44886589050293, "global_step": 111575, "epoch": 2656} {"train_loss": -6.567214012145996, "global_step": 111576, "epoch": 2656} {"train_loss": -6.442587852478027, "global_step": 111577, "epoch": 2656} {"train_loss": -6.4203081130981445, "global_step": 111578, "epoch": 2656} {"train_loss": -6.4931640625, "global_step": 111579, "epoch": 2656} {"train_loss": -6.482842445373535, "global_step": 111580, "epoch": 2656} {"train_loss": -6.523530960083008, "global_step": 111581, "epoch": 2656} {"train_loss": -6.520530700683594, "global_step": 111582, "epoch": 2656} {"train_loss": -6.494104385375977, "global_step": 111583, "epoch": 2656} {"train_loss": -6.3875412940979, "global_step": 111584, "epoch": 2656} {"train_loss": -6.6142897605896, "global_step": 111585, "epoch": 2656} {"train_loss": -6.399771690368652, "global_step": 111586, "epoch": 2656} {"train_loss": -6.5727691650390625, "global_step": 111587, "epoch": 2656} {"train_loss": -6.4629106521606445, "global_step": 111588, "epoch": 2656} {"train_loss": -6.48539400100708, "global_step": 111589, "epoch": 2656} {"train_loss": -6.416131973266602, "global_step": 111590, "epoch": 2656} {"train_loss": -6.5085906982421875, "global_step": 111591, "epoch": 2656} {"train_loss": -6.592766284942627, "global_step": 111592, "epoch": 2656} {"train_loss": -6.461054427283151, "global_step": 111593, "epoch": 2656, "val_loss": 64993.03125} {"train_loss": -6.544750213623047, "global_step": 111594, "epoch": 2657} {"train_loss": -6.484926700592041, "global_step": 111595, "epoch": 2657} {"train_loss": -6.573847770690918, "global_step": 111596, "epoch": 2657} {"train_loss": -6.532956600189209, "global_step": 111597, "epoch": 2657} {"train_loss": -6.432165145874023, "global_step": 111598, "epoch": 2657} {"train_loss": -6.386011600494385, "global_step": 111599, "epoch": 2657} {"train_loss": -6.510285377502441, "global_step": 111600, "epoch": 2657} {"train_loss": -6.491870880126953, "global_step": 111601, "epoch": 2657} {"train_loss": -6.607584476470947, "global_step": 111602, "epoch": 2657} {"train_loss": -6.552888870239258, "global_step": 111603, "epoch": 2657} {"train_loss": -6.555752754211426, "global_step": 111604, "epoch": 2657} {"train_loss": -6.503692150115967, "global_step": 111605, "epoch": 2657} {"train_loss": -6.5023369789123535, "global_step": 111606, "epoch": 2657} {"train_loss": -6.537125110626221, "global_step": 111607, "epoch": 2657} {"train_loss": -6.443314552307129, "global_step": 111608, "epoch": 2657} {"train_loss": -6.494812965393066, "global_step": 111609, "epoch": 2657} {"train_loss": -6.549233913421631, "global_step": 111610, "epoch": 2657} {"train_loss": -6.535963535308838, "global_step": 111611, "epoch": 2657} {"train_loss": -6.379181861877441, "global_step": 111612, "epoch": 2657} {"train_loss": -6.502083778381348, "global_step": 111613, "epoch": 2657} {"train_loss": -6.465483665466309, "global_step": 111614, "epoch": 2657} {"train_loss": -6.65031623840332, "global_step": 111615, "epoch": 2657} {"train_loss": -6.532981872558594, "global_step": 111616, "epoch": 2657} {"train_loss": -6.561679840087891, "global_step": 111617, "epoch": 2657} {"train_loss": -6.493529796600342, "global_step": 111618, "epoch": 2657} {"train_loss": -6.612903594970703, "global_step": 111619, "epoch": 2657} {"train_loss": -6.545535087585449, "global_step": 111620, "epoch": 2657} {"train_loss": -6.569218635559082, "global_step": 111621, "epoch": 2657} {"train_loss": -6.508787155151367, "global_step": 111622, "epoch": 2657} {"train_loss": -6.433653354644775, "global_step": 111623, "epoch": 2657} {"train_loss": -6.422145366668701, "global_step": 111624, "epoch": 2657} {"train_loss": -6.436451435089111, "global_step": 111625, "epoch": 2657} {"train_loss": -6.57923698425293, "global_step": 111626, "epoch": 2657} {"train_loss": -6.492323875427246, "global_step": 111627, "epoch": 2657} {"train_loss": -6.607710838317871, "global_step": 111628, "epoch": 2657} {"train_loss": -6.461889743804932, "global_step": 111629, "epoch": 2657} {"train_loss": -6.4766845703125, "global_step": 111630, "epoch": 2657} {"train_loss": -6.53481388092041, "global_step": 111631, "epoch": 2657} {"train_loss": -6.472445964813232, "global_step": 111632, "epoch": 2657} {"train_loss": -6.465309143066406, "global_step": 111633, "epoch": 2657} {"train_loss": -6.424470901489258, "global_step": 111634, "epoch": 2657} {"train_loss": -6.507656301770892, "global_step": 111635, "epoch": 2657, "val_loss": 64932.7890625} {"train_loss": -6.633060455322266, "global_step": 111636, "epoch": 2658} {"train_loss": -6.534764289855957, "global_step": 111637, "epoch": 2658} {"train_loss": -6.51620626449585, "global_step": 111638, "epoch": 2658} {"train_loss": -6.572964668273926, "global_step": 111639, "epoch": 2658} {"train_loss": -6.339821815490723, "global_step": 111640, "epoch": 2658} {"train_loss": -6.375024795532227, "global_step": 111641, "epoch": 2658} {"train_loss": -6.481574058532715, "global_step": 111642, "epoch": 2658} {"train_loss": -6.509073257446289, "global_step": 111643, "epoch": 2658} {"train_loss": -6.498136520385742, "global_step": 111644, "epoch": 2658} {"train_loss": -6.443247318267822, "global_step": 111645, "epoch": 2658} {"train_loss": -6.520228385925293, "global_step": 111646, "epoch": 2658} {"train_loss": -6.441725254058838, "global_step": 111647, "epoch": 2658} {"train_loss": -6.460691452026367, "global_step": 111648, "epoch": 2658} {"train_loss": -6.504176139831543, "global_step": 111649, "epoch": 2658} {"train_loss": -6.54361629486084, "global_step": 111650, "epoch": 2658} {"train_loss": -6.476310729980469, "global_step": 111651, "epoch": 2658} {"train_loss": -6.521422863006592, "global_step": 111652, "epoch": 2658} {"train_loss": -6.453782081604004, "global_step": 111653, "epoch": 2658} {"train_loss": -6.436176776885986, "global_step": 111654, "epoch": 2658} {"train_loss": -6.341658592224121, "global_step": 111655, "epoch": 2658} {"train_loss": -6.391085624694824, "global_step": 111656, "epoch": 2658} {"train_loss": -6.362069606781006, "global_step": 111657, "epoch": 2658} {"train_loss": -6.266331672668457, "global_step": 111658, "epoch": 2658} {"train_loss": -6.415633201599121, "global_step": 111659, "epoch": 2658} {"train_loss": -6.410429954528809, "global_step": 111660, "epoch": 2658} {"train_loss": -6.463588714599609, "global_step": 111661, "epoch": 2658} {"train_loss": -6.523794174194336, "global_step": 111662, "epoch": 2658} {"train_loss": -6.459747314453125, "global_step": 111663, "epoch": 2658} {"train_loss": -6.485472679138184, "global_step": 111664, "epoch": 2658} {"train_loss": -6.443690299987793, "global_step": 111665, "epoch": 2658} {"train_loss": -6.514289855957031, "global_step": 111666, "epoch": 2658} {"train_loss": -6.437006950378418, "global_step": 111667, "epoch": 2658} {"train_loss": -6.4922027587890625, "global_step": 111668, "epoch": 2658} {"train_loss": -6.493313312530518, "global_step": 111669, "epoch": 2658} {"train_loss": -6.518692970275879, "global_step": 111670, "epoch": 2658} {"train_loss": -6.495473384857178, "global_step": 111671, "epoch": 2658} {"train_loss": -6.414588451385498, "global_step": 111672, "epoch": 2658} {"train_loss": -6.472677230834961, "global_step": 111673, "epoch": 2658} {"train_loss": -6.490269660949707, "global_step": 111674, "epoch": 2658} {"train_loss": -6.559433937072754, "global_step": 111675, "epoch": 2658} {"train_loss": -6.4478349685668945, "global_step": 111676, "epoch": 2658} {"train_loss": -6.468333607628232, "global_step": 111677, "epoch": 2658, "val_loss": 65218.74609375} {"train_loss": -6.446646213531494, "global_step": 111678, "epoch": 2659} {"train_loss": -6.496685028076172, "global_step": 111679, "epoch": 2659} {"train_loss": -6.511335372924805, "global_step": 111680, "epoch": 2659} {"train_loss": -6.367882251739502, "global_step": 111681, "epoch": 2659} {"train_loss": -6.575015068054199, "global_step": 111682, "epoch": 2659} {"train_loss": -6.465433120727539, "global_step": 111683, "epoch": 2659} {"train_loss": -6.495303153991699, "global_step": 111684, "epoch": 2659} {"train_loss": -6.532867431640625, "global_step": 111685, "epoch": 2659} {"train_loss": -6.506453037261963, "global_step": 111686, "epoch": 2659} {"train_loss": -6.533450603485107, "global_step": 111687, "epoch": 2659} {"train_loss": -6.437760353088379, "global_step": 111688, "epoch": 2659} {"train_loss": -6.519725799560547, "global_step": 111689, "epoch": 2659} {"train_loss": -6.484500885009766, "global_step": 111690, "epoch": 2659} {"train_loss": -6.408827781677246, "global_step": 111691, "epoch": 2659} {"train_loss": -6.546502113342285, "global_step": 111692, "epoch": 2659} {"train_loss": -6.564145088195801, "global_step": 111693, "epoch": 2659} {"train_loss": -6.434900283813477, "global_step": 111694, "epoch": 2659} {"train_loss": -6.528151512145996, "global_step": 111695, "epoch": 2659} {"train_loss": -6.479239463806152, "global_step": 111696, "epoch": 2659} {"train_loss": -6.483455657958984, "global_step": 111697, "epoch": 2659} {"train_loss": -6.576040267944336, "global_step": 111698, "epoch": 2659} {"train_loss": -6.485138416290283, "global_step": 111699, "epoch": 2659} {"train_loss": -6.510109901428223, "global_step": 111700, "epoch": 2659} {"train_loss": -6.437164306640625, "global_step": 111701, "epoch": 2659} {"train_loss": -6.378252029418945, "global_step": 111702, "epoch": 2659} {"train_loss": -6.432528495788574, "global_step": 111703, "epoch": 2659} {"train_loss": -6.483031749725342, "global_step": 111704, "epoch": 2659} {"train_loss": -6.390040874481201, "global_step": 111705, "epoch": 2659} {"train_loss": -6.484901428222656, "global_step": 111706, "epoch": 2659} {"train_loss": -6.441736698150635, "global_step": 111707, "epoch": 2659} {"train_loss": -6.467507362365723, "global_step": 111708, "epoch": 2659} {"train_loss": -6.576311111450195, "global_step": 111709, "epoch": 2659} {"train_loss": -6.486062526702881, "global_step": 111710, "epoch": 2659} {"train_loss": -6.528285980224609, "global_step": 111711, "epoch": 2659} {"train_loss": -6.4108991622924805, "global_step": 111712, "epoch": 2659} {"train_loss": -6.48999547958374, "global_step": 111713, "epoch": 2659} {"train_loss": -6.5097455978393555, "global_step": 111714, "epoch": 2659} {"train_loss": -6.345706939697266, "global_step": 111715, "epoch": 2659} {"train_loss": -6.464101791381836, "global_step": 111716, "epoch": 2659} {"train_loss": -6.464890956878662, "global_step": 111717, "epoch": 2659} {"train_loss": -6.509128570556641, "global_step": 111718, "epoch": 2659} {"train_loss": -6.4799010299500965, "global_step": 111719, "epoch": 2659, "val_loss": 65166.39453125} {"train_loss": -6.586031436920166, "global_step": 111720, "epoch": 2660} {"train_loss": -6.473739147186279, "global_step": 111721, "epoch": 2660} {"train_loss": -6.42502498626709, "global_step": 111722, "epoch": 2660} {"train_loss": -6.500912189483643, "global_step": 111723, "epoch": 2660} {"train_loss": -6.5256757736206055, "global_step": 111724, "epoch": 2660} {"train_loss": -6.525683879852295, "global_step": 111725, "epoch": 2660} {"train_loss": -6.523754119873047, "global_step": 111726, "epoch": 2660} {"train_loss": -6.485033988952637, "global_step": 111727, "epoch": 2660} {"train_loss": -6.449976444244385, "global_step": 111728, "epoch": 2660} {"train_loss": -6.31716251373291, "global_step": 111729, "epoch": 2660} {"train_loss": -6.476268291473389, "global_step": 111730, "epoch": 2660} {"train_loss": -6.492240905761719, "global_step": 111731, "epoch": 2660} {"train_loss": -6.449204444885254, "global_step": 111732, "epoch": 2660} {"train_loss": -6.527655601501465, "global_step": 111733, "epoch": 2660} {"train_loss": -6.441099643707275, "global_step": 111734, "epoch": 2660} {"train_loss": -6.555220127105713, "global_step": 111735, "epoch": 2660} {"train_loss": -6.4756550788879395, "global_step": 111736, "epoch": 2660} {"train_loss": -6.619366645812988, "global_step": 111737, "epoch": 2660} {"train_loss": -6.456357955932617, "global_step": 111738, "epoch": 2660} {"train_loss": -6.479363441467285, "global_step": 111739, "epoch": 2660} {"train_loss": -6.526148796081543, "global_step": 111740, "epoch": 2660} {"train_loss": -6.528965950012207, "global_step": 111741, "epoch": 2660} {"train_loss": -6.408493995666504, "global_step": 111742, "epoch": 2660} {"train_loss": -6.500876426696777, "global_step": 111743, "epoch": 2660} {"train_loss": -6.605401039123535, "global_step": 111744, "epoch": 2660} {"train_loss": -6.574063301086426, "global_step": 111745, "epoch": 2660} {"train_loss": -6.395882606506348, "global_step": 111746, "epoch": 2660} {"train_loss": -6.437857151031494, "global_step": 111747, "epoch": 2660} {"train_loss": -6.474747657775879, "global_step": 111748, "epoch": 2660} {"train_loss": -6.503391265869141, "global_step": 111749, "epoch": 2660} {"train_loss": -6.578114986419678, "global_step": 111750, "epoch": 2660} {"train_loss": -6.5940351486206055, "global_step": 111751, "epoch": 2660} {"train_loss": -6.4677886962890625, "global_step": 111752, "epoch": 2660} {"train_loss": -6.53038215637207, "global_step": 111753, "epoch": 2660} {"train_loss": -6.495664119720459, "global_step": 111754, "epoch": 2660} {"train_loss": -6.56883430480957, "global_step": 111755, "epoch": 2660} {"train_loss": -6.493272304534912, "global_step": 111756, "epoch": 2660} {"train_loss": -6.58671760559082, "global_step": 111757, "epoch": 2660} {"train_loss": -6.431042671203613, "global_step": 111758, "epoch": 2660} {"train_loss": -6.489424705505371, "global_step": 111759, "epoch": 2660} {"train_loss": -6.461574077606201, "global_step": 111760, "epoch": 2660} {"train_loss": -6.497606765656244, "global_step": 111761, "epoch": 2660, "val_loss": 65018.47265625} {"train_loss": -6.636580467224121, "global_step": 111762, "epoch": 2661} {"train_loss": -6.52458381652832, "global_step": 111763, "epoch": 2661} {"train_loss": -6.4438958168029785, "global_step": 111764, "epoch": 2661} {"train_loss": -6.478896141052246, "global_step": 111765, "epoch": 2661} {"train_loss": -6.505880355834961, "global_step": 111766, "epoch": 2661} {"train_loss": -6.423141002655029, "global_step": 111767, "epoch": 2661} {"train_loss": -6.43825626373291, "global_step": 111768, "epoch": 2661} {"train_loss": -6.499730110168457, "global_step": 111769, "epoch": 2661} {"train_loss": -6.5951313972473145, "global_step": 111770, "epoch": 2661} {"train_loss": -6.5067949295043945, "global_step": 111771, "epoch": 2661} {"train_loss": -6.697577476501465, "global_step": 111772, "epoch": 2661} {"train_loss": -6.579937934875488, "global_step": 111773, "epoch": 2661} {"train_loss": -6.450277328491211, "global_step": 111774, "epoch": 2661} {"train_loss": -6.616496562957764, "global_step": 111775, "epoch": 2661} {"train_loss": -6.3657073974609375, "global_step": 111776, "epoch": 2661} {"train_loss": -6.588961124420166, "global_step": 111777, "epoch": 2661} {"train_loss": -6.512373924255371, "global_step": 111778, "epoch": 2661} {"train_loss": -6.459898948669434, "global_step": 111779, "epoch": 2661} {"train_loss": -6.518692493438721, "global_step": 111780, "epoch": 2661} {"train_loss": -6.428842544555664, "global_step": 111781, "epoch": 2661} {"train_loss": -6.470888137817383, "global_step": 111782, "epoch": 2661} {"train_loss": -6.542860507965088, "global_step": 111783, "epoch": 2661} {"train_loss": -6.631702423095703, "global_step": 111784, "epoch": 2661} {"train_loss": -6.413336753845215, "global_step": 111785, "epoch": 2661} {"train_loss": -6.490387439727783, "global_step": 111786, "epoch": 2661} {"train_loss": -6.503040313720703, "global_step": 111787, "epoch": 2661} {"train_loss": -6.645142555236816, "global_step": 111788, "epoch": 2661} {"train_loss": -6.506083965301514, "global_step": 111789, "epoch": 2661} {"train_loss": -6.588509559631348, "global_step": 111790, "epoch": 2661} {"train_loss": -6.493488311767578, "global_step": 111791, "epoch": 2661} {"train_loss": -6.457294464111328, "global_step": 111792, "epoch": 2661} {"train_loss": -6.493579864501953, "global_step": 111793, "epoch": 2661} {"train_loss": -6.443447113037109, "global_step": 111794, "epoch": 2661} {"train_loss": -6.398107051849365, "global_step": 111795, "epoch": 2661} {"train_loss": -6.541351318359375, "global_step": 111796, "epoch": 2661} {"train_loss": -6.360352516174316, "global_step": 111797, "epoch": 2661} {"train_loss": -6.453153610229492, "global_step": 111798, "epoch": 2661} {"train_loss": -6.701038360595703, "global_step": 111799, "epoch": 2661} {"train_loss": -6.262585163116455, "global_step": 111800, "epoch": 2661} {"train_loss": -6.31735897064209, "global_step": 111801, "epoch": 2661} {"train_loss": -6.545353889465332, "global_step": 111802, "epoch": 2661} {"train_loss": -6.496485358192807, "global_step": 111803, "epoch": 2661, "val_loss": 65165.92578125} {"train_loss": -6.591483116149902, "global_step": 111804, "epoch": 2662} {"train_loss": -6.387192726135254, "global_step": 111805, "epoch": 2662} {"train_loss": -6.488302230834961, "global_step": 111806, "epoch": 2662} {"train_loss": -6.539134979248047, "global_step": 111807, "epoch": 2662} {"train_loss": -6.521429538726807, "global_step": 111808, "epoch": 2662} {"train_loss": -6.392185211181641, "global_step": 111809, "epoch": 2662} {"train_loss": -6.520740509033203, "global_step": 111810, "epoch": 2662} {"train_loss": -6.43073844909668, "global_step": 111811, "epoch": 2662} {"train_loss": -6.388591766357422, "global_step": 111812, "epoch": 2662} {"train_loss": -6.576576232910156, "global_step": 111813, "epoch": 2662} {"train_loss": -6.522843360900879, "global_step": 111814, "epoch": 2662} {"train_loss": -6.597765922546387, "global_step": 111815, "epoch": 2662} {"train_loss": -6.434381008148193, "global_step": 111816, "epoch": 2662} {"train_loss": -6.5819597244262695, "global_step": 111817, "epoch": 2662} {"train_loss": -6.509990215301514, "global_step": 111818, "epoch": 2662} {"train_loss": -6.403730869293213, "global_step": 111819, "epoch": 2662} {"train_loss": -6.583339214324951, "global_step": 111820, "epoch": 2662} {"train_loss": -6.476413726806641, "global_step": 111821, "epoch": 2662} {"train_loss": -6.487040042877197, "global_step": 111822, "epoch": 2662} {"train_loss": -6.5190324783325195, "global_step": 111823, "epoch": 2662} {"train_loss": -6.439972877502441, "global_step": 111824, "epoch": 2662} {"train_loss": -6.5444488525390625, "global_step": 111825, "epoch": 2662} {"train_loss": -6.558987617492676, "global_step": 111826, "epoch": 2662} {"train_loss": -6.557010650634766, "global_step": 111827, "epoch": 2662} {"train_loss": -6.4822235107421875, "global_step": 111828, "epoch": 2662} {"train_loss": -6.526519775390625, "global_step": 111829, "epoch": 2662} {"train_loss": -6.491249084472656, "global_step": 111830, "epoch": 2662} {"train_loss": -6.404783725738525, "global_step": 111831, "epoch": 2662} {"train_loss": -6.604569911956787, "global_step": 111832, "epoch": 2662} {"train_loss": -6.4446821212768555, "global_step": 111833, "epoch": 2662} {"train_loss": -6.404772758483887, "global_step": 111834, "epoch": 2662} {"train_loss": -6.435654163360596, "global_step": 111835, "epoch": 2662} {"train_loss": -6.6591033935546875, "global_step": 111836, "epoch": 2662} {"train_loss": -6.532624244689941, "global_step": 111837, "epoch": 2662} {"train_loss": -6.446440696716309, "global_step": 111838, "epoch": 2662} {"train_loss": -6.471978187561035, "global_step": 111839, "epoch": 2662} {"train_loss": -6.4108567237854, "global_step": 111840, "epoch": 2662} {"train_loss": -6.3834075927734375, "global_step": 111841, "epoch": 2662} {"train_loss": -6.446847915649414, "global_step": 111842, "epoch": 2662} {"train_loss": -6.408506393432617, "global_step": 111843, "epoch": 2662} {"train_loss": -6.52784538269043, "global_step": 111844, "epoch": 2662} {"train_loss": -6.493402310780117, "global_step": 111845, "epoch": 2662, "val_loss": 65244.07421875} {"train_loss": -6.359522342681885, "global_step": 111846, "epoch": 2663} {"train_loss": -6.586182594299316, "global_step": 111847, "epoch": 2663} {"train_loss": -6.494395732879639, "global_step": 111848, "epoch": 2663} {"train_loss": -6.467187881469727, "global_step": 111849, "epoch": 2663} {"train_loss": -6.593038558959961, "global_step": 111850, "epoch": 2663} {"train_loss": -6.505829811096191, "global_step": 111851, "epoch": 2663} {"train_loss": -6.568284511566162, "global_step": 111852, "epoch": 2663} {"train_loss": -6.538674354553223, "global_step": 111853, "epoch": 2663} {"train_loss": -6.54064416885376, "global_step": 111854, "epoch": 2663} {"train_loss": -6.504927158355713, "global_step": 111855, "epoch": 2663} {"train_loss": -6.574390411376953, "global_step": 111856, "epoch": 2663} {"train_loss": -6.516752243041992, "global_step": 111857, "epoch": 2663} {"train_loss": -6.573504447937012, "global_step": 111858, "epoch": 2663} {"train_loss": -6.501240253448486, "global_step": 111859, "epoch": 2663} {"train_loss": -6.581907272338867, "global_step": 111860, "epoch": 2663} {"train_loss": -6.499882698059082, "global_step": 111861, "epoch": 2663} {"train_loss": -6.59022331237793, "global_step": 111862, "epoch": 2663} {"train_loss": -6.580499649047852, "global_step": 111863, "epoch": 2663} {"train_loss": -6.477140426635742, "global_step": 111864, "epoch": 2663} {"train_loss": -6.599955081939697, "global_step": 111865, "epoch": 2663} {"train_loss": -6.605983734130859, "global_step": 111866, "epoch": 2663} {"train_loss": -6.4715118408203125, "global_step": 111867, "epoch": 2663} {"train_loss": -6.425060272216797, "global_step": 111868, "epoch": 2663} {"train_loss": -6.463685035705566, "global_step": 111869, "epoch": 2663} {"train_loss": -6.551362991333008, "global_step": 111870, "epoch": 2663} {"train_loss": -6.5983195304870605, "global_step": 111871, "epoch": 2663} {"train_loss": -6.395090579986572, "global_step": 111872, "epoch": 2663} {"train_loss": -6.491969585418701, "global_step": 111873, "epoch": 2663} {"train_loss": -6.575553894042969, "global_step": 111874, "epoch": 2663} {"train_loss": -6.432226181030273, "global_step": 111875, "epoch": 2663} {"train_loss": -6.597855567932129, "global_step": 111876, "epoch": 2663} {"train_loss": -6.5547709465026855, "global_step": 111877, "epoch": 2663} {"train_loss": -6.58098030090332, "global_step": 111878, "epoch": 2663} {"train_loss": -6.497649192810059, "global_step": 111879, "epoch": 2663} {"train_loss": -6.422204494476318, "global_step": 111880, "epoch": 2663} {"train_loss": -6.533969879150391, "global_step": 111881, "epoch": 2663} {"train_loss": -6.442468643188477, "global_step": 111882, "epoch": 2663} {"train_loss": -6.505472660064697, "global_step": 111883, "epoch": 2663} {"train_loss": -6.419074535369873, "global_step": 111884, "epoch": 2663} {"train_loss": -6.487719535827637, "global_step": 111885, "epoch": 2663} {"train_loss": -6.564420223236084, "global_step": 111886, "epoch": 2663} {"train_loss": -6.517703430993216, "global_step": 111887, "epoch": 2663, "val_loss": 65065.89453125} {"train_loss": -6.578883171081543, "global_step": 111888, "epoch": 2664} {"train_loss": -6.490149974822998, "global_step": 111889, "epoch": 2664} {"train_loss": -6.432374000549316, "global_step": 111890, "epoch": 2664} {"train_loss": -6.599521160125732, "global_step": 111891, "epoch": 2664} {"train_loss": -6.451422214508057, "global_step": 111892, "epoch": 2664} {"train_loss": -6.485870361328125, "global_step": 111893, "epoch": 2664} {"train_loss": -6.458312034606934, "global_step": 111894, "epoch": 2664} {"train_loss": -6.423415184020996, "global_step": 111895, "epoch": 2664} {"train_loss": -6.517841339111328, "global_step": 111896, "epoch": 2664} {"train_loss": -6.576811790466309, "global_step": 111897, "epoch": 2664} {"train_loss": -6.490262031555176, "global_step": 111898, "epoch": 2664} {"train_loss": -6.519144058227539, "global_step": 111899, "epoch": 2664} {"train_loss": -6.42362117767334, "global_step": 111900, "epoch": 2664} {"train_loss": -6.42547607421875, "global_step": 111901, "epoch": 2664} {"train_loss": -6.535243034362793, "global_step": 111902, "epoch": 2664} {"train_loss": -6.671726226806641, "global_step": 111903, "epoch": 2664} {"train_loss": -6.587899684906006, "global_step": 111904, "epoch": 2664} {"train_loss": -6.555214881896973, "global_step": 111905, "epoch": 2664} {"train_loss": -6.632530212402344, "global_step": 111906, "epoch": 2664} {"train_loss": -6.509463310241699, "global_step": 111907, "epoch": 2664} {"train_loss": -6.503376007080078, "global_step": 111908, "epoch": 2664} {"train_loss": -6.6377058029174805, "global_step": 111909, "epoch": 2664} {"train_loss": -6.639464378356934, "global_step": 111910, "epoch": 2664} {"train_loss": -6.511804580688477, "global_step": 111911, "epoch": 2664} {"train_loss": -6.519774913787842, "global_step": 111912, "epoch": 2664} {"train_loss": -6.4045867919921875, "global_step": 111913, "epoch": 2664} {"train_loss": -6.366460800170898, "global_step": 111914, "epoch": 2664} {"train_loss": -6.386868476867676, "global_step": 111915, "epoch": 2664} {"train_loss": -6.446791648864746, "global_step": 111916, "epoch": 2664} {"train_loss": -6.590278625488281, "global_step": 111917, "epoch": 2664} {"train_loss": -6.5499467849731445, "global_step": 111918, "epoch": 2664} {"train_loss": -6.446813106536865, "global_step": 111919, "epoch": 2664} {"train_loss": -6.4685869216918945, "global_step": 111920, "epoch": 2664} {"train_loss": -6.483956813812256, "global_step": 111921, "epoch": 2664} {"train_loss": -6.478919982910156, "global_step": 111922, "epoch": 2664} {"train_loss": -6.5193610191345215, "global_step": 111923, "epoch": 2664} {"train_loss": -6.391712188720703, "global_step": 111924, "epoch": 2664} {"train_loss": -6.4420623779296875, "global_step": 111925, "epoch": 2664} {"train_loss": -6.475449085235596, "global_step": 111926, "epoch": 2664} {"train_loss": -6.3954243659973145, "global_step": 111927, "epoch": 2664} {"train_loss": -6.477565765380859, "global_step": 111928, "epoch": 2664} {"train_loss": -6.499835843131656, "global_step": 111929, "epoch": 2664, "val_loss": 65033.10546875} {"train_loss": -6.477530479431152, "global_step": 111930, "epoch": 2665} {"train_loss": -6.574048042297363, "global_step": 111931, "epoch": 2665} {"train_loss": -6.526622295379639, "global_step": 111932, "epoch": 2665} {"train_loss": -6.509435653686523, "global_step": 111933, "epoch": 2665} {"train_loss": -6.445866107940674, "global_step": 111934, "epoch": 2665} {"train_loss": -6.466072082519531, "global_step": 111935, "epoch": 2665} {"train_loss": -6.511582374572754, "global_step": 111936, "epoch": 2665} {"train_loss": -6.601117134094238, "global_step": 111937, "epoch": 2665} {"train_loss": -6.4789228439331055, "global_step": 111938, "epoch": 2665} {"train_loss": -6.503389358520508, "global_step": 111939, "epoch": 2665} {"train_loss": -6.447812557220459, "global_step": 111940, "epoch": 2665} {"train_loss": -6.443241119384766, "global_step": 111941, "epoch": 2665} {"train_loss": -6.576513290405273, "global_step": 111942, "epoch": 2665} {"train_loss": -6.594560623168945, "global_step": 111943, "epoch": 2665} {"train_loss": -6.364442825317383, "global_step": 111944, "epoch": 2665} {"train_loss": -6.536612510681152, "global_step": 111945, "epoch": 2665} {"train_loss": -6.422706604003906, "global_step": 111946, "epoch": 2665} {"train_loss": -6.554883003234863, "global_step": 111947, "epoch": 2665} {"train_loss": -6.643327713012695, "global_step": 111948, "epoch": 2665} {"train_loss": -6.5565290451049805, "global_step": 111949, "epoch": 2665} {"train_loss": -6.413608074188232, "global_step": 111950, "epoch": 2665} {"train_loss": -6.509716033935547, "global_step": 111951, "epoch": 2665} {"train_loss": -6.542357921600342, "global_step": 111952, "epoch": 2665} {"train_loss": -6.475657939910889, "global_step": 111953, "epoch": 2665} {"train_loss": -6.562906265258789, "global_step": 111954, "epoch": 2665} {"train_loss": -6.509836196899414, "global_step": 111955, "epoch": 2665} {"train_loss": -6.491349697113037, "global_step": 111956, "epoch": 2665} {"train_loss": -6.510098457336426, "global_step": 111957, "epoch": 2665} {"train_loss": -6.4061279296875, "global_step": 111958, "epoch": 2665} {"train_loss": -6.460037708282471, "global_step": 111959, "epoch": 2665} {"train_loss": -6.549865245819092, "global_step": 111960, "epoch": 2665} {"train_loss": -6.497246265411377, "global_step": 111961, "epoch": 2665} {"train_loss": -6.417891502380371, "global_step": 111962, "epoch": 2665} {"train_loss": -6.495708465576172, "global_step": 111963, "epoch": 2665} {"train_loss": -6.371565341949463, "global_step": 111964, "epoch": 2665} {"train_loss": -6.371009826660156, "global_step": 111965, "epoch": 2665} {"train_loss": -6.5129499435424805, "global_step": 111966, "epoch": 2665} {"train_loss": -6.529773712158203, "global_step": 111967, "epoch": 2665} {"train_loss": -6.352029323577881, "global_step": 111968, "epoch": 2665} {"train_loss": -6.594536781311035, "global_step": 111969, "epoch": 2665} {"train_loss": -6.428008079528809, "global_step": 111970, "epoch": 2665} {"train_loss": -6.489523467563448, "global_step": 111971, "epoch": 2665, "val_loss": 65127.78125} {"train_loss": -6.518895149230957, "global_step": 111972, "epoch": 2666} {"train_loss": -6.446763515472412, "global_step": 111973, "epoch": 2666} {"train_loss": -6.451446056365967, "global_step": 111974, "epoch": 2666} {"train_loss": -6.417236328125, "global_step": 111975, "epoch": 2666} {"train_loss": -6.4948344230651855, "global_step": 111976, "epoch": 2666} {"train_loss": -6.41420841217041, "global_step": 111977, "epoch": 2666} {"train_loss": -6.418981075286865, "global_step": 111978, "epoch": 2666} {"train_loss": -6.490583896636963, "global_step": 111979, "epoch": 2666} {"train_loss": -6.397664546966553, "global_step": 111980, "epoch": 2666} {"train_loss": -6.569701194763184, "global_step": 111981, "epoch": 2666} {"train_loss": -6.379640579223633, "global_step": 111982, "epoch": 2666} {"train_loss": -6.588292121887207, "global_step": 111983, "epoch": 2666} {"train_loss": -6.526050567626953, "global_step": 111984, "epoch": 2666} {"train_loss": -6.424500942230225, "global_step": 111985, "epoch": 2666} {"train_loss": -6.526467323303223, "global_step": 111986, "epoch": 2666} {"train_loss": -6.429856300354004, "global_step": 111987, "epoch": 2666} {"train_loss": -6.4641194343566895, "global_step": 111988, "epoch": 2666} {"train_loss": -6.476465702056885, "global_step": 111989, "epoch": 2666} {"train_loss": -6.442155838012695, "global_step": 111990, "epoch": 2666} {"train_loss": -6.526860237121582, "global_step": 111991, "epoch": 2666} {"train_loss": -6.488979339599609, "global_step": 111992, "epoch": 2666} {"train_loss": -6.507610321044922, "global_step": 111993, "epoch": 2666} {"train_loss": -6.521991729736328, "global_step": 111994, "epoch": 2666} {"train_loss": -6.39107084274292, "global_step": 111995, "epoch": 2666} {"train_loss": -6.465747356414795, "global_step": 111996, "epoch": 2666} {"train_loss": -6.5193634033203125, "global_step": 111997, "epoch": 2666} {"train_loss": -6.499356746673584, "global_step": 111998, "epoch": 2666} {"train_loss": -6.590193271636963, "global_step": 111999, "epoch": 2666} {"train_loss": -6.572360992431641, "global_step": 112000, "epoch": 2666} {"train_loss": -6.4990081787109375, "global_step": 112001, "epoch": 2666} {"train_loss": -6.5623979568481445, "global_step": 112002, "epoch": 2666} {"train_loss": -6.583622455596924, "global_step": 112003, "epoch": 2666} {"train_loss": -6.531711578369141, "global_step": 112004, "epoch": 2666} {"train_loss": -6.522784233093262, "global_step": 112005, "epoch": 2666} {"train_loss": -6.593413352966309, "global_step": 112006, "epoch": 2666} {"train_loss": -6.502196788787842, "global_step": 112007, "epoch": 2666} {"train_loss": -6.47961950302124, "global_step": 112008, "epoch": 2666} {"train_loss": -6.438337802886963, "global_step": 112009, "epoch": 2666} {"train_loss": -6.578672409057617, "global_step": 112010, "epoch": 2666} {"train_loss": -6.446244239807129, "global_step": 112011, "epoch": 2666} {"train_loss": -6.554154396057129, "global_step": 112012, "epoch": 2666} {"train_loss": -6.491390773228237, "global_step": 112013, "epoch": 2666, "val_loss": 65089.33984375} {"train_loss": -6.527464389801025, "global_step": 112014, "epoch": 2667} {"train_loss": -6.4267191886901855, "global_step": 112015, "epoch": 2667} {"train_loss": -6.420755386352539, "global_step": 112016, "epoch": 2667} {"train_loss": -6.529597282409668, "global_step": 112017, "epoch": 2667} {"train_loss": -6.462165832519531, "global_step": 112018, "epoch": 2667} {"train_loss": -6.4859843254089355, "global_step": 112019, "epoch": 2667} {"train_loss": -6.417350769042969, "global_step": 112020, "epoch": 2667} {"train_loss": -6.540499687194824, "global_step": 112021, "epoch": 2667} {"train_loss": -6.498472213745117, "global_step": 112022, "epoch": 2667} {"train_loss": -6.513335227966309, "global_step": 112023, "epoch": 2667} {"train_loss": -6.465519428253174, "global_step": 112024, "epoch": 2667} {"train_loss": -6.580989837646484, "global_step": 112025, "epoch": 2667} {"train_loss": -6.421233654022217, "global_step": 112026, "epoch": 2667} {"train_loss": -6.522796630859375, "global_step": 112027, "epoch": 2667} {"train_loss": -6.510701656341553, "global_step": 112028, "epoch": 2667} {"train_loss": -6.391500473022461, "global_step": 112029, "epoch": 2667} {"train_loss": -6.551297187805176, "global_step": 112030, "epoch": 2667} {"train_loss": -6.5432586669921875, "global_step": 112031, "epoch": 2667} {"train_loss": -6.384579658508301, "global_step": 112032, "epoch": 2667} {"train_loss": -6.558318138122559, "global_step": 112033, "epoch": 2667} {"train_loss": -6.534870147705078, "global_step": 112034, "epoch": 2667} {"train_loss": -6.505551338195801, "global_step": 112035, "epoch": 2667} {"train_loss": -6.4457244873046875, "global_step": 112036, "epoch": 2667} {"train_loss": -6.500489234924316, "global_step": 112037, "epoch": 2667} {"train_loss": -6.570690631866455, "global_step": 112038, "epoch": 2667} {"train_loss": -6.556734085083008, "global_step": 112039, "epoch": 2667} {"train_loss": -6.574582576751709, "global_step": 112040, "epoch": 2667} {"train_loss": -6.434600830078125, "global_step": 112041, "epoch": 2667} {"train_loss": -6.622985363006592, "global_step": 112042, "epoch": 2667} {"train_loss": -6.4727325439453125, "global_step": 112043, "epoch": 2667} {"train_loss": -6.426743984222412, "global_step": 112044, "epoch": 2667} {"train_loss": -6.521755218505859, "global_step": 112045, "epoch": 2667} {"train_loss": -6.491372108459473, "global_step": 112046, "epoch": 2667} {"train_loss": -6.399155616760254, "global_step": 112047, "epoch": 2667} {"train_loss": -6.466477394104004, "global_step": 112048, "epoch": 2667} {"train_loss": -6.555258274078369, "global_step": 112049, "epoch": 2667} {"train_loss": -6.427090644836426, "global_step": 112050, "epoch": 2667} {"train_loss": -6.552407264709473, "global_step": 112051, "epoch": 2667} {"train_loss": -6.658731460571289, "global_step": 112052, "epoch": 2667} {"train_loss": -6.516767501831055, "global_step": 112053, "epoch": 2667} {"train_loss": -6.466927528381348, "global_step": 112054, "epoch": 2667} {"train_loss": -6.497940812792097, "global_step": 112055, "epoch": 2667, "val_loss": 65128.51953125} {"train_loss": -6.598250389099121, "global_step": 112056, "epoch": 2668} {"train_loss": -6.518156051635742, "global_step": 112057, "epoch": 2668} {"train_loss": -6.502966403961182, "global_step": 112058, "epoch": 2668} {"train_loss": -6.506920337677002, "global_step": 112059, "epoch": 2668} {"train_loss": -6.400084018707275, "global_step": 112060, "epoch": 2668} {"train_loss": -6.572150230407715, "global_step": 112061, "epoch": 2668} {"train_loss": -6.352225303649902, "global_step": 112062, "epoch": 2668} {"train_loss": -6.2303032875061035, "global_step": 112063, "epoch": 2668} {"train_loss": -6.465094566345215, "global_step": 112064, "epoch": 2668} {"train_loss": -6.42630672454834, "global_step": 112065, "epoch": 2668} {"train_loss": -6.333575248718262, "global_step": 112066, "epoch": 2668} {"train_loss": -6.38603401184082, "global_step": 112067, "epoch": 2668} {"train_loss": -6.409186840057373, "global_step": 112068, "epoch": 2668} {"train_loss": -6.369536399841309, "global_step": 112069, "epoch": 2668} {"train_loss": -6.294773101806641, "global_step": 112070, "epoch": 2668} {"train_loss": -6.3978962898254395, "global_step": 112071, "epoch": 2668} {"train_loss": -6.298280715942383, "global_step": 112072, "epoch": 2668} {"train_loss": -6.41609001159668, "global_step": 112073, "epoch": 2668} {"train_loss": -6.362238883972168, "global_step": 112074, "epoch": 2668} {"train_loss": -6.3452582359313965, "global_step": 112075, "epoch": 2668} {"train_loss": -6.365607738494873, "global_step": 112076, "epoch": 2668} {"train_loss": -6.515326023101807, "global_step": 112077, "epoch": 2668} {"train_loss": -6.426482677459717, "global_step": 112078, "epoch": 2668} {"train_loss": -6.486370086669922, "global_step": 112079, "epoch": 2668} {"train_loss": -6.538643836975098, "global_step": 112080, "epoch": 2668} {"train_loss": -6.460580825805664, "global_step": 112081, "epoch": 2668} {"train_loss": -6.470974922180176, "global_step": 112082, "epoch": 2668} {"train_loss": -6.424774169921875, "global_step": 112083, "epoch": 2668} {"train_loss": -6.459012508392334, "global_step": 112084, "epoch": 2668} {"train_loss": -6.426761150360107, "global_step": 112085, "epoch": 2668} {"train_loss": -6.4913859367370605, "global_step": 112086, "epoch": 2668} {"train_loss": -6.421490669250488, "global_step": 112087, "epoch": 2668} {"train_loss": -6.499471664428711, "global_step": 112088, "epoch": 2668} {"train_loss": -6.470152854919434, "global_step": 112089, "epoch": 2668} {"train_loss": -6.402711868286133, "global_step": 112090, "epoch": 2668} {"train_loss": -6.604310035705566, "global_step": 112091, "epoch": 2668} {"train_loss": -6.437241554260254, "global_step": 112092, "epoch": 2668} {"train_loss": -6.484536170959473, "global_step": 112093, "epoch": 2668} {"train_loss": -6.501062870025635, "global_step": 112094, "epoch": 2668} {"train_loss": -6.439958572387695, "global_step": 112095, "epoch": 2668} {"train_loss": -6.467337608337402, "global_step": 112096, "epoch": 2668} {"train_loss": -6.440790846234276, "global_step": 112097, "epoch": 2668, "val_loss": 65156.37890625} {"train_loss": -6.474791049957275, "global_step": 112098, "epoch": 2669} {"train_loss": -6.354445457458496, "global_step": 112099, "epoch": 2669} {"train_loss": -6.478529453277588, "global_step": 112100, "epoch": 2669} {"train_loss": -6.360012054443359, "global_step": 112101, "epoch": 2669} {"train_loss": -6.417654991149902, "global_step": 112102, "epoch": 2669} {"train_loss": -6.543709754943848, "global_step": 112103, "epoch": 2669} {"train_loss": -6.468586444854736, "global_step": 112104, "epoch": 2669} {"train_loss": -6.378411293029785, "global_step": 112105, "epoch": 2669} {"train_loss": -6.464716911315918, "global_step": 112106, "epoch": 2669} {"train_loss": -6.382684230804443, "global_step": 112107, "epoch": 2669} {"train_loss": -6.502486705780029, "global_step": 112108, "epoch": 2669} {"train_loss": -6.286581993103027, "global_step": 112109, "epoch": 2669} {"train_loss": -6.385225296020508, "global_step": 112110, "epoch": 2669} {"train_loss": -6.486847400665283, "global_step": 112111, "epoch": 2669} {"train_loss": -6.298893928527832, "global_step": 112112, "epoch": 2669} {"train_loss": -6.492623329162598, "global_step": 112113, "epoch": 2669} {"train_loss": -6.426150321960449, "global_step": 112114, "epoch": 2669} {"train_loss": -6.473274230957031, "global_step": 112115, "epoch": 2669} {"train_loss": -6.288697242736816, "global_step": 112116, "epoch": 2669} {"train_loss": -6.412093639373779, "global_step": 112117, "epoch": 2669} {"train_loss": -6.2940449714660645, "global_step": 112118, "epoch": 2669} {"train_loss": -6.356390953063965, "global_step": 112119, "epoch": 2669} {"train_loss": -6.363171100616455, "global_step": 112120, "epoch": 2669} {"train_loss": -6.442905902862549, "global_step": 112121, "epoch": 2669} {"train_loss": -6.449298858642578, "global_step": 112122, "epoch": 2669} {"train_loss": -6.5116472244262695, "global_step": 112123, "epoch": 2669} {"train_loss": -6.556632041931152, "global_step": 112124, "epoch": 2669} {"train_loss": -6.512866020202637, "global_step": 112125, "epoch": 2669} {"train_loss": -6.4755859375, "global_step": 112126, "epoch": 2669} {"train_loss": -6.567914009094238, "global_step": 112127, "epoch": 2669} {"train_loss": -6.56645393371582, "global_step": 112128, "epoch": 2669} {"train_loss": -6.622491359710693, "global_step": 112129, "epoch": 2669} {"train_loss": -6.521783828735352, "global_step": 112130, "epoch": 2669} {"train_loss": -6.565501689910889, "global_step": 112131, "epoch": 2669} {"train_loss": -6.518025875091553, "global_step": 112132, "epoch": 2669} {"train_loss": -6.586519241333008, "global_step": 112133, "epoch": 2669} {"train_loss": -6.5906171798706055, "global_step": 112134, "epoch": 2669} {"train_loss": -6.424266815185547, "global_step": 112135, "epoch": 2669} {"train_loss": -6.524816513061523, "global_step": 112136, "epoch": 2669} {"train_loss": -6.564484596252441, "global_step": 112137, "epoch": 2669} {"train_loss": -6.492547512054443, "global_step": 112138, "epoch": 2669} {"train_loss": -6.462597086316063, "global_step": 112139, "epoch": 2669, "val_loss": 65101.87109375} {"train_loss": -6.580893516540527, "global_step": 112140, "epoch": 2670} {"train_loss": -6.47518253326416, "global_step": 112141, "epoch": 2670} {"train_loss": -6.436080455780029, "global_step": 112142, "epoch": 2670} {"train_loss": -6.5215277671813965, "global_step": 112143, "epoch": 2670} {"train_loss": -6.504578113555908, "global_step": 112144, "epoch": 2670} {"train_loss": -6.5209503173828125, "global_step": 112145, "epoch": 2670} {"train_loss": -6.571494102478027, "global_step": 112146, "epoch": 2670} {"train_loss": -6.51409387588501, "global_step": 112147, "epoch": 2670} {"train_loss": -6.512929439544678, "global_step": 112148, "epoch": 2670} {"train_loss": -6.594735145568848, "global_step": 112149, "epoch": 2670} {"train_loss": -6.501389503479004, "global_step": 112150, "epoch": 2670} {"train_loss": -6.536245346069336, "global_step": 112151, "epoch": 2670} {"train_loss": -6.58908224105835, "global_step": 112152, "epoch": 2670} {"train_loss": -6.5034027099609375, "global_step": 112153, "epoch": 2670} {"train_loss": -6.578133583068848, "global_step": 112154, "epoch": 2670} {"train_loss": -6.488946914672852, "global_step": 112155, "epoch": 2670} {"train_loss": -6.522989273071289, "global_step": 112156, "epoch": 2670} {"train_loss": -6.507546424865723, "global_step": 112157, "epoch": 2670} {"train_loss": -6.528240203857422, "global_step": 112158, "epoch": 2670} {"train_loss": -6.594548225402832, "global_step": 112159, "epoch": 2670} {"train_loss": -6.6300554275512695, "global_step": 112160, "epoch": 2670} {"train_loss": -6.533182144165039, "global_step": 112161, "epoch": 2670} {"train_loss": -6.544906139373779, "global_step": 112162, "epoch": 2670} {"train_loss": -6.53732442855835, "global_step": 112163, "epoch": 2670} {"train_loss": -6.472648620605469, "global_step": 112164, "epoch": 2670} {"train_loss": -6.515844345092773, "global_step": 112165, "epoch": 2670} {"train_loss": -6.594823837280273, "global_step": 112166, "epoch": 2670} {"train_loss": -6.392685890197754, "global_step": 112167, "epoch": 2670} {"train_loss": -6.532657623291016, "global_step": 112168, "epoch": 2670} {"train_loss": -6.501226425170898, "global_step": 112169, "epoch": 2670} {"train_loss": -6.510693550109863, "global_step": 112170, "epoch": 2670} {"train_loss": -6.587480545043945, "global_step": 112171, "epoch": 2670} {"train_loss": -6.340662002563477, "global_step": 112172, "epoch": 2670} {"train_loss": -6.609166622161865, "global_step": 112173, "epoch": 2670} {"train_loss": -6.419034004211426, "global_step": 112174, "epoch": 2670} {"train_loss": -6.35272216796875, "global_step": 112175, "epoch": 2670} {"train_loss": -6.400567531585693, "global_step": 112176, "epoch": 2670} {"train_loss": -6.3427300453186035, "global_step": 112177, "epoch": 2670} {"train_loss": -6.4929375648498535, "global_step": 112178, "epoch": 2670} {"train_loss": -6.294180870056152, "global_step": 112179, "epoch": 2670} {"train_loss": -6.182038307189941, "global_step": 112180, "epoch": 2670} {"train_loss": -6.49672532081604, "global_step": 112181, "epoch": 2670, "val_loss": 65241.69921875} {"train_loss": -6.349251747131348, "global_step": 112182, "epoch": 2671} {"train_loss": -6.405251502990723, "global_step": 112183, "epoch": 2671} {"train_loss": -6.407033443450928, "global_step": 112184, "epoch": 2671} {"train_loss": -6.397665977478027, "global_step": 112185, "epoch": 2671} {"train_loss": -6.349615573883057, "global_step": 112186, "epoch": 2671} {"train_loss": -6.245914459228516, "global_step": 112187, "epoch": 2671} {"train_loss": -6.518929958343506, "global_step": 112188, "epoch": 2671} {"train_loss": -6.541513919830322, "global_step": 112189, "epoch": 2671} {"train_loss": -6.357553958892822, "global_step": 112190, "epoch": 2671} {"train_loss": -6.468240261077881, "global_step": 112191, "epoch": 2671} {"train_loss": -6.423752784729004, "global_step": 112192, "epoch": 2671} {"train_loss": -6.349510192871094, "global_step": 112193, "epoch": 2671} {"train_loss": -6.4382476806640625, "global_step": 112194, "epoch": 2671} {"train_loss": -6.424013137817383, "global_step": 112195, "epoch": 2671} {"train_loss": -6.561104774475098, "global_step": 112196, "epoch": 2671} {"train_loss": -6.421142578125, "global_step": 112197, "epoch": 2671} {"train_loss": -6.482028961181641, "global_step": 112198, "epoch": 2671} {"train_loss": -6.569766044616699, "global_step": 112199, "epoch": 2671} {"train_loss": -6.502365589141846, "global_step": 112200, "epoch": 2671} {"train_loss": -6.478174209594727, "global_step": 112201, "epoch": 2671} {"train_loss": -6.571159362792969, "global_step": 112202, "epoch": 2671} {"train_loss": -6.587725639343262, "global_step": 112203, "epoch": 2671} {"train_loss": -6.503544807434082, "global_step": 112204, "epoch": 2671} {"train_loss": -6.393985748291016, "global_step": 112205, "epoch": 2671} {"train_loss": -6.574531078338623, "global_step": 112206, "epoch": 2671} {"train_loss": -6.470461368560791, "global_step": 112207, "epoch": 2671} {"train_loss": -6.472242832183838, "global_step": 112208, "epoch": 2671} {"train_loss": -6.460213661193848, "global_step": 112209, "epoch": 2671} {"train_loss": -6.564809799194336, "global_step": 112210, "epoch": 2671} {"train_loss": -6.544705390930176, "global_step": 112211, "epoch": 2671} {"train_loss": -6.412785530090332, "global_step": 112212, "epoch": 2671} {"train_loss": -6.540469169616699, "global_step": 112213, "epoch": 2671} {"train_loss": -6.496750831604004, "global_step": 112214, "epoch": 2671} {"train_loss": -6.444975852966309, "global_step": 112215, "epoch": 2671} {"train_loss": -6.543647766113281, "global_step": 112216, "epoch": 2671} {"train_loss": -6.461015224456787, "global_step": 112217, "epoch": 2671} {"train_loss": -6.505496501922607, "global_step": 112218, "epoch": 2671} {"train_loss": -6.57059907913208, "global_step": 112219, "epoch": 2671} {"train_loss": -6.539593696594238, "global_step": 112220, "epoch": 2671} {"train_loss": -6.544948577880859, "global_step": 112221, "epoch": 2671} {"train_loss": -6.536466121673584, "global_step": 112222, "epoch": 2671} {"train_loss": -6.476637692678542, "global_step": 112223, "epoch": 2671, "val_loss": 65170.6875} {"train_loss": -6.524264812469482, "global_step": 112224, "epoch": 2672} {"train_loss": -6.480952262878418, "global_step": 112225, "epoch": 2672} {"train_loss": -6.614614486694336, "global_step": 112226, "epoch": 2672} {"train_loss": -6.419413089752197, "global_step": 112227, "epoch": 2672} {"train_loss": -6.494838714599609, "global_step": 112228, "epoch": 2672} {"train_loss": -6.631083965301514, "global_step": 112229, "epoch": 2672} {"train_loss": -6.466828346252441, "global_step": 112230, "epoch": 2672} {"train_loss": -6.514431476593018, "global_step": 112231, "epoch": 2672} {"train_loss": -6.564357757568359, "global_step": 112232, "epoch": 2672} {"train_loss": -6.567106246948242, "global_step": 112233, "epoch": 2672} {"train_loss": -6.563145160675049, "global_step": 112234, "epoch": 2672} {"train_loss": -6.48836088180542, "global_step": 112235, "epoch": 2672} {"train_loss": -6.420676231384277, "global_step": 112236, "epoch": 2672} {"train_loss": -6.479173183441162, "global_step": 112237, "epoch": 2672} {"train_loss": -6.442558765411377, "global_step": 112238, "epoch": 2672} {"train_loss": -6.43218994140625, "global_step": 112239, "epoch": 2672} {"train_loss": -6.491292953491211, "global_step": 112240, "epoch": 2672} {"train_loss": -6.410256385803223, "global_step": 112241, "epoch": 2672} {"train_loss": -6.591533660888672, "global_step": 112242, "epoch": 2672} {"train_loss": -6.370200157165527, "global_step": 112243, "epoch": 2672} {"train_loss": -6.539328575134277, "global_step": 112244, "epoch": 2672} {"train_loss": -6.455618858337402, "global_step": 112245, "epoch": 2672} {"train_loss": -6.448413372039795, "global_step": 112246, "epoch": 2672} {"train_loss": -6.456260681152344, "global_step": 112247, "epoch": 2672} {"train_loss": -6.5422492027282715, "global_step": 112248, "epoch": 2672} {"train_loss": -6.47991943359375, "global_step": 112249, "epoch": 2672} {"train_loss": -6.432931423187256, "global_step": 112250, "epoch": 2672} {"train_loss": -6.503440856933594, "global_step": 112251, "epoch": 2672} {"train_loss": -6.348845481872559, "global_step": 112252, "epoch": 2672} {"train_loss": -6.326198577880859, "global_step": 112253, "epoch": 2672} {"train_loss": -6.486533164978027, "global_step": 112254, "epoch": 2672} {"train_loss": -6.46588134765625, "global_step": 112255, "epoch": 2672} {"train_loss": -6.378097057342529, "global_step": 112256, "epoch": 2672} {"train_loss": -6.436097145080566, "global_step": 112257, "epoch": 2672} {"train_loss": -6.406930923461914, "global_step": 112258, "epoch": 2672} {"train_loss": -6.461452960968018, "global_step": 112259, "epoch": 2672} {"train_loss": -6.506504535675049, "global_step": 112260, "epoch": 2672} {"train_loss": -6.379397392272949, "global_step": 112261, "epoch": 2672} {"train_loss": -6.358604431152344, "global_step": 112262, "epoch": 2672} {"train_loss": -6.481165885925293, "global_step": 112263, "epoch": 2672} {"train_loss": -6.3694329261779785, "global_step": 112264, "epoch": 2672} {"train_loss": -6.466824588321504, "global_step": 112265, "epoch": 2672, "val_loss": 65567.34375} {"train_loss": -6.384631156921387, "global_step": 112266, "epoch": 2673} {"train_loss": -6.402154922485352, "global_step": 112267, "epoch": 2673} {"train_loss": -6.446996688842773, "global_step": 112268, "epoch": 2673} {"train_loss": -6.333558082580566, "global_step": 112269, "epoch": 2673} {"train_loss": -6.297067165374756, "global_step": 112270, "epoch": 2673} {"train_loss": -6.42807149887085, "global_step": 112271, "epoch": 2673} {"train_loss": -6.411827087402344, "global_step": 112272, "epoch": 2673} {"train_loss": -6.368860721588135, "global_step": 112273, "epoch": 2673} {"train_loss": -6.459495544433594, "global_step": 112274, "epoch": 2673} {"train_loss": -6.3118815422058105, "global_step": 112275, "epoch": 2673} {"train_loss": -6.43892240524292, "global_step": 112276, "epoch": 2673} {"train_loss": -6.383312702178955, "global_step": 112277, "epoch": 2673} {"train_loss": -6.2493510246276855, "global_step": 112278, "epoch": 2673} {"train_loss": -6.310680389404297, "global_step": 112279, "epoch": 2673} {"train_loss": -6.39903450012207, "global_step": 112280, "epoch": 2673} {"train_loss": -6.556095123291016, "global_step": 112281, "epoch": 2673} {"train_loss": -6.313116073608398, "global_step": 112282, "epoch": 2673} {"train_loss": -6.333519458770752, "global_step": 112283, "epoch": 2673} {"train_loss": -6.30727481842041, "global_step": 112284, "epoch": 2673} {"train_loss": -6.287585258483887, "global_step": 112285, "epoch": 2673} {"train_loss": -6.430078983306885, "global_step": 112286, "epoch": 2673} {"train_loss": -6.423505783081055, "global_step": 112287, "epoch": 2673} {"train_loss": -6.313831329345703, "global_step": 112288, "epoch": 2673} {"train_loss": -6.477550506591797, "global_step": 112289, "epoch": 2673} {"train_loss": -6.290705680847168, "global_step": 112290, "epoch": 2673} {"train_loss": -6.41829776763916, "global_step": 112291, "epoch": 2673} {"train_loss": -6.347119331359863, "global_step": 112292, "epoch": 2673} {"train_loss": -6.3674774169921875, "global_step": 112293, "epoch": 2673} {"train_loss": -6.465156555175781, "global_step": 112294, "epoch": 2673} {"train_loss": -6.508011817932129, "global_step": 112295, "epoch": 2673} {"train_loss": -6.322323799133301, "global_step": 112296, "epoch": 2673} {"train_loss": -6.4124755859375, "global_step": 112297, "epoch": 2673} {"train_loss": -6.497962951660156, "global_step": 112298, "epoch": 2673} {"train_loss": -6.406870365142822, "global_step": 112299, "epoch": 2673} {"train_loss": -6.484180927276611, "global_step": 112300, "epoch": 2673} {"train_loss": -6.371993541717529, "global_step": 112301, "epoch": 2673} {"train_loss": -6.414113998413086, "global_step": 112302, "epoch": 2673} {"train_loss": -6.411759853363037, "global_step": 112303, "epoch": 2673} {"train_loss": -6.465953826904297, "global_step": 112304, "epoch": 2673} {"train_loss": -6.4546308517456055, "global_step": 112305, "epoch": 2673} {"train_loss": -6.4729461669921875, "global_step": 112306, "epoch": 2673} {"train_loss": -6.397013698305402, "global_step": 112307, "epoch": 2673, "val_loss": 65391.35546875} {"train_loss": -6.425492763519287, "global_step": 112308, "epoch": 2674} {"train_loss": -6.317287445068359, "global_step": 112309, "epoch": 2674} {"train_loss": -6.351036071777344, "global_step": 112310, "epoch": 2674} {"train_loss": -6.49691915512085, "global_step": 112311, "epoch": 2674} {"train_loss": -6.495631217956543, "global_step": 112312, "epoch": 2674} {"train_loss": -6.456007957458496, "global_step": 112313, "epoch": 2674} {"train_loss": -6.3610029220581055, "global_step": 112314, "epoch": 2674} {"train_loss": -6.408019065856934, "global_step": 112315, "epoch": 2674} {"train_loss": -6.558011531829834, "global_step": 112316, "epoch": 2674} {"train_loss": -6.454407691955566, "global_step": 112317, "epoch": 2674} {"train_loss": -6.480185031890869, "global_step": 112318, "epoch": 2674} {"train_loss": -6.388845443725586, "global_step": 112319, "epoch": 2674} {"train_loss": -6.438056945800781, "global_step": 112320, "epoch": 2674} {"train_loss": -6.432544231414795, "global_step": 112321, "epoch": 2674} {"train_loss": -6.407425880432129, "global_step": 112322, "epoch": 2674} {"train_loss": -6.47039270401001, "global_step": 112323, "epoch": 2674} {"train_loss": -6.485724449157715, "global_step": 112324, "epoch": 2674} {"train_loss": -6.455822944641113, "global_step": 112325, "epoch": 2674} {"train_loss": -6.512259483337402, "global_step": 112326, "epoch": 2674} {"train_loss": -6.4788103103637695, "global_step": 112327, "epoch": 2674} {"train_loss": -6.432467937469482, "global_step": 112328, "epoch": 2674} {"train_loss": -6.409389019012451, "global_step": 112329, "epoch": 2674} {"train_loss": -6.4123687744140625, "global_step": 112330, "epoch": 2674} {"train_loss": -6.417849540710449, "global_step": 112331, "epoch": 2674} {"train_loss": -6.450617790222168, "global_step": 112332, "epoch": 2674} {"train_loss": -6.421590805053711, "global_step": 112333, "epoch": 2674} {"train_loss": -6.532958984375, "global_step": 112334, "epoch": 2674} {"train_loss": -6.399683952331543, "global_step": 112335, "epoch": 2674} {"train_loss": -6.544280052185059, "global_step": 112336, "epoch": 2674} {"train_loss": -6.430392265319824, "global_step": 112337, "epoch": 2674} {"train_loss": -6.552419662475586, "global_step": 112338, "epoch": 2674} {"train_loss": -6.454890251159668, "global_step": 112339, "epoch": 2674} {"train_loss": -6.545961380004883, "global_step": 112340, "epoch": 2674} {"train_loss": -6.592507362365723, "global_step": 112341, "epoch": 2674} {"train_loss": -6.48185920715332, "global_step": 112342, "epoch": 2674} {"train_loss": -6.530508041381836, "global_step": 112343, "epoch": 2674} {"train_loss": -6.510317325592041, "global_step": 112344, "epoch": 2674} {"train_loss": -6.524374008178711, "global_step": 112345, "epoch": 2674} {"train_loss": -6.5989813804626465, "global_step": 112346, "epoch": 2674} {"train_loss": -6.593601703643799, "global_step": 112347, "epoch": 2674} {"train_loss": -6.531292915344238, "global_step": 112348, "epoch": 2674} {"train_loss": -6.4725241888137095, "global_step": 112349, "epoch": 2674, "val_loss": 65016.0625} {"train_loss": -6.407157897949219, "global_step": 112350, "epoch": 2675} {"train_loss": -6.60998010635376, "global_step": 112351, "epoch": 2675} {"train_loss": -6.6945271492004395, "global_step": 112352, "epoch": 2675} {"train_loss": -6.440051078796387, "global_step": 112353, "epoch": 2675} {"train_loss": -6.521272659301758, "global_step": 112354, "epoch": 2675} {"train_loss": -6.487016677856445, "global_step": 112355, "epoch": 2675} {"train_loss": -6.567534923553467, "global_step": 112356, "epoch": 2675} {"train_loss": -6.61655330657959, "global_step": 112357, "epoch": 2675} {"train_loss": -6.46481466293335, "global_step": 112358, "epoch": 2675} {"train_loss": -6.443377494812012, "global_step": 112359, "epoch": 2675} {"train_loss": -6.470625400543213, "global_step": 112360, "epoch": 2675} {"train_loss": -6.502838611602783, "global_step": 112361, "epoch": 2675} {"train_loss": -6.464283466339111, "global_step": 112362, "epoch": 2675} {"train_loss": -6.464145660400391, "global_step": 112363, "epoch": 2675} {"train_loss": -6.486235618591309, "global_step": 112364, "epoch": 2675} {"train_loss": -6.384543418884277, "global_step": 112365, "epoch": 2675} {"train_loss": -6.4597320556640625, "global_step": 112366, "epoch": 2675} {"train_loss": -6.548419952392578, "global_step": 112367, "epoch": 2675} {"train_loss": -6.519532203674316, "global_step": 112368, "epoch": 2675} {"train_loss": -6.440912246704102, "global_step": 112369, "epoch": 2675} {"train_loss": -6.575893878936768, "global_step": 112370, "epoch": 2675} {"train_loss": -6.540735244750977, "global_step": 112371, "epoch": 2675} {"train_loss": -6.505619525909424, "global_step": 112372, "epoch": 2675} {"train_loss": -6.379497528076172, "global_step": 112373, "epoch": 2675} {"train_loss": -6.4828290939331055, "global_step": 112374, "epoch": 2675} {"train_loss": -6.478783130645752, "global_step": 112375, "epoch": 2675} {"train_loss": -6.507183074951172, "global_step": 112376, "epoch": 2675} {"train_loss": -6.499628067016602, "global_step": 112377, "epoch": 2675} {"train_loss": -6.48476505279541, "global_step": 112378, "epoch": 2675} {"train_loss": -6.553686141967773, "global_step": 112379, "epoch": 2675} {"train_loss": -6.516737937927246, "global_step": 112380, "epoch": 2675} {"train_loss": -6.543156623840332, "global_step": 112381, "epoch": 2675} {"train_loss": -6.365977764129639, "global_step": 112382, "epoch": 2675} {"train_loss": -6.586033344268799, "global_step": 112383, "epoch": 2675} {"train_loss": -6.586256980895996, "global_step": 112384, "epoch": 2675} {"train_loss": -6.526487827301025, "global_step": 112385, "epoch": 2675} {"train_loss": -6.547469139099121, "global_step": 112386, "epoch": 2675} {"train_loss": -6.53564453125, "global_step": 112387, "epoch": 2675} {"train_loss": -6.420242786407471, "global_step": 112388, "epoch": 2675} {"train_loss": -6.494932174682617, "global_step": 112389, "epoch": 2675} {"train_loss": -6.561554908752441, "global_step": 112390, "epoch": 2675} {"train_loss": -6.503605751764207, "global_step": 112391, "epoch": 2675, "val_loss": 65337.27734375} {"train_loss": -6.498008728027344, "global_step": 112392, "epoch": 2676} {"train_loss": -6.538932800292969, "global_step": 112393, "epoch": 2676} {"train_loss": -6.462222576141357, "global_step": 112394, "epoch": 2676} {"train_loss": -6.567221641540527, "global_step": 112395, "epoch": 2676} {"train_loss": -6.520961761474609, "global_step": 112396, "epoch": 2676} {"train_loss": -6.601584434509277, "global_step": 112397, "epoch": 2676} {"train_loss": -6.38818359375, "global_step": 112398, "epoch": 2676} {"train_loss": -6.486296653747559, "global_step": 112399, "epoch": 2676} {"train_loss": -6.562245845794678, "global_step": 112400, "epoch": 2676} {"train_loss": -6.3296637535095215, "global_step": 112401, "epoch": 2676} {"train_loss": -6.344509124755859, "global_step": 112402, "epoch": 2676} {"train_loss": -6.614654541015625, "global_step": 112403, "epoch": 2676} {"train_loss": -6.397736549377441, "global_step": 112404, "epoch": 2676} {"train_loss": -6.436516284942627, "global_step": 112405, "epoch": 2676} {"train_loss": -6.478260517120361, "global_step": 112406, "epoch": 2676} {"train_loss": -6.385419845581055, "global_step": 112407, "epoch": 2676} {"train_loss": -6.5143232345581055, "global_step": 112408, "epoch": 2676} {"train_loss": -6.439712047576904, "global_step": 112409, "epoch": 2676} {"train_loss": -6.420956611633301, "global_step": 112410, "epoch": 2676} {"train_loss": -6.54559326171875, "global_step": 112411, "epoch": 2676} {"train_loss": -6.415735721588135, "global_step": 112412, "epoch": 2676} {"train_loss": -6.501712799072266, "global_step": 112413, "epoch": 2676} {"train_loss": -6.412016868591309, "global_step": 112414, "epoch": 2676} {"train_loss": -6.579632759094238, "global_step": 112415, "epoch": 2676} {"train_loss": -6.503526210784912, "global_step": 112416, "epoch": 2676} {"train_loss": -6.467933654785156, "global_step": 112417, "epoch": 2676} {"train_loss": -6.5536603927612305, "global_step": 112418, "epoch": 2676} {"train_loss": -6.535055160522461, "global_step": 112419, "epoch": 2676} {"train_loss": -6.5228729248046875, "global_step": 112420, "epoch": 2676} {"train_loss": -6.44405460357666, "global_step": 112421, "epoch": 2676} {"train_loss": -6.549040794372559, "global_step": 112422, "epoch": 2676} {"train_loss": -6.5033063888549805, "global_step": 112423, "epoch": 2676} {"train_loss": -6.4790568351745605, "global_step": 112424, "epoch": 2676} {"train_loss": -6.46616268157959, "global_step": 112425, "epoch": 2676} {"train_loss": -6.485870838165283, "global_step": 112426, "epoch": 2676} {"train_loss": -6.496987342834473, "global_step": 112427, "epoch": 2676} {"train_loss": -6.444179058074951, "global_step": 112428, "epoch": 2676} {"train_loss": -6.317052364349365, "global_step": 112429, "epoch": 2676} {"train_loss": -6.521781921386719, "global_step": 112430, "epoch": 2676} {"train_loss": -6.4692230224609375, "global_step": 112431, "epoch": 2676} {"train_loss": -6.423871040344238, "global_step": 112432, "epoch": 2676} {"train_loss": -6.482785837990897, "global_step": 112433, "epoch": 2676, "val_loss": 65198.859375} {"train_loss": -6.523135185241699, "global_step": 112434, "epoch": 2677} {"train_loss": -6.519831657409668, "global_step": 112435, "epoch": 2677} {"train_loss": -6.397902965545654, "global_step": 112436, "epoch": 2677} {"train_loss": -6.605339050292969, "global_step": 112437, "epoch": 2677} {"train_loss": -6.362297058105469, "global_step": 112438, "epoch": 2677} {"train_loss": -6.427362442016602, "global_step": 112439, "epoch": 2677} {"train_loss": -6.515228748321533, "global_step": 112440, "epoch": 2677} {"train_loss": -6.5555901527404785, "global_step": 112441, "epoch": 2677} {"train_loss": -6.572371006011963, "global_step": 112442, "epoch": 2677} {"train_loss": -6.3628950119018555, "global_step": 112443, "epoch": 2677} {"train_loss": -6.522643089294434, "global_step": 112444, "epoch": 2677} {"train_loss": -6.4602580070495605, "global_step": 112445, "epoch": 2677} {"train_loss": -6.4442291259765625, "global_step": 112446, "epoch": 2677} {"train_loss": -6.533365249633789, "global_step": 112447, "epoch": 2677} {"train_loss": -6.596318244934082, "global_step": 112448, "epoch": 2677} {"train_loss": -6.548614501953125, "global_step": 112449, "epoch": 2677} {"train_loss": -6.511235237121582, "global_step": 112450, "epoch": 2677} {"train_loss": -6.378236293792725, "global_step": 112451, "epoch": 2677} {"train_loss": -6.598979949951172, "global_step": 112452, "epoch": 2677} {"train_loss": -6.494504451751709, "global_step": 112453, "epoch": 2677} {"train_loss": -6.619745254516602, "global_step": 112454, "epoch": 2677} {"train_loss": -6.58589506149292, "global_step": 112455, "epoch": 2677} {"train_loss": -6.555237770080566, "global_step": 112456, "epoch": 2677} {"train_loss": -6.544419765472412, "global_step": 112457, "epoch": 2677} {"train_loss": -6.530265808105469, "global_step": 112458, "epoch": 2677} {"train_loss": -6.550034999847412, "global_step": 112459, "epoch": 2677} {"train_loss": -6.540318489074707, "global_step": 112460, "epoch": 2677} {"train_loss": -6.657281875610352, "global_step": 112461, "epoch": 2677} {"train_loss": -6.441346168518066, "global_step": 112462, "epoch": 2677} {"train_loss": -6.423964023590088, "global_step": 112463, "epoch": 2677} {"train_loss": -6.405875205993652, "global_step": 112464, "epoch": 2677} {"train_loss": -6.497385501861572, "global_step": 112465, "epoch": 2677} {"train_loss": -6.460587501525879, "global_step": 112466, "epoch": 2677} {"train_loss": -6.529050827026367, "global_step": 112467, "epoch": 2677} {"train_loss": -6.3350725173950195, "global_step": 112468, "epoch": 2677} {"train_loss": -6.566361904144287, "global_step": 112469, "epoch": 2677} {"train_loss": -6.549527168273926, "global_step": 112470, "epoch": 2677} {"train_loss": -6.458725929260254, "global_step": 112471, "epoch": 2677} {"train_loss": -6.4654645919799805, "global_step": 112472, "epoch": 2677} {"train_loss": -6.565154075622559, "global_step": 112473, "epoch": 2677} {"train_loss": -6.478588104248047, "global_step": 112474, "epoch": 2677} {"train_loss": -6.505149977547782, "global_step": 112475, "epoch": 2677, "val_loss": 65112.015625} {"train_loss": -6.584066390991211, "global_step": 112476, "epoch": 2678} {"train_loss": -6.444180965423584, "global_step": 112477, "epoch": 2678} {"train_loss": -6.53176736831665, "global_step": 112478, "epoch": 2678} {"train_loss": -6.408175468444824, "global_step": 112479, "epoch": 2678} {"train_loss": -6.579201698303223, "global_step": 112480, "epoch": 2678} {"train_loss": -6.434315204620361, "global_step": 112481, "epoch": 2678} {"train_loss": -6.470211505889893, "global_step": 112482, "epoch": 2678} {"train_loss": -6.593803405761719, "global_step": 112483, "epoch": 2678} {"train_loss": -6.462087631225586, "global_step": 112484, "epoch": 2678} {"train_loss": -6.539147853851318, "global_step": 112485, "epoch": 2678} {"train_loss": -6.411548614501953, "global_step": 112486, "epoch": 2678} {"train_loss": -6.339961051940918, "global_step": 112487, "epoch": 2678} {"train_loss": -6.452461242675781, "global_step": 112488, "epoch": 2678} {"train_loss": -6.429819583892822, "global_step": 112489, "epoch": 2678} {"train_loss": -6.3780927658081055, "global_step": 112490, "epoch": 2678} {"train_loss": -6.297135353088379, "global_step": 112491, "epoch": 2678} {"train_loss": -6.51878547668457, "global_step": 112492, "epoch": 2678} {"train_loss": -6.458299160003662, "global_step": 112493, "epoch": 2678} {"train_loss": -6.368190765380859, "global_step": 112494, "epoch": 2678} {"train_loss": -6.470171928405762, "global_step": 112495, "epoch": 2678} {"train_loss": -6.253936767578125, "global_step": 112496, "epoch": 2678} {"train_loss": -6.395752906799316, "global_step": 112497, "epoch": 2678} {"train_loss": -6.337331771850586, "global_step": 112498, "epoch": 2678} {"train_loss": -6.534863471984863, "global_step": 112499, "epoch": 2678} {"train_loss": -6.321904182434082, "global_step": 112500, "epoch": 2678} {"train_loss": -6.526330947875977, "global_step": 112501, "epoch": 2678} {"train_loss": -6.352663040161133, "global_step": 112502, "epoch": 2678} {"train_loss": -6.409679412841797, "global_step": 112503, "epoch": 2678} {"train_loss": -6.430336952209473, "global_step": 112504, "epoch": 2678} {"train_loss": -6.466034889221191, "global_step": 112505, "epoch": 2678} {"train_loss": -6.34321403503418, "global_step": 112506, "epoch": 2678} {"train_loss": -6.445589065551758, "global_step": 112507, "epoch": 2678} {"train_loss": -6.482854843139648, "global_step": 112508, "epoch": 2678} {"train_loss": -6.521125316619873, "global_step": 112509, "epoch": 2678} {"train_loss": -6.263670921325684, "global_step": 112510, "epoch": 2678} {"train_loss": -6.476828098297119, "global_step": 112511, "epoch": 2678} {"train_loss": -6.462676525115967, "global_step": 112512, "epoch": 2678} {"train_loss": -6.410562515258789, "global_step": 112513, "epoch": 2678} {"train_loss": -6.464841842651367, "global_step": 112514, "epoch": 2678} {"train_loss": -6.494547367095947, "global_step": 112515, "epoch": 2678} {"train_loss": -6.415543556213379, "global_step": 112516, "epoch": 2678} {"train_loss": -6.441034339723133, "global_step": 112517, "epoch": 2678, "val_loss": 65176.6796875} {"train_loss": -6.5368428230285645, "global_step": 112518, "epoch": 2679} {"train_loss": -6.437996864318848, "global_step": 112519, "epoch": 2679} {"train_loss": -6.455291748046875, "global_step": 112520, "epoch": 2679} {"train_loss": -6.470449924468994, "global_step": 112521, "epoch": 2679} {"train_loss": -6.499783039093018, "global_step": 112522, "epoch": 2679} {"train_loss": -6.521266937255859, "global_step": 112523, "epoch": 2679} {"train_loss": -6.552132606506348, "global_step": 112524, "epoch": 2679} {"train_loss": -6.621540069580078, "global_step": 112525, "epoch": 2679} {"train_loss": -6.506054878234863, "global_step": 112526, "epoch": 2679} {"train_loss": -6.523837089538574, "global_step": 112527, "epoch": 2679} {"train_loss": -6.543261528015137, "global_step": 112528, "epoch": 2679} {"train_loss": -6.422016143798828, "global_step": 112529, "epoch": 2679} {"train_loss": -6.517383098602295, "global_step": 112530, "epoch": 2679} {"train_loss": -6.564264297485352, "global_step": 112531, "epoch": 2679} {"train_loss": -6.501585483551025, "global_step": 112532, "epoch": 2679} {"train_loss": -6.439573287963867, "global_step": 112533, "epoch": 2679} {"train_loss": -6.591777801513672, "global_step": 112534, "epoch": 2679} {"train_loss": -6.366860389709473, "global_step": 112535, "epoch": 2679} {"train_loss": -6.559993743896484, "global_step": 112536, "epoch": 2679} {"train_loss": -6.595155715942383, "global_step": 112537, "epoch": 2679} {"train_loss": -6.44663143157959, "global_step": 112538, "epoch": 2679} {"train_loss": -6.557061195373535, "global_step": 112539, "epoch": 2679} {"train_loss": -6.459850311279297, "global_step": 112540, "epoch": 2679} {"train_loss": -6.542557716369629, "global_step": 112541, "epoch": 2679} {"train_loss": -6.522373199462891, "global_step": 112542, "epoch": 2679} {"train_loss": -6.541949272155762, "global_step": 112543, "epoch": 2679} {"train_loss": -6.526124954223633, "global_step": 112544, "epoch": 2679} {"train_loss": -6.5143327713012695, "global_step": 112545, "epoch": 2679} {"train_loss": -6.509690284729004, "global_step": 112546, "epoch": 2679} {"train_loss": -6.5037994384765625, "global_step": 112547, "epoch": 2679} {"train_loss": -6.423405647277832, "global_step": 112548, "epoch": 2679} {"train_loss": -6.44924783706665, "global_step": 112549, "epoch": 2679} {"train_loss": -6.524711608886719, "global_step": 112550, "epoch": 2679} {"train_loss": -6.372674465179443, "global_step": 112551, "epoch": 2679} {"train_loss": -6.510677337646484, "global_step": 112552, "epoch": 2679} {"train_loss": -6.568106651306152, "global_step": 112553, "epoch": 2679} {"train_loss": -6.573328495025635, "global_step": 112554, "epoch": 2679} {"train_loss": -6.533203125, "global_step": 112555, "epoch": 2679} {"train_loss": -6.505438804626465, "global_step": 112556, "epoch": 2679} {"train_loss": -6.597329616546631, "global_step": 112557, "epoch": 2679} {"train_loss": -6.381495475769043, "global_step": 112558, "epoch": 2679} {"train_loss": -6.5070854028066, "global_step": 112559, "epoch": 2679, "val_loss": 64974.6171875} {"train_loss": -6.414459228515625, "global_step": 112560, "epoch": 2680} {"train_loss": -6.586064338684082, "global_step": 112561, "epoch": 2680} {"train_loss": -6.553380966186523, "global_step": 112562, "epoch": 2680} {"train_loss": -6.539379119873047, "global_step": 112563, "epoch": 2680} {"train_loss": -6.476771354675293, "global_step": 112564, "epoch": 2680} {"train_loss": -6.518346786499023, "global_step": 112565, "epoch": 2680} {"train_loss": -6.461673736572266, "global_step": 112566, "epoch": 2680} {"train_loss": -6.515885353088379, "global_step": 112567, "epoch": 2680} {"train_loss": -6.568846225738525, "global_step": 112568, "epoch": 2680} {"train_loss": -6.422975540161133, "global_step": 112569, "epoch": 2680} {"train_loss": -6.419356346130371, "global_step": 112570, "epoch": 2680} {"train_loss": -6.682007789611816, "global_step": 112571, "epoch": 2680} {"train_loss": -6.526188850402832, "global_step": 112572, "epoch": 2680} {"train_loss": -6.554437160491943, "global_step": 112573, "epoch": 2680} {"train_loss": -6.46714973449707, "global_step": 112574, "epoch": 2680} {"train_loss": -6.515773773193359, "global_step": 112575, "epoch": 2680} {"train_loss": -6.589792728424072, "global_step": 112576, "epoch": 2680} {"train_loss": -6.4599175453186035, "global_step": 112577, "epoch": 2680} {"train_loss": -6.529946327209473, "global_step": 112578, "epoch": 2680} {"train_loss": -6.502566337585449, "global_step": 112579, "epoch": 2680} {"train_loss": -6.47593355178833, "global_step": 112580, "epoch": 2680} {"train_loss": -6.470175743103027, "global_step": 112581, "epoch": 2680} {"train_loss": -6.521821975708008, "global_step": 112582, "epoch": 2680} {"train_loss": -6.490884304046631, "global_step": 112583, "epoch": 2680} {"train_loss": -6.572125434875488, "global_step": 112584, "epoch": 2680} {"train_loss": -6.5089216232299805, "global_step": 112585, "epoch": 2680} {"train_loss": -6.5045166015625, "global_step": 112586, "epoch": 2680} {"train_loss": -6.559979438781738, "global_step": 112587, "epoch": 2680} {"train_loss": -6.670567035675049, "global_step": 112588, "epoch": 2680} {"train_loss": -6.559108257293701, "global_step": 112589, "epoch": 2680} {"train_loss": -6.478734016418457, "global_step": 112590, "epoch": 2680} {"train_loss": -6.608904838562012, "global_step": 112591, "epoch": 2680} {"train_loss": -6.568307876586914, "global_step": 112592, "epoch": 2680} {"train_loss": -6.502721786499023, "global_step": 112593, "epoch": 2680} {"train_loss": -6.378812789916992, "global_step": 112594, "epoch": 2680} {"train_loss": -6.493060111999512, "global_step": 112595, "epoch": 2680} {"train_loss": -6.64525032043457, "global_step": 112596, "epoch": 2680} {"train_loss": -6.586045265197754, "global_step": 112597, "epoch": 2680} {"train_loss": -6.556523323059082, "global_step": 112598, "epoch": 2680} {"train_loss": -6.591372013092041, "global_step": 112599, "epoch": 2680} {"train_loss": -6.638064384460449, "global_step": 112600, "epoch": 2680} {"train_loss": -6.529403970355079, "global_step": 112601, "epoch": 2680, "val_loss": 65105.69921875} {"train_loss": -6.536541938781738, "global_step": 112602, "epoch": 2681} {"train_loss": -6.454089164733887, "global_step": 112603, "epoch": 2681} {"train_loss": -6.556824684143066, "global_step": 112604, "epoch": 2681} {"train_loss": -6.4849348068237305, "global_step": 112605, "epoch": 2681} {"train_loss": -6.403172492980957, "global_step": 112606, "epoch": 2681} {"train_loss": -6.487207889556885, "global_step": 112607, "epoch": 2681} {"train_loss": -6.567927837371826, "global_step": 112608, "epoch": 2681} {"train_loss": -6.532672882080078, "global_step": 112609, "epoch": 2681} {"train_loss": -6.593855857849121, "global_step": 112610, "epoch": 2681} {"train_loss": -6.530891418457031, "global_step": 112611, "epoch": 2681} {"train_loss": -6.59684944152832, "global_step": 112612, "epoch": 2681} {"train_loss": -6.60115385055542, "global_step": 112613, "epoch": 2681} {"train_loss": -6.488696575164795, "global_step": 112614, "epoch": 2681} {"train_loss": -6.514470100402832, "global_step": 112615, "epoch": 2681} {"train_loss": -6.572120666503906, "global_step": 112616, "epoch": 2681} {"train_loss": -6.562982559204102, "global_step": 112617, "epoch": 2681} {"train_loss": -6.529707908630371, "global_step": 112618, "epoch": 2681} {"train_loss": -6.419710636138916, "global_step": 112619, "epoch": 2681} {"train_loss": -6.511363983154297, "global_step": 112620, "epoch": 2681} {"train_loss": -6.402915000915527, "global_step": 112621, "epoch": 2681} {"train_loss": -6.5306291580200195, "global_step": 112622, "epoch": 2681} {"train_loss": -6.456212997436523, "global_step": 112623, "epoch": 2681} {"train_loss": -6.4028825759887695, "global_step": 112624, "epoch": 2681} {"train_loss": -6.56309700012207, "global_step": 112625, "epoch": 2681} {"train_loss": -6.52158260345459, "global_step": 112626, "epoch": 2681} {"train_loss": -6.557591438293457, "global_step": 112627, "epoch": 2681} {"train_loss": -6.541574478149414, "global_step": 112628, "epoch": 2681} {"train_loss": -6.559967994689941, "global_step": 112629, "epoch": 2681} {"train_loss": -6.547635078430176, "global_step": 112630, "epoch": 2681} {"train_loss": -6.555138111114502, "global_step": 112631, "epoch": 2681} {"train_loss": -6.427446365356445, "global_step": 112632, "epoch": 2681} {"train_loss": -6.601401329040527, "global_step": 112633, "epoch": 2681} {"train_loss": -6.611912250518799, "global_step": 112634, "epoch": 2681} {"train_loss": -6.454532146453857, "global_step": 112635, "epoch": 2681} {"train_loss": -6.443028450012207, "global_step": 112636, "epoch": 2681} {"train_loss": -6.5325927734375, "global_step": 112637, "epoch": 2681} {"train_loss": -6.433712482452393, "global_step": 112638, "epoch": 2681} {"train_loss": -6.439055442810059, "global_step": 112639, "epoch": 2681} {"train_loss": -6.489325523376465, "global_step": 112640, "epoch": 2681} {"train_loss": -6.470808506011963, "global_step": 112641, "epoch": 2681} {"train_loss": -6.414694786071777, "global_step": 112642, "epoch": 2681} {"train_loss": -6.510245981670561, "global_step": 112643, "epoch": 2681, "val_loss": 65454.4140625} {"train_loss": -6.378434658050537, "global_step": 112644, "epoch": 2682} {"train_loss": -6.605951309204102, "global_step": 112645, "epoch": 2682} {"train_loss": -6.4112396240234375, "global_step": 112646, "epoch": 2682} {"train_loss": -6.547820091247559, "global_step": 112647, "epoch": 2682} {"train_loss": -6.50587272644043, "global_step": 112648, "epoch": 2682} {"train_loss": -6.437385559082031, "global_step": 112649, "epoch": 2682} {"train_loss": -6.481864929199219, "global_step": 112650, "epoch": 2682} {"train_loss": -6.39724063873291, "global_step": 112651, "epoch": 2682} {"train_loss": -6.448059558868408, "global_step": 112652, "epoch": 2682} {"train_loss": -6.480836868286133, "global_step": 112653, "epoch": 2682} {"train_loss": -6.4645538330078125, "global_step": 112654, "epoch": 2682} {"train_loss": -6.508770942687988, "global_step": 112655, "epoch": 2682} {"train_loss": -6.432349681854248, "global_step": 112656, "epoch": 2682} {"train_loss": -6.516032695770264, "global_step": 112657, "epoch": 2682} {"train_loss": -6.507023811340332, "global_step": 112658, "epoch": 2682} {"train_loss": -6.496712684631348, "global_step": 112659, "epoch": 2682} {"train_loss": -6.41013765335083, "global_step": 112660, "epoch": 2682} {"train_loss": -6.610048294067383, "global_step": 112661, "epoch": 2682} {"train_loss": -6.368369102478027, "global_step": 112662, "epoch": 2682} {"train_loss": -6.505343437194824, "global_step": 112663, "epoch": 2682} {"train_loss": -6.463618278503418, "global_step": 112664, "epoch": 2682} {"train_loss": -6.502154350280762, "global_step": 112665, "epoch": 2682} {"train_loss": -6.555635452270508, "global_step": 112666, "epoch": 2682} {"train_loss": -6.619316101074219, "global_step": 112667, "epoch": 2682} {"train_loss": -6.56973934173584, "global_step": 112668, "epoch": 2682} {"train_loss": -6.4566755294799805, "global_step": 112669, "epoch": 2682} {"train_loss": -6.4991984367370605, "global_step": 112670, "epoch": 2682} {"train_loss": -6.538963317871094, "global_step": 112671, "epoch": 2682} {"train_loss": -6.479203224182129, "global_step": 112672, "epoch": 2682} {"train_loss": -6.569894790649414, "global_step": 112673, "epoch": 2682} {"train_loss": -6.702401161193848, "global_step": 112674, "epoch": 2682} {"train_loss": -6.593542098999023, "global_step": 112675, "epoch": 2682} {"train_loss": -6.455508232116699, "global_step": 112676, "epoch": 2682} {"train_loss": -6.49837589263916, "global_step": 112677, "epoch": 2682} {"train_loss": -6.443785667419434, "global_step": 112678, "epoch": 2682} {"train_loss": -6.501026630401611, "global_step": 112679, "epoch": 2682} {"train_loss": -6.489987850189209, "global_step": 112680, "epoch": 2682} {"train_loss": -6.506043434143066, "global_step": 112681, "epoch": 2682} {"train_loss": -6.390023231506348, "global_step": 112682, "epoch": 2682} {"train_loss": -6.424098014831543, "global_step": 112683, "epoch": 2682} {"train_loss": -6.443872451782227, "global_step": 112684, "epoch": 2682} {"train_loss": -6.492193267458961, "global_step": 112685, "epoch": 2682, "val_loss": 65209.7734375} {"train_loss": -6.392571449279785, "global_step": 112686, "epoch": 2683} {"train_loss": -6.50518274307251, "global_step": 112687, "epoch": 2683} {"train_loss": -6.48175048828125, "global_step": 112688, "epoch": 2683} {"train_loss": -6.52147102355957, "global_step": 112689, "epoch": 2683} {"train_loss": -6.542054653167725, "global_step": 112690, "epoch": 2683} {"train_loss": -6.510830402374268, "global_step": 112691, "epoch": 2683} {"train_loss": -6.39655876159668, "global_step": 112692, "epoch": 2683} {"train_loss": -6.567470550537109, "global_step": 112693, "epoch": 2683} {"train_loss": -6.470615863800049, "global_step": 112694, "epoch": 2683} {"train_loss": -6.497635841369629, "global_step": 112695, "epoch": 2683} {"train_loss": -6.443221569061279, "global_step": 112696, "epoch": 2683} {"train_loss": -6.428256511688232, "global_step": 112697, "epoch": 2683} {"train_loss": -6.49672794342041, "global_step": 112698, "epoch": 2683} {"train_loss": -6.4539008140563965, "global_step": 112699, "epoch": 2683} {"train_loss": -6.448726654052734, "global_step": 112700, "epoch": 2683} {"train_loss": -6.560841083526611, "global_step": 112701, "epoch": 2683} {"train_loss": -6.65569543838501, "global_step": 112702, "epoch": 2683} {"train_loss": -6.530636787414551, "global_step": 112703, "epoch": 2683} {"train_loss": -6.510209083557129, "global_step": 112704, "epoch": 2683} {"train_loss": -6.501100540161133, "global_step": 112705, "epoch": 2683} {"train_loss": -6.4526872634887695, "global_step": 112706, "epoch": 2683} {"train_loss": -6.596413612365723, "global_step": 112707, "epoch": 2683} {"train_loss": -6.6198930740356445, "global_step": 112708, "epoch": 2683} {"train_loss": -6.627660751342773, "global_step": 112709, "epoch": 2683} {"train_loss": -6.5086517333984375, "global_step": 112710, "epoch": 2683} {"train_loss": -6.508864402770996, "global_step": 112711, "epoch": 2683} {"train_loss": -6.46671199798584, "global_step": 112712, "epoch": 2683} {"train_loss": -6.46641206741333, "global_step": 112713, "epoch": 2683} {"train_loss": -6.539775848388672, "global_step": 112714, "epoch": 2683} {"train_loss": -6.627248764038086, "global_step": 112715, "epoch": 2683} {"train_loss": -6.460220813751221, "global_step": 112716, "epoch": 2683} {"train_loss": -6.4982757568359375, "global_step": 112717, "epoch": 2683} {"train_loss": -6.546926498413086, "global_step": 112718, "epoch": 2683} {"train_loss": -6.470354080200195, "global_step": 112719, "epoch": 2683} {"train_loss": -6.429624080657959, "global_step": 112720, "epoch": 2683} {"train_loss": -6.345771312713623, "global_step": 112721, "epoch": 2683} {"train_loss": -6.364833831787109, "global_step": 112722, "epoch": 2683} {"train_loss": -6.512895584106445, "global_step": 112723, "epoch": 2683} {"train_loss": -6.432397842407227, "global_step": 112724, "epoch": 2683} {"train_loss": -6.4679718017578125, "global_step": 112725, "epoch": 2683} {"train_loss": -6.459141731262207, "global_step": 112726, "epoch": 2683} {"train_loss": -6.495142312276931, "global_step": 112727, "epoch": 2683, "val_loss": 64999.734375} {"train_loss": -6.482891082763672, "global_step": 112728, "epoch": 2684} {"train_loss": -6.545358180999756, "global_step": 112729, "epoch": 2684} {"train_loss": -6.447390556335449, "global_step": 112730, "epoch": 2684} {"train_loss": -6.375267028808594, "global_step": 112731, "epoch": 2684} {"train_loss": -6.421771049499512, "global_step": 112732, "epoch": 2684} {"train_loss": -6.530169486999512, "global_step": 112733, "epoch": 2684} {"train_loss": -6.431853294372559, "global_step": 112734, "epoch": 2684} {"train_loss": -6.51229190826416, "global_step": 112735, "epoch": 2684} {"train_loss": -6.423711776733398, "global_step": 112736, "epoch": 2684} {"train_loss": -6.565826416015625, "global_step": 112737, "epoch": 2684} {"train_loss": -6.4527716636657715, "global_step": 112738, "epoch": 2684} {"train_loss": -6.597177505493164, "global_step": 112739, "epoch": 2684} {"train_loss": -6.497536659240723, "global_step": 112740, "epoch": 2684} {"train_loss": -6.496260166168213, "global_step": 112741, "epoch": 2684} {"train_loss": -6.527675628662109, "global_step": 112742, "epoch": 2684} {"train_loss": -6.563086032867432, "global_step": 112743, "epoch": 2684} {"train_loss": -6.519647121429443, "global_step": 112744, "epoch": 2684} {"train_loss": -6.511568546295166, "global_step": 112745, "epoch": 2684} {"train_loss": -6.426504611968994, "global_step": 112746, "epoch": 2684} {"train_loss": -6.513710975646973, "global_step": 112747, "epoch": 2684} {"train_loss": -6.605457782745361, "global_step": 112748, "epoch": 2684} {"train_loss": -6.462502479553223, "global_step": 112749, "epoch": 2684} {"train_loss": -6.589811325073242, "global_step": 112750, "epoch": 2684} {"train_loss": -6.466711521148682, "global_step": 112751, "epoch": 2684} {"train_loss": -6.400167465209961, "global_step": 112752, "epoch": 2684} {"train_loss": -6.565650463104248, "global_step": 112753, "epoch": 2684} {"train_loss": -6.300658226013184, "global_step": 112754, "epoch": 2684} {"train_loss": -6.483295440673828, "global_step": 112755, "epoch": 2684} {"train_loss": -6.5968523025512695, "global_step": 112756, "epoch": 2684} {"train_loss": -6.381156921386719, "global_step": 112757, "epoch": 2684} {"train_loss": -6.5272536277771, "global_step": 112758, "epoch": 2684} {"train_loss": -6.305237770080566, "global_step": 112759, "epoch": 2684} {"train_loss": -6.450188159942627, "global_step": 112760, "epoch": 2684} {"train_loss": -6.467274188995361, "global_step": 112761, "epoch": 2684} {"train_loss": -6.44654655456543, "global_step": 112762, "epoch": 2684} {"train_loss": -6.545543193817139, "global_step": 112763, "epoch": 2684} {"train_loss": -6.54258394241333, "global_step": 112764, "epoch": 2684} {"train_loss": -6.380704402923584, "global_step": 112765, "epoch": 2684} {"train_loss": -6.5607709884643555, "global_step": 112766, "epoch": 2684} {"train_loss": -6.443081855773926, "global_step": 112767, "epoch": 2684} {"train_loss": -6.487740993499756, "global_step": 112768, "epoch": 2684} {"train_loss": -6.483866350991385, "global_step": 112769, "epoch": 2684, "val_loss": 65337.56640625} {"train_loss": -6.397650718688965, "global_step": 112770, "epoch": 2685} {"train_loss": -6.46596622467041, "global_step": 112771, "epoch": 2685} {"train_loss": -6.526244163513184, "global_step": 112772, "epoch": 2685} {"train_loss": -6.413189888000488, "global_step": 112773, "epoch": 2685} {"train_loss": -6.452526569366455, "global_step": 112774, "epoch": 2685} {"train_loss": -6.580512046813965, "global_step": 112775, "epoch": 2685} {"train_loss": -6.433181285858154, "global_step": 112776, "epoch": 2685} {"train_loss": -6.467688083648682, "global_step": 112777, "epoch": 2685} {"train_loss": -6.571231842041016, "global_step": 112778, "epoch": 2685} {"train_loss": -6.616665363311768, "global_step": 112779, "epoch": 2685} {"train_loss": -6.606329441070557, "global_step": 112780, "epoch": 2685} {"train_loss": -6.522944927215576, "global_step": 112781, "epoch": 2685} {"train_loss": -6.556232452392578, "global_step": 112782, "epoch": 2685} {"train_loss": -6.471139907836914, "global_step": 112783, "epoch": 2685} {"train_loss": -6.38104772567749, "global_step": 112784, "epoch": 2685} {"train_loss": -6.502971649169922, "global_step": 112785, "epoch": 2685} {"train_loss": -6.598184108734131, "global_step": 112786, "epoch": 2685} {"train_loss": -6.5075836181640625, "global_step": 112787, "epoch": 2685} {"train_loss": -6.624658584594727, "global_step": 112788, "epoch": 2685} {"train_loss": -6.483511924743652, "global_step": 112789, "epoch": 2685} {"train_loss": -6.489973545074463, "global_step": 112790, "epoch": 2685} {"train_loss": -6.594620227813721, "global_step": 112791, "epoch": 2685} {"train_loss": -6.545435428619385, "global_step": 112792, "epoch": 2685} {"train_loss": -6.388332366943359, "global_step": 112793, "epoch": 2685} {"train_loss": -6.47274112701416, "global_step": 112794, "epoch": 2685} {"train_loss": -6.470625877380371, "global_step": 112795, "epoch": 2685} {"train_loss": -6.536378383636475, "global_step": 112796, "epoch": 2685} {"train_loss": -6.517482757568359, "global_step": 112797, "epoch": 2685} {"train_loss": -6.467217922210693, "global_step": 112798, "epoch": 2685} {"train_loss": -6.534836292266846, "global_step": 112799, "epoch": 2685} {"train_loss": -6.555692672729492, "global_step": 112800, "epoch": 2685} {"train_loss": -6.479526042938232, "global_step": 112801, "epoch": 2685} {"train_loss": -6.512027740478516, "global_step": 112802, "epoch": 2685} {"train_loss": -6.359881401062012, "global_step": 112803, "epoch": 2685} {"train_loss": -6.5598273277282715, "global_step": 112804, "epoch": 2685} {"train_loss": -6.4844136238098145, "global_step": 112805, "epoch": 2685} {"train_loss": -6.528897762298584, "global_step": 112806, "epoch": 2685} {"train_loss": -6.54658317565918, "global_step": 112807, "epoch": 2685} {"train_loss": -6.431180953979492, "global_step": 112808, "epoch": 2685} {"train_loss": -6.60176420211792, "global_step": 112809, "epoch": 2685} {"train_loss": -6.566990375518799, "global_step": 112810, "epoch": 2685} {"train_loss": -6.506070579801287, "global_step": 112811, "epoch": 2685, "val_loss": 65168.37890625} {"train_loss": -6.6155500411987305, "global_step": 112812, "epoch": 2686} {"train_loss": -6.629278659820557, "global_step": 112813, "epoch": 2686} {"train_loss": -6.383149147033691, "global_step": 112814, "epoch": 2686} {"train_loss": -6.532609939575195, "global_step": 112815, "epoch": 2686} {"train_loss": -6.5384931564331055, "global_step": 112816, "epoch": 2686} {"train_loss": -6.422928333282471, "global_step": 112817, "epoch": 2686} {"train_loss": -6.457656383514404, "global_step": 112818, "epoch": 2686} {"train_loss": -6.489158630371094, "global_step": 112819, "epoch": 2686} {"train_loss": -6.426505088806152, "global_step": 112820, "epoch": 2686} {"train_loss": -6.620710372924805, "global_step": 112821, "epoch": 2686} {"train_loss": -6.466952323913574, "global_step": 112822, "epoch": 2686} {"train_loss": -6.466273307800293, "global_step": 112823, "epoch": 2686} {"train_loss": -6.584410667419434, "global_step": 112824, "epoch": 2686} {"train_loss": -6.4605913162231445, "global_step": 112825, "epoch": 2686} {"train_loss": -6.396986961364746, "global_step": 112826, "epoch": 2686} {"train_loss": -6.52086877822876, "global_step": 112827, "epoch": 2686} {"train_loss": -6.360799789428711, "global_step": 112828, "epoch": 2686} {"train_loss": -6.379335403442383, "global_step": 112829, "epoch": 2686} {"train_loss": -6.406662940979004, "global_step": 112830, "epoch": 2686} {"train_loss": -6.438867568969727, "global_step": 112831, "epoch": 2686} {"train_loss": -6.292430877685547, "global_step": 112832, "epoch": 2686} {"train_loss": -6.347565650939941, "global_step": 112833, "epoch": 2686} {"train_loss": -6.4973368644714355, "global_step": 112834, "epoch": 2686} {"train_loss": -6.349768161773682, "global_step": 112835, "epoch": 2686} {"train_loss": -6.473822593688965, "global_step": 112836, "epoch": 2686} {"train_loss": -6.399568557739258, "global_step": 112837, "epoch": 2686} {"train_loss": -6.438929080963135, "global_step": 112838, "epoch": 2686} {"train_loss": -6.353433609008789, "global_step": 112839, "epoch": 2686} {"train_loss": -6.473346710205078, "global_step": 112840, "epoch": 2686} {"train_loss": -6.50476598739624, "global_step": 112841, "epoch": 2686} {"train_loss": -6.55996561050415, "global_step": 112842, "epoch": 2686} {"train_loss": -6.588627338409424, "global_step": 112843, "epoch": 2686} {"train_loss": -6.3739519119262695, "global_step": 112844, "epoch": 2686} {"train_loss": -6.554831504821777, "global_step": 112845, "epoch": 2686} {"train_loss": -6.412160873413086, "global_step": 112846, "epoch": 2686} {"train_loss": -6.517531394958496, "global_step": 112847, "epoch": 2686} {"train_loss": -6.424500465393066, "global_step": 112848, "epoch": 2686} {"train_loss": -6.461133003234863, "global_step": 112849, "epoch": 2686} {"train_loss": -6.486840724945068, "global_step": 112850, "epoch": 2686} {"train_loss": -6.545903205871582, "global_step": 112851, "epoch": 2686} {"train_loss": -6.4861297607421875, "global_step": 112852, "epoch": 2686} {"train_loss": -6.469288212912423, "global_step": 112853, "epoch": 2686, "val_loss": 65069.22265625} {"train_loss": -6.52657413482666, "global_step": 112854, "epoch": 2687} {"train_loss": -6.500815391540527, "global_step": 112855, "epoch": 2687} {"train_loss": -6.439652919769287, "global_step": 112856, "epoch": 2687} {"train_loss": -6.446009635925293, "global_step": 112857, "epoch": 2687} {"train_loss": -6.37383508682251, "global_step": 112858, "epoch": 2687} {"train_loss": -6.5440168380737305, "global_step": 112859, "epoch": 2687} {"train_loss": -6.383472442626953, "global_step": 112860, "epoch": 2687} {"train_loss": -6.4499101638793945, "global_step": 112861, "epoch": 2687} {"train_loss": -6.374506950378418, "global_step": 112862, "epoch": 2687} {"train_loss": -6.311382293701172, "global_step": 112863, "epoch": 2687} {"train_loss": -6.493503570556641, "global_step": 112864, "epoch": 2687} {"train_loss": -6.487037658691406, "global_step": 112865, "epoch": 2687} {"train_loss": -6.412149429321289, "global_step": 112866, "epoch": 2687} {"train_loss": -6.565267562866211, "global_step": 112867, "epoch": 2687} {"train_loss": -6.5147480964660645, "global_step": 112868, "epoch": 2687} {"train_loss": -6.608105659484863, "global_step": 112869, "epoch": 2687} {"train_loss": -6.483828067779541, "global_step": 112870, "epoch": 2687} {"train_loss": -6.532235622406006, "global_step": 112871, "epoch": 2687} {"train_loss": -6.4344329833984375, "global_step": 112872, "epoch": 2687} {"train_loss": -6.443213939666748, "global_step": 112873, "epoch": 2687} {"train_loss": -6.398242950439453, "global_step": 112874, "epoch": 2687} {"train_loss": -6.402055740356445, "global_step": 112875, "epoch": 2687} {"train_loss": -6.462226390838623, "global_step": 112876, "epoch": 2687} {"train_loss": -6.4278035163879395, "global_step": 112877, "epoch": 2687} {"train_loss": -6.430641174316406, "global_step": 112878, "epoch": 2687} {"train_loss": -6.426760673522949, "global_step": 112879, "epoch": 2687} {"train_loss": -6.473427772521973, "global_step": 112880, "epoch": 2687} {"train_loss": -6.51414680480957, "global_step": 112881, "epoch": 2687} {"train_loss": -6.4996538162231445, "global_step": 112882, "epoch": 2687} {"train_loss": -6.408485412597656, "global_step": 112883, "epoch": 2687} {"train_loss": -6.498538494110107, "global_step": 112884, "epoch": 2687} {"train_loss": -6.415859222412109, "global_step": 112885, "epoch": 2687} {"train_loss": -6.458182334899902, "global_step": 112886, "epoch": 2687} {"train_loss": -6.365540504455566, "global_step": 112887, "epoch": 2687} {"train_loss": -6.515300750732422, "global_step": 112888, "epoch": 2687} {"train_loss": -6.307884693145752, "global_step": 112889, "epoch": 2687} {"train_loss": -6.415969371795654, "global_step": 112890, "epoch": 2687} {"train_loss": -6.4204864501953125, "global_step": 112891, "epoch": 2687} {"train_loss": -6.4537835121154785, "global_step": 112892, "epoch": 2687} {"train_loss": -6.453995227813721, "global_step": 112893, "epoch": 2687} {"train_loss": -6.431354522705078, "global_step": 112894, "epoch": 2687} {"train_loss": -6.453887212844122, "global_step": 112895, "epoch": 2687, "val_loss": 65189.33984375} {"train_loss": -6.4269561767578125, "global_step": 112896, "epoch": 2688} {"train_loss": -6.4366865158081055, "global_step": 112897, "epoch": 2688} {"train_loss": -6.557631492614746, "global_step": 112898, "epoch": 2688} {"train_loss": -6.511425018310547, "global_step": 112899, "epoch": 2688} {"train_loss": -6.460083961486816, "global_step": 112900, "epoch": 2688} {"train_loss": -6.421152114868164, "global_step": 112901, "epoch": 2688} {"train_loss": -6.47872257232666, "global_step": 112902, "epoch": 2688} {"train_loss": -6.447420120239258, "global_step": 112903, "epoch": 2688} {"train_loss": -6.397795677185059, "global_step": 112904, "epoch": 2688} {"train_loss": -6.494134902954102, "global_step": 112905, "epoch": 2688} {"train_loss": -6.547314167022705, "global_step": 112906, "epoch": 2688} {"train_loss": -6.453190803527832, "global_step": 112907, "epoch": 2688} {"train_loss": -6.58903169631958, "global_step": 112908, "epoch": 2688} {"train_loss": -6.444222450256348, "global_step": 112909, "epoch": 2688} {"train_loss": -6.516022682189941, "global_step": 112910, "epoch": 2688} {"train_loss": -6.494797706604004, "global_step": 112911, "epoch": 2688} {"train_loss": -6.403153419494629, "global_step": 112912, "epoch": 2688} {"train_loss": -6.4492034912109375, "global_step": 112913, "epoch": 2688} {"train_loss": -6.537951469421387, "global_step": 112914, "epoch": 2688} {"train_loss": -6.545660972595215, "global_step": 112915, "epoch": 2688} {"train_loss": -6.486757755279541, "global_step": 112916, "epoch": 2688} {"train_loss": -6.55230712890625, "global_step": 112917, "epoch": 2688} {"train_loss": -6.451227188110352, "global_step": 112918, "epoch": 2688} {"train_loss": -6.4587297439575195, "global_step": 112919, "epoch": 2688} {"train_loss": -6.512050628662109, "global_step": 112920, "epoch": 2688} {"train_loss": -6.595821380615234, "global_step": 112921, "epoch": 2688} {"train_loss": -6.406223297119141, "global_step": 112922, "epoch": 2688} {"train_loss": -6.5087504386901855, "global_step": 112923, "epoch": 2688} {"train_loss": -6.462532997131348, "global_step": 112924, "epoch": 2688} {"train_loss": -6.385261058807373, "global_step": 112925, "epoch": 2688} {"train_loss": -6.547521114349365, "global_step": 112926, "epoch": 2688} {"train_loss": -6.353153228759766, "global_step": 112927, "epoch": 2688} {"train_loss": -6.448580741882324, "global_step": 112928, "epoch": 2688} {"train_loss": -6.437965393066406, "global_step": 112929, "epoch": 2688} {"train_loss": -6.558374881744385, "global_step": 112930, "epoch": 2688} {"train_loss": -6.463407516479492, "global_step": 112931, "epoch": 2688} {"train_loss": -6.62817907333374, "global_step": 112932, "epoch": 2688} {"train_loss": -6.546148300170898, "global_step": 112933, "epoch": 2688} {"train_loss": -6.493380546569824, "global_step": 112934, "epoch": 2688} {"train_loss": -6.510669708251953, "global_step": 112935, "epoch": 2688} {"train_loss": -6.515573978424072, "global_step": 112936, "epoch": 2688} {"train_loss": -6.489887873331706, "global_step": 112937, "epoch": 2688, "val_loss": 65163.046875} {"train_loss": -6.514753341674805, "global_step": 112938, "epoch": 2689} {"train_loss": -6.517153739929199, "global_step": 112939, "epoch": 2689} {"train_loss": -6.556159973144531, "global_step": 112940, "epoch": 2689} {"train_loss": -6.566068172454834, "global_step": 112941, "epoch": 2689} {"train_loss": -6.57369327545166, "global_step": 112942, "epoch": 2689} {"train_loss": -6.586535930633545, "global_step": 112943, "epoch": 2689} {"train_loss": -6.464468002319336, "global_step": 112944, "epoch": 2689} {"train_loss": -6.61064338684082, "global_step": 112945, "epoch": 2689} {"train_loss": -6.608734607696533, "global_step": 112946, "epoch": 2689} {"train_loss": -6.538146018981934, "global_step": 112947, "epoch": 2689} {"train_loss": -6.560449123382568, "global_step": 112948, "epoch": 2689} {"train_loss": -6.535506248474121, "global_step": 112949, "epoch": 2689} {"train_loss": -6.558566570281982, "global_step": 112950, "epoch": 2689} {"train_loss": -6.518695831298828, "global_step": 112951, "epoch": 2689} {"train_loss": -6.698766708374023, "global_step": 112952, "epoch": 2689} {"train_loss": -6.52325963973999, "global_step": 112953, "epoch": 2689} {"train_loss": -6.660010814666748, "global_step": 112954, "epoch": 2689} {"train_loss": -6.417324066162109, "global_step": 112955, "epoch": 2689} {"train_loss": -6.395495414733887, "global_step": 112956, "epoch": 2689} {"train_loss": -6.4982757568359375, "global_step": 112957, "epoch": 2689} {"train_loss": -6.377849102020264, "global_step": 112958, "epoch": 2689} {"train_loss": -6.417267322540283, "global_step": 112959, "epoch": 2689} {"train_loss": -6.476230621337891, "global_step": 112960, "epoch": 2689} {"train_loss": -6.531861782073975, "global_step": 112961, "epoch": 2689} {"train_loss": -6.405759811401367, "global_step": 112962, "epoch": 2689} {"train_loss": -6.438920974731445, "global_step": 112963, "epoch": 2689} {"train_loss": -6.393630027770996, "global_step": 112964, "epoch": 2689} {"train_loss": -6.479109764099121, "global_step": 112965, "epoch": 2689} {"train_loss": -6.433663368225098, "global_step": 112966, "epoch": 2689} {"train_loss": -6.395944595336914, "global_step": 112967, "epoch": 2689} {"train_loss": -6.423316955566406, "global_step": 112968, "epoch": 2689} {"train_loss": -6.465313911437988, "global_step": 112969, "epoch": 2689} {"train_loss": -6.468143939971924, "global_step": 112970, "epoch": 2689} {"train_loss": -6.502762794494629, "global_step": 112971, "epoch": 2689} {"train_loss": -6.456918716430664, "global_step": 112972, "epoch": 2689} {"train_loss": -6.434471130371094, "global_step": 112973, "epoch": 2689} {"train_loss": -6.425357341766357, "global_step": 112974, "epoch": 2689} {"train_loss": -6.512999057769775, "global_step": 112975, "epoch": 2689} {"train_loss": -6.461589813232422, "global_step": 112976, "epoch": 2689} {"train_loss": -6.462547779083252, "global_step": 112977, "epoch": 2689} {"train_loss": -6.439797401428223, "global_step": 112978, "epoch": 2689} {"train_loss": -6.494164569037301, "global_step": 112979, "epoch": 2689, "val_loss": 65371.17578125} {"train_loss": -6.431645393371582, "global_step": 112980, "epoch": 2690} {"train_loss": -6.494256973266602, "global_step": 112981, "epoch": 2690} {"train_loss": -6.390178680419922, "global_step": 112982, "epoch": 2690} {"train_loss": -6.402087211608887, "global_step": 112983, "epoch": 2690} {"train_loss": -6.376430511474609, "global_step": 112984, "epoch": 2690} {"train_loss": -6.5962114334106445, "global_step": 112985, "epoch": 2690} {"train_loss": -6.549111366271973, "global_step": 112986, "epoch": 2690} {"train_loss": -6.548974990844727, "global_step": 112987, "epoch": 2690} {"train_loss": -6.5135040283203125, "global_step": 112988, "epoch": 2690} {"train_loss": -6.564728736877441, "global_step": 112989, "epoch": 2690} {"train_loss": -6.481597423553467, "global_step": 112990, "epoch": 2690} {"train_loss": -6.574195861816406, "global_step": 112991, "epoch": 2690} {"train_loss": -6.46088171005249, "global_step": 112992, "epoch": 2690} {"train_loss": -6.572118759155273, "global_step": 112993, "epoch": 2690} {"train_loss": -6.5000715255737305, "global_step": 112994, "epoch": 2690} {"train_loss": -6.543575286865234, "global_step": 112995, "epoch": 2690} {"train_loss": -6.498904228210449, "global_step": 112996, "epoch": 2690} {"train_loss": -6.47395133972168, "global_step": 112997, "epoch": 2690} {"train_loss": -6.584095001220703, "global_step": 112998, "epoch": 2690} {"train_loss": -6.495599269866943, "global_step": 112999, "epoch": 2690} {"train_loss": -6.566206932067871, "global_step": 113000, "epoch": 2690} {"train_loss": -6.4936842918396, "global_step": 113001, "epoch": 2690} {"train_loss": -6.457695960998535, "global_step": 113002, "epoch": 2690} {"train_loss": -6.543975830078125, "global_step": 113003, "epoch": 2690} {"train_loss": -6.47022008895874, "global_step": 113004, "epoch": 2690} {"train_loss": -6.58184814453125, "global_step": 113005, "epoch": 2690} {"train_loss": -6.482898712158203, "global_step": 113006, "epoch": 2690} {"train_loss": -6.526630401611328, "global_step": 113007, "epoch": 2690} {"train_loss": -6.452165603637695, "global_step": 113008, "epoch": 2690} {"train_loss": -6.389820098876953, "global_step": 113009, "epoch": 2690} {"train_loss": -6.480243682861328, "global_step": 113010, "epoch": 2690} {"train_loss": -6.4319844245910645, "global_step": 113011, "epoch": 2690} {"train_loss": -6.518560409545898, "global_step": 113012, "epoch": 2690} {"train_loss": -6.424338340759277, "global_step": 113013, "epoch": 2690} {"train_loss": -6.577669143676758, "global_step": 113014, "epoch": 2690} {"train_loss": -6.44801664352417, "global_step": 113015, "epoch": 2690} {"train_loss": -6.426177978515625, "global_step": 113016, "epoch": 2690} {"train_loss": -6.433070182800293, "global_step": 113017, "epoch": 2690} {"train_loss": -6.461002349853516, "global_step": 113018, "epoch": 2690} {"train_loss": -6.461897850036621, "global_step": 113019, "epoch": 2690} {"train_loss": -6.438163757324219, "global_step": 113020, "epoch": 2690} {"train_loss": -6.4893641244797475, "global_step": 113021, "epoch": 2690, "val_loss": 65088.00390625} {"train_loss": -6.555702209472656, "global_step": 113022, "epoch": 2691} {"train_loss": -6.445392608642578, "global_step": 113023, "epoch": 2691} {"train_loss": -6.541751384735107, "global_step": 113024, "epoch": 2691} {"train_loss": -6.4284210205078125, "global_step": 113025, "epoch": 2691} {"train_loss": -6.5112504959106445, "global_step": 113026, "epoch": 2691} {"train_loss": -6.515789031982422, "global_step": 113027, "epoch": 2691} {"train_loss": -6.459375381469727, "global_step": 113028, "epoch": 2691} {"train_loss": -6.448179244995117, "global_step": 113029, "epoch": 2691} {"train_loss": -6.494132995605469, "global_step": 113030, "epoch": 2691} {"train_loss": -6.5153021812438965, "global_step": 113031, "epoch": 2691} {"train_loss": -6.427702903747559, "global_step": 113032, "epoch": 2691} {"train_loss": -6.580071926116943, "global_step": 113033, "epoch": 2691} {"train_loss": -6.548274993896484, "global_step": 113034, "epoch": 2691} {"train_loss": -6.274878025054932, "global_step": 113035, "epoch": 2691} {"train_loss": -6.507497787475586, "global_step": 113036, "epoch": 2691} {"train_loss": -6.450926303863525, "global_step": 113037, "epoch": 2691} {"train_loss": -6.530712127685547, "global_step": 113038, "epoch": 2691} {"train_loss": -6.473596572875977, "global_step": 113039, "epoch": 2691} {"train_loss": -6.575659275054932, "global_step": 113040, "epoch": 2691} {"train_loss": -6.516404151916504, "global_step": 113041, "epoch": 2691} {"train_loss": -6.414778232574463, "global_step": 113042, "epoch": 2691} {"train_loss": -6.566472053527832, "global_step": 113043, "epoch": 2691} {"train_loss": -6.507546424865723, "global_step": 113044, "epoch": 2691} {"train_loss": -6.533756256103516, "global_step": 113045, "epoch": 2691} {"train_loss": -6.545652389526367, "global_step": 113046, "epoch": 2691} {"train_loss": -6.5275678634643555, "global_step": 113047, "epoch": 2691} {"train_loss": -6.513049125671387, "global_step": 113048, "epoch": 2691} {"train_loss": -6.548513412475586, "global_step": 113049, "epoch": 2691} {"train_loss": -6.5862836837768555, "global_step": 113050, "epoch": 2691} {"train_loss": -6.586188316345215, "global_step": 113051, "epoch": 2691} {"train_loss": -6.449568748474121, "global_step": 113052, "epoch": 2691} {"train_loss": -6.564642429351807, "global_step": 113053, "epoch": 2691} {"train_loss": -6.478122711181641, "global_step": 113054, "epoch": 2691} {"train_loss": -6.567632675170898, "global_step": 113055, "epoch": 2691} {"train_loss": -6.477038383483887, "global_step": 113056, "epoch": 2691} {"train_loss": -6.558952331542969, "global_step": 113057, "epoch": 2691} {"train_loss": -6.506420612335205, "global_step": 113058, "epoch": 2691} {"train_loss": -6.515758991241455, "global_step": 113059, "epoch": 2691} {"train_loss": -6.598230361938477, "global_step": 113060, "epoch": 2691} {"train_loss": -6.572005271911621, "global_step": 113061, "epoch": 2691} {"train_loss": -6.534158706665039, "global_step": 113062, "epoch": 2691} {"train_loss": -6.512146586463565, "global_step": 113063, "epoch": 2691, "val_loss": 65070.5546875} {"train_loss": -6.611120223999023, "global_step": 113064, "epoch": 2692} {"train_loss": -6.507662296295166, "global_step": 113065, "epoch": 2692} {"train_loss": -6.576228618621826, "global_step": 113066, "epoch": 2692} {"train_loss": -6.573733329772949, "global_step": 113067, "epoch": 2692} {"train_loss": -6.537461757659912, "global_step": 113068, "epoch": 2692} {"train_loss": -6.678423881530762, "global_step": 113069, "epoch": 2692} {"train_loss": -6.529343605041504, "global_step": 113070, "epoch": 2692} {"train_loss": -6.63087272644043, "global_step": 113071, "epoch": 2692} {"train_loss": -6.483470916748047, "global_step": 113072, "epoch": 2692} {"train_loss": -6.533475875854492, "global_step": 113073, "epoch": 2692} {"train_loss": -6.619483470916748, "global_step": 113074, "epoch": 2692} {"train_loss": -6.730032920837402, "global_step": 113075, "epoch": 2692} {"train_loss": -6.595951080322266, "global_step": 113076, "epoch": 2692} {"train_loss": -6.42080545425415, "global_step": 113077, "epoch": 2692} {"train_loss": -6.635819435119629, "global_step": 113078, "epoch": 2692} {"train_loss": -6.46929931640625, "global_step": 113079, "epoch": 2692} {"train_loss": -6.509617805480957, "global_step": 113080, "epoch": 2692} {"train_loss": -6.614948749542236, "global_step": 113081, "epoch": 2692} {"train_loss": -6.490632057189941, "global_step": 113082, "epoch": 2692} {"train_loss": -6.519775390625, "global_step": 113083, "epoch": 2692} {"train_loss": -6.548510551452637, "global_step": 113084, "epoch": 2692} {"train_loss": -6.480404853820801, "global_step": 113085, "epoch": 2692} {"train_loss": -6.643502235412598, "global_step": 113086, "epoch": 2692} {"train_loss": -6.4325761795043945, "global_step": 113087, "epoch": 2692} {"train_loss": -6.54967737197876, "global_step": 113088, "epoch": 2692} {"train_loss": -6.439000129699707, "global_step": 113089, "epoch": 2692} {"train_loss": -6.514543533325195, "global_step": 113090, "epoch": 2692} {"train_loss": -6.524410247802734, "global_step": 113091, "epoch": 2692} {"train_loss": -6.495168685913086, "global_step": 113092, "epoch": 2692} {"train_loss": -6.461711883544922, "global_step": 113093, "epoch": 2692} {"train_loss": -6.508465766906738, "global_step": 113094, "epoch": 2692} {"train_loss": -6.539936542510986, "global_step": 113095, "epoch": 2692} {"train_loss": -6.511449813842773, "global_step": 113096, "epoch": 2692} {"train_loss": -6.603580951690674, "global_step": 113097, "epoch": 2692} {"train_loss": -6.518580913543701, "global_step": 113098, "epoch": 2692} {"train_loss": -6.585221767425537, "global_step": 113099, "epoch": 2692} {"train_loss": -6.574739456176758, "global_step": 113100, "epoch": 2692} {"train_loss": -6.523348808288574, "global_step": 113101, "epoch": 2692} {"train_loss": -6.523924827575684, "global_step": 113102, "epoch": 2692} {"train_loss": -6.405447959899902, "global_step": 113103, "epoch": 2692} {"train_loss": -6.475949764251709, "global_step": 113104, "epoch": 2692} {"train_loss": -6.539451962425595, "global_step": 113105, "epoch": 2692, "val_loss": 65297.7109375} {"train_loss": -6.354002952575684, "global_step": 113106, "epoch": 2693} {"train_loss": -6.576939582824707, "global_step": 113107, "epoch": 2693} {"train_loss": -6.542902946472168, "global_step": 113108, "epoch": 2693} {"train_loss": -6.4250264167785645, "global_step": 113109, "epoch": 2693} {"train_loss": -6.40486478805542, "global_step": 113110, "epoch": 2693} {"train_loss": -6.485057830810547, "global_step": 113111, "epoch": 2693} {"train_loss": -6.501656532287598, "global_step": 113112, "epoch": 2693} {"train_loss": -6.387749671936035, "global_step": 113113, "epoch": 2693} {"train_loss": -6.338249683380127, "global_step": 113114, "epoch": 2693} {"train_loss": -6.521151542663574, "global_step": 113115, "epoch": 2693} {"train_loss": -6.46921443939209, "global_step": 113116, "epoch": 2693} {"train_loss": -6.342497825622559, "global_step": 113117, "epoch": 2693} {"train_loss": -6.505472183227539, "global_step": 113118, "epoch": 2693} {"train_loss": -6.385309219360352, "global_step": 113119, "epoch": 2693} {"train_loss": -6.570794105529785, "global_step": 113120, "epoch": 2693} {"train_loss": -6.539339542388916, "global_step": 113121, "epoch": 2693} {"train_loss": -6.3860321044921875, "global_step": 113122, "epoch": 2693} {"train_loss": -6.465784072875977, "global_step": 113123, "epoch": 2693} {"train_loss": -6.44471549987793, "global_step": 113124, "epoch": 2693} {"train_loss": -6.44944953918457, "global_step": 113125, "epoch": 2693} {"train_loss": -6.631404876708984, "global_step": 113126, "epoch": 2693} {"train_loss": -6.558215141296387, "global_step": 113127, "epoch": 2693} {"train_loss": -6.5245819091796875, "global_step": 113128, "epoch": 2693} {"train_loss": -6.518521308898926, "global_step": 113129, "epoch": 2693} {"train_loss": -6.489899635314941, "global_step": 113130, "epoch": 2693} {"train_loss": -6.521830081939697, "global_step": 113131, "epoch": 2693} {"train_loss": -6.45177698135376, "global_step": 113132, "epoch": 2693} {"train_loss": -6.665282249450684, "global_step": 113133, "epoch": 2693} {"train_loss": -6.3810133934021, "global_step": 113134, "epoch": 2693} {"train_loss": -6.449343204498291, "global_step": 113135, "epoch": 2693} {"train_loss": -6.4771037101745605, "global_step": 113136, "epoch": 2693} {"train_loss": -6.347458362579346, "global_step": 113137, "epoch": 2693} {"train_loss": -6.627832412719727, "global_step": 113138, "epoch": 2693} {"train_loss": -6.523886680603027, "global_step": 113139, "epoch": 2693} {"train_loss": -6.473465919494629, "global_step": 113140, "epoch": 2693} {"train_loss": -6.456247806549072, "global_step": 113141, "epoch": 2693} {"train_loss": -6.523403167724609, "global_step": 113142, "epoch": 2693} {"train_loss": -6.498195648193359, "global_step": 113143, "epoch": 2693} {"train_loss": -6.509670734405518, "global_step": 113144, "epoch": 2693} {"train_loss": -6.506498336791992, "global_step": 113145, "epoch": 2693} {"train_loss": -6.390054702758789, "global_step": 113146, "epoch": 2693} {"train_loss": -6.477136782237461, "global_step": 113147, "epoch": 2693, "val_loss": 65485.5390625} {"train_loss": -6.52994966506958, "global_step": 113148, "epoch": 2694} {"train_loss": -6.526087284088135, "global_step": 113149, "epoch": 2694} {"train_loss": -6.459078788757324, "global_step": 113150, "epoch": 2694} {"train_loss": -6.4797163009643555, "global_step": 113151, "epoch": 2694} {"train_loss": -6.505348205566406, "global_step": 113152, "epoch": 2694} {"train_loss": -6.539731979370117, "global_step": 113153, "epoch": 2694} {"train_loss": -6.426002025604248, "global_step": 113154, "epoch": 2694} {"train_loss": -6.508563041687012, "global_step": 113155, "epoch": 2694} {"train_loss": -6.530887126922607, "global_step": 113156, "epoch": 2694} {"train_loss": -6.532686710357666, "global_step": 113157, "epoch": 2694} {"train_loss": -6.44178581237793, "global_step": 113158, "epoch": 2694} {"train_loss": -6.497533321380615, "global_step": 113159, "epoch": 2694} {"train_loss": -6.521373748779297, "global_step": 113160, "epoch": 2694} {"train_loss": -6.4712324142456055, "global_step": 113161, "epoch": 2694} {"train_loss": -6.517594337463379, "global_step": 113162, "epoch": 2694} {"train_loss": -6.478557586669922, "global_step": 113163, "epoch": 2694} {"train_loss": -6.5389323234558105, "global_step": 113164, "epoch": 2694} {"train_loss": -6.530609607696533, "global_step": 113165, "epoch": 2694} {"train_loss": -6.458329200744629, "global_step": 113166, "epoch": 2694} {"train_loss": -6.416625022888184, "global_step": 113167, "epoch": 2694} {"train_loss": -6.462868690490723, "global_step": 113168, "epoch": 2694} {"train_loss": -6.412478446960449, "global_step": 113169, "epoch": 2694} {"train_loss": -6.621441841125488, "global_step": 113170, "epoch": 2694} {"train_loss": -6.513830661773682, "global_step": 113171, "epoch": 2694} {"train_loss": -6.3979973793029785, "global_step": 113172, "epoch": 2694} {"train_loss": -6.59657096862793, "global_step": 113173, "epoch": 2694} {"train_loss": -6.373811721801758, "global_step": 113174, "epoch": 2694} {"train_loss": -6.43446159362793, "global_step": 113175, "epoch": 2694} {"train_loss": -6.482013702392578, "global_step": 113176, "epoch": 2694} {"train_loss": -6.410091876983643, "global_step": 113177, "epoch": 2694} {"train_loss": -6.546019077301025, "global_step": 113178, "epoch": 2694} {"train_loss": -6.421858787536621, "global_step": 113179, "epoch": 2694} {"train_loss": -6.55795955657959, "global_step": 113180, "epoch": 2694} {"train_loss": -6.53154993057251, "global_step": 113181, "epoch": 2694} {"train_loss": -6.583249092102051, "global_step": 113182, "epoch": 2694} {"train_loss": -6.438221454620361, "global_step": 113183, "epoch": 2694} {"train_loss": -6.496251106262207, "global_step": 113184, "epoch": 2694} {"train_loss": -6.453134536743164, "global_step": 113185, "epoch": 2694} {"train_loss": -6.386293411254883, "global_step": 113186, "epoch": 2694} {"train_loss": -6.61358642578125, "global_step": 113187, "epoch": 2694} {"train_loss": -6.561954975128174, "global_step": 113188, "epoch": 2694} {"train_loss": -6.492972601027716, "global_step": 113189, "epoch": 2694, "val_loss": 65351.67578125} {"train_loss": -6.478063583374023, "global_step": 113190, "epoch": 2695} {"train_loss": -6.542506217956543, "global_step": 113191, "epoch": 2695} {"train_loss": -6.47952938079834, "global_step": 113192, "epoch": 2695} {"train_loss": -6.461236953735352, "global_step": 113193, "epoch": 2695} {"train_loss": -6.598210334777832, "global_step": 113194, "epoch": 2695} {"train_loss": -6.559453010559082, "global_step": 113195, "epoch": 2695} {"train_loss": -6.53788948059082, "global_step": 113196, "epoch": 2695} {"train_loss": -6.46684455871582, "global_step": 113197, "epoch": 2695} {"train_loss": -6.582549095153809, "global_step": 113198, "epoch": 2695} {"train_loss": -6.496120452880859, "global_step": 113199, "epoch": 2695} {"train_loss": -6.505374431610107, "global_step": 113200, "epoch": 2695} {"train_loss": -6.510946273803711, "global_step": 113201, "epoch": 2695} {"train_loss": -6.398939609527588, "global_step": 113202, "epoch": 2695} {"train_loss": -6.515151023864746, "global_step": 113203, "epoch": 2695} {"train_loss": -6.476790428161621, "global_step": 113204, "epoch": 2695} {"train_loss": -6.58195161819458, "global_step": 113205, "epoch": 2695} {"train_loss": -6.547926902770996, "global_step": 113206, "epoch": 2695} {"train_loss": -6.459354400634766, "global_step": 113207, "epoch": 2695} {"train_loss": -6.382287979125977, "global_step": 113208, "epoch": 2695} {"train_loss": -6.457917213439941, "global_step": 113209, "epoch": 2695} {"train_loss": -6.411168098449707, "global_step": 113210, "epoch": 2695} {"train_loss": -6.342766761779785, "global_step": 113211, "epoch": 2695} {"train_loss": -6.52400016784668, "global_step": 113212, "epoch": 2695} {"train_loss": -6.4865522384643555, "global_step": 113213, "epoch": 2695} {"train_loss": -6.531713962554932, "global_step": 113214, "epoch": 2695} {"train_loss": -6.364633560180664, "global_step": 113215, "epoch": 2695} {"train_loss": -6.512186050415039, "global_step": 113216, "epoch": 2695} {"train_loss": -6.427657127380371, "global_step": 113217, "epoch": 2695} {"train_loss": -6.499035358428955, "global_step": 113218, "epoch": 2695} {"train_loss": -6.3888840675354, "global_step": 113219, "epoch": 2695} {"train_loss": -6.510385036468506, "global_step": 113220, "epoch": 2695} {"train_loss": -6.490090370178223, "global_step": 113221, "epoch": 2695} {"train_loss": -6.390049934387207, "global_step": 113222, "epoch": 2695} {"train_loss": -6.41656494140625, "global_step": 113223, "epoch": 2695} {"train_loss": -6.536664009094238, "global_step": 113224, "epoch": 2695} {"train_loss": -6.50876522064209, "global_step": 113225, "epoch": 2695} {"train_loss": -6.547739028930664, "global_step": 113226, "epoch": 2695} {"train_loss": -6.4042816162109375, "global_step": 113227, "epoch": 2695} {"train_loss": -6.460984230041504, "global_step": 113228, "epoch": 2695} {"train_loss": -6.570040702819824, "global_step": 113229, "epoch": 2695} {"train_loss": -6.292560577392578, "global_step": 113230, "epoch": 2695} {"train_loss": -6.480153129214332, "global_step": 113231, "epoch": 2695, "val_loss": 65147.6328125} {"train_loss": -6.638274669647217, "global_step": 113232, "epoch": 2696} {"train_loss": -6.553708076477051, "global_step": 113233, "epoch": 2696} {"train_loss": -6.469534873962402, "global_step": 113234, "epoch": 2696} {"train_loss": -6.383254528045654, "global_step": 113235, "epoch": 2696} {"train_loss": -6.469499588012695, "global_step": 113236, "epoch": 2696} {"train_loss": -6.314640045166016, "global_step": 113237, "epoch": 2696} {"train_loss": -6.493051052093506, "global_step": 113238, "epoch": 2696} {"train_loss": -6.347963809967041, "global_step": 113239, "epoch": 2696} {"train_loss": -6.375950813293457, "global_step": 113240, "epoch": 2696} {"train_loss": -6.402288436889648, "global_step": 113241, "epoch": 2696} {"train_loss": -6.168347358703613, "global_step": 113242, "epoch": 2696} {"train_loss": -6.492751598358154, "global_step": 113243, "epoch": 2696} {"train_loss": -6.3252410888671875, "global_step": 113244, "epoch": 2696} {"train_loss": -6.389042854309082, "global_step": 113245, "epoch": 2696} {"train_loss": -6.474826812744141, "global_step": 113246, "epoch": 2696} {"train_loss": -6.392053604125977, "global_step": 113247, "epoch": 2696} {"train_loss": -6.46129035949707, "global_step": 113248, "epoch": 2696} {"train_loss": -6.428685188293457, "global_step": 113249, "epoch": 2696} {"train_loss": -6.509864330291748, "global_step": 113250, "epoch": 2696} {"train_loss": -6.486584186553955, "global_step": 113251, "epoch": 2696} {"train_loss": -6.517358779907227, "global_step": 113252, "epoch": 2696} {"train_loss": -6.471792221069336, "global_step": 113253, "epoch": 2696} {"train_loss": -6.45759916305542, "global_step": 113254, "epoch": 2696} {"train_loss": -6.346274375915527, "global_step": 113255, "epoch": 2696} {"train_loss": -6.527039527893066, "global_step": 113256, "epoch": 2696} {"train_loss": -6.382173538208008, "global_step": 113257, "epoch": 2696} {"train_loss": -6.473610877990723, "global_step": 113258, "epoch": 2696} {"train_loss": -6.505532741546631, "global_step": 113259, "epoch": 2696} {"train_loss": -6.4367265701293945, "global_step": 113260, "epoch": 2696} {"train_loss": -6.484273910522461, "global_step": 113261, "epoch": 2696} {"train_loss": -6.355393886566162, "global_step": 113262, "epoch": 2696} {"train_loss": -6.511996269226074, "global_step": 113263, "epoch": 2696} {"train_loss": -6.404815673828125, "global_step": 113264, "epoch": 2696} {"train_loss": -6.395899772644043, "global_step": 113265, "epoch": 2696} {"train_loss": -6.385842800140381, "global_step": 113266, "epoch": 2696} {"train_loss": -6.629075050354004, "global_step": 113267, "epoch": 2696} {"train_loss": -6.537781238555908, "global_step": 113268, "epoch": 2696} {"train_loss": -6.581228256225586, "global_step": 113269, "epoch": 2696} {"train_loss": -6.42926025390625, "global_step": 113270, "epoch": 2696} {"train_loss": -6.519680976867676, "global_step": 113271, "epoch": 2696} {"train_loss": -6.43632698059082, "global_step": 113272, "epoch": 2696} {"train_loss": -6.449917804627192, "global_step": 113273, "epoch": 2696, "val_loss": 65266.0625} {"train_loss": -6.538210868835449, "global_step": 113274, "epoch": 2697} {"train_loss": -6.475305080413818, "global_step": 113275, "epoch": 2697} {"train_loss": -6.536629676818848, "global_step": 113276, "epoch": 2697} {"train_loss": -6.50390625, "global_step": 113277, "epoch": 2697} {"train_loss": -6.560227870941162, "global_step": 113278, "epoch": 2697} {"train_loss": -6.560248851776123, "global_step": 113279, "epoch": 2697} {"train_loss": -6.673681259155273, "global_step": 113280, "epoch": 2697} {"train_loss": -6.513675689697266, "global_step": 113281, "epoch": 2697} {"train_loss": -6.566440582275391, "global_step": 113282, "epoch": 2697} {"train_loss": -6.516548156738281, "global_step": 113283, "epoch": 2697} {"train_loss": -6.577789783477783, "global_step": 113284, "epoch": 2697} {"train_loss": -6.457137107849121, "global_step": 113285, "epoch": 2697} {"train_loss": -6.4480719566345215, "global_step": 113286, "epoch": 2697} {"train_loss": -6.502309322357178, "global_step": 113287, "epoch": 2697} {"train_loss": -6.411556243896484, "global_step": 113288, "epoch": 2697} {"train_loss": -6.513448715209961, "global_step": 113289, "epoch": 2697} {"train_loss": -6.299685478210449, "global_step": 113290, "epoch": 2697} {"train_loss": -6.577807903289795, "global_step": 113291, "epoch": 2697} {"train_loss": -6.420122146606445, "global_step": 113292, "epoch": 2697} {"train_loss": -6.515040397644043, "global_step": 113293, "epoch": 2697} {"train_loss": -6.390239715576172, "global_step": 113294, "epoch": 2697} {"train_loss": -6.402789115905762, "global_step": 113295, "epoch": 2697} {"train_loss": -6.450035095214844, "global_step": 113296, "epoch": 2697} {"train_loss": -6.641960144042969, "global_step": 113297, "epoch": 2697} {"train_loss": -6.45941162109375, "global_step": 113298, "epoch": 2697} {"train_loss": -6.512790679931641, "global_step": 113299, "epoch": 2697} {"train_loss": -6.486374855041504, "global_step": 113300, "epoch": 2697} {"train_loss": -6.448814868927002, "global_step": 113301, "epoch": 2697} {"train_loss": -6.630239963531494, "global_step": 113302, "epoch": 2697} {"train_loss": -6.456536293029785, "global_step": 113303, "epoch": 2697} {"train_loss": -6.324196815490723, "global_step": 113304, "epoch": 2697} {"train_loss": -6.410982131958008, "global_step": 113305, "epoch": 2697} {"train_loss": -6.425601959228516, "global_step": 113306, "epoch": 2697} {"train_loss": -6.273127555847168, "global_step": 113307, "epoch": 2697} {"train_loss": -6.385592460632324, "global_step": 113308, "epoch": 2697} {"train_loss": -6.499617576599121, "global_step": 113309, "epoch": 2697} {"train_loss": -6.372237682342529, "global_step": 113310, "epoch": 2697} {"train_loss": -6.297603607177734, "global_step": 113311, "epoch": 2697} {"train_loss": -6.523804664611816, "global_step": 113312, "epoch": 2697} {"train_loss": -6.3177809715271, "global_step": 113313, "epoch": 2697} {"train_loss": -6.524318695068359, "global_step": 113314, "epoch": 2697} {"train_loss": -6.469477880568731, "global_step": 113315, "epoch": 2697, "val_loss": 65303.10546875} {"train_loss": -6.487210750579834, "global_step": 113316, "epoch": 2698} {"train_loss": -6.477299690246582, "global_step": 113317, "epoch": 2698} {"train_loss": -6.521337509155273, "global_step": 113318, "epoch": 2698} {"train_loss": -6.484509468078613, "global_step": 113319, "epoch": 2698} {"train_loss": -6.356736660003662, "global_step": 113320, "epoch": 2698} {"train_loss": -6.572343826293945, "global_step": 113321, "epoch": 2698} {"train_loss": -6.434681415557861, "global_step": 113322, "epoch": 2698} {"train_loss": -6.433344841003418, "global_step": 113323, "epoch": 2698} {"train_loss": -6.436368465423584, "global_step": 113324, "epoch": 2698} {"train_loss": -6.418540954589844, "global_step": 113325, "epoch": 2698} {"train_loss": -6.413286209106445, "global_step": 113326, "epoch": 2698} {"train_loss": -6.335150241851807, "global_step": 113327, "epoch": 2698} {"train_loss": -6.491652488708496, "global_step": 113328, "epoch": 2698} {"train_loss": -6.418222427368164, "global_step": 113329, "epoch": 2698} {"train_loss": -6.337690353393555, "global_step": 113330, "epoch": 2698} {"train_loss": -6.530362129211426, "global_step": 113331, "epoch": 2698} {"train_loss": -6.5604143142700195, "global_step": 113332, "epoch": 2698} {"train_loss": -6.4749064445495605, "global_step": 113333, "epoch": 2698} {"train_loss": -6.438533782958984, "global_step": 113334, "epoch": 2698} {"train_loss": -6.43035364151001, "global_step": 113335, "epoch": 2698} {"train_loss": -6.4293742179870605, "global_step": 113336, "epoch": 2698} {"train_loss": -6.416526794433594, "global_step": 113337, "epoch": 2698} {"train_loss": -6.453187942504883, "global_step": 113338, "epoch": 2698} {"train_loss": -6.394660472869873, "global_step": 113339, "epoch": 2698} {"train_loss": -6.595078945159912, "global_step": 113340, "epoch": 2698} {"train_loss": -6.422708511352539, "global_step": 113341, "epoch": 2698} {"train_loss": -6.531091213226318, "global_step": 113342, "epoch": 2698} {"train_loss": -6.542950630187988, "global_step": 113343, "epoch": 2698} {"train_loss": -6.512951850891113, "global_step": 113344, "epoch": 2698} {"train_loss": -6.564028263092041, "global_step": 113345, "epoch": 2698} {"train_loss": -6.529228687286377, "global_step": 113346, "epoch": 2698} {"train_loss": -6.373349189758301, "global_step": 113347, "epoch": 2698} {"train_loss": -6.538840293884277, "global_step": 113348, "epoch": 2698} {"train_loss": -6.5396857261657715, "global_step": 113349, "epoch": 2698} {"train_loss": -6.546095848083496, "global_step": 113350, "epoch": 2698} {"train_loss": -6.480554103851318, "global_step": 113351, "epoch": 2698} {"train_loss": -6.498048782348633, "global_step": 113352, "epoch": 2698} {"train_loss": -6.569745063781738, "global_step": 113353, "epoch": 2698} {"train_loss": -6.541319370269775, "global_step": 113354, "epoch": 2698} {"train_loss": -6.475125789642334, "global_step": 113355, "epoch": 2698} {"train_loss": -6.50192928314209, "global_step": 113356, "epoch": 2698} {"train_loss": -6.477687233970279, "global_step": 113357, "epoch": 2698, "val_loss": 65098.34375} {"train_loss": -6.503818035125732, "global_step": 113358, "epoch": 2699} {"train_loss": -6.539969444274902, "global_step": 113359, "epoch": 2699} {"train_loss": -6.590756893157959, "global_step": 113360, "epoch": 2699} {"train_loss": -6.506319046020508, "global_step": 113361, "epoch": 2699} {"train_loss": -6.600971698760986, "global_step": 113362, "epoch": 2699} {"train_loss": -6.6101393699646, "global_step": 113363, "epoch": 2699} {"train_loss": -6.476733207702637, "global_step": 113364, "epoch": 2699} {"train_loss": -6.5012311935424805, "global_step": 113365, "epoch": 2699} {"train_loss": -6.505174160003662, "global_step": 113366, "epoch": 2699} {"train_loss": -6.448328971862793, "global_step": 113367, "epoch": 2699} {"train_loss": -6.624894618988037, "global_step": 113368, "epoch": 2699} {"train_loss": -6.477087497711182, "global_step": 113369, "epoch": 2699} {"train_loss": -6.582235336303711, "global_step": 113370, "epoch": 2699} {"train_loss": -6.518407821655273, "global_step": 113371, "epoch": 2699} {"train_loss": -6.528870582580566, "global_step": 113372, "epoch": 2699} {"train_loss": -6.469722747802734, "global_step": 113373, "epoch": 2699} {"train_loss": -6.593707084655762, "global_step": 113374, "epoch": 2699} {"train_loss": -6.424497604370117, "global_step": 113375, "epoch": 2699} {"train_loss": -6.561273574829102, "global_step": 113376, "epoch": 2699} {"train_loss": -6.58954381942749, "global_step": 113377, "epoch": 2699} {"train_loss": -6.554156303405762, "global_step": 113378, "epoch": 2699} {"train_loss": -6.475419998168945, "global_step": 113379, "epoch": 2699} {"train_loss": -6.536980152130127, "global_step": 113380, "epoch": 2699} {"train_loss": -6.489269256591797, "global_step": 113381, "epoch": 2699} {"train_loss": -6.431802749633789, "global_step": 113382, "epoch": 2699} {"train_loss": -6.544013977050781, "global_step": 113383, "epoch": 2699} {"train_loss": -6.604935646057129, "global_step": 113384, "epoch": 2699} {"train_loss": -6.457096099853516, "global_step": 113385, "epoch": 2699} {"train_loss": -6.584086894989014, "global_step": 113386, "epoch": 2699} {"train_loss": -6.5951008796691895, "global_step": 113387, "epoch": 2699} {"train_loss": -6.515007972717285, "global_step": 113388, "epoch": 2699} {"train_loss": -6.342099189758301, "global_step": 113389, "epoch": 2699} {"train_loss": -6.521256446838379, "global_step": 113390, "epoch": 2699} {"train_loss": -6.470876216888428, "global_step": 113391, "epoch": 2699} {"train_loss": -6.57852029800415, "global_step": 113392, "epoch": 2699} {"train_loss": -6.495459079742432, "global_step": 113393, "epoch": 2699} {"train_loss": -6.467601776123047, "global_step": 113394, "epoch": 2699} {"train_loss": -6.560320854187012, "global_step": 113395, "epoch": 2699} {"train_loss": -6.530702590942383, "global_step": 113396, "epoch": 2699} {"train_loss": -6.519090175628662, "global_step": 113397, "epoch": 2699} {"train_loss": -6.579972743988037, "global_step": 113398, "epoch": 2699} {"train_loss": -6.525448481241862, "global_step": 113399, "epoch": 2699, "val_loss": 65477.24609375} {"train_loss": -6.51276159286499, "global_step": 113400, "epoch": 2700} {"train_loss": -6.427402973175049, "global_step": 113401, "epoch": 2700} {"train_loss": -6.600007057189941, "global_step": 113402, "epoch": 2700} {"train_loss": -6.545060157775879, "global_step": 113403, "epoch": 2700} {"train_loss": -6.568965911865234, "global_step": 113404, "epoch": 2700} {"train_loss": -6.471665859222412, "global_step": 113405, "epoch": 2700} {"train_loss": -6.516493797302246, "global_step": 113406, "epoch": 2700} {"train_loss": -6.436846733093262, "global_step": 113407, "epoch": 2700} {"train_loss": -6.544641971588135, "global_step": 113408, "epoch": 2700} {"train_loss": -6.495933532714844, "global_step": 113409, "epoch": 2700} {"train_loss": -6.648128509521484, "global_step": 113410, "epoch": 2700} {"train_loss": -6.54769229888916, "global_step": 113411, "epoch": 2700} {"train_loss": -6.537310600280762, "global_step": 113412, "epoch": 2700} {"train_loss": -6.550044059753418, "global_step": 113413, "epoch": 2700} {"train_loss": -6.493129730224609, "global_step": 113414, "epoch": 2700} {"train_loss": -6.567343235015869, "global_step": 113415, "epoch": 2700} {"train_loss": -6.557180404663086, "global_step": 113416, "epoch": 2700} {"train_loss": -6.570256233215332, "global_step": 113417, "epoch": 2700} {"train_loss": -6.552679061889648, "global_step": 113418, "epoch": 2700} {"train_loss": -6.5188775062561035, "global_step": 113419, "epoch": 2700} {"train_loss": -6.546984672546387, "global_step": 113420, "epoch": 2700} {"train_loss": -6.585463523864746, "global_step": 113421, "epoch": 2700} {"train_loss": -6.565580368041992, "global_step": 113422, "epoch": 2700} {"train_loss": -6.630214214324951, "global_step": 113423, "epoch": 2700} {"train_loss": -6.637017726898193, "global_step": 113424, "epoch": 2700} {"train_loss": -6.487794876098633, "global_step": 113425, "epoch": 2700} {"train_loss": -6.45512580871582, "global_step": 113426, "epoch": 2700} {"train_loss": -6.484967231750488, "global_step": 113427, "epoch": 2700} {"train_loss": -6.532278537750244, "global_step": 113428, "epoch": 2700} {"train_loss": -6.495901584625244, "global_step": 113429, "epoch": 2700} {"train_loss": -6.530370712280273, "global_step": 113430, "epoch": 2700} {"train_loss": -6.577220916748047, "global_step": 113431, "epoch": 2700} {"train_loss": -6.509483337402344, "global_step": 113432, "epoch": 2700} {"train_loss": -6.471339225769043, "global_step": 113433, "epoch": 2700} {"train_loss": -6.536380767822266, "global_step": 113434, "epoch": 2700} {"train_loss": -6.478970527648926, "global_step": 113435, "epoch": 2700} {"train_loss": -6.447970390319824, "global_step": 113436, "epoch": 2700} {"train_loss": -6.514109134674072, "global_step": 113437, "epoch": 2700} {"train_loss": -6.487142562866211, "global_step": 113438, "epoch": 2700} {"train_loss": -6.461145401000977, "global_step": 113439, "epoch": 2700} {"train_loss": -6.4153056144714355, "global_step": 113440, "epoch": 2700} {"train_loss": -6.524878365652902, "global_step": 113441, "epoch": 2700, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.7048061260831229, "train/sim_max_reward_3": 0.3965775330383614, "train/sim_max_reward_4": 0.8838802162536873, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.33854905246479616, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.7807630849296149, "test/sim_max_reward_4300004": 0.553906357071529, "test/sim_max_reward_4300005": 0.6568659036256179, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.37563899647637705, "test/sim_max_reward_4300008": 0.9604729135129065, "test/sim_max_reward_4300009": 0.9677352582422213, "test/sim_max_reward_4300010": 1.0, "test/sim_max_reward_4300011": 0.30410265293833333, "test/sim_max_reward_4300012": 0.8531595576131965, "test/sim_max_reward_4300013": 0.4041469708694105, "test/sim_max_reward_4300014": 0.9842461089028604, "test/sim_max_reward_4300015": 0.976052917150763, "test/sim_max_reward_4300016": 0.9796093210050835, "test/sim_max_reward_4300017": 0.4195916572077244, "test/sim_max_reward_4300018": 0.4441527319640529, "test/sim_max_reward_4300019": 0.18590665793764194, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 1.0, "test/sim_max_reward_4300022": 0.9553706203806867, "test/sim_max_reward_4300023": 0.3305436891307625, "test/sim_max_reward_4300024": 1.0, "test/sim_max_reward_4300025": 0.4701821708298385, "test/sim_max_reward_4300026": 0.9719212773004801, "test/sim_max_reward_4300027": 1.0, "test/sim_max_reward_4300028": 0.8636889585839101, "test/sim_max_reward_4300029": 0.8233146187523839, "test/sim_max_reward_4300030": 0.9511252700768978, "test/sim_max_reward_4300031": 0.3497790947530539, "test/sim_max_reward_4300032": 0.8766950513918209, "test/sim_max_reward_4300033": 0.711231995698612, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.780973489680214, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8189554959751946, "test/sim_max_reward_4300038": 0.8592824023036921, "test/sim_max_reward_4300039": 0.5042312042954179, "test/sim_max_reward_4300040": 0.866810911826698, "test/sim_max_reward_4300041": 0.9941942013380655, "test/sim_max_reward_4300042": 0.3639241355027848, "test/sim_max_reward_4300043": 0.09358960564622605, "test/sim_max_reward_4300044": 0.9190753166669792, "test/sim_max_reward_4300045": 0.9535523546208754, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.13657524919774633, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.19326239279626828, "train/mean_score": 0.5614243552239019, "test/mean_score": 0.6234474752844843, "val_loss": 65188.74609375} {"train_loss": -6.601230621337891, "global_step": 113442, "epoch": 2701} {"train_loss": -6.474166393280029, "global_step": 113443, "epoch": 2701} {"train_loss": -6.581510543823242, "global_step": 113444, "epoch": 2701} {"train_loss": -6.551481246948242, "global_step": 113445, "epoch": 2701} {"train_loss": -6.545280933380127, "global_step": 113446, "epoch": 2701} {"train_loss": -6.543941497802734, "global_step": 113447, "epoch": 2701} {"train_loss": -6.46034574508667, "global_step": 113448, "epoch": 2701} {"train_loss": -6.593053340911865, "global_step": 113449, "epoch": 2701} {"train_loss": -6.658655166625977, "global_step": 113450, "epoch": 2701} {"train_loss": -6.604583740234375, "global_step": 113451, "epoch": 2701} {"train_loss": -6.532126426696777, "global_step": 113452, "epoch": 2701} {"train_loss": -6.497628211975098, "global_step": 113453, "epoch": 2701} {"train_loss": -6.502933025360107, "global_step": 113454, "epoch": 2701} {"train_loss": -6.619507789611816, "global_step": 113455, "epoch": 2701} {"train_loss": -6.489007949829102, "global_step": 113456, "epoch": 2701} {"train_loss": -6.555071830749512, "global_step": 113457, "epoch": 2701} {"train_loss": -6.492883682250977, "global_step": 113458, "epoch": 2701} {"train_loss": -6.4902663230896, "global_step": 113459, "epoch": 2701} {"train_loss": -6.554054260253906, "global_step": 113460, "epoch": 2701} {"train_loss": -6.490583419799805, "global_step": 113461, "epoch": 2701} {"train_loss": -6.390198707580566, "global_step": 113462, "epoch": 2701} {"train_loss": -6.384222030639648, "global_step": 113463, "epoch": 2701} {"train_loss": -6.525254249572754, "global_step": 113464, "epoch": 2701} {"train_loss": -6.459634780883789, "global_step": 113465, "epoch": 2701} {"train_loss": -6.329467296600342, "global_step": 113466, "epoch": 2701} {"train_loss": -6.495711326599121, "global_step": 113467, "epoch": 2701} {"train_loss": -6.427364349365234, "global_step": 113468, "epoch": 2701} {"train_loss": -6.4184160232543945, "global_step": 113469, "epoch": 2701} {"train_loss": -6.495031356811523, "global_step": 113470, "epoch": 2701} {"train_loss": -6.468885898590088, "global_step": 113471, "epoch": 2701} {"train_loss": -6.53597354888916, "global_step": 113472, "epoch": 2701} {"train_loss": -6.530302047729492, "global_step": 113473, "epoch": 2701} {"train_loss": -6.558009147644043, "global_step": 113474, "epoch": 2701} {"train_loss": -6.415005683898926, "global_step": 113475, "epoch": 2701} {"train_loss": -6.459499359130859, "global_step": 113476, "epoch": 2701} {"train_loss": -6.500199317932129, "global_step": 113477, "epoch": 2701} {"train_loss": -6.485225677490234, "global_step": 113478, "epoch": 2701} {"train_loss": -6.549355983734131, "global_step": 113479, "epoch": 2701} {"train_loss": -6.478117942810059, "global_step": 113480, "epoch": 2701} {"train_loss": -6.481372833251953, "global_step": 113481, "epoch": 2701} {"train_loss": -6.559291362762451, "global_step": 113482, "epoch": 2701} {"train_loss": -6.506572450910296, "global_step": 113483, "epoch": 2701, "val_loss": 65045.37109375} {"train_loss": -6.570860862731934, "global_step": 113484, "epoch": 2702} {"train_loss": -6.5880537033081055, "global_step": 113485, "epoch": 2702} {"train_loss": -6.375985145568848, "global_step": 113486, "epoch": 2702} {"train_loss": -6.445107460021973, "global_step": 113487, "epoch": 2702} {"train_loss": -6.493666648864746, "global_step": 113488, "epoch": 2702} {"train_loss": -6.531381607055664, "global_step": 113489, "epoch": 2702} {"train_loss": -6.484574317932129, "global_step": 113490, "epoch": 2702} {"train_loss": -6.451700687408447, "global_step": 113491, "epoch": 2702} {"train_loss": -6.570246696472168, "global_step": 113492, "epoch": 2702} {"train_loss": -6.5884552001953125, "global_step": 113493, "epoch": 2702} {"train_loss": -6.4502387046813965, "global_step": 113494, "epoch": 2702} {"train_loss": -6.424929618835449, "global_step": 113495, "epoch": 2702} {"train_loss": -6.607256889343262, "global_step": 113496, "epoch": 2702} {"train_loss": -6.421020030975342, "global_step": 113497, "epoch": 2702} {"train_loss": -6.495003700256348, "global_step": 113498, "epoch": 2702} {"train_loss": -6.500298023223877, "global_step": 113499, "epoch": 2702} {"train_loss": -6.620941162109375, "global_step": 113500, "epoch": 2702} {"train_loss": -6.5031232833862305, "global_step": 113501, "epoch": 2702} {"train_loss": -6.464451789855957, "global_step": 113502, "epoch": 2702} {"train_loss": -6.415986061096191, "global_step": 113503, "epoch": 2702} {"train_loss": -6.559606552124023, "global_step": 113504, "epoch": 2702} {"train_loss": -6.526648044586182, "global_step": 113505, "epoch": 2702} {"train_loss": -6.437021255493164, "global_step": 113506, "epoch": 2702} {"train_loss": -6.50260066986084, "global_step": 113507, "epoch": 2702} {"train_loss": -6.43468713760376, "global_step": 113508, "epoch": 2702} {"train_loss": -6.455536842346191, "global_step": 113509, "epoch": 2702} {"train_loss": -6.43501091003418, "global_step": 113510, "epoch": 2702} {"train_loss": -6.394045829772949, "global_step": 113511, "epoch": 2702} {"train_loss": -6.425654888153076, "global_step": 113512, "epoch": 2702} {"train_loss": -6.400117874145508, "global_step": 113513, "epoch": 2702} {"train_loss": -6.4762468338012695, "global_step": 113514, "epoch": 2702} {"train_loss": -6.5146565437316895, "global_step": 113515, "epoch": 2702} {"train_loss": -6.438685417175293, "global_step": 113516, "epoch": 2702} {"train_loss": -6.613335609436035, "global_step": 113517, "epoch": 2702} {"train_loss": -6.527740478515625, "global_step": 113518, "epoch": 2702} {"train_loss": -6.532156944274902, "global_step": 113519, "epoch": 2702} {"train_loss": -6.567911624908447, "global_step": 113520, "epoch": 2702} {"train_loss": -6.532407760620117, "global_step": 113521, "epoch": 2702} {"train_loss": -6.6082000732421875, "global_step": 113522, "epoch": 2702} {"train_loss": -6.610290050506592, "global_step": 113523, "epoch": 2702} {"train_loss": -6.509035587310791, "global_step": 113524, "epoch": 2702} {"train_loss": -6.5046733901614235, "global_step": 113525, "epoch": 2702, "val_loss": 65144.8046875} {"train_loss": -6.493093967437744, "global_step": 113526, "epoch": 2703} {"train_loss": -6.518304347991943, "global_step": 113527, "epoch": 2703} {"train_loss": -6.674711227416992, "global_step": 113528, "epoch": 2703} {"train_loss": -6.437771797180176, "global_step": 113529, "epoch": 2703} {"train_loss": -6.4908294677734375, "global_step": 113530, "epoch": 2703} {"train_loss": -6.622401714324951, "global_step": 113531, "epoch": 2703} {"train_loss": -6.551468372344971, "global_step": 113532, "epoch": 2703} {"train_loss": -6.515149116516113, "global_step": 113533, "epoch": 2703} {"train_loss": -6.642152309417725, "global_step": 113534, "epoch": 2703} {"train_loss": -6.588615417480469, "global_step": 113535, "epoch": 2703} {"train_loss": -6.562314987182617, "global_step": 113536, "epoch": 2703} {"train_loss": -6.604171276092529, "global_step": 113537, "epoch": 2703} {"train_loss": -6.525489330291748, "global_step": 113538, "epoch": 2703} {"train_loss": -6.526468753814697, "global_step": 113539, "epoch": 2703} {"train_loss": -6.528191089630127, "global_step": 113540, "epoch": 2703} {"train_loss": -6.548758506774902, "global_step": 113541, "epoch": 2703} {"train_loss": -6.5433759689331055, "global_step": 113542, "epoch": 2703} {"train_loss": -6.527307510375977, "global_step": 113543, "epoch": 2703} {"train_loss": -6.534379959106445, "global_step": 113544, "epoch": 2703} {"train_loss": -6.612203598022461, "global_step": 113545, "epoch": 2703} {"train_loss": -6.515417098999023, "global_step": 113546, "epoch": 2703} {"train_loss": -6.57986307144165, "global_step": 113547, "epoch": 2703} {"train_loss": -6.517795562744141, "global_step": 113548, "epoch": 2703} {"train_loss": -6.514800548553467, "global_step": 113549, "epoch": 2703} {"train_loss": -6.525781154632568, "global_step": 113550, "epoch": 2703} {"train_loss": -6.402339935302734, "global_step": 113551, "epoch": 2703} {"train_loss": -6.483305931091309, "global_step": 113552, "epoch": 2703} {"train_loss": -6.531225204467773, "global_step": 113553, "epoch": 2703} {"train_loss": -6.461256504058838, "global_step": 113554, "epoch": 2703} {"train_loss": -6.529727458953857, "global_step": 113555, "epoch": 2703} {"train_loss": -6.586174964904785, "global_step": 113556, "epoch": 2703} {"train_loss": -6.456742286682129, "global_step": 113557, "epoch": 2703} {"train_loss": -6.551506996154785, "global_step": 113558, "epoch": 2703} {"train_loss": -6.52407169342041, "global_step": 113559, "epoch": 2703} {"train_loss": -6.50520658493042, "global_step": 113560, "epoch": 2703} {"train_loss": -6.564882755279541, "global_step": 113561, "epoch": 2703} {"train_loss": -6.495491027832031, "global_step": 113562, "epoch": 2703} {"train_loss": -6.378190040588379, "global_step": 113563, "epoch": 2703} {"train_loss": -6.583810329437256, "global_step": 113564, "epoch": 2703} {"train_loss": -6.392068386077881, "global_step": 113565, "epoch": 2703} {"train_loss": -6.469362735748291, "global_step": 113566, "epoch": 2703} {"train_loss": -6.526785555339995, "global_step": 113567, "epoch": 2703, "val_loss": 65263.37109375} {"train_loss": -6.603054523468018, "global_step": 113568, "epoch": 2704} {"train_loss": -6.495708465576172, "global_step": 113569, "epoch": 2704} {"train_loss": -6.472796440124512, "global_step": 113570, "epoch": 2704} {"train_loss": -6.447879791259766, "global_step": 113571, "epoch": 2704} {"train_loss": -6.537731170654297, "global_step": 113572, "epoch": 2704} {"train_loss": -6.449467658996582, "global_step": 113573, "epoch": 2704} {"train_loss": -6.4100494384765625, "global_step": 113574, "epoch": 2704} {"train_loss": -6.538674354553223, "global_step": 113575, "epoch": 2704} {"train_loss": -6.467316627502441, "global_step": 113576, "epoch": 2704} {"train_loss": -6.542980194091797, "global_step": 113577, "epoch": 2704} {"train_loss": -6.565121650695801, "global_step": 113578, "epoch": 2704} {"train_loss": -6.559148788452148, "global_step": 113579, "epoch": 2704} {"train_loss": -6.479567527770996, "global_step": 113580, "epoch": 2704} {"train_loss": -6.495715141296387, "global_step": 113581, "epoch": 2704} {"train_loss": -6.544726371765137, "global_step": 113582, "epoch": 2704} {"train_loss": -6.510538101196289, "global_step": 113583, "epoch": 2704} {"train_loss": -6.5460357666015625, "global_step": 113584, "epoch": 2704} {"train_loss": -6.6417555809021, "global_step": 113585, "epoch": 2704} {"train_loss": -6.606168746948242, "global_step": 113586, "epoch": 2704} {"train_loss": -6.554344654083252, "global_step": 113587, "epoch": 2704} {"train_loss": -6.503908157348633, "global_step": 113588, "epoch": 2704} {"train_loss": -6.459653854370117, "global_step": 113589, "epoch": 2704} {"train_loss": -6.595956802368164, "global_step": 113590, "epoch": 2704} {"train_loss": -6.512016296386719, "global_step": 113591, "epoch": 2704} {"train_loss": -6.487884521484375, "global_step": 113592, "epoch": 2704} {"train_loss": -6.652228355407715, "global_step": 113593, "epoch": 2704} {"train_loss": -6.5529069900512695, "global_step": 113594, "epoch": 2704} {"train_loss": -6.612588882446289, "global_step": 113595, "epoch": 2704} {"train_loss": -6.51460599899292, "global_step": 113596, "epoch": 2704} {"train_loss": -6.453874588012695, "global_step": 113597, "epoch": 2704} {"train_loss": -6.574243545532227, "global_step": 113598, "epoch": 2704} {"train_loss": -6.4404754638671875, "global_step": 113599, "epoch": 2704} {"train_loss": -6.601273536682129, "global_step": 113600, "epoch": 2704} {"train_loss": -6.615989685058594, "global_step": 113601, "epoch": 2704} {"train_loss": -6.495959758758545, "global_step": 113602, "epoch": 2704} {"train_loss": -6.550860404968262, "global_step": 113603, "epoch": 2704} {"train_loss": -6.625456809997559, "global_step": 113604, "epoch": 2704} {"train_loss": -6.444432735443115, "global_step": 113605, "epoch": 2704} {"train_loss": -6.598355293273926, "global_step": 113606, "epoch": 2704} {"train_loss": -6.5252685546875, "global_step": 113607, "epoch": 2704} {"train_loss": -6.4919657707214355, "global_step": 113608, "epoch": 2704} {"train_loss": -6.5303333940960115, "global_step": 113609, "epoch": 2704, "val_loss": 65245.34375} {"train_loss": -6.5496416091918945, "global_step": 113610, "epoch": 2705} {"train_loss": -6.404885292053223, "global_step": 113611, "epoch": 2705} {"train_loss": -6.456811428070068, "global_step": 113612, "epoch": 2705} {"train_loss": -6.495501518249512, "global_step": 113613, "epoch": 2705} {"train_loss": -6.549973487854004, "global_step": 113614, "epoch": 2705} {"train_loss": -6.442046642303467, "global_step": 113615, "epoch": 2705} {"train_loss": -6.578902244567871, "global_step": 113616, "epoch": 2705} {"train_loss": -6.394378662109375, "global_step": 113617, "epoch": 2705} {"train_loss": -6.5668439865112305, "global_step": 113618, "epoch": 2705} {"train_loss": -6.402843475341797, "global_step": 113619, "epoch": 2705} {"train_loss": -6.4891486167907715, "global_step": 113620, "epoch": 2705} {"train_loss": -6.5048370361328125, "global_step": 113621, "epoch": 2705} {"train_loss": -6.367659091949463, "global_step": 113622, "epoch": 2705} {"train_loss": -6.431646347045898, "global_step": 113623, "epoch": 2705} {"train_loss": -6.497361183166504, "global_step": 113624, "epoch": 2705} {"train_loss": -6.396322250366211, "global_step": 113625, "epoch": 2705} {"train_loss": -6.542901992797852, "global_step": 113626, "epoch": 2705} {"train_loss": -6.544560432434082, "global_step": 113627, "epoch": 2705} {"train_loss": -6.415785789489746, "global_step": 113628, "epoch": 2705} {"train_loss": -6.372274398803711, "global_step": 113629, "epoch": 2705} {"train_loss": -6.346856594085693, "global_step": 113630, "epoch": 2705} {"train_loss": -6.383367538452148, "global_step": 113631, "epoch": 2705} {"train_loss": -6.351769924163818, "global_step": 113632, "epoch": 2705} {"train_loss": -6.527009963989258, "global_step": 113633, "epoch": 2705} {"train_loss": -6.286074638366699, "global_step": 113634, "epoch": 2705} {"train_loss": -6.468344211578369, "global_step": 113635, "epoch": 2705} {"train_loss": -6.457277297973633, "global_step": 113636, "epoch": 2705} {"train_loss": -6.44062614440918, "global_step": 113637, "epoch": 2705} {"train_loss": -6.382290840148926, "global_step": 113638, "epoch": 2705} {"train_loss": -6.416280746459961, "global_step": 113639, "epoch": 2705} {"train_loss": -6.384970664978027, "global_step": 113640, "epoch": 2705} {"train_loss": -6.423853874206543, "global_step": 113641, "epoch": 2705} {"train_loss": -6.530750274658203, "global_step": 113642, "epoch": 2705} {"train_loss": -6.543857097625732, "global_step": 113643, "epoch": 2705} {"train_loss": -6.5477294921875, "global_step": 113644, "epoch": 2705} {"train_loss": -6.533041477203369, "global_step": 113645, "epoch": 2705} {"train_loss": -6.4300007820129395, "global_step": 113646, "epoch": 2705} {"train_loss": -6.556928634643555, "global_step": 113647, "epoch": 2705} {"train_loss": -6.512052059173584, "global_step": 113648, "epoch": 2705} {"train_loss": -6.585076332092285, "global_step": 113649, "epoch": 2705} {"train_loss": -6.578787803649902, "global_step": 113650, "epoch": 2705} {"train_loss": -6.466813621066866, "global_step": 113651, "epoch": 2705, "val_loss": 65116.13671875} {"train_loss": -6.517398834228516, "global_step": 113652, "epoch": 2706} {"train_loss": -6.665740013122559, "global_step": 113653, "epoch": 2706} {"train_loss": -6.412789344787598, "global_step": 113654, "epoch": 2706} {"train_loss": -6.5025458335876465, "global_step": 113655, "epoch": 2706} {"train_loss": -6.473241329193115, "global_step": 113656, "epoch": 2706} {"train_loss": -6.536656856536865, "global_step": 113657, "epoch": 2706} {"train_loss": -6.525914192199707, "global_step": 113658, "epoch": 2706} {"train_loss": -6.540692329406738, "global_step": 113659, "epoch": 2706} {"train_loss": -6.581355094909668, "global_step": 113660, "epoch": 2706} {"train_loss": -6.515198707580566, "global_step": 113661, "epoch": 2706} {"train_loss": -6.481287479400635, "global_step": 113662, "epoch": 2706} {"train_loss": -6.551177024841309, "global_step": 113663, "epoch": 2706} {"train_loss": -6.61588191986084, "global_step": 113664, "epoch": 2706} {"train_loss": -6.355421543121338, "global_step": 113665, "epoch": 2706} {"train_loss": -6.6074628829956055, "global_step": 113666, "epoch": 2706} {"train_loss": -6.582571029663086, "global_step": 113667, "epoch": 2706} {"train_loss": -6.53111457824707, "global_step": 113668, "epoch": 2706} {"train_loss": -6.462490081787109, "global_step": 113669, "epoch": 2706} {"train_loss": -6.439291000366211, "global_step": 113670, "epoch": 2706} {"train_loss": -6.563836574554443, "global_step": 113671, "epoch": 2706} {"train_loss": -6.558719635009766, "global_step": 113672, "epoch": 2706} {"train_loss": -6.600693225860596, "global_step": 113673, "epoch": 2706} {"train_loss": -6.5814337730407715, "global_step": 113674, "epoch": 2706} {"train_loss": -6.369324684143066, "global_step": 113675, "epoch": 2706} {"train_loss": -6.515300750732422, "global_step": 113676, "epoch": 2706} {"train_loss": -6.390770435333252, "global_step": 113677, "epoch": 2706} {"train_loss": -6.554555892944336, "global_step": 113678, "epoch": 2706} {"train_loss": -6.56734037399292, "global_step": 113679, "epoch": 2706} {"train_loss": -6.390664100646973, "global_step": 113680, "epoch": 2706} {"train_loss": -6.631753444671631, "global_step": 113681, "epoch": 2706} {"train_loss": -6.466767311096191, "global_step": 113682, "epoch": 2706} {"train_loss": -6.58054256439209, "global_step": 113683, "epoch": 2706} {"train_loss": -6.35457181930542, "global_step": 113684, "epoch": 2706} {"train_loss": -6.539673805236816, "global_step": 113685, "epoch": 2706} {"train_loss": -6.515546798706055, "global_step": 113686, "epoch": 2706} {"train_loss": -6.406063556671143, "global_step": 113687, "epoch": 2706} {"train_loss": -6.467883110046387, "global_step": 113688, "epoch": 2706} {"train_loss": -6.420200824737549, "global_step": 113689, "epoch": 2706} {"train_loss": -6.436495304107666, "global_step": 113690, "epoch": 2706} {"train_loss": -6.520388126373291, "global_step": 113691, "epoch": 2706} {"train_loss": -6.462103843688965, "global_step": 113692, "epoch": 2706} {"train_loss": -6.507097005844116, "global_step": 113693, "epoch": 2706, "val_loss": 65286.5859375} {"train_loss": -6.39212703704834, "global_step": 113694, "epoch": 2707} {"train_loss": -6.591175079345703, "global_step": 113695, "epoch": 2707} {"train_loss": -6.5970458984375, "global_step": 113696, "epoch": 2707} {"train_loss": -6.534228324890137, "global_step": 113697, "epoch": 2707} {"train_loss": -6.477026462554932, "global_step": 113698, "epoch": 2707} {"train_loss": -6.503080368041992, "global_step": 113699, "epoch": 2707} {"train_loss": -6.477228164672852, "global_step": 113700, "epoch": 2707} {"train_loss": -6.599652290344238, "global_step": 113701, "epoch": 2707} {"train_loss": -6.418015956878662, "global_step": 113702, "epoch": 2707} {"train_loss": -6.5382795333862305, "global_step": 113703, "epoch": 2707} {"train_loss": -6.504837989807129, "global_step": 113704, "epoch": 2707} {"train_loss": -6.435617446899414, "global_step": 113705, "epoch": 2707} {"train_loss": -6.576806545257568, "global_step": 113706, "epoch": 2707} {"train_loss": -6.520209312438965, "global_step": 113707, "epoch": 2707} {"train_loss": -6.526487827301025, "global_step": 113708, "epoch": 2707} {"train_loss": -6.576834678649902, "global_step": 113709, "epoch": 2707} {"train_loss": -6.474440097808838, "global_step": 113710, "epoch": 2707} {"train_loss": -6.526371002197266, "global_step": 113711, "epoch": 2707} {"train_loss": -6.529774188995361, "global_step": 113712, "epoch": 2707} {"train_loss": -6.618804931640625, "global_step": 113713, "epoch": 2707} {"train_loss": -6.524126052856445, "global_step": 113714, "epoch": 2707} {"train_loss": -6.497006416320801, "global_step": 113715, "epoch": 2707} {"train_loss": -6.635134696960449, "global_step": 113716, "epoch": 2707} {"train_loss": -6.6041646003723145, "global_step": 113717, "epoch": 2707} {"train_loss": -6.562353134155273, "global_step": 113718, "epoch": 2707} {"train_loss": -6.47310733795166, "global_step": 113719, "epoch": 2707} {"train_loss": -6.5226569175720215, "global_step": 113720, "epoch": 2707} {"train_loss": -6.418889999389648, "global_step": 113721, "epoch": 2707} {"train_loss": -6.594073295593262, "global_step": 113722, "epoch": 2707} {"train_loss": -6.553402900695801, "global_step": 113723, "epoch": 2707} {"train_loss": -6.580791473388672, "global_step": 113724, "epoch": 2707} {"train_loss": -6.522472858428955, "global_step": 113725, "epoch": 2707} {"train_loss": -6.6036272048950195, "global_step": 113726, "epoch": 2707} {"train_loss": -6.511599063873291, "global_step": 113727, "epoch": 2707} {"train_loss": -6.642153739929199, "global_step": 113728, "epoch": 2707} {"train_loss": -6.397477626800537, "global_step": 113729, "epoch": 2707} {"train_loss": -6.572486400604248, "global_step": 113730, "epoch": 2707} {"train_loss": -6.490746021270752, "global_step": 113731, "epoch": 2707} {"train_loss": -6.5901689529418945, "global_step": 113732, "epoch": 2707} {"train_loss": -6.4915056228637695, "global_step": 113733, "epoch": 2707} {"train_loss": -6.500323295593262, "global_step": 113734, "epoch": 2707} {"train_loss": -6.528867380959647, "global_step": 113735, "epoch": 2707, "val_loss": 65285.8671875} {"train_loss": -6.540408134460449, "global_step": 113736, "epoch": 2708} {"train_loss": -6.622441291809082, "global_step": 113737, "epoch": 2708} {"train_loss": -6.515108108520508, "global_step": 113738, "epoch": 2708} {"train_loss": -6.520745277404785, "global_step": 113739, "epoch": 2708} {"train_loss": -6.509160995483398, "global_step": 113740, "epoch": 2708} {"train_loss": -6.44291877746582, "global_step": 113741, "epoch": 2708} {"train_loss": -6.465060710906982, "global_step": 113742, "epoch": 2708} {"train_loss": -6.345700263977051, "global_step": 113743, "epoch": 2708} {"train_loss": -6.465044975280762, "global_step": 113744, "epoch": 2708} {"train_loss": -6.466739654541016, "global_step": 113745, "epoch": 2708} {"train_loss": -6.447898864746094, "global_step": 113746, "epoch": 2708} {"train_loss": -6.485813140869141, "global_step": 113747, "epoch": 2708} {"train_loss": -6.452901840209961, "global_step": 113748, "epoch": 2708} {"train_loss": -6.568454265594482, "global_step": 113749, "epoch": 2708} {"train_loss": -6.541498184204102, "global_step": 113750, "epoch": 2708} {"train_loss": -6.470559120178223, "global_step": 113751, "epoch": 2708} {"train_loss": -6.434542655944824, "global_step": 113752, "epoch": 2708} {"train_loss": -6.526126384735107, "global_step": 113753, "epoch": 2708} {"train_loss": -6.322112083435059, "global_step": 113754, "epoch": 2708} {"train_loss": -6.423497200012207, "global_step": 113755, "epoch": 2708} {"train_loss": -6.265552520751953, "global_step": 113756, "epoch": 2708} {"train_loss": -6.501936912536621, "global_step": 113757, "epoch": 2708} {"train_loss": -6.476093292236328, "global_step": 113758, "epoch": 2708} {"train_loss": -6.419156074523926, "global_step": 113759, "epoch": 2708} {"train_loss": -6.442235946655273, "global_step": 113760, "epoch": 2708} {"train_loss": -6.368183612823486, "global_step": 113761, "epoch": 2708} {"train_loss": -6.330803871154785, "global_step": 113762, "epoch": 2708} {"train_loss": -6.465343475341797, "global_step": 113763, "epoch": 2708} {"train_loss": -6.544003486633301, "global_step": 113764, "epoch": 2708} {"train_loss": -6.450106620788574, "global_step": 113765, "epoch": 2708} {"train_loss": -6.419460296630859, "global_step": 113766, "epoch": 2708} {"train_loss": -6.610775947570801, "global_step": 113767, "epoch": 2708} {"train_loss": -6.475805282592773, "global_step": 113768, "epoch": 2708} {"train_loss": -6.433859348297119, "global_step": 113769, "epoch": 2708} {"train_loss": -6.477308750152588, "global_step": 113770, "epoch": 2708} {"train_loss": -6.479020118713379, "global_step": 113771, "epoch": 2708} {"train_loss": -6.518650054931641, "global_step": 113772, "epoch": 2708} {"train_loss": -6.538348197937012, "global_step": 113773, "epoch": 2708} {"train_loss": -6.607939720153809, "global_step": 113774, "epoch": 2708} {"train_loss": -6.488367080688477, "global_step": 113775, "epoch": 2708} {"train_loss": -6.52531099319458, "global_step": 113776, "epoch": 2708} {"train_loss": -6.476967981883457, "global_step": 113777, "epoch": 2708, "val_loss": 65091.296875} {"train_loss": -6.592041015625, "global_step": 113778, "epoch": 2709} {"train_loss": -6.4827189445495605, "global_step": 113779, "epoch": 2709} {"train_loss": -6.456232070922852, "global_step": 113780, "epoch": 2709} {"train_loss": -6.5516533851623535, "global_step": 113781, "epoch": 2709} {"train_loss": -6.553244590759277, "global_step": 113782, "epoch": 2709} {"train_loss": -6.519314289093018, "global_step": 113783, "epoch": 2709} {"train_loss": -6.502336502075195, "global_step": 113784, "epoch": 2709} {"train_loss": -6.539821624755859, "global_step": 113785, "epoch": 2709} {"train_loss": -6.536814212799072, "global_step": 113786, "epoch": 2709} {"train_loss": -6.494663238525391, "global_step": 113787, "epoch": 2709} {"train_loss": -6.476093769073486, "global_step": 113788, "epoch": 2709} {"train_loss": -6.502128601074219, "global_step": 113789, "epoch": 2709} {"train_loss": -6.602476119995117, "global_step": 113790, "epoch": 2709} {"train_loss": -6.519010543823242, "global_step": 113791, "epoch": 2709} {"train_loss": -6.5370097160339355, "global_step": 113792, "epoch": 2709} {"train_loss": -6.481271743774414, "global_step": 113793, "epoch": 2709} {"train_loss": -6.610058784484863, "global_step": 113794, "epoch": 2709} {"train_loss": -6.589796543121338, "global_step": 113795, "epoch": 2709} {"train_loss": -6.509173393249512, "global_step": 113796, "epoch": 2709} {"train_loss": -6.581775665283203, "global_step": 113797, "epoch": 2709} {"train_loss": -6.479692459106445, "global_step": 113798, "epoch": 2709} {"train_loss": -6.509129524230957, "global_step": 113799, "epoch": 2709} {"train_loss": -6.50007963180542, "global_step": 113800, "epoch": 2709} {"train_loss": -6.440491676330566, "global_step": 113801, "epoch": 2709} {"train_loss": -6.592704772949219, "global_step": 113802, "epoch": 2709} {"train_loss": -6.553617000579834, "global_step": 113803, "epoch": 2709} {"train_loss": -6.491162300109863, "global_step": 113804, "epoch": 2709} {"train_loss": -6.617271423339844, "global_step": 113805, "epoch": 2709} {"train_loss": -6.559517860412598, "global_step": 113806, "epoch": 2709} {"train_loss": -6.438535213470459, "global_step": 113807, "epoch": 2709} {"train_loss": -6.671497344970703, "global_step": 113808, "epoch": 2709} {"train_loss": -6.483199119567871, "global_step": 113809, "epoch": 2709} {"train_loss": -6.515834808349609, "global_step": 113810, "epoch": 2709} {"train_loss": -6.532085418701172, "global_step": 113811, "epoch": 2709} {"train_loss": -6.467612266540527, "global_step": 113812, "epoch": 2709} {"train_loss": -6.481961250305176, "global_step": 113813, "epoch": 2709} {"train_loss": -6.553914546966553, "global_step": 113814, "epoch": 2709} {"train_loss": -6.5211405754089355, "global_step": 113815, "epoch": 2709} {"train_loss": -6.553433418273926, "global_step": 113816, "epoch": 2709} {"train_loss": -6.490797996520996, "global_step": 113817, "epoch": 2709} {"train_loss": -6.43182897567749, "global_step": 113818, "epoch": 2709} {"train_loss": -6.524389948163714, "global_step": 113819, "epoch": 2709, "val_loss": 65384.015625} {"train_loss": -6.516783714294434, "global_step": 113820, "epoch": 2710} {"train_loss": -6.556761264801025, "global_step": 113821, "epoch": 2710} {"train_loss": -6.546213150024414, "global_step": 113822, "epoch": 2710} {"train_loss": -6.560979843139648, "global_step": 113823, "epoch": 2710} {"train_loss": -6.573791027069092, "global_step": 113824, "epoch": 2710} {"train_loss": -6.496194839477539, "global_step": 113825, "epoch": 2710} {"train_loss": -6.575564384460449, "global_step": 113826, "epoch": 2710} {"train_loss": -6.439758777618408, "global_step": 113827, "epoch": 2710} {"train_loss": -6.468280792236328, "global_step": 113828, "epoch": 2710} {"train_loss": -6.50977897644043, "global_step": 113829, "epoch": 2710} {"train_loss": -6.523326396942139, "global_step": 113830, "epoch": 2710} {"train_loss": -6.542572975158691, "global_step": 113831, "epoch": 2710} {"train_loss": -6.584327697753906, "global_step": 113832, "epoch": 2710} {"train_loss": -6.4651079177856445, "global_step": 113833, "epoch": 2710} {"train_loss": -6.659079074859619, "global_step": 113834, "epoch": 2710} {"train_loss": -6.546062469482422, "global_step": 113835, "epoch": 2710} {"train_loss": -6.512636661529541, "global_step": 113836, "epoch": 2710} {"train_loss": -6.53157901763916, "global_step": 113837, "epoch": 2710} {"train_loss": -6.46754264831543, "global_step": 113838, "epoch": 2710} {"train_loss": -6.482572555541992, "global_step": 113839, "epoch": 2710} {"train_loss": -6.435723304748535, "global_step": 113840, "epoch": 2710} {"train_loss": -6.504284858703613, "global_step": 113841, "epoch": 2710} {"train_loss": -6.535816669464111, "global_step": 113842, "epoch": 2710} {"train_loss": -6.352614879608154, "global_step": 113843, "epoch": 2710} {"train_loss": -6.401987552642822, "global_step": 113844, "epoch": 2710} {"train_loss": -6.515590190887451, "global_step": 113845, "epoch": 2710} {"train_loss": -6.352344036102295, "global_step": 113846, "epoch": 2710} {"train_loss": -6.414068698883057, "global_step": 113847, "epoch": 2710} {"train_loss": -6.537371635437012, "global_step": 113848, "epoch": 2710} {"train_loss": -6.491726875305176, "global_step": 113849, "epoch": 2710} {"train_loss": -6.587904930114746, "global_step": 113850, "epoch": 2710} {"train_loss": -6.490455627441406, "global_step": 113851, "epoch": 2710} {"train_loss": -6.402943134307861, "global_step": 113852, "epoch": 2710} {"train_loss": -6.565458297729492, "global_step": 113853, "epoch": 2710} {"train_loss": -6.382536888122559, "global_step": 113854, "epoch": 2710} {"train_loss": -6.450638294219971, "global_step": 113855, "epoch": 2710} {"train_loss": -6.534768104553223, "global_step": 113856, "epoch": 2710} {"train_loss": -6.535826683044434, "global_step": 113857, "epoch": 2710} {"train_loss": -6.3987717628479, "global_step": 113858, "epoch": 2710} {"train_loss": -6.602447509765625, "global_step": 113859, "epoch": 2710} {"train_loss": -6.37196159362793, "global_step": 113860, "epoch": 2710} {"train_loss": -6.498709701356434, "global_step": 113861, "epoch": 2710, "val_loss": 65167.390625} {"train_loss": -6.553780555725098, "global_step": 113862, "epoch": 2711} {"train_loss": -6.393155097961426, "global_step": 113863, "epoch": 2711} {"train_loss": -6.541375637054443, "global_step": 113864, "epoch": 2711} {"train_loss": -6.534924507141113, "global_step": 113865, "epoch": 2711} {"train_loss": -6.506951332092285, "global_step": 113866, "epoch": 2711} {"train_loss": -6.529904842376709, "global_step": 113867, "epoch": 2711} {"train_loss": -6.4212846755981445, "global_step": 113868, "epoch": 2711} {"train_loss": -6.478509902954102, "global_step": 113869, "epoch": 2711} {"train_loss": -6.580728530883789, "global_step": 113870, "epoch": 2711} {"train_loss": -6.4849348068237305, "global_step": 113871, "epoch": 2711} {"train_loss": -6.583556175231934, "global_step": 113872, "epoch": 2711} {"train_loss": -6.524748802185059, "global_step": 113873, "epoch": 2711} {"train_loss": -6.399110317230225, "global_step": 113874, "epoch": 2711} {"train_loss": -6.4822845458984375, "global_step": 113875, "epoch": 2711} {"train_loss": -6.470810890197754, "global_step": 113876, "epoch": 2711} {"train_loss": -6.534640312194824, "global_step": 113877, "epoch": 2711} {"train_loss": -6.5169572830200195, "global_step": 113878, "epoch": 2711} {"train_loss": -6.440919876098633, "global_step": 113879, "epoch": 2711} {"train_loss": -6.548309326171875, "global_step": 113880, "epoch": 2711} {"train_loss": -6.459037780761719, "global_step": 113881, "epoch": 2711} {"train_loss": -6.493059158325195, "global_step": 113882, "epoch": 2711} {"train_loss": -6.439248085021973, "global_step": 113883, "epoch": 2711} {"train_loss": -6.4516096115112305, "global_step": 113884, "epoch": 2711} {"train_loss": -6.445711135864258, "global_step": 113885, "epoch": 2711} {"train_loss": -6.504514217376709, "global_step": 113886, "epoch": 2711} {"train_loss": -6.570315361022949, "global_step": 113887, "epoch": 2711} {"train_loss": -6.550514221191406, "global_step": 113888, "epoch": 2711} {"train_loss": -6.4195404052734375, "global_step": 113889, "epoch": 2711} {"train_loss": -6.569729328155518, "global_step": 113890, "epoch": 2711} {"train_loss": -6.558627128601074, "global_step": 113891, "epoch": 2711} {"train_loss": -6.489855766296387, "global_step": 113892, "epoch": 2711} {"train_loss": -6.640528678894043, "global_step": 113893, "epoch": 2711} {"train_loss": -6.638162612915039, "global_step": 113894, "epoch": 2711} {"train_loss": -6.45985746383667, "global_step": 113895, "epoch": 2711} {"train_loss": -6.565121650695801, "global_step": 113896, "epoch": 2711} {"train_loss": -6.420539379119873, "global_step": 113897, "epoch": 2711} {"train_loss": -6.533425331115723, "global_step": 113898, "epoch": 2711} {"train_loss": -6.60053825378418, "global_step": 113899, "epoch": 2711} {"train_loss": -6.567605018615723, "global_step": 113900, "epoch": 2711} {"train_loss": -6.427083492279053, "global_step": 113901, "epoch": 2711} {"train_loss": -6.439816474914551, "global_step": 113902, "epoch": 2711} {"train_loss": -6.508468230565389, "global_step": 113903, "epoch": 2711, "val_loss": 65284.28125} {"train_loss": -6.498363494873047, "global_step": 113904, "epoch": 2712} {"train_loss": -6.620591163635254, "global_step": 113905, "epoch": 2712} {"train_loss": -6.436862945556641, "global_step": 113906, "epoch": 2712} {"train_loss": -6.550246238708496, "global_step": 113907, "epoch": 2712} {"train_loss": -6.582097053527832, "global_step": 113908, "epoch": 2712} {"train_loss": -6.685025215148926, "global_step": 113909, "epoch": 2712} {"train_loss": -6.621948719024658, "global_step": 113910, "epoch": 2712} {"train_loss": -6.56282377243042, "global_step": 113911, "epoch": 2712} {"train_loss": -6.576398849487305, "global_step": 113912, "epoch": 2712} {"train_loss": -6.535880088806152, "global_step": 113913, "epoch": 2712} {"train_loss": -6.491811752319336, "global_step": 113914, "epoch": 2712} {"train_loss": -6.511885643005371, "global_step": 113915, "epoch": 2712} {"train_loss": -6.454672336578369, "global_step": 113916, "epoch": 2712} {"train_loss": -6.502014636993408, "global_step": 113917, "epoch": 2712} {"train_loss": -6.475231170654297, "global_step": 113918, "epoch": 2712} {"train_loss": -6.396496772766113, "global_step": 113919, "epoch": 2712} {"train_loss": -6.607176780700684, "global_step": 113920, "epoch": 2712} {"train_loss": -6.524796009063721, "global_step": 113921, "epoch": 2712} {"train_loss": -6.391219615936279, "global_step": 113922, "epoch": 2712} {"train_loss": -6.5500168800354, "global_step": 113923, "epoch": 2712} {"train_loss": -6.381078720092773, "global_step": 113924, "epoch": 2712} {"train_loss": -6.615445613861084, "global_step": 113925, "epoch": 2712} {"train_loss": -6.391422748565674, "global_step": 113926, "epoch": 2712} {"train_loss": -6.552933216094971, "global_step": 113927, "epoch": 2712} {"train_loss": -6.4706645011901855, "global_step": 113928, "epoch": 2712} {"train_loss": -6.562318801879883, "global_step": 113929, "epoch": 2712} {"train_loss": -6.56911563873291, "global_step": 113930, "epoch": 2712} {"train_loss": -6.575483322143555, "global_step": 113931, "epoch": 2712} {"train_loss": -6.514594078063965, "global_step": 113932, "epoch": 2712} {"train_loss": -6.679643154144287, "global_step": 113933, "epoch": 2712} {"train_loss": -6.557073593139648, "global_step": 113934, "epoch": 2712} {"train_loss": -6.4932966232299805, "global_step": 113935, "epoch": 2712} {"train_loss": -6.38651180267334, "global_step": 113936, "epoch": 2712} {"train_loss": -6.650622367858887, "global_step": 113937, "epoch": 2712} {"train_loss": -6.411892890930176, "global_step": 113938, "epoch": 2712} {"train_loss": -6.600076675415039, "global_step": 113939, "epoch": 2712} {"train_loss": -6.492840766906738, "global_step": 113940, "epoch": 2712} {"train_loss": -6.4910759925842285, "global_step": 113941, "epoch": 2712} {"train_loss": -6.453006267547607, "global_step": 113942, "epoch": 2712} {"train_loss": -6.56541109085083, "global_step": 113943, "epoch": 2712} {"train_loss": -6.422267913818359, "global_step": 113944, "epoch": 2712} {"train_loss": -6.51776697522118, "global_step": 113945, "epoch": 2712, "val_loss": 65182.6640625} {"train_loss": -6.4998860359191895, "global_step": 113946, "epoch": 2713} {"train_loss": -6.496761798858643, "global_step": 113947, "epoch": 2713} {"train_loss": -6.417958736419678, "global_step": 113948, "epoch": 2713} {"train_loss": -6.4832000732421875, "global_step": 113949, "epoch": 2713} {"train_loss": -6.4841203689575195, "global_step": 113950, "epoch": 2713} {"train_loss": -6.522810459136963, "global_step": 113951, "epoch": 2713} {"train_loss": -6.4051313400268555, "global_step": 113952, "epoch": 2713} {"train_loss": -6.493306636810303, "global_step": 113953, "epoch": 2713} {"train_loss": -6.507223606109619, "global_step": 113954, "epoch": 2713} {"train_loss": -6.426609039306641, "global_step": 113955, "epoch": 2713} {"train_loss": -6.362284183502197, "global_step": 113956, "epoch": 2713} {"train_loss": -6.5544023513793945, "global_step": 113957, "epoch": 2713} {"train_loss": -6.502560615539551, "global_step": 113958, "epoch": 2713} {"train_loss": -6.384159088134766, "global_step": 113959, "epoch": 2713} {"train_loss": -6.491865158081055, "global_step": 113960, "epoch": 2713} {"train_loss": -6.5772600173950195, "global_step": 113961, "epoch": 2713} {"train_loss": -6.593987941741943, "global_step": 113962, "epoch": 2713} {"train_loss": -6.39920711517334, "global_step": 113963, "epoch": 2713} {"train_loss": -6.441367149353027, "global_step": 113964, "epoch": 2713} {"train_loss": -6.3541669845581055, "global_step": 113965, "epoch": 2713} {"train_loss": -6.493599891662598, "global_step": 113966, "epoch": 2713} {"train_loss": -6.500516891479492, "global_step": 113967, "epoch": 2713} {"train_loss": -6.340022087097168, "global_step": 113968, "epoch": 2713} {"train_loss": -6.4539031982421875, "global_step": 113969, "epoch": 2713} {"train_loss": -6.286055564880371, "global_step": 113970, "epoch": 2713} {"train_loss": -6.28136682510376, "global_step": 113971, "epoch": 2713} {"train_loss": -6.503360748291016, "global_step": 113972, "epoch": 2713} {"train_loss": -6.6182732582092285, "global_step": 113973, "epoch": 2713} {"train_loss": -6.54102087020874, "global_step": 113974, "epoch": 2713} {"train_loss": -6.478033065795898, "global_step": 113975, "epoch": 2713} {"train_loss": -6.565683841705322, "global_step": 113976, "epoch": 2713} {"train_loss": -6.412249565124512, "global_step": 113977, "epoch": 2713} {"train_loss": -6.5198493003845215, "global_step": 113978, "epoch": 2713} {"train_loss": -6.519431114196777, "global_step": 113979, "epoch": 2713} {"train_loss": -6.584569454193115, "global_step": 113980, "epoch": 2713} {"train_loss": -6.555377006530762, "global_step": 113981, "epoch": 2713} {"train_loss": -6.420770168304443, "global_step": 113982, "epoch": 2713} {"train_loss": -6.524720191955566, "global_step": 113983, "epoch": 2713} {"train_loss": -6.473109245300293, "global_step": 113984, "epoch": 2713} {"train_loss": -6.558203220367432, "global_step": 113985, "epoch": 2713} {"train_loss": -6.571106910705566, "global_step": 113986, "epoch": 2713} {"train_loss": -6.478758278347197, "global_step": 113987, "epoch": 2713, "val_loss": 65113.10546875} {"train_loss": -6.55001163482666, "global_step": 113988, "epoch": 2714} {"train_loss": -6.5578227043151855, "global_step": 113989, "epoch": 2714} {"train_loss": -6.536289215087891, "global_step": 113990, "epoch": 2714} {"train_loss": -6.5875749588012695, "global_step": 113991, "epoch": 2714} {"train_loss": -6.477816104888916, "global_step": 113992, "epoch": 2714} {"train_loss": -6.629531383514404, "global_step": 113993, "epoch": 2714} {"train_loss": -6.597525596618652, "global_step": 113994, "epoch": 2714} {"train_loss": -6.540248870849609, "global_step": 113995, "epoch": 2714} {"train_loss": -6.509905815124512, "global_step": 113996, "epoch": 2714} {"train_loss": -6.5718584060668945, "global_step": 113997, "epoch": 2714} {"train_loss": -6.592622756958008, "global_step": 113998, "epoch": 2714} {"train_loss": -6.422264099121094, "global_step": 113999, "epoch": 2714} {"train_loss": -6.537564277648926, "global_step": 114000, "epoch": 2714} {"train_loss": -6.54764461517334, "global_step": 114001, "epoch": 2714} {"train_loss": -6.554759979248047, "global_step": 114002, "epoch": 2714} {"train_loss": -6.564772605895996, "global_step": 114003, "epoch": 2714} {"train_loss": -6.539497375488281, "global_step": 114004, "epoch": 2714} {"train_loss": -6.502966403961182, "global_step": 114005, "epoch": 2714} {"train_loss": -6.68349552154541, "global_step": 114006, "epoch": 2714} {"train_loss": -6.543665885925293, "global_step": 114007, "epoch": 2714} {"train_loss": -6.537977695465088, "global_step": 114008, "epoch": 2714} {"train_loss": -6.484169006347656, "global_step": 114009, "epoch": 2714} {"train_loss": -6.4754838943481445, "global_step": 114010, "epoch": 2714} {"train_loss": -6.296390533447266, "global_step": 114011, "epoch": 2714} {"train_loss": -6.586848258972168, "global_step": 114012, "epoch": 2714} {"train_loss": -6.449776649475098, "global_step": 114013, "epoch": 2714} {"train_loss": -6.524396896362305, "global_step": 114014, "epoch": 2714} {"train_loss": -6.483621597290039, "global_step": 114015, "epoch": 2714} {"train_loss": -6.515470027923584, "global_step": 114016, "epoch": 2714} {"train_loss": -6.478562831878662, "global_step": 114017, "epoch": 2714} {"train_loss": -6.487062931060791, "global_step": 114018, "epoch": 2714} {"train_loss": -6.528903007507324, "global_step": 114019, "epoch": 2714} {"train_loss": -6.458357334136963, "global_step": 114020, "epoch": 2714} {"train_loss": -6.385331153869629, "global_step": 114021, "epoch": 2714} {"train_loss": -6.400646209716797, "global_step": 114022, "epoch": 2714} {"train_loss": -6.474742889404297, "global_step": 114023, "epoch": 2714} {"train_loss": -6.487192153930664, "global_step": 114024, "epoch": 2714} {"train_loss": -6.634675979614258, "global_step": 114025, "epoch": 2714} {"train_loss": -6.5027079582214355, "global_step": 114026, "epoch": 2714} {"train_loss": -6.572771072387695, "global_step": 114027, "epoch": 2714} {"train_loss": -6.513602256774902, "global_step": 114028, "epoch": 2714} {"train_loss": -6.517920425959995, "global_step": 114029, "epoch": 2714, "val_loss": 65415.16796875} {"train_loss": -6.513966083526611, "global_step": 114030, "epoch": 2715} {"train_loss": -6.4564666748046875, "global_step": 114031, "epoch": 2715} {"train_loss": -6.443963527679443, "global_step": 114032, "epoch": 2715} {"train_loss": -6.415417671203613, "global_step": 114033, "epoch": 2715} {"train_loss": -6.604608535766602, "global_step": 114034, "epoch": 2715} {"train_loss": -6.562648773193359, "global_step": 114035, "epoch": 2715} {"train_loss": -6.580254077911377, "global_step": 114036, "epoch": 2715} {"train_loss": -6.532529830932617, "global_step": 114037, "epoch": 2715} {"train_loss": -6.507075309753418, "global_step": 114038, "epoch": 2715} {"train_loss": -6.566956520080566, "global_step": 114039, "epoch": 2715} {"train_loss": -6.579294204711914, "global_step": 114040, "epoch": 2715} {"train_loss": -6.562525749206543, "global_step": 114041, "epoch": 2715} {"train_loss": -6.633778095245361, "global_step": 114042, "epoch": 2715} {"train_loss": -6.429440021514893, "global_step": 114043, "epoch": 2715} {"train_loss": -6.40537166595459, "global_step": 114044, "epoch": 2715} {"train_loss": -6.522937297821045, "global_step": 114045, "epoch": 2715} {"train_loss": -6.604681968688965, "global_step": 114046, "epoch": 2715} {"train_loss": -6.505191802978516, "global_step": 114047, "epoch": 2715} {"train_loss": -6.650023460388184, "global_step": 114048, "epoch": 2715} {"train_loss": -6.573121070861816, "global_step": 114049, "epoch": 2715} {"train_loss": -6.530261039733887, "global_step": 114050, "epoch": 2715} {"train_loss": -6.537080764770508, "global_step": 114051, "epoch": 2715} {"train_loss": -6.479194641113281, "global_step": 114052, "epoch": 2715} {"train_loss": -6.598748207092285, "global_step": 114053, "epoch": 2715} {"train_loss": -6.5481367111206055, "global_step": 114054, "epoch": 2715} {"train_loss": -6.605212211608887, "global_step": 114055, "epoch": 2715} {"train_loss": -6.589694976806641, "global_step": 114056, "epoch": 2715} {"train_loss": -6.543422698974609, "global_step": 114057, "epoch": 2715} {"train_loss": -6.575850009918213, "global_step": 114058, "epoch": 2715} {"train_loss": -6.567046165466309, "global_step": 114059, "epoch": 2715} {"train_loss": -6.541141510009766, "global_step": 114060, "epoch": 2715} {"train_loss": -6.458796501159668, "global_step": 114061, "epoch": 2715} {"train_loss": -6.541835784912109, "global_step": 114062, "epoch": 2715} {"train_loss": -6.536855220794678, "global_step": 114063, "epoch": 2715} {"train_loss": -6.529001235961914, "global_step": 114064, "epoch": 2715} {"train_loss": -6.442483425140381, "global_step": 114065, "epoch": 2715} {"train_loss": -6.451545715332031, "global_step": 114066, "epoch": 2715} {"train_loss": -6.463698387145996, "global_step": 114067, "epoch": 2715} {"train_loss": -6.4405622482299805, "global_step": 114068, "epoch": 2715} {"train_loss": -6.519659042358398, "global_step": 114069, "epoch": 2715} {"train_loss": -6.579197406768799, "global_step": 114070, "epoch": 2715} {"train_loss": -6.5277711890992665, "global_step": 114071, "epoch": 2715, "val_loss": 65641.828125} {"train_loss": -6.369314193725586, "global_step": 114072, "epoch": 2716} {"train_loss": -6.516029357910156, "global_step": 114073, "epoch": 2716} {"train_loss": -6.556182384490967, "global_step": 114074, "epoch": 2716} {"train_loss": -6.380053520202637, "global_step": 114075, "epoch": 2716} {"train_loss": -6.4667439460754395, "global_step": 114076, "epoch": 2716} {"train_loss": -6.445225715637207, "global_step": 114077, "epoch": 2716} {"train_loss": -6.435647964477539, "global_step": 114078, "epoch": 2716} {"train_loss": -6.480269432067871, "global_step": 114079, "epoch": 2716} {"train_loss": -6.497551918029785, "global_step": 114080, "epoch": 2716} {"train_loss": -6.386192321777344, "global_step": 114081, "epoch": 2716} {"train_loss": -6.432066440582275, "global_step": 114082, "epoch": 2716} {"train_loss": -6.400539875030518, "global_step": 114083, "epoch": 2716} {"train_loss": -6.531414031982422, "global_step": 114084, "epoch": 2716} {"train_loss": -6.518387317657471, "global_step": 114085, "epoch": 2716} {"train_loss": -6.477618217468262, "global_step": 114086, "epoch": 2716} {"train_loss": -6.430981636047363, "global_step": 114087, "epoch": 2716} {"train_loss": -6.471879959106445, "global_step": 114088, "epoch": 2716} {"train_loss": -6.515627861022949, "global_step": 114089, "epoch": 2716} {"train_loss": -6.51788330078125, "global_step": 114090, "epoch": 2716} {"train_loss": -6.51869010925293, "global_step": 114091, "epoch": 2716} {"train_loss": -6.491624355316162, "global_step": 114092, "epoch": 2716} {"train_loss": -6.4072675704956055, "global_step": 114093, "epoch": 2716} {"train_loss": -6.487627983093262, "global_step": 114094, "epoch": 2716} {"train_loss": -6.48430061340332, "global_step": 114095, "epoch": 2716} {"train_loss": -6.509888648986816, "global_step": 114096, "epoch": 2716} {"train_loss": -6.530647277832031, "global_step": 114097, "epoch": 2716} {"train_loss": -6.473693370819092, "global_step": 114098, "epoch": 2716} {"train_loss": -6.536445617675781, "global_step": 114099, "epoch": 2716} {"train_loss": -6.439299583435059, "global_step": 114100, "epoch": 2716} {"train_loss": -6.527562141418457, "global_step": 114101, "epoch": 2716} {"train_loss": -6.654250621795654, "global_step": 114102, "epoch": 2716} {"train_loss": -6.611677169799805, "global_step": 114103, "epoch": 2716} {"train_loss": -6.540231704711914, "global_step": 114104, "epoch": 2716} {"train_loss": -6.583736896514893, "global_step": 114105, "epoch": 2716} {"train_loss": -6.5233259201049805, "global_step": 114106, "epoch": 2716} {"train_loss": -6.521527290344238, "global_step": 114107, "epoch": 2716} {"train_loss": -6.550802707672119, "global_step": 114108, "epoch": 2716} {"train_loss": -6.53859806060791, "global_step": 114109, "epoch": 2716} {"train_loss": -6.52805233001709, "global_step": 114110, "epoch": 2716} {"train_loss": -6.447052478790283, "global_step": 114111, "epoch": 2716} {"train_loss": -6.600938320159912, "global_step": 114112, "epoch": 2716} {"train_loss": -6.49544570559547, "global_step": 114113, "epoch": 2716, "val_loss": 65351.2421875} {"train_loss": -6.582749366760254, "global_step": 114114, "epoch": 2717} {"train_loss": -6.397160530090332, "global_step": 114115, "epoch": 2717} {"train_loss": -6.504426956176758, "global_step": 114116, "epoch": 2717} {"train_loss": -6.669162750244141, "global_step": 114117, "epoch": 2717} {"train_loss": -6.4327778816223145, "global_step": 114118, "epoch": 2717} {"train_loss": -6.626890182495117, "global_step": 114119, "epoch": 2717} {"train_loss": -6.441962242126465, "global_step": 114120, "epoch": 2717} {"train_loss": -6.492986679077148, "global_step": 114121, "epoch": 2717} {"train_loss": -6.506708145141602, "global_step": 114122, "epoch": 2717} {"train_loss": -6.588759899139404, "global_step": 114123, "epoch": 2717} {"train_loss": -6.480789661407471, "global_step": 114124, "epoch": 2717} {"train_loss": -6.590104103088379, "global_step": 114125, "epoch": 2717} {"train_loss": -6.602525234222412, "global_step": 114126, "epoch": 2717} {"train_loss": -6.537142753601074, "global_step": 114127, "epoch": 2717} {"train_loss": -6.590991020202637, "global_step": 114128, "epoch": 2717} {"train_loss": -6.501676082611084, "global_step": 114129, "epoch": 2717} {"train_loss": -6.578193187713623, "global_step": 114130, "epoch": 2717} {"train_loss": -6.613853454589844, "global_step": 114131, "epoch": 2717} {"train_loss": -6.5395002365112305, "global_step": 114132, "epoch": 2717} {"train_loss": -6.514943599700928, "global_step": 114133, "epoch": 2717} {"train_loss": -6.670220375061035, "global_step": 114134, "epoch": 2717} {"train_loss": -6.597838401794434, "global_step": 114135, "epoch": 2717} {"train_loss": -6.544578552246094, "global_step": 114136, "epoch": 2717} {"train_loss": -6.4676618576049805, "global_step": 114137, "epoch": 2717} {"train_loss": -6.531641006469727, "global_step": 114138, "epoch": 2717} {"train_loss": -6.546316146850586, "global_step": 114139, "epoch": 2717} {"train_loss": -6.540253639221191, "global_step": 114140, "epoch": 2717} {"train_loss": -6.6148247718811035, "global_step": 114141, "epoch": 2717} {"train_loss": -6.48689603805542, "global_step": 114142, "epoch": 2717} {"train_loss": -6.44244384765625, "global_step": 114143, "epoch": 2717} {"train_loss": -6.486780643463135, "global_step": 114144, "epoch": 2717} {"train_loss": -6.553685665130615, "global_step": 114145, "epoch": 2717} {"train_loss": -6.563360691070557, "global_step": 114146, "epoch": 2717} {"train_loss": -6.563536643981934, "global_step": 114147, "epoch": 2717} {"train_loss": -6.492664813995361, "global_step": 114148, "epoch": 2717} {"train_loss": -6.518436431884766, "global_step": 114149, "epoch": 2717} {"train_loss": -6.472782135009766, "global_step": 114150, "epoch": 2717} {"train_loss": -6.530717849731445, "global_step": 114151, "epoch": 2717} {"train_loss": -6.497492790222168, "global_step": 114152, "epoch": 2717} {"train_loss": -6.635756492614746, "global_step": 114153, "epoch": 2717} {"train_loss": -6.5481343269348145, "global_step": 114154, "epoch": 2717} {"train_loss": -6.539607638404483, "global_step": 114155, "epoch": 2717, "val_loss": 65203.9375} {"train_loss": -6.461820602416992, "global_step": 114156, "epoch": 2718} {"train_loss": -6.45952033996582, "global_step": 114157, "epoch": 2718} {"train_loss": -6.5186967849731445, "global_step": 114158, "epoch": 2718} {"train_loss": -6.490679740905762, "global_step": 114159, "epoch": 2718} {"train_loss": -6.508649826049805, "global_step": 114160, "epoch": 2718} {"train_loss": -6.542572975158691, "global_step": 114161, "epoch": 2718} {"train_loss": -6.487740516662598, "global_step": 114162, "epoch": 2718} {"train_loss": -6.601265907287598, "global_step": 114163, "epoch": 2718} {"train_loss": -6.540109634399414, "global_step": 114164, "epoch": 2718} {"train_loss": -6.541263103485107, "global_step": 114165, "epoch": 2718} {"train_loss": -6.483301162719727, "global_step": 114166, "epoch": 2718} {"train_loss": -6.53873348236084, "global_step": 114167, "epoch": 2718} {"train_loss": -6.508421897888184, "global_step": 114168, "epoch": 2718} {"train_loss": -6.571679592132568, "global_step": 114169, "epoch": 2718} {"train_loss": -6.504830360412598, "global_step": 114170, "epoch": 2718} {"train_loss": -6.581821441650391, "global_step": 114171, "epoch": 2718} {"train_loss": -6.505157470703125, "global_step": 114172, "epoch": 2718} {"train_loss": -6.454134941101074, "global_step": 114173, "epoch": 2718} {"train_loss": -6.4641218185424805, "global_step": 114174, "epoch": 2718} {"train_loss": -6.604651927947998, "global_step": 114175, "epoch": 2718} {"train_loss": -6.505979061126709, "global_step": 114176, "epoch": 2718} {"train_loss": -6.534100532531738, "global_step": 114177, "epoch": 2718} {"train_loss": -6.627658843994141, "global_step": 114178, "epoch": 2718} {"train_loss": -6.483302593231201, "global_step": 114179, "epoch": 2718} {"train_loss": -6.522809982299805, "global_step": 114180, "epoch": 2718} {"train_loss": -6.560405731201172, "global_step": 114181, "epoch": 2718} {"train_loss": -6.472944259643555, "global_step": 114182, "epoch": 2718} {"train_loss": -6.437509536743164, "global_step": 114183, "epoch": 2718} {"train_loss": -6.705545425415039, "global_step": 114184, "epoch": 2718} {"train_loss": -6.548884391784668, "global_step": 114185, "epoch": 2718} {"train_loss": -6.521145820617676, "global_step": 114186, "epoch": 2718} {"train_loss": -6.517779350280762, "global_step": 114187, "epoch": 2718} {"train_loss": -6.494397163391113, "global_step": 114188, "epoch": 2718} {"train_loss": -6.51402473449707, "global_step": 114189, "epoch": 2718} {"train_loss": -6.406057357788086, "global_step": 114190, "epoch": 2718} {"train_loss": -6.474048137664795, "global_step": 114191, "epoch": 2718} {"train_loss": -6.579941272735596, "global_step": 114192, "epoch": 2718} {"train_loss": -6.459354877471924, "global_step": 114193, "epoch": 2718} {"train_loss": -6.472866058349609, "global_step": 114194, "epoch": 2718} {"train_loss": -6.4894819259643555, "global_step": 114195, "epoch": 2718} {"train_loss": -6.491685390472412, "global_step": 114196, "epoch": 2718} {"train_loss": -6.5143635386512395, "global_step": 114197, "epoch": 2718, "val_loss": 65325.75390625} {"train_loss": -6.540485858917236, "global_step": 114198, "epoch": 2719} {"train_loss": -6.441163063049316, "global_step": 114199, "epoch": 2719} {"train_loss": -6.367844581604004, "global_step": 114200, "epoch": 2719} {"train_loss": -6.380171775817871, "global_step": 114201, "epoch": 2719} {"train_loss": -6.591609954833984, "global_step": 114202, "epoch": 2719} {"train_loss": -6.591855049133301, "global_step": 114203, "epoch": 2719} {"train_loss": -6.4202561378479, "global_step": 114204, "epoch": 2719} {"train_loss": -6.419707298278809, "global_step": 114205, "epoch": 2719} {"train_loss": -6.635994911193848, "global_step": 114206, "epoch": 2719} {"train_loss": -6.49818754196167, "global_step": 114207, "epoch": 2719} {"train_loss": -6.517232894897461, "global_step": 114208, "epoch": 2719} {"train_loss": -6.665127277374268, "global_step": 114209, "epoch": 2719} {"train_loss": -6.60243034362793, "global_step": 114210, "epoch": 2719} {"train_loss": -6.464909553527832, "global_step": 114211, "epoch": 2719} {"train_loss": -6.481665134429932, "global_step": 114212, "epoch": 2719} {"train_loss": -6.585984230041504, "global_step": 114213, "epoch": 2719} {"train_loss": -6.452052593231201, "global_step": 114214, "epoch": 2719} {"train_loss": -6.511598587036133, "global_step": 114215, "epoch": 2719} {"train_loss": -6.444671630859375, "global_step": 114216, "epoch": 2719} {"train_loss": -6.387767791748047, "global_step": 114217, "epoch": 2719} {"train_loss": -6.640942573547363, "global_step": 114218, "epoch": 2719} {"train_loss": -6.525002956390381, "global_step": 114219, "epoch": 2719} {"train_loss": -6.464705944061279, "global_step": 114220, "epoch": 2719} {"train_loss": -6.46127986907959, "global_step": 114221, "epoch": 2719} {"train_loss": -6.516873359680176, "global_step": 114222, "epoch": 2719} {"train_loss": -6.501220703125, "global_step": 114223, "epoch": 2719} {"train_loss": -6.6187028884887695, "global_step": 114224, "epoch": 2719} {"train_loss": -6.603100776672363, "global_step": 114225, "epoch": 2719} {"train_loss": -6.492554187774658, "global_step": 114226, "epoch": 2719} {"train_loss": -6.478758811950684, "global_step": 114227, "epoch": 2719} {"train_loss": -6.619434356689453, "global_step": 114228, "epoch": 2719} {"train_loss": -6.468017578125, "global_step": 114229, "epoch": 2719} {"train_loss": -6.505155563354492, "global_step": 114230, "epoch": 2719} {"train_loss": -6.566291809082031, "global_step": 114231, "epoch": 2719} {"train_loss": -6.476616859436035, "global_step": 114232, "epoch": 2719} {"train_loss": -6.546557903289795, "global_step": 114233, "epoch": 2719} {"train_loss": -6.593297958374023, "global_step": 114234, "epoch": 2719} {"train_loss": -6.594961166381836, "global_step": 114235, "epoch": 2719} {"train_loss": -6.647911071777344, "global_step": 114236, "epoch": 2719} {"train_loss": -6.554382801055908, "global_step": 114237, "epoch": 2719} {"train_loss": -6.580015182495117, "global_step": 114238, "epoch": 2719} {"train_loss": -6.523673171088809, "global_step": 114239, "epoch": 2719, "val_loss": 65232.8828125} {"train_loss": -6.57485294342041, "global_step": 114240, "epoch": 2720} {"train_loss": -6.528390884399414, "global_step": 114241, "epoch": 2720} {"train_loss": -6.508319854736328, "global_step": 114242, "epoch": 2720} {"train_loss": -6.541930198669434, "global_step": 114243, "epoch": 2720} {"train_loss": -6.428272247314453, "global_step": 114244, "epoch": 2720} {"train_loss": -6.428684234619141, "global_step": 114245, "epoch": 2720} {"train_loss": -6.610771179199219, "global_step": 114246, "epoch": 2720} {"train_loss": -6.5895094871521, "global_step": 114247, "epoch": 2720} {"train_loss": -6.3898491859436035, "global_step": 114248, "epoch": 2720} {"train_loss": -6.572549819946289, "global_step": 114249, "epoch": 2720} {"train_loss": -6.478156089782715, "global_step": 114250, "epoch": 2720} {"train_loss": -6.432730674743652, "global_step": 114251, "epoch": 2720} {"train_loss": -6.58534049987793, "global_step": 114252, "epoch": 2720} {"train_loss": -6.564150333404541, "global_step": 114253, "epoch": 2720} {"train_loss": -6.602890968322754, "global_step": 114254, "epoch": 2720} {"train_loss": -6.604070663452148, "global_step": 114255, "epoch": 2720} {"train_loss": -6.52236795425415, "global_step": 114256, "epoch": 2720} {"train_loss": -6.48403263092041, "global_step": 114257, "epoch": 2720} {"train_loss": -6.483887672424316, "global_step": 114258, "epoch": 2720} {"train_loss": -6.535233497619629, "global_step": 114259, "epoch": 2720} {"train_loss": -6.519431114196777, "global_step": 114260, "epoch": 2720} {"train_loss": -6.462730407714844, "global_step": 114261, "epoch": 2720} {"train_loss": -6.485498428344727, "global_step": 114262, "epoch": 2720} {"train_loss": -6.6407928466796875, "global_step": 114263, "epoch": 2720} {"train_loss": -6.469630718231201, "global_step": 114264, "epoch": 2720} {"train_loss": -6.482627868652344, "global_step": 114265, "epoch": 2720} {"train_loss": -6.486050605773926, "global_step": 114266, "epoch": 2720} {"train_loss": -6.5059051513671875, "global_step": 114267, "epoch": 2720} {"train_loss": -6.4722089767456055, "global_step": 114268, "epoch": 2720} {"train_loss": -6.5244140625, "global_step": 114269, "epoch": 2720} {"train_loss": -6.473036289215088, "global_step": 114270, "epoch": 2720} {"train_loss": -6.501405715942383, "global_step": 114271, "epoch": 2720} {"train_loss": -6.445074558258057, "global_step": 114272, "epoch": 2720} {"train_loss": -6.559701919555664, "global_step": 114273, "epoch": 2720} {"train_loss": -6.437605857849121, "global_step": 114274, "epoch": 2720} {"train_loss": -6.634504318237305, "global_step": 114275, "epoch": 2720} {"train_loss": -6.559201240539551, "global_step": 114276, "epoch": 2720} {"train_loss": -6.537845611572266, "global_step": 114277, "epoch": 2720} {"train_loss": -6.520040988922119, "global_step": 114278, "epoch": 2720} {"train_loss": -6.532681941986084, "global_step": 114279, "epoch": 2720} {"train_loss": -6.555118560791016, "global_step": 114280, "epoch": 2720} {"train_loss": -6.520339511689686, "global_step": 114281, "epoch": 2720, "val_loss": 65288.9921875} {"train_loss": -6.615278244018555, "global_step": 114282, "epoch": 2721} {"train_loss": -6.599440097808838, "global_step": 114283, "epoch": 2721} {"train_loss": -6.5615129470825195, "global_step": 114284, "epoch": 2721} {"train_loss": -6.486824989318848, "global_step": 114285, "epoch": 2721} {"train_loss": -6.550006866455078, "global_step": 114286, "epoch": 2721} {"train_loss": -6.516667366027832, "global_step": 114287, "epoch": 2721} {"train_loss": -6.536035537719727, "global_step": 114288, "epoch": 2721} {"train_loss": -6.527438163757324, "global_step": 114289, "epoch": 2721} {"train_loss": -6.584003925323486, "global_step": 114290, "epoch": 2721} {"train_loss": -6.51589298248291, "global_step": 114291, "epoch": 2721} {"train_loss": -6.442156791687012, "global_step": 114292, "epoch": 2721} {"train_loss": -6.587684631347656, "global_step": 114293, "epoch": 2721} {"train_loss": -6.560127258300781, "global_step": 114294, "epoch": 2721} {"train_loss": -6.637678146362305, "global_step": 114295, "epoch": 2721} {"train_loss": -6.594369411468506, "global_step": 114296, "epoch": 2721} {"train_loss": -6.470464706420898, "global_step": 114297, "epoch": 2721} {"train_loss": -6.549931526184082, "global_step": 114298, "epoch": 2721} {"train_loss": -6.551339149475098, "global_step": 114299, "epoch": 2721} {"train_loss": -6.578949451446533, "global_step": 114300, "epoch": 2721} {"train_loss": -6.595754623413086, "global_step": 114301, "epoch": 2721} {"train_loss": -6.6715617179870605, "global_step": 114302, "epoch": 2721} {"train_loss": -6.640093803405762, "global_step": 114303, "epoch": 2721} {"train_loss": -6.514849662780762, "global_step": 114304, "epoch": 2721} {"train_loss": -6.570613384246826, "global_step": 114305, "epoch": 2721} {"train_loss": -6.555883884429932, "global_step": 114306, "epoch": 2721} {"train_loss": -6.501667022705078, "global_step": 114307, "epoch": 2721} {"train_loss": -6.563349723815918, "global_step": 114308, "epoch": 2721} {"train_loss": -6.530177593231201, "global_step": 114309, "epoch": 2721} {"train_loss": -6.510781764984131, "global_step": 114310, "epoch": 2721} {"train_loss": -6.466590404510498, "global_step": 114311, "epoch": 2721} {"train_loss": -6.521688938140869, "global_step": 114312, "epoch": 2721} {"train_loss": -6.598942756652832, "global_step": 114313, "epoch": 2721} {"train_loss": -6.428701400756836, "global_step": 114314, "epoch": 2721} {"train_loss": -6.579065322875977, "global_step": 114315, "epoch": 2721} {"train_loss": -6.615816593170166, "global_step": 114316, "epoch": 2721} {"train_loss": -6.49416446685791, "global_step": 114317, "epoch": 2721} {"train_loss": -6.608473777770996, "global_step": 114318, "epoch": 2721} {"train_loss": -6.599275588989258, "global_step": 114319, "epoch": 2721} {"train_loss": -6.571681022644043, "global_step": 114320, "epoch": 2721} {"train_loss": -6.501417636871338, "global_step": 114321, "epoch": 2721} {"train_loss": -6.545534133911133, "global_step": 114322, "epoch": 2721} {"train_loss": -6.552799678984142, "global_step": 114323, "epoch": 2721, "val_loss": 65270.12890625} {"train_loss": -6.613105297088623, "global_step": 114324, "epoch": 2722} {"train_loss": -6.5285468101501465, "global_step": 114325, "epoch": 2722} {"train_loss": -6.604224681854248, "global_step": 114326, "epoch": 2722} {"train_loss": -6.533602237701416, "global_step": 114327, "epoch": 2722} {"train_loss": -6.4642205238342285, "global_step": 114328, "epoch": 2722} {"train_loss": -6.598465919494629, "global_step": 114329, "epoch": 2722} {"train_loss": -6.4836015701293945, "global_step": 114330, "epoch": 2722} {"train_loss": -6.458493232727051, "global_step": 114331, "epoch": 2722} {"train_loss": -6.44965934753418, "global_step": 114332, "epoch": 2722} {"train_loss": -6.617631912231445, "global_step": 114333, "epoch": 2722} {"train_loss": -6.577822685241699, "global_step": 114334, "epoch": 2722} {"train_loss": -6.543567180633545, "global_step": 114335, "epoch": 2722} {"train_loss": -6.545754909515381, "global_step": 114336, "epoch": 2722} {"train_loss": -6.613306999206543, "global_step": 114337, "epoch": 2722} {"train_loss": -6.528559684753418, "global_step": 114338, "epoch": 2722} {"train_loss": -6.355628967285156, "global_step": 114339, "epoch": 2722} {"train_loss": -6.5294575691223145, "global_step": 114340, "epoch": 2722} {"train_loss": -6.47846794128418, "global_step": 114341, "epoch": 2722} {"train_loss": -6.412935733795166, "global_step": 114342, "epoch": 2722} {"train_loss": -6.562560081481934, "global_step": 114343, "epoch": 2722} {"train_loss": -6.539216995239258, "global_step": 114344, "epoch": 2722} {"train_loss": -6.485255718231201, "global_step": 114345, "epoch": 2722} {"train_loss": -6.530388832092285, "global_step": 114346, "epoch": 2722} {"train_loss": -6.441251754760742, "global_step": 114347, "epoch": 2722} {"train_loss": -6.559670448303223, "global_step": 114348, "epoch": 2722} {"train_loss": -6.533232688903809, "global_step": 114349, "epoch": 2722} {"train_loss": -6.4760966300964355, "global_step": 114350, "epoch": 2722} {"train_loss": -6.373022556304932, "global_step": 114351, "epoch": 2722} {"train_loss": -6.505218982696533, "global_step": 114352, "epoch": 2722} {"train_loss": -6.546271324157715, "global_step": 114353, "epoch": 2722} {"train_loss": -6.444469451904297, "global_step": 114354, "epoch": 2722} {"train_loss": -6.550006866455078, "global_step": 114355, "epoch": 2722} {"train_loss": -6.509352684020996, "global_step": 114356, "epoch": 2722} {"train_loss": -6.544015884399414, "global_step": 114357, "epoch": 2722} {"train_loss": -6.450591087341309, "global_step": 114358, "epoch": 2722} {"train_loss": -6.498292922973633, "global_step": 114359, "epoch": 2722} {"train_loss": -6.5928955078125, "global_step": 114360, "epoch": 2722} {"train_loss": -6.400209903717041, "global_step": 114361, "epoch": 2722} {"train_loss": -6.530345916748047, "global_step": 114362, "epoch": 2722} {"train_loss": -6.556589603424072, "global_step": 114363, "epoch": 2722} {"train_loss": -6.561014175415039, "global_step": 114364, "epoch": 2722} {"train_loss": -6.515951031730289, "global_step": 114365, "epoch": 2722, "val_loss": 65484.28125} {"train_loss": -6.566647529602051, "global_step": 114366, "epoch": 2723} {"train_loss": -6.471019744873047, "global_step": 114367, "epoch": 2723} {"train_loss": -6.52605676651001, "global_step": 114368, "epoch": 2723} {"train_loss": -6.563083648681641, "global_step": 114369, "epoch": 2723} {"train_loss": -6.462174892425537, "global_step": 114370, "epoch": 2723} {"train_loss": -6.4989914894104, "global_step": 114371, "epoch": 2723} {"train_loss": -6.583280563354492, "global_step": 114372, "epoch": 2723} {"train_loss": -6.551137447357178, "global_step": 114373, "epoch": 2723} {"train_loss": -6.488559722900391, "global_step": 114374, "epoch": 2723} {"train_loss": -6.533836364746094, "global_step": 114375, "epoch": 2723} {"train_loss": -6.535623550415039, "global_step": 114376, "epoch": 2723} {"train_loss": -6.491278648376465, "global_step": 114377, "epoch": 2723} {"train_loss": -6.53585958480835, "global_step": 114378, "epoch": 2723} {"train_loss": -6.579002857208252, "global_step": 114379, "epoch": 2723} {"train_loss": -6.548266410827637, "global_step": 114380, "epoch": 2723} {"train_loss": -6.52510404586792, "global_step": 114381, "epoch": 2723} {"train_loss": -6.574383735656738, "global_step": 114382, "epoch": 2723} {"train_loss": -6.529200553894043, "global_step": 114383, "epoch": 2723} {"train_loss": -6.479374885559082, "global_step": 114384, "epoch": 2723} {"train_loss": -6.522594928741455, "global_step": 114385, "epoch": 2723} {"train_loss": -6.464937210083008, "global_step": 114386, "epoch": 2723} {"train_loss": -6.4889326095581055, "global_step": 114387, "epoch": 2723} {"train_loss": -6.5478515625, "global_step": 114388, "epoch": 2723} {"train_loss": -6.535266876220703, "global_step": 114389, "epoch": 2723} {"train_loss": -6.511478424072266, "global_step": 114390, "epoch": 2723} {"train_loss": -6.572900295257568, "global_step": 114391, "epoch": 2723} {"train_loss": -6.578299522399902, "global_step": 114392, "epoch": 2723} {"train_loss": -6.458522796630859, "global_step": 114393, "epoch": 2723} {"train_loss": -6.457546710968018, "global_step": 114394, "epoch": 2723} {"train_loss": -6.50473690032959, "global_step": 114395, "epoch": 2723} {"train_loss": -6.491048336029053, "global_step": 114396, "epoch": 2723} {"train_loss": -6.553389072418213, "global_step": 114397, "epoch": 2723} {"train_loss": -6.465276718139648, "global_step": 114398, "epoch": 2723} {"train_loss": -6.521162986755371, "global_step": 114399, "epoch": 2723} {"train_loss": -6.484119415283203, "global_step": 114400, "epoch": 2723} {"train_loss": -6.4265899658203125, "global_step": 114401, "epoch": 2723} {"train_loss": -6.5448126792907715, "global_step": 114402, "epoch": 2723} {"train_loss": -6.546348571777344, "global_step": 114403, "epoch": 2723} {"train_loss": -6.502571105957031, "global_step": 114404, "epoch": 2723} {"train_loss": -6.541011810302734, "global_step": 114405, "epoch": 2723} {"train_loss": -6.523460388183594, "global_step": 114406, "epoch": 2723} {"train_loss": -6.5200514793396, "global_step": 114407, "epoch": 2723, "val_loss": 65458.86328125} {"train_loss": -6.490231037139893, "global_step": 114408, "epoch": 2724} {"train_loss": -6.64449405670166, "global_step": 114409, "epoch": 2724} {"train_loss": -6.46873664855957, "global_step": 114410, "epoch": 2724} {"train_loss": -6.394407749176025, "global_step": 114411, "epoch": 2724} {"train_loss": -6.581559181213379, "global_step": 114412, "epoch": 2724} {"train_loss": -6.417843341827393, "global_step": 114413, "epoch": 2724} {"train_loss": -6.399263381958008, "global_step": 114414, "epoch": 2724} {"train_loss": -6.476004600524902, "global_step": 114415, "epoch": 2724} {"train_loss": -6.368012428283691, "global_step": 114416, "epoch": 2724} {"train_loss": -6.271105766296387, "global_step": 114417, "epoch": 2724} {"train_loss": -6.482325553894043, "global_step": 114418, "epoch": 2724} {"train_loss": -6.392911434173584, "global_step": 114419, "epoch": 2724} {"train_loss": -6.533293724060059, "global_step": 114420, "epoch": 2724} {"train_loss": -6.433742523193359, "global_step": 114421, "epoch": 2724} {"train_loss": -6.489982604980469, "global_step": 114422, "epoch": 2724} {"train_loss": -6.4799089431762695, "global_step": 114423, "epoch": 2724} {"train_loss": -6.319494247436523, "global_step": 114424, "epoch": 2724} {"train_loss": -6.530778884887695, "global_step": 114425, "epoch": 2724} {"train_loss": -6.380727767944336, "global_step": 114426, "epoch": 2724} {"train_loss": -6.484775066375732, "global_step": 114427, "epoch": 2724} {"train_loss": -6.507271766662598, "global_step": 114428, "epoch": 2724} {"train_loss": -6.501303195953369, "global_step": 114429, "epoch": 2724} {"train_loss": -6.528666973114014, "global_step": 114430, "epoch": 2724} {"train_loss": -6.553555965423584, "global_step": 114431, "epoch": 2724} {"train_loss": -6.431249618530273, "global_step": 114432, "epoch": 2724} {"train_loss": -6.335070610046387, "global_step": 114433, "epoch": 2724} {"train_loss": -6.430970191955566, "global_step": 114434, "epoch": 2724} {"train_loss": -6.42816162109375, "global_step": 114435, "epoch": 2724} {"train_loss": -6.523041725158691, "global_step": 114436, "epoch": 2724} {"train_loss": -6.329642295837402, "global_step": 114437, "epoch": 2724} {"train_loss": -6.498911380767822, "global_step": 114438, "epoch": 2724} {"train_loss": -6.326364994049072, "global_step": 114439, "epoch": 2724} {"train_loss": -6.398807048797607, "global_step": 114440, "epoch": 2724} {"train_loss": -6.462973117828369, "global_step": 114441, "epoch": 2724} {"train_loss": -6.369275093078613, "global_step": 114442, "epoch": 2724} {"train_loss": -6.473925590515137, "global_step": 114443, "epoch": 2724} {"train_loss": -6.3327155113220215, "global_step": 114444, "epoch": 2724} {"train_loss": -6.528345108032227, "global_step": 114445, "epoch": 2724} {"train_loss": -6.450905799865723, "global_step": 114446, "epoch": 2724} {"train_loss": -6.491298675537109, "global_step": 114447, "epoch": 2724} {"train_loss": -6.551025390625, "global_step": 114448, "epoch": 2724} {"train_loss": -6.452578919274466, "global_step": 114449, "epoch": 2724, "val_loss": 65468.5} {"train_loss": -6.465789318084717, "global_step": 114450, "epoch": 2725} {"train_loss": -6.432934284210205, "global_step": 114451, "epoch": 2725} {"train_loss": -6.582843780517578, "global_step": 114452, "epoch": 2725} {"train_loss": -6.4732666015625, "global_step": 114453, "epoch": 2725} {"train_loss": -6.519304275512695, "global_step": 114454, "epoch": 2725} {"train_loss": -6.577699661254883, "global_step": 114455, "epoch": 2725} {"train_loss": -6.461315155029297, "global_step": 114456, "epoch": 2725} {"train_loss": -6.570469856262207, "global_step": 114457, "epoch": 2725} {"train_loss": -6.679019451141357, "global_step": 114458, "epoch": 2725} {"train_loss": -6.534578800201416, "global_step": 114459, "epoch": 2725} {"train_loss": -6.542603492736816, "global_step": 114460, "epoch": 2725} {"train_loss": -6.416102886199951, "global_step": 114461, "epoch": 2725} {"train_loss": -6.560905456542969, "global_step": 114462, "epoch": 2725} {"train_loss": -6.451364040374756, "global_step": 114463, "epoch": 2725} {"train_loss": -6.505191802978516, "global_step": 114464, "epoch": 2725} {"train_loss": -6.520804405212402, "global_step": 114465, "epoch": 2725} {"train_loss": -6.445613861083984, "global_step": 114466, "epoch": 2725} {"train_loss": -6.502285003662109, "global_step": 114467, "epoch": 2725} {"train_loss": -6.499467849731445, "global_step": 114468, "epoch": 2725} {"train_loss": -6.408231735229492, "global_step": 114469, "epoch": 2725} {"train_loss": -6.489631652832031, "global_step": 114470, "epoch": 2725} {"train_loss": -6.516544342041016, "global_step": 114471, "epoch": 2725} {"train_loss": -6.457901954650879, "global_step": 114472, "epoch": 2725} {"train_loss": -6.512375831604004, "global_step": 114473, "epoch": 2725} {"train_loss": -6.4640350341796875, "global_step": 114474, "epoch": 2725} {"train_loss": -6.405081748962402, "global_step": 114475, "epoch": 2725} {"train_loss": -6.563723564147949, "global_step": 114476, "epoch": 2725} {"train_loss": -6.399360656738281, "global_step": 114477, "epoch": 2725} {"train_loss": -6.517214298248291, "global_step": 114478, "epoch": 2725} {"train_loss": -6.448423385620117, "global_step": 114479, "epoch": 2725} {"train_loss": -6.332991123199463, "global_step": 114480, "epoch": 2725} {"train_loss": -6.48050594329834, "global_step": 114481, "epoch": 2725} {"train_loss": -6.519052028656006, "global_step": 114482, "epoch": 2725} {"train_loss": -6.485264301300049, "global_step": 114483, "epoch": 2725} {"train_loss": -6.574294090270996, "global_step": 114484, "epoch": 2725} {"train_loss": -6.481423377990723, "global_step": 114485, "epoch": 2725} {"train_loss": -6.535503387451172, "global_step": 114486, "epoch": 2725} {"train_loss": -6.5641045570373535, "global_step": 114487, "epoch": 2725} {"train_loss": -6.549161434173584, "global_step": 114488, "epoch": 2725} {"train_loss": -6.5739240646362305, "global_step": 114489, "epoch": 2725} {"train_loss": -6.616756916046143, "global_step": 114490, "epoch": 2725} {"train_loss": -6.502619516281855, "global_step": 114491, "epoch": 2725, "val_loss": 65436.7734375} {"train_loss": -6.57755184173584, "global_step": 114492, "epoch": 2726} {"train_loss": -6.562033176422119, "global_step": 114493, "epoch": 2726} {"train_loss": -6.586435317993164, "global_step": 114494, "epoch": 2726} {"train_loss": -6.518346309661865, "global_step": 114495, "epoch": 2726} {"train_loss": -6.608414649963379, "global_step": 114496, "epoch": 2726} {"train_loss": -6.515753269195557, "global_step": 114497, "epoch": 2726} {"train_loss": -6.620683670043945, "global_step": 114498, "epoch": 2726} {"train_loss": -6.645794868469238, "global_step": 114499, "epoch": 2726} {"train_loss": -6.567574977874756, "global_step": 114500, "epoch": 2726} {"train_loss": -6.577065467834473, "global_step": 114501, "epoch": 2726} {"train_loss": -6.478972434997559, "global_step": 114502, "epoch": 2726} {"train_loss": -6.54384708404541, "global_step": 114503, "epoch": 2726} {"train_loss": -6.556715965270996, "global_step": 114504, "epoch": 2726} {"train_loss": -6.371058464050293, "global_step": 114505, "epoch": 2726} {"train_loss": -6.461680889129639, "global_step": 114506, "epoch": 2726} {"train_loss": -6.416290283203125, "global_step": 114507, "epoch": 2726} {"train_loss": -6.529669761657715, "global_step": 114508, "epoch": 2726} {"train_loss": -6.436334609985352, "global_step": 114509, "epoch": 2726} {"train_loss": -6.6050262451171875, "global_step": 114510, "epoch": 2726} {"train_loss": -6.362084865570068, "global_step": 114511, "epoch": 2726} {"train_loss": -6.562559604644775, "global_step": 114512, "epoch": 2726} {"train_loss": -6.560250282287598, "global_step": 114513, "epoch": 2726} {"train_loss": -6.360251426696777, "global_step": 114514, "epoch": 2726} {"train_loss": -6.417807102203369, "global_step": 114515, "epoch": 2726} {"train_loss": -6.412912368774414, "global_step": 114516, "epoch": 2726} {"train_loss": -6.514665603637695, "global_step": 114517, "epoch": 2726} {"train_loss": -6.517643928527832, "global_step": 114518, "epoch": 2726} {"train_loss": -6.446195125579834, "global_step": 114519, "epoch": 2726} {"train_loss": -6.506831169128418, "global_step": 114520, "epoch": 2726} {"train_loss": -6.552556991577148, "global_step": 114521, "epoch": 2726} {"train_loss": -6.42740535736084, "global_step": 114522, "epoch": 2726} {"train_loss": -6.54983377456665, "global_step": 114523, "epoch": 2726} {"train_loss": -6.505081653594971, "global_step": 114524, "epoch": 2726} {"train_loss": -6.5019683837890625, "global_step": 114525, "epoch": 2726} {"train_loss": -6.488060474395752, "global_step": 114526, "epoch": 2726} {"train_loss": -6.549100875854492, "global_step": 114527, "epoch": 2726} {"train_loss": -6.5024590492248535, "global_step": 114528, "epoch": 2726} {"train_loss": -6.51507043838501, "global_step": 114529, "epoch": 2726} {"train_loss": -6.540721893310547, "global_step": 114530, "epoch": 2726} {"train_loss": -6.591547012329102, "global_step": 114531, "epoch": 2726} {"train_loss": -6.589921951293945, "global_step": 114532, "epoch": 2726} {"train_loss": -6.515416304270427, "global_step": 114533, "epoch": 2726, "val_loss": 65367.1953125} {"train_loss": -6.600208759307861, "global_step": 114534, "epoch": 2727} {"train_loss": -6.548595428466797, "global_step": 114535, "epoch": 2727} {"train_loss": -6.509006500244141, "global_step": 114536, "epoch": 2727} {"train_loss": -6.512703895568848, "global_step": 114537, "epoch": 2727} {"train_loss": -6.465800762176514, "global_step": 114538, "epoch": 2727} {"train_loss": -6.451575756072998, "global_step": 114539, "epoch": 2727} {"train_loss": -6.503661155700684, "global_step": 114540, "epoch": 2727} {"train_loss": -6.558152675628662, "global_step": 114541, "epoch": 2727} {"train_loss": -6.448431968688965, "global_step": 114542, "epoch": 2727} {"train_loss": -6.556271553039551, "global_step": 114543, "epoch": 2727} {"train_loss": -6.612602233886719, "global_step": 114544, "epoch": 2727} {"train_loss": -6.528286933898926, "global_step": 114545, "epoch": 2727} {"train_loss": -6.444521427154541, "global_step": 114546, "epoch": 2727} {"train_loss": -6.591313362121582, "global_step": 114547, "epoch": 2727} {"train_loss": -6.488847732543945, "global_step": 114548, "epoch": 2727} {"train_loss": -6.493865013122559, "global_step": 114549, "epoch": 2727} {"train_loss": -6.519138336181641, "global_step": 114550, "epoch": 2727} {"train_loss": -6.47520637512207, "global_step": 114551, "epoch": 2727} {"train_loss": -6.463007926940918, "global_step": 114552, "epoch": 2727} {"train_loss": -6.48476505279541, "global_step": 114553, "epoch": 2727} {"train_loss": -6.526156425476074, "global_step": 114554, "epoch": 2727} {"train_loss": -6.479698181152344, "global_step": 114555, "epoch": 2727} {"train_loss": -6.399844169616699, "global_step": 114556, "epoch": 2727} {"train_loss": -6.517858028411865, "global_step": 114557, "epoch": 2727} {"train_loss": -6.457690238952637, "global_step": 114558, "epoch": 2727} {"train_loss": -6.3848466873168945, "global_step": 114559, "epoch": 2727} {"train_loss": -6.445774078369141, "global_step": 114560, "epoch": 2727} {"train_loss": -6.396162509918213, "global_step": 114561, "epoch": 2727} {"train_loss": -6.514233589172363, "global_step": 114562, "epoch": 2727} {"train_loss": -6.407963752746582, "global_step": 114563, "epoch": 2727} {"train_loss": -6.377665042877197, "global_step": 114564, "epoch": 2727} {"train_loss": -6.530775547027588, "global_step": 114565, "epoch": 2727} {"train_loss": -6.360134124755859, "global_step": 114566, "epoch": 2727} {"train_loss": -6.432669639587402, "global_step": 114567, "epoch": 2727} {"train_loss": -6.488389015197754, "global_step": 114568, "epoch": 2727} {"train_loss": -6.42059326171875, "global_step": 114569, "epoch": 2727} {"train_loss": -6.535006523132324, "global_step": 114570, "epoch": 2727} {"train_loss": -6.401378631591797, "global_step": 114571, "epoch": 2727} {"train_loss": -6.486832141876221, "global_step": 114572, "epoch": 2727} {"train_loss": -6.460253715515137, "global_step": 114573, "epoch": 2727} {"train_loss": -6.538491249084473, "global_step": 114574, "epoch": 2727} {"train_loss": -6.477635315486363, "global_step": 114575, "epoch": 2727, "val_loss": 65214.5234375} {"train_loss": -6.464208126068115, "global_step": 114576, "epoch": 2728} {"train_loss": -6.405615329742432, "global_step": 114577, "epoch": 2728} {"train_loss": -6.557766914367676, "global_step": 114578, "epoch": 2728} {"train_loss": -6.483607769012451, "global_step": 114579, "epoch": 2728} {"train_loss": -6.520228385925293, "global_step": 114580, "epoch": 2728} {"train_loss": -6.503712177276611, "global_step": 114581, "epoch": 2728} {"train_loss": -6.50064754486084, "global_step": 114582, "epoch": 2728} {"train_loss": -6.448296070098877, "global_step": 114583, "epoch": 2728} {"train_loss": -6.523846626281738, "global_step": 114584, "epoch": 2728} {"train_loss": -6.605526924133301, "global_step": 114585, "epoch": 2728} {"train_loss": -6.4910430908203125, "global_step": 114586, "epoch": 2728} {"train_loss": -6.5335893630981445, "global_step": 114587, "epoch": 2728} {"train_loss": -6.386662483215332, "global_step": 114588, "epoch": 2728} {"train_loss": -6.592451095581055, "global_step": 114589, "epoch": 2728} {"train_loss": -6.573742389678955, "global_step": 114590, "epoch": 2728} {"train_loss": -6.567287921905518, "global_step": 114591, "epoch": 2728} {"train_loss": -6.5192461013793945, "global_step": 114592, "epoch": 2728} {"train_loss": -6.674040794372559, "global_step": 114593, "epoch": 2728} {"train_loss": -6.51918888092041, "global_step": 114594, "epoch": 2728} {"train_loss": -6.525817394256592, "global_step": 114595, "epoch": 2728} {"train_loss": -6.50071907043457, "global_step": 114596, "epoch": 2728} {"train_loss": -6.613753318786621, "global_step": 114597, "epoch": 2728} {"train_loss": -6.492805480957031, "global_step": 114598, "epoch": 2728} {"train_loss": -6.462123870849609, "global_step": 114599, "epoch": 2728} {"train_loss": -6.453200817108154, "global_step": 114600, "epoch": 2728} {"train_loss": -6.566071510314941, "global_step": 114601, "epoch": 2728} {"train_loss": -6.503201961517334, "global_step": 114602, "epoch": 2728} {"train_loss": -6.516815185546875, "global_step": 114603, "epoch": 2728} {"train_loss": -6.550051212310791, "global_step": 114604, "epoch": 2728} {"train_loss": -6.516094207763672, "global_step": 114605, "epoch": 2728} {"train_loss": -6.4556169509887695, "global_step": 114606, "epoch": 2728} {"train_loss": -6.541049003601074, "global_step": 114607, "epoch": 2728} {"train_loss": -6.596636772155762, "global_step": 114608, "epoch": 2728} {"train_loss": -6.528465270996094, "global_step": 114609, "epoch": 2728} {"train_loss": -6.477079391479492, "global_step": 114610, "epoch": 2728} {"train_loss": -6.552680015563965, "global_step": 114611, "epoch": 2728} {"train_loss": -6.45781946182251, "global_step": 114612, "epoch": 2728} {"train_loss": -6.582777500152588, "global_step": 114613, "epoch": 2728} {"train_loss": -6.614144802093506, "global_step": 114614, "epoch": 2728} {"train_loss": -6.581602573394775, "global_step": 114615, "epoch": 2728} {"train_loss": -6.520404815673828, "global_step": 114616, "epoch": 2728} {"train_loss": -6.524516684668405, "global_step": 114617, "epoch": 2728, "val_loss": 65299.2265625} {"train_loss": -6.521519660949707, "global_step": 114618, "epoch": 2729} {"train_loss": -6.722830772399902, "global_step": 114619, "epoch": 2729} {"train_loss": -6.472534656524658, "global_step": 114620, "epoch": 2729} {"train_loss": -6.450156211853027, "global_step": 114621, "epoch": 2729} {"train_loss": -6.649064064025879, "global_step": 114622, "epoch": 2729} {"train_loss": -6.6434197425842285, "global_step": 114623, "epoch": 2729} {"train_loss": -6.556039810180664, "global_step": 114624, "epoch": 2729} {"train_loss": -6.571106910705566, "global_step": 114625, "epoch": 2729} {"train_loss": -6.604899883270264, "global_step": 114626, "epoch": 2729} {"train_loss": -6.523771286010742, "global_step": 114627, "epoch": 2729} {"train_loss": -6.5477190017700195, "global_step": 114628, "epoch": 2729} {"train_loss": -6.520862579345703, "global_step": 114629, "epoch": 2729} {"train_loss": -6.490796089172363, "global_step": 114630, "epoch": 2729} {"train_loss": -6.538224220275879, "global_step": 114631, "epoch": 2729} {"train_loss": -6.498512268066406, "global_step": 114632, "epoch": 2729} {"train_loss": -6.603493690490723, "global_step": 114633, "epoch": 2729} {"train_loss": -6.560057640075684, "global_step": 114634, "epoch": 2729} {"train_loss": -6.503066062927246, "global_step": 114635, "epoch": 2729} {"train_loss": -6.5423173904418945, "global_step": 114636, "epoch": 2729} {"train_loss": -6.491603851318359, "global_step": 114637, "epoch": 2729} {"train_loss": -6.530467510223389, "global_step": 114638, "epoch": 2729} {"train_loss": -6.549656867980957, "global_step": 114639, "epoch": 2729} {"train_loss": -6.621272087097168, "global_step": 114640, "epoch": 2729} {"train_loss": -6.526218891143799, "global_step": 114641, "epoch": 2729} {"train_loss": -6.461905479431152, "global_step": 114642, "epoch": 2729} {"train_loss": -6.679105281829834, "global_step": 114643, "epoch": 2729} {"train_loss": -6.63214111328125, "global_step": 114644, "epoch": 2729} {"train_loss": -6.512532711029053, "global_step": 114645, "epoch": 2729} {"train_loss": -6.530643939971924, "global_step": 114646, "epoch": 2729} {"train_loss": -6.320878982543945, "global_step": 114647, "epoch": 2729} {"train_loss": -6.5428972244262695, "global_step": 114648, "epoch": 2729} {"train_loss": -6.532034873962402, "global_step": 114649, "epoch": 2729} {"train_loss": -6.617441177368164, "global_step": 114650, "epoch": 2729} {"train_loss": -6.541922569274902, "global_step": 114651, "epoch": 2729} {"train_loss": -6.554989814758301, "global_step": 114652, "epoch": 2729} {"train_loss": -6.544300556182861, "global_step": 114653, "epoch": 2729} {"train_loss": -6.4863386154174805, "global_step": 114654, "epoch": 2729} {"train_loss": -6.564303398132324, "global_step": 114655, "epoch": 2729} {"train_loss": -6.573002338409424, "global_step": 114656, "epoch": 2729} {"train_loss": -6.57908821105957, "global_step": 114657, "epoch": 2729} {"train_loss": -6.550168037414551, "global_step": 114658, "epoch": 2729} {"train_loss": -6.548194556009202, "global_step": 114659, "epoch": 2729, "val_loss": 65131.296875} {"train_loss": -6.559007167816162, "global_step": 114660, "epoch": 2730} {"train_loss": -6.558067321777344, "global_step": 114661, "epoch": 2730} {"train_loss": -6.521661758422852, "global_step": 114662, "epoch": 2730} {"train_loss": -6.604153633117676, "global_step": 114663, "epoch": 2730} {"train_loss": -6.452476501464844, "global_step": 114664, "epoch": 2730} {"train_loss": -6.619163513183594, "global_step": 114665, "epoch": 2730} {"train_loss": -6.452425956726074, "global_step": 114666, "epoch": 2730} {"train_loss": -6.4749436378479, "global_step": 114667, "epoch": 2730} {"train_loss": -6.586798191070557, "global_step": 114668, "epoch": 2730} {"train_loss": -6.36293888092041, "global_step": 114669, "epoch": 2730} {"train_loss": -6.473923683166504, "global_step": 114670, "epoch": 2730} {"train_loss": -6.435683250427246, "global_step": 114671, "epoch": 2730} {"train_loss": -6.471127510070801, "global_step": 114672, "epoch": 2730} {"train_loss": -6.48349666595459, "global_step": 114673, "epoch": 2730} {"train_loss": -6.510844707489014, "global_step": 114674, "epoch": 2730} {"train_loss": -6.639822959899902, "global_step": 114675, "epoch": 2730} {"train_loss": -6.692636966705322, "global_step": 114676, "epoch": 2730} {"train_loss": -6.488078594207764, "global_step": 114677, "epoch": 2730} {"train_loss": -6.704463958740234, "global_step": 114678, "epoch": 2730} {"train_loss": -6.5992889404296875, "global_step": 114679, "epoch": 2730} {"train_loss": -6.684200286865234, "global_step": 114680, "epoch": 2730} {"train_loss": -6.528285026550293, "global_step": 114681, "epoch": 2730} {"train_loss": -6.561331748962402, "global_step": 114682, "epoch": 2730} {"train_loss": -6.416337013244629, "global_step": 114683, "epoch": 2730} {"train_loss": -6.436461925506592, "global_step": 114684, "epoch": 2730} {"train_loss": -6.545727252960205, "global_step": 114685, "epoch": 2730} {"train_loss": -6.569778919219971, "global_step": 114686, "epoch": 2730} {"train_loss": -6.6032185554504395, "global_step": 114687, "epoch": 2730} {"train_loss": -6.633990287780762, "global_step": 114688, "epoch": 2730} {"train_loss": -6.686229705810547, "global_step": 114689, "epoch": 2730} {"train_loss": -6.555517196655273, "global_step": 114690, "epoch": 2730} {"train_loss": -6.580196380615234, "global_step": 114691, "epoch": 2730} {"train_loss": -6.538402557373047, "global_step": 114692, "epoch": 2730} {"train_loss": -6.593699932098389, "global_step": 114693, "epoch": 2730} {"train_loss": -6.480915069580078, "global_step": 114694, "epoch": 2730} {"train_loss": -6.517251014709473, "global_step": 114695, "epoch": 2730} {"train_loss": -6.55275821685791, "global_step": 114696, "epoch": 2730} {"train_loss": -6.510558128356934, "global_step": 114697, "epoch": 2730} {"train_loss": -6.506343841552734, "global_step": 114698, "epoch": 2730} {"train_loss": -6.504262924194336, "global_step": 114699, "epoch": 2730} {"train_loss": -6.5675554275512695, "global_step": 114700, "epoch": 2730} {"train_loss": -6.543369122913906, "global_step": 114701, "epoch": 2730, "val_loss": 65136.8828125} {"train_loss": -6.569663047790527, "global_step": 114702, "epoch": 2731} {"train_loss": -6.527952194213867, "global_step": 114703, "epoch": 2731} {"train_loss": -6.542161464691162, "global_step": 114704, "epoch": 2731} {"train_loss": -6.441493034362793, "global_step": 114705, "epoch": 2731} {"train_loss": -6.478395462036133, "global_step": 114706, "epoch": 2731} {"train_loss": -6.576138973236084, "global_step": 114707, "epoch": 2731} {"train_loss": -6.413912296295166, "global_step": 114708, "epoch": 2731} {"train_loss": -6.503658294677734, "global_step": 114709, "epoch": 2731} {"train_loss": -6.581052303314209, "global_step": 114710, "epoch": 2731} {"train_loss": -6.468439102172852, "global_step": 114711, "epoch": 2731} {"train_loss": -6.432821273803711, "global_step": 114712, "epoch": 2731} {"train_loss": -6.451672554016113, "global_step": 114713, "epoch": 2731} {"train_loss": -6.59307861328125, "global_step": 114714, "epoch": 2731} {"train_loss": -6.5638837814331055, "global_step": 114715, "epoch": 2731} {"train_loss": -6.598834991455078, "global_step": 114716, "epoch": 2731} {"train_loss": -6.708759307861328, "global_step": 114717, "epoch": 2731} {"train_loss": -6.701959133148193, "global_step": 114718, "epoch": 2731} {"train_loss": -6.664662837982178, "global_step": 114719, "epoch": 2731} {"train_loss": -6.592876434326172, "global_step": 114720, "epoch": 2731} {"train_loss": -6.525307655334473, "global_step": 114721, "epoch": 2731} {"train_loss": -6.474801063537598, "global_step": 114722, "epoch": 2731} {"train_loss": -6.605494976043701, "global_step": 114723, "epoch": 2731} {"train_loss": -6.659815788269043, "global_step": 114724, "epoch": 2731} {"train_loss": -6.602104663848877, "global_step": 114725, "epoch": 2731} {"train_loss": -6.4870219230651855, "global_step": 114726, "epoch": 2731} {"train_loss": -6.666655540466309, "global_step": 114727, "epoch": 2731} {"train_loss": -6.512996673583984, "global_step": 114728, "epoch": 2731} {"train_loss": -6.6248626708984375, "global_step": 114729, "epoch": 2731} {"train_loss": -6.554135322570801, "global_step": 114730, "epoch": 2731} {"train_loss": -6.572754859924316, "global_step": 114731, "epoch": 2731} {"train_loss": -6.344525337219238, "global_step": 114732, "epoch": 2731} {"train_loss": -6.468240737915039, "global_step": 114733, "epoch": 2731} {"train_loss": -6.461032867431641, "global_step": 114734, "epoch": 2731} {"train_loss": -6.4409308433532715, "global_step": 114735, "epoch": 2731} {"train_loss": -6.362898826599121, "global_step": 114736, "epoch": 2731} {"train_loss": -6.537633895874023, "global_step": 114737, "epoch": 2731} {"train_loss": -6.552911758422852, "global_step": 114738, "epoch": 2731} {"train_loss": -6.521780014038086, "global_step": 114739, "epoch": 2731} {"train_loss": -6.520803928375244, "global_step": 114740, "epoch": 2731} {"train_loss": -6.425838470458984, "global_step": 114741, "epoch": 2731} {"train_loss": -6.421355247497559, "global_step": 114742, "epoch": 2731} {"train_loss": -6.533166317712693, "global_step": 114743, "epoch": 2731, "val_loss": 65042.34765625} {"train_loss": -6.495206356048584, "global_step": 114744, "epoch": 2732} {"train_loss": -6.545967102050781, "global_step": 114745, "epoch": 2732} {"train_loss": -6.4298996925354, "global_step": 114746, "epoch": 2732} {"train_loss": -6.461152076721191, "global_step": 114747, "epoch": 2732} {"train_loss": -6.346399784088135, "global_step": 114748, "epoch": 2732} {"train_loss": -6.46278190612793, "global_step": 114749, "epoch": 2732} {"train_loss": -6.439079284667969, "global_step": 114750, "epoch": 2732} {"train_loss": -6.321514129638672, "global_step": 114751, "epoch": 2732} {"train_loss": -6.578150749206543, "global_step": 114752, "epoch": 2732} {"train_loss": -6.378548622131348, "global_step": 114753, "epoch": 2732} {"train_loss": -6.407834529876709, "global_step": 114754, "epoch": 2732} {"train_loss": -6.369449138641357, "global_step": 114755, "epoch": 2732} {"train_loss": -6.4077959060668945, "global_step": 114756, "epoch": 2732} {"train_loss": -6.399624347686768, "global_step": 114757, "epoch": 2732} {"train_loss": -6.339137077331543, "global_step": 114758, "epoch": 2732} {"train_loss": -6.400797367095947, "global_step": 114759, "epoch": 2732} {"train_loss": -6.2974138259887695, "global_step": 114760, "epoch": 2732} {"train_loss": -6.47678279876709, "global_step": 114761, "epoch": 2732} {"train_loss": -6.261880397796631, "global_step": 114762, "epoch": 2732} {"train_loss": -6.498232841491699, "global_step": 114763, "epoch": 2732} {"train_loss": -6.312258720397949, "global_step": 114764, "epoch": 2732} {"train_loss": -6.419676780700684, "global_step": 114765, "epoch": 2732} {"train_loss": -6.469042778015137, "global_step": 114766, "epoch": 2732} {"train_loss": -6.430089473724365, "global_step": 114767, "epoch": 2732} {"train_loss": -6.498168468475342, "global_step": 114768, "epoch": 2732} {"train_loss": -6.452042579650879, "global_step": 114769, "epoch": 2732} {"train_loss": -6.518091201782227, "global_step": 114770, "epoch": 2732} {"train_loss": -6.554555892944336, "global_step": 114771, "epoch": 2732} {"train_loss": -6.4079084396362305, "global_step": 114772, "epoch": 2732} {"train_loss": -6.463857650756836, "global_step": 114773, "epoch": 2732} {"train_loss": -6.514379501342773, "global_step": 114774, "epoch": 2732} {"train_loss": -6.38063907623291, "global_step": 114775, "epoch": 2732} {"train_loss": -6.454856872558594, "global_step": 114776, "epoch": 2732} {"train_loss": -6.480161190032959, "global_step": 114777, "epoch": 2732} {"train_loss": -6.4379472732543945, "global_step": 114778, "epoch": 2732} {"train_loss": -6.535701751708984, "global_step": 114779, "epoch": 2732} {"train_loss": -6.569403648376465, "global_step": 114780, "epoch": 2732} {"train_loss": -6.624819278717041, "global_step": 114781, "epoch": 2732} {"train_loss": -6.4796013832092285, "global_step": 114782, "epoch": 2732} {"train_loss": -6.395175933837891, "global_step": 114783, "epoch": 2732} {"train_loss": -6.4980363845825195, "global_step": 114784, "epoch": 2732} {"train_loss": -6.4458930151803155, "global_step": 114785, "epoch": 2732, "val_loss": 65145.3359375} {"train_loss": -6.5870256423950195, "global_step": 114786, "epoch": 2733} {"train_loss": -6.505748748779297, "global_step": 114787, "epoch": 2733} {"train_loss": -6.496526718139648, "global_step": 114788, "epoch": 2733} {"train_loss": -6.43598747253418, "global_step": 114789, "epoch": 2733} {"train_loss": -6.454395294189453, "global_step": 114790, "epoch": 2733} {"train_loss": -6.589145660400391, "global_step": 114791, "epoch": 2733} {"train_loss": -6.651296138763428, "global_step": 114792, "epoch": 2733} {"train_loss": -6.527775764465332, "global_step": 114793, "epoch": 2733} {"train_loss": -6.534273147583008, "global_step": 114794, "epoch": 2733} {"train_loss": -6.452587127685547, "global_step": 114795, "epoch": 2733} {"train_loss": -6.534703731536865, "global_step": 114796, "epoch": 2733} {"train_loss": -6.614650249481201, "global_step": 114797, "epoch": 2733} {"train_loss": -6.507267951965332, "global_step": 114798, "epoch": 2733} {"train_loss": -6.546568870544434, "global_step": 114799, "epoch": 2733} {"train_loss": -6.57679557800293, "global_step": 114800, "epoch": 2733} {"train_loss": -6.507137298583984, "global_step": 114801, "epoch": 2733} {"train_loss": -6.510468006134033, "global_step": 114802, "epoch": 2733} {"train_loss": -6.524076461791992, "global_step": 114803, "epoch": 2733} {"train_loss": -6.440803527832031, "global_step": 114804, "epoch": 2733} {"train_loss": -6.555541038513184, "global_step": 114805, "epoch": 2733} {"train_loss": -6.415789604187012, "global_step": 114806, "epoch": 2733} {"train_loss": -6.643746376037598, "global_step": 114807, "epoch": 2733} {"train_loss": -6.540570259094238, "global_step": 114808, "epoch": 2733} {"train_loss": -6.472492218017578, "global_step": 114809, "epoch": 2733} {"train_loss": -6.503883361816406, "global_step": 114810, "epoch": 2733} {"train_loss": -6.536723613739014, "global_step": 114811, "epoch": 2733} {"train_loss": -6.563599109649658, "global_step": 114812, "epoch": 2733} {"train_loss": -6.579485893249512, "global_step": 114813, "epoch": 2733} {"train_loss": -6.496593475341797, "global_step": 114814, "epoch": 2733} {"train_loss": -6.520867347717285, "global_step": 114815, "epoch": 2733} {"train_loss": -6.556933403015137, "global_step": 114816, "epoch": 2733} {"train_loss": -6.407104969024658, "global_step": 114817, "epoch": 2733} {"train_loss": -6.558145523071289, "global_step": 114818, "epoch": 2733} {"train_loss": -6.432636260986328, "global_step": 114819, "epoch": 2733} {"train_loss": -6.517683982849121, "global_step": 114820, "epoch": 2733} {"train_loss": -6.494262218475342, "global_step": 114821, "epoch": 2733} {"train_loss": -6.556293487548828, "global_step": 114822, "epoch": 2733} {"train_loss": -6.568943500518799, "global_step": 114823, "epoch": 2733} {"train_loss": -6.371779918670654, "global_step": 114824, "epoch": 2733} {"train_loss": -6.647878646850586, "global_step": 114825, "epoch": 2733} {"train_loss": -6.437851428985596, "global_step": 114826, "epoch": 2733} {"train_loss": -6.5191060815538675, "global_step": 114827, "epoch": 2733, "val_loss": 65090.109375} {"train_loss": -6.634325981140137, "global_step": 114828, "epoch": 2734} {"train_loss": -6.508066177368164, "global_step": 114829, "epoch": 2734} {"train_loss": -6.5680317878723145, "global_step": 114830, "epoch": 2734} {"train_loss": -6.457152366638184, "global_step": 114831, "epoch": 2734} {"train_loss": -6.354158401489258, "global_step": 114832, "epoch": 2734} {"train_loss": -6.432805061340332, "global_step": 114833, "epoch": 2734} {"train_loss": -6.600992202758789, "global_step": 114834, "epoch": 2734} {"train_loss": -6.388068199157715, "global_step": 114835, "epoch": 2734} {"train_loss": -6.537718772888184, "global_step": 114836, "epoch": 2734} {"train_loss": -6.615116119384766, "global_step": 114837, "epoch": 2734} {"train_loss": -6.451325416564941, "global_step": 114838, "epoch": 2734} {"train_loss": -6.580820560455322, "global_step": 114839, "epoch": 2734} {"train_loss": -6.493054389953613, "global_step": 114840, "epoch": 2734} {"train_loss": -6.451538562774658, "global_step": 114841, "epoch": 2734} {"train_loss": -6.48849630355835, "global_step": 114842, "epoch": 2734} {"train_loss": -6.4502153396606445, "global_step": 114843, "epoch": 2734} {"train_loss": -6.428134441375732, "global_step": 114844, "epoch": 2734} {"train_loss": -6.4359846115112305, "global_step": 114845, "epoch": 2734} {"train_loss": -6.580575942993164, "global_step": 114846, "epoch": 2734} {"train_loss": -6.396821975708008, "global_step": 114847, "epoch": 2734} {"train_loss": -6.4078826904296875, "global_step": 114848, "epoch": 2734} {"train_loss": -6.5061726570129395, "global_step": 114849, "epoch": 2734} {"train_loss": -6.410320281982422, "global_step": 114850, "epoch": 2734} {"train_loss": -6.5041117668151855, "global_step": 114851, "epoch": 2734} {"train_loss": -6.493930339813232, "global_step": 114852, "epoch": 2734} {"train_loss": -6.478494644165039, "global_step": 114853, "epoch": 2734} {"train_loss": -6.504669189453125, "global_step": 114854, "epoch": 2734} {"train_loss": -6.4717512130737305, "global_step": 114855, "epoch": 2734} {"train_loss": -6.467846393585205, "global_step": 114856, "epoch": 2734} {"train_loss": -6.618869781494141, "global_step": 114857, "epoch": 2734} {"train_loss": -6.581197738647461, "global_step": 114858, "epoch": 2734} {"train_loss": -6.452944755554199, "global_step": 114859, "epoch": 2734} {"train_loss": -6.572841167449951, "global_step": 114860, "epoch": 2734} {"train_loss": -6.469296455383301, "global_step": 114861, "epoch": 2734} {"train_loss": -6.485263347625732, "global_step": 114862, "epoch": 2734} {"train_loss": -6.503247261047363, "global_step": 114863, "epoch": 2734} {"train_loss": -6.481865882873535, "global_step": 114864, "epoch": 2734} {"train_loss": -6.486565589904785, "global_step": 114865, "epoch": 2734} {"train_loss": -6.478650093078613, "global_step": 114866, "epoch": 2734} {"train_loss": -6.494932651519775, "global_step": 114867, "epoch": 2734} {"train_loss": -6.563666343688965, "global_step": 114868, "epoch": 2734} {"train_loss": -6.49734167825608, "global_step": 114869, "epoch": 2734, "val_loss": 65531.58203125} {"train_loss": -6.505366802215576, "global_step": 114870, "epoch": 2735} {"train_loss": -6.478273868560791, "global_step": 114871, "epoch": 2735} {"train_loss": -6.51167631149292, "global_step": 114872, "epoch": 2735} {"train_loss": -6.487915992736816, "global_step": 114873, "epoch": 2735} {"train_loss": -6.500635623931885, "global_step": 114874, "epoch": 2735} {"train_loss": -6.544692516326904, "global_step": 114875, "epoch": 2735} {"train_loss": -6.485569953918457, "global_step": 114876, "epoch": 2735} {"train_loss": -6.58797550201416, "global_step": 114877, "epoch": 2735} {"train_loss": -6.454080581665039, "global_step": 114878, "epoch": 2735} {"train_loss": -6.600961208343506, "global_step": 114879, "epoch": 2735} {"train_loss": -6.476629257202148, "global_step": 114880, "epoch": 2735} {"train_loss": -6.47742223739624, "global_step": 114881, "epoch": 2735} {"train_loss": -6.546464920043945, "global_step": 114882, "epoch": 2735} {"train_loss": -6.464415550231934, "global_step": 114883, "epoch": 2735} {"train_loss": -6.54660177230835, "global_step": 114884, "epoch": 2735} {"train_loss": -6.537552833557129, "global_step": 114885, "epoch": 2735} {"train_loss": -6.479964733123779, "global_step": 114886, "epoch": 2735} {"train_loss": -6.354981899261475, "global_step": 114887, "epoch": 2735} {"train_loss": -6.476278781890869, "global_step": 114888, "epoch": 2735} {"train_loss": -6.400271892547607, "global_step": 114889, "epoch": 2735} {"train_loss": -6.4262590408325195, "global_step": 114890, "epoch": 2735} {"train_loss": -6.458347320556641, "global_step": 114891, "epoch": 2735} {"train_loss": -6.467355728149414, "global_step": 114892, "epoch": 2735} {"train_loss": -6.392827033996582, "global_step": 114893, "epoch": 2735} {"train_loss": -6.517420768737793, "global_step": 114894, "epoch": 2735} {"train_loss": -6.356534004211426, "global_step": 114895, "epoch": 2735} {"train_loss": -6.504022598266602, "global_step": 114896, "epoch": 2735} {"train_loss": -6.476884841918945, "global_step": 114897, "epoch": 2735} {"train_loss": -6.552107334136963, "global_step": 114898, "epoch": 2735} {"train_loss": -6.476086139678955, "global_step": 114899, "epoch": 2735} {"train_loss": -6.540183067321777, "global_step": 114900, "epoch": 2735} {"train_loss": -6.490387916564941, "global_step": 114901, "epoch": 2735} {"train_loss": -6.474430084228516, "global_step": 114902, "epoch": 2735} {"train_loss": -6.436405658721924, "global_step": 114903, "epoch": 2735} {"train_loss": -6.449062347412109, "global_step": 114904, "epoch": 2735} {"train_loss": -6.53751277923584, "global_step": 114905, "epoch": 2735} {"train_loss": -6.494228363037109, "global_step": 114906, "epoch": 2735} {"train_loss": -6.6337456703186035, "global_step": 114907, "epoch": 2735} {"train_loss": -6.520576477050781, "global_step": 114908, "epoch": 2735} {"train_loss": -6.519514083862305, "global_step": 114909, "epoch": 2735} {"train_loss": -6.585186958312988, "global_step": 114910, "epoch": 2735} {"train_loss": -6.494001990272885, "global_step": 114911, "epoch": 2735, "val_loss": 65431.77734375} {"train_loss": -6.4823384284973145, "global_step": 114912, "epoch": 2736} {"train_loss": -6.5952653884887695, "global_step": 114913, "epoch": 2736} {"train_loss": -6.5907135009765625, "global_step": 114914, "epoch": 2736} {"train_loss": -6.522909641265869, "global_step": 114915, "epoch": 2736} {"train_loss": -6.612677097320557, "global_step": 114916, "epoch": 2736} {"train_loss": -6.514819145202637, "global_step": 114917, "epoch": 2736} {"train_loss": -6.519718647003174, "global_step": 114918, "epoch": 2736} {"train_loss": -6.589016914367676, "global_step": 114919, "epoch": 2736} {"train_loss": -6.477513313293457, "global_step": 114920, "epoch": 2736} {"train_loss": -6.489199638366699, "global_step": 114921, "epoch": 2736} {"train_loss": -6.580489158630371, "global_step": 114922, "epoch": 2736} {"train_loss": -6.635173797607422, "global_step": 114923, "epoch": 2736} {"train_loss": -6.532931327819824, "global_step": 114924, "epoch": 2736} {"train_loss": -6.526089668273926, "global_step": 114925, "epoch": 2736} {"train_loss": -6.457417964935303, "global_step": 114926, "epoch": 2736} {"train_loss": -6.5456647872924805, "global_step": 114927, "epoch": 2736} {"train_loss": -6.429555892944336, "global_step": 114928, "epoch": 2736} {"train_loss": -6.4144287109375, "global_step": 114929, "epoch": 2736} {"train_loss": -6.5806169509887695, "global_step": 114930, "epoch": 2736} {"train_loss": -6.392889022827148, "global_step": 114931, "epoch": 2736} {"train_loss": -6.540740013122559, "global_step": 114932, "epoch": 2736} {"train_loss": -6.490196228027344, "global_step": 114933, "epoch": 2736} {"train_loss": -6.463292598724365, "global_step": 114934, "epoch": 2736} {"train_loss": -6.515420913696289, "global_step": 114935, "epoch": 2736} {"train_loss": -6.561964988708496, "global_step": 114936, "epoch": 2736} {"train_loss": -6.3289265632629395, "global_step": 114937, "epoch": 2736} {"train_loss": -6.5064311027526855, "global_step": 114938, "epoch": 2736} {"train_loss": -6.524594306945801, "global_step": 114939, "epoch": 2736} {"train_loss": -6.501344203948975, "global_step": 114940, "epoch": 2736} {"train_loss": -6.533383846282959, "global_step": 114941, "epoch": 2736} {"train_loss": -6.520819664001465, "global_step": 114942, "epoch": 2736} {"train_loss": -6.636930465698242, "global_step": 114943, "epoch": 2736} {"train_loss": -6.553607940673828, "global_step": 114944, "epoch": 2736} {"train_loss": -6.587502479553223, "global_step": 114945, "epoch": 2736} {"train_loss": -6.461233139038086, "global_step": 114946, "epoch": 2736} {"train_loss": -6.404640197753906, "global_step": 114947, "epoch": 2736} {"train_loss": -6.498908996582031, "global_step": 114948, "epoch": 2736} {"train_loss": -6.575898170471191, "global_step": 114949, "epoch": 2736} {"train_loss": -6.422272682189941, "global_step": 114950, "epoch": 2736} {"train_loss": -6.465295791625977, "global_step": 114951, "epoch": 2736} {"train_loss": -6.463707447052002, "global_step": 114952, "epoch": 2736} {"train_loss": -6.512441374006725, "global_step": 114953, "epoch": 2736, "val_loss": 65315.15625} {"train_loss": -6.466841697692871, "global_step": 114954, "epoch": 2737} {"train_loss": -6.519566535949707, "global_step": 114955, "epoch": 2737} {"train_loss": -6.543511390686035, "global_step": 114956, "epoch": 2737} {"train_loss": -6.464919090270996, "global_step": 114957, "epoch": 2737} {"train_loss": -6.542038917541504, "global_step": 114958, "epoch": 2737} {"train_loss": -6.410351753234863, "global_step": 114959, "epoch": 2737} {"train_loss": -6.572483539581299, "global_step": 114960, "epoch": 2737} {"train_loss": -6.512131690979004, "global_step": 114961, "epoch": 2737} {"train_loss": -6.449815273284912, "global_step": 114962, "epoch": 2737} {"train_loss": -6.506143093109131, "global_step": 114963, "epoch": 2737} {"train_loss": -6.433096408843994, "global_step": 114964, "epoch": 2737} {"train_loss": -6.583633899688721, "global_step": 114965, "epoch": 2737} {"train_loss": -6.532172203063965, "global_step": 114966, "epoch": 2737} {"train_loss": -6.324911117553711, "global_step": 114967, "epoch": 2737} {"train_loss": -6.544206142425537, "global_step": 114968, "epoch": 2737} {"train_loss": -6.424842834472656, "global_step": 114969, "epoch": 2737} {"train_loss": -6.412532806396484, "global_step": 114970, "epoch": 2737} {"train_loss": -6.441489219665527, "global_step": 114971, "epoch": 2737} {"train_loss": -6.364911079406738, "global_step": 114972, "epoch": 2737} {"train_loss": -6.5230889320373535, "global_step": 114973, "epoch": 2737} {"train_loss": -6.493378639221191, "global_step": 114974, "epoch": 2737} {"train_loss": -6.5350341796875, "global_step": 114975, "epoch": 2737} {"train_loss": -6.575756072998047, "global_step": 114976, "epoch": 2737} {"train_loss": -6.545522689819336, "global_step": 114977, "epoch": 2737} {"train_loss": -6.632145881652832, "global_step": 114978, "epoch": 2737} {"train_loss": -6.493494987487793, "global_step": 114979, "epoch": 2737} {"train_loss": -6.45258903503418, "global_step": 114980, "epoch": 2737} {"train_loss": -6.558331489562988, "global_step": 114981, "epoch": 2737} {"train_loss": -6.417530536651611, "global_step": 114982, "epoch": 2737} {"train_loss": -6.590170860290527, "global_step": 114983, "epoch": 2737} {"train_loss": -6.411126136779785, "global_step": 114984, "epoch": 2737} {"train_loss": -6.426337242126465, "global_step": 114985, "epoch": 2737} {"train_loss": -6.527289867401123, "global_step": 114986, "epoch": 2737} {"train_loss": -6.663212776184082, "global_step": 114987, "epoch": 2737} {"train_loss": -6.559430122375488, "global_step": 114988, "epoch": 2737} {"train_loss": -6.446191310882568, "global_step": 114989, "epoch": 2737} {"train_loss": -6.449164867401123, "global_step": 114990, "epoch": 2737} {"train_loss": -6.5574049949646, "global_step": 114991, "epoch": 2737} {"train_loss": -6.415907859802246, "global_step": 114992, "epoch": 2737} {"train_loss": -6.459216594696045, "global_step": 114993, "epoch": 2737} {"train_loss": -6.58090877532959, "global_step": 114994, "epoch": 2737} {"train_loss": -6.499354589553106, "global_step": 114995, "epoch": 2737, "val_loss": 65381.38671875} {"train_loss": -6.466231346130371, "global_step": 114996, "epoch": 2738} {"train_loss": -6.596834659576416, "global_step": 114997, "epoch": 2738} {"train_loss": -6.6011834144592285, "global_step": 114998, "epoch": 2738} {"train_loss": -6.559318542480469, "global_step": 114999, "epoch": 2738} {"train_loss": -6.411721706390381, "global_step": 115000, "epoch": 2738} {"train_loss": -6.55851936340332, "global_step": 115001, "epoch": 2738} {"train_loss": -6.4286394119262695, "global_step": 115002, "epoch": 2738} {"train_loss": -6.482616424560547, "global_step": 115003, "epoch": 2738} {"train_loss": -6.5637311935424805, "global_step": 115004, "epoch": 2738} {"train_loss": -6.512760639190674, "global_step": 115005, "epoch": 2738} {"train_loss": -6.540165901184082, "global_step": 115006, "epoch": 2738} {"train_loss": -6.575716972351074, "global_step": 115007, "epoch": 2738} {"train_loss": -6.47672700881958, "global_step": 115008, "epoch": 2738} {"train_loss": -6.493692398071289, "global_step": 115009, "epoch": 2738} {"train_loss": -6.444999694824219, "global_step": 115010, "epoch": 2738} {"train_loss": -6.62747859954834, "global_step": 115011, "epoch": 2738} {"train_loss": -6.538412570953369, "global_step": 115012, "epoch": 2738} {"train_loss": -6.486191749572754, "global_step": 115013, "epoch": 2738} {"train_loss": -6.531256675720215, "global_step": 115014, "epoch": 2738} {"train_loss": -6.345685005187988, "global_step": 115015, "epoch": 2738} {"train_loss": -6.541306495666504, "global_step": 115016, "epoch": 2738} {"train_loss": -6.627531051635742, "global_step": 115017, "epoch": 2738} {"train_loss": -6.458244800567627, "global_step": 115018, "epoch": 2738} {"train_loss": -6.552742958068848, "global_step": 115019, "epoch": 2738} {"train_loss": -6.493180274963379, "global_step": 115020, "epoch": 2738} {"train_loss": -6.447408676147461, "global_step": 115021, "epoch": 2738} {"train_loss": -6.46129035949707, "global_step": 115022, "epoch": 2738} {"train_loss": -6.467940330505371, "global_step": 115023, "epoch": 2738} {"train_loss": -6.5270466804504395, "global_step": 115024, "epoch": 2738} {"train_loss": -6.518016815185547, "global_step": 115025, "epoch": 2738} {"train_loss": -6.544539451599121, "global_step": 115026, "epoch": 2738} {"train_loss": -6.5738444328308105, "global_step": 115027, "epoch": 2738} {"train_loss": -6.5317559242248535, "global_step": 115028, "epoch": 2738} {"train_loss": -6.541543960571289, "global_step": 115029, "epoch": 2738} {"train_loss": -6.536494731903076, "global_step": 115030, "epoch": 2738} {"train_loss": -6.492203235626221, "global_step": 115031, "epoch": 2738} {"train_loss": -6.489378929138184, "global_step": 115032, "epoch": 2738} {"train_loss": -6.587047576904297, "global_step": 115033, "epoch": 2738} {"train_loss": -6.635831832885742, "global_step": 115034, "epoch": 2738} {"train_loss": -6.643248081207275, "global_step": 115035, "epoch": 2738} {"train_loss": -6.627068519592285, "global_step": 115036, "epoch": 2738} {"train_loss": -6.5255647500356035, "global_step": 115037, "epoch": 2738, "val_loss": 65369.25390625} {"train_loss": -6.505529403686523, "global_step": 115038, "epoch": 2739} {"train_loss": -6.471691131591797, "global_step": 115039, "epoch": 2739} {"train_loss": -6.552175045013428, "global_step": 115040, "epoch": 2739} {"train_loss": -6.649385452270508, "global_step": 115041, "epoch": 2739} {"train_loss": -6.509657859802246, "global_step": 115042, "epoch": 2739} {"train_loss": -6.56378698348999, "global_step": 115043, "epoch": 2739} {"train_loss": -6.55980110168457, "global_step": 115044, "epoch": 2739} {"train_loss": -6.578653812408447, "global_step": 115045, "epoch": 2739} {"train_loss": -6.609988212585449, "global_step": 115046, "epoch": 2739} {"train_loss": -6.440097332000732, "global_step": 115047, "epoch": 2739} {"train_loss": -6.616268157958984, "global_step": 115048, "epoch": 2739} {"train_loss": -6.555237770080566, "global_step": 115049, "epoch": 2739} {"train_loss": -6.507904052734375, "global_step": 115050, "epoch": 2739} {"train_loss": -6.597927093505859, "global_step": 115051, "epoch": 2739} {"train_loss": -6.713163375854492, "global_step": 115052, "epoch": 2739} {"train_loss": -6.596166610717773, "global_step": 115053, "epoch": 2739} {"train_loss": -6.504711151123047, "global_step": 115054, "epoch": 2739} {"train_loss": -6.544157981872559, "global_step": 115055, "epoch": 2739} {"train_loss": -6.519213676452637, "global_step": 115056, "epoch": 2739} {"train_loss": -6.4763875007629395, "global_step": 115057, "epoch": 2739} {"train_loss": -6.372654914855957, "global_step": 115058, "epoch": 2739} {"train_loss": -6.441828727722168, "global_step": 115059, "epoch": 2739} {"train_loss": -6.479889869689941, "global_step": 115060, "epoch": 2739} {"train_loss": -6.439289093017578, "global_step": 115061, "epoch": 2739} {"train_loss": -6.4928083419799805, "global_step": 115062, "epoch": 2739} {"train_loss": -6.419386863708496, "global_step": 115063, "epoch": 2739} {"train_loss": -6.526281356811523, "global_step": 115064, "epoch": 2739} {"train_loss": -6.446499824523926, "global_step": 115065, "epoch": 2739} {"train_loss": -6.493495941162109, "global_step": 115066, "epoch": 2739} {"train_loss": -6.579049110412598, "global_step": 115067, "epoch": 2739} {"train_loss": -6.42929744720459, "global_step": 115068, "epoch": 2739} {"train_loss": -6.516181945800781, "global_step": 115069, "epoch": 2739} {"train_loss": -6.632627010345459, "global_step": 115070, "epoch": 2739} {"train_loss": -6.577814102172852, "global_step": 115071, "epoch": 2739} {"train_loss": -6.5578155517578125, "global_step": 115072, "epoch": 2739} {"train_loss": -6.477816104888916, "global_step": 115073, "epoch": 2739} {"train_loss": -6.357806205749512, "global_step": 115074, "epoch": 2739} {"train_loss": -6.388574123382568, "global_step": 115075, "epoch": 2739} {"train_loss": -6.51368522644043, "global_step": 115076, "epoch": 2739} {"train_loss": -6.452479362487793, "global_step": 115077, "epoch": 2739} {"train_loss": -6.465014457702637, "global_step": 115078, "epoch": 2739} {"train_loss": -6.516089677810669, "global_step": 115079, "epoch": 2739, "val_loss": 65647.8359375} {"train_loss": -6.531983852386475, "global_step": 115080, "epoch": 2740} {"train_loss": -6.4708075523376465, "global_step": 115081, "epoch": 2740} {"train_loss": -6.472263813018799, "global_step": 115082, "epoch": 2740} {"train_loss": -6.47874641418457, "global_step": 115083, "epoch": 2740} {"train_loss": -6.328606605529785, "global_step": 115084, "epoch": 2740} {"train_loss": -6.465051651000977, "global_step": 115085, "epoch": 2740} {"train_loss": -6.470854759216309, "global_step": 115086, "epoch": 2740} {"train_loss": -6.497107028961182, "global_step": 115087, "epoch": 2740} {"train_loss": -6.378591537475586, "global_step": 115088, "epoch": 2740} {"train_loss": -6.325659275054932, "global_step": 115089, "epoch": 2740} {"train_loss": -6.556349277496338, "global_step": 115090, "epoch": 2740} {"train_loss": -6.49600887298584, "global_step": 115091, "epoch": 2740} {"train_loss": -6.519671440124512, "global_step": 115092, "epoch": 2740} {"train_loss": -6.599822044372559, "global_step": 115093, "epoch": 2740} {"train_loss": -6.412925720214844, "global_step": 115094, "epoch": 2740} {"train_loss": -6.5117621421813965, "global_step": 115095, "epoch": 2740} {"train_loss": -6.542905807495117, "global_step": 115096, "epoch": 2740} {"train_loss": -6.506958961486816, "global_step": 115097, "epoch": 2740} {"train_loss": -6.373749256134033, "global_step": 115098, "epoch": 2740} {"train_loss": -6.393241882324219, "global_step": 115099, "epoch": 2740} {"train_loss": -6.540297031402588, "global_step": 115100, "epoch": 2740} {"train_loss": -6.5049729347229, "global_step": 115101, "epoch": 2740} {"train_loss": -6.528058052062988, "global_step": 115102, "epoch": 2740} {"train_loss": -6.561394691467285, "global_step": 115103, "epoch": 2740} {"train_loss": -6.549877166748047, "global_step": 115104, "epoch": 2740} {"train_loss": -6.560482025146484, "global_step": 115105, "epoch": 2740} {"train_loss": -6.450263977050781, "global_step": 115106, "epoch": 2740} {"train_loss": -6.5456318855285645, "global_step": 115107, "epoch": 2740} {"train_loss": -6.548159122467041, "global_step": 115108, "epoch": 2740} {"train_loss": -6.462387561798096, "global_step": 115109, "epoch": 2740} {"train_loss": -6.5317063331604, "global_step": 115110, "epoch": 2740} {"train_loss": -6.429946422576904, "global_step": 115111, "epoch": 2740} {"train_loss": -6.50606632232666, "global_step": 115112, "epoch": 2740} {"train_loss": -6.529211044311523, "global_step": 115113, "epoch": 2740} {"train_loss": -6.561614990234375, "global_step": 115114, "epoch": 2740} {"train_loss": -6.605580806732178, "global_step": 115115, "epoch": 2740} {"train_loss": -6.546788215637207, "global_step": 115116, "epoch": 2740} {"train_loss": -6.543339729309082, "global_step": 115117, "epoch": 2740} {"train_loss": -6.47226619720459, "global_step": 115118, "epoch": 2740} {"train_loss": -6.532752990722656, "global_step": 115119, "epoch": 2740} {"train_loss": -6.5568389892578125, "global_step": 115120, "epoch": 2740} {"train_loss": -6.495288269860404, "global_step": 115121, "epoch": 2740, "val_loss": 65359.5625} {"train_loss": -6.5361762046813965, "global_step": 115122, "epoch": 2741} {"train_loss": -6.5773701667785645, "global_step": 115123, "epoch": 2741} {"train_loss": -6.561631679534912, "global_step": 115124, "epoch": 2741} {"train_loss": -6.504935264587402, "global_step": 115125, "epoch": 2741} {"train_loss": -6.428994178771973, "global_step": 115126, "epoch": 2741} {"train_loss": -6.541346549987793, "global_step": 115127, "epoch": 2741} {"train_loss": -6.529156684875488, "global_step": 115128, "epoch": 2741} {"train_loss": -6.62570333480835, "global_step": 115129, "epoch": 2741} {"train_loss": -6.6610188484191895, "global_step": 115130, "epoch": 2741} {"train_loss": -6.505260467529297, "global_step": 115131, "epoch": 2741} {"train_loss": -6.548112869262695, "global_step": 115132, "epoch": 2741} {"train_loss": -6.528061866760254, "global_step": 115133, "epoch": 2741} {"train_loss": -6.470722198486328, "global_step": 115134, "epoch": 2741} {"train_loss": -6.658312797546387, "global_step": 115135, "epoch": 2741} {"train_loss": -6.515081405639648, "global_step": 115136, "epoch": 2741} {"train_loss": -6.641134262084961, "global_step": 115137, "epoch": 2741} {"train_loss": -6.590809345245361, "global_step": 115138, "epoch": 2741} {"train_loss": -6.584078788757324, "global_step": 115139, "epoch": 2741} {"train_loss": -6.520798206329346, "global_step": 115140, "epoch": 2741} {"train_loss": -6.569340705871582, "global_step": 115141, "epoch": 2741} {"train_loss": -6.625697612762451, "global_step": 115142, "epoch": 2741} {"train_loss": -6.5420122146606445, "global_step": 115143, "epoch": 2741} {"train_loss": -6.632905006408691, "global_step": 115144, "epoch": 2741} {"train_loss": -6.539033889770508, "global_step": 115145, "epoch": 2741} {"train_loss": -6.455793380737305, "global_step": 115146, "epoch": 2741} {"train_loss": -6.559273719787598, "global_step": 115147, "epoch": 2741} {"train_loss": -6.501361846923828, "global_step": 115148, "epoch": 2741} {"train_loss": -6.477441787719727, "global_step": 115149, "epoch": 2741} {"train_loss": -6.504482269287109, "global_step": 115150, "epoch": 2741} {"train_loss": -6.492694854736328, "global_step": 115151, "epoch": 2741} {"train_loss": -6.59805154800415, "global_step": 115152, "epoch": 2741} {"train_loss": -6.511013031005859, "global_step": 115153, "epoch": 2741} {"train_loss": -6.36524772644043, "global_step": 115154, "epoch": 2741} {"train_loss": -6.511404037475586, "global_step": 115155, "epoch": 2741} {"train_loss": -6.5940937995910645, "global_step": 115156, "epoch": 2741} {"train_loss": -6.505516052246094, "global_step": 115157, "epoch": 2741} {"train_loss": -6.504217147827148, "global_step": 115158, "epoch": 2741} {"train_loss": -6.606467247009277, "global_step": 115159, "epoch": 2741} {"train_loss": -6.542278289794922, "global_step": 115160, "epoch": 2741} {"train_loss": -6.446493148803711, "global_step": 115161, "epoch": 2741} {"train_loss": -6.465639591217041, "global_step": 115162, "epoch": 2741} {"train_loss": -6.54003179640997, "global_step": 115163, "epoch": 2741, "val_loss": 65405.56640625} {"train_loss": -6.544711112976074, "global_step": 115164, "epoch": 2742} {"train_loss": -6.57929801940918, "global_step": 115165, "epoch": 2742} {"train_loss": -6.414398193359375, "global_step": 115166, "epoch": 2742} {"train_loss": -6.421783447265625, "global_step": 115167, "epoch": 2742} {"train_loss": -6.491744041442871, "global_step": 115168, "epoch": 2742} {"train_loss": -6.378185749053955, "global_step": 115169, "epoch": 2742} {"train_loss": -6.383451461791992, "global_step": 115170, "epoch": 2742} {"train_loss": -6.489945411682129, "global_step": 115171, "epoch": 2742} {"train_loss": -6.497331619262695, "global_step": 115172, "epoch": 2742} {"train_loss": -6.445619583129883, "global_step": 115173, "epoch": 2742} {"train_loss": -6.500637054443359, "global_step": 115174, "epoch": 2742} {"train_loss": -6.449555397033691, "global_step": 115175, "epoch": 2742} {"train_loss": -6.602417945861816, "global_step": 115176, "epoch": 2742} {"train_loss": -6.387238502502441, "global_step": 115177, "epoch": 2742} {"train_loss": -6.405195713043213, "global_step": 115178, "epoch": 2742} {"train_loss": -6.347046375274658, "global_step": 115179, "epoch": 2742} {"train_loss": -6.436552047729492, "global_step": 115180, "epoch": 2742} {"train_loss": -6.3250837326049805, "global_step": 115181, "epoch": 2742} {"train_loss": -6.480864524841309, "global_step": 115182, "epoch": 2742} {"train_loss": -6.3131208419799805, "global_step": 115183, "epoch": 2742} {"train_loss": -6.43081521987915, "global_step": 115184, "epoch": 2742} {"train_loss": -6.536208629608154, "global_step": 115185, "epoch": 2742} {"train_loss": -6.303397178649902, "global_step": 115186, "epoch": 2742} {"train_loss": -6.564794063568115, "global_step": 115187, "epoch": 2742} {"train_loss": -6.382049560546875, "global_step": 115188, "epoch": 2742} {"train_loss": -6.492884159088135, "global_step": 115189, "epoch": 2742} {"train_loss": -6.487762451171875, "global_step": 115190, "epoch": 2742} {"train_loss": -6.448489189147949, "global_step": 115191, "epoch": 2742} {"train_loss": -6.431873321533203, "global_step": 115192, "epoch": 2742} {"train_loss": -6.495038986206055, "global_step": 115193, "epoch": 2742} {"train_loss": -6.499439239501953, "global_step": 115194, "epoch": 2742} {"train_loss": -6.48051643371582, "global_step": 115195, "epoch": 2742} {"train_loss": -6.588778495788574, "global_step": 115196, "epoch": 2742} {"train_loss": -6.516756057739258, "global_step": 115197, "epoch": 2742} {"train_loss": -6.581942081451416, "global_step": 115198, "epoch": 2742} {"train_loss": -6.554065704345703, "global_step": 115199, "epoch": 2742} {"train_loss": -6.512368202209473, "global_step": 115200, "epoch": 2742} {"train_loss": -6.480422019958496, "global_step": 115201, "epoch": 2742} {"train_loss": -6.4956278800964355, "global_step": 115202, "epoch": 2742} {"train_loss": -6.568810939788818, "global_step": 115203, "epoch": 2742} {"train_loss": -6.608216285705566, "global_step": 115204, "epoch": 2742} {"train_loss": -6.4740243298666815, "global_step": 115205, "epoch": 2742, "val_loss": 65348.15625} {"train_loss": -6.4983954429626465, "global_step": 115206, "epoch": 2743} {"train_loss": -6.46346378326416, "global_step": 115207, "epoch": 2743} {"train_loss": -6.613702774047852, "global_step": 115208, "epoch": 2743} {"train_loss": -6.554274559020996, "global_step": 115209, "epoch": 2743} {"train_loss": -6.621310234069824, "global_step": 115210, "epoch": 2743} {"train_loss": -6.525505065917969, "global_step": 115211, "epoch": 2743} {"train_loss": -6.502033233642578, "global_step": 115212, "epoch": 2743} {"train_loss": -6.459946632385254, "global_step": 115213, "epoch": 2743} {"train_loss": -6.538806915283203, "global_step": 115214, "epoch": 2743} {"train_loss": -6.619324684143066, "global_step": 115215, "epoch": 2743} {"train_loss": -6.608510971069336, "global_step": 115216, "epoch": 2743} {"train_loss": -6.556049823760986, "global_step": 115217, "epoch": 2743} {"train_loss": -6.667113780975342, "global_step": 115218, "epoch": 2743} {"train_loss": -6.522769927978516, "global_step": 115219, "epoch": 2743} {"train_loss": -6.5212812423706055, "global_step": 115220, "epoch": 2743} {"train_loss": -6.446832180023193, "global_step": 115221, "epoch": 2743} {"train_loss": -6.4599609375, "global_step": 115222, "epoch": 2743} {"train_loss": -6.495837688446045, "global_step": 115223, "epoch": 2743} {"train_loss": -6.569906234741211, "global_step": 115224, "epoch": 2743} {"train_loss": -6.486388206481934, "global_step": 115225, "epoch": 2743} {"train_loss": -6.488827228546143, "global_step": 115226, "epoch": 2743} {"train_loss": -6.425065994262695, "global_step": 115227, "epoch": 2743} {"train_loss": -6.564384460449219, "global_step": 115228, "epoch": 2743} {"train_loss": -6.5336103439331055, "global_step": 115229, "epoch": 2743} {"train_loss": -6.5003767013549805, "global_step": 115230, "epoch": 2743} {"train_loss": -6.508585453033447, "global_step": 115231, "epoch": 2743} {"train_loss": -6.5545654296875, "global_step": 115232, "epoch": 2743} {"train_loss": -6.5216217041015625, "global_step": 115233, "epoch": 2743} {"train_loss": -6.401623725891113, "global_step": 115234, "epoch": 2743} {"train_loss": -6.513321876525879, "global_step": 115235, "epoch": 2743} {"train_loss": -6.507814884185791, "global_step": 115236, "epoch": 2743} {"train_loss": -6.592829704284668, "global_step": 115237, "epoch": 2743} {"train_loss": -6.5164594650268555, "global_step": 115238, "epoch": 2743} {"train_loss": -6.475089073181152, "global_step": 115239, "epoch": 2743} {"train_loss": -6.4853410720825195, "global_step": 115240, "epoch": 2743} {"train_loss": -6.398550987243652, "global_step": 115241, "epoch": 2743} {"train_loss": -6.543992042541504, "global_step": 115242, "epoch": 2743} {"train_loss": -6.444825172424316, "global_step": 115243, "epoch": 2743} {"train_loss": -6.5579447746276855, "global_step": 115244, "epoch": 2743} {"train_loss": -6.532876014709473, "global_step": 115245, "epoch": 2743} {"train_loss": -6.427572727203369, "global_step": 115246, "epoch": 2743} {"train_loss": -6.517631860006423, "global_step": 115247, "epoch": 2743, "val_loss": 65370.296875} {"train_loss": -6.547079563140869, "global_step": 115248, "epoch": 2744} {"train_loss": -6.558965682983398, "global_step": 115249, "epoch": 2744} {"train_loss": -6.497050762176514, "global_step": 115250, "epoch": 2744} {"train_loss": -6.5962677001953125, "global_step": 115251, "epoch": 2744} {"train_loss": -6.4454569816589355, "global_step": 115252, "epoch": 2744} {"train_loss": -6.606967926025391, "global_step": 115253, "epoch": 2744} {"train_loss": -6.487752914428711, "global_step": 115254, "epoch": 2744} {"train_loss": -6.603087902069092, "global_step": 115255, "epoch": 2744} {"train_loss": -6.572336196899414, "global_step": 115256, "epoch": 2744} {"train_loss": -6.465211868286133, "global_step": 115257, "epoch": 2744} {"train_loss": -6.529526233673096, "global_step": 115258, "epoch": 2744} {"train_loss": -6.538541793823242, "global_step": 115259, "epoch": 2744} {"train_loss": -6.583571434020996, "global_step": 115260, "epoch": 2744} {"train_loss": -6.56275749206543, "global_step": 115261, "epoch": 2744} {"train_loss": -6.573304176330566, "global_step": 115262, "epoch": 2744} {"train_loss": -6.539611339569092, "global_step": 115263, "epoch": 2744} {"train_loss": -6.558495998382568, "global_step": 115264, "epoch": 2744} {"train_loss": -6.46776819229126, "global_step": 115265, "epoch": 2744} {"train_loss": -6.537301063537598, "global_step": 115266, "epoch": 2744} {"train_loss": -6.460084915161133, "global_step": 115267, "epoch": 2744} {"train_loss": -6.602433204650879, "global_step": 115268, "epoch": 2744} {"train_loss": -6.452269554138184, "global_step": 115269, "epoch": 2744} {"train_loss": -6.504345893859863, "global_step": 115270, "epoch": 2744} {"train_loss": -6.512160778045654, "global_step": 115271, "epoch": 2744} {"train_loss": -6.582581520080566, "global_step": 115272, "epoch": 2744} {"train_loss": -6.505983829498291, "global_step": 115273, "epoch": 2744} {"train_loss": -6.5868072509765625, "global_step": 115274, "epoch": 2744} {"train_loss": -6.487043857574463, "global_step": 115275, "epoch": 2744} {"train_loss": -6.558287620544434, "global_step": 115276, "epoch": 2744} {"train_loss": -6.488654136657715, "global_step": 115277, "epoch": 2744} {"train_loss": -6.577314376831055, "global_step": 115278, "epoch": 2744} {"train_loss": -6.436139106750488, "global_step": 115279, "epoch": 2744} {"train_loss": -6.349875450134277, "global_step": 115280, "epoch": 2744} {"train_loss": -6.53752326965332, "global_step": 115281, "epoch": 2744} {"train_loss": -6.410539150238037, "global_step": 115282, "epoch": 2744} {"train_loss": -6.432379722595215, "global_step": 115283, "epoch": 2744} {"train_loss": -6.449481010437012, "global_step": 115284, "epoch": 2744} {"train_loss": -6.509552478790283, "global_step": 115285, "epoch": 2744} {"train_loss": -6.559864044189453, "global_step": 115286, "epoch": 2744} {"train_loss": -6.362475395202637, "global_step": 115287, "epoch": 2744} {"train_loss": -6.464300632476807, "global_step": 115288, "epoch": 2744} {"train_loss": -6.513238872800555, "global_step": 115289, "epoch": 2744, "val_loss": 65535.4453125} {"train_loss": -6.464422225952148, "global_step": 115290, "epoch": 2745} {"train_loss": -6.519767761230469, "global_step": 115291, "epoch": 2745} {"train_loss": -6.642574787139893, "global_step": 115292, "epoch": 2745} {"train_loss": -6.548923492431641, "global_step": 115293, "epoch": 2745} {"train_loss": -6.4961838722229, "global_step": 115294, "epoch": 2745} {"train_loss": -6.46140718460083, "global_step": 115295, "epoch": 2745} {"train_loss": -6.480230331420898, "global_step": 115296, "epoch": 2745} {"train_loss": -6.537317752838135, "global_step": 115297, "epoch": 2745} {"train_loss": -6.460562705993652, "global_step": 115298, "epoch": 2745} {"train_loss": -6.556426048278809, "global_step": 115299, "epoch": 2745} {"train_loss": -6.505486488342285, "global_step": 115300, "epoch": 2745} {"train_loss": -6.450409889221191, "global_step": 115301, "epoch": 2745} {"train_loss": -6.583193778991699, "global_step": 115302, "epoch": 2745} {"train_loss": -6.626219749450684, "global_step": 115303, "epoch": 2745} {"train_loss": -6.551052093505859, "global_step": 115304, "epoch": 2745} {"train_loss": -6.5284037590026855, "global_step": 115305, "epoch": 2745} {"train_loss": -6.456144332885742, "global_step": 115306, "epoch": 2745} {"train_loss": -6.560702323913574, "global_step": 115307, "epoch": 2745} {"train_loss": -6.559979438781738, "global_step": 115308, "epoch": 2745} {"train_loss": -6.469853401184082, "global_step": 115309, "epoch": 2745} {"train_loss": -6.595129489898682, "global_step": 115310, "epoch": 2745} {"train_loss": -6.572574615478516, "global_step": 115311, "epoch": 2745} {"train_loss": -6.620494365692139, "global_step": 115312, "epoch": 2745} {"train_loss": -6.4771623611450195, "global_step": 115313, "epoch": 2745} {"train_loss": -6.556870460510254, "global_step": 115314, "epoch": 2745} {"train_loss": -6.5770111083984375, "global_step": 115315, "epoch": 2745} {"train_loss": -6.5125861167907715, "global_step": 115316, "epoch": 2745} {"train_loss": -6.495373725891113, "global_step": 115317, "epoch": 2745} {"train_loss": -6.590928077697754, "global_step": 115318, "epoch": 2745} {"train_loss": -6.549132823944092, "global_step": 115319, "epoch": 2745} {"train_loss": -6.517001152038574, "global_step": 115320, "epoch": 2745} {"train_loss": -6.576653957366943, "global_step": 115321, "epoch": 2745} {"train_loss": -6.574991703033447, "global_step": 115322, "epoch": 2745} {"train_loss": -6.544479846954346, "global_step": 115323, "epoch": 2745} {"train_loss": -6.511780738830566, "global_step": 115324, "epoch": 2745} {"train_loss": -6.554973602294922, "global_step": 115325, "epoch": 2745} {"train_loss": -6.561604022979736, "global_step": 115326, "epoch": 2745} {"train_loss": -6.566901683807373, "global_step": 115327, "epoch": 2745} {"train_loss": -6.488702774047852, "global_step": 115328, "epoch": 2745} {"train_loss": -6.549680709838867, "global_step": 115329, "epoch": 2745} {"train_loss": -6.581524848937988, "global_step": 115330, "epoch": 2745} {"train_loss": -6.537682056427002, "global_step": 115331, "epoch": 2745, "val_loss": 65285.9453125} {"train_loss": -6.517843246459961, "global_step": 115332, "epoch": 2746} {"train_loss": -6.588176727294922, "global_step": 115333, "epoch": 2746} {"train_loss": -6.509913444519043, "global_step": 115334, "epoch": 2746} {"train_loss": -6.517479419708252, "global_step": 115335, "epoch": 2746} {"train_loss": -6.596744060516357, "global_step": 115336, "epoch": 2746} {"train_loss": -6.7416486740112305, "global_step": 115337, "epoch": 2746} {"train_loss": -6.569992542266846, "global_step": 115338, "epoch": 2746} {"train_loss": -6.556926250457764, "global_step": 115339, "epoch": 2746} {"train_loss": -6.493069648742676, "global_step": 115340, "epoch": 2746} {"train_loss": -6.611266136169434, "global_step": 115341, "epoch": 2746} {"train_loss": -6.533329963684082, "global_step": 115342, "epoch": 2746} {"train_loss": -6.5834455490112305, "global_step": 115343, "epoch": 2746} {"train_loss": -6.503506660461426, "global_step": 115344, "epoch": 2746} {"train_loss": -6.559818744659424, "global_step": 115345, "epoch": 2746} {"train_loss": -6.5305280685424805, "global_step": 115346, "epoch": 2746} {"train_loss": -6.530976295471191, "global_step": 115347, "epoch": 2746} {"train_loss": -6.61447811126709, "global_step": 115348, "epoch": 2746} {"train_loss": -6.496268272399902, "global_step": 115349, "epoch": 2746} {"train_loss": -6.536986827850342, "global_step": 115350, "epoch": 2746} {"train_loss": -6.4920549392700195, "global_step": 115351, "epoch": 2746} {"train_loss": -6.538098335266113, "global_step": 115352, "epoch": 2746} {"train_loss": -6.658918380737305, "global_step": 115353, "epoch": 2746} {"train_loss": -6.582927227020264, "global_step": 115354, "epoch": 2746} {"train_loss": -6.543435096740723, "global_step": 115355, "epoch": 2746} {"train_loss": -6.501512050628662, "global_step": 115356, "epoch": 2746} {"train_loss": -6.518062591552734, "global_step": 115357, "epoch": 2746} {"train_loss": -6.5818705558776855, "global_step": 115358, "epoch": 2746} {"train_loss": -6.531261444091797, "global_step": 115359, "epoch": 2746} {"train_loss": -6.445783615112305, "global_step": 115360, "epoch": 2746} {"train_loss": -6.466926574707031, "global_step": 115361, "epoch": 2746} {"train_loss": -6.394223213195801, "global_step": 115362, "epoch": 2746} {"train_loss": -6.6344194412231445, "global_step": 115363, "epoch": 2746} {"train_loss": -6.484025478363037, "global_step": 115364, "epoch": 2746} {"train_loss": -6.5442214012146, "global_step": 115365, "epoch": 2746} {"train_loss": -6.514169692993164, "global_step": 115366, "epoch": 2746} {"train_loss": -6.5100626945495605, "global_step": 115367, "epoch": 2746} {"train_loss": -6.5545125007629395, "global_step": 115368, "epoch": 2746} {"train_loss": -6.671802520751953, "global_step": 115369, "epoch": 2746} {"train_loss": -6.4533843994140625, "global_step": 115370, "epoch": 2746} {"train_loss": -6.603671073913574, "global_step": 115371, "epoch": 2746} {"train_loss": -6.571821689605713, "global_step": 115372, "epoch": 2746} {"train_loss": -6.542735440390451, "global_step": 115373, "epoch": 2746, "val_loss": 65448.6953125} {"train_loss": -6.466884613037109, "global_step": 115374, "epoch": 2747} {"train_loss": -6.497282981872559, "global_step": 115375, "epoch": 2747} {"train_loss": -6.477962017059326, "global_step": 115376, "epoch": 2747} {"train_loss": -6.541311740875244, "global_step": 115377, "epoch": 2747} {"train_loss": -6.512271404266357, "global_step": 115378, "epoch": 2747} {"train_loss": -6.593748569488525, "global_step": 115379, "epoch": 2747} {"train_loss": -6.631858825683594, "global_step": 115380, "epoch": 2747} {"train_loss": -6.580418586730957, "global_step": 115381, "epoch": 2747} {"train_loss": -6.507221221923828, "global_step": 115382, "epoch": 2747} {"train_loss": -6.5030035972595215, "global_step": 115383, "epoch": 2747} {"train_loss": -6.503053665161133, "global_step": 115384, "epoch": 2747} {"train_loss": -6.458590507507324, "global_step": 115385, "epoch": 2747} {"train_loss": -6.629605293273926, "global_step": 115386, "epoch": 2747} {"train_loss": -6.594804763793945, "global_step": 115387, "epoch": 2747} {"train_loss": -6.522326469421387, "global_step": 115388, "epoch": 2747} {"train_loss": -6.432560920715332, "global_step": 115389, "epoch": 2747} {"train_loss": -6.568648338317871, "global_step": 115390, "epoch": 2747} {"train_loss": -6.586470603942871, "global_step": 115391, "epoch": 2747} {"train_loss": -6.575024127960205, "global_step": 115392, "epoch": 2747} {"train_loss": -6.693818092346191, "global_step": 115393, "epoch": 2747} {"train_loss": -6.544861793518066, "global_step": 115394, "epoch": 2747} {"train_loss": -6.540677070617676, "global_step": 115395, "epoch": 2747} {"train_loss": -6.536746025085449, "global_step": 115396, "epoch": 2747} {"train_loss": -6.478350639343262, "global_step": 115397, "epoch": 2747} {"train_loss": -6.550259590148926, "global_step": 115398, "epoch": 2747} {"train_loss": -6.575350761413574, "global_step": 115399, "epoch": 2747} {"train_loss": -6.280787467956543, "global_step": 115400, "epoch": 2747} {"train_loss": -6.408368110656738, "global_step": 115401, "epoch": 2747} {"train_loss": -6.516124248504639, "global_step": 115402, "epoch": 2747} {"train_loss": -6.50910758972168, "global_step": 115403, "epoch": 2747} {"train_loss": -6.5154948234558105, "global_step": 115404, "epoch": 2747} {"train_loss": -6.505395889282227, "global_step": 115405, "epoch": 2747} {"train_loss": -6.423128128051758, "global_step": 115406, "epoch": 2747} {"train_loss": -6.449369430541992, "global_step": 115407, "epoch": 2747} {"train_loss": -6.562994956970215, "global_step": 115408, "epoch": 2747} {"train_loss": -6.433950424194336, "global_step": 115409, "epoch": 2747} {"train_loss": -6.516395568847656, "global_step": 115410, "epoch": 2747} {"train_loss": -6.520536422729492, "global_step": 115411, "epoch": 2747} {"train_loss": -6.680512428283691, "global_step": 115412, "epoch": 2747} {"train_loss": -6.410214900970459, "global_step": 115413, "epoch": 2747} {"train_loss": -6.40889835357666, "global_step": 115414, "epoch": 2747} {"train_loss": -6.516974767049153, "global_step": 115415, "epoch": 2747, "val_loss": 65373.046875} {"train_loss": -6.5373125076293945, "global_step": 115416, "epoch": 2748} {"train_loss": -6.549434661865234, "global_step": 115417, "epoch": 2748} {"train_loss": -6.529400825500488, "global_step": 115418, "epoch": 2748} {"train_loss": -6.477964401245117, "global_step": 115419, "epoch": 2748} {"train_loss": -6.4883527755737305, "global_step": 115420, "epoch": 2748} {"train_loss": -6.593127727508545, "global_step": 115421, "epoch": 2748} {"train_loss": -6.598793983459473, "global_step": 115422, "epoch": 2748} {"train_loss": -6.459366798400879, "global_step": 115423, "epoch": 2748} {"train_loss": -6.569100379943848, "global_step": 115424, "epoch": 2748} {"train_loss": -6.4611711502075195, "global_step": 115425, "epoch": 2748} {"train_loss": -6.5392303466796875, "global_step": 115426, "epoch": 2748} {"train_loss": -6.462674140930176, "global_step": 115427, "epoch": 2748} {"train_loss": -6.575918674468994, "global_step": 115428, "epoch": 2748} {"train_loss": -6.5228681564331055, "global_step": 115429, "epoch": 2748} {"train_loss": -6.514374732971191, "global_step": 115430, "epoch": 2748} {"train_loss": -6.591414451599121, "global_step": 115431, "epoch": 2748} {"train_loss": -6.353171348571777, "global_step": 115432, "epoch": 2748} {"train_loss": -6.516848087310791, "global_step": 115433, "epoch": 2748} {"train_loss": -6.486214637756348, "global_step": 115434, "epoch": 2748} {"train_loss": -6.454624176025391, "global_step": 115435, "epoch": 2748} {"train_loss": -6.456793785095215, "global_step": 115436, "epoch": 2748} {"train_loss": -6.416897773742676, "global_step": 115437, "epoch": 2748} {"train_loss": -6.510006427764893, "global_step": 115438, "epoch": 2748} {"train_loss": -6.308767318725586, "global_step": 115439, "epoch": 2748} {"train_loss": -6.482056140899658, "global_step": 115440, "epoch": 2748} {"train_loss": -6.426172733306885, "global_step": 115441, "epoch": 2748} {"train_loss": -6.515988349914551, "global_step": 115442, "epoch": 2748} {"train_loss": -6.3628997802734375, "global_step": 115443, "epoch": 2748} {"train_loss": -6.448259353637695, "global_step": 115444, "epoch": 2748} {"train_loss": -6.453567981719971, "global_step": 115445, "epoch": 2748} {"train_loss": -6.643088340759277, "global_step": 115446, "epoch": 2748} {"train_loss": -6.4325337409973145, "global_step": 115447, "epoch": 2748} {"train_loss": -6.58882474899292, "global_step": 115448, "epoch": 2748} {"train_loss": -6.463681221008301, "global_step": 115449, "epoch": 2748} {"train_loss": -6.525992393493652, "global_step": 115450, "epoch": 2748} {"train_loss": -6.467490196228027, "global_step": 115451, "epoch": 2748} {"train_loss": -6.501404762268066, "global_step": 115452, "epoch": 2748} {"train_loss": -6.537370681762695, "global_step": 115453, "epoch": 2748} {"train_loss": -6.387761116027832, "global_step": 115454, "epoch": 2748} {"train_loss": -6.430456161499023, "global_step": 115455, "epoch": 2748} {"train_loss": -6.404021263122559, "global_step": 115456, "epoch": 2748} {"train_loss": -6.487664268130348, "global_step": 115457, "epoch": 2748, "val_loss": 65190.765625} {"train_loss": -6.6178178787231445, "global_step": 115458, "epoch": 2749} {"train_loss": -6.454306602478027, "global_step": 115459, "epoch": 2749} {"train_loss": -6.493476867675781, "global_step": 115460, "epoch": 2749} {"train_loss": -6.4486613273620605, "global_step": 115461, "epoch": 2749} {"train_loss": -6.475396633148193, "global_step": 115462, "epoch": 2749} {"train_loss": -6.446011543273926, "global_step": 115463, "epoch": 2749} {"train_loss": -6.55828857421875, "global_step": 115464, "epoch": 2749} {"train_loss": -6.404284954071045, "global_step": 115465, "epoch": 2749} {"train_loss": -6.475381851196289, "global_step": 115466, "epoch": 2749} {"train_loss": -6.5254716873168945, "global_step": 115467, "epoch": 2749} {"train_loss": -6.386013984680176, "global_step": 115468, "epoch": 2749} {"train_loss": -6.473949432373047, "global_step": 115469, "epoch": 2749} {"train_loss": -6.4676055908203125, "global_step": 115470, "epoch": 2749} {"train_loss": -6.485100746154785, "global_step": 115471, "epoch": 2749} {"train_loss": -6.611726760864258, "global_step": 115472, "epoch": 2749} {"train_loss": -6.563698768615723, "global_step": 115473, "epoch": 2749} {"train_loss": -6.561269760131836, "global_step": 115474, "epoch": 2749} {"train_loss": -6.454933166503906, "global_step": 115475, "epoch": 2749} {"train_loss": -6.46051549911499, "global_step": 115476, "epoch": 2749} {"train_loss": -6.55407190322876, "global_step": 115477, "epoch": 2749} {"train_loss": -6.57405948638916, "global_step": 115478, "epoch": 2749} {"train_loss": -6.668646812438965, "global_step": 115479, "epoch": 2749} {"train_loss": -6.5439252853393555, "global_step": 115480, "epoch": 2749} {"train_loss": -6.4957475662231445, "global_step": 115481, "epoch": 2749} {"train_loss": -6.552268981933594, "global_step": 115482, "epoch": 2749} {"train_loss": -6.668068885803223, "global_step": 115483, "epoch": 2749} {"train_loss": -6.5722150802612305, "global_step": 115484, "epoch": 2749} {"train_loss": -6.539920806884766, "global_step": 115485, "epoch": 2749} {"train_loss": -6.565583229064941, "global_step": 115486, "epoch": 2749} {"train_loss": -6.495932579040527, "global_step": 115487, "epoch": 2749} {"train_loss": -6.6605095863342285, "global_step": 115488, "epoch": 2749} {"train_loss": -6.628747940063477, "global_step": 115489, "epoch": 2749} {"train_loss": -6.50933313369751, "global_step": 115490, "epoch": 2749} {"train_loss": -6.592654705047607, "global_step": 115491, "epoch": 2749} {"train_loss": -6.529792308807373, "global_step": 115492, "epoch": 2749} {"train_loss": -6.650705337524414, "global_step": 115493, "epoch": 2749} {"train_loss": -6.631451606750488, "global_step": 115494, "epoch": 2749} {"train_loss": -6.460561752319336, "global_step": 115495, "epoch": 2749} {"train_loss": -6.579448699951172, "global_step": 115496, "epoch": 2749} {"train_loss": -6.601370334625244, "global_step": 115497, "epoch": 2749} {"train_loss": -6.604278564453125, "global_step": 115498, "epoch": 2749} {"train_loss": -6.538812739508493, "global_step": 115499, "epoch": 2749, "val_loss": 65252.92578125} {"train_loss": -6.603744983673096, "global_step": 115500, "epoch": 2750} {"train_loss": -6.561663627624512, "global_step": 115501, "epoch": 2750} {"train_loss": -6.60891056060791, "global_step": 115502, "epoch": 2750} {"train_loss": -6.549533367156982, "global_step": 115503, "epoch": 2750} {"train_loss": -6.68101167678833, "global_step": 115504, "epoch": 2750} {"train_loss": -6.604237079620361, "global_step": 115505, "epoch": 2750} {"train_loss": -6.613552093505859, "global_step": 115506, "epoch": 2750} {"train_loss": -6.53467321395874, "global_step": 115507, "epoch": 2750} {"train_loss": -6.507935047149658, "global_step": 115508, "epoch": 2750} {"train_loss": -6.574042797088623, "global_step": 115509, "epoch": 2750} {"train_loss": -6.566859245300293, "global_step": 115510, "epoch": 2750} {"train_loss": -6.5591630935668945, "global_step": 115511, "epoch": 2750} {"train_loss": -6.681969165802002, "global_step": 115512, "epoch": 2750} {"train_loss": -6.540399551391602, "global_step": 115513, "epoch": 2750} {"train_loss": -6.440748691558838, "global_step": 115514, "epoch": 2750} {"train_loss": -6.486708164215088, "global_step": 115515, "epoch": 2750} {"train_loss": -6.432598114013672, "global_step": 115516, "epoch": 2750} {"train_loss": -6.51197624206543, "global_step": 115517, "epoch": 2750} {"train_loss": -6.479063034057617, "global_step": 115518, "epoch": 2750} {"train_loss": -6.557085990905762, "global_step": 115519, "epoch": 2750} {"train_loss": -6.51261568069458, "global_step": 115520, "epoch": 2750} {"train_loss": -6.55088996887207, "global_step": 115521, "epoch": 2750} {"train_loss": -6.582969665527344, "global_step": 115522, "epoch": 2750} {"train_loss": -6.5988545417785645, "global_step": 115523, "epoch": 2750} {"train_loss": -6.436450004577637, "global_step": 115524, "epoch": 2750} {"train_loss": -6.485177040100098, "global_step": 115525, "epoch": 2750} {"train_loss": -6.496133804321289, "global_step": 115526, "epoch": 2750} {"train_loss": -6.515241622924805, "global_step": 115527, "epoch": 2750} {"train_loss": -6.689030647277832, "global_step": 115528, "epoch": 2750} {"train_loss": -6.54364538192749, "global_step": 115529, "epoch": 2750} {"train_loss": -6.544764041900635, "global_step": 115530, "epoch": 2750} {"train_loss": -6.526891708374023, "global_step": 115531, "epoch": 2750} {"train_loss": -6.525092601776123, "global_step": 115532, "epoch": 2750} {"train_loss": -6.568114280700684, "global_step": 115533, "epoch": 2750} {"train_loss": -6.503003120422363, "global_step": 115534, "epoch": 2750} {"train_loss": -6.62930965423584, "global_step": 115535, "epoch": 2750} {"train_loss": -6.480379104614258, "global_step": 115536, "epoch": 2750} {"train_loss": -6.472216606140137, "global_step": 115537, "epoch": 2750} {"train_loss": -6.51745080947876, "global_step": 115538, "epoch": 2750} {"train_loss": -6.5082244873046875, "global_step": 115539, "epoch": 2750} {"train_loss": -6.460803031921387, "global_step": 115540, "epoch": 2750} {"train_loss": -6.542233784993489, "global_step": 115541, "epoch": 2750, "train/sim_max_reward_0": 0.20307980068198833, "train/sim_max_reward_1": 0.9137090919714873, "train/sim_max_reward_2": 0.8607014871760892, "train/sim_max_reward_3": 0.14443414779576338, "train/sim_max_reward_4": 0.9876542810913034, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5685330895100474, "test/sim_max_reward_4300002": 0.9247866328315416, "test/sim_max_reward_4300003": 0.9652811021023286, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.6571302675233761, "test/sim_max_reward_4300006": 0.9813123790918838, "test/sim_max_reward_4300007": 0.358638829126907, "test/sim_max_reward_4300008": 0.7066050224815003, "test/sim_max_reward_4300009": 0.9731975496121347, "test/sim_max_reward_4300010": 0.9370616343467233, "test/sim_max_reward_4300011": 0.3131124571128182, "test/sim_max_reward_4300012": 0.591482410608708, "test/sim_max_reward_4300013": 0.9956179951601455, "test/sim_max_reward_4300014": 0.8937906727349695, "test/sim_max_reward_4300015": 0.9537362910535143, "test/sim_max_reward_4300016": 0.9192762714457842, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.43002411783618294, "test/sim_max_reward_4300019": 0.18593308027924077, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.35532490777947284, "test/sim_max_reward_4300022": 0.8825139239385488, "test/sim_max_reward_4300023": 0.333684065448626, "test/sim_max_reward_4300024": 0.7771789916436855, "test/sim_max_reward_4300025": 0.9991196791940294, "test/sim_max_reward_4300026": 0.05548867765697765, "test/sim_max_reward_4300027": 0.955591109798989, "test/sim_max_reward_4300028": 0.9336282448636548, "test/sim_max_reward_4300029": 0.9018378792649526, "test/sim_max_reward_4300030": 0.0008061954690310072, "test/sim_max_reward_4300031": 0.21294785055102672, "test/sim_max_reward_4300032": 0.9322776797061122, "test/sim_max_reward_4300033": 0.6225516842653185, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.6966685859813607, "test/sim_max_reward_4300036": 0.1996078469082437, "test/sim_max_reward_4300037": 0.8952188161700679, "test/sim_max_reward_4300038": 0.9228255498583934, "test/sim_max_reward_4300039": 0.9025963163175316, "test/sim_max_reward_4300040": 1.0, "test/sim_max_reward_4300041": 0.20588913014854693, "test/sim_max_reward_4300042": 0.6938639695815569, "test/sim_max_reward_4300043": 0.950738647354651, "test/sim_max_reward_4300044": 0.9552535317217299, "test/sim_max_reward_4300045": 0.9521347234568955, "test/sim_max_reward_4300046": 0.8781159902584719, "test/sim_max_reward_4300047": 0.12515613991052416, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.2001480865286498, "train/mean_score": 0.5504272613464698, "test/mean_score": 0.6182504426288828, "val_loss": 65382.6953125} {"train_loss": -6.493430137634277, "global_step": 115542, "epoch": 2751} {"train_loss": -6.566287994384766, "global_step": 115543, "epoch": 2751} {"train_loss": -6.534889221191406, "global_step": 115544, "epoch": 2751} {"train_loss": -6.524689674377441, "global_step": 115545, "epoch": 2751} {"train_loss": -6.577869892120361, "global_step": 115546, "epoch": 2751} {"train_loss": -6.501119613647461, "global_step": 115547, "epoch": 2751} {"train_loss": -6.460816860198975, "global_step": 115548, "epoch": 2751} {"train_loss": -6.432539939880371, "global_step": 115549, "epoch": 2751} {"train_loss": -6.524340629577637, "global_step": 115550, "epoch": 2751} {"train_loss": -6.5679473876953125, "global_step": 115551, "epoch": 2751} {"train_loss": -6.563190460205078, "global_step": 115552, "epoch": 2751} {"train_loss": -6.577349662780762, "global_step": 115553, "epoch": 2751} {"train_loss": -6.441226005554199, "global_step": 115554, "epoch": 2751} {"train_loss": -6.527029991149902, "global_step": 115555, "epoch": 2751} {"train_loss": -6.578956604003906, "global_step": 115556, "epoch": 2751} {"train_loss": -6.491183280944824, "global_step": 115557, "epoch": 2751} {"train_loss": -6.616664886474609, "global_step": 115558, "epoch": 2751} {"train_loss": -6.50177001953125, "global_step": 115559, "epoch": 2751} {"train_loss": -6.512160301208496, "global_step": 115560, "epoch": 2751} {"train_loss": -6.570590019226074, "global_step": 115561, "epoch": 2751} {"train_loss": -6.474091529846191, "global_step": 115562, "epoch": 2751} {"train_loss": -6.617112636566162, "global_step": 115563, "epoch": 2751} {"train_loss": -6.545505046844482, "global_step": 115564, "epoch": 2751} {"train_loss": -6.5881547927856445, "global_step": 115565, "epoch": 2751} {"train_loss": -6.646978855133057, "global_step": 115566, "epoch": 2751} {"train_loss": -6.553040027618408, "global_step": 115567, "epoch": 2751} {"train_loss": -6.560871601104736, "global_step": 115568, "epoch": 2751} {"train_loss": -6.480574607849121, "global_step": 115569, "epoch": 2751} {"train_loss": -6.587311744689941, "global_step": 115570, "epoch": 2751} {"train_loss": -6.582732200622559, "global_step": 115571, "epoch": 2751} {"train_loss": -6.531719207763672, "global_step": 115572, "epoch": 2751} {"train_loss": -6.6138458251953125, "global_step": 115573, "epoch": 2751} {"train_loss": -6.556241989135742, "global_step": 115574, "epoch": 2751} {"train_loss": -6.558189392089844, "global_step": 115575, "epoch": 2751} {"train_loss": -6.522770404815674, "global_step": 115576, "epoch": 2751} {"train_loss": -6.471835136413574, "global_step": 115577, "epoch": 2751} {"train_loss": -6.548601150512695, "global_step": 115578, "epoch": 2751} {"train_loss": -6.596057891845703, "global_step": 115579, "epoch": 2751} {"train_loss": -6.412167072296143, "global_step": 115580, "epoch": 2751} {"train_loss": -6.455966472625732, "global_step": 115581, "epoch": 2751} {"train_loss": -6.606871604919434, "global_step": 115582, "epoch": 2751} {"train_loss": -6.540965716044108, "global_step": 115583, "epoch": 2751, "val_loss": 65536.859375} {"train_loss": -6.480424880981445, "global_step": 115584, "epoch": 2752} {"train_loss": -6.485437393188477, "global_step": 115585, "epoch": 2752} {"train_loss": -6.432405471801758, "global_step": 115586, "epoch": 2752} {"train_loss": -6.565188407897949, "global_step": 115587, "epoch": 2752} {"train_loss": -6.388599872589111, "global_step": 115588, "epoch": 2752} {"train_loss": -6.469578742980957, "global_step": 115589, "epoch": 2752} {"train_loss": -6.631330490112305, "global_step": 115590, "epoch": 2752} {"train_loss": -6.450639724731445, "global_step": 115591, "epoch": 2752} {"train_loss": -6.5898518562316895, "global_step": 115592, "epoch": 2752} {"train_loss": -6.573592185974121, "global_step": 115593, "epoch": 2752} {"train_loss": -6.447168350219727, "global_step": 115594, "epoch": 2752} {"train_loss": -6.4588727951049805, "global_step": 115595, "epoch": 2752} {"train_loss": -6.615066051483154, "global_step": 115596, "epoch": 2752} {"train_loss": -6.5000505447387695, "global_step": 115597, "epoch": 2752} {"train_loss": -6.580205917358398, "global_step": 115598, "epoch": 2752} {"train_loss": -6.536323547363281, "global_step": 115599, "epoch": 2752} {"train_loss": -6.536341190338135, "global_step": 115600, "epoch": 2752} {"train_loss": -6.51630973815918, "global_step": 115601, "epoch": 2752} {"train_loss": -6.585186004638672, "global_step": 115602, "epoch": 2752} {"train_loss": -6.588101387023926, "global_step": 115603, "epoch": 2752} {"train_loss": -6.511114597320557, "global_step": 115604, "epoch": 2752} {"train_loss": -6.580395221710205, "global_step": 115605, "epoch": 2752} {"train_loss": -6.585142135620117, "global_step": 115606, "epoch": 2752} {"train_loss": -6.5288543701171875, "global_step": 115607, "epoch": 2752} {"train_loss": -6.594095706939697, "global_step": 115608, "epoch": 2752} {"train_loss": -6.520236015319824, "global_step": 115609, "epoch": 2752} {"train_loss": -6.428472518920898, "global_step": 115610, "epoch": 2752} {"train_loss": -6.528373718261719, "global_step": 115611, "epoch": 2752} {"train_loss": -6.458837509155273, "global_step": 115612, "epoch": 2752} {"train_loss": -6.504378318786621, "global_step": 115613, "epoch": 2752} {"train_loss": -6.550103187561035, "global_step": 115614, "epoch": 2752} {"train_loss": -6.577332019805908, "global_step": 115615, "epoch": 2752} {"train_loss": -6.565279960632324, "global_step": 115616, "epoch": 2752} {"train_loss": -6.538311004638672, "global_step": 115617, "epoch": 2752} {"train_loss": -6.483543395996094, "global_step": 115618, "epoch": 2752} {"train_loss": -6.5475029945373535, "global_step": 115619, "epoch": 2752} {"train_loss": -6.51231050491333, "global_step": 115620, "epoch": 2752} {"train_loss": -6.5523786544799805, "global_step": 115621, "epoch": 2752} {"train_loss": -6.561184883117676, "global_step": 115622, "epoch": 2752} {"train_loss": -6.480794429779053, "global_step": 115623, "epoch": 2752} {"train_loss": -6.540999889373779, "global_step": 115624, "epoch": 2752} {"train_loss": -6.525654009410313, "global_step": 115625, "epoch": 2752, "val_loss": 65296.5} {"train_loss": -6.564397811889648, "global_step": 115626, "epoch": 2753} {"train_loss": -6.545788764953613, "global_step": 115627, "epoch": 2753} {"train_loss": -6.5693159103393555, "global_step": 115628, "epoch": 2753} {"train_loss": -6.572940826416016, "global_step": 115629, "epoch": 2753} {"train_loss": -6.524039268493652, "global_step": 115630, "epoch": 2753} {"train_loss": -6.519062042236328, "global_step": 115631, "epoch": 2753} {"train_loss": -6.491872787475586, "global_step": 115632, "epoch": 2753} {"train_loss": -6.652979373931885, "global_step": 115633, "epoch": 2753} {"train_loss": -6.645714282989502, "global_step": 115634, "epoch": 2753} {"train_loss": -6.573812007904053, "global_step": 115635, "epoch": 2753} {"train_loss": -6.641751289367676, "global_step": 115636, "epoch": 2753} {"train_loss": -6.573517799377441, "global_step": 115637, "epoch": 2753} {"train_loss": -6.546354293823242, "global_step": 115638, "epoch": 2753} {"train_loss": -6.5324482917785645, "global_step": 115639, "epoch": 2753} {"train_loss": -6.588231086730957, "global_step": 115640, "epoch": 2753} {"train_loss": -6.492158889770508, "global_step": 115641, "epoch": 2753} {"train_loss": -6.438686370849609, "global_step": 115642, "epoch": 2753} {"train_loss": -6.62440824508667, "global_step": 115643, "epoch": 2753} {"train_loss": -6.563715934753418, "global_step": 115644, "epoch": 2753} {"train_loss": -6.560660362243652, "global_step": 115645, "epoch": 2753} {"train_loss": -6.691836357116699, "global_step": 115646, "epoch": 2753} {"train_loss": -6.564018726348877, "global_step": 115647, "epoch": 2753} {"train_loss": -6.518441200256348, "global_step": 115648, "epoch": 2753} {"train_loss": -6.53176212310791, "global_step": 115649, "epoch": 2753} {"train_loss": -6.511910915374756, "global_step": 115650, "epoch": 2753} {"train_loss": -6.499086380004883, "global_step": 115651, "epoch": 2753} {"train_loss": -6.445769309997559, "global_step": 115652, "epoch": 2753} {"train_loss": -6.611554145812988, "global_step": 115653, "epoch": 2753} {"train_loss": -6.446920394897461, "global_step": 115654, "epoch": 2753} {"train_loss": -6.389617443084717, "global_step": 115655, "epoch": 2753} {"train_loss": -6.528850555419922, "global_step": 115656, "epoch": 2753} {"train_loss": -6.491400718688965, "global_step": 115657, "epoch": 2753} {"train_loss": -6.385437965393066, "global_step": 115658, "epoch": 2753} {"train_loss": -6.567626953125, "global_step": 115659, "epoch": 2753} {"train_loss": -6.4876580238342285, "global_step": 115660, "epoch": 2753} {"train_loss": -6.429159164428711, "global_step": 115661, "epoch": 2753} {"train_loss": -6.433246612548828, "global_step": 115662, "epoch": 2753} {"train_loss": -6.448449611663818, "global_step": 115663, "epoch": 2753} {"train_loss": -6.581418991088867, "global_step": 115664, "epoch": 2753} {"train_loss": -6.309536933898926, "global_step": 115665, "epoch": 2753} {"train_loss": -6.476778984069824, "global_step": 115666, "epoch": 2753} {"train_loss": -6.525284358433315, "global_step": 115667, "epoch": 2753, "val_loss": 65330.37109375} {"train_loss": -6.518351078033447, "global_step": 115668, "epoch": 2754} {"train_loss": -6.484745979309082, "global_step": 115669, "epoch": 2754} {"train_loss": -6.479485988616943, "global_step": 115670, "epoch": 2754} {"train_loss": -6.491813659667969, "global_step": 115671, "epoch": 2754} {"train_loss": -6.44378662109375, "global_step": 115672, "epoch": 2754} {"train_loss": -6.519474983215332, "global_step": 115673, "epoch": 2754} {"train_loss": -6.382016658782959, "global_step": 115674, "epoch": 2754} {"train_loss": -6.354313850402832, "global_step": 115675, "epoch": 2754} {"train_loss": -6.492668151855469, "global_step": 115676, "epoch": 2754} {"train_loss": -6.43602991104126, "global_step": 115677, "epoch": 2754} {"train_loss": -6.462536334991455, "global_step": 115678, "epoch": 2754} {"train_loss": -6.462613582611084, "global_step": 115679, "epoch": 2754} {"train_loss": -6.478682518005371, "global_step": 115680, "epoch": 2754} {"train_loss": -6.484431743621826, "global_step": 115681, "epoch": 2754} {"train_loss": -6.330375671386719, "global_step": 115682, "epoch": 2754} {"train_loss": -6.538208961486816, "global_step": 115683, "epoch": 2754} {"train_loss": -6.498639106750488, "global_step": 115684, "epoch": 2754} {"train_loss": -6.447920799255371, "global_step": 115685, "epoch": 2754} {"train_loss": -6.443244934082031, "global_step": 115686, "epoch": 2754} {"train_loss": -6.445213317871094, "global_step": 115687, "epoch": 2754} {"train_loss": -6.54679012298584, "global_step": 115688, "epoch": 2754} {"train_loss": -6.404418468475342, "global_step": 115689, "epoch": 2754} {"train_loss": -6.482486248016357, "global_step": 115690, "epoch": 2754} {"train_loss": -6.452486991882324, "global_step": 115691, "epoch": 2754} {"train_loss": -6.489258766174316, "global_step": 115692, "epoch": 2754} {"train_loss": -6.346768379211426, "global_step": 115693, "epoch": 2754} {"train_loss": -6.529356002807617, "global_step": 115694, "epoch": 2754} {"train_loss": -6.511075496673584, "global_step": 115695, "epoch": 2754} {"train_loss": -6.38677978515625, "global_step": 115696, "epoch": 2754} {"train_loss": -6.5297698974609375, "global_step": 115697, "epoch": 2754} {"train_loss": -6.645848274230957, "global_step": 115698, "epoch": 2754} {"train_loss": -6.3994832038879395, "global_step": 115699, "epoch": 2754} {"train_loss": -6.610190391540527, "global_step": 115700, "epoch": 2754} {"train_loss": -6.38936185836792, "global_step": 115701, "epoch": 2754} {"train_loss": -6.395033836364746, "global_step": 115702, "epoch": 2754} {"train_loss": -6.551843643188477, "global_step": 115703, "epoch": 2754} {"train_loss": -6.356695175170898, "global_step": 115704, "epoch": 2754} {"train_loss": -6.556899070739746, "global_step": 115705, "epoch": 2754} {"train_loss": -6.383888244628906, "global_step": 115706, "epoch": 2754} {"train_loss": -6.472977638244629, "global_step": 115707, "epoch": 2754} {"train_loss": -6.550851821899414, "global_step": 115708, "epoch": 2754} {"train_loss": -6.4673965771993, "global_step": 115709, "epoch": 2754, "val_loss": 65367.75} {"train_loss": -6.57685661315918, "global_step": 115710, "epoch": 2755} {"train_loss": -6.551624774932861, "global_step": 115711, "epoch": 2755} {"train_loss": -6.486644744873047, "global_step": 115712, "epoch": 2755} {"train_loss": -6.573718547821045, "global_step": 115713, "epoch": 2755} {"train_loss": -6.661699295043945, "global_step": 115714, "epoch": 2755} {"train_loss": -6.500248908996582, "global_step": 115715, "epoch": 2755} {"train_loss": -6.588263511657715, "global_step": 115716, "epoch": 2755} {"train_loss": -6.434083938598633, "global_step": 115717, "epoch": 2755} {"train_loss": -6.594538688659668, "global_step": 115718, "epoch": 2755} {"train_loss": -6.485057830810547, "global_step": 115719, "epoch": 2755} {"train_loss": -6.519537925720215, "global_step": 115720, "epoch": 2755} {"train_loss": -6.593642711639404, "global_step": 115721, "epoch": 2755} {"train_loss": -6.473517417907715, "global_step": 115722, "epoch": 2755} {"train_loss": -6.5427446365356445, "global_step": 115723, "epoch": 2755} {"train_loss": -6.5422210693359375, "global_step": 115724, "epoch": 2755} {"train_loss": -6.498830318450928, "global_step": 115725, "epoch": 2755} {"train_loss": -6.5791521072387695, "global_step": 115726, "epoch": 2755} {"train_loss": -6.524783134460449, "global_step": 115727, "epoch": 2755} {"train_loss": -6.559689521789551, "global_step": 115728, "epoch": 2755} {"train_loss": -6.498437881469727, "global_step": 115729, "epoch": 2755} {"train_loss": -6.512127876281738, "global_step": 115730, "epoch": 2755} {"train_loss": -6.594045639038086, "global_step": 115731, "epoch": 2755} {"train_loss": -6.475900173187256, "global_step": 115732, "epoch": 2755} {"train_loss": -6.511016845703125, "global_step": 115733, "epoch": 2755} {"train_loss": -6.4359612464904785, "global_step": 115734, "epoch": 2755} {"train_loss": -6.569536209106445, "global_step": 115735, "epoch": 2755} {"train_loss": -6.530573844909668, "global_step": 115736, "epoch": 2755} {"train_loss": -6.54063606262207, "global_step": 115737, "epoch": 2755} {"train_loss": -6.455463409423828, "global_step": 115738, "epoch": 2755} {"train_loss": -6.473740577697754, "global_step": 115739, "epoch": 2755} {"train_loss": -6.476106643676758, "global_step": 115740, "epoch": 2755} {"train_loss": -6.4332756996154785, "global_step": 115741, "epoch": 2755} {"train_loss": -6.424306869506836, "global_step": 115742, "epoch": 2755} {"train_loss": -6.504739761352539, "global_step": 115743, "epoch": 2755} {"train_loss": -6.504009246826172, "global_step": 115744, "epoch": 2755} {"train_loss": -6.496867656707764, "global_step": 115745, "epoch": 2755} {"train_loss": -6.408041000366211, "global_step": 115746, "epoch": 2755} {"train_loss": -6.5576276779174805, "global_step": 115747, "epoch": 2755} {"train_loss": -6.411095142364502, "global_step": 115748, "epoch": 2755} {"train_loss": -6.483664512634277, "global_step": 115749, "epoch": 2755} {"train_loss": -6.534402847290039, "global_step": 115750, "epoch": 2755} {"train_loss": -6.512315398170834, "global_step": 115751, "epoch": 2755, "val_loss": 65422.15234375} {"train_loss": -6.56577205657959, "global_step": 115752, "epoch": 2756} {"train_loss": -6.508620262145996, "global_step": 115753, "epoch": 2756} {"train_loss": -6.529268264770508, "global_step": 115754, "epoch": 2756} {"train_loss": -6.466727256774902, "global_step": 115755, "epoch": 2756} {"train_loss": -6.596412181854248, "global_step": 115756, "epoch": 2756} {"train_loss": -6.450604438781738, "global_step": 115757, "epoch": 2756} {"train_loss": -6.485986709594727, "global_step": 115758, "epoch": 2756} {"train_loss": -6.546613693237305, "global_step": 115759, "epoch": 2756} {"train_loss": -6.418912410736084, "global_step": 115760, "epoch": 2756} {"train_loss": -6.588316440582275, "global_step": 115761, "epoch": 2756} {"train_loss": -6.433149337768555, "global_step": 115762, "epoch": 2756} {"train_loss": -6.538148880004883, "global_step": 115763, "epoch": 2756} {"train_loss": -6.632507801055908, "global_step": 115764, "epoch": 2756} {"train_loss": -6.559411525726318, "global_step": 115765, "epoch": 2756} {"train_loss": -6.489684104919434, "global_step": 115766, "epoch": 2756} {"train_loss": -6.531900405883789, "global_step": 115767, "epoch": 2756} {"train_loss": -6.471693992614746, "global_step": 115768, "epoch": 2756} {"train_loss": -6.512962341308594, "global_step": 115769, "epoch": 2756} {"train_loss": -6.492299556732178, "global_step": 115770, "epoch": 2756} {"train_loss": -6.458405494689941, "global_step": 115771, "epoch": 2756} {"train_loss": -6.583492755889893, "global_step": 115772, "epoch": 2756} {"train_loss": -6.5838823318481445, "global_step": 115773, "epoch": 2756} {"train_loss": -6.546749114990234, "global_step": 115774, "epoch": 2756} {"train_loss": -6.528684139251709, "global_step": 115775, "epoch": 2756} {"train_loss": -6.476041793823242, "global_step": 115776, "epoch": 2756} {"train_loss": -6.4842119216918945, "global_step": 115777, "epoch": 2756} {"train_loss": -6.541871547698975, "global_step": 115778, "epoch": 2756} {"train_loss": -6.513513565063477, "global_step": 115779, "epoch": 2756} {"train_loss": -6.654268264770508, "global_step": 115780, "epoch": 2756} {"train_loss": -6.556659698486328, "global_step": 115781, "epoch": 2756} {"train_loss": -6.482227325439453, "global_step": 115782, "epoch": 2756} {"train_loss": -6.487480163574219, "global_step": 115783, "epoch": 2756} {"train_loss": -6.527505874633789, "global_step": 115784, "epoch": 2756} {"train_loss": -6.515588760375977, "global_step": 115785, "epoch": 2756} {"train_loss": -6.663758277893066, "global_step": 115786, "epoch": 2756} {"train_loss": -6.441277027130127, "global_step": 115787, "epoch": 2756} {"train_loss": -6.527616024017334, "global_step": 115788, "epoch": 2756} {"train_loss": -6.592620372772217, "global_step": 115789, "epoch": 2756} {"train_loss": -6.492005348205566, "global_step": 115790, "epoch": 2756} {"train_loss": -6.394604682922363, "global_step": 115791, "epoch": 2756} {"train_loss": -6.617698669433594, "global_step": 115792, "epoch": 2756} {"train_loss": -6.526719059262957, "global_step": 115793, "epoch": 2756, "val_loss": 65354.79296875} {"train_loss": -6.482151985168457, "global_step": 115794, "epoch": 2757} {"train_loss": -6.565999984741211, "global_step": 115795, "epoch": 2757} {"train_loss": -6.465053558349609, "global_step": 115796, "epoch": 2757} {"train_loss": -6.548815727233887, "global_step": 115797, "epoch": 2757} {"train_loss": -6.461093425750732, "global_step": 115798, "epoch": 2757} {"train_loss": -6.5258097648620605, "global_step": 115799, "epoch": 2757} {"train_loss": -6.539698123931885, "global_step": 115800, "epoch": 2757} {"train_loss": -6.300044536590576, "global_step": 115801, "epoch": 2757} {"train_loss": -6.477005481719971, "global_step": 115802, "epoch": 2757} {"train_loss": -6.295855522155762, "global_step": 115803, "epoch": 2757} {"train_loss": -6.294477462768555, "global_step": 115804, "epoch": 2757} {"train_loss": -6.5740742683410645, "global_step": 115805, "epoch": 2757} {"train_loss": -6.372175216674805, "global_step": 115806, "epoch": 2757} {"train_loss": -6.432611465454102, "global_step": 115807, "epoch": 2757} {"train_loss": -6.469500541687012, "global_step": 115808, "epoch": 2757} {"train_loss": -6.404197692871094, "global_step": 115809, "epoch": 2757} {"train_loss": -6.5843048095703125, "global_step": 115810, "epoch": 2757} {"train_loss": -6.3920578956604, "global_step": 115811, "epoch": 2757} {"train_loss": -6.552990913391113, "global_step": 115812, "epoch": 2757} {"train_loss": -6.5108513832092285, "global_step": 115813, "epoch": 2757} {"train_loss": -6.520096778869629, "global_step": 115814, "epoch": 2757} {"train_loss": -6.538930416107178, "global_step": 115815, "epoch": 2757} {"train_loss": -6.443018913269043, "global_step": 115816, "epoch": 2757} {"train_loss": -6.618363380432129, "global_step": 115817, "epoch": 2757} {"train_loss": -6.643909454345703, "global_step": 115818, "epoch": 2757} {"train_loss": -6.538163185119629, "global_step": 115819, "epoch": 2757} {"train_loss": -6.575211524963379, "global_step": 115820, "epoch": 2757} {"train_loss": -6.572696685791016, "global_step": 115821, "epoch": 2757} {"train_loss": -6.458849906921387, "global_step": 115822, "epoch": 2757} {"train_loss": -6.526316165924072, "global_step": 115823, "epoch": 2757} {"train_loss": -6.443902969360352, "global_step": 115824, "epoch": 2757} {"train_loss": -6.475666046142578, "global_step": 115825, "epoch": 2757} {"train_loss": -6.611627578735352, "global_step": 115826, "epoch": 2757} {"train_loss": -6.5973286628723145, "global_step": 115827, "epoch": 2757} {"train_loss": -6.629101753234863, "global_step": 115828, "epoch": 2757} {"train_loss": -6.51137638092041, "global_step": 115829, "epoch": 2757} {"train_loss": -6.435022830963135, "global_step": 115830, "epoch": 2757} {"train_loss": -6.443713188171387, "global_step": 115831, "epoch": 2757} {"train_loss": -6.471966743469238, "global_step": 115832, "epoch": 2757} {"train_loss": -6.508977890014648, "global_step": 115833, "epoch": 2757} {"train_loss": -6.519197463989258, "global_step": 115834, "epoch": 2757} {"train_loss": -6.495593411581857, "global_step": 115835, "epoch": 2757, "val_loss": 65351.4453125} {"train_loss": -6.567850589752197, "global_step": 115836, "epoch": 2758} {"train_loss": -6.5418620109558105, "global_step": 115837, "epoch": 2758} {"train_loss": -6.570589065551758, "global_step": 115838, "epoch": 2758} {"train_loss": -6.512725830078125, "global_step": 115839, "epoch": 2758} {"train_loss": -6.469464302062988, "global_step": 115840, "epoch": 2758} {"train_loss": -6.572662353515625, "global_step": 115841, "epoch": 2758} {"train_loss": -6.492183685302734, "global_step": 115842, "epoch": 2758} {"train_loss": -6.60524320602417, "global_step": 115843, "epoch": 2758} {"train_loss": -6.557425498962402, "global_step": 115844, "epoch": 2758} {"train_loss": -6.42212438583374, "global_step": 115845, "epoch": 2758} {"train_loss": -6.616781234741211, "global_step": 115846, "epoch": 2758} {"train_loss": -6.434640407562256, "global_step": 115847, "epoch": 2758} {"train_loss": -6.3914713859558105, "global_step": 115848, "epoch": 2758} {"train_loss": -6.565408706665039, "global_step": 115849, "epoch": 2758} {"train_loss": -6.5711774826049805, "global_step": 115850, "epoch": 2758} {"train_loss": -6.480095863342285, "global_step": 115851, "epoch": 2758} {"train_loss": -6.512378692626953, "global_step": 115852, "epoch": 2758} {"train_loss": -6.4932708740234375, "global_step": 115853, "epoch": 2758} {"train_loss": -6.491669654846191, "global_step": 115854, "epoch": 2758} {"train_loss": -6.420088768005371, "global_step": 115855, "epoch": 2758} {"train_loss": -6.490927219390869, "global_step": 115856, "epoch": 2758} {"train_loss": -6.28647518157959, "global_step": 115857, "epoch": 2758} {"train_loss": -6.54011344909668, "global_step": 115858, "epoch": 2758} {"train_loss": -6.520735740661621, "global_step": 115859, "epoch": 2758} {"train_loss": -6.368027687072754, "global_step": 115860, "epoch": 2758} {"train_loss": -6.624290466308594, "global_step": 115861, "epoch": 2758} {"train_loss": -6.432082653045654, "global_step": 115862, "epoch": 2758} {"train_loss": -6.472682952880859, "global_step": 115863, "epoch": 2758} {"train_loss": -6.615121841430664, "global_step": 115864, "epoch": 2758} {"train_loss": -6.535239219665527, "global_step": 115865, "epoch": 2758} {"train_loss": -6.3909831047058105, "global_step": 115866, "epoch": 2758} {"train_loss": -6.538097858428955, "global_step": 115867, "epoch": 2758} {"train_loss": -6.453609466552734, "global_step": 115868, "epoch": 2758} {"train_loss": -6.462640285491943, "global_step": 115869, "epoch": 2758} {"train_loss": -6.449771881103516, "global_step": 115870, "epoch": 2758} {"train_loss": -6.460300922393799, "global_step": 115871, "epoch": 2758} {"train_loss": -6.5621137619018555, "global_step": 115872, "epoch": 2758} {"train_loss": -6.347817420959473, "global_step": 115873, "epoch": 2758} {"train_loss": -6.567041397094727, "global_step": 115874, "epoch": 2758} {"train_loss": -6.577267169952393, "global_step": 115875, "epoch": 2758} {"train_loss": -6.485771179199219, "global_step": 115876, "epoch": 2758} {"train_loss": -6.500163430259342, "global_step": 115877, "epoch": 2758, "val_loss": 65467.6953125} {"train_loss": -6.527560234069824, "global_step": 115878, "epoch": 2759} {"train_loss": -6.513576030731201, "global_step": 115879, "epoch": 2759} {"train_loss": -6.554760932922363, "global_step": 115880, "epoch": 2759} {"train_loss": -6.523481369018555, "global_step": 115881, "epoch": 2759} {"train_loss": -6.4894280433654785, "global_step": 115882, "epoch": 2759} {"train_loss": -6.547371864318848, "global_step": 115883, "epoch": 2759} {"train_loss": -6.537174701690674, "global_step": 115884, "epoch": 2759} {"train_loss": -6.446673393249512, "global_step": 115885, "epoch": 2759} {"train_loss": -6.537594795227051, "global_step": 115886, "epoch": 2759} {"train_loss": -6.458383083343506, "global_step": 115887, "epoch": 2759} {"train_loss": -6.557772159576416, "global_step": 115888, "epoch": 2759} {"train_loss": -6.509150505065918, "global_step": 115889, "epoch": 2759} {"train_loss": -6.627865791320801, "global_step": 115890, "epoch": 2759} {"train_loss": -6.430983066558838, "global_step": 115891, "epoch": 2759} {"train_loss": -6.41139554977417, "global_step": 115892, "epoch": 2759} {"train_loss": -6.396405220031738, "global_step": 115893, "epoch": 2759} {"train_loss": -6.443861484527588, "global_step": 115894, "epoch": 2759} {"train_loss": -6.431373596191406, "global_step": 115895, "epoch": 2759} {"train_loss": -6.422434329986572, "global_step": 115896, "epoch": 2759} {"train_loss": -6.465409278869629, "global_step": 115897, "epoch": 2759} {"train_loss": -6.469086647033691, "global_step": 115898, "epoch": 2759} {"train_loss": -6.446718215942383, "global_step": 115899, "epoch": 2759} {"train_loss": -6.442922592163086, "global_step": 115900, "epoch": 2759} {"train_loss": -6.446682929992676, "global_step": 115901, "epoch": 2759} {"train_loss": -6.523754119873047, "global_step": 115902, "epoch": 2759} {"train_loss": -6.556371688842773, "global_step": 115903, "epoch": 2759} {"train_loss": -6.420693397521973, "global_step": 115904, "epoch": 2759} {"train_loss": -6.441393852233887, "global_step": 115905, "epoch": 2759} {"train_loss": -6.551455497741699, "global_step": 115906, "epoch": 2759} {"train_loss": -6.497712135314941, "global_step": 115907, "epoch": 2759} {"train_loss": -6.491627216339111, "global_step": 115908, "epoch": 2759} {"train_loss": -6.460475921630859, "global_step": 115909, "epoch": 2759} {"train_loss": -6.420500755310059, "global_step": 115910, "epoch": 2759} {"train_loss": -6.57797908782959, "global_step": 115911, "epoch": 2759} {"train_loss": -6.489201068878174, "global_step": 115912, "epoch": 2759} {"train_loss": -6.408111572265625, "global_step": 115913, "epoch": 2759} {"train_loss": -6.524847984313965, "global_step": 115914, "epoch": 2759} {"train_loss": -6.521587371826172, "global_step": 115915, "epoch": 2759} {"train_loss": -6.4574294090271, "global_step": 115916, "epoch": 2759} {"train_loss": -6.432553291320801, "global_step": 115917, "epoch": 2759} {"train_loss": -6.490045070648193, "global_step": 115918, "epoch": 2759} {"train_loss": -6.487722987220401, "global_step": 115919, "epoch": 2759, "val_loss": 65394.03125} {"train_loss": -6.504182815551758, "global_step": 115920, "epoch": 2760} {"train_loss": -6.467373847961426, "global_step": 115921, "epoch": 2760} {"train_loss": -6.631972789764404, "global_step": 115922, "epoch": 2760} {"train_loss": -6.410329818725586, "global_step": 115923, "epoch": 2760} {"train_loss": -6.494969367980957, "global_step": 115924, "epoch": 2760} {"train_loss": -6.627799987792969, "global_step": 115925, "epoch": 2760} {"train_loss": -6.522945404052734, "global_step": 115926, "epoch": 2760} {"train_loss": -6.568312168121338, "global_step": 115927, "epoch": 2760} {"train_loss": -6.605830192565918, "global_step": 115928, "epoch": 2760} {"train_loss": -6.5530500411987305, "global_step": 115929, "epoch": 2760} {"train_loss": -6.645887851715088, "global_step": 115930, "epoch": 2760} {"train_loss": -6.4657487869262695, "global_step": 115931, "epoch": 2760} {"train_loss": -6.597285270690918, "global_step": 115932, "epoch": 2760} {"train_loss": -6.622262477874756, "global_step": 115933, "epoch": 2760} {"train_loss": -6.5857768058776855, "global_step": 115934, "epoch": 2760} {"train_loss": -6.486618995666504, "global_step": 115935, "epoch": 2760} {"train_loss": -6.625500679016113, "global_step": 115936, "epoch": 2760} {"train_loss": -6.549561977386475, "global_step": 115937, "epoch": 2760} {"train_loss": -6.501237869262695, "global_step": 115938, "epoch": 2760} {"train_loss": -6.489770889282227, "global_step": 115939, "epoch": 2760} {"train_loss": -6.628147125244141, "global_step": 115940, "epoch": 2760} {"train_loss": -6.544943809509277, "global_step": 115941, "epoch": 2760} {"train_loss": -6.580652713775635, "global_step": 115942, "epoch": 2760} {"train_loss": -6.552641868591309, "global_step": 115943, "epoch": 2760} {"train_loss": -6.565155029296875, "global_step": 115944, "epoch": 2760} {"train_loss": -6.580136775970459, "global_step": 115945, "epoch": 2760} {"train_loss": -6.540143966674805, "global_step": 115946, "epoch": 2760} {"train_loss": -6.574427127838135, "global_step": 115947, "epoch": 2760} {"train_loss": -6.541204452514648, "global_step": 115948, "epoch": 2760} {"train_loss": -6.603015899658203, "global_step": 115949, "epoch": 2760} {"train_loss": -6.560309410095215, "global_step": 115950, "epoch": 2760} {"train_loss": -6.53703498840332, "global_step": 115951, "epoch": 2760} {"train_loss": -6.4873456954956055, "global_step": 115952, "epoch": 2760} {"train_loss": -6.494474411010742, "global_step": 115953, "epoch": 2760} {"train_loss": -6.57696533203125, "global_step": 115954, "epoch": 2760} {"train_loss": -6.671816825866699, "global_step": 115955, "epoch": 2760} {"train_loss": -6.585087299346924, "global_step": 115956, "epoch": 2760} {"train_loss": -6.485191345214844, "global_step": 115957, "epoch": 2760} {"train_loss": -6.576653003692627, "global_step": 115958, "epoch": 2760} {"train_loss": -6.513398170471191, "global_step": 115959, "epoch": 2760} {"train_loss": -6.543670177459717, "global_step": 115960, "epoch": 2760} {"train_loss": -6.554566383361816, "global_step": 115961, "epoch": 2760, "val_loss": 65255.83984375} {"train_loss": -6.528413772583008, "global_step": 115962, "epoch": 2761} {"train_loss": -6.546876907348633, "global_step": 115963, "epoch": 2761} {"train_loss": -6.6215925216674805, "global_step": 115964, "epoch": 2761} {"train_loss": -6.61402702331543, "global_step": 115965, "epoch": 2761} {"train_loss": -6.512394428253174, "global_step": 115966, "epoch": 2761} {"train_loss": -6.5402913093566895, "global_step": 115967, "epoch": 2761} {"train_loss": -6.539388179779053, "global_step": 115968, "epoch": 2761} {"train_loss": -6.5022759437561035, "global_step": 115969, "epoch": 2761} {"train_loss": -6.53810453414917, "global_step": 115970, "epoch": 2761} {"train_loss": -6.557343006134033, "global_step": 115971, "epoch": 2761} {"train_loss": -6.607109069824219, "global_step": 115972, "epoch": 2761} {"train_loss": -6.554411888122559, "global_step": 115973, "epoch": 2761} {"train_loss": -6.4499125480651855, "global_step": 115974, "epoch": 2761} {"train_loss": -6.71639347076416, "global_step": 115975, "epoch": 2761} {"train_loss": -6.578855991363525, "global_step": 115976, "epoch": 2761} {"train_loss": -6.57676887512207, "global_step": 115977, "epoch": 2761} {"train_loss": -6.508810043334961, "global_step": 115978, "epoch": 2761} {"train_loss": -6.514832496643066, "global_step": 115979, "epoch": 2761} {"train_loss": -6.564582347869873, "global_step": 115980, "epoch": 2761} {"train_loss": -6.5677170753479, "global_step": 115981, "epoch": 2761} {"train_loss": -6.50158166885376, "global_step": 115982, "epoch": 2761} {"train_loss": -6.5283403396606445, "global_step": 115983, "epoch": 2761} {"train_loss": -6.510971546173096, "global_step": 115984, "epoch": 2761} {"train_loss": -6.667231559753418, "global_step": 115985, "epoch": 2761} {"train_loss": -6.479491710662842, "global_step": 115986, "epoch": 2761} {"train_loss": -6.536637306213379, "global_step": 115987, "epoch": 2761} {"train_loss": -6.525042533874512, "global_step": 115988, "epoch": 2761} {"train_loss": -6.523212432861328, "global_step": 115989, "epoch": 2761} {"train_loss": -6.504159927368164, "global_step": 115990, "epoch": 2761} {"train_loss": -6.517543792724609, "global_step": 115991, "epoch": 2761} {"train_loss": -6.598482131958008, "global_step": 115992, "epoch": 2761} {"train_loss": -6.405734062194824, "global_step": 115993, "epoch": 2761} {"train_loss": -6.5258660316467285, "global_step": 115994, "epoch": 2761} {"train_loss": -6.671115398406982, "global_step": 115995, "epoch": 2761} {"train_loss": -6.511496543884277, "global_step": 115996, "epoch": 2761} {"train_loss": -6.339877128601074, "global_step": 115997, "epoch": 2761} {"train_loss": -6.483681678771973, "global_step": 115998, "epoch": 2761} {"train_loss": -6.6051788330078125, "global_step": 115999, "epoch": 2761} {"train_loss": -6.341483116149902, "global_step": 116000, "epoch": 2761} {"train_loss": -6.511471748352051, "global_step": 116001, "epoch": 2761} {"train_loss": -6.4999494552612305, "global_step": 116002, "epoch": 2761} {"train_loss": -6.534137986955189, "global_step": 116003, "epoch": 2761, "val_loss": 65452.87890625} {"train_loss": -6.576906204223633, "global_step": 116004, "epoch": 2762} {"train_loss": -6.525956630706787, "global_step": 116005, "epoch": 2762} {"train_loss": -6.530786991119385, "global_step": 116006, "epoch": 2762} {"train_loss": -6.523458480834961, "global_step": 116007, "epoch": 2762} {"train_loss": -6.373653888702393, "global_step": 116008, "epoch": 2762} {"train_loss": -6.414793014526367, "global_step": 116009, "epoch": 2762} {"train_loss": -6.496535778045654, "global_step": 116010, "epoch": 2762} {"train_loss": -6.569962501525879, "global_step": 116011, "epoch": 2762} {"train_loss": -6.626384258270264, "global_step": 116012, "epoch": 2762} {"train_loss": -6.404348850250244, "global_step": 116013, "epoch": 2762} {"train_loss": -6.53411865234375, "global_step": 116014, "epoch": 2762} {"train_loss": -6.580890655517578, "global_step": 116015, "epoch": 2762} {"train_loss": -6.481387138366699, "global_step": 116016, "epoch": 2762} {"train_loss": -6.558129787445068, "global_step": 116017, "epoch": 2762} {"train_loss": -6.424781322479248, "global_step": 116018, "epoch": 2762} {"train_loss": -6.541237831115723, "global_step": 116019, "epoch": 2762} {"train_loss": -6.381769180297852, "global_step": 116020, "epoch": 2762} {"train_loss": -6.554686546325684, "global_step": 116021, "epoch": 2762} {"train_loss": -6.482717037200928, "global_step": 116022, "epoch": 2762} {"train_loss": -6.495735168457031, "global_step": 116023, "epoch": 2762} {"train_loss": -6.630708694458008, "global_step": 116024, "epoch": 2762} {"train_loss": -6.37306022644043, "global_step": 116025, "epoch": 2762} {"train_loss": -6.3915839195251465, "global_step": 116026, "epoch": 2762} {"train_loss": -6.562989711761475, "global_step": 116027, "epoch": 2762} {"train_loss": -6.532379150390625, "global_step": 116028, "epoch": 2762} {"train_loss": -6.518216133117676, "global_step": 116029, "epoch": 2762} {"train_loss": -6.544065475463867, "global_step": 116030, "epoch": 2762} {"train_loss": -6.528962135314941, "global_step": 116031, "epoch": 2762} {"train_loss": -6.563510894775391, "global_step": 116032, "epoch": 2762} {"train_loss": -6.535372257232666, "global_step": 116033, "epoch": 2762} {"train_loss": -6.599177360534668, "global_step": 116034, "epoch": 2762} {"train_loss": -6.575808525085449, "global_step": 116035, "epoch": 2762} {"train_loss": -6.6063690185546875, "global_step": 116036, "epoch": 2762} {"train_loss": -6.579883575439453, "global_step": 116037, "epoch": 2762} {"train_loss": -6.487844467163086, "global_step": 116038, "epoch": 2762} {"train_loss": -6.574546813964844, "global_step": 116039, "epoch": 2762} {"train_loss": -6.561907768249512, "global_step": 116040, "epoch": 2762} {"train_loss": -6.5573577880859375, "global_step": 116041, "epoch": 2762} {"train_loss": -6.597329139709473, "global_step": 116042, "epoch": 2762} {"train_loss": -6.495206832885742, "global_step": 116043, "epoch": 2762} {"train_loss": -6.382286548614502, "global_step": 116044, "epoch": 2762} {"train_loss": -6.520181962421963, "global_step": 116045, "epoch": 2762, "val_loss": 65496.6875} {"train_loss": -6.46895694732666, "global_step": 116046, "epoch": 2763} {"train_loss": -6.601253986358643, "global_step": 116047, "epoch": 2763} {"train_loss": -6.410435676574707, "global_step": 116048, "epoch": 2763} {"train_loss": -6.408215522766113, "global_step": 116049, "epoch": 2763} {"train_loss": -6.540828704833984, "global_step": 116050, "epoch": 2763} {"train_loss": -6.3496246337890625, "global_step": 116051, "epoch": 2763} {"train_loss": -6.475667476654053, "global_step": 116052, "epoch": 2763} {"train_loss": -6.4368577003479, "global_step": 116053, "epoch": 2763} {"train_loss": -6.480990409851074, "global_step": 116054, "epoch": 2763} {"train_loss": -6.580833435058594, "global_step": 116055, "epoch": 2763} {"train_loss": -6.446314334869385, "global_step": 116056, "epoch": 2763} {"train_loss": -6.446130275726318, "global_step": 116057, "epoch": 2763} {"train_loss": -6.618236541748047, "global_step": 116058, "epoch": 2763} {"train_loss": -6.5219268798828125, "global_step": 116059, "epoch": 2763} {"train_loss": -6.540549278259277, "global_step": 116060, "epoch": 2763} {"train_loss": -6.476754665374756, "global_step": 116061, "epoch": 2763} {"train_loss": -6.588462829589844, "global_step": 116062, "epoch": 2763} {"train_loss": -6.527446746826172, "global_step": 116063, "epoch": 2763} {"train_loss": -6.515472412109375, "global_step": 116064, "epoch": 2763} {"train_loss": -6.468277931213379, "global_step": 116065, "epoch": 2763} {"train_loss": -6.7207441329956055, "global_step": 116066, "epoch": 2763} {"train_loss": -6.523709297180176, "global_step": 116067, "epoch": 2763} {"train_loss": -6.553465843200684, "global_step": 116068, "epoch": 2763} {"train_loss": -6.645112037658691, "global_step": 116069, "epoch": 2763} {"train_loss": -6.551249980926514, "global_step": 116070, "epoch": 2763} {"train_loss": -6.4845685958862305, "global_step": 116071, "epoch": 2763} {"train_loss": -6.561288356781006, "global_step": 116072, "epoch": 2763} {"train_loss": -6.495668888092041, "global_step": 116073, "epoch": 2763} {"train_loss": -6.521668434143066, "global_step": 116074, "epoch": 2763} {"train_loss": -6.513087272644043, "global_step": 116075, "epoch": 2763} {"train_loss": -6.66210412979126, "global_step": 116076, "epoch": 2763} {"train_loss": -6.542815685272217, "global_step": 116077, "epoch": 2763} {"train_loss": -6.547175407409668, "global_step": 116078, "epoch": 2763} {"train_loss": -6.5149245262146, "global_step": 116079, "epoch": 2763} {"train_loss": -6.414798736572266, "global_step": 116080, "epoch": 2763} {"train_loss": -6.5869879722595215, "global_step": 116081, "epoch": 2763} {"train_loss": -6.552202224731445, "global_step": 116082, "epoch": 2763} {"train_loss": -6.470000743865967, "global_step": 116083, "epoch": 2763} {"train_loss": -6.565815448760986, "global_step": 116084, "epoch": 2763} {"train_loss": -6.6725993156433105, "global_step": 116085, "epoch": 2763} {"train_loss": -6.473336696624756, "global_step": 116086, "epoch": 2763} {"train_loss": -6.522784199033465, "global_step": 116087, "epoch": 2763, "val_loss": 65387.51953125} {"train_loss": -6.511143684387207, "global_step": 116088, "epoch": 2764} {"train_loss": -6.521035671234131, "global_step": 116089, "epoch": 2764} {"train_loss": -6.556868553161621, "global_step": 116090, "epoch": 2764} {"train_loss": -6.556965351104736, "global_step": 116091, "epoch": 2764} {"train_loss": -6.413569450378418, "global_step": 116092, "epoch": 2764} {"train_loss": -6.5493035316467285, "global_step": 116093, "epoch": 2764} {"train_loss": -6.587381362915039, "global_step": 116094, "epoch": 2764} {"train_loss": -6.516615390777588, "global_step": 116095, "epoch": 2764} {"train_loss": -6.4524078369140625, "global_step": 116096, "epoch": 2764} {"train_loss": -6.553751468658447, "global_step": 116097, "epoch": 2764} {"train_loss": -6.463932037353516, "global_step": 116098, "epoch": 2764} {"train_loss": -6.590272426605225, "global_step": 116099, "epoch": 2764} {"train_loss": -6.530839443206787, "global_step": 116100, "epoch": 2764} {"train_loss": -6.575902938842773, "global_step": 116101, "epoch": 2764} {"train_loss": -6.566774845123291, "global_step": 116102, "epoch": 2764} {"train_loss": -6.573811054229736, "global_step": 116103, "epoch": 2764} {"train_loss": -6.534955978393555, "global_step": 116104, "epoch": 2764} {"train_loss": -6.600790023803711, "global_step": 116105, "epoch": 2764} {"train_loss": -6.498607635498047, "global_step": 116106, "epoch": 2764} {"train_loss": -6.480773448944092, "global_step": 116107, "epoch": 2764} {"train_loss": -6.401555061340332, "global_step": 116108, "epoch": 2764} {"train_loss": -6.594118118286133, "global_step": 116109, "epoch": 2764} {"train_loss": -6.602872371673584, "global_step": 116110, "epoch": 2764} {"train_loss": -6.4926371574401855, "global_step": 116111, "epoch": 2764} {"train_loss": -6.386632442474365, "global_step": 116112, "epoch": 2764} {"train_loss": -6.547825813293457, "global_step": 116113, "epoch": 2764} {"train_loss": -6.536738872528076, "global_step": 116114, "epoch": 2764} {"train_loss": -6.554195404052734, "global_step": 116115, "epoch": 2764} {"train_loss": -6.586881637573242, "global_step": 116116, "epoch": 2764} {"train_loss": -6.666207790374756, "global_step": 116117, "epoch": 2764} {"train_loss": -6.464563846588135, "global_step": 116118, "epoch": 2764} {"train_loss": -6.537529945373535, "global_step": 116119, "epoch": 2764} {"train_loss": -6.547578811645508, "global_step": 116120, "epoch": 2764} {"train_loss": -6.559588432312012, "global_step": 116121, "epoch": 2764} {"train_loss": -6.5454511642456055, "global_step": 116122, "epoch": 2764} {"train_loss": -6.613391876220703, "global_step": 116123, "epoch": 2764} {"train_loss": -6.53140926361084, "global_step": 116124, "epoch": 2764} {"train_loss": -6.5073957443237305, "global_step": 116125, "epoch": 2764} {"train_loss": -6.622345924377441, "global_step": 116126, "epoch": 2764} {"train_loss": -6.557064056396484, "global_step": 116127, "epoch": 2764} {"train_loss": -6.523984909057617, "global_step": 116128, "epoch": 2764} {"train_loss": -6.537260816210792, "global_step": 116129, "epoch": 2764, "val_loss": 65284.0} {"train_loss": -6.496644496917725, "global_step": 116130, "epoch": 2765} {"train_loss": -6.667522430419922, "global_step": 116131, "epoch": 2765} {"train_loss": -6.5835041999816895, "global_step": 116132, "epoch": 2765} {"train_loss": -6.521188735961914, "global_step": 116133, "epoch": 2765} {"train_loss": -6.550455093383789, "global_step": 116134, "epoch": 2765} {"train_loss": -6.474304676055908, "global_step": 116135, "epoch": 2765} {"train_loss": -6.550222396850586, "global_step": 116136, "epoch": 2765} {"train_loss": -6.61305046081543, "global_step": 116137, "epoch": 2765} {"train_loss": -6.623899936676025, "global_step": 116138, "epoch": 2765} {"train_loss": -6.650763511657715, "global_step": 116139, "epoch": 2765} {"train_loss": -6.509839057922363, "global_step": 116140, "epoch": 2765} {"train_loss": -6.547703742980957, "global_step": 116141, "epoch": 2765} {"train_loss": -6.600454330444336, "global_step": 116142, "epoch": 2765} {"train_loss": -6.6051177978515625, "global_step": 116143, "epoch": 2765} {"train_loss": -6.5921854972839355, "global_step": 116144, "epoch": 2765} {"train_loss": -6.455067157745361, "global_step": 116145, "epoch": 2765} {"train_loss": -6.45299768447876, "global_step": 116146, "epoch": 2765} {"train_loss": -6.552403450012207, "global_step": 116147, "epoch": 2765} {"train_loss": -6.518257141113281, "global_step": 116148, "epoch": 2765} {"train_loss": -6.529296875, "global_step": 116149, "epoch": 2765} {"train_loss": -6.517947673797607, "global_step": 116150, "epoch": 2765} {"train_loss": -6.606858730316162, "global_step": 116151, "epoch": 2765} {"train_loss": -6.48689079284668, "global_step": 116152, "epoch": 2765} {"train_loss": -6.4378981590271, "global_step": 116153, "epoch": 2765} {"train_loss": -6.474281311035156, "global_step": 116154, "epoch": 2765} {"train_loss": -6.354583740234375, "global_step": 116155, "epoch": 2765} {"train_loss": -6.470531940460205, "global_step": 116156, "epoch": 2765} {"train_loss": -6.505259990692139, "global_step": 116157, "epoch": 2765} {"train_loss": -6.545982360839844, "global_step": 116158, "epoch": 2765} {"train_loss": -6.539044380187988, "global_step": 116159, "epoch": 2765} {"train_loss": -6.443603038787842, "global_step": 116160, "epoch": 2765} {"train_loss": -6.646859169006348, "global_step": 116161, "epoch": 2765} {"train_loss": -6.478000640869141, "global_step": 116162, "epoch": 2765} {"train_loss": -6.600372791290283, "global_step": 116163, "epoch": 2765} {"train_loss": -6.606341361999512, "global_step": 116164, "epoch": 2765} {"train_loss": -6.448589324951172, "global_step": 116165, "epoch": 2765} {"train_loss": -6.585599422454834, "global_step": 116166, "epoch": 2765} {"train_loss": -6.547114372253418, "global_step": 116167, "epoch": 2765} {"train_loss": -6.6534504890441895, "global_step": 116168, "epoch": 2765} {"train_loss": -6.660265922546387, "global_step": 116169, "epoch": 2765} {"train_loss": -6.5219244956970215, "global_step": 116170, "epoch": 2765} {"train_loss": -6.545112553096953, "global_step": 116171, "epoch": 2765, "val_loss": 65466.0625} {"train_loss": -6.538436412811279, "global_step": 116172, "epoch": 2766} {"train_loss": -6.581418991088867, "global_step": 116173, "epoch": 2766} {"train_loss": -6.499691009521484, "global_step": 116174, "epoch": 2766} {"train_loss": -6.479165077209473, "global_step": 116175, "epoch": 2766} {"train_loss": -6.44394588470459, "global_step": 116176, "epoch": 2766} {"train_loss": -6.4499030113220215, "global_step": 116177, "epoch": 2766} {"train_loss": -6.356293678283691, "global_step": 116178, "epoch": 2766} {"train_loss": -6.449822425842285, "global_step": 116179, "epoch": 2766} {"train_loss": -6.495855331420898, "global_step": 116180, "epoch": 2766} {"train_loss": -6.3118085861206055, "global_step": 116181, "epoch": 2766} {"train_loss": -6.507885456085205, "global_step": 116182, "epoch": 2766} {"train_loss": -6.459768295288086, "global_step": 116183, "epoch": 2766} {"train_loss": -6.639891624450684, "global_step": 116184, "epoch": 2766} {"train_loss": -6.417932510375977, "global_step": 116185, "epoch": 2766} {"train_loss": -6.584214210510254, "global_step": 116186, "epoch": 2766} {"train_loss": -6.512729644775391, "global_step": 116187, "epoch": 2766} {"train_loss": -6.4623026847839355, "global_step": 116188, "epoch": 2766} {"train_loss": -6.540629863739014, "global_step": 116189, "epoch": 2766} {"train_loss": -6.489907264709473, "global_step": 116190, "epoch": 2766} {"train_loss": -6.458868026733398, "global_step": 116191, "epoch": 2766} {"train_loss": -6.497129440307617, "global_step": 116192, "epoch": 2766} {"train_loss": -6.616281509399414, "global_step": 116193, "epoch": 2766} {"train_loss": -6.601178169250488, "global_step": 116194, "epoch": 2766} {"train_loss": -6.585211277008057, "global_step": 116195, "epoch": 2766} {"train_loss": -6.497638702392578, "global_step": 116196, "epoch": 2766} {"train_loss": -6.5171685218811035, "global_step": 116197, "epoch": 2766} {"train_loss": -6.416346073150635, "global_step": 116198, "epoch": 2766} {"train_loss": -6.469863414764404, "global_step": 116199, "epoch": 2766} {"train_loss": -6.4814300537109375, "global_step": 116200, "epoch": 2766} {"train_loss": -6.365799427032471, "global_step": 116201, "epoch": 2766} {"train_loss": -6.460140705108643, "global_step": 116202, "epoch": 2766} {"train_loss": -6.4177961349487305, "global_step": 116203, "epoch": 2766} {"train_loss": -6.6036376953125, "global_step": 116204, "epoch": 2766} {"train_loss": -6.488679885864258, "global_step": 116205, "epoch": 2766} {"train_loss": -6.331332206726074, "global_step": 116206, "epoch": 2766} {"train_loss": -6.5772600173950195, "global_step": 116207, "epoch": 2766} {"train_loss": -6.329351425170898, "global_step": 116208, "epoch": 2766} {"train_loss": -6.495352745056152, "global_step": 116209, "epoch": 2766} {"train_loss": -6.517353057861328, "global_step": 116210, "epoch": 2766} {"train_loss": -6.364107131958008, "global_step": 116211, "epoch": 2766} {"train_loss": -6.479462146759033, "global_step": 116212, "epoch": 2766} {"train_loss": -6.482873519261678, "global_step": 116213, "epoch": 2766, "val_loss": 65520.65234375} {"train_loss": -6.501518249511719, "global_step": 116214, "epoch": 2767} {"train_loss": -6.4782867431640625, "global_step": 116215, "epoch": 2767} {"train_loss": -6.5105390548706055, "global_step": 116216, "epoch": 2767} {"train_loss": -6.548764705657959, "global_step": 116217, "epoch": 2767} {"train_loss": -6.521720886230469, "global_step": 116218, "epoch": 2767} {"train_loss": -6.518218040466309, "global_step": 116219, "epoch": 2767} {"train_loss": -6.526873588562012, "global_step": 116220, "epoch": 2767} {"train_loss": -6.4898295402526855, "global_step": 116221, "epoch": 2767} {"train_loss": -6.45198917388916, "global_step": 116222, "epoch": 2767} {"train_loss": -6.433526992797852, "global_step": 116223, "epoch": 2767} {"train_loss": -6.448606967926025, "global_step": 116224, "epoch": 2767} {"train_loss": -6.473620414733887, "global_step": 116225, "epoch": 2767} {"train_loss": -6.652904510498047, "global_step": 116226, "epoch": 2767} {"train_loss": -6.586176872253418, "global_step": 116227, "epoch": 2767} {"train_loss": -6.744229316711426, "global_step": 116228, "epoch": 2767} {"train_loss": -6.567286491394043, "global_step": 116229, "epoch": 2767} {"train_loss": -6.6188859939575195, "global_step": 116230, "epoch": 2767} {"train_loss": -6.5254974365234375, "global_step": 116231, "epoch": 2767} {"train_loss": -6.586324691772461, "global_step": 116232, "epoch": 2767} {"train_loss": -6.6172637939453125, "global_step": 116233, "epoch": 2767} {"train_loss": -6.633408546447754, "global_step": 116234, "epoch": 2767} {"train_loss": -6.572127819061279, "global_step": 116235, "epoch": 2767} {"train_loss": -6.528008460998535, "global_step": 116236, "epoch": 2767} {"train_loss": -6.690705299377441, "global_step": 116237, "epoch": 2767} {"train_loss": -6.492669105529785, "global_step": 116238, "epoch": 2767} {"train_loss": -6.5775885581970215, "global_step": 116239, "epoch": 2767} {"train_loss": -6.602893829345703, "global_step": 116240, "epoch": 2767} {"train_loss": -6.664577484130859, "global_step": 116241, "epoch": 2767} {"train_loss": -6.449324131011963, "global_step": 116242, "epoch": 2767} {"train_loss": -6.515438079833984, "global_step": 116243, "epoch": 2767} {"train_loss": -6.623438835144043, "global_step": 116244, "epoch": 2767} {"train_loss": -6.515584468841553, "global_step": 116245, "epoch": 2767} {"train_loss": -6.55660343170166, "global_step": 116246, "epoch": 2767} {"train_loss": -6.645334243774414, "global_step": 116247, "epoch": 2767} {"train_loss": -6.500662326812744, "global_step": 116248, "epoch": 2767} {"train_loss": -6.448678970336914, "global_step": 116249, "epoch": 2767} {"train_loss": -6.576708793640137, "global_step": 116250, "epoch": 2767} {"train_loss": -6.496793270111084, "global_step": 116251, "epoch": 2767} {"train_loss": -6.528212070465088, "global_step": 116252, "epoch": 2767} {"train_loss": -6.444247245788574, "global_step": 116253, "epoch": 2767} {"train_loss": -6.509588241577148, "global_step": 116254, "epoch": 2767} {"train_loss": -6.547762745902652, "global_step": 116255, "epoch": 2767, "val_loss": 65480.3671875} {"train_loss": -6.5935444831848145, "global_step": 116256, "epoch": 2768} {"train_loss": -6.438920974731445, "global_step": 116257, "epoch": 2768} {"train_loss": -6.556851863861084, "global_step": 116258, "epoch": 2768} {"train_loss": -6.473150253295898, "global_step": 116259, "epoch": 2768} {"train_loss": -6.616522789001465, "global_step": 116260, "epoch": 2768} {"train_loss": -6.509458541870117, "global_step": 116261, "epoch": 2768} {"train_loss": -6.4747209548950195, "global_step": 116262, "epoch": 2768} {"train_loss": -6.537975311279297, "global_step": 116263, "epoch": 2768} {"train_loss": -6.495316982269287, "global_step": 116264, "epoch": 2768} {"train_loss": -6.418006896972656, "global_step": 116265, "epoch": 2768} {"train_loss": -6.477405548095703, "global_step": 116266, "epoch": 2768} {"train_loss": -6.440625190734863, "global_step": 116267, "epoch": 2768} {"train_loss": -6.493479251861572, "global_step": 116268, "epoch": 2768} {"train_loss": -6.579162120819092, "global_step": 116269, "epoch": 2768} {"train_loss": -6.503498554229736, "global_step": 116270, "epoch": 2768} {"train_loss": -6.586753845214844, "global_step": 116271, "epoch": 2768} {"train_loss": -6.610547065734863, "global_step": 116272, "epoch": 2768} {"train_loss": -6.502677917480469, "global_step": 116273, "epoch": 2768} {"train_loss": -6.513010025024414, "global_step": 116274, "epoch": 2768} {"train_loss": -6.564291000366211, "global_step": 116275, "epoch": 2768} {"train_loss": -6.404149532318115, "global_step": 116276, "epoch": 2768} {"train_loss": -6.483529090881348, "global_step": 116277, "epoch": 2768} {"train_loss": -6.487458229064941, "global_step": 116278, "epoch": 2768} {"train_loss": -6.546729564666748, "global_step": 116279, "epoch": 2768} {"train_loss": -6.509787082672119, "global_step": 116280, "epoch": 2768} {"train_loss": -6.5751800537109375, "global_step": 116281, "epoch": 2768} {"train_loss": -6.495422840118408, "global_step": 116282, "epoch": 2768} {"train_loss": -6.462125301361084, "global_step": 116283, "epoch": 2768} {"train_loss": -6.585825443267822, "global_step": 116284, "epoch": 2768} {"train_loss": -6.507963180541992, "global_step": 116285, "epoch": 2768} {"train_loss": -6.569850921630859, "global_step": 116286, "epoch": 2768} {"train_loss": -6.535326957702637, "global_step": 116287, "epoch": 2768} {"train_loss": -6.543413162231445, "global_step": 116288, "epoch": 2768} {"train_loss": -6.576162338256836, "global_step": 116289, "epoch": 2768} {"train_loss": -6.520087718963623, "global_step": 116290, "epoch": 2768} {"train_loss": -6.4323859214782715, "global_step": 116291, "epoch": 2768} {"train_loss": -6.489355564117432, "global_step": 116292, "epoch": 2768} {"train_loss": -6.546092510223389, "global_step": 116293, "epoch": 2768} {"train_loss": -6.369166374206543, "global_step": 116294, "epoch": 2768} {"train_loss": -6.664427757263184, "global_step": 116295, "epoch": 2768} {"train_loss": -6.542839050292969, "global_step": 116296, "epoch": 2768} {"train_loss": -6.516643115452358, "global_step": 116297, "epoch": 2768, "val_loss": 65493.36328125} {"train_loss": -6.521629333496094, "global_step": 116298, "epoch": 2769} {"train_loss": -6.592482566833496, "global_step": 116299, "epoch": 2769} {"train_loss": -6.56256628036499, "global_step": 116300, "epoch": 2769} {"train_loss": -6.59831428527832, "global_step": 116301, "epoch": 2769} {"train_loss": -6.449492454528809, "global_step": 116302, "epoch": 2769} {"train_loss": -6.512377738952637, "global_step": 116303, "epoch": 2769} {"train_loss": -6.597903728485107, "global_step": 116304, "epoch": 2769} {"train_loss": -6.435941696166992, "global_step": 116305, "epoch": 2769} {"train_loss": -6.52418327331543, "global_step": 116306, "epoch": 2769} {"train_loss": -6.43511962890625, "global_step": 116307, "epoch": 2769} {"train_loss": -6.513960838317871, "global_step": 116308, "epoch": 2769} {"train_loss": -6.48227596282959, "global_step": 116309, "epoch": 2769} {"train_loss": -6.678902626037598, "global_step": 116310, "epoch": 2769} {"train_loss": -6.638359546661377, "global_step": 116311, "epoch": 2769} {"train_loss": -6.550963878631592, "global_step": 116312, "epoch": 2769} {"train_loss": -6.545832633972168, "global_step": 116313, "epoch": 2769} {"train_loss": -6.56102180480957, "global_step": 116314, "epoch": 2769} {"train_loss": -6.5508904457092285, "global_step": 116315, "epoch": 2769} {"train_loss": -6.546588897705078, "global_step": 116316, "epoch": 2769} {"train_loss": -6.58482027053833, "global_step": 116317, "epoch": 2769} {"train_loss": -6.559349060058594, "global_step": 116318, "epoch": 2769} {"train_loss": -6.587616920471191, "global_step": 116319, "epoch": 2769} {"train_loss": -6.5269775390625, "global_step": 116320, "epoch": 2769} {"train_loss": -6.594942092895508, "global_step": 116321, "epoch": 2769} {"train_loss": -6.5542192459106445, "global_step": 116322, "epoch": 2769} {"train_loss": -6.563014984130859, "global_step": 116323, "epoch": 2769} {"train_loss": -6.523818492889404, "global_step": 116324, "epoch": 2769} {"train_loss": -6.531935691833496, "global_step": 116325, "epoch": 2769} {"train_loss": -6.578953742980957, "global_step": 116326, "epoch": 2769} {"train_loss": -6.6126556396484375, "global_step": 116327, "epoch": 2769} {"train_loss": -6.635388374328613, "global_step": 116328, "epoch": 2769} {"train_loss": -6.600734710693359, "global_step": 116329, "epoch": 2769} {"train_loss": -6.611092567443848, "global_step": 116330, "epoch": 2769} {"train_loss": -6.593201637268066, "global_step": 116331, "epoch": 2769} {"train_loss": -6.466251373291016, "global_step": 116332, "epoch": 2769} {"train_loss": -6.4883012771606445, "global_step": 116333, "epoch": 2769} {"train_loss": -6.620920181274414, "global_step": 116334, "epoch": 2769} {"train_loss": -6.590715408325195, "global_step": 116335, "epoch": 2769} {"train_loss": -6.526949882507324, "global_step": 116336, "epoch": 2769} {"train_loss": -6.599277496337891, "global_step": 116337, "epoch": 2769} {"train_loss": -6.519674301147461, "global_step": 116338, "epoch": 2769} {"train_loss": -6.554956106912522, "global_step": 116339, "epoch": 2769, "val_loss": 65470.8046875} {"train_loss": -6.502590179443359, "global_step": 116340, "epoch": 2770} {"train_loss": -6.475050926208496, "global_step": 116341, "epoch": 2770} {"train_loss": -6.499384880065918, "global_step": 116342, "epoch": 2770} {"train_loss": -6.6121506690979, "global_step": 116343, "epoch": 2770} {"train_loss": -6.529706954956055, "global_step": 116344, "epoch": 2770} {"train_loss": -6.592507362365723, "global_step": 116345, "epoch": 2770} {"train_loss": -6.489065647125244, "global_step": 116346, "epoch": 2770} {"train_loss": -6.301058769226074, "global_step": 116347, "epoch": 2770} {"train_loss": -6.525485992431641, "global_step": 116348, "epoch": 2770} {"train_loss": -6.283257961273193, "global_step": 116349, "epoch": 2770} {"train_loss": -6.3510847091674805, "global_step": 116350, "epoch": 2770} {"train_loss": -6.3502373695373535, "global_step": 116351, "epoch": 2770} {"train_loss": -6.268158435821533, "global_step": 116352, "epoch": 2770} {"train_loss": -6.567676067352295, "global_step": 116353, "epoch": 2770} {"train_loss": -6.124590873718262, "global_step": 116354, "epoch": 2770} {"train_loss": -6.435070514678955, "global_step": 116355, "epoch": 2770} {"train_loss": -6.306117057800293, "global_step": 116356, "epoch": 2770} {"train_loss": -6.490509986877441, "global_step": 116357, "epoch": 2770} {"train_loss": -6.300737380981445, "global_step": 116358, "epoch": 2770} {"train_loss": -6.46544075012207, "global_step": 116359, "epoch": 2770} {"train_loss": -6.436214923858643, "global_step": 116360, "epoch": 2770} {"train_loss": -6.42172908782959, "global_step": 116361, "epoch": 2770} {"train_loss": -6.41886568069458, "global_step": 116362, "epoch": 2770} {"train_loss": -6.346328258514404, "global_step": 116363, "epoch": 2770} {"train_loss": -6.56412410736084, "global_step": 116364, "epoch": 2770} {"train_loss": -6.317034721374512, "global_step": 116365, "epoch": 2770} {"train_loss": -6.542859077453613, "global_step": 116366, "epoch": 2770} {"train_loss": -6.44875431060791, "global_step": 116367, "epoch": 2770} {"train_loss": -6.457527160644531, "global_step": 116368, "epoch": 2770} {"train_loss": -6.428922653198242, "global_step": 116369, "epoch": 2770} {"train_loss": -6.421145915985107, "global_step": 116370, "epoch": 2770} {"train_loss": -6.497928619384766, "global_step": 116371, "epoch": 2770} {"train_loss": -6.546802520751953, "global_step": 116372, "epoch": 2770} {"train_loss": -6.422860145568848, "global_step": 116373, "epoch": 2770} {"train_loss": -6.530825138092041, "global_step": 116374, "epoch": 2770} {"train_loss": -6.486649513244629, "global_step": 116375, "epoch": 2770} {"train_loss": -6.520767688751221, "global_step": 116376, "epoch": 2770} {"train_loss": -6.598262786865234, "global_step": 116377, "epoch": 2770} {"train_loss": -6.510105133056641, "global_step": 116378, "epoch": 2770} {"train_loss": -6.556768417358398, "global_step": 116379, "epoch": 2770} {"train_loss": -6.4951276779174805, "global_step": 116380, "epoch": 2770} {"train_loss": -6.4538740657624745, "global_step": 116381, "epoch": 2770, "val_loss": 65432.5625} {"train_loss": -6.538839817047119, "global_step": 116382, "epoch": 2771} {"train_loss": -6.672031402587891, "global_step": 116383, "epoch": 2771} {"train_loss": -6.530666828155518, "global_step": 116384, "epoch": 2771} {"train_loss": -6.530264377593994, "global_step": 116385, "epoch": 2771} {"train_loss": -6.508049964904785, "global_step": 116386, "epoch": 2771} {"train_loss": -6.484366416931152, "global_step": 116387, "epoch": 2771} {"train_loss": -6.450090408325195, "global_step": 116388, "epoch": 2771} {"train_loss": -6.68305778503418, "global_step": 116389, "epoch": 2771} {"train_loss": -6.577347755432129, "global_step": 116390, "epoch": 2771} {"train_loss": -6.3711137771606445, "global_step": 116391, "epoch": 2771} {"train_loss": -6.6188507080078125, "global_step": 116392, "epoch": 2771} {"train_loss": -6.69438362121582, "global_step": 116393, "epoch": 2771} {"train_loss": -6.702373027801514, "global_step": 116394, "epoch": 2771} {"train_loss": -6.653368949890137, "global_step": 116395, "epoch": 2771} {"train_loss": -6.503533840179443, "global_step": 116396, "epoch": 2771} {"train_loss": -6.549992084503174, "global_step": 116397, "epoch": 2771} {"train_loss": -6.485943794250488, "global_step": 116398, "epoch": 2771} {"train_loss": -6.638274192810059, "global_step": 116399, "epoch": 2771} {"train_loss": -6.576053619384766, "global_step": 116400, "epoch": 2771} {"train_loss": -6.539022445678711, "global_step": 116401, "epoch": 2771} {"train_loss": -6.635829925537109, "global_step": 116402, "epoch": 2771} {"train_loss": -6.671729564666748, "global_step": 116403, "epoch": 2771} {"train_loss": -6.597357749938965, "global_step": 116404, "epoch": 2771} {"train_loss": -6.610899925231934, "global_step": 116405, "epoch": 2771} {"train_loss": -6.5763702392578125, "global_step": 116406, "epoch": 2771} {"train_loss": -6.783029079437256, "global_step": 116407, "epoch": 2771} {"train_loss": -6.531661033630371, "global_step": 116408, "epoch": 2771} {"train_loss": -6.527053356170654, "global_step": 116409, "epoch": 2771} {"train_loss": -6.565408706665039, "global_step": 116410, "epoch": 2771} {"train_loss": -6.569346904754639, "global_step": 116411, "epoch": 2771} {"train_loss": -6.617220401763916, "global_step": 116412, "epoch": 2771} {"train_loss": -6.423453330993652, "global_step": 116413, "epoch": 2771} {"train_loss": -6.493265151977539, "global_step": 116414, "epoch": 2771} {"train_loss": -6.5354180335998535, "global_step": 116415, "epoch": 2771} {"train_loss": -6.44545841217041, "global_step": 116416, "epoch": 2771} {"train_loss": -6.458070755004883, "global_step": 116417, "epoch": 2771} {"train_loss": -6.394207000732422, "global_step": 116418, "epoch": 2771} {"train_loss": -6.5354719161987305, "global_step": 116419, "epoch": 2771} {"train_loss": -6.551660537719727, "global_step": 116420, "epoch": 2771} {"train_loss": -6.537735462188721, "global_step": 116421, "epoch": 2771} {"train_loss": -6.625509262084961, "global_step": 116422, "epoch": 2771} {"train_loss": -6.564050572259085, "global_step": 116423, "epoch": 2771, "val_loss": 65455.96875} {"train_loss": -6.559584617614746, "global_step": 116424, "epoch": 2772} {"train_loss": -6.584468364715576, "global_step": 116425, "epoch": 2772} {"train_loss": -6.548076629638672, "global_step": 116426, "epoch": 2772} {"train_loss": -6.57102108001709, "global_step": 116427, "epoch": 2772} {"train_loss": -6.727941513061523, "global_step": 116428, "epoch": 2772} {"train_loss": -6.5824127197265625, "global_step": 116429, "epoch": 2772} {"train_loss": -6.542924880981445, "global_step": 116430, "epoch": 2772} {"train_loss": -6.553400039672852, "global_step": 116431, "epoch": 2772} {"train_loss": -6.640263557434082, "global_step": 116432, "epoch": 2772} {"train_loss": -6.552165985107422, "global_step": 116433, "epoch": 2772} {"train_loss": -6.530062675476074, "global_step": 116434, "epoch": 2772} {"train_loss": -6.645627975463867, "global_step": 116435, "epoch": 2772} {"train_loss": -6.541792869567871, "global_step": 116436, "epoch": 2772} {"train_loss": -6.554634094238281, "global_step": 116437, "epoch": 2772} {"train_loss": -6.610383033752441, "global_step": 116438, "epoch": 2772} {"train_loss": -6.661282539367676, "global_step": 116439, "epoch": 2772} {"train_loss": -6.428206920623779, "global_step": 116440, "epoch": 2772} {"train_loss": -6.593667030334473, "global_step": 116441, "epoch": 2772} {"train_loss": -6.528857231140137, "global_step": 116442, "epoch": 2772} {"train_loss": -6.430366039276123, "global_step": 116443, "epoch": 2772} {"train_loss": -6.5205912590026855, "global_step": 116444, "epoch": 2772} {"train_loss": -6.54709005355835, "global_step": 116445, "epoch": 2772} {"train_loss": -6.450649261474609, "global_step": 116446, "epoch": 2772} {"train_loss": -6.583211898803711, "global_step": 116447, "epoch": 2772} {"train_loss": -6.5247392654418945, "global_step": 116448, "epoch": 2772} {"train_loss": -6.453976631164551, "global_step": 116449, "epoch": 2772} {"train_loss": -6.677706718444824, "global_step": 116450, "epoch": 2772} {"train_loss": -6.535174369812012, "global_step": 116451, "epoch": 2772} {"train_loss": -6.448486804962158, "global_step": 116452, "epoch": 2772} {"train_loss": -6.551540851593018, "global_step": 116453, "epoch": 2772} {"train_loss": -6.447656631469727, "global_step": 116454, "epoch": 2772} {"train_loss": -6.611201286315918, "global_step": 116455, "epoch": 2772} {"train_loss": -6.531330108642578, "global_step": 116456, "epoch": 2772} {"train_loss": -6.680641174316406, "global_step": 116457, "epoch": 2772} {"train_loss": -6.4337921142578125, "global_step": 116458, "epoch": 2772} {"train_loss": -6.514630317687988, "global_step": 116459, "epoch": 2772} {"train_loss": -6.5890655517578125, "global_step": 116460, "epoch": 2772} {"train_loss": -6.440922260284424, "global_step": 116461, "epoch": 2772} {"train_loss": -6.500711441040039, "global_step": 116462, "epoch": 2772} {"train_loss": -6.605999946594238, "global_step": 116463, "epoch": 2772} {"train_loss": -6.5753068923950195, "global_step": 116464, "epoch": 2772} {"train_loss": -6.550199701672509, "global_step": 116465, "epoch": 2772, "val_loss": 65514.42578125} {"train_loss": -6.543283462524414, "global_step": 116466, "epoch": 2773} {"train_loss": -6.4711689949035645, "global_step": 116467, "epoch": 2773} {"train_loss": -6.584522724151611, "global_step": 116468, "epoch": 2773} {"train_loss": -6.6605072021484375, "global_step": 116469, "epoch": 2773} {"train_loss": -6.66934061050415, "global_step": 116470, "epoch": 2773} {"train_loss": -6.532251358032227, "global_step": 116471, "epoch": 2773} {"train_loss": -6.616209983825684, "global_step": 116472, "epoch": 2773} {"train_loss": -6.434158802032471, "global_step": 116473, "epoch": 2773} {"train_loss": -6.630162239074707, "global_step": 116474, "epoch": 2773} {"train_loss": -6.619635581970215, "global_step": 116475, "epoch": 2773} {"train_loss": -6.394525527954102, "global_step": 116476, "epoch": 2773} {"train_loss": -6.5668230056762695, "global_step": 116477, "epoch": 2773} {"train_loss": -6.567082405090332, "global_step": 116478, "epoch": 2773} {"train_loss": -6.519701957702637, "global_step": 116479, "epoch": 2773} {"train_loss": -6.483613967895508, "global_step": 116480, "epoch": 2773} {"train_loss": -6.632279872894287, "global_step": 116481, "epoch": 2773} {"train_loss": -6.447394371032715, "global_step": 116482, "epoch": 2773} {"train_loss": -6.512232303619385, "global_step": 116483, "epoch": 2773} {"train_loss": -6.609371185302734, "global_step": 116484, "epoch": 2773} {"train_loss": -6.473396301269531, "global_step": 116485, "epoch": 2773} {"train_loss": -6.533043384552002, "global_step": 116486, "epoch": 2773} {"train_loss": -6.361160755157471, "global_step": 116487, "epoch": 2773} {"train_loss": -6.50970458984375, "global_step": 116488, "epoch": 2773} {"train_loss": -6.531271934509277, "global_step": 116489, "epoch": 2773} {"train_loss": -6.480339050292969, "global_step": 116490, "epoch": 2773} {"train_loss": -6.440910339355469, "global_step": 116491, "epoch": 2773} {"train_loss": -6.483929634094238, "global_step": 116492, "epoch": 2773} {"train_loss": -6.4079484939575195, "global_step": 116493, "epoch": 2773} {"train_loss": -6.499449253082275, "global_step": 116494, "epoch": 2773} {"train_loss": -6.57668399810791, "global_step": 116495, "epoch": 2773} {"train_loss": -6.454235076904297, "global_step": 116496, "epoch": 2773} {"train_loss": -6.458120346069336, "global_step": 116497, "epoch": 2773} {"train_loss": -6.344185829162598, "global_step": 116498, "epoch": 2773} {"train_loss": -6.421735763549805, "global_step": 116499, "epoch": 2773} {"train_loss": -6.438007831573486, "global_step": 116500, "epoch": 2773} {"train_loss": -6.369578838348389, "global_step": 116501, "epoch": 2773} {"train_loss": -6.385535717010498, "global_step": 116502, "epoch": 2773} {"train_loss": -6.3834404945373535, "global_step": 116503, "epoch": 2773} {"train_loss": -6.573035717010498, "global_step": 116504, "epoch": 2773} {"train_loss": -6.4415459632873535, "global_step": 116505, "epoch": 2773} {"train_loss": -6.531868934631348, "global_step": 116506, "epoch": 2773} {"train_loss": -6.502937021709624, "global_step": 116507, "epoch": 2773, "val_loss": 65630.9765625} {"train_loss": -6.457043170928955, "global_step": 116508, "epoch": 2774} {"train_loss": -6.5726494789123535, "global_step": 116509, "epoch": 2774} {"train_loss": -6.459863185882568, "global_step": 116510, "epoch": 2774} {"train_loss": -6.420130252838135, "global_step": 116511, "epoch": 2774} {"train_loss": -6.474957466125488, "global_step": 116512, "epoch": 2774} {"train_loss": -6.506847381591797, "global_step": 116513, "epoch": 2774} {"train_loss": -6.426159858703613, "global_step": 116514, "epoch": 2774} {"train_loss": -6.54332971572876, "global_step": 116515, "epoch": 2774} {"train_loss": -6.496918678283691, "global_step": 116516, "epoch": 2774} {"train_loss": -6.622098445892334, "global_step": 116517, "epoch": 2774} {"train_loss": -6.540111541748047, "global_step": 116518, "epoch": 2774} {"train_loss": -6.572999477386475, "global_step": 116519, "epoch": 2774} {"train_loss": -6.568351745605469, "global_step": 116520, "epoch": 2774} {"train_loss": -6.449888229370117, "global_step": 116521, "epoch": 2774} {"train_loss": -6.484325408935547, "global_step": 116522, "epoch": 2774} {"train_loss": -6.43898868560791, "global_step": 116523, "epoch": 2774} {"train_loss": -6.563432693481445, "global_step": 116524, "epoch": 2774} {"train_loss": -6.574382305145264, "global_step": 116525, "epoch": 2774} {"train_loss": -6.5833539962768555, "global_step": 116526, "epoch": 2774} {"train_loss": -6.519697666168213, "global_step": 116527, "epoch": 2774} {"train_loss": -6.4106831550598145, "global_step": 116528, "epoch": 2774} {"train_loss": -6.568293571472168, "global_step": 116529, "epoch": 2774} {"train_loss": -6.5137457847595215, "global_step": 116530, "epoch": 2774} {"train_loss": -6.536751747131348, "global_step": 116531, "epoch": 2774} {"train_loss": -6.608070373535156, "global_step": 116532, "epoch": 2774} {"train_loss": -6.557211875915527, "global_step": 116533, "epoch": 2774} {"train_loss": -6.542547225952148, "global_step": 116534, "epoch": 2774} {"train_loss": -6.603834629058838, "global_step": 116535, "epoch": 2774} {"train_loss": -6.513070106506348, "global_step": 116536, "epoch": 2774} {"train_loss": -6.567636966705322, "global_step": 116537, "epoch": 2774} {"train_loss": -6.621186256408691, "global_step": 116538, "epoch": 2774} {"train_loss": -6.571897506713867, "global_step": 116539, "epoch": 2774} {"train_loss": -6.528039932250977, "global_step": 116540, "epoch": 2774} {"train_loss": -6.573446750640869, "global_step": 116541, "epoch": 2774} {"train_loss": -6.52589225769043, "global_step": 116542, "epoch": 2774} {"train_loss": -6.518521308898926, "global_step": 116543, "epoch": 2774} {"train_loss": -6.533162593841553, "global_step": 116544, "epoch": 2774} {"train_loss": -6.740998268127441, "global_step": 116545, "epoch": 2774} {"train_loss": -6.552678108215332, "global_step": 116546, "epoch": 2774} {"train_loss": -6.588040351867676, "global_step": 116547, "epoch": 2774} {"train_loss": -6.589817047119141, "global_step": 116548, "epoch": 2774} {"train_loss": -6.538050061180478, "global_step": 116549, "epoch": 2774, "val_loss": 65396.25390625} {"train_loss": -6.502374649047852, "global_step": 116550, "epoch": 2775} {"train_loss": -6.664154052734375, "global_step": 116551, "epoch": 2775} {"train_loss": -6.484282970428467, "global_step": 116552, "epoch": 2775} {"train_loss": -6.731523036956787, "global_step": 116553, "epoch": 2775} {"train_loss": -6.570472717285156, "global_step": 116554, "epoch": 2775} {"train_loss": -6.525010585784912, "global_step": 116555, "epoch": 2775} {"train_loss": -6.617638111114502, "global_step": 116556, "epoch": 2775} {"train_loss": -6.4974365234375, "global_step": 116557, "epoch": 2775} {"train_loss": -6.544801712036133, "global_step": 116558, "epoch": 2775} {"train_loss": -6.532946586608887, "global_step": 116559, "epoch": 2775} {"train_loss": -6.3598952293396, "global_step": 116560, "epoch": 2775} {"train_loss": -6.507279872894287, "global_step": 116561, "epoch": 2775} {"train_loss": -6.339332580566406, "global_step": 116562, "epoch": 2775} {"train_loss": -6.476462364196777, "global_step": 116563, "epoch": 2775} {"train_loss": -6.473484516143799, "global_step": 116564, "epoch": 2775} {"train_loss": -6.462353229522705, "global_step": 116565, "epoch": 2775} {"train_loss": -6.582651138305664, "global_step": 116566, "epoch": 2775} {"train_loss": -6.4642744064331055, "global_step": 116567, "epoch": 2775} {"train_loss": -6.51862096786499, "global_step": 116568, "epoch": 2775} {"train_loss": -6.405346393585205, "global_step": 116569, "epoch": 2775} {"train_loss": -6.229623794555664, "global_step": 116570, "epoch": 2775} {"train_loss": -6.499766826629639, "global_step": 116571, "epoch": 2775} {"train_loss": -6.483922481536865, "global_step": 116572, "epoch": 2775} {"train_loss": -6.54293966293335, "global_step": 116573, "epoch": 2775} {"train_loss": -6.505834579467773, "global_step": 116574, "epoch": 2775} {"train_loss": -6.540670394897461, "global_step": 116575, "epoch": 2775} {"train_loss": -6.586330413818359, "global_step": 116576, "epoch": 2775} {"train_loss": -6.478645324707031, "global_step": 116577, "epoch": 2775} {"train_loss": -6.562531471252441, "global_step": 116578, "epoch": 2775} {"train_loss": -6.6188645362854, "global_step": 116579, "epoch": 2775} {"train_loss": -6.5345330238342285, "global_step": 116580, "epoch": 2775} {"train_loss": -6.531649589538574, "global_step": 116581, "epoch": 2775} {"train_loss": -6.550388336181641, "global_step": 116582, "epoch": 2775} {"train_loss": -6.471609115600586, "global_step": 116583, "epoch": 2775} {"train_loss": -6.489126682281494, "global_step": 116584, "epoch": 2775} {"train_loss": -6.507480621337891, "global_step": 116585, "epoch": 2775} {"train_loss": -6.437128067016602, "global_step": 116586, "epoch": 2775} {"train_loss": -6.393589496612549, "global_step": 116587, "epoch": 2775} {"train_loss": -6.672602653503418, "global_step": 116588, "epoch": 2775} {"train_loss": -6.575460433959961, "global_step": 116589, "epoch": 2775} {"train_loss": -6.469333648681641, "global_step": 116590, "epoch": 2775} {"train_loss": -6.511255037216913, "global_step": 116591, "epoch": 2775, "val_loss": 65450.34765625} {"train_loss": -6.531329154968262, "global_step": 116592, "epoch": 2776} {"train_loss": -6.525969505310059, "global_step": 116593, "epoch": 2776} {"train_loss": -6.621598243713379, "global_step": 116594, "epoch": 2776} {"train_loss": -6.474249839782715, "global_step": 116595, "epoch": 2776} {"train_loss": -6.490958213806152, "global_step": 116596, "epoch": 2776} {"train_loss": -6.503679275512695, "global_step": 116597, "epoch": 2776} {"train_loss": -6.374284267425537, "global_step": 116598, "epoch": 2776} {"train_loss": -6.544761657714844, "global_step": 116599, "epoch": 2776} {"train_loss": -6.389459133148193, "global_step": 116600, "epoch": 2776} {"train_loss": -6.523326396942139, "global_step": 116601, "epoch": 2776} {"train_loss": -6.389657020568848, "global_step": 116602, "epoch": 2776} {"train_loss": -6.408152103424072, "global_step": 116603, "epoch": 2776} {"train_loss": -6.409547328948975, "global_step": 116604, "epoch": 2776} {"train_loss": -6.442824363708496, "global_step": 116605, "epoch": 2776} {"train_loss": -6.549742221832275, "global_step": 116606, "epoch": 2776} {"train_loss": -6.408905029296875, "global_step": 116607, "epoch": 2776} {"train_loss": -6.5439982414245605, "global_step": 116608, "epoch": 2776} {"train_loss": -6.3917036056518555, "global_step": 116609, "epoch": 2776} {"train_loss": -6.492003440856934, "global_step": 116610, "epoch": 2776} {"train_loss": -6.496038436889648, "global_step": 116611, "epoch": 2776} {"train_loss": -6.6217803955078125, "global_step": 116612, "epoch": 2776} {"train_loss": -6.502588272094727, "global_step": 116613, "epoch": 2776} {"train_loss": -6.427790641784668, "global_step": 116614, "epoch": 2776} {"train_loss": -6.463584899902344, "global_step": 116615, "epoch": 2776} {"train_loss": -6.492201805114746, "global_step": 116616, "epoch": 2776} {"train_loss": -6.349490165710449, "global_step": 116617, "epoch": 2776} {"train_loss": -6.467966556549072, "global_step": 116618, "epoch": 2776} {"train_loss": -6.494287967681885, "global_step": 116619, "epoch": 2776} {"train_loss": -6.560170650482178, "global_step": 116620, "epoch": 2776} {"train_loss": -6.433488368988037, "global_step": 116621, "epoch": 2776} {"train_loss": -6.564168453216553, "global_step": 116622, "epoch": 2776} {"train_loss": -6.410954475402832, "global_step": 116623, "epoch": 2776} {"train_loss": -6.572591781616211, "global_step": 116624, "epoch": 2776} {"train_loss": -6.35498571395874, "global_step": 116625, "epoch": 2776} {"train_loss": -6.541106224060059, "global_step": 116626, "epoch": 2776} {"train_loss": -6.532614707946777, "global_step": 116627, "epoch": 2776} {"train_loss": -6.539783000946045, "global_step": 116628, "epoch": 2776} {"train_loss": -6.571191787719727, "global_step": 116629, "epoch": 2776} {"train_loss": -6.413588523864746, "global_step": 116630, "epoch": 2776} {"train_loss": -6.561959266662598, "global_step": 116631, "epoch": 2776} {"train_loss": -6.599625110626221, "global_step": 116632, "epoch": 2776} {"train_loss": -6.491445416495914, "global_step": 116633, "epoch": 2776, "val_loss": 65373.68359375} {"train_loss": -6.5489983558654785, "global_step": 116634, "epoch": 2777} {"train_loss": -6.500777244567871, "global_step": 116635, "epoch": 2777} {"train_loss": -6.591803550720215, "global_step": 116636, "epoch": 2777} {"train_loss": -6.429634094238281, "global_step": 116637, "epoch": 2777} {"train_loss": -6.480654716491699, "global_step": 116638, "epoch": 2777} {"train_loss": -6.57755184173584, "global_step": 116639, "epoch": 2777} {"train_loss": -6.516595840454102, "global_step": 116640, "epoch": 2777} {"train_loss": -6.543243885040283, "global_step": 116641, "epoch": 2777} {"train_loss": -6.5853271484375, "global_step": 116642, "epoch": 2777} {"train_loss": -6.701298236846924, "global_step": 116643, "epoch": 2777} {"train_loss": -6.63692569732666, "global_step": 116644, "epoch": 2777} {"train_loss": -6.568074703216553, "global_step": 116645, "epoch": 2777} {"train_loss": -6.583973407745361, "global_step": 116646, "epoch": 2777} {"train_loss": -6.586689472198486, "global_step": 116647, "epoch": 2777} {"train_loss": -6.464860439300537, "global_step": 116648, "epoch": 2777} {"train_loss": -6.542167663574219, "global_step": 116649, "epoch": 2777} {"train_loss": -6.517067909240723, "global_step": 116650, "epoch": 2777} {"train_loss": -6.459152698516846, "global_step": 116651, "epoch": 2777} {"train_loss": -6.6491804122924805, "global_step": 116652, "epoch": 2777} {"train_loss": -6.552651882171631, "global_step": 116653, "epoch": 2777} {"train_loss": -6.48238468170166, "global_step": 116654, "epoch": 2777} {"train_loss": -6.5124616622924805, "global_step": 116655, "epoch": 2777} {"train_loss": -6.554248809814453, "global_step": 116656, "epoch": 2777} {"train_loss": -6.512231826782227, "global_step": 116657, "epoch": 2777} {"train_loss": -6.476988792419434, "global_step": 116658, "epoch": 2777} {"train_loss": -6.587611198425293, "global_step": 116659, "epoch": 2777} {"train_loss": -6.497690200805664, "global_step": 116660, "epoch": 2777} {"train_loss": -6.390230178833008, "global_step": 116661, "epoch": 2777} {"train_loss": -6.515966415405273, "global_step": 116662, "epoch": 2777} {"train_loss": -6.522623062133789, "global_step": 116663, "epoch": 2777} {"train_loss": -6.489302635192871, "global_step": 116664, "epoch": 2777} {"train_loss": -6.565862655639648, "global_step": 116665, "epoch": 2777} {"train_loss": -6.572174072265625, "global_step": 116666, "epoch": 2777} {"train_loss": -6.482949256896973, "global_step": 116667, "epoch": 2777} {"train_loss": -6.479272842407227, "global_step": 116668, "epoch": 2777} {"train_loss": -6.585353851318359, "global_step": 116669, "epoch": 2777} {"train_loss": -6.516652584075928, "global_step": 116670, "epoch": 2777} {"train_loss": -6.573558807373047, "global_step": 116671, "epoch": 2777} {"train_loss": -6.663761615753174, "global_step": 116672, "epoch": 2777} {"train_loss": -6.614044189453125, "global_step": 116673, "epoch": 2777} {"train_loss": -6.560330390930176, "global_step": 116674, "epoch": 2777} {"train_loss": -6.543320474170503, "global_step": 116675, "epoch": 2777, "val_loss": 65442.62109375} {"train_loss": -6.468557357788086, "global_step": 116676, "epoch": 2778} {"train_loss": -6.591807842254639, "global_step": 116677, "epoch": 2778} {"train_loss": -6.660118103027344, "global_step": 116678, "epoch": 2778} {"train_loss": -6.475162506103516, "global_step": 116679, "epoch": 2778} {"train_loss": -6.528512477874756, "global_step": 116680, "epoch": 2778} {"train_loss": -6.518665313720703, "global_step": 116681, "epoch": 2778} {"train_loss": -6.6363372802734375, "global_step": 116682, "epoch": 2778} {"train_loss": -6.664061546325684, "global_step": 116683, "epoch": 2778} {"train_loss": -6.607942581176758, "global_step": 116684, "epoch": 2778} {"train_loss": -6.678825378417969, "global_step": 116685, "epoch": 2778} {"train_loss": -6.480731010437012, "global_step": 116686, "epoch": 2778} {"train_loss": -6.5043439865112305, "global_step": 116687, "epoch": 2778} {"train_loss": -6.523043632507324, "global_step": 116688, "epoch": 2778} {"train_loss": -6.625359058380127, "global_step": 116689, "epoch": 2778} {"train_loss": -6.5828962326049805, "global_step": 116690, "epoch": 2778} {"train_loss": -6.557058811187744, "global_step": 116691, "epoch": 2778} {"train_loss": -6.581139087677002, "global_step": 116692, "epoch": 2778} {"train_loss": -6.560341835021973, "global_step": 116693, "epoch": 2778} {"train_loss": -6.748929023742676, "global_step": 116694, "epoch": 2778} {"train_loss": -6.59231424331665, "global_step": 116695, "epoch": 2778} {"train_loss": -6.4391303062438965, "global_step": 116696, "epoch": 2778} {"train_loss": -6.721862316131592, "global_step": 116697, "epoch": 2778} {"train_loss": -6.487158298492432, "global_step": 116698, "epoch": 2778} {"train_loss": -6.57332706451416, "global_step": 116699, "epoch": 2778} {"train_loss": -6.597784996032715, "global_step": 116700, "epoch": 2778} {"train_loss": -6.497982978820801, "global_step": 116701, "epoch": 2778} {"train_loss": -6.626576900482178, "global_step": 116702, "epoch": 2778} {"train_loss": -6.551137924194336, "global_step": 116703, "epoch": 2778} {"train_loss": -6.442975997924805, "global_step": 116704, "epoch": 2778} {"train_loss": -6.519494533538818, "global_step": 116705, "epoch": 2778} {"train_loss": -6.508642196655273, "global_step": 116706, "epoch": 2778} {"train_loss": -6.563118934631348, "global_step": 116707, "epoch": 2778} {"train_loss": -6.581445217132568, "global_step": 116708, "epoch": 2778} {"train_loss": -6.548859119415283, "global_step": 116709, "epoch": 2778} {"train_loss": -6.611108779907227, "global_step": 116710, "epoch": 2778} {"train_loss": -6.652285575866699, "global_step": 116711, "epoch": 2778} {"train_loss": -6.611379146575928, "global_step": 116712, "epoch": 2778} {"train_loss": -6.491029262542725, "global_step": 116713, "epoch": 2778} {"train_loss": -6.6362152099609375, "global_step": 116714, "epoch": 2778} {"train_loss": -6.578544616699219, "global_step": 116715, "epoch": 2778} {"train_loss": -6.552145957946777, "global_step": 116716, "epoch": 2778} {"train_loss": -6.571223758515858, "global_step": 116717, "epoch": 2778, "val_loss": 65291.1875} {"train_loss": -6.529885768890381, "global_step": 116718, "epoch": 2779} {"train_loss": -6.553560256958008, "global_step": 116719, "epoch": 2779} {"train_loss": -6.566606521606445, "global_step": 116720, "epoch": 2779} {"train_loss": -6.63023567199707, "global_step": 116721, "epoch": 2779} {"train_loss": -6.5728912353515625, "global_step": 116722, "epoch": 2779} {"train_loss": -6.413055419921875, "global_step": 116723, "epoch": 2779} {"train_loss": -6.667623996734619, "global_step": 116724, "epoch": 2779} {"train_loss": -6.686500549316406, "global_step": 116725, "epoch": 2779} {"train_loss": -6.623581409454346, "global_step": 116726, "epoch": 2779} {"train_loss": -6.536349296569824, "global_step": 116727, "epoch": 2779} {"train_loss": -6.595385551452637, "global_step": 116728, "epoch": 2779} {"train_loss": -6.485960960388184, "global_step": 116729, "epoch": 2779} {"train_loss": -6.5107502937316895, "global_step": 116730, "epoch": 2779} {"train_loss": -6.595792770385742, "global_step": 116731, "epoch": 2779} {"train_loss": -6.550438404083252, "global_step": 116732, "epoch": 2779} {"train_loss": -6.532684326171875, "global_step": 116733, "epoch": 2779} {"train_loss": -6.448952674865723, "global_step": 116734, "epoch": 2779} {"train_loss": -6.515191555023193, "global_step": 116735, "epoch": 2779} {"train_loss": -6.593118190765381, "global_step": 116736, "epoch": 2779} {"train_loss": -6.583616256713867, "global_step": 116737, "epoch": 2779} {"train_loss": -6.505241394042969, "global_step": 116738, "epoch": 2779} {"train_loss": -6.390817642211914, "global_step": 116739, "epoch": 2779} {"train_loss": -6.53895378112793, "global_step": 116740, "epoch": 2779} {"train_loss": -6.589460372924805, "global_step": 116741, "epoch": 2779} {"train_loss": -6.535402774810791, "global_step": 116742, "epoch": 2779} {"train_loss": -6.563452243804932, "global_step": 116743, "epoch": 2779} {"train_loss": -6.494633674621582, "global_step": 116744, "epoch": 2779} {"train_loss": -6.48714542388916, "global_step": 116745, "epoch": 2779} {"train_loss": -6.565732002258301, "global_step": 116746, "epoch": 2779} {"train_loss": -6.614485263824463, "global_step": 116747, "epoch": 2779} {"train_loss": -6.53663444519043, "global_step": 116748, "epoch": 2779} {"train_loss": -6.552967071533203, "global_step": 116749, "epoch": 2779} {"train_loss": -6.56436824798584, "global_step": 116750, "epoch": 2779} {"train_loss": -6.615719795227051, "global_step": 116751, "epoch": 2779} {"train_loss": -6.664860725402832, "global_step": 116752, "epoch": 2779} {"train_loss": -6.703819274902344, "global_step": 116753, "epoch": 2779} {"train_loss": -6.533243656158447, "global_step": 116754, "epoch": 2779} {"train_loss": -6.680139064788818, "global_step": 116755, "epoch": 2779} {"train_loss": -6.491476058959961, "global_step": 116756, "epoch": 2779} {"train_loss": -6.547976493835449, "global_step": 116757, "epoch": 2779} {"train_loss": -6.578207969665527, "global_step": 116758, "epoch": 2779} {"train_loss": -6.559158302488781, "global_step": 116759, "epoch": 2779, "val_loss": 65491.84765625} {"train_loss": -6.470676422119141, "global_step": 116760, "epoch": 2780} {"train_loss": -6.538273811340332, "global_step": 116761, "epoch": 2780} {"train_loss": -6.356793403625488, "global_step": 116762, "epoch": 2780} {"train_loss": -6.569135665893555, "global_step": 116763, "epoch": 2780} {"train_loss": -6.573474884033203, "global_step": 116764, "epoch": 2780} {"train_loss": -6.497371196746826, "global_step": 116765, "epoch": 2780} {"train_loss": -6.612407684326172, "global_step": 116766, "epoch": 2780} {"train_loss": -6.535006046295166, "global_step": 116767, "epoch": 2780} {"train_loss": -6.472758769989014, "global_step": 116768, "epoch": 2780} {"train_loss": -6.444992542266846, "global_step": 116769, "epoch": 2780} {"train_loss": -6.547338485717773, "global_step": 116770, "epoch": 2780} {"train_loss": -6.648399353027344, "global_step": 116771, "epoch": 2780} {"train_loss": -6.455203056335449, "global_step": 116772, "epoch": 2780} {"train_loss": -6.51019811630249, "global_step": 116773, "epoch": 2780} {"train_loss": -6.548064231872559, "global_step": 116774, "epoch": 2780} {"train_loss": -6.447617530822754, "global_step": 116775, "epoch": 2780} {"train_loss": -6.441249847412109, "global_step": 116776, "epoch": 2780} {"train_loss": -6.403421878814697, "global_step": 116777, "epoch": 2780} {"train_loss": -6.428497791290283, "global_step": 116778, "epoch": 2780} {"train_loss": -6.516356468200684, "global_step": 116779, "epoch": 2780} {"train_loss": -6.517983436584473, "global_step": 116780, "epoch": 2780} {"train_loss": -6.478802680969238, "global_step": 116781, "epoch": 2780} {"train_loss": -6.526738166809082, "global_step": 116782, "epoch": 2780} {"train_loss": -6.527126312255859, "global_step": 116783, "epoch": 2780} {"train_loss": -6.580560684204102, "global_step": 116784, "epoch": 2780} {"train_loss": -6.610898494720459, "global_step": 116785, "epoch": 2780} {"train_loss": -6.472931861877441, "global_step": 116786, "epoch": 2780} {"train_loss": -6.546299934387207, "global_step": 116787, "epoch": 2780} {"train_loss": -6.587201118469238, "global_step": 116788, "epoch": 2780} {"train_loss": -6.41738224029541, "global_step": 116789, "epoch": 2780} {"train_loss": -6.534960746765137, "global_step": 116790, "epoch": 2780} {"train_loss": -6.533010959625244, "global_step": 116791, "epoch": 2780} {"train_loss": -6.61725378036499, "global_step": 116792, "epoch": 2780} {"train_loss": -6.554224014282227, "global_step": 116793, "epoch": 2780} {"train_loss": -6.538134574890137, "global_step": 116794, "epoch": 2780} {"train_loss": -6.570202827453613, "global_step": 116795, "epoch": 2780} {"train_loss": -6.418087959289551, "global_step": 116796, "epoch": 2780} {"train_loss": -6.531695365905762, "global_step": 116797, "epoch": 2780} {"train_loss": -6.539579391479492, "global_step": 116798, "epoch": 2780} {"train_loss": -6.546426773071289, "global_step": 116799, "epoch": 2780} {"train_loss": -6.408979415893555, "global_step": 116800, "epoch": 2780} {"train_loss": -6.510552485783895, "global_step": 116801, "epoch": 2780, "val_loss": 65555.6484375} {"train_loss": -6.601844787597656, "global_step": 116802, "epoch": 2781} {"train_loss": -6.504146099090576, "global_step": 116803, "epoch": 2781} {"train_loss": -6.643182277679443, "global_step": 116804, "epoch": 2781} {"train_loss": -6.462817192077637, "global_step": 116805, "epoch": 2781} {"train_loss": -6.55540657043457, "global_step": 116806, "epoch": 2781} {"train_loss": -6.4489545822143555, "global_step": 116807, "epoch": 2781} {"train_loss": -6.49722957611084, "global_step": 116808, "epoch": 2781} {"train_loss": -6.532141208648682, "global_step": 116809, "epoch": 2781} {"train_loss": -6.586592674255371, "global_step": 116810, "epoch": 2781} {"train_loss": -6.52107048034668, "global_step": 116811, "epoch": 2781} {"train_loss": -6.575018405914307, "global_step": 116812, "epoch": 2781} {"train_loss": -6.53560733795166, "global_step": 116813, "epoch": 2781} {"train_loss": -6.499601364135742, "global_step": 116814, "epoch": 2781} {"train_loss": -6.4809112548828125, "global_step": 116815, "epoch": 2781} {"train_loss": -6.618084907531738, "global_step": 116816, "epoch": 2781} {"train_loss": -6.606368064880371, "global_step": 116817, "epoch": 2781} {"train_loss": -6.588982582092285, "global_step": 116818, "epoch": 2781} {"train_loss": -6.671844005584717, "global_step": 116819, "epoch": 2781} {"train_loss": -6.520680904388428, "global_step": 116820, "epoch": 2781} {"train_loss": -6.617922306060791, "global_step": 116821, "epoch": 2781} {"train_loss": -6.540805816650391, "global_step": 116822, "epoch": 2781} {"train_loss": -6.591935157775879, "global_step": 116823, "epoch": 2781} {"train_loss": -6.518793106079102, "global_step": 116824, "epoch": 2781} {"train_loss": -6.4816718101501465, "global_step": 116825, "epoch": 2781} {"train_loss": -6.558327674865723, "global_step": 116826, "epoch": 2781} {"train_loss": -6.414201736450195, "global_step": 116827, "epoch": 2781} {"train_loss": -6.64884614944458, "global_step": 116828, "epoch": 2781} {"train_loss": -6.434602737426758, "global_step": 116829, "epoch": 2781} {"train_loss": -6.475718021392822, "global_step": 116830, "epoch": 2781} {"train_loss": -6.536762237548828, "global_step": 116831, "epoch": 2781} {"train_loss": -6.4119977951049805, "global_step": 116832, "epoch": 2781} {"train_loss": -6.590920925140381, "global_step": 116833, "epoch": 2781} {"train_loss": -6.423305511474609, "global_step": 116834, "epoch": 2781} {"train_loss": -6.496700286865234, "global_step": 116835, "epoch": 2781} {"train_loss": -6.535611152648926, "global_step": 116836, "epoch": 2781} {"train_loss": -6.528406620025635, "global_step": 116837, "epoch": 2781} {"train_loss": -6.558998107910156, "global_step": 116838, "epoch": 2781} {"train_loss": -6.492578983306885, "global_step": 116839, "epoch": 2781} {"train_loss": -6.473817348480225, "global_step": 116840, "epoch": 2781} {"train_loss": -6.349466800689697, "global_step": 116841, "epoch": 2781} {"train_loss": -6.418458461761475, "global_step": 116842, "epoch": 2781} {"train_loss": -6.523501895722889, "global_step": 116843, "epoch": 2781, "val_loss": 65425.98046875} {"train_loss": -6.534137725830078, "global_step": 116844, "epoch": 2782} {"train_loss": -6.5527238845825195, "global_step": 116845, "epoch": 2782} {"train_loss": -6.610782623291016, "global_step": 116846, "epoch": 2782} {"train_loss": -6.469815254211426, "global_step": 116847, "epoch": 2782} {"train_loss": -6.418413162231445, "global_step": 116848, "epoch": 2782} {"train_loss": -6.4944891929626465, "global_step": 116849, "epoch": 2782} {"train_loss": -6.601667404174805, "global_step": 116850, "epoch": 2782} {"train_loss": -6.4960174560546875, "global_step": 116851, "epoch": 2782} {"train_loss": -6.519968032836914, "global_step": 116852, "epoch": 2782} {"train_loss": -6.485988616943359, "global_step": 116853, "epoch": 2782} {"train_loss": -6.413176536560059, "global_step": 116854, "epoch": 2782} {"train_loss": -6.552130699157715, "global_step": 116855, "epoch": 2782} {"train_loss": -6.498409748077393, "global_step": 116856, "epoch": 2782} {"train_loss": -6.5362019538879395, "global_step": 116857, "epoch": 2782} {"train_loss": -6.527168273925781, "global_step": 116858, "epoch": 2782} {"train_loss": -6.501254081726074, "global_step": 116859, "epoch": 2782} {"train_loss": -6.411497592926025, "global_step": 116860, "epoch": 2782} {"train_loss": -6.514636993408203, "global_step": 116861, "epoch": 2782} {"train_loss": -6.476980209350586, "global_step": 116862, "epoch": 2782} {"train_loss": -6.429230690002441, "global_step": 116863, "epoch": 2782} {"train_loss": -6.545512676239014, "global_step": 116864, "epoch": 2782} {"train_loss": -6.522929668426514, "global_step": 116865, "epoch": 2782} {"train_loss": -6.511360168457031, "global_step": 116866, "epoch": 2782} {"train_loss": -6.456528663635254, "global_step": 116867, "epoch": 2782} {"train_loss": -6.527011871337891, "global_step": 116868, "epoch": 2782} {"train_loss": -6.652876853942871, "global_step": 116869, "epoch": 2782} {"train_loss": -6.414987087249756, "global_step": 116870, "epoch": 2782} {"train_loss": -6.585320472717285, "global_step": 116871, "epoch": 2782} {"train_loss": -6.651459693908691, "global_step": 116872, "epoch": 2782} {"train_loss": -6.59609317779541, "global_step": 116873, "epoch": 2782} {"train_loss": -6.559543609619141, "global_step": 116874, "epoch": 2782} {"train_loss": -6.575710296630859, "global_step": 116875, "epoch": 2782} {"train_loss": -6.592222213745117, "global_step": 116876, "epoch": 2782} {"train_loss": -6.453739166259766, "global_step": 116877, "epoch": 2782} {"train_loss": -6.5129289627075195, "global_step": 116878, "epoch": 2782} {"train_loss": -6.528511047363281, "global_step": 116879, "epoch": 2782} {"train_loss": -6.56193208694458, "global_step": 116880, "epoch": 2782} {"train_loss": -6.518939018249512, "global_step": 116881, "epoch": 2782} {"train_loss": -6.494791030883789, "global_step": 116882, "epoch": 2782} {"train_loss": -6.504858493804932, "global_step": 116883, "epoch": 2782} {"train_loss": -6.6246490478515625, "global_step": 116884, "epoch": 2782} {"train_loss": -6.522108305068243, "global_step": 116885, "epoch": 2782, "val_loss": 65604.9921875} {"train_loss": -6.559980869293213, "global_step": 116886, "epoch": 2783} {"train_loss": -6.4718804359436035, "global_step": 116887, "epoch": 2783} {"train_loss": -6.641496181488037, "global_step": 116888, "epoch": 2783} {"train_loss": -6.5572381019592285, "global_step": 116889, "epoch": 2783} {"train_loss": -6.637362003326416, "global_step": 116890, "epoch": 2783} {"train_loss": -6.589079856872559, "global_step": 116891, "epoch": 2783} {"train_loss": -6.479637145996094, "global_step": 116892, "epoch": 2783} {"train_loss": -6.537020683288574, "global_step": 116893, "epoch": 2783} {"train_loss": -6.554411888122559, "global_step": 116894, "epoch": 2783} {"train_loss": -6.518205165863037, "global_step": 116895, "epoch": 2783} {"train_loss": -6.524181842803955, "global_step": 116896, "epoch": 2783} {"train_loss": -6.5132155418396, "global_step": 116897, "epoch": 2783} {"train_loss": -6.605109214782715, "global_step": 116898, "epoch": 2783} {"train_loss": -6.608470916748047, "global_step": 116899, "epoch": 2783} {"train_loss": -6.53741979598999, "global_step": 116900, "epoch": 2783} {"train_loss": -6.553824424743652, "global_step": 116901, "epoch": 2783} {"train_loss": -6.635529518127441, "global_step": 116902, "epoch": 2783} {"train_loss": -6.514398097991943, "global_step": 116903, "epoch": 2783} {"train_loss": -6.380004405975342, "global_step": 116904, "epoch": 2783} {"train_loss": -6.645962715148926, "global_step": 116905, "epoch": 2783} {"train_loss": -6.425290107727051, "global_step": 116906, "epoch": 2783} {"train_loss": -6.431976318359375, "global_step": 116907, "epoch": 2783} {"train_loss": -6.577058792114258, "global_step": 116908, "epoch": 2783} {"train_loss": -6.46807336807251, "global_step": 116909, "epoch": 2783} {"train_loss": -6.430299758911133, "global_step": 116910, "epoch": 2783} {"train_loss": -6.596747398376465, "global_step": 116911, "epoch": 2783} {"train_loss": -6.53490686416626, "global_step": 116912, "epoch": 2783} {"train_loss": -6.496643543243408, "global_step": 116913, "epoch": 2783} {"train_loss": -6.577498435974121, "global_step": 116914, "epoch": 2783} {"train_loss": -6.524711608886719, "global_step": 116915, "epoch": 2783} {"train_loss": -6.608860969543457, "global_step": 116916, "epoch": 2783} {"train_loss": -6.449967384338379, "global_step": 116917, "epoch": 2783} {"train_loss": -6.519052505493164, "global_step": 116918, "epoch": 2783} {"train_loss": -6.673988342285156, "global_step": 116919, "epoch": 2783} {"train_loss": -6.431486129760742, "global_step": 116920, "epoch": 2783} {"train_loss": -6.535674571990967, "global_step": 116921, "epoch": 2783} {"train_loss": -6.511722087860107, "global_step": 116922, "epoch": 2783} {"train_loss": -6.449869155883789, "global_step": 116923, "epoch": 2783} {"train_loss": -6.5315117835998535, "global_step": 116924, "epoch": 2783} {"train_loss": -6.465183258056641, "global_step": 116925, "epoch": 2783} {"train_loss": -6.59658145904541, "global_step": 116926, "epoch": 2783} {"train_loss": -6.533780222847348, "global_step": 116927, "epoch": 2783, "val_loss": 65689.2578125} {"train_loss": -6.5506181716918945, "global_step": 116928, "epoch": 2784} {"train_loss": -6.49479866027832, "global_step": 116929, "epoch": 2784} {"train_loss": -6.4416937828063965, "global_step": 116930, "epoch": 2784} {"train_loss": -6.679925918579102, "global_step": 116931, "epoch": 2784} {"train_loss": -6.483109951019287, "global_step": 116932, "epoch": 2784} {"train_loss": -6.578958511352539, "global_step": 116933, "epoch": 2784} {"train_loss": -6.6822509765625, "global_step": 116934, "epoch": 2784} {"train_loss": -6.566950798034668, "global_step": 116935, "epoch": 2784} {"train_loss": -6.507288932800293, "global_step": 116936, "epoch": 2784} {"train_loss": -6.515742778778076, "global_step": 116937, "epoch": 2784} {"train_loss": -6.561276912689209, "global_step": 116938, "epoch": 2784} {"train_loss": -6.6149067878723145, "global_step": 116939, "epoch": 2784} {"train_loss": -6.488942623138428, "global_step": 116940, "epoch": 2784} {"train_loss": -6.62172794342041, "global_step": 116941, "epoch": 2784} {"train_loss": -6.5721635818481445, "global_step": 116942, "epoch": 2784} {"train_loss": -6.6219353675842285, "global_step": 116943, "epoch": 2784} {"train_loss": -6.545901298522949, "global_step": 116944, "epoch": 2784} {"train_loss": -6.574674606323242, "global_step": 116945, "epoch": 2784} {"train_loss": -6.56752872467041, "global_step": 116946, "epoch": 2784} {"train_loss": -6.495136737823486, "global_step": 116947, "epoch": 2784} {"train_loss": -6.60704231262207, "global_step": 116948, "epoch": 2784} {"train_loss": -6.610015869140625, "global_step": 116949, "epoch": 2784} {"train_loss": -6.559392929077148, "global_step": 116950, "epoch": 2784} {"train_loss": -6.500424861907959, "global_step": 116951, "epoch": 2784} {"train_loss": -6.440366744995117, "global_step": 116952, "epoch": 2784} {"train_loss": -6.492618560791016, "global_step": 116953, "epoch": 2784} {"train_loss": -6.616284370422363, "global_step": 116954, "epoch": 2784} {"train_loss": -6.599120140075684, "global_step": 116955, "epoch": 2784} {"train_loss": -6.583468914031982, "global_step": 116956, "epoch": 2784} {"train_loss": -6.504343032836914, "global_step": 116957, "epoch": 2784} {"train_loss": -6.519007682800293, "global_step": 116958, "epoch": 2784} {"train_loss": -6.464603900909424, "global_step": 116959, "epoch": 2784} {"train_loss": -6.555605888366699, "global_step": 116960, "epoch": 2784} {"train_loss": -6.553960800170898, "global_step": 116961, "epoch": 2784} {"train_loss": -6.5531110763549805, "global_step": 116962, "epoch": 2784} {"train_loss": -6.542825222015381, "global_step": 116963, "epoch": 2784} {"train_loss": -6.51503849029541, "global_step": 116964, "epoch": 2784} {"train_loss": -6.5399885177612305, "global_step": 116965, "epoch": 2784} {"train_loss": -6.559990406036377, "global_step": 116966, "epoch": 2784} {"train_loss": -6.601094722747803, "global_step": 116967, "epoch": 2784} {"train_loss": -6.475603103637695, "global_step": 116968, "epoch": 2784} {"train_loss": -6.5522258168175105, "global_step": 116969, "epoch": 2784, "val_loss": 65364.1328125} {"train_loss": -6.5434722900390625, "global_step": 116970, "epoch": 2785} {"train_loss": -6.481381416320801, "global_step": 116971, "epoch": 2785} {"train_loss": -6.6957268714904785, "global_step": 116972, "epoch": 2785} {"train_loss": -6.486940383911133, "global_step": 116973, "epoch": 2785} {"train_loss": -6.507686614990234, "global_step": 116974, "epoch": 2785} {"train_loss": -6.693509578704834, "global_step": 116975, "epoch": 2785} {"train_loss": -6.645377159118652, "global_step": 116976, "epoch": 2785} {"train_loss": -6.571662902832031, "global_step": 116977, "epoch": 2785} {"train_loss": -6.59533166885376, "global_step": 116978, "epoch": 2785} {"train_loss": -6.497365951538086, "global_step": 116979, "epoch": 2785} {"train_loss": -6.499863624572754, "global_step": 116980, "epoch": 2785} {"train_loss": -6.4526472091674805, "global_step": 116981, "epoch": 2785} {"train_loss": -6.60392427444458, "global_step": 116982, "epoch": 2785} {"train_loss": -6.380486488342285, "global_step": 116983, "epoch": 2785} {"train_loss": -6.3028130531311035, "global_step": 116984, "epoch": 2785} {"train_loss": -6.488776206970215, "global_step": 116985, "epoch": 2785} {"train_loss": -6.348391056060791, "global_step": 116986, "epoch": 2785} {"train_loss": -6.457653999328613, "global_step": 116987, "epoch": 2785} {"train_loss": -6.494132041931152, "global_step": 116988, "epoch": 2785} {"train_loss": -6.50677490234375, "global_step": 116989, "epoch": 2785} {"train_loss": -6.491746425628662, "global_step": 116990, "epoch": 2785} {"train_loss": -6.550858020782471, "global_step": 116991, "epoch": 2785} {"train_loss": -6.524840831756592, "global_step": 116992, "epoch": 2785} {"train_loss": -6.500604629516602, "global_step": 116993, "epoch": 2785} {"train_loss": -6.570339679718018, "global_step": 116994, "epoch": 2785} {"train_loss": -6.434863567352295, "global_step": 116995, "epoch": 2785} {"train_loss": -6.516989707946777, "global_step": 116996, "epoch": 2785} {"train_loss": -6.5159831047058105, "global_step": 116997, "epoch": 2785} {"train_loss": -6.553130149841309, "global_step": 116998, "epoch": 2785} {"train_loss": -6.402083396911621, "global_step": 116999, "epoch": 2785} {"train_loss": -6.510775089263916, "global_step": 117000, "epoch": 2785} {"train_loss": -6.492579936981201, "global_step": 117001, "epoch": 2785} {"train_loss": -6.475408554077148, "global_step": 117002, "epoch": 2785} {"train_loss": -6.622642517089844, "global_step": 117003, "epoch": 2785} {"train_loss": -6.422088623046875, "global_step": 117004, "epoch": 2785} {"train_loss": -6.593562126159668, "global_step": 117005, "epoch": 2785} {"train_loss": -6.562124252319336, "global_step": 117006, "epoch": 2785} {"train_loss": -6.484531402587891, "global_step": 117007, "epoch": 2785} {"train_loss": -6.528903007507324, "global_step": 117008, "epoch": 2785} {"train_loss": -6.585733413696289, "global_step": 117009, "epoch": 2785} {"train_loss": -6.450581073760986, "global_step": 117010, "epoch": 2785} {"train_loss": -6.51365369842166, "global_step": 117011, "epoch": 2785, "val_loss": 65518.93359375} {"train_loss": -6.477499008178711, "global_step": 117012, "epoch": 2786} {"train_loss": -6.625786781311035, "global_step": 117013, "epoch": 2786} {"train_loss": -6.693023681640625, "global_step": 117014, "epoch": 2786} {"train_loss": -6.542872905731201, "global_step": 117015, "epoch": 2786} {"train_loss": -6.586630344390869, "global_step": 117016, "epoch": 2786} {"train_loss": -6.523581504821777, "global_step": 117017, "epoch": 2786} {"train_loss": -6.5455322265625, "global_step": 117018, "epoch": 2786} {"train_loss": -6.619616508483887, "global_step": 117019, "epoch": 2786} {"train_loss": -6.551174163818359, "global_step": 117020, "epoch": 2786} {"train_loss": -6.599358558654785, "global_step": 117021, "epoch": 2786} {"train_loss": -6.587719440460205, "global_step": 117022, "epoch": 2786} {"train_loss": -6.559839248657227, "global_step": 117023, "epoch": 2786} {"train_loss": -6.587777137756348, "global_step": 117024, "epoch": 2786} {"train_loss": -6.568232536315918, "global_step": 117025, "epoch": 2786} {"train_loss": -6.5059661865234375, "global_step": 117026, "epoch": 2786} {"train_loss": -6.577534198760986, "global_step": 117027, "epoch": 2786} {"train_loss": -6.389688968658447, "global_step": 117028, "epoch": 2786} {"train_loss": -6.649285316467285, "global_step": 117029, "epoch": 2786} {"train_loss": -6.571869850158691, "global_step": 117030, "epoch": 2786} {"train_loss": -6.55183219909668, "global_step": 117031, "epoch": 2786} {"train_loss": -6.540624618530273, "global_step": 117032, "epoch": 2786} {"train_loss": -6.618305206298828, "global_step": 117033, "epoch": 2786} {"train_loss": -6.47898006439209, "global_step": 117034, "epoch": 2786} {"train_loss": -6.55338716506958, "global_step": 117035, "epoch": 2786} {"train_loss": -6.528739929199219, "global_step": 117036, "epoch": 2786} {"train_loss": -6.563189506530762, "global_step": 117037, "epoch": 2786} {"train_loss": -6.451303958892822, "global_step": 117038, "epoch": 2786} {"train_loss": -6.554512023925781, "global_step": 117039, "epoch": 2786} {"train_loss": -6.586637496948242, "global_step": 117040, "epoch": 2786} {"train_loss": -6.585397720336914, "global_step": 117041, "epoch": 2786} {"train_loss": -6.54606819152832, "global_step": 117042, "epoch": 2786} {"train_loss": -6.449644088745117, "global_step": 117043, "epoch": 2786} {"train_loss": -6.597251892089844, "global_step": 117044, "epoch": 2786} {"train_loss": -6.576158046722412, "global_step": 117045, "epoch": 2786} {"train_loss": -6.515625, "global_step": 117046, "epoch": 2786} {"train_loss": -6.562910079956055, "global_step": 117047, "epoch": 2786} {"train_loss": -6.537142753601074, "global_step": 117048, "epoch": 2786} {"train_loss": -6.478339195251465, "global_step": 117049, "epoch": 2786} {"train_loss": -6.480391979217529, "global_step": 117050, "epoch": 2786} {"train_loss": -6.583275318145752, "global_step": 117051, "epoch": 2786} {"train_loss": -6.534600734710693, "global_step": 117052, "epoch": 2786} {"train_loss": -6.550522043591454, "global_step": 117053, "epoch": 2786, "val_loss": 65338.62890625} {"train_loss": -6.6232099533081055, "global_step": 117054, "epoch": 2787} {"train_loss": -6.473020076751709, "global_step": 117055, "epoch": 2787} {"train_loss": -6.5405988693237305, "global_step": 117056, "epoch": 2787} {"train_loss": -6.588256359100342, "global_step": 117057, "epoch": 2787} {"train_loss": -6.551230430603027, "global_step": 117058, "epoch": 2787} {"train_loss": -6.480597019195557, "global_step": 117059, "epoch": 2787} {"train_loss": -6.4889984130859375, "global_step": 117060, "epoch": 2787} {"train_loss": -6.552029609680176, "global_step": 117061, "epoch": 2787} {"train_loss": -6.451306343078613, "global_step": 117062, "epoch": 2787} {"train_loss": -6.405831813812256, "global_step": 117063, "epoch": 2787} {"train_loss": -6.370054244995117, "global_step": 117064, "epoch": 2787} {"train_loss": -6.485024452209473, "global_step": 117065, "epoch": 2787} {"train_loss": -6.470231056213379, "global_step": 117066, "epoch": 2787} {"train_loss": -6.415289878845215, "global_step": 117067, "epoch": 2787} {"train_loss": -6.562841892242432, "global_step": 117068, "epoch": 2787} {"train_loss": -6.534956455230713, "global_step": 117069, "epoch": 2787} {"train_loss": -6.505235195159912, "global_step": 117070, "epoch": 2787} {"train_loss": -6.478976249694824, "global_step": 117071, "epoch": 2787} {"train_loss": -6.453601837158203, "global_step": 117072, "epoch": 2787} {"train_loss": -6.380715847015381, "global_step": 117073, "epoch": 2787} {"train_loss": -6.53626823425293, "global_step": 117074, "epoch": 2787} {"train_loss": -6.524524688720703, "global_step": 117075, "epoch": 2787} {"train_loss": -6.574408531188965, "global_step": 117076, "epoch": 2787} {"train_loss": -6.564199447631836, "global_step": 117077, "epoch": 2787} {"train_loss": -6.494043350219727, "global_step": 117078, "epoch": 2787} {"train_loss": -6.508169174194336, "global_step": 117079, "epoch": 2787} {"train_loss": -6.510959625244141, "global_step": 117080, "epoch": 2787} {"train_loss": -6.498341083526611, "global_step": 117081, "epoch": 2787} {"train_loss": -6.523026466369629, "global_step": 117082, "epoch": 2787} {"train_loss": -6.60420036315918, "global_step": 117083, "epoch": 2787} {"train_loss": -6.5016984939575195, "global_step": 117084, "epoch": 2787} {"train_loss": -6.619717597961426, "global_step": 117085, "epoch": 2787} {"train_loss": -6.4368696212768555, "global_step": 117086, "epoch": 2787} {"train_loss": -6.540417671203613, "global_step": 117087, "epoch": 2787} {"train_loss": -6.547771453857422, "global_step": 117088, "epoch": 2787} {"train_loss": -6.589930534362793, "global_step": 117089, "epoch": 2787} {"train_loss": -6.46381950378418, "global_step": 117090, "epoch": 2787} {"train_loss": -6.450259208679199, "global_step": 117091, "epoch": 2787} {"train_loss": -6.556123733520508, "global_step": 117092, "epoch": 2787} {"train_loss": -6.3716511726379395, "global_step": 117093, "epoch": 2787} {"train_loss": -6.392789363861084, "global_step": 117094, "epoch": 2787} {"train_loss": -6.503460032599313, "global_step": 117095, "epoch": 2787, "val_loss": 65604.8515625} {"train_loss": -6.593975067138672, "global_step": 117096, "epoch": 2788} {"train_loss": -6.490307331085205, "global_step": 117097, "epoch": 2788} {"train_loss": -6.413725852966309, "global_step": 117098, "epoch": 2788} {"train_loss": -6.624758720397949, "global_step": 117099, "epoch": 2788} {"train_loss": -6.495540618896484, "global_step": 117100, "epoch": 2788} {"train_loss": -6.5351762771606445, "global_step": 117101, "epoch": 2788} {"train_loss": -6.544459342956543, "global_step": 117102, "epoch": 2788} {"train_loss": -6.490223407745361, "global_step": 117103, "epoch": 2788} {"train_loss": -6.471738338470459, "global_step": 117104, "epoch": 2788} {"train_loss": -6.538574695587158, "global_step": 117105, "epoch": 2788} {"train_loss": -6.549744129180908, "global_step": 117106, "epoch": 2788} {"train_loss": -6.552570343017578, "global_step": 117107, "epoch": 2788} {"train_loss": -6.427327632904053, "global_step": 117108, "epoch": 2788} {"train_loss": -6.574928283691406, "global_step": 117109, "epoch": 2788} {"train_loss": -6.489221572875977, "global_step": 117110, "epoch": 2788} {"train_loss": -6.5305328369140625, "global_step": 117111, "epoch": 2788} {"train_loss": -6.458306789398193, "global_step": 117112, "epoch": 2788} {"train_loss": -6.490167617797852, "global_step": 117113, "epoch": 2788} {"train_loss": -6.563973903656006, "global_step": 117114, "epoch": 2788} {"train_loss": -6.606105804443359, "global_step": 117115, "epoch": 2788} {"train_loss": -6.560457706451416, "global_step": 117116, "epoch": 2788} {"train_loss": -6.426164627075195, "global_step": 117117, "epoch": 2788} {"train_loss": -6.494002342224121, "global_step": 117118, "epoch": 2788} {"train_loss": -6.609438896179199, "global_step": 117119, "epoch": 2788} {"train_loss": -6.542228698730469, "global_step": 117120, "epoch": 2788} {"train_loss": -6.406253337860107, "global_step": 117121, "epoch": 2788} {"train_loss": -6.53184700012207, "global_step": 117122, "epoch": 2788} {"train_loss": -6.513195514678955, "global_step": 117123, "epoch": 2788} {"train_loss": -6.455524444580078, "global_step": 117124, "epoch": 2788} {"train_loss": -6.529684543609619, "global_step": 117125, "epoch": 2788} {"train_loss": -6.546336650848389, "global_step": 117126, "epoch": 2788} {"train_loss": -6.3580827713012695, "global_step": 117127, "epoch": 2788} {"train_loss": -6.487234115600586, "global_step": 117128, "epoch": 2788} {"train_loss": -6.491100788116455, "global_step": 117129, "epoch": 2788} {"train_loss": -6.518933296203613, "global_step": 117130, "epoch": 2788} {"train_loss": -6.648439407348633, "global_step": 117131, "epoch": 2788} {"train_loss": -6.5801167488098145, "global_step": 117132, "epoch": 2788} {"train_loss": -6.495965003967285, "global_step": 117133, "epoch": 2788} {"train_loss": -6.581568241119385, "global_step": 117134, "epoch": 2788} {"train_loss": -6.580343246459961, "global_step": 117135, "epoch": 2788} {"train_loss": -6.618557929992676, "global_step": 117136, "epoch": 2788} {"train_loss": -6.5234860352107455, "global_step": 117137, "epoch": 2788, "val_loss": 65417.8125} {"train_loss": -6.575099468231201, "global_step": 117138, "epoch": 2789} {"train_loss": -6.60587215423584, "global_step": 117139, "epoch": 2789} {"train_loss": -6.574353218078613, "global_step": 117140, "epoch": 2789} {"train_loss": -6.657513618469238, "global_step": 117141, "epoch": 2789} {"train_loss": -6.519598007202148, "global_step": 117142, "epoch": 2789} {"train_loss": -6.531360626220703, "global_step": 117143, "epoch": 2789} {"train_loss": -6.470340728759766, "global_step": 117144, "epoch": 2789} {"train_loss": -6.485789775848389, "global_step": 117145, "epoch": 2789} {"train_loss": -6.57041072845459, "global_step": 117146, "epoch": 2789} {"train_loss": -6.462444305419922, "global_step": 117147, "epoch": 2789} {"train_loss": -6.526523590087891, "global_step": 117148, "epoch": 2789} {"train_loss": -6.6313252449035645, "global_step": 117149, "epoch": 2789} {"train_loss": -6.604349136352539, "global_step": 117150, "epoch": 2789} {"train_loss": -6.6272196769714355, "global_step": 117151, "epoch": 2789} {"train_loss": -6.524499416351318, "global_step": 117152, "epoch": 2789} {"train_loss": -6.591766357421875, "global_step": 117153, "epoch": 2789} {"train_loss": -6.573960304260254, "global_step": 117154, "epoch": 2789} {"train_loss": -6.5762224197387695, "global_step": 117155, "epoch": 2789} {"train_loss": -6.673030853271484, "global_step": 117156, "epoch": 2789} {"train_loss": -6.425729751586914, "global_step": 117157, "epoch": 2789} {"train_loss": -6.605198383331299, "global_step": 117158, "epoch": 2789} {"train_loss": -6.523633003234863, "global_step": 117159, "epoch": 2789} {"train_loss": -6.549917221069336, "global_step": 117160, "epoch": 2789} {"train_loss": -6.480878829956055, "global_step": 117161, "epoch": 2789} {"train_loss": -6.453188896179199, "global_step": 117162, "epoch": 2789} {"train_loss": -6.404722213745117, "global_step": 117163, "epoch": 2789} {"train_loss": -6.562690734863281, "global_step": 117164, "epoch": 2789} {"train_loss": -6.387630462646484, "global_step": 117165, "epoch": 2789} {"train_loss": -6.507589340209961, "global_step": 117166, "epoch": 2789} {"train_loss": -6.48176383972168, "global_step": 117167, "epoch": 2789} {"train_loss": -6.590867519378662, "global_step": 117168, "epoch": 2789} {"train_loss": -6.542263031005859, "global_step": 117169, "epoch": 2789} {"train_loss": -6.493899345397949, "global_step": 117170, "epoch": 2789} {"train_loss": -6.50990104675293, "global_step": 117171, "epoch": 2789} {"train_loss": -6.4422101974487305, "global_step": 117172, "epoch": 2789} {"train_loss": -6.389557838439941, "global_step": 117173, "epoch": 2789} {"train_loss": -6.5263566970825195, "global_step": 117174, "epoch": 2789} {"train_loss": -6.554490089416504, "global_step": 117175, "epoch": 2789} {"train_loss": -6.582960605621338, "global_step": 117176, "epoch": 2789} {"train_loss": -6.5447492599487305, "global_step": 117177, "epoch": 2789} {"train_loss": -6.55250358581543, "global_step": 117178, "epoch": 2789} {"train_loss": -6.536184901282901, "global_step": 117179, "epoch": 2789, "val_loss": 65523.08203125} {"train_loss": -6.494603157043457, "global_step": 117180, "epoch": 2790} {"train_loss": -6.413867473602295, "global_step": 117181, "epoch": 2790} {"train_loss": -6.563023567199707, "global_step": 117182, "epoch": 2790} {"train_loss": -6.548326015472412, "global_step": 117183, "epoch": 2790} {"train_loss": -6.614752769470215, "global_step": 117184, "epoch": 2790} {"train_loss": -6.446630477905273, "global_step": 117185, "epoch": 2790} {"train_loss": -6.482501029968262, "global_step": 117186, "epoch": 2790} {"train_loss": -6.608983516693115, "global_step": 117187, "epoch": 2790} {"train_loss": -6.489388465881348, "global_step": 117188, "epoch": 2790} {"train_loss": -6.568530559539795, "global_step": 117189, "epoch": 2790} {"train_loss": -6.574336051940918, "global_step": 117190, "epoch": 2790} {"train_loss": -6.555689811706543, "global_step": 117191, "epoch": 2790} {"train_loss": -6.594843864440918, "global_step": 117192, "epoch": 2790} {"train_loss": -6.623578071594238, "global_step": 117193, "epoch": 2790} {"train_loss": -6.591466903686523, "global_step": 117194, "epoch": 2790} {"train_loss": -6.420283317565918, "global_step": 117195, "epoch": 2790} {"train_loss": -6.602987289428711, "global_step": 117196, "epoch": 2790} {"train_loss": -6.477071762084961, "global_step": 117197, "epoch": 2790} {"train_loss": -6.6473846435546875, "global_step": 117198, "epoch": 2790} {"train_loss": -6.479134559631348, "global_step": 117199, "epoch": 2790} {"train_loss": -6.619447708129883, "global_step": 117200, "epoch": 2790} {"train_loss": -6.689224720001221, "global_step": 117201, "epoch": 2790} {"train_loss": -6.504694938659668, "global_step": 117202, "epoch": 2790} {"train_loss": -6.534200668334961, "global_step": 117203, "epoch": 2790} {"train_loss": -6.595441818237305, "global_step": 117204, "epoch": 2790} {"train_loss": -6.419872283935547, "global_step": 117205, "epoch": 2790} {"train_loss": -6.5974578857421875, "global_step": 117206, "epoch": 2790} {"train_loss": -6.555400848388672, "global_step": 117207, "epoch": 2790} {"train_loss": -6.538787841796875, "global_step": 117208, "epoch": 2790} {"train_loss": -6.521778106689453, "global_step": 117209, "epoch": 2790} {"train_loss": -6.528820037841797, "global_step": 117210, "epoch": 2790} {"train_loss": -6.535764217376709, "global_step": 117211, "epoch": 2790} {"train_loss": -6.577153205871582, "global_step": 117212, "epoch": 2790} {"train_loss": -6.620905876159668, "global_step": 117213, "epoch": 2790} {"train_loss": -6.603819370269775, "global_step": 117214, "epoch": 2790} {"train_loss": -6.610085487365723, "global_step": 117215, "epoch": 2790} {"train_loss": -6.541017055511475, "global_step": 117216, "epoch": 2790} {"train_loss": -6.623988151550293, "global_step": 117217, "epoch": 2790} {"train_loss": -6.557148456573486, "global_step": 117218, "epoch": 2790} {"train_loss": -6.514895915985107, "global_step": 117219, "epoch": 2790} {"train_loss": -6.511387825012207, "global_step": 117220, "epoch": 2790} {"train_loss": -6.549820343653361, "global_step": 117221, "epoch": 2790, "val_loss": 65398.27734375} {"train_loss": -6.482793807983398, "global_step": 117222, "epoch": 2791} {"train_loss": -6.5786027908325195, "global_step": 117223, "epoch": 2791} {"train_loss": -6.511900424957275, "global_step": 117224, "epoch": 2791} {"train_loss": -6.5662994384765625, "global_step": 117225, "epoch": 2791} {"train_loss": -6.464091777801514, "global_step": 117226, "epoch": 2791} {"train_loss": -6.573661804199219, "global_step": 117227, "epoch": 2791} {"train_loss": -6.558547496795654, "global_step": 117228, "epoch": 2791} {"train_loss": -6.536165237426758, "global_step": 117229, "epoch": 2791} {"train_loss": -6.544294357299805, "global_step": 117230, "epoch": 2791} {"train_loss": -6.623603820800781, "global_step": 117231, "epoch": 2791} {"train_loss": -6.505125045776367, "global_step": 117232, "epoch": 2791} {"train_loss": -6.477025985717773, "global_step": 117233, "epoch": 2791} {"train_loss": -6.6361188888549805, "global_step": 117234, "epoch": 2791} {"train_loss": -6.639026641845703, "global_step": 117235, "epoch": 2791} {"train_loss": -6.45979118347168, "global_step": 117236, "epoch": 2791} {"train_loss": -6.561821937561035, "global_step": 117237, "epoch": 2791} {"train_loss": -6.484707355499268, "global_step": 117238, "epoch": 2791} {"train_loss": -6.529934883117676, "global_step": 117239, "epoch": 2791} {"train_loss": -6.6290459632873535, "global_step": 117240, "epoch": 2791} {"train_loss": -6.391329765319824, "global_step": 117241, "epoch": 2791} {"train_loss": -6.520740509033203, "global_step": 117242, "epoch": 2791} {"train_loss": -6.474111557006836, "global_step": 117243, "epoch": 2791} {"train_loss": -6.511312484741211, "global_step": 117244, "epoch": 2791} {"train_loss": -6.652754783630371, "global_step": 117245, "epoch": 2791} {"train_loss": -6.653027534484863, "global_step": 117246, "epoch": 2791} {"train_loss": -6.559931755065918, "global_step": 117247, "epoch": 2791} {"train_loss": -6.458929538726807, "global_step": 117248, "epoch": 2791} {"train_loss": -6.453173637390137, "global_step": 117249, "epoch": 2791} {"train_loss": -6.547325134277344, "global_step": 117250, "epoch": 2791} {"train_loss": -6.534341335296631, "global_step": 117251, "epoch": 2791} {"train_loss": -6.4975433349609375, "global_step": 117252, "epoch": 2791} {"train_loss": -6.568991184234619, "global_step": 117253, "epoch": 2791} {"train_loss": -6.44897985458374, "global_step": 117254, "epoch": 2791} {"train_loss": -6.538658618927002, "global_step": 117255, "epoch": 2791} {"train_loss": -6.4395952224731445, "global_step": 117256, "epoch": 2791} {"train_loss": -6.564345359802246, "global_step": 117257, "epoch": 2791} {"train_loss": -6.5396013259887695, "global_step": 117258, "epoch": 2791} {"train_loss": -6.55927848815918, "global_step": 117259, "epoch": 2791} {"train_loss": -6.549799919128418, "global_step": 117260, "epoch": 2791} {"train_loss": -6.500184059143066, "global_step": 117261, "epoch": 2791} {"train_loss": -6.574079513549805, "global_step": 117262, "epoch": 2791} {"train_loss": -6.532526038941883, "global_step": 117263, "epoch": 2791, "val_loss": 65460.91015625} {"train_loss": -6.395194053649902, "global_step": 117264, "epoch": 2792} {"train_loss": -6.589803695678711, "global_step": 117265, "epoch": 2792} {"train_loss": -6.5063371658325195, "global_step": 117266, "epoch": 2792} {"train_loss": -6.502397537231445, "global_step": 117267, "epoch": 2792} {"train_loss": -6.688372611999512, "global_step": 117268, "epoch": 2792} {"train_loss": -6.611250877380371, "global_step": 117269, "epoch": 2792} {"train_loss": -6.574126243591309, "global_step": 117270, "epoch": 2792} {"train_loss": -6.422372817993164, "global_step": 117271, "epoch": 2792} {"train_loss": -6.479646682739258, "global_step": 117272, "epoch": 2792} {"train_loss": -6.484227180480957, "global_step": 117273, "epoch": 2792} {"train_loss": -6.457146167755127, "global_step": 117274, "epoch": 2792} {"train_loss": -6.571949005126953, "global_step": 117275, "epoch": 2792} {"train_loss": -6.536614894866943, "global_step": 117276, "epoch": 2792} {"train_loss": -6.5732221603393555, "global_step": 117277, "epoch": 2792} {"train_loss": -6.577767372131348, "global_step": 117278, "epoch": 2792} {"train_loss": -6.555229187011719, "global_step": 117279, "epoch": 2792} {"train_loss": -6.582304000854492, "global_step": 117280, "epoch": 2792} {"train_loss": -6.595646858215332, "global_step": 117281, "epoch": 2792} {"train_loss": -6.5126261711120605, "global_step": 117282, "epoch": 2792} {"train_loss": -6.519758224487305, "global_step": 117283, "epoch": 2792} {"train_loss": -6.532555103302002, "global_step": 117284, "epoch": 2792} {"train_loss": -6.567501068115234, "global_step": 117285, "epoch": 2792} {"train_loss": -6.583198547363281, "global_step": 117286, "epoch": 2792} {"train_loss": -6.585145950317383, "global_step": 117287, "epoch": 2792} {"train_loss": -6.614533424377441, "global_step": 117288, "epoch": 2792} {"train_loss": -6.563356876373291, "global_step": 117289, "epoch": 2792} {"train_loss": -6.4155120849609375, "global_step": 117290, "epoch": 2792} {"train_loss": -6.598188400268555, "global_step": 117291, "epoch": 2792} {"train_loss": -6.669981956481934, "global_step": 117292, "epoch": 2792} {"train_loss": -6.56093168258667, "global_step": 117293, "epoch": 2792} {"train_loss": -6.612518310546875, "global_step": 117294, "epoch": 2792} {"train_loss": -6.703112602233887, "global_step": 117295, "epoch": 2792} {"train_loss": -6.5657429695129395, "global_step": 117296, "epoch": 2792} {"train_loss": -6.588370323181152, "global_step": 117297, "epoch": 2792} {"train_loss": -6.48377799987793, "global_step": 117298, "epoch": 2792} {"train_loss": -6.533059120178223, "global_step": 117299, "epoch": 2792} {"train_loss": -6.624337196350098, "global_step": 117300, "epoch": 2792} {"train_loss": -6.579713344573975, "global_step": 117301, "epoch": 2792} {"train_loss": -6.43277645111084, "global_step": 117302, "epoch": 2792} {"train_loss": -6.563746929168701, "global_step": 117303, "epoch": 2792} {"train_loss": -6.571347236633301, "global_step": 117304, "epoch": 2792} {"train_loss": -6.553113301595052, "global_step": 117305, "epoch": 2792, "val_loss": 65468.3125} {"train_loss": -6.636046886444092, "global_step": 117306, "epoch": 2793} {"train_loss": -6.561176300048828, "global_step": 117307, "epoch": 2793} {"train_loss": -6.576794624328613, "global_step": 117308, "epoch": 2793} {"train_loss": -6.545846939086914, "global_step": 117309, "epoch": 2793} {"train_loss": -6.711099624633789, "global_step": 117310, "epoch": 2793} {"train_loss": -6.524896621704102, "global_step": 117311, "epoch": 2793} {"train_loss": -6.65480375289917, "global_step": 117312, "epoch": 2793} {"train_loss": -6.635048866271973, "global_step": 117313, "epoch": 2793} {"train_loss": -6.568140506744385, "global_step": 117314, "epoch": 2793} {"train_loss": -6.637731552124023, "global_step": 117315, "epoch": 2793} {"train_loss": -6.609747886657715, "global_step": 117316, "epoch": 2793} {"train_loss": -6.545867919921875, "global_step": 117317, "epoch": 2793} {"train_loss": -6.692607879638672, "global_step": 117318, "epoch": 2793} {"train_loss": -6.629390239715576, "global_step": 117319, "epoch": 2793} {"train_loss": -6.693020820617676, "global_step": 117320, "epoch": 2793} {"train_loss": -6.517195224761963, "global_step": 117321, "epoch": 2793} {"train_loss": -6.468542098999023, "global_step": 117322, "epoch": 2793} {"train_loss": -6.6226115226745605, "global_step": 117323, "epoch": 2793} {"train_loss": -6.693750381469727, "global_step": 117324, "epoch": 2793} {"train_loss": -6.528366565704346, "global_step": 117325, "epoch": 2793} {"train_loss": -6.525082111358643, "global_step": 117326, "epoch": 2793} {"train_loss": -6.6480488777160645, "global_step": 117327, "epoch": 2793} {"train_loss": -6.552036285400391, "global_step": 117328, "epoch": 2793} {"train_loss": -6.493218421936035, "global_step": 117329, "epoch": 2793} {"train_loss": -6.5527424812316895, "global_step": 117330, "epoch": 2793} {"train_loss": -6.563464164733887, "global_step": 117331, "epoch": 2793} {"train_loss": -6.532942295074463, "global_step": 117332, "epoch": 2793} {"train_loss": -6.652128219604492, "global_step": 117333, "epoch": 2793} {"train_loss": -6.500059127807617, "global_step": 117334, "epoch": 2793} {"train_loss": -6.445939540863037, "global_step": 117335, "epoch": 2793} {"train_loss": -6.489680290222168, "global_step": 117336, "epoch": 2793} {"train_loss": -6.690625190734863, "global_step": 117337, "epoch": 2793} {"train_loss": -6.4849748611450195, "global_step": 117338, "epoch": 2793} {"train_loss": -6.429438591003418, "global_step": 117339, "epoch": 2793} {"train_loss": -6.538054466247559, "global_step": 117340, "epoch": 2793} {"train_loss": -6.495776653289795, "global_step": 117341, "epoch": 2793} {"train_loss": -6.4617509841918945, "global_step": 117342, "epoch": 2793} {"train_loss": -6.495463848114014, "global_step": 117343, "epoch": 2793} {"train_loss": -6.500831604003906, "global_step": 117344, "epoch": 2793} {"train_loss": -6.492316246032715, "global_step": 117345, "epoch": 2793} {"train_loss": -6.620682239532471, "global_step": 117346, "epoch": 2793} {"train_loss": -6.564661809376308, "global_step": 117347, "epoch": 2793, "val_loss": 65592.140625} {"train_loss": -6.535910606384277, "global_step": 117348, "epoch": 2794} {"train_loss": -6.482964515686035, "global_step": 117349, "epoch": 2794} {"train_loss": -6.587435245513916, "global_step": 117350, "epoch": 2794} {"train_loss": -6.515440464019775, "global_step": 117351, "epoch": 2794} {"train_loss": -6.617347717285156, "global_step": 117352, "epoch": 2794} {"train_loss": -6.517961502075195, "global_step": 117353, "epoch": 2794} {"train_loss": -6.612685203552246, "global_step": 117354, "epoch": 2794} {"train_loss": -6.614058971405029, "global_step": 117355, "epoch": 2794} {"train_loss": -6.5205183029174805, "global_step": 117356, "epoch": 2794} {"train_loss": -6.43354606628418, "global_step": 117357, "epoch": 2794} {"train_loss": -6.6508002281188965, "global_step": 117358, "epoch": 2794} {"train_loss": -6.630746841430664, "global_step": 117359, "epoch": 2794} {"train_loss": -6.584118843078613, "global_step": 117360, "epoch": 2794} {"train_loss": -6.552590370178223, "global_step": 117361, "epoch": 2794} {"train_loss": -6.661982536315918, "global_step": 117362, "epoch": 2794} {"train_loss": -6.607494354248047, "global_step": 117363, "epoch": 2794} {"train_loss": -6.633485794067383, "global_step": 117364, "epoch": 2794} {"train_loss": -6.585195541381836, "global_step": 117365, "epoch": 2794} {"train_loss": -6.471220970153809, "global_step": 117366, "epoch": 2794} {"train_loss": -6.692368030548096, "global_step": 117367, "epoch": 2794} {"train_loss": -6.523629188537598, "global_step": 117368, "epoch": 2794} {"train_loss": -6.6096343994140625, "global_step": 117369, "epoch": 2794} {"train_loss": -6.4116668701171875, "global_step": 117370, "epoch": 2794} {"train_loss": -6.681643486022949, "global_step": 117371, "epoch": 2794} {"train_loss": -6.578088760375977, "global_step": 117372, "epoch": 2794} {"train_loss": -6.508065223693848, "global_step": 117373, "epoch": 2794} {"train_loss": -6.516429901123047, "global_step": 117374, "epoch": 2794} {"train_loss": -6.635538101196289, "global_step": 117375, "epoch": 2794} {"train_loss": -6.507843017578125, "global_step": 117376, "epoch": 2794} {"train_loss": -6.654763221740723, "global_step": 117377, "epoch": 2794} {"train_loss": -6.615299701690674, "global_step": 117378, "epoch": 2794} {"train_loss": -6.471972942352295, "global_step": 117379, "epoch": 2794} {"train_loss": -6.523358345031738, "global_step": 117380, "epoch": 2794} {"train_loss": -6.578737258911133, "global_step": 117381, "epoch": 2794} {"train_loss": -6.57895565032959, "global_step": 117382, "epoch": 2794} {"train_loss": -6.575333595275879, "global_step": 117383, "epoch": 2794} {"train_loss": -6.540517807006836, "global_step": 117384, "epoch": 2794} {"train_loss": -6.603167533874512, "global_step": 117385, "epoch": 2794} {"train_loss": -6.5571746826171875, "global_step": 117386, "epoch": 2794} {"train_loss": -6.602984428405762, "global_step": 117387, "epoch": 2794} {"train_loss": -6.634739875793457, "global_step": 117388, "epoch": 2794} {"train_loss": -6.57059079124814, "global_step": 117389, "epoch": 2794, "val_loss": 65399.99609375} {"train_loss": -6.505950927734375, "global_step": 117390, "epoch": 2795} {"train_loss": -6.521090507507324, "global_step": 117391, "epoch": 2795} {"train_loss": -6.585874080657959, "global_step": 117392, "epoch": 2795} {"train_loss": -6.43202018737793, "global_step": 117393, "epoch": 2795} {"train_loss": -6.538854598999023, "global_step": 117394, "epoch": 2795} {"train_loss": -6.558567047119141, "global_step": 117395, "epoch": 2795} {"train_loss": -6.612791538238525, "global_step": 117396, "epoch": 2795} {"train_loss": -6.4521403312683105, "global_step": 117397, "epoch": 2795} {"train_loss": -6.584772109985352, "global_step": 117398, "epoch": 2795} {"train_loss": -6.496542453765869, "global_step": 117399, "epoch": 2795} {"train_loss": -6.4940996170043945, "global_step": 117400, "epoch": 2795} {"train_loss": -6.456167697906494, "global_step": 117401, "epoch": 2795} {"train_loss": -6.582620143890381, "global_step": 117402, "epoch": 2795} {"train_loss": -6.451605796813965, "global_step": 117403, "epoch": 2795} {"train_loss": -6.5305562019348145, "global_step": 117404, "epoch": 2795} {"train_loss": -6.529123306274414, "global_step": 117405, "epoch": 2795} {"train_loss": -6.512017250061035, "global_step": 117406, "epoch": 2795} {"train_loss": -6.600735187530518, "global_step": 117407, "epoch": 2795} {"train_loss": -6.579576015472412, "global_step": 117408, "epoch": 2795} {"train_loss": -6.630199909210205, "global_step": 117409, "epoch": 2795} {"train_loss": -6.559427261352539, "global_step": 117410, "epoch": 2795} {"train_loss": -6.596631050109863, "global_step": 117411, "epoch": 2795} {"train_loss": -6.510556697845459, "global_step": 117412, "epoch": 2795} {"train_loss": -6.589025497436523, "global_step": 117413, "epoch": 2795} {"train_loss": -6.483144760131836, "global_step": 117414, "epoch": 2795} {"train_loss": -6.440814018249512, "global_step": 117415, "epoch": 2795} {"train_loss": -6.455196857452393, "global_step": 117416, "epoch": 2795} {"train_loss": -6.490519046783447, "global_step": 117417, "epoch": 2795} {"train_loss": -6.5936713218688965, "global_step": 117418, "epoch": 2795} {"train_loss": -6.532798767089844, "global_step": 117419, "epoch": 2795} {"train_loss": -6.604458808898926, "global_step": 117420, "epoch": 2795} {"train_loss": -6.54932975769043, "global_step": 117421, "epoch": 2795} {"train_loss": -6.619693756103516, "global_step": 117422, "epoch": 2795} {"train_loss": -6.634916305541992, "global_step": 117423, "epoch": 2795} {"train_loss": -6.532989501953125, "global_step": 117424, "epoch": 2795} {"train_loss": -6.547868251800537, "global_step": 117425, "epoch": 2795} {"train_loss": -6.565060615539551, "global_step": 117426, "epoch": 2795} {"train_loss": -6.658207893371582, "global_step": 117427, "epoch": 2795} {"train_loss": -6.519829750061035, "global_step": 117428, "epoch": 2795} {"train_loss": -6.558945178985596, "global_step": 117429, "epoch": 2795} {"train_loss": -6.530862808227539, "global_step": 117430, "epoch": 2795} {"train_loss": -6.543930734906878, "global_step": 117431, "epoch": 2795, "val_loss": 65638.765625} {"train_loss": -6.569599151611328, "global_step": 117432, "epoch": 2796} {"train_loss": -6.4792633056640625, "global_step": 117433, "epoch": 2796} {"train_loss": -6.669139862060547, "global_step": 117434, "epoch": 2796} {"train_loss": -6.3578901290893555, "global_step": 117435, "epoch": 2796} {"train_loss": -6.587271690368652, "global_step": 117436, "epoch": 2796} {"train_loss": -6.556258678436279, "global_step": 117437, "epoch": 2796} {"train_loss": -6.481500148773193, "global_step": 117438, "epoch": 2796} {"train_loss": -6.566387176513672, "global_step": 117439, "epoch": 2796} {"train_loss": -6.582720756530762, "global_step": 117440, "epoch": 2796} {"train_loss": -6.512967109680176, "global_step": 117441, "epoch": 2796} {"train_loss": -6.7458038330078125, "global_step": 117442, "epoch": 2796} {"train_loss": -6.57981014251709, "global_step": 117443, "epoch": 2796} {"train_loss": -6.5871901512146, "global_step": 117444, "epoch": 2796} {"train_loss": -6.536367893218994, "global_step": 117445, "epoch": 2796} {"train_loss": -6.633502960205078, "global_step": 117446, "epoch": 2796} {"train_loss": -6.608953475952148, "global_step": 117447, "epoch": 2796} {"train_loss": -6.57838773727417, "global_step": 117448, "epoch": 2796} {"train_loss": -6.579207420349121, "global_step": 117449, "epoch": 2796} {"train_loss": -6.515785217285156, "global_step": 117450, "epoch": 2796} {"train_loss": -6.557687282562256, "global_step": 117451, "epoch": 2796} {"train_loss": -6.4564619064331055, "global_step": 117452, "epoch": 2796} {"train_loss": -6.566106796264648, "global_step": 117453, "epoch": 2796} {"train_loss": -6.541860580444336, "global_step": 117454, "epoch": 2796} {"train_loss": -6.568914413452148, "global_step": 117455, "epoch": 2796} {"train_loss": -6.4766621589660645, "global_step": 117456, "epoch": 2796} {"train_loss": -6.615326404571533, "global_step": 117457, "epoch": 2796} {"train_loss": -6.504166603088379, "global_step": 117458, "epoch": 2796} {"train_loss": -6.4017333984375, "global_step": 117459, "epoch": 2796} {"train_loss": -6.4292473793029785, "global_step": 117460, "epoch": 2796} {"train_loss": -6.5982160568237305, "global_step": 117461, "epoch": 2796} {"train_loss": -6.568416595458984, "global_step": 117462, "epoch": 2796} {"train_loss": -6.494706153869629, "global_step": 117463, "epoch": 2796} {"train_loss": -6.529407978057861, "global_step": 117464, "epoch": 2796} {"train_loss": -6.438665390014648, "global_step": 117465, "epoch": 2796} {"train_loss": -6.538881778717041, "global_step": 117466, "epoch": 2796} {"train_loss": -6.641828536987305, "global_step": 117467, "epoch": 2796} {"train_loss": -6.492417812347412, "global_step": 117468, "epoch": 2796} {"train_loss": -6.466429710388184, "global_step": 117469, "epoch": 2796} {"train_loss": -6.528268814086914, "global_step": 117470, "epoch": 2796} {"train_loss": -6.597278594970703, "global_step": 117471, "epoch": 2796} {"train_loss": -6.577569961547852, "global_step": 117472, "epoch": 2796} {"train_loss": -6.545133522578648, "global_step": 117473, "epoch": 2796, "val_loss": 65472.19921875} {"train_loss": -6.539980888366699, "global_step": 117474, "epoch": 2797} {"train_loss": -6.500115394592285, "global_step": 117475, "epoch": 2797} {"train_loss": -6.529486656188965, "global_step": 117476, "epoch": 2797} {"train_loss": -6.71239709854126, "global_step": 117477, "epoch": 2797} {"train_loss": -6.574172496795654, "global_step": 117478, "epoch": 2797} {"train_loss": -6.566651821136475, "global_step": 117479, "epoch": 2797} {"train_loss": -6.606121063232422, "global_step": 117480, "epoch": 2797} {"train_loss": -6.577713966369629, "global_step": 117481, "epoch": 2797} {"train_loss": -6.660407543182373, "global_step": 117482, "epoch": 2797} {"train_loss": -6.526700019836426, "global_step": 117483, "epoch": 2797} {"train_loss": -6.5186333656311035, "global_step": 117484, "epoch": 2797} {"train_loss": -6.6639790534973145, "global_step": 117485, "epoch": 2797} {"train_loss": -6.554851055145264, "global_step": 117486, "epoch": 2797} {"train_loss": -6.534341812133789, "global_step": 117487, "epoch": 2797} {"train_loss": -6.531606197357178, "global_step": 117488, "epoch": 2797} {"train_loss": -6.491205215454102, "global_step": 117489, "epoch": 2797} {"train_loss": -6.582201957702637, "global_step": 117490, "epoch": 2797} {"train_loss": -6.581648349761963, "global_step": 117491, "epoch": 2797} {"train_loss": -6.6271491050720215, "global_step": 117492, "epoch": 2797} {"train_loss": -6.558428764343262, "global_step": 117493, "epoch": 2797} {"train_loss": -6.528772354125977, "global_step": 117494, "epoch": 2797} {"train_loss": -6.584615707397461, "global_step": 117495, "epoch": 2797} {"train_loss": -6.570239067077637, "global_step": 117496, "epoch": 2797} {"train_loss": -6.605826377868652, "global_step": 117497, "epoch": 2797} {"train_loss": -6.598775863647461, "global_step": 117498, "epoch": 2797} {"train_loss": -6.554420471191406, "global_step": 117499, "epoch": 2797} {"train_loss": -6.5184526443481445, "global_step": 117500, "epoch": 2797} {"train_loss": -6.498055458068848, "global_step": 117501, "epoch": 2797} {"train_loss": -6.434918403625488, "global_step": 117502, "epoch": 2797} {"train_loss": -6.535360336303711, "global_step": 117503, "epoch": 2797} {"train_loss": -6.655729293823242, "global_step": 117504, "epoch": 2797} {"train_loss": -6.491062164306641, "global_step": 117505, "epoch": 2797} {"train_loss": -6.485745429992676, "global_step": 117506, "epoch": 2797} {"train_loss": -6.507081985473633, "global_step": 117507, "epoch": 2797} {"train_loss": -6.588693618774414, "global_step": 117508, "epoch": 2797} {"train_loss": -6.517423152923584, "global_step": 117509, "epoch": 2797} {"train_loss": -6.531333923339844, "global_step": 117510, "epoch": 2797} {"train_loss": -6.592811584472656, "global_step": 117511, "epoch": 2797} {"train_loss": -6.5744428634643555, "global_step": 117512, "epoch": 2797} {"train_loss": -6.435865879058838, "global_step": 117513, "epoch": 2797} {"train_loss": -6.492351531982422, "global_step": 117514, "epoch": 2797} {"train_loss": -6.554055089042301, "global_step": 117515, "epoch": 2797, "val_loss": 65439.7890625} {"train_loss": -6.528617858886719, "global_step": 117516, "epoch": 2798} {"train_loss": -6.628348350524902, "global_step": 117517, "epoch": 2798} {"train_loss": -6.533628940582275, "global_step": 117518, "epoch": 2798} {"train_loss": -6.553062438964844, "global_step": 117519, "epoch": 2798} {"train_loss": -6.446084976196289, "global_step": 117520, "epoch": 2798} {"train_loss": -6.712382793426514, "global_step": 117521, "epoch": 2798} {"train_loss": -6.543840408325195, "global_step": 117522, "epoch": 2798} {"train_loss": -6.566277980804443, "global_step": 117523, "epoch": 2798} {"train_loss": -6.485409259796143, "global_step": 117524, "epoch": 2798} {"train_loss": -6.494542121887207, "global_step": 117525, "epoch": 2798} {"train_loss": -6.5295820236206055, "global_step": 117526, "epoch": 2798} {"train_loss": -6.571419715881348, "global_step": 117527, "epoch": 2798} {"train_loss": -6.541922092437744, "global_step": 117528, "epoch": 2798} {"train_loss": -6.609772682189941, "global_step": 117529, "epoch": 2798} {"train_loss": -6.48182487487793, "global_step": 117530, "epoch": 2798} {"train_loss": -6.558526992797852, "global_step": 117531, "epoch": 2798} {"train_loss": -6.593786716461182, "global_step": 117532, "epoch": 2798} {"train_loss": -6.557178020477295, "global_step": 117533, "epoch": 2798} {"train_loss": -6.60116720199585, "global_step": 117534, "epoch": 2798} {"train_loss": -6.524282455444336, "global_step": 117535, "epoch": 2798} {"train_loss": -6.565285682678223, "global_step": 117536, "epoch": 2798} {"train_loss": -6.585887432098389, "global_step": 117537, "epoch": 2798} {"train_loss": -6.638450622558594, "global_step": 117538, "epoch": 2798} {"train_loss": -6.5616302490234375, "global_step": 117539, "epoch": 2798} {"train_loss": -6.565368175506592, "global_step": 117540, "epoch": 2798} {"train_loss": -6.593588829040527, "global_step": 117541, "epoch": 2798} {"train_loss": -6.508727073669434, "global_step": 117542, "epoch": 2798} {"train_loss": -6.602191925048828, "global_step": 117543, "epoch": 2798} {"train_loss": -6.593557834625244, "global_step": 117544, "epoch": 2798} {"train_loss": -6.52677059173584, "global_step": 117545, "epoch": 2798} {"train_loss": -6.6657819747924805, "global_step": 117546, "epoch": 2798} {"train_loss": -6.541074275970459, "global_step": 117547, "epoch": 2798} {"train_loss": -6.4949846267700195, "global_step": 117548, "epoch": 2798} {"train_loss": -6.497016906738281, "global_step": 117549, "epoch": 2798} {"train_loss": -6.479719161987305, "global_step": 117550, "epoch": 2798} {"train_loss": -6.458066940307617, "global_step": 117551, "epoch": 2798} {"train_loss": -6.578049182891846, "global_step": 117552, "epoch": 2798} {"train_loss": -6.460391998291016, "global_step": 117553, "epoch": 2798} {"train_loss": -6.47428035736084, "global_step": 117554, "epoch": 2798} {"train_loss": -6.564492225646973, "global_step": 117555, "epoch": 2798} {"train_loss": -6.539581298828125, "global_step": 117556, "epoch": 2798} {"train_loss": -6.552628483091082, "global_step": 117557, "epoch": 2798, "val_loss": 65573.6015625} {"train_loss": -6.644524574279785, "global_step": 117558, "epoch": 2799} {"train_loss": -6.416216850280762, "global_step": 117559, "epoch": 2799} {"train_loss": -6.5078511238098145, "global_step": 117560, "epoch": 2799} {"train_loss": -6.539154529571533, "global_step": 117561, "epoch": 2799} {"train_loss": -6.540928840637207, "global_step": 117562, "epoch": 2799} {"train_loss": -6.615509033203125, "global_step": 117563, "epoch": 2799} {"train_loss": -6.515153408050537, "global_step": 117564, "epoch": 2799} {"train_loss": -6.561145782470703, "global_step": 117565, "epoch": 2799} {"train_loss": -6.625434398651123, "global_step": 117566, "epoch": 2799} {"train_loss": -6.54646635055542, "global_step": 117567, "epoch": 2799} {"train_loss": -6.564260482788086, "global_step": 117568, "epoch": 2799} {"train_loss": -6.593315124511719, "global_step": 117569, "epoch": 2799} {"train_loss": -6.597419738769531, "global_step": 117570, "epoch": 2799} {"train_loss": -6.551977157592773, "global_step": 117571, "epoch": 2799} {"train_loss": -6.569393157958984, "global_step": 117572, "epoch": 2799} {"train_loss": -6.583049297332764, "global_step": 117573, "epoch": 2799} {"train_loss": -6.48006534576416, "global_step": 117574, "epoch": 2799} {"train_loss": -6.542164325714111, "global_step": 117575, "epoch": 2799} {"train_loss": -6.46926212310791, "global_step": 117576, "epoch": 2799} {"train_loss": -6.641429901123047, "global_step": 117577, "epoch": 2799} {"train_loss": -6.536564350128174, "global_step": 117578, "epoch": 2799} {"train_loss": -6.577244281768799, "global_step": 117579, "epoch": 2799} {"train_loss": -6.508845806121826, "global_step": 117580, "epoch": 2799} {"train_loss": -6.4684224128723145, "global_step": 117581, "epoch": 2799} {"train_loss": -6.58982515335083, "global_step": 117582, "epoch": 2799} {"train_loss": -6.6333160400390625, "global_step": 117583, "epoch": 2799} {"train_loss": -6.651700496673584, "global_step": 117584, "epoch": 2799} {"train_loss": -6.438776016235352, "global_step": 117585, "epoch": 2799} {"train_loss": -6.515506744384766, "global_step": 117586, "epoch": 2799} {"train_loss": -6.604484558105469, "global_step": 117587, "epoch": 2799} {"train_loss": -6.587698936462402, "global_step": 117588, "epoch": 2799} {"train_loss": -6.57954216003418, "global_step": 117589, "epoch": 2799} {"train_loss": -6.553988933563232, "global_step": 117590, "epoch": 2799} {"train_loss": -6.596078395843506, "global_step": 117591, "epoch": 2799} {"train_loss": -6.578979969024658, "global_step": 117592, "epoch": 2799} {"train_loss": -6.511434078216553, "global_step": 117593, "epoch": 2799} {"train_loss": -6.526978492736816, "global_step": 117594, "epoch": 2799} {"train_loss": -6.593062400817871, "global_step": 117595, "epoch": 2799} {"train_loss": -6.51855993270874, "global_step": 117596, "epoch": 2799} {"train_loss": -6.575667381286621, "global_step": 117597, "epoch": 2799} {"train_loss": -6.575479030609131, "global_step": 117598, "epoch": 2799} {"train_loss": -6.556097859428043, "global_step": 117599, "epoch": 2799, "val_loss": 65361.72265625} {"train_loss": -6.597532272338867, "global_step": 117600, "epoch": 2800} {"train_loss": -6.54976224899292, "global_step": 117601, "epoch": 2800} {"train_loss": -6.585366249084473, "global_step": 117602, "epoch": 2800} {"train_loss": -6.631205081939697, "global_step": 117603, "epoch": 2800} {"train_loss": -6.541432857513428, "global_step": 117604, "epoch": 2800} {"train_loss": -6.686036586761475, "global_step": 117605, "epoch": 2800} {"train_loss": -6.527291297912598, "global_step": 117606, "epoch": 2800} {"train_loss": -6.657033443450928, "global_step": 117607, "epoch": 2800} {"train_loss": -6.6776275634765625, "global_step": 117608, "epoch": 2800} {"train_loss": -6.612947463989258, "global_step": 117609, "epoch": 2800} {"train_loss": -6.561287879943848, "global_step": 117610, "epoch": 2800} {"train_loss": -6.562197685241699, "global_step": 117611, "epoch": 2800} {"train_loss": -6.6520795822143555, "global_step": 117612, "epoch": 2800} {"train_loss": -6.576189994812012, "global_step": 117613, "epoch": 2800} {"train_loss": -6.5782060623168945, "global_step": 117614, "epoch": 2800} {"train_loss": -6.598058700561523, "global_step": 117615, "epoch": 2800} {"train_loss": -6.602476119995117, "global_step": 117616, "epoch": 2800} {"train_loss": -6.547104835510254, "global_step": 117617, "epoch": 2800} {"train_loss": -6.616728782653809, "global_step": 117618, "epoch": 2800} {"train_loss": -6.471789360046387, "global_step": 117619, "epoch": 2800} {"train_loss": -6.617836952209473, "global_step": 117620, "epoch": 2800} {"train_loss": -6.515596866607666, "global_step": 117621, "epoch": 2800} {"train_loss": -6.530606269836426, "global_step": 117622, "epoch": 2800} {"train_loss": -6.55657958984375, "global_step": 117623, "epoch": 2800} {"train_loss": -6.684993743896484, "global_step": 117624, "epoch": 2800} {"train_loss": -6.455488204956055, "global_step": 117625, "epoch": 2800} {"train_loss": -6.622846603393555, "global_step": 117626, "epoch": 2800} {"train_loss": -6.57045841217041, "global_step": 117627, "epoch": 2800} {"train_loss": -6.533368110656738, "global_step": 117628, "epoch": 2800} {"train_loss": -6.423255920410156, "global_step": 117629, "epoch": 2800} {"train_loss": -6.4837236404418945, "global_step": 117630, "epoch": 2800} {"train_loss": -6.535571098327637, "global_step": 117631, "epoch": 2800} {"train_loss": -6.38185977935791, "global_step": 117632, "epoch": 2800} {"train_loss": -6.526420593261719, "global_step": 117633, "epoch": 2800} {"train_loss": -6.389399528503418, "global_step": 117634, "epoch": 2800} {"train_loss": -6.456339359283447, "global_step": 117635, "epoch": 2800} {"train_loss": -6.3785858154296875, "global_step": 117636, "epoch": 2800} {"train_loss": -6.5003814697265625, "global_step": 117637, "epoch": 2800} {"train_loss": -6.490189552307129, "global_step": 117638, "epoch": 2800} {"train_loss": -6.370575904846191, "global_step": 117639, "epoch": 2800} {"train_loss": -6.405854225158691, "global_step": 117640, "epoch": 2800} {"train_loss": -6.542605774743216, "global_step": 117641, "epoch": 2800, "train/sim_max_reward_0": 0.752493489606812, "train/sim_max_reward_1": 0.2881003335448727, "train/sim_max_reward_2": 0.49106584366669886, "train/sim_max_reward_3": 0.9528092711810364, "train/sim_max_reward_4": 0.9870723620536771, "train/sim_max_reward_5": 0.9734806353289625, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.16487174112403088, "test/sim_max_reward_4300002": 0.9143629453097288, "test/sim_max_reward_4300003": 0.9533500556930123, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.7843687084191385, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.5436801859832547, "test/sim_max_reward_4300008": 0.0, "test/sim_max_reward_4300009": 0.9485160883351496, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9773897615918639, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.9916166193409047, "test/sim_max_reward_4300014": 0.9275667597820171, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.9619151668766519, "test/sim_max_reward_4300017": 0.7876896331854081, "test/sim_max_reward_4300018": 0.4073268828811688, "test/sim_max_reward_4300019": 0.18518627266817028, "test/sim_max_reward_4300020": 0.00580425969749447, "test/sim_max_reward_4300021": 0.90979685439692, "test/sim_max_reward_4300022": 0.9540027695946558, "test/sim_max_reward_4300023": 0.33306760160411686, "test/sim_max_reward_4300024": 0.6894465530125962, "test/sim_max_reward_4300025": 0.7922538871854623, "test/sim_max_reward_4300026": 0.1558118331099245, "test/sim_max_reward_4300027": 0.8503664956818179, "test/sim_max_reward_4300028": 0.9163312051441569, "test/sim_max_reward_4300029": 0.8164278140435993, "test/sim_max_reward_4300030": 0.9638024037387883, "test/sim_max_reward_4300031": 0.22053322174964662, "test/sim_max_reward_4300032": 0.7074140132705133, "test/sim_max_reward_4300033": 0.6222284993872252, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.4605048089458702, "test/sim_max_reward_4300036": 0.2004172322411768, "test/sim_max_reward_4300037": 0.8882183542564865, "test/sim_max_reward_4300038": 0.7737040400438802, "test/sim_max_reward_4300039": 0.7537779437875808, "test/sim_max_reward_4300040": 0.8693356055901765, "test/sim_max_reward_4300041": 0.8939331846446714, "test/sim_max_reward_4300042": 1.0, "test/sim_max_reward_4300043": 0.1892038757791064, "test/sim_max_reward_4300044": 0.26159771557285666, "test/sim_max_reward_4300045": 0.21557315853796416, "test/sim_max_reward_4300046": 0.9254861571662992, "test/sim_max_reward_4300047": 0.9765932235843842, "test/sim_max_reward_4300048": 0.01978354435877722, "test/sim_max_reward_4300049": 0.2643917606600433, "train/mean_score": 0.7408369892303432, "test/mean_score": 0.5838696588557195, "val_loss": 65747.8984375} {"train_loss": -6.416813850402832, "global_step": 117642, "epoch": 2801} {"train_loss": -6.58552360534668, "global_step": 117643, "epoch": 2801} {"train_loss": -6.452203750610352, "global_step": 117644, "epoch": 2801} {"train_loss": -6.470846176147461, "global_step": 117645, "epoch": 2801} {"train_loss": -6.458465576171875, "global_step": 117646, "epoch": 2801} {"train_loss": -6.441363334655762, "global_step": 117647, "epoch": 2801} {"train_loss": -6.4199676513671875, "global_step": 117648, "epoch": 2801} {"train_loss": -6.528730392456055, "global_step": 117649, "epoch": 2801} {"train_loss": -6.585927963256836, "global_step": 117650, "epoch": 2801} {"train_loss": -6.493546009063721, "global_step": 117651, "epoch": 2801} {"train_loss": -6.526473045349121, "global_step": 117652, "epoch": 2801} {"train_loss": -6.439182758331299, "global_step": 117653, "epoch": 2801} {"train_loss": -6.435765743255615, "global_step": 117654, "epoch": 2801} {"train_loss": -6.504266262054443, "global_step": 117655, "epoch": 2801} {"train_loss": -6.41528844833374, "global_step": 117656, "epoch": 2801} {"train_loss": -6.524959564208984, "global_step": 117657, "epoch": 2801} {"train_loss": -6.538057804107666, "global_step": 117658, "epoch": 2801} {"train_loss": -6.542423725128174, "global_step": 117659, "epoch": 2801} {"train_loss": -6.4713544845581055, "global_step": 117660, "epoch": 2801} {"train_loss": -6.444472789764404, "global_step": 117661, "epoch": 2801} {"train_loss": -6.54745626449585, "global_step": 117662, "epoch": 2801} {"train_loss": -6.540010452270508, "global_step": 117663, "epoch": 2801} {"train_loss": -6.606139659881592, "global_step": 117664, "epoch": 2801} {"train_loss": -6.512238502502441, "global_step": 117665, "epoch": 2801} {"train_loss": -6.586397647857666, "global_step": 117666, "epoch": 2801} {"train_loss": -6.48639440536499, "global_step": 117667, "epoch": 2801} {"train_loss": -6.6104888916015625, "global_step": 117668, "epoch": 2801} {"train_loss": -6.6428985595703125, "global_step": 117669, "epoch": 2801} {"train_loss": -6.497791290283203, "global_step": 117670, "epoch": 2801} {"train_loss": -6.478026390075684, "global_step": 117671, "epoch": 2801} {"train_loss": -6.547687530517578, "global_step": 117672, "epoch": 2801} {"train_loss": -6.529449462890625, "global_step": 117673, "epoch": 2801} {"train_loss": -6.5093536376953125, "global_step": 117674, "epoch": 2801} {"train_loss": -6.553086280822754, "global_step": 117675, "epoch": 2801} {"train_loss": -6.536770820617676, "global_step": 117676, "epoch": 2801} {"train_loss": -6.551456451416016, "global_step": 117677, "epoch": 2801} {"train_loss": -6.684394836425781, "global_step": 117678, "epoch": 2801} {"train_loss": -6.639070510864258, "global_step": 117679, "epoch": 2801} {"train_loss": -6.463198661804199, "global_step": 117680, "epoch": 2801} {"train_loss": -6.546734809875488, "global_step": 117681, "epoch": 2801} {"train_loss": -6.6637444496154785, "global_step": 117682, "epoch": 2801} {"train_loss": -6.523438851038615, "global_step": 117683, "epoch": 2801, "val_loss": 65427.203125} {"train_loss": -6.546899318695068, "global_step": 117684, "epoch": 2802} {"train_loss": -6.471695899963379, "global_step": 117685, "epoch": 2802} {"train_loss": -6.508579730987549, "global_step": 117686, "epoch": 2802} {"train_loss": -6.41325569152832, "global_step": 117687, "epoch": 2802} {"train_loss": -6.356346130371094, "global_step": 117688, "epoch": 2802} {"train_loss": -6.572531223297119, "global_step": 117689, "epoch": 2802} {"train_loss": -6.437813758850098, "global_step": 117690, "epoch": 2802} {"train_loss": -6.367125511169434, "global_step": 117691, "epoch": 2802} {"train_loss": -6.6083879470825195, "global_step": 117692, "epoch": 2802} {"train_loss": -6.336772918701172, "global_step": 117693, "epoch": 2802} {"train_loss": -6.56574821472168, "global_step": 117694, "epoch": 2802} {"train_loss": -6.38295316696167, "global_step": 117695, "epoch": 2802} {"train_loss": -6.482648849487305, "global_step": 117696, "epoch": 2802} {"train_loss": -6.5139570236206055, "global_step": 117697, "epoch": 2802} {"train_loss": -6.491495132446289, "global_step": 117698, "epoch": 2802} {"train_loss": -6.57325553894043, "global_step": 117699, "epoch": 2802} {"train_loss": -6.526717185974121, "global_step": 117700, "epoch": 2802} {"train_loss": -6.498613357543945, "global_step": 117701, "epoch": 2802} {"train_loss": -6.455045223236084, "global_step": 117702, "epoch": 2802} {"train_loss": -6.655710220336914, "global_step": 117703, "epoch": 2802} {"train_loss": -6.508762359619141, "global_step": 117704, "epoch": 2802} {"train_loss": -6.558165550231934, "global_step": 117705, "epoch": 2802} {"train_loss": -6.393189907073975, "global_step": 117706, "epoch": 2802} {"train_loss": -6.61531925201416, "global_step": 117707, "epoch": 2802} {"train_loss": -6.464958667755127, "global_step": 117708, "epoch": 2802} {"train_loss": -6.412772178649902, "global_step": 117709, "epoch": 2802} {"train_loss": -6.588212966918945, "global_step": 117710, "epoch": 2802} {"train_loss": -6.431562423706055, "global_step": 117711, "epoch": 2802} {"train_loss": -6.506378650665283, "global_step": 117712, "epoch": 2802} {"train_loss": -6.571688652038574, "global_step": 117713, "epoch": 2802} {"train_loss": -6.525798797607422, "global_step": 117714, "epoch": 2802} {"train_loss": -6.52083683013916, "global_step": 117715, "epoch": 2802} {"train_loss": -6.494302749633789, "global_step": 117716, "epoch": 2802} {"train_loss": -6.591874599456787, "global_step": 117717, "epoch": 2802} {"train_loss": -6.591517448425293, "global_step": 117718, "epoch": 2802} {"train_loss": -6.490152359008789, "global_step": 117719, "epoch": 2802} {"train_loss": -6.597155570983887, "global_step": 117720, "epoch": 2802} {"train_loss": -6.552704811096191, "global_step": 117721, "epoch": 2802} {"train_loss": -6.383705139160156, "global_step": 117722, "epoch": 2802} {"train_loss": -6.453624725341797, "global_step": 117723, "epoch": 2802} {"train_loss": -6.482904434204102, "global_step": 117724, "epoch": 2802} {"train_loss": -6.500422738847279, "global_step": 117725, "epoch": 2802, "val_loss": 65438.66015625} {"train_loss": -6.518077850341797, "global_step": 117726, "epoch": 2803} {"train_loss": -6.47062873840332, "global_step": 117727, "epoch": 2803} {"train_loss": -6.634683609008789, "global_step": 117728, "epoch": 2803} {"train_loss": -6.568233013153076, "global_step": 117729, "epoch": 2803} {"train_loss": -6.462015151977539, "global_step": 117730, "epoch": 2803} {"train_loss": -6.538273811340332, "global_step": 117731, "epoch": 2803} {"train_loss": -6.557717800140381, "global_step": 117732, "epoch": 2803} {"train_loss": -6.549169540405273, "global_step": 117733, "epoch": 2803} {"train_loss": -6.541864395141602, "global_step": 117734, "epoch": 2803} {"train_loss": -6.487069606781006, "global_step": 117735, "epoch": 2803} {"train_loss": -6.549365997314453, "global_step": 117736, "epoch": 2803} {"train_loss": -6.552865982055664, "global_step": 117737, "epoch": 2803} {"train_loss": -6.507680892944336, "global_step": 117738, "epoch": 2803} {"train_loss": -6.622468948364258, "global_step": 117739, "epoch": 2803} {"train_loss": -6.472173690795898, "global_step": 117740, "epoch": 2803} {"train_loss": -6.629947662353516, "global_step": 117741, "epoch": 2803} {"train_loss": -6.65708589553833, "global_step": 117742, "epoch": 2803} {"train_loss": -6.5663909912109375, "global_step": 117743, "epoch": 2803} {"train_loss": -6.59529972076416, "global_step": 117744, "epoch": 2803} {"train_loss": -6.535834789276123, "global_step": 117745, "epoch": 2803} {"train_loss": -6.471485137939453, "global_step": 117746, "epoch": 2803} {"train_loss": -6.510679244995117, "global_step": 117747, "epoch": 2803} {"train_loss": -6.590864181518555, "global_step": 117748, "epoch": 2803} {"train_loss": -6.516707420349121, "global_step": 117749, "epoch": 2803} {"train_loss": -6.624120712280273, "global_step": 117750, "epoch": 2803} {"train_loss": -6.611056804656982, "global_step": 117751, "epoch": 2803} {"train_loss": -6.683752536773682, "global_step": 117752, "epoch": 2803} {"train_loss": -6.647542953491211, "global_step": 117753, "epoch": 2803} {"train_loss": -6.611185073852539, "global_step": 117754, "epoch": 2803} {"train_loss": -6.512729644775391, "global_step": 117755, "epoch": 2803} {"train_loss": -6.602068901062012, "global_step": 117756, "epoch": 2803} {"train_loss": -6.490381240844727, "global_step": 117757, "epoch": 2803} {"train_loss": -6.400338172912598, "global_step": 117758, "epoch": 2803} {"train_loss": -6.557989597320557, "global_step": 117759, "epoch": 2803} {"train_loss": -6.511164665222168, "global_step": 117760, "epoch": 2803} {"train_loss": -6.50285530090332, "global_step": 117761, "epoch": 2803} {"train_loss": -6.518105983734131, "global_step": 117762, "epoch": 2803} {"train_loss": -6.62225341796875, "global_step": 117763, "epoch": 2803} {"train_loss": -6.41923713684082, "global_step": 117764, "epoch": 2803} {"train_loss": -6.485514163970947, "global_step": 117765, "epoch": 2803} {"train_loss": -6.550198554992676, "global_step": 117766, "epoch": 2803} {"train_loss": -6.543481565657116, "global_step": 117767, "epoch": 2803, "val_loss": 65503.33984375} {"train_loss": -6.4508233070373535, "global_step": 117768, "epoch": 2804} {"train_loss": -6.338925361633301, "global_step": 117769, "epoch": 2804} {"train_loss": -6.480817794799805, "global_step": 117770, "epoch": 2804} {"train_loss": -6.562341690063477, "global_step": 117771, "epoch": 2804} {"train_loss": -6.494354248046875, "global_step": 117772, "epoch": 2804} {"train_loss": -6.568652629852295, "global_step": 117773, "epoch": 2804} {"train_loss": -6.4264936447143555, "global_step": 117774, "epoch": 2804} {"train_loss": -6.537593841552734, "global_step": 117775, "epoch": 2804} {"train_loss": -6.389883995056152, "global_step": 117776, "epoch": 2804} {"train_loss": -6.555158615112305, "global_step": 117777, "epoch": 2804} {"train_loss": -6.496120929718018, "global_step": 117778, "epoch": 2804} {"train_loss": -6.552290439605713, "global_step": 117779, "epoch": 2804} {"train_loss": -6.5806097984313965, "global_step": 117780, "epoch": 2804} {"train_loss": -6.534820556640625, "global_step": 117781, "epoch": 2804} {"train_loss": -6.496703624725342, "global_step": 117782, "epoch": 2804} {"train_loss": -6.6213178634643555, "global_step": 117783, "epoch": 2804} {"train_loss": -6.585132598876953, "global_step": 117784, "epoch": 2804} {"train_loss": -6.581260681152344, "global_step": 117785, "epoch": 2804} {"train_loss": -6.482138156890869, "global_step": 117786, "epoch": 2804} {"train_loss": -6.616447448730469, "global_step": 117787, "epoch": 2804} {"train_loss": -6.542250633239746, "global_step": 117788, "epoch": 2804} {"train_loss": -6.7536725997924805, "global_step": 117789, "epoch": 2804} {"train_loss": -6.463929176330566, "global_step": 117790, "epoch": 2804} {"train_loss": -6.566047668457031, "global_step": 117791, "epoch": 2804} {"train_loss": -6.589108943939209, "global_step": 117792, "epoch": 2804} {"train_loss": -6.536932945251465, "global_step": 117793, "epoch": 2804} {"train_loss": -6.517436504364014, "global_step": 117794, "epoch": 2804} {"train_loss": -6.571102142333984, "global_step": 117795, "epoch": 2804} {"train_loss": -6.3932600021362305, "global_step": 117796, "epoch": 2804} {"train_loss": -6.473565101623535, "global_step": 117797, "epoch": 2804} {"train_loss": -6.503812313079834, "global_step": 117798, "epoch": 2804} {"train_loss": -6.506198883056641, "global_step": 117799, "epoch": 2804} {"train_loss": -6.571695327758789, "global_step": 117800, "epoch": 2804} {"train_loss": -6.56584358215332, "global_step": 117801, "epoch": 2804} {"train_loss": -6.42867374420166, "global_step": 117802, "epoch": 2804} {"train_loss": -6.487540245056152, "global_step": 117803, "epoch": 2804} {"train_loss": -6.628798961639404, "global_step": 117804, "epoch": 2804} {"train_loss": -6.589010715484619, "global_step": 117805, "epoch": 2804} {"train_loss": -6.538586616516113, "global_step": 117806, "epoch": 2804} {"train_loss": -6.636470317840576, "global_step": 117807, "epoch": 2804} {"train_loss": -6.6903605461120605, "global_step": 117808, "epoch": 2804} {"train_loss": -6.535520712534587, "global_step": 117809, "epoch": 2804, "val_loss": 65480.33203125} {"train_loss": -6.619715213775635, "global_step": 117810, "epoch": 2805} {"train_loss": -6.561501979827881, "global_step": 117811, "epoch": 2805} {"train_loss": -6.542788505554199, "global_step": 117812, "epoch": 2805} {"train_loss": -6.596671104431152, "global_step": 117813, "epoch": 2805} {"train_loss": -6.580437660217285, "global_step": 117814, "epoch": 2805} {"train_loss": -6.572957992553711, "global_step": 117815, "epoch": 2805} {"train_loss": -6.441910743713379, "global_step": 117816, "epoch": 2805} {"train_loss": -6.572756767272949, "global_step": 117817, "epoch": 2805} {"train_loss": -6.623841285705566, "global_step": 117818, "epoch": 2805} {"train_loss": -6.5777788162231445, "global_step": 117819, "epoch": 2805} {"train_loss": -6.692885875701904, "global_step": 117820, "epoch": 2805} {"train_loss": -6.639086723327637, "global_step": 117821, "epoch": 2805} {"train_loss": -6.605295181274414, "global_step": 117822, "epoch": 2805} {"train_loss": -6.568719863891602, "global_step": 117823, "epoch": 2805} {"train_loss": -6.565129280090332, "global_step": 117824, "epoch": 2805} {"train_loss": -6.6350603103637695, "global_step": 117825, "epoch": 2805} {"train_loss": -6.641985893249512, "global_step": 117826, "epoch": 2805} {"train_loss": -6.576995372772217, "global_step": 117827, "epoch": 2805} {"train_loss": -6.666038990020752, "global_step": 117828, "epoch": 2805} {"train_loss": -6.669689655303955, "global_step": 117829, "epoch": 2805} {"train_loss": -6.559358596801758, "global_step": 117830, "epoch": 2805} {"train_loss": -6.535209655761719, "global_step": 117831, "epoch": 2805} {"train_loss": -6.315384387969971, "global_step": 117832, "epoch": 2805} {"train_loss": -6.50496244430542, "global_step": 117833, "epoch": 2805} {"train_loss": -6.541746139526367, "global_step": 117834, "epoch": 2805} {"train_loss": -6.547369956970215, "global_step": 117835, "epoch": 2805} {"train_loss": -6.5273637771606445, "global_step": 117836, "epoch": 2805} {"train_loss": -6.553591728210449, "global_step": 117837, "epoch": 2805} {"train_loss": -6.549504280090332, "global_step": 117838, "epoch": 2805} {"train_loss": -6.520152568817139, "global_step": 117839, "epoch": 2805} {"train_loss": -6.492981910705566, "global_step": 117840, "epoch": 2805} {"train_loss": -6.525968551635742, "global_step": 117841, "epoch": 2805} {"train_loss": -6.456756591796875, "global_step": 117842, "epoch": 2805} {"train_loss": -6.485960006713867, "global_step": 117843, "epoch": 2805} {"train_loss": -6.4761576652526855, "global_step": 117844, "epoch": 2805} {"train_loss": -6.459522247314453, "global_step": 117845, "epoch": 2805} {"train_loss": -6.457222938537598, "global_step": 117846, "epoch": 2805} {"train_loss": -6.525678634643555, "global_step": 117847, "epoch": 2805} {"train_loss": -6.647411823272705, "global_step": 117848, "epoch": 2805} {"train_loss": -6.5690717697143555, "global_step": 117849, "epoch": 2805} {"train_loss": -6.5182037353515625, "global_step": 117850, "epoch": 2805} {"train_loss": -6.553892124266851, "global_step": 117851, "epoch": 2805, "val_loss": 65613.7421875} {"train_loss": -6.386328220367432, "global_step": 117852, "epoch": 2806} {"train_loss": -6.503711700439453, "global_step": 117853, "epoch": 2806} {"train_loss": -6.589441299438477, "global_step": 117854, "epoch": 2806} {"train_loss": -6.432262420654297, "global_step": 117855, "epoch": 2806} {"train_loss": -6.547959327697754, "global_step": 117856, "epoch": 2806} {"train_loss": -6.550670623779297, "global_step": 117857, "epoch": 2806} {"train_loss": -6.402773857116699, "global_step": 117858, "epoch": 2806} {"train_loss": -6.4786481857299805, "global_step": 117859, "epoch": 2806} {"train_loss": -6.545143127441406, "global_step": 117860, "epoch": 2806} {"train_loss": -6.5839972496032715, "global_step": 117861, "epoch": 2806} {"train_loss": -6.563282012939453, "global_step": 117862, "epoch": 2806} {"train_loss": -6.601889133453369, "global_step": 117863, "epoch": 2806} {"train_loss": -6.551087379455566, "global_step": 117864, "epoch": 2806} {"train_loss": -6.6436052322387695, "global_step": 117865, "epoch": 2806} {"train_loss": -6.4500837326049805, "global_step": 117866, "epoch": 2806} {"train_loss": -6.423586368560791, "global_step": 117867, "epoch": 2806} {"train_loss": -6.570010185241699, "global_step": 117868, "epoch": 2806} {"train_loss": -6.648372650146484, "global_step": 117869, "epoch": 2806} {"train_loss": -6.572561264038086, "global_step": 117870, "epoch": 2806} {"train_loss": -6.54022216796875, "global_step": 117871, "epoch": 2806} {"train_loss": -6.512601852416992, "global_step": 117872, "epoch": 2806} {"train_loss": -6.575908660888672, "global_step": 117873, "epoch": 2806} {"train_loss": -6.483636856079102, "global_step": 117874, "epoch": 2806} {"train_loss": -6.655705451965332, "global_step": 117875, "epoch": 2806} {"train_loss": -6.590790748596191, "global_step": 117876, "epoch": 2806} {"train_loss": -6.624922752380371, "global_step": 117877, "epoch": 2806} {"train_loss": -6.61713981628418, "global_step": 117878, "epoch": 2806} {"train_loss": -6.528717994689941, "global_step": 117879, "epoch": 2806} {"train_loss": -6.59568977355957, "global_step": 117880, "epoch": 2806} {"train_loss": -6.525213718414307, "global_step": 117881, "epoch": 2806} {"train_loss": -6.596428871154785, "global_step": 117882, "epoch": 2806} {"train_loss": -6.563973426818848, "global_step": 117883, "epoch": 2806} {"train_loss": -6.626123428344727, "global_step": 117884, "epoch": 2806} {"train_loss": -6.638047218322754, "global_step": 117885, "epoch": 2806} {"train_loss": -6.564765930175781, "global_step": 117886, "epoch": 2806} {"train_loss": -6.491873741149902, "global_step": 117887, "epoch": 2806} {"train_loss": -6.567936420440674, "global_step": 117888, "epoch": 2806} {"train_loss": -6.531026840209961, "global_step": 117889, "epoch": 2806} {"train_loss": -6.51385498046875, "global_step": 117890, "epoch": 2806} {"train_loss": -6.409368991851807, "global_step": 117891, "epoch": 2806} {"train_loss": -6.512801170349121, "global_step": 117892, "epoch": 2806} {"train_loss": -6.544759035110474, "global_step": 117893, "epoch": 2806, "val_loss": 65635.8515625} {"train_loss": -6.5860185623168945, "global_step": 117894, "epoch": 2807} {"train_loss": -6.591728687286377, "global_step": 117895, "epoch": 2807} {"train_loss": -6.538971900939941, "global_step": 117896, "epoch": 2807} {"train_loss": -6.6207427978515625, "global_step": 117897, "epoch": 2807} {"train_loss": -6.583341598510742, "global_step": 117898, "epoch": 2807} {"train_loss": -6.603556156158447, "global_step": 117899, "epoch": 2807} {"train_loss": -6.710787296295166, "global_step": 117900, "epoch": 2807} {"train_loss": -6.4253249168396, "global_step": 117901, "epoch": 2807} {"train_loss": -6.42485237121582, "global_step": 117902, "epoch": 2807} {"train_loss": -6.562660217285156, "global_step": 117903, "epoch": 2807} {"train_loss": -6.478911399841309, "global_step": 117904, "epoch": 2807} {"train_loss": -6.476118087768555, "global_step": 117905, "epoch": 2807} {"train_loss": -6.561687469482422, "global_step": 117906, "epoch": 2807} {"train_loss": -6.569545269012451, "global_step": 117907, "epoch": 2807} {"train_loss": -6.550168991088867, "global_step": 117908, "epoch": 2807} {"train_loss": -6.536157131195068, "global_step": 117909, "epoch": 2807} {"train_loss": -6.462376117706299, "global_step": 117910, "epoch": 2807} {"train_loss": -6.583956241607666, "global_step": 117911, "epoch": 2807} {"train_loss": -6.577780723571777, "global_step": 117912, "epoch": 2807} {"train_loss": -6.502713203430176, "global_step": 117913, "epoch": 2807} {"train_loss": -6.701338768005371, "global_step": 117914, "epoch": 2807} {"train_loss": -6.480340957641602, "global_step": 117915, "epoch": 2807} {"train_loss": -6.553140640258789, "global_step": 117916, "epoch": 2807} {"train_loss": -6.564860820770264, "global_step": 117917, "epoch": 2807} {"train_loss": -6.408750534057617, "global_step": 117918, "epoch": 2807} {"train_loss": -6.4387288093566895, "global_step": 117919, "epoch": 2807} {"train_loss": -6.583547115325928, "global_step": 117920, "epoch": 2807} {"train_loss": -6.4234299659729, "global_step": 117921, "epoch": 2807} {"train_loss": -6.453754425048828, "global_step": 117922, "epoch": 2807} {"train_loss": -6.462665557861328, "global_step": 117923, "epoch": 2807} {"train_loss": -6.505884647369385, "global_step": 117924, "epoch": 2807} {"train_loss": -6.622308731079102, "global_step": 117925, "epoch": 2807} {"train_loss": -6.495521545410156, "global_step": 117926, "epoch": 2807} {"train_loss": -6.573643684387207, "global_step": 117927, "epoch": 2807} {"train_loss": -6.549981594085693, "global_step": 117928, "epoch": 2807} {"train_loss": -6.509429931640625, "global_step": 117929, "epoch": 2807} {"train_loss": -6.472988605499268, "global_step": 117930, "epoch": 2807} {"train_loss": -6.444474697113037, "global_step": 117931, "epoch": 2807} {"train_loss": -6.530935764312744, "global_step": 117932, "epoch": 2807} {"train_loss": -6.612422466278076, "global_step": 117933, "epoch": 2807} {"train_loss": -6.446308612823486, "global_step": 117934, "epoch": 2807} {"train_loss": -6.52944210597447, "global_step": 117935, "epoch": 2807, "val_loss": 65688.4453125} {"train_loss": -6.449291706085205, "global_step": 117936, "epoch": 2808} {"train_loss": -6.478519439697266, "global_step": 117937, "epoch": 2808} {"train_loss": -6.6018171310424805, "global_step": 117938, "epoch": 2808} {"train_loss": -6.564306259155273, "global_step": 117939, "epoch": 2808} {"train_loss": -6.567246913909912, "global_step": 117940, "epoch": 2808} {"train_loss": -6.561633110046387, "global_step": 117941, "epoch": 2808} {"train_loss": -6.478941917419434, "global_step": 117942, "epoch": 2808} {"train_loss": -6.486888885498047, "global_step": 117943, "epoch": 2808} {"train_loss": -6.427577972412109, "global_step": 117944, "epoch": 2808} {"train_loss": -6.537477016448975, "global_step": 117945, "epoch": 2808} {"train_loss": -6.493675231933594, "global_step": 117946, "epoch": 2808} {"train_loss": -6.635489463806152, "global_step": 117947, "epoch": 2808} {"train_loss": -6.509185791015625, "global_step": 117948, "epoch": 2808} {"train_loss": -6.526609420776367, "global_step": 117949, "epoch": 2808} {"train_loss": -6.654789924621582, "global_step": 117950, "epoch": 2808} {"train_loss": -6.583337306976318, "global_step": 117951, "epoch": 2808} {"train_loss": -6.643214225769043, "global_step": 117952, "epoch": 2808} {"train_loss": -6.613694190979004, "global_step": 117953, "epoch": 2808} {"train_loss": -6.540021896362305, "global_step": 117954, "epoch": 2808} {"train_loss": -6.676061630249023, "global_step": 117955, "epoch": 2808} {"train_loss": -6.633842468261719, "global_step": 117956, "epoch": 2808} {"train_loss": -6.667459487915039, "global_step": 117957, "epoch": 2808} {"train_loss": -6.605469703674316, "global_step": 117958, "epoch": 2808} {"train_loss": -6.570103645324707, "global_step": 117959, "epoch": 2808} {"train_loss": -6.552567005157471, "global_step": 117960, "epoch": 2808} {"train_loss": -6.688793182373047, "global_step": 117961, "epoch": 2808} {"train_loss": -6.609561443328857, "global_step": 117962, "epoch": 2808} {"train_loss": -6.514985084533691, "global_step": 117963, "epoch": 2808} {"train_loss": -6.681631565093994, "global_step": 117964, "epoch": 2808} {"train_loss": -6.622725486755371, "global_step": 117965, "epoch": 2808} {"train_loss": -6.5547966957092285, "global_step": 117966, "epoch": 2808} {"train_loss": -6.677714824676514, "global_step": 117967, "epoch": 2808} {"train_loss": -6.463094711303711, "global_step": 117968, "epoch": 2808} {"train_loss": -6.545833587646484, "global_step": 117969, "epoch": 2808} {"train_loss": -6.561941146850586, "global_step": 117970, "epoch": 2808} {"train_loss": -6.410762310028076, "global_step": 117971, "epoch": 2808} {"train_loss": -6.372729778289795, "global_step": 117972, "epoch": 2808} {"train_loss": -6.631031036376953, "global_step": 117973, "epoch": 2808} {"train_loss": -6.551388263702393, "global_step": 117974, "epoch": 2808} {"train_loss": -6.54039192199707, "global_step": 117975, "epoch": 2808} {"train_loss": -6.554015159606934, "global_step": 117976, "epoch": 2808} {"train_loss": -6.560684056509109, "global_step": 117977, "epoch": 2808, "val_loss": 65330.3046875} {"train_loss": -6.557358741760254, "global_step": 117978, "epoch": 2809} {"train_loss": -6.636105537414551, "global_step": 117979, "epoch": 2809} {"train_loss": -6.588735580444336, "global_step": 117980, "epoch": 2809} {"train_loss": -6.591919422149658, "global_step": 117981, "epoch": 2809} {"train_loss": -6.637840270996094, "global_step": 117982, "epoch": 2809} {"train_loss": -6.652898788452148, "global_step": 117983, "epoch": 2809} {"train_loss": -6.665169715881348, "global_step": 117984, "epoch": 2809} {"train_loss": -6.509855270385742, "global_step": 117985, "epoch": 2809} {"train_loss": -6.524290084838867, "global_step": 117986, "epoch": 2809} {"train_loss": -6.404689788818359, "global_step": 117987, "epoch": 2809} {"train_loss": -6.428761005401611, "global_step": 117988, "epoch": 2809} {"train_loss": -6.637592792510986, "global_step": 117989, "epoch": 2809} {"train_loss": -6.434200286865234, "global_step": 117990, "epoch": 2809} {"train_loss": -6.559006690979004, "global_step": 117991, "epoch": 2809} {"train_loss": -6.541436672210693, "global_step": 117992, "epoch": 2809} {"train_loss": -6.56704044342041, "global_step": 117993, "epoch": 2809} {"train_loss": -6.558689594268799, "global_step": 117994, "epoch": 2809} {"train_loss": -6.58260440826416, "global_step": 117995, "epoch": 2809} {"train_loss": -6.481479644775391, "global_step": 117996, "epoch": 2809} {"train_loss": -6.4475178718566895, "global_step": 117997, "epoch": 2809} {"train_loss": -6.474339008331299, "global_step": 117998, "epoch": 2809} {"train_loss": -6.418087959289551, "global_step": 117999, "epoch": 2809} {"train_loss": -6.579684257507324, "global_step": 118000, "epoch": 2809} {"train_loss": -6.358314514160156, "global_step": 118001, "epoch": 2809} {"train_loss": -6.575142860412598, "global_step": 118002, "epoch": 2809} {"train_loss": -6.529611587524414, "global_step": 118003, "epoch": 2809} {"train_loss": -6.490621566772461, "global_step": 118004, "epoch": 2809} {"train_loss": -6.388195037841797, "global_step": 118005, "epoch": 2809} {"train_loss": -6.463624954223633, "global_step": 118006, "epoch": 2809} {"train_loss": -6.517910957336426, "global_step": 118007, "epoch": 2809} {"train_loss": -6.515294075012207, "global_step": 118008, "epoch": 2809} {"train_loss": -6.472538948059082, "global_step": 118009, "epoch": 2809} {"train_loss": -6.556255340576172, "global_step": 118010, "epoch": 2809} {"train_loss": -6.418652057647705, "global_step": 118011, "epoch": 2809} {"train_loss": -6.509755611419678, "global_step": 118012, "epoch": 2809} {"train_loss": -6.424898147583008, "global_step": 118013, "epoch": 2809} {"train_loss": -6.485985279083252, "global_step": 118014, "epoch": 2809} {"train_loss": -6.616569519042969, "global_step": 118015, "epoch": 2809} {"train_loss": -6.536696434020996, "global_step": 118016, "epoch": 2809} {"train_loss": -6.549681663513184, "global_step": 118017, "epoch": 2809} {"train_loss": -6.551297664642334, "global_step": 118018, "epoch": 2809} {"train_loss": -6.5267924808320545, "global_step": 118019, "epoch": 2809, "val_loss": 65393.484375} {"train_loss": -6.517093181610107, "global_step": 118020, "epoch": 2810} {"train_loss": -6.592021465301514, "global_step": 118021, "epoch": 2810} {"train_loss": -6.5595574378967285, "global_step": 118022, "epoch": 2810} {"train_loss": -6.575494766235352, "global_step": 118023, "epoch": 2810} {"train_loss": -6.614260196685791, "global_step": 118024, "epoch": 2810} {"train_loss": -6.502624988555908, "global_step": 118025, "epoch": 2810} {"train_loss": -6.685128211975098, "global_step": 118026, "epoch": 2810} {"train_loss": -6.5324482917785645, "global_step": 118027, "epoch": 2810} {"train_loss": -6.501023292541504, "global_step": 118028, "epoch": 2810} {"train_loss": -6.600787162780762, "global_step": 118029, "epoch": 2810} {"train_loss": -6.587579727172852, "global_step": 118030, "epoch": 2810} {"train_loss": -6.505705833435059, "global_step": 118031, "epoch": 2810} {"train_loss": -6.49119758605957, "global_step": 118032, "epoch": 2810} {"train_loss": -6.691582679748535, "global_step": 118033, "epoch": 2810} {"train_loss": -6.455049514770508, "global_step": 118034, "epoch": 2810} {"train_loss": -6.515613555908203, "global_step": 118035, "epoch": 2810} {"train_loss": -6.593048572540283, "global_step": 118036, "epoch": 2810} {"train_loss": -6.517248630523682, "global_step": 118037, "epoch": 2810} {"train_loss": -6.478823661804199, "global_step": 118038, "epoch": 2810} {"train_loss": -6.457067489624023, "global_step": 118039, "epoch": 2810} {"train_loss": -6.541896343231201, "global_step": 118040, "epoch": 2810} {"train_loss": -6.530517578125, "global_step": 118041, "epoch": 2810} {"train_loss": -6.586264610290527, "global_step": 118042, "epoch": 2810} {"train_loss": -6.544540882110596, "global_step": 118043, "epoch": 2810} {"train_loss": -6.581471920013428, "global_step": 118044, "epoch": 2810} {"train_loss": -6.613223552703857, "global_step": 118045, "epoch": 2810} {"train_loss": -6.655710697174072, "global_step": 118046, "epoch": 2810} {"train_loss": -6.570282459259033, "global_step": 118047, "epoch": 2810} {"train_loss": -6.576959609985352, "global_step": 118048, "epoch": 2810} {"train_loss": -6.5768632888793945, "global_step": 118049, "epoch": 2810} {"train_loss": -6.640466690063477, "global_step": 118050, "epoch": 2810} {"train_loss": -6.467988967895508, "global_step": 118051, "epoch": 2810} {"train_loss": -6.45353889465332, "global_step": 118052, "epoch": 2810} {"train_loss": -6.602283954620361, "global_step": 118053, "epoch": 2810} {"train_loss": -6.486418724060059, "global_step": 118054, "epoch": 2810} {"train_loss": -6.631667613983154, "global_step": 118055, "epoch": 2810} {"train_loss": -6.526586532592773, "global_step": 118056, "epoch": 2810} {"train_loss": -6.4309844970703125, "global_step": 118057, "epoch": 2810} {"train_loss": -6.633112907409668, "global_step": 118058, "epoch": 2810} {"train_loss": -6.594648361206055, "global_step": 118059, "epoch": 2810} {"train_loss": -6.524937629699707, "global_step": 118060, "epoch": 2810} {"train_loss": -6.555468354906354, "global_step": 118061, "epoch": 2810, "val_loss": 65597.8671875} {"train_loss": -6.539048194885254, "global_step": 118062, "epoch": 2811} {"train_loss": -6.4546427726745605, "global_step": 118063, "epoch": 2811} {"train_loss": -6.553731918334961, "global_step": 118064, "epoch": 2811} {"train_loss": -6.500539302825928, "global_step": 118065, "epoch": 2811} {"train_loss": -6.4756364822387695, "global_step": 118066, "epoch": 2811} {"train_loss": -6.546411037445068, "global_step": 118067, "epoch": 2811} {"train_loss": -6.477239608764648, "global_step": 118068, "epoch": 2811} {"train_loss": -6.528163909912109, "global_step": 118069, "epoch": 2811} {"train_loss": -6.6128621101379395, "global_step": 118070, "epoch": 2811} {"train_loss": -6.551918029785156, "global_step": 118071, "epoch": 2811} {"train_loss": -6.581550121307373, "global_step": 118072, "epoch": 2811} {"train_loss": -6.608841419219971, "global_step": 118073, "epoch": 2811} {"train_loss": -6.510491371154785, "global_step": 118074, "epoch": 2811} {"train_loss": -6.5273590087890625, "global_step": 118075, "epoch": 2811} {"train_loss": -6.513985633850098, "global_step": 118076, "epoch": 2811} {"train_loss": -6.611361980438232, "global_step": 118077, "epoch": 2811} {"train_loss": -6.565637111663818, "global_step": 118078, "epoch": 2811} {"train_loss": -6.6771159172058105, "global_step": 118079, "epoch": 2811} {"train_loss": -6.530874252319336, "global_step": 118080, "epoch": 2811} {"train_loss": -6.5809478759765625, "global_step": 118081, "epoch": 2811} {"train_loss": -6.60500431060791, "global_step": 118082, "epoch": 2811} {"train_loss": -6.543546676635742, "global_step": 118083, "epoch": 2811} {"train_loss": -6.482884407043457, "global_step": 118084, "epoch": 2811} {"train_loss": -6.55855655670166, "global_step": 118085, "epoch": 2811} {"train_loss": -6.560029983520508, "global_step": 118086, "epoch": 2811} {"train_loss": -6.534995079040527, "global_step": 118087, "epoch": 2811} {"train_loss": -6.6408514976501465, "global_step": 118088, "epoch": 2811} {"train_loss": -6.602841854095459, "global_step": 118089, "epoch": 2811} {"train_loss": -6.541409015655518, "global_step": 118090, "epoch": 2811} {"train_loss": -6.56805419921875, "global_step": 118091, "epoch": 2811} {"train_loss": -6.593869209289551, "global_step": 118092, "epoch": 2811} {"train_loss": -6.609499931335449, "global_step": 118093, "epoch": 2811} {"train_loss": -6.644876956939697, "global_step": 118094, "epoch": 2811} {"train_loss": -6.638125419616699, "global_step": 118095, "epoch": 2811} {"train_loss": -6.622568130493164, "global_step": 118096, "epoch": 2811} {"train_loss": -6.455460548400879, "global_step": 118097, "epoch": 2811} {"train_loss": -6.653596878051758, "global_step": 118098, "epoch": 2811} {"train_loss": -6.573907375335693, "global_step": 118099, "epoch": 2811} {"train_loss": -6.4974870681762695, "global_step": 118100, "epoch": 2811} {"train_loss": -6.476298809051514, "global_step": 118101, "epoch": 2811} {"train_loss": -6.569594383239746, "global_step": 118102, "epoch": 2811} {"train_loss": -6.560245332263765, "global_step": 118103, "epoch": 2811, "val_loss": 65752.609375} {"train_loss": -6.547560214996338, "global_step": 118104, "epoch": 2812} {"train_loss": -6.603669166564941, "global_step": 118105, "epoch": 2812} {"train_loss": -6.521562099456787, "global_step": 118106, "epoch": 2812} {"train_loss": -6.437009334564209, "global_step": 118107, "epoch": 2812} {"train_loss": -6.553428649902344, "global_step": 118108, "epoch": 2812} {"train_loss": -6.703227996826172, "global_step": 118109, "epoch": 2812} {"train_loss": -6.6040358543396, "global_step": 118110, "epoch": 2812} {"train_loss": -6.696529865264893, "global_step": 118111, "epoch": 2812} {"train_loss": -6.533332824707031, "global_step": 118112, "epoch": 2812} {"train_loss": -6.553638458251953, "global_step": 118113, "epoch": 2812} {"train_loss": -6.644723415374756, "global_step": 118114, "epoch": 2812} {"train_loss": -6.512784004211426, "global_step": 118115, "epoch": 2812} {"train_loss": -6.536568641662598, "global_step": 118116, "epoch": 2812} {"train_loss": -6.542170524597168, "global_step": 118117, "epoch": 2812} {"train_loss": -6.598651885986328, "global_step": 118118, "epoch": 2812} {"train_loss": -6.657982349395752, "global_step": 118119, "epoch": 2812} {"train_loss": -6.673818588256836, "global_step": 118120, "epoch": 2812} {"train_loss": -6.5600266456604, "global_step": 118121, "epoch": 2812} {"train_loss": -6.635354042053223, "global_step": 118122, "epoch": 2812} {"train_loss": -6.491599082946777, "global_step": 118123, "epoch": 2812} {"train_loss": -6.667211055755615, "global_step": 118124, "epoch": 2812} {"train_loss": -6.630509376525879, "global_step": 118125, "epoch": 2812} {"train_loss": -6.51140022277832, "global_step": 118126, "epoch": 2812} {"train_loss": -6.682642936706543, "global_step": 118127, "epoch": 2812} {"train_loss": -6.728436470031738, "global_step": 118128, "epoch": 2812} {"train_loss": -6.579528331756592, "global_step": 118129, "epoch": 2812} {"train_loss": -6.505967617034912, "global_step": 118130, "epoch": 2812} {"train_loss": -6.508889675140381, "global_step": 118131, "epoch": 2812} {"train_loss": -6.434733867645264, "global_step": 118132, "epoch": 2812} {"train_loss": -6.609620094299316, "global_step": 118133, "epoch": 2812} {"train_loss": -6.571629524230957, "global_step": 118134, "epoch": 2812} {"train_loss": -6.660219192504883, "global_step": 118135, "epoch": 2812} {"train_loss": -6.531492233276367, "global_step": 118136, "epoch": 2812} {"train_loss": -6.577671527862549, "global_step": 118137, "epoch": 2812} {"train_loss": -6.582721710205078, "global_step": 118138, "epoch": 2812} {"train_loss": -6.619002342224121, "global_step": 118139, "epoch": 2812} {"train_loss": -6.525085926055908, "global_step": 118140, "epoch": 2812} {"train_loss": -6.548055171966553, "global_step": 118141, "epoch": 2812} {"train_loss": -6.575351715087891, "global_step": 118142, "epoch": 2812} {"train_loss": -6.59517240524292, "global_step": 118143, "epoch": 2812} {"train_loss": -6.573688507080078, "global_step": 118144, "epoch": 2812} {"train_loss": -6.580002603076753, "global_step": 118145, "epoch": 2812, "val_loss": 65673.09375} {"train_loss": -6.644800186157227, "global_step": 118146, "epoch": 2813} {"train_loss": -6.494388580322266, "global_step": 118147, "epoch": 2813} {"train_loss": -6.497597694396973, "global_step": 118148, "epoch": 2813} {"train_loss": -6.540487289428711, "global_step": 118149, "epoch": 2813} {"train_loss": -6.533059120178223, "global_step": 118150, "epoch": 2813} {"train_loss": -6.549648761749268, "global_step": 118151, "epoch": 2813} {"train_loss": -6.487936019897461, "global_step": 118152, "epoch": 2813} {"train_loss": -6.638895511627197, "global_step": 118153, "epoch": 2813} {"train_loss": -6.600883483886719, "global_step": 118154, "epoch": 2813} {"train_loss": -6.664307117462158, "global_step": 118155, "epoch": 2813} {"train_loss": -6.500537872314453, "global_step": 118156, "epoch": 2813} {"train_loss": -6.467870712280273, "global_step": 118157, "epoch": 2813} {"train_loss": -6.44517707824707, "global_step": 118158, "epoch": 2813} {"train_loss": -6.522247314453125, "global_step": 118159, "epoch": 2813} {"train_loss": -6.433437347412109, "global_step": 118160, "epoch": 2813} {"train_loss": -6.596563339233398, "global_step": 118161, "epoch": 2813} {"train_loss": -6.496077060699463, "global_step": 118162, "epoch": 2813} {"train_loss": -6.395575046539307, "global_step": 118163, "epoch": 2813} {"train_loss": -6.42719841003418, "global_step": 118164, "epoch": 2813} {"train_loss": -6.468479156494141, "global_step": 118165, "epoch": 2813} {"train_loss": -6.530544281005859, "global_step": 118166, "epoch": 2813} {"train_loss": -6.598729610443115, "global_step": 118167, "epoch": 2813} {"train_loss": -6.536613941192627, "global_step": 118168, "epoch": 2813} {"train_loss": -6.429544448852539, "global_step": 118169, "epoch": 2813} {"train_loss": -6.545340538024902, "global_step": 118170, "epoch": 2813} {"train_loss": -6.575488567352295, "global_step": 118171, "epoch": 2813} {"train_loss": -6.4909539222717285, "global_step": 118172, "epoch": 2813} {"train_loss": -6.551924228668213, "global_step": 118173, "epoch": 2813} {"train_loss": -6.516222953796387, "global_step": 118174, "epoch": 2813} {"train_loss": -6.334286689758301, "global_step": 118175, "epoch": 2813} {"train_loss": -6.3919525146484375, "global_step": 118176, "epoch": 2813} {"train_loss": -6.448835372924805, "global_step": 118177, "epoch": 2813} {"train_loss": -6.510733604431152, "global_step": 118178, "epoch": 2813} {"train_loss": -6.400158882141113, "global_step": 118179, "epoch": 2813} {"train_loss": -6.482872009277344, "global_step": 118180, "epoch": 2813} {"train_loss": -6.553035736083984, "global_step": 118181, "epoch": 2813} {"train_loss": -6.578868389129639, "global_step": 118182, "epoch": 2813} {"train_loss": -6.52159309387207, "global_step": 118183, "epoch": 2813} {"train_loss": -6.448108196258545, "global_step": 118184, "epoch": 2813} {"train_loss": -6.561913013458252, "global_step": 118185, "epoch": 2813} {"train_loss": -6.381365776062012, "global_step": 118186, "epoch": 2813} {"train_loss": -6.511801617486136, "global_step": 118187, "epoch": 2813, "val_loss": 65690.8515625} {"train_loss": -6.56839656829834, "global_step": 118188, "epoch": 2814} {"train_loss": -6.425471305847168, "global_step": 118189, "epoch": 2814} {"train_loss": -6.608494758605957, "global_step": 118190, "epoch": 2814} {"train_loss": -6.5683417320251465, "global_step": 118191, "epoch": 2814} {"train_loss": -6.548816680908203, "global_step": 118192, "epoch": 2814} {"train_loss": -6.548999309539795, "global_step": 118193, "epoch": 2814} {"train_loss": -6.615303039550781, "global_step": 118194, "epoch": 2814} {"train_loss": -6.41424560546875, "global_step": 118195, "epoch": 2814} {"train_loss": -6.439049243927002, "global_step": 118196, "epoch": 2814} {"train_loss": -6.570399761199951, "global_step": 118197, "epoch": 2814} {"train_loss": -6.5180983543396, "global_step": 118198, "epoch": 2814} {"train_loss": -6.599388599395752, "global_step": 118199, "epoch": 2814} {"train_loss": -6.422280311584473, "global_step": 118200, "epoch": 2814} {"train_loss": -6.454563617706299, "global_step": 118201, "epoch": 2814} {"train_loss": -6.579555511474609, "global_step": 118202, "epoch": 2814} {"train_loss": -6.530032157897949, "global_step": 118203, "epoch": 2814} {"train_loss": -6.423379898071289, "global_step": 118204, "epoch": 2814} {"train_loss": -6.546568393707275, "global_step": 118205, "epoch": 2814} {"train_loss": -6.5014872550964355, "global_step": 118206, "epoch": 2814} {"train_loss": -6.555471420288086, "global_step": 118207, "epoch": 2814} {"train_loss": -6.716136932373047, "global_step": 118208, "epoch": 2814} {"train_loss": -6.5585174560546875, "global_step": 118209, "epoch": 2814} {"train_loss": -6.551238059997559, "global_step": 118210, "epoch": 2814} {"train_loss": -6.587948799133301, "global_step": 118211, "epoch": 2814} {"train_loss": -6.525700569152832, "global_step": 118212, "epoch": 2814} {"train_loss": -6.561703681945801, "global_step": 118213, "epoch": 2814} {"train_loss": -6.448031425476074, "global_step": 118214, "epoch": 2814} {"train_loss": -6.512278079986572, "global_step": 118215, "epoch": 2814} {"train_loss": -6.626235008239746, "global_step": 118216, "epoch": 2814} {"train_loss": -6.4600324630737305, "global_step": 118217, "epoch": 2814} {"train_loss": -6.509471893310547, "global_step": 118218, "epoch": 2814} {"train_loss": -6.486027717590332, "global_step": 118219, "epoch": 2814} {"train_loss": -6.494937896728516, "global_step": 118220, "epoch": 2814} {"train_loss": -6.511394500732422, "global_step": 118221, "epoch": 2814} {"train_loss": -6.461530685424805, "global_step": 118222, "epoch": 2814} {"train_loss": -6.538135528564453, "global_step": 118223, "epoch": 2814} {"train_loss": -6.476932525634766, "global_step": 118224, "epoch": 2814} {"train_loss": -6.324717998504639, "global_step": 118225, "epoch": 2814} {"train_loss": -6.4834747314453125, "global_step": 118226, "epoch": 2814} {"train_loss": -6.388765335083008, "global_step": 118227, "epoch": 2814} {"train_loss": -6.515012741088867, "global_step": 118228, "epoch": 2814} {"train_loss": -6.516239892868769, "global_step": 118229, "epoch": 2814, "val_loss": 65528.91796875} {"train_loss": -6.598675727844238, "global_step": 118230, "epoch": 2815} {"train_loss": -6.5714616775512695, "global_step": 118231, "epoch": 2815} {"train_loss": -6.618727207183838, "global_step": 118232, "epoch": 2815} {"train_loss": -6.517827987670898, "global_step": 118233, "epoch": 2815} {"train_loss": -6.480595588684082, "global_step": 118234, "epoch": 2815} {"train_loss": -6.575531959533691, "global_step": 118235, "epoch": 2815} {"train_loss": -6.614583969116211, "global_step": 118236, "epoch": 2815} {"train_loss": -6.586827754974365, "global_step": 118237, "epoch": 2815} {"train_loss": -6.450462341308594, "global_step": 118238, "epoch": 2815} {"train_loss": -6.554731369018555, "global_step": 118239, "epoch": 2815} {"train_loss": -6.574350357055664, "global_step": 118240, "epoch": 2815} {"train_loss": -6.612666130065918, "global_step": 118241, "epoch": 2815} {"train_loss": -6.556495189666748, "global_step": 118242, "epoch": 2815} {"train_loss": -6.577596664428711, "global_step": 118243, "epoch": 2815} {"train_loss": -6.5854573249816895, "global_step": 118244, "epoch": 2815} {"train_loss": -6.61778450012207, "global_step": 118245, "epoch": 2815} {"train_loss": -6.546514511108398, "global_step": 118246, "epoch": 2815} {"train_loss": -6.495364189147949, "global_step": 118247, "epoch": 2815} {"train_loss": -6.513311862945557, "global_step": 118248, "epoch": 2815} {"train_loss": -6.612457275390625, "global_step": 118249, "epoch": 2815} {"train_loss": -6.420616626739502, "global_step": 118250, "epoch": 2815} {"train_loss": -6.6004767417907715, "global_step": 118251, "epoch": 2815} {"train_loss": -6.476395130157471, "global_step": 118252, "epoch": 2815} {"train_loss": -6.6473588943481445, "global_step": 118253, "epoch": 2815} {"train_loss": -6.575048446655273, "global_step": 118254, "epoch": 2815} {"train_loss": -6.643360137939453, "global_step": 118255, "epoch": 2815} {"train_loss": -6.5290374755859375, "global_step": 118256, "epoch": 2815} {"train_loss": -6.540079593658447, "global_step": 118257, "epoch": 2815} {"train_loss": -6.460670471191406, "global_step": 118258, "epoch": 2815} {"train_loss": -6.596782684326172, "global_step": 118259, "epoch": 2815} {"train_loss": -6.609987735748291, "global_step": 118260, "epoch": 2815} {"train_loss": -6.604423522949219, "global_step": 118261, "epoch": 2815} {"train_loss": -6.544980049133301, "global_step": 118262, "epoch": 2815} {"train_loss": -6.598549842834473, "global_step": 118263, "epoch": 2815} {"train_loss": -6.554092884063721, "global_step": 118264, "epoch": 2815} {"train_loss": -6.501821041107178, "global_step": 118265, "epoch": 2815} {"train_loss": -6.528007984161377, "global_step": 118266, "epoch": 2815} {"train_loss": -6.672238826751709, "global_step": 118267, "epoch": 2815} {"train_loss": -6.621085166931152, "global_step": 118268, "epoch": 2815} {"train_loss": -6.489843845367432, "global_step": 118269, "epoch": 2815} {"train_loss": -6.6203131675720215, "global_step": 118270, "epoch": 2815} {"train_loss": -6.561666761125837, "global_step": 118271, "epoch": 2815, "val_loss": 65470.28125} {"train_loss": -6.559699058532715, "global_step": 118272, "epoch": 2816} {"train_loss": -6.574824810028076, "global_step": 118273, "epoch": 2816} {"train_loss": -6.493612289428711, "global_step": 118274, "epoch": 2816} {"train_loss": -6.607366561889648, "global_step": 118275, "epoch": 2816} {"train_loss": -6.607668876647949, "global_step": 118276, "epoch": 2816} {"train_loss": -6.584687232971191, "global_step": 118277, "epoch": 2816} {"train_loss": -6.665569305419922, "global_step": 118278, "epoch": 2816} {"train_loss": -6.603250026702881, "global_step": 118279, "epoch": 2816} {"train_loss": -6.510462760925293, "global_step": 118280, "epoch": 2816} {"train_loss": -6.532508850097656, "global_step": 118281, "epoch": 2816} {"train_loss": -6.48106575012207, "global_step": 118282, "epoch": 2816} {"train_loss": -6.483769416809082, "global_step": 118283, "epoch": 2816} {"train_loss": -6.532269477844238, "global_step": 118284, "epoch": 2816} {"train_loss": -6.549417972564697, "global_step": 118285, "epoch": 2816} {"train_loss": -6.574930191040039, "global_step": 118286, "epoch": 2816} {"train_loss": -6.68828010559082, "global_step": 118287, "epoch": 2816} {"train_loss": -6.664486408233643, "global_step": 118288, "epoch": 2816} {"train_loss": -6.571646690368652, "global_step": 118289, "epoch": 2816} {"train_loss": -6.434404373168945, "global_step": 118290, "epoch": 2816} {"train_loss": -6.425556182861328, "global_step": 118291, "epoch": 2816} {"train_loss": -6.676335334777832, "global_step": 118292, "epoch": 2816} {"train_loss": -6.634875774383545, "global_step": 118293, "epoch": 2816} {"train_loss": -6.564760208129883, "global_step": 118294, "epoch": 2816} {"train_loss": -6.56981897354126, "global_step": 118295, "epoch": 2816} {"train_loss": -6.605298042297363, "global_step": 118296, "epoch": 2816} {"train_loss": -6.5269775390625, "global_step": 118297, "epoch": 2816} {"train_loss": -6.51483154296875, "global_step": 118298, "epoch": 2816} {"train_loss": -6.5137128829956055, "global_step": 118299, "epoch": 2816} {"train_loss": -6.673426628112793, "global_step": 118300, "epoch": 2816} {"train_loss": -6.586467266082764, "global_step": 118301, "epoch": 2816} {"train_loss": -6.616644859313965, "global_step": 118302, "epoch": 2816} {"train_loss": -6.631655216217041, "global_step": 118303, "epoch": 2816} {"train_loss": -6.59623908996582, "global_step": 118304, "epoch": 2816} {"train_loss": -6.569870471954346, "global_step": 118305, "epoch": 2816} {"train_loss": -6.606769561767578, "global_step": 118306, "epoch": 2816} {"train_loss": -6.546839714050293, "global_step": 118307, "epoch": 2816} {"train_loss": -6.5654706954956055, "global_step": 118308, "epoch": 2816} {"train_loss": -6.562923908233643, "global_step": 118309, "epoch": 2816} {"train_loss": -6.632241725921631, "global_step": 118310, "epoch": 2816} {"train_loss": -6.564803123474121, "global_step": 118311, "epoch": 2816} {"train_loss": -6.575483322143555, "global_step": 118312, "epoch": 2816} {"train_loss": -6.571346805209205, "global_step": 118313, "epoch": 2816, "val_loss": 65679.9140625} {"train_loss": -6.59328556060791, "global_step": 118314, "epoch": 2817} {"train_loss": -6.555604457855225, "global_step": 118315, "epoch": 2817} {"train_loss": -6.561477184295654, "global_step": 118316, "epoch": 2817} {"train_loss": -6.51516056060791, "global_step": 118317, "epoch": 2817} {"train_loss": -6.579036235809326, "global_step": 118318, "epoch": 2817} {"train_loss": -6.718949317932129, "global_step": 118319, "epoch": 2817} {"train_loss": -6.5456719398498535, "global_step": 118320, "epoch": 2817} {"train_loss": -6.615370750427246, "global_step": 118321, "epoch": 2817} {"train_loss": -6.500999927520752, "global_step": 118322, "epoch": 2817} {"train_loss": -6.603252410888672, "global_step": 118323, "epoch": 2817} {"train_loss": -6.605921745300293, "global_step": 118324, "epoch": 2817} {"train_loss": -6.60118293762207, "global_step": 118325, "epoch": 2817} {"train_loss": -6.670079708099365, "global_step": 118326, "epoch": 2817} {"train_loss": -6.557618141174316, "global_step": 118327, "epoch": 2817} {"train_loss": -6.600970268249512, "global_step": 118328, "epoch": 2817} {"train_loss": -6.486307144165039, "global_step": 118329, "epoch": 2817} {"train_loss": -6.656105995178223, "global_step": 118330, "epoch": 2817} {"train_loss": -6.519244194030762, "global_step": 118331, "epoch": 2817} {"train_loss": -6.56984281539917, "global_step": 118332, "epoch": 2817} {"train_loss": -6.516568183898926, "global_step": 118333, "epoch": 2817} {"train_loss": -6.521556377410889, "global_step": 118334, "epoch": 2817} {"train_loss": -6.561382293701172, "global_step": 118335, "epoch": 2817} {"train_loss": -6.440539836883545, "global_step": 118336, "epoch": 2817} {"train_loss": -6.588443756103516, "global_step": 118337, "epoch": 2817} {"train_loss": -6.604066848754883, "global_step": 118338, "epoch": 2817} {"train_loss": -6.533149719238281, "global_step": 118339, "epoch": 2817} {"train_loss": -6.476689338684082, "global_step": 118340, "epoch": 2817} {"train_loss": -6.594554901123047, "global_step": 118341, "epoch": 2817} {"train_loss": -6.653660774230957, "global_step": 118342, "epoch": 2817} {"train_loss": -6.459826469421387, "global_step": 118343, "epoch": 2817} {"train_loss": -6.4843645095825195, "global_step": 118344, "epoch": 2817} {"train_loss": -6.533952713012695, "global_step": 118345, "epoch": 2817} {"train_loss": -6.686773300170898, "global_step": 118346, "epoch": 2817} {"train_loss": -6.479028701782227, "global_step": 118347, "epoch": 2817} {"train_loss": -6.537022113800049, "global_step": 118348, "epoch": 2817} {"train_loss": -6.580894470214844, "global_step": 118349, "epoch": 2817} {"train_loss": -6.519482612609863, "global_step": 118350, "epoch": 2817} {"train_loss": -6.614386558532715, "global_step": 118351, "epoch": 2817} {"train_loss": -6.597229957580566, "global_step": 118352, "epoch": 2817} {"train_loss": -6.505946636199951, "global_step": 118353, "epoch": 2817} {"train_loss": -6.580362319946289, "global_step": 118354, "epoch": 2817} {"train_loss": -6.560638030370076, "global_step": 118355, "epoch": 2817, "val_loss": 65767.625} {"train_loss": -6.461616516113281, "global_step": 118356, "epoch": 2818} {"train_loss": -6.5947675704956055, "global_step": 118357, "epoch": 2818} {"train_loss": -6.392644882202148, "global_step": 118358, "epoch": 2818} {"train_loss": -6.612841606140137, "global_step": 118359, "epoch": 2818} {"train_loss": -6.353193283081055, "global_step": 118360, "epoch": 2818} {"train_loss": -6.3821516036987305, "global_step": 118361, "epoch": 2818} {"train_loss": -6.555451393127441, "global_step": 118362, "epoch": 2818} {"train_loss": -6.530229568481445, "global_step": 118363, "epoch": 2818} {"train_loss": -6.518087863922119, "global_step": 118364, "epoch": 2818} {"train_loss": -6.613492965698242, "global_step": 118365, "epoch": 2818} {"train_loss": -6.392330169677734, "global_step": 118366, "epoch": 2818} {"train_loss": -6.433043003082275, "global_step": 118367, "epoch": 2818} {"train_loss": -6.516651153564453, "global_step": 118368, "epoch": 2818} {"train_loss": -6.6148200035095215, "global_step": 118369, "epoch": 2818} {"train_loss": -6.54896354675293, "global_step": 118370, "epoch": 2818} {"train_loss": -6.427894115447998, "global_step": 118371, "epoch": 2818} {"train_loss": -6.5474629402160645, "global_step": 118372, "epoch": 2818} {"train_loss": -6.251645088195801, "global_step": 118373, "epoch": 2818} {"train_loss": -6.534607887268066, "global_step": 118374, "epoch": 2818} {"train_loss": -6.453490734100342, "global_step": 118375, "epoch": 2818} {"train_loss": -6.5151166915893555, "global_step": 118376, "epoch": 2818} {"train_loss": -6.500520706176758, "global_step": 118377, "epoch": 2818} {"train_loss": -6.409274578094482, "global_step": 118378, "epoch": 2818} {"train_loss": -6.580537796020508, "global_step": 118379, "epoch": 2818} {"train_loss": -6.504940986633301, "global_step": 118380, "epoch": 2818} {"train_loss": -6.5170207023620605, "global_step": 118381, "epoch": 2818} {"train_loss": -6.399725914001465, "global_step": 118382, "epoch": 2818} {"train_loss": -6.507823944091797, "global_step": 118383, "epoch": 2818} {"train_loss": -6.510026454925537, "global_step": 118384, "epoch": 2818} {"train_loss": -6.537774085998535, "global_step": 118385, "epoch": 2818} {"train_loss": -6.512478828430176, "global_step": 118386, "epoch": 2818} {"train_loss": -6.353264808654785, "global_step": 118387, "epoch": 2818} {"train_loss": -6.461982727050781, "global_step": 118388, "epoch": 2818} {"train_loss": -6.535053730010986, "global_step": 118389, "epoch": 2818} {"train_loss": -6.49164342880249, "global_step": 118390, "epoch": 2818} {"train_loss": -6.5793352127075195, "global_step": 118391, "epoch": 2818} {"train_loss": -6.556092262268066, "global_step": 118392, "epoch": 2818} {"train_loss": -6.528748989105225, "global_step": 118393, "epoch": 2818} {"train_loss": -6.620388984680176, "global_step": 118394, "epoch": 2818} {"train_loss": -6.594954013824463, "global_step": 118395, "epoch": 2818} {"train_loss": -6.513881206512451, "global_step": 118396, "epoch": 2818} {"train_loss": -6.50009806950887, "global_step": 118397, "epoch": 2818, "val_loss": 65775.03125} {"train_loss": -6.57258415222168, "global_step": 118398, "epoch": 2819} {"train_loss": -6.523188591003418, "global_step": 118399, "epoch": 2819} {"train_loss": -6.541013717651367, "global_step": 118400, "epoch": 2819} {"train_loss": -6.561162948608398, "global_step": 118401, "epoch": 2819} {"train_loss": -6.597042083740234, "global_step": 118402, "epoch": 2819} {"train_loss": -6.523036956787109, "global_step": 118403, "epoch": 2819} {"train_loss": -6.453085422515869, "global_step": 118404, "epoch": 2819} {"train_loss": -6.541243076324463, "global_step": 118405, "epoch": 2819} {"train_loss": -6.578434944152832, "global_step": 118406, "epoch": 2819} {"train_loss": -6.54654598236084, "global_step": 118407, "epoch": 2819} {"train_loss": -6.4940080642700195, "global_step": 118408, "epoch": 2819} {"train_loss": -6.586819171905518, "global_step": 118409, "epoch": 2819} {"train_loss": -6.569250106811523, "global_step": 118410, "epoch": 2819} {"train_loss": -6.53977632522583, "global_step": 118411, "epoch": 2819} {"train_loss": -6.556743621826172, "global_step": 118412, "epoch": 2819} {"train_loss": -6.526064395904541, "global_step": 118413, "epoch": 2819} {"train_loss": -6.567712783813477, "global_step": 118414, "epoch": 2819} {"train_loss": -6.547563552856445, "global_step": 118415, "epoch": 2819} {"train_loss": -6.579842567443848, "global_step": 118416, "epoch": 2819} {"train_loss": -6.536015033721924, "global_step": 118417, "epoch": 2819} {"train_loss": -6.614689350128174, "global_step": 118418, "epoch": 2819} {"train_loss": -6.614711284637451, "global_step": 118419, "epoch": 2819} {"train_loss": -6.44744348526001, "global_step": 118420, "epoch": 2819} {"train_loss": -6.629106521606445, "global_step": 118421, "epoch": 2819} {"train_loss": -6.422060012817383, "global_step": 118422, "epoch": 2819} {"train_loss": -6.430145263671875, "global_step": 118423, "epoch": 2819} {"train_loss": -6.363002300262451, "global_step": 118424, "epoch": 2819} {"train_loss": -6.498701095581055, "global_step": 118425, "epoch": 2819} {"train_loss": -6.3858747482299805, "global_step": 118426, "epoch": 2819} {"train_loss": -6.461405277252197, "global_step": 118427, "epoch": 2819} {"train_loss": -6.48758602142334, "global_step": 118428, "epoch": 2819} {"train_loss": -6.302949905395508, "global_step": 118429, "epoch": 2819} {"train_loss": -6.6240010261535645, "global_step": 118430, "epoch": 2819} {"train_loss": -6.382330894470215, "global_step": 118431, "epoch": 2819} {"train_loss": -6.363638877868652, "global_step": 118432, "epoch": 2819} {"train_loss": -6.514274597167969, "global_step": 118433, "epoch": 2819} {"train_loss": -6.394465446472168, "global_step": 118434, "epoch": 2819} {"train_loss": -6.3852667808532715, "global_step": 118435, "epoch": 2819} {"train_loss": -6.419498443603516, "global_step": 118436, "epoch": 2819} {"train_loss": -6.411464691162109, "global_step": 118437, "epoch": 2819} {"train_loss": -6.531764030456543, "global_step": 118438, "epoch": 2819} {"train_loss": -6.5023550646645685, "global_step": 118439, "epoch": 2819, "val_loss": 65643.6640625} {"train_loss": -6.5963053703308105, "global_step": 118440, "epoch": 2820} {"train_loss": -6.5468645095825195, "global_step": 118441, "epoch": 2820} {"train_loss": -6.566333770751953, "global_step": 118442, "epoch": 2820} {"train_loss": -6.597799301147461, "global_step": 118443, "epoch": 2820} {"train_loss": -6.508580207824707, "global_step": 118444, "epoch": 2820} {"train_loss": -6.479083061218262, "global_step": 118445, "epoch": 2820} {"train_loss": -6.422027587890625, "global_step": 118446, "epoch": 2820} {"train_loss": -6.4989728927612305, "global_step": 118447, "epoch": 2820} {"train_loss": -6.525493621826172, "global_step": 118448, "epoch": 2820} {"train_loss": -6.564301013946533, "global_step": 118449, "epoch": 2820} {"train_loss": -6.725924015045166, "global_step": 118450, "epoch": 2820} {"train_loss": -6.568985462188721, "global_step": 118451, "epoch": 2820} {"train_loss": -6.574990272521973, "global_step": 118452, "epoch": 2820} {"train_loss": -6.5108642578125, "global_step": 118453, "epoch": 2820} {"train_loss": -6.507213115692139, "global_step": 118454, "epoch": 2820} {"train_loss": -6.643990516662598, "global_step": 118455, "epoch": 2820} {"train_loss": -6.638704776763916, "global_step": 118456, "epoch": 2820} {"train_loss": -6.6457624435424805, "global_step": 118457, "epoch": 2820} {"train_loss": -6.573123931884766, "global_step": 118458, "epoch": 2820} {"train_loss": -6.492855072021484, "global_step": 118459, "epoch": 2820} {"train_loss": -6.530643463134766, "global_step": 118460, "epoch": 2820} {"train_loss": -6.543773651123047, "global_step": 118461, "epoch": 2820} {"train_loss": -6.460851669311523, "global_step": 118462, "epoch": 2820} {"train_loss": -6.536375045776367, "global_step": 118463, "epoch": 2820} {"train_loss": -6.441075325012207, "global_step": 118464, "epoch": 2820} {"train_loss": -6.649698734283447, "global_step": 118465, "epoch": 2820} {"train_loss": -6.537105560302734, "global_step": 118466, "epoch": 2820} {"train_loss": -6.390893936157227, "global_step": 118467, "epoch": 2820} {"train_loss": -6.618596076965332, "global_step": 118468, "epoch": 2820} {"train_loss": -6.507819175720215, "global_step": 118469, "epoch": 2820} {"train_loss": -6.576405048370361, "global_step": 118470, "epoch": 2820} {"train_loss": -6.499109268188477, "global_step": 118471, "epoch": 2820} {"train_loss": -6.530447006225586, "global_step": 118472, "epoch": 2820} {"train_loss": -6.690669536590576, "global_step": 118473, "epoch": 2820} {"train_loss": -6.386661529541016, "global_step": 118474, "epoch": 2820} {"train_loss": -6.605983257293701, "global_step": 118475, "epoch": 2820} {"train_loss": -6.554788589477539, "global_step": 118476, "epoch": 2820} {"train_loss": -6.450445175170898, "global_step": 118477, "epoch": 2820} {"train_loss": -6.522188186645508, "global_step": 118478, "epoch": 2820} {"train_loss": -6.4907546043396, "global_step": 118479, "epoch": 2820} {"train_loss": -6.61817741394043, "global_step": 118480, "epoch": 2820} {"train_loss": -6.540758882250104, "global_step": 118481, "epoch": 2820, "val_loss": 65682.421875} {"train_loss": -6.691915512084961, "global_step": 118482, "epoch": 2821} {"train_loss": -6.7196149826049805, "global_step": 118483, "epoch": 2821} {"train_loss": -6.579464435577393, "global_step": 118484, "epoch": 2821} {"train_loss": -6.600836753845215, "global_step": 118485, "epoch": 2821} {"train_loss": -6.563729286193848, "global_step": 118486, "epoch": 2821} {"train_loss": -6.519443035125732, "global_step": 118487, "epoch": 2821} {"train_loss": -6.561549186706543, "global_step": 118488, "epoch": 2821} {"train_loss": -6.441061019897461, "global_step": 118489, "epoch": 2821} {"train_loss": -6.632333755493164, "global_step": 118490, "epoch": 2821} {"train_loss": -6.508334159851074, "global_step": 118491, "epoch": 2821} {"train_loss": -6.558043479919434, "global_step": 118492, "epoch": 2821} {"train_loss": -6.599945545196533, "global_step": 118493, "epoch": 2821} {"train_loss": -6.592439651489258, "global_step": 118494, "epoch": 2821} {"train_loss": -6.537944316864014, "global_step": 118495, "epoch": 2821} {"train_loss": -6.555832386016846, "global_step": 118496, "epoch": 2821} {"train_loss": -6.527768135070801, "global_step": 118497, "epoch": 2821} {"train_loss": -6.576809883117676, "global_step": 118498, "epoch": 2821} {"train_loss": -6.417477607727051, "global_step": 118499, "epoch": 2821} {"train_loss": -6.457477569580078, "global_step": 118500, "epoch": 2821} {"train_loss": -6.497690200805664, "global_step": 118501, "epoch": 2821} {"train_loss": -6.664793968200684, "global_step": 118502, "epoch": 2821} {"train_loss": -6.500917434692383, "global_step": 118503, "epoch": 2821} {"train_loss": -6.442401885986328, "global_step": 118504, "epoch": 2821} {"train_loss": -6.629433631896973, "global_step": 118505, "epoch": 2821} {"train_loss": -6.479994773864746, "global_step": 118506, "epoch": 2821} {"train_loss": -6.363557815551758, "global_step": 118507, "epoch": 2821} {"train_loss": -6.597293853759766, "global_step": 118508, "epoch": 2821} {"train_loss": -6.600531101226807, "global_step": 118509, "epoch": 2821} {"train_loss": -6.389735698699951, "global_step": 118510, "epoch": 2821} {"train_loss": -6.502894401550293, "global_step": 118511, "epoch": 2821} {"train_loss": -6.628681182861328, "global_step": 118512, "epoch": 2821} {"train_loss": -6.446175575256348, "global_step": 118513, "epoch": 2821} {"train_loss": -6.678035736083984, "global_step": 118514, "epoch": 2821} {"train_loss": -6.5863518714904785, "global_step": 118515, "epoch": 2821} {"train_loss": -6.569176197052002, "global_step": 118516, "epoch": 2821} {"train_loss": -6.570427894592285, "global_step": 118517, "epoch": 2821} {"train_loss": -6.535824775695801, "global_step": 118518, "epoch": 2821} {"train_loss": -6.543188095092773, "global_step": 118519, "epoch": 2821} {"train_loss": -6.56957483291626, "global_step": 118520, "epoch": 2821} {"train_loss": -6.558047294616699, "global_step": 118521, "epoch": 2821} {"train_loss": -6.681008815765381, "global_step": 118522, "epoch": 2821} {"train_loss": -6.553206875210717, "global_step": 118523, "epoch": 2821, "val_loss": 65503.4375} {"train_loss": -6.570304870605469, "global_step": 118524, "epoch": 2822} {"train_loss": -6.6441168785095215, "global_step": 118525, "epoch": 2822} {"train_loss": -6.658759117126465, "global_step": 118526, "epoch": 2822} {"train_loss": -6.6096906661987305, "global_step": 118527, "epoch": 2822} {"train_loss": -6.553216934204102, "global_step": 118528, "epoch": 2822} {"train_loss": -6.529704570770264, "global_step": 118529, "epoch": 2822} {"train_loss": -6.472484588623047, "global_step": 118530, "epoch": 2822} {"train_loss": -6.47948694229126, "global_step": 118531, "epoch": 2822} {"train_loss": -6.649197101593018, "global_step": 118532, "epoch": 2822} {"train_loss": -6.444742202758789, "global_step": 118533, "epoch": 2822} {"train_loss": -6.548600673675537, "global_step": 118534, "epoch": 2822} {"train_loss": -6.61151123046875, "global_step": 118535, "epoch": 2822} {"train_loss": -6.618500709533691, "global_step": 118536, "epoch": 2822} {"train_loss": -6.662617206573486, "global_step": 118537, "epoch": 2822} {"train_loss": -6.445518493652344, "global_step": 118538, "epoch": 2822} {"train_loss": -6.7114481925964355, "global_step": 118539, "epoch": 2822} {"train_loss": -6.52702522277832, "global_step": 118540, "epoch": 2822} {"train_loss": -6.502721309661865, "global_step": 118541, "epoch": 2822} {"train_loss": -6.590348243713379, "global_step": 118542, "epoch": 2822} {"train_loss": -6.386014938354492, "global_step": 118543, "epoch": 2822} {"train_loss": -6.4405517578125, "global_step": 118544, "epoch": 2822} {"train_loss": -6.541030406951904, "global_step": 118545, "epoch": 2822} {"train_loss": -6.412944793701172, "global_step": 118546, "epoch": 2822} {"train_loss": -6.445716857910156, "global_step": 118547, "epoch": 2822} {"train_loss": -6.392539978027344, "global_step": 118548, "epoch": 2822} {"train_loss": -6.561794281005859, "global_step": 118549, "epoch": 2822} {"train_loss": -6.614673614501953, "global_step": 118550, "epoch": 2822} {"train_loss": -6.464142322540283, "global_step": 118551, "epoch": 2822} {"train_loss": -6.5864386558532715, "global_step": 118552, "epoch": 2822} {"train_loss": -6.602875232696533, "global_step": 118553, "epoch": 2822} {"train_loss": -6.441410541534424, "global_step": 118554, "epoch": 2822} {"train_loss": -6.5606889724731445, "global_step": 118555, "epoch": 2822} {"train_loss": -6.529593467712402, "global_step": 118556, "epoch": 2822} {"train_loss": -6.571117877960205, "global_step": 118557, "epoch": 2822} {"train_loss": -6.573729991912842, "global_step": 118558, "epoch": 2822} {"train_loss": -6.489529132843018, "global_step": 118559, "epoch": 2822} {"train_loss": -6.600461959838867, "global_step": 118560, "epoch": 2822} {"train_loss": -6.666739463806152, "global_step": 118561, "epoch": 2822} {"train_loss": -6.480216979980469, "global_step": 118562, "epoch": 2822} {"train_loss": -6.543844223022461, "global_step": 118563, "epoch": 2822} {"train_loss": -6.553004264831543, "global_step": 118564, "epoch": 2822} {"train_loss": -6.543079614639282, "global_step": 118565, "epoch": 2822, "val_loss": 65833.6875} {"train_loss": -6.697305679321289, "global_step": 118566, "epoch": 2823} {"train_loss": -6.5285491943359375, "global_step": 118567, "epoch": 2823} {"train_loss": -6.469322681427002, "global_step": 118568, "epoch": 2823} {"train_loss": -6.639252662658691, "global_step": 118569, "epoch": 2823} {"train_loss": -6.553908348083496, "global_step": 118570, "epoch": 2823} {"train_loss": -6.522073268890381, "global_step": 118571, "epoch": 2823} {"train_loss": -6.458563327789307, "global_step": 118572, "epoch": 2823} {"train_loss": -6.560971260070801, "global_step": 118573, "epoch": 2823} {"train_loss": -6.535035133361816, "global_step": 118574, "epoch": 2823} {"train_loss": -6.371173858642578, "global_step": 118575, "epoch": 2823} {"train_loss": -6.508392810821533, "global_step": 118576, "epoch": 2823} {"train_loss": -6.61592960357666, "global_step": 118577, "epoch": 2823} {"train_loss": -6.56492805480957, "global_step": 118578, "epoch": 2823} {"train_loss": -6.484606742858887, "global_step": 118579, "epoch": 2823} {"train_loss": -6.593635559082031, "global_step": 118580, "epoch": 2823} {"train_loss": -6.566987991333008, "global_step": 118581, "epoch": 2823} {"train_loss": -6.410226821899414, "global_step": 118582, "epoch": 2823} {"train_loss": -6.454403400421143, "global_step": 118583, "epoch": 2823} {"train_loss": -6.524443626403809, "global_step": 118584, "epoch": 2823} {"train_loss": -6.422740459442139, "global_step": 118585, "epoch": 2823} {"train_loss": -6.4967851638793945, "global_step": 118586, "epoch": 2823} {"train_loss": -6.5375657081604, "global_step": 118587, "epoch": 2823} {"train_loss": -6.526125907897949, "global_step": 118588, "epoch": 2823} {"train_loss": -6.547876358032227, "global_step": 118589, "epoch": 2823} {"train_loss": -6.395393371582031, "global_step": 118590, "epoch": 2823} {"train_loss": -6.570812225341797, "global_step": 118591, "epoch": 2823} {"train_loss": -6.48786735534668, "global_step": 118592, "epoch": 2823} {"train_loss": -6.4717254638671875, "global_step": 118593, "epoch": 2823} {"train_loss": -6.493314743041992, "global_step": 118594, "epoch": 2823} {"train_loss": -6.425965785980225, "global_step": 118595, "epoch": 2823} {"train_loss": -6.526543140411377, "global_step": 118596, "epoch": 2823} {"train_loss": -6.431247234344482, "global_step": 118597, "epoch": 2823} {"train_loss": -6.478000640869141, "global_step": 118598, "epoch": 2823} {"train_loss": -6.45051383972168, "global_step": 118599, "epoch": 2823} {"train_loss": -6.514458179473877, "global_step": 118600, "epoch": 2823} {"train_loss": -6.485729694366455, "global_step": 118601, "epoch": 2823} {"train_loss": -6.441906452178955, "global_step": 118602, "epoch": 2823} {"train_loss": -6.498600482940674, "global_step": 118603, "epoch": 2823} {"train_loss": -6.3870391845703125, "global_step": 118604, "epoch": 2823} {"train_loss": -6.534280776977539, "global_step": 118605, "epoch": 2823} {"train_loss": -6.557432174682617, "global_step": 118606, "epoch": 2823} {"train_loss": -6.500563031151181, "global_step": 118607, "epoch": 2823, "val_loss": 65790.421875} {"train_loss": -6.575142860412598, "global_step": 118608, "epoch": 2824} {"train_loss": -6.508584976196289, "global_step": 118609, "epoch": 2824} {"train_loss": -6.442874431610107, "global_step": 118610, "epoch": 2824} {"train_loss": -6.5226593017578125, "global_step": 118611, "epoch": 2824} {"train_loss": -6.560724258422852, "global_step": 118612, "epoch": 2824} {"train_loss": -6.347958087921143, "global_step": 118613, "epoch": 2824} {"train_loss": -6.53129243850708, "global_step": 118614, "epoch": 2824} {"train_loss": -6.485895156860352, "global_step": 118615, "epoch": 2824} {"train_loss": -6.482888221740723, "global_step": 118616, "epoch": 2824} {"train_loss": -6.456525802612305, "global_step": 118617, "epoch": 2824} {"train_loss": -6.628776550292969, "global_step": 118618, "epoch": 2824} {"train_loss": -6.436147212982178, "global_step": 118619, "epoch": 2824} {"train_loss": -6.486453056335449, "global_step": 118620, "epoch": 2824} {"train_loss": -6.482253074645996, "global_step": 118621, "epoch": 2824} {"train_loss": -6.375558853149414, "global_step": 118622, "epoch": 2824} {"train_loss": -6.688055992126465, "global_step": 118623, "epoch": 2824} {"train_loss": -6.495181560516357, "global_step": 118624, "epoch": 2824} {"train_loss": -6.436867713928223, "global_step": 118625, "epoch": 2824} {"train_loss": -6.50369119644165, "global_step": 118626, "epoch": 2824} {"train_loss": -6.55324649810791, "global_step": 118627, "epoch": 2824} {"train_loss": -6.523069381713867, "global_step": 118628, "epoch": 2824} {"train_loss": -6.559330940246582, "global_step": 118629, "epoch": 2824} {"train_loss": -6.549337387084961, "global_step": 118630, "epoch": 2824} {"train_loss": -6.653644561767578, "global_step": 118631, "epoch": 2824} {"train_loss": -6.615696907043457, "global_step": 118632, "epoch": 2824} {"train_loss": -6.587076663970947, "global_step": 118633, "epoch": 2824} {"train_loss": -6.6076250076293945, "global_step": 118634, "epoch": 2824} {"train_loss": -6.4994001388549805, "global_step": 118635, "epoch": 2824} {"train_loss": -6.537614822387695, "global_step": 118636, "epoch": 2824} {"train_loss": -6.539742469787598, "global_step": 118637, "epoch": 2824} {"train_loss": -6.550734519958496, "global_step": 118638, "epoch": 2824} {"train_loss": -6.5743536949157715, "global_step": 118639, "epoch": 2824} {"train_loss": -6.486875534057617, "global_step": 118640, "epoch": 2824} {"train_loss": -6.617193698883057, "global_step": 118641, "epoch": 2824} {"train_loss": -6.599003791809082, "global_step": 118642, "epoch": 2824} {"train_loss": -6.592577934265137, "global_step": 118643, "epoch": 2824} {"train_loss": -6.597609519958496, "global_step": 118644, "epoch": 2824} {"train_loss": -6.52999210357666, "global_step": 118645, "epoch": 2824} {"train_loss": -6.527331352233887, "global_step": 118646, "epoch": 2824} {"train_loss": -6.570063591003418, "global_step": 118647, "epoch": 2824} {"train_loss": -6.553628444671631, "global_step": 118648, "epoch": 2824} {"train_loss": -6.536107801255726, "global_step": 118649, "epoch": 2824, "val_loss": 65547.8046875} {"train_loss": -6.639505386352539, "global_step": 118650, "epoch": 2825} {"train_loss": -6.504953384399414, "global_step": 118651, "epoch": 2825} {"train_loss": -6.602704048156738, "global_step": 118652, "epoch": 2825} {"train_loss": -6.532034873962402, "global_step": 118653, "epoch": 2825} {"train_loss": -6.598793983459473, "global_step": 118654, "epoch": 2825} {"train_loss": -6.4707841873168945, "global_step": 118655, "epoch": 2825} {"train_loss": -6.61249303817749, "global_step": 118656, "epoch": 2825} {"train_loss": -6.622525215148926, "global_step": 118657, "epoch": 2825} {"train_loss": -6.572841644287109, "global_step": 118658, "epoch": 2825} {"train_loss": -6.560421943664551, "global_step": 118659, "epoch": 2825} {"train_loss": -6.675821304321289, "global_step": 118660, "epoch": 2825} {"train_loss": -6.651779651641846, "global_step": 118661, "epoch": 2825} {"train_loss": -6.617580413818359, "global_step": 118662, "epoch": 2825} {"train_loss": -6.529727935791016, "global_step": 118663, "epoch": 2825} {"train_loss": -6.601454734802246, "global_step": 118664, "epoch": 2825} {"train_loss": -6.532974720001221, "global_step": 118665, "epoch": 2825} {"train_loss": -6.600687503814697, "global_step": 118666, "epoch": 2825} {"train_loss": -6.706467628479004, "global_step": 118667, "epoch": 2825} {"train_loss": -6.639376163482666, "global_step": 118668, "epoch": 2825} {"train_loss": -6.711338996887207, "global_step": 118669, "epoch": 2825} {"train_loss": -6.619350433349609, "global_step": 118670, "epoch": 2825} {"train_loss": -6.720200538635254, "global_step": 118671, "epoch": 2825} {"train_loss": -6.630088806152344, "global_step": 118672, "epoch": 2825} {"train_loss": -6.630274295806885, "global_step": 118673, "epoch": 2825} {"train_loss": -6.648365020751953, "global_step": 118674, "epoch": 2825} {"train_loss": -6.6665568351745605, "global_step": 118675, "epoch": 2825} {"train_loss": -6.455813407897949, "global_step": 118676, "epoch": 2825} {"train_loss": -6.692890167236328, "global_step": 118677, "epoch": 2825} {"train_loss": -6.627878189086914, "global_step": 118678, "epoch": 2825} {"train_loss": -6.47133731842041, "global_step": 118679, "epoch": 2825} {"train_loss": -6.530214786529541, "global_step": 118680, "epoch": 2825} {"train_loss": -6.516689300537109, "global_step": 118681, "epoch": 2825} {"train_loss": -6.529015064239502, "global_step": 118682, "epoch": 2825} {"train_loss": -6.577800750732422, "global_step": 118683, "epoch": 2825} {"train_loss": -6.583103179931641, "global_step": 118684, "epoch": 2825} {"train_loss": -6.594949245452881, "global_step": 118685, "epoch": 2825} {"train_loss": -6.590435028076172, "global_step": 118686, "epoch": 2825} {"train_loss": -6.634678840637207, "global_step": 118687, "epoch": 2825} {"train_loss": -6.575663089752197, "global_step": 118688, "epoch": 2825} {"train_loss": -6.677075386047363, "global_step": 118689, "epoch": 2825} {"train_loss": -6.628410339355469, "global_step": 118690, "epoch": 2825} {"train_loss": -6.598005238033476, "global_step": 118691, "epoch": 2825, "val_loss": 65683.0078125} {"train_loss": -6.587452411651611, "global_step": 118692, "epoch": 2826} {"train_loss": -6.584254264831543, "global_step": 118693, "epoch": 2826} {"train_loss": -6.51354455947876, "global_step": 118694, "epoch": 2826} {"train_loss": -6.630801677703857, "global_step": 118695, "epoch": 2826} {"train_loss": -6.5105204582214355, "global_step": 118696, "epoch": 2826} {"train_loss": -6.39980411529541, "global_step": 118697, "epoch": 2826} {"train_loss": -6.558427333831787, "global_step": 118698, "epoch": 2826} {"train_loss": -6.526093006134033, "global_step": 118699, "epoch": 2826} {"train_loss": -6.49757194519043, "global_step": 118700, "epoch": 2826} {"train_loss": -6.573508262634277, "global_step": 118701, "epoch": 2826} {"train_loss": -6.5305681228637695, "global_step": 118702, "epoch": 2826} {"train_loss": -6.530600547790527, "global_step": 118703, "epoch": 2826} {"train_loss": -6.556032180786133, "global_step": 118704, "epoch": 2826} {"train_loss": -6.590307235717773, "global_step": 118705, "epoch": 2826} {"train_loss": -6.404273986816406, "global_step": 118706, "epoch": 2826} {"train_loss": -6.559384822845459, "global_step": 118707, "epoch": 2826} {"train_loss": -6.477941036224365, "global_step": 118708, "epoch": 2826} {"train_loss": -6.607401371002197, "global_step": 118709, "epoch": 2826} {"train_loss": -6.503026962280273, "global_step": 118710, "epoch": 2826} {"train_loss": -6.630882263183594, "global_step": 118711, "epoch": 2826} {"train_loss": -6.554482460021973, "global_step": 118712, "epoch": 2826} {"train_loss": -6.541729927062988, "global_step": 118713, "epoch": 2826} {"train_loss": -6.53409481048584, "global_step": 118714, "epoch": 2826} {"train_loss": -6.615434646606445, "global_step": 118715, "epoch": 2826} {"train_loss": -6.512063026428223, "global_step": 118716, "epoch": 2826} {"train_loss": -6.528890609741211, "global_step": 118717, "epoch": 2826} {"train_loss": -6.5652055740356445, "global_step": 118718, "epoch": 2826} {"train_loss": -6.435788154602051, "global_step": 118719, "epoch": 2826} {"train_loss": -6.565654277801514, "global_step": 118720, "epoch": 2826} {"train_loss": -6.563309669494629, "global_step": 118721, "epoch": 2826} {"train_loss": -6.499741554260254, "global_step": 118722, "epoch": 2826} {"train_loss": -6.389930725097656, "global_step": 118723, "epoch": 2826} {"train_loss": -6.557168006896973, "global_step": 118724, "epoch": 2826} {"train_loss": -6.645570278167725, "global_step": 118725, "epoch": 2826} {"train_loss": -6.582413673400879, "global_step": 118726, "epoch": 2826} {"train_loss": -6.48710823059082, "global_step": 118727, "epoch": 2826} {"train_loss": -6.530065536499023, "global_step": 118728, "epoch": 2826} {"train_loss": -6.538104057312012, "global_step": 118729, "epoch": 2826} {"train_loss": -6.615449905395508, "global_step": 118730, "epoch": 2826} {"train_loss": -6.543449401855469, "global_step": 118731, "epoch": 2826} {"train_loss": -6.562730312347412, "global_step": 118732, "epoch": 2826} {"train_loss": -6.542346545628139, "global_step": 118733, "epoch": 2826, "val_loss": 65751.9453125} {"train_loss": -6.539750576019287, "global_step": 118734, "epoch": 2827} {"train_loss": -6.6011881828308105, "global_step": 118735, "epoch": 2827} {"train_loss": -6.727224349975586, "global_step": 118736, "epoch": 2827} {"train_loss": -6.593134880065918, "global_step": 118737, "epoch": 2827} {"train_loss": -6.559277534484863, "global_step": 118738, "epoch": 2827} {"train_loss": -6.565474987030029, "global_step": 118739, "epoch": 2827} {"train_loss": -6.716358184814453, "global_step": 118740, "epoch": 2827} {"train_loss": -6.556443214416504, "global_step": 118741, "epoch": 2827} {"train_loss": -6.589913368225098, "global_step": 118742, "epoch": 2827} {"train_loss": -6.624399662017822, "global_step": 118743, "epoch": 2827} {"train_loss": -6.625411033630371, "global_step": 118744, "epoch": 2827} {"train_loss": -6.554862022399902, "global_step": 118745, "epoch": 2827} {"train_loss": -6.4524993896484375, "global_step": 118746, "epoch": 2827} {"train_loss": -6.50740909576416, "global_step": 118747, "epoch": 2827} {"train_loss": -6.550946235656738, "global_step": 118748, "epoch": 2827} {"train_loss": -6.54400634765625, "global_step": 118749, "epoch": 2827} {"train_loss": -6.531274795532227, "global_step": 118750, "epoch": 2827} {"train_loss": -6.603542327880859, "global_step": 118751, "epoch": 2827} {"train_loss": -6.544733047485352, "global_step": 118752, "epoch": 2827} {"train_loss": -6.605366230010986, "global_step": 118753, "epoch": 2827} {"train_loss": -6.611705780029297, "global_step": 118754, "epoch": 2827} {"train_loss": -6.564568519592285, "global_step": 118755, "epoch": 2827} {"train_loss": -6.600829124450684, "global_step": 118756, "epoch": 2827} {"train_loss": -6.6406474113464355, "global_step": 118757, "epoch": 2827} {"train_loss": -6.553463935852051, "global_step": 118758, "epoch": 2827} {"train_loss": -6.6869988441467285, "global_step": 118759, "epoch": 2827} {"train_loss": -6.49559211730957, "global_step": 118760, "epoch": 2827} {"train_loss": -6.593402862548828, "global_step": 118761, "epoch": 2827} {"train_loss": -6.592888832092285, "global_step": 118762, "epoch": 2827} {"train_loss": -6.61415433883667, "global_step": 118763, "epoch": 2827} {"train_loss": -6.657552242279053, "global_step": 118764, "epoch": 2827} {"train_loss": -6.513113975524902, "global_step": 118765, "epoch": 2827} {"train_loss": -6.659196853637695, "global_step": 118766, "epoch": 2827} {"train_loss": -6.654557228088379, "global_step": 118767, "epoch": 2827} {"train_loss": -6.507647514343262, "global_step": 118768, "epoch": 2827} {"train_loss": -6.522095680236816, "global_step": 118769, "epoch": 2827} {"train_loss": -6.483673095703125, "global_step": 118770, "epoch": 2827} {"train_loss": -6.431678771972656, "global_step": 118771, "epoch": 2827} {"train_loss": -6.532472610473633, "global_step": 118772, "epoch": 2827} {"train_loss": -6.211460113525391, "global_step": 118773, "epoch": 2827} {"train_loss": -6.278041839599609, "global_step": 118774, "epoch": 2827} {"train_loss": -6.555391084580195, "global_step": 118775, "epoch": 2827, "val_loss": 66266.4609375} {"train_loss": -6.267399311065674, "global_step": 118776, "epoch": 2828} {"train_loss": -6.445743083953857, "global_step": 118777, "epoch": 2828} {"train_loss": -6.33383846282959, "global_step": 118778, "epoch": 2828} {"train_loss": -6.3431806564331055, "global_step": 118779, "epoch": 2828} {"train_loss": -6.340611457824707, "global_step": 118780, "epoch": 2828} {"train_loss": -6.375155448913574, "global_step": 118781, "epoch": 2828} {"train_loss": -6.192412376403809, "global_step": 118782, "epoch": 2828} {"train_loss": -6.444440841674805, "global_step": 118783, "epoch": 2828} {"train_loss": -6.32289457321167, "global_step": 118784, "epoch": 2828} {"train_loss": -6.466169357299805, "global_step": 118785, "epoch": 2828} {"train_loss": -6.36244010925293, "global_step": 118786, "epoch": 2828} {"train_loss": -6.442401885986328, "global_step": 118787, "epoch": 2828} {"train_loss": -6.4851837158203125, "global_step": 118788, "epoch": 2828} {"train_loss": -6.565435886383057, "global_step": 118789, "epoch": 2828} {"train_loss": -6.453938961029053, "global_step": 118790, "epoch": 2828} {"train_loss": -6.557552814483643, "global_step": 118791, "epoch": 2828} {"train_loss": -6.389354705810547, "global_step": 118792, "epoch": 2828} {"train_loss": -6.560215473175049, "global_step": 118793, "epoch": 2828} {"train_loss": -6.354382514953613, "global_step": 118794, "epoch": 2828} {"train_loss": -6.533074855804443, "global_step": 118795, "epoch": 2828} {"train_loss": -6.428220748901367, "global_step": 118796, "epoch": 2828} {"train_loss": -6.549126625061035, "global_step": 118797, "epoch": 2828} {"train_loss": -6.510746002197266, "global_step": 118798, "epoch": 2828} {"train_loss": -6.565160751342773, "global_step": 118799, "epoch": 2828} {"train_loss": -6.469675064086914, "global_step": 118800, "epoch": 2828} {"train_loss": -6.544989585876465, "global_step": 118801, "epoch": 2828} {"train_loss": -6.452756881713867, "global_step": 118802, "epoch": 2828} {"train_loss": -6.566287517547607, "global_step": 118803, "epoch": 2828} {"train_loss": -6.6352057456970215, "global_step": 118804, "epoch": 2828} {"train_loss": -6.5425825119018555, "global_step": 118805, "epoch": 2828} {"train_loss": -6.555027961730957, "global_step": 118806, "epoch": 2828} {"train_loss": -6.596842288970947, "global_step": 118807, "epoch": 2828} {"train_loss": -6.618521690368652, "global_step": 118808, "epoch": 2828} {"train_loss": -6.5667724609375, "global_step": 118809, "epoch": 2828} {"train_loss": -6.34429931640625, "global_step": 118810, "epoch": 2828} {"train_loss": -6.6446027755737305, "global_step": 118811, "epoch": 2828} {"train_loss": -6.6620941162109375, "global_step": 118812, "epoch": 2828} {"train_loss": -6.446610450744629, "global_step": 118813, "epoch": 2828} {"train_loss": -6.582671165466309, "global_step": 118814, "epoch": 2828} {"train_loss": -6.544586181640625, "global_step": 118815, "epoch": 2828} {"train_loss": -6.5790696144104, "global_step": 118816, "epoch": 2828} {"train_loss": -6.477804445085072, "global_step": 118817, "epoch": 2828, "val_loss": 65604.1875} {"train_loss": -6.556697845458984, "global_step": 118818, "epoch": 2829} {"train_loss": -6.655794620513916, "global_step": 118819, "epoch": 2829} {"train_loss": -6.673892021179199, "global_step": 118820, "epoch": 2829} {"train_loss": -6.635533809661865, "global_step": 118821, "epoch": 2829} {"train_loss": -6.591007232666016, "global_step": 118822, "epoch": 2829} {"train_loss": -6.584416389465332, "global_step": 118823, "epoch": 2829} {"train_loss": -6.584471702575684, "global_step": 118824, "epoch": 2829} {"train_loss": -6.587205410003662, "global_step": 118825, "epoch": 2829} {"train_loss": -6.59836483001709, "global_step": 118826, "epoch": 2829} {"train_loss": -6.481542110443115, "global_step": 118827, "epoch": 2829} {"train_loss": -6.636938095092773, "global_step": 118828, "epoch": 2829} {"train_loss": -6.593698501586914, "global_step": 118829, "epoch": 2829} {"train_loss": -6.665648937225342, "global_step": 118830, "epoch": 2829} {"train_loss": -6.638523578643799, "global_step": 118831, "epoch": 2829} {"train_loss": -6.536202430725098, "global_step": 118832, "epoch": 2829} {"train_loss": -6.468246936798096, "global_step": 118833, "epoch": 2829} {"train_loss": -6.530911445617676, "global_step": 118834, "epoch": 2829} {"train_loss": -6.663086891174316, "global_step": 118835, "epoch": 2829} {"train_loss": -6.6623759269714355, "global_step": 118836, "epoch": 2829} {"train_loss": -6.507302761077881, "global_step": 118837, "epoch": 2829} {"train_loss": -6.690119743347168, "global_step": 118838, "epoch": 2829} {"train_loss": -6.503698825836182, "global_step": 118839, "epoch": 2829} {"train_loss": -6.553995132446289, "global_step": 118840, "epoch": 2829} {"train_loss": -6.6153364181518555, "global_step": 118841, "epoch": 2829} {"train_loss": -6.529253959655762, "global_step": 118842, "epoch": 2829} {"train_loss": -6.587662696838379, "global_step": 118843, "epoch": 2829} {"train_loss": -6.456517219543457, "global_step": 118844, "epoch": 2829} {"train_loss": -6.499444961547852, "global_step": 118845, "epoch": 2829} {"train_loss": -6.36873722076416, "global_step": 118846, "epoch": 2829} {"train_loss": -6.600245475769043, "global_step": 118847, "epoch": 2829} {"train_loss": -6.6786627769470215, "global_step": 118848, "epoch": 2829} {"train_loss": -6.533633232116699, "global_step": 118849, "epoch": 2829} {"train_loss": -6.568572998046875, "global_step": 118850, "epoch": 2829} {"train_loss": -6.556396484375, "global_step": 118851, "epoch": 2829} {"train_loss": -6.664327621459961, "global_step": 118852, "epoch": 2829} {"train_loss": -6.417181968688965, "global_step": 118853, "epoch": 2829} {"train_loss": -6.458655834197998, "global_step": 118854, "epoch": 2829} {"train_loss": -6.485611438751221, "global_step": 118855, "epoch": 2829} {"train_loss": -6.538554668426514, "global_step": 118856, "epoch": 2829} {"train_loss": -6.414525985717773, "global_step": 118857, "epoch": 2829} {"train_loss": -6.417483329772949, "global_step": 118858, "epoch": 2829} {"train_loss": -6.5607046740395685, "global_step": 118859, "epoch": 2829, "val_loss": 65564.921875} {"train_loss": -6.505197525024414, "global_step": 118860, "epoch": 2830} {"train_loss": -6.569253921508789, "global_step": 118861, "epoch": 2830} {"train_loss": -6.639289855957031, "global_step": 118862, "epoch": 2830} {"train_loss": -6.489081382751465, "global_step": 118863, "epoch": 2830} {"train_loss": -6.520411491394043, "global_step": 118864, "epoch": 2830} {"train_loss": -6.572451591491699, "global_step": 118865, "epoch": 2830} {"train_loss": -6.641803741455078, "global_step": 118866, "epoch": 2830} {"train_loss": -6.452032566070557, "global_step": 118867, "epoch": 2830} {"train_loss": -6.436891078948975, "global_step": 118868, "epoch": 2830} {"train_loss": -6.572108268737793, "global_step": 118869, "epoch": 2830} {"train_loss": -6.513993263244629, "global_step": 118870, "epoch": 2830} {"train_loss": -6.628537178039551, "global_step": 118871, "epoch": 2830} {"train_loss": -6.561217784881592, "global_step": 118872, "epoch": 2830} {"train_loss": -6.478170871734619, "global_step": 118873, "epoch": 2830} {"train_loss": -6.6349310874938965, "global_step": 118874, "epoch": 2830} {"train_loss": -6.619661808013916, "global_step": 118875, "epoch": 2830} {"train_loss": -6.607614040374756, "global_step": 118876, "epoch": 2830} {"train_loss": -6.49530553817749, "global_step": 118877, "epoch": 2830} {"train_loss": -6.608164310455322, "global_step": 118878, "epoch": 2830} {"train_loss": -6.59694766998291, "global_step": 118879, "epoch": 2830} {"train_loss": -6.641407012939453, "global_step": 118880, "epoch": 2830} {"train_loss": -6.5317864418029785, "global_step": 118881, "epoch": 2830} {"train_loss": -6.488922119140625, "global_step": 118882, "epoch": 2830} {"train_loss": -6.588459014892578, "global_step": 118883, "epoch": 2830} {"train_loss": -6.4839606285095215, "global_step": 118884, "epoch": 2830} {"train_loss": -6.6638898849487305, "global_step": 118885, "epoch": 2830} {"train_loss": -6.5258917808532715, "global_step": 118886, "epoch": 2830} {"train_loss": -6.615297317504883, "global_step": 118887, "epoch": 2830} {"train_loss": -6.612198829650879, "global_step": 118888, "epoch": 2830} {"train_loss": -6.558884620666504, "global_step": 118889, "epoch": 2830} {"train_loss": -6.553329944610596, "global_step": 118890, "epoch": 2830} {"train_loss": -6.621515274047852, "global_step": 118891, "epoch": 2830} {"train_loss": -6.638838768005371, "global_step": 118892, "epoch": 2830} {"train_loss": -6.444929599761963, "global_step": 118893, "epoch": 2830} {"train_loss": -6.500415325164795, "global_step": 118894, "epoch": 2830} {"train_loss": -6.4867377281188965, "global_step": 118895, "epoch": 2830} {"train_loss": -6.557104587554932, "global_step": 118896, "epoch": 2830} {"train_loss": -6.475019454956055, "global_step": 118897, "epoch": 2830} {"train_loss": -6.55747127532959, "global_step": 118898, "epoch": 2830} {"train_loss": -6.489017009735107, "global_step": 118899, "epoch": 2830} {"train_loss": -6.540829658508301, "global_step": 118900, "epoch": 2830} {"train_loss": -6.552811054956345, "global_step": 118901, "epoch": 2830, "val_loss": 65432.140625} {"train_loss": -6.6693315505981445, "global_step": 118902, "epoch": 2831} {"train_loss": -6.599322319030762, "global_step": 118903, "epoch": 2831} {"train_loss": -6.569363594055176, "global_step": 118904, "epoch": 2831} {"train_loss": -6.5904340744018555, "global_step": 118905, "epoch": 2831} {"train_loss": -6.620631217956543, "global_step": 118906, "epoch": 2831} {"train_loss": -6.633446216583252, "global_step": 118907, "epoch": 2831} {"train_loss": -6.569218158721924, "global_step": 118908, "epoch": 2831} {"train_loss": -6.538495063781738, "global_step": 118909, "epoch": 2831} {"train_loss": -6.4788818359375, "global_step": 118910, "epoch": 2831} {"train_loss": -6.667179107666016, "global_step": 118911, "epoch": 2831} {"train_loss": -6.635918140411377, "global_step": 118912, "epoch": 2831} {"train_loss": -6.516663551330566, "global_step": 118913, "epoch": 2831} {"train_loss": -6.601624488830566, "global_step": 118914, "epoch": 2831} {"train_loss": -6.631906509399414, "global_step": 118915, "epoch": 2831} {"train_loss": -6.5137152671813965, "global_step": 118916, "epoch": 2831} {"train_loss": -6.488222122192383, "global_step": 118917, "epoch": 2831} {"train_loss": -6.594407558441162, "global_step": 118918, "epoch": 2831} {"train_loss": -6.537616729736328, "global_step": 118919, "epoch": 2831} {"train_loss": -6.530447006225586, "global_step": 118920, "epoch": 2831} {"train_loss": -6.581952095031738, "global_step": 118921, "epoch": 2831} {"train_loss": -6.535805702209473, "global_step": 118922, "epoch": 2831} {"train_loss": -6.637119293212891, "global_step": 118923, "epoch": 2831} {"train_loss": -6.645380020141602, "global_step": 118924, "epoch": 2831} {"train_loss": -6.4388837814331055, "global_step": 118925, "epoch": 2831} {"train_loss": -6.598401069641113, "global_step": 118926, "epoch": 2831} {"train_loss": -6.454562664031982, "global_step": 118927, "epoch": 2831} {"train_loss": -6.604567527770996, "global_step": 118928, "epoch": 2831} {"train_loss": -6.615135192871094, "global_step": 118929, "epoch": 2831} {"train_loss": -6.5293121337890625, "global_step": 118930, "epoch": 2831} {"train_loss": -6.476046085357666, "global_step": 118931, "epoch": 2831} {"train_loss": -6.589117050170898, "global_step": 118932, "epoch": 2831} {"train_loss": -6.557715892791748, "global_step": 118933, "epoch": 2831} {"train_loss": -6.515646457672119, "global_step": 118934, "epoch": 2831} {"train_loss": -6.542820453643799, "global_step": 118935, "epoch": 2831} {"train_loss": -6.5823974609375, "global_step": 118936, "epoch": 2831} {"train_loss": -6.639449596405029, "global_step": 118937, "epoch": 2831} {"train_loss": -6.516695976257324, "global_step": 118938, "epoch": 2831} {"train_loss": -6.566657066345215, "global_step": 118939, "epoch": 2831} {"train_loss": -6.648311614990234, "global_step": 118940, "epoch": 2831} {"train_loss": -6.568137168884277, "global_step": 118941, "epoch": 2831} {"train_loss": -6.685441017150879, "global_step": 118942, "epoch": 2831} {"train_loss": -6.575677565165928, "global_step": 118943, "epoch": 2831, "val_loss": 65640.015625} {"train_loss": -6.647928237915039, "global_step": 118944, "epoch": 2832} {"train_loss": -6.550374984741211, "global_step": 118945, "epoch": 2832} {"train_loss": -6.489221572875977, "global_step": 118946, "epoch": 2832} {"train_loss": -6.609601020812988, "global_step": 118947, "epoch": 2832} {"train_loss": -6.620671272277832, "global_step": 118948, "epoch": 2832} {"train_loss": -6.439719200134277, "global_step": 118949, "epoch": 2832} {"train_loss": -6.632352352142334, "global_step": 118950, "epoch": 2832} {"train_loss": -6.542218208312988, "global_step": 118951, "epoch": 2832} {"train_loss": -6.579543113708496, "global_step": 118952, "epoch": 2832} {"train_loss": -6.501996994018555, "global_step": 118953, "epoch": 2832} {"train_loss": -6.614914894104004, "global_step": 118954, "epoch": 2832} {"train_loss": -6.596238136291504, "global_step": 118955, "epoch": 2832} {"train_loss": -6.658397674560547, "global_step": 118956, "epoch": 2832} {"train_loss": -6.641357421875, "global_step": 118957, "epoch": 2832} {"train_loss": -6.4955830574035645, "global_step": 118958, "epoch": 2832} {"train_loss": -6.595586776733398, "global_step": 118959, "epoch": 2832} {"train_loss": -6.460914611816406, "global_step": 118960, "epoch": 2832} {"train_loss": -6.49057674407959, "global_step": 118961, "epoch": 2832} {"train_loss": -6.545838356018066, "global_step": 118962, "epoch": 2832} {"train_loss": -6.540088653564453, "global_step": 118963, "epoch": 2832} {"train_loss": -6.521073341369629, "global_step": 118964, "epoch": 2832} {"train_loss": -6.485936641693115, "global_step": 118965, "epoch": 2832} {"train_loss": -6.478989124298096, "global_step": 118966, "epoch": 2832} {"train_loss": -6.480520725250244, "global_step": 118967, "epoch": 2832} {"train_loss": -6.6064958572387695, "global_step": 118968, "epoch": 2832} {"train_loss": -6.515404224395752, "global_step": 118969, "epoch": 2832} {"train_loss": -6.573441505432129, "global_step": 118970, "epoch": 2832} {"train_loss": -6.5584397315979, "global_step": 118971, "epoch": 2832} {"train_loss": -6.4760589599609375, "global_step": 118972, "epoch": 2832} {"train_loss": -6.616924285888672, "global_step": 118973, "epoch": 2832} {"train_loss": -6.581048011779785, "global_step": 118974, "epoch": 2832} {"train_loss": -6.559298515319824, "global_step": 118975, "epoch": 2832} {"train_loss": -6.5804548263549805, "global_step": 118976, "epoch": 2832} {"train_loss": -6.551039695739746, "global_step": 118977, "epoch": 2832} {"train_loss": -6.5789031982421875, "global_step": 118978, "epoch": 2832} {"train_loss": -6.593764305114746, "global_step": 118979, "epoch": 2832} {"train_loss": -6.610649108886719, "global_step": 118980, "epoch": 2832} {"train_loss": -6.501593589782715, "global_step": 118981, "epoch": 2832} {"train_loss": -6.536701202392578, "global_step": 118982, "epoch": 2832} {"train_loss": -6.598111152648926, "global_step": 118983, "epoch": 2832} {"train_loss": -6.562868118286133, "global_step": 118984, "epoch": 2832} {"train_loss": -6.55719146274385, "global_step": 118985, "epoch": 2832, "val_loss": 65712.6875} {"train_loss": -6.663025379180908, "global_step": 118986, "epoch": 2833} {"train_loss": -6.647958755493164, "global_step": 118987, "epoch": 2833} {"train_loss": -6.651027679443359, "global_step": 118988, "epoch": 2833} {"train_loss": -6.622377395629883, "global_step": 118989, "epoch": 2833} {"train_loss": -6.514662742614746, "global_step": 118990, "epoch": 2833} {"train_loss": -6.54912805557251, "global_step": 118991, "epoch": 2833} {"train_loss": -6.564923286437988, "global_step": 118992, "epoch": 2833} {"train_loss": -6.620325088500977, "global_step": 118993, "epoch": 2833} {"train_loss": -6.559226036071777, "global_step": 118994, "epoch": 2833} {"train_loss": -6.54877233505249, "global_step": 118995, "epoch": 2833} {"train_loss": -6.498415470123291, "global_step": 118996, "epoch": 2833} {"train_loss": -6.4433112144470215, "global_step": 118997, "epoch": 2833} {"train_loss": -6.607329845428467, "global_step": 118998, "epoch": 2833} {"train_loss": -6.532858848571777, "global_step": 118999, "epoch": 2833} {"train_loss": -6.577157497406006, "global_step": 119000, "epoch": 2833} {"train_loss": -6.693159103393555, "global_step": 119001, "epoch": 2833} {"train_loss": -6.440129280090332, "global_step": 119002, "epoch": 2833} {"train_loss": -6.537834167480469, "global_step": 119003, "epoch": 2833} {"train_loss": -6.527249336242676, "global_step": 119004, "epoch": 2833} {"train_loss": -6.547174453735352, "global_step": 119005, "epoch": 2833} {"train_loss": -6.629971504211426, "global_step": 119006, "epoch": 2833} {"train_loss": -6.4080047607421875, "global_step": 119007, "epoch": 2833} {"train_loss": -6.623568058013916, "global_step": 119008, "epoch": 2833} {"train_loss": -6.511041641235352, "global_step": 119009, "epoch": 2833} {"train_loss": -6.472737789154053, "global_step": 119010, "epoch": 2833} {"train_loss": -6.644607067108154, "global_step": 119011, "epoch": 2833} {"train_loss": -6.469515323638916, "global_step": 119012, "epoch": 2833} {"train_loss": -6.535750389099121, "global_step": 119013, "epoch": 2833} {"train_loss": -6.551336288452148, "global_step": 119014, "epoch": 2833} {"train_loss": -6.47335147857666, "global_step": 119015, "epoch": 2833} {"train_loss": -6.464350700378418, "global_step": 119016, "epoch": 2833} {"train_loss": -6.52537202835083, "global_step": 119017, "epoch": 2833} {"train_loss": -6.5958476066589355, "global_step": 119018, "epoch": 2833} {"train_loss": -6.580230712890625, "global_step": 119019, "epoch": 2833} {"train_loss": -6.558297157287598, "global_step": 119020, "epoch": 2833} {"train_loss": -6.550107002258301, "global_step": 119021, "epoch": 2833} {"train_loss": -6.369170188903809, "global_step": 119022, "epoch": 2833} {"train_loss": -6.57255744934082, "global_step": 119023, "epoch": 2833} {"train_loss": -6.519783973693848, "global_step": 119024, "epoch": 2833} {"train_loss": -6.530383110046387, "global_step": 119025, "epoch": 2833} {"train_loss": -6.548008918762207, "global_step": 119026, "epoch": 2833} {"train_loss": -6.545809609549386, "global_step": 119027, "epoch": 2833, "val_loss": 65583.609375} {"train_loss": -6.413199424743652, "global_step": 119028, "epoch": 2834} {"train_loss": -6.468662261962891, "global_step": 119029, "epoch": 2834} {"train_loss": -6.533607482910156, "global_step": 119030, "epoch": 2834} {"train_loss": -6.580672264099121, "global_step": 119031, "epoch": 2834} {"train_loss": -6.612297534942627, "global_step": 119032, "epoch": 2834} {"train_loss": -6.559965133666992, "global_step": 119033, "epoch": 2834} {"train_loss": -6.477817058563232, "global_step": 119034, "epoch": 2834} {"train_loss": -6.557135581970215, "global_step": 119035, "epoch": 2834} {"train_loss": -6.551405429840088, "global_step": 119036, "epoch": 2834} {"train_loss": -6.514414310455322, "global_step": 119037, "epoch": 2834} {"train_loss": -6.635232448577881, "global_step": 119038, "epoch": 2834} {"train_loss": -6.5432233810424805, "global_step": 119039, "epoch": 2834} {"train_loss": -6.506030559539795, "global_step": 119040, "epoch": 2834} {"train_loss": -6.564794540405273, "global_step": 119041, "epoch": 2834} {"train_loss": -6.52144193649292, "global_step": 119042, "epoch": 2834} {"train_loss": -6.5950236320495605, "global_step": 119043, "epoch": 2834} {"train_loss": -6.490352153778076, "global_step": 119044, "epoch": 2834} {"train_loss": -6.507597923278809, "global_step": 119045, "epoch": 2834} {"train_loss": -6.573700904846191, "global_step": 119046, "epoch": 2834} {"train_loss": -6.635801315307617, "global_step": 119047, "epoch": 2834} {"train_loss": -6.662173271179199, "global_step": 119048, "epoch": 2834} {"train_loss": -6.599854469299316, "global_step": 119049, "epoch": 2834} {"train_loss": -6.547439098358154, "global_step": 119050, "epoch": 2834} {"train_loss": -6.536043167114258, "global_step": 119051, "epoch": 2834} {"train_loss": -6.614946365356445, "global_step": 119052, "epoch": 2834} {"train_loss": -6.592629432678223, "global_step": 119053, "epoch": 2834} {"train_loss": -6.6120100021362305, "global_step": 119054, "epoch": 2834} {"train_loss": -6.65726900100708, "global_step": 119055, "epoch": 2834} {"train_loss": -6.6201066970825195, "global_step": 119056, "epoch": 2834} {"train_loss": -6.575839042663574, "global_step": 119057, "epoch": 2834} {"train_loss": -6.506892204284668, "global_step": 119058, "epoch": 2834} {"train_loss": -6.614678382873535, "global_step": 119059, "epoch": 2834} {"train_loss": -6.5709028244018555, "global_step": 119060, "epoch": 2834} {"train_loss": -6.472693920135498, "global_step": 119061, "epoch": 2834} {"train_loss": -6.604101657867432, "global_step": 119062, "epoch": 2834} {"train_loss": -6.509380340576172, "global_step": 119063, "epoch": 2834} {"train_loss": -6.596720218658447, "global_step": 119064, "epoch": 2834} {"train_loss": -6.644894123077393, "global_step": 119065, "epoch": 2834} {"train_loss": -6.405849456787109, "global_step": 119066, "epoch": 2834} {"train_loss": -6.591073036193848, "global_step": 119067, "epoch": 2834} {"train_loss": -6.565646171569824, "global_step": 119068, "epoch": 2834} {"train_loss": -6.559525228682018, "global_step": 119069, "epoch": 2834, "val_loss": 65644.3125} {"train_loss": -6.657395362854004, "global_step": 119070, "epoch": 2835} {"train_loss": -6.685495853424072, "global_step": 119071, "epoch": 2835} {"train_loss": -6.511759281158447, "global_step": 119072, "epoch": 2835} {"train_loss": -6.678023338317871, "global_step": 119073, "epoch": 2835} {"train_loss": -6.5893049240112305, "global_step": 119074, "epoch": 2835} {"train_loss": -6.6665544509887695, "global_step": 119075, "epoch": 2835} {"train_loss": -6.58756160736084, "global_step": 119076, "epoch": 2835} {"train_loss": -6.586681842803955, "global_step": 119077, "epoch": 2835} {"train_loss": -6.53364372253418, "global_step": 119078, "epoch": 2835} {"train_loss": -6.543569564819336, "global_step": 119079, "epoch": 2835} {"train_loss": -6.617358207702637, "global_step": 119080, "epoch": 2835} {"train_loss": -6.519132614135742, "global_step": 119081, "epoch": 2835} {"train_loss": -6.691741943359375, "global_step": 119082, "epoch": 2835} {"train_loss": -6.52436637878418, "global_step": 119083, "epoch": 2835} {"train_loss": -6.566826820373535, "global_step": 119084, "epoch": 2835} {"train_loss": -6.630504131317139, "global_step": 119085, "epoch": 2835} {"train_loss": -6.63857364654541, "global_step": 119086, "epoch": 2835} {"train_loss": -6.477309226989746, "global_step": 119087, "epoch": 2835} {"train_loss": -6.687047958374023, "global_step": 119088, "epoch": 2835} {"train_loss": -6.6303558349609375, "global_step": 119089, "epoch": 2835} {"train_loss": -6.666718006134033, "global_step": 119090, "epoch": 2835} {"train_loss": -6.531169891357422, "global_step": 119091, "epoch": 2835} {"train_loss": -6.648859977722168, "global_step": 119092, "epoch": 2835} {"train_loss": -6.491066932678223, "global_step": 119093, "epoch": 2835} {"train_loss": -6.410467147827148, "global_step": 119094, "epoch": 2835} {"train_loss": -6.580865859985352, "global_step": 119095, "epoch": 2835} {"train_loss": -6.5935211181640625, "global_step": 119096, "epoch": 2835} {"train_loss": -6.516326904296875, "global_step": 119097, "epoch": 2835} {"train_loss": -6.494085311889648, "global_step": 119098, "epoch": 2835} {"train_loss": -6.6747236251831055, "global_step": 119099, "epoch": 2835} {"train_loss": -6.5284552574157715, "global_step": 119100, "epoch": 2835} {"train_loss": -6.602595329284668, "global_step": 119101, "epoch": 2835} {"train_loss": -6.680445194244385, "global_step": 119102, "epoch": 2835} {"train_loss": -6.6142730712890625, "global_step": 119103, "epoch": 2835} {"train_loss": -6.579822540283203, "global_step": 119104, "epoch": 2835} {"train_loss": -6.626705169677734, "global_step": 119105, "epoch": 2835} {"train_loss": -6.540591239929199, "global_step": 119106, "epoch": 2835} {"train_loss": -6.570982933044434, "global_step": 119107, "epoch": 2835} {"train_loss": -6.551446914672852, "global_step": 119108, "epoch": 2835} {"train_loss": -6.541674613952637, "global_step": 119109, "epoch": 2835} {"train_loss": -6.563288688659668, "global_step": 119110, "epoch": 2835} {"train_loss": -6.585029738289969, "global_step": 119111, "epoch": 2835, "val_loss": 65674.5546875} {"train_loss": -6.513983726501465, "global_step": 119112, "epoch": 2836} {"train_loss": -6.588687419891357, "global_step": 119113, "epoch": 2836} {"train_loss": -6.59437894821167, "global_step": 119114, "epoch": 2836} {"train_loss": -6.385415554046631, "global_step": 119115, "epoch": 2836} {"train_loss": -6.621157169342041, "global_step": 119116, "epoch": 2836} {"train_loss": -6.352430820465088, "global_step": 119117, "epoch": 2836} {"train_loss": -6.389901161193848, "global_step": 119118, "epoch": 2836} {"train_loss": -6.441266059875488, "global_step": 119119, "epoch": 2836} {"train_loss": -6.31195592880249, "global_step": 119120, "epoch": 2836} {"train_loss": -6.401157379150391, "global_step": 119121, "epoch": 2836} {"train_loss": -6.329485893249512, "global_step": 119122, "epoch": 2836} {"train_loss": -6.488048553466797, "global_step": 119123, "epoch": 2836} {"train_loss": -6.406434059143066, "global_step": 119124, "epoch": 2836} {"train_loss": -6.431124687194824, "global_step": 119125, "epoch": 2836} {"train_loss": -6.511748790740967, "global_step": 119126, "epoch": 2836} {"train_loss": -6.52920389175415, "global_step": 119127, "epoch": 2836} {"train_loss": -6.313162803649902, "global_step": 119128, "epoch": 2836} {"train_loss": -6.53282356262207, "global_step": 119129, "epoch": 2836} {"train_loss": -6.609484672546387, "global_step": 119130, "epoch": 2836} {"train_loss": -6.473628997802734, "global_step": 119131, "epoch": 2836} {"train_loss": -6.5406904220581055, "global_step": 119132, "epoch": 2836} {"train_loss": -6.510581016540527, "global_step": 119133, "epoch": 2836} {"train_loss": -6.499308109283447, "global_step": 119134, "epoch": 2836} {"train_loss": -6.539686679840088, "global_step": 119135, "epoch": 2836} {"train_loss": -6.492227554321289, "global_step": 119136, "epoch": 2836} {"train_loss": -6.3436055183410645, "global_step": 119137, "epoch": 2836} {"train_loss": -6.5802388191223145, "global_step": 119138, "epoch": 2836} {"train_loss": -6.447636127471924, "global_step": 119139, "epoch": 2836} {"train_loss": -6.588516712188721, "global_step": 119140, "epoch": 2836} {"train_loss": -6.526852130889893, "global_step": 119141, "epoch": 2836} {"train_loss": -6.447305679321289, "global_step": 119142, "epoch": 2836} {"train_loss": -6.458681106567383, "global_step": 119143, "epoch": 2836} {"train_loss": -6.572561264038086, "global_step": 119144, "epoch": 2836} {"train_loss": -6.584129333496094, "global_step": 119145, "epoch": 2836} {"train_loss": -6.5249457359313965, "global_step": 119146, "epoch": 2836} {"train_loss": -6.5452165603637695, "global_step": 119147, "epoch": 2836} {"train_loss": -6.606451988220215, "global_step": 119148, "epoch": 2836} {"train_loss": -6.526742458343506, "global_step": 119149, "epoch": 2836} {"train_loss": -6.526061534881592, "global_step": 119150, "epoch": 2836} {"train_loss": -6.640240669250488, "global_step": 119151, "epoch": 2836} {"train_loss": -6.476107597351074, "global_step": 119152, "epoch": 2836} {"train_loss": -6.493917170025053, "global_step": 119153, "epoch": 2836, "val_loss": 65801.9296875} {"train_loss": -6.556949615478516, "global_step": 119154, "epoch": 2837} {"train_loss": -6.5189361572265625, "global_step": 119155, "epoch": 2837} {"train_loss": -6.517378807067871, "global_step": 119156, "epoch": 2837} {"train_loss": -6.547053337097168, "global_step": 119157, "epoch": 2837} {"train_loss": -6.540866851806641, "global_step": 119158, "epoch": 2837} {"train_loss": -6.653769016265869, "global_step": 119159, "epoch": 2837} {"train_loss": -6.578739643096924, "global_step": 119160, "epoch": 2837} {"train_loss": -6.518024444580078, "global_step": 119161, "epoch": 2837} {"train_loss": -6.480093002319336, "global_step": 119162, "epoch": 2837} {"train_loss": -6.5601301193237305, "global_step": 119163, "epoch": 2837} {"train_loss": -6.554352760314941, "global_step": 119164, "epoch": 2837} {"train_loss": -6.651026248931885, "global_step": 119165, "epoch": 2837} {"train_loss": -6.554436683654785, "global_step": 119166, "epoch": 2837} {"train_loss": -6.560739517211914, "global_step": 119167, "epoch": 2837} {"train_loss": -6.572138786315918, "global_step": 119168, "epoch": 2837} {"train_loss": -6.557287693023682, "global_step": 119169, "epoch": 2837} {"train_loss": -6.6548871994018555, "global_step": 119170, "epoch": 2837} {"train_loss": -6.683414936065674, "global_step": 119171, "epoch": 2837} {"train_loss": -6.548072338104248, "global_step": 119172, "epoch": 2837} {"train_loss": -6.635629653930664, "global_step": 119173, "epoch": 2837} {"train_loss": -6.6125383377075195, "global_step": 119174, "epoch": 2837} {"train_loss": -6.509185314178467, "global_step": 119175, "epoch": 2837} {"train_loss": -6.550952911376953, "global_step": 119176, "epoch": 2837} {"train_loss": -6.504693984985352, "global_step": 119177, "epoch": 2837} {"train_loss": -6.605745315551758, "global_step": 119178, "epoch": 2837} {"train_loss": -6.641142845153809, "global_step": 119179, "epoch": 2837} {"train_loss": -6.538619041442871, "global_step": 119180, "epoch": 2837} {"train_loss": -6.710844039916992, "global_step": 119181, "epoch": 2837} {"train_loss": -6.446934223175049, "global_step": 119182, "epoch": 2837} {"train_loss": -6.626936912536621, "global_step": 119183, "epoch": 2837} {"train_loss": -6.640442848205566, "global_step": 119184, "epoch": 2837} {"train_loss": -6.616184234619141, "global_step": 119185, "epoch": 2837} {"train_loss": -6.5645294189453125, "global_step": 119186, "epoch": 2837} {"train_loss": -6.710002422332764, "global_step": 119187, "epoch": 2837} {"train_loss": -6.615382671356201, "global_step": 119188, "epoch": 2837} {"train_loss": -6.560379505157471, "global_step": 119189, "epoch": 2837} {"train_loss": -6.586856842041016, "global_step": 119190, "epoch": 2837} {"train_loss": -6.666919231414795, "global_step": 119191, "epoch": 2837} {"train_loss": -6.626829624176025, "global_step": 119192, "epoch": 2837} {"train_loss": -6.755881309509277, "global_step": 119193, "epoch": 2837} {"train_loss": -6.600606918334961, "global_step": 119194, "epoch": 2837} {"train_loss": -6.590301434199016, "global_step": 119195, "epoch": 2837, "val_loss": 65873.2109375} {"train_loss": -6.519941806793213, "global_step": 119196, "epoch": 2838} {"train_loss": -6.636348247528076, "global_step": 119197, "epoch": 2838} {"train_loss": -6.541436195373535, "global_step": 119198, "epoch": 2838} {"train_loss": -6.636022090911865, "global_step": 119199, "epoch": 2838} {"train_loss": -6.59058952331543, "global_step": 119200, "epoch": 2838} {"train_loss": -6.525286674499512, "global_step": 119201, "epoch": 2838} {"train_loss": -6.648524761199951, "global_step": 119202, "epoch": 2838} {"train_loss": -6.460479736328125, "global_step": 119203, "epoch": 2838} {"train_loss": -6.495479583740234, "global_step": 119204, "epoch": 2838} {"train_loss": -6.351485252380371, "global_step": 119205, "epoch": 2838} {"train_loss": -6.490861892700195, "global_step": 119206, "epoch": 2838} {"train_loss": -6.4438652992248535, "global_step": 119207, "epoch": 2838} {"train_loss": -6.384622573852539, "global_step": 119208, "epoch": 2838} {"train_loss": -6.4242753982543945, "global_step": 119209, "epoch": 2838} {"train_loss": -6.565790176391602, "global_step": 119210, "epoch": 2838} {"train_loss": -6.395524501800537, "global_step": 119211, "epoch": 2838} {"train_loss": -6.502200126647949, "global_step": 119212, "epoch": 2838} {"train_loss": -6.579606056213379, "global_step": 119213, "epoch": 2838} {"train_loss": -6.461962699890137, "global_step": 119214, "epoch": 2838} {"train_loss": -6.533452033996582, "global_step": 119215, "epoch": 2838} {"train_loss": -6.534881591796875, "global_step": 119216, "epoch": 2838} {"train_loss": -6.481870174407959, "global_step": 119217, "epoch": 2838} {"train_loss": -6.532258987426758, "global_step": 119218, "epoch": 2838} {"train_loss": -6.571988582611084, "global_step": 119219, "epoch": 2838} {"train_loss": -6.444876194000244, "global_step": 119220, "epoch": 2838} {"train_loss": -6.480354309082031, "global_step": 119221, "epoch": 2838} {"train_loss": -6.686891078948975, "global_step": 119222, "epoch": 2838} {"train_loss": -6.365516185760498, "global_step": 119223, "epoch": 2838} {"train_loss": -6.62874698638916, "global_step": 119224, "epoch": 2838} {"train_loss": -6.388402938842773, "global_step": 119225, "epoch": 2838} {"train_loss": -6.4749555587768555, "global_step": 119226, "epoch": 2838} {"train_loss": -6.494897842407227, "global_step": 119227, "epoch": 2838} {"train_loss": -6.5013322830200195, "global_step": 119228, "epoch": 2838} {"train_loss": -6.425800800323486, "global_step": 119229, "epoch": 2838} {"train_loss": -6.445463180541992, "global_step": 119230, "epoch": 2838} {"train_loss": -6.490937232971191, "global_step": 119231, "epoch": 2838} {"train_loss": -6.469331741333008, "global_step": 119232, "epoch": 2838} {"train_loss": -6.546095371246338, "global_step": 119233, "epoch": 2838} {"train_loss": -6.521569728851318, "global_step": 119234, "epoch": 2838} {"train_loss": -6.382380485534668, "global_step": 119235, "epoch": 2838} {"train_loss": -6.496525287628174, "global_step": 119236, "epoch": 2838} {"train_loss": -6.502789747147333, "global_step": 119237, "epoch": 2838, "val_loss": 65774.015625} {"train_loss": -6.508543968200684, "global_step": 119238, "epoch": 2839} {"train_loss": -6.584963321685791, "global_step": 119239, "epoch": 2839} {"train_loss": -6.604844093322754, "global_step": 119240, "epoch": 2839} {"train_loss": -6.62047004699707, "global_step": 119241, "epoch": 2839} {"train_loss": -6.661674499511719, "global_step": 119242, "epoch": 2839} {"train_loss": -6.544496059417725, "global_step": 119243, "epoch": 2839} {"train_loss": -6.507638931274414, "global_step": 119244, "epoch": 2839} {"train_loss": -6.6335954666137695, "global_step": 119245, "epoch": 2839} {"train_loss": -6.596564292907715, "global_step": 119246, "epoch": 2839} {"train_loss": -6.450878620147705, "global_step": 119247, "epoch": 2839} {"train_loss": -6.6739888191223145, "global_step": 119248, "epoch": 2839} {"train_loss": -6.426694393157959, "global_step": 119249, "epoch": 2839} {"train_loss": -6.5086350440979, "global_step": 119250, "epoch": 2839} {"train_loss": -6.522590637207031, "global_step": 119251, "epoch": 2839} {"train_loss": -6.376208782196045, "global_step": 119252, "epoch": 2839} {"train_loss": -6.458958625793457, "global_step": 119253, "epoch": 2839} {"train_loss": -6.308056831359863, "global_step": 119254, "epoch": 2839} {"train_loss": -6.5091352462768555, "global_step": 119255, "epoch": 2839} {"train_loss": -6.402712345123291, "global_step": 119256, "epoch": 2839} {"train_loss": -6.41865348815918, "global_step": 119257, "epoch": 2839} {"train_loss": -6.56398344039917, "global_step": 119258, "epoch": 2839} {"train_loss": -6.4510602951049805, "global_step": 119259, "epoch": 2839} {"train_loss": -6.530465126037598, "global_step": 119260, "epoch": 2839} {"train_loss": -6.514010429382324, "global_step": 119261, "epoch": 2839} {"train_loss": -6.578122615814209, "global_step": 119262, "epoch": 2839} {"train_loss": -6.581386566162109, "global_step": 119263, "epoch": 2839} {"train_loss": -6.75535249710083, "global_step": 119264, "epoch": 2839} {"train_loss": -6.668079853057861, "global_step": 119265, "epoch": 2839} {"train_loss": -6.522037506103516, "global_step": 119266, "epoch": 2839} {"train_loss": -6.545125484466553, "global_step": 119267, "epoch": 2839} {"train_loss": -6.548108100891113, "global_step": 119268, "epoch": 2839} {"train_loss": -6.471379280090332, "global_step": 119269, "epoch": 2839} {"train_loss": -6.541776657104492, "global_step": 119270, "epoch": 2839} {"train_loss": -6.605799674987793, "global_step": 119271, "epoch": 2839} {"train_loss": -6.585210800170898, "global_step": 119272, "epoch": 2839} {"train_loss": -6.575138092041016, "global_step": 119273, "epoch": 2839} {"train_loss": -6.4672651290893555, "global_step": 119274, "epoch": 2839} {"train_loss": -6.459019184112549, "global_step": 119275, "epoch": 2839} {"train_loss": -6.640581130981445, "global_step": 119276, "epoch": 2839} {"train_loss": -6.570283889770508, "global_step": 119277, "epoch": 2839} {"train_loss": -6.563124656677246, "global_step": 119278, "epoch": 2839} {"train_loss": -6.536103884379069, "global_step": 119279, "epoch": 2839, "val_loss": 65791.640625} {"train_loss": -6.554758071899414, "global_step": 119280, "epoch": 2840} {"train_loss": -6.5084309577941895, "global_step": 119281, "epoch": 2840} {"train_loss": -6.726039886474609, "global_step": 119282, "epoch": 2840} {"train_loss": -6.548473358154297, "global_step": 119283, "epoch": 2840} {"train_loss": -6.62367057800293, "global_step": 119284, "epoch": 2840} {"train_loss": -6.37370491027832, "global_step": 119285, "epoch": 2840} {"train_loss": -6.439406871795654, "global_step": 119286, "epoch": 2840} {"train_loss": -6.491172790527344, "global_step": 119287, "epoch": 2840} {"train_loss": -6.49491024017334, "global_step": 119288, "epoch": 2840} {"train_loss": -6.541264057159424, "global_step": 119289, "epoch": 2840} {"train_loss": -6.481463432312012, "global_step": 119290, "epoch": 2840} {"train_loss": -6.544086456298828, "global_step": 119291, "epoch": 2840} {"train_loss": -6.501886367797852, "global_step": 119292, "epoch": 2840} {"train_loss": -6.535388946533203, "global_step": 119293, "epoch": 2840} {"train_loss": -6.4455976486206055, "global_step": 119294, "epoch": 2840} {"train_loss": -6.442440986633301, "global_step": 119295, "epoch": 2840} {"train_loss": -6.506408214569092, "global_step": 119296, "epoch": 2840} {"train_loss": -6.47384786605835, "global_step": 119297, "epoch": 2840} {"train_loss": -6.579787731170654, "global_step": 119298, "epoch": 2840} {"train_loss": -6.6223978996276855, "global_step": 119299, "epoch": 2840} {"train_loss": -6.5869340896606445, "global_step": 119300, "epoch": 2840} {"train_loss": -6.451224327087402, "global_step": 119301, "epoch": 2840} {"train_loss": -6.638965606689453, "global_step": 119302, "epoch": 2840} {"train_loss": -6.527202606201172, "global_step": 119303, "epoch": 2840} {"train_loss": -6.650259971618652, "global_step": 119304, "epoch": 2840} {"train_loss": -6.572103500366211, "global_step": 119305, "epoch": 2840} {"train_loss": -6.553138732910156, "global_step": 119306, "epoch": 2840} {"train_loss": -6.543355464935303, "global_step": 119307, "epoch": 2840} {"train_loss": -6.490970611572266, "global_step": 119308, "epoch": 2840} {"train_loss": -6.500706672668457, "global_step": 119309, "epoch": 2840} {"train_loss": -6.582469940185547, "global_step": 119310, "epoch": 2840} {"train_loss": -6.5496296882629395, "global_step": 119311, "epoch": 2840} {"train_loss": -6.618602752685547, "global_step": 119312, "epoch": 2840} {"train_loss": -6.557845592498779, "global_step": 119313, "epoch": 2840} {"train_loss": -6.543817520141602, "global_step": 119314, "epoch": 2840} {"train_loss": -6.591744422912598, "global_step": 119315, "epoch": 2840} {"train_loss": -6.6264801025390625, "global_step": 119316, "epoch": 2840} {"train_loss": -6.571983814239502, "global_step": 119317, "epoch": 2840} {"train_loss": -6.480912208557129, "global_step": 119318, "epoch": 2840} {"train_loss": -6.598073482513428, "global_step": 119319, "epoch": 2840} {"train_loss": -6.509673118591309, "global_step": 119320, "epoch": 2840} {"train_loss": -6.545811709903536, "global_step": 119321, "epoch": 2840, "val_loss": 65599.9609375} {"train_loss": -6.515683650970459, "global_step": 119322, "epoch": 2841} {"train_loss": -6.532997131347656, "global_step": 119323, "epoch": 2841} {"train_loss": -6.62603759765625, "global_step": 119324, "epoch": 2841} {"train_loss": -6.4814276695251465, "global_step": 119325, "epoch": 2841} {"train_loss": -6.617031097412109, "global_step": 119326, "epoch": 2841} {"train_loss": -6.4614715576171875, "global_step": 119327, "epoch": 2841} {"train_loss": -6.547610759735107, "global_step": 119328, "epoch": 2841} {"train_loss": -6.5520477294921875, "global_step": 119329, "epoch": 2841} {"train_loss": -6.631732940673828, "global_step": 119330, "epoch": 2841} {"train_loss": -6.464341163635254, "global_step": 119331, "epoch": 2841} {"train_loss": -6.513233184814453, "global_step": 119332, "epoch": 2841} {"train_loss": -6.577362537384033, "global_step": 119333, "epoch": 2841} {"train_loss": -6.588171005249023, "global_step": 119334, "epoch": 2841} {"train_loss": -6.463498592376709, "global_step": 119335, "epoch": 2841} {"train_loss": -6.592043876647949, "global_step": 119336, "epoch": 2841} {"train_loss": -6.638058185577393, "global_step": 119337, "epoch": 2841} {"train_loss": -6.539283752441406, "global_step": 119338, "epoch": 2841} {"train_loss": -6.663334846496582, "global_step": 119339, "epoch": 2841} {"train_loss": -6.471615791320801, "global_step": 119340, "epoch": 2841} {"train_loss": -6.467327117919922, "global_step": 119341, "epoch": 2841} {"train_loss": -6.584109306335449, "global_step": 119342, "epoch": 2841} {"train_loss": -6.576695919036865, "global_step": 119343, "epoch": 2841} {"train_loss": -6.524073600769043, "global_step": 119344, "epoch": 2841} {"train_loss": -6.423933982849121, "global_step": 119345, "epoch": 2841} {"train_loss": -6.604888439178467, "global_step": 119346, "epoch": 2841} {"train_loss": -6.477046489715576, "global_step": 119347, "epoch": 2841} {"train_loss": -6.504068851470947, "global_step": 119348, "epoch": 2841} {"train_loss": -6.574859619140625, "global_step": 119349, "epoch": 2841} {"train_loss": -6.54090690612793, "global_step": 119350, "epoch": 2841} {"train_loss": -6.498953819274902, "global_step": 119351, "epoch": 2841} {"train_loss": -6.512779712677002, "global_step": 119352, "epoch": 2841} {"train_loss": -6.532912254333496, "global_step": 119353, "epoch": 2841} {"train_loss": -6.540998458862305, "global_step": 119354, "epoch": 2841} {"train_loss": -6.558052062988281, "global_step": 119355, "epoch": 2841} {"train_loss": -6.557198524475098, "global_step": 119356, "epoch": 2841} {"train_loss": -6.674618721008301, "global_step": 119357, "epoch": 2841} {"train_loss": -6.552764892578125, "global_step": 119358, "epoch": 2841} {"train_loss": -6.541244029998779, "global_step": 119359, "epoch": 2841} {"train_loss": -6.43657112121582, "global_step": 119360, "epoch": 2841} {"train_loss": -6.58444881439209, "global_step": 119361, "epoch": 2841} {"train_loss": -6.548737525939941, "global_step": 119362, "epoch": 2841} {"train_loss": -6.5431117330278665, "global_step": 119363, "epoch": 2841, "val_loss": 65679.8515625} {"train_loss": -6.592235565185547, "global_step": 119364, "epoch": 2842} {"train_loss": -6.524251937866211, "global_step": 119365, "epoch": 2842} {"train_loss": -6.594408988952637, "global_step": 119366, "epoch": 2842} {"train_loss": -6.565157890319824, "global_step": 119367, "epoch": 2842} {"train_loss": -6.520022392272949, "global_step": 119368, "epoch": 2842} {"train_loss": -6.594491481781006, "global_step": 119369, "epoch": 2842} {"train_loss": -6.501696586608887, "global_step": 119370, "epoch": 2842} {"train_loss": -6.592394828796387, "global_step": 119371, "epoch": 2842} {"train_loss": -6.562458038330078, "global_step": 119372, "epoch": 2842} {"train_loss": -6.489441871643066, "global_step": 119373, "epoch": 2842} {"train_loss": -6.640645980834961, "global_step": 119374, "epoch": 2842} {"train_loss": -6.564980506896973, "global_step": 119375, "epoch": 2842} {"train_loss": -6.569033622741699, "global_step": 119376, "epoch": 2842} {"train_loss": -6.439526557922363, "global_step": 119377, "epoch": 2842} {"train_loss": -6.601877212524414, "global_step": 119378, "epoch": 2842} {"train_loss": -6.5247955322265625, "global_step": 119379, "epoch": 2842} {"train_loss": -6.505653381347656, "global_step": 119380, "epoch": 2842} {"train_loss": -6.558220863342285, "global_step": 119381, "epoch": 2842} {"train_loss": -6.464937210083008, "global_step": 119382, "epoch": 2842} {"train_loss": -6.627432823181152, "global_step": 119383, "epoch": 2842} {"train_loss": -6.602219581604004, "global_step": 119384, "epoch": 2842} {"train_loss": -6.475299835205078, "global_step": 119385, "epoch": 2842} {"train_loss": -6.582769393920898, "global_step": 119386, "epoch": 2842} {"train_loss": -6.548150062561035, "global_step": 119387, "epoch": 2842} {"train_loss": -6.505066871643066, "global_step": 119388, "epoch": 2842} {"train_loss": -6.683751583099365, "global_step": 119389, "epoch": 2842} {"train_loss": -6.632509231567383, "global_step": 119390, "epoch": 2842} {"train_loss": -6.585167407989502, "global_step": 119391, "epoch": 2842} {"train_loss": -6.696521759033203, "global_step": 119392, "epoch": 2842} {"train_loss": -6.521839141845703, "global_step": 119393, "epoch": 2842} {"train_loss": -6.609152793884277, "global_step": 119394, "epoch": 2842} {"train_loss": -6.620180130004883, "global_step": 119395, "epoch": 2842} {"train_loss": -6.719923496246338, "global_step": 119396, "epoch": 2842} {"train_loss": -6.619410514831543, "global_step": 119397, "epoch": 2842} {"train_loss": -6.556862831115723, "global_step": 119398, "epoch": 2842} {"train_loss": -6.549829483032227, "global_step": 119399, "epoch": 2842} {"train_loss": -6.408683776855469, "global_step": 119400, "epoch": 2842} {"train_loss": -6.4926252365112305, "global_step": 119401, "epoch": 2842} {"train_loss": -6.495143890380859, "global_step": 119402, "epoch": 2842} {"train_loss": -6.451695442199707, "global_step": 119403, "epoch": 2842} {"train_loss": -6.440616130828857, "global_step": 119404, "epoch": 2842} {"train_loss": -6.557004542577834, "global_step": 119405, "epoch": 2842, "val_loss": 65688.9375} {"train_loss": -6.62169075012207, "global_step": 119406, "epoch": 2843} {"train_loss": -6.577937126159668, "global_step": 119407, "epoch": 2843} {"train_loss": -6.634148597717285, "global_step": 119408, "epoch": 2843} {"train_loss": -6.497827529907227, "global_step": 119409, "epoch": 2843} {"train_loss": -6.60513162612915, "global_step": 119410, "epoch": 2843} {"train_loss": -6.602217674255371, "global_step": 119411, "epoch": 2843} {"train_loss": -6.5886125564575195, "global_step": 119412, "epoch": 2843} {"train_loss": -6.5156145095825195, "global_step": 119413, "epoch": 2843} {"train_loss": -6.6150898933410645, "global_step": 119414, "epoch": 2843} {"train_loss": -6.5775909423828125, "global_step": 119415, "epoch": 2843} {"train_loss": -6.591943740844727, "global_step": 119416, "epoch": 2843} {"train_loss": -6.65849494934082, "global_step": 119417, "epoch": 2843} {"train_loss": -6.60890007019043, "global_step": 119418, "epoch": 2843} {"train_loss": -6.666524887084961, "global_step": 119419, "epoch": 2843} {"train_loss": -6.509188652038574, "global_step": 119420, "epoch": 2843} {"train_loss": -6.520725250244141, "global_step": 119421, "epoch": 2843} {"train_loss": -6.516885757446289, "global_step": 119422, "epoch": 2843} {"train_loss": -6.557823181152344, "global_step": 119423, "epoch": 2843} {"train_loss": -6.6270341873168945, "global_step": 119424, "epoch": 2843} {"train_loss": -6.538675308227539, "global_step": 119425, "epoch": 2843} {"train_loss": -6.568126201629639, "global_step": 119426, "epoch": 2843} {"train_loss": -6.7031965255737305, "global_step": 119427, "epoch": 2843} {"train_loss": -6.563007831573486, "global_step": 119428, "epoch": 2843} {"train_loss": -6.692202091217041, "global_step": 119429, "epoch": 2843} {"train_loss": -6.6437764167785645, "global_step": 119430, "epoch": 2843} {"train_loss": -6.5352020263671875, "global_step": 119431, "epoch": 2843} {"train_loss": -6.549520015716553, "global_step": 119432, "epoch": 2843} {"train_loss": -6.579050540924072, "global_step": 119433, "epoch": 2843} {"train_loss": -6.669306755065918, "global_step": 119434, "epoch": 2843} {"train_loss": -6.569444179534912, "global_step": 119435, "epoch": 2843} {"train_loss": -6.5062255859375, "global_step": 119436, "epoch": 2843} {"train_loss": -6.560650825500488, "global_step": 119437, "epoch": 2843} {"train_loss": -6.544623374938965, "global_step": 119438, "epoch": 2843} {"train_loss": -6.4782915115356445, "global_step": 119439, "epoch": 2843} {"train_loss": -6.61456823348999, "global_step": 119440, "epoch": 2843} {"train_loss": -6.578080177307129, "global_step": 119441, "epoch": 2843} {"train_loss": -6.4883928298950195, "global_step": 119442, "epoch": 2843} {"train_loss": -6.508020401000977, "global_step": 119443, "epoch": 2843} {"train_loss": -6.4978179931640625, "global_step": 119444, "epoch": 2843} {"train_loss": -6.475607872009277, "global_step": 119445, "epoch": 2843} {"train_loss": -6.692256450653076, "global_step": 119446, "epoch": 2843} {"train_loss": -6.578777006694248, "global_step": 119447, "epoch": 2843, "val_loss": 65721.6953125} {"train_loss": -6.448448181152344, "global_step": 119448, "epoch": 2844} {"train_loss": -6.560929298400879, "global_step": 119449, "epoch": 2844} {"train_loss": -6.527321815490723, "global_step": 119450, "epoch": 2844} {"train_loss": -6.424561500549316, "global_step": 119451, "epoch": 2844} {"train_loss": -6.651976585388184, "global_step": 119452, "epoch": 2844} {"train_loss": -6.644654750823975, "global_step": 119453, "epoch": 2844} {"train_loss": -6.4766526222229, "global_step": 119454, "epoch": 2844} {"train_loss": -6.412501335144043, "global_step": 119455, "epoch": 2844} {"train_loss": -6.4282732009887695, "global_step": 119456, "epoch": 2844} {"train_loss": -6.572776794433594, "global_step": 119457, "epoch": 2844} {"train_loss": -6.523585319519043, "global_step": 119458, "epoch": 2844} {"train_loss": -6.297101974487305, "global_step": 119459, "epoch": 2844} {"train_loss": -6.542117118835449, "global_step": 119460, "epoch": 2844} {"train_loss": -6.362874984741211, "global_step": 119461, "epoch": 2844} {"train_loss": -6.4092512130737305, "global_step": 119462, "epoch": 2844} {"train_loss": -6.587262153625488, "global_step": 119463, "epoch": 2844} {"train_loss": -6.526800155639648, "global_step": 119464, "epoch": 2844} {"train_loss": -6.437655448913574, "global_step": 119465, "epoch": 2844} {"train_loss": -6.523985385894775, "global_step": 119466, "epoch": 2844} {"train_loss": -6.547658920288086, "global_step": 119467, "epoch": 2844} {"train_loss": -6.4644880294799805, "global_step": 119468, "epoch": 2844} {"train_loss": -6.489086151123047, "global_step": 119469, "epoch": 2844} {"train_loss": -6.545681953430176, "global_step": 119470, "epoch": 2844} {"train_loss": -6.510559558868408, "global_step": 119471, "epoch": 2844} {"train_loss": -6.441278457641602, "global_step": 119472, "epoch": 2844} {"train_loss": -6.4497785568237305, "global_step": 119473, "epoch": 2844} {"train_loss": -6.454537868499756, "global_step": 119474, "epoch": 2844} {"train_loss": -6.572071075439453, "global_step": 119475, "epoch": 2844} {"train_loss": -6.495548248291016, "global_step": 119476, "epoch": 2844} {"train_loss": -6.542886734008789, "global_step": 119477, "epoch": 2844} {"train_loss": -6.423348903656006, "global_step": 119478, "epoch": 2844} {"train_loss": -6.6451616287231445, "global_step": 119479, "epoch": 2844} {"train_loss": -6.631413459777832, "global_step": 119480, "epoch": 2844} {"train_loss": -6.439144134521484, "global_step": 119481, "epoch": 2844} {"train_loss": -6.51954460144043, "global_step": 119482, "epoch": 2844} {"train_loss": -6.5229172706604, "global_step": 119483, "epoch": 2844} {"train_loss": -6.5450334548950195, "global_step": 119484, "epoch": 2844} {"train_loss": -6.562440872192383, "global_step": 119485, "epoch": 2844} {"train_loss": -6.492100715637207, "global_step": 119486, "epoch": 2844} {"train_loss": -6.607511520385742, "global_step": 119487, "epoch": 2844} {"train_loss": -6.6247358322143555, "global_step": 119488, "epoch": 2844} {"train_loss": -6.51041267031715, "global_step": 119489, "epoch": 2844, "val_loss": 65728.0859375} {"train_loss": -6.613054275512695, "global_step": 119490, "epoch": 2845} {"train_loss": -6.4708356857299805, "global_step": 119491, "epoch": 2845} {"train_loss": -6.633354187011719, "global_step": 119492, "epoch": 2845} {"train_loss": -6.512881755828857, "global_step": 119493, "epoch": 2845} {"train_loss": -6.468216896057129, "global_step": 119494, "epoch": 2845} {"train_loss": -6.546785354614258, "global_step": 119495, "epoch": 2845} {"train_loss": -6.636030197143555, "global_step": 119496, "epoch": 2845} {"train_loss": -6.625871658325195, "global_step": 119497, "epoch": 2845} {"train_loss": -6.619340419769287, "global_step": 119498, "epoch": 2845} {"train_loss": -6.517890930175781, "global_step": 119499, "epoch": 2845} {"train_loss": -6.7177734375, "global_step": 119500, "epoch": 2845} {"train_loss": -6.466440200805664, "global_step": 119501, "epoch": 2845} {"train_loss": -6.53901481628418, "global_step": 119502, "epoch": 2845} {"train_loss": -6.468222618103027, "global_step": 119503, "epoch": 2845} {"train_loss": -6.479035377502441, "global_step": 119504, "epoch": 2845} {"train_loss": -6.5037431716918945, "global_step": 119505, "epoch": 2845} {"train_loss": -6.52037239074707, "global_step": 119506, "epoch": 2845} {"train_loss": -6.457743167877197, "global_step": 119507, "epoch": 2845} {"train_loss": -6.515233516693115, "global_step": 119508, "epoch": 2845} {"train_loss": -6.617408752441406, "global_step": 119509, "epoch": 2845} {"train_loss": -6.684659481048584, "global_step": 119510, "epoch": 2845} {"train_loss": -6.592779159545898, "global_step": 119511, "epoch": 2845} {"train_loss": -6.714771270751953, "global_step": 119512, "epoch": 2845} {"train_loss": -6.581328868865967, "global_step": 119513, "epoch": 2845} {"train_loss": -6.696177959442139, "global_step": 119514, "epoch": 2845} {"train_loss": -6.720189571380615, "global_step": 119515, "epoch": 2845} {"train_loss": -6.556596279144287, "global_step": 119516, "epoch": 2845} {"train_loss": -6.582952499389648, "global_step": 119517, "epoch": 2845} {"train_loss": -6.483882904052734, "global_step": 119518, "epoch": 2845} {"train_loss": -6.579122066497803, "global_step": 119519, "epoch": 2845} {"train_loss": -6.545574188232422, "global_step": 119520, "epoch": 2845} {"train_loss": -6.4721479415893555, "global_step": 119521, "epoch": 2845} {"train_loss": -6.581594944000244, "global_step": 119522, "epoch": 2845} {"train_loss": -6.568966388702393, "global_step": 119523, "epoch": 2845} {"train_loss": -6.654093265533447, "global_step": 119524, "epoch": 2845} {"train_loss": -6.591731071472168, "global_step": 119525, "epoch": 2845} {"train_loss": -6.590196132659912, "global_step": 119526, "epoch": 2845} {"train_loss": -6.604004859924316, "global_step": 119527, "epoch": 2845} {"train_loss": -6.4883880615234375, "global_step": 119528, "epoch": 2845} {"train_loss": -6.586844444274902, "global_step": 119529, "epoch": 2845} {"train_loss": -6.5408806800842285, "global_step": 119530, "epoch": 2845} {"train_loss": -6.567515305110386, "global_step": 119531, "epoch": 2845, "val_loss": 65651.84375} {"train_loss": -6.535153388977051, "global_step": 119532, "epoch": 2846} {"train_loss": -6.556288242340088, "global_step": 119533, "epoch": 2846} {"train_loss": -6.60661506652832, "global_step": 119534, "epoch": 2846} {"train_loss": -6.554446697235107, "global_step": 119535, "epoch": 2846} {"train_loss": -6.55851936340332, "global_step": 119536, "epoch": 2846} {"train_loss": -6.609597206115723, "global_step": 119537, "epoch": 2846} {"train_loss": -6.4836907386779785, "global_step": 119538, "epoch": 2846} {"train_loss": -6.665412902832031, "global_step": 119539, "epoch": 2846} {"train_loss": -6.645776748657227, "global_step": 119540, "epoch": 2846} {"train_loss": -6.6227874755859375, "global_step": 119541, "epoch": 2846} {"train_loss": -6.582404613494873, "global_step": 119542, "epoch": 2846} {"train_loss": -6.547114372253418, "global_step": 119543, "epoch": 2846} {"train_loss": -6.6116485595703125, "global_step": 119544, "epoch": 2846} {"train_loss": -6.414608001708984, "global_step": 119545, "epoch": 2846} {"train_loss": -6.614667892456055, "global_step": 119546, "epoch": 2846} {"train_loss": -6.542596817016602, "global_step": 119547, "epoch": 2846} {"train_loss": -6.609312534332275, "global_step": 119548, "epoch": 2846} {"train_loss": -6.528593063354492, "global_step": 119549, "epoch": 2846} {"train_loss": -6.605903148651123, "global_step": 119550, "epoch": 2846} {"train_loss": -6.5734663009643555, "global_step": 119551, "epoch": 2846} {"train_loss": -6.552301406860352, "global_step": 119552, "epoch": 2846} {"train_loss": -6.506542205810547, "global_step": 119553, "epoch": 2846} {"train_loss": -6.612343788146973, "global_step": 119554, "epoch": 2846} {"train_loss": -6.509901523590088, "global_step": 119555, "epoch": 2846} {"train_loss": -6.593855381011963, "global_step": 119556, "epoch": 2846} {"train_loss": -6.548945426940918, "global_step": 119557, "epoch": 2846} {"train_loss": -6.618056297302246, "global_step": 119558, "epoch": 2846} {"train_loss": -6.461244583129883, "global_step": 119559, "epoch": 2846} {"train_loss": -6.508252143859863, "global_step": 119560, "epoch": 2846} {"train_loss": -6.568570137023926, "global_step": 119561, "epoch": 2846} {"train_loss": -6.631782531738281, "global_step": 119562, "epoch": 2846} {"train_loss": -6.688905715942383, "global_step": 119563, "epoch": 2846} {"train_loss": -6.684802055358887, "global_step": 119564, "epoch": 2846} {"train_loss": -6.600812911987305, "global_step": 119565, "epoch": 2846} {"train_loss": -6.54594612121582, "global_step": 119566, "epoch": 2846} {"train_loss": -6.713053226470947, "global_step": 119567, "epoch": 2846} {"train_loss": -6.672517776489258, "global_step": 119568, "epoch": 2846} {"train_loss": -6.589439392089844, "global_step": 119569, "epoch": 2846} {"train_loss": -6.545441627502441, "global_step": 119570, "epoch": 2846} {"train_loss": -6.6690673828125, "global_step": 119571, "epoch": 2846} {"train_loss": -6.60561466217041, "global_step": 119572, "epoch": 2846} {"train_loss": -6.581598577045259, "global_step": 119573, "epoch": 2846, "val_loss": 65635.6875} {"train_loss": -6.6523637771606445, "global_step": 119574, "epoch": 2847} {"train_loss": -6.539502143859863, "global_step": 119575, "epoch": 2847} {"train_loss": -6.603511810302734, "global_step": 119576, "epoch": 2847} {"train_loss": -6.643355369567871, "global_step": 119577, "epoch": 2847} {"train_loss": -6.5666351318359375, "global_step": 119578, "epoch": 2847} {"train_loss": -6.573910713195801, "global_step": 119579, "epoch": 2847} {"train_loss": -6.573577404022217, "global_step": 119580, "epoch": 2847} {"train_loss": -6.645357131958008, "global_step": 119581, "epoch": 2847} {"train_loss": -6.625532150268555, "global_step": 119582, "epoch": 2847} {"train_loss": -6.518528938293457, "global_step": 119583, "epoch": 2847} {"train_loss": -6.541110515594482, "global_step": 119584, "epoch": 2847} {"train_loss": -6.562792778015137, "global_step": 119585, "epoch": 2847} {"train_loss": -6.651020050048828, "global_step": 119586, "epoch": 2847} {"train_loss": -6.482855319976807, "global_step": 119587, "epoch": 2847} {"train_loss": -6.5984206199646, "global_step": 119588, "epoch": 2847} {"train_loss": -6.587649345397949, "global_step": 119589, "epoch": 2847} {"train_loss": -6.553921699523926, "global_step": 119590, "epoch": 2847} {"train_loss": -6.514928817749023, "global_step": 119591, "epoch": 2847} {"train_loss": -6.535594940185547, "global_step": 119592, "epoch": 2847} {"train_loss": -6.540798187255859, "global_step": 119593, "epoch": 2847} {"train_loss": -6.4621076583862305, "global_step": 119594, "epoch": 2847} {"train_loss": -6.590295314788818, "global_step": 119595, "epoch": 2847} {"train_loss": -6.48123836517334, "global_step": 119596, "epoch": 2847} {"train_loss": -6.522992134094238, "global_step": 119597, "epoch": 2847} {"train_loss": -6.499815940856934, "global_step": 119598, "epoch": 2847} {"train_loss": -6.6567158699035645, "global_step": 119599, "epoch": 2847} {"train_loss": -6.55745792388916, "global_step": 119600, "epoch": 2847} {"train_loss": -6.562738418579102, "global_step": 119601, "epoch": 2847} {"train_loss": -6.577078342437744, "global_step": 119602, "epoch": 2847} {"train_loss": -6.5072221755981445, "global_step": 119603, "epoch": 2847} {"train_loss": -6.548019886016846, "global_step": 119604, "epoch": 2847} {"train_loss": -6.461411476135254, "global_step": 119605, "epoch": 2847} {"train_loss": -6.5281524658203125, "global_step": 119606, "epoch": 2847} {"train_loss": -6.437577247619629, "global_step": 119607, "epoch": 2847} {"train_loss": -6.500576019287109, "global_step": 119608, "epoch": 2847} {"train_loss": -6.528066635131836, "global_step": 119609, "epoch": 2847} {"train_loss": -6.500848770141602, "global_step": 119610, "epoch": 2847} {"train_loss": -6.593391418457031, "global_step": 119611, "epoch": 2847} {"train_loss": -6.625736713409424, "global_step": 119612, "epoch": 2847} {"train_loss": -6.631939888000488, "global_step": 119613, "epoch": 2847} {"train_loss": -6.550394058227539, "global_step": 119614, "epoch": 2847} {"train_loss": -6.558994781403315, "global_step": 119615, "epoch": 2847, "val_loss": 65693.8515625} {"train_loss": -6.6214189529418945, "global_step": 119616, "epoch": 2848} {"train_loss": -6.602878570556641, "global_step": 119617, "epoch": 2848} {"train_loss": -6.441173553466797, "global_step": 119618, "epoch": 2848} {"train_loss": -6.519637107849121, "global_step": 119619, "epoch": 2848} {"train_loss": -6.572689056396484, "global_step": 119620, "epoch": 2848} {"train_loss": -6.4806365966796875, "global_step": 119621, "epoch": 2848} {"train_loss": -6.5911664962768555, "global_step": 119622, "epoch": 2848} {"train_loss": -6.64274787902832, "global_step": 119623, "epoch": 2848} {"train_loss": -6.499987602233887, "global_step": 119624, "epoch": 2848} {"train_loss": -6.634251594543457, "global_step": 119625, "epoch": 2848} {"train_loss": -6.608365058898926, "global_step": 119626, "epoch": 2848} {"train_loss": -6.555554389953613, "global_step": 119627, "epoch": 2848} {"train_loss": -6.618585586547852, "global_step": 119628, "epoch": 2848} {"train_loss": -6.448339462280273, "global_step": 119629, "epoch": 2848} {"train_loss": -6.617907524108887, "global_step": 119630, "epoch": 2848} {"train_loss": -6.48420524597168, "global_step": 119631, "epoch": 2848} {"train_loss": -6.720741271972656, "global_step": 119632, "epoch": 2848} {"train_loss": -6.631793975830078, "global_step": 119633, "epoch": 2848} {"train_loss": -6.435060024261475, "global_step": 119634, "epoch": 2848} {"train_loss": -6.4675164222717285, "global_step": 119635, "epoch": 2848} {"train_loss": -6.5412492752075195, "global_step": 119636, "epoch": 2848} {"train_loss": -6.646010875701904, "global_step": 119637, "epoch": 2848} {"train_loss": -6.522221565246582, "global_step": 119638, "epoch": 2848} {"train_loss": -6.589782238006592, "global_step": 119639, "epoch": 2848} {"train_loss": -6.525928020477295, "global_step": 119640, "epoch": 2848} {"train_loss": -6.702919960021973, "global_step": 119641, "epoch": 2848} {"train_loss": -6.640080451965332, "global_step": 119642, "epoch": 2848} {"train_loss": -6.605464458465576, "global_step": 119643, "epoch": 2848} {"train_loss": -6.710490703582764, "global_step": 119644, "epoch": 2848} {"train_loss": -6.638968467712402, "global_step": 119645, "epoch": 2848} {"train_loss": -6.687619686126709, "global_step": 119646, "epoch": 2848} {"train_loss": -6.615429878234863, "global_step": 119647, "epoch": 2848} {"train_loss": -6.506499767303467, "global_step": 119648, "epoch": 2848} {"train_loss": -6.671712875366211, "global_step": 119649, "epoch": 2848} {"train_loss": -6.689520359039307, "global_step": 119650, "epoch": 2848} {"train_loss": -6.598454475402832, "global_step": 119651, "epoch": 2848} {"train_loss": -6.594529628753662, "global_step": 119652, "epoch": 2848} {"train_loss": -6.577880382537842, "global_step": 119653, "epoch": 2848} {"train_loss": -6.649462699890137, "global_step": 119654, "epoch": 2848} {"train_loss": -6.514909744262695, "global_step": 119655, "epoch": 2848} {"train_loss": -6.588410377502441, "global_step": 119656, "epoch": 2848} {"train_loss": -6.586677585329328, "global_step": 119657, "epoch": 2848, "val_loss": 65705.8671875} {"train_loss": -6.58168888092041, "global_step": 119658, "epoch": 2849} {"train_loss": -6.561971664428711, "global_step": 119659, "epoch": 2849} {"train_loss": -6.483092308044434, "global_step": 119660, "epoch": 2849} {"train_loss": -6.547820091247559, "global_step": 119661, "epoch": 2849} {"train_loss": -6.577173233032227, "global_step": 119662, "epoch": 2849} {"train_loss": -6.5355224609375, "global_step": 119663, "epoch": 2849} {"train_loss": -6.525152206420898, "global_step": 119664, "epoch": 2849} {"train_loss": -6.376043796539307, "global_step": 119665, "epoch": 2849} {"train_loss": -6.620240211486816, "global_step": 119666, "epoch": 2849} {"train_loss": -6.494422912597656, "global_step": 119667, "epoch": 2849} {"train_loss": -6.482273578643799, "global_step": 119668, "epoch": 2849} {"train_loss": -6.498195648193359, "global_step": 119669, "epoch": 2849} {"train_loss": -6.505385875701904, "global_step": 119670, "epoch": 2849} {"train_loss": -6.519946098327637, "global_step": 119671, "epoch": 2849} {"train_loss": -6.425477981567383, "global_step": 119672, "epoch": 2849} {"train_loss": -6.382471561431885, "global_step": 119673, "epoch": 2849} {"train_loss": -6.340956687927246, "global_step": 119674, "epoch": 2849} {"train_loss": -6.401548385620117, "global_step": 119675, "epoch": 2849} {"train_loss": -6.528861045837402, "global_step": 119676, "epoch": 2849} {"train_loss": -6.49566650390625, "global_step": 119677, "epoch": 2849} {"train_loss": -6.567476272583008, "global_step": 119678, "epoch": 2849} {"train_loss": -6.525629997253418, "global_step": 119679, "epoch": 2849} {"train_loss": -6.669933319091797, "global_step": 119680, "epoch": 2849} {"train_loss": -6.396731376647949, "global_step": 119681, "epoch": 2849} {"train_loss": -6.523537635803223, "global_step": 119682, "epoch": 2849} {"train_loss": -6.543761253356934, "global_step": 119683, "epoch": 2849} {"train_loss": -6.627963066101074, "global_step": 119684, "epoch": 2849} {"train_loss": -6.505489826202393, "global_step": 119685, "epoch": 2849} {"train_loss": -6.568082332611084, "global_step": 119686, "epoch": 2849} {"train_loss": -6.578826904296875, "global_step": 119687, "epoch": 2849} {"train_loss": -6.57499361038208, "global_step": 119688, "epoch": 2849} {"train_loss": -6.496913909912109, "global_step": 119689, "epoch": 2849} {"train_loss": -6.539829254150391, "global_step": 119690, "epoch": 2849} {"train_loss": -6.562874794006348, "global_step": 119691, "epoch": 2849} {"train_loss": -6.591946125030518, "global_step": 119692, "epoch": 2849} {"train_loss": -6.541203498840332, "global_step": 119693, "epoch": 2849} {"train_loss": -6.613616943359375, "global_step": 119694, "epoch": 2849} {"train_loss": -6.552028179168701, "global_step": 119695, "epoch": 2849} {"train_loss": -6.474203586578369, "global_step": 119696, "epoch": 2849} {"train_loss": -6.61129903793335, "global_step": 119697, "epoch": 2849} {"train_loss": -6.45057487487793, "global_step": 119698, "epoch": 2849} {"train_loss": -6.5211668241591685, "global_step": 119699, "epoch": 2849, "val_loss": 65643.2578125} {"train_loss": -6.491644382476807, "global_step": 119700, "epoch": 2850} {"train_loss": -6.586814880371094, "global_step": 119701, "epoch": 2850} {"train_loss": -6.649724006652832, "global_step": 119702, "epoch": 2850} {"train_loss": -6.583087921142578, "global_step": 119703, "epoch": 2850} {"train_loss": -6.581474304199219, "global_step": 119704, "epoch": 2850} {"train_loss": -6.560422897338867, "global_step": 119705, "epoch": 2850} {"train_loss": -6.677096843719482, "global_step": 119706, "epoch": 2850} {"train_loss": -6.729925632476807, "global_step": 119707, "epoch": 2850} {"train_loss": -6.40977668762207, "global_step": 119708, "epoch": 2850} {"train_loss": -6.681816101074219, "global_step": 119709, "epoch": 2850} {"train_loss": -6.639039993286133, "global_step": 119710, "epoch": 2850} {"train_loss": -6.608799457550049, "global_step": 119711, "epoch": 2850} {"train_loss": -6.646424293518066, "global_step": 119712, "epoch": 2850} {"train_loss": -6.65190315246582, "global_step": 119713, "epoch": 2850} {"train_loss": -6.596026420593262, "global_step": 119714, "epoch": 2850} {"train_loss": -6.55129337310791, "global_step": 119715, "epoch": 2850} {"train_loss": -6.5344343185424805, "global_step": 119716, "epoch": 2850} {"train_loss": -6.5986409187316895, "global_step": 119717, "epoch": 2850} {"train_loss": -6.515080451965332, "global_step": 119718, "epoch": 2850} {"train_loss": -6.664665699005127, "global_step": 119719, "epoch": 2850} {"train_loss": -6.561793804168701, "global_step": 119720, "epoch": 2850} {"train_loss": -6.664891242980957, "global_step": 119721, "epoch": 2850} {"train_loss": -6.591226577758789, "global_step": 119722, "epoch": 2850} {"train_loss": -6.482052803039551, "global_step": 119723, "epoch": 2850} {"train_loss": -6.585019111633301, "global_step": 119724, "epoch": 2850} {"train_loss": -6.647001266479492, "global_step": 119725, "epoch": 2850} {"train_loss": -6.599097728729248, "global_step": 119726, "epoch": 2850} {"train_loss": -6.617993354797363, "global_step": 119727, "epoch": 2850} {"train_loss": -6.564908027648926, "global_step": 119728, "epoch": 2850} {"train_loss": -6.627838134765625, "global_step": 119729, "epoch": 2850} {"train_loss": -6.478084564208984, "global_step": 119730, "epoch": 2850} {"train_loss": -6.483938217163086, "global_step": 119731, "epoch": 2850} {"train_loss": -6.602354049682617, "global_step": 119732, "epoch": 2850} {"train_loss": -6.539088726043701, "global_step": 119733, "epoch": 2850} {"train_loss": -6.47414493560791, "global_step": 119734, "epoch": 2850} {"train_loss": -6.624526023864746, "global_step": 119735, "epoch": 2850} {"train_loss": -6.596962928771973, "global_step": 119736, "epoch": 2850} {"train_loss": -6.591838836669922, "global_step": 119737, "epoch": 2850} {"train_loss": -6.555326461791992, "global_step": 119738, "epoch": 2850} {"train_loss": -6.584689617156982, "global_step": 119739, "epoch": 2850} {"train_loss": -6.4555864334106445, "global_step": 119740, "epoch": 2850} {"train_loss": -6.583115782056536, "global_step": 119741, "epoch": 2850, "train/sim_max_reward_0": 0.39559338037163344, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.8969307926291934, "train/sim_max_reward_3": 0.39156244949984914, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.9503022343399365, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.22664809214176518, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.8968458347216877, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9153404191406952, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.8881664102335817, "test/sim_max_reward_4300008": 0.9097968271375382, "test/sim_max_reward_4300009": 0.9542024358612965, "test/sim_max_reward_4300010": 0.8975437483227116, "test/sim_max_reward_4300011": 0.2948082999015049, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 0.9308485155789646, "test/sim_max_reward_4300015": 0.9161983300801174, "test/sim_max_reward_4300016": 1.0, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.4567439001487067, "test/sim_max_reward_4300019": 0.1835153646485776, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8935465051423781, "test/sim_max_reward_4300022": 0.24637089871324153, "test/sim_max_reward_4300023": 0.4881269747491953, "test/sim_max_reward_4300024": 0.48343571097958643, "test/sim_max_reward_4300025": 0.9553926202509027, "test/sim_max_reward_4300026": 0.6785842662306673, "test/sim_max_reward_4300027": 0.9181575988574376, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.8537841638337734, "test/sim_max_reward_4300030": 0.17890567331079238, "test/sim_max_reward_4300031": 0.349537359488058, "test/sim_max_reward_4300032": 0.972692534723145, "test/sim_max_reward_4300033": 0.7185996848445757, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.769101495973393, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.6202134855945186, "test/sim_max_reward_4300038": 0.9984438153039731, "test/sim_max_reward_4300039": 0.49082027146111007, "test/sim_max_reward_4300040": 0.3223220170834726, "test/sim_max_reward_4300041": 0.8324937006799913, "test/sim_max_reward_4300042": 0.45135892871579825, "test/sim_max_reward_4300043": 0.16267097674709083, "test/sim_max_reward_4300044": 0.7986444708871593, "test/sim_max_reward_4300045": 0.19194525140562027, "test/sim_max_reward_4300046": 0.11141419052592079, "test/sim_max_reward_4300047": 0.1571966505802949, "test/sim_max_reward_4300048": 0.7479367190609213, "test/sim_max_reward_4300049": 0.25126892094998765, "train/mean_score": 0.7723981428067687, "test/mean_score": 0.5665730256876583, "val_loss": 65586.515625} {"train_loss": -6.516437530517578, "global_step": 119742, "epoch": 2851} {"train_loss": -6.597848415374756, "global_step": 119743, "epoch": 2851} {"train_loss": -6.5358381271362305, "global_step": 119744, "epoch": 2851} {"train_loss": -6.567467212677002, "global_step": 119745, "epoch": 2851} {"train_loss": -6.548803329467773, "global_step": 119746, "epoch": 2851} {"train_loss": -6.584397315979004, "global_step": 119747, "epoch": 2851} {"train_loss": -6.603318214416504, "global_step": 119748, "epoch": 2851} {"train_loss": -6.562352180480957, "global_step": 119749, "epoch": 2851} {"train_loss": -6.645977973937988, "global_step": 119750, "epoch": 2851} {"train_loss": -6.550658226013184, "global_step": 119751, "epoch": 2851} {"train_loss": -6.523544788360596, "global_step": 119752, "epoch": 2851} {"train_loss": -6.622830390930176, "global_step": 119753, "epoch": 2851} {"train_loss": -6.532754898071289, "global_step": 119754, "epoch": 2851} {"train_loss": -6.561606407165527, "global_step": 119755, "epoch": 2851} {"train_loss": -6.5925397872924805, "global_step": 119756, "epoch": 2851} {"train_loss": -6.690896034240723, "global_step": 119757, "epoch": 2851} {"train_loss": -6.619912147521973, "global_step": 119758, "epoch": 2851} {"train_loss": -6.69761848449707, "global_step": 119759, "epoch": 2851} {"train_loss": -6.58509635925293, "global_step": 119760, "epoch": 2851} {"train_loss": -6.592530250549316, "global_step": 119761, "epoch": 2851} {"train_loss": -6.571838855743408, "global_step": 119762, "epoch": 2851} {"train_loss": -6.568619728088379, "global_step": 119763, "epoch": 2851} {"train_loss": -6.635746955871582, "global_step": 119764, "epoch": 2851} {"train_loss": -6.561814308166504, "global_step": 119765, "epoch": 2851} {"train_loss": -6.559117317199707, "global_step": 119766, "epoch": 2851} {"train_loss": -6.598238945007324, "global_step": 119767, "epoch": 2851} {"train_loss": -6.568944931030273, "global_step": 119768, "epoch": 2851} {"train_loss": -6.581812858581543, "global_step": 119769, "epoch": 2851} {"train_loss": -6.50227165222168, "global_step": 119770, "epoch": 2851} {"train_loss": -6.622419357299805, "global_step": 119771, "epoch": 2851} {"train_loss": -6.677289009094238, "global_step": 119772, "epoch": 2851} {"train_loss": -6.588413238525391, "global_step": 119773, "epoch": 2851} {"train_loss": -6.573824882507324, "global_step": 119774, "epoch": 2851} {"train_loss": -6.600813865661621, "global_step": 119775, "epoch": 2851} {"train_loss": -6.5555267333984375, "global_step": 119776, "epoch": 2851} {"train_loss": -6.531457424163818, "global_step": 119777, "epoch": 2851} {"train_loss": -6.656044006347656, "global_step": 119778, "epoch": 2851} {"train_loss": -6.432017803192139, "global_step": 119779, "epoch": 2851} {"train_loss": -6.570102691650391, "global_step": 119780, "epoch": 2851} {"train_loss": -6.4326958656311035, "global_step": 119781, "epoch": 2851} {"train_loss": -6.491001129150391, "global_step": 119782, "epoch": 2851} {"train_loss": -6.57574987411499, "global_step": 119783, "epoch": 2851, "val_loss": 65603.703125} {"train_loss": -6.452672481536865, "global_step": 119784, "epoch": 2852} {"train_loss": -6.478668689727783, "global_step": 119785, "epoch": 2852} {"train_loss": -6.542167663574219, "global_step": 119786, "epoch": 2852} {"train_loss": -6.388765335083008, "global_step": 119787, "epoch": 2852} {"train_loss": -6.530973434448242, "global_step": 119788, "epoch": 2852} {"train_loss": -6.448882579803467, "global_step": 119789, "epoch": 2852} {"train_loss": -6.422267913818359, "global_step": 119790, "epoch": 2852} {"train_loss": -6.602917671203613, "global_step": 119791, "epoch": 2852} {"train_loss": -6.4221978187561035, "global_step": 119792, "epoch": 2852} {"train_loss": -6.525464057922363, "global_step": 119793, "epoch": 2852} {"train_loss": -6.537041664123535, "global_step": 119794, "epoch": 2852} {"train_loss": -6.5031538009643555, "global_step": 119795, "epoch": 2852} {"train_loss": -6.537117004394531, "global_step": 119796, "epoch": 2852} {"train_loss": -6.607419013977051, "global_step": 119797, "epoch": 2852} {"train_loss": -6.443525314331055, "global_step": 119798, "epoch": 2852} {"train_loss": -6.433310508728027, "global_step": 119799, "epoch": 2852} {"train_loss": -6.55947208404541, "global_step": 119800, "epoch": 2852} {"train_loss": -6.56431770324707, "global_step": 119801, "epoch": 2852} {"train_loss": -6.672354698181152, "global_step": 119802, "epoch": 2852} {"train_loss": -6.492316722869873, "global_step": 119803, "epoch": 2852} {"train_loss": -6.494631290435791, "global_step": 119804, "epoch": 2852} {"train_loss": -6.622346878051758, "global_step": 119805, "epoch": 2852} {"train_loss": -6.574821472167969, "global_step": 119806, "epoch": 2852} {"train_loss": -6.599749565124512, "global_step": 119807, "epoch": 2852} {"train_loss": -6.594211101531982, "global_step": 119808, "epoch": 2852} {"train_loss": -6.564114093780518, "global_step": 119809, "epoch": 2852} {"train_loss": -6.5546417236328125, "global_step": 119810, "epoch": 2852} {"train_loss": -6.645230770111084, "global_step": 119811, "epoch": 2852} {"train_loss": -6.51005744934082, "global_step": 119812, "epoch": 2852} {"train_loss": -6.604523181915283, "global_step": 119813, "epoch": 2852} {"train_loss": -6.6426472663879395, "global_step": 119814, "epoch": 2852} {"train_loss": -6.526647567749023, "global_step": 119815, "epoch": 2852} {"train_loss": -6.439121246337891, "global_step": 119816, "epoch": 2852} {"train_loss": -6.642606735229492, "global_step": 119817, "epoch": 2852} {"train_loss": -6.527214527130127, "global_step": 119818, "epoch": 2852} {"train_loss": -6.545605182647705, "global_step": 119819, "epoch": 2852} {"train_loss": -6.545402526855469, "global_step": 119820, "epoch": 2852} {"train_loss": -6.5733489990234375, "global_step": 119821, "epoch": 2852} {"train_loss": -6.499382019042969, "global_step": 119822, "epoch": 2852} {"train_loss": -6.620120048522949, "global_step": 119823, "epoch": 2852} {"train_loss": -6.543276786804199, "global_step": 119824, "epoch": 2852} {"train_loss": -6.540236836387997, "global_step": 119825, "epoch": 2852, "val_loss": 65686.5859375} {"train_loss": -6.501270771026611, "global_step": 119826, "epoch": 2853} {"train_loss": -6.635617733001709, "global_step": 119827, "epoch": 2853} {"train_loss": -6.560915470123291, "global_step": 119828, "epoch": 2853} {"train_loss": -6.615637302398682, "global_step": 119829, "epoch": 2853} {"train_loss": -6.61375093460083, "global_step": 119830, "epoch": 2853} {"train_loss": -6.652314186096191, "global_step": 119831, "epoch": 2853} {"train_loss": -6.530170440673828, "global_step": 119832, "epoch": 2853} {"train_loss": -6.461627006530762, "global_step": 119833, "epoch": 2853} {"train_loss": -6.731819152832031, "global_step": 119834, "epoch": 2853} {"train_loss": -6.5610809326171875, "global_step": 119835, "epoch": 2853} {"train_loss": -6.5781145095825195, "global_step": 119836, "epoch": 2853} {"train_loss": -6.535499572753906, "global_step": 119837, "epoch": 2853} {"train_loss": -6.656149387359619, "global_step": 119838, "epoch": 2853} {"train_loss": -6.656377792358398, "global_step": 119839, "epoch": 2853} {"train_loss": -6.44718074798584, "global_step": 119840, "epoch": 2853} {"train_loss": -6.454817771911621, "global_step": 119841, "epoch": 2853} {"train_loss": -6.584741115570068, "global_step": 119842, "epoch": 2853} {"train_loss": -6.524878025054932, "global_step": 119843, "epoch": 2853} {"train_loss": -6.546856880187988, "global_step": 119844, "epoch": 2853} {"train_loss": -6.493319034576416, "global_step": 119845, "epoch": 2853} {"train_loss": -6.609798431396484, "global_step": 119846, "epoch": 2853} {"train_loss": -6.60423469543457, "global_step": 119847, "epoch": 2853} {"train_loss": -6.602482795715332, "global_step": 119848, "epoch": 2853} {"train_loss": -6.5465989112854, "global_step": 119849, "epoch": 2853} {"train_loss": -6.607205390930176, "global_step": 119850, "epoch": 2853} {"train_loss": -6.582942008972168, "global_step": 119851, "epoch": 2853} {"train_loss": -6.489635467529297, "global_step": 119852, "epoch": 2853} {"train_loss": -6.550967216491699, "global_step": 119853, "epoch": 2853} {"train_loss": -6.445527076721191, "global_step": 119854, "epoch": 2853} {"train_loss": -6.548988342285156, "global_step": 119855, "epoch": 2853} {"train_loss": -6.6371355056762695, "global_step": 119856, "epoch": 2853} {"train_loss": -6.641805648803711, "global_step": 119857, "epoch": 2853} {"train_loss": -6.598940849304199, "global_step": 119858, "epoch": 2853} {"train_loss": -6.652584552764893, "global_step": 119859, "epoch": 2853} {"train_loss": -6.491806983947754, "global_step": 119860, "epoch": 2853} {"train_loss": -6.609527111053467, "global_step": 119861, "epoch": 2853} {"train_loss": -6.595189094543457, "global_step": 119862, "epoch": 2853} {"train_loss": -6.5890092849731445, "global_step": 119863, "epoch": 2853} {"train_loss": -6.633612632751465, "global_step": 119864, "epoch": 2853} {"train_loss": -6.66758918762207, "global_step": 119865, "epoch": 2853} {"train_loss": -6.512966156005859, "global_step": 119866, "epoch": 2853} {"train_loss": -6.575361104238601, "global_step": 119867, "epoch": 2853, "val_loss": 65804.2265625} {"train_loss": -6.558560848236084, "global_step": 119868, "epoch": 2854} {"train_loss": -6.599126815795898, "global_step": 119869, "epoch": 2854} {"train_loss": -6.697387218475342, "global_step": 119870, "epoch": 2854} {"train_loss": -6.508221626281738, "global_step": 119871, "epoch": 2854} {"train_loss": -6.5104660987854, "global_step": 119872, "epoch": 2854} {"train_loss": -6.587677955627441, "global_step": 119873, "epoch": 2854} {"train_loss": -6.531917572021484, "global_step": 119874, "epoch": 2854} {"train_loss": -6.598761558532715, "global_step": 119875, "epoch": 2854} {"train_loss": -6.645883560180664, "global_step": 119876, "epoch": 2854} {"train_loss": -6.482019424438477, "global_step": 119877, "epoch": 2854} {"train_loss": -6.635719299316406, "global_step": 119878, "epoch": 2854} {"train_loss": -6.587951183319092, "global_step": 119879, "epoch": 2854} {"train_loss": -6.523830413818359, "global_step": 119880, "epoch": 2854} {"train_loss": -6.626708030700684, "global_step": 119881, "epoch": 2854} {"train_loss": -6.5601983070373535, "global_step": 119882, "epoch": 2854} {"train_loss": -6.515471458435059, "global_step": 119883, "epoch": 2854} {"train_loss": -6.544615268707275, "global_step": 119884, "epoch": 2854} {"train_loss": -6.4566826820373535, "global_step": 119885, "epoch": 2854} {"train_loss": -6.513083457946777, "global_step": 119886, "epoch": 2854} {"train_loss": -6.584979057312012, "global_step": 119887, "epoch": 2854} {"train_loss": -6.481063365936279, "global_step": 119888, "epoch": 2854} {"train_loss": -6.446138381958008, "global_step": 119889, "epoch": 2854} {"train_loss": -6.692879676818848, "global_step": 119890, "epoch": 2854} {"train_loss": -6.566282272338867, "global_step": 119891, "epoch": 2854} {"train_loss": -6.620602130889893, "global_step": 119892, "epoch": 2854} {"train_loss": -6.580904006958008, "global_step": 119893, "epoch": 2854} {"train_loss": -6.481999397277832, "global_step": 119894, "epoch": 2854} {"train_loss": -6.497552871704102, "global_step": 119895, "epoch": 2854} {"train_loss": -6.597016334533691, "global_step": 119896, "epoch": 2854} {"train_loss": -6.599494934082031, "global_step": 119897, "epoch": 2854} {"train_loss": -6.575456619262695, "global_step": 119898, "epoch": 2854} {"train_loss": -6.5445966720581055, "global_step": 119899, "epoch": 2854} {"train_loss": -6.644008636474609, "global_step": 119900, "epoch": 2854} {"train_loss": -6.567587852478027, "global_step": 119901, "epoch": 2854} {"train_loss": -6.5843353271484375, "global_step": 119902, "epoch": 2854} {"train_loss": -6.639703750610352, "global_step": 119903, "epoch": 2854} {"train_loss": -6.619867324829102, "global_step": 119904, "epoch": 2854} {"train_loss": -6.539932727813721, "global_step": 119905, "epoch": 2854} {"train_loss": -6.62285041809082, "global_step": 119906, "epoch": 2854} {"train_loss": -6.71772575378418, "global_step": 119907, "epoch": 2854} {"train_loss": -6.584778785705566, "global_step": 119908, "epoch": 2854} {"train_loss": -6.573079234077817, "global_step": 119909, "epoch": 2854, "val_loss": 65643.609375} {"train_loss": -6.6408891677856445, "global_step": 119910, "epoch": 2855} {"train_loss": -6.619123458862305, "global_step": 119911, "epoch": 2855} {"train_loss": -6.618625640869141, "global_step": 119912, "epoch": 2855} {"train_loss": -6.626281261444092, "global_step": 119913, "epoch": 2855} {"train_loss": -6.582559108734131, "global_step": 119914, "epoch": 2855} {"train_loss": -6.728316783905029, "global_step": 119915, "epoch": 2855} {"train_loss": -6.64974308013916, "global_step": 119916, "epoch": 2855} {"train_loss": -6.461187839508057, "global_step": 119917, "epoch": 2855} {"train_loss": -6.652561187744141, "global_step": 119918, "epoch": 2855} {"train_loss": -6.514752388000488, "global_step": 119919, "epoch": 2855} {"train_loss": -6.415005683898926, "global_step": 119920, "epoch": 2855} {"train_loss": -6.649435043334961, "global_step": 119921, "epoch": 2855} {"train_loss": -6.622910499572754, "global_step": 119922, "epoch": 2855} {"train_loss": -6.439117431640625, "global_step": 119923, "epoch": 2855} {"train_loss": -6.561236381530762, "global_step": 119924, "epoch": 2855} {"train_loss": -6.597805500030518, "global_step": 119925, "epoch": 2855} {"train_loss": -6.5607099533081055, "global_step": 119926, "epoch": 2855} {"train_loss": -6.572580814361572, "global_step": 119927, "epoch": 2855} {"train_loss": -6.423089027404785, "global_step": 119928, "epoch": 2855} {"train_loss": -6.472405910491943, "global_step": 119929, "epoch": 2855} {"train_loss": -6.638655662536621, "global_step": 119930, "epoch": 2855} {"train_loss": -6.562983512878418, "global_step": 119931, "epoch": 2855} {"train_loss": -6.642009258270264, "global_step": 119932, "epoch": 2855} {"train_loss": -6.631572723388672, "global_step": 119933, "epoch": 2855} {"train_loss": -6.568559169769287, "global_step": 119934, "epoch": 2855} {"train_loss": -6.506921768188477, "global_step": 119935, "epoch": 2855} {"train_loss": -6.5114569664001465, "global_step": 119936, "epoch": 2855} {"train_loss": -6.494726181030273, "global_step": 119937, "epoch": 2855} {"train_loss": -6.510049819946289, "global_step": 119938, "epoch": 2855} {"train_loss": -6.509811878204346, "global_step": 119939, "epoch": 2855} {"train_loss": -6.507862091064453, "global_step": 119940, "epoch": 2855} {"train_loss": -6.461093902587891, "global_step": 119941, "epoch": 2855} {"train_loss": -6.4793877601623535, "global_step": 119942, "epoch": 2855} {"train_loss": -6.390993118286133, "global_step": 119943, "epoch": 2855} {"train_loss": -6.436627388000488, "global_step": 119944, "epoch": 2855} {"train_loss": -6.421072006225586, "global_step": 119945, "epoch": 2855} {"train_loss": -6.49807071685791, "global_step": 119946, "epoch": 2855} {"train_loss": -6.527059078216553, "global_step": 119947, "epoch": 2855} {"train_loss": -6.448163986206055, "global_step": 119948, "epoch": 2855} {"train_loss": -6.384967803955078, "global_step": 119949, "epoch": 2855} {"train_loss": -6.483530521392822, "global_step": 119950, "epoch": 2855} {"train_loss": -6.536471855072748, "global_step": 119951, "epoch": 2855, "val_loss": 65626.328125} {"train_loss": -6.482107162475586, "global_step": 119952, "epoch": 2856} {"train_loss": -6.418112754821777, "global_step": 119953, "epoch": 2856} {"train_loss": -6.654880523681641, "global_step": 119954, "epoch": 2856} {"train_loss": -6.4548659324646, "global_step": 119955, "epoch": 2856} {"train_loss": -6.436002254486084, "global_step": 119956, "epoch": 2856} {"train_loss": -6.520105838775635, "global_step": 119957, "epoch": 2856} {"train_loss": -6.573742866516113, "global_step": 119958, "epoch": 2856} {"train_loss": -6.501719951629639, "global_step": 119959, "epoch": 2856} {"train_loss": -6.4533796310424805, "global_step": 119960, "epoch": 2856} {"train_loss": -6.630817890167236, "global_step": 119961, "epoch": 2856} {"train_loss": -6.501861095428467, "global_step": 119962, "epoch": 2856} {"train_loss": -6.52655029296875, "global_step": 119963, "epoch": 2856} {"train_loss": -6.684723854064941, "global_step": 119964, "epoch": 2856} {"train_loss": -6.504538536071777, "global_step": 119965, "epoch": 2856} {"train_loss": -6.512995719909668, "global_step": 119966, "epoch": 2856} {"train_loss": -6.53569221496582, "global_step": 119967, "epoch": 2856} {"train_loss": -6.519427299499512, "global_step": 119968, "epoch": 2856} {"train_loss": -6.643461227416992, "global_step": 119969, "epoch": 2856} {"train_loss": -6.65501594543457, "global_step": 119970, "epoch": 2856} {"train_loss": -6.618585109710693, "global_step": 119971, "epoch": 2856} {"train_loss": -6.573696136474609, "global_step": 119972, "epoch": 2856} {"train_loss": -6.552829742431641, "global_step": 119973, "epoch": 2856} {"train_loss": -6.535629749298096, "global_step": 119974, "epoch": 2856} {"train_loss": -6.48342227935791, "global_step": 119975, "epoch": 2856} {"train_loss": -6.63126277923584, "global_step": 119976, "epoch": 2856} {"train_loss": -6.608447074890137, "global_step": 119977, "epoch": 2856} {"train_loss": -6.463439464569092, "global_step": 119978, "epoch": 2856} {"train_loss": -6.660449028015137, "global_step": 119979, "epoch": 2856} {"train_loss": -6.642299652099609, "global_step": 119980, "epoch": 2856} {"train_loss": -6.620107650756836, "global_step": 119981, "epoch": 2856} {"train_loss": -6.555241584777832, "global_step": 119982, "epoch": 2856} {"train_loss": -6.537012100219727, "global_step": 119983, "epoch": 2856} {"train_loss": -6.411866188049316, "global_step": 119984, "epoch": 2856} {"train_loss": -6.511601448059082, "global_step": 119985, "epoch": 2856} {"train_loss": -6.446139335632324, "global_step": 119986, "epoch": 2856} {"train_loss": -6.527448654174805, "global_step": 119987, "epoch": 2856} {"train_loss": -6.53281307220459, "global_step": 119988, "epoch": 2856} {"train_loss": -6.434670448303223, "global_step": 119989, "epoch": 2856} {"train_loss": -6.5452165603637695, "global_step": 119990, "epoch": 2856} {"train_loss": -6.460524559020996, "global_step": 119991, "epoch": 2856} {"train_loss": -6.518517971038818, "global_step": 119992, "epoch": 2856} {"train_loss": -6.5363370804559615, "global_step": 119993, "epoch": 2856, "val_loss": 65797.21875} {"train_loss": -6.5118255615234375, "global_step": 119994, "epoch": 2857} {"train_loss": -6.587216377258301, "global_step": 119995, "epoch": 2857} {"train_loss": -6.443289756774902, "global_step": 119996, "epoch": 2857} {"train_loss": -6.513289928436279, "global_step": 119997, "epoch": 2857} {"train_loss": -6.610340595245361, "global_step": 119998, "epoch": 2857} {"train_loss": -6.5803680419921875, "global_step": 119999, "epoch": 2857} {"train_loss": -6.553562164306641, "global_step": 120000, "epoch": 2857} {"train_loss": -6.516530513763428, "global_step": 120001, "epoch": 2857} {"train_loss": -6.548157691955566, "global_step": 120002, "epoch": 2857} {"train_loss": -6.545013904571533, "global_step": 120003, "epoch": 2857} {"train_loss": -6.575711250305176, "global_step": 120004, "epoch": 2857} {"train_loss": -6.427051544189453, "global_step": 120005, "epoch": 2857} {"train_loss": -6.483040809631348, "global_step": 120006, "epoch": 2857} {"train_loss": -6.5410051345825195, "global_step": 120007, "epoch": 2857} {"train_loss": -6.441192626953125, "global_step": 120008, "epoch": 2857} {"train_loss": -6.618480205535889, "global_step": 120009, "epoch": 2857} {"train_loss": -6.523222923278809, "global_step": 120010, "epoch": 2857} {"train_loss": -6.5994696617126465, "global_step": 120011, "epoch": 2857} {"train_loss": -6.585296630859375, "global_step": 120012, "epoch": 2857} {"train_loss": -6.5264458656311035, "global_step": 120013, "epoch": 2857} {"train_loss": -6.538782119750977, "global_step": 120014, "epoch": 2857} {"train_loss": -6.5315046310424805, "global_step": 120015, "epoch": 2857} {"train_loss": -6.516352653503418, "global_step": 120016, "epoch": 2857} {"train_loss": -6.548238754272461, "global_step": 120017, "epoch": 2857} {"train_loss": -6.654841899871826, "global_step": 120018, "epoch": 2857} {"train_loss": -6.53754997253418, "global_step": 120019, "epoch": 2857} {"train_loss": -6.557369709014893, "global_step": 120020, "epoch": 2857} {"train_loss": -6.552915573120117, "global_step": 120021, "epoch": 2857} {"train_loss": -6.604621887207031, "global_step": 120022, "epoch": 2857} {"train_loss": -6.538881301879883, "global_step": 120023, "epoch": 2857} {"train_loss": -6.484262943267822, "global_step": 120024, "epoch": 2857} {"train_loss": -6.462137699127197, "global_step": 120025, "epoch": 2857} {"train_loss": -6.49844217300415, "global_step": 120026, "epoch": 2857} {"train_loss": -6.5815300941467285, "global_step": 120027, "epoch": 2857} {"train_loss": -6.5501275062561035, "global_step": 120028, "epoch": 2857} {"train_loss": -6.575286865234375, "global_step": 120029, "epoch": 2857} {"train_loss": -6.502617359161377, "global_step": 120030, "epoch": 2857} {"train_loss": -6.5869340896606445, "global_step": 120031, "epoch": 2857} {"train_loss": -6.482607841491699, "global_step": 120032, "epoch": 2857} {"train_loss": -6.560347080230713, "global_step": 120033, "epoch": 2857} {"train_loss": -6.609951019287109, "global_step": 120034, "epoch": 2857} {"train_loss": -6.540464923495338, "global_step": 120035, "epoch": 2857, "val_loss": 65913.609375} {"train_loss": -6.582324981689453, "global_step": 120036, "epoch": 2858} {"train_loss": -6.538969039916992, "global_step": 120037, "epoch": 2858} {"train_loss": -6.547816276550293, "global_step": 120038, "epoch": 2858} {"train_loss": -6.623699188232422, "global_step": 120039, "epoch": 2858} {"train_loss": -6.430579662322998, "global_step": 120040, "epoch": 2858} {"train_loss": -6.398294448852539, "global_step": 120041, "epoch": 2858} {"train_loss": -6.587385177612305, "global_step": 120042, "epoch": 2858} {"train_loss": -6.544367790222168, "global_step": 120043, "epoch": 2858} {"train_loss": -6.46292781829834, "global_step": 120044, "epoch": 2858} {"train_loss": -6.604563236236572, "global_step": 120045, "epoch": 2858} {"train_loss": -6.677469253540039, "global_step": 120046, "epoch": 2858} {"train_loss": -6.626354217529297, "global_step": 120047, "epoch": 2858} {"train_loss": -6.560457229614258, "global_step": 120048, "epoch": 2858} {"train_loss": -6.581172943115234, "global_step": 120049, "epoch": 2858} {"train_loss": -6.526727676391602, "global_step": 120050, "epoch": 2858} {"train_loss": -6.629298210144043, "global_step": 120051, "epoch": 2858} {"train_loss": -6.610456943511963, "global_step": 120052, "epoch": 2858} {"train_loss": -6.561878681182861, "global_step": 120053, "epoch": 2858} {"train_loss": -6.665249824523926, "global_step": 120054, "epoch": 2858} {"train_loss": -6.630711555480957, "global_step": 120055, "epoch": 2858} {"train_loss": -6.610705375671387, "global_step": 120056, "epoch": 2858} {"train_loss": -6.595898628234863, "global_step": 120057, "epoch": 2858} {"train_loss": -6.679340362548828, "global_step": 120058, "epoch": 2858} {"train_loss": -6.610321044921875, "global_step": 120059, "epoch": 2858} {"train_loss": -6.556108474731445, "global_step": 120060, "epoch": 2858} {"train_loss": -6.6076579093933105, "global_step": 120061, "epoch": 2858} {"train_loss": -6.479219436645508, "global_step": 120062, "epoch": 2858} {"train_loss": -6.578184604644775, "global_step": 120063, "epoch": 2858} {"train_loss": -6.475452423095703, "global_step": 120064, "epoch": 2858} {"train_loss": -6.553210735321045, "global_step": 120065, "epoch": 2858} {"train_loss": -6.627881050109863, "global_step": 120066, "epoch": 2858} {"train_loss": -6.572249412536621, "global_step": 120067, "epoch": 2858} {"train_loss": -6.628808975219727, "global_step": 120068, "epoch": 2858} {"train_loss": -6.664770126342773, "global_step": 120069, "epoch": 2858} {"train_loss": -6.525888442993164, "global_step": 120070, "epoch": 2858} {"train_loss": -6.533323287963867, "global_step": 120071, "epoch": 2858} {"train_loss": -6.6845011711120605, "global_step": 120072, "epoch": 2858} {"train_loss": -6.5941162109375, "global_step": 120073, "epoch": 2858} {"train_loss": -6.5654802322387695, "global_step": 120074, "epoch": 2858} {"train_loss": -6.616831302642822, "global_step": 120075, "epoch": 2858} {"train_loss": -6.543231964111328, "global_step": 120076, "epoch": 2858} {"train_loss": -6.575913735798427, "global_step": 120077, "epoch": 2858, "val_loss": 65663.8359375} {"train_loss": -6.543835639953613, "global_step": 120078, "epoch": 2859} {"train_loss": -6.672930717468262, "global_step": 120079, "epoch": 2859} {"train_loss": -6.626660346984863, "global_step": 120080, "epoch": 2859} {"train_loss": -6.614768981933594, "global_step": 120081, "epoch": 2859} {"train_loss": -6.574637413024902, "global_step": 120082, "epoch": 2859} {"train_loss": -6.596253395080566, "global_step": 120083, "epoch": 2859} {"train_loss": -6.604218482971191, "global_step": 120084, "epoch": 2859} {"train_loss": -6.622272491455078, "global_step": 120085, "epoch": 2859} {"train_loss": -6.537727355957031, "global_step": 120086, "epoch": 2859} {"train_loss": -6.636482238769531, "global_step": 120087, "epoch": 2859} {"train_loss": -6.671852111816406, "global_step": 120088, "epoch": 2859} {"train_loss": -6.578824996948242, "global_step": 120089, "epoch": 2859} {"train_loss": -6.611724853515625, "global_step": 120090, "epoch": 2859} {"train_loss": -6.545878887176514, "global_step": 120091, "epoch": 2859} {"train_loss": -6.633307456970215, "global_step": 120092, "epoch": 2859} {"train_loss": -6.645111083984375, "global_step": 120093, "epoch": 2859} {"train_loss": -6.486686706542969, "global_step": 120094, "epoch": 2859} {"train_loss": -6.691866874694824, "global_step": 120095, "epoch": 2859} {"train_loss": -6.554288864135742, "global_step": 120096, "epoch": 2859} {"train_loss": -6.6884260177612305, "global_step": 120097, "epoch": 2859} {"train_loss": -6.736924171447754, "global_step": 120098, "epoch": 2859} {"train_loss": -6.633534908294678, "global_step": 120099, "epoch": 2859} {"train_loss": -6.544539451599121, "global_step": 120100, "epoch": 2859} {"train_loss": -6.5911359786987305, "global_step": 120101, "epoch": 2859} {"train_loss": -6.616341590881348, "global_step": 120102, "epoch": 2859} {"train_loss": -6.679577827453613, "global_step": 120103, "epoch": 2859} {"train_loss": -6.585235595703125, "global_step": 120104, "epoch": 2859} {"train_loss": -6.502910137176514, "global_step": 120105, "epoch": 2859} {"train_loss": -6.563441753387451, "global_step": 120106, "epoch": 2859} {"train_loss": -6.575847625732422, "global_step": 120107, "epoch": 2859} {"train_loss": -6.5262579917907715, "global_step": 120108, "epoch": 2859} {"train_loss": -6.564497947692871, "global_step": 120109, "epoch": 2859} {"train_loss": -6.562323570251465, "global_step": 120110, "epoch": 2859} {"train_loss": -6.45941162109375, "global_step": 120111, "epoch": 2859} {"train_loss": -6.5517578125, "global_step": 120112, "epoch": 2859} {"train_loss": -6.6164116859436035, "global_step": 120113, "epoch": 2859} {"train_loss": -6.5323357582092285, "global_step": 120114, "epoch": 2859} {"train_loss": -6.5189666748046875, "global_step": 120115, "epoch": 2859} {"train_loss": -6.594467639923096, "global_step": 120116, "epoch": 2859} {"train_loss": -6.605788230895996, "global_step": 120117, "epoch": 2859} {"train_loss": -6.634566307067871, "global_step": 120118, "epoch": 2859} {"train_loss": -6.594281559898739, "global_step": 120119, "epoch": 2859, "val_loss": 65760.40625} {"train_loss": -6.583775520324707, "global_step": 120120, "epoch": 2860} {"train_loss": -6.564361095428467, "global_step": 120121, "epoch": 2860} {"train_loss": -6.591059684753418, "global_step": 120122, "epoch": 2860} {"train_loss": -6.576934337615967, "global_step": 120123, "epoch": 2860} {"train_loss": -6.5425190925598145, "global_step": 120124, "epoch": 2860} {"train_loss": -6.530132293701172, "global_step": 120125, "epoch": 2860} {"train_loss": -6.544288635253906, "global_step": 120126, "epoch": 2860} {"train_loss": -6.493383884429932, "global_step": 120127, "epoch": 2860} {"train_loss": -6.553627967834473, "global_step": 120128, "epoch": 2860} {"train_loss": -6.619636535644531, "global_step": 120129, "epoch": 2860} {"train_loss": -6.616828918457031, "global_step": 120130, "epoch": 2860} {"train_loss": -6.521323204040527, "global_step": 120131, "epoch": 2860} {"train_loss": -6.613364219665527, "global_step": 120132, "epoch": 2860} {"train_loss": -6.767129898071289, "global_step": 120133, "epoch": 2860} {"train_loss": -6.595638275146484, "global_step": 120134, "epoch": 2860} {"train_loss": -6.575255870819092, "global_step": 120135, "epoch": 2860} {"train_loss": -6.621422290802002, "global_step": 120136, "epoch": 2860} {"train_loss": -6.566367149353027, "global_step": 120137, "epoch": 2860} {"train_loss": -6.595698356628418, "global_step": 120138, "epoch": 2860} {"train_loss": -6.571694850921631, "global_step": 120139, "epoch": 2860} {"train_loss": -6.595303535461426, "global_step": 120140, "epoch": 2860} {"train_loss": -6.427257061004639, "global_step": 120141, "epoch": 2860} {"train_loss": -6.505410671234131, "global_step": 120142, "epoch": 2860} {"train_loss": -6.602024555206299, "global_step": 120143, "epoch": 2860} {"train_loss": -6.555182933807373, "global_step": 120144, "epoch": 2860} {"train_loss": -6.642114639282227, "global_step": 120145, "epoch": 2860} {"train_loss": -6.630666732788086, "global_step": 120146, "epoch": 2860} {"train_loss": -6.658010005950928, "global_step": 120147, "epoch": 2860} {"train_loss": -6.56851053237915, "global_step": 120148, "epoch": 2860} {"train_loss": -6.742931842803955, "global_step": 120149, "epoch": 2860} {"train_loss": -6.5055646896362305, "global_step": 120150, "epoch": 2860} {"train_loss": -6.5348405838012695, "global_step": 120151, "epoch": 2860} {"train_loss": -6.445659637451172, "global_step": 120152, "epoch": 2860} {"train_loss": -6.534675598144531, "global_step": 120153, "epoch": 2860} {"train_loss": -6.576708793640137, "global_step": 120154, "epoch": 2860} {"train_loss": -6.487900733947754, "global_step": 120155, "epoch": 2860} {"train_loss": -6.676883697509766, "global_step": 120156, "epoch": 2860} {"train_loss": -6.596863746643066, "global_step": 120157, "epoch": 2860} {"train_loss": -6.585964202880859, "global_step": 120158, "epoch": 2860} {"train_loss": -6.441157341003418, "global_step": 120159, "epoch": 2860} {"train_loss": -6.615609169006348, "global_step": 120160, "epoch": 2860} {"train_loss": -6.572895981016613, "global_step": 120161, "epoch": 2860, "val_loss": 65806.546875} {"train_loss": -6.512475490570068, "global_step": 120162, "epoch": 2861} {"train_loss": -6.613186836242676, "global_step": 120163, "epoch": 2861} {"train_loss": -6.479547500610352, "global_step": 120164, "epoch": 2861} {"train_loss": -6.663599967956543, "global_step": 120165, "epoch": 2861} {"train_loss": -6.582719326019287, "global_step": 120166, "epoch": 2861} {"train_loss": -6.61549186706543, "global_step": 120167, "epoch": 2861} {"train_loss": -6.606892108917236, "global_step": 120168, "epoch": 2861} {"train_loss": -6.6035356521606445, "global_step": 120169, "epoch": 2861} {"train_loss": -6.628591060638428, "global_step": 120170, "epoch": 2861} {"train_loss": -6.528082847595215, "global_step": 120171, "epoch": 2861} {"train_loss": -6.590826988220215, "global_step": 120172, "epoch": 2861} {"train_loss": -6.528648376464844, "global_step": 120173, "epoch": 2861} {"train_loss": -6.633145809173584, "global_step": 120174, "epoch": 2861} {"train_loss": -6.536486625671387, "global_step": 120175, "epoch": 2861} {"train_loss": -6.517766952514648, "global_step": 120176, "epoch": 2861} {"train_loss": -6.575780868530273, "global_step": 120177, "epoch": 2861} {"train_loss": -6.6103363037109375, "global_step": 120178, "epoch": 2861} {"train_loss": -6.536927700042725, "global_step": 120179, "epoch": 2861} {"train_loss": -6.6739115715026855, "global_step": 120180, "epoch": 2861} {"train_loss": -6.63279390335083, "global_step": 120181, "epoch": 2861} {"train_loss": -6.449073314666748, "global_step": 120182, "epoch": 2861} {"train_loss": -6.662263870239258, "global_step": 120183, "epoch": 2861} {"train_loss": -6.529239654541016, "global_step": 120184, "epoch": 2861} {"train_loss": -6.56785774230957, "global_step": 120185, "epoch": 2861} {"train_loss": -6.506185531616211, "global_step": 120186, "epoch": 2861} {"train_loss": -6.475543975830078, "global_step": 120187, "epoch": 2861} {"train_loss": -6.588543891906738, "global_step": 120188, "epoch": 2861} {"train_loss": -6.39306640625, "global_step": 120189, "epoch": 2861} {"train_loss": -6.4410786628723145, "global_step": 120190, "epoch": 2861} {"train_loss": -6.560387134552002, "global_step": 120191, "epoch": 2861} {"train_loss": -6.6088714599609375, "global_step": 120192, "epoch": 2861} {"train_loss": -6.46109676361084, "global_step": 120193, "epoch": 2861} {"train_loss": -6.5358500480651855, "global_step": 120194, "epoch": 2861} {"train_loss": -6.5334672927856445, "global_step": 120195, "epoch": 2861} {"train_loss": -6.464735984802246, "global_step": 120196, "epoch": 2861} {"train_loss": -6.472683906555176, "global_step": 120197, "epoch": 2861} {"train_loss": -6.4988226890563965, "global_step": 120198, "epoch": 2861} {"train_loss": -6.52275276184082, "global_step": 120199, "epoch": 2861} {"train_loss": -6.573465347290039, "global_step": 120200, "epoch": 2861} {"train_loss": -6.49976921081543, "global_step": 120201, "epoch": 2861} {"train_loss": -6.554035186767578, "global_step": 120202, "epoch": 2861} {"train_loss": -6.54952757699149, "global_step": 120203, "epoch": 2861, "val_loss": 65790.1015625} {"train_loss": -6.52772331237793, "global_step": 120204, "epoch": 2862} {"train_loss": -6.54216194152832, "global_step": 120205, "epoch": 2862} {"train_loss": -6.585655212402344, "global_step": 120206, "epoch": 2862} {"train_loss": -6.430093765258789, "global_step": 120207, "epoch": 2862} {"train_loss": -6.638091087341309, "global_step": 120208, "epoch": 2862} {"train_loss": -6.452145576477051, "global_step": 120209, "epoch": 2862} {"train_loss": -6.475220680236816, "global_step": 120210, "epoch": 2862} {"train_loss": -6.465657711029053, "global_step": 120211, "epoch": 2862} {"train_loss": -6.5004987716674805, "global_step": 120212, "epoch": 2862} {"train_loss": -6.553714752197266, "global_step": 120213, "epoch": 2862} {"train_loss": -6.535019874572754, "global_step": 120214, "epoch": 2862} {"train_loss": -6.345935821533203, "global_step": 120215, "epoch": 2862} {"train_loss": -6.609933376312256, "global_step": 120216, "epoch": 2862} {"train_loss": -6.445016860961914, "global_step": 120217, "epoch": 2862} {"train_loss": -6.520164489746094, "global_step": 120218, "epoch": 2862} {"train_loss": -6.595379829406738, "global_step": 120219, "epoch": 2862} {"train_loss": -6.614141464233398, "global_step": 120220, "epoch": 2862} {"train_loss": -6.663704872131348, "global_step": 120221, "epoch": 2862} {"train_loss": -6.465124607086182, "global_step": 120222, "epoch": 2862} {"train_loss": -6.467113971710205, "global_step": 120223, "epoch": 2862} {"train_loss": -6.530898094177246, "global_step": 120224, "epoch": 2862} {"train_loss": -6.405139446258545, "global_step": 120225, "epoch": 2862} {"train_loss": -6.574158668518066, "global_step": 120226, "epoch": 2862} {"train_loss": -6.5263495445251465, "global_step": 120227, "epoch": 2862} {"train_loss": -6.446147441864014, "global_step": 120228, "epoch": 2862} {"train_loss": -6.417667865753174, "global_step": 120229, "epoch": 2862} {"train_loss": -6.5585432052612305, "global_step": 120230, "epoch": 2862} {"train_loss": -6.544839859008789, "global_step": 120231, "epoch": 2862} {"train_loss": -6.542328834533691, "global_step": 120232, "epoch": 2862} {"train_loss": -6.575778007507324, "global_step": 120233, "epoch": 2862} {"train_loss": -6.587132453918457, "global_step": 120234, "epoch": 2862} {"train_loss": -6.538477897644043, "global_step": 120235, "epoch": 2862} {"train_loss": -6.532140254974365, "global_step": 120236, "epoch": 2862} {"train_loss": -6.562587738037109, "global_step": 120237, "epoch": 2862} {"train_loss": -6.586188316345215, "global_step": 120238, "epoch": 2862} {"train_loss": -6.555305004119873, "global_step": 120239, "epoch": 2862} {"train_loss": -6.718360424041748, "global_step": 120240, "epoch": 2862} {"train_loss": -6.565429210662842, "global_step": 120241, "epoch": 2862} {"train_loss": -6.4822235107421875, "global_step": 120242, "epoch": 2862} {"train_loss": -6.527753829956055, "global_step": 120243, "epoch": 2862} {"train_loss": -6.542242050170898, "global_step": 120244, "epoch": 2862} {"train_loss": -6.532444794972737, "global_step": 120245, "epoch": 2862, "val_loss": 65747.3359375} {"train_loss": -6.6329731941223145, "global_step": 120246, "epoch": 2863} {"train_loss": -6.59417200088501, "global_step": 120247, "epoch": 2863} {"train_loss": -6.465794563293457, "global_step": 120248, "epoch": 2863} {"train_loss": -6.531110763549805, "global_step": 120249, "epoch": 2863} {"train_loss": -6.536137580871582, "global_step": 120250, "epoch": 2863} {"train_loss": -6.608321189880371, "global_step": 120251, "epoch": 2863} {"train_loss": -6.541865348815918, "global_step": 120252, "epoch": 2863} {"train_loss": -6.578612327575684, "global_step": 120253, "epoch": 2863} {"train_loss": -6.593296527862549, "global_step": 120254, "epoch": 2863} {"train_loss": -6.53553581237793, "global_step": 120255, "epoch": 2863} {"train_loss": -6.616674900054932, "global_step": 120256, "epoch": 2863} {"train_loss": -6.615274429321289, "global_step": 120257, "epoch": 2863} {"train_loss": -6.57211971282959, "global_step": 120258, "epoch": 2863} {"train_loss": -6.687068939208984, "global_step": 120259, "epoch": 2863} {"train_loss": -6.536926746368408, "global_step": 120260, "epoch": 2863} {"train_loss": -6.570829391479492, "global_step": 120261, "epoch": 2863} {"train_loss": -6.5568013191223145, "global_step": 120262, "epoch": 2863} {"train_loss": -6.657881736755371, "global_step": 120263, "epoch": 2863} {"train_loss": -6.577579975128174, "global_step": 120264, "epoch": 2863} {"train_loss": -6.680112838745117, "global_step": 120265, "epoch": 2863} {"train_loss": -6.644102096557617, "global_step": 120266, "epoch": 2863} {"train_loss": -6.624403953552246, "global_step": 120267, "epoch": 2863} {"train_loss": -6.677064895629883, "global_step": 120268, "epoch": 2863} {"train_loss": -6.6203718185424805, "global_step": 120269, "epoch": 2863} {"train_loss": -6.578556537628174, "global_step": 120270, "epoch": 2863} {"train_loss": -6.643959045410156, "global_step": 120271, "epoch": 2863} {"train_loss": -6.5926289558410645, "global_step": 120272, "epoch": 2863} {"train_loss": -6.574498653411865, "global_step": 120273, "epoch": 2863} {"train_loss": -6.634681701660156, "global_step": 120274, "epoch": 2863} {"train_loss": -6.508085250854492, "global_step": 120275, "epoch": 2863} {"train_loss": -6.643828392028809, "global_step": 120276, "epoch": 2863} {"train_loss": -6.5512518882751465, "global_step": 120277, "epoch": 2863} {"train_loss": -6.483936309814453, "global_step": 120278, "epoch": 2863} {"train_loss": -6.54445743560791, "global_step": 120279, "epoch": 2863} {"train_loss": -6.658975601196289, "global_step": 120280, "epoch": 2863} {"train_loss": -6.518949508666992, "global_step": 120281, "epoch": 2863} {"train_loss": -6.474099159240723, "global_step": 120282, "epoch": 2863} {"train_loss": -6.591434478759766, "global_step": 120283, "epoch": 2863} {"train_loss": -6.49596643447876, "global_step": 120284, "epoch": 2863} {"train_loss": -6.4496965408325195, "global_step": 120285, "epoch": 2863} {"train_loss": -6.549759864807129, "global_step": 120286, "epoch": 2863} {"train_loss": -6.5767863137381415, "global_step": 120287, "epoch": 2863, "val_loss": 65705.328125} {"train_loss": -6.462220191955566, "global_step": 120288, "epoch": 2864} {"train_loss": -6.605680465698242, "global_step": 120289, "epoch": 2864} {"train_loss": -6.532510757446289, "global_step": 120290, "epoch": 2864} {"train_loss": -6.711681842803955, "global_step": 120291, "epoch": 2864} {"train_loss": -6.622174263000488, "global_step": 120292, "epoch": 2864} {"train_loss": -6.55307674407959, "global_step": 120293, "epoch": 2864} {"train_loss": -6.552362442016602, "global_step": 120294, "epoch": 2864} {"train_loss": -6.638601303100586, "global_step": 120295, "epoch": 2864} {"train_loss": -6.606563091278076, "global_step": 120296, "epoch": 2864} {"train_loss": -6.607175827026367, "global_step": 120297, "epoch": 2864} {"train_loss": -6.553275108337402, "global_step": 120298, "epoch": 2864} {"train_loss": -6.44077205657959, "global_step": 120299, "epoch": 2864} {"train_loss": -6.619241714477539, "global_step": 120300, "epoch": 2864} {"train_loss": -6.537935256958008, "global_step": 120301, "epoch": 2864} {"train_loss": -6.615339279174805, "global_step": 120302, "epoch": 2864} {"train_loss": -6.633922576904297, "global_step": 120303, "epoch": 2864} {"train_loss": -6.594742298126221, "global_step": 120304, "epoch": 2864} {"train_loss": -6.666234016418457, "global_step": 120305, "epoch": 2864} {"train_loss": -6.63425350189209, "global_step": 120306, "epoch": 2864} {"train_loss": -6.638574600219727, "global_step": 120307, "epoch": 2864} {"train_loss": -6.633622169494629, "global_step": 120308, "epoch": 2864} {"train_loss": -6.532562732696533, "global_step": 120309, "epoch": 2864} {"train_loss": -6.578773498535156, "global_step": 120310, "epoch": 2864} {"train_loss": -6.6544575691223145, "global_step": 120311, "epoch": 2864} {"train_loss": -6.577321529388428, "global_step": 120312, "epoch": 2864} {"train_loss": -6.674038410186768, "global_step": 120313, "epoch": 2864} {"train_loss": -6.513620376586914, "global_step": 120314, "epoch": 2864} {"train_loss": -6.59138298034668, "global_step": 120315, "epoch": 2864} {"train_loss": -6.57465934753418, "global_step": 120316, "epoch": 2864} {"train_loss": -6.607583522796631, "global_step": 120317, "epoch": 2864} {"train_loss": -6.533504486083984, "global_step": 120318, "epoch": 2864} {"train_loss": -6.569108009338379, "global_step": 120319, "epoch": 2864} {"train_loss": -6.406487464904785, "global_step": 120320, "epoch": 2864} {"train_loss": -6.5725507736206055, "global_step": 120321, "epoch": 2864} {"train_loss": -6.459012031555176, "global_step": 120322, "epoch": 2864} {"train_loss": -6.412191390991211, "global_step": 120323, "epoch": 2864} {"train_loss": -6.467700004577637, "global_step": 120324, "epoch": 2864} {"train_loss": -6.551599502563477, "global_step": 120325, "epoch": 2864} {"train_loss": -6.557164192199707, "global_step": 120326, "epoch": 2864} {"train_loss": -6.525759220123291, "global_step": 120327, "epoch": 2864} {"train_loss": -6.393735408782959, "global_step": 120328, "epoch": 2864} {"train_loss": -6.566820814495995, "global_step": 120329, "epoch": 2864, "val_loss": 66103.34375} {"train_loss": -6.435345649719238, "global_step": 120330, "epoch": 2865} {"train_loss": -6.552060127258301, "global_step": 120331, "epoch": 2865} {"train_loss": -6.553913116455078, "global_step": 120332, "epoch": 2865} {"train_loss": -6.440273761749268, "global_step": 120333, "epoch": 2865} {"train_loss": -6.532652854919434, "global_step": 120334, "epoch": 2865} {"train_loss": -6.361977577209473, "global_step": 120335, "epoch": 2865} {"train_loss": -6.479351997375488, "global_step": 120336, "epoch": 2865} {"train_loss": -6.50361442565918, "global_step": 120337, "epoch": 2865} {"train_loss": -6.610431671142578, "global_step": 120338, "epoch": 2865} {"train_loss": -6.589089393615723, "global_step": 120339, "epoch": 2865} {"train_loss": -6.526244640350342, "global_step": 120340, "epoch": 2865} {"train_loss": -6.509188175201416, "global_step": 120341, "epoch": 2865} {"train_loss": -6.650243759155273, "global_step": 120342, "epoch": 2865} {"train_loss": -6.540384769439697, "global_step": 120343, "epoch": 2865} {"train_loss": -6.658588409423828, "global_step": 120344, "epoch": 2865} {"train_loss": -6.5837297439575195, "global_step": 120345, "epoch": 2865} {"train_loss": -6.574484825134277, "global_step": 120346, "epoch": 2865} {"train_loss": -6.701958179473877, "global_step": 120347, "epoch": 2865} {"train_loss": -6.609265327453613, "global_step": 120348, "epoch": 2865} {"train_loss": -6.563752174377441, "global_step": 120349, "epoch": 2865} {"train_loss": -6.610418796539307, "global_step": 120350, "epoch": 2865} {"train_loss": -6.499674320220947, "global_step": 120351, "epoch": 2865} {"train_loss": -6.5762810707092285, "global_step": 120352, "epoch": 2865} {"train_loss": -6.4865007400512695, "global_step": 120353, "epoch": 2865} {"train_loss": -6.517076015472412, "global_step": 120354, "epoch": 2865} {"train_loss": -6.538112163543701, "global_step": 120355, "epoch": 2865} {"train_loss": -6.651853561401367, "global_step": 120356, "epoch": 2865} {"train_loss": -6.511370658874512, "global_step": 120357, "epoch": 2865} {"train_loss": -6.517439842224121, "global_step": 120358, "epoch": 2865} {"train_loss": -6.650650501251221, "global_step": 120359, "epoch": 2865} {"train_loss": -6.560988426208496, "global_step": 120360, "epoch": 2865} {"train_loss": -6.535094261169434, "global_step": 120361, "epoch": 2865} {"train_loss": -6.6339216232299805, "global_step": 120362, "epoch": 2865} {"train_loss": -6.685784339904785, "global_step": 120363, "epoch": 2865} {"train_loss": -6.563187599182129, "global_step": 120364, "epoch": 2865} {"train_loss": -6.469134330749512, "global_step": 120365, "epoch": 2865} {"train_loss": -6.566949844360352, "global_step": 120366, "epoch": 2865} {"train_loss": -6.5434770584106445, "global_step": 120367, "epoch": 2865} {"train_loss": -6.643304347991943, "global_step": 120368, "epoch": 2865} {"train_loss": -6.589087963104248, "global_step": 120369, "epoch": 2865} {"train_loss": -6.577119827270508, "global_step": 120370, "epoch": 2865} {"train_loss": -6.55985537029448, "global_step": 120371, "epoch": 2865, "val_loss": 65718.7109375} {"train_loss": -6.60249137878418, "global_step": 120372, "epoch": 2866} {"train_loss": -6.6019182205200195, "global_step": 120373, "epoch": 2866} {"train_loss": -6.553514003753662, "global_step": 120374, "epoch": 2866} {"train_loss": -6.508914947509766, "global_step": 120375, "epoch": 2866} {"train_loss": -6.634703636169434, "global_step": 120376, "epoch": 2866} {"train_loss": -6.5837626457214355, "global_step": 120377, "epoch": 2866} {"train_loss": -6.656550407409668, "global_step": 120378, "epoch": 2866} {"train_loss": -6.6682586669921875, "global_step": 120379, "epoch": 2866} {"train_loss": -6.607207298278809, "global_step": 120380, "epoch": 2866} {"train_loss": -6.494205951690674, "global_step": 120381, "epoch": 2866} {"train_loss": -6.618967056274414, "global_step": 120382, "epoch": 2866} {"train_loss": -6.636927604675293, "global_step": 120383, "epoch": 2866} {"train_loss": -6.693533897399902, "global_step": 120384, "epoch": 2866} {"train_loss": -6.608086585998535, "global_step": 120385, "epoch": 2866} {"train_loss": -6.672220706939697, "global_step": 120386, "epoch": 2866} {"train_loss": -6.672869682312012, "global_step": 120387, "epoch": 2866} {"train_loss": -6.666333198547363, "global_step": 120388, "epoch": 2866} {"train_loss": -6.574536323547363, "global_step": 120389, "epoch": 2866} {"train_loss": -6.627653121948242, "global_step": 120390, "epoch": 2866} {"train_loss": -6.693127155303955, "global_step": 120391, "epoch": 2866} {"train_loss": -6.696916580200195, "global_step": 120392, "epoch": 2866} {"train_loss": -6.583918571472168, "global_step": 120393, "epoch": 2866} {"train_loss": -6.688052654266357, "global_step": 120394, "epoch": 2866} {"train_loss": -6.639637470245361, "global_step": 120395, "epoch": 2866} {"train_loss": -6.691474437713623, "global_step": 120396, "epoch": 2866} {"train_loss": -6.592704772949219, "global_step": 120397, "epoch": 2866} {"train_loss": -6.617652893066406, "global_step": 120398, "epoch": 2866} {"train_loss": -6.513293266296387, "global_step": 120399, "epoch": 2866} {"train_loss": -6.594549179077148, "global_step": 120400, "epoch": 2866} {"train_loss": -6.635649681091309, "global_step": 120401, "epoch": 2866} {"train_loss": -6.5066328048706055, "global_step": 120402, "epoch": 2866} {"train_loss": -6.511096000671387, "global_step": 120403, "epoch": 2866} {"train_loss": -6.633415222167969, "global_step": 120404, "epoch": 2866} {"train_loss": -6.647319793701172, "global_step": 120405, "epoch": 2866} {"train_loss": -6.344954490661621, "global_step": 120406, "epoch": 2866} {"train_loss": -6.603578567504883, "global_step": 120407, "epoch": 2866} {"train_loss": -6.5355682373046875, "global_step": 120408, "epoch": 2866} {"train_loss": -6.444159984588623, "global_step": 120409, "epoch": 2866} {"train_loss": -6.568991661071777, "global_step": 120410, "epoch": 2866} {"train_loss": -6.622450351715088, "global_step": 120411, "epoch": 2866} {"train_loss": -6.46713924407959, "global_step": 120412, "epoch": 2866} {"train_loss": -6.5974338962918235, "global_step": 120413, "epoch": 2866, "val_loss": 65935.2421875} {"train_loss": -6.406721115112305, "global_step": 120414, "epoch": 2867} {"train_loss": -6.502988815307617, "global_step": 120415, "epoch": 2867} {"train_loss": -6.516175746917725, "global_step": 120416, "epoch": 2867} {"train_loss": -6.592163562774658, "global_step": 120417, "epoch": 2867} {"train_loss": -6.565686225891113, "global_step": 120418, "epoch": 2867} {"train_loss": -6.467938423156738, "global_step": 120419, "epoch": 2867} {"train_loss": -6.534847259521484, "global_step": 120420, "epoch": 2867} {"train_loss": -6.5568013191223145, "global_step": 120421, "epoch": 2867} {"train_loss": -6.694184303283691, "global_step": 120422, "epoch": 2867} {"train_loss": -6.61489200592041, "global_step": 120423, "epoch": 2867} {"train_loss": -6.631583213806152, "global_step": 120424, "epoch": 2867} {"train_loss": -6.577774524688721, "global_step": 120425, "epoch": 2867} {"train_loss": -6.48018741607666, "global_step": 120426, "epoch": 2867} {"train_loss": -6.561768531799316, "global_step": 120427, "epoch": 2867} {"train_loss": -6.600482940673828, "global_step": 120428, "epoch": 2867} {"train_loss": -6.535904884338379, "global_step": 120429, "epoch": 2867} {"train_loss": -6.503106117248535, "global_step": 120430, "epoch": 2867} {"train_loss": -6.6327385902404785, "global_step": 120431, "epoch": 2867} {"train_loss": -6.5860137939453125, "global_step": 120432, "epoch": 2867} {"train_loss": -6.617162704467773, "global_step": 120433, "epoch": 2867} {"train_loss": -6.562491416931152, "global_step": 120434, "epoch": 2867} {"train_loss": -6.510540962219238, "global_step": 120435, "epoch": 2867} {"train_loss": -6.4757080078125, "global_step": 120436, "epoch": 2867} {"train_loss": -6.534418106079102, "global_step": 120437, "epoch": 2867} {"train_loss": -6.544622421264648, "global_step": 120438, "epoch": 2867} {"train_loss": -6.6411542892456055, "global_step": 120439, "epoch": 2867} {"train_loss": -6.512160301208496, "global_step": 120440, "epoch": 2867} {"train_loss": -6.610817909240723, "global_step": 120441, "epoch": 2867} {"train_loss": -6.547725677490234, "global_step": 120442, "epoch": 2867} {"train_loss": -6.5924153327941895, "global_step": 120443, "epoch": 2867} {"train_loss": -6.491025924682617, "global_step": 120444, "epoch": 2867} {"train_loss": -6.507877349853516, "global_step": 120445, "epoch": 2867} {"train_loss": -6.561678886413574, "global_step": 120446, "epoch": 2867} {"train_loss": -6.493137359619141, "global_step": 120447, "epoch": 2867} {"train_loss": -6.595412254333496, "global_step": 120448, "epoch": 2867} {"train_loss": -6.518062591552734, "global_step": 120449, "epoch": 2867} {"train_loss": -6.430742263793945, "global_step": 120450, "epoch": 2867} {"train_loss": -6.609504699707031, "global_step": 120451, "epoch": 2867} {"train_loss": -6.528748989105225, "global_step": 120452, "epoch": 2867} {"train_loss": -6.5639801025390625, "global_step": 120453, "epoch": 2867} {"train_loss": -6.563767433166504, "global_step": 120454, "epoch": 2867} {"train_loss": -6.549419902619862, "global_step": 120455, "epoch": 2867, "val_loss": 65946.4921875} {"train_loss": -6.486931800842285, "global_step": 120456, "epoch": 2868} {"train_loss": -6.710787773132324, "global_step": 120457, "epoch": 2868} {"train_loss": -6.468061447143555, "global_step": 120458, "epoch": 2868} {"train_loss": -6.527858734130859, "global_step": 120459, "epoch": 2868} {"train_loss": -6.605985641479492, "global_step": 120460, "epoch": 2868} {"train_loss": -6.638492584228516, "global_step": 120461, "epoch": 2868} {"train_loss": -6.627986907958984, "global_step": 120462, "epoch": 2868} {"train_loss": -6.562471389770508, "global_step": 120463, "epoch": 2868} {"train_loss": -6.5636067390441895, "global_step": 120464, "epoch": 2868} {"train_loss": -6.59647274017334, "global_step": 120465, "epoch": 2868} {"train_loss": -6.598904609680176, "global_step": 120466, "epoch": 2868} {"train_loss": -6.698083877563477, "global_step": 120467, "epoch": 2868} {"train_loss": -6.627294063568115, "global_step": 120468, "epoch": 2868} {"train_loss": -6.626348972320557, "global_step": 120469, "epoch": 2868} {"train_loss": -6.715246677398682, "global_step": 120470, "epoch": 2868} {"train_loss": -6.523282527923584, "global_step": 120471, "epoch": 2868} {"train_loss": -6.600860595703125, "global_step": 120472, "epoch": 2868} {"train_loss": -6.713847637176514, "global_step": 120473, "epoch": 2868} {"train_loss": -6.598701000213623, "global_step": 120474, "epoch": 2868} {"train_loss": -6.51523494720459, "global_step": 120475, "epoch": 2868} {"train_loss": -6.6068010330200195, "global_step": 120476, "epoch": 2868} {"train_loss": -6.612560749053955, "global_step": 120477, "epoch": 2868} {"train_loss": -6.445736885070801, "global_step": 120478, "epoch": 2868} {"train_loss": -6.608386039733887, "global_step": 120479, "epoch": 2868} {"train_loss": -6.5876030921936035, "global_step": 120480, "epoch": 2868} {"train_loss": -6.536203384399414, "global_step": 120481, "epoch": 2868} {"train_loss": -6.553905487060547, "global_step": 120482, "epoch": 2868} {"train_loss": -6.610366344451904, "global_step": 120483, "epoch": 2868} {"train_loss": -6.478055000305176, "global_step": 120484, "epoch": 2868} {"train_loss": -6.637718200683594, "global_step": 120485, "epoch": 2868} {"train_loss": -6.633482456207275, "global_step": 120486, "epoch": 2868} {"train_loss": -6.502414226531982, "global_step": 120487, "epoch": 2868} {"train_loss": -6.731204032897949, "global_step": 120488, "epoch": 2868} {"train_loss": -6.614476203918457, "global_step": 120489, "epoch": 2868} {"train_loss": -6.67133903503418, "global_step": 120490, "epoch": 2868} {"train_loss": -6.583768844604492, "global_step": 120491, "epoch": 2868} {"train_loss": -6.54486608505249, "global_step": 120492, "epoch": 2868} {"train_loss": -6.575656890869141, "global_step": 120493, "epoch": 2868} {"train_loss": -6.568675518035889, "global_step": 120494, "epoch": 2868} {"train_loss": -6.494148254394531, "global_step": 120495, "epoch": 2868} {"train_loss": -6.513176918029785, "global_step": 120496, "epoch": 2868} {"train_loss": -6.586348635809762, "global_step": 120497, "epoch": 2868, "val_loss": 65974.203125} {"train_loss": -6.5634284019470215, "global_step": 120498, "epoch": 2869} {"train_loss": -6.494572639465332, "global_step": 120499, "epoch": 2869} {"train_loss": -6.583837509155273, "global_step": 120500, "epoch": 2869} {"train_loss": -6.527823448181152, "global_step": 120501, "epoch": 2869} {"train_loss": -6.675710678100586, "global_step": 120502, "epoch": 2869} {"train_loss": -6.633354187011719, "global_step": 120503, "epoch": 2869} {"train_loss": -6.507983684539795, "global_step": 120504, "epoch": 2869} {"train_loss": -6.535818099975586, "global_step": 120505, "epoch": 2869} {"train_loss": -6.561319351196289, "global_step": 120506, "epoch": 2869} {"train_loss": -6.693725109100342, "global_step": 120507, "epoch": 2869} {"train_loss": -6.554566860198975, "global_step": 120508, "epoch": 2869} {"train_loss": -6.659146308898926, "global_step": 120509, "epoch": 2869} {"train_loss": -6.504788875579834, "global_step": 120510, "epoch": 2869} {"train_loss": -6.536865234375, "global_step": 120511, "epoch": 2869} {"train_loss": -6.529323577880859, "global_step": 120512, "epoch": 2869} {"train_loss": -6.610237121582031, "global_step": 120513, "epoch": 2869} {"train_loss": -6.509990215301514, "global_step": 120514, "epoch": 2869} {"train_loss": -6.613860130310059, "global_step": 120515, "epoch": 2869} {"train_loss": -6.543972969055176, "global_step": 120516, "epoch": 2869} {"train_loss": -6.529860496520996, "global_step": 120517, "epoch": 2869} {"train_loss": -6.6134209632873535, "global_step": 120518, "epoch": 2869} {"train_loss": -6.4457197189331055, "global_step": 120519, "epoch": 2869} {"train_loss": -6.512655258178711, "global_step": 120520, "epoch": 2869} {"train_loss": -6.673740386962891, "global_step": 120521, "epoch": 2869} {"train_loss": -6.4947919845581055, "global_step": 120522, "epoch": 2869} {"train_loss": -6.53653621673584, "global_step": 120523, "epoch": 2869} {"train_loss": -6.679394721984863, "global_step": 120524, "epoch": 2869} {"train_loss": -6.594916820526123, "global_step": 120525, "epoch": 2869} {"train_loss": -6.692386627197266, "global_step": 120526, "epoch": 2869} {"train_loss": -6.601712703704834, "global_step": 120527, "epoch": 2869} {"train_loss": -6.656875133514404, "global_step": 120528, "epoch": 2869} {"train_loss": -6.655768394470215, "global_step": 120529, "epoch": 2869} {"train_loss": -6.674870491027832, "global_step": 120530, "epoch": 2869} {"train_loss": -6.650467872619629, "global_step": 120531, "epoch": 2869} {"train_loss": -6.620757102966309, "global_step": 120532, "epoch": 2869} {"train_loss": -6.5248212814331055, "global_step": 120533, "epoch": 2869} {"train_loss": -6.6733198165893555, "global_step": 120534, "epoch": 2869} {"train_loss": -6.665311813354492, "global_step": 120535, "epoch": 2869} {"train_loss": -6.581251621246338, "global_step": 120536, "epoch": 2869} {"train_loss": -6.552180767059326, "global_step": 120537, "epoch": 2869} {"train_loss": -6.61055850982666, "global_step": 120538, "epoch": 2869} {"train_loss": -6.588198729923794, "global_step": 120539, "epoch": 2869, "val_loss": 65775.2578125} {"train_loss": -6.579610824584961, "global_step": 120540, "epoch": 2870} {"train_loss": -6.643782615661621, "global_step": 120541, "epoch": 2870} {"train_loss": -6.5015106201171875, "global_step": 120542, "epoch": 2870} {"train_loss": -6.438955307006836, "global_step": 120543, "epoch": 2870} {"train_loss": -6.579874515533447, "global_step": 120544, "epoch": 2870} {"train_loss": -6.581881046295166, "global_step": 120545, "epoch": 2870} {"train_loss": -6.418279647827148, "global_step": 120546, "epoch": 2870} {"train_loss": -6.576723098754883, "global_step": 120547, "epoch": 2870} {"train_loss": -6.6332807540893555, "global_step": 120548, "epoch": 2870} {"train_loss": -6.623212814331055, "global_step": 120549, "epoch": 2870} {"train_loss": -6.6701226234436035, "global_step": 120550, "epoch": 2870} {"train_loss": -6.642065048217773, "global_step": 120551, "epoch": 2870} {"train_loss": -6.605452537536621, "global_step": 120552, "epoch": 2870} {"train_loss": -6.5731964111328125, "global_step": 120553, "epoch": 2870} {"train_loss": -6.5995941162109375, "global_step": 120554, "epoch": 2870} {"train_loss": -6.6303510665893555, "global_step": 120555, "epoch": 2870} {"train_loss": -6.550355911254883, "global_step": 120556, "epoch": 2870} {"train_loss": -6.609755516052246, "global_step": 120557, "epoch": 2870} {"train_loss": -6.585681915283203, "global_step": 120558, "epoch": 2870} {"train_loss": -6.611957550048828, "global_step": 120559, "epoch": 2870} {"train_loss": -6.54123067855835, "global_step": 120560, "epoch": 2870} {"train_loss": -6.554232597351074, "global_step": 120561, "epoch": 2870} {"train_loss": -6.590981483459473, "global_step": 120562, "epoch": 2870} {"train_loss": -6.556912422180176, "global_step": 120563, "epoch": 2870} {"train_loss": -6.730505466461182, "global_step": 120564, "epoch": 2870} {"train_loss": -6.55490779876709, "global_step": 120565, "epoch": 2870} {"train_loss": -6.547248840332031, "global_step": 120566, "epoch": 2870} {"train_loss": -6.605253219604492, "global_step": 120567, "epoch": 2870} {"train_loss": -6.583676815032959, "global_step": 120568, "epoch": 2870} {"train_loss": -6.631209373474121, "global_step": 120569, "epoch": 2870} {"train_loss": -6.537946701049805, "global_step": 120570, "epoch": 2870} {"train_loss": -6.6190900802612305, "global_step": 120571, "epoch": 2870} {"train_loss": -6.520687580108643, "global_step": 120572, "epoch": 2870} {"train_loss": -6.60246467590332, "global_step": 120573, "epoch": 2870} {"train_loss": -6.602964878082275, "global_step": 120574, "epoch": 2870} {"train_loss": -6.602574825286865, "global_step": 120575, "epoch": 2870} {"train_loss": -6.629154205322266, "global_step": 120576, "epoch": 2870} {"train_loss": -6.690052032470703, "global_step": 120577, "epoch": 2870} {"train_loss": -6.48286247253418, "global_step": 120578, "epoch": 2870} {"train_loss": -6.586782455444336, "global_step": 120579, "epoch": 2870} {"train_loss": -6.637752056121826, "global_step": 120580, "epoch": 2870} {"train_loss": -6.5892628374553865, "global_step": 120581, "epoch": 2870, "val_loss": 66102.03125} {"train_loss": -6.598635673522949, "global_step": 120582, "epoch": 2871} {"train_loss": -6.59737491607666, "global_step": 120583, "epoch": 2871} {"train_loss": -6.630033493041992, "global_step": 120584, "epoch": 2871} {"train_loss": -6.588156223297119, "global_step": 120585, "epoch": 2871} {"train_loss": -6.595187187194824, "global_step": 120586, "epoch": 2871} {"train_loss": -6.5705695152282715, "global_step": 120587, "epoch": 2871} {"train_loss": -6.517589569091797, "global_step": 120588, "epoch": 2871} {"train_loss": -6.400346755981445, "global_step": 120589, "epoch": 2871} {"train_loss": -6.646273612976074, "global_step": 120590, "epoch": 2871} {"train_loss": -6.46040678024292, "global_step": 120591, "epoch": 2871} {"train_loss": -6.4743876457214355, "global_step": 120592, "epoch": 2871} {"train_loss": -6.59263277053833, "global_step": 120593, "epoch": 2871} {"train_loss": -6.669862747192383, "global_step": 120594, "epoch": 2871} {"train_loss": -6.521358013153076, "global_step": 120595, "epoch": 2871} {"train_loss": -6.650378704071045, "global_step": 120596, "epoch": 2871} {"train_loss": -6.572361946105957, "global_step": 120597, "epoch": 2871} {"train_loss": -6.493925094604492, "global_step": 120598, "epoch": 2871} {"train_loss": -6.5306854248046875, "global_step": 120599, "epoch": 2871} {"train_loss": -6.5125732421875, "global_step": 120600, "epoch": 2871} {"train_loss": -6.3961896896362305, "global_step": 120601, "epoch": 2871} {"train_loss": -6.564208030700684, "global_step": 120602, "epoch": 2871} {"train_loss": -6.4969482421875, "global_step": 120603, "epoch": 2871} {"train_loss": -6.56423807144165, "global_step": 120604, "epoch": 2871} {"train_loss": -6.588469505310059, "global_step": 120605, "epoch": 2871} {"train_loss": -6.520363807678223, "global_step": 120606, "epoch": 2871} {"train_loss": -6.648178577423096, "global_step": 120607, "epoch": 2871} {"train_loss": -6.612336158752441, "global_step": 120608, "epoch": 2871} {"train_loss": -6.6285810470581055, "global_step": 120609, "epoch": 2871} {"train_loss": -6.481534004211426, "global_step": 120610, "epoch": 2871} {"train_loss": -6.3839874267578125, "global_step": 120611, "epoch": 2871} {"train_loss": -6.483922958374023, "global_step": 120612, "epoch": 2871} {"train_loss": -6.419094085693359, "global_step": 120613, "epoch": 2871} {"train_loss": -6.636081218719482, "global_step": 120614, "epoch": 2871} {"train_loss": -6.522561073303223, "global_step": 120615, "epoch": 2871} {"train_loss": -6.419058799743652, "global_step": 120616, "epoch": 2871} {"train_loss": -6.530059337615967, "global_step": 120617, "epoch": 2871} {"train_loss": -6.463021755218506, "global_step": 120618, "epoch": 2871} {"train_loss": -6.48057222366333, "global_step": 120619, "epoch": 2871} {"train_loss": -6.481975555419922, "global_step": 120620, "epoch": 2871} {"train_loss": -6.525680065155029, "global_step": 120621, "epoch": 2871} {"train_loss": -6.6294684410095215, "global_step": 120622, "epoch": 2871} {"train_loss": -6.537207217443557, "global_step": 120623, "epoch": 2871, "val_loss": 65964.7109375} {"train_loss": -6.538785934448242, "global_step": 120624, "epoch": 2872} {"train_loss": -6.537757396697998, "global_step": 120625, "epoch": 2872} {"train_loss": -6.494574069976807, "global_step": 120626, "epoch": 2872} {"train_loss": -6.520336151123047, "global_step": 120627, "epoch": 2872} {"train_loss": -6.5437493324279785, "global_step": 120628, "epoch": 2872} {"train_loss": -6.628507614135742, "global_step": 120629, "epoch": 2872} {"train_loss": -6.541069984436035, "global_step": 120630, "epoch": 2872} {"train_loss": -6.641767501831055, "global_step": 120631, "epoch": 2872} {"train_loss": -6.573184490203857, "global_step": 120632, "epoch": 2872} {"train_loss": -6.585656642913818, "global_step": 120633, "epoch": 2872} {"train_loss": -6.615785598754883, "global_step": 120634, "epoch": 2872} {"train_loss": -6.670406818389893, "global_step": 120635, "epoch": 2872} {"train_loss": -6.662127494812012, "global_step": 120636, "epoch": 2872} {"train_loss": -6.6504621505737305, "global_step": 120637, "epoch": 2872} {"train_loss": -6.657378673553467, "global_step": 120638, "epoch": 2872} {"train_loss": -6.615329742431641, "global_step": 120639, "epoch": 2872} {"train_loss": -6.573330879211426, "global_step": 120640, "epoch": 2872} {"train_loss": -6.656280040740967, "global_step": 120641, "epoch": 2872} {"train_loss": -6.5630574226379395, "global_step": 120642, "epoch": 2872} {"train_loss": -6.671213150024414, "global_step": 120643, "epoch": 2872} {"train_loss": -6.6517791748046875, "global_step": 120644, "epoch": 2872} {"train_loss": -6.616288661956787, "global_step": 120645, "epoch": 2872} {"train_loss": -6.569425582885742, "global_step": 120646, "epoch": 2872} {"train_loss": -6.681853294372559, "global_step": 120647, "epoch": 2872} {"train_loss": -6.662136077880859, "global_step": 120648, "epoch": 2872} {"train_loss": -6.609975337982178, "global_step": 120649, "epoch": 2872} {"train_loss": -6.692825794219971, "global_step": 120650, "epoch": 2872} {"train_loss": -6.452502250671387, "global_step": 120651, "epoch": 2872} {"train_loss": -6.482503890991211, "global_step": 120652, "epoch": 2872} {"train_loss": -6.6104230880737305, "global_step": 120653, "epoch": 2872} {"train_loss": -6.531490802764893, "global_step": 120654, "epoch": 2872} {"train_loss": -6.633616924285889, "global_step": 120655, "epoch": 2872} {"train_loss": -6.768390655517578, "global_step": 120656, "epoch": 2872} {"train_loss": -6.490423679351807, "global_step": 120657, "epoch": 2872} {"train_loss": -6.558134078979492, "global_step": 120658, "epoch": 2872} {"train_loss": -6.519861221313477, "global_step": 120659, "epoch": 2872} {"train_loss": -6.5674543380737305, "global_step": 120660, "epoch": 2872} {"train_loss": -6.635354518890381, "global_step": 120661, "epoch": 2872} {"train_loss": -6.531110763549805, "global_step": 120662, "epoch": 2872} {"train_loss": -6.6072998046875, "global_step": 120663, "epoch": 2872} {"train_loss": -6.52396821975708, "global_step": 120664, "epoch": 2872} {"train_loss": -6.589476891926357, "global_step": 120665, "epoch": 2872, "val_loss": 65770.671875} {"train_loss": -6.535062789916992, "global_step": 120666, "epoch": 2873} {"train_loss": -6.650224685668945, "global_step": 120667, "epoch": 2873} {"train_loss": -6.486901760101318, "global_step": 120668, "epoch": 2873} {"train_loss": -6.6999735832214355, "global_step": 120669, "epoch": 2873} {"train_loss": -6.556901931762695, "global_step": 120670, "epoch": 2873} {"train_loss": -6.474891185760498, "global_step": 120671, "epoch": 2873} {"train_loss": -6.6614227294921875, "global_step": 120672, "epoch": 2873} {"train_loss": -6.579784393310547, "global_step": 120673, "epoch": 2873} {"train_loss": -6.560474395751953, "global_step": 120674, "epoch": 2873} {"train_loss": -6.5683746337890625, "global_step": 120675, "epoch": 2873} {"train_loss": -6.596571922302246, "global_step": 120676, "epoch": 2873} {"train_loss": -6.623054027557373, "global_step": 120677, "epoch": 2873} {"train_loss": -6.569522857666016, "global_step": 120678, "epoch": 2873} {"train_loss": -6.6392364501953125, "global_step": 120679, "epoch": 2873} {"train_loss": -6.609622001647949, "global_step": 120680, "epoch": 2873} {"train_loss": -6.556168556213379, "global_step": 120681, "epoch": 2873} {"train_loss": -6.603309154510498, "global_step": 120682, "epoch": 2873} {"train_loss": -6.471978187561035, "global_step": 120683, "epoch": 2873} {"train_loss": -6.6749677658081055, "global_step": 120684, "epoch": 2873} {"train_loss": -6.566281795501709, "global_step": 120685, "epoch": 2873} {"train_loss": -6.392908573150635, "global_step": 120686, "epoch": 2873} {"train_loss": -6.437575340270996, "global_step": 120687, "epoch": 2873} {"train_loss": -6.493077278137207, "global_step": 120688, "epoch": 2873} {"train_loss": -6.393228054046631, "global_step": 120689, "epoch": 2873} {"train_loss": -6.5715484619140625, "global_step": 120690, "epoch": 2873} {"train_loss": -6.561820983886719, "global_step": 120691, "epoch": 2873} {"train_loss": -6.546667098999023, "global_step": 120692, "epoch": 2873} {"train_loss": -6.457680702209473, "global_step": 120693, "epoch": 2873} {"train_loss": -6.455087184906006, "global_step": 120694, "epoch": 2873} {"train_loss": -6.502703666687012, "global_step": 120695, "epoch": 2873} {"train_loss": -6.537854194641113, "global_step": 120696, "epoch": 2873} {"train_loss": -6.638129234313965, "global_step": 120697, "epoch": 2873} {"train_loss": -6.562858581542969, "global_step": 120698, "epoch": 2873} {"train_loss": -6.571028709411621, "global_step": 120699, "epoch": 2873} {"train_loss": -6.568650722503662, "global_step": 120700, "epoch": 2873} {"train_loss": -6.532378673553467, "global_step": 120701, "epoch": 2873} {"train_loss": -6.509153366088867, "global_step": 120702, "epoch": 2873} {"train_loss": -6.525193691253662, "global_step": 120703, "epoch": 2873} {"train_loss": -6.595843315124512, "global_step": 120704, "epoch": 2873} {"train_loss": -6.4546284675598145, "global_step": 120705, "epoch": 2873} {"train_loss": -6.55565071105957, "global_step": 120706, "epoch": 2873} {"train_loss": -6.54914623215085, "global_step": 120707, "epoch": 2873, "val_loss": 65950.671875} {"train_loss": -6.5152692794799805, "global_step": 120708, "epoch": 2874} {"train_loss": -6.496618270874023, "global_step": 120709, "epoch": 2874} {"train_loss": -6.4053239822387695, "global_step": 120710, "epoch": 2874} {"train_loss": -6.567901611328125, "global_step": 120711, "epoch": 2874} {"train_loss": -6.529224395751953, "global_step": 120712, "epoch": 2874} {"train_loss": -6.47235107421875, "global_step": 120713, "epoch": 2874} {"train_loss": -6.635149002075195, "global_step": 120714, "epoch": 2874} {"train_loss": -6.47724723815918, "global_step": 120715, "epoch": 2874} {"train_loss": -6.5723114013671875, "global_step": 120716, "epoch": 2874} {"train_loss": -6.606389999389648, "global_step": 120717, "epoch": 2874} {"train_loss": -6.603715896606445, "global_step": 120718, "epoch": 2874} {"train_loss": -6.609030723571777, "global_step": 120719, "epoch": 2874} {"train_loss": -6.547781944274902, "global_step": 120720, "epoch": 2874} {"train_loss": -6.58383846282959, "global_step": 120721, "epoch": 2874} {"train_loss": -6.606382369995117, "global_step": 120722, "epoch": 2874} {"train_loss": -6.625694274902344, "global_step": 120723, "epoch": 2874} {"train_loss": -6.515098571777344, "global_step": 120724, "epoch": 2874} {"train_loss": -6.601700305938721, "global_step": 120725, "epoch": 2874} {"train_loss": -6.695833206176758, "global_step": 120726, "epoch": 2874} {"train_loss": -6.594318389892578, "global_step": 120727, "epoch": 2874} {"train_loss": -6.585351467132568, "global_step": 120728, "epoch": 2874} {"train_loss": -6.663990020751953, "global_step": 120729, "epoch": 2874} {"train_loss": -6.602608680725098, "global_step": 120730, "epoch": 2874} {"train_loss": -6.590068817138672, "global_step": 120731, "epoch": 2874} {"train_loss": -6.638662338256836, "global_step": 120732, "epoch": 2874} {"train_loss": -6.757269859313965, "global_step": 120733, "epoch": 2874} {"train_loss": -6.588371753692627, "global_step": 120734, "epoch": 2874} {"train_loss": -6.606302261352539, "global_step": 120735, "epoch": 2874} {"train_loss": -6.696350574493408, "global_step": 120736, "epoch": 2874} {"train_loss": -6.595686912536621, "global_step": 120737, "epoch": 2874} {"train_loss": -6.511691093444824, "global_step": 120738, "epoch": 2874} {"train_loss": -6.632968425750732, "global_step": 120739, "epoch": 2874} {"train_loss": -6.6531982421875, "global_step": 120740, "epoch": 2874} {"train_loss": -6.6342267990112305, "global_step": 120741, "epoch": 2874} {"train_loss": -6.628066062927246, "global_step": 120742, "epoch": 2874} {"train_loss": -6.580481052398682, "global_step": 120743, "epoch": 2874} {"train_loss": -6.56773567199707, "global_step": 120744, "epoch": 2874} {"train_loss": -6.608846664428711, "global_step": 120745, "epoch": 2874} {"train_loss": -6.589489936828613, "global_step": 120746, "epoch": 2874} {"train_loss": -6.701213836669922, "global_step": 120747, "epoch": 2874} {"train_loss": -6.651364326477051, "global_step": 120748, "epoch": 2874} {"train_loss": -6.592671996071225, "global_step": 120749, "epoch": 2874, "val_loss": 65762.046875} {"train_loss": -6.572453498840332, "global_step": 120750, "epoch": 2875} {"train_loss": -6.62270450592041, "global_step": 120751, "epoch": 2875} {"train_loss": -6.513188362121582, "global_step": 120752, "epoch": 2875} {"train_loss": -6.601951599121094, "global_step": 120753, "epoch": 2875} {"train_loss": -6.6395721435546875, "global_step": 120754, "epoch": 2875} {"train_loss": -6.569205284118652, "global_step": 120755, "epoch": 2875} {"train_loss": -6.525543212890625, "global_step": 120756, "epoch": 2875} {"train_loss": -6.620186805725098, "global_step": 120757, "epoch": 2875} {"train_loss": -6.633108139038086, "global_step": 120758, "epoch": 2875} {"train_loss": -6.4931640625, "global_step": 120759, "epoch": 2875} {"train_loss": -6.663158416748047, "global_step": 120760, "epoch": 2875} {"train_loss": -6.474404335021973, "global_step": 120761, "epoch": 2875} {"train_loss": -6.760533332824707, "global_step": 120762, "epoch": 2875} {"train_loss": -6.625532627105713, "global_step": 120763, "epoch": 2875} {"train_loss": -6.6673688888549805, "global_step": 120764, "epoch": 2875} {"train_loss": -6.620253562927246, "global_step": 120765, "epoch": 2875} {"train_loss": -6.500637054443359, "global_step": 120766, "epoch": 2875} {"train_loss": -6.618818283081055, "global_step": 120767, "epoch": 2875} {"train_loss": -6.585935592651367, "global_step": 120768, "epoch": 2875} {"train_loss": -6.637652397155762, "global_step": 120769, "epoch": 2875} {"train_loss": -6.595078468322754, "global_step": 120770, "epoch": 2875} {"train_loss": -6.553092002868652, "global_step": 120771, "epoch": 2875} {"train_loss": -6.63602352142334, "global_step": 120772, "epoch": 2875} {"train_loss": -6.640115261077881, "global_step": 120773, "epoch": 2875} {"train_loss": -6.6276044845581055, "global_step": 120774, "epoch": 2875} {"train_loss": -6.635301113128662, "global_step": 120775, "epoch": 2875} {"train_loss": -6.592569351196289, "global_step": 120776, "epoch": 2875} {"train_loss": -6.6054182052612305, "global_step": 120777, "epoch": 2875} {"train_loss": -6.619475364685059, "global_step": 120778, "epoch": 2875} {"train_loss": -6.646671295166016, "global_step": 120779, "epoch": 2875} {"train_loss": -6.632650852203369, "global_step": 120780, "epoch": 2875} {"train_loss": -6.647014141082764, "global_step": 120781, "epoch": 2875} {"train_loss": -6.672597885131836, "global_step": 120782, "epoch": 2875} {"train_loss": -6.6583781242370605, "global_step": 120783, "epoch": 2875} {"train_loss": -6.671239852905273, "global_step": 120784, "epoch": 2875} {"train_loss": -6.61995792388916, "global_step": 120785, "epoch": 2875} {"train_loss": -6.624241828918457, "global_step": 120786, "epoch": 2875} {"train_loss": -6.458314895629883, "global_step": 120787, "epoch": 2875} {"train_loss": -6.544857501983643, "global_step": 120788, "epoch": 2875} {"train_loss": -6.685708045959473, "global_step": 120789, "epoch": 2875} {"train_loss": -6.544140338897705, "global_step": 120790, "epoch": 2875} {"train_loss": -6.605955316906884, "global_step": 120791, "epoch": 2875, "val_loss": 65806.546875} {"train_loss": -6.629290580749512, "global_step": 120792, "epoch": 2876} {"train_loss": -6.747394561767578, "global_step": 120793, "epoch": 2876} {"train_loss": -6.564274787902832, "global_step": 120794, "epoch": 2876} {"train_loss": -6.528697967529297, "global_step": 120795, "epoch": 2876} {"train_loss": -6.572781562805176, "global_step": 120796, "epoch": 2876} {"train_loss": -6.421457767486572, "global_step": 120797, "epoch": 2876} {"train_loss": -6.641963958740234, "global_step": 120798, "epoch": 2876} {"train_loss": -6.558223247528076, "global_step": 120799, "epoch": 2876} {"train_loss": -6.528708457946777, "global_step": 120800, "epoch": 2876} {"train_loss": -6.602187156677246, "global_step": 120801, "epoch": 2876} {"train_loss": -6.560991287231445, "global_step": 120802, "epoch": 2876} {"train_loss": -6.392306327819824, "global_step": 120803, "epoch": 2876} {"train_loss": -6.343707084655762, "global_step": 120804, "epoch": 2876} {"train_loss": -6.555994987487793, "global_step": 120805, "epoch": 2876} {"train_loss": -6.6651411056518555, "global_step": 120806, "epoch": 2876} {"train_loss": -6.531105995178223, "global_step": 120807, "epoch": 2876} {"train_loss": -6.674068927764893, "global_step": 120808, "epoch": 2876} {"train_loss": -6.613824844360352, "global_step": 120809, "epoch": 2876} {"train_loss": -6.532016754150391, "global_step": 120810, "epoch": 2876} {"train_loss": -6.505809783935547, "global_step": 120811, "epoch": 2876} {"train_loss": -6.504823684692383, "global_step": 120812, "epoch": 2876} {"train_loss": -6.547414779663086, "global_step": 120813, "epoch": 2876} {"train_loss": -6.488698482513428, "global_step": 120814, "epoch": 2876} {"train_loss": -6.566584587097168, "global_step": 120815, "epoch": 2876} {"train_loss": -6.607048034667969, "global_step": 120816, "epoch": 2876} {"train_loss": -6.551011085510254, "global_step": 120817, "epoch": 2876} {"train_loss": -6.553945541381836, "global_step": 120818, "epoch": 2876} {"train_loss": -6.55703067779541, "global_step": 120819, "epoch": 2876} {"train_loss": -6.494905948638916, "global_step": 120820, "epoch": 2876} {"train_loss": -6.495944499969482, "global_step": 120821, "epoch": 2876} {"train_loss": -6.670508861541748, "global_step": 120822, "epoch": 2876} {"train_loss": -6.468489646911621, "global_step": 120823, "epoch": 2876} {"train_loss": -6.576021194458008, "global_step": 120824, "epoch": 2876} {"train_loss": -6.637566089630127, "global_step": 120825, "epoch": 2876} {"train_loss": -6.648700714111328, "global_step": 120826, "epoch": 2876} {"train_loss": -6.522512435913086, "global_step": 120827, "epoch": 2876} {"train_loss": -6.586819648742676, "global_step": 120828, "epoch": 2876} {"train_loss": -6.624112129211426, "global_step": 120829, "epoch": 2876} {"train_loss": -6.628114700317383, "global_step": 120830, "epoch": 2876} {"train_loss": -6.373154640197754, "global_step": 120831, "epoch": 2876} {"train_loss": -6.513655185699463, "global_step": 120832, "epoch": 2876} {"train_loss": -6.556460584912982, "global_step": 120833, "epoch": 2876, "val_loss": 65711.4296875} {"train_loss": -6.460536956787109, "global_step": 120834, "epoch": 2877} {"train_loss": -6.439206123352051, "global_step": 120835, "epoch": 2877} {"train_loss": -6.526978492736816, "global_step": 120836, "epoch": 2877} {"train_loss": -6.358834743499756, "global_step": 120837, "epoch": 2877} {"train_loss": -6.420785903930664, "global_step": 120838, "epoch": 2877} {"train_loss": -6.460392475128174, "global_step": 120839, "epoch": 2877} {"train_loss": -6.552162170410156, "global_step": 120840, "epoch": 2877} {"train_loss": -6.359015464782715, "global_step": 120841, "epoch": 2877} {"train_loss": -6.360475540161133, "global_step": 120842, "epoch": 2877} {"train_loss": -6.3749494552612305, "global_step": 120843, "epoch": 2877} {"train_loss": -6.440692901611328, "global_step": 120844, "epoch": 2877} {"train_loss": -6.365111351013184, "global_step": 120845, "epoch": 2877} {"train_loss": -6.557522296905518, "global_step": 120846, "epoch": 2877} {"train_loss": -6.215044975280762, "global_step": 120847, "epoch": 2877} {"train_loss": -6.479865074157715, "global_step": 120848, "epoch": 2877} {"train_loss": -6.357147216796875, "global_step": 120849, "epoch": 2877} {"train_loss": -6.400526523590088, "global_step": 120850, "epoch": 2877} {"train_loss": -6.4251556396484375, "global_step": 120851, "epoch": 2877} {"train_loss": -6.42258358001709, "global_step": 120852, "epoch": 2877} {"train_loss": -6.426983833312988, "global_step": 120853, "epoch": 2877} {"train_loss": -6.417205810546875, "global_step": 120854, "epoch": 2877} {"train_loss": -6.4416680335998535, "global_step": 120855, "epoch": 2877} {"train_loss": -6.53444766998291, "global_step": 120856, "epoch": 2877} {"train_loss": -6.463724136352539, "global_step": 120857, "epoch": 2877} {"train_loss": -6.408684730529785, "global_step": 120858, "epoch": 2877} {"train_loss": -6.588817596435547, "global_step": 120859, "epoch": 2877} {"train_loss": -6.404303073883057, "global_step": 120860, "epoch": 2877} {"train_loss": -6.554039001464844, "global_step": 120861, "epoch": 2877} {"train_loss": -6.453863620758057, "global_step": 120862, "epoch": 2877} {"train_loss": -6.524075031280518, "global_step": 120863, "epoch": 2877} {"train_loss": -6.486920356750488, "global_step": 120864, "epoch": 2877} {"train_loss": -6.593850135803223, "global_step": 120865, "epoch": 2877} {"train_loss": -6.658812522888184, "global_step": 120866, "epoch": 2877} {"train_loss": -6.541367530822754, "global_step": 120867, "epoch": 2877} {"train_loss": -6.540335178375244, "global_step": 120868, "epoch": 2877} {"train_loss": -6.522477626800537, "global_step": 120869, "epoch": 2877} {"train_loss": -6.637187957763672, "global_step": 120870, "epoch": 2877} {"train_loss": -6.528295516967773, "global_step": 120871, "epoch": 2877} {"train_loss": -6.529648303985596, "global_step": 120872, "epoch": 2877} {"train_loss": -6.5562872886657715, "global_step": 120873, "epoch": 2877} {"train_loss": -6.518733501434326, "global_step": 120874, "epoch": 2877} {"train_loss": -6.477446908042545, "global_step": 120875, "epoch": 2877, "val_loss": 65855.2109375} {"train_loss": -6.537724494934082, "global_step": 120876, "epoch": 2878} {"train_loss": -6.615028381347656, "global_step": 120877, "epoch": 2878} {"train_loss": -6.730715751647949, "global_step": 120878, "epoch": 2878} {"train_loss": -6.62552547454834, "global_step": 120879, "epoch": 2878} {"train_loss": -6.707095146179199, "global_step": 120880, "epoch": 2878} {"train_loss": -6.705848693847656, "global_step": 120881, "epoch": 2878} {"train_loss": -6.537416458129883, "global_step": 120882, "epoch": 2878} {"train_loss": -6.655558109283447, "global_step": 120883, "epoch": 2878} {"train_loss": -6.623104095458984, "global_step": 120884, "epoch": 2878} {"train_loss": -6.576939582824707, "global_step": 120885, "epoch": 2878} {"train_loss": -6.62921142578125, "global_step": 120886, "epoch": 2878} {"train_loss": -6.638816833496094, "global_step": 120887, "epoch": 2878} {"train_loss": -6.579172611236572, "global_step": 120888, "epoch": 2878} {"train_loss": -6.589280605316162, "global_step": 120889, "epoch": 2878} {"train_loss": -6.650513172149658, "global_step": 120890, "epoch": 2878} {"train_loss": -6.724906921386719, "global_step": 120891, "epoch": 2878} {"train_loss": -6.668225288391113, "global_step": 120892, "epoch": 2878} {"train_loss": -6.6528849601745605, "global_step": 120893, "epoch": 2878} {"train_loss": -6.599150657653809, "global_step": 120894, "epoch": 2878} {"train_loss": -6.588242053985596, "global_step": 120895, "epoch": 2878} {"train_loss": -6.5480875968933105, "global_step": 120896, "epoch": 2878} {"train_loss": -6.605724334716797, "global_step": 120897, "epoch": 2878} {"train_loss": -6.697249412536621, "global_step": 120898, "epoch": 2878} {"train_loss": -6.5117506980896, "global_step": 120899, "epoch": 2878} {"train_loss": -6.6210246086120605, "global_step": 120900, "epoch": 2878} {"train_loss": -6.489362716674805, "global_step": 120901, "epoch": 2878} {"train_loss": -6.488044738769531, "global_step": 120902, "epoch": 2878} {"train_loss": -6.5781168937683105, "global_step": 120903, "epoch": 2878} {"train_loss": -6.528193473815918, "global_step": 120904, "epoch": 2878} {"train_loss": -6.643111705780029, "global_step": 120905, "epoch": 2878} {"train_loss": -6.577130317687988, "global_step": 120906, "epoch": 2878} {"train_loss": -6.492366790771484, "global_step": 120907, "epoch": 2878} {"train_loss": -6.572256088256836, "global_step": 120908, "epoch": 2878} {"train_loss": -6.487236022949219, "global_step": 120909, "epoch": 2878} {"train_loss": -6.629560947418213, "global_step": 120910, "epoch": 2878} {"train_loss": -6.545623302459717, "global_step": 120911, "epoch": 2878} {"train_loss": -6.606405258178711, "global_step": 120912, "epoch": 2878} {"train_loss": -6.547897815704346, "global_step": 120913, "epoch": 2878} {"train_loss": -6.482899188995361, "global_step": 120914, "epoch": 2878} {"train_loss": -6.5103912353515625, "global_step": 120915, "epoch": 2878} {"train_loss": -6.423540115356445, "global_step": 120916, "epoch": 2878} {"train_loss": -6.58986040524074, "global_step": 120917, "epoch": 2878, "val_loss": 65868.9140625} {"train_loss": -6.506047248840332, "global_step": 120918, "epoch": 2879} {"train_loss": -6.614133358001709, "global_step": 120919, "epoch": 2879} {"train_loss": -6.47453498840332, "global_step": 120920, "epoch": 2879} {"train_loss": -6.684670448303223, "global_step": 120921, "epoch": 2879} {"train_loss": -6.6490349769592285, "global_step": 120922, "epoch": 2879} {"train_loss": -6.50404167175293, "global_step": 120923, "epoch": 2879} {"train_loss": -6.582808494567871, "global_step": 120924, "epoch": 2879} {"train_loss": -6.603697776794434, "global_step": 120925, "epoch": 2879} {"train_loss": -6.499824047088623, "global_step": 120926, "epoch": 2879} {"train_loss": -6.611127853393555, "global_step": 120927, "epoch": 2879} {"train_loss": -6.659944534301758, "global_step": 120928, "epoch": 2879} {"train_loss": -6.61141300201416, "global_step": 120929, "epoch": 2879} {"train_loss": -6.494353771209717, "global_step": 120930, "epoch": 2879} {"train_loss": -6.523493766784668, "global_step": 120931, "epoch": 2879} {"train_loss": -6.498958587646484, "global_step": 120932, "epoch": 2879} {"train_loss": -6.397800445556641, "global_step": 120933, "epoch": 2879} {"train_loss": -6.603167533874512, "global_step": 120934, "epoch": 2879} {"train_loss": -6.429566383361816, "global_step": 120935, "epoch": 2879} {"train_loss": -6.5393524169921875, "global_step": 120936, "epoch": 2879} {"train_loss": -6.406203746795654, "global_step": 120937, "epoch": 2879} {"train_loss": -6.517581462860107, "global_step": 120938, "epoch": 2879} {"train_loss": -6.624490737915039, "global_step": 120939, "epoch": 2879} {"train_loss": -6.473206520080566, "global_step": 120940, "epoch": 2879} {"train_loss": -6.603719711303711, "global_step": 120941, "epoch": 2879} {"train_loss": -6.497066497802734, "global_step": 120942, "epoch": 2879} {"train_loss": -6.520200729370117, "global_step": 120943, "epoch": 2879} {"train_loss": -6.5375566482543945, "global_step": 120944, "epoch": 2879} {"train_loss": -6.51732063293457, "global_step": 120945, "epoch": 2879} {"train_loss": -6.624517440795898, "global_step": 120946, "epoch": 2879} {"train_loss": -6.399380207061768, "global_step": 120947, "epoch": 2879} {"train_loss": -6.5657958984375, "global_step": 120948, "epoch": 2879} {"train_loss": -6.472320556640625, "global_step": 120949, "epoch": 2879} {"train_loss": -6.59798526763916, "global_step": 120950, "epoch": 2879} {"train_loss": -6.612100124359131, "global_step": 120951, "epoch": 2879} {"train_loss": -6.592118263244629, "global_step": 120952, "epoch": 2879} {"train_loss": -6.5705366134643555, "global_step": 120953, "epoch": 2879} {"train_loss": -6.5389180183410645, "global_step": 120954, "epoch": 2879} {"train_loss": -6.57501220703125, "global_step": 120955, "epoch": 2879} {"train_loss": -6.566518783569336, "global_step": 120956, "epoch": 2879} {"train_loss": -6.51210880279541, "global_step": 120957, "epoch": 2879} {"train_loss": -6.592106819152832, "global_step": 120958, "epoch": 2879} {"train_loss": -6.545178492863973, "global_step": 120959, "epoch": 2879, "val_loss": 65817.9921875} {"train_loss": -6.600020885467529, "global_step": 120960, "epoch": 2880} {"train_loss": -6.606285572052002, "global_step": 120961, "epoch": 2880} {"train_loss": -6.479340553283691, "global_step": 120962, "epoch": 2880} {"train_loss": -6.609518051147461, "global_step": 120963, "epoch": 2880} {"train_loss": -6.615155220031738, "global_step": 120964, "epoch": 2880} {"train_loss": -6.547750473022461, "global_step": 120965, "epoch": 2880} {"train_loss": -6.608201503753662, "global_step": 120966, "epoch": 2880} {"train_loss": -6.538524627685547, "global_step": 120967, "epoch": 2880} {"train_loss": -6.541439056396484, "global_step": 120968, "epoch": 2880} {"train_loss": -6.555538177490234, "global_step": 120969, "epoch": 2880} {"train_loss": -6.489875793457031, "global_step": 120970, "epoch": 2880} {"train_loss": -6.46489953994751, "global_step": 120971, "epoch": 2880} {"train_loss": -6.51912260055542, "global_step": 120972, "epoch": 2880} {"train_loss": -6.46702241897583, "global_step": 120973, "epoch": 2880} {"train_loss": -6.6224212646484375, "global_step": 120974, "epoch": 2880} {"train_loss": -6.541952133178711, "global_step": 120975, "epoch": 2880} {"train_loss": -6.54083251953125, "global_step": 120976, "epoch": 2880} {"train_loss": -6.574499130249023, "global_step": 120977, "epoch": 2880} {"train_loss": -6.606532096862793, "global_step": 120978, "epoch": 2880} {"train_loss": -6.547349452972412, "global_step": 120979, "epoch": 2880} {"train_loss": -6.604315757751465, "global_step": 120980, "epoch": 2880} {"train_loss": -6.533415794372559, "global_step": 120981, "epoch": 2880} {"train_loss": -6.601624488830566, "global_step": 120982, "epoch": 2880} {"train_loss": -6.4821367263793945, "global_step": 120983, "epoch": 2880} {"train_loss": -6.585642337799072, "global_step": 120984, "epoch": 2880} {"train_loss": -6.298846244812012, "global_step": 120985, "epoch": 2880} {"train_loss": -6.518298149108887, "global_step": 120986, "epoch": 2880} {"train_loss": -6.353283882141113, "global_step": 120987, "epoch": 2880} {"train_loss": -6.505555629730225, "global_step": 120988, "epoch": 2880} {"train_loss": -6.575596809387207, "global_step": 120989, "epoch": 2880} {"train_loss": -6.50814151763916, "global_step": 120990, "epoch": 2880} {"train_loss": -6.655041694641113, "global_step": 120991, "epoch": 2880} {"train_loss": -6.42791748046875, "global_step": 120992, "epoch": 2880} {"train_loss": -6.560835361480713, "global_step": 120993, "epoch": 2880} {"train_loss": -6.605343818664551, "global_step": 120994, "epoch": 2880} {"train_loss": -6.374249458312988, "global_step": 120995, "epoch": 2880} {"train_loss": -6.509664535522461, "global_step": 120996, "epoch": 2880} {"train_loss": -6.62844705581665, "global_step": 120997, "epoch": 2880} {"train_loss": -6.481202602386475, "global_step": 120998, "epoch": 2880} {"train_loss": -6.569210052490234, "global_step": 120999, "epoch": 2880} {"train_loss": -6.547603130340576, "global_step": 121000, "epoch": 2880} {"train_loss": -6.5362560749053955, "global_step": 121001, "epoch": 2880, "val_loss": 65774.53125} {"train_loss": -6.736422538757324, "global_step": 121002, "epoch": 2881} {"train_loss": -6.499641418457031, "global_step": 121003, "epoch": 2881} {"train_loss": -6.413429260253906, "global_step": 121004, "epoch": 2881} {"train_loss": -6.604046821594238, "global_step": 121005, "epoch": 2881} {"train_loss": -6.598577499389648, "global_step": 121006, "epoch": 2881} {"train_loss": -6.718276023864746, "global_step": 121007, "epoch": 2881} {"train_loss": -6.65073823928833, "global_step": 121008, "epoch": 2881} {"train_loss": -6.6270928382873535, "global_step": 121009, "epoch": 2881} {"train_loss": -6.64180850982666, "global_step": 121010, "epoch": 2881} {"train_loss": -6.560944080352783, "global_step": 121011, "epoch": 2881} {"train_loss": -6.60975456237793, "global_step": 121012, "epoch": 2881} {"train_loss": -6.467752456665039, "global_step": 121013, "epoch": 2881} {"train_loss": -6.552825450897217, "global_step": 121014, "epoch": 2881} {"train_loss": -6.507408142089844, "global_step": 121015, "epoch": 2881} {"train_loss": -6.540724754333496, "global_step": 121016, "epoch": 2881} {"train_loss": -6.645382881164551, "global_step": 121017, "epoch": 2881} {"train_loss": -6.563694000244141, "global_step": 121018, "epoch": 2881} {"train_loss": -6.596824645996094, "global_step": 121019, "epoch": 2881} {"train_loss": -6.627884387969971, "global_step": 121020, "epoch": 2881} {"train_loss": -6.611482620239258, "global_step": 121021, "epoch": 2881} {"train_loss": -6.624983787536621, "global_step": 121022, "epoch": 2881} {"train_loss": -6.619112014770508, "global_step": 121023, "epoch": 2881} {"train_loss": -6.579104423522949, "global_step": 121024, "epoch": 2881} {"train_loss": -6.692452430725098, "global_step": 121025, "epoch": 2881} {"train_loss": -6.688991546630859, "global_step": 121026, "epoch": 2881} {"train_loss": -6.657965660095215, "global_step": 121027, "epoch": 2881} {"train_loss": -6.701317310333252, "global_step": 121028, "epoch": 2881} {"train_loss": -6.577498912811279, "global_step": 121029, "epoch": 2881} {"train_loss": -6.691961765289307, "global_step": 121030, "epoch": 2881} {"train_loss": -6.631402015686035, "global_step": 121031, "epoch": 2881} {"train_loss": -6.670173645019531, "global_step": 121032, "epoch": 2881} {"train_loss": -6.615050315856934, "global_step": 121033, "epoch": 2881} {"train_loss": -6.601038455963135, "global_step": 121034, "epoch": 2881} {"train_loss": -6.764834403991699, "global_step": 121035, "epoch": 2881} {"train_loss": -6.678961753845215, "global_step": 121036, "epoch": 2881} {"train_loss": -6.568014144897461, "global_step": 121037, "epoch": 2881} {"train_loss": -6.465352535247803, "global_step": 121038, "epoch": 2881} {"train_loss": -6.63906717300415, "global_step": 121039, "epoch": 2881} {"train_loss": -6.496337890625, "global_step": 121040, "epoch": 2881} {"train_loss": -6.700889587402344, "global_step": 121041, "epoch": 2881} {"train_loss": -6.580974578857422, "global_step": 121042, "epoch": 2881} {"train_loss": -6.608489944821312, "global_step": 121043, "epoch": 2881, "val_loss": 65935.828125} {"train_loss": -6.612752914428711, "global_step": 121044, "epoch": 2882} {"train_loss": -6.630966663360596, "global_step": 121045, "epoch": 2882} {"train_loss": -6.657422065734863, "global_step": 121046, "epoch": 2882} {"train_loss": -6.655641555786133, "global_step": 121047, "epoch": 2882} {"train_loss": -6.747337818145752, "global_step": 121048, "epoch": 2882} {"train_loss": -6.650516986846924, "global_step": 121049, "epoch": 2882} {"train_loss": -6.685399055480957, "global_step": 121050, "epoch": 2882} {"train_loss": -6.552587509155273, "global_step": 121051, "epoch": 2882} {"train_loss": -6.6617937088012695, "global_step": 121052, "epoch": 2882} {"train_loss": -6.59497594833374, "global_step": 121053, "epoch": 2882} {"train_loss": -6.687952518463135, "global_step": 121054, "epoch": 2882} {"train_loss": -6.537204742431641, "global_step": 121055, "epoch": 2882} {"train_loss": -6.671280860900879, "global_step": 121056, "epoch": 2882} {"train_loss": -6.723086357116699, "global_step": 121057, "epoch": 2882} {"train_loss": -6.643728256225586, "global_step": 121058, "epoch": 2882} {"train_loss": -6.6076154708862305, "global_step": 121059, "epoch": 2882} {"train_loss": -6.604269027709961, "global_step": 121060, "epoch": 2882} {"train_loss": -6.641752243041992, "global_step": 121061, "epoch": 2882} {"train_loss": -6.605759620666504, "global_step": 121062, "epoch": 2882} {"train_loss": -6.6590576171875, "global_step": 121063, "epoch": 2882} {"train_loss": -6.6159868240356445, "global_step": 121064, "epoch": 2882} {"train_loss": -6.5210676193237305, "global_step": 121065, "epoch": 2882} {"train_loss": -6.54106330871582, "global_step": 121066, "epoch": 2882} {"train_loss": -6.6108903884887695, "global_step": 121067, "epoch": 2882} {"train_loss": -6.539059162139893, "global_step": 121068, "epoch": 2882} {"train_loss": -6.562268257141113, "global_step": 121069, "epoch": 2882} {"train_loss": -6.667208671569824, "global_step": 121070, "epoch": 2882} {"train_loss": -6.54484748840332, "global_step": 121071, "epoch": 2882} {"train_loss": -6.50234842300415, "global_step": 121072, "epoch": 2882} {"train_loss": -6.507102012634277, "global_step": 121073, "epoch": 2882} {"train_loss": -6.529519081115723, "global_step": 121074, "epoch": 2882} {"train_loss": -6.609677791595459, "global_step": 121075, "epoch": 2882} {"train_loss": -6.572040557861328, "global_step": 121076, "epoch": 2882} {"train_loss": -6.5775346755981445, "global_step": 121077, "epoch": 2882} {"train_loss": -6.593461513519287, "global_step": 121078, "epoch": 2882} {"train_loss": -6.512291431427002, "global_step": 121079, "epoch": 2882} {"train_loss": -6.509852409362793, "global_step": 121080, "epoch": 2882} {"train_loss": -6.541311264038086, "global_step": 121081, "epoch": 2882} {"train_loss": -6.4370527267456055, "global_step": 121082, "epoch": 2882} {"train_loss": -6.712306976318359, "global_step": 121083, "epoch": 2882} {"train_loss": -6.538221836090088, "global_step": 121084, "epoch": 2882} {"train_loss": -6.600312142145066, "global_step": 121085, "epoch": 2882, "val_loss": 66096.171875} {"train_loss": -6.565952301025391, "global_step": 121086, "epoch": 2883} {"train_loss": -6.607663154602051, "global_step": 121087, "epoch": 2883} {"train_loss": -6.614128589630127, "global_step": 121088, "epoch": 2883} {"train_loss": -6.557567596435547, "global_step": 121089, "epoch": 2883} {"train_loss": -6.630883693695068, "global_step": 121090, "epoch": 2883} {"train_loss": -6.573803901672363, "global_step": 121091, "epoch": 2883} {"train_loss": -6.549654006958008, "global_step": 121092, "epoch": 2883} {"train_loss": -6.615738868713379, "global_step": 121093, "epoch": 2883} {"train_loss": -6.563699722290039, "global_step": 121094, "epoch": 2883} {"train_loss": -6.6990556716918945, "global_step": 121095, "epoch": 2883} {"train_loss": -6.465782165527344, "global_step": 121096, "epoch": 2883} {"train_loss": -6.6350812911987305, "global_step": 121097, "epoch": 2883} {"train_loss": -6.664835453033447, "global_step": 121098, "epoch": 2883} {"train_loss": -6.668504238128662, "global_step": 121099, "epoch": 2883} {"train_loss": -6.5117316246032715, "global_step": 121100, "epoch": 2883} {"train_loss": -6.540346145629883, "global_step": 121101, "epoch": 2883} {"train_loss": -6.6130051612854, "global_step": 121102, "epoch": 2883} {"train_loss": -6.74161958694458, "global_step": 121103, "epoch": 2883} {"train_loss": -6.458528518676758, "global_step": 121104, "epoch": 2883} {"train_loss": -6.6541337966918945, "global_step": 121105, "epoch": 2883} {"train_loss": -6.447119235992432, "global_step": 121106, "epoch": 2883} {"train_loss": -6.602818489074707, "global_step": 121107, "epoch": 2883} {"train_loss": -6.690143585205078, "global_step": 121108, "epoch": 2883} {"train_loss": -6.670290946960449, "global_step": 121109, "epoch": 2883} {"train_loss": -6.526226997375488, "global_step": 121110, "epoch": 2883} {"train_loss": -6.669682025909424, "global_step": 121111, "epoch": 2883} {"train_loss": -6.573747634887695, "global_step": 121112, "epoch": 2883} {"train_loss": -6.570940017700195, "global_step": 121113, "epoch": 2883} {"train_loss": -6.672110557556152, "global_step": 121114, "epoch": 2883} {"train_loss": -6.650619029998779, "global_step": 121115, "epoch": 2883} {"train_loss": -6.6421613693237305, "global_step": 121116, "epoch": 2883} {"train_loss": -6.627894878387451, "global_step": 121117, "epoch": 2883} {"train_loss": -6.58904504776001, "global_step": 121118, "epoch": 2883} {"train_loss": -6.62200403213501, "global_step": 121119, "epoch": 2883} {"train_loss": -6.705597877502441, "global_step": 121120, "epoch": 2883} {"train_loss": -6.567638874053955, "global_step": 121121, "epoch": 2883} {"train_loss": -6.5492658615112305, "global_step": 121122, "epoch": 2883} {"train_loss": -6.626035690307617, "global_step": 121123, "epoch": 2883} {"train_loss": -6.478135585784912, "global_step": 121124, "epoch": 2883} {"train_loss": -6.507330894470215, "global_step": 121125, "epoch": 2883} {"train_loss": -6.556004524230957, "global_step": 121126, "epoch": 2883} {"train_loss": -6.593641042709351, "global_step": 121127, "epoch": 2883, "val_loss": 65744.3984375} {"train_loss": -6.617004871368408, "global_step": 121128, "epoch": 2884} {"train_loss": -6.547272205352783, "global_step": 121129, "epoch": 2884} {"train_loss": -6.547372817993164, "global_step": 121130, "epoch": 2884} {"train_loss": -6.462377071380615, "global_step": 121131, "epoch": 2884} {"train_loss": -6.6295647621154785, "global_step": 121132, "epoch": 2884} {"train_loss": -6.523088455200195, "global_step": 121133, "epoch": 2884} {"train_loss": -6.520534992218018, "global_step": 121134, "epoch": 2884} {"train_loss": -6.668693542480469, "global_step": 121135, "epoch": 2884} {"train_loss": -6.673036098480225, "global_step": 121136, "epoch": 2884} {"train_loss": -6.603705883026123, "global_step": 121137, "epoch": 2884} {"train_loss": -6.700042247772217, "global_step": 121138, "epoch": 2884} {"train_loss": -6.4768500328063965, "global_step": 121139, "epoch": 2884} {"train_loss": -6.664045333862305, "global_step": 121140, "epoch": 2884} {"train_loss": -6.705193519592285, "global_step": 121141, "epoch": 2884} {"train_loss": -6.655378818511963, "global_step": 121142, "epoch": 2884} {"train_loss": -6.780475616455078, "global_step": 121143, "epoch": 2884} {"train_loss": -6.565984725952148, "global_step": 121144, "epoch": 2884} {"train_loss": -6.492234230041504, "global_step": 121145, "epoch": 2884} {"train_loss": -6.6541032791137695, "global_step": 121146, "epoch": 2884} {"train_loss": -6.640200138092041, "global_step": 121147, "epoch": 2884} {"train_loss": -6.7096052169799805, "global_step": 121148, "epoch": 2884} {"train_loss": -6.554372787475586, "global_step": 121149, "epoch": 2884} {"train_loss": -6.532301902770996, "global_step": 121150, "epoch": 2884} {"train_loss": -6.653437614440918, "global_step": 121151, "epoch": 2884} {"train_loss": -6.629202842712402, "global_step": 121152, "epoch": 2884} {"train_loss": -6.821932792663574, "global_step": 121153, "epoch": 2884} {"train_loss": -6.69819974899292, "global_step": 121154, "epoch": 2884} {"train_loss": -6.558379650115967, "global_step": 121155, "epoch": 2884} {"train_loss": -6.635961532592773, "global_step": 121156, "epoch": 2884} {"train_loss": -6.656304836273193, "global_step": 121157, "epoch": 2884} {"train_loss": -6.695172309875488, "global_step": 121158, "epoch": 2884} {"train_loss": -6.626125812530518, "global_step": 121159, "epoch": 2884} {"train_loss": -6.693264961242676, "global_step": 121160, "epoch": 2884} {"train_loss": -6.680327415466309, "global_step": 121161, "epoch": 2884} {"train_loss": -6.638917922973633, "global_step": 121162, "epoch": 2884} {"train_loss": -6.613322734832764, "global_step": 121163, "epoch": 2884} {"train_loss": -6.532405853271484, "global_step": 121164, "epoch": 2884} {"train_loss": -6.561047077178955, "global_step": 121165, "epoch": 2884} {"train_loss": -6.590867042541504, "global_step": 121166, "epoch": 2884} {"train_loss": -6.632328510284424, "global_step": 121167, "epoch": 2884} {"train_loss": -6.477954864501953, "global_step": 121168, "epoch": 2884} {"train_loss": -6.619265147617885, "global_step": 121169, "epoch": 2884, "val_loss": 65811.53125} {"train_loss": -6.730071544647217, "global_step": 121170, "epoch": 2885} {"train_loss": -6.588433265686035, "global_step": 121171, "epoch": 2885} {"train_loss": -6.712615966796875, "global_step": 121172, "epoch": 2885} {"train_loss": -6.499089241027832, "global_step": 121173, "epoch": 2885} {"train_loss": -6.490045547485352, "global_step": 121174, "epoch": 2885} {"train_loss": -6.660974502563477, "global_step": 121175, "epoch": 2885} {"train_loss": -6.64580774307251, "global_step": 121176, "epoch": 2885} {"train_loss": -6.593273639678955, "global_step": 121177, "epoch": 2885} {"train_loss": -6.6262712478637695, "global_step": 121178, "epoch": 2885} {"train_loss": -6.508609771728516, "global_step": 121179, "epoch": 2885} {"train_loss": -6.591385841369629, "global_step": 121180, "epoch": 2885} {"train_loss": -6.571539878845215, "global_step": 121181, "epoch": 2885} {"train_loss": -6.685243606567383, "global_step": 121182, "epoch": 2885} {"train_loss": -6.562493324279785, "global_step": 121183, "epoch": 2885} {"train_loss": -6.5400285720825195, "global_step": 121184, "epoch": 2885} {"train_loss": -6.791786193847656, "global_step": 121185, "epoch": 2885} {"train_loss": -6.654367446899414, "global_step": 121186, "epoch": 2885} {"train_loss": -6.6092681884765625, "global_step": 121187, "epoch": 2885} {"train_loss": -6.554917812347412, "global_step": 121188, "epoch": 2885} {"train_loss": -6.730006694793701, "global_step": 121189, "epoch": 2885} {"train_loss": -6.632002830505371, "global_step": 121190, "epoch": 2885} {"train_loss": -6.504432678222656, "global_step": 121191, "epoch": 2885} {"train_loss": -6.574782371520996, "global_step": 121192, "epoch": 2885} {"train_loss": -6.586271286010742, "global_step": 121193, "epoch": 2885} {"train_loss": -6.585663795471191, "global_step": 121194, "epoch": 2885} {"train_loss": -6.62886905670166, "global_step": 121195, "epoch": 2885} {"train_loss": -6.647352695465088, "global_step": 121196, "epoch": 2885} {"train_loss": -6.558297157287598, "global_step": 121197, "epoch": 2885} {"train_loss": -6.526641845703125, "global_step": 121198, "epoch": 2885} {"train_loss": -6.515392303466797, "global_step": 121199, "epoch": 2885} {"train_loss": -6.632494926452637, "global_step": 121200, "epoch": 2885} {"train_loss": -6.5676164627075195, "global_step": 121201, "epoch": 2885} {"train_loss": -6.590145111083984, "global_step": 121202, "epoch": 2885} {"train_loss": -6.554884910583496, "global_step": 121203, "epoch": 2885} {"train_loss": -6.592594623565674, "global_step": 121204, "epoch": 2885} {"train_loss": -6.557622909545898, "global_step": 121205, "epoch": 2885} {"train_loss": -6.403552532196045, "global_step": 121206, "epoch": 2885} {"train_loss": -6.575893878936768, "global_step": 121207, "epoch": 2885} {"train_loss": -6.473735809326172, "global_step": 121208, "epoch": 2885} {"train_loss": -6.511564254760742, "global_step": 121209, "epoch": 2885} {"train_loss": -6.604541778564453, "global_step": 121210, "epoch": 2885} {"train_loss": -6.586893308730352, "global_step": 121211, "epoch": 2885, "val_loss": 65957.9921875} {"train_loss": -6.496638298034668, "global_step": 121212, "epoch": 2886} {"train_loss": -6.458862781524658, "global_step": 121213, "epoch": 2886} {"train_loss": -6.437419414520264, "global_step": 121214, "epoch": 2886} {"train_loss": -6.565277099609375, "global_step": 121215, "epoch": 2886} {"train_loss": -6.483510971069336, "global_step": 121216, "epoch": 2886} {"train_loss": -6.538569450378418, "global_step": 121217, "epoch": 2886} {"train_loss": -6.522470474243164, "global_step": 121218, "epoch": 2886} {"train_loss": -6.603132724761963, "global_step": 121219, "epoch": 2886} {"train_loss": -6.56765079498291, "global_step": 121220, "epoch": 2886} {"train_loss": -6.536255836486816, "global_step": 121221, "epoch": 2886} {"train_loss": -6.46850061416626, "global_step": 121222, "epoch": 2886} {"train_loss": -6.657863616943359, "global_step": 121223, "epoch": 2886} {"train_loss": -6.6096391677856445, "global_step": 121224, "epoch": 2886} {"train_loss": -6.534021854400635, "global_step": 121225, "epoch": 2886} {"train_loss": -6.5432820320129395, "global_step": 121226, "epoch": 2886} {"train_loss": -6.422833442687988, "global_step": 121227, "epoch": 2886} {"train_loss": -6.613139629364014, "global_step": 121228, "epoch": 2886} {"train_loss": -6.382619380950928, "global_step": 121229, "epoch": 2886} {"train_loss": -6.499272346496582, "global_step": 121230, "epoch": 2886} {"train_loss": -6.596748352050781, "global_step": 121231, "epoch": 2886} {"train_loss": -6.669716835021973, "global_step": 121232, "epoch": 2886} {"train_loss": -6.568974018096924, "global_step": 121233, "epoch": 2886} {"train_loss": -6.565983772277832, "global_step": 121234, "epoch": 2886} {"train_loss": -6.607361793518066, "global_step": 121235, "epoch": 2886} {"train_loss": -6.531937599182129, "global_step": 121236, "epoch": 2886} {"train_loss": -6.561963081359863, "global_step": 121237, "epoch": 2886} {"train_loss": -6.642500877380371, "global_step": 121238, "epoch": 2886} {"train_loss": -6.613159656524658, "global_step": 121239, "epoch": 2886} {"train_loss": -6.690454483032227, "global_step": 121240, "epoch": 2886} {"train_loss": -6.591639518737793, "global_step": 121241, "epoch": 2886} {"train_loss": -6.679513931274414, "global_step": 121242, "epoch": 2886} {"train_loss": -6.628592491149902, "global_step": 121243, "epoch": 2886} {"train_loss": -6.692238807678223, "global_step": 121244, "epoch": 2886} {"train_loss": -6.670770168304443, "global_step": 121245, "epoch": 2886} {"train_loss": -6.64157772064209, "global_step": 121246, "epoch": 2886} {"train_loss": -6.641608715057373, "global_step": 121247, "epoch": 2886} {"train_loss": -6.593198776245117, "global_step": 121248, "epoch": 2886} {"train_loss": -6.61585807800293, "global_step": 121249, "epoch": 2886} {"train_loss": -6.583743095397949, "global_step": 121250, "epoch": 2886} {"train_loss": -6.539332389831543, "global_step": 121251, "epoch": 2886} {"train_loss": -6.604831695556641, "global_step": 121252, "epoch": 2886} {"train_loss": -6.571639367512295, "global_step": 121253, "epoch": 2886, "val_loss": 65828.6484375} {"train_loss": -6.5814528465271, "global_step": 121254, "epoch": 2887} {"train_loss": -6.587137222290039, "global_step": 121255, "epoch": 2887} {"train_loss": -6.580852508544922, "global_step": 121256, "epoch": 2887} {"train_loss": -6.504167556762695, "global_step": 121257, "epoch": 2887} {"train_loss": -6.444574356079102, "global_step": 121258, "epoch": 2887} {"train_loss": -6.617082595825195, "global_step": 121259, "epoch": 2887} {"train_loss": -6.721244812011719, "global_step": 121260, "epoch": 2887} {"train_loss": -6.473628044128418, "global_step": 121261, "epoch": 2887} {"train_loss": -6.5757598876953125, "global_step": 121262, "epoch": 2887} {"train_loss": -6.6309309005737305, "global_step": 121263, "epoch": 2887} {"train_loss": -6.434728145599365, "global_step": 121264, "epoch": 2887} {"train_loss": -6.665961265563965, "global_step": 121265, "epoch": 2887} {"train_loss": -6.579254627227783, "global_step": 121266, "epoch": 2887} {"train_loss": -6.512674331665039, "global_step": 121267, "epoch": 2887} {"train_loss": -6.627549171447754, "global_step": 121268, "epoch": 2887} {"train_loss": -6.600152015686035, "global_step": 121269, "epoch": 2887} {"train_loss": -6.590368270874023, "global_step": 121270, "epoch": 2887} {"train_loss": -6.565824508666992, "global_step": 121271, "epoch": 2887} {"train_loss": -6.447356224060059, "global_step": 121272, "epoch": 2887} {"train_loss": -6.611625671386719, "global_step": 121273, "epoch": 2887} {"train_loss": -6.659844875335693, "global_step": 121274, "epoch": 2887} {"train_loss": -6.539312362670898, "global_step": 121275, "epoch": 2887} {"train_loss": -6.6437087059021, "global_step": 121276, "epoch": 2887} {"train_loss": -6.594232082366943, "global_step": 121277, "epoch": 2887} {"train_loss": -6.60075569152832, "global_step": 121278, "epoch": 2887} {"train_loss": -6.609785556793213, "global_step": 121279, "epoch": 2887} {"train_loss": -6.709346771240234, "global_step": 121280, "epoch": 2887} {"train_loss": -6.629726886749268, "global_step": 121281, "epoch": 2887} {"train_loss": -6.571835517883301, "global_step": 121282, "epoch": 2887} {"train_loss": -6.670191287994385, "global_step": 121283, "epoch": 2887} {"train_loss": -6.60310697555542, "global_step": 121284, "epoch": 2887} {"train_loss": -6.603357315063477, "global_step": 121285, "epoch": 2887} {"train_loss": -6.692495346069336, "global_step": 121286, "epoch": 2887} {"train_loss": -6.620777130126953, "global_step": 121287, "epoch": 2887} {"train_loss": -6.675251483917236, "global_step": 121288, "epoch": 2887} {"train_loss": -6.625743389129639, "global_step": 121289, "epoch": 2887} {"train_loss": -6.6006059646606445, "global_step": 121290, "epoch": 2887} {"train_loss": -6.539848327636719, "global_step": 121291, "epoch": 2887} {"train_loss": -6.5166215896606445, "global_step": 121292, "epoch": 2887} {"train_loss": -6.656173229217529, "global_step": 121293, "epoch": 2887} {"train_loss": -6.644635200500488, "global_step": 121294, "epoch": 2887} {"train_loss": -6.593073084240868, "global_step": 121295, "epoch": 2887, "val_loss": 66111.3359375} {"train_loss": -6.573210716247559, "global_step": 121296, "epoch": 2888} {"train_loss": -6.5225934982299805, "global_step": 121297, "epoch": 2888} {"train_loss": -6.700519561767578, "global_step": 121298, "epoch": 2888} {"train_loss": -6.517455577850342, "global_step": 121299, "epoch": 2888} {"train_loss": -6.49683952331543, "global_step": 121300, "epoch": 2888} {"train_loss": -6.572558879852295, "global_step": 121301, "epoch": 2888} {"train_loss": -6.513529300689697, "global_step": 121302, "epoch": 2888} {"train_loss": -6.43820333480835, "global_step": 121303, "epoch": 2888} {"train_loss": -6.592104434967041, "global_step": 121304, "epoch": 2888} {"train_loss": -6.561159610748291, "global_step": 121305, "epoch": 2888} {"train_loss": -6.583968162536621, "global_step": 121306, "epoch": 2888} {"train_loss": -6.649356842041016, "global_step": 121307, "epoch": 2888} {"train_loss": -6.628529071807861, "global_step": 121308, "epoch": 2888} {"train_loss": -6.6118316650390625, "global_step": 121309, "epoch": 2888} {"train_loss": -6.601108074188232, "global_step": 121310, "epoch": 2888} {"train_loss": -6.582380771636963, "global_step": 121311, "epoch": 2888} {"train_loss": -6.634743690490723, "global_step": 121312, "epoch": 2888} {"train_loss": -6.579582214355469, "global_step": 121313, "epoch": 2888} {"train_loss": -6.741120338439941, "global_step": 121314, "epoch": 2888} {"train_loss": -6.619085311889648, "global_step": 121315, "epoch": 2888} {"train_loss": -6.709711074829102, "global_step": 121316, "epoch": 2888} {"train_loss": -6.574878215789795, "global_step": 121317, "epoch": 2888} {"train_loss": -6.573217391967773, "global_step": 121318, "epoch": 2888} {"train_loss": -6.696104049682617, "global_step": 121319, "epoch": 2888} {"train_loss": -6.684509754180908, "global_step": 121320, "epoch": 2888} {"train_loss": -6.578822135925293, "global_step": 121321, "epoch": 2888} {"train_loss": -6.6479315757751465, "global_step": 121322, "epoch": 2888} {"train_loss": -6.6186747550964355, "global_step": 121323, "epoch": 2888} {"train_loss": -6.599034309387207, "global_step": 121324, "epoch": 2888} {"train_loss": -6.621633529663086, "global_step": 121325, "epoch": 2888} {"train_loss": -6.598484992980957, "global_step": 121326, "epoch": 2888} {"train_loss": -6.599822044372559, "global_step": 121327, "epoch": 2888} {"train_loss": -6.671593189239502, "global_step": 121328, "epoch": 2888} {"train_loss": -6.642205715179443, "global_step": 121329, "epoch": 2888} {"train_loss": -6.546944618225098, "global_step": 121330, "epoch": 2888} {"train_loss": -6.653088092803955, "global_step": 121331, "epoch": 2888} {"train_loss": -6.595062255859375, "global_step": 121332, "epoch": 2888} {"train_loss": -6.592988967895508, "global_step": 121333, "epoch": 2888} {"train_loss": -6.494372367858887, "global_step": 121334, "epoch": 2888} {"train_loss": -6.616972923278809, "global_step": 121335, "epoch": 2888} {"train_loss": -6.467791557312012, "global_step": 121336, "epoch": 2888} {"train_loss": -6.594322749546596, "global_step": 121337, "epoch": 2888, "val_loss": 66007.7421875} {"train_loss": -6.513556957244873, "global_step": 121338, "epoch": 2889} {"train_loss": -6.436625003814697, "global_step": 121339, "epoch": 2889} {"train_loss": -6.603404521942139, "global_step": 121340, "epoch": 2889} {"train_loss": -6.555373191833496, "global_step": 121341, "epoch": 2889} {"train_loss": -6.531021595001221, "global_step": 121342, "epoch": 2889} {"train_loss": -6.458219528198242, "global_step": 121343, "epoch": 2889} {"train_loss": -6.46024227142334, "global_step": 121344, "epoch": 2889} {"train_loss": -6.580947399139404, "global_step": 121345, "epoch": 2889} {"train_loss": -6.462268829345703, "global_step": 121346, "epoch": 2889} {"train_loss": -6.499945640563965, "global_step": 121347, "epoch": 2889} {"train_loss": -6.532140254974365, "global_step": 121348, "epoch": 2889} {"train_loss": -6.557826042175293, "global_step": 121349, "epoch": 2889} {"train_loss": -6.545432090759277, "global_step": 121350, "epoch": 2889} {"train_loss": -6.598525047302246, "global_step": 121351, "epoch": 2889} {"train_loss": -6.5284342765808105, "global_step": 121352, "epoch": 2889} {"train_loss": -6.450427055358887, "global_step": 121353, "epoch": 2889} {"train_loss": -6.523960590362549, "global_step": 121354, "epoch": 2889} {"train_loss": -6.498112678527832, "global_step": 121355, "epoch": 2889} {"train_loss": -6.546420097351074, "global_step": 121356, "epoch": 2889} {"train_loss": -6.626395225524902, "global_step": 121357, "epoch": 2889} {"train_loss": -6.550329208374023, "global_step": 121358, "epoch": 2889} {"train_loss": -6.538461685180664, "global_step": 121359, "epoch": 2889} {"train_loss": -6.713904857635498, "global_step": 121360, "epoch": 2889} {"train_loss": -6.542400360107422, "global_step": 121361, "epoch": 2889} {"train_loss": -6.5317063331604, "global_step": 121362, "epoch": 2889} {"train_loss": -6.6217851638793945, "global_step": 121363, "epoch": 2889} {"train_loss": -6.631193161010742, "global_step": 121364, "epoch": 2889} {"train_loss": -6.579774379730225, "global_step": 121365, "epoch": 2889} {"train_loss": -6.586546421051025, "global_step": 121366, "epoch": 2889} {"train_loss": -6.529816627502441, "global_step": 121367, "epoch": 2889} {"train_loss": -6.6204681396484375, "global_step": 121368, "epoch": 2889} {"train_loss": -6.549201011657715, "global_step": 121369, "epoch": 2889} {"train_loss": -6.502955436706543, "global_step": 121370, "epoch": 2889} {"train_loss": -6.608253479003906, "global_step": 121371, "epoch": 2889} {"train_loss": -6.455103397369385, "global_step": 121372, "epoch": 2889} {"train_loss": -6.560837745666504, "global_step": 121373, "epoch": 2889} {"train_loss": -6.6087646484375, "global_step": 121374, "epoch": 2889} {"train_loss": -6.43636417388916, "global_step": 121375, "epoch": 2889} {"train_loss": -6.5503058433532715, "global_step": 121376, "epoch": 2889} {"train_loss": -6.600625514984131, "global_step": 121377, "epoch": 2889} {"train_loss": -6.5421342849731445, "global_step": 121378, "epoch": 2889} {"train_loss": -6.546696174712408, "global_step": 121379, "epoch": 2889, "val_loss": 65899.0234375} {"train_loss": -6.550914764404297, "global_step": 121380, "epoch": 2890} {"train_loss": -6.553318977355957, "global_step": 121381, "epoch": 2890} {"train_loss": -6.596185684204102, "global_step": 121382, "epoch": 2890} {"train_loss": -6.620959758758545, "global_step": 121383, "epoch": 2890} {"train_loss": -6.535057067871094, "global_step": 121384, "epoch": 2890} {"train_loss": -6.682406425476074, "global_step": 121385, "epoch": 2890} {"train_loss": -6.538239479064941, "global_step": 121386, "epoch": 2890} {"train_loss": -6.512645244598389, "global_step": 121387, "epoch": 2890} {"train_loss": -6.582004547119141, "global_step": 121388, "epoch": 2890} {"train_loss": -6.588113307952881, "global_step": 121389, "epoch": 2890} {"train_loss": -6.573812961578369, "global_step": 121390, "epoch": 2890} {"train_loss": -6.566131591796875, "global_step": 121391, "epoch": 2890} {"train_loss": -6.46146297454834, "global_step": 121392, "epoch": 2890} {"train_loss": -6.50353479385376, "global_step": 121393, "epoch": 2890} {"train_loss": -6.542304992675781, "global_step": 121394, "epoch": 2890} {"train_loss": -6.545434951782227, "global_step": 121395, "epoch": 2890} {"train_loss": -6.449242115020752, "global_step": 121396, "epoch": 2890} {"train_loss": -6.608715057373047, "global_step": 121397, "epoch": 2890} {"train_loss": -6.613790035247803, "global_step": 121398, "epoch": 2890} {"train_loss": -6.512271881103516, "global_step": 121399, "epoch": 2890} {"train_loss": -6.605607986450195, "global_step": 121400, "epoch": 2890} {"train_loss": -6.5204854011535645, "global_step": 121401, "epoch": 2890} {"train_loss": -6.474769592285156, "global_step": 121402, "epoch": 2890} {"train_loss": -6.522489547729492, "global_step": 121403, "epoch": 2890} {"train_loss": -6.50114631652832, "global_step": 121404, "epoch": 2890} {"train_loss": -6.6347784996032715, "global_step": 121405, "epoch": 2890} {"train_loss": -6.524938583374023, "global_step": 121406, "epoch": 2890} {"train_loss": -6.410093784332275, "global_step": 121407, "epoch": 2890} {"train_loss": -6.660487174987793, "global_step": 121408, "epoch": 2890} {"train_loss": -6.497540473937988, "global_step": 121409, "epoch": 2890} {"train_loss": -6.483162879943848, "global_step": 121410, "epoch": 2890} {"train_loss": -6.503769874572754, "global_step": 121411, "epoch": 2890} {"train_loss": -6.4502387046813965, "global_step": 121412, "epoch": 2890} {"train_loss": -6.607687950134277, "global_step": 121413, "epoch": 2890} {"train_loss": -6.426560401916504, "global_step": 121414, "epoch": 2890} {"train_loss": -6.5234479904174805, "global_step": 121415, "epoch": 2890} {"train_loss": -6.541977882385254, "global_step": 121416, "epoch": 2890} {"train_loss": -6.621124744415283, "global_step": 121417, "epoch": 2890} {"train_loss": -6.587625026702881, "global_step": 121418, "epoch": 2890} {"train_loss": -6.564947128295898, "global_step": 121419, "epoch": 2890} {"train_loss": -6.567204475402832, "global_step": 121420, "epoch": 2890} {"train_loss": -6.544213226863316, "global_step": 121421, "epoch": 2890, "val_loss": 65843.0078125} {"train_loss": -6.459506034851074, "global_step": 121422, "epoch": 2891} {"train_loss": -6.615258693695068, "global_step": 121423, "epoch": 2891} {"train_loss": -6.416141510009766, "global_step": 121424, "epoch": 2891} {"train_loss": -6.582781791687012, "global_step": 121425, "epoch": 2891} {"train_loss": -6.553720474243164, "global_step": 121426, "epoch": 2891} {"train_loss": -6.428849220275879, "global_step": 121427, "epoch": 2891} {"train_loss": -6.576519966125488, "global_step": 121428, "epoch": 2891} {"train_loss": -6.581472396850586, "global_step": 121429, "epoch": 2891} {"train_loss": -6.610574245452881, "global_step": 121430, "epoch": 2891} {"train_loss": -6.458179473876953, "global_step": 121431, "epoch": 2891} {"train_loss": -6.588587760925293, "global_step": 121432, "epoch": 2891} {"train_loss": -6.3878865242004395, "global_step": 121433, "epoch": 2891} {"train_loss": -6.62212610244751, "global_step": 121434, "epoch": 2891} {"train_loss": -6.49501895904541, "global_step": 121435, "epoch": 2891} {"train_loss": -6.469518661499023, "global_step": 121436, "epoch": 2891} {"train_loss": -6.5789947509765625, "global_step": 121437, "epoch": 2891} {"train_loss": -6.423215389251709, "global_step": 121438, "epoch": 2891} {"train_loss": -6.588968753814697, "global_step": 121439, "epoch": 2891} {"train_loss": -6.489445686340332, "global_step": 121440, "epoch": 2891} {"train_loss": -6.497492790222168, "global_step": 121441, "epoch": 2891} {"train_loss": -6.524107933044434, "global_step": 121442, "epoch": 2891} {"train_loss": -6.6047797203063965, "global_step": 121443, "epoch": 2891} {"train_loss": -6.56978702545166, "global_step": 121444, "epoch": 2891} {"train_loss": -6.664985656738281, "global_step": 121445, "epoch": 2891} {"train_loss": -6.533413887023926, "global_step": 121446, "epoch": 2891} {"train_loss": -6.6554765701293945, "global_step": 121447, "epoch": 2891} {"train_loss": -6.535478115081787, "global_step": 121448, "epoch": 2891} {"train_loss": -6.607728004455566, "global_step": 121449, "epoch": 2891} {"train_loss": -6.664434432983398, "global_step": 121450, "epoch": 2891} {"train_loss": -6.516718864440918, "global_step": 121451, "epoch": 2891} {"train_loss": -6.5220794677734375, "global_step": 121452, "epoch": 2891} {"train_loss": -6.534753799438477, "global_step": 121453, "epoch": 2891} {"train_loss": -6.578338623046875, "global_step": 121454, "epoch": 2891} {"train_loss": -6.637777805328369, "global_step": 121455, "epoch": 2891} {"train_loss": -6.636913299560547, "global_step": 121456, "epoch": 2891} {"train_loss": -6.581220626831055, "global_step": 121457, "epoch": 2891} {"train_loss": -6.692250728607178, "global_step": 121458, "epoch": 2891} {"train_loss": -6.550963401794434, "global_step": 121459, "epoch": 2891} {"train_loss": -6.560669898986816, "global_step": 121460, "epoch": 2891} {"train_loss": -6.610204219818115, "global_step": 121461, "epoch": 2891} {"train_loss": -6.603170871734619, "global_step": 121462, "epoch": 2891} {"train_loss": -6.5585354169209795, "global_step": 121463, "epoch": 2891, "val_loss": 65739.5390625} {"train_loss": -6.654315948486328, "global_step": 121464, "epoch": 2892} {"train_loss": -6.7080535888671875, "global_step": 121465, "epoch": 2892} {"train_loss": -6.695398807525635, "global_step": 121466, "epoch": 2892} {"train_loss": -6.624035835266113, "global_step": 121467, "epoch": 2892} {"train_loss": -6.5755085945129395, "global_step": 121468, "epoch": 2892} {"train_loss": -6.630464553833008, "global_step": 121469, "epoch": 2892} {"train_loss": -6.595086097717285, "global_step": 121470, "epoch": 2892} {"train_loss": -6.583582878112793, "global_step": 121471, "epoch": 2892} {"train_loss": -6.6617231369018555, "global_step": 121472, "epoch": 2892} {"train_loss": -6.606788635253906, "global_step": 121473, "epoch": 2892} {"train_loss": -6.5986785888671875, "global_step": 121474, "epoch": 2892} {"train_loss": -6.576613426208496, "global_step": 121475, "epoch": 2892} {"train_loss": -6.577261924743652, "global_step": 121476, "epoch": 2892} {"train_loss": -6.61171817779541, "global_step": 121477, "epoch": 2892} {"train_loss": -6.670236110687256, "global_step": 121478, "epoch": 2892} {"train_loss": -6.654980182647705, "global_step": 121479, "epoch": 2892} {"train_loss": -6.624737739562988, "global_step": 121480, "epoch": 2892} {"train_loss": -6.541074275970459, "global_step": 121481, "epoch": 2892} {"train_loss": -6.56071662902832, "global_step": 121482, "epoch": 2892} {"train_loss": -6.484938621520996, "global_step": 121483, "epoch": 2892} {"train_loss": -6.620961666107178, "global_step": 121484, "epoch": 2892} {"train_loss": -6.515381813049316, "global_step": 121485, "epoch": 2892} {"train_loss": -6.534088134765625, "global_step": 121486, "epoch": 2892} {"train_loss": -6.598416805267334, "global_step": 121487, "epoch": 2892} {"train_loss": -6.570160865783691, "global_step": 121488, "epoch": 2892} {"train_loss": -6.386336326599121, "global_step": 121489, "epoch": 2892} {"train_loss": -6.4437456130981445, "global_step": 121490, "epoch": 2892} {"train_loss": -6.528951168060303, "global_step": 121491, "epoch": 2892} {"train_loss": -6.456857681274414, "global_step": 121492, "epoch": 2892} {"train_loss": -6.5469069480896, "global_step": 121493, "epoch": 2892} {"train_loss": -6.555968284606934, "global_step": 121494, "epoch": 2892} {"train_loss": -6.502495288848877, "global_step": 121495, "epoch": 2892} {"train_loss": -6.544705867767334, "global_step": 121496, "epoch": 2892} {"train_loss": -6.579924583435059, "global_step": 121497, "epoch": 2892} {"train_loss": -6.53706169128418, "global_step": 121498, "epoch": 2892} {"train_loss": -6.502298355102539, "global_step": 121499, "epoch": 2892} {"train_loss": -6.5697174072265625, "global_step": 121500, "epoch": 2892} {"train_loss": -6.534628868103027, "global_step": 121501, "epoch": 2892} {"train_loss": -6.51964807510376, "global_step": 121502, "epoch": 2892} {"train_loss": -6.5762810707092285, "global_step": 121503, "epoch": 2892} {"train_loss": -6.630771636962891, "global_step": 121504, "epoch": 2892} {"train_loss": -6.573990731012254, "global_step": 121505, "epoch": 2892, "val_loss": 65870.3046875} {"train_loss": -6.562869071960449, "global_step": 121506, "epoch": 2893} {"train_loss": -6.609055519104004, "global_step": 121507, "epoch": 2893} {"train_loss": -6.603732109069824, "global_step": 121508, "epoch": 2893} {"train_loss": -6.574633598327637, "global_step": 121509, "epoch": 2893} {"train_loss": -6.634329319000244, "global_step": 121510, "epoch": 2893} {"train_loss": -6.534380912780762, "global_step": 121511, "epoch": 2893} {"train_loss": -6.503094673156738, "global_step": 121512, "epoch": 2893} {"train_loss": -6.534501075744629, "global_step": 121513, "epoch": 2893} {"train_loss": -6.654609680175781, "global_step": 121514, "epoch": 2893} {"train_loss": -6.57214879989624, "global_step": 121515, "epoch": 2893} {"train_loss": -6.599727153778076, "global_step": 121516, "epoch": 2893} {"train_loss": -6.501167297363281, "global_step": 121517, "epoch": 2893} {"train_loss": -6.653281211853027, "global_step": 121518, "epoch": 2893} {"train_loss": -6.6276350021362305, "global_step": 121519, "epoch": 2893} {"train_loss": -6.5390543937683105, "global_step": 121520, "epoch": 2893} {"train_loss": -6.63355827331543, "global_step": 121521, "epoch": 2893} {"train_loss": -6.49231481552124, "global_step": 121522, "epoch": 2893} {"train_loss": -6.694572448730469, "global_step": 121523, "epoch": 2893} {"train_loss": -6.683658599853516, "global_step": 121524, "epoch": 2893} {"train_loss": -6.564373970031738, "global_step": 121525, "epoch": 2893} {"train_loss": -6.72004508972168, "global_step": 121526, "epoch": 2893} {"train_loss": -6.5056657791137695, "global_step": 121527, "epoch": 2893} {"train_loss": -6.575912952423096, "global_step": 121528, "epoch": 2893} {"train_loss": -6.621917724609375, "global_step": 121529, "epoch": 2893} {"train_loss": -6.653511047363281, "global_step": 121530, "epoch": 2893} {"train_loss": -6.70444393157959, "global_step": 121531, "epoch": 2893} {"train_loss": -6.587774753570557, "global_step": 121532, "epoch": 2893} {"train_loss": -6.502906799316406, "global_step": 121533, "epoch": 2893} {"train_loss": -6.649916648864746, "global_step": 121534, "epoch": 2893} {"train_loss": -6.550228595733643, "global_step": 121535, "epoch": 2893} {"train_loss": -6.5106964111328125, "global_step": 121536, "epoch": 2893} {"train_loss": -6.588942050933838, "global_step": 121537, "epoch": 2893} {"train_loss": -6.579867362976074, "global_step": 121538, "epoch": 2893} {"train_loss": -6.51917839050293, "global_step": 121539, "epoch": 2893} {"train_loss": -6.688511848449707, "global_step": 121540, "epoch": 2893} {"train_loss": -6.668524742126465, "global_step": 121541, "epoch": 2893} {"train_loss": -6.599063873291016, "global_step": 121542, "epoch": 2893} {"train_loss": -6.512911319732666, "global_step": 121543, "epoch": 2893} {"train_loss": -6.631141185760498, "global_step": 121544, "epoch": 2893} {"train_loss": -6.531120777130127, "global_step": 121545, "epoch": 2893} {"train_loss": -6.538233757019043, "global_step": 121546, "epoch": 2893} {"train_loss": -6.59357704435076, "global_step": 121547, "epoch": 2893, "val_loss": 66080.6640625} {"train_loss": -6.577169895172119, "global_step": 121548, "epoch": 2894} {"train_loss": -6.435069561004639, "global_step": 121549, "epoch": 2894} {"train_loss": -6.633479118347168, "global_step": 121550, "epoch": 2894} {"train_loss": -6.468562126159668, "global_step": 121551, "epoch": 2894} {"train_loss": -6.664151668548584, "global_step": 121552, "epoch": 2894} {"train_loss": -6.4534430503845215, "global_step": 121553, "epoch": 2894} {"train_loss": -6.589766025543213, "global_step": 121554, "epoch": 2894} {"train_loss": -6.528188705444336, "global_step": 121555, "epoch": 2894} {"train_loss": -6.596138954162598, "global_step": 121556, "epoch": 2894} {"train_loss": -6.633090019226074, "global_step": 121557, "epoch": 2894} {"train_loss": -6.408663749694824, "global_step": 121558, "epoch": 2894} {"train_loss": -6.5359296798706055, "global_step": 121559, "epoch": 2894} {"train_loss": -6.51353645324707, "global_step": 121560, "epoch": 2894} {"train_loss": -6.528847694396973, "global_step": 121561, "epoch": 2894} {"train_loss": -6.534735679626465, "global_step": 121562, "epoch": 2894} {"train_loss": -6.510269641876221, "global_step": 121563, "epoch": 2894} {"train_loss": -6.6905059814453125, "global_step": 121564, "epoch": 2894} {"train_loss": -6.557997226715088, "global_step": 121565, "epoch": 2894} {"train_loss": -6.60743522644043, "global_step": 121566, "epoch": 2894} {"train_loss": -6.512959003448486, "global_step": 121567, "epoch": 2894} {"train_loss": -6.5923614501953125, "global_step": 121568, "epoch": 2894} {"train_loss": -6.603055000305176, "global_step": 121569, "epoch": 2894} {"train_loss": -6.524144172668457, "global_step": 121570, "epoch": 2894} {"train_loss": -6.4769182205200195, "global_step": 121571, "epoch": 2894} {"train_loss": -6.521063804626465, "global_step": 121572, "epoch": 2894} {"train_loss": -6.445641040802002, "global_step": 121573, "epoch": 2894} {"train_loss": -6.530138969421387, "global_step": 121574, "epoch": 2894} {"train_loss": -6.473830223083496, "global_step": 121575, "epoch": 2894} {"train_loss": -6.532961845397949, "global_step": 121576, "epoch": 2894} {"train_loss": -6.686319351196289, "global_step": 121577, "epoch": 2894} {"train_loss": -6.58706521987915, "global_step": 121578, "epoch": 2894} {"train_loss": -6.554081916809082, "global_step": 121579, "epoch": 2894} {"train_loss": -6.595949172973633, "global_step": 121580, "epoch": 2894} {"train_loss": -6.508059501647949, "global_step": 121581, "epoch": 2894} {"train_loss": -6.471774101257324, "global_step": 121582, "epoch": 2894} {"train_loss": -6.5910797119140625, "global_step": 121583, "epoch": 2894} {"train_loss": -6.548303604125977, "global_step": 121584, "epoch": 2894} {"train_loss": -6.6056342124938965, "global_step": 121585, "epoch": 2894} {"train_loss": -6.479798316955566, "global_step": 121586, "epoch": 2894} {"train_loss": -6.565456390380859, "global_step": 121587, "epoch": 2894} {"train_loss": -6.490894317626953, "global_step": 121588, "epoch": 2894} {"train_loss": -6.541714974812099, "global_step": 121589, "epoch": 2894, "val_loss": 66105.234375} {"train_loss": -6.558480262756348, "global_step": 121590, "epoch": 2895} {"train_loss": -6.518335342407227, "global_step": 121591, "epoch": 2895} {"train_loss": -6.621918201446533, "global_step": 121592, "epoch": 2895} {"train_loss": -6.543658256530762, "global_step": 121593, "epoch": 2895} {"train_loss": -6.537901878356934, "global_step": 121594, "epoch": 2895} {"train_loss": -6.592224597930908, "global_step": 121595, "epoch": 2895} {"train_loss": -6.526517868041992, "global_step": 121596, "epoch": 2895} {"train_loss": -6.581600666046143, "global_step": 121597, "epoch": 2895} {"train_loss": -6.596127033233643, "global_step": 121598, "epoch": 2895} {"train_loss": -6.6512346267700195, "global_step": 121599, "epoch": 2895} {"train_loss": -6.5421881675720215, "global_step": 121600, "epoch": 2895} {"train_loss": -6.553211212158203, "global_step": 121601, "epoch": 2895} {"train_loss": -6.609362602233887, "global_step": 121602, "epoch": 2895} {"train_loss": -6.576105117797852, "global_step": 121603, "epoch": 2895} {"train_loss": -6.708378791809082, "global_step": 121604, "epoch": 2895} {"train_loss": -6.458811283111572, "global_step": 121605, "epoch": 2895} {"train_loss": -6.7789201736450195, "global_step": 121606, "epoch": 2895} {"train_loss": -6.636153221130371, "global_step": 121607, "epoch": 2895} {"train_loss": -6.5046000480651855, "global_step": 121608, "epoch": 2895} {"train_loss": -6.703656196594238, "global_step": 121609, "epoch": 2895} {"train_loss": -6.501463413238525, "global_step": 121610, "epoch": 2895} {"train_loss": -6.4009294509887695, "global_step": 121611, "epoch": 2895} {"train_loss": -6.516946792602539, "global_step": 121612, "epoch": 2895} {"train_loss": -6.556873321533203, "global_step": 121613, "epoch": 2895} {"train_loss": -6.471311092376709, "global_step": 121614, "epoch": 2895} {"train_loss": -6.179120063781738, "global_step": 121615, "epoch": 2895} {"train_loss": -6.51266622543335, "global_step": 121616, "epoch": 2895} {"train_loss": -6.4716410636901855, "global_step": 121617, "epoch": 2895} {"train_loss": -6.381988048553467, "global_step": 121618, "epoch": 2895} {"train_loss": -6.543817520141602, "global_step": 121619, "epoch": 2895} {"train_loss": -6.4333295822143555, "global_step": 121620, "epoch": 2895} {"train_loss": -6.4955644607543945, "global_step": 121621, "epoch": 2895} {"train_loss": -6.384090423583984, "global_step": 121622, "epoch": 2895} {"train_loss": -6.595430374145508, "global_step": 121623, "epoch": 2895} {"train_loss": -6.454073905944824, "global_step": 121624, "epoch": 2895} {"train_loss": -6.469120979309082, "global_step": 121625, "epoch": 2895} {"train_loss": -6.557346343994141, "global_step": 121626, "epoch": 2895} {"train_loss": -6.535793304443359, "global_step": 121627, "epoch": 2895} {"train_loss": -6.513602256774902, "global_step": 121628, "epoch": 2895} {"train_loss": -6.690074920654297, "global_step": 121629, "epoch": 2895} {"train_loss": -6.594742774963379, "global_step": 121630, "epoch": 2895} {"train_loss": -6.540374903451829, "global_step": 121631, "epoch": 2895, "val_loss": 65813.3671875} {"train_loss": -6.603025436401367, "global_step": 121632, "epoch": 2896} {"train_loss": -6.616463661193848, "global_step": 121633, "epoch": 2896} {"train_loss": -6.595327854156494, "global_step": 121634, "epoch": 2896} {"train_loss": -6.550016403198242, "global_step": 121635, "epoch": 2896} {"train_loss": -6.47830867767334, "global_step": 121636, "epoch": 2896} {"train_loss": -6.637373447418213, "global_step": 121637, "epoch": 2896} {"train_loss": -6.574568271636963, "global_step": 121638, "epoch": 2896} {"train_loss": -6.527921676635742, "global_step": 121639, "epoch": 2896} {"train_loss": -6.59511661529541, "global_step": 121640, "epoch": 2896} {"train_loss": -6.6626176834106445, "global_step": 121641, "epoch": 2896} {"train_loss": -6.593568801879883, "global_step": 121642, "epoch": 2896} {"train_loss": -6.687026023864746, "global_step": 121643, "epoch": 2896} {"train_loss": -6.5853424072265625, "global_step": 121644, "epoch": 2896} {"train_loss": -6.539268493652344, "global_step": 121645, "epoch": 2896} {"train_loss": -6.630302429199219, "global_step": 121646, "epoch": 2896} {"train_loss": -6.606638431549072, "global_step": 121647, "epoch": 2896} {"train_loss": -6.665348529815674, "global_step": 121648, "epoch": 2896} {"train_loss": -6.494050025939941, "global_step": 121649, "epoch": 2896} {"train_loss": -6.515247344970703, "global_step": 121650, "epoch": 2896} {"train_loss": -6.501816749572754, "global_step": 121651, "epoch": 2896} {"train_loss": -6.497221946716309, "global_step": 121652, "epoch": 2896} {"train_loss": -6.412220001220703, "global_step": 121653, "epoch": 2896} {"train_loss": -6.55246639251709, "global_step": 121654, "epoch": 2896} {"train_loss": -6.5502119064331055, "global_step": 121655, "epoch": 2896} {"train_loss": -6.583769798278809, "global_step": 121656, "epoch": 2896} {"train_loss": -6.674685955047607, "global_step": 121657, "epoch": 2896} {"train_loss": -6.671280860900879, "global_step": 121658, "epoch": 2896} {"train_loss": -6.720938682556152, "global_step": 121659, "epoch": 2896} {"train_loss": -6.601715087890625, "global_step": 121660, "epoch": 2896} {"train_loss": -6.603179931640625, "global_step": 121661, "epoch": 2896} {"train_loss": -6.508904933929443, "global_step": 121662, "epoch": 2896} {"train_loss": -6.654700756072998, "global_step": 121663, "epoch": 2896} {"train_loss": -6.503998756408691, "global_step": 121664, "epoch": 2896} {"train_loss": -6.556161880493164, "global_step": 121665, "epoch": 2896} {"train_loss": -6.535697937011719, "global_step": 121666, "epoch": 2896} {"train_loss": -6.500560760498047, "global_step": 121667, "epoch": 2896} {"train_loss": -6.658951759338379, "global_step": 121668, "epoch": 2896} {"train_loss": -6.518049716949463, "global_step": 121669, "epoch": 2896} {"train_loss": -6.750362396240234, "global_step": 121670, "epoch": 2896} {"train_loss": -6.57023811340332, "global_step": 121671, "epoch": 2896} {"train_loss": -6.636177062988281, "global_step": 121672, "epoch": 2896} {"train_loss": -6.583509819848197, "global_step": 121673, "epoch": 2896, "val_loss": 65752.8984375} {"train_loss": -6.526588439941406, "global_step": 121674, "epoch": 2897} {"train_loss": -6.63790225982666, "global_step": 121675, "epoch": 2897} {"train_loss": -6.521232604980469, "global_step": 121676, "epoch": 2897} {"train_loss": -6.645123481750488, "global_step": 121677, "epoch": 2897} {"train_loss": -6.681027412414551, "global_step": 121678, "epoch": 2897} {"train_loss": -6.64116096496582, "global_step": 121679, "epoch": 2897} {"train_loss": -6.503502368927002, "global_step": 121680, "epoch": 2897} {"train_loss": -6.637506484985352, "global_step": 121681, "epoch": 2897} {"train_loss": -6.59815788269043, "global_step": 121682, "epoch": 2897} {"train_loss": -6.675518035888672, "global_step": 121683, "epoch": 2897} {"train_loss": -6.7196455001831055, "global_step": 121684, "epoch": 2897} {"train_loss": -6.555629730224609, "global_step": 121685, "epoch": 2897} {"train_loss": -6.625067710876465, "global_step": 121686, "epoch": 2897} {"train_loss": -6.555689334869385, "global_step": 121687, "epoch": 2897} {"train_loss": -6.591792106628418, "global_step": 121688, "epoch": 2897} {"train_loss": -6.641231536865234, "global_step": 121689, "epoch": 2897} {"train_loss": -6.626664161682129, "global_step": 121690, "epoch": 2897} {"train_loss": -6.559610843658447, "global_step": 121691, "epoch": 2897} {"train_loss": -6.6881866455078125, "global_step": 121692, "epoch": 2897} {"train_loss": -6.564215660095215, "global_step": 121693, "epoch": 2897} {"train_loss": -6.6505045890808105, "global_step": 121694, "epoch": 2897} {"train_loss": -6.753751754760742, "global_step": 121695, "epoch": 2897} {"train_loss": -6.6241679191589355, "global_step": 121696, "epoch": 2897} {"train_loss": -6.6398725509643555, "global_step": 121697, "epoch": 2897} {"train_loss": -6.50970458984375, "global_step": 121698, "epoch": 2897} {"train_loss": -6.608803749084473, "global_step": 121699, "epoch": 2897} {"train_loss": -6.448289394378662, "global_step": 121700, "epoch": 2897} {"train_loss": -6.577807426452637, "global_step": 121701, "epoch": 2897} {"train_loss": -6.689806938171387, "global_step": 121702, "epoch": 2897} {"train_loss": -6.53395938873291, "global_step": 121703, "epoch": 2897} {"train_loss": -6.539422988891602, "global_step": 121704, "epoch": 2897} {"train_loss": -6.534963607788086, "global_step": 121705, "epoch": 2897} {"train_loss": -6.296899795532227, "global_step": 121706, "epoch": 2897} {"train_loss": -6.567577838897705, "global_step": 121707, "epoch": 2897} {"train_loss": -6.52501106262207, "global_step": 121708, "epoch": 2897} {"train_loss": -6.4284772872924805, "global_step": 121709, "epoch": 2897} {"train_loss": -6.490780353546143, "global_step": 121710, "epoch": 2897} {"train_loss": -6.3426055908203125, "global_step": 121711, "epoch": 2897} {"train_loss": -6.543795585632324, "global_step": 121712, "epoch": 2897} {"train_loss": -6.420169830322266, "global_step": 121713, "epoch": 2897} {"train_loss": -6.440502643585205, "global_step": 121714, "epoch": 2897} {"train_loss": -6.567475455147879, "global_step": 121715, "epoch": 2897, "val_loss": 66036.71875} {"train_loss": -6.521160125732422, "global_step": 121716, "epoch": 2898} {"train_loss": -6.57246208190918, "global_step": 121717, "epoch": 2898} {"train_loss": -6.380342960357666, "global_step": 121718, "epoch": 2898} {"train_loss": -6.5200653076171875, "global_step": 121719, "epoch": 2898} {"train_loss": -6.491568565368652, "global_step": 121720, "epoch": 2898} {"train_loss": -6.582634925842285, "global_step": 121721, "epoch": 2898} {"train_loss": -6.519857406616211, "global_step": 121722, "epoch": 2898} {"train_loss": -6.6347808837890625, "global_step": 121723, "epoch": 2898} {"train_loss": -6.508658409118652, "global_step": 121724, "epoch": 2898} {"train_loss": -6.584630012512207, "global_step": 121725, "epoch": 2898} {"train_loss": -6.504910469055176, "global_step": 121726, "epoch": 2898} {"train_loss": -6.489421844482422, "global_step": 121727, "epoch": 2898} {"train_loss": -6.541595458984375, "global_step": 121728, "epoch": 2898} {"train_loss": -6.52829647064209, "global_step": 121729, "epoch": 2898} {"train_loss": -6.468958854675293, "global_step": 121730, "epoch": 2898} {"train_loss": -6.539834976196289, "global_step": 121731, "epoch": 2898} {"train_loss": -6.575656414031982, "global_step": 121732, "epoch": 2898} {"train_loss": -6.443611145019531, "global_step": 121733, "epoch": 2898} {"train_loss": -6.567836761474609, "global_step": 121734, "epoch": 2898} {"train_loss": -6.461629867553711, "global_step": 121735, "epoch": 2898} {"train_loss": -6.543055534362793, "global_step": 121736, "epoch": 2898} {"train_loss": -6.639379501342773, "global_step": 121737, "epoch": 2898} {"train_loss": -6.362465858459473, "global_step": 121738, "epoch": 2898} {"train_loss": -6.646556377410889, "global_step": 121739, "epoch": 2898} {"train_loss": -6.45161771774292, "global_step": 121740, "epoch": 2898} {"train_loss": -6.4986371994018555, "global_step": 121741, "epoch": 2898} {"train_loss": -6.571887493133545, "global_step": 121742, "epoch": 2898} {"train_loss": -6.470194339752197, "global_step": 121743, "epoch": 2898} {"train_loss": -6.513710021972656, "global_step": 121744, "epoch": 2898} {"train_loss": -6.5171332359313965, "global_step": 121745, "epoch": 2898} {"train_loss": -6.529022693634033, "global_step": 121746, "epoch": 2898} {"train_loss": -6.591002464294434, "global_step": 121747, "epoch": 2898} {"train_loss": -6.5168538093566895, "global_step": 121748, "epoch": 2898} {"train_loss": -6.649774074554443, "global_step": 121749, "epoch": 2898} {"train_loss": -6.483634948730469, "global_step": 121750, "epoch": 2898} {"train_loss": -6.444278717041016, "global_step": 121751, "epoch": 2898} {"train_loss": -6.524923324584961, "global_step": 121752, "epoch": 2898} {"train_loss": -6.540745735168457, "global_step": 121753, "epoch": 2898} {"train_loss": -6.515480995178223, "global_step": 121754, "epoch": 2898} {"train_loss": -6.545495986938477, "global_step": 121755, "epoch": 2898} {"train_loss": -6.578082084655762, "global_step": 121756, "epoch": 2898} {"train_loss": -6.523667653401692, "global_step": 121757, "epoch": 2898, "val_loss": 65901.3359375} {"train_loss": -6.610481262207031, "global_step": 121758, "epoch": 2899} {"train_loss": -6.515635967254639, "global_step": 121759, "epoch": 2899} {"train_loss": -6.51206111907959, "global_step": 121760, "epoch": 2899} {"train_loss": -6.509729385375977, "global_step": 121761, "epoch": 2899} {"train_loss": -6.538135528564453, "global_step": 121762, "epoch": 2899} {"train_loss": -6.496829986572266, "global_step": 121763, "epoch": 2899} {"train_loss": -6.475314617156982, "global_step": 121764, "epoch": 2899} {"train_loss": -6.604379177093506, "global_step": 121765, "epoch": 2899} {"train_loss": -6.555819511413574, "global_step": 121766, "epoch": 2899} {"train_loss": -6.585583209991455, "global_step": 121767, "epoch": 2899} {"train_loss": -6.535696029663086, "global_step": 121768, "epoch": 2899} {"train_loss": -6.618025779724121, "global_step": 121769, "epoch": 2899} {"train_loss": -6.686007499694824, "global_step": 121770, "epoch": 2899} {"train_loss": -6.650468826293945, "global_step": 121771, "epoch": 2899} {"train_loss": -6.529613971710205, "global_step": 121772, "epoch": 2899} {"train_loss": -6.607302665710449, "global_step": 121773, "epoch": 2899} {"train_loss": -6.598318576812744, "global_step": 121774, "epoch": 2899} {"train_loss": -6.719770908355713, "global_step": 121775, "epoch": 2899} {"train_loss": -6.499690055847168, "global_step": 121776, "epoch": 2899} {"train_loss": -6.540945053100586, "global_step": 121777, "epoch": 2899} {"train_loss": -6.5284295082092285, "global_step": 121778, "epoch": 2899} {"train_loss": -6.649442195892334, "global_step": 121779, "epoch": 2899} {"train_loss": -6.577908515930176, "global_step": 121780, "epoch": 2899} {"train_loss": -6.589366912841797, "global_step": 121781, "epoch": 2899} {"train_loss": -6.652457237243652, "global_step": 121782, "epoch": 2899} {"train_loss": -6.718125343322754, "global_step": 121783, "epoch": 2899} {"train_loss": -6.534398078918457, "global_step": 121784, "epoch": 2899} {"train_loss": -6.5281758308410645, "global_step": 121785, "epoch": 2899} {"train_loss": -6.560559272766113, "global_step": 121786, "epoch": 2899} {"train_loss": -6.578522682189941, "global_step": 121787, "epoch": 2899} {"train_loss": -6.544286727905273, "global_step": 121788, "epoch": 2899} {"train_loss": -6.553070545196533, "global_step": 121789, "epoch": 2899} {"train_loss": -6.653206825256348, "global_step": 121790, "epoch": 2899} {"train_loss": -6.648677349090576, "global_step": 121791, "epoch": 2899} {"train_loss": -6.636899948120117, "global_step": 121792, "epoch": 2899} {"train_loss": -6.546293258666992, "global_step": 121793, "epoch": 2899} {"train_loss": -6.737117767333984, "global_step": 121794, "epoch": 2899} {"train_loss": -6.424548149108887, "global_step": 121795, "epoch": 2899} {"train_loss": -6.572405815124512, "global_step": 121796, "epoch": 2899} {"train_loss": -6.683035850524902, "global_step": 121797, "epoch": 2899} {"train_loss": -6.64237117767334, "global_step": 121798, "epoch": 2899} {"train_loss": -6.584693329674857, "global_step": 121799, "epoch": 2899, "val_loss": 65973.765625} {"train_loss": -6.6010050773620605, "global_step": 121800, "epoch": 2900} {"train_loss": -6.540287017822266, "global_step": 121801, "epoch": 2900} {"train_loss": -6.710442543029785, "global_step": 121802, "epoch": 2900} {"train_loss": -6.567695140838623, "global_step": 121803, "epoch": 2900} {"train_loss": -6.5529255867004395, "global_step": 121804, "epoch": 2900} {"train_loss": -6.538432598114014, "global_step": 121805, "epoch": 2900} {"train_loss": -6.579322338104248, "global_step": 121806, "epoch": 2900} {"train_loss": -6.60062313079834, "global_step": 121807, "epoch": 2900} {"train_loss": -6.5704665184021, "global_step": 121808, "epoch": 2900} {"train_loss": -6.644302845001221, "global_step": 121809, "epoch": 2900} {"train_loss": -6.6836256980896, "global_step": 121810, "epoch": 2900} {"train_loss": -6.5992279052734375, "global_step": 121811, "epoch": 2900} {"train_loss": -6.603377342224121, "global_step": 121812, "epoch": 2900} {"train_loss": -6.588135719299316, "global_step": 121813, "epoch": 2900} {"train_loss": -6.623574256896973, "global_step": 121814, "epoch": 2900} {"train_loss": -6.560855388641357, "global_step": 121815, "epoch": 2900} {"train_loss": -6.593997001647949, "global_step": 121816, "epoch": 2900} {"train_loss": -6.611591815948486, "global_step": 121817, "epoch": 2900} {"train_loss": -6.586565017700195, "global_step": 121818, "epoch": 2900} {"train_loss": -6.602005958557129, "global_step": 121819, "epoch": 2900} {"train_loss": -6.580267906188965, "global_step": 121820, "epoch": 2900} {"train_loss": -6.639005661010742, "global_step": 121821, "epoch": 2900} {"train_loss": -6.573514461517334, "global_step": 121822, "epoch": 2900} {"train_loss": -6.5537614822387695, "global_step": 121823, "epoch": 2900} {"train_loss": -6.643765926361084, "global_step": 121824, "epoch": 2900} {"train_loss": -6.6417670249938965, "global_step": 121825, "epoch": 2900} {"train_loss": -6.622906684875488, "global_step": 121826, "epoch": 2900} {"train_loss": -6.506490230560303, "global_step": 121827, "epoch": 2900} {"train_loss": -6.666234493255615, "global_step": 121828, "epoch": 2900} {"train_loss": -6.600244522094727, "global_step": 121829, "epoch": 2900} {"train_loss": -6.621280670166016, "global_step": 121830, "epoch": 2900} {"train_loss": -6.55987548828125, "global_step": 121831, "epoch": 2900} {"train_loss": -6.611205101013184, "global_step": 121832, "epoch": 2900} {"train_loss": -6.495935440063477, "global_step": 121833, "epoch": 2900} {"train_loss": -6.653258800506592, "global_step": 121834, "epoch": 2900} {"train_loss": -6.789655685424805, "global_step": 121835, "epoch": 2900} {"train_loss": -6.634769439697266, "global_step": 121836, "epoch": 2900} {"train_loss": -6.5620269775390625, "global_step": 121837, "epoch": 2900} {"train_loss": -6.5796709060668945, "global_step": 121838, "epoch": 2900} {"train_loss": -6.746379852294922, "global_step": 121839, "epoch": 2900} {"train_loss": -6.552518367767334, "global_step": 121840, "epoch": 2900} {"train_loss": -6.6033387297675725, "global_step": 121841, "epoch": 2900, "train/sim_max_reward_0": 0.3835359219372086, "train/sim_max_reward_1": 0.9409944078640274, "train/sim_max_reward_2": 0.948537559557551, "train/sim_max_reward_3": 0.9098194170325674, "train/sim_max_reward_4": 0.9628709136082021, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.3931024863415075, "test/sim_max_reward_4300002": 0.787564270988923, "test/sim_max_reward_4300003": 0.9813128941424738, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8445551123696283, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.31856788977101047, "test/sim_max_reward_4300008": 0.8971830396881642, "test/sim_max_reward_4300009": 0.9813628016033612, "test/sim_max_reward_4300010": 0.15492326054637423, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.8937720835518838, "test/sim_max_reward_4300013": 0.9856132780614956, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.33992999906222054, "test/sim_max_reward_4300016": 0.8784205904702348, "test/sim_max_reward_4300017": 0.47949322040830206, "test/sim_max_reward_4300018": 0.4575663022264923, "test/sim_max_reward_4300019": 0.18593951600794872, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8884011056094714, "test/sim_max_reward_4300022": 0.2781242125506841, "test/sim_max_reward_4300023": 0.3301337043307974, "test/sim_max_reward_4300024": 0.3316400314450364, "test/sim_max_reward_4300025": 0.1664791928725336, "test/sim_max_reward_4300026": 0.09073288397678038, "test/sim_max_reward_4300027": 0.9451064371492159, "test/sim_max_reward_4300028": 1.0, "test/sim_max_reward_4300029": 0.00662709934444269, "test/sim_max_reward_4300030": 0.934469817291053, "test/sim_max_reward_4300031": 0.20585299844950575, "test/sim_max_reward_4300032": 0.92896621120646, "test/sim_max_reward_4300033": 0.5393484775187978, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.30310417815879914, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.850009851119975, "test/sim_max_reward_4300038": 0.892708934882676, "test/sim_max_reward_4300039": 0.8902908028919743, "test/sim_max_reward_4300040": 0.9249350361643464, "test/sim_max_reward_4300041": 0.974527897793248, "test/sim_max_reward_4300042": 0.717080230785131, "test/sim_max_reward_4300043": 0.16983639676788612, "test/sim_max_reward_4300044": 0.7555586427262948, "test/sim_max_reward_4300045": 0.990101637367929, "test/sim_max_reward_4300046": 0.9987684702435865, "test/sim_max_reward_4300047": 0.9219474832902441, "test/sim_max_reward_4300048": 0.0010062665215058821, "test/sim_max_reward_4300049": 0.12939670869634698, "train/mean_score": 0.7231238298936241, "test/mean_score": 0.5591897934953503, "val_loss": 65833.0546875} {"train_loss": -6.604233741760254, "global_step": 121842, "epoch": 2901} {"train_loss": -6.605199813842773, "global_step": 121843, "epoch": 2901} {"train_loss": -6.538976669311523, "global_step": 121844, "epoch": 2901} {"train_loss": -6.465780258178711, "global_step": 121845, "epoch": 2901} {"train_loss": -6.540126800537109, "global_step": 121846, "epoch": 2901} {"train_loss": -6.59431791305542, "global_step": 121847, "epoch": 2901} {"train_loss": -6.5345869064331055, "global_step": 121848, "epoch": 2901} {"train_loss": -6.566666603088379, "global_step": 121849, "epoch": 2901} {"train_loss": -6.475332260131836, "global_step": 121850, "epoch": 2901} {"train_loss": -6.486873626708984, "global_step": 121851, "epoch": 2901} {"train_loss": -6.582798957824707, "global_step": 121852, "epoch": 2901} {"train_loss": -6.6462860107421875, "global_step": 121853, "epoch": 2901} {"train_loss": -6.506213188171387, "global_step": 121854, "epoch": 2901} {"train_loss": -6.623709678649902, "global_step": 121855, "epoch": 2901} {"train_loss": -6.695396423339844, "global_step": 121856, "epoch": 2901} {"train_loss": -6.561061859130859, "global_step": 121857, "epoch": 2901} {"train_loss": -6.41886568069458, "global_step": 121858, "epoch": 2901} {"train_loss": -6.491722583770752, "global_step": 121859, "epoch": 2901} {"train_loss": -6.276451110839844, "global_step": 121860, "epoch": 2901} {"train_loss": -6.539087772369385, "global_step": 121861, "epoch": 2901} {"train_loss": -6.446659088134766, "global_step": 121862, "epoch": 2901} {"train_loss": -6.455986499786377, "global_step": 121863, "epoch": 2901} {"train_loss": -6.546897888183594, "global_step": 121864, "epoch": 2901} {"train_loss": -6.504606246948242, "global_step": 121865, "epoch": 2901} {"train_loss": -6.593994140625, "global_step": 121866, "epoch": 2901} {"train_loss": -6.437633514404297, "global_step": 121867, "epoch": 2901} {"train_loss": -6.66964054107666, "global_step": 121868, "epoch": 2901} {"train_loss": -6.487211227416992, "global_step": 121869, "epoch": 2901} {"train_loss": -6.464458465576172, "global_step": 121870, "epoch": 2901} {"train_loss": -6.521492958068848, "global_step": 121871, "epoch": 2901} {"train_loss": -6.463940620422363, "global_step": 121872, "epoch": 2901} {"train_loss": -6.640769958496094, "global_step": 121873, "epoch": 2901} {"train_loss": -6.446344375610352, "global_step": 121874, "epoch": 2901} {"train_loss": -6.639528751373291, "global_step": 121875, "epoch": 2901} {"train_loss": -6.558655738830566, "global_step": 121876, "epoch": 2901} {"train_loss": -6.514892578125, "global_step": 121877, "epoch": 2901} {"train_loss": -6.508787631988525, "global_step": 121878, "epoch": 2901} {"train_loss": -6.61722993850708, "global_step": 121879, "epoch": 2901} {"train_loss": -6.610710144042969, "global_step": 121880, "epoch": 2901} {"train_loss": -6.572801113128662, "global_step": 121881, "epoch": 2901} {"train_loss": -6.567322254180908, "global_step": 121882, "epoch": 2901} {"train_loss": -6.537541321345738, "global_step": 121883, "epoch": 2901, "val_loss": 65803.0390625} {"train_loss": -6.622420787811279, "global_step": 121884, "epoch": 2902} {"train_loss": -6.4910430908203125, "global_step": 121885, "epoch": 2902} {"train_loss": -6.5350341796875, "global_step": 121886, "epoch": 2902} {"train_loss": -6.6381144523620605, "global_step": 121887, "epoch": 2902} {"train_loss": -6.4779582023620605, "global_step": 121888, "epoch": 2902} {"train_loss": -6.803243160247803, "global_step": 121889, "epoch": 2902} {"train_loss": -6.738137245178223, "global_step": 121890, "epoch": 2902} {"train_loss": -6.592611312866211, "global_step": 121891, "epoch": 2902} {"train_loss": -6.569009780883789, "global_step": 121892, "epoch": 2902} {"train_loss": -6.5116472244262695, "global_step": 121893, "epoch": 2902} {"train_loss": -6.54679012298584, "global_step": 121894, "epoch": 2902} {"train_loss": -6.625044822692871, "global_step": 121895, "epoch": 2902} {"train_loss": -6.54970645904541, "global_step": 121896, "epoch": 2902} {"train_loss": -6.52347469329834, "global_step": 121897, "epoch": 2902} {"train_loss": -6.583870887756348, "global_step": 121898, "epoch": 2902} {"train_loss": -6.5641069412231445, "global_step": 121899, "epoch": 2902} {"train_loss": -6.556110382080078, "global_step": 121900, "epoch": 2902} {"train_loss": -6.6185197830200195, "global_step": 121901, "epoch": 2902} {"train_loss": -6.472454071044922, "global_step": 121902, "epoch": 2902} {"train_loss": -6.605679512023926, "global_step": 121903, "epoch": 2902} {"train_loss": -6.656345367431641, "global_step": 121904, "epoch": 2902} {"train_loss": -6.493047714233398, "global_step": 121905, "epoch": 2902} {"train_loss": -6.566884994506836, "global_step": 121906, "epoch": 2902} {"train_loss": -6.6680707931518555, "global_step": 121907, "epoch": 2902} {"train_loss": -6.691239356994629, "global_step": 121908, "epoch": 2902} {"train_loss": -6.609389305114746, "global_step": 121909, "epoch": 2902} {"train_loss": -6.5811767578125, "global_step": 121910, "epoch": 2902} {"train_loss": -6.588025093078613, "global_step": 121911, "epoch": 2902} {"train_loss": -6.633953094482422, "global_step": 121912, "epoch": 2902} {"train_loss": -6.674404621124268, "global_step": 121913, "epoch": 2902} {"train_loss": -6.514554977416992, "global_step": 121914, "epoch": 2902} {"train_loss": -6.617637634277344, "global_step": 121915, "epoch": 2902} {"train_loss": -6.6077985763549805, "global_step": 121916, "epoch": 2902} {"train_loss": -6.604938983917236, "global_step": 121917, "epoch": 2902} {"train_loss": -6.660403728485107, "global_step": 121918, "epoch": 2902} {"train_loss": -6.556421756744385, "global_step": 121919, "epoch": 2902} {"train_loss": -6.443765640258789, "global_step": 121920, "epoch": 2902} {"train_loss": -6.559666633605957, "global_step": 121921, "epoch": 2902} {"train_loss": -6.611157417297363, "global_step": 121922, "epoch": 2902} {"train_loss": -6.659423828125, "global_step": 121923, "epoch": 2902} {"train_loss": -6.5037641525268555, "global_step": 121924, "epoch": 2902} {"train_loss": -6.586464041755313, "global_step": 121925, "epoch": 2902, "val_loss": 66015.328125} {"train_loss": -6.559029579162598, "global_step": 121926, "epoch": 2903} {"train_loss": -6.416250705718994, "global_step": 121927, "epoch": 2903} {"train_loss": -6.575596809387207, "global_step": 121928, "epoch": 2903} {"train_loss": -6.474857807159424, "global_step": 121929, "epoch": 2903} {"train_loss": -6.572261810302734, "global_step": 121930, "epoch": 2903} {"train_loss": -6.545955657958984, "global_step": 121931, "epoch": 2903} {"train_loss": -6.571659088134766, "global_step": 121932, "epoch": 2903} {"train_loss": -6.623146057128906, "global_step": 121933, "epoch": 2903} {"train_loss": -6.549359321594238, "global_step": 121934, "epoch": 2903} {"train_loss": -6.5499396324157715, "global_step": 121935, "epoch": 2903} {"train_loss": -6.455262184143066, "global_step": 121936, "epoch": 2903} {"train_loss": -6.576832294464111, "global_step": 121937, "epoch": 2903} {"train_loss": -6.468483924865723, "global_step": 121938, "epoch": 2903} {"train_loss": -6.620084762573242, "global_step": 121939, "epoch": 2903} {"train_loss": -6.495330333709717, "global_step": 121940, "epoch": 2903} {"train_loss": -6.535483360290527, "global_step": 121941, "epoch": 2903} {"train_loss": -6.667367935180664, "global_step": 121942, "epoch": 2903} {"train_loss": -6.533164024353027, "global_step": 121943, "epoch": 2903} {"train_loss": -6.538843154907227, "global_step": 121944, "epoch": 2903} {"train_loss": -6.55230712890625, "global_step": 121945, "epoch": 2903} {"train_loss": -6.654263496398926, "global_step": 121946, "epoch": 2903} {"train_loss": -6.489893436431885, "global_step": 121947, "epoch": 2903} {"train_loss": -6.524587154388428, "global_step": 121948, "epoch": 2903} {"train_loss": -6.492219924926758, "global_step": 121949, "epoch": 2903} {"train_loss": -6.549731254577637, "global_step": 121950, "epoch": 2903} {"train_loss": -6.534459590911865, "global_step": 121951, "epoch": 2903} {"train_loss": -6.442874908447266, "global_step": 121952, "epoch": 2903} {"train_loss": -6.657770156860352, "global_step": 121953, "epoch": 2903} {"train_loss": -6.568643569946289, "global_step": 121954, "epoch": 2903} {"train_loss": -6.533496856689453, "global_step": 121955, "epoch": 2903} {"train_loss": -6.566347122192383, "global_step": 121956, "epoch": 2903} {"train_loss": -6.585270404815674, "global_step": 121957, "epoch": 2903} {"train_loss": -6.546706199645996, "global_step": 121958, "epoch": 2903} {"train_loss": -6.492300987243652, "global_step": 121959, "epoch": 2903} {"train_loss": -6.5807576179504395, "global_step": 121960, "epoch": 2903} {"train_loss": -6.487905502319336, "global_step": 121961, "epoch": 2903} {"train_loss": -6.586104393005371, "global_step": 121962, "epoch": 2903} {"train_loss": -6.622903823852539, "global_step": 121963, "epoch": 2903} {"train_loss": -6.652983665466309, "global_step": 121964, "epoch": 2903} {"train_loss": -6.58253288269043, "global_step": 121965, "epoch": 2903} {"train_loss": -6.547098159790039, "global_step": 121966, "epoch": 2903} {"train_loss": -6.55084152448745, "global_step": 121967, "epoch": 2903, "val_loss": 65747.1328125} {"train_loss": -6.507637977600098, "global_step": 121968, "epoch": 2904} {"train_loss": -6.579880714416504, "global_step": 121969, "epoch": 2904} {"train_loss": -6.566230297088623, "global_step": 121970, "epoch": 2904} {"train_loss": -6.532606601715088, "global_step": 121971, "epoch": 2904} {"train_loss": -6.699536323547363, "global_step": 121972, "epoch": 2904} {"train_loss": -6.532861709594727, "global_step": 121973, "epoch": 2904} {"train_loss": -6.466686248779297, "global_step": 121974, "epoch": 2904} {"train_loss": -6.538698196411133, "global_step": 121975, "epoch": 2904} {"train_loss": -6.515874862670898, "global_step": 121976, "epoch": 2904} {"train_loss": -6.602998733520508, "global_step": 121977, "epoch": 2904} {"train_loss": -6.501398086547852, "global_step": 121978, "epoch": 2904} {"train_loss": -6.534633636474609, "global_step": 121979, "epoch": 2904} {"train_loss": -6.5152788162231445, "global_step": 121980, "epoch": 2904} {"train_loss": -6.5425639152526855, "global_step": 121981, "epoch": 2904} {"train_loss": -6.582583427429199, "global_step": 121982, "epoch": 2904} {"train_loss": -6.634605884552002, "global_step": 121983, "epoch": 2904} {"train_loss": -6.562029838562012, "global_step": 121984, "epoch": 2904} {"train_loss": -6.631549835205078, "global_step": 121985, "epoch": 2904} {"train_loss": -6.6286301612854, "global_step": 121986, "epoch": 2904} {"train_loss": -6.583981513977051, "global_step": 121987, "epoch": 2904} {"train_loss": -6.475775718688965, "global_step": 121988, "epoch": 2904} {"train_loss": -6.655009746551514, "global_step": 121989, "epoch": 2904} {"train_loss": -6.629080295562744, "global_step": 121990, "epoch": 2904} {"train_loss": -6.64202880859375, "global_step": 121991, "epoch": 2904} {"train_loss": -6.654994964599609, "global_step": 121992, "epoch": 2904} {"train_loss": -6.582862854003906, "global_step": 121993, "epoch": 2904} {"train_loss": -6.569047451019287, "global_step": 121994, "epoch": 2904} {"train_loss": -6.577629566192627, "global_step": 121995, "epoch": 2904} {"train_loss": -6.6535491943359375, "global_step": 121996, "epoch": 2904} {"train_loss": -6.642228126525879, "global_step": 121997, "epoch": 2904} {"train_loss": -6.583913326263428, "global_step": 121998, "epoch": 2904} {"train_loss": -6.6978349685668945, "global_step": 121999, "epoch": 2904} {"train_loss": -6.581000328063965, "global_step": 122000, "epoch": 2904} {"train_loss": -6.526312351226807, "global_step": 122001, "epoch": 2904} {"train_loss": -6.620490550994873, "global_step": 122002, "epoch": 2904} {"train_loss": -6.597440719604492, "global_step": 122003, "epoch": 2904} {"train_loss": -6.67932653427124, "global_step": 122004, "epoch": 2904} {"train_loss": -6.582771301269531, "global_step": 122005, "epoch": 2904} {"train_loss": -6.532352447509766, "global_step": 122006, "epoch": 2904} {"train_loss": -6.544836044311523, "global_step": 122007, "epoch": 2904} {"train_loss": -6.640038013458252, "global_step": 122008, "epoch": 2904} {"train_loss": -6.584437983376639, "global_step": 122009, "epoch": 2904, "val_loss": 65849.09375} {"train_loss": -6.58298397064209, "global_step": 122010, "epoch": 2905} {"train_loss": -6.5329999923706055, "global_step": 122011, "epoch": 2905} {"train_loss": -6.635262489318848, "global_step": 122012, "epoch": 2905} {"train_loss": -6.473602294921875, "global_step": 122013, "epoch": 2905} {"train_loss": -6.638039588928223, "global_step": 122014, "epoch": 2905} {"train_loss": -6.653918266296387, "global_step": 122015, "epoch": 2905} {"train_loss": -6.576559066772461, "global_step": 122016, "epoch": 2905} {"train_loss": -6.466991424560547, "global_step": 122017, "epoch": 2905} {"train_loss": -6.518017768859863, "global_step": 122018, "epoch": 2905} {"train_loss": -6.556629180908203, "global_step": 122019, "epoch": 2905} {"train_loss": -6.566406726837158, "global_step": 122020, "epoch": 2905} {"train_loss": -6.7316131591796875, "global_step": 122021, "epoch": 2905} {"train_loss": -6.593681335449219, "global_step": 122022, "epoch": 2905} {"train_loss": -6.630434513092041, "global_step": 122023, "epoch": 2905} {"train_loss": -6.578919887542725, "global_step": 122024, "epoch": 2905} {"train_loss": -6.655829906463623, "global_step": 122025, "epoch": 2905} {"train_loss": -6.568488121032715, "global_step": 122026, "epoch": 2905} {"train_loss": -6.635709285736084, "global_step": 122027, "epoch": 2905} {"train_loss": -6.592034816741943, "global_step": 122028, "epoch": 2905} {"train_loss": -6.507105350494385, "global_step": 122029, "epoch": 2905} {"train_loss": -6.628451824188232, "global_step": 122030, "epoch": 2905} {"train_loss": -6.514660835266113, "global_step": 122031, "epoch": 2905} {"train_loss": -6.604779243469238, "global_step": 122032, "epoch": 2905} {"train_loss": -6.549310207366943, "global_step": 122033, "epoch": 2905} {"train_loss": -6.425020217895508, "global_step": 122034, "epoch": 2905} {"train_loss": -6.608280181884766, "global_step": 122035, "epoch": 2905} {"train_loss": -6.570508003234863, "global_step": 122036, "epoch": 2905} {"train_loss": -6.498398780822754, "global_step": 122037, "epoch": 2905} {"train_loss": -6.627248764038086, "global_step": 122038, "epoch": 2905} {"train_loss": -6.529975891113281, "global_step": 122039, "epoch": 2905} {"train_loss": -6.60988712310791, "global_step": 122040, "epoch": 2905} {"train_loss": -6.6399102210998535, "global_step": 122041, "epoch": 2905} {"train_loss": -6.599972248077393, "global_step": 122042, "epoch": 2905} {"train_loss": -6.52585506439209, "global_step": 122043, "epoch": 2905} {"train_loss": -6.639636993408203, "global_step": 122044, "epoch": 2905} {"train_loss": -6.527824401855469, "global_step": 122045, "epoch": 2905} {"train_loss": -6.48106575012207, "global_step": 122046, "epoch": 2905} {"train_loss": -6.586704254150391, "global_step": 122047, "epoch": 2905} {"train_loss": -6.715635299682617, "global_step": 122048, "epoch": 2905} {"train_loss": -6.457415580749512, "global_step": 122049, "epoch": 2905} {"train_loss": -6.588983535766602, "global_step": 122050, "epoch": 2905} {"train_loss": -6.576374825977144, "global_step": 122051, "epoch": 2905, "val_loss": 65688.6953125} {"train_loss": -6.536169528961182, "global_step": 122052, "epoch": 2906} {"train_loss": -6.556455612182617, "global_step": 122053, "epoch": 2906} {"train_loss": -6.510193824768066, "global_step": 122054, "epoch": 2906} {"train_loss": -6.586308002471924, "global_step": 122055, "epoch": 2906} {"train_loss": -6.549035549163818, "global_step": 122056, "epoch": 2906} {"train_loss": -6.622402191162109, "global_step": 122057, "epoch": 2906} {"train_loss": -6.730733871459961, "global_step": 122058, "epoch": 2906} {"train_loss": -6.568404674530029, "global_step": 122059, "epoch": 2906} {"train_loss": -6.608514785766602, "global_step": 122060, "epoch": 2906} {"train_loss": -6.557723045349121, "global_step": 122061, "epoch": 2906} {"train_loss": -6.605179786682129, "global_step": 122062, "epoch": 2906} {"train_loss": -6.633950710296631, "global_step": 122063, "epoch": 2906} {"train_loss": -6.570321083068848, "global_step": 122064, "epoch": 2906} {"train_loss": -6.683055400848389, "global_step": 122065, "epoch": 2906} {"train_loss": -6.576624393463135, "global_step": 122066, "epoch": 2906} {"train_loss": -6.504429817199707, "global_step": 122067, "epoch": 2906} {"train_loss": -6.645504474639893, "global_step": 122068, "epoch": 2906} {"train_loss": -6.7322468757629395, "global_step": 122069, "epoch": 2906} {"train_loss": -6.603634357452393, "global_step": 122070, "epoch": 2906} {"train_loss": -6.6673197746276855, "global_step": 122071, "epoch": 2906} {"train_loss": -6.547690391540527, "global_step": 122072, "epoch": 2906} {"train_loss": -6.629711627960205, "global_step": 122073, "epoch": 2906} {"train_loss": -6.637115478515625, "global_step": 122074, "epoch": 2906} {"train_loss": -6.672260284423828, "global_step": 122075, "epoch": 2906} {"train_loss": -6.65585994720459, "global_step": 122076, "epoch": 2906} {"train_loss": -6.654003143310547, "global_step": 122077, "epoch": 2906} {"train_loss": -6.616004943847656, "global_step": 122078, "epoch": 2906} {"train_loss": -6.677557945251465, "global_step": 122079, "epoch": 2906} {"train_loss": -6.645357131958008, "global_step": 122080, "epoch": 2906} {"train_loss": -6.528372764587402, "global_step": 122081, "epoch": 2906} {"train_loss": -6.518510341644287, "global_step": 122082, "epoch": 2906} {"train_loss": -6.670714378356934, "global_step": 122083, "epoch": 2906} {"train_loss": -6.419907569885254, "global_step": 122084, "epoch": 2906} {"train_loss": -6.650357246398926, "global_step": 122085, "epoch": 2906} {"train_loss": -6.654516220092773, "global_step": 122086, "epoch": 2906} {"train_loss": -6.525477409362793, "global_step": 122087, "epoch": 2906} {"train_loss": -6.67348575592041, "global_step": 122088, "epoch": 2906} {"train_loss": -6.4273681640625, "global_step": 122089, "epoch": 2906} {"train_loss": -6.680274963378906, "global_step": 122090, "epoch": 2906} {"train_loss": -6.585981369018555, "global_step": 122091, "epoch": 2906} {"train_loss": -6.4695611000061035, "global_step": 122092, "epoch": 2906} {"train_loss": -6.599206663313366, "global_step": 122093, "epoch": 2906, "val_loss": 65925.21875} {"train_loss": -6.587061405181885, "global_step": 122094, "epoch": 2907} {"train_loss": -6.623687744140625, "global_step": 122095, "epoch": 2907} {"train_loss": -6.615162372589111, "global_step": 122096, "epoch": 2907} {"train_loss": -6.652835845947266, "global_step": 122097, "epoch": 2907} {"train_loss": -6.633589744567871, "global_step": 122098, "epoch": 2907} {"train_loss": -6.593889236450195, "global_step": 122099, "epoch": 2907} {"train_loss": -6.559925079345703, "global_step": 122100, "epoch": 2907} {"train_loss": -6.674485683441162, "global_step": 122101, "epoch": 2907} {"train_loss": -6.525110244750977, "global_step": 122102, "epoch": 2907} {"train_loss": -6.479122638702393, "global_step": 122103, "epoch": 2907} {"train_loss": -6.641085624694824, "global_step": 122104, "epoch": 2907} {"train_loss": -6.695727348327637, "global_step": 122105, "epoch": 2907} {"train_loss": -6.705687522888184, "global_step": 122106, "epoch": 2907} {"train_loss": -6.688352584838867, "global_step": 122107, "epoch": 2907} {"train_loss": -6.649912357330322, "global_step": 122108, "epoch": 2907} {"train_loss": -6.550736427307129, "global_step": 122109, "epoch": 2907} {"train_loss": -6.717465877532959, "global_step": 122110, "epoch": 2907} {"train_loss": -6.488458633422852, "global_step": 122111, "epoch": 2907} {"train_loss": -6.639436721801758, "global_step": 122112, "epoch": 2907} {"train_loss": -6.637607574462891, "global_step": 122113, "epoch": 2907} {"train_loss": -6.630599021911621, "global_step": 122114, "epoch": 2907} {"train_loss": -6.723873615264893, "global_step": 122115, "epoch": 2907} {"train_loss": -6.677804470062256, "global_step": 122116, "epoch": 2907} {"train_loss": -6.562049865722656, "global_step": 122117, "epoch": 2907} {"train_loss": -6.529956817626953, "global_step": 122118, "epoch": 2907} {"train_loss": -6.638851165771484, "global_step": 122119, "epoch": 2907} {"train_loss": -6.662713527679443, "global_step": 122120, "epoch": 2907} {"train_loss": -6.441431999206543, "global_step": 122121, "epoch": 2907} {"train_loss": -6.58998966217041, "global_step": 122122, "epoch": 2907} {"train_loss": -6.429007530212402, "global_step": 122123, "epoch": 2907} {"train_loss": -6.5858941078186035, "global_step": 122124, "epoch": 2907} {"train_loss": -6.581202507019043, "global_step": 122125, "epoch": 2907} {"train_loss": -6.46881103515625, "global_step": 122126, "epoch": 2907} {"train_loss": -6.583344459533691, "global_step": 122127, "epoch": 2907} {"train_loss": -6.558370590209961, "global_step": 122128, "epoch": 2907} {"train_loss": -6.535202980041504, "global_step": 122129, "epoch": 2907} {"train_loss": -6.516056060791016, "global_step": 122130, "epoch": 2907} {"train_loss": -6.340948104858398, "global_step": 122131, "epoch": 2907} {"train_loss": -6.620584487915039, "global_step": 122132, "epoch": 2907} {"train_loss": -6.448995590209961, "global_step": 122133, "epoch": 2907} {"train_loss": -6.440839767456055, "global_step": 122134, "epoch": 2907} {"train_loss": -6.584695498148601, "global_step": 122135, "epoch": 2907, "val_loss": 66347.9921875} {"train_loss": -6.40484619140625, "global_step": 122136, "epoch": 2908} {"train_loss": -6.502437114715576, "global_step": 122137, "epoch": 2908} {"train_loss": -6.452791690826416, "global_step": 122138, "epoch": 2908} {"train_loss": -6.412284851074219, "global_step": 122139, "epoch": 2908} {"train_loss": -6.482935905456543, "global_step": 122140, "epoch": 2908} {"train_loss": -6.544615745544434, "global_step": 122141, "epoch": 2908} {"train_loss": -6.607820987701416, "global_step": 122142, "epoch": 2908} {"train_loss": -6.678153991699219, "global_step": 122143, "epoch": 2908} {"train_loss": -6.6769561767578125, "global_step": 122144, "epoch": 2908} {"train_loss": -6.542720794677734, "global_step": 122145, "epoch": 2908} {"train_loss": -6.556349754333496, "global_step": 122146, "epoch": 2908} {"train_loss": -6.590923309326172, "global_step": 122147, "epoch": 2908} {"train_loss": -6.556423664093018, "global_step": 122148, "epoch": 2908} {"train_loss": -6.561102867126465, "global_step": 122149, "epoch": 2908} {"train_loss": -6.764742851257324, "global_step": 122150, "epoch": 2908} {"train_loss": -6.654926300048828, "global_step": 122151, "epoch": 2908} {"train_loss": -6.683810234069824, "global_step": 122152, "epoch": 2908} {"train_loss": -6.600109100341797, "global_step": 122153, "epoch": 2908} {"train_loss": -6.758492469787598, "global_step": 122154, "epoch": 2908} {"train_loss": -6.675755500793457, "global_step": 122155, "epoch": 2908} {"train_loss": -6.68449592590332, "global_step": 122156, "epoch": 2908} {"train_loss": -6.600525856018066, "global_step": 122157, "epoch": 2908} {"train_loss": -6.547929763793945, "global_step": 122158, "epoch": 2908} {"train_loss": -6.647961616516113, "global_step": 122159, "epoch": 2908} {"train_loss": -6.576630592346191, "global_step": 122160, "epoch": 2908} {"train_loss": -6.615809440612793, "global_step": 122161, "epoch": 2908} {"train_loss": -6.606292724609375, "global_step": 122162, "epoch": 2908} {"train_loss": -6.57009220123291, "global_step": 122163, "epoch": 2908} {"train_loss": -6.626712322235107, "global_step": 122164, "epoch": 2908} {"train_loss": -6.679828643798828, "global_step": 122165, "epoch": 2908} {"train_loss": -6.719028472900391, "global_step": 122166, "epoch": 2908} {"train_loss": -6.589186668395996, "global_step": 122167, "epoch": 2908} {"train_loss": -6.5435872077941895, "global_step": 122168, "epoch": 2908} {"train_loss": -6.543713569641113, "global_step": 122169, "epoch": 2908} {"train_loss": -6.661043643951416, "global_step": 122170, "epoch": 2908} {"train_loss": -6.577055931091309, "global_step": 122171, "epoch": 2908} {"train_loss": -6.624838829040527, "global_step": 122172, "epoch": 2908} {"train_loss": -6.475653648376465, "global_step": 122173, "epoch": 2908} {"train_loss": -6.573901176452637, "global_step": 122174, "epoch": 2908} {"train_loss": -6.646904945373535, "global_step": 122175, "epoch": 2908} {"train_loss": -6.616405010223389, "global_step": 122176, "epoch": 2908} {"train_loss": -6.595382486070905, "global_step": 122177, "epoch": 2908, "val_loss": 65913.6953125} {"train_loss": -6.616607189178467, "global_step": 122178, "epoch": 2909} {"train_loss": -6.565701961517334, "global_step": 122179, "epoch": 2909} {"train_loss": -6.537505149841309, "global_step": 122180, "epoch": 2909} {"train_loss": -6.641222953796387, "global_step": 122181, "epoch": 2909} {"train_loss": -6.585237503051758, "global_step": 122182, "epoch": 2909} {"train_loss": -6.635763168334961, "global_step": 122183, "epoch": 2909} {"train_loss": -6.634927749633789, "global_step": 122184, "epoch": 2909} {"train_loss": -6.539793014526367, "global_step": 122185, "epoch": 2909} {"train_loss": -6.700811386108398, "global_step": 122186, "epoch": 2909} {"train_loss": -6.641164779663086, "global_step": 122187, "epoch": 2909} {"train_loss": -6.716466903686523, "global_step": 122188, "epoch": 2909} {"train_loss": -6.7179951667785645, "global_step": 122189, "epoch": 2909} {"train_loss": -6.582079887390137, "global_step": 122190, "epoch": 2909} {"train_loss": -6.592700004577637, "global_step": 122191, "epoch": 2909} {"train_loss": -6.649725914001465, "global_step": 122192, "epoch": 2909} {"train_loss": -6.6471476554870605, "global_step": 122193, "epoch": 2909} {"train_loss": -6.554672718048096, "global_step": 122194, "epoch": 2909} {"train_loss": -6.593436241149902, "global_step": 122195, "epoch": 2909} {"train_loss": -6.63796329498291, "global_step": 122196, "epoch": 2909} {"train_loss": -6.681160926818848, "global_step": 122197, "epoch": 2909} {"train_loss": -6.565305709838867, "global_step": 122198, "epoch": 2909} {"train_loss": -6.639368057250977, "global_step": 122199, "epoch": 2909} {"train_loss": -6.770961761474609, "global_step": 122200, "epoch": 2909} {"train_loss": -6.567358016967773, "global_step": 122201, "epoch": 2909} {"train_loss": -6.562114715576172, "global_step": 122202, "epoch": 2909} {"train_loss": -6.71182107925415, "global_step": 122203, "epoch": 2909} {"train_loss": -6.680863857269287, "global_step": 122204, "epoch": 2909} {"train_loss": -6.628641128540039, "global_step": 122205, "epoch": 2909} {"train_loss": -6.609170913696289, "global_step": 122206, "epoch": 2909} {"train_loss": -6.67293643951416, "global_step": 122207, "epoch": 2909} {"train_loss": -6.560196876525879, "global_step": 122208, "epoch": 2909} {"train_loss": -6.562140464782715, "global_step": 122209, "epoch": 2909} {"train_loss": -6.6839375495910645, "global_step": 122210, "epoch": 2909} {"train_loss": -6.5435709953308105, "global_step": 122211, "epoch": 2909} {"train_loss": -6.651209831237793, "global_step": 122212, "epoch": 2909} {"train_loss": -6.627297401428223, "global_step": 122213, "epoch": 2909} {"train_loss": -6.586230278015137, "global_step": 122214, "epoch": 2909} {"train_loss": -6.634812831878662, "global_step": 122215, "epoch": 2909} {"train_loss": -6.62007999420166, "global_step": 122216, "epoch": 2909} {"train_loss": -6.494446277618408, "global_step": 122217, "epoch": 2909} {"train_loss": -6.541988372802734, "global_step": 122218, "epoch": 2909} {"train_loss": -6.619346845717657, "global_step": 122219, "epoch": 2909, "val_loss": 65971.734375} {"train_loss": -6.594547271728516, "global_step": 122220, "epoch": 2910} {"train_loss": -6.5941314697265625, "global_step": 122221, "epoch": 2910} {"train_loss": -6.633636474609375, "global_step": 122222, "epoch": 2910} {"train_loss": -6.587460517883301, "global_step": 122223, "epoch": 2910} {"train_loss": -6.6797194480896, "global_step": 122224, "epoch": 2910} {"train_loss": -6.5693159103393555, "global_step": 122225, "epoch": 2910} {"train_loss": -6.6908979415893555, "global_step": 122226, "epoch": 2910} {"train_loss": -6.6838226318359375, "global_step": 122227, "epoch": 2910} {"train_loss": -6.668745040893555, "global_step": 122228, "epoch": 2910} {"train_loss": -6.668359279632568, "global_step": 122229, "epoch": 2910} {"train_loss": -6.667925834655762, "global_step": 122230, "epoch": 2910} {"train_loss": -6.6494669914245605, "global_step": 122231, "epoch": 2910} {"train_loss": -6.65976619720459, "global_step": 122232, "epoch": 2910} {"train_loss": -6.491094589233398, "global_step": 122233, "epoch": 2910} {"train_loss": -6.54615592956543, "global_step": 122234, "epoch": 2910} {"train_loss": -6.66004753112793, "global_step": 122235, "epoch": 2910} {"train_loss": -6.485536575317383, "global_step": 122236, "epoch": 2910} {"train_loss": -6.516567230224609, "global_step": 122237, "epoch": 2910} {"train_loss": -6.483222007751465, "global_step": 122238, "epoch": 2910} {"train_loss": -6.487837791442871, "global_step": 122239, "epoch": 2910} {"train_loss": -6.596451282501221, "global_step": 122240, "epoch": 2910} {"train_loss": -6.443123817443848, "global_step": 122241, "epoch": 2910} {"train_loss": -6.572396278381348, "global_step": 122242, "epoch": 2910} {"train_loss": -6.448387145996094, "global_step": 122243, "epoch": 2910} {"train_loss": -6.4490132331848145, "global_step": 122244, "epoch": 2910} {"train_loss": -6.611360549926758, "global_step": 122245, "epoch": 2910} {"train_loss": -6.31033992767334, "global_step": 122246, "epoch": 2910} {"train_loss": -6.640913009643555, "global_step": 122247, "epoch": 2910} {"train_loss": -6.464138984680176, "global_step": 122248, "epoch": 2910} {"train_loss": -6.427337169647217, "global_step": 122249, "epoch": 2910} {"train_loss": -6.475974082946777, "global_step": 122250, "epoch": 2910} {"train_loss": -6.66316032409668, "global_step": 122251, "epoch": 2910} {"train_loss": -6.582751274108887, "global_step": 122252, "epoch": 2910} {"train_loss": -6.579913139343262, "global_step": 122253, "epoch": 2910} {"train_loss": -6.575473785400391, "global_step": 122254, "epoch": 2910} {"train_loss": -6.609223365783691, "global_step": 122255, "epoch": 2910} {"train_loss": -6.574249267578125, "global_step": 122256, "epoch": 2910} {"train_loss": -6.511684417724609, "global_step": 122257, "epoch": 2910} {"train_loss": -6.568966865539551, "global_step": 122258, "epoch": 2910} {"train_loss": -6.524145126342773, "global_step": 122259, "epoch": 2910} {"train_loss": -6.580233573913574, "global_step": 122260, "epoch": 2910} {"train_loss": -6.566082125618344, "global_step": 122261, "epoch": 2910, "val_loss": 65904.0859375} {"train_loss": -6.628871917724609, "global_step": 122262, "epoch": 2911} {"train_loss": -6.641216278076172, "global_step": 122263, "epoch": 2911} {"train_loss": -6.574571132659912, "global_step": 122264, "epoch": 2911} {"train_loss": -6.542240142822266, "global_step": 122265, "epoch": 2911} {"train_loss": -6.587238311767578, "global_step": 122266, "epoch": 2911} {"train_loss": -6.611113548278809, "global_step": 122267, "epoch": 2911} {"train_loss": -6.645529747009277, "global_step": 122268, "epoch": 2911} {"train_loss": -6.54931116104126, "global_step": 122269, "epoch": 2911} {"train_loss": -6.665255546569824, "global_step": 122270, "epoch": 2911} {"train_loss": -6.6319580078125, "global_step": 122271, "epoch": 2911} {"train_loss": -6.644787788391113, "global_step": 122272, "epoch": 2911} {"train_loss": -6.604227542877197, "global_step": 122273, "epoch": 2911} {"train_loss": -6.54308557510376, "global_step": 122274, "epoch": 2911} {"train_loss": -6.580751419067383, "global_step": 122275, "epoch": 2911} {"train_loss": -6.738584518432617, "global_step": 122276, "epoch": 2911} {"train_loss": -6.672582149505615, "global_step": 122277, "epoch": 2911} {"train_loss": -6.573931694030762, "global_step": 122278, "epoch": 2911} {"train_loss": -6.596932411193848, "global_step": 122279, "epoch": 2911} {"train_loss": -6.47077751159668, "global_step": 122280, "epoch": 2911} {"train_loss": -6.679446697235107, "global_step": 122281, "epoch": 2911} {"train_loss": -6.557464599609375, "global_step": 122282, "epoch": 2911} {"train_loss": -6.581276893615723, "global_step": 122283, "epoch": 2911} {"train_loss": -6.605236530303955, "global_step": 122284, "epoch": 2911} {"train_loss": -6.6620330810546875, "global_step": 122285, "epoch": 2911} {"train_loss": -6.565682411193848, "global_step": 122286, "epoch": 2911} {"train_loss": -6.649073123931885, "global_step": 122287, "epoch": 2911} {"train_loss": -6.697809219360352, "global_step": 122288, "epoch": 2911} {"train_loss": -6.633825302124023, "global_step": 122289, "epoch": 2911} {"train_loss": -6.680838584899902, "global_step": 122290, "epoch": 2911} {"train_loss": -6.6721906661987305, "global_step": 122291, "epoch": 2911} {"train_loss": -6.628607749938965, "global_step": 122292, "epoch": 2911} {"train_loss": -6.582121849060059, "global_step": 122293, "epoch": 2911} {"train_loss": -6.548921585083008, "global_step": 122294, "epoch": 2911} {"train_loss": -6.696186542510986, "global_step": 122295, "epoch": 2911} {"train_loss": -6.718896865844727, "global_step": 122296, "epoch": 2911} {"train_loss": -6.564758777618408, "global_step": 122297, "epoch": 2911} {"train_loss": -6.605886459350586, "global_step": 122298, "epoch": 2911} {"train_loss": -6.62669038772583, "global_step": 122299, "epoch": 2911} {"train_loss": -6.592293739318848, "global_step": 122300, "epoch": 2911} {"train_loss": -6.606349468231201, "global_step": 122301, "epoch": 2911} {"train_loss": -6.738259315490723, "global_step": 122302, "epoch": 2911} {"train_loss": -6.620389086859567, "global_step": 122303, "epoch": 2911, "val_loss": 65865.65625} {"train_loss": -6.595359802246094, "global_step": 122304, "epoch": 2912} {"train_loss": -6.598480224609375, "global_step": 122305, "epoch": 2912} {"train_loss": -6.633631229400635, "global_step": 122306, "epoch": 2912} {"train_loss": -6.6573591232299805, "global_step": 122307, "epoch": 2912} {"train_loss": -6.5961151123046875, "global_step": 122308, "epoch": 2912} {"train_loss": -6.456991195678711, "global_step": 122309, "epoch": 2912} {"train_loss": -6.558546543121338, "global_step": 122310, "epoch": 2912} {"train_loss": -6.60805606842041, "global_step": 122311, "epoch": 2912} {"train_loss": -6.72346305847168, "global_step": 122312, "epoch": 2912} {"train_loss": -6.558498382568359, "global_step": 122313, "epoch": 2912} {"train_loss": -6.4929399490356445, "global_step": 122314, "epoch": 2912} {"train_loss": -6.820399284362793, "global_step": 122315, "epoch": 2912} {"train_loss": -6.614025592803955, "global_step": 122316, "epoch": 2912} {"train_loss": -6.50123405456543, "global_step": 122317, "epoch": 2912} {"train_loss": -6.712104320526123, "global_step": 122318, "epoch": 2912} {"train_loss": -6.640336036682129, "global_step": 122319, "epoch": 2912} {"train_loss": -6.550943851470947, "global_step": 122320, "epoch": 2912} {"train_loss": -6.630074501037598, "global_step": 122321, "epoch": 2912} {"train_loss": -6.550445556640625, "global_step": 122322, "epoch": 2912} {"train_loss": -6.492434501647949, "global_step": 122323, "epoch": 2912} {"train_loss": -6.580773830413818, "global_step": 122324, "epoch": 2912} {"train_loss": -6.602587699890137, "global_step": 122325, "epoch": 2912} {"train_loss": -6.532250881195068, "global_step": 122326, "epoch": 2912} {"train_loss": -6.651881694793701, "global_step": 122327, "epoch": 2912} {"train_loss": -6.475218296051025, "global_step": 122328, "epoch": 2912} {"train_loss": -6.680385589599609, "global_step": 122329, "epoch": 2912} {"train_loss": -6.5711517333984375, "global_step": 122330, "epoch": 2912} {"train_loss": -6.585268974304199, "global_step": 122331, "epoch": 2912} {"train_loss": -6.713068008422852, "global_step": 122332, "epoch": 2912} {"train_loss": -6.6234331130981445, "global_step": 122333, "epoch": 2912} {"train_loss": -6.647002220153809, "global_step": 122334, "epoch": 2912} {"train_loss": -6.582479953765869, "global_step": 122335, "epoch": 2912} {"train_loss": -6.664959907531738, "global_step": 122336, "epoch": 2912} {"train_loss": -6.690237998962402, "global_step": 122337, "epoch": 2912} {"train_loss": -6.5308637619018555, "global_step": 122338, "epoch": 2912} {"train_loss": -6.592537879943848, "global_step": 122339, "epoch": 2912} {"train_loss": -6.568641185760498, "global_step": 122340, "epoch": 2912} {"train_loss": -6.719910621643066, "global_step": 122341, "epoch": 2912} {"train_loss": -6.61065673828125, "global_step": 122342, "epoch": 2912} {"train_loss": -6.602278709411621, "global_step": 122343, "epoch": 2912} {"train_loss": -6.541435241699219, "global_step": 122344, "epoch": 2912} {"train_loss": -6.606039081301008, "global_step": 122345, "epoch": 2912, "val_loss": 65911.28125} {"train_loss": -6.609897136688232, "global_step": 122346, "epoch": 2913} {"train_loss": -6.583927631378174, "global_step": 122347, "epoch": 2913} {"train_loss": -6.670581817626953, "global_step": 122348, "epoch": 2913} {"train_loss": -6.767477035522461, "global_step": 122349, "epoch": 2913} {"train_loss": -6.677989959716797, "global_step": 122350, "epoch": 2913} {"train_loss": -6.698228359222412, "global_step": 122351, "epoch": 2913} {"train_loss": -6.624839782714844, "global_step": 122352, "epoch": 2913} {"train_loss": -6.650878429412842, "global_step": 122353, "epoch": 2913} {"train_loss": -6.681461334228516, "global_step": 122354, "epoch": 2913} {"train_loss": -6.625978469848633, "global_step": 122355, "epoch": 2913} {"train_loss": -6.64917516708374, "global_step": 122356, "epoch": 2913} {"train_loss": -6.623746395111084, "global_step": 122357, "epoch": 2913} {"train_loss": -6.682392597198486, "global_step": 122358, "epoch": 2913} {"train_loss": -6.56350040435791, "global_step": 122359, "epoch": 2913} {"train_loss": -6.6075921058654785, "global_step": 122360, "epoch": 2913} {"train_loss": -6.496210098266602, "global_step": 122361, "epoch": 2913} {"train_loss": -6.577262878417969, "global_step": 122362, "epoch": 2913} {"train_loss": -6.511282444000244, "global_step": 122363, "epoch": 2913} {"train_loss": -6.542269706726074, "global_step": 122364, "epoch": 2913} {"train_loss": -6.589035987854004, "global_step": 122365, "epoch": 2913} {"train_loss": -6.554290771484375, "global_step": 122366, "epoch": 2913} {"train_loss": -6.572732925415039, "global_step": 122367, "epoch": 2913} {"train_loss": -6.562427997589111, "global_step": 122368, "epoch": 2913} {"train_loss": -6.6672773361206055, "global_step": 122369, "epoch": 2913} {"train_loss": -6.605621337890625, "global_step": 122370, "epoch": 2913} {"train_loss": -6.592076301574707, "global_step": 122371, "epoch": 2913} {"train_loss": -6.664952278137207, "global_step": 122372, "epoch": 2913} {"train_loss": -6.530327796936035, "global_step": 122373, "epoch": 2913} {"train_loss": -6.566059112548828, "global_step": 122374, "epoch": 2913} {"train_loss": -6.558651447296143, "global_step": 122375, "epoch": 2913} {"train_loss": -6.60329532623291, "global_step": 122376, "epoch": 2913} {"train_loss": -6.628168106079102, "global_step": 122377, "epoch": 2913} {"train_loss": -6.610255718231201, "global_step": 122378, "epoch": 2913} {"train_loss": -6.501236915588379, "global_step": 122379, "epoch": 2913} {"train_loss": -6.596973419189453, "global_step": 122380, "epoch": 2913} {"train_loss": -6.606789588928223, "global_step": 122381, "epoch": 2913} {"train_loss": -6.64570951461792, "global_step": 122382, "epoch": 2913} {"train_loss": -6.613080024719238, "global_step": 122383, "epoch": 2913} {"train_loss": -6.529134750366211, "global_step": 122384, "epoch": 2913} {"train_loss": -6.550712585449219, "global_step": 122385, "epoch": 2913} {"train_loss": -6.566206932067871, "global_step": 122386, "epoch": 2913} {"train_loss": -6.599208718254452, "global_step": 122387, "epoch": 2913, "val_loss": 66027.46875} {"train_loss": -6.660388946533203, "global_step": 122388, "epoch": 2914} {"train_loss": -6.415944576263428, "global_step": 122389, "epoch": 2914} {"train_loss": -6.5621256828308105, "global_step": 122390, "epoch": 2914} {"train_loss": -6.64113712310791, "global_step": 122391, "epoch": 2914} {"train_loss": -6.465509414672852, "global_step": 122392, "epoch": 2914} {"train_loss": -6.674543380737305, "global_step": 122393, "epoch": 2914} {"train_loss": -6.370672225952148, "global_step": 122394, "epoch": 2914} {"train_loss": -6.368490219116211, "global_step": 122395, "epoch": 2914} {"train_loss": -6.512094974517822, "global_step": 122396, "epoch": 2914} {"train_loss": -6.494499206542969, "global_step": 122397, "epoch": 2914} {"train_loss": -6.485274314880371, "global_step": 122398, "epoch": 2914} {"train_loss": -6.489624977111816, "global_step": 122399, "epoch": 2914} {"train_loss": -6.6345930099487305, "global_step": 122400, "epoch": 2914} {"train_loss": -6.519626140594482, "global_step": 122401, "epoch": 2914} {"train_loss": -6.605973243713379, "global_step": 122402, "epoch": 2914} {"train_loss": -6.459383010864258, "global_step": 122403, "epoch": 2914} {"train_loss": -6.577938079833984, "global_step": 122404, "epoch": 2914} {"train_loss": -6.4753923416137695, "global_step": 122405, "epoch": 2914} {"train_loss": -6.641444206237793, "global_step": 122406, "epoch": 2914} {"train_loss": -6.374184608459473, "global_step": 122407, "epoch": 2914} {"train_loss": -6.504667282104492, "global_step": 122408, "epoch": 2914} {"train_loss": -6.42618465423584, "global_step": 122409, "epoch": 2914} {"train_loss": -6.52573299407959, "global_step": 122410, "epoch": 2914} {"train_loss": -6.573554515838623, "global_step": 122411, "epoch": 2914} {"train_loss": -6.5559282302856445, "global_step": 122412, "epoch": 2914} {"train_loss": -6.457542419433594, "global_step": 122413, "epoch": 2914} {"train_loss": -6.616667747497559, "global_step": 122414, "epoch": 2914} {"train_loss": -6.580691814422607, "global_step": 122415, "epoch": 2914} {"train_loss": -6.541353225708008, "global_step": 122416, "epoch": 2914} {"train_loss": -6.502119064331055, "global_step": 122417, "epoch": 2914} {"train_loss": -6.588059425354004, "global_step": 122418, "epoch": 2914} {"train_loss": -6.675496578216553, "global_step": 122419, "epoch": 2914} {"train_loss": -6.529953479766846, "global_step": 122420, "epoch": 2914} {"train_loss": -6.571782112121582, "global_step": 122421, "epoch": 2914} {"train_loss": -6.6194305419921875, "global_step": 122422, "epoch": 2914} {"train_loss": -6.64949893951416, "global_step": 122423, "epoch": 2914} {"train_loss": -6.516010761260986, "global_step": 122424, "epoch": 2914} {"train_loss": -6.615633487701416, "global_step": 122425, "epoch": 2914} {"train_loss": -6.513706207275391, "global_step": 122426, "epoch": 2914} {"train_loss": -6.585492134094238, "global_step": 122427, "epoch": 2914} {"train_loss": -6.6330132484436035, "global_step": 122428, "epoch": 2914} {"train_loss": -6.541670470010667, "global_step": 122429, "epoch": 2914, "val_loss": 65897.6015625} {"train_loss": -6.565730094909668, "global_step": 122430, "epoch": 2915} {"train_loss": -6.6296186447143555, "global_step": 122431, "epoch": 2915} {"train_loss": -6.717832565307617, "global_step": 122432, "epoch": 2915} {"train_loss": -6.626097679138184, "global_step": 122433, "epoch": 2915} {"train_loss": -6.618443489074707, "global_step": 122434, "epoch": 2915} {"train_loss": -6.713174343109131, "global_step": 122435, "epoch": 2915} {"train_loss": -6.692915916442871, "global_step": 122436, "epoch": 2915} {"train_loss": -6.58499813079834, "global_step": 122437, "epoch": 2915} {"train_loss": -6.617170333862305, "global_step": 122438, "epoch": 2915} {"train_loss": -6.719445705413818, "global_step": 122439, "epoch": 2915} {"train_loss": -6.637958526611328, "global_step": 122440, "epoch": 2915} {"train_loss": -6.681036949157715, "global_step": 122441, "epoch": 2915} {"train_loss": -6.574061393737793, "global_step": 122442, "epoch": 2915} {"train_loss": -6.686976909637451, "global_step": 122443, "epoch": 2915} {"train_loss": -6.553784370422363, "global_step": 122444, "epoch": 2915} {"train_loss": -6.594030380249023, "global_step": 122445, "epoch": 2915} {"train_loss": -6.535519599914551, "global_step": 122446, "epoch": 2915} {"train_loss": -6.5600762367248535, "global_step": 122447, "epoch": 2915} {"train_loss": -6.569676399230957, "global_step": 122448, "epoch": 2915} {"train_loss": -6.631301403045654, "global_step": 122449, "epoch": 2915} {"train_loss": -6.641034126281738, "global_step": 122450, "epoch": 2915} {"train_loss": -6.641646385192871, "global_step": 122451, "epoch": 2915} {"train_loss": -6.607662200927734, "global_step": 122452, "epoch": 2915} {"train_loss": -6.705837249755859, "global_step": 122453, "epoch": 2915} {"train_loss": -6.603729724884033, "global_step": 122454, "epoch": 2915} {"train_loss": -6.41548490524292, "global_step": 122455, "epoch": 2915} {"train_loss": -6.7514872550964355, "global_step": 122456, "epoch": 2915} {"train_loss": -6.62145471572876, "global_step": 122457, "epoch": 2915} {"train_loss": -6.801653861999512, "global_step": 122458, "epoch": 2915} {"train_loss": -6.727237701416016, "global_step": 122459, "epoch": 2915} {"train_loss": -6.657046794891357, "global_step": 122460, "epoch": 2915} {"train_loss": -6.575918197631836, "global_step": 122461, "epoch": 2915} {"train_loss": -6.677641868591309, "global_step": 122462, "epoch": 2915} {"train_loss": -6.577243804931641, "global_step": 122463, "epoch": 2915} {"train_loss": -6.586622714996338, "global_step": 122464, "epoch": 2915} {"train_loss": -6.639945030212402, "global_step": 122465, "epoch": 2915} {"train_loss": -6.60680627822876, "global_step": 122466, "epoch": 2915} {"train_loss": -6.646607398986816, "global_step": 122467, "epoch": 2915} {"train_loss": -6.623066425323486, "global_step": 122468, "epoch": 2915} {"train_loss": -6.757303237915039, "global_step": 122469, "epoch": 2915} {"train_loss": -6.5848188400268555, "global_step": 122470, "epoch": 2915} {"train_loss": -6.631102403004964, "global_step": 122471, "epoch": 2915, "val_loss": 65957.765625} {"train_loss": -6.661503791809082, "global_step": 122472, "epoch": 2916} {"train_loss": -6.568967342376709, "global_step": 122473, "epoch": 2916} {"train_loss": -6.587063789367676, "global_step": 122474, "epoch": 2916} {"train_loss": -6.601723670959473, "global_step": 122475, "epoch": 2916} {"train_loss": -6.547469139099121, "global_step": 122476, "epoch": 2916} {"train_loss": -6.577111721038818, "global_step": 122477, "epoch": 2916} {"train_loss": -6.586453914642334, "global_step": 122478, "epoch": 2916} {"train_loss": -6.488339900970459, "global_step": 122479, "epoch": 2916} {"train_loss": -6.567648410797119, "global_step": 122480, "epoch": 2916} {"train_loss": -6.437133312225342, "global_step": 122481, "epoch": 2916} {"train_loss": -6.637660026550293, "global_step": 122482, "epoch": 2916} {"train_loss": -6.648904800415039, "global_step": 122483, "epoch": 2916} {"train_loss": -6.568996429443359, "global_step": 122484, "epoch": 2916} {"train_loss": -6.586421012878418, "global_step": 122485, "epoch": 2916} {"train_loss": -6.587838649749756, "global_step": 122486, "epoch": 2916} {"train_loss": -6.614396095275879, "global_step": 122487, "epoch": 2916} {"train_loss": -6.430349826812744, "global_step": 122488, "epoch": 2916} {"train_loss": -6.465065956115723, "global_step": 122489, "epoch": 2916} {"train_loss": -6.645586013793945, "global_step": 122490, "epoch": 2916} {"train_loss": -6.551138877868652, "global_step": 122491, "epoch": 2916} {"train_loss": -6.512269020080566, "global_step": 122492, "epoch": 2916} {"train_loss": -6.57754373550415, "global_step": 122493, "epoch": 2916} {"train_loss": -6.652809143066406, "global_step": 122494, "epoch": 2916} {"train_loss": -6.645329475402832, "global_step": 122495, "epoch": 2916} {"train_loss": -6.615095138549805, "global_step": 122496, "epoch": 2916} {"train_loss": -6.655405044555664, "global_step": 122497, "epoch": 2916} {"train_loss": -6.667774200439453, "global_step": 122498, "epoch": 2916} {"train_loss": -6.66074275970459, "global_step": 122499, "epoch": 2916} {"train_loss": -6.6526994705200195, "global_step": 122500, "epoch": 2916} {"train_loss": -6.61224365234375, "global_step": 122501, "epoch": 2916} {"train_loss": -6.623997688293457, "global_step": 122502, "epoch": 2916} {"train_loss": -6.624901294708252, "global_step": 122503, "epoch": 2916} {"train_loss": -6.544089317321777, "global_step": 122504, "epoch": 2916} {"train_loss": -6.711164474487305, "global_step": 122505, "epoch": 2916} {"train_loss": -6.423279762268066, "global_step": 122506, "epoch": 2916} {"train_loss": -6.534305572509766, "global_step": 122507, "epoch": 2916} {"train_loss": -6.641977310180664, "global_step": 122508, "epoch": 2916} {"train_loss": -6.463600158691406, "global_step": 122509, "epoch": 2916} {"train_loss": -6.6282830238342285, "global_step": 122510, "epoch": 2916} {"train_loss": -6.416183948516846, "global_step": 122511, "epoch": 2916} {"train_loss": -6.547279357910156, "global_step": 122512, "epoch": 2916} {"train_loss": -6.581051747004191, "global_step": 122513, "epoch": 2916, "val_loss": 65967.453125} {"train_loss": -6.336523056030273, "global_step": 122514, "epoch": 2917} {"train_loss": -6.462763786315918, "global_step": 122515, "epoch": 2917} {"train_loss": -6.505588531494141, "global_step": 122516, "epoch": 2917} {"train_loss": -6.468166351318359, "global_step": 122517, "epoch": 2917} {"train_loss": -6.574960708618164, "global_step": 122518, "epoch": 2917} {"train_loss": -6.513283729553223, "global_step": 122519, "epoch": 2917} {"train_loss": -6.626539707183838, "global_step": 122520, "epoch": 2917} {"train_loss": -6.498419761657715, "global_step": 122521, "epoch": 2917} {"train_loss": -6.5618133544921875, "global_step": 122522, "epoch": 2917} {"train_loss": -6.589744567871094, "global_step": 122523, "epoch": 2917} {"train_loss": -6.626401901245117, "global_step": 122524, "epoch": 2917} {"train_loss": -6.578383922576904, "global_step": 122525, "epoch": 2917} {"train_loss": -6.4723310470581055, "global_step": 122526, "epoch": 2917} {"train_loss": -6.598771095275879, "global_step": 122527, "epoch": 2917} {"train_loss": -6.568941116333008, "global_step": 122528, "epoch": 2917} {"train_loss": -6.543224334716797, "global_step": 122529, "epoch": 2917} {"train_loss": -6.605916976928711, "global_step": 122530, "epoch": 2917} {"train_loss": -6.6479082107543945, "global_step": 122531, "epoch": 2917} {"train_loss": -6.569568634033203, "global_step": 122532, "epoch": 2917} {"train_loss": -6.625601768493652, "global_step": 122533, "epoch": 2917} {"train_loss": -6.597324848175049, "global_step": 122534, "epoch": 2917} {"train_loss": -6.469546318054199, "global_step": 122535, "epoch": 2917} {"train_loss": -6.494570732116699, "global_step": 122536, "epoch": 2917} {"train_loss": -6.553675174713135, "global_step": 122537, "epoch": 2917} {"train_loss": -6.682633399963379, "global_step": 122538, "epoch": 2917} {"train_loss": -6.561976432800293, "global_step": 122539, "epoch": 2917} {"train_loss": -6.6130571365356445, "global_step": 122540, "epoch": 2917} {"train_loss": -6.532639980316162, "global_step": 122541, "epoch": 2917} {"train_loss": -6.578564643859863, "global_step": 122542, "epoch": 2917} {"train_loss": -6.630559921264648, "global_step": 122543, "epoch": 2917} {"train_loss": -6.717131614685059, "global_step": 122544, "epoch": 2917} {"train_loss": -6.6047515869140625, "global_step": 122545, "epoch": 2917} {"train_loss": -6.706903457641602, "global_step": 122546, "epoch": 2917} {"train_loss": -6.678395748138428, "global_step": 122547, "epoch": 2917} {"train_loss": -6.5641021728515625, "global_step": 122548, "epoch": 2917} {"train_loss": -6.598140716552734, "global_step": 122549, "epoch": 2917} {"train_loss": -6.68145227432251, "global_step": 122550, "epoch": 2917} {"train_loss": -6.60832405090332, "global_step": 122551, "epoch": 2917} {"train_loss": -6.547859191894531, "global_step": 122552, "epoch": 2917} {"train_loss": -6.550433158874512, "global_step": 122553, "epoch": 2917} {"train_loss": -6.660397529602051, "global_step": 122554, "epoch": 2917} {"train_loss": -6.576719193231492, "global_step": 122555, "epoch": 2917, "val_loss": 65963.7109375} {"train_loss": -6.66918420791626, "global_step": 122556, "epoch": 2918} {"train_loss": -6.530551910400391, "global_step": 122557, "epoch": 2918} {"train_loss": -6.697075843811035, "global_step": 122558, "epoch": 2918} {"train_loss": -6.566452980041504, "global_step": 122559, "epoch": 2918} {"train_loss": -6.535127639770508, "global_step": 122560, "epoch": 2918} {"train_loss": -6.564471244812012, "global_step": 122561, "epoch": 2918} {"train_loss": -6.635607719421387, "global_step": 122562, "epoch": 2918} {"train_loss": -6.6030168533325195, "global_step": 122563, "epoch": 2918} {"train_loss": -6.584084510803223, "global_step": 122564, "epoch": 2918} {"train_loss": -6.520723342895508, "global_step": 122565, "epoch": 2918} {"train_loss": -6.526986122131348, "global_step": 122566, "epoch": 2918} {"train_loss": -6.6226043701171875, "global_step": 122567, "epoch": 2918} {"train_loss": -6.515737533569336, "global_step": 122568, "epoch": 2918} {"train_loss": -6.621873378753662, "global_step": 122569, "epoch": 2918} {"train_loss": -6.632507801055908, "global_step": 122570, "epoch": 2918} {"train_loss": -6.715207099914551, "global_step": 122571, "epoch": 2918} {"train_loss": -6.653806686401367, "global_step": 122572, "epoch": 2918} {"train_loss": -6.61037540435791, "global_step": 122573, "epoch": 2918} {"train_loss": -6.6666717529296875, "global_step": 122574, "epoch": 2918} {"train_loss": -6.578164100646973, "global_step": 122575, "epoch": 2918} {"train_loss": -6.51447057723999, "global_step": 122576, "epoch": 2918} {"train_loss": -6.569545745849609, "global_step": 122577, "epoch": 2918} {"train_loss": -6.617242813110352, "global_step": 122578, "epoch": 2918} {"train_loss": -6.571079730987549, "global_step": 122579, "epoch": 2918} {"train_loss": -6.6853108406066895, "global_step": 122580, "epoch": 2918} {"train_loss": -6.578007698059082, "global_step": 122581, "epoch": 2918} {"train_loss": -6.509960174560547, "global_step": 122582, "epoch": 2918} {"train_loss": -6.558889389038086, "global_step": 122583, "epoch": 2918} {"train_loss": -6.5199713706970215, "global_step": 122584, "epoch": 2918} {"train_loss": -6.618165969848633, "global_step": 122585, "epoch": 2918} {"train_loss": -6.524131774902344, "global_step": 122586, "epoch": 2918} {"train_loss": -6.385639667510986, "global_step": 122587, "epoch": 2918} {"train_loss": -6.61699104309082, "global_step": 122588, "epoch": 2918} {"train_loss": -6.470396041870117, "global_step": 122589, "epoch": 2918} {"train_loss": -6.568464279174805, "global_step": 122590, "epoch": 2918} {"train_loss": -6.491391658782959, "global_step": 122591, "epoch": 2918} {"train_loss": -6.532867431640625, "global_step": 122592, "epoch": 2918} {"train_loss": -6.590579032897949, "global_step": 122593, "epoch": 2918} {"train_loss": -6.530155658721924, "global_step": 122594, "epoch": 2918} {"train_loss": -6.629585266113281, "global_step": 122595, "epoch": 2918} {"train_loss": -6.531850814819336, "global_step": 122596, "epoch": 2918} {"train_loss": -6.577161868413289, "global_step": 122597, "epoch": 2918, "val_loss": 66057.3046875} {"train_loss": -6.626527309417725, "global_step": 122598, "epoch": 2919} {"train_loss": -6.634661674499512, "global_step": 122599, "epoch": 2919} {"train_loss": -6.599623680114746, "global_step": 122600, "epoch": 2919} {"train_loss": -6.702603816986084, "global_step": 122601, "epoch": 2919} {"train_loss": -6.532649993896484, "global_step": 122602, "epoch": 2919} {"train_loss": -6.503574371337891, "global_step": 122603, "epoch": 2919} {"train_loss": -6.594572067260742, "global_step": 122604, "epoch": 2919} {"train_loss": -6.561648368835449, "global_step": 122605, "epoch": 2919} {"train_loss": -6.685766220092773, "global_step": 122606, "epoch": 2919} {"train_loss": -6.543463230133057, "global_step": 122607, "epoch": 2919} {"train_loss": -6.614137649536133, "global_step": 122608, "epoch": 2919} {"train_loss": -6.67026424407959, "global_step": 122609, "epoch": 2919} {"train_loss": -6.651147842407227, "global_step": 122610, "epoch": 2919} {"train_loss": -6.620390892028809, "global_step": 122611, "epoch": 2919} {"train_loss": -6.625082015991211, "global_step": 122612, "epoch": 2919} {"train_loss": -6.579646110534668, "global_step": 122613, "epoch": 2919} {"train_loss": -6.585941314697266, "global_step": 122614, "epoch": 2919} {"train_loss": -6.657016754150391, "global_step": 122615, "epoch": 2919} {"train_loss": -6.6394124031066895, "global_step": 122616, "epoch": 2919} {"train_loss": -6.6421427726745605, "global_step": 122617, "epoch": 2919} {"train_loss": -6.673403739929199, "global_step": 122618, "epoch": 2919} {"train_loss": -6.641835689544678, "global_step": 122619, "epoch": 2919} {"train_loss": -6.705406188964844, "global_step": 122620, "epoch": 2919} {"train_loss": -6.62639856338501, "global_step": 122621, "epoch": 2919} {"train_loss": -6.705380439758301, "global_step": 122622, "epoch": 2919} {"train_loss": -6.579724311828613, "global_step": 122623, "epoch": 2919} {"train_loss": -6.596674919128418, "global_step": 122624, "epoch": 2919} {"train_loss": -6.554295539855957, "global_step": 122625, "epoch": 2919} {"train_loss": -6.6853413581848145, "global_step": 122626, "epoch": 2919} {"train_loss": -6.633900165557861, "global_step": 122627, "epoch": 2919} {"train_loss": -6.679868698120117, "global_step": 122628, "epoch": 2919} {"train_loss": -6.645280838012695, "global_step": 122629, "epoch": 2919} {"train_loss": -6.662894248962402, "global_step": 122630, "epoch": 2919} {"train_loss": -6.73530387878418, "global_step": 122631, "epoch": 2919} {"train_loss": -6.623416423797607, "global_step": 122632, "epoch": 2919} {"train_loss": -6.680075645446777, "global_step": 122633, "epoch": 2919} {"train_loss": -6.647810935974121, "global_step": 122634, "epoch": 2919} {"train_loss": -6.654173851013184, "global_step": 122635, "epoch": 2919} {"train_loss": -6.568191051483154, "global_step": 122636, "epoch": 2919} {"train_loss": -6.589456081390381, "global_step": 122637, "epoch": 2919} {"train_loss": -6.467377185821533, "global_step": 122638, "epoch": 2919} {"train_loss": -6.620779639198666, "global_step": 122639, "epoch": 2919, "val_loss": 66012.8203125} {"train_loss": -6.517009735107422, "global_step": 122640, "epoch": 2920} {"train_loss": -6.433966636657715, "global_step": 122641, "epoch": 2920} {"train_loss": -6.680789947509766, "global_step": 122642, "epoch": 2920} {"train_loss": -6.4801740646362305, "global_step": 122643, "epoch": 2920} {"train_loss": -6.5822858810424805, "global_step": 122644, "epoch": 2920} {"train_loss": -6.584729194641113, "global_step": 122645, "epoch": 2920} {"train_loss": -6.477372169494629, "global_step": 122646, "epoch": 2920} {"train_loss": -6.635026931762695, "global_step": 122647, "epoch": 2920} {"train_loss": -6.573885917663574, "global_step": 122648, "epoch": 2920} {"train_loss": -6.540128707885742, "global_step": 122649, "epoch": 2920} {"train_loss": -6.556291580200195, "global_step": 122650, "epoch": 2920} {"train_loss": -6.579907417297363, "global_step": 122651, "epoch": 2920} {"train_loss": -6.506651878356934, "global_step": 122652, "epoch": 2920} {"train_loss": -6.617323875427246, "global_step": 122653, "epoch": 2920} {"train_loss": -6.451556205749512, "global_step": 122654, "epoch": 2920} {"train_loss": -6.601016044616699, "global_step": 122655, "epoch": 2920} {"train_loss": -6.632539749145508, "global_step": 122656, "epoch": 2920} {"train_loss": -6.717652320861816, "global_step": 122657, "epoch": 2920} {"train_loss": -6.611753463745117, "global_step": 122658, "epoch": 2920} {"train_loss": -6.532828330993652, "global_step": 122659, "epoch": 2920} {"train_loss": -6.650128364562988, "global_step": 122660, "epoch": 2920} {"train_loss": -6.5773468017578125, "global_step": 122661, "epoch": 2920} {"train_loss": -6.613373279571533, "global_step": 122662, "epoch": 2920} {"train_loss": -6.726072311401367, "global_step": 122663, "epoch": 2920} {"train_loss": -6.617108345031738, "global_step": 122664, "epoch": 2920} {"train_loss": -6.586389541625977, "global_step": 122665, "epoch": 2920} {"train_loss": -6.628029823303223, "global_step": 122666, "epoch": 2920} {"train_loss": -6.679686546325684, "global_step": 122667, "epoch": 2920} {"train_loss": -6.612174987792969, "global_step": 122668, "epoch": 2920} {"train_loss": -6.600404262542725, "global_step": 122669, "epoch": 2920} {"train_loss": -6.630857467651367, "global_step": 122670, "epoch": 2920} {"train_loss": -6.64482307434082, "global_step": 122671, "epoch": 2920} {"train_loss": -6.580903053283691, "global_step": 122672, "epoch": 2920} {"train_loss": -6.687670707702637, "global_step": 122673, "epoch": 2920} {"train_loss": -6.483367919921875, "global_step": 122674, "epoch": 2920} {"train_loss": -6.7647929191589355, "global_step": 122675, "epoch": 2920} {"train_loss": -6.560111999511719, "global_step": 122676, "epoch": 2920} {"train_loss": -6.565586566925049, "global_step": 122677, "epoch": 2920} {"train_loss": -6.574899673461914, "global_step": 122678, "epoch": 2920} {"train_loss": -6.610844612121582, "global_step": 122679, "epoch": 2920} {"train_loss": -6.614803791046143, "global_step": 122680, "epoch": 2920} {"train_loss": -6.596642278489613, "global_step": 122681, "epoch": 2920, "val_loss": 65876.390625} {"train_loss": -6.514254570007324, "global_step": 122682, "epoch": 2921} {"train_loss": -6.6858720779418945, "global_step": 122683, "epoch": 2921} {"train_loss": -6.657339096069336, "global_step": 122684, "epoch": 2921} {"train_loss": -6.663372039794922, "global_step": 122685, "epoch": 2921} {"train_loss": -6.64848518371582, "global_step": 122686, "epoch": 2921} {"train_loss": -6.641958236694336, "global_step": 122687, "epoch": 2921} {"train_loss": -6.66262149810791, "global_step": 122688, "epoch": 2921} {"train_loss": -6.685477256774902, "global_step": 122689, "epoch": 2921} {"train_loss": -6.594142436981201, "global_step": 122690, "epoch": 2921} {"train_loss": -6.626420021057129, "global_step": 122691, "epoch": 2921} {"train_loss": -6.434713840484619, "global_step": 122692, "epoch": 2921} {"train_loss": -6.6586103439331055, "global_step": 122693, "epoch": 2921} {"train_loss": -6.5320963859558105, "global_step": 122694, "epoch": 2921} {"train_loss": -6.587930202484131, "global_step": 122695, "epoch": 2921} {"train_loss": -6.583306312561035, "global_step": 122696, "epoch": 2921} {"train_loss": -6.42219352722168, "global_step": 122697, "epoch": 2921} {"train_loss": -6.561385154724121, "global_step": 122698, "epoch": 2921} {"train_loss": -6.575649261474609, "global_step": 122699, "epoch": 2921} {"train_loss": -6.634780406951904, "global_step": 122700, "epoch": 2921} {"train_loss": -6.579461097717285, "global_step": 122701, "epoch": 2921} {"train_loss": -6.615115642547607, "global_step": 122702, "epoch": 2921} {"train_loss": -6.610469818115234, "global_step": 122703, "epoch": 2921} {"train_loss": -6.5291748046875, "global_step": 122704, "epoch": 2921} {"train_loss": -6.508754253387451, "global_step": 122705, "epoch": 2921} {"train_loss": -6.771770477294922, "global_step": 122706, "epoch": 2921} {"train_loss": -6.557190418243408, "global_step": 122707, "epoch": 2921} {"train_loss": -6.589112281799316, "global_step": 122708, "epoch": 2921} {"train_loss": -6.536283493041992, "global_step": 122709, "epoch": 2921} {"train_loss": -6.413645267486572, "global_step": 122710, "epoch": 2921} {"train_loss": -6.608261585235596, "global_step": 122711, "epoch": 2921} {"train_loss": -6.633655071258545, "global_step": 122712, "epoch": 2921} {"train_loss": -6.546978950500488, "global_step": 122713, "epoch": 2921} {"train_loss": -6.606038570404053, "global_step": 122714, "epoch": 2921} {"train_loss": -6.6163153648376465, "global_step": 122715, "epoch": 2921} {"train_loss": -6.658129692077637, "global_step": 122716, "epoch": 2921} {"train_loss": -6.672801971435547, "global_step": 122717, "epoch": 2921} {"train_loss": -6.582139015197754, "global_step": 122718, "epoch": 2921} {"train_loss": -6.602967262268066, "global_step": 122719, "epoch": 2921} {"train_loss": -6.6878662109375, "global_step": 122720, "epoch": 2921} {"train_loss": -6.567462921142578, "global_step": 122721, "epoch": 2921} {"train_loss": -6.749124050140381, "global_step": 122722, "epoch": 2921} {"train_loss": -6.5992929708390005, "global_step": 122723, "epoch": 2921, "val_loss": 65769.171875} {"train_loss": -6.635788917541504, "global_step": 122724, "epoch": 2922} {"train_loss": -6.615693092346191, "global_step": 122725, "epoch": 2922} {"train_loss": -6.701310157775879, "global_step": 122726, "epoch": 2922} {"train_loss": -6.616036891937256, "global_step": 122727, "epoch": 2922} {"train_loss": -6.698559284210205, "global_step": 122728, "epoch": 2922} {"train_loss": -6.5574750900268555, "global_step": 122729, "epoch": 2922} {"train_loss": -6.603472709655762, "global_step": 122730, "epoch": 2922} {"train_loss": -6.587349891662598, "global_step": 122731, "epoch": 2922} {"train_loss": -6.662032127380371, "global_step": 122732, "epoch": 2922} {"train_loss": -6.669268608093262, "global_step": 122733, "epoch": 2922} {"train_loss": -6.670677185058594, "global_step": 122734, "epoch": 2922} {"train_loss": -6.699212074279785, "global_step": 122735, "epoch": 2922} {"train_loss": -6.673335075378418, "global_step": 122736, "epoch": 2922} {"train_loss": -6.676413536071777, "global_step": 122737, "epoch": 2922} {"train_loss": -6.69785737991333, "global_step": 122738, "epoch": 2922} {"train_loss": -6.64424991607666, "global_step": 122739, "epoch": 2922} {"train_loss": -6.60267448425293, "global_step": 122740, "epoch": 2922} {"train_loss": -6.7148613929748535, "global_step": 122741, "epoch": 2922} {"train_loss": -6.646426200866699, "global_step": 122742, "epoch": 2922} {"train_loss": -6.576785087585449, "global_step": 122743, "epoch": 2922} {"train_loss": -6.571379661560059, "global_step": 122744, "epoch": 2922} {"train_loss": -6.559826850891113, "global_step": 122745, "epoch": 2922} {"train_loss": -6.688823699951172, "global_step": 122746, "epoch": 2922} {"train_loss": -6.678730010986328, "global_step": 122747, "epoch": 2922} {"train_loss": -6.609994888305664, "global_step": 122748, "epoch": 2922} {"train_loss": -6.623318672180176, "global_step": 122749, "epoch": 2922} {"train_loss": -6.658608436584473, "global_step": 122750, "epoch": 2922} {"train_loss": -6.62932014465332, "global_step": 122751, "epoch": 2922} {"train_loss": -6.622621059417725, "global_step": 122752, "epoch": 2922} {"train_loss": -6.657483100891113, "global_step": 122753, "epoch": 2922} {"train_loss": -6.673456192016602, "global_step": 122754, "epoch": 2922} {"train_loss": -6.736808776855469, "global_step": 122755, "epoch": 2922} {"train_loss": -6.5825910568237305, "global_step": 122756, "epoch": 2922} {"train_loss": -6.673253059387207, "global_step": 122757, "epoch": 2922} {"train_loss": -6.615996360778809, "global_step": 122758, "epoch": 2922} {"train_loss": -6.629918098449707, "global_step": 122759, "epoch": 2922} {"train_loss": -6.736611366271973, "global_step": 122760, "epoch": 2922} {"train_loss": -6.577019214630127, "global_step": 122761, "epoch": 2922} {"train_loss": -6.59901762008667, "global_step": 122762, "epoch": 2922} {"train_loss": -6.482785224914551, "global_step": 122763, "epoch": 2922} {"train_loss": -6.532548904418945, "global_step": 122764, "epoch": 2922} {"train_loss": -6.6338730198996405, "global_step": 122765, "epoch": 2922, "val_loss": 65829.828125} {"train_loss": -6.617337226867676, "global_step": 122766, "epoch": 2923} {"train_loss": -6.511305809020996, "global_step": 122767, "epoch": 2923} {"train_loss": -6.577609062194824, "global_step": 122768, "epoch": 2923} {"train_loss": -6.577042579650879, "global_step": 122769, "epoch": 2923} {"train_loss": -6.5624003410339355, "global_step": 122770, "epoch": 2923} {"train_loss": -6.602277755737305, "global_step": 122771, "epoch": 2923} {"train_loss": -6.603022575378418, "global_step": 122772, "epoch": 2923} {"train_loss": -6.602753639221191, "global_step": 122773, "epoch": 2923} {"train_loss": -6.634913444519043, "global_step": 122774, "epoch": 2923} {"train_loss": -6.558598518371582, "global_step": 122775, "epoch": 2923} {"train_loss": -6.630722522735596, "global_step": 122776, "epoch": 2923} {"train_loss": -6.521307468414307, "global_step": 122777, "epoch": 2923} {"train_loss": -6.570059776306152, "global_step": 122778, "epoch": 2923} {"train_loss": -6.710395812988281, "global_step": 122779, "epoch": 2923} {"train_loss": -6.554147720336914, "global_step": 122780, "epoch": 2923} {"train_loss": -6.63881254196167, "global_step": 122781, "epoch": 2923} {"train_loss": -6.589506149291992, "global_step": 122782, "epoch": 2923} {"train_loss": -6.631765365600586, "global_step": 122783, "epoch": 2923} {"train_loss": -6.572271823883057, "global_step": 122784, "epoch": 2923} {"train_loss": -6.629374027252197, "global_step": 122785, "epoch": 2923} {"train_loss": -6.593668460845947, "global_step": 122786, "epoch": 2923} {"train_loss": -6.632669448852539, "global_step": 122787, "epoch": 2923} {"train_loss": -6.613807678222656, "global_step": 122788, "epoch": 2923} {"train_loss": -6.591448783874512, "global_step": 122789, "epoch": 2923} {"train_loss": -6.713510036468506, "global_step": 122790, "epoch": 2923} {"train_loss": -6.582327842712402, "global_step": 122791, "epoch": 2923} {"train_loss": -6.644814491271973, "global_step": 122792, "epoch": 2923} {"train_loss": -6.604917526245117, "global_step": 122793, "epoch": 2923} {"train_loss": -6.478675842285156, "global_step": 122794, "epoch": 2923} {"train_loss": -6.599923133850098, "global_step": 122795, "epoch": 2923} {"train_loss": -6.636167526245117, "global_step": 122796, "epoch": 2923} {"train_loss": -6.419282913208008, "global_step": 122797, "epoch": 2923} {"train_loss": -6.56418514251709, "global_step": 122798, "epoch": 2923} {"train_loss": -6.5744171142578125, "global_step": 122799, "epoch": 2923} {"train_loss": -6.518523216247559, "global_step": 122800, "epoch": 2923} {"train_loss": -6.542882919311523, "global_step": 122801, "epoch": 2923} {"train_loss": -6.614809036254883, "global_step": 122802, "epoch": 2923} {"train_loss": -6.712582111358643, "global_step": 122803, "epoch": 2923} {"train_loss": -6.594078063964844, "global_step": 122804, "epoch": 2923} {"train_loss": -6.673280715942383, "global_step": 122805, "epoch": 2923} {"train_loss": -6.614535331726074, "global_step": 122806, "epoch": 2923} {"train_loss": -6.595836037681217, "global_step": 122807, "epoch": 2923, "val_loss": 66006.1171875} {"train_loss": -6.565985679626465, "global_step": 122808, "epoch": 2924} {"train_loss": -6.568702697753906, "global_step": 122809, "epoch": 2924} {"train_loss": -6.5215349197387695, "global_step": 122810, "epoch": 2924} {"train_loss": -6.571671962738037, "global_step": 122811, "epoch": 2924} {"train_loss": -6.517411231994629, "global_step": 122812, "epoch": 2924} {"train_loss": -6.5486369132995605, "global_step": 122813, "epoch": 2924} {"train_loss": -6.619668483734131, "global_step": 122814, "epoch": 2924} {"train_loss": -6.686285018920898, "global_step": 122815, "epoch": 2924} {"train_loss": -6.608016490936279, "global_step": 122816, "epoch": 2924} {"train_loss": -6.701021671295166, "global_step": 122817, "epoch": 2924} {"train_loss": -6.513504981994629, "global_step": 122818, "epoch": 2924} {"train_loss": -6.575968265533447, "global_step": 122819, "epoch": 2924} {"train_loss": -6.569511413574219, "global_step": 122820, "epoch": 2924} {"train_loss": -6.557245254516602, "global_step": 122821, "epoch": 2924} {"train_loss": -6.619997024536133, "global_step": 122822, "epoch": 2924} {"train_loss": -6.577948570251465, "global_step": 122823, "epoch": 2924} {"train_loss": -6.667778491973877, "global_step": 122824, "epoch": 2924} {"train_loss": -6.568145275115967, "global_step": 122825, "epoch": 2924} {"train_loss": -6.752852916717529, "global_step": 122826, "epoch": 2924} {"train_loss": -6.6382904052734375, "global_step": 122827, "epoch": 2924} {"train_loss": -6.732356548309326, "global_step": 122828, "epoch": 2924} {"train_loss": -6.683391571044922, "global_step": 122829, "epoch": 2924} {"train_loss": -6.641922950744629, "global_step": 122830, "epoch": 2924} {"train_loss": -6.581997871398926, "global_step": 122831, "epoch": 2924} {"train_loss": -6.5621232986450195, "global_step": 122832, "epoch": 2924} {"train_loss": -6.531807899475098, "global_step": 122833, "epoch": 2924} {"train_loss": -6.572019577026367, "global_step": 122834, "epoch": 2924} {"train_loss": -6.587774276733398, "global_step": 122835, "epoch": 2924} {"train_loss": -6.6649169921875, "global_step": 122836, "epoch": 2924} {"train_loss": -6.545072078704834, "global_step": 122837, "epoch": 2924} {"train_loss": -6.6818342208862305, "global_step": 122838, "epoch": 2924} {"train_loss": -6.463696002960205, "global_step": 122839, "epoch": 2924} {"train_loss": -6.496458053588867, "global_step": 122840, "epoch": 2924} {"train_loss": -6.667603492736816, "global_step": 122841, "epoch": 2924} {"train_loss": -6.550549507141113, "global_step": 122842, "epoch": 2924} {"train_loss": -6.566758632659912, "global_step": 122843, "epoch": 2924} {"train_loss": -6.550595760345459, "global_step": 122844, "epoch": 2924} {"train_loss": -6.5056047439575195, "global_step": 122845, "epoch": 2924} {"train_loss": -6.47490119934082, "global_step": 122846, "epoch": 2924} {"train_loss": -6.643148899078369, "global_step": 122847, "epoch": 2924} {"train_loss": -6.490438461303711, "global_step": 122848, "epoch": 2924} {"train_loss": -6.584796394620623, "global_step": 122849, "epoch": 2924, "val_loss": 65785.765625} {"train_loss": -6.580122947692871, "global_step": 122850, "epoch": 2925} {"train_loss": -6.531646251678467, "global_step": 122851, "epoch": 2925} {"train_loss": -6.589709281921387, "global_step": 122852, "epoch": 2925} {"train_loss": -6.58413028717041, "global_step": 122853, "epoch": 2925} {"train_loss": -6.506887435913086, "global_step": 122854, "epoch": 2925} {"train_loss": -6.520264625549316, "global_step": 122855, "epoch": 2925} {"train_loss": -6.543224811553955, "global_step": 122856, "epoch": 2925} {"train_loss": -6.623470306396484, "global_step": 122857, "epoch": 2925} {"train_loss": -6.449394226074219, "global_step": 122858, "epoch": 2925} {"train_loss": -6.651154518127441, "global_step": 122859, "epoch": 2925} {"train_loss": -6.467362880706787, "global_step": 122860, "epoch": 2925} {"train_loss": -6.558000564575195, "global_step": 122861, "epoch": 2925} {"train_loss": -6.618994235992432, "global_step": 122862, "epoch": 2925} {"train_loss": -6.632011413574219, "global_step": 122863, "epoch": 2925} {"train_loss": -6.622430801391602, "global_step": 122864, "epoch": 2925} {"train_loss": -6.591875076293945, "global_step": 122865, "epoch": 2925} {"train_loss": -6.671051979064941, "global_step": 122866, "epoch": 2925} {"train_loss": -6.515056610107422, "global_step": 122867, "epoch": 2925} {"train_loss": -6.698574542999268, "global_step": 122868, "epoch": 2925} {"train_loss": -6.566327095031738, "global_step": 122869, "epoch": 2925} {"train_loss": -6.570291996002197, "global_step": 122870, "epoch": 2925} {"train_loss": -6.699201583862305, "global_step": 122871, "epoch": 2925} {"train_loss": -6.660635471343994, "global_step": 122872, "epoch": 2925} {"train_loss": -6.6223578453063965, "global_step": 122873, "epoch": 2925} {"train_loss": -6.566305160522461, "global_step": 122874, "epoch": 2925} {"train_loss": -6.562166690826416, "global_step": 122875, "epoch": 2925} {"train_loss": -6.581397533416748, "global_step": 122876, "epoch": 2925} {"train_loss": -6.705056190490723, "global_step": 122877, "epoch": 2925} {"train_loss": -6.6188507080078125, "global_step": 122878, "epoch": 2925} {"train_loss": -6.623806953430176, "global_step": 122879, "epoch": 2925} {"train_loss": -6.700614929199219, "global_step": 122880, "epoch": 2925} {"train_loss": -6.57936954498291, "global_step": 122881, "epoch": 2925} {"train_loss": -6.550840377807617, "global_step": 122882, "epoch": 2925} {"train_loss": -6.604314804077148, "global_step": 122883, "epoch": 2925} {"train_loss": -6.72260046005249, "global_step": 122884, "epoch": 2925} {"train_loss": -6.609531402587891, "global_step": 122885, "epoch": 2925} {"train_loss": -6.543858051300049, "global_step": 122886, "epoch": 2925} {"train_loss": -6.654458522796631, "global_step": 122887, "epoch": 2925} {"train_loss": -6.5637383460998535, "global_step": 122888, "epoch": 2925} {"train_loss": -6.672729015350342, "global_step": 122889, "epoch": 2925} {"train_loss": -6.642552375793457, "global_step": 122890, "epoch": 2925} {"train_loss": -6.597693307059152, "global_step": 122891, "epoch": 2925, "val_loss": 65833.0546875} {"train_loss": -6.501097679138184, "global_step": 122892, "epoch": 2926} {"train_loss": -6.559266090393066, "global_step": 122893, "epoch": 2926} {"train_loss": -6.4542012214660645, "global_step": 122894, "epoch": 2926} {"train_loss": -6.508974552154541, "global_step": 122895, "epoch": 2926} {"train_loss": -6.65592098236084, "global_step": 122896, "epoch": 2926} {"train_loss": -6.602980613708496, "global_step": 122897, "epoch": 2926} {"train_loss": -6.567958354949951, "global_step": 122898, "epoch": 2926} {"train_loss": -6.597472190856934, "global_step": 122899, "epoch": 2926} {"train_loss": -6.515651702880859, "global_step": 122900, "epoch": 2926} {"train_loss": -6.616084098815918, "global_step": 122901, "epoch": 2926} {"train_loss": -6.518667221069336, "global_step": 122902, "epoch": 2926} {"train_loss": -6.595097541809082, "global_step": 122903, "epoch": 2926} {"train_loss": -6.686203479766846, "global_step": 122904, "epoch": 2926} {"train_loss": -6.579237461090088, "global_step": 122905, "epoch": 2926} {"train_loss": -6.662498950958252, "global_step": 122906, "epoch": 2926} {"train_loss": -6.736828804016113, "global_step": 122907, "epoch": 2926} {"train_loss": -6.576949119567871, "global_step": 122908, "epoch": 2926} {"train_loss": -6.5961809158325195, "global_step": 122909, "epoch": 2926} {"train_loss": -6.683976650238037, "global_step": 122910, "epoch": 2926} {"train_loss": -6.6912713050842285, "global_step": 122911, "epoch": 2926} {"train_loss": -6.729406833648682, "global_step": 122912, "epoch": 2926} {"train_loss": -6.59678840637207, "global_step": 122913, "epoch": 2926} {"train_loss": -6.5299787521362305, "global_step": 122914, "epoch": 2926} {"train_loss": -6.563882827758789, "global_step": 122915, "epoch": 2926} {"train_loss": -6.573503494262695, "global_step": 122916, "epoch": 2926} {"train_loss": -6.6258649826049805, "global_step": 122917, "epoch": 2926} {"train_loss": -6.546791076660156, "global_step": 122918, "epoch": 2926} {"train_loss": -6.580338478088379, "global_step": 122919, "epoch": 2926} {"train_loss": -6.535579681396484, "global_step": 122920, "epoch": 2926} {"train_loss": -6.643476963043213, "global_step": 122921, "epoch": 2926} {"train_loss": -6.68705940246582, "global_step": 122922, "epoch": 2926} {"train_loss": -6.558282852172852, "global_step": 122923, "epoch": 2926} {"train_loss": -6.641587257385254, "global_step": 122924, "epoch": 2926} {"train_loss": -6.615909576416016, "global_step": 122925, "epoch": 2926} {"train_loss": -6.609349250793457, "global_step": 122926, "epoch": 2926} {"train_loss": -6.5678205490112305, "global_step": 122927, "epoch": 2926} {"train_loss": -6.643989562988281, "global_step": 122928, "epoch": 2926} {"train_loss": -6.632912635803223, "global_step": 122929, "epoch": 2926} {"train_loss": -6.61466121673584, "global_step": 122930, "epoch": 2926} {"train_loss": -6.494560718536377, "global_step": 122931, "epoch": 2926} {"train_loss": -6.623127460479736, "global_step": 122932, "epoch": 2926} {"train_loss": -6.595501911072504, "global_step": 122933, "epoch": 2926, "val_loss": 66106.359375} {"train_loss": -6.407818794250488, "global_step": 122934, "epoch": 2927} {"train_loss": -6.591142654418945, "global_step": 122935, "epoch": 2927} {"train_loss": -6.6013031005859375, "global_step": 122936, "epoch": 2927} {"train_loss": -6.484155178070068, "global_step": 122937, "epoch": 2927} {"train_loss": -6.598554611206055, "global_step": 122938, "epoch": 2927} {"train_loss": -6.688335418701172, "global_step": 122939, "epoch": 2927} {"train_loss": -6.6160736083984375, "global_step": 122940, "epoch": 2927} {"train_loss": -6.621793270111084, "global_step": 122941, "epoch": 2927} {"train_loss": -6.647095680236816, "global_step": 122942, "epoch": 2927} {"train_loss": -6.678572654724121, "global_step": 122943, "epoch": 2927} {"train_loss": -6.613439559936523, "global_step": 122944, "epoch": 2927} {"train_loss": -6.578207969665527, "global_step": 122945, "epoch": 2927} {"train_loss": -6.641691207885742, "global_step": 122946, "epoch": 2927} {"train_loss": -6.667860984802246, "global_step": 122947, "epoch": 2927} {"train_loss": -6.626537322998047, "global_step": 122948, "epoch": 2927} {"train_loss": -6.472029209136963, "global_step": 122949, "epoch": 2927} {"train_loss": -6.6508636474609375, "global_step": 122950, "epoch": 2927} {"train_loss": -6.731175422668457, "global_step": 122951, "epoch": 2927} {"train_loss": -6.477855682373047, "global_step": 122952, "epoch": 2927} {"train_loss": -6.477896213531494, "global_step": 122953, "epoch": 2927} {"train_loss": -6.668225288391113, "global_step": 122954, "epoch": 2927} {"train_loss": -6.562487602233887, "global_step": 122955, "epoch": 2927} {"train_loss": -6.5946855545043945, "global_step": 122956, "epoch": 2927} {"train_loss": -6.638585090637207, "global_step": 122957, "epoch": 2927} {"train_loss": -6.620358467102051, "global_step": 122958, "epoch": 2927} {"train_loss": -6.59954833984375, "global_step": 122959, "epoch": 2927} {"train_loss": -6.582200050354004, "global_step": 122960, "epoch": 2927} {"train_loss": -6.5640363693237305, "global_step": 122961, "epoch": 2927} {"train_loss": -6.498210906982422, "global_step": 122962, "epoch": 2927} {"train_loss": -6.608913421630859, "global_step": 122963, "epoch": 2927} {"train_loss": -6.599020004272461, "global_step": 122964, "epoch": 2927} {"train_loss": -6.597975730895996, "global_step": 122965, "epoch": 2927} {"train_loss": -6.682726860046387, "global_step": 122966, "epoch": 2927} {"train_loss": -6.486716270446777, "global_step": 122967, "epoch": 2927} {"train_loss": -6.596312046051025, "global_step": 122968, "epoch": 2927} {"train_loss": -6.695213317871094, "global_step": 122969, "epoch": 2927} {"train_loss": -6.622654914855957, "global_step": 122970, "epoch": 2927} {"train_loss": -6.571868419647217, "global_step": 122971, "epoch": 2927} {"train_loss": -6.650579452514648, "global_step": 122972, "epoch": 2927} {"train_loss": -6.689054012298584, "global_step": 122973, "epoch": 2927} {"train_loss": -6.6589250564575195, "global_step": 122974, "epoch": 2927} {"train_loss": -6.604276407332647, "global_step": 122975, "epoch": 2927, "val_loss": 65854.859375} {"train_loss": -6.665694236755371, "global_step": 122976, "epoch": 2928} {"train_loss": -6.559532165527344, "global_step": 122977, "epoch": 2928} {"train_loss": -6.79398250579834, "global_step": 122978, "epoch": 2928} {"train_loss": -6.549576282501221, "global_step": 122979, "epoch": 2928} {"train_loss": -6.531294345855713, "global_step": 122980, "epoch": 2928} {"train_loss": -6.695095062255859, "global_step": 122981, "epoch": 2928} {"train_loss": -6.5728960037231445, "global_step": 122982, "epoch": 2928} {"train_loss": -6.624191761016846, "global_step": 122983, "epoch": 2928} {"train_loss": -6.618303298950195, "global_step": 122984, "epoch": 2928} {"train_loss": -6.583102226257324, "global_step": 122985, "epoch": 2928} {"train_loss": -6.710211753845215, "global_step": 122986, "epoch": 2928} {"train_loss": -6.541743755340576, "global_step": 122987, "epoch": 2928} {"train_loss": -6.691537380218506, "global_step": 122988, "epoch": 2928} {"train_loss": -6.81427001953125, "global_step": 122989, "epoch": 2928} {"train_loss": -6.590027809143066, "global_step": 122990, "epoch": 2928} {"train_loss": -6.50724458694458, "global_step": 122991, "epoch": 2928} {"train_loss": -6.678194046020508, "global_step": 122992, "epoch": 2928} {"train_loss": -6.617004871368408, "global_step": 122993, "epoch": 2928} {"train_loss": -6.578612327575684, "global_step": 122994, "epoch": 2928} {"train_loss": -6.623714447021484, "global_step": 122995, "epoch": 2928} {"train_loss": -6.510801315307617, "global_step": 122996, "epoch": 2928} {"train_loss": -6.596370697021484, "global_step": 122997, "epoch": 2928} {"train_loss": -6.7033514976501465, "global_step": 122998, "epoch": 2928} {"train_loss": -6.631393909454346, "global_step": 122999, "epoch": 2928} {"train_loss": -6.563656330108643, "global_step": 123000, "epoch": 2928} {"train_loss": -6.506649017333984, "global_step": 123001, "epoch": 2928} {"train_loss": -6.60156774520874, "global_step": 123002, "epoch": 2928} {"train_loss": -6.420744895935059, "global_step": 123003, "epoch": 2928} {"train_loss": -6.650554180145264, "global_step": 123004, "epoch": 2928} {"train_loss": -6.545574188232422, "global_step": 123005, "epoch": 2928} {"train_loss": -6.627140045166016, "global_step": 123006, "epoch": 2928} {"train_loss": -6.562715530395508, "global_step": 123007, "epoch": 2928} {"train_loss": -6.583540439605713, "global_step": 123008, "epoch": 2928} {"train_loss": -6.641659736633301, "global_step": 123009, "epoch": 2928} {"train_loss": -6.523388385772705, "global_step": 123010, "epoch": 2928} {"train_loss": -6.625695705413818, "global_step": 123011, "epoch": 2928} {"train_loss": -6.468852519989014, "global_step": 123012, "epoch": 2928} {"train_loss": -6.5545148849487305, "global_step": 123013, "epoch": 2928} {"train_loss": -6.590035438537598, "global_step": 123014, "epoch": 2928} {"train_loss": -6.568550109863281, "global_step": 123015, "epoch": 2928} {"train_loss": -6.5286688804626465, "global_step": 123016, "epoch": 2928} {"train_loss": -6.6012836410885765, "global_step": 123017, "epoch": 2928, "val_loss": 65952.5859375} {"train_loss": -6.567336082458496, "global_step": 123018, "epoch": 2929} {"train_loss": -6.5458760261535645, "global_step": 123019, "epoch": 2929} {"train_loss": -6.690694808959961, "global_step": 123020, "epoch": 2929} {"train_loss": -6.596592903137207, "global_step": 123021, "epoch": 2929} {"train_loss": -6.6004180908203125, "global_step": 123022, "epoch": 2929} {"train_loss": -6.64724063873291, "global_step": 123023, "epoch": 2929} {"train_loss": -6.6283979415893555, "global_step": 123024, "epoch": 2929} {"train_loss": -6.603517532348633, "global_step": 123025, "epoch": 2929} {"train_loss": -6.56567907333374, "global_step": 123026, "epoch": 2929} {"train_loss": -6.588362693786621, "global_step": 123027, "epoch": 2929} {"train_loss": -6.572094917297363, "global_step": 123028, "epoch": 2929} {"train_loss": -6.631762981414795, "global_step": 123029, "epoch": 2929} {"train_loss": -6.577052593231201, "global_step": 123030, "epoch": 2929} {"train_loss": -6.637462139129639, "global_step": 123031, "epoch": 2929} {"train_loss": -6.595652103424072, "global_step": 123032, "epoch": 2929} {"train_loss": -6.653162956237793, "global_step": 123033, "epoch": 2929} {"train_loss": -6.649176597595215, "global_step": 123034, "epoch": 2929} {"train_loss": -6.763896465301514, "global_step": 123035, "epoch": 2929} {"train_loss": -6.633219242095947, "global_step": 123036, "epoch": 2929} {"train_loss": -6.651533603668213, "global_step": 123037, "epoch": 2929} {"train_loss": -6.685132026672363, "global_step": 123038, "epoch": 2929} {"train_loss": -6.623207092285156, "global_step": 123039, "epoch": 2929} {"train_loss": -6.536773681640625, "global_step": 123040, "epoch": 2929} {"train_loss": -6.58566951751709, "global_step": 123041, "epoch": 2929} {"train_loss": -6.739544868469238, "global_step": 123042, "epoch": 2929} {"train_loss": -6.597375869750977, "global_step": 123043, "epoch": 2929} {"train_loss": -6.651230812072754, "global_step": 123044, "epoch": 2929} {"train_loss": -6.600398063659668, "global_step": 123045, "epoch": 2929} {"train_loss": -6.648571014404297, "global_step": 123046, "epoch": 2929} {"train_loss": -6.656033039093018, "global_step": 123047, "epoch": 2929} {"train_loss": -6.772977828979492, "global_step": 123048, "epoch": 2929} {"train_loss": -6.471038818359375, "global_step": 123049, "epoch": 2929} {"train_loss": -6.66176700592041, "global_step": 123050, "epoch": 2929} {"train_loss": -6.637502670288086, "global_step": 123051, "epoch": 2929} {"train_loss": -6.598994255065918, "global_step": 123052, "epoch": 2929} {"train_loss": -6.706113815307617, "global_step": 123053, "epoch": 2929} {"train_loss": -6.539618492126465, "global_step": 123054, "epoch": 2929} {"train_loss": -6.474921226501465, "global_step": 123055, "epoch": 2929} {"train_loss": -6.572843551635742, "global_step": 123056, "epoch": 2929} {"train_loss": -6.637076377868652, "global_step": 123057, "epoch": 2929} {"train_loss": -6.533018112182617, "global_step": 123058, "epoch": 2929} {"train_loss": -6.6203882694244385, "global_step": 123059, "epoch": 2929, "val_loss": 65996.4921875} {"train_loss": -6.719728469848633, "global_step": 123060, "epoch": 2930} {"train_loss": -6.649228096008301, "global_step": 123061, "epoch": 2930} {"train_loss": -6.673439979553223, "global_step": 123062, "epoch": 2930} {"train_loss": -6.7499098777771, "global_step": 123063, "epoch": 2930} {"train_loss": -6.5960493087768555, "global_step": 123064, "epoch": 2930} {"train_loss": -6.642917633056641, "global_step": 123065, "epoch": 2930} {"train_loss": -6.537148475646973, "global_step": 123066, "epoch": 2930} {"train_loss": -6.612344264984131, "global_step": 123067, "epoch": 2930} {"train_loss": -6.638671875, "global_step": 123068, "epoch": 2930} {"train_loss": -6.67208194732666, "global_step": 123069, "epoch": 2930} {"train_loss": -6.629377365112305, "global_step": 123070, "epoch": 2930} {"train_loss": -6.655388832092285, "global_step": 123071, "epoch": 2930} {"train_loss": -6.656090259552002, "global_step": 123072, "epoch": 2930} {"train_loss": -6.578135967254639, "global_step": 123073, "epoch": 2930} {"train_loss": -6.767430305480957, "global_step": 123074, "epoch": 2930} {"train_loss": -6.608906269073486, "global_step": 123075, "epoch": 2930} {"train_loss": -6.6445136070251465, "global_step": 123076, "epoch": 2930} {"train_loss": -6.7039923667907715, "global_step": 123077, "epoch": 2930} {"train_loss": -6.441586971282959, "global_step": 123078, "epoch": 2930} {"train_loss": -6.733878135681152, "global_step": 123079, "epoch": 2930} {"train_loss": -6.572915077209473, "global_step": 123080, "epoch": 2930} {"train_loss": -6.503657341003418, "global_step": 123081, "epoch": 2930} {"train_loss": -6.600494384765625, "global_step": 123082, "epoch": 2930} {"train_loss": -6.659050464630127, "global_step": 123083, "epoch": 2930} {"train_loss": -6.724360942840576, "global_step": 123084, "epoch": 2930} {"train_loss": -6.576229572296143, "global_step": 123085, "epoch": 2930} {"train_loss": -6.57974910736084, "global_step": 123086, "epoch": 2930} {"train_loss": -6.588820934295654, "global_step": 123087, "epoch": 2930} {"train_loss": -6.506755352020264, "global_step": 123088, "epoch": 2930} {"train_loss": -6.534931659698486, "global_step": 123089, "epoch": 2930} {"train_loss": -6.625393867492676, "global_step": 123090, "epoch": 2930} {"train_loss": -6.582125663757324, "global_step": 123091, "epoch": 2930} {"train_loss": -6.517478942871094, "global_step": 123092, "epoch": 2930} {"train_loss": -6.626067161560059, "global_step": 123093, "epoch": 2930} {"train_loss": -6.6243085861206055, "global_step": 123094, "epoch": 2930} {"train_loss": -6.595175743103027, "global_step": 123095, "epoch": 2930} {"train_loss": -6.67596435546875, "global_step": 123096, "epoch": 2930} {"train_loss": -6.715084075927734, "global_step": 123097, "epoch": 2930} {"train_loss": -6.504401206970215, "global_step": 123098, "epoch": 2930} {"train_loss": -6.555014133453369, "global_step": 123099, "epoch": 2930} {"train_loss": -6.5302510261535645, "global_step": 123100, "epoch": 2930} {"train_loss": -6.617193948654902, "global_step": 123101, "epoch": 2930, "val_loss": 66113.7265625} {"train_loss": -6.462369918823242, "global_step": 123102, "epoch": 2931} {"train_loss": -6.578036308288574, "global_step": 123103, "epoch": 2931} {"train_loss": -6.647721767425537, "global_step": 123104, "epoch": 2931} {"train_loss": -6.661975860595703, "global_step": 123105, "epoch": 2931} {"train_loss": -6.563261032104492, "global_step": 123106, "epoch": 2931} {"train_loss": -6.630330562591553, "global_step": 123107, "epoch": 2931} {"train_loss": -6.406027793884277, "global_step": 123108, "epoch": 2931} {"train_loss": -6.595039367675781, "global_step": 123109, "epoch": 2931} {"train_loss": -6.613585948944092, "global_step": 123110, "epoch": 2931} {"train_loss": -6.446903228759766, "global_step": 123111, "epoch": 2931} {"train_loss": -6.545310020446777, "global_step": 123112, "epoch": 2931} {"train_loss": -6.653168201446533, "global_step": 123113, "epoch": 2931} {"train_loss": -6.650279521942139, "global_step": 123114, "epoch": 2931} {"train_loss": -6.590575218200684, "global_step": 123115, "epoch": 2931} {"train_loss": -6.637631416320801, "global_step": 123116, "epoch": 2931} {"train_loss": -6.566473960876465, "global_step": 123117, "epoch": 2931} {"train_loss": -6.6068620681762695, "global_step": 123118, "epoch": 2931} {"train_loss": -6.58928108215332, "global_step": 123119, "epoch": 2931} {"train_loss": -6.714890480041504, "global_step": 123120, "epoch": 2931} {"train_loss": -6.5465288162231445, "global_step": 123121, "epoch": 2931} {"train_loss": -6.486347198486328, "global_step": 123122, "epoch": 2931} {"train_loss": -6.570699214935303, "global_step": 123123, "epoch": 2931} {"train_loss": -6.563299655914307, "global_step": 123124, "epoch": 2931} {"train_loss": -6.461187362670898, "global_step": 123125, "epoch": 2931} {"train_loss": -6.5303850173950195, "global_step": 123126, "epoch": 2931} {"train_loss": -6.470335960388184, "global_step": 123127, "epoch": 2931} {"train_loss": -6.559144020080566, "global_step": 123128, "epoch": 2931} {"train_loss": -6.568700790405273, "global_step": 123129, "epoch": 2931} {"train_loss": -6.671708106994629, "global_step": 123130, "epoch": 2931} {"train_loss": -6.470323085784912, "global_step": 123131, "epoch": 2931} {"train_loss": -6.491182327270508, "global_step": 123132, "epoch": 2931} {"train_loss": -6.481448173522949, "global_step": 123133, "epoch": 2931} {"train_loss": -6.508431434631348, "global_step": 123134, "epoch": 2931} {"train_loss": -6.433640956878662, "global_step": 123135, "epoch": 2931} {"train_loss": -6.428836822509766, "global_step": 123136, "epoch": 2931} {"train_loss": -6.4952826499938965, "global_step": 123137, "epoch": 2931} {"train_loss": -6.545366287231445, "global_step": 123138, "epoch": 2931} {"train_loss": -6.602102279663086, "global_step": 123139, "epoch": 2931} {"train_loss": -6.419282913208008, "global_step": 123140, "epoch": 2931} {"train_loss": -6.544557571411133, "global_step": 123141, "epoch": 2931} {"train_loss": -6.554435729980469, "global_step": 123142, "epoch": 2931} {"train_loss": -6.550126075744629, "global_step": 123143, "epoch": 2931, "val_loss": 66220.2109375} {"train_loss": -6.482767105102539, "global_step": 123144, "epoch": 2932} {"train_loss": -6.513893127441406, "global_step": 123145, "epoch": 2932} {"train_loss": -6.5783610343933105, "global_step": 123146, "epoch": 2932} {"train_loss": -6.501772880554199, "global_step": 123147, "epoch": 2932} {"train_loss": -6.565433502197266, "global_step": 123148, "epoch": 2932} {"train_loss": -6.492867469787598, "global_step": 123149, "epoch": 2932} {"train_loss": -6.599935054779053, "global_step": 123150, "epoch": 2932} {"train_loss": -6.473719120025635, "global_step": 123151, "epoch": 2932} {"train_loss": -6.476929664611816, "global_step": 123152, "epoch": 2932} {"train_loss": -6.561577796936035, "global_step": 123153, "epoch": 2932} {"train_loss": -6.611042022705078, "global_step": 123154, "epoch": 2932} {"train_loss": -6.682308197021484, "global_step": 123155, "epoch": 2932} {"train_loss": -6.67434024810791, "global_step": 123156, "epoch": 2932} {"train_loss": -6.651089191436768, "global_step": 123157, "epoch": 2932} {"train_loss": -6.62636137008667, "global_step": 123158, "epoch": 2932} {"train_loss": -6.583798408508301, "global_step": 123159, "epoch": 2932} {"train_loss": -6.605184078216553, "global_step": 123160, "epoch": 2932} {"train_loss": -6.629778861999512, "global_step": 123161, "epoch": 2932} {"train_loss": -6.560133934020996, "global_step": 123162, "epoch": 2932} {"train_loss": -6.5823822021484375, "global_step": 123163, "epoch": 2932} {"train_loss": -6.673530578613281, "global_step": 123164, "epoch": 2932} {"train_loss": -6.541274547576904, "global_step": 123165, "epoch": 2932} {"train_loss": -6.585631370544434, "global_step": 123166, "epoch": 2932} {"train_loss": -6.508812427520752, "global_step": 123167, "epoch": 2932} {"train_loss": -6.586380481719971, "global_step": 123168, "epoch": 2932} {"train_loss": -6.455227851867676, "global_step": 123169, "epoch": 2932} {"train_loss": -6.667773246765137, "global_step": 123170, "epoch": 2932} {"train_loss": -6.666685581207275, "global_step": 123171, "epoch": 2932} {"train_loss": -6.641264915466309, "global_step": 123172, "epoch": 2932} {"train_loss": -6.5239691734313965, "global_step": 123173, "epoch": 2932} {"train_loss": -6.606390476226807, "global_step": 123174, "epoch": 2932} {"train_loss": -6.58552885055542, "global_step": 123175, "epoch": 2932} {"train_loss": -6.608077049255371, "global_step": 123176, "epoch": 2932} {"train_loss": -6.680635452270508, "global_step": 123177, "epoch": 2932} {"train_loss": -6.642275810241699, "global_step": 123178, "epoch": 2932} {"train_loss": -6.578493118286133, "global_step": 123179, "epoch": 2932} {"train_loss": -6.709875106811523, "global_step": 123180, "epoch": 2932} {"train_loss": -6.635834693908691, "global_step": 123181, "epoch": 2932} {"train_loss": -6.6349053382873535, "global_step": 123182, "epoch": 2932} {"train_loss": -6.674910068511963, "global_step": 123183, "epoch": 2932} {"train_loss": -6.568036079406738, "global_step": 123184, "epoch": 2932} {"train_loss": -6.594196614764986, "global_step": 123185, "epoch": 2932, "val_loss": 66016.015625} {"train_loss": -6.612389087677002, "global_step": 123186, "epoch": 2933} {"train_loss": -6.536380767822266, "global_step": 123187, "epoch": 2933} {"train_loss": -6.638641357421875, "global_step": 123188, "epoch": 2933} {"train_loss": -6.600987434387207, "global_step": 123189, "epoch": 2933} {"train_loss": -6.61151123046875, "global_step": 123190, "epoch": 2933} {"train_loss": -6.496381759643555, "global_step": 123191, "epoch": 2933} {"train_loss": -6.574759006500244, "global_step": 123192, "epoch": 2933} {"train_loss": -6.577548980712891, "global_step": 123193, "epoch": 2933} {"train_loss": -6.540619373321533, "global_step": 123194, "epoch": 2933} {"train_loss": -6.375106334686279, "global_step": 123195, "epoch": 2933} {"train_loss": -6.463776588439941, "global_step": 123196, "epoch": 2933} {"train_loss": -6.382689476013184, "global_step": 123197, "epoch": 2933} {"train_loss": -6.381577968597412, "global_step": 123198, "epoch": 2933} {"train_loss": -6.553134918212891, "global_step": 123199, "epoch": 2933} {"train_loss": -6.423857688903809, "global_step": 123200, "epoch": 2933} {"train_loss": -6.558310031890869, "global_step": 123201, "epoch": 2933} {"train_loss": -6.460942268371582, "global_step": 123202, "epoch": 2933} {"train_loss": -6.503983020782471, "global_step": 123203, "epoch": 2933} {"train_loss": -6.5178446769714355, "global_step": 123204, "epoch": 2933} {"train_loss": -6.439082145690918, "global_step": 123205, "epoch": 2933} {"train_loss": -6.543207168579102, "global_step": 123206, "epoch": 2933} {"train_loss": -6.609155654907227, "global_step": 123207, "epoch": 2933} {"train_loss": -6.520925521850586, "global_step": 123208, "epoch": 2933} {"train_loss": -6.496062278747559, "global_step": 123209, "epoch": 2933} {"train_loss": -6.505692005157471, "global_step": 123210, "epoch": 2933} {"train_loss": -6.56301212310791, "global_step": 123211, "epoch": 2933} {"train_loss": -6.595808029174805, "global_step": 123212, "epoch": 2933} {"train_loss": -6.517596244812012, "global_step": 123213, "epoch": 2933} {"train_loss": -6.628787040710449, "global_step": 123214, "epoch": 2933} {"train_loss": -6.471320629119873, "global_step": 123215, "epoch": 2933} {"train_loss": -6.600015163421631, "global_step": 123216, "epoch": 2933} {"train_loss": -6.569622039794922, "global_step": 123217, "epoch": 2933} {"train_loss": -6.578427314758301, "global_step": 123218, "epoch": 2933} {"train_loss": -6.612164497375488, "global_step": 123219, "epoch": 2933} {"train_loss": -6.585709571838379, "global_step": 123220, "epoch": 2933} {"train_loss": -6.594343185424805, "global_step": 123221, "epoch": 2933} {"train_loss": -6.525890350341797, "global_step": 123222, "epoch": 2933} {"train_loss": -6.570122718811035, "global_step": 123223, "epoch": 2933} {"train_loss": -6.607556343078613, "global_step": 123224, "epoch": 2933} {"train_loss": -6.674767017364502, "global_step": 123225, "epoch": 2933} {"train_loss": -6.587564468383789, "global_step": 123226, "epoch": 2933} {"train_loss": -6.542149135044643, "global_step": 123227, "epoch": 2933, "val_loss": 65852.71875} {"train_loss": -6.63645601272583, "global_step": 123228, "epoch": 2934} {"train_loss": -6.619098663330078, "global_step": 123229, "epoch": 2934} {"train_loss": -6.727945327758789, "global_step": 123230, "epoch": 2934} {"train_loss": -6.617636680603027, "global_step": 123231, "epoch": 2934} {"train_loss": -6.568879127502441, "global_step": 123232, "epoch": 2934} {"train_loss": -6.617447853088379, "global_step": 123233, "epoch": 2934} {"train_loss": -6.638199806213379, "global_step": 123234, "epoch": 2934} {"train_loss": -6.600521564483643, "global_step": 123235, "epoch": 2934} {"train_loss": -6.632131099700928, "global_step": 123236, "epoch": 2934} {"train_loss": -6.622820854187012, "global_step": 123237, "epoch": 2934} {"train_loss": -6.703686714172363, "global_step": 123238, "epoch": 2934} {"train_loss": -6.634740829467773, "global_step": 123239, "epoch": 2934} {"train_loss": -6.514824390411377, "global_step": 123240, "epoch": 2934} {"train_loss": -6.627920150756836, "global_step": 123241, "epoch": 2934} {"train_loss": -6.665708541870117, "global_step": 123242, "epoch": 2934} {"train_loss": -6.594478130340576, "global_step": 123243, "epoch": 2934} {"train_loss": -6.596488952636719, "global_step": 123244, "epoch": 2934} {"train_loss": -6.572439193725586, "global_step": 123245, "epoch": 2934} {"train_loss": -6.566962242126465, "global_step": 123246, "epoch": 2934} {"train_loss": -6.6860551834106445, "global_step": 123247, "epoch": 2934} {"train_loss": -6.616037845611572, "global_step": 123248, "epoch": 2934} {"train_loss": -6.508257865905762, "global_step": 123249, "epoch": 2934} {"train_loss": -6.590278625488281, "global_step": 123250, "epoch": 2934} {"train_loss": -6.632479667663574, "global_step": 123251, "epoch": 2934} {"train_loss": -6.70558500289917, "global_step": 123252, "epoch": 2934} {"train_loss": -6.646120548248291, "global_step": 123253, "epoch": 2934} {"train_loss": -6.694846153259277, "global_step": 123254, "epoch": 2934} {"train_loss": -6.6251444816589355, "global_step": 123255, "epoch": 2934} {"train_loss": -6.598197937011719, "global_step": 123256, "epoch": 2934} {"train_loss": -6.672859191894531, "global_step": 123257, "epoch": 2934} {"train_loss": -6.679598808288574, "global_step": 123258, "epoch": 2934} {"train_loss": -6.603031158447266, "global_step": 123259, "epoch": 2934} {"train_loss": -6.544315338134766, "global_step": 123260, "epoch": 2934} {"train_loss": -6.579366683959961, "global_step": 123261, "epoch": 2934} {"train_loss": -6.671601295471191, "global_step": 123262, "epoch": 2934} {"train_loss": -6.660195350646973, "global_step": 123263, "epoch": 2934} {"train_loss": -6.588585376739502, "global_step": 123264, "epoch": 2934} {"train_loss": -6.6468095779418945, "global_step": 123265, "epoch": 2934} {"train_loss": -6.5636725425720215, "global_step": 123266, "epoch": 2934} {"train_loss": -6.680863380432129, "global_step": 123267, "epoch": 2934} {"train_loss": -6.611786365509033, "global_step": 123268, "epoch": 2934} {"train_loss": -6.6216206550598145, "global_step": 123269, "epoch": 2934, "val_loss": 66019.0546875} {"train_loss": -6.509939670562744, "global_step": 123270, "epoch": 2935} {"train_loss": -6.6131744384765625, "global_step": 123271, "epoch": 2935} {"train_loss": -6.5133280754089355, "global_step": 123272, "epoch": 2935} {"train_loss": -6.611943244934082, "global_step": 123273, "epoch": 2935} {"train_loss": -6.728233337402344, "global_step": 123274, "epoch": 2935} {"train_loss": -6.569351673126221, "global_step": 123275, "epoch": 2935} {"train_loss": -6.636952877044678, "global_step": 123276, "epoch": 2935} {"train_loss": -6.60173225402832, "global_step": 123277, "epoch": 2935} {"train_loss": -6.711008548736572, "global_step": 123278, "epoch": 2935} {"train_loss": -6.500892639160156, "global_step": 123279, "epoch": 2935} {"train_loss": -6.6371169090271, "global_step": 123280, "epoch": 2935} {"train_loss": -6.541083335876465, "global_step": 123281, "epoch": 2935} {"train_loss": -6.642242431640625, "global_step": 123282, "epoch": 2935} {"train_loss": -6.627625465393066, "global_step": 123283, "epoch": 2935} {"train_loss": -6.483067989349365, "global_step": 123284, "epoch": 2935} {"train_loss": -6.644948959350586, "global_step": 123285, "epoch": 2935} {"train_loss": -6.6432600021362305, "global_step": 123286, "epoch": 2935} {"train_loss": -6.735020637512207, "global_step": 123287, "epoch": 2935} {"train_loss": -6.602059364318848, "global_step": 123288, "epoch": 2935} {"train_loss": -6.714322090148926, "global_step": 123289, "epoch": 2935} {"train_loss": -6.597346305847168, "global_step": 123290, "epoch": 2935} {"train_loss": -6.6569414138793945, "global_step": 123291, "epoch": 2935} {"train_loss": -6.5934343338012695, "global_step": 123292, "epoch": 2935} {"train_loss": -6.6592512130737305, "global_step": 123293, "epoch": 2935} {"train_loss": -6.695123672485352, "global_step": 123294, "epoch": 2935} {"train_loss": -6.670475006103516, "global_step": 123295, "epoch": 2935} {"train_loss": -6.746679306030273, "global_step": 123296, "epoch": 2935} {"train_loss": -6.777733325958252, "global_step": 123297, "epoch": 2935} {"train_loss": -6.69282341003418, "global_step": 123298, "epoch": 2935} {"train_loss": -6.651928901672363, "global_step": 123299, "epoch": 2935} {"train_loss": -6.566211700439453, "global_step": 123300, "epoch": 2935} {"train_loss": -6.578124046325684, "global_step": 123301, "epoch": 2935} {"train_loss": -6.73908805847168, "global_step": 123302, "epoch": 2935} {"train_loss": -6.5963287353515625, "global_step": 123303, "epoch": 2935} {"train_loss": -6.548410415649414, "global_step": 123304, "epoch": 2935} {"train_loss": -6.60944128036499, "global_step": 123305, "epoch": 2935} {"train_loss": -6.609394550323486, "global_step": 123306, "epoch": 2935} {"train_loss": -6.6095757484436035, "global_step": 123307, "epoch": 2935} {"train_loss": -6.673427581787109, "global_step": 123308, "epoch": 2935} {"train_loss": -6.505380630493164, "global_step": 123309, "epoch": 2935} {"train_loss": -6.585204124450684, "global_step": 123310, "epoch": 2935} {"train_loss": -6.621961650394258, "global_step": 123311, "epoch": 2935, "val_loss": 65904.546875} {"train_loss": -6.655564308166504, "global_step": 123312, "epoch": 2936} {"train_loss": -6.606984615325928, "global_step": 123313, "epoch": 2936} {"train_loss": -6.590360641479492, "global_step": 123314, "epoch": 2936} {"train_loss": -6.653384208679199, "global_step": 123315, "epoch": 2936} {"train_loss": -6.52695369720459, "global_step": 123316, "epoch": 2936} {"train_loss": -6.6210246086120605, "global_step": 123317, "epoch": 2936} {"train_loss": -6.680174827575684, "global_step": 123318, "epoch": 2936} {"train_loss": -6.6718292236328125, "global_step": 123319, "epoch": 2936} {"train_loss": -6.6660990715026855, "global_step": 123320, "epoch": 2936} {"train_loss": -6.558175563812256, "global_step": 123321, "epoch": 2936} {"train_loss": -6.718369960784912, "global_step": 123322, "epoch": 2936} {"train_loss": -6.649722099304199, "global_step": 123323, "epoch": 2936} {"train_loss": -6.67835807800293, "global_step": 123324, "epoch": 2936} {"train_loss": -6.707682132720947, "global_step": 123325, "epoch": 2936} {"train_loss": -6.589205265045166, "global_step": 123326, "epoch": 2936} {"train_loss": -6.620736598968506, "global_step": 123327, "epoch": 2936} {"train_loss": -6.592588901519775, "global_step": 123328, "epoch": 2936} {"train_loss": -6.647099018096924, "global_step": 123329, "epoch": 2936} {"train_loss": -6.72687292098999, "global_step": 123330, "epoch": 2936} {"train_loss": -6.714090347290039, "global_step": 123331, "epoch": 2936} {"train_loss": -6.581060409545898, "global_step": 123332, "epoch": 2936} {"train_loss": -6.567699909210205, "global_step": 123333, "epoch": 2936} {"train_loss": -6.566994667053223, "global_step": 123334, "epoch": 2936} {"train_loss": -6.463604927062988, "global_step": 123335, "epoch": 2936} {"train_loss": -6.4752655029296875, "global_step": 123336, "epoch": 2936} {"train_loss": -6.608203411102295, "global_step": 123337, "epoch": 2936} {"train_loss": -6.554363250732422, "global_step": 123338, "epoch": 2936} {"train_loss": -6.447131633758545, "global_step": 123339, "epoch": 2936} {"train_loss": -6.580321311950684, "global_step": 123340, "epoch": 2936} {"train_loss": -6.4151506423950195, "global_step": 123341, "epoch": 2936} {"train_loss": -6.551812171936035, "global_step": 123342, "epoch": 2936} {"train_loss": -6.452462196350098, "global_step": 123343, "epoch": 2936} {"train_loss": -6.400207042694092, "global_step": 123344, "epoch": 2936} {"train_loss": -6.555652618408203, "global_step": 123345, "epoch": 2936} {"train_loss": -6.39247989654541, "global_step": 123346, "epoch": 2936} {"train_loss": -6.64206600189209, "global_step": 123347, "epoch": 2936} {"train_loss": -6.521946907043457, "global_step": 123348, "epoch": 2936} {"train_loss": -6.531999588012695, "global_step": 123349, "epoch": 2936} {"train_loss": -6.574108123779297, "global_step": 123350, "epoch": 2936} {"train_loss": -6.563815116882324, "global_step": 123351, "epoch": 2936} {"train_loss": -6.639488220214844, "global_step": 123352, "epoch": 2936} {"train_loss": -6.5831959928785055, "global_step": 123353, "epoch": 2936, "val_loss": 66186.890625} {"train_loss": -6.613370418548584, "global_step": 123354, "epoch": 2937} {"train_loss": -6.4935197830200195, "global_step": 123355, "epoch": 2937} {"train_loss": -6.642819404602051, "global_step": 123356, "epoch": 2937} {"train_loss": -6.584791660308838, "global_step": 123357, "epoch": 2937} {"train_loss": -6.534337043762207, "global_step": 123358, "epoch": 2937} {"train_loss": -6.498737335205078, "global_step": 123359, "epoch": 2937} {"train_loss": -6.605421543121338, "global_step": 123360, "epoch": 2937} {"train_loss": -6.57342004776001, "global_step": 123361, "epoch": 2937} {"train_loss": -6.560798645019531, "global_step": 123362, "epoch": 2937} {"train_loss": -6.558318138122559, "global_step": 123363, "epoch": 2937} {"train_loss": -6.549997329711914, "global_step": 123364, "epoch": 2937} {"train_loss": -6.605462551116943, "global_step": 123365, "epoch": 2937} {"train_loss": -6.604761600494385, "global_step": 123366, "epoch": 2937} {"train_loss": -6.649416923522949, "global_step": 123367, "epoch": 2937} {"train_loss": -6.594382286071777, "global_step": 123368, "epoch": 2937} {"train_loss": -6.648207664489746, "global_step": 123369, "epoch": 2937} {"train_loss": -6.6605753898620605, "global_step": 123370, "epoch": 2937} {"train_loss": -6.731973648071289, "global_step": 123371, "epoch": 2937} {"train_loss": -6.681641578674316, "global_step": 123372, "epoch": 2937} {"train_loss": -6.596739768981934, "global_step": 123373, "epoch": 2937} {"train_loss": -6.529843330383301, "global_step": 123374, "epoch": 2937} {"train_loss": -6.502274036407471, "global_step": 123375, "epoch": 2937} {"train_loss": -6.460263252258301, "global_step": 123376, "epoch": 2937} {"train_loss": -6.531009674072266, "global_step": 123377, "epoch": 2937} {"train_loss": -6.522365093231201, "global_step": 123378, "epoch": 2937} {"train_loss": -6.545258045196533, "global_step": 123379, "epoch": 2937} {"train_loss": -6.677855491638184, "global_step": 123380, "epoch": 2937} {"train_loss": -6.556942939758301, "global_step": 123381, "epoch": 2937} {"train_loss": -6.632554054260254, "global_step": 123382, "epoch": 2937} {"train_loss": -6.5776448249816895, "global_step": 123383, "epoch": 2937} {"train_loss": -6.656546592712402, "global_step": 123384, "epoch": 2937} {"train_loss": -6.601432800292969, "global_step": 123385, "epoch": 2937} {"train_loss": -6.641093730926514, "global_step": 123386, "epoch": 2937} {"train_loss": -6.542991638183594, "global_step": 123387, "epoch": 2937} {"train_loss": -6.663914680480957, "global_step": 123388, "epoch": 2937} {"train_loss": -6.584690093994141, "global_step": 123389, "epoch": 2937} {"train_loss": -6.556450843811035, "global_step": 123390, "epoch": 2937} {"train_loss": -6.495212554931641, "global_step": 123391, "epoch": 2937} {"train_loss": -6.587512016296387, "global_step": 123392, "epoch": 2937} {"train_loss": -6.618278503417969, "global_step": 123393, "epoch": 2937} {"train_loss": -6.752130031585693, "global_step": 123394, "epoch": 2937} {"train_loss": -6.591381027584984, "global_step": 123395, "epoch": 2937, "val_loss": 65998.0546875} {"train_loss": -6.639652252197266, "global_step": 123396, "epoch": 2938} {"train_loss": -6.594130039215088, "global_step": 123397, "epoch": 2938} {"train_loss": -6.635035037994385, "global_step": 123398, "epoch": 2938} {"train_loss": -6.675050735473633, "global_step": 123399, "epoch": 2938} {"train_loss": -6.555487632751465, "global_step": 123400, "epoch": 2938} {"train_loss": -6.673980712890625, "global_step": 123401, "epoch": 2938} {"train_loss": -6.594127178192139, "global_step": 123402, "epoch": 2938} {"train_loss": -6.625967979431152, "global_step": 123403, "epoch": 2938} {"train_loss": -6.722217559814453, "global_step": 123404, "epoch": 2938} {"train_loss": -6.671778678894043, "global_step": 123405, "epoch": 2938} {"train_loss": -6.6910600662231445, "global_step": 123406, "epoch": 2938} {"train_loss": -6.641305923461914, "global_step": 123407, "epoch": 2938} {"train_loss": -6.586875915527344, "global_step": 123408, "epoch": 2938} {"train_loss": -6.693634033203125, "global_step": 123409, "epoch": 2938} {"train_loss": -6.583786964416504, "global_step": 123410, "epoch": 2938} {"train_loss": -6.582576751708984, "global_step": 123411, "epoch": 2938} {"train_loss": -6.714775085449219, "global_step": 123412, "epoch": 2938} {"train_loss": -6.719155311584473, "global_step": 123413, "epoch": 2938} {"train_loss": -6.596785545349121, "global_step": 123414, "epoch": 2938} {"train_loss": -6.585597038269043, "global_step": 123415, "epoch": 2938} {"train_loss": -6.629423141479492, "global_step": 123416, "epoch": 2938} {"train_loss": -6.665173530578613, "global_step": 123417, "epoch": 2938} {"train_loss": -6.549116611480713, "global_step": 123418, "epoch": 2938} {"train_loss": -6.642316818237305, "global_step": 123419, "epoch": 2938} {"train_loss": -6.655202388763428, "global_step": 123420, "epoch": 2938} {"train_loss": -6.616660118103027, "global_step": 123421, "epoch": 2938} {"train_loss": -6.661126136779785, "global_step": 123422, "epoch": 2938} {"train_loss": -6.732219219207764, "global_step": 123423, "epoch": 2938} {"train_loss": -6.568917274475098, "global_step": 123424, "epoch": 2938} {"train_loss": -6.670581340789795, "global_step": 123425, "epoch": 2938} {"train_loss": -6.592800140380859, "global_step": 123426, "epoch": 2938} {"train_loss": -6.633665084838867, "global_step": 123427, "epoch": 2938} {"train_loss": -6.6572489738464355, "global_step": 123428, "epoch": 2938} {"train_loss": -6.648209571838379, "global_step": 123429, "epoch": 2938} {"train_loss": -6.587512493133545, "global_step": 123430, "epoch": 2938} {"train_loss": -6.726382255554199, "global_step": 123431, "epoch": 2938} {"train_loss": -6.652498245239258, "global_step": 123432, "epoch": 2938} {"train_loss": -6.6404128074646, "global_step": 123433, "epoch": 2938} {"train_loss": -6.625226020812988, "global_step": 123434, "epoch": 2938} {"train_loss": -6.577191352844238, "global_step": 123435, "epoch": 2938} {"train_loss": -6.702422142028809, "global_step": 123436, "epoch": 2938} {"train_loss": -6.640272969291324, "global_step": 123437, "epoch": 2938, "val_loss": 65939.9765625} {"train_loss": -6.6829609870910645, "global_step": 123438, "epoch": 2939} {"train_loss": -6.615351676940918, "global_step": 123439, "epoch": 2939} {"train_loss": -6.569006443023682, "global_step": 123440, "epoch": 2939} {"train_loss": -6.60755729675293, "global_step": 123441, "epoch": 2939} {"train_loss": -6.517307281494141, "global_step": 123442, "epoch": 2939} {"train_loss": -6.654570579528809, "global_step": 123443, "epoch": 2939} {"train_loss": -6.655635833740234, "global_step": 123444, "epoch": 2939} {"train_loss": -6.640797138214111, "global_step": 123445, "epoch": 2939} {"train_loss": -6.694669723510742, "global_step": 123446, "epoch": 2939} {"train_loss": -6.627655029296875, "global_step": 123447, "epoch": 2939} {"train_loss": -6.616197109222412, "global_step": 123448, "epoch": 2939} {"train_loss": -6.6392388343811035, "global_step": 123449, "epoch": 2939} {"train_loss": -6.676020622253418, "global_step": 123450, "epoch": 2939} {"train_loss": -6.624190330505371, "global_step": 123451, "epoch": 2939} {"train_loss": -6.648259162902832, "global_step": 123452, "epoch": 2939} {"train_loss": -6.7142333984375, "global_step": 123453, "epoch": 2939} {"train_loss": -6.630773544311523, "global_step": 123454, "epoch": 2939} {"train_loss": -6.739306449890137, "global_step": 123455, "epoch": 2939} {"train_loss": -6.710298538208008, "global_step": 123456, "epoch": 2939} {"train_loss": -6.596151351928711, "global_step": 123457, "epoch": 2939} {"train_loss": -6.693352699279785, "global_step": 123458, "epoch": 2939} {"train_loss": -6.695405006408691, "global_step": 123459, "epoch": 2939} {"train_loss": -6.601401329040527, "global_step": 123460, "epoch": 2939} {"train_loss": -6.608006954193115, "global_step": 123461, "epoch": 2939} {"train_loss": -6.6358537673950195, "global_step": 123462, "epoch": 2939} {"train_loss": -6.675171852111816, "global_step": 123463, "epoch": 2939} {"train_loss": -6.501284122467041, "global_step": 123464, "epoch": 2939} {"train_loss": -6.685729026794434, "global_step": 123465, "epoch": 2939} {"train_loss": -6.689939975738525, "global_step": 123466, "epoch": 2939} {"train_loss": -6.651022911071777, "global_step": 123467, "epoch": 2939} {"train_loss": -6.561703681945801, "global_step": 123468, "epoch": 2939} {"train_loss": -6.619687557220459, "global_step": 123469, "epoch": 2939} {"train_loss": -6.597092628479004, "global_step": 123470, "epoch": 2939} {"train_loss": -6.656740665435791, "global_step": 123471, "epoch": 2939} {"train_loss": -6.627050876617432, "global_step": 123472, "epoch": 2939} {"train_loss": -6.613943099975586, "global_step": 123473, "epoch": 2939} {"train_loss": -6.602563858032227, "global_step": 123474, "epoch": 2939} {"train_loss": -6.617733001708984, "global_step": 123475, "epoch": 2939} {"train_loss": -6.630600929260254, "global_step": 123476, "epoch": 2939} {"train_loss": -6.5934157371521, "global_step": 123477, "epoch": 2939} {"train_loss": -6.584139347076416, "global_step": 123478, "epoch": 2939} {"train_loss": -6.635438760121663, "global_step": 123479, "epoch": 2939, "val_loss": 66066.2421875} {"train_loss": -6.625923156738281, "global_step": 123480, "epoch": 2940} {"train_loss": -6.668409824371338, "global_step": 123481, "epoch": 2940} {"train_loss": -6.63154411315918, "global_step": 123482, "epoch": 2940} {"train_loss": -6.668527603149414, "global_step": 123483, "epoch": 2940} {"train_loss": -6.671769142150879, "global_step": 123484, "epoch": 2940} {"train_loss": -6.630443572998047, "global_step": 123485, "epoch": 2940} {"train_loss": -6.619946479797363, "global_step": 123486, "epoch": 2940} {"train_loss": -6.503679275512695, "global_step": 123487, "epoch": 2940} {"train_loss": -6.616334438323975, "global_step": 123488, "epoch": 2940} {"train_loss": -6.609413146972656, "global_step": 123489, "epoch": 2940} {"train_loss": -6.577008247375488, "global_step": 123490, "epoch": 2940} {"train_loss": -6.584997653961182, "global_step": 123491, "epoch": 2940} {"train_loss": -6.515879154205322, "global_step": 123492, "epoch": 2940} {"train_loss": -6.583403587341309, "global_step": 123493, "epoch": 2940} {"train_loss": -6.446404457092285, "global_step": 123494, "epoch": 2940} {"train_loss": -6.439910888671875, "global_step": 123495, "epoch": 2940} {"train_loss": -6.50948429107666, "global_step": 123496, "epoch": 2940} {"train_loss": -6.517416000366211, "global_step": 123497, "epoch": 2940} {"train_loss": -6.280953884124756, "global_step": 123498, "epoch": 2940} {"train_loss": -6.5833001136779785, "global_step": 123499, "epoch": 2940} {"train_loss": -6.490939140319824, "global_step": 123500, "epoch": 2940} {"train_loss": -6.478137969970703, "global_step": 123501, "epoch": 2940} {"train_loss": -6.528887748718262, "global_step": 123502, "epoch": 2940} {"train_loss": -6.339712619781494, "global_step": 123503, "epoch": 2940} {"train_loss": -6.569760322570801, "global_step": 123504, "epoch": 2940} {"train_loss": -6.4276838302612305, "global_step": 123505, "epoch": 2940} {"train_loss": -6.471532821655273, "global_step": 123506, "epoch": 2940} {"train_loss": -6.45142936706543, "global_step": 123507, "epoch": 2940} {"train_loss": -6.486187934875488, "global_step": 123508, "epoch": 2940} {"train_loss": -6.451010227203369, "global_step": 123509, "epoch": 2940} {"train_loss": -6.477984428405762, "global_step": 123510, "epoch": 2940} {"train_loss": -6.548789978027344, "global_step": 123511, "epoch": 2940} {"train_loss": -6.468042373657227, "global_step": 123512, "epoch": 2940} {"train_loss": -6.505193710327148, "global_step": 123513, "epoch": 2940} {"train_loss": -6.547092437744141, "global_step": 123514, "epoch": 2940} {"train_loss": -6.450198173522949, "global_step": 123515, "epoch": 2940} {"train_loss": -6.439279079437256, "global_step": 123516, "epoch": 2940} {"train_loss": -6.504822731018066, "global_step": 123517, "epoch": 2940} {"train_loss": -6.42439079284668, "global_step": 123518, "epoch": 2940} {"train_loss": -6.419693470001221, "global_step": 123519, "epoch": 2940} {"train_loss": -6.61570930480957, "global_step": 123520, "epoch": 2940} {"train_loss": -6.52104157493228, "global_step": 123521, "epoch": 2940, "val_loss": 65874.984375} {"train_loss": -6.5072736740112305, "global_step": 123522, "epoch": 2941} {"train_loss": -6.609051704406738, "global_step": 123523, "epoch": 2941} {"train_loss": -6.564333438873291, "global_step": 123524, "epoch": 2941} {"train_loss": -6.477507591247559, "global_step": 123525, "epoch": 2941} {"train_loss": -6.660709381103516, "global_step": 123526, "epoch": 2941} {"train_loss": -6.50211238861084, "global_step": 123527, "epoch": 2941} {"train_loss": -6.649778366088867, "global_step": 123528, "epoch": 2941} {"train_loss": -6.604475021362305, "global_step": 123529, "epoch": 2941} {"train_loss": -6.627441883087158, "global_step": 123530, "epoch": 2941} {"train_loss": -6.680030822753906, "global_step": 123531, "epoch": 2941} {"train_loss": -6.543850898742676, "global_step": 123532, "epoch": 2941} {"train_loss": -6.676216125488281, "global_step": 123533, "epoch": 2941} {"train_loss": -6.615398406982422, "global_step": 123534, "epoch": 2941} {"train_loss": -6.490826606750488, "global_step": 123535, "epoch": 2941} {"train_loss": -6.579224586486816, "global_step": 123536, "epoch": 2941} {"train_loss": -6.565128326416016, "global_step": 123537, "epoch": 2941} {"train_loss": -6.631147384643555, "global_step": 123538, "epoch": 2941} {"train_loss": -6.619747638702393, "global_step": 123539, "epoch": 2941} {"train_loss": -6.7791428565979, "global_step": 123540, "epoch": 2941} {"train_loss": -6.50337028503418, "global_step": 123541, "epoch": 2941} {"train_loss": -6.613430023193359, "global_step": 123542, "epoch": 2941} {"train_loss": -6.743252277374268, "global_step": 123543, "epoch": 2941} {"train_loss": -6.679635047912598, "global_step": 123544, "epoch": 2941} {"train_loss": -6.519688129425049, "global_step": 123545, "epoch": 2941} {"train_loss": -6.604647636413574, "global_step": 123546, "epoch": 2941} {"train_loss": -6.613520622253418, "global_step": 123547, "epoch": 2941} {"train_loss": -6.541942596435547, "global_step": 123548, "epoch": 2941} {"train_loss": -6.568229675292969, "global_step": 123549, "epoch": 2941} {"train_loss": -6.522402763366699, "global_step": 123550, "epoch": 2941} {"train_loss": -6.6006364822387695, "global_step": 123551, "epoch": 2941} {"train_loss": -6.578880310058594, "global_step": 123552, "epoch": 2941} {"train_loss": -6.59037446975708, "global_step": 123553, "epoch": 2941} {"train_loss": -6.7824506759643555, "global_step": 123554, "epoch": 2941} {"train_loss": -6.627674102783203, "global_step": 123555, "epoch": 2941} {"train_loss": -6.699587345123291, "global_step": 123556, "epoch": 2941} {"train_loss": -6.601211071014404, "global_step": 123557, "epoch": 2941} {"train_loss": -6.683093070983887, "global_step": 123558, "epoch": 2941} {"train_loss": -6.642098903656006, "global_step": 123559, "epoch": 2941} {"train_loss": -6.605134010314941, "global_step": 123560, "epoch": 2941} {"train_loss": -6.728351593017578, "global_step": 123561, "epoch": 2941} {"train_loss": -6.5121750831604, "global_step": 123562, "epoch": 2941} {"train_loss": -6.60737403233846, "global_step": 123563, "epoch": 2941, "val_loss": 66137.3671875} {"train_loss": -6.589901924133301, "global_step": 123564, "epoch": 2942} {"train_loss": -6.621927738189697, "global_step": 123565, "epoch": 2942} {"train_loss": -6.526401519775391, "global_step": 123566, "epoch": 2942} {"train_loss": -6.634410858154297, "global_step": 123567, "epoch": 2942} {"train_loss": -6.605888843536377, "global_step": 123568, "epoch": 2942} {"train_loss": -6.6152567863464355, "global_step": 123569, "epoch": 2942} {"train_loss": -6.620632171630859, "global_step": 123570, "epoch": 2942} {"train_loss": -6.584449291229248, "global_step": 123571, "epoch": 2942} {"train_loss": -6.638436794281006, "global_step": 123572, "epoch": 2942} {"train_loss": -6.612174987792969, "global_step": 123573, "epoch": 2942} {"train_loss": -6.584440231323242, "global_step": 123574, "epoch": 2942} {"train_loss": -6.552445411682129, "global_step": 123575, "epoch": 2942} {"train_loss": -6.513202667236328, "global_step": 123576, "epoch": 2942} {"train_loss": -6.580780029296875, "global_step": 123577, "epoch": 2942} {"train_loss": -6.38430118560791, "global_step": 123578, "epoch": 2942} {"train_loss": -6.530369281768799, "global_step": 123579, "epoch": 2942} {"train_loss": -6.526445388793945, "global_step": 123580, "epoch": 2942} {"train_loss": -6.658050537109375, "global_step": 123581, "epoch": 2942} {"train_loss": -6.630232810974121, "global_step": 123582, "epoch": 2942} {"train_loss": -6.545794486999512, "global_step": 123583, "epoch": 2942} {"train_loss": -6.678760528564453, "global_step": 123584, "epoch": 2942} {"train_loss": -6.570104598999023, "global_step": 123585, "epoch": 2942} {"train_loss": -6.597657203674316, "global_step": 123586, "epoch": 2942} {"train_loss": -6.62604284286499, "global_step": 123587, "epoch": 2942} {"train_loss": -6.6733808517456055, "global_step": 123588, "epoch": 2942} {"train_loss": -6.647909164428711, "global_step": 123589, "epoch": 2942} {"train_loss": -6.592761516571045, "global_step": 123590, "epoch": 2942} {"train_loss": -6.677845478057861, "global_step": 123591, "epoch": 2942} {"train_loss": -6.669493675231934, "global_step": 123592, "epoch": 2942} {"train_loss": -6.572531700134277, "global_step": 123593, "epoch": 2942} {"train_loss": -6.550021648406982, "global_step": 123594, "epoch": 2942} {"train_loss": -6.725701332092285, "global_step": 123595, "epoch": 2942} {"train_loss": -6.613946914672852, "global_step": 123596, "epoch": 2942} {"train_loss": -6.689763069152832, "global_step": 123597, "epoch": 2942} {"train_loss": -6.479710578918457, "global_step": 123598, "epoch": 2942} {"train_loss": -6.588104248046875, "global_step": 123599, "epoch": 2942} {"train_loss": -6.688065528869629, "global_step": 123600, "epoch": 2942} {"train_loss": -6.630070209503174, "global_step": 123601, "epoch": 2942} {"train_loss": -6.642374038696289, "global_step": 123602, "epoch": 2942} {"train_loss": -6.593132019042969, "global_step": 123603, "epoch": 2942} {"train_loss": -6.685605049133301, "global_step": 123604, "epoch": 2942} {"train_loss": -6.606531438373384, "global_step": 123605, "epoch": 2942, "val_loss": 65955.9375} {"train_loss": -6.639169216156006, "global_step": 123606, "epoch": 2943} {"train_loss": -6.707455635070801, "global_step": 123607, "epoch": 2943} {"train_loss": -6.763690948486328, "global_step": 123608, "epoch": 2943} {"train_loss": -6.6886701583862305, "global_step": 123609, "epoch": 2943} {"train_loss": -6.649413108825684, "global_step": 123610, "epoch": 2943} {"train_loss": -6.777074813842773, "global_step": 123611, "epoch": 2943} {"train_loss": -6.5938591957092285, "global_step": 123612, "epoch": 2943} {"train_loss": -6.546055316925049, "global_step": 123613, "epoch": 2943} {"train_loss": -6.760925769805908, "global_step": 123614, "epoch": 2943} {"train_loss": -6.73311710357666, "global_step": 123615, "epoch": 2943} {"train_loss": -6.551951885223389, "global_step": 123616, "epoch": 2943} {"train_loss": -6.495187759399414, "global_step": 123617, "epoch": 2943} {"train_loss": -6.684473514556885, "global_step": 123618, "epoch": 2943} {"train_loss": -6.498905181884766, "global_step": 123619, "epoch": 2943} {"train_loss": -6.590244293212891, "global_step": 123620, "epoch": 2943} {"train_loss": -6.7187886238098145, "global_step": 123621, "epoch": 2943} {"train_loss": -6.639523983001709, "global_step": 123622, "epoch": 2943} {"train_loss": -6.578545093536377, "global_step": 123623, "epoch": 2943} {"train_loss": -6.576422691345215, "global_step": 123624, "epoch": 2943} {"train_loss": -6.477689743041992, "global_step": 123625, "epoch": 2943} {"train_loss": -6.553420543670654, "global_step": 123626, "epoch": 2943} {"train_loss": -6.712498188018799, "global_step": 123627, "epoch": 2943} {"train_loss": -6.575952529907227, "global_step": 123628, "epoch": 2943} {"train_loss": -6.545461177825928, "global_step": 123629, "epoch": 2943} {"train_loss": -6.630706310272217, "global_step": 123630, "epoch": 2943} {"train_loss": -6.486194133758545, "global_step": 123631, "epoch": 2943} {"train_loss": -6.673697471618652, "global_step": 123632, "epoch": 2943} {"train_loss": -6.5225324630737305, "global_step": 123633, "epoch": 2943} {"train_loss": -6.511592388153076, "global_step": 123634, "epoch": 2943} {"train_loss": -6.596214294433594, "global_step": 123635, "epoch": 2943} {"train_loss": -6.569815635681152, "global_step": 123636, "epoch": 2943} {"train_loss": -6.50871467590332, "global_step": 123637, "epoch": 2943} {"train_loss": -6.598254203796387, "global_step": 123638, "epoch": 2943} {"train_loss": -6.55387020111084, "global_step": 123639, "epoch": 2943} {"train_loss": -6.612351417541504, "global_step": 123640, "epoch": 2943} {"train_loss": -6.52729606628418, "global_step": 123641, "epoch": 2943} {"train_loss": -6.458897590637207, "global_step": 123642, "epoch": 2943} {"train_loss": -6.558509349822998, "global_step": 123643, "epoch": 2943} {"train_loss": -6.583714485168457, "global_step": 123644, "epoch": 2943} {"train_loss": -6.652666091918945, "global_step": 123645, "epoch": 2943} {"train_loss": -6.620820045471191, "global_step": 123646, "epoch": 2943} {"train_loss": -6.599397057578678, "global_step": 123647, "epoch": 2943, "val_loss": 66143.2734375} {"train_loss": -6.5097174644470215, "global_step": 123648, "epoch": 2944} {"train_loss": -6.546789646148682, "global_step": 123649, "epoch": 2944} {"train_loss": -6.554141044616699, "global_step": 123650, "epoch": 2944} {"train_loss": -6.604465484619141, "global_step": 123651, "epoch": 2944} {"train_loss": -6.701030731201172, "global_step": 123652, "epoch": 2944} {"train_loss": -6.460362434387207, "global_step": 123653, "epoch": 2944} {"train_loss": -6.596798419952393, "global_step": 123654, "epoch": 2944} {"train_loss": -6.612313270568848, "global_step": 123655, "epoch": 2944} {"train_loss": -6.494930744171143, "global_step": 123656, "epoch": 2944} {"train_loss": -6.562221527099609, "global_step": 123657, "epoch": 2944} {"train_loss": -6.498520374298096, "global_step": 123658, "epoch": 2944} {"train_loss": -6.517299652099609, "global_step": 123659, "epoch": 2944} {"train_loss": -6.552755355834961, "global_step": 123660, "epoch": 2944} {"train_loss": -6.541069030761719, "global_step": 123661, "epoch": 2944} {"train_loss": -6.617180347442627, "global_step": 123662, "epoch": 2944} {"train_loss": -6.580029487609863, "global_step": 123663, "epoch": 2944} {"train_loss": -6.559289932250977, "global_step": 123664, "epoch": 2944} {"train_loss": -6.668423652648926, "global_step": 123665, "epoch": 2944} {"train_loss": -6.6818389892578125, "global_step": 123666, "epoch": 2944} {"train_loss": -6.594213485717773, "global_step": 123667, "epoch": 2944} {"train_loss": -6.660338401794434, "global_step": 123668, "epoch": 2944} {"train_loss": -6.57387638092041, "global_step": 123669, "epoch": 2944} {"train_loss": -6.666645526885986, "global_step": 123670, "epoch": 2944} {"train_loss": -6.737946033477783, "global_step": 123671, "epoch": 2944} {"train_loss": -6.690364837646484, "global_step": 123672, "epoch": 2944} {"train_loss": -6.513747215270996, "global_step": 123673, "epoch": 2944} {"train_loss": -6.580384254455566, "global_step": 123674, "epoch": 2944} {"train_loss": -6.623322486877441, "global_step": 123675, "epoch": 2944} {"train_loss": -6.613519668579102, "global_step": 123676, "epoch": 2944} {"train_loss": -6.5348005294799805, "global_step": 123677, "epoch": 2944} {"train_loss": -6.563844680786133, "global_step": 123678, "epoch": 2944} {"train_loss": -6.701958179473877, "global_step": 123679, "epoch": 2944} {"train_loss": -6.6555399894714355, "global_step": 123680, "epoch": 2944} {"train_loss": -6.511818885803223, "global_step": 123681, "epoch": 2944} {"train_loss": -6.632509708404541, "global_step": 123682, "epoch": 2944} {"train_loss": -6.66413688659668, "global_step": 123683, "epoch": 2944} {"train_loss": -6.5530548095703125, "global_step": 123684, "epoch": 2944} {"train_loss": -6.684648036956787, "global_step": 123685, "epoch": 2944} {"train_loss": -6.682567596435547, "global_step": 123686, "epoch": 2944} {"train_loss": -6.665494918823242, "global_step": 123687, "epoch": 2944} {"train_loss": -6.492001533508301, "global_step": 123688, "epoch": 2944} {"train_loss": -6.599338395254953, "global_step": 123689, "epoch": 2944, "val_loss": 66098.6171875} {"train_loss": -6.551823139190674, "global_step": 123690, "epoch": 2945} {"train_loss": -6.642766952514648, "global_step": 123691, "epoch": 2945} {"train_loss": -6.711158752441406, "global_step": 123692, "epoch": 2945} {"train_loss": -6.411754608154297, "global_step": 123693, "epoch": 2945} {"train_loss": -6.490114212036133, "global_step": 123694, "epoch": 2945} {"train_loss": -6.513490676879883, "global_step": 123695, "epoch": 2945} {"train_loss": -6.443265914916992, "global_step": 123696, "epoch": 2945} {"train_loss": -6.574783802032471, "global_step": 123697, "epoch": 2945} {"train_loss": -6.582176685333252, "global_step": 123698, "epoch": 2945} {"train_loss": -6.583151817321777, "global_step": 123699, "epoch": 2945} {"train_loss": -6.624456405639648, "global_step": 123700, "epoch": 2945} {"train_loss": -6.5927734375, "global_step": 123701, "epoch": 2945} {"train_loss": -6.567887306213379, "global_step": 123702, "epoch": 2945} {"train_loss": -6.677700996398926, "global_step": 123703, "epoch": 2945} {"train_loss": -6.518967628479004, "global_step": 123704, "epoch": 2945} {"train_loss": -6.579164505004883, "global_step": 123705, "epoch": 2945} {"train_loss": -6.618351936340332, "global_step": 123706, "epoch": 2945} {"train_loss": -6.555455207824707, "global_step": 123707, "epoch": 2945} {"train_loss": -6.6602325439453125, "global_step": 123708, "epoch": 2945} {"train_loss": -6.467913627624512, "global_step": 123709, "epoch": 2945} {"train_loss": -6.646027565002441, "global_step": 123710, "epoch": 2945} {"train_loss": -6.607083320617676, "global_step": 123711, "epoch": 2945} {"train_loss": -6.640347480773926, "global_step": 123712, "epoch": 2945} {"train_loss": -6.685309410095215, "global_step": 123713, "epoch": 2945} {"train_loss": -6.7511396408081055, "global_step": 123714, "epoch": 2945} {"train_loss": -6.541459083557129, "global_step": 123715, "epoch": 2945} {"train_loss": -6.530477523803711, "global_step": 123716, "epoch": 2945} {"train_loss": -6.7024078369140625, "global_step": 123717, "epoch": 2945} {"train_loss": -6.6313934326171875, "global_step": 123718, "epoch": 2945} {"train_loss": -6.689317226409912, "global_step": 123719, "epoch": 2945} {"train_loss": -6.626821517944336, "global_step": 123720, "epoch": 2945} {"train_loss": -6.618192672729492, "global_step": 123721, "epoch": 2945} {"train_loss": -6.671777725219727, "global_step": 123722, "epoch": 2945} {"train_loss": -6.599515914916992, "global_step": 123723, "epoch": 2945} {"train_loss": -6.632845878601074, "global_step": 123724, "epoch": 2945} {"train_loss": -6.6396965980529785, "global_step": 123725, "epoch": 2945} {"train_loss": -6.5313520431518555, "global_step": 123726, "epoch": 2945} {"train_loss": -6.668335914611816, "global_step": 123727, "epoch": 2945} {"train_loss": -6.544610023498535, "global_step": 123728, "epoch": 2945} {"train_loss": -6.471316337585449, "global_step": 123729, "epoch": 2945} {"train_loss": -6.559328556060791, "global_step": 123730, "epoch": 2945} {"train_loss": -6.590959605716524, "global_step": 123731, "epoch": 2945, "val_loss": 66163.5} {"train_loss": -6.597090244293213, "global_step": 123732, "epoch": 2946} {"train_loss": -6.501875400543213, "global_step": 123733, "epoch": 2946} {"train_loss": -6.747219085693359, "global_step": 123734, "epoch": 2946} {"train_loss": -6.601809024810791, "global_step": 123735, "epoch": 2946} {"train_loss": -6.598060607910156, "global_step": 123736, "epoch": 2946} {"train_loss": -6.598146438598633, "global_step": 123737, "epoch": 2946} {"train_loss": -6.563917636871338, "global_step": 123738, "epoch": 2946} {"train_loss": -6.51765775680542, "global_step": 123739, "epoch": 2946} {"train_loss": -6.58613920211792, "global_step": 123740, "epoch": 2946} {"train_loss": -6.553565979003906, "global_step": 123741, "epoch": 2946} {"train_loss": -6.5787458419799805, "global_step": 123742, "epoch": 2946} {"train_loss": -6.540895938873291, "global_step": 123743, "epoch": 2946} {"train_loss": -6.54267692565918, "global_step": 123744, "epoch": 2946} {"train_loss": -6.53807258605957, "global_step": 123745, "epoch": 2946} {"train_loss": -6.648161888122559, "global_step": 123746, "epoch": 2946} {"train_loss": -6.755539894104004, "global_step": 123747, "epoch": 2946} {"train_loss": -6.534271240234375, "global_step": 123748, "epoch": 2946} {"train_loss": -6.773571968078613, "global_step": 123749, "epoch": 2946} {"train_loss": -6.576535701751709, "global_step": 123750, "epoch": 2946} {"train_loss": -6.538220405578613, "global_step": 123751, "epoch": 2946} {"train_loss": -6.664319038391113, "global_step": 123752, "epoch": 2946} {"train_loss": -6.639484882354736, "global_step": 123753, "epoch": 2946} {"train_loss": -6.605842590332031, "global_step": 123754, "epoch": 2946} {"train_loss": -6.731743812561035, "global_step": 123755, "epoch": 2946} {"train_loss": -6.646972179412842, "global_step": 123756, "epoch": 2946} {"train_loss": -6.663753032684326, "global_step": 123757, "epoch": 2946} {"train_loss": -6.534289360046387, "global_step": 123758, "epoch": 2946} {"train_loss": -6.634284496307373, "global_step": 123759, "epoch": 2946} {"train_loss": -6.752440929412842, "global_step": 123760, "epoch": 2946} {"train_loss": -6.610717296600342, "global_step": 123761, "epoch": 2946} {"train_loss": -6.549638748168945, "global_step": 123762, "epoch": 2946} {"train_loss": -6.611328125, "global_step": 123763, "epoch": 2946} {"train_loss": -6.621463775634766, "global_step": 123764, "epoch": 2946} {"train_loss": -6.561234474182129, "global_step": 123765, "epoch": 2946} {"train_loss": -6.466742038726807, "global_step": 123766, "epoch": 2946} {"train_loss": -6.459212303161621, "global_step": 123767, "epoch": 2946} {"train_loss": -6.466179370880127, "global_step": 123768, "epoch": 2946} {"train_loss": -6.312063217163086, "global_step": 123769, "epoch": 2946} {"train_loss": -6.611862659454346, "global_step": 123770, "epoch": 2946} {"train_loss": -6.526463508605957, "global_step": 123771, "epoch": 2946} {"train_loss": -6.4752726554870605, "global_step": 123772, "epoch": 2946} {"train_loss": -6.582105000813802, "global_step": 123773, "epoch": 2946, "val_loss": 65915.7109375} {"train_loss": -6.540332317352295, "global_step": 123774, "epoch": 2947} {"train_loss": -6.613029479980469, "global_step": 123775, "epoch": 2947} {"train_loss": -6.650113582611084, "global_step": 123776, "epoch": 2947} {"train_loss": -6.4736104011535645, "global_step": 123777, "epoch": 2947} {"train_loss": -6.523473739624023, "global_step": 123778, "epoch": 2947} {"train_loss": -6.601722717285156, "global_step": 123779, "epoch": 2947} {"train_loss": -6.600327014923096, "global_step": 123780, "epoch": 2947} {"train_loss": -6.649748802185059, "global_step": 123781, "epoch": 2947} {"train_loss": -6.6256866455078125, "global_step": 123782, "epoch": 2947} {"train_loss": -6.604198455810547, "global_step": 123783, "epoch": 2947} {"train_loss": -6.498925685882568, "global_step": 123784, "epoch": 2947} {"train_loss": -6.63722038269043, "global_step": 123785, "epoch": 2947} {"train_loss": -6.528372287750244, "global_step": 123786, "epoch": 2947} {"train_loss": -6.591327667236328, "global_step": 123787, "epoch": 2947} {"train_loss": -6.555170059204102, "global_step": 123788, "epoch": 2947} {"train_loss": -6.713789939880371, "global_step": 123789, "epoch": 2947} {"train_loss": -6.603713512420654, "global_step": 123790, "epoch": 2947} {"train_loss": -6.608097076416016, "global_step": 123791, "epoch": 2947} {"train_loss": -6.566064357757568, "global_step": 123792, "epoch": 2947} {"train_loss": -6.64666748046875, "global_step": 123793, "epoch": 2947} {"train_loss": -6.669009685516357, "global_step": 123794, "epoch": 2947} {"train_loss": -6.526108741760254, "global_step": 123795, "epoch": 2947} {"train_loss": -6.5316009521484375, "global_step": 123796, "epoch": 2947} {"train_loss": -6.6108503341674805, "global_step": 123797, "epoch": 2947} {"train_loss": -6.500912189483643, "global_step": 123798, "epoch": 2947} {"train_loss": -6.496641159057617, "global_step": 123799, "epoch": 2947} {"train_loss": -6.6203413009643555, "global_step": 123800, "epoch": 2947} {"train_loss": -6.441524505615234, "global_step": 123801, "epoch": 2947} {"train_loss": -6.456606864929199, "global_step": 123802, "epoch": 2947} {"train_loss": -6.456691265106201, "global_step": 123803, "epoch": 2947} {"train_loss": -6.475636959075928, "global_step": 123804, "epoch": 2947} {"train_loss": -6.402857780456543, "global_step": 123805, "epoch": 2947} {"train_loss": -6.516304969787598, "global_step": 123806, "epoch": 2947} {"train_loss": -6.477399826049805, "global_step": 123807, "epoch": 2947} {"train_loss": -6.440851211547852, "global_step": 123808, "epoch": 2947} {"train_loss": -6.440946578979492, "global_step": 123809, "epoch": 2947} {"train_loss": -6.454371452331543, "global_step": 123810, "epoch": 2947} {"train_loss": -6.545510768890381, "global_step": 123811, "epoch": 2947} {"train_loss": -6.477715015411377, "global_step": 123812, "epoch": 2947} {"train_loss": -6.503072738647461, "global_step": 123813, "epoch": 2947} {"train_loss": -6.484859466552734, "global_step": 123814, "epoch": 2947} {"train_loss": -6.544558911096482, "global_step": 123815, "epoch": 2947, "val_loss": 65815.125} {"train_loss": -6.518118381500244, "global_step": 123816, "epoch": 2948} {"train_loss": -6.492772579193115, "global_step": 123817, "epoch": 2948} {"train_loss": -6.398231506347656, "global_step": 123818, "epoch": 2948} {"train_loss": -6.648521423339844, "global_step": 123819, "epoch": 2948} {"train_loss": -6.519996643066406, "global_step": 123820, "epoch": 2948} {"train_loss": -6.520798683166504, "global_step": 123821, "epoch": 2948} {"train_loss": -6.484885215759277, "global_step": 123822, "epoch": 2948} {"train_loss": -6.490145683288574, "global_step": 123823, "epoch": 2948} {"train_loss": -6.540372848510742, "global_step": 123824, "epoch": 2948} {"train_loss": -6.540263652801514, "global_step": 123825, "epoch": 2948} {"train_loss": -6.627048015594482, "global_step": 123826, "epoch": 2948} {"train_loss": -6.580267429351807, "global_step": 123827, "epoch": 2948} {"train_loss": -6.6298441886901855, "global_step": 123828, "epoch": 2948} {"train_loss": -6.544745445251465, "global_step": 123829, "epoch": 2948} {"train_loss": -6.511455535888672, "global_step": 123830, "epoch": 2948} {"train_loss": -6.503525733947754, "global_step": 123831, "epoch": 2948} {"train_loss": -6.593526840209961, "global_step": 123832, "epoch": 2948} {"train_loss": -6.625548839569092, "global_step": 123833, "epoch": 2948} {"train_loss": -6.524299621582031, "global_step": 123834, "epoch": 2948} {"train_loss": -6.473021507263184, "global_step": 123835, "epoch": 2948} {"train_loss": -6.5414533615112305, "global_step": 123836, "epoch": 2948} {"train_loss": -6.568938255310059, "global_step": 123837, "epoch": 2948} {"train_loss": -6.659320831298828, "global_step": 123838, "epoch": 2948} {"train_loss": -6.5475969314575195, "global_step": 123839, "epoch": 2948} {"train_loss": -6.497732162475586, "global_step": 123840, "epoch": 2948} {"train_loss": -6.5548095703125, "global_step": 123841, "epoch": 2948} {"train_loss": -6.51093864440918, "global_step": 123842, "epoch": 2948} {"train_loss": -6.58799934387207, "global_step": 123843, "epoch": 2948} {"train_loss": -6.564209461212158, "global_step": 123844, "epoch": 2948} {"train_loss": -6.573285102844238, "global_step": 123845, "epoch": 2948} {"train_loss": -6.588357448577881, "global_step": 123846, "epoch": 2948} {"train_loss": -6.6811065673828125, "global_step": 123847, "epoch": 2948} {"train_loss": -6.423151016235352, "global_step": 123848, "epoch": 2948} {"train_loss": -6.666866302490234, "global_step": 123849, "epoch": 2948} {"train_loss": -6.579229354858398, "global_step": 123850, "epoch": 2948} {"train_loss": -6.583295822143555, "global_step": 123851, "epoch": 2948} {"train_loss": -6.552268028259277, "global_step": 123852, "epoch": 2948} {"train_loss": -6.565756797790527, "global_step": 123853, "epoch": 2948} {"train_loss": -6.464338302612305, "global_step": 123854, "epoch": 2948} {"train_loss": -6.647398471832275, "global_step": 123855, "epoch": 2948} {"train_loss": -6.590539932250977, "global_step": 123856, "epoch": 2948} {"train_loss": -6.555902481079102, "global_step": 123857, "epoch": 2948, "val_loss": 66053.421875} {"train_loss": -6.588354110717773, "global_step": 123858, "epoch": 2949} {"train_loss": -6.653128623962402, "global_step": 123859, "epoch": 2949} {"train_loss": -6.603328704833984, "global_step": 123860, "epoch": 2949} {"train_loss": -6.590512275695801, "global_step": 123861, "epoch": 2949} {"train_loss": -6.6328020095825195, "global_step": 123862, "epoch": 2949} {"train_loss": -6.468294620513916, "global_step": 123863, "epoch": 2949} {"train_loss": -6.555865287780762, "global_step": 123864, "epoch": 2949} {"train_loss": -6.660444259643555, "global_step": 123865, "epoch": 2949} {"train_loss": -6.627034664154053, "global_step": 123866, "epoch": 2949} {"train_loss": -6.656306266784668, "global_step": 123867, "epoch": 2949} {"train_loss": -6.669135093688965, "global_step": 123868, "epoch": 2949} {"train_loss": -6.653916835784912, "global_step": 123869, "epoch": 2949} {"train_loss": -6.675980091094971, "global_step": 123870, "epoch": 2949} {"train_loss": -6.6001362800598145, "global_step": 123871, "epoch": 2949} {"train_loss": -6.583622932434082, "global_step": 123872, "epoch": 2949} {"train_loss": -6.60213565826416, "global_step": 123873, "epoch": 2949} {"train_loss": -6.630585670471191, "global_step": 123874, "epoch": 2949} {"train_loss": -6.650916576385498, "global_step": 123875, "epoch": 2949} {"train_loss": -6.582608222961426, "global_step": 123876, "epoch": 2949} {"train_loss": -6.6518874168396, "global_step": 123877, "epoch": 2949} {"train_loss": -6.460781574249268, "global_step": 123878, "epoch": 2949} {"train_loss": -6.5545854568481445, "global_step": 123879, "epoch": 2949} {"train_loss": -6.618367671966553, "global_step": 123880, "epoch": 2949} {"train_loss": -6.531176567077637, "global_step": 123881, "epoch": 2949} {"train_loss": -6.598872184753418, "global_step": 123882, "epoch": 2949} {"train_loss": -6.6287946701049805, "global_step": 123883, "epoch": 2949} {"train_loss": -6.579713821411133, "global_step": 123884, "epoch": 2949} {"train_loss": -6.673036098480225, "global_step": 123885, "epoch": 2949} {"train_loss": -6.589878082275391, "global_step": 123886, "epoch": 2949} {"train_loss": -6.585630893707275, "global_step": 123887, "epoch": 2949} {"train_loss": -6.640320777893066, "global_step": 123888, "epoch": 2949} {"train_loss": -6.594758987426758, "global_step": 123889, "epoch": 2949} {"train_loss": -6.642906188964844, "global_step": 123890, "epoch": 2949} {"train_loss": -6.737559795379639, "global_step": 123891, "epoch": 2949} {"train_loss": -6.677146911621094, "global_step": 123892, "epoch": 2949} {"train_loss": -6.6189703941345215, "global_step": 123893, "epoch": 2949} {"train_loss": -6.625200271606445, "global_step": 123894, "epoch": 2949} {"train_loss": -6.59827995300293, "global_step": 123895, "epoch": 2949} {"train_loss": -6.694070816040039, "global_step": 123896, "epoch": 2949} {"train_loss": -6.547484397888184, "global_step": 123897, "epoch": 2949} {"train_loss": -6.488138675689697, "global_step": 123898, "epoch": 2949} {"train_loss": -6.610565912155878, "global_step": 123899, "epoch": 2949, "val_loss": 65931.53125} {"train_loss": -6.595061302185059, "global_step": 123900, "epoch": 2950} {"train_loss": -6.655848503112793, "global_step": 123901, "epoch": 2950} {"train_loss": -6.508561611175537, "global_step": 123902, "epoch": 2950} {"train_loss": -6.623995304107666, "global_step": 123903, "epoch": 2950} {"train_loss": -6.631078243255615, "global_step": 123904, "epoch": 2950} {"train_loss": -6.587039947509766, "global_step": 123905, "epoch": 2950} {"train_loss": -6.6286540031433105, "global_step": 123906, "epoch": 2950} {"train_loss": -6.581643104553223, "global_step": 123907, "epoch": 2950} {"train_loss": -6.6530609130859375, "global_step": 123908, "epoch": 2950} {"train_loss": -6.641380310058594, "global_step": 123909, "epoch": 2950} {"train_loss": -6.667168617248535, "global_step": 123910, "epoch": 2950} {"train_loss": -6.580964088439941, "global_step": 123911, "epoch": 2950} {"train_loss": -6.663217544555664, "global_step": 123912, "epoch": 2950} {"train_loss": -6.676042556762695, "global_step": 123913, "epoch": 2950} {"train_loss": -6.629367828369141, "global_step": 123914, "epoch": 2950} {"train_loss": -6.721475601196289, "global_step": 123915, "epoch": 2950} {"train_loss": -6.61524772644043, "global_step": 123916, "epoch": 2950} {"train_loss": -6.656355857849121, "global_step": 123917, "epoch": 2950} {"train_loss": -6.619701385498047, "global_step": 123918, "epoch": 2950} {"train_loss": -6.634828567504883, "global_step": 123919, "epoch": 2950} {"train_loss": -6.710914134979248, "global_step": 123920, "epoch": 2950} {"train_loss": -6.615645408630371, "global_step": 123921, "epoch": 2950} {"train_loss": -6.670844554901123, "global_step": 123922, "epoch": 2950} {"train_loss": -6.616188049316406, "global_step": 123923, "epoch": 2950} {"train_loss": -6.570095539093018, "global_step": 123924, "epoch": 2950} {"train_loss": -6.563103199005127, "global_step": 123925, "epoch": 2950} {"train_loss": -6.623769283294678, "global_step": 123926, "epoch": 2950} {"train_loss": -6.60081672668457, "global_step": 123927, "epoch": 2950} {"train_loss": -6.548310279846191, "global_step": 123928, "epoch": 2950} {"train_loss": -6.695596694946289, "global_step": 123929, "epoch": 2950} {"train_loss": -6.619093418121338, "global_step": 123930, "epoch": 2950} {"train_loss": -6.689310550689697, "global_step": 123931, "epoch": 2950} {"train_loss": -6.5662946701049805, "global_step": 123932, "epoch": 2950} {"train_loss": -6.737959384918213, "global_step": 123933, "epoch": 2950} {"train_loss": -6.580373764038086, "global_step": 123934, "epoch": 2950} {"train_loss": -6.598930358886719, "global_step": 123935, "epoch": 2950} {"train_loss": -6.768083572387695, "global_step": 123936, "epoch": 2950} {"train_loss": -6.692811489105225, "global_step": 123937, "epoch": 2950} {"train_loss": -6.573426246643066, "global_step": 123938, "epoch": 2950} {"train_loss": -6.624512672424316, "global_step": 123939, "epoch": 2950} {"train_loss": -6.638957977294922, "global_step": 123940, "epoch": 2950} {"train_loss": -6.630738269715082, "global_step": 123941, "epoch": 2950, "train/sim_max_reward_0": 0.19295775586476566, "train/sim_max_reward_1": 0.9613710137185697, "train/sim_max_reward_2": 0.925418230647816, "train/sim_max_reward_3": 0.12805080295777024, "train/sim_max_reward_4": 0.8572339580230343, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.23237359467641136, "test/sim_max_reward_4300002": 0.9366274619294395, "test/sim_max_reward_4300003": 0.9169064649406549, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.31906396095190576, "test/sim_max_reward_4300008": 0.5387059538693294, "test/sim_max_reward_4300009": 0.8475954270827445, "test/sim_max_reward_4300010": 0.8895971145078129, "test/sim_max_reward_4300011": 0.9467348893389157, "test/sim_max_reward_4300012": 0.919091979696619, "test/sim_max_reward_4300013": 0.9153792573691694, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9752826750867177, "test/sim_max_reward_4300016": 0.05720085709483749, "test/sim_max_reward_4300017": 0.9553694911210512, "test/sim_max_reward_4300018": 0.5383221220549385, "test/sim_max_reward_4300019": 0.18607668168307737, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.3575040990491371, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.32767907136880337, "test/sim_max_reward_4300024": 0.536243831331901, "test/sim_max_reward_4300025": 0.95219179323036, "test/sim_max_reward_4300026": 0.8566239119936868, "test/sim_max_reward_4300027": 1.0, "test/sim_max_reward_4300028": 3.1320201334312693e-07, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.9976702109182309, "test/sim_max_reward_4300031": 0.24243174458827546, "test/sim_max_reward_4300032": 0.9307144083826331, "test/sim_max_reward_4300033": 0.7050382205478127, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.2440440902598978, "test/sim_max_reward_4300036": 0.22160305104632114, "test/sim_max_reward_4300037": 0.8956001787108723, "test/sim_max_reward_4300038": 0.987668202358066, "test/sim_max_reward_4300039": 0.808076862165582, "test/sim_max_reward_4300040": 0.9823153650751608, "test/sim_max_reward_4300041": 0.938331037903751, "test/sim_max_reward_4300042": 0.7104186617464104, "test/sim_max_reward_4300043": 0.1802345274553809, "test/sim_max_reward_4300044": 0.9877812800485067, "test/sim_max_reward_4300045": 0.18699584055062132, "test/sim_max_reward_4300046": 0.8669750628630531, "test/sim_max_reward_4300047": 1.0, "test/sim_max_reward_4300048": 0.9885104994160325, "test/sim_max_reward_4300049": 0.26721818767419614, "train/mean_score": 0.5430027534290238, "test/mean_score": 0.6072406497619923, "val_loss": 65875.265625} {"train_loss": -6.730792999267578, "global_step": 123942, "epoch": 2951} {"train_loss": -6.599758148193359, "global_step": 123943, "epoch": 2951} {"train_loss": -6.7493062019348145, "global_step": 123944, "epoch": 2951} {"train_loss": -6.702037811279297, "global_step": 123945, "epoch": 2951} {"train_loss": -6.633196830749512, "global_step": 123946, "epoch": 2951} {"train_loss": -6.602866172790527, "global_step": 123947, "epoch": 2951} {"train_loss": -6.615008354187012, "global_step": 123948, "epoch": 2951} {"train_loss": -6.64279842376709, "global_step": 123949, "epoch": 2951} {"train_loss": -6.758541107177734, "global_step": 123950, "epoch": 2951} {"train_loss": -6.599823951721191, "global_step": 123951, "epoch": 2951} {"train_loss": -6.696791648864746, "global_step": 123952, "epoch": 2951} {"train_loss": -6.619470596313477, "global_step": 123953, "epoch": 2951} {"train_loss": -6.667746543884277, "global_step": 123954, "epoch": 2951} {"train_loss": -6.688812732696533, "global_step": 123955, "epoch": 2951} {"train_loss": -6.765326976776123, "global_step": 123956, "epoch": 2951} {"train_loss": -6.617678165435791, "global_step": 123957, "epoch": 2951} {"train_loss": -6.583393573760986, "global_step": 123958, "epoch": 2951} {"train_loss": -6.699678421020508, "global_step": 123959, "epoch": 2951} {"train_loss": -6.632948875427246, "global_step": 123960, "epoch": 2951} {"train_loss": -6.575153350830078, "global_step": 123961, "epoch": 2951} {"train_loss": -6.777896881103516, "global_step": 123962, "epoch": 2951} {"train_loss": -6.567212104797363, "global_step": 123963, "epoch": 2951} {"train_loss": -6.684299468994141, "global_step": 123964, "epoch": 2951} {"train_loss": -6.681031227111816, "global_step": 123965, "epoch": 2951} {"train_loss": -6.660998344421387, "global_step": 123966, "epoch": 2951} {"train_loss": -6.6687774658203125, "global_step": 123967, "epoch": 2951} {"train_loss": -6.688530921936035, "global_step": 123968, "epoch": 2951} {"train_loss": -6.731741905212402, "global_step": 123969, "epoch": 2951} {"train_loss": -6.632783889770508, "global_step": 123970, "epoch": 2951} {"train_loss": -6.626805305480957, "global_step": 123971, "epoch": 2951} {"train_loss": -6.676596164703369, "global_step": 123972, "epoch": 2951} {"train_loss": -6.645726203918457, "global_step": 123973, "epoch": 2951} {"train_loss": -6.691377639770508, "global_step": 123974, "epoch": 2951} {"train_loss": -6.583829879760742, "global_step": 123975, "epoch": 2951} {"train_loss": -6.654300689697266, "global_step": 123976, "epoch": 2951} {"train_loss": -6.639081954956055, "global_step": 123977, "epoch": 2951} {"train_loss": -6.556140899658203, "global_step": 123978, "epoch": 2951} {"train_loss": -6.556293487548828, "global_step": 123979, "epoch": 2951} {"train_loss": -6.640803813934326, "global_step": 123980, "epoch": 2951} {"train_loss": -6.485509872436523, "global_step": 123981, "epoch": 2951} {"train_loss": -6.531597137451172, "global_step": 123982, "epoch": 2951} {"train_loss": -6.6484895433698386, "global_step": 123983, "epoch": 2951, "val_loss": 66019.1015625} {"train_loss": -6.662110328674316, "global_step": 123984, "epoch": 2952} {"train_loss": -6.59275484085083, "global_step": 123985, "epoch": 2952} {"train_loss": -6.68560791015625, "global_step": 123986, "epoch": 2952} {"train_loss": -6.6657257080078125, "global_step": 123987, "epoch": 2952} {"train_loss": -6.734681129455566, "global_step": 123988, "epoch": 2952} {"train_loss": -6.6227707862854, "global_step": 123989, "epoch": 2952} {"train_loss": -6.744535446166992, "global_step": 123990, "epoch": 2952} {"train_loss": -6.6552839279174805, "global_step": 123991, "epoch": 2952} {"train_loss": -6.606597900390625, "global_step": 123992, "epoch": 2952} {"train_loss": -6.606166362762451, "global_step": 123993, "epoch": 2952} {"train_loss": -6.719344139099121, "global_step": 123994, "epoch": 2952} {"train_loss": -6.655220031738281, "global_step": 123995, "epoch": 2952} {"train_loss": -6.566242694854736, "global_step": 123996, "epoch": 2952} {"train_loss": -6.53306770324707, "global_step": 123997, "epoch": 2952} {"train_loss": -6.616754055023193, "global_step": 123998, "epoch": 2952} {"train_loss": -6.597517013549805, "global_step": 123999, "epoch": 2952} {"train_loss": -6.480123519897461, "global_step": 124000, "epoch": 2952} {"train_loss": -6.58880090713501, "global_step": 124001, "epoch": 2952} {"train_loss": -6.596507549285889, "global_step": 124002, "epoch": 2952} {"train_loss": -6.517242431640625, "global_step": 124003, "epoch": 2952} {"train_loss": -6.637082099914551, "global_step": 124004, "epoch": 2952} {"train_loss": -6.69690465927124, "global_step": 124005, "epoch": 2952} {"train_loss": -6.741069316864014, "global_step": 124006, "epoch": 2952} {"train_loss": -6.781137466430664, "global_step": 124007, "epoch": 2952} {"train_loss": -6.718985557556152, "global_step": 124008, "epoch": 2952} {"train_loss": -6.700348854064941, "global_step": 124009, "epoch": 2952} {"train_loss": -6.589450836181641, "global_step": 124010, "epoch": 2952} {"train_loss": -6.660022735595703, "global_step": 124011, "epoch": 2952} {"train_loss": -6.6272687911987305, "global_step": 124012, "epoch": 2952} {"train_loss": -6.63809871673584, "global_step": 124013, "epoch": 2952} {"train_loss": -6.65221643447876, "global_step": 124014, "epoch": 2952} {"train_loss": -6.614773750305176, "global_step": 124015, "epoch": 2952} {"train_loss": -6.626408576965332, "global_step": 124016, "epoch": 2952} {"train_loss": -6.6192474365234375, "global_step": 124017, "epoch": 2952} {"train_loss": -6.502828598022461, "global_step": 124018, "epoch": 2952} {"train_loss": -6.647977828979492, "global_step": 124019, "epoch": 2952} {"train_loss": -6.633285999298096, "global_step": 124020, "epoch": 2952} {"train_loss": -6.445713520050049, "global_step": 124021, "epoch": 2952} {"train_loss": -6.426464080810547, "global_step": 124022, "epoch": 2952} {"train_loss": -6.609111785888672, "global_step": 124023, "epoch": 2952} {"train_loss": -6.456070899963379, "global_step": 124024, "epoch": 2952} {"train_loss": -6.618398155484881, "global_step": 124025, "epoch": 2952, "val_loss": 66050.40625} {"train_loss": -6.650594711303711, "global_step": 124026, "epoch": 2953} {"train_loss": -6.638131141662598, "global_step": 124027, "epoch": 2953} {"train_loss": -6.634952068328857, "global_step": 124028, "epoch": 2953} {"train_loss": -6.508037567138672, "global_step": 124029, "epoch": 2953} {"train_loss": -6.64004373550415, "global_step": 124030, "epoch": 2953} {"train_loss": -6.639918327331543, "global_step": 124031, "epoch": 2953} {"train_loss": -6.711848258972168, "global_step": 124032, "epoch": 2953} {"train_loss": -6.6655049324035645, "global_step": 124033, "epoch": 2953} {"train_loss": -6.678764343261719, "global_step": 124034, "epoch": 2953} {"train_loss": -6.664466381072998, "global_step": 124035, "epoch": 2953} {"train_loss": -6.594293594360352, "global_step": 124036, "epoch": 2953} {"train_loss": -6.6638875007629395, "global_step": 124037, "epoch": 2953} {"train_loss": -6.708259105682373, "global_step": 124038, "epoch": 2953} {"train_loss": -6.68927001953125, "global_step": 124039, "epoch": 2953} {"train_loss": -6.5396647453308105, "global_step": 124040, "epoch": 2953} {"train_loss": -6.609710216522217, "global_step": 124041, "epoch": 2953} {"train_loss": -6.630092620849609, "global_step": 124042, "epoch": 2953} {"train_loss": -6.65293025970459, "global_step": 124043, "epoch": 2953} {"train_loss": -6.626777648925781, "global_step": 124044, "epoch": 2953} {"train_loss": -6.414817810058594, "global_step": 124045, "epoch": 2953} {"train_loss": -6.6249847412109375, "global_step": 124046, "epoch": 2953} {"train_loss": -6.528132438659668, "global_step": 124047, "epoch": 2953} {"train_loss": -6.676738262176514, "global_step": 124048, "epoch": 2953} {"train_loss": -6.535125732421875, "global_step": 124049, "epoch": 2953} {"train_loss": -6.613760948181152, "global_step": 124050, "epoch": 2953} {"train_loss": -6.615391731262207, "global_step": 124051, "epoch": 2953} {"train_loss": -6.493381500244141, "global_step": 124052, "epoch": 2953} {"train_loss": -6.552966117858887, "global_step": 124053, "epoch": 2953} {"train_loss": -6.541018962860107, "global_step": 124054, "epoch": 2953} {"train_loss": -6.527831554412842, "global_step": 124055, "epoch": 2953} {"train_loss": -6.524468421936035, "global_step": 124056, "epoch": 2953} {"train_loss": -6.4959564208984375, "global_step": 124057, "epoch": 2953} {"train_loss": -6.36647891998291, "global_step": 124058, "epoch": 2953} {"train_loss": -6.608419895172119, "global_step": 124059, "epoch": 2953} {"train_loss": -6.573424339294434, "global_step": 124060, "epoch": 2953} {"train_loss": -6.467432975769043, "global_step": 124061, "epoch": 2953} {"train_loss": -6.553275108337402, "global_step": 124062, "epoch": 2953} {"train_loss": -6.416396141052246, "global_step": 124063, "epoch": 2953} {"train_loss": -6.610920429229736, "global_step": 124064, "epoch": 2953} {"train_loss": -6.526498794555664, "global_step": 124065, "epoch": 2953} {"train_loss": -6.5241265296936035, "global_step": 124066, "epoch": 2953} {"train_loss": -6.585881199155535, "global_step": 124067, "epoch": 2953, "val_loss": 65954.1171875} {"train_loss": -6.574013710021973, "global_step": 124068, "epoch": 2954} {"train_loss": -6.605589866638184, "global_step": 124069, "epoch": 2954} {"train_loss": -6.664648056030273, "global_step": 124070, "epoch": 2954} {"train_loss": -6.671953201293945, "global_step": 124071, "epoch": 2954} {"train_loss": -6.628530025482178, "global_step": 124072, "epoch": 2954} {"train_loss": -6.526817798614502, "global_step": 124073, "epoch": 2954} {"train_loss": -6.668240547180176, "global_step": 124074, "epoch": 2954} {"train_loss": -6.626288414001465, "global_step": 124075, "epoch": 2954} {"train_loss": -6.496070861816406, "global_step": 124076, "epoch": 2954} {"train_loss": -6.575831413269043, "global_step": 124077, "epoch": 2954} {"train_loss": -6.670058727264404, "global_step": 124078, "epoch": 2954} {"train_loss": -6.465463638305664, "global_step": 124079, "epoch": 2954} {"train_loss": -6.472580909729004, "global_step": 124080, "epoch": 2954} {"train_loss": -6.584439277648926, "global_step": 124081, "epoch": 2954} {"train_loss": -6.54004430770874, "global_step": 124082, "epoch": 2954} {"train_loss": -6.529779434204102, "global_step": 124083, "epoch": 2954} {"train_loss": -6.597519874572754, "global_step": 124084, "epoch": 2954} {"train_loss": -6.643283843994141, "global_step": 124085, "epoch": 2954} {"train_loss": -6.658841133117676, "global_step": 124086, "epoch": 2954} {"train_loss": -6.5684895515441895, "global_step": 124087, "epoch": 2954} {"train_loss": -6.522428512573242, "global_step": 124088, "epoch": 2954} {"train_loss": -6.652716636657715, "global_step": 124089, "epoch": 2954} {"train_loss": -6.654638767242432, "global_step": 124090, "epoch": 2954} {"train_loss": -6.605924606323242, "global_step": 124091, "epoch": 2954} {"train_loss": -6.634498596191406, "global_step": 124092, "epoch": 2954} {"train_loss": -6.622903823852539, "global_step": 124093, "epoch": 2954} {"train_loss": -6.635156154632568, "global_step": 124094, "epoch": 2954} {"train_loss": -6.664527416229248, "global_step": 124095, "epoch": 2954} {"train_loss": -6.439323902130127, "global_step": 124096, "epoch": 2954} {"train_loss": -6.599491119384766, "global_step": 124097, "epoch": 2954} {"train_loss": -6.519442558288574, "global_step": 124098, "epoch": 2954} {"train_loss": -6.491279602050781, "global_step": 124099, "epoch": 2954} {"train_loss": -6.575436115264893, "global_step": 124100, "epoch": 2954} {"train_loss": -6.563796043395996, "global_step": 124101, "epoch": 2954} {"train_loss": -6.47873067855835, "global_step": 124102, "epoch": 2954} {"train_loss": -6.556914806365967, "global_step": 124103, "epoch": 2954} {"train_loss": -6.623629093170166, "global_step": 124104, "epoch": 2954} {"train_loss": -6.662247657775879, "global_step": 124105, "epoch": 2954} {"train_loss": -6.411098480224609, "global_step": 124106, "epoch": 2954} {"train_loss": -6.583248138427734, "global_step": 124107, "epoch": 2954} {"train_loss": -6.657265663146973, "global_step": 124108, "epoch": 2954} {"train_loss": -6.581663131713867, "global_step": 124109, "epoch": 2954, "val_loss": 65876.375} {"train_loss": -6.599935531616211, "global_step": 124110, "epoch": 2955} {"train_loss": -6.442893028259277, "global_step": 124111, "epoch": 2955} {"train_loss": -6.589751243591309, "global_step": 124112, "epoch": 2955} {"train_loss": -6.471497535705566, "global_step": 124113, "epoch": 2955} {"train_loss": -6.532568454742432, "global_step": 124114, "epoch": 2955} {"train_loss": -6.531947612762451, "global_step": 124115, "epoch": 2955} {"train_loss": -6.6223649978637695, "global_step": 124116, "epoch": 2955} {"train_loss": -6.409953594207764, "global_step": 124117, "epoch": 2955} {"train_loss": -6.6229753494262695, "global_step": 124118, "epoch": 2955} {"train_loss": -6.482044219970703, "global_step": 124119, "epoch": 2955} {"train_loss": -6.598864555358887, "global_step": 124120, "epoch": 2955} {"train_loss": -6.50118350982666, "global_step": 124121, "epoch": 2955} {"train_loss": -6.498574256896973, "global_step": 124122, "epoch": 2955} {"train_loss": -6.554702281951904, "global_step": 124123, "epoch": 2955} {"train_loss": -6.505016803741455, "global_step": 124124, "epoch": 2955} {"train_loss": -6.523529529571533, "global_step": 124125, "epoch": 2955} {"train_loss": -6.410496711730957, "global_step": 124126, "epoch": 2955} {"train_loss": -6.574876308441162, "global_step": 124127, "epoch": 2955} {"train_loss": -6.57359504699707, "global_step": 124128, "epoch": 2955} {"train_loss": -6.585737228393555, "global_step": 124129, "epoch": 2955} {"train_loss": -6.515596866607666, "global_step": 124130, "epoch": 2955} {"train_loss": -6.527395248413086, "global_step": 124131, "epoch": 2955} {"train_loss": -6.541518211364746, "global_step": 124132, "epoch": 2955} {"train_loss": -6.652890205383301, "global_step": 124133, "epoch": 2955} {"train_loss": -6.642961502075195, "global_step": 124134, "epoch": 2955} {"train_loss": -6.581786632537842, "global_step": 124135, "epoch": 2955} {"train_loss": -6.540140151977539, "global_step": 124136, "epoch": 2955} {"train_loss": -6.592872619628906, "global_step": 124137, "epoch": 2955} {"train_loss": -6.649347305297852, "global_step": 124138, "epoch": 2955} {"train_loss": -6.60248327255249, "global_step": 124139, "epoch": 2955} {"train_loss": -6.620926380157471, "global_step": 124140, "epoch": 2955} {"train_loss": -6.566985130310059, "global_step": 124141, "epoch": 2955} {"train_loss": -6.623327255249023, "global_step": 124142, "epoch": 2955} {"train_loss": -6.4722394943237305, "global_step": 124143, "epoch": 2955} {"train_loss": -6.683446884155273, "global_step": 124144, "epoch": 2955} {"train_loss": -6.5891642570495605, "global_step": 124145, "epoch": 2955} {"train_loss": -6.692437171936035, "global_step": 124146, "epoch": 2955} {"train_loss": -6.561872482299805, "global_step": 124147, "epoch": 2955} {"train_loss": -6.600009918212891, "global_step": 124148, "epoch": 2955} {"train_loss": -6.585513114929199, "global_step": 124149, "epoch": 2955} {"train_loss": -6.639861583709717, "global_step": 124150, "epoch": 2955} {"train_loss": -6.565529789243426, "global_step": 124151, "epoch": 2955, "val_loss": 66281.0859375} {"train_loss": -6.583610534667969, "global_step": 124152, "epoch": 2956} {"train_loss": -6.5890655517578125, "global_step": 124153, "epoch": 2956} {"train_loss": -6.649971961975098, "global_step": 124154, "epoch": 2956} {"train_loss": -6.605804443359375, "global_step": 124155, "epoch": 2956} {"train_loss": -6.558326721191406, "global_step": 124156, "epoch": 2956} {"train_loss": -6.646602630615234, "global_step": 124157, "epoch": 2956} {"train_loss": -6.6769914627075195, "global_step": 124158, "epoch": 2956} {"train_loss": -6.665127754211426, "global_step": 124159, "epoch": 2956} {"train_loss": -6.612820148468018, "global_step": 124160, "epoch": 2956} {"train_loss": -6.618792533874512, "global_step": 124161, "epoch": 2956} {"train_loss": -6.71042537689209, "global_step": 124162, "epoch": 2956} {"train_loss": -6.6136369705200195, "global_step": 124163, "epoch": 2956} {"train_loss": -6.538209915161133, "global_step": 124164, "epoch": 2956} {"train_loss": -6.668494701385498, "global_step": 124165, "epoch": 2956} {"train_loss": -6.521540641784668, "global_step": 124166, "epoch": 2956} {"train_loss": -6.684475898742676, "global_step": 124167, "epoch": 2956} {"train_loss": -6.662412643432617, "global_step": 124168, "epoch": 2956} {"train_loss": -6.663714408874512, "global_step": 124169, "epoch": 2956} {"train_loss": -6.625406265258789, "global_step": 124170, "epoch": 2956} {"train_loss": -6.538724422454834, "global_step": 124171, "epoch": 2956} {"train_loss": -6.682318687438965, "global_step": 124172, "epoch": 2956} {"train_loss": -6.586006164550781, "global_step": 124173, "epoch": 2956} {"train_loss": -6.650881767272949, "global_step": 124174, "epoch": 2956} {"train_loss": -6.648411750793457, "global_step": 124175, "epoch": 2956} {"train_loss": -6.607217788696289, "global_step": 124176, "epoch": 2956} {"train_loss": -6.637913703918457, "global_step": 124177, "epoch": 2956} {"train_loss": -6.574061393737793, "global_step": 124178, "epoch": 2956} {"train_loss": -6.609803676605225, "global_step": 124179, "epoch": 2956} {"train_loss": -6.61506462097168, "global_step": 124180, "epoch": 2956} {"train_loss": -6.592617034912109, "global_step": 124181, "epoch": 2956} {"train_loss": -6.591976642608643, "global_step": 124182, "epoch": 2956} {"train_loss": -6.625768184661865, "global_step": 124183, "epoch": 2956} {"train_loss": -6.5886383056640625, "global_step": 124184, "epoch": 2956} {"train_loss": -6.572880268096924, "global_step": 124185, "epoch": 2956} {"train_loss": -6.604241847991943, "global_step": 124186, "epoch": 2956} {"train_loss": -6.5818586349487305, "global_step": 124187, "epoch": 2956} {"train_loss": -6.635822296142578, "global_step": 124188, "epoch": 2956} {"train_loss": -6.625096797943115, "global_step": 124189, "epoch": 2956} {"train_loss": -6.58090877532959, "global_step": 124190, "epoch": 2956} {"train_loss": -6.603930473327637, "global_step": 124191, "epoch": 2956} {"train_loss": -6.638640403747559, "global_step": 124192, "epoch": 2956} {"train_loss": -6.616437196731567, "global_step": 124193, "epoch": 2956, "val_loss": 66369.59375} {"train_loss": -6.558620452880859, "global_step": 124194, "epoch": 2957} {"train_loss": -6.655675411224365, "global_step": 124195, "epoch": 2957} {"train_loss": -6.633786678314209, "global_step": 124196, "epoch": 2957} {"train_loss": -6.53872013092041, "global_step": 124197, "epoch": 2957} {"train_loss": -6.650970458984375, "global_step": 124198, "epoch": 2957} {"train_loss": -6.455862522125244, "global_step": 124199, "epoch": 2957} {"train_loss": -6.546879768371582, "global_step": 124200, "epoch": 2957} {"train_loss": -6.715091228485107, "global_step": 124201, "epoch": 2957} {"train_loss": -6.620924949645996, "global_step": 124202, "epoch": 2957} {"train_loss": -6.601972579956055, "global_step": 124203, "epoch": 2957} {"train_loss": -6.570257186889648, "global_step": 124204, "epoch": 2957} {"train_loss": -6.464896202087402, "global_step": 124205, "epoch": 2957} {"train_loss": -6.633452892303467, "global_step": 124206, "epoch": 2957} {"train_loss": -6.494692802429199, "global_step": 124207, "epoch": 2957} {"train_loss": -6.563495635986328, "global_step": 124208, "epoch": 2957} {"train_loss": -6.570526123046875, "global_step": 124209, "epoch": 2957} {"train_loss": -6.595677375793457, "global_step": 124210, "epoch": 2957} {"train_loss": -6.645539283752441, "global_step": 124211, "epoch": 2957} {"train_loss": -6.626027584075928, "global_step": 124212, "epoch": 2957} {"train_loss": -6.5850396156311035, "global_step": 124213, "epoch": 2957} {"train_loss": -6.5755767822265625, "global_step": 124214, "epoch": 2957} {"train_loss": -6.554161071777344, "global_step": 124215, "epoch": 2957} {"train_loss": -6.648909568786621, "global_step": 124216, "epoch": 2957} {"train_loss": -6.449470520019531, "global_step": 124217, "epoch": 2957} {"train_loss": -6.654303550720215, "global_step": 124218, "epoch": 2957} {"train_loss": -6.571772575378418, "global_step": 124219, "epoch": 2957} {"train_loss": -6.4204912185668945, "global_step": 124220, "epoch": 2957} {"train_loss": -6.737957000732422, "global_step": 124221, "epoch": 2957} {"train_loss": -6.567836761474609, "global_step": 124222, "epoch": 2957} {"train_loss": -6.487808704376221, "global_step": 124223, "epoch": 2957} {"train_loss": -6.607781410217285, "global_step": 124224, "epoch": 2957} {"train_loss": -6.486189365386963, "global_step": 124225, "epoch": 2957} {"train_loss": -6.648735046386719, "global_step": 124226, "epoch": 2957} {"train_loss": -6.590225696563721, "global_step": 124227, "epoch": 2957} {"train_loss": -6.5635881423950195, "global_step": 124228, "epoch": 2957} {"train_loss": -6.65602445602417, "global_step": 124229, "epoch": 2957} {"train_loss": -6.573076248168945, "global_step": 124230, "epoch": 2957} {"train_loss": -6.661161422729492, "global_step": 124231, "epoch": 2957} {"train_loss": -6.5872955322265625, "global_step": 124232, "epoch": 2957} {"train_loss": -6.557161331176758, "global_step": 124233, "epoch": 2957} {"train_loss": -6.614660739898682, "global_step": 124234, "epoch": 2957} {"train_loss": -6.582523345947266, "global_step": 124235, "epoch": 2957, "val_loss": 66012.1171875} {"train_loss": -6.619475841522217, "global_step": 124236, "epoch": 2958} {"train_loss": -6.595534324645996, "global_step": 124237, "epoch": 2958} {"train_loss": -6.696893692016602, "global_step": 124238, "epoch": 2958} {"train_loss": -6.618895530700684, "global_step": 124239, "epoch": 2958} {"train_loss": -6.552938461303711, "global_step": 124240, "epoch": 2958} {"train_loss": -6.621548652648926, "global_step": 124241, "epoch": 2958} {"train_loss": -6.602540969848633, "global_step": 124242, "epoch": 2958} {"train_loss": -6.494017601013184, "global_step": 124243, "epoch": 2958} {"train_loss": -6.566612243652344, "global_step": 124244, "epoch": 2958} {"train_loss": -6.608828544616699, "global_step": 124245, "epoch": 2958} {"train_loss": -6.548225402832031, "global_step": 124246, "epoch": 2958} {"train_loss": -6.553025245666504, "global_step": 124247, "epoch": 2958} {"train_loss": -6.580533027648926, "global_step": 124248, "epoch": 2958} {"train_loss": -6.600283145904541, "global_step": 124249, "epoch": 2958} {"train_loss": -6.620125770568848, "global_step": 124250, "epoch": 2958} {"train_loss": -6.654185771942139, "global_step": 124251, "epoch": 2958} {"train_loss": -6.726015090942383, "global_step": 124252, "epoch": 2958} {"train_loss": -6.5701775550842285, "global_step": 124253, "epoch": 2958} {"train_loss": -6.569292068481445, "global_step": 124254, "epoch": 2958} {"train_loss": -6.498115539550781, "global_step": 124255, "epoch": 2958} {"train_loss": -6.6165361404418945, "global_step": 124256, "epoch": 2958} {"train_loss": -6.593967437744141, "global_step": 124257, "epoch": 2958} {"train_loss": -6.733412742614746, "global_step": 124258, "epoch": 2958} {"train_loss": -6.595346450805664, "global_step": 124259, "epoch": 2958} {"train_loss": -6.620716094970703, "global_step": 124260, "epoch": 2958} {"train_loss": -6.543133735656738, "global_step": 124261, "epoch": 2958} {"train_loss": -6.7727813720703125, "global_step": 124262, "epoch": 2958} {"train_loss": -6.721616744995117, "global_step": 124263, "epoch": 2958} {"train_loss": -6.639971733093262, "global_step": 124264, "epoch": 2958} {"train_loss": -6.651041507720947, "global_step": 124265, "epoch": 2958} {"train_loss": -6.547468185424805, "global_step": 124266, "epoch": 2958} {"train_loss": -6.673795700073242, "global_step": 124267, "epoch": 2958} {"train_loss": -6.529568672180176, "global_step": 124268, "epoch": 2958} {"train_loss": -6.510680198669434, "global_step": 124269, "epoch": 2958} {"train_loss": -6.526147842407227, "global_step": 124270, "epoch": 2958} {"train_loss": -6.645031929016113, "global_step": 124271, "epoch": 2958} {"train_loss": -6.567417144775391, "global_step": 124272, "epoch": 2958} {"train_loss": -6.353826522827148, "global_step": 124273, "epoch": 2958} {"train_loss": -6.741576194763184, "global_step": 124274, "epoch": 2958} {"train_loss": -6.591213226318359, "global_step": 124275, "epoch": 2958} {"train_loss": -6.679760932922363, "global_step": 124276, "epoch": 2958} {"train_loss": -6.6046649387904575, "global_step": 124277, "epoch": 2958, "val_loss": 66130.3359375} {"train_loss": -6.494330406188965, "global_step": 124278, "epoch": 2959} {"train_loss": -6.680660247802734, "global_step": 124279, "epoch": 2959} {"train_loss": -6.590996265411377, "global_step": 124280, "epoch": 2959} {"train_loss": -6.582673072814941, "global_step": 124281, "epoch": 2959} {"train_loss": -6.596508502960205, "global_step": 124282, "epoch": 2959} {"train_loss": -6.664729118347168, "global_step": 124283, "epoch": 2959} {"train_loss": -6.555542945861816, "global_step": 124284, "epoch": 2959} {"train_loss": -6.635876178741455, "global_step": 124285, "epoch": 2959} {"train_loss": -6.738966941833496, "global_step": 124286, "epoch": 2959} {"train_loss": -6.583446979522705, "global_step": 124287, "epoch": 2959} {"train_loss": -6.595537185668945, "global_step": 124288, "epoch": 2959} {"train_loss": -6.56024169921875, "global_step": 124289, "epoch": 2959} {"train_loss": -6.556797981262207, "global_step": 124290, "epoch": 2959} {"train_loss": -6.625312805175781, "global_step": 124291, "epoch": 2959} {"train_loss": -6.4506449699401855, "global_step": 124292, "epoch": 2959} {"train_loss": -6.718790531158447, "global_step": 124293, "epoch": 2959} {"train_loss": -6.6631879806518555, "global_step": 124294, "epoch": 2959} {"train_loss": -6.645648002624512, "global_step": 124295, "epoch": 2959} {"train_loss": -6.695350646972656, "global_step": 124296, "epoch": 2959} {"train_loss": -6.59233283996582, "global_step": 124297, "epoch": 2959} {"train_loss": -6.659449100494385, "global_step": 124298, "epoch": 2959} {"train_loss": -6.585244655609131, "global_step": 124299, "epoch": 2959} {"train_loss": -6.69539213180542, "global_step": 124300, "epoch": 2959} {"train_loss": -6.640765190124512, "global_step": 124301, "epoch": 2959} {"train_loss": -6.497414588928223, "global_step": 124302, "epoch": 2959} {"train_loss": -6.678980350494385, "global_step": 124303, "epoch": 2959} {"train_loss": -6.652000427246094, "global_step": 124304, "epoch": 2959} {"train_loss": -6.749936103820801, "global_step": 124305, "epoch": 2959} {"train_loss": -6.689078330993652, "global_step": 124306, "epoch": 2959} {"train_loss": -6.540494918823242, "global_step": 124307, "epoch": 2959} {"train_loss": -6.730504989624023, "global_step": 124308, "epoch": 2959} {"train_loss": -6.617613792419434, "global_step": 124309, "epoch": 2959} {"train_loss": -6.612058639526367, "global_step": 124310, "epoch": 2959} {"train_loss": -6.546352386474609, "global_step": 124311, "epoch": 2959} {"train_loss": -6.564705848693848, "global_step": 124312, "epoch": 2959} {"train_loss": -6.6374311447143555, "global_step": 124313, "epoch": 2959} {"train_loss": -6.668623924255371, "global_step": 124314, "epoch": 2959} {"train_loss": -6.650054931640625, "global_step": 124315, "epoch": 2959} {"train_loss": -6.6573028564453125, "global_step": 124316, "epoch": 2959} {"train_loss": -6.611324310302734, "global_step": 124317, "epoch": 2959} {"train_loss": -6.6909356117248535, "global_step": 124318, "epoch": 2959} {"train_loss": -6.626881406420753, "global_step": 124319, "epoch": 2959, "val_loss": 66017.1953125} {"train_loss": -6.591464519500732, "global_step": 124320, "epoch": 2960} {"train_loss": -6.685129165649414, "global_step": 124321, "epoch": 2960} {"train_loss": -6.585503101348877, "global_step": 124322, "epoch": 2960} {"train_loss": -6.579402446746826, "global_step": 124323, "epoch": 2960} {"train_loss": -6.547205924987793, "global_step": 124324, "epoch": 2960} {"train_loss": -6.608194351196289, "global_step": 124325, "epoch": 2960} {"train_loss": -6.66096305847168, "global_step": 124326, "epoch": 2960} {"train_loss": -6.6715087890625, "global_step": 124327, "epoch": 2960} {"train_loss": -6.474099159240723, "global_step": 124328, "epoch": 2960} {"train_loss": -6.588908672332764, "global_step": 124329, "epoch": 2960} {"train_loss": -6.671246528625488, "global_step": 124330, "epoch": 2960} {"train_loss": -6.582084655761719, "global_step": 124331, "epoch": 2960} {"train_loss": -6.556511878967285, "global_step": 124332, "epoch": 2960} {"train_loss": -6.746112823486328, "global_step": 124333, "epoch": 2960} {"train_loss": -6.686579704284668, "global_step": 124334, "epoch": 2960} {"train_loss": -6.5633063316345215, "global_step": 124335, "epoch": 2960} {"train_loss": -6.610664367675781, "global_step": 124336, "epoch": 2960} {"train_loss": -6.701298713684082, "global_step": 124337, "epoch": 2960} {"train_loss": -6.6257524490356445, "global_step": 124338, "epoch": 2960} {"train_loss": -6.6323561668396, "global_step": 124339, "epoch": 2960} {"train_loss": -6.64028263092041, "global_step": 124340, "epoch": 2960} {"train_loss": -6.678571701049805, "global_step": 124341, "epoch": 2960} {"train_loss": -6.618391036987305, "global_step": 124342, "epoch": 2960} {"train_loss": -6.583829879760742, "global_step": 124343, "epoch": 2960} {"train_loss": -6.708701133728027, "global_step": 124344, "epoch": 2960} {"train_loss": -6.54145622253418, "global_step": 124345, "epoch": 2960} {"train_loss": -6.545708656311035, "global_step": 124346, "epoch": 2960} {"train_loss": -6.600286483764648, "global_step": 124347, "epoch": 2960} {"train_loss": -6.612348556518555, "global_step": 124348, "epoch": 2960} {"train_loss": -6.4185333251953125, "global_step": 124349, "epoch": 2960} {"train_loss": -6.535451412200928, "global_step": 124350, "epoch": 2960} {"train_loss": -6.367423057556152, "global_step": 124351, "epoch": 2960} {"train_loss": -6.480137825012207, "global_step": 124352, "epoch": 2960} {"train_loss": -6.600167274475098, "global_step": 124353, "epoch": 2960} {"train_loss": -6.453710079193115, "global_step": 124354, "epoch": 2960} {"train_loss": -6.471430778503418, "global_step": 124355, "epoch": 2960} {"train_loss": -6.464017391204834, "global_step": 124356, "epoch": 2960} {"train_loss": -6.473937034606934, "global_step": 124357, "epoch": 2960} {"train_loss": -6.5874342918396, "global_step": 124358, "epoch": 2960} {"train_loss": -6.46749210357666, "global_step": 124359, "epoch": 2960} {"train_loss": -6.50848388671875, "global_step": 124360, "epoch": 2960} {"train_loss": -6.577777533304124, "global_step": 124361, "epoch": 2960, "val_loss": 66231.109375} {"train_loss": -6.618495941162109, "global_step": 124362, "epoch": 2961} {"train_loss": -6.6036224365234375, "global_step": 124363, "epoch": 2961} {"train_loss": -6.458805084228516, "global_step": 124364, "epoch": 2961} {"train_loss": -6.650895118713379, "global_step": 124365, "epoch": 2961} {"train_loss": -6.495622634887695, "global_step": 124366, "epoch": 2961} {"train_loss": -6.57718563079834, "global_step": 124367, "epoch": 2961} {"train_loss": -6.394284248352051, "global_step": 124368, "epoch": 2961} {"train_loss": -6.646637439727783, "global_step": 124369, "epoch": 2961} {"train_loss": -6.431644916534424, "global_step": 124370, "epoch": 2961} {"train_loss": -6.535042762756348, "global_step": 124371, "epoch": 2961} {"train_loss": -6.527678489685059, "global_step": 124372, "epoch": 2961} {"train_loss": -6.56935977935791, "global_step": 124373, "epoch": 2961} {"train_loss": -6.4185285568237305, "global_step": 124374, "epoch": 2961} {"train_loss": -6.606926918029785, "global_step": 124375, "epoch": 2961} {"train_loss": -6.6211113929748535, "global_step": 124376, "epoch": 2961} {"train_loss": -6.587925910949707, "global_step": 124377, "epoch": 2961} {"train_loss": -6.597579002380371, "global_step": 124378, "epoch": 2961} {"train_loss": -6.60500431060791, "global_step": 124379, "epoch": 2961} {"train_loss": -6.7156476974487305, "global_step": 124380, "epoch": 2961} {"train_loss": -6.569824695587158, "global_step": 124381, "epoch": 2961} {"train_loss": -6.597592353820801, "global_step": 124382, "epoch": 2961} {"train_loss": -6.657639503479004, "global_step": 124383, "epoch": 2961} {"train_loss": -6.653268814086914, "global_step": 124384, "epoch": 2961} {"train_loss": -6.663404941558838, "global_step": 124385, "epoch": 2961} {"train_loss": -6.618894100189209, "global_step": 124386, "epoch": 2961} {"train_loss": -6.693830966949463, "global_step": 124387, "epoch": 2961} {"train_loss": -6.5664520263671875, "global_step": 124388, "epoch": 2961} {"train_loss": -6.54312801361084, "global_step": 124389, "epoch": 2961} {"train_loss": -6.742887496948242, "global_step": 124390, "epoch": 2961} {"train_loss": -6.605285167694092, "global_step": 124391, "epoch": 2961} {"train_loss": -6.588659763336182, "global_step": 124392, "epoch": 2961} {"train_loss": -6.6939496994018555, "global_step": 124393, "epoch": 2961} {"train_loss": -6.616501331329346, "global_step": 124394, "epoch": 2961} {"train_loss": -6.750705718994141, "global_step": 124395, "epoch": 2961} {"train_loss": -6.711810111999512, "global_step": 124396, "epoch": 2961} {"train_loss": -6.610504627227783, "global_step": 124397, "epoch": 2961} {"train_loss": -6.608036994934082, "global_step": 124398, "epoch": 2961} {"train_loss": -6.719480037689209, "global_step": 124399, "epoch": 2961} {"train_loss": -6.564809322357178, "global_step": 124400, "epoch": 2961} {"train_loss": -6.595336437225342, "global_step": 124401, "epoch": 2961} {"train_loss": -6.584132194519043, "global_step": 124402, "epoch": 2961} {"train_loss": -6.598714737665086, "global_step": 124403, "epoch": 2961, "val_loss": 66030.9375} {"train_loss": -6.583695888519287, "global_step": 124404, "epoch": 2962} {"train_loss": -6.591477394104004, "global_step": 124405, "epoch": 2962} {"train_loss": -6.631369590759277, "global_step": 124406, "epoch": 2962} {"train_loss": -6.6331610679626465, "global_step": 124407, "epoch": 2962} {"train_loss": -6.5976433753967285, "global_step": 124408, "epoch": 2962} {"train_loss": -6.561775207519531, "global_step": 124409, "epoch": 2962} {"train_loss": -6.549955368041992, "global_step": 124410, "epoch": 2962} {"train_loss": -6.53920841217041, "global_step": 124411, "epoch": 2962} {"train_loss": -6.652132034301758, "global_step": 124412, "epoch": 2962} {"train_loss": -6.671097755432129, "global_step": 124413, "epoch": 2962} {"train_loss": -6.566056728363037, "global_step": 124414, "epoch": 2962} {"train_loss": -6.763830184936523, "global_step": 124415, "epoch": 2962} {"train_loss": -6.656590461730957, "global_step": 124416, "epoch": 2962} {"train_loss": -6.677535057067871, "global_step": 124417, "epoch": 2962} {"train_loss": -6.612469673156738, "global_step": 124418, "epoch": 2962} {"train_loss": -6.737749099731445, "global_step": 124419, "epoch": 2962} {"train_loss": -6.625349044799805, "global_step": 124420, "epoch": 2962} {"train_loss": -6.669124603271484, "global_step": 124421, "epoch": 2962} {"train_loss": -6.662741661071777, "global_step": 124422, "epoch": 2962} {"train_loss": -6.694467067718506, "global_step": 124423, "epoch": 2962} {"train_loss": -6.68421745300293, "global_step": 124424, "epoch": 2962} {"train_loss": -6.652259826660156, "global_step": 124425, "epoch": 2962} {"train_loss": -6.5144944190979, "global_step": 124426, "epoch": 2962} {"train_loss": -6.6517744064331055, "global_step": 124427, "epoch": 2962} {"train_loss": -6.545091152191162, "global_step": 124428, "epoch": 2962} {"train_loss": -6.5797576904296875, "global_step": 124429, "epoch": 2962} {"train_loss": -6.640583038330078, "global_step": 124430, "epoch": 2962} {"train_loss": -6.603650093078613, "global_step": 124431, "epoch": 2962} {"train_loss": -6.584826469421387, "global_step": 124432, "epoch": 2962} {"train_loss": -6.650152206420898, "global_step": 124433, "epoch": 2962} {"train_loss": -6.637836933135986, "global_step": 124434, "epoch": 2962} {"train_loss": -6.693227767944336, "global_step": 124435, "epoch": 2962} {"train_loss": -6.699701309204102, "global_step": 124436, "epoch": 2962} {"train_loss": -6.682244300842285, "global_step": 124437, "epoch": 2962} {"train_loss": -6.709253311157227, "global_step": 124438, "epoch": 2962} {"train_loss": -6.610001087188721, "global_step": 124439, "epoch": 2962} {"train_loss": -6.611215591430664, "global_step": 124440, "epoch": 2962} {"train_loss": -6.585659503936768, "global_step": 124441, "epoch": 2962} {"train_loss": -6.669893741607666, "global_step": 124442, "epoch": 2962} {"train_loss": -6.675413131713867, "global_step": 124443, "epoch": 2962} {"train_loss": -6.557468414306641, "global_step": 124444, "epoch": 2962} {"train_loss": -6.63189993585859, "global_step": 124445, "epoch": 2962, "val_loss": 66013.234375} {"train_loss": -6.640504837036133, "global_step": 124446, "epoch": 2963} {"train_loss": -6.711031436920166, "global_step": 124447, "epoch": 2963} {"train_loss": -6.588794708251953, "global_step": 124448, "epoch": 2963} {"train_loss": -6.681121826171875, "global_step": 124449, "epoch": 2963} {"train_loss": -6.634156227111816, "global_step": 124450, "epoch": 2963} {"train_loss": -6.61827278137207, "global_step": 124451, "epoch": 2963} {"train_loss": -6.603147983551025, "global_step": 124452, "epoch": 2963} {"train_loss": -6.654160499572754, "global_step": 124453, "epoch": 2963} {"train_loss": -6.623747825622559, "global_step": 124454, "epoch": 2963} {"train_loss": -6.523270130157471, "global_step": 124455, "epoch": 2963} {"train_loss": -6.6066575050354, "global_step": 124456, "epoch": 2963} {"train_loss": -6.576992988586426, "global_step": 124457, "epoch": 2963} {"train_loss": -6.540177345275879, "global_step": 124458, "epoch": 2963} {"train_loss": -6.636140823364258, "global_step": 124459, "epoch": 2963} {"train_loss": -6.667029857635498, "global_step": 124460, "epoch": 2963} {"train_loss": -6.521793365478516, "global_step": 124461, "epoch": 2963} {"train_loss": -6.6770782470703125, "global_step": 124462, "epoch": 2963} {"train_loss": -6.4975385665893555, "global_step": 124463, "epoch": 2963} {"train_loss": -6.576498985290527, "global_step": 124464, "epoch": 2963} {"train_loss": -6.617116451263428, "global_step": 124465, "epoch": 2963} {"train_loss": -6.553359508514404, "global_step": 124466, "epoch": 2963} {"train_loss": -6.612029075622559, "global_step": 124467, "epoch": 2963} {"train_loss": -6.438698768615723, "global_step": 124468, "epoch": 2963} {"train_loss": -6.608698844909668, "global_step": 124469, "epoch": 2963} {"train_loss": -6.638563632965088, "global_step": 124470, "epoch": 2963} {"train_loss": -6.5816650390625, "global_step": 124471, "epoch": 2963} {"train_loss": -6.603616714477539, "global_step": 124472, "epoch": 2963} {"train_loss": -6.587936878204346, "global_step": 124473, "epoch": 2963} {"train_loss": -6.61992073059082, "global_step": 124474, "epoch": 2963} {"train_loss": -6.586200714111328, "global_step": 124475, "epoch": 2963} {"train_loss": -6.488702774047852, "global_step": 124476, "epoch": 2963} {"train_loss": -6.600221157073975, "global_step": 124477, "epoch": 2963} {"train_loss": -6.5345306396484375, "global_step": 124478, "epoch": 2963} {"train_loss": -6.495604515075684, "global_step": 124479, "epoch": 2963} {"train_loss": -6.597201347351074, "global_step": 124480, "epoch": 2963} {"train_loss": -6.470569610595703, "global_step": 124481, "epoch": 2963} {"train_loss": -6.589216232299805, "global_step": 124482, "epoch": 2963} {"train_loss": -6.468774318695068, "global_step": 124483, "epoch": 2963} {"train_loss": -6.397477149963379, "global_step": 124484, "epoch": 2963} {"train_loss": -6.436372756958008, "global_step": 124485, "epoch": 2963} {"train_loss": -6.565662384033203, "global_step": 124486, "epoch": 2963} {"train_loss": -6.57485868817284, "global_step": 124487, "epoch": 2963, "val_loss": 66077.0625} {"train_loss": -6.63129997253418, "global_step": 124488, "epoch": 2964} {"train_loss": -6.368279457092285, "global_step": 124489, "epoch": 2964} {"train_loss": -6.48253870010376, "global_step": 124490, "epoch": 2964} {"train_loss": -6.485886573791504, "global_step": 124491, "epoch": 2964} {"train_loss": -6.597048759460449, "global_step": 124492, "epoch": 2964} {"train_loss": -6.462682247161865, "global_step": 124493, "epoch": 2964} {"train_loss": -6.627707481384277, "global_step": 124494, "epoch": 2964} {"train_loss": -6.527196884155273, "global_step": 124495, "epoch": 2964} {"train_loss": -6.629886627197266, "global_step": 124496, "epoch": 2964} {"train_loss": -6.512698173522949, "global_step": 124497, "epoch": 2964} {"train_loss": -6.478976249694824, "global_step": 124498, "epoch": 2964} {"train_loss": -6.671937942504883, "global_step": 124499, "epoch": 2964} {"train_loss": -6.533692359924316, "global_step": 124500, "epoch": 2964} {"train_loss": -6.496644020080566, "global_step": 124501, "epoch": 2964} {"train_loss": -6.54643440246582, "global_step": 124502, "epoch": 2964} {"train_loss": -6.567081928253174, "global_step": 124503, "epoch": 2964} {"train_loss": -6.749269485473633, "global_step": 124504, "epoch": 2964} {"train_loss": -6.609829902648926, "global_step": 124505, "epoch": 2964} {"train_loss": -6.57386589050293, "global_step": 124506, "epoch": 2964} {"train_loss": -6.631964206695557, "global_step": 124507, "epoch": 2964} {"train_loss": -6.567417144775391, "global_step": 124508, "epoch": 2964} {"train_loss": -6.615488529205322, "global_step": 124509, "epoch": 2964} {"train_loss": -6.532415390014648, "global_step": 124510, "epoch": 2964} {"train_loss": -6.659344673156738, "global_step": 124511, "epoch": 2964} {"train_loss": -6.517541408538818, "global_step": 124512, "epoch": 2964} {"train_loss": -6.578317642211914, "global_step": 124513, "epoch": 2964} {"train_loss": -6.61640739440918, "global_step": 124514, "epoch": 2964} {"train_loss": -6.6075286865234375, "global_step": 124515, "epoch": 2964} {"train_loss": -6.716801643371582, "global_step": 124516, "epoch": 2964} {"train_loss": -6.533840179443359, "global_step": 124517, "epoch": 2964} {"train_loss": -6.474073886871338, "global_step": 124518, "epoch": 2964} {"train_loss": -6.479100227355957, "global_step": 124519, "epoch": 2964} {"train_loss": -6.541736602783203, "global_step": 124520, "epoch": 2964} {"train_loss": -6.535773754119873, "global_step": 124521, "epoch": 2964} {"train_loss": -6.458999156951904, "global_step": 124522, "epoch": 2964} {"train_loss": -6.537412643432617, "global_step": 124523, "epoch": 2964} {"train_loss": -6.598212242126465, "global_step": 124524, "epoch": 2964} {"train_loss": -6.637460708618164, "global_step": 124525, "epoch": 2964} {"train_loss": -6.572120666503906, "global_step": 124526, "epoch": 2964} {"train_loss": -6.588225364685059, "global_step": 124527, "epoch": 2964} {"train_loss": -6.702182292938232, "global_step": 124528, "epoch": 2964} {"train_loss": -6.569367238453457, "global_step": 124529, "epoch": 2964, "val_loss": 66230.1015625} {"train_loss": -6.6530375480651855, "global_step": 124530, "epoch": 2965} {"train_loss": -6.615151405334473, "global_step": 124531, "epoch": 2965} {"train_loss": -6.710099220275879, "global_step": 124532, "epoch": 2965} {"train_loss": -6.599170684814453, "global_step": 124533, "epoch": 2965} {"train_loss": -6.698182582855225, "global_step": 124534, "epoch": 2965} {"train_loss": -6.731088638305664, "global_step": 124535, "epoch": 2965} {"train_loss": -6.642264366149902, "global_step": 124536, "epoch": 2965} {"train_loss": -6.533602237701416, "global_step": 124537, "epoch": 2965} {"train_loss": -6.58234977722168, "global_step": 124538, "epoch": 2965} {"train_loss": -6.532948970794678, "global_step": 124539, "epoch": 2965} {"train_loss": -6.664495468139648, "global_step": 124540, "epoch": 2965} {"train_loss": -6.694215774536133, "global_step": 124541, "epoch": 2965} {"train_loss": -6.66302490234375, "global_step": 124542, "epoch": 2965} {"train_loss": -6.498714447021484, "global_step": 124543, "epoch": 2965} {"train_loss": -6.580113887786865, "global_step": 124544, "epoch": 2965} {"train_loss": -6.681522369384766, "global_step": 124545, "epoch": 2965} {"train_loss": -6.550415992736816, "global_step": 124546, "epoch": 2965} {"train_loss": -6.6786789894104, "global_step": 124547, "epoch": 2965} {"train_loss": -6.631793022155762, "global_step": 124548, "epoch": 2965} {"train_loss": -6.724055767059326, "global_step": 124549, "epoch": 2965} {"train_loss": -6.639252662658691, "global_step": 124550, "epoch": 2965} {"train_loss": -6.6635308265686035, "global_step": 124551, "epoch": 2965} {"train_loss": -6.569369792938232, "global_step": 124552, "epoch": 2965} {"train_loss": -6.768594741821289, "global_step": 124553, "epoch": 2965} {"train_loss": -6.669816017150879, "global_step": 124554, "epoch": 2965} {"train_loss": -6.6851396560668945, "global_step": 124555, "epoch": 2965} {"train_loss": -6.563023567199707, "global_step": 124556, "epoch": 2965} {"train_loss": -6.693251609802246, "global_step": 124557, "epoch": 2965} {"train_loss": -6.743953704833984, "global_step": 124558, "epoch": 2965} {"train_loss": -6.62278938293457, "global_step": 124559, "epoch": 2965} {"train_loss": -6.639191627502441, "global_step": 124560, "epoch": 2965} {"train_loss": -6.641688346862793, "global_step": 124561, "epoch": 2965} {"train_loss": -6.585003852844238, "global_step": 124562, "epoch": 2965} {"train_loss": -6.72206974029541, "global_step": 124563, "epoch": 2965} {"train_loss": -6.702081203460693, "global_step": 124564, "epoch": 2965} {"train_loss": -6.7193284034729, "global_step": 124565, "epoch": 2965} {"train_loss": -6.712681770324707, "global_step": 124566, "epoch": 2965} {"train_loss": -6.694660186767578, "global_step": 124567, "epoch": 2965} {"train_loss": -6.697210311889648, "global_step": 124568, "epoch": 2965} {"train_loss": -6.540329933166504, "global_step": 124569, "epoch": 2965} {"train_loss": -6.705203533172607, "global_step": 124570, "epoch": 2965} {"train_loss": -6.651786372775123, "global_step": 124571, "epoch": 2965, "val_loss": 66269.2421875} {"train_loss": -6.772950172424316, "global_step": 124572, "epoch": 2966} {"train_loss": -6.6633405685424805, "global_step": 124573, "epoch": 2966} {"train_loss": -6.738428115844727, "global_step": 124574, "epoch": 2966} {"train_loss": -6.5916829109191895, "global_step": 124575, "epoch": 2966} {"train_loss": -6.686048984527588, "global_step": 124576, "epoch": 2966} {"train_loss": -6.606709003448486, "global_step": 124577, "epoch": 2966} {"train_loss": -6.577907562255859, "global_step": 124578, "epoch": 2966} {"train_loss": -6.67147159576416, "global_step": 124579, "epoch": 2966} {"train_loss": -6.6175642013549805, "global_step": 124580, "epoch": 2966} {"train_loss": -6.628896713256836, "global_step": 124581, "epoch": 2966} {"train_loss": -6.559329032897949, "global_step": 124582, "epoch": 2966} {"train_loss": -6.559475898742676, "global_step": 124583, "epoch": 2966} {"train_loss": -6.647018909454346, "global_step": 124584, "epoch": 2966} {"train_loss": -6.476955413818359, "global_step": 124585, "epoch": 2966} {"train_loss": -6.636551856994629, "global_step": 124586, "epoch": 2966} {"train_loss": -6.5957770347595215, "global_step": 124587, "epoch": 2966} {"train_loss": -6.6487226486206055, "global_step": 124588, "epoch": 2966} {"train_loss": -6.665815353393555, "global_step": 124589, "epoch": 2966} {"train_loss": -6.634997367858887, "global_step": 124590, "epoch": 2966} {"train_loss": -6.600399971008301, "global_step": 124591, "epoch": 2966} {"train_loss": -6.666431427001953, "global_step": 124592, "epoch": 2966} {"train_loss": -6.586177825927734, "global_step": 124593, "epoch": 2966} {"train_loss": -6.681297779083252, "global_step": 124594, "epoch": 2966} {"train_loss": -6.6555891036987305, "global_step": 124595, "epoch": 2966} {"train_loss": -6.629521369934082, "global_step": 124596, "epoch": 2966} {"train_loss": -6.655139923095703, "global_step": 124597, "epoch": 2966} {"train_loss": -6.5753679275512695, "global_step": 124598, "epoch": 2966} {"train_loss": -6.551945686340332, "global_step": 124599, "epoch": 2966} {"train_loss": -6.749527931213379, "global_step": 124600, "epoch": 2966} {"train_loss": -6.6762189865112305, "global_step": 124601, "epoch": 2966} {"train_loss": -6.606199264526367, "global_step": 124602, "epoch": 2966} {"train_loss": -6.610960006713867, "global_step": 124603, "epoch": 2966} {"train_loss": -6.650468826293945, "global_step": 124604, "epoch": 2966} {"train_loss": -6.65635871887207, "global_step": 124605, "epoch": 2966} {"train_loss": -6.659682273864746, "global_step": 124606, "epoch": 2966} {"train_loss": -6.642155647277832, "global_step": 124607, "epoch": 2966} {"train_loss": -6.5678935050964355, "global_step": 124608, "epoch": 2966} {"train_loss": -6.471103668212891, "global_step": 124609, "epoch": 2966} {"train_loss": -6.560890197753906, "global_step": 124610, "epoch": 2966} {"train_loss": -6.546048164367676, "global_step": 124611, "epoch": 2966} {"train_loss": -6.479635238647461, "global_step": 124612, "epoch": 2966} {"train_loss": -6.622031007494245, "global_step": 124613, "epoch": 2966, "val_loss": 66153.3515625} {"train_loss": -6.54286527633667, "global_step": 124614, "epoch": 2967} {"train_loss": -6.615991115570068, "global_step": 124615, "epoch": 2967} {"train_loss": -6.457684516906738, "global_step": 124616, "epoch": 2967} {"train_loss": -6.503013610839844, "global_step": 124617, "epoch": 2967} {"train_loss": -6.48518180847168, "global_step": 124618, "epoch": 2967} {"train_loss": -6.562230110168457, "global_step": 124619, "epoch": 2967} {"train_loss": -6.598548889160156, "global_step": 124620, "epoch": 2967} {"train_loss": -6.392337799072266, "global_step": 124621, "epoch": 2967} {"train_loss": -6.587738990783691, "global_step": 124622, "epoch": 2967} {"train_loss": -6.460219860076904, "global_step": 124623, "epoch": 2967} {"train_loss": -6.528967380523682, "global_step": 124624, "epoch": 2967} {"train_loss": -6.353461265563965, "global_step": 124625, "epoch": 2967} {"train_loss": -6.47655725479126, "global_step": 124626, "epoch": 2967} {"train_loss": -6.513010501861572, "global_step": 124627, "epoch": 2967} {"train_loss": -6.425046443939209, "global_step": 124628, "epoch": 2967} {"train_loss": -6.466063976287842, "global_step": 124629, "epoch": 2967} {"train_loss": -6.592180252075195, "global_step": 124630, "epoch": 2967} {"train_loss": -6.566788673400879, "global_step": 124631, "epoch": 2967} {"train_loss": -6.511821269989014, "global_step": 124632, "epoch": 2967} {"train_loss": -6.578299045562744, "global_step": 124633, "epoch": 2967} {"train_loss": -6.495916366577148, "global_step": 124634, "epoch": 2967} {"train_loss": -6.562067031860352, "global_step": 124635, "epoch": 2967} {"train_loss": -6.598517417907715, "global_step": 124636, "epoch": 2967} {"train_loss": -6.464930534362793, "global_step": 124637, "epoch": 2967} {"train_loss": -6.50897216796875, "global_step": 124638, "epoch": 2967} {"train_loss": -6.533773422241211, "global_step": 124639, "epoch": 2967} {"train_loss": -6.53585147857666, "global_step": 124640, "epoch": 2967} {"train_loss": -6.537227153778076, "global_step": 124641, "epoch": 2967} {"train_loss": -6.633872985839844, "global_step": 124642, "epoch": 2967} {"train_loss": -6.617171287536621, "global_step": 124643, "epoch": 2967} {"train_loss": -6.46989631652832, "global_step": 124644, "epoch": 2967} {"train_loss": -6.685169219970703, "global_step": 124645, "epoch": 2967} {"train_loss": -6.621681213378906, "global_step": 124646, "epoch": 2967} {"train_loss": -6.527096748352051, "global_step": 124647, "epoch": 2967} {"train_loss": -6.631549835205078, "global_step": 124648, "epoch": 2967} {"train_loss": -6.630897521972656, "global_step": 124649, "epoch": 2967} {"train_loss": -6.57792854309082, "global_step": 124650, "epoch": 2967} {"train_loss": -6.68583869934082, "global_step": 124651, "epoch": 2967} {"train_loss": -6.605259418487549, "global_step": 124652, "epoch": 2967} {"train_loss": -6.552502632141113, "global_step": 124653, "epoch": 2967} {"train_loss": -6.685189247131348, "global_step": 124654, "epoch": 2967} {"train_loss": -6.548267239616031, "global_step": 124655, "epoch": 2967, "val_loss": 65910.578125} {"train_loss": -6.6823039054870605, "global_step": 124656, "epoch": 2968} {"train_loss": -6.584250450134277, "global_step": 124657, "epoch": 2968} {"train_loss": -6.569265842437744, "global_step": 124658, "epoch": 2968} {"train_loss": -6.525754451751709, "global_step": 124659, "epoch": 2968} {"train_loss": -6.589252948760986, "global_step": 124660, "epoch": 2968} {"train_loss": -6.5861334800720215, "global_step": 124661, "epoch": 2968} {"train_loss": -6.622800350189209, "global_step": 124662, "epoch": 2968} {"train_loss": -6.632590293884277, "global_step": 124663, "epoch": 2968} {"train_loss": -6.54062032699585, "global_step": 124664, "epoch": 2968} {"train_loss": -6.588373184204102, "global_step": 124665, "epoch": 2968} {"train_loss": -6.612776756286621, "global_step": 124666, "epoch": 2968} {"train_loss": -6.539017677307129, "global_step": 124667, "epoch": 2968} {"train_loss": -6.636224269866943, "global_step": 124668, "epoch": 2968} {"train_loss": -6.601214408874512, "global_step": 124669, "epoch": 2968} {"train_loss": -6.675900936126709, "global_step": 124670, "epoch": 2968} {"train_loss": -6.514971733093262, "global_step": 124671, "epoch": 2968} {"train_loss": -6.584839820861816, "global_step": 124672, "epoch": 2968} {"train_loss": -6.556694030761719, "global_step": 124673, "epoch": 2968} {"train_loss": -6.602629661560059, "global_step": 124674, "epoch": 2968} {"train_loss": -6.614467620849609, "global_step": 124675, "epoch": 2968} {"train_loss": -6.587523937225342, "global_step": 124676, "epoch": 2968} {"train_loss": -6.592931270599365, "global_step": 124677, "epoch": 2968} {"train_loss": -6.554681777954102, "global_step": 124678, "epoch": 2968} {"train_loss": -6.595383644104004, "global_step": 124679, "epoch": 2968} {"train_loss": -6.661098480224609, "global_step": 124680, "epoch": 2968} {"train_loss": -6.6022138595581055, "global_step": 124681, "epoch": 2968} {"train_loss": -6.519697189331055, "global_step": 124682, "epoch": 2968} {"train_loss": -6.62255859375, "global_step": 124683, "epoch": 2968} {"train_loss": -6.5678510665893555, "global_step": 124684, "epoch": 2968} {"train_loss": -6.566646099090576, "global_step": 124685, "epoch": 2968} {"train_loss": -6.51765775680542, "global_step": 124686, "epoch": 2968} {"train_loss": -6.574556827545166, "global_step": 124687, "epoch": 2968} {"train_loss": -6.610644340515137, "global_step": 124688, "epoch": 2968} {"train_loss": -6.497584342956543, "global_step": 124689, "epoch": 2968} {"train_loss": -6.578986167907715, "global_step": 124690, "epoch": 2968} {"train_loss": -6.590900897979736, "global_step": 124691, "epoch": 2968} {"train_loss": -6.45121955871582, "global_step": 124692, "epoch": 2968} {"train_loss": -6.585360527038574, "global_step": 124693, "epoch": 2968} {"train_loss": -6.524565696716309, "global_step": 124694, "epoch": 2968} {"train_loss": -6.646860599517822, "global_step": 124695, "epoch": 2968} {"train_loss": -6.59678840637207, "global_step": 124696, "epoch": 2968} {"train_loss": -6.581876800173805, "global_step": 124697, "epoch": 2968, "val_loss": 66089.5078125} {"train_loss": -6.551143646240234, "global_step": 124698, "epoch": 2969} {"train_loss": -6.57219123840332, "global_step": 124699, "epoch": 2969} {"train_loss": -6.507932662963867, "global_step": 124700, "epoch": 2969} {"train_loss": -6.539140701293945, "global_step": 124701, "epoch": 2969} {"train_loss": -6.567197799682617, "global_step": 124702, "epoch": 2969} {"train_loss": -6.684820652008057, "global_step": 124703, "epoch": 2969} {"train_loss": -6.522271156311035, "global_step": 124704, "epoch": 2969} {"train_loss": -6.6749958992004395, "global_step": 124705, "epoch": 2969} {"train_loss": -6.635591506958008, "global_step": 124706, "epoch": 2969} {"train_loss": -6.594542503356934, "global_step": 124707, "epoch": 2969} {"train_loss": -6.670565605163574, "global_step": 124708, "epoch": 2969} {"train_loss": -6.503208637237549, "global_step": 124709, "epoch": 2969} {"train_loss": -6.606006145477295, "global_step": 124710, "epoch": 2969} {"train_loss": -6.70845365524292, "global_step": 124711, "epoch": 2969} {"train_loss": -6.369603157043457, "global_step": 124712, "epoch": 2969} {"train_loss": -6.560246467590332, "global_step": 124713, "epoch": 2969} {"train_loss": -6.585862159729004, "global_step": 124714, "epoch": 2969} {"train_loss": -6.405417442321777, "global_step": 124715, "epoch": 2969} {"train_loss": -6.569280624389648, "global_step": 124716, "epoch": 2969} {"train_loss": -6.475161075592041, "global_step": 124717, "epoch": 2969} {"train_loss": -6.580293655395508, "global_step": 124718, "epoch": 2969} {"train_loss": -6.504759788513184, "global_step": 124719, "epoch": 2969} {"train_loss": -6.581581115722656, "global_step": 124720, "epoch": 2969} {"train_loss": -6.619730472564697, "global_step": 124721, "epoch": 2969} {"train_loss": -6.477825164794922, "global_step": 124722, "epoch": 2969} {"train_loss": -6.562840938568115, "global_step": 124723, "epoch": 2969} {"train_loss": -6.458285331726074, "global_step": 124724, "epoch": 2969} {"train_loss": -6.678508281707764, "global_step": 124725, "epoch": 2969} {"train_loss": -6.512675762176514, "global_step": 124726, "epoch": 2969} {"train_loss": -6.627139091491699, "global_step": 124727, "epoch": 2969} {"train_loss": -6.583748817443848, "global_step": 124728, "epoch": 2969} {"train_loss": -6.541208267211914, "global_step": 124729, "epoch": 2969} {"train_loss": -6.66733455657959, "global_step": 124730, "epoch": 2969} {"train_loss": -6.597719192504883, "global_step": 124731, "epoch": 2969} {"train_loss": -6.656018257141113, "global_step": 124732, "epoch": 2969} {"train_loss": -6.613241195678711, "global_step": 124733, "epoch": 2969} {"train_loss": -6.7046356201171875, "global_step": 124734, "epoch": 2969} {"train_loss": -6.686204433441162, "global_step": 124735, "epoch": 2969} {"train_loss": -6.56907844543457, "global_step": 124736, "epoch": 2969} {"train_loss": -6.652841567993164, "global_step": 124737, "epoch": 2969} {"train_loss": -6.618318557739258, "global_step": 124738, "epoch": 2969} {"train_loss": -6.582559381212507, "global_step": 124739, "epoch": 2969, "val_loss": 66024.0625} {"train_loss": -6.607802391052246, "global_step": 124740, "epoch": 2970} {"train_loss": -6.683411598205566, "global_step": 124741, "epoch": 2970} {"train_loss": -6.578086853027344, "global_step": 124742, "epoch": 2970} {"train_loss": -6.586503028869629, "global_step": 124743, "epoch": 2970} {"train_loss": -6.675313949584961, "global_step": 124744, "epoch": 2970} {"train_loss": -6.628989219665527, "global_step": 124745, "epoch": 2970} {"train_loss": -6.505783557891846, "global_step": 124746, "epoch": 2970} {"train_loss": -6.648934364318848, "global_step": 124747, "epoch": 2970} {"train_loss": -6.733057498931885, "global_step": 124748, "epoch": 2970} {"train_loss": -6.687976360321045, "global_step": 124749, "epoch": 2970} {"train_loss": -6.685769557952881, "global_step": 124750, "epoch": 2970} {"train_loss": -6.5408854484558105, "global_step": 124751, "epoch": 2970} {"train_loss": -6.510492324829102, "global_step": 124752, "epoch": 2970} {"train_loss": -6.659817695617676, "global_step": 124753, "epoch": 2970} {"train_loss": -6.636371612548828, "global_step": 124754, "epoch": 2970} {"train_loss": -6.6520233154296875, "global_step": 124755, "epoch": 2970} {"train_loss": -6.606305122375488, "global_step": 124756, "epoch": 2970} {"train_loss": -6.584568023681641, "global_step": 124757, "epoch": 2970} {"train_loss": -6.695992469787598, "global_step": 124758, "epoch": 2970} {"train_loss": -6.550599098205566, "global_step": 124759, "epoch": 2970} {"train_loss": -6.63581657409668, "global_step": 124760, "epoch": 2970} {"train_loss": -6.4367780685424805, "global_step": 124761, "epoch": 2970} {"train_loss": -6.675546646118164, "global_step": 124762, "epoch": 2970} {"train_loss": -6.551113128662109, "global_step": 124763, "epoch": 2970} {"train_loss": -6.632201671600342, "global_step": 124764, "epoch": 2970} {"train_loss": -6.5874528884887695, "global_step": 124765, "epoch": 2970} {"train_loss": -6.621278762817383, "global_step": 124766, "epoch": 2970} {"train_loss": -6.5887041091918945, "global_step": 124767, "epoch": 2970} {"train_loss": -6.571788787841797, "global_step": 124768, "epoch": 2970} {"train_loss": -6.543465614318848, "global_step": 124769, "epoch": 2970} {"train_loss": -6.434020042419434, "global_step": 124770, "epoch": 2970} {"train_loss": -6.644186019897461, "global_step": 124771, "epoch": 2970} {"train_loss": -6.622008323669434, "global_step": 124772, "epoch": 2970} {"train_loss": -6.6104044914245605, "global_step": 124773, "epoch": 2970} {"train_loss": -6.622941970825195, "global_step": 124774, "epoch": 2970} {"train_loss": -6.616223335266113, "global_step": 124775, "epoch": 2970} {"train_loss": -6.476863384246826, "global_step": 124776, "epoch": 2970} {"train_loss": -6.591831684112549, "global_step": 124777, "epoch": 2970} {"train_loss": -6.41325569152832, "global_step": 124778, "epoch": 2970} {"train_loss": -6.54168701171875, "global_step": 124779, "epoch": 2970} {"train_loss": -6.45084285736084, "global_step": 124780, "epoch": 2970} {"train_loss": -6.588887157894316, "global_step": 124781, "epoch": 2970, "val_loss": 66277.9609375} {"train_loss": -6.545588493347168, "global_step": 124782, "epoch": 2971} {"train_loss": -6.536393642425537, "global_step": 124783, "epoch": 2971} {"train_loss": -6.535424709320068, "global_step": 124784, "epoch": 2971} {"train_loss": -6.549287796020508, "global_step": 124785, "epoch": 2971} {"train_loss": -6.501877784729004, "global_step": 124786, "epoch": 2971} {"train_loss": -6.472881317138672, "global_step": 124787, "epoch": 2971} {"train_loss": -6.583096504211426, "global_step": 124788, "epoch": 2971} {"train_loss": -6.455554485321045, "global_step": 124789, "epoch": 2971} {"train_loss": -6.611698627471924, "global_step": 124790, "epoch": 2971} {"train_loss": -6.541666030883789, "global_step": 124791, "epoch": 2971} {"train_loss": -6.561903953552246, "global_step": 124792, "epoch": 2971} {"train_loss": -6.543465614318848, "global_step": 124793, "epoch": 2971} {"train_loss": -6.594155311584473, "global_step": 124794, "epoch": 2971} {"train_loss": -6.568636894226074, "global_step": 124795, "epoch": 2971} {"train_loss": -6.58220911026001, "global_step": 124796, "epoch": 2971} {"train_loss": -6.686423301696777, "global_step": 124797, "epoch": 2971} {"train_loss": -6.595017433166504, "global_step": 124798, "epoch": 2971} {"train_loss": -6.632306098937988, "global_step": 124799, "epoch": 2971} {"train_loss": -6.528580665588379, "global_step": 124800, "epoch": 2971} {"train_loss": -6.564691066741943, "global_step": 124801, "epoch": 2971} {"train_loss": -6.592008590698242, "global_step": 124802, "epoch": 2971} {"train_loss": -6.59642219543457, "global_step": 124803, "epoch": 2971} {"train_loss": -6.605775356292725, "global_step": 124804, "epoch": 2971} {"train_loss": -6.572147369384766, "global_step": 124805, "epoch": 2971} {"train_loss": -6.567910671234131, "global_step": 124806, "epoch": 2971} {"train_loss": -6.688867568969727, "global_step": 124807, "epoch": 2971} {"train_loss": -6.595061302185059, "global_step": 124808, "epoch": 2971} {"train_loss": -6.565582275390625, "global_step": 124809, "epoch": 2971} {"train_loss": -6.564899444580078, "global_step": 124810, "epoch": 2971} {"train_loss": -6.604098320007324, "global_step": 124811, "epoch": 2971} {"train_loss": -6.443781852722168, "global_step": 124812, "epoch": 2971} {"train_loss": -6.551815032958984, "global_step": 124813, "epoch": 2971} {"train_loss": -6.717364311218262, "global_step": 124814, "epoch": 2971} {"train_loss": -6.50779914855957, "global_step": 124815, "epoch": 2971} {"train_loss": -6.60856819152832, "global_step": 124816, "epoch": 2971} {"train_loss": -6.632798194885254, "global_step": 124817, "epoch": 2971} {"train_loss": -6.613539695739746, "global_step": 124818, "epoch": 2971} {"train_loss": -6.748848915100098, "global_step": 124819, "epoch": 2971} {"train_loss": -6.5767364501953125, "global_step": 124820, "epoch": 2971} {"train_loss": -6.585704803466797, "global_step": 124821, "epoch": 2971} {"train_loss": -6.673810005187988, "global_step": 124822, "epoch": 2971} {"train_loss": -6.58227581069583, "global_step": 124823, "epoch": 2971, "val_loss": 66086.8046875} {"train_loss": -6.624421119689941, "global_step": 124824, "epoch": 2972} {"train_loss": -6.690919876098633, "global_step": 124825, "epoch": 2972} {"train_loss": -6.643314361572266, "global_step": 124826, "epoch": 2972} {"train_loss": -6.640102863311768, "global_step": 124827, "epoch": 2972} {"train_loss": -6.703845977783203, "global_step": 124828, "epoch": 2972} {"train_loss": -6.6427178382873535, "global_step": 124829, "epoch": 2972} {"train_loss": -6.604247093200684, "global_step": 124830, "epoch": 2972} {"train_loss": -6.685044288635254, "global_step": 124831, "epoch": 2972} {"train_loss": -6.54703426361084, "global_step": 124832, "epoch": 2972} {"train_loss": -6.637093544006348, "global_step": 124833, "epoch": 2972} {"train_loss": -6.636826515197754, "global_step": 124834, "epoch": 2972} {"train_loss": -6.67370080947876, "global_step": 124835, "epoch": 2972} {"train_loss": -6.702528953552246, "global_step": 124836, "epoch": 2972} {"train_loss": -6.602937698364258, "global_step": 124837, "epoch": 2972} {"train_loss": -6.666502952575684, "global_step": 124838, "epoch": 2972} {"train_loss": -6.71352481842041, "global_step": 124839, "epoch": 2972} {"train_loss": -6.687334060668945, "global_step": 124840, "epoch": 2972} {"train_loss": -6.616905212402344, "global_step": 124841, "epoch": 2972} {"train_loss": -6.64951229095459, "global_step": 124842, "epoch": 2972} {"train_loss": -6.620728969573975, "global_step": 124843, "epoch": 2972} {"train_loss": -6.649289131164551, "global_step": 124844, "epoch": 2972} {"train_loss": -6.489492416381836, "global_step": 124845, "epoch": 2972} {"train_loss": -6.598912239074707, "global_step": 124846, "epoch": 2972} {"train_loss": -6.621798515319824, "global_step": 124847, "epoch": 2972} {"train_loss": -6.624279975891113, "global_step": 124848, "epoch": 2972} {"train_loss": -6.709657669067383, "global_step": 124849, "epoch": 2972} {"train_loss": -6.682244777679443, "global_step": 124850, "epoch": 2972} {"train_loss": -6.626382827758789, "global_step": 124851, "epoch": 2972} {"train_loss": -6.622929096221924, "global_step": 124852, "epoch": 2972} {"train_loss": -6.642385482788086, "global_step": 124853, "epoch": 2972} {"train_loss": -6.639959335327148, "global_step": 124854, "epoch": 2972} {"train_loss": -6.5884690284729, "global_step": 124855, "epoch": 2972} {"train_loss": -6.593114376068115, "global_step": 124856, "epoch": 2972} {"train_loss": -6.772221565246582, "global_step": 124857, "epoch": 2972} {"train_loss": -6.621240615844727, "global_step": 124858, "epoch": 2972} {"train_loss": -6.677971839904785, "global_step": 124859, "epoch": 2972} {"train_loss": -6.720688819885254, "global_step": 124860, "epoch": 2972} {"train_loss": -6.638983249664307, "global_step": 124861, "epoch": 2972} {"train_loss": -6.833965301513672, "global_step": 124862, "epoch": 2972} {"train_loss": -6.670144081115723, "global_step": 124863, "epoch": 2972} {"train_loss": -6.699618339538574, "global_step": 124864, "epoch": 2972} {"train_loss": -6.6511203561510355, "global_step": 124865, "epoch": 2972, "val_loss": 65966.890625} {"train_loss": -6.716031551361084, "global_step": 124866, "epoch": 2973} {"train_loss": -6.557069778442383, "global_step": 124867, "epoch": 2973} {"train_loss": -6.617090702056885, "global_step": 124868, "epoch": 2973} {"train_loss": -6.706799030303955, "global_step": 124869, "epoch": 2973} {"train_loss": -6.611903190612793, "global_step": 124870, "epoch": 2973} {"train_loss": -6.724039077758789, "global_step": 124871, "epoch": 2973} {"train_loss": -6.637514114379883, "global_step": 124872, "epoch": 2973} {"train_loss": -6.6377387046813965, "global_step": 124873, "epoch": 2973} {"train_loss": -6.678824424743652, "global_step": 124874, "epoch": 2973} {"train_loss": -6.654653549194336, "global_step": 124875, "epoch": 2973} {"train_loss": -6.601062774658203, "global_step": 124876, "epoch": 2973} {"train_loss": -6.693001747131348, "global_step": 124877, "epoch": 2973} {"train_loss": -6.6924028396606445, "global_step": 124878, "epoch": 2973} {"train_loss": -6.580646991729736, "global_step": 124879, "epoch": 2973} {"train_loss": -6.641895771026611, "global_step": 124880, "epoch": 2973} {"train_loss": -6.711382865905762, "global_step": 124881, "epoch": 2973} {"train_loss": -6.635309219360352, "global_step": 124882, "epoch": 2973} {"train_loss": -6.655393600463867, "global_step": 124883, "epoch": 2973} {"train_loss": -6.629619598388672, "global_step": 124884, "epoch": 2973} {"train_loss": -6.587285995483398, "global_step": 124885, "epoch": 2973} {"train_loss": -6.623319625854492, "global_step": 124886, "epoch": 2973} {"train_loss": -6.509764671325684, "global_step": 124887, "epoch": 2973} {"train_loss": -6.502403736114502, "global_step": 124888, "epoch": 2973} {"train_loss": -6.5927886962890625, "global_step": 124889, "epoch": 2973} {"train_loss": -6.584568977355957, "global_step": 124890, "epoch": 2973} {"train_loss": -6.5980119705200195, "global_step": 124891, "epoch": 2973} {"train_loss": -6.578999996185303, "global_step": 124892, "epoch": 2973} {"train_loss": -6.471346855163574, "global_step": 124893, "epoch": 2973} {"train_loss": -6.603424072265625, "global_step": 124894, "epoch": 2973} {"train_loss": -6.529201507568359, "global_step": 124895, "epoch": 2973} {"train_loss": -6.539262771606445, "global_step": 124896, "epoch": 2973} {"train_loss": -6.5195465087890625, "global_step": 124897, "epoch": 2973} {"train_loss": -6.604391098022461, "global_step": 124898, "epoch": 2973} {"train_loss": -6.585512161254883, "global_step": 124899, "epoch": 2973} {"train_loss": -6.511643409729004, "global_step": 124900, "epoch": 2973} {"train_loss": -6.539233684539795, "global_step": 124901, "epoch": 2973} {"train_loss": -6.514706134796143, "global_step": 124902, "epoch": 2973} {"train_loss": -6.743306636810303, "global_step": 124903, "epoch": 2973} {"train_loss": -6.516658782958984, "global_step": 124904, "epoch": 2973} {"train_loss": -6.564719200134277, "global_step": 124905, "epoch": 2973} {"train_loss": -6.68629264831543, "global_step": 124906, "epoch": 2973} {"train_loss": -6.604498704274495, "global_step": 124907, "epoch": 2973, "val_loss": 66162.3046875} {"train_loss": -6.645540237426758, "global_step": 124908, "epoch": 2974} {"train_loss": -6.63389778137207, "global_step": 124909, "epoch": 2974} {"train_loss": -6.677864074707031, "global_step": 124910, "epoch": 2974} {"train_loss": -6.647778034210205, "global_step": 124911, "epoch": 2974} {"train_loss": -6.622878551483154, "global_step": 124912, "epoch": 2974} {"train_loss": -6.679634094238281, "global_step": 124913, "epoch": 2974} {"train_loss": -6.576695919036865, "global_step": 124914, "epoch": 2974} {"train_loss": -6.607118606567383, "global_step": 124915, "epoch": 2974} {"train_loss": -6.584345817565918, "global_step": 124916, "epoch": 2974} {"train_loss": -6.661226272583008, "global_step": 124917, "epoch": 2974} {"train_loss": -6.67631721496582, "global_step": 124918, "epoch": 2974} {"train_loss": -6.646347999572754, "global_step": 124919, "epoch": 2974} {"train_loss": -6.6102986335754395, "global_step": 124920, "epoch": 2974} {"train_loss": -6.784017086029053, "global_step": 124921, "epoch": 2974} {"train_loss": -6.650295257568359, "global_step": 124922, "epoch": 2974} {"train_loss": -6.710457801818848, "global_step": 124923, "epoch": 2974} {"train_loss": -6.590944766998291, "global_step": 124924, "epoch": 2974} {"train_loss": -6.715150356292725, "global_step": 124925, "epoch": 2974} {"train_loss": -6.600889205932617, "global_step": 124926, "epoch": 2974} {"train_loss": -6.654419898986816, "global_step": 124927, "epoch": 2974} {"train_loss": -6.578300476074219, "global_step": 124928, "epoch": 2974} {"train_loss": -6.676117420196533, "global_step": 124929, "epoch": 2974} {"train_loss": -6.756111145019531, "global_step": 124930, "epoch": 2974} {"train_loss": -6.569685935974121, "global_step": 124931, "epoch": 2974} {"train_loss": -6.491757392883301, "global_step": 124932, "epoch": 2974} {"train_loss": -6.600689888000488, "global_step": 124933, "epoch": 2974} {"train_loss": -6.593841075897217, "global_step": 124934, "epoch": 2974} {"train_loss": -6.754907608032227, "global_step": 124935, "epoch": 2974} {"train_loss": -6.709374904632568, "global_step": 124936, "epoch": 2974} {"train_loss": -6.548865795135498, "global_step": 124937, "epoch": 2974} {"train_loss": -6.572016716003418, "global_step": 124938, "epoch": 2974} {"train_loss": -6.638172149658203, "global_step": 124939, "epoch": 2974} {"train_loss": -6.616456031799316, "global_step": 124940, "epoch": 2974} {"train_loss": -6.699864864349365, "global_step": 124941, "epoch": 2974} {"train_loss": -6.575473785400391, "global_step": 124942, "epoch": 2974} {"train_loss": -6.602715492248535, "global_step": 124943, "epoch": 2974} {"train_loss": -6.720111846923828, "global_step": 124944, "epoch": 2974} {"train_loss": -6.5210418701171875, "global_step": 124945, "epoch": 2974} {"train_loss": -6.640443801879883, "global_step": 124946, "epoch": 2974} {"train_loss": -6.694467544555664, "global_step": 124947, "epoch": 2974} {"train_loss": -6.483699321746826, "global_step": 124948, "epoch": 2974} {"train_loss": -6.633759759721302, "global_step": 124949, "epoch": 2974, "val_loss": 66270.1328125} {"train_loss": -6.386387825012207, "global_step": 124950, "epoch": 2975} {"train_loss": -6.437915802001953, "global_step": 124951, "epoch": 2975} {"train_loss": -6.643970966339111, "global_step": 124952, "epoch": 2975} {"train_loss": -6.327764511108398, "global_step": 124953, "epoch": 2975} {"train_loss": -6.566871643066406, "global_step": 124954, "epoch": 2975} {"train_loss": -6.505504608154297, "global_step": 124955, "epoch": 2975} {"train_loss": -6.676790237426758, "global_step": 124956, "epoch": 2975} {"train_loss": -6.546347618103027, "global_step": 124957, "epoch": 2975} {"train_loss": -6.614006996154785, "global_step": 124958, "epoch": 2975} {"train_loss": -6.691468715667725, "global_step": 124959, "epoch": 2975} {"train_loss": -6.600335121154785, "global_step": 124960, "epoch": 2975} {"train_loss": -6.642580032348633, "global_step": 124961, "epoch": 2975} {"train_loss": -6.603148460388184, "global_step": 124962, "epoch": 2975} {"train_loss": -6.605717658996582, "global_step": 124963, "epoch": 2975} {"train_loss": -6.576749324798584, "global_step": 124964, "epoch": 2975} {"train_loss": -6.625619888305664, "global_step": 124965, "epoch": 2975} {"train_loss": -6.490289211273193, "global_step": 124966, "epoch": 2975} {"train_loss": -6.679548263549805, "global_step": 124967, "epoch": 2975} {"train_loss": -6.563225746154785, "global_step": 124968, "epoch": 2975} {"train_loss": -6.544692039489746, "global_step": 124969, "epoch": 2975} {"train_loss": -6.606528282165527, "global_step": 124970, "epoch": 2975} {"train_loss": -6.580687522888184, "global_step": 124971, "epoch": 2975} {"train_loss": -6.558935165405273, "global_step": 124972, "epoch": 2975} {"train_loss": -6.676105976104736, "global_step": 124973, "epoch": 2975} {"train_loss": -6.551831245422363, "global_step": 124974, "epoch": 2975} {"train_loss": -6.647016525268555, "global_step": 124975, "epoch": 2975} {"train_loss": -6.640653610229492, "global_step": 124976, "epoch": 2975} {"train_loss": -6.621380805969238, "global_step": 124977, "epoch": 2975} {"train_loss": -6.565608024597168, "global_step": 124978, "epoch": 2975} {"train_loss": -6.5768914222717285, "global_step": 124979, "epoch": 2975} {"train_loss": -6.712174415588379, "global_step": 124980, "epoch": 2975} {"train_loss": -6.608040809631348, "global_step": 124981, "epoch": 2975} {"train_loss": -6.573435306549072, "global_step": 124982, "epoch": 2975} {"train_loss": -6.6153154373168945, "global_step": 124983, "epoch": 2975} {"train_loss": -6.610362529754639, "global_step": 124984, "epoch": 2975} {"train_loss": -6.6675825119018555, "global_step": 124985, "epoch": 2975} {"train_loss": -6.536764144897461, "global_step": 124986, "epoch": 2975} {"train_loss": -6.623030662536621, "global_step": 124987, "epoch": 2975} {"train_loss": -6.69702672958374, "global_step": 124988, "epoch": 2975} {"train_loss": -6.605437755584717, "global_step": 124989, "epoch": 2975} {"train_loss": -6.674069881439209, "global_step": 124990, "epoch": 2975} {"train_loss": -6.592814104897635, "global_step": 124991, "epoch": 2975, "val_loss": 66408.875} {"train_loss": -6.695736885070801, "global_step": 124992, "epoch": 2976} {"train_loss": -6.574517726898193, "global_step": 124993, "epoch": 2976} {"train_loss": -6.637657642364502, "global_step": 124994, "epoch": 2976} {"train_loss": -6.652565002441406, "global_step": 124995, "epoch": 2976} {"train_loss": -6.580094337463379, "global_step": 124996, "epoch": 2976} {"train_loss": -6.722897529602051, "global_step": 124997, "epoch": 2976} {"train_loss": -6.759518623352051, "global_step": 124998, "epoch": 2976} {"train_loss": -6.699612617492676, "global_step": 124999, "epoch": 2976} {"train_loss": -6.670825004577637, "global_step": 125000, "epoch": 2976} {"train_loss": -6.691210746765137, "global_step": 125001, "epoch": 2976} {"train_loss": -6.719552993774414, "global_step": 125002, "epoch": 2976} {"train_loss": -6.650063514709473, "global_step": 125003, "epoch": 2976} {"train_loss": -6.6683759689331055, "global_step": 125004, "epoch": 2976} {"train_loss": -6.643904685974121, "global_step": 125005, "epoch": 2976} {"train_loss": -6.633735656738281, "global_step": 125006, "epoch": 2976} {"train_loss": -6.619132995605469, "global_step": 125007, "epoch": 2976} {"train_loss": -6.653182506561279, "global_step": 125008, "epoch": 2976} {"train_loss": -6.611435890197754, "global_step": 125009, "epoch": 2976} {"train_loss": -6.740856647491455, "global_step": 125010, "epoch": 2976} {"train_loss": -6.583377838134766, "global_step": 125011, "epoch": 2976} {"train_loss": -6.75667142868042, "global_step": 125012, "epoch": 2976} {"train_loss": -6.634618759155273, "global_step": 125013, "epoch": 2976} {"train_loss": -6.623802185058594, "global_step": 125014, "epoch": 2976} {"train_loss": -6.674181938171387, "global_step": 125015, "epoch": 2976} {"train_loss": -6.704296112060547, "global_step": 125016, "epoch": 2976} {"train_loss": -6.628916263580322, "global_step": 125017, "epoch": 2976} {"train_loss": -6.560734272003174, "global_step": 125018, "epoch": 2976} {"train_loss": -6.552689552307129, "global_step": 125019, "epoch": 2976} {"train_loss": -6.624274253845215, "global_step": 125020, "epoch": 2976} {"train_loss": -6.445305824279785, "global_step": 125021, "epoch": 2976} {"train_loss": -6.576739311218262, "global_step": 125022, "epoch": 2976} {"train_loss": -6.638818740844727, "global_step": 125023, "epoch": 2976} {"train_loss": -6.6706671714782715, "global_step": 125024, "epoch": 2976} {"train_loss": -6.645552635192871, "global_step": 125025, "epoch": 2976} {"train_loss": -6.681295871734619, "global_step": 125026, "epoch": 2976} {"train_loss": -6.6926703453063965, "global_step": 125027, "epoch": 2976} {"train_loss": -6.531485080718994, "global_step": 125028, "epoch": 2976} {"train_loss": -6.684653282165527, "global_step": 125029, "epoch": 2976} {"train_loss": -6.537920951843262, "global_step": 125030, "epoch": 2976} {"train_loss": -6.514850616455078, "global_step": 125031, "epoch": 2976} {"train_loss": -6.707399368286133, "global_step": 125032, "epoch": 2976} {"train_loss": -6.641373339153471, "global_step": 125033, "epoch": 2976, "val_loss": 66217.1484375} {"train_loss": -6.665341377258301, "global_step": 125034, "epoch": 2977} {"train_loss": -6.707132339477539, "global_step": 125035, "epoch": 2977} {"train_loss": -6.639248847961426, "global_step": 125036, "epoch": 2977} {"train_loss": -6.644086837768555, "global_step": 125037, "epoch": 2977} {"train_loss": -6.635461807250977, "global_step": 125038, "epoch": 2977} {"train_loss": -6.616245746612549, "global_step": 125039, "epoch": 2977} {"train_loss": -6.568818092346191, "global_step": 125040, "epoch": 2977} {"train_loss": -6.598881721496582, "global_step": 125041, "epoch": 2977} {"train_loss": -6.587952613830566, "global_step": 125042, "epoch": 2977} {"train_loss": -6.663839340209961, "global_step": 125043, "epoch": 2977} {"train_loss": -6.487144470214844, "global_step": 125044, "epoch": 2977} {"train_loss": -6.7499799728393555, "global_step": 125045, "epoch": 2977} {"train_loss": -6.6374969482421875, "global_step": 125046, "epoch": 2977} {"train_loss": -6.5842390060424805, "global_step": 125047, "epoch": 2977} {"train_loss": -6.617522239685059, "global_step": 125048, "epoch": 2977} {"train_loss": -6.6249494552612305, "global_step": 125049, "epoch": 2977} {"train_loss": -6.701622009277344, "global_step": 125050, "epoch": 2977} {"train_loss": -6.538394927978516, "global_step": 125051, "epoch": 2977} {"train_loss": -6.686429977416992, "global_step": 125052, "epoch": 2977} {"train_loss": -6.607961654663086, "global_step": 125053, "epoch": 2977} {"train_loss": -6.598901271820068, "global_step": 125054, "epoch": 2977} {"train_loss": -6.729199409484863, "global_step": 125055, "epoch": 2977} {"train_loss": -6.649125099182129, "global_step": 125056, "epoch": 2977} {"train_loss": -6.6596221923828125, "global_step": 125057, "epoch": 2977} {"train_loss": -6.586459159851074, "global_step": 125058, "epoch": 2977} {"train_loss": -6.576335430145264, "global_step": 125059, "epoch": 2977} {"train_loss": -6.6795148849487305, "global_step": 125060, "epoch": 2977} {"train_loss": -6.588418960571289, "global_step": 125061, "epoch": 2977} {"train_loss": -6.599141597747803, "global_step": 125062, "epoch": 2977} {"train_loss": -6.64866828918457, "global_step": 125063, "epoch": 2977} {"train_loss": -6.552789688110352, "global_step": 125064, "epoch": 2977} {"train_loss": -6.669940948486328, "global_step": 125065, "epoch": 2977} {"train_loss": -6.698799133300781, "global_step": 125066, "epoch": 2977} {"train_loss": -6.699170112609863, "global_step": 125067, "epoch": 2977} {"train_loss": -6.651164531707764, "global_step": 125068, "epoch": 2977} {"train_loss": -6.644115447998047, "global_step": 125069, "epoch": 2977} {"train_loss": -6.573972702026367, "global_step": 125070, "epoch": 2977} {"train_loss": -6.592409610748291, "global_step": 125071, "epoch": 2977} {"train_loss": -6.724661827087402, "global_step": 125072, "epoch": 2977} {"train_loss": -6.60955810546875, "global_step": 125073, "epoch": 2977} {"train_loss": -6.483722686767578, "global_step": 125074, "epoch": 2977} {"train_loss": -6.629766543706258, "global_step": 125075, "epoch": 2977, "val_loss": 66120.1796875} {"train_loss": -6.70074987411499, "global_step": 125076, "epoch": 2978} {"train_loss": -6.572446823120117, "global_step": 125077, "epoch": 2978} {"train_loss": -6.575366020202637, "global_step": 125078, "epoch": 2978} {"train_loss": -6.603245735168457, "global_step": 125079, "epoch": 2978} {"train_loss": -6.570969581604004, "global_step": 125080, "epoch": 2978} {"train_loss": -6.629696846008301, "global_step": 125081, "epoch": 2978} {"train_loss": -6.588520050048828, "global_step": 125082, "epoch": 2978} {"train_loss": -6.678502082824707, "global_step": 125083, "epoch": 2978} {"train_loss": -6.646481513977051, "global_step": 125084, "epoch": 2978} {"train_loss": -6.638079643249512, "global_step": 125085, "epoch": 2978} {"train_loss": -6.612425804138184, "global_step": 125086, "epoch": 2978} {"train_loss": -6.625072002410889, "global_step": 125087, "epoch": 2978} {"train_loss": -6.619498252868652, "global_step": 125088, "epoch": 2978} {"train_loss": -6.729585647583008, "global_step": 125089, "epoch": 2978} {"train_loss": -6.641319274902344, "global_step": 125090, "epoch": 2978} {"train_loss": -6.66331672668457, "global_step": 125091, "epoch": 2978} {"train_loss": -6.611289978027344, "global_step": 125092, "epoch": 2978} {"train_loss": -6.521971225738525, "global_step": 125093, "epoch": 2978} {"train_loss": -6.628838539123535, "global_step": 125094, "epoch": 2978} {"train_loss": -6.674822807312012, "global_step": 125095, "epoch": 2978} {"train_loss": -6.713437557220459, "global_step": 125096, "epoch": 2978} {"train_loss": -6.562170505523682, "global_step": 125097, "epoch": 2978} {"train_loss": -6.668990135192871, "global_step": 125098, "epoch": 2978} {"train_loss": -6.612560272216797, "global_step": 125099, "epoch": 2978} {"train_loss": -6.62337589263916, "global_step": 125100, "epoch": 2978} {"train_loss": -6.721963882446289, "global_step": 125101, "epoch": 2978} {"train_loss": -6.593646049499512, "global_step": 125102, "epoch": 2978} {"train_loss": -6.516976356506348, "global_step": 125103, "epoch": 2978} {"train_loss": -6.624633312225342, "global_step": 125104, "epoch": 2978} {"train_loss": -6.6584272384643555, "global_step": 125105, "epoch": 2978} {"train_loss": -6.633234977722168, "global_step": 125106, "epoch": 2978} {"train_loss": -6.615476131439209, "global_step": 125107, "epoch": 2978} {"train_loss": -6.588991165161133, "global_step": 125108, "epoch": 2978} {"train_loss": -6.704226970672607, "global_step": 125109, "epoch": 2978} {"train_loss": -6.751574993133545, "global_step": 125110, "epoch": 2978} {"train_loss": -6.665961742401123, "global_step": 125111, "epoch": 2978} {"train_loss": -6.599447727203369, "global_step": 125112, "epoch": 2978} {"train_loss": -6.635204315185547, "global_step": 125113, "epoch": 2978} {"train_loss": -6.499152183532715, "global_step": 125114, "epoch": 2978} {"train_loss": -6.772129058837891, "global_step": 125115, "epoch": 2978} {"train_loss": -6.721089839935303, "global_step": 125116, "epoch": 2978} {"train_loss": -6.632747502554031, "global_step": 125117, "epoch": 2978, "val_loss": 66131.625} {"train_loss": -6.5775227546691895, "global_step": 125118, "epoch": 2979} {"train_loss": -6.510186195373535, "global_step": 125119, "epoch": 2979} {"train_loss": -6.542757034301758, "global_step": 125120, "epoch": 2979} {"train_loss": -6.57005500793457, "global_step": 125121, "epoch": 2979} {"train_loss": -6.576064109802246, "global_step": 125122, "epoch": 2979} {"train_loss": -6.531977653503418, "global_step": 125123, "epoch": 2979} {"train_loss": -6.708075523376465, "global_step": 125124, "epoch": 2979} {"train_loss": -6.655022621154785, "global_step": 125125, "epoch": 2979} {"train_loss": -6.608035087585449, "global_step": 125126, "epoch": 2979} {"train_loss": -6.625940799713135, "global_step": 125127, "epoch": 2979} {"train_loss": -6.604985237121582, "global_step": 125128, "epoch": 2979} {"train_loss": -6.706033706665039, "global_step": 125129, "epoch": 2979} {"train_loss": -6.599360466003418, "global_step": 125130, "epoch": 2979} {"train_loss": -6.627635478973389, "global_step": 125131, "epoch": 2979} {"train_loss": -6.687234401702881, "global_step": 125132, "epoch": 2979} {"train_loss": -6.5972700119018555, "global_step": 125133, "epoch": 2979} {"train_loss": -6.728207588195801, "global_step": 125134, "epoch": 2979} {"train_loss": -6.725921630859375, "global_step": 125135, "epoch": 2979} {"train_loss": -6.630978584289551, "global_step": 125136, "epoch": 2979} {"train_loss": -6.688999176025391, "global_step": 125137, "epoch": 2979} {"train_loss": -6.650649070739746, "global_step": 125138, "epoch": 2979} {"train_loss": -6.6789422035217285, "global_step": 125139, "epoch": 2979} {"train_loss": -6.716319561004639, "global_step": 125140, "epoch": 2979} {"train_loss": -6.656184673309326, "global_step": 125141, "epoch": 2979} {"train_loss": -6.715142250061035, "global_step": 125142, "epoch": 2979} {"train_loss": -6.6506733894348145, "global_step": 125143, "epoch": 2979} {"train_loss": -6.615012168884277, "global_step": 125144, "epoch": 2979} {"train_loss": -6.715599536895752, "global_step": 125145, "epoch": 2979} {"train_loss": -6.735799312591553, "global_step": 125146, "epoch": 2979} {"train_loss": -6.686707019805908, "global_step": 125147, "epoch": 2979} {"train_loss": -6.666853904724121, "global_step": 125148, "epoch": 2979} {"train_loss": -6.7398681640625, "global_step": 125149, "epoch": 2979} {"train_loss": -6.533411026000977, "global_step": 125150, "epoch": 2979} {"train_loss": -6.692080020904541, "global_step": 125151, "epoch": 2979} {"train_loss": -6.69623327255249, "global_step": 125152, "epoch": 2979} {"train_loss": -6.644059181213379, "global_step": 125153, "epoch": 2979} {"train_loss": -6.544484615325928, "global_step": 125154, "epoch": 2979} {"train_loss": -6.5733232498168945, "global_step": 125155, "epoch": 2979} {"train_loss": -6.65013313293457, "global_step": 125156, "epoch": 2979} {"train_loss": -6.609043121337891, "global_step": 125157, "epoch": 2979} {"train_loss": -6.689557075500488, "global_step": 125158, "epoch": 2979} {"train_loss": -6.6445034231458395, "global_step": 125159, "epoch": 2979, "val_loss": 65812.0078125} {"train_loss": -6.61489725112915, "global_step": 125160, "epoch": 2980} {"train_loss": -6.6100754737854, "global_step": 125161, "epoch": 2980} {"train_loss": -6.576546669006348, "global_step": 125162, "epoch": 2980} {"train_loss": -6.765493392944336, "global_step": 125163, "epoch": 2980} {"train_loss": -6.527469635009766, "global_step": 125164, "epoch": 2980} {"train_loss": -6.634888648986816, "global_step": 125165, "epoch": 2980} {"train_loss": -6.669683456420898, "global_step": 125166, "epoch": 2980} {"train_loss": -6.583563804626465, "global_step": 125167, "epoch": 2980} {"train_loss": -6.628055572509766, "global_step": 125168, "epoch": 2980} {"train_loss": -6.720758438110352, "global_step": 125169, "epoch": 2980} {"train_loss": -6.630064487457275, "global_step": 125170, "epoch": 2980} {"train_loss": -6.567129135131836, "global_step": 125171, "epoch": 2980} {"train_loss": -6.602896690368652, "global_step": 125172, "epoch": 2980} {"train_loss": -6.645716667175293, "global_step": 125173, "epoch": 2980} {"train_loss": -6.575314521789551, "global_step": 125174, "epoch": 2980} {"train_loss": -6.567614555358887, "global_step": 125175, "epoch": 2980} {"train_loss": -6.806341171264648, "global_step": 125176, "epoch": 2980} {"train_loss": -6.642985820770264, "global_step": 125177, "epoch": 2980} {"train_loss": -6.776493072509766, "global_step": 125178, "epoch": 2980} {"train_loss": -6.584423065185547, "global_step": 125179, "epoch": 2980} {"train_loss": -6.7532806396484375, "global_step": 125180, "epoch": 2980} {"train_loss": -6.615024089813232, "global_step": 125181, "epoch": 2980} {"train_loss": -6.652945518493652, "global_step": 125182, "epoch": 2980} {"train_loss": -6.6732258796691895, "global_step": 125183, "epoch": 2980} {"train_loss": -6.609838485717773, "global_step": 125184, "epoch": 2980} {"train_loss": -6.712588310241699, "global_step": 125185, "epoch": 2980} {"train_loss": -6.632802963256836, "global_step": 125186, "epoch": 2980} {"train_loss": -6.6078901290893555, "global_step": 125187, "epoch": 2980} {"train_loss": -6.62926721572876, "global_step": 125188, "epoch": 2980} {"train_loss": -6.573296070098877, "global_step": 125189, "epoch": 2980} {"train_loss": -6.799875259399414, "global_step": 125190, "epoch": 2980} {"train_loss": -6.620739459991455, "global_step": 125191, "epoch": 2980} {"train_loss": -6.570339202880859, "global_step": 125192, "epoch": 2980} {"train_loss": -6.445435523986816, "global_step": 125193, "epoch": 2980} {"train_loss": -6.549272537231445, "global_step": 125194, "epoch": 2980} {"train_loss": -6.671306610107422, "global_step": 125195, "epoch": 2980} {"train_loss": -6.4310808181762695, "global_step": 125196, "epoch": 2980} {"train_loss": -6.505716800689697, "global_step": 125197, "epoch": 2980} {"train_loss": -6.518415451049805, "global_step": 125198, "epoch": 2980} {"train_loss": -6.495713710784912, "global_step": 125199, "epoch": 2980} {"train_loss": -6.543736457824707, "global_step": 125200, "epoch": 2980} {"train_loss": -6.61721244312468, "global_step": 125201, "epoch": 2980, "val_loss": 66094.671875} {"train_loss": -6.533425331115723, "global_step": 125202, "epoch": 2981} {"train_loss": -6.470295429229736, "global_step": 125203, "epoch": 2981} {"train_loss": -6.561800956726074, "global_step": 125204, "epoch": 2981} {"train_loss": -6.665844917297363, "global_step": 125205, "epoch": 2981} {"train_loss": -6.596808910369873, "global_step": 125206, "epoch": 2981} {"train_loss": -6.633192539215088, "global_step": 125207, "epoch": 2981} {"train_loss": -6.50977897644043, "global_step": 125208, "epoch": 2981} {"train_loss": -6.575841426849365, "global_step": 125209, "epoch": 2981} {"train_loss": -6.592703819274902, "global_step": 125210, "epoch": 2981} {"train_loss": -6.504804611206055, "global_step": 125211, "epoch": 2981} {"train_loss": -6.564654350280762, "global_step": 125212, "epoch": 2981} {"train_loss": -6.653602600097656, "global_step": 125213, "epoch": 2981} {"train_loss": -6.565310001373291, "global_step": 125214, "epoch": 2981} {"train_loss": -6.640970230102539, "global_step": 125215, "epoch": 2981} {"train_loss": -6.709886074066162, "global_step": 125216, "epoch": 2981} {"train_loss": -6.545262813568115, "global_step": 125217, "epoch": 2981} {"train_loss": -6.667753219604492, "global_step": 125218, "epoch": 2981} {"train_loss": -6.595957279205322, "global_step": 125219, "epoch": 2981} {"train_loss": -6.565372467041016, "global_step": 125220, "epoch": 2981} {"train_loss": -6.682302951812744, "global_step": 125221, "epoch": 2981} {"train_loss": -6.470301628112793, "global_step": 125222, "epoch": 2981} {"train_loss": -6.508693695068359, "global_step": 125223, "epoch": 2981} {"train_loss": -6.704959869384766, "global_step": 125224, "epoch": 2981} {"train_loss": -6.537106513977051, "global_step": 125225, "epoch": 2981} {"train_loss": -6.607126235961914, "global_step": 125226, "epoch": 2981} {"train_loss": -6.553393363952637, "global_step": 125227, "epoch": 2981} {"train_loss": -6.539400100708008, "global_step": 125228, "epoch": 2981} {"train_loss": -6.694155693054199, "global_step": 125229, "epoch": 2981} {"train_loss": -6.493060111999512, "global_step": 125230, "epoch": 2981} {"train_loss": -6.624915599822998, "global_step": 125231, "epoch": 2981} {"train_loss": -6.701051712036133, "global_step": 125232, "epoch": 2981} {"train_loss": -6.577199459075928, "global_step": 125233, "epoch": 2981} {"train_loss": -6.6438069343566895, "global_step": 125234, "epoch": 2981} {"train_loss": -6.56017541885376, "global_step": 125235, "epoch": 2981} {"train_loss": -6.574980735778809, "global_step": 125236, "epoch": 2981} {"train_loss": -6.645846366882324, "global_step": 125237, "epoch": 2981} {"train_loss": -6.582414150238037, "global_step": 125238, "epoch": 2981} {"train_loss": -6.622905731201172, "global_step": 125239, "epoch": 2981} {"train_loss": -6.685091018676758, "global_step": 125240, "epoch": 2981} {"train_loss": -6.462829113006592, "global_step": 125241, "epoch": 2981} {"train_loss": -6.535746097564697, "global_step": 125242, "epoch": 2981} {"train_loss": -6.589569875172207, "global_step": 125243, "epoch": 2981, "val_loss": 66106.78125} {"train_loss": -6.589767932891846, "global_step": 125244, "epoch": 2982} {"train_loss": -6.560996055603027, "global_step": 125245, "epoch": 2982} {"train_loss": -6.574504852294922, "global_step": 125246, "epoch": 2982} {"train_loss": -6.6864447593688965, "global_step": 125247, "epoch": 2982} {"train_loss": -6.634642124176025, "global_step": 125248, "epoch": 2982} {"train_loss": -6.621181964874268, "global_step": 125249, "epoch": 2982} {"train_loss": -6.757904052734375, "global_step": 125250, "epoch": 2982} {"train_loss": -6.616304397583008, "global_step": 125251, "epoch": 2982} {"train_loss": -6.680080890655518, "global_step": 125252, "epoch": 2982} {"train_loss": -6.667915344238281, "global_step": 125253, "epoch": 2982} {"train_loss": -6.707086086273193, "global_step": 125254, "epoch": 2982} {"train_loss": -6.667437553405762, "global_step": 125255, "epoch": 2982} {"train_loss": -6.537809371948242, "global_step": 125256, "epoch": 2982} {"train_loss": -6.5146026611328125, "global_step": 125257, "epoch": 2982} {"train_loss": -6.524877548217773, "global_step": 125258, "epoch": 2982} {"train_loss": -6.577319145202637, "global_step": 125259, "epoch": 2982} {"train_loss": -6.580072402954102, "global_step": 125260, "epoch": 2982} {"train_loss": -6.596155643463135, "global_step": 125261, "epoch": 2982} {"train_loss": -6.555997371673584, "global_step": 125262, "epoch": 2982} {"train_loss": -6.5771074295043945, "global_step": 125263, "epoch": 2982} {"train_loss": -6.576722145080566, "global_step": 125264, "epoch": 2982} {"train_loss": -6.57250452041626, "global_step": 125265, "epoch": 2982} {"train_loss": -6.6466875076293945, "global_step": 125266, "epoch": 2982} {"train_loss": -6.53199577331543, "global_step": 125267, "epoch": 2982} {"train_loss": -6.663397789001465, "global_step": 125268, "epoch": 2982} {"train_loss": -6.54812479019165, "global_step": 125269, "epoch": 2982} {"train_loss": -6.75742769241333, "global_step": 125270, "epoch": 2982} {"train_loss": -6.642950057983398, "global_step": 125271, "epoch": 2982} {"train_loss": -6.532278060913086, "global_step": 125272, "epoch": 2982} {"train_loss": -6.524035453796387, "global_step": 125273, "epoch": 2982} {"train_loss": -6.6587419509887695, "global_step": 125274, "epoch": 2982} {"train_loss": -6.621942043304443, "global_step": 125275, "epoch": 2982} {"train_loss": -6.681238174438477, "global_step": 125276, "epoch": 2982} {"train_loss": -6.5524749755859375, "global_step": 125277, "epoch": 2982} {"train_loss": -6.608201503753662, "global_step": 125278, "epoch": 2982} {"train_loss": -6.5714850425720215, "global_step": 125279, "epoch": 2982} {"train_loss": -6.61651611328125, "global_step": 125280, "epoch": 2982} {"train_loss": -6.579797744750977, "global_step": 125281, "epoch": 2982} {"train_loss": -6.591829299926758, "global_step": 125282, "epoch": 2982} {"train_loss": -6.519689559936523, "global_step": 125283, "epoch": 2982} {"train_loss": -6.597459316253662, "global_step": 125284, "epoch": 2982} {"train_loss": -6.6076009046463735, "global_step": 125285, "epoch": 2982, "val_loss": 66243.265625} {"train_loss": -6.6492815017700195, "global_step": 125286, "epoch": 2983} {"train_loss": -6.750261306762695, "global_step": 125287, "epoch": 2983} {"train_loss": -6.533083915710449, "global_step": 125288, "epoch": 2983} {"train_loss": -6.688968658447266, "global_step": 125289, "epoch": 2983} {"train_loss": -6.625742435455322, "global_step": 125290, "epoch": 2983} {"train_loss": -6.583200931549072, "global_step": 125291, "epoch": 2983} {"train_loss": -6.609784126281738, "global_step": 125292, "epoch": 2983} {"train_loss": -6.593287467956543, "global_step": 125293, "epoch": 2983} {"train_loss": -6.747705459594727, "global_step": 125294, "epoch": 2983} {"train_loss": -6.6804728507995605, "global_step": 125295, "epoch": 2983} {"train_loss": -6.649304389953613, "global_step": 125296, "epoch": 2983} {"train_loss": -6.619099140167236, "global_step": 125297, "epoch": 2983} {"train_loss": -6.790779113769531, "global_step": 125298, "epoch": 2983} {"train_loss": -6.693404674530029, "global_step": 125299, "epoch": 2983} {"train_loss": -6.634198188781738, "global_step": 125300, "epoch": 2983} {"train_loss": -6.638943195343018, "global_step": 125301, "epoch": 2983} {"train_loss": -6.763197422027588, "global_step": 125302, "epoch": 2983} {"train_loss": -6.644427299499512, "global_step": 125303, "epoch": 2983} {"train_loss": -6.627579689025879, "global_step": 125304, "epoch": 2983} {"train_loss": -6.6614603996276855, "global_step": 125305, "epoch": 2983} {"train_loss": -6.575467109680176, "global_step": 125306, "epoch": 2983} {"train_loss": -6.594733238220215, "global_step": 125307, "epoch": 2983} {"train_loss": -6.592347145080566, "global_step": 125308, "epoch": 2983} {"train_loss": -6.627627372741699, "global_step": 125309, "epoch": 2983} {"train_loss": -6.665617942810059, "global_step": 125310, "epoch": 2983} {"train_loss": -6.700444221496582, "global_step": 125311, "epoch": 2983} {"train_loss": -6.501543998718262, "global_step": 125312, "epoch": 2983} {"train_loss": -6.731040954589844, "global_step": 125313, "epoch": 2983} {"train_loss": -6.661934852600098, "global_step": 125314, "epoch": 2983} {"train_loss": -6.697772026062012, "global_step": 125315, "epoch": 2983} {"train_loss": -6.601578235626221, "global_step": 125316, "epoch": 2983} {"train_loss": -6.5047197341918945, "global_step": 125317, "epoch": 2983} {"train_loss": -6.501572608947754, "global_step": 125318, "epoch": 2983} {"train_loss": -6.6566362380981445, "global_step": 125319, "epoch": 2983} {"train_loss": -6.530796051025391, "global_step": 125320, "epoch": 2983} {"train_loss": -6.623847007751465, "global_step": 125321, "epoch": 2983} {"train_loss": -6.651581764221191, "global_step": 125322, "epoch": 2983} {"train_loss": -6.658411502838135, "global_step": 125323, "epoch": 2983} {"train_loss": -6.633697509765625, "global_step": 125324, "epoch": 2983} {"train_loss": -6.719352722167969, "global_step": 125325, "epoch": 2983} {"train_loss": -6.597411155700684, "global_step": 125326, "epoch": 2983} {"train_loss": -6.640279224940708, "global_step": 125327, "epoch": 2983, "val_loss": 66277.1875} {"train_loss": -6.628866672515869, "global_step": 125328, "epoch": 2984} {"train_loss": -6.5844926834106445, "global_step": 125329, "epoch": 2984} {"train_loss": -6.736611366271973, "global_step": 125330, "epoch": 2984} {"train_loss": -6.610731601715088, "global_step": 125331, "epoch": 2984} {"train_loss": -6.651442050933838, "global_step": 125332, "epoch": 2984} {"train_loss": -6.5895185470581055, "global_step": 125333, "epoch": 2984} {"train_loss": -6.629331588745117, "global_step": 125334, "epoch": 2984} {"train_loss": -6.6494317054748535, "global_step": 125335, "epoch": 2984} {"train_loss": -6.713699817657471, "global_step": 125336, "epoch": 2984} {"train_loss": -6.661952972412109, "global_step": 125337, "epoch": 2984} {"train_loss": -6.566758632659912, "global_step": 125338, "epoch": 2984} {"train_loss": -6.56850004196167, "global_step": 125339, "epoch": 2984} {"train_loss": -6.551643371582031, "global_step": 125340, "epoch": 2984} {"train_loss": -6.58742618560791, "global_step": 125341, "epoch": 2984} {"train_loss": -6.678990364074707, "global_step": 125342, "epoch": 2984} {"train_loss": -6.553811550140381, "global_step": 125343, "epoch": 2984} {"train_loss": -6.640839576721191, "global_step": 125344, "epoch": 2984} {"train_loss": -6.551171779632568, "global_step": 125345, "epoch": 2984} {"train_loss": -6.562198638916016, "global_step": 125346, "epoch": 2984} {"train_loss": -6.640542030334473, "global_step": 125347, "epoch": 2984} {"train_loss": -6.486474990844727, "global_step": 125348, "epoch": 2984} {"train_loss": -6.597324371337891, "global_step": 125349, "epoch": 2984} {"train_loss": -6.567219257354736, "global_step": 125350, "epoch": 2984} {"train_loss": -6.549694061279297, "global_step": 125351, "epoch": 2984} {"train_loss": -6.55957555770874, "global_step": 125352, "epoch": 2984} {"train_loss": -6.6267194747924805, "global_step": 125353, "epoch": 2984} {"train_loss": -6.507424831390381, "global_step": 125354, "epoch": 2984} {"train_loss": -6.597054481506348, "global_step": 125355, "epoch": 2984} {"train_loss": -6.548885822296143, "global_step": 125356, "epoch": 2984} {"train_loss": -6.547847747802734, "global_step": 125357, "epoch": 2984} {"train_loss": -6.6460795402526855, "global_step": 125358, "epoch": 2984} {"train_loss": -6.62479305267334, "global_step": 125359, "epoch": 2984} {"train_loss": -6.509126663208008, "global_step": 125360, "epoch": 2984} {"train_loss": -6.634219169616699, "global_step": 125361, "epoch": 2984} {"train_loss": -6.54937219619751, "global_step": 125362, "epoch": 2984} {"train_loss": -6.629617214202881, "global_step": 125363, "epoch": 2984} {"train_loss": -6.543091773986816, "global_step": 125364, "epoch": 2984} {"train_loss": -6.564389228820801, "global_step": 125365, "epoch": 2984} {"train_loss": -6.59080171585083, "global_step": 125366, "epoch": 2984} {"train_loss": -6.509701251983643, "global_step": 125367, "epoch": 2984} {"train_loss": -6.393141746520996, "global_step": 125368, "epoch": 2984} {"train_loss": -6.5872525828225275, "global_step": 125369, "epoch": 2984, "val_loss": 66176.109375} {"train_loss": -6.471943378448486, "global_step": 125370, "epoch": 2985} {"train_loss": -6.467895984649658, "global_step": 125371, "epoch": 2985} {"train_loss": -6.510364532470703, "global_step": 125372, "epoch": 2985} {"train_loss": -6.4885149002075195, "global_step": 125373, "epoch": 2985} {"train_loss": -6.5511884689331055, "global_step": 125374, "epoch": 2985} {"train_loss": -6.464587211608887, "global_step": 125375, "epoch": 2985} {"train_loss": -6.610430717468262, "global_step": 125376, "epoch": 2985} {"train_loss": -6.489416122436523, "global_step": 125377, "epoch": 2985} {"train_loss": -6.543948173522949, "global_step": 125378, "epoch": 2985} {"train_loss": -6.550925254821777, "global_step": 125379, "epoch": 2985} {"train_loss": -6.563148498535156, "global_step": 125380, "epoch": 2985} {"train_loss": -6.58473014831543, "global_step": 125381, "epoch": 2985} {"train_loss": -6.572866439819336, "global_step": 125382, "epoch": 2985} {"train_loss": -6.54960823059082, "global_step": 125383, "epoch": 2985} {"train_loss": -6.506664276123047, "global_step": 125384, "epoch": 2985} {"train_loss": -6.544612884521484, "global_step": 125385, "epoch": 2985} {"train_loss": -6.516663074493408, "global_step": 125386, "epoch": 2985} {"train_loss": -6.642045974731445, "global_step": 125387, "epoch": 2985} {"train_loss": -6.573851585388184, "global_step": 125388, "epoch": 2985} {"train_loss": -6.503125190734863, "global_step": 125389, "epoch": 2985} {"train_loss": -6.6678619384765625, "global_step": 125390, "epoch": 2985} {"train_loss": -6.492845058441162, "global_step": 125391, "epoch": 2985} {"train_loss": -6.5385894775390625, "global_step": 125392, "epoch": 2985} {"train_loss": -6.679457664489746, "global_step": 125393, "epoch": 2985} {"train_loss": -6.556579113006592, "global_step": 125394, "epoch": 2985} {"train_loss": -6.661996364593506, "global_step": 125395, "epoch": 2985} {"train_loss": -6.594109058380127, "global_step": 125396, "epoch": 2985} {"train_loss": -6.593912124633789, "global_step": 125397, "epoch": 2985} {"train_loss": -6.5738420486450195, "global_step": 125398, "epoch": 2985} {"train_loss": -6.578947067260742, "global_step": 125399, "epoch": 2985} {"train_loss": -6.679475784301758, "global_step": 125400, "epoch": 2985} {"train_loss": -6.637206077575684, "global_step": 125401, "epoch": 2985} {"train_loss": -6.632865905761719, "global_step": 125402, "epoch": 2985} {"train_loss": -6.670697212219238, "global_step": 125403, "epoch": 2985} {"train_loss": -6.6228508949279785, "global_step": 125404, "epoch": 2985} {"train_loss": -6.752903938293457, "global_step": 125405, "epoch": 2985} {"train_loss": -6.665733814239502, "global_step": 125406, "epoch": 2985} {"train_loss": -6.649903297424316, "global_step": 125407, "epoch": 2985} {"train_loss": -6.639159679412842, "global_step": 125408, "epoch": 2985} {"train_loss": -6.724410057067871, "global_step": 125409, "epoch": 2985} {"train_loss": -6.661153793334961, "global_step": 125410, "epoch": 2985} {"train_loss": -6.588560093016851, "global_step": 125411, "epoch": 2985, "val_loss": 66190.140625} {"train_loss": -6.730288505554199, "global_step": 125412, "epoch": 2986} {"train_loss": -6.662201881408691, "global_step": 125413, "epoch": 2986} {"train_loss": -6.658256530761719, "global_step": 125414, "epoch": 2986} {"train_loss": -6.6313700675964355, "global_step": 125415, "epoch": 2986} {"train_loss": -6.733146667480469, "global_step": 125416, "epoch": 2986} {"train_loss": -6.580217361450195, "global_step": 125417, "epoch": 2986} {"train_loss": -6.685696601867676, "global_step": 125418, "epoch": 2986} {"train_loss": -6.633638381958008, "global_step": 125419, "epoch": 2986} {"train_loss": -6.582892417907715, "global_step": 125420, "epoch": 2986} {"train_loss": -6.615382671356201, "global_step": 125421, "epoch": 2986} {"train_loss": -6.594870567321777, "global_step": 125422, "epoch": 2986} {"train_loss": -6.717879772186279, "global_step": 125423, "epoch": 2986} {"train_loss": -6.7227301597595215, "global_step": 125424, "epoch": 2986} {"train_loss": -6.744109153747559, "global_step": 125425, "epoch": 2986} {"train_loss": -6.770026206970215, "global_step": 125426, "epoch": 2986} {"train_loss": -6.693445205688477, "global_step": 125427, "epoch": 2986} {"train_loss": -6.757281303405762, "global_step": 125428, "epoch": 2986} {"train_loss": -6.65296745300293, "global_step": 125429, "epoch": 2986} {"train_loss": -6.63252592086792, "global_step": 125430, "epoch": 2986} {"train_loss": -6.618121147155762, "global_step": 125431, "epoch": 2986} {"train_loss": -6.690526485443115, "global_step": 125432, "epoch": 2986} {"train_loss": -6.694622039794922, "global_step": 125433, "epoch": 2986} {"train_loss": -6.592538356781006, "global_step": 125434, "epoch": 2986} {"train_loss": -6.741251468658447, "global_step": 125435, "epoch": 2986} {"train_loss": -6.626657962799072, "global_step": 125436, "epoch": 2986} {"train_loss": -6.590068817138672, "global_step": 125437, "epoch": 2986} {"train_loss": -6.623226165771484, "global_step": 125438, "epoch": 2986} {"train_loss": -6.700999736785889, "global_step": 125439, "epoch": 2986} {"train_loss": -6.7620930671691895, "global_step": 125440, "epoch": 2986} {"train_loss": -6.640023231506348, "global_step": 125441, "epoch": 2986} {"train_loss": -6.63629150390625, "global_step": 125442, "epoch": 2986} {"train_loss": -6.770379066467285, "global_step": 125443, "epoch": 2986} {"train_loss": -6.748024940490723, "global_step": 125444, "epoch": 2986} {"train_loss": -6.629673480987549, "global_step": 125445, "epoch": 2986} {"train_loss": -6.684823513031006, "global_step": 125446, "epoch": 2986} {"train_loss": -6.7691144943237305, "global_step": 125447, "epoch": 2986} {"train_loss": -6.684004783630371, "global_step": 125448, "epoch": 2986} {"train_loss": -6.648675441741943, "global_step": 125449, "epoch": 2986} {"train_loss": -6.731753826141357, "global_step": 125450, "epoch": 2986} {"train_loss": -6.651184558868408, "global_step": 125451, "epoch": 2986} {"train_loss": -6.697494983673096, "global_step": 125452, "epoch": 2986} {"train_loss": -6.675019775118146, "global_step": 125453, "epoch": 2986, "val_loss": 66020.3359375} {"train_loss": -6.66455078125, "global_step": 125454, "epoch": 2987} {"train_loss": -6.729848384857178, "global_step": 125455, "epoch": 2987} {"train_loss": -6.58143424987793, "global_step": 125456, "epoch": 2987} {"train_loss": -6.6617889404296875, "global_step": 125457, "epoch": 2987} {"train_loss": -6.679649829864502, "global_step": 125458, "epoch": 2987} {"train_loss": -6.685546398162842, "global_step": 125459, "epoch": 2987} {"train_loss": -6.601613998413086, "global_step": 125460, "epoch": 2987} {"train_loss": -6.643087387084961, "global_step": 125461, "epoch": 2987} {"train_loss": -6.707574844360352, "global_step": 125462, "epoch": 2987} {"train_loss": -6.685412883758545, "global_step": 125463, "epoch": 2987} {"train_loss": -6.616040229797363, "global_step": 125464, "epoch": 2987} {"train_loss": -6.6194963455200195, "global_step": 125465, "epoch": 2987} {"train_loss": -6.468091011047363, "global_step": 125466, "epoch": 2987} {"train_loss": -6.625676155090332, "global_step": 125467, "epoch": 2987} {"train_loss": -6.74531364440918, "global_step": 125468, "epoch": 2987} {"train_loss": -6.654756546020508, "global_step": 125469, "epoch": 2987} {"train_loss": -6.493362903594971, "global_step": 125470, "epoch": 2987} {"train_loss": -6.722746849060059, "global_step": 125471, "epoch": 2987} {"train_loss": -6.777925491333008, "global_step": 125472, "epoch": 2987} {"train_loss": -6.569058418273926, "global_step": 125473, "epoch": 2987} {"train_loss": -6.646709442138672, "global_step": 125474, "epoch": 2987} {"train_loss": -6.66071891784668, "global_step": 125475, "epoch": 2987} {"train_loss": -6.74381685256958, "global_step": 125476, "epoch": 2987} {"train_loss": -6.637639045715332, "global_step": 125477, "epoch": 2987} {"train_loss": -6.601491928100586, "global_step": 125478, "epoch": 2987} {"train_loss": -6.68068790435791, "global_step": 125479, "epoch": 2987} {"train_loss": -6.697043418884277, "global_step": 125480, "epoch": 2987} {"train_loss": -6.634542465209961, "global_step": 125481, "epoch": 2987} {"train_loss": -6.652616500854492, "global_step": 125482, "epoch": 2987} {"train_loss": -6.819301605224609, "global_step": 125483, "epoch": 2987} {"train_loss": -6.636319160461426, "global_step": 125484, "epoch": 2987} {"train_loss": -6.567937850952148, "global_step": 125485, "epoch": 2987} {"train_loss": -6.713683128356934, "global_step": 125486, "epoch": 2987} {"train_loss": -6.647778511047363, "global_step": 125487, "epoch": 2987} {"train_loss": -6.635716915130615, "global_step": 125488, "epoch": 2987} {"train_loss": -6.649055480957031, "global_step": 125489, "epoch": 2987} {"train_loss": -6.678637504577637, "global_step": 125490, "epoch": 2987} {"train_loss": -6.555971145629883, "global_step": 125491, "epoch": 2987} {"train_loss": -6.576876640319824, "global_step": 125492, "epoch": 2987} {"train_loss": -6.566153049468994, "global_step": 125493, "epoch": 2987} {"train_loss": -6.592590808868408, "global_step": 125494, "epoch": 2987} {"train_loss": -6.645255032039824, "global_step": 125495, "epoch": 2987, "val_loss": 66475.3984375} {"train_loss": -6.593382835388184, "global_step": 125496, "epoch": 2988} {"train_loss": -6.698183059692383, "global_step": 125497, "epoch": 2988} {"train_loss": -6.602158546447754, "global_step": 125498, "epoch": 2988} {"train_loss": -6.603762626647949, "global_step": 125499, "epoch": 2988} {"train_loss": -6.58011531829834, "global_step": 125500, "epoch": 2988} {"train_loss": -6.525965213775635, "global_step": 125501, "epoch": 2988} {"train_loss": -6.718950271606445, "global_step": 125502, "epoch": 2988} {"train_loss": -6.617532253265381, "global_step": 125503, "epoch": 2988} {"train_loss": -6.607388019561768, "global_step": 125504, "epoch": 2988} {"train_loss": -6.7423810958862305, "global_step": 125505, "epoch": 2988} {"train_loss": -6.625481605529785, "global_step": 125506, "epoch": 2988} {"train_loss": -6.566080570220947, "global_step": 125507, "epoch": 2988} {"train_loss": -6.549399375915527, "global_step": 125508, "epoch": 2988} {"train_loss": -6.604472637176514, "global_step": 125509, "epoch": 2988} {"train_loss": -6.684965133666992, "global_step": 125510, "epoch": 2988} {"train_loss": -6.647805213928223, "global_step": 125511, "epoch": 2988} {"train_loss": -6.669965744018555, "global_step": 125512, "epoch": 2988} {"train_loss": -6.559770107269287, "global_step": 125513, "epoch": 2988} {"train_loss": -6.56658935546875, "global_step": 125514, "epoch": 2988} {"train_loss": -6.604776382446289, "global_step": 125515, "epoch": 2988} {"train_loss": -6.599623680114746, "global_step": 125516, "epoch": 2988} {"train_loss": -6.704715728759766, "global_step": 125517, "epoch": 2988} {"train_loss": -6.641470909118652, "global_step": 125518, "epoch": 2988} {"train_loss": -6.650844573974609, "global_step": 125519, "epoch": 2988} {"train_loss": -6.7594780921936035, "global_step": 125520, "epoch": 2988} {"train_loss": -6.708537578582764, "global_step": 125521, "epoch": 2988} {"train_loss": -6.564491271972656, "global_step": 125522, "epoch": 2988} {"train_loss": -6.632720470428467, "global_step": 125523, "epoch": 2988} {"train_loss": -6.653194427490234, "global_step": 125524, "epoch": 2988} {"train_loss": -6.68099308013916, "global_step": 125525, "epoch": 2988} {"train_loss": -6.701849937438965, "global_step": 125526, "epoch": 2988} {"train_loss": -6.745271682739258, "global_step": 125527, "epoch": 2988} {"train_loss": -6.708730220794678, "global_step": 125528, "epoch": 2988} {"train_loss": -6.615733623504639, "global_step": 125529, "epoch": 2988} {"train_loss": -6.670454978942871, "global_step": 125530, "epoch": 2988} {"train_loss": -6.637956619262695, "global_step": 125531, "epoch": 2988} {"train_loss": -6.714468002319336, "global_step": 125532, "epoch": 2988} {"train_loss": -6.560002326965332, "global_step": 125533, "epoch": 2988} {"train_loss": -6.441900253295898, "global_step": 125534, "epoch": 2988} {"train_loss": -6.636721611022949, "global_step": 125535, "epoch": 2988} {"train_loss": -6.469615459442139, "global_step": 125536, "epoch": 2988} {"train_loss": -6.630814506894066, "global_step": 125537, "epoch": 2988, "val_loss": 66224.1015625} {"train_loss": -6.595416069030762, "global_step": 125538, "epoch": 2989} {"train_loss": -6.434607982635498, "global_step": 125539, "epoch": 2989} {"train_loss": -6.6131415367126465, "global_step": 125540, "epoch": 2989} {"train_loss": -6.539561748504639, "global_step": 125541, "epoch": 2989} {"train_loss": -6.616059303283691, "global_step": 125542, "epoch": 2989} {"train_loss": -6.57780122756958, "global_step": 125543, "epoch": 2989} {"train_loss": -6.6157426834106445, "global_step": 125544, "epoch": 2989} {"train_loss": -6.708181381225586, "global_step": 125545, "epoch": 2989} {"train_loss": -6.5719146728515625, "global_step": 125546, "epoch": 2989} {"train_loss": -6.763612747192383, "global_step": 125547, "epoch": 2989} {"train_loss": -6.745265960693359, "global_step": 125548, "epoch": 2989} {"train_loss": -6.567477226257324, "global_step": 125549, "epoch": 2989} {"train_loss": -6.537851810455322, "global_step": 125550, "epoch": 2989} {"train_loss": -6.432125091552734, "global_step": 125551, "epoch": 2989} {"train_loss": -6.605253219604492, "global_step": 125552, "epoch": 2989} {"train_loss": -6.582408905029297, "global_step": 125553, "epoch": 2989} {"train_loss": -6.562702655792236, "global_step": 125554, "epoch": 2989} {"train_loss": -6.5969977378845215, "global_step": 125555, "epoch": 2989} {"train_loss": -6.71817684173584, "global_step": 125556, "epoch": 2989} {"train_loss": -6.673177719116211, "global_step": 125557, "epoch": 2989} {"train_loss": -6.483631134033203, "global_step": 125558, "epoch": 2989} {"train_loss": -6.6630859375, "global_step": 125559, "epoch": 2989} {"train_loss": -6.549138069152832, "global_step": 125560, "epoch": 2989} {"train_loss": -6.493017673492432, "global_step": 125561, "epoch": 2989} {"train_loss": -6.616994857788086, "global_step": 125562, "epoch": 2989} {"train_loss": -6.611852169036865, "global_step": 125563, "epoch": 2989} {"train_loss": -6.473085880279541, "global_step": 125564, "epoch": 2989} {"train_loss": -6.646264553070068, "global_step": 125565, "epoch": 2989} {"train_loss": -6.419713973999023, "global_step": 125566, "epoch": 2989} {"train_loss": -6.681906700134277, "global_step": 125567, "epoch": 2989} {"train_loss": -6.752469062805176, "global_step": 125568, "epoch": 2989} {"train_loss": -6.414674282073975, "global_step": 125569, "epoch": 2989} {"train_loss": -6.675362586975098, "global_step": 125570, "epoch": 2989} {"train_loss": -6.571521759033203, "global_step": 125571, "epoch": 2989} {"train_loss": -6.629435062408447, "global_step": 125572, "epoch": 2989} {"train_loss": -6.634620666503906, "global_step": 125573, "epoch": 2989} {"train_loss": -6.725964546203613, "global_step": 125574, "epoch": 2989} {"train_loss": -6.510628700256348, "global_step": 125575, "epoch": 2989} {"train_loss": -6.547117710113525, "global_step": 125576, "epoch": 2989} {"train_loss": -6.586739540100098, "global_step": 125577, "epoch": 2989} {"train_loss": -6.625426769256592, "global_step": 125578, "epoch": 2989} {"train_loss": -6.59329282669794, "global_step": 125579, "epoch": 2989, "val_loss": 66204.4453125} {"train_loss": -6.644824028015137, "global_step": 125580, "epoch": 2990} {"train_loss": -6.707898139953613, "global_step": 125581, "epoch": 2990} {"train_loss": -6.747636795043945, "global_step": 125582, "epoch": 2990} {"train_loss": -6.648106575012207, "global_step": 125583, "epoch": 2990} {"train_loss": -6.578263759613037, "global_step": 125584, "epoch": 2990} {"train_loss": -6.575491428375244, "global_step": 125585, "epoch": 2990} {"train_loss": -6.613330841064453, "global_step": 125586, "epoch": 2990} {"train_loss": -6.6529130935668945, "global_step": 125587, "epoch": 2990} {"train_loss": -6.518771171569824, "global_step": 125588, "epoch": 2990} {"train_loss": -6.651053428649902, "global_step": 125589, "epoch": 2990} {"train_loss": -6.693094253540039, "global_step": 125590, "epoch": 2990} {"train_loss": -6.439294815063477, "global_step": 125591, "epoch": 2990} {"train_loss": -6.455110549926758, "global_step": 125592, "epoch": 2990} {"train_loss": -6.580819606781006, "global_step": 125593, "epoch": 2990} {"train_loss": -6.480587005615234, "global_step": 125594, "epoch": 2990} {"train_loss": -6.5710906982421875, "global_step": 125595, "epoch": 2990} {"train_loss": -6.570263862609863, "global_step": 125596, "epoch": 2990} {"train_loss": -6.4936652183532715, "global_step": 125597, "epoch": 2990} {"train_loss": -6.535942077636719, "global_step": 125598, "epoch": 2990} {"train_loss": -6.525965690612793, "global_step": 125599, "epoch": 2990} {"train_loss": -6.628561019897461, "global_step": 125600, "epoch": 2990} {"train_loss": -6.51963472366333, "global_step": 125601, "epoch": 2990} {"train_loss": -6.61280632019043, "global_step": 125602, "epoch": 2990} {"train_loss": -6.6602983474731445, "global_step": 125603, "epoch": 2990} {"train_loss": -6.536022186279297, "global_step": 125604, "epoch": 2990} {"train_loss": -6.577579498291016, "global_step": 125605, "epoch": 2990} {"train_loss": -6.566986083984375, "global_step": 125606, "epoch": 2990} {"train_loss": -6.515751838684082, "global_step": 125607, "epoch": 2990} {"train_loss": -6.666118621826172, "global_step": 125608, "epoch": 2990} {"train_loss": -6.579771518707275, "global_step": 125609, "epoch": 2990} {"train_loss": -6.619791507720947, "global_step": 125610, "epoch": 2990} {"train_loss": -6.58523416519165, "global_step": 125611, "epoch": 2990} {"train_loss": -6.5549211502075195, "global_step": 125612, "epoch": 2990} {"train_loss": -6.580402374267578, "global_step": 125613, "epoch": 2990} {"train_loss": -6.595486640930176, "global_step": 125614, "epoch": 2990} {"train_loss": -6.682607173919678, "global_step": 125615, "epoch": 2990} {"train_loss": -6.684387683868408, "global_step": 125616, "epoch": 2990} {"train_loss": -6.65152645111084, "global_step": 125617, "epoch": 2990} {"train_loss": -6.726325988769531, "global_step": 125618, "epoch": 2990} {"train_loss": -6.616506099700928, "global_step": 125619, "epoch": 2990} {"train_loss": -6.705620765686035, "global_step": 125620, "epoch": 2990} {"train_loss": -6.598723320733933, "global_step": 125621, "epoch": 2990, "val_loss": 66203.3359375} {"train_loss": -6.762424945831299, "global_step": 125622, "epoch": 2991} {"train_loss": -6.657655715942383, "global_step": 125623, "epoch": 2991} {"train_loss": -6.6509904861450195, "global_step": 125624, "epoch": 2991} {"train_loss": -6.740525245666504, "global_step": 125625, "epoch": 2991} {"train_loss": -6.511438369750977, "global_step": 125626, "epoch": 2991} {"train_loss": -6.645485877990723, "global_step": 125627, "epoch": 2991} {"train_loss": -6.64587926864624, "global_step": 125628, "epoch": 2991} {"train_loss": -6.661624908447266, "global_step": 125629, "epoch": 2991} {"train_loss": -6.561590671539307, "global_step": 125630, "epoch": 2991} {"train_loss": -6.618735313415527, "global_step": 125631, "epoch": 2991} {"train_loss": -6.5771965980529785, "global_step": 125632, "epoch": 2991} {"train_loss": -6.609687805175781, "global_step": 125633, "epoch": 2991} {"train_loss": -6.696331024169922, "global_step": 125634, "epoch": 2991} {"train_loss": -6.618717193603516, "global_step": 125635, "epoch": 2991} {"train_loss": -6.587111473083496, "global_step": 125636, "epoch": 2991} {"train_loss": -6.567195415496826, "global_step": 125637, "epoch": 2991} {"train_loss": -6.604006767272949, "global_step": 125638, "epoch": 2991} {"train_loss": -6.622037887573242, "global_step": 125639, "epoch": 2991} {"train_loss": -6.657376766204834, "global_step": 125640, "epoch": 2991} {"train_loss": -6.619597434997559, "global_step": 125641, "epoch": 2991} {"train_loss": -6.6424880027771, "global_step": 125642, "epoch": 2991} {"train_loss": -6.640941143035889, "global_step": 125643, "epoch": 2991} {"train_loss": -6.591411590576172, "global_step": 125644, "epoch": 2991} {"train_loss": -6.5714850425720215, "global_step": 125645, "epoch": 2991} {"train_loss": -6.627480506896973, "global_step": 125646, "epoch": 2991} {"train_loss": -6.603015899658203, "global_step": 125647, "epoch": 2991} {"train_loss": -6.667498588562012, "global_step": 125648, "epoch": 2991} {"train_loss": -6.600139617919922, "global_step": 125649, "epoch": 2991} {"train_loss": -6.694463729858398, "global_step": 125650, "epoch": 2991} {"train_loss": -6.58253812789917, "global_step": 125651, "epoch": 2991} {"train_loss": -6.640192031860352, "global_step": 125652, "epoch": 2991} {"train_loss": -6.742508888244629, "global_step": 125653, "epoch": 2991} {"train_loss": -6.706502914428711, "global_step": 125654, "epoch": 2991} {"train_loss": -6.72721004486084, "global_step": 125655, "epoch": 2991} {"train_loss": -6.573631763458252, "global_step": 125656, "epoch": 2991} {"train_loss": -6.599516868591309, "global_step": 125657, "epoch": 2991} {"train_loss": -6.638012886047363, "global_step": 125658, "epoch": 2991} {"train_loss": -6.628488540649414, "global_step": 125659, "epoch": 2991} {"train_loss": -6.65163516998291, "global_step": 125660, "epoch": 2991} {"train_loss": -6.7080793380737305, "global_step": 125661, "epoch": 2991} {"train_loss": -6.572707176208496, "global_step": 125662, "epoch": 2991} {"train_loss": -6.636200291769845, "global_step": 125663, "epoch": 2991, "val_loss": 66101.984375} {"train_loss": -6.701642036437988, "global_step": 125664, "epoch": 2992} {"train_loss": -6.71450138092041, "global_step": 125665, "epoch": 2992} {"train_loss": -6.554577350616455, "global_step": 125666, "epoch": 2992} {"train_loss": -6.592926025390625, "global_step": 125667, "epoch": 2992} {"train_loss": -6.705503940582275, "global_step": 125668, "epoch": 2992} {"train_loss": -6.650012493133545, "global_step": 125669, "epoch": 2992} {"train_loss": -6.7186360359191895, "global_step": 125670, "epoch": 2992} {"train_loss": -6.586644172668457, "global_step": 125671, "epoch": 2992} {"train_loss": -6.710598468780518, "global_step": 125672, "epoch": 2992} {"train_loss": -6.651511192321777, "global_step": 125673, "epoch": 2992} {"train_loss": -6.586272239685059, "global_step": 125674, "epoch": 2992} {"train_loss": -6.719520568847656, "global_step": 125675, "epoch": 2992} {"train_loss": -6.694155693054199, "global_step": 125676, "epoch": 2992} {"train_loss": -6.636755466461182, "global_step": 125677, "epoch": 2992} {"train_loss": -6.585710525512695, "global_step": 125678, "epoch": 2992} {"train_loss": -6.563976287841797, "global_step": 125679, "epoch": 2992} {"train_loss": -6.733011245727539, "global_step": 125680, "epoch": 2992} {"train_loss": -6.693561553955078, "global_step": 125681, "epoch": 2992} {"train_loss": -6.612929821014404, "global_step": 125682, "epoch": 2992} {"train_loss": -6.664675712585449, "global_step": 125683, "epoch": 2992} {"train_loss": -6.55969762802124, "global_step": 125684, "epoch": 2992} {"train_loss": -6.586533069610596, "global_step": 125685, "epoch": 2992} {"train_loss": -6.669302463531494, "global_step": 125686, "epoch": 2992} {"train_loss": -6.53066349029541, "global_step": 125687, "epoch": 2992} {"train_loss": -6.587483882904053, "global_step": 125688, "epoch": 2992} {"train_loss": -6.49770450592041, "global_step": 125689, "epoch": 2992} {"train_loss": -6.6147894859313965, "global_step": 125690, "epoch": 2992} {"train_loss": -6.707139492034912, "global_step": 125691, "epoch": 2992} {"train_loss": -6.734053611755371, "global_step": 125692, "epoch": 2992} {"train_loss": -6.632633209228516, "global_step": 125693, "epoch": 2992} {"train_loss": -6.754518508911133, "global_step": 125694, "epoch": 2992} {"train_loss": -6.585058689117432, "global_step": 125695, "epoch": 2992} {"train_loss": -6.650964736938477, "global_step": 125696, "epoch": 2992} {"train_loss": -6.659524917602539, "global_step": 125697, "epoch": 2992} {"train_loss": -6.745919227600098, "global_step": 125698, "epoch": 2992} {"train_loss": -6.785118103027344, "global_step": 125699, "epoch": 2992} {"train_loss": -6.666935920715332, "global_step": 125700, "epoch": 2992} {"train_loss": -6.622794151306152, "global_step": 125701, "epoch": 2992} {"train_loss": -6.638761520385742, "global_step": 125702, "epoch": 2992} {"train_loss": -6.660710334777832, "global_step": 125703, "epoch": 2992} {"train_loss": -6.697552680969238, "global_step": 125704, "epoch": 2992} {"train_loss": -6.650285005569458, "global_step": 125705, "epoch": 2992, "val_loss": 66335.40625} {"train_loss": -6.675350666046143, "global_step": 125706, "epoch": 2993} {"train_loss": -6.7431440353393555, "global_step": 125707, "epoch": 2993} {"train_loss": -6.647481918334961, "global_step": 125708, "epoch": 2993} {"train_loss": -6.598257064819336, "global_step": 125709, "epoch": 2993} {"train_loss": -6.762495994567871, "global_step": 125710, "epoch": 2993} {"train_loss": -6.661319732666016, "global_step": 125711, "epoch": 2993} {"train_loss": -6.6959381103515625, "global_step": 125712, "epoch": 2993} {"train_loss": -6.669554710388184, "global_step": 125713, "epoch": 2993} {"train_loss": -6.66482400894165, "global_step": 125714, "epoch": 2993} {"train_loss": -6.634194374084473, "global_step": 125715, "epoch": 2993} {"train_loss": -6.557465553283691, "global_step": 125716, "epoch": 2993} {"train_loss": -6.548346519470215, "global_step": 125717, "epoch": 2993} {"train_loss": -6.577734470367432, "global_step": 125718, "epoch": 2993} {"train_loss": -6.617031574249268, "global_step": 125719, "epoch": 2993} {"train_loss": -6.573361396789551, "global_step": 125720, "epoch": 2993} {"train_loss": -6.672540664672852, "global_step": 125721, "epoch": 2993} {"train_loss": -6.699977874755859, "global_step": 125722, "epoch": 2993} {"train_loss": -6.4186835289001465, "global_step": 125723, "epoch": 2993} {"train_loss": -6.706419944763184, "global_step": 125724, "epoch": 2993} {"train_loss": -6.623746871948242, "global_step": 125725, "epoch": 2993} {"train_loss": -6.575230598449707, "global_step": 125726, "epoch": 2993} {"train_loss": -6.448658466339111, "global_step": 125727, "epoch": 2993} {"train_loss": -6.416511058807373, "global_step": 125728, "epoch": 2993} {"train_loss": -6.597465991973877, "global_step": 125729, "epoch": 2993} {"train_loss": -6.720722198486328, "global_step": 125730, "epoch": 2993} {"train_loss": -6.458059787750244, "global_step": 125731, "epoch": 2993} {"train_loss": -6.5480146408081055, "global_step": 125732, "epoch": 2993} {"train_loss": -6.722871780395508, "global_step": 125733, "epoch": 2993} {"train_loss": -6.697626113891602, "global_step": 125734, "epoch": 2993} {"train_loss": -6.583696365356445, "global_step": 125735, "epoch": 2993} {"train_loss": -6.505755424499512, "global_step": 125736, "epoch": 2993} {"train_loss": -6.484988212585449, "global_step": 125737, "epoch": 2993} {"train_loss": -6.6889753341674805, "global_step": 125738, "epoch": 2993} {"train_loss": -6.579605579376221, "global_step": 125739, "epoch": 2993} {"train_loss": -6.564477920532227, "global_step": 125740, "epoch": 2993} {"train_loss": -6.588317394256592, "global_step": 125741, "epoch": 2993} {"train_loss": -6.662446022033691, "global_step": 125742, "epoch": 2993} {"train_loss": -6.726759910583496, "global_step": 125743, "epoch": 2993} {"train_loss": -6.663193702697754, "global_step": 125744, "epoch": 2993} {"train_loss": -6.5799078941345215, "global_step": 125745, "epoch": 2993} {"train_loss": -6.711129188537598, "global_step": 125746, "epoch": 2993} {"train_loss": -6.621253217969622, "global_step": 125747, "epoch": 2993, "val_loss": 66430.90625} {"train_loss": -6.665042400360107, "global_step": 125748, "epoch": 2994} {"train_loss": -6.627687931060791, "global_step": 125749, "epoch": 2994} {"train_loss": -6.598465919494629, "global_step": 125750, "epoch": 2994} {"train_loss": -6.6194000244140625, "global_step": 125751, "epoch": 2994} {"train_loss": -6.752412796020508, "global_step": 125752, "epoch": 2994} {"train_loss": -6.731348991394043, "global_step": 125753, "epoch": 2994} {"train_loss": -6.646803855895996, "global_step": 125754, "epoch": 2994} {"train_loss": -6.547577857971191, "global_step": 125755, "epoch": 2994} {"train_loss": -6.782981872558594, "global_step": 125756, "epoch": 2994} {"train_loss": -6.713954925537109, "global_step": 125757, "epoch": 2994} {"train_loss": -6.676777362823486, "global_step": 125758, "epoch": 2994} {"train_loss": -6.697434425354004, "global_step": 125759, "epoch": 2994} {"train_loss": -6.650446891784668, "global_step": 125760, "epoch": 2994} {"train_loss": -6.723994255065918, "global_step": 125761, "epoch": 2994} {"train_loss": -6.627963542938232, "global_step": 125762, "epoch": 2994} {"train_loss": -6.597711563110352, "global_step": 125763, "epoch": 2994} {"train_loss": -6.5716142654418945, "global_step": 125764, "epoch": 2994} {"train_loss": -6.534523010253906, "global_step": 125765, "epoch": 2994} {"train_loss": -6.588191032409668, "global_step": 125766, "epoch": 2994} {"train_loss": -6.506847381591797, "global_step": 125767, "epoch": 2994} {"train_loss": -6.65416955947876, "global_step": 125768, "epoch": 2994} {"train_loss": -6.551590919494629, "global_step": 125769, "epoch": 2994} {"train_loss": -6.535582542419434, "global_step": 125770, "epoch": 2994} {"train_loss": -6.560204029083252, "global_step": 125771, "epoch": 2994} {"train_loss": -6.626862049102783, "global_step": 125772, "epoch": 2994} {"train_loss": -6.520124912261963, "global_step": 125773, "epoch": 2994} {"train_loss": -6.564213752746582, "global_step": 125774, "epoch": 2994} {"train_loss": -6.574209690093994, "global_step": 125775, "epoch": 2994} {"train_loss": -6.558672904968262, "global_step": 125776, "epoch": 2994} {"train_loss": -6.557205677032471, "global_step": 125777, "epoch": 2994} {"train_loss": -6.565649509429932, "global_step": 125778, "epoch": 2994} {"train_loss": -6.645409107208252, "global_step": 125779, "epoch": 2994} {"train_loss": -6.585422515869141, "global_step": 125780, "epoch": 2994} {"train_loss": -6.587022304534912, "global_step": 125781, "epoch": 2994} {"train_loss": -6.674315452575684, "global_step": 125782, "epoch": 2994} {"train_loss": -6.605412483215332, "global_step": 125783, "epoch": 2994} {"train_loss": -6.602002143859863, "global_step": 125784, "epoch": 2994} {"train_loss": -6.68375301361084, "global_step": 125785, "epoch": 2994} {"train_loss": -6.665641784667969, "global_step": 125786, "epoch": 2994} {"train_loss": -6.650946140289307, "global_step": 125787, "epoch": 2994} {"train_loss": -6.640211582183838, "global_step": 125788, "epoch": 2994} {"train_loss": -6.619566656294323, "global_step": 125789, "epoch": 2994, "val_loss": 66198.28125} {"train_loss": -6.719789505004883, "global_step": 125790, "epoch": 2995} {"train_loss": -6.64849328994751, "global_step": 125791, "epoch": 2995} {"train_loss": -6.581914901733398, "global_step": 125792, "epoch": 2995} {"train_loss": -6.604269981384277, "global_step": 125793, "epoch": 2995} {"train_loss": -6.763256072998047, "global_step": 125794, "epoch": 2995} {"train_loss": -6.683592796325684, "global_step": 125795, "epoch": 2995} {"train_loss": -6.780954837799072, "global_step": 125796, "epoch": 2995} {"train_loss": -6.7467546463012695, "global_step": 125797, "epoch": 2995} {"train_loss": -6.732769966125488, "global_step": 125798, "epoch": 2995} {"train_loss": -6.701801300048828, "global_step": 125799, "epoch": 2995} {"train_loss": -6.620522975921631, "global_step": 125800, "epoch": 2995} {"train_loss": -6.627614974975586, "global_step": 125801, "epoch": 2995} {"train_loss": -6.6279215812683105, "global_step": 125802, "epoch": 2995} {"train_loss": -6.497947692871094, "global_step": 125803, "epoch": 2995} {"train_loss": -6.564693927764893, "global_step": 125804, "epoch": 2995} {"train_loss": -6.7070512771606445, "global_step": 125805, "epoch": 2995} {"train_loss": -6.574507713317871, "global_step": 125806, "epoch": 2995} {"train_loss": -6.616257667541504, "global_step": 125807, "epoch": 2995} {"train_loss": -6.611042022705078, "global_step": 125808, "epoch": 2995} {"train_loss": -6.527115345001221, "global_step": 125809, "epoch": 2995} {"train_loss": -6.681388854980469, "global_step": 125810, "epoch": 2995} {"train_loss": -6.481837749481201, "global_step": 125811, "epoch": 2995} {"train_loss": -6.583225250244141, "global_step": 125812, "epoch": 2995} {"train_loss": -6.547070503234863, "global_step": 125813, "epoch": 2995} {"train_loss": -6.601256370544434, "global_step": 125814, "epoch": 2995} {"train_loss": -6.693229675292969, "global_step": 125815, "epoch": 2995} {"train_loss": -6.597137451171875, "global_step": 125816, "epoch": 2995} {"train_loss": -6.482781410217285, "global_step": 125817, "epoch": 2995} {"train_loss": -6.636989593505859, "global_step": 125818, "epoch": 2995} {"train_loss": -6.529897689819336, "global_step": 125819, "epoch": 2995} {"train_loss": -6.652939796447754, "global_step": 125820, "epoch": 2995} {"train_loss": -6.579008102416992, "global_step": 125821, "epoch": 2995} {"train_loss": -6.481232643127441, "global_step": 125822, "epoch": 2995} {"train_loss": -6.632820129394531, "global_step": 125823, "epoch": 2995} {"train_loss": -6.559754371643066, "global_step": 125824, "epoch": 2995} {"train_loss": -6.557973861694336, "global_step": 125825, "epoch": 2995} {"train_loss": -6.684776306152344, "global_step": 125826, "epoch": 2995} {"train_loss": -6.4343791007995605, "global_step": 125827, "epoch": 2995} {"train_loss": -6.625628471374512, "global_step": 125828, "epoch": 2995} {"train_loss": -6.609428405761719, "global_step": 125829, "epoch": 2995} {"train_loss": -6.613616943359375, "global_step": 125830, "epoch": 2995} {"train_loss": -6.613556521279471, "global_step": 125831, "epoch": 2995, "val_loss": 66014.0390625} {"train_loss": -6.679788589477539, "global_step": 125832, "epoch": 2996} {"train_loss": -6.639849662780762, "global_step": 125833, "epoch": 2996} {"train_loss": -6.660554885864258, "global_step": 125834, "epoch": 2996} {"train_loss": -6.565978527069092, "global_step": 125835, "epoch": 2996} {"train_loss": -6.572003364562988, "global_step": 125836, "epoch": 2996} {"train_loss": -6.675615310668945, "global_step": 125837, "epoch": 2996} {"train_loss": -6.66374397277832, "global_step": 125838, "epoch": 2996} {"train_loss": -6.641928672790527, "global_step": 125839, "epoch": 2996} {"train_loss": -6.640297889709473, "global_step": 125840, "epoch": 2996} {"train_loss": -6.663487434387207, "global_step": 125841, "epoch": 2996} {"train_loss": -6.704084873199463, "global_step": 125842, "epoch": 2996} {"train_loss": -6.549423694610596, "global_step": 125843, "epoch": 2996} {"train_loss": -6.56374454498291, "global_step": 125844, "epoch": 2996} {"train_loss": -6.631821632385254, "global_step": 125845, "epoch": 2996} {"train_loss": -6.6218109130859375, "global_step": 125846, "epoch": 2996} {"train_loss": -6.725184917449951, "global_step": 125847, "epoch": 2996} {"train_loss": -6.763749122619629, "global_step": 125848, "epoch": 2996} {"train_loss": -6.704629898071289, "global_step": 125849, "epoch": 2996} {"train_loss": -6.654134750366211, "global_step": 125850, "epoch": 2996} {"train_loss": -6.584625244140625, "global_step": 125851, "epoch": 2996} {"train_loss": -6.695977210998535, "global_step": 125852, "epoch": 2996} {"train_loss": -6.736632823944092, "global_step": 125853, "epoch": 2996} {"train_loss": -6.718593597412109, "global_step": 125854, "epoch": 2996} {"train_loss": -6.6917724609375, "global_step": 125855, "epoch": 2996} {"train_loss": -6.662131309509277, "global_step": 125856, "epoch": 2996} {"train_loss": -6.597643852233887, "global_step": 125857, "epoch": 2996} {"train_loss": -6.676241397857666, "global_step": 125858, "epoch": 2996} {"train_loss": -6.480085372924805, "global_step": 125859, "epoch": 2996} {"train_loss": -6.524666786193848, "global_step": 125860, "epoch": 2996} {"train_loss": -6.7203168869018555, "global_step": 125861, "epoch": 2996} {"train_loss": -6.547630310058594, "global_step": 125862, "epoch": 2996} {"train_loss": -6.670915603637695, "global_step": 125863, "epoch": 2996} {"train_loss": -6.541952133178711, "global_step": 125864, "epoch": 2996} {"train_loss": -6.625205993652344, "global_step": 125865, "epoch": 2996} {"train_loss": -6.5188493728637695, "global_step": 125866, "epoch": 2996} {"train_loss": -6.545403480529785, "global_step": 125867, "epoch": 2996} {"train_loss": -6.703275203704834, "global_step": 125868, "epoch": 2996} {"train_loss": -6.317420959472656, "global_step": 125869, "epoch": 2996} {"train_loss": -6.5508575439453125, "global_step": 125870, "epoch": 2996} {"train_loss": -6.468502998352051, "global_step": 125871, "epoch": 2996} {"train_loss": -6.55600643157959, "global_step": 125872, "epoch": 2996} {"train_loss": -6.6209559213547475, "global_step": 125873, "epoch": 2996, "val_loss": 66245.109375} {"train_loss": -6.632092475891113, "global_step": 125874, "epoch": 2997} {"train_loss": -6.669841766357422, "global_step": 125875, "epoch": 2997} {"train_loss": -6.59653377532959, "global_step": 125876, "epoch": 2997} {"train_loss": -6.702708721160889, "global_step": 125877, "epoch": 2997} {"train_loss": -6.511979579925537, "global_step": 125878, "epoch": 2997} {"train_loss": -6.671209335327148, "global_step": 125879, "epoch": 2997} {"train_loss": -6.682103157043457, "global_step": 125880, "epoch": 2997} {"train_loss": -6.577729225158691, "global_step": 125881, "epoch": 2997} {"train_loss": -6.561893939971924, "global_step": 125882, "epoch": 2997} {"train_loss": -6.688906669616699, "global_step": 125883, "epoch": 2997} {"train_loss": -6.613202095031738, "global_step": 125884, "epoch": 2997} {"train_loss": -6.630364894866943, "global_step": 125885, "epoch": 2997} {"train_loss": -6.655290603637695, "global_step": 125886, "epoch": 2997} {"train_loss": -6.624665260314941, "global_step": 125887, "epoch": 2997} {"train_loss": -6.557412147521973, "global_step": 125888, "epoch": 2997} {"train_loss": -6.616211891174316, "global_step": 125889, "epoch": 2997} {"train_loss": -6.566444396972656, "global_step": 125890, "epoch": 2997} {"train_loss": -6.553112983703613, "global_step": 125891, "epoch": 2997} {"train_loss": -6.545872688293457, "global_step": 125892, "epoch": 2997} {"train_loss": -6.632862091064453, "global_step": 125893, "epoch": 2997} {"train_loss": -6.636518955230713, "global_step": 125894, "epoch": 2997} {"train_loss": -6.566806793212891, "global_step": 125895, "epoch": 2997} {"train_loss": -6.599185943603516, "global_step": 125896, "epoch": 2997} {"train_loss": -6.603332996368408, "global_step": 125897, "epoch": 2997} {"train_loss": -6.632987976074219, "global_step": 125898, "epoch": 2997} {"train_loss": -6.551708221435547, "global_step": 125899, "epoch": 2997} {"train_loss": -6.642524719238281, "global_step": 125900, "epoch": 2997} {"train_loss": -6.577094078063965, "global_step": 125901, "epoch": 2997} {"train_loss": -6.616937637329102, "global_step": 125902, "epoch": 2997} {"train_loss": -6.6332173347473145, "global_step": 125903, "epoch": 2997} {"train_loss": -6.573237419128418, "global_step": 125904, "epoch": 2997} {"train_loss": -6.628949165344238, "global_step": 125905, "epoch": 2997} {"train_loss": -6.479747772216797, "global_step": 125906, "epoch": 2997} {"train_loss": -6.6018476486206055, "global_step": 125907, "epoch": 2997} {"train_loss": -6.7247467041015625, "global_step": 125908, "epoch": 2997} {"train_loss": -6.5866851806640625, "global_step": 125909, "epoch": 2997} {"train_loss": -6.52609920501709, "global_step": 125910, "epoch": 2997} {"train_loss": -6.662819862365723, "global_step": 125911, "epoch": 2997} {"train_loss": -6.677755355834961, "global_step": 125912, "epoch": 2997} {"train_loss": -6.7020392417907715, "global_step": 125913, "epoch": 2997} {"train_loss": -6.662768363952637, "global_step": 125914, "epoch": 2997} {"train_loss": -6.613564968109131, "global_step": 125915, "epoch": 2997, "val_loss": 66223.0390625} {"train_loss": -6.671862602233887, "global_step": 125916, "epoch": 2998} {"train_loss": -6.691481590270996, "global_step": 125917, "epoch": 2998} {"train_loss": -6.665073394775391, "global_step": 125918, "epoch": 2998} {"train_loss": -6.570412635803223, "global_step": 125919, "epoch": 2998} {"train_loss": -6.608536720275879, "global_step": 125920, "epoch": 2998} {"train_loss": -6.635990619659424, "global_step": 125921, "epoch": 2998} {"train_loss": -6.677187919616699, "global_step": 125922, "epoch": 2998} {"train_loss": -6.604973793029785, "global_step": 125923, "epoch": 2998} {"train_loss": -6.723883628845215, "global_step": 125924, "epoch": 2998} {"train_loss": -6.740843772888184, "global_step": 125925, "epoch": 2998} {"train_loss": -6.508623123168945, "global_step": 125926, "epoch": 2998} {"train_loss": -6.662336349487305, "global_step": 125927, "epoch": 2998} {"train_loss": -6.677890777587891, "global_step": 125928, "epoch": 2998} {"train_loss": -6.659354209899902, "global_step": 125929, "epoch": 2998} {"train_loss": -6.63705587387085, "global_step": 125930, "epoch": 2998} {"train_loss": -6.719396114349365, "global_step": 125931, "epoch": 2998} {"train_loss": -6.645087242126465, "global_step": 125932, "epoch": 2998} {"train_loss": -6.754386901855469, "global_step": 125933, "epoch": 2998} {"train_loss": -6.670768737792969, "global_step": 125934, "epoch": 2998} {"train_loss": -6.56831169128418, "global_step": 125935, "epoch": 2998} {"train_loss": -6.673841953277588, "global_step": 125936, "epoch": 2998} {"train_loss": -6.639314651489258, "global_step": 125937, "epoch": 2998} {"train_loss": -6.556058406829834, "global_step": 125938, "epoch": 2998} {"train_loss": -6.629465579986572, "global_step": 125939, "epoch": 2998} {"train_loss": -6.679258823394775, "global_step": 125940, "epoch": 2998} {"train_loss": -6.437070369720459, "global_step": 125941, "epoch": 2998} {"train_loss": -6.731072425842285, "global_step": 125942, "epoch": 2998} {"train_loss": -6.505527496337891, "global_step": 125943, "epoch": 2998} {"train_loss": -6.658258438110352, "global_step": 125944, "epoch": 2998} {"train_loss": -6.646206855773926, "global_step": 125945, "epoch": 2998} {"train_loss": -6.500470161437988, "global_step": 125946, "epoch": 2998} {"train_loss": -6.591169357299805, "global_step": 125947, "epoch": 2998} {"train_loss": -6.539299011230469, "global_step": 125948, "epoch": 2998} {"train_loss": -6.563371658325195, "global_step": 125949, "epoch": 2998} {"train_loss": -6.594078063964844, "global_step": 125950, "epoch": 2998} {"train_loss": -6.59291410446167, "global_step": 125951, "epoch": 2998} {"train_loss": -6.590932846069336, "global_step": 125952, "epoch": 2998} {"train_loss": -6.622469902038574, "global_step": 125953, "epoch": 2998} {"train_loss": -6.628232002258301, "global_step": 125954, "epoch": 2998} {"train_loss": -6.517662048339844, "global_step": 125955, "epoch": 2998} {"train_loss": -6.52104377746582, "global_step": 125956, "epoch": 2998} {"train_loss": -6.621186937604632, "global_step": 125957, "epoch": 2998, "val_loss": 66285.9921875} {"train_loss": -6.67353630065918, "global_step": 125958, "epoch": 2999} {"train_loss": -6.657755374908447, "global_step": 125959, "epoch": 2999} {"train_loss": -6.613770484924316, "global_step": 125960, "epoch": 2999} {"train_loss": -6.5607147216796875, "global_step": 125961, "epoch": 2999} {"train_loss": -6.52552604675293, "global_step": 125962, "epoch": 2999} {"train_loss": -6.477869987487793, "global_step": 125963, "epoch": 2999} {"train_loss": -6.608211517333984, "global_step": 125964, "epoch": 2999} {"train_loss": -6.692626953125, "global_step": 125965, "epoch": 2999} {"train_loss": -6.682163238525391, "global_step": 125966, "epoch": 2999} {"train_loss": -6.690013885498047, "global_step": 125967, "epoch": 2999} {"train_loss": -6.608242511749268, "global_step": 125968, "epoch": 2999} {"train_loss": -6.712332725524902, "global_step": 125969, "epoch": 2999} {"train_loss": -6.6499433517456055, "global_step": 125970, "epoch": 2999} {"train_loss": -6.5701189041137695, "global_step": 125971, "epoch": 2999} {"train_loss": -6.62863826751709, "global_step": 125972, "epoch": 2999} {"train_loss": -6.571150779724121, "global_step": 125973, "epoch": 2999} {"train_loss": -6.574394226074219, "global_step": 125974, "epoch": 2999} {"train_loss": -6.621519088745117, "global_step": 125975, "epoch": 2999} {"train_loss": -6.6725568771362305, "global_step": 125976, "epoch": 2999} {"train_loss": -6.604653358459473, "global_step": 125977, "epoch": 2999} {"train_loss": -6.5805344581604, "global_step": 125978, "epoch": 2999} {"train_loss": -6.673260688781738, "global_step": 125979, "epoch": 2999} {"train_loss": -6.648989677429199, "global_step": 125980, "epoch": 2999} {"train_loss": -6.7182722091674805, "global_step": 125981, "epoch": 2999} {"train_loss": -6.5605950355529785, "global_step": 125982, "epoch": 2999} {"train_loss": -6.577300071716309, "global_step": 125983, "epoch": 2999} {"train_loss": -6.677920341491699, "global_step": 125984, "epoch": 2999} {"train_loss": -6.708354949951172, "global_step": 125985, "epoch": 2999} {"train_loss": -6.770235061645508, "global_step": 125986, "epoch": 2999} {"train_loss": -6.628656387329102, "global_step": 125987, "epoch": 2999} {"train_loss": -6.569179534912109, "global_step": 125988, "epoch": 2999} {"train_loss": -6.604767799377441, "global_step": 125989, "epoch": 2999} {"train_loss": -6.575343608856201, "global_step": 125990, "epoch": 2999} {"train_loss": -6.710035800933838, "global_step": 125991, "epoch": 2999} {"train_loss": -6.638701438903809, "global_step": 125992, "epoch": 2999} {"train_loss": -6.641697883605957, "global_step": 125993, "epoch": 2999} {"train_loss": -6.629462242126465, "global_step": 125994, "epoch": 2999} {"train_loss": -6.5609025955200195, "global_step": 125995, "epoch": 2999} {"train_loss": -6.6361799240112305, "global_step": 125996, "epoch": 2999} {"train_loss": -6.640500068664551, "global_step": 125997, "epoch": 2999} {"train_loss": -6.618720054626465, "global_step": 125998, "epoch": 2999} {"train_loss": -6.630322013582502, "global_step": 125999, "epoch": 2999, "val_loss": 66202.3046875} {"train_loss": -6.632443428039551, "global_step": 126000, "epoch": 3000} {"train_loss": -6.591468334197998, "global_step": 126001, "epoch": 3000} {"train_loss": -6.535189628601074, "global_step": 126002, "epoch": 3000} {"train_loss": -6.629136085510254, "global_step": 126003, "epoch": 3000} {"train_loss": -6.638235092163086, "global_step": 126004, "epoch": 3000} {"train_loss": -6.632458686828613, "global_step": 126005, "epoch": 3000} {"train_loss": -6.648205757141113, "global_step": 126006, "epoch": 3000} {"train_loss": -6.569388389587402, "global_step": 126007, "epoch": 3000} {"train_loss": -6.656015396118164, "global_step": 126008, "epoch": 3000} {"train_loss": -6.735321044921875, "global_step": 126009, "epoch": 3000} {"train_loss": -6.70564079284668, "global_step": 126010, "epoch": 3000} {"train_loss": -6.720475196838379, "global_step": 126011, "epoch": 3000} {"train_loss": -6.673393249511719, "global_step": 126012, "epoch": 3000} {"train_loss": -6.692600250244141, "global_step": 126013, "epoch": 3000} {"train_loss": -6.595344543457031, "global_step": 126014, "epoch": 3000} {"train_loss": -6.582745552062988, "global_step": 126015, "epoch": 3000} {"train_loss": -6.5263752937316895, "global_step": 126016, "epoch": 3000} {"train_loss": -6.693739414215088, "global_step": 126017, "epoch": 3000} {"train_loss": -6.550021648406982, "global_step": 126018, "epoch": 3000} {"train_loss": -6.511914253234863, "global_step": 126019, "epoch": 3000} {"train_loss": -6.588711738586426, "global_step": 126020, "epoch": 3000} {"train_loss": -6.521148681640625, "global_step": 126021, "epoch": 3000} {"train_loss": -6.489003658294678, "global_step": 126022, "epoch": 3000} {"train_loss": -6.534667015075684, "global_step": 126023, "epoch": 3000} {"train_loss": -6.568366050720215, "global_step": 126024, "epoch": 3000} {"train_loss": -6.613478660583496, "global_step": 126025, "epoch": 3000} {"train_loss": -6.522463798522949, "global_step": 126026, "epoch": 3000} {"train_loss": -6.6520819664001465, "global_step": 126027, "epoch": 3000} {"train_loss": -6.5620269775390625, "global_step": 126028, "epoch": 3000} {"train_loss": -6.522878170013428, "global_step": 126029, "epoch": 3000} {"train_loss": -6.79937219619751, "global_step": 126030, "epoch": 3000} {"train_loss": -6.616539001464844, "global_step": 126031, "epoch": 3000} {"train_loss": -6.614021301269531, "global_step": 126032, "epoch": 3000} {"train_loss": -6.6215901374816895, "global_step": 126033, "epoch": 3000} {"train_loss": -6.644321441650391, "global_step": 126034, "epoch": 3000} {"train_loss": -6.743363380432129, "global_step": 126035, "epoch": 3000} {"train_loss": -6.635262489318848, "global_step": 126036, "epoch": 3000} {"train_loss": -6.6319732666015625, "global_step": 126037, "epoch": 3000} {"train_loss": -6.658657550811768, "global_step": 126038, "epoch": 3000} {"train_loss": -6.626371383666992, "global_step": 126039, "epoch": 3000} {"train_loss": -6.57058048248291, "global_step": 126040, "epoch": 3000} {"train_loss": -6.618378809520176, "global_step": 126041, "epoch": 3000, "train/sim_max_reward_0": 0.19048323729324512, "train/sim_max_reward_1": 0.8943057860525768, "train/sim_max_reward_2": 0.5277246479143194, "train/sim_max_reward_3": 0.3832762895447125, "train/sim_max_reward_4": 0.9800534273392604, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.3547660078768014, "test/sim_max_reward_4300002": 0.9377596161767648, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9194773235201894, "test/sim_max_reward_4300006": 0.788357240304245, "test/sim_max_reward_4300007": 0.30543411838038403, "test/sim_max_reward_4300008": 0.9587033876036609, "test/sim_max_reward_4300009": 0.9453085286555047, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9969718733683552, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.4146236368425642, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.8024271863835752, "test/sim_max_reward_4300017": 0.9702256912921622, "test/sim_max_reward_4300018": 0.4327519826587827, "test/sim_max_reward_4300019": 0.18584278583926572, "test/sim_max_reward_4300020": 0.2069821860797598, "test/sim_max_reward_4300021": 0.933507799969263, "test/sim_max_reward_4300022": 0.8339767359496608, "test/sim_max_reward_4300023": 0.33044961334054485, "test/sim_max_reward_4300024": 0.9577302230941208, "test/sim_max_reward_4300025": 0.9007801486773553, "test/sim_max_reward_4300026": 0.17552273417611614, "test/sim_max_reward_4300027": 0.04392046964306086, "test/sim_max_reward_4300028": 0.0010120955587905487, "test/sim_max_reward_4300029": 0.5829400702665265, "test/sim_max_reward_4300030": 0.3658218021775495, "test/sim_max_reward_4300031": 0.9388614890497033, "test/sim_max_reward_4300032": 0.9592658225561782, "test/sim_max_reward_4300033": 0.9600017549654232, "test/sim_max_reward_4300034": 0.008202306949464678, "test/sim_max_reward_4300035": 0.5203859162306826, "test/sim_max_reward_4300036": 0.2317370368424552, "test/sim_max_reward_4300037": 0.9009533798627808, "test/sim_max_reward_4300038": 0.9183624029349388, "test/sim_max_reward_4300039": 0.9589938651393412, "test/sim_max_reward_4300040": 1.0, "test/sim_max_reward_4300041": 0.9988186374992983, "test/sim_max_reward_4300042": 0.7236453261762378, "test/sim_max_reward_4300043": 0.1658530374046247, "test/sim_max_reward_4300044": 0.9423865603219651, "test/sim_max_reward_4300045": 0.1774802843285279, "test/sim_max_reward_4300046": 0.9717857702996024, "test/sim_max_reward_4300047": 0.13329300626279775, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.10445955850917457, "train/mean_score": 0.5281380245843835, "test/mean_score": 0.5995122703595497, "val_loss": 66018.1953125} {"train_loss": -6.779152870178223, "global_step": 126042, "epoch": 3001} {"train_loss": -6.697950839996338, "global_step": 126043, "epoch": 3001} {"train_loss": -6.652981758117676, "global_step": 126044, "epoch": 3001} {"train_loss": -6.73091459274292, "global_step": 126045, "epoch": 3001} {"train_loss": -6.7275710105896, "global_step": 126046, "epoch": 3001} {"train_loss": -6.544064521789551, "global_step": 126047, "epoch": 3001} {"train_loss": -6.633874893188477, "global_step": 126048, "epoch": 3001} {"train_loss": -6.678304195404053, "global_step": 126049, "epoch": 3001} {"train_loss": -6.749001979827881, "global_step": 126050, "epoch": 3001} {"train_loss": -6.631089210510254, "global_step": 126051, "epoch": 3001} {"train_loss": -6.604973793029785, "global_step": 126052, "epoch": 3001} {"train_loss": -6.669550895690918, "global_step": 126053, "epoch": 3001} {"train_loss": -6.694008827209473, "global_step": 126054, "epoch": 3001} {"train_loss": -6.7051262855529785, "global_step": 126055, "epoch": 3001} {"train_loss": -6.685904502868652, "global_step": 126056, "epoch": 3001} {"train_loss": -6.762601852416992, "global_step": 126057, "epoch": 3001} {"train_loss": -6.6354217529296875, "global_step": 126058, "epoch": 3001} {"train_loss": -6.63090705871582, "global_step": 126059, "epoch": 3001} {"train_loss": -6.628785133361816, "global_step": 126060, "epoch": 3001} {"train_loss": -6.704722881317139, "global_step": 126061, "epoch": 3001} {"train_loss": -6.664665699005127, "global_step": 126062, "epoch": 3001} {"train_loss": -6.650732517242432, "global_step": 126063, "epoch": 3001} {"train_loss": -6.68525505065918, "global_step": 126064, "epoch": 3001} {"train_loss": -6.6610565185546875, "global_step": 126065, "epoch": 3001} {"train_loss": -6.618697643280029, "global_step": 126066, "epoch": 3001} {"train_loss": -6.65018367767334, "global_step": 126067, "epoch": 3001} {"train_loss": -6.72231912612915, "global_step": 126068, "epoch": 3001} {"train_loss": -6.688079833984375, "global_step": 126069, "epoch": 3001} {"train_loss": -6.641356468200684, "global_step": 126070, "epoch": 3001} {"train_loss": -6.637942790985107, "global_step": 126071, "epoch": 3001} {"train_loss": -6.604678630828857, "global_step": 126072, "epoch": 3001} {"train_loss": -6.649709701538086, "global_step": 126073, "epoch": 3001} {"train_loss": -6.580035209655762, "global_step": 126074, "epoch": 3001} {"train_loss": -6.6470255851745605, "global_step": 126075, "epoch": 3001} {"train_loss": -6.67534065246582, "global_step": 126076, "epoch": 3001} {"train_loss": -6.624209403991699, "global_step": 126077, "epoch": 3001} {"train_loss": -6.525277614593506, "global_step": 126078, "epoch": 3001} {"train_loss": -6.454741954803467, "global_step": 126079, "epoch": 3001} {"train_loss": -6.624399185180664, "global_step": 126080, "epoch": 3001} {"train_loss": -6.6329240798950195, "global_step": 126081, "epoch": 3001} {"train_loss": -6.577693462371826, "global_step": 126082, "epoch": 3001} {"train_loss": -6.648743073145549, "global_step": 126083, "epoch": 3001, "val_loss": 66367.625} {"train_loss": -6.41363000869751, "global_step": 126084, "epoch": 3002} {"train_loss": -6.590150833129883, "global_step": 126085, "epoch": 3002} {"train_loss": -6.517753601074219, "global_step": 126086, "epoch": 3002} {"train_loss": -6.619697570800781, "global_step": 126087, "epoch": 3002} {"train_loss": -6.528164863586426, "global_step": 126088, "epoch": 3002} {"train_loss": -6.488246917724609, "global_step": 126089, "epoch": 3002} {"train_loss": -6.513335227966309, "global_step": 126090, "epoch": 3002} {"train_loss": -6.648983001708984, "global_step": 126091, "epoch": 3002} {"train_loss": -6.622520446777344, "global_step": 126092, "epoch": 3002} {"train_loss": -6.524238586425781, "global_step": 126093, "epoch": 3002} {"train_loss": -6.591516971588135, "global_step": 126094, "epoch": 3002} {"train_loss": -6.521472930908203, "global_step": 126095, "epoch": 3002} {"train_loss": -6.53501558303833, "global_step": 126096, "epoch": 3002} {"train_loss": -6.597694396972656, "global_step": 126097, "epoch": 3002} {"train_loss": -6.546337127685547, "global_step": 126098, "epoch": 3002} {"train_loss": -6.568864345550537, "global_step": 126099, "epoch": 3002} {"train_loss": -6.567033767700195, "global_step": 126100, "epoch": 3002} {"train_loss": -6.620020389556885, "global_step": 126101, "epoch": 3002} {"train_loss": -6.584707260131836, "global_step": 126102, "epoch": 3002} {"train_loss": -6.7520246505737305, "global_step": 126103, "epoch": 3002} {"train_loss": -6.616204261779785, "global_step": 126104, "epoch": 3002} {"train_loss": -6.608922958374023, "global_step": 126105, "epoch": 3002} {"train_loss": -6.569464206695557, "global_step": 126106, "epoch": 3002} {"train_loss": -6.766911506652832, "global_step": 126107, "epoch": 3002} {"train_loss": -6.645936012268066, "global_step": 126108, "epoch": 3002} {"train_loss": -6.769894123077393, "global_step": 126109, "epoch": 3002} {"train_loss": -6.5440473556518555, "global_step": 126110, "epoch": 3002} {"train_loss": -6.755413055419922, "global_step": 126111, "epoch": 3002} {"train_loss": -6.719463348388672, "global_step": 126112, "epoch": 3002} {"train_loss": -6.706967353820801, "global_step": 126113, "epoch": 3002} {"train_loss": -6.677884101867676, "global_step": 126114, "epoch": 3002} {"train_loss": -6.6790971755981445, "global_step": 126115, "epoch": 3002} {"train_loss": -6.669259071350098, "global_step": 126116, "epoch": 3002} {"train_loss": -6.603926181793213, "global_step": 126117, "epoch": 3002} {"train_loss": -6.619582653045654, "global_step": 126118, "epoch": 3002} {"train_loss": -6.616631031036377, "global_step": 126119, "epoch": 3002} {"train_loss": -6.67495059967041, "global_step": 126120, "epoch": 3002} {"train_loss": -6.632413387298584, "global_step": 126121, "epoch": 3002} {"train_loss": -6.584856986999512, "global_step": 126122, "epoch": 3002} {"train_loss": -6.665378570556641, "global_step": 126123, "epoch": 3002} {"train_loss": -6.584794044494629, "global_step": 126124, "epoch": 3002} {"train_loss": -6.612013510295323, "global_step": 126125, "epoch": 3002, "val_loss": 66159.5} {"train_loss": -6.576533317565918, "global_step": 126126, "epoch": 3003} {"train_loss": -6.623788833618164, "global_step": 126127, "epoch": 3003} {"train_loss": -6.64021110534668, "global_step": 126128, "epoch": 3003} {"train_loss": -6.602011203765869, "global_step": 126129, "epoch": 3003} {"train_loss": -6.64893102645874, "global_step": 126130, "epoch": 3003} {"train_loss": -6.687577724456787, "global_step": 126131, "epoch": 3003} {"train_loss": -6.725340843200684, "global_step": 126132, "epoch": 3003} {"train_loss": -6.652385711669922, "global_step": 126133, "epoch": 3003} {"train_loss": -6.675470352172852, "global_step": 126134, "epoch": 3003} {"train_loss": -6.587370872497559, "global_step": 126135, "epoch": 3003} {"train_loss": -6.581652641296387, "global_step": 126136, "epoch": 3003} {"train_loss": -6.6666975021362305, "global_step": 126137, "epoch": 3003} {"train_loss": -6.651052951812744, "global_step": 126138, "epoch": 3003} {"train_loss": -6.640568256378174, "global_step": 126139, "epoch": 3003} {"train_loss": -6.654931545257568, "global_step": 126140, "epoch": 3003} {"train_loss": -6.624568939208984, "global_step": 126141, "epoch": 3003} {"train_loss": -6.631913185119629, "global_step": 126142, "epoch": 3003} {"train_loss": -6.6648101806640625, "global_step": 126143, "epoch": 3003} {"train_loss": -6.659974575042725, "global_step": 126144, "epoch": 3003} {"train_loss": -6.578027725219727, "global_step": 126145, "epoch": 3003} {"train_loss": -6.627253532409668, "global_step": 126146, "epoch": 3003} {"train_loss": -6.682469367980957, "global_step": 126147, "epoch": 3003} {"train_loss": -6.697256088256836, "global_step": 126148, "epoch": 3003} {"train_loss": -6.601187705993652, "global_step": 126149, "epoch": 3003} {"train_loss": -6.624752044677734, "global_step": 126150, "epoch": 3003} {"train_loss": -6.5970659255981445, "global_step": 126151, "epoch": 3003} {"train_loss": -6.570112705230713, "global_step": 126152, "epoch": 3003} {"train_loss": -6.708887577056885, "global_step": 126153, "epoch": 3003} {"train_loss": -6.554720878601074, "global_step": 126154, "epoch": 3003} {"train_loss": -6.657887935638428, "global_step": 126155, "epoch": 3003} {"train_loss": -6.569377899169922, "global_step": 126156, "epoch": 3003} {"train_loss": -6.649857521057129, "global_step": 126157, "epoch": 3003} {"train_loss": -6.621210098266602, "global_step": 126158, "epoch": 3003} {"train_loss": -6.629734992980957, "global_step": 126159, "epoch": 3003} {"train_loss": -6.690085411071777, "global_step": 126160, "epoch": 3003} {"train_loss": -6.750007152557373, "global_step": 126161, "epoch": 3003} {"train_loss": -6.759371280670166, "global_step": 126162, "epoch": 3003} {"train_loss": -6.638493061065674, "global_step": 126163, "epoch": 3003} {"train_loss": -6.653355598449707, "global_step": 126164, "epoch": 3003} {"train_loss": -6.584829330444336, "global_step": 126165, "epoch": 3003} {"train_loss": -6.713201522827148, "global_step": 126166, "epoch": 3003} {"train_loss": -6.645174083255586, "global_step": 126167, "epoch": 3003, "val_loss": 66141.34375} {"train_loss": -6.613155364990234, "global_step": 126168, "epoch": 3004} {"train_loss": -6.633111953735352, "global_step": 126169, "epoch": 3004} {"train_loss": -6.71540641784668, "global_step": 126170, "epoch": 3004} {"train_loss": -6.618712902069092, "global_step": 126171, "epoch": 3004} {"train_loss": -6.624691009521484, "global_step": 126172, "epoch": 3004} {"train_loss": -6.6056294441223145, "global_step": 126173, "epoch": 3004} {"train_loss": -6.715325355529785, "global_step": 126174, "epoch": 3004} {"train_loss": -6.580521106719971, "global_step": 126175, "epoch": 3004} {"train_loss": -6.600379467010498, "global_step": 126176, "epoch": 3004} {"train_loss": -6.577816009521484, "global_step": 126177, "epoch": 3004} {"train_loss": -6.513415336608887, "global_step": 126178, "epoch": 3004} {"train_loss": -6.8370585441589355, "global_step": 126179, "epoch": 3004} {"train_loss": -6.568354606628418, "global_step": 126180, "epoch": 3004} {"train_loss": -6.648681163787842, "global_step": 126181, "epoch": 3004} {"train_loss": -6.6773529052734375, "global_step": 126182, "epoch": 3004} {"train_loss": -6.570565223693848, "global_step": 126183, "epoch": 3004} {"train_loss": -6.60213565826416, "global_step": 126184, "epoch": 3004} {"train_loss": -6.515863418579102, "global_step": 126185, "epoch": 3004} {"train_loss": -6.732670783996582, "global_step": 126186, "epoch": 3004} {"train_loss": -6.6395649909973145, "global_step": 126187, "epoch": 3004} {"train_loss": -6.6024932861328125, "global_step": 126188, "epoch": 3004} {"train_loss": -6.643364906311035, "global_step": 126189, "epoch": 3004} {"train_loss": -6.641767978668213, "global_step": 126190, "epoch": 3004} {"train_loss": -6.620550155639648, "global_step": 126191, "epoch": 3004} {"train_loss": -6.545902252197266, "global_step": 126192, "epoch": 3004} {"train_loss": -6.557341575622559, "global_step": 126193, "epoch": 3004} {"train_loss": -6.440990447998047, "global_step": 126194, "epoch": 3004} {"train_loss": -6.617941856384277, "global_step": 126195, "epoch": 3004} {"train_loss": -6.578437328338623, "global_step": 126196, "epoch": 3004} {"train_loss": -6.4762468338012695, "global_step": 126197, "epoch": 3004} {"train_loss": -6.5580153465271, "global_step": 126198, "epoch": 3004} {"train_loss": -6.589076042175293, "global_step": 126199, "epoch": 3004} {"train_loss": -6.56755256652832, "global_step": 126200, "epoch": 3004} {"train_loss": -6.526390075683594, "global_step": 126201, "epoch": 3004} {"train_loss": -6.519433498382568, "global_step": 126202, "epoch": 3004} {"train_loss": -6.549320220947266, "global_step": 126203, "epoch": 3004} {"train_loss": -6.647813320159912, "global_step": 126204, "epoch": 3004} {"train_loss": -6.5792155265808105, "global_step": 126205, "epoch": 3004} {"train_loss": -6.631528854370117, "global_step": 126206, "epoch": 3004} {"train_loss": -6.548528671264648, "global_step": 126207, "epoch": 3004} {"train_loss": -6.618277072906494, "global_step": 126208, "epoch": 3004} {"train_loss": -6.600636096227737, "global_step": 126209, "epoch": 3004, "val_loss": 66333.171875} {"train_loss": -6.621863842010498, "global_step": 126210, "epoch": 3005} {"train_loss": -6.652996063232422, "global_step": 126211, "epoch": 3005} {"train_loss": -6.644183158874512, "global_step": 126212, "epoch": 3005} {"train_loss": -6.644734859466553, "global_step": 126213, "epoch": 3005} {"train_loss": -6.63355827331543, "global_step": 126214, "epoch": 3005} {"train_loss": -6.613217353820801, "global_step": 126215, "epoch": 3005} {"train_loss": -6.540637016296387, "global_step": 126216, "epoch": 3005} {"train_loss": -6.711026191711426, "global_step": 126217, "epoch": 3005} {"train_loss": -6.679509162902832, "global_step": 126218, "epoch": 3005} {"train_loss": -6.621891021728516, "global_step": 126219, "epoch": 3005} {"train_loss": -6.613951683044434, "global_step": 126220, "epoch": 3005} {"train_loss": -6.741486549377441, "global_step": 126221, "epoch": 3005} {"train_loss": -6.495794773101807, "global_step": 126222, "epoch": 3005} {"train_loss": -6.734769821166992, "global_step": 126223, "epoch": 3005} {"train_loss": -6.56320858001709, "global_step": 126224, "epoch": 3005} {"train_loss": -6.72945499420166, "global_step": 126225, "epoch": 3005} {"train_loss": -6.74108362197876, "global_step": 126226, "epoch": 3005} {"train_loss": -6.623074531555176, "global_step": 126227, "epoch": 3005} {"train_loss": -6.676239490509033, "global_step": 126228, "epoch": 3005} {"train_loss": -6.620923042297363, "global_step": 126229, "epoch": 3005} {"train_loss": -6.704019546508789, "global_step": 126230, "epoch": 3005} {"train_loss": -6.631417274475098, "global_step": 126231, "epoch": 3005} {"train_loss": -6.552449703216553, "global_step": 126232, "epoch": 3005} {"train_loss": -6.690610885620117, "global_step": 126233, "epoch": 3005} {"train_loss": -6.619476795196533, "global_step": 126234, "epoch": 3005} {"train_loss": -6.639114856719971, "global_step": 126235, "epoch": 3005} {"train_loss": -6.592779159545898, "global_step": 126236, "epoch": 3005} {"train_loss": -6.705719947814941, "global_step": 126237, "epoch": 3005} {"train_loss": -6.763920307159424, "global_step": 126238, "epoch": 3005} {"train_loss": -6.553557395935059, "global_step": 126239, "epoch": 3005} {"train_loss": -6.619959831237793, "global_step": 126240, "epoch": 3005} {"train_loss": -6.668474197387695, "global_step": 126241, "epoch": 3005} {"train_loss": -6.723817825317383, "global_step": 126242, "epoch": 3005} {"train_loss": -6.519578456878662, "global_step": 126243, "epoch": 3005} {"train_loss": -6.6345133781433105, "global_step": 126244, "epoch": 3005} {"train_loss": -6.666477203369141, "global_step": 126245, "epoch": 3005} {"train_loss": -6.5726470947265625, "global_step": 126246, "epoch": 3005} {"train_loss": -6.359516143798828, "global_step": 126247, "epoch": 3005} {"train_loss": -6.632750511169434, "global_step": 126248, "epoch": 3005} {"train_loss": -6.541133880615234, "global_step": 126249, "epoch": 3005} {"train_loss": -6.614500045776367, "global_step": 126250, "epoch": 3005} {"train_loss": -6.631403537023635, "global_step": 126251, "epoch": 3005, "val_loss": 66426.3984375} {"train_loss": -6.595444679260254, "global_step": 126252, "epoch": 3006} {"train_loss": -6.5424041748046875, "global_step": 126253, "epoch": 3006} {"train_loss": -6.5783843994140625, "global_step": 126254, "epoch": 3006} {"train_loss": -6.5832133293151855, "global_step": 126255, "epoch": 3006} {"train_loss": -6.57194709777832, "global_step": 126256, "epoch": 3006} {"train_loss": -6.647055625915527, "global_step": 126257, "epoch": 3006} {"train_loss": -6.61194372177124, "global_step": 126258, "epoch": 3006} {"train_loss": -6.410566329956055, "global_step": 126259, "epoch": 3006} {"train_loss": -6.607922077178955, "global_step": 126260, "epoch": 3006} {"train_loss": -6.660979270935059, "global_step": 126261, "epoch": 3006} {"train_loss": -6.527925491333008, "global_step": 126262, "epoch": 3006} {"train_loss": -6.65850830078125, "global_step": 126263, "epoch": 3006} {"train_loss": -6.534925937652588, "global_step": 126264, "epoch": 3006} {"train_loss": -6.627849578857422, "global_step": 126265, "epoch": 3006} {"train_loss": -6.674360752105713, "global_step": 126266, "epoch": 3006} {"train_loss": -6.608421802520752, "global_step": 126267, "epoch": 3006} {"train_loss": -6.638615608215332, "global_step": 126268, "epoch": 3006} {"train_loss": -6.5767822265625, "global_step": 126269, "epoch": 3006} {"train_loss": -6.620635509490967, "global_step": 126270, "epoch": 3006} {"train_loss": -6.442445755004883, "global_step": 126271, "epoch": 3006} {"train_loss": -6.557170867919922, "global_step": 126272, "epoch": 3006} {"train_loss": -6.652028560638428, "global_step": 126273, "epoch": 3006} {"train_loss": -6.556367874145508, "global_step": 126274, "epoch": 3006} {"train_loss": -6.4677734375, "global_step": 126275, "epoch": 3006} {"train_loss": -6.613203525543213, "global_step": 126276, "epoch": 3006} {"train_loss": -6.52829647064209, "global_step": 126277, "epoch": 3006} {"train_loss": -6.514894485473633, "global_step": 126278, "epoch": 3006} {"train_loss": -6.59736442565918, "global_step": 126279, "epoch": 3006} {"train_loss": -6.519434452056885, "global_step": 126280, "epoch": 3006} {"train_loss": -6.527341842651367, "global_step": 126281, "epoch": 3006} {"train_loss": -6.6960368156433105, "global_step": 126282, "epoch": 3006} {"train_loss": -6.492387771606445, "global_step": 126283, "epoch": 3006} {"train_loss": -6.640291213989258, "global_step": 126284, "epoch": 3006} {"train_loss": -6.606117248535156, "global_step": 126285, "epoch": 3006} {"train_loss": -6.587087154388428, "global_step": 126286, "epoch": 3006} {"train_loss": -6.590312480926514, "global_step": 126287, "epoch": 3006} {"train_loss": -6.559963226318359, "global_step": 126288, "epoch": 3006} {"train_loss": -6.623191833496094, "global_step": 126289, "epoch": 3006} {"train_loss": -6.612853527069092, "global_step": 126290, "epoch": 3006} {"train_loss": -6.502616882324219, "global_step": 126291, "epoch": 3006} {"train_loss": -6.505566596984863, "global_step": 126292, "epoch": 3006} {"train_loss": -6.576821043377831, "global_step": 126293, "epoch": 3006, "val_loss": 66162.3125} {"train_loss": -6.5956926345825195, "global_step": 126294, "epoch": 3007} {"train_loss": -6.576654434204102, "global_step": 126295, "epoch": 3007} {"train_loss": -6.540982246398926, "global_step": 126296, "epoch": 3007} {"train_loss": -6.473283767700195, "global_step": 126297, "epoch": 3007} {"train_loss": -6.588967323303223, "global_step": 126298, "epoch": 3007} {"train_loss": -6.679624557495117, "global_step": 126299, "epoch": 3007} {"train_loss": -6.596776008605957, "global_step": 126300, "epoch": 3007} {"train_loss": -6.51552152633667, "global_step": 126301, "epoch": 3007} {"train_loss": -6.611274242401123, "global_step": 126302, "epoch": 3007} {"train_loss": -6.547984600067139, "global_step": 126303, "epoch": 3007} {"train_loss": -6.571994781494141, "global_step": 126304, "epoch": 3007} {"train_loss": -6.523436546325684, "global_step": 126305, "epoch": 3007} {"train_loss": -6.555549621582031, "global_step": 126306, "epoch": 3007} {"train_loss": -6.594778060913086, "global_step": 126307, "epoch": 3007} {"train_loss": -6.50513219833374, "global_step": 126308, "epoch": 3007} {"train_loss": -6.620455265045166, "global_step": 126309, "epoch": 3007} {"train_loss": -6.561840057373047, "global_step": 126310, "epoch": 3007} {"train_loss": -6.50046443939209, "global_step": 126311, "epoch": 3007} {"train_loss": -6.5179290771484375, "global_step": 126312, "epoch": 3007} {"train_loss": -6.553450584411621, "global_step": 126313, "epoch": 3007} {"train_loss": -6.621766090393066, "global_step": 126314, "epoch": 3007} {"train_loss": -6.48956298828125, "global_step": 126315, "epoch": 3007} {"train_loss": -6.665668487548828, "global_step": 126316, "epoch": 3007} {"train_loss": -6.576037406921387, "global_step": 126317, "epoch": 3007} {"train_loss": -6.5518412590026855, "global_step": 126318, "epoch": 3007} {"train_loss": -6.724573612213135, "global_step": 126319, "epoch": 3007} {"train_loss": -6.509498119354248, "global_step": 126320, "epoch": 3007} {"train_loss": -6.629637718200684, "global_step": 126321, "epoch": 3007} {"train_loss": -6.567505836486816, "global_step": 126322, "epoch": 3007} {"train_loss": -6.599228858947754, "global_step": 126323, "epoch": 3007} {"train_loss": -6.609658241271973, "global_step": 126324, "epoch": 3007} {"train_loss": -6.6137776374816895, "global_step": 126325, "epoch": 3007} {"train_loss": -6.597240924835205, "global_step": 126326, "epoch": 3007} {"train_loss": -6.589280128479004, "global_step": 126327, "epoch": 3007} {"train_loss": -6.614779472351074, "global_step": 126328, "epoch": 3007} {"train_loss": -6.608819961547852, "global_step": 126329, "epoch": 3007} {"train_loss": -6.628454208374023, "global_step": 126330, "epoch": 3007} {"train_loss": -6.686515808105469, "global_step": 126331, "epoch": 3007} {"train_loss": -6.627692222595215, "global_step": 126332, "epoch": 3007} {"train_loss": -6.6464948654174805, "global_step": 126333, "epoch": 3007} {"train_loss": -6.714718818664551, "global_step": 126334, "epoch": 3007} {"train_loss": -6.587971982501802, "global_step": 126335, "epoch": 3007, "val_loss": 66308.1484375} {"train_loss": -6.671722412109375, "global_step": 126336, "epoch": 3008} {"train_loss": -6.609217166900635, "global_step": 126337, "epoch": 3008} {"train_loss": -6.603799343109131, "global_step": 126338, "epoch": 3008} {"train_loss": -6.673161506652832, "global_step": 126339, "epoch": 3008} {"train_loss": -6.671907424926758, "global_step": 126340, "epoch": 3008} {"train_loss": -6.643800258636475, "global_step": 126341, "epoch": 3008} {"train_loss": -6.605905532836914, "global_step": 126342, "epoch": 3008} {"train_loss": -6.558565139770508, "global_step": 126343, "epoch": 3008} {"train_loss": -6.738858222961426, "global_step": 126344, "epoch": 3008} {"train_loss": -6.422900199890137, "global_step": 126345, "epoch": 3008} {"train_loss": -6.639129161834717, "global_step": 126346, "epoch": 3008} {"train_loss": -6.573195457458496, "global_step": 126347, "epoch": 3008} {"train_loss": -6.574101448059082, "global_step": 126348, "epoch": 3008} {"train_loss": -6.591938018798828, "global_step": 126349, "epoch": 3008} {"train_loss": -6.697046279907227, "global_step": 126350, "epoch": 3008} {"train_loss": -6.593507289886475, "global_step": 126351, "epoch": 3008} {"train_loss": -6.698569297790527, "global_step": 126352, "epoch": 3008} {"train_loss": -6.6512451171875, "global_step": 126353, "epoch": 3008} {"train_loss": -6.624850273132324, "global_step": 126354, "epoch": 3008} {"train_loss": -6.65730094909668, "global_step": 126355, "epoch": 3008} {"train_loss": -6.62985372543335, "global_step": 126356, "epoch": 3008} {"train_loss": -6.679265975952148, "global_step": 126357, "epoch": 3008} {"train_loss": -6.652496337890625, "global_step": 126358, "epoch": 3008} {"train_loss": -6.56291389465332, "global_step": 126359, "epoch": 3008} {"train_loss": -6.683177947998047, "global_step": 126360, "epoch": 3008} {"train_loss": -6.642897129058838, "global_step": 126361, "epoch": 3008} {"train_loss": -6.592820167541504, "global_step": 126362, "epoch": 3008} {"train_loss": -6.749535083770752, "global_step": 126363, "epoch": 3008} {"train_loss": -6.6035685539245605, "global_step": 126364, "epoch": 3008} {"train_loss": -6.679429054260254, "global_step": 126365, "epoch": 3008} {"train_loss": -6.690069198608398, "global_step": 126366, "epoch": 3008} {"train_loss": -6.664882659912109, "global_step": 126367, "epoch": 3008} {"train_loss": -6.695476531982422, "global_step": 126368, "epoch": 3008} {"train_loss": -6.704118728637695, "global_step": 126369, "epoch": 3008} {"train_loss": -6.693547248840332, "global_step": 126370, "epoch": 3008} {"train_loss": -6.573313236236572, "global_step": 126371, "epoch": 3008} {"train_loss": -6.6248698234558105, "global_step": 126372, "epoch": 3008} {"train_loss": -6.643557548522949, "global_step": 126373, "epoch": 3008} {"train_loss": -6.713143348693848, "global_step": 126374, "epoch": 3008} {"train_loss": -6.646427154541016, "global_step": 126375, "epoch": 3008} {"train_loss": -6.666221618652344, "global_step": 126376, "epoch": 3008} {"train_loss": -6.6434653259459, "global_step": 126377, "epoch": 3008, "val_loss": 66150.1484375} {"train_loss": -6.7232666015625, "global_step": 126378, "epoch": 3009} {"train_loss": -6.78080415725708, "global_step": 126379, "epoch": 3009} {"train_loss": -6.558289527893066, "global_step": 126380, "epoch": 3009} {"train_loss": -6.761847972869873, "global_step": 126381, "epoch": 3009} {"train_loss": -6.718691825866699, "global_step": 126382, "epoch": 3009} {"train_loss": -6.733327865600586, "global_step": 126383, "epoch": 3009} {"train_loss": -6.670716285705566, "global_step": 126384, "epoch": 3009} {"train_loss": -6.587264537811279, "global_step": 126385, "epoch": 3009} {"train_loss": -6.695534706115723, "global_step": 126386, "epoch": 3009} {"train_loss": -6.56871223449707, "global_step": 126387, "epoch": 3009} {"train_loss": -6.652933597564697, "global_step": 126388, "epoch": 3009} {"train_loss": -6.712059020996094, "global_step": 126389, "epoch": 3009} {"train_loss": -6.76298189163208, "global_step": 126390, "epoch": 3009} {"train_loss": -6.627224445343018, "global_step": 126391, "epoch": 3009} {"train_loss": -6.6152215003967285, "global_step": 126392, "epoch": 3009} {"train_loss": -6.730681896209717, "global_step": 126393, "epoch": 3009} {"train_loss": -6.693713188171387, "global_step": 126394, "epoch": 3009} {"train_loss": -6.699357986450195, "global_step": 126395, "epoch": 3009} {"train_loss": -6.660219192504883, "global_step": 126396, "epoch": 3009} {"train_loss": -6.753913879394531, "global_step": 126397, "epoch": 3009} {"train_loss": -6.630434989929199, "global_step": 126398, "epoch": 3009} {"train_loss": -6.591468811035156, "global_step": 126399, "epoch": 3009} {"train_loss": -6.782164573669434, "global_step": 126400, "epoch": 3009} {"train_loss": -6.673666954040527, "global_step": 126401, "epoch": 3009} {"train_loss": -6.656826019287109, "global_step": 126402, "epoch": 3009} {"train_loss": -6.682584762573242, "global_step": 126403, "epoch": 3009} {"train_loss": -6.689695358276367, "global_step": 126404, "epoch": 3009} {"train_loss": -6.748037338256836, "global_step": 126405, "epoch": 3009} {"train_loss": -6.709600448608398, "global_step": 126406, "epoch": 3009} {"train_loss": -6.691692352294922, "global_step": 126407, "epoch": 3009} {"train_loss": -6.698947906494141, "global_step": 126408, "epoch": 3009} {"train_loss": -6.666960716247559, "global_step": 126409, "epoch": 3009} {"train_loss": -6.647792816162109, "global_step": 126410, "epoch": 3009} {"train_loss": -6.682493209838867, "global_step": 126411, "epoch": 3009} {"train_loss": -6.704870223999023, "global_step": 126412, "epoch": 3009} {"train_loss": -6.673058986663818, "global_step": 126413, "epoch": 3009} {"train_loss": -6.632540702819824, "global_step": 126414, "epoch": 3009} {"train_loss": -6.559410095214844, "global_step": 126415, "epoch": 3009} {"train_loss": -6.664104461669922, "global_step": 126416, "epoch": 3009} {"train_loss": -6.7263102531433105, "global_step": 126417, "epoch": 3009} {"train_loss": -6.605260848999023, "global_step": 126418, "epoch": 3009} {"train_loss": -6.676096609660557, "global_step": 126419, "epoch": 3009, "val_loss": 66321.734375} {"train_loss": -6.690372943878174, "global_step": 126420, "epoch": 3010} {"train_loss": -6.686624526977539, "global_step": 126421, "epoch": 3010} {"train_loss": -6.595670700073242, "global_step": 126422, "epoch": 3010} {"train_loss": -6.590569019317627, "global_step": 126423, "epoch": 3010} {"train_loss": -6.59214973449707, "global_step": 126424, "epoch": 3010} {"train_loss": -6.548983097076416, "global_step": 126425, "epoch": 3010} {"train_loss": -6.568190574645996, "global_step": 126426, "epoch": 3010} {"train_loss": -6.619865417480469, "global_step": 126427, "epoch": 3010} {"train_loss": -6.495450019836426, "global_step": 126428, "epoch": 3010} {"train_loss": -6.528467178344727, "global_step": 126429, "epoch": 3010} {"train_loss": -6.517417907714844, "global_step": 126430, "epoch": 3010} {"train_loss": -6.448285102844238, "global_step": 126431, "epoch": 3010} {"train_loss": -6.606086730957031, "global_step": 126432, "epoch": 3010} {"train_loss": -6.5372209548950195, "global_step": 126433, "epoch": 3010} {"train_loss": -6.464056015014648, "global_step": 126434, "epoch": 3010} {"train_loss": -6.619794845581055, "global_step": 126435, "epoch": 3010} {"train_loss": -6.658665180206299, "global_step": 126436, "epoch": 3010} {"train_loss": -6.609609603881836, "global_step": 126437, "epoch": 3010} {"train_loss": -6.588523864746094, "global_step": 126438, "epoch": 3010} {"train_loss": -6.645323753356934, "global_step": 126439, "epoch": 3010} {"train_loss": -6.5504350662231445, "global_step": 126440, "epoch": 3010} {"train_loss": -6.530213832855225, "global_step": 126441, "epoch": 3010} {"train_loss": -6.675012111663818, "global_step": 126442, "epoch": 3010} {"train_loss": -6.738221168518066, "global_step": 126443, "epoch": 3010} {"train_loss": -6.668834686279297, "global_step": 126444, "epoch": 3010} {"train_loss": -6.656177520751953, "global_step": 126445, "epoch": 3010} {"train_loss": -6.679543495178223, "global_step": 126446, "epoch": 3010} {"train_loss": -6.641232490539551, "global_step": 126447, "epoch": 3010} {"train_loss": -6.629661560058594, "global_step": 126448, "epoch": 3010} {"train_loss": -6.68910551071167, "global_step": 126449, "epoch": 3010} {"train_loss": -6.641341209411621, "global_step": 126450, "epoch": 3010} {"train_loss": -6.726802825927734, "global_step": 126451, "epoch": 3010} {"train_loss": -6.745575904846191, "global_step": 126452, "epoch": 3010} {"train_loss": -6.748348236083984, "global_step": 126453, "epoch": 3010} {"train_loss": -6.71597146987915, "global_step": 126454, "epoch": 3010} {"train_loss": -6.715733528137207, "global_step": 126455, "epoch": 3010} {"train_loss": -6.778151988983154, "global_step": 126456, "epoch": 3010} {"train_loss": -6.59925651550293, "global_step": 126457, "epoch": 3010} {"train_loss": -6.5802903175354, "global_step": 126458, "epoch": 3010} {"train_loss": -6.6876068115234375, "global_step": 126459, "epoch": 3010} {"train_loss": -6.750415802001953, "global_step": 126460, "epoch": 3010} {"train_loss": -6.628619636808123, "global_step": 126461, "epoch": 3010, "val_loss": 66042.265625} {"train_loss": -6.6698102951049805, "global_step": 126462, "epoch": 3011} {"train_loss": -6.611324310302734, "global_step": 126463, "epoch": 3011} {"train_loss": -6.680465221405029, "global_step": 126464, "epoch": 3011} {"train_loss": -6.721428871154785, "global_step": 126465, "epoch": 3011} {"train_loss": -6.73719596862793, "global_step": 126466, "epoch": 3011} {"train_loss": -6.593951225280762, "global_step": 126467, "epoch": 3011} {"train_loss": -6.709320068359375, "global_step": 126468, "epoch": 3011} {"train_loss": -6.6218132972717285, "global_step": 126469, "epoch": 3011} {"train_loss": -6.605884552001953, "global_step": 126470, "epoch": 3011} {"train_loss": -6.551881313323975, "global_step": 126471, "epoch": 3011} {"train_loss": -6.664702415466309, "global_step": 126472, "epoch": 3011} {"train_loss": -6.707483291625977, "global_step": 126473, "epoch": 3011} {"train_loss": -6.654548645019531, "global_step": 126474, "epoch": 3011} {"train_loss": -6.696608543395996, "global_step": 126475, "epoch": 3011} {"train_loss": -6.598472595214844, "global_step": 126476, "epoch": 3011} {"train_loss": -6.503773212432861, "global_step": 126477, "epoch": 3011} {"train_loss": -6.567695617675781, "global_step": 126478, "epoch": 3011} {"train_loss": -6.670154094696045, "global_step": 126479, "epoch": 3011} {"train_loss": -6.584747314453125, "global_step": 126480, "epoch": 3011} {"train_loss": -6.700442790985107, "global_step": 126481, "epoch": 3011} {"train_loss": -6.5718255043029785, "global_step": 126482, "epoch": 3011} {"train_loss": -6.565721035003662, "global_step": 126483, "epoch": 3011} {"train_loss": -6.527937889099121, "global_step": 126484, "epoch": 3011} {"train_loss": -6.61860466003418, "global_step": 126485, "epoch": 3011} {"train_loss": -6.5542097091674805, "global_step": 126486, "epoch": 3011} {"train_loss": -6.673620223999023, "global_step": 126487, "epoch": 3011} {"train_loss": -6.633296966552734, "global_step": 126488, "epoch": 3011} {"train_loss": -6.621124744415283, "global_step": 126489, "epoch": 3011} {"train_loss": -6.701545715332031, "global_step": 126490, "epoch": 3011} {"train_loss": -6.514811992645264, "global_step": 126491, "epoch": 3011} {"train_loss": -6.660423755645752, "global_step": 126492, "epoch": 3011} {"train_loss": -6.551732540130615, "global_step": 126493, "epoch": 3011} {"train_loss": -6.659067630767822, "global_step": 126494, "epoch": 3011} {"train_loss": -6.736555099487305, "global_step": 126495, "epoch": 3011} {"train_loss": -6.6048736572265625, "global_step": 126496, "epoch": 3011} {"train_loss": -6.689001560211182, "global_step": 126497, "epoch": 3011} {"train_loss": -6.733118534088135, "global_step": 126498, "epoch": 3011} {"train_loss": -6.545710563659668, "global_step": 126499, "epoch": 3011} {"train_loss": -6.720719337463379, "global_step": 126500, "epoch": 3011} {"train_loss": -6.556553363800049, "global_step": 126501, "epoch": 3011} {"train_loss": -6.546901702880859, "global_step": 126502, "epoch": 3011} {"train_loss": -6.630174954732259, "global_step": 126503, "epoch": 3011, "val_loss": 66508.625} {"train_loss": -6.681541442871094, "global_step": 126504, "epoch": 3012} {"train_loss": -6.660045623779297, "global_step": 126505, "epoch": 3012} {"train_loss": -6.59031343460083, "global_step": 126506, "epoch": 3012} {"train_loss": -6.688695907592773, "global_step": 126507, "epoch": 3012} {"train_loss": -6.5284600257873535, "global_step": 126508, "epoch": 3012} {"train_loss": -6.511120796203613, "global_step": 126509, "epoch": 3012} {"train_loss": -6.645596981048584, "global_step": 126510, "epoch": 3012} {"train_loss": -6.641345500946045, "global_step": 126511, "epoch": 3012} {"train_loss": -6.590193748474121, "global_step": 126512, "epoch": 3012} {"train_loss": -6.643375396728516, "global_step": 126513, "epoch": 3012} {"train_loss": -6.619073390960693, "global_step": 126514, "epoch": 3012} {"train_loss": -6.600847244262695, "global_step": 126515, "epoch": 3012} {"train_loss": -6.662783145904541, "global_step": 126516, "epoch": 3012} {"train_loss": -6.612152576446533, "global_step": 126517, "epoch": 3012} {"train_loss": -6.471166610717773, "global_step": 126518, "epoch": 3012} {"train_loss": -6.580043792724609, "global_step": 126519, "epoch": 3012} {"train_loss": -6.546518802642822, "global_step": 126520, "epoch": 3012} {"train_loss": -6.550106525421143, "global_step": 126521, "epoch": 3012} {"train_loss": -6.628657817840576, "global_step": 126522, "epoch": 3012} {"train_loss": -6.7008819580078125, "global_step": 126523, "epoch": 3012} {"train_loss": -6.583444118499756, "global_step": 126524, "epoch": 3012} {"train_loss": -6.597954750061035, "global_step": 126525, "epoch": 3012} {"train_loss": -6.563864231109619, "global_step": 126526, "epoch": 3012} {"train_loss": -6.538629531860352, "global_step": 126527, "epoch": 3012} {"train_loss": -6.525948524475098, "global_step": 126528, "epoch": 3012} {"train_loss": -6.760416030883789, "global_step": 126529, "epoch": 3012} {"train_loss": -6.716822624206543, "global_step": 126530, "epoch": 3012} {"train_loss": -6.758133411407471, "global_step": 126531, "epoch": 3012} {"train_loss": -6.761107444763184, "global_step": 126532, "epoch": 3012} {"train_loss": -6.641384124755859, "global_step": 126533, "epoch": 3012} {"train_loss": -6.5603179931640625, "global_step": 126534, "epoch": 3012} {"train_loss": -6.627211093902588, "global_step": 126535, "epoch": 3012} {"train_loss": -6.697898864746094, "global_step": 126536, "epoch": 3012} {"train_loss": -6.694430351257324, "global_step": 126537, "epoch": 3012} {"train_loss": -6.669887065887451, "global_step": 126538, "epoch": 3012} {"train_loss": -6.612576961517334, "global_step": 126539, "epoch": 3012} {"train_loss": -6.633084774017334, "global_step": 126540, "epoch": 3012} {"train_loss": -6.7132134437561035, "global_step": 126541, "epoch": 3012} {"train_loss": -6.508356094360352, "global_step": 126542, "epoch": 3012} {"train_loss": -6.715517997741699, "global_step": 126543, "epoch": 3012} {"train_loss": -6.515349864959717, "global_step": 126544, "epoch": 3012} {"train_loss": -6.622490394683111, "global_step": 126545, "epoch": 3012, "val_loss": 66287.171875} {"train_loss": -6.689782619476318, "global_step": 126546, "epoch": 3013} {"train_loss": -6.71879768371582, "global_step": 126547, "epoch": 3013} {"train_loss": -6.648355484008789, "global_step": 126548, "epoch": 3013} {"train_loss": -6.7220869064331055, "global_step": 126549, "epoch": 3013} {"train_loss": -6.668338775634766, "global_step": 126550, "epoch": 3013} {"train_loss": -6.6034650802612305, "global_step": 126551, "epoch": 3013} {"train_loss": -6.6101531982421875, "global_step": 126552, "epoch": 3013} {"train_loss": -6.6861186027526855, "global_step": 126553, "epoch": 3013} {"train_loss": -6.620304107666016, "global_step": 126554, "epoch": 3013} {"train_loss": -6.637414455413818, "global_step": 126555, "epoch": 3013} {"train_loss": -6.632513999938965, "global_step": 126556, "epoch": 3013} {"train_loss": -6.546603202819824, "global_step": 126557, "epoch": 3013} {"train_loss": -6.656632900238037, "global_step": 126558, "epoch": 3013} {"train_loss": -6.631627082824707, "global_step": 126559, "epoch": 3013} {"train_loss": -6.5517964363098145, "global_step": 126560, "epoch": 3013} {"train_loss": -6.603507041931152, "global_step": 126561, "epoch": 3013} {"train_loss": -6.601685523986816, "global_step": 126562, "epoch": 3013} {"train_loss": -6.590188980102539, "global_step": 126563, "epoch": 3013} {"train_loss": -6.598983287811279, "global_step": 126564, "epoch": 3013} {"train_loss": -6.698725700378418, "global_step": 126565, "epoch": 3013} {"train_loss": -6.648700714111328, "global_step": 126566, "epoch": 3013} {"train_loss": -6.550040245056152, "global_step": 126567, "epoch": 3013} {"train_loss": -6.705859184265137, "global_step": 126568, "epoch": 3013} {"train_loss": -6.626432418823242, "global_step": 126569, "epoch": 3013} {"train_loss": -6.5910797119140625, "global_step": 126570, "epoch": 3013} {"train_loss": -6.588533401489258, "global_step": 126571, "epoch": 3013} {"train_loss": -6.606283187866211, "global_step": 126572, "epoch": 3013} {"train_loss": -6.542433738708496, "global_step": 126573, "epoch": 3013} {"train_loss": -6.625616550445557, "global_step": 126574, "epoch": 3013} {"train_loss": -6.730510234832764, "global_step": 126575, "epoch": 3013} {"train_loss": -6.765571594238281, "global_step": 126576, "epoch": 3013} {"train_loss": -6.6697235107421875, "global_step": 126577, "epoch": 3013} {"train_loss": -6.699705123901367, "global_step": 126578, "epoch": 3013} {"train_loss": -6.671738624572754, "global_step": 126579, "epoch": 3013} {"train_loss": -6.602231979370117, "global_step": 126580, "epoch": 3013} {"train_loss": -6.714075088500977, "global_step": 126581, "epoch": 3013} {"train_loss": -6.671062469482422, "global_step": 126582, "epoch": 3013} {"train_loss": -6.715247631072998, "global_step": 126583, "epoch": 3013} {"train_loss": -6.544680118560791, "global_step": 126584, "epoch": 3013} {"train_loss": -6.607942581176758, "global_step": 126585, "epoch": 3013} {"train_loss": -6.533923149108887, "global_step": 126586, "epoch": 3013} {"train_loss": -6.637600728443691, "global_step": 126587, "epoch": 3013, "val_loss": 66033.1953125} {"train_loss": -6.7243804931640625, "global_step": 126588, "epoch": 3014} {"train_loss": -6.641806602478027, "global_step": 126589, "epoch": 3014} {"train_loss": -6.742147445678711, "global_step": 126590, "epoch": 3014} {"train_loss": -6.683067321777344, "global_step": 126591, "epoch": 3014} {"train_loss": -6.671601295471191, "global_step": 126592, "epoch": 3014} {"train_loss": -6.621648788452148, "global_step": 126593, "epoch": 3014} {"train_loss": -6.6902265548706055, "global_step": 126594, "epoch": 3014} {"train_loss": -6.679112434387207, "global_step": 126595, "epoch": 3014} {"train_loss": -6.591330051422119, "global_step": 126596, "epoch": 3014} {"train_loss": -6.561567783355713, "global_step": 126597, "epoch": 3014} {"train_loss": -6.563486099243164, "global_step": 126598, "epoch": 3014} {"train_loss": -6.517167091369629, "global_step": 126599, "epoch": 3014} {"train_loss": -6.51381778717041, "global_step": 126600, "epoch": 3014} {"train_loss": -6.722559928894043, "global_step": 126601, "epoch": 3014} {"train_loss": -6.4650163650512695, "global_step": 126602, "epoch": 3014} {"train_loss": -6.682833194732666, "global_step": 126603, "epoch": 3014} {"train_loss": -6.4253058433532715, "global_step": 126604, "epoch": 3014} {"train_loss": -6.538528919219971, "global_step": 126605, "epoch": 3014} {"train_loss": -6.5653076171875, "global_step": 126606, "epoch": 3014} {"train_loss": -6.529048919677734, "global_step": 126607, "epoch": 3014} {"train_loss": -6.636479377746582, "global_step": 126608, "epoch": 3014} {"train_loss": -6.491593360900879, "global_step": 126609, "epoch": 3014} {"train_loss": -6.607605934143066, "global_step": 126610, "epoch": 3014} {"train_loss": -6.516381740570068, "global_step": 126611, "epoch": 3014} {"train_loss": -6.498271465301514, "global_step": 126612, "epoch": 3014} {"train_loss": -6.4888224601745605, "global_step": 126613, "epoch": 3014} {"train_loss": -6.588476181030273, "global_step": 126614, "epoch": 3014} {"train_loss": -6.635089874267578, "global_step": 126615, "epoch": 3014} {"train_loss": -6.539153099060059, "global_step": 126616, "epoch": 3014} {"train_loss": -6.6430344581604, "global_step": 126617, "epoch": 3014} {"train_loss": -6.589637756347656, "global_step": 126618, "epoch": 3014} {"train_loss": -6.694034576416016, "global_step": 126619, "epoch": 3014} {"train_loss": -6.508156776428223, "global_step": 126620, "epoch": 3014} {"train_loss": -6.653384208679199, "global_step": 126621, "epoch": 3014} {"train_loss": -6.667750358581543, "global_step": 126622, "epoch": 3014} {"train_loss": -6.657809257507324, "global_step": 126623, "epoch": 3014} {"train_loss": -6.7358479499816895, "global_step": 126624, "epoch": 3014} {"train_loss": -6.582066535949707, "global_step": 126625, "epoch": 3014} {"train_loss": -6.526172637939453, "global_step": 126626, "epoch": 3014} {"train_loss": -6.524601459503174, "global_step": 126627, "epoch": 3014} {"train_loss": -6.58024787902832, "global_step": 126628, "epoch": 3014} {"train_loss": -6.598171767734346, "global_step": 126629, "epoch": 3014, "val_loss": 66330.2734375} {"train_loss": -6.544233322143555, "global_step": 126630, "epoch": 3015} {"train_loss": -6.65704870223999, "global_step": 126631, "epoch": 3015} {"train_loss": -6.473369598388672, "global_step": 126632, "epoch": 3015} {"train_loss": -6.566657543182373, "global_step": 126633, "epoch": 3015} {"train_loss": -6.544794082641602, "global_step": 126634, "epoch": 3015} {"train_loss": -6.652000904083252, "global_step": 126635, "epoch": 3015} {"train_loss": -6.561940670013428, "global_step": 126636, "epoch": 3015} {"train_loss": -6.512295246124268, "global_step": 126637, "epoch": 3015} {"train_loss": -6.5389814376831055, "global_step": 126638, "epoch": 3015} {"train_loss": -6.67997932434082, "global_step": 126639, "epoch": 3015} {"train_loss": -6.630564212799072, "global_step": 126640, "epoch": 3015} {"train_loss": -6.649258613586426, "global_step": 126641, "epoch": 3015} {"train_loss": -6.580299377441406, "global_step": 126642, "epoch": 3015} {"train_loss": -6.649017810821533, "global_step": 126643, "epoch": 3015} {"train_loss": -6.696935176849365, "global_step": 126644, "epoch": 3015} {"train_loss": -6.774614334106445, "global_step": 126645, "epoch": 3015} {"train_loss": -6.706070899963379, "global_step": 126646, "epoch": 3015} {"train_loss": -6.678125858306885, "global_step": 126647, "epoch": 3015} {"train_loss": -6.7148566246032715, "global_step": 126648, "epoch": 3015} {"train_loss": -6.679802894592285, "global_step": 126649, "epoch": 3015} {"train_loss": -6.597437858581543, "global_step": 126650, "epoch": 3015} {"train_loss": -6.634897232055664, "global_step": 126651, "epoch": 3015} {"train_loss": -6.699981689453125, "global_step": 126652, "epoch": 3015} {"train_loss": -6.754260063171387, "global_step": 126653, "epoch": 3015} {"train_loss": -6.7170844078063965, "global_step": 126654, "epoch": 3015} {"train_loss": -6.6074604988098145, "global_step": 126655, "epoch": 3015} {"train_loss": -6.754054069519043, "global_step": 126656, "epoch": 3015} {"train_loss": -6.598221302032471, "global_step": 126657, "epoch": 3015} {"train_loss": -6.7027106285095215, "global_step": 126658, "epoch": 3015} {"train_loss": -6.648937225341797, "global_step": 126659, "epoch": 3015} {"train_loss": -6.678011894226074, "global_step": 126660, "epoch": 3015} {"train_loss": -6.692831993103027, "global_step": 126661, "epoch": 3015} {"train_loss": -6.671883583068848, "global_step": 126662, "epoch": 3015} {"train_loss": -6.659616470336914, "global_step": 126663, "epoch": 3015} {"train_loss": -6.691686630249023, "global_step": 126664, "epoch": 3015} {"train_loss": -6.538980007171631, "global_step": 126665, "epoch": 3015} {"train_loss": -6.777846813201904, "global_step": 126666, "epoch": 3015} {"train_loss": -6.730538368225098, "global_step": 126667, "epoch": 3015} {"train_loss": -6.631768226623535, "global_step": 126668, "epoch": 3015} {"train_loss": -6.54159688949585, "global_step": 126669, "epoch": 3015} {"train_loss": -6.607041835784912, "global_step": 126670, "epoch": 3015} {"train_loss": -6.6448422613598055, "global_step": 126671, "epoch": 3015, "val_loss": 66389.7265625} {"train_loss": -6.5923638343811035, "global_step": 126672, "epoch": 3016} {"train_loss": -6.587131977081299, "global_step": 126673, "epoch": 3016} {"train_loss": -6.812845230102539, "global_step": 126674, "epoch": 3016} {"train_loss": -6.780299186706543, "global_step": 126675, "epoch": 3016} {"train_loss": -6.582869052886963, "global_step": 126676, "epoch": 3016} {"train_loss": -6.48786735534668, "global_step": 126677, "epoch": 3016} {"train_loss": -6.653717994689941, "global_step": 126678, "epoch": 3016} {"train_loss": -6.600797653198242, "global_step": 126679, "epoch": 3016} {"train_loss": -6.6168107986450195, "global_step": 126680, "epoch": 3016} {"train_loss": -6.645906925201416, "global_step": 126681, "epoch": 3016} {"train_loss": -6.521702289581299, "global_step": 126682, "epoch": 3016} {"train_loss": -6.6532440185546875, "global_step": 126683, "epoch": 3016} {"train_loss": -6.695158004760742, "global_step": 126684, "epoch": 3016} {"train_loss": -6.661355972290039, "global_step": 126685, "epoch": 3016} {"train_loss": -6.660261154174805, "global_step": 126686, "epoch": 3016} {"train_loss": -6.603216171264648, "global_step": 126687, "epoch": 3016} {"train_loss": -6.570484638214111, "global_step": 126688, "epoch": 3016} {"train_loss": -6.4889116287231445, "global_step": 126689, "epoch": 3016} {"train_loss": -6.5578837394714355, "global_step": 126690, "epoch": 3016} {"train_loss": -6.573721885681152, "global_step": 126691, "epoch": 3016} {"train_loss": -6.406233310699463, "global_step": 126692, "epoch": 3016} {"train_loss": -6.650265693664551, "global_step": 126693, "epoch": 3016} {"train_loss": -6.442452430725098, "global_step": 126694, "epoch": 3016} {"train_loss": -6.614296913146973, "global_step": 126695, "epoch": 3016} {"train_loss": -6.575516700744629, "global_step": 126696, "epoch": 3016} {"train_loss": -6.567025184631348, "global_step": 126697, "epoch": 3016} {"train_loss": -6.533327579498291, "global_step": 126698, "epoch": 3016} {"train_loss": -6.459314346313477, "global_step": 126699, "epoch": 3016} {"train_loss": -6.614465713500977, "global_step": 126700, "epoch": 3016} {"train_loss": -6.397704124450684, "global_step": 126701, "epoch": 3016} {"train_loss": -6.596551895141602, "global_step": 126702, "epoch": 3016} {"train_loss": -6.543534278869629, "global_step": 126703, "epoch": 3016} {"train_loss": -6.692368507385254, "global_step": 126704, "epoch": 3016} {"train_loss": -6.534554958343506, "global_step": 126705, "epoch": 3016} {"train_loss": -6.557713031768799, "global_step": 126706, "epoch": 3016} {"train_loss": -6.574404716491699, "global_step": 126707, "epoch": 3016} {"train_loss": -6.455130577087402, "global_step": 126708, "epoch": 3016} {"train_loss": -6.519802093505859, "global_step": 126709, "epoch": 3016} {"train_loss": -6.5827956199646, "global_step": 126710, "epoch": 3016} {"train_loss": -6.602715015411377, "global_step": 126711, "epoch": 3016} {"train_loss": -6.6435136795043945, "global_step": 126712, "epoch": 3016} {"train_loss": -6.582742713746571, "global_step": 126713, "epoch": 3016, "val_loss": 66306.7421875} {"train_loss": -6.65311336517334, "global_step": 126714, "epoch": 3017} {"train_loss": -6.711228370666504, "global_step": 126715, "epoch": 3017} {"train_loss": -6.60080623626709, "global_step": 126716, "epoch": 3017} {"train_loss": -6.651122093200684, "global_step": 126717, "epoch": 3017} {"train_loss": -6.553154945373535, "global_step": 126718, "epoch": 3017} {"train_loss": -6.604182720184326, "global_step": 126719, "epoch": 3017} {"train_loss": -6.644008159637451, "global_step": 126720, "epoch": 3017} {"train_loss": -6.625314235687256, "global_step": 126721, "epoch": 3017} {"train_loss": -6.624402046203613, "global_step": 126722, "epoch": 3017} {"train_loss": -6.73579740524292, "global_step": 126723, "epoch": 3017} {"train_loss": -6.71157169342041, "global_step": 126724, "epoch": 3017} {"train_loss": -6.704139709472656, "global_step": 126725, "epoch": 3017} {"train_loss": -6.706171989440918, "global_step": 126726, "epoch": 3017} {"train_loss": -6.529264450073242, "global_step": 126727, "epoch": 3017} {"train_loss": -6.689617156982422, "global_step": 126728, "epoch": 3017} {"train_loss": -6.783909797668457, "global_step": 126729, "epoch": 3017} {"train_loss": -6.623638153076172, "global_step": 126730, "epoch": 3017} {"train_loss": -6.7651166915893555, "global_step": 126731, "epoch": 3017} {"train_loss": -6.677396297454834, "global_step": 126732, "epoch": 3017} {"train_loss": -6.649910926818848, "global_step": 126733, "epoch": 3017} {"train_loss": -6.642302513122559, "global_step": 126734, "epoch": 3017} {"train_loss": -6.7038893699646, "global_step": 126735, "epoch": 3017} {"train_loss": -6.543434143066406, "global_step": 126736, "epoch": 3017} {"train_loss": -6.677774429321289, "global_step": 126737, "epoch": 3017} {"train_loss": -6.716787815093994, "global_step": 126738, "epoch": 3017} {"train_loss": -6.64039945602417, "global_step": 126739, "epoch": 3017} {"train_loss": -6.595839977264404, "global_step": 126740, "epoch": 3017} {"train_loss": -6.594964027404785, "global_step": 126741, "epoch": 3017} {"train_loss": -6.559598922729492, "global_step": 126742, "epoch": 3017} {"train_loss": -6.687709808349609, "global_step": 126743, "epoch": 3017} {"train_loss": -6.50429630279541, "global_step": 126744, "epoch": 3017} {"train_loss": -6.520412445068359, "global_step": 126745, "epoch": 3017} {"train_loss": -6.645916938781738, "global_step": 126746, "epoch": 3017} {"train_loss": -6.568650245666504, "global_step": 126747, "epoch": 3017} {"train_loss": -6.5442047119140625, "global_step": 126748, "epoch": 3017} {"train_loss": -6.533034324645996, "global_step": 126749, "epoch": 3017} {"train_loss": -6.525856018066406, "global_step": 126750, "epoch": 3017} {"train_loss": -6.603137016296387, "global_step": 126751, "epoch": 3017} {"train_loss": -6.556095123291016, "global_step": 126752, "epoch": 3017} {"train_loss": -6.573721885681152, "global_step": 126753, "epoch": 3017} {"train_loss": -6.7086381912231445, "global_step": 126754, "epoch": 3017} {"train_loss": -6.625291131791615, "global_step": 126755, "epoch": 3017, "val_loss": 66333.1328125} {"train_loss": -6.540706634521484, "global_step": 126756, "epoch": 3018} {"train_loss": -6.6291351318359375, "global_step": 126757, "epoch": 3018} {"train_loss": -6.522686004638672, "global_step": 126758, "epoch": 3018} {"train_loss": -6.650217056274414, "global_step": 126759, "epoch": 3018} {"train_loss": -6.570394515991211, "global_step": 126760, "epoch": 3018} {"train_loss": -6.561716079711914, "global_step": 126761, "epoch": 3018} {"train_loss": -6.559053897857666, "global_step": 126762, "epoch": 3018} {"train_loss": -6.535076141357422, "global_step": 126763, "epoch": 3018} {"train_loss": -6.564632415771484, "global_step": 126764, "epoch": 3018} {"train_loss": -6.4765238761901855, "global_step": 126765, "epoch": 3018} {"train_loss": -6.629955768585205, "global_step": 126766, "epoch": 3018} {"train_loss": -6.631757736206055, "global_step": 126767, "epoch": 3018} {"train_loss": -6.611863613128662, "global_step": 126768, "epoch": 3018} {"train_loss": -6.583881855010986, "global_step": 126769, "epoch": 3018} {"train_loss": -6.60548210144043, "global_step": 126770, "epoch": 3018} {"train_loss": -6.783498287200928, "global_step": 126771, "epoch": 3018} {"train_loss": -6.675215244293213, "global_step": 126772, "epoch": 3018} {"train_loss": -6.70150899887085, "global_step": 126773, "epoch": 3018} {"train_loss": -6.702903747558594, "global_step": 126774, "epoch": 3018} {"train_loss": -6.681147575378418, "global_step": 126775, "epoch": 3018} {"train_loss": -6.546783447265625, "global_step": 126776, "epoch": 3018} {"train_loss": -6.597098350524902, "global_step": 126777, "epoch": 3018} {"train_loss": -6.722539901733398, "global_step": 126778, "epoch": 3018} {"train_loss": -6.6556267738342285, "global_step": 126779, "epoch": 3018} {"train_loss": -6.688268661499023, "global_step": 126780, "epoch": 3018} {"train_loss": -6.734737396240234, "global_step": 126781, "epoch": 3018} {"train_loss": -6.622743606567383, "global_step": 126782, "epoch": 3018} {"train_loss": -6.722668170928955, "global_step": 126783, "epoch": 3018} {"train_loss": -6.60806941986084, "global_step": 126784, "epoch": 3018} {"train_loss": -6.720501899719238, "global_step": 126785, "epoch": 3018} {"train_loss": -6.698739051818848, "global_step": 126786, "epoch": 3018} {"train_loss": -6.755398750305176, "global_step": 126787, "epoch": 3018} {"train_loss": -6.702238082885742, "global_step": 126788, "epoch": 3018} {"train_loss": -6.659625053405762, "global_step": 126789, "epoch": 3018} {"train_loss": -6.716920852661133, "global_step": 126790, "epoch": 3018} {"train_loss": -6.583250522613525, "global_step": 126791, "epoch": 3018} {"train_loss": -6.6431074142456055, "global_step": 126792, "epoch": 3018} {"train_loss": -6.611464023590088, "global_step": 126793, "epoch": 3018} {"train_loss": -6.639936447143555, "global_step": 126794, "epoch": 3018} {"train_loss": -6.610006332397461, "global_step": 126795, "epoch": 3018} {"train_loss": -6.547928333282471, "global_step": 126796, "epoch": 3018} {"train_loss": -6.631671337854295, "global_step": 126797, "epoch": 3018, "val_loss": 66181.6328125} {"train_loss": -6.63442325592041, "global_step": 126798, "epoch": 3019} {"train_loss": -6.461034297943115, "global_step": 126799, "epoch": 3019} {"train_loss": -6.7021942138671875, "global_step": 126800, "epoch": 3019} {"train_loss": -6.496528625488281, "global_step": 126801, "epoch": 3019} {"train_loss": -6.689370155334473, "global_step": 126802, "epoch": 3019} {"train_loss": -6.641294479370117, "global_step": 126803, "epoch": 3019} {"train_loss": -6.621481895446777, "global_step": 126804, "epoch": 3019} {"train_loss": -6.558754920959473, "global_step": 126805, "epoch": 3019} {"train_loss": -6.55178165435791, "global_step": 126806, "epoch": 3019} {"train_loss": -6.6803693771362305, "global_step": 126807, "epoch": 3019} {"train_loss": -6.504148960113525, "global_step": 126808, "epoch": 3019} {"train_loss": -6.6778106689453125, "global_step": 126809, "epoch": 3019} {"train_loss": -6.629277229309082, "global_step": 126810, "epoch": 3019} {"train_loss": -6.726998329162598, "global_step": 126811, "epoch": 3019} {"train_loss": -6.77476167678833, "global_step": 126812, "epoch": 3019} {"train_loss": -6.659996032714844, "global_step": 126813, "epoch": 3019} {"train_loss": -6.4683613777160645, "global_step": 126814, "epoch": 3019} {"train_loss": -6.732623100280762, "global_step": 126815, "epoch": 3019} {"train_loss": -6.650230407714844, "global_step": 126816, "epoch": 3019} {"train_loss": -6.704700946807861, "global_step": 126817, "epoch": 3019} {"train_loss": -6.639800548553467, "global_step": 126818, "epoch": 3019} {"train_loss": -6.805728912353516, "global_step": 126819, "epoch": 3019} {"train_loss": -6.591641426086426, "global_step": 126820, "epoch": 3019} {"train_loss": -6.769632816314697, "global_step": 126821, "epoch": 3019} {"train_loss": -6.638216972351074, "global_step": 126822, "epoch": 3019} {"train_loss": -6.552859306335449, "global_step": 126823, "epoch": 3019} {"train_loss": -6.664012908935547, "global_step": 126824, "epoch": 3019} {"train_loss": -6.628264427185059, "global_step": 126825, "epoch": 3019} {"train_loss": -6.735562324523926, "global_step": 126826, "epoch": 3019} {"train_loss": -6.662234306335449, "global_step": 126827, "epoch": 3019} {"train_loss": -6.644989967346191, "global_step": 126828, "epoch": 3019} {"train_loss": -6.6045708656311035, "global_step": 126829, "epoch": 3019} {"train_loss": -6.620816230773926, "global_step": 126830, "epoch": 3019} {"train_loss": -6.745901107788086, "global_step": 126831, "epoch": 3019} {"train_loss": -6.683343410491943, "global_step": 126832, "epoch": 3019} {"train_loss": -6.669178009033203, "global_step": 126833, "epoch": 3019} {"train_loss": -6.7319746017456055, "global_step": 126834, "epoch": 3019} {"train_loss": -6.678557872772217, "global_step": 126835, "epoch": 3019} {"train_loss": -6.69205379486084, "global_step": 126836, "epoch": 3019} {"train_loss": -6.630265235900879, "global_step": 126837, "epoch": 3019} {"train_loss": -6.589299201965332, "global_step": 126838, "epoch": 3019} {"train_loss": -6.648604143233526, "global_step": 126839, "epoch": 3019, "val_loss": 66179.875} {"train_loss": -6.541356086730957, "global_step": 126840, "epoch": 3020} {"train_loss": -6.725897312164307, "global_step": 126841, "epoch": 3020} {"train_loss": -6.668954849243164, "global_step": 126842, "epoch": 3020} {"train_loss": -6.736640930175781, "global_step": 126843, "epoch": 3020} {"train_loss": -6.607182502746582, "global_step": 126844, "epoch": 3020} {"train_loss": -6.760151386260986, "global_step": 126845, "epoch": 3020} {"train_loss": -6.683850288391113, "global_step": 126846, "epoch": 3020} {"train_loss": -6.758233070373535, "global_step": 126847, "epoch": 3020} {"train_loss": -6.7772016525268555, "global_step": 126848, "epoch": 3020} {"train_loss": -6.649411678314209, "global_step": 126849, "epoch": 3020} {"train_loss": -6.734463691711426, "global_step": 126850, "epoch": 3020} {"train_loss": -6.73624849319458, "global_step": 126851, "epoch": 3020} {"train_loss": -6.659334182739258, "global_step": 126852, "epoch": 3020} {"train_loss": -6.641252517700195, "global_step": 126853, "epoch": 3020} {"train_loss": -6.640109062194824, "global_step": 126854, "epoch": 3020} {"train_loss": -6.660159111022949, "global_step": 126855, "epoch": 3020} {"train_loss": -6.648616790771484, "global_step": 126856, "epoch": 3020} {"train_loss": -6.638632297515869, "global_step": 126857, "epoch": 3020} {"train_loss": -6.672597885131836, "global_step": 126858, "epoch": 3020} {"train_loss": -6.639951705932617, "global_step": 126859, "epoch": 3020} {"train_loss": -6.663364410400391, "global_step": 126860, "epoch": 3020} {"train_loss": -6.654414176940918, "global_step": 126861, "epoch": 3020} {"train_loss": -6.622005462646484, "global_step": 126862, "epoch": 3020} {"train_loss": -6.557746410369873, "global_step": 126863, "epoch": 3020} {"train_loss": -6.603497505187988, "global_step": 126864, "epoch": 3020} {"train_loss": -6.608376502990723, "global_step": 126865, "epoch": 3020} {"train_loss": -6.74976921081543, "global_step": 126866, "epoch": 3020} {"train_loss": -6.6884026527404785, "global_step": 126867, "epoch": 3020} {"train_loss": -6.635638236999512, "global_step": 126868, "epoch": 3020} {"train_loss": -6.67573881149292, "global_step": 126869, "epoch": 3020} {"train_loss": -6.612927436828613, "global_step": 126870, "epoch": 3020} {"train_loss": -6.6630859375, "global_step": 126871, "epoch": 3020} {"train_loss": -6.555843353271484, "global_step": 126872, "epoch": 3020} {"train_loss": -6.631718635559082, "global_step": 126873, "epoch": 3020} {"train_loss": -6.633851051330566, "global_step": 126874, "epoch": 3020} {"train_loss": -6.757936477661133, "global_step": 126875, "epoch": 3020} {"train_loss": -6.667585372924805, "global_step": 126876, "epoch": 3020} {"train_loss": -6.578127861022949, "global_step": 126877, "epoch": 3020} {"train_loss": -6.5767693519592285, "global_step": 126878, "epoch": 3020} {"train_loss": -6.745950698852539, "global_step": 126879, "epoch": 3020} {"train_loss": -6.575474739074707, "global_step": 126880, "epoch": 3020} {"train_loss": -6.660208270663307, "global_step": 126881, "epoch": 3020, "val_loss": 66407.921875} {"train_loss": -6.599569797515869, "global_step": 126882, "epoch": 3021} {"train_loss": -6.598648548126221, "global_step": 126883, "epoch": 3021} {"train_loss": -6.695430755615234, "global_step": 126884, "epoch": 3021} {"train_loss": -6.572324752807617, "global_step": 126885, "epoch": 3021} {"train_loss": -6.571049213409424, "global_step": 126886, "epoch": 3021} {"train_loss": -6.519676208496094, "global_step": 126887, "epoch": 3021} {"train_loss": -6.594751358032227, "global_step": 126888, "epoch": 3021} {"train_loss": -6.574962139129639, "global_step": 126889, "epoch": 3021} {"train_loss": -6.566838264465332, "global_step": 126890, "epoch": 3021} {"train_loss": -6.556865215301514, "global_step": 126891, "epoch": 3021} {"train_loss": -6.658394813537598, "global_step": 126892, "epoch": 3021} {"train_loss": -6.577210426330566, "global_step": 126893, "epoch": 3021} {"train_loss": -6.677182674407959, "global_step": 126894, "epoch": 3021} {"train_loss": -6.578671932220459, "global_step": 126895, "epoch": 3021} {"train_loss": -6.586432456970215, "global_step": 126896, "epoch": 3021} {"train_loss": -6.602892875671387, "global_step": 126897, "epoch": 3021} {"train_loss": -6.66290283203125, "global_step": 126898, "epoch": 3021} {"train_loss": -6.599626541137695, "global_step": 126899, "epoch": 3021} {"train_loss": -6.4449462890625, "global_step": 126900, "epoch": 3021} {"train_loss": -6.553968906402588, "global_step": 126901, "epoch": 3021} {"train_loss": -6.715298652648926, "global_step": 126902, "epoch": 3021} {"train_loss": -6.626970291137695, "global_step": 126903, "epoch": 3021} {"train_loss": -6.5311174392700195, "global_step": 126904, "epoch": 3021} {"train_loss": -6.638004302978516, "global_step": 126905, "epoch": 3021} {"train_loss": -6.637759208679199, "global_step": 126906, "epoch": 3021} {"train_loss": -6.603193759918213, "global_step": 126907, "epoch": 3021} {"train_loss": -6.688324451446533, "global_step": 126908, "epoch": 3021} {"train_loss": -6.598329544067383, "global_step": 126909, "epoch": 3021} {"train_loss": -6.660719394683838, "global_step": 126910, "epoch": 3021} {"train_loss": -6.658648490905762, "global_step": 126911, "epoch": 3021} {"train_loss": -6.6610212326049805, "global_step": 126912, "epoch": 3021} {"train_loss": -6.565458297729492, "global_step": 126913, "epoch": 3021} {"train_loss": -6.714914798736572, "global_step": 126914, "epoch": 3021} {"train_loss": -6.589001655578613, "global_step": 126915, "epoch": 3021} {"train_loss": -6.573620319366455, "global_step": 126916, "epoch": 3021} {"train_loss": -6.744042873382568, "global_step": 126917, "epoch": 3021} {"train_loss": -6.731175899505615, "global_step": 126918, "epoch": 3021} {"train_loss": -6.742784023284912, "global_step": 126919, "epoch": 3021} {"train_loss": -6.662085056304932, "global_step": 126920, "epoch": 3021} {"train_loss": -6.6434197425842285, "global_step": 126921, "epoch": 3021} {"train_loss": -6.574346542358398, "global_step": 126922, "epoch": 3021} {"train_loss": -6.613917838959467, "global_step": 126923, "epoch": 3021, "val_loss": 66210.0859375} {"train_loss": -6.556582450866699, "global_step": 126924, "epoch": 3022} {"train_loss": -6.706052780151367, "global_step": 126925, "epoch": 3022} {"train_loss": -6.753651142120361, "global_step": 126926, "epoch": 3022} {"train_loss": -6.635030746459961, "global_step": 126927, "epoch": 3022} {"train_loss": -6.696551322937012, "global_step": 126928, "epoch": 3022} {"train_loss": -6.769342422485352, "global_step": 126929, "epoch": 3022} {"train_loss": -6.635753631591797, "global_step": 126930, "epoch": 3022} {"train_loss": -6.721395492553711, "global_step": 126931, "epoch": 3022} {"train_loss": -6.77163553237915, "global_step": 126932, "epoch": 3022} {"train_loss": -6.738059043884277, "global_step": 126933, "epoch": 3022} {"train_loss": -6.658445358276367, "global_step": 126934, "epoch": 3022} {"train_loss": -6.754293441772461, "global_step": 126935, "epoch": 3022} {"train_loss": -6.605287551879883, "global_step": 126936, "epoch": 3022} {"train_loss": -6.6670732498168945, "global_step": 126937, "epoch": 3022} {"train_loss": -6.696502685546875, "global_step": 126938, "epoch": 3022} {"train_loss": -6.661563873291016, "global_step": 126939, "epoch": 3022} {"train_loss": -6.696928977966309, "global_step": 126940, "epoch": 3022} {"train_loss": -6.597116947174072, "global_step": 126941, "epoch": 3022} {"train_loss": -6.728570938110352, "global_step": 126942, "epoch": 3022} {"train_loss": -6.734556198120117, "global_step": 126943, "epoch": 3022} {"train_loss": -6.604959011077881, "global_step": 126944, "epoch": 3022} {"train_loss": -6.649436950683594, "global_step": 126945, "epoch": 3022} {"train_loss": -6.804803371429443, "global_step": 126946, "epoch": 3022} {"train_loss": -6.520749092102051, "global_step": 126947, "epoch": 3022} {"train_loss": -6.596834182739258, "global_step": 126948, "epoch": 3022} {"train_loss": -6.560125350952148, "global_step": 126949, "epoch": 3022} {"train_loss": -6.604130744934082, "global_step": 126950, "epoch": 3022} {"train_loss": -6.563933849334717, "global_step": 126951, "epoch": 3022} {"train_loss": -6.567903995513916, "global_step": 126952, "epoch": 3022} {"train_loss": -6.651515960693359, "global_step": 126953, "epoch": 3022} {"train_loss": -6.703339576721191, "global_step": 126954, "epoch": 3022} {"train_loss": -6.650217056274414, "global_step": 126955, "epoch": 3022} {"train_loss": -6.598042964935303, "global_step": 126956, "epoch": 3022} {"train_loss": -6.645307540893555, "global_step": 126957, "epoch": 3022} {"train_loss": -6.497138977050781, "global_step": 126958, "epoch": 3022} {"train_loss": -6.718469619750977, "global_step": 126959, "epoch": 3022} {"train_loss": -6.632331848144531, "global_step": 126960, "epoch": 3022} {"train_loss": -6.65104866027832, "global_step": 126961, "epoch": 3022} {"train_loss": -6.625868797302246, "global_step": 126962, "epoch": 3022} {"train_loss": -6.639286994934082, "global_step": 126963, "epoch": 3022} {"train_loss": -6.727356910705566, "global_step": 126964, "epoch": 3022} {"train_loss": -6.6582105954488116, "global_step": 126965, "epoch": 3022, "val_loss": 66365.5703125} {"train_loss": -6.573378562927246, "global_step": 126966, "epoch": 3023} {"train_loss": -6.72697114944458, "global_step": 126967, "epoch": 3023} {"train_loss": -6.662055492401123, "global_step": 126968, "epoch": 3023} {"train_loss": -6.668285369873047, "global_step": 126969, "epoch": 3023} {"train_loss": -6.552037239074707, "global_step": 126970, "epoch": 3023} {"train_loss": -6.62908935546875, "global_step": 126971, "epoch": 3023} {"train_loss": -6.647221565246582, "global_step": 126972, "epoch": 3023} {"train_loss": -6.636354446411133, "global_step": 126973, "epoch": 3023} {"train_loss": -6.666008949279785, "global_step": 126974, "epoch": 3023} {"train_loss": -6.74306058883667, "global_step": 126975, "epoch": 3023} {"train_loss": -6.693404674530029, "global_step": 126976, "epoch": 3023} {"train_loss": -6.739452838897705, "global_step": 126977, "epoch": 3023} {"train_loss": -6.6674346923828125, "global_step": 126978, "epoch": 3023} {"train_loss": -6.668892860412598, "global_step": 126979, "epoch": 3023} {"train_loss": -6.642176628112793, "global_step": 126980, "epoch": 3023} {"train_loss": -6.627041339874268, "global_step": 126981, "epoch": 3023} {"train_loss": -6.594642639160156, "global_step": 126982, "epoch": 3023} {"train_loss": -6.572476863861084, "global_step": 126983, "epoch": 3023} {"train_loss": -6.627412796020508, "global_step": 126984, "epoch": 3023} {"train_loss": -6.611798286437988, "global_step": 126985, "epoch": 3023} {"train_loss": -6.609349250793457, "global_step": 126986, "epoch": 3023} {"train_loss": -6.610861778259277, "global_step": 126987, "epoch": 3023} {"train_loss": -6.73171854019165, "global_step": 126988, "epoch": 3023} {"train_loss": -6.6394572257995605, "global_step": 126989, "epoch": 3023} {"train_loss": -6.673639297485352, "global_step": 126990, "epoch": 3023} {"train_loss": -6.548725605010986, "global_step": 126991, "epoch": 3023} {"train_loss": -6.566463470458984, "global_step": 126992, "epoch": 3023} {"train_loss": -6.743373870849609, "global_step": 126993, "epoch": 3023} {"train_loss": -6.5955071449279785, "global_step": 126994, "epoch": 3023} {"train_loss": -6.637748718261719, "global_step": 126995, "epoch": 3023} {"train_loss": -6.713102340698242, "global_step": 126996, "epoch": 3023} {"train_loss": -6.67347526550293, "global_step": 126997, "epoch": 3023} {"train_loss": -6.644975185394287, "global_step": 126998, "epoch": 3023} {"train_loss": -6.487100601196289, "global_step": 126999, "epoch": 3023} {"train_loss": -6.60952091217041, "global_step": 127000, "epoch": 3023} {"train_loss": -6.621662139892578, "global_step": 127001, "epoch": 3023} {"train_loss": -6.653259754180908, "global_step": 127002, "epoch": 3023} {"train_loss": -6.613799095153809, "global_step": 127003, "epoch": 3023} {"train_loss": -6.6205854415893555, "global_step": 127004, "epoch": 3023} {"train_loss": -6.5710673332214355, "global_step": 127005, "epoch": 3023} {"train_loss": -6.576198101043701, "global_step": 127006, "epoch": 3023} {"train_loss": -6.636309226353963, "global_step": 127007, "epoch": 3023, "val_loss": 66147.4140625} {"train_loss": -6.646910667419434, "global_step": 127008, "epoch": 3024} {"train_loss": -6.567843437194824, "global_step": 127009, "epoch": 3024} {"train_loss": -6.638916015625, "global_step": 127010, "epoch": 3024} {"train_loss": -6.64498233795166, "global_step": 127011, "epoch": 3024} {"train_loss": -6.678894996643066, "global_step": 127012, "epoch": 3024} {"train_loss": -6.689092636108398, "global_step": 127013, "epoch": 3024} {"train_loss": -6.637822151184082, "global_step": 127014, "epoch": 3024} {"train_loss": -6.6440019607543945, "global_step": 127015, "epoch": 3024} {"train_loss": -6.733968257904053, "global_step": 127016, "epoch": 3024} {"train_loss": -6.6641154289245605, "global_step": 127017, "epoch": 3024} {"train_loss": -6.6407670974731445, "global_step": 127018, "epoch": 3024} {"train_loss": -6.631013870239258, "global_step": 127019, "epoch": 3024} {"train_loss": -6.666137218475342, "global_step": 127020, "epoch": 3024} {"train_loss": -6.5354204177856445, "global_step": 127021, "epoch": 3024} {"train_loss": -6.6632280349731445, "global_step": 127022, "epoch": 3024} {"train_loss": -6.607053279876709, "global_step": 127023, "epoch": 3024} {"train_loss": -6.739892482757568, "global_step": 127024, "epoch": 3024} {"train_loss": -6.698061943054199, "global_step": 127025, "epoch": 3024} {"train_loss": -6.636580467224121, "global_step": 127026, "epoch": 3024} {"train_loss": -6.6806535720825195, "global_step": 127027, "epoch": 3024} {"train_loss": -6.564444065093994, "global_step": 127028, "epoch": 3024} {"train_loss": -6.616824150085449, "global_step": 127029, "epoch": 3024} {"train_loss": -6.57771635055542, "global_step": 127030, "epoch": 3024} {"train_loss": -6.611517906188965, "global_step": 127031, "epoch": 3024} {"train_loss": -6.680795669555664, "global_step": 127032, "epoch": 3024} {"train_loss": -6.630796432495117, "global_step": 127033, "epoch": 3024} {"train_loss": -6.564915180206299, "global_step": 127034, "epoch": 3024} {"train_loss": -6.553989410400391, "global_step": 127035, "epoch": 3024} {"train_loss": -6.666012763977051, "global_step": 127036, "epoch": 3024} {"train_loss": -6.614501953125, "global_step": 127037, "epoch": 3024} {"train_loss": -6.688955307006836, "global_step": 127038, "epoch": 3024} {"train_loss": -6.637173652648926, "global_step": 127039, "epoch": 3024} {"train_loss": -6.472363471984863, "global_step": 127040, "epoch": 3024} {"train_loss": -6.601926803588867, "global_step": 127041, "epoch": 3024} {"train_loss": -6.522048473358154, "global_step": 127042, "epoch": 3024} {"train_loss": -6.607339382171631, "global_step": 127043, "epoch": 3024} {"train_loss": -6.619056701660156, "global_step": 127044, "epoch": 3024} {"train_loss": -6.613771438598633, "global_step": 127045, "epoch": 3024} {"train_loss": -6.507266998291016, "global_step": 127046, "epoch": 3024} {"train_loss": -6.681077003479004, "global_step": 127047, "epoch": 3024} {"train_loss": -6.426508903503418, "global_step": 127048, "epoch": 3024} {"train_loss": -6.62131515003386, "global_step": 127049, "epoch": 3024, "val_loss": 66265.0625} {"train_loss": -6.578536033630371, "global_step": 127050, "epoch": 3025} {"train_loss": -6.601502418518066, "global_step": 127051, "epoch": 3025} {"train_loss": -6.658149719238281, "global_step": 127052, "epoch": 3025} {"train_loss": -6.659841537475586, "global_step": 127053, "epoch": 3025} {"train_loss": -6.499874114990234, "global_step": 127054, "epoch": 3025} {"train_loss": -6.573420524597168, "global_step": 127055, "epoch": 3025} {"train_loss": -6.693778991699219, "global_step": 127056, "epoch": 3025} {"train_loss": -6.621973514556885, "global_step": 127057, "epoch": 3025} {"train_loss": -6.560542106628418, "global_step": 127058, "epoch": 3025} {"train_loss": -6.570977687835693, "global_step": 127059, "epoch": 3025} {"train_loss": -6.597445487976074, "global_step": 127060, "epoch": 3025} {"train_loss": -6.656048774719238, "global_step": 127061, "epoch": 3025} {"train_loss": -6.633138179779053, "global_step": 127062, "epoch": 3025} {"train_loss": -6.634889602661133, "global_step": 127063, "epoch": 3025} {"train_loss": -6.585991859436035, "global_step": 127064, "epoch": 3025} {"train_loss": -6.628204345703125, "global_step": 127065, "epoch": 3025} {"train_loss": -6.573657035827637, "global_step": 127066, "epoch": 3025} {"train_loss": -6.566987991333008, "global_step": 127067, "epoch": 3025} {"train_loss": -6.538990497589111, "global_step": 127068, "epoch": 3025} {"train_loss": -6.518387317657471, "global_step": 127069, "epoch": 3025} {"train_loss": -6.526251316070557, "global_step": 127070, "epoch": 3025} {"train_loss": -6.753164768218994, "global_step": 127071, "epoch": 3025} {"train_loss": -6.642502784729004, "global_step": 127072, "epoch": 3025} {"train_loss": -6.6582746505737305, "global_step": 127073, "epoch": 3025} {"train_loss": -6.665463447570801, "global_step": 127074, "epoch": 3025} {"train_loss": -6.729365825653076, "global_step": 127075, "epoch": 3025} {"train_loss": -6.732516288757324, "global_step": 127076, "epoch": 3025} {"train_loss": -6.739086151123047, "global_step": 127077, "epoch": 3025} {"train_loss": -6.618765830993652, "global_step": 127078, "epoch": 3025} {"train_loss": -6.619967460632324, "global_step": 127079, "epoch": 3025} {"train_loss": -6.651914596557617, "global_step": 127080, "epoch": 3025} {"train_loss": -6.6378912925720215, "global_step": 127081, "epoch": 3025} {"train_loss": -6.644811630249023, "global_step": 127082, "epoch": 3025} {"train_loss": -6.755877494812012, "global_step": 127083, "epoch": 3025} {"train_loss": -6.660693168640137, "global_step": 127084, "epoch": 3025} {"train_loss": -6.727175712585449, "global_step": 127085, "epoch": 3025} {"train_loss": -6.6821184158325195, "global_step": 127086, "epoch": 3025} {"train_loss": -6.689671039581299, "global_step": 127087, "epoch": 3025} {"train_loss": -6.7118306159973145, "global_step": 127088, "epoch": 3025} {"train_loss": -6.614353179931641, "global_step": 127089, "epoch": 3025} {"train_loss": -6.673276901245117, "global_step": 127090, "epoch": 3025} {"train_loss": -6.637084813345046, "global_step": 127091, "epoch": 3025, "val_loss": 66007.4296875} {"train_loss": -6.581099510192871, "global_step": 127092, "epoch": 3026} {"train_loss": -6.566732883453369, "global_step": 127093, "epoch": 3026} {"train_loss": -6.618131637573242, "global_step": 127094, "epoch": 3026} {"train_loss": -6.509818077087402, "global_step": 127095, "epoch": 3026} {"train_loss": -6.631858825683594, "global_step": 127096, "epoch": 3026} {"train_loss": -6.3561110496521, "global_step": 127097, "epoch": 3026} {"train_loss": -6.514122009277344, "global_step": 127098, "epoch": 3026} {"train_loss": -6.492439270019531, "global_step": 127099, "epoch": 3026} {"train_loss": -6.338929176330566, "global_step": 127100, "epoch": 3026} {"train_loss": -6.644126892089844, "global_step": 127101, "epoch": 3026} {"train_loss": -6.48716926574707, "global_step": 127102, "epoch": 3026} {"train_loss": -6.388146877288818, "global_step": 127103, "epoch": 3026} {"train_loss": -6.60784387588501, "global_step": 127104, "epoch": 3026} {"train_loss": -6.431818962097168, "global_step": 127105, "epoch": 3026} {"train_loss": -6.530016899108887, "global_step": 127106, "epoch": 3026} {"train_loss": -6.569705009460449, "global_step": 127107, "epoch": 3026} {"train_loss": -6.537347316741943, "global_step": 127108, "epoch": 3026} {"train_loss": -6.593028545379639, "global_step": 127109, "epoch": 3026} {"train_loss": -6.503279685974121, "global_step": 127110, "epoch": 3026} {"train_loss": -6.606332778930664, "global_step": 127111, "epoch": 3026} {"train_loss": -6.607080936431885, "global_step": 127112, "epoch": 3026} {"train_loss": -6.631682395935059, "global_step": 127113, "epoch": 3026} {"train_loss": -6.611995697021484, "global_step": 127114, "epoch": 3026} {"train_loss": -6.666563034057617, "global_step": 127115, "epoch": 3026} {"train_loss": -6.642948627471924, "global_step": 127116, "epoch": 3026} {"train_loss": -6.641176700592041, "global_step": 127117, "epoch": 3026} {"train_loss": -6.67606258392334, "global_step": 127118, "epoch": 3026} {"train_loss": -6.6578850746154785, "global_step": 127119, "epoch": 3026} {"train_loss": -6.7326979637146, "global_step": 127120, "epoch": 3026} {"train_loss": -6.570523738861084, "global_step": 127121, "epoch": 3026} {"train_loss": -6.7493391036987305, "global_step": 127122, "epoch": 3026} {"train_loss": -6.611069679260254, "global_step": 127123, "epoch": 3026} {"train_loss": -6.597438812255859, "global_step": 127124, "epoch": 3026} {"train_loss": -6.700045585632324, "global_step": 127125, "epoch": 3026} {"train_loss": -6.587966442108154, "global_step": 127126, "epoch": 3026} {"train_loss": -6.625444412231445, "global_step": 127127, "epoch": 3026} {"train_loss": -6.647963523864746, "global_step": 127128, "epoch": 3026} {"train_loss": -6.550402641296387, "global_step": 127129, "epoch": 3026} {"train_loss": -6.664616107940674, "global_step": 127130, "epoch": 3026} {"train_loss": -6.635409355163574, "global_step": 127131, "epoch": 3026} {"train_loss": -6.70110559463501, "global_step": 127132, "epoch": 3026} {"train_loss": -6.588566064834595, "global_step": 127133, "epoch": 3026, "val_loss": 66131.3984375} {"train_loss": -6.534985542297363, "global_step": 127134, "epoch": 3027} {"train_loss": -6.572734832763672, "global_step": 127135, "epoch": 3027} {"train_loss": -6.74520206451416, "global_step": 127136, "epoch": 3027} {"train_loss": -6.386776924133301, "global_step": 127137, "epoch": 3027} {"train_loss": -6.647546768188477, "global_step": 127138, "epoch": 3027} {"train_loss": -6.587521076202393, "global_step": 127139, "epoch": 3027} {"train_loss": -6.727171897888184, "global_step": 127140, "epoch": 3027} {"train_loss": -6.7173638343811035, "global_step": 127141, "epoch": 3027} {"train_loss": -6.713456153869629, "global_step": 127142, "epoch": 3027} {"train_loss": -6.643248081207275, "global_step": 127143, "epoch": 3027} {"train_loss": -6.560031890869141, "global_step": 127144, "epoch": 3027} {"train_loss": -6.59315824508667, "global_step": 127145, "epoch": 3027} {"train_loss": -6.749475479125977, "global_step": 127146, "epoch": 3027} {"train_loss": -6.668164253234863, "global_step": 127147, "epoch": 3027} {"train_loss": -6.661364555358887, "global_step": 127148, "epoch": 3027} {"train_loss": -6.642950057983398, "global_step": 127149, "epoch": 3027} {"train_loss": -6.628772735595703, "global_step": 127150, "epoch": 3027} {"train_loss": -6.613560676574707, "global_step": 127151, "epoch": 3027} {"train_loss": -6.737026214599609, "global_step": 127152, "epoch": 3027} {"train_loss": -6.51967716217041, "global_step": 127153, "epoch": 3027} {"train_loss": -6.764224052429199, "global_step": 127154, "epoch": 3027} {"train_loss": -6.657043933868408, "global_step": 127155, "epoch": 3027} {"train_loss": -6.636395454406738, "global_step": 127156, "epoch": 3027} {"train_loss": -6.633935928344727, "global_step": 127157, "epoch": 3027} {"train_loss": -6.6363301277160645, "global_step": 127158, "epoch": 3027} {"train_loss": -6.539366722106934, "global_step": 127159, "epoch": 3027} {"train_loss": -6.539680480957031, "global_step": 127160, "epoch": 3027} {"train_loss": -6.637105464935303, "global_step": 127161, "epoch": 3027} {"train_loss": -6.5182576179504395, "global_step": 127162, "epoch": 3027} {"train_loss": -6.715847969055176, "global_step": 127163, "epoch": 3027} {"train_loss": -6.713963031768799, "global_step": 127164, "epoch": 3027} {"train_loss": -6.683508396148682, "global_step": 127165, "epoch": 3027} {"train_loss": -6.655200958251953, "global_step": 127166, "epoch": 3027} {"train_loss": -6.683269500732422, "global_step": 127167, "epoch": 3027} {"train_loss": -6.686577320098877, "global_step": 127168, "epoch": 3027} {"train_loss": -6.704431056976318, "global_step": 127169, "epoch": 3027} {"train_loss": -6.535792350769043, "global_step": 127170, "epoch": 3027} {"train_loss": -6.505714416503906, "global_step": 127171, "epoch": 3027} {"train_loss": -6.681408882141113, "global_step": 127172, "epoch": 3027} {"train_loss": -6.608057022094727, "global_step": 127173, "epoch": 3027} {"train_loss": -6.618472099304199, "global_step": 127174, "epoch": 3027} {"train_loss": -6.634374720709665, "global_step": 127175, "epoch": 3027, "val_loss": 66071.4921875} {"train_loss": -6.546547889709473, "global_step": 127176, "epoch": 3028} {"train_loss": -6.740427017211914, "global_step": 127177, "epoch": 3028} {"train_loss": -6.700979232788086, "global_step": 127178, "epoch": 3028} {"train_loss": -6.72416877746582, "global_step": 127179, "epoch": 3028} {"train_loss": -6.716522216796875, "global_step": 127180, "epoch": 3028} {"train_loss": -6.664958953857422, "global_step": 127181, "epoch": 3028} {"train_loss": -6.688730716705322, "global_step": 127182, "epoch": 3028} {"train_loss": -6.564467430114746, "global_step": 127183, "epoch": 3028} {"train_loss": -6.803187370300293, "global_step": 127184, "epoch": 3028} {"train_loss": -6.699638366699219, "global_step": 127185, "epoch": 3028} {"train_loss": -6.642740249633789, "global_step": 127186, "epoch": 3028} {"train_loss": -6.680091857910156, "global_step": 127187, "epoch": 3028} {"train_loss": -6.718854904174805, "global_step": 127188, "epoch": 3028} {"train_loss": -6.699402809143066, "global_step": 127189, "epoch": 3028} {"train_loss": -6.717554569244385, "global_step": 127190, "epoch": 3028} {"train_loss": -6.61358642578125, "global_step": 127191, "epoch": 3028} {"train_loss": -6.679178237915039, "global_step": 127192, "epoch": 3028} {"train_loss": -6.644515037536621, "global_step": 127193, "epoch": 3028} {"train_loss": -6.593196868896484, "global_step": 127194, "epoch": 3028} {"train_loss": -6.6791815757751465, "global_step": 127195, "epoch": 3028} {"train_loss": -6.57354211807251, "global_step": 127196, "epoch": 3028} {"train_loss": -6.709846019744873, "global_step": 127197, "epoch": 3028} {"train_loss": -6.618756294250488, "global_step": 127198, "epoch": 3028} {"train_loss": -6.640295028686523, "global_step": 127199, "epoch": 3028} {"train_loss": -6.68339729309082, "global_step": 127200, "epoch": 3028} {"train_loss": -6.573744297027588, "global_step": 127201, "epoch": 3028} {"train_loss": -6.650824546813965, "global_step": 127202, "epoch": 3028} {"train_loss": -6.655765533447266, "global_step": 127203, "epoch": 3028} {"train_loss": -6.716586112976074, "global_step": 127204, "epoch": 3028} {"train_loss": -6.649593353271484, "global_step": 127205, "epoch": 3028} {"train_loss": -6.728273868560791, "global_step": 127206, "epoch": 3028} {"train_loss": -6.490004539489746, "global_step": 127207, "epoch": 3028} {"train_loss": -6.641861915588379, "global_step": 127208, "epoch": 3028} {"train_loss": -6.624944686889648, "global_step": 127209, "epoch": 3028} {"train_loss": -6.522136688232422, "global_step": 127210, "epoch": 3028} {"train_loss": -6.7105607986450195, "global_step": 127211, "epoch": 3028} {"train_loss": -6.610831260681152, "global_step": 127212, "epoch": 3028} {"train_loss": -6.583220481872559, "global_step": 127213, "epoch": 3028} {"train_loss": -6.723514080047607, "global_step": 127214, "epoch": 3028} {"train_loss": -6.683906555175781, "global_step": 127215, "epoch": 3028} {"train_loss": -6.662295341491699, "global_step": 127216, "epoch": 3028} {"train_loss": -6.659348101842971, "global_step": 127217, "epoch": 3028, "val_loss": 66301.2421875} {"train_loss": -6.710638999938965, "global_step": 127218, "epoch": 3029} {"train_loss": -6.6120829582214355, "global_step": 127219, "epoch": 3029} {"train_loss": -6.748991012573242, "global_step": 127220, "epoch": 3029} {"train_loss": -6.633305072784424, "global_step": 127221, "epoch": 3029} {"train_loss": -6.572875499725342, "global_step": 127222, "epoch": 3029} {"train_loss": -6.692429542541504, "global_step": 127223, "epoch": 3029} {"train_loss": -6.807195663452148, "global_step": 127224, "epoch": 3029} {"train_loss": -6.646486282348633, "global_step": 127225, "epoch": 3029} {"train_loss": -6.740506172180176, "global_step": 127226, "epoch": 3029} {"train_loss": -6.667827606201172, "global_step": 127227, "epoch": 3029} {"train_loss": -6.635501384735107, "global_step": 127228, "epoch": 3029} {"train_loss": -6.62091588973999, "global_step": 127229, "epoch": 3029} {"train_loss": -6.694674968719482, "global_step": 127230, "epoch": 3029} {"train_loss": -6.626859664916992, "global_step": 127231, "epoch": 3029} {"train_loss": -6.608308792114258, "global_step": 127232, "epoch": 3029} {"train_loss": -6.598711013793945, "global_step": 127233, "epoch": 3029} {"train_loss": -6.721105575561523, "global_step": 127234, "epoch": 3029} {"train_loss": -6.508157253265381, "global_step": 127235, "epoch": 3029} {"train_loss": -6.566701889038086, "global_step": 127236, "epoch": 3029} {"train_loss": -6.562769889831543, "global_step": 127237, "epoch": 3029} {"train_loss": -6.432648658752441, "global_step": 127238, "epoch": 3029} {"train_loss": -6.523317337036133, "global_step": 127239, "epoch": 3029} {"train_loss": -6.5359110832214355, "global_step": 127240, "epoch": 3029} {"train_loss": -6.527178764343262, "global_step": 127241, "epoch": 3029} {"train_loss": -6.631466865539551, "global_step": 127242, "epoch": 3029} {"train_loss": -6.458718299865723, "global_step": 127243, "epoch": 3029} {"train_loss": -6.623058319091797, "global_step": 127244, "epoch": 3029} {"train_loss": -6.429581165313721, "global_step": 127245, "epoch": 3029} {"train_loss": -6.557137489318848, "global_step": 127246, "epoch": 3029} {"train_loss": -6.673678874969482, "global_step": 127247, "epoch": 3029} {"train_loss": -6.504404067993164, "global_step": 127248, "epoch": 3029} {"train_loss": -6.516449928283691, "global_step": 127249, "epoch": 3029} {"train_loss": -6.496368408203125, "global_step": 127250, "epoch": 3029} {"train_loss": -6.589822769165039, "global_step": 127251, "epoch": 3029} {"train_loss": -6.545037746429443, "global_step": 127252, "epoch": 3029} {"train_loss": -6.602370262145996, "global_step": 127253, "epoch": 3029} {"train_loss": -6.632279872894287, "global_step": 127254, "epoch": 3029} {"train_loss": -6.614015579223633, "global_step": 127255, "epoch": 3029} {"train_loss": -6.615649223327637, "global_step": 127256, "epoch": 3029} {"train_loss": -6.664786338806152, "global_step": 127257, "epoch": 3029} {"train_loss": -6.577561378479004, "global_step": 127258, "epoch": 3029} {"train_loss": -6.603062266395206, "global_step": 127259, "epoch": 3029, "val_loss": 66361.796875} {"train_loss": -6.692450523376465, "global_step": 127260, "epoch": 3030} {"train_loss": -6.7274580001831055, "global_step": 127261, "epoch": 3030} {"train_loss": -6.622983455657959, "global_step": 127262, "epoch": 3030} {"train_loss": -6.510102272033691, "global_step": 127263, "epoch": 3030} {"train_loss": -6.67267370223999, "global_step": 127264, "epoch": 3030} {"train_loss": -6.626630783081055, "global_step": 127265, "epoch": 3030} {"train_loss": -6.561715126037598, "global_step": 127266, "epoch": 3030} {"train_loss": -6.648514747619629, "global_step": 127267, "epoch": 3030} {"train_loss": -6.678749084472656, "global_step": 127268, "epoch": 3030} {"train_loss": -6.701642990112305, "global_step": 127269, "epoch": 3030} {"train_loss": -6.5714569091796875, "global_step": 127270, "epoch": 3030} {"train_loss": -6.670907974243164, "global_step": 127271, "epoch": 3030} {"train_loss": -6.592870712280273, "global_step": 127272, "epoch": 3030} {"train_loss": -6.701423645019531, "global_step": 127273, "epoch": 3030} {"train_loss": -6.657768249511719, "global_step": 127274, "epoch": 3030} {"train_loss": -6.708306312561035, "global_step": 127275, "epoch": 3030} {"train_loss": -6.623929977416992, "global_step": 127276, "epoch": 3030} {"train_loss": -6.74971866607666, "global_step": 127277, "epoch": 3030} {"train_loss": -6.633452415466309, "global_step": 127278, "epoch": 3030} {"train_loss": -6.598423004150391, "global_step": 127279, "epoch": 3030} {"train_loss": -6.763121128082275, "global_step": 127280, "epoch": 3030} {"train_loss": -6.5254411697387695, "global_step": 127281, "epoch": 3030} {"train_loss": -6.830019474029541, "global_step": 127282, "epoch": 3030} {"train_loss": -6.773055076599121, "global_step": 127283, "epoch": 3030} {"train_loss": -6.603304386138916, "global_step": 127284, "epoch": 3030} {"train_loss": -6.671967506408691, "global_step": 127285, "epoch": 3030} {"train_loss": -6.555673599243164, "global_step": 127286, "epoch": 3030} {"train_loss": -6.642901420593262, "global_step": 127287, "epoch": 3030} {"train_loss": -6.668948650360107, "global_step": 127288, "epoch": 3030} {"train_loss": -6.6371002197265625, "global_step": 127289, "epoch": 3030} {"train_loss": -6.671923637390137, "global_step": 127290, "epoch": 3030} {"train_loss": -6.730786323547363, "global_step": 127291, "epoch": 3030} {"train_loss": -6.596187114715576, "global_step": 127292, "epoch": 3030} {"train_loss": -6.489973068237305, "global_step": 127293, "epoch": 3030} {"train_loss": -6.692648887634277, "global_step": 127294, "epoch": 3030} {"train_loss": -6.637969970703125, "global_step": 127295, "epoch": 3030} {"train_loss": -6.649975776672363, "global_step": 127296, "epoch": 3030} {"train_loss": -6.566868305206299, "global_step": 127297, "epoch": 3030} {"train_loss": -6.563488006591797, "global_step": 127298, "epoch": 3030} {"train_loss": -6.645208835601807, "global_step": 127299, "epoch": 3030} {"train_loss": -6.663661956787109, "global_step": 127300, "epoch": 3030} {"train_loss": -6.645979540688651, "global_step": 127301, "epoch": 3030, "val_loss": 66165.1875} {"train_loss": -6.551030158996582, "global_step": 127302, "epoch": 3031} {"train_loss": -6.546279430389404, "global_step": 127303, "epoch": 3031} {"train_loss": -6.60198450088501, "global_step": 127304, "epoch": 3031} {"train_loss": -6.617253303527832, "global_step": 127305, "epoch": 3031} {"train_loss": -6.606282711029053, "global_step": 127306, "epoch": 3031} {"train_loss": -6.577430725097656, "global_step": 127307, "epoch": 3031} {"train_loss": -6.575162410736084, "global_step": 127308, "epoch": 3031} {"train_loss": -6.727053165435791, "global_step": 127309, "epoch": 3031} {"train_loss": -6.573716163635254, "global_step": 127310, "epoch": 3031} {"train_loss": -6.66630744934082, "global_step": 127311, "epoch": 3031} {"train_loss": -6.631549835205078, "global_step": 127312, "epoch": 3031} {"train_loss": -6.515225410461426, "global_step": 127313, "epoch": 3031} {"train_loss": -6.625791549682617, "global_step": 127314, "epoch": 3031} {"train_loss": -6.651506423950195, "global_step": 127315, "epoch": 3031} {"train_loss": -6.638587951660156, "global_step": 127316, "epoch": 3031} {"train_loss": -6.5539350509643555, "global_step": 127317, "epoch": 3031} {"train_loss": -6.654726982116699, "global_step": 127318, "epoch": 3031} {"train_loss": -6.707890510559082, "global_step": 127319, "epoch": 3031} {"train_loss": -6.74663782119751, "global_step": 127320, "epoch": 3031} {"train_loss": -6.63367223739624, "global_step": 127321, "epoch": 3031} {"train_loss": -6.623054504394531, "global_step": 127322, "epoch": 3031} {"train_loss": -6.607269287109375, "global_step": 127323, "epoch": 3031} {"train_loss": -6.5850019454956055, "global_step": 127324, "epoch": 3031} {"train_loss": -6.599248886108398, "global_step": 127325, "epoch": 3031} {"train_loss": -6.723642349243164, "global_step": 127326, "epoch": 3031} {"train_loss": -6.569241523742676, "global_step": 127327, "epoch": 3031} {"train_loss": -6.501463890075684, "global_step": 127328, "epoch": 3031} {"train_loss": -6.71411657333374, "global_step": 127329, "epoch": 3031} {"train_loss": -6.521162509918213, "global_step": 127330, "epoch": 3031} {"train_loss": -6.558938026428223, "global_step": 127331, "epoch": 3031} {"train_loss": -6.674315452575684, "global_step": 127332, "epoch": 3031} {"train_loss": -6.511545181274414, "global_step": 127333, "epoch": 3031} {"train_loss": -6.666887283325195, "global_step": 127334, "epoch": 3031} {"train_loss": -6.605181694030762, "global_step": 127335, "epoch": 3031} {"train_loss": -6.684887886047363, "global_step": 127336, "epoch": 3031} {"train_loss": -6.690380573272705, "global_step": 127337, "epoch": 3031} {"train_loss": -6.5941314697265625, "global_step": 127338, "epoch": 3031} {"train_loss": -6.613387107849121, "global_step": 127339, "epoch": 3031} {"train_loss": -6.692489147186279, "global_step": 127340, "epoch": 3031} {"train_loss": -6.667949676513672, "global_step": 127341, "epoch": 3031} {"train_loss": -6.745395660400391, "global_step": 127342, "epoch": 3031} {"train_loss": -6.6242376282101585, "global_step": 127343, "epoch": 3031, "val_loss": 66319.2578125} {"train_loss": -6.698060035705566, "global_step": 127344, "epoch": 3032} {"train_loss": -6.630746841430664, "global_step": 127345, "epoch": 3032} {"train_loss": -6.694911003112793, "global_step": 127346, "epoch": 3032} {"train_loss": -6.530149459838867, "global_step": 127347, "epoch": 3032} {"train_loss": -6.631303787231445, "global_step": 127348, "epoch": 3032} {"train_loss": -6.729816436767578, "global_step": 127349, "epoch": 3032} {"train_loss": -6.601503372192383, "global_step": 127350, "epoch": 3032} {"train_loss": -6.591617584228516, "global_step": 127351, "epoch": 3032} {"train_loss": -6.589211463928223, "global_step": 127352, "epoch": 3032} {"train_loss": -6.640604019165039, "global_step": 127353, "epoch": 3032} {"train_loss": -6.717859745025635, "global_step": 127354, "epoch": 3032} {"train_loss": -6.54302453994751, "global_step": 127355, "epoch": 3032} {"train_loss": -6.584847450256348, "global_step": 127356, "epoch": 3032} {"train_loss": -6.684775352478027, "global_step": 127357, "epoch": 3032} {"train_loss": -6.50911808013916, "global_step": 127358, "epoch": 3032} {"train_loss": -6.550981521606445, "global_step": 127359, "epoch": 3032} {"train_loss": -6.534735679626465, "global_step": 127360, "epoch": 3032} {"train_loss": -6.557791709899902, "global_step": 127361, "epoch": 3032} {"train_loss": -6.601533889770508, "global_step": 127362, "epoch": 3032} {"train_loss": -6.541673183441162, "global_step": 127363, "epoch": 3032} {"train_loss": -6.454943656921387, "global_step": 127364, "epoch": 3032} {"train_loss": -6.584717750549316, "global_step": 127365, "epoch": 3032} {"train_loss": -6.498561859130859, "global_step": 127366, "epoch": 3032} {"train_loss": -6.571506500244141, "global_step": 127367, "epoch": 3032} {"train_loss": -6.500136375427246, "global_step": 127368, "epoch": 3032} {"train_loss": -6.554039478302002, "global_step": 127369, "epoch": 3032} {"train_loss": -6.474448204040527, "global_step": 127370, "epoch": 3032} {"train_loss": -6.530148029327393, "global_step": 127371, "epoch": 3032} {"train_loss": -6.424063682556152, "global_step": 127372, "epoch": 3032} {"train_loss": -6.55449104309082, "global_step": 127373, "epoch": 3032} {"train_loss": -6.5425567626953125, "global_step": 127374, "epoch": 3032} {"train_loss": -6.629400253295898, "global_step": 127375, "epoch": 3032} {"train_loss": -6.548927307128906, "global_step": 127376, "epoch": 3032} {"train_loss": -6.557397365570068, "global_step": 127377, "epoch": 3032} {"train_loss": -6.667880535125732, "global_step": 127378, "epoch": 3032} {"train_loss": -6.625689506530762, "global_step": 127379, "epoch": 3032} {"train_loss": -6.473775386810303, "global_step": 127380, "epoch": 3032} {"train_loss": -6.590575218200684, "global_step": 127381, "epoch": 3032} {"train_loss": -6.516995429992676, "global_step": 127382, "epoch": 3032} {"train_loss": -6.70897102355957, "global_step": 127383, "epoch": 3032} {"train_loss": -6.58671760559082, "global_step": 127384, "epoch": 3032} {"train_loss": -6.582441818146479, "global_step": 127385, "epoch": 3032, "val_loss": 66262.1640625} {"train_loss": -6.587745666503906, "global_step": 127386, "epoch": 3033} {"train_loss": -6.676461696624756, "global_step": 127387, "epoch": 3033} {"train_loss": -6.574764728546143, "global_step": 127388, "epoch": 3033} {"train_loss": -6.470826625823975, "global_step": 127389, "epoch": 3033} {"train_loss": -6.625041961669922, "global_step": 127390, "epoch": 3033} {"train_loss": -6.612665176391602, "global_step": 127391, "epoch": 3033} {"train_loss": -6.409829616546631, "global_step": 127392, "epoch": 3033} {"train_loss": -6.616094589233398, "global_step": 127393, "epoch": 3033} {"train_loss": -6.583038330078125, "global_step": 127394, "epoch": 3033} {"train_loss": -6.663567066192627, "global_step": 127395, "epoch": 3033} {"train_loss": -6.591331958770752, "global_step": 127396, "epoch": 3033} {"train_loss": -6.559961318969727, "global_step": 127397, "epoch": 3033} {"train_loss": -6.6788177490234375, "global_step": 127398, "epoch": 3033} {"train_loss": -6.591296195983887, "global_step": 127399, "epoch": 3033} {"train_loss": -6.618106842041016, "global_step": 127400, "epoch": 3033} {"train_loss": -6.557651519775391, "global_step": 127401, "epoch": 3033} {"train_loss": -6.506870746612549, "global_step": 127402, "epoch": 3033} {"train_loss": -6.646981239318848, "global_step": 127403, "epoch": 3033} {"train_loss": -6.491596698760986, "global_step": 127404, "epoch": 3033} {"train_loss": -6.601264953613281, "global_step": 127405, "epoch": 3033} {"train_loss": -6.4401984214782715, "global_step": 127406, "epoch": 3033} {"train_loss": -6.494131088256836, "global_step": 127407, "epoch": 3033} {"train_loss": -6.528282165527344, "global_step": 127408, "epoch": 3033} {"train_loss": -6.542214393615723, "global_step": 127409, "epoch": 3033} {"train_loss": -6.625357627868652, "global_step": 127410, "epoch": 3033} {"train_loss": -6.521426200866699, "global_step": 127411, "epoch": 3033} {"train_loss": -6.547490119934082, "global_step": 127412, "epoch": 3033} {"train_loss": -6.481168270111084, "global_step": 127413, "epoch": 3033} {"train_loss": -6.539968490600586, "global_step": 127414, "epoch": 3033} {"train_loss": -6.465668678283691, "global_step": 127415, "epoch": 3033} {"train_loss": -6.619497299194336, "global_step": 127416, "epoch": 3033} {"train_loss": -6.578943252563477, "global_step": 127417, "epoch": 3033} {"train_loss": -6.636869430541992, "global_step": 127418, "epoch": 3033} {"train_loss": -6.581547260284424, "global_step": 127419, "epoch": 3033} {"train_loss": -6.60267448425293, "global_step": 127420, "epoch": 3033} {"train_loss": -6.728816032409668, "global_step": 127421, "epoch": 3033} {"train_loss": -6.6186842918396, "global_step": 127422, "epoch": 3033} {"train_loss": -6.502521991729736, "global_step": 127423, "epoch": 3033} {"train_loss": -6.601749897003174, "global_step": 127424, "epoch": 3033} {"train_loss": -6.63314962387085, "global_step": 127425, "epoch": 3033} {"train_loss": -6.764039993286133, "global_step": 127426, "epoch": 3033} {"train_loss": -6.579530534290132, "global_step": 127427, "epoch": 3033, "val_loss": 66195.484375} {"train_loss": -6.73190450668335, "global_step": 127428, "epoch": 3034} {"train_loss": -6.805062294006348, "global_step": 127429, "epoch": 3034} {"train_loss": -6.680404186248779, "global_step": 127430, "epoch": 3034} {"train_loss": -6.650748252868652, "global_step": 127431, "epoch": 3034} {"train_loss": -6.6630682945251465, "global_step": 127432, "epoch": 3034} {"train_loss": -6.794824600219727, "global_step": 127433, "epoch": 3034} {"train_loss": -6.670804977416992, "global_step": 127434, "epoch": 3034} {"train_loss": -6.682228088378906, "global_step": 127435, "epoch": 3034} {"train_loss": -6.489896774291992, "global_step": 127436, "epoch": 3034} {"train_loss": -6.599067687988281, "global_step": 127437, "epoch": 3034} {"train_loss": -6.7082109451293945, "global_step": 127438, "epoch": 3034} {"train_loss": -6.72175407409668, "global_step": 127439, "epoch": 3034} {"train_loss": -6.7068095207214355, "global_step": 127440, "epoch": 3034} {"train_loss": -6.723310470581055, "global_step": 127441, "epoch": 3034} {"train_loss": -6.4140825271606445, "global_step": 127442, "epoch": 3034} {"train_loss": -6.5937957763671875, "global_step": 127443, "epoch": 3034} {"train_loss": -6.754473686218262, "global_step": 127444, "epoch": 3034} {"train_loss": -6.635369300842285, "global_step": 127445, "epoch": 3034} {"train_loss": -6.593909740447998, "global_step": 127446, "epoch": 3034} {"train_loss": -6.679766654968262, "global_step": 127447, "epoch": 3034} {"train_loss": -6.720727443695068, "global_step": 127448, "epoch": 3034} {"train_loss": -6.614819526672363, "global_step": 127449, "epoch": 3034} {"train_loss": -6.667928695678711, "global_step": 127450, "epoch": 3034} {"train_loss": -6.673277378082275, "global_step": 127451, "epoch": 3034} {"train_loss": -6.630934715270996, "global_step": 127452, "epoch": 3034} {"train_loss": -6.803837776184082, "global_step": 127453, "epoch": 3034} {"train_loss": -6.616347312927246, "global_step": 127454, "epoch": 3034} {"train_loss": -6.533865928649902, "global_step": 127455, "epoch": 3034} {"train_loss": -6.711304664611816, "global_step": 127456, "epoch": 3034} {"train_loss": -6.696371555328369, "global_step": 127457, "epoch": 3034} {"train_loss": -6.67508602142334, "global_step": 127458, "epoch": 3034} {"train_loss": -6.623729228973389, "global_step": 127459, "epoch": 3034} {"train_loss": -6.67106294631958, "global_step": 127460, "epoch": 3034} {"train_loss": -6.673724174499512, "global_step": 127461, "epoch": 3034} {"train_loss": -6.760243892669678, "global_step": 127462, "epoch": 3034} {"train_loss": -6.709125518798828, "global_step": 127463, "epoch": 3034} {"train_loss": -6.776914119720459, "global_step": 127464, "epoch": 3034} {"train_loss": -6.674722671508789, "global_step": 127465, "epoch": 3034} {"train_loss": -6.7349534034729, "global_step": 127466, "epoch": 3034} {"train_loss": -6.753843784332275, "global_step": 127467, "epoch": 3034} {"train_loss": -6.733280658721924, "global_step": 127468, "epoch": 3034} {"train_loss": -6.673328286125546, "global_step": 127469, "epoch": 3034, "val_loss": 66167.6875} {"train_loss": -6.647914886474609, "global_step": 127470, "epoch": 3035} {"train_loss": -6.594710350036621, "global_step": 127471, "epoch": 3035} {"train_loss": -6.658522129058838, "global_step": 127472, "epoch": 3035} {"train_loss": -6.714966773986816, "global_step": 127473, "epoch": 3035} {"train_loss": -6.684545516967773, "global_step": 127474, "epoch": 3035} {"train_loss": -6.723972320556641, "global_step": 127475, "epoch": 3035} {"train_loss": -6.730823993682861, "global_step": 127476, "epoch": 3035} {"train_loss": -6.663143634796143, "global_step": 127477, "epoch": 3035} {"train_loss": -6.69856071472168, "global_step": 127478, "epoch": 3035} {"train_loss": -6.638031482696533, "global_step": 127479, "epoch": 3035} {"train_loss": -6.737333297729492, "global_step": 127480, "epoch": 3035} {"train_loss": -6.740005016326904, "global_step": 127481, "epoch": 3035} {"train_loss": -6.790620803833008, "global_step": 127482, "epoch": 3035} {"train_loss": -6.667533874511719, "global_step": 127483, "epoch": 3035} {"train_loss": -6.671010971069336, "global_step": 127484, "epoch": 3035} {"train_loss": -6.666869163513184, "global_step": 127485, "epoch": 3035} {"train_loss": -6.65592098236084, "global_step": 127486, "epoch": 3035} {"train_loss": -6.592448711395264, "global_step": 127487, "epoch": 3035} {"train_loss": -6.690864562988281, "global_step": 127488, "epoch": 3035} {"train_loss": -6.703489303588867, "global_step": 127489, "epoch": 3035} {"train_loss": -6.669614315032959, "global_step": 127490, "epoch": 3035} {"train_loss": -6.639509677886963, "global_step": 127491, "epoch": 3035} {"train_loss": -6.7133097648620605, "global_step": 127492, "epoch": 3035} {"train_loss": -6.652320861816406, "global_step": 127493, "epoch": 3035} {"train_loss": -6.642427444458008, "global_step": 127494, "epoch": 3035} {"train_loss": -6.752350330352783, "global_step": 127495, "epoch": 3035} {"train_loss": -6.64683723449707, "global_step": 127496, "epoch": 3035} {"train_loss": -6.535107612609863, "global_step": 127497, "epoch": 3035} {"train_loss": -6.706522464752197, "global_step": 127498, "epoch": 3035} {"train_loss": -6.614480972290039, "global_step": 127499, "epoch": 3035} {"train_loss": -6.5148515701293945, "global_step": 127500, "epoch": 3035} {"train_loss": -6.676318168640137, "global_step": 127501, "epoch": 3035} {"train_loss": -6.621389865875244, "global_step": 127502, "epoch": 3035} {"train_loss": -6.700760364532471, "global_step": 127503, "epoch": 3035} {"train_loss": -6.56456995010376, "global_step": 127504, "epoch": 3035} {"train_loss": -6.580280303955078, "global_step": 127505, "epoch": 3035} {"train_loss": -6.601529598236084, "global_step": 127506, "epoch": 3035} {"train_loss": -6.504190921783447, "global_step": 127507, "epoch": 3035} {"train_loss": -6.576231956481934, "global_step": 127508, "epoch": 3035} {"train_loss": -6.66392707824707, "global_step": 127509, "epoch": 3035} {"train_loss": -6.622496604919434, "global_step": 127510, "epoch": 3035} {"train_loss": -6.656694446291242, "global_step": 127511, "epoch": 3035, "val_loss": 66319.3359375} {"train_loss": -6.6584367752075195, "global_step": 127512, "epoch": 3036} {"train_loss": -6.532814979553223, "global_step": 127513, "epoch": 3036} {"train_loss": -6.672901153564453, "global_step": 127514, "epoch": 3036} {"train_loss": -6.604917049407959, "global_step": 127515, "epoch": 3036} {"train_loss": -6.698025703430176, "global_step": 127516, "epoch": 3036} {"train_loss": -6.628226280212402, "global_step": 127517, "epoch": 3036} {"train_loss": -6.608919143676758, "global_step": 127518, "epoch": 3036} {"train_loss": -6.705334663391113, "global_step": 127519, "epoch": 3036} {"train_loss": -6.72297477722168, "global_step": 127520, "epoch": 3036} {"train_loss": -6.573434352874756, "global_step": 127521, "epoch": 3036} {"train_loss": -6.669533729553223, "global_step": 127522, "epoch": 3036} {"train_loss": -6.6343817710876465, "global_step": 127523, "epoch": 3036} {"train_loss": -6.726367950439453, "global_step": 127524, "epoch": 3036} {"train_loss": -6.692209243774414, "global_step": 127525, "epoch": 3036} {"train_loss": -6.643545627593994, "global_step": 127526, "epoch": 3036} {"train_loss": -6.712618827819824, "global_step": 127527, "epoch": 3036} {"train_loss": -6.664390563964844, "global_step": 127528, "epoch": 3036} {"train_loss": -6.694404602050781, "global_step": 127529, "epoch": 3036} {"train_loss": -6.68597412109375, "global_step": 127530, "epoch": 3036} {"train_loss": -6.712775230407715, "global_step": 127531, "epoch": 3036} {"train_loss": -6.703042984008789, "global_step": 127532, "epoch": 3036} {"train_loss": -6.710988998413086, "global_step": 127533, "epoch": 3036} {"train_loss": -6.703075408935547, "global_step": 127534, "epoch": 3036} {"train_loss": -6.634364128112793, "global_step": 127535, "epoch": 3036} {"train_loss": -6.632408142089844, "global_step": 127536, "epoch": 3036} {"train_loss": -6.547560691833496, "global_step": 127537, "epoch": 3036} {"train_loss": -6.5818071365356445, "global_step": 127538, "epoch": 3036} {"train_loss": -6.59976863861084, "global_step": 127539, "epoch": 3036} {"train_loss": -6.633306503295898, "global_step": 127540, "epoch": 3036} {"train_loss": -6.6589789390563965, "global_step": 127541, "epoch": 3036} {"train_loss": -6.494388580322266, "global_step": 127542, "epoch": 3036} {"train_loss": -6.614273548126221, "global_step": 127543, "epoch": 3036} {"train_loss": -6.652769088745117, "global_step": 127544, "epoch": 3036} {"train_loss": -6.523036956787109, "global_step": 127545, "epoch": 3036} {"train_loss": -6.573495864868164, "global_step": 127546, "epoch": 3036} {"train_loss": -6.6909260749816895, "global_step": 127547, "epoch": 3036} {"train_loss": -6.642380714416504, "global_step": 127548, "epoch": 3036} {"train_loss": -6.551796913146973, "global_step": 127549, "epoch": 3036} {"train_loss": -6.628247261047363, "global_step": 127550, "epoch": 3036} {"train_loss": -6.572936058044434, "global_step": 127551, "epoch": 3036} {"train_loss": -6.730568885803223, "global_step": 127552, "epoch": 3036} {"train_loss": -6.638112760725475, "global_step": 127553, "epoch": 3036, "val_loss": 66183.4375} {"train_loss": -6.544788360595703, "global_step": 127554, "epoch": 3037} {"train_loss": -6.603682994842529, "global_step": 127555, "epoch": 3037} {"train_loss": -6.60063362121582, "global_step": 127556, "epoch": 3037} {"train_loss": -6.676412582397461, "global_step": 127557, "epoch": 3037} {"train_loss": -6.431773662567139, "global_step": 127558, "epoch": 3037} {"train_loss": -6.559945583343506, "global_step": 127559, "epoch": 3037} {"train_loss": -6.520387649536133, "global_step": 127560, "epoch": 3037} {"train_loss": -6.579380035400391, "global_step": 127561, "epoch": 3037} {"train_loss": -6.603695869445801, "global_step": 127562, "epoch": 3037} {"train_loss": -6.409082412719727, "global_step": 127563, "epoch": 3037} {"train_loss": -6.502363681793213, "global_step": 127564, "epoch": 3037} {"train_loss": -6.404391288757324, "global_step": 127565, "epoch": 3037} {"train_loss": -6.560096740722656, "global_step": 127566, "epoch": 3037} {"train_loss": -6.400691032409668, "global_step": 127567, "epoch": 3037} {"train_loss": -6.557313919067383, "global_step": 127568, "epoch": 3037} {"train_loss": -6.509396553039551, "global_step": 127569, "epoch": 3037} {"train_loss": -6.61114501953125, "global_step": 127570, "epoch": 3037} {"train_loss": -6.496147155761719, "global_step": 127571, "epoch": 3037} {"train_loss": -6.559435844421387, "global_step": 127572, "epoch": 3037} {"train_loss": -6.513042449951172, "global_step": 127573, "epoch": 3037} {"train_loss": -6.545801639556885, "global_step": 127574, "epoch": 3037} {"train_loss": -6.53936767578125, "global_step": 127575, "epoch": 3037} {"train_loss": -6.500124931335449, "global_step": 127576, "epoch": 3037} {"train_loss": -6.621813774108887, "global_step": 127577, "epoch": 3037} {"train_loss": -6.495203971862793, "global_step": 127578, "epoch": 3037} {"train_loss": -6.608112335205078, "global_step": 127579, "epoch": 3037} {"train_loss": -6.550165176391602, "global_step": 127580, "epoch": 3037} {"train_loss": -6.387965202331543, "global_step": 127581, "epoch": 3037} {"train_loss": -6.4656171798706055, "global_step": 127582, "epoch": 3037} {"train_loss": -6.564126014709473, "global_step": 127583, "epoch": 3037} {"train_loss": -6.597288131713867, "global_step": 127584, "epoch": 3037} {"train_loss": -6.586447715759277, "global_step": 127585, "epoch": 3037} {"train_loss": -6.670248985290527, "global_step": 127586, "epoch": 3037} {"train_loss": -6.568835258483887, "global_step": 127587, "epoch": 3037} {"train_loss": -6.577210903167725, "global_step": 127588, "epoch": 3037} {"train_loss": -6.4669389724731445, "global_step": 127589, "epoch": 3037} {"train_loss": -6.732827186584473, "global_step": 127590, "epoch": 3037} {"train_loss": -6.6885833740234375, "global_step": 127591, "epoch": 3037} {"train_loss": -6.684627532958984, "global_step": 127592, "epoch": 3037} {"train_loss": -6.567286491394043, "global_step": 127593, "epoch": 3037} {"train_loss": -6.6796417236328125, "global_step": 127594, "epoch": 3037} {"train_loss": -6.558391321273077, "global_step": 127595, "epoch": 3037, "val_loss": 66363.4453125} {"train_loss": -6.638939380645752, "global_step": 127596, "epoch": 3038} {"train_loss": -6.67905330657959, "global_step": 127597, "epoch": 3038} {"train_loss": -6.610823631286621, "global_step": 127598, "epoch": 3038} {"train_loss": -6.7368035316467285, "global_step": 127599, "epoch": 3038} {"train_loss": -6.5376410484313965, "global_step": 127600, "epoch": 3038} {"train_loss": -6.641514301300049, "global_step": 127601, "epoch": 3038} {"train_loss": -6.668434143066406, "global_step": 127602, "epoch": 3038} {"train_loss": -6.579195976257324, "global_step": 127603, "epoch": 3038} {"train_loss": -6.501255989074707, "global_step": 127604, "epoch": 3038} {"train_loss": -6.745133399963379, "global_step": 127605, "epoch": 3038} {"train_loss": -6.6474175453186035, "global_step": 127606, "epoch": 3038} {"train_loss": -6.446902751922607, "global_step": 127607, "epoch": 3038} {"train_loss": -6.710919380187988, "global_step": 127608, "epoch": 3038} {"train_loss": -6.684841632843018, "global_step": 127609, "epoch": 3038} {"train_loss": -6.597067356109619, "global_step": 127610, "epoch": 3038} {"train_loss": -6.723004341125488, "global_step": 127611, "epoch": 3038} {"train_loss": -6.6038923263549805, "global_step": 127612, "epoch": 3038} {"train_loss": -6.660220146179199, "global_step": 127613, "epoch": 3038} {"train_loss": -6.7002668380737305, "global_step": 127614, "epoch": 3038} {"train_loss": -6.555520534515381, "global_step": 127615, "epoch": 3038} {"train_loss": -6.697778701782227, "global_step": 127616, "epoch": 3038} {"train_loss": -6.621090888977051, "global_step": 127617, "epoch": 3038} {"train_loss": -6.5230393409729, "global_step": 127618, "epoch": 3038} {"train_loss": -6.643584251403809, "global_step": 127619, "epoch": 3038} {"train_loss": -6.643315315246582, "global_step": 127620, "epoch": 3038} {"train_loss": -6.532870292663574, "global_step": 127621, "epoch": 3038} {"train_loss": -6.619426727294922, "global_step": 127622, "epoch": 3038} {"train_loss": -6.636205196380615, "global_step": 127623, "epoch": 3038} {"train_loss": -6.597751140594482, "global_step": 127624, "epoch": 3038} {"train_loss": -6.498752117156982, "global_step": 127625, "epoch": 3038} {"train_loss": -6.588774681091309, "global_step": 127626, "epoch": 3038} {"train_loss": -6.602388381958008, "global_step": 127627, "epoch": 3038} {"train_loss": -6.62348747253418, "global_step": 127628, "epoch": 3038} {"train_loss": -6.697906494140625, "global_step": 127629, "epoch": 3038} {"train_loss": -6.607431411743164, "global_step": 127630, "epoch": 3038} {"train_loss": -6.564004898071289, "global_step": 127631, "epoch": 3038} {"train_loss": -6.643561840057373, "global_step": 127632, "epoch": 3038} {"train_loss": -6.670330047607422, "global_step": 127633, "epoch": 3038} {"train_loss": -6.640737533569336, "global_step": 127634, "epoch": 3038} {"train_loss": -6.639836311340332, "global_step": 127635, "epoch": 3038} {"train_loss": -6.598142623901367, "global_step": 127636, "epoch": 3038} {"train_loss": -6.624398980821882, "global_step": 127637, "epoch": 3038, "val_loss": 66210.9453125} {"train_loss": -6.750723838806152, "global_step": 127638, "epoch": 3039} {"train_loss": -6.6274733543396, "global_step": 127639, "epoch": 3039} {"train_loss": -6.76316499710083, "global_step": 127640, "epoch": 3039} {"train_loss": -6.675261974334717, "global_step": 127641, "epoch": 3039} {"train_loss": -6.654522895812988, "global_step": 127642, "epoch": 3039} {"train_loss": -6.637264251708984, "global_step": 127643, "epoch": 3039} {"train_loss": -6.708605766296387, "global_step": 127644, "epoch": 3039} {"train_loss": -6.714963436126709, "global_step": 127645, "epoch": 3039} {"train_loss": -6.750942230224609, "global_step": 127646, "epoch": 3039} {"train_loss": -6.541079521179199, "global_step": 127647, "epoch": 3039} {"train_loss": -6.727660179138184, "global_step": 127648, "epoch": 3039} {"train_loss": -6.633248805999756, "global_step": 127649, "epoch": 3039} {"train_loss": -6.803693771362305, "global_step": 127650, "epoch": 3039} {"train_loss": -6.758879661560059, "global_step": 127651, "epoch": 3039} {"train_loss": -6.625004291534424, "global_step": 127652, "epoch": 3039} {"train_loss": -6.716671466827393, "global_step": 127653, "epoch": 3039} {"train_loss": -6.68414306640625, "global_step": 127654, "epoch": 3039} {"train_loss": -6.644032001495361, "global_step": 127655, "epoch": 3039} {"train_loss": -6.696588516235352, "global_step": 127656, "epoch": 3039} {"train_loss": -6.66011905670166, "global_step": 127657, "epoch": 3039} {"train_loss": -6.636172771453857, "global_step": 127658, "epoch": 3039} {"train_loss": -6.704653739929199, "global_step": 127659, "epoch": 3039} {"train_loss": -6.808537483215332, "global_step": 127660, "epoch": 3039} {"train_loss": -6.6866655349731445, "global_step": 127661, "epoch": 3039} {"train_loss": -6.554234504699707, "global_step": 127662, "epoch": 3039} {"train_loss": -6.6078338623046875, "global_step": 127663, "epoch": 3039} {"train_loss": -6.687170028686523, "global_step": 127664, "epoch": 3039} {"train_loss": -6.687493324279785, "global_step": 127665, "epoch": 3039} {"train_loss": -6.73922872543335, "global_step": 127666, "epoch": 3039} {"train_loss": -6.673925399780273, "global_step": 127667, "epoch": 3039} {"train_loss": -6.760383605957031, "global_step": 127668, "epoch": 3039} {"train_loss": -6.699803352355957, "global_step": 127669, "epoch": 3039} {"train_loss": -6.678412437438965, "global_step": 127670, "epoch": 3039} {"train_loss": -6.711596488952637, "global_step": 127671, "epoch": 3039} {"train_loss": -6.729776382446289, "global_step": 127672, "epoch": 3039} {"train_loss": -6.684128761291504, "global_step": 127673, "epoch": 3039} {"train_loss": -6.724899768829346, "global_step": 127674, "epoch": 3039} {"train_loss": -6.58111572265625, "global_step": 127675, "epoch": 3039} {"train_loss": -6.5784807205200195, "global_step": 127676, "epoch": 3039} {"train_loss": -6.678668975830078, "global_step": 127677, "epoch": 3039} {"train_loss": -6.545455455780029, "global_step": 127678, "epoch": 3039} {"train_loss": -6.681135552270072, "global_step": 127679, "epoch": 3039, "val_loss": 66550.8515625} {"train_loss": -6.51388692855835, "global_step": 127680, "epoch": 3040} {"train_loss": -6.6492018699646, "global_step": 127681, "epoch": 3040} {"train_loss": -6.7365570068359375, "global_step": 127682, "epoch": 3040} {"train_loss": -6.576859951019287, "global_step": 127683, "epoch": 3040} {"train_loss": -6.609431266784668, "global_step": 127684, "epoch": 3040} {"train_loss": -6.4025163650512695, "global_step": 127685, "epoch": 3040} {"train_loss": -6.588033199310303, "global_step": 127686, "epoch": 3040} {"train_loss": -6.531228065490723, "global_step": 127687, "epoch": 3040} {"train_loss": -6.493146896362305, "global_step": 127688, "epoch": 3040} {"train_loss": -6.663849353790283, "global_step": 127689, "epoch": 3040} {"train_loss": -6.387836456298828, "global_step": 127690, "epoch": 3040} {"train_loss": -6.568835258483887, "global_step": 127691, "epoch": 3040} {"train_loss": -6.440047740936279, "global_step": 127692, "epoch": 3040} {"train_loss": -6.620896339416504, "global_step": 127693, "epoch": 3040} {"train_loss": -6.576735496520996, "global_step": 127694, "epoch": 3040} {"train_loss": -6.487868309020996, "global_step": 127695, "epoch": 3040} {"train_loss": -6.563780784606934, "global_step": 127696, "epoch": 3040} {"train_loss": -6.506231784820557, "global_step": 127697, "epoch": 3040} {"train_loss": -6.551580429077148, "global_step": 127698, "epoch": 3040} {"train_loss": -6.53102445602417, "global_step": 127699, "epoch": 3040} {"train_loss": -6.580881595611572, "global_step": 127700, "epoch": 3040} {"train_loss": -6.511786937713623, "global_step": 127701, "epoch": 3040} {"train_loss": -6.597925186157227, "global_step": 127702, "epoch": 3040} {"train_loss": -6.521234035491943, "global_step": 127703, "epoch": 3040} {"train_loss": -6.655987739562988, "global_step": 127704, "epoch": 3040} {"train_loss": -6.6172051429748535, "global_step": 127705, "epoch": 3040} {"train_loss": -6.697612762451172, "global_step": 127706, "epoch": 3040} {"train_loss": -6.661654472351074, "global_step": 127707, "epoch": 3040} {"train_loss": -6.697309970855713, "global_step": 127708, "epoch": 3040} {"train_loss": -6.739927291870117, "global_step": 127709, "epoch": 3040} {"train_loss": -6.764932632446289, "global_step": 127710, "epoch": 3040} {"train_loss": -6.710994720458984, "global_step": 127711, "epoch": 3040} {"train_loss": -6.797648906707764, "global_step": 127712, "epoch": 3040} {"train_loss": -6.716185569763184, "global_step": 127713, "epoch": 3040} {"train_loss": -6.753445625305176, "global_step": 127714, "epoch": 3040} {"train_loss": -6.782880783081055, "global_step": 127715, "epoch": 3040} {"train_loss": -6.715022087097168, "global_step": 127716, "epoch": 3040} {"train_loss": -6.609496116638184, "global_step": 127717, "epoch": 3040} {"train_loss": -6.715188980102539, "global_step": 127718, "epoch": 3040} {"train_loss": -6.690128803253174, "global_step": 127719, "epoch": 3040} {"train_loss": -6.77830171585083, "global_step": 127720, "epoch": 3040} {"train_loss": -6.618864002681914, "global_step": 127721, "epoch": 3040, "val_loss": 66351.390625} {"train_loss": -6.678190231323242, "global_step": 127722, "epoch": 3041} {"train_loss": -6.719768047332764, "global_step": 127723, "epoch": 3041} {"train_loss": -6.6450090408325195, "global_step": 127724, "epoch": 3041} {"train_loss": -6.673354625701904, "global_step": 127725, "epoch": 3041} {"train_loss": -6.625702381134033, "global_step": 127726, "epoch": 3041} {"train_loss": -6.672340393066406, "global_step": 127727, "epoch": 3041} {"train_loss": -6.722504615783691, "global_step": 127728, "epoch": 3041} {"train_loss": -6.710900783538818, "global_step": 127729, "epoch": 3041} {"train_loss": -6.748156547546387, "global_step": 127730, "epoch": 3041} {"train_loss": -6.661823749542236, "global_step": 127731, "epoch": 3041} {"train_loss": -6.639611721038818, "global_step": 127732, "epoch": 3041} {"train_loss": -6.789786338806152, "global_step": 127733, "epoch": 3041} {"train_loss": -6.709554672241211, "global_step": 127734, "epoch": 3041} {"train_loss": -6.611845016479492, "global_step": 127735, "epoch": 3041} {"train_loss": -6.66269063949585, "global_step": 127736, "epoch": 3041} {"train_loss": -6.57990837097168, "global_step": 127737, "epoch": 3041} {"train_loss": -6.64450216293335, "global_step": 127738, "epoch": 3041} {"train_loss": -6.708033561706543, "global_step": 127739, "epoch": 3041} {"train_loss": -6.665892124176025, "global_step": 127740, "epoch": 3041} {"train_loss": -6.774645805358887, "global_step": 127741, "epoch": 3041} {"train_loss": -6.5745530128479, "global_step": 127742, "epoch": 3041} {"train_loss": -6.630794525146484, "global_step": 127743, "epoch": 3041} {"train_loss": -6.662079811096191, "global_step": 127744, "epoch": 3041} {"train_loss": -6.663936138153076, "global_step": 127745, "epoch": 3041} {"train_loss": -6.700003623962402, "global_step": 127746, "epoch": 3041} {"train_loss": -6.538562774658203, "global_step": 127747, "epoch": 3041} {"train_loss": -6.60531759262085, "global_step": 127748, "epoch": 3041} {"train_loss": -6.671374320983887, "global_step": 127749, "epoch": 3041} {"train_loss": -6.6478376388549805, "global_step": 127750, "epoch": 3041} {"train_loss": -6.5970458984375, "global_step": 127751, "epoch": 3041} {"train_loss": -6.591505527496338, "global_step": 127752, "epoch": 3041} {"train_loss": -6.580780982971191, "global_step": 127753, "epoch": 3041} {"train_loss": -6.574668884277344, "global_step": 127754, "epoch": 3041} {"train_loss": -6.562280654907227, "global_step": 127755, "epoch": 3041} {"train_loss": -6.614406585693359, "global_step": 127756, "epoch": 3041} {"train_loss": -6.609913349151611, "global_step": 127757, "epoch": 3041} {"train_loss": -6.527835845947266, "global_step": 127758, "epoch": 3041} {"train_loss": -6.630501747131348, "global_step": 127759, "epoch": 3041} {"train_loss": -6.644582748413086, "global_step": 127760, "epoch": 3041} {"train_loss": -6.577627182006836, "global_step": 127761, "epoch": 3041} {"train_loss": -6.545631408691406, "global_step": 127762, "epoch": 3041} {"train_loss": -6.641155333746047, "global_step": 127763, "epoch": 3041, "val_loss": 66343.6171875} {"train_loss": -6.476076602935791, "global_step": 127764, "epoch": 3042} {"train_loss": -6.443642616271973, "global_step": 127765, "epoch": 3042} {"train_loss": -6.557549953460693, "global_step": 127766, "epoch": 3042} {"train_loss": -6.347411155700684, "global_step": 127767, "epoch": 3042} {"train_loss": -6.558222770690918, "global_step": 127768, "epoch": 3042} {"train_loss": -6.5043721199035645, "global_step": 127769, "epoch": 3042} {"train_loss": -6.652344703674316, "global_step": 127770, "epoch": 3042} {"train_loss": -6.600496292114258, "global_step": 127771, "epoch": 3042} {"train_loss": -6.585715293884277, "global_step": 127772, "epoch": 3042} {"train_loss": -6.581441402435303, "global_step": 127773, "epoch": 3042} {"train_loss": -6.6490092277526855, "global_step": 127774, "epoch": 3042} {"train_loss": -6.57343864440918, "global_step": 127775, "epoch": 3042} {"train_loss": -6.51492977142334, "global_step": 127776, "epoch": 3042} {"train_loss": -6.657502174377441, "global_step": 127777, "epoch": 3042} {"train_loss": -6.565609931945801, "global_step": 127778, "epoch": 3042} {"train_loss": -6.633018970489502, "global_step": 127779, "epoch": 3042} {"train_loss": -6.6444549560546875, "global_step": 127780, "epoch": 3042} {"train_loss": -6.590669631958008, "global_step": 127781, "epoch": 3042} {"train_loss": -6.7519211769104, "global_step": 127782, "epoch": 3042} {"train_loss": -6.601017951965332, "global_step": 127783, "epoch": 3042} {"train_loss": -6.64619255065918, "global_step": 127784, "epoch": 3042} {"train_loss": -6.637022018432617, "global_step": 127785, "epoch": 3042} {"train_loss": -6.683167934417725, "global_step": 127786, "epoch": 3042} {"train_loss": -6.599912643432617, "global_step": 127787, "epoch": 3042} {"train_loss": -6.661185264587402, "global_step": 127788, "epoch": 3042} {"train_loss": -6.554457187652588, "global_step": 127789, "epoch": 3042} {"train_loss": -6.5447096824646, "global_step": 127790, "epoch": 3042} {"train_loss": -6.663899898529053, "global_step": 127791, "epoch": 3042} {"train_loss": -6.658444404602051, "global_step": 127792, "epoch": 3042} {"train_loss": -6.55802059173584, "global_step": 127793, "epoch": 3042} {"train_loss": -6.695504188537598, "global_step": 127794, "epoch": 3042} {"train_loss": -6.615241050720215, "global_step": 127795, "epoch": 3042} {"train_loss": -6.715143203735352, "global_step": 127796, "epoch": 3042} {"train_loss": -6.618960380554199, "global_step": 127797, "epoch": 3042} {"train_loss": -6.545673370361328, "global_step": 127798, "epoch": 3042} {"train_loss": -6.7118353843688965, "global_step": 127799, "epoch": 3042} {"train_loss": -6.632478713989258, "global_step": 127800, "epoch": 3042} {"train_loss": -6.735283851623535, "global_step": 127801, "epoch": 3042} {"train_loss": -6.7708587646484375, "global_step": 127802, "epoch": 3042} {"train_loss": -6.671515464782715, "global_step": 127803, "epoch": 3042} {"train_loss": -6.655874729156494, "global_step": 127804, "epoch": 3042} {"train_loss": -6.611859753018334, "global_step": 127805, "epoch": 3042, "val_loss": 66343.109375} {"train_loss": -6.5948567390441895, "global_step": 127806, "epoch": 3043} {"train_loss": -6.5678558349609375, "global_step": 127807, "epoch": 3043} {"train_loss": -6.672147750854492, "global_step": 127808, "epoch": 3043} {"train_loss": -6.6298675537109375, "global_step": 127809, "epoch": 3043} {"train_loss": -6.691194534301758, "global_step": 127810, "epoch": 3043} {"train_loss": -6.68218994140625, "global_step": 127811, "epoch": 3043} {"train_loss": -6.700037002563477, "global_step": 127812, "epoch": 3043} {"train_loss": -6.62497615814209, "global_step": 127813, "epoch": 3043} {"train_loss": -6.818120002746582, "global_step": 127814, "epoch": 3043} {"train_loss": -6.615809440612793, "global_step": 127815, "epoch": 3043} {"train_loss": -6.718906402587891, "global_step": 127816, "epoch": 3043} {"train_loss": -6.668447971343994, "global_step": 127817, "epoch": 3043} {"train_loss": -6.747185230255127, "global_step": 127818, "epoch": 3043} {"train_loss": -6.571311950683594, "global_step": 127819, "epoch": 3043} {"train_loss": -6.58284330368042, "global_step": 127820, "epoch": 3043} {"train_loss": -6.695627212524414, "global_step": 127821, "epoch": 3043} {"train_loss": -6.754270553588867, "global_step": 127822, "epoch": 3043} {"train_loss": -6.52939510345459, "global_step": 127823, "epoch": 3043} {"train_loss": -6.736201286315918, "global_step": 127824, "epoch": 3043} {"train_loss": -6.664755821228027, "global_step": 127825, "epoch": 3043} {"train_loss": -6.718641757965088, "global_step": 127826, "epoch": 3043} {"train_loss": -6.707673072814941, "global_step": 127827, "epoch": 3043} {"train_loss": -6.674635887145996, "global_step": 127828, "epoch": 3043} {"train_loss": -6.612370491027832, "global_step": 127829, "epoch": 3043} {"train_loss": -6.598322868347168, "global_step": 127830, "epoch": 3043} {"train_loss": -6.678203105926514, "global_step": 127831, "epoch": 3043} {"train_loss": -6.560294151306152, "global_step": 127832, "epoch": 3043} {"train_loss": -6.7089314460754395, "global_step": 127833, "epoch": 3043} {"train_loss": -6.670172691345215, "global_step": 127834, "epoch": 3043} {"train_loss": -6.654295444488525, "global_step": 127835, "epoch": 3043} {"train_loss": -6.728184700012207, "global_step": 127836, "epoch": 3043} {"train_loss": -6.732365608215332, "global_step": 127837, "epoch": 3043} {"train_loss": -6.67933464050293, "global_step": 127838, "epoch": 3043} {"train_loss": -6.715851783752441, "global_step": 127839, "epoch": 3043} {"train_loss": -6.604440212249756, "global_step": 127840, "epoch": 3043} {"train_loss": -6.673711776733398, "global_step": 127841, "epoch": 3043} {"train_loss": -6.808938503265381, "global_step": 127842, "epoch": 3043} {"train_loss": -6.659037113189697, "global_step": 127843, "epoch": 3043} {"train_loss": -6.701578140258789, "global_step": 127844, "epoch": 3043} {"train_loss": -6.675493240356445, "global_step": 127845, "epoch": 3043} {"train_loss": -6.66002893447876, "global_step": 127846, "epoch": 3043} {"train_loss": -6.671422878901164, "global_step": 127847, "epoch": 3043, "val_loss": 66262.4921875} {"train_loss": -6.715175151824951, "global_step": 127848, "epoch": 3044} {"train_loss": -6.716261386871338, "global_step": 127849, "epoch": 3044} {"train_loss": -6.685586929321289, "global_step": 127850, "epoch": 3044} {"train_loss": -6.680201053619385, "global_step": 127851, "epoch": 3044} {"train_loss": -6.670286178588867, "global_step": 127852, "epoch": 3044} {"train_loss": -6.7176313400268555, "global_step": 127853, "epoch": 3044} {"train_loss": -6.80500602722168, "global_step": 127854, "epoch": 3044} {"train_loss": -6.710501670837402, "global_step": 127855, "epoch": 3044} {"train_loss": -6.586938381195068, "global_step": 127856, "epoch": 3044} {"train_loss": -6.626640319824219, "global_step": 127857, "epoch": 3044} {"train_loss": -6.782215118408203, "global_step": 127858, "epoch": 3044} {"train_loss": -6.692198276519775, "global_step": 127859, "epoch": 3044} {"train_loss": -6.668944358825684, "global_step": 127860, "epoch": 3044} {"train_loss": -6.550462245941162, "global_step": 127861, "epoch": 3044} {"train_loss": -6.598359107971191, "global_step": 127862, "epoch": 3044} {"train_loss": -6.613081932067871, "global_step": 127863, "epoch": 3044} {"train_loss": -6.669060230255127, "global_step": 127864, "epoch": 3044} {"train_loss": -6.583549499511719, "global_step": 127865, "epoch": 3044} {"train_loss": -6.621989727020264, "global_step": 127866, "epoch": 3044} {"train_loss": -6.584044933319092, "global_step": 127867, "epoch": 3044} {"train_loss": -6.539645195007324, "global_step": 127868, "epoch": 3044} {"train_loss": -6.602910995483398, "global_step": 127869, "epoch": 3044} {"train_loss": -6.695145606994629, "global_step": 127870, "epoch": 3044} {"train_loss": -6.569043159484863, "global_step": 127871, "epoch": 3044} {"train_loss": -6.587773323059082, "global_step": 127872, "epoch": 3044} {"train_loss": -6.705196380615234, "global_step": 127873, "epoch": 3044} {"train_loss": -6.561522483825684, "global_step": 127874, "epoch": 3044} {"train_loss": -6.594994068145752, "global_step": 127875, "epoch": 3044} {"train_loss": -6.5627288818359375, "global_step": 127876, "epoch": 3044} {"train_loss": -6.655335426330566, "global_step": 127877, "epoch": 3044} {"train_loss": -6.661049842834473, "global_step": 127878, "epoch": 3044} {"train_loss": -6.643531322479248, "global_step": 127879, "epoch": 3044} {"train_loss": -6.708343982696533, "global_step": 127880, "epoch": 3044} {"train_loss": -6.6430583000183105, "global_step": 127881, "epoch": 3044} {"train_loss": -6.556217193603516, "global_step": 127882, "epoch": 3044} {"train_loss": -6.722526550292969, "global_step": 127883, "epoch": 3044} {"train_loss": -6.729475021362305, "global_step": 127884, "epoch": 3044} {"train_loss": -6.570560455322266, "global_step": 127885, "epoch": 3044} {"train_loss": -6.792717933654785, "global_step": 127886, "epoch": 3044} {"train_loss": -6.690276145935059, "global_step": 127887, "epoch": 3044} {"train_loss": -6.731302261352539, "global_step": 127888, "epoch": 3044} {"train_loss": -6.654187872296288, "global_step": 127889, "epoch": 3044, "val_loss": 66288.8984375} {"train_loss": -6.6758036613464355, "global_step": 127890, "epoch": 3045} {"train_loss": -6.730055809020996, "global_step": 127891, "epoch": 3045} {"train_loss": -6.718842506408691, "global_step": 127892, "epoch": 3045} {"train_loss": -6.652958393096924, "global_step": 127893, "epoch": 3045} {"train_loss": -6.728276252746582, "global_step": 127894, "epoch": 3045} {"train_loss": -6.571527004241943, "global_step": 127895, "epoch": 3045} {"train_loss": -6.646153450012207, "global_step": 127896, "epoch": 3045} {"train_loss": -6.635708332061768, "global_step": 127897, "epoch": 3045} {"train_loss": -6.6865997314453125, "global_step": 127898, "epoch": 3045} {"train_loss": -6.577288627624512, "global_step": 127899, "epoch": 3045} {"train_loss": -6.659038066864014, "global_step": 127900, "epoch": 3045} {"train_loss": -6.6359663009643555, "global_step": 127901, "epoch": 3045} {"train_loss": -6.615817546844482, "global_step": 127902, "epoch": 3045} {"train_loss": -6.697623252868652, "global_step": 127903, "epoch": 3045} {"train_loss": -6.701548099517822, "global_step": 127904, "epoch": 3045} {"train_loss": -6.584809303283691, "global_step": 127905, "epoch": 3045} {"train_loss": -6.679584503173828, "global_step": 127906, "epoch": 3045} {"train_loss": -6.766308784484863, "global_step": 127907, "epoch": 3045} {"train_loss": -6.612774848937988, "global_step": 127908, "epoch": 3045} {"train_loss": -6.597078323364258, "global_step": 127909, "epoch": 3045} {"train_loss": -6.633933067321777, "global_step": 127910, "epoch": 3045} {"train_loss": -6.635594367980957, "global_step": 127911, "epoch": 3045} {"train_loss": -6.558019638061523, "global_step": 127912, "epoch": 3045} {"train_loss": -6.699021339416504, "global_step": 127913, "epoch": 3045} {"train_loss": -6.686147689819336, "global_step": 127914, "epoch": 3045} {"train_loss": -6.655807971954346, "global_step": 127915, "epoch": 3045} {"train_loss": -6.785540580749512, "global_step": 127916, "epoch": 3045} {"train_loss": -6.597301483154297, "global_step": 127917, "epoch": 3045} {"train_loss": -6.6877570152282715, "global_step": 127918, "epoch": 3045} {"train_loss": -6.621302604675293, "global_step": 127919, "epoch": 3045} {"train_loss": -6.6453752517700195, "global_step": 127920, "epoch": 3045} {"train_loss": -6.611684799194336, "global_step": 127921, "epoch": 3045} {"train_loss": -6.679669380187988, "global_step": 127922, "epoch": 3045} {"train_loss": -6.783726692199707, "global_step": 127923, "epoch": 3045} {"train_loss": -6.626811504364014, "global_step": 127924, "epoch": 3045} {"train_loss": -6.600800037384033, "global_step": 127925, "epoch": 3045} {"train_loss": -6.629889488220215, "global_step": 127926, "epoch": 3045} {"train_loss": -6.525458335876465, "global_step": 127927, "epoch": 3045} {"train_loss": -6.60640811920166, "global_step": 127928, "epoch": 3045} {"train_loss": -6.532215118408203, "global_step": 127929, "epoch": 3045} {"train_loss": -6.66953182220459, "global_step": 127930, "epoch": 3045} {"train_loss": -6.650582881200881, "global_step": 127931, "epoch": 3045, "val_loss": 66530.21875} {"train_loss": -6.556869983673096, "global_step": 127932, "epoch": 3046} {"train_loss": -6.661282062530518, "global_step": 127933, "epoch": 3046} {"train_loss": -6.642348289489746, "global_step": 127934, "epoch": 3046} {"train_loss": -6.647071838378906, "global_step": 127935, "epoch": 3046} {"train_loss": -6.545365333557129, "global_step": 127936, "epoch": 3046} {"train_loss": -6.572628974914551, "global_step": 127937, "epoch": 3046} {"train_loss": -6.6444854736328125, "global_step": 127938, "epoch": 3046} {"train_loss": -6.550505638122559, "global_step": 127939, "epoch": 3046} {"train_loss": -6.580413818359375, "global_step": 127940, "epoch": 3046} {"train_loss": -6.628072738647461, "global_step": 127941, "epoch": 3046} {"train_loss": -6.548100471496582, "global_step": 127942, "epoch": 3046} {"train_loss": -6.639317512512207, "global_step": 127943, "epoch": 3046} {"train_loss": -6.5646843910217285, "global_step": 127944, "epoch": 3046} {"train_loss": -6.752524375915527, "global_step": 127945, "epoch": 3046} {"train_loss": -6.642370223999023, "global_step": 127946, "epoch": 3046} {"train_loss": -6.626955032348633, "global_step": 127947, "epoch": 3046} {"train_loss": -6.579833984375, "global_step": 127948, "epoch": 3046} {"train_loss": -6.5951972007751465, "global_step": 127949, "epoch": 3046} {"train_loss": -6.472886085510254, "global_step": 127950, "epoch": 3046} {"train_loss": -6.669516563415527, "global_step": 127951, "epoch": 3046} {"train_loss": -6.498780250549316, "global_step": 127952, "epoch": 3046} {"train_loss": -6.473299026489258, "global_step": 127953, "epoch": 3046} {"train_loss": -6.5973100662231445, "global_step": 127954, "epoch": 3046} {"train_loss": -6.488341331481934, "global_step": 127955, "epoch": 3046} {"train_loss": -6.3926801681518555, "global_step": 127956, "epoch": 3046} {"train_loss": -6.54708194732666, "global_step": 127957, "epoch": 3046} {"train_loss": -6.424040794372559, "global_step": 127958, "epoch": 3046} {"train_loss": -6.65944766998291, "global_step": 127959, "epoch": 3046} {"train_loss": -6.514395713806152, "global_step": 127960, "epoch": 3046} {"train_loss": -6.552437782287598, "global_step": 127961, "epoch": 3046} {"train_loss": -6.578847885131836, "global_step": 127962, "epoch": 3046} {"train_loss": -6.55745792388916, "global_step": 127963, "epoch": 3046} {"train_loss": -6.547654628753662, "global_step": 127964, "epoch": 3046} {"train_loss": -6.665210723876953, "global_step": 127965, "epoch": 3046} {"train_loss": -6.532680034637451, "global_step": 127966, "epoch": 3046} {"train_loss": -6.406545162200928, "global_step": 127967, "epoch": 3046} {"train_loss": -6.640235900878906, "global_step": 127968, "epoch": 3046} {"train_loss": -6.370871543884277, "global_step": 127969, "epoch": 3046} {"train_loss": -6.584644794464111, "global_step": 127970, "epoch": 3046} {"train_loss": -6.634641170501709, "global_step": 127971, "epoch": 3046} {"train_loss": -6.681922912597656, "global_step": 127972, "epoch": 3046} {"train_loss": -6.570116077150617, "global_step": 127973, "epoch": 3046, "val_loss": 66301.125} {"train_loss": -6.642544746398926, "global_step": 127974, "epoch": 3047} {"train_loss": -6.606479644775391, "global_step": 127975, "epoch": 3047} {"train_loss": -6.478706359863281, "global_step": 127976, "epoch": 3047} {"train_loss": -6.700439929962158, "global_step": 127977, "epoch": 3047} {"train_loss": -6.633243083953857, "global_step": 127978, "epoch": 3047} {"train_loss": -6.625672340393066, "global_step": 127979, "epoch": 3047} {"train_loss": -6.70295524597168, "global_step": 127980, "epoch": 3047} {"train_loss": -6.641314506530762, "global_step": 127981, "epoch": 3047} {"train_loss": -6.665712356567383, "global_step": 127982, "epoch": 3047} {"train_loss": -6.5500054359436035, "global_step": 127983, "epoch": 3047} {"train_loss": -6.478109836578369, "global_step": 127984, "epoch": 3047} {"train_loss": -6.676319599151611, "global_step": 127985, "epoch": 3047} {"train_loss": -6.554389953613281, "global_step": 127986, "epoch": 3047} {"train_loss": -6.5250163078308105, "global_step": 127987, "epoch": 3047} {"train_loss": -6.459829807281494, "global_step": 127988, "epoch": 3047} {"train_loss": -6.678965091705322, "global_step": 127989, "epoch": 3047} {"train_loss": -6.733994483947754, "global_step": 127990, "epoch": 3047} {"train_loss": -6.587605953216553, "global_step": 127991, "epoch": 3047} {"train_loss": -6.6183576583862305, "global_step": 127992, "epoch": 3047} {"train_loss": -6.523233890533447, "global_step": 127993, "epoch": 3047} {"train_loss": -6.635854244232178, "global_step": 127994, "epoch": 3047} {"train_loss": -6.669844627380371, "global_step": 127995, "epoch": 3047} {"train_loss": -6.580812454223633, "global_step": 127996, "epoch": 3047} {"train_loss": -6.593423366546631, "global_step": 127997, "epoch": 3047} {"train_loss": -6.565586090087891, "global_step": 127998, "epoch": 3047} {"train_loss": -6.532296180725098, "global_step": 127999, "epoch": 3047} {"train_loss": -6.6671528816223145, "global_step": 128000, "epoch": 3047} {"train_loss": -6.557688236236572, "global_step": 128001, "epoch": 3047} {"train_loss": -6.588827133178711, "global_step": 128002, "epoch": 3047} {"train_loss": -6.564292907714844, "global_step": 128003, "epoch": 3047} {"train_loss": -6.519774913787842, "global_step": 128004, "epoch": 3047} {"train_loss": -6.614166736602783, "global_step": 128005, "epoch": 3047} {"train_loss": -6.530345916748047, "global_step": 128006, "epoch": 3047} {"train_loss": -6.596453666687012, "global_step": 128007, "epoch": 3047} {"train_loss": -6.5944647789001465, "global_step": 128008, "epoch": 3047} {"train_loss": -6.600821495056152, "global_step": 128009, "epoch": 3047} {"train_loss": -6.562010765075684, "global_step": 128010, "epoch": 3047} {"train_loss": -6.4999775886535645, "global_step": 128011, "epoch": 3047} {"train_loss": -6.624969482421875, "global_step": 128012, "epoch": 3047} {"train_loss": -6.726701259613037, "global_step": 128013, "epoch": 3047} {"train_loss": -6.508729934692383, "global_step": 128014, "epoch": 3047} {"train_loss": -6.597115391776676, "global_step": 128015, "epoch": 3047, "val_loss": 66121.265625} {"train_loss": -6.62542724609375, "global_step": 128016, "epoch": 3048} {"train_loss": -6.685863494873047, "global_step": 128017, "epoch": 3048} {"train_loss": -6.657644748687744, "global_step": 128018, "epoch": 3048} {"train_loss": -6.602378845214844, "global_step": 128019, "epoch": 3048} {"train_loss": -6.6342363357543945, "global_step": 128020, "epoch": 3048} {"train_loss": -6.627523422241211, "global_step": 128021, "epoch": 3048} {"train_loss": -6.652736663818359, "global_step": 128022, "epoch": 3048} {"train_loss": -6.663626194000244, "global_step": 128023, "epoch": 3048} {"train_loss": -6.675574779510498, "global_step": 128024, "epoch": 3048} {"train_loss": -6.734101295471191, "global_step": 128025, "epoch": 3048} {"train_loss": -6.585113525390625, "global_step": 128026, "epoch": 3048} {"train_loss": -6.797902584075928, "global_step": 128027, "epoch": 3048} {"train_loss": -6.75576639175415, "global_step": 128028, "epoch": 3048} {"train_loss": -6.701282501220703, "global_step": 128029, "epoch": 3048} {"train_loss": -6.67867374420166, "global_step": 128030, "epoch": 3048} {"train_loss": -6.708589553833008, "global_step": 128031, "epoch": 3048} {"train_loss": -6.628777503967285, "global_step": 128032, "epoch": 3048} {"train_loss": -6.64539098739624, "global_step": 128033, "epoch": 3048} {"train_loss": -6.798932075500488, "global_step": 128034, "epoch": 3048} {"train_loss": -6.703120231628418, "global_step": 128035, "epoch": 3048} {"train_loss": -6.61901330947876, "global_step": 128036, "epoch": 3048} {"train_loss": -6.775061130523682, "global_step": 128037, "epoch": 3048} {"train_loss": -6.5699687004089355, "global_step": 128038, "epoch": 3048} {"train_loss": -6.598762512207031, "global_step": 128039, "epoch": 3048} {"train_loss": -6.704617977142334, "global_step": 128040, "epoch": 3048} {"train_loss": -6.733185768127441, "global_step": 128041, "epoch": 3048} {"train_loss": -6.605051517486572, "global_step": 128042, "epoch": 3048} {"train_loss": -6.838147163391113, "global_step": 128043, "epoch": 3048} {"train_loss": -6.638983249664307, "global_step": 128044, "epoch": 3048} {"train_loss": -6.755884170532227, "global_step": 128045, "epoch": 3048} {"train_loss": -6.714066505432129, "global_step": 128046, "epoch": 3048} {"train_loss": -6.816377639770508, "global_step": 128047, "epoch": 3048} {"train_loss": -6.753399848937988, "global_step": 128048, "epoch": 3048} {"train_loss": -6.733523368835449, "global_step": 128049, "epoch": 3048} {"train_loss": -6.804008960723877, "global_step": 128050, "epoch": 3048} {"train_loss": -6.866903305053711, "global_step": 128051, "epoch": 3048} {"train_loss": -6.770764350891113, "global_step": 128052, "epoch": 3048} {"train_loss": -6.803624153137207, "global_step": 128053, "epoch": 3048} {"train_loss": -6.611041069030762, "global_step": 128054, "epoch": 3048} {"train_loss": -6.690071105957031, "global_step": 128055, "epoch": 3048} {"train_loss": -6.789194107055664, "global_step": 128056, "epoch": 3048} {"train_loss": -6.7005656106131415, "global_step": 128057, "epoch": 3048, "val_loss": 66664.5} {"train_loss": -6.644587993621826, "global_step": 128058, "epoch": 3049} {"train_loss": -6.783416748046875, "global_step": 128059, "epoch": 3049} {"train_loss": -6.677379608154297, "global_step": 128060, "epoch": 3049} {"train_loss": -6.743748664855957, "global_step": 128061, "epoch": 3049} {"train_loss": -6.631590366363525, "global_step": 128062, "epoch": 3049} {"train_loss": -6.543003559112549, "global_step": 128063, "epoch": 3049} {"train_loss": -6.737201690673828, "global_step": 128064, "epoch": 3049} {"train_loss": -6.718550205230713, "global_step": 128065, "epoch": 3049} {"train_loss": -6.706053733825684, "global_step": 128066, "epoch": 3049} {"train_loss": -6.701615333557129, "global_step": 128067, "epoch": 3049} {"train_loss": -6.6329498291015625, "global_step": 128068, "epoch": 3049} {"train_loss": -6.700327396392822, "global_step": 128069, "epoch": 3049} {"train_loss": -6.6403374671936035, "global_step": 128070, "epoch": 3049} {"train_loss": -6.7071709632873535, "global_step": 128071, "epoch": 3049} {"train_loss": -6.638641357421875, "global_step": 128072, "epoch": 3049} {"train_loss": -6.637585639953613, "global_step": 128073, "epoch": 3049} {"train_loss": -6.7841644287109375, "global_step": 128074, "epoch": 3049} {"train_loss": -6.667819499969482, "global_step": 128075, "epoch": 3049} {"train_loss": -6.749725341796875, "global_step": 128076, "epoch": 3049} {"train_loss": -6.769646644592285, "global_step": 128077, "epoch": 3049} {"train_loss": -6.638568878173828, "global_step": 128078, "epoch": 3049} {"train_loss": -6.678630828857422, "global_step": 128079, "epoch": 3049} {"train_loss": -6.759433269500732, "global_step": 128080, "epoch": 3049} {"train_loss": -6.576545715332031, "global_step": 128081, "epoch": 3049} {"train_loss": -6.751751899719238, "global_step": 128082, "epoch": 3049} {"train_loss": -6.71865177154541, "global_step": 128083, "epoch": 3049} {"train_loss": -6.6636834144592285, "global_step": 128084, "epoch": 3049} {"train_loss": -6.76040506362915, "global_step": 128085, "epoch": 3049} {"train_loss": -6.680729866027832, "global_step": 128086, "epoch": 3049} {"train_loss": -6.514134407043457, "global_step": 128087, "epoch": 3049} {"train_loss": -6.6110148429870605, "global_step": 128088, "epoch": 3049} {"train_loss": -6.599224090576172, "global_step": 128089, "epoch": 3049} {"train_loss": -6.680051803588867, "global_step": 128090, "epoch": 3049} {"train_loss": -6.527822971343994, "global_step": 128091, "epoch": 3049} {"train_loss": -6.576912879943848, "global_step": 128092, "epoch": 3049} {"train_loss": -6.61583137512207, "global_step": 128093, "epoch": 3049} {"train_loss": -6.5647149085998535, "global_step": 128094, "epoch": 3049} {"train_loss": -6.657770156860352, "global_step": 128095, "epoch": 3049} {"train_loss": -6.518899917602539, "global_step": 128096, "epoch": 3049} {"train_loss": -6.646629333496094, "global_step": 128097, "epoch": 3049} {"train_loss": -6.602560997009277, "global_step": 128098, "epoch": 3049} {"train_loss": -6.664621126084101, "global_step": 128099, "epoch": 3049, "val_loss": 66482.875} {"train_loss": -6.747683525085449, "global_step": 128100, "epoch": 3050} {"train_loss": -6.702689170837402, "global_step": 128101, "epoch": 3050} {"train_loss": -6.7137274742126465, "global_step": 128102, "epoch": 3050} {"train_loss": -6.532031059265137, "global_step": 128103, "epoch": 3050} {"train_loss": -6.705933570861816, "global_step": 128104, "epoch": 3050} {"train_loss": -6.704748153686523, "global_step": 128105, "epoch": 3050} {"train_loss": -6.566107749938965, "global_step": 128106, "epoch": 3050} {"train_loss": -6.727682113647461, "global_step": 128107, "epoch": 3050} {"train_loss": -6.788523197174072, "global_step": 128108, "epoch": 3050} {"train_loss": -6.694832801818848, "global_step": 128109, "epoch": 3050} {"train_loss": -6.492068290710449, "global_step": 128110, "epoch": 3050} {"train_loss": -6.669891834259033, "global_step": 128111, "epoch": 3050} {"train_loss": -6.60858678817749, "global_step": 128112, "epoch": 3050} {"train_loss": -6.598308563232422, "global_step": 128113, "epoch": 3050} {"train_loss": -6.647920608520508, "global_step": 128114, "epoch": 3050} {"train_loss": -6.6736860275268555, "global_step": 128115, "epoch": 3050} {"train_loss": -6.538435935974121, "global_step": 128116, "epoch": 3050} {"train_loss": -6.683469295501709, "global_step": 128117, "epoch": 3050} {"train_loss": -6.515764236450195, "global_step": 128118, "epoch": 3050} {"train_loss": -6.622799873352051, "global_step": 128119, "epoch": 3050} {"train_loss": -6.600748062133789, "global_step": 128120, "epoch": 3050} {"train_loss": -6.668386936187744, "global_step": 128121, "epoch": 3050} {"train_loss": -6.740108966827393, "global_step": 128122, "epoch": 3050} {"train_loss": -6.723169803619385, "global_step": 128123, "epoch": 3050} {"train_loss": -6.701117038726807, "global_step": 128124, "epoch": 3050} {"train_loss": -6.680704593658447, "global_step": 128125, "epoch": 3050} {"train_loss": -6.712333679199219, "global_step": 128126, "epoch": 3050} {"train_loss": -6.690820217132568, "global_step": 128127, "epoch": 3050} {"train_loss": -6.617170333862305, "global_step": 128128, "epoch": 3050} {"train_loss": -6.690488815307617, "global_step": 128129, "epoch": 3050} {"train_loss": -6.724757194519043, "global_step": 128130, "epoch": 3050} {"train_loss": -6.687345504760742, "global_step": 128131, "epoch": 3050} {"train_loss": -6.581967353820801, "global_step": 128132, "epoch": 3050} {"train_loss": -6.721250057220459, "global_step": 128133, "epoch": 3050} {"train_loss": -6.630120277404785, "global_step": 128134, "epoch": 3050} {"train_loss": -6.610466957092285, "global_step": 128135, "epoch": 3050} {"train_loss": -6.659645080566406, "global_step": 128136, "epoch": 3050} {"train_loss": -6.568861961364746, "global_step": 128137, "epoch": 3050} {"train_loss": -6.744067668914795, "global_step": 128138, "epoch": 3050} {"train_loss": -6.603704452514648, "global_step": 128139, "epoch": 3050} {"train_loss": -6.707528591156006, "global_step": 128140, "epoch": 3050} {"train_loss": -6.6556560425531295, "global_step": 128141, "epoch": 3050, "train/sim_max_reward_0": 0.2006318730369974, "train/sim_max_reward_1": 0.9951865954697314, "train/sim_max_reward_2": 0.558831603890996, "train/sim_max_reward_3": 0.8002471512609249, "train/sim_max_reward_4": 0.9938104665234674, "train/sim_max_reward_5": 0.19568863947736684, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5478504020295046, "test/sim_max_reward_4300002": 0.9467239250533156, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8789894464357082, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.902511918956623, "test/sim_max_reward_4300008": 0.9227820686076481, "test/sim_max_reward_4300009": 0.9748239178700979, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.9326060810951706, "test/sim_max_reward_4300013": 0.8148751197018669, "test/sim_max_reward_4300014": 0.9403330039792991, "test/sim_max_reward_4300015": 0.8489887125341887, "test/sim_max_reward_4300016": 0.020252531004158594, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.6081709148791894, "test/sim_max_reward_4300019": 0.18589658944808343, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9242392014776453, "test/sim_max_reward_4300022": 0.8801711372136972, "test/sim_max_reward_4300023": 0.8460646068296253, "test/sim_max_reward_4300024": 0.9718157381969518, "test/sim_max_reward_4300025": 0.9338605735500982, "test/sim_max_reward_4300026": 0.18219794370404338, "test/sim_max_reward_4300027": 0.9375752967012614, "test/sim_max_reward_4300028": 0.9538320589858414, "test/sim_max_reward_4300029": 0.41018120198436847, "test/sim_max_reward_4300030": 0.876954732189762, "test/sim_max_reward_4300031": 0.20978778831159922, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.6984512557184467, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.6919427774945963, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9114729278352985, "test/sim_max_reward_4300038": 0.5340595885378341, "test/sim_max_reward_4300039": 0.903708482971245, "test/sim_max_reward_4300040": 0.7374159466608472, "test/sim_max_reward_4300041": 0.147160509597931, "test/sim_max_reward_4300042": 0.7180152966893415, "test/sim_max_reward_4300043": 0.13755267315338268, "test/sim_max_reward_4300044": 0.9759486571187876, "test/sim_max_reward_4300045": 0.335340911370024, "test/sim_max_reward_4300046": 0.0, "test/sim_max_reward_4300047": 0.17774138123462224, "test/sim_max_reward_4300048": 0.07834761578908041, "test/sim_max_reward_4300049": 0.3363459863683368, "train/mean_score": 0.6240660549432473, "test/mean_score": 0.5850003428330457, "val_loss": 66270.46875} {"train_loss": -6.750555992126465, "global_step": 128142, "epoch": 3051} {"train_loss": -6.683468818664551, "global_step": 128143, "epoch": 3051} {"train_loss": -6.466151237487793, "global_step": 128144, "epoch": 3051} {"train_loss": -6.643141746520996, "global_step": 128145, "epoch": 3051} {"train_loss": -6.576776504516602, "global_step": 128146, "epoch": 3051} {"train_loss": -6.719583988189697, "global_step": 128147, "epoch": 3051} {"train_loss": -6.632256031036377, "global_step": 128148, "epoch": 3051} {"train_loss": -6.543698787689209, "global_step": 128149, "epoch": 3051} {"train_loss": -6.720293998718262, "global_step": 128150, "epoch": 3051} {"train_loss": -6.679694652557373, "global_step": 128151, "epoch": 3051} {"train_loss": -6.6531524658203125, "global_step": 128152, "epoch": 3051} {"train_loss": -6.637892723083496, "global_step": 128153, "epoch": 3051} {"train_loss": -6.60399866104126, "global_step": 128154, "epoch": 3051} {"train_loss": -6.7010650634765625, "global_step": 128155, "epoch": 3051} {"train_loss": -6.808608531951904, "global_step": 128156, "epoch": 3051} {"train_loss": -6.770842552185059, "global_step": 128157, "epoch": 3051} {"train_loss": -6.7476019859313965, "global_step": 128158, "epoch": 3051} {"train_loss": -6.727033615112305, "global_step": 128159, "epoch": 3051} {"train_loss": -6.586068153381348, "global_step": 128160, "epoch": 3051} {"train_loss": -6.593271255493164, "global_step": 128161, "epoch": 3051} {"train_loss": -6.672048568725586, "global_step": 128162, "epoch": 3051} {"train_loss": -6.70765495300293, "global_step": 128163, "epoch": 3051} {"train_loss": -6.666025161743164, "global_step": 128164, "epoch": 3051} {"train_loss": -6.706411361694336, "global_step": 128165, "epoch": 3051} {"train_loss": -6.62087345123291, "global_step": 128166, "epoch": 3051} {"train_loss": -6.582304954528809, "global_step": 128167, "epoch": 3051} {"train_loss": -6.688455581665039, "global_step": 128168, "epoch": 3051} {"train_loss": -6.629824638366699, "global_step": 128169, "epoch": 3051} {"train_loss": -6.72369384765625, "global_step": 128170, "epoch": 3051} {"train_loss": -6.525803565979004, "global_step": 128171, "epoch": 3051} {"train_loss": -6.532837390899658, "global_step": 128172, "epoch": 3051} {"train_loss": -6.645603179931641, "global_step": 128173, "epoch": 3051} {"train_loss": -6.608590126037598, "global_step": 128174, "epoch": 3051} {"train_loss": -6.6050848960876465, "global_step": 128175, "epoch": 3051} {"train_loss": -6.678560733795166, "global_step": 128176, "epoch": 3051} {"train_loss": -6.623052597045898, "global_step": 128177, "epoch": 3051} {"train_loss": -6.5998759269714355, "global_step": 128178, "epoch": 3051} {"train_loss": -6.655788421630859, "global_step": 128179, "epoch": 3051} {"train_loss": -6.581386566162109, "global_step": 128180, "epoch": 3051} {"train_loss": -6.717310905456543, "global_step": 128181, "epoch": 3051} {"train_loss": -6.686409950256348, "global_step": 128182, "epoch": 3051} {"train_loss": -6.651097785858881, "global_step": 128183, "epoch": 3051, "val_loss": 66368.59375} {"train_loss": -6.731544017791748, "global_step": 128184, "epoch": 3052} {"train_loss": -6.769109725952148, "global_step": 128185, "epoch": 3052} {"train_loss": -6.638165473937988, "global_step": 128186, "epoch": 3052} {"train_loss": -6.536952018737793, "global_step": 128187, "epoch": 3052} {"train_loss": -6.65903377532959, "global_step": 128188, "epoch": 3052} {"train_loss": -6.667364120483398, "global_step": 128189, "epoch": 3052} {"train_loss": -6.629858493804932, "global_step": 128190, "epoch": 3052} {"train_loss": -6.741029739379883, "global_step": 128191, "epoch": 3052} {"train_loss": -6.72448205947876, "global_step": 128192, "epoch": 3052} {"train_loss": -6.76692008972168, "global_step": 128193, "epoch": 3052} {"train_loss": -6.62568998336792, "global_step": 128194, "epoch": 3052} {"train_loss": -6.76591157913208, "global_step": 128195, "epoch": 3052} {"train_loss": -6.6710429191589355, "global_step": 128196, "epoch": 3052} {"train_loss": -6.693727493286133, "global_step": 128197, "epoch": 3052} {"train_loss": -6.648713111877441, "global_step": 128198, "epoch": 3052} {"train_loss": -6.617049217224121, "global_step": 128199, "epoch": 3052} {"train_loss": -6.682683944702148, "global_step": 128200, "epoch": 3052} {"train_loss": -6.728270530700684, "global_step": 128201, "epoch": 3052} {"train_loss": -6.553428649902344, "global_step": 128202, "epoch": 3052} {"train_loss": -6.720736503601074, "global_step": 128203, "epoch": 3052} {"train_loss": -6.708372116088867, "global_step": 128204, "epoch": 3052} {"train_loss": -6.734220504760742, "global_step": 128205, "epoch": 3052} {"train_loss": -6.634921073913574, "global_step": 128206, "epoch": 3052} {"train_loss": -6.621509552001953, "global_step": 128207, "epoch": 3052} {"train_loss": -6.712657451629639, "global_step": 128208, "epoch": 3052} {"train_loss": -6.583670616149902, "global_step": 128209, "epoch": 3052} {"train_loss": -6.555764675140381, "global_step": 128210, "epoch": 3052} {"train_loss": -6.510223388671875, "global_step": 128211, "epoch": 3052} {"train_loss": -6.5923237800598145, "global_step": 128212, "epoch": 3052} {"train_loss": -6.564175605773926, "global_step": 128213, "epoch": 3052} {"train_loss": -6.588309288024902, "global_step": 128214, "epoch": 3052} {"train_loss": -6.621212959289551, "global_step": 128215, "epoch": 3052} {"train_loss": -6.629158020019531, "global_step": 128216, "epoch": 3052} {"train_loss": -6.64419412612915, "global_step": 128217, "epoch": 3052} {"train_loss": -6.5202250480651855, "global_step": 128218, "epoch": 3052} {"train_loss": -6.7384843826293945, "global_step": 128219, "epoch": 3052} {"train_loss": -6.565474987030029, "global_step": 128220, "epoch": 3052} {"train_loss": -6.602818965911865, "global_step": 128221, "epoch": 3052} {"train_loss": -6.659302711486816, "global_step": 128222, "epoch": 3052} {"train_loss": -6.664038181304932, "global_step": 128223, "epoch": 3052} {"train_loss": -6.631659984588623, "global_step": 128224, "epoch": 3052} {"train_loss": -6.648936373846872, "global_step": 128225, "epoch": 3052, "val_loss": 66387.25} {"train_loss": -6.728144645690918, "global_step": 128226, "epoch": 3053} {"train_loss": -6.706799507141113, "global_step": 128227, "epoch": 3053} {"train_loss": -6.646574974060059, "global_step": 128228, "epoch": 3053} {"train_loss": -6.740474700927734, "global_step": 128229, "epoch": 3053} {"train_loss": -6.669443130493164, "global_step": 128230, "epoch": 3053} {"train_loss": -6.661402702331543, "global_step": 128231, "epoch": 3053} {"train_loss": -6.679124355316162, "global_step": 128232, "epoch": 3053} {"train_loss": -6.5424370765686035, "global_step": 128233, "epoch": 3053} {"train_loss": -6.7300004959106445, "global_step": 128234, "epoch": 3053} {"train_loss": -6.653518199920654, "global_step": 128235, "epoch": 3053} {"train_loss": -6.6446123123168945, "global_step": 128236, "epoch": 3053} {"train_loss": -6.726961135864258, "global_step": 128237, "epoch": 3053} {"train_loss": -6.659883499145508, "global_step": 128238, "epoch": 3053} {"train_loss": -6.628079414367676, "global_step": 128239, "epoch": 3053} {"train_loss": -6.71137809753418, "global_step": 128240, "epoch": 3053} {"train_loss": -6.695903301239014, "global_step": 128241, "epoch": 3053} {"train_loss": -6.558028221130371, "global_step": 128242, "epoch": 3053} {"train_loss": -6.577815532684326, "global_step": 128243, "epoch": 3053} {"train_loss": -6.727259635925293, "global_step": 128244, "epoch": 3053} {"train_loss": -6.5980939865112305, "global_step": 128245, "epoch": 3053} {"train_loss": -6.672294616699219, "global_step": 128246, "epoch": 3053} {"train_loss": -6.660368919372559, "global_step": 128247, "epoch": 3053} {"train_loss": -6.704034805297852, "global_step": 128248, "epoch": 3053} {"train_loss": -6.557034492492676, "global_step": 128249, "epoch": 3053} {"train_loss": -6.556244850158691, "global_step": 128250, "epoch": 3053} {"train_loss": -6.6738739013671875, "global_step": 128251, "epoch": 3053} {"train_loss": -6.49152946472168, "global_step": 128252, "epoch": 3053} {"train_loss": -6.678656101226807, "global_step": 128253, "epoch": 3053} {"train_loss": -6.682539939880371, "global_step": 128254, "epoch": 3053} {"train_loss": -6.656826496124268, "global_step": 128255, "epoch": 3053} {"train_loss": -6.658122539520264, "global_step": 128256, "epoch": 3053} {"train_loss": -6.651464939117432, "global_step": 128257, "epoch": 3053} {"train_loss": -6.5775628089904785, "global_step": 128258, "epoch": 3053} {"train_loss": -6.6629767417907715, "global_step": 128259, "epoch": 3053} {"train_loss": -6.684727668762207, "global_step": 128260, "epoch": 3053} {"train_loss": -6.725299835205078, "global_step": 128261, "epoch": 3053} {"train_loss": -6.5822272300720215, "global_step": 128262, "epoch": 3053} {"train_loss": -6.681948661804199, "global_step": 128263, "epoch": 3053} {"train_loss": -6.50844669342041, "global_step": 128264, "epoch": 3053} {"train_loss": -6.713719367980957, "global_step": 128265, "epoch": 3053} {"train_loss": -6.777392387390137, "global_step": 128266, "epoch": 3053} {"train_loss": -6.6521056947254, "global_step": 128267, "epoch": 3053, "val_loss": 66528.2421875} {"train_loss": -6.551905632019043, "global_step": 128268, "epoch": 3054} {"train_loss": -6.6617207527160645, "global_step": 128269, "epoch": 3054} {"train_loss": -6.7382283210754395, "global_step": 128270, "epoch": 3054} {"train_loss": -6.688605785369873, "global_step": 128271, "epoch": 3054} {"train_loss": -6.723201274871826, "global_step": 128272, "epoch": 3054} {"train_loss": -6.727768898010254, "global_step": 128273, "epoch": 3054} {"train_loss": -6.784422874450684, "global_step": 128274, "epoch": 3054} {"train_loss": -6.7101593017578125, "global_step": 128275, "epoch": 3054} {"train_loss": -6.6698384284973145, "global_step": 128276, "epoch": 3054} {"train_loss": -6.773501396179199, "global_step": 128277, "epoch": 3054} {"train_loss": -6.659169673919678, "global_step": 128278, "epoch": 3054} {"train_loss": -6.617795467376709, "global_step": 128279, "epoch": 3054} {"train_loss": -6.688237190246582, "global_step": 128280, "epoch": 3054} {"train_loss": -6.5731282234191895, "global_step": 128281, "epoch": 3054} {"train_loss": -6.659095764160156, "global_step": 128282, "epoch": 3054} {"train_loss": -6.739709854125977, "global_step": 128283, "epoch": 3054} {"train_loss": -6.745833396911621, "global_step": 128284, "epoch": 3054} {"train_loss": -6.727421760559082, "global_step": 128285, "epoch": 3054} {"train_loss": -6.656148910522461, "global_step": 128286, "epoch": 3054} {"train_loss": -6.631387710571289, "global_step": 128287, "epoch": 3054} {"train_loss": -6.662924766540527, "global_step": 128288, "epoch": 3054} {"train_loss": -6.78913688659668, "global_step": 128289, "epoch": 3054} {"train_loss": -6.732029438018799, "global_step": 128290, "epoch": 3054} {"train_loss": -6.577169895172119, "global_step": 128291, "epoch": 3054} {"train_loss": -6.8167572021484375, "global_step": 128292, "epoch": 3054} {"train_loss": -6.679198741912842, "global_step": 128293, "epoch": 3054} {"train_loss": -6.648373603820801, "global_step": 128294, "epoch": 3054} {"train_loss": -6.726763725280762, "global_step": 128295, "epoch": 3054} {"train_loss": -6.591592788696289, "global_step": 128296, "epoch": 3054} {"train_loss": -6.60521125793457, "global_step": 128297, "epoch": 3054} {"train_loss": -6.710516929626465, "global_step": 128298, "epoch": 3054} {"train_loss": -6.652382850646973, "global_step": 128299, "epoch": 3054} {"train_loss": -6.692471981048584, "global_step": 128300, "epoch": 3054} {"train_loss": -6.602242469787598, "global_step": 128301, "epoch": 3054} {"train_loss": -6.6649250984191895, "global_step": 128302, "epoch": 3054} {"train_loss": -6.66790771484375, "global_step": 128303, "epoch": 3054} {"train_loss": -6.656300067901611, "global_step": 128304, "epoch": 3054} {"train_loss": -6.5794172286987305, "global_step": 128305, "epoch": 3054} {"train_loss": -6.578507900238037, "global_step": 128306, "epoch": 3054} {"train_loss": -6.674721717834473, "global_step": 128307, "epoch": 3054} {"train_loss": -6.574522495269775, "global_step": 128308, "epoch": 3054} {"train_loss": -6.672379981903803, "global_step": 128309, "epoch": 3054, "val_loss": 66261.7109375} {"train_loss": -6.732595920562744, "global_step": 128310, "epoch": 3055} {"train_loss": -6.62542724609375, "global_step": 128311, "epoch": 3055} {"train_loss": -6.700709342956543, "global_step": 128312, "epoch": 3055} {"train_loss": -6.533267021179199, "global_step": 128313, "epoch": 3055} {"train_loss": -6.670536994934082, "global_step": 128314, "epoch": 3055} {"train_loss": -6.63508415222168, "global_step": 128315, "epoch": 3055} {"train_loss": -6.63224983215332, "global_step": 128316, "epoch": 3055} {"train_loss": -6.765247344970703, "global_step": 128317, "epoch": 3055} {"train_loss": -6.553140163421631, "global_step": 128318, "epoch": 3055} {"train_loss": -6.64447546005249, "global_step": 128319, "epoch": 3055} {"train_loss": -6.724221229553223, "global_step": 128320, "epoch": 3055} {"train_loss": -6.674607753753662, "global_step": 128321, "epoch": 3055} {"train_loss": -6.641712188720703, "global_step": 128322, "epoch": 3055} {"train_loss": -6.4941558837890625, "global_step": 128323, "epoch": 3055} {"train_loss": -6.510529518127441, "global_step": 128324, "epoch": 3055} {"train_loss": -6.617928981781006, "global_step": 128325, "epoch": 3055} {"train_loss": -6.689373016357422, "global_step": 128326, "epoch": 3055} {"train_loss": -6.486781120300293, "global_step": 128327, "epoch": 3055} {"train_loss": -6.583765029907227, "global_step": 128328, "epoch": 3055} {"train_loss": -6.5534210205078125, "global_step": 128329, "epoch": 3055} {"train_loss": -6.670756816864014, "global_step": 128330, "epoch": 3055} {"train_loss": -6.619200229644775, "global_step": 128331, "epoch": 3055} {"train_loss": -6.674854278564453, "global_step": 128332, "epoch": 3055} {"train_loss": -6.528128623962402, "global_step": 128333, "epoch": 3055} {"train_loss": -6.702688217163086, "global_step": 128334, "epoch": 3055} {"train_loss": -6.60162353515625, "global_step": 128335, "epoch": 3055} {"train_loss": -6.586920261383057, "global_step": 128336, "epoch": 3055} {"train_loss": -6.660326957702637, "global_step": 128337, "epoch": 3055} {"train_loss": -6.6468024253845215, "global_step": 128338, "epoch": 3055} {"train_loss": -6.560729503631592, "global_step": 128339, "epoch": 3055} {"train_loss": -6.641308784484863, "global_step": 128340, "epoch": 3055} {"train_loss": -6.655034065246582, "global_step": 128341, "epoch": 3055} {"train_loss": -6.65726375579834, "global_step": 128342, "epoch": 3055} {"train_loss": -6.756928443908691, "global_step": 128343, "epoch": 3055} {"train_loss": -6.660882949829102, "global_step": 128344, "epoch": 3055} {"train_loss": -6.752845764160156, "global_step": 128345, "epoch": 3055} {"train_loss": -6.750993251800537, "global_step": 128346, "epoch": 3055} {"train_loss": -6.708217620849609, "global_step": 128347, "epoch": 3055} {"train_loss": -6.7534379959106445, "global_step": 128348, "epoch": 3055} {"train_loss": -6.631220817565918, "global_step": 128349, "epoch": 3055} {"train_loss": -6.644164562225342, "global_step": 128350, "epoch": 3055} {"train_loss": -6.642344168254307, "global_step": 128351, "epoch": 3055, "val_loss": 66244.328125} {"train_loss": -6.671165466308594, "global_step": 128352, "epoch": 3056} {"train_loss": -6.584778785705566, "global_step": 128353, "epoch": 3056} {"train_loss": -6.623432159423828, "global_step": 128354, "epoch": 3056} {"train_loss": -6.619574069976807, "global_step": 128355, "epoch": 3056} {"train_loss": -6.64605712890625, "global_step": 128356, "epoch": 3056} {"train_loss": -6.689715385437012, "global_step": 128357, "epoch": 3056} {"train_loss": -6.636465072631836, "global_step": 128358, "epoch": 3056} {"train_loss": -6.675692558288574, "global_step": 128359, "epoch": 3056} {"train_loss": -6.71595573425293, "global_step": 128360, "epoch": 3056} {"train_loss": -6.71129846572876, "global_step": 128361, "epoch": 3056} {"train_loss": -6.719066619873047, "global_step": 128362, "epoch": 3056} {"train_loss": -6.657749652862549, "global_step": 128363, "epoch": 3056} {"train_loss": -6.699030876159668, "global_step": 128364, "epoch": 3056} {"train_loss": -6.66851806640625, "global_step": 128365, "epoch": 3056} {"train_loss": -6.646461009979248, "global_step": 128366, "epoch": 3056} {"train_loss": -6.735580921173096, "global_step": 128367, "epoch": 3056} {"train_loss": -6.744291305541992, "global_step": 128368, "epoch": 3056} {"train_loss": -6.705765247344971, "global_step": 128369, "epoch": 3056} {"train_loss": -6.79410982131958, "global_step": 128370, "epoch": 3056} {"train_loss": -6.607239723205566, "global_step": 128371, "epoch": 3056} {"train_loss": -6.613077163696289, "global_step": 128372, "epoch": 3056} {"train_loss": -6.657065391540527, "global_step": 128373, "epoch": 3056} {"train_loss": -6.644062042236328, "global_step": 128374, "epoch": 3056} {"train_loss": -6.562978744506836, "global_step": 128375, "epoch": 3056} {"train_loss": -6.659087657928467, "global_step": 128376, "epoch": 3056} {"train_loss": -6.669524669647217, "global_step": 128377, "epoch": 3056} {"train_loss": -6.696732521057129, "global_step": 128378, "epoch": 3056} {"train_loss": -6.641341686248779, "global_step": 128379, "epoch": 3056} {"train_loss": -6.605175971984863, "global_step": 128380, "epoch": 3056} {"train_loss": -6.668606758117676, "global_step": 128381, "epoch": 3056} {"train_loss": -6.632004737854004, "global_step": 128382, "epoch": 3056} {"train_loss": -6.59757661819458, "global_step": 128383, "epoch": 3056} {"train_loss": -6.620786666870117, "global_step": 128384, "epoch": 3056} {"train_loss": -6.60228157043457, "global_step": 128385, "epoch": 3056} {"train_loss": -6.5724287033081055, "global_step": 128386, "epoch": 3056} {"train_loss": -6.561901092529297, "global_step": 128387, "epoch": 3056} {"train_loss": -6.592440128326416, "global_step": 128388, "epoch": 3056} {"train_loss": -6.486695289611816, "global_step": 128389, "epoch": 3056} {"train_loss": -6.6281633377075195, "global_step": 128390, "epoch": 3056} {"train_loss": -6.476720809936523, "global_step": 128391, "epoch": 3056} {"train_loss": -6.598172187805176, "global_step": 128392, "epoch": 3056} {"train_loss": -6.6403805414835615, "global_step": 128393, "epoch": 3056, "val_loss": 66445.34375} {"train_loss": -6.432570457458496, "global_step": 128394, "epoch": 3057} {"train_loss": -6.700850009918213, "global_step": 128395, "epoch": 3057} {"train_loss": -6.507349491119385, "global_step": 128396, "epoch": 3057} {"train_loss": -6.642851829528809, "global_step": 128397, "epoch": 3057} {"train_loss": -6.543211460113525, "global_step": 128398, "epoch": 3057} {"train_loss": -6.5308122634887695, "global_step": 128399, "epoch": 3057} {"train_loss": -6.491155624389648, "global_step": 128400, "epoch": 3057} {"train_loss": -6.674535751342773, "global_step": 128401, "epoch": 3057} {"train_loss": -6.495335578918457, "global_step": 128402, "epoch": 3057} {"train_loss": -6.533746242523193, "global_step": 128403, "epoch": 3057} {"train_loss": -6.629979133605957, "global_step": 128404, "epoch": 3057} {"train_loss": -6.507057189941406, "global_step": 128405, "epoch": 3057} {"train_loss": -6.594034194946289, "global_step": 128406, "epoch": 3057} {"train_loss": -6.488514423370361, "global_step": 128407, "epoch": 3057} {"train_loss": -6.475170135498047, "global_step": 128408, "epoch": 3057} {"train_loss": -6.564263343811035, "global_step": 128409, "epoch": 3057} {"train_loss": -6.531233787536621, "global_step": 128410, "epoch": 3057} {"train_loss": -6.6008501052856445, "global_step": 128411, "epoch": 3057} {"train_loss": -6.535489559173584, "global_step": 128412, "epoch": 3057} {"train_loss": -6.589733600616455, "global_step": 128413, "epoch": 3057} {"train_loss": -6.583771228790283, "global_step": 128414, "epoch": 3057} {"train_loss": -6.549887657165527, "global_step": 128415, "epoch": 3057} {"train_loss": -6.661228656768799, "global_step": 128416, "epoch": 3057} {"train_loss": -6.651400566101074, "global_step": 128417, "epoch": 3057} {"train_loss": -6.723139762878418, "global_step": 128418, "epoch": 3057} {"train_loss": -6.595481872558594, "global_step": 128419, "epoch": 3057} {"train_loss": -6.597378253936768, "global_step": 128420, "epoch": 3057} {"train_loss": -6.6121110916137695, "global_step": 128421, "epoch": 3057} {"train_loss": -6.685007095336914, "global_step": 128422, "epoch": 3057} {"train_loss": -6.575821876525879, "global_step": 128423, "epoch": 3057} {"train_loss": -6.5714521408081055, "global_step": 128424, "epoch": 3057} {"train_loss": -6.647883415222168, "global_step": 128425, "epoch": 3057} {"train_loss": -6.644991874694824, "global_step": 128426, "epoch": 3057} {"train_loss": -6.623970985412598, "global_step": 128427, "epoch": 3057} {"train_loss": -6.589970111846924, "global_step": 128428, "epoch": 3057} {"train_loss": -6.644077301025391, "global_step": 128429, "epoch": 3057} {"train_loss": -6.687889575958252, "global_step": 128430, "epoch": 3057} {"train_loss": -6.705501079559326, "global_step": 128431, "epoch": 3057} {"train_loss": -6.700158596038818, "global_step": 128432, "epoch": 3057} {"train_loss": -6.751214027404785, "global_step": 128433, "epoch": 3057} {"train_loss": -6.59727668762207, "global_step": 128434, "epoch": 3057} {"train_loss": -6.596906094324021, "global_step": 128435, "epoch": 3057, "val_loss": 66345.953125} {"train_loss": -6.6381683349609375, "global_step": 128436, "epoch": 3058} {"train_loss": -6.659929275512695, "global_step": 128437, "epoch": 3058} {"train_loss": -6.641386032104492, "global_step": 128438, "epoch": 3058} {"train_loss": -6.524874210357666, "global_step": 128439, "epoch": 3058} {"train_loss": -6.528721809387207, "global_step": 128440, "epoch": 3058} {"train_loss": -6.571847915649414, "global_step": 128441, "epoch": 3058} {"train_loss": -6.502689361572266, "global_step": 128442, "epoch": 3058} {"train_loss": -6.588037490844727, "global_step": 128443, "epoch": 3058} {"train_loss": -6.6280341148376465, "global_step": 128444, "epoch": 3058} {"train_loss": -6.445590972900391, "global_step": 128445, "epoch": 3058} {"train_loss": -6.645051002502441, "global_step": 128446, "epoch": 3058} {"train_loss": -6.426077365875244, "global_step": 128447, "epoch": 3058} {"train_loss": -6.571175575256348, "global_step": 128448, "epoch": 3058} {"train_loss": -6.598735809326172, "global_step": 128449, "epoch": 3058} {"train_loss": -6.568334579467773, "global_step": 128450, "epoch": 3058} {"train_loss": -6.6962432861328125, "global_step": 128451, "epoch": 3058} {"train_loss": -6.626023292541504, "global_step": 128452, "epoch": 3058} {"train_loss": -6.640786170959473, "global_step": 128453, "epoch": 3058} {"train_loss": -6.602373123168945, "global_step": 128454, "epoch": 3058} {"train_loss": -6.64275598526001, "global_step": 128455, "epoch": 3058} {"train_loss": -6.701557159423828, "global_step": 128456, "epoch": 3058} {"train_loss": -6.629938125610352, "global_step": 128457, "epoch": 3058} {"train_loss": -6.622255325317383, "global_step": 128458, "epoch": 3058} {"train_loss": -6.671741485595703, "global_step": 128459, "epoch": 3058} {"train_loss": -6.6710004806518555, "global_step": 128460, "epoch": 3058} {"train_loss": -6.767305374145508, "global_step": 128461, "epoch": 3058} {"train_loss": -6.66008186340332, "global_step": 128462, "epoch": 3058} {"train_loss": -6.531932830810547, "global_step": 128463, "epoch": 3058} {"train_loss": -6.546715259552002, "global_step": 128464, "epoch": 3058} {"train_loss": -6.778554916381836, "global_step": 128465, "epoch": 3058} {"train_loss": -6.646764755249023, "global_step": 128466, "epoch": 3058} {"train_loss": -6.582317352294922, "global_step": 128467, "epoch": 3058} {"train_loss": -6.711634159088135, "global_step": 128468, "epoch": 3058} {"train_loss": -6.649467468261719, "global_step": 128469, "epoch": 3058} {"train_loss": -6.668482780456543, "global_step": 128470, "epoch": 3058} {"train_loss": -6.659741401672363, "global_step": 128471, "epoch": 3058} {"train_loss": -6.624215602874756, "global_step": 128472, "epoch": 3058} {"train_loss": -6.695671081542969, "global_step": 128473, "epoch": 3058} {"train_loss": -6.5280022621154785, "global_step": 128474, "epoch": 3058} {"train_loss": -6.709821701049805, "global_step": 128475, "epoch": 3058} {"train_loss": -6.596497058868408, "global_step": 128476, "epoch": 3058} {"train_loss": -6.619825453985305, "global_step": 128477, "epoch": 3058, "val_loss": 66455.7421875} {"train_loss": -6.675528526306152, "global_step": 128478, "epoch": 3059} {"train_loss": -6.691187858581543, "global_step": 128479, "epoch": 3059} {"train_loss": -6.717350959777832, "global_step": 128480, "epoch": 3059} {"train_loss": -6.6970109939575195, "global_step": 128481, "epoch": 3059} {"train_loss": -6.672114372253418, "global_step": 128482, "epoch": 3059} {"train_loss": -6.781760215759277, "global_step": 128483, "epoch": 3059} {"train_loss": -6.722275733947754, "global_step": 128484, "epoch": 3059} {"train_loss": -6.6910600662231445, "global_step": 128485, "epoch": 3059} {"train_loss": -6.482811450958252, "global_step": 128486, "epoch": 3059} {"train_loss": -6.699930191040039, "global_step": 128487, "epoch": 3059} {"train_loss": -6.71907377243042, "global_step": 128488, "epoch": 3059} {"train_loss": -6.702805042266846, "global_step": 128489, "epoch": 3059} {"train_loss": -6.685818672180176, "global_step": 128490, "epoch": 3059} {"train_loss": -6.6597771644592285, "global_step": 128491, "epoch": 3059} {"train_loss": -6.701391220092773, "global_step": 128492, "epoch": 3059} {"train_loss": -6.694488525390625, "global_step": 128493, "epoch": 3059} {"train_loss": -6.7804975509643555, "global_step": 128494, "epoch": 3059} {"train_loss": -6.81897497177124, "global_step": 128495, "epoch": 3059} {"train_loss": -6.779844760894775, "global_step": 128496, "epoch": 3059} {"train_loss": -6.628884792327881, "global_step": 128497, "epoch": 3059} {"train_loss": -6.670273780822754, "global_step": 128498, "epoch": 3059} {"train_loss": -6.659242630004883, "global_step": 128499, "epoch": 3059} {"train_loss": -6.725526809692383, "global_step": 128500, "epoch": 3059} {"train_loss": -6.675784587860107, "global_step": 128501, "epoch": 3059} {"train_loss": -6.606717109680176, "global_step": 128502, "epoch": 3059} {"train_loss": -6.704350471496582, "global_step": 128503, "epoch": 3059} {"train_loss": -6.710179328918457, "global_step": 128504, "epoch": 3059} {"train_loss": -6.690369606018066, "global_step": 128505, "epoch": 3059} {"train_loss": -6.644333839416504, "global_step": 128506, "epoch": 3059} {"train_loss": -6.691014766693115, "global_step": 128507, "epoch": 3059} {"train_loss": -6.717446327209473, "global_step": 128508, "epoch": 3059} {"train_loss": -6.619658470153809, "global_step": 128509, "epoch": 3059} {"train_loss": -6.645373344421387, "global_step": 128510, "epoch": 3059} {"train_loss": -6.721354961395264, "global_step": 128511, "epoch": 3059} {"train_loss": -6.57283878326416, "global_step": 128512, "epoch": 3059} {"train_loss": -6.501352310180664, "global_step": 128513, "epoch": 3059} {"train_loss": -6.723150730133057, "global_step": 128514, "epoch": 3059} {"train_loss": -6.650826454162598, "global_step": 128515, "epoch": 3059} {"train_loss": -6.564846992492676, "global_step": 128516, "epoch": 3059} {"train_loss": -6.556694984436035, "global_step": 128517, "epoch": 3059} {"train_loss": -6.755283355712891, "global_step": 128518, "epoch": 3059} {"train_loss": -6.676723434811547, "global_step": 128519, "epoch": 3059, "val_loss": 66583.9921875} {"train_loss": -6.622448444366455, "global_step": 128520, "epoch": 3060} {"train_loss": -6.700177192687988, "global_step": 128521, "epoch": 3060} {"train_loss": -6.657289505004883, "global_step": 128522, "epoch": 3060} {"train_loss": -6.623067855834961, "global_step": 128523, "epoch": 3060} {"train_loss": -6.6324849128723145, "global_step": 128524, "epoch": 3060} {"train_loss": -6.708192348480225, "global_step": 128525, "epoch": 3060} {"train_loss": -6.618378639221191, "global_step": 128526, "epoch": 3060} {"train_loss": -6.581598281860352, "global_step": 128527, "epoch": 3060} {"train_loss": -6.621215343475342, "global_step": 128528, "epoch": 3060} {"train_loss": -6.59084415435791, "global_step": 128529, "epoch": 3060} {"train_loss": -6.56186056137085, "global_step": 128530, "epoch": 3060} {"train_loss": -6.6430768966674805, "global_step": 128531, "epoch": 3060} {"train_loss": -6.59446907043457, "global_step": 128532, "epoch": 3060} {"train_loss": -6.675293922424316, "global_step": 128533, "epoch": 3060} {"train_loss": -6.571540832519531, "global_step": 128534, "epoch": 3060} {"train_loss": -6.640806674957275, "global_step": 128535, "epoch": 3060} {"train_loss": -6.654142379760742, "global_step": 128536, "epoch": 3060} {"train_loss": -6.661691665649414, "global_step": 128537, "epoch": 3060} {"train_loss": -6.624708652496338, "global_step": 128538, "epoch": 3060} {"train_loss": -6.73858642578125, "global_step": 128539, "epoch": 3060} {"train_loss": -6.57094669342041, "global_step": 128540, "epoch": 3060} {"train_loss": -6.600926876068115, "global_step": 128541, "epoch": 3060} {"train_loss": -6.44980525970459, "global_step": 128542, "epoch": 3060} {"train_loss": -6.538315773010254, "global_step": 128543, "epoch": 3060} {"train_loss": -6.643977165222168, "global_step": 128544, "epoch": 3060} {"train_loss": -6.568238735198975, "global_step": 128545, "epoch": 3060} {"train_loss": -6.656769752502441, "global_step": 128546, "epoch": 3060} {"train_loss": -6.80184268951416, "global_step": 128547, "epoch": 3060} {"train_loss": -6.623285293579102, "global_step": 128548, "epoch": 3060} {"train_loss": -6.67255163192749, "global_step": 128549, "epoch": 3060} {"train_loss": -6.668840408325195, "global_step": 128550, "epoch": 3060} {"train_loss": -6.594383716583252, "global_step": 128551, "epoch": 3060} {"train_loss": -6.669727325439453, "global_step": 128552, "epoch": 3060} {"train_loss": -6.6577534675598145, "global_step": 128553, "epoch": 3060} {"train_loss": -6.633913993835449, "global_step": 128554, "epoch": 3060} {"train_loss": -6.675206661224365, "global_step": 128555, "epoch": 3060} {"train_loss": -6.568561553955078, "global_step": 128556, "epoch": 3060} {"train_loss": -6.691830635070801, "global_step": 128557, "epoch": 3060} {"train_loss": -6.653567314147949, "global_step": 128558, "epoch": 3060} {"train_loss": -6.560924530029297, "global_step": 128559, "epoch": 3060} {"train_loss": -6.635725021362305, "global_step": 128560, "epoch": 3060} {"train_loss": -6.630521694819133, "global_step": 128561, "epoch": 3060, "val_loss": 66394.8359375} {"train_loss": -6.671628952026367, "global_step": 128562, "epoch": 3061} {"train_loss": -6.674535751342773, "global_step": 128563, "epoch": 3061} {"train_loss": -6.653896331787109, "global_step": 128564, "epoch": 3061} {"train_loss": -6.6961565017700195, "global_step": 128565, "epoch": 3061} {"train_loss": -6.5480194091796875, "global_step": 128566, "epoch": 3061} {"train_loss": -6.672992706298828, "global_step": 128567, "epoch": 3061} {"train_loss": -6.775513172149658, "global_step": 128568, "epoch": 3061} {"train_loss": -6.655785083770752, "global_step": 128569, "epoch": 3061} {"train_loss": -6.743753910064697, "global_step": 128570, "epoch": 3061} {"train_loss": -6.699247360229492, "global_step": 128571, "epoch": 3061} {"train_loss": -6.656005859375, "global_step": 128572, "epoch": 3061} {"train_loss": -6.783457279205322, "global_step": 128573, "epoch": 3061} {"train_loss": -6.652535438537598, "global_step": 128574, "epoch": 3061} {"train_loss": -6.679740905761719, "global_step": 128575, "epoch": 3061} {"train_loss": -6.739767074584961, "global_step": 128576, "epoch": 3061} {"train_loss": -6.733227252960205, "global_step": 128577, "epoch": 3061} {"train_loss": -6.62169075012207, "global_step": 128578, "epoch": 3061} {"train_loss": -6.725945472717285, "global_step": 128579, "epoch": 3061} {"train_loss": -6.679462432861328, "global_step": 128580, "epoch": 3061} {"train_loss": -6.696562767028809, "global_step": 128581, "epoch": 3061} {"train_loss": -6.747078895568848, "global_step": 128582, "epoch": 3061} {"train_loss": -6.604375839233398, "global_step": 128583, "epoch": 3061} {"train_loss": -6.677984237670898, "global_step": 128584, "epoch": 3061} {"train_loss": -6.5709309577941895, "global_step": 128585, "epoch": 3061} {"train_loss": -6.716765403747559, "global_step": 128586, "epoch": 3061} {"train_loss": -6.665777206420898, "global_step": 128587, "epoch": 3061} {"train_loss": -6.514433860778809, "global_step": 128588, "epoch": 3061} {"train_loss": -6.647706985473633, "global_step": 128589, "epoch": 3061} {"train_loss": -6.5396552085876465, "global_step": 128590, "epoch": 3061} {"train_loss": -6.581906318664551, "global_step": 128591, "epoch": 3061} {"train_loss": -6.594801902770996, "global_step": 128592, "epoch": 3061} {"train_loss": -6.673250198364258, "global_step": 128593, "epoch": 3061} {"train_loss": -6.7168474197387695, "global_step": 128594, "epoch": 3061} {"train_loss": -6.5433125495910645, "global_step": 128595, "epoch": 3061} {"train_loss": -6.525571346282959, "global_step": 128596, "epoch": 3061} {"train_loss": -6.591285705566406, "global_step": 128597, "epoch": 3061} {"train_loss": -6.601652145385742, "global_step": 128598, "epoch": 3061} {"train_loss": -6.655780792236328, "global_step": 128599, "epoch": 3061} {"train_loss": -6.685028076171875, "global_step": 128600, "epoch": 3061} {"train_loss": -6.693758964538574, "global_step": 128601, "epoch": 3061} {"train_loss": -6.611475944519043, "global_step": 128602, "epoch": 3061} {"train_loss": -6.656984510875883, "global_step": 128603, "epoch": 3061, "val_loss": 66379.1875} {"train_loss": -6.692584037780762, "global_step": 128604, "epoch": 3062} {"train_loss": -6.695794582366943, "global_step": 128605, "epoch": 3062} {"train_loss": -6.725849151611328, "global_step": 128606, "epoch": 3062} {"train_loss": -6.6693525314331055, "global_step": 128607, "epoch": 3062} {"train_loss": -6.70893669128418, "global_step": 128608, "epoch": 3062} {"train_loss": -6.6276655197143555, "global_step": 128609, "epoch": 3062} {"train_loss": -6.6994476318359375, "global_step": 128610, "epoch": 3062} {"train_loss": -6.60590934753418, "global_step": 128611, "epoch": 3062} {"train_loss": -6.600645065307617, "global_step": 128612, "epoch": 3062} {"train_loss": -6.69966983795166, "global_step": 128613, "epoch": 3062} {"train_loss": -6.772363662719727, "global_step": 128614, "epoch": 3062} {"train_loss": -6.811717987060547, "global_step": 128615, "epoch": 3062} {"train_loss": -6.688201904296875, "global_step": 128616, "epoch": 3062} {"train_loss": -6.781045913696289, "global_step": 128617, "epoch": 3062} {"train_loss": -6.723822593688965, "global_step": 128618, "epoch": 3062} {"train_loss": -6.662558555603027, "global_step": 128619, "epoch": 3062} {"train_loss": -6.824150085449219, "global_step": 128620, "epoch": 3062} {"train_loss": -6.66413688659668, "global_step": 128621, "epoch": 3062} {"train_loss": -6.543813228607178, "global_step": 128622, "epoch": 3062} {"train_loss": -6.681941986083984, "global_step": 128623, "epoch": 3062} {"train_loss": -6.573862075805664, "global_step": 128624, "epoch": 3062} {"train_loss": -6.680813312530518, "global_step": 128625, "epoch": 3062} {"train_loss": -6.61286735534668, "global_step": 128626, "epoch": 3062} {"train_loss": -6.599853515625, "global_step": 128627, "epoch": 3062} {"train_loss": -6.581715106964111, "global_step": 128628, "epoch": 3062} {"train_loss": -6.615514755249023, "global_step": 128629, "epoch": 3062} {"train_loss": -6.629940509796143, "global_step": 128630, "epoch": 3062} {"train_loss": -6.631097793579102, "global_step": 128631, "epoch": 3062} {"train_loss": -6.550159454345703, "global_step": 128632, "epoch": 3062} {"train_loss": -6.582271099090576, "global_step": 128633, "epoch": 3062} {"train_loss": -6.617244720458984, "global_step": 128634, "epoch": 3062} {"train_loss": -6.606698036193848, "global_step": 128635, "epoch": 3062} {"train_loss": -6.595432281494141, "global_step": 128636, "epoch": 3062} {"train_loss": -6.613637924194336, "global_step": 128637, "epoch": 3062} {"train_loss": -6.751286506652832, "global_step": 128638, "epoch": 3062} {"train_loss": -6.6633453369140625, "global_step": 128639, "epoch": 3062} {"train_loss": -6.694519996643066, "global_step": 128640, "epoch": 3062} {"train_loss": -6.704990386962891, "global_step": 128641, "epoch": 3062} {"train_loss": -6.633111000061035, "global_step": 128642, "epoch": 3062} {"train_loss": -6.577217102050781, "global_step": 128643, "epoch": 3062} {"train_loss": -6.657632827758789, "global_step": 128644, "epoch": 3062} {"train_loss": -6.656639610018049, "global_step": 128645, "epoch": 3062, "val_loss": 66358.15625} {"train_loss": -6.523073673248291, "global_step": 128646, "epoch": 3063} {"train_loss": -6.64930534362793, "global_step": 128647, "epoch": 3063} {"train_loss": -6.59790563583374, "global_step": 128648, "epoch": 3063} {"train_loss": -6.624303817749023, "global_step": 128649, "epoch": 3063} {"train_loss": -6.734621524810791, "global_step": 128650, "epoch": 3063} {"train_loss": -6.727903366088867, "global_step": 128651, "epoch": 3063} {"train_loss": -6.532198905944824, "global_step": 128652, "epoch": 3063} {"train_loss": -6.830167770385742, "global_step": 128653, "epoch": 3063} {"train_loss": -6.691134452819824, "global_step": 128654, "epoch": 3063} {"train_loss": -6.6574249267578125, "global_step": 128655, "epoch": 3063} {"train_loss": -6.65895938873291, "global_step": 128656, "epoch": 3063} {"train_loss": -6.634078025817871, "global_step": 128657, "epoch": 3063} {"train_loss": -6.715276718139648, "global_step": 128658, "epoch": 3063} {"train_loss": -6.5667877197265625, "global_step": 128659, "epoch": 3063} {"train_loss": -6.650155067443848, "global_step": 128660, "epoch": 3063} {"train_loss": -6.547973155975342, "global_step": 128661, "epoch": 3063} {"train_loss": -6.732688903808594, "global_step": 128662, "epoch": 3063} {"train_loss": -6.610852241516113, "global_step": 128663, "epoch": 3063} {"train_loss": -6.6761980056762695, "global_step": 128664, "epoch": 3063} {"train_loss": -6.713221549987793, "global_step": 128665, "epoch": 3063} {"train_loss": -6.710792541503906, "global_step": 128666, "epoch": 3063} {"train_loss": -6.666626930236816, "global_step": 128667, "epoch": 3063} {"train_loss": -6.631175994873047, "global_step": 128668, "epoch": 3063} {"train_loss": -6.584342002868652, "global_step": 128669, "epoch": 3063} {"train_loss": -6.740389823913574, "global_step": 128670, "epoch": 3063} {"train_loss": -6.564783096313477, "global_step": 128671, "epoch": 3063} {"train_loss": -6.6310133934021, "global_step": 128672, "epoch": 3063} {"train_loss": -6.687087059020996, "global_step": 128673, "epoch": 3063} {"train_loss": -6.580259799957275, "global_step": 128674, "epoch": 3063} {"train_loss": -6.64555549621582, "global_step": 128675, "epoch": 3063} {"train_loss": -6.681133270263672, "global_step": 128676, "epoch": 3063} {"train_loss": -6.700424671173096, "global_step": 128677, "epoch": 3063} {"train_loss": -6.737668037414551, "global_step": 128678, "epoch": 3063} {"train_loss": -6.682656288146973, "global_step": 128679, "epoch": 3063} {"train_loss": -6.677199840545654, "global_step": 128680, "epoch": 3063} {"train_loss": -6.646248817443848, "global_step": 128681, "epoch": 3063} {"train_loss": -6.608996868133545, "global_step": 128682, "epoch": 3063} {"train_loss": -6.65758752822876, "global_step": 128683, "epoch": 3063} {"train_loss": -6.534339904785156, "global_step": 128684, "epoch": 3063} {"train_loss": -6.708374977111816, "global_step": 128685, "epoch": 3063} {"train_loss": -6.540156841278076, "global_step": 128686, "epoch": 3063} {"train_loss": -6.652494453248524, "global_step": 128687, "epoch": 3063, "val_loss": 66551.6484375} {"train_loss": -6.58150577545166, "global_step": 128688, "epoch": 3064} {"train_loss": -6.552334308624268, "global_step": 128689, "epoch": 3064} {"train_loss": -6.657103538513184, "global_step": 128690, "epoch": 3064} {"train_loss": -6.605425834655762, "global_step": 128691, "epoch": 3064} {"train_loss": -6.565223693847656, "global_step": 128692, "epoch": 3064} {"train_loss": -6.540443420410156, "global_step": 128693, "epoch": 3064} {"train_loss": -6.664932727813721, "global_step": 128694, "epoch": 3064} {"train_loss": -6.583744049072266, "global_step": 128695, "epoch": 3064} {"train_loss": -6.621335029602051, "global_step": 128696, "epoch": 3064} {"train_loss": -6.610037326812744, "global_step": 128697, "epoch": 3064} {"train_loss": -6.606563091278076, "global_step": 128698, "epoch": 3064} {"train_loss": -6.514371395111084, "global_step": 128699, "epoch": 3064} {"train_loss": -6.59724235534668, "global_step": 128700, "epoch": 3064} {"train_loss": -6.658644199371338, "global_step": 128701, "epoch": 3064} {"train_loss": -6.471157550811768, "global_step": 128702, "epoch": 3064} {"train_loss": -6.549912452697754, "global_step": 128703, "epoch": 3064} {"train_loss": -6.613945960998535, "global_step": 128704, "epoch": 3064} {"train_loss": -6.62321662902832, "global_step": 128705, "epoch": 3064} {"train_loss": -6.666205406188965, "global_step": 128706, "epoch": 3064} {"train_loss": -6.506396293640137, "global_step": 128707, "epoch": 3064} {"train_loss": -6.698145866394043, "global_step": 128708, "epoch": 3064} {"train_loss": -6.5754852294921875, "global_step": 128709, "epoch": 3064} {"train_loss": -6.5415730476379395, "global_step": 128710, "epoch": 3064} {"train_loss": -6.730017185211182, "global_step": 128711, "epoch": 3064} {"train_loss": -6.598263740539551, "global_step": 128712, "epoch": 3064} {"train_loss": -6.703493118286133, "global_step": 128713, "epoch": 3064} {"train_loss": -6.727457046508789, "global_step": 128714, "epoch": 3064} {"train_loss": -6.66485595703125, "global_step": 128715, "epoch": 3064} {"train_loss": -6.737222194671631, "global_step": 128716, "epoch": 3064} {"train_loss": -6.6058855056762695, "global_step": 128717, "epoch": 3064} {"train_loss": -6.662716865539551, "global_step": 128718, "epoch": 3064} {"train_loss": -6.767354965209961, "global_step": 128719, "epoch": 3064} {"train_loss": -6.496813774108887, "global_step": 128720, "epoch": 3064} {"train_loss": -6.788096904754639, "global_step": 128721, "epoch": 3064} {"train_loss": -6.604706764221191, "global_step": 128722, "epoch": 3064} {"train_loss": -6.457784652709961, "global_step": 128723, "epoch": 3064} {"train_loss": -6.7095441818237305, "global_step": 128724, "epoch": 3064} {"train_loss": -6.433938980102539, "global_step": 128725, "epoch": 3064} {"train_loss": -6.62307071685791, "global_step": 128726, "epoch": 3064} {"train_loss": -6.697283744812012, "global_step": 128727, "epoch": 3064} {"train_loss": -6.526178359985352, "global_step": 128728, "epoch": 3064} {"train_loss": -6.613133793785458, "global_step": 128729, "epoch": 3064, "val_loss": 66543.4375} {"train_loss": -6.597236633300781, "global_step": 128730, "epoch": 3065} {"train_loss": -6.638894557952881, "global_step": 128731, "epoch": 3065} {"train_loss": -6.666045665740967, "global_step": 128732, "epoch": 3065} {"train_loss": -6.719386100769043, "global_step": 128733, "epoch": 3065} {"train_loss": -6.533125877380371, "global_step": 128734, "epoch": 3065} {"train_loss": -6.6004180908203125, "global_step": 128735, "epoch": 3065} {"train_loss": -6.617177963256836, "global_step": 128736, "epoch": 3065} {"train_loss": -6.555882930755615, "global_step": 128737, "epoch": 3065} {"train_loss": -6.535469055175781, "global_step": 128738, "epoch": 3065} {"train_loss": -6.550140857696533, "global_step": 128739, "epoch": 3065} {"train_loss": -6.563848495483398, "global_step": 128740, "epoch": 3065} {"train_loss": -6.578470230102539, "global_step": 128741, "epoch": 3065} {"train_loss": -6.591122627258301, "global_step": 128742, "epoch": 3065} {"train_loss": -6.582788467407227, "global_step": 128743, "epoch": 3065} {"train_loss": -6.7288818359375, "global_step": 128744, "epoch": 3065} {"train_loss": -6.6322126388549805, "global_step": 128745, "epoch": 3065} {"train_loss": -6.656890869140625, "global_step": 128746, "epoch": 3065} {"train_loss": -6.583189010620117, "global_step": 128747, "epoch": 3065} {"train_loss": -6.638655662536621, "global_step": 128748, "epoch": 3065} {"train_loss": -6.678805351257324, "global_step": 128749, "epoch": 3065} {"train_loss": -6.689089298248291, "global_step": 128750, "epoch": 3065} {"train_loss": -6.609086036682129, "global_step": 128751, "epoch": 3065} {"train_loss": -6.670832633972168, "global_step": 128752, "epoch": 3065} {"train_loss": -6.715689659118652, "global_step": 128753, "epoch": 3065} {"train_loss": -6.605844974517822, "global_step": 128754, "epoch": 3065} {"train_loss": -6.577574729919434, "global_step": 128755, "epoch": 3065} {"train_loss": -6.745034217834473, "global_step": 128756, "epoch": 3065} {"train_loss": -6.643450736999512, "global_step": 128757, "epoch": 3065} {"train_loss": -6.732353210449219, "global_step": 128758, "epoch": 3065} {"train_loss": -6.634060859680176, "global_step": 128759, "epoch": 3065} {"train_loss": -6.7593841552734375, "global_step": 128760, "epoch": 3065} {"train_loss": -6.548187255859375, "global_step": 128761, "epoch": 3065} {"train_loss": -6.681960105895996, "global_step": 128762, "epoch": 3065} {"train_loss": -6.740612983703613, "global_step": 128763, "epoch": 3065} {"train_loss": -6.646921157836914, "global_step": 128764, "epoch": 3065} {"train_loss": -6.711116790771484, "global_step": 128765, "epoch": 3065} {"train_loss": -6.739910125732422, "global_step": 128766, "epoch": 3065} {"train_loss": -6.648842811584473, "global_step": 128767, "epoch": 3065} {"train_loss": -6.575812339782715, "global_step": 128768, "epoch": 3065} {"train_loss": -6.595450401306152, "global_step": 128769, "epoch": 3065} {"train_loss": -6.549437522888184, "global_step": 128770, "epoch": 3065} {"train_loss": -6.635653064364479, "global_step": 128771, "epoch": 3065, "val_loss": 66481.7109375} {"train_loss": -6.461254119873047, "global_step": 128772, "epoch": 3066} {"train_loss": -6.7255659103393555, "global_step": 128773, "epoch": 3066} {"train_loss": -6.721517562866211, "global_step": 128774, "epoch": 3066} {"train_loss": -6.515026569366455, "global_step": 128775, "epoch": 3066} {"train_loss": -6.634453773498535, "global_step": 128776, "epoch": 3066} {"train_loss": -6.65290641784668, "global_step": 128777, "epoch": 3066} {"train_loss": -6.53233528137207, "global_step": 128778, "epoch": 3066} {"train_loss": -6.626343727111816, "global_step": 128779, "epoch": 3066} {"train_loss": -6.754993915557861, "global_step": 128780, "epoch": 3066} {"train_loss": -6.642453670501709, "global_step": 128781, "epoch": 3066} {"train_loss": -6.786025047302246, "global_step": 128782, "epoch": 3066} {"train_loss": -6.621115684509277, "global_step": 128783, "epoch": 3066} {"train_loss": -6.649174690246582, "global_step": 128784, "epoch": 3066} {"train_loss": -6.68046236038208, "global_step": 128785, "epoch": 3066} {"train_loss": -6.65206241607666, "global_step": 128786, "epoch": 3066} {"train_loss": -6.598947525024414, "global_step": 128787, "epoch": 3066} {"train_loss": -6.578108310699463, "global_step": 128788, "epoch": 3066} {"train_loss": -6.59332275390625, "global_step": 128789, "epoch": 3066} {"train_loss": -6.741238117218018, "global_step": 128790, "epoch": 3066} {"train_loss": -6.665156841278076, "global_step": 128791, "epoch": 3066} {"train_loss": -6.770987033843994, "global_step": 128792, "epoch": 3066} {"train_loss": -6.648866176605225, "global_step": 128793, "epoch": 3066} {"train_loss": -6.608506202697754, "global_step": 128794, "epoch": 3066} {"train_loss": -6.732064247131348, "global_step": 128795, "epoch": 3066} {"train_loss": -6.725569725036621, "global_step": 128796, "epoch": 3066} {"train_loss": -6.569836616516113, "global_step": 128797, "epoch": 3066} {"train_loss": -6.789316177368164, "global_step": 128798, "epoch": 3066} {"train_loss": -6.6000213623046875, "global_step": 128799, "epoch": 3066} {"train_loss": -6.709902763366699, "global_step": 128800, "epoch": 3066} {"train_loss": -6.64017391204834, "global_step": 128801, "epoch": 3066} {"train_loss": -6.52997350692749, "global_step": 128802, "epoch": 3066} {"train_loss": -6.692804336547852, "global_step": 128803, "epoch": 3066} {"train_loss": -6.512066841125488, "global_step": 128804, "epoch": 3066} {"train_loss": -6.653811454772949, "global_step": 128805, "epoch": 3066} {"train_loss": -6.61857795715332, "global_step": 128806, "epoch": 3066} {"train_loss": -6.729041576385498, "global_step": 128807, "epoch": 3066} {"train_loss": -6.591617584228516, "global_step": 128808, "epoch": 3066} {"train_loss": -6.716403961181641, "global_step": 128809, "epoch": 3066} {"train_loss": -6.597596168518066, "global_step": 128810, "epoch": 3066} {"train_loss": -6.632633686065674, "global_step": 128811, "epoch": 3066} {"train_loss": -6.67623233795166, "global_step": 128812, "epoch": 3066} {"train_loss": -6.647263356617519, "global_step": 128813, "epoch": 3066, "val_loss": 66316.6953125} {"train_loss": -6.689602851867676, "global_step": 128814, "epoch": 3067} {"train_loss": -6.707282543182373, "global_step": 128815, "epoch": 3067} {"train_loss": -6.719094276428223, "global_step": 128816, "epoch": 3067} {"train_loss": -6.718156814575195, "global_step": 128817, "epoch": 3067} {"train_loss": -6.671493053436279, "global_step": 128818, "epoch": 3067} {"train_loss": -6.572562217712402, "global_step": 128819, "epoch": 3067} {"train_loss": -6.642923355102539, "global_step": 128820, "epoch": 3067} {"train_loss": -6.5993218421936035, "global_step": 128821, "epoch": 3067} {"train_loss": -6.580437660217285, "global_step": 128822, "epoch": 3067} {"train_loss": -6.676766872406006, "global_step": 128823, "epoch": 3067} {"train_loss": -6.508412837982178, "global_step": 128824, "epoch": 3067} {"train_loss": -6.560384273529053, "global_step": 128825, "epoch": 3067} {"train_loss": -6.454039096832275, "global_step": 128826, "epoch": 3067} {"train_loss": -6.67056941986084, "global_step": 128827, "epoch": 3067} {"train_loss": -6.570349216461182, "global_step": 128828, "epoch": 3067} {"train_loss": -6.593067169189453, "global_step": 128829, "epoch": 3067} {"train_loss": -6.622292995452881, "global_step": 128830, "epoch": 3067} {"train_loss": -6.659127712249756, "global_step": 128831, "epoch": 3067} {"train_loss": -6.7593793869018555, "global_step": 128832, "epoch": 3067} {"train_loss": -6.605635643005371, "global_step": 128833, "epoch": 3067} {"train_loss": -6.566028118133545, "global_step": 128834, "epoch": 3067} {"train_loss": -6.697086334228516, "global_step": 128835, "epoch": 3067} {"train_loss": -6.491642951965332, "global_step": 128836, "epoch": 3067} {"train_loss": -6.599016189575195, "global_step": 128837, "epoch": 3067} {"train_loss": -6.614499092102051, "global_step": 128838, "epoch": 3067} {"train_loss": -6.681563377380371, "global_step": 128839, "epoch": 3067} {"train_loss": -6.647568702697754, "global_step": 128840, "epoch": 3067} {"train_loss": -6.507570743560791, "global_step": 128841, "epoch": 3067} {"train_loss": -6.617166519165039, "global_step": 128842, "epoch": 3067} {"train_loss": -6.5428619384765625, "global_step": 128843, "epoch": 3067} {"train_loss": -6.616367816925049, "global_step": 128844, "epoch": 3067} {"train_loss": -6.505428791046143, "global_step": 128845, "epoch": 3067} {"train_loss": -6.532800197601318, "global_step": 128846, "epoch": 3067} {"train_loss": -6.532439231872559, "global_step": 128847, "epoch": 3067} {"train_loss": -6.571685791015625, "global_step": 128848, "epoch": 3067} {"train_loss": -6.609718322753906, "global_step": 128849, "epoch": 3067} {"train_loss": -6.619107246398926, "global_step": 128850, "epoch": 3067} {"train_loss": -6.584645748138428, "global_step": 128851, "epoch": 3067} {"train_loss": -6.625214576721191, "global_step": 128852, "epoch": 3067} {"train_loss": -6.653382301330566, "global_step": 128853, "epoch": 3067} {"train_loss": -6.602238178253174, "global_step": 128854, "epoch": 3067} {"train_loss": -6.608097859791347, "global_step": 128855, "epoch": 3067, "val_loss": 66450.7109375} {"train_loss": -6.612290382385254, "global_step": 128856, "epoch": 3068} {"train_loss": -6.630815029144287, "global_step": 128857, "epoch": 3068} {"train_loss": -6.741613388061523, "global_step": 128858, "epoch": 3068} {"train_loss": -6.600797653198242, "global_step": 128859, "epoch": 3068} {"train_loss": -6.5902323722839355, "global_step": 128860, "epoch": 3068} {"train_loss": -6.753896713256836, "global_step": 128861, "epoch": 3068} {"train_loss": -6.75789213180542, "global_step": 128862, "epoch": 3068} {"train_loss": -6.569447040557861, "global_step": 128863, "epoch": 3068} {"train_loss": -6.656589031219482, "global_step": 128864, "epoch": 3068} {"train_loss": -6.771507263183594, "global_step": 128865, "epoch": 3068} {"train_loss": -6.6066789627075195, "global_step": 128866, "epoch": 3068} {"train_loss": -6.741972923278809, "global_step": 128867, "epoch": 3068} {"train_loss": -6.536309242248535, "global_step": 128868, "epoch": 3068} {"train_loss": -6.679004669189453, "global_step": 128869, "epoch": 3068} {"train_loss": -6.644050598144531, "global_step": 128870, "epoch": 3068} {"train_loss": -6.574131965637207, "global_step": 128871, "epoch": 3068} {"train_loss": -6.758337497711182, "global_step": 128872, "epoch": 3068} {"train_loss": -6.614263534545898, "global_step": 128873, "epoch": 3068} {"train_loss": -6.7018046379089355, "global_step": 128874, "epoch": 3068} {"train_loss": -6.662683963775635, "global_step": 128875, "epoch": 3068} {"train_loss": -6.646455764770508, "global_step": 128876, "epoch": 3068} {"train_loss": -6.670877456665039, "global_step": 128877, "epoch": 3068} {"train_loss": -6.62324857711792, "global_step": 128878, "epoch": 3068} {"train_loss": -6.577605247497559, "global_step": 128879, "epoch": 3068} {"train_loss": -6.622591495513916, "global_step": 128880, "epoch": 3068} {"train_loss": -6.689036846160889, "global_step": 128881, "epoch": 3068} {"train_loss": -6.704938888549805, "global_step": 128882, "epoch": 3068} {"train_loss": -6.562557220458984, "global_step": 128883, "epoch": 3068} {"train_loss": -6.712830543518066, "global_step": 128884, "epoch": 3068} {"train_loss": -6.6381683349609375, "global_step": 128885, "epoch": 3068} {"train_loss": -6.646615028381348, "global_step": 128886, "epoch": 3068} {"train_loss": -6.6785688400268555, "global_step": 128887, "epoch": 3068} {"train_loss": -6.710761070251465, "global_step": 128888, "epoch": 3068} {"train_loss": -6.709983825683594, "global_step": 128889, "epoch": 3068} {"train_loss": -6.6108293533325195, "global_step": 128890, "epoch": 3068} {"train_loss": -6.681365966796875, "global_step": 128891, "epoch": 3068} {"train_loss": -6.65968132019043, "global_step": 128892, "epoch": 3068} {"train_loss": -6.707230567932129, "global_step": 128893, "epoch": 3068} {"train_loss": -6.710506439208984, "global_step": 128894, "epoch": 3068} {"train_loss": -6.705498695373535, "global_step": 128895, "epoch": 3068} {"train_loss": -6.677063941955566, "global_step": 128896, "epoch": 3068} {"train_loss": -6.66060251281375, "global_step": 128897, "epoch": 3068, "val_loss": 66491.0546875} {"train_loss": -6.622513294219971, "global_step": 128898, "epoch": 3069} {"train_loss": -6.667598724365234, "global_step": 128899, "epoch": 3069} {"train_loss": -6.643218994140625, "global_step": 128900, "epoch": 3069} {"train_loss": -6.565847396850586, "global_step": 128901, "epoch": 3069} {"train_loss": -6.647517204284668, "global_step": 128902, "epoch": 3069} {"train_loss": -6.751803398132324, "global_step": 128903, "epoch": 3069} {"train_loss": -6.649363994598389, "global_step": 128904, "epoch": 3069} {"train_loss": -6.523462295532227, "global_step": 128905, "epoch": 3069} {"train_loss": -6.681026458740234, "global_step": 128906, "epoch": 3069} {"train_loss": -6.65964412689209, "global_step": 128907, "epoch": 3069} {"train_loss": -6.672669887542725, "global_step": 128908, "epoch": 3069} {"train_loss": -6.684865474700928, "global_step": 128909, "epoch": 3069} {"train_loss": -6.564589977264404, "global_step": 128910, "epoch": 3069} {"train_loss": -6.6637115478515625, "global_step": 128911, "epoch": 3069} {"train_loss": -6.609943389892578, "global_step": 128912, "epoch": 3069} {"train_loss": -6.535460948944092, "global_step": 128913, "epoch": 3069} {"train_loss": -6.591242790222168, "global_step": 128914, "epoch": 3069} {"train_loss": -6.636518955230713, "global_step": 128915, "epoch": 3069} {"train_loss": -6.766417503356934, "global_step": 128916, "epoch": 3069} {"train_loss": -6.629989147186279, "global_step": 128917, "epoch": 3069} {"train_loss": -6.544291019439697, "global_step": 128918, "epoch": 3069} {"train_loss": -6.714193820953369, "global_step": 128919, "epoch": 3069} {"train_loss": -6.580689430236816, "global_step": 128920, "epoch": 3069} {"train_loss": -6.715334892272949, "global_step": 128921, "epoch": 3069} {"train_loss": -6.621088981628418, "global_step": 128922, "epoch": 3069} {"train_loss": -6.698302268981934, "global_step": 128923, "epoch": 3069} {"train_loss": -6.656759262084961, "global_step": 128924, "epoch": 3069} {"train_loss": -6.6221184730529785, "global_step": 128925, "epoch": 3069} {"train_loss": -6.619765758514404, "global_step": 128926, "epoch": 3069} {"train_loss": -6.553954124450684, "global_step": 128927, "epoch": 3069} {"train_loss": -6.647109031677246, "global_step": 128928, "epoch": 3069} {"train_loss": -6.6180033683776855, "global_step": 128929, "epoch": 3069} {"train_loss": -6.649023532867432, "global_step": 128930, "epoch": 3069} {"train_loss": -6.567203998565674, "global_step": 128931, "epoch": 3069} {"train_loss": -6.744345664978027, "global_step": 128932, "epoch": 3069} {"train_loss": -6.558463096618652, "global_step": 128933, "epoch": 3069} {"train_loss": -6.639537334442139, "global_step": 128934, "epoch": 3069} {"train_loss": -6.730647087097168, "global_step": 128935, "epoch": 3069} {"train_loss": -6.593236923217773, "global_step": 128936, "epoch": 3069} {"train_loss": -6.679207801818848, "global_step": 128937, "epoch": 3069} {"train_loss": -6.661037445068359, "global_step": 128938, "epoch": 3069} {"train_loss": -6.637280884243193, "global_step": 128939, "epoch": 3069, "val_loss": 66405.8984375} {"train_loss": -6.663461685180664, "global_step": 128940, "epoch": 3070} {"train_loss": -6.6472697257995605, "global_step": 128941, "epoch": 3070} {"train_loss": -6.710087299346924, "global_step": 128942, "epoch": 3070} {"train_loss": -6.571619987487793, "global_step": 128943, "epoch": 3070} {"train_loss": -6.686964511871338, "global_step": 128944, "epoch": 3070} {"train_loss": -6.6396484375, "global_step": 128945, "epoch": 3070} {"train_loss": -6.633715629577637, "global_step": 128946, "epoch": 3070} {"train_loss": -6.685454368591309, "global_step": 128947, "epoch": 3070} {"train_loss": -6.7042951583862305, "global_step": 128948, "epoch": 3070} {"train_loss": -6.730915546417236, "global_step": 128949, "epoch": 3070} {"train_loss": -6.6725754737854, "global_step": 128950, "epoch": 3070} {"train_loss": -6.743882656097412, "global_step": 128951, "epoch": 3070} {"train_loss": -6.667156219482422, "global_step": 128952, "epoch": 3070} {"train_loss": -6.668384552001953, "global_step": 128953, "epoch": 3070} {"train_loss": -6.685932159423828, "global_step": 128954, "epoch": 3070} {"train_loss": -6.523748874664307, "global_step": 128955, "epoch": 3070} {"train_loss": -6.653482913970947, "global_step": 128956, "epoch": 3070} {"train_loss": -6.638913154602051, "global_step": 128957, "epoch": 3070} {"train_loss": -6.619187355041504, "global_step": 128958, "epoch": 3070} {"train_loss": -6.725588798522949, "global_step": 128959, "epoch": 3070} {"train_loss": -6.738805294036865, "global_step": 128960, "epoch": 3070} {"train_loss": -6.710916519165039, "global_step": 128961, "epoch": 3070} {"train_loss": -6.74098539352417, "global_step": 128962, "epoch": 3070} {"train_loss": -6.654005527496338, "global_step": 128963, "epoch": 3070} {"train_loss": -6.8006696701049805, "global_step": 128964, "epoch": 3070} {"train_loss": -6.715607643127441, "global_step": 128965, "epoch": 3070} {"train_loss": -6.570945739746094, "global_step": 128966, "epoch": 3070} {"train_loss": -6.65125846862793, "global_step": 128967, "epoch": 3070} {"train_loss": -6.733687877655029, "global_step": 128968, "epoch": 3070} {"train_loss": -6.706605911254883, "global_step": 128969, "epoch": 3070} {"train_loss": -6.752974510192871, "global_step": 128970, "epoch": 3070} {"train_loss": -6.615184783935547, "global_step": 128971, "epoch": 3070} {"train_loss": -6.753177642822266, "global_step": 128972, "epoch": 3070} {"train_loss": -6.785714149475098, "global_step": 128973, "epoch": 3070} {"train_loss": -6.714264392852783, "global_step": 128974, "epoch": 3070} {"train_loss": -6.689797401428223, "global_step": 128975, "epoch": 3070} {"train_loss": -6.670190334320068, "global_step": 128976, "epoch": 3070} {"train_loss": -6.55471134185791, "global_step": 128977, "epoch": 3070} {"train_loss": -6.632126808166504, "global_step": 128978, "epoch": 3070} {"train_loss": -6.519444465637207, "global_step": 128979, "epoch": 3070} {"train_loss": -6.61240291595459, "global_step": 128980, "epoch": 3070} {"train_loss": -6.6729573749360585, "global_step": 128981, "epoch": 3070, "val_loss": 66858.375} {"train_loss": -6.635437488555908, "global_step": 128982, "epoch": 3071} {"train_loss": -6.737393856048584, "global_step": 128983, "epoch": 3071} {"train_loss": -6.550899028778076, "global_step": 128984, "epoch": 3071} {"train_loss": -6.67520809173584, "global_step": 128985, "epoch": 3071} {"train_loss": -6.599468231201172, "global_step": 128986, "epoch": 3071} {"train_loss": -6.804546356201172, "global_step": 128987, "epoch": 3071} {"train_loss": -6.645559787750244, "global_step": 128988, "epoch": 3071} {"train_loss": -6.661539077758789, "global_step": 128989, "epoch": 3071} {"train_loss": -6.709690093994141, "global_step": 128990, "epoch": 3071} {"train_loss": -6.642765045166016, "global_step": 128991, "epoch": 3071} {"train_loss": -6.598868370056152, "global_step": 128992, "epoch": 3071} {"train_loss": -6.670530796051025, "global_step": 128993, "epoch": 3071} {"train_loss": -6.663469314575195, "global_step": 128994, "epoch": 3071} {"train_loss": -6.5770978927612305, "global_step": 128995, "epoch": 3071} {"train_loss": -6.637833118438721, "global_step": 128996, "epoch": 3071} {"train_loss": -6.603130340576172, "global_step": 128997, "epoch": 3071} {"train_loss": -6.6410746574401855, "global_step": 128998, "epoch": 3071} {"train_loss": -6.549726963043213, "global_step": 128999, "epoch": 3071} {"train_loss": -6.58326530456543, "global_step": 129000, "epoch": 3071} {"train_loss": -6.630796909332275, "global_step": 129001, "epoch": 3071} {"train_loss": -6.668551445007324, "global_step": 129002, "epoch": 3071} {"train_loss": -6.5622758865356445, "global_step": 129003, "epoch": 3071} {"train_loss": -6.656742095947266, "global_step": 129004, "epoch": 3071} {"train_loss": -6.610710144042969, "global_step": 129005, "epoch": 3071} {"train_loss": -6.589437484741211, "global_step": 129006, "epoch": 3071} {"train_loss": -6.618729591369629, "global_step": 129007, "epoch": 3071} {"train_loss": -6.513260841369629, "global_step": 129008, "epoch": 3071} {"train_loss": -6.648538589477539, "global_step": 129009, "epoch": 3071} {"train_loss": -6.770744323730469, "global_step": 129010, "epoch": 3071} {"train_loss": -6.628223896026611, "global_step": 129011, "epoch": 3071} {"train_loss": -6.594058036804199, "global_step": 129012, "epoch": 3071} {"train_loss": -6.702606201171875, "global_step": 129013, "epoch": 3071} {"train_loss": -6.653623580932617, "global_step": 129014, "epoch": 3071} {"train_loss": -6.658245086669922, "global_step": 129015, "epoch": 3071} {"train_loss": -6.675950050354004, "global_step": 129016, "epoch": 3071} {"train_loss": -6.5835466384887695, "global_step": 129017, "epoch": 3071} {"train_loss": -6.695805549621582, "global_step": 129018, "epoch": 3071} {"train_loss": -6.5818586349487305, "global_step": 129019, "epoch": 3071} {"train_loss": -6.6604413986206055, "global_step": 129020, "epoch": 3071} {"train_loss": -6.630066871643066, "global_step": 129021, "epoch": 3071} {"train_loss": -6.585531711578369, "global_step": 129022, "epoch": 3071} {"train_loss": -6.636307443891253, "global_step": 129023, "epoch": 3071, "val_loss": 66162.6640625} {"train_loss": -6.642576694488525, "global_step": 129024, "epoch": 3072} {"train_loss": -6.51777982711792, "global_step": 129025, "epoch": 3072} {"train_loss": -6.571627616882324, "global_step": 129026, "epoch": 3072} {"train_loss": -6.593595504760742, "global_step": 129027, "epoch": 3072} {"train_loss": -6.551206111907959, "global_step": 129028, "epoch": 3072} {"train_loss": -6.6663618087768555, "global_step": 129029, "epoch": 3072} {"train_loss": -6.637424468994141, "global_step": 129030, "epoch": 3072} {"train_loss": -6.647267818450928, "global_step": 129031, "epoch": 3072} {"train_loss": -6.694442272186279, "global_step": 129032, "epoch": 3072} {"train_loss": -6.631731033325195, "global_step": 129033, "epoch": 3072} {"train_loss": -6.7414655685424805, "global_step": 129034, "epoch": 3072} {"train_loss": -6.700405597686768, "global_step": 129035, "epoch": 3072} {"train_loss": -6.843073844909668, "global_step": 129036, "epoch": 3072} {"train_loss": -6.579951763153076, "global_step": 129037, "epoch": 3072} {"train_loss": -6.647825241088867, "global_step": 129038, "epoch": 3072} {"train_loss": -6.648141384124756, "global_step": 129039, "epoch": 3072} {"train_loss": -6.727109432220459, "global_step": 129040, "epoch": 3072} {"train_loss": -6.645078659057617, "global_step": 129041, "epoch": 3072} {"train_loss": -6.60659646987915, "global_step": 129042, "epoch": 3072} {"train_loss": -6.738703727722168, "global_step": 129043, "epoch": 3072} {"train_loss": -6.5564985275268555, "global_step": 129044, "epoch": 3072} {"train_loss": -6.6724066734313965, "global_step": 129045, "epoch": 3072} {"train_loss": -6.733047962188721, "global_step": 129046, "epoch": 3072} {"train_loss": -6.480047702789307, "global_step": 129047, "epoch": 3072} {"train_loss": -6.814633369445801, "global_step": 129048, "epoch": 3072} {"train_loss": -6.652066230773926, "global_step": 129049, "epoch": 3072} {"train_loss": -6.623679161071777, "global_step": 129050, "epoch": 3072} {"train_loss": -6.718108177185059, "global_step": 129051, "epoch": 3072} {"train_loss": -6.695259094238281, "global_step": 129052, "epoch": 3072} {"train_loss": -6.693784236907959, "global_step": 129053, "epoch": 3072} {"train_loss": -6.754166603088379, "global_step": 129054, "epoch": 3072} {"train_loss": -6.777866363525391, "global_step": 129055, "epoch": 3072} {"train_loss": -6.667160987854004, "global_step": 129056, "epoch": 3072} {"train_loss": -6.653183460235596, "global_step": 129057, "epoch": 3072} {"train_loss": -6.603385925292969, "global_step": 129058, "epoch": 3072} {"train_loss": -6.720731735229492, "global_step": 129059, "epoch": 3072} {"train_loss": -6.510505676269531, "global_step": 129060, "epoch": 3072} {"train_loss": -6.636202335357666, "global_step": 129061, "epoch": 3072} {"train_loss": -6.617502689361572, "global_step": 129062, "epoch": 3072} {"train_loss": -6.664497375488281, "global_step": 129063, "epoch": 3072} {"train_loss": -6.612910747528076, "global_step": 129064, "epoch": 3072} {"train_loss": -6.654116698673794, "global_step": 129065, "epoch": 3072, "val_loss": 66592.6953125} {"train_loss": -6.58351993560791, "global_step": 129066, "epoch": 3073} {"train_loss": -6.565115928649902, "global_step": 129067, "epoch": 3073} {"train_loss": -6.681332111358643, "global_step": 129068, "epoch": 3073} {"train_loss": -6.61203670501709, "global_step": 129069, "epoch": 3073} {"train_loss": -6.724461078643799, "global_step": 129070, "epoch": 3073} {"train_loss": -6.63067626953125, "global_step": 129071, "epoch": 3073} {"train_loss": -6.724952697753906, "global_step": 129072, "epoch": 3073} {"train_loss": -6.554035186767578, "global_step": 129073, "epoch": 3073} {"train_loss": -6.670890808105469, "global_step": 129074, "epoch": 3073} {"train_loss": -6.7214460372924805, "global_step": 129075, "epoch": 3073} {"train_loss": -6.76143741607666, "global_step": 129076, "epoch": 3073} {"train_loss": -6.721625328063965, "global_step": 129077, "epoch": 3073} {"train_loss": -6.779856204986572, "global_step": 129078, "epoch": 3073} {"train_loss": -6.659999847412109, "global_step": 129079, "epoch": 3073} {"train_loss": -6.597551345825195, "global_step": 129080, "epoch": 3073} {"train_loss": -6.658614635467529, "global_step": 129081, "epoch": 3073} {"train_loss": -6.488928318023682, "global_step": 129082, "epoch": 3073} {"train_loss": -6.385246276855469, "global_step": 129083, "epoch": 3073} {"train_loss": -6.608272552490234, "global_step": 129084, "epoch": 3073} {"train_loss": -6.609127998352051, "global_step": 129085, "epoch": 3073} {"train_loss": -6.521542549133301, "global_step": 129086, "epoch": 3073} {"train_loss": -6.541808128356934, "global_step": 129087, "epoch": 3073} {"train_loss": -6.5435686111450195, "global_step": 129088, "epoch": 3073} {"train_loss": -6.648530006408691, "global_step": 129089, "epoch": 3073} {"train_loss": -6.634265899658203, "global_step": 129090, "epoch": 3073} {"train_loss": -6.668824195861816, "global_step": 129091, "epoch": 3073} {"train_loss": -6.670178413391113, "global_step": 129092, "epoch": 3073} {"train_loss": -6.588173866271973, "global_step": 129093, "epoch": 3073} {"train_loss": -6.5321149826049805, "global_step": 129094, "epoch": 3073} {"train_loss": -6.670910835266113, "global_step": 129095, "epoch": 3073} {"train_loss": -6.704209804534912, "global_step": 129096, "epoch": 3073} {"train_loss": -6.609883785247803, "global_step": 129097, "epoch": 3073} {"train_loss": -6.593762397766113, "global_step": 129098, "epoch": 3073} {"train_loss": -6.685300350189209, "global_step": 129099, "epoch": 3073} {"train_loss": -6.6272430419921875, "global_step": 129100, "epoch": 3073} {"train_loss": -6.664003372192383, "global_step": 129101, "epoch": 3073} {"train_loss": -6.61414909362793, "global_step": 129102, "epoch": 3073} {"train_loss": -6.570127487182617, "global_step": 129103, "epoch": 3073} {"train_loss": -6.703507900238037, "global_step": 129104, "epoch": 3073} {"train_loss": -6.77772331237793, "global_step": 129105, "epoch": 3073} {"train_loss": -6.624929428100586, "global_step": 129106, "epoch": 3073} {"train_loss": -6.634321405774071, "global_step": 129107, "epoch": 3073, "val_loss": 66458.484375} {"train_loss": -6.693389415740967, "global_step": 129108, "epoch": 3074} {"train_loss": -6.731560707092285, "global_step": 129109, "epoch": 3074} {"train_loss": -6.596269607543945, "global_step": 129110, "epoch": 3074} {"train_loss": -6.634082317352295, "global_step": 129111, "epoch": 3074} {"train_loss": -6.730823516845703, "global_step": 129112, "epoch": 3074} {"train_loss": -6.652952194213867, "global_step": 129113, "epoch": 3074} {"train_loss": -6.727594375610352, "global_step": 129114, "epoch": 3074} {"train_loss": -6.6683669090271, "global_step": 129115, "epoch": 3074} {"train_loss": -6.662969589233398, "global_step": 129116, "epoch": 3074} {"train_loss": -6.684901237487793, "global_step": 129117, "epoch": 3074} {"train_loss": -6.653251647949219, "global_step": 129118, "epoch": 3074} {"train_loss": -6.668405532836914, "global_step": 129119, "epoch": 3074} {"train_loss": -6.6682963371276855, "global_step": 129120, "epoch": 3074} {"train_loss": -6.564298152923584, "global_step": 129121, "epoch": 3074} {"train_loss": -6.71955680847168, "global_step": 129122, "epoch": 3074} {"train_loss": -6.720428466796875, "global_step": 129123, "epoch": 3074} {"train_loss": -6.629042625427246, "global_step": 129124, "epoch": 3074} {"train_loss": -6.743324279785156, "global_step": 129125, "epoch": 3074} {"train_loss": -6.641462802886963, "global_step": 129126, "epoch": 3074} {"train_loss": -6.670727729797363, "global_step": 129127, "epoch": 3074} {"train_loss": -6.7517805099487305, "global_step": 129128, "epoch": 3074} {"train_loss": -6.579859256744385, "global_step": 129129, "epoch": 3074} {"train_loss": -6.643184661865234, "global_step": 129130, "epoch": 3074} {"train_loss": -6.723492622375488, "global_step": 129131, "epoch": 3074} {"train_loss": -6.675193786621094, "global_step": 129132, "epoch": 3074} {"train_loss": -6.734272003173828, "global_step": 129133, "epoch": 3074} {"train_loss": -6.646678924560547, "global_step": 129134, "epoch": 3074} {"train_loss": -6.678729057312012, "global_step": 129135, "epoch": 3074} {"train_loss": -6.709514617919922, "global_step": 129136, "epoch": 3074} {"train_loss": -6.584394454956055, "global_step": 129137, "epoch": 3074} {"train_loss": -6.668177127838135, "global_step": 129138, "epoch": 3074} {"train_loss": -6.682656288146973, "global_step": 129139, "epoch": 3074} {"train_loss": -6.639547824859619, "global_step": 129140, "epoch": 3074} {"train_loss": -6.7270708084106445, "global_step": 129141, "epoch": 3074} {"train_loss": -6.619690418243408, "global_step": 129142, "epoch": 3074} {"train_loss": -6.6631245613098145, "global_step": 129143, "epoch": 3074} {"train_loss": -6.678020477294922, "global_step": 129144, "epoch": 3074} {"train_loss": -6.684116840362549, "global_step": 129145, "epoch": 3074} {"train_loss": -6.709367752075195, "global_step": 129146, "epoch": 3074} {"train_loss": -6.616889953613281, "global_step": 129147, "epoch": 3074} {"train_loss": -6.576591491699219, "global_step": 129148, "epoch": 3074} {"train_loss": -6.665062824885051, "global_step": 129149, "epoch": 3074, "val_loss": 66649.671875} {"train_loss": -6.573000431060791, "global_step": 129150, "epoch": 3075} {"train_loss": -6.604747772216797, "global_step": 129151, "epoch": 3075} {"train_loss": -6.504209518432617, "global_step": 129152, "epoch": 3075} {"train_loss": -6.5885162353515625, "global_step": 129153, "epoch": 3075} {"train_loss": -6.624016761779785, "global_step": 129154, "epoch": 3075} {"train_loss": -6.602789878845215, "global_step": 129155, "epoch": 3075} {"train_loss": -6.623220920562744, "global_step": 129156, "epoch": 3075} {"train_loss": -6.618378162384033, "global_step": 129157, "epoch": 3075} {"train_loss": -6.612529754638672, "global_step": 129158, "epoch": 3075} {"train_loss": -6.680560111999512, "global_step": 129159, "epoch": 3075} {"train_loss": -6.714530944824219, "global_step": 129160, "epoch": 3075} {"train_loss": -6.713171482086182, "global_step": 129161, "epoch": 3075} {"train_loss": -6.681760787963867, "global_step": 129162, "epoch": 3075} {"train_loss": -6.6246795654296875, "global_step": 129163, "epoch": 3075} {"train_loss": -6.6960530281066895, "global_step": 129164, "epoch": 3075} {"train_loss": -6.673025131225586, "global_step": 129165, "epoch": 3075} {"train_loss": -6.626889228820801, "global_step": 129166, "epoch": 3075} {"train_loss": -6.787289619445801, "global_step": 129167, "epoch": 3075} {"train_loss": -6.720029830932617, "global_step": 129168, "epoch": 3075} {"train_loss": -6.685340881347656, "global_step": 129169, "epoch": 3075} {"train_loss": -6.623571395874023, "global_step": 129170, "epoch": 3075} {"train_loss": -6.691758155822754, "global_step": 129171, "epoch": 3075} {"train_loss": -6.657135009765625, "global_step": 129172, "epoch": 3075} {"train_loss": -6.752158164978027, "global_step": 129173, "epoch": 3075} {"train_loss": -6.7423505783081055, "global_step": 129174, "epoch": 3075} {"train_loss": -6.661581516265869, "global_step": 129175, "epoch": 3075} {"train_loss": -6.723659515380859, "global_step": 129176, "epoch": 3075} {"train_loss": -6.678365230560303, "global_step": 129177, "epoch": 3075} {"train_loss": -6.697892189025879, "global_step": 129178, "epoch": 3075} {"train_loss": -6.698927879333496, "global_step": 129179, "epoch": 3075} {"train_loss": -6.620113372802734, "global_step": 129180, "epoch": 3075} {"train_loss": -6.717226505279541, "global_step": 129181, "epoch": 3075} {"train_loss": -6.691081523895264, "global_step": 129182, "epoch": 3075} {"train_loss": -6.5872650146484375, "global_step": 129183, "epoch": 3075} {"train_loss": -6.641062259674072, "global_step": 129184, "epoch": 3075} {"train_loss": -6.59023380279541, "global_step": 129185, "epoch": 3075} {"train_loss": -6.641351699829102, "global_step": 129186, "epoch": 3075} {"train_loss": -6.6608686447143555, "global_step": 129187, "epoch": 3075} {"train_loss": -6.745512962341309, "global_step": 129188, "epoch": 3075} {"train_loss": -6.575239658355713, "global_step": 129189, "epoch": 3075} {"train_loss": -6.674792289733887, "global_step": 129190, "epoch": 3075} {"train_loss": -6.660022020339966, "global_step": 129191, "epoch": 3075, "val_loss": 66354.859375} {"train_loss": -6.620050430297852, "global_step": 129192, "epoch": 3076} {"train_loss": -6.649698257446289, "global_step": 129193, "epoch": 3076} {"train_loss": -6.690532684326172, "global_step": 129194, "epoch": 3076} {"train_loss": -6.567210674285889, "global_step": 129195, "epoch": 3076} {"train_loss": -6.587005138397217, "global_step": 129196, "epoch": 3076} {"train_loss": -6.743521690368652, "global_step": 129197, "epoch": 3076} {"train_loss": -6.688632011413574, "global_step": 129198, "epoch": 3076} {"train_loss": -6.463891506195068, "global_step": 129199, "epoch": 3076} {"train_loss": -6.705652236938477, "global_step": 129200, "epoch": 3076} {"train_loss": -6.779951095581055, "global_step": 129201, "epoch": 3076} {"train_loss": -6.649957656860352, "global_step": 129202, "epoch": 3076} {"train_loss": -6.648399353027344, "global_step": 129203, "epoch": 3076} {"train_loss": -6.758731365203857, "global_step": 129204, "epoch": 3076} {"train_loss": -6.510175704956055, "global_step": 129205, "epoch": 3076} {"train_loss": -6.606069564819336, "global_step": 129206, "epoch": 3076} {"train_loss": -6.641810417175293, "global_step": 129207, "epoch": 3076} {"train_loss": -6.628353118896484, "global_step": 129208, "epoch": 3076} {"train_loss": -6.619207859039307, "global_step": 129209, "epoch": 3076} {"train_loss": -6.62717342376709, "global_step": 129210, "epoch": 3076} {"train_loss": -6.486494064331055, "global_step": 129211, "epoch": 3076} {"train_loss": -6.634981155395508, "global_step": 129212, "epoch": 3076} {"train_loss": -6.635910987854004, "global_step": 129213, "epoch": 3076} {"train_loss": -6.579013824462891, "global_step": 129214, "epoch": 3076} {"train_loss": -6.703380107879639, "global_step": 129215, "epoch": 3076} {"train_loss": -6.694554328918457, "global_step": 129216, "epoch": 3076} {"train_loss": -6.747903823852539, "global_step": 129217, "epoch": 3076} {"train_loss": -6.634963035583496, "global_step": 129218, "epoch": 3076} {"train_loss": -6.700321674346924, "global_step": 129219, "epoch": 3076} {"train_loss": -6.493298530578613, "global_step": 129220, "epoch": 3076} {"train_loss": -6.553088188171387, "global_step": 129221, "epoch": 3076} {"train_loss": -6.599690914154053, "global_step": 129222, "epoch": 3076} {"train_loss": -6.5459065437316895, "global_step": 129223, "epoch": 3076} {"train_loss": -6.675505638122559, "global_step": 129224, "epoch": 3076} {"train_loss": -6.567739486694336, "global_step": 129225, "epoch": 3076} {"train_loss": -6.512607574462891, "global_step": 129226, "epoch": 3076} {"train_loss": -6.714171886444092, "global_step": 129227, "epoch": 3076} {"train_loss": -6.411264419555664, "global_step": 129228, "epoch": 3076} {"train_loss": -6.689495086669922, "global_step": 129229, "epoch": 3076} {"train_loss": -6.625249862670898, "global_step": 129230, "epoch": 3076} {"train_loss": -6.570313453674316, "global_step": 129231, "epoch": 3076} {"train_loss": -6.671670913696289, "global_step": 129232, "epoch": 3076} {"train_loss": -6.624584334237235, "global_step": 129233, "epoch": 3076, "val_loss": 66345.828125} {"train_loss": -6.771629333496094, "global_step": 129234, "epoch": 3077} {"train_loss": -6.6785783767700195, "global_step": 129235, "epoch": 3077} {"train_loss": -6.597517967224121, "global_step": 129236, "epoch": 3077} {"train_loss": -6.604658603668213, "global_step": 129237, "epoch": 3077} {"train_loss": -6.6594414710998535, "global_step": 129238, "epoch": 3077} {"train_loss": -6.640496253967285, "global_step": 129239, "epoch": 3077} {"train_loss": -6.785720348358154, "global_step": 129240, "epoch": 3077} {"train_loss": -6.684401035308838, "global_step": 129241, "epoch": 3077} {"train_loss": -6.697723865509033, "global_step": 129242, "epoch": 3077} {"train_loss": -6.568965435028076, "global_step": 129243, "epoch": 3077} {"train_loss": -6.755488395690918, "global_step": 129244, "epoch": 3077} {"train_loss": -6.516702651977539, "global_step": 129245, "epoch": 3077} {"train_loss": -6.752995491027832, "global_step": 129246, "epoch": 3077} {"train_loss": -6.671795845031738, "global_step": 129247, "epoch": 3077} {"train_loss": -6.597780227661133, "global_step": 129248, "epoch": 3077} {"train_loss": -6.70683479309082, "global_step": 129249, "epoch": 3077} {"train_loss": -6.631075859069824, "global_step": 129250, "epoch": 3077} {"train_loss": -6.6459269523620605, "global_step": 129251, "epoch": 3077} {"train_loss": -6.550093173980713, "global_step": 129252, "epoch": 3077} {"train_loss": -6.662178039550781, "global_step": 129253, "epoch": 3077} {"train_loss": -6.623383522033691, "global_step": 129254, "epoch": 3077} {"train_loss": -6.569797992706299, "global_step": 129255, "epoch": 3077} {"train_loss": -6.661523818969727, "global_step": 129256, "epoch": 3077} {"train_loss": -6.661527156829834, "global_step": 129257, "epoch": 3077} {"train_loss": -6.654864311218262, "global_step": 129258, "epoch": 3077} {"train_loss": -6.671016693115234, "global_step": 129259, "epoch": 3077} {"train_loss": -6.727653503417969, "global_step": 129260, "epoch": 3077} {"train_loss": -6.611172199249268, "global_step": 129261, "epoch": 3077} {"train_loss": -6.879912853240967, "global_step": 129262, "epoch": 3077} {"train_loss": -6.72489070892334, "global_step": 129263, "epoch": 3077} {"train_loss": -6.594184398651123, "global_step": 129264, "epoch": 3077} {"train_loss": -6.556229591369629, "global_step": 129265, "epoch": 3077} {"train_loss": -6.524763107299805, "global_step": 129266, "epoch": 3077} {"train_loss": -6.745875835418701, "global_step": 129267, "epoch": 3077} {"train_loss": -6.561503887176514, "global_step": 129268, "epoch": 3077} {"train_loss": -6.627903938293457, "global_step": 129269, "epoch": 3077} {"train_loss": -6.638711452484131, "global_step": 129270, "epoch": 3077} {"train_loss": -6.566964149475098, "global_step": 129271, "epoch": 3077} {"train_loss": -6.509134292602539, "global_step": 129272, "epoch": 3077} {"train_loss": -6.735213279724121, "global_step": 129273, "epoch": 3077} {"train_loss": -6.618244647979736, "global_step": 129274, "epoch": 3077} {"train_loss": -6.650147948946271, "global_step": 129275, "epoch": 3077, "val_loss": 66484.4140625} {"train_loss": -6.471134185791016, "global_step": 129276, "epoch": 3078} {"train_loss": -6.596656322479248, "global_step": 129277, "epoch": 3078} {"train_loss": -6.737521171569824, "global_step": 129278, "epoch": 3078} {"train_loss": -6.6839399337768555, "global_step": 129279, "epoch": 3078} {"train_loss": -6.530149459838867, "global_step": 129280, "epoch": 3078} {"train_loss": -6.664450645446777, "global_step": 129281, "epoch": 3078} {"train_loss": -6.739868640899658, "global_step": 129282, "epoch": 3078} {"train_loss": -6.687445640563965, "global_step": 129283, "epoch": 3078} {"train_loss": -6.662018299102783, "global_step": 129284, "epoch": 3078} {"train_loss": -6.566795349121094, "global_step": 129285, "epoch": 3078} {"train_loss": -6.718289375305176, "global_step": 129286, "epoch": 3078} {"train_loss": -6.597527503967285, "global_step": 129287, "epoch": 3078} {"train_loss": -6.717470645904541, "global_step": 129288, "epoch": 3078} {"train_loss": -6.667058944702148, "global_step": 129289, "epoch": 3078} {"train_loss": -6.8028106689453125, "global_step": 129290, "epoch": 3078} {"train_loss": -6.695697784423828, "global_step": 129291, "epoch": 3078} {"train_loss": -6.689115047454834, "global_step": 129292, "epoch": 3078} {"train_loss": -6.716385841369629, "global_step": 129293, "epoch": 3078} {"train_loss": -6.5947980880737305, "global_step": 129294, "epoch": 3078} {"train_loss": -6.676769256591797, "global_step": 129295, "epoch": 3078} {"train_loss": -6.7256083488464355, "global_step": 129296, "epoch": 3078} {"train_loss": -6.620439529418945, "global_step": 129297, "epoch": 3078} {"train_loss": -6.808693885803223, "global_step": 129298, "epoch": 3078} {"train_loss": -6.655172824859619, "global_step": 129299, "epoch": 3078} {"train_loss": -6.656529426574707, "global_step": 129300, "epoch": 3078} {"train_loss": -6.7082085609436035, "global_step": 129301, "epoch": 3078} {"train_loss": -6.744557857513428, "global_step": 129302, "epoch": 3078} {"train_loss": -6.706377029418945, "global_step": 129303, "epoch": 3078} {"train_loss": -6.665623664855957, "global_step": 129304, "epoch": 3078} {"train_loss": -6.667136192321777, "global_step": 129305, "epoch": 3078} {"train_loss": -6.725705146789551, "global_step": 129306, "epoch": 3078} {"train_loss": -6.598836421966553, "global_step": 129307, "epoch": 3078} {"train_loss": -6.658551216125488, "global_step": 129308, "epoch": 3078} {"train_loss": -6.579460144042969, "global_step": 129309, "epoch": 3078} {"train_loss": -6.696042537689209, "global_step": 129310, "epoch": 3078} {"train_loss": -6.710817337036133, "global_step": 129311, "epoch": 3078} {"train_loss": -6.700588226318359, "global_step": 129312, "epoch": 3078} {"train_loss": -6.676896095275879, "global_step": 129313, "epoch": 3078} {"train_loss": -6.6679368019104, "global_step": 129314, "epoch": 3078} {"train_loss": -6.607377052307129, "global_step": 129315, "epoch": 3078} {"train_loss": -6.579677581787109, "global_step": 129316, "epoch": 3078} {"train_loss": -6.6673898583366755, "global_step": 129317, "epoch": 3078, "val_loss": 66355.25} {"train_loss": -6.645209312438965, "global_step": 129318, "epoch": 3079} {"train_loss": -6.677397727966309, "global_step": 129319, "epoch": 3079} {"train_loss": -6.729613304138184, "global_step": 129320, "epoch": 3079} {"train_loss": -6.700080394744873, "global_step": 129321, "epoch": 3079} {"train_loss": -6.685375213623047, "global_step": 129322, "epoch": 3079} {"train_loss": -6.626641273498535, "global_step": 129323, "epoch": 3079} {"train_loss": -6.6808180809021, "global_step": 129324, "epoch": 3079} {"train_loss": -6.711038112640381, "global_step": 129325, "epoch": 3079} {"train_loss": -6.703834533691406, "global_step": 129326, "epoch": 3079} {"train_loss": -6.728813171386719, "global_step": 129327, "epoch": 3079} {"train_loss": -6.658745765686035, "global_step": 129328, "epoch": 3079} {"train_loss": -6.712275505065918, "global_step": 129329, "epoch": 3079} {"train_loss": -6.650441646575928, "global_step": 129330, "epoch": 3079} {"train_loss": -6.605446815490723, "global_step": 129331, "epoch": 3079} {"train_loss": -6.607986927032471, "global_step": 129332, "epoch": 3079} {"train_loss": -6.5301618576049805, "global_step": 129333, "epoch": 3079} {"train_loss": -6.593551158905029, "global_step": 129334, "epoch": 3079} {"train_loss": -6.507846355438232, "global_step": 129335, "epoch": 3079} {"train_loss": -6.500912666320801, "global_step": 129336, "epoch": 3079} {"train_loss": -6.724902153015137, "global_step": 129337, "epoch": 3079} {"train_loss": -6.419722557067871, "global_step": 129338, "epoch": 3079} {"train_loss": -6.504854202270508, "global_step": 129339, "epoch": 3079} {"train_loss": -6.452741622924805, "global_step": 129340, "epoch": 3079} {"train_loss": -6.545778751373291, "global_step": 129341, "epoch": 3079} {"train_loss": -6.490234375, "global_step": 129342, "epoch": 3079} {"train_loss": -6.56358528137207, "global_step": 129343, "epoch": 3079} {"train_loss": -6.516761779785156, "global_step": 129344, "epoch": 3079} {"train_loss": -6.557755470275879, "global_step": 129345, "epoch": 3079} {"train_loss": -6.613955497741699, "global_step": 129346, "epoch": 3079} {"train_loss": -6.523125648498535, "global_step": 129347, "epoch": 3079} {"train_loss": -6.639277458190918, "global_step": 129348, "epoch": 3079} {"train_loss": -6.517494201660156, "global_step": 129349, "epoch": 3079} {"train_loss": -6.583657264709473, "global_step": 129350, "epoch": 3079} {"train_loss": -6.635324478149414, "global_step": 129351, "epoch": 3079} {"train_loss": -6.639193534851074, "global_step": 129352, "epoch": 3079} {"train_loss": -6.5312910079956055, "global_step": 129353, "epoch": 3079} {"train_loss": -6.5733323097229, "global_step": 129354, "epoch": 3079} {"train_loss": -6.6644134521484375, "global_step": 129355, "epoch": 3079} {"train_loss": -6.4858293533325195, "global_step": 129356, "epoch": 3079} {"train_loss": -6.683581829071045, "global_step": 129357, "epoch": 3079} {"train_loss": -6.5447258949279785, "global_step": 129358, "epoch": 3079} {"train_loss": -6.597649392627535, "global_step": 129359, "epoch": 3079, "val_loss": 66315.1875} {"train_loss": -6.5625104904174805, "global_step": 129360, "epoch": 3080} {"train_loss": -6.546330451965332, "global_step": 129361, "epoch": 3080} {"train_loss": -6.564205646514893, "global_step": 129362, "epoch": 3080} {"train_loss": -6.574192047119141, "global_step": 129363, "epoch": 3080} {"train_loss": -6.494901180267334, "global_step": 129364, "epoch": 3080} {"train_loss": -6.529526710510254, "global_step": 129365, "epoch": 3080} {"train_loss": -6.599757671356201, "global_step": 129366, "epoch": 3080} {"train_loss": -6.523996353149414, "global_step": 129367, "epoch": 3080} {"train_loss": -6.6407976150512695, "global_step": 129368, "epoch": 3080} {"train_loss": -6.563350200653076, "global_step": 129369, "epoch": 3080} {"train_loss": -6.5285773277282715, "global_step": 129370, "epoch": 3080} {"train_loss": -6.705694675445557, "global_step": 129371, "epoch": 3080} {"train_loss": -6.608680725097656, "global_step": 129372, "epoch": 3080} {"train_loss": -6.717596054077148, "global_step": 129373, "epoch": 3080} {"train_loss": -6.655574798583984, "global_step": 129374, "epoch": 3080} {"train_loss": -6.612151622772217, "global_step": 129375, "epoch": 3080} {"train_loss": -6.681532859802246, "global_step": 129376, "epoch": 3080} {"train_loss": -6.62769889831543, "global_step": 129377, "epoch": 3080} {"train_loss": -6.660118579864502, "global_step": 129378, "epoch": 3080} {"train_loss": -6.656209945678711, "global_step": 129379, "epoch": 3080} {"train_loss": -6.622323989868164, "global_step": 129380, "epoch": 3080} {"train_loss": -6.525607109069824, "global_step": 129381, "epoch": 3080} {"train_loss": -6.545581817626953, "global_step": 129382, "epoch": 3080} {"train_loss": -6.62364387512207, "global_step": 129383, "epoch": 3080} {"train_loss": -6.614997863769531, "global_step": 129384, "epoch": 3080} {"train_loss": -6.691924095153809, "global_step": 129385, "epoch": 3080} {"train_loss": -6.749460220336914, "global_step": 129386, "epoch": 3080} {"train_loss": -6.657436370849609, "global_step": 129387, "epoch": 3080} {"train_loss": -6.752577781677246, "global_step": 129388, "epoch": 3080} {"train_loss": -6.683642387390137, "global_step": 129389, "epoch": 3080} {"train_loss": -6.616726398468018, "global_step": 129390, "epoch": 3080} {"train_loss": -6.780877590179443, "global_step": 129391, "epoch": 3080} {"train_loss": -6.677738666534424, "global_step": 129392, "epoch": 3080} {"train_loss": -6.713337421417236, "global_step": 129393, "epoch": 3080} {"train_loss": -6.7419281005859375, "global_step": 129394, "epoch": 3080} {"train_loss": -6.656723976135254, "global_step": 129395, "epoch": 3080} {"train_loss": -6.778439521789551, "global_step": 129396, "epoch": 3080} {"train_loss": -6.672128200531006, "global_step": 129397, "epoch": 3080} {"train_loss": -6.623250484466553, "global_step": 129398, "epoch": 3080} {"train_loss": -6.635600566864014, "global_step": 129399, "epoch": 3080} {"train_loss": -6.581604957580566, "global_step": 129400, "epoch": 3080} {"train_loss": -6.636031003225417, "global_step": 129401, "epoch": 3080, "val_loss": 66504.8984375} {"train_loss": -6.707272529602051, "global_step": 129402, "epoch": 3081} {"train_loss": -6.715304374694824, "global_step": 129403, "epoch": 3081} {"train_loss": -6.777456283569336, "global_step": 129404, "epoch": 3081} {"train_loss": -6.641396999359131, "global_step": 129405, "epoch": 3081} {"train_loss": -6.6668806076049805, "global_step": 129406, "epoch": 3081} {"train_loss": -6.661125183105469, "global_step": 129407, "epoch": 3081} {"train_loss": -6.752593994140625, "global_step": 129408, "epoch": 3081} {"train_loss": -6.721480369567871, "global_step": 129409, "epoch": 3081} {"train_loss": -6.695505619049072, "global_step": 129410, "epoch": 3081} {"train_loss": -6.645243167877197, "global_step": 129411, "epoch": 3081} {"train_loss": -6.721628189086914, "global_step": 129412, "epoch": 3081} {"train_loss": -6.653717994689941, "global_step": 129413, "epoch": 3081} {"train_loss": -6.7330121994018555, "global_step": 129414, "epoch": 3081} {"train_loss": -6.809460639953613, "global_step": 129415, "epoch": 3081} {"train_loss": -6.693026542663574, "global_step": 129416, "epoch": 3081} {"train_loss": -6.63835334777832, "global_step": 129417, "epoch": 3081} {"train_loss": -6.600155830383301, "global_step": 129418, "epoch": 3081} {"train_loss": -6.540988922119141, "global_step": 129419, "epoch": 3081} {"train_loss": -6.56184196472168, "global_step": 129420, "epoch": 3081} {"train_loss": -6.7175774574279785, "global_step": 129421, "epoch": 3081} {"train_loss": -6.587772846221924, "global_step": 129422, "epoch": 3081} {"train_loss": -6.581871509552002, "global_step": 129423, "epoch": 3081} {"train_loss": -6.636515140533447, "global_step": 129424, "epoch": 3081} {"train_loss": -6.676746845245361, "global_step": 129425, "epoch": 3081} {"train_loss": -6.785158157348633, "global_step": 129426, "epoch": 3081} {"train_loss": -6.612326145172119, "global_step": 129427, "epoch": 3081} {"train_loss": -6.7376017570495605, "global_step": 129428, "epoch": 3081} {"train_loss": -6.675865650177002, "global_step": 129429, "epoch": 3081} {"train_loss": -6.744357109069824, "global_step": 129430, "epoch": 3081} {"train_loss": -6.768567085266113, "global_step": 129431, "epoch": 3081} {"train_loss": -6.673196792602539, "global_step": 129432, "epoch": 3081} {"train_loss": -6.780429363250732, "global_step": 129433, "epoch": 3081} {"train_loss": -6.717461585998535, "global_step": 129434, "epoch": 3081} {"train_loss": -6.710738182067871, "global_step": 129435, "epoch": 3081} {"train_loss": -6.658731460571289, "global_step": 129436, "epoch": 3081} {"train_loss": -6.699029922485352, "global_step": 129437, "epoch": 3081} {"train_loss": -6.7312798500061035, "global_step": 129438, "epoch": 3081} {"train_loss": -6.779555320739746, "global_step": 129439, "epoch": 3081} {"train_loss": -6.605367183685303, "global_step": 129440, "epoch": 3081} {"train_loss": -6.672664642333984, "global_step": 129441, "epoch": 3081} {"train_loss": -6.753159999847412, "global_step": 129442, "epoch": 3081} {"train_loss": -6.687776894796462, "global_step": 129443, "epoch": 3081, "val_loss": 66210.4921875} {"train_loss": -6.710869789123535, "global_step": 129444, "epoch": 3082} {"train_loss": -6.7457380294799805, "global_step": 129445, "epoch": 3082} {"train_loss": -6.460057258605957, "global_step": 129446, "epoch": 3082} {"train_loss": -6.532498359680176, "global_step": 129447, "epoch": 3082} {"train_loss": -6.7632598876953125, "global_step": 129448, "epoch": 3082} {"train_loss": -6.619719505310059, "global_step": 129449, "epoch": 3082} {"train_loss": -6.742643356323242, "global_step": 129450, "epoch": 3082} {"train_loss": -6.723976135253906, "global_step": 129451, "epoch": 3082} {"train_loss": -6.648605823516846, "global_step": 129452, "epoch": 3082} {"train_loss": -6.6698503494262695, "global_step": 129453, "epoch": 3082} {"train_loss": -6.712221622467041, "global_step": 129454, "epoch": 3082} {"train_loss": -6.56611442565918, "global_step": 129455, "epoch": 3082} {"train_loss": -6.647204399108887, "global_step": 129456, "epoch": 3082} {"train_loss": -6.702955722808838, "global_step": 129457, "epoch": 3082} {"train_loss": -6.598532199859619, "global_step": 129458, "epoch": 3082} {"train_loss": -6.679243087768555, "global_step": 129459, "epoch": 3082} {"train_loss": -6.625713348388672, "global_step": 129460, "epoch": 3082} {"train_loss": -6.689435958862305, "global_step": 129461, "epoch": 3082} {"train_loss": -6.624685287475586, "global_step": 129462, "epoch": 3082} {"train_loss": -6.613570213317871, "global_step": 129463, "epoch": 3082} {"train_loss": -6.771246433258057, "global_step": 129464, "epoch": 3082} {"train_loss": -6.586980819702148, "global_step": 129465, "epoch": 3082} {"train_loss": -6.6570892333984375, "global_step": 129466, "epoch": 3082} {"train_loss": -6.621316909790039, "global_step": 129467, "epoch": 3082} {"train_loss": -6.600929260253906, "global_step": 129468, "epoch": 3082} {"train_loss": -6.811737537384033, "global_step": 129469, "epoch": 3082} {"train_loss": -6.651474475860596, "global_step": 129470, "epoch": 3082} {"train_loss": -6.770486831665039, "global_step": 129471, "epoch": 3082} {"train_loss": -6.635720252990723, "global_step": 129472, "epoch": 3082} {"train_loss": -6.668553352355957, "global_step": 129473, "epoch": 3082} {"train_loss": -6.671215534210205, "global_step": 129474, "epoch": 3082} {"train_loss": -6.766112327575684, "global_step": 129475, "epoch": 3082} {"train_loss": -6.840703964233398, "global_step": 129476, "epoch": 3082} {"train_loss": -6.76292085647583, "global_step": 129477, "epoch": 3082} {"train_loss": -6.684928894042969, "global_step": 129478, "epoch": 3082} {"train_loss": -6.722851753234863, "global_step": 129479, "epoch": 3082} {"train_loss": -6.679727077484131, "global_step": 129480, "epoch": 3082} {"train_loss": -6.710796356201172, "global_step": 129481, "epoch": 3082} {"train_loss": -6.7408905029296875, "global_step": 129482, "epoch": 3082} {"train_loss": -6.70388650894165, "global_step": 129483, "epoch": 3082} {"train_loss": -6.6731343269348145, "global_step": 129484, "epoch": 3082} {"train_loss": -6.677934941791353, "global_step": 129485, "epoch": 3082, "val_loss": 66484.2578125} {"train_loss": -6.679426193237305, "global_step": 129486, "epoch": 3083} {"train_loss": -6.760550498962402, "global_step": 129487, "epoch": 3083} {"train_loss": -6.741457939147949, "global_step": 129488, "epoch": 3083} {"train_loss": -6.640899181365967, "global_step": 129489, "epoch": 3083} {"train_loss": -6.668066501617432, "global_step": 129490, "epoch": 3083} {"train_loss": -6.648062705993652, "global_step": 129491, "epoch": 3083} {"train_loss": -6.705018043518066, "global_step": 129492, "epoch": 3083} {"train_loss": -6.684727668762207, "global_step": 129493, "epoch": 3083} {"train_loss": -6.7323527336120605, "global_step": 129494, "epoch": 3083} {"train_loss": -6.824334144592285, "global_step": 129495, "epoch": 3083} {"train_loss": -6.686888217926025, "global_step": 129496, "epoch": 3083} {"train_loss": -6.724471569061279, "global_step": 129497, "epoch": 3083} {"train_loss": -6.660830497741699, "global_step": 129498, "epoch": 3083} {"train_loss": -6.757051467895508, "global_step": 129499, "epoch": 3083} {"train_loss": -6.595738410949707, "global_step": 129500, "epoch": 3083} {"train_loss": -6.658344745635986, "global_step": 129501, "epoch": 3083} {"train_loss": -6.664707183837891, "global_step": 129502, "epoch": 3083} {"train_loss": -6.731393814086914, "global_step": 129503, "epoch": 3083} {"train_loss": -6.575839042663574, "global_step": 129504, "epoch": 3083} {"train_loss": -6.68553352355957, "global_step": 129505, "epoch": 3083} {"train_loss": -6.620085716247559, "global_step": 129506, "epoch": 3083} {"train_loss": -6.649852275848389, "global_step": 129507, "epoch": 3083} {"train_loss": -6.644339084625244, "global_step": 129508, "epoch": 3083} {"train_loss": -6.6194610595703125, "global_step": 129509, "epoch": 3083} {"train_loss": -6.679943084716797, "global_step": 129510, "epoch": 3083} {"train_loss": -6.67938232421875, "global_step": 129511, "epoch": 3083} {"train_loss": -6.703604698181152, "global_step": 129512, "epoch": 3083} {"train_loss": -6.753057479858398, "global_step": 129513, "epoch": 3083} {"train_loss": -6.622299671173096, "global_step": 129514, "epoch": 3083} {"train_loss": -6.627887725830078, "global_step": 129515, "epoch": 3083} {"train_loss": -6.562238693237305, "global_step": 129516, "epoch": 3083} {"train_loss": -6.66774845123291, "global_step": 129517, "epoch": 3083} {"train_loss": -6.73876953125, "global_step": 129518, "epoch": 3083} {"train_loss": -6.587396621704102, "global_step": 129519, "epoch": 3083} {"train_loss": -6.681298732757568, "global_step": 129520, "epoch": 3083} {"train_loss": -6.585487365722656, "global_step": 129521, "epoch": 3083} {"train_loss": -6.662381172180176, "global_step": 129522, "epoch": 3083} {"train_loss": -6.621910095214844, "global_step": 129523, "epoch": 3083} {"train_loss": -6.474552154541016, "global_step": 129524, "epoch": 3083} {"train_loss": -6.62495756149292, "global_step": 129525, "epoch": 3083} {"train_loss": -6.623528480529785, "global_step": 129526, "epoch": 3083} {"train_loss": -6.661767460051037, "global_step": 129527, "epoch": 3083, "val_loss": 66294.4375} {"train_loss": -6.751735210418701, "global_step": 129528, "epoch": 3084} {"train_loss": -6.52877140045166, "global_step": 129529, "epoch": 3084} {"train_loss": -6.65843391418457, "global_step": 129530, "epoch": 3084} {"train_loss": -6.5979766845703125, "global_step": 129531, "epoch": 3084} {"train_loss": -6.560312747955322, "global_step": 129532, "epoch": 3084} {"train_loss": -6.7062530517578125, "global_step": 129533, "epoch": 3084} {"train_loss": -6.4071364402771, "global_step": 129534, "epoch": 3084} {"train_loss": -6.558910846710205, "global_step": 129535, "epoch": 3084} {"train_loss": -6.542390823364258, "global_step": 129536, "epoch": 3084} {"train_loss": -6.34432315826416, "global_step": 129537, "epoch": 3084} {"train_loss": -6.449999809265137, "global_step": 129538, "epoch": 3084} {"train_loss": -6.499577522277832, "global_step": 129539, "epoch": 3084} {"train_loss": -6.6137518882751465, "global_step": 129540, "epoch": 3084} {"train_loss": -6.487313270568848, "global_step": 129541, "epoch": 3084} {"train_loss": -6.5256195068359375, "global_step": 129542, "epoch": 3084} {"train_loss": -6.447970867156982, "global_step": 129543, "epoch": 3084} {"train_loss": -6.5222930908203125, "global_step": 129544, "epoch": 3084} {"train_loss": -6.50803279876709, "global_step": 129545, "epoch": 3084} {"train_loss": -6.5711894035339355, "global_step": 129546, "epoch": 3084} {"train_loss": -6.535655975341797, "global_step": 129547, "epoch": 3084} {"train_loss": -6.510350227355957, "global_step": 129548, "epoch": 3084} {"train_loss": -6.520770072937012, "global_step": 129549, "epoch": 3084} {"train_loss": -6.668675422668457, "global_step": 129550, "epoch": 3084} {"train_loss": -6.4678955078125, "global_step": 129551, "epoch": 3084} {"train_loss": -6.5937652587890625, "global_step": 129552, "epoch": 3084} {"train_loss": -6.465196132659912, "global_step": 129553, "epoch": 3084} {"train_loss": -6.671477317810059, "global_step": 129554, "epoch": 3084} {"train_loss": -6.470982551574707, "global_step": 129555, "epoch": 3084} {"train_loss": -6.701617240905762, "global_step": 129556, "epoch": 3084} {"train_loss": -6.683526515960693, "global_step": 129557, "epoch": 3084} {"train_loss": -6.646510601043701, "global_step": 129558, "epoch": 3084} {"train_loss": -6.7512030601501465, "global_step": 129559, "epoch": 3084} {"train_loss": -6.5602006912231445, "global_step": 129560, "epoch": 3084} {"train_loss": -6.73386287689209, "global_step": 129561, "epoch": 3084} {"train_loss": -6.580745697021484, "global_step": 129562, "epoch": 3084} {"train_loss": -6.672370910644531, "global_step": 129563, "epoch": 3084} {"train_loss": -6.620020866394043, "global_step": 129564, "epoch": 3084} {"train_loss": -6.68526554107666, "global_step": 129565, "epoch": 3084} {"train_loss": -6.561445236206055, "global_step": 129566, "epoch": 3084} {"train_loss": -6.5294389724731445, "global_step": 129567, "epoch": 3084} {"train_loss": -6.651362895965576, "global_step": 129568, "epoch": 3084} {"train_loss": -6.5722434520721436, "global_step": 129569, "epoch": 3084, "val_loss": 66401.390625} {"train_loss": -6.677397727966309, "global_step": 129570, "epoch": 3085} {"train_loss": -6.684882164001465, "global_step": 129571, "epoch": 3085} {"train_loss": -6.503339767456055, "global_step": 129572, "epoch": 3085} {"train_loss": -6.693908214569092, "global_step": 129573, "epoch": 3085} {"train_loss": -6.6702094078063965, "global_step": 129574, "epoch": 3085} {"train_loss": -6.687108993530273, "global_step": 129575, "epoch": 3085} {"train_loss": -6.619198799133301, "global_step": 129576, "epoch": 3085} {"train_loss": -6.646857738494873, "global_step": 129577, "epoch": 3085} {"train_loss": -6.538991928100586, "global_step": 129578, "epoch": 3085} {"train_loss": -6.5852203369140625, "global_step": 129579, "epoch": 3085} {"train_loss": -6.724778175354004, "global_step": 129580, "epoch": 3085} {"train_loss": -6.61998176574707, "global_step": 129581, "epoch": 3085} {"train_loss": -6.708106994628906, "global_step": 129582, "epoch": 3085} {"train_loss": -6.593062400817871, "global_step": 129583, "epoch": 3085} {"train_loss": -6.591975688934326, "global_step": 129584, "epoch": 3085} {"train_loss": -6.695499420166016, "global_step": 129585, "epoch": 3085} {"train_loss": -6.655692100524902, "global_step": 129586, "epoch": 3085} {"train_loss": -6.546605110168457, "global_step": 129587, "epoch": 3085} {"train_loss": -6.718884468078613, "global_step": 129588, "epoch": 3085} {"train_loss": -6.644165992736816, "global_step": 129589, "epoch": 3085} {"train_loss": -6.763116836547852, "global_step": 129590, "epoch": 3085} {"train_loss": -6.7293314933776855, "global_step": 129591, "epoch": 3085} {"train_loss": -6.640408039093018, "global_step": 129592, "epoch": 3085} {"train_loss": -6.601546287536621, "global_step": 129593, "epoch": 3085} {"train_loss": -6.711209297180176, "global_step": 129594, "epoch": 3085} {"train_loss": -6.674237251281738, "global_step": 129595, "epoch": 3085} {"train_loss": -6.65983772277832, "global_step": 129596, "epoch": 3085} {"train_loss": -6.717580795288086, "global_step": 129597, "epoch": 3085} {"train_loss": -6.625013828277588, "global_step": 129598, "epoch": 3085} {"train_loss": -6.704685688018799, "global_step": 129599, "epoch": 3085} {"train_loss": -6.786550045013428, "global_step": 129600, "epoch": 3085} {"train_loss": -6.58786678314209, "global_step": 129601, "epoch": 3085} {"train_loss": -6.679804801940918, "global_step": 129602, "epoch": 3085} {"train_loss": -6.69366455078125, "global_step": 129603, "epoch": 3085} {"train_loss": -6.718533515930176, "global_step": 129604, "epoch": 3085} {"train_loss": -6.732568740844727, "global_step": 129605, "epoch": 3085} {"train_loss": -6.7080912590026855, "global_step": 129606, "epoch": 3085} {"train_loss": -6.760658264160156, "global_step": 129607, "epoch": 3085} {"train_loss": -6.681878089904785, "global_step": 129608, "epoch": 3085} {"train_loss": -6.7209792137146, "global_step": 129609, "epoch": 3085} {"train_loss": -6.673366546630859, "global_step": 129610, "epoch": 3085} {"train_loss": -6.666715973899478, "global_step": 129611, "epoch": 3085, "val_loss": 66360.1796875} {"train_loss": -6.802783012390137, "global_step": 129612, "epoch": 3086} {"train_loss": -6.774471282958984, "global_step": 129613, "epoch": 3086} {"train_loss": -6.8282151222229, "global_step": 129614, "epoch": 3086} {"train_loss": -6.792666912078857, "global_step": 129615, "epoch": 3086} {"train_loss": -6.581734657287598, "global_step": 129616, "epoch": 3086} {"train_loss": -6.671931266784668, "global_step": 129617, "epoch": 3086} {"train_loss": -6.790339469909668, "global_step": 129618, "epoch": 3086} {"train_loss": -6.733333587646484, "global_step": 129619, "epoch": 3086} {"train_loss": -6.767528057098389, "global_step": 129620, "epoch": 3086} {"train_loss": -6.8090105056762695, "global_step": 129621, "epoch": 3086} {"train_loss": -6.7772135734558105, "global_step": 129622, "epoch": 3086} {"train_loss": -6.648950576782227, "global_step": 129623, "epoch": 3086} {"train_loss": -6.649004936218262, "global_step": 129624, "epoch": 3086} {"train_loss": -6.669715404510498, "global_step": 129625, "epoch": 3086} {"train_loss": -6.670557975769043, "global_step": 129626, "epoch": 3086} {"train_loss": -6.59049129486084, "global_step": 129627, "epoch": 3086} {"train_loss": -6.601293563842773, "global_step": 129628, "epoch": 3086} {"train_loss": -6.630318641662598, "global_step": 129629, "epoch": 3086} {"train_loss": -6.572876453399658, "global_step": 129630, "epoch": 3086} {"train_loss": -6.53315544128418, "global_step": 129631, "epoch": 3086} {"train_loss": -6.594444751739502, "global_step": 129632, "epoch": 3086} {"train_loss": -6.634037971496582, "global_step": 129633, "epoch": 3086} {"train_loss": -6.620893955230713, "global_step": 129634, "epoch": 3086} {"train_loss": -6.731222629547119, "global_step": 129635, "epoch": 3086} {"train_loss": -6.532517433166504, "global_step": 129636, "epoch": 3086} {"train_loss": -6.605013370513916, "global_step": 129637, "epoch": 3086} {"train_loss": -6.660647869110107, "global_step": 129638, "epoch": 3086} {"train_loss": -6.730838775634766, "global_step": 129639, "epoch": 3086} {"train_loss": -6.7244181632995605, "global_step": 129640, "epoch": 3086} {"train_loss": -6.530184268951416, "global_step": 129641, "epoch": 3086} {"train_loss": -6.5428290367126465, "global_step": 129642, "epoch": 3086} {"train_loss": -6.501585006713867, "global_step": 129643, "epoch": 3086} {"train_loss": -6.647441387176514, "global_step": 129644, "epoch": 3086} {"train_loss": -6.583865165710449, "global_step": 129645, "epoch": 3086} {"train_loss": -6.6887946128845215, "global_step": 129646, "epoch": 3086} {"train_loss": -6.613077163696289, "global_step": 129647, "epoch": 3086} {"train_loss": -6.608597755432129, "global_step": 129648, "epoch": 3086} {"train_loss": -6.602957725524902, "global_step": 129649, "epoch": 3086} {"train_loss": -6.63552188873291, "global_step": 129650, "epoch": 3086} {"train_loss": -6.658000469207764, "global_step": 129651, "epoch": 3086} {"train_loss": -6.581570148468018, "global_step": 129652, "epoch": 3086} {"train_loss": -6.6564679599943615, "global_step": 129653, "epoch": 3086, "val_loss": 66423.7109375} {"train_loss": -6.686572074890137, "global_step": 129654, "epoch": 3087} {"train_loss": -6.66987419128418, "global_step": 129655, "epoch": 3087} {"train_loss": -6.6001787185668945, "global_step": 129656, "epoch": 3087} {"train_loss": -6.620131492614746, "global_step": 129657, "epoch": 3087} {"train_loss": -6.636713027954102, "global_step": 129658, "epoch": 3087} {"train_loss": -6.547574043273926, "global_step": 129659, "epoch": 3087} {"train_loss": -6.601840019226074, "global_step": 129660, "epoch": 3087} {"train_loss": -6.643309593200684, "global_step": 129661, "epoch": 3087} {"train_loss": -6.594327926635742, "global_step": 129662, "epoch": 3087} {"train_loss": -6.618714332580566, "global_step": 129663, "epoch": 3087} {"train_loss": -6.61570930480957, "global_step": 129664, "epoch": 3087} {"train_loss": -6.771749973297119, "global_step": 129665, "epoch": 3087} {"train_loss": -6.532624244689941, "global_step": 129666, "epoch": 3087} {"train_loss": -6.617647171020508, "global_step": 129667, "epoch": 3087} {"train_loss": -6.656002998352051, "global_step": 129668, "epoch": 3087} {"train_loss": -6.594282150268555, "global_step": 129669, "epoch": 3087} {"train_loss": -6.718653678894043, "global_step": 129670, "epoch": 3087} {"train_loss": -6.708011150360107, "global_step": 129671, "epoch": 3087} {"train_loss": -6.632888317108154, "global_step": 129672, "epoch": 3087} {"train_loss": -6.663158416748047, "global_step": 129673, "epoch": 3087} {"train_loss": -6.73006010055542, "global_step": 129674, "epoch": 3087} {"train_loss": -6.621478080749512, "global_step": 129675, "epoch": 3087} {"train_loss": -6.615036964416504, "global_step": 129676, "epoch": 3087} {"train_loss": -6.79584264755249, "global_step": 129677, "epoch": 3087} {"train_loss": -6.702949523925781, "global_step": 129678, "epoch": 3087} {"train_loss": -6.735218048095703, "global_step": 129679, "epoch": 3087} {"train_loss": -6.554874420166016, "global_step": 129680, "epoch": 3087} {"train_loss": -6.712404251098633, "global_step": 129681, "epoch": 3087} {"train_loss": -6.653711318969727, "global_step": 129682, "epoch": 3087} {"train_loss": -6.625114440917969, "global_step": 129683, "epoch": 3087} {"train_loss": -6.651982307434082, "global_step": 129684, "epoch": 3087} {"train_loss": -6.630101203918457, "global_step": 129685, "epoch": 3087} {"train_loss": -6.603492736816406, "global_step": 129686, "epoch": 3087} {"train_loss": -6.7072553634643555, "global_step": 129687, "epoch": 3087} {"train_loss": -6.675973892211914, "global_step": 129688, "epoch": 3087} {"train_loss": -6.65431022644043, "global_step": 129689, "epoch": 3087} {"train_loss": -6.666683673858643, "global_step": 129690, "epoch": 3087} {"train_loss": -6.751578330993652, "global_step": 129691, "epoch": 3087} {"train_loss": -6.7706379890441895, "global_step": 129692, "epoch": 3087} {"train_loss": -6.7493696212768555, "global_step": 129693, "epoch": 3087} {"train_loss": -6.726984024047852, "global_step": 129694, "epoch": 3087} {"train_loss": -6.6613566761925105, "global_step": 129695, "epoch": 3087, "val_loss": 66452.671875} {"train_loss": -6.703275680541992, "global_step": 129696, "epoch": 3088} {"train_loss": -6.6741461753845215, "global_step": 129697, "epoch": 3088} {"train_loss": -6.822762489318848, "global_step": 129698, "epoch": 3088} {"train_loss": -6.7506256103515625, "global_step": 129699, "epoch": 3088} {"train_loss": -6.65599250793457, "global_step": 129700, "epoch": 3088} {"train_loss": -6.747555255889893, "global_step": 129701, "epoch": 3088} {"train_loss": -6.587323188781738, "global_step": 129702, "epoch": 3088} {"train_loss": -6.5949249267578125, "global_step": 129703, "epoch": 3088} {"train_loss": -6.52414608001709, "global_step": 129704, "epoch": 3088} {"train_loss": -6.663739204406738, "global_step": 129705, "epoch": 3088} {"train_loss": -6.749784469604492, "global_step": 129706, "epoch": 3088} {"train_loss": -6.64344596862793, "global_step": 129707, "epoch": 3088} {"train_loss": -6.677885055541992, "global_step": 129708, "epoch": 3088} {"train_loss": -6.601975440979004, "global_step": 129709, "epoch": 3088} {"train_loss": -6.574235439300537, "global_step": 129710, "epoch": 3088} {"train_loss": -6.657114028930664, "global_step": 129711, "epoch": 3088} {"train_loss": -6.724636554718018, "global_step": 129712, "epoch": 3088} {"train_loss": -6.722721576690674, "global_step": 129713, "epoch": 3088} {"train_loss": -6.681919574737549, "global_step": 129714, "epoch": 3088} {"train_loss": -6.573251724243164, "global_step": 129715, "epoch": 3088} {"train_loss": -6.61922550201416, "global_step": 129716, "epoch": 3088} {"train_loss": -6.461631774902344, "global_step": 129717, "epoch": 3088} {"train_loss": -6.7897725105285645, "global_step": 129718, "epoch": 3088} {"train_loss": -6.457306861877441, "global_step": 129719, "epoch": 3088} {"train_loss": -6.5412068367004395, "global_step": 129720, "epoch": 3088} {"train_loss": -6.670765399932861, "global_step": 129721, "epoch": 3088} {"train_loss": -6.5646772384643555, "global_step": 129722, "epoch": 3088} {"train_loss": -6.572570323944092, "global_step": 129723, "epoch": 3088} {"train_loss": -6.573333740234375, "global_step": 129724, "epoch": 3088} {"train_loss": -6.520092010498047, "global_step": 129725, "epoch": 3088} {"train_loss": -6.664443016052246, "global_step": 129726, "epoch": 3088} {"train_loss": -6.546236991882324, "global_step": 129727, "epoch": 3088} {"train_loss": -6.556459903717041, "global_step": 129728, "epoch": 3088} {"train_loss": -6.425134181976318, "global_step": 129729, "epoch": 3088} {"train_loss": -6.740333557128906, "global_step": 129730, "epoch": 3088} {"train_loss": -6.493192672729492, "global_step": 129731, "epoch": 3088} {"train_loss": -6.613348484039307, "global_step": 129732, "epoch": 3088} {"train_loss": -6.549644470214844, "global_step": 129733, "epoch": 3088} {"train_loss": -6.675996780395508, "global_step": 129734, "epoch": 3088} {"train_loss": -6.625985145568848, "global_step": 129735, "epoch": 3088} {"train_loss": -6.565479755401611, "global_step": 129736, "epoch": 3088} {"train_loss": -6.624062470027378, "global_step": 129737, "epoch": 3088, "val_loss": 66335.7421875} {"train_loss": -6.6114115715026855, "global_step": 129738, "epoch": 3089} {"train_loss": -6.594361305236816, "global_step": 129739, "epoch": 3089} {"train_loss": -6.635522842407227, "global_step": 129740, "epoch": 3089} {"train_loss": -6.699019908905029, "global_step": 129741, "epoch": 3089} {"train_loss": -6.662424564361572, "global_step": 129742, "epoch": 3089} {"train_loss": -6.715609550476074, "global_step": 129743, "epoch": 3089} {"train_loss": -6.687079906463623, "global_step": 129744, "epoch": 3089} {"train_loss": -6.695797920227051, "global_step": 129745, "epoch": 3089} {"train_loss": -6.66605806350708, "global_step": 129746, "epoch": 3089} {"train_loss": -6.648506164550781, "global_step": 129747, "epoch": 3089} {"train_loss": -6.742824554443359, "global_step": 129748, "epoch": 3089} {"train_loss": -6.653257846832275, "global_step": 129749, "epoch": 3089} {"train_loss": -6.589590072631836, "global_step": 129750, "epoch": 3089} {"train_loss": -6.696976661682129, "global_step": 129751, "epoch": 3089} {"train_loss": -6.606155872344971, "global_step": 129752, "epoch": 3089} {"train_loss": -6.651247024536133, "global_step": 129753, "epoch": 3089} {"train_loss": -6.4789886474609375, "global_step": 129754, "epoch": 3089} {"train_loss": -6.6588263511657715, "global_step": 129755, "epoch": 3089} {"train_loss": -6.527050971984863, "global_step": 129756, "epoch": 3089} {"train_loss": -6.644550800323486, "global_step": 129757, "epoch": 3089} {"train_loss": -6.624683380126953, "global_step": 129758, "epoch": 3089} {"train_loss": -6.52943754196167, "global_step": 129759, "epoch": 3089} {"train_loss": -6.608038902282715, "global_step": 129760, "epoch": 3089} {"train_loss": -6.575718879699707, "global_step": 129761, "epoch": 3089} {"train_loss": -6.625038146972656, "global_step": 129762, "epoch": 3089} {"train_loss": -6.604157447814941, "global_step": 129763, "epoch": 3089} {"train_loss": -6.66822624206543, "global_step": 129764, "epoch": 3089} {"train_loss": -6.708461761474609, "global_step": 129765, "epoch": 3089} {"train_loss": -6.640080451965332, "global_step": 129766, "epoch": 3089} {"train_loss": -6.621434211730957, "global_step": 129767, "epoch": 3089} {"train_loss": -6.60373592376709, "global_step": 129768, "epoch": 3089} {"train_loss": -6.718690395355225, "global_step": 129769, "epoch": 3089} {"train_loss": -6.608323097229004, "global_step": 129770, "epoch": 3089} {"train_loss": -6.679642677307129, "global_step": 129771, "epoch": 3089} {"train_loss": -6.739056587219238, "global_step": 129772, "epoch": 3089} {"train_loss": -6.726006031036377, "global_step": 129773, "epoch": 3089} {"train_loss": -6.669912338256836, "global_step": 129774, "epoch": 3089} {"train_loss": -6.597165107727051, "global_step": 129775, "epoch": 3089} {"train_loss": -6.571083068847656, "global_step": 129776, "epoch": 3089} {"train_loss": -6.602617263793945, "global_step": 129777, "epoch": 3089} {"train_loss": -6.591564178466797, "global_step": 129778, "epoch": 3089} {"train_loss": -6.637335890815372, "global_step": 129779, "epoch": 3089, "val_loss": 66578.6484375} {"train_loss": -6.592067241668701, "global_step": 129780, "epoch": 3090} {"train_loss": -6.652502059936523, "global_step": 129781, "epoch": 3090} {"train_loss": -6.616967678070068, "global_step": 129782, "epoch": 3090} {"train_loss": -6.567089080810547, "global_step": 129783, "epoch": 3090} {"train_loss": -6.713428974151611, "global_step": 129784, "epoch": 3090} {"train_loss": -6.6081342697143555, "global_step": 129785, "epoch": 3090} {"train_loss": -6.606318473815918, "global_step": 129786, "epoch": 3090} {"train_loss": -6.542466640472412, "global_step": 129787, "epoch": 3090} {"train_loss": -6.577822685241699, "global_step": 129788, "epoch": 3090} {"train_loss": -6.62613582611084, "global_step": 129789, "epoch": 3090} {"train_loss": -6.617722034454346, "global_step": 129790, "epoch": 3090} {"train_loss": -6.623069763183594, "global_step": 129791, "epoch": 3090} {"train_loss": -6.632072448730469, "global_step": 129792, "epoch": 3090} {"train_loss": -6.676567077636719, "global_step": 129793, "epoch": 3090} {"train_loss": -6.719855308532715, "global_step": 129794, "epoch": 3090} {"train_loss": -6.61721134185791, "global_step": 129795, "epoch": 3090} {"train_loss": -6.681483268737793, "global_step": 129796, "epoch": 3090} {"train_loss": -6.781189918518066, "global_step": 129797, "epoch": 3090} {"train_loss": -6.654093265533447, "global_step": 129798, "epoch": 3090} {"train_loss": -6.623246192932129, "global_step": 129799, "epoch": 3090} {"train_loss": -6.68167781829834, "global_step": 129800, "epoch": 3090} {"train_loss": -6.641842365264893, "global_step": 129801, "epoch": 3090} {"train_loss": -6.642495155334473, "global_step": 129802, "epoch": 3090} {"train_loss": -6.7389349937438965, "global_step": 129803, "epoch": 3090} {"train_loss": -6.699987888336182, "global_step": 129804, "epoch": 3090} {"train_loss": -6.734927177429199, "global_step": 129805, "epoch": 3090} {"train_loss": -6.647500514984131, "global_step": 129806, "epoch": 3090} {"train_loss": -6.660226821899414, "global_step": 129807, "epoch": 3090} {"train_loss": -6.693907260894775, "global_step": 129808, "epoch": 3090} {"train_loss": -6.715048313140869, "global_step": 129809, "epoch": 3090} {"train_loss": -6.593155860900879, "global_step": 129810, "epoch": 3090} {"train_loss": -6.716650009155273, "global_step": 129811, "epoch": 3090} {"train_loss": -6.754876136779785, "global_step": 129812, "epoch": 3090} {"train_loss": -6.735248565673828, "global_step": 129813, "epoch": 3090} {"train_loss": -6.673861980438232, "global_step": 129814, "epoch": 3090} {"train_loss": -6.801388263702393, "global_step": 129815, "epoch": 3090} {"train_loss": -6.744359970092773, "global_step": 129816, "epoch": 3090} {"train_loss": -6.657859802246094, "global_step": 129817, "epoch": 3090} {"train_loss": -6.772356033325195, "global_step": 129818, "epoch": 3090} {"train_loss": -6.648531913757324, "global_step": 129819, "epoch": 3090} {"train_loss": -6.733162879943848, "global_step": 129820, "epoch": 3090} {"train_loss": -6.67006668590364, "global_step": 129821, "epoch": 3090, "val_loss": 66489.078125} {"train_loss": -6.718678951263428, "global_step": 129822, "epoch": 3091} {"train_loss": -6.690258026123047, "global_step": 129823, "epoch": 3091} {"train_loss": -6.761746406555176, "global_step": 129824, "epoch": 3091} {"train_loss": -6.675772666931152, "global_step": 129825, "epoch": 3091} {"train_loss": -6.681124687194824, "global_step": 129826, "epoch": 3091} {"train_loss": -6.769440650939941, "global_step": 129827, "epoch": 3091} {"train_loss": -6.738247871398926, "global_step": 129828, "epoch": 3091} {"train_loss": -6.792413711547852, "global_step": 129829, "epoch": 3091} {"train_loss": -6.7326531410217285, "global_step": 129830, "epoch": 3091} {"train_loss": -6.692734718322754, "global_step": 129831, "epoch": 3091} {"train_loss": -6.679387092590332, "global_step": 129832, "epoch": 3091} {"train_loss": -6.685016632080078, "global_step": 129833, "epoch": 3091} {"train_loss": -6.685087203979492, "global_step": 129834, "epoch": 3091} {"train_loss": -6.743915557861328, "global_step": 129835, "epoch": 3091} {"train_loss": -6.647558212280273, "global_step": 129836, "epoch": 3091} {"train_loss": -6.645416259765625, "global_step": 129837, "epoch": 3091} {"train_loss": -6.789942741394043, "global_step": 129838, "epoch": 3091} {"train_loss": -6.677887439727783, "global_step": 129839, "epoch": 3091} {"train_loss": -6.546612739562988, "global_step": 129840, "epoch": 3091} {"train_loss": -6.727888107299805, "global_step": 129841, "epoch": 3091} {"train_loss": -6.759537220001221, "global_step": 129842, "epoch": 3091} {"train_loss": -6.4822235107421875, "global_step": 129843, "epoch": 3091} {"train_loss": -6.572068691253662, "global_step": 129844, "epoch": 3091} {"train_loss": -6.647026538848877, "global_step": 129845, "epoch": 3091} {"train_loss": -6.628877639770508, "global_step": 129846, "epoch": 3091} {"train_loss": -6.57619047164917, "global_step": 129847, "epoch": 3091} {"train_loss": -6.599673748016357, "global_step": 129848, "epoch": 3091} {"train_loss": -6.6464104652404785, "global_step": 129849, "epoch": 3091} {"train_loss": -6.570121765136719, "global_step": 129850, "epoch": 3091} {"train_loss": -6.4966301918029785, "global_step": 129851, "epoch": 3091} {"train_loss": -6.645570755004883, "global_step": 129852, "epoch": 3091} {"train_loss": -6.6302642822265625, "global_step": 129853, "epoch": 3091} {"train_loss": -6.564425468444824, "global_step": 129854, "epoch": 3091} {"train_loss": -6.551989555358887, "global_step": 129855, "epoch": 3091} {"train_loss": -6.504824638366699, "global_step": 129856, "epoch": 3091} {"train_loss": -6.589199066162109, "global_step": 129857, "epoch": 3091} {"train_loss": -6.548799514770508, "global_step": 129858, "epoch": 3091} {"train_loss": -6.5239362716674805, "global_step": 129859, "epoch": 3091} {"train_loss": -6.4975738525390625, "global_step": 129860, "epoch": 3091} {"train_loss": -6.692153453826904, "global_step": 129861, "epoch": 3091} {"train_loss": -6.508830547332764, "global_step": 129862, "epoch": 3091} {"train_loss": -6.643491165978568, "global_step": 129863, "epoch": 3091, "val_loss": 66631.46875} {"train_loss": -6.575287342071533, "global_step": 129864, "epoch": 3092} {"train_loss": -6.5419230461120605, "global_step": 129865, "epoch": 3092} {"train_loss": -6.602499008178711, "global_step": 129866, "epoch": 3092} {"train_loss": -6.518876075744629, "global_step": 129867, "epoch": 3092} {"train_loss": -6.662256240844727, "global_step": 129868, "epoch": 3092} {"train_loss": -6.620345592498779, "global_step": 129869, "epoch": 3092} {"train_loss": -6.671518802642822, "global_step": 129870, "epoch": 3092} {"train_loss": -6.650909423828125, "global_step": 129871, "epoch": 3092} {"train_loss": -6.643322944641113, "global_step": 129872, "epoch": 3092} {"train_loss": -6.595738887786865, "global_step": 129873, "epoch": 3092} {"train_loss": -6.6057844161987305, "global_step": 129874, "epoch": 3092} {"train_loss": -6.656856536865234, "global_step": 129875, "epoch": 3092} {"train_loss": -6.700681686401367, "global_step": 129876, "epoch": 3092} {"train_loss": -6.7735748291015625, "global_step": 129877, "epoch": 3092} {"train_loss": -6.6766252517700195, "global_step": 129878, "epoch": 3092} {"train_loss": -6.706892490386963, "global_step": 129879, "epoch": 3092} {"train_loss": -6.733892917633057, "global_step": 129880, "epoch": 3092} {"train_loss": -6.6332573890686035, "global_step": 129881, "epoch": 3092} {"train_loss": -6.745689868927002, "global_step": 129882, "epoch": 3092} {"train_loss": -6.704100608825684, "global_step": 129883, "epoch": 3092} {"train_loss": -6.552608966827393, "global_step": 129884, "epoch": 3092} {"train_loss": -6.715923309326172, "global_step": 129885, "epoch": 3092} {"train_loss": -6.7462263107299805, "global_step": 129886, "epoch": 3092} {"train_loss": -6.69326639175415, "global_step": 129887, "epoch": 3092} {"train_loss": -6.835402965545654, "global_step": 129888, "epoch": 3092} {"train_loss": -6.745497703552246, "global_step": 129889, "epoch": 3092} {"train_loss": -6.7876386642456055, "global_step": 129890, "epoch": 3092} {"train_loss": -6.665406227111816, "global_step": 129891, "epoch": 3092} {"train_loss": -6.775857925415039, "global_step": 129892, "epoch": 3092} {"train_loss": -6.656911849975586, "global_step": 129893, "epoch": 3092} {"train_loss": -6.839094161987305, "global_step": 129894, "epoch": 3092} {"train_loss": -6.766952991485596, "global_step": 129895, "epoch": 3092} {"train_loss": -6.701512813568115, "global_step": 129896, "epoch": 3092} {"train_loss": -6.627223491668701, "global_step": 129897, "epoch": 3092} {"train_loss": -6.703885555267334, "global_step": 129898, "epoch": 3092} {"train_loss": -6.772546768188477, "global_step": 129899, "epoch": 3092} {"train_loss": -6.750230312347412, "global_step": 129900, "epoch": 3092} {"train_loss": -6.620560646057129, "global_step": 129901, "epoch": 3092} {"train_loss": -6.735188007354736, "global_step": 129902, "epoch": 3092} {"train_loss": -6.657598972320557, "global_step": 129903, "epoch": 3092} {"train_loss": -6.671261310577393, "global_step": 129904, "epoch": 3092} {"train_loss": -6.682630028043475, "global_step": 129905, "epoch": 3092, "val_loss": 66222.5546875} {"train_loss": -6.713405609130859, "global_step": 129906, "epoch": 3093} {"train_loss": -6.649319648742676, "global_step": 129907, "epoch": 3093} {"train_loss": -6.790111064910889, "global_step": 129908, "epoch": 3093} {"train_loss": -6.836885452270508, "global_step": 129909, "epoch": 3093} {"train_loss": -6.697926998138428, "global_step": 129910, "epoch": 3093} {"train_loss": -6.614570140838623, "global_step": 129911, "epoch": 3093} {"train_loss": -6.672996520996094, "global_step": 129912, "epoch": 3093} {"train_loss": -6.761573791503906, "global_step": 129913, "epoch": 3093} {"train_loss": -6.701281547546387, "global_step": 129914, "epoch": 3093} {"train_loss": -6.800527572631836, "global_step": 129915, "epoch": 3093} {"train_loss": -6.743845462799072, "global_step": 129916, "epoch": 3093} {"train_loss": -6.676932334899902, "global_step": 129917, "epoch": 3093} {"train_loss": -6.818082332611084, "global_step": 129918, "epoch": 3093} {"train_loss": -6.776234149932861, "global_step": 129919, "epoch": 3093} {"train_loss": -6.688485145568848, "global_step": 129920, "epoch": 3093} {"train_loss": -6.879947662353516, "global_step": 129921, "epoch": 3093} {"train_loss": -6.680048942565918, "global_step": 129922, "epoch": 3093} {"train_loss": -6.7005791664123535, "global_step": 129923, "epoch": 3093} {"train_loss": -6.686850070953369, "global_step": 129924, "epoch": 3093} {"train_loss": -6.708683967590332, "global_step": 129925, "epoch": 3093} {"train_loss": -6.688618183135986, "global_step": 129926, "epoch": 3093} {"train_loss": -6.546666145324707, "global_step": 129927, "epoch": 3093} {"train_loss": -6.6390700340271, "global_step": 129928, "epoch": 3093} {"train_loss": -6.616732597351074, "global_step": 129929, "epoch": 3093} {"train_loss": -6.568873405456543, "global_step": 129930, "epoch": 3093} {"train_loss": -6.603813171386719, "global_step": 129931, "epoch": 3093} {"train_loss": -6.583627700805664, "global_step": 129932, "epoch": 3093} {"train_loss": -6.689462661743164, "global_step": 129933, "epoch": 3093} {"train_loss": -6.672970294952393, "global_step": 129934, "epoch": 3093} {"train_loss": -6.7901930809021, "global_step": 129935, "epoch": 3093} {"train_loss": -6.650162220001221, "global_step": 129936, "epoch": 3093} {"train_loss": -6.755499839782715, "global_step": 129937, "epoch": 3093} {"train_loss": -6.681471347808838, "global_step": 129938, "epoch": 3093} {"train_loss": -6.707450866699219, "global_step": 129939, "epoch": 3093} {"train_loss": -6.738324165344238, "global_step": 129940, "epoch": 3093} {"train_loss": -6.657320022583008, "global_step": 129941, "epoch": 3093} {"train_loss": -6.547967910766602, "global_step": 129942, "epoch": 3093} {"train_loss": -6.615300178527832, "global_step": 129943, "epoch": 3093} {"train_loss": -6.53788423538208, "global_step": 129944, "epoch": 3093} {"train_loss": -6.663745880126953, "global_step": 129945, "epoch": 3093} {"train_loss": -6.709388732910156, "global_step": 129946, "epoch": 3093} {"train_loss": -6.686806519826253, "global_step": 129947, "epoch": 3093, "val_loss": 66420.7578125} {"train_loss": -6.609645843505859, "global_step": 129948, "epoch": 3094} {"train_loss": -6.6885247230529785, "global_step": 129949, "epoch": 3094} {"train_loss": -6.576711177825928, "global_step": 129950, "epoch": 3094} {"train_loss": -6.70237398147583, "global_step": 129951, "epoch": 3094} {"train_loss": -6.632615089416504, "global_step": 129952, "epoch": 3094} {"train_loss": -6.750705718994141, "global_step": 129953, "epoch": 3094} {"train_loss": -6.615338325500488, "global_step": 129954, "epoch": 3094} {"train_loss": -6.635741233825684, "global_step": 129955, "epoch": 3094} {"train_loss": -6.767346382141113, "global_step": 129956, "epoch": 3094} {"train_loss": -6.79076623916626, "global_step": 129957, "epoch": 3094} {"train_loss": -6.689654350280762, "global_step": 129958, "epoch": 3094} {"train_loss": -6.8050689697265625, "global_step": 129959, "epoch": 3094} {"train_loss": -6.794286727905273, "global_step": 129960, "epoch": 3094} {"train_loss": -6.722151756286621, "global_step": 129961, "epoch": 3094} {"train_loss": -6.646561622619629, "global_step": 129962, "epoch": 3094} {"train_loss": -6.674705505371094, "global_step": 129963, "epoch": 3094} {"train_loss": -6.634173393249512, "global_step": 129964, "epoch": 3094} {"train_loss": -6.712428092956543, "global_step": 129965, "epoch": 3094} {"train_loss": -6.671507835388184, "global_step": 129966, "epoch": 3094} {"train_loss": -6.6278557777404785, "global_step": 129967, "epoch": 3094} {"train_loss": -6.780970096588135, "global_step": 129968, "epoch": 3094} {"train_loss": -6.734273910522461, "global_step": 129969, "epoch": 3094} {"train_loss": -6.656731128692627, "global_step": 129970, "epoch": 3094} {"train_loss": -6.724504470825195, "global_step": 129971, "epoch": 3094} {"train_loss": -6.798824310302734, "global_step": 129972, "epoch": 3094} {"train_loss": -6.743068218231201, "global_step": 129973, "epoch": 3094} {"train_loss": -6.773521423339844, "global_step": 129974, "epoch": 3094} {"train_loss": -6.582673072814941, "global_step": 129975, "epoch": 3094} {"train_loss": -6.659173011779785, "global_step": 129976, "epoch": 3094} {"train_loss": -6.687628746032715, "global_step": 129977, "epoch": 3094} {"train_loss": -6.5760369300842285, "global_step": 129978, "epoch": 3094} {"train_loss": -6.584146976470947, "global_step": 129979, "epoch": 3094} {"train_loss": -6.731996536254883, "global_step": 129980, "epoch": 3094} {"train_loss": -6.590666770935059, "global_step": 129981, "epoch": 3094} {"train_loss": -6.630654335021973, "global_step": 129982, "epoch": 3094} {"train_loss": -6.676732063293457, "global_step": 129983, "epoch": 3094} {"train_loss": -6.611722946166992, "global_step": 129984, "epoch": 3094} {"train_loss": -6.536464691162109, "global_step": 129985, "epoch": 3094} {"train_loss": -6.74884033203125, "global_step": 129986, "epoch": 3094} {"train_loss": -6.617826461791992, "global_step": 129987, "epoch": 3094} {"train_loss": -6.6890411376953125, "global_step": 129988, "epoch": 3094} {"train_loss": -6.680868625640869, "global_step": 129989, "epoch": 3094, "val_loss": 66489.9921875} {"train_loss": -6.589197158813477, "global_step": 129990, "epoch": 3095} {"train_loss": -6.647475242614746, "global_step": 129991, "epoch": 3095} {"train_loss": -6.689416885375977, "global_step": 129992, "epoch": 3095} {"train_loss": -6.745853900909424, "global_step": 129993, "epoch": 3095} {"train_loss": -6.61570930480957, "global_step": 129994, "epoch": 3095} {"train_loss": -6.6830949783325195, "global_step": 129995, "epoch": 3095} {"train_loss": -6.7034220695495605, "global_step": 129996, "epoch": 3095} {"train_loss": -6.554881572723389, "global_step": 129997, "epoch": 3095} {"train_loss": -6.6862101554870605, "global_step": 129998, "epoch": 3095} {"train_loss": -6.593901634216309, "global_step": 129999, "epoch": 3095} {"train_loss": -6.64741849899292, "global_step": 130000, "epoch": 3095} {"train_loss": -6.624026775360107, "global_step": 130001, "epoch": 3095} {"train_loss": -6.592256546020508, "global_step": 130002, "epoch": 3095} {"train_loss": -6.713761329650879, "global_step": 130003, "epoch": 3095} {"train_loss": -6.7493696212768555, "global_step": 130004, "epoch": 3095} {"train_loss": -6.68032169342041, "global_step": 130005, "epoch": 3095} {"train_loss": -6.650653839111328, "global_step": 130006, "epoch": 3095} {"train_loss": -6.490224838256836, "global_step": 130007, "epoch": 3095} {"train_loss": -6.560873031616211, "global_step": 130008, "epoch": 3095} {"train_loss": -6.6122894287109375, "global_step": 130009, "epoch": 3095} {"train_loss": -6.6369733810424805, "global_step": 130010, "epoch": 3095} {"train_loss": -6.477224826812744, "global_step": 130011, "epoch": 3095} {"train_loss": -6.64046573638916, "global_step": 130012, "epoch": 3095} {"train_loss": -6.6828999519348145, "global_step": 130013, "epoch": 3095} {"train_loss": -6.6046037673950195, "global_step": 130014, "epoch": 3095} {"train_loss": -6.631721496582031, "global_step": 130015, "epoch": 3095} {"train_loss": -6.696425437927246, "global_step": 130016, "epoch": 3095} {"train_loss": -6.652266502380371, "global_step": 130017, "epoch": 3095} {"train_loss": -6.707376480102539, "global_step": 130018, "epoch": 3095} {"train_loss": -6.640501499176025, "global_step": 130019, "epoch": 3095} {"train_loss": -6.615047931671143, "global_step": 130020, "epoch": 3095} {"train_loss": -6.547355651855469, "global_step": 130021, "epoch": 3095} {"train_loss": -6.583559989929199, "global_step": 130022, "epoch": 3095} {"train_loss": -6.68984317779541, "global_step": 130023, "epoch": 3095} {"train_loss": -6.619746208190918, "global_step": 130024, "epoch": 3095} {"train_loss": -6.523869037628174, "global_step": 130025, "epoch": 3095} {"train_loss": -6.713675022125244, "global_step": 130026, "epoch": 3095} {"train_loss": -6.604837894439697, "global_step": 130027, "epoch": 3095} {"train_loss": -6.57733154296875, "global_step": 130028, "epoch": 3095} {"train_loss": -6.701428413391113, "global_step": 130029, "epoch": 3095} {"train_loss": -6.626983165740967, "global_step": 130030, "epoch": 3095} {"train_loss": -6.63532364936102, "global_step": 130031, "epoch": 3095, "val_loss": 66562.9765625} {"train_loss": -6.783822059631348, "global_step": 130032, "epoch": 3096} {"train_loss": -6.713911056518555, "global_step": 130033, "epoch": 3096} {"train_loss": -6.6058197021484375, "global_step": 130034, "epoch": 3096} {"train_loss": -6.572849273681641, "global_step": 130035, "epoch": 3096} {"train_loss": -6.615777015686035, "global_step": 130036, "epoch": 3096} {"train_loss": -6.638604164123535, "global_step": 130037, "epoch": 3096} {"train_loss": -6.677242755889893, "global_step": 130038, "epoch": 3096} {"train_loss": -6.571319103240967, "global_step": 130039, "epoch": 3096} {"train_loss": -6.6360931396484375, "global_step": 130040, "epoch": 3096} {"train_loss": -6.701799392700195, "global_step": 130041, "epoch": 3096} {"train_loss": -6.68005895614624, "global_step": 130042, "epoch": 3096} {"train_loss": -6.555651664733887, "global_step": 130043, "epoch": 3096} {"train_loss": -6.6810526847839355, "global_step": 130044, "epoch": 3096} {"train_loss": -6.61981201171875, "global_step": 130045, "epoch": 3096} {"train_loss": -6.716108798980713, "global_step": 130046, "epoch": 3096} {"train_loss": -6.717308521270752, "global_step": 130047, "epoch": 3096} {"train_loss": -6.596861839294434, "global_step": 130048, "epoch": 3096} {"train_loss": -6.6770501136779785, "global_step": 130049, "epoch": 3096} {"train_loss": -6.701727867126465, "global_step": 130050, "epoch": 3096} {"train_loss": -6.763988971710205, "global_step": 130051, "epoch": 3096} {"train_loss": -6.576606750488281, "global_step": 130052, "epoch": 3096} {"train_loss": -6.73569393157959, "global_step": 130053, "epoch": 3096} {"train_loss": -6.703475475311279, "global_step": 130054, "epoch": 3096} {"train_loss": -6.713258743286133, "global_step": 130055, "epoch": 3096} {"train_loss": -6.6577630043029785, "global_step": 130056, "epoch": 3096} {"train_loss": -6.6729230880737305, "global_step": 130057, "epoch": 3096} {"train_loss": -6.762523651123047, "global_step": 130058, "epoch": 3096} {"train_loss": -6.647590637207031, "global_step": 130059, "epoch": 3096} {"train_loss": -6.649795055389404, "global_step": 130060, "epoch": 3096} {"train_loss": -6.776932716369629, "global_step": 130061, "epoch": 3096} {"train_loss": -6.612394332885742, "global_step": 130062, "epoch": 3096} {"train_loss": -6.65013313293457, "global_step": 130063, "epoch": 3096} {"train_loss": -6.622087478637695, "global_step": 130064, "epoch": 3096} {"train_loss": -6.745367050170898, "global_step": 130065, "epoch": 3096} {"train_loss": -6.694944381713867, "global_step": 130066, "epoch": 3096} {"train_loss": -6.695112228393555, "global_step": 130067, "epoch": 3096} {"train_loss": -6.710551738739014, "global_step": 130068, "epoch": 3096} {"train_loss": -6.629344463348389, "global_step": 130069, "epoch": 3096} {"train_loss": -6.72387170791626, "global_step": 130070, "epoch": 3096} {"train_loss": -6.628899574279785, "global_step": 130071, "epoch": 3096} {"train_loss": -6.807855129241943, "global_step": 130072, "epoch": 3096} {"train_loss": -6.675630455925351, "global_step": 130073, "epoch": 3096, "val_loss": 66430.5078125} {"train_loss": -6.777862071990967, "global_step": 130074, "epoch": 3097} {"train_loss": -6.708948612213135, "global_step": 130075, "epoch": 3097} {"train_loss": -6.646345138549805, "global_step": 130076, "epoch": 3097} {"train_loss": -6.719424247741699, "global_step": 130077, "epoch": 3097} {"train_loss": -6.706543922424316, "global_step": 130078, "epoch": 3097} {"train_loss": -6.747129917144775, "global_step": 130079, "epoch": 3097} {"train_loss": -6.647287845611572, "global_step": 130080, "epoch": 3097} {"train_loss": -6.739470481872559, "global_step": 130081, "epoch": 3097} {"train_loss": -6.724069595336914, "global_step": 130082, "epoch": 3097} {"train_loss": -6.726874351501465, "global_step": 130083, "epoch": 3097} {"train_loss": -6.803675174713135, "global_step": 130084, "epoch": 3097} {"train_loss": -6.741235733032227, "global_step": 130085, "epoch": 3097} {"train_loss": -6.705266952514648, "global_step": 130086, "epoch": 3097} {"train_loss": -6.708521842956543, "global_step": 130087, "epoch": 3097} {"train_loss": -6.696260452270508, "global_step": 130088, "epoch": 3097} {"train_loss": -6.867749214172363, "global_step": 130089, "epoch": 3097} {"train_loss": -6.613289833068848, "global_step": 130090, "epoch": 3097} {"train_loss": -6.684365272521973, "global_step": 130091, "epoch": 3097} {"train_loss": -6.676344394683838, "global_step": 130092, "epoch": 3097} {"train_loss": -6.605542182922363, "global_step": 130093, "epoch": 3097} {"train_loss": -6.587343215942383, "global_step": 130094, "epoch": 3097} {"train_loss": -6.669430255889893, "global_step": 130095, "epoch": 3097} {"train_loss": -6.6232757568359375, "global_step": 130096, "epoch": 3097} {"train_loss": -6.548160552978516, "global_step": 130097, "epoch": 3097} {"train_loss": -6.66234016418457, "global_step": 130098, "epoch": 3097} {"train_loss": -6.69774866104126, "global_step": 130099, "epoch": 3097} {"train_loss": -6.724002838134766, "global_step": 130100, "epoch": 3097} {"train_loss": -6.721012115478516, "global_step": 130101, "epoch": 3097} {"train_loss": -6.740499973297119, "global_step": 130102, "epoch": 3097} {"train_loss": -6.699750900268555, "global_step": 130103, "epoch": 3097} {"train_loss": -6.658992767333984, "global_step": 130104, "epoch": 3097} {"train_loss": -6.708014011383057, "global_step": 130105, "epoch": 3097} {"train_loss": -6.66696834564209, "global_step": 130106, "epoch": 3097} {"train_loss": -6.8039469718933105, "global_step": 130107, "epoch": 3097} {"train_loss": -6.808079242706299, "global_step": 130108, "epoch": 3097} {"train_loss": -6.581315040588379, "global_step": 130109, "epoch": 3097} {"train_loss": -6.725016117095947, "global_step": 130110, "epoch": 3097} {"train_loss": -6.588652610778809, "global_step": 130111, "epoch": 3097} {"train_loss": -6.6307549476623535, "global_step": 130112, "epoch": 3097} {"train_loss": -6.499579429626465, "global_step": 130113, "epoch": 3097} {"train_loss": -6.603132247924805, "global_step": 130114, "epoch": 3097} {"train_loss": -6.686482736042568, "global_step": 130115, "epoch": 3097, "val_loss": 66498.28125} {"train_loss": -6.617895603179932, "global_step": 130116, "epoch": 3098} {"train_loss": -6.667043685913086, "global_step": 130117, "epoch": 3098} {"train_loss": -6.704462051391602, "global_step": 130118, "epoch": 3098} {"train_loss": -6.649745464324951, "global_step": 130119, "epoch": 3098} {"train_loss": -6.646328449249268, "global_step": 130120, "epoch": 3098} {"train_loss": -6.6599249839782715, "global_step": 130121, "epoch": 3098} {"train_loss": -6.579615116119385, "global_step": 130122, "epoch": 3098} {"train_loss": -6.631385803222656, "global_step": 130123, "epoch": 3098} {"train_loss": -6.557241439819336, "global_step": 130124, "epoch": 3098} {"train_loss": -6.656585693359375, "global_step": 130125, "epoch": 3098} {"train_loss": -6.668733596801758, "global_step": 130126, "epoch": 3098} {"train_loss": -6.687429428100586, "global_step": 130127, "epoch": 3098} {"train_loss": -6.646144390106201, "global_step": 130128, "epoch": 3098} {"train_loss": -6.605658531188965, "global_step": 130129, "epoch": 3098} {"train_loss": -6.676128387451172, "global_step": 130130, "epoch": 3098} {"train_loss": -6.732141494750977, "global_step": 130131, "epoch": 3098} {"train_loss": -6.622928619384766, "global_step": 130132, "epoch": 3098} {"train_loss": -6.611278057098389, "global_step": 130133, "epoch": 3098} {"train_loss": -6.635388374328613, "global_step": 130134, "epoch": 3098} {"train_loss": -6.574066638946533, "global_step": 130135, "epoch": 3098} {"train_loss": -6.6786394119262695, "global_step": 130136, "epoch": 3098} {"train_loss": -6.689477443695068, "global_step": 130137, "epoch": 3098} {"train_loss": -6.711176872253418, "global_step": 130138, "epoch": 3098} {"train_loss": -6.657094955444336, "global_step": 130139, "epoch": 3098} {"train_loss": -6.6405744552612305, "global_step": 130140, "epoch": 3098} {"train_loss": -6.804594039916992, "global_step": 130141, "epoch": 3098} {"train_loss": -6.763576030731201, "global_step": 130142, "epoch": 3098} {"train_loss": -6.63426399230957, "global_step": 130143, "epoch": 3098} {"train_loss": -6.744382381439209, "global_step": 130144, "epoch": 3098} {"train_loss": -6.466939926147461, "global_step": 130145, "epoch": 3098} {"train_loss": -6.7697343826293945, "global_step": 130146, "epoch": 3098} {"train_loss": -6.669334411621094, "global_step": 130147, "epoch": 3098} {"train_loss": -6.604026794433594, "global_step": 130148, "epoch": 3098} {"train_loss": -6.806471347808838, "global_step": 130149, "epoch": 3098} {"train_loss": -6.783758163452148, "global_step": 130150, "epoch": 3098} {"train_loss": -6.66424560546875, "global_step": 130151, "epoch": 3098} {"train_loss": -6.603811740875244, "global_step": 130152, "epoch": 3098} {"train_loss": -6.6405463218688965, "global_step": 130153, "epoch": 3098} {"train_loss": -6.671992301940918, "global_step": 130154, "epoch": 3098} {"train_loss": -6.467012405395508, "global_step": 130155, "epoch": 3098} {"train_loss": -6.652703285217285, "global_step": 130156, "epoch": 3098} {"train_loss": -6.656082925342378, "global_step": 130157, "epoch": 3098, "val_loss": 66566.8046875} {"train_loss": -6.645746231079102, "global_step": 130158, "epoch": 3099} {"train_loss": -6.70380973815918, "global_step": 130159, "epoch": 3099} {"train_loss": -6.750094413757324, "global_step": 130160, "epoch": 3099} {"train_loss": -6.802165985107422, "global_step": 130161, "epoch": 3099} {"train_loss": -6.7642927169799805, "global_step": 130162, "epoch": 3099} {"train_loss": -6.649608135223389, "global_step": 130163, "epoch": 3099} {"train_loss": -6.741060256958008, "global_step": 130164, "epoch": 3099} {"train_loss": -6.691823959350586, "global_step": 130165, "epoch": 3099} {"train_loss": -6.529129981994629, "global_step": 130166, "epoch": 3099} {"train_loss": -6.712664604187012, "global_step": 130167, "epoch": 3099} {"train_loss": -6.746394157409668, "global_step": 130168, "epoch": 3099} {"train_loss": -6.536501407623291, "global_step": 130169, "epoch": 3099} {"train_loss": -6.737573623657227, "global_step": 130170, "epoch": 3099} {"train_loss": -6.579104423522949, "global_step": 130171, "epoch": 3099} {"train_loss": -6.609185218811035, "global_step": 130172, "epoch": 3099} {"train_loss": -6.701102256774902, "global_step": 130173, "epoch": 3099} {"train_loss": -6.6889214515686035, "global_step": 130174, "epoch": 3099} {"train_loss": -6.726429462432861, "global_step": 130175, "epoch": 3099} {"train_loss": -6.723628520965576, "global_step": 130176, "epoch": 3099} {"train_loss": -6.691631317138672, "global_step": 130177, "epoch": 3099} {"train_loss": -6.614516258239746, "global_step": 130178, "epoch": 3099} {"train_loss": -6.611456871032715, "global_step": 130179, "epoch": 3099} {"train_loss": -6.669492721557617, "global_step": 130180, "epoch": 3099} {"train_loss": -6.644558906555176, "global_step": 130181, "epoch": 3099} {"train_loss": -6.687313556671143, "global_step": 130182, "epoch": 3099} {"train_loss": -6.721704483032227, "global_step": 130183, "epoch": 3099} {"train_loss": -6.639640808105469, "global_step": 130184, "epoch": 3099} {"train_loss": -6.691702842712402, "global_step": 130185, "epoch": 3099} {"train_loss": -6.569583892822266, "global_step": 130186, "epoch": 3099} {"train_loss": -6.642692565917969, "global_step": 130187, "epoch": 3099} {"train_loss": -6.6680378913879395, "global_step": 130188, "epoch": 3099} {"train_loss": -6.53242301940918, "global_step": 130189, "epoch": 3099} {"train_loss": -6.636273384094238, "global_step": 130190, "epoch": 3099} {"train_loss": -6.590207099914551, "global_step": 130191, "epoch": 3099} {"train_loss": -6.6436309814453125, "global_step": 130192, "epoch": 3099} {"train_loss": -6.707810401916504, "global_step": 130193, "epoch": 3099} {"train_loss": -6.633058547973633, "global_step": 130194, "epoch": 3099} {"train_loss": -6.628938674926758, "global_step": 130195, "epoch": 3099} {"train_loss": -6.734683990478516, "global_step": 130196, "epoch": 3099} {"train_loss": -6.742031097412109, "global_step": 130197, "epoch": 3099} {"train_loss": -6.804978370666504, "global_step": 130198, "epoch": 3099} {"train_loss": -6.672343288149152, "global_step": 130199, "epoch": 3099, "val_loss": 66374.3984375} {"train_loss": -6.713737964630127, "global_step": 130200, "epoch": 3100} {"train_loss": -6.747186660766602, "global_step": 130201, "epoch": 3100} {"train_loss": -6.685398578643799, "global_step": 130202, "epoch": 3100} {"train_loss": -6.735668182373047, "global_step": 130203, "epoch": 3100} {"train_loss": -6.600147247314453, "global_step": 130204, "epoch": 3100} {"train_loss": -6.753337860107422, "global_step": 130205, "epoch": 3100} {"train_loss": -6.748156547546387, "global_step": 130206, "epoch": 3100} {"train_loss": -6.679980754852295, "global_step": 130207, "epoch": 3100} {"train_loss": -6.882643699645996, "global_step": 130208, "epoch": 3100} {"train_loss": -6.663419723510742, "global_step": 130209, "epoch": 3100} {"train_loss": -6.624585151672363, "global_step": 130210, "epoch": 3100} {"train_loss": -6.659438610076904, "global_step": 130211, "epoch": 3100} {"train_loss": -6.634082794189453, "global_step": 130212, "epoch": 3100} {"train_loss": -6.696807861328125, "global_step": 130213, "epoch": 3100} {"train_loss": -6.6039910316467285, "global_step": 130214, "epoch": 3100} {"train_loss": -6.675037384033203, "global_step": 130215, "epoch": 3100} {"train_loss": -6.820206642150879, "global_step": 130216, "epoch": 3100} {"train_loss": -6.770966529846191, "global_step": 130217, "epoch": 3100} {"train_loss": -6.749567985534668, "global_step": 130218, "epoch": 3100} {"train_loss": -6.6908159255981445, "global_step": 130219, "epoch": 3100} {"train_loss": -6.696860313415527, "global_step": 130220, "epoch": 3100} {"train_loss": -6.665910720825195, "global_step": 130221, "epoch": 3100} {"train_loss": -6.7328925132751465, "global_step": 130222, "epoch": 3100} {"train_loss": -6.743832111358643, "global_step": 130223, "epoch": 3100} {"train_loss": -6.724620342254639, "global_step": 130224, "epoch": 3100} {"train_loss": -6.728551387786865, "global_step": 130225, "epoch": 3100} {"train_loss": -6.709261894226074, "global_step": 130226, "epoch": 3100} {"train_loss": -6.729672431945801, "global_step": 130227, "epoch": 3100} {"train_loss": -6.728871822357178, "global_step": 130228, "epoch": 3100} {"train_loss": -6.750240325927734, "global_step": 130229, "epoch": 3100} {"train_loss": -6.7423200607299805, "global_step": 130230, "epoch": 3100} {"train_loss": -6.770471572875977, "global_step": 130231, "epoch": 3100} {"train_loss": -6.712350845336914, "global_step": 130232, "epoch": 3100} {"train_loss": -6.686530113220215, "global_step": 130233, "epoch": 3100} {"train_loss": -6.815470218658447, "global_step": 130234, "epoch": 3100} {"train_loss": -6.636999607086182, "global_step": 130235, "epoch": 3100} {"train_loss": -6.653312683105469, "global_step": 130236, "epoch": 3100} {"train_loss": -6.733014106750488, "global_step": 130237, "epoch": 3100} {"train_loss": -6.648959159851074, "global_step": 130238, "epoch": 3100} {"train_loss": -6.694785118103027, "global_step": 130239, "epoch": 3100} {"train_loss": -6.65277099609375, "global_step": 130240, "epoch": 3100} {"train_loss": -6.7064573764801025, "global_step": 130241, "epoch": 3100, "train/sim_max_reward_0": 0.19406019058517215, "train/sim_max_reward_1": 0.9400593489212458, "train/sim_max_reward_2": 0.9633928028745351, "train/sim_max_reward_3": 0.9311581187843938, "train/sim_max_reward_4": 0.9030468870533827, "train/sim_max_reward_5": 0.8907138327215044, "test/sim_max_reward_4300000": 0.9492866489885781, "test/sim_max_reward_4300001": 0.6979357892684188, "test/sim_max_reward_4300002": 0.9446027709403105, "test/sim_max_reward_4300003": 0.9248468121593828, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.864508960510853, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.33806621466679393, "test/sim_max_reward_4300008": 0.9279693344349779, "test/sim_max_reward_4300009": 0.9227039679220592, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9433322094233297, "test/sim_max_reward_4300012": 0.8965692483627611, "test/sim_max_reward_4300013": 0.41046238366609794, "test/sim_max_reward_4300014": 0.9623954699035154, "test/sim_max_reward_4300015": 0.9807638652702235, "test/sim_max_reward_4300016": 0.9018513071155989, "test/sim_max_reward_4300017": 0.985984962120851, "test/sim_max_reward_4300018": 0.43583611933385097, "test/sim_max_reward_4300019": 0.18334244095728758, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.3607543843785625, "test/sim_max_reward_4300022": 0.41082703560360206, "test/sim_max_reward_4300023": 1.0, "test/sim_max_reward_4300024": 0.8859959734401779, "test/sim_max_reward_4300025": 0.8769906516060387, "test/sim_max_reward_4300026": 0.13043642759784865, "test/sim_max_reward_4300027": 0.8091167381821637, "test/sim_max_reward_4300028": 0.0019247655848127405, "test/sim_max_reward_4300029": 0.8134606229066718, "test/sim_max_reward_4300030": 0.0, "test/sim_max_reward_4300031": 0.8082015882799678, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.8149484240038882, "test/sim_max_reward_4300034": 0.2842563186840405, "test/sim_max_reward_4300035": 0.5226582146762214, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8505857607059925, "test/sim_max_reward_4300038": 0.5827216489156923, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.8451410763156253, "test/sim_max_reward_4300041": 0.4272596038714626, "test/sim_max_reward_4300042": 0.8854648877012007, "test/sim_max_reward_4300043": 0.16354654546352843, "test/sim_max_reward_4300044": 0.8242535027806076, "test/sim_max_reward_4300045": 0.18390535537481617, "test/sim_max_reward_4300046": 0.8089564281873212, "test/sim_max_reward_4300047": 0.20219069941559803, "test/sim_max_reward_4300048": 0.9247381092796213, "test/sim_max_reward_4300049": 0.10509723548911719, "train/mean_score": 0.8037385301567056, "test/mean_score": 0.6001783744772446, "val_loss": 66473.0859375} {"train_loss": -6.695392608642578, "global_step": 130242, "epoch": 3101} {"train_loss": -6.710936546325684, "global_step": 130243, "epoch": 3101} {"train_loss": -6.689987659454346, "global_step": 130244, "epoch": 3101} {"train_loss": -6.649049758911133, "global_step": 130245, "epoch": 3101} {"train_loss": -6.623773574829102, "global_step": 130246, "epoch": 3101} {"train_loss": -6.618495464324951, "global_step": 130247, "epoch": 3101} {"train_loss": -6.586500644683838, "global_step": 130248, "epoch": 3101} {"train_loss": -6.689731597900391, "global_step": 130249, "epoch": 3101} {"train_loss": -6.627936363220215, "global_step": 130250, "epoch": 3101} {"train_loss": -6.653283596038818, "global_step": 130251, "epoch": 3101} {"train_loss": -6.658518314361572, "global_step": 130252, "epoch": 3101} {"train_loss": -6.569670677185059, "global_step": 130253, "epoch": 3101} {"train_loss": -6.568823337554932, "global_step": 130254, "epoch": 3101} {"train_loss": -6.50730037689209, "global_step": 130255, "epoch": 3101} {"train_loss": -6.54062557220459, "global_step": 130256, "epoch": 3101} {"train_loss": -6.4646477699279785, "global_step": 130257, "epoch": 3101} {"train_loss": -6.6768293380737305, "global_step": 130258, "epoch": 3101} {"train_loss": -6.542014122009277, "global_step": 130259, "epoch": 3101} {"train_loss": -6.599108695983887, "global_step": 130260, "epoch": 3101} {"train_loss": -6.557195663452148, "global_step": 130261, "epoch": 3101} {"train_loss": -6.643027305603027, "global_step": 130262, "epoch": 3101} {"train_loss": -6.659261703491211, "global_step": 130263, "epoch": 3101} {"train_loss": -6.46821928024292, "global_step": 130264, "epoch": 3101} {"train_loss": -6.648385524749756, "global_step": 130265, "epoch": 3101} {"train_loss": -6.617341995239258, "global_step": 130266, "epoch": 3101} {"train_loss": -6.6525349617004395, "global_step": 130267, "epoch": 3101} {"train_loss": -6.5705342292785645, "global_step": 130268, "epoch": 3101} {"train_loss": -6.499689102172852, "global_step": 130269, "epoch": 3101} {"train_loss": -6.552061557769775, "global_step": 130270, "epoch": 3101} {"train_loss": -6.653611183166504, "global_step": 130271, "epoch": 3101} {"train_loss": -6.683501720428467, "global_step": 130272, "epoch": 3101} {"train_loss": -6.6861724853515625, "global_step": 130273, "epoch": 3101} {"train_loss": -6.597867012023926, "global_step": 130274, "epoch": 3101} {"train_loss": -6.740346908569336, "global_step": 130275, "epoch": 3101} {"train_loss": -6.613492965698242, "global_step": 130276, "epoch": 3101} {"train_loss": -6.5128936767578125, "global_step": 130277, "epoch": 3101} {"train_loss": -6.6710710525512695, "global_step": 130278, "epoch": 3101} {"train_loss": -6.712752342224121, "global_step": 130279, "epoch": 3101} {"train_loss": -6.557805061340332, "global_step": 130280, "epoch": 3101} {"train_loss": -6.596385955810547, "global_step": 130281, "epoch": 3101} {"train_loss": -6.635488986968994, "global_step": 130282, "epoch": 3101} {"train_loss": -6.612104018529256, "global_step": 130283, "epoch": 3101, "val_loss": 66514.125} {"train_loss": -6.750241279602051, "global_step": 130284, "epoch": 3102} {"train_loss": -6.695635795593262, "global_step": 130285, "epoch": 3102} {"train_loss": -6.608602046966553, "global_step": 130286, "epoch": 3102} {"train_loss": -6.561257362365723, "global_step": 130287, "epoch": 3102} {"train_loss": -6.609991073608398, "global_step": 130288, "epoch": 3102} {"train_loss": -6.5175018310546875, "global_step": 130289, "epoch": 3102} {"train_loss": -6.643911361694336, "global_step": 130290, "epoch": 3102} {"train_loss": -6.613156318664551, "global_step": 130291, "epoch": 3102} {"train_loss": -6.4426069259643555, "global_step": 130292, "epoch": 3102} {"train_loss": -6.605649948120117, "global_step": 130293, "epoch": 3102} {"train_loss": -6.548801898956299, "global_step": 130294, "epoch": 3102} {"train_loss": -6.682125091552734, "global_step": 130295, "epoch": 3102} {"train_loss": -6.55385684967041, "global_step": 130296, "epoch": 3102} {"train_loss": -6.427879810333252, "global_step": 130297, "epoch": 3102} {"train_loss": -6.564579963684082, "global_step": 130298, "epoch": 3102} {"train_loss": -6.529092311859131, "global_step": 130299, "epoch": 3102} {"train_loss": -6.618569850921631, "global_step": 130300, "epoch": 3102} {"train_loss": -6.4479146003723145, "global_step": 130301, "epoch": 3102} {"train_loss": -6.575345039367676, "global_step": 130302, "epoch": 3102} {"train_loss": -6.49802827835083, "global_step": 130303, "epoch": 3102} {"train_loss": -6.549392223358154, "global_step": 130304, "epoch": 3102} {"train_loss": -6.557150840759277, "global_step": 130305, "epoch": 3102} {"train_loss": -6.481812000274658, "global_step": 130306, "epoch": 3102} {"train_loss": -6.555768966674805, "global_step": 130307, "epoch": 3102} {"train_loss": -6.54312801361084, "global_step": 130308, "epoch": 3102} {"train_loss": -6.558319091796875, "global_step": 130309, "epoch": 3102} {"train_loss": -6.725450038909912, "global_step": 130310, "epoch": 3102} {"train_loss": -6.447941780090332, "global_step": 130311, "epoch": 3102} {"train_loss": -6.602145671844482, "global_step": 130312, "epoch": 3102} {"train_loss": -6.551215171813965, "global_step": 130313, "epoch": 3102} {"train_loss": -6.550564765930176, "global_step": 130314, "epoch": 3102} {"train_loss": -6.572145462036133, "global_step": 130315, "epoch": 3102} {"train_loss": -6.611248970031738, "global_step": 130316, "epoch": 3102} {"train_loss": -6.625222206115723, "global_step": 130317, "epoch": 3102} {"train_loss": -6.631258010864258, "global_step": 130318, "epoch": 3102} {"train_loss": -6.621550559997559, "global_step": 130319, "epoch": 3102} {"train_loss": -6.748266220092773, "global_step": 130320, "epoch": 3102} {"train_loss": -6.708817481994629, "global_step": 130321, "epoch": 3102} {"train_loss": -6.644591808319092, "global_step": 130322, "epoch": 3102} {"train_loss": -6.534414291381836, "global_step": 130323, "epoch": 3102} {"train_loss": -6.697100639343262, "global_step": 130324, "epoch": 3102} {"train_loss": -6.588613192240397, "global_step": 130325, "epoch": 3102, "val_loss": 66481.171875} {"train_loss": -6.722743988037109, "global_step": 130326, "epoch": 3103} {"train_loss": -6.535926342010498, "global_step": 130327, "epoch": 3103} {"train_loss": -6.641691207885742, "global_step": 130328, "epoch": 3103} {"train_loss": -6.71823263168335, "global_step": 130329, "epoch": 3103} {"train_loss": -6.681394100189209, "global_step": 130330, "epoch": 3103} {"train_loss": -6.716188907623291, "global_step": 130331, "epoch": 3103} {"train_loss": -6.7292680740356445, "global_step": 130332, "epoch": 3103} {"train_loss": -6.611649513244629, "global_step": 130333, "epoch": 3103} {"train_loss": -6.664950370788574, "global_step": 130334, "epoch": 3103} {"train_loss": -6.6824750900268555, "global_step": 130335, "epoch": 3103} {"train_loss": -6.7907819747924805, "global_step": 130336, "epoch": 3103} {"train_loss": -6.756141662597656, "global_step": 130337, "epoch": 3103} {"train_loss": -6.691832542419434, "global_step": 130338, "epoch": 3103} {"train_loss": -6.7825517654418945, "global_step": 130339, "epoch": 3103} {"train_loss": -6.786716938018799, "global_step": 130340, "epoch": 3103} {"train_loss": -6.7240681648254395, "global_step": 130341, "epoch": 3103} {"train_loss": -6.625911712646484, "global_step": 130342, "epoch": 3103} {"train_loss": -6.739648818969727, "global_step": 130343, "epoch": 3103} {"train_loss": -6.780831336975098, "global_step": 130344, "epoch": 3103} {"train_loss": -6.752431869506836, "global_step": 130345, "epoch": 3103} {"train_loss": -6.734963417053223, "global_step": 130346, "epoch": 3103} {"train_loss": -6.639896392822266, "global_step": 130347, "epoch": 3103} {"train_loss": -6.770118713378906, "global_step": 130348, "epoch": 3103} {"train_loss": -6.749087810516357, "global_step": 130349, "epoch": 3103} {"train_loss": -6.692238807678223, "global_step": 130350, "epoch": 3103} {"train_loss": -6.642253875732422, "global_step": 130351, "epoch": 3103} {"train_loss": -6.615556716918945, "global_step": 130352, "epoch": 3103} {"train_loss": -6.734150409698486, "global_step": 130353, "epoch": 3103} {"train_loss": -6.760461807250977, "global_step": 130354, "epoch": 3103} {"train_loss": -6.73996639251709, "global_step": 130355, "epoch": 3103} {"train_loss": -6.7126569747924805, "global_step": 130356, "epoch": 3103} {"train_loss": -6.645140171051025, "global_step": 130357, "epoch": 3103} {"train_loss": -6.841203212738037, "global_step": 130358, "epoch": 3103} {"train_loss": -6.666300296783447, "global_step": 130359, "epoch": 3103} {"train_loss": -6.7185540199279785, "global_step": 130360, "epoch": 3103} {"train_loss": -6.85213565826416, "global_step": 130361, "epoch": 3103} {"train_loss": -6.702960968017578, "global_step": 130362, "epoch": 3103} {"train_loss": -6.776515483856201, "global_step": 130363, "epoch": 3103} {"train_loss": -6.651945114135742, "global_step": 130364, "epoch": 3103} {"train_loss": -6.739335536956787, "global_step": 130365, "epoch": 3103} {"train_loss": -6.692089080810547, "global_step": 130366, "epoch": 3103} {"train_loss": -6.713393336250668, "global_step": 130367, "epoch": 3103, "val_loss": 66331.7890625} {"train_loss": -6.7088518142700195, "global_step": 130368, "epoch": 3104} {"train_loss": -6.626614570617676, "global_step": 130369, "epoch": 3104} {"train_loss": -6.585021018981934, "global_step": 130370, "epoch": 3104} {"train_loss": -6.67588996887207, "global_step": 130371, "epoch": 3104} {"train_loss": -6.661686897277832, "global_step": 130372, "epoch": 3104} {"train_loss": -6.6968793869018555, "global_step": 130373, "epoch": 3104} {"train_loss": -6.756553649902344, "global_step": 130374, "epoch": 3104} {"train_loss": -6.7741522789001465, "global_step": 130375, "epoch": 3104} {"train_loss": -6.709280967712402, "global_step": 130376, "epoch": 3104} {"train_loss": -6.702771186828613, "global_step": 130377, "epoch": 3104} {"train_loss": -6.611848831176758, "global_step": 130378, "epoch": 3104} {"train_loss": -6.626401424407959, "global_step": 130379, "epoch": 3104} {"train_loss": -6.669905662536621, "global_step": 130380, "epoch": 3104} {"train_loss": -6.752985000610352, "global_step": 130381, "epoch": 3104} {"train_loss": -6.642038345336914, "global_step": 130382, "epoch": 3104} {"train_loss": -6.716235637664795, "global_step": 130383, "epoch": 3104} {"train_loss": -6.690949440002441, "global_step": 130384, "epoch": 3104} {"train_loss": -6.595671653747559, "global_step": 130385, "epoch": 3104} {"train_loss": -6.684874534606934, "global_step": 130386, "epoch": 3104} {"train_loss": -6.590429306030273, "global_step": 130387, "epoch": 3104} {"train_loss": -6.555780410766602, "global_step": 130388, "epoch": 3104} {"train_loss": -6.6993303298950195, "global_step": 130389, "epoch": 3104} {"train_loss": -6.553019046783447, "global_step": 130390, "epoch": 3104} {"train_loss": -6.556926250457764, "global_step": 130391, "epoch": 3104} {"train_loss": -6.754290580749512, "global_step": 130392, "epoch": 3104} {"train_loss": -6.568391799926758, "global_step": 130393, "epoch": 3104} {"train_loss": -6.66536283493042, "global_step": 130394, "epoch": 3104} {"train_loss": -6.629739284515381, "global_step": 130395, "epoch": 3104} {"train_loss": -6.594175338745117, "global_step": 130396, "epoch": 3104} {"train_loss": -6.589067459106445, "global_step": 130397, "epoch": 3104} {"train_loss": -6.694106101989746, "global_step": 130398, "epoch": 3104} {"train_loss": -6.6460957527160645, "global_step": 130399, "epoch": 3104} {"train_loss": -6.669854164123535, "global_step": 130400, "epoch": 3104} {"train_loss": -6.717879295349121, "global_step": 130401, "epoch": 3104} {"train_loss": -6.495944023132324, "global_step": 130402, "epoch": 3104} {"train_loss": -6.638312339782715, "global_step": 130403, "epoch": 3104} {"train_loss": -6.651704788208008, "global_step": 130404, "epoch": 3104} {"train_loss": -6.616976261138916, "global_step": 130405, "epoch": 3104} {"train_loss": -6.616123199462891, "global_step": 130406, "epoch": 3104} {"train_loss": -6.634471893310547, "global_step": 130407, "epoch": 3104} {"train_loss": -6.712895393371582, "global_step": 130408, "epoch": 3104} {"train_loss": -6.650841429120018, "global_step": 130409, "epoch": 3104, "val_loss": 66907.0078125} {"train_loss": -6.579094886779785, "global_step": 130410, "epoch": 3105} {"train_loss": -6.631039619445801, "global_step": 130411, "epoch": 3105} {"train_loss": -6.587445259094238, "global_step": 130412, "epoch": 3105} {"train_loss": -6.49979829788208, "global_step": 130413, "epoch": 3105} {"train_loss": -6.703132629394531, "global_step": 130414, "epoch": 3105} {"train_loss": -6.495223045349121, "global_step": 130415, "epoch": 3105} {"train_loss": -6.734541893005371, "global_step": 130416, "epoch": 3105} {"train_loss": -6.653566360473633, "global_step": 130417, "epoch": 3105} {"train_loss": -6.620454788208008, "global_step": 130418, "epoch": 3105} {"train_loss": -6.659530162811279, "global_step": 130419, "epoch": 3105} {"train_loss": -6.6424479484558105, "global_step": 130420, "epoch": 3105} {"train_loss": -6.633347511291504, "global_step": 130421, "epoch": 3105} {"train_loss": -6.701788902282715, "global_step": 130422, "epoch": 3105} {"train_loss": -6.599266052246094, "global_step": 130423, "epoch": 3105} {"train_loss": -6.660472393035889, "global_step": 130424, "epoch": 3105} {"train_loss": -6.769791126251221, "global_step": 130425, "epoch": 3105} {"train_loss": -6.784799575805664, "global_step": 130426, "epoch": 3105} {"train_loss": -6.684024333953857, "global_step": 130427, "epoch": 3105} {"train_loss": -6.685413360595703, "global_step": 130428, "epoch": 3105} {"train_loss": -6.7352094650268555, "global_step": 130429, "epoch": 3105} {"train_loss": -6.6739726066589355, "global_step": 130430, "epoch": 3105} {"train_loss": -6.703200340270996, "global_step": 130431, "epoch": 3105} {"train_loss": -6.687981128692627, "global_step": 130432, "epoch": 3105} {"train_loss": -6.68793249130249, "global_step": 130433, "epoch": 3105} {"train_loss": -6.767852783203125, "global_step": 130434, "epoch": 3105} {"train_loss": -6.643182277679443, "global_step": 130435, "epoch": 3105} {"train_loss": -6.773385047912598, "global_step": 130436, "epoch": 3105} {"train_loss": -6.6955790519714355, "global_step": 130437, "epoch": 3105} {"train_loss": -6.757638931274414, "global_step": 130438, "epoch": 3105} {"train_loss": -6.7353973388671875, "global_step": 130439, "epoch": 3105} {"train_loss": -6.716923713684082, "global_step": 130440, "epoch": 3105} {"train_loss": -6.878942012786865, "global_step": 130441, "epoch": 3105} {"train_loss": -6.710624694824219, "global_step": 130442, "epoch": 3105} {"train_loss": -6.73820686340332, "global_step": 130443, "epoch": 3105} {"train_loss": -6.737595558166504, "global_step": 130444, "epoch": 3105} {"train_loss": -6.814166069030762, "global_step": 130445, "epoch": 3105} {"train_loss": -6.723457336425781, "global_step": 130446, "epoch": 3105} {"train_loss": -6.761023998260498, "global_step": 130447, "epoch": 3105} {"train_loss": -6.593055248260498, "global_step": 130448, "epoch": 3105} {"train_loss": -6.686951160430908, "global_step": 130449, "epoch": 3105} {"train_loss": -6.66901969909668, "global_step": 130450, "epoch": 3105} {"train_loss": -6.6898919968377974, "global_step": 130451, "epoch": 3105, "val_loss": 66593.546875} {"train_loss": -6.720859050750732, "global_step": 130452, "epoch": 3106} {"train_loss": -6.7137675285339355, "global_step": 130453, "epoch": 3106} {"train_loss": -6.612800598144531, "global_step": 130454, "epoch": 3106} {"train_loss": -6.652708053588867, "global_step": 130455, "epoch": 3106} {"train_loss": -6.622849464416504, "global_step": 130456, "epoch": 3106} {"train_loss": -6.716651439666748, "global_step": 130457, "epoch": 3106} {"train_loss": -6.693605422973633, "global_step": 130458, "epoch": 3106} {"train_loss": -6.783576488494873, "global_step": 130459, "epoch": 3106} {"train_loss": -6.710709571838379, "global_step": 130460, "epoch": 3106} {"train_loss": -6.666168212890625, "global_step": 130461, "epoch": 3106} {"train_loss": -6.645437240600586, "global_step": 130462, "epoch": 3106} {"train_loss": -6.786367416381836, "global_step": 130463, "epoch": 3106} {"train_loss": -6.693125247955322, "global_step": 130464, "epoch": 3106} {"train_loss": -6.655239105224609, "global_step": 130465, "epoch": 3106} {"train_loss": -6.624569892883301, "global_step": 130466, "epoch": 3106} {"train_loss": -6.612695693969727, "global_step": 130467, "epoch": 3106} {"train_loss": -6.614510536193848, "global_step": 130468, "epoch": 3106} {"train_loss": -6.678625583648682, "global_step": 130469, "epoch": 3106} {"train_loss": -6.717698097229004, "global_step": 130470, "epoch": 3106} {"train_loss": -6.538552284240723, "global_step": 130471, "epoch": 3106} {"train_loss": -6.507856369018555, "global_step": 130472, "epoch": 3106} {"train_loss": -6.616931438446045, "global_step": 130473, "epoch": 3106} {"train_loss": -6.587319850921631, "global_step": 130474, "epoch": 3106} {"train_loss": -6.615597724914551, "global_step": 130475, "epoch": 3106} {"train_loss": -6.69957160949707, "global_step": 130476, "epoch": 3106} {"train_loss": -6.623805522918701, "global_step": 130477, "epoch": 3106} {"train_loss": -6.617500305175781, "global_step": 130478, "epoch": 3106} {"train_loss": -6.651609420776367, "global_step": 130479, "epoch": 3106} {"train_loss": -6.578886032104492, "global_step": 130480, "epoch": 3106} {"train_loss": -6.636380195617676, "global_step": 130481, "epoch": 3106} {"train_loss": -6.680432319641113, "global_step": 130482, "epoch": 3106} {"train_loss": -6.611529350280762, "global_step": 130483, "epoch": 3106} {"train_loss": -6.696744441986084, "global_step": 130484, "epoch": 3106} {"train_loss": -6.510309219360352, "global_step": 130485, "epoch": 3106} {"train_loss": -6.6481451988220215, "global_step": 130486, "epoch": 3106} {"train_loss": -6.6454315185546875, "global_step": 130487, "epoch": 3106} {"train_loss": -6.652825355529785, "global_step": 130488, "epoch": 3106} {"train_loss": -6.695522308349609, "global_step": 130489, "epoch": 3106} {"train_loss": -6.69488525390625, "global_step": 130490, "epoch": 3106} {"train_loss": -6.630867958068848, "global_step": 130491, "epoch": 3106} {"train_loss": -6.6051344871521, "global_step": 130492, "epoch": 3106} {"train_loss": -6.650103500911167, "global_step": 130493, "epoch": 3106, "val_loss": 66571.28125} {"train_loss": -6.48075008392334, "global_step": 130494, "epoch": 3107} {"train_loss": -6.686415672302246, "global_step": 130495, "epoch": 3107} {"train_loss": -6.57372522354126, "global_step": 130496, "epoch": 3107} {"train_loss": -6.825037956237793, "global_step": 130497, "epoch": 3107} {"train_loss": -6.682151794433594, "global_step": 130498, "epoch": 3107} {"train_loss": -6.759558200836182, "global_step": 130499, "epoch": 3107} {"train_loss": -6.686525821685791, "global_step": 130500, "epoch": 3107} {"train_loss": -6.69132137298584, "global_step": 130501, "epoch": 3107} {"train_loss": -6.623933792114258, "global_step": 130502, "epoch": 3107} {"train_loss": -6.643377304077148, "global_step": 130503, "epoch": 3107} {"train_loss": -6.668674945831299, "global_step": 130504, "epoch": 3107} {"train_loss": -6.591200351715088, "global_step": 130505, "epoch": 3107} {"train_loss": -6.611235618591309, "global_step": 130506, "epoch": 3107} {"train_loss": -6.67398738861084, "global_step": 130507, "epoch": 3107} {"train_loss": -6.692173957824707, "global_step": 130508, "epoch": 3107} {"train_loss": -6.7648773193359375, "global_step": 130509, "epoch": 3107} {"train_loss": -6.773181915283203, "global_step": 130510, "epoch": 3107} {"train_loss": -6.58381462097168, "global_step": 130511, "epoch": 3107} {"train_loss": -6.620018482208252, "global_step": 130512, "epoch": 3107} {"train_loss": -6.628846645355225, "global_step": 130513, "epoch": 3107} {"train_loss": -6.649267196655273, "global_step": 130514, "epoch": 3107} {"train_loss": -6.665641784667969, "global_step": 130515, "epoch": 3107} {"train_loss": -6.728658199310303, "global_step": 130516, "epoch": 3107} {"train_loss": -6.669652938842773, "global_step": 130517, "epoch": 3107} {"train_loss": -6.739419937133789, "global_step": 130518, "epoch": 3107} {"train_loss": -6.629205703735352, "global_step": 130519, "epoch": 3107} {"train_loss": -6.7030181884765625, "global_step": 130520, "epoch": 3107} {"train_loss": -6.741645812988281, "global_step": 130521, "epoch": 3107} {"train_loss": -6.745924949645996, "global_step": 130522, "epoch": 3107} {"train_loss": -6.7253947257995605, "global_step": 130523, "epoch": 3107} {"train_loss": -6.634029388427734, "global_step": 130524, "epoch": 3107} {"train_loss": -6.732515335083008, "global_step": 130525, "epoch": 3107} {"train_loss": -6.696714401245117, "global_step": 130526, "epoch": 3107} {"train_loss": -6.661377906799316, "global_step": 130527, "epoch": 3107} {"train_loss": -6.561995029449463, "global_step": 130528, "epoch": 3107} {"train_loss": -6.746634006500244, "global_step": 130529, "epoch": 3107} {"train_loss": -6.727376937866211, "global_step": 130530, "epoch": 3107} {"train_loss": -6.698944091796875, "global_step": 130531, "epoch": 3107} {"train_loss": -6.646392822265625, "global_step": 130532, "epoch": 3107} {"train_loss": -6.6999711990356445, "global_step": 130533, "epoch": 3107} {"train_loss": -6.748538494110107, "global_step": 130534, "epoch": 3107} {"train_loss": -6.682842652002971, "global_step": 130535, "epoch": 3107, "val_loss": 66655.265625} {"train_loss": -6.711368083953857, "global_step": 130536, "epoch": 3108} {"train_loss": -6.723771095275879, "global_step": 130537, "epoch": 3108} {"train_loss": -6.679889678955078, "global_step": 130538, "epoch": 3108} {"train_loss": -6.8192291259765625, "global_step": 130539, "epoch": 3108} {"train_loss": -6.579089164733887, "global_step": 130540, "epoch": 3108} {"train_loss": -6.712930679321289, "global_step": 130541, "epoch": 3108} {"train_loss": -6.628842353820801, "global_step": 130542, "epoch": 3108} {"train_loss": -6.728363037109375, "global_step": 130543, "epoch": 3108} {"train_loss": -6.687717437744141, "global_step": 130544, "epoch": 3108} {"train_loss": -6.669303894042969, "global_step": 130545, "epoch": 3108} {"train_loss": -6.6982269287109375, "global_step": 130546, "epoch": 3108} {"train_loss": -6.570567607879639, "global_step": 130547, "epoch": 3108} {"train_loss": -6.688097953796387, "global_step": 130548, "epoch": 3108} {"train_loss": -6.799065589904785, "global_step": 130549, "epoch": 3108} {"train_loss": -6.729825496673584, "global_step": 130550, "epoch": 3108} {"train_loss": -6.613124847412109, "global_step": 130551, "epoch": 3108} {"train_loss": -6.741270065307617, "global_step": 130552, "epoch": 3108} {"train_loss": -6.723872184753418, "global_step": 130553, "epoch": 3108} {"train_loss": -6.768141746520996, "global_step": 130554, "epoch": 3108} {"train_loss": -6.702785491943359, "global_step": 130555, "epoch": 3108} {"train_loss": -6.7270636558532715, "global_step": 130556, "epoch": 3108} {"train_loss": -6.805510997772217, "global_step": 130557, "epoch": 3108} {"train_loss": -6.641356468200684, "global_step": 130558, "epoch": 3108} {"train_loss": -6.76572847366333, "global_step": 130559, "epoch": 3108} {"train_loss": -6.729454040527344, "global_step": 130560, "epoch": 3108} {"train_loss": -6.766818046569824, "global_step": 130561, "epoch": 3108} {"train_loss": -6.6424407958984375, "global_step": 130562, "epoch": 3108} {"train_loss": -6.654106616973877, "global_step": 130563, "epoch": 3108} {"train_loss": -6.585765838623047, "global_step": 130564, "epoch": 3108} {"train_loss": -6.628801345825195, "global_step": 130565, "epoch": 3108} {"train_loss": -6.704683780670166, "global_step": 130566, "epoch": 3108} {"train_loss": -6.748976707458496, "global_step": 130567, "epoch": 3108} {"train_loss": -6.704800605773926, "global_step": 130568, "epoch": 3108} {"train_loss": -6.603960990905762, "global_step": 130569, "epoch": 3108} {"train_loss": -6.793727874755859, "global_step": 130570, "epoch": 3108} {"train_loss": -6.7021918296813965, "global_step": 130571, "epoch": 3108} {"train_loss": -6.722307205200195, "global_step": 130572, "epoch": 3108} {"train_loss": -6.714855670928955, "global_step": 130573, "epoch": 3108} {"train_loss": -6.693288803100586, "global_step": 130574, "epoch": 3108} {"train_loss": -6.757560729980469, "global_step": 130575, "epoch": 3108} {"train_loss": -6.663452625274658, "global_step": 130576, "epoch": 3108} {"train_loss": -6.698683670588902, "global_step": 130577, "epoch": 3108, "val_loss": 66691.171875} {"train_loss": -6.719671726226807, "global_step": 130578, "epoch": 3109} {"train_loss": -6.69167423248291, "global_step": 130579, "epoch": 3109} {"train_loss": -6.744150161743164, "global_step": 130580, "epoch": 3109} {"train_loss": -6.666171073913574, "global_step": 130581, "epoch": 3109} {"train_loss": -6.810034275054932, "global_step": 130582, "epoch": 3109} {"train_loss": -6.845070838928223, "global_step": 130583, "epoch": 3109} {"train_loss": -6.786005020141602, "global_step": 130584, "epoch": 3109} {"train_loss": -6.76249885559082, "global_step": 130585, "epoch": 3109} {"train_loss": -6.67461633682251, "global_step": 130586, "epoch": 3109} {"train_loss": -6.722488880157471, "global_step": 130587, "epoch": 3109} {"train_loss": -6.700545310974121, "global_step": 130588, "epoch": 3109} {"train_loss": -6.71431827545166, "global_step": 130589, "epoch": 3109} {"train_loss": -6.749686241149902, "global_step": 130590, "epoch": 3109} {"train_loss": -6.7388505935668945, "global_step": 130591, "epoch": 3109} {"train_loss": -6.788565635681152, "global_step": 130592, "epoch": 3109} {"train_loss": -6.736082553863525, "global_step": 130593, "epoch": 3109} {"train_loss": -6.60142183303833, "global_step": 130594, "epoch": 3109} {"train_loss": -6.713729381561279, "global_step": 130595, "epoch": 3109} {"train_loss": -6.685614585876465, "global_step": 130596, "epoch": 3109} {"train_loss": -6.646875381469727, "global_step": 130597, "epoch": 3109} {"train_loss": -6.697009563446045, "global_step": 130598, "epoch": 3109} {"train_loss": -6.554818153381348, "global_step": 130599, "epoch": 3109} {"train_loss": -6.674408912658691, "global_step": 130600, "epoch": 3109} {"train_loss": -6.670060157775879, "global_step": 130601, "epoch": 3109} {"train_loss": -6.657595157623291, "global_step": 130602, "epoch": 3109} {"train_loss": -6.7550950050354, "global_step": 130603, "epoch": 3109} {"train_loss": -6.728776931762695, "global_step": 130604, "epoch": 3109} {"train_loss": -6.656670093536377, "global_step": 130605, "epoch": 3109} {"train_loss": -6.721549034118652, "global_step": 130606, "epoch": 3109} {"train_loss": -6.542259216308594, "global_step": 130607, "epoch": 3109} {"train_loss": -6.674604415893555, "global_step": 130608, "epoch": 3109} {"train_loss": -6.645394325256348, "global_step": 130609, "epoch": 3109} {"train_loss": -6.71260404586792, "global_step": 130610, "epoch": 3109} {"train_loss": -6.533970832824707, "global_step": 130611, "epoch": 3109} {"train_loss": -6.743034362792969, "global_step": 130612, "epoch": 3109} {"train_loss": -6.628859519958496, "global_step": 130613, "epoch": 3109} {"train_loss": -6.6042070388793945, "global_step": 130614, "epoch": 3109} {"train_loss": -6.678245544433594, "global_step": 130615, "epoch": 3109} {"train_loss": -6.611599922180176, "global_step": 130616, "epoch": 3109} {"train_loss": -6.612123012542725, "global_step": 130617, "epoch": 3109} {"train_loss": -6.652416229248047, "global_step": 130618, "epoch": 3109} {"train_loss": -6.689114423025222, "global_step": 130619, "epoch": 3109, "val_loss": 66590.515625} {"train_loss": -6.657023906707764, "global_step": 130620, "epoch": 3110} {"train_loss": -6.581167221069336, "global_step": 130621, "epoch": 3110} {"train_loss": -6.729940891265869, "global_step": 130622, "epoch": 3110} {"train_loss": -6.664705753326416, "global_step": 130623, "epoch": 3110} {"train_loss": -6.533267974853516, "global_step": 130624, "epoch": 3110} {"train_loss": -6.68247652053833, "global_step": 130625, "epoch": 3110} {"train_loss": -6.69114875793457, "global_step": 130626, "epoch": 3110} {"train_loss": -6.60244607925415, "global_step": 130627, "epoch": 3110} {"train_loss": -6.697747230529785, "global_step": 130628, "epoch": 3110} {"train_loss": -6.570956707000732, "global_step": 130629, "epoch": 3110} {"train_loss": -6.578600883483887, "global_step": 130630, "epoch": 3110} {"train_loss": -6.751786231994629, "global_step": 130631, "epoch": 3110} {"train_loss": -6.665789604187012, "global_step": 130632, "epoch": 3110} {"train_loss": -6.582286834716797, "global_step": 130633, "epoch": 3110} {"train_loss": -6.654952049255371, "global_step": 130634, "epoch": 3110} {"train_loss": -6.651309013366699, "global_step": 130635, "epoch": 3110} {"train_loss": -6.638832092285156, "global_step": 130636, "epoch": 3110} {"train_loss": -6.5873870849609375, "global_step": 130637, "epoch": 3110} {"train_loss": -6.484813213348389, "global_step": 130638, "epoch": 3110} {"train_loss": -6.635962009429932, "global_step": 130639, "epoch": 3110} {"train_loss": -6.594951152801514, "global_step": 130640, "epoch": 3110} {"train_loss": -6.747092247009277, "global_step": 130641, "epoch": 3110} {"train_loss": -6.588117599487305, "global_step": 130642, "epoch": 3110} {"train_loss": -6.6207170486450195, "global_step": 130643, "epoch": 3110} {"train_loss": -6.5503716468811035, "global_step": 130644, "epoch": 3110} {"train_loss": -6.544881343841553, "global_step": 130645, "epoch": 3110} {"train_loss": -6.568393707275391, "global_step": 130646, "epoch": 3110} {"train_loss": -6.533561706542969, "global_step": 130647, "epoch": 3110} {"train_loss": -6.587538242340088, "global_step": 130648, "epoch": 3110} {"train_loss": -6.7317609786987305, "global_step": 130649, "epoch": 3110} {"train_loss": -6.666147232055664, "global_step": 130650, "epoch": 3110} {"train_loss": -6.6860833168029785, "global_step": 130651, "epoch": 3110} {"train_loss": -6.617990970611572, "global_step": 130652, "epoch": 3110} {"train_loss": -6.6298747062683105, "global_step": 130653, "epoch": 3110} {"train_loss": -6.655601978302002, "global_step": 130654, "epoch": 3110} {"train_loss": -6.701088905334473, "global_step": 130655, "epoch": 3110} {"train_loss": -6.799402236938477, "global_step": 130656, "epoch": 3110} {"train_loss": -6.76222562789917, "global_step": 130657, "epoch": 3110} {"train_loss": -6.580991744995117, "global_step": 130658, "epoch": 3110} {"train_loss": -6.633753776550293, "global_step": 130659, "epoch": 3110} {"train_loss": -6.694119453430176, "global_step": 130660, "epoch": 3110} {"train_loss": -6.634203468050275, "global_step": 130661, "epoch": 3110, "val_loss": 66466.3046875} {"train_loss": -6.713850021362305, "global_step": 130662, "epoch": 3111} {"train_loss": -6.842047691345215, "global_step": 130663, "epoch": 3111} {"train_loss": -6.759396553039551, "global_step": 130664, "epoch": 3111} {"train_loss": -6.697928428649902, "global_step": 130665, "epoch": 3111} {"train_loss": -6.72830057144165, "global_step": 130666, "epoch": 3111} {"train_loss": -6.7542524337768555, "global_step": 130667, "epoch": 3111} {"train_loss": -6.7089996337890625, "global_step": 130668, "epoch": 3111} {"train_loss": -6.677037715911865, "global_step": 130669, "epoch": 3111} {"train_loss": -6.748805999755859, "global_step": 130670, "epoch": 3111} {"train_loss": -6.662252426147461, "global_step": 130671, "epoch": 3111} {"train_loss": -6.594447135925293, "global_step": 130672, "epoch": 3111} {"train_loss": -6.766336441040039, "global_step": 130673, "epoch": 3111} {"train_loss": -6.581721782684326, "global_step": 130674, "epoch": 3111} {"train_loss": -6.708556175231934, "global_step": 130675, "epoch": 3111} {"train_loss": -6.660408020019531, "global_step": 130676, "epoch": 3111} {"train_loss": -6.490699768066406, "global_step": 130677, "epoch": 3111} {"train_loss": -6.624599456787109, "global_step": 130678, "epoch": 3111} {"train_loss": -6.686095237731934, "global_step": 130679, "epoch": 3111} {"train_loss": -6.5475006103515625, "global_step": 130680, "epoch": 3111} {"train_loss": -6.765841484069824, "global_step": 130681, "epoch": 3111} {"train_loss": -6.707942962646484, "global_step": 130682, "epoch": 3111} {"train_loss": -6.550717353820801, "global_step": 130683, "epoch": 3111} {"train_loss": -6.737871170043945, "global_step": 130684, "epoch": 3111} {"train_loss": -6.57158899307251, "global_step": 130685, "epoch": 3111} {"train_loss": -6.655506610870361, "global_step": 130686, "epoch": 3111} {"train_loss": -6.660739898681641, "global_step": 130687, "epoch": 3111} {"train_loss": -6.642468452453613, "global_step": 130688, "epoch": 3111} {"train_loss": -6.691816806793213, "global_step": 130689, "epoch": 3111} {"train_loss": -6.64772891998291, "global_step": 130690, "epoch": 3111} {"train_loss": -6.718392372131348, "global_step": 130691, "epoch": 3111} {"train_loss": -6.671635627746582, "global_step": 130692, "epoch": 3111} {"train_loss": -6.745269298553467, "global_step": 130693, "epoch": 3111} {"train_loss": -6.73358154296875, "global_step": 130694, "epoch": 3111} {"train_loss": -6.562628746032715, "global_step": 130695, "epoch": 3111} {"train_loss": -6.611652374267578, "global_step": 130696, "epoch": 3111} {"train_loss": -6.7669267654418945, "global_step": 130697, "epoch": 3111} {"train_loss": -6.774781227111816, "global_step": 130698, "epoch": 3111} {"train_loss": -6.733864784240723, "global_step": 130699, "epoch": 3111} {"train_loss": -6.550251007080078, "global_step": 130700, "epoch": 3111} {"train_loss": -6.729829788208008, "global_step": 130701, "epoch": 3111} {"train_loss": -6.732091903686523, "global_step": 130702, "epoch": 3111} {"train_loss": -6.67791535740807, "global_step": 130703, "epoch": 3111, "val_loss": 66745.53125} {"train_loss": -6.587841033935547, "global_step": 130704, "epoch": 3112} {"train_loss": -6.575063705444336, "global_step": 130705, "epoch": 3112} {"train_loss": -6.536100387573242, "global_step": 130706, "epoch": 3112} {"train_loss": -6.6290154457092285, "global_step": 130707, "epoch": 3112} {"train_loss": -6.552838325500488, "global_step": 130708, "epoch": 3112} {"train_loss": -6.726752281188965, "global_step": 130709, "epoch": 3112} {"train_loss": -6.52470588684082, "global_step": 130710, "epoch": 3112} {"train_loss": -6.655550003051758, "global_step": 130711, "epoch": 3112} {"train_loss": -6.680721282958984, "global_step": 130712, "epoch": 3112} {"train_loss": -6.545706272125244, "global_step": 130713, "epoch": 3112} {"train_loss": -6.678555488586426, "global_step": 130714, "epoch": 3112} {"train_loss": -6.6691508293151855, "global_step": 130715, "epoch": 3112} {"train_loss": -6.604454517364502, "global_step": 130716, "epoch": 3112} {"train_loss": -6.657530784606934, "global_step": 130717, "epoch": 3112} {"train_loss": -6.671004772186279, "global_step": 130718, "epoch": 3112} {"train_loss": -6.7058868408203125, "global_step": 130719, "epoch": 3112} {"train_loss": -6.622066974639893, "global_step": 130720, "epoch": 3112} {"train_loss": -6.60518741607666, "global_step": 130721, "epoch": 3112} {"train_loss": -6.642992973327637, "global_step": 130722, "epoch": 3112} {"train_loss": -6.602114677429199, "global_step": 130723, "epoch": 3112} {"train_loss": -6.681591033935547, "global_step": 130724, "epoch": 3112} {"train_loss": -6.6271257400512695, "global_step": 130725, "epoch": 3112} {"train_loss": -6.552195072174072, "global_step": 130726, "epoch": 3112} {"train_loss": -6.5863356590271, "global_step": 130727, "epoch": 3112} {"train_loss": -6.642386436462402, "global_step": 130728, "epoch": 3112} {"train_loss": -6.583432197570801, "global_step": 130729, "epoch": 3112} {"train_loss": -6.668291091918945, "global_step": 130730, "epoch": 3112} {"train_loss": -6.687797546386719, "global_step": 130731, "epoch": 3112} {"train_loss": -6.683905124664307, "global_step": 130732, "epoch": 3112} {"train_loss": -6.700498580932617, "global_step": 130733, "epoch": 3112} {"train_loss": -6.67131233215332, "global_step": 130734, "epoch": 3112} {"train_loss": -6.772696495056152, "global_step": 130735, "epoch": 3112} {"train_loss": -6.730446815490723, "global_step": 130736, "epoch": 3112} {"train_loss": -6.784375190734863, "global_step": 130737, "epoch": 3112} {"train_loss": -6.624828815460205, "global_step": 130738, "epoch": 3112} {"train_loss": -6.684639930725098, "global_step": 130739, "epoch": 3112} {"train_loss": -6.719071865081787, "global_step": 130740, "epoch": 3112} {"train_loss": -6.547730445861816, "global_step": 130741, "epoch": 3112} {"train_loss": -6.736823081970215, "global_step": 130742, "epoch": 3112} {"train_loss": -6.542552947998047, "global_step": 130743, "epoch": 3112} {"train_loss": -6.570858001708984, "global_step": 130744, "epoch": 3112} {"train_loss": -6.642721800577073, "global_step": 130745, "epoch": 3112, "val_loss": 66425.2109375} {"train_loss": -6.543663024902344, "global_step": 130746, "epoch": 3113} {"train_loss": -6.698861122131348, "global_step": 130747, "epoch": 3113} {"train_loss": -6.553057670593262, "global_step": 130748, "epoch": 3113} {"train_loss": -6.615954875946045, "global_step": 130749, "epoch": 3113} {"train_loss": -6.5375590324401855, "global_step": 130750, "epoch": 3113} {"train_loss": -6.708711624145508, "global_step": 130751, "epoch": 3113} {"train_loss": -6.677773952484131, "global_step": 130752, "epoch": 3113} {"train_loss": -6.619793891906738, "global_step": 130753, "epoch": 3113} {"train_loss": -6.658339500427246, "global_step": 130754, "epoch": 3113} {"train_loss": -6.431703567504883, "global_step": 130755, "epoch": 3113} {"train_loss": -6.5866193771362305, "global_step": 130756, "epoch": 3113} {"train_loss": -6.63780403137207, "global_step": 130757, "epoch": 3113} {"train_loss": -6.634022235870361, "global_step": 130758, "epoch": 3113} {"train_loss": -6.6856465339660645, "global_step": 130759, "epoch": 3113} {"train_loss": -6.588769912719727, "global_step": 130760, "epoch": 3113} {"train_loss": -6.551495552062988, "global_step": 130761, "epoch": 3113} {"train_loss": -6.487675189971924, "global_step": 130762, "epoch": 3113} {"train_loss": -6.640054225921631, "global_step": 130763, "epoch": 3113} {"train_loss": -6.425711631774902, "global_step": 130764, "epoch": 3113} {"train_loss": -6.521732330322266, "global_step": 130765, "epoch": 3113} {"train_loss": -6.719405174255371, "global_step": 130766, "epoch": 3113} {"train_loss": -6.512004852294922, "global_step": 130767, "epoch": 3113} {"train_loss": -6.726345539093018, "global_step": 130768, "epoch": 3113} {"train_loss": -6.631248950958252, "global_step": 130769, "epoch": 3113} {"train_loss": -6.648441314697266, "global_step": 130770, "epoch": 3113} {"train_loss": -6.712982177734375, "global_step": 130771, "epoch": 3113} {"train_loss": -6.564883232116699, "global_step": 130772, "epoch": 3113} {"train_loss": -6.596426010131836, "global_step": 130773, "epoch": 3113} {"train_loss": -6.6827239990234375, "global_step": 130774, "epoch": 3113} {"train_loss": -6.753133773803711, "global_step": 130775, "epoch": 3113} {"train_loss": -6.489155292510986, "global_step": 130776, "epoch": 3113} {"train_loss": -6.717986106872559, "global_step": 130777, "epoch": 3113} {"train_loss": -6.537269592285156, "global_step": 130778, "epoch": 3113} {"train_loss": -6.695395469665527, "global_step": 130779, "epoch": 3113} {"train_loss": -6.74245548248291, "global_step": 130780, "epoch": 3113} {"train_loss": -6.6951584815979, "global_step": 130781, "epoch": 3113} {"train_loss": -6.511632442474365, "global_step": 130782, "epoch": 3113} {"train_loss": -6.619113445281982, "global_step": 130783, "epoch": 3113} {"train_loss": -6.6558637619018555, "global_step": 130784, "epoch": 3113} {"train_loss": -6.508267879486084, "global_step": 130785, "epoch": 3113} {"train_loss": -6.678553104400635, "global_step": 130786, "epoch": 3113} {"train_loss": -6.615632488614037, "global_step": 130787, "epoch": 3113, "val_loss": 66648.6953125} {"train_loss": -6.588349342346191, "global_step": 130788, "epoch": 3114} {"train_loss": -6.617412090301514, "global_step": 130789, "epoch": 3114} {"train_loss": -6.72255802154541, "global_step": 130790, "epoch": 3114} {"train_loss": -6.617096900939941, "global_step": 130791, "epoch": 3114} {"train_loss": -6.723467826843262, "global_step": 130792, "epoch": 3114} {"train_loss": -6.599648475646973, "global_step": 130793, "epoch": 3114} {"train_loss": -6.6061601638793945, "global_step": 130794, "epoch": 3114} {"train_loss": -6.709394931793213, "global_step": 130795, "epoch": 3114} {"train_loss": -6.606544494628906, "global_step": 130796, "epoch": 3114} {"train_loss": -6.669033050537109, "global_step": 130797, "epoch": 3114} {"train_loss": -6.725977897644043, "global_step": 130798, "epoch": 3114} {"train_loss": -6.622252941131592, "global_step": 130799, "epoch": 3114} {"train_loss": -6.665946006774902, "global_step": 130800, "epoch": 3114} {"train_loss": -6.629338264465332, "global_step": 130801, "epoch": 3114} {"train_loss": -6.643457889556885, "global_step": 130802, "epoch": 3114} {"train_loss": -6.677342414855957, "global_step": 130803, "epoch": 3114} {"train_loss": -6.596714496612549, "global_step": 130804, "epoch": 3114} {"train_loss": -6.6762495040893555, "global_step": 130805, "epoch": 3114} {"train_loss": -6.681762218475342, "global_step": 130806, "epoch": 3114} {"train_loss": -6.655757427215576, "global_step": 130807, "epoch": 3114} {"train_loss": -6.766493797302246, "global_step": 130808, "epoch": 3114} {"train_loss": -6.681614875793457, "global_step": 130809, "epoch": 3114} {"train_loss": -6.685720443725586, "global_step": 130810, "epoch": 3114} {"train_loss": -6.730276584625244, "global_step": 130811, "epoch": 3114} {"train_loss": -6.6978983879089355, "global_step": 130812, "epoch": 3114} {"train_loss": -6.607276916503906, "global_step": 130813, "epoch": 3114} {"train_loss": -6.726852893829346, "global_step": 130814, "epoch": 3114} {"train_loss": -6.67208194732666, "global_step": 130815, "epoch": 3114} {"train_loss": -6.646058082580566, "global_step": 130816, "epoch": 3114} {"train_loss": -6.701603889465332, "global_step": 130817, "epoch": 3114} {"train_loss": -6.740727424621582, "global_step": 130818, "epoch": 3114} {"train_loss": -6.613675117492676, "global_step": 130819, "epoch": 3114} {"train_loss": -6.760549068450928, "global_step": 130820, "epoch": 3114} {"train_loss": -6.626232147216797, "global_step": 130821, "epoch": 3114} {"train_loss": -6.648225784301758, "global_step": 130822, "epoch": 3114} {"train_loss": -6.677848815917969, "global_step": 130823, "epoch": 3114} {"train_loss": -6.513075828552246, "global_step": 130824, "epoch": 3114} {"train_loss": -6.668213844299316, "global_step": 130825, "epoch": 3114} {"train_loss": -6.714657783508301, "global_step": 130826, "epoch": 3114} {"train_loss": -6.69215726852417, "global_step": 130827, "epoch": 3114} {"train_loss": -6.755283832550049, "global_step": 130828, "epoch": 3114} {"train_loss": -6.667239938463483, "global_step": 130829, "epoch": 3114, "val_loss": 66571.3046875} {"train_loss": -6.686334133148193, "global_step": 130830, "epoch": 3115} {"train_loss": -6.536655426025391, "global_step": 130831, "epoch": 3115} {"train_loss": -6.632184982299805, "global_step": 130832, "epoch": 3115} {"train_loss": -6.711235046386719, "global_step": 130833, "epoch": 3115} {"train_loss": -6.630620002746582, "global_step": 130834, "epoch": 3115} {"train_loss": -6.727353096008301, "global_step": 130835, "epoch": 3115} {"train_loss": -6.709551811218262, "global_step": 130836, "epoch": 3115} {"train_loss": -6.722268104553223, "global_step": 130837, "epoch": 3115} {"train_loss": -6.740747451782227, "global_step": 130838, "epoch": 3115} {"train_loss": -6.727485656738281, "global_step": 130839, "epoch": 3115} {"train_loss": -6.722340106964111, "global_step": 130840, "epoch": 3115} {"train_loss": -6.6042799949646, "global_step": 130841, "epoch": 3115} {"train_loss": -6.707355976104736, "global_step": 130842, "epoch": 3115} {"train_loss": -6.749607086181641, "global_step": 130843, "epoch": 3115} {"train_loss": -6.656188011169434, "global_step": 130844, "epoch": 3115} {"train_loss": -6.829419136047363, "global_step": 130845, "epoch": 3115} {"train_loss": -6.6901140213012695, "global_step": 130846, "epoch": 3115} {"train_loss": -6.651528358459473, "global_step": 130847, "epoch": 3115} {"train_loss": -6.7989397048950195, "global_step": 130848, "epoch": 3115} {"train_loss": -6.678068161010742, "global_step": 130849, "epoch": 3115} {"train_loss": -6.679742813110352, "global_step": 130850, "epoch": 3115} {"train_loss": -6.745976448059082, "global_step": 130851, "epoch": 3115} {"train_loss": -6.5834736824035645, "global_step": 130852, "epoch": 3115} {"train_loss": -6.7585015296936035, "global_step": 130853, "epoch": 3115} {"train_loss": -6.654211521148682, "global_step": 130854, "epoch": 3115} {"train_loss": -6.653173923492432, "global_step": 130855, "epoch": 3115} {"train_loss": -6.620141983032227, "global_step": 130856, "epoch": 3115} {"train_loss": -6.586197376251221, "global_step": 130857, "epoch": 3115} {"train_loss": -6.731719970703125, "global_step": 130858, "epoch": 3115} {"train_loss": -6.746589660644531, "global_step": 130859, "epoch": 3115} {"train_loss": -6.698390007019043, "global_step": 130860, "epoch": 3115} {"train_loss": -6.645644187927246, "global_step": 130861, "epoch": 3115} {"train_loss": -6.739036560058594, "global_step": 130862, "epoch": 3115} {"train_loss": -6.670783996582031, "global_step": 130863, "epoch": 3115} {"train_loss": -6.624965667724609, "global_step": 130864, "epoch": 3115} {"train_loss": -6.691845893859863, "global_step": 130865, "epoch": 3115} {"train_loss": -6.705447196960449, "global_step": 130866, "epoch": 3115} {"train_loss": -6.823251724243164, "global_step": 130867, "epoch": 3115} {"train_loss": -6.679231643676758, "global_step": 130868, "epoch": 3115} {"train_loss": -6.674185752868652, "global_step": 130869, "epoch": 3115} {"train_loss": -6.710604667663574, "global_step": 130870, "epoch": 3115} {"train_loss": -6.68948092914763, "global_step": 130871, "epoch": 3115, "val_loss": 66556.0859375} {"train_loss": -6.67228364944458, "global_step": 130872, "epoch": 3116} {"train_loss": -6.692978858947754, "global_step": 130873, "epoch": 3116} {"train_loss": -6.606820106506348, "global_step": 130874, "epoch": 3116} {"train_loss": -6.649078369140625, "global_step": 130875, "epoch": 3116} {"train_loss": -6.672366142272949, "global_step": 130876, "epoch": 3116} {"train_loss": -6.687360763549805, "global_step": 130877, "epoch": 3116} {"train_loss": -6.597659587860107, "global_step": 130878, "epoch": 3116} {"train_loss": -6.645167827606201, "global_step": 130879, "epoch": 3116} {"train_loss": -6.715259552001953, "global_step": 130880, "epoch": 3116} {"train_loss": -6.616177558898926, "global_step": 130881, "epoch": 3116} {"train_loss": -6.627497673034668, "global_step": 130882, "epoch": 3116} {"train_loss": -6.710984706878662, "global_step": 130883, "epoch": 3116} {"train_loss": -6.59628963470459, "global_step": 130884, "epoch": 3116} {"train_loss": -6.5862932205200195, "global_step": 130885, "epoch": 3116} {"train_loss": -6.558731555938721, "global_step": 130886, "epoch": 3116} {"train_loss": -6.748789310455322, "global_step": 130887, "epoch": 3116} {"train_loss": -6.73381233215332, "global_step": 130888, "epoch": 3116} {"train_loss": -6.53803825378418, "global_step": 130889, "epoch": 3116} {"train_loss": -6.688063621520996, "global_step": 130890, "epoch": 3116} {"train_loss": -6.662471771240234, "global_step": 130891, "epoch": 3116} {"train_loss": -6.72929048538208, "global_step": 130892, "epoch": 3116} {"train_loss": -6.644308090209961, "global_step": 130893, "epoch": 3116} {"train_loss": -6.7150373458862305, "global_step": 130894, "epoch": 3116} {"train_loss": -6.644346237182617, "global_step": 130895, "epoch": 3116} {"train_loss": -6.6884965896606445, "global_step": 130896, "epoch": 3116} {"train_loss": -6.707996368408203, "global_step": 130897, "epoch": 3116} {"train_loss": -6.807435989379883, "global_step": 130898, "epoch": 3116} {"train_loss": -6.622798919677734, "global_step": 130899, "epoch": 3116} {"train_loss": -6.700184345245361, "global_step": 130900, "epoch": 3116} {"train_loss": -6.708067893981934, "global_step": 130901, "epoch": 3116} {"train_loss": -6.731776237487793, "global_step": 130902, "epoch": 3116} {"train_loss": -6.680593013763428, "global_step": 130903, "epoch": 3116} {"train_loss": -6.66507625579834, "global_step": 130904, "epoch": 3116} {"train_loss": -6.73719596862793, "global_step": 130905, "epoch": 3116} {"train_loss": -6.593918800354004, "global_step": 130906, "epoch": 3116} {"train_loss": -6.695417404174805, "global_step": 130907, "epoch": 3116} {"train_loss": -6.748778343200684, "global_step": 130908, "epoch": 3116} {"train_loss": -6.695250988006592, "global_step": 130909, "epoch": 3116} {"train_loss": -6.57794189453125, "global_step": 130910, "epoch": 3116} {"train_loss": -6.617709159851074, "global_step": 130911, "epoch": 3116} {"train_loss": -6.787929058074951, "global_step": 130912, "epoch": 3116} {"train_loss": -6.6707288310641335, "global_step": 130913, "epoch": 3116, "val_loss": 66593.8046875} {"train_loss": -6.776851654052734, "global_step": 130914, "epoch": 3117} {"train_loss": -6.6520586013793945, "global_step": 130915, "epoch": 3117} {"train_loss": -6.717105388641357, "global_step": 130916, "epoch": 3117} {"train_loss": -6.58413553237915, "global_step": 130917, "epoch": 3117} {"train_loss": -6.722049236297607, "global_step": 130918, "epoch": 3117} {"train_loss": -6.548768997192383, "global_step": 130919, "epoch": 3117} {"train_loss": -6.702516078948975, "global_step": 130920, "epoch": 3117} {"train_loss": -6.697457313537598, "global_step": 130921, "epoch": 3117} {"train_loss": -6.5949506759643555, "global_step": 130922, "epoch": 3117} {"train_loss": -6.677096366882324, "global_step": 130923, "epoch": 3117} {"train_loss": -6.681850433349609, "global_step": 130924, "epoch": 3117} {"train_loss": -6.821501731872559, "global_step": 130925, "epoch": 3117} {"train_loss": -6.621575355529785, "global_step": 130926, "epoch": 3117} {"train_loss": -6.77840518951416, "global_step": 130927, "epoch": 3117} {"train_loss": -6.686978340148926, "global_step": 130928, "epoch": 3117} {"train_loss": -6.725037574768066, "global_step": 130929, "epoch": 3117} {"train_loss": -6.662533283233643, "global_step": 130930, "epoch": 3117} {"train_loss": -6.763075828552246, "global_step": 130931, "epoch": 3117} {"train_loss": -6.728508949279785, "global_step": 130932, "epoch": 3117} {"train_loss": -6.686385154724121, "global_step": 130933, "epoch": 3117} {"train_loss": -6.64025354385376, "global_step": 130934, "epoch": 3117} {"train_loss": -6.643148422241211, "global_step": 130935, "epoch": 3117} {"train_loss": -6.620364189147949, "global_step": 130936, "epoch": 3117} {"train_loss": -6.6706342697143555, "global_step": 130937, "epoch": 3117} {"train_loss": -6.820372581481934, "global_step": 130938, "epoch": 3117} {"train_loss": -6.529400825500488, "global_step": 130939, "epoch": 3117} {"train_loss": -6.753582000732422, "global_step": 130940, "epoch": 3117} {"train_loss": -6.798358917236328, "global_step": 130941, "epoch": 3117} {"train_loss": -6.728453159332275, "global_step": 130942, "epoch": 3117} {"train_loss": -6.5956010818481445, "global_step": 130943, "epoch": 3117} {"train_loss": -6.710874557495117, "global_step": 130944, "epoch": 3117} {"train_loss": -6.706899642944336, "global_step": 130945, "epoch": 3117} {"train_loss": -6.711277008056641, "global_step": 130946, "epoch": 3117} {"train_loss": -6.69305944442749, "global_step": 130947, "epoch": 3117} {"train_loss": -6.811075210571289, "global_step": 130948, "epoch": 3117} {"train_loss": -6.760626792907715, "global_step": 130949, "epoch": 3117} {"train_loss": -6.716139793395996, "global_step": 130950, "epoch": 3117} {"train_loss": -6.561519145965576, "global_step": 130951, "epoch": 3117} {"train_loss": -6.752157211303711, "global_step": 130952, "epoch": 3117} {"train_loss": -6.6856913566589355, "global_step": 130953, "epoch": 3117} {"train_loss": -6.656870365142822, "global_step": 130954, "epoch": 3117} {"train_loss": -6.693831750324795, "global_step": 130955, "epoch": 3117, "val_loss": 66416.046875} {"train_loss": -6.641590118408203, "global_step": 130956, "epoch": 3118} {"train_loss": -6.77278995513916, "global_step": 130957, "epoch": 3118} {"train_loss": -6.707083225250244, "global_step": 130958, "epoch": 3118} {"train_loss": -6.573000907897949, "global_step": 130959, "epoch": 3118} {"train_loss": -6.753927230834961, "global_step": 130960, "epoch": 3118} {"train_loss": -6.701671600341797, "global_step": 130961, "epoch": 3118} {"train_loss": -6.633164882659912, "global_step": 130962, "epoch": 3118} {"train_loss": -6.640780448913574, "global_step": 130963, "epoch": 3118} {"train_loss": -6.678447723388672, "global_step": 130964, "epoch": 3118} {"train_loss": -6.753208160400391, "global_step": 130965, "epoch": 3118} {"train_loss": -6.747559547424316, "global_step": 130966, "epoch": 3118} {"train_loss": -6.761481285095215, "global_step": 130967, "epoch": 3118} {"train_loss": -6.725847244262695, "global_step": 130968, "epoch": 3118} {"train_loss": -6.735196113586426, "global_step": 130969, "epoch": 3118} {"train_loss": -6.647176265716553, "global_step": 130970, "epoch": 3118} {"train_loss": -6.714052200317383, "global_step": 130971, "epoch": 3118} {"train_loss": -6.644221305847168, "global_step": 130972, "epoch": 3118} {"train_loss": -6.738341331481934, "global_step": 130973, "epoch": 3118} {"train_loss": -6.643886566162109, "global_step": 130974, "epoch": 3118} {"train_loss": -6.683722019195557, "global_step": 130975, "epoch": 3118} {"train_loss": -6.646687030792236, "global_step": 130976, "epoch": 3118} {"train_loss": -6.66221809387207, "global_step": 130977, "epoch": 3118} {"train_loss": -6.7292633056640625, "global_step": 130978, "epoch": 3118} {"train_loss": -6.678699970245361, "global_step": 130979, "epoch": 3118} {"train_loss": -6.763909816741943, "global_step": 130980, "epoch": 3118} {"train_loss": -6.6482977867126465, "global_step": 130981, "epoch": 3118} {"train_loss": -6.720332145690918, "global_step": 130982, "epoch": 3118} {"train_loss": -6.701748847961426, "global_step": 130983, "epoch": 3118} {"train_loss": -6.705671310424805, "global_step": 130984, "epoch": 3118} {"train_loss": -6.791855812072754, "global_step": 130985, "epoch": 3118} {"train_loss": -6.704485893249512, "global_step": 130986, "epoch": 3118} {"train_loss": -6.687912940979004, "global_step": 130987, "epoch": 3118} {"train_loss": -6.632216930389404, "global_step": 130988, "epoch": 3118} {"train_loss": -6.688932418823242, "global_step": 130989, "epoch": 3118} {"train_loss": -6.7221527099609375, "global_step": 130990, "epoch": 3118} {"train_loss": -6.652854919433594, "global_step": 130991, "epoch": 3118} {"train_loss": -6.717491626739502, "global_step": 130992, "epoch": 3118} {"train_loss": -6.8413519859313965, "global_step": 130993, "epoch": 3118} {"train_loss": -6.660171031951904, "global_step": 130994, "epoch": 3118} {"train_loss": -6.690397262573242, "global_step": 130995, "epoch": 3118} {"train_loss": -6.696655750274658, "global_step": 130996, "epoch": 3118} {"train_loss": -6.7008411430177235, "global_step": 130997, "epoch": 3118, "val_loss": 66518.4921875} {"train_loss": -6.675384521484375, "global_step": 130998, "epoch": 3119} {"train_loss": -6.708205223083496, "global_step": 130999, "epoch": 3119} {"train_loss": -6.779593467712402, "global_step": 131000, "epoch": 3119} {"train_loss": -6.805191993713379, "global_step": 131001, "epoch": 3119} {"train_loss": -6.70999813079834, "global_step": 131002, "epoch": 3119} {"train_loss": -6.674914360046387, "global_step": 131003, "epoch": 3119} {"train_loss": -6.726598739624023, "global_step": 131004, "epoch": 3119} {"train_loss": -6.747122287750244, "global_step": 131005, "epoch": 3119} {"train_loss": -6.65250301361084, "global_step": 131006, "epoch": 3119} {"train_loss": -6.760658264160156, "global_step": 131007, "epoch": 3119} {"train_loss": -6.607362747192383, "global_step": 131008, "epoch": 3119} {"train_loss": -6.630759239196777, "global_step": 131009, "epoch": 3119} {"train_loss": -6.667308807373047, "global_step": 131010, "epoch": 3119} {"train_loss": -6.64091682434082, "global_step": 131011, "epoch": 3119} {"train_loss": -6.7340312004089355, "global_step": 131012, "epoch": 3119} {"train_loss": -6.616635322570801, "global_step": 131013, "epoch": 3119} {"train_loss": -6.796030044555664, "global_step": 131014, "epoch": 3119} {"train_loss": -6.700662136077881, "global_step": 131015, "epoch": 3119} {"train_loss": -6.735383987426758, "global_step": 131016, "epoch": 3119} {"train_loss": -6.704921245574951, "global_step": 131017, "epoch": 3119} {"train_loss": -6.666714668273926, "global_step": 131018, "epoch": 3119} {"train_loss": -6.506861686706543, "global_step": 131019, "epoch": 3119} {"train_loss": -6.670732498168945, "global_step": 131020, "epoch": 3119} {"train_loss": -6.80301570892334, "global_step": 131021, "epoch": 3119} {"train_loss": -6.7579450607299805, "global_step": 131022, "epoch": 3119} {"train_loss": -6.706554889678955, "global_step": 131023, "epoch": 3119} {"train_loss": -6.702097415924072, "global_step": 131024, "epoch": 3119} {"train_loss": -6.764482498168945, "global_step": 131025, "epoch": 3119} {"train_loss": -6.76206111907959, "global_step": 131026, "epoch": 3119} {"train_loss": -6.72587776184082, "global_step": 131027, "epoch": 3119} {"train_loss": -6.635564804077148, "global_step": 131028, "epoch": 3119} {"train_loss": -6.781082630157471, "global_step": 131029, "epoch": 3119} {"train_loss": -6.676115989685059, "global_step": 131030, "epoch": 3119} {"train_loss": -6.688535690307617, "global_step": 131031, "epoch": 3119} {"train_loss": -6.699301719665527, "global_step": 131032, "epoch": 3119} {"train_loss": -6.590764045715332, "global_step": 131033, "epoch": 3119} {"train_loss": -6.602842330932617, "global_step": 131034, "epoch": 3119} {"train_loss": -6.812078475952148, "global_step": 131035, "epoch": 3119} {"train_loss": -6.626016139984131, "global_step": 131036, "epoch": 3119} {"train_loss": -6.737146377563477, "global_step": 131037, "epoch": 3119} {"train_loss": -6.643241882324219, "global_step": 131038, "epoch": 3119} {"train_loss": -6.697379203069778, "global_step": 131039, "epoch": 3119, "val_loss": 66691.2734375} {"train_loss": -6.577426910400391, "global_step": 131040, "epoch": 3120} {"train_loss": -6.7261881828308105, "global_step": 131041, "epoch": 3120} {"train_loss": -6.745941162109375, "global_step": 131042, "epoch": 3120} {"train_loss": -6.5977277755737305, "global_step": 131043, "epoch": 3120} {"train_loss": -6.75225830078125, "global_step": 131044, "epoch": 3120} {"train_loss": -6.826035499572754, "global_step": 131045, "epoch": 3120} {"train_loss": -6.702836990356445, "global_step": 131046, "epoch": 3120} {"train_loss": -6.705197334289551, "global_step": 131047, "epoch": 3120} {"train_loss": -6.692000865936279, "global_step": 131048, "epoch": 3120} {"train_loss": -6.61509895324707, "global_step": 131049, "epoch": 3120} {"train_loss": -6.627490997314453, "global_step": 131050, "epoch": 3120} {"train_loss": -6.582207679748535, "global_step": 131051, "epoch": 3120} {"train_loss": -6.58550500869751, "global_step": 131052, "epoch": 3120} {"train_loss": -6.757498264312744, "global_step": 131053, "epoch": 3120} {"train_loss": -6.634255409240723, "global_step": 131054, "epoch": 3120} {"train_loss": -6.6656107902526855, "global_step": 131055, "epoch": 3120} {"train_loss": -6.647192478179932, "global_step": 131056, "epoch": 3120} {"train_loss": -6.45515775680542, "global_step": 131057, "epoch": 3120} {"train_loss": -6.648557662963867, "global_step": 131058, "epoch": 3120} {"train_loss": -6.559343338012695, "global_step": 131059, "epoch": 3120} {"train_loss": -6.657329559326172, "global_step": 131060, "epoch": 3120} {"train_loss": -6.744802474975586, "global_step": 131061, "epoch": 3120} {"train_loss": -6.559088706970215, "global_step": 131062, "epoch": 3120} {"train_loss": -6.760343551635742, "global_step": 131063, "epoch": 3120} {"train_loss": -6.583604335784912, "global_step": 131064, "epoch": 3120} {"train_loss": -6.65233039855957, "global_step": 131065, "epoch": 3120} {"train_loss": -6.75154972076416, "global_step": 131066, "epoch": 3120} {"train_loss": -6.570226669311523, "global_step": 131067, "epoch": 3120} {"train_loss": -6.670549392700195, "global_step": 131068, "epoch": 3120} {"train_loss": -6.66343879699707, "global_step": 131069, "epoch": 3120} {"train_loss": -6.708510398864746, "global_step": 131070, "epoch": 3120} {"train_loss": -6.679002285003662, "global_step": 131071, "epoch": 3120} {"train_loss": -6.605808258056641, "global_step": 131072, "epoch": 3120} {"train_loss": -6.654812812805176, "global_step": 131073, "epoch": 3120} {"train_loss": -6.628008842468262, "global_step": 131074, "epoch": 3120} {"train_loss": -6.746501922607422, "global_step": 131075, "epoch": 3120} {"train_loss": -6.707339286804199, "global_step": 131076, "epoch": 3120} {"train_loss": -6.534128665924072, "global_step": 131077, "epoch": 3120} {"train_loss": -6.686835289001465, "global_step": 131078, "epoch": 3120} {"train_loss": -6.7139482498168945, "global_step": 131079, "epoch": 3120} {"train_loss": -6.728924751281738, "global_step": 131080, "epoch": 3120} {"train_loss": -6.661013285319011, "global_step": 131081, "epoch": 3120, "val_loss": 66521.9921875} {"train_loss": -6.674959182739258, "global_step": 131082, "epoch": 3121} {"train_loss": -6.692389965057373, "global_step": 131083, "epoch": 3121} {"train_loss": -6.568633079528809, "global_step": 131084, "epoch": 3121} {"train_loss": -6.714947700500488, "global_step": 131085, "epoch": 3121} {"train_loss": -6.712194442749023, "global_step": 131086, "epoch": 3121} {"train_loss": -6.722187519073486, "global_step": 131087, "epoch": 3121} {"train_loss": -6.553254127502441, "global_step": 131088, "epoch": 3121} {"train_loss": -6.6475300788879395, "global_step": 131089, "epoch": 3121} {"train_loss": -6.784048080444336, "global_step": 131090, "epoch": 3121} {"train_loss": -6.699112892150879, "global_step": 131091, "epoch": 3121} {"train_loss": -6.691706657409668, "global_step": 131092, "epoch": 3121} {"train_loss": -6.48130989074707, "global_step": 131093, "epoch": 3121} {"train_loss": -6.492669105529785, "global_step": 131094, "epoch": 3121} {"train_loss": -6.7116851806640625, "global_step": 131095, "epoch": 3121} {"train_loss": -6.633121490478516, "global_step": 131096, "epoch": 3121} {"train_loss": -6.661347389221191, "global_step": 131097, "epoch": 3121} {"train_loss": -6.676192283630371, "global_step": 131098, "epoch": 3121} {"train_loss": -6.633840560913086, "global_step": 131099, "epoch": 3121} {"train_loss": -6.661217212677002, "global_step": 131100, "epoch": 3121} {"train_loss": -6.765410423278809, "global_step": 131101, "epoch": 3121} {"train_loss": -6.75199031829834, "global_step": 131102, "epoch": 3121} {"train_loss": -6.729615688323975, "global_step": 131103, "epoch": 3121} {"train_loss": -6.774012565612793, "global_step": 131104, "epoch": 3121} {"train_loss": -6.692166328430176, "global_step": 131105, "epoch": 3121} {"train_loss": -6.667459487915039, "global_step": 131106, "epoch": 3121} {"train_loss": -6.607483386993408, "global_step": 131107, "epoch": 3121} {"train_loss": -6.706119537353516, "global_step": 131108, "epoch": 3121} {"train_loss": -6.692543029785156, "global_step": 131109, "epoch": 3121} {"train_loss": -6.701716899871826, "global_step": 131110, "epoch": 3121} {"train_loss": -6.71226692199707, "global_step": 131111, "epoch": 3121} {"train_loss": -6.652692794799805, "global_step": 131112, "epoch": 3121} {"train_loss": -6.659659385681152, "global_step": 131113, "epoch": 3121} {"train_loss": -6.765483379364014, "global_step": 131114, "epoch": 3121} {"train_loss": -6.767986297607422, "global_step": 131115, "epoch": 3121} {"train_loss": -6.683720588684082, "global_step": 131116, "epoch": 3121} {"train_loss": -6.6802544593811035, "global_step": 131117, "epoch": 3121} {"train_loss": -6.7011871337890625, "global_step": 131118, "epoch": 3121} {"train_loss": -6.732987403869629, "global_step": 131119, "epoch": 3121} {"train_loss": -6.615062713623047, "global_step": 131120, "epoch": 3121} {"train_loss": -6.696114540100098, "global_step": 131121, "epoch": 3121} {"train_loss": -6.78233528137207, "global_step": 131122, "epoch": 3121} {"train_loss": -6.683281535194034, "global_step": 131123, "epoch": 3121, "val_loss": 66730.984375} {"train_loss": -6.731886863708496, "global_step": 131124, "epoch": 3122} {"train_loss": -6.698314189910889, "global_step": 131125, "epoch": 3122} {"train_loss": -6.693073749542236, "global_step": 131126, "epoch": 3122} {"train_loss": -6.723505020141602, "global_step": 131127, "epoch": 3122} {"train_loss": -6.651702404022217, "global_step": 131128, "epoch": 3122} {"train_loss": -6.756368637084961, "global_step": 131129, "epoch": 3122} {"train_loss": -6.521535873413086, "global_step": 131130, "epoch": 3122} {"train_loss": -6.667971611022949, "global_step": 131131, "epoch": 3122} {"train_loss": -6.715794563293457, "global_step": 131132, "epoch": 3122} {"train_loss": -6.657263278961182, "global_step": 131133, "epoch": 3122} {"train_loss": -6.624125957489014, "global_step": 131134, "epoch": 3122} {"train_loss": -6.6558637619018555, "global_step": 131135, "epoch": 3122} {"train_loss": -6.688317775726318, "global_step": 131136, "epoch": 3122} {"train_loss": -6.64814567565918, "global_step": 131137, "epoch": 3122} {"train_loss": -6.654542922973633, "global_step": 131138, "epoch": 3122} {"train_loss": -6.7048540115356445, "global_step": 131139, "epoch": 3122} {"train_loss": -6.744460105895996, "global_step": 131140, "epoch": 3122} {"train_loss": -6.639576435089111, "global_step": 131141, "epoch": 3122} {"train_loss": -6.639913558959961, "global_step": 131142, "epoch": 3122} {"train_loss": -6.790455341339111, "global_step": 131143, "epoch": 3122} {"train_loss": -6.7766008377075195, "global_step": 131144, "epoch": 3122} {"train_loss": -6.822051048278809, "global_step": 131145, "epoch": 3122} {"train_loss": -6.607913017272949, "global_step": 131146, "epoch": 3122} {"train_loss": -6.736979961395264, "global_step": 131147, "epoch": 3122} {"train_loss": -6.697054862976074, "global_step": 131148, "epoch": 3122} {"train_loss": -6.790409088134766, "global_step": 131149, "epoch": 3122} {"train_loss": -6.614372253417969, "global_step": 131150, "epoch": 3122} {"train_loss": -6.69527530670166, "global_step": 131151, "epoch": 3122} {"train_loss": -6.718856334686279, "global_step": 131152, "epoch": 3122} {"train_loss": -6.661727428436279, "global_step": 131153, "epoch": 3122} {"train_loss": -6.698578357696533, "global_step": 131154, "epoch": 3122} {"train_loss": -6.582919597625732, "global_step": 131155, "epoch": 3122} {"train_loss": -6.730861663818359, "global_step": 131156, "epoch": 3122} {"train_loss": -6.507161617279053, "global_step": 131157, "epoch": 3122} {"train_loss": -6.694410800933838, "global_step": 131158, "epoch": 3122} {"train_loss": -6.58081579208374, "global_step": 131159, "epoch": 3122} {"train_loss": -6.406325817108154, "global_step": 131160, "epoch": 3122} {"train_loss": -6.647587776184082, "global_step": 131161, "epoch": 3122} {"train_loss": -6.623568534851074, "global_step": 131162, "epoch": 3122} {"train_loss": -6.460548400878906, "global_step": 131163, "epoch": 3122} {"train_loss": -6.564286231994629, "global_step": 131164, "epoch": 3122} {"train_loss": -6.664866844813029, "global_step": 131165, "epoch": 3122, "val_loss": 66760.28125} {"train_loss": -6.608828544616699, "global_step": 131166, "epoch": 3123} {"train_loss": -6.664666175842285, "global_step": 131167, "epoch": 3123} {"train_loss": -6.58946418762207, "global_step": 131168, "epoch": 3123} {"train_loss": -6.649629592895508, "global_step": 131169, "epoch": 3123} {"train_loss": -6.490640640258789, "global_step": 131170, "epoch": 3123} {"train_loss": -6.724325180053711, "global_step": 131171, "epoch": 3123} {"train_loss": -6.615119934082031, "global_step": 131172, "epoch": 3123} {"train_loss": -6.667588233947754, "global_step": 131173, "epoch": 3123} {"train_loss": -6.6885480880737305, "global_step": 131174, "epoch": 3123} {"train_loss": -6.6315789222717285, "global_step": 131175, "epoch": 3123} {"train_loss": -6.612603187561035, "global_step": 131176, "epoch": 3123} {"train_loss": -6.639346122741699, "global_step": 131177, "epoch": 3123} {"train_loss": -6.610694885253906, "global_step": 131178, "epoch": 3123} {"train_loss": -6.541045188903809, "global_step": 131179, "epoch": 3123} {"train_loss": -6.606781959533691, "global_step": 131180, "epoch": 3123} {"train_loss": -6.604709625244141, "global_step": 131181, "epoch": 3123} {"train_loss": -6.4530029296875, "global_step": 131182, "epoch": 3123} {"train_loss": -6.629768371582031, "global_step": 131183, "epoch": 3123} {"train_loss": -6.527940273284912, "global_step": 131184, "epoch": 3123} {"train_loss": -6.599783897399902, "global_step": 131185, "epoch": 3123} {"train_loss": -6.49152946472168, "global_step": 131186, "epoch": 3123} {"train_loss": -6.5357441902160645, "global_step": 131187, "epoch": 3123} {"train_loss": -6.582779884338379, "global_step": 131188, "epoch": 3123} {"train_loss": -6.646581649780273, "global_step": 131189, "epoch": 3123} {"train_loss": -6.548572540283203, "global_step": 131190, "epoch": 3123} {"train_loss": -6.676021099090576, "global_step": 131191, "epoch": 3123} {"train_loss": -6.488502502441406, "global_step": 131192, "epoch": 3123} {"train_loss": -6.625273704528809, "global_step": 131193, "epoch": 3123} {"train_loss": -6.56449031829834, "global_step": 131194, "epoch": 3123} {"train_loss": -6.653079032897949, "global_step": 131195, "epoch": 3123} {"train_loss": -6.5447282791137695, "global_step": 131196, "epoch": 3123} {"train_loss": -6.6419878005981445, "global_step": 131197, "epoch": 3123} {"train_loss": -6.65532112121582, "global_step": 131198, "epoch": 3123} {"train_loss": -6.671067714691162, "global_step": 131199, "epoch": 3123} {"train_loss": -6.684499263763428, "global_step": 131200, "epoch": 3123} {"train_loss": -6.67024040222168, "global_step": 131201, "epoch": 3123} {"train_loss": -6.648562431335449, "global_step": 131202, "epoch": 3123} {"train_loss": -6.617859840393066, "global_step": 131203, "epoch": 3123} {"train_loss": -6.667862892150879, "global_step": 131204, "epoch": 3123} {"train_loss": -6.67633056640625, "global_step": 131205, "epoch": 3123} {"train_loss": -6.587861061096191, "global_step": 131206, "epoch": 3123} {"train_loss": -6.6118987287793844, "global_step": 131207, "epoch": 3123, "val_loss": 66542.0625} {"train_loss": -6.71660852432251, "global_step": 131208, "epoch": 3124} {"train_loss": -6.696186065673828, "global_step": 131209, "epoch": 3124} {"train_loss": -6.503689765930176, "global_step": 131210, "epoch": 3124} {"train_loss": -6.74444055557251, "global_step": 131211, "epoch": 3124} {"train_loss": -6.73161506652832, "global_step": 131212, "epoch": 3124} {"train_loss": -6.673612117767334, "global_step": 131213, "epoch": 3124} {"train_loss": -6.6952056884765625, "global_step": 131214, "epoch": 3124} {"train_loss": -6.652721881866455, "global_step": 131215, "epoch": 3124} {"train_loss": -6.696829319000244, "global_step": 131216, "epoch": 3124} {"train_loss": -6.706841468811035, "global_step": 131217, "epoch": 3124} {"train_loss": -6.62997579574585, "global_step": 131218, "epoch": 3124} {"train_loss": -6.6493024826049805, "global_step": 131219, "epoch": 3124} {"train_loss": -6.629217147827148, "global_step": 131220, "epoch": 3124} {"train_loss": -6.747690677642822, "global_step": 131221, "epoch": 3124} {"train_loss": -6.732170104980469, "global_step": 131222, "epoch": 3124} {"train_loss": -6.648342132568359, "global_step": 131223, "epoch": 3124} {"train_loss": -6.629548072814941, "global_step": 131224, "epoch": 3124} {"train_loss": -6.671783447265625, "global_step": 131225, "epoch": 3124} {"train_loss": -6.561467170715332, "global_step": 131226, "epoch": 3124} {"train_loss": -6.761860370635986, "global_step": 131227, "epoch": 3124} {"train_loss": -6.7087812423706055, "global_step": 131228, "epoch": 3124} {"train_loss": -6.707467079162598, "global_step": 131229, "epoch": 3124} {"train_loss": -6.6423845291137695, "global_step": 131230, "epoch": 3124} {"train_loss": -6.584516525268555, "global_step": 131231, "epoch": 3124} {"train_loss": -6.593071937561035, "global_step": 131232, "epoch": 3124} {"train_loss": -6.759613990783691, "global_step": 131233, "epoch": 3124} {"train_loss": -6.550811767578125, "global_step": 131234, "epoch": 3124} {"train_loss": -6.716732025146484, "global_step": 131235, "epoch": 3124} {"train_loss": -6.697501182556152, "global_step": 131236, "epoch": 3124} {"train_loss": -6.6772565841674805, "global_step": 131237, "epoch": 3124} {"train_loss": -6.687877655029297, "global_step": 131238, "epoch": 3124} {"train_loss": -6.720751762390137, "global_step": 131239, "epoch": 3124} {"train_loss": -6.649069786071777, "global_step": 131240, "epoch": 3124} {"train_loss": -6.726190567016602, "global_step": 131241, "epoch": 3124} {"train_loss": -6.697978973388672, "global_step": 131242, "epoch": 3124} {"train_loss": -6.755701065063477, "global_step": 131243, "epoch": 3124} {"train_loss": -6.787346839904785, "global_step": 131244, "epoch": 3124} {"train_loss": -6.77503776550293, "global_step": 131245, "epoch": 3124} {"train_loss": -6.684110641479492, "global_step": 131246, "epoch": 3124} {"train_loss": -6.663214683532715, "global_step": 131247, "epoch": 3124} {"train_loss": -6.699172019958496, "global_step": 131248, "epoch": 3124} {"train_loss": -6.686138164429438, "global_step": 131249, "epoch": 3124, "val_loss": 66502.984375} {"train_loss": -6.772144317626953, "global_step": 131250, "epoch": 3125} {"train_loss": -6.784963607788086, "global_step": 131251, "epoch": 3125} {"train_loss": -6.677156925201416, "global_step": 131252, "epoch": 3125} {"train_loss": -6.662167549133301, "global_step": 131253, "epoch": 3125} {"train_loss": -6.734011650085449, "global_step": 131254, "epoch": 3125} {"train_loss": -6.7003278732299805, "global_step": 131255, "epoch": 3125} {"train_loss": -6.723977088928223, "global_step": 131256, "epoch": 3125} {"train_loss": -6.715046405792236, "global_step": 131257, "epoch": 3125} {"train_loss": -6.777039527893066, "global_step": 131258, "epoch": 3125} {"train_loss": -6.695592403411865, "global_step": 131259, "epoch": 3125} {"train_loss": -6.564190864562988, "global_step": 131260, "epoch": 3125} {"train_loss": -6.734306335449219, "global_step": 131261, "epoch": 3125} {"train_loss": -6.731508255004883, "global_step": 131262, "epoch": 3125} {"train_loss": -6.651918888092041, "global_step": 131263, "epoch": 3125} {"train_loss": -6.50525426864624, "global_step": 131264, "epoch": 3125} {"train_loss": -6.720906734466553, "global_step": 131265, "epoch": 3125} {"train_loss": -6.715503692626953, "global_step": 131266, "epoch": 3125} {"train_loss": -6.7464985847473145, "global_step": 131267, "epoch": 3125} {"train_loss": -6.820659160614014, "global_step": 131268, "epoch": 3125} {"train_loss": -6.623021125793457, "global_step": 131269, "epoch": 3125} {"train_loss": -6.760650634765625, "global_step": 131270, "epoch": 3125} {"train_loss": -6.6486358642578125, "global_step": 131271, "epoch": 3125} {"train_loss": -6.638489723205566, "global_step": 131272, "epoch": 3125} {"train_loss": -6.6942596435546875, "global_step": 131273, "epoch": 3125} {"train_loss": -6.7657928466796875, "global_step": 131274, "epoch": 3125} {"train_loss": -6.645940780639648, "global_step": 131275, "epoch": 3125} {"train_loss": -6.716722011566162, "global_step": 131276, "epoch": 3125} {"train_loss": -6.724747657775879, "global_step": 131277, "epoch": 3125} {"train_loss": -6.70152473449707, "global_step": 131278, "epoch": 3125} {"train_loss": -6.6970930099487305, "global_step": 131279, "epoch": 3125} {"train_loss": -6.769129753112793, "global_step": 131280, "epoch": 3125} {"train_loss": -6.697612762451172, "global_step": 131281, "epoch": 3125} {"train_loss": -6.779400825500488, "global_step": 131282, "epoch": 3125} {"train_loss": -6.79577112197876, "global_step": 131283, "epoch": 3125} {"train_loss": -6.696342468261719, "global_step": 131284, "epoch": 3125} {"train_loss": -6.587741374969482, "global_step": 131285, "epoch": 3125} {"train_loss": -6.666670799255371, "global_step": 131286, "epoch": 3125} {"train_loss": -6.6185784339904785, "global_step": 131287, "epoch": 3125} {"train_loss": -6.531756401062012, "global_step": 131288, "epoch": 3125} {"train_loss": -6.613930702209473, "global_step": 131289, "epoch": 3125} {"train_loss": -6.7387895584106445, "global_step": 131290, "epoch": 3125} {"train_loss": -6.693766548520043, "global_step": 131291, "epoch": 3125, "val_loss": 66592.28125} {"train_loss": -6.5574564933776855, "global_step": 131292, "epoch": 3126} {"train_loss": -6.655729293823242, "global_step": 131293, "epoch": 3126} {"train_loss": -6.727717399597168, "global_step": 131294, "epoch": 3126} {"train_loss": -6.5787811279296875, "global_step": 131295, "epoch": 3126} {"train_loss": -6.6907830238342285, "global_step": 131296, "epoch": 3126} {"train_loss": -6.619701385498047, "global_step": 131297, "epoch": 3126} {"train_loss": -6.7529144287109375, "global_step": 131298, "epoch": 3126} {"train_loss": -6.70065975189209, "global_step": 131299, "epoch": 3126} {"train_loss": -6.6865034103393555, "global_step": 131300, "epoch": 3126} {"train_loss": -6.733846664428711, "global_step": 131301, "epoch": 3126} {"train_loss": -6.709210395812988, "global_step": 131302, "epoch": 3126} {"train_loss": -6.711903095245361, "global_step": 131303, "epoch": 3126} {"train_loss": -6.690632343292236, "global_step": 131304, "epoch": 3126} {"train_loss": -6.666833877563477, "global_step": 131305, "epoch": 3126} {"train_loss": -6.694540500640869, "global_step": 131306, "epoch": 3126} {"train_loss": -6.663812637329102, "global_step": 131307, "epoch": 3126} {"train_loss": -6.721817493438721, "global_step": 131308, "epoch": 3126} {"train_loss": -6.688015937805176, "global_step": 131309, "epoch": 3126} {"train_loss": -6.5070695877075195, "global_step": 131310, "epoch": 3126} {"train_loss": -6.54170560836792, "global_step": 131311, "epoch": 3126} {"train_loss": -6.524102210998535, "global_step": 131312, "epoch": 3126} {"train_loss": -6.587004661560059, "global_step": 131313, "epoch": 3126} {"train_loss": -6.607085227966309, "global_step": 131314, "epoch": 3126} {"train_loss": -6.571687698364258, "global_step": 131315, "epoch": 3126} {"train_loss": -6.719351768493652, "global_step": 131316, "epoch": 3126} {"train_loss": -6.637877464294434, "global_step": 131317, "epoch": 3126} {"train_loss": -6.670106887817383, "global_step": 131318, "epoch": 3126} {"train_loss": -6.6418681144714355, "global_step": 131319, "epoch": 3126} {"train_loss": -6.474255561828613, "global_step": 131320, "epoch": 3126} {"train_loss": -6.732073783874512, "global_step": 131321, "epoch": 3126} {"train_loss": -6.53317928314209, "global_step": 131322, "epoch": 3126} {"train_loss": -6.644132614135742, "global_step": 131323, "epoch": 3126} {"train_loss": -6.608245372772217, "global_step": 131324, "epoch": 3126} {"train_loss": -6.481954574584961, "global_step": 131325, "epoch": 3126} {"train_loss": -6.55302619934082, "global_step": 131326, "epoch": 3126} {"train_loss": -6.785074710845947, "global_step": 131327, "epoch": 3126} {"train_loss": -6.558873176574707, "global_step": 131328, "epoch": 3126} {"train_loss": -6.736948490142822, "global_step": 131329, "epoch": 3126} {"train_loss": -6.748787879943848, "global_step": 131330, "epoch": 3126} {"train_loss": -6.732935905456543, "global_step": 131331, "epoch": 3126} {"train_loss": -6.713377952575684, "global_step": 131332, "epoch": 3126} {"train_loss": -6.646517276763916, "global_step": 131333, "epoch": 3126, "val_loss": 66611.484375} {"train_loss": -6.564997673034668, "global_step": 131334, "epoch": 3127} {"train_loss": -6.543389320373535, "global_step": 131335, "epoch": 3127} {"train_loss": -6.677097797393799, "global_step": 131336, "epoch": 3127} {"train_loss": -6.565581321716309, "global_step": 131337, "epoch": 3127} {"train_loss": -6.5980072021484375, "global_step": 131338, "epoch": 3127} {"train_loss": -6.739042282104492, "global_step": 131339, "epoch": 3127} {"train_loss": -6.660342216491699, "global_step": 131340, "epoch": 3127} {"train_loss": -6.594338417053223, "global_step": 131341, "epoch": 3127} {"train_loss": -6.66500997543335, "global_step": 131342, "epoch": 3127} {"train_loss": -6.584639549255371, "global_step": 131343, "epoch": 3127} {"train_loss": -6.640229225158691, "global_step": 131344, "epoch": 3127} {"train_loss": -6.652001857757568, "global_step": 131345, "epoch": 3127} {"train_loss": -6.5657501220703125, "global_step": 131346, "epoch": 3127} {"train_loss": -6.746730804443359, "global_step": 131347, "epoch": 3127} {"train_loss": -6.6453142166137695, "global_step": 131348, "epoch": 3127} {"train_loss": -6.707080841064453, "global_step": 131349, "epoch": 3127} {"train_loss": -6.66588020324707, "global_step": 131350, "epoch": 3127} {"train_loss": -6.598798751831055, "global_step": 131351, "epoch": 3127} {"train_loss": -6.7096405029296875, "global_step": 131352, "epoch": 3127} {"train_loss": -6.682177543640137, "global_step": 131353, "epoch": 3127} {"train_loss": -6.738182067871094, "global_step": 131354, "epoch": 3127} {"train_loss": -6.715029716491699, "global_step": 131355, "epoch": 3127} {"train_loss": -6.555941581726074, "global_step": 131356, "epoch": 3127} {"train_loss": -6.692127227783203, "global_step": 131357, "epoch": 3127} {"train_loss": -6.684617042541504, "global_step": 131358, "epoch": 3127} {"train_loss": -6.6819915771484375, "global_step": 131359, "epoch": 3127} {"train_loss": -6.662055969238281, "global_step": 131360, "epoch": 3127} {"train_loss": -6.51078462600708, "global_step": 131361, "epoch": 3127} {"train_loss": -6.654458522796631, "global_step": 131362, "epoch": 3127} {"train_loss": -6.645123481750488, "global_step": 131363, "epoch": 3127} {"train_loss": -6.627590656280518, "global_step": 131364, "epoch": 3127} {"train_loss": -6.694319725036621, "global_step": 131365, "epoch": 3127} {"train_loss": -6.700159072875977, "global_step": 131366, "epoch": 3127} {"train_loss": -6.604545593261719, "global_step": 131367, "epoch": 3127} {"train_loss": -6.637534141540527, "global_step": 131368, "epoch": 3127} {"train_loss": -6.686184883117676, "global_step": 131369, "epoch": 3127} {"train_loss": -6.769870758056641, "global_step": 131370, "epoch": 3127} {"train_loss": -6.611669540405273, "global_step": 131371, "epoch": 3127} {"train_loss": -6.681273460388184, "global_step": 131372, "epoch": 3127} {"train_loss": -6.703749656677246, "global_step": 131373, "epoch": 3127} {"train_loss": -6.5875959396362305, "global_step": 131374, "epoch": 3127} {"train_loss": -6.65147834732419, "global_step": 131375, "epoch": 3127, "val_loss": 66723.734375} {"train_loss": -6.63212776184082, "global_step": 131376, "epoch": 3128} {"train_loss": -6.483461380004883, "global_step": 131377, "epoch": 3128} {"train_loss": -6.6531291007995605, "global_step": 131378, "epoch": 3128} {"train_loss": -6.797782897949219, "global_step": 131379, "epoch": 3128} {"train_loss": -6.5111188888549805, "global_step": 131380, "epoch": 3128} {"train_loss": -6.599201202392578, "global_step": 131381, "epoch": 3128} {"train_loss": -6.63306999206543, "global_step": 131382, "epoch": 3128} {"train_loss": -6.622462272644043, "global_step": 131383, "epoch": 3128} {"train_loss": -6.580739974975586, "global_step": 131384, "epoch": 3128} {"train_loss": -6.416974067687988, "global_step": 131385, "epoch": 3128} {"train_loss": -6.523305892944336, "global_step": 131386, "epoch": 3128} {"train_loss": -6.690303802490234, "global_step": 131387, "epoch": 3128} {"train_loss": -6.614300727844238, "global_step": 131388, "epoch": 3128} {"train_loss": -6.698594093322754, "global_step": 131389, "epoch": 3128} {"train_loss": -6.688777446746826, "global_step": 131390, "epoch": 3128} {"train_loss": -6.6333231925964355, "global_step": 131391, "epoch": 3128} {"train_loss": -6.715338706970215, "global_step": 131392, "epoch": 3128} {"train_loss": -6.6444501876831055, "global_step": 131393, "epoch": 3128} {"train_loss": -6.650946140289307, "global_step": 131394, "epoch": 3128} {"train_loss": -6.693530559539795, "global_step": 131395, "epoch": 3128} {"train_loss": -6.662119388580322, "global_step": 131396, "epoch": 3128} {"train_loss": -6.755610466003418, "global_step": 131397, "epoch": 3128} {"train_loss": -6.721899032592773, "global_step": 131398, "epoch": 3128} {"train_loss": -6.606006622314453, "global_step": 131399, "epoch": 3128} {"train_loss": -6.700369834899902, "global_step": 131400, "epoch": 3128} {"train_loss": -6.727457046508789, "global_step": 131401, "epoch": 3128} {"train_loss": -6.677240371704102, "global_step": 131402, "epoch": 3128} {"train_loss": -6.737555980682373, "global_step": 131403, "epoch": 3128} {"train_loss": -6.731392860412598, "global_step": 131404, "epoch": 3128} {"train_loss": -6.652993202209473, "global_step": 131405, "epoch": 3128} {"train_loss": -6.5879621505737305, "global_step": 131406, "epoch": 3128} {"train_loss": -6.686040878295898, "global_step": 131407, "epoch": 3128} {"train_loss": -6.677265167236328, "global_step": 131408, "epoch": 3128} {"train_loss": -6.752080917358398, "global_step": 131409, "epoch": 3128} {"train_loss": -6.623237609863281, "global_step": 131410, "epoch": 3128} {"train_loss": -6.574162483215332, "global_step": 131411, "epoch": 3128} {"train_loss": -6.778567314147949, "global_step": 131412, "epoch": 3128} {"train_loss": -6.661250114440918, "global_step": 131413, "epoch": 3128} {"train_loss": -6.753271102905273, "global_step": 131414, "epoch": 3128} {"train_loss": -6.694208145141602, "global_step": 131415, "epoch": 3128} {"train_loss": -6.675844192504883, "global_step": 131416, "epoch": 3128} {"train_loss": -6.656726439793904, "global_step": 131417, "epoch": 3128, "val_loss": 66477.8125} {"train_loss": -6.703865051269531, "global_step": 131418, "epoch": 3129} {"train_loss": -6.705606937408447, "global_step": 131419, "epoch": 3129} {"train_loss": -6.672446250915527, "global_step": 131420, "epoch": 3129} {"train_loss": -6.670138359069824, "global_step": 131421, "epoch": 3129} {"train_loss": -6.4453606605529785, "global_step": 131422, "epoch": 3129} {"train_loss": -6.803576946258545, "global_step": 131423, "epoch": 3129} {"train_loss": -6.680160045623779, "global_step": 131424, "epoch": 3129} {"train_loss": -6.517413139343262, "global_step": 131425, "epoch": 3129} {"train_loss": -6.714758396148682, "global_step": 131426, "epoch": 3129} {"train_loss": -6.534372329711914, "global_step": 131427, "epoch": 3129} {"train_loss": -6.646714210510254, "global_step": 131428, "epoch": 3129} {"train_loss": -6.728632926940918, "global_step": 131429, "epoch": 3129} {"train_loss": -6.583024978637695, "global_step": 131430, "epoch": 3129} {"train_loss": -6.6634650230407715, "global_step": 131431, "epoch": 3129} {"train_loss": -6.648514747619629, "global_step": 131432, "epoch": 3129} {"train_loss": -6.7571187019348145, "global_step": 131433, "epoch": 3129} {"train_loss": -6.63638973236084, "global_step": 131434, "epoch": 3129} {"train_loss": -6.66961669921875, "global_step": 131435, "epoch": 3129} {"train_loss": -6.638154029846191, "global_step": 131436, "epoch": 3129} {"train_loss": -6.634086608886719, "global_step": 131437, "epoch": 3129} {"train_loss": -6.655634880065918, "global_step": 131438, "epoch": 3129} {"train_loss": -6.625580787658691, "global_step": 131439, "epoch": 3129} {"train_loss": -6.687577724456787, "global_step": 131440, "epoch": 3129} {"train_loss": -6.606472015380859, "global_step": 131441, "epoch": 3129} {"train_loss": -6.463495254516602, "global_step": 131442, "epoch": 3129} {"train_loss": -6.552163600921631, "global_step": 131443, "epoch": 3129} {"train_loss": -6.721407413482666, "global_step": 131444, "epoch": 3129} {"train_loss": -6.532486915588379, "global_step": 131445, "epoch": 3129} {"train_loss": -6.782071113586426, "global_step": 131446, "epoch": 3129} {"train_loss": -6.644218444824219, "global_step": 131447, "epoch": 3129} {"train_loss": -6.644552230834961, "global_step": 131448, "epoch": 3129} {"train_loss": -6.669367790222168, "global_step": 131449, "epoch": 3129} {"train_loss": -6.640885353088379, "global_step": 131450, "epoch": 3129} {"train_loss": -6.615512371063232, "global_step": 131451, "epoch": 3129} {"train_loss": -6.660057067871094, "global_step": 131452, "epoch": 3129} {"train_loss": -6.54951286315918, "global_step": 131453, "epoch": 3129} {"train_loss": -6.612347602844238, "global_step": 131454, "epoch": 3129} {"train_loss": -6.649158477783203, "global_step": 131455, "epoch": 3129} {"train_loss": -6.557075500488281, "global_step": 131456, "epoch": 3129} {"train_loss": -6.501810073852539, "global_step": 131457, "epoch": 3129} {"train_loss": -6.596485137939453, "global_step": 131458, "epoch": 3129} {"train_loss": -6.6326959019615535, "global_step": 131459, "epoch": 3129, "val_loss": 66498.3671875} {"train_loss": -6.667910099029541, "global_step": 131460, "epoch": 3130} {"train_loss": -6.675786972045898, "global_step": 131461, "epoch": 3130} {"train_loss": -6.628158092498779, "global_step": 131462, "epoch": 3130} {"train_loss": -6.647337913513184, "global_step": 131463, "epoch": 3130} {"train_loss": -6.633664131164551, "global_step": 131464, "epoch": 3130} {"train_loss": -6.663419246673584, "global_step": 131465, "epoch": 3130} {"train_loss": -6.6174468994140625, "global_step": 131466, "epoch": 3130} {"train_loss": -6.781554222106934, "global_step": 131467, "epoch": 3130} {"train_loss": -6.580964088439941, "global_step": 131468, "epoch": 3130} {"train_loss": -6.617308139801025, "global_step": 131469, "epoch": 3130} {"train_loss": -6.638859748840332, "global_step": 131470, "epoch": 3130} {"train_loss": -6.585187911987305, "global_step": 131471, "epoch": 3130} {"train_loss": -6.620415687561035, "global_step": 131472, "epoch": 3130} {"train_loss": -6.577271461486816, "global_step": 131473, "epoch": 3130} {"train_loss": -6.672010898590088, "global_step": 131474, "epoch": 3130} {"train_loss": -6.734407424926758, "global_step": 131475, "epoch": 3130} {"train_loss": -6.721706867218018, "global_step": 131476, "epoch": 3130} {"train_loss": -6.632496356964111, "global_step": 131477, "epoch": 3130} {"train_loss": -6.723146915435791, "global_step": 131478, "epoch": 3130} {"train_loss": -6.6861491203308105, "global_step": 131479, "epoch": 3130} {"train_loss": -6.6995086669921875, "global_step": 131480, "epoch": 3130} {"train_loss": -6.728498458862305, "global_step": 131481, "epoch": 3130} {"train_loss": -6.594475746154785, "global_step": 131482, "epoch": 3130} {"train_loss": -6.657307147979736, "global_step": 131483, "epoch": 3130} {"train_loss": -6.6773905754089355, "global_step": 131484, "epoch": 3130} {"train_loss": -6.724081993103027, "global_step": 131485, "epoch": 3130} {"train_loss": -6.66928243637085, "global_step": 131486, "epoch": 3130} {"train_loss": -6.725943088531494, "global_step": 131487, "epoch": 3130} {"train_loss": -6.7026872634887695, "global_step": 131488, "epoch": 3130} {"train_loss": -6.67779541015625, "global_step": 131489, "epoch": 3130} {"train_loss": -6.718674659729004, "global_step": 131490, "epoch": 3130} {"train_loss": -6.631895542144775, "global_step": 131491, "epoch": 3130} {"train_loss": -6.615886211395264, "global_step": 131492, "epoch": 3130} {"train_loss": -6.736645698547363, "global_step": 131493, "epoch": 3130} {"train_loss": -6.629424095153809, "global_step": 131494, "epoch": 3130} {"train_loss": -6.737817764282227, "global_step": 131495, "epoch": 3130} {"train_loss": -6.748199462890625, "global_step": 131496, "epoch": 3130} {"train_loss": -6.729743957519531, "global_step": 131497, "epoch": 3130} {"train_loss": -6.679500579833984, "global_step": 131498, "epoch": 3130} {"train_loss": -6.796124458312988, "global_step": 131499, "epoch": 3130} {"train_loss": -6.8310394287109375, "global_step": 131500, "epoch": 3130} {"train_loss": -6.67997449920291, "global_step": 131501, "epoch": 3130, "val_loss": 66418.46875} {"train_loss": -6.693350791931152, "global_step": 131502, "epoch": 3131} {"train_loss": -6.81796932220459, "global_step": 131503, "epoch": 3131} {"train_loss": -6.821756839752197, "global_step": 131504, "epoch": 3131} {"train_loss": -6.828326225280762, "global_step": 131505, "epoch": 3131} {"train_loss": -6.706814765930176, "global_step": 131506, "epoch": 3131} {"train_loss": -6.792444229125977, "global_step": 131507, "epoch": 3131} {"train_loss": -6.703217506408691, "global_step": 131508, "epoch": 3131} {"train_loss": -6.826777935028076, "global_step": 131509, "epoch": 3131} {"train_loss": -6.74095344543457, "global_step": 131510, "epoch": 3131} {"train_loss": -6.797542572021484, "global_step": 131511, "epoch": 3131} {"train_loss": -6.7170915603637695, "global_step": 131512, "epoch": 3131} {"train_loss": -6.648942470550537, "global_step": 131513, "epoch": 3131} {"train_loss": -6.850200653076172, "global_step": 131514, "epoch": 3131} {"train_loss": -6.638714790344238, "global_step": 131515, "epoch": 3131} {"train_loss": -6.7605180740356445, "global_step": 131516, "epoch": 3131} {"train_loss": -6.6678571701049805, "global_step": 131517, "epoch": 3131} {"train_loss": -6.649155139923096, "global_step": 131518, "epoch": 3131} {"train_loss": -6.726469039916992, "global_step": 131519, "epoch": 3131} {"train_loss": -6.743923664093018, "global_step": 131520, "epoch": 3131} {"train_loss": -6.7248854637146, "global_step": 131521, "epoch": 3131} {"train_loss": -6.771711826324463, "global_step": 131522, "epoch": 3131} {"train_loss": -6.835997581481934, "global_step": 131523, "epoch": 3131} {"train_loss": -6.837268829345703, "global_step": 131524, "epoch": 3131} {"train_loss": -6.6942901611328125, "global_step": 131525, "epoch": 3131} {"train_loss": -6.731400966644287, "global_step": 131526, "epoch": 3131} {"train_loss": -6.770320892333984, "global_step": 131527, "epoch": 3131} {"train_loss": -6.777649879455566, "global_step": 131528, "epoch": 3131} {"train_loss": -6.761124610900879, "global_step": 131529, "epoch": 3131} {"train_loss": -6.598459720611572, "global_step": 131530, "epoch": 3131} {"train_loss": -6.68093204498291, "global_step": 131531, "epoch": 3131} {"train_loss": -6.762907981872559, "global_step": 131532, "epoch": 3131} {"train_loss": -6.637063026428223, "global_step": 131533, "epoch": 3131} {"train_loss": -6.6537017822265625, "global_step": 131534, "epoch": 3131} {"train_loss": -6.6353020668029785, "global_step": 131535, "epoch": 3131} {"train_loss": -6.633345603942871, "global_step": 131536, "epoch": 3131} {"train_loss": -6.622943878173828, "global_step": 131537, "epoch": 3131} {"train_loss": -6.634224891662598, "global_step": 131538, "epoch": 3131} {"train_loss": -6.735985279083252, "global_step": 131539, "epoch": 3131} {"train_loss": -6.649773597717285, "global_step": 131540, "epoch": 3131} {"train_loss": -6.660885810852051, "global_step": 131541, "epoch": 3131} {"train_loss": -6.65286922454834, "global_step": 131542, "epoch": 3131} {"train_loss": -6.722453594207764, "global_step": 131543, "epoch": 3131, "val_loss": 66615.0078125} {"train_loss": -6.752019882202148, "global_step": 131544, "epoch": 3132} {"train_loss": -6.7280378341674805, "global_step": 131545, "epoch": 3132} {"train_loss": -6.717776775360107, "global_step": 131546, "epoch": 3132} {"train_loss": -6.828648567199707, "global_step": 131547, "epoch": 3132} {"train_loss": -6.760097503662109, "global_step": 131548, "epoch": 3132} {"train_loss": -6.830761909484863, "global_step": 131549, "epoch": 3132} {"train_loss": -6.662690162658691, "global_step": 131550, "epoch": 3132} {"train_loss": -6.642620086669922, "global_step": 131551, "epoch": 3132} {"train_loss": -6.761173248291016, "global_step": 131552, "epoch": 3132} {"train_loss": -6.694683074951172, "global_step": 131553, "epoch": 3132} {"train_loss": -6.673332214355469, "global_step": 131554, "epoch": 3132} {"train_loss": -6.666942596435547, "global_step": 131555, "epoch": 3132} {"train_loss": -6.802389621734619, "global_step": 131556, "epoch": 3132} {"train_loss": -6.752326011657715, "global_step": 131557, "epoch": 3132} {"train_loss": -6.740868091583252, "global_step": 131558, "epoch": 3132} {"train_loss": -6.673638343811035, "global_step": 131559, "epoch": 3132} {"train_loss": -6.7601823806762695, "global_step": 131560, "epoch": 3132} {"train_loss": -6.684131622314453, "global_step": 131561, "epoch": 3132} {"train_loss": -6.710015773773193, "global_step": 131562, "epoch": 3132} {"train_loss": -6.789521217346191, "global_step": 131563, "epoch": 3132} {"train_loss": -6.5859456062316895, "global_step": 131564, "epoch": 3132} {"train_loss": -6.703474044799805, "global_step": 131565, "epoch": 3132} {"train_loss": -6.7057952880859375, "global_step": 131566, "epoch": 3132} {"train_loss": -6.755101203918457, "global_step": 131567, "epoch": 3132} {"train_loss": -6.648126602172852, "global_step": 131568, "epoch": 3132} {"train_loss": -6.749895095825195, "global_step": 131569, "epoch": 3132} {"train_loss": -6.677544593811035, "global_step": 131570, "epoch": 3132} {"train_loss": -6.733879089355469, "global_step": 131571, "epoch": 3132} {"train_loss": -6.628748893737793, "global_step": 131572, "epoch": 3132} {"train_loss": -6.705655097961426, "global_step": 131573, "epoch": 3132} {"train_loss": -6.695339679718018, "global_step": 131574, "epoch": 3132} {"train_loss": -6.725098133087158, "global_step": 131575, "epoch": 3132} {"train_loss": -6.744852066040039, "global_step": 131576, "epoch": 3132} {"train_loss": -6.723465442657471, "global_step": 131577, "epoch": 3132} {"train_loss": -6.720278739929199, "global_step": 131578, "epoch": 3132} {"train_loss": -6.709477424621582, "global_step": 131579, "epoch": 3132} {"train_loss": -6.767226219177246, "global_step": 131580, "epoch": 3132} {"train_loss": -6.656695365905762, "global_step": 131581, "epoch": 3132} {"train_loss": -6.705399513244629, "global_step": 131582, "epoch": 3132} {"train_loss": -6.679084777832031, "global_step": 131583, "epoch": 3132} {"train_loss": -6.705126762390137, "global_step": 131584, "epoch": 3132} {"train_loss": -6.716996919541132, "global_step": 131585, "epoch": 3132, "val_loss": 66745.78125} {"train_loss": -6.622641563415527, "global_step": 131586, "epoch": 3133} {"train_loss": -6.739977836608887, "global_step": 131587, "epoch": 3133} {"train_loss": -6.664693832397461, "global_step": 131588, "epoch": 3133} {"train_loss": -6.789341449737549, "global_step": 131589, "epoch": 3133} {"train_loss": -6.635873794555664, "global_step": 131590, "epoch": 3133} {"train_loss": -6.802495956420898, "global_step": 131591, "epoch": 3133} {"train_loss": -6.608371734619141, "global_step": 131592, "epoch": 3133} {"train_loss": -6.654938220977783, "global_step": 131593, "epoch": 3133} {"train_loss": -6.844322204589844, "global_step": 131594, "epoch": 3133} {"train_loss": -6.720570087432861, "global_step": 131595, "epoch": 3133} {"train_loss": -6.547799110412598, "global_step": 131596, "epoch": 3133} {"train_loss": -6.707647800445557, "global_step": 131597, "epoch": 3133} {"train_loss": -6.640067100524902, "global_step": 131598, "epoch": 3133} {"train_loss": -6.697454929351807, "global_step": 131599, "epoch": 3133} {"train_loss": -6.675018787384033, "global_step": 131600, "epoch": 3133} {"train_loss": -6.571097373962402, "global_step": 131601, "epoch": 3133} {"train_loss": -6.67545223236084, "global_step": 131602, "epoch": 3133} {"train_loss": -6.699043273925781, "global_step": 131603, "epoch": 3133} {"train_loss": -6.641472816467285, "global_step": 131604, "epoch": 3133} {"train_loss": -6.621374607086182, "global_step": 131605, "epoch": 3133} {"train_loss": -6.6791253089904785, "global_step": 131606, "epoch": 3133} {"train_loss": -6.724509239196777, "global_step": 131607, "epoch": 3133} {"train_loss": -6.591578483581543, "global_step": 131608, "epoch": 3133} {"train_loss": -6.567905426025391, "global_step": 131609, "epoch": 3133} {"train_loss": -6.54786491394043, "global_step": 131610, "epoch": 3133} {"train_loss": -6.593367576599121, "global_step": 131611, "epoch": 3133} {"train_loss": -6.518547534942627, "global_step": 131612, "epoch": 3133} {"train_loss": -6.67622709274292, "global_step": 131613, "epoch": 3133} {"train_loss": -6.497729778289795, "global_step": 131614, "epoch": 3133} {"train_loss": -6.7394561767578125, "global_step": 131615, "epoch": 3133} {"train_loss": -6.613399505615234, "global_step": 131616, "epoch": 3133} {"train_loss": -6.588650703430176, "global_step": 131617, "epoch": 3133} {"train_loss": -6.7176713943481445, "global_step": 131618, "epoch": 3133} {"train_loss": -6.528210639953613, "global_step": 131619, "epoch": 3133} {"train_loss": -6.671046733856201, "global_step": 131620, "epoch": 3133} {"train_loss": -6.635416030883789, "global_step": 131621, "epoch": 3133} {"train_loss": -6.620310306549072, "global_step": 131622, "epoch": 3133} {"train_loss": -6.53904914855957, "global_step": 131623, "epoch": 3133} {"train_loss": -6.532860279083252, "global_step": 131624, "epoch": 3133} {"train_loss": -6.603482246398926, "global_step": 131625, "epoch": 3133} {"train_loss": -6.71422004699707, "global_step": 131626, "epoch": 3133} {"train_loss": -6.644217411677043, "global_step": 131627, "epoch": 3133, "val_loss": 66859.3984375} {"train_loss": -6.740258693695068, "global_step": 131628, "epoch": 3134} {"train_loss": -6.664798736572266, "global_step": 131629, "epoch": 3134} {"train_loss": -6.615736484527588, "global_step": 131630, "epoch": 3134} {"train_loss": -6.552738189697266, "global_step": 131631, "epoch": 3134} {"train_loss": -6.675798416137695, "global_step": 131632, "epoch": 3134} {"train_loss": -6.682682991027832, "global_step": 131633, "epoch": 3134} {"train_loss": -6.622690200805664, "global_step": 131634, "epoch": 3134} {"train_loss": -6.641391754150391, "global_step": 131635, "epoch": 3134} {"train_loss": -6.664238929748535, "global_step": 131636, "epoch": 3134} {"train_loss": -6.560072898864746, "global_step": 131637, "epoch": 3134} {"train_loss": -6.449345588684082, "global_step": 131638, "epoch": 3134} {"train_loss": -6.708174228668213, "global_step": 131639, "epoch": 3134} {"train_loss": -6.707979202270508, "global_step": 131640, "epoch": 3134} {"train_loss": -6.590616226196289, "global_step": 131641, "epoch": 3134} {"train_loss": -6.516298294067383, "global_step": 131642, "epoch": 3134} {"train_loss": -6.695738315582275, "global_step": 131643, "epoch": 3134} {"train_loss": -6.553625106811523, "global_step": 131644, "epoch": 3134} {"train_loss": -6.553280830383301, "global_step": 131645, "epoch": 3134} {"train_loss": -6.618782043457031, "global_step": 131646, "epoch": 3134} {"train_loss": -6.5615339279174805, "global_step": 131647, "epoch": 3134} {"train_loss": -6.5996809005737305, "global_step": 131648, "epoch": 3134} {"train_loss": -6.5586090087890625, "global_step": 131649, "epoch": 3134} {"train_loss": -6.695248126983643, "global_step": 131650, "epoch": 3134} {"train_loss": -6.591738224029541, "global_step": 131651, "epoch": 3134} {"train_loss": -6.673548698425293, "global_step": 131652, "epoch": 3134} {"train_loss": -6.646918773651123, "global_step": 131653, "epoch": 3134} {"train_loss": -6.621561050415039, "global_step": 131654, "epoch": 3134} {"train_loss": -6.68851900100708, "global_step": 131655, "epoch": 3134} {"train_loss": -6.591906547546387, "global_step": 131656, "epoch": 3134} {"train_loss": -6.66038703918457, "global_step": 131657, "epoch": 3134} {"train_loss": -6.621220588684082, "global_step": 131658, "epoch": 3134} {"train_loss": -6.6268630027771, "global_step": 131659, "epoch": 3134} {"train_loss": -6.612861633300781, "global_step": 131660, "epoch": 3134} {"train_loss": -6.732494354248047, "global_step": 131661, "epoch": 3134} {"train_loss": -6.591062545776367, "global_step": 131662, "epoch": 3134} {"train_loss": -6.695862293243408, "global_step": 131663, "epoch": 3134} {"train_loss": -6.617020606994629, "global_step": 131664, "epoch": 3134} {"train_loss": -6.611536026000977, "global_step": 131665, "epoch": 3134} {"train_loss": -6.660205364227295, "global_step": 131666, "epoch": 3134} {"train_loss": -6.549544811248779, "global_step": 131667, "epoch": 3134} {"train_loss": -6.760319709777832, "global_step": 131668, "epoch": 3134} {"train_loss": -6.632489635830834, "global_step": 131669, "epoch": 3134, "val_loss": 66785.1171875} {"train_loss": -6.6842193603515625, "global_step": 131670, "epoch": 3135} {"train_loss": -6.764706134796143, "global_step": 131671, "epoch": 3135} {"train_loss": -6.59910249710083, "global_step": 131672, "epoch": 3135} {"train_loss": -6.712015151977539, "global_step": 131673, "epoch": 3135} {"train_loss": -6.635961532592773, "global_step": 131674, "epoch": 3135} {"train_loss": -6.795419692993164, "global_step": 131675, "epoch": 3135} {"train_loss": -6.714828014373779, "global_step": 131676, "epoch": 3135} {"train_loss": -6.6427154541015625, "global_step": 131677, "epoch": 3135} {"train_loss": -6.664344310760498, "global_step": 131678, "epoch": 3135} {"train_loss": -6.689389705657959, "global_step": 131679, "epoch": 3135} {"train_loss": -6.591160774230957, "global_step": 131680, "epoch": 3135} {"train_loss": -6.704645156860352, "global_step": 131681, "epoch": 3135} {"train_loss": -6.687270641326904, "global_step": 131682, "epoch": 3135} {"train_loss": -6.780144691467285, "global_step": 131683, "epoch": 3135} {"train_loss": -6.54150915145874, "global_step": 131684, "epoch": 3135} {"train_loss": -6.714580535888672, "global_step": 131685, "epoch": 3135} {"train_loss": -6.73063850402832, "global_step": 131686, "epoch": 3135} {"train_loss": -6.690610885620117, "global_step": 131687, "epoch": 3135} {"train_loss": -6.745046138763428, "global_step": 131688, "epoch": 3135} {"train_loss": -6.631860256195068, "global_step": 131689, "epoch": 3135} {"train_loss": -6.786381721496582, "global_step": 131690, "epoch": 3135} {"train_loss": -6.717755317687988, "global_step": 131691, "epoch": 3135} {"train_loss": -6.70139217376709, "global_step": 131692, "epoch": 3135} {"train_loss": -6.672258377075195, "global_step": 131693, "epoch": 3135} {"train_loss": -6.7513298988342285, "global_step": 131694, "epoch": 3135} {"train_loss": -6.678684234619141, "global_step": 131695, "epoch": 3135} {"train_loss": -6.662596702575684, "global_step": 131696, "epoch": 3135} {"train_loss": -6.656328201293945, "global_step": 131697, "epoch": 3135} {"train_loss": -6.724730014801025, "global_step": 131698, "epoch": 3135} {"train_loss": -6.723385810852051, "global_step": 131699, "epoch": 3135} {"train_loss": -6.715361595153809, "global_step": 131700, "epoch": 3135} {"train_loss": -6.6160101890563965, "global_step": 131701, "epoch": 3135} {"train_loss": -6.708169937133789, "global_step": 131702, "epoch": 3135} {"train_loss": -6.67779541015625, "global_step": 131703, "epoch": 3135} {"train_loss": -6.622460842132568, "global_step": 131704, "epoch": 3135} {"train_loss": -6.507987976074219, "global_step": 131705, "epoch": 3135} {"train_loss": -6.636013031005859, "global_step": 131706, "epoch": 3135} {"train_loss": -6.646919250488281, "global_step": 131707, "epoch": 3135} {"train_loss": -6.612792015075684, "global_step": 131708, "epoch": 3135} {"train_loss": -6.5585784912109375, "global_step": 131709, "epoch": 3135} {"train_loss": -6.667372226715088, "global_step": 131710, "epoch": 3135} {"train_loss": -6.677312726066226, "global_step": 131711, "epoch": 3135, "val_loss": 66616.6953125} {"train_loss": -6.682131290435791, "global_step": 131712, "epoch": 3136} {"train_loss": -6.654011249542236, "global_step": 131713, "epoch": 3136} {"train_loss": -6.733768939971924, "global_step": 131714, "epoch": 3136} {"train_loss": -6.790886402130127, "global_step": 131715, "epoch": 3136} {"train_loss": -6.5965657234191895, "global_step": 131716, "epoch": 3136} {"train_loss": -6.8297014236450195, "global_step": 131717, "epoch": 3136} {"train_loss": -6.632338523864746, "global_step": 131718, "epoch": 3136} {"train_loss": -6.620944976806641, "global_step": 131719, "epoch": 3136} {"train_loss": -6.679689407348633, "global_step": 131720, "epoch": 3136} {"train_loss": -6.6337361335754395, "global_step": 131721, "epoch": 3136} {"train_loss": -6.643773078918457, "global_step": 131722, "epoch": 3136} {"train_loss": -6.608624458312988, "global_step": 131723, "epoch": 3136} {"train_loss": -6.736567497253418, "global_step": 131724, "epoch": 3136} {"train_loss": -6.724721908569336, "global_step": 131725, "epoch": 3136} {"train_loss": -6.549675464630127, "global_step": 131726, "epoch": 3136} {"train_loss": -6.667836666107178, "global_step": 131727, "epoch": 3136} {"train_loss": -6.671283721923828, "global_step": 131728, "epoch": 3136} {"train_loss": -6.598836898803711, "global_step": 131729, "epoch": 3136} {"train_loss": -6.657422065734863, "global_step": 131730, "epoch": 3136} {"train_loss": -6.583902835845947, "global_step": 131731, "epoch": 3136} {"train_loss": -6.635053634643555, "global_step": 131732, "epoch": 3136} {"train_loss": -6.5717573165893555, "global_step": 131733, "epoch": 3136} {"train_loss": -6.701043605804443, "global_step": 131734, "epoch": 3136} {"train_loss": -6.612991809844971, "global_step": 131735, "epoch": 3136} {"train_loss": -6.7707109451293945, "global_step": 131736, "epoch": 3136} {"train_loss": -6.708550453186035, "global_step": 131737, "epoch": 3136} {"train_loss": -6.688918113708496, "global_step": 131738, "epoch": 3136} {"train_loss": -6.78282356262207, "global_step": 131739, "epoch": 3136} {"train_loss": -6.643832206726074, "global_step": 131740, "epoch": 3136} {"train_loss": -6.692705154418945, "global_step": 131741, "epoch": 3136} {"train_loss": -6.6891584396362305, "global_step": 131742, "epoch": 3136} {"train_loss": -6.655285835266113, "global_step": 131743, "epoch": 3136} {"train_loss": -6.5122599601745605, "global_step": 131744, "epoch": 3136} {"train_loss": -6.683780193328857, "global_step": 131745, "epoch": 3136} {"train_loss": -6.775051116943359, "global_step": 131746, "epoch": 3136} {"train_loss": -6.740194320678711, "global_step": 131747, "epoch": 3136} {"train_loss": -6.706218719482422, "global_step": 131748, "epoch": 3136} {"train_loss": -6.748821258544922, "global_step": 131749, "epoch": 3136} {"train_loss": -6.542329788208008, "global_step": 131750, "epoch": 3136} {"train_loss": -6.658304691314697, "global_step": 131751, "epoch": 3136} {"train_loss": -6.755456447601318, "global_step": 131752, "epoch": 3136} {"train_loss": -6.67602937562125, "global_step": 131753, "epoch": 3136, "val_loss": 66810.1953125} {"train_loss": -6.747285842895508, "global_step": 131754, "epoch": 3137} {"train_loss": -6.77853536605835, "global_step": 131755, "epoch": 3137} {"train_loss": -6.6923651695251465, "global_step": 131756, "epoch": 3137} {"train_loss": -6.642519950866699, "global_step": 131757, "epoch": 3137} {"train_loss": -6.732909202575684, "global_step": 131758, "epoch": 3137} {"train_loss": -6.79281759262085, "global_step": 131759, "epoch": 3137} {"train_loss": -6.749773025512695, "global_step": 131760, "epoch": 3137} {"train_loss": -6.6834330558776855, "global_step": 131761, "epoch": 3137} {"train_loss": -6.780697822570801, "global_step": 131762, "epoch": 3137} {"train_loss": -6.705909729003906, "global_step": 131763, "epoch": 3137} {"train_loss": -6.647166728973389, "global_step": 131764, "epoch": 3137} {"train_loss": -6.6875104904174805, "global_step": 131765, "epoch": 3137} {"train_loss": -6.693905830383301, "global_step": 131766, "epoch": 3137} {"train_loss": -6.7631988525390625, "global_step": 131767, "epoch": 3137} {"train_loss": -6.534566879272461, "global_step": 131768, "epoch": 3137} {"train_loss": -6.765087127685547, "global_step": 131769, "epoch": 3137} {"train_loss": -6.683823108673096, "global_step": 131770, "epoch": 3137} {"train_loss": -6.630149841308594, "global_step": 131771, "epoch": 3137} {"train_loss": -6.744773864746094, "global_step": 131772, "epoch": 3137} {"train_loss": -6.694993019104004, "global_step": 131773, "epoch": 3137} {"train_loss": -6.6979217529296875, "global_step": 131774, "epoch": 3137} {"train_loss": -6.619666576385498, "global_step": 131775, "epoch": 3137} {"train_loss": -6.654757499694824, "global_step": 131776, "epoch": 3137} {"train_loss": -6.6442060470581055, "global_step": 131777, "epoch": 3137} {"train_loss": -6.624245643615723, "global_step": 131778, "epoch": 3137} {"train_loss": -6.618102073669434, "global_step": 131779, "epoch": 3137} {"train_loss": -6.720005989074707, "global_step": 131780, "epoch": 3137} {"train_loss": -6.613015174865723, "global_step": 131781, "epoch": 3137} {"train_loss": -6.621699333190918, "global_step": 131782, "epoch": 3137} {"train_loss": -6.644959449768066, "global_step": 131783, "epoch": 3137} {"train_loss": -6.706813335418701, "global_step": 131784, "epoch": 3137} {"train_loss": -6.624485015869141, "global_step": 131785, "epoch": 3137} {"train_loss": -6.621636867523193, "global_step": 131786, "epoch": 3137} {"train_loss": -6.57181453704834, "global_step": 131787, "epoch": 3137} {"train_loss": -6.703769683837891, "global_step": 131788, "epoch": 3137} {"train_loss": -6.665589809417725, "global_step": 131789, "epoch": 3137} {"train_loss": -6.701333999633789, "global_step": 131790, "epoch": 3137} {"train_loss": -6.667579650878906, "global_step": 131791, "epoch": 3137} {"train_loss": -6.562540054321289, "global_step": 131792, "epoch": 3137} {"train_loss": -6.577843189239502, "global_step": 131793, "epoch": 3137} {"train_loss": -6.735964298248291, "global_step": 131794, "epoch": 3137} {"train_loss": -6.67602649189177, "global_step": 131795, "epoch": 3137, "val_loss": 66766.2421875} {"train_loss": -6.767184257507324, "global_step": 131796, "epoch": 3138} {"train_loss": -6.624602317810059, "global_step": 131797, "epoch": 3138} {"train_loss": -6.690339088439941, "global_step": 131798, "epoch": 3138} {"train_loss": -6.73576021194458, "global_step": 131799, "epoch": 3138} {"train_loss": -6.699475288391113, "global_step": 131800, "epoch": 3138} {"train_loss": -6.783339977264404, "global_step": 131801, "epoch": 3138} {"train_loss": -6.716699600219727, "global_step": 131802, "epoch": 3138} {"train_loss": -6.664600372314453, "global_step": 131803, "epoch": 3138} {"train_loss": -6.711480140686035, "global_step": 131804, "epoch": 3138} {"train_loss": -6.633653163909912, "global_step": 131805, "epoch": 3138} {"train_loss": -6.750887870788574, "global_step": 131806, "epoch": 3138} {"train_loss": -6.668630123138428, "global_step": 131807, "epoch": 3138} {"train_loss": -6.605106353759766, "global_step": 131808, "epoch": 3138} {"train_loss": -6.659092426300049, "global_step": 131809, "epoch": 3138} {"train_loss": -6.718442916870117, "global_step": 131810, "epoch": 3138} {"train_loss": -6.874190330505371, "global_step": 131811, "epoch": 3138} {"train_loss": -6.69029426574707, "global_step": 131812, "epoch": 3138} {"train_loss": -6.714117050170898, "global_step": 131813, "epoch": 3138} {"train_loss": -6.65414571762085, "global_step": 131814, "epoch": 3138} {"train_loss": -6.62565803527832, "global_step": 131815, "epoch": 3138} {"train_loss": -6.792551040649414, "global_step": 131816, "epoch": 3138} {"train_loss": -6.69016170501709, "global_step": 131817, "epoch": 3138} {"train_loss": -6.663919448852539, "global_step": 131818, "epoch": 3138} {"train_loss": -6.695213794708252, "global_step": 131819, "epoch": 3138} {"train_loss": -6.671703338623047, "global_step": 131820, "epoch": 3138} {"train_loss": -6.683189392089844, "global_step": 131821, "epoch": 3138} {"train_loss": -6.672243118286133, "global_step": 131822, "epoch": 3138} {"train_loss": -6.662142753601074, "global_step": 131823, "epoch": 3138} {"train_loss": -6.779235363006592, "global_step": 131824, "epoch": 3138} {"train_loss": -6.639293670654297, "global_step": 131825, "epoch": 3138} {"train_loss": -6.625772953033447, "global_step": 131826, "epoch": 3138} {"train_loss": -6.763877868652344, "global_step": 131827, "epoch": 3138} {"train_loss": -6.6602678298950195, "global_step": 131828, "epoch": 3138} {"train_loss": -6.638739109039307, "global_step": 131829, "epoch": 3138} {"train_loss": -6.7114763259887695, "global_step": 131830, "epoch": 3138} {"train_loss": -6.6017374992370605, "global_step": 131831, "epoch": 3138} {"train_loss": -6.66648530960083, "global_step": 131832, "epoch": 3138} {"train_loss": -6.724976062774658, "global_step": 131833, "epoch": 3138} {"train_loss": -6.724311828613281, "global_step": 131834, "epoch": 3138} {"train_loss": -6.568537712097168, "global_step": 131835, "epoch": 3138} {"train_loss": -6.6741814613342285, "global_step": 131836, "epoch": 3138} {"train_loss": -6.6880955923171275, "global_step": 131837, "epoch": 3138, "val_loss": 66923.7421875} {"train_loss": -6.768609523773193, "global_step": 131838, "epoch": 3139} {"train_loss": -6.624579906463623, "global_step": 131839, "epoch": 3139} {"train_loss": -6.6159210205078125, "global_step": 131840, "epoch": 3139} {"train_loss": -6.637917518615723, "global_step": 131841, "epoch": 3139} {"train_loss": -6.595829010009766, "global_step": 131842, "epoch": 3139} {"train_loss": -6.676970958709717, "global_step": 131843, "epoch": 3139} {"train_loss": -6.440370559692383, "global_step": 131844, "epoch": 3139} {"train_loss": -6.744274139404297, "global_step": 131845, "epoch": 3139} {"train_loss": -6.453575134277344, "global_step": 131846, "epoch": 3139} {"train_loss": -6.538280963897705, "global_step": 131847, "epoch": 3139} {"train_loss": -6.615085601806641, "global_step": 131848, "epoch": 3139} {"train_loss": -6.610081672668457, "global_step": 131849, "epoch": 3139} {"train_loss": -6.639125347137451, "global_step": 131850, "epoch": 3139} {"train_loss": -6.643482208251953, "global_step": 131851, "epoch": 3139} {"train_loss": -6.601995944976807, "global_step": 131852, "epoch": 3139} {"train_loss": -6.687865257263184, "global_step": 131853, "epoch": 3139} {"train_loss": -6.599429130554199, "global_step": 131854, "epoch": 3139} {"train_loss": -6.739899635314941, "global_step": 131855, "epoch": 3139} {"train_loss": -6.6928300857543945, "global_step": 131856, "epoch": 3139} {"train_loss": -6.694970607757568, "global_step": 131857, "epoch": 3139} {"train_loss": -6.611428260803223, "global_step": 131858, "epoch": 3139} {"train_loss": -6.746996879577637, "global_step": 131859, "epoch": 3139} {"train_loss": -6.617831707000732, "global_step": 131860, "epoch": 3139} {"train_loss": -6.699108123779297, "global_step": 131861, "epoch": 3139} {"train_loss": -6.780849456787109, "global_step": 131862, "epoch": 3139} {"train_loss": -6.641597747802734, "global_step": 131863, "epoch": 3139} {"train_loss": -6.729391574859619, "global_step": 131864, "epoch": 3139} {"train_loss": -6.6810503005981445, "global_step": 131865, "epoch": 3139} {"train_loss": -6.7715301513671875, "global_step": 131866, "epoch": 3139} {"train_loss": -6.581874847412109, "global_step": 131867, "epoch": 3139} {"train_loss": -6.676688194274902, "global_step": 131868, "epoch": 3139} {"train_loss": -6.5788655281066895, "global_step": 131869, "epoch": 3139} {"train_loss": -6.587631702423096, "global_step": 131870, "epoch": 3139} {"train_loss": -6.708662033081055, "global_step": 131871, "epoch": 3139} {"train_loss": -6.610561370849609, "global_step": 131872, "epoch": 3139} {"train_loss": -6.745981216430664, "global_step": 131873, "epoch": 3139} {"train_loss": -6.6983819007873535, "global_step": 131874, "epoch": 3139} {"train_loss": -6.707051753997803, "global_step": 131875, "epoch": 3139} {"train_loss": -6.653916358947754, "global_step": 131876, "epoch": 3139} {"train_loss": -6.7044219970703125, "global_step": 131877, "epoch": 3139} {"train_loss": -6.687969207763672, "global_step": 131878, "epoch": 3139} {"train_loss": -6.657206955410185, "global_step": 131879, "epoch": 3139, "val_loss": 66588.125} {"train_loss": -6.757449150085449, "global_step": 131880, "epoch": 3140} {"train_loss": -6.8146491050720215, "global_step": 131881, "epoch": 3140} {"train_loss": -6.675112724304199, "global_step": 131882, "epoch": 3140} {"train_loss": -6.730775833129883, "global_step": 131883, "epoch": 3140} {"train_loss": -6.666492938995361, "global_step": 131884, "epoch": 3140} {"train_loss": -6.824119567871094, "global_step": 131885, "epoch": 3140} {"train_loss": -6.792391777038574, "global_step": 131886, "epoch": 3140} {"train_loss": -6.753458023071289, "global_step": 131887, "epoch": 3140} {"train_loss": -6.679587364196777, "global_step": 131888, "epoch": 3140} {"train_loss": -6.88451623916626, "global_step": 131889, "epoch": 3140} {"train_loss": -6.6730804443359375, "global_step": 131890, "epoch": 3140} {"train_loss": -6.817174911499023, "global_step": 131891, "epoch": 3140} {"train_loss": -6.631590843200684, "global_step": 131892, "epoch": 3140} {"train_loss": -6.757143974304199, "global_step": 131893, "epoch": 3140} {"train_loss": -6.72072696685791, "global_step": 131894, "epoch": 3140} {"train_loss": -6.531782150268555, "global_step": 131895, "epoch": 3140} {"train_loss": -6.634442329406738, "global_step": 131896, "epoch": 3140} {"train_loss": -6.448513984680176, "global_step": 131897, "epoch": 3140} {"train_loss": -6.631846904754639, "global_step": 131898, "epoch": 3140} {"train_loss": -6.633246421813965, "global_step": 131899, "epoch": 3140} {"train_loss": -6.5113043785095215, "global_step": 131900, "epoch": 3140} {"train_loss": -6.7881269454956055, "global_step": 131901, "epoch": 3140} {"train_loss": -6.7605791091918945, "global_step": 131902, "epoch": 3140} {"train_loss": -6.46131706237793, "global_step": 131903, "epoch": 3140} {"train_loss": -6.640394687652588, "global_step": 131904, "epoch": 3140} {"train_loss": -6.6444807052612305, "global_step": 131905, "epoch": 3140} {"train_loss": -6.508355140686035, "global_step": 131906, "epoch": 3140} {"train_loss": -6.660808563232422, "global_step": 131907, "epoch": 3140} {"train_loss": -6.573450088500977, "global_step": 131908, "epoch": 3140} {"train_loss": -6.638089179992676, "global_step": 131909, "epoch": 3140} {"train_loss": -6.725419998168945, "global_step": 131910, "epoch": 3140} {"train_loss": -6.607195854187012, "global_step": 131911, "epoch": 3140} {"train_loss": -6.606130123138428, "global_step": 131912, "epoch": 3140} {"train_loss": -6.630058288574219, "global_step": 131913, "epoch": 3140} {"train_loss": -6.678675651550293, "global_step": 131914, "epoch": 3140} {"train_loss": -6.633514404296875, "global_step": 131915, "epoch": 3140} {"train_loss": -6.6776862144470215, "global_step": 131916, "epoch": 3140} {"train_loss": -6.676521301269531, "global_step": 131917, "epoch": 3140} {"train_loss": -6.7031331062316895, "global_step": 131918, "epoch": 3140} {"train_loss": -6.693302154541016, "global_step": 131919, "epoch": 3140} {"train_loss": -6.643481731414795, "global_step": 131920, "epoch": 3140} {"train_loss": -6.670624732971191, "global_step": 131921, "epoch": 3140, "val_loss": 66698.703125} {"train_loss": -6.587530612945557, "global_step": 131922, "epoch": 3141} {"train_loss": -6.671572208404541, "global_step": 131923, "epoch": 3141} {"train_loss": -6.682812690734863, "global_step": 131924, "epoch": 3141} {"train_loss": -6.7084059715271, "global_step": 131925, "epoch": 3141} {"train_loss": -6.671213150024414, "global_step": 131926, "epoch": 3141} {"train_loss": -6.633832931518555, "global_step": 131927, "epoch": 3141} {"train_loss": -6.680505752563477, "global_step": 131928, "epoch": 3141} {"train_loss": -6.75263786315918, "global_step": 131929, "epoch": 3141} {"train_loss": -6.773210525512695, "global_step": 131930, "epoch": 3141} {"train_loss": -6.67746639251709, "global_step": 131931, "epoch": 3141} {"train_loss": -6.779301643371582, "global_step": 131932, "epoch": 3141} {"train_loss": -6.7415595054626465, "global_step": 131933, "epoch": 3141} {"train_loss": -6.709765911102295, "global_step": 131934, "epoch": 3141} {"train_loss": -6.610875129699707, "global_step": 131935, "epoch": 3141} {"train_loss": -6.759953022003174, "global_step": 131936, "epoch": 3141} {"train_loss": -6.69215202331543, "global_step": 131937, "epoch": 3141} {"train_loss": -6.685778617858887, "global_step": 131938, "epoch": 3141} {"train_loss": -6.767022132873535, "global_step": 131939, "epoch": 3141} {"train_loss": -6.662703990936279, "global_step": 131940, "epoch": 3141} {"train_loss": -6.795915126800537, "global_step": 131941, "epoch": 3141} {"train_loss": -6.793868064880371, "global_step": 131942, "epoch": 3141} {"train_loss": -6.567971229553223, "global_step": 131943, "epoch": 3141} {"train_loss": -6.749381065368652, "global_step": 131944, "epoch": 3141} {"train_loss": -6.755902290344238, "global_step": 131945, "epoch": 3141} {"train_loss": -6.641615867614746, "global_step": 131946, "epoch": 3141} {"train_loss": -6.695837020874023, "global_step": 131947, "epoch": 3141} {"train_loss": -6.673023223876953, "global_step": 131948, "epoch": 3141} {"train_loss": -6.76576042175293, "global_step": 131949, "epoch": 3141} {"train_loss": -6.760809898376465, "global_step": 131950, "epoch": 3141} {"train_loss": -6.605992317199707, "global_step": 131951, "epoch": 3141} {"train_loss": -6.6955695152282715, "global_step": 131952, "epoch": 3141} {"train_loss": -6.78269100189209, "global_step": 131953, "epoch": 3141} {"train_loss": -6.660620212554932, "global_step": 131954, "epoch": 3141} {"train_loss": -6.581416606903076, "global_step": 131955, "epoch": 3141} {"train_loss": -6.564188480377197, "global_step": 131956, "epoch": 3141} {"train_loss": -6.535651683807373, "global_step": 131957, "epoch": 3141} {"train_loss": -6.7784013748168945, "global_step": 131958, "epoch": 3141} {"train_loss": -6.626517295837402, "global_step": 131959, "epoch": 3141} {"train_loss": -6.6218366622924805, "global_step": 131960, "epoch": 3141} {"train_loss": -6.649413108825684, "global_step": 131961, "epoch": 3141} {"train_loss": -6.707670211791992, "global_step": 131962, "epoch": 3141} {"train_loss": -6.690733137584868, "global_step": 131963, "epoch": 3141, "val_loss": 66726.890625} {"train_loss": -6.641020774841309, "global_step": 131964, "epoch": 3142} {"train_loss": -6.689621925354004, "global_step": 131965, "epoch": 3142} {"train_loss": -6.673407077789307, "global_step": 131966, "epoch": 3142} {"train_loss": -6.744471549987793, "global_step": 131967, "epoch": 3142} {"train_loss": -6.6862874031066895, "global_step": 131968, "epoch": 3142} {"train_loss": -6.656576156616211, "global_step": 131969, "epoch": 3142} {"train_loss": -6.7229132652282715, "global_step": 131970, "epoch": 3142} {"train_loss": -6.77048397064209, "global_step": 131971, "epoch": 3142} {"train_loss": -6.782556533813477, "global_step": 131972, "epoch": 3142} {"train_loss": -6.648131370544434, "global_step": 131973, "epoch": 3142} {"train_loss": -6.785726547241211, "global_step": 131974, "epoch": 3142} {"train_loss": -6.675120830535889, "global_step": 131975, "epoch": 3142} {"train_loss": -6.586380481719971, "global_step": 131976, "epoch": 3142} {"train_loss": -6.717771530151367, "global_step": 131977, "epoch": 3142} {"train_loss": -6.836126327514648, "global_step": 131978, "epoch": 3142} {"train_loss": -6.651068687438965, "global_step": 131979, "epoch": 3142} {"train_loss": -6.86450719833374, "global_step": 131980, "epoch": 3142} {"train_loss": -6.732166290283203, "global_step": 131981, "epoch": 3142} {"train_loss": -6.707541465759277, "global_step": 131982, "epoch": 3142} {"train_loss": -6.746868133544922, "global_step": 131983, "epoch": 3142} {"train_loss": -6.729311943054199, "global_step": 131984, "epoch": 3142} {"train_loss": -6.706763744354248, "global_step": 131985, "epoch": 3142} {"train_loss": -6.721875190734863, "global_step": 131986, "epoch": 3142} {"train_loss": -6.716763973236084, "global_step": 131987, "epoch": 3142} {"train_loss": -6.8630475997924805, "global_step": 131988, "epoch": 3142} {"train_loss": -6.688774108886719, "global_step": 131989, "epoch": 3142} {"train_loss": -6.60500431060791, "global_step": 131990, "epoch": 3142} {"train_loss": -6.73028564453125, "global_step": 131991, "epoch": 3142} {"train_loss": -6.737679958343506, "global_step": 131992, "epoch": 3142} {"train_loss": -6.609025955200195, "global_step": 131993, "epoch": 3142} {"train_loss": -6.755630970001221, "global_step": 131994, "epoch": 3142} {"train_loss": -6.711954593658447, "global_step": 131995, "epoch": 3142} {"train_loss": -6.752939701080322, "global_step": 131996, "epoch": 3142} {"train_loss": -6.6742730140686035, "global_step": 131997, "epoch": 3142} {"train_loss": -6.631685256958008, "global_step": 131998, "epoch": 3142} {"train_loss": -6.74693489074707, "global_step": 131999, "epoch": 3142} {"train_loss": -6.5695295333862305, "global_step": 132000, "epoch": 3142} {"train_loss": -6.786101341247559, "global_step": 132001, "epoch": 3142} {"train_loss": -6.711139678955078, "global_step": 132002, "epoch": 3142} {"train_loss": -6.760002136230469, "global_step": 132003, "epoch": 3142} {"train_loss": -6.630590438842773, "global_step": 132004, "epoch": 3142} {"train_loss": -6.71112280800229, "global_step": 132005, "epoch": 3142, "val_loss": 66574.6015625} {"train_loss": -6.703636169433594, "global_step": 132006, "epoch": 3143} {"train_loss": -6.733152389526367, "global_step": 132007, "epoch": 3143} {"train_loss": -6.686617851257324, "global_step": 132008, "epoch": 3143} {"train_loss": -6.654177665710449, "global_step": 132009, "epoch": 3143} {"train_loss": -6.536028861999512, "global_step": 132010, "epoch": 3143} {"train_loss": -6.675426959991455, "global_step": 132011, "epoch": 3143} {"train_loss": -6.685301780700684, "global_step": 132012, "epoch": 3143} {"train_loss": -6.736560821533203, "global_step": 132013, "epoch": 3143} {"train_loss": -6.773022651672363, "global_step": 132014, "epoch": 3143} {"train_loss": -6.793890953063965, "global_step": 132015, "epoch": 3143} {"train_loss": -6.789758682250977, "global_step": 132016, "epoch": 3143} {"train_loss": -6.753807544708252, "global_step": 132017, "epoch": 3143} {"train_loss": -6.618033409118652, "global_step": 132018, "epoch": 3143} {"train_loss": -6.725152492523193, "global_step": 132019, "epoch": 3143} {"train_loss": -6.797810077667236, "global_step": 132020, "epoch": 3143} {"train_loss": -6.705420017242432, "global_step": 132021, "epoch": 3143} {"train_loss": -6.7526373863220215, "global_step": 132022, "epoch": 3143} {"train_loss": -6.705763816833496, "global_step": 132023, "epoch": 3143} {"train_loss": -6.7011213302612305, "global_step": 132024, "epoch": 3143} {"train_loss": -6.7121992111206055, "global_step": 132025, "epoch": 3143} {"train_loss": -6.759866714477539, "global_step": 132026, "epoch": 3143} {"train_loss": -6.700305938720703, "global_step": 132027, "epoch": 3143} {"train_loss": -6.646694183349609, "global_step": 132028, "epoch": 3143} {"train_loss": -6.6677565574646, "global_step": 132029, "epoch": 3143} {"train_loss": -6.629343032836914, "global_step": 132030, "epoch": 3143} {"train_loss": -6.593036651611328, "global_step": 132031, "epoch": 3143} {"train_loss": -6.624774932861328, "global_step": 132032, "epoch": 3143} {"train_loss": -6.741485595703125, "global_step": 132033, "epoch": 3143} {"train_loss": -6.725075721740723, "global_step": 132034, "epoch": 3143} {"train_loss": -6.562848091125488, "global_step": 132035, "epoch": 3143} {"train_loss": -6.680051326751709, "global_step": 132036, "epoch": 3143} {"train_loss": -6.581638336181641, "global_step": 132037, "epoch": 3143} {"train_loss": -6.660811424255371, "global_step": 132038, "epoch": 3143} {"train_loss": -6.732314586639404, "global_step": 132039, "epoch": 3143} {"train_loss": -6.712810516357422, "global_step": 132040, "epoch": 3143} {"train_loss": -6.667578220367432, "global_step": 132041, "epoch": 3143} {"train_loss": -6.696459770202637, "global_step": 132042, "epoch": 3143} {"train_loss": -6.72078275680542, "global_step": 132043, "epoch": 3143} {"train_loss": -6.774660110473633, "global_step": 132044, "epoch": 3143} {"train_loss": -6.816367149353027, "global_step": 132045, "epoch": 3143} {"train_loss": -6.672124862670898, "global_step": 132046, "epoch": 3143} {"train_loss": -6.69929457846142, "global_step": 132047, "epoch": 3143, "val_loss": 66813.4375} {"train_loss": -6.731400489807129, "global_step": 132048, "epoch": 3144} {"train_loss": -6.8109025955200195, "global_step": 132049, "epoch": 3144} {"train_loss": -6.797523498535156, "global_step": 132050, "epoch": 3144} {"train_loss": -6.734811782836914, "global_step": 132051, "epoch": 3144} {"train_loss": -6.777373790740967, "global_step": 132052, "epoch": 3144} {"train_loss": -6.70017147064209, "global_step": 132053, "epoch": 3144} {"train_loss": -6.745767116546631, "global_step": 132054, "epoch": 3144} {"train_loss": -6.709197044372559, "global_step": 132055, "epoch": 3144} {"train_loss": -6.755285739898682, "global_step": 132056, "epoch": 3144} {"train_loss": -6.677243232727051, "global_step": 132057, "epoch": 3144} {"train_loss": -6.737687110900879, "global_step": 132058, "epoch": 3144} {"train_loss": -6.636140823364258, "global_step": 132059, "epoch": 3144} {"train_loss": -6.604282379150391, "global_step": 132060, "epoch": 3144} {"train_loss": -6.703968048095703, "global_step": 132061, "epoch": 3144} {"train_loss": -6.647942066192627, "global_step": 132062, "epoch": 3144} {"train_loss": -6.6753435134887695, "global_step": 132063, "epoch": 3144} {"train_loss": -6.675771236419678, "global_step": 132064, "epoch": 3144} {"train_loss": -6.782262325286865, "global_step": 132065, "epoch": 3144} {"train_loss": -6.744248390197754, "global_step": 132066, "epoch": 3144} {"train_loss": -6.716197490692139, "global_step": 132067, "epoch": 3144} {"train_loss": -6.6114912033081055, "global_step": 132068, "epoch": 3144} {"train_loss": -6.731757640838623, "global_step": 132069, "epoch": 3144} {"train_loss": -6.699027061462402, "global_step": 132070, "epoch": 3144} {"train_loss": -6.665676116943359, "global_step": 132071, "epoch": 3144} {"train_loss": -6.7338104248046875, "global_step": 132072, "epoch": 3144} {"train_loss": -6.6360392570495605, "global_step": 132073, "epoch": 3144} {"train_loss": -6.632055282592773, "global_step": 132074, "epoch": 3144} {"train_loss": -6.649807929992676, "global_step": 132075, "epoch": 3144} {"train_loss": -6.626579761505127, "global_step": 132076, "epoch": 3144} {"train_loss": -6.6592183113098145, "global_step": 132077, "epoch": 3144} {"train_loss": -6.740123748779297, "global_step": 132078, "epoch": 3144} {"train_loss": -6.667257308959961, "global_step": 132079, "epoch": 3144} {"train_loss": -6.659981727600098, "global_step": 132080, "epoch": 3144} {"train_loss": -6.790032386779785, "global_step": 132081, "epoch": 3144} {"train_loss": -6.63309383392334, "global_step": 132082, "epoch": 3144} {"train_loss": -6.652403354644775, "global_step": 132083, "epoch": 3144} {"train_loss": -6.696407794952393, "global_step": 132084, "epoch": 3144} {"train_loss": -6.677398681640625, "global_step": 132085, "epoch": 3144} {"train_loss": -6.776022911071777, "global_step": 132086, "epoch": 3144} {"train_loss": -6.765530586242676, "global_step": 132087, "epoch": 3144} {"train_loss": -6.5528459548950195, "global_step": 132088, "epoch": 3144} {"train_loss": -6.6980777354467484, "global_step": 132089, "epoch": 3144, "val_loss": 66777.921875} {"train_loss": -6.875921726226807, "global_step": 132090, "epoch": 3145} {"train_loss": -6.648029804229736, "global_step": 132091, "epoch": 3145} {"train_loss": -6.63558292388916, "global_step": 132092, "epoch": 3145} {"train_loss": -6.610828399658203, "global_step": 132093, "epoch": 3145} {"train_loss": -6.576995849609375, "global_step": 132094, "epoch": 3145} {"train_loss": -6.75355863571167, "global_step": 132095, "epoch": 3145} {"train_loss": -6.687044620513916, "global_step": 132096, "epoch": 3145} {"train_loss": -6.480252265930176, "global_step": 132097, "epoch": 3145} {"train_loss": -6.726382255554199, "global_step": 132098, "epoch": 3145} {"train_loss": -6.662789344787598, "global_step": 132099, "epoch": 3145} {"train_loss": -6.721522808074951, "global_step": 132100, "epoch": 3145} {"train_loss": -6.680362224578857, "global_step": 132101, "epoch": 3145} {"train_loss": -6.740812301635742, "global_step": 132102, "epoch": 3145} {"train_loss": -6.740383148193359, "global_step": 132103, "epoch": 3145} {"train_loss": -6.698782920837402, "global_step": 132104, "epoch": 3145} {"train_loss": -6.666524410247803, "global_step": 132105, "epoch": 3145} {"train_loss": -6.6972270011901855, "global_step": 132106, "epoch": 3145} {"train_loss": -6.626410484313965, "global_step": 132107, "epoch": 3145} {"train_loss": -6.645195007324219, "global_step": 132108, "epoch": 3145} {"train_loss": -6.615604877471924, "global_step": 132109, "epoch": 3145} {"train_loss": -6.518587112426758, "global_step": 132110, "epoch": 3145} {"train_loss": -6.549345016479492, "global_step": 132111, "epoch": 3145} {"train_loss": -6.588674068450928, "global_step": 132112, "epoch": 3145} {"train_loss": -6.692874908447266, "global_step": 132113, "epoch": 3145} {"train_loss": -6.576896667480469, "global_step": 132114, "epoch": 3145} {"train_loss": -6.5935187339782715, "global_step": 132115, "epoch": 3145} {"train_loss": -6.641269207000732, "global_step": 132116, "epoch": 3145} {"train_loss": -6.490583896636963, "global_step": 132117, "epoch": 3145} {"train_loss": -6.707217216491699, "global_step": 132118, "epoch": 3145} {"train_loss": -6.532126426696777, "global_step": 132119, "epoch": 3145} {"train_loss": -6.591667175292969, "global_step": 132120, "epoch": 3145} {"train_loss": -6.580955505371094, "global_step": 132121, "epoch": 3145} {"train_loss": -6.653668403625488, "global_step": 132122, "epoch": 3145} {"train_loss": -6.731936454772949, "global_step": 132123, "epoch": 3145} {"train_loss": -6.592521667480469, "global_step": 132124, "epoch": 3145} {"train_loss": -6.510258197784424, "global_step": 132125, "epoch": 3145} {"train_loss": -6.6810126304626465, "global_step": 132126, "epoch": 3145} {"train_loss": -6.477047443389893, "global_step": 132127, "epoch": 3145} {"train_loss": -6.701627731323242, "global_step": 132128, "epoch": 3145} {"train_loss": -6.607449531555176, "global_step": 132129, "epoch": 3145} {"train_loss": -6.623166561126709, "global_step": 132130, "epoch": 3145} {"train_loss": -6.637654327210926, "global_step": 132131, "epoch": 3145, "val_loss": 66821.3515625} {"train_loss": -6.566253662109375, "global_step": 132132, "epoch": 3146} {"train_loss": -6.649542808532715, "global_step": 132133, "epoch": 3146} {"train_loss": -6.683371067047119, "global_step": 132134, "epoch": 3146} {"train_loss": -6.672357082366943, "global_step": 132135, "epoch": 3146} {"train_loss": -6.653075218200684, "global_step": 132136, "epoch": 3146} {"train_loss": -6.527474880218506, "global_step": 132137, "epoch": 3146} {"train_loss": -6.707218170166016, "global_step": 132138, "epoch": 3146} {"train_loss": -6.682280540466309, "global_step": 132139, "epoch": 3146} {"train_loss": -6.627643585205078, "global_step": 132140, "epoch": 3146} {"train_loss": -6.639314651489258, "global_step": 132141, "epoch": 3146} {"train_loss": -6.693868637084961, "global_step": 132142, "epoch": 3146} {"train_loss": -6.6304426193237305, "global_step": 132143, "epoch": 3146} {"train_loss": -6.6383819580078125, "global_step": 132144, "epoch": 3146} {"train_loss": -6.699240207672119, "global_step": 132145, "epoch": 3146} {"train_loss": -6.752158164978027, "global_step": 132146, "epoch": 3146} {"train_loss": -6.70603609085083, "global_step": 132147, "epoch": 3146} {"train_loss": -6.6798295974731445, "global_step": 132148, "epoch": 3146} {"train_loss": -6.689723491668701, "global_step": 132149, "epoch": 3146} {"train_loss": -6.661937713623047, "global_step": 132150, "epoch": 3146} {"train_loss": -6.590601444244385, "global_step": 132151, "epoch": 3146} {"train_loss": -6.686313152313232, "global_step": 132152, "epoch": 3146} {"train_loss": -6.771491050720215, "global_step": 132153, "epoch": 3146} {"train_loss": -6.684118270874023, "global_step": 132154, "epoch": 3146} {"train_loss": -6.650274753570557, "global_step": 132155, "epoch": 3146} {"train_loss": -6.697756767272949, "global_step": 132156, "epoch": 3146} {"train_loss": -6.8462114334106445, "global_step": 132157, "epoch": 3146} {"train_loss": -6.736734390258789, "global_step": 132158, "epoch": 3146} {"train_loss": -6.753386497497559, "global_step": 132159, "epoch": 3146} {"train_loss": -6.6957855224609375, "global_step": 132160, "epoch": 3146} {"train_loss": -6.860230922698975, "global_step": 132161, "epoch": 3146} {"train_loss": -6.677588939666748, "global_step": 132162, "epoch": 3146} {"train_loss": -6.729255676269531, "global_step": 132163, "epoch": 3146} {"train_loss": -6.812300682067871, "global_step": 132164, "epoch": 3146} {"train_loss": -6.796607494354248, "global_step": 132165, "epoch": 3146} {"train_loss": -6.783992767333984, "global_step": 132166, "epoch": 3146} {"train_loss": -6.741053581237793, "global_step": 132167, "epoch": 3146} {"train_loss": -6.675204753875732, "global_step": 132168, "epoch": 3146} {"train_loss": -6.717781066894531, "global_step": 132169, "epoch": 3146} {"train_loss": -6.765190601348877, "global_step": 132170, "epoch": 3146} {"train_loss": -6.6581010818481445, "global_step": 132171, "epoch": 3146} {"train_loss": -6.595970153808594, "global_step": 132172, "epoch": 3146} {"train_loss": -6.692757947104318, "global_step": 132173, "epoch": 3146, "val_loss": 66657.8203125} {"train_loss": -6.705402851104736, "global_step": 132174, "epoch": 3147} {"train_loss": -6.908451080322266, "global_step": 132175, "epoch": 3147} {"train_loss": -6.653074264526367, "global_step": 132176, "epoch": 3147} {"train_loss": -6.813551902770996, "global_step": 132177, "epoch": 3147} {"train_loss": -6.671530723571777, "global_step": 132178, "epoch": 3147} {"train_loss": -6.717545986175537, "global_step": 132179, "epoch": 3147} {"train_loss": -6.548852920532227, "global_step": 132180, "epoch": 3147} {"train_loss": -6.63477897644043, "global_step": 132181, "epoch": 3147} {"train_loss": -6.628789901733398, "global_step": 132182, "epoch": 3147} {"train_loss": -6.5257568359375, "global_step": 132183, "epoch": 3147} {"train_loss": -6.5814971923828125, "global_step": 132184, "epoch": 3147} {"train_loss": -6.711021423339844, "global_step": 132185, "epoch": 3147} {"train_loss": -6.393016338348389, "global_step": 132186, "epoch": 3147} {"train_loss": -6.594352722167969, "global_step": 132187, "epoch": 3147} {"train_loss": -6.630031108856201, "global_step": 132188, "epoch": 3147} {"train_loss": -6.465815544128418, "global_step": 132189, "epoch": 3147} {"train_loss": -6.661672592163086, "global_step": 132190, "epoch": 3147} {"train_loss": -6.337156772613525, "global_step": 132191, "epoch": 3147} {"train_loss": -6.564601898193359, "global_step": 132192, "epoch": 3147} {"train_loss": -6.625755786895752, "global_step": 132193, "epoch": 3147} {"train_loss": -6.465754508972168, "global_step": 132194, "epoch": 3147} {"train_loss": -6.7067108154296875, "global_step": 132195, "epoch": 3147} {"train_loss": -6.633930683135986, "global_step": 132196, "epoch": 3147} {"train_loss": -6.735755443572998, "global_step": 132197, "epoch": 3147} {"train_loss": -6.60394811630249, "global_step": 132198, "epoch": 3147} {"train_loss": -6.706143379211426, "global_step": 132199, "epoch": 3147} {"train_loss": -6.74432897567749, "global_step": 132200, "epoch": 3147} {"train_loss": -6.596522331237793, "global_step": 132201, "epoch": 3147} {"train_loss": -6.710474491119385, "global_step": 132202, "epoch": 3147} {"train_loss": -6.698643207550049, "global_step": 132203, "epoch": 3147} {"train_loss": -6.698680877685547, "global_step": 132204, "epoch": 3147} {"train_loss": -6.7755327224731445, "global_step": 132205, "epoch": 3147} {"train_loss": -6.660732269287109, "global_step": 132206, "epoch": 3147} {"train_loss": -6.647078514099121, "global_step": 132207, "epoch": 3147} {"train_loss": -6.602022171020508, "global_step": 132208, "epoch": 3147} {"train_loss": -6.76041316986084, "global_step": 132209, "epoch": 3147} {"train_loss": -6.892116546630859, "global_step": 132210, "epoch": 3147} {"train_loss": -6.758270263671875, "global_step": 132211, "epoch": 3147} {"train_loss": -6.626546382904053, "global_step": 132212, "epoch": 3147} {"train_loss": -6.820761680603027, "global_step": 132213, "epoch": 3147} {"train_loss": -6.629083156585693, "global_step": 132214, "epoch": 3147} {"train_loss": -6.655888761792864, "global_step": 132215, "epoch": 3147, "val_loss": 66782.71875} {"train_loss": -6.6294426918029785, "global_step": 132216, "epoch": 3148} {"train_loss": -6.634235858917236, "global_step": 132217, "epoch": 3148} {"train_loss": -6.712691307067871, "global_step": 132218, "epoch": 3148} {"train_loss": -6.655605316162109, "global_step": 132219, "epoch": 3148} {"train_loss": -6.666181564331055, "global_step": 132220, "epoch": 3148} {"train_loss": -6.724395275115967, "global_step": 132221, "epoch": 3148} {"train_loss": -6.677487373352051, "global_step": 132222, "epoch": 3148} {"train_loss": -6.684385776519775, "global_step": 132223, "epoch": 3148} {"train_loss": -6.763393402099609, "global_step": 132224, "epoch": 3148} {"train_loss": -6.710369110107422, "global_step": 132225, "epoch": 3148} {"train_loss": -6.826849937438965, "global_step": 132226, "epoch": 3148} {"train_loss": -6.697582721710205, "global_step": 132227, "epoch": 3148} {"train_loss": -6.806883811950684, "global_step": 132228, "epoch": 3148} {"train_loss": -6.65942907333374, "global_step": 132229, "epoch": 3148} {"train_loss": -6.80704927444458, "global_step": 132230, "epoch": 3148} {"train_loss": -6.698897361755371, "global_step": 132231, "epoch": 3148} {"train_loss": -6.742854118347168, "global_step": 132232, "epoch": 3148} {"train_loss": -6.626946926116943, "global_step": 132233, "epoch": 3148} {"train_loss": -6.693276405334473, "global_step": 132234, "epoch": 3148} {"train_loss": -6.6700334548950195, "global_step": 132235, "epoch": 3148} {"train_loss": -6.761477470397949, "global_step": 132236, "epoch": 3148} {"train_loss": -6.585220813751221, "global_step": 132237, "epoch": 3148} {"train_loss": -6.678811073303223, "global_step": 132238, "epoch": 3148} {"train_loss": -6.716925621032715, "global_step": 132239, "epoch": 3148} {"train_loss": -6.777377605438232, "global_step": 132240, "epoch": 3148} {"train_loss": -6.7070417404174805, "global_step": 132241, "epoch": 3148} {"train_loss": -6.712433815002441, "global_step": 132242, "epoch": 3148} {"train_loss": -6.746725559234619, "global_step": 132243, "epoch": 3148} {"train_loss": -6.616607666015625, "global_step": 132244, "epoch": 3148} {"train_loss": -6.667656898498535, "global_step": 132245, "epoch": 3148} {"train_loss": -6.740927696228027, "global_step": 132246, "epoch": 3148} {"train_loss": -6.762809753417969, "global_step": 132247, "epoch": 3148} {"train_loss": -6.777581214904785, "global_step": 132248, "epoch": 3148} {"train_loss": -6.758267402648926, "global_step": 132249, "epoch": 3148} {"train_loss": -6.730685710906982, "global_step": 132250, "epoch": 3148} {"train_loss": -6.726415157318115, "global_step": 132251, "epoch": 3148} {"train_loss": -6.774477005004883, "global_step": 132252, "epoch": 3148} {"train_loss": -6.750107765197754, "global_step": 132253, "epoch": 3148} {"train_loss": -6.736153602600098, "global_step": 132254, "epoch": 3148} {"train_loss": -6.826413154602051, "global_step": 132255, "epoch": 3148} {"train_loss": -6.705615997314453, "global_step": 132256, "epoch": 3148} {"train_loss": -6.714352971031552, "global_step": 132257, "epoch": 3148, "val_loss": 66796.078125} {"train_loss": -6.79387903213501, "global_step": 132258, "epoch": 3149} {"train_loss": -6.665157318115234, "global_step": 132259, "epoch": 3149} {"train_loss": -6.693783760070801, "global_step": 132260, "epoch": 3149} {"train_loss": -6.651006698608398, "global_step": 132261, "epoch": 3149} {"train_loss": -6.70084810256958, "global_step": 132262, "epoch": 3149} {"train_loss": -6.713618755340576, "global_step": 132263, "epoch": 3149} {"train_loss": -6.68277645111084, "global_step": 132264, "epoch": 3149} {"train_loss": -6.71340274810791, "global_step": 132265, "epoch": 3149} {"train_loss": -6.798802375793457, "global_step": 132266, "epoch": 3149} {"train_loss": -6.761872291564941, "global_step": 132267, "epoch": 3149} {"train_loss": -6.712275505065918, "global_step": 132268, "epoch": 3149} {"train_loss": -6.75252628326416, "global_step": 132269, "epoch": 3149} {"train_loss": -6.612434387207031, "global_step": 132270, "epoch": 3149} {"train_loss": -6.54954195022583, "global_step": 132271, "epoch": 3149} {"train_loss": -6.637111663818359, "global_step": 132272, "epoch": 3149} {"train_loss": -6.6265716552734375, "global_step": 132273, "epoch": 3149} {"train_loss": -6.567129611968994, "global_step": 132274, "epoch": 3149} {"train_loss": -6.575844764709473, "global_step": 132275, "epoch": 3149} {"train_loss": -6.68314266204834, "global_step": 132276, "epoch": 3149} {"train_loss": -6.582759857177734, "global_step": 132277, "epoch": 3149} {"train_loss": -6.603339195251465, "global_step": 132278, "epoch": 3149} {"train_loss": -6.563966751098633, "global_step": 132279, "epoch": 3149} {"train_loss": -6.65133810043335, "global_step": 132280, "epoch": 3149} {"train_loss": -6.5716962814331055, "global_step": 132281, "epoch": 3149} {"train_loss": -6.674983978271484, "global_step": 132282, "epoch": 3149} {"train_loss": -6.476999759674072, "global_step": 132283, "epoch": 3149} {"train_loss": -6.563081741333008, "global_step": 132284, "epoch": 3149} {"train_loss": -6.698556900024414, "global_step": 132285, "epoch": 3149} {"train_loss": -6.601101398468018, "global_step": 132286, "epoch": 3149} {"train_loss": -6.767463684082031, "global_step": 132287, "epoch": 3149} {"train_loss": -6.562559604644775, "global_step": 132288, "epoch": 3149} {"train_loss": -6.74871826171875, "global_step": 132289, "epoch": 3149} {"train_loss": -6.744710922241211, "global_step": 132290, "epoch": 3149} {"train_loss": -6.684747695922852, "global_step": 132291, "epoch": 3149} {"train_loss": -6.60119104385376, "global_step": 132292, "epoch": 3149} {"train_loss": -6.648501873016357, "global_step": 132293, "epoch": 3149} {"train_loss": -6.6542744636535645, "global_step": 132294, "epoch": 3149} {"train_loss": -6.622784614562988, "global_step": 132295, "epoch": 3149} {"train_loss": -6.7276225090026855, "global_step": 132296, "epoch": 3149} {"train_loss": -6.684305667877197, "global_step": 132297, "epoch": 3149} {"train_loss": -6.476629257202148, "global_step": 132298, "epoch": 3149} {"train_loss": -6.654437167303903, "global_step": 132299, "epoch": 3149, "val_loss": 66812.625} {"train_loss": -6.665431022644043, "global_step": 132300, "epoch": 3150} {"train_loss": -6.587302207946777, "global_step": 132301, "epoch": 3150} {"train_loss": -6.728928089141846, "global_step": 132302, "epoch": 3150} {"train_loss": -6.595682144165039, "global_step": 132303, "epoch": 3150} {"train_loss": -6.592347145080566, "global_step": 132304, "epoch": 3150} {"train_loss": -6.687216281890869, "global_step": 132305, "epoch": 3150} {"train_loss": -6.614904880523682, "global_step": 132306, "epoch": 3150} {"train_loss": -6.636611461639404, "global_step": 132307, "epoch": 3150} {"train_loss": -6.66182804107666, "global_step": 132308, "epoch": 3150} {"train_loss": -6.668673038482666, "global_step": 132309, "epoch": 3150} {"train_loss": -6.739908218383789, "global_step": 132310, "epoch": 3150} {"train_loss": -6.60306453704834, "global_step": 132311, "epoch": 3150} {"train_loss": -6.673761367797852, "global_step": 132312, "epoch": 3150} {"train_loss": -6.711697578430176, "global_step": 132313, "epoch": 3150} {"train_loss": -6.614944934844971, "global_step": 132314, "epoch": 3150} {"train_loss": -6.646568775177002, "global_step": 132315, "epoch": 3150} {"train_loss": -6.605792045593262, "global_step": 132316, "epoch": 3150} {"train_loss": -6.757107734680176, "global_step": 132317, "epoch": 3150} {"train_loss": -6.740352630615234, "global_step": 132318, "epoch": 3150} {"train_loss": -6.832513332366943, "global_step": 132319, "epoch": 3150} {"train_loss": -6.713172912597656, "global_step": 132320, "epoch": 3150} {"train_loss": -6.646393775939941, "global_step": 132321, "epoch": 3150} {"train_loss": -6.759371280670166, "global_step": 132322, "epoch": 3150} {"train_loss": -6.745953559875488, "global_step": 132323, "epoch": 3150} {"train_loss": -6.6818528175354, "global_step": 132324, "epoch": 3150} {"train_loss": -6.748909950256348, "global_step": 132325, "epoch": 3150} {"train_loss": -6.701570510864258, "global_step": 132326, "epoch": 3150} {"train_loss": -6.6953887939453125, "global_step": 132327, "epoch": 3150} {"train_loss": -6.6787261962890625, "global_step": 132328, "epoch": 3150} {"train_loss": -6.780927658081055, "global_step": 132329, "epoch": 3150} {"train_loss": -6.613059043884277, "global_step": 132330, "epoch": 3150} {"train_loss": -6.65289831161499, "global_step": 132331, "epoch": 3150} {"train_loss": -6.7489237785339355, "global_step": 132332, "epoch": 3150} {"train_loss": -6.628874778747559, "global_step": 132333, "epoch": 3150} {"train_loss": -6.737313747406006, "global_step": 132334, "epoch": 3150} {"train_loss": -6.760991096496582, "global_step": 132335, "epoch": 3150} {"train_loss": -6.625046730041504, "global_step": 132336, "epoch": 3150} {"train_loss": -6.637761116027832, "global_step": 132337, "epoch": 3150} {"train_loss": -6.619829177856445, "global_step": 132338, "epoch": 3150} {"train_loss": -6.6794586181640625, "global_step": 132339, "epoch": 3150} {"train_loss": -6.563070297241211, "global_step": 132340, "epoch": 3150} {"train_loss": -6.676765714372907, "global_step": 132341, "epoch": 3150, "train/sim_max_reward_0": 0.42543094948607585, "train/sim_max_reward_1": 0.8765500122530275, "train/sim_max_reward_2": 0.5655487398775056, "train/sim_max_reward_3": 0.3790534725025768, "train/sim_max_reward_4": 0.8805038301021463, "train/sim_max_reward_5": 0.868915179822667, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.5067542215173687, "test/sim_max_reward_4300002": 0.9445950761892348, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.5828771918861073, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.5023304668117781, "test/sim_max_reward_4300008": 0.8500822255371318, "test/sim_max_reward_4300009": 0.9482507242141853, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.32487261684830643, "test/sim_max_reward_4300012": 0.9820129953448471, "test/sim_max_reward_4300013": 0.9675336214222323, "test/sim_max_reward_4300014": 0.9412687772573202, "test/sim_max_reward_4300015": 0.9953610552698475, "test/sim_max_reward_4300016": 0.7491643494109183, "test/sim_max_reward_4300017": 0.876386468317861, "test/sim_max_reward_4300018": 0.4193944042850079, "test/sim_max_reward_4300019": 0.18351770792156633, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9223304308690937, "test/sim_max_reward_4300022": 0.6942958264646816, "test/sim_max_reward_4300023": 0.3277677208005477, "test/sim_max_reward_4300024": 0.9713252391871663, "test/sim_max_reward_4300025": 0.9063697657431963, "test/sim_max_reward_4300026": 0.17811050720091717, "test/sim_max_reward_4300027": 0.941637397589475, "test/sim_max_reward_4300028": 0.920672108778972, "test/sim_max_reward_4300029": 0.23418001578374528, "test/sim_max_reward_4300030": 0.31396781657641826, "test/sim_max_reward_4300031": 0.9392289131789149, "test/sim_max_reward_4300032": 0.9922974228744239, "test/sim_max_reward_4300033": 0.8306996957392292, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.47252213455637676, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.7800911407715271, "test/sim_max_reward_4300038": 0.4616760416238953, "test/sim_max_reward_4300039": 0.8889148686718963, "test/sim_max_reward_4300040": 0.9162057531350654, "test/sim_max_reward_4300041": 0.924842643551562, "test/sim_max_reward_4300042": 0.7172580669829246, "test/sim_max_reward_4300043": 0.14061393507685802, "test/sim_max_reward_4300044": 0.9113368604625978, "test/sim_max_reward_4300045": 0.17193361996896347, "test/sim_max_reward_4300046": 0.9147360085735852, "test/sim_max_reward_4300047": 0.9639264113512476, "test/sim_max_reward_4300048": 0.005228187117160089, "test/sim_max_reward_4300049": 0.23876581064183905, "train/mean_score": 0.6660003640073332, "test/mean_score": 0.5934072893175751, "val_loss": 66809.3515625} {"train_loss": -6.541713237762451, "global_step": 132342, "epoch": 3151} {"train_loss": -6.659422874450684, "global_step": 132343, "epoch": 3151} {"train_loss": -6.674053192138672, "global_step": 132344, "epoch": 3151} {"train_loss": -6.48574161529541, "global_step": 132345, "epoch": 3151} {"train_loss": -6.796643257141113, "global_step": 132346, "epoch": 3151} {"train_loss": -6.70969295501709, "global_step": 132347, "epoch": 3151} {"train_loss": -6.638096809387207, "global_step": 132348, "epoch": 3151} {"train_loss": -6.615984916687012, "global_step": 132349, "epoch": 3151} {"train_loss": -6.628735542297363, "global_step": 132350, "epoch": 3151} {"train_loss": -6.6767778396606445, "global_step": 132351, "epoch": 3151} {"train_loss": -6.640522003173828, "global_step": 132352, "epoch": 3151} {"train_loss": -6.706286430358887, "global_step": 132353, "epoch": 3151} {"train_loss": -6.8171820640563965, "global_step": 132354, "epoch": 3151} {"train_loss": -6.64765739440918, "global_step": 132355, "epoch": 3151} {"train_loss": -6.670793533325195, "global_step": 132356, "epoch": 3151} {"train_loss": -6.674044609069824, "global_step": 132357, "epoch": 3151} {"train_loss": -6.7384490966796875, "global_step": 132358, "epoch": 3151} {"train_loss": -6.677263259887695, "global_step": 132359, "epoch": 3151} {"train_loss": -6.558359146118164, "global_step": 132360, "epoch": 3151} {"train_loss": -6.724660873413086, "global_step": 132361, "epoch": 3151} {"train_loss": -6.688698768615723, "global_step": 132362, "epoch": 3151} {"train_loss": -6.63500452041626, "global_step": 132363, "epoch": 3151} {"train_loss": -6.746315002441406, "global_step": 132364, "epoch": 3151} {"train_loss": -6.698883056640625, "global_step": 132365, "epoch": 3151} {"train_loss": -6.679117679595947, "global_step": 132366, "epoch": 3151} {"train_loss": -6.610116958618164, "global_step": 132367, "epoch": 3151} {"train_loss": -6.670801162719727, "global_step": 132368, "epoch": 3151} {"train_loss": -6.616247177124023, "global_step": 132369, "epoch": 3151} {"train_loss": -6.553829193115234, "global_step": 132370, "epoch": 3151} {"train_loss": -6.620553970336914, "global_step": 132371, "epoch": 3151} {"train_loss": -6.723278999328613, "global_step": 132372, "epoch": 3151} {"train_loss": -6.5100908279418945, "global_step": 132373, "epoch": 3151} {"train_loss": -6.509397506713867, "global_step": 132374, "epoch": 3151} {"train_loss": -6.504613399505615, "global_step": 132375, "epoch": 3151} {"train_loss": -6.5981011390686035, "global_step": 132376, "epoch": 3151} {"train_loss": -6.612667083740234, "global_step": 132377, "epoch": 3151} {"train_loss": -6.546309471130371, "global_step": 132378, "epoch": 3151} {"train_loss": -6.708919048309326, "global_step": 132379, "epoch": 3151} {"train_loss": -6.644975662231445, "global_step": 132380, "epoch": 3151} {"train_loss": -6.55104923248291, "global_step": 132381, "epoch": 3151} {"train_loss": -6.577620029449463, "global_step": 132382, "epoch": 3151} {"train_loss": -6.638588723682222, "global_step": 132383, "epoch": 3151, "val_loss": 66608.7578125} {"train_loss": -6.702817916870117, "global_step": 132384, "epoch": 3152} {"train_loss": -6.687016487121582, "global_step": 132385, "epoch": 3152} {"train_loss": -6.7250518798828125, "global_step": 132386, "epoch": 3152} {"train_loss": -6.6890869140625, "global_step": 132387, "epoch": 3152} {"train_loss": -6.664202690124512, "global_step": 132388, "epoch": 3152} {"train_loss": -6.735576152801514, "global_step": 132389, "epoch": 3152} {"train_loss": -6.776602745056152, "global_step": 132390, "epoch": 3152} {"train_loss": -6.672399520874023, "global_step": 132391, "epoch": 3152} {"train_loss": -6.7055745124816895, "global_step": 132392, "epoch": 3152} {"train_loss": -6.6356706619262695, "global_step": 132393, "epoch": 3152} {"train_loss": -6.747750282287598, "global_step": 132394, "epoch": 3152} {"train_loss": -6.681454658508301, "global_step": 132395, "epoch": 3152} {"train_loss": -6.645346641540527, "global_step": 132396, "epoch": 3152} {"train_loss": -6.659812927246094, "global_step": 132397, "epoch": 3152} {"train_loss": -6.72712516784668, "global_step": 132398, "epoch": 3152} {"train_loss": -6.599773406982422, "global_step": 132399, "epoch": 3152} {"train_loss": -6.580289840698242, "global_step": 132400, "epoch": 3152} {"train_loss": -6.594711780548096, "global_step": 132401, "epoch": 3152} {"train_loss": -6.600682258605957, "global_step": 132402, "epoch": 3152} {"train_loss": -6.609850883483887, "global_step": 132403, "epoch": 3152} {"train_loss": -6.523444175720215, "global_step": 132404, "epoch": 3152} {"train_loss": -6.6241254806518555, "global_step": 132405, "epoch": 3152} {"train_loss": -6.543161392211914, "global_step": 132406, "epoch": 3152} {"train_loss": -6.601271629333496, "global_step": 132407, "epoch": 3152} {"train_loss": -6.7147088050842285, "global_step": 132408, "epoch": 3152} {"train_loss": -6.537734031677246, "global_step": 132409, "epoch": 3152} {"train_loss": -6.575526237487793, "global_step": 132410, "epoch": 3152} {"train_loss": -6.589788436889648, "global_step": 132411, "epoch": 3152} {"train_loss": -6.521170139312744, "global_step": 132412, "epoch": 3152} {"train_loss": -6.780264854431152, "global_step": 132413, "epoch": 3152} {"train_loss": -6.5544023513793945, "global_step": 132414, "epoch": 3152} {"train_loss": -6.607622146606445, "global_step": 132415, "epoch": 3152} {"train_loss": -6.586971282958984, "global_step": 132416, "epoch": 3152} {"train_loss": -6.589244842529297, "global_step": 132417, "epoch": 3152} {"train_loss": -6.553695201873779, "global_step": 132418, "epoch": 3152} {"train_loss": -6.683579444885254, "global_step": 132419, "epoch": 3152} {"train_loss": -6.574341773986816, "global_step": 132420, "epoch": 3152} {"train_loss": -6.5391693115234375, "global_step": 132421, "epoch": 3152} {"train_loss": -6.576362609863281, "global_step": 132422, "epoch": 3152} {"train_loss": -6.586775779724121, "global_step": 132423, "epoch": 3152} {"train_loss": -6.573642730712891, "global_step": 132424, "epoch": 3152} {"train_loss": -6.628739811125255, "global_step": 132425, "epoch": 3152, "val_loss": 66832.53125} {"train_loss": -6.657474517822266, "global_step": 132426, "epoch": 3153} {"train_loss": -6.595304489135742, "global_step": 132427, "epoch": 3153} {"train_loss": -6.723426818847656, "global_step": 132428, "epoch": 3153} {"train_loss": -6.593653678894043, "global_step": 132429, "epoch": 3153} {"train_loss": -6.7078094482421875, "global_step": 132430, "epoch": 3153} {"train_loss": -6.687243461608887, "global_step": 132431, "epoch": 3153} {"train_loss": -6.662105083465576, "global_step": 132432, "epoch": 3153} {"train_loss": -6.704841613769531, "global_step": 132433, "epoch": 3153} {"train_loss": -6.6776442527771, "global_step": 132434, "epoch": 3153} {"train_loss": -6.675095081329346, "global_step": 132435, "epoch": 3153} {"train_loss": -6.7116241455078125, "global_step": 132436, "epoch": 3153} {"train_loss": -6.6067399978637695, "global_step": 132437, "epoch": 3153} {"train_loss": -6.644287109375, "global_step": 132438, "epoch": 3153} {"train_loss": -6.639097213745117, "global_step": 132439, "epoch": 3153} {"train_loss": -6.645541191101074, "global_step": 132440, "epoch": 3153} {"train_loss": -6.550625801086426, "global_step": 132441, "epoch": 3153} {"train_loss": -6.758600234985352, "global_step": 132442, "epoch": 3153} {"train_loss": -6.707436561584473, "global_step": 132443, "epoch": 3153} {"train_loss": -6.734241485595703, "global_step": 132444, "epoch": 3153} {"train_loss": -6.776119232177734, "global_step": 132445, "epoch": 3153} {"train_loss": -6.574742317199707, "global_step": 132446, "epoch": 3153} {"train_loss": -6.805766582489014, "global_step": 132447, "epoch": 3153} {"train_loss": -6.57974100112915, "global_step": 132448, "epoch": 3153} {"train_loss": -6.759213447570801, "global_step": 132449, "epoch": 3153} {"train_loss": -6.654562473297119, "global_step": 132450, "epoch": 3153} {"train_loss": -6.622224807739258, "global_step": 132451, "epoch": 3153} {"train_loss": -6.720068454742432, "global_step": 132452, "epoch": 3153} {"train_loss": -6.644999027252197, "global_step": 132453, "epoch": 3153} {"train_loss": -6.710987091064453, "global_step": 132454, "epoch": 3153} {"train_loss": -6.716453552246094, "global_step": 132455, "epoch": 3153} {"train_loss": -6.7183122634887695, "global_step": 132456, "epoch": 3153} {"train_loss": -6.655991554260254, "global_step": 132457, "epoch": 3153} {"train_loss": -6.821233749389648, "global_step": 132458, "epoch": 3153} {"train_loss": -6.686447620391846, "global_step": 132459, "epoch": 3153} {"train_loss": -6.555965423583984, "global_step": 132460, "epoch": 3153} {"train_loss": -6.772979736328125, "global_step": 132461, "epoch": 3153} {"train_loss": -6.729626655578613, "global_step": 132462, "epoch": 3153} {"train_loss": -6.656944274902344, "global_step": 132463, "epoch": 3153} {"train_loss": -6.657422065734863, "global_step": 132464, "epoch": 3153} {"train_loss": -6.7667436599731445, "global_step": 132465, "epoch": 3153} {"train_loss": -6.721522331237793, "global_step": 132466, "epoch": 3153} {"train_loss": -6.682236330849784, "global_step": 132467, "epoch": 3153, "val_loss": 66811.8046875} {"train_loss": -6.7184247970581055, "global_step": 132468, "epoch": 3154} {"train_loss": -6.838071823120117, "global_step": 132469, "epoch": 3154} {"train_loss": -6.754135608673096, "global_step": 132470, "epoch": 3154} {"train_loss": -6.764410972595215, "global_step": 132471, "epoch": 3154} {"train_loss": -6.724486351013184, "global_step": 132472, "epoch": 3154} {"train_loss": -6.743623733520508, "global_step": 132473, "epoch": 3154} {"train_loss": -6.702147483825684, "global_step": 132474, "epoch": 3154} {"train_loss": -6.634140491485596, "global_step": 132475, "epoch": 3154} {"train_loss": -6.73870849609375, "global_step": 132476, "epoch": 3154} {"train_loss": -6.636882781982422, "global_step": 132477, "epoch": 3154} {"train_loss": -6.7563018798828125, "global_step": 132478, "epoch": 3154} {"train_loss": -6.597733020782471, "global_step": 132479, "epoch": 3154} {"train_loss": -6.687488079071045, "global_step": 132480, "epoch": 3154} {"train_loss": -6.684782981872559, "global_step": 132481, "epoch": 3154} {"train_loss": -6.680704116821289, "global_step": 132482, "epoch": 3154} {"train_loss": -6.720342636108398, "global_step": 132483, "epoch": 3154} {"train_loss": -6.769576549530029, "global_step": 132484, "epoch": 3154} {"train_loss": -6.892657279968262, "global_step": 132485, "epoch": 3154} {"train_loss": -6.597012519836426, "global_step": 132486, "epoch": 3154} {"train_loss": -6.806210517883301, "global_step": 132487, "epoch": 3154} {"train_loss": -6.722261428833008, "global_step": 132488, "epoch": 3154} {"train_loss": -6.762749671936035, "global_step": 132489, "epoch": 3154} {"train_loss": -6.759537696838379, "global_step": 132490, "epoch": 3154} {"train_loss": -6.733445644378662, "global_step": 132491, "epoch": 3154} {"train_loss": -6.662498474121094, "global_step": 132492, "epoch": 3154} {"train_loss": -6.613153457641602, "global_step": 132493, "epoch": 3154} {"train_loss": -6.634655952453613, "global_step": 132494, "epoch": 3154} {"train_loss": -6.752772808074951, "global_step": 132495, "epoch": 3154} {"train_loss": -6.786184310913086, "global_step": 132496, "epoch": 3154} {"train_loss": -6.814373970031738, "global_step": 132497, "epoch": 3154} {"train_loss": -6.778581142425537, "global_step": 132498, "epoch": 3154} {"train_loss": -6.701339244842529, "global_step": 132499, "epoch": 3154} {"train_loss": -6.722261428833008, "global_step": 132500, "epoch": 3154} {"train_loss": -6.755334377288818, "global_step": 132501, "epoch": 3154} {"train_loss": -6.644311904907227, "global_step": 132502, "epoch": 3154} {"train_loss": -6.731503486633301, "global_step": 132503, "epoch": 3154} {"train_loss": -6.7111101150512695, "global_step": 132504, "epoch": 3154} {"train_loss": -6.742363452911377, "global_step": 132505, "epoch": 3154} {"train_loss": -6.6684184074401855, "global_step": 132506, "epoch": 3154} {"train_loss": -6.797667503356934, "global_step": 132507, "epoch": 3154} {"train_loss": -6.769644737243652, "global_step": 132508, "epoch": 3154} {"train_loss": -6.726112944739206, "global_step": 132509, "epoch": 3154, "val_loss": 66613.2890625} {"train_loss": -6.731339454650879, "global_step": 132510, "epoch": 3155} {"train_loss": -6.745612621307373, "global_step": 132511, "epoch": 3155} {"train_loss": -6.78727912902832, "global_step": 132512, "epoch": 3155} {"train_loss": -6.7089738845825195, "global_step": 132513, "epoch": 3155} {"train_loss": -6.695977210998535, "global_step": 132514, "epoch": 3155} {"train_loss": -6.735619068145752, "global_step": 132515, "epoch": 3155} {"train_loss": -6.655916213989258, "global_step": 132516, "epoch": 3155} {"train_loss": -6.695584774017334, "global_step": 132517, "epoch": 3155} {"train_loss": -6.747725963592529, "global_step": 132518, "epoch": 3155} {"train_loss": -6.826846122741699, "global_step": 132519, "epoch": 3155} {"train_loss": -6.655623435974121, "global_step": 132520, "epoch": 3155} {"train_loss": -6.622259140014648, "global_step": 132521, "epoch": 3155} {"train_loss": -6.713598728179932, "global_step": 132522, "epoch": 3155} {"train_loss": -6.580133438110352, "global_step": 132523, "epoch": 3155} {"train_loss": -6.692027568817139, "global_step": 132524, "epoch": 3155} {"train_loss": -6.604378700256348, "global_step": 132525, "epoch": 3155} {"train_loss": -6.48716926574707, "global_step": 132526, "epoch": 3155} {"train_loss": -6.728471755981445, "global_step": 132527, "epoch": 3155} {"train_loss": -6.631561756134033, "global_step": 132528, "epoch": 3155} {"train_loss": -6.679689407348633, "global_step": 132529, "epoch": 3155} {"train_loss": -6.707900524139404, "global_step": 132530, "epoch": 3155} {"train_loss": -6.7658796310424805, "global_step": 132531, "epoch": 3155} {"train_loss": -6.625487327575684, "global_step": 132532, "epoch": 3155} {"train_loss": -6.642498016357422, "global_step": 132533, "epoch": 3155} {"train_loss": -6.723673343658447, "global_step": 132534, "epoch": 3155} {"train_loss": -6.696784019470215, "global_step": 132535, "epoch": 3155} {"train_loss": -6.630345344543457, "global_step": 132536, "epoch": 3155} {"train_loss": -6.652245998382568, "global_step": 132537, "epoch": 3155} {"train_loss": -6.642105579376221, "global_step": 132538, "epoch": 3155} {"train_loss": -6.72568416595459, "global_step": 132539, "epoch": 3155} {"train_loss": -6.734367370605469, "global_step": 132540, "epoch": 3155} {"train_loss": -6.613796234130859, "global_step": 132541, "epoch": 3155} {"train_loss": -6.733755111694336, "global_step": 132542, "epoch": 3155} {"train_loss": -6.563232421875, "global_step": 132543, "epoch": 3155} {"train_loss": -6.7032084465026855, "global_step": 132544, "epoch": 3155} {"train_loss": -6.812221050262451, "global_step": 132545, "epoch": 3155} {"train_loss": -6.758183479309082, "global_step": 132546, "epoch": 3155} {"train_loss": -6.700948715209961, "global_step": 132547, "epoch": 3155} {"train_loss": -6.621189594268799, "global_step": 132548, "epoch": 3155} {"train_loss": -6.7003679275512695, "global_step": 132549, "epoch": 3155} {"train_loss": -6.8493523597717285, "global_step": 132550, "epoch": 3155} {"train_loss": -6.691096339906965, "global_step": 132551, "epoch": 3155, "val_loss": 66630.203125} {"train_loss": -6.709239959716797, "global_step": 132552, "epoch": 3156} {"train_loss": -6.643640518188477, "global_step": 132553, "epoch": 3156} {"train_loss": -6.6554975509643555, "global_step": 132554, "epoch": 3156} {"train_loss": -6.633413314819336, "global_step": 132555, "epoch": 3156} {"train_loss": -6.746835708618164, "global_step": 132556, "epoch": 3156} {"train_loss": -6.709884166717529, "global_step": 132557, "epoch": 3156} {"train_loss": -6.683879852294922, "global_step": 132558, "epoch": 3156} {"train_loss": -6.7191596031188965, "global_step": 132559, "epoch": 3156} {"train_loss": -6.670409202575684, "global_step": 132560, "epoch": 3156} {"train_loss": -6.656463146209717, "global_step": 132561, "epoch": 3156} {"train_loss": -6.677422046661377, "global_step": 132562, "epoch": 3156} {"train_loss": -6.690532684326172, "global_step": 132563, "epoch": 3156} {"train_loss": -6.6072282791137695, "global_step": 132564, "epoch": 3156} {"train_loss": -6.596560955047607, "global_step": 132565, "epoch": 3156} {"train_loss": -6.676862716674805, "global_step": 132566, "epoch": 3156} {"train_loss": -6.665077209472656, "global_step": 132567, "epoch": 3156} {"train_loss": -6.701026439666748, "global_step": 132568, "epoch": 3156} {"train_loss": -6.665071964263916, "global_step": 132569, "epoch": 3156} {"train_loss": -6.693065166473389, "global_step": 132570, "epoch": 3156} {"train_loss": -6.725940704345703, "global_step": 132571, "epoch": 3156} {"train_loss": -6.6980390548706055, "global_step": 132572, "epoch": 3156} {"train_loss": -6.785429954528809, "global_step": 132573, "epoch": 3156} {"train_loss": -6.693099498748779, "global_step": 132574, "epoch": 3156} {"train_loss": -6.7750749588012695, "global_step": 132575, "epoch": 3156} {"train_loss": -6.737238883972168, "global_step": 132576, "epoch": 3156} {"train_loss": -6.690859794616699, "global_step": 132577, "epoch": 3156} {"train_loss": -6.71113395690918, "global_step": 132578, "epoch": 3156} {"train_loss": -6.68452262878418, "global_step": 132579, "epoch": 3156} {"train_loss": -6.679331302642822, "global_step": 132580, "epoch": 3156} {"train_loss": -6.668333530426025, "global_step": 132581, "epoch": 3156} {"train_loss": -6.8248748779296875, "global_step": 132582, "epoch": 3156} {"train_loss": -6.886346817016602, "global_step": 132583, "epoch": 3156} {"train_loss": -6.615350723266602, "global_step": 132584, "epoch": 3156} {"train_loss": -6.703518867492676, "global_step": 132585, "epoch": 3156} {"train_loss": -6.799554347991943, "global_step": 132586, "epoch": 3156} {"train_loss": -6.828721046447754, "global_step": 132587, "epoch": 3156} {"train_loss": -6.674038887023926, "global_step": 132588, "epoch": 3156} {"train_loss": -6.6942338943481445, "global_step": 132589, "epoch": 3156} {"train_loss": -6.801319599151611, "global_step": 132590, "epoch": 3156} {"train_loss": -6.660135269165039, "global_step": 132591, "epoch": 3156} {"train_loss": -6.665810585021973, "global_step": 132592, "epoch": 3156} {"train_loss": -6.702196711585636, "global_step": 132593, "epoch": 3156, "val_loss": 66737.1796875} {"train_loss": -6.782679080963135, "global_step": 132594, "epoch": 3157} {"train_loss": -6.761302947998047, "global_step": 132595, "epoch": 3157} {"train_loss": -6.694973945617676, "global_step": 132596, "epoch": 3157} {"train_loss": -6.75665807723999, "global_step": 132597, "epoch": 3157} {"train_loss": -6.649930000305176, "global_step": 132598, "epoch": 3157} {"train_loss": -6.656084060668945, "global_step": 132599, "epoch": 3157} {"train_loss": -6.833035945892334, "global_step": 132600, "epoch": 3157} {"train_loss": -6.736793518066406, "global_step": 132601, "epoch": 3157} {"train_loss": -6.7675580978393555, "global_step": 132602, "epoch": 3157} {"train_loss": -6.772716999053955, "global_step": 132603, "epoch": 3157} {"train_loss": -6.741628646850586, "global_step": 132604, "epoch": 3157} {"train_loss": -6.741035461425781, "global_step": 132605, "epoch": 3157} {"train_loss": -6.656426429748535, "global_step": 132606, "epoch": 3157} {"train_loss": -6.757340431213379, "global_step": 132607, "epoch": 3157} {"train_loss": -6.754993438720703, "global_step": 132608, "epoch": 3157} {"train_loss": -6.825361251831055, "global_step": 132609, "epoch": 3157} {"train_loss": -6.663003444671631, "global_step": 132610, "epoch": 3157} {"train_loss": -6.669710636138916, "global_step": 132611, "epoch": 3157} {"train_loss": -6.7171630859375, "global_step": 132612, "epoch": 3157} {"train_loss": -6.7683515548706055, "global_step": 132613, "epoch": 3157} {"train_loss": -6.70180082321167, "global_step": 132614, "epoch": 3157} {"train_loss": -6.788910388946533, "global_step": 132615, "epoch": 3157} {"train_loss": -6.686368942260742, "global_step": 132616, "epoch": 3157} {"train_loss": -6.712088584899902, "global_step": 132617, "epoch": 3157} {"train_loss": -6.72114372253418, "global_step": 132618, "epoch": 3157} {"train_loss": -6.772983551025391, "global_step": 132619, "epoch": 3157} {"train_loss": -6.650887966156006, "global_step": 132620, "epoch": 3157} {"train_loss": -6.641993999481201, "global_step": 132621, "epoch": 3157} {"train_loss": -6.686380386352539, "global_step": 132622, "epoch": 3157} {"train_loss": -6.6729888916015625, "global_step": 132623, "epoch": 3157} {"train_loss": -6.578508377075195, "global_step": 132624, "epoch": 3157} {"train_loss": -6.619361877441406, "global_step": 132625, "epoch": 3157} {"train_loss": -6.709904670715332, "global_step": 132626, "epoch": 3157} {"train_loss": -6.6324262619018555, "global_step": 132627, "epoch": 3157} {"train_loss": -6.725189208984375, "global_step": 132628, "epoch": 3157} {"train_loss": -6.621728420257568, "global_step": 132629, "epoch": 3157} {"train_loss": -6.803256511688232, "global_step": 132630, "epoch": 3157} {"train_loss": -6.63884162902832, "global_step": 132631, "epoch": 3157} {"train_loss": -6.659079551696777, "global_step": 132632, "epoch": 3157} {"train_loss": -6.688048839569092, "global_step": 132633, "epoch": 3157} {"train_loss": -6.594694137573242, "global_step": 132634, "epoch": 3157} {"train_loss": -6.704615854081654, "global_step": 132635, "epoch": 3157, "val_loss": 66791.6015625} {"train_loss": -6.666603088378906, "global_step": 132636, "epoch": 3158} {"train_loss": -6.785143852233887, "global_step": 132637, "epoch": 3158} {"train_loss": -6.629708290100098, "global_step": 132638, "epoch": 3158} {"train_loss": -6.744435787200928, "global_step": 132639, "epoch": 3158} {"train_loss": -6.769410610198975, "global_step": 132640, "epoch": 3158} {"train_loss": -6.595145225524902, "global_step": 132641, "epoch": 3158} {"train_loss": -6.776912212371826, "global_step": 132642, "epoch": 3158} {"train_loss": -6.692564487457275, "global_step": 132643, "epoch": 3158} {"train_loss": -6.673582553863525, "global_step": 132644, "epoch": 3158} {"train_loss": -6.664497375488281, "global_step": 132645, "epoch": 3158} {"train_loss": -6.636569023132324, "global_step": 132646, "epoch": 3158} {"train_loss": -6.611342430114746, "global_step": 132647, "epoch": 3158} {"train_loss": -6.657582759857178, "global_step": 132648, "epoch": 3158} {"train_loss": -6.664138317108154, "global_step": 132649, "epoch": 3158} {"train_loss": -6.542912483215332, "global_step": 132650, "epoch": 3158} {"train_loss": -6.804813861846924, "global_step": 132651, "epoch": 3158} {"train_loss": -6.734703063964844, "global_step": 132652, "epoch": 3158} {"train_loss": -6.597151756286621, "global_step": 132653, "epoch": 3158} {"train_loss": -6.581547737121582, "global_step": 132654, "epoch": 3158} {"train_loss": -6.751655578613281, "global_step": 132655, "epoch": 3158} {"train_loss": -6.5063557624816895, "global_step": 132656, "epoch": 3158} {"train_loss": -6.697402477264404, "global_step": 132657, "epoch": 3158} {"train_loss": -6.741396903991699, "global_step": 132658, "epoch": 3158} {"train_loss": -6.67811393737793, "global_step": 132659, "epoch": 3158} {"train_loss": -6.641508102416992, "global_step": 132660, "epoch": 3158} {"train_loss": -6.737266540527344, "global_step": 132661, "epoch": 3158} {"train_loss": -6.671605110168457, "global_step": 132662, "epoch": 3158} {"train_loss": -6.717426776885986, "global_step": 132663, "epoch": 3158} {"train_loss": -6.66124153137207, "global_step": 132664, "epoch": 3158} {"train_loss": -6.690656661987305, "global_step": 132665, "epoch": 3158} {"train_loss": -6.620502471923828, "global_step": 132666, "epoch": 3158} {"train_loss": -6.781385898590088, "global_step": 132667, "epoch": 3158} {"train_loss": -6.693994522094727, "global_step": 132668, "epoch": 3158} {"train_loss": -6.686802387237549, "global_step": 132669, "epoch": 3158} {"train_loss": -6.75694465637207, "global_step": 132670, "epoch": 3158} {"train_loss": -6.675867557525635, "global_step": 132671, "epoch": 3158} {"train_loss": -6.7315263748168945, "global_step": 132672, "epoch": 3158} {"train_loss": -6.701851844787598, "global_step": 132673, "epoch": 3158} {"train_loss": -6.676252841949463, "global_step": 132674, "epoch": 3158} {"train_loss": -6.744177341461182, "global_step": 132675, "epoch": 3158} {"train_loss": -6.764195442199707, "global_step": 132676, "epoch": 3158} {"train_loss": -6.689188696089245, "global_step": 132677, "epoch": 3158, "val_loss": 66623.5390625} {"train_loss": -6.745895862579346, "global_step": 132678, "epoch": 3159} {"train_loss": -6.618498802185059, "global_step": 132679, "epoch": 3159} {"train_loss": -6.722437858581543, "global_step": 132680, "epoch": 3159} {"train_loss": -6.609883785247803, "global_step": 132681, "epoch": 3159} {"train_loss": -6.711804389953613, "global_step": 132682, "epoch": 3159} {"train_loss": -6.662409782409668, "global_step": 132683, "epoch": 3159} {"train_loss": -6.708617210388184, "global_step": 132684, "epoch": 3159} {"train_loss": -6.48099422454834, "global_step": 132685, "epoch": 3159} {"train_loss": -6.588137149810791, "global_step": 132686, "epoch": 3159} {"train_loss": -6.526450157165527, "global_step": 132687, "epoch": 3159} {"train_loss": -6.493768215179443, "global_step": 132688, "epoch": 3159} {"train_loss": -6.587125778198242, "global_step": 132689, "epoch": 3159} {"train_loss": -6.608147144317627, "global_step": 132690, "epoch": 3159} {"train_loss": -6.6563262939453125, "global_step": 132691, "epoch": 3159} {"train_loss": -6.460322856903076, "global_step": 132692, "epoch": 3159} {"train_loss": -6.655224800109863, "global_step": 132693, "epoch": 3159} {"train_loss": -6.639631271362305, "global_step": 132694, "epoch": 3159} {"train_loss": -6.577280044555664, "global_step": 132695, "epoch": 3159} {"train_loss": -6.521721839904785, "global_step": 132696, "epoch": 3159} {"train_loss": -6.6127800941467285, "global_step": 132697, "epoch": 3159} {"train_loss": -6.638166427612305, "global_step": 132698, "epoch": 3159} {"train_loss": -6.53231143951416, "global_step": 132699, "epoch": 3159} {"train_loss": -6.659411430358887, "global_step": 132700, "epoch": 3159} {"train_loss": -6.551204204559326, "global_step": 132701, "epoch": 3159} {"train_loss": -6.645626544952393, "global_step": 132702, "epoch": 3159} {"train_loss": -6.671083927154541, "global_step": 132703, "epoch": 3159} {"train_loss": -6.668025970458984, "global_step": 132704, "epoch": 3159} {"train_loss": -6.698943138122559, "global_step": 132705, "epoch": 3159} {"train_loss": -6.677818775177002, "global_step": 132706, "epoch": 3159} {"train_loss": -6.590096473693848, "global_step": 132707, "epoch": 3159} {"train_loss": -6.7605133056640625, "global_step": 132708, "epoch": 3159} {"train_loss": -6.630881309509277, "global_step": 132709, "epoch": 3159} {"train_loss": -6.808646202087402, "global_step": 132710, "epoch": 3159} {"train_loss": -6.705496311187744, "global_step": 132711, "epoch": 3159} {"train_loss": -6.595585823059082, "global_step": 132712, "epoch": 3159} {"train_loss": -6.630341529846191, "global_step": 132713, "epoch": 3159} {"train_loss": -6.718790054321289, "global_step": 132714, "epoch": 3159} {"train_loss": -6.660734176635742, "global_step": 132715, "epoch": 3159} {"train_loss": -6.717220306396484, "global_step": 132716, "epoch": 3159} {"train_loss": -6.670135498046875, "global_step": 132717, "epoch": 3159} {"train_loss": -6.707162380218506, "global_step": 132718, "epoch": 3159} {"train_loss": -6.638165394465129, "global_step": 132719, "epoch": 3159, "val_loss": 66903.9140625} {"train_loss": -6.684033393859863, "global_step": 132720, "epoch": 3160} {"train_loss": -6.618044376373291, "global_step": 132721, "epoch": 3160} {"train_loss": -6.6718549728393555, "global_step": 132722, "epoch": 3160} {"train_loss": -6.72528600692749, "global_step": 132723, "epoch": 3160} {"train_loss": -6.711605072021484, "global_step": 132724, "epoch": 3160} {"train_loss": -6.768795013427734, "global_step": 132725, "epoch": 3160} {"train_loss": -6.632193565368652, "global_step": 132726, "epoch": 3160} {"train_loss": -6.755108833312988, "global_step": 132727, "epoch": 3160} {"train_loss": -6.6747145652771, "global_step": 132728, "epoch": 3160} {"train_loss": -6.658940315246582, "global_step": 132729, "epoch": 3160} {"train_loss": -6.773709297180176, "global_step": 132730, "epoch": 3160} {"train_loss": -6.681055545806885, "global_step": 132731, "epoch": 3160} {"train_loss": -6.543988227844238, "global_step": 132732, "epoch": 3160} {"train_loss": -6.641931533813477, "global_step": 132733, "epoch": 3160} {"train_loss": -6.642739295959473, "global_step": 132734, "epoch": 3160} {"train_loss": -6.67254638671875, "global_step": 132735, "epoch": 3160} {"train_loss": -6.663922309875488, "global_step": 132736, "epoch": 3160} {"train_loss": -6.696442127227783, "global_step": 132737, "epoch": 3160} {"train_loss": -6.625839710235596, "global_step": 132738, "epoch": 3160} {"train_loss": -6.664582252502441, "global_step": 132739, "epoch": 3160} {"train_loss": -6.591789245605469, "global_step": 132740, "epoch": 3160} {"train_loss": -6.596634864807129, "global_step": 132741, "epoch": 3160} {"train_loss": -6.693208694458008, "global_step": 132742, "epoch": 3160} {"train_loss": -6.6085004806518555, "global_step": 132743, "epoch": 3160} {"train_loss": -6.603890419006348, "global_step": 132744, "epoch": 3160} {"train_loss": -6.6169586181640625, "global_step": 132745, "epoch": 3160} {"train_loss": -6.659157752990723, "global_step": 132746, "epoch": 3160} {"train_loss": -6.619122505187988, "global_step": 132747, "epoch": 3160} {"train_loss": -6.701241493225098, "global_step": 132748, "epoch": 3160} {"train_loss": -6.79782772064209, "global_step": 132749, "epoch": 3160} {"train_loss": -6.604934215545654, "global_step": 132750, "epoch": 3160} {"train_loss": -6.628103256225586, "global_step": 132751, "epoch": 3160} {"train_loss": -6.674674987792969, "global_step": 132752, "epoch": 3160} {"train_loss": -6.686818599700928, "global_step": 132753, "epoch": 3160} {"train_loss": -6.720096588134766, "global_step": 132754, "epoch": 3160} {"train_loss": -6.687510013580322, "global_step": 132755, "epoch": 3160} {"train_loss": -6.701191425323486, "global_step": 132756, "epoch": 3160} {"train_loss": -6.66313362121582, "global_step": 132757, "epoch": 3160} {"train_loss": -6.661639213562012, "global_step": 132758, "epoch": 3160} {"train_loss": -6.681517601013184, "global_step": 132759, "epoch": 3160} {"train_loss": -6.66480016708374, "global_step": 132760, "epoch": 3160} {"train_loss": -6.666740156355358, "global_step": 132761, "epoch": 3160, "val_loss": 66667.9375} {"train_loss": -6.766474723815918, "global_step": 132762, "epoch": 3161} {"train_loss": -6.719902992248535, "global_step": 132763, "epoch": 3161} {"train_loss": -6.674468040466309, "global_step": 132764, "epoch": 3161} {"train_loss": -6.7712225914001465, "global_step": 132765, "epoch": 3161} {"train_loss": -6.634272575378418, "global_step": 132766, "epoch": 3161} {"train_loss": -6.681766033172607, "global_step": 132767, "epoch": 3161} {"train_loss": -6.674299716949463, "global_step": 132768, "epoch": 3161} {"train_loss": -6.698420524597168, "global_step": 132769, "epoch": 3161} {"train_loss": -6.590826511383057, "global_step": 132770, "epoch": 3161} {"train_loss": -6.753314971923828, "global_step": 132771, "epoch": 3161} {"train_loss": -6.611606597900391, "global_step": 132772, "epoch": 3161} {"train_loss": -6.48972225189209, "global_step": 132773, "epoch": 3161} {"train_loss": -6.691580772399902, "global_step": 132774, "epoch": 3161} {"train_loss": -6.572145462036133, "global_step": 132775, "epoch": 3161} {"train_loss": -6.680172443389893, "global_step": 132776, "epoch": 3161} {"train_loss": -6.617807865142822, "global_step": 132777, "epoch": 3161} {"train_loss": -6.659992694854736, "global_step": 132778, "epoch": 3161} {"train_loss": -6.724362373352051, "global_step": 132779, "epoch": 3161} {"train_loss": -6.698313236236572, "global_step": 132780, "epoch": 3161} {"train_loss": -6.6441497802734375, "global_step": 132781, "epoch": 3161} {"train_loss": -6.774908065795898, "global_step": 132782, "epoch": 3161} {"train_loss": -6.64781379699707, "global_step": 132783, "epoch": 3161} {"train_loss": -6.694272041320801, "global_step": 132784, "epoch": 3161} {"train_loss": -6.7843017578125, "global_step": 132785, "epoch": 3161} {"train_loss": -6.707275390625, "global_step": 132786, "epoch": 3161} {"train_loss": -6.7445831298828125, "global_step": 132787, "epoch": 3161} {"train_loss": -6.7045392990112305, "global_step": 132788, "epoch": 3161} {"train_loss": -6.700268745422363, "global_step": 132789, "epoch": 3161} {"train_loss": -6.796377182006836, "global_step": 132790, "epoch": 3161} {"train_loss": -6.693950653076172, "global_step": 132791, "epoch": 3161} {"train_loss": -6.778253078460693, "global_step": 132792, "epoch": 3161} {"train_loss": -6.710991859436035, "global_step": 132793, "epoch": 3161} {"train_loss": -6.637548446655273, "global_step": 132794, "epoch": 3161} {"train_loss": -6.666050910949707, "global_step": 132795, "epoch": 3161} {"train_loss": -6.6738691329956055, "global_step": 132796, "epoch": 3161} {"train_loss": -6.693789482116699, "global_step": 132797, "epoch": 3161} {"train_loss": -6.644620895385742, "global_step": 132798, "epoch": 3161} {"train_loss": -6.783465385437012, "global_step": 132799, "epoch": 3161} {"train_loss": -6.731327056884766, "global_step": 132800, "epoch": 3161} {"train_loss": -6.69647216796875, "global_step": 132801, "epoch": 3161} {"train_loss": -6.755489349365234, "global_step": 132802, "epoch": 3161} {"train_loss": -6.694025493803478, "global_step": 132803, "epoch": 3161, "val_loss": 66633.109375} {"train_loss": -6.673521041870117, "global_step": 132804, "epoch": 3162} {"train_loss": -6.680936813354492, "global_step": 132805, "epoch": 3162} {"train_loss": -6.691884994506836, "global_step": 132806, "epoch": 3162} {"train_loss": -6.7874956130981445, "global_step": 132807, "epoch": 3162} {"train_loss": -6.847548484802246, "global_step": 132808, "epoch": 3162} {"train_loss": -6.684822082519531, "global_step": 132809, "epoch": 3162} {"train_loss": -6.7891364097595215, "global_step": 132810, "epoch": 3162} {"train_loss": -6.765787124633789, "global_step": 132811, "epoch": 3162} {"train_loss": -6.607346534729004, "global_step": 132812, "epoch": 3162} {"train_loss": -6.7650299072265625, "global_step": 132813, "epoch": 3162} {"train_loss": -6.84644079208374, "global_step": 132814, "epoch": 3162} {"train_loss": -6.746716022491455, "global_step": 132815, "epoch": 3162} {"train_loss": -6.639928817749023, "global_step": 132816, "epoch": 3162} {"train_loss": -6.6595458984375, "global_step": 132817, "epoch": 3162} {"train_loss": -6.7448883056640625, "global_step": 132818, "epoch": 3162} {"train_loss": -6.625151634216309, "global_step": 132819, "epoch": 3162} {"train_loss": -6.713156223297119, "global_step": 132820, "epoch": 3162} {"train_loss": -6.690969467163086, "global_step": 132821, "epoch": 3162} {"train_loss": -6.6155571937561035, "global_step": 132822, "epoch": 3162} {"train_loss": -6.759150505065918, "global_step": 132823, "epoch": 3162} {"train_loss": -6.586517810821533, "global_step": 132824, "epoch": 3162} {"train_loss": -6.731581687927246, "global_step": 132825, "epoch": 3162} {"train_loss": -6.703427314758301, "global_step": 132826, "epoch": 3162} {"train_loss": -6.687458038330078, "global_step": 132827, "epoch": 3162} {"train_loss": -6.655499458312988, "global_step": 132828, "epoch": 3162} {"train_loss": -6.850175857543945, "global_step": 132829, "epoch": 3162} {"train_loss": -6.736051559448242, "global_step": 132830, "epoch": 3162} {"train_loss": -6.688342094421387, "global_step": 132831, "epoch": 3162} {"train_loss": -6.622525215148926, "global_step": 132832, "epoch": 3162} {"train_loss": -6.598227024078369, "global_step": 132833, "epoch": 3162} {"train_loss": -6.748248100280762, "global_step": 132834, "epoch": 3162} {"train_loss": -6.712912559509277, "global_step": 132835, "epoch": 3162} {"train_loss": -6.675591945648193, "global_step": 132836, "epoch": 3162} {"train_loss": -6.652123928070068, "global_step": 132837, "epoch": 3162} {"train_loss": -6.665182113647461, "global_step": 132838, "epoch": 3162} {"train_loss": -6.639519691467285, "global_step": 132839, "epoch": 3162} {"train_loss": -6.777657985687256, "global_step": 132840, "epoch": 3162} {"train_loss": -6.770687580108643, "global_step": 132841, "epoch": 3162} {"train_loss": -6.593594074249268, "global_step": 132842, "epoch": 3162} {"train_loss": -6.698627948760986, "global_step": 132843, "epoch": 3162} {"train_loss": -6.798837184906006, "global_step": 132844, "epoch": 3162} {"train_loss": -6.707866066978092, "global_step": 132845, "epoch": 3162, "val_loss": 66594.265625} {"train_loss": -6.707821369171143, "global_step": 132846, "epoch": 3163} {"train_loss": -6.713417053222656, "global_step": 132847, "epoch": 3163} {"train_loss": -6.715734004974365, "global_step": 132848, "epoch": 3163} {"train_loss": -6.775888442993164, "global_step": 132849, "epoch": 3163} {"train_loss": -6.7019805908203125, "global_step": 132850, "epoch": 3163} {"train_loss": -6.726100921630859, "global_step": 132851, "epoch": 3163} {"train_loss": -6.836966514587402, "global_step": 132852, "epoch": 3163} {"train_loss": -6.674022674560547, "global_step": 132853, "epoch": 3163} {"train_loss": -6.737392425537109, "global_step": 132854, "epoch": 3163} {"train_loss": -6.67633056640625, "global_step": 132855, "epoch": 3163} {"train_loss": -6.624595642089844, "global_step": 132856, "epoch": 3163} {"train_loss": -6.602957725524902, "global_step": 132857, "epoch": 3163} {"train_loss": -6.666455268859863, "global_step": 132858, "epoch": 3163} {"train_loss": -6.670450210571289, "global_step": 132859, "epoch": 3163} {"train_loss": -6.60938835144043, "global_step": 132860, "epoch": 3163} {"train_loss": -6.771598815917969, "global_step": 132861, "epoch": 3163} {"train_loss": -6.6844162940979, "global_step": 132862, "epoch": 3163} {"train_loss": -6.630403518676758, "global_step": 132863, "epoch": 3163} {"train_loss": -6.724420547485352, "global_step": 132864, "epoch": 3163} {"train_loss": -6.450423717498779, "global_step": 132865, "epoch": 3163} {"train_loss": -6.583803176879883, "global_step": 132866, "epoch": 3163} {"train_loss": -6.627884864807129, "global_step": 132867, "epoch": 3163} {"train_loss": -6.507843971252441, "global_step": 132868, "epoch": 3163} {"train_loss": -6.68733024597168, "global_step": 132869, "epoch": 3163} {"train_loss": -6.620269775390625, "global_step": 132870, "epoch": 3163} {"train_loss": -6.597492694854736, "global_step": 132871, "epoch": 3163} {"train_loss": -6.65048360824585, "global_step": 132872, "epoch": 3163} {"train_loss": -6.526829719543457, "global_step": 132873, "epoch": 3163} {"train_loss": -6.65151834487915, "global_step": 132874, "epoch": 3163} {"train_loss": -6.635721206665039, "global_step": 132875, "epoch": 3163} {"train_loss": -6.702600955963135, "global_step": 132876, "epoch": 3163} {"train_loss": -6.655214786529541, "global_step": 132877, "epoch": 3163} {"train_loss": -6.681605815887451, "global_step": 132878, "epoch": 3163} {"train_loss": -6.652857780456543, "global_step": 132879, "epoch": 3163} {"train_loss": -6.727609634399414, "global_step": 132880, "epoch": 3163} {"train_loss": -6.759706974029541, "global_step": 132881, "epoch": 3163} {"train_loss": -6.716022968292236, "global_step": 132882, "epoch": 3163} {"train_loss": -6.684144496917725, "global_step": 132883, "epoch": 3163} {"train_loss": -6.7286057472229, "global_step": 132884, "epoch": 3163} {"train_loss": -6.838441848754883, "global_step": 132885, "epoch": 3163} {"train_loss": -6.697656631469727, "global_step": 132886, "epoch": 3163} {"train_loss": -6.673855202538626, "global_step": 132887, "epoch": 3163, "val_loss": 66528.2109375} {"train_loss": -6.754422664642334, "global_step": 132888, "epoch": 3164} {"train_loss": -6.726419925689697, "global_step": 132889, "epoch": 3164} {"train_loss": -6.659072399139404, "global_step": 132890, "epoch": 3164} {"train_loss": -6.834197044372559, "global_step": 132891, "epoch": 3164} {"train_loss": -6.647448539733887, "global_step": 132892, "epoch": 3164} {"train_loss": -6.744653701782227, "global_step": 132893, "epoch": 3164} {"train_loss": -6.777431488037109, "global_step": 132894, "epoch": 3164} {"train_loss": -6.630780220031738, "global_step": 132895, "epoch": 3164} {"train_loss": -6.7221879959106445, "global_step": 132896, "epoch": 3164} {"train_loss": -6.730381011962891, "global_step": 132897, "epoch": 3164} {"train_loss": -6.765896797180176, "global_step": 132898, "epoch": 3164} {"train_loss": -6.771332740783691, "global_step": 132899, "epoch": 3164} {"train_loss": -6.739980697631836, "global_step": 132900, "epoch": 3164} {"train_loss": -6.736939907073975, "global_step": 132901, "epoch": 3164} {"train_loss": -6.710824012756348, "global_step": 132902, "epoch": 3164} {"train_loss": -6.841706275939941, "global_step": 132903, "epoch": 3164} {"train_loss": -6.590032577514648, "global_step": 132904, "epoch": 3164} {"train_loss": -6.667912483215332, "global_step": 132905, "epoch": 3164} {"train_loss": -6.697887420654297, "global_step": 132906, "epoch": 3164} {"train_loss": -6.7890706062316895, "global_step": 132907, "epoch": 3164} {"train_loss": -6.71586799621582, "global_step": 132908, "epoch": 3164} {"train_loss": -6.743372917175293, "global_step": 132909, "epoch": 3164} {"train_loss": -6.659615516662598, "global_step": 132910, "epoch": 3164} {"train_loss": -6.52582311630249, "global_step": 132911, "epoch": 3164} {"train_loss": -6.644065856933594, "global_step": 132912, "epoch": 3164} {"train_loss": -6.6263837814331055, "global_step": 132913, "epoch": 3164} {"train_loss": -6.704878330230713, "global_step": 132914, "epoch": 3164} {"train_loss": -6.700953483581543, "global_step": 132915, "epoch": 3164} {"train_loss": -6.598295211791992, "global_step": 132916, "epoch": 3164} {"train_loss": -6.641557693481445, "global_step": 132917, "epoch": 3164} {"train_loss": -6.721161842346191, "global_step": 132918, "epoch": 3164} {"train_loss": -6.673172950744629, "global_step": 132919, "epoch": 3164} {"train_loss": -6.510834693908691, "global_step": 132920, "epoch": 3164} {"train_loss": -6.6996307373046875, "global_step": 132921, "epoch": 3164} {"train_loss": -6.630057334899902, "global_step": 132922, "epoch": 3164} {"train_loss": -6.626744747161865, "global_step": 132923, "epoch": 3164} {"train_loss": -6.6644792556762695, "global_step": 132924, "epoch": 3164} {"train_loss": -6.7012224197387695, "global_step": 132925, "epoch": 3164} {"train_loss": -6.761534214019775, "global_step": 132926, "epoch": 3164} {"train_loss": -6.670900344848633, "global_step": 132927, "epoch": 3164} {"train_loss": -6.585134506225586, "global_step": 132928, "epoch": 3164} {"train_loss": -6.692835875919887, "global_step": 132929, "epoch": 3164, "val_loss": 67073.0078125} {"train_loss": -6.6367411613464355, "global_step": 132930, "epoch": 3165} {"train_loss": -6.640594005584717, "global_step": 132931, "epoch": 3165} {"train_loss": -6.697148323059082, "global_step": 132932, "epoch": 3165} {"train_loss": -6.615844249725342, "global_step": 132933, "epoch": 3165} {"train_loss": -6.689659118652344, "global_step": 132934, "epoch": 3165} {"train_loss": -6.7195844650268555, "global_step": 132935, "epoch": 3165} {"train_loss": -6.753487586975098, "global_step": 132936, "epoch": 3165} {"train_loss": -6.713944435119629, "global_step": 132937, "epoch": 3165} {"train_loss": -6.649377346038818, "global_step": 132938, "epoch": 3165} {"train_loss": -6.78568696975708, "global_step": 132939, "epoch": 3165} {"train_loss": -6.654033660888672, "global_step": 132940, "epoch": 3165} {"train_loss": -6.741455078125, "global_step": 132941, "epoch": 3165} {"train_loss": -6.677876949310303, "global_step": 132942, "epoch": 3165} {"train_loss": -6.659502029418945, "global_step": 132943, "epoch": 3165} {"train_loss": -6.769500732421875, "global_step": 132944, "epoch": 3165} {"train_loss": -6.812005043029785, "global_step": 132945, "epoch": 3165} {"train_loss": -6.780389785766602, "global_step": 132946, "epoch": 3165} {"train_loss": -6.753342151641846, "global_step": 132947, "epoch": 3165} {"train_loss": -6.662385940551758, "global_step": 132948, "epoch": 3165} {"train_loss": -6.761935234069824, "global_step": 132949, "epoch": 3165} {"train_loss": -6.682461261749268, "global_step": 132950, "epoch": 3165} {"train_loss": -6.689833641052246, "global_step": 132951, "epoch": 3165} {"train_loss": -6.726073265075684, "global_step": 132952, "epoch": 3165} {"train_loss": -6.701866149902344, "global_step": 132953, "epoch": 3165} {"train_loss": -6.734982490539551, "global_step": 132954, "epoch": 3165} {"train_loss": -6.77119255065918, "global_step": 132955, "epoch": 3165} {"train_loss": -6.581071853637695, "global_step": 132956, "epoch": 3165} {"train_loss": -6.61228609085083, "global_step": 132957, "epoch": 3165} {"train_loss": -6.6715779304504395, "global_step": 132958, "epoch": 3165} {"train_loss": -6.460312843322754, "global_step": 132959, "epoch": 3165} {"train_loss": -6.785747528076172, "global_step": 132960, "epoch": 3165} {"train_loss": -6.6920084953308105, "global_step": 132961, "epoch": 3165} {"train_loss": -6.634904861450195, "global_step": 132962, "epoch": 3165} {"train_loss": -6.716317653656006, "global_step": 132963, "epoch": 3165} {"train_loss": -6.648862361907959, "global_step": 132964, "epoch": 3165} {"train_loss": -6.616683006286621, "global_step": 132965, "epoch": 3165} {"train_loss": -6.705155372619629, "global_step": 132966, "epoch": 3165} {"train_loss": -6.672604560852051, "global_step": 132967, "epoch": 3165} {"train_loss": -6.572127342224121, "global_step": 132968, "epoch": 3165} {"train_loss": -6.706643104553223, "global_step": 132969, "epoch": 3165} {"train_loss": -6.522619247436523, "global_step": 132970, "epoch": 3165} {"train_loss": -6.68275507291158, "global_step": 132971, "epoch": 3165, "val_loss": 66629.015625} {"train_loss": -6.671756267547607, "global_step": 132972, "epoch": 3166} {"train_loss": -6.565435409545898, "global_step": 132973, "epoch": 3166} {"train_loss": -6.614752769470215, "global_step": 132974, "epoch": 3166} {"train_loss": -6.704367160797119, "global_step": 132975, "epoch": 3166} {"train_loss": -6.674644470214844, "global_step": 132976, "epoch": 3166} {"train_loss": -6.737577438354492, "global_step": 132977, "epoch": 3166} {"train_loss": -6.531929016113281, "global_step": 132978, "epoch": 3166} {"train_loss": -6.612937927246094, "global_step": 132979, "epoch": 3166} {"train_loss": -6.674323081970215, "global_step": 132980, "epoch": 3166} {"train_loss": -6.723849296569824, "global_step": 132981, "epoch": 3166} {"train_loss": -6.642550468444824, "global_step": 132982, "epoch": 3166} {"train_loss": -6.669081211090088, "global_step": 132983, "epoch": 3166} {"train_loss": -6.668061256408691, "global_step": 132984, "epoch": 3166} {"train_loss": -6.677334308624268, "global_step": 132985, "epoch": 3166} {"train_loss": -6.624048233032227, "global_step": 132986, "epoch": 3166} {"train_loss": -6.724514007568359, "global_step": 132987, "epoch": 3166} {"train_loss": -6.637372016906738, "global_step": 132988, "epoch": 3166} {"train_loss": -6.696294784545898, "global_step": 132989, "epoch": 3166} {"train_loss": -6.748385429382324, "global_step": 132990, "epoch": 3166} {"train_loss": -6.668314456939697, "global_step": 132991, "epoch": 3166} {"train_loss": -6.68891716003418, "global_step": 132992, "epoch": 3166} {"train_loss": -6.7782135009765625, "global_step": 132993, "epoch": 3166} {"train_loss": -6.643768787384033, "global_step": 132994, "epoch": 3166} {"train_loss": -6.644223690032959, "global_step": 132995, "epoch": 3166} {"train_loss": -6.67038631439209, "global_step": 132996, "epoch": 3166} {"train_loss": -6.4991326332092285, "global_step": 132997, "epoch": 3166} {"train_loss": -6.842963218688965, "global_step": 132998, "epoch": 3166} {"train_loss": -6.708361625671387, "global_step": 132999, "epoch": 3166} {"train_loss": -6.535769462585449, "global_step": 133000, "epoch": 3166} {"train_loss": -6.60656213760376, "global_step": 133001, "epoch": 3166} {"train_loss": -6.574202537536621, "global_step": 133002, "epoch": 3166} {"train_loss": -6.526551723480225, "global_step": 133003, "epoch": 3166} {"train_loss": -6.62165641784668, "global_step": 133004, "epoch": 3166} {"train_loss": -6.567718505859375, "global_step": 133005, "epoch": 3166} {"train_loss": -6.610958576202393, "global_step": 133006, "epoch": 3166} {"train_loss": -6.483341693878174, "global_step": 133007, "epoch": 3166} {"train_loss": -6.632425308227539, "global_step": 133008, "epoch": 3166} {"train_loss": -6.592114448547363, "global_step": 133009, "epoch": 3166} {"train_loss": -6.699566841125488, "global_step": 133010, "epoch": 3166} {"train_loss": -6.765345573425293, "global_step": 133011, "epoch": 3166} {"train_loss": -6.6746392250061035, "global_step": 133012, "epoch": 3166} {"train_loss": -6.648232039951143, "global_step": 133013, "epoch": 3166, "val_loss": 66883.0625} {"train_loss": -6.683682441711426, "global_step": 133014, "epoch": 3167} {"train_loss": -6.713878154754639, "global_step": 133015, "epoch": 3167} {"train_loss": -6.585391998291016, "global_step": 133016, "epoch": 3167} {"train_loss": -6.629204750061035, "global_step": 133017, "epoch": 3167} {"train_loss": -6.6728010177612305, "global_step": 133018, "epoch": 3167} {"train_loss": -6.658330917358398, "global_step": 133019, "epoch": 3167} {"train_loss": -6.644471168518066, "global_step": 133020, "epoch": 3167} {"train_loss": -6.630769729614258, "global_step": 133021, "epoch": 3167} {"train_loss": -6.656113147735596, "global_step": 133022, "epoch": 3167} {"train_loss": -6.65972900390625, "global_step": 133023, "epoch": 3167} {"train_loss": -6.648888111114502, "global_step": 133024, "epoch": 3167} {"train_loss": -6.556488990783691, "global_step": 133025, "epoch": 3167} {"train_loss": -6.702548503875732, "global_step": 133026, "epoch": 3167} {"train_loss": -6.55778694152832, "global_step": 133027, "epoch": 3167} {"train_loss": -6.737881660461426, "global_step": 133028, "epoch": 3167} {"train_loss": -6.588397979736328, "global_step": 133029, "epoch": 3167} {"train_loss": -6.651482582092285, "global_step": 133030, "epoch": 3167} {"train_loss": -6.700280666351318, "global_step": 133031, "epoch": 3167} {"train_loss": -6.772727012634277, "global_step": 133032, "epoch": 3167} {"train_loss": -6.711187362670898, "global_step": 133033, "epoch": 3167} {"train_loss": -6.682730674743652, "global_step": 133034, "epoch": 3167} {"train_loss": -6.755249977111816, "global_step": 133035, "epoch": 3167} {"train_loss": -6.62294864654541, "global_step": 133036, "epoch": 3167} {"train_loss": -6.732351303100586, "global_step": 133037, "epoch": 3167} {"train_loss": -6.652565956115723, "global_step": 133038, "epoch": 3167} {"train_loss": -6.7833781242370605, "global_step": 133039, "epoch": 3167} {"train_loss": -6.789880275726318, "global_step": 133040, "epoch": 3167} {"train_loss": -6.756017684936523, "global_step": 133041, "epoch": 3167} {"train_loss": -6.7515339851379395, "global_step": 133042, "epoch": 3167} {"train_loss": -6.801322937011719, "global_step": 133043, "epoch": 3167} {"train_loss": -6.708927631378174, "global_step": 133044, "epoch": 3167} {"train_loss": -6.703069686889648, "global_step": 133045, "epoch": 3167} {"train_loss": -6.721832752227783, "global_step": 133046, "epoch": 3167} {"train_loss": -6.769673824310303, "global_step": 133047, "epoch": 3167} {"train_loss": -6.8101887702941895, "global_step": 133048, "epoch": 3167} {"train_loss": -6.8024187088012695, "global_step": 133049, "epoch": 3167} {"train_loss": -6.670555591583252, "global_step": 133050, "epoch": 3167} {"train_loss": -6.817255973815918, "global_step": 133051, "epoch": 3167} {"train_loss": -6.681310176849365, "global_step": 133052, "epoch": 3167} {"train_loss": -6.788349151611328, "global_step": 133053, "epoch": 3167} {"train_loss": -6.79820442199707, "global_step": 133054, "epoch": 3167} {"train_loss": -6.702579623176938, "global_step": 133055, "epoch": 3167, "val_loss": 66672.359375} {"train_loss": -6.772112846374512, "global_step": 133056, "epoch": 3168} {"train_loss": -6.864797592163086, "global_step": 133057, "epoch": 3168} {"train_loss": -6.691905498504639, "global_step": 133058, "epoch": 3168} {"train_loss": -6.708513259887695, "global_step": 133059, "epoch": 3168} {"train_loss": -6.719046592712402, "global_step": 133060, "epoch": 3168} {"train_loss": -6.647089004516602, "global_step": 133061, "epoch": 3168} {"train_loss": -6.792986869812012, "global_step": 133062, "epoch": 3168} {"train_loss": -6.825153827667236, "global_step": 133063, "epoch": 3168} {"train_loss": -6.737422943115234, "global_step": 133064, "epoch": 3168} {"train_loss": -6.758662700653076, "global_step": 133065, "epoch": 3168} {"train_loss": -6.690532684326172, "global_step": 133066, "epoch": 3168} {"train_loss": -6.703121185302734, "global_step": 133067, "epoch": 3168} {"train_loss": -6.789609909057617, "global_step": 133068, "epoch": 3168} {"train_loss": -6.7134504318237305, "global_step": 133069, "epoch": 3168} {"train_loss": -6.805796146392822, "global_step": 133070, "epoch": 3168} {"train_loss": -6.770771026611328, "global_step": 133071, "epoch": 3168} {"train_loss": -6.768518447875977, "global_step": 133072, "epoch": 3168} {"train_loss": -6.735936164855957, "global_step": 133073, "epoch": 3168} {"train_loss": -6.718545913696289, "global_step": 133074, "epoch": 3168} {"train_loss": -6.728704452514648, "global_step": 133075, "epoch": 3168} {"train_loss": -6.831890106201172, "global_step": 133076, "epoch": 3168} {"train_loss": -6.6432390213012695, "global_step": 133077, "epoch": 3168} {"train_loss": -6.7082977294921875, "global_step": 133078, "epoch": 3168} {"train_loss": -6.693285942077637, "global_step": 133079, "epoch": 3168} {"train_loss": -6.675939559936523, "global_step": 133080, "epoch": 3168} {"train_loss": -6.670577049255371, "global_step": 133081, "epoch": 3168} {"train_loss": -6.674132823944092, "global_step": 133082, "epoch": 3168} {"train_loss": -6.764664649963379, "global_step": 133083, "epoch": 3168} {"train_loss": -6.593871116638184, "global_step": 133084, "epoch": 3168} {"train_loss": -6.700726509094238, "global_step": 133085, "epoch": 3168} {"train_loss": -6.541838645935059, "global_step": 133086, "epoch": 3168} {"train_loss": -6.661229133605957, "global_step": 133087, "epoch": 3168} {"train_loss": -6.806888580322266, "global_step": 133088, "epoch": 3168} {"train_loss": -6.705807685852051, "global_step": 133089, "epoch": 3168} {"train_loss": -6.710072994232178, "global_step": 133090, "epoch": 3168} {"train_loss": -6.7234086990356445, "global_step": 133091, "epoch": 3168} {"train_loss": -6.701761245727539, "global_step": 133092, "epoch": 3168} {"train_loss": -6.670176982879639, "global_step": 133093, "epoch": 3168} {"train_loss": -6.645327568054199, "global_step": 133094, "epoch": 3168} {"train_loss": -6.6245832443237305, "global_step": 133095, "epoch": 3168} {"train_loss": -6.599097728729248, "global_step": 133096, "epoch": 3168} {"train_loss": -6.714893749782017, "global_step": 133097, "epoch": 3168, "val_loss": 66669.8984375} {"train_loss": -6.71012544631958, "global_step": 133098, "epoch": 3169} {"train_loss": -6.609376907348633, "global_step": 133099, "epoch": 3169} {"train_loss": -6.7337493896484375, "global_step": 133100, "epoch": 3169} {"train_loss": -6.711658477783203, "global_step": 133101, "epoch": 3169} {"train_loss": -6.630086421966553, "global_step": 133102, "epoch": 3169} {"train_loss": -6.706662178039551, "global_step": 133103, "epoch": 3169} {"train_loss": -6.692511558532715, "global_step": 133104, "epoch": 3169} {"train_loss": -6.625720977783203, "global_step": 133105, "epoch": 3169} {"train_loss": -6.541332244873047, "global_step": 133106, "epoch": 3169} {"train_loss": -6.617244243621826, "global_step": 133107, "epoch": 3169} {"train_loss": -6.5940141677856445, "global_step": 133108, "epoch": 3169} {"train_loss": -6.490397930145264, "global_step": 133109, "epoch": 3169} {"train_loss": -6.616900444030762, "global_step": 133110, "epoch": 3169} {"train_loss": -6.508366107940674, "global_step": 133111, "epoch": 3169} {"train_loss": -6.64176082611084, "global_step": 133112, "epoch": 3169} {"train_loss": -6.607694149017334, "global_step": 133113, "epoch": 3169} {"train_loss": -6.626760482788086, "global_step": 133114, "epoch": 3169} {"train_loss": -6.569965839385986, "global_step": 133115, "epoch": 3169} {"train_loss": -6.660353183746338, "global_step": 133116, "epoch": 3169} {"train_loss": -6.590899467468262, "global_step": 133117, "epoch": 3169} {"train_loss": -6.737900257110596, "global_step": 133118, "epoch": 3169} {"train_loss": -6.711226463317871, "global_step": 133119, "epoch": 3169} {"train_loss": -6.6538286209106445, "global_step": 133120, "epoch": 3169} {"train_loss": -6.591789245605469, "global_step": 133121, "epoch": 3169} {"train_loss": -6.617580413818359, "global_step": 133122, "epoch": 3169} {"train_loss": -6.767552375793457, "global_step": 133123, "epoch": 3169} {"train_loss": -6.702709197998047, "global_step": 133124, "epoch": 3169} {"train_loss": -6.703420162200928, "global_step": 133125, "epoch": 3169} {"train_loss": -6.791830062866211, "global_step": 133126, "epoch": 3169} {"train_loss": -6.625317096710205, "global_step": 133127, "epoch": 3169} {"train_loss": -6.564797878265381, "global_step": 133128, "epoch": 3169} {"train_loss": -6.723388671875, "global_step": 133129, "epoch": 3169} {"train_loss": -6.816978454589844, "global_step": 133130, "epoch": 3169} {"train_loss": -6.585750102996826, "global_step": 133131, "epoch": 3169} {"train_loss": -6.730572700500488, "global_step": 133132, "epoch": 3169} {"train_loss": -6.7417216300964355, "global_step": 133133, "epoch": 3169} {"train_loss": -6.55376672744751, "global_step": 133134, "epoch": 3169} {"train_loss": -6.7158203125, "global_step": 133135, "epoch": 3169} {"train_loss": -6.748544692993164, "global_step": 133136, "epoch": 3169} {"train_loss": -6.605266571044922, "global_step": 133137, "epoch": 3169} {"train_loss": -6.839753150939941, "global_step": 133138, "epoch": 3169} {"train_loss": -6.661265384583246, "global_step": 133139, "epoch": 3169, "val_loss": 66731.5625} {"train_loss": -6.8071794509887695, "global_step": 133140, "epoch": 3170} {"train_loss": -6.668813705444336, "global_step": 133141, "epoch": 3170} {"train_loss": -6.791132926940918, "global_step": 133142, "epoch": 3170} {"train_loss": -6.660553455352783, "global_step": 133143, "epoch": 3170} {"train_loss": -6.67954158782959, "global_step": 133144, "epoch": 3170} {"train_loss": -6.659672260284424, "global_step": 133145, "epoch": 3170} {"train_loss": -6.767867088317871, "global_step": 133146, "epoch": 3170} {"train_loss": -6.674674987792969, "global_step": 133147, "epoch": 3170} {"train_loss": -6.6696648597717285, "global_step": 133148, "epoch": 3170} {"train_loss": -6.783968925476074, "global_step": 133149, "epoch": 3170} {"train_loss": -6.67191219329834, "global_step": 133150, "epoch": 3170} {"train_loss": -6.708829879760742, "global_step": 133151, "epoch": 3170} {"train_loss": -6.740878105163574, "global_step": 133152, "epoch": 3170} {"train_loss": -6.772780418395996, "global_step": 133153, "epoch": 3170} {"train_loss": -6.672841548919678, "global_step": 133154, "epoch": 3170} {"train_loss": -6.623819351196289, "global_step": 133155, "epoch": 3170} {"train_loss": -6.688599586486816, "global_step": 133156, "epoch": 3170} {"train_loss": -6.676509380340576, "global_step": 133157, "epoch": 3170} {"train_loss": -6.763962745666504, "global_step": 133158, "epoch": 3170} {"train_loss": -6.807533264160156, "global_step": 133159, "epoch": 3170} {"train_loss": -6.73799991607666, "global_step": 133160, "epoch": 3170} {"train_loss": -6.746466636657715, "global_step": 133161, "epoch": 3170} {"train_loss": -6.678799629211426, "global_step": 133162, "epoch": 3170} {"train_loss": -6.716163635253906, "global_step": 133163, "epoch": 3170} {"train_loss": -6.745249271392822, "global_step": 133164, "epoch": 3170} {"train_loss": -6.764101028442383, "global_step": 133165, "epoch": 3170} {"train_loss": -6.591379165649414, "global_step": 133166, "epoch": 3170} {"train_loss": -6.670205593109131, "global_step": 133167, "epoch": 3170} {"train_loss": -6.701292991638184, "global_step": 133168, "epoch": 3170} {"train_loss": -6.565749168395996, "global_step": 133169, "epoch": 3170} {"train_loss": -6.6466064453125, "global_step": 133170, "epoch": 3170} {"train_loss": -6.771441459655762, "global_step": 133171, "epoch": 3170} {"train_loss": -6.6936845779418945, "global_step": 133172, "epoch": 3170} {"train_loss": -6.770442008972168, "global_step": 133173, "epoch": 3170} {"train_loss": -6.713535308837891, "global_step": 133174, "epoch": 3170} {"train_loss": -6.72048282623291, "global_step": 133175, "epoch": 3170} {"train_loss": -6.578394889831543, "global_step": 133176, "epoch": 3170} {"train_loss": -6.7292962074279785, "global_step": 133177, "epoch": 3170} {"train_loss": -6.690728664398193, "global_step": 133178, "epoch": 3170} {"train_loss": -6.655209541320801, "global_step": 133179, "epoch": 3170} {"train_loss": -6.7171783447265625, "global_step": 133180, "epoch": 3170} {"train_loss": -6.701625710441952, "global_step": 133181, "epoch": 3170, "val_loss": 66868.6640625} {"train_loss": -6.780076026916504, "global_step": 133182, "epoch": 3171} {"train_loss": -6.741336822509766, "global_step": 133183, "epoch": 3171} {"train_loss": -6.656408309936523, "global_step": 133184, "epoch": 3171} {"train_loss": -6.710452079772949, "global_step": 133185, "epoch": 3171} {"train_loss": -6.807188510894775, "global_step": 133186, "epoch": 3171} {"train_loss": -6.687922954559326, "global_step": 133187, "epoch": 3171} {"train_loss": -6.742936134338379, "global_step": 133188, "epoch": 3171} {"train_loss": -6.789816379547119, "global_step": 133189, "epoch": 3171} {"train_loss": -6.734344005584717, "global_step": 133190, "epoch": 3171} {"train_loss": -6.777881622314453, "global_step": 133191, "epoch": 3171} {"train_loss": -6.737454414367676, "global_step": 133192, "epoch": 3171} {"train_loss": -6.662442207336426, "global_step": 133193, "epoch": 3171} {"train_loss": -6.66220760345459, "global_step": 133194, "epoch": 3171} {"train_loss": -6.817977428436279, "global_step": 133195, "epoch": 3171} {"train_loss": -6.641407489776611, "global_step": 133196, "epoch": 3171} {"train_loss": -6.557108402252197, "global_step": 133197, "epoch": 3171} {"train_loss": -6.76674747467041, "global_step": 133198, "epoch": 3171} {"train_loss": -6.649430751800537, "global_step": 133199, "epoch": 3171} {"train_loss": -6.6652069091796875, "global_step": 133200, "epoch": 3171} {"train_loss": -6.673046588897705, "global_step": 133201, "epoch": 3171} {"train_loss": -6.718542575836182, "global_step": 133202, "epoch": 3171} {"train_loss": -6.671281814575195, "global_step": 133203, "epoch": 3171} {"train_loss": -6.69573974609375, "global_step": 133204, "epoch": 3171} {"train_loss": -6.592837333679199, "global_step": 133205, "epoch": 3171} {"train_loss": -6.708352088928223, "global_step": 133206, "epoch": 3171} {"train_loss": -6.7449421882629395, "global_step": 133207, "epoch": 3171} {"train_loss": -6.65803861618042, "global_step": 133208, "epoch": 3171} {"train_loss": -6.565756320953369, "global_step": 133209, "epoch": 3171} {"train_loss": -6.616859436035156, "global_step": 133210, "epoch": 3171} {"train_loss": -6.771226406097412, "global_step": 133211, "epoch": 3171} {"train_loss": -6.532870292663574, "global_step": 133212, "epoch": 3171} {"train_loss": -6.574012756347656, "global_step": 133213, "epoch": 3171} {"train_loss": -6.691103935241699, "global_step": 133214, "epoch": 3171} {"train_loss": -6.556496620178223, "global_step": 133215, "epoch": 3171} {"train_loss": -6.614052772521973, "global_step": 133216, "epoch": 3171} {"train_loss": -6.657184600830078, "global_step": 133217, "epoch": 3171} {"train_loss": -6.495059967041016, "global_step": 133218, "epoch": 3171} {"train_loss": -6.608638763427734, "global_step": 133219, "epoch": 3171} {"train_loss": -6.541877746582031, "global_step": 133220, "epoch": 3171} {"train_loss": -6.741199493408203, "global_step": 133221, "epoch": 3171} {"train_loss": -6.52566385269165, "global_step": 133222, "epoch": 3171} {"train_loss": -6.671974851971581, "global_step": 133223, "epoch": 3171, "val_loss": 66714.015625} {"train_loss": -6.618218421936035, "global_step": 133224, "epoch": 3172} {"train_loss": -6.648061275482178, "global_step": 133225, "epoch": 3172} {"train_loss": -6.760690212249756, "global_step": 133226, "epoch": 3172} {"train_loss": -6.670671463012695, "global_step": 133227, "epoch": 3172} {"train_loss": -6.768372535705566, "global_step": 133228, "epoch": 3172} {"train_loss": -6.807618618011475, "global_step": 133229, "epoch": 3172} {"train_loss": -6.755731105804443, "global_step": 133230, "epoch": 3172} {"train_loss": -6.657497406005859, "global_step": 133231, "epoch": 3172} {"train_loss": -6.676225662231445, "global_step": 133232, "epoch": 3172} {"train_loss": -6.7066545486450195, "global_step": 133233, "epoch": 3172} {"train_loss": -6.74705696105957, "global_step": 133234, "epoch": 3172} {"train_loss": -6.676229953765869, "global_step": 133235, "epoch": 3172} {"train_loss": -6.72111701965332, "global_step": 133236, "epoch": 3172} {"train_loss": -6.6866254806518555, "global_step": 133237, "epoch": 3172} {"train_loss": -6.7192277908325195, "global_step": 133238, "epoch": 3172} {"train_loss": -6.707218170166016, "global_step": 133239, "epoch": 3172} {"train_loss": -6.622485637664795, "global_step": 133240, "epoch": 3172} {"train_loss": -6.6688947677612305, "global_step": 133241, "epoch": 3172} {"train_loss": -6.616117477416992, "global_step": 133242, "epoch": 3172} {"train_loss": -6.775174140930176, "global_step": 133243, "epoch": 3172} {"train_loss": -6.752372741699219, "global_step": 133244, "epoch": 3172} {"train_loss": -6.6750898361206055, "global_step": 133245, "epoch": 3172} {"train_loss": -6.7213029861450195, "global_step": 133246, "epoch": 3172} {"train_loss": -6.780507564544678, "global_step": 133247, "epoch": 3172} {"train_loss": -6.680183410644531, "global_step": 133248, "epoch": 3172} {"train_loss": -6.827056884765625, "global_step": 133249, "epoch": 3172} {"train_loss": -6.682070732116699, "global_step": 133250, "epoch": 3172} {"train_loss": -6.696030139923096, "global_step": 133251, "epoch": 3172} {"train_loss": -6.566342830657959, "global_step": 133252, "epoch": 3172} {"train_loss": -6.6422119140625, "global_step": 133253, "epoch": 3172} {"train_loss": -6.70351505279541, "global_step": 133254, "epoch": 3172} {"train_loss": -6.755633354187012, "global_step": 133255, "epoch": 3172} {"train_loss": -6.622705459594727, "global_step": 133256, "epoch": 3172} {"train_loss": -6.70802116394043, "global_step": 133257, "epoch": 3172} {"train_loss": -6.611485958099365, "global_step": 133258, "epoch": 3172} {"train_loss": -6.731182098388672, "global_step": 133259, "epoch": 3172} {"train_loss": -6.769062042236328, "global_step": 133260, "epoch": 3172} {"train_loss": -6.74273157119751, "global_step": 133261, "epoch": 3172} {"train_loss": -6.643339157104492, "global_step": 133262, "epoch": 3172} {"train_loss": -6.749475479125977, "global_step": 133263, "epoch": 3172} {"train_loss": -6.713420867919922, "global_step": 133264, "epoch": 3172} {"train_loss": -6.704648120062692, "global_step": 133265, "epoch": 3172, "val_loss": 66646.3828125} {"train_loss": -6.704646110534668, "global_step": 133266, "epoch": 3173} {"train_loss": -6.6588969230651855, "global_step": 133267, "epoch": 3173} {"train_loss": -6.742620468139648, "global_step": 133268, "epoch": 3173} {"train_loss": -6.745668411254883, "global_step": 133269, "epoch": 3173} {"train_loss": -6.6470746994018555, "global_step": 133270, "epoch": 3173} {"train_loss": -6.677227973937988, "global_step": 133271, "epoch": 3173} {"train_loss": -6.81438684463501, "global_step": 133272, "epoch": 3173} {"train_loss": -6.670990467071533, "global_step": 133273, "epoch": 3173} {"train_loss": -6.777523517608643, "global_step": 133274, "epoch": 3173} {"train_loss": -6.678953170776367, "global_step": 133275, "epoch": 3173} {"train_loss": -6.6166791915893555, "global_step": 133276, "epoch": 3173} {"train_loss": -6.707636833190918, "global_step": 133277, "epoch": 3173} {"train_loss": -6.713074207305908, "global_step": 133278, "epoch": 3173} {"train_loss": -6.771353721618652, "global_step": 133279, "epoch": 3173} {"train_loss": -6.768240451812744, "global_step": 133280, "epoch": 3173} {"train_loss": -6.738092422485352, "global_step": 133281, "epoch": 3173} {"train_loss": -6.753726959228516, "global_step": 133282, "epoch": 3173} {"train_loss": -6.651430130004883, "global_step": 133283, "epoch": 3173} {"train_loss": -6.664821624755859, "global_step": 133284, "epoch": 3173} {"train_loss": -6.589357376098633, "global_step": 133285, "epoch": 3173} {"train_loss": -6.741387367248535, "global_step": 133286, "epoch": 3173} {"train_loss": -6.711550712585449, "global_step": 133287, "epoch": 3173} {"train_loss": -6.690250396728516, "global_step": 133288, "epoch": 3173} {"train_loss": -6.791949272155762, "global_step": 133289, "epoch": 3173} {"train_loss": -6.658266067504883, "global_step": 133290, "epoch": 3173} {"train_loss": -6.703498363494873, "global_step": 133291, "epoch": 3173} {"train_loss": -6.705348014831543, "global_step": 133292, "epoch": 3173} {"train_loss": -6.554704666137695, "global_step": 133293, "epoch": 3173} {"train_loss": -6.608852386474609, "global_step": 133294, "epoch": 3173} {"train_loss": -6.804370880126953, "global_step": 133295, "epoch": 3173} {"train_loss": -6.64699649810791, "global_step": 133296, "epoch": 3173} {"train_loss": -6.710785865783691, "global_step": 133297, "epoch": 3173} {"train_loss": -6.66552209854126, "global_step": 133298, "epoch": 3173} {"train_loss": -6.743124008178711, "global_step": 133299, "epoch": 3173} {"train_loss": -6.681644439697266, "global_step": 133300, "epoch": 3173} {"train_loss": -6.652559280395508, "global_step": 133301, "epoch": 3173} {"train_loss": -6.587129592895508, "global_step": 133302, "epoch": 3173} {"train_loss": -6.718831539154053, "global_step": 133303, "epoch": 3173} {"train_loss": -6.658390045166016, "global_step": 133304, "epoch": 3173} {"train_loss": -6.715835094451904, "global_step": 133305, "epoch": 3173} {"train_loss": -6.68479061126709, "global_step": 133306, "epoch": 3173} {"train_loss": -6.693934667678106, "global_step": 133307, "epoch": 3173, "val_loss": 67085.484375} {"train_loss": -6.727510929107666, "global_step": 133308, "epoch": 3174} {"train_loss": -6.686816692352295, "global_step": 133309, "epoch": 3174} {"train_loss": -6.812783241271973, "global_step": 133310, "epoch": 3174} {"train_loss": -6.649602890014648, "global_step": 133311, "epoch": 3174} {"train_loss": -6.662079811096191, "global_step": 133312, "epoch": 3174} {"train_loss": -6.6834516525268555, "global_step": 133313, "epoch": 3174} {"train_loss": -6.653823375701904, "global_step": 133314, "epoch": 3174} {"train_loss": -6.663033962249756, "global_step": 133315, "epoch": 3174} {"train_loss": -6.714044570922852, "global_step": 133316, "epoch": 3174} {"train_loss": -6.716651916503906, "global_step": 133317, "epoch": 3174} {"train_loss": -6.569232940673828, "global_step": 133318, "epoch": 3174} {"train_loss": -6.73805046081543, "global_step": 133319, "epoch": 3174} {"train_loss": -6.5939717292785645, "global_step": 133320, "epoch": 3174} {"train_loss": -6.524742603302002, "global_step": 133321, "epoch": 3174} {"train_loss": -6.630134105682373, "global_step": 133322, "epoch": 3174} {"train_loss": -6.662088394165039, "global_step": 133323, "epoch": 3174} {"train_loss": -6.644113540649414, "global_step": 133324, "epoch": 3174} {"train_loss": -6.499072551727295, "global_step": 133325, "epoch": 3174} {"train_loss": -6.62802791595459, "global_step": 133326, "epoch": 3174} {"train_loss": -6.690618515014648, "global_step": 133327, "epoch": 3174} {"train_loss": -6.568917751312256, "global_step": 133328, "epoch": 3174} {"train_loss": -6.472294330596924, "global_step": 133329, "epoch": 3174} {"train_loss": -6.5820207595825195, "global_step": 133330, "epoch": 3174} {"train_loss": -6.681972980499268, "global_step": 133331, "epoch": 3174} {"train_loss": -6.656191825866699, "global_step": 133332, "epoch": 3174} {"train_loss": -6.516506671905518, "global_step": 133333, "epoch": 3174} {"train_loss": -6.668105125427246, "global_step": 133334, "epoch": 3174} {"train_loss": -6.668092727661133, "global_step": 133335, "epoch": 3174} {"train_loss": -6.661507606506348, "global_step": 133336, "epoch": 3174} {"train_loss": -6.751788139343262, "global_step": 133337, "epoch": 3174} {"train_loss": -6.700172424316406, "global_step": 133338, "epoch": 3174} {"train_loss": -6.61202335357666, "global_step": 133339, "epoch": 3174} {"train_loss": -6.764263153076172, "global_step": 133340, "epoch": 3174} {"train_loss": -6.628832817077637, "global_step": 133341, "epoch": 3174} {"train_loss": -6.681439399719238, "global_step": 133342, "epoch": 3174} {"train_loss": -6.709733009338379, "global_step": 133343, "epoch": 3174} {"train_loss": -6.641685485839844, "global_step": 133344, "epoch": 3174} {"train_loss": -6.727179527282715, "global_step": 133345, "epoch": 3174} {"train_loss": -6.761582374572754, "global_step": 133346, "epoch": 3174} {"train_loss": -6.602241516113281, "global_step": 133347, "epoch": 3174} {"train_loss": -6.898448944091797, "global_step": 133348, "epoch": 3174} {"train_loss": -6.66217413402739, "global_step": 133349, "epoch": 3174, "val_loss": 66749.1953125} {"train_loss": -6.735956192016602, "global_step": 133350, "epoch": 3175} {"train_loss": -6.622316360473633, "global_step": 133351, "epoch": 3175} {"train_loss": -6.659546852111816, "global_step": 133352, "epoch": 3175} {"train_loss": -6.623703956604004, "global_step": 133353, "epoch": 3175} {"train_loss": -6.775019645690918, "global_step": 133354, "epoch": 3175} {"train_loss": -6.6687822341918945, "global_step": 133355, "epoch": 3175} {"train_loss": -6.619332313537598, "global_step": 133356, "epoch": 3175} {"train_loss": -6.686732292175293, "global_step": 133357, "epoch": 3175} {"train_loss": -6.6382951736450195, "global_step": 133358, "epoch": 3175} {"train_loss": -6.679522514343262, "global_step": 133359, "epoch": 3175} {"train_loss": -6.636651039123535, "global_step": 133360, "epoch": 3175} {"train_loss": -6.699533462524414, "global_step": 133361, "epoch": 3175} {"train_loss": -6.676638603210449, "global_step": 133362, "epoch": 3175} {"train_loss": -6.5978922843933105, "global_step": 133363, "epoch": 3175} {"train_loss": -6.673028945922852, "global_step": 133364, "epoch": 3175} {"train_loss": -6.621650695800781, "global_step": 133365, "epoch": 3175} {"train_loss": -6.61777400970459, "global_step": 133366, "epoch": 3175} {"train_loss": -6.670816421508789, "global_step": 133367, "epoch": 3175} {"train_loss": -6.593745231628418, "global_step": 133368, "epoch": 3175} {"train_loss": -6.634064197540283, "global_step": 133369, "epoch": 3175} {"train_loss": -6.608087539672852, "global_step": 133370, "epoch": 3175} {"train_loss": -6.618259429931641, "global_step": 133371, "epoch": 3175} {"train_loss": -6.5693511962890625, "global_step": 133372, "epoch": 3175} {"train_loss": -6.682946681976318, "global_step": 133373, "epoch": 3175} {"train_loss": -6.695852756500244, "global_step": 133374, "epoch": 3175} {"train_loss": -6.703704833984375, "global_step": 133375, "epoch": 3175} {"train_loss": -6.749168395996094, "global_step": 133376, "epoch": 3175} {"train_loss": -6.742711067199707, "global_step": 133377, "epoch": 3175} {"train_loss": -6.7479400634765625, "global_step": 133378, "epoch": 3175} {"train_loss": -6.783145904541016, "global_step": 133379, "epoch": 3175} {"train_loss": -6.683564186096191, "global_step": 133380, "epoch": 3175} {"train_loss": -6.61457633972168, "global_step": 133381, "epoch": 3175} {"train_loss": -6.764440536499023, "global_step": 133382, "epoch": 3175} {"train_loss": -6.655187606811523, "global_step": 133383, "epoch": 3175} {"train_loss": -6.756416320800781, "global_step": 133384, "epoch": 3175} {"train_loss": -6.7369279861450195, "global_step": 133385, "epoch": 3175} {"train_loss": -6.798956871032715, "global_step": 133386, "epoch": 3175} {"train_loss": -6.683162689208984, "global_step": 133387, "epoch": 3175} {"train_loss": -6.787057399749756, "global_step": 133388, "epoch": 3175} {"train_loss": -6.6923723220825195, "global_step": 133389, "epoch": 3175} {"train_loss": -6.653491973876953, "global_step": 133390, "epoch": 3175} {"train_loss": -6.680094866525559, "global_step": 133391, "epoch": 3175, "val_loss": 66671.484375} {"train_loss": -6.727529048919678, "global_step": 133392, "epoch": 3176} {"train_loss": -6.692291259765625, "global_step": 133393, "epoch": 3176} {"train_loss": -6.694207668304443, "global_step": 133394, "epoch": 3176} {"train_loss": -6.686008453369141, "global_step": 133395, "epoch": 3176} {"train_loss": -6.670543193817139, "global_step": 133396, "epoch": 3176} {"train_loss": -6.5781354904174805, "global_step": 133397, "epoch": 3176} {"train_loss": -6.843985080718994, "global_step": 133398, "epoch": 3176} {"train_loss": -6.729435920715332, "global_step": 133399, "epoch": 3176} {"train_loss": -6.80998420715332, "global_step": 133400, "epoch": 3176} {"train_loss": -6.811850070953369, "global_step": 133401, "epoch": 3176} {"train_loss": -6.693728446960449, "global_step": 133402, "epoch": 3176} {"train_loss": -6.769423484802246, "global_step": 133403, "epoch": 3176} {"train_loss": -6.690174102783203, "global_step": 133404, "epoch": 3176} {"train_loss": -6.6659345626831055, "global_step": 133405, "epoch": 3176} {"train_loss": -6.8262481689453125, "global_step": 133406, "epoch": 3176} {"train_loss": -6.6939520835876465, "global_step": 133407, "epoch": 3176} {"train_loss": -6.644173622131348, "global_step": 133408, "epoch": 3176} {"train_loss": -6.7005696296691895, "global_step": 133409, "epoch": 3176} {"train_loss": -6.663431644439697, "global_step": 133410, "epoch": 3176} {"train_loss": -6.765403747558594, "global_step": 133411, "epoch": 3176} {"train_loss": -6.7256669998168945, "global_step": 133412, "epoch": 3176} {"train_loss": -6.777009963989258, "global_step": 133413, "epoch": 3176} {"train_loss": -6.755792617797852, "global_step": 133414, "epoch": 3176} {"train_loss": -6.747747421264648, "global_step": 133415, "epoch": 3176} {"train_loss": -6.684309959411621, "global_step": 133416, "epoch": 3176} {"train_loss": -6.802769184112549, "global_step": 133417, "epoch": 3176} {"train_loss": -6.624035835266113, "global_step": 133418, "epoch": 3176} {"train_loss": -6.68735933303833, "global_step": 133419, "epoch": 3176} {"train_loss": -6.7963175773620605, "global_step": 133420, "epoch": 3176} {"train_loss": -6.765084266662598, "global_step": 133421, "epoch": 3176} {"train_loss": -6.7079010009765625, "global_step": 133422, "epoch": 3176} {"train_loss": -6.584985733032227, "global_step": 133423, "epoch": 3176} {"train_loss": -6.682043075561523, "global_step": 133424, "epoch": 3176} {"train_loss": -6.760241508483887, "global_step": 133425, "epoch": 3176} {"train_loss": -6.729649066925049, "global_step": 133426, "epoch": 3176} {"train_loss": -6.636861324310303, "global_step": 133427, "epoch": 3176} {"train_loss": -6.705930233001709, "global_step": 133428, "epoch": 3176} {"train_loss": -6.5643768310546875, "global_step": 133429, "epoch": 3176} {"train_loss": -6.676934242248535, "global_step": 133430, "epoch": 3176} {"train_loss": -6.700248718261719, "global_step": 133431, "epoch": 3176} {"train_loss": -6.679718017578125, "global_step": 133432, "epoch": 3176} {"train_loss": -6.7090552761441185, "global_step": 133433, "epoch": 3176, "val_loss": 67157.625} {"train_loss": -6.703296661376953, "global_step": 133434, "epoch": 3177} {"train_loss": -6.660613536834717, "global_step": 133435, "epoch": 3177} {"train_loss": -6.6859869956970215, "global_step": 133436, "epoch": 3177} {"train_loss": -6.659037113189697, "global_step": 133437, "epoch": 3177} {"train_loss": -6.71482515335083, "global_step": 133438, "epoch": 3177} {"train_loss": -6.717212677001953, "global_step": 133439, "epoch": 3177} {"train_loss": -6.674856662750244, "global_step": 133440, "epoch": 3177} {"train_loss": -6.751182556152344, "global_step": 133441, "epoch": 3177} {"train_loss": -6.791092872619629, "global_step": 133442, "epoch": 3177} {"train_loss": -6.777179718017578, "global_step": 133443, "epoch": 3177} {"train_loss": -6.732948303222656, "global_step": 133444, "epoch": 3177} {"train_loss": -6.758918285369873, "global_step": 133445, "epoch": 3177} {"train_loss": -6.6978325843811035, "global_step": 133446, "epoch": 3177} {"train_loss": -6.713466644287109, "global_step": 133447, "epoch": 3177} {"train_loss": -6.709628105163574, "global_step": 133448, "epoch": 3177} {"train_loss": -6.782936096191406, "global_step": 133449, "epoch": 3177} {"train_loss": -6.747025012969971, "global_step": 133450, "epoch": 3177} {"train_loss": -6.649493217468262, "global_step": 133451, "epoch": 3177} {"train_loss": -6.735876083374023, "global_step": 133452, "epoch": 3177} {"train_loss": -6.798986434936523, "global_step": 133453, "epoch": 3177} {"train_loss": -6.613837242126465, "global_step": 133454, "epoch": 3177} {"train_loss": -6.786497116088867, "global_step": 133455, "epoch": 3177} {"train_loss": -6.623504638671875, "global_step": 133456, "epoch": 3177} {"train_loss": -6.670085430145264, "global_step": 133457, "epoch": 3177} {"train_loss": -6.710499286651611, "global_step": 133458, "epoch": 3177} {"train_loss": -6.675018310546875, "global_step": 133459, "epoch": 3177} {"train_loss": -6.697364330291748, "global_step": 133460, "epoch": 3177} {"train_loss": -6.738552093505859, "global_step": 133461, "epoch": 3177} {"train_loss": -6.795954704284668, "global_step": 133462, "epoch": 3177} {"train_loss": -6.784292221069336, "global_step": 133463, "epoch": 3177} {"train_loss": -6.743744850158691, "global_step": 133464, "epoch": 3177} {"train_loss": -6.726706504821777, "global_step": 133465, "epoch": 3177} {"train_loss": -6.789325714111328, "global_step": 133466, "epoch": 3177} {"train_loss": -6.775465965270996, "global_step": 133467, "epoch": 3177} {"train_loss": -6.732420444488525, "global_step": 133468, "epoch": 3177} {"train_loss": -6.699041366577148, "global_step": 133469, "epoch": 3177} {"train_loss": -6.81000280380249, "global_step": 133470, "epoch": 3177} {"train_loss": -6.791521072387695, "global_step": 133471, "epoch": 3177} {"train_loss": -6.746919631958008, "global_step": 133472, "epoch": 3177} {"train_loss": -6.720943450927734, "global_step": 133473, "epoch": 3177} {"train_loss": -6.691661834716797, "global_step": 133474, "epoch": 3177} {"train_loss": -6.723041682016282, "global_step": 133475, "epoch": 3177, "val_loss": 66780.8046875} {"train_loss": -6.785318374633789, "global_step": 133476, "epoch": 3178} {"train_loss": -6.666389465332031, "global_step": 133477, "epoch": 3178} {"train_loss": -6.823972225189209, "global_step": 133478, "epoch": 3178} {"train_loss": -6.817227363586426, "global_step": 133479, "epoch": 3178} {"train_loss": -6.758537769317627, "global_step": 133480, "epoch": 3178} {"train_loss": -6.664956569671631, "global_step": 133481, "epoch": 3178} {"train_loss": -6.775454044342041, "global_step": 133482, "epoch": 3178} {"train_loss": -6.772230625152588, "global_step": 133483, "epoch": 3178} {"train_loss": -6.675315856933594, "global_step": 133484, "epoch": 3178} {"train_loss": -6.744388580322266, "global_step": 133485, "epoch": 3178} {"train_loss": -6.731929779052734, "global_step": 133486, "epoch": 3178} {"train_loss": -6.842878341674805, "global_step": 133487, "epoch": 3178} {"train_loss": -6.708560466766357, "global_step": 133488, "epoch": 3178} {"train_loss": -6.6782989501953125, "global_step": 133489, "epoch": 3178} {"train_loss": -6.7631988525390625, "global_step": 133490, "epoch": 3178} {"train_loss": -6.696146011352539, "global_step": 133491, "epoch": 3178} {"train_loss": -6.7748870849609375, "global_step": 133492, "epoch": 3178} {"train_loss": -6.781564712524414, "global_step": 133493, "epoch": 3178} {"train_loss": -6.792751312255859, "global_step": 133494, "epoch": 3178} {"train_loss": -6.697504043579102, "global_step": 133495, "epoch": 3178} {"train_loss": -6.630007743835449, "global_step": 133496, "epoch": 3178} {"train_loss": -6.735467910766602, "global_step": 133497, "epoch": 3178} {"train_loss": -6.591721534729004, "global_step": 133498, "epoch": 3178} {"train_loss": -6.709657669067383, "global_step": 133499, "epoch": 3178} {"train_loss": -6.75167989730835, "global_step": 133500, "epoch": 3178} {"train_loss": -6.697371482849121, "global_step": 133501, "epoch": 3178} {"train_loss": -6.7356858253479, "global_step": 133502, "epoch": 3178} {"train_loss": -6.743547439575195, "global_step": 133503, "epoch": 3178} {"train_loss": -6.6771392822265625, "global_step": 133504, "epoch": 3178} {"train_loss": -6.7381134033203125, "global_step": 133505, "epoch": 3178} {"train_loss": -6.6800079345703125, "global_step": 133506, "epoch": 3178} {"train_loss": -6.514256954193115, "global_step": 133507, "epoch": 3178} {"train_loss": -6.63037633895874, "global_step": 133508, "epoch": 3178} {"train_loss": -6.635025978088379, "global_step": 133509, "epoch": 3178} {"train_loss": -6.502223968505859, "global_step": 133510, "epoch": 3178} {"train_loss": -6.657212257385254, "global_step": 133511, "epoch": 3178} {"train_loss": -6.683504104614258, "global_step": 133512, "epoch": 3178} {"train_loss": -6.612802505493164, "global_step": 133513, "epoch": 3178} {"train_loss": -6.543252944946289, "global_step": 133514, "epoch": 3178} {"train_loss": -6.570194244384766, "global_step": 133515, "epoch": 3178} {"train_loss": -6.598405361175537, "global_step": 133516, "epoch": 3178} {"train_loss": -6.693459283737909, "global_step": 133517, "epoch": 3178, "val_loss": 66877.4453125} {"train_loss": -6.671028137207031, "global_step": 133518, "epoch": 3179} {"train_loss": -6.450456142425537, "global_step": 133519, "epoch": 3179} {"train_loss": -6.704180717468262, "global_step": 133520, "epoch": 3179} {"train_loss": -6.5078229904174805, "global_step": 133521, "epoch": 3179} {"train_loss": -6.578998565673828, "global_step": 133522, "epoch": 3179} {"train_loss": -6.613349914550781, "global_step": 133523, "epoch": 3179} {"train_loss": -6.583446502685547, "global_step": 133524, "epoch": 3179} {"train_loss": -6.641550064086914, "global_step": 133525, "epoch": 3179} {"train_loss": -6.540575981140137, "global_step": 133526, "epoch": 3179} {"train_loss": -6.622066974639893, "global_step": 133527, "epoch": 3179} {"train_loss": -6.63029146194458, "global_step": 133528, "epoch": 3179} {"train_loss": -6.642102241516113, "global_step": 133529, "epoch": 3179} {"train_loss": -6.665320873260498, "global_step": 133530, "epoch": 3179} {"train_loss": -6.5417656898498535, "global_step": 133531, "epoch": 3179} {"train_loss": -6.725411891937256, "global_step": 133532, "epoch": 3179} {"train_loss": -6.736882209777832, "global_step": 133533, "epoch": 3179} {"train_loss": -6.55495548248291, "global_step": 133534, "epoch": 3179} {"train_loss": -6.713665962219238, "global_step": 133535, "epoch": 3179} {"train_loss": -6.717281341552734, "global_step": 133536, "epoch": 3179} {"train_loss": -6.724688529968262, "global_step": 133537, "epoch": 3179} {"train_loss": -6.665585994720459, "global_step": 133538, "epoch": 3179} {"train_loss": -6.709714412689209, "global_step": 133539, "epoch": 3179} {"train_loss": -6.632046699523926, "global_step": 133540, "epoch": 3179} {"train_loss": -6.571390628814697, "global_step": 133541, "epoch": 3179} {"train_loss": -6.725106239318848, "global_step": 133542, "epoch": 3179} {"train_loss": -6.634030342102051, "global_step": 133543, "epoch": 3179} {"train_loss": -6.6818156242370605, "global_step": 133544, "epoch": 3179} {"train_loss": -6.639186382293701, "global_step": 133545, "epoch": 3179} {"train_loss": -6.703427791595459, "global_step": 133546, "epoch": 3179} {"train_loss": -6.658891677856445, "global_step": 133547, "epoch": 3179} {"train_loss": -6.6181535720825195, "global_step": 133548, "epoch": 3179} {"train_loss": -6.7527360916137695, "global_step": 133549, "epoch": 3179} {"train_loss": -6.792026519775391, "global_step": 133550, "epoch": 3179} {"train_loss": -6.771872520446777, "global_step": 133551, "epoch": 3179} {"train_loss": -6.557141304016113, "global_step": 133552, "epoch": 3179} {"train_loss": -6.654850482940674, "global_step": 133553, "epoch": 3179} {"train_loss": -6.682790279388428, "global_step": 133554, "epoch": 3179} {"train_loss": -6.757589817047119, "global_step": 133555, "epoch": 3179} {"train_loss": -6.509672164916992, "global_step": 133556, "epoch": 3179} {"train_loss": -6.78014612197876, "global_step": 133557, "epoch": 3179} {"train_loss": -6.677007675170898, "global_step": 133558, "epoch": 3179} {"train_loss": -6.65343595686413, "global_step": 133559, "epoch": 3179, "val_loss": 66867.0} {"train_loss": -6.723234176635742, "global_step": 133560, "epoch": 3180} {"train_loss": -6.606496810913086, "global_step": 133561, "epoch": 3180} {"train_loss": -6.651589393615723, "global_step": 133562, "epoch": 3180} {"train_loss": -6.770876884460449, "global_step": 133563, "epoch": 3180} {"train_loss": -6.655013084411621, "global_step": 133564, "epoch": 3180} {"train_loss": -6.805713653564453, "global_step": 133565, "epoch": 3180} {"train_loss": -6.692773342132568, "global_step": 133566, "epoch": 3180} {"train_loss": -6.679473876953125, "global_step": 133567, "epoch": 3180} {"train_loss": -6.784303188323975, "global_step": 133568, "epoch": 3180} {"train_loss": -6.641623497009277, "global_step": 133569, "epoch": 3180} {"train_loss": -6.720329284667969, "global_step": 133570, "epoch": 3180} {"train_loss": -6.757841110229492, "global_step": 133571, "epoch": 3180} {"train_loss": -6.63386344909668, "global_step": 133572, "epoch": 3180} {"train_loss": -6.633993148803711, "global_step": 133573, "epoch": 3180} {"train_loss": -6.6848955154418945, "global_step": 133574, "epoch": 3180} {"train_loss": -6.686002731323242, "global_step": 133575, "epoch": 3180} {"train_loss": -6.693210601806641, "global_step": 133576, "epoch": 3180} {"train_loss": -6.6834025382995605, "global_step": 133577, "epoch": 3180} {"train_loss": -6.719948768615723, "global_step": 133578, "epoch": 3180} {"train_loss": -6.656914710998535, "global_step": 133579, "epoch": 3180} {"train_loss": -6.650404930114746, "global_step": 133580, "epoch": 3180} {"train_loss": -6.631461143493652, "global_step": 133581, "epoch": 3180} {"train_loss": -6.754172325134277, "global_step": 133582, "epoch": 3180} {"train_loss": -6.571809768676758, "global_step": 133583, "epoch": 3180} {"train_loss": -6.656628131866455, "global_step": 133584, "epoch": 3180} {"train_loss": -6.651447296142578, "global_step": 133585, "epoch": 3180} {"train_loss": -6.576661586761475, "global_step": 133586, "epoch": 3180} {"train_loss": -6.5496721267700195, "global_step": 133587, "epoch": 3180} {"train_loss": -6.718642234802246, "global_step": 133588, "epoch": 3180} {"train_loss": -6.645695209503174, "global_step": 133589, "epoch": 3180} {"train_loss": -6.580684661865234, "global_step": 133590, "epoch": 3180} {"train_loss": -6.715883731842041, "global_step": 133591, "epoch": 3180} {"train_loss": -6.728710174560547, "global_step": 133592, "epoch": 3180} {"train_loss": -6.720058917999268, "global_step": 133593, "epoch": 3180} {"train_loss": -6.693978309631348, "global_step": 133594, "epoch": 3180} {"train_loss": -6.654609680175781, "global_step": 133595, "epoch": 3180} {"train_loss": -6.726097106933594, "global_step": 133596, "epoch": 3180} {"train_loss": -6.686959743499756, "global_step": 133597, "epoch": 3180} {"train_loss": -6.749824523925781, "global_step": 133598, "epoch": 3180} {"train_loss": -6.835447788238525, "global_step": 133599, "epoch": 3180} {"train_loss": -6.692462921142578, "global_step": 133600, "epoch": 3180} {"train_loss": -6.687545254116967, "global_step": 133601, "epoch": 3180, "val_loss": 66897.5703125} {"train_loss": -6.695058822631836, "global_step": 133602, "epoch": 3181} {"train_loss": -6.699633598327637, "global_step": 133603, "epoch": 3181} {"train_loss": -6.774260520935059, "global_step": 133604, "epoch": 3181} {"train_loss": -6.725945472717285, "global_step": 133605, "epoch": 3181} {"train_loss": -6.663398742675781, "global_step": 133606, "epoch": 3181} {"train_loss": -6.597249507904053, "global_step": 133607, "epoch": 3181} {"train_loss": -6.707395553588867, "global_step": 133608, "epoch": 3181} {"train_loss": -6.815704345703125, "global_step": 133609, "epoch": 3181} {"train_loss": -6.715064525604248, "global_step": 133610, "epoch": 3181} {"train_loss": -6.663911819458008, "global_step": 133611, "epoch": 3181} {"train_loss": -6.672762870788574, "global_step": 133612, "epoch": 3181} {"train_loss": -6.770358085632324, "global_step": 133613, "epoch": 3181} {"train_loss": -6.55921745300293, "global_step": 133614, "epoch": 3181} {"train_loss": -6.699302673339844, "global_step": 133615, "epoch": 3181} {"train_loss": -6.681410312652588, "global_step": 133616, "epoch": 3181} {"train_loss": -6.730812072753906, "global_step": 133617, "epoch": 3181} {"train_loss": -6.680141448974609, "global_step": 133618, "epoch": 3181} {"train_loss": -6.672418117523193, "global_step": 133619, "epoch": 3181} {"train_loss": -6.835007190704346, "global_step": 133620, "epoch": 3181} {"train_loss": -6.684460639953613, "global_step": 133621, "epoch": 3181} {"train_loss": -6.776499271392822, "global_step": 133622, "epoch": 3181} {"train_loss": -6.685398101806641, "global_step": 133623, "epoch": 3181} {"train_loss": -6.739878177642822, "global_step": 133624, "epoch": 3181} {"train_loss": -6.680459022521973, "global_step": 133625, "epoch": 3181} {"train_loss": -6.690372467041016, "global_step": 133626, "epoch": 3181} {"train_loss": -6.65355110168457, "global_step": 133627, "epoch": 3181} {"train_loss": -6.82633113861084, "global_step": 133628, "epoch": 3181} {"train_loss": -6.806960105895996, "global_step": 133629, "epoch": 3181} {"train_loss": -6.659241676330566, "global_step": 133630, "epoch": 3181} {"train_loss": -6.850088119506836, "global_step": 133631, "epoch": 3181} {"train_loss": -6.714392185211182, "global_step": 133632, "epoch": 3181} {"train_loss": -6.636904239654541, "global_step": 133633, "epoch": 3181} {"train_loss": -6.776035785675049, "global_step": 133634, "epoch": 3181} {"train_loss": -6.694827556610107, "global_step": 133635, "epoch": 3181} {"train_loss": -6.719125747680664, "global_step": 133636, "epoch": 3181} {"train_loss": -6.708300590515137, "global_step": 133637, "epoch": 3181} {"train_loss": -6.733828544616699, "global_step": 133638, "epoch": 3181} {"train_loss": -6.804202079772949, "global_step": 133639, "epoch": 3181} {"train_loss": -6.726687431335449, "global_step": 133640, "epoch": 3181} {"train_loss": -6.666127681732178, "global_step": 133641, "epoch": 3181} {"train_loss": -6.722917556762695, "global_step": 133642, "epoch": 3181} {"train_loss": -6.712988444737026, "global_step": 133643, "epoch": 3181, "val_loss": 66954.4453125} {"train_loss": -6.726490497589111, "global_step": 133644, "epoch": 3182} {"train_loss": -6.693470001220703, "global_step": 133645, "epoch": 3182} {"train_loss": -6.716762542724609, "global_step": 133646, "epoch": 3182} {"train_loss": -6.8023576736450195, "global_step": 133647, "epoch": 3182} {"train_loss": -6.720881938934326, "global_step": 133648, "epoch": 3182} {"train_loss": -6.601443290710449, "global_step": 133649, "epoch": 3182} {"train_loss": -6.631528854370117, "global_step": 133650, "epoch": 3182} {"train_loss": -6.640881061553955, "global_step": 133651, "epoch": 3182} {"train_loss": -6.636960029602051, "global_step": 133652, "epoch": 3182} {"train_loss": -6.736569881439209, "global_step": 133653, "epoch": 3182} {"train_loss": -6.6304931640625, "global_step": 133654, "epoch": 3182} {"train_loss": -6.756248474121094, "global_step": 133655, "epoch": 3182} {"train_loss": -6.790192604064941, "global_step": 133656, "epoch": 3182} {"train_loss": -6.6756134033203125, "global_step": 133657, "epoch": 3182} {"train_loss": -6.719156742095947, "global_step": 133658, "epoch": 3182} {"train_loss": -6.70319938659668, "global_step": 133659, "epoch": 3182} {"train_loss": -6.742663383483887, "global_step": 133660, "epoch": 3182} {"train_loss": -6.829614162445068, "global_step": 133661, "epoch": 3182} {"train_loss": -6.746825218200684, "global_step": 133662, "epoch": 3182} {"train_loss": -6.6242828369140625, "global_step": 133663, "epoch": 3182} {"train_loss": -6.786033630371094, "global_step": 133664, "epoch": 3182} {"train_loss": -6.741782188415527, "global_step": 133665, "epoch": 3182} {"train_loss": -6.689299583435059, "global_step": 133666, "epoch": 3182} {"train_loss": -6.713903903961182, "global_step": 133667, "epoch": 3182} {"train_loss": -6.751267433166504, "global_step": 133668, "epoch": 3182} {"train_loss": -6.7054948806762695, "global_step": 133669, "epoch": 3182} {"train_loss": -6.677618980407715, "global_step": 133670, "epoch": 3182} {"train_loss": -6.803718566894531, "global_step": 133671, "epoch": 3182} {"train_loss": -6.760444641113281, "global_step": 133672, "epoch": 3182} {"train_loss": -6.695042133331299, "global_step": 133673, "epoch": 3182} {"train_loss": -6.809762001037598, "global_step": 133674, "epoch": 3182} {"train_loss": -6.804224491119385, "global_step": 133675, "epoch": 3182} {"train_loss": -6.7047529220581055, "global_step": 133676, "epoch": 3182} {"train_loss": -6.570991516113281, "global_step": 133677, "epoch": 3182} {"train_loss": -6.602222442626953, "global_step": 133678, "epoch": 3182} {"train_loss": -6.725884914398193, "global_step": 133679, "epoch": 3182} {"train_loss": -6.564547538757324, "global_step": 133680, "epoch": 3182} {"train_loss": -6.818014144897461, "global_step": 133681, "epoch": 3182} {"train_loss": -6.636562347412109, "global_step": 133682, "epoch": 3182} {"train_loss": -6.475914001464844, "global_step": 133683, "epoch": 3182} {"train_loss": -6.759628772735596, "global_step": 133684, "epoch": 3182} {"train_loss": -6.700044575191679, "global_step": 133685, "epoch": 3182, "val_loss": 66600.4609375} {"train_loss": -6.71462345123291, "global_step": 133686, "epoch": 3183} {"train_loss": -6.822261333465576, "global_step": 133687, "epoch": 3183} {"train_loss": -6.735771179199219, "global_step": 133688, "epoch": 3183} {"train_loss": -6.662263870239258, "global_step": 133689, "epoch": 3183} {"train_loss": -6.672725677490234, "global_step": 133690, "epoch": 3183} {"train_loss": -6.542140960693359, "global_step": 133691, "epoch": 3183} {"train_loss": -6.672786712646484, "global_step": 133692, "epoch": 3183} {"train_loss": -6.59687614440918, "global_step": 133693, "epoch": 3183} {"train_loss": -6.749844074249268, "global_step": 133694, "epoch": 3183} {"train_loss": -6.707746505737305, "global_step": 133695, "epoch": 3183} {"train_loss": -6.707047462463379, "global_step": 133696, "epoch": 3183} {"train_loss": -6.740566730499268, "global_step": 133697, "epoch": 3183} {"train_loss": -6.684018135070801, "global_step": 133698, "epoch": 3183} {"train_loss": -6.647479057312012, "global_step": 133699, "epoch": 3183} {"train_loss": -6.728955268859863, "global_step": 133700, "epoch": 3183} {"train_loss": -6.67574405670166, "global_step": 133701, "epoch": 3183} {"train_loss": -6.721752166748047, "global_step": 133702, "epoch": 3183} {"train_loss": -6.678583145141602, "global_step": 133703, "epoch": 3183} {"train_loss": -6.717169761657715, "global_step": 133704, "epoch": 3183} {"train_loss": -6.710060119628906, "global_step": 133705, "epoch": 3183} {"train_loss": -6.739965915679932, "global_step": 133706, "epoch": 3183} {"train_loss": -6.640561103820801, "global_step": 133707, "epoch": 3183} {"train_loss": -6.7354631423950195, "global_step": 133708, "epoch": 3183} {"train_loss": -6.638808250427246, "global_step": 133709, "epoch": 3183} {"train_loss": -6.628607273101807, "global_step": 133710, "epoch": 3183} {"train_loss": -6.647979736328125, "global_step": 133711, "epoch": 3183} {"train_loss": -6.547938346862793, "global_step": 133712, "epoch": 3183} {"train_loss": -6.658477306365967, "global_step": 133713, "epoch": 3183} {"train_loss": -6.716835021972656, "global_step": 133714, "epoch": 3183} {"train_loss": -6.613458156585693, "global_step": 133715, "epoch": 3183} {"train_loss": -6.740662097930908, "global_step": 133716, "epoch": 3183} {"train_loss": -6.688887596130371, "global_step": 133717, "epoch": 3183} {"train_loss": -6.5604352951049805, "global_step": 133718, "epoch": 3183} {"train_loss": -6.640905380249023, "global_step": 133719, "epoch": 3183} {"train_loss": -6.561163902282715, "global_step": 133720, "epoch": 3183} {"train_loss": -6.369659900665283, "global_step": 133721, "epoch": 3183} {"train_loss": -6.639765739440918, "global_step": 133722, "epoch": 3183} {"train_loss": -6.668391227722168, "global_step": 133723, "epoch": 3183} {"train_loss": -6.6314496994018555, "global_step": 133724, "epoch": 3183} {"train_loss": -6.513583183288574, "global_step": 133725, "epoch": 3183} {"train_loss": -6.639382362365723, "global_step": 133726, "epoch": 3183} {"train_loss": -6.658870674314953, "global_step": 133727, "epoch": 3183, "val_loss": 66692.8515625} {"train_loss": -6.574858665466309, "global_step": 133728, "epoch": 3184} {"train_loss": -6.771749496459961, "global_step": 133729, "epoch": 3184} {"train_loss": -6.688882827758789, "global_step": 133730, "epoch": 3184} {"train_loss": -6.637759208679199, "global_step": 133731, "epoch": 3184} {"train_loss": -6.7525763511657715, "global_step": 133732, "epoch": 3184} {"train_loss": -6.728361129760742, "global_step": 133733, "epoch": 3184} {"train_loss": -6.746347904205322, "global_step": 133734, "epoch": 3184} {"train_loss": -6.735069274902344, "global_step": 133735, "epoch": 3184} {"train_loss": -6.619179725646973, "global_step": 133736, "epoch": 3184} {"train_loss": -6.6836419105529785, "global_step": 133737, "epoch": 3184} {"train_loss": -6.710637092590332, "global_step": 133738, "epoch": 3184} {"train_loss": -6.845592498779297, "global_step": 133739, "epoch": 3184} {"train_loss": -6.669828414916992, "global_step": 133740, "epoch": 3184} {"train_loss": -6.627386093139648, "global_step": 133741, "epoch": 3184} {"train_loss": -6.695587158203125, "global_step": 133742, "epoch": 3184} {"train_loss": -6.663096904754639, "global_step": 133743, "epoch": 3184} {"train_loss": -6.735861778259277, "global_step": 133744, "epoch": 3184} {"train_loss": -6.586069107055664, "global_step": 133745, "epoch": 3184} {"train_loss": -6.780340671539307, "global_step": 133746, "epoch": 3184} {"train_loss": -6.778021812438965, "global_step": 133747, "epoch": 3184} {"train_loss": -6.5700531005859375, "global_step": 133748, "epoch": 3184} {"train_loss": -6.62615442276001, "global_step": 133749, "epoch": 3184} {"train_loss": -6.632074356079102, "global_step": 133750, "epoch": 3184} {"train_loss": -6.662346363067627, "global_step": 133751, "epoch": 3184} {"train_loss": -6.7954792976379395, "global_step": 133752, "epoch": 3184} {"train_loss": -6.849555492401123, "global_step": 133753, "epoch": 3184} {"train_loss": -6.695959091186523, "global_step": 133754, "epoch": 3184} {"train_loss": -6.794795989990234, "global_step": 133755, "epoch": 3184} {"train_loss": -6.725153923034668, "global_step": 133756, "epoch": 3184} {"train_loss": -6.654217720031738, "global_step": 133757, "epoch": 3184} {"train_loss": -6.637714862823486, "global_step": 133758, "epoch": 3184} {"train_loss": -6.780091285705566, "global_step": 133759, "epoch": 3184} {"train_loss": -6.618678092956543, "global_step": 133760, "epoch": 3184} {"train_loss": -6.711550235748291, "global_step": 133761, "epoch": 3184} {"train_loss": -6.6288957595825195, "global_step": 133762, "epoch": 3184} {"train_loss": -6.863259792327881, "global_step": 133763, "epoch": 3184} {"train_loss": -6.693251609802246, "global_step": 133764, "epoch": 3184} {"train_loss": -6.654804229736328, "global_step": 133765, "epoch": 3184} {"train_loss": -6.773348808288574, "global_step": 133766, "epoch": 3184} {"train_loss": -6.651059150695801, "global_step": 133767, "epoch": 3184} {"train_loss": -6.752018928527832, "global_step": 133768, "epoch": 3184} {"train_loss": -6.702077082225254, "global_step": 133769, "epoch": 3184, "val_loss": 66751.2890625} {"train_loss": -6.770954608917236, "global_step": 133770, "epoch": 3185} {"train_loss": -6.792675018310547, "global_step": 133771, "epoch": 3185} {"train_loss": -6.842179775238037, "global_step": 133772, "epoch": 3185} {"train_loss": -6.715171813964844, "global_step": 133773, "epoch": 3185} {"train_loss": -6.758658409118652, "global_step": 133774, "epoch": 3185} {"train_loss": -6.689217567443848, "global_step": 133775, "epoch": 3185} {"train_loss": -6.774009704589844, "global_step": 133776, "epoch": 3185} {"train_loss": -6.718897819519043, "global_step": 133777, "epoch": 3185} {"train_loss": -6.724231719970703, "global_step": 133778, "epoch": 3185} {"train_loss": -6.7767744064331055, "global_step": 133779, "epoch": 3185} {"train_loss": -6.732214450836182, "global_step": 133780, "epoch": 3185} {"train_loss": -6.612945556640625, "global_step": 133781, "epoch": 3185} {"train_loss": -6.704028606414795, "global_step": 133782, "epoch": 3185} {"train_loss": -6.604776859283447, "global_step": 133783, "epoch": 3185} {"train_loss": -6.542460918426514, "global_step": 133784, "epoch": 3185} {"train_loss": -6.575948715209961, "global_step": 133785, "epoch": 3185} {"train_loss": -6.580373764038086, "global_step": 133786, "epoch": 3185} {"train_loss": -6.732705593109131, "global_step": 133787, "epoch": 3185} {"train_loss": -6.683651924133301, "global_step": 133788, "epoch": 3185} {"train_loss": -6.649634838104248, "global_step": 133789, "epoch": 3185} {"train_loss": -6.625579833984375, "global_step": 133790, "epoch": 3185} {"train_loss": -6.651628017425537, "global_step": 133791, "epoch": 3185} {"train_loss": -6.6251726150512695, "global_step": 133792, "epoch": 3185} {"train_loss": -6.777109146118164, "global_step": 133793, "epoch": 3185} {"train_loss": -6.66707181930542, "global_step": 133794, "epoch": 3185} {"train_loss": -6.745736122131348, "global_step": 133795, "epoch": 3185} {"train_loss": -6.7094526290893555, "global_step": 133796, "epoch": 3185} {"train_loss": -6.705843448638916, "global_step": 133797, "epoch": 3185} {"train_loss": -6.641348838806152, "global_step": 133798, "epoch": 3185} {"train_loss": -6.652891159057617, "global_step": 133799, "epoch": 3185} {"train_loss": -6.715904235839844, "global_step": 133800, "epoch": 3185} {"train_loss": -6.651034355163574, "global_step": 133801, "epoch": 3185} {"train_loss": -6.614107608795166, "global_step": 133802, "epoch": 3185} {"train_loss": -6.658526420593262, "global_step": 133803, "epoch": 3185} {"train_loss": -6.546542167663574, "global_step": 133804, "epoch": 3185} {"train_loss": -6.609336853027344, "global_step": 133805, "epoch": 3185} {"train_loss": -6.637104034423828, "global_step": 133806, "epoch": 3185} {"train_loss": -6.575972080230713, "global_step": 133807, "epoch": 3185} {"train_loss": -6.699960708618164, "global_step": 133808, "epoch": 3185} {"train_loss": -6.555460453033447, "global_step": 133809, "epoch": 3185} {"train_loss": -6.75344181060791, "global_step": 133810, "epoch": 3185} {"train_loss": -6.6790287381126765, "global_step": 133811, "epoch": 3185, "val_loss": 66963.140625} {"train_loss": -6.594849109649658, "global_step": 133812, "epoch": 3186} {"train_loss": -6.7212677001953125, "global_step": 133813, "epoch": 3186} {"train_loss": -6.64070463180542, "global_step": 133814, "epoch": 3186} {"train_loss": -6.809549331665039, "global_step": 133815, "epoch": 3186} {"train_loss": -6.653382301330566, "global_step": 133816, "epoch": 3186} {"train_loss": -6.686357498168945, "global_step": 133817, "epoch": 3186} {"train_loss": -6.716766357421875, "global_step": 133818, "epoch": 3186} {"train_loss": -6.719478607177734, "global_step": 133819, "epoch": 3186} {"train_loss": -6.747489929199219, "global_step": 133820, "epoch": 3186} {"train_loss": -6.677000045776367, "global_step": 133821, "epoch": 3186} {"train_loss": -6.799456596374512, "global_step": 133822, "epoch": 3186} {"train_loss": -6.770977020263672, "global_step": 133823, "epoch": 3186} {"train_loss": -6.620816230773926, "global_step": 133824, "epoch": 3186} {"train_loss": -6.748224258422852, "global_step": 133825, "epoch": 3186} {"train_loss": -6.768248558044434, "global_step": 133826, "epoch": 3186} {"train_loss": -6.75637149810791, "global_step": 133827, "epoch": 3186} {"train_loss": -6.6962480545043945, "global_step": 133828, "epoch": 3186} {"train_loss": -6.657130241394043, "global_step": 133829, "epoch": 3186} {"train_loss": -6.72026252746582, "global_step": 133830, "epoch": 3186} {"train_loss": -6.56917667388916, "global_step": 133831, "epoch": 3186} {"train_loss": -6.707124710083008, "global_step": 133832, "epoch": 3186} {"train_loss": -6.729060173034668, "global_step": 133833, "epoch": 3186} {"train_loss": -6.687903881072998, "global_step": 133834, "epoch": 3186} {"train_loss": -6.695391654968262, "global_step": 133835, "epoch": 3186} {"train_loss": -6.782586097717285, "global_step": 133836, "epoch": 3186} {"train_loss": -6.654585838317871, "global_step": 133837, "epoch": 3186} {"train_loss": -6.6365275382995605, "global_step": 133838, "epoch": 3186} {"train_loss": -6.641120910644531, "global_step": 133839, "epoch": 3186} {"train_loss": -6.852502822875977, "global_step": 133840, "epoch": 3186} {"train_loss": -6.700410842895508, "global_step": 133841, "epoch": 3186} {"train_loss": -6.618832588195801, "global_step": 133842, "epoch": 3186} {"train_loss": -6.661477088928223, "global_step": 133843, "epoch": 3186} {"train_loss": -6.737642288208008, "global_step": 133844, "epoch": 3186} {"train_loss": -6.661869525909424, "global_step": 133845, "epoch": 3186} {"train_loss": -6.635655403137207, "global_step": 133846, "epoch": 3186} {"train_loss": -6.652669906616211, "global_step": 133847, "epoch": 3186} {"train_loss": -6.65140962600708, "global_step": 133848, "epoch": 3186} {"train_loss": -6.772574424743652, "global_step": 133849, "epoch": 3186} {"train_loss": -6.505617618560791, "global_step": 133850, "epoch": 3186} {"train_loss": -6.589692115783691, "global_step": 133851, "epoch": 3186} {"train_loss": -6.679238319396973, "global_step": 133852, "epoch": 3186} {"train_loss": -6.688170478457496, "global_step": 133853, "epoch": 3186, "val_loss": 66682.421875} {"train_loss": -6.720884323120117, "global_step": 133854, "epoch": 3187} {"train_loss": -6.620349884033203, "global_step": 133855, "epoch": 3187} {"train_loss": -6.700876235961914, "global_step": 133856, "epoch": 3187} {"train_loss": -6.675589084625244, "global_step": 133857, "epoch": 3187} {"train_loss": -6.790515899658203, "global_step": 133858, "epoch": 3187} {"train_loss": -6.675764083862305, "global_step": 133859, "epoch": 3187} {"train_loss": -6.652164936065674, "global_step": 133860, "epoch": 3187} {"train_loss": -6.700416564941406, "global_step": 133861, "epoch": 3187} {"train_loss": -6.704623699188232, "global_step": 133862, "epoch": 3187} {"train_loss": -6.638772964477539, "global_step": 133863, "epoch": 3187} {"train_loss": -6.634443283081055, "global_step": 133864, "epoch": 3187} {"train_loss": -6.635964393615723, "global_step": 133865, "epoch": 3187} {"train_loss": -6.679720878601074, "global_step": 133866, "epoch": 3187} {"train_loss": -6.602298259735107, "global_step": 133867, "epoch": 3187} {"train_loss": -6.667936325073242, "global_step": 133868, "epoch": 3187} {"train_loss": -6.627424716949463, "global_step": 133869, "epoch": 3187} {"train_loss": -6.588171005249023, "global_step": 133870, "epoch": 3187} {"train_loss": -6.749383926391602, "global_step": 133871, "epoch": 3187} {"train_loss": -6.696351051330566, "global_step": 133872, "epoch": 3187} {"train_loss": -6.672976016998291, "global_step": 133873, "epoch": 3187} {"train_loss": -6.631312847137451, "global_step": 133874, "epoch": 3187} {"train_loss": -6.702598571777344, "global_step": 133875, "epoch": 3187} {"train_loss": -6.703545570373535, "global_step": 133876, "epoch": 3187} {"train_loss": -6.709449768066406, "global_step": 133877, "epoch": 3187} {"train_loss": -6.860219478607178, "global_step": 133878, "epoch": 3187} {"train_loss": -6.667410373687744, "global_step": 133879, "epoch": 3187} {"train_loss": -6.611623287200928, "global_step": 133880, "epoch": 3187} {"train_loss": -6.661160469055176, "global_step": 133881, "epoch": 3187} {"train_loss": -6.697114944458008, "global_step": 133882, "epoch": 3187} {"train_loss": -6.785254001617432, "global_step": 133883, "epoch": 3187} {"train_loss": -6.891603946685791, "global_step": 133884, "epoch": 3187} {"train_loss": -6.7451982498168945, "global_step": 133885, "epoch": 3187} {"train_loss": -6.736532211303711, "global_step": 133886, "epoch": 3187} {"train_loss": -6.704207420349121, "global_step": 133887, "epoch": 3187} {"train_loss": -6.780834197998047, "global_step": 133888, "epoch": 3187} {"train_loss": -6.737924575805664, "global_step": 133889, "epoch": 3187} {"train_loss": -6.695878982543945, "global_step": 133890, "epoch": 3187} {"train_loss": -6.7010498046875, "global_step": 133891, "epoch": 3187} {"train_loss": -6.58514404296875, "global_step": 133892, "epoch": 3187} {"train_loss": -6.79854679107666, "global_step": 133893, "epoch": 3187} {"train_loss": -6.7601823806762695, "global_step": 133894, "epoch": 3187} {"train_loss": -6.697908276603336, "global_step": 133895, "epoch": 3187, "val_loss": 66968.0078125} {"train_loss": -6.760120868682861, "global_step": 133896, "epoch": 3188} {"train_loss": -6.605008125305176, "global_step": 133897, "epoch": 3188} {"train_loss": -6.572361469268799, "global_step": 133898, "epoch": 3188} {"train_loss": -6.572393894195557, "global_step": 133899, "epoch": 3188} {"train_loss": -6.714224338531494, "global_step": 133900, "epoch": 3188} {"train_loss": -6.677125453948975, "global_step": 133901, "epoch": 3188} {"train_loss": -6.678837299346924, "global_step": 133902, "epoch": 3188} {"train_loss": -6.688813209533691, "global_step": 133903, "epoch": 3188} {"train_loss": -6.729598045349121, "global_step": 133904, "epoch": 3188} {"train_loss": -6.7162556648254395, "global_step": 133905, "epoch": 3188} {"train_loss": -6.690598487854004, "global_step": 133906, "epoch": 3188} {"train_loss": -6.713487148284912, "global_step": 133907, "epoch": 3188} {"train_loss": -6.658967018127441, "global_step": 133908, "epoch": 3188} {"train_loss": -6.619830131530762, "global_step": 133909, "epoch": 3188} {"train_loss": -6.746349334716797, "global_step": 133910, "epoch": 3188} {"train_loss": -6.679533958435059, "global_step": 133911, "epoch": 3188} {"train_loss": -6.69086217880249, "global_step": 133912, "epoch": 3188} {"train_loss": -6.681401252746582, "global_step": 133913, "epoch": 3188} {"train_loss": -6.638650417327881, "global_step": 133914, "epoch": 3188} {"train_loss": -6.676296234130859, "global_step": 133915, "epoch": 3188} {"train_loss": -6.718097686767578, "global_step": 133916, "epoch": 3188} {"train_loss": -6.637509346008301, "global_step": 133917, "epoch": 3188} {"train_loss": -6.8128461837768555, "global_step": 133918, "epoch": 3188} {"train_loss": -6.751090049743652, "global_step": 133919, "epoch": 3188} {"train_loss": -6.660397529602051, "global_step": 133920, "epoch": 3188} {"train_loss": -6.742168426513672, "global_step": 133921, "epoch": 3188} {"train_loss": -6.689752578735352, "global_step": 133922, "epoch": 3188} {"train_loss": -6.768240928649902, "global_step": 133923, "epoch": 3188} {"train_loss": -6.624268531799316, "global_step": 133924, "epoch": 3188} {"train_loss": -6.782949447631836, "global_step": 133925, "epoch": 3188} {"train_loss": -6.781071662902832, "global_step": 133926, "epoch": 3188} {"train_loss": -6.625611305236816, "global_step": 133927, "epoch": 3188} {"train_loss": -6.801963806152344, "global_step": 133928, "epoch": 3188} {"train_loss": -6.70818567276001, "global_step": 133929, "epoch": 3188} {"train_loss": -6.722939491271973, "global_step": 133930, "epoch": 3188} {"train_loss": -6.6491289138793945, "global_step": 133931, "epoch": 3188} {"train_loss": -6.744009971618652, "global_step": 133932, "epoch": 3188} {"train_loss": -6.697096347808838, "global_step": 133933, "epoch": 3188} {"train_loss": -6.724472522735596, "global_step": 133934, "epoch": 3188} {"train_loss": -6.7354865074157715, "global_step": 133935, "epoch": 3188} {"train_loss": -6.830874443054199, "global_step": 133936, "epoch": 3188} {"train_loss": -6.697941064834595, "global_step": 133937, "epoch": 3188, "val_loss": 66918.5234375} {"train_loss": -6.828465461730957, "global_step": 133938, "epoch": 3189} {"train_loss": -6.848101615905762, "global_step": 133939, "epoch": 3189} {"train_loss": -6.636415481567383, "global_step": 133940, "epoch": 3189} {"train_loss": -6.687918663024902, "global_step": 133941, "epoch": 3189} {"train_loss": -6.769149303436279, "global_step": 133942, "epoch": 3189} {"train_loss": -6.767585754394531, "global_step": 133943, "epoch": 3189} {"train_loss": -6.706273078918457, "global_step": 133944, "epoch": 3189} {"train_loss": -6.790290832519531, "global_step": 133945, "epoch": 3189} {"train_loss": -6.728212356567383, "global_step": 133946, "epoch": 3189} {"train_loss": -6.79974365234375, "global_step": 133947, "epoch": 3189} {"train_loss": -6.70603609085083, "global_step": 133948, "epoch": 3189} {"train_loss": -6.726618766784668, "global_step": 133949, "epoch": 3189} {"train_loss": -6.6925578117370605, "global_step": 133950, "epoch": 3189} {"train_loss": -6.783506393432617, "global_step": 133951, "epoch": 3189} {"train_loss": -6.689939498901367, "global_step": 133952, "epoch": 3189} {"train_loss": -6.792296409606934, "global_step": 133953, "epoch": 3189} {"train_loss": -6.686018466949463, "global_step": 133954, "epoch": 3189} {"train_loss": -6.732221603393555, "global_step": 133955, "epoch": 3189} {"train_loss": -6.773408889770508, "global_step": 133956, "epoch": 3189} {"train_loss": -6.720041275024414, "global_step": 133957, "epoch": 3189} {"train_loss": -6.736391067504883, "global_step": 133958, "epoch": 3189} {"train_loss": -6.6820549964904785, "global_step": 133959, "epoch": 3189} {"train_loss": -6.868980407714844, "global_step": 133960, "epoch": 3189} {"train_loss": -6.7420430183410645, "global_step": 133961, "epoch": 3189} {"train_loss": -6.741460800170898, "global_step": 133962, "epoch": 3189} {"train_loss": -6.773205757141113, "global_step": 133963, "epoch": 3189} {"train_loss": -6.823380470275879, "global_step": 133964, "epoch": 3189} {"train_loss": -6.715259075164795, "global_step": 133965, "epoch": 3189} {"train_loss": -6.736784934997559, "global_step": 133966, "epoch": 3189} {"train_loss": -6.716485977172852, "global_step": 133967, "epoch": 3189} {"train_loss": -6.74603271484375, "global_step": 133968, "epoch": 3189} {"train_loss": -6.780757904052734, "global_step": 133969, "epoch": 3189} {"train_loss": -6.630873680114746, "global_step": 133970, "epoch": 3189} {"train_loss": -6.688433647155762, "global_step": 133971, "epoch": 3189} {"train_loss": -6.659743785858154, "global_step": 133972, "epoch": 3189} {"train_loss": -6.717948913574219, "global_step": 133973, "epoch": 3189} {"train_loss": -6.717466354370117, "global_step": 133974, "epoch": 3189} {"train_loss": -6.776294231414795, "global_step": 133975, "epoch": 3189} {"train_loss": -6.871397495269775, "global_step": 133976, "epoch": 3189} {"train_loss": -6.65167760848999, "global_step": 133977, "epoch": 3189} {"train_loss": -6.690649509429932, "global_step": 133978, "epoch": 3189} {"train_loss": -6.738665909994216, "global_step": 133979, "epoch": 3189, "val_loss": 66862.171875} {"train_loss": -6.753681182861328, "global_step": 133980, "epoch": 3190} {"train_loss": -6.655879497528076, "global_step": 133981, "epoch": 3190} {"train_loss": -6.749688148498535, "global_step": 133982, "epoch": 3190} {"train_loss": -6.591453552246094, "global_step": 133983, "epoch": 3190} {"train_loss": -6.65206241607666, "global_step": 133984, "epoch": 3190} {"train_loss": -6.688712120056152, "global_step": 133985, "epoch": 3190} {"train_loss": -6.726184844970703, "global_step": 133986, "epoch": 3190} {"train_loss": -6.535754680633545, "global_step": 133987, "epoch": 3190} {"train_loss": -6.758911609649658, "global_step": 133988, "epoch": 3190} {"train_loss": -6.755642414093018, "global_step": 133989, "epoch": 3190} {"train_loss": -6.737764358520508, "global_step": 133990, "epoch": 3190} {"train_loss": -6.691679000854492, "global_step": 133991, "epoch": 3190} {"train_loss": -6.600744247436523, "global_step": 133992, "epoch": 3190} {"train_loss": -6.713253498077393, "global_step": 133993, "epoch": 3190} {"train_loss": -6.815052509307861, "global_step": 133994, "epoch": 3190} {"train_loss": -6.627753257751465, "global_step": 133995, "epoch": 3190} {"train_loss": -6.690483570098877, "global_step": 133996, "epoch": 3190} {"train_loss": -6.6706647872924805, "global_step": 133997, "epoch": 3190} {"train_loss": -6.678725242614746, "global_step": 133998, "epoch": 3190} {"train_loss": -6.703051567077637, "global_step": 133999, "epoch": 3190} {"train_loss": -6.812105178833008, "global_step": 134000, "epoch": 3190} {"train_loss": -6.753213405609131, "global_step": 134001, "epoch": 3190} {"train_loss": -6.783690452575684, "global_step": 134002, "epoch": 3190} {"train_loss": -6.598889350891113, "global_step": 134003, "epoch": 3190} {"train_loss": -6.617280960083008, "global_step": 134004, "epoch": 3190} {"train_loss": -6.7151899337768555, "global_step": 134005, "epoch": 3190} {"train_loss": -6.6975507736206055, "global_step": 134006, "epoch": 3190} {"train_loss": -6.655142784118652, "global_step": 134007, "epoch": 3190} {"train_loss": -6.773752212524414, "global_step": 134008, "epoch": 3190} {"train_loss": -6.76476526260376, "global_step": 134009, "epoch": 3190} {"train_loss": -6.719437599182129, "global_step": 134010, "epoch": 3190} {"train_loss": -6.641122817993164, "global_step": 134011, "epoch": 3190} {"train_loss": -6.728164196014404, "global_step": 134012, "epoch": 3190} {"train_loss": -6.732723712921143, "global_step": 134013, "epoch": 3190} {"train_loss": -6.658494472503662, "global_step": 134014, "epoch": 3190} {"train_loss": -6.815324783325195, "global_step": 134015, "epoch": 3190} {"train_loss": -6.683941841125488, "global_step": 134016, "epoch": 3190} {"train_loss": -6.679717540740967, "global_step": 134017, "epoch": 3190} {"train_loss": -6.709657669067383, "global_step": 134018, "epoch": 3190} {"train_loss": -6.727588653564453, "global_step": 134019, "epoch": 3190} {"train_loss": -6.714119911193848, "global_step": 134020, "epoch": 3190} {"train_loss": -6.7039848282223655, "global_step": 134021, "epoch": 3190, "val_loss": 66827.3359375} {"train_loss": -6.680245399475098, "global_step": 134022, "epoch": 3191} {"train_loss": -6.6465983390808105, "global_step": 134023, "epoch": 3191} {"train_loss": -6.832005023956299, "global_step": 134024, "epoch": 3191} {"train_loss": -6.71452522277832, "global_step": 134025, "epoch": 3191} {"train_loss": -6.601322650909424, "global_step": 134026, "epoch": 3191} {"train_loss": -6.748474597930908, "global_step": 134027, "epoch": 3191} {"train_loss": -6.652591705322266, "global_step": 134028, "epoch": 3191} {"train_loss": -6.641862869262695, "global_step": 134029, "epoch": 3191} {"train_loss": -6.616987705230713, "global_step": 134030, "epoch": 3191} {"train_loss": -6.730855941772461, "global_step": 134031, "epoch": 3191} {"train_loss": -6.624481201171875, "global_step": 134032, "epoch": 3191} {"train_loss": -6.546059608459473, "global_step": 134033, "epoch": 3191} {"train_loss": -6.665050506591797, "global_step": 134034, "epoch": 3191} {"train_loss": -6.682401657104492, "global_step": 134035, "epoch": 3191} {"train_loss": -6.577210426330566, "global_step": 134036, "epoch": 3191} {"train_loss": -6.777493000030518, "global_step": 134037, "epoch": 3191} {"train_loss": -6.737941741943359, "global_step": 134038, "epoch": 3191} {"train_loss": -6.686607837677002, "global_step": 134039, "epoch": 3191} {"train_loss": -6.67698860168457, "global_step": 134040, "epoch": 3191} {"train_loss": -6.682255744934082, "global_step": 134041, "epoch": 3191} {"train_loss": -6.749290466308594, "global_step": 134042, "epoch": 3191} {"train_loss": -6.705618858337402, "global_step": 134043, "epoch": 3191} {"train_loss": -6.809991836547852, "global_step": 134044, "epoch": 3191} {"train_loss": -6.808436393737793, "global_step": 134045, "epoch": 3191} {"train_loss": -6.710549354553223, "global_step": 134046, "epoch": 3191} {"train_loss": -6.7828216552734375, "global_step": 134047, "epoch": 3191} {"train_loss": -6.68999719619751, "global_step": 134048, "epoch": 3191} {"train_loss": -6.703787803649902, "global_step": 134049, "epoch": 3191} {"train_loss": -6.720241069793701, "global_step": 134050, "epoch": 3191} {"train_loss": -6.609739303588867, "global_step": 134051, "epoch": 3191} {"train_loss": -6.610213279724121, "global_step": 134052, "epoch": 3191} {"train_loss": -6.63840389251709, "global_step": 134053, "epoch": 3191} {"train_loss": -6.780177593231201, "global_step": 134054, "epoch": 3191} {"train_loss": -6.7610859870910645, "global_step": 134055, "epoch": 3191} {"train_loss": -6.591904163360596, "global_step": 134056, "epoch": 3191} {"train_loss": -6.7448015213012695, "global_step": 134057, "epoch": 3191} {"train_loss": -6.639056205749512, "global_step": 134058, "epoch": 3191} {"train_loss": -6.560211658477783, "global_step": 134059, "epoch": 3191} {"train_loss": -6.687962532043457, "global_step": 134060, "epoch": 3191} {"train_loss": -6.583454132080078, "global_step": 134061, "epoch": 3191} {"train_loss": -6.719565391540527, "global_step": 134062, "epoch": 3191} {"train_loss": -6.6868325982775, "global_step": 134063, "epoch": 3191, "val_loss": 66734.0859375} {"train_loss": -6.6323676109313965, "global_step": 134064, "epoch": 3192} {"train_loss": -6.6690778732299805, "global_step": 134065, "epoch": 3192} {"train_loss": -6.581311225891113, "global_step": 134066, "epoch": 3192} {"train_loss": -6.6398162841796875, "global_step": 134067, "epoch": 3192} {"train_loss": -6.675773620605469, "global_step": 134068, "epoch": 3192} {"train_loss": -6.752721786499023, "global_step": 134069, "epoch": 3192} {"train_loss": -6.607118129730225, "global_step": 134070, "epoch": 3192} {"train_loss": -6.728240013122559, "global_step": 134071, "epoch": 3192} {"train_loss": -6.7784037590026855, "global_step": 134072, "epoch": 3192} {"train_loss": -6.652736663818359, "global_step": 134073, "epoch": 3192} {"train_loss": -6.7238616943359375, "global_step": 134074, "epoch": 3192} {"train_loss": -6.6657328605651855, "global_step": 134075, "epoch": 3192} {"train_loss": -6.775477409362793, "global_step": 134076, "epoch": 3192} {"train_loss": -6.837886333465576, "global_step": 134077, "epoch": 3192} {"train_loss": -6.813928604125977, "global_step": 134078, "epoch": 3192} {"train_loss": -6.7450127601623535, "global_step": 134079, "epoch": 3192} {"train_loss": -6.798274040222168, "global_step": 134080, "epoch": 3192} {"train_loss": -6.745373725891113, "global_step": 134081, "epoch": 3192} {"train_loss": -6.769962310791016, "global_step": 134082, "epoch": 3192} {"train_loss": -6.602957248687744, "global_step": 134083, "epoch": 3192} {"train_loss": -6.858051300048828, "global_step": 134084, "epoch": 3192} {"train_loss": -6.635546684265137, "global_step": 134085, "epoch": 3192} {"train_loss": -6.693305015563965, "global_step": 134086, "epoch": 3192} {"train_loss": -6.791274070739746, "global_step": 134087, "epoch": 3192} {"train_loss": -6.72905158996582, "global_step": 134088, "epoch": 3192} {"train_loss": -6.886484622955322, "global_step": 134089, "epoch": 3192} {"train_loss": -6.7977752685546875, "global_step": 134090, "epoch": 3192} {"train_loss": -6.70680046081543, "global_step": 134091, "epoch": 3192} {"train_loss": -6.729150772094727, "global_step": 134092, "epoch": 3192} {"train_loss": -6.736715793609619, "global_step": 134093, "epoch": 3192} {"train_loss": -6.824547290802002, "global_step": 134094, "epoch": 3192} {"train_loss": -6.610051155090332, "global_step": 134095, "epoch": 3192} {"train_loss": -6.8419575691223145, "global_step": 134096, "epoch": 3192} {"train_loss": -6.631563663482666, "global_step": 134097, "epoch": 3192} {"train_loss": -6.732200622558594, "global_step": 134098, "epoch": 3192} {"train_loss": -6.644190311431885, "global_step": 134099, "epoch": 3192} {"train_loss": -6.5843119621276855, "global_step": 134100, "epoch": 3192} {"train_loss": -6.688236236572266, "global_step": 134101, "epoch": 3192} {"train_loss": -6.670209884643555, "global_step": 134102, "epoch": 3192} {"train_loss": -6.557048797607422, "global_step": 134103, "epoch": 3192} {"train_loss": -6.630007743835449, "global_step": 134104, "epoch": 3192} {"train_loss": -6.708336092176891, "global_step": 134105, "epoch": 3192, "val_loss": 66829.234375} {"train_loss": -6.6337151527404785, "global_step": 134106, "epoch": 3193} {"train_loss": -6.846078395843506, "global_step": 134107, "epoch": 3193} {"train_loss": -6.518714904785156, "global_step": 134108, "epoch": 3193} {"train_loss": -6.670715808868408, "global_step": 134109, "epoch": 3193} {"train_loss": -6.537768363952637, "global_step": 134110, "epoch": 3193} {"train_loss": -6.590132713317871, "global_step": 134111, "epoch": 3193} {"train_loss": -6.616975784301758, "global_step": 134112, "epoch": 3193} {"train_loss": -6.6743245124816895, "global_step": 134113, "epoch": 3193} {"train_loss": -6.758047103881836, "global_step": 134114, "epoch": 3193} {"train_loss": -6.694698810577393, "global_step": 134115, "epoch": 3193} {"train_loss": -6.6360321044921875, "global_step": 134116, "epoch": 3193} {"train_loss": -6.684812545776367, "global_step": 134117, "epoch": 3193} {"train_loss": -6.647762298583984, "global_step": 134118, "epoch": 3193} {"train_loss": -6.779731750488281, "global_step": 134119, "epoch": 3193} {"train_loss": -6.713910102844238, "global_step": 134120, "epoch": 3193} {"train_loss": -6.727617263793945, "global_step": 134121, "epoch": 3193} {"train_loss": -6.637449264526367, "global_step": 134122, "epoch": 3193} {"train_loss": -6.62800407409668, "global_step": 134123, "epoch": 3193} {"train_loss": -6.631527423858643, "global_step": 134124, "epoch": 3193} {"train_loss": -6.680629730224609, "global_step": 134125, "epoch": 3193} {"train_loss": -6.678460597991943, "global_step": 134126, "epoch": 3193} {"train_loss": -6.753708839416504, "global_step": 134127, "epoch": 3193} {"train_loss": -6.708823204040527, "global_step": 134128, "epoch": 3193} {"train_loss": -6.763383865356445, "global_step": 134129, "epoch": 3193} {"train_loss": -6.71830940246582, "global_step": 134130, "epoch": 3193} {"train_loss": -6.725387096405029, "global_step": 134131, "epoch": 3193} {"train_loss": -6.7364912033081055, "global_step": 134132, "epoch": 3193} {"train_loss": -6.604705810546875, "global_step": 134133, "epoch": 3193} {"train_loss": -6.674551963806152, "global_step": 134134, "epoch": 3193} {"train_loss": -6.737087249755859, "global_step": 134135, "epoch": 3193} {"train_loss": -6.632054328918457, "global_step": 134136, "epoch": 3193} {"train_loss": -6.711210250854492, "global_step": 134137, "epoch": 3193} {"train_loss": -6.789543628692627, "global_step": 134138, "epoch": 3193} {"train_loss": -6.770435333251953, "global_step": 134139, "epoch": 3193} {"train_loss": -6.660972595214844, "global_step": 134140, "epoch": 3193} {"train_loss": -6.66261625289917, "global_step": 134141, "epoch": 3193} {"train_loss": -6.7408881187438965, "global_step": 134142, "epoch": 3193} {"train_loss": -6.556007385253906, "global_step": 134143, "epoch": 3193} {"train_loss": -6.749519348144531, "global_step": 134144, "epoch": 3193} {"train_loss": -6.659200191497803, "global_step": 134145, "epoch": 3193} {"train_loss": -6.701603412628174, "global_step": 134146, "epoch": 3193} {"train_loss": -6.685938755671184, "global_step": 134147, "epoch": 3193, "val_loss": 67034.53125} {"train_loss": -6.70357608795166, "global_step": 134148, "epoch": 3194} {"train_loss": -6.749398231506348, "global_step": 134149, "epoch": 3194} {"train_loss": -6.746772766113281, "global_step": 134150, "epoch": 3194} {"train_loss": -6.632373809814453, "global_step": 134151, "epoch": 3194} {"train_loss": -6.700924873352051, "global_step": 134152, "epoch": 3194} {"train_loss": -6.846066474914551, "global_step": 134153, "epoch": 3194} {"train_loss": -6.594647407531738, "global_step": 134154, "epoch": 3194} {"train_loss": -6.67239236831665, "global_step": 134155, "epoch": 3194} {"train_loss": -6.809700965881348, "global_step": 134156, "epoch": 3194} {"train_loss": -6.796531677246094, "global_step": 134157, "epoch": 3194} {"train_loss": -6.713555812835693, "global_step": 134158, "epoch": 3194} {"train_loss": -6.725621223449707, "global_step": 134159, "epoch": 3194} {"train_loss": -6.7505621910095215, "global_step": 134160, "epoch": 3194} {"train_loss": -6.6353678703308105, "global_step": 134161, "epoch": 3194} {"train_loss": -6.694024085998535, "global_step": 134162, "epoch": 3194} {"train_loss": -6.6271281242370605, "global_step": 134163, "epoch": 3194} {"train_loss": -6.692324638366699, "global_step": 134164, "epoch": 3194} {"train_loss": -6.507680892944336, "global_step": 134165, "epoch": 3194} {"train_loss": -6.383631706237793, "global_step": 134166, "epoch": 3194} {"train_loss": -6.837486267089844, "global_step": 134167, "epoch": 3194} {"train_loss": -6.60178279876709, "global_step": 134168, "epoch": 3194} {"train_loss": -6.665600299835205, "global_step": 134169, "epoch": 3194} {"train_loss": -6.681887626647949, "global_step": 134170, "epoch": 3194} {"train_loss": -6.6127777099609375, "global_step": 134171, "epoch": 3194} {"train_loss": -6.650249004364014, "global_step": 134172, "epoch": 3194} {"train_loss": -6.7258195877075195, "global_step": 134173, "epoch": 3194} {"train_loss": -6.621062278747559, "global_step": 134174, "epoch": 3194} {"train_loss": -6.768442153930664, "global_step": 134175, "epoch": 3194} {"train_loss": -6.5487565994262695, "global_step": 134176, "epoch": 3194} {"train_loss": -6.690858364105225, "global_step": 134177, "epoch": 3194} {"train_loss": -6.675018310546875, "global_step": 134178, "epoch": 3194} {"train_loss": -6.779209613800049, "global_step": 134179, "epoch": 3194} {"train_loss": -6.759335041046143, "global_step": 134180, "epoch": 3194} {"train_loss": -6.6569671630859375, "global_step": 134181, "epoch": 3194} {"train_loss": -6.725924015045166, "global_step": 134182, "epoch": 3194} {"train_loss": -6.6374006271362305, "global_step": 134183, "epoch": 3194} {"train_loss": -6.663018226623535, "global_step": 134184, "epoch": 3194} {"train_loss": -6.783089637756348, "global_step": 134185, "epoch": 3194} {"train_loss": -6.751500129699707, "global_step": 134186, "epoch": 3194} {"train_loss": -6.554542541503906, "global_step": 134187, "epoch": 3194} {"train_loss": -6.802949905395508, "global_step": 134188, "epoch": 3194} {"train_loss": -6.687510479064215, "global_step": 134189, "epoch": 3194, "val_loss": 66917.390625} {"train_loss": -6.610696315765381, "global_step": 134190, "epoch": 3195} {"train_loss": -6.598171234130859, "global_step": 134191, "epoch": 3195} {"train_loss": -6.636953353881836, "global_step": 134192, "epoch": 3195} {"train_loss": -6.694068908691406, "global_step": 134193, "epoch": 3195} {"train_loss": -6.748019695281982, "global_step": 134194, "epoch": 3195} {"train_loss": -6.565591812133789, "global_step": 134195, "epoch": 3195} {"train_loss": -6.636517524719238, "global_step": 134196, "epoch": 3195} {"train_loss": -6.684987545013428, "global_step": 134197, "epoch": 3195} {"train_loss": -6.6595940589904785, "global_step": 134198, "epoch": 3195} {"train_loss": -6.653460502624512, "global_step": 134199, "epoch": 3195} {"train_loss": -6.604135036468506, "global_step": 134200, "epoch": 3195} {"train_loss": -6.481339454650879, "global_step": 134201, "epoch": 3195} {"train_loss": -6.625406265258789, "global_step": 134202, "epoch": 3195} {"train_loss": -6.774304389953613, "global_step": 134203, "epoch": 3195} {"train_loss": -6.625936508178711, "global_step": 134204, "epoch": 3195} {"train_loss": -6.734575271606445, "global_step": 134205, "epoch": 3195} {"train_loss": -6.64335823059082, "global_step": 134206, "epoch": 3195} {"train_loss": -6.636530876159668, "global_step": 134207, "epoch": 3195} {"train_loss": -6.740119934082031, "global_step": 134208, "epoch": 3195} {"train_loss": -6.590000152587891, "global_step": 134209, "epoch": 3195} {"train_loss": -6.719145774841309, "global_step": 134210, "epoch": 3195} {"train_loss": -6.6683807373046875, "global_step": 134211, "epoch": 3195} {"train_loss": -6.644697189331055, "global_step": 134212, "epoch": 3195} {"train_loss": -6.6460418701171875, "global_step": 134213, "epoch": 3195} {"train_loss": -6.784535884857178, "global_step": 134214, "epoch": 3195} {"train_loss": -6.661175727844238, "global_step": 134215, "epoch": 3195} {"train_loss": -6.749532699584961, "global_step": 134216, "epoch": 3195} {"train_loss": -6.69067907333374, "global_step": 134217, "epoch": 3195} {"train_loss": -6.6729326248168945, "global_step": 134218, "epoch": 3195} {"train_loss": -6.735598564147949, "global_step": 134219, "epoch": 3195} {"train_loss": -6.6732282638549805, "global_step": 134220, "epoch": 3195} {"train_loss": -6.737671852111816, "global_step": 134221, "epoch": 3195} {"train_loss": -6.706768035888672, "global_step": 134222, "epoch": 3195} {"train_loss": -6.746984481811523, "global_step": 134223, "epoch": 3195} {"train_loss": -6.788994789123535, "global_step": 134224, "epoch": 3195} {"train_loss": -6.6343889236450195, "global_step": 134225, "epoch": 3195} {"train_loss": -6.743732452392578, "global_step": 134226, "epoch": 3195} {"train_loss": -6.724314212799072, "global_step": 134227, "epoch": 3195} {"train_loss": -6.770087718963623, "global_step": 134228, "epoch": 3195} {"train_loss": -6.584969520568848, "global_step": 134229, "epoch": 3195} {"train_loss": -6.576218605041504, "global_step": 134230, "epoch": 3195} {"train_loss": -6.675834780647641, "global_step": 134231, "epoch": 3195, "val_loss": 66740.1640625} {"train_loss": -6.577712535858154, "global_step": 134232, "epoch": 3196} {"train_loss": -6.68091344833374, "global_step": 134233, "epoch": 3196} {"train_loss": -6.697751045227051, "global_step": 134234, "epoch": 3196} {"train_loss": -6.623559951782227, "global_step": 134235, "epoch": 3196} {"train_loss": -6.7498931884765625, "global_step": 134236, "epoch": 3196} {"train_loss": -6.661861419677734, "global_step": 134237, "epoch": 3196} {"train_loss": -6.695343017578125, "global_step": 134238, "epoch": 3196} {"train_loss": -6.751733779907227, "global_step": 134239, "epoch": 3196} {"train_loss": -6.747072219848633, "global_step": 134240, "epoch": 3196} {"train_loss": -6.731796741485596, "global_step": 134241, "epoch": 3196} {"train_loss": -6.655673503875732, "global_step": 134242, "epoch": 3196} {"train_loss": -6.841322898864746, "global_step": 134243, "epoch": 3196} {"train_loss": -6.573387145996094, "global_step": 134244, "epoch": 3196} {"train_loss": -6.66043758392334, "global_step": 134245, "epoch": 3196} {"train_loss": -6.680164813995361, "global_step": 134246, "epoch": 3196} {"train_loss": -6.6440911293029785, "global_step": 134247, "epoch": 3196} {"train_loss": -6.613025665283203, "global_step": 134248, "epoch": 3196} {"train_loss": -6.702417850494385, "global_step": 134249, "epoch": 3196} {"train_loss": -6.583890914916992, "global_step": 134250, "epoch": 3196} {"train_loss": -6.546271324157715, "global_step": 134251, "epoch": 3196} {"train_loss": -6.791537761688232, "global_step": 134252, "epoch": 3196} {"train_loss": -6.670439720153809, "global_step": 134253, "epoch": 3196} {"train_loss": -6.5641961097717285, "global_step": 134254, "epoch": 3196} {"train_loss": -6.689270496368408, "global_step": 134255, "epoch": 3196} {"train_loss": -6.636227130889893, "global_step": 134256, "epoch": 3196} {"train_loss": -6.624335289001465, "global_step": 134257, "epoch": 3196} {"train_loss": -6.568323135375977, "global_step": 134258, "epoch": 3196} {"train_loss": -6.590867519378662, "global_step": 134259, "epoch": 3196} {"train_loss": -6.538059234619141, "global_step": 134260, "epoch": 3196} {"train_loss": -6.6216583251953125, "global_step": 134261, "epoch": 3196} {"train_loss": -6.542376518249512, "global_step": 134262, "epoch": 3196} {"train_loss": -6.666860580444336, "global_step": 134263, "epoch": 3196} {"train_loss": -6.669349193572998, "global_step": 134264, "epoch": 3196} {"train_loss": -6.636958599090576, "global_step": 134265, "epoch": 3196} {"train_loss": -6.573452472686768, "global_step": 134266, "epoch": 3196} {"train_loss": -6.589779853820801, "global_step": 134267, "epoch": 3196} {"train_loss": -6.63665246963501, "global_step": 134268, "epoch": 3196} {"train_loss": -6.61440372467041, "global_step": 134269, "epoch": 3196} {"train_loss": -6.638514041900635, "global_step": 134270, "epoch": 3196} {"train_loss": -6.629448890686035, "global_step": 134271, "epoch": 3196} {"train_loss": -6.6274309158325195, "global_step": 134272, "epoch": 3196} {"train_loss": -6.647622358231318, "global_step": 134273, "epoch": 3196, "val_loss": 67298.390625} {"train_loss": -6.638360977172852, "global_step": 134274, "epoch": 3197} {"train_loss": -6.716599941253662, "global_step": 134275, "epoch": 3197} {"train_loss": -6.725286483764648, "global_step": 134276, "epoch": 3197} {"train_loss": -6.674493312835693, "global_step": 134277, "epoch": 3197} {"train_loss": -6.7790069580078125, "global_step": 134278, "epoch": 3197} {"train_loss": -6.739805221557617, "global_step": 134279, "epoch": 3197} {"train_loss": -6.746705055236816, "global_step": 134280, "epoch": 3197} {"train_loss": -6.792725086212158, "global_step": 134281, "epoch": 3197} {"train_loss": -6.697283744812012, "global_step": 134282, "epoch": 3197} {"train_loss": -6.763319492340088, "global_step": 134283, "epoch": 3197} {"train_loss": -6.78998327255249, "global_step": 134284, "epoch": 3197} {"train_loss": -6.729334831237793, "global_step": 134285, "epoch": 3197} {"train_loss": -6.714461326599121, "global_step": 134286, "epoch": 3197} {"train_loss": -6.715880393981934, "global_step": 134287, "epoch": 3197} {"train_loss": -6.759718894958496, "global_step": 134288, "epoch": 3197} {"train_loss": -6.774831771850586, "global_step": 134289, "epoch": 3197} {"train_loss": -6.783475399017334, "global_step": 134290, "epoch": 3197} {"train_loss": -6.761529922485352, "global_step": 134291, "epoch": 3197} {"train_loss": -6.735361099243164, "global_step": 134292, "epoch": 3197} {"train_loss": -6.6251983642578125, "global_step": 134293, "epoch": 3197} {"train_loss": -6.782829284667969, "global_step": 134294, "epoch": 3197} {"train_loss": -6.662933826446533, "global_step": 134295, "epoch": 3197} {"train_loss": -6.695047378540039, "global_step": 134296, "epoch": 3197} {"train_loss": -6.745904445648193, "global_step": 134297, "epoch": 3197} {"train_loss": -6.751607894897461, "global_step": 134298, "epoch": 3197} {"train_loss": -6.618894577026367, "global_step": 134299, "epoch": 3197} {"train_loss": -6.766050338745117, "global_step": 134300, "epoch": 3197} {"train_loss": -6.7353010177612305, "global_step": 134301, "epoch": 3197} {"train_loss": -6.709612846374512, "global_step": 134302, "epoch": 3197} {"train_loss": -6.681334495544434, "global_step": 134303, "epoch": 3197} {"train_loss": -6.760909080505371, "global_step": 134304, "epoch": 3197} {"train_loss": -6.658870697021484, "global_step": 134305, "epoch": 3197} {"train_loss": -6.683072090148926, "global_step": 134306, "epoch": 3197} {"train_loss": -6.695295333862305, "global_step": 134307, "epoch": 3197} {"train_loss": -6.750500679016113, "global_step": 134308, "epoch": 3197} {"train_loss": -6.732289791107178, "global_step": 134309, "epoch": 3197} {"train_loss": -6.738692283630371, "global_step": 134310, "epoch": 3197} {"train_loss": -6.72901725769043, "global_step": 134311, "epoch": 3197} {"train_loss": -6.65893030166626, "global_step": 134312, "epoch": 3197} {"train_loss": -6.69624137878418, "global_step": 134313, "epoch": 3197} {"train_loss": -6.776522636413574, "global_step": 134314, "epoch": 3197} {"train_loss": -6.7250562735966275, "global_step": 134315, "epoch": 3197, "val_loss": 66887.5703125} {"train_loss": -6.747564315795898, "global_step": 134316, "epoch": 3198} {"train_loss": -6.709074974060059, "global_step": 134317, "epoch": 3198} {"train_loss": -6.734628200531006, "global_step": 134318, "epoch": 3198} {"train_loss": -6.742499351501465, "global_step": 134319, "epoch": 3198} {"train_loss": -6.804780960083008, "global_step": 134320, "epoch": 3198} {"train_loss": -6.673957824707031, "global_step": 134321, "epoch": 3198} {"train_loss": -6.50039005279541, "global_step": 134322, "epoch": 3198} {"train_loss": -6.668694496154785, "global_step": 134323, "epoch": 3198} {"train_loss": -6.889711856842041, "global_step": 134324, "epoch": 3198} {"train_loss": -6.720732688903809, "global_step": 134325, "epoch": 3198} {"train_loss": -6.55767297744751, "global_step": 134326, "epoch": 3198} {"train_loss": -6.67172908782959, "global_step": 134327, "epoch": 3198} {"train_loss": -6.644930362701416, "global_step": 134328, "epoch": 3198} {"train_loss": -6.5748291015625, "global_step": 134329, "epoch": 3198} {"train_loss": -6.756475448608398, "global_step": 134330, "epoch": 3198} {"train_loss": -6.7161126136779785, "global_step": 134331, "epoch": 3198} {"train_loss": -6.756163597106934, "global_step": 134332, "epoch": 3198} {"train_loss": -6.688021659851074, "global_step": 134333, "epoch": 3198} {"train_loss": -6.646820068359375, "global_step": 134334, "epoch": 3198} {"train_loss": -6.752508163452148, "global_step": 134335, "epoch": 3198} {"train_loss": -6.620622158050537, "global_step": 134336, "epoch": 3198} {"train_loss": -6.724944591522217, "global_step": 134337, "epoch": 3198} {"train_loss": -6.736021995544434, "global_step": 134338, "epoch": 3198} {"train_loss": -6.6252641677856445, "global_step": 134339, "epoch": 3198} {"train_loss": -6.616390228271484, "global_step": 134340, "epoch": 3198} {"train_loss": -6.693652629852295, "global_step": 134341, "epoch": 3198} {"train_loss": -6.710822105407715, "global_step": 134342, "epoch": 3198} {"train_loss": -6.753860950469971, "global_step": 134343, "epoch": 3198} {"train_loss": -6.759652137756348, "global_step": 134344, "epoch": 3198} {"train_loss": -6.577958106994629, "global_step": 134345, "epoch": 3198} {"train_loss": -6.584137439727783, "global_step": 134346, "epoch": 3198} {"train_loss": -6.690629959106445, "global_step": 134347, "epoch": 3198} {"train_loss": -6.594324588775635, "global_step": 134348, "epoch": 3198} {"train_loss": -6.623588562011719, "global_step": 134349, "epoch": 3198} {"train_loss": -6.539276123046875, "global_step": 134350, "epoch": 3198} {"train_loss": -6.642269611358643, "global_step": 134351, "epoch": 3198} {"train_loss": -6.57398796081543, "global_step": 134352, "epoch": 3198} {"train_loss": -6.610177993774414, "global_step": 134353, "epoch": 3198} {"train_loss": -6.622249126434326, "global_step": 134354, "epoch": 3198} {"train_loss": -6.613768577575684, "global_step": 134355, "epoch": 3198} {"train_loss": -6.611605644226074, "global_step": 134356, "epoch": 3198} {"train_loss": -6.669402837753296, "global_step": 134357, "epoch": 3198, "val_loss": 67022.6953125} {"train_loss": -6.695216655731201, "global_step": 134358, "epoch": 3199} {"train_loss": -6.607301712036133, "global_step": 134359, "epoch": 3199} {"train_loss": -6.766541481018066, "global_step": 134360, "epoch": 3199} {"train_loss": -6.610462188720703, "global_step": 134361, "epoch": 3199} {"train_loss": -6.665244102478027, "global_step": 134362, "epoch": 3199} {"train_loss": -6.614589691162109, "global_step": 134363, "epoch": 3199} {"train_loss": -6.677600860595703, "global_step": 134364, "epoch": 3199} {"train_loss": -6.676913261413574, "global_step": 134365, "epoch": 3199} {"train_loss": -6.635187149047852, "global_step": 134366, "epoch": 3199} {"train_loss": -6.728960990905762, "global_step": 134367, "epoch": 3199} {"train_loss": -6.63931131362915, "global_step": 134368, "epoch": 3199} {"train_loss": -6.767711639404297, "global_step": 134369, "epoch": 3199} {"train_loss": -6.6695356369018555, "global_step": 134370, "epoch": 3199} {"train_loss": -6.759864330291748, "global_step": 134371, "epoch": 3199} {"train_loss": -6.633232116699219, "global_step": 134372, "epoch": 3199} {"train_loss": -6.592086315155029, "global_step": 134373, "epoch": 3199} {"train_loss": -6.755076885223389, "global_step": 134374, "epoch": 3199} {"train_loss": -6.761153697967529, "global_step": 134375, "epoch": 3199} {"train_loss": -6.73148250579834, "global_step": 134376, "epoch": 3199} {"train_loss": -6.494205474853516, "global_step": 134377, "epoch": 3199} {"train_loss": -6.702964782714844, "global_step": 134378, "epoch": 3199} {"train_loss": -6.725086688995361, "global_step": 134379, "epoch": 3199} {"train_loss": -6.696388244628906, "global_step": 134380, "epoch": 3199} {"train_loss": -6.710379600524902, "global_step": 134381, "epoch": 3199} {"train_loss": -6.59553337097168, "global_step": 134382, "epoch": 3199} {"train_loss": -6.62505578994751, "global_step": 134383, "epoch": 3199} {"train_loss": -6.7154316902160645, "global_step": 134384, "epoch": 3199} {"train_loss": -6.626805305480957, "global_step": 134385, "epoch": 3199} {"train_loss": -6.740355968475342, "global_step": 134386, "epoch": 3199} {"train_loss": -6.697843551635742, "global_step": 134387, "epoch": 3199} {"train_loss": -6.64393424987793, "global_step": 134388, "epoch": 3199} {"train_loss": -6.694411754608154, "global_step": 134389, "epoch": 3199} {"train_loss": -6.801672458648682, "global_step": 134390, "epoch": 3199} {"train_loss": -6.639019966125488, "global_step": 134391, "epoch": 3199} {"train_loss": -6.560063362121582, "global_step": 134392, "epoch": 3199} {"train_loss": -6.83198356628418, "global_step": 134393, "epoch": 3199} {"train_loss": -6.659465789794922, "global_step": 134394, "epoch": 3199} {"train_loss": -6.703732013702393, "global_step": 134395, "epoch": 3199} {"train_loss": -6.6424689292907715, "global_step": 134396, "epoch": 3199} {"train_loss": -6.644306659698486, "global_step": 134397, "epoch": 3199} {"train_loss": -6.83454704284668, "global_step": 134398, "epoch": 3199} {"train_loss": -6.682843957628522, "global_step": 134399, "epoch": 3199, "val_loss": 66962.59375} {"train_loss": -6.849787712097168, "global_step": 134400, "epoch": 3200} {"train_loss": -6.769815444946289, "global_step": 134401, "epoch": 3200} {"train_loss": -6.798708438873291, "global_step": 134402, "epoch": 3200} {"train_loss": -6.667636871337891, "global_step": 134403, "epoch": 3200} {"train_loss": -6.824265956878662, "global_step": 134404, "epoch": 3200} {"train_loss": -6.729403495788574, "global_step": 134405, "epoch": 3200} {"train_loss": -6.764084815979004, "global_step": 134406, "epoch": 3200} {"train_loss": -6.76593017578125, "global_step": 134407, "epoch": 3200} {"train_loss": -6.732634544372559, "global_step": 134408, "epoch": 3200} {"train_loss": -6.796088218688965, "global_step": 134409, "epoch": 3200} {"train_loss": -6.752958297729492, "global_step": 134410, "epoch": 3200} {"train_loss": -6.933024883270264, "global_step": 134411, "epoch": 3200} {"train_loss": -6.812089920043945, "global_step": 134412, "epoch": 3200} {"train_loss": -6.754786014556885, "global_step": 134413, "epoch": 3200} {"train_loss": -6.772914886474609, "global_step": 134414, "epoch": 3200} {"train_loss": -6.728552341461182, "global_step": 134415, "epoch": 3200} {"train_loss": -6.679242134094238, "global_step": 134416, "epoch": 3200} {"train_loss": -6.703770160675049, "global_step": 134417, "epoch": 3200} {"train_loss": -6.798284530639648, "global_step": 134418, "epoch": 3200} {"train_loss": -6.73655891418457, "global_step": 134419, "epoch": 3200} {"train_loss": -6.692747116088867, "global_step": 134420, "epoch": 3200} {"train_loss": -6.763891696929932, "global_step": 134421, "epoch": 3200} {"train_loss": -6.709728240966797, "global_step": 134422, "epoch": 3200} {"train_loss": -6.755845546722412, "global_step": 134423, "epoch": 3200} {"train_loss": -6.726629257202148, "global_step": 134424, "epoch": 3200} {"train_loss": -6.7021331787109375, "global_step": 134425, "epoch": 3200} {"train_loss": -6.8157639503479, "global_step": 134426, "epoch": 3200} {"train_loss": -6.750836372375488, "global_step": 134427, "epoch": 3200} {"train_loss": -6.631030082702637, "global_step": 134428, "epoch": 3200} {"train_loss": -6.633450031280518, "global_step": 134429, "epoch": 3200} {"train_loss": -6.7137532234191895, "global_step": 134430, "epoch": 3200} {"train_loss": -6.602256774902344, "global_step": 134431, "epoch": 3200} {"train_loss": -6.7337846755981445, "global_step": 134432, "epoch": 3200} {"train_loss": -6.638966083526611, "global_step": 134433, "epoch": 3200} {"train_loss": -6.70644474029541, "global_step": 134434, "epoch": 3200} {"train_loss": -6.725169658660889, "global_step": 134435, "epoch": 3200} {"train_loss": -6.6309356689453125, "global_step": 134436, "epoch": 3200} {"train_loss": -6.715897083282471, "global_step": 134437, "epoch": 3200} {"train_loss": -6.773822784423828, "global_step": 134438, "epoch": 3200} {"train_loss": -6.686514854431152, "global_step": 134439, "epoch": 3200} {"train_loss": -6.7864274978637695, "global_step": 134440, "epoch": 3200} {"train_loss": -6.7407881532396585, "global_step": 134441, "epoch": 3200, "train/sim_max_reward_0": 0.1916537094074233, "train/sim_max_reward_1": 0.9528465414173161, "train/sim_max_reward_2": 0.5426264185301973, "train/sim_max_reward_3": 0.3962790520443081, "train/sim_max_reward_4": 0.8339422812753852, "train/sim_max_reward_5": 0.2890376066073436, "test/sim_max_reward_4300000": 0.013628093070725225, "test/sim_max_reward_4300001": 0.3927801915239976, "test/sim_max_reward_4300002": 0.9805958263317613, "test/sim_max_reward_4300003": 0.9068910875928478, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9573599957793473, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.37704612500558016, "test/sim_max_reward_4300008": 0.9354793248393359, "test/sim_max_reward_4300009": 0.9875357461578694, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.9811601803983206, "test/sim_max_reward_4300013": 0.9975869032629789, "test/sim_max_reward_4300014": 0.9951421294107328, "test/sim_max_reward_4300015": 0.9860942920666511, "test/sim_max_reward_4300016": 0.9574669859418005, "test/sim_max_reward_4300017": 0.9368828054749294, "test/sim_max_reward_4300018": 0.41576818547713534, "test/sim_max_reward_4300019": 0.18347356671596415, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8386991448919531, "test/sim_max_reward_4300022": 0.9469071570344633, "test/sim_max_reward_4300023": 0.32661783674075584, "test/sim_max_reward_4300024": 0.9352924129969873, "test/sim_max_reward_4300025": 0.9680531144397106, "test/sim_max_reward_4300026": 0.2551564706117039, "test/sim_max_reward_4300027": 0.9612650833132147, "test/sim_max_reward_4300028": 0.9700186806113235, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.9512157363379053, "test/sim_max_reward_4300031": 0.21082477221822327, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.7237478994718297, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.7803818556632167, "test/sim_max_reward_4300036": 0.20253834933855278, "test/sim_max_reward_4300037": 0.9796586568760729, "test/sim_max_reward_4300038": 0.9649920406119776, "test/sim_max_reward_4300039": 0.3905710778575516, "test/sim_max_reward_4300040": 0.4877399367516338, "test/sim_max_reward_4300041": 0.952498398470196, "test/sim_max_reward_4300042": 0.879893484842585, "test/sim_max_reward_4300043": 0.1675610955910604, "test/sim_max_reward_4300044": 0.8069852361043296, "test/sim_max_reward_4300045": 0.9495596282979342, "test/sim_max_reward_4300046": 0.0, "test/sim_max_reward_4300047": 0.11020298222603099, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.2361014303124659, "train/mean_score": 0.5343976015469956, "test/mean_score": 0.6003441605094189, "val_loss": 66743.0078125} {"train_loss": -6.794766426086426, "global_step": 134442, "epoch": 3201} {"train_loss": -6.806793212890625, "global_step": 134443, "epoch": 3201} {"train_loss": -6.741006851196289, "global_step": 134444, "epoch": 3201} {"train_loss": -6.799915313720703, "global_step": 134445, "epoch": 3201} {"train_loss": -6.746238708496094, "global_step": 134446, "epoch": 3201} {"train_loss": -6.645853519439697, "global_step": 134447, "epoch": 3201} {"train_loss": -6.732125282287598, "global_step": 134448, "epoch": 3201} {"train_loss": -6.808144569396973, "global_step": 134449, "epoch": 3201} {"train_loss": -6.865765571594238, "global_step": 134450, "epoch": 3201} {"train_loss": -6.762068748474121, "global_step": 134451, "epoch": 3201} {"train_loss": -6.83869743347168, "global_step": 134452, "epoch": 3201} {"train_loss": -6.749324798583984, "global_step": 134453, "epoch": 3201} {"train_loss": -6.833732604980469, "global_step": 134454, "epoch": 3201} {"train_loss": -6.800278663635254, "global_step": 134455, "epoch": 3201} {"train_loss": -6.722965240478516, "global_step": 134456, "epoch": 3201} {"train_loss": -6.783595085144043, "global_step": 134457, "epoch": 3201} {"train_loss": -6.716835021972656, "global_step": 134458, "epoch": 3201} {"train_loss": -6.665081977844238, "global_step": 134459, "epoch": 3201} {"train_loss": -6.752091884613037, "global_step": 134460, "epoch": 3201} {"train_loss": -6.71572732925415, "global_step": 134461, "epoch": 3201} {"train_loss": -6.610691547393799, "global_step": 134462, "epoch": 3201} {"train_loss": -6.691180229187012, "global_step": 134463, "epoch": 3201} {"train_loss": -6.667140007019043, "global_step": 134464, "epoch": 3201} {"train_loss": -6.664668083190918, "global_step": 134465, "epoch": 3201} {"train_loss": -6.716647624969482, "global_step": 134466, "epoch": 3201} {"train_loss": -6.730992317199707, "global_step": 134467, "epoch": 3201} {"train_loss": -6.800049781799316, "global_step": 134468, "epoch": 3201} {"train_loss": -6.723774433135986, "global_step": 134469, "epoch": 3201} {"train_loss": -6.617400646209717, "global_step": 134470, "epoch": 3201} {"train_loss": -6.718780994415283, "global_step": 134471, "epoch": 3201} {"train_loss": -6.819316864013672, "global_step": 134472, "epoch": 3201} {"train_loss": -6.63395881652832, "global_step": 134473, "epoch": 3201} {"train_loss": -6.708391189575195, "global_step": 134474, "epoch": 3201} {"train_loss": -6.68760871887207, "global_step": 134475, "epoch": 3201} {"train_loss": -6.633601188659668, "global_step": 134476, "epoch": 3201} {"train_loss": -6.672183990478516, "global_step": 134477, "epoch": 3201} {"train_loss": -6.692383766174316, "global_step": 134478, "epoch": 3201} {"train_loss": -6.65380334854126, "global_step": 134479, "epoch": 3201} {"train_loss": -6.610252857208252, "global_step": 134480, "epoch": 3201} {"train_loss": -6.752331733703613, "global_step": 134481, "epoch": 3201} {"train_loss": -6.598820209503174, "global_step": 134482, "epoch": 3201} {"train_loss": -6.725197996412005, "global_step": 134483, "epoch": 3201, "val_loss": 66836.8984375} {"train_loss": -6.7362236976623535, "global_step": 134484, "epoch": 3202} {"train_loss": -6.715816497802734, "global_step": 134485, "epoch": 3202} {"train_loss": -6.765167236328125, "global_step": 134486, "epoch": 3202} {"train_loss": -6.7987165451049805, "global_step": 134487, "epoch": 3202} {"train_loss": -6.731427192687988, "global_step": 134488, "epoch": 3202} {"train_loss": -6.76624870300293, "global_step": 134489, "epoch": 3202} {"train_loss": -6.707305908203125, "global_step": 134490, "epoch": 3202} {"train_loss": -6.7035369873046875, "global_step": 134491, "epoch": 3202} {"train_loss": -6.596994876861572, "global_step": 134492, "epoch": 3202} {"train_loss": -6.5424065589904785, "global_step": 134493, "epoch": 3202} {"train_loss": -6.763144493103027, "global_step": 134494, "epoch": 3202} {"train_loss": -6.679582595825195, "global_step": 134495, "epoch": 3202} {"train_loss": -6.596382141113281, "global_step": 134496, "epoch": 3202} {"train_loss": -6.707093238830566, "global_step": 134497, "epoch": 3202} {"train_loss": -6.608155250549316, "global_step": 134498, "epoch": 3202} {"train_loss": -6.689455032348633, "global_step": 134499, "epoch": 3202} {"train_loss": -6.65180778503418, "global_step": 134500, "epoch": 3202} {"train_loss": -6.677104473114014, "global_step": 134501, "epoch": 3202} {"train_loss": -6.698033332824707, "global_step": 134502, "epoch": 3202} {"train_loss": -6.712676048278809, "global_step": 134503, "epoch": 3202} {"train_loss": -6.710394859313965, "global_step": 134504, "epoch": 3202} {"train_loss": -6.756735801696777, "global_step": 134505, "epoch": 3202} {"train_loss": -6.736433982849121, "global_step": 134506, "epoch": 3202} {"train_loss": -6.693330764770508, "global_step": 134507, "epoch": 3202} {"train_loss": -6.716352462768555, "global_step": 134508, "epoch": 3202} {"train_loss": -6.70344352722168, "global_step": 134509, "epoch": 3202} {"train_loss": -6.8164262771606445, "global_step": 134510, "epoch": 3202} {"train_loss": -6.644808292388916, "global_step": 134511, "epoch": 3202} {"train_loss": -6.767330646514893, "global_step": 134512, "epoch": 3202} {"train_loss": -6.749993324279785, "global_step": 134513, "epoch": 3202} {"train_loss": -6.641956329345703, "global_step": 134514, "epoch": 3202} {"train_loss": -6.608700752258301, "global_step": 134515, "epoch": 3202} {"train_loss": -6.748961448669434, "global_step": 134516, "epoch": 3202} {"train_loss": -6.542449951171875, "global_step": 134517, "epoch": 3202} {"train_loss": -6.61159610748291, "global_step": 134518, "epoch": 3202} {"train_loss": -6.687327861785889, "global_step": 134519, "epoch": 3202} {"train_loss": -6.580516815185547, "global_step": 134520, "epoch": 3202} {"train_loss": -6.607345104217529, "global_step": 134521, "epoch": 3202} {"train_loss": -6.710116863250732, "global_step": 134522, "epoch": 3202} {"train_loss": -6.643737316131592, "global_step": 134523, "epoch": 3202} {"train_loss": -6.626051425933838, "global_step": 134524, "epoch": 3202} {"train_loss": -6.689194747379848, "global_step": 134525, "epoch": 3202, "val_loss": 66917.7890625} {"train_loss": -6.710566520690918, "global_step": 134526, "epoch": 3203} {"train_loss": -6.760614395141602, "global_step": 134527, "epoch": 3203} {"train_loss": -6.649385929107666, "global_step": 134528, "epoch": 3203} {"train_loss": -6.707770347595215, "global_step": 134529, "epoch": 3203} {"train_loss": -6.769467353820801, "global_step": 134530, "epoch": 3203} {"train_loss": -6.703374862670898, "global_step": 134531, "epoch": 3203} {"train_loss": -6.715666770935059, "global_step": 134532, "epoch": 3203} {"train_loss": -6.719625473022461, "global_step": 134533, "epoch": 3203} {"train_loss": -6.781001091003418, "global_step": 134534, "epoch": 3203} {"train_loss": -6.775225639343262, "global_step": 134535, "epoch": 3203} {"train_loss": -6.748595237731934, "global_step": 134536, "epoch": 3203} {"train_loss": -6.705565929412842, "global_step": 134537, "epoch": 3203} {"train_loss": -6.793747901916504, "global_step": 134538, "epoch": 3203} {"train_loss": -6.77851676940918, "global_step": 134539, "epoch": 3203} {"train_loss": -6.675433158874512, "global_step": 134540, "epoch": 3203} {"train_loss": -6.730760097503662, "global_step": 134541, "epoch": 3203} {"train_loss": -6.798479080200195, "global_step": 134542, "epoch": 3203} {"train_loss": -6.747577667236328, "global_step": 134543, "epoch": 3203} {"train_loss": -6.830357074737549, "global_step": 134544, "epoch": 3203} {"train_loss": -6.7447919845581055, "global_step": 134545, "epoch": 3203} {"train_loss": -6.690383434295654, "global_step": 134546, "epoch": 3203} {"train_loss": -6.884157657623291, "global_step": 134547, "epoch": 3203} {"train_loss": -6.7015485763549805, "global_step": 134548, "epoch": 3203} {"train_loss": -6.7160444259643555, "global_step": 134549, "epoch": 3203} {"train_loss": -6.82581901550293, "global_step": 134550, "epoch": 3203} {"train_loss": -6.723552703857422, "global_step": 134551, "epoch": 3203} {"train_loss": -6.7675371170043945, "global_step": 134552, "epoch": 3203} {"train_loss": -6.754217147827148, "global_step": 134553, "epoch": 3203} {"train_loss": -6.717825889587402, "global_step": 134554, "epoch": 3203} {"train_loss": -6.749946117401123, "global_step": 134555, "epoch": 3203} {"train_loss": -6.735176086425781, "global_step": 134556, "epoch": 3203} {"train_loss": -6.647968292236328, "global_step": 134557, "epoch": 3203} {"train_loss": -6.689964294433594, "global_step": 134558, "epoch": 3203} {"train_loss": -6.6292901039123535, "global_step": 134559, "epoch": 3203} {"train_loss": -6.734676361083984, "global_step": 134560, "epoch": 3203} {"train_loss": -6.530618667602539, "global_step": 134561, "epoch": 3203} {"train_loss": -6.528100967407227, "global_step": 134562, "epoch": 3203} {"train_loss": -6.693795680999756, "global_step": 134563, "epoch": 3203} {"train_loss": -6.538472652435303, "global_step": 134564, "epoch": 3203} {"train_loss": -6.517452239990234, "global_step": 134565, "epoch": 3203} {"train_loss": -6.716438293457031, "global_step": 134566, "epoch": 3203} {"train_loss": -6.715754406792777, "global_step": 134567, "epoch": 3203, "val_loss": 66931.0546875} {"train_loss": -6.689531326293945, "global_step": 134568, "epoch": 3204} {"train_loss": -6.584546089172363, "global_step": 134569, "epoch": 3204} {"train_loss": -6.527296543121338, "global_step": 134570, "epoch": 3204} {"train_loss": -6.608760833740234, "global_step": 134571, "epoch": 3204} {"train_loss": -6.584074974060059, "global_step": 134572, "epoch": 3204} {"train_loss": -6.686371803283691, "global_step": 134573, "epoch": 3204} {"train_loss": -6.541291236877441, "global_step": 134574, "epoch": 3204} {"train_loss": -6.674342632293701, "global_step": 134575, "epoch": 3204} {"train_loss": -6.727974891662598, "global_step": 134576, "epoch": 3204} {"train_loss": -6.6113667488098145, "global_step": 134577, "epoch": 3204} {"train_loss": -6.575631618499756, "global_step": 134578, "epoch": 3204} {"train_loss": -6.705377101898193, "global_step": 134579, "epoch": 3204} {"train_loss": -6.606302261352539, "global_step": 134580, "epoch": 3204} {"train_loss": -6.616660118103027, "global_step": 134581, "epoch": 3204} {"train_loss": -6.726999759674072, "global_step": 134582, "epoch": 3204} {"train_loss": -6.619093894958496, "global_step": 134583, "epoch": 3204} {"train_loss": -6.639033317565918, "global_step": 134584, "epoch": 3204} {"train_loss": -6.643152713775635, "global_step": 134585, "epoch": 3204} {"train_loss": -6.699105262756348, "global_step": 134586, "epoch": 3204} {"train_loss": -6.649149417877197, "global_step": 134587, "epoch": 3204} {"train_loss": -6.733118057250977, "global_step": 134588, "epoch": 3204} {"train_loss": -6.6808061599731445, "global_step": 134589, "epoch": 3204} {"train_loss": -6.595209121704102, "global_step": 134590, "epoch": 3204} {"train_loss": -6.773975849151611, "global_step": 134591, "epoch": 3204} {"train_loss": -6.6743574142456055, "global_step": 134592, "epoch": 3204} {"train_loss": -6.646063804626465, "global_step": 134593, "epoch": 3204} {"train_loss": -6.826983451843262, "global_step": 134594, "epoch": 3204} {"train_loss": -6.730721950531006, "global_step": 134595, "epoch": 3204} {"train_loss": -6.838520050048828, "global_step": 134596, "epoch": 3204} {"train_loss": -6.76128625869751, "global_step": 134597, "epoch": 3204} {"train_loss": -6.859714508056641, "global_step": 134598, "epoch": 3204} {"train_loss": -6.767864227294922, "global_step": 134599, "epoch": 3204} {"train_loss": -6.758210182189941, "global_step": 134600, "epoch": 3204} {"train_loss": -6.685833930969238, "global_step": 134601, "epoch": 3204} {"train_loss": -6.768677711486816, "global_step": 134602, "epoch": 3204} {"train_loss": -6.84061861038208, "global_step": 134603, "epoch": 3204} {"train_loss": -6.680892467498779, "global_step": 134604, "epoch": 3204} {"train_loss": -6.703485012054443, "global_step": 134605, "epoch": 3204} {"train_loss": -6.7118940353393555, "global_step": 134606, "epoch": 3204} {"train_loss": -6.697059631347656, "global_step": 134607, "epoch": 3204} {"train_loss": -6.768085479736328, "global_step": 134608, "epoch": 3204} {"train_loss": -6.689660185859317, "global_step": 134609, "epoch": 3204, "val_loss": 66851.1796875} {"train_loss": -6.834701061248779, "global_step": 134610, "epoch": 3205} {"train_loss": -6.73967170715332, "global_step": 134611, "epoch": 3205} {"train_loss": -6.85478401184082, "global_step": 134612, "epoch": 3205} {"train_loss": -6.674644470214844, "global_step": 134613, "epoch": 3205} {"train_loss": -6.845460891723633, "global_step": 134614, "epoch": 3205} {"train_loss": -6.726173400878906, "global_step": 134615, "epoch": 3205} {"train_loss": -6.862720489501953, "global_step": 134616, "epoch": 3205} {"train_loss": -6.806858062744141, "global_step": 134617, "epoch": 3205} {"train_loss": -6.752079010009766, "global_step": 134618, "epoch": 3205} {"train_loss": -6.680323600769043, "global_step": 134619, "epoch": 3205} {"train_loss": -6.807526588439941, "global_step": 134620, "epoch": 3205} {"train_loss": -6.81290340423584, "global_step": 134621, "epoch": 3205} {"train_loss": -6.738049030303955, "global_step": 134622, "epoch": 3205} {"train_loss": -6.681189060211182, "global_step": 134623, "epoch": 3205} {"train_loss": -6.697947978973389, "global_step": 134624, "epoch": 3205} {"train_loss": -6.847592353820801, "global_step": 134625, "epoch": 3205} {"train_loss": -6.791864395141602, "global_step": 134626, "epoch": 3205} {"train_loss": -6.749636650085449, "global_step": 134627, "epoch": 3205} {"train_loss": -6.704625129699707, "global_step": 134628, "epoch": 3205} {"train_loss": -6.68575382232666, "global_step": 134629, "epoch": 3205} {"train_loss": -6.717015743255615, "global_step": 134630, "epoch": 3205} {"train_loss": -6.717681884765625, "global_step": 134631, "epoch": 3205} {"train_loss": -6.806378364562988, "global_step": 134632, "epoch": 3205} {"train_loss": -6.6142988204956055, "global_step": 134633, "epoch": 3205} {"train_loss": -6.717256546020508, "global_step": 134634, "epoch": 3205} {"train_loss": -6.736749649047852, "global_step": 134635, "epoch": 3205} {"train_loss": -6.711475849151611, "global_step": 134636, "epoch": 3205} {"train_loss": -6.623350620269775, "global_step": 134637, "epoch": 3205} {"train_loss": -6.487894058227539, "global_step": 134638, "epoch": 3205} {"train_loss": -6.631583213806152, "global_step": 134639, "epoch": 3205} {"train_loss": -6.755691051483154, "global_step": 134640, "epoch": 3205} {"train_loss": -6.651079177856445, "global_step": 134641, "epoch": 3205} {"train_loss": -6.564127445220947, "global_step": 134642, "epoch": 3205} {"train_loss": -6.614378929138184, "global_step": 134643, "epoch": 3205} {"train_loss": -6.662302017211914, "global_step": 134644, "epoch": 3205} {"train_loss": -6.667806625366211, "global_step": 134645, "epoch": 3205} {"train_loss": -6.679107666015625, "global_step": 134646, "epoch": 3205} {"train_loss": -6.795653343200684, "global_step": 134647, "epoch": 3205} {"train_loss": -6.629619121551514, "global_step": 134648, "epoch": 3205} {"train_loss": -6.701602935791016, "global_step": 134649, "epoch": 3205} {"train_loss": -6.7249603271484375, "global_step": 134650, "epoch": 3205} {"train_loss": -6.719323510215396, "global_step": 134651, "epoch": 3205, "val_loss": 66796.6640625} {"train_loss": -6.694524765014648, "global_step": 134652, "epoch": 3206} {"train_loss": -6.763304710388184, "global_step": 134653, "epoch": 3206} {"train_loss": -6.68979549407959, "global_step": 134654, "epoch": 3206} {"train_loss": -6.754100799560547, "global_step": 134655, "epoch": 3206} {"train_loss": -6.658510208129883, "global_step": 134656, "epoch": 3206} {"train_loss": -6.8105692863464355, "global_step": 134657, "epoch": 3206} {"train_loss": -6.641609191894531, "global_step": 134658, "epoch": 3206} {"train_loss": -6.592313766479492, "global_step": 134659, "epoch": 3206} {"train_loss": -6.543538570404053, "global_step": 134660, "epoch": 3206} {"train_loss": -6.77131462097168, "global_step": 134661, "epoch": 3206} {"train_loss": -6.613924980163574, "global_step": 134662, "epoch": 3206} {"train_loss": -6.7151570320129395, "global_step": 134663, "epoch": 3206} {"train_loss": -6.653356075286865, "global_step": 134664, "epoch": 3206} {"train_loss": -6.756691932678223, "global_step": 134665, "epoch": 3206} {"train_loss": -6.659630298614502, "global_step": 134666, "epoch": 3206} {"train_loss": -6.644907474517822, "global_step": 134667, "epoch": 3206} {"train_loss": -6.68988037109375, "global_step": 134668, "epoch": 3206} {"train_loss": -6.699143409729004, "global_step": 134669, "epoch": 3206} {"train_loss": -6.801103115081787, "global_step": 134670, "epoch": 3206} {"train_loss": -6.690041542053223, "global_step": 134671, "epoch": 3206} {"train_loss": -6.710641860961914, "global_step": 134672, "epoch": 3206} {"train_loss": -6.603013515472412, "global_step": 134673, "epoch": 3206} {"train_loss": -6.510018348693848, "global_step": 134674, "epoch": 3206} {"train_loss": -6.638420104980469, "global_step": 134675, "epoch": 3206} {"train_loss": -6.55983829498291, "global_step": 134676, "epoch": 3206} {"train_loss": -6.662644386291504, "global_step": 134677, "epoch": 3206} {"train_loss": -6.60489559173584, "global_step": 134678, "epoch": 3206} {"train_loss": -6.740047931671143, "global_step": 134679, "epoch": 3206} {"train_loss": -6.603135585784912, "global_step": 134680, "epoch": 3206} {"train_loss": -6.772905349731445, "global_step": 134681, "epoch": 3206} {"train_loss": -6.718593597412109, "global_step": 134682, "epoch": 3206} {"train_loss": -6.616565227508545, "global_step": 134683, "epoch": 3206} {"train_loss": -6.706645965576172, "global_step": 134684, "epoch": 3206} {"train_loss": -6.554576396942139, "global_step": 134685, "epoch": 3206} {"train_loss": -6.648832321166992, "global_step": 134686, "epoch": 3206} {"train_loss": -6.6082000732421875, "global_step": 134687, "epoch": 3206} {"train_loss": -6.6935319900512695, "global_step": 134688, "epoch": 3206} {"train_loss": -6.618904113769531, "global_step": 134689, "epoch": 3206} {"train_loss": -6.658412933349609, "global_step": 134690, "epoch": 3206} {"train_loss": -6.604809761047363, "global_step": 134691, "epoch": 3206} {"train_loss": -6.581204891204834, "global_step": 134692, "epoch": 3206} {"train_loss": -6.661614202317738, "global_step": 134693, "epoch": 3206, "val_loss": 66973.1953125} {"train_loss": -6.712593078613281, "global_step": 134694, "epoch": 3207} {"train_loss": -6.691471099853516, "global_step": 134695, "epoch": 3207} {"train_loss": -6.512073516845703, "global_step": 134696, "epoch": 3207} {"train_loss": -6.668668746948242, "global_step": 134697, "epoch": 3207} {"train_loss": -6.763679504394531, "global_step": 134698, "epoch": 3207} {"train_loss": -6.701157569885254, "global_step": 134699, "epoch": 3207} {"train_loss": -6.722979545593262, "global_step": 134700, "epoch": 3207} {"train_loss": -6.75423526763916, "global_step": 134701, "epoch": 3207} {"train_loss": -6.592168807983398, "global_step": 134702, "epoch": 3207} {"train_loss": -6.761194229125977, "global_step": 134703, "epoch": 3207} {"train_loss": -6.735350608825684, "global_step": 134704, "epoch": 3207} {"train_loss": -6.714018821716309, "global_step": 134705, "epoch": 3207} {"train_loss": -6.726818084716797, "global_step": 134706, "epoch": 3207} {"train_loss": -6.688112258911133, "global_step": 134707, "epoch": 3207} {"train_loss": -6.695788383483887, "global_step": 134708, "epoch": 3207} {"train_loss": -6.724920749664307, "global_step": 134709, "epoch": 3207} {"train_loss": -6.821056842803955, "global_step": 134710, "epoch": 3207} {"train_loss": -6.836529731750488, "global_step": 134711, "epoch": 3207} {"train_loss": -6.747217178344727, "global_step": 134712, "epoch": 3207} {"train_loss": -6.72535514831543, "global_step": 134713, "epoch": 3207} {"train_loss": -6.768529891967773, "global_step": 134714, "epoch": 3207} {"train_loss": -6.812893867492676, "global_step": 134715, "epoch": 3207} {"train_loss": -6.796358585357666, "global_step": 134716, "epoch": 3207} {"train_loss": -6.775542259216309, "global_step": 134717, "epoch": 3207} {"train_loss": -6.651302337646484, "global_step": 134718, "epoch": 3207} {"train_loss": -6.710114479064941, "global_step": 134719, "epoch": 3207} {"train_loss": -6.775883674621582, "global_step": 134720, "epoch": 3207} {"train_loss": -6.777512073516846, "global_step": 134721, "epoch": 3207} {"train_loss": -6.795454025268555, "global_step": 134722, "epoch": 3207} {"train_loss": -6.745025634765625, "global_step": 134723, "epoch": 3207} {"train_loss": -6.766107559204102, "global_step": 134724, "epoch": 3207} {"train_loss": -6.683811187744141, "global_step": 134725, "epoch": 3207} {"train_loss": -6.734194755554199, "global_step": 134726, "epoch": 3207} {"train_loss": -6.694644451141357, "global_step": 134727, "epoch": 3207} {"train_loss": -6.715263843536377, "global_step": 134728, "epoch": 3207} {"train_loss": -6.637574195861816, "global_step": 134729, "epoch": 3207} {"train_loss": -6.65812873840332, "global_step": 134730, "epoch": 3207} {"train_loss": -6.661407470703125, "global_step": 134731, "epoch": 3207} {"train_loss": -6.754355430603027, "global_step": 134732, "epoch": 3207} {"train_loss": -6.6642303466796875, "global_step": 134733, "epoch": 3207} {"train_loss": -6.69488525390625, "global_step": 134734, "epoch": 3207} {"train_loss": -6.7206088815416605, "global_step": 134735, "epoch": 3207, "val_loss": 66918.6015625} {"train_loss": -6.7934465408325195, "global_step": 134736, "epoch": 3208} {"train_loss": -6.566279411315918, "global_step": 134737, "epoch": 3208} {"train_loss": -6.820892333984375, "global_step": 134738, "epoch": 3208} {"train_loss": -6.778207302093506, "global_step": 134739, "epoch": 3208} {"train_loss": -6.706486701965332, "global_step": 134740, "epoch": 3208} {"train_loss": -6.72186279296875, "global_step": 134741, "epoch": 3208} {"train_loss": -6.70018196105957, "global_step": 134742, "epoch": 3208} {"train_loss": -6.6434550285339355, "global_step": 134743, "epoch": 3208} {"train_loss": -6.754161357879639, "global_step": 134744, "epoch": 3208} {"train_loss": -6.730374813079834, "global_step": 134745, "epoch": 3208} {"train_loss": -6.607249736785889, "global_step": 134746, "epoch": 3208} {"train_loss": -6.785325527191162, "global_step": 134747, "epoch": 3208} {"train_loss": -6.786868572235107, "global_step": 134748, "epoch": 3208} {"train_loss": -6.771426200866699, "global_step": 134749, "epoch": 3208} {"train_loss": -6.767012596130371, "global_step": 134750, "epoch": 3208} {"train_loss": -6.665304660797119, "global_step": 134751, "epoch": 3208} {"train_loss": -6.734993934631348, "global_step": 134752, "epoch": 3208} {"train_loss": -6.675759315490723, "global_step": 134753, "epoch": 3208} {"train_loss": -6.6887030601501465, "global_step": 134754, "epoch": 3208} {"train_loss": -6.629019737243652, "global_step": 134755, "epoch": 3208} {"train_loss": -6.751442909240723, "global_step": 134756, "epoch": 3208} {"train_loss": -6.652219772338867, "global_step": 134757, "epoch": 3208} {"train_loss": -6.673601150512695, "global_step": 134758, "epoch": 3208} {"train_loss": -6.6619391441345215, "global_step": 134759, "epoch": 3208} {"train_loss": -6.700809478759766, "global_step": 134760, "epoch": 3208} {"train_loss": -6.79636812210083, "global_step": 134761, "epoch": 3208} {"train_loss": -6.693482398986816, "global_step": 134762, "epoch": 3208} {"train_loss": -6.745962142944336, "global_step": 134763, "epoch": 3208} {"train_loss": -6.843776702880859, "global_step": 134764, "epoch": 3208} {"train_loss": -6.724724292755127, "global_step": 134765, "epoch": 3208} {"train_loss": -6.815810203552246, "global_step": 134766, "epoch": 3208} {"train_loss": -6.709733486175537, "global_step": 134767, "epoch": 3208} {"train_loss": -6.745038986206055, "global_step": 134768, "epoch": 3208} {"train_loss": -6.731925964355469, "global_step": 134769, "epoch": 3208} {"train_loss": -6.670827865600586, "global_step": 134770, "epoch": 3208} {"train_loss": -6.653557777404785, "global_step": 134771, "epoch": 3208} {"train_loss": -6.670368671417236, "global_step": 134772, "epoch": 3208} {"train_loss": -6.640649795532227, "global_step": 134773, "epoch": 3208} {"train_loss": -6.737112522125244, "global_step": 134774, "epoch": 3208} {"train_loss": -6.659592628479004, "global_step": 134775, "epoch": 3208} {"train_loss": -6.782480716705322, "global_step": 134776, "epoch": 3208} {"train_loss": -6.716895580291748, "global_step": 134777, "epoch": 3208, "val_loss": 66859.0234375} {"train_loss": -6.731744766235352, "global_step": 134778, "epoch": 3209} {"train_loss": -6.741238117218018, "global_step": 134779, "epoch": 3209} {"train_loss": -6.687767505645752, "global_step": 134780, "epoch": 3209} {"train_loss": -6.783751487731934, "global_step": 134781, "epoch": 3209} {"train_loss": -6.768093585968018, "global_step": 134782, "epoch": 3209} {"train_loss": -6.774564743041992, "global_step": 134783, "epoch": 3209} {"train_loss": -6.791326522827148, "global_step": 134784, "epoch": 3209} {"train_loss": -6.830504417419434, "global_step": 134785, "epoch": 3209} {"train_loss": -6.727109909057617, "global_step": 134786, "epoch": 3209} {"train_loss": -6.734649181365967, "global_step": 134787, "epoch": 3209} {"train_loss": -6.799041748046875, "global_step": 134788, "epoch": 3209} {"train_loss": -6.686705589294434, "global_step": 134789, "epoch": 3209} {"train_loss": -6.690239906311035, "global_step": 134790, "epoch": 3209} {"train_loss": -6.821244716644287, "global_step": 134791, "epoch": 3209} {"train_loss": -6.620588302612305, "global_step": 134792, "epoch": 3209} {"train_loss": -6.643959045410156, "global_step": 134793, "epoch": 3209} {"train_loss": -6.744391441345215, "global_step": 134794, "epoch": 3209} {"train_loss": -6.579091548919678, "global_step": 134795, "epoch": 3209} {"train_loss": -6.586973667144775, "global_step": 134796, "epoch": 3209} {"train_loss": -6.630220413208008, "global_step": 134797, "epoch": 3209} {"train_loss": -6.6303558349609375, "global_step": 134798, "epoch": 3209} {"train_loss": -6.6832122802734375, "global_step": 134799, "epoch": 3209} {"train_loss": -6.601845741271973, "global_step": 134800, "epoch": 3209} {"train_loss": -6.776531219482422, "global_step": 134801, "epoch": 3209} {"train_loss": -6.574158668518066, "global_step": 134802, "epoch": 3209} {"train_loss": -6.567776679992676, "global_step": 134803, "epoch": 3209} {"train_loss": -6.509030818939209, "global_step": 134804, "epoch": 3209} {"train_loss": -6.601456642150879, "global_step": 134805, "epoch": 3209} {"train_loss": -6.501441478729248, "global_step": 134806, "epoch": 3209} {"train_loss": -6.595543384552002, "global_step": 134807, "epoch": 3209} {"train_loss": -6.650969982147217, "global_step": 134808, "epoch": 3209} {"train_loss": -6.474818229675293, "global_step": 134809, "epoch": 3209} {"train_loss": -6.659749984741211, "global_step": 134810, "epoch": 3209} {"train_loss": -6.55963134765625, "global_step": 134811, "epoch": 3209} {"train_loss": -6.634212017059326, "global_step": 134812, "epoch": 3209} {"train_loss": -6.724985122680664, "global_step": 134813, "epoch": 3209} {"train_loss": -6.600526332855225, "global_step": 134814, "epoch": 3209} {"train_loss": -6.460474014282227, "global_step": 134815, "epoch": 3209} {"train_loss": -6.5085272789001465, "global_step": 134816, "epoch": 3209} {"train_loss": -6.611484527587891, "global_step": 134817, "epoch": 3209} {"train_loss": -6.490856170654297, "global_step": 134818, "epoch": 3209} {"train_loss": -6.652859029315767, "global_step": 134819, "epoch": 3209, "val_loss": 66944.4296875} {"train_loss": -6.778386116027832, "global_step": 134820, "epoch": 3210} {"train_loss": -6.677828788757324, "global_step": 134821, "epoch": 3210} {"train_loss": -6.685598373413086, "global_step": 134822, "epoch": 3210} {"train_loss": -6.770699501037598, "global_step": 134823, "epoch": 3210} {"train_loss": -6.659921169281006, "global_step": 134824, "epoch": 3210} {"train_loss": -6.773623943328857, "global_step": 134825, "epoch": 3210} {"train_loss": -6.82996129989624, "global_step": 134826, "epoch": 3210} {"train_loss": -6.602643966674805, "global_step": 134827, "epoch": 3210} {"train_loss": -6.836738109588623, "global_step": 134828, "epoch": 3210} {"train_loss": -6.658748626708984, "global_step": 134829, "epoch": 3210} {"train_loss": -6.728735446929932, "global_step": 134830, "epoch": 3210} {"train_loss": -6.728863716125488, "global_step": 134831, "epoch": 3210} {"train_loss": -6.66633415222168, "global_step": 134832, "epoch": 3210} {"train_loss": -6.726850509643555, "global_step": 134833, "epoch": 3210} {"train_loss": -6.72331428527832, "global_step": 134834, "epoch": 3210} {"train_loss": -6.716376304626465, "global_step": 134835, "epoch": 3210} {"train_loss": -6.691781520843506, "global_step": 134836, "epoch": 3210} {"train_loss": -6.690481185913086, "global_step": 134837, "epoch": 3210} {"train_loss": -6.686664581298828, "global_step": 134838, "epoch": 3210} {"train_loss": -6.680878162384033, "global_step": 134839, "epoch": 3210} {"train_loss": -6.7154154777526855, "global_step": 134840, "epoch": 3210} {"train_loss": -6.768013954162598, "global_step": 134841, "epoch": 3210} {"train_loss": -6.838099479675293, "global_step": 134842, "epoch": 3210} {"train_loss": -6.768402099609375, "global_step": 134843, "epoch": 3210} {"train_loss": -6.658060550689697, "global_step": 134844, "epoch": 3210} {"train_loss": -6.662286758422852, "global_step": 134845, "epoch": 3210} {"train_loss": -6.729172706604004, "global_step": 134846, "epoch": 3210} {"train_loss": -6.70088529586792, "global_step": 134847, "epoch": 3210} {"train_loss": -6.804441452026367, "global_step": 134848, "epoch": 3210} {"train_loss": -6.69221305847168, "global_step": 134849, "epoch": 3210} {"train_loss": -6.708283424377441, "global_step": 134850, "epoch": 3210} {"train_loss": -6.769392013549805, "global_step": 134851, "epoch": 3210} {"train_loss": -6.794232368469238, "global_step": 134852, "epoch": 3210} {"train_loss": -6.694338798522949, "global_step": 134853, "epoch": 3210} {"train_loss": -6.691966533660889, "global_step": 134854, "epoch": 3210} {"train_loss": -6.691677093505859, "global_step": 134855, "epoch": 3210} {"train_loss": -6.53370475769043, "global_step": 134856, "epoch": 3210} {"train_loss": -6.628868579864502, "global_step": 134857, "epoch": 3210} {"train_loss": -6.602304935455322, "global_step": 134858, "epoch": 3210} {"train_loss": -6.703891754150391, "global_step": 134859, "epoch": 3210} {"train_loss": -6.790749549865723, "global_step": 134860, "epoch": 3210} {"train_loss": -6.7103135358719594, "global_step": 134861, "epoch": 3210, "val_loss": 67053.3125} {"train_loss": -6.742673873901367, "global_step": 134862, "epoch": 3211} {"train_loss": -6.727874755859375, "global_step": 134863, "epoch": 3211} {"train_loss": -6.783433437347412, "global_step": 134864, "epoch": 3211} {"train_loss": -6.745670318603516, "global_step": 134865, "epoch": 3211} {"train_loss": -6.672711372375488, "global_step": 134866, "epoch": 3211} {"train_loss": -6.721316337585449, "global_step": 134867, "epoch": 3211} {"train_loss": -6.776705741882324, "global_step": 134868, "epoch": 3211} {"train_loss": -6.696788787841797, "global_step": 134869, "epoch": 3211} {"train_loss": -6.776098251342773, "global_step": 134870, "epoch": 3211} {"train_loss": -6.712069988250732, "global_step": 134871, "epoch": 3211} {"train_loss": -6.737027168273926, "global_step": 134872, "epoch": 3211} {"train_loss": -6.773329734802246, "global_step": 134873, "epoch": 3211} {"train_loss": -6.706315994262695, "global_step": 134874, "epoch": 3211} {"train_loss": -6.647213935852051, "global_step": 134875, "epoch": 3211} {"train_loss": -6.645172119140625, "global_step": 134876, "epoch": 3211} {"train_loss": -6.6863837242126465, "global_step": 134877, "epoch": 3211} {"train_loss": -6.7167510986328125, "global_step": 134878, "epoch": 3211} {"train_loss": -6.651216506958008, "global_step": 134879, "epoch": 3211} {"train_loss": -6.783005237579346, "global_step": 134880, "epoch": 3211} {"train_loss": -6.523240089416504, "global_step": 134881, "epoch": 3211} {"train_loss": -6.608980178833008, "global_step": 134882, "epoch": 3211} {"train_loss": -6.4663190841674805, "global_step": 134883, "epoch": 3211} {"train_loss": -6.507802963256836, "global_step": 134884, "epoch": 3211} {"train_loss": -6.7237935066223145, "global_step": 134885, "epoch": 3211} {"train_loss": -6.48187255859375, "global_step": 134886, "epoch": 3211} {"train_loss": -6.723141193389893, "global_step": 134887, "epoch": 3211} {"train_loss": -6.637857437133789, "global_step": 134888, "epoch": 3211} {"train_loss": -6.696722984313965, "global_step": 134889, "epoch": 3211} {"train_loss": -6.646293640136719, "global_step": 134890, "epoch": 3211} {"train_loss": -6.792282581329346, "global_step": 134891, "epoch": 3211} {"train_loss": -6.685125350952148, "global_step": 134892, "epoch": 3211} {"train_loss": -6.777795791625977, "global_step": 134893, "epoch": 3211} {"train_loss": -6.6692657470703125, "global_step": 134894, "epoch": 3211} {"train_loss": -6.647922515869141, "global_step": 134895, "epoch": 3211} {"train_loss": -6.737776756286621, "global_step": 134896, "epoch": 3211} {"train_loss": -6.539078712463379, "global_step": 134897, "epoch": 3211} {"train_loss": -6.620870590209961, "global_step": 134898, "epoch": 3211} {"train_loss": -6.567846775054932, "global_step": 134899, "epoch": 3211} {"train_loss": -6.813536643981934, "global_step": 134900, "epoch": 3211} {"train_loss": -6.7082085609436035, "global_step": 134901, "epoch": 3211} {"train_loss": -6.697563648223877, "global_step": 134902, "epoch": 3211} {"train_loss": -6.686544077736991, "global_step": 134903, "epoch": 3211, "val_loss": 66848.734375} {"train_loss": -6.769804000854492, "global_step": 134904, "epoch": 3212} {"train_loss": -6.717106819152832, "global_step": 134905, "epoch": 3212} {"train_loss": -6.699692726135254, "global_step": 134906, "epoch": 3212} {"train_loss": -6.792115211486816, "global_step": 134907, "epoch": 3212} {"train_loss": -6.791924476623535, "global_step": 134908, "epoch": 3212} {"train_loss": -6.6908159255981445, "global_step": 134909, "epoch": 3212} {"train_loss": -6.614985942840576, "global_step": 134910, "epoch": 3212} {"train_loss": -6.841116428375244, "global_step": 134911, "epoch": 3212} {"train_loss": -6.701164245605469, "global_step": 134912, "epoch": 3212} {"train_loss": -6.819154262542725, "global_step": 134913, "epoch": 3212} {"train_loss": -6.794776439666748, "global_step": 134914, "epoch": 3212} {"train_loss": -6.634956359863281, "global_step": 134915, "epoch": 3212} {"train_loss": -6.630714416503906, "global_step": 134916, "epoch": 3212} {"train_loss": -6.628614902496338, "global_step": 134917, "epoch": 3212} {"train_loss": -6.724018096923828, "global_step": 134918, "epoch": 3212} {"train_loss": -6.705305099487305, "global_step": 134919, "epoch": 3212} {"train_loss": -6.644808292388916, "global_step": 134920, "epoch": 3212} {"train_loss": -6.6454176902771, "global_step": 134921, "epoch": 3212} {"train_loss": -6.741057395935059, "global_step": 134922, "epoch": 3212} {"train_loss": -6.639236927032471, "global_step": 134923, "epoch": 3212} {"train_loss": -6.788818359375, "global_step": 134924, "epoch": 3212} {"train_loss": -6.628850936889648, "global_step": 134925, "epoch": 3212} {"train_loss": -6.689047813415527, "global_step": 134926, "epoch": 3212} {"train_loss": -6.7645111083984375, "global_step": 134927, "epoch": 3212} {"train_loss": -6.724844455718994, "global_step": 134928, "epoch": 3212} {"train_loss": -6.694662570953369, "global_step": 134929, "epoch": 3212} {"train_loss": -6.743685722351074, "global_step": 134930, "epoch": 3212} {"train_loss": -6.636879920959473, "global_step": 134931, "epoch": 3212} {"train_loss": -6.803196907043457, "global_step": 134932, "epoch": 3212} {"train_loss": -6.652873992919922, "global_step": 134933, "epoch": 3212} {"train_loss": -6.661225318908691, "global_step": 134934, "epoch": 3212} {"train_loss": -6.6828460693359375, "global_step": 134935, "epoch": 3212} {"train_loss": -6.772121906280518, "global_step": 134936, "epoch": 3212} {"train_loss": -6.74961519241333, "global_step": 134937, "epoch": 3212} {"train_loss": -6.759706497192383, "global_step": 134938, "epoch": 3212} {"train_loss": -6.761626243591309, "global_step": 134939, "epoch": 3212} {"train_loss": -6.683493614196777, "global_step": 134940, "epoch": 3212} {"train_loss": -6.7544169425964355, "global_step": 134941, "epoch": 3212} {"train_loss": -6.711284160614014, "global_step": 134942, "epoch": 3212} {"train_loss": -6.785015106201172, "global_step": 134943, "epoch": 3212} {"train_loss": -6.719457149505615, "global_step": 134944, "epoch": 3212} {"train_loss": -6.717316797801426, "global_step": 134945, "epoch": 3212, "val_loss": 66895.7734375} {"train_loss": -6.820204734802246, "global_step": 134946, "epoch": 3213} {"train_loss": -6.748795986175537, "global_step": 134947, "epoch": 3213} {"train_loss": -6.722261428833008, "global_step": 134948, "epoch": 3213} {"train_loss": -6.819549560546875, "global_step": 134949, "epoch": 3213} {"train_loss": -6.78547477722168, "global_step": 134950, "epoch": 3213} {"train_loss": -6.735410213470459, "global_step": 134951, "epoch": 3213} {"train_loss": -6.777525424957275, "global_step": 134952, "epoch": 3213} {"train_loss": -6.7881622314453125, "global_step": 134953, "epoch": 3213} {"train_loss": -6.73879337310791, "global_step": 134954, "epoch": 3213} {"train_loss": -6.767395496368408, "global_step": 134955, "epoch": 3213} {"train_loss": -6.867572784423828, "global_step": 134956, "epoch": 3213} {"train_loss": -6.716519832611084, "global_step": 134957, "epoch": 3213} {"train_loss": -6.814207077026367, "global_step": 134958, "epoch": 3213} {"train_loss": -6.797672271728516, "global_step": 134959, "epoch": 3213} {"train_loss": -6.749729156494141, "global_step": 134960, "epoch": 3213} {"train_loss": -6.733027458190918, "global_step": 134961, "epoch": 3213} {"train_loss": -6.674492835998535, "global_step": 134962, "epoch": 3213} {"train_loss": -6.583531379699707, "global_step": 134963, "epoch": 3213} {"train_loss": -6.79263973236084, "global_step": 134964, "epoch": 3213} {"train_loss": -6.754395484924316, "global_step": 134965, "epoch": 3213} {"train_loss": -6.686766624450684, "global_step": 134966, "epoch": 3213} {"train_loss": -6.7215776443481445, "global_step": 134967, "epoch": 3213} {"train_loss": -6.631094932556152, "global_step": 134968, "epoch": 3213} {"train_loss": -6.674011707305908, "global_step": 134969, "epoch": 3213} {"train_loss": -6.790778636932373, "global_step": 134970, "epoch": 3213} {"train_loss": -6.720458507537842, "global_step": 134971, "epoch": 3213} {"train_loss": -6.789431571960449, "global_step": 134972, "epoch": 3213} {"train_loss": -6.840693473815918, "global_step": 134973, "epoch": 3213} {"train_loss": -6.660058498382568, "global_step": 134974, "epoch": 3213} {"train_loss": -6.777535438537598, "global_step": 134975, "epoch": 3213} {"train_loss": -6.680253028869629, "global_step": 134976, "epoch": 3213} {"train_loss": -6.757962226867676, "global_step": 134977, "epoch": 3213} {"train_loss": -6.702897071838379, "global_step": 134978, "epoch": 3213} {"train_loss": -6.602160930633545, "global_step": 134979, "epoch": 3213} {"train_loss": -6.807441711425781, "global_step": 134980, "epoch": 3213} {"train_loss": -6.613563537597656, "global_step": 134981, "epoch": 3213} {"train_loss": -6.7120866775512695, "global_step": 134982, "epoch": 3213} {"train_loss": -6.754452705383301, "global_step": 134983, "epoch": 3213} {"train_loss": -6.7060651779174805, "global_step": 134984, "epoch": 3213} {"train_loss": -6.722360610961914, "global_step": 134985, "epoch": 3213} {"train_loss": -6.703268051147461, "global_step": 134986, "epoch": 3213} {"train_loss": -6.734677008220127, "global_step": 134987, "epoch": 3213, "val_loss": 66965.2421875} {"train_loss": -6.720907211303711, "global_step": 134988, "epoch": 3214} {"train_loss": -6.707280158996582, "global_step": 134989, "epoch": 3214} {"train_loss": -6.621251106262207, "global_step": 134990, "epoch": 3214} {"train_loss": -6.753244400024414, "global_step": 134991, "epoch": 3214} {"train_loss": -6.807452201843262, "global_step": 134992, "epoch": 3214} {"train_loss": -6.817428112030029, "global_step": 134993, "epoch": 3214} {"train_loss": -6.713702201843262, "global_step": 134994, "epoch": 3214} {"train_loss": -6.7101030349731445, "global_step": 134995, "epoch": 3214} {"train_loss": -6.648491382598877, "global_step": 134996, "epoch": 3214} {"train_loss": -6.813246726989746, "global_step": 134997, "epoch": 3214} {"train_loss": -6.647212505340576, "global_step": 134998, "epoch": 3214} {"train_loss": -6.730057716369629, "global_step": 134999, "epoch": 3214} {"train_loss": -6.726839542388916, "global_step": 135000, "epoch": 3214} {"train_loss": -6.707976341247559, "global_step": 135001, "epoch": 3214} {"train_loss": -6.710726737976074, "global_step": 135002, "epoch": 3214} {"train_loss": -6.660600662231445, "global_step": 135003, "epoch": 3214} {"train_loss": -6.666537284851074, "global_step": 135004, "epoch": 3214} {"train_loss": -6.752245903015137, "global_step": 135005, "epoch": 3214} {"train_loss": -6.734891414642334, "global_step": 135006, "epoch": 3214} {"train_loss": -6.750860214233398, "global_step": 135007, "epoch": 3214} {"train_loss": -6.7892746925354, "global_step": 135008, "epoch": 3214} {"train_loss": -6.703126907348633, "global_step": 135009, "epoch": 3214} {"train_loss": -6.7113752365112305, "global_step": 135010, "epoch": 3214} {"train_loss": -6.6934404373168945, "global_step": 135011, "epoch": 3214} {"train_loss": -6.674942970275879, "global_step": 135012, "epoch": 3214} {"train_loss": -6.793169021606445, "global_step": 135013, "epoch": 3214} {"train_loss": -6.702930927276611, "global_step": 135014, "epoch": 3214} {"train_loss": -6.710964202880859, "global_step": 135015, "epoch": 3214} {"train_loss": -6.742541313171387, "global_step": 135016, "epoch": 3214} {"train_loss": -6.614118576049805, "global_step": 135017, "epoch": 3214} {"train_loss": -6.730579376220703, "global_step": 135018, "epoch": 3214} {"train_loss": -6.606399059295654, "global_step": 135019, "epoch": 3214} {"train_loss": -6.635405540466309, "global_step": 135020, "epoch": 3214} {"train_loss": -6.695640563964844, "global_step": 135021, "epoch": 3214} {"train_loss": -6.6481170654296875, "global_step": 135022, "epoch": 3214} {"train_loss": -6.536312103271484, "global_step": 135023, "epoch": 3214} {"train_loss": -6.616515159606934, "global_step": 135024, "epoch": 3214} {"train_loss": -6.666226387023926, "global_step": 135025, "epoch": 3214} {"train_loss": -6.565618991851807, "global_step": 135026, "epoch": 3214} {"train_loss": -6.663977146148682, "global_step": 135027, "epoch": 3214} {"train_loss": -6.581929683685303, "global_step": 135028, "epoch": 3214} {"train_loss": -6.693056810469854, "global_step": 135029, "epoch": 3214, "val_loss": 66942.5546875} {"train_loss": -6.595256805419922, "global_step": 135030, "epoch": 3215} {"train_loss": -6.587343215942383, "global_step": 135031, "epoch": 3215} {"train_loss": -6.6583333015441895, "global_step": 135032, "epoch": 3215} {"train_loss": -6.71134090423584, "global_step": 135033, "epoch": 3215} {"train_loss": -6.651074409484863, "global_step": 135034, "epoch": 3215} {"train_loss": -6.708957672119141, "global_step": 135035, "epoch": 3215} {"train_loss": -6.669881820678711, "global_step": 135036, "epoch": 3215} {"train_loss": -6.713841438293457, "global_step": 135037, "epoch": 3215} {"train_loss": -6.6803202629089355, "global_step": 135038, "epoch": 3215} {"train_loss": -6.641191482543945, "global_step": 135039, "epoch": 3215} {"train_loss": -6.813826084136963, "global_step": 135040, "epoch": 3215} {"train_loss": -6.647784233093262, "global_step": 135041, "epoch": 3215} {"train_loss": -6.714712142944336, "global_step": 135042, "epoch": 3215} {"train_loss": -6.695298671722412, "global_step": 135043, "epoch": 3215} {"train_loss": -6.683346271514893, "global_step": 135044, "epoch": 3215} {"train_loss": -6.762796401977539, "global_step": 135045, "epoch": 3215} {"train_loss": -6.767219066619873, "global_step": 135046, "epoch": 3215} {"train_loss": -6.619708061218262, "global_step": 135047, "epoch": 3215} {"train_loss": -6.624835014343262, "global_step": 135048, "epoch": 3215} {"train_loss": -6.744150638580322, "global_step": 135049, "epoch": 3215} {"train_loss": -6.533652305603027, "global_step": 135050, "epoch": 3215} {"train_loss": -6.652777671813965, "global_step": 135051, "epoch": 3215} {"train_loss": -6.7412109375, "global_step": 135052, "epoch": 3215} {"train_loss": -6.703693389892578, "global_step": 135053, "epoch": 3215} {"train_loss": -6.707901477813721, "global_step": 135054, "epoch": 3215} {"train_loss": -6.702703475952148, "global_step": 135055, "epoch": 3215} {"train_loss": -6.778929710388184, "global_step": 135056, "epoch": 3215} {"train_loss": -6.581443786621094, "global_step": 135057, "epoch": 3215} {"train_loss": -6.816711902618408, "global_step": 135058, "epoch": 3215} {"train_loss": -6.736868858337402, "global_step": 135059, "epoch": 3215} {"train_loss": -6.552213191986084, "global_step": 135060, "epoch": 3215} {"train_loss": -6.616629600524902, "global_step": 135061, "epoch": 3215} {"train_loss": -6.63587760925293, "global_step": 135062, "epoch": 3215} {"train_loss": -6.49440860748291, "global_step": 135063, "epoch": 3215} {"train_loss": -6.741662502288818, "global_step": 135064, "epoch": 3215} {"train_loss": -6.467989444732666, "global_step": 135065, "epoch": 3215} {"train_loss": -6.679619789123535, "global_step": 135066, "epoch": 3215} {"train_loss": -6.737004280090332, "global_step": 135067, "epoch": 3215} {"train_loss": -6.615818977355957, "global_step": 135068, "epoch": 3215} {"train_loss": -6.777057647705078, "global_step": 135069, "epoch": 3215} {"train_loss": -6.705296993255615, "global_step": 135070, "epoch": 3215} {"train_loss": -6.674641416186378, "global_step": 135071, "epoch": 3215, "val_loss": 67020.5} {"train_loss": -6.6197099685668945, "global_step": 135072, "epoch": 3216} {"train_loss": -6.754834175109863, "global_step": 135073, "epoch": 3216} {"train_loss": -6.671060562133789, "global_step": 135074, "epoch": 3216} {"train_loss": -6.729874610900879, "global_step": 135075, "epoch": 3216} {"train_loss": -6.6936936378479, "global_step": 135076, "epoch": 3216} {"train_loss": -6.696898937225342, "global_step": 135077, "epoch": 3216} {"train_loss": -6.796765327453613, "global_step": 135078, "epoch": 3216} {"train_loss": -6.652564525604248, "global_step": 135079, "epoch": 3216} {"train_loss": -6.699540615081787, "global_step": 135080, "epoch": 3216} {"train_loss": -6.524031639099121, "global_step": 135081, "epoch": 3216} {"train_loss": -6.574598789215088, "global_step": 135082, "epoch": 3216} {"train_loss": -6.6382527351379395, "global_step": 135083, "epoch": 3216} {"train_loss": -6.538517475128174, "global_step": 135084, "epoch": 3216} {"train_loss": -6.705927848815918, "global_step": 135085, "epoch": 3216} {"train_loss": -6.463106155395508, "global_step": 135086, "epoch": 3216} {"train_loss": -6.651730537414551, "global_step": 135087, "epoch": 3216} {"train_loss": -6.631950378417969, "global_step": 135088, "epoch": 3216} {"train_loss": -6.599582672119141, "global_step": 135089, "epoch": 3216} {"train_loss": -6.700059413909912, "global_step": 135090, "epoch": 3216} {"train_loss": -6.571634292602539, "global_step": 135091, "epoch": 3216} {"train_loss": -6.7581281661987305, "global_step": 135092, "epoch": 3216} {"train_loss": -6.642518043518066, "global_step": 135093, "epoch": 3216} {"train_loss": -6.773555278778076, "global_step": 135094, "epoch": 3216} {"train_loss": -6.650218486785889, "global_step": 135095, "epoch": 3216} {"train_loss": -6.640596389770508, "global_step": 135096, "epoch": 3216} {"train_loss": -6.646997451782227, "global_step": 135097, "epoch": 3216} {"train_loss": -6.72517728805542, "global_step": 135098, "epoch": 3216} {"train_loss": -6.66651725769043, "global_step": 135099, "epoch": 3216} {"train_loss": -6.640248775482178, "global_step": 135100, "epoch": 3216} {"train_loss": -6.695765495300293, "global_step": 135101, "epoch": 3216} {"train_loss": -6.615081310272217, "global_step": 135102, "epoch": 3216} {"train_loss": -6.700508117675781, "global_step": 135103, "epoch": 3216} {"train_loss": -6.640896797180176, "global_step": 135104, "epoch": 3216} {"train_loss": -6.4679155349731445, "global_step": 135105, "epoch": 3216} {"train_loss": -6.790600299835205, "global_step": 135106, "epoch": 3216} {"train_loss": -6.753416538238525, "global_step": 135107, "epoch": 3216} {"train_loss": -6.832210540771484, "global_step": 135108, "epoch": 3216} {"train_loss": -6.672882080078125, "global_step": 135109, "epoch": 3216} {"train_loss": -6.694901466369629, "global_step": 135110, "epoch": 3216} {"train_loss": -6.654702186584473, "global_step": 135111, "epoch": 3216} {"train_loss": -6.7404375076293945, "global_step": 135112, "epoch": 3216} {"train_loss": -6.66867843128386, "global_step": 135113, "epoch": 3216, "val_loss": 67115.25} {"train_loss": -6.719363212585449, "global_step": 135114, "epoch": 3217} {"train_loss": -6.74794864654541, "global_step": 135115, "epoch": 3217} {"train_loss": -6.733860969543457, "global_step": 135116, "epoch": 3217} {"train_loss": -6.644725799560547, "global_step": 135117, "epoch": 3217} {"train_loss": -6.815781593322754, "global_step": 135118, "epoch": 3217} {"train_loss": -6.756213188171387, "global_step": 135119, "epoch": 3217} {"train_loss": -6.799527645111084, "global_step": 135120, "epoch": 3217} {"train_loss": -6.76334285736084, "global_step": 135121, "epoch": 3217} {"train_loss": -6.737181663513184, "global_step": 135122, "epoch": 3217} {"train_loss": -6.7472944259643555, "global_step": 135123, "epoch": 3217} {"train_loss": -6.735772132873535, "global_step": 135124, "epoch": 3217} {"train_loss": -6.84868049621582, "global_step": 135125, "epoch": 3217} {"train_loss": -6.815483570098877, "global_step": 135126, "epoch": 3217} {"train_loss": -6.784235954284668, "global_step": 135127, "epoch": 3217} {"train_loss": -6.712331771850586, "global_step": 135128, "epoch": 3217} {"train_loss": -6.792094707489014, "global_step": 135129, "epoch": 3217} {"train_loss": -6.769810676574707, "global_step": 135130, "epoch": 3217} {"train_loss": -6.620765209197998, "global_step": 135131, "epoch": 3217} {"train_loss": -6.675075531005859, "global_step": 135132, "epoch": 3217} {"train_loss": -6.666871070861816, "global_step": 135133, "epoch": 3217} {"train_loss": -6.723925590515137, "global_step": 135134, "epoch": 3217} {"train_loss": -6.670444488525391, "global_step": 135135, "epoch": 3217} {"train_loss": -6.681654930114746, "global_step": 135136, "epoch": 3217} {"train_loss": -6.7792816162109375, "global_step": 135137, "epoch": 3217} {"train_loss": -6.758391380310059, "global_step": 135138, "epoch": 3217} {"train_loss": -6.6752610206604, "global_step": 135139, "epoch": 3217} {"train_loss": -6.805431842803955, "global_step": 135140, "epoch": 3217} {"train_loss": -6.715396404266357, "global_step": 135141, "epoch": 3217} {"train_loss": -6.811583518981934, "global_step": 135142, "epoch": 3217} {"train_loss": -6.800875663757324, "global_step": 135143, "epoch": 3217} {"train_loss": -6.704228401184082, "global_step": 135144, "epoch": 3217} {"train_loss": -6.8474626541137695, "global_step": 135145, "epoch": 3217} {"train_loss": -6.834188461303711, "global_step": 135146, "epoch": 3217} {"train_loss": -6.70741605758667, "global_step": 135147, "epoch": 3217} {"train_loss": -6.810070514678955, "global_step": 135148, "epoch": 3217} {"train_loss": -6.630508899688721, "global_step": 135149, "epoch": 3217} {"train_loss": -6.6336669921875, "global_step": 135150, "epoch": 3217} {"train_loss": -6.694248199462891, "global_step": 135151, "epoch": 3217} {"train_loss": -6.575553894042969, "global_step": 135152, "epoch": 3217} {"train_loss": -6.697395324707031, "global_step": 135153, "epoch": 3217} {"train_loss": -6.603640079498291, "global_step": 135154, "epoch": 3217} {"train_loss": -6.728704225449335, "global_step": 135155, "epoch": 3217, "val_loss": 67067.0546875} {"train_loss": -6.724241256713867, "global_step": 135156, "epoch": 3218} {"train_loss": -6.5895562171936035, "global_step": 135157, "epoch": 3218} {"train_loss": -6.597912788391113, "global_step": 135158, "epoch": 3218} {"train_loss": -6.670148849487305, "global_step": 135159, "epoch": 3218} {"train_loss": -6.614832878112793, "global_step": 135160, "epoch": 3218} {"train_loss": -6.67710542678833, "global_step": 135161, "epoch": 3218} {"train_loss": -6.740742206573486, "global_step": 135162, "epoch": 3218} {"train_loss": -6.6722917556762695, "global_step": 135163, "epoch": 3218} {"train_loss": -6.640165328979492, "global_step": 135164, "epoch": 3218} {"train_loss": -6.774245262145996, "global_step": 135165, "epoch": 3218} {"train_loss": -6.724510192871094, "global_step": 135166, "epoch": 3218} {"train_loss": -6.653513431549072, "global_step": 135167, "epoch": 3218} {"train_loss": -6.780632972717285, "global_step": 135168, "epoch": 3218} {"train_loss": -6.73561954498291, "global_step": 135169, "epoch": 3218} {"train_loss": -6.755188941955566, "global_step": 135170, "epoch": 3218} {"train_loss": -6.753195762634277, "global_step": 135171, "epoch": 3218} {"train_loss": -6.787915229797363, "global_step": 135172, "epoch": 3218} {"train_loss": -6.8075432777404785, "global_step": 135173, "epoch": 3218} {"train_loss": -6.697125434875488, "global_step": 135174, "epoch": 3218} {"train_loss": -6.757875919342041, "global_step": 135175, "epoch": 3218} {"train_loss": -6.620678901672363, "global_step": 135176, "epoch": 3218} {"train_loss": -6.700077056884766, "global_step": 135177, "epoch": 3218} {"train_loss": -6.835458755493164, "global_step": 135178, "epoch": 3218} {"train_loss": -6.798336029052734, "global_step": 135179, "epoch": 3218} {"train_loss": -6.854831695556641, "global_step": 135180, "epoch": 3218} {"train_loss": -6.665551662445068, "global_step": 135181, "epoch": 3218} {"train_loss": -6.547432899475098, "global_step": 135182, "epoch": 3218} {"train_loss": -6.7635111808776855, "global_step": 135183, "epoch": 3218} {"train_loss": -6.690283298492432, "global_step": 135184, "epoch": 3218} {"train_loss": -6.731219291687012, "global_step": 135185, "epoch": 3218} {"train_loss": -6.78317928314209, "global_step": 135186, "epoch": 3218} {"train_loss": -6.771429061889648, "global_step": 135187, "epoch": 3218} {"train_loss": -6.656951904296875, "global_step": 135188, "epoch": 3218} {"train_loss": -6.771002769470215, "global_step": 135189, "epoch": 3218} {"train_loss": -6.685894012451172, "global_step": 135190, "epoch": 3218} {"train_loss": -6.681299209594727, "global_step": 135191, "epoch": 3218} {"train_loss": -6.750825881958008, "global_step": 135192, "epoch": 3218} {"train_loss": -6.717959880828857, "global_step": 135193, "epoch": 3218} {"train_loss": -6.76971960067749, "global_step": 135194, "epoch": 3218} {"train_loss": -6.772902488708496, "global_step": 135195, "epoch": 3218} {"train_loss": -6.561568260192871, "global_step": 135196, "epoch": 3218} {"train_loss": -6.7126024677639915, "global_step": 135197, "epoch": 3218, "val_loss": 66932.25} {"train_loss": -6.691436767578125, "global_step": 135198, "epoch": 3219} {"train_loss": -6.741326332092285, "global_step": 135199, "epoch": 3219} {"train_loss": -6.668365478515625, "global_step": 135200, "epoch": 3219} {"train_loss": -6.678895950317383, "global_step": 135201, "epoch": 3219} {"train_loss": -6.671891689300537, "global_step": 135202, "epoch": 3219} {"train_loss": -6.678337574005127, "global_step": 135203, "epoch": 3219} {"train_loss": -6.59391450881958, "global_step": 135204, "epoch": 3219} {"train_loss": -6.738456726074219, "global_step": 135205, "epoch": 3219} {"train_loss": -6.569855213165283, "global_step": 135206, "epoch": 3219} {"train_loss": -6.624678611755371, "global_step": 135207, "epoch": 3219} {"train_loss": -6.650120735168457, "global_step": 135208, "epoch": 3219} {"train_loss": -6.555424690246582, "global_step": 135209, "epoch": 3219} {"train_loss": -6.763593673706055, "global_step": 135210, "epoch": 3219} {"train_loss": -6.637233734130859, "global_step": 135211, "epoch": 3219} {"train_loss": -6.673183441162109, "global_step": 135212, "epoch": 3219} {"train_loss": -6.594305038452148, "global_step": 135213, "epoch": 3219} {"train_loss": -6.6890788078308105, "global_step": 135214, "epoch": 3219} {"train_loss": -6.649474143981934, "global_step": 135215, "epoch": 3219} {"train_loss": -6.5818352699279785, "global_step": 135216, "epoch": 3219} {"train_loss": -6.711215019226074, "global_step": 135217, "epoch": 3219} {"train_loss": -6.612829685211182, "global_step": 135218, "epoch": 3219} {"train_loss": -6.565996170043945, "global_step": 135219, "epoch": 3219} {"train_loss": -6.682157516479492, "global_step": 135220, "epoch": 3219} {"train_loss": -6.538601398468018, "global_step": 135221, "epoch": 3219} {"train_loss": -6.734078407287598, "global_step": 135222, "epoch": 3219} {"train_loss": -6.7711029052734375, "global_step": 135223, "epoch": 3219} {"train_loss": -6.61644172668457, "global_step": 135224, "epoch": 3219} {"train_loss": -6.665225028991699, "global_step": 135225, "epoch": 3219} {"train_loss": -6.758084297180176, "global_step": 135226, "epoch": 3219} {"train_loss": -6.6172685623168945, "global_step": 135227, "epoch": 3219} {"train_loss": -6.699621200561523, "global_step": 135228, "epoch": 3219} {"train_loss": -6.744253158569336, "global_step": 135229, "epoch": 3219} {"train_loss": -6.698474884033203, "global_step": 135230, "epoch": 3219} {"train_loss": -6.680117607116699, "global_step": 135231, "epoch": 3219} {"train_loss": -6.677998065948486, "global_step": 135232, "epoch": 3219} {"train_loss": -6.7456254959106445, "global_step": 135233, "epoch": 3219} {"train_loss": -6.675778865814209, "global_step": 135234, "epoch": 3219} {"train_loss": -6.645227909088135, "global_step": 135235, "epoch": 3219} {"train_loss": -6.759660720825195, "global_step": 135236, "epoch": 3219} {"train_loss": -6.759821891784668, "global_step": 135237, "epoch": 3219} {"train_loss": -6.716195583343506, "global_step": 135238, "epoch": 3219} {"train_loss": -6.672951686949957, "global_step": 135239, "epoch": 3219, "val_loss": 66949.890625} {"train_loss": -6.685945510864258, "global_step": 135240, "epoch": 3220} {"train_loss": -6.748505592346191, "global_step": 135241, "epoch": 3220} {"train_loss": -6.782453536987305, "global_step": 135242, "epoch": 3220} {"train_loss": -6.703835964202881, "global_step": 135243, "epoch": 3220} {"train_loss": -6.669589996337891, "global_step": 135244, "epoch": 3220} {"train_loss": -6.8003387451171875, "global_step": 135245, "epoch": 3220} {"train_loss": -6.707502365112305, "global_step": 135246, "epoch": 3220} {"train_loss": -6.615272521972656, "global_step": 135247, "epoch": 3220} {"train_loss": -6.689148426055908, "global_step": 135248, "epoch": 3220} {"train_loss": -6.732632637023926, "global_step": 135249, "epoch": 3220} {"train_loss": -6.74798059463501, "global_step": 135250, "epoch": 3220} {"train_loss": -6.660938739776611, "global_step": 135251, "epoch": 3220} {"train_loss": -6.711440086364746, "global_step": 135252, "epoch": 3220} {"train_loss": -6.758630752563477, "global_step": 135253, "epoch": 3220} {"train_loss": -6.669454574584961, "global_step": 135254, "epoch": 3220} {"train_loss": -6.857967853546143, "global_step": 135255, "epoch": 3220} {"train_loss": -6.812687397003174, "global_step": 135256, "epoch": 3220} {"train_loss": -6.653276443481445, "global_step": 135257, "epoch": 3220} {"train_loss": -6.7477827072143555, "global_step": 135258, "epoch": 3220} {"train_loss": -6.618896484375, "global_step": 135259, "epoch": 3220} {"train_loss": -6.745264053344727, "global_step": 135260, "epoch": 3220} {"train_loss": -6.819841384887695, "global_step": 135261, "epoch": 3220} {"train_loss": -6.809867858886719, "global_step": 135262, "epoch": 3220} {"train_loss": -6.546600341796875, "global_step": 135263, "epoch": 3220} {"train_loss": -6.665498733520508, "global_step": 135264, "epoch": 3220} {"train_loss": -6.746910572052002, "global_step": 135265, "epoch": 3220} {"train_loss": -6.703068733215332, "global_step": 135266, "epoch": 3220} {"train_loss": -6.657317638397217, "global_step": 135267, "epoch": 3220} {"train_loss": -6.703616142272949, "global_step": 135268, "epoch": 3220} {"train_loss": -6.6831512451171875, "global_step": 135269, "epoch": 3220} {"train_loss": -6.711651802062988, "global_step": 135270, "epoch": 3220} {"train_loss": -6.741642951965332, "global_step": 135271, "epoch": 3220} {"train_loss": -6.608078479766846, "global_step": 135272, "epoch": 3220} {"train_loss": -6.674893856048584, "global_step": 135273, "epoch": 3220} {"train_loss": -6.650689601898193, "global_step": 135274, "epoch": 3220} {"train_loss": -6.751548767089844, "global_step": 135275, "epoch": 3220} {"train_loss": -6.739687919616699, "global_step": 135276, "epoch": 3220} {"train_loss": -6.775822639465332, "global_step": 135277, "epoch": 3220} {"train_loss": -6.691047668457031, "global_step": 135278, "epoch": 3220} {"train_loss": -6.768810272216797, "global_step": 135279, "epoch": 3220} {"train_loss": -6.7046027183532715, "global_step": 135280, "epoch": 3220} {"train_loss": -6.713625646772838, "global_step": 135281, "epoch": 3220, "val_loss": 66874.1640625} {"train_loss": -6.713252067565918, "global_step": 135282, "epoch": 3221} {"train_loss": -6.732041358947754, "global_step": 135283, "epoch": 3221} {"train_loss": -6.863417625427246, "global_step": 135284, "epoch": 3221} {"train_loss": -6.7847161293029785, "global_step": 135285, "epoch": 3221} {"train_loss": -6.845841407775879, "global_step": 135286, "epoch": 3221} {"train_loss": -6.791868209838867, "global_step": 135287, "epoch": 3221} {"train_loss": -6.772919178009033, "global_step": 135288, "epoch": 3221} {"train_loss": -6.844078540802002, "global_step": 135289, "epoch": 3221} {"train_loss": -6.827611923217773, "global_step": 135290, "epoch": 3221} {"train_loss": -6.779703140258789, "global_step": 135291, "epoch": 3221} {"train_loss": -6.820957183837891, "global_step": 135292, "epoch": 3221} {"train_loss": -6.758443832397461, "global_step": 135293, "epoch": 3221} {"train_loss": -6.662586212158203, "global_step": 135294, "epoch": 3221} {"train_loss": -6.684760093688965, "global_step": 135295, "epoch": 3221} {"train_loss": -6.777409553527832, "global_step": 135296, "epoch": 3221} {"train_loss": -6.842513084411621, "global_step": 135297, "epoch": 3221} {"train_loss": -6.709278583526611, "global_step": 135298, "epoch": 3221} {"train_loss": -6.7851996421813965, "global_step": 135299, "epoch": 3221} {"train_loss": -6.892784118652344, "global_step": 135300, "epoch": 3221} {"train_loss": -6.794307708740234, "global_step": 135301, "epoch": 3221} {"train_loss": -6.749456405639648, "global_step": 135302, "epoch": 3221} {"train_loss": -6.771790504455566, "global_step": 135303, "epoch": 3221} {"train_loss": -6.749876022338867, "global_step": 135304, "epoch": 3221} {"train_loss": -6.798962116241455, "global_step": 135305, "epoch": 3221} {"train_loss": -6.705682754516602, "global_step": 135306, "epoch": 3221} {"train_loss": -6.893320083618164, "global_step": 135307, "epoch": 3221} {"train_loss": -6.800340175628662, "global_step": 135308, "epoch": 3221} {"train_loss": -6.7045793533325195, "global_step": 135309, "epoch": 3221} {"train_loss": -6.864118576049805, "global_step": 135310, "epoch": 3221} {"train_loss": -6.627309799194336, "global_step": 135311, "epoch": 3221} {"train_loss": -6.680042743682861, "global_step": 135312, "epoch": 3221} {"train_loss": -6.742081642150879, "global_step": 135313, "epoch": 3221} {"train_loss": -6.754739761352539, "global_step": 135314, "epoch": 3221} {"train_loss": -6.8240814208984375, "global_step": 135315, "epoch": 3221} {"train_loss": -6.667176723480225, "global_step": 135316, "epoch": 3221} {"train_loss": -6.716553688049316, "global_step": 135317, "epoch": 3221} {"train_loss": -6.8576555252075195, "global_step": 135318, "epoch": 3221} {"train_loss": -6.586742877960205, "global_step": 135319, "epoch": 3221} {"train_loss": -6.772592544555664, "global_step": 135320, "epoch": 3221} {"train_loss": -6.6761579513549805, "global_step": 135321, "epoch": 3221} {"train_loss": -6.649355411529541, "global_step": 135322, "epoch": 3221} {"train_loss": -6.7622701327006025, "global_step": 135323, "epoch": 3221, "val_loss": 66963.375} {"train_loss": -6.66873836517334, "global_step": 135324, "epoch": 3222} {"train_loss": -6.774569511413574, "global_step": 135325, "epoch": 3222} {"train_loss": -6.682777404785156, "global_step": 135326, "epoch": 3222} {"train_loss": -6.732918739318848, "global_step": 135327, "epoch": 3222} {"train_loss": -6.637531757354736, "global_step": 135328, "epoch": 3222} {"train_loss": -6.793627738952637, "global_step": 135329, "epoch": 3222} {"train_loss": -6.7352294921875, "global_step": 135330, "epoch": 3222} {"train_loss": -6.797242164611816, "global_step": 135331, "epoch": 3222} {"train_loss": -6.724003791809082, "global_step": 135332, "epoch": 3222} {"train_loss": -6.8870720863342285, "global_step": 135333, "epoch": 3222} {"train_loss": -6.796553134918213, "global_step": 135334, "epoch": 3222} {"train_loss": -6.755513668060303, "global_step": 135335, "epoch": 3222} {"train_loss": -6.818011283874512, "global_step": 135336, "epoch": 3222} {"train_loss": -6.752660274505615, "global_step": 135337, "epoch": 3222} {"train_loss": -6.715941905975342, "global_step": 135338, "epoch": 3222} {"train_loss": -6.776594161987305, "global_step": 135339, "epoch": 3222} {"train_loss": -6.720268249511719, "global_step": 135340, "epoch": 3222} {"train_loss": -6.740809440612793, "global_step": 135341, "epoch": 3222} {"train_loss": -6.695761203765869, "global_step": 135342, "epoch": 3222} {"train_loss": -6.788172245025635, "global_step": 135343, "epoch": 3222} {"train_loss": -6.793585300445557, "global_step": 135344, "epoch": 3222} {"train_loss": -6.721315383911133, "global_step": 135345, "epoch": 3222} {"train_loss": -6.74913215637207, "global_step": 135346, "epoch": 3222} {"train_loss": -6.827771186828613, "global_step": 135347, "epoch": 3222} {"train_loss": -6.527467727661133, "global_step": 135348, "epoch": 3222} {"train_loss": -6.715134620666504, "global_step": 135349, "epoch": 3222} {"train_loss": -6.817414283752441, "global_step": 135350, "epoch": 3222} {"train_loss": -6.752896308898926, "global_step": 135351, "epoch": 3222} {"train_loss": -6.6308794021606445, "global_step": 135352, "epoch": 3222} {"train_loss": -6.7388129234313965, "global_step": 135353, "epoch": 3222} {"train_loss": -6.7019572257995605, "global_step": 135354, "epoch": 3222} {"train_loss": -6.766757965087891, "global_step": 135355, "epoch": 3222} {"train_loss": -6.68889045715332, "global_step": 135356, "epoch": 3222} {"train_loss": -6.639097690582275, "global_step": 135357, "epoch": 3222} {"train_loss": -6.6694231033325195, "global_step": 135358, "epoch": 3222} {"train_loss": -6.674383163452148, "global_step": 135359, "epoch": 3222} {"train_loss": -6.854500770568848, "global_step": 135360, "epoch": 3222} {"train_loss": -6.639251232147217, "global_step": 135361, "epoch": 3222} {"train_loss": -6.737297534942627, "global_step": 135362, "epoch": 3222} {"train_loss": -6.726114273071289, "global_step": 135363, "epoch": 3222} {"train_loss": -6.662317276000977, "global_step": 135364, "epoch": 3222} {"train_loss": -6.730593056905837, "global_step": 135365, "epoch": 3222, "val_loss": 67077.0859375} {"train_loss": -6.713891983032227, "global_step": 135366, "epoch": 3223} {"train_loss": -6.698659896850586, "global_step": 135367, "epoch": 3223} {"train_loss": -6.713379383087158, "global_step": 135368, "epoch": 3223} {"train_loss": -6.737494468688965, "global_step": 135369, "epoch": 3223} {"train_loss": -6.645617485046387, "global_step": 135370, "epoch": 3223} {"train_loss": -6.698584079742432, "global_step": 135371, "epoch": 3223} {"train_loss": -6.687778949737549, "global_step": 135372, "epoch": 3223} {"train_loss": -6.660028457641602, "global_step": 135373, "epoch": 3223} {"train_loss": -6.804902076721191, "global_step": 135374, "epoch": 3223} {"train_loss": -6.670474529266357, "global_step": 135375, "epoch": 3223} {"train_loss": -6.7332987785339355, "global_step": 135376, "epoch": 3223} {"train_loss": -6.807641506195068, "global_step": 135377, "epoch": 3223} {"train_loss": -6.796060562133789, "global_step": 135378, "epoch": 3223} {"train_loss": -6.583008766174316, "global_step": 135379, "epoch": 3223} {"train_loss": -6.656929016113281, "global_step": 135380, "epoch": 3223} {"train_loss": -6.5747575759887695, "global_step": 135381, "epoch": 3223} {"train_loss": -6.734222412109375, "global_step": 135382, "epoch": 3223} {"train_loss": -6.839073181152344, "global_step": 135383, "epoch": 3223} {"train_loss": -6.761869430541992, "global_step": 135384, "epoch": 3223} {"train_loss": -6.730121612548828, "global_step": 135385, "epoch": 3223} {"train_loss": -6.768610954284668, "global_step": 135386, "epoch": 3223} {"train_loss": -6.839016437530518, "global_step": 135387, "epoch": 3223} {"train_loss": -6.785778045654297, "global_step": 135388, "epoch": 3223} {"train_loss": -6.635331630706787, "global_step": 135389, "epoch": 3223} {"train_loss": -6.696529388427734, "global_step": 135390, "epoch": 3223} {"train_loss": -6.623711109161377, "global_step": 135391, "epoch": 3223} {"train_loss": -6.611420631408691, "global_step": 135392, "epoch": 3223} {"train_loss": -6.6758246421813965, "global_step": 135393, "epoch": 3223} {"train_loss": -6.666879177093506, "global_step": 135394, "epoch": 3223} {"train_loss": -6.75465202331543, "global_step": 135395, "epoch": 3223} {"train_loss": -6.6197052001953125, "global_step": 135396, "epoch": 3223} {"train_loss": -6.748373985290527, "global_step": 135397, "epoch": 3223} {"train_loss": -6.662776947021484, "global_step": 135398, "epoch": 3223} {"train_loss": -6.785123825073242, "global_step": 135399, "epoch": 3223} {"train_loss": -6.763952255249023, "global_step": 135400, "epoch": 3223} {"train_loss": -6.707795143127441, "global_step": 135401, "epoch": 3223} {"train_loss": -6.746408462524414, "global_step": 135402, "epoch": 3223} {"train_loss": -6.722538948059082, "global_step": 135403, "epoch": 3223} {"train_loss": -6.680302143096924, "global_step": 135404, "epoch": 3223} {"train_loss": -6.651572227478027, "global_step": 135405, "epoch": 3223} {"train_loss": -6.708813190460205, "global_step": 135406, "epoch": 3223} {"train_loss": -6.7098100412459605, "global_step": 135407, "epoch": 3223, "val_loss": 66984.0546875} {"train_loss": -6.64777946472168, "global_step": 135408, "epoch": 3224} {"train_loss": -6.794113636016846, "global_step": 135409, "epoch": 3224} {"train_loss": -6.806614875793457, "global_step": 135410, "epoch": 3224} {"train_loss": -6.609433174133301, "global_step": 135411, "epoch": 3224} {"train_loss": -6.663233757019043, "global_step": 135412, "epoch": 3224} {"train_loss": -6.855251312255859, "global_step": 135413, "epoch": 3224} {"train_loss": -6.695296287536621, "global_step": 135414, "epoch": 3224} {"train_loss": -6.819889068603516, "global_step": 135415, "epoch": 3224} {"train_loss": -6.776656150817871, "global_step": 135416, "epoch": 3224} {"train_loss": -6.642126560211182, "global_step": 135417, "epoch": 3224} {"train_loss": -6.633342266082764, "global_step": 135418, "epoch": 3224} {"train_loss": -6.741372108459473, "global_step": 135419, "epoch": 3224} {"train_loss": -6.722783088684082, "global_step": 135420, "epoch": 3224} {"train_loss": -6.745571136474609, "global_step": 135421, "epoch": 3224} {"train_loss": -6.675752639770508, "global_step": 135422, "epoch": 3224} {"train_loss": -6.8186235427856445, "global_step": 135423, "epoch": 3224} {"train_loss": -6.596790313720703, "global_step": 135424, "epoch": 3224} {"train_loss": -6.721468448638916, "global_step": 135425, "epoch": 3224} {"train_loss": -6.738434791564941, "global_step": 135426, "epoch": 3224} {"train_loss": -6.736240386962891, "global_step": 135427, "epoch": 3224} {"train_loss": -6.667646884918213, "global_step": 135428, "epoch": 3224} {"train_loss": -6.655695915222168, "global_step": 135429, "epoch": 3224} {"train_loss": -6.770138263702393, "global_step": 135430, "epoch": 3224} {"train_loss": -6.705992698669434, "global_step": 135431, "epoch": 3224} {"train_loss": -6.691579818725586, "global_step": 135432, "epoch": 3224} {"train_loss": -6.578560829162598, "global_step": 135433, "epoch": 3224} {"train_loss": -6.647692680358887, "global_step": 135434, "epoch": 3224} {"train_loss": -6.551912307739258, "global_step": 135435, "epoch": 3224} {"train_loss": -6.719722747802734, "global_step": 135436, "epoch": 3224} {"train_loss": -6.677254676818848, "global_step": 135437, "epoch": 3224} {"train_loss": -6.705630302429199, "global_step": 135438, "epoch": 3224} {"train_loss": -6.711138725280762, "global_step": 135439, "epoch": 3224} {"train_loss": -6.504878044128418, "global_step": 135440, "epoch": 3224} {"train_loss": -6.558995246887207, "global_step": 135441, "epoch": 3224} {"train_loss": -6.609850883483887, "global_step": 135442, "epoch": 3224} {"train_loss": -6.7509965896606445, "global_step": 135443, "epoch": 3224} {"train_loss": -6.500505447387695, "global_step": 135444, "epoch": 3224} {"train_loss": -6.745876312255859, "global_step": 135445, "epoch": 3224} {"train_loss": -6.662797927856445, "global_step": 135446, "epoch": 3224} {"train_loss": -6.762192249298096, "global_step": 135447, "epoch": 3224} {"train_loss": -6.715909004211426, "global_step": 135448, "epoch": 3224} {"train_loss": -6.688291663215274, "global_step": 135449, "epoch": 3224, "val_loss": 67023.8984375} {"train_loss": -6.665821075439453, "global_step": 135450, "epoch": 3225} {"train_loss": -6.65131950378418, "global_step": 135451, "epoch": 3225} {"train_loss": -6.555135726928711, "global_step": 135452, "epoch": 3225} {"train_loss": -6.727868556976318, "global_step": 135453, "epoch": 3225} {"train_loss": -6.800505638122559, "global_step": 135454, "epoch": 3225} {"train_loss": -6.756498336791992, "global_step": 135455, "epoch": 3225} {"train_loss": -6.656922817230225, "global_step": 135456, "epoch": 3225} {"train_loss": -6.634953498840332, "global_step": 135457, "epoch": 3225} {"train_loss": -6.689578056335449, "global_step": 135458, "epoch": 3225} {"train_loss": -6.6721510887146, "global_step": 135459, "epoch": 3225} {"train_loss": -6.697239398956299, "global_step": 135460, "epoch": 3225} {"train_loss": -6.722463607788086, "global_step": 135461, "epoch": 3225} {"train_loss": -6.711585998535156, "global_step": 135462, "epoch": 3225} {"train_loss": -6.796286106109619, "global_step": 135463, "epoch": 3225} {"train_loss": -6.739388465881348, "global_step": 135464, "epoch": 3225} {"train_loss": -6.714573383331299, "global_step": 135465, "epoch": 3225} {"train_loss": -6.808101654052734, "global_step": 135466, "epoch": 3225} {"train_loss": -6.720624923706055, "global_step": 135467, "epoch": 3225} {"train_loss": -6.798844337463379, "global_step": 135468, "epoch": 3225} {"train_loss": -6.705408096313477, "global_step": 135469, "epoch": 3225} {"train_loss": -6.771604061126709, "global_step": 135470, "epoch": 3225} {"train_loss": -6.708559036254883, "global_step": 135471, "epoch": 3225} {"train_loss": -6.694772243499756, "global_step": 135472, "epoch": 3225} {"train_loss": -6.714913845062256, "global_step": 135473, "epoch": 3225} {"train_loss": -6.797669410705566, "global_step": 135474, "epoch": 3225} {"train_loss": -6.774675369262695, "global_step": 135475, "epoch": 3225} {"train_loss": -6.630401611328125, "global_step": 135476, "epoch": 3225} {"train_loss": -6.681207656860352, "global_step": 135477, "epoch": 3225} {"train_loss": -6.725032329559326, "global_step": 135478, "epoch": 3225} {"train_loss": -6.790768146514893, "global_step": 135479, "epoch": 3225} {"train_loss": -6.647544860839844, "global_step": 135480, "epoch": 3225} {"train_loss": -6.691937446594238, "global_step": 135481, "epoch": 3225} {"train_loss": -6.728782653808594, "global_step": 135482, "epoch": 3225} {"train_loss": -6.744240760803223, "global_step": 135483, "epoch": 3225} {"train_loss": -6.8137712478637695, "global_step": 135484, "epoch": 3225} {"train_loss": -6.71033239364624, "global_step": 135485, "epoch": 3225} {"train_loss": -6.740822792053223, "global_step": 135486, "epoch": 3225} {"train_loss": -6.8162431716918945, "global_step": 135487, "epoch": 3225} {"train_loss": -6.684900283813477, "global_step": 135488, "epoch": 3225} {"train_loss": -6.782668113708496, "global_step": 135489, "epoch": 3225} {"train_loss": -6.754108428955078, "global_step": 135490, "epoch": 3225} {"train_loss": -6.723985547111148, "global_step": 135491, "epoch": 3225, "val_loss": 66893.6875} {"train_loss": -6.788649559020996, "global_step": 135492, "epoch": 3226} {"train_loss": -6.782721042633057, "global_step": 135493, "epoch": 3226} {"train_loss": -6.743755340576172, "global_step": 135494, "epoch": 3226} {"train_loss": -6.771568298339844, "global_step": 135495, "epoch": 3226} {"train_loss": -6.74542236328125, "global_step": 135496, "epoch": 3226} {"train_loss": -6.654373645782471, "global_step": 135497, "epoch": 3226} {"train_loss": -6.7950439453125, "global_step": 135498, "epoch": 3226} {"train_loss": -6.773847579956055, "global_step": 135499, "epoch": 3226} {"train_loss": -6.629183769226074, "global_step": 135500, "epoch": 3226} {"train_loss": -6.740948677062988, "global_step": 135501, "epoch": 3226} {"train_loss": -6.740854263305664, "global_step": 135502, "epoch": 3226} {"train_loss": -6.794342041015625, "global_step": 135503, "epoch": 3226} {"train_loss": -6.7849016189575195, "global_step": 135504, "epoch": 3226} {"train_loss": -6.848241806030273, "global_step": 135505, "epoch": 3226} {"train_loss": -6.743869781494141, "global_step": 135506, "epoch": 3226} {"train_loss": -6.739676475524902, "global_step": 135507, "epoch": 3226} {"train_loss": -6.600184917449951, "global_step": 135508, "epoch": 3226} {"train_loss": -6.739317893981934, "global_step": 135509, "epoch": 3226} {"train_loss": -6.784470081329346, "global_step": 135510, "epoch": 3226} {"train_loss": -6.8231096267700195, "global_step": 135511, "epoch": 3226} {"train_loss": -6.718569278717041, "global_step": 135512, "epoch": 3226} {"train_loss": -6.6809983253479, "global_step": 135513, "epoch": 3226} {"train_loss": -6.77238655090332, "global_step": 135514, "epoch": 3226} {"train_loss": -6.688846588134766, "global_step": 135515, "epoch": 3226} {"train_loss": -6.716370105743408, "global_step": 135516, "epoch": 3226} {"train_loss": -6.751317977905273, "global_step": 135517, "epoch": 3226} {"train_loss": -6.711587905883789, "global_step": 135518, "epoch": 3226} {"train_loss": -6.755007266998291, "global_step": 135519, "epoch": 3226} {"train_loss": -6.647734642028809, "global_step": 135520, "epoch": 3226} {"train_loss": -6.788542747497559, "global_step": 135521, "epoch": 3226} {"train_loss": -6.73872184753418, "global_step": 135522, "epoch": 3226} {"train_loss": -6.735830307006836, "global_step": 135523, "epoch": 3226} {"train_loss": -6.582208633422852, "global_step": 135524, "epoch": 3226} {"train_loss": -6.741755485534668, "global_step": 135525, "epoch": 3226} {"train_loss": -6.715002536773682, "global_step": 135526, "epoch": 3226} {"train_loss": -6.767258644104004, "global_step": 135527, "epoch": 3226} {"train_loss": -6.8105669021606445, "global_step": 135528, "epoch": 3226} {"train_loss": -6.641074180603027, "global_step": 135529, "epoch": 3226} {"train_loss": -6.772991180419922, "global_step": 135530, "epoch": 3226} {"train_loss": -6.647302627563477, "global_step": 135531, "epoch": 3226} {"train_loss": -6.794368267059326, "global_step": 135532, "epoch": 3226} {"train_loss": -6.735674710500808, "global_step": 135533, "epoch": 3226, "val_loss": 67083.1015625} {"train_loss": -6.736030578613281, "global_step": 135534, "epoch": 3227} {"train_loss": -6.731783390045166, "global_step": 135535, "epoch": 3227} {"train_loss": -6.65877628326416, "global_step": 135536, "epoch": 3227} {"train_loss": -6.67418098449707, "global_step": 135537, "epoch": 3227} {"train_loss": -6.662225723266602, "global_step": 135538, "epoch": 3227} {"train_loss": -6.720786094665527, "global_step": 135539, "epoch": 3227} {"train_loss": -6.703502178192139, "global_step": 135540, "epoch": 3227} {"train_loss": -6.834132194519043, "global_step": 135541, "epoch": 3227} {"train_loss": -6.731888294219971, "global_step": 135542, "epoch": 3227} {"train_loss": -6.661443710327148, "global_step": 135543, "epoch": 3227} {"train_loss": -6.691159248352051, "global_step": 135544, "epoch": 3227} {"train_loss": -6.849709510803223, "global_step": 135545, "epoch": 3227} {"train_loss": -6.736439228057861, "global_step": 135546, "epoch": 3227} {"train_loss": -6.726690769195557, "global_step": 135547, "epoch": 3227} {"train_loss": -6.719714641571045, "global_step": 135548, "epoch": 3227} {"train_loss": -6.783318519592285, "global_step": 135549, "epoch": 3227} {"train_loss": -6.726550579071045, "global_step": 135550, "epoch": 3227} {"train_loss": -6.699365615844727, "global_step": 135551, "epoch": 3227} {"train_loss": -6.8250579833984375, "global_step": 135552, "epoch": 3227} {"train_loss": -6.638519287109375, "global_step": 135553, "epoch": 3227} {"train_loss": -6.8256754875183105, "global_step": 135554, "epoch": 3227} {"train_loss": -6.780545711517334, "global_step": 135555, "epoch": 3227} {"train_loss": -6.693600654602051, "global_step": 135556, "epoch": 3227} {"train_loss": -6.63858699798584, "global_step": 135557, "epoch": 3227} {"train_loss": -6.757199287414551, "global_step": 135558, "epoch": 3227} {"train_loss": -6.75944185256958, "global_step": 135559, "epoch": 3227} {"train_loss": -6.724883079528809, "global_step": 135560, "epoch": 3227} {"train_loss": -6.731612205505371, "global_step": 135561, "epoch": 3227} {"train_loss": -6.645224571228027, "global_step": 135562, "epoch": 3227} {"train_loss": -6.703697204589844, "global_step": 135563, "epoch": 3227} {"train_loss": -6.6248779296875, "global_step": 135564, "epoch": 3227} {"train_loss": -6.694117069244385, "global_step": 135565, "epoch": 3227} {"train_loss": -6.723280906677246, "global_step": 135566, "epoch": 3227} {"train_loss": -6.658262729644775, "global_step": 135567, "epoch": 3227} {"train_loss": -6.623623847961426, "global_step": 135568, "epoch": 3227} {"train_loss": -6.59104585647583, "global_step": 135569, "epoch": 3227} {"train_loss": -6.664648056030273, "global_step": 135570, "epoch": 3227} {"train_loss": -6.721043109893799, "global_step": 135571, "epoch": 3227} {"train_loss": -6.773711681365967, "global_step": 135572, "epoch": 3227} {"train_loss": -6.67636251449585, "global_step": 135573, "epoch": 3227} {"train_loss": -6.707704544067383, "global_step": 135574, "epoch": 3227} {"train_loss": -6.712206692922683, "global_step": 135575, "epoch": 3227, "val_loss": 67065.421875} {"train_loss": -6.635685443878174, "global_step": 135576, "epoch": 3228} {"train_loss": -6.616971969604492, "global_step": 135577, "epoch": 3228} {"train_loss": -6.691218376159668, "global_step": 135578, "epoch": 3228} {"train_loss": -6.665098190307617, "global_step": 135579, "epoch": 3228} {"train_loss": -6.707955360412598, "global_step": 135580, "epoch": 3228} {"train_loss": -6.690832614898682, "global_step": 135581, "epoch": 3228} {"train_loss": -6.693665504455566, "global_step": 135582, "epoch": 3228} {"train_loss": -6.664088249206543, "global_step": 135583, "epoch": 3228} {"train_loss": -6.676783561706543, "global_step": 135584, "epoch": 3228} {"train_loss": -6.8052520751953125, "global_step": 135585, "epoch": 3228} {"train_loss": -6.79434871673584, "global_step": 135586, "epoch": 3228} {"train_loss": -6.687441349029541, "global_step": 135587, "epoch": 3228} {"train_loss": -6.748897552490234, "global_step": 135588, "epoch": 3228} {"train_loss": -6.7461652755737305, "global_step": 135589, "epoch": 3228} {"train_loss": -6.768497467041016, "global_step": 135590, "epoch": 3228} {"train_loss": -6.798354148864746, "global_step": 135591, "epoch": 3228} {"train_loss": -6.658026695251465, "global_step": 135592, "epoch": 3228} {"train_loss": -6.7692131996154785, "global_step": 135593, "epoch": 3228} {"train_loss": -6.710174083709717, "global_step": 135594, "epoch": 3228} {"train_loss": -6.769412517547607, "global_step": 135595, "epoch": 3228} {"train_loss": -6.768759250640869, "global_step": 135596, "epoch": 3228} {"train_loss": -6.750088691711426, "global_step": 135597, "epoch": 3228} {"train_loss": -6.583126544952393, "global_step": 135598, "epoch": 3228} {"train_loss": -6.662783145904541, "global_step": 135599, "epoch": 3228} {"train_loss": -6.749839782714844, "global_step": 135600, "epoch": 3228} {"train_loss": -6.684737682342529, "global_step": 135601, "epoch": 3228} {"train_loss": -6.704176902770996, "global_step": 135602, "epoch": 3228} {"train_loss": -6.561339378356934, "global_step": 135603, "epoch": 3228} {"train_loss": -6.799186706542969, "global_step": 135604, "epoch": 3228} {"train_loss": -6.626538276672363, "global_step": 135605, "epoch": 3228} {"train_loss": -6.6602888107299805, "global_step": 135606, "epoch": 3228} {"train_loss": -6.787137031555176, "global_step": 135607, "epoch": 3228} {"train_loss": -6.743216037750244, "global_step": 135608, "epoch": 3228} {"train_loss": -6.843897819519043, "global_step": 135609, "epoch": 3228} {"train_loss": -6.74378776550293, "global_step": 135610, "epoch": 3228} {"train_loss": -6.819666385650635, "global_step": 135611, "epoch": 3228} {"train_loss": -6.701328277587891, "global_step": 135612, "epoch": 3228} {"train_loss": -6.73387336730957, "global_step": 135613, "epoch": 3228} {"train_loss": -6.695663928985596, "global_step": 135614, "epoch": 3228} {"train_loss": -6.65908145904541, "global_step": 135615, "epoch": 3228} {"train_loss": -6.697048187255859, "global_step": 135616, "epoch": 3228} {"train_loss": -6.71510436421349, "global_step": 135617, "epoch": 3228, "val_loss": 66942.359375} {"train_loss": -6.761148452758789, "global_step": 135618, "epoch": 3229} {"train_loss": -6.807221412658691, "global_step": 135619, "epoch": 3229} {"train_loss": -6.8055620193481445, "global_step": 135620, "epoch": 3229} {"train_loss": -6.573557376861572, "global_step": 135621, "epoch": 3229} {"train_loss": -6.859302997589111, "global_step": 135622, "epoch": 3229} {"train_loss": -6.745702743530273, "global_step": 135623, "epoch": 3229} {"train_loss": -6.747926235198975, "global_step": 135624, "epoch": 3229} {"train_loss": -6.7270188331604, "global_step": 135625, "epoch": 3229} {"train_loss": -6.688327789306641, "global_step": 135626, "epoch": 3229} {"train_loss": -6.662997245788574, "global_step": 135627, "epoch": 3229} {"train_loss": -6.808855056762695, "global_step": 135628, "epoch": 3229} {"train_loss": -6.686352729797363, "global_step": 135629, "epoch": 3229} {"train_loss": -6.824350833892822, "global_step": 135630, "epoch": 3229} {"train_loss": -6.669368743896484, "global_step": 135631, "epoch": 3229} {"train_loss": -6.834981918334961, "global_step": 135632, "epoch": 3229} {"train_loss": -6.7575273513793945, "global_step": 135633, "epoch": 3229} {"train_loss": -6.75068473815918, "global_step": 135634, "epoch": 3229} {"train_loss": -6.666419506072998, "global_step": 135635, "epoch": 3229} {"train_loss": -6.728638648986816, "global_step": 135636, "epoch": 3229} {"train_loss": -6.754645347595215, "global_step": 135637, "epoch": 3229} {"train_loss": -6.671099662780762, "global_step": 135638, "epoch": 3229} {"train_loss": -6.690330982208252, "global_step": 135639, "epoch": 3229} {"train_loss": -6.738649368286133, "global_step": 135640, "epoch": 3229} {"train_loss": -6.648092269897461, "global_step": 135641, "epoch": 3229} {"train_loss": -6.660812854766846, "global_step": 135642, "epoch": 3229} {"train_loss": -6.612733364105225, "global_step": 135643, "epoch": 3229} {"train_loss": -6.769597053527832, "global_step": 135644, "epoch": 3229} {"train_loss": -6.668034553527832, "global_step": 135645, "epoch": 3229} {"train_loss": -6.753425121307373, "global_step": 135646, "epoch": 3229} {"train_loss": -6.721389293670654, "global_step": 135647, "epoch": 3229} {"train_loss": -6.695878028869629, "global_step": 135648, "epoch": 3229} {"train_loss": -6.6500420570373535, "global_step": 135649, "epoch": 3229} {"train_loss": -6.636107444763184, "global_step": 135650, "epoch": 3229} {"train_loss": -6.7322773933410645, "global_step": 135651, "epoch": 3229} {"train_loss": -6.747812271118164, "global_step": 135652, "epoch": 3229} {"train_loss": -6.6133551597595215, "global_step": 135653, "epoch": 3229} {"train_loss": -6.855345726013184, "global_step": 135654, "epoch": 3229} {"train_loss": -6.755206108093262, "global_step": 135655, "epoch": 3229} {"train_loss": -6.607627868652344, "global_step": 135656, "epoch": 3229} {"train_loss": -6.655888557434082, "global_step": 135657, "epoch": 3229} {"train_loss": -6.718379974365234, "global_step": 135658, "epoch": 3229} {"train_loss": -6.715968835921514, "global_step": 135659, "epoch": 3229, "val_loss": 67265.109375} {"train_loss": -6.71599006652832, "global_step": 135660, "epoch": 3230} {"train_loss": -6.673594951629639, "global_step": 135661, "epoch": 3230} {"train_loss": -6.536540985107422, "global_step": 135662, "epoch": 3230} {"train_loss": -6.596080780029297, "global_step": 135663, "epoch": 3230} {"train_loss": -6.769186973571777, "global_step": 135664, "epoch": 3230} {"train_loss": -6.67772102355957, "global_step": 135665, "epoch": 3230} {"train_loss": -6.641739845275879, "global_step": 135666, "epoch": 3230} {"train_loss": -6.662750244140625, "global_step": 135667, "epoch": 3230} {"train_loss": -6.6405768394470215, "global_step": 135668, "epoch": 3230} {"train_loss": -6.668968200683594, "global_step": 135669, "epoch": 3230} {"train_loss": -6.701169967651367, "global_step": 135670, "epoch": 3230} {"train_loss": -6.699392318725586, "global_step": 135671, "epoch": 3230} {"train_loss": -6.76619815826416, "global_step": 135672, "epoch": 3230} {"train_loss": -6.561179161071777, "global_step": 135673, "epoch": 3230} {"train_loss": -6.691786766052246, "global_step": 135674, "epoch": 3230} {"train_loss": -6.639312744140625, "global_step": 135675, "epoch": 3230} {"train_loss": -6.6161065101623535, "global_step": 135676, "epoch": 3230} {"train_loss": -6.721318244934082, "global_step": 135677, "epoch": 3230} {"train_loss": -6.684417247772217, "global_step": 135678, "epoch": 3230} {"train_loss": -6.639432907104492, "global_step": 135679, "epoch": 3230} {"train_loss": -6.718181133270264, "global_step": 135680, "epoch": 3230} {"train_loss": -6.772823333740234, "global_step": 135681, "epoch": 3230} {"train_loss": -6.67434024810791, "global_step": 135682, "epoch": 3230} {"train_loss": -6.746006965637207, "global_step": 135683, "epoch": 3230} {"train_loss": -6.705560684204102, "global_step": 135684, "epoch": 3230} {"train_loss": -6.791866302490234, "global_step": 135685, "epoch": 3230} {"train_loss": -6.706581115722656, "global_step": 135686, "epoch": 3230} {"train_loss": -6.6757354736328125, "global_step": 135687, "epoch": 3230} {"train_loss": -6.871669769287109, "global_step": 135688, "epoch": 3230} {"train_loss": -6.767014503479004, "global_step": 135689, "epoch": 3230} {"train_loss": -6.677037239074707, "global_step": 135690, "epoch": 3230} {"train_loss": -6.685903072357178, "global_step": 135691, "epoch": 3230} {"train_loss": -6.6854400634765625, "global_step": 135692, "epoch": 3230} {"train_loss": -6.719588279724121, "global_step": 135693, "epoch": 3230} {"train_loss": -6.7393670082092285, "global_step": 135694, "epoch": 3230} {"train_loss": -6.722814559936523, "global_step": 135695, "epoch": 3230} {"train_loss": -6.757554054260254, "global_step": 135696, "epoch": 3230} {"train_loss": -6.704921722412109, "global_step": 135697, "epoch": 3230} {"train_loss": -6.731755256652832, "global_step": 135698, "epoch": 3230} {"train_loss": -6.723219871520996, "global_step": 135699, "epoch": 3230} {"train_loss": -6.667232036590576, "global_step": 135700, "epoch": 3230} {"train_loss": -6.697140307653518, "global_step": 135701, "epoch": 3230, "val_loss": 66832.3515625} {"train_loss": -6.8507490158081055, "global_step": 135702, "epoch": 3231} {"train_loss": -6.750587463378906, "global_step": 135703, "epoch": 3231} {"train_loss": -6.77980899810791, "global_step": 135704, "epoch": 3231} {"train_loss": -6.750304222106934, "global_step": 135705, "epoch": 3231} {"train_loss": -6.784652233123779, "global_step": 135706, "epoch": 3231} {"train_loss": -6.7657880783081055, "global_step": 135707, "epoch": 3231} {"train_loss": -6.707030296325684, "global_step": 135708, "epoch": 3231} {"train_loss": -6.6991400718688965, "global_step": 135709, "epoch": 3231} {"train_loss": -6.839412689208984, "global_step": 135710, "epoch": 3231} {"train_loss": -6.669284820556641, "global_step": 135711, "epoch": 3231} {"train_loss": -6.689911365509033, "global_step": 135712, "epoch": 3231} {"train_loss": -6.787586212158203, "global_step": 135713, "epoch": 3231} {"train_loss": -6.663594722747803, "global_step": 135714, "epoch": 3231} {"train_loss": -6.830939769744873, "global_step": 135715, "epoch": 3231} {"train_loss": -6.644016742706299, "global_step": 135716, "epoch": 3231} {"train_loss": -6.7259907722473145, "global_step": 135717, "epoch": 3231} {"train_loss": -6.761375427246094, "global_step": 135718, "epoch": 3231} {"train_loss": -6.567625045776367, "global_step": 135719, "epoch": 3231} {"train_loss": -6.718873023986816, "global_step": 135720, "epoch": 3231} {"train_loss": -6.822405815124512, "global_step": 135721, "epoch": 3231} {"train_loss": -6.579793453216553, "global_step": 135722, "epoch": 3231} {"train_loss": -6.61410665512085, "global_step": 135723, "epoch": 3231} {"train_loss": -6.675549030303955, "global_step": 135724, "epoch": 3231} {"train_loss": -6.689170837402344, "global_step": 135725, "epoch": 3231} {"train_loss": -6.733493328094482, "global_step": 135726, "epoch": 3231} {"train_loss": -6.622668743133545, "global_step": 135727, "epoch": 3231} {"train_loss": -6.699583053588867, "global_step": 135728, "epoch": 3231} {"train_loss": -6.623664855957031, "global_step": 135729, "epoch": 3231} {"train_loss": -6.583412170410156, "global_step": 135730, "epoch": 3231} {"train_loss": -6.703861236572266, "global_step": 135731, "epoch": 3231} {"train_loss": -6.616217613220215, "global_step": 135732, "epoch": 3231} {"train_loss": -6.591833114624023, "global_step": 135733, "epoch": 3231} {"train_loss": -6.669610977172852, "global_step": 135734, "epoch": 3231} {"train_loss": -6.665642738342285, "global_step": 135735, "epoch": 3231} {"train_loss": -6.718715190887451, "global_step": 135736, "epoch": 3231} {"train_loss": -6.613239288330078, "global_step": 135737, "epoch": 3231} {"train_loss": -6.699951171875, "global_step": 135738, "epoch": 3231} {"train_loss": -6.737844467163086, "global_step": 135739, "epoch": 3231} {"train_loss": -6.580286502838135, "global_step": 135740, "epoch": 3231} {"train_loss": -6.689380645751953, "global_step": 135741, "epoch": 3231} {"train_loss": -6.683788299560547, "global_step": 135742, "epoch": 3231} {"train_loss": -6.697903939655849, "global_step": 135743, "epoch": 3231, "val_loss": 66928.8515625} {"train_loss": -6.71631383895874, "global_step": 135744, "epoch": 3232} {"train_loss": -6.657042503356934, "global_step": 135745, "epoch": 3232} {"train_loss": -6.692933082580566, "global_step": 135746, "epoch": 3232} {"train_loss": -6.658100128173828, "global_step": 135747, "epoch": 3232} {"train_loss": -6.690572738647461, "global_step": 135748, "epoch": 3232} {"train_loss": -6.8025712966918945, "global_step": 135749, "epoch": 3232} {"train_loss": -6.592860221862793, "global_step": 135750, "epoch": 3232} {"train_loss": -6.824831962585449, "global_step": 135751, "epoch": 3232} {"train_loss": -6.697012901306152, "global_step": 135752, "epoch": 3232} {"train_loss": -6.703556060791016, "global_step": 135753, "epoch": 3232} {"train_loss": -6.782771587371826, "global_step": 135754, "epoch": 3232} {"train_loss": -6.647843360900879, "global_step": 135755, "epoch": 3232} {"train_loss": -6.820433616638184, "global_step": 135756, "epoch": 3232} {"train_loss": -6.668494701385498, "global_step": 135757, "epoch": 3232} {"train_loss": -6.709665298461914, "global_step": 135758, "epoch": 3232} {"train_loss": -6.734361171722412, "global_step": 135759, "epoch": 3232} {"train_loss": -6.6681318283081055, "global_step": 135760, "epoch": 3232} {"train_loss": -6.815967559814453, "global_step": 135761, "epoch": 3232} {"train_loss": -6.7410783767700195, "global_step": 135762, "epoch": 3232} {"train_loss": -6.725959300994873, "global_step": 135763, "epoch": 3232} {"train_loss": -6.729700088500977, "global_step": 135764, "epoch": 3232} {"train_loss": -6.718725681304932, "global_step": 135765, "epoch": 3232} {"train_loss": -6.607605934143066, "global_step": 135766, "epoch": 3232} {"train_loss": -6.663944244384766, "global_step": 135767, "epoch": 3232} {"train_loss": -6.628419876098633, "global_step": 135768, "epoch": 3232} {"train_loss": -6.60590934753418, "global_step": 135769, "epoch": 3232} {"train_loss": -6.719448089599609, "global_step": 135770, "epoch": 3232} {"train_loss": -6.682576656341553, "global_step": 135771, "epoch": 3232} {"train_loss": -6.700144290924072, "global_step": 135772, "epoch": 3232} {"train_loss": -6.770082473754883, "global_step": 135773, "epoch": 3232} {"train_loss": -6.6557817459106445, "global_step": 135774, "epoch": 3232} {"train_loss": -6.757218360900879, "global_step": 135775, "epoch": 3232} {"train_loss": -6.62615966796875, "global_step": 135776, "epoch": 3232} {"train_loss": -6.597105026245117, "global_step": 135777, "epoch": 3232} {"train_loss": -6.658807754516602, "global_step": 135778, "epoch": 3232} {"train_loss": -6.619508743286133, "global_step": 135779, "epoch": 3232} {"train_loss": -6.716423988342285, "global_step": 135780, "epoch": 3232} {"train_loss": -6.7784528732299805, "global_step": 135781, "epoch": 3232} {"train_loss": -6.652986526489258, "global_step": 135782, "epoch": 3232} {"train_loss": -6.709601402282715, "global_step": 135783, "epoch": 3232} {"train_loss": -6.722071170806885, "global_step": 135784, "epoch": 3232} {"train_loss": -6.699094692866008, "global_step": 135785, "epoch": 3232, "val_loss": 66941.21875} {"train_loss": -6.676552772521973, "global_step": 135786, "epoch": 3233} {"train_loss": -6.6742753982543945, "global_step": 135787, "epoch": 3233} {"train_loss": -6.751821041107178, "global_step": 135788, "epoch": 3233} {"train_loss": -6.61783504486084, "global_step": 135789, "epoch": 3233} {"train_loss": -6.751111030578613, "global_step": 135790, "epoch": 3233} {"train_loss": -6.656079292297363, "global_step": 135791, "epoch": 3233} {"train_loss": -6.707756519317627, "global_step": 135792, "epoch": 3233} {"train_loss": -6.72853422164917, "global_step": 135793, "epoch": 3233} {"train_loss": -6.63401460647583, "global_step": 135794, "epoch": 3233} {"train_loss": -6.730088233947754, "global_step": 135795, "epoch": 3233} {"train_loss": -6.753299713134766, "global_step": 135796, "epoch": 3233} {"train_loss": -6.667539119720459, "global_step": 135797, "epoch": 3233} {"train_loss": -6.734188556671143, "global_step": 135798, "epoch": 3233} {"train_loss": -6.744726657867432, "global_step": 135799, "epoch": 3233} {"train_loss": -6.680734634399414, "global_step": 135800, "epoch": 3233} {"train_loss": -6.7649126052856445, "global_step": 135801, "epoch": 3233} {"train_loss": -6.759506702423096, "global_step": 135802, "epoch": 3233} {"train_loss": -6.715235710144043, "global_step": 135803, "epoch": 3233} {"train_loss": -6.656468868255615, "global_step": 135804, "epoch": 3233} {"train_loss": -6.722374439239502, "global_step": 135805, "epoch": 3233} {"train_loss": -6.772991180419922, "global_step": 135806, "epoch": 3233} {"train_loss": -6.715782165527344, "global_step": 135807, "epoch": 3233} {"train_loss": -6.862584114074707, "global_step": 135808, "epoch": 3233} {"train_loss": -6.748456001281738, "global_step": 135809, "epoch": 3233} {"train_loss": -6.730396270751953, "global_step": 135810, "epoch": 3233} {"train_loss": -6.8160786628723145, "global_step": 135811, "epoch": 3233} {"train_loss": -6.8724365234375, "global_step": 135812, "epoch": 3233} {"train_loss": -6.939958095550537, "global_step": 135813, "epoch": 3233} {"train_loss": -6.662931442260742, "global_step": 135814, "epoch": 3233} {"train_loss": -6.659700393676758, "global_step": 135815, "epoch": 3233} {"train_loss": -6.905416488647461, "global_step": 135816, "epoch": 3233} {"train_loss": -6.759772300720215, "global_step": 135817, "epoch": 3233} {"train_loss": -6.805418014526367, "global_step": 135818, "epoch": 3233} {"train_loss": -6.781723976135254, "global_step": 135819, "epoch": 3233} {"train_loss": -6.805070877075195, "global_step": 135820, "epoch": 3233} {"train_loss": -6.662581443786621, "global_step": 135821, "epoch": 3233} {"train_loss": -6.808284282684326, "global_step": 135822, "epoch": 3233} {"train_loss": -6.760486602783203, "global_step": 135823, "epoch": 3233} {"train_loss": -6.613205909729004, "global_step": 135824, "epoch": 3233} {"train_loss": -6.623358726501465, "global_step": 135825, "epoch": 3233} {"train_loss": -6.678561210632324, "global_step": 135826, "epoch": 3233} {"train_loss": -6.736168271019345, "global_step": 135827, "epoch": 3233, "val_loss": 66897.3125} {"train_loss": -6.810401439666748, "global_step": 135828, "epoch": 3234} {"train_loss": -6.792252063751221, "global_step": 135829, "epoch": 3234} {"train_loss": -6.867985248565674, "global_step": 135830, "epoch": 3234} {"train_loss": -6.884462356567383, "global_step": 135831, "epoch": 3234} {"train_loss": -6.652184963226318, "global_step": 135832, "epoch": 3234} {"train_loss": -6.872737884521484, "global_step": 135833, "epoch": 3234} {"train_loss": -6.806756019592285, "global_step": 135834, "epoch": 3234} {"train_loss": -6.819357395172119, "global_step": 135835, "epoch": 3234} {"train_loss": -6.801560401916504, "global_step": 135836, "epoch": 3234} {"train_loss": -6.854613304138184, "global_step": 135837, "epoch": 3234} {"train_loss": -6.637526988983154, "global_step": 135838, "epoch": 3234} {"train_loss": -6.769372463226318, "global_step": 135839, "epoch": 3234} {"train_loss": -6.718670845031738, "global_step": 135840, "epoch": 3234} {"train_loss": -6.809857368469238, "global_step": 135841, "epoch": 3234} {"train_loss": -6.77745246887207, "global_step": 135842, "epoch": 3234} {"train_loss": -6.784749507904053, "global_step": 135843, "epoch": 3234} {"train_loss": -6.764003753662109, "global_step": 135844, "epoch": 3234} {"train_loss": -6.776000499725342, "global_step": 135845, "epoch": 3234} {"train_loss": -6.607067108154297, "global_step": 135846, "epoch": 3234} {"train_loss": -6.740973472595215, "global_step": 135847, "epoch": 3234} {"train_loss": -6.741460800170898, "global_step": 135848, "epoch": 3234} {"train_loss": -6.737363815307617, "global_step": 135849, "epoch": 3234} {"train_loss": -6.722504615783691, "global_step": 135850, "epoch": 3234} {"train_loss": -6.766101837158203, "global_step": 135851, "epoch": 3234} {"train_loss": -6.697025299072266, "global_step": 135852, "epoch": 3234} {"train_loss": -6.64627742767334, "global_step": 135853, "epoch": 3234} {"train_loss": -6.863604545593262, "global_step": 135854, "epoch": 3234} {"train_loss": -6.77666711807251, "global_step": 135855, "epoch": 3234} {"train_loss": -6.651381492614746, "global_step": 135856, "epoch": 3234} {"train_loss": -6.763824462890625, "global_step": 135857, "epoch": 3234} {"train_loss": -6.7403669357299805, "global_step": 135858, "epoch": 3234} {"train_loss": -6.712635517120361, "global_step": 135859, "epoch": 3234} {"train_loss": -6.717120170593262, "global_step": 135860, "epoch": 3234} {"train_loss": -6.794995307922363, "global_step": 135861, "epoch": 3234} {"train_loss": -6.686539649963379, "global_step": 135862, "epoch": 3234} {"train_loss": -6.637823581695557, "global_step": 135863, "epoch": 3234} {"train_loss": -6.730077743530273, "global_step": 135864, "epoch": 3234} {"train_loss": -6.726203918457031, "global_step": 135865, "epoch": 3234} {"train_loss": -6.663555145263672, "global_step": 135866, "epoch": 3234} {"train_loss": -6.731646537780762, "global_step": 135867, "epoch": 3234} {"train_loss": -6.621351718902588, "global_step": 135868, "epoch": 3234} {"train_loss": -6.7473572208767845, "global_step": 135869, "epoch": 3234, "val_loss": 66979.765625} {"train_loss": -6.903704643249512, "global_step": 135870, "epoch": 3235} {"train_loss": -6.658538818359375, "global_step": 135871, "epoch": 3235} {"train_loss": -6.684614181518555, "global_step": 135872, "epoch": 3235} {"train_loss": -6.803889274597168, "global_step": 135873, "epoch": 3235} {"train_loss": -6.805762767791748, "global_step": 135874, "epoch": 3235} {"train_loss": -6.70439338684082, "global_step": 135875, "epoch": 3235} {"train_loss": -6.7913665771484375, "global_step": 135876, "epoch": 3235} {"train_loss": -6.836888313293457, "global_step": 135877, "epoch": 3235} {"train_loss": -6.663535118103027, "global_step": 135878, "epoch": 3235} {"train_loss": -6.774975776672363, "global_step": 135879, "epoch": 3235} {"train_loss": -6.7665815353393555, "global_step": 135880, "epoch": 3235} {"train_loss": -6.695614814758301, "global_step": 135881, "epoch": 3235} {"train_loss": -6.781328201293945, "global_step": 135882, "epoch": 3235} {"train_loss": -6.769111156463623, "global_step": 135883, "epoch": 3235} {"train_loss": -6.742530345916748, "global_step": 135884, "epoch": 3235} {"train_loss": -6.771873474121094, "global_step": 135885, "epoch": 3235} {"train_loss": -6.701382637023926, "global_step": 135886, "epoch": 3235} {"train_loss": -6.709448337554932, "global_step": 135887, "epoch": 3235} {"train_loss": -6.634788513183594, "global_step": 135888, "epoch": 3235} {"train_loss": -6.767756938934326, "global_step": 135889, "epoch": 3235} {"train_loss": -6.689789772033691, "global_step": 135890, "epoch": 3235} {"train_loss": -6.585451126098633, "global_step": 135891, "epoch": 3235} {"train_loss": -6.691549777984619, "global_step": 135892, "epoch": 3235} {"train_loss": -6.70670747756958, "global_step": 135893, "epoch": 3235} {"train_loss": -6.712961673736572, "global_step": 135894, "epoch": 3235} {"train_loss": -6.5990142822265625, "global_step": 135895, "epoch": 3235} {"train_loss": -6.830746650695801, "global_step": 135896, "epoch": 3235} {"train_loss": -6.66526985168457, "global_step": 135897, "epoch": 3235} {"train_loss": -6.571187973022461, "global_step": 135898, "epoch": 3235} {"train_loss": -6.777892112731934, "global_step": 135899, "epoch": 3235} {"train_loss": -6.668646812438965, "global_step": 135900, "epoch": 3235} {"train_loss": -6.642735481262207, "global_step": 135901, "epoch": 3235} {"train_loss": -6.6559271812438965, "global_step": 135902, "epoch": 3235} {"train_loss": -6.740614891052246, "global_step": 135903, "epoch": 3235} {"train_loss": -6.798121452331543, "global_step": 135904, "epoch": 3235} {"train_loss": -6.782001495361328, "global_step": 135905, "epoch": 3235} {"train_loss": -6.714559078216553, "global_step": 135906, "epoch": 3235} {"train_loss": -6.757211685180664, "global_step": 135907, "epoch": 3235} {"train_loss": -6.761312484741211, "global_step": 135908, "epoch": 3235} {"train_loss": -6.703178405761719, "global_step": 135909, "epoch": 3235} {"train_loss": -6.7420196533203125, "global_step": 135910, "epoch": 3235} {"train_loss": -6.7265794050125844, "global_step": 135911, "epoch": 3235, "val_loss": 67049.3046875} {"train_loss": -6.650951385498047, "global_step": 135912, "epoch": 3236} {"train_loss": -6.675267219543457, "global_step": 135913, "epoch": 3236} {"train_loss": -6.624823570251465, "global_step": 135914, "epoch": 3236} {"train_loss": -6.700515270233154, "global_step": 135915, "epoch": 3236} {"train_loss": -6.630775451660156, "global_step": 135916, "epoch": 3236} {"train_loss": -6.795350551605225, "global_step": 135917, "epoch": 3236} {"train_loss": -6.830161094665527, "global_step": 135918, "epoch": 3236} {"train_loss": -6.77154541015625, "global_step": 135919, "epoch": 3236} {"train_loss": -6.665741920471191, "global_step": 135920, "epoch": 3236} {"train_loss": -6.756363391876221, "global_step": 135921, "epoch": 3236} {"train_loss": -6.807782173156738, "global_step": 135922, "epoch": 3236} {"train_loss": -6.813486099243164, "global_step": 135923, "epoch": 3236} {"train_loss": -6.671463966369629, "global_step": 135924, "epoch": 3236} {"train_loss": -6.716461181640625, "global_step": 135925, "epoch": 3236} {"train_loss": -6.640568733215332, "global_step": 135926, "epoch": 3236} {"train_loss": -6.711301803588867, "global_step": 135927, "epoch": 3236} {"train_loss": -6.8001389503479, "global_step": 135928, "epoch": 3236} {"train_loss": -6.746157169342041, "global_step": 135929, "epoch": 3236} {"train_loss": -6.73345947265625, "global_step": 135930, "epoch": 3236} {"train_loss": -6.76578950881958, "global_step": 135931, "epoch": 3236} {"train_loss": -6.695174217224121, "global_step": 135932, "epoch": 3236} {"train_loss": -6.676907062530518, "global_step": 135933, "epoch": 3236} {"train_loss": -6.6217041015625, "global_step": 135934, "epoch": 3236} {"train_loss": -6.671056270599365, "global_step": 135935, "epoch": 3236} {"train_loss": -6.819851875305176, "global_step": 135936, "epoch": 3236} {"train_loss": -6.7410783767700195, "global_step": 135937, "epoch": 3236} {"train_loss": -6.65772008895874, "global_step": 135938, "epoch": 3236} {"train_loss": -6.761183261871338, "global_step": 135939, "epoch": 3236} {"train_loss": -6.687497138977051, "global_step": 135940, "epoch": 3236} {"train_loss": -6.5437703132629395, "global_step": 135941, "epoch": 3236} {"train_loss": -6.767703533172607, "global_step": 135942, "epoch": 3236} {"train_loss": -6.567019939422607, "global_step": 135943, "epoch": 3236} {"train_loss": -6.620800495147705, "global_step": 135944, "epoch": 3236} {"train_loss": -6.791134834289551, "global_step": 135945, "epoch": 3236} {"train_loss": -6.682612419128418, "global_step": 135946, "epoch": 3236} {"train_loss": -6.633315086364746, "global_step": 135947, "epoch": 3236} {"train_loss": -6.7253193855285645, "global_step": 135948, "epoch": 3236} {"train_loss": -6.7209930419921875, "global_step": 135949, "epoch": 3236} {"train_loss": -6.717659950256348, "global_step": 135950, "epoch": 3236} {"train_loss": -6.618285655975342, "global_step": 135951, "epoch": 3236} {"train_loss": -6.834957122802734, "global_step": 135952, "epoch": 3236} {"train_loss": -6.708856060391381, "global_step": 135953, "epoch": 3236, "val_loss": 66850.671875} {"train_loss": -6.610346794128418, "global_step": 135954, "epoch": 3237} {"train_loss": -6.730080604553223, "global_step": 135955, "epoch": 3237} {"train_loss": -6.741680145263672, "global_step": 135956, "epoch": 3237} {"train_loss": -6.790729522705078, "global_step": 135957, "epoch": 3237} {"train_loss": -6.7648515701293945, "global_step": 135958, "epoch": 3237} {"train_loss": -6.648780822753906, "global_step": 135959, "epoch": 3237} {"train_loss": -6.712573051452637, "global_step": 135960, "epoch": 3237} {"train_loss": -6.723374843597412, "global_step": 135961, "epoch": 3237} {"train_loss": -6.649789810180664, "global_step": 135962, "epoch": 3237} {"train_loss": -6.802246570587158, "global_step": 135963, "epoch": 3237} {"train_loss": -6.661956787109375, "global_step": 135964, "epoch": 3237} {"train_loss": -6.723440647125244, "global_step": 135965, "epoch": 3237} {"train_loss": -6.720388412475586, "global_step": 135966, "epoch": 3237} {"train_loss": -6.766059875488281, "global_step": 135967, "epoch": 3237} {"train_loss": -6.7138190269470215, "global_step": 135968, "epoch": 3237} {"train_loss": -6.756019115447998, "global_step": 135969, "epoch": 3237} {"train_loss": -6.65749979019165, "global_step": 135970, "epoch": 3237} {"train_loss": -6.728870391845703, "global_step": 135971, "epoch": 3237} {"train_loss": -6.737242698669434, "global_step": 135972, "epoch": 3237} {"train_loss": -6.508928298950195, "global_step": 135973, "epoch": 3237} {"train_loss": -6.7705583572387695, "global_step": 135974, "epoch": 3237} {"train_loss": -6.740632057189941, "global_step": 135975, "epoch": 3237} {"train_loss": -6.760082244873047, "global_step": 135976, "epoch": 3237} {"train_loss": -6.783041954040527, "global_step": 135977, "epoch": 3237} {"train_loss": -6.726987838745117, "global_step": 135978, "epoch": 3237} {"train_loss": -6.6648149490356445, "global_step": 135979, "epoch": 3237} {"train_loss": -6.783935546875, "global_step": 135980, "epoch": 3237} {"train_loss": -6.871608734130859, "global_step": 135981, "epoch": 3237} {"train_loss": -6.674746036529541, "global_step": 135982, "epoch": 3237} {"train_loss": -6.723827838897705, "global_step": 135983, "epoch": 3237} {"train_loss": -6.6882171630859375, "global_step": 135984, "epoch": 3237} {"train_loss": -6.624297142028809, "global_step": 135985, "epoch": 3237} {"train_loss": -6.769276142120361, "global_step": 135986, "epoch": 3237} {"train_loss": -6.813485622406006, "global_step": 135987, "epoch": 3237} {"train_loss": -6.698582649230957, "global_step": 135988, "epoch": 3237} {"train_loss": -6.75369930267334, "global_step": 135989, "epoch": 3237} {"train_loss": -6.697827339172363, "global_step": 135990, "epoch": 3237} {"train_loss": -6.722927570343018, "global_step": 135991, "epoch": 3237} {"train_loss": -6.820111274719238, "global_step": 135992, "epoch": 3237} {"train_loss": -6.805634021759033, "global_step": 135993, "epoch": 3237} {"train_loss": -6.615455627441406, "global_step": 135994, "epoch": 3237} {"train_loss": -6.727042890730358, "global_step": 135995, "epoch": 3237, "val_loss": 66922.765625} {"train_loss": -6.708826541900635, "global_step": 135996, "epoch": 3238} {"train_loss": -6.85500431060791, "global_step": 135997, "epoch": 3238} {"train_loss": -6.688969135284424, "global_step": 135998, "epoch": 3238} {"train_loss": -6.7950568199157715, "global_step": 135999, "epoch": 3238} {"train_loss": -6.6572136878967285, "global_step": 136000, "epoch": 3238} {"train_loss": -6.760097980499268, "global_step": 136001, "epoch": 3238} {"train_loss": -6.717165946960449, "global_step": 136002, "epoch": 3238} {"train_loss": -6.668410301208496, "global_step": 136003, "epoch": 3238} {"train_loss": -6.840999603271484, "global_step": 136004, "epoch": 3238} {"train_loss": -6.736635208129883, "global_step": 136005, "epoch": 3238} {"train_loss": -6.6827497482299805, "global_step": 136006, "epoch": 3238} {"train_loss": -6.786375999450684, "global_step": 136007, "epoch": 3238} {"train_loss": -6.754334449768066, "global_step": 136008, "epoch": 3238} {"train_loss": -6.741239070892334, "global_step": 136009, "epoch": 3238} {"train_loss": -6.802740573883057, "global_step": 136010, "epoch": 3238} {"train_loss": -6.728336334228516, "global_step": 136011, "epoch": 3238} {"train_loss": -6.741969585418701, "global_step": 136012, "epoch": 3238} {"train_loss": -6.779111385345459, "global_step": 136013, "epoch": 3238} {"train_loss": -6.692686557769775, "global_step": 136014, "epoch": 3238} {"train_loss": -6.579600811004639, "global_step": 136015, "epoch": 3238} {"train_loss": -6.753811836242676, "global_step": 136016, "epoch": 3238} {"train_loss": -6.821950912475586, "global_step": 136017, "epoch": 3238} {"train_loss": -6.726881504058838, "global_step": 136018, "epoch": 3238} {"train_loss": -6.7700066566467285, "global_step": 136019, "epoch": 3238} {"train_loss": -6.69064998626709, "global_step": 136020, "epoch": 3238} {"train_loss": -6.822273254394531, "global_step": 136021, "epoch": 3238} {"train_loss": -6.780487537384033, "global_step": 136022, "epoch": 3238} {"train_loss": -6.738663673400879, "global_step": 136023, "epoch": 3238} {"train_loss": -6.7135748863220215, "global_step": 136024, "epoch": 3238} {"train_loss": -6.616119384765625, "global_step": 136025, "epoch": 3238} {"train_loss": -6.603399276733398, "global_step": 136026, "epoch": 3238} {"train_loss": -6.645578384399414, "global_step": 136027, "epoch": 3238} {"train_loss": -6.778929710388184, "global_step": 136028, "epoch": 3238} {"train_loss": -6.642862319946289, "global_step": 136029, "epoch": 3238} {"train_loss": -6.797058582305908, "global_step": 136030, "epoch": 3238} {"train_loss": -6.716917991638184, "global_step": 136031, "epoch": 3238} {"train_loss": -6.734488487243652, "global_step": 136032, "epoch": 3238} {"train_loss": -6.777914047241211, "global_step": 136033, "epoch": 3238} {"train_loss": -6.70421838760376, "global_step": 136034, "epoch": 3238} {"train_loss": -6.76666259765625, "global_step": 136035, "epoch": 3238} {"train_loss": -6.712648391723633, "global_step": 136036, "epoch": 3238} {"train_loss": -6.730756873176212, "global_step": 136037, "epoch": 3238, "val_loss": 67087.3125} {"train_loss": -6.559370994567871, "global_step": 136038, "epoch": 3239} {"train_loss": -6.659895896911621, "global_step": 136039, "epoch": 3239} {"train_loss": -6.659769535064697, "global_step": 136040, "epoch": 3239} {"train_loss": -6.655519485473633, "global_step": 136041, "epoch": 3239} {"train_loss": -6.760052680969238, "global_step": 136042, "epoch": 3239} {"train_loss": -6.6563262939453125, "global_step": 136043, "epoch": 3239} {"train_loss": -6.8176774978637695, "global_step": 136044, "epoch": 3239} {"train_loss": -6.678277015686035, "global_step": 136045, "epoch": 3239} {"train_loss": -6.784147262573242, "global_step": 136046, "epoch": 3239} {"train_loss": -6.652673244476318, "global_step": 136047, "epoch": 3239} {"train_loss": -6.724428653717041, "global_step": 136048, "epoch": 3239} {"train_loss": -6.755252838134766, "global_step": 136049, "epoch": 3239} {"train_loss": -6.54836368560791, "global_step": 136050, "epoch": 3239} {"train_loss": -6.645266532897949, "global_step": 136051, "epoch": 3239} {"train_loss": -6.708240509033203, "global_step": 136052, "epoch": 3239} {"train_loss": -6.607089042663574, "global_step": 136053, "epoch": 3239} {"train_loss": -6.7342939376831055, "global_step": 136054, "epoch": 3239} {"train_loss": -6.786008834838867, "global_step": 136055, "epoch": 3239} {"train_loss": -6.7248640060424805, "global_step": 136056, "epoch": 3239} {"train_loss": -6.62216854095459, "global_step": 136057, "epoch": 3239} {"train_loss": -6.66666316986084, "global_step": 136058, "epoch": 3239} {"train_loss": -6.669528484344482, "global_step": 136059, "epoch": 3239} {"train_loss": -6.505781650543213, "global_step": 136060, "epoch": 3239} {"train_loss": -6.75526237487793, "global_step": 136061, "epoch": 3239} {"train_loss": -6.515848159790039, "global_step": 136062, "epoch": 3239} {"train_loss": -6.608412742614746, "global_step": 136063, "epoch": 3239} {"train_loss": -6.734313488006592, "global_step": 136064, "epoch": 3239} {"train_loss": -6.579667568206787, "global_step": 136065, "epoch": 3239} {"train_loss": -6.774411201477051, "global_step": 136066, "epoch": 3239} {"train_loss": -6.570293426513672, "global_step": 136067, "epoch": 3239} {"train_loss": -6.607938766479492, "global_step": 136068, "epoch": 3239} {"train_loss": -6.830872535705566, "global_step": 136069, "epoch": 3239} {"train_loss": -6.794313430786133, "global_step": 136070, "epoch": 3239} {"train_loss": -6.701467514038086, "global_step": 136071, "epoch": 3239} {"train_loss": -6.722895622253418, "global_step": 136072, "epoch": 3239} {"train_loss": -6.700429916381836, "global_step": 136073, "epoch": 3239} {"train_loss": -6.612492084503174, "global_step": 136074, "epoch": 3239} {"train_loss": -6.748898029327393, "global_step": 136075, "epoch": 3239} {"train_loss": -6.623532295227051, "global_step": 136076, "epoch": 3239} {"train_loss": -6.689326763153076, "global_step": 136077, "epoch": 3239} {"train_loss": -6.698227882385254, "global_step": 136078, "epoch": 3239} {"train_loss": -6.679326341265724, "global_step": 136079, "epoch": 3239, "val_loss": 66841.140625} {"train_loss": -6.659731864929199, "global_step": 136080, "epoch": 3240} {"train_loss": -6.716081619262695, "global_step": 136081, "epoch": 3240} {"train_loss": -6.714102745056152, "global_step": 136082, "epoch": 3240} {"train_loss": -6.744400978088379, "global_step": 136083, "epoch": 3240} {"train_loss": -6.743717193603516, "global_step": 136084, "epoch": 3240} {"train_loss": -6.6539225578308105, "global_step": 136085, "epoch": 3240} {"train_loss": -6.746042728424072, "global_step": 136086, "epoch": 3240} {"train_loss": -6.625436782836914, "global_step": 136087, "epoch": 3240} {"train_loss": -6.706308364868164, "global_step": 136088, "epoch": 3240} {"train_loss": -6.640284538269043, "global_step": 136089, "epoch": 3240} {"train_loss": -6.667339324951172, "global_step": 136090, "epoch": 3240} {"train_loss": -6.606205940246582, "global_step": 136091, "epoch": 3240} {"train_loss": -6.610519886016846, "global_step": 136092, "epoch": 3240} {"train_loss": -6.757152557373047, "global_step": 136093, "epoch": 3240} {"train_loss": -6.745843887329102, "global_step": 136094, "epoch": 3240} {"train_loss": -6.806787490844727, "global_step": 136095, "epoch": 3240} {"train_loss": -6.63670015335083, "global_step": 136096, "epoch": 3240} {"train_loss": -6.723670482635498, "global_step": 136097, "epoch": 3240} {"train_loss": -6.750704288482666, "global_step": 136098, "epoch": 3240} {"train_loss": -6.8695526123046875, "global_step": 136099, "epoch": 3240} {"train_loss": -6.81074333190918, "global_step": 136100, "epoch": 3240} {"train_loss": -6.781759262084961, "global_step": 136101, "epoch": 3240} {"train_loss": -6.760868072509766, "global_step": 136102, "epoch": 3240} {"train_loss": -6.733593940734863, "global_step": 136103, "epoch": 3240} {"train_loss": -6.809721946716309, "global_step": 136104, "epoch": 3240} {"train_loss": -6.796298980712891, "global_step": 136105, "epoch": 3240} {"train_loss": -6.78316593170166, "global_step": 136106, "epoch": 3240} {"train_loss": -6.731450080871582, "global_step": 136107, "epoch": 3240} {"train_loss": -6.743457794189453, "global_step": 136108, "epoch": 3240} {"train_loss": -6.838738918304443, "global_step": 136109, "epoch": 3240} {"train_loss": -6.77532434463501, "global_step": 136110, "epoch": 3240} {"train_loss": -6.662103652954102, "global_step": 136111, "epoch": 3240} {"train_loss": -6.837832927703857, "global_step": 136112, "epoch": 3240} {"train_loss": -6.7817702293396, "global_step": 136113, "epoch": 3240} {"train_loss": -6.696718215942383, "global_step": 136114, "epoch": 3240} {"train_loss": -6.747315406799316, "global_step": 136115, "epoch": 3240} {"train_loss": -6.760541915893555, "global_step": 136116, "epoch": 3240} {"train_loss": -6.762510776519775, "global_step": 136117, "epoch": 3240} {"train_loss": -6.662761688232422, "global_step": 136118, "epoch": 3240} {"train_loss": -6.758193492889404, "global_step": 136119, "epoch": 3240} {"train_loss": -6.675315856933594, "global_step": 136120, "epoch": 3240} {"train_loss": -6.734019177300589, "global_step": 136121, "epoch": 3240, "val_loss": 67012.1640625} {"train_loss": -6.623658180236816, "global_step": 136122, "epoch": 3241} {"train_loss": -6.648974418640137, "global_step": 136123, "epoch": 3241} {"train_loss": -6.727652072906494, "global_step": 136124, "epoch": 3241} {"train_loss": -6.596526145935059, "global_step": 136125, "epoch": 3241} {"train_loss": -6.692538738250732, "global_step": 136126, "epoch": 3241} {"train_loss": -6.759232521057129, "global_step": 136127, "epoch": 3241} {"train_loss": -6.708235740661621, "global_step": 136128, "epoch": 3241} {"train_loss": -6.707120895385742, "global_step": 136129, "epoch": 3241} {"train_loss": -6.692523002624512, "global_step": 136130, "epoch": 3241} {"train_loss": -6.73780632019043, "global_step": 136131, "epoch": 3241} {"train_loss": -6.81518030166626, "global_step": 136132, "epoch": 3241} {"train_loss": -6.770744800567627, "global_step": 136133, "epoch": 3241} {"train_loss": -6.778298854827881, "global_step": 136134, "epoch": 3241} {"train_loss": -6.697478771209717, "global_step": 136135, "epoch": 3241} {"train_loss": -6.6366167068481445, "global_step": 136136, "epoch": 3241} {"train_loss": -6.778166770935059, "global_step": 136137, "epoch": 3241} {"train_loss": -6.660533905029297, "global_step": 136138, "epoch": 3241} {"train_loss": -6.859951496124268, "global_step": 136139, "epoch": 3241} {"train_loss": -6.717356204986572, "global_step": 136140, "epoch": 3241} {"train_loss": -6.815503120422363, "global_step": 136141, "epoch": 3241} {"train_loss": -6.764157295227051, "global_step": 136142, "epoch": 3241} {"train_loss": -6.8121538162231445, "global_step": 136143, "epoch": 3241} {"train_loss": -6.773268699645996, "global_step": 136144, "epoch": 3241} {"train_loss": -6.65608024597168, "global_step": 136145, "epoch": 3241} {"train_loss": -6.748047828674316, "global_step": 136146, "epoch": 3241} {"train_loss": -6.684947490692139, "global_step": 136147, "epoch": 3241} {"train_loss": -6.762679576873779, "global_step": 136148, "epoch": 3241} {"train_loss": -6.7587690353393555, "global_step": 136149, "epoch": 3241} {"train_loss": -6.7662553787231445, "global_step": 136150, "epoch": 3241} {"train_loss": -6.729957580566406, "global_step": 136151, "epoch": 3241} {"train_loss": -6.883796691894531, "global_step": 136152, "epoch": 3241} {"train_loss": -6.819001197814941, "global_step": 136153, "epoch": 3241} {"train_loss": -6.678622245788574, "global_step": 136154, "epoch": 3241} {"train_loss": -6.565247058868408, "global_step": 136155, "epoch": 3241} {"train_loss": -6.720789432525635, "global_step": 136156, "epoch": 3241} {"train_loss": -6.692688941955566, "global_step": 136157, "epoch": 3241} {"train_loss": -6.8023457527160645, "global_step": 136158, "epoch": 3241} {"train_loss": -6.795295715332031, "global_step": 136159, "epoch": 3241} {"train_loss": -6.759644985198975, "global_step": 136160, "epoch": 3241} {"train_loss": -6.796163558959961, "global_step": 136161, "epoch": 3241} {"train_loss": -6.630146026611328, "global_step": 136162, "epoch": 3241} {"train_loss": -6.732225474857149, "global_step": 136163, "epoch": 3241, "val_loss": 66864.21875} {"train_loss": -6.89255952835083, "global_step": 136164, "epoch": 3242} {"train_loss": -6.659017562866211, "global_step": 136165, "epoch": 3242} {"train_loss": -6.721161365509033, "global_step": 136166, "epoch": 3242} {"train_loss": -6.769426345825195, "global_step": 136167, "epoch": 3242} {"train_loss": -6.69630241394043, "global_step": 136168, "epoch": 3242} {"train_loss": -6.621973037719727, "global_step": 136169, "epoch": 3242} {"train_loss": -6.790005207061768, "global_step": 136170, "epoch": 3242} {"train_loss": -6.659664154052734, "global_step": 136171, "epoch": 3242} {"train_loss": -6.870766639709473, "global_step": 136172, "epoch": 3242} {"train_loss": -6.686201095581055, "global_step": 136173, "epoch": 3242} {"train_loss": -6.6728010177612305, "global_step": 136174, "epoch": 3242} {"train_loss": -6.711698532104492, "global_step": 136175, "epoch": 3242} {"train_loss": -6.740160942077637, "global_step": 136176, "epoch": 3242} {"train_loss": -6.794821739196777, "global_step": 136177, "epoch": 3242} {"train_loss": -6.663296699523926, "global_step": 136178, "epoch": 3242} {"train_loss": -6.632682800292969, "global_step": 136179, "epoch": 3242} {"train_loss": -6.659984588623047, "global_step": 136180, "epoch": 3242} {"train_loss": -6.583449840545654, "global_step": 136181, "epoch": 3242} {"train_loss": -6.7007832527160645, "global_step": 136182, "epoch": 3242} {"train_loss": -6.632003307342529, "global_step": 136183, "epoch": 3242} {"train_loss": -6.560179710388184, "global_step": 136184, "epoch": 3242} {"train_loss": -6.610182762145996, "global_step": 136185, "epoch": 3242} {"train_loss": -6.656505584716797, "global_step": 136186, "epoch": 3242} {"train_loss": -6.644214630126953, "global_step": 136187, "epoch": 3242} {"train_loss": -6.737461090087891, "global_step": 136188, "epoch": 3242} {"train_loss": -6.578788757324219, "global_step": 136189, "epoch": 3242} {"train_loss": -6.610605239868164, "global_step": 136190, "epoch": 3242} {"train_loss": -6.599206924438477, "global_step": 136191, "epoch": 3242} {"train_loss": -6.588171482086182, "global_step": 136192, "epoch": 3242} {"train_loss": -6.629949569702148, "global_step": 136193, "epoch": 3242} {"train_loss": -6.591015815734863, "global_step": 136194, "epoch": 3242} {"train_loss": -6.705962657928467, "global_step": 136195, "epoch": 3242} {"train_loss": -6.502955436706543, "global_step": 136196, "epoch": 3242} {"train_loss": -6.70259952545166, "global_step": 136197, "epoch": 3242} {"train_loss": -6.630618095397949, "global_step": 136198, "epoch": 3242} {"train_loss": -6.5057783126831055, "global_step": 136199, "epoch": 3242} {"train_loss": -6.613658905029297, "global_step": 136200, "epoch": 3242} {"train_loss": -6.695504665374756, "global_step": 136201, "epoch": 3242} {"train_loss": -6.731535911560059, "global_step": 136202, "epoch": 3242} {"train_loss": -6.74414587020874, "global_step": 136203, "epoch": 3242} {"train_loss": -6.758924961090088, "global_step": 136204, "epoch": 3242} {"train_loss": -6.67515290351141, "global_step": 136205, "epoch": 3242, "val_loss": 66930.0390625} {"train_loss": -6.685697555541992, "global_step": 136206, "epoch": 3243} {"train_loss": -6.765488147735596, "global_step": 136207, "epoch": 3243} {"train_loss": -6.850297927856445, "global_step": 136208, "epoch": 3243} {"train_loss": -6.759747505187988, "global_step": 136209, "epoch": 3243} {"train_loss": -6.817586898803711, "global_step": 136210, "epoch": 3243} {"train_loss": -6.669220924377441, "global_step": 136211, "epoch": 3243} {"train_loss": -6.739025115966797, "global_step": 136212, "epoch": 3243} {"train_loss": -6.734623908996582, "global_step": 136213, "epoch": 3243} {"train_loss": -6.694378852844238, "global_step": 136214, "epoch": 3243} {"train_loss": -6.75580358505249, "global_step": 136215, "epoch": 3243} {"train_loss": -6.750329971313477, "global_step": 136216, "epoch": 3243} {"train_loss": -6.748072624206543, "global_step": 136217, "epoch": 3243} {"train_loss": -6.789246082305908, "global_step": 136218, "epoch": 3243} {"train_loss": -6.733884811401367, "global_step": 136219, "epoch": 3243} {"train_loss": -6.614827632904053, "global_step": 136220, "epoch": 3243} {"train_loss": -6.805116653442383, "global_step": 136221, "epoch": 3243} {"train_loss": -6.588287830352783, "global_step": 136222, "epoch": 3243} {"train_loss": -6.706483840942383, "global_step": 136223, "epoch": 3243} {"train_loss": -6.648238182067871, "global_step": 136224, "epoch": 3243} {"train_loss": -6.700488090515137, "global_step": 136225, "epoch": 3243} {"train_loss": -6.69720458984375, "global_step": 136226, "epoch": 3243} {"train_loss": -6.795702934265137, "global_step": 136227, "epoch": 3243} {"train_loss": -6.766206741333008, "global_step": 136228, "epoch": 3243} {"train_loss": -6.7475690841674805, "global_step": 136229, "epoch": 3243} {"train_loss": -6.554531097412109, "global_step": 136230, "epoch": 3243} {"train_loss": -6.740401268005371, "global_step": 136231, "epoch": 3243} {"train_loss": -6.752090930938721, "global_step": 136232, "epoch": 3243} {"train_loss": -6.633367538452148, "global_step": 136233, "epoch": 3243} {"train_loss": -6.763792037963867, "global_step": 136234, "epoch": 3243} {"train_loss": -6.677541255950928, "global_step": 136235, "epoch": 3243} {"train_loss": -6.73701810836792, "global_step": 136236, "epoch": 3243} {"train_loss": -6.546298980712891, "global_step": 136237, "epoch": 3243} {"train_loss": -6.725414276123047, "global_step": 136238, "epoch": 3243} {"train_loss": -6.720751762390137, "global_step": 136239, "epoch": 3243} {"train_loss": -6.645242214202881, "global_step": 136240, "epoch": 3243} {"train_loss": -6.685670852661133, "global_step": 136241, "epoch": 3243} {"train_loss": -6.63460636138916, "global_step": 136242, "epoch": 3243} {"train_loss": -6.733036994934082, "global_step": 136243, "epoch": 3243} {"train_loss": -6.484179496765137, "global_step": 136244, "epoch": 3243} {"train_loss": -6.748353958129883, "global_step": 136245, "epoch": 3243} {"train_loss": -6.753870010375977, "global_step": 136246, "epoch": 3243} {"train_loss": -6.708002113160633, "global_step": 136247, "epoch": 3243, "val_loss": 66789.140625} {"train_loss": -6.8231940269470215, "global_step": 136248, "epoch": 3244} {"train_loss": -6.601757049560547, "global_step": 136249, "epoch": 3244} {"train_loss": -6.722481727600098, "global_step": 136250, "epoch": 3244} {"train_loss": -6.733939170837402, "global_step": 136251, "epoch": 3244} {"train_loss": -6.525882720947266, "global_step": 136252, "epoch": 3244} {"train_loss": -6.7010087966918945, "global_step": 136253, "epoch": 3244} {"train_loss": -6.654952049255371, "global_step": 136254, "epoch": 3244} {"train_loss": -6.656720161437988, "global_step": 136255, "epoch": 3244} {"train_loss": -6.778560638427734, "global_step": 136256, "epoch": 3244} {"train_loss": -6.8130693435668945, "global_step": 136257, "epoch": 3244} {"train_loss": -6.714216709136963, "global_step": 136258, "epoch": 3244} {"train_loss": -6.7550835609436035, "global_step": 136259, "epoch": 3244} {"train_loss": -6.614136695861816, "global_step": 136260, "epoch": 3244} {"train_loss": -6.799063205718994, "global_step": 136261, "epoch": 3244} {"train_loss": -6.692863464355469, "global_step": 136262, "epoch": 3244} {"train_loss": -6.748612403869629, "global_step": 136263, "epoch": 3244} {"train_loss": -6.690314292907715, "global_step": 136264, "epoch": 3244} {"train_loss": -6.580848693847656, "global_step": 136265, "epoch": 3244} {"train_loss": -6.773906707763672, "global_step": 136266, "epoch": 3244} {"train_loss": -6.761713027954102, "global_step": 136267, "epoch": 3244} {"train_loss": -6.674622058868408, "global_step": 136268, "epoch": 3244} {"train_loss": -6.871555328369141, "global_step": 136269, "epoch": 3244} {"train_loss": -6.841965198516846, "global_step": 136270, "epoch": 3244} {"train_loss": -6.751333236694336, "global_step": 136271, "epoch": 3244} {"train_loss": -6.702200412750244, "global_step": 136272, "epoch": 3244} {"train_loss": -6.758261680603027, "global_step": 136273, "epoch": 3244} {"train_loss": -6.797640323638916, "global_step": 136274, "epoch": 3244} {"train_loss": -6.705803871154785, "global_step": 136275, "epoch": 3244} {"train_loss": -6.823836326599121, "global_step": 136276, "epoch": 3244} {"train_loss": -6.833736896514893, "global_step": 136277, "epoch": 3244} {"train_loss": -6.862739562988281, "global_step": 136278, "epoch": 3244} {"train_loss": -6.813182830810547, "global_step": 136279, "epoch": 3244} {"train_loss": -6.7118377685546875, "global_step": 136280, "epoch": 3244} {"train_loss": -6.709170341491699, "global_step": 136281, "epoch": 3244} {"train_loss": -6.804955005645752, "global_step": 136282, "epoch": 3244} {"train_loss": -6.698367118835449, "global_step": 136283, "epoch": 3244} {"train_loss": -6.71412992477417, "global_step": 136284, "epoch": 3244} {"train_loss": -6.727136611938477, "global_step": 136285, "epoch": 3244} {"train_loss": -6.7370710372924805, "global_step": 136286, "epoch": 3244} {"train_loss": -6.84348201751709, "global_step": 136287, "epoch": 3244} {"train_loss": -6.803936958312988, "global_step": 136288, "epoch": 3244} {"train_loss": -6.739936601547968, "global_step": 136289, "epoch": 3244, "val_loss": 66968.984375} {"train_loss": -6.857665061950684, "global_step": 136290, "epoch": 3245} {"train_loss": -6.782135009765625, "global_step": 136291, "epoch": 3245} {"train_loss": -6.774391174316406, "global_step": 136292, "epoch": 3245} {"train_loss": -6.730640888214111, "global_step": 136293, "epoch": 3245} {"train_loss": -6.75604248046875, "global_step": 136294, "epoch": 3245} {"train_loss": -6.851862907409668, "global_step": 136295, "epoch": 3245} {"train_loss": -6.802900314331055, "global_step": 136296, "epoch": 3245} {"train_loss": -6.925407409667969, "global_step": 136297, "epoch": 3245} {"train_loss": -6.841922760009766, "global_step": 136298, "epoch": 3245} {"train_loss": -6.785185813903809, "global_step": 136299, "epoch": 3245} {"train_loss": -6.682450294494629, "global_step": 136300, "epoch": 3245} {"train_loss": -6.829654693603516, "global_step": 136301, "epoch": 3245} {"train_loss": -6.754441738128662, "global_step": 136302, "epoch": 3245} {"train_loss": -6.752784252166748, "global_step": 136303, "epoch": 3245} {"train_loss": -6.832348346710205, "global_step": 136304, "epoch": 3245} {"train_loss": -6.7197585105896, "global_step": 136305, "epoch": 3245} {"train_loss": -6.735586166381836, "global_step": 136306, "epoch": 3245} {"train_loss": -6.72996711730957, "global_step": 136307, "epoch": 3245} {"train_loss": -6.750814914703369, "global_step": 136308, "epoch": 3245} {"train_loss": -6.639391899108887, "global_step": 136309, "epoch": 3245} {"train_loss": -6.724762439727783, "global_step": 136310, "epoch": 3245} {"train_loss": -6.802489280700684, "global_step": 136311, "epoch": 3245} {"train_loss": -6.619490623474121, "global_step": 136312, "epoch": 3245} {"train_loss": -6.75689697265625, "global_step": 136313, "epoch": 3245} {"train_loss": -6.713882923126221, "global_step": 136314, "epoch": 3245} {"train_loss": -6.696948528289795, "global_step": 136315, "epoch": 3245} {"train_loss": -6.710498809814453, "global_step": 136316, "epoch": 3245} {"train_loss": -6.780313491821289, "global_step": 136317, "epoch": 3245} {"train_loss": -6.735808372497559, "global_step": 136318, "epoch": 3245} {"train_loss": -6.693402290344238, "global_step": 136319, "epoch": 3245} {"train_loss": -6.619208335876465, "global_step": 136320, "epoch": 3245} {"train_loss": -6.680145263671875, "global_step": 136321, "epoch": 3245} {"train_loss": -6.700333595275879, "global_step": 136322, "epoch": 3245} {"train_loss": -6.60024881362915, "global_step": 136323, "epoch": 3245} {"train_loss": -6.668396949768066, "global_step": 136324, "epoch": 3245} {"train_loss": -6.668470859527588, "global_step": 136325, "epoch": 3245} {"train_loss": -6.785733222961426, "global_step": 136326, "epoch": 3245} {"train_loss": -6.737231254577637, "global_step": 136327, "epoch": 3245} {"train_loss": -6.75379753112793, "global_step": 136328, "epoch": 3245} {"train_loss": -6.72787618637085, "global_step": 136329, "epoch": 3245} {"train_loss": -6.722576141357422, "global_step": 136330, "epoch": 3245} {"train_loss": -6.744195926757086, "global_step": 136331, "epoch": 3245, "val_loss": 66920.390625} {"train_loss": -6.761462211608887, "global_step": 136332, "epoch": 3246} {"train_loss": -6.798396110534668, "global_step": 136333, "epoch": 3246} {"train_loss": -6.712327003479004, "global_step": 136334, "epoch": 3246} {"train_loss": -6.727132320404053, "global_step": 136335, "epoch": 3246} {"train_loss": -6.656059265136719, "global_step": 136336, "epoch": 3246} {"train_loss": -6.791511535644531, "global_step": 136337, "epoch": 3246} {"train_loss": -6.721590042114258, "global_step": 136338, "epoch": 3246} {"train_loss": -6.696173191070557, "global_step": 136339, "epoch": 3246} {"train_loss": -6.78329610824585, "global_step": 136340, "epoch": 3246} {"train_loss": -6.656055927276611, "global_step": 136341, "epoch": 3246} {"train_loss": -6.755161285400391, "global_step": 136342, "epoch": 3246} {"train_loss": -6.690178394317627, "global_step": 136343, "epoch": 3246} {"train_loss": -6.691139221191406, "global_step": 136344, "epoch": 3246} {"train_loss": -6.731961250305176, "global_step": 136345, "epoch": 3246} {"train_loss": -6.593466758728027, "global_step": 136346, "epoch": 3246} {"train_loss": -6.751151084899902, "global_step": 136347, "epoch": 3246} {"train_loss": -6.7701616287231445, "global_step": 136348, "epoch": 3246} {"train_loss": -6.69616174697876, "global_step": 136349, "epoch": 3246} {"train_loss": -6.878235340118408, "global_step": 136350, "epoch": 3246} {"train_loss": -6.675558090209961, "global_step": 136351, "epoch": 3246} {"train_loss": -6.771407127380371, "global_step": 136352, "epoch": 3246} {"train_loss": -6.803045272827148, "global_step": 136353, "epoch": 3246} {"train_loss": -6.820600509643555, "global_step": 136354, "epoch": 3246} {"train_loss": -6.7664361000061035, "global_step": 136355, "epoch": 3246} {"train_loss": -6.77974796295166, "global_step": 136356, "epoch": 3246} {"train_loss": -6.685171127319336, "global_step": 136357, "epoch": 3246} {"train_loss": -6.783376693725586, "global_step": 136358, "epoch": 3246} {"train_loss": -6.755786895751953, "global_step": 136359, "epoch": 3246} {"train_loss": -6.783278465270996, "global_step": 136360, "epoch": 3246} {"train_loss": -6.809920787811279, "global_step": 136361, "epoch": 3246} {"train_loss": -6.71142053604126, "global_step": 136362, "epoch": 3246} {"train_loss": -6.730101585388184, "global_step": 136363, "epoch": 3246} {"train_loss": -6.859541893005371, "global_step": 136364, "epoch": 3246} {"train_loss": -6.754288673400879, "global_step": 136365, "epoch": 3246} {"train_loss": -6.822263240814209, "global_step": 136366, "epoch": 3246} {"train_loss": -6.9417524337768555, "global_step": 136367, "epoch": 3246} {"train_loss": -6.771495819091797, "global_step": 136368, "epoch": 3246} {"train_loss": -6.581742286682129, "global_step": 136369, "epoch": 3246} {"train_loss": -6.77603006362915, "global_step": 136370, "epoch": 3246} {"train_loss": -6.822456359863281, "global_step": 136371, "epoch": 3246} {"train_loss": -6.690276145935059, "global_step": 136372, "epoch": 3246} {"train_loss": -6.749860718136742, "global_step": 136373, "epoch": 3246, "val_loss": 67089.78125} {"train_loss": -6.835269927978516, "global_step": 136374, "epoch": 3247} {"train_loss": -6.66682243347168, "global_step": 136375, "epoch": 3247} {"train_loss": -6.621469497680664, "global_step": 136376, "epoch": 3247} {"train_loss": -6.7588605880737305, "global_step": 136377, "epoch": 3247} {"train_loss": -6.83149528503418, "global_step": 136378, "epoch": 3247} {"train_loss": -6.6818952560424805, "global_step": 136379, "epoch": 3247} {"train_loss": -6.673391819000244, "global_step": 136380, "epoch": 3247} {"train_loss": -6.680965900421143, "global_step": 136381, "epoch": 3247} {"train_loss": -6.748711109161377, "global_step": 136382, "epoch": 3247} {"train_loss": -6.70849084854126, "global_step": 136383, "epoch": 3247} {"train_loss": -6.627842903137207, "global_step": 136384, "epoch": 3247} {"train_loss": -6.823241233825684, "global_step": 136385, "epoch": 3247} {"train_loss": -6.671856880187988, "global_step": 136386, "epoch": 3247} {"train_loss": -6.7548370361328125, "global_step": 136387, "epoch": 3247} {"train_loss": -6.726878643035889, "global_step": 136388, "epoch": 3247} {"train_loss": -6.707263946533203, "global_step": 136389, "epoch": 3247} {"train_loss": -6.808543682098389, "global_step": 136390, "epoch": 3247} {"train_loss": -6.786545753479004, "global_step": 136391, "epoch": 3247} {"train_loss": -6.842795372009277, "global_step": 136392, "epoch": 3247} {"train_loss": -6.823957443237305, "global_step": 136393, "epoch": 3247} {"train_loss": -6.727416038513184, "global_step": 136394, "epoch": 3247} {"train_loss": -6.719011306762695, "global_step": 136395, "epoch": 3247} {"train_loss": -6.68565559387207, "global_step": 136396, "epoch": 3247} {"train_loss": -6.773989677429199, "global_step": 136397, "epoch": 3247} {"train_loss": -6.714251518249512, "global_step": 136398, "epoch": 3247} {"train_loss": -6.833043098449707, "global_step": 136399, "epoch": 3247} {"train_loss": -6.836174964904785, "global_step": 136400, "epoch": 3247} {"train_loss": -6.775125980377197, "global_step": 136401, "epoch": 3247} {"train_loss": -6.71843147277832, "global_step": 136402, "epoch": 3247} {"train_loss": -6.7775068283081055, "global_step": 136403, "epoch": 3247} {"train_loss": -6.757457733154297, "global_step": 136404, "epoch": 3247} {"train_loss": -6.730808734893799, "global_step": 136405, "epoch": 3247} {"train_loss": -6.724699020385742, "global_step": 136406, "epoch": 3247} {"train_loss": -6.783769607543945, "global_step": 136407, "epoch": 3247} {"train_loss": -6.782565116882324, "global_step": 136408, "epoch": 3247} {"train_loss": -6.703367710113525, "global_step": 136409, "epoch": 3247} {"train_loss": -6.641730308532715, "global_step": 136410, "epoch": 3247} {"train_loss": -6.729538917541504, "global_step": 136411, "epoch": 3247} {"train_loss": -6.657835960388184, "global_step": 136412, "epoch": 3247} {"train_loss": -6.539888381958008, "global_step": 136413, "epoch": 3247} {"train_loss": -6.734126567840576, "global_step": 136414, "epoch": 3247} {"train_loss": -6.733807211830502, "global_step": 136415, "epoch": 3247, "val_loss": 67038.375} {"train_loss": -6.705140113830566, "global_step": 136416, "epoch": 3248} {"train_loss": -6.839232921600342, "global_step": 136417, "epoch": 3248} {"train_loss": -6.462687969207764, "global_step": 136418, "epoch": 3248} {"train_loss": -6.6323113441467285, "global_step": 136419, "epoch": 3248} {"train_loss": -6.67951774597168, "global_step": 136420, "epoch": 3248} {"train_loss": -6.594506740570068, "global_step": 136421, "epoch": 3248} {"train_loss": -6.739304542541504, "global_step": 136422, "epoch": 3248} {"train_loss": -6.723997116088867, "global_step": 136423, "epoch": 3248} {"train_loss": -6.65059232711792, "global_step": 136424, "epoch": 3248} {"train_loss": -6.699033260345459, "global_step": 136425, "epoch": 3248} {"train_loss": -6.5308685302734375, "global_step": 136426, "epoch": 3248} {"train_loss": -6.787205696105957, "global_step": 136427, "epoch": 3248} {"train_loss": -6.69173002243042, "global_step": 136428, "epoch": 3248} {"train_loss": -6.717435836791992, "global_step": 136429, "epoch": 3248} {"train_loss": -6.709595203399658, "global_step": 136430, "epoch": 3248} {"train_loss": -6.718360900878906, "global_step": 136431, "epoch": 3248} {"train_loss": -6.729345321655273, "global_step": 136432, "epoch": 3248} {"train_loss": -6.681493759155273, "global_step": 136433, "epoch": 3248} {"train_loss": -6.579034328460693, "global_step": 136434, "epoch": 3248} {"train_loss": -6.842320919036865, "global_step": 136435, "epoch": 3248} {"train_loss": -6.595469951629639, "global_step": 136436, "epoch": 3248} {"train_loss": -6.656663417816162, "global_step": 136437, "epoch": 3248} {"train_loss": -6.715706825256348, "global_step": 136438, "epoch": 3248} {"train_loss": -6.763181686401367, "global_step": 136439, "epoch": 3248} {"train_loss": -6.752013206481934, "global_step": 136440, "epoch": 3248} {"train_loss": -6.699974060058594, "global_step": 136441, "epoch": 3248} {"train_loss": -6.643421173095703, "global_step": 136442, "epoch": 3248} {"train_loss": -6.681418418884277, "global_step": 136443, "epoch": 3248} {"train_loss": -6.813410758972168, "global_step": 136444, "epoch": 3248} {"train_loss": -6.745212554931641, "global_step": 136445, "epoch": 3248} {"train_loss": -6.651320457458496, "global_step": 136446, "epoch": 3248} {"train_loss": -6.715060234069824, "global_step": 136447, "epoch": 3248} {"train_loss": -6.634974002838135, "global_step": 136448, "epoch": 3248} {"train_loss": -6.446498870849609, "global_step": 136449, "epoch": 3248} {"train_loss": -6.5968475341796875, "global_step": 136450, "epoch": 3248} {"train_loss": -6.466460227966309, "global_step": 136451, "epoch": 3248} {"train_loss": -6.581569671630859, "global_step": 136452, "epoch": 3248} {"train_loss": -6.75662088394165, "global_step": 136453, "epoch": 3248} {"train_loss": -6.534255504608154, "global_step": 136454, "epoch": 3248} {"train_loss": -6.639023303985596, "global_step": 136455, "epoch": 3248} {"train_loss": -6.644245624542236, "global_step": 136456, "epoch": 3248} {"train_loss": -6.670841410046532, "global_step": 136457, "epoch": 3248, "val_loss": 67042.9609375} {"train_loss": -6.706148147583008, "global_step": 136458, "epoch": 3249} {"train_loss": -6.523717403411865, "global_step": 136459, "epoch": 3249} {"train_loss": -6.611806869506836, "global_step": 136460, "epoch": 3249} {"train_loss": -6.701424598693848, "global_step": 136461, "epoch": 3249} {"train_loss": -6.694104194641113, "global_step": 136462, "epoch": 3249} {"train_loss": -6.656045913696289, "global_step": 136463, "epoch": 3249} {"train_loss": -6.597867965698242, "global_step": 136464, "epoch": 3249} {"train_loss": -6.64077091217041, "global_step": 136465, "epoch": 3249} {"train_loss": -6.733035564422607, "global_step": 136466, "epoch": 3249} {"train_loss": -6.745113372802734, "global_step": 136467, "epoch": 3249} {"train_loss": -6.688284397125244, "global_step": 136468, "epoch": 3249} {"train_loss": -6.7953901290893555, "global_step": 136469, "epoch": 3249} {"train_loss": -6.6976518630981445, "global_step": 136470, "epoch": 3249} {"train_loss": -6.878284454345703, "global_step": 136471, "epoch": 3249} {"train_loss": -6.607011318206787, "global_step": 136472, "epoch": 3249} {"train_loss": -6.697551727294922, "global_step": 136473, "epoch": 3249} {"train_loss": -6.754349708557129, "global_step": 136474, "epoch": 3249} {"train_loss": -6.628286361694336, "global_step": 136475, "epoch": 3249} {"train_loss": -6.614419937133789, "global_step": 136476, "epoch": 3249} {"train_loss": -6.816990375518799, "global_step": 136477, "epoch": 3249} {"train_loss": -6.78111457824707, "global_step": 136478, "epoch": 3249} {"train_loss": -6.709383964538574, "global_step": 136479, "epoch": 3249} {"train_loss": -6.5884318351745605, "global_step": 136480, "epoch": 3249} {"train_loss": -6.615436553955078, "global_step": 136481, "epoch": 3249} {"train_loss": -6.716740131378174, "global_step": 136482, "epoch": 3249} {"train_loss": -6.778338432312012, "global_step": 136483, "epoch": 3249} {"train_loss": -6.6883087158203125, "global_step": 136484, "epoch": 3249} {"train_loss": -6.810441493988037, "global_step": 136485, "epoch": 3249} {"train_loss": -6.68715238571167, "global_step": 136486, "epoch": 3249} {"train_loss": -6.746063232421875, "global_step": 136487, "epoch": 3249} {"train_loss": -6.774523735046387, "global_step": 136488, "epoch": 3249} {"train_loss": -6.896322250366211, "global_step": 136489, "epoch": 3249} {"train_loss": -6.719242095947266, "global_step": 136490, "epoch": 3249} {"train_loss": -6.82059383392334, "global_step": 136491, "epoch": 3249} {"train_loss": -6.786287307739258, "global_step": 136492, "epoch": 3249} {"train_loss": -6.780492782592773, "global_step": 136493, "epoch": 3249} {"train_loss": -6.671350479125977, "global_step": 136494, "epoch": 3249} {"train_loss": -6.785869598388672, "global_step": 136495, "epoch": 3249} {"train_loss": -6.8163957595825195, "global_step": 136496, "epoch": 3249} {"train_loss": -6.859643936157227, "global_step": 136497, "epoch": 3249} {"train_loss": -6.71652889251709, "global_step": 136498, "epoch": 3249} {"train_loss": -6.721220584142776, "global_step": 136499, "epoch": 3249, "val_loss": 66877.7734375} {"train_loss": -6.739606857299805, "global_step": 136500, "epoch": 3250} {"train_loss": -6.759246826171875, "global_step": 136501, "epoch": 3250} {"train_loss": -6.764177322387695, "global_step": 136502, "epoch": 3250} {"train_loss": -6.749582290649414, "global_step": 136503, "epoch": 3250} {"train_loss": -6.702070236206055, "global_step": 136504, "epoch": 3250} {"train_loss": -6.673337459564209, "global_step": 136505, "epoch": 3250} {"train_loss": -6.646421432495117, "global_step": 136506, "epoch": 3250} {"train_loss": -6.613128185272217, "global_step": 136507, "epoch": 3250} {"train_loss": -6.703894138336182, "global_step": 136508, "epoch": 3250} {"train_loss": -6.737842559814453, "global_step": 136509, "epoch": 3250} {"train_loss": -6.663081645965576, "global_step": 136510, "epoch": 3250} {"train_loss": -6.751904010772705, "global_step": 136511, "epoch": 3250} {"train_loss": -6.735426902770996, "global_step": 136512, "epoch": 3250} {"train_loss": -6.738919734954834, "global_step": 136513, "epoch": 3250} {"train_loss": -6.689727783203125, "global_step": 136514, "epoch": 3250} {"train_loss": -6.641848087310791, "global_step": 136515, "epoch": 3250} {"train_loss": -6.697883129119873, "global_step": 136516, "epoch": 3250} {"train_loss": -6.70658016204834, "global_step": 136517, "epoch": 3250} {"train_loss": -6.866591453552246, "global_step": 136518, "epoch": 3250} {"train_loss": -6.634411334991455, "global_step": 136519, "epoch": 3250} {"train_loss": -6.8426055908203125, "global_step": 136520, "epoch": 3250} {"train_loss": -6.559059143066406, "global_step": 136521, "epoch": 3250} {"train_loss": -6.629779815673828, "global_step": 136522, "epoch": 3250} {"train_loss": -6.66319465637207, "global_step": 136523, "epoch": 3250} {"train_loss": -6.602892875671387, "global_step": 136524, "epoch": 3250} {"train_loss": -6.691554069519043, "global_step": 136525, "epoch": 3250} {"train_loss": -6.641282081604004, "global_step": 136526, "epoch": 3250} {"train_loss": -6.56287956237793, "global_step": 136527, "epoch": 3250} {"train_loss": -6.677277565002441, "global_step": 136528, "epoch": 3250} {"train_loss": -6.692568302154541, "global_step": 136529, "epoch": 3250} {"train_loss": -6.803727149963379, "global_step": 136530, "epoch": 3250} {"train_loss": -6.719616889953613, "global_step": 136531, "epoch": 3250} {"train_loss": -6.659320831298828, "global_step": 136532, "epoch": 3250} {"train_loss": -6.78754186630249, "global_step": 136533, "epoch": 3250} {"train_loss": -6.7475905418396, "global_step": 136534, "epoch": 3250} {"train_loss": -6.747359275817871, "global_step": 136535, "epoch": 3250} {"train_loss": -6.673863887786865, "global_step": 136536, "epoch": 3250} {"train_loss": -6.749444007873535, "global_step": 136537, "epoch": 3250} {"train_loss": -6.8282856941223145, "global_step": 136538, "epoch": 3250} {"train_loss": -6.799904823303223, "global_step": 136539, "epoch": 3250} {"train_loss": -6.667682647705078, "global_step": 136540, "epoch": 3250} {"train_loss": -6.7056342760721845, "global_step": 136541, "epoch": 3250, "train/sim_max_reward_0": 0.830490001195079, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.5493380410796648, "train/sim_max_reward_3": 0.8483430333756825, "train/sim_max_reward_4": 0.9436503964077378, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.22126029558674334, "test/sim_max_reward_4300001": 0.44263196917317676, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.9017636613158299, "test/sim_max_reward_4300004": 0.4221734148372167, "test/sim_max_reward_4300005": 0.9079289142496724, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.7568856135682511, "test/sim_max_reward_4300008": 0.9353261922563771, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.8404343035141439, "test/sim_max_reward_4300011": 0.47716066027437914, "test/sim_max_reward_4300012": 0.9831436166707681, "test/sim_max_reward_4300013": 0.8464588489758655, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.3222171885901337, "test/sim_max_reward_4300016": 0.9573488769994254, "test/sim_max_reward_4300017": 0.6262960704917931, "test/sim_max_reward_4300018": 0.9038874900130676, "test/sim_max_reward_4300019": 0.18549925869993386, "test/sim_max_reward_4300020": 0.03839764501076659, "test/sim_max_reward_4300021": 0.9294601801918263, "test/sim_max_reward_4300022": 0.8591739829947789, "test/sim_max_reward_4300023": 1.0, "test/sim_max_reward_4300024": 1.0, "test/sim_max_reward_4300025": 0.7301711927263627, "test/sim_max_reward_4300026": 0.18989727659030137, "test/sim_max_reward_4300027": 0.7001451122882064, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.0625755428052659, "test/sim_max_reward_4300031": 0.20733208888720597, "test/sim_max_reward_4300032": 0.7843941641141762, "test/sim_max_reward_4300033": 0.7132210002546857, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.9296201033412806, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.906515713863613, "test/sim_max_reward_4300038": 0.9861795641470182, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.9741770869592967, "test/sim_max_reward_4300041": 0.900151274863542, "test/sim_max_reward_4300042": 0.6340780922895151, "test/sim_max_reward_4300043": 0.1721736038948956, "test/sim_max_reward_4300044": 0.6280618312011131, "test/sim_max_reward_4300045": 0.9009935454356702, "test/sim_max_reward_4300046": 0.49760854768708745, "test/sim_max_reward_4300047": 0.18347504229899186, "test/sim_max_reward_4300048": 0.9124188891570708, "test/sim_max_reward_4300049": 0.208602222945192, "train/mean_score": 0.7274677052367252, "test/mean_score": 0.6195686838945623, "val_loss": 67145.734375} {"train_loss": -6.716561317443848, "global_step": 136542, "epoch": 3251} {"train_loss": -6.730825424194336, "global_step": 136543, "epoch": 3251} {"train_loss": -6.676807403564453, "global_step": 136544, "epoch": 3251} {"train_loss": -6.697763919830322, "global_step": 136545, "epoch": 3251} {"train_loss": -6.700277328491211, "global_step": 136546, "epoch": 3251} {"train_loss": -6.670392036437988, "global_step": 136547, "epoch": 3251} {"train_loss": -6.71202278137207, "global_step": 136548, "epoch": 3251} {"train_loss": -6.709480285644531, "global_step": 136549, "epoch": 3251} {"train_loss": -6.691723823547363, "global_step": 136550, "epoch": 3251} {"train_loss": -6.705756664276123, "global_step": 136551, "epoch": 3251} {"train_loss": -6.614027976989746, "global_step": 136552, "epoch": 3251} {"train_loss": -6.734036445617676, "global_step": 136553, "epoch": 3251} {"train_loss": -6.669671058654785, "global_step": 136554, "epoch": 3251} {"train_loss": -6.631773948669434, "global_step": 136555, "epoch": 3251} {"train_loss": -6.698423385620117, "global_step": 136556, "epoch": 3251} {"train_loss": -6.58358097076416, "global_step": 136557, "epoch": 3251} {"train_loss": -6.865557670593262, "global_step": 136558, "epoch": 3251} {"train_loss": -6.690218448638916, "global_step": 136559, "epoch": 3251} {"train_loss": -6.6824235916137695, "global_step": 136560, "epoch": 3251} {"train_loss": -6.608250141143799, "global_step": 136561, "epoch": 3251} {"train_loss": -6.718828201293945, "global_step": 136562, "epoch": 3251} {"train_loss": -6.758610725402832, "global_step": 136563, "epoch": 3251} {"train_loss": -6.808615684509277, "global_step": 136564, "epoch": 3251} {"train_loss": -6.806331634521484, "global_step": 136565, "epoch": 3251} {"train_loss": -6.670034408569336, "global_step": 136566, "epoch": 3251} {"train_loss": -6.779010772705078, "global_step": 136567, "epoch": 3251} {"train_loss": -6.730484962463379, "global_step": 136568, "epoch": 3251} {"train_loss": -6.5647172927856445, "global_step": 136569, "epoch": 3251} {"train_loss": -6.817016124725342, "global_step": 136570, "epoch": 3251} {"train_loss": -6.798972129821777, "global_step": 136571, "epoch": 3251} {"train_loss": -6.783135414123535, "global_step": 136572, "epoch": 3251} {"train_loss": -6.806778907775879, "global_step": 136573, "epoch": 3251} {"train_loss": -6.724766254425049, "global_step": 136574, "epoch": 3251} {"train_loss": -6.760300636291504, "global_step": 136575, "epoch": 3251} {"train_loss": -6.660069465637207, "global_step": 136576, "epoch": 3251} {"train_loss": -6.6929755210876465, "global_step": 136577, "epoch": 3251} {"train_loss": -6.5843963623046875, "global_step": 136578, "epoch": 3251} {"train_loss": -6.464712142944336, "global_step": 136579, "epoch": 3251} {"train_loss": -6.741544723510742, "global_step": 136580, "epoch": 3251} {"train_loss": -6.555567741394043, "global_step": 136581, "epoch": 3251} {"train_loss": -6.6968770027160645, "global_step": 136582, "epoch": 3251} {"train_loss": -6.69825275739034, "global_step": 136583, "epoch": 3251, "val_loss": 67330.921875} {"train_loss": -6.493622779846191, "global_step": 136584, "epoch": 3252} {"train_loss": -6.688494682312012, "global_step": 136585, "epoch": 3252} {"train_loss": -6.554224967956543, "global_step": 136586, "epoch": 3252} {"train_loss": -6.661708831787109, "global_step": 136587, "epoch": 3252} {"train_loss": -6.586404800415039, "global_step": 136588, "epoch": 3252} {"train_loss": -6.597802639007568, "global_step": 136589, "epoch": 3252} {"train_loss": -6.606645584106445, "global_step": 136590, "epoch": 3252} {"train_loss": -6.733016014099121, "global_step": 136591, "epoch": 3252} {"train_loss": -6.719900131225586, "global_step": 136592, "epoch": 3252} {"train_loss": -6.657746315002441, "global_step": 136593, "epoch": 3252} {"train_loss": -6.708834648132324, "global_step": 136594, "epoch": 3252} {"train_loss": -6.627134323120117, "global_step": 136595, "epoch": 3252} {"train_loss": -6.674066543579102, "global_step": 136596, "epoch": 3252} {"train_loss": -6.610983848571777, "global_step": 136597, "epoch": 3252} {"train_loss": -6.750555992126465, "global_step": 136598, "epoch": 3252} {"train_loss": -6.638722896575928, "global_step": 136599, "epoch": 3252} {"train_loss": -6.716618537902832, "global_step": 136600, "epoch": 3252} {"train_loss": -6.525419235229492, "global_step": 136601, "epoch": 3252} {"train_loss": -6.691503047943115, "global_step": 136602, "epoch": 3252} {"train_loss": -6.589204788208008, "global_step": 136603, "epoch": 3252} {"train_loss": -6.7268218994140625, "global_step": 136604, "epoch": 3252} {"train_loss": -6.614686012268066, "global_step": 136605, "epoch": 3252} {"train_loss": -6.695265769958496, "global_step": 136606, "epoch": 3252} {"train_loss": -6.716555595397949, "global_step": 136607, "epoch": 3252} {"train_loss": -6.6915483474731445, "global_step": 136608, "epoch": 3252} {"train_loss": -6.7022833824157715, "global_step": 136609, "epoch": 3252} {"train_loss": -6.672264099121094, "global_step": 136610, "epoch": 3252} {"train_loss": -6.7209038734436035, "global_step": 136611, "epoch": 3252} {"train_loss": -6.620900630950928, "global_step": 136612, "epoch": 3252} {"train_loss": -6.671848297119141, "global_step": 136613, "epoch": 3252} {"train_loss": -6.677427291870117, "global_step": 136614, "epoch": 3252} {"train_loss": -6.611669063568115, "global_step": 136615, "epoch": 3252} {"train_loss": -6.723328590393066, "global_step": 136616, "epoch": 3252} {"train_loss": -6.679240703582764, "global_step": 136617, "epoch": 3252} {"train_loss": -6.677078723907471, "global_step": 136618, "epoch": 3252} {"train_loss": -6.734898567199707, "global_step": 136619, "epoch": 3252} {"train_loss": -6.708719730377197, "global_step": 136620, "epoch": 3252} {"train_loss": -6.727303504943848, "global_step": 136621, "epoch": 3252} {"train_loss": -6.654008388519287, "global_step": 136622, "epoch": 3252} {"train_loss": -6.656913757324219, "global_step": 136623, "epoch": 3252} {"train_loss": -6.632800579071045, "global_step": 136624, "epoch": 3252} {"train_loss": -6.663887546176002, "global_step": 136625, "epoch": 3252, "val_loss": 66979.546875} {"train_loss": -6.652299880981445, "global_step": 136626, "epoch": 3253} {"train_loss": -6.755526065826416, "global_step": 136627, "epoch": 3253} {"train_loss": -6.674182891845703, "global_step": 136628, "epoch": 3253} {"train_loss": -6.732934951782227, "global_step": 136629, "epoch": 3253} {"train_loss": -6.711231708526611, "global_step": 136630, "epoch": 3253} {"train_loss": -6.740489959716797, "global_step": 136631, "epoch": 3253} {"train_loss": -6.6691083908081055, "global_step": 136632, "epoch": 3253} {"train_loss": -6.642611980438232, "global_step": 136633, "epoch": 3253} {"train_loss": -6.810759544372559, "global_step": 136634, "epoch": 3253} {"train_loss": -6.629088878631592, "global_step": 136635, "epoch": 3253} {"train_loss": -6.75609827041626, "global_step": 136636, "epoch": 3253} {"train_loss": -6.651938438415527, "global_step": 136637, "epoch": 3253} {"train_loss": -6.556686878204346, "global_step": 136638, "epoch": 3253} {"train_loss": -6.6891326904296875, "global_step": 136639, "epoch": 3253} {"train_loss": -6.7012763023376465, "global_step": 136640, "epoch": 3253} {"train_loss": -6.689269065856934, "global_step": 136641, "epoch": 3253} {"train_loss": -6.655549049377441, "global_step": 136642, "epoch": 3253} {"train_loss": -6.686790466308594, "global_step": 136643, "epoch": 3253} {"train_loss": -6.668377876281738, "global_step": 136644, "epoch": 3253} {"train_loss": -6.816577434539795, "global_step": 136645, "epoch": 3253} {"train_loss": -6.66990327835083, "global_step": 136646, "epoch": 3253} {"train_loss": -6.744847774505615, "global_step": 136647, "epoch": 3253} {"train_loss": -6.729099273681641, "global_step": 136648, "epoch": 3253} {"train_loss": -6.78868293762207, "global_step": 136649, "epoch": 3253} {"train_loss": -6.750586032867432, "global_step": 136650, "epoch": 3253} {"train_loss": -6.788416862487793, "global_step": 136651, "epoch": 3253} {"train_loss": -6.7926177978515625, "global_step": 136652, "epoch": 3253} {"train_loss": -6.749418258666992, "global_step": 136653, "epoch": 3253} {"train_loss": -6.668251991271973, "global_step": 136654, "epoch": 3253} {"train_loss": -6.709810256958008, "global_step": 136655, "epoch": 3253} {"train_loss": -6.715679168701172, "global_step": 136656, "epoch": 3253} {"train_loss": -6.716977119445801, "global_step": 136657, "epoch": 3253} {"train_loss": -6.694692611694336, "global_step": 136658, "epoch": 3253} {"train_loss": -6.783633232116699, "global_step": 136659, "epoch": 3253} {"train_loss": -6.827921390533447, "global_step": 136660, "epoch": 3253} {"train_loss": -6.835414886474609, "global_step": 136661, "epoch": 3253} {"train_loss": -6.754901885986328, "global_step": 136662, "epoch": 3253} {"train_loss": -6.695628643035889, "global_step": 136663, "epoch": 3253} {"train_loss": -6.800104141235352, "global_step": 136664, "epoch": 3253} {"train_loss": -6.782433032989502, "global_step": 136665, "epoch": 3253} {"train_loss": -6.743781089782715, "global_step": 136666, "epoch": 3253} {"train_loss": -6.7247203304654075, "global_step": 136667, "epoch": 3253, "val_loss": 67135.5390625} {"train_loss": -6.680325508117676, "global_step": 136668, "epoch": 3254} {"train_loss": -6.718261241912842, "global_step": 136669, "epoch": 3254} {"train_loss": -6.801610946655273, "global_step": 136670, "epoch": 3254} {"train_loss": -6.6781535148620605, "global_step": 136671, "epoch": 3254} {"train_loss": -6.718660354614258, "global_step": 136672, "epoch": 3254} {"train_loss": -6.721526622772217, "global_step": 136673, "epoch": 3254} {"train_loss": -6.731444835662842, "global_step": 136674, "epoch": 3254} {"train_loss": -6.799330711364746, "global_step": 136675, "epoch": 3254} {"train_loss": -6.771551132202148, "global_step": 136676, "epoch": 3254} {"train_loss": -6.817741394042969, "global_step": 136677, "epoch": 3254} {"train_loss": -6.702298641204834, "global_step": 136678, "epoch": 3254} {"train_loss": -6.677943706512451, "global_step": 136679, "epoch": 3254} {"train_loss": -6.836379051208496, "global_step": 136680, "epoch": 3254} {"train_loss": -6.824979305267334, "global_step": 136681, "epoch": 3254} {"train_loss": -6.735282897949219, "global_step": 136682, "epoch": 3254} {"train_loss": -6.698545455932617, "global_step": 136683, "epoch": 3254} {"train_loss": -6.859910488128662, "global_step": 136684, "epoch": 3254} {"train_loss": -6.684699058532715, "global_step": 136685, "epoch": 3254} {"train_loss": -6.690180778503418, "global_step": 136686, "epoch": 3254} {"train_loss": -6.718752861022949, "global_step": 136687, "epoch": 3254} {"train_loss": -6.688298225402832, "global_step": 136688, "epoch": 3254} {"train_loss": -6.782107353210449, "global_step": 136689, "epoch": 3254} {"train_loss": -6.802062034606934, "global_step": 136690, "epoch": 3254} {"train_loss": -6.760687828063965, "global_step": 136691, "epoch": 3254} {"train_loss": -6.765166759490967, "global_step": 136692, "epoch": 3254} {"train_loss": -6.833931922912598, "global_step": 136693, "epoch": 3254} {"train_loss": -6.748342514038086, "global_step": 136694, "epoch": 3254} {"train_loss": -6.748254776000977, "global_step": 136695, "epoch": 3254} {"train_loss": -6.790676116943359, "global_step": 136696, "epoch": 3254} {"train_loss": -6.880908012390137, "global_step": 136697, "epoch": 3254} {"train_loss": -6.619655132293701, "global_step": 136698, "epoch": 3254} {"train_loss": -6.696911811828613, "global_step": 136699, "epoch": 3254} {"train_loss": -6.75946569442749, "global_step": 136700, "epoch": 3254} {"train_loss": -6.7021026611328125, "global_step": 136701, "epoch": 3254} {"train_loss": -6.691537380218506, "global_step": 136702, "epoch": 3254} {"train_loss": -6.727184772491455, "global_step": 136703, "epoch": 3254} {"train_loss": -6.882303237915039, "global_step": 136704, "epoch": 3254} {"train_loss": -6.7871551513671875, "global_step": 136705, "epoch": 3254} {"train_loss": -6.764590740203857, "global_step": 136706, "epoch": 3254} {"train_loss": -6.722076416015625, "global_step": 136707, "epoch": 3254} {"train_loss": -6.735874176025391, "global_step": 136708, "epoch": 3254} {"train_loss": -6.750671920322237, "global_step": 136709, "epoch": 3254, "val_loss": 67383.078125} {"train_loss": -6.686677932739258, "global_step": 136710, "epoch": 3255} {"train_loss": -6.754304885864258, "global_step": 136711, "epoch": 3255} {"train_loss": -6.832662582397461, "global_step": 136712, "epoch": 3255} {"train_loss": -6.756246566772461, "global_step": 136713, "epoch": 3255} {"train_loss": -6.793724060058594, "global_step": 136714, "epoch": 3255} {"train_loss": -6.754460334777832, "global_step": 136715, "epoch": 3255} {"train_loss": -6.623967170715332, "global_step": 136716, "epoch": 3255} {"train_loss": -6.783849716186523, "global_step": 136717, "epoch": 3255} {"train_loss": -6.645600318908691, "global_step": 136718, "epoch": 3255} {"train_loss": -6.745659828186035, "global_step": 136719, "epoch": 3255} {"train_loss": -6.740571022033691, "global_step": 136720, "epoch": 3255} {"train_loss": -6.635952949523926, "global_step": 136721, "epoch": 3255} {"train_loss": -6.7835187911987305, "global_step": 136722, "epoch": 3255} {"train_loss": -6.565789222717285, "global_step": 136723, "epoch": 3255} {"train_loss": -6.693014144897461, "global_step": 136724, "epoch": 3255} {"train_loss": -6.766879081726074, "global_step": 136725, "epoch": 3255} {"train_loss": -6.618271827697754, "global_step": 136726, "epoch": 3255} {"train_loss": -6.94151496887207, "global_step": 136727, "epoch": 3255} {"train_loss": -6.585299491882324, "global_step": 136728, "epoch": 3255} {"train_loss": -6.692392349243164, "global_step": 136729, "epoch": 3255} {"train_loss": -6.74941349029541, "global_step": 136730, "epoch": 3255} {"train_loss": -6.549799919128418, "global_step": 136731, "epoch": 3255} {"train_loss": -6.8555498123168945, "global_step": 136732, "epoch": 3255} {"train_loss": -6.646431922912598, "global_step": 136733, "epoch": 3255} {"train_loss": -6.752908706665039, "global_step": 136734, "epoch": 3255} {"train_loss": -6.7425432205200195, "global_step": 136735, "epoch": 3255} {"train_loss": -6.612621784210205, "global_step": 136736, "epoch": 3255} {"train_loss": -6.709267616271973, "global_step": 136737, "epoch": 3255} {"train_loss": -6.599257469177246, "global_step": 136738, "epoch": 3255} {"train_loss": -6.643313884735107, "global_step": 136739, "epoch": 3255} {"train_loss": -6.62812614440918, "global_step": 136740, "epoch": 3255} {"train_loss": -6.704054832458496, "global_step": 136741, "epoch": 3255} {"train_loss": -6.7047014236450195, "global_step": 136742, "epoch": 3255} {"train_loss": -6.561374664306641, "global_step": 136743, "epoch": 3255} {"train_loss": -6.641910076141357, "global_step": 136744, "epoch": 3255} {"train_loss": -6.568396091461182, "global_step": 136745, "epoch": 3255} {"train_loss": -6.718130111694336, "global_step": 136746, "epoch": 3255} {"train_loss": -6.574016094207764, "global_step": 136747, "epoch": 3255} {"train_loss": -6.700475215911865, "global_step": 136748, "epoch": 3255} {"train_loss": -6.452444076538086, "global_step": 136749, "epoch": 3255} {"train_loss": -6.6148176193237305, "global_step": 136750, "epoch": 3255} {"train_loss": -6.683741013209025, "global_step": 136751, "epoch": 3255, "val_loss": 67047.328125} {"train_loss": -6.748620986938477, "global_step": 136752, "epoch": 3256} {"train_loss": -6.6634368896484375, "global_step": 136753, "epoch": 3256} {"train_loss": -6.661215782165527, "global_step": 136754, "epoch": 3256} {"train_loss": -6.761407852172852, "global_step": 136755, "epoch": 3256} {"train_loss": -6.6508636474609375, "global_step": 136756, "epoch": 3256} {"train_loss": -6.713224411010742, "global_step": 136757, "epoch": 3256} {"train_loss": -6.611135482788086, "global_step": 136758, "epoch": 3256} {"train_loss": -6.816893577575684, "global_step": 136759, "epoch": 3256} {"train_loss": -6.697551727294922, "global_step": 136760, "epoch": 3256} {"train_loss": -6.78862190246582, "global_step": 136761, "epoch": 3256} {"train_loss": -6.616329669952393, "global_step": 136762, "epoch": 3256} {"train_loss": -6.711487770080566, "global_step": 136763, "epoch": 3256} {"train_loss": -6.809547424316406, "global_step": 136764, "epoch": 3256} {"train_loss": -6.785852909088135, "global_step": 136765, "epoch": 3256} {"train_loss": -6.796450614929199, "global_step": 136766, "epoch": 3256} {"train_loss": -6.8058180809021, "global_step": 136767, "epoch": 3256} {"train_loss": -6.7998857498168945, "global_step": 136768, "epoch": 3256} {"train_loss": -6.766299247741699, "global_step": 136769, "epoch": 3256} {"train_loss": -6.735623836517334, "global_step": 136770, "epoch": 3256} {"train_loss": -6.825251579284668, "global_step": 136771, "epoch": 3256} {"train_loss": -6.763042449951172, "global_step": 136772, "epoch": 3256} {"train_loss": -6.646944999694824, "global_step": 136773, "epoch": 3256} {"train_loss": -6.680210590362549, "global_step": 136774, "epoch": 3256} {"train_loss": -6.768457889556885, "global_step": 136775, "epoch": 3256} {"train_loss": -6.823341369628906, "global_step": 136776, "epoch": 3256} {"train_loss": -6.716318130493164, "global_step": 136777, "epoch": 3256} {"train_loss": -6.824163436889648, "global_step": 136778, "epoch": 3256} {"train_loss": -6.758257865905762, "global_step": 136779, "epoch": 3256} {"train_loss": -6.702581405639648, "global_step": 136780, "epoch": 3256} {"train_loss": -6.690123558044434, "global_step": 136781, "epoch": 3256} {"train_loss": -6.727488040924072, "global_step": 136782, "epoch": 3256} {"train_loss": -6.774432182312012, "global_step": 136783, "epoch": 3256} {"train_loss": -6.674925327301025, "global_step": 136784, "epoch": 3256} {"train_loss": -6.757490158081055, "global_step": 136785, "epoch": 3256} {"train_loss": -6.777388572692871, "global_step": 136786, "epoch": 3256} {"train_loss": -6.741301536560059, "global_step": 136787, "epoch": 3256} {"train_loss": -6.594781875610352, "global_step": 136788, "epoch": 3256} {"train_loss": -6.576779365539551, "global_step": 136789, "epoch": 3256} {"train_loss": -6.730465888977051, "global_step": 136790, "epoch": 3256} {"train_loss": -6.642325401306152, "global_step": 136791, "epoch": 3256} {"train_loss": -6.838597297668457, "global_step": 136792, "epoch": 3256} {"train_loss": -6.726086026146298, "global_step": 136793, "epoch": 3256, "val_loss": 66887.4921875} {"train_loss": -6.608367919921875, "global_step": 136794, "epoch": 3257} {"train_loss": -6.746062278747559, "global_step": 136795, "epoch": 3257} {"train_loss": -6.6192731857299805, "global_step": 136796, "epoch": 3257} {"train_loss": -6.892941474914551, "global_step": 136797, "epoch": 3257} {"train_loss": -6.74116325378418, "global_step": 136798, "epoch": 3257} {"train_loss": -6.829617500305176, "global_step": 136799, "epoch": 3257} {"train_loss": -6.796346664428711, "global_step": 136800, "epoch": 3257} {"train_loss": -6.70096492767334, "global_step": 136801, "epoch": 3257} {"train_loss": -6.869029998779297, "global_step": 136802, "epoch": 3257} {"train_loss": -6.637558460235596, "global_step": 136803, "epoch": 3257} {"train_loss": -6.834018707275391, "global_step": 136804, "epoch": 3257} {"train_loss": -6.84058141708374, "global_step": 136805, "epoch": 3257} {"train_loss": -6.784564971923828, "global_step": 136806, "epoch": 3257} {"train_loss": -6.714686393737793, "global_step": 136807, "epoch": 3257} {"train_loss": -6.757131576538086, "global_step": 136808, "epoch": 3257} {"train_loss": -6.738019943237305, "global_step": 136809, "epoch": 3257} {"train_loss": -6.707785606384277, "global_step": 136810, "epoch": 3257} {"train_loss": -6.860759735107422, "global_step": 136811, "epoch": 3257} {"train_loss": -6.805994987487793, "global_step": 136812, "epoch": 3257} {"train_loss": -6.743261814117432, "global_step": 136813, "epoch": 3257} {"train_loss": -6.770508289337158, "global_step": 136814, "epoch": 3257} {"train_loss": -6.688418865203857, "global_step": 136815, "epoch": 3257} {"train_loss": -6.6519927978515625, "global_step": 136816, "epoch": 3257} {"train_loss": -6.568343162536621, "global_step": 136817, "epoch": 3257} {"train_loss": -6.686263084411621, "global_step": 136818, "epoch": 3257} {"train_loss": -6.719293594360352, "global_step": 136819, "epoch": 3257} {"train_loss": -6.775445938110352, "global_step": 136820, "epoch": 3257} {"train_loss": -6.7380499839782715, "global_step": 136821, "epoch": 3257} {"train_loss": -6.721185207366943, "global_step": 136822, "epoch": 3257} {"train_loss": -6.668120384216309, "global_step": 136823, "epoch": 3257} {"train_loss": -6.815607070922852, "global_step": 136824, "epoch": 3257} {"train_loss": -6.69529914855957, "global_step": 136825, "epoch": 3257} {"train_loss": -6.864010810852051, "global_step": 136826, "epoch": 3257} {"train_loss": -6.876028060913086, "global_step": 136827, "epoch": 3257} {"train_loss": -6.736687183380127, "global_step": 136828, "epoch": 3257} {"train_loss": -6.7240681648254395, "global_step": 136829, "epoch": 3257} {"train_loss": -6.752461910247803, "global_step": 136830, "epoch": 3257} {"train_loss": -6.781256675720215, "global_step": 136831, "epoch": 3257} {"train_loss": -6.825404644012451, "global_step": 136832, "epoch": 3257} {"train_loss": -6.756633281707764, "global_step": 136833, "epoch": 3257} {"train_loss": -6.809698104858398, "global_step": 136834, "epoch": 3257} {"train_loss": -6.750880968003046, "global_step": 136835, "epoch": 3257, "val_loss": 67081.203125} {"train_loss": -6.682964324951172, "global_step": 136836, "epoch": 3258} {"train_loss": -6.765185356140137, "global_step": 136837, "epoch": 3258} {"train_loss": -6.559166431427002, "global_step": 136838, "epoch": 3258} {"train_loss": -6.776887893676758, "global_step": 136839, "epoch": 3258} {"train_loss": -6.620729446411133, "global_step": 136840, "epoch": 3258} {"train_loss": -6.64259147644043, "global_step": 136841, "epoch": 3258} {"train_loss": -6.742399215698242, "global_step": 136842, "epoch": 3258} {"train_loss": -6.602232933044434, "global_step": 136843, "epoch": 3258} {"train_loss": -6.589862823486328, "global_step": 136844, "epoch": 3258} {"train_loss": -6.572275161743164, "global_step": 136845, "epoch": 3258} {"train_loss": -6.655043601989746, "global_step": 136846, "epoch": 3258} {"train_loss": -6.77781867980957, "global_step": 136847, "epoch": 3258} {"train_loss": -6.56585693359375, "global_step": 136848, "epoch": 3258} {"train_loss": -6.675268173217773, "global_step": 136849, "epoch": 3258} {"train_loss": -6.716960430145264, "global_step": 136850, "epoch": 3258} {"train_loss": -6.65315580368042, "global_step": 136851, "epoch": 3258} {"train_loss": -6.677797317504883, "global_step": 136852, "epoch": 3258} {"train_loss": -6.540268421173096, "global_step": 136853, "epoch": 3258} {"train_loss": -6.636501789093018, "global_step": 136854, "epoch": 3258} {"train_loss": -6.716288089752197, "global_step": 136855, "epoch": 3258} {"train_loss": -6.6260833740234375, "global_step": 136856, "epoch": 3258} {"train_loss": -6.573322772979736, "global_step": 136857, "epoch": 3258} {"train_loss": -6.753767967224121, "global_step": 136858, "epoch": 3258} {"train_loss": -6.695955753326416, "global_step": 136859, "epoch": 3258} {"train_loss": -6.663895606994629, "global_step": 136860, "epoch": 3258} {"train_loss": -6.653515338897705, "global_step": 136861, "epoch": 3258} {"train_loss": -6.638727188110352, "global_step": 136862, "epoch": 3258} {"train_loss": -6.733612060546875, "global_step": 136863, "epoch": 3258} {"train_loss": -6.6284613609313965, "global_step": 136864, "epoch": 3258} {"train_loss": -6.706352233886719, "global_step": 136865, "epoch": 3258} {"train_loss": -6.6867828369140625, "global_step": 136866, "epoch": 3258} {"train_loss": -6.811973571777344, "global_step": 136867, "epoch": 3258} {"train_loss": -6.7159423828125, "global_step": 136868, "epoch": 3258} {"train_loss": -6.688173294067383, "global_step": 136869, "epoch": 3258} {"train_loss": -6.7628631591796875, "global_step": 136870, "epoch": 3258} {"train_loss": -6.701940536499023, "global_step": 136871, "epoch": 3258} {"train_loss": -6.607264995574951, "global_step": 136872, "epoch": 3258} {"train_loss": -6.7837042808532715, "global_step": 136873, "epoch": 3258} {"train_loss": -6.609185218811035, "global_step": 136874, "epoch": 3258} {"train_loss": -6.7512617111206055, "global_step": 136875, "epoch": 3258} {"train_loss": -6.646905899047852, "global_step": 136876, "epoch": 3258} {"train_loss": -6.676307712282453, "global_step": 136877, "epoch": 3258, "val_loss": 67083.5390625} {"train_loss": -6.690850257873535, "global_step": 136878, "epoch": 3259} {"train_loss": -6.751166343688965, "global_step": 136879, "epoch": 3259} {"train_loss": -6.7555670738220215, "global_step": 136880, "epoch": 3259} {"train_loss": -6.779723167419434, "global_step": 136881, "epoch": 3259} {"train_loss": -6.72493839263916, "global_step": 136882, "epoch": 3259} {"train_loss": -6.769469738006592, "global_step": 136883, "epoch": 3259} {"train_loss": -6.692388534545898, "global_step": 136884, "epoch": 3259} {"train_loss": -6.735900402069092, "global_step": 136885, "epoch": 3259} {"train_loss": -6.755684852600098, "global_step": 136886, "epoch": 3259} {"train_loss": -6.800751209259033, "global_step": 136887, "epoch": 3259} {"train_loss": -6.830766201019287, "global_step": 136888, "epoch": 3259} {"train_loss": -6.7358856201171875, "global_step": 136889, "epoch": 3259} {"train_loss": -6.72980260848999, "global_step": 136890, "epoch": 3259} {"train_loss": -6.750688076019287, "global_step": 136891, "epoch": 3259} {"train_loss": -6.763440132141113, "global_step": 136892, "epoch": 3259} {"train_loss": -6.7339582443237305, "global_step": 136893, "epoch": 3259} {"train_loss": -6.667804718017578, "global_step": 136894, "epoch": 3259} {"train_loss": -6.737565040588379, "global_step": 136895, "epoch": 3259} {"train_loss": -6.744211196899414, "global_step": 136896, "epoch": 3259} {"train_loss": -6.728644371032715, "global_step": 136897, "epoch": 3259} {"train_loss": -6.629931449890137, "global_step": 136898, "epoch": 3259} {"train_loss": -6.820258140563965, "global_step": 136899, "epoch": 3259} {"train_loss": -6.774843215942383, "global_step": 136900, "epoch": 3259} {"train_loss": -6.825567245483398, "global_step": 136901, "epoch": 3259} {"train_loss": -6.72186279296875, "global_step": 136902, "epoch": 3259} {"train_loss": -6.637204170227051, "global_step": 136903, "epoch": 3259} {"train_loss": -6.696758270263672, "global_step": 136904, "epoch": 3259} {"train_loss": -6.803049087524414, "global_step": 136905, "epoch": 3259} {"train_loss": -6.6598100662231445, "global_step": 136906, "epoch": 3259} {"train_loss": -6.712011337280273, "global_step": 136907, "epoch": 3259} {"train_loss": -6.834473133087158, "global_step": 136908, "epoch": 3259} {"train_loss": -6.750761032104492, "global_step": 136909, "epoch": 3259} {"train_loss": -6.643054962158203, "global_step": 136910, "epoch": 3259} {"train_loss": -6.749338150024414, "global_step": 136911, "epoch": 3259} {"train_loss": -6.784086227416992, "global_step": 136912, "epoch": 3259} {"train_loss": -6.635928153991699, "global_step": 136913, "epoch": 3259} {"train_loss": -6.6106181144714355, "global_step": 136914, "epoch": 3259} {"train_loss": -6.6324262619018555, "global_step": 136915, "epoch": 3259} {"train_loss": -6.475612640380859, "global_step": 136916, "epoch": 3259} {"train_loss": -6.708117961883545, "global_step": 136917, "epoch": 3259} {"train_loss": -6.599973678588867, "global_step": 136918, "epoch": 3259} {"train_loss": -6.717715206600371, "global_step": 136919, "epoch": 3259, "val_loss": 67439.1875} {"train_loss": -6.611516952514648, "global_step": 136920, "epoch": 3260} {"train_loss": -6.663045883178711, "global_step": 136921, "epoch": 3260} {"train_loss": -6.694005489349365, "global_step": 136922, "epoch": 3260} {"train_loss": -6.565864086151123, "global_step": 136923, "epoch": 3260} {"train_loss": -6.482659339904785, "global_step": 136924, "epoch": 3260} {"train_loss": -6.563899993896484, "global_step": 136925, "epoch": 3260} {"train_loss": -6.6851677894592285, "global_step": 136926, "epoch": 3260} {"train_loss": -6.4328179359436035, "global_step": 136927, "epoch": 3260} {"train_loss": -6.672107219696045, "global_step": 136928, "epoch": 3260} {"train_loss": -6.569509506225586, "global_step": 136929, "epoch": 3260} {"train_loss": -6.669568061828613, "global_step": 136930, "epoch": 3260} {"train_loss": -6.599302291870117, "global_step": 136931, "epoch": 3260} {"train_loss": -6.66679573059082, "global_step": 136932, "epoch": 3260} {"train_loss": -6.663688659667969, "global_step": 136933, "epoch": 3260} {"train_loss": -6.6539130210876465, "global_step": 136934, "epoch": 3260} {"train_loss": -6.727604866027832, "global_step": 136935, "epoch": 3260} {"train_loss": -6.715451717376709, "global_step": 136936, "epoch": 3260} {"train_loss": -6.782580375671387, "global_step": 136937, "epoch": 3260} {"train_loss": -6.765467643737793, "global_step": 136938, "epoch": 3260} {"train_loss": -6.78141450881958, "global_step": 136939, "epoch": 3260} {"train_loss": -6.76081657409668, "global_step": 136940, "epoch": 3260} {"train_loss": -6.746914863586426, "global_step": 136941, "epoch": 3260} {"train_loss": -6.619683265686035, "global_step": 136942, "epoch": 3260} {"train_loss": -6.702568054199219, "global_step": 136943, "epoch": 3260} {"train_loss": -6.8354387283325195, "global_step": 136944, "epoch": 3260} {"train_loss": -6.797698497772217, "global_step": 136945, "epoch": 3260} {"train_loss": -6.849608421325684, "global_step": 136946, "epoch": 3260} {"train_loss": -6.810524940490723, "global_step": 136947, "epoch": 3260} {"train_loss": -6.686479568481445, "global_step": 136948, "epoch": 3260} {"train_loss": -6.687289714813232, "global_step": 136949, "epoch": 3260} {"train_loss": -6.667325019836426, "global_step": 136950, "epoch": 3260} {"train_loss": -6.75868558883667, "global_step": 136951, "epoch": 3260} {"train_loss": -6.808455467224121, "global_step": 136952, "epoch": 3260} {"train_loss": -6.664244651794434, "global_step": 136953, "epoch": 3260} {"train_loss": -6.893681526184082, "global_step": 136954, "epoch": 3260} {"train_loss": -6.777435302734375, "global_step": 136955, "epoch": 3260} {"train_loss": -6.86247444152832, "global_step": 136956, "epoch": 3260} {"train_loss": -6.837596893310547, "global_step": 136957, "epoch": 3260} {"train_loss": -6.808093547821045, "global_step": 136958, "epoch": 3260} {"train_loss": -6.8093719482421875, "global_step": 136959, "epoch": 3260} {"train_loss": -6.861794948577881, "global_step": 136960, "epoch": 3260} {"train_loss": -6.716004144577753, "global_step": 136961, "epoch": 3260, "val_loss": 67043.4375} {"train_loss": -6.835406303405762, "global_step": 136962, "epoch": 3261} {"train_loss": -6.771609306335449, "global_step": 136963, "epoch": 3261} {"train_loss": -6.826138496398926, "global_step": 136964, "epoch": 3261} {"train_loss": -6.727933406829834, "global_step": 136965, "epoch": 3261} {"train_loss": -6.761075973510742, "global_step": 136966, "epoch": 3261} {"train_loss": -6.847548961639404, "global_step": 136967, "epoch": 3261} {"train_loss": -6.740488052368164, "global_step": 136968, "epoch": 3261} {"train_loss": -6.7562994956970215, "global_step": 136969, "epoch": 3261} {"train_loss": -6.699562072753906, "global_step": 136970, "epoch": 3261} {"train_loss": -6.766823768615723, "global_step": 136971, "epoch": 3261} {"train_loss": -6.775675296783447, "global_step": 136972, "epoch": 3261} {"train_loss": -6.711846351623535, "global_step": 136973, "epoch": 3261} {"train_loss": -6.667819976806641, "global_step": 136974, "epoch": 3261} {"train_loss": -6.825959205627441, "global_step": 136975, "epoch": 3261} {"train_loss": -6.821624755859375, "global_step": 136976, "epoch": 3261} {"train_loss": -6.595111846923828, "global_step": 136977, "epoch": 3261} {"train_loss": -6.722135066986084, "global_step": 136978, "epoch": 3261} {"train_loss": -6.692786693572998, "global_step": 136979, "epoch": 3261} {"train_loss": -6.6831207275390625, "global_step": 136980, "epoch": 3261} {"train_loss": -6.663150787353516, "global_step": 136981, "epoch": 3261} {"train_loss": -6.702425956726074, "global_step": 136982, "epoch": 3261} {"train_loss": -6.721617698669434, "global_step": 136983, "epoch": 3261} {"train_loss": -6.701048851013184, "global_step": 136984, "epoch": 3261} {"train_loss": -6.691407680511475, "global_step": 136985, "epoch": 3261} {"train_loss": -6.715115070343018, "global_step": 136986, "epoch": 3261} {"train_loss": -6.743461608886719, "global_step": 136987, "epoch": 3261} {"train_loss": -6.686857223510742, "global_step": 136988, "epoch": 3261} {"train_loss": -6.618451118469238, "global_step": 136989, "epoch": 3261} {"train_loss": -6.637200355529785, "global_step": 136990, "epoch": 3261} {"train_loss": -6.64192533493042, "global_step": 136991, "epoch": 3261} {"train_loss": -6.63956356048584, "global_step": 136992, "epoch": 3261} {"train_loss": -6.747442245483398, "global_step": 136993, "epoch": 3261} {"train_loss": -6.608475685119629, "global_step": 136994, "epoch": 3261} {"train_loss": -6.64547061920166, "global_step": 136995, "epoch": 3261} {"train_loss": -6.707470893859863, "global_step": 136996, "epoch": 3261} {"train_loss": -6.70485782623291, "global_step": 136997, "epoch": 3261} {"train_loss": -6.641192436218262, "global_step": 136998, "epoch": 3261} {"train_loss": -6.682776927947998, "global_step": 136999, "epoch": 3261} {"train_loss": -6.747592449188232, "global_step": 137000, "epoch": 3261} {"train_loss": -6.632959365844727, "global_step": 137001, "epoch": 3261} {"train_loss": -6.674404144287109, "global_step": 137002, "epoch": 3261} {"train_loss": -6.7117477258046465, "global_step": 137003, "epoch": 3261, "val_loss": 67086.8359375} {"train_loss": -6.772934913635254, "global_step": 137004, "epoch": 3262} {"train_loss": -6.716658592224121, "global_step": 137005, "epoch": 3262} {"train_loss": -6.578826904296875, "global_step": 137006, "epoch": 3262} {"train_loss": -6.709831237792969, "global_step": 137007, "epoch": 3262} {"train_loss": -6.702826499938965, "global_step": 137008, "epoch": 3262} {"train_loss": -6.691454887390137, "global_step": 137009, "epoch": 3262} {"train_loss": -6.705979347229004, "global_step": 137010, "epoch": 3262} {"train_loss": -6.706872940063477, "global_step": 137011, "epoch": 3262} {"train_loss": -6.581277847290039, "global_step": 137012, "epoch": 3262} {"train_loss": -6.660818099975586, "global_step": 137013, "epoch": 3262} {"train_loss": -6.696419715881348, "global_step": 137014, "epoch": 3262} {"train_loss": -6.8446431159973145, "global_step": 137015, "epoch": 3262} {"train_loss": -6.689558029174805, "global_step": 137016, "epoch": 3262} {"train_loss": -6.624054431915283, "global_step": 137017, "epoch": 3262} {"train_loss": -6.647194862365723, "global_step": 137018, "epoch": 3262} {"train_loss": -6.694064140319824, "global_step": 137019, "epoch": 3262} {"train_loss": -6.839181900024414, "global_step": 137020, "epoch": 3262} {"train_loss": -6.65954065322876, "global_step": 137021, "epoch": 3262} {"train_loss": -6.856128692626953, "global_step": 137022, "epoch": 3262} {"train_loss": -6.695772171020508, "global_step": 137023, "epoch": 3262} {"train_loss": -6.788278579711914, "global_step": 137024, "epoch": 3262} {"train_loss": -6.793116569519043, "global_step": 137025, "epoch": 3262} {"train_loss": -6.803075790405273, "global_step": 137026, "epoch": 3262} {"train_loss": -6.620021820068359, "global_step": 137027, "epoch": 3262} {"train_loss": -6.768446445465088, "global_step": 137028, "epoch": 3262} {"train_loss": -6.776782989501953, "global_step": 137029, "epoch": 3262} {"train_loss": -6.683954238891602, "global_step": 137030, "epoch": 3262} {"train_loss": -6.82341194152832, "global_step": 137031, "epoch": 3262} {"train_loss": -6.825902938842773, "global_step": 137032, "epoch": 3262} {"train_loss": -6.72047758102417, "global_step": 137033, "epoch": 3262} {"train_loss": -6.759302139282227, "global_step": 137034, "epoch": 3262} {"train_loss": -6.770298480987549, "global_step": 137035, "epoch": 3262} {"train_loss": -6.722810745239258, "global_step": 137036, "epoch": 3262} {"train_loss": -6.64743185043335, "global_step": 137037, "epoch": 3262} {"train_loss": -6.648421287536621, "global_step": 137038, "epoch": 3262} {"train_loss": -6.750425338745117, "global_step": 137039, "epoch": 3262} {"train_loss": -6.78572940826416, "global_step": 137040, "epoch": 3262} {"train_loss": -6.752429485321045, "global_step": 137041, "epoch": 3262} {"train_loss": -6.768346786499023, "global_step": 137042, "epoch": 3262} {"train_loss": -6.691093444824219, "global_step": 137043, "epoch": 3262} {"train_loss": -6.708367824554443, "global_step": 137044, "epoch": 3262} {"train_loss": -6.724827755065191, "global_step": 137045, "epoch": 3262, "val_loss": 67115.2734375} {"train_loss": -6.660350799560547, "global_step": 137046, "epoch": 3263} {"train_loss": -6.768733978271484, "global_step": 137047, "epoch": 3263} {"train_loss": -6.59004020690918, "global_step": 137048, "epoch": 3263} {"train_loss": -6.70665168762207, "global_step": 137049, "epoch": 3263} {"train_loss": -6.723548889160156, "global_step": 137050, "epoch": 3263} {"train_loss": -6.829468727111816, "global_step": 137051, "epoch": 3263} {"train_loss": -6.704110145568848, "global_step": 137052, "epoch": 3263} {"train_loss": -6.851559162139893, "global_step": 137053, "epoch": 3263} {"train_loss": -6.779732704162598, "global_step": 137054, "epoch": 3263} {"train_loss": -6.728808403015137, "global_step": 137055, "epoch": 3263} {"train_loss": -6.764975547790527, "global_step": 137056, "epoch": 3263} {"train_loss": -6.773322582244873, "global_step": 137057, "epoch": 3263} {"train_loss": -6.622421741485596, "global_step": 137058, "epoch": 3263} {"train_loss": -6.705387115478516, "global_step": 137059, "epoch": 3263} {"train_loss": -6.647031784057617, "global_step": 137060, "epoch": 3263} {"train_loss": -6.732613563537598, "global_step": 137061, "epoch": 3263} {"train_loss": -6.855386734008789, "global_step": 137062, "epoch": 3263} {"train_loss": -6.848747253417969, "global_step": 137063, "epoch": 3263} {"train_loss": -6.786561965942383, "global_step": 137064, "epoch": 3263} {"train_loss": -6.694779396057129, "global_step": 137065, "epoch": 3263} {"train_loss": -6.791650772094727, "global_step": 137066, "epoch": 3263} {"train_loss": -6.851633071899414, "global_step": 137067, "epoch": 3263} {"train_loss": -6.759149074554443, "global_step": 137068, "epoch": 3263} {"train_loss": -6.800281524658203, "global_step": 137069, "epoch": 3263} {"train_loss": -6.792781829833984, "global_step": 137070, "epoch": 3263} {"train_loss": -6.770013809204102, "global_step": 137071, "epoch": 3263} {"train_loss": -6.808121681213379, "global_step": 137072, "epoch": 3263} {"train_loss": -6.755402565002441, "global_step": 137073, "epoch": 3263} {"train_loss": -6.798648357391357, "global_step": 137074, "epoch": 3263} {"train_loss": -6.781397342681885, "global_step": 137075, "epoch": 3263} {"train_loss": -6.8063554763793945, "global_step": 137076, "epoch": 3263} {"train_loss": -6.640571117401123, "global_step": 137077, "epoch": 3263} {"train_loss": -6.896746635437012, "global_step": 137078, "epoch": 3263} {"train_loss": -6.734075546264648, "global_step": 137079, "epoch": 3263} {"train_loss": -6.775891304016113, "global_step": 137080, "epoch": 3263} {"train_loss": -6.697772026062012, "global_step": 137081, "epoch": 3263} {"train_loss": -6.72893762588501, "global_step": 137082, "epoch": 3263} {"train_loss": -6.7601776123046875, "global_step": 137083, "epoch": 3263} {"train_loss": -6.5840044021606445, "global_step": 137084, "epoch": 3263} {"train_loss": -6.77620792388916, "global_step": 137085, "epoch": 3263} {"train_loss": -6.601836204528809, "global_step": 137086, "epoch": 3263} {"train_loss": -6.748642047246297, "global_step": 137087, "epoch": 3263, "val_loss": 67159.46875} {"train_loss": -6.723276615142822, "global_step": 137088, "epoch": 3264} {"train_loss": -6.6788740158081055, "global_step": 137089, "epoch": 3264} {"train_loss": -6.678531646728516, "global_step": 137090, "epoch": 3264} {"train_loss": -6.733635902404785, "global_step": 137091, "epoch": 3264} {"train_loss": -6.711111068725586, "global_step": 137092, "epoch": 3264} {"train_loss": -6.710997581481934, "global_step": 137093, "epoch": 3264} {"train_loss": -6.687811851501465, "global_step": 137094, "epoch": 3264} {"train_loss": -6.686786651611328, "global_step": 137095, "epoch": 3264} {"train_loss": -6.753294467926025, "global_step": 137096, "epoch": 3264} {"train_loss": -6.854131698608398, "global_step": 137097, "epoch": 3264} {"train_loss": -6.604606628417969, "global_step": 137098, "epoch": 3264} {"train_loss": -6.788496017456055, "global_step": 137099, "epoch": 3264} {"train_loss": -6.783326148986816, "global_step": 137100, "epoch": 3264} {"train_loss": -6.690217971801758, "global_step": 137101, "epoch": 3264} {"train_loss": -6.765719890594482, "global_step": 137102, "epoch": 3264} {"train_loss": -6.687140464782715, "global_step": 137103, "epoch": 3264} {"train_loss": -6.712092876434326, "global_step": 137104, "epoch": 3264} {"train_loss": -6.748501777648926, "global_step": 137105, "epoch": 3264} {"train_loss": -6.674782752990723, "global_step": 137106, "epoch": 3264} {"train_loss": -6.688576698303223, "global_step": 137107, "epoch": 3264} {"train_loss": -6.71549129486084, "global_step": 137108, "epoch": 3264} {"train_loss": -6.633721351623535, "global_step": 137109, "epoch": 3264} {"train_loss": -6.725677490234375, "global_step": 137110, "epoch": 3264} {"train_loss": -6.714404106140137, "global_step": 137111, "epoch": 3264} {"train_loss": -6.685842990875244, "global_step": 137112, "epoch": 3264} {"train_loss": -6.6692705154418945, "global_step": 137113, "epoch": 3264} {"train_loss": -6.832202911376953, "global_step": 137114, "epoch": 3264} {"train_loss": -6.643612384796143, "global_step": 137115, "epoch": 3264} {"train_loss": -6.650171279907227, "global_step": 137116, "epoch": 3264} {"train_loss": -6.801712989807129, "global_step": 137117, "epoch": 3264} {"train_loss": -6.693469047546387, "global_step": 137118, "epoch": 3264} {"train_loss": -6.741235733032227, "global_step": 137119, "epoch": 3264} {"train_loss": -6.74818229675293, "global_step": 137120, "epoch": 3264} {"train_loss": -6.719517707824707, "global_step": 137121, "epoch": 3264} {"train_loss": -6.803629398345947, "global_step": 137122, "epoch": 3264} {"train_loss": -6.729742050170898, "global_step": 137123, "epoch": 3264} {"train_loss": -6.805270671844482, "global_step": 137124, "epoch": 3264} {"train_loss": -6.739985466003418, "global_step": 137125, "epoch": 3264} {"train_loss": -6.669579029083252, "global_step": 137126, "epoch": 3264} {"train_loss": -6.79025936126709, "global_step": 137127, "epoch": 3264} {"train_loss": -6.672863960266113, "global_step": 137128, "epoch": 3264} {"train_loss": -6.720838274274554, "global_step": 137129, "epoch": 3264, "val_loss": 67084.5859375} {"train_loss": -6.748737335205078, "global_step": 137130, "epoch": 3265} {"train_loss": -6.704809665679932, "global_step": 137131, "epoch": 3265} {"train_loss": -6.705306053161621, "global_step": 137132, "epoch": 3265} {"train_loss": -6.5457444190979, "global_step": 137133, "epoch": 3265} {"train_loss": -6.763324737548828, "global_step": 137134, "epoch": 3265} {"train_loss": -6.813000679016113, "global_step": 137135, "epoch": 3265} {"train_loss": -6.675093650817871, "global_step": 137136, "epoch": 3265} {"train_loss": -6.780723571777344, "global_step": 137137, "epoch": 3265} {"train_loss": -6.771158218383789, "global_step": 137138, "epoch": 3265} {"train_loss": -6.713678359985352, "global_step": 137139, "epoch": 3265} {"train_loss": -6.79701566696167, "global_step": 137140, "epoch": 3265} {"train_loss": -6.7254838943481445, "global_step": 137141, "epoch": 3265} {"train_loss": -6.738112449645996, "global_step": 137142, "epoch": 3265} {"train_loss": -6.688683986663818, "global_step": 137143, "epoch": 3265} {"train_loss": -6.7021989822387695, "global_step": 137144, "epoch": 3265} {"train_loss": -6.7231831550598145, "global_step": 137145, "epoch": 3265} {"train_loss": -6.782980442047119, "global_step": 137146, "epoch": 3265} {"train_loss": -6.721681594848633, "global_step": 137147, "epoch": 3265} {"train_loss": -6.792510509490967, "global_step": 137148, "epoch": 3265} {"train_loss": -6.809065818786621, "global_step": 137149, "epoch": 3265} {"train_loss": -6.787849426269531, "global_step": 137150, "epoch": 3265} {"train_loss": -6.703873157501221, "global_step": 137151, "epoch": 3265} {"train_loss": -6.674833297729492, "global_step": 137152, "epoch": 3265} {"train_loss": -6.648724555969238, "global_step": 137153, "epoch": 3265} {"train_loss": -6.7277421951293945, "global_step": 137154, "epoch": 3265} {"train_loss": -6.715140342712402, "global_step": 137155, "epoch": 3265} {"train_loss": -6.61012077331543, "global_step": 137156, "epoch": 3265} {"train_loss": -6.742649555206299, "global_step": 137157, "epoch": 3265} {"train_loss": -6.698242664337158, "global_step": 137158, "epoch": 3265} {"train_loss": -6.646026134490967, "global_step": 137159, "epoch": 3265} {"train_loss": -6.686041355133057, "global_step": 137160, "epoch": 3265} {"train_loss": -6.618574619293213, "global_step": 137161, "epoch": 3265} {"train_loss": -6.856874465942383, "global_step": 137162, "epoch": 3265} {"train_loss": -6.684298038482666, "global_step": 137163, "epoch": 3265} {"train_loss": -6.63051700592041, "global_step": 137164, "epoch": 3265} {"train_loss": -6.719679832458496, "global_step": 137165, "epoch": 3265} {"train_loss": -6.878909111022949, "global_step": 137166, "epoch": 3265} {"train_loss": -6.787568092346191, "global_step": 137167, "epoch": 3265} {"train_loss": -6.754761695861816, "global_step": 137168, "epoch": 3265} {"train_loss": -6.669290542602539, "global_step": 137169, "epoch": 3265} {"train_loss": -6.813499450683594, "global_step": 137170, "epoch": 3265} {"train_loss": -6.728144906816029, "global_step": 137171, "epoch": 3265, "val_loss": 67194.7578125} {"train_loss": -6.713719367980957, "global_step": 137172, "epoch": 3266} {"train_loss": -6.743396282196045, "global_step": 137173, "epoch": 3266} {"train_loss": -6.756390571594238, "global_step": 137174, "epoch": 3266} {"train_loss": -6.662661552429199, "global_step": 137175, "epoch": 3266} {"train_loss": -6.89685583114624, "global_step": 137176, "epoch": 3266} {"train_loss": -6.789572715759277, "global_step": 137177, "epoch": 3266} {"train_loss": -6.816003799438477, "global_step": 137178, "epoch": 3266} {"train_loss": -6.753607273101807, "global_step": 137179, "epoch": 3266} {"train_loss": -6.674434661865234, "global_step": 137180, "epoch": 3266} {"train_loss": -6.886502265930176, "global_step": 137181, "epoch": 3266} {"train_loss": -6.721670627593994, "global_step": 137182, "epoch": 3266} {"train_loss": -6.824125289916992, "global_step": 137183, "epoch": 3266} {"train_loss": -6.70071268081665, "global_step": 137184, "epoch": 3266} {"train_loss": -6.698696136474609, "global_step": 137185, "epoch": 3266} {"train_loss": -6.740653991699219, "global_step": 137186, "epoch": 3266} {"train_loss": -6.651523590087891, "global_step": 137187, "epoch": 3266} {"train_loss": -6.729565620422363, "global_step": 137188, "epoch": 3266} {"train_loss": -6.760117053985596, "global_step": 137189, "epoch": 3266} {"train_loss": -6.663313865661621, "global_step": 137190, "epoch": 3266} {"train_loss": -6.69923734664917, "global_step": 137191, "epoch": 3266} {"train_loss": -6.552252769470215, "global_step": 137192, "epoch": 3266} {"train_loss": -6.617760181427002, "global_step": 137193, "epoch": 3266} {"train_loss": -6.760421276092529, "global_step": 137194, "epoch": 3266} {"train_loss": -6.710301399230957, "global_step": 137195, "epoch": 3266} {"train_loss": -6.773642539978027, "global_step": 137196, "epoch": 3266} {"train_loss": -6.629570960998535, "global_step": 137197, "epoch": 3266} {"train_loss": -6.6762542724609375, "global_step": 137198, "epoch": 3266} {"train_loss": -6.69620418548584, "global_step": 137199, "epoch": 3266} {"train_loss": -6.663153171539307, "global_step": 137200, "epoch": 3266} {"train_loss": -6.673199653625488, "global_step": 137201, "epoch": 3266} {"train_loss": -6.680070400238037, "global_step": 137202, "epoch": 3266} {"train_loss": -6.6124138832092285, "global_step": 137203, "epoch": 3266} {"train_loss": -6.666811466217041, "global_step": 137204, "epoch": 3266} {"train_loss": -6.646780014038086, "global_step": 137205, "epoch": 3266} {"train_loss": -6.769847869873047, "global_step": 137206, "epoch": 3266} {"train_loss": -6.663208961486816, "global_step": 137207, "epoch": 3266} {"train_loss": -6.7807393074035645, "global_step": 137208, "epoch": 3266} {"train_loss": -6.663518905639648, "global_step": 137209, "epoch": 3266} {"train_loss": -6.766964912414551, "global_step": 137210, "epoch": 3266} {"train_loss": -6.789255142211914, "global_step": 137211, "epoch": 3266} {"train_loss": -6.726032733917236, "global_step": 137212, "epoch": 3266} {"train_loss": -6.718706244514102, "global_step": 137213, "epoch": 3266, "val_loss": 66935.421875} {"train_loss": -6.757955551147461, "global_step": 137214, "epoch": 3267} {"train_loss": -6.69072961807251, "global_step": 137215, "epoch": 3267} {"train_loss": -6.707930564880371, "global_step": 137216, "epoch": 3267} {"train_loss": -6.713934898376465, "global_step": 137217, "epoch": 3267} {"train_loss": -6.802368640899658, "global_step": 137218, "epoch": 3267} {"train_loss": -6.76693058013916, "global_step": 137219, "epoch": 3267} {"train_loss": -6.784493446350098, "global_step": 137220, "epoch": 3267} {"train_loss": -6.727166175842285, "global_step": 137221, "epoch": 3267} {"train_loss": -6.8508830070495605, "global_step": 137222, "epoch": 3267} {"train_loss": -6.7312164306640625, "global_step": 137223, "epoch": 3267} {"train_loss": -6.774237632751465, "global_step": 137224, "epoch": 3267} {"train_loss": -6.754011154174805, "global_step": 137225, "epoch": 3267} {"train_loss": -6.682406425476074, "global_step": 137226, "epoch": 3267} {"train_loss": -6.851065158843994, "global_step": 137227, "epoch": 3267} {"train_loss": -6.813061237335205, "global_step": 137228, "epoch": 3267} {"train_loss": -6.774301052093506, "global_step": 137229, "epoch": 3267} {"train_loss": -6.827585220336914, "global_step": 137230, "epoch": 3267} {"train_loss": -6.813230514526367, "global_step": 137231, "epoch": 3267} {"train_loss": -6.696356773376465, "global_step": 137232, "epoch": 3267} {"train_loss": -6.789079666137695, "global_step": 137233, "epoch": 3267} {"train_loss": -6.840723991394043, "global_step": 137234, "epoch": 3267} {"train_loss": -6.886063575744629, "global_step": 137235, "epoch": 3267} {"train_loss": -6.720922470092773, "global_step": 137236, "epoch": 3267} {"train_loss": -6.873831748962402, "global_step": 137237, "epoch": 3267} {"train_loss": -6.656105995178223, "global_step": 137238, "epoch": 3267} {"train_loss": -6.808899879455566, "global_step": 137239, "epoch": 3267} {"train_loss": -6.759268760681152, "global_step": 137240, "epoch": 3267} {"train_loss": -6.83182430267334, "global_step": 137241, "epoch": 3267} {"train_loss": -6.831099987030029, "global_step": 137242, "epoch": 3267} {"train_loss": -6.816371917724609, "global_step": 137243, "epoch": 3267} {"train_loss": -6.779354095458984, "global_step": 137244, "epoch": 3267} {"train_loss": -6.851696014404297, "global_step": 137245, "epoch": 3267} {"train_loss": -6.7327985763549805, "global_step": 137246, "epoch": 3267} {"train_loss": -6.781740665435791, "global_step": 137247, "epoch": 3267} {"train_loss": -6.774387359619141, "global_step": 137248, "epoch": 3267} {"train_loss": -6.816765308380127, "global_step": 137249, "epoch": 3267} {"train_loss": -6.792386054992676, "global_step": 137250, "epoch": 3267} {"train_loss": -6.807751655578613, "global_step": 137251, "epoch": 3267} {"train_loss": -6.794517517089844, "global_step": 137252, "epoch": 3267} {"train_loss": -6.77599573135376, "global_step": 137253, "epoch": 3267} {"train_loss": -6.8023223876953125, "global_step": 137254, "epoch": 3267} {"train_loss": -6.781707786378407, "global_step": 137255, "epoch": 3267, "val_loss": 67076.5625} {"train_loss": -6.81141471862793, "global_step": 137256, "epoch": 3268} {"train_loss": -6.767451286315918, "global_step": 137257, "epoch": 3268} {"train_loss": -6.757938385009766, "global_step": 137258, "epoch": 3268} {"train_loss": -6.731245994567871, "global_step": 137259, "epoch": 3268} {"train_loss": -6.7006516456604, "global_step": 137260, "epoch": 3268} {"train_loss": -6.750990867614746, "global_step": 137261, "epoch": 3268} {"train_loss": -6.874156951904297, "global_step": 137262, "epoch": 3268} {"train_loss": -6.684584617614746, "global_step": 137263, "epoch": 3268} {"train_loss": -6.790210247039795, "global_step": 137264, "epoch": 3268} {"train_loss": -6.851592063903809, "global_step": 137265, "epoch": 3268} {"train_loss": -6.749898433685303, "global_step": 137266, "epoch": 3268} {"train_loss": -6.7706708908081055, "global_step": 137267, "epoch": 3268} {"train_loss": -6.621347427368164, "global_step": 137268, "epoch": 3268} {"train_loss": -6.860326766967773, "global_step": 137269, "epoch": 3268} {"train_loss": -6.7698283195495605, "global_step": 137270, "epoch": 3268} {"train_loss": -6.646989822387695, "global_step": 137271, "epoch": 3268} {"train_loss": -6.675233840942383, "global_step": 137272, "epoch": 3268} {"train_loss": -6.630260944366455, "global_step": 137273, "epoch": 3268} {"train_loss": -6.846609115600586, "global_step": 137274, "epoch": 3268} {"train_loss": -6.623897552490234, "global_step": 137275, "epoch": 3268} {"train_loss": -6.684342384338379, "global_step": 137276, "epoch": 3268} {"train_loss": -6.804622650146484, "global_step": 137277, "epoch": 3268} {"train_loss": -6.78311824798584, "global_step": 137278, "epoch": 3268} {"train_loss": -6.82967472076416, "global_step": 137279, "epoch": 3268} {"train_loss": -6.768255710601807, "global_step": 137280, "epoch": 3268} {"train_loss": -6.655959606170654, "global_step": 137281, "epoch": 3268} {"train_loss": -6.804759979248047, "global_step": 137282, "epoch": 3268} {"train_loss": -6.746739864349365, "global_step": 137283, "epoch": 3268} {"train_loss": -6.790324687957764, "global_step": 137284, "epoch": 3268} {"train_loss": -6.725743770599365, "global_step": 137285, "epoch": 3268} {"train_loss": -6.7099456787109375, "global_step": 137286, "epoch": 3268} {"train_loss": -6.758573532104492, "global_step": 137287, "epoch": 3268} {"train_loss": -6.6895318031311035, "global_step": 137288, "epoch": 3268} {"train_loss": -6.714592933654785, "global_step": 137289, "epoch": 3268} {"train_loss": -6.867030620574951, "global_step": 137290, "epoch": 3268} {"train_loss": -6.6846513748168945, "global_step": 137291, "epoch": 3268} {"train_loss": -6.631841659545898, "global_step": 137292, "epoch": 3268} {"train_loss": -6.711077690124512, "global_step": 137293, "epoch": 3268} {"train_loss": -6.745862007141113, "global_step": 137294, "epoch": 3268} {"train_loss": -6.756702423095703, "global_step": 137295, "epoch": 3268} {"train_loss": -6.622211456298828, "global_step": 137296, "epoch": 3268} {"train_loss": -6.738953613099598, "global_step": 137297, "epoch": 3268, "val_loss": 67075.1640625} {"train_loss": -6.736642837524414, "global_step": 137298, "epoch": 3269} {"train_loss": -6.8530168533325195, "global_step": 137299, "epoch": 3269} {"train_loss": -6.752819538116455, "global_step": 137300, "epoch": 3269} {"train_loss": -6.657618999481201, "global_step": 137301, "epoch": 3269} {"train_loss": -6.763176441192627, "global_step": 137302, "epoch": 3269} {"train_loss": -6.652873992919922, "global_step": 137303, "epoch": 3269} {"train_loss": -6.666354656219482, "global_step": 137304, "epoch": 3269} {"train_loss": -6.746508598327637, "global_step": 137305, "epoch": 3269} {"train_loss": -6.616874694824219, "global_step": 137306, "epoch": 3269} {"train_loss": -6.6170148849487305, "global_step": 137307, "epoch": 3269} {"train_loss": -6.592026710510254, "global_step": 137308, "epoch": 3269} {"train_loss": -6.584771156311035, "global_step": 137309, "epoch": 3269} {"train_loss": -6.4907121658325195, "global_step": 137310, "epoch": 3269} {"train_loss": -6.733130931854248, "global_step": 137311, "epoch": 3269} {"train_loss": -6.766691207885742, "global_step": 137312, "epoch": 3269} {"train_loss": -6.6617302894592285, "global_step": 137313, "epoch": 3269} {"train_loss": -6.595494747161865, "global_step": 137314, "epoch": 3269} {"train_loss": -6.702059268951416, "global_step": 137315, "epoch": 3269} {"train_loss": -6.722256660461426, "global_step": 137316, "epoch": 3269} {"train_loss": -6.716250896453857, "global_step": 137317, "epoch": 3269} {"train_loss": -6.782856464385986, "global_step": 137318, "epoch": 3269} {"train_loss": -6.576722145080566, "global_step": 137319, "epoch": 3269} {"train_loss": -6.778759956359863, "global_step": 137320, "epoch": 3269} {"train_loss": -6.723296165466309, "global_step": 137321, "epoch": 3269} {"train_loss": -6.815242767333984, "global_step": 137322, "epoch": 3269} {"train_loss": -6.759310722351074, "global_step": 137323, "epoch": 3269} {"train_loss": -6.693942546844482, "global_step": 137324, "epoch": 3269} {"train_loss": -6.7279558181762695, "global_step": 137325, "epoch": 3269} {"train_loss": -6.814639091491699, "global_step": 137326, "epoch": 3269} {"train_loss": -6.729275703430176, "global_step": 137327, "epoch": 3269} {"train_loss": -6.703422546386719, "global_step": 137328, "epoch": 3269} {"train_loss": -6.791248798370361, "global_step": 137329, "epoch": 3269} {"train_loss": -6.860198974609375, "global_step": 137330, "epoch": 3269} {"train_loss": -6.7010698318481445, "global_step": 137331, "epoch": 3269} {"train_loss": -6.757625579833984, "global_step": 137332, "epoch": 3269} {"train_loss": -6.820180892944336, "global_step": 137333, "epoch": 3269} {"train_loss": -6.66252326965332, "global_step": 137334, "epoch": 3269} {"train_loss": -6.734061241149902, "global_step": 137335, "epoch": 3269} {"train_loss": -6.806453704833984, "global_step": 137336, "epoch": 3269} {"train_loss": -6.7063374519348145, "global_step": 137337, "epoch": 3269} {"train_loss": -6.813116073608398, "global_step": 137338, "epoch": 3269} {"train_loss": -6.718330928257534, "global_step": 137339, "epoch": 3269, "val_loss": 67016.6015625} {"train_loss": -6.797158718109131, "global_step": 137340, "epoch": 3270} {"train_loss": -6.660771369934082, "global_step": 137341, "epoch": 3270} {"train_loss": -6.71319580078125, "global_step": 137342, "epoch": 3270} {"train_loss": -6.654183387756348, "global_step": 137343, "epoch": 3270} {"train_loss": -6.755217552185059, "global_step": 137344, "epoch": 3270} {"train_loss": -6.662210941314697, "global_step": 137345, "epoch": 3270} {"train_loss": -6.819003105163574, "global_step": 137346, "epoch": 3270} {"train_loss": -6.706067085266113, "global_step": 137347, "epoch": 3270} {"train_loss": -6.752715110778809, "global_step": 137348, "epoch": 3270} {"train_loss": -6.701277256011963, "global_step": 137349, "epoch": 3270} {"train_loss": -6.718698978424072, "global_step": 137350, "epoch": 3270} {"train_loss": -6.7650861740112305, "global_step": 137351, "epoch": 3270} {"train_loss": -6.713891983032227, "global_step": 137352, "epoch": 3270} {"train_loss": -6.618869781494141, "global_step": 137353, "epoch": 3270} {"train_loss": -6.769660472869873, "global_step": 137354, "epoch": 3270} {"train_loss": -6.722109317779541, "global_step": 137355, "epoch": 3270} {"train_loss": -6.637874603271484, "global_step": 137356, "epoch": 3270} {"train_loss": -6.733260154724121, "global_step": 137357, "epoch": 3270} {"train_loss": -6.763152122497559, "global_step": 137358, "epoch": 3270} {"train_loss": -6.737179279327393, "global_step": 137359, "epoch": 3270} {"train_loss": -6.742893218994141, "global_step": 137360, "epoch": 3270} {"train_loss": -6.737317085266113, "global_step": 137361, "epoch": 3270} {"train_loss": -6.82730770111084, "global_step": 137362, "epoch": 3270} {"train_loss": -6.633230209350586, "global_step": 137363, "epoch": 3270} {"train_loss": -6.7891998291015625, "global_step": 137364, "epoch": 3270} {"train_loss": -6.714978218078613, "global_step": 137365, "epoch": 3270} {"train_loss": -6.661059379577637, "global_step": 137366, "epoch": 3270} {"train_loss": -6.71037483215332, "global_step": 137367, "epoch": 3270} {"train_loss": -6.776268005371094, "global_step": 137368, "epoch": 3270} {"train_loss": -6.753171443939209, "global_step": 137369, "epoch": 3270} {"train_loss": -6.862723350524902, "global_step": 137370, "epoch": 3270} {"train_loss": -6.7558794021606445, "global_step": 137371, "epoch": 3270} {"train_loss": -6.80619478225708, "global_step": 137372, "epoch": 3270} {"train_loss": -6.683281421661377, "global_step": 137373, "epoch": 3270} {"train_loss": -6.687404632568359, "global_step": 137374, "epoch": 3270} {"train_loss": -6.771343231201172, "global_step": 137375, "epoch": 3270} {"train_loss": -6.725523948669434, "global_step": 137376, "epoch": 3270} {"train_loss": -6.713088512420654, "global_step": 137377, "epoch": 3270} {"train_loss": -6.7195844650268555, "global_step": 137378, "epoch": 3270} {"train_loss": -6.734755516052246, "global_step": 137379, "epoch": 3270} {"train_loss": -6.861930847167969, "global_step": 137380, "epoch": 3270} {"train_loss": -6.732025135131109, "global_step": 137381, "epoch": 3270, "val_loss": 67131.9921875} {"train_loss": -6.824225425720215, "global_step": 137382, "epoch": 3271} {"train_loss": -6.691629409790039, "global_step": 137383, "epoch": 3271} {"train_loss": -6.6582536697387695, "global_step": 137384, "epoch": 3271} {"train_loss": -6.748953819274902, "global_step": 137385, "epoch": 3271} {"train_loss": -6.613945007324219, "global_step": 137386, "epoch": 3271} {"train_loss": -6.7721099853515625, "global_step": 137387, "epoch": 3271} {"train_loss": -6.766043663024902, "global_step": 137388, "epoch": 3271} {"train_loss": -6.666696548461914, "global_step": 137389, "epoch": 3271} {"train_loss": -6.667864799499512, "global_step": 137390, "epoch": 3271} {"train_loss": -6.622073173522949, "global_step": 137391, "epoch": 3271} {"train_loss": -6.7276458740234375, "global_step": 137392, "epoch": 3271} {"train_loss": -6.716758728027344, "global_step": 137393, "epoch": 3271} {"train_loss": -6.638806343078613, "global_step": 137394, "epoch": 3271} {"train_loss": -6.696440696716309, "global_step": 137395, "epoch": 3271} {"train_loss": -6.573017120361328, "global_step": 137396, "epoch": 3271} {"train_loss": -6.6803388595581055, "global_step": 137397, "epoch": 3271} {"train_loss": -6.751269817352295, "global_step": 137398, "epoch": 3271} {"train_loss": -6.728615760803223, "global_step": 137399, "epoch": 3271} {"train_loss": -6.613638877868652, "global_step": 137400, "epoch": 3271} {"train_loss": -6.668705940246582, "global_step": 137401, "epoch": 3271} {"train_loss": -6.692915916442871, "global_step": 137402, "epoch": 3271} {"train_loss": -6.65478515625, "global_step": 137403, "epoch": 3271} {"train_loss": -6.642924785614014, "global_step": 137404, "epoch": 3271} {"train_loss": -6.656414985656738, "global_step": 137405, "epoch": 3271} {"train_loss": -6.746106147766113, "global_step": 137406, "epoch": 3271} {"train_loss": -6.774879455566406, "global_step": 137407, "epoch": 3271} {"train_loss": -6.842121601104736, "global_step": 137408, "epoch": 3271} {"train_loss": -6.759074687957764, "global_step": 137409, "epoch": 3271} {"train_loss": -6.764179229736328, "global_step": 137410, "epoch": 3271} {"train_loss": -6.853726387023926, "global_step": 137411, "epoch": 3271} {"train_loss": -6.750857830047607, "global_step": 137412, "epoch": 3271} {"train_loss": -6.70487642288208, "global_step": 137413, "epoch": 3271} {"train_loss": -6.692275524139404, "global_step": 137414, "epoch": 3271} {"train_loss": -6.6799821853637695, "global_step": 137415, "epoch": 3271} {"train_loss": -6.70509672164917, "global_step": 137416, "epoch": 3271} {"train_loss": -6.794741153717041, "global_step": 137417, "epoch": 3271} {"train_loss": -6.736886024475098, "global_step": 137418, "epoch": 3271} {"train_loss": -6.924699783325195, "global_step": 137419, "epoch": 3271} {"train_loss": -7.013612270355225, "global_step": 137420, "epoch": 3271} {"train_loss": -6.762429237365723, "global_step": 137421, "epoch": 3271} {"train_loss": -6.722490310668945, "global_step": 137422, "epoch": 3271} {"train_loss": -6.726027772540138, "global_step": 137423, "epoch": 3271, "val_loss": 66952.2109375} {"train_loss": -6.787332057952881, "global_step": 137424, "epoch": 3272} {"train_loss": -6.766872406005859, "global_step": 137425, "epoch": 3272} {"train_loss": -6.703897476196289, "global_step": 137426, "epoch": 3272} {"train_loss": -6.799042224884033, "global_step": 137427, "epoch": 3272} {"train_loss": -6.755675792694092, "global_step": 137428, "epoch": 3272} {"train_loss": -6.895816326141357, "global_step": 137429, "epoch": 3272} {"train_loss": -6.894412517547607, "global_step": 137430, "epoch": 3272} {"train_loss": -6.842657089233398, "global_step": 137431, "epoch": 3272} {"train_loss": -6.839156150817871, "global_step": 137432, "epoch": 3272} {"train_loss": -6.8423871994018555, "global_step": 137433, "epoch": 3272} {"train_loss": -6.826722621917725, "global_step": 137434, "epoch": 3272} {"train_loss": -6.752287864685059, "global_step": 137435, "epoch": 3272} {"train_loss": -6.794381141662598, "global_step": 137436, "epoch": 3272} {"train_loss": -6.757167816162109, "global_step": 137437, "epoch": 3272} {"train_loss": -6.833905220031738, "global_step": 137438, "epoch": 3272} {"train_loss": -6.811255931854248, "global_step": 137439, "epoch": 3272} {"train_loss": -6.86114501953125, "global_step": 137440, "epoch": 3272} {"train_loss": -6.740018844604492, "global_step": 137441, "epoch": 3272} {"train_loss": -6.750746250152588, "global_step": 137442, "epoch": 3272} {"train_loss": -6.861608028411865, "global_step": 137443, "epoch": 3272} {"train_loss": -6.715761184692383, "global_step": 137444, "epoch": 3272} {"train_loss": -6.740131855010986, "global_step": 137445, "epoch": 3272} {"train_loss": -6.751638412475586, "global_step": 137446, "epoch": 3272} {"train_loss": -6.817805290222168, "global_step": 137447, "epoch": 3272} {"train_loss": -6.669468402862549, "global_step": 137448, "epoch": 3272} {"train_loss": -6.683366298675537, "global_step": 137449, "epoch": 3272} {"train_loss": -6.738290786743164, "global_step": 137450, "epoch": 3272} {"train_loss": -6.820794582366943, "global_step": 137451, "epoch": 3272} {"train_loss": -6.664789199829102, "global_step": 137452, "epoch": 3272} {"train_loss": -6.75441837310791, "global_step": 137453, "epoch": 3272} {"train_loss": -6.647371292114258, "global_step": 137454, "epoch": 3272} {"train_loss": -6.635747909545898, "global_step": 137455, "epoch": 3272} {"train_loss": -6.873809814453125, "global_step": 137456, "epoch": 3272} {"train_loss": -6.785192966461182, "global_step": 137457, "epoch": 3272} {"train_loss": -6.749967098236084, "global_step": 137458, "epoch": 3272} {"train_loss": -6.724808692932129, "global_step": 137459, "epoch": 3272} {"train_loss": -6.673584461212158, "global_step": 137460, "epoch": 3272} {"train_loss": -6.74293327331543, "global_step": 137461, "epoch": 3272} {"train_loss": -6.677262783050537, "global_step": 137462, "epoch": 3272} {"train_loss": -6.681506633758545, "global_step": 137463, "epoch": 3272} {"train_loss": -6.60164737701416, "global_step": 137464, "epoch": 3272} {"train_loss": -6.757447742280506, "global_step": 137465, "epoch": 3272, "val_loss": 67143.5390625} {"train_loss": -6.6696367263793945, "global_step": 137466, "epoch": 3273} {"train_loss": -6.760161876678467, "global_step": 137467, "epoch": 3273} {"train_loss": -6.743261337280273, "global_step": 137468, "epoch": 3273} {"train_loss": -6.8547282218933105, "global_step": 137469, "epoch": 3273} {"train_loss": -6.613588809967041, "global_step": 137470, "epoch": 3273} {"train_loss": -6.671542167663574, "global_step": 137471, "epoch": 3273} {"train_loss": -6.631683349609375, "global_step": 137472, "epoch": 3273} {"train_loss": -6.605888843536377, "global_step": 137473, "epoch": 3273} {"train_loss": -6.643872261047363, "global_step": 137474, "epoch": 3273} {"train_loss": -6.678489685058594, "global_step": 137475, "epoch": 3273} {"train_loss": -6.560183525085449, "global_step": 137476, "epoch": 3273} {"train_loss": -6.7427778244018555, "global_step": 137477, "epoch": 3273} {"train_loss": -6.708209037780762, "global_step": 137478, "epoch": 3273} {"train_loss": -6.776214122772217, "global_step": 137479, "epoch": 3273} {"train_loss": -6.823065280914307, "global_step": 137480, "epoch": 3273} {"train_loss": -6.707648754119873, "global_step": 137481, "epoch": 3273} {"train_loss": -6.773502349853516, "global_step": 137482, "epoch": 3273} {"train_loss": -6.733843803405762, "global_step": 137483, "epoch": 3273} {"train_loss": -6.725602626800537, "global_step": 137484, "epoch": 3273} {"train_loss": -6.811034679412842, "global_step": 137485, "epoch": 3273} {"train_loss": -6.737332344055176, "global_step": 137486, "epoch": 3273} {"train_loss": -6.6800031661987305, "global_step": 137487, "epoch": 3273} {"train_loss": -6.677256107330322, "global_step": 137488, "epoch": 3273} {"train_loss": -6.744091033935547, "global_step": 137489, "epoch": 3273} {"train_loss": -6.815382480621338, "global_step": 137490, "epoch": 3273} {"train_loss": -6.677342414855957, "global_step": 137491, "epoch": 3273} {"train_loss": -6.773207187652588, "global_step": 137492, "epoch": 3273} {"train_loss": -6.697586536407471, "global_step": 137493, "epoch": 3273} {"train_loss": -6.805616855621338, "global_step": 137494, "epoch": 3273} {"train_loss": -6.706018924713135, "global_step": 137495, "epoch": 3273} {"train_loss": -6.696101188659668, "global_step": 137496, "epoch": 3273} {"train_loss": -6.810838222503662, "global_step": 137497, "epoch": 3273} {"train_loss": -6.7674150466918945, "global_step": 137498, "epoch": 3273} {"train_loss": -6.805213928222656, "global_step": 137499, "epoch": 3273} {"train_loss": -6.821239948272705, "global_step": 137500, "epoch": 3273} {"train_loss": -6.753297805786133, "global_step": 137501, "epoch": 3273} {"train_loss": -6.824298858642578, "global_step": 137502, "epoch": 3273} {"train_loss": -6.79020881652832, "global_step": 137503, "epoch": 3273} {"train_loss": -6.743485450744629, "global_step": 137504, "epoch": 3273} {"train_loss": -6.78985595703125, "global_step": 137505, "epoch": 3273} {"train_loss": -6.770483493804932, "global_step": 137506, "epoch": 3273} {"train_loss": -6.731503373100644, "global_step": 137507, "epoch": 3273, "val_loss": 66962.3203125} {"train_loss": -6.7786359786987305, "global_step": 137508, "epoch": 3274} {"train_loss": -6.568262577056885, "global_step": 137509, "epoch": 3274} {"train_loss": -6.788315296173096, "global_step": 137510, "epoch": 3274} {"train_loss": -6.661628723144531, "global_step": 137511, "epoch": 3274} {"train_loss": -6.682036399841309, "global_step": 137512, "epoch": 3274} {"train_loss": -6.7264084815979, "global_step": 137513, "epoch": 3274} {"train_loss": -6.486462116241455, "global_step": 137514, "epoch": 3274} {"train_loss": -6.868032455444336, "global_step": 137515, "epoch": 3274} {"train_loss": -6.596061706542969, "global_step": 137516, "epoch": 3274} {"train_loss": -6.476696491241455, "global_step": 137517, "epoch": 3274} {"train_loss": -6.790390968322754, "global_step": 137518, "epoch": 3274} {"train_loss": -6.599157333374023, "global_step": 137519, "epoch": 3274} {"train_loss": -6.70120906829834, "global_step": 137520, "epoch": 3274} {"train_loss": -6.541699409484863, "global_step": 137521, "epoch": 3274} {"train_loss": -6.59989070892334, "global_step": 137522, "epoch": 3274} {"train_loss": -6.699210166931152, "global_step": 137523, "epoch": 3274} {"train_loss": -6.78010368347168, "global_step": 137524, "epoch": 3274} {"train_loss": -6.748595237731934, "global_step": 137525, "epoch": 3274} {"train_loss": -6.7248077392578125, "global_step": 137526, "epoch": 3274} {"train_loss": -6.800085067749023, "global_step": 137527, "epoch": 3274} {"train_loss": -6.6905646324157715, "global_step": 137528, "epoch": 3274} {"train_loss": -6.6548171043396, "global_step": 137529, "epoch": 3274} {"train_loss": -6.621153831481934, "global_step": 137530, "epoch": 3274} {"train_loss": -6.655506134033203, "global_step": 137531, "epoch": 3274} {"train_loss": -6.816411972045898, "global_step": 137532, "epoch": 3274} {"train_loss": -6.68382453918457, "global_step": 137533, "epoch": 3274} {"train_loss": -6.744131088256836, "global_step": 137534, "epoch": 3274} {"train_loss": -6.641262054443359, "global_step": 137535, "epoch": 3274} {"train_loss": -6.722621440887451, "global_step": 137536, "epoch": 3274} {"train_loss": -6.873757362365723, "global_step": 137537, "epoch": 3274} {"train_loss": -6.636224746704102, "global_step": 137538, "epoch": 3274} {"train_loss": -6.694862365722656, "global_step": 137539, "epoch": 3274} {"train_loss": -6.61336612701416, "global_step": 137540, "epoch": 3274} {"train_loss": -6.807372570037842, "global_step": 137541, "epoch": 3274} {"train_loss": -6.761534690856934, "global_step": 137542, "epoch": 3274} {"train_loss": -6.709868431091309, "global_step": 137543, "epoch": 3274} {"train_loss": -6.745014190673828, "global_step": 137544, "epoch": 3274} {"train_loss": -6.672999858856201, "global_step": 137545, "epoch": 3274} {"train_loss": -6.742607593536377, "global_step": 137546, "epoch": 3274} {"train_loss": -6.755274772644043, "global_step": 137547, "epoch": 3274} {"train_loss": -6.654693126678467, "global_step": 137548, "epoch": 3274} {"train_loss": -6.692808389663696, "global_step": 137549, "epoch": 3274, "val_loss": 66987.640625} {"train_loss": -6.707709312438965, "global_step": 137550, "epoch": 3275} {"train_loss": -6.683681964874268, "global_step": 137551, "epoch": 3275} {"train_loss": -6.647119522094727, "global_step": 137552, "epoch": 3275} {"train_loss": -6.807890892028809, "global_step": 137553, "epoch": 3275} {"train_loss": -6.7688398361206055, "global_step": 137554, "epoch": 3275} {"train_loss": -6.699784755706787, "global_step": 137555, "epoch": 3275} {"train_loss": -6.683664798736572, "global_step": 137556, "epoch": 3275} {"train_loss": -6.645709037780762, "global_step": 137557, "epoch": 3275} {"train_loss": -6.785691261291504, "global_step": 137558, "epoch": 3275} {"train_loss": -6.601060390472412, "global_step": 137559, "epoch": 3275} {"train_loss": -6.70057487487793, "global_step": 137560, "epoch": 3275} {"train_loss": -6.650485992431641, "global_step": 137561, "epoch": 3275} {"train_loss": -6.694954872131348, "global_step": 137562, "epoch": 3275} {"train_loss": -6.734305381774902, "global_step": 137563, "epoch": 3275} {"train_loss": -6.7400665283203125, "global_step": 137564, "epoch": 3275} {"train_loss": -6.778524398803711, "global_step": 137565, "epoch": 3275} {"train_loss": -6.630720138549805, "global_step": 137566, "epoch": 3275} {"train_loss": -6.648283004760742, "global_step": 137567, "epoch": 3275} {"train_loss": -6.608440399169922, "global_step": 137568, "epoch": 3275} {"train_loss": -6.7563676834106445, "global_step": 137569, "epoch": 3275} {"train_loss": -6.756926536560059, "global_step": 137570, "epoch": 3275} {"train_loss": -6.634382247924805, "global_step": 137571, "epoch": 3275} {"train_loss": -6.734477996826172, "global_step": 137572, "epoch": 3275} {"train_loss": -6.708745956420898, "global_step": 137573, "epoch": 3275} {"train_loss": -6.655344009399414, "global_step": 137574, "epoch": 3275} {"train_loss": -6.702688217163086, "global_step": 137575, "epoch": 3275} {"train_loss": -6.608316421508789, "global_step": 137576, "epoch": 3275} {"train_loss": -6.7297868728637695, "global_step": 137577, "epoch": 3275} {"train_loss": -6.721796989440918, "global_step": 137578, "epoch": 3275} {"train_loss": -6.748536586761475, "global_step": 137579, "epoch": 3275} {"train_loss": -6.699409008026123, "global_step": 137580, "epoch": 3275} {"train_loss": -6.557771682739258, "global_step": 137581, "epoch": 3275} {"train_loss": -6.725555419921875, "global_step": 137582, "epoch": 3275} {"train_loss": -6.7997026443481445, "global_step": 137583, "epoch": 3275} {"train_loss": -6.87345027923584, "global_step": 137584, "epoch": 3275} {"train_loss": -6.765774726867676, "global_step": 137585, "epoch": 3275} {"train_loss": -6.781146049499512, "global_step": 137586, "epoch": 3275} {"train_loss": -6.770062446594238, "global_step": 137587, "epoch": 3275} {"train_loss": -6.732064723968506, "global_step": 137588, "epoch": 3275} {"train_loss": -6.620670318603516, "global_step": 137589, "epoch": 3275} {"train_loss": -6.651466369628906, "global_step": 137590, "epoch": 3275} {"train_loss": -6.707059610457647, "global_step": 137591, "epoch": 3275, "val_loss": 66865.3671875} {"train_loss": -6.832847595214844, "global_step": 137592, "epoch": 3276} {"train_loss": -6.673550605773926, "global_step": 137593, "epoch": 3276} {"train_loss": -6.708640098571777, "global_step": 137594, "epoch": 3276} {"train_loss": -6.834359169006348, "global_step": 137595, "epoch": 3276} {"train_loss": -6.7329607009887695, "global_step": 137596, "epoch": 3276} {"train_loss": -6.8098978996276855, "global_step": 137597, "epoch": 3276} {"train_loss": -6.666252136230469, "global_step": 137598, "epoch": 3276} {"train_loss": -6.833449363708496, "global_step": 137599, "epoch": 3276} {"train_loss": -6.725732803344727, "global_step": 137600, "epoch": 3276} {"train_loss": -6.699654579162598, "global_step": 137601, "epoch": 3276} {"train_loss": -6.772870063781738, "global_step": 137602, "epoch": 3276} {"train_loss": -6.743773460388184, "global_step": 137603, "epoch": 3276} {"train_loss": -6.67783260345459, "global_step": 137604, "epoch": 3276} {"train_loss": -6.74663782119751, "global_step": 137605, "epoch": 3276} {"train_loss": -6.819104194641113, "global_step": 137606, "epoch": 3276} {"train_loss": -6.750361919403076, "global_step": 137607, "epoch": 3276} {"train_loss": -6.697600364685059, "global_step": 137608, "epoch": 3276} {"train_loss": -6.754024028778076, "global_step": 137609, "epoch": 3276} {"train_loss": -6.767331123352051, "global_step": 137610, "epoch": 3276} {"train_loss": -6.710332870483398, "global_step": 137611, "epoch": 3276} {"train_loss": -6.903131484985352, "global_step": 137612, "epoch": 3276} {"train_loss": -6.704188346862793, "global_step": 137613, "epoch": 3276} {"train_loss": -6.8687591552734375, "global_step": 137614, "epoch": 3276} {"train_loss": -6.718173027038574, "global_step": 137615, "epoch": 3276} {"train_loss": -6.636626720428467, "global_step": 137616, "epoch": 3276} {"train_loss": -6.8155107498168945, "global_step": 137617, "epoch": 3276} {"train_loss": -6.7368364334106445, "global_step": 137618, "epoch": 3276} {"train_loss": -6.668495178222656, "global_step": 137619, "epoch": 3276} {"train_loss": -6.773238182067871, "global_step": 137620, "epoch": 3276} {"train_loss": -6.857834339141846, "global_step": 137621, "epoch": 3276} {"train_loss": -6.930306434631348, "global_step": 137622, "epoch": 3276} {"train_loss": -6.780430793762207, "global_step": 137623, "epoch": 3276} {"train_loss": -6.74637508392334, "global_step": 137624, "epoch": 3276} {"train_loss": -6.733765125274658, "global_step": 137625, "epoch": 3276} {"train_loss": -6.776330947875977, "global_step": 137626, "epoch": 3276} {"train_loss": -6.701706409454346, "global_step": 137627, "epoch": 3276} {"train_loss": -6.794034004211426, "global_step": 137628, "epoch": 3276} {"train_loss": -6.773246765136719, "global_step": 137629, "epoch": 3276} {"train_loss": -6.708568572998047, "global_step": 137630, "epoch": 3276} {"train_loss": -6.740731239318848, "global_step": 137631, "epoch": 3276} {"train_loss": -6.727940559387207, "global_step": 137632, "epoch": 3276} {"train_loss": -6.754601910000756, "global_step": 137633, "epoch": 3276, "val_loss": 67136.6875} {"train_loss": -6.777189254760742, "global_step": 137634, "epoch": 3277} {"train_loss": -6.72851037979126, "global_step": 137635, "epoch": 3277} {"train_loss": -6.649233341217041, "global_step": 137636, "epoch": 3277} {"train_loss": -6.836791515350342, "global_step": 137637, "epoch": 3277} {"train_loss": -6.656760215759277, "global_step": 137638, "epoch": 3277} {"train_loss": -6.82311487197876, "global_step": 137639, "epoch": 3277} {"train_loss": -6.610140323638916, "global_step": 137640, "epoch": 3277} {"train_loss": -6.723119735717773, "global_step": 137641, "epoch": 3277} {"train_loss": -6.80930233001709, "global_step": 137642, "epoch": 3277} {"train_loss": -6.692409992218018, "global_step": 137643, "epoch": 3277} {"train_loss": -6.837369441986084, "global_step": 137644, "epoch": 3277} {"train_loss": -6.651790142059326, "global_step": 137645, "epoch": 3277} {"train_loss": -6.536827087402344, "global_step": 137646, "epoch": 3277} {"train_loss": -6.810689449310303, "global_step": 137647, "epoch": 3277} {"train_loss": -6.785731792449951, "global_step": 137648, "epoch": 3277} {"train_loss": -6.598764419555664, "global_step": 137649, "epoch": 3277} {"train_loss": -6.860608100891113, "global_step": 137650, "epoch": 3277} {"train_loss": -6.675705909729004, "global_step": 137651, "epoch": 3277} {"train_loss": -6.629652976989746, "global_step": 137652, "epoch": 3277} {"train_loss": -6.831546783447266, "global_step": 137653, "epoch": 3277} {"train_loss": -6.759235382080078, "global_step": 137654, "epoch": 3277} {"train_loss": -6.798010349273682, "global_step": 137655, "epoch": 3277} {"train_loss": -6.762551784515381, "global_step": 137656, "epoch": 3277} {"train_loss": -6.683479309082031, "global_step": 137657, "epoch": 3277} {"train_loss": -6.829799652099609, "global_step": 137658, "epoch": 3277} {"train_loss": -6.710468292236328, "global_step": 137659, "epoch": 3277} {"train_loss": -6.740427017211914, "global_step": 137660, "epoch": 3277} {"train_loss": -6.707414627075195, "global_step": 137661, "epoch": 3277} {"train_loss": -6.624369144439697, "global_step": 137662, "epoch": 3277} {"train_loss": -6.722625732421875, "global_step": 137663, "epoch": 3277} {"train_loss": -6.861706733703613, "global_step": 137664, "epoch": 3277} {"train_loss": -6.769639015197754, "global_step": 137665, "epoch": 3277} {"train_loss": -6.659755706787109, "global_step": 137666, "epoch": 3277} {"train_loss": -6.668859481811523, "global_step": 137667, "epoch": 3277} {"train_loss": -6.73838472366333, "global_step": 137668, "epoch": 3277} {"train_loss": -6.75694465637207, "global_step": 137669, "epoch": 3277} {"train_loss": -6.7144389152526855, "global_step": 137670, "epoch": 3277} {"train_loss": -6.75294303894043, "global_step": 137671, "epoch": 3277} {"train_loss": -6.7565388679504395, "global_step": 137672, "epoch": 3277} {"train_loss": -6.6845784187316895, "global_step": 137673, "epoch": 3277} {"train_loss": -6.882648468017578, "global_step": 137674, "epoch": 3277} {"train_loss": -6.732066461018154, "global_step": 137675, "epoch": 3277, "val_loss": 67084.203125} {"train_loss": -6.862773895263672, "global_step": 137676, "epoch": 3278} {"train_loss": -6.638089656829834, "global_step": 137677, "epoch": 3278} {"train_loss": -6.7851057052612305, "global_step": 137678, "epoch": 3278} {"train_loss": -6.74246883392334, "global_step": 137679, "epoch": 3278} {"train_loss": -6.753345012664795, "global_step": 137680, "epoch": 3278} {"train_loss": -6.788916110992432, "global_step": 137681, "epoch": 3278} {"train_loss": -6.809988975524902, "global_step": 137682, "epoch": 3278} {"train_loss": -6.622593879699707, "global_step": 137683, "epoch": 3278} {"train_loss": -6.7653584480285645, "global_step": 137684, "epoch": 3278} {"train_loss": -6.798220157623291, "global_step": 137685, "epoch": 3278} {"train_loss": -6.734758377075195, "global_step": 137686, "epoch": 3278} {"train_loss": -6.77294921875, "global_step": 137687, "epoch": 3278} {"train_loss": -6.7824907302856445, "global_step": 137688, "epoch": 3278} {"train_loss": -6.891721248626709, "global_step": 137689, "epoch": 3278} {"train_loss": -6.700393199920654, "global_step": 137690, "epoch": 3278} {"train_loss": -6.759926795959473, "global_step": 137691, "epoch": 3278} {"train_loss": -6.813227653503418, "global_step": 137692, "epoch": 3278} {"train_loss": -6.746002197265625, "global_step": 137693, "epoch": 3278} {"train_loss": -6.782322883605957, "global_step": 137694, "epoch": 3278} {"train_loss": -6.78929328918457, "global_step": 137695, "epoch": 3278} {"train_loss": -6.794007301330566, "global_step": 137696, "epoch": 3278} {"train_loss": -6.843346118927002, "global_step": 137697, "epoch": 3278} {"train_loss": -6.736339569091797, "global_step": 137698, "epoch": 3278} {"train_loss": -6.858839988708496, "global_step": 137699, "epoch": 3278} {"train_loss": -6.772792339324951, "global_step": 137700, "epoch": 3278} {"train_loss": -6.820265293121338, "global_step": 137701, "epoch": 3278} {"train_loss": -6.834988594055176, "global_step": 137702, "epoch": 3278} {"train_loss": -6.729509353637695, "global_step": 137703, "epoch": 3278} {"train_loss": -6.842935562133789, "global_step": 137704, "epoch": 3278} {"train_loss": -6.689751625061035, "global_step": 137705, "epoch": 3278} {"train_loss": -6.750452995300293, "global_step": 137706, "epoch": 3278} {"train_loss": -6.69528865814209, "global_step": 137707, "epoch": 3278} {"train_loss": -6.807319164276123, "global_step": 137708, "epoch": 3278} {"train_loss": -6.723898887634277, "global_step": 137709, "epoch": 3278} {"train_loss": -6.952406883239746, "global_step": 137710, "epoch": 3278} {"train_loss": -6.579647064208984, "global_step": 137711, "epoch": 3278} {"train_loss": -6.683470249176025, "global_step": 137712, "epoch": 3278} {"train_loss": -6.8353753089904785, "global_step": 137713, "epoch": 3278} {"train_loss": -6.687891960144043, "global_step": 137714, "epoch": 3278} {"train_loss": -6.607085704803467, "global_step": 137715, "epoch": 3278} {"train_loss": -6.811979293823242, "global_step": 137716, "epoch": 3278} {"train_loss": -6.763460147948492, "global_step": 137717, "epoch": 3278, "val_loss": 66990.5} {"train_loss": -6.744013786315918, "global_step": 137718, "epoch": 3279} {"train_loss": -6.746676921844482, "global_step": 137719, "epoch": 3279} {"train_loss": -6.8554511070251465, "global_step": 137720, "epoch": 3279} {"train_loss": -6.676136016845703, "global_step": 137721, "epoch": 3279} {"train_loss": -6.780707359313965, "global_step": 137722, "epoch": 3279} {"train_loss": -6.842489719390869, "global_step": 137723, "epoch": 3279} {"train_loss": -6.775814056396484, "global_step": 137724, "epoch": 3279} {"train_loss": -6.80378532409668, "global_step": 137725, "epoch": 3279} {"train_loss": -6.718504905700684, "global_step": 137726, "epoch": 3279} {"train_loss": -6.749133110046387, "global_step": 137727, "epoch": 3279} {"train_loss": -6.7103471755981445, "global_step": 137728, "epoch": 3279} {"train_loss": -6.735100269317627, "global_step": 137729, "epoch": 3279} {"train_loss": -6.703792572021484, "global_step": 137730, "epoch": 3279} {"train_loss": -6.714250564575195, "global_step": 137731, "epoch": 3279} {"train_loss": -6.821192741394043, "global_step": 137732, "epoch": 3279} {"train_loss": -6.603713035583496, "global_step": 137733, "epoch": 3279} {"train_loss": -6.747145652770996, "global_step": 137734, "epoch": 3279} {"train_loss": -6.648723602294922, "global_step": 137735, "epoch": 3279} {"train_loss": -6.638957977294922, "global_step": 137736, "epoch": 3279} {"train_loss": -6.77802038192749, "global_step": 137737, "epoch": 3279} {"train_loss": -6.516820907592773, "global_step": 137738, "epoch": 3279} {"train_loss": -6.591021537780762, "global_step": 137739, "epoch": 3279} {"train_loss": -6.763606071472168, "global_step": 137740, "epoch": 3279} {"train_loss": -6.552003860473633, "global_step": 137741, "epoch": 3279} {"train_loss": -6.697678565979004, "global_step": 137742, "epoch": 3279} {"train_loss": -6.753819465637207, "global_step": 137743, "epoch": 3279} {"train_loss": -6.63327693939209, "global_step": 137744, "epoch": 3279} {"train_loss": -6.79885721206665, "global_step": 137745, "epoch": 3279} {"train_loss": -6.661597728729248, "global_step": 137746, "epoch": 3279} {"train_loss": -6.777022361755371, "global_step": 137747, "epoch": 3279} {"train_loss": -6.823235034942627, "global_step": 137748, "epoch": 3279} {"train_loss": -6.7228193283081055, "global_step": 137749, "epoch": 3279} {"train_loss": -6.73091983795166, "global_step": 137750, "epoch": 3279} {"train_loss": -6.732394695281982, "global_step": 137751, "epoch": 3279} {"train_loss": -6.633188724517822, "global_step": 137752, "epoch": 3279} {"train_loss": -6.753531455993652, "global_step": 137753, "epoch": 3279} {"train_loss": -6.761187553405762, "global_step": 137754, "epoch": 3279} {"train_loss": -6.754434585571289, "global_step": 137755, "epoch": 3279} {"train_loss": -6.787514686584473, "global_step": 137756, "epoch": 3279} {"train_loss": -6.719737529754639, "global_step": 137757, "epoch": 3279} {"train_loss": -6.81917667388916, "global_step": 137758, "epoch": 3279} {"train_loss": -6.726157563073294, "global_step": 137759, "epoch": 3279, "val_loss": 67079.9453125} {"train_loss": -6.616687774658203, "global_step": 137760, "epoch": 3280} {"train_loss": -6.797064304351807, "global_step": 137761, "epoch": 3280} {"train_loss": -6.632439613342285, "global_step": 137762, "epoch": 3280} {"train_loss": -6.837968826293945, "global_step": 137763, "epoch": 3280} {"train_loss": -6.690617561340332, "global_step": 137764, "epoch": 3280} {"train_loss": -6.722111701965332, "global_step": 137765, "epoch": 3280} {"train_loss": -6.809559345245361, "global_step": 137766, "epoch": 3280} {"train_loss": -6.768087387084961, "global_step": 137767, "epoch": 3280} {"train_loss": -6.726302623748779, "global_step": 137768, "epoch": 3280} {"train_loss": -6.680148124694824, "global_step": 137769, "epoch": 3280} {"train_loss": -6.848958492279053, "global_step": 137770, "epoch": 3280} {"train_loss": -6.60996150970459, "global_step": 137771, "epoch": 3280} {"train_loss": -6.73729944229126, "global_step": 137772, "epoch": 3280} {"train_loss": -6.664000988006592, "global_step": 137773, "epoch": 3280} {"train_loss": -6.735535621643066, "global_step": 137774, "epoch": 3280} {"train_loss": -6.72610330581665, "global_step": 137775, "epoch": 3280} {"train_loss": -6.728023529052734, "global_step": 137776, "epoch": 3280} {"train_loss": -6.683140754699707, "global_step": 137777, "epoch": 3280} {"train_loss": -6.8080291748046875, "global_step": 137778, "epoch": 3280} {"train_loss": -6.744667053222656, "global_step": 137779, "epoch": 3280} {"train_loss": -6.6908674240112305, "global_step": 137780, "epoch": 3280} {"train_loss": -6.731901168823242, "global_step": 137781, "epoch": 3280} {"train_loss": -6.729373455047607, "global_step": 137782, "epoch": 3280} {"train_loss": -6.814319610595703, "global_step": 137783, "epoch": 3280} {"train_loss": -6.709038734436035, "global_step": 137784, "epoch": 3280} {"train_loss": -6.692593097686768, "global_step": 137785, "epoch": 3280} {"train_loss": -6.732571601867676, "global_step": 137786, "epoch": 3280} {"train_loss": -6.763354301452637, "global_step": 137787, "epoch": 3280} {"train_loss": -6.769769668579102, "global_step": 137788, "epoch": 3280} {"train_loss": -6.735579490661621, "global_step": 137789, "epoch": 3280} {"train_loss": -6.658901214599609, "global_step": 137790, "epoch": 3280} {"train_loss": -6.760432243347168, "global_step": 137791, "epoch": 3280} {"train_loss": -6.782515525817871, "global_step": 137792, "epoch": 3280} {"train_loss": -6.772383689880371, "global_step": 137793, "epoch": 3280} {"train_loss": -6.812353134155273, "global_step": 137794, "epoch": 3280} {"train_loss": -6.844358444213867, "global_step": 137795, "epoch": 3280} {"train_loss": -6.81888484954834, "global_step": 137796, "epoch": 3280} {"train_loss": -6.727255821228027, "global_step": 137797, "epoch": 3280} {"train_loss": -6.804725646972656, "global_step": 137798, "epoch": 3280} {"train_loss": -6.89634895324707, "global_step": 137799, "epoch": 3280} {"train_loss": -6.747989654541016, "global_step": 137800, "epoch": 3280} {"train_loss": -6.745530298777989, "global_step": 137801, "epoch": 3280, "val_loss": 67196.1796875} {"train_loss": -6.793269634246826, "global_step": 137802, "epoch": 3281} {"train_loss": -6.751477241516113, "global_step": 137803, "epoch": 3281} {"train_loss": -6.6464033126831055, "global_step": 137804, "epoch": 3281} {"train_loss": -6.778909683227539, "global_step": 137805, "epoch": 3281} {"train_loss": -6.803251266479492, "global_step": 137806, "epoch": 3281} {"train_loss": -6.741055965423584, "global_step": 137807, "epoch": 3281} {"train_loss": -6.742191314697266, "global_step": 137808, "epoch": 3281} {"train_loss": -6.769786834716797, "global_step": 137809, "epoch": 3281} {"train_loss": -6.7671895027160645, "global_step": 137810, "epoch": 3281} {"train_loss": -6.702451705932617, "global_step": 137811, "epoch": 3281} {"train_loss": -6.663592338562012, "global_step": 137812, "epoch": 3281} {"train_loss": -6.775948524475098, "global_step": 137813, "epoch": 3281} {"train_loss": -6.654726028442383, "global_step": 137814, "epoch": 3281} {"train_loss": -6.797658443450928, "global_step": 137815, "epoch": 3281} {"train_loss": -6.755163669586182, "global_step": 137816, "epoch": 3281} {"train_loss": -6.673870086669922, "global_step": 137817, "epoch": 3281} {"train_loss": -6.700006008148193, "global_step": 137818, "epoch": 3281} {"train_loss": -6.623333930969238, "global_step": 137819, "epoch": 3281} {"train_loss": -6.683128356933594, "global_step": 137820, "epoch": 3281} {"train_loss": -6.644308567047119, "global_step": 137821, "epoch": 3281} {"train_loss": -6.659691333770752, "global_step": 137822, "epoch": 3281} {"train_loss": -6.7505998611450195, "global_step": 137823, "epoch": 3281} {"train_loss": -6.785158157348633, "global_step": 137824, "epoch": 3281} {"train_loss": -6.631591320037842, "global_step": 137825, "epoch": 3281} {"train_loss": -6.697558403015137, "global_step": 137826, "epoch": 3281} {"train_loss": -6.641577243804932, "global_step": 137827, "epoch": 3281} {"train_loss": -6.713274955749512, "global_step": 137828, "epoch": 3281} {"train_loss": -6.763576507568359, "global_step": 137829, "epoch": 3281} {"train_loss": -6.573458194732666, "global_step": 137830, "epoch": 3281} {"train_loss": -6.693384647369385, "global_step": 137831, "epoch": 3281} {"train_loss": -6.673686504364014, "global_step": 137832, "epoch": 3281} {"train_loss": -6.712533473968506, "global_step": 137833, "epoch": 3281} {"train_loss": -6.79941987991333, "global_step": 137834, "epoch": 3281} {"train_loss": -6.709475994110107, "global_step": 137835, "epoch": 3281} {"train_loss": -6.891964912414551, "global_step": 137836, "epoch": 3281} {"train_loss": -6.912708759307861, "global_step": 137837, "epoch": 3281} {"train_loss": -6.717824935913086, "global_step": 137838, "epoch": 3281} {"train_loss": -6.757964611053467, "global_step": 137839, "epoch": 3281} {"train_loss": -6.767523765563965, "global_step": 137840, "epoch": 3281} {"train_loss": -6.799074172973633, "global_step": 137841, "epoch": 3281} {"train_loss": -6.743831634521484, "global_step": 137842, "epoch": 3281} {"train_loss": -6.731726896195185, "global_step": 137843, "epoch": 3281, "val_loss": 66959.3984375} {"train_loss": -6.806347846984863, "global_step": 137844, "epoch": 3282} {"train_loss": -6.8202009201049805, "global_step": 137845, "epoch": 3282} {"train_loss": -6.799337387084961, "global_step": 137846, "epoch": 3282} {"train_loss": -6.718116760253906, "global_step": 137847, "epoch": 3282} {"train_loss": -6.787333011627197, "global_step": 137848, "epoch": 3282} {"train_loss": -6.906914710998535, "global_step": 137849, "epoch": 3282} {"train_loss": -6.7234883308410645, "global_step": 137850, "epoch": 3282} {"train_loss": -6.718051910400391, "global_step": 137851, "epoch": 3282} {"train_loss": -6.731673240661621, "global_step": 137852, "epoch": 3282} {"train_loss": -6.737124443054199, "global_step": 137853, "epoch": 3282} {"train_loss": -6.7839460372924805, "global_step": 137854, "epoch": 3282} {"train_loss": -6.794460296630859, "global_step": 137855, "epoch": 3282} {"train_loss": -6.806251049041748, "global_step": 137856, "epoch": 3282} {"train_loss": -6.761589050292969, "global_step": 137857, "epoch": 3282} {"train_loss": -6.660629749298096, "global_step": 137858, "epoch": 3282} {"train_loss": -6.738492965698242, "global_step": 137859, "epoch": 3282} {"train_loss": -6.854736804962158, "global_step": 137860, "epoch": 3282} {"train_loss": -6.737329006195068, "global_step": 137861, "epoch": 3282} {"train_loss": -6.77182674407959, "global_step": 137862, "epoch": 3282} {"train_loss": -6.717815399169922, "global_step": 137863, "epoch": 3282} {"train_loss": -6.779363632202148, "global_step": 137864, "epoch": 3282} {"train_loss": -6.785644054412842, "global_step": 137865, "epoch": 3282} {"train_loss": -6.741189002990723, "global_step": 137866, "epoch": 3282} {"train_loss": -6.746092796325684, "global_step": 137867, "epoch": 3282} {"train_loss": -6.720297813415527, "global_step": 137868, "epoch": 3282} {"train_loss": -6.823741912841797, "global_step": 137869, "epoch": 3282} {"train_loss": -6.701188564300537, "global_step": 137870, "epoch": 3282} {"train_loss": -6.728325843811035, "global_step": 137871, "epoch": 3282} {"train_loss": -6.754024505615234, "global_step": 137872, "epoch": 3282} {"train_loss": -6.686753273010254, "global_step": 137873, "epoch": 3282} {"train_loss": -6.704543113708496, "global_step": 137874, "epoch": 3282} {"train_loss": -6.572193145751953, "global_step": 137875, "epoch": 3282} {"train_loss": -6.813878059387207, "global_step": 137876, "epoch": 3282} {"train_loss": -6.699525356292725, "global_step": 137877, "epoch": 3282} {"train_loss": -6.735642910003662, "global_step": 137878, "epoch": 3282} {"train_loss": -6.666637420654297, "global_step": 137879, "epoch": 3282} {"train_loss": -6.671696186065674, "global_step": 137880, "epoch": 3282} {"train_loss": -6.736788749694824, "global_step": 137881, "epoch": 3282} {"train_loss": -6.691368579864502, "global_step": 137882, "epoch": 3282} {"train_loss": -6.79958963394165, "global_step": 137883, "epoch": 3282} {"train_loss": -6.575523376464844, "global_step": 137884, "epoch": 3282} {"train_loss": -6.746186052049909, "global_step": 137885, "epoch": 3282, "val_loss": 67075.109375} {"train_loss": -6.73222541809082, "global_step": 137886, "epoch": 3283} {"train_loss": -6.787195205688477, "global_step": 137887, "epoch": 3283} {"train_loss": -6.815459251403809, "global_step": 137888, "epoch": 3283} {"train_loss": -6.630928993225098, "global_step": 137889, "epoch": 3283} {"train_loss": -6.6927642822265625, "global_step": 137890, "epoch": 3283} {"train_loss": -6.698177337646484, "global_step": 137891, "epoch": 3283} {"train_loss": -6.851595878601074, "global_step": 137892, "epoch": 3283} {"train_loss": -6.70116662979126, "global_step": 137893, "epoch": 3283} {"train_loss": -6.658178329467773, "global_step": 137894, "epoch": 3283} {"train_loss": -6.708289623260498, "global_step": 137895, "epoch": 3283} {"train_loss": -6.6420440673828125, "global_step": 137896, "epoch": 3283} {"train_loss": -6.650468826293945, "global_step": 137897, "epoch": 3283} {"train_loss": -6.667537689208984, "global_step": 137898, "epoch": 3283} {"train_loss": -6.726313591003418, "global_step": 137899, "epoch": 3283} {"train_loss": -6.765974998474121, "global_step": 137900, "epoch": 3283} {"train_loss": -6.745299816131592, "global_step": 137901, "epoch": 3283} {"train_loss": -6.7545599937438965, "global_step": 137902, "epoch": 3283} {"train_loss": -6.705690383911133, "global_step": 137903, "epoch": 3283} {"train_loss": -6.734992027282715, "global_step": 137904, "epoch": 3283} {"train_loss": -6.685494422912598, "global_step": 137905, "epoch": 3283} {"train_loss": -6.855719566345215, "global_step": 137906, "epoch": 3283} {"train_loss": -6.790632724761963, "global_step": 137907, "epoch": 3283} {"train_loss": -6.72390079498291, "global_step": 137908, "epoch": 3283} {"train_loss": -6.638920783996582, "global_step": 137909, "epoch": 3283} {"train_loss": -6.808889389038086, "global_step": 137910, "epoch": 3283} {"train_loss": -6.6369547843933105, "global_step": 137911, "epoch": 3283} {"train_loss": -6.7835516929626465, "global_step": 137912, "epoch": 3283} {"train_loss": -6.793871879577637, "global_step": 137913, "epoch": 3283} {"train_loss": -6.741429328918457, "global_step": 137914, "epoch": 3283} {"train_loss": -6.74661922454834, "global_step": 137915, "epoch": 3283} {"train_loss": -6.745793342590332, "global_step": 137916, "epoch": 3283} {"train_loss": -6.760582447052002, "global_step": 137917, "epoch": 3283} {"train_loss": -6.609400749206543, "global_step": 137918, "epoch": 3283} {"train_loss": -6.690886497497559, "global_step": 137919, "epoch": 3283} {"train_loss": -6.755643844604492, "global_step": 137920, "epoch": 3283} {"train_loss": -6.403477668762207, "global_step": 137921, "epoch": 3283} {"train_loss": -6.702390193939209, "global_step": 137922, "epoch": 3283} {"train_loss": -6.667567253112793, "global_step": 137923, "epoch": 3283} {"train_loss": -6.542401313781738, "global_step": 137924, "epoch": 3283} {"train_loss": -6.716220855712891, "global_step": 137925, "epoch": 3283} {"train_loss": -6.612361907958984, "global_step": 137926, "epoch": 3283} {"train_loss": -6.706718671889532, "global_step": 137927, "epoch": 3283, "val_loss": 67182.328125} {"train_loss": -6.678686141967773, "global_step": 137928, "epoch": 3284} {"train_loss": -6.584072589874268, "global_step": 137929, "epoch": 3284} {"train_loss": -6.589188575744629, "global_step": 137930, "epoch": 3284} {"train_loss": -6.639424800872803, "global_step": 137931, "epoch": 3284} {"train_loss": -6.76992130279541, "global_step": 137932, "epoch": 3284} {"train_loss": -6.646726131439209, "global_step": 137933, "epoch": 3284} {"train_loss": -6.629039287567139, "global_step": 137934, "epoch": 3284} {"train_loss": -6.5783514976501465, "global_step": 137935, "epoch": 3284} {"train_loss": -6.707383632659912, "global_step": 137936, "epoch": 3284} {"train_loss": -6.618677139282227, "global_step": 137937, "epoch": 3284} {"train_loss": -6.810373306274414, "global_step": 137938, "epoch": 3284} {"train_loss": -6.6237287521362305, "global_step": 137939, "epoch": 3284} {"train_loss": -6.758955478668213, "global_step": 137940, "epoch": 3284} {"train_loss": -6.751225471496582, "global_step": 137941, "epoch": 3284} {"train_loss": -6.742868423461914, "global_step": 137942, "epoch": 3284} {"train_loss": -6.644552230834961, "global_step": 137943, "epoch": 3284} {"train_loss": -6.588283538818359, "global_step": 137944, "epoch": 3284} {"train_loss": -6.717845916748047, "global_step": 137945, "epoch": 3284} {"train_loss": -6.670402526855469, "global_step": 137946, "epoch": 3284} {"train_loss": -6.7881903648376465, "global_step": 137947, "epoch": 3284} {"train_loss": -6.674007892608643, "global_step": 137948, "epoch": 3284} {"train_loss": -6.7252912521362305, "global_step": 137949, "epoch": 3284} {"train_loss": -6.5252366065979, "global_step": 137950, "epoch": 3284} {"train_loss": -6.859482765197754, "global_step": 137951, "epoch": 3284} {"train_loss": -6.6911773681640625, "global_step": 137952, "epoch": 3284} {"train_loss": -6.6858134269714355, "global_step": 137953, "epoch": 3284} {"train_loss": -6.658778667449951, "global_step": 137954, "epoch": 3284} {"train_loss": -6.707773208618164, "global_step": 137955, "epoch": 3284} {"train_loss": -6.732690811157227, "global_step": 137956, "epoch": 3284} {"train_loss": -6.70904541015625, "global_step": 137957, "epoch": 3284} {"train_loss": -6.634545803070068, "global_step": 137958, "epoch": 3284} {"train_loss": -6.7133684158325195, "global_step": 137959, "epoch": 3284} {"train_loss": -6.6690263748168945, "global_step": 137960, "epoch": 3284} {"train_loss": -6.870561599731445, "global_step": 137961, "epoch": 3284} {"train_loss": -6.758199214935303, "global_step": 137962, "epoch": 3284} {"train_loss": -6.756809234619141, "global_step": 137963, "epoch": 3284} {"train_loss": -6.781571388244629, "global_step": 137964, "epoch": 3284} {"train_loss": -6.795868873596191, "global_step": 137965, "epoch": 3284} {"train_loss": -6.730995178222656, "global_step": 137966, "epoch": 3284} {"train_loss": -6.59638786315918, "global_step": 137967, "epoch": 3284} {"train_loss": -6.716612815856934, "global_step": 137968, "epoch": 3284} {"train_loss": -6.696263801483881, "global_step": 137969, "epoch": 3284, "val_loss": 67350.78125} {"train_loss": -6.657361030578613, "global_step": 137970, "epoch": 3285} {"train_loss": -6.856017589569092, "global_step": 137971, "epoch": 3285} {"train_loss": -6.623908519744873, "global_step": 137972, "epoch": 3285} {"train_loss": -6.688421249389648, "global_step": 137973, "epoch": 3285} {"train_loss": -6.786724090576172, "global_step": 137974, "epoch": 3285} {"train_loss": -6.6032843589782715, "global_step": 137975, "epoch": 3285} {"train_loss": -6.724708080291748, "global_step": 137976, "epoch": 3285} {"train_loss": -6.733750343322754, "global_step": 137977, "epoch": 3285} {"train_loss": -6.679998397827148, "global_step": 137978, "epoch": 3285} {"train_loss": -6.7476677894592285, "global_step": 137979, "epoch": 3285} {"train_loss": -6.770788192749023, "global_step": 137980, "epoch": 3285} {"train_loss": -6.85188102722168, "global_step": 137981, "epoch": 3285} {"train_loss": -6.696485996246338, "global_step": 137982, "epoch": 3285} {"train_loss": -6.8238444328308105, "global_step": 137983, "epoch": 3285} {"train_loss": -6.7914934158325195, "global_step": 137984, "epoch": 3285} {"train_loss": -6.756601333618164, "global_step": 137985, "epoch": 3285} {"train_loss": -6.725521564483643, "global_step": 137986, "epoch": 3285} {"train_loss": -6.601626396179199, "global_step": 137987, "epoch": 3285} {"train_loss": -6.750558853149414, "global_step": 137988, "epoch": 3285} {"train_loss": -6.670486927032471, "global_step": 137989, "epoch": 3285} {"train_loss": -6.681502342224121, "global_step": 137990, "epoch": 3285} {"train_loss": -6.674576282501221, "global_step": 137991, "epoch": 3285} {"train_loss": -6.797179698944092, "global_step": 137992, "epoch": 3285} {"train_loss": -6.7997212409973145, "global_step": 137993, "epoch": 3285} {"train_loss": -6.788951873779297, "global_step": 137994, "epoch": 3285} {"train_loss": -6.72711181640625, "global_step": 137995, "epoch": 3285} {"train_loss": -6.8181328773498535, "global_step": 137996, "epoch": 3285} {"train_loss": -6.616950511932373, "global_step": 137997, "epoch": 3285} {"train_loss": -6.806919574737549, "global_step": 137998, "epoch": 3285} {"train_loss": -6.739934921264648, "global_step": 137999, "epoch": 3285} {"train_loss": -6.77707576751709, "global_step": 138000, "epoch": 3285} {"train_loss": -6.752307891845703, "global_step": 138001, "epoch": 3285} {"train_loss": -6.739822864532471, "global_step": 138002, "epoch": 3285} {"train_loss": -6.673308372497559, "global_step": 138003, "epoch": 3285} {"train_loss": -6.6490678787231445, "global_step": 138004, "epoch": 3285} {"train_loss": -6.5353922843933105, "global_step": 138005, "epoch": 3285} {"train_loss": -6.692879676818848, "global_step": 138006, "epoch": 3285} {"train_loss": -6.699939727783203, "global_step": 138007, "epoch": 3285} {"train_loss": -6.590940952301025, "global_step": 138008, "epoch": 3285} {"train_loss": -6.760468482971191, "global_step": 138009, "epoch": 3285} {"train_loss": -6.677042007446289, "global_step": 138010, "epoch": 3285} {"train_loss": -6.721863042740595, "global_step": 138011, "epoch": 3285, "val_loss": 67144.890625} {"train_loss": -6.782219886779785, "global_step": 138012, "epoch": 3286} {"train_loss": -6.813808441162109, "global_step": 138013, "epoch": 3286} {"train_loss": -6.635280609130859, "global_step": 138014, "epoch": 3286} {"train_loss": -6.689862251281738, "global_step": 138015, "epoch": 3286} {"train_loss": -6.7612409591674805, "global_step": 138016, "epoch": 3286} {"train_loss": -6.641254901885986, "global_step": 138017, "epoch": 3286} {"train_loss": -6.7378644943237305, "global_step": 138018, "epoch": 3286} {"train_loss": -6.635848045349121, "global_step": 138019, "epoch": 3286} {"train_loss": -6.734799385070801, "global_step": 138020, "epoch": 3286} {"train_loss": -6.677486419677734, "global_step": 138021, "epoch": 3286} {"train_loss": -6.742094993591309, "global_step": 138022, "epoch": 3286} {"train_loss": -6.743193626403809, "global_step": 138023, "epoch": 3286} {"train_loss": -6.650123596191406, "global_step": 138024, "epoch": 3286} {"train_loss": -6.696011066436768, "global_step": 138025, "epoch": 3286} {"train_loss": -6.7602949142456055, "global_step": 138026, "epoch": 3286} {"train_loss": -6.7512712478637695, "global_step": 138027, "epoch": 3286} {"train_loss": -6.731310844421387, "global_step": 138028, "epoch": 3286} {"train_loss": -6.846055030822754, "global_step": 138029, "epoch": 3286} {"train_loss": -6.8313093185424805, "global_step": 138030, "epoch": 3286} {"train_loss": -6.776540756225586, "global_step": 138031, "epoch": 3286} {"train_loss": -6.756486892700195, "global_step": 138032, "epoch": 3286} {"train_loss": -6.723969459533691, "global_step": 138033, "epoch": 3286} {"train_loss": -6.784246444702148, "global_step": 138034, "epoch": 3286} {"train_loss": -6.7913336753845215, "global_step": 138035, "epoch": 3286} {"train_loss": -6.788078308105469, "global_step": 138036, "epoch": 3286} {"train_loss": -6.864753723144531, "global_step": 138037, "epoch": 3286} {"train_loss": -6.855563163757324, "global_step": 138038, "epoch": 3286} {"train_loss": -6.761161804199219, "global_step": 138039, "epoch": 3286} {"train_loss": -6.832975387573242, "global_step": 138040, "epoch": 3286} {"train_loss": -6.6350998878479, "global_step": 138041, "epoch": 3286} {"train_loss": -6.875676155090332, "global_step": 138042, "epoch": 3286} {"train_loss": -6.7743072509765625, "global_step": 138043, "epoch": 3286} {"train_loss": -6.841978073120117, "global_step": 138044, "epoch": 3286} {"train_loss": -6.76593017578125, "global_step": 138045, "epoch": 3286} {"train_loss": -6.803027629852295, "global_step": 138046, "epoch": 3286} {"train_loss": -6.736052513122559, "global_step": 138047, "epoch": 3286} {"train_loss": -6.683999538421631, "global_step": 138048, "epoch": 3286} {"train_loss": -6.748407363891602, "global_step": 138049, "epoch": 3286} {"train_loss": -6.693733215332031, "global_step": 138050, "epoch": 3286} {"train_loss": -6.709188461303711, "global_step": 138051, "epoch": 3286} {"train_loss": -6.7718658447265625, "global_step": 138052, "epoch": 3286} {"train_loss": -6.753627561387562, "global_step": 138053, "epoch": 3286, "val_loss": 67248.015625} {"train_loss": -6.831063270568848, "global_step": 138054, "epoch": 3287} {"train_loss": -6.785120964050293, "global_step": 138055, "epoch": 3287} {"train_loss": -6.682345390319824, "global_step": 138056, "epoch": 3287} {"train_loss": -6.709652900695801, "global_step": 138057, "epoch": 3287} {"train_loss": -6.817293167114258, "global_step": 138058, "epoch": 3287} {"train_loss": -6.778914451599121, "global_step": 138059, "epoch": 3287} {"train_loss": -6.673482894897461, "global_step": 138060, "epoch": 3287} {"train_loss": -6.854790210723877, "global_step": 138061, "epoch": 3287} {"train_loss": -6.755929946899414, "global_step": 138062, "epoch": 3287} {"train_loss": -6.767649173736572, "global_step": 138063, "epoch": 3287} {"train_loss": -6.712377071380615, "global_step": 138064, "epoch": 3287} {"train_loss": -6.789679527282715, "global_step": 138065, "epoch": 3287} {"train_loss": -6.722970962524414, "global_step": 138066, "epoch": 3287} {"train_loss": -6.751105785369873, "global_step": 138067, "epoch": 3287} {"train_loss": -6.605445861816406, "global_step": 138068, "epoch": 3287} {"train_loss": -6.764767646789551, "global_step": 138069, "epoch": 3287} {"train_loss": -6.658117771148682, "global_step": 138070, "epoch": 3287} {"train_loss": -6.749501705169678, "global_step": 138071, "epoch": 3287} {"train_loss": -6.667934417724609, "global_step": 138072, "epoch": 3287} {"train_loss": -6.725374698638916, "global_step": 138073, "epoch": 3287} {"train_loss": -6.726807117462158, "global_step": 138074, "epoch": 3287} {"train_loss": -6.670964241027832, "global_step": 138075, "epoch": 3287} {"train_loss": -6.636319160461426, "global_step": 138076, "epoch": 3287} {"train_loss": -6.6645121574401855, "global_step": 138077, "epoch": 3287} {"train_loss": -6.720457077026367, "global_step": 138078, "epoch": 3287} {"train_loss": -6.742112159729004, "global_step": 138079, "epoch": 3287} {"train_loss": -6.6852521896362305, "global_step": 138080, "epoch": 3287} {"train_loss": -6.705718994140625, "global_step": 138081, "epoch": 3287} {"train_loss": -6.6138410568237305, "global_step": 138082, "epoch": 3287} {"train_loss": -6.664158821105957, "global_step": 138083, "epoch": 3287} {"train_loss": -6.602128982543945, "global_step": 138084, "epoch": 3287} {"train_loss": -6.71812629699707, "global_step": 138085, "epoch": 3287} {"train_loss": -6.796958923339844, "global_step": 138086, "epoch": 3287} {"train_loss": -6.69382381439209, "global_step": 138087, "epoch": 3287} {"train_loss": -6.629393577575684, "global_step": 138088, "epoch": 3287} {"train_loss": -6.790410041809082, "global_step": 138089, "epoch": 3287} {"train_loss": -6.693109035491943, "global_step": 138090, "epoch": 3287} {"train_loss": -6.681094169616699, "global_step": 138091, "epoch": 3287} {"train_loss": -6.654056549072266, "global_step": 138092, "epoch": 3287} {"train_loss": -6.65767765045166, "global_step": 138093, "epoch": 3287} {"train_loss": -6.869813919067383, "global_step": 138094, "epoch": 3287} {"train_loss": -6.7212114334106445, "global_step": 138095, "epoch": 3287, "val_loss": 67076.4140625} {"train_loss": -6.669127464294434, "global_step": 138096, "epoch": 3288} {"train_loss": -6.7341413497924805, "global_step": 138097, "epoch": 3288} {"train_loss": -6.761809825897217, "global_step": 138098, "epoch": 3288} {"train_loss": -6.777154922485352, "global_step": 138099, "epoch": 3288} {"train_loss": -6.689547538757324, "global_step": 138100, "epoch": 3288} {"train_loss": -6.6853437423706055, "global_step": 138101, "epoch": 3288} {"train_loss": -6.732150554656982, "global_step": 138102, "epoch": 3288} {"train_loss": -6.713991165161133, "global_step": 138103, "epoch": 3288} {"train_loss": -6.684591770172119, "global_step": 138104, "epoch": 3288} {"train_loss": -6.750098705291748, "global_step": 138105, "epoch": 3288} {"train_loss": -6.77651834487915, "global_step": 138106, "epoch": 3288} {"train_loss": -6.780196666717529, "global_step": 138107, "epoch": 3288} {"train_loss": -6.7017927169799805, "global_step": 138108, "epoch": 3288} {"train_loss": -6.811670780181885, "global_step": 138109, "epoch": 3288} {"train_loss": -6.688471794128418, "global_step": 138110, "epoch": 3288} {"train_loss": -6.739841938018799, "global_step": 138111, "epoch": 3288} {"train_loss": -6.652574062347412, "global_step": 138112, "epoch": 3288} {"train_loss": -6.7180891036987305, "global_step": 138113, "epoch": 3288} {"train_loss": -6.756461143493652, "global_step": 138114, "epoch": 3288} {"train_loss": -6.666201591491699, "global_step": 138115, "epoch": 3288} {"train_loss": -6.69090461730957, "global_step": 138116, "epoch": 3288} {"train_loss": -6.764766216278076, "global_step": 138117, "epoch": 3288} {"train_loss": -6.651297569274902, "global_step": 138118, "epoch": 3288} {"train_loss": -6.721518039703369, "global_step": 138119, "epoch": 3288} {"train_loss": -6.799736022949219, "global_step": 138120, "epoch": 3288} {"train_loss": -6.777065277099609, "global_step": 138121, "epoch": 3288} {"train_loss": -6.678256988525391, "global_step": 138122, "epoch": 3288} {"train_loss": -6.769060134887695, "global_step": 138123, "epoch": 3288} {"train_loss": -6.728275775909424, "global_step": 138124, "epoch": 3288} {"train_loss": -6.734931945800781, "global_step": 138125, "epoch": 3288} {"train_loss": -6.775396347045898, "global_step": 138126, "epoch": 3288} {"train_loss": -6.749053955078125, "global_step": 138127, "epoch": 3288} {"train_loss": -6.675710678100586, "global_step": 138128, "epoch": 3288} {"train_loss": -6.717824935913086, "global_step": 138129, "epoch": 3288} {"train_loss": -6.759737968444824, "global_step": 138130, "epoch": 3288} {"train_loss": -6.72423791885376, "global_step": 138131, "epoch": 3288} {"train_loss": -6.752312660217285, "global_step": 138132, "epoch": 3288} {"train_loss": -6.8245415687561035, "global_step": 138133, "epoch": 3288} {"train_loss": -6.7941131591796875, "global_step": 138134, "epoch": 3288} {"train_loss": -6.698843002319336, "global_step": 138135, "epoch": 3288} {"train_loss": -6.843603134155273, "global_step": 138136, "epoch": 3288} {"train_loss": -6.733763637996855, "global_step": 138137, "epoch": 3288, "val_loss": 67170.375} {"train_loss": -6.816700458526611, "global_step": 138138, "epoch": 3289} {"train_loss": -6.780165672302246, "global_step": 138139, "epoch": 3289} {"train_loss": -6.8044023513793945, "global_step": 138140, "epoch": 3289} {"train_loss": -6.791444778442383, "global_step": 138141, "epoch": 3289} {"train_loss": -6.708662986755371, "global_step": 138142, "epoch": 3289} {"train_loss": -6.719751358032227, "global_step": 138143, "epoch": 3289} {"train_loss": -6.774934768676758, "global_step": 138144, "epoch": 3289} {"train_loss": -6.712573528289795, "global_step": 138145, "epoch": 3289} {"train_loss": -6.795797824859619, "global_step": 138146, "epoch": 3289} {"train_loss": -6.862298965454102, "global_step": 138147, "epoch": 3289} {"train_loss": -6.659503936767578, "global_step": 138148, "epoch": 3289} {"train_loss": -6.778329849243164, "global_step": 138149, "epoch": 3289} {"train_loss": -6.837919235229492, "global_step": 138150, "epoch": 3289} {"train_loss": -6.727395057678223, "global_step": 138151, "epoch": 3289} {"train_loss": -6.630258083343506, "global_step": 138152, "epoch": 3289} {"train_loss": -6.716629981994629, "global_step": 138153, "epoch": 3289} {"train_loss": -6.771651744842529, "global_step": 138154, "epoch": 3289} {"train_loss": -6.655542373657227, "global_step": 138155, "epoch": 3289} {"train_loss": -6.68243932723999, "global_step": 138156, "epoch": 3289} {"train_loss": -6.774632930755615, "global_step": 138157, "epoch": 3289} {"train_loss": -6.591684341430664, "global_step": 138158, "epoch": 3289} {"train_loss": -6.719732761383057, "global_step": 138159, "epoch": 3289} {"train_loss": -6.697113513946533, "global_step": 138160, "epoch": 3289} {"train_loss": -6.800137519836426, "global_step": 138161, "epoch": 3289} {"train_loss": -6.699804306030273, "global_step": 138162, "epoch": 3289} {"train_loss": -6.732470512390137, "global_step": 138163, "epoch": 3289} {"train_loss": -6.797768592834473, "global_step": 138164, "epoch": 3289} {"train_loss": -6.7127461433410645, "global_step": 138165, "epoch": 3289} {"train_loss": -6.760444641113281, "global_step": 138166, "epoch": 3289} {"train_loss": -6.753658294677734, "global_step": 138167, "epoch": 3289} {"train_loss": -6.735689163208008, "global_step": 138168, "epoch": 3289} {"train_loss": -6.613286018371582, "global_step": 138169, "epoch": 3289} {"train_loss": -6.7432355880737305, "global_step": 138170, "epoch": 3289} {"train_loss": -6.785329818725586, "global_step": 138171, "epoch": 3289} {"train_loss": -6.7097063064575195, "global_step": 138172, "epoch": 3289} {"train_loss": -6.782256603240967, "global_step": 138173, "epoch": 3289} {"train_loss": -6.889425754547119, "global_step": 138174, "epoch": 3289} {"train_loss": -6.658876419067383, "global_step": 138175, "epoch": 3289} {"train_loss": -6.6105804443359375, "global_step": 138176, "epoch": 3289} {"train_loss": -6.762885093688965, "global_step": 138177, "epoch": 3289} {"train_loss": -6.707074165344238, "global_step": 138178, "epoch": 3289} {"train_loss": -6.737496126265753, "global_step": 138179, "epoch": 3289, "val_loss": 67142.09375} {"train_loss": -6.769670486450195, "global_step": 138180, "epoch": 3290} {"train_loss": -6.62641716003418, "global_step": 138181, "epoch": 3290} {"train_loss": -6.620827674865723, "global_step": 138182, "epoch": 3290} {"train_loss": -6.664972305297852, "global_step": 138183, "epoch": 3290} {"train_loss": -6.725154876708984, "global_step": 138184, "epoch": 3290} {"train_loss": -6.685131072998047, "global_step": 138185, "epoch": 3290} {"train_loss": -6.569148063659668, "global_step": 138186, "epoch": 3290} {"train_loss": -6.678321838378906, "global_step": 138187, "epoch": 3290} {"train_loss": -6.633885860443115, "global_step": 138188, "epoch": 3290} {"train_loss": -6.659135818481445, "global_step": 138189, "epoch": 3290} {"train_loss": -6.707553863525391, "global_step": 138190, "epoch": 3290} {"train_loss": -6.6959028244018555, "global_step": 138191, "epoch": 3290} {"train_loss": -6.768360137939453, "global_step": 138192, "epoch": 3290} {"train_loss": -6.8228020668029785, "global_step": 138193, "epoch": 3290} {"train_loss": -6.763354778289795, "global_step": 138194, "epoch": 3290} {"train_loss": -6.721584796905518, "global_step": 138195, "epoch": 3290} {"train_loss": -6.704374313354492, "global_step": 138196, "epoch": 3290} {"train_loss": -6.645698547363281, "global_step": 138197, "epoch": 3290} {"train_loss": -6.711202621459961, "global_step": 138198, "epoch": 3290} {"train_loss": -6.599268913269043, "global_step": 138199, "epoch": 3290} {"train_loss": -6.686591148376465, "global_step": 138200, "epoch": 3290} {"train_loss": -6.562370300292969, "global_step": 138201, "epoch": 3290} {"train_loss": -6.788642406463623, "global_step": 138202, "epoch": 3290} {"train_loss": -6.796677589416504, "global_step": 138203, "epoch": 3290} {"train_loss": -6.715188026428223, "global_step": 138204, "epoch": 3290} {"train_loss": -6.725013732910156, "global_step": 138205, "epoch": 3290} {"train_loss": -6.771579265594482, "global_step": 138206, "epoch": 3290} {"train_loss": -6.768772125244141, "global_step": 138207, "epoch": 3290} {"train_loss": -6.706837177276611, "global_step": 138208, "epoch": 3290} {"train_loss": -6.821240425109863, "global_step": 138209, "epoch": 3290} {"train_loss": -6.740320682525635, "global_step": 138210, "epoch": 3290} {"train_loss": -6.769466400146484, "global_step": 138211, "epoch": 3290} {"train_loss": -6.766293048858643, "global_step": 138212, "epoch": 3290} {"train_loss": -6.689427852630615, "global_step": 138213, "epoch": 3290} {"train_loss": -6.765499114990234, "global_step": 138214, "epoch": 3290} {"train_loss": -6.778332710266113, "global_step": 138215, "epoch": 3290} {"train_loss": -6.795477390289307, "global_step": 138216, "epoch": 3290} {"train_loss": -6.789252281188965, "global_step": 138217, "epoch": 3290} {"train_loss": -6.684492111206055, "global_step": 138218, "epoch": 3290} {"train_loss": -6.854336738586426, "global_step": 138219, "epoch": 3290} {"train_loss": -6.676828384399414, "global_step": 138220, "epoch": 3290} {"train_loss": -6.719617128372192, "global_step": 138221, "epoch": 3290, "val_loss": 67091.8203125} {"train_loss": -6.720952033996582, "global_step": 138222, "epoch": 3291} {"train_loss": -6.7093892097473145, "global_step": 138223, "epoch": 3291} {"train_loss": -6.693027496337891, "global_step": 138224, "epoch": 3291} {"train_loss": -6.691683769226074, "global_step": 138225, "epoch": 3291} {"train_loss": -6.780897617340088, "global_step": 138226, "epoch": 3291} {"train_loss": -6.758237838745117, "global_step": 138227, "epoch": 3291} {"train_loss": -6.776777267456055, "global_step": 138228, "epoch": 3291} {"train_loss": -6.981292247772217, "global_step": 138229, "epoch": 3291} {"train_loss": -6.76634407043457, "global_step": 138230, "epoch": 3291} {"train_loss": -6.6227617263793945, "global_step": 138231, "epoch": 3291} {"train_loss": -6.738778591156006, "global_step": 138232, "epoch": 3291} {"train_loss": -6.7679290771484375, "global_step": 138233, "epoch": 3291} {"train_loss": -6.715422630310059, "global_step": 138234, "epoch": 3291} {"train_loss": -6.662548065185547, "global_step": 138235, "epoch": 3291} {"train_loss": -6.56843376159668, "global_step": 138236, "epoch": 3291} {"train_loss": -6.769417762756348, "global_step": 138237, "epoch": 3291} {"train_loss": -6.794830799102783, "global_step": 138238, "epoch": 3291} {"train_loss": -6.819213390350342, "global_step": 138239, "epoch": 3291} {"train_loss": -6.620073318481445, "global_step": 138240, "epoch": 3291} {"train_loss": -6.843340873718262, "global_step": 138241, "epoch": 3291} {"train_loss": -6.7624053955078125, "global_step": 138242, "epoch": 3291} {"train_loss": -6.773225784301758, "global_step": 138243, "epoch": 3291} {"train_loss": -6.716892242431641, "global_step": 138244, "epoch": 3291} {"train_loss": -6.569792747497559, "global_step": 138245, "epoch": 3291} {"train_loss": -6.756094455718994, "global_step": 138246, "epoch": 3291} {"train_loss": -6.790765762329102, "global_step": 138247, "epoch": 3291} {"train_loss": -6.728340148925781, "global_step": 138248, "epoch": 3291} {"train_loss": -6.714598178863525, "global_step": 138249, "epoch": 3291} {"train_loss": -6.774344444274902, "global_step": 138250, "epoch": 3291} {"train_loss": -6.690942287445068, "global_step": 138251, "epoch": 3291} {"train_loss": -6.803187370300293, "global_step": 138252, "epoch": 3291} {"train_loss": -6.778276443481445, "global_step": 138253, "epoch": 3291} {"train_loss": -6.895357608795166, "global_step": 138254, "epoch": 3291} {"train_loss": -6.692865371704102, "global_step": 138255, "epoch": 3291} {"train_loss": -6.770987510681152, "global_step": 138256, "epoch": 3291} {"train_loss": -6.670681476593018, "global_step": 138257, "epoch": 3291} {"train_loss": -6.641271591186523, "global_step": 138258, "epoch": 3291} {"train_loss": -6.739099502563477, "global_step": 138259, "epoch": 3291} {"train_loss": -6.601067066192627, "global_step": 138260, "epoch": 3291} {"train_loss": -6.7496161460876465, "global_step": 138261, "epoch": 3291} {"train_loss": -6.804539680480957, "global_step": 138262, "epoch": 3291} {"train_loss": -6.73819789432344, "global_step": 138263, "epoch": 3291, "val_loss": 67245.359375} {"train_loss": -6.784714698791504, "global_step": 138264, "epoch": 3292} {"train_loss": -6.641216278076172, "global_step": 138265, "epoch": 3292} {"train_loss": -6.665897369384766, "global_step": 138266, "epoch": 3292} {"train_loss": -6.736008644104004, "global_step": 138267, "epoch": 3292} {"train_loss": -6.648029327392578, "global_step": 138268, "epoch": 3292} {"train_loss": -6.744224548339844, "global_step": 138269, "epoch": 3292} {"train_loss": -6.729478359222412, "global_step": 138270, "epoch": 3292} {"train_loss": -6.672823905944824, "global_step": 138271, "epoch": 3292} {"train_loss": -6.685054302215576, "global_step": 138272, "epoch": 3292} {"train_loss": -6.7524309158325195, "global_step": 138273, "epoch": 3292} {"train_loss": -6.771452903747559, "global_step": 138274, "epoch": 3292} {"train_loss": -6.714820861816406, "global_step": 138275, "epoch": 3292} {"train_loss": -6.76866340637207, "global_step": 138276, "epoch": 3292} {"train_loss": -6.566571235656738, "global_step": 138277, "epoch": 3292} {"train_loss": -6.773149490356445, "global_step": 138278, "epoch": 3292} {"train_loss": -6.698906421661377, "global_step": 138279, "epoch": 3292} {"train_loss": -6.692616939544678, "global_step": 138280, "epoch": 3292} {"train_loss": -6.729608058929443, "global_step": 138281, "epoch": 3292} {"train_loss": -6.663717269897461, "global_step": 138282, "epoch": 3292} {"train_loss": -6.724831581115723, "global_step": 138283, "epoch": 3292} {"train_loss": -6.72524356842041, "global_step": 138284, "epoch": 3292} {"train_loss": -6.669368743896484, "global_step": 138285, "epoch": 3292} {"train_loss": -6.744621276855469, "global_step": 138286, "epoch": 3292} {"train_loss": -6.712460994720459, "global_step": 138287, "epoch": 3292} {"train_loss": -6.9005584716796875, "global_step": 138288, "epoch": 3292} {"train_loss": -6.825436592102051, "global_step": 138289, "epoch": 3292} {"train_loss": -6.699549674987793, "global_step": 138290, "epoch": 3292} {"train_loss": -6.785782814025879, "global_step": 138291, "epoch": 3292} {"train_loss": -6.718626976013184, "global_step": 138292, "epoch": 3292} {"train_loss": -6.652748107910156, "global_step": 138293, "epoch": 3292} {"train_loss": -6.68964958190918, "global_step": 138294, "epoch": 3292} {"train_loss": -6.801628112792969, "global_step": 138295, "epoch": 3292} {"train_loss": -6.777135372161865, "global_step": 138296, "epoch": 3292} {"train_loss": -6.770243167877197, "global_step": 138297, "epoch": 3292} {"train_loss": -6.835737228393555, "global_step": 138298, "epoch": 3292} {"train_loss": -6.870935440063477, "global_step": 138299, "epoch": 3292} {"train_loss": -6.729386329650879, "global_step": 138300, "epoch": 3292} {"train_loss": -6.788015365600586, "global_step": 138301, "epoch": 3292} {"train_loss": -6.87202787399292, "global_step": 138302, "epoch": 3292} {"train_loss": -6.779401779174805, "global_step": 138303, "epoch": 3292} {"train_loss": -6.776636123657227, "global_step": 138304, "epoch": 3292} {"train_loss": -6.738431272052583, "global_step": 138305, "epoch": 3292, "val_loss": 67241.0} {"train_loss": -6.755403995513916, "global_step": 138306, "epoch": 3293} {"train_loss": -6.878471374511719, "global_step": 138307, "epoch": 3293} {"train_loss": -6.776234149932861, "global_step": 138308, "epoch": 3293} {"train_loss": -6.832952976226807, "global_step": 138309, "epoch": 3293} {"train_loss": -6.730252265930176, "global_step": 138310, "epoch": 3293} {"train_loss": -6.770282745361328, "global_step": 138311, "epoch": 3293} {"train_loss": -6.83039665222168, "global_step": 138312, "epoch": 3293} {"train_loss": -6.83510160446167, "global_step": 138313, "epoch": 3293} {"train_loss": -6.813084602355957, "global_step": 138314, "epoch": 3293} {"train_loss": -6.838571548461914, "global_step": 138315, "epoch": 3293} {"train_loss": -6.772315979003906, "global_step": 138316, "epoch": 3293} {"train_loss": -6.740203857421875, "global_step": 138317, "epoch": 3293} {"train_loss": -6.720361709594727, "global_step": 138318, "epoch": 3293} {"train_loss": -6.7336344718933105, "global_step": 138319, "epoch": 3293} {"train_loss": -6.766865253448486, "global_step": 138320, "epoch": 3293} {"train_loss": -6.746649742126465, "global_step": 138321, "epoch": 3293} {"train_loss": -6.802314758300781, "global_step": 138322, "epoch": 3293} {"train_loss": -6.7884087562561035, "global_step": 138323, "epoch": 3293} {"train_loss": -6.906827926635742, "global_step": 138324, "epoch": 3293} {"train_loss": -6.832489013671875, "global_step": 138325, "epoch": 3293} {"train_loss": -6.8086771965026855, "global_step": 138326, "epoch": 3293} {"train_loss": -6.790792465209961, "global_step": 138327, "epoch": 3293} {"train_loss": -6.797613143920898, "global_step": 138328, "epoch": 3293} {"train_loss": -6.773210525512695, "global_step": 138329, "epoch": 3293} {"train_loss": -6.782090187072754, "global_step": 138330, "epoch": 3293} {"train_loss": -6.668905258178711, "global_step": 138331, "epoch": 3293} {"train_loss": -6.861083507537842, "global_step": 138332, "epoch": 3293} {"train_loss": -6.721747875213623, "global_step": 138333, "epoch": 3293} {"train_loss": -6.792026042938232, "global_step": 138334, "epoch": 3293} {"train_loss": -6.613544464111328, "global_step": 138335, "epoch": 3293} {"train_loss": -6.774248123168945, "global_step": 138336, "epoch": 3293} {"train_loss": -6.815232276916504, "global_step": 138337, "epoch": 3293} {"train_loss": -6.587267875671387, "global_step": 138338, "epoch": 3293} {"train_loss": -6.752063751220703, "global_step": 138339, "epoch": 3293} {"train_loss": -6.854556083679199, "global_step": 138340, "epoch": 3293} {"train_loss": -6.674800872802734, "global_step": 138341, "epoch": 3293} {"train_loss": -6.840056896209717, "global_step": 138342, "epoch": 3293} {"train_loss": -6.639429092407227, "global_step": 138343, "epoch": 3293} {"train_loss": -6.630565643310547, "global_step": 138344, "epoch": 3293} {"train_loss": -6.702195167541504, "global_step": 138345, "epoch": 3293} {"train_loss": -6.696089744567871, "global_step": 138346, "epoch": 3293} {"train_loss": -6.768610227675665, "global_step": 138347, "epoch": 3293, "val_loss": 67142.7890625} {"train_loss": -6.81694221496582, "global_step": 138348, "epoch": 3294} {"train_loss": -6.750023365020752, "global_step": 138349, "epoch": 3294} {"train_loss": -6.636452674865723, "global_step": 138350, "epoch": 3294} {"train_loss": -6.727403163909912, "global_step": 138351, "epoch": 3294} {"train_loss": -6.745990753173828, "global_step": 138352, "epoch": 3294} {"train_loss": -6.675841331481934, "global_step": 138353, "epoch": 3294} {"train_loss": -6.838804244995117, "global_step": 138354, "epoch": 3294} {"train_loss": -6.771975994110107, "global_step": 138355, "epoch": 3294} {"train_loss": -6.623989105224609, "global_step": 138356, "epoch": 3294} {"train_loss": -6.771012306213379, "global_step": 138357, "epoch": 3294} {"train_loss": -6.674151420593262, "global_step": 138358, "epoch": 3294} {"train_loss": -6.757446765899658, "global_step": 138359, "epoch": 3294} {"train_loss": -6.754505634307861, "global_step": 138360, "epoch": 3294} {"train_loss": -6.688951015472412, "global_step": 138361, "epoch": 3294} {"train_loss": -6.724822044372559, "global_step": 138362, "epoch": 3294} {"train_loss": -6.692134857177734, "global_step": 138363, "epoch": 3294} {"train_loss": -6.806626796722412, "global_step": 138364, "epoch": 3294} {"train_loss": -6.7232537269592285, "global_step": 138365, "epoch": 3294} {"train_loss": -6.794482707977295, "global_step": 138366, "epoch": 3294} {"train_loss": -6.746979713439941, "global_step": 138367, "epoch": 3294} {"train_loss": -6.775012969970703, "global_step": 138368, "epoch": 3294} {"train_loss": -6.825457572937012, "global_step": 138369, "epoch": 3294} {"train_loss": -6.760228157043457, "global_step": 138370, "epoch": 3294} {"train_loss": -6.664176940917969, "global_step": 138371, "epoch": 3294} {"train_loss": -6.720564842224121, "global_step": 138372, "epoch": 3294} {"train_loss": -6.777933597564697, "global_step": 138373, "epoch": 3294} {"train_loss": -6.797296524047852, "global_step": 138374, "epoch": 3294} {"train_loss": -6.733780384063721, "global_step": 138375, "epoch": 3294} {"train_loss": -6.775674819946289, "global_step": 138376, "epoch": 3294} {"train_loss": -6.823686599731445, "global_step": 138377, "epoch": 3294} {"train_loss": -6.823616981506348, "global_step": 138378, "epoch": 3294} {"train_loss": -6.753375053405762, "global_step": 138379, "epoch": 3294} {"train_loss": -6.693488121032715, "global_step": 138380, "epoch": 3294} {"train_loss": -6.764819145202637, "global_step": 138381, "epoch": 3294} {"train_loss": -6.673464775085449, "global_step": 138382, "epoch": 3294} {"train_loss": -6.671550750732422, "global_step": 138383, "epoch": 3294} {"train_loss": -6.744930744171143, "global_step": 138384, "epoch": 3294} {"train_loss": -6.60389518737793, "global_step": 138385, "epoch": 3294} {"train_loss": -6.694879531860352, "global_step": 138386, "epoch": 3294} {"train_loss": -6.591712951660156, "global_step": 138387, "epoch": 3294} {"train_loss": -6.682791233062744, "global_step": 138388, "epoch": 3294} {"train_loss": -6.731507221857707, "global_step": 138389, "epoch": 3294, "val_loss": 67066.7734375} {"train_loss": -6.639753341674805, "global_step": 138390, "epoch": 3295} {"train_loss": -6.656819820404053, "global_step": 138391, "epoch": 3295} {"train_loss": -6.777006149291992, "global_step": 138392, "epoch": 3295} {"train_loss": -6.588620185852051, "global_step": 138393, "epoch": 3295} {"train_loss": -6.5753254890441895, "global_step": 138394, "epoch": 3295} {"train_loss": -6.631322383880615, "global_step": 138395, "epoch": 3295} {"train_loss": -6.689396858215332, "global_step": 138396, "epoch": 3295} {"train_loss": -6.618956565856934, "global_step": 138397, "epoch": 3295} {"train_loss": -6.644969940185547, "global_step": 138398, "epoch": 3295} {"train_loss": -6.7002973556518555, "global_step": 138399, "epoch": 3295} {"train_loss": -6.63284158706665, "global_step": 138400, "epoch": 3295} {"train_loss": -6.77541446685791, "global_step": 138401, "epoch": 3295} {"train_loss": -6.480564117431641, "global_step": 138402, "epoch": 3295} {"train_loss": -6.732872486114502, "global_step": 138403, "epoch": 3295} {"train_loss": -6.669837951660156, "global_step": 138404, "epoch": 3295} {"train_loss": -6.734744548797607, "global_step": 138405, "epoch": 3295} {"train_loss": -6.662289619445801, "global_step": 138406, "epoch": 3295} {"train_loss": -6.747541904449463, "global_step": 138407, "epoch": 3295} {"train_loss": -6.657651424407959, "global_step": 138408, "epoch": 3295} {"train_loss": -6.651388168334961, "global_step": 138409, "epoch": 3295} {"train_loss": -6.782471179962158, "global_step": 138410, "epoch": 3295} {"train_loss": -6.719925880432129, "global_step": 138411, "epoch": 3295} {"train_loss": -6.653827667236328, "global_step": 138412, "epoch": 3295} {"train_loss": -6.828865051269531, "global_step": 138413, "epoch": 3295} {"train_loss": -6.695279121398926, "global_step": 138414, "epoch": 3295} {"train_loss": -6.689863204956055, "global_step": 138415, "epoch": 3295} {"train_loss": -6.619589805603027, "global_step": 138416, "epoch": 3295} {"train_loss": -6.732534408569336, "global_step": 138417, "epoch": 3295} {"train_loss": -6.683897972106934, "global_step": 138418, "epoch": 3295} {"train_loss": -6.728909492492676, "global_step": 138419, "epoch": 3295} {"train_loss": -6.80139684677124, "global_step": 138420, "epoch": 3295} {"train_loss": -6.747808456420898, "global_step": 138421, "epoch": 3295} {"train_loss": -6.727788925170898, "global_step": 138422, "epoch": 3295} {"train_loss": -6.841988563537598, "global_step": 138423, "epoch": 3295} {"train_loss": -6.834199905395508, "global_step": 138424, "epoch": 3295} {"train_loss": -6.865781784057617, "global_step": 138425, "epoch": 3295} {"train_loss": -6.807624816894531, "global_step": 138426, "epoch": 3295} {"train_loss": -6.746567726135254, "global_step": 138427, "epoch": 3295} {"train_loss": -6.824767112731934, "global_step": 138428, "epoch": 3295} {"train_loss": -6.903202056884766, "global_step": 138429, "epoch": 3295} {"train_loss": -6.821622848510742, "global_step": 138430, "epoch": 3295} {"train_loss": -6.718628792535691, "global_step": 138431, "epoch": 3295, "val_loss": 67115.1875} {"train_loss": -6.817132949829102, "global_step": 138432, "epoch": 3296} {"train_loss": -6.768194198608398, "global_step": 138433, "epoch": 3296} {"train_loss": -6.749786376953125, "global_step": 138434, "epoch": 3296} {"train_loss": -6.772270202636719, "global_step": 138435, "epoch": 3296} {"train_loss": -6.7291107177734375, "global_step": 138436, "epoch": 3296} {"train_loss": -6.769785404205322, "global_step": 138437, "epoch": 3296} {"train_loss": -6.785521507263184, "global_step": 138438, "epoch": 3296} {"train_loss": -6.751515865325928, "global_step": 138439, "epoch": 3296} {"train_loss": -6.708807945251465, "global_step": 138440, "epoch": 3296} {"train_loss": -6.740518569946289, "global_step": 138441, "epoch": 3296} {"train_loss": -6.63712739944458, "global_step": 138442, "epoch": 3296} {"train_loss": -6.866765975952148, "global_step": 138443, "epoch": 3296} {"train_loss": -6.634655952453613, "global_step": 138444, "epoch": 3296} {"train_loss": -6.717763900756836, "global_step": 138445, "epoch": 3296} {"train_loss": -6.862316608428955, "global_step": 138446, "epoch": 3296} {"train_loss": -6.689373016357422, "global_step": 138447, "epoch": 3296} {"train_loss": -6.759016036987305, "global_step": 138448, "epoch": 3296} {"train_loss": -6.715385437011719, "global_step": 138449, "epoch": 3296} {"train_loss": -6.74734354019165, "global_step": 138450, "epoch": 3296} {"train_loss": -6.751195907592773, "global_step": 138451, "epoch": 3296} {"train_loss": -6.612126350402832, "global_step": 138452, "epoch": 3296} {"train_loss": -6.774115562438965, "global_step": 138453, "epoch": 3296} {"train_loss": -6.681794166564941, "global_step": 138454, "epoch": 3296} {"train_loss": -6.641223907470703, "global_step": 138455, "epoch": 3296} {"train_loss": -6.757154941558838, "global_step": 138456, "epoch": 3296} {"train_loss": -6.74969482421875, "global_step": 138457, "epoch": 3296} {"train_loss": -6.694342613220215, "global_step": 138458, "epoch": 3296} {"train_loss": -6.687575340270996, "global_step": 138459, "epoch": 3296} {"train_loss": -6.799818992614746, "global_step": 138460, "epoch": 3296} {"train_loss": -6.796000003814697, "global_step": 138461, "epoch": 3296} {"train_loss": -6.910053730010986, "global_step": 138462, "epoch": 3296} {"train_loss": -6.715526103973389, "global_step": 138463, "epoch": 3296} {"train_loss": -6.769162654876709, "global_step": 138464, "epoch": 3296} {"train_loss": -6.701812744140625, "global_step": 138465, "epoch": 3296} {"train_loss": -6.711252212524414, "global_step": 138466, "epoch": 3296} {"train_loss": -6.667019844055176, "global_step": 138467, "epoch": 3296} {"train_loss": -6.764195442199707, "global_step": 138468, "epoch": 3296} {"train_loss": -6.735445022583008, "global_step": 138469, "epoch": 3296} {"train_loss": -6.655569553375244, "global_step": 138470, "epoch": 3296} {"train_loss": -6.814436912536621, "global_step": 138471, "epoch": 3296} {"train_loss": -6.681876182556152, "global_step": 138472, "epoch": 3296} {"train_loss": -6.741897594361078, "global_step": 138473, "epoch": 3296, "val_loss": 67153.0546875} {"train_loss": -6.7973785400390625, "global_step": 138474, "epoch": 3297} {"train_loss": -6.692656517028809, "global_step": 138475, "epoch": 3297} {"train_loss": -6.746018409729004, "global_step": 138476, "epoch": 3297} {"train_loss": -6.745099067687988, "global_step": 138477, "epoch": 3297} {"train_loss": -6.720916748046875, "global_step": 138478, "epoch": 3297} {"train_loss": -6.724412441253662, "global_step": 138479, "epoch": 3297} {"train_loss": -6.723772048950195, "global_step": 138480, "epoch": 3297} {"train_loss": -6.748752117156982, "global_step": 138481, "epoch": 3297} {"train_loss": -6.699122905731201, "global_step": 138482, "epoch": 3297} {"train_loss": -6.734988212585449, "global_step": 138483, "epoch": 3297} {"train_loss": -6.735725402832031, "global_step": 138484, "epoch": 3297} {"train_loss": -6.667595863342285, "global_step": 138485, "epoch": 3297} {"train_loss": -6.628791809082031, "global_step": 138486, "epoch": 3297} {"train_loss": -6.758040428161621, "global_step": 138487, "epoch": 3297} {"train_loss": -6.629460334777832, "global_step": 138488, "epoch": 3297} {"train_loss": -6.608270168304443, "global_step": 138489, "epoch": 3297} {"train_loss": -6.733663558959961, "global_step": 138490, "epoch": 3297} {"train_loss": -6.568901062011719, "global_step": 138491, "epoch": 3297} {"train_loss": -6.675622940063477, "global_step": 138492, "epoch": 3297} {"train_loss": -6.791542053222656, "global_step": 138493, "epoch": 3297} {"train_loss": -6.531549453735352, "global_step": 138494, "epoch": 3297} {"train_loss": -6.581406593322754, "global_step": 138495, "epoch": 3297} {"train_loss": -6.712039470672607, "global_step": 138496, "epoch": 3297} {"train_loss": -6.476247310638428, "global_step": 138497, "epoch": 3297} {"train_loss": -6.663210868835449, "global_step": 138498, "epoch": 3297} {"train_loss": -6.786779880523682, "global_step": 138499, "epoch": 3297} {"train_loss": -6.614109039306641, "global_step": 138500, "epoch": 3297} {"train_loss": -6.774015426635742, "global_step": 138501, "epoch": 3297} {"train_loss": -6.683823585510254, "global_step": 138502, "epoch": 3297} {"train_loss": -6.676694869995117, "global_step": 138503, "epoch": 3297} {"train_loss": -6.800923824310303, "global_step": 138504, "epoch": 3297} {"train_loss": -6.677536964416504, "global_step": 138505, "epoch": 3297} {"train_loss": -6.705557346343994, "global_step": 138506, "epoch": 3297} {"train_loss": -6.736210346221924, "global_step": 138507, "epoch": 3297} {"train_loss": -6.631610870361328, "global_step": 138508, "epoch": 3297} {"train_loss": -6.857098579406738, "global_step": 138509, "epoch": 3297} {"train_loss": -6.806570053100586, "global_step": 138510, "epoch": 3297} {"train_loss": -6.650282859802246, "global_step": 138511, "epoch": 3297} {"train_loss": -6.620695114135742, "global_step": 138512, "epoch": 3297} {"train_loss": -6.754270553588867, "global_step": 138513, "epoch": 3297} {"train_loss": -6.787830352783203, "global_step": 138514, "epoch": 3297} {"train_loss": -6.699652694520497, "global_step": 138515, "epoch": 3297, "val_loss": 67007.359375} {"train_loss": -6.767943382263184, "global_step": 138516, "epoch": 3298} {"train_loss": -6.751399993896484, "global_step": 138517, "epoch": 3298} {"train_loss": -6.7529616355896, "global_step": 138518, "epoch": 3298} {"train_loss": -6.756363868713379, "global_step": 138519, "epoch": 3298} {"train_loss": -6.807807445526123, "global_step": 138520, "epoch": 3298} {"train_loss": -6.746647834777832, "global_step": 138521, "epoch": 3298} {"train_loss": -6.803561210632324, "global_step": 138522, "epoch": 3298} {"train_loss": -6.80052375793457, "global_step": 138523, "epoch": 3298} {"train_loss": -6.763333320617676, "global_step": 138524, "epoch": 3298} {"train_loss": -6.835807800292969, "global_step": 138525, "epoch": 3298} {"train_loss": -6.7243146896362305, "global_step": 138526, "epoch": 3298} {"train_loss": -6.7282233238220215, "global_step": 138527, "epoch": 3298} {"train_loss": -6.845407009124756, "global_step": 138528, "epoch": 3298} {"train_loss": -6.787002086639404, "global_step": 138529, "epoch": 3298} {"train_loss": -6.729341506958008, "global_step": 138530, "epoch": 3298} {"train_loss": -6.783236503601074, "global_step": 138531, "epoch": 3298} {"train_loss": -6.696855068206787, "global_step": 138532, "epoch": 3298} {"train_loss": -6.830255508422852, "global_step": 138533, "epoch": 3298} {"train_loss": -6.776083469390869, "global_step": 138534, "epoch": 3298} {"train_loss": -6.770168304443359, "global_step": 138535, "epoch": 3298} {"train_loss": -6.759443283081055, "global_step": 138536, "epoch": 3298} {"train_loss": -6.829543113708496, "global_step": 138537, "epoch": 3298} {"train_loss": -6.752993106842041, "global_step": 138538, "epoch": 3298} {"train_loss": -6.858277320861816, "global_step": 138539, "epoch": 3298} {"train_loss": -6.842220783233643, "global_step": 138540, "epoch": 3298} {"train_loss": -6.768699645996094, "global_step": 138541, "epoch": 3298} {"train_loss": -6.746760368347168, "global_step": 138542, "epoch": 3298} {"train_loss": -6.799523830413818, "global_step": 138543, "epoch": 3298} {"train_loss": -6.7739386558532715, "global_step": 138544, "epoch": 3298} {"train_loss": -6.807257652282715, "global_step": 138545, "epoch": 3298} {"train_loss": -6.822059631347656, "global_step": 138546, "epoch": 3298} {"train_loss": -6.754982948303223, "global_step": 138547, "epoch": 3298} {"train_loss": -6.747013092041016, "global_step": 138548, "epoch": 3298} {"train_loss": -6.702558517456055, "global_step": 138549, "epoch": 3298} {"train_loss": -6.767041206359863, "global_step": 138550, "epoch": 3298} {"train_loss": -6.855498313903809, "global_step": 138551, "epoch": 3298} {"train_loss": -6.802639484405518, "global_step": 138552, "epoch": 3298} {"train_loss": -6.733555793762207, "global_step": 138553, "epoch": 3298} {"train_loss": -6.738064765930176, "global_step": 138554, "epoch": 3298} {"train_loss": -6.844504356384277, "global_step": 138555, "epoch": 3298} {"train_loss": -6.877044200897217, "global_step": 138556, "epoch": 3298} {"train_loss": -6.780445700600033, "global_step": 138557, "epoch": 3298, "val_loss": 67139.390625} {"train_loss": -6.813781261444092, "global_step": 138558, "epoch": 3299} {"train_loss": -6.858875274658203, "global_step": 138559, "epoch": 3299} {"train_loss": -6.799226760864258, "global_step": 138560, "epoch": 3299} {"train_loss": -6.657670021057129, "global_step": 138561, "epoch": 3299} {"train_loss": -6.617665767669678, "global_step": 138562, "epoch": 3299} {"train_loss": -6.732935905456543, "global_step": 138563, "epoch": 3299} {"train_loss": -6.775896072387695, "global_step": 138564, "epoch": 3299} {"train_loss": -6.634774684906006, "global_step": 138565, "epoch": 3299} {"train_loss": -6.730036735534668, "global_step": 138566, "epoch": 3299} {"train_loss": -6.776318550109863, "global_step": 138567, "epoch": 3299} {"train_loss": -6.605736255645752, "global_step": 138568, "epoch": 3299} {"train_loss": -6.67012882232666, "global_step": 138569, "epoch": 3299} {"train_loss": -6.633540153503418, "global_step": 138570, "epoch": 3299} {"train_loss": -6.634781837463379, "global_step": 138571, "epoch": 3299} {"train_loss": -6.6645050048828125, "global_step": 138572, "epoch": 3299} {"train_loss": -6.666975021362305, "global_step": 138573, "epoch": 3299} {"train_loss": -6.7449259757995605, "global_step": 138574, "epoch": 3299} {"train_loss": -6.584994316101074, "global_step": 138575, "epoch": 3299} {"train_loss": -6.719415664672852, "global_step": 138576, "epoch": 3299} {"train_loss": -6.618755340576172, "global_step": 138577, "epoch": 3299} {"train_loss": -6.718610763549805, "global_step": 138578, "epoch": 3299} {"train_loss": -6.595054626464844, "global_step": 138579, "epoch": 3299} {"train_loss": -6.620026111602783, "global_step": 138580, "epoch": 3299} {"train_loss": -6.64012336730957, "global_step": 138581, "epoch": 3299} {"train_loss": -6.539100646972656, "global_step": 138582, "epoch": 3299} {"train_loss": -6.679296016693115, "global_step": 138583, "epoch": 3299} {"train_loss": -6.635465621948242, "global_step": 138584, "epoch": 3299} {"train_loss": -6.56838846206665, "global_step": 138585, "epoch": 3299} {"train_loss": -6.593804359436035, "global_step": 138586, "epoch": 3299} {"train_loss": -6.598547458648682, "global_step": 138587, "epoch": 3299} {"train_loss": -6.64040470123291, "global_step": 138588, "epoch": 3299} {"train_loss": -6.697310447692871, "global_step": 138589, "epoch": 3299} {"train_loss": -6.598263740539551, "global_step": 138590, "epoch": 3299} {"train_loss": -6.517437934875488, "global_step": 138591, "epoch": 3299} {"train_loss": -6.604409217834473, "global_step": 138592, "epoch": 3299} {"train_loss": -6.640233993530273, "global_step": 138593, "epoch": 3299} {"train_loss": -6.522706031799316, "global_step": 138594, "epoch": 3299} {"train_loss": -6.643405914306641, "global_step": 138595, "epoch": 3299} {"train_loss": -6.454085350036621, "global_step": 138596, "epoch": 3299} {"train_loss": -6.617692947387695, "global_step": 138597, "epoch": 3299} {"train_loss": -6.680917263031006, "global_step": 138598, "epoch": 3299} {"train_loss": -6.653323162169683, "global_step": 138599, "epoch": 3299, "val_loss": 67016.984375} {"train_loss": -6.650443077087402, "global_step": 138600, "epoch": 3300} {"train_loss": -6.760701656341553, "global_step": 138601, "epoch": 3300} {"train_loss": -6.674715995788574, "global_step": 138602, "epoch": 3300} {"train_loss": -6.652928829193115, "global_step": 138603, "epoch": 3300} {"train_loss": -6.742622375488281, "global_step": 138604, "epoch": 3300} {"train_loss": -6.7728776931762695, "global_step": 138605, "epoch": 3300} {"train_loss": -6.696147441864014, "global_step": 138606, "epoch": 3300} {"train_loss": -6.680905342102051, "global_step": 138607, "epoch": 3300} {"train_loss": -6.644336700439453, "global_step": 138608, "epoch": 3300} {"train_loss": -6.650972843170166, "global_step": 138609, "epoch": 3300} {"train_loss": -6.727175712585449, "global_step": 138610, "epoch": 3300} {"train_loss": -6.720181465148926, "global_step": 138611, "epoch": 3300} {"train_loss": -6.710129737854004, "global_step": 138612, "epoch": 3300} {"train_loss": -6.775977611541748, "global_step": 138613, "epoch": 3300} {"train_loss": -6.7532548904418945, "global_step": 138614, "epoch": 3300} {"train_loss": -6.678927421569824, "global_step": 138615, "epoch": 3300} {"train_loss": -6.84759521484375, "global_step": 138616, "epoch": 3300} {"train_loss": -6.824239730834961, "global_step": 138617, "epoch": 3300} {"train_loss": -6.786332130432129, "global_step": 138618, "epoch": 3300} {"train_loss": -6.7819743156433105, "global_step": 138619, "epoch": 3300} {"train_loss": -6.737921237945557, "global_step": 138620, "epoch": 3300} {"train_loss": -6.844882965087891, "global_step": 138621, "epoch": 3300} {"train_loss": -6.775567054748535, "global_step": 138622, "epoch": 3300} {"train_loss": -6.8586506843566895, "global_step": 138623, "epoch": 3300} {"train_loss": -6.744316101074219, "global_step": 138624, "epoch": 3300} {"train_loss": -6.810628414154053, "global_step": 138625, "epoch": 3300} {"train_loss": -6.853736400604248, "global_step": 138626, "epoch": 3300} {"train_loss": -6.7889509201049805, "global_step": 138627, "epoch": 3300} {"train_loss": -6.61568021774292, "global_step": 138628, "epoch": 3300} {"train_loss": -6.801909446716309, "global_step": 138629, "epoch": 3300} {"train_loss": -6.643756866455078, "global_step": 138630, "epoch": 3300} {"train_loss": -6.830574035644531, "global_step": 138631, "epoch": 3300} {"train_loss": -6.772854804992676, "global_step": 138632, "epoch": 3300} {"train_loss": -6.723211288452148, "global_step": 138633, "epoch": 3300} {"train_loss": -6.777284622192383, "global_step": 138634, "epoch": 3300} {"train_loss": -6.75639009475708, "global_step": 138635, "epoch": 3300} {"train_loss": -6.740636825561523, "global_step": 138636, "epoch": 3300} {"train_loss": -6.788372993469238, "global_step": 138637, "epoch": 3300} {"train_loss": -6.828864574432373, "global_step": 138638, "epoch": 3300} {"train_loss": -6.754382133483887, "global_step": 138639, "epoch": 3300} {"train_loss": -6.804479122161865, "global_step": 138640, "epoch": 3300} {"train_loss": -6.754548367999849, "global_step": 138641, "epoch": 3300, "train/sim_max_reward_0": 0.7150331838158351, "train/sim_max_reward_1": 0.9037541364483317, "train/sim_max_reward_2": 0.47730115747178453, "train/sim_max_reward_3": 0.9449496276492557, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.2102727760792111, "test/sim_max_reward_4300000": 0.7799425386593478, "test/sim_max_reward_4300001": 0.31390884506551875, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.7290092297743608, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9031873853624954, "test/sim_max_reward_4300006": 0.9780333383100862, "test/sim_max_reward_4300007": 0.9723350551884303, "test/sim_max_reward_4300008": 0.9852401713446375, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.2986648343680922, "test/sim_max_reward_4300012": 0.8754710904687717, "test/sim_max_reward_4300013": 0.9870671526432369, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.984368603639988, "test/sim_max_reward_4300016": 0.9288536858446107, "test/sim_max_reward_4300017": 0.5488291665682704, "test/sim_max_reward_4300018": 0.4476998229506382, "test/sim_max_reward_4300019": 0.18586680222112928, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9818785255678983, "test/sim_max_reward_4300022": 0.35161515066120097, "test/sim_max_reward_4300023": 0.3282625408963851, "test/sim_max_reward_4300024": 0.9775268404887012, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.18662748758402145, "test/sim_max_reward_4300027": 0.8133221090243148, "test/sim_max_reward_4300028": 1.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.2053124868802306, "test/sim_max_reward_4300031": 0.2618455066542292, "test/sim_max_reward_4300032": 0.9611445480146551, "test/sim_max_reward_4300033": 0.624793208969552, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.8227822140734182, "test/sim_max_reward_4300036": 0.2128540191624104, "test/sim_max_reward_4300037": 0.9240945822030099, "test/sim_max_reward_4300038": 0.6562364462302672, "test/sim_max_reward_4300039": 0.8896225946573331, "test/sim_max_reward_4300040": 0.9091800921612313, "test/sim_max_reward_4300041": 0.9604511298782118, "test/sim_max_reward_4300042": 0.720638079225257, "test/sim_max_reward_4300043": 0.01912165197990456, "test/sim_max_reward_4300044": 0.9698318950188048, "test/sim_max_reward_4300045": 0.19738431528883826, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.15239711213625334, "test/sim_max_reward_4300048": 0.222616099728707, "test/sim_max_reward_4300049": 0.30424597693618866, "train/mean_score": 0.7085518135774032, "test/mean_score": 0.6117619288127986, "val_loss": 67153.421875} {"train_loss": -6.783685684204102, "global_step": 138642, "epoch": 3301} {"train_loss": -6.791229724884033, "global_step": 138643, "epoch": 3301} {"train_loss": -6.897058963775635, "global_step": 138644, "epoch": 3301} {"train_loss": -6.783502578735352, "global_step": 138645, "epoch": 3301} {"train_loss": -6.830875396728516, "global_step": 138646, "epoch": 3301} {"train_loss": -6.747939109802246, "global_step": 138647, "epoch": 3301} {"train_loss": -6.7635698318481445, "global_step": 138648, "epoch": 3301} {"train_loss": -6.7697553634643555, "global_step": 138649, "epoch": 3301} {"train_loss": -6.783620834350586, "global_step": 138650, "epoch": 3301} {"train_loss": -6.841119289398193, "global_step": 138651, "epoch": 3301} {"train_loss": -6.722908973693848, "global_step": 138652, "epoch": 3301} {"train_loss": -6.726293563842773, "global_step": 138653, "epoch": 3301} {"train_loss": -6.71037483215332, "global_step": 138654, "epoch": 3301} {"train_loss": -6.780807971954346, "global_step": 138655, "epoch": 3301} {"train_loss": -6.834012985229492, "global_step": 138656, "epoch": 3301} {"train_loss": -6.747729301452637, "global_step": 138657, "epoch": 3301} {"train_loss": -6.903323173522949, "global_step": 138658, "epoch": 3301} {"train_loss": -6.759259223937988, "global_step": 138659, "epoch": 3301} {"train_loss": -6.731499671936035, "global_step": 138660, "epoch": 3301} {"train_loss": -6.651192665100098, "global_step": 138661, "epoch": 3301} {"train_loss": -6.7043585777282715, "global_step": 138662, "epoch": 3301} {"train_loss": -6.711728572845459, "global_step": 138663, "epoch": 3301} {"train_loss": -6.797961711883545, "global_step": 138664, "epoch": 3301} {"train_loss": -6.708211898803711, "global_step": 138665, "epoch": 3301} {"train_loss": -6.788738250732422, "global_step": 138666, "epoch": 3301} {"train_loss": -6.882224082946777, "global_step": 138667, "epoch": 3301} {"train_loss": -6.736835479736328, "global_step": 138668, "epoch": 3301} {"train_loss": -6.7905120849609375, "global_step": 138669, "epoch": 3301} {"train_loss": -6.722434043884277, "global_step": 138670, "epoch": 3301} {"train_loss": -6.727206230163574, "global_step": 138671, "epoch": 3301} {"train_loss": -6.859048843383789, "global_step": 138672, "epoch": 3301} {"train_loss": -6.7288055419921875, "global_step": 138673, "epoch": 3301} {"train_loss": -6.899030685424805, "global_step": 138674, "epoch": 3301} {"train_loss": -6.850559711456299, "global_step": 138675, "epoch": 3301} {"train_loss": -6.716883659362793, "global_step": 138676, "epoch": 3301} {"train_loss": -6.8198699951171875, "global_step": 138677, "epoch": 3301} {"train_loss": -6.790455341339111, "global_step": 138678, "epoch": 3301} {"train_loss": -6.8393096923828125, "global_step": 138679, "epoch": 3301} {"train_loss": -6.847334861755371, "global_step": 138680, "epoch": 3301} {"train_loss": -6.723482608795166, "global_step": 138681, "epoch": 3301} {"train_loss": -6.810606002807617, "global_step": 138682, "epoch": 3301} {"train_loss": -6.781733297166371, "global_step": 138683, "epoch": 3301, "val_loss": 67091.484375} {"train_loss": -6.735395431518555, "global_step": 138684, "epoch": 3302} {"train_loss": -6.764223098754883, "global_step": 138685, "epoch": 3302} {"train_loss": -6.83067512512207, "global_step": 138686, "epoch": 3302} {"train_loss": -6.7315874099731445, "global_step": 138687, "epoch": 3302} {"train_loss": -6.805379867553711, "global_step": 138688, "epoch": 3302} {"train_loss": -6.849570274353027, "global_step": 138689, "epoch": 3302} {"train_loss": -6.893774032592773, "global_step": 138690, "epoch": 3302} {"train_loss": -6.644920825958252, "global_step": 138691, "epoch": 3302} {"train_loss": -6.804143905639648, "global_step": 138692, "epoch": 3302} {"train_loss": -6.7737956047058105, "global_step": 138693, "epoch": 3302} {"train_loss": -6.73915958404541, "global_step": 138694, "epoch": 3302} {"train_loss": -6.780706405639648, "global_step": 138695, "epoch": 3302} {"train_loss": -6.8808088302612305, "global_step": 138696, "epoch": 3302} {"train_loss": -6.765063285827637, "global_step": 138697, "epoch": 3302} {"train_loss": -6.880948066711426, "global_step": 138698, "epoch": 3302} {"train_loss": -6.817808151245117, "global_step": 138699, "epoch": 3302} {"train_loss": -6.750405311584473, "global_step": 138700, "epoch": 3302} {"train_loss": -6.663115501403809, "global_step": 138701, "epoch": 3302} {"train_loss": -6.758268356323242, "global_step": 138702, "epoch": 3302} {"train_loss": -6.711993217468262, "global_step": 138703, "epoch": 3302} {"train_loss": -6.751519203186035, "global_step": 138704, "epoch": 3302} {"train_loss": -6.738242149353027, "global_step": 138705, "epoch": 3302} {"train_loss": -6.791003704071045, "global_step": 138706, "epoch": 3302} {"train_loss": -6.708586692810059, "global_step": 138707, "epoch": 3302} {"train_loss": -6.848466873168945, "global_step": 138708, "epoch": 3302} {"train_loss": -6.693369388580322, "global_step": 138709, "epoch": 3302} {"train_loss": -6.840175628662109, "global_step": 138710, "epoch": 3302} {"train_loss": -6.750964164733887, "global_step": 138711, "epoch": 3302} {"train_loss": -6.734155654907227, "global_step": 138712, "epoch": 3302} {"train_loss": -6.621431827545166, "global_step": 138713, "epoch": 3302} {"train_loss": -6.697790145874023, "global_step": 138714, "epoch": 3302} {"train_loss": -6.68647575378418, "global_step": 138715, "epoch": 3302} {"train_loss": -6.645956993103027, "global_step": 138716, "epoch": 3302} {"train_loss": -6.735272407531738, "global_step": 138717, "epoch": 3302} {"train_loss": -6.807592391967773, "global_step": 138718, "epoch": 3302} {"train_loss": -6.689948558807373, "global_step": 138719, "epoch": 3302} {"train_loss": -6.72025203704834, "global_step": 138720, "epoch": 3302} {"train_loss": -6.826135635375977, "global_step": 138721, "epoch": 3302} {"train_loss": -6.757571220397949, "global_step": 138722, "epoch": 3302} {"train_loss": -6.791985511779785, "global_step": 138723, "epoch": 3302} {"train_loss": -6.747626781463623, "global_step": 138724, "epoch": 3302} {"train_loss": -6.759576138995943, "global_step": 138725, "epoch": 3302, "val_loss": 67377.3828125} {"train_loss": -6.675841331481934, "global_step": 138726, "epoch": 3303} {"train_loss": -6.735923767089844, "global_step": 138727, "epoch": 3303} {"train_loss": -6.705843925476074, "global_step": 138728, "epoch": 3303} {"train_loss": -6.722319602966309, "global_step": 138729, "epoch": 3303} {"train_loss": -6.759577751159668, "global_step": 138730, "epoch": 3303} {"train_loss": -6.8512163162231445, "global_step": 138731, "epoch": 3303} {"train_loss": -6.7434563636779785, "global_step": 138732, "epoch": 3303} {"train_loss": -6.60935115814209, "global_step": 138733, "epoch": 3303} {"train_loss": -6.74359130859375, "global_step": 138734, "epoch": 3303} {"train_loss": -6.73922061920166, "global_step": 138735, "epoch": 3303} {"train_loss": -6.743842124938965, "global_step": 138736, "epoch": 3303} {"train_loss": -6.759212970733643, "global_step": 138737, "epoch": 3303} {"train_loss": -6.766178607940674, "global_step": 138738, "epoch": 3303} {"train_loss": -6.7980499267578125, "global_step": 138739, "epoch": 3303} {"train_loss": -6.802643775939941, "global_step": 138740, "epoch": 3303} {"train_loss": -6.729970932006836, "global_step": 138741, "epoch": 3303} {"train_loss": -6.674922943115234, "global_step": 138742, "epoch": 3303} {"train_loss": -6.718357086181641, "global_step": 138743, "epoch": 3303} {"train_loss": -6.568197250366211, "global_step": 138744, "epoch": 3303} {"train_loss": -6.777676105499268, "global_step": 138745, "epoch": 3303} {"train_loss": -6.6753644943237305, "global_step": 138746, "epoch": 3303} {"train_loss": -6.6782379150390625, "global_step": 138747, "epoch": 3303} {"train_loss": -6.660552024841309, "global_step": 138748, "epoch": 3303} {"train_loss": -6.685965538024902, "global_step": 138749, "epoch": 3303} {"train_loss": -6.696544647216797, "global_step": 138750, "epoch": 3303} {"train_loss": -6.605940818786621, "global_step": 138751, "epoch": 3303} {"train_loss": -6.722249507904053, "global_step": 138752, "epoch": 3303} {"train_loss": -6.685980796813965, "global_step": 138753, "epoch": 3303} {"train_loss": -6.696854591369629, "global_step": 138754, "epoch": 3303} {"train_loss": -6.67558479309082, "global_step": 138755, "epoch": 3303} {"train_loss": -6.628653526306152, "global_step": 138756, "epoch": 3303} {"train_loss": -6.7003278732299805, "global_step": 138757, "epoch": 3303} {"train_loss": -6.566031455993652, "global_step": 138758, "epoch": 3303} {"train_loss": -6.711817741394043, "global_step": 138759, "epoch": 3303} {"train_loss": -6.737788200378418, "global_step": 138760, "epoch": 3303} {"train_loss": -6.794706344604492, "global_step": 138761, "epoch": 3303} {"train_loss": -6.721739768981934, "global_step": 138762, "epoch": 3303} {"train_loss": -6.745963096618652, "global_step": 138763, "epoch": 3303} {"train_loss": -6.650668144226074, "global_step": 138764, "epoch": 3303} {"train_loss": -6.6040496826171875, "global_step": 138765, "epoch": 3303} {"train_loss": -6.823787689208984, "global_step": 138766, "epoch": 3303} {"train_loss": -6.708441802433559, "global_step": 138767, "epoch": 3303, "val_loss": 67462.359375} {"train_loss": -6.769721508026123, "global_step": 138768, "epoch": 3304} {"train_loss": -6.662148952484131, "global_step": 138769, "epoch": 3304} {"train_loss": -6.796435356140137, "global_step": 138770, "epoch": 3304} {"train_loss": -6.7708635330200195, "global_step": 138771, "epoch": 3304} {"train_loss": -6.719635009765625, "global_step": 138772, "epoch": 3304} {"train_loss": -6.708248138427734, "global_step": 138773, "epoch": 3304} {"train_loss": -6.79261589050293, "global_step": 138774, "epoch": 3304} {"train_loss": -6.809013843536377, "global_step": 138775, "epoch": 3304} {"train_loss": -6.9061384201049805, "global_step": 138776, "epoch": 3304} {"train_loss": -6.8368940353393555, "global_step": 138777, "epoch": 3304} {"train_loss": -6.8477373123168945, "global_step": 138778, "epoch": 3304} {"train_loss": -6.77454948425293, "global_step": 138779, "epoch": 3304} {"train_loss": -6.818060874938965, "global_step": 138780, "epoch": 3304} {"train_loss": -6.594643592834473, "global_step": 138781, "epoch": 3304} {"train_loss": -6.807722091674805, "global_step": 138782, "epoch": 3304} {"train_loss": -6.68699836730957, "global_step": 138783, "epoch": 3304} {"train_loss": -6.825673580169678, "global_step": 138784, "epoch": 3304} {"train_loss": -6.745213508605957, "global_step": 138785, "epoch": 3304} {"train_loss": -6.800393104553223, "global_step": 138786, "epoch": 3304} {"train_loss": -6.819319725036621, "global_step": 138787, "epoch": 3304} {"train_loss": -6.763869285583496, "global_step": 138788, "epoch": 3304} {"train_loss": -6.886465549468994, "global_step": 138789, "epoch": 3304} {"train_loss": -6.730409622192383, "global_step": 138790, "epoch": 3304} {"train_loss": -6.654209136962891, "global_step": 138791, "epoch": 3304} {"train_loss": -6.725948333740234, "global_step": 138792, "epoch": 3304} {"train_loss": -6.721956253051758, "global_step": 138793, "epoch": 3304} {"train_loss": -6.893715858459473, "global_step": 138794, "epoch": 3304} {"train_loss": -6.778943061828613, "global_step": 138795, "epoch": 3304} {"train_loss": -6.7860565185546875, "global_step": 138796, "epoch": 3304} {"train_loss": -6.876858711242676, "global_step": 138797, "epoch": 3304} {"train_loss": -6.844707489013672, "global_step": 138798, "epoch": 3304} {"train_loss": -6.876987934112549, "global_step": 138799, "epoch": 3304} {"train_loss": -6.757086753845215, "global_step": 138800, "epoch": 3304} {"train_loss": -6.750845909118652, "global_step": 138801, "epoch": 3304} {"train_loss": -6.723752975463867, "global_step": 138802, "epoch": 3304} {"train_loss": -6.672626972198486, "global_step": 138803, "epoch": 3304} {"train_loss": -6.795139312744141, "global_step": 138804, "epoch": 3304} {"train_loss": -6.838501453399658, "global_step": 138805, "epoch": 3304} {"train_loss": -6.76558780670166, "global_step": 138806, "epoch": 3304} {"train_loss": -6.7708845138549805, "global_step": 138807, "epoch": 3304} {"train_loss": -6.796236991882324, "global_step": 138808, "epoch": 3304} {"train_loss": -6.776848804383051, "global_step": 138809, "epoch": 3304, "val_loss": 67030.5546875} {"train_loss": -6.810482025146484, "global_step": 138810, "epoch": 3305} {"train_loss": -6.794648170471191, "global_step": 138811, "epoch": 3305} {"train_loss": -6.828056335449219, "global_step": 138812, "epoch": 3305} {"train_loss": -6.730891704559326, "global_step": 138813, "epoch": 3305} {"train_loss": -6.813779830932617, "global_step": 138814, "epoch": 3305} {"train_loss": -6.840124130249023, "global_step": 138815, "epoch": 3305} {"train_loss": -6.939530372619629, "global_step": 138816, "epoch": 3305} {"train_loss": -6.875773906707764, "global_step": 138817, "epoch": 3305} {"train_loss": -6.778512477874756, "global_step": 138818, "epoch": 3305} {"train_loss": -6.869165420532227, "global_step": 138819, "epoch": 3305} {"train_loss": -6.781095027923584, "global_step": 138820, "epoch": 3305} {"train_loss": -6.810538291931152, "global_step": 138821, "epoch": 3305} {"train_loss": -6.904045104980469, "global_step": 138822, "epoch": 3305} {"train_loss": -6.755692481994629, "global_step": 138823, "epoch": 3305} {"train_loss": -6.728393077850342, "global_step": 138824, "epoch": 3305} {"train_loss": -6.736197471618652, "global_step": 138825, "epoch": 3305} {"train_loss": -6.790135383605957, "global_step": 138826, "epoch": 3305} {"train_loss": -6.688694953918457, "global_step": 138827, "epoch": 3305} {"train_loss": -6.821847915649414, "global_step": 138828, "epoch": 3305} {"train_loss": -6.600428104400635, "global_step": 138829, "epoch": 3305} {"train_loss": -6.714277267456055, "global_step": 138830, "epoch": 3305} {"train_loss": -6.771679878234863, "global_step": 138831, "epoch": 3305} {"train_loss": -6.5746355056762695, "global_step": 138832, "epoch": 3305} {"train_loss": -6.7565717697143555, "global_step": 138833, "epoch": 3305} {"train_loss": -6.754526138305664, "global_step": 138834, "epoch": 3305} {"train_loss": -6.72776985168457, "global_step": 138835, "epoch": 3305} {"train_loss": -6.90073299407959, "global_step": 138836, "epoch": 3305} {"train_loss": -6.788896083831787, "global_step": 138837, "epoch": 3305} {"train_loss": -6.6532673835754395, "global_step": 138838, "epoch": 3305} {"train_loss": -6.804279327392578, "global_step": 138839, "epoch": 3305} {"train_loss": -6.743558883666992, "global_step": 138840, "epoch": 3305} {"train_loss": -6.73973274230957, "global_step": 138841, "epoch": 3305} {"train_loss": -6.861985206604004, "global_step": 138842, "epoch": 3305} {"train_loss": -6.735705375671387, "global_step": 138843, "epoch": 3305} {"train_loss": -6.783685684204102, "global_step": 138844, "epoch": 3305} {"train_loss": -6.781764030456543, "global_step": 138845, "epoch": 3305} {"train_loss": -6.731627941131592, "global_step": 138846, "epoch": 3305} {"train_loss": -6.579050064086914, "global_step": 138847, "epoch": 3305} {"train_loss": -6.754003524780273, "global_step": 138848, "epoch": 3305} {"train_loss": -6.709153175354004, "global_step": 138849, "epoch": 3305} {"train_loss": -6.662762641906738, "global_step": 138850, "epoch": 3305} {"train_loss": -6.767265876134236, "global_step": 138851, "epoch": 3305, "val_loss": 67299.9375} {"train_loss": -6.683651924133301, "global_step": 138852, "epoch": 3306} {"train_loss": -6.691330432891846, "global_step": 138853, "epoch": 3306} {"train_loss": -6.662996768951416, "global_step": 138854, "epoch": 3306} {"train_loss": -6.720461368560791, "global_step": 138855, "epoch": 3306} {"train_loss": -6.802509307861328, "global_step": 138856, "epoch": 3306} {"train_loss": -6.706598281860352, "global_step": 138857, "epoch": 3306} {"train_loss": -6.704946517944336, "global_step": 138858, "epoch": 3306} {"train_loss": -6.7035136222839355, "global_step": 138859, "epoch": 3306} {"train_loss": -6.672609806060791, "global_step": 138860, "epoch": 3306} {"train_loss": -6.7488555908203125, "global_step": 138861, "epoch": 3306} {"train_loss": -6.64423942565918, "global_step": 138862, "epoch": 3306} {"train_loss": -6.670986175537109, "global_step": 138863, "epoch": 3306} {"train_loss": -6.656428813934326, "global_step": 138864, "epoch": 3306} {"train_loss": -6.685533046722412, "global_step": 138865, "epoch": 3306} {"train_loss": -6.630250930786133, "global_step": 138866, "epoch": 3306} {"train_loss": -6.706089496612549, "global_step": 138867, "epoch": 3306} {"train_loss": -6.588741779327393, "global_step": 138868, "epoch": 3306} {"train_loss": -6.678029537200928, "global_step": 138869, "epoch": 3306} {"train_loss": -6.625248432159424, "global_step": 138870, "epoch": 3306} {"train_loss": -6.739272594451904, "global_step": 138871, "epoch": 3306} {"train_loss": -6.720090866088867, "global_step": 138872, "epoch": 3306} {"train_loss": -6.733353614807129, "global_step": 138873, "epoch": 3306} {"train_loss": -6.7840352058410645, "global_step": 138874, "epoch": 3306} {"train_loss": -6.641603946685791, "global_step": 138875, "epoch": 3306} {"train_loss": -6.795212745666504, "global_step": 138876, "epoch": 3306} {"train_loss": -6.705273628234863, "global_step": 138877, "epoch": 3306} {"train_loss": -6.7760725021362305, "global_step": 138878, "epoch": 3306} {"train_loss": -6.745269775390625, "global_step": 138879, "epoch": 3306} {"train_loss": -6.719949722290039, "global_step": 138880, "epoch": 3306} {"train_loss": -6.683510780334473, "global_step": 138881, "epoch": 3306} {"train_loss": -6.674215316772461, "global_step": 138882, "epoch": 3306} {"train_loss": -6.738551616668701, "global_step": 138883, "epoch": 3306} {"train_loss": -6.771432876586914, "global_step": 138884, "epoch": 3306} {"train_loss": -6.626355171203613, "global_step": 138885, "epoch": 3306} {"train_loss": -6.682713985443115, "global_step": 138886, "epoch": 3306} {"train_loss": -6.860952377319336, "global_step": 138887, "epoch": 3306} {"train_loss": -6.794855117797852, "global_step": 138888, "epoch": 3306} {"train_loss": -6.713544845581055, "global_step": 138889, "epoch": 3306} {"train_loss": -6.763279438018799, "global_step": 138890, "epoch": 3306} {"train_loss": -6.7570414543151855, "global_step": 138891, "epoch": 3306} {"train_loss": -6.745626449584961, "global_step": 138892, "epoch": 3306} {"train_loss": -6.709928330920992, "global_step": 138893, "epoch": 3306, "val_loss": 67108.7421875} {"train_loss": -6.706093788146973, "global_step": 138894, "epoch": 3307} {"train_loss": -6.742910385131836, "global_step": 138895, "epoch": 3307} {"train_loss": -6.671483993530273, "global_step": 138896, "epoch": 3307} {"train_loss": -6.817173480987549, "global_step": 138897, "epoch": 3307} {"train_loss": -6.820793151855469, "global_step": 138898, "epoch": 3307} {"train_loss": -6.651148796081543, "global_step": 138899, "epoch": 3307} {"train_loss": -6.742473125457764, "global_step": 138900, "epoch": 3307} {"train_loss": -6.737540245056152, "global_step": 138901, "epoch": 3307} {"train_loss": -6.657018184661865, "global_step": 138902, "epoch": 3307} {"train_loss": -6.750604629516602, "global_step": 138903, "epoch": 3307} {"train_loss": -6.821585655212402, "global_step": 138904, "epoch": 3307} {"train_loss": -6.781294822692871, "global_step": 138905, "epoch": 3307} {"train_loss": -6.834754467010498, "global_step": 138906, "epoch": 3307} {"train_loss": -6.787397384643555, "global_step": 138907, "epoch": 3307} {"train_loss": -6.755159854888916, "global_step": 138908, "epoch": 3307} {"train_loss": -6.797313213348389, "global_step": 138909, "epoch": 3307} {"train_loss": -6.7600836753845215, "global_step": 138910, "epoch": 3307} {"train_loss": -6.7668609619140625, "global_step": 138911, "epoch": 3307} {"train_loss": -6.859234809875488, "global_step": 138912, "epoch": 3307} {"train_loss": -6.804544448852539, "global_step": 138913, "epoch": 3307} {"train_loss": -6.853055953979492, "global_step": 138914, "epoch": 3307} {"train_loss": -6.773795127868652, "global_step": 138915, "epoch": 3307} {"train_loss": -6.773116111755371, "global_step": 138916, "epoch": 3307} {"train_loss": -6.674397945404053, "global_step": 138917, "epoch": 3307} {"train_loss": -6.790197372436523, "global_step": 138918, "epoch": 3307} {"train_loss": -6.735631942749023, "global_step": 138919, "epoch": 3307} {"train_loss": -6.8683552742004395, "global_step": 138920, "epoch": 3307} {"train_loss": -6.849203109741211, "global_step": 138921, "epoch": 3307} {"train_loss": -6.652759552001953, "global_step": 138922, "epoch": 3307} {"train_loss": -6.882791042327881, "global_step": 138923, "epoch": 3307} {"train_loss": -6.901972770690918, "global_step": 138924, "epoch": 3307} {"train_loss": -6.79131555557251, "global_step": 138925, "epoch": 3307} {"train_loss": -6.805067539215088, "global_step": 138926, "epoch": 3307} {"train_loss": -6.927980899810791, "global_step": 138927, "epoch": 3307} {"train_loss": -6.803582191467285, "global_step": 138928, "epoch": 3307} {"train_loss": -6.673348426818848, "global_step": 138929, "epoch": 3307} {"train_loss": -6.766176223754883, "global_step": 138930, "epoch": 3307} {"train_loss": -6.809812068939209, "global_step": 138931, "epoch": 3307} {"train_loss": -6.732098579406738, "global_step": 138932, "epoch": 3307} {"train_loss": -6.723564147949219, "global_step": 138933, "epoch": 3307} {"train_loss": -6.658758163452148, "global_step": 138934, "epoch": 3307} {"train_loss": -6.774469375610352, "global_step": 138935, "epoch": 3307, "val_loss": 67065.6015625} {"train_loss": -6.850746154785156, "global_step": 138936, "epoch": 3308} {"train_loss": -6.693234443664551, "global_step": 138937, "epoch": 3308} {"train_loss": -6.840208053588867, "global_step": 138938, "epoch": 3308} {"train_loss": -6.827384948730469, "global_step": 138939, "epoch": 3308} {"train_loss": -6.676826477050781, "global_step": 138940, "epoch": 3308} {"train_loss": -6.853062629699707, "global_step": 138941, "epoch": 3308} {"train_loss": -6.790186882019043, "global_step": 138942, "epoch": 3308} {"train_loss": -6.846858978271484, "global_step": 138943, "epoch": 3308} {"train_loss": -6.848021507263184, "global_step": 138944, "epoch": 3308} {"train_loss": -6.719768047332764, "global_step": 138945, "epoch": 3308} {"train_loss": -6.756742477416992, "global_step": 138946, "epoch": 3308} {"train_loss": -6.70859432220459, "global_step": 138947, "epoch": 3308} {"train_loss": -6.752866744995117, "global_step": 138948, "epoch": 3308} {"train_loss": -6.7073655128479, "global_step": 138949, "epoch": 3308} {"train_loss": -6.81705379486084, "global_step": 138950, "epoch": 3308} {"train_loss": -6.760191917419434, "global_step": 138951, "epoch": 3308} {"train_loss": -6.733187675476074, "global_step": 138952, "epoch": 3308} {"train_loss": -6.826375961303711, "global_step": 138953, "epoch": 3308} {"train_loss": -6.690586090087891, "global_step": 138954, "epoch": 3308} {"train_loss": -6.818662643432617, "global_step": 138955, "epoch": 3308} {"train_loss": -6.767602920532227, "global_step": 138956, "epoch": 3308} {"train_loss": -6.850052356719971, "global_step": 138957, "epoch": 3308} {"train_loss": -6.660788536071777, "global_step": 138958, "epoch": 3308} {"train_loss": -6.586677551269531, "global_step": 138959, "epoch": 3308} {"train_loss": -6.797633171081543, "global_step": 138960, "epoch": 3308} {"train_loss": -6.689942836761475, "global_step": 138961, "epoch": 3308} {"train_loss": -6.822513103485107, "global_step": 138962, "epoch": 3308} {"train_loss": -6.7641520500183105, "global_step": 138963, "epoch": 3308} {"train_loss": -6.804166316986084, "global_step": 138964, "epoch": 3308} {"train_loss": -6.780084609985352, "global_step": 138965, "epoch": 3308} {"train_loss": -6.833727836608887, "global_step": 138966, "epoch": 3308} {"train_loss": -6.670747756958008, "global_step": 138967, "epoch": 3308} {"train_loss": -6.681089401245117, "global_step": 138968, "epoch": 3308} {"train_loss": -6.806135654449463, "global_step": 138969, "epoch": 3308} {"train_loss": -6.7079362869262695, "global_step": 138970, "epoch": 3308} {"train_loss": -6.7484588623046875, "global_step": 138971, "epoch": 3308} {"train_loss": -6.6392011642456055, "global_step": 138972, "epoch": 3308} {"train_loss": -6.733128070831299, "global_step": 138973, "epoch": 3308} {"train_loss": -6.721037864685059, "global_step": 138974, "epoch": 3308} {"train_loss": -6.784388542175293, "global_step": 138975, "epoch": 3308} {"train_loss": -6.744618892669678, "global_step": 138976, "epoch": 3308} {"train_loss": -6.758235079901559, "global_step": 138977, "epoch": 3308, "val_loss": 67268.234375} {"train_loss": -6.582729339599609, "global_step": 138978, "epoch": 3309} {"train_loss": -6.819889068603516, "global_step": 138979, "epoch": 3309} {"train_loss": -6.895299434661865, "global_step": 138980, "epoch": 3309} {"train_loss": -6.691104412078857, "global_step": 138981, "epoch": 3309} {"train_loss": -6.738097667694092, "global_step": 138982, "epoch": 3309} {"train_loss": -6.902626991271973, "global_step": 138983, "epoch": 3309} {"train_loss": -6.835155487060547, "global_step": 138984, "epoch": 3309} {"train_loss": -6.675533294677734, "global_step": 138985, "epoch": 3309} {"train_loss": -6.86870002746582, "global_step": 138986, "epoch": 3309} {"train_loss": -6.843984603881836, "global_step": 138987, "epoch": 3309} {"train_loss": -6.707626819610596, "global_step": 138988, "epoch": 3309} {"train_loss": -6.688565731048584, "global_step": 138989, "epoch": 3309} {"train_loss": -6.676991939544678, "global_step": 138990, "epoch": 3309} {"train_loss": -6.851670265197754, "global_step": 138991, "epoch": 3309} {"train_loss": -6.676856994628906, "global_step": 138992, "epoch": 3309} {"train_loss": -6.738814353942871, "global_step": 138993, "epoch": 3309} {"train_loss": -6.766417026519775, "global_step": 138994, "epoch": 3309} {"train_loss": -6.787644386291504, "global_step": 138995, "epoch": 3309} {"train_loss": -6.899821758270264, "global_step": 138996, "epoch": 3309} {"train_loss": -6.882842540740967, "global_step": 138997, "epoch": 3309} {"train_loss": -6.840344429016113, "global_step": 138998, "epoch": 3309} {"train_loss": -6.718238353729248, "global_step": 138999, "epoch": 3309} {"train_loss": -6.783477783203125, "global_step": 139000, "epoch": 3309} {"train_loss": -6.846417427062988, "global_step": 139001, "epoch": 3309} {"train_loss": -6.731935501098633, "global_step": 139002, "epoch": 3309} {"train_loss": -6.807399749755859, "global_step": 139003, "epoch": 3309} {"train_loss": -6.785363674163818, "global_step": 139004, "epoch": 3309} {"train_loss": -6.722947120666504, "global_step": 139005, "epoch": 3309} {"train_loss": -6.863421440124512, "global_step": 139006, "epoch": 3309} {"train_loss": -6.809150695800781, "global_step": 139007, "epoch": 3309} {"train_loss": -6.764286518096924, "global_step": 139008, "epoch": 3309} {"train_loss": -6.830455780029297, "global_step": 139009, "epoch": 3309} {"train_loss": -6.864129066467285, "global_step": 139010, "epoch": 3309} {"train_loss": -6.887128829956055, "global_step": 139011, "epoch": 3309} {"train_loss": -6.752974510192871, "global_step": 139012, "epoch": 3309} {"train_loss": -6.7434163093566895, "global_step": 139013, "epoch": 3309} {"train_loss": -6.803624153137207, "global_step": 139014, "epoch": 3309} {"train_loss": -6.585168838500977, "global_step": 139015, "epoch": 3309} {"train_loss": -6.59214973449707, "global_step": 139016, "epoch": 3309} {"train_loss": -6.840708255767822, "global_step": 139017, "epoch": 3309} {"train_loss": -6.678466320037842, "global_step": 139018, "epoch": 3309} {"train_loss": -6.773333708445231, "global_step": 139019, "epoch": 3309, "val_loss": 67406.2578125} {"train_loss": -6.685372352600098, "global_step": 139020, "epoch": 3310} {"train_loss": -6.5777082443237305, "global_step": 139021, "epoch": 3310} {"train_loss": -6.695132255554199, "global_step": 139022, "epoch": 3310} {"train_loss": -6.728865146636963, "global_step": 139023, "epoch": 3310} {"train_loss": -6.6331658363342285, "global_step": 139024, "epoch": 3310} {"train_loss": -6.736161708831787, "global_step": 139025, "epoch": 3310} {"train_loss": -6.860849857330322, "global_step": 139026, "epoch": 3310} {"train_loss": -6.7678608894348145, "global_step": 139027, "epoch": 3310} {"train_loss": -6.697136878967285, "global_step": 139028, "epoch": 3310} {"train_loss": -6.738710403442383, "global_step": 139029, "epoch": 3310} {"train_loss": -6.7570695877075195, "global_step": 139030, "epoch": 3310} {"train_loss": -6.773429870605469, "global_step": 139031, "epoch": 3310} {"train_loss": -6.76043701171875, "global_step": 139032, "epoch": 3310} {"train_loss": -6.773815631866455, "global_step": 139033, "epoch": 3310} {"train_loss": -6.730279445648193, "global_step": 139034, "epoch": 3310} {"train_loss": -6.646521091461182, "global_step": 139035, "epoch": 3310} {"train_loss": -6.731287956237793, "global_step": 139036, "epoch": 3310} {"train_loss": -6.700187683105469, "global_step": 139037, "epoch": 3310} {"train_loss": -6.722322463989258, "global_step": 139038, "epoch": 3310} {"train_loss": -6.713623046875, "global_step": 139039, "epoch": 3310} {"train_loss": -6.8113627433776855, "global_step": 139040, "epoch": 3310} {"train_loss": -6.772243976593018, "global_step": 139041, "epoch": 3310} {"train_loss": -6.729830265045166, "global_step": 139042, "epoch": 3310} {"train_loss": -6.6352739334106445, "global_step": 139043, "epoch": 3310} {"train_loss": -6.844527244567871, "global_step": 139044, "epoch": 3310} {"train_loss": -6.7788591384887695, "global_step": 139045, "epoch": 3310} {"train_loss": -6.809365272521973, "global_step": 139046, "epoch": 3310} {"train_loss": -6.7633056640625, "global_step": 139047, "epoch": 3310} {"train_loss": -6.764232635498047, "global_step": 139048, "epoch": 3310} {"train_loss": -6.692851543426514, "global_step": 139049, "epoch": 3310} {"train_loss": -6.680132865905762, "global_step": 139050, "epoch": 3310} {"train_loss": -6.707267761230469, "global_step": 139051, "epoch": 3310} {"train_loss": -6.783583641052246, "global_step": 139052, "epoch": 3310} {"train_loss": -6.644644737243652, "global_step": 139053, "epoch": 3310} {"train_loss": -6.613842964172363, "global_step": 139054, "epoch": 3310} {"train_loss": -6.810734272003174, "global_step": 139055, "epoch": 3310} {"train_loss": -6.596316337585449, "global_step": 139056, "epoch": 3310} {"train_loss": -6.767738342285156, "global_step": 139057, "epoch": 3310} {"train_loss": -6.619366645812988, "global_step": 139058, "epoch": 3310} {"train_loss": -6.680307388305664, "global_step": 139059, "epoch": 3310} {"train_loss": -6.629905700683594, "global_step": 139060, "epoch": 3310} {"train_loss": -6.719414336340768, "global_step": 139061, "epoch": 3310, "val_loss": 67351.9453125} {"train_loss": -6.66478157043457, "global_step": 139062, "epoch": 3311} {"train_loss": -6.719735145568848, "global_step": 139063, "epoch": 3311} {"train_loss": -6.667971611022949, "global_step": 139064, "epoch": 3311} {"train_loss": -6.568335056304932, "global_step": 139065, "epoch": 3311} {"train_loss": -6.666418075561523, "global_step": 139066, "epoch": 3311} {"train_loss": -6.657332420349121, "global_step": 139067, "epoch": 3311} {"train_loss": -6.606881141662598, "global_step": 139068, "epoch": 3311} {"train_loss": -6.594966411590576, "global_step": 139069, "epoch": 3311} {"train_loss": -6.718419551849365, "global_step": 139070, "epoch": 3311} {"train_loss": -6.696227073669434, "global_step": 139071, "epoch": 3311} {"train_loss": -6.674171447753906, "global_step": 139072, "epoch": 3311} {"train_loss": -6.808424949645996, "global_step": 139073, "epoch": 3311} {"train_loss": -6.6717400550842285, "global_step": 139074, "epoch": 3311} {"train_loss": -6.806233882904053, "global_step": 139075, "epoch": 3311} {"train_loss": -6.671018600463867, "global_step": 139076, "epoch": 3311} {"train_loss": -6.688749313354492, "global_step": 139077, "epoch": 3311} {"train_loss": -6.64369535446167, "global_step": 139078, "epoch": 3311} {"train_loss": -6.681633949279785, "global_step": 139079, "epoch": 3311} {"train_loss": -6.739771842956543, "global_step": 139080, "epoch": 3311} {"train_loss": -6.817288398742676, "global_step": 139081, "epoch": 3311} {"train_loss": -6.775951385498047, "global_step": 139082, "epoch": 3311} {"train_loss": -6.749227523803711, "global_step": 139083, "epoch": 3311} {"train_loss": -6.78337287902832, "global_step": 139084, "epoch": 3311} {"train_loss": -6.826282978057861, "global_step": 139085, "epoch": 3311} {"train_loss": -6.661255836486816, "global_step": 139086, "epoch": 3311} {"train_loss": -6.775218486785889, "global_step": 139087, "epoch": 3311} {"train_loss": -6.863922119140625, "global_step": 139088, "epoch": 3311} {"train_loss": -6.667600631713867, "global_step": 139089, "epoch": 3311} {"train_loss": -6.8098978996276855, "global_step": 139090, "epoch": 3311} {"train_loss": -6.669680118560791, "global_step": 139091, "epoch": 3311} {"train_loss": -6.720668315887451, "global_step": 139092, "epoch": 3311} {"train_loss": -6.708372592926025, "global_step": 139093, "epoch": 3311} {"train_loss": -6.7199835777282715, "global_step": 139094, "epoch": 3311} {"train_loss": -6.711374282836914, "global_step": 139095, "epoch": 3311} {"train_loss": -6.792308807373047, "global_step": 139096, "epoch": 3311} {"train_loss": -6.6681671142578125, "global_step": 139097, "epoch": 3311} {"train_loss": -6.787548065185547, "global_step": 139098, "epoch": 3311} {"train_loss": -6.7716875076293945, "global_step": 139099, "epoch": 3311} {"train_loss": -6.761800765991211, "global_step": 139100, "epoch": 3311} {"train_loss": -6.8050031661987305, "global_step": 139101, "epoch": 3311} {"train_loss": -6.667433738708496, "global_step": 139102, "epoch": 3311} {"train_loss": -6.71973348799206, "global_step": 139103, "epoch": 3311, "val_loss": 67177.734375} {"train_loss": -6.766510009765625, "global_step": 139104, "epoch": 3312} {"train_loss": -6.683058738708496, "global_step": 139105, "epoch": 3312} {"train_loss": -6.740006446838379, "global_step": 139106, "epoch": 3312} {"train_loss": -6.775214195251465, "global_step": 139107, "epoch": 3312} {"train_loss": -6.800884246826172, "global_step": 139108, "epoch": 3312} {"train_loss": -6.896448135375977, "global_step": 139109, "epoch": 3312} {"train_loss": -6.767139911651611, "global_step": 139110, "epoch": 3312} {"train_loss": -6.796781063079834, "global_step": 139111, "epoch": 3312} {"train_loss": -6.775714874267578, "global_step": 139112, "epoch": 3312} {"train_loss": -6.740945816040039, "global_step": 139113, "epoch": 3312} {"train_loss": -6.8196187019348145, "global_step": 139114, "epoch": 3312} {"train_loss": -6.791522979736328, "global_step": 139115, "epoch": 3312} {"train_loss": -6.703653335571289, "global_step": 139116, "epoch": 3312} {"train_loss": -6.649971961975098, "global_step": 139117, "epoch": 3312} {"train_loss": -6.725954055786133, "global_step": 139118, "epoch": 3312} {"train_loss": -6.780117988586426, "global_step": 139119, "epoch": 3312} {"train_loss": -6.75229024887085, "global_step": 139120, "epoch": 3312} {"train_loss": -6.784642219543457, "global_step": 139121, "epoch": 3312} {"train_loss": -6.657139778137207, "global_step": 139122, "epoch": 3312} {"train_loss": -6.715595245361328, "global_step": 139123, "epoch": 3312} {"train_loss": -6.6877641677856445, "global_step": 139124, "epoch": 3312} {"train_loss": -6.7669219970703125, "global_step": 139125, "epoch": 3312} {"train_loss": -6.759942054748535, "global_step": 139126, "epoch": 3312} {"train_loss": -6.830044746398926, "global_step": 139127, "epoch": 3312} {"train_loss": -6.778295516967773, "global_step": 139128, "epoch": 3312} {"train_loss": -6.872152328491211, "global_step": 139129, "epoch": 3312} {"train_loss": -6.727933883666992, "global_step": 139130, "epoch": 3312} {"train_loss": -6.7159624099731445, "global_step": 139131, "epoch": 3312} {"train_loss": -6.9244585037231445, "global_step": 139132, "epoch": 3312} {"train_loss": -6.849956512451172, "global_step": 139133, "epoch": 3312} {"train_loss": -6.708513259887695, "global_step": 139134, "epoch": 3312} {"train_loss": -6.721563339233398, "global_step": 139135, "epoch": 3312} {"train_loss": -6.792355537414551, "global_step": 139136, "epoch": 3312} {"train_loss": -6.7363691329956055, "global_step": 139137, "epoch": 3312} {"train_loss": -6.749951362609863, "global_step": 139138, "epoch": 3312} {"train_loss": -6.812884330749512, "global_step": 139139, "epoch": 3312} {"train_loss": -6.746050834655762, "global_step": 139140, "epoch": 3312} {"train_loss": -6.732421875, "global_step": 139141, "epoch": 3312} {"train_loss": -6.677776336669922, "global_step": 139142, "epoch": 3312} {"train_loss": -6.780613899230957, "global_step": 139143, "epoch": 3312} {"train_loss": -6.726353645324707, "global_step": 139144, "epoch": 3312} {"train_loss": -6.765149388994489, "global_step": 139145, "epoch": 3312, "val_loss": 67096.1640625} {"train_loss": -6.6731181144714355, "global_step": 139146, "epoch": 3313} {"train_loss": -6.781341075897217, "global_step": 139147, "epoch": 3313} {"train_loss": -6.7873077392578125, "global_step": 139148, "epoch": 3313} {"train_loss": -6.759359359741211, "global_step": 139149, "epoch": 3313} {"train_loss": -6.787301540374756, "global_step": 139150, "epoch": 3313} {"train_loss": -6.727095603942871, "global_step": 139151, "epoch": 3313} {"train_loss": -6.7158708572387695, "global_step": 139152, "epoch": 3313} {"train_loss": -6.665806770324707, "global_step": 139153, "epoch": 3313} {"train_loss": -6.631913185119629, "global_step": 139154, "epoch": 3313} {"train_loss": -6.891360282897949, "global_step": 139155, "epoch": 3313} {"train_loss": -6.672682762145996, "global_step": 139156, "epoch": 3313} {"train_loss": -6.67429256439209, "global_step": 139157, "epoch": 3313} {"train_loss": -6.812559127807617, "global_step": 139158, "epoch": 3313} {"train_loss": -6.645327568054199, "global_step": 139159, "epoch": 3313} {"train_loss": -6.605686664581299, "global_step": 139160, "epoch": 3313} {"train_loss": -6.7706685066223145, "global_step": 139161, "epoch": 3313} {"train_loss": -6.704679012298584, "global_step": 139162, "epoch": 3313} {"train_loss": -6.609047889709473, "global_step": 139163, "epoch": 3313} {"train_loss": -6.753105163574219, "global_step": 139164, "epoch": 3313} {"train_loss": -6.513515472412109, "global_step": 139165, "epoch": 3313} {"train_loss": -6.747783660888672, "global_step": 139166, "epoch": 3313} {"train_loss": -6.684711456298828, "global_step": 139167, "epoch": 3313} {"train_loss": -6.747310161590576, "global_step": 139168, "epoch": 3313} {"train_loss": -6.790874481201172, "global_step": 139169, "epoch": 3313} {"train_loss": -6.6042799949646, "global_step": 139170, "epoch": 3313} {"train_loss": -6.720882415771484, "global_step": 139171, "epoch": 3313} {"train_loss": -6.617928504943848, "global_step": 139172, "epoch": 3313} {"train_loss": -6.654789924621582, "global_step": 139173, "epoch": 3313} {"train_loss": -6.765523433685303, "global_step": 139174, "epoch": 3313} {"train_loss": -6.713522911071777, "global_step": 139175, "epoch": 3313} {"train_loss": -6.58204460144043, "global_step": 139176, "epoch": 3313} {"train_loss": -6.802119255065918, "global_step": 139177, "epoch": 3313} {"train_loss": -6.66405725479126, "global_step": 139178, "epoch": 3313} {"train_loss": -6.7870097160339355, "global_step": 139179, "epoch": 3313} {"train_loss": -6.776476860046387, "global_step": 139180, "epoch": 3313} {"train_loss": -6.7566962242126465, "global_step": 139181, "epoch": 3313} {"train_loss": -6.7207465171813965, "global_step": 139182, "epoch": 3313} {"train_loss": -6.804570198059082, "global_step": 139183, "epoch": 3313} {"train_loss": -6.67713737487793, "global_step": 139184, "epoch": 3313} {"train_loss": -6.716721057891846, "global_step": 139185, "epoch": 3313} {"train_loss": -6.806318283081055, "global_step": 139186, "epoch": 3313} {"train_loss": -6.716674816040766, "global_step": 139187, "epoch": 3313, "val_loss": 67022.25} {"train_loss": -6.762134075164795, "global_step": 139188, "epoch": 3314} {"train_loss": -6.7532501220703125, "global_step": 139189, "epoch": 3314} {"train_loss": -6.710752010345459, "global_step": 139190, "epoch": 3314} {"train_loss": -6.780261039733887, "global_step": 139191, "epoch": 3314} {"train_loss": -6.714138031005859, "global_step": 139192, "epoch": 3314} {"train_loss": -6.8103532791137695, "global_step": 139193, "epoch": 3314} {"train_loss": -6.738348960876465, "global_step": 139194, "epoch": 3314} {"train_loss": -6.75075626373291, "global_step": 139195, "epoch": 3314} {"train_loss": -6.712654113769531, "global_step": 139196, "epoch": 3314} {"train_loss": -6.815093517303467, "global_step": 139197, "epoch": 3314} {"train_loss": -6.764155387878418, "global_step": 139198, "epoch": 3314} {"train_loss": -6.728072166442871, "global_step": 139199, "epoch": 3314} {"train_loss": -6.734813690185547, "global_step": 139200, "epoch": 3314} {"train_loss": -6.659630298614502, "global_step": 139201, "epoch": 3314} {"train_loss": -6.689632415771484, "global_step": 139202, "epoch": 3314} {"train_loss": -6.841533660888672, "global_step": 139203, "epoch": 3314} {"train_loss": -6.668397426605225, "global_step": 139204, "epoch": 3314} {"train_loss": -6.736358642578125, "global_step": 139205, "epoch": 3314} {"train_loss": -6.662079811096191, "global_step": 139206, "epoch": 3314} {"train_loss": -6.724613189697266, "global_step": 139207, "epoch": 3314} {"train_loss": -6.701316833496094, "global_step": 139208, "epoch": 3314} {"train_loss": -6.808072090148926, "global_step": 139209, "epoch": 3314} {"train_loss": -6.717116355895996, "global_step": 139210, "epoch": 3314} {"train_loss": -6.68839693069458, "global_step": 139211, "epoch": 3314} {"train_loss": -6.772478103637695, "global_step": 139212, "epoch": 3314} {"train_loss": -6.756742477416992, "global_step": 139213, "epoch": 3314} {"train_loss": -6.781560897827148, "global_step": 139214, "epoch": 3314} {"train_loss": -6.777712821960449, "global_step": 139215, "epoch": 3314} {"train_loss": -6.684377193450928, "global_step": 139216, "epoch": 3314} {"train_loss": -6.849729537963867, "global_step": 139217, "epoch": 3314} {"train_loss": -6.713507652282715, "global_step": 139218, "epoch": 3314} {"train_loss": -6.885656833648682, "global_step": 139219, "epoch": 3314} {"train_loss": -6.790949821472168, "global_step": 139220, "epoch": 3314} {"train_loss": -6.850109100341797, "global_step": 139221, "epoch": 3314} {"train_loss": -6.794586181640625, "global_step": 139222, "epoch": 3314} {"train_loss": -6.85084342956543, "global_step": 139223, "epoch": 3314} {"train_loss": -6.820961952209473, "global_step": 139224, "epoch": 3314} {"train_loss": -6.781252861022949, "global_step": 139225, "epoch": 3314} {"train_loss": -6.737239360809326, "global_step": 139226, "epoch": 3314} {"train_loss": -6.700203895568848, "global_step": 139227, "epoch": 3314} {"train_loss": -6.635059833526611, "global_step": 139228, "epoch": 3314} {"train_loss": -6.7531958648136685, "global_step": 139229, "epoch": 3314, "val_loss": 67362.8046875} {"train_loss": -6.797874450683594, "global_step": 139230, "epoch": 3315} {"train_loss": -6.729245185852051, "global_step": 139231, "epoch": 3315} {"train_loss": -6.6394243240356445, "global_step": 139232, "epoch": 3315} {"train_loss": -6.685102462768555, "global_step": 139233, "epoch": 3315} {"train_loss": -6.70008659362793, "global_step": 139234, "epoch": 3315} {"train_loss": -6.698103904724121, "global_step": 139235, "epoch": 3315} {"train_loss": -6.808011531829834, "global_step": 139236, "epoch": 3315} {"train_loss": -6.672462463378906, "global_step": 139237, "epoch": 3315} {"train_loss": -6.66108512878418, "global_step": 139238, "epoch": 3315} {"train_loss": -6.736105918884277, "global_step": 139239, "epoch": 3315} {"train_loss": -6.675118446350098, "global_step": 139240, "epoch": 3315} {"train_loss": -6.699109077453613, "global_step": 139241, "epoch": 3315} {"train_loss": -6.814217567443848, "global_step": 139242, "epoch": 3315} {"train_loss": -6.65008020401001, "global_step": 139243, "epoch": 3315} {"train_loss": -6.50526237487793, "global_step": 139244, "epoch": 3315} {"train_loss": -6.685281753540039, "global_step": 139245, "epoch": 3315} {"train_loss": -6.693821907043457, "global_step": 139246, "epoch": 3315} {"train_loss": -6.632870674133301, "global_step": 139247, "epoch": 3315} {"train_loss": -6.703595161437988, "global_step": 139248, "epoch": 3315} {"train_loss": -6.698247909545898, "global_step": 139249, "epoch": 3315} {"train_loss": -6.861220359802246, "global_step": 139250, "epoch": 3315} {"train_loss": -6.831596851348877, "global_step": 139251, "epoch": 3315} {"train_loss": -6.83519983291626, "global_step": 139252, "epoch": 3315} {"train_loss": -6.7244367599487305, "global_step": 139253, "epoch": 3315} {"train_loss": -6.714609146118164, "global_step": 139254, "epoch": 3315} {"train_loss": -6.787816524505615, "global_step": 139255, "epoch": 3315} {"train_loss": -6.802778244018555, "global_step": 139256, "epoch": 3315} {"train_loss": -6.871336936950684, "global_step": 139257, "epoch": 3315} {"train_loss": -6.778406143188477, "global_step": 139258, "epoch": 3315} {"train_loss": -6.7783284187316895, "global_step": 139259, "epoch": 3315} {"train_loss": -6.8293914794921875, "global_step": 139260, "epoch": 3315} {"train_loss": -6.7310662269592285, "global_step": 139261, "epoch": 3315} {"train_loss": -6.743823051452637, "global_step": 139262, "epoch": 3315} {"train_loss": -6.85210657119751, "global_step": 139263, "epoch": 3315} {"train_loss": -6.7681474685668945, "global_step": 139264, "epoch": 3315} {"train_loss": -6.697544574737549, "global_step": 139265, "epoch": 3315} {"train_loss": -6.698768615722656, "global_step": 139266, "epoch": 3315} {"train_loss": -6.684349060058594, "global_step": 139267, "epoch": 3315} {"train_loss": -6.776195049285889, "global_step": 139268, "epoch": 3315} {"train_loss": -6.700593948364258, "global_step": 139269, "epoch": 3315} {"train_loss": -6.706448554992676, "global_step": 139270, "epoch": 3315} {"train_loss": -6.733375072479248, "global_step": 139271, "epoch": 3315, "val_loss": 67461.8125} {"train_loss": -6.749994277954102, "global_step": 139272, "epoch": 3316} {"train_loss": -6.777563095092773, "global_step": 139273, "epoch": 3316} {"train_loss": -6.692252159118652, "global_step": 139274, "epoch": 3316} {"train_loss": -6.6443891525268555, "global_step": 139275, "epoch": 3316} {"train_loss": -6.693380355834961, "global_step": 139276, "epoch": 3316} {"train_loss": -6.680902481079102, "global_step": 139277, "epoch": 3316} {"train_loss": -6.788165092468262, "global_step": 139278, "epoch": 3316} {"train_loss": -6.771801471710205, "global_step": 139279, "epoch": 3316} {"train_loss": -6.604574203491211, "global_step": 139280, "epoch": 3316} {"train_loss": -6.777891635894775, "global_step": 139281, "epoch": 3316} {"train_loss": -6.795791149139404, "global_step": 139282, "epoch": 3316} {"train_loss": -6.792671203613281, "global_step": 139283, "epoch": 3316} {"train_loss": -6.830235004425049, "global_step": 139284, "epoch": 3316} {"train_loss": -6.75098991394043, "global_step": 139285, "epoch": 3316} {"train_loss": -6.7975053787231445, "global_step": 139286, "epoch": 3316} {"train_loss": -6.831446647644043, "global_step": 139287, "epoch": 3316} {"train_loss": -6.777890682220459, "global_step": 139288, "epoch": 3316} {"train_loss": -6.740805149078369, "global_step": 139289, "epoch": 3316} {"train_loss": -6.700756072998047, "global_step": 139290, "epoch": 3316} {"train_loss": -6.572542190551758, "global_step": 139291, "epoch": 3316} {"train_loss": -6.8533101081848145, "global_step": 139292, "epoch": 3316} {"train_loss": -6.749335289001465, "global_step": 139293, "epoch": 3316} {"train_loss": -6.753190040588379, "global_step": 139294, "epoch": 3316} {"train_loss": -6.80100154876709, "global_step": 139295, "epoch": 3316} {"train_loss": -6.777541160583496, "global_step": 139296, "epoch": 3316} {"train_loss": -6.765359878540039, "global_step": 139297, "epoch": 3316} {"train_loss": -6.643064022064209, "global_step": 139298, "epoch": 3316} {"train_loss": -6.783954620361328, "global_step": 139299, "epoch": 3316} {"train_loss": -6.7220377922058105, "global_step": 139300, "epoch": 3316} {"train_loss": -6.628760814666748, "global_step": 139301, "epoch": 3316} {"train_loss": -6.740421772003174, "global_step": 139302, "epoch": 3316} {"train_loss": -6.742287635803223, "global_step": 139303, "epoch": 3316} {"train_loss": -6.677956581115723, "global_step": 139304, "epoch": 3316} {"train_loss": -6.813093185424805, "global_step": 139305, "epoch": 3316} {"train_loss": -6.794404983520508, "global_step": 139306, "epoch": 3316} {"train_loss": -6.668468475341797, "global_step": 139307, "epoch": 3316} {"train_loss": -6.773478031158447, "global_step": 139308, "epoch": 3316} {"train_loss": -6.893235683441162, "global_step": 139309, "epoch": 3316} {"train_loss": -6.830574989318848, "global_step": 139310, "epoch": 3316} {"train_loss": -6.738252639770508, "global_step": 139311, "epoch": 3316} {"train_loss": -6.6997528076171875, "global_step": 139312, "epoch": 3316} {"train_loss": -6.743015607198079, "global_step": 139313, "epoch": 3316, "val_loss": 67312.1796875} {"train_loss": -6.782705783843994, "global_step": 139314, "epoch": 3317} {"train_loss": -6.722667217254639, "global_step": 139315, "epoch": 3317} {"train_loss": -6.707808017730713, "global_step": 139316, "epoch": 3317} {"train_loss": -6.862083911895752, "global_step": 139317, "epoch": 3317} {"train_loss": -6.638524532318115, "global_step": 139318, "epoch": 3317} {"train_loss": -6.723814010620117, "global_step": 139319, "epoch": 3317} {"train_loss": -6.753386497497559, "global_step": 139320, "epoch": 3317} {"train_loss": -6.765196323394775, "global_step": 139321, "epoch": 3317} {"train_loss": -6.688955783843994, "global_step": 139322, "epoch": 3317} {"train_loss": -6.8029022216796875, "global_step": 139323, "epoch": 3317} {"train_loss": -6.754021644592285, "global_step": 139324, "epoch": 3317} {"train_loss": -6.777514934539795, "global_step": 139325, "epoch": 3317} {"train_loss": -6.838627338409424, "global_step": 139326, "epoch": 3317} {"train_loss": -6.786056041717529, "global_step": 139327, "epoch": 3317} {"train_loss": -6.796815872192383, "global_step": 139328, "epoch": 3317} {"train_loss": -6.80550479888916, "global_step": 139329, "epoch": 3317} {"train_loss": -6.821129322052002, "global_step": 139330, "epoch": 3317} {"train_loss": -6.739552021026611, "global_step": 139331, "epoch": 3317} {"train_loss": -6.754445552825928, "global_step": 139332, "epoch": 3317} {"train_loss": -6.765608787536621, "global_step": 139333, "epoch": 3317} {"train_loss": -6.7252116203308105, "global_step": 139334, "epoch": 3317} {"train_loss": -6.785914421081543, "global_step": 139335, "epoch": 3317} {"train_loss": -6.758156776428223, "global_step": 139336, "epoch": 3317} {"train_loss": -6.710577964782715, "global_step": 139337, "epoch": 3317} {"train_loss": -6.7421770095825195, "global_step": 139338, "epoch": 3317} {"train_loss": -6.741808891296387, "global_step": 139339, "epoch": 3317} {"train_loss": -6.6866350173950195, "global_step": 139340, "epoch": 3317} {"train_loss": -6.887757778167725, "global_step": 139341, "epoch": 3317} {"train_loss": -6.790951728820801, "global_step": 139342, "epoch": 3317} {"train_loss": -6.645575523376465, "global_step": 139343, "epoch": 3317} {"train_loss": -6.780840873718262, "global_step": 139344, "epoch": 3317} {"train_loss": -6.680920600891113, "global_step": 139345, "epoch": 3317} {"train_loss": -6.765401363372803, "global_step": 139346, "epoch": 3317} {"train_loss": -6.777989864349365, "global_step": 139347, "epoch": 3317} {"train_loss": -6.676628112792969, "global_step": 139348, "epoch": 3317} {"train_loss": -6.720268726348877, "global_step": 139349, "epoch": 3317} {"train_loss": -6.700457572937012, "global_step": 139350, "epoch": 3317} {"train_loss": -6.733746528625488, "global_step": 139351, "epoch": 3317} {"train_loss": -6.740857124328613, "global_step": 139352, "epoch": 3317} {"train_loss": -6.5955328941345215, "global_step": 139353, "epoch": 3317} {"train_loss": -6.755465507507324, "global_step": 139354, "epoch": 3317} {"train_loss": -6.749014241354806, "global_step": 139355, "epoch": 3317, "val_loss": 67413.9609375} {"train_loss": -6.700832843780518, "global_step": 139356, "epoch": 3318} {"train_loss": -6.799618721008301, "global_step": 139357, "epoch": 3318} {"train_loss": -6.755006790161133, "global_step": 139358, "epoch": 3318} {"train_loss": -6.775683879852295, "global_step": 139359, "epoch": 3318} {"train_loss": -6.719781875610352, "global_step": 139360, "epoch": 3318} {"train_loss": -6.681338310241699, "global_step": 139361, "epoch": 3318} {"train_loss": -6.611393928527832, "global_step": 139362, "epoch": 3318} {"train_loss": -6.6710662841796875, "global_step": 139363, "epoch": 3318} {"train_loss": -6.657625675201416, "global_step": 139364, "epoch": 3318} {"train_loss": -6.739383697509766, "global_step": 139365, "epoch": 3318} {"train_loss": -6.79358434677124, "global_step": 139366, "epoch": 3318} {"train_loss": -6.604876518249512, "global_step": 139367, "epoch": 3318} {"train_loss": -6.855694770812988, "global_step": 139368, "epoch": 3318} {"train_loss": -6.715965270996094, "global_step": 139369, "epoch": 3318} {"train_loss": -6.760970115661621, "global_step": 139370, "epoch": 3318} {"train_loss": -6.677155494689941, "global_step": 139371, "epoch": 3318} {"train_loss": -6.712868690490723, "global_step": 139372, "epoch": 3318} {"train_loss": -6.713181018829346, "global_step": 139373, "epoch": 3318} {"train_loss": -6.643153190612793, "global_step": 139374, "epoch": 3318} {"train_loss": -6.6722564697265625, "global_step": 139375, "epoch": 3318} {"train_loss": -6.573108673095703, "global_step": 139376, "epoch": 3318} {"train_loss": -6.626989364624023, "global_step": 139377, "epoch": 3318} {"train_loss": -6.674411773681641, "global_step": 139378, "epoch": 3318} {"train_loss": -6.685518264770508, "global_step": 139379, "epoch": 3318} {"train_loss": -6.696171283721924, "global_step": 139380, "epoch": 3318} {"train_loss": -6.716702461242676, "global_step": 139381, "epoch": 3318} {"train_loss": -6.655290126800537, "global_step": 139382, "epoch": 3318} {"train_loss": -6.813162803649902, "global_step": 139383, "epoch": 3318} {"train_loss": -6.705744743347168, "global_step": 139384, "epoch": 3318} {"train_loss": -6.621146202087402, "global_step": 139385, "epoch": 3318} {"train_loss": -6.740169525146484, "global_step": 139386, "epoch": 3318} {"train_loss": -6.663649559020996, "global_step": 139387, "epoch": 3318} {"train_loss": -6.733577251434326, "global_step": 139388, "epoch": 3318} {"train_loss": -6.619244575500488, "global_step": 139389, "epoch": 3318} {"train_loss": -6.706942558288574, "global_step": 139390, "epoch": 3318} {"train_loss": -6.786890029907227, "global_step": 139391, "epoch": 3318} {"train_loss": -6.624020099639893, "global_step": 139392, "epoch": 3318} {"train_loss": -6.739013671875, "global_step": 139393, "epoch": 3318} {"train_loss": -6.608074188232422, "global_step": 139394, "epoch": 3318} {"train_loss": -6.715235710144043, "global_step": 139395, "epoch": 3318} {"train_loss": -6.687337875366211, "global_step": 139396, "epoch": 3318} {"train_loss": -6.7019189312344505, "global_step": 139397, "epoch": 3318, "val_loss": 67348.7109375} {"train_loss": -6.760750770568848, "global_step": 139398, "epoch": 3319} {"train_loss": -6.753482341766357, "global_step": 139399, "epoch": 3319} {"train_loss": -6.663336753845215, "global_step": 139400, "epoch": 3319} {"train_loss": -6.642559051513672, "global_step": 139401, "epoch": 3319} {"train_loss": -6.705024242401123, "global_step": 139402, "epoch": 3319} {"train_loss": -6.787126064300537, "global_step": 139403, "epoch": 3319} {"train_loss": -6.669003963470459, "global_step": 139404, "epoch": 3319} {"train_loss": -6.541391849517822, "global_step": 139405, "epoch": 3319} {"train_loss": -6.69944429397583, "global_step": 139406, "epoch": 3319} {"train_loss": -6.766561031341553, "global_step": 139407, "epoch": 3319} {"train_loss": -6.778052806854248, "global_step": 139408, "epoch": 3319} {"train_loss": -6.64996337890625, "global_step": 139409, "epoch": 3319} {"train_loss": -6.797532558441162, "global_step": 139410, "epoch": 3319} {"train_loss": -6.652957916259766, "global_step": 139411, "epoch": 3319} {"train_loss": -6.764680862426758, "global_step": 139412, "epoch": 3319} {"train_loss": -6.743250846862793, "global_step": 139413, "epoch": 3319} {"train_loss": -6.642935752868652, "global_step": 139414, "epoch": 3319} {"train_loss": -6.756122589111328, "global_step": 139415, "epoch": 3319} {"train_loss": -6.772488594055176, "global_step": 139416, "epoch": 3319} {"train_loss": -6.763915061950684, "global_step": 139417, "epoch": 3319} {"train_loss": -6.834799289703369, "global_step": 139418, "epoch": 3319} {"train_loss": -6.7623796463012695, "global_step": 139419, "epoch": 3319} {"train_loss": -6.749852180480957, "global_step": 139420, "epoch": 3319} {"train_loss": -6.744412899017334, "global_step": 139421, "epoch": 3319} {"train_loss": -6.867925643920898, "global_step": 139422, "epoch": 3319} {"train_loss": -6.71368408203125, "global_step": 139423, "epoch": 3319} {"train_loss": -6.7131805419921875, "global_step": 139424, "epoch": 3319} {"train_loss": -6.831546783447266, "global_step": 139425, "epoch": 3319} {"train_loss": -6.727082252502441, "global_step": 139426, "epoch": 3319} {"train_loss": -6.750011920928955, "global_step": 139427, "epoch": 3319} {"train_loss": -6.839890956878662, "global_step": 139428, "epoch": 3319} {"train_loss": -6.813060760498047, "global_step": 139429, "epoch": 3319} {"train_loss": -6.702204704284668, "global_step": 139430, "epoch": 3319} {"train_loss": -6.7599334716796875, "global_step": 139431, "epoch": 3319} {"train_loss": -6.696296215057373, "global_step": 139432, "epoch": 3319} {"train_loss": -6.695432186126709, "global_step": 139433, "epoch": 3319} {"train_loss": -6.7134904861450195, "global_step": 139434, "epoch": 3319} {"train_loss": -6.814095497131348, "global_step": 139435, "epoch": 3319} {"train_loss": -6.807680130004883, "global_step": 139436, "epoch": 3319} {"train_loss": -6.771344184875488, "global_step": 139437, "epoch": 3319} {"train_loss": -6.816042900085449, "global_step": 139438, "epoch": 3319} {"train_loss": -6.742702268418812, "global_step": 139439, "epoch": 3319, "val_loss": 67178.53125} {"train_loss": -6.847400665283203, "global_step": 139440, "epoch": 3320} {"train_loss": -6.837153434753418, "global_step": 139441, "epoch": 3320} {"train_loss": -6.741216659545898, "global_step": 139442, "epoch": 3320} {"train_loss": -6.930136203765869, "global_step": 139443, "epoch": 3320} {"train_loss": -6.931595802307129, "global_step": 139444, "epoch": 3320} {"train_loss": -6.7582879066467285, "global_step": 139445, "epoch": 3320} {"train_loss": -6.855708122253418, "global_step": 139446, "epoch": 3320} {"train_loss": -6.73961877822876, "global_step": 139447, "epoch": 3320} {"train_loss": -6.712676048278809, "global_step": 139448, "epoch": 3320} {"train_loss": -6.798246383666992, "global_step": 139449, "epoch": 3320} {"train_loss": -6.783343315124512, "global_step": 139450, "epoch": 3320} {"train_loss": -6.710755348205566, "global_step": 139451, "epoch": 3320} {"train_loss": -6.7308030128479, "global_step": 139452, "epoch": 3320} {"train_loss": -6.849539756774902, "global_step": 139453, "epoch": 3320} {"train_loss": -6.6290788650512695, "global_step": 139454, "epoch": 3320} {"train_loss": -6.7685866355896, "global_step": 139455, "epoch": 3320} {"train_loss": -6.717529296875, "global_step": 139456, "epoch": 3320} {"train_loss": -6.7351484298706055, "global_step": 139457, "epoch": 3320} {"train_loss": -6.830277919769287, "global_step": 139458, "epoch": 3320} {"train_loss": -6.732362747192383, "global_step": 139459, "epoch": 3320} {"train_loss": -6.793664932250977, "global_step": 139460, "epoch": 3320} {"train_loss": -6.697748184204102, "global_step": 139461, "epoch": 3320} {"train_loss": -6.72553825378418, "global_step": 139462, "epoch": 3320} {"train_loss": -6.669738292694092, "global_step": 139463, "epoch": 3320} {"train_loss": -6.659994125366211, "global_step": 139464, "epoch": 3320} {"train_loss": -6.691608428955078, "global_step": 139465, "epoch": 3320} {"train_loss": -6.825211524963379, "global_step": 139466, "epoch": 3320} {"train_loss": -6.738672256469727, "global_step": 139467, "epoch": 3320} {"train_loss": -6.749477386474609, "global_step": 139468, "epoch": 3320} {"train_loss": -6.721022605895996, "global_step": 139469, "epoch": 3320} {"train_loss": -6.7035932540893555, "global_step": 139470, "epoch": 3320} {"train_loss": -6.751593589782715, "global_step": 139471, "epoch": 3320} {"train_loss": -6.722588062286377, "global_step": 139472, "epoch": 3320} {"train_loss": -6.803037643432617, "global_step": 139473, "epoch": 3320} {"train_loss": -6.728427410125732, "global_step": 139474, "epoch": 3320} {"train_loss": -6.59915018081665, "global_step": 139475, "epoch": 3320} {"train_loss": -6.654881477355957, "global_step": 139476, "epoch": 3320} {"train_loss": -6.734405517578125, "global_step": 139477, "epoch": 3320} {"train_loss": -6.778558254241943, "global_step": 139478, "epoch": 3320} {"train_loss": -6.756504058837891, "global_step": 139479, "epoch": 3320} {"train_loss": -6.8340373039245605, "global_step": 139480, "epoch": 3320} {"train_loss": -6.755824827012562, "global_step": 139481, "epoch": 3320, "val_loss": 67256.7734375} {"train_loss": -6.844715595245361, "global_step": 139482, "epoch": 3321} {"train_loss": -6.752256393432617, "global_step": 139483, "epoch": 3321} {"train_loss": -6.824872970581055, "global_step": 139484, "epoch": 3321} {"train_loss": -6.858034133911133, "global_step": 139485, "epoch": 3321} {"train_loss": -6.801051139831543, "global_step": 139486, "epoch": 3321} {"train_loss": -6.795819282531738, "global_step": 139487, "epoch": 3321} {"train_loss": -6.874013423919678, "global_step": 139488, "epoch": 3321} {"train_loss": -6.854741096496582, "global_step": 139489, "epoch": 3321} {"train_loss": -6.795192718505859, "global_step": 139490, "epoch": 3321} {"train_loss": -6.810813903808594, "global_step": 139491, "epoch": 3321} {"train_loss": -6.712831497192383, "global_step": 139492, "epoch": 3321} {"train_loss": -6.812294960021973, "global_step": 139493, "epoch": 3321} {"train_loss": -6.799184799194336, "global_step": 139494, "epoch": 3321} {"train_loss": -6.776569843292236, "global_step": 139495, "epoch": 3321} {"train_loss": -6.803542137145996, "global_step": 139496, "epoch": 3321} {"train_loss": -6.897357940673828, "global_step": 139497, "epoch": 3321} {"train_loss": -6.810655117034912, "global_step": 139498, "epoch": 3321} {"train_loss": -6.834111213684082, "global_step": 139499, "epoch": 3321} {"train_loss": -6.607571601867676, "global_step": 139500, "epoch": 3321} {"train_loss": -6.6516265869140625, "global_step": 139501, "epoch": 3321} {"train_loss": -6.7977423667907715, "global_step": 139502, "epoch": 3321} {"train_loss": -6.846883773803711, "global_step": 139503, "epoch": 3321} {"train_loss": -6.780674934387207, "global_step": 139504, "epoch": 3321} {"train_loss": -6.782109260559082, "global_step": 139505, "epoch": 3321} {"train_loss": -6.788142204284668, "global_step": 139506, "epoch": 3321} {"train_loss": -6.859676837921143, "global_step": 139507, "epoch": 3321} {"train_loss": -6.808126449584961, "global_step": 139508, "epoch": 3321} {"train_loss": -6.810723304748535, "global_step": 139509, "epoch": 3321} {"train_loss": -6.841283798217773, "global_step": 139510, "epoch": 3321} {"train_loss": -6.79157829284668, "global_step": 139511, "epoch": 3321} {"train_loss": -6.799422264099121, "global_step": 139512, "epoch": 3321} {"train_loss": -6.862504482269287, "global_step": 139513, "epoch": 3321} {"train_loss": -6.737136363983154, "global_step": 139514, "epoch": 3321} {"train_loss": -6.825311183929443, "global_step": 139515, "epoch": 3321} {"train_loss": -6.697904586791992, "global_step": 139516, "epoch": 3321} {"train_loss": -6.7521748542785645, "global_step": 139517, "epoch": 3321} {"train_loss": -6.826836585998535, "global_step": 139518, "epoch": 3321} {"train_loss": -6.832223892211914, "global_step": 139519, "epoch": 3321} {"train_loss": -6.812304973602295, "global_step": 139520, "epoch": 3321} {"train_loss": -6.824892520904541, "global_step": 139521, "epoch": 3321} {"train_loss": -6.684128761291504, "global_step": 139522, "epoch": 3321} {"train_loss": -6.79595931371053, "global_step": 139523, "epoch": 3321, "val_loss": 67149.46875} {"train_loss": -6.796054840087891, "global_step": 139524, "epoch": 3322} {"train_loss": -6.720622539520264, "global_step": 139525, "epoch": 3322} {"train_loss": -6.811001777648926, "global_step": 139526, "epoch": 3322} {"train_loss": -6.722723007202148, "global_step": 139527, "epoch": 3322} {"train_loss": -6.704132556915283, "global_step": 139528, "epoch": 3322} {"train_loss": -6.745370864868164, "global_step": 139529, "epoch": 3322} {"train_loss": -6.774937629699707, "global_step": 139530, "epoch": 3322} {"train_loss": -6.834408760070801, "global_step": 139531, "epoch": 3322} {"train_loss": -6.808404922485352, "global_step": 139532, "epoch": 3322} {"train_loss": -6.838005065917969, "global_step": 139533, "epoch": 3322} {"train_loss": -6.855005741119385, "global_step": 139534, "epoch": 3322} {"train_loss": -6.7834014892578125, "global_step": 139535, "epoch": 3322} {"train_loss": -6.833809852600098, "global_step": 139536, "epoch": 3322} {"train_loss": -6.706745147705078, "global_step": 139537, "epoch": 3322} {"train_loss": -6.7766804695129395, "global_step": 139538, "epoch": 3322} {"train_loss": -6.771907806396484, "global_step": 139539, "epoch": 3322} {"train_loss": -6.817095756530762, "global_step": 139540, "epoch": 3322} {"train_loss": -6.769593238830566, "global_step": 139541, "epoch": 3322} {"train_loss": -6.781126499176025, "global_step": 139542, "epoch": 3322} {"train_loss": -6.755815505981445, "global_step": 139543, "epoch": 3322} {"train_loss": -6.844264984130859, "global_step": 139544, "epoch": 3322} {"train_loss": -6.86759090423584, "global_step": 139545, "epoch": 3322} {"train_loss": -6.7933268547058105, "global_step": 139546, "epoch": 3322} {"train_loss": -6.618619918823242, "global_step": 139547, "epoch": 3322} {"train_loss": -6.777351379394531, "global_step": 139548, "epoch": 3322} {"train_loss": -6.678933620452881, "global_step": 139549, "epoch": 3322} {"train_loss": -6.71090030670166, "global_step": 139550, "epoch": 3322} {"train_loss": -6.763915061950684, "global_step": 139551, "epoch": 3322} {"train_loss": -6.738870620727539, "global_step": 139552, "epoch": 3322} {"train_loss": -6.8216552734375, "global_step": 139553, "epoch": 3322} {"train_loss": -6.688416004180908, "global_step": 139554, "epoch": 3322} {"train_loss": -6.7377824783325195, "global_step": 139555, "epoch": 3322} {"train_loss": -6.656094551086426, "global_step": 139556, "epoch": 3322} {"train_loss": -6.693951606750488, "global_step": 139557, "epoch": 3322} {"train_loss": -6.648317337036133, "global_step": 139558, "epoch": 3322} {"train_loss": -6.649637222290039, "global_step": 139559, "epoch": 3322} {"train_loss": -6.717647552490234, "global_step": 139560, "epoch": 3322} {"train_loss": -6.682538032531738, "global_step": 139561, "epoch": 3322} {"train_loss": -6.816667079925537, "global_step": 139562, "epoch": 3322} {"train_loss": -6.642492294311523, "global_step": 139563, "epoch": 3322} {"train_loss": -6.734060287475586, "global_step": 139564, "epoch": 3322} {"train_loss": -6.754698685237339, "global_step": 139565, "epoch": 3322, "val_loss": 67386.71875} {"train_loss": -6.746774673461914, "global_step": 139566, "epoch": 3323} {"train_loss": -6.747632026672363, "global_step": 139567, "epoch": 3323} {"train_loss": -6.803461074829102, "global_step": 139568, "epoch": 3323} {"train_loss": -6.788459777832031, "global_step": 139569, "epoch": 3323} {"train_loss": -6.841675758361816, "global_step": 139570, "epoch": 3323} {"train_loss": -6.807269096374512, "global_step": 139571, "epoch": 3323} {"train_loss": -6.777100086212158, "global_step": 139572, "epoch": 3323} {"train_loss": -6.899590492248535, "global_step": 139573, "epoch": 3323} {"train_loss": -6.754793643951416, "global_step": 139574, "epoch": 3323} {"train_loss": -6.74896240234375, "global_step": 139575, "epoch": 3323} {"train_loss": -6.750117778778076, "global_step": 139576, "epoch": 3323} {"train_loss": -6.814908027648926, "global_step": 139577, "epoch": 3323} {"train_loss": -6.834868431091309, "global_step": 139578, "epoch": 3323} {"train_loss": -6.745084285736084, "global_step": 139579, "epoch": 3323} {"train_loss": -6.73148250579834, "global_step": 139580, "epoch": 3323} {"train_loss": -6.719877243041992, "global_step": 139581, "epoch": 3323} {"train_loss": -6.878592491149902, "global_step": 139582, "epoch": 3323} {"train_loss": -6.81187629699707, "global_step": 139583, "epoch": 3323} {"train_loss": -6.751880645751953, "global_step": 139584, "epoch": 3323} {"train_loss": -6.741619110107422, "global_step": 139585, "epoch": 3323} {"train_loss": -6.8173627853393555, "global_step": 139586, "epoch": 3323} {"train_loss": -6.826264381408691, "global_step": 139587, "epoch": 3323} {"train_loss": -6.703888416290283, "global_step": 139588, "epoch": 3323} {"train_loss": -6.870415687561035, "global_step": 139589, "epoch": 3323} {"train_loss": -6.718781471252441, "global_step": 139590, "epoch": 3323} {"train_loss": -6.865215301513672, "global_step": 139591, "epoch": 3323} {"train_loss": -6.844066619873047, "global_step": 139592, "epoch": 3323} {"train_loss": -6.714714050292969, "global_step": 139593, "epoch": 3323} {"train_loss": -6.807608127593994, "global_step": 139594, "epoch": 3323} {"train_loss": -6.777114391326904, "global_step": 139595, "epoch": 3323} {"train_loss": -6.764202117919922, "global_step": 139596, "epoch": 3323} {"train_loss": -6.843362331390381, "global_step": 139597, "epoch": 3323} {"train_loss": -6.805556297302246, "global_step": 139598, "epoch": 3323} {"train_loss": -6.761381149291992, "global_step": 139599, "epoch": 3323} {"train_loss": -6.8444719314575195, "global_step": 139600, "epoch": 3323} {"train_loss": -6.714056968688965, "global_step": 139601, "epoch": 3323} {"train_loss": -6.811338424682617, "global_step": 139602, "epoch": 3323} {"train_loss": -6.9095964431762695, "global_step": 139603, "epoch": 3323} {"train_loss": -6.848649024963379, "global_step": 139604, "epoch": 3323} {"train_loss": -6.819380760192871, "global_step": 139605, "epoch": 3323} {"train_loss": -6.783095359802246, "global_step": 139606, "epoch": 3323} {"train_loss": -6.794519356318882, "global_step": 139607, "epoch": 3323, "val_loss": 67261.96875} {"train_loss": -6.761144638061523, "global_step": 139608, "epoch": 3324} {"train_loss": -6.844760894775391, "global_step": 139609, "epoch": 3324} {"train_loss": -6.94345760345459, "global_step": 139610, "epoch": 3324} {"train_loss": -6.84431266784668, "global_step": 139611, "epoch": 3324} {"train_loss": -6.687824249267578, "global_step": 139612, "epoch": 3324} {"train_loss": -6.816554546356201, "global_step": 139613, "epoch": 3324} {"train_loss": -6.9111433029174805, "global_step": 139614, "epoch": 3324} {"train_loss": -6.851690292358398, "global_step": 139615, "epoch": 3324} {"train_loss": -6.749378204345703, "global_step": 139616, "epoch": 3324} {"train_loss": -6.87049674987793, "global_step": 139617, "epoch": 3324} {"train_loss": -6.867313861846924, "global_step": 139618, "epoch": 3324} {"train_loss": -6.89016056060791, "global_step": 139619, "epoch": 3324} {"train_loss": -6.827485084533691, "global_step": 139620, "epoch": 3324} {"train_loss": -6.739495277404785, "global_step": 139621, "epoch": 3324} {"train_loss": -6.690243721008301, "global_step": 139622, "epoch": 3324} {"train_loss": -6.6757612228393555, "global_step": 139623, "epoch": 3324} {"train_loss": -6.730410575866699, "global_step": 139624, "epoch": 3324} {"train_loss": -6.734804630279541, "global_step": 139625, "epoch": 3324} {"train_loss": -6.679704666137695, "global_step": 139626, "epoch": 3324} {"train_loss": -6.756804466247559, "global_step": 139627, "epoch": 3324} {"train_loss": -6.739757537841797, "global_step": 139628, "epoch": 3324} {"train_loss": -6.689372539520264, "global_step": 139629, "epoch": 3324} {"train_loss": -6.726002216339111, "global_step": 139630, "epoch": 3324} {"train_loss": -6.716830730438232, "global_step": 139631, "epoch": 3324} {"train_loss": -6.681023597717285, "global_step": 139632, "epoch": 3324} {"train_loss": -6.824759483337402, "global_step": 139633, "epoch": 3324} {"train_loss": -6.738308906555176, "global_step": 139634, "epoch": 3324} {"train_loss": -6.590915679931641, "global_step": 139635, "epoch": 3324} {"train_loss": -6.684438705444336, "global_step": 139636, "epoch": 3324} {"train_loss": -6.746547698974609, "global_step": 139637, "epoch": 3324} {"train_loss": -6.771660804748535, "global_step": 139638, "epoch": 3324} {"train_loss": -6.752972602844238, "global_step": 139639, "epoch": 3324} {"train_loss": -6.830441474914551, "global_step": 139640, "epoch": 3324} {"train_loss": -6.789065837860107, "global_step": 139641, "epoch": 3324} {"train_loss": -6.822391510009766, "global_step": 139642, "epoch": 3324} {"train_loss": -6.7350006103515625, "global_step": 139643, "epoch": 3324} {"train_loss": -6.796268463134766, "global_step": 139644, "epoch": 3324} {"train_loss": -6.7629804611206055, "global_step": 139645, "epoch": 3324} {"train_loss": -6.730325698852539, "global_step": 139646, "epoch": 3324} {"train_loss": -6.902374267578125, "global_step": 139647, "epoch": 3324} {"train_loss": -6.7686309814453125, "global_step": 139648, "epoch": 3324} {"train_loss": -6.77106625693185, "global_step": 139649, "epoch": 3324, "val_loss": 67195.7109375} {"train_loss": -6.697482585906982, "global_step": 139650, "epoch": 3325} {"train_loss": -6.800354480743408, "global_step": 139651, "epoch": 3325} {"train_loss": -6.798667907714844, "global_step": 139652, "epoch": 3325} {"train_loss": -6.663064956665039, "global_step": 139653, "epoch": 3325} {"train_loss": -6.678971290588379, "global_step": 139654, "epoch": 3325} {"train_loss": -6.564810276031494, "global_step": 139655, "epoch": 3325} {"train_loss": -6.7476959228515625, "global_step": 139656, "epoch": 3325} {"train_loss": -6.641852855682373, "global_step": 139657, "epoch": 3325} {"train_loss": -6.7306013107299805, "global_step": 139658, "epoch": 3325} {"train_loss": -6.714187145233154, "global_step": 139659, "epoch": 3325} {"train_loss": -6.709348201751709, "global_step": 139660, "epoch": 3325} {"train_loss": -6.664361000061035, "global_step": 139661, "epoch": 3325} {"train_loss": -6.581124305725098, "global_step": 139662, "epoch": 3325} {"train_loss": -6.722036361694336, "global_step": 139663, "epoch": 3325} {"train_loss": -6.689878463745117, "global_step": 139664, "epoch": 3325} {"train_loss": -6.764379501342773, "global_step": 139665, "epoch": 3325} {"train_loss": -6.7836456298828125, "global_step": 139666, "epoch": 3325} {"train_loss": -6.685212135314941, "global_step": 139667, "epoch": 3325} {"train_loss": -6.652524948120117, "global_step": 139668, "epoch": 3325} {"train_loss": -6.704070568084717, "global_step": 139669, "epoch": 3325} {"train_loss": -6.735343933105469, "global_step": 139670, "epoch": 3325} {"train_loss": -6.736896991729736, "global_step": 139671, "epoch": 3325} {"train_loss": -6.868776321411133, "global_step": 139672, "epoch": 3325} {"train_loss": -6.727328300476074, "global_step": 139673, "epoch": 3325} {"train_loss": -6.775957107543945, "global_step": 139674, "epoch": 3325} {"train_loss": -6.772747993469238, "global_step": 139675, "epoch": 3325} {"train_loss": -6.822829723358154, "global_step": 139676, "epoch": 3325} {"train_loss": -6.740142345428467, "global_step": 139677, "epoch": 3325} {"train_loss": -6.88092041015625, "global_step": 139678, "epoch": 3325} {"train_loss": -6.735791206359863, "global_step": 139679, "epoch": 3325} {"train_loss": -6.812901496887207, "global_step": 139680, "epoch": 3325} {"train_loss": -6.787805557250977, "global_step": 139681, "epoch": 3325} {"train_loss": -6.809479713439941, "global_step": 139682, "epoch": 3325} {"train_loss": -6.830336570739746, "global_step": 139683, "epoch": 3325} {"train_loss": -6.757585048675537, "global_step": 139684, "epoch": 3325} {"train_loss": -6.641054153442383, "global_step": 139685, "epoch": 3325} {"train_loss": -6.705166816711426, "global_step": 139686, "epoch": 3325} {"train_loss": -6.818380355834961, "global_step": 139687, "epoch": 3325} {"train_loss": -6.6903181076049805, "global_step": 139688, "epoch": 3325} {"train_loss": -6.615485668182373, "global_step": 139689, "epoch": 3325} {"train_loss": -6.7538628578186035, "global_step": 139690, "epoch": 3325} {"train_loss": -6.729617561612811, "global_step": 139691, "epoch": 3325, "val_loss": 67326.4375} {"train_loss": -6.755433559417725, "global_step": 139692, "epoch": 3326} {"train_loss": -6.75881290435791, "global_step": 139693, "epoch": 3326} {"train_loss": -6.725287914276123, "global_step": 139694, "epoch": 3326} {"train_loss": -6.78986930847168, "global_step": 139695, "epoch": 3326} {"train_loss": -6.768895149230957, "global_step": 139696, "epoch": 3326} {"train_loss": -6.711545944213867, "global_step": 139697, "epoch": 3326} {"train_loss": -6.737152099609375, "global_step": 139698, "epoch": 3326} {"train_loss": -6.681265830993652, "global_step": 139699, "epoch": 3326} {"train_loss": -6.827211380004883, "global_step": 139700, "epoch": 3326} {"train_loss": -6.761490821838379, "global_step": 139701, "epoch": 3326} {"train_loss": -6.747079849243164, "global_step": 139702, "epoch": 3326} {"train_loss": -6.793999671936035, "global_step": 139703, "epoch": 3326} {"train_loss": -6.784631729125977, "global_step": 139704, "epoch": 3326} {"train_loss": -6.959684371948242, "global_step": 139705, "epoch": 3326} {"train_loss": -6.832255840301514, "global_step": 139706, "epoch": 3326} {"train_loss": -6.716400146484375, "global_step": 139707, "epoch": 3326} {"train_loss": -6.7923197746276855, "global_step": 139708, "epoch": 3326} {"train_loss": -6.86106014251709, "global_step": 139709, "epoch": 3326} {"train_loss": -6.623380184173584, "global_step": 139710, "epoch": 3326} {"train_loss": -6.843712329864502, "global_step": 139711, "epoch": 3326} {"train_loss": -6.789780616760254, "global_step": 139712, "epoch": 3326} {"train_loss": -6.777008533477783, "global_step": 139713, "epoch": 3326} {"train_loss": -6.769748210906982, "global_step": 139714, "epoch": 3326} {"train_loss": -6.778839111328125, "global_step": 139715, "epoch": 3326} {"train_loss": -6.831272125244141, "global_step": 139716, "epoch": 3326} {"train_loss": -6.774867057800293, "global_step": 139717, "epoch": 3326} {"train_loss": -6.721797943115234, "global_step": 139718, "epoch": 3326} {"train_loss": -6.7744903564453125, "global_step": 139719, "epoch": 3326} {"train_loss": -6.762112617492676, "global_step": 139720, "epoch": 3326} {"train_loss": -6.755173683166504, "global_step": 139721, "epoch": 3326} {"train_loss": -6.804744720458984, "global_step": 139722, "epoch": 3326} {"train_loss": -6.868132591247559, "global_step": 139723, "epoch": 3326} {"train_loss": -6.777376651763916, "global_step": 139724, "epoch": 3326} {"train_loss": -6.789394378662109, "global_step": 139725, "epoch": 3326} {"train_loss": -6.811615467071533, "global_step": 139726, "epoch": 3326} {"train_loss": -6.765578269958496, "global_step": 139727, "epoch": 3326} {"train_loss": -6.800846099853516, "global_step": 139728, "epoch": 3326} {"train_loss": -6.834112644195557, "global_step": 139729, "epoch": 3326} {"train_loss": -6.769536018371582, "global_step": 139730, "epoch": 3326} {"train_loss": -6.786409854888916, "global_step": 139731, "epoch": 3326} {"train_loss": -6.790101051330566, "global_step": 139732, "epoch": 3326} {"train_loss": -6.7790952410016745, "global_step": 139733, "epoch": 3326, "val_loss": 67251.5703125} {"train_loss": -6.796181678771973, "global_step": 139734, "epoch": 3327} {"train_loss": -6.6755170822143555, "global_step": 139735, "epoch": 3327} {"train_loss": -6.763306617736816, "global_step": 139736, "epoch": 3327} {"train_loss": -6.795902252197266, "global_step": 139737, "epoch": 3327} {"train_loss": -6.914815425872803, "global_step": 139738, "epoch": 3327} {"train_loss": -6.803743362426758, "global_step": 139739, "epoch": 3327} {"train_loss": -6.723414897918701, "global_step": 139740, "epoch": 3327} {"train_loss": -6.624728202819824, "global_step": 139741, "epoch": 3327} {"train_loss": -6.897701740264893, "global_step": 139742, "epoch": 3327} {"train_loss": -6.779507160186768, "global_step": 139743, "epoch": 3327} {"train_loss": -6.713910102844238, "global_step": 139744, "epoch": 3327} {"train_loss": -6.7306060791015625, "global_step": 139745, "epoch": 3327} {"train_loss": -6.79990291595459, "global_step": 139746, "epoch": 3327} {"train_loss": -6.708510398864746, "global_step": 139747, "epoch": 3327} {"train_loss": -6.69879150390625, "global_step": 139748, "epoch": 3327} {"train_loss": -6.668498992919922, "global_step": 139749, "epoch": 3327} {"train_loss": -6.38594388961792, "global_step": 139750, "epoch": 3327} {"train_loss": -6.740993976593018, "global_step": 139751, "epoch": 3327} {"train_loss": -6.640705108642578, "global_step": 139752, "epoch": 3327} {"train_loss": -6.7353692054748535, "global_step": 139753, "epoch": 3327} {"train_loss": -6.793102741241455, "global_step": 139754, "epoch": 3327} {"train_loss": -6.722944259643555, "global_step": 139755, "epoch": 3327} {"train_loss": -6.59792423248291, "global_step": 139756, "epoch": 3327} {"train_loss": -6.600470542907715, "global_step": 139757, "epoch": 3327} {"train_loss": -6.664134979248047, "global_step": 139758, "epoch": 3327} {"train_loss": -6.719307899475098, "global_step": 139759, "epoch": 3327} {"train_loss": -6.694225788116455, "global_step": 139760, "epoch": 3327} {"train_loss": -6.759509086608887, "global_step": 139761, "epoch": 3327} {"train_loss": -6.6478800773620605, "global_step": 139762, "epoch": 3327} {"train_loss": -6.757114410400391, "global_step": 139763, "epoch": 3327} {"train_loss": -6.575685501098633, "global_step": 139764, "epoch": 3327} {"train_loss": -6.715203285217285, "global_step": 139765, "epoch": 3327} {"train_loss": -6.597586154937744, "global_step": 139766, "epoch": 3327} {"train_loss": -6.700885772705078, "global_step": 139767, "epoch": 3327} {"train_loss": -6.658735275268555, "global_step": 139768, "epoch": 3327} {"train_loss": -6.494985103607178, "global_step": 139769, "epoch": 3327} {"train_loss": -6.768518447875977, "global_step": 139770, "epoch": 3327} {"train_loss": -6.531835556030273, "global_step": 139771, "epoch": 3327} {"train_loss": -6.554261684417725, "global_step": 139772, "epoch": 3327} {"train_loss": -6.595681190490723, "global_step": 139773, "epoch": 3327} {"train_loss": -6.67430305480957, "global_step": 139774, "epoch": 3327} {"train_loss": -6.689893336523147, "global_step": 139775, "epoch": 3327, "val_loss": 67210.171875} {"train_loss": -6.677361011505127, "global_step": 139776, "epoch": 3328} {"train_loss": -6.568325519561768, "global_step": 139777, "epoch": 3328} {"train_loss": -6.700441360473633, "global_step": 139778, "epoch": 3328} {"train_loss": -6.636704444885254, "global_step": 139779, "epoch": 3328} {"train_loss": -6.806075572967529, "global_step": 139780, "epoch": 3328} {"train_loss": -6.777978420257568, "global_step": 139781, "epoch": 3328} {"train_loss": -6.640743255615234, "global_step": 139782, "epoch": 3328} {"train_loss": -6.728580474853516, "global_step": 139783, "epoch": 3328} {"train_loss": -6.692648887634277, "global_step": 139784, "epoch": 3328} {"train_loss": -6.764307975769043, "global_step": 139785, "epoch": 3328} {"train_loss": -6.649775981903076, "global_step": 139786, "epoch": 3328} {"train_loss": -6.8518385887146, "global_step": 139787, "epoch": 3328} {"train_loss": -6.748130798339844, "global_step": 139788, "epoch": 3328} {"train_loss": -6.780705451965332, "global_step": 139789, "epoch": 3328} {"train_loss": -6.603844165802002, "global_step": 139790, "epoch": 3328} {"train_loss": -6.7446184158325195, "global_step": 139791, "epoch": 3328} {"train_loss": -6.663295745849609, "global_step": 139792, "epoch": 3328} {"train_loss": -6.7513628005981445, "global_step": 139793, "epoch": 3328} {"train_loss": -6.811110973358154, "global_step": 139794, "epoch": 3328} {"train_loss": -6.656105041503906, "global_step": 139795, "epoch": 3328} {"train_loss": -6.6817545890808105, "global_step": 139796, "epoch": 3328} {"train_loss": -6.722556114196777, "global_step": 139797, "epoch": 3328} {"train_loss": -6.7386980056762695, "global_step": 139798, "epoch": 3328} {"train_loss": -6.812384605407715, "global_step": 139799, "epoch": 3328} {"train_loss": -6.708362579345703, "global_step": 139800, "epoch": 3328} {"train_loss": -6.867825984954834, "global_step": 139801, "epoch": 3328} {"train_loss": -6.7129082679748535, "global_step": 139802, "epoch": 3328} {"train_loss": -6.850757122039795, "global_step": 139803, "epoch": 3328} {"train_loss": -6.729850769042969, "global_step": 139804, "epoch": 3328} {"train_loss": -6.722256660461426, "global_step": 139805, "epoch": 3328} {"train_loss": -6.773505210876465, "global_step": 139806, "epoch": 3328} {"train_loss": -6.746970176696777, "global_step": 139807, "epoch": 3328} {"train_loss": -6.794734001159668, "global_step": 139808, "epoch": 3328} {"train_loss": -6.762848854064941, "global_step": 139809, "epoch": 3328} {"train_loss": -6.691675662994385, "global_step": 139810, "epoch": 3328} {"train_loss": -6.8128228187561035, "global_step": 139811, "epoch": 3328} {"train_loss": -6.726314067840576, "global_step": 139812, "epoch": 3328} {"train_loss": -6.6973419189453125, "global_step": 139813, "epoch": 3328} {"train_loss": -6.698138236999512, "global_step": 139814, "epoch": 3328} {"train_loss": -6.775384902954102, "global_step": 139815, "epoch": 3328} {"train_loss": -6.8142852783203125, "global_step": 139816, "epoch": 3328} {"train_loss": -6.7343036106654575, "global_step": 139817, "epoch": 3328, "val_loss": 67152.0078125} {"train_loss": -6.813525199890137, "global_step": 139818, "epoch": 3329} {"train_loss": -6.894381523132324, "global_step": 139819, "epoch": 3329} {"train_loss": -6.74279260635376, "global_step": 139820, "epoch": 3329} {"train_loss": -6.778496265411377, "global_step": 139821, "epoch": 3329} {"train_loss": -6.8241682052612305, "global_step": 139822, "epoch": 3329} {"train_loss": -6.761168956756592, "global_step": 139823, "epoch": 3329} {"train_loss": -6.876529216766357, "global_step": 139824, "epoch": 3329} {"train_loss": -6.7739105224609375, "global_step": 139825, "epoch": 3329} {"train_loss": -6.829707622528076, "global_step": 139826, "epoch": 3329} {"train_loss": -6.870199203491211, "global_step": 139827, "epoch": 3329} {"train_loss": -6.7093400955200195, "global_step": 139828, "epoch": 3329} {"train_loss": -6.918623447418213, "global_step": 139829, "epoch": 3329} {"train_loss": -6.871843338012695, "global_step": 139830, "epoch": 3329} {"train_loss": -6.8316569328308105, "global_step": 139831, "epoch": 3329} {"train_loss": -6.839733123779297, "global_step": 139832, "epoch": 3329} {"train_loss": -6.858313083648682, "global_step": 139833, "epoch": 3329} {"train_loss": -6.8882527351379395, "global_step": 139834, "epoch": 3329} {"train_loss": -6.727713584899902, "global_step": 139835, "epoch": 3329} {"train_loss": -6.673997402191162, "global_step": 139836, "epoch": 3329} {"train_loss": -6.707808971405029, "global_step": 139837, "epoch": 3329} {"train_loss": -6.760169506072998, "global_step": 139838, "epoch": 3329} {"train_loss": -6.763403415679932, "global_step": 139839, "epoch": 3329} {"train_loss": -6.8019585609436035, "global_step": 139840, "epoch": 3329} {"train_loss": -6.739670753479004, "global_step": 139841, "epoch": 3329} {"train_loss": -6.7059736251831055, "global_step": 139842, "epoch": 3329} {"train_loss": -6.759459018707275, "global_step": 139843, "epoch": 3329} {"train_loss": -6.94895076751709, "global_step": 139844, "epoch": 3329} {"train_loss": -6.808299541473389, "global_step": 139845, "epoch": 3329} {"train_loss": -6.917885780334473, "global_step": 139846, "epoch": 3329} {"train_loss": -6.7517242431640625, "global_step": 139847, "epoch": 3329} {"train_loss": -6.876941680908203, "global_step": 139848, "epoch": 3329} {"train_loss": -6.687230110168457, "global_step": 139849, "epoch": 3329} {"train_loss": -6.829140663146973, "global_step": 139850, "epoch": 3329} {"train_loss": -6.751784324645996, "global_step": 139851, "epoch": 3329} {"train_loss": -6.778759956359863, "global_step": 139852, "epoch": 3329} {"train_loss": -6.736445426940918, "global_step": 139853, "epoch": 3329} {"train_loss": -6.886624336242676, "global_step": 139854, "epoch": 3329} {"train_loss": -6.8564629554748535, "global_step": 139855, "epoch": 3329} {"train_loss": -6.783155918121338, "global_step": 139856, "epoch": 3329} {"train_loss": -6.721383094787598, "global_step": 139857, "epoch": 3329} {"train_loss": -6.754018783569336, "global_step": 139858, "epoch": 3329} {"train_loss": -6.799140964235578, "global_step": 139859, "epoch": 3329, "val_loss": 67372.234375} {"train_loss": -6.694108009338379, "global_step": 139860, "epoch": 3330} {"train_loss": -6.8393449783325195, "global_step": 139861, "epoch": 3330} {"train_loss": -6.779960632324219, "global_step": 139862, "epoch": 3330} {"train_loss": -6.812002182006836, "global_step": 139863, "epoch": 3330} {"train_loss": -6.751766204833984, "global_step": 139864, "epoch": 3330} {"train_loss": -6.851234436035156, "global_step": 139865, "epoch": 3330} {"train_loss": -6.777575492858887, "global_step": 139866, "epoch": 3330} {"train_loss": -6.812058448791504, "global_step": 139867, "epoch": 3330} {"train_loss": -6.7558512687683105, "global_step": 139868, "epoch": 3330} {"train_loss": -6.722276210784912, "global_step": 139869, "epoch": 3330} {"train_loss": -6.802013874053955, "global_step": 139870, "epoch": 3330} {"train_loss": -6.71900749206543, "global_step": 139871, "epoch": 3330} {"train_loss": -6.778229713439941, "global_step": 139872, "epoch": 3330} {"train_loss": -6.825908660888672, "global_step": 139873, "epoch": 3330} {"train_loss": -6.7886762619018555, "global_step": 139874, "epoch": 3330} {"train_loss": -6.828488349914551, "global_step": 139875, "epoch": 3330} {"train_loss": -6.781686782836914, "global_step": 139876, "epoch": 3330} {"train_loss": -6.881941318511963, "global_step": 139877, "epoch": 3330} {"train_loss": -6.841896057128906, "global_step": 139878, "epoch": 3330} {"train_loss": -6.843852519989014, "global_step": 139879, "epoch": 3330} {"train_loss": -6.73944091796875, "global_step": 139880, "epoch": 3330} {"train_loss": -6.8449859619140625, "global_step": 139881, "epoch": 3330} {"train_loss": -6.737414360046387, "global_step": 139882, "epoch": 3330} {"train_loss": -6.775938034057617, "global_step": 139883, "epoch": 3330} {"train_loss": -6.8493242263793945, "global_step": 139884, "epoch": 3330} {"train_loss": -6.758805274963379, "global_step": 139885, "epoch": 3330} {"train_loss": -6.788190841674805, "global_step": 139886, "epoch": 3330} {"train_loss": -6.812796592712402, "global_step": 139887, "epoch": 3330} {"train_loss": -6.737643718719482, "global_step": 139888, "epoch": 3330} {"train_loss": -6.670124053955078, "global_step": 139889, "epoch": 3330} {"train_loss": -6.803065299987793, "global_step": 139890, "epoch": 3330} {"train_loss": -6.785134315490723, "global_step": 139891, "epoch": 3330} {"train_loss": -6.646129608154297, "global_step": 139892, "epoch": 3330} {"train_loss": -6.806222915649414, "global_step": 139893, "epoch": 3330} {"train_loss": -6.766874313354492, "global_step": 139894, "epoch": 3330} {"train_loss": -6.694445610046387, "global_step": 139895, "epoch": 3330} {"train_loss": -6.714106559753418, "global_step": 139896, "epoch": 3330} {"train_loss": -6.665359020233154, "global_step": 139897, "epoch": 3330} {"train_loss": -6.82659387588501, "global_step": 139898, "epoch": 3330} {"train_loss": -6.719215393066406, "global_step": 139899, "epoch": 3330} {"train_loss": -6.694392204284668, "global_step": 139900, "epoch": 3330} {"train_loss": -6.773405336198353, "global_step": 139901, "epoch": 3330, "val_loss": 67553.4609375} {"train_loss": -6.779549598693848, "global_step": 139902, "epoch": 3331} {"train_loss": -6.84107780456543, "global_step": 139903, "epoch": 3331} {"train_loss": -6.777410984039307, "global_step": 139904, "epoch": 3331} {"train_loss": -6.6376800537109375, "global_step": 139905, "epoch": 3331} {"train_loss": -6.797839164733887, "global_step": 139906, "epoch": 3331} {"train_loss": -6.75914192199707, "global_step": 139907, "epoch": 3331} {"train_loss": -6.616697311401367, "global_step": 139908, "epoch": 3331} {"train_loss": -6.665834903717041, "global_step": 139909, "epoch": 3331} {"train_loss": -6.607329368591309, "global_step": 139910, "epoch": 3331} {"train_loss": -6.743964195251465, "global_step": 139911, "epoch": 3331} {"train_loss": -6.686766624450684, "global_step": 139912, "epoch": 3331} {"train_loss": -6.643273830413818, "global_step": 139913, "epoch": 3331} {"train_loss": -6.823281288146973, "global_step": 139914, "epoch": 3331} {"train_loss": -6.754749774932861, "global_step": 139915, "epoch": 3331} {"train_loss": -6.7760114669799805, "global_step": 139916, "epoch": 3331} {"train_loss": -6.733042240142822, "global_step": 139917, "epoch": 3331} {"train_loss": -6.688321113586426, "global_step": 139918, "epoch": 3331} {"train_loss": -6.618346214294434, "global_step": 139919, "epoch": 3331} {"train_loss": -6.780302047729492, "global_step": 139920, "epoch": 3331} {"train_loss": -6.537267684936523, "global_step": 139921, "epoch": 3331} {"train_loss": -6.777462959289551, "global_step": 139922, "epoch": 3331} {"train_loss": -6.688032150268555, "global_step": 139923, "epoch": 3331} {"train_loss": -6.656492710113525, "global_step": 139924, "epoch": 3331} {"train_loss": -6.754034996032715, "global_step": 139925, "epoch": 3331} {"train_loss": -6.663928985595703, "global_step": 139926, "epoch": 3331} {"train_loss": -6.7089056968688965, "global_step": 139927, "epoch": 3331} {"train_loss": -6.7311692237854, "global_step": 139928, "epoch": 3331} {"train_loss": -6.6607160568237305, "global_step": 139929, "epoch": 3331} {"train_loss": -6.7706708908081055, "global_step": 139930, "epoch": 3331} {"train_loss": -6.798953533172607, "global_step": 139931, "epoch": 3331} {"train_loss": -6.702826499938965, "global_step": 139932, "epoch": 3331} {"train_loss": -6.697826385498047, "global_step": 139933, "epoch": 3331} {"train_loss": -6.709395408630371, "global_step": 139934, "epoch": 3331} {"train_loss": -6.5918121337890625, "global_step": 139935, "epoch": 3331} {"train_loss": -6.758155822753906, "global_step": 139936, "epoch": 3331} {"train_loss": -6.658478736877441, "global_step": 139937, "epoch": 3331} {"train_loss": -6.737894535064697, "global_step": 139938, "epoch": 3331} {"train_loss": -6.6486921310424805, "global_step": 139939, "epoch": 3331} {"train_loss": -6.625235557556152, "global_step": 139940, "epoch": 3331} {"train_loss": -6.747576713562012, "global_step": 139941, "epoch": 3331} {"train_loss": -6.748329162597656, "global_step": 139942, "epoch": 3331} {"train_loss": -6.711405084246681, "global_step": 139943, "epoch": 3331, "val_loss": 67375.78125} {"train_loss": -6.696928977966309, "global_step": 139944, "epoch": 3332} {"train_loss": -6.764087677001953, "global_step": 139945, "epoch": 3332} {"train_loss": -6.715054512023926, "global_step": 139946, "epoch": 3332} {"train_loss": -6.7220306396484375, "global_step": 139947, "epoch": 3332} {"train_loss": -6.779947280883789, "global_step": 139948, "epoch": 3332} {"train_loss": -6.806130409240723, "global_step": 139949, "epoch": 3332} {"train_loss": -6.766772270202637, "global_step": 139950, "epoch": 3332} {"train_loss": -6.800889492034912, "global_step": 139951, "epoch": 3332} {"train_loss": -6.812654495239258, "global_step": 139952, "epoch": 3332} {"train_loss": -6.822705268859863, "global_step": 139953, "epoch": 3332} {"train_loss": -6.798437595367432, "global_step": 139954, "epoch": 3332} {"train_loss": -6.811686992645264, "global_step": 139955, "epoch": 3332} {"train_loss": -6.844446659088135, "global_step": 139956, "epoch": 3332} {"train_loss": -6.873636245727539, "global_step": 139957, "epoch": 3332} {"train_loss": -6.763597011566162, "global_step": 139958, "epoch": 3332} {"train_loss": -6.783782958984375, "global_step": 139959, "epoch": 3332} {"train_loss": -6.66426420211792, "global_step": 139960, "epoch": 3332} {"train_loss": -6.7482008934021, "global_step": 139961, "epoch": 3332} {"train_loss": -6.679452896118164, "global_step": 139962, "epoch": 3332} {"train_loss": -6.761183738708496, "global_step": 139963, "epoch": 3332} {"train_loss": -6.704424858093262, "global_step": 139964, "epoch": 3332} {"train_loss": -6.844832420349121, "global_step": 139965, "epoch": 3332} {"train_loss": -6.827973365783691, "global_step": 139966, "epoch": 3332} {"train_loss": -6.737903118133545, "global_step": 139967, "epoch": 3332} {"train_loss": -6.876248359680176, "global_step": 139968, "epoch": 3332} {"train_loss": -6.852117538452148, "global_step": 139969, "epoch": 3332} {"train_loss": -6.882714748382568, "global_step": 139970, "epoch": 3332} {"train_loss": -6.814953804016113, "global_step": 139971, "epoch": 3332} {"train_loss": -6.7492194175720215, "global_step": 139972, "epoch": 3332} {"train_loss": -6.708253860473633, "global_step": 139973, "epoch": 3332} {"train_loss": -6.830035209655762, "global_step": 139974, "epoch": 3332} {"train_loss": -6.761507987976074, "global_step": 139975, "epoch": 3332} {"train_loss": -6.786927223205566, "global_step": 139976, "epoch": 3332} {"train_loss": -6.866838455200195, "global_step": 139977, "epoch": 3332} {"train_loss": -6.831855773925781, "global_step": 139978, "epoch": 3332} {"train_loss": -6.743738174438477, "global_step": 139979, "epoch": 3332} {"train_loss": -6.797100067138672, "global_step": 139980, "epoch": 3332} {"train_loss": -6.772111892700195, "global_step": 139981, "epoch": 3332} {"train_loss": -6.810147762298584, "global_step": 139982, "epoch": 3332} {"train_loss": -6.757319450378418, "global_step": 139983, "epoch": 3332} {"train_loss": -6.734284400939941, "global_step": 139984, "epoch": 3332} {"train_loss": -6.779533113752093, "global_step": 139985, "epoch": 3332, "val_loss": 67309.828125} {"train_loss": -6.807782173156738, "global_step": 139986, "epoch": 3333} {"train_loss": -6.662259101867676, "global_step": 139987, "epoch": 3333} {"train_loss": -6.691805839538574, "global_step": 139988, "epoch": 3333} {"train_loss": -6.890100002288818, "global_step": 139989, "epoch": 3333} {"train_loss": -6.703856468200684, "global_step": 139990, "epoch": 3333} {"train_loss": -6.7681097984313965, "global_step": 139991, "epoch": 3333} {"train_loss": -6.74399471282959, "global_step": 139992, "epoch": 3333} {"train_loss": -6.579419136047363, "global_step": 139993, "epoch": 3333} {"train_loss": -6.643130302429199, "global_step": 139994, "epoch": 3333} {"train_loss": -6.639603614807129, "global_step": 139995, "epoch": 3333} {"train_loss": -6.615184783935547, "global_step": 139996, "epoch": 3333} {"train_loss": -6.885665416717529, "global_step": 139997, "epoch": 3333} {"train_loss": -6.684569358825684, "global_step": 139998, "epoch": 3333} {"train_loss": -6.738886833190918, "global_step": 139999, "epoch": 3333} {"train_loss": -6.732660293579102, "global_step": 140000, "epoch": 3333} {"train_loss": -6.738499641418457, "global_step": 140001, "epoch": 3333} {"train_loss": -6.7472429275512695, "global_step": 140002, "epoch": 3333} {"train_loss": -6.775540828704834, "global_step": 140003, "epoch": 3333} {"train_loss": -6.788373947143555, "global_step": 140004, "epoch": 3333} {"train_loss": -6.657854080200195, "global_step": 140005, "epoch": 3333} {"train_loss": -6.727870464324951, "global_step": 140006, "epoch": 3333} {"train_loss": -6.771319389343262, "global_step": 140007, "epoch": 3333} {"train_loss": -6.805880546569824, "global_step": 140008, "epoch": 3333} {"train_loss": -6.814385414123535, "global_step": 140009, "epoch": 3333} {"train_loss": -6.779052257537842, "global_step": 140010, "epoch": 3333} {"train_loss": -6.672537803649902, "global_step": 140011, "epoch": 3333} {"train_loss": -6.713464260101318, "global_step": 140012, "epoch": 3333} {"train_loss": -6.782114505767822, "global_step": 140013, "epoch": 3333} {"train_loss": -6.814755916595459, "global_step": 140014, "epoch": 3333} {"train_loss": -6.812450885772705, "global_step": 140015, "epoch": 3333} {"train_loss": -6.750635147094727, "global_step": 140016, "epoch": 3333} {"train_loss": -6.858285427093506, "global_step": 140017, "epoch": 3333} {"train_loss": -6.725998878479004, "global_step": 140018, "epoch": 3333} {"train_loss": -6.875448703765869, "global_step": 140019, "epoch": 3333} {"train_loss": -6.764672756195068, "global_step": 140020, "epoch": 3333} {"train_loss": -6.793674468994141, "global_step": 140021, "epoch": 3333} {"train_loss": -6.8306884765625, "global_step": 140022, "epoch": 3333} {"train_loss": -6.74668025970459, "global_step": 140023, "epoch": 3333} {"train_loss": -6.697732448577881, "global_step": 140024, "epoch": 3333} {"train_loss": -6.7034735679626465, "global_step": 140025, "epoch": 3333} {"train_loss": -6.775882720947266, "global_step": 140026, "epoch": 3333} {"train_loss": -6.748316265287853, "global_step": 140027, "epoch": 3333, "val_loss": 67540.5859375} {"train_loss": -6.656302452087402, "global_step": 140028, "epoch": 3334} {"train_loss": -6.778567314147949, "global_step": 140029, "epoch": 3334} {"train_loss": -6.692113876342773, "global_step": 140030, "epoch": 3334} {"train_loss": -6.7142486572265625, "global_step": 140031, "epoch": 3334} {"train_loss": -6.862645626068115, "global_step": 140032, "epoch": 3334} {"train_loss": -6.676215648651123, "global_step": 140033, "epoch": 3334} {"train_loss": -6.797918796539307, "global_step": 140034, "epoch": 3334} {"train_loss": -6.77406120300293, "global_step": 140035, "epoch": 3334} {"train_loss": -6.7480573654174805, "global_step": 140036, "epoch": 3334} {"train_loss": -6.871912002563477, "global_step": 140037, "epoch": 3334} {"train_loss": -6.829265594482422, "global_step": 140038, "epoch": 3334} {"train_loss": -6.855517864227295, "global_step": 140039, "epoch": 3334} {"train_loss": -6.700555801391602, "global_step": 140040, "epoch": 3334} {"train_loss": -6.80695915222168, "global_step": 140041, "epoch": 3334} {"train_loss": -6.821233749389648, "global_step": 140042, "epoch": 3334} {"train_loss": -6.7226762771606445, "global_step": 140043, "epoch": 3334} {"train_loss": -6.792574882507324, "global_step": 140044, "epoch": 3334} {"train_loss": -6.810669898986816, "global_step": 140045, "epoch": 3334} {"train_loss": -6.781129360198975, "global_step": 140046, "epoch": 3334} {"train_loss": -6.757871627807617, "global_step": 140047, "epoch": 3334} {"train_loss": -6.826851844787598, "global_step": 140048, "epoch": 3334} {"train_loss": -6.7090559005737305, "global_step": 140049, "epoch": 3334} {"train_loss": -6.781852722167969, "global_step": 140050, "epoch": 3334} {"train_loss": -6.592877388000488, "global_step": 140051, "epoch": 3334} {"train_loss": -6.849937915802002, "global_step": 140052, "epoch": 3334} {"train_loss": -6.7696852684021, "global_step": 140053, "epoch": 3334} {"train_loss": -6.7548041343688965, "global_step": 140054, "epoch": 3334} {"train_loss": -6.90512752532959, "global_step": 140055, "epoch": 3334} {"train_loss": -6.818772315979004, "global_step": 140056, "epoch": 3334} {"train_loss": -6.842389106750488, "global_step": 140057, "epoch": 3334} {"train_loss": -6.816737174987793, "global_step": 140058, "epoch": 3334} {"train_loss": -6.7037577629089355, "global_step": 140059, "epoch": 3334} {"train_loss": -6.714447021484375, "global_step": 140060, "epoch": 3334} {"train_loss": -6.642089366912842, "global_step": 140061, "epoch": 3334} {"train_loss": -6.792152404785156, "global_step": 140062, "epoch": 3334} {"train_loss": -6.898434638977051, "global_step": 140063, "epoch": 3334} {"train_loss": -6.682497024536133, "global_step": 140064, "epoch": 3334} {"train_loss": -6.696354866027832, "global_step": 140065, "epoch": 3334} {"train_loss": -6.6893181800842285, "global_step": 140066, "epoch": 3334} {"train_loss": -6.792390823364258, "global_step": 140067, "epoch": 3334} {"train_loss": -6.726731300354004, "global_step": 140068, "epoch": 3334} {"train_loss": -6.767303512209938, "global_step": 140069, "epoch": 3334, "val_loss": 67340.265625} {"train_loss": -6.784992218017578, "global_step": 140070, "epoch": 3335} {"train_loss": -6.815892219543457, "global_step": 140071, "epoch": 3335} {"train_loss": -6.738805770874023, "global_step": 140072, "epoch": 3335} {"train_loss": -6.809544563293457, "global_step": 140073, "epoch": 3335} {"train_loss": -6.679734706878662, "global_step": 140074, "epoch": 3335} {"train_loss": -6.912757873535156, "global_step": 140075, "epoch": 3335} {"train_loss": -6.81104040145874, "global_step": 140076, "epoch": 3335} {"train_loss": -6.798308849334717, "global_step": 140077, "epoch": 3335} {"train_loss": -6.801292896270752, "global_step": 140078, "epoch": 3335} {"train_loss": -6.855284690856934, "global_step": 140079, "epoch": 3335} {"train_loss": -6.769320964813232, "global_step": 140080, "epoch": 3335} {"train_loss": -6.789022445678711, "global_step": 140081, "epoch": 3335} {"train_loss": -6.782219409942627, "global_step": 140082, "epoch": 3335} {"train_loss": -6.64189338684082, "global_step": 140083, "epoch": 3335} {"train_loss": -6.82624626159668, "global_step": 140084, "epoch": 3335} {"train_loss": -6.787835121154785, "global_step": 140085, "epoch": 3335} {"train_loss": -6.8444504737854, "global_step": 140086, "epoch": 3335} {"train_loss": -6.740813255310059, "global_step": 140087, "epoch": 3335} {"train_loss": -6.944448471069336, "global_step": 140088, "epoch": 3335} {"train_loss": -6.878720283508301, "global_step": 140089, "epoch": 3335} {"train_loss": -6.874960899353027, "global_step": 140090, "epoch": 3335} {"train_loss": -6.825369834899902, "global_step": 140091, "epoch": 3335} {"train_loss": -6.710611343383789, "global_step": 140092, "epoch": 3335} {"train_loss": -6.80294132232666, "global_step": 140093, "epoch": 3335} {"train_loss": -6.684534549713135, "global_step": 140094, "epoch": 3335} {"train_loss": -6.794958114624023, "global_step": 140095, "epoch": 3335} {"train_loss": -6.7899394035339355, "global_step": 140096, "epoch": 3335} {"train_loss": -6.749130725860596, "global_step": 140097, "epoch": 3335} {"train_loss": -6.880109786987305, "global_step": 140098, "epoch": 3335} {"train_loss": -6.877813816070557, "global_step": 140099, "epoch": 3335} {"train_loss": -6.844778060913086, "global_step": 140100, "epoch": 3335} {"train_loss": -6.770213603973389, "global_step": 140101, "epoch": 3335} {"train_loss": -6.758806228637695, "global_step": 140102, "epoch": 3335} {"train_loss": -6.851380348205566, "global_step": 140103, "epoch": 3335} {"train_loss": -6.762712001800537, "global_step": 140104, "epoch": 3335} {"train_loss": -6.759574890136719, "global_step": 140105, "epoch": 3335} {"train_loss": -6.735847473144531, "global_step": 140106, "epoch": 3335} {"train_loss": -6.559731960296631, "global_step": 140107, "epoch": 3335} {"train_loss": -6.835788726806641, "global_step": 140108, "epoch": 3335} {"train_loss": -6.827432632446289, "global_step": 140109, "epoch": 3335} {"train_loss": -6.769495964050293, "global_step": 140110, "epoch": 3335} {"train_loss": -6.794100625174386, "global_step": 140111, "epoch": 3335, "val_loss": 67251.796875} {"train_loss": -6.782585144042969, "global_step": 140112, "epoch": 3336} {"train_loss": -6.787841796875, "global_step": 140113, "epoch": 3336} {"train_loss": -6.762412071228027, "global_step": 140114, "epoch": 3336} {"train_loss": -6.7580718994140625, "global_step": 140115, "epoch": 3336} {"train_loss": -6.763512134552002, "global_step": 140116, "epoch": 3336} {"train_loss": -6.767023086547852, "global_step": 140117, "epoch": 3336} {"train_loss": -6.759548187255859, "global_step": 140118, "epoch": 3336} {"train_loss": -6.837485313415527, "global_step": 140119, "epoch": 3336} {"train_loss": -6.661635398864746, "global_step": 140120, "epoch": 3336} {"train_loss": -6.579387664794922, "global_step": 140121, "epoch": 3336} {"train_loss": -6.819632530212402, "global_step": 140122, "epoch": 3336} {"train_loss": -6.734247207641602, "global_step": 140123, "epoch": 3336} {"train_loss": -6.827157497406006, "global_step": 140124, "epoch": 3336} {"train_loss": -6.833835601806641, "global_step": 140125, "epoch": 3336} {"train_loss": -6.6725592613220215, "global_step": 140126, "epoch": 3336} {"train_loss": -6.650611877441406, "global_step": 140127, "epoch": 3336} {"train_loss": -6.6186370849609375, "global_step": 140128, "epoch": 3336} {"train_loss": -6.670477867126465, "global_step": 140129, "epoch": 3336} {"train_loss": -6.781259059906006, "global_step": 140130, "epoch": 3336} {"train_loss": -6.5727691650390625, "global_step": 140131, "epoch": 3336} {"train_loss": -6.613980293273926, "global_step": 140132, "epoch": 3336} {"train_loss": -6.619360446929932, "global_step": 140133, "epoch": 3336} {"train_loss": -6.702755928039551, "global_step": 140134, "epoch": 3336} {"train_loss": -6.637523651123047, "global_step": 140135, "epoch": 3336} {"train_loss": -6.573171615600586, "global_step": 140136, "epoch": 3336} {"train_loss": -6.597220420837402, "global_step": 140137, "epoch": 3336} {"train_loss": -6.673839092254639, "global_step": 140138, "epoch": 3336} {"train_loss": -6.703320026397705, "global_step": 140139, "epoch": 3336} {"train_loss": -6.6168036460876465, "global_step": 140140, "epoch": 3336} {"train_loss": -6.730805397033691, "global_step": 140141, "epoch": 3336} {"train_loss": -6.757937908172607, "global_step": 140142, "epoch": 3336} {"train_loss": -6.725683689117432, "global_step": 140143, "epoch": 3336} {"train_loss": -6.743281364440918, "global_step": 140144, "epoch": 3336} {"train_loss": -6.737914562225342, "global_step": 140145, "epoch": 3336} {"train_loss": -6.790266513824463, "global_step": 140146, "epoch": 3336} {"train_loss": -6.700868606567383, "global_step": 140147, "epoch": 3336} {"train_loss": -6.726070404052734, "global_step": 140148, "epoch": 3336} {"train_loss": -6.690351963043213, "global_step": 140149, "epoch": 3336} {"train_loss": -6.778199195861816, "global_step": 140150, "epoch": 3336} {"train_loss": -6.640722274780273, "global_step": 140151, "epoch": 3336} {"train_loss": -6.745241165161133, "global_step": 140152, "epoch": 3336} {"train_loss": -6.709745577403477, "global_step": 140153, "epoch": 3336, "val_loss": 67235.015625} {"train_loss": -6.6805572509765625, "global_step": 140154, "epoch": 3337} {"train_loss": -6.764324188232422, "global_step": 140155, "epoch": 3337} {"train_loss": -6.680644989013672, "global_step": 140156, "epoch": 3337} {"train_loss": -6.753994941711426, "global_step": 140157, "epoch": 3337} {"train_loss": -6.618808269500732, "global_step": 140158, "epoch": 3337} {"train_loss": -6.631494998931885, "global_step": 140159, "epoch": 3337} {"train_loss": -6.775969505310059, "global_step": 140160, "epoch": 3337} {"train_loss": -6.7271528244018555, "global_step": 140161, "epoch": 3337} {"train_loss": -6.8791093826293945, "global_step": 140162, "epoch": 3337} {"train_loss": -6.646922588348389, "global_step": 140163, "epoch": 3337} {"train_loss": -6.669676780700684, "global_step": 140164, "epoch": 3337} {"train_loss": -6.7597150802612305, "global_step": 140165, "epoch": 3337} {"train_loss": -6.765081405639648, "global_step": 140166, "epoch": 3337} {"train_loss": -6.797732353210449, "global_step": 140167, "epoch": 3337} {"train_loss": -6.7726850509643555, "global_step": 140168, "epoch": 3337} {"train_loss": -6.7086310386657715, "global_step": 140169, "epoch": 3337} {"train_loss": -6.683905601501465, "global_step": 140170, "epoch": 3337} {"train_loss": -6.666450500488281, "global_step": 140171, "epoch": 3337} {"train_loss": -6.673708915710449, "global_step": 140172, "epoch": 3337} {"train_loss": -6.749527931213379, "global_step": 140173, "epoch": 3337} {"train_loss": -6.707973957061768, "global_step": 140174, "epoch": 3337} {"train_loss": -6.709524631500244, "global_step": 140175, "epoch": 3337} {"train_loss": -6.896286964416504, "global_step": 140176, "epoch": 3337} {"train_loss": -6.721520900726318, "global_step": 140177, "epoch": 3337} {"train_loss": -6.74015474319458, "global_step": 140178, "epoch": 3337} {"train_loss": -6.76900053024292, "global_step": 140179, "epoch": 3337} {"train_loss": -6.818304538726807, "global_step": 140180, "epoch": 3337} {"train_loss": -6.870181083679199, "global_step": 140181, "epoch": 3337} {"train_loss": -6.82682991027832, "global_step": 140182, "epoch": 3337} {"train_loss": -6.797746658325195, "global_step": 140183, "epoch": 3337} {"train_loss": -6.8844523429870605, "global_step": 140184, "epoch": 3337} {"train_loss": -6.768462181091309, "global_step": 140185, "epoch": 3337} {"train_loss": -6.728292465209961, "global_step": 140186, "epoch": 3337} {"train_loss": -6.816986083984375, "global_step": 140187, "epoch": 3337} {"train_loss": -6.8422675132751465, "global_step": 140188, "epoch": 3337} {"train_loss": -6.8567633628845215, "global_step": 140189, "epoch": 3337} {"train_loss": -6.763696670532227, "global_step": 140190, "epoch": 3337} {"train_loss": -6.791622161865234, "global_step": 140191, "epoch": 3337} {"train_loss": -6.865054130554199, "global_step": 140192, "epoch": 3337} {"train_loss": -6.694330215454102, "global_step": 140193, "epoch": 3337} {"train_loss": -6.814702033996582, "global_step": 140194, "epoch": 3337} {"train_loss": -6.759428035645258, "global_step": 140195, "epoch": 3337, "val_loss": 67406.1015625} {"train_loss": -6.699066638946533, "global_step": 140196, "epoch": 3338} {"train_loss": -6.668122291564941, "global_step": 140197, "epoch": 3338} {"train_loss": -6.780181407928467, "global_step": 140198, "epoch": 3338} {"train_loss": -6.701848030090332, "global_step": 140199, "epoch": 3338} {"train_loss": -6.8069748878479, "global_step": 140200, "epoch": 3338} {"train_loss": -6.885595321655273, "global_step": 140201, "epoch": 3338} {"train_loss": -6.730246067047119, "global_step": 140202, "epoch": 3338} {"train_loss": -6.77432918548584, "global_step": 140203, "epoch": 3338} {"train_loss": -6.77953577041626, "global_step": 140204, "epoch": 3338} {"train_loss": -6.869806289672852, "global_step": 140205, "epoch": 3338} {"train_loss": -6.796606540679932, "global_step": 140206, "epoch": 3338} {"train_loss": -6.697000026702881, "global_step": 140207, "epoch": 3338} {"train_loss": -6.777029037475586, "global_step": 140208, "epoch": 3338} {"train_loss": -6.784064769744873, "global_step": 140209, "epoch": 3338} {"train_loss": -6.742941379547119, "global_step": 140210, "epoch": 3338} {"train_loss": -6.771998882293701, "global_step": 140211, "epoch": 3338} {"train_loss": -6.911275863647461, "global_step": 140212, "epoch": 3338} {"train_loss": -6.811113357543945, "global_step": 140213, "epoch": 3338} {"train_loss": -6.683805465698242, "global_step": 140214, "epoch": 3338} {"train_loss": -6.6860270500183105, "global_step": 140215, "epoch": 3338} {"train_loss": -6.7105536460876465, "global_step": 140216, "epoch": 3338} {"train_loss": -6.699711799621582, "global_step": 140217, "epoch": 3338} {"train_loss": -6.76528263092041, "global_step": 140218, "epoch": 3338} {"train_loss": -6.9249396324157715, "global_step": 140219, "epoch": 3338} {"train_loss": -6.787161350250244, "global_step": 140220, "epoch": 3338} {"train_loss": -6.727670192718506, "global_step": 140221, "epoch": 3338} {"train_loss": -6.81889009475708, "global_step": 140222, "epoch": 3338} {"train_loss": -6.760402679443359, "global_step": 140223, "epoch": 3338} {"train_loss": -6.785453796386719, "global_step": 140224, "epoch": 3338} {"train_loss": -6.855682373046875, "global_step": 140225, "epoch": 3338} {"train_loss": -6.817602157592773, "global_step": 140226, "epoch": 3338} {"train_loss": -6.767569541931152, "global_step": 140227, "epoch": 3338} {"train_loss": -6.802596092224121, "global_step": 140228, "epoch": 3338} {"train_loss": -6.847397327423096, "global_step": 140229, "epoch": 3338} {"train_loss": -6.7445831298828125, "global_step": 140230, "epoch": 3338} {"train_loss": -6.76451301574707, "global_step": 140231, "epoch": 3338} {"train_loss": -6.80830717086792, "global_step": 140232, "epoch": 3338} {"train_loss": -6.6406426429748535, "global_step": 140233, "epoch": 3338} {"train_loss": -6.810428619384766, "global_step": 140234, "epoch": 3338} {"train_loss": -6.807485580444336, "global_step": 140235, "epoch": 3338} {"train_loss": -6.749312400817871, "global_step": 140236, "epoch": 3338} {"train_loss": -6.771475178854806, "global_step": 140237, "epoch": 3338, "val_loss": 67247.8125} {"train_loss": -6.740851879119873, "global_step": 140238, "epoch": 3339} {"train_loss": -6.819457054138184, "global_step": 140239, "epoch": 3339} {"train_loss": -6.85726261138916, "global_step": 140240, "epoch": 3339} {"train_loss": -6.80092716217041, "global_step": 140241, "epoch": 3339} {"train_loss": -6.755141735076904, "global_step": 140242, "epoch": 3339} {"train_loss": -6.833226203918457, "global_step": 140243, "epoch": 3339} {"train_loss": -6.700283050537109, "global_step": 140244, "epoch": 3339} {"train_loss": -6.844604015350342, "global_step": 140245, "epoch": 3339} {"train_loss": -6.859271049499512, "global_step": 140246, "epoch": 3339} {"train_loss": -6.7160749435424805, "global_step": 140247, "epoch": 3339} {"train_loss": -6.721959590911865, "global_step": 140248, "epoch": 3339} {"train_loss": -6.790406227111816, "global_step": 140249, "epoch": 3339} {"train_loss": -6.770922660827637, "global_step": 140250, "epoch": 3339} {"train_loss": -6.727616310119629, "global_step": 140251, "epoch": 3339} {"train_loss": -6.72733736038208, "global_step": 140252, "epoch": 3339} {"train_loss": -6.839285850524902, "global_step": 140253, "epoch": 3339} {"train_loss": -6.558518409729004, "global_step": 140254, "epoch": 3339} {"train_loss": -6.691310882568359, "global_step": 140255, "epoch": 3339} {"train_loss": -6.851951599121094, "global_step": 140256, "epoch": 3339} {"train_loss": -6.776948928833008, "global_step": 140257, "epoch": 3339} {"train_loss": -6.712683200836182, "global_step": 140258, "epoch": 3339} {"train_loss": -6.6743669509887695, "global_step": 140259, "epoch": 3339} {"train_loss": -6.607568264007568, "global_step": 140260, "epoch": 3339} {"train_loss": -6.667421817779541, "global_step": 140261, "epoch": 3339} {"train_loss": -6.51275634765625, "global_step": 140262, "epoch": 3339} {"train_loss": -6.6999311447143555, "global_step": 140263, "epoch": 3339} {"train_loss": -6.740823745727539, "global_step": 140264, "epoch": 3339} {"train_loss": -6.583897590637207, "global_step": 140265, "epoch": 3339} {"train_loss": -6.6919965744018555, "global_step": 140266, "epoch": 3339} {"train_loss": -6.67720890045166, "global_step": 140267, "epoch": 3339} {"train_loss": -6.746209621429443, "global_step": 140268, "epoch": 3339} {"train_loss": -6.697325229644775, "global_step": 140269, "epoch": 3339} {"train_loss": -6.684859752655029, "global_step": 140270, "epoch": 3339} {"train_loss": -6.695738792419434, "global_step": 140271, "epoch": 3339} {"train_loss": -6.737018585205078, "global_step": 140272, "epoch": 3339} {"train_loss": -6.707376003265381, "global_step": 140273, "epoch": 3339} {"train_loss": -6.767767429351807, "global_step": 140274, "epoch": 3339} {"train_loss": -6.848337650299072, "global_step": 140275, "epoch": 3339} {"train_loss": -6.70294189453125, "global_step": 140276, "epoch": 3339} {"train_loss": -6.766219139099121, "global_step": 140277, "epoch": 3339} {"train_loss": -6.784239768981934, "global_step": 140278, "epoch": 3339} {"train_loss": -6.736305475234985, "global_step": 140279, "epoch": 3339, "val_loss": 67481.2421875} {"train_loss": -6.776663780212402, "global_step": 140280, "epoch": 3340} {"train_loss": -6.77321720123291, "global_step": 140281, "epoch": 3340} {"train_loss": -6.717912673950195, "global_step": 140282, "epoch": 3340} {"train_loss": -6.842116355895996, "global_step": 140283, "epoch": 3340} {"train_loss": -6.810883045196533, "global_step": 140284, "epoch": 3340} {"train_loss": -6.82650899887085, "global_step": 140285, "epoch": 3340} {"train_loss": -6.83087158203125, "global_step": 140286, "epoch": 3340} {"train_loss": -6.873790740966797, "global_step": 140287, "epoch": 3340} {"train_loss": -6.7804107666015625, "global_step": 140288, "epoch": 3340} {"train_loss": -6.807984352111816, "global_step": 140289, "epoch": 3340} {"train_loss": -6.876318454742432, "global_step": 140290, "epoch": 3340} {"train_loss": -6.746509552001953, "global_step": 140291, "epoch": 3340} {"train_loss": -6.796173572540283, "global_step": 140292, "epoch": 3340} {"train_loss": -6.81859827041626, "global_step": 140293, "epoch": 3340} {"train_loss": -6.888914585113525, "global_step": 140294, "epoch": 3340} {"train_loss": -6.958336353302002, "global_step": 140295, "epoch": 3340} {"train_loss": -6.8544392585754395, "global_step": 140296, "epoch": 3340} {"train_loss": -6.859040260314941, "global_step": 140297, "epoch": 3340} {"train_loss": -6.747479438781738, "global_step": 140298, "epoch": 3340} {"train_loss": -6.823573112487793, "global_step": 140299, "epoch": 3340} {"train_loss": -6.795681953430176, "global_step": 140300, "epoch": 3340} {"train_loss": -6.808513641357422, "global_step": 140301, "epoch": 3340} {"train_loss": -6.822795867919922, "global_step": 140302, "epoch": 3340} {"train_loss": -6.768507957458496, "global_step": 140303, "epoch": 3340} {"train_loss": -6.776677131652832, "global_step": 140304, "epoch": 3340} {"train_loss": -6.8802900314331055, "global_step": 140305, "epoch": 3340} {"train_loss": -6.758213043212891, "global_step": 140306, "epoch": 3340} {"train_loss": -6.812898635864258, "global_step": 140307, "epoch": 3340} {"train_loss": -6.831868648529053, "global_step": 140308, "epoch": 3340} {"train_loss": -6.708575248718262, "global_step": 140309, "epoch": 3340} {"train_loss": -6.745560646057129, "global_step": 140310, "epoch": 3340} {"train_loss": -6.706191062927246, "global_step": 140311, "epoch": 3340} {"train_loss": -6.782618522644043, "global_step": 140312, "epoch": 3340} {"train_loss": -6.8445281982421875, "global_step": 140313, "epoch": 3340} {"train_loss": -6.758256912231445, "global_step": 140314, "epoch": 3340} {"train_loss": -6.782861709594727, "global_step": 140315, "epoch": 3340} {"train_loss": -6.715022087097168, "global_step": 140316, "epoch": 3340} {"train_loss": -6.541590690612793, "global_step": 140317, "epoch": 3340} {"train_loss": -6.668045520782471, "global_step": 140318, "epoch": 3340} {"train_loss": -6.804157257080078, "global_step": 140319, "epoch": 3340} {"train_loss": -6.651247978210449, "global_step": 140320, "epoch": 3340} {"train_loss": -6.7895415510450094, "global_step": 140321, "epoch": 3340, "val_loss": 67758.125} {"train_loss": -6.68980073928833, "global_step": 140322, "epoch": 3341} {"train_loss": -6.699884414672852, "global_step": 140323, "epoch": 3341} {"train_loss": -6.725025177001953, "global_step": 140324, "epoch": 3341} {"train_loss": -6.8318681716918945, "global_step": 140325, "epoch": 3341} {"train_loss": -6.803447246551514, "global_step": 140326, "epoch": 3341} {"train_loss": -6.666711807250977, "global_step": 140327, "epoch": 3341} {"train_loss": -6.694331169128418, "global_step": 140328, "epoch": 3341} {"train_loss": -6.763580322265625, "global_step": 140329, "epoch": 3341} {"train_loss": -6.809894561767578, "global_step": 140330, "epoch": 3341} {"train_loss": -6.682096481323242, "global_step": 140331, "epoch": 3341} {"train_loss": -6.695754051208496, "global_step": 140332, "epoch": 3341} {"train_loss": -6.886616230010986, "global_step": 140333, "epoch": 3341} {"train_loss": -6.67500114440918, "global_step": 140334, "epoch": 3341} {"train_loss": -6.591914176940918, "global_step": 140335, "epoch": 3341} {"train_loss": -6.763708591461182, "global_step": 140336, "epoch": 3341} {"train_loss": -6.665094375610352, "global_step": 140337, "epoch": 3341} {"train_loss": -6.687131404876709, "global_step": 140338, "epoch": 3341} {"train_loss": -6.731884002685547, "global_step": 140339, "epoch": 3341} {"train_loss": -6.722037315368652, "global_step": 140340, "epoch": 3341} {"train_loss": -6.668845176696777, "global_step": 140341, "epoch": 3341} {"train_loss": -6.9032368659973145, "global_step": 140342, "epoch": 3341} {"train_loss": -6.574481010437012, "global_step": 140343, "epoch": 3341} {"train_loss": -6.627835750579834, "global_step": 140344, "epoch": 3341} {"train_loss": -6.69455099105835, "global_step": 140345, "epoch": 3341} {"train_loss": -6.6706976890563965, "global_step": 140346, "epoch": 3341} {"train_loss": -6.798463344573975, "global_step": 140347, "epoch": 3341} {"train_loss": -6.755214214324951, "global_step": 140348, "epoch": 3341} {"train_loss": -6.774001121520996, "global_step": 140349, "epoch": 3341} {"train_loss": -6.7246222496032715, "global_step": 140350, "epoch": 3341} {"train_loss": -6.807629585266113, "global_step": 140351, "epoch": 3341} {"train_loss": -6.776667594909668, "global_step": 140352, "epoch": 3341} {"train_loss": -6.732329368591309, "global_step": 140353, "epoch": 3341} {"train_loss": -6.886833190917969, "global_step": 140354, "epoch": 3341} {"train_loss": -6.738376617431641, "global_step": 140355, "epoch": 3341} {"train_loss": -6.6848907470703125, "global_step": 140356, "epoch": 3341} {"train_loss": -6.775982856750488, "global_step": 140357, "epoch": 3341} {"train_loss": -6.755335807800293, "global_step": 140358, "epoch": 3341} {"train_loss": -6.697451591491699, "global_step": 140359, "epoch": 3341} {"train_loss": -6.737756252288818, "global_step": 140360, "epoch": 3341} {"train_loss": -6.730184078216553, "global_step": 140361, "epoch": 3341} {"train_loss": -6.7194623947143555, "global_step": 140362, "epoch": 3341} {"train_loss": -6.731114194506691, "global_step": 140363, "epoch": 3341, "val_loss": 67478.90625} {"train_loss": -6.654135704040527, "global_step": 140364, "epoch": 3342} {"train_loss": -6.7548322677612305, "global_step": 140365, "epoch": 3342} {"train_loss": -6.705843925476074, "global_step": 140366, "epoch": 3342} {"train_loss": -6.736204147338867, "global_step": 140367, "epoch": 3342} {"train_loss": -6.694087982177734, "global_step": 140368, "epoch": 3342} {"train_loss": -6.870928764343262, "global_step": 140369, "epoch": 3342} {"train_loss": -6.792266845703125, "global_step": 140370, "epoch": 3342} {"train_loss": -6.785923004150391, "global_step": 140371, "epoch": 3342} {"train_loss": -6.658398628234863, "global_step": 140372, "epoch": 3342} {"train_loss": -6.795014381408691, "global_step": 140373, "epoch": 3342} {"train_loss": -6.715847015380859, "global_step": 140374, "epoch": 3342} {"train_loss": -6.742246627807617, "global_step": 140375, "epoch": 3342} {"train_loss": -6.733843803405762, "global_step": 140376, "epoch": 3342} {"train_loss": -6.719106674194336, "global_step": 140377, "epoch": 3342} {"train_loss": -6.764348983764648, "global_step": 140378, "epoch": 3342} {"train_loss": -6.624344348907471, "global_step": 140379, "epoch": 3342} {"train_loss": -6.743918418884277, "global_step": 140380, "epoch": 3342} {"train_loss": -6.883661270141602, "global_step": 140381, "epoch": 3342} {"train_loss": -6.791676998138428, "global_step": 140382, "epoch": 3342} {"train_loss": -6.86427640914917, "global_step": 140383, "epoch": 3342} {"train_loss": -6.831764221191406, "global_step": 140384, "epoch": 3342} {"train_loss": -6.859226703643799, "global_step": 140385, "epoch": 3342} {"train_loss": -6.844193458557129, "global_step": 140386, "epoch": 3342} {"train_loss": -6.876049041748047, "global_step": 140387, "epoch": 3342} {"train_loss": -6.833617210388184, "global_step": 140388, "epoch": 3342} {"train_loss": -6.755334854125977, "global_step": 140389, "epoch": 3342} {"train_loss": -6.835184097290039, "global_step": 140390, "epoch": 3342} {"train_loss": -6.803072929382324, "global_step": 140391, "epoch": 3342} {"train_loss": -6.895485877990723, "global_step": 140392, "epoch": 3342} {"train_loss": -6.785964012145996, "global_step": 140393, "epoch": 3342} {"train_loss": -6.80635929107666, "global_step": 140394, "epoch": 3342} {"train_loss": -6.909064769744873, "global_step": 140395, "epoch": 3342} {"train_loss": -6.811814308166504, "global_step": 140396, "epoch": 3342} {"train_loss": -6.795058250427246, "global_step": 140397, "epoch": 3342} {"train_loss": -6.82399320602417, "global_step": 140398, "epoch": 3342} {"train_loss": -6.7832417488098145, "global_step": 140399, "epoch": 3342} {"train_loss": -6.733199119567871, "global_step": 140400, "epoch": 3342} {"train_loss": -6.732970237731934, "global_step": 140401, "epoch": 3342} {"train_loss": -6.806790351867676, "global_step": 140402, "epoch": 3342} {"train_loss": -6.717593193054199, "global_step": 140403, "epoch": 3342} {"train_loss": -6.63456392288208, "global_step": 140404, "epoch": 3342} {"train_loss": -6.780396677198864, "global_step": 140405, "epoch": 3342, "val_loss": 67399.7421875} {"train_loss": -6.81938362121582, "global_step": 140406, "epoch": 3343} {"train_loss": -6.809287071228027, "global_step": 140407, "epoch": 3343} {"train_loss": -6.732598781585693, "global_step": 140408, "epoch": 3343} {"train_loss": -6.832434177398682, "global_step": 140409, "epoch": 3343} {"train_loss": -6.754858016967773, "global_step": 140410, "epoch": 3343} {"train_loss": -6.669597625732422, "global_step": 140411, "epoch": 3343} {"train_loss": -6.672557830810547, "global_step": 140412, "epoch": 3343} {"train_loss": -6.761748790740967, "global_step": 140413, "epoch": 3343} {"train_loss": -6.866750717163086, "global_step": 140414, "epoch": 3343} {"train_loss": -6.861800193786621, "global_step": 140415, "epoch": 3343} {"train_loss": -6.7252960205078125, "global_step": 140416, "epoch": 3343} {"train_loss": -6.830872535705566, "global_step": 140417, "epoch": 3343} {"train_loss": -6.795381546020508, "global_step": 140418, "epoch": 3343} {"train_loss": -6.773409366607666, "global_step": 140419, "epoch": 3343} {"train_loss": -6.853417873382568, "global_step": 140420, "epoch": 3343} {"train_loss": -6.727983474731445, "global_step": 140421, "epoch": 3343} {"train_loss": -6.712447643280029, "global_step": 140422, "epoch": 3343} {"train_loss": -6.793648719787598, "global_step": 140423, "epoch": 3343} {"train_loss": -6.735195636749268, "global_step": 140424, "epoch": 3343} {"train_loss": -6.801609992980957, "global_step": 140425, "epoch": 3343} {"train_loss": -6.8254313468933105, "global_step": 140426, "epoch": 3343} {"train_loss": -6.82012414932251, "global_step": 140427, "epoch": 3343} {"train_loss": -6.8293070793151855, "global_step": 140428, "epoch": 3343} {"train_loss": -6.842433929443359, "global_step": 140429, "epoch": 3343} {"train_loss": -6.710675239562988, "global_step": 140430, "epoch": 3343} {"train_loss": -6.8510589599609375, "global_step": 140431, "epoch": 3343} {"train_loss": -6.708935737609863, "global_step": 140432, "epoch": 3343} {"train_loss": -6.786253929138184, "global_step": 140433, "epoch": 3343} {"train_loss": -6.808417320251465, "global_step": 140434, "epoch": 3343} {"train_loss": -6.672176361083984, "global_step": 140435, "epoch": 3343} {"train_loss": -6.692378044128418, "global_step": 140436, "epoch": 3343} {"train_loss": -6.7486796379089355, "global_step": 140437, "epoch": 3343} {"train_loss": -6.9027018547058105, "global_step": 140438, "epoch": 3343} {"train_loss": -6.839818477630615, "global_step": 140439, "epoch": 3343} {"train_loss": -6.739017486572266, "global_step": 140440, "epoch": 3343} {"train_loss": -6.7884626388549805, "global_step": 140441, "epoch": 3343} {"train_loss": -6.860238075256348, "global_step": 140442, "epoch": 3343} {"train_loss": -6.794323921203613, "global_step": 140443, "epoch": 3343} {"train_loss": -6.8727288246154785, "global_step": 140444, "epoch": 3343} {"train_loss": -6.899505615234375, "global_step": 140445, "epoch": 3343} {"train_loss": -6.823293685913086, "global_step": 140446, "epoch": 3343} {"train_loss": -6.789116042000907, "global_step": 140447, "epoch": 3343, "val_loss": 67247.8515625} {"train_loss": -6.752425670623779, "global_step": 140448, "epoch": 3344} {"train_loss": -6.720799446105957, "global_step": 140449, "epoch": 3344} {"train_loss": -6.712093353271484, "global_step": 140450, "epoch": 3344} {"train_loss": -6.741235733032227, "global_step": 140451, "epoch": 3344} {"train_loss": -6.727710247039795, "global_step": 140452, "epoch": 3344} {"train_loss": -6.776208877563477, "global_step": 140453, "epoch": 3344} {"train_loss": -6.712672233581543, "global_step": 140454, "epoch": 3344} {"train_loss": -6.820075988769531, "global_step": 140455, "epoch": 3344} {"train_loss": -6.708370208740234, "global_step": 140456, "epoch": 3344} {"train_loss": -6.627773761749268, "global_step": 140457, "epoch": 3344} {"train_loss": -6.777364730834961, "global_step": 140458, "epoch": 3344} {"train_loss": -6.80008602142334, "global_step": 140459, "epoch": 3344} {"train_loss": -6.780457496643066, "global_step": 140460, "epoch": 3344} {"train_loss": -6.736703872680664, "global_step": 140461, "epoch": 3344} {"train_loss": -6.7246599197387695, "global_step": 140462, "epoch": 3344} {"train_loss": -6.910238265991211, "global_step": 140463, "epoch": 3344} {"train_loss": -6.596414566040039, "global_step": 140464, "epoch": 3344} {"train_loss": -6.778421878814697, "global_step": 140465, "epoch": 3344} {"train_loss": -6.805502414703369, "global_step": 140466, "epoch": 3344} {"train_loss": -6.575050354003906, "global_step": 140467, "epoch": 3344} {"train_loss": -6.6875410079956055, "global_step": 140468, "epoch": 3344} {"train_loss": -6.683809757232666, "global_step": 140469, "epoch": 3344} {"train_loss": -6.724520683288574, "global_step": 140470, "epoch": 3344} {"train_loss": -6.664817810058594, "global_step": 140471, "epoch": 3344} {"train_loss": -6.801116943359375, "global_step": 140472, "epoch": 3344} {"train_loss": -6.758189678192139, "global_step": 140473, "epoch": 3344} {"train_loss": -6.818464279174805, "global_step": 140474, "epoch": 3344} {"train_loss": -6.735950469970703, "global_step": 140475, "epoch": 3344} {"train_loss": -6.724289894104004, "global_step": 140476, "epoch": 3344} {"train_loss": -6.759798049926758, "global_step": 140477, "epoch": 3344} {"train_loss": -6.835012435913086, "global_step": 140478, "epoch": 3344} {"train_loss": -6.761186599731445, "global_step": 140479, "epoch": 3344} {"train_loss": -6.890897750854492, "global_step": 140480, "epoch": 3344} {"train_loss": -6.752209663391113, "global_step": 140481, "epoch": 3344} {"train_loss": -6.701523303985596, "global_step": 140482, "epoch": 3344} {"train_loss": -6.72665548324585, "global_step": 140483, "epoch": 3344} {"train_loss": -6.644139766693115, "global_step": 140484, "epoch": 3344} {"train_loss": -6.71661901473999, "global_step": 140485, "epoch": 3344} {"train_loss": -6.742392539978027, "global_step": 140486, "epoch": 3344} {"train_loss": -6.766925811767578, "global_step": 140487, "epoch": 3344} {"train_loss": -6.564624786376953, "global_step": 140488, "epoch": 3344} {"train_loss": -6.735946189789545, "global_step": 140489, "epoch": 3344, "val_loss": 67390.4140625} {"train_loss": -6.653507709503174, "global_step": 140490, "epoch": 3345} {"train_loss": -6.819576263427734, "global_step": 140491, "epoch": 3345} {"train_loss": -6.734963417053223, "global_step": 140492, "epoch": 3345} {"train_loss": -6.742903709411621, "global_step": 140493, "epoch": 3345} {"train_loss": -6.731592178344727, "global_step": 140494, "epoch": 3345} {"train_loss": -6.895412921905518, "global_step": 140495, "epoch": 3345} {"train_loss": -6.830519676208496, "global_step": 140496, "epoch": 3345} {"train_loss": -6.7913384437561035, "global_step": 140497, "epoch": 3345} {"train_loss": -6.665833950042725, "global_step": 140498, "epoch": 3345} {"train_loss": -6.731539726257324, "global_step": 140499, "epoch": 3345} {"train_loss": -6.699887275695801, "global_step": 140500, "epoch": 3345} {"train_loss": -6.697254180908203, "global_step": 140501, "epoch": 3345} {"train_loss": -6.783123016357422, "global_step": 140502, "epoch": 3345} {"train_loss": -6.7468743324279785, "global_step": 140503, "epoch": 3345} {"train_loss": -6.847063064575195, "global_step": 140504, "epoch": 3345} {"train_loss": -6.725238800048828, "global_step": 140505, "epoch": 3345} {"train_loss": -6.835658550262451, "global_step": 140506, "epoch": 3345} {"train_loss": -6.632491111755371, "global_step": 140507, "epoch": 3345} {"train_loss": -6.725775718688965, "global_step": 140508, "epoch": 3345} {"train_loss": -6.77039098739624, "global_step": 140509, "epoch": 3345} {"train_loss": -6.713919639587402, "global_step": 140510, "epoch": 3345} {"train_loss": -6.656716346740723, "global_step": 140511, "epoch": 3345} {"train_loss": -6.842678070068359, "global_step": 140512, "epoch": 3345} {"train_loss": -6.637293815612793, "global_step": 140513, "epoch": 3345} {"train_loss": -6.810144424438477, "global_step": 140514, "epoch": 3345} {"train_loss": -6.831589698791504, "global_step": 140515, "epoch": 3345} {"train_loss": -6.726483345031738, "global_step": 140516, "epoch": 3345} {"train_loss": -6.793264865875244, "global_step": 140517, "epoch": 3345} {"train_loss": -6.90790319442749, "global_step": 140518, "epoch": 3345} {"train_loss": -6.68421745300293, "global_step": 140519, "epoch": 3345} {"train_loss": -6.866206169128418, "global_step": 140520, "epoch": 3345} {"train_loss": -6.81710958480835, "global_step": 140521, "epoch": 3345} {"train_loss": -6.855738162994385, "global_step": 140522, "epoch": 3345} {"train_loss": -6.671319484710693, "global_step": 140523, "epoch": 3345} {"train_loss": -6.7021636962890625, "global_step": 140524, "epoch": 3345} {"train_loss": -6.693851470947266, "global_step": 140525, "epoch": 3345} {"train_loss": -6.761382579803467, "global_step": 140526, "epoch": 3345} {"train_loss": -6.696242332458496, "global_step": 140527, "epoch": 3345} {"train_loss": -6.808018684387207, "global_step": 140528, "epoch": 3345} {"train_loss": -6.751251697540283, "global_step": 140529, "epoch": 3345} {"train_loss": -6.779818534851074, "global_step": 140530, "epoch": 3345} {"train_loss": -6.756320578711374, "global_step": 140531, "epoch": 3345, "val_loss": 67271.328125} {"train_loss": -6.752399921417236, "global_step": 140532, "epoch": 3346} {"train_loss": -6.781997203826904, "global_step": 140533, "epoch": 3346} {"train_loss": -6.7032470703125, "global_step": 140534, "epoch": 3346} {"train_loss": -6.795248031616211, "global_step": 140535, "epoch": 3346} {"train_loss": -6.783190727233887, "global_step": 140536, "epoch": 3346} {"train_loss": -6.717116355895996, "global_step": 140537, "epoch": 3346} {"train_loss": -6.756290435791016, "global_step": 140538, "epoch": 3346} {"train_loss": -6.7469482421875, "global_step": 140539, "epoch": 3346} {"train_loss": -6.742097854614258, "global_step": 140540, "epoch": 3346} {"train_loss": -6.855851173400879, "global_step": 140541, "epoch": 3346} {"train_loss": -6.742709159851074, "global_step": 140542, "epoch": 3346} {"train_loss": -6.794528007507324, "global_step": 140543, "epoch": 3346} {"train_loss": -6.812028884887695, "global_step": 140544, "epoch": 3346} {"train_loss": -6.789562225341797, "global_step": 140545, "epoch": 3346} {"train_loss": -6.7510552406311035, "global_step": 140546, "epoch": 3346} {"train_loss": -6.7747039794921875, "global_step": 140547, "epoch": 3346} {"train_loss": -6.724575042724609, "global_step": 140548, "epoch": 3346} {"train_loss": -6.758989334106445, "global_step": 140549, "epoch": 3346} {"train_loss": -6.687009811401367, "global_step": 140550, "epoch": 3346} {"train_loss": -6.871288299560547, "global_step": 140551, "epoch": 3346} {"train_loss": -6.824959754943848, "global_step": 140552, "epoch": 3346} {"train_loss": -6.816319942474365, "global_step": 140553, "epoch": 3346} {"train_loss": -6.781006336212158, "global_step": 140554, "epoch": 3346} {"train_loss": -6.630749702453613, "global_step": 140555, "epoch": 3346} {"train_loss": -6.786055088043213, "global_step": 140556, "epoch": 3346} {"train_loss": -6.813571929931641, "global_step": 140557, "epoch": 3346} {"train_loss": -6.8656792640686035, "global_step": 140558, "epoch": 3346} {"train_loss": -6.729226112365723, "global_step": 140559, "epoch": 3346} {"train_loss": -6.805013656616211, "global_step": 140560, "epoch": 3346} {"train_loss": -6.815700531005859, "global_step": 140561, "epoch": 3346} {"train_loss": -6.828094482421875, "global_step": 140562, "epoch": 3346} {"train_loss": -6.773473739624023, "global_step": 140563, "epoch": 3346} {"train_loss": -6.799278259277344, "global_step": 140564, "epoch": 3346} {"train_loss": -6.782675743103027, "global_step": 140565, "epoch": 3346} {"train_loss": -6.689153671264648, "global_step": 140566, "epoch": 3346} {"train_loss": -6.723443508148193, "global_step": 140567, "epoch": 3346} {"train_loss": -6.6973981857299805, "global_step": 140568, "epoch": 3346} {"train_loss": -6.616384983062744, "global_step": 140569, "epoch": 3346} {"train_loss": -6.704212188720703, "global_step": 140570, "epoch": 3346} {"train_loss": -6.860450267791748, "global_step": 140571, "epoch": 3346} {"train_loss": -6.538473129272461, "global_step": 140572, "epoch": 3346} {"train_loss": -6.760732934588478, "global_step": 140573, "epoch": 3346, "val_loss": 67299.625} {"train_loss": -6.7243733406066895, "global_step": 140574, "epoch": 3347} {"train_loss": -6.735265254974365, "global_step": 140575, "epoch": 3347} {"train_loss": -6.718868255615234, "global_step": 140576, "epoch": 3347} {"train_loss": -6.675271511077881, "global_step": 140577, "epoch": 3347} {"train_loss": -6.710588455200195, "global_step": 140578, "epoch": 3347} {"train_loss": -6.697343826293945, "global_step": 140579, "epoch": 3347} {"train_loss": -6.812921524047852, "global_step": 140580, "epoch": 3347} {"train_loss": -6.805266380310059, "global_step": 140581, "epoch": 3347} {"train_loss": -6.8297576904296875, "global_step": 140582, "epoch": 3347} {"train_loss": -6.644858360290527, "global_step": 140583, "epoch": 3347} {"train_loss": -6.784976005554199, "global_step": 140584, "epoch": 3347} {"train_loss": -6.783175468444824, "global_step": 140585, "epoch": 3347} {"train_loss": -6.775153160095215, "global_step": 140586, "epoch": 3347} {"train_loss": -6.923323631286621, "global_step": 140587, "epoch": 3347} {"train_loss": -6.910632133483887, "global_step": 140588, "epoch": 3347} {"train_loss": -6.837160587310791, "global_step": 140589, "epoch": 3347} {"train_loss": -6.867921352386475, "global_step": 140590, "epoch": 3347} {"train_loss": -6.779515743255615, "global_step": 140591, "epoch": 3347} {"train_loss": -6.834583282470703, "global_step": 140592, "epoch": 3347} {"train_loss": -6.766779899597168, "global_step": 140593, "epoch": 3347} {"train_loss": -6.768130779266357, "global_step": 140594, "epoch": 3347} {"train_loss": -6.761236667633057, "global_step": 140595, "epoch": 3347} {"train_loss": -6.811366081237793, "global_step": 140596, "epoch": 3347} {"train_loss": -6.789844989776611, "global_step": 140597, "epoch": 3347} {"train_loss": -6.766684532165527, "global_step": 140598, "epoch": 3347} {"train_loss": -6.735387802124023, "global_step": 140599, "epoch": 3347} {"train_loss": -6.68794059753418, "global_step": 140600, "epoch": 3347} {"train_loss": -6.794787406921387, "global_step": 140601, "epoch": 3347} {"train_loss": -6.885970115661621, "global_step": 140602, "epoch": 3347} {"train_loss": -6.780539512634277, "global_step": 140603, "epoch": 3347} {"train_loss": -6.83500337600708, "global_step": 140604, "epoch": 3347} {"train_loss": -6.696253776550293, "global_step": 140605, "epoch": 3347} {"train_loss": -6.866979598999023, "global_step": 140606, "epoch": 3347} {"train_loss": -6.855960845947266, "global_step": 140607, "epoch": 3347} {"train_loss": -6.830044746398926, "global_step": 140608, "epoch": 3347} {"train_loss": -6.820954322814941, "global_step": 140609, "epoch": 3347} {"train_loss": -6.755866527557373, "global_step": 140610, "epoch": 3347} {"train_loss": -6.641321182250977, "global_step": 140611, "epoch": 3347} {"train_loss": -6.700441360473633, "global_step": 140612, "epoch": 3347} {"train_loss": -6.615778923034668, "global_step": 140613, "epoch": 3347} {"train_loss": -6.662714004516602, "global_step": 140614, "epoch": 3347} {"train_loss": -6.769404150190807, "global_step": 140615, "epoch": 3347, "val_loss": 67401.4140625} {"train_loss": -6.646492958068848, "global_step": 140616, "epoch": 3348} {"train_loss": -6.723947525024414, "global_step": 140617, "epoch": 3348} {"train_loss": -6.63021993637085, "global_step": 140618, "epoch": 3348} {"train_loss": -6.681738376617432, "global_step": 140619, "epoch": 3348} {"train_loss": -6.555872917175293, "global_step": 140620, "epoch": 3348} {"train_loss": -6.643467903137207, "global_step": 140621, "epoch": 3348} {"train_loss": -6.897274017333984, "global_step": 140622, "epoch": 3348} {"train_loss": -6.64299201965332, "global_step": 140623, "epoch": 3348} {"train_loss": -6.698644161224365, "global_step": 140624, "epoch": 3348} {"train_loss": -6.681460380554199, "global_step": 140625, "epoch": 3348} {"train_loss": -6.6578521728515625, "global_step": 140626, "epoch": 3348} {"train_loss": -6.805937767028809, "global_step": 140627, "epoch": 3348} {"train_loss": -6.6437482833862305, "global_step": 140628, "epoch": 3348} {"train_loss": -6.632962226867676, "global_step": 140629, "epoch": 3348} {"train_loss": -6.680540084838867, "global_step": 140630, "epoch": 3348} {"train_loss": -6.760101795196533, "global_step": 140631, "epoch": 3348} {"train_loss": -6.677790641784668, "global_step": 140632, "epoch": 3348} {"train_loss": -6.756011009216309, "global_step": 140633, "epoch": 3348} {"train_loss": -6.758914947509766, "global_step": 140634, "epoch": 3348} {"train_loss": -6.697146892547607, "global_step": 140635, "epoch": 3348} {"train_loss": -6.752650260925293, "global_step": 140636, "epoch": 3348} {"train_loss": -6.719217300415039, "global_step": 140637, "epoch": 3348} {"train_loss": -6.800032615661621, "global_step": 140638, "epoch": 3348} {"train_loss": -6.7259063720703125, "global_step": 140639, "epoch": 3348} {"train_loss": -6.708196640014648, "global_step": 140640, "epoch": 3348} {"train_loss": -6.845614433288574, "global_step": 140641, "epoch": 3348} {"train_loss": -6.741127967834473, "global_step": 140642, "epoch": 3348} {"train_loss": -6.79500150680542, "global_step": 140643, "epoch": 3348} {"train_loss": -6.858830451965332, "global_step": 140644, "epoch": 3348} {"train_loss": -6.807631015777588, "global_step": 140645, "epoch": 3348} {"train_loss": -6.8326215744018555, "global_step": 140646, "epoch": 3348} {"train_loss": -6.8188347816467285, "global_step": 140647, "epoch": 3348} {"train_loss": -6.696457862854004, "global_step": 140648, "epoch": 3348} {"train_loss": -6.8244853019714355, "global_step": 140649, "epoch": 3348} {"train_loss": -6.764575958251953, "global_step": 140650, "epoch": 3348} {"train_loss": -6.898171901702881, "global_step": 140651, "epoch": 3348} {"train_loss": -6.817609786987305, "global_step": 140652, "epoch": 3348} {"train_loss": -6.725747108459473, "global_step": 140653, "epoch": 3348} {"train_loss": -6.753905773162842, "global_step": 140654, "epoch": 3348} {"train_loss": -6.893017292022705, "global_step": 140655, "epoch": 3348} {"train_loss": -6.8145952224731445, "global_step": 140656, "epoch": 3348} {"train_loss": -6.7452855337233775, "global_step": 140657, "epoch": 3348, "val_loss": 67426.6953125} {"train_loss": -6.7514190673828125, "global_step": 140658, "epoch": 3349} {"train_loss": -6.737552642822266, "global_step": 140659, "epoch": 3349} {"train_loss": -6.813741683959961, "global_step": 140660, "epoch": 3349} {"train_loss": -6.812023639678955, "global_step": 140661, "epoch": 3349} {"train_loss": -6.7763671875, "global_step": 140662, "epoch": 3349} {"train_loss": -6.817286968231201, "global_step": 140663, "epoch": 3349} {"train_loss": -6.742795944213867, "global_step": 140664, "epoch": 3349} {"train_loss": -6.768887042999268, "global_step": 140665, "epoch": 3349} {"train_loss": -6.893943786621094, "global_step": 140666, "epoch": 3349} {"train_loss": -6.791075229644775, "global_step": 140667, "epoch": 3349} {"train_loss": -6.846210479736328, "global_step": 140668, "epoch": 3349} {"train_loss": -6.77541446685791, "global_step": 140669, "epoch": 3349} {"train_loss": -6.778042793273926, "global_step": 140670, "epoch": 3349} {"train_loss": -6.801340103149414, "global_step": 140671, "epoch": 3349} {"train_loss": -6.804379940032959, "global_step": 140672, "epoch": 3349} {"train_loss": -6.828701496124268, "global_step": 140673, "epoch": 3349} {"train_loss": -6.867589473724365, "global_step": 140674, "epoch": 3349} {"train_loss": -6.740156173706055, "global_step": 140675, "epoch": 3349} {"train_loss": -6.911582946777344, "global_step": 140676, "epoch": 3349} {"train_loss": -6.801658630371094, "global_step": 140677, "epoch": 3349} {"train_loss": -6.745486259460449, "global_step": 140678, "epoch": 3349} {"train_loss": -6.86677360534668, "global_step": 140679, "epoch": 3349} {"train_loss": -6.92634916305542, "global_step": 140680, "epoch": 3349} {"train_loss": -6.9273529052734375, "global_step": 140681, "epoch": 3349} {"train_loss": -6.857877254486084, "global_step": 140682, "epoch": 3349} {"train_loss": -6.769142150878906, "global_step": 140683, "epoch": 3349} {"train_loss": -6.928813457489014, "global_step": 140684, "epoch": 3349} {"train_loss": -6.801692962646484, "global_step": 140685, "epoch": 3349} {"train_loss": -6.815916061401367, "global_step": 140686, "epoch": 3349} {"train_loss": -6.736452579498291, "global_step": 140687, "epoch": 3349} {"train_loss": -6.703711032867432, "global_step": 140688, "epoch": 3349} {"train_loss": -6.840420722961426, "global_step": 140689, "epoch": 3349} {"train_loss": -6.698737621307373, "global_step": 140690, "epoch": 3349} {"train_loss": -6.625744819641113, "global_step": 140691, "epoch": 3349} {"train_loss": -6.6836981773376465, "global_step": 140692, "epoch": 3349} {"train_loss": -6.748169898986816, "global_step": 140693, "epoch": 3349} {"train_loss": -6.780285835266113, "global_step": 140694, "epoch": 3349} {"train_loss": -6.719006538391113, "global_step": 140695, "epoch": 3349} {"train_loss": -6.736039161682129, "global_step": 140696, "epoch": 3349} {"train_loss": -6.8103179931640625, "global_step": 140697, "epoch": 3349} {"train_loss": -6.7190093994140625, "global_step": 140698, "epoch": 3349} {"train_loss": -6.7923661186581565, "global_step": 140699, "epoch": 3349, "val_loss": 67359.4140625} {"train_loss": -6.695189476013184, "global_step": 140700, "epoch": 3350} {"train_loss": -6.788205146789551, "global_step": 140701, "epoch": 3350} {"train_loss": -6.851710796356201, "global_step": 140702, "epoch": 3350} {"train_loss": -6.8681488037109375, "global_step": 140703, "epoch": 3350} {"train_loss": -6.782955169677734, "global_step": 140704, "epoch": 3350} {"train_loss": -6.744692325592041, "global_step": 140705, "epoch": 3350} {"train_loss": -6.896206855773926, "global_step": 140706, "epoch": 3350} {"train_loss": -6.729633331298828, "global_step": 140707, "epoch": 3350} {"train_loss": -6.909322738647461, "global_step": 140708, "epoch": 3350} {"train_loss": -6.867176055908203, "global_step": 140709, "epoch": 3350} {"train_loss": -6.834812164306641, "global_step": 140710, "epoch": 3350} {"train_loss": -6.872644424438477, "global_step": 140711, "epoch": 3350} {"train_loss": -6.690545082092285, "global_step": 140712, "epoch": 3350} {"train_loss": -6.826363563537598, "global_step": 140713, "epoch": 3350} {"train_loss": -6.748030185699463, "global_step": 140714, "epoch": 3350} {"train_loss": -6.844213485717773, "global_step": 140715, "epoch": 3350} {"train_loss": -6.861789703369141, "global_step": 140716, "epoch": 3350} {"train_loss": -6.720767498016357, "global_step": 140717, "epoch": 3350} {"train_loss": -6.788302421569824, "global_step": 140718, "epoch": 3350} {"train_loss": -6.8010149002075195, "global_step": 140719, "epoch": 3350} {"train_loss": -6.763855934143066, "global_step": 140720, "epoch": 3350} {"train_loss": -6.818737030029297, "global_step": 140721, "epoch": 3350} {"train_loss": -6.875019073486328, "global_step": 140722, "epoch": 3350} {"train_loss": -6.798925399780273, "global_step": 140723, "epoch": 3350} {"train_loss": -6.884003639221191, "global_step": 140724, "epoch": 3350} {"train_loss": -6.894340515136719, "global_step": 140725, "epoch": 3350} {"train_loss": -6.735428810119629, "global_step": 140726, "epoch": 3350} {"train_loss": -6.718865394592285, "global_step": 140727, "epoch": 3350} {"train_loss": -6.913317680358887, "global_step": 140728, "epoch": 3350} {"train_loss": -6.76565408706665, "global_step": 140729, "epoch": 3350} {"train_loss": -6.847975730895996, "global_step": 140730, "epoch": 3350} {"train_loss": -6.726902961730957, "global_step": 140731, "epoch": 3350} {"train_loss": -6.807353973388672, "global_step": 140732, "epoch": 3350} {"train_loss": -6.800197601318359, "global_step": 140733, "epoch": 3350} {"train_loss": -6.868878364562988, "global_step": 140734, "epoch": 3350} {"train_loss": -6.740108013153076, "global_step": 140735, "epoch": 3350} {"train_loss": -6.810473442077637, "global_step": 140736, "epoch": 3350} {"train_loss": -6.676829814910889, "global_step": 140737, "epoch": 3350} {"train_loss": -6.776525020599365, "global_step": 140738, "epoch": 3350} {"train_loss": -6.7107930183410645, "global_step": 140739, "epoch": 3350} {"train_loss": -6.586513042449951, "global_step": 140740, "epoch": 3350} {"train_loss": -6.793685334069388, "global_step": 140741, "epoch": 3350, "train/sim_max_reward_0": 0.19653104271964006, "train/sim_max_reward_1": 0.9027575255292791, "train/sim_max_reward_2": 0.5538884873393792, "train/sim_max_reward_3": 0.9169206138204002, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8809363426965899, "test/sim_max_reward_4300001": 0.5388399466060297, "test/sim_max_reward_4300002": 0.9616192046991322, "test/sim_max_reward_4300003": 0.9551491660975736, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.945451092823847, "test/sim_max_reward_4300006": 0.18398269656782815, "test/sim_max_reward_4300007": 0.6333588726685976, "test/sim_max_reward_4300008": 0.907021352484582, "test/sim_max_reward_4300009": 0.9363581378147795, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.8452444406226174, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.4131923796587315, "test/sim_max_reward_4300014": 0.9708196250696512, "test/sim_max_reward_4300015": 0.9036800616012829, "test/sim_max_reward_4300016": 0.9883353719004324, "test/sim_max_reward_4300017": 0.8404259654103003, "test/sim_max_reward_4300018": 0.4410148345547883, "test/sim_max_reward_4300019": 0.1859217859750007, "test/sim_max_reward_4300020": 0.009067358971496738, "test/sim_max_reward_4300021": 0.8533106785743426, "test/sim_max_reward_4300022": 0.9756066454352871, "test/sim_max_reward_4300023": 0.32745282633984646, "test/sim_max_reward_4300024": 0.9538769255218821, "test/sim_max_reward_4300025": 0.8748377717865636, "test/sim_max_reward_4300026": 0.20913913314089674, "test/sim_max_reward_4300027": 0.8722088087326479, "test/sim_max_reward_4300028": 0.6459705545855001, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.8539840600340878, "test/sim_max_reward_4300031": 1.0, "test/sim_max_reward_4300032": 0.783627036421766, "test/sim_max_reward_4300033": 0.7203177850556349, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.7148924048734582, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8849021316322879, "test/sim_max_reward_4300038": 0.902611495699259, "test/sim_max_reward_4300039": 0.4008248691551327, "test/sim_max_reward_4300040": 0.8890828966009795, "test/sim_max_reward_4300041": 0.7255107764253155, "test/sim_max_reward_4300042": 0.7149524329057179, "test/sim_max_reward_4300043": 0.1451573386979742, "test/sim_max_reward_4300044": 0.7830852709490127, "test/sim_max_reward_4300045": 0.8336769497519908, "test/sim_max_reward_4300046": 0.9996285052443262, "test/sim_max_reward_4300047": 0.23030084221322353, "test/sim_max_reward_4300048": 0.789362022951391, "test/sim_max_reward_4300049": 0.2072747403541274, "train/mean_score": 0.6271804047951477, "test/mean_score": 0.6409408351935736, "val_loss": 67348.796875} {"train_loss": -6.706568717956543, "global_step": 140742, "epoch": 3351} {"train_loss": -6.791255950927734, "global_step": 140743, "epoch": 3351} {"train_loss": -6.780754089355469, "global_step": 140744, "epoch": 3351} {"train_loss": -6.7085771560668945, "global_step": 140745, "epoch": 3351} {"train_loss": -6.649416923522949, "global_step": 140746, "epoch": 3351} {"train_loss": -6.703261375427246, "global_step": 140747, "epoch": 3351} {"train_loss": -6.850379943847656, "global_step": 140748, "epoch": 3351} {"train_loss": -6.56467342376709, "global_step": 140749, "epoch": 3351} {"train_loss": -6.679109573364258, "global_step": 140750, "epoch": 3351} {"train_loss": -6.7090654373168945, "global_step": 140751, "epoch": 3351} {"train_loss": -6.669190406799316, "global_step": 140752, "epoch": 3351} {"train_loss": -6.751011848449707, "global_step": 140753, "epoch": 3351} {"train_loss": -6.637998104095459, "global_step": 140754, "epoch": 3351} {"train_loss": -6.724763870239258, "global_step": 140755, "epoch": 3351} {"train_loss": -6.739803791046143, "global_step": 140756, "epoch": 3351} {"train_loss": -6.799256324768066, "global_step": 140757, "epoch": 3351} {"train_loss": -6.733307361602783, "global_step": 140758, "epoch": 3351} {"train_loss": -6.645570278167725, "global_step": 140759, "epoch": 3351} {"train_loss": -6.684450149536133, "global_step": 140760, "epoch": 3351} {"train_loss": -6.706973075866699, "global_step": 140761, "epoch": 3351} {"train_loss": -6.731782913208008, "global_step": 140762, "epoch": 3351} {"train_loss": -6.821217060089111, "global_step": 140763, "epoch": 3351} {"train_loss": -6.791276931762695, "global_step": 140764, "epoch": 3351} {"train_loss": -6.755429744720459, "global_step": 140765, "epoch": 3351} {"train_loss": -6.746654987335205, "global_step": 140766, "epoch": 3351} {"train_loss": -6.75211763381958, "global_step": 140767, "epoch": 3351} {"train_loss": -6.822470664978027, "global_step": 140768, "epoch": 3351} {"train_loss": -6.812286376953125, "global_step": 140769, "epoch": 3351} {"train_loss": -6.887814521789551, "global_step": 140770, "epoch": 3351} {"train_loss": -6.795505046844482, "global_step": 140771, "epoch": 3351} {"train_loss": -6.8144450187683105, "global_step": 140772, "epoch": 3351} {"train_loss": -6.692683219909668, "global_step": 140773, "epoch": 3351} {"train_loss": -6.846296310424805, "global_step": 140774, "epoch": 3351} {"train_loss": -6.813050270080566, "global_step": 140775, "epoch": 3351} {"train_loss": -6.800960540771484, "global_step": 140776, "epoch": 3351} {"train_loss": -6.779654502868652, "global_step": 140777, "epoch": 3351} {"train_loss": -6.720247745513916, "global_step": 140778, "epoch": 3351} {"train_loss": -6.785191535949707, "global_step": 140779, "epoch": 3351} {"train_loss": -6.730818748474121, "global_step": 140780, "epoch": 3351} {"train_loss": -6.791197776794434, "global_step": 140781, "epoch": 3351} {"train_loss": -6.804836273193359, "global_step": 140782, "epoch": 3351} {"train_loss": -6.746825615564982, "global_step": 140783, "epoch": 3351, "val_loss": 67299.5859375} {"train_loss": -6.777286529541016, "global_step": 140784, "epoch": 3352} {"train_loss": -6.857687950134277, "global_step": 140785, "epoch": 3352} {"train_loss": -6.620600700378418, "global_step": 140786, "epoch": 3352} {"train_loss": -6.723894119262695, "global_step": 140787, "epoch": 3352} {"train_loss": -6.77957820892334, "global_step": 140788, "epoch": 3352} {"train_loss": -6.678689002990723, "global_step": 140789, "epoch": 3352} {"train_loss": -6.759159088134766, "global_step": 140790, "epoch": 3352} {"train_loss": -6.82777214050293, "global_step": 140791, "epoch": 3352} {"train_loss": -6.713596343994141, "global_step": 140792, "epoch": 3352} {"train_loss": -6.741482734680176, "global_step": 140793, "epoch": 3352} {"train_loss": -6.730072975158691, "global_step": 140794, "epoch": 3352} {"train_loss": -6.843634605407715, "global_step": 140795, "epoch": 3352} {"train_loss": -6.798254013061523, "global_step": 140796, "epoch": 3352} {"train_loss": -6.866191864013672, "global_step": 140797, "epoch": 3352} {"train_loss": -6.675090312957764, "global_step": 140798, "epoch": 3352} {"train_loss": -6.7965497970581055, "global_step": 140799, "epoch": 3352} {"train_loss": -6.78951358795166, "global_step": 140800, "epoch": 3352} {"train_loss": -6.722513198852539, "global_step": 140801, "epoch": 3352} {"train_loss": -6.689568519592285, "global_step": 140802, "epoch": 3352} {"train_loss": -6.783116340637207, "global_step": 140803, "epoch": 3352} {"train_loss": -6.7545976638793945, "global_step": 140804, "epoch": 3352} {"train_loss": -6.812309741973877, "global_step": 140805, "epoch": 3352} {"train_loss": -6.77411413192749, "global_step": 140806, "epoch": 3352} {"train_loss": -6.752243995666504, "global_step": 140807, "epoch": 3352} {"train_loss": -6.807514190673828, "global_step": 140808, "epoch": 3352} {"train_loss": -6.675559997558594, "global_step": 140809, "epoch": 3352} {"train_loss": -6.763182640075684, "global_step": 140810, "epoch": 3352} {"train_loss": -6.68575382232666, "global_step": 140811, "epoch": 3352} {"train_loss": -6.929866790771484, "global_step": 140812, "epoch": 3352} {"train_loss": -6.781254768371582, "global_step": 140813, "epoch": 3352} {"train_loss": -6.764123916625977, "global_step": 140814, "epoch": 3352} {"train_loss": -6.7770843505859375, "global_step": 140815, "epoch": 3352} {"train_loss": -6.815265655517578, "global_step": 140816, "epoch": 3352} {"train_loss": -6.781181335449219, "global_step": 140817, "epoch": 3352} {"train_loss": -6.754624843597412, "global_step": 140818, "epoch": 3352} {"train_loss": -6.758073329925537, "global_step": 140819, "epoch": 3352} {"train_loss": -6.866290092468262, "global_step": 140820, "epoch": 3352} {"train_loss": -6.824220180511475, "global_step": 140821, "epoch": 3352} {"train_loss": -6.637592315673828, "global_step": 140822, "epoch": 3352} {"train_loss": -6.8887529373168945, "global_step": 140823, "epoch": 3352} {"train_loss": -6.75340461730957, "global_step": 140824, "epoch": 3352} {"train_loss": -6.7669616880871, "global_step": 140825, "epoch": 3352, "val_loss": 67461.9609375} {"train_loss": -6.649990081787109, "global_step": 140826, "epoch": 3353} {"train_loss": -6.816414833068848, "global_step": 140827, "epoch": 3353} {"train_loss": -6.637887477874756, "global_step": 140828, "epoch": 3353} {"train_loss": -6.731595516204834, "global_step": 140829, "epoch": 3353} {"train_loss": -6.818902015686035, "global_step": 140830, "epoch": 3353} {"train_loss": -6.804644584655762, "global_step": 140831, "epoch": 3353} {"train_loss": -6.866621971130371, "global_step": 140832, "epoch": 3353} {"train_loss": -6.782371520996094, "global_step": 140833, "epoch": 3353} {"train_loss": -6.855740547180176, "global_step": 140834, "epoch": 3353} {"train_loss": -6.883073806762695, "global_step": 140835, "epoch": 3353} {"train_loss": -6.683223247528076, "global_step": 140836, "epoch": 3353} {"train_loss": -6.798498630523682, "global_step": 140837, "epoch": 3353} {"train_loss": -6.806044578552246, "global_step": 140838, "epoch": 3353} {"train_loss": -6.66780948638916, "global_step": 140839, "epoch": 3353} {"train_loss": -6.733297348022461, "global_step": 140840, "epoch": 3353} {"train_loss": -6.794460773468018, "global_step": 140841, "epoch": 3353} {"train_loss": -6.813138008117676, "global_step": 140842, "epoch": 3353} {"train_loss": -6.82766056060791, "global_step": 140843, "epoch": 3353} {"train_loss": -6.795835494995117, "global_step": 140844, "epoch": 3353} {"train_loss": -6.789961338043213, "global_step": 140845, "epoch": 3353} {"train_loss": -6.729262828826904, "global_step": 140846, "epoch": 3353} {"train_loss": -6.764636516571045, "global_step": 140847, "epoch": 3353} {"train_loss": -6.757547855377197, "global_step": 140848, "epoch": 3353} {"train_loss": -6.839731693267822, "global_step": 140849, "epoch": 3353} {"train_loss": -6.634031772613525, "global_step": 140850, "epoch": 3353} {"train_loss": -6.730123043060303, "global_step": 140851, "epoch": 3353} {"train_loss": -6.805758953094482, "global_step": 140852, "epoch": 3353} {"train_loss": -6.7858991622924805, "global_step": 140853, "epoch": 3353} {"train_loss": -6.769287586212158, "global_step": 140854, "epoch": 3353} {"train_loss": -6.8519721031188965, "global_step": 140855, "epoch": 3353} {"train_loss": -6.721025466918945, "global_step": 140856, "epoch": 3353} {"train_loss": -6.729165554046631, "global_step": 140857, "epoch": 3353} {"train_loss": -6.703547954559326, "global_step": 140858, "epoch": 3353} {"train_loss": -6.754613399505615, "global_step": 140859, "epoch": 3353} {"train_loss": -6.780600547790527, "global_step": 140860, "epoch": 3353} {"train_loss": -6.725168704986572, "global_step": 140861, "epoch": 3353} {"train_loss": -6.6668596267700195, "global_step": 140862, "epoch": 3353} {"train_loss": -6.792478084564209, "global_step": 140863, "epoch": 3353} {"train_loss": -6.698611259460449, "global_step": 140864, "epoch": 3353} {"train_loss": -6.72076940536499, "global_step": 140865, "epoch": 3353} {"train_loss": -6.808162689208984, "global_step": 140866, "epoch": 3353} {"train_loss": -6.762747968946185, "global_step": 140867, "epoch": 3353, "val_loss": 67389.1796875} {"train_loss": -6.781148910522461, "global_step": 140868, "epoch": 3354} {"train_loss": -6.704258441925049, "global_step": 140869, "epoch": 3354} {"train_loss": -6.676324844360352, "global_step": 140870, "epoch": 3354} {"train_loss": -6.714875221252441, "global_step": 140871, "epoch": 3354} {"train_loss": -6.633199691772461, "global_step": 140872, "epoch": 3354} {"train_loss": -6.616103172302246, "global_step": 140873, "epoch": 3354} {"train_loss": -6.790741920471191, "global_step": 140874, "epoch": 3354} {"train_loss": -6.58328914642334, "global_step": 140875, "epoch": 3354} {"train_loss": -6.768245697021484, "global_step": 140876, "epoch": 3354} {"train_loss": -6.637372970581055, "global_step": 140877, "epoch": 3354} {"train_loss": -6.764622688293457, "global_step": 140878, "epoch": 3354} {"train_loss": -6.592663764953613, "global_step": 140879, "epoch": 3354} {"train_loss": -6.634034633636475, "global_step": 140880, "epoch": 3354} {"train_loss": -6.694886207580566, "global_step": 140881, "epoch": 3354} {"train_loss": -6.739986419677734, "global_step": 140882, "epoch": 3354} {"train_loss": -6.606524467468262, "global_step": 140883, "epoch": 3354} {"train_loss": -6.715109348297119, "global_step": 140884, "epoch": 3354} {"train_loss": -6.7797722816467285, "global_step": 140885, "epoch": 3354} {"train_loss": -6.560661315917969, "global_step": 140886, "epoch": 3354} {"train_loss": -6.706696510314941, "global_step": 140887, "epoch": 3354} {"train_loss": -6.718165397644043, "global_step": 140888, "epoch": 3354} {"train_loss": -6.652067184448242, "global_step": 140889, "epoch": 3354} {"train_loss": -6.741201400756836, "global_step": 140890, "epoch": 3354} {"train_loss": -6.697169780731201, "global_step": 140891, "epoch": 3354} {"train_loss": -6.719534873962402, "global_step": 140892, "epoch": 3354} {"train_loss": -6.669924736022949, "global_step": 140893, "epoch": 3354} {"train_loss": -6.7608537673950195, "global_step": 140894, "epoch": 3354} {"train_loss": -6.888009071350098, "global_step": 140895, "epoch": 3354} {"train_loss": -6.875436782836914, "global_step": 140896, "epoch": 3354} {"train_loss": -6.71265983581543, "global_step": 140897, "epoch": 3354} {"train_loss": -6.766167163848877, "global_step": 140898, "epoch": 3354} {"train_loss": -6.76725435256958, "global_step": 140899, "epoch": 3354} {"train_loss": -6.717288494110107, "global_step": 140900, "epoch": 3354} {"train_loss": -6.813790321350098, "global_step": 140901, "epoch": 3354} {"train_loss": -6.845233917236328, "global_step": 140902, "epoch": 3354} {"train_loss": -6.8134613037109375, "global_step": 140903, "epoch": 3354} {"train_loss": -6.742806434631348, "global_step": 140904, "epoch": 3354} {"train_loss": -6.746070861816406, "global_step": 140905, "epoch": 3354} {"train_loss": -6.811643600463867, "global_step": 140906, "epoch": 3354} {"train_loss": -6.812159061431885, "global_step": 140907, "epoch": 3354} {"train_loss": -6.778105735778809, "global_step": 140908, "epoch": 3354} {"train_loss": -6.72763188680013, "global_step": 140909, "epoch": 3354, "val_loss": 67295.3671875} {"train_loss": -6.856250762939453, "global_step": 140910, "epoch": 3355} {"train_loss": -6.804279327392578, "global_step": 140911, "epoch": 3355} {"train_loss": -6.852664947509766, "global_step": 140912, "epoch": 3355} {"train_loss": -6.817116737365723, "global_step": 140913, "epoch": 3355} {"train_loss": -6.8427534103393555, "global_step": 140914, "epoch": 3355} {"train_loss": -6.822123050689697, "global_step": 140915, "epoch": 3355} {"train_loss": -6.800727844238281, "global_step": 140916, "epoch": 3355} {"train_loss": -6.8043670654296875, "global_step": 140917, "epoch": 3355} {"train_loss": -6.925342559814453, "global_step": 140918, "epoch": 3355} {"train_loss": -6.9044599533081055, "global_step": 140919, "epoch": 3355} {"train_loss": -6.821314811706543, "global_step": 140920, "epoch": 3355} {"train_loss": -6.878310203552246, "global_step": 140921, "epoch": 3355} {"train_loss": -6.802435874938965, "global_step": 140922, "epoch": 3355} {"train_loss": -6.796109676361084, "global_step": 140923, "epoch": 3355} {"train_loss": -6.836401462554932, "global_step": 140924, "epoch": 3355} {"train_loss": -6.8281168937683105, "global_step": 140925, "epoch": 3355} {"train_loss": -6.822861671447754, "global_step": 140926, "epoch": 3355} {"train_loss": -6.780350685119629, "global_step": 140927, "epoch": 3355} {"train_loss": -6.841408729553223, "global_step": 140928, "epoch": 3355} {"train_loss": -6.757790565490723, "global_step": 140929, "epoch": 3355} {"train_loss": -6.7856669425964355, "global_step": 140930, "epoch": 3355} {"train_loss": -6.780552864074707, "global_step": 140931, "epoch": 3355} {"train_loss": -6.887759208679199, "global_step": 140932, "epoch": 3355} {"train_loss": -6.733151435852051, "global_step": 140933, "epoch": 3355} {"train_loss": -6.725101470947266, "global_step": 140934, "epoch": 3355} {"train_loss": -6.844560146331787, "global_step": 140935, "epoch": 3355} {"train_loss": -6.706602096557617, "global_step": 140936, "epoch": 3355} {"train_loss": -6.7739481925964355, "global_step": 140937, "epoch": 3355} {"train_loss": -6.763786792755127, "global_step": 140938, "epoch": 3355} {"train_loss": -6.7657880783081055, "global_step": 140939, "epoch": 3355} {"train_loss": -6.846732139587402, "global_step": 140940, "epoch": 3355} {"train_loss": -6.927130699157715, "global_step": 140941, "epoch": 3355} {"train_loss": -6.815394401550293, "global_step": 140942, "epoch": 3355} {"train_loss": -6.73250675201416, "global_step": 140943, "epoch": 3355} {"train_loss": -6.863264083862305, "global_step": 140944, "epoch": 3355} {"train_loss": -6.875972747802734, "global_step": 140945, "epoch": 3355} {"train_loss": -6.787461280822754, "global_step": 140946, "epoch": 3355} {"train_loss": -6.767967224121094, "global_step": 140947, "epoch": 3355} {"train_loss": -6.806446075439453, "global_step": 140948, "epoch": 3355} {"train_loss": -6.76116418838501, "global_step": 140949, "epoch": 3355} {"train_loss": -6.777753829956055, "global_step": 140950, "epoch": 3355} {"train_loss": -6.813031628018334, "global_step": 140951, "epoch": 3355, "val_loss": 67293.1484375} {"train_loss": -6.839208126068115, "global_step": 140952, "epoch": 3356} {"train_loss": -6.716089248657227, "global_step": 140953, "epoch": 3356} {"train_loss": -6.7030792236328125, "global_step": 140954, "epoch": 3356} {"train_loss": -6.734111309051514, "global_step": 140955, "epoch": 3356} {"train_loss": -6.93440055847168, "global_step": 140956, "epoch": 3356} {"train_loss": -6.694695472717285, "global_step": 140957, "epoch": 3356} {"train_loss": -6.836492538452148, "global_step": 140958, "epoch": 3356} {"train_loss": -6.787750244140625, "global_step": 140959, "epoch": 3356} {"train_loss": -6.606966972351074, "global_step": 140960, "epoch": 3356} {"train_loss": -6.7725911140441895, "global_step": 140961, "epoch": 3356} {"train_loss": -6.611878395080566, "global_step": 140962, "epoch": 3356} {"train_loss": -6.777809143066406, "global_step": 140963, "epoch": 3356} {"train_loss": -6.781999588012695, "global_step": 140964, "epoch": 3356} {"train_loss": -6.724438190460205, "global_step": 140965, "epoch": 3356} {"train_loss": -6.912294864654541, "global_step": 140966, "epoch": 3356} {"train_loss": -6.664506435394287, "global_step": 140967, "epoch": 3356} {"train_loss": -6.660826683044434, "global_step": 140968, "epoch": 3356} {"train_loss": -6.690182685852051, "global_step": 140969, "epoch": 3356} {"train_loss": -6.834352016448975, "global_step": 140970, "epoch": 3356} {"train_loss": -6.710017204284668, "global_step": 140971, "epoch": 3356} {"train_loss": -6.701167583465576, "global_step": 140972, "epoch": 3356} {"train_loss": -6.7910003662109375, "global_step": 140973, "epoch": 3356} {"train_loss": -6.807275772094727, "global_step": 140974, "epoch": 3356} {"train_loss": -6.735564231872559, "global_step": 140975, "epoch": 3356} {"train_loss": -6.699861526489258, "global_step": 140976, "epoch": 3356} {"train_loss": -6.699663162231445, "global_step": 140977, "epoch": 3356} {"train_loss": -6.7557878494262695, "global_step": 140978, "epoch": 3356} {"train_loss": -6.700387477874756, "global_step": 140979, "epoch": 3356} {"train_loss": -6.7496232986450195, "global_step": 140980, "epoch": 3356} {"train_loss": -6.692987442016602, "global_step": 140981, "epoch": 3356} {"train_loss": -6.729155540466309, "global_step": 140982, "epoch": 3356} {"train_loss": -6.791269302368164, "global_step": 140983, "epoch": 3356} {"train_loss": -6.688464164733887, "global_step": 140984, "epoch": 3356} {"train_loss": -6.784511566162109, "global_step": 140985, "epoch": 3356} {"train_loss": -6.850421905517578, "global_step": 140986, "epoch": 3356} {"train_loss": -6.63712215423584, "global_step": 140987, "epoch": 3356} {"train_loss": -6.709752559661865, "global_step": 140988, "epoch": 3356} {"train_loss": -6.790925979614258, "global_step": 140989, "epoch": 3356} {"train_loss": -6.627664566040039, "global_step": 140990, "epoch": 3356} {"train_loss": -6.782347679138184, "global_step": 140991, "epoch": 3356} {"train_loss": -6.679025650024414, "global_step": 140992, "epoch": 3356} {"train_loss": -6.739277113051641, "global_step": 140993, "epoch": 3356, "val_loss": 67633.6875} {"train_loss": -6.651630878448486, "global_step": 140994, "epoch": 3357} {"train_loss": -6.6612067222595215, "global_step": 140995, "epoch": 3357} {"train_loss": -6.844338417053223, "global_step": 140996, "epoch": 3357} {"train_loss": -6.785946369171143, "global_step": 140997, "epoch": 3357} {"train_loss": -6.693663597106934, "global_step": 140998, "epoch": 3357} {"train_loss": -6.838584899902344, "global_step": 140999, "epoch": 3357} {"train_loss": -6.820652484893799, "global_step": 141000, "epoch": 3357} {"train_loss": -6.768692493438721, "global_step": 141001, "epoch": 3357} {"train_loss": -6.7245306968688965, "global_step": 141002, "epoch": 3357} {"train_loss": -6.878273010253906, "global_step": 141003, "epoch": 3357} {"train_loss": -6.794690132141113, "global_step": 141004, "epoch": 3357} {"train_loss": -6.797603607177734, "global_step": 141005, "epoch": 3357} {"train_loss": -6.714365005493164, "global_step": 141006, "epoch": 3357} {"train_loss": -6.870698928833008, "global_step": 141007, "epoch": 3357} {"train_loss": -6.769401550292969, "global_step": 141008, "epoch": 3357} {"train_loss": -6.782456398010254, "global_step": 141009, "epoch": 3357} {"train_loss": -6.873049736022949, "global_step": 141010, "epoch": 3357} {"train_loss": -6.65919828414917, "global_step": 141011, "epoch": 3357} {"train_loss": -6.86918306350708, "global_step": 141012, "epoch": 3357} {"train_loss": -6.727109909057617, "global_step": 141013, "epoch": 3357} {"train_loss": -6.745821475982666, "global_step": 141014, "epoch": 3357} {"train_loss": -6.696462631225586, "global_step": 141015, "epoch": 3357} {"train_loss": -6.800322532653809, "global_step": 141016, "epoch": 3357} {"train_loss": -6.725939750671387, "global_step": 141017, "epoch": 3357} {"train_loss": -6.899396896362305, "global_step": 141018, "epoch": 3357} {"train_loss": -6.814819812774658, "global_step": 141019, "epoch": 3357} {"train_loss": -6.729214191436768, "global_step": 141020, "epoch": 3357} {"train_loss": -6.767209053039551, "global_step": 141021, "epoch": 3357} {"train_loss": -6.7908782958984375, "global_step": 141022, "epoch": 3357} {"train_loss": -6.78315544128418, "global_step": 141023, "epoch": 3357} {"train_loss": -6.75803279876709, "global_step": 141024, "epoch": 3357} {"train_loss": -6.7474188804626465, "global_step": 141025, "epoch": 3357} {"train_loss": -6.849466800689697, "global_step": 141026, "epoch": 3357} {"train_loss": -6.757366180419922, "global_step": 141027, "epoch": 3357} {"train_loss": -6.786574840545654, "global_step": 141028, "epoch": 3357} {"train_loss": -6.753381729125977, "global_step": 141029, "epoch": 3357} {"train_loss": -6.721077919006348, "global_step": 141030, "epoch": 3357} {"train_loss": -6.69395637512207, "global_step": 141031, "epoch": 3357} {"train_loss": -6.817806243896484, "global_step": 141032, "epoch": 3357} {"train_loss": -6.774759292602539, "global_step": 141033, "epoch": 3357} {"train_loss": -6.89875602722168, "global_step": 141034, "epoch": 3357} {"train_loss": -6.774772155852545, "global_step": 141035, "epoch": 3357, "val_loss": 67516.4140625} {"train_loss": -6.763574123382568, "global_step": 141036, "epoch": 3358} {"train_loss": -6.892407417297363, "global_step": 141037, "epoch": 3358} {"train_loss": -6.814861297607422, "global_step": 141038, "epoch": 3358} {"train_loss": -6.848243713378906, "global_step": 141039, "epoch": 3358} {"train_loss": -6.863486289978027, "global_step": 141040, "epoch": 3358} {"train_loss": -6.808477878570557, "global_step": 141041, "epoch": 3358} {"train_loss": -6.791782855987549, "global_step": 141042, "epoch": 3358} {"train_loss": -6.746820449829102, "global_step": 141043, "epoch": 3358} {"train_loss": -6.69783878326416, "global_step": 141044, "epoch": 3358} {"train_loss": -6.789616107940674, "global_step": 141045, "epoch": 3358} {"train_loss": -6.7353925704956055, "global_step": 141046, "epoch": 3358} {"train_loss": -6.632711410522461, "global_step": 141047, "epoch": 3358} {"train_loss": -6.699191570281982, "global_step": 141048, "epoch": 3358} {"train_loss": -6.792823314666748, "global_step": 141049, "epoch": 3358} {"train_loss": -6.720175743103027, "global_step": 141050, "epoch": 3358} {"train_loss": -6.7231574058532715, "global_step": 141051, "epoch": 3358} {"train_loss": -6.908825874328613, "global_step": 141052, "epoch": 3358} {"train_loss": -6.677495002746582, "global_step": 141053, "epoch": 3358} {"train_loss": -6.812507152557373, "global_step": 141054, "epoch": 3358} {"train_loss": -6.757742881774902, "global_step": 141055, "epoch": 3358} {"train_loss": -6.879594326019287, "global_step": 141056, "epoch": 3358} {"train_loss": -6.771341323852539, "global_step": 141057, "epoch": 3358} {"train_loss": -6.711389541625977, "global_step": 141058, "epoch": 3358} {"train_loss": -6.7105183601379395, "global_step": 141059, "epoch": 3358} {"train_loss": -6.862266540527344, "global_step": 141060, "epoch": 3358} {"train_loss": -6.760317802429199, "global_step": 141061, "epoch": 3358} {"train_loss": -6.80264139175415, "global_step": 141062, "epoch": 3358} {"train_loss": -6.768953323364258, "global_step": 141063, "epoch": 3358} {"train_loss": -6.737250328063965, "global_step": 141064, "epoch": 3358} {"train_loss": -6.776117324829102, "global_step": 141065, "epoch": 3358} {"train_loss": -6.684686660766602, "global_step": 141066, "epoch": 3358} {"train_loss": -6.806303024291992, "global_step": 141067, "epoch": 3358} {"train_loss": -6.661324501037598, "global_step": 141068, "epoch": 3358} {"train_loss": -6.794093608856201, "global_step": 141069, "epoch": 3358} {"train_loss": -6.666042327880859, "global_step": 141070, "epoch": 3358} {"train_loss": -6.744760036468506, "global_step": 141071, "epoch": 3358} {"train_loss": -6.772976875305176, "global_step": 141072, "epoch": 3358} {"train_loss": -6.660310745239258, "global_step": 141073, "epoch": 3358} {"train_loss": -6.672781944274902, "global_step": 141074, "epoch": 3358} {"train_loss": -6.70744514465332, "global_step": 141075, "epoch": 3358} {"train_loss": -6.791871070861816, "global_step": 141076, "epoch": 3358} {"train_loss": -6.762949625651042, "global_step": 141077, "epoch": 3358, "val_loss": 67297.5546875} {"train_loss": -6.735837459564209, "global_step": 141078, "epoch": 3359} {"train_loss": -6.806399345397949, "global_step": 141079, "epoch": 3359} {"train_loss": -6.7344231605529785, "global_step": 141080, "epoch": 3359} {"train_loss": -6.808897972106934, "global_step": 141081, "epoch": 3359} {"train_loss": -6.817987442016602, "global_step": 141082, "epoch": 3359} {"train_loss": -6.77927303314209, "global_step": 141083, "epoch": 3359} {"train_loss": -6.720044136047363, "global_step": 141084, "epoch": 3359} {"train_loss": -6.771414756774902, "global_step": 141085, "epoch": 3359} {"train_loss": -6.89421272277832, "global_step": 141086, "epoch": 3359} {"train_loss": -6.8178486824035645, "global_step": 141087, "epoch": 3359} {"train_loss": -6.6667160987854, "global_step": 141088, "epoch": 3359} {"train_loss": -6.690544128417969, "global_step": 141089, "epoch": 3359} {"train_loss": -6.657405853271484, "global_step": 141090, "epoch": 3359} {"train_loss": -6.778558731079102, "global_step": 141091, "epoch": 3359} {"train_loss": -6.73870849609375, "global_step": 141092, "epoch": 3359} {"train_loss": -6.818660259246826, "global_step": 141093, "epoch": 3359} {"train_loss": -6.864307403564453, "global_step": 141094, "epoch": 3359} {"train_loss": -6.809347152709961, "global_step": 141095, "epoch": 3359} {"train_loss": -6.779007434844971, "global_step": 141096, "epoch": 3359} {"train_loss": -6.843626022338867, "global_step": 141097, "epoch": 3359} {"train_loss": -6.840728759765625, "global_step": 141098, "epoch": 3359} {"train_loss": -6.905412673950195, "global_step": 141099, "epoch": 3359} {"train_loss": -6.7723870277404785, "global_step": 141100, "epoch": 3359} {"train_loss": -6.844782829284668, "global_step": 141101, "epoch": 3359} {"train_loss": -6.767810821533203, "global_step": 141102, "epoch": 3359} {"train_loss": -6.891395568847656, "global_step": 141103, "epoch": 3359} {"train_loss": -6.792200088500977, "global_step": 141104, "epoch": 3359} {"train_loss": -6.589724540710449, "global_step": 141105, "epoch": 3359} {"train_loss": -6.6811370849609375, "global_step": 141106, "epoch": 3359} {"train_loss": -6.691078186035156, "global_step": 141107, "epoch": 3359} {"train_loss": -6.598739147186279, "global_step": 141108, "epoch": 3359} {"train_loss": -6.682840347290039, "global_step": 141109, "epoch": 3359} {"train_loss": -6.679534912109375, "global_step": 141110, "epoch": 3359} {"train_loss": -6.742244243621826, "global_step": 141111, "epoch": 3359} {"train_loss": -6.586172103881836, "global_step": 141112, "epoch": 3359} {"train_loss": -6.767234802246094, "global_step": 141113, "epoch": 3359} {"train_loss": -6.857619285583496, "global_step": 141114, "epoch": 3359} {"train_loss": -6.698276519775391, "global_step": 141115, "epoch": 3359} {"train_loss": -6.713490962982178, "global_step": 141116, "epoch": 3359} {"train_loss": -6.8486785888671875, "global_step": 141117, "epoch": 3359} {"train_loss": -6.71406888961792, "global_step": 141118, "epoch": 3359} {"train_loss": -6.761600017547607, "global_step": 141119, "epoch": 3359, "val_loss": 67439.484375} {"train_loss": -6.728003978729248, "global_step": 141120, "epoch": 3360} {"train_loss": -6.777944564819336, "global_step": 141121, "epoch": 3360} {"train_loss": -6.78385591506958, "global_step": 141122, "epoch": 3360} {"train_loss": -6.791788101196289, "global_step": 141123, "epoch": 3360} {"train_loss": -6.854510307312012, "global_step": 141124, "epoch": 3360} {"train_loss": -6.761673927307129, "global_step": 141125, "epoch": 3360} {"train_loss": -6.763300895690918, "global_step": 141126, "epoch": 3360} {"train_loss": -7.0030903816223145, "global_step": 141127, "epoch": 3360} {"train_loss": -6.797672271728516, "global_step": 141128, "epoch": 3360} {"train_loss": -6.785600662231445, "global_step": 141129, "epoch": 3360} {"train_loss": -6.718092918395996, "global_step": 141130, "epoch": 3360} {"train_loss": -6.778156757354736, "global_step": 141131, "epoch": 3360} {"train_loss": -6.827836513519287, "global_step": 141132, "epoch": 3360} {"train_loss": -6.791449546813965, "global_step": 141133, "epoch": 3360} {"train_loss": -6.703681468963623, "global_step": 141134, "epoch": 3360} {"train_loss": -6.782790184020996, "global_step": 141135, "epoch": 3360} {"train_loss": -6.812747001647949, "global_step": 141136, "epoch": 3360} {"train_loss": -6.750092506408691, "global_step": 141137, "epoch": 3360} {"train_loss": -6.730190753936768, "global_step": 141138, "epoch": 3360} {"train_loss": -6.871460914611816, "global_step": 141139, "epoch": 3360} {"train_loss": -6.684866428375244, "global_step": 141140, "epoch": 3360} {"train_loss": -6.6761674880981445, "global_step": 141141, "epoch": 3360} {"train_loss": -6.7144775390625, "global_step": 141142, "epoch": 3360} {"train_loss": -6.721748352050781, "global_step": 141143, "epoch": 3360} {"train_loss": -6.809678554534912, "global_step": 141144, "epoch": 3360} {"train_loss": -6.824768543243408, "global_step": 141145, "epoch": 3360} {"train_loss": -6.757082939147949, "global_step": 141146, "epoch": 3360} {"train_loss": -6.745845794677734, "global_step": 141147, "epoch": 3360} {"train_loss": -6.771196365356445, "global_step": 141148, "epoch": 3360} {"train_loss": -6.714198112487793, "global_step": 141149, "epoch": 3360} {"train_loss": -6.681502342224121, "global_step": 141150, "epoch": 3360} {"train_loss": -6.708883285522461, "global_step": 141151, "epoch": 3360} {"train_loss": -6.751468658447266, "global_step": 141152, "epoch": 3360} {"train_loss": -6.744791030883789, "global_step": 141153, "epoch": 3360} {"train_loss": -6.794942855834961, "global_step": 141154, "epoch": 3360} {"train_loss": -6.816376686096191, "global_step": 141155, "epoch": 3360} {"train_loss": -6.589669704437256, "global_step": 141156, "epoch": 3360} {"train_loss": -6.658112049102783, "global_step": 141157, "epoch": 3360} {"train_loss": -6.6486968994140625, "global_step": 141158, "epoch": 3360} {"train_loss": -6.759554862976074, "global_step": 141159, "epoch": 3360} {"train_loss": -6.674908638000488, "global_step": 141160, "epoch": 3360} {"train_loss": -6.752776622772217, "global_step": 141161, "epoch": 3360, "val_loss": 67643.0546875} {"train_loss": -6.751181602478027, "global_step": 141162, "epoch": 3361} {"train_loss": -6.717718601226807, "global_step": 141163, "epoch": 3361} {"train_loss": -6.618408203125, "global_step": 141164, "epoch": 3361} {"train_loss": -6.7503342628479, "global_step": 141165, "epoch": 3361} {"train_loss": -6.695284843444824, "global_step": 141166, "epoch": 3361} {"train_loss": -6.6634745597839355, "global_step": 141167, "epoch": 3361} {"train_loss": -6.7258219718933105, "global_step": 141168, "epoch": 3361} {"train_loss": -6.69003963470459, "global_step": 141169, "epoch": 3361} {"train_loss": -6.6628546714782715, "global_step": 141170, "epoch": 3361} {"train_loss": -6.667708396911621, "global_step": 141171, "epoch": 3361} {"train_loss": -6.746891498565674, "global_step": 141172, "epoch": 3361} {"train_loss": -6.905645370483398, "global_step": 141173, "epoch": 3361} {"train_loss": -6.735847473144531, "global_step": 141174, "epoch": 3361} {"train_loss": -6.727227687835693, "global_step": 141175, "epoch": 3361} {"train_loss": -6.804509162902832, "global_step": 141176, "epoch": 3361} {"train_loss": -6.882260799407959, "global_step": 141177, "epoch": 3361} {"train_loss": -6.740434169769287, "global_step": 141178, "epoch": 3361} {"train_loss": -6.815421104431152, "global_step": 141179, "epoch": 3361} {"train_loss": -6.713274955749512, "global_step": 141180, "epoch": 3361} {"train_loss": -6.794942378997803, "global_step": 141181, "epoch": 3361} {"train_loss": -6.690831184387207, "global_step": 141182, "epoch": 3361} {"train_loss": -6.773285388946533, "global_step": 141183, "epoch": 3361} {"train_loss": -6.836088180541992, "global_step": 141184, "epoch": 3361} {"train_loss": -6.882841110229492, "global_step": 141185, "epoch": 3361} {"train_loss": -6.748737335205078, "global_step": 141186, "epoch": 3361} {"train_loss": -6.7621355056762695, "global_step": 141187, "epoch": 3361} {"train_loss": -6.847301959991455, "global_step": 141188, "epoch": 3361} {"train_loss": -6.754420757293701, "global_step": 141189, "epoch": 3361} {"train_loss": -6.829944610595703, "global_step": 141190, "epoch": 3361} {"train_loss": -6.824893951416016, "global_step": 141191, "epoch": 3361} {"train_loss": -6.613592624664307, "global_step": 141192, "epoch": 3361} {"train_loss": -6.731689453125, "global_step": 141193, "epoch": 3361} {"train_loss": -6.836122035980225, "global_step": 141194, "epoch": 3361} {"train_loss": -6.708861351013184, "global_step": 141195, "epoch": 3361} {"train_loss": -6.799954414367676, "global_step": 141196, "epoch": 3361} {"train_loss": -6.767195701599121, "global_step": 141197, "epoch": 3361} {"train_loss": -6.7558088302612305, "global_step": 141198, "epoch": 3361} {"train_loss": -6.763515472412109, "global_step": 141199, "epoch": 3361} {"train_loss": -6.753487586975098, "global_step": 141200, "epoch": 3361} {"train_loss": -6.8527021408081055, "global_step": 141201, "epoch": 3361} {"train_loss": -6.80617618560791, "global_step": 141202, "epoch": 3361} {"train_loss": -6.759228195462908, "global_step": 141203, "epoch": 3361, "val_loss": 67384.78125} {"train_loss": -6.663580894470215, "global_step": 141204, "epoch": 3362} {"train_loss": -6.7202534675598145, "global_step": 141205, "epoch": 3362} {"train_loss": -6.741973876953125, "global_step": 141206, "epoch": 3362} {"train_loss": -6.7888875007629395, "global_step": 141207, "epoch": 3362} {"train_loss": -6.741654396057129, "global_step": 141208, "epoch": 3362} {"train_loss": -6.719510555267334, "global_step": 141209, "epoch": 3362} {"train_loss": -6.771414756774902, "global_step": 141210, "epoch": 3362} {"train_loss": -6.685736656188965, "global_step": 141211, "epoch": 3362} {"train_loss": -6.816493511199951, "global_step": 141212, "epoch": 3362} {"train_loss": -6.729821681976318, "global_step": 141213, "epoch": 3362} {"train_loss": -6.744775772094727, "global_step": 141214, "epoch": 3362} {"train_loss": -6.827689170837402, "global_step": 141215, "epoch": 3362} {"train_loss": -6.80179500579834, "global_step": 141216, "epoch": 3362} {"train_loss": -6.877126216888428, "global_step": 141217, "epoch": 3362} {"train_loss": -6.738070487976074, "global_step": 141218, "epoch": 3362} {"train_loss": -6.8652567863464355, "global_step": 141219, "epoch": 3362} {"train_loss": -6.8380889892578125, "global_step": 141220, "epoch": 3362} {"train_loss": -6.737720966339111, "global_step": 141221, "epoch": 3362} {"train_loss": -6.723941326141357, "global_step": 141222, "epoch": 3362} {"train_loss": -6.7913665771484375, "global_step": 141223, "epoch": 3362} {"train_loss": -6.731420040130615, "global_step": 141224, "epoch": 3362} {"train_loss": -6.879456996917725, "global_step": 141225, "epoch": 3362} {"train_loss": -6.72315788269043, "global_step": 141226, "epoch": 3362} {"train_loss": -6.798274040222168, "global_step": 141227, "epoch": 3362} {"train_loss": -6.798218727111816, "global_step": 141228, "epoch": 3362} {"train_loss": -6.80001974105835, "global_step": 141229, "epoch": 3362} {"train_loss": -6.8542375564575195, "global_step": 141230, "epoch": 3362} {"train_loss": -6.840710163116455, "global_step": 141231, "epoch": 3362} {"train_loss": -6.833254337310791, "global_step": 141232, "epoch": 3362} {"train_loss": -6.96681022644043, "global_step": 141233, "epoch": 3362} {"train_loss": -6.762733459472656, "global_step": 141234, "epoch": 3362} {"train_loss": -6.741988658905029, "global_step": 141235, "epoch": 3362} {"train_loss": -6.86591100692749, "global_step": 141236, "epoch": 3362} {"train_loss": -6.812024116516113, "global_step": 141237, "epoch": 3362} {"train_loss": -6.836062431335449, "global_step": 141238, "epoch": 3362} {"train_loss": -6.848969459533691, "global_step": 141239, "epoch": 3362} {"train_loss": -6.790172576904297, "global_step": 141240, "epoch": 3362} {"train_loss": -6.8192033767700195, "global_step": 141241, "epoch": 3362} {"train_loss": -6.721158981323242, "global_step": 141242, "epoch": 3362} {"train_loss": -6.70515775680542, "global_step": 141243, "epoch": 3362} {"train_loss": -6.736103057861328, "global_step": 141244, "epoch": 3362} {"train_loss": -6.782654137838454, "global_step": 141245, "epoch": 3362, "val_loss": 67555.015625} {"train_loss": -6.809329986572266, "global_step": 141246, "epoch": 3363} {"train_loss": -6.748093128204346, "global_step": 141247, "epoch": 3363} {"train_loss": -6.776525497436523, "global_step": 141248, "epoch": 3363} {"train_loss": -6.8375139236450195, "global_step": 141249, "epoch": 3363} {"train_loss": -6.6996378898620605, "global_step": 141250, "epoch": 3363} {"train_loss": -6.836177825927734, "global_step": 141251, "epoch": 3363} {"train_loss": -6.769296646118164, "global_step": 141252, "epoch": 3363} {"train_loss": -6.663622856140137, "global_step": 141253, "epoch": 3363} {"train_loss": -6.758732795715332, "global_step": 141254, "epoch": 3363} {"train_loss": -6.7819013595581055, "global_step": 141255, "epoch": 3363} {"train_loss": -6.706221103668213, "global_step": 141256, "epoch": 3363} {"train_loss": -6.802602767944336, "global_step": 141257, "epoch": 3363} {"train_loss": -6.75456428527832, "global_step": 141258, "epoch": 3363} {"train_loss": -6.783677577972412, "global_step": 141259, "epoch": 3363} {"train_loss": -6.867755889892578, "global_step": 141260, "epoch": 3363} {"train_loss": -6.802929878234863, "global_step": 141261, "epoch": 3363} {"train_loss": -6.8618268966674805, "global_step": 141262, "epoch": 3363} {"train_loss": -6.83003568649292, "global_step": 141263, "epoch": 3363} {"train_loss": -6.869330406188965, "global_step": 141264, "epoch": 3363} {"train_loss": -6.879514217376709, "global_step": 141265, "epoch": 3363} {"train_loss": -6.813981056213379, "global_step": 141266, "epoch": 3363} {"train_loss": -6.8422393798828125, "global_step": 141267, "epoch": 3363} {"train_loss": -6.931315898895264, "global_step": 141268, "epoch": 3363} {"train_loss": -6.848213195800781, "global_step": 141269, "epoch": 3363} {"train_loss": -6.977025032043457, "global_step": 141270, "epoch": 3363} {"train_loss": -6.887373924255371, "global_step": 141271, "epoch": 3363} {"train_loss": -6.8244524002075195, "global_step": 141272, "epoch": 3363} {"train_loss": -6.812557220458984, "global_step": 141273, "epoch": 3363} {"train_loss": -6.713886260986328, "global_step": 141274, "epoch": 3363} {"train_loss": -6.744623184204102, "global_step": 141275, "epoch": 3363} {"train_loss": -6.822332859039307, "global_step": 141276, "epoch": 3363} {"train_loss": -6.783622741699219, "global_step": 141277, "epoch": 3363} {"train_loss": -6.736557483673096, "global_step": 141278, "epoch": 3363} {"train_loss": -6.723272323608398, "global_step": 141279, "epoch": 3363} {"train_loss": -6.827035427093506, "global_step": 141280, "epoch": 3363} {"train_loss": -6.729780197143555, "global_step": 141281, "epoch": 3363} {"train_loss": -6.779367923736572, "global_step": 141282, "epoch": 3363} {"train_loss": -6.810851573944092, "global_step": 141283, "epoch": 3363} {"train_loss": -6.6908111572265625, "global_step": 141284, "epoch": 3363} {"train_loss": -6.804006576538086, "global_step": 141285, "epoch": 3363} {"train_loss": -6.765297889709473, "global_step": 141286, "epoch": 3363} {"train_loss": -6.7919175284249445, "global_step": 141287, "epoch": 3363, "val_loss": 67322.609375} {"train_loss": -6.834901809692383, "global_step": 141288, "epoch": 3364} {"train_loss": -6.645864486694336, "global_step": 141289, "epoch": 3364} {"train_loss": -6.501728534698486, "global_step": 141290, "epoch": 3364} {"train_loss": -6.748276710510254, "global_step": 141291, "epoch": 3364} {"train_loss": -6.6952128410339355, "global_step": 141292, "epoch": 3364} {"train_loss": -6.669289588928223, "global_step": 141293, "epoch": 3364} {"train_loss": -6.7537736892700195, "global_step": 141294, "epoch": 3364} {"train_loss": -6.669826507568359, "global_step": 141295, "epoch": 3364} {"train_loss": -6.663022041320801, "global_step": 141296, "epoch": 3364} {"train_loss": -6.741964340209961, "global_step": 141297, "epoch": 3364} {"train_loss": -6.677075386047363, "global_step": 141298, "epoch": 3364} {"train_loss": -6.788058280944824, "global_step": 141299, "epoch": 3364} {"train_loss": -6.692805290222168, "global_step": 141300, "epoch": 3364} {"train_loss": -6.731799125671387, "global_step": 141301, "epoch": 3364} {"train_loss": -6.681602478027344, "global_step": 141302, "epoch": 3364} {"train_loss": -6.729796409606934, "global_step": 141303, "epoch": 3364} {"train_loss": -6.7980804443359375, "global_step": 141304, "epoch": 3364} {"train_loss": -6.7495832443237305, "global_step": 141305, "epoch": 3364} {"train_loss": -6.867650985717773, "global_step": 141306, "epoch": 3364} {"train_loss": -6.675464630126953, "global_step": 141307, "epoch": 3364} {"train_loss": -6.707467079162598, "global_step": 141308, "epoch": 3364} {"train_loss": -6.790610313415527, "global_step": 141309, "epoch": 3364} {"train_loss": -6.680150985717773, "global_step": 141310, "epoch": 3364} {"train_loss": -6.776110649108887, "global_step": 141311, "epoch": 3364} {"train_loss": -6.708563327789307, "global_step": 141312, "epoch": 3364} {"train_loss": -6.7628984451293945, "global_step": 141313, "epoch": 3364} {"train_loss": -6.788487911224365, "global_step": 141314, "epoch": 3364} {"train_loss": -6.708189487457275, "global_step": 141315, "epoch": 3364} {"train_loss": -6.772885322570801, "global_step": 141316, "epoch": 3364} {"train_loss": -6.7052202224731445, "global_step": 141317, "epoch": 3364} {"train_loss": -6.8261213302612305, "global_step": 141318, "epoch": 3364} {"train_loss": -6.81558895111084, "global_step": 141319, "epoch": 3364} {"train_loss": -6.657629013061523, "global_step": 141320, "epoch": 3364} {"train_loss": -6.768876075744629, "global_step": 141321, "epoch": 3364} {"train_loss": -6.772199630737305, "global_step": 141322, "epoch": 3364} {"train_loss": -6.763443946838379, "global_step": 141323, "epoch": 3364} {"train_loss": -6.750583648681641, "global_step": 141324, "epoch": 3364} {"train_loss": -6.754303932189941, "global_step": 141325, "epoch": 3364} {"train_loss": -6.6755781173706055, "global_step": 141326, "epoch": 3364} {"train_loss": -6.877933502197266, "global_step": 141327, "epoch": 3364} {"train_loss": -6.699922561645508, "global_step": 141328, "epoch": 3364} {"train_loss": -6.7339980488731745, "global_step": 141329, "epoch": 3364, "val_loss": 67313.6015625} {"train_loss": -6.851276874542236, "global_step": 141330, "epoch": 3365} {"train_loss": -6.688148498535156, "global_step": 141331, "epoch": 3365} {"train_loss": -6.862126350402832, "global_step": 141332, "epoch": 3365} {"train_loss": -6.760081768035889, "global_step": 141333, "epoch": 3365} {"train_loss": -6.839902877807617, "global_step": 141334, "epoch": 3365} {"train_loss": -6.697369575500488, "global_step": 141335, "epoch": 3365} {"train_loss": -6.75225305557251, "global_step": 141336, "epoch": 3365} {"train_loss": -6.770411491394043, "global_step": 141337, "epoch": 3365} {"train_loss": -6.687237739562988, "global_step": 141338, "epoch": 3365} {"train_loss": -6.755212783813477, "global_step": 141339, "epoch": 3365} {"train_loss": -6.835495948791504, "global_step": 141340, "epoch": 3365} {"train_loss": -6.863730430603027, "global_step": 141341, "epoch": 3365} {"train_loss": -6.860208511352539, "global_step": 141342, "epoch": 3365} {"train_loss": -6.79036808013916, "global_step": 141343, "epoch": 3365} {"train_loss": -6.775327205657959, "global_step": 141344, "epoch": 3365} {"train_loss": -6.701810836791992, "global_step": 141345, "epoch": 3365} {"train_loss": -6.855663299560547, "global_step": 141346, "epoch": 3365} {"train_loss": -6.758092403411865, "global_step": 141347, "epoch": 3365} {"train_loss": -6.783141136169434, "global_step": 141348, "epoch": 3365} {"train_loss": -6.902584075927734, "global_step": 141349, "epoch": 3365} {"train_loss": -6.722878456115723, "global_step": 141350, "epoch": 3365} {"train_loss": -6.699995994567871, "global_step": 141351, "epoch": 3365} {"train_loss": -6.785459518432617, "global_step": 141352, "epoch": 3365} {"train_loss": -6.708512306213379, "global_step": 141353, "epoch": 3365} {"train_loss": -6.562752723693848, "global_step": 141354, "epoch": 3365} {"train_loss": -6.836727619171143, "global_step": 141355, "epoch": 3365} {"train_loss": -6.781123161315918, "global_step": 141356, "epoch": 3365} {"train_loss": -6.756531715393066, "global_step": 141357, "epoch": 3365} {"train_loss": -6.73313045501709, "global_step": 141358, "epoch": 3365} {"train_loss": -6.807977676391602, "global_step": 141359, "epoch": 3365} {"train_loss": -6.8737993240356445, "global_step": 141360, "epoch": 3365} {"train_loss": -6.707767486572266, "global_step": 141361, "epoch": 3365} {"train_loss": -6.78388786315918, "global_step": 141362, "epoch": 3365} {"train_loss": -6.835715293884277, "global_step": 141363, "epoch": 3365} {"train_loss": -6.71064567565918, "global_step": 141364, "epoch": 3365} {"train_loss": -6.764810562133789, "global_step": 141365, "epoch": 3365} {"train_loss": -6.763525009155273, "global_step": 141366, "epoch": 3365} {"train_loss": -6.696401596069336, "global_step": 141367, "epoch": 3365} {"train_loss": -6.675719261169434, "global_step": 141368, "epoch": 3365} {"train_loss": -6.648961544036865, "global_step": 141369, "epoch": 3365} {"train_loss": -6.824953079223633, "global_step": 141370, "epoch": 3365} {"train_loss": -6.764982075918288, "global_step": 141371, "epoch": 3365, "val_loss": 67446.4375} {"train_loss": -6.772910118103027, "global_step": 141372, "epoch": 3366} {"train_loss": -6.713657379150391, "global_step": 141373, "epoch": 3366} {"train_loss": -6.780677795410156, "global_step": 141374, "epoch": 3366} {"train_loss": -6.819418430328369, "global_step": 141375, "epoch": 3366} {"train_loss": -6.596013069152832, "global_step": 141376, "epoch": 3366} {"train_loss": -6.788816928863525, "global_step": 141377, "epoch": 3366} {"train_loss": -6.737717628479004, "global_step": 141378, "epoch": 3366} {"train_loss": -6.686086654663086, "global_step": 141379, "epoch": 3366} {"train_loss": -6.730348587036133, "global_step": 141380, "epoch": 3366} {"train_loss": -6.74511194229126, "global_step": 141381, "epoch": 3366} {"train_loss": -6.631841659545898, "global_step": 141382, "epoch": 3366} {"train_loss": -6.742514133453369, "global_step": 141383, "epoch": 3366} {"train_loss": -6.690706253051758, "global_step": 141384, "epoch": 3366} {"train_loss": -6.793437957763672, "global_step": 141385, "epoch": 3366} {"train_loss": -6.7534074783325195, "global_step": 141386, "epoch": 3366} {"train_loss": -6.730762481689453, "global_step": 141387, "epoch": 3366} {"train_loss": -6.765619277954102, "global_step": 141388, "epoch": 3366} {"train_loss": -6.7377166748046875, "global_step": 141389, "epoch": 3366} {"train_loss": -6.807872772216797, "global_step": 141390, "epoch": 3366} {"train_loss": -6.802908420562744, "global_step": 141391, "epoch": 3366} {"train_loss": -6.787090301513672, "global_step": 141392, "epoch": 3366} {"train_loss": -6.760856628417969, "global_step": 141393, "epoch": 3366} {"train_loss": -6.754558563232422, "global_step": 141394, "epoch": 3366} {"train_loss": -6.661730766296387, "global_step": 141395, "epoch": 3366} {"train_loss": -6.82473611831665, "global_step": 141396, "epoch": 3366} {"train_loss": -6.6587677001953125, "global_step": 141397, "epoch": 3366} {"train_loss": -6.706827163696289, "global_step": 141398, "epoch": 3366} {"train_loss": -6.710803031921387, "global_step": 141399, "epoch": 3366} {"train_loss": -6.704961776733398, "global_step": 141400, "epoch": 3366} {"train_loss": -6.788506984710693, "global_step": 141401, "epoch": 3366} {"train_loss": -6.792204856872559, "global_step": 141402, "epoch": 3366} {"train_loss": -6.727827072143555, "global_step": 141403, "epoch": 3366} {"train_loss": -6.683006286621094, "global_step": 141404, "epoch": 3366} {"train_loss": -6.811442852020264, "global_step": 141405, "epoch": 3366} {"train_loss": -6.669872760772705, "global_step": 141406, "epoch": 3366} {"train_loss": -6.6917266845703125, "global_step": 141407, "epoch": 3366} {"train_loss": -6.767166614532471, "global_step": 141408, "epoch": 3366} {"train_loss": -6.81379508972168, "global_step": 141409, "epoch": 3366} {"train_loss": -6.7815985679626465, "global_step": 141410, "epoch": 3366} {"train_loss": -6.759101867675781, "global_step": 141411, "epoch": 3366} {"train_loss": -6.724829196929932, "global_step": 141412, "epoch": 3366} {"train_loss": -6.744164341971988, "global_step": 141413, "epoch": 3366, "val_loss": 67349.7265625} {"train_loss": -6.73042106628418, "global_step": 141414, "epoch": 3367} {"train_loss": -6.710826873779297, "global_step": 141415, "epoch": 3367} {"train_loss": -6.795468330383301, "global_step": 141416, "epoch": 3367} {"train_loss": -6.758804798126221, "global_step": 141417, "epoch": 3367} {"train_loss": -6.831728935241699, "global_step": 141418, "epoch": 3367} {"train_loss": -6.789951324462891, "global_step": 141419, "epoch": 3367} {"train_loss": -6.842665672302246, "global_step": 141420, "epoch": 3367} {"train_loss": -6.869537353515625, "global_step": 141421, "epoch": 3367} {"train_loss": -6.890965938568115, "global_step": 141422, "epoch": 3367} {"train_loss": -6.817483425140381, "global_step": 141423, "epoch": 3367} {"train_loss": -6.824905872344971, "global_step": 141424, "epoch": 3367} {"train_loss": -6.762639045715332, "global_step": 141425, "epoch": 3367} {"train_loss": -6.871664047241211, "global_step": 141426, "epoch": 3367} {"train_loss": -6.8535003662109375, "global_step": 141427, "epoch": 3367} {"train_loss": -6.754672050476074, "global_step": 141428, "epoch": 3367} {"train_loss": -6.7614970207214355, "global_step": 141429, "epoch": 3367} {"train_loss": -6.872987747192383, "global_step": 141430, "epoch": 3367} {"train_loss": -6.807493686676025, "global_step": 141431, "epoch": 3367} {"train_loss": -6.881820201873779, "global_step": 141432, "epoch": 3367} {"train_loss": -6.838168621063232, "global_step": 141433, "epoch": 3367} {"train_loss": -6.751970291137695, "global_step": 141434, "epoch": 3367} {"train_loss": -6.658190727233887, "global_step": 141435, "epoch": 3367} {"train_loss": -6.831495761871338, "global_step": 141436, "epoch": 3367} {"train_loss": -6.874790191650391, "global_step": 141437, "epoch": 3367} {"train_loss": -6.678361892700195, "global_step": 141438, "epoch": 3367} {"train_loss": -6.8929362297058105, "global_step": 141439, "epoch": 3367} {"train_loss": -6.920661449432373, "global_step": 141440, "epoch": 3367} {"train_loss": -6.920771598815918, "global_step": 141441, "epoch": 3367} {"train_loss": -6.856624603271484, "global_step": 141442, "epoch": 3367} {"train_loss": -6.838839530944824, "global_step": 141443, "epoch": 3367} {"train_loss": -6.828258514404297, "global_step": 141444, "epoch": 3367} {"train_loss": -6.650955677032471, "global_step": 141445, "epoch": 3367} {"train_loss": -6.914042949676514, "global_step": 141446, "epoch": 3367} {"train_loss": -6.837970733642578, "global_step": 141447, "epoch": 3367} {"train_loss": -6.814948081970215, "global_step": 141448, "epoch": 3367} {"train_loss": -6.753549575805664, "global_step": 141449, "epoch": 3367} {"train_loss": -6.834059715270996, "global_step": 141450, "epoch": 3367} {"train_loss": -6.714504718780518, "global_step": 141451, "epoch": 3367} {"train_loss": -6.73976993560791, "global_step": 141452, "epoch": 3367} {"train_loss": -6.804836750030518, "global_step": 141453, "epoch": 3367} {"train_loss": -6.613651275634766, "global_step": 141454, "epoch": 3367} {"train_loss": -6.8016142163957864, "global_step": 141455, "epoch": 3367, "val_loss": 67425.1796875} {"train_loss": -6.702939987182617, "global_step": 141456, "epoch": 3368} {"train_loss": -6.668279647827148, "global_step": 141457, "epoch": 3368} {"train_loss": -6.535458087921143, "global_step": 141458, "epoch": 3368} {"train_loss": -6.6632890701293945, "global_step": 141459, "epoch": 3368} {"train_loss": -6.753299713134766, "global_step": 141460, "epoch": 3368} {"train_loss": -6.464305400848389, "global_step": 141461, "epoch": 3368} {"train_loss": -6.803783416748047, "global_step": 141462, "epoch": 3368} {"train_loss": -6.583727836608887, "global_step": 141463, "epoch": 3368} {"train_loss": -6.555582046508789, "global_step": 141464, "epoch": 3368} {"train_loss": -6.746637344360352, "global_step": 141465, "epoch": 3368} {"train_loss": -6.5516486167907715, "global_step": 141466, "epoch": 3368} {"train_loss": -6.620199203491211, "global_step": 141467, "epoch": 3368} {"train_loss": -6.610164642333984, "global_step": 141468, "epoch": 3368} {"train_loss": -6.690618991851807, "global_step": 141469, "epoch": 3368} {"train_loss": -6.568218231201172, "global_step": 141470, "epoch": 3368} {"train_loss": -6.621862411499023, "global_step": 141471, "epoch": 3368} {"train_loss": -6.660759925842285, "global_step": 141472, "epoch": 3368} {"train_loss": -6.587375164031982, "global_step": 141473, "epoch": 3368} {"train_loss": -6.790980815887451, "global_step": 141474, "epoch": 3368} {"train_loss": -6.690362453460693, "global_step": 141475, "epoch": 3368} {"train_loss": -6.736739158630371, "global_step": 141476, "epoch": 3368} {"train_loss": -6.688569068908691, "global_step": 141477, "epoch": 3368} {"train_loss": -6.752191066741943, "global_step": 141478, "epoch": 3368} {"train_loss": -6.808209419250488, "global_step": 141479, "epoch": 3368} {"train_loss": -6.8046064376831055, "global_step": 141480, "epoch": 3368} {"train_loss": -6.785098075866699, "global_step": 141481, "epoch": 3368} {"train_loss": -6.772030830383301, "global_step": 141482, "epoch": 3368} {"train_loss": -6.836395740509033, "global_step": 141483, "epoch": 3368} {"train_loss": -6.808981895446777, "global_step": 141484, "epoch": 3368} {"train_loss": -6.849273204803467, "global_step": 141485, "epoch": 3368} {"train_loss": -6.731694221496582, "global_step": 141486, "epoch": 3368} {"train_loss": -6.800004005432129, "global_step": 141487, "epoch": 3368} {"train_loss": -6.777353763580322, "global_step": 141488, "epoch": 3368} {"train_loss": -6.76237154006958, "global_step": 141489, "epoch": 3368} {"train_loss": -6.811399459838867, "global_step": 141490, "epoch": 3368} {"train_loss": -6.701290607452393, "global_step": 141491, "epoch": 3368} {"train_loss": -6.761104583740234, "global_step": 141492, "epoch": 3368} {"train_loss": -6.707183837890625, "global_step": 141493, "epoch": 3368} {"train_loss": -6.746499538421631, "global_step": 141494, "epoch": 3368} {"train_loss": -6.730313301086426, "global_step": 141495, "epoch": 3368} {"train_loss": -6.733919143676758, "global_step": 141496, "epoch": 3368} {"train_loss": -6.709185112090338, "global_step": 141497, "epoch": 3368, "val_loss": 67535.6953125} {"train_loss": -6.81157112121582, "global_step": 141498, "epoch": 3369} {"train_loss": -6.808928966522217, "global_step": 141499, "epoch": 3369} {"train_loss": -6.7017107009887695, "global_step": 141500, "epoch": 3369} {"train_loss": -6.827163219451904, "global_step": 141501, "epoch": 3369} {"train_loss": -6.829817771911621, "global_step": 141502, "epoch": 3369} {"train_loss": -6.765207290649414, "global_step": 141503, "epoch": 3369} {"train_loss": -6.809412479400635, "global_step": 141504, "epoch": 3369} {"train_loss": -6.825692176818848, "global_step": 141505, "epoch": 3369} {"train_loss": -6.774381160736084, "global_step": 141506, "epoch": 3369} {"train_loss": -6.797668933868408, "global_step": 141507, "epoch": 3369} {"train_loss": -6.810483932495117, "global_step": 141508, "epoch": 3369} {"train_loss": -6.842571258544922, "global_step": 141509, "epoch": 3369} {"train_loss": -6.734226226806641, "global_step": 141510, "epoch": 3369} {"train_loss": -6.8039045333862305, "global_step": 141511, "epoch": 3369} {"train_loss": -6.657929420471191, "global_step": 141512, "epoch": 3369} {"train_loss": -6.758026123046875, "global_step": 141513, "epoch": 3369} {"train_loss": -6.787723541259766, "global_step": 141514, "epoch": 3369} {"train_loss": -6.740615367889404, "global_step": 141515, "epoch": 3369} {"train_loss": -6.805228233337402, "global_step": 141516, "epoch": 3369} {"train_loss": -6.820551872253418, "global_step": 141517, "epoch": 3369} {"train_loss": -6.671474456787109, "global_step": 141518, "epoch": 3369} {"train_loss": -6.882920742034912, "global_step": 141519, "epoch": 3369} {"train_loss": -6.575690269470215, "global_step": 141520, "epoch": 3369} {"train_loss": -6.851966381072998, "global_step": 141521, "epoch": 3369} {"train_loss": -6.666223526000977, "global_step": 141522, "epoch": 3369} {"train_loss": -6.726619720458984, "global_step": 141523, "epoch": 3369} {"train_loss": -6.75785493850708, "global_step": 141524, "epoch": 3369} {"train_loss": -6.84323263168335, "global_step": 141525, "epoch": 3369} {"train_loss": -6.7725629806518555, "global_step": 141526, "epoch": 3369} {"train_loss": -6.811526298522949, "global_step": 141527, "epoch": 3369} {"train_loss": -6.820446491241455, "global_step": 141528, "epoch": 3369} {"train_loss": -6.873296737670898, "global_step": 141529, "epoch": 3369} {"train_loss": -6.799020290374756, "global_step": 141530, "epoch": 3369} {"train_loss": -6.780891418457031, "global_step": 141531, "epoch": 3369} {"train_loss": -6.713087558746338, "global_step": 141532, "epoch": 3369} {"train_loss": -6.78520393371582, "global_step": 141533, "epoch": 3369} {"train_loss": -6.855164051055908, "global_step": 141534, "epoch": 3369} {"train_loss": -6.801067352294922, "global_step": 141535, "epoch": 3369} {"train_loss": -6.745232582092285, "global_step": 141536, "epoch": 3369} {"train_loss": -6.8947014808654785, "global_step": 141537, "epoch": 3369} {"train_loss": -6.870219707489014, "global_step": 141538, "epoch": 3369} {"train_loss": -6.783967301959083, "global_step": 141539, "epoch": 3369, "val_loss": 67423.0546875} {"train_loss": -6.82215690612793, "global_step": 141540, "epoch": 3370} {"train_loss": -6.763469696044922, "global_step": 141541, "epoch": 3370} {"train_loss": -6.7154974937438965, "global_step": 141542, "epoch": 3370} {"train_loss": -6.703022003173828, "global_step": 141543, "epoch": 3370} {"train_loss": -6.687620162963867, "global_step": 141544, "epoch": 3370} {"train_loss": -6.7965850830078125, "global_step": 141545, "epoch": 3370} {"train_loss": -6.859260559082031, "global_step": 141546, "epoch": 3370} {"train_loss": -6.711912155151367, "global_step": 141547, "epoch": 3370} {"train_loss": -6.863635540008545, "global_step": 141548, "epoch": 3370} {"train_loss": -6.631629943847656, "global_step": 141549, "epoch": 3370} {"train_loss": -6.758981704711914, "global_step": 141550, "epoch": 3370} {"train_loss": -6.787883281707764, "global_step": 141551, "epoch": 3370} {"train_loss": -6.779669761657715, "global_step": 141552, "epoch": 3370} {"train_loss": -6.756202697753906, "global_step": 141553, "epoch": 3370} {"train_loss": -6.664619445800781, "global_step": 141554, "epoch": 3370} {"train_loss": -6.8183112144470215, "global_step": 141555, "epoch": 3370} {"train_loss": -6.7419281005859375, "global_step": 141556, "epoch": 3370} {"train_loss": -6.727878570556641, "global_step": 141557, "epoch": 3370} {"train_loss": -6.838701248168945, "global_step": 141558, "epoch": 3370} {"train_loss": -6.825878620147705, "global_step": 141559, "epoch": 3370} {"train_loss": -6.72022819519043, "global_step": 141560, "epoch": 3370} {"train_loss": -6.747506141662598, "global_step": 141561, "epoch": 3370} {"train_loss": -6.815653324127197, "global_step": 141562, "epoch": 3370} {"train_loss": -6.715636253356934, "global_step": 141563, "epoch": 3370} {"train_loss": -6.800437927246094, "global_step": 141564, "epoch": 3370} {"train_loss": -6.747841835021973, "global_step": 141565, "epoch": 3370} {"train_loss": -6.74018669128418, "global_step": 141566, "epoch": 3370} {"train_loss": -6.9387311935424805, "global_step": 141567, "epoch": 3370} {"train_loss": -6.716115474700928, "global_step": 141568, "epoch": 3370} {"train_loss": -6.755099296569824, "global_step": 141569, "epoch": 3370} {"train_loss": -6.806427955627441, "global_step": 141570, "epoch": 3370} {"train_loss": -6.604312896728516, "global_step": 141571, "epoch": 3370} {"train_loss": -6.698159217834473, "global_step": 141572, "epoch": 3370} {"train_loss": -6.902551651000977, "global_step": 141573, "epoch": 3370} {"train_loss": -6.6776275634765625, "global_step": 141574, "epoch": 3370} {"train_loss": -6.750285625457764, "global_step": 141575, "epoch": 3370} {"train_loss": -6.80909538269043, "global_step": 141576, "epoch": 3370} {"train_loss": -6.677310943603516, "global_step": 141577, "epoch": 3370} {"train_loss": -6.744580268859863, "global_step": 141578, "epoch": 3370} {"train_loss": -6.793234825134277, "global_step": 141579, "epoch": 3370} {"train_loss": -6.76611328125, "global_step": 141580, "epoch": 3370} {"train_loss": -6.761423485619681, "global_step": 141581, "epoch": 3370, "val_loss": 67471.09375} {"train_loss": -6.799523830413818, "global_step": 141582, "epoch": 3371} {"train_loss": -6.733753204345703, "global_step": 141583, "epoch": 3371} {"train_loss": -6.85765266418457, "global_step": 141584, "epoch": 3371} {"train_loss": -6.6089911460876465, "global_step": 141585, "epoch": 3371} {"train_loss": -6.78959846496582, "global_step": 141586, "epoch": 3371} {"train_loss": -6.802468299865723, "global_step": 141587, "epoch": 3371} {"train_loss": -6.744537830352783, "global_step": 141588, "epoch": 3371} {"train_loss": -6.7171430587768555, "global_step": 141589, "epoch": 3371} {"train_loss": -6.761802673339844, "global_step": 141590, "epoch": 3371} {"train_loss": -6.525906562805176, "global_step": 141591, "epoch": 3371} {"train_loss": -6.678908348083496, "global_step": 141592, "epoch": 3371} {"train_loss": -6.7127251625061035, "global_step": 141593, "epoch": 3371} {"train_loss": -6.59650993347168, "global_step": 141594, "epoch": 3371} {"train_loss": -6.786645889282227, "global_step": 141595, "epoch": 3371} {"train_loss": -6.69393253326416, "global_step": 141596, "epoch": 3371} {"train_loss": -6.690943241119385, "global_step": 141597, "epoch": 3371} {"train_loss": -6.670400619506836, "global_step": 141598, "epoch": 3371} {"train_loss": -6.783960819244385, "global_step": 141599, "epoch": 3371} {"train_loss": -6.716403961181641, "global_step": 141600, "epoch": 3371} {"train_loss": -6.683094024658203, "global_step": 141601, "epoch": 3371} {"train_loss": -6.849620819091797, "global_step": 141602, "epoch": 3371} {"train_loss": -6.7056498527526855, "global_step": 141603, "epoch": 3371} {"train_loss": -6.788609504699707, "global_step": 141604, "epoch": 3371} {"train_loss": -6.8680596351623535, "global_step": 141605, "epoch": 3371} {"train_loss": -6.89853572845459, "global_step": 141606, "epoch": 3371} {"train_loss": -6.797059059143066, "global_step": 141607, "epoch": 3371} {"train_loss": -6.821548938751221, "global_step": 141608, "epoch": 3371} {"train_loss": -6.675324440002441, "global_step": 141609, "epoch": 3371} {"train_loss": -6.816248893737793, "global_step": 141610, "epoch": 3371} {"train_loss": -6.7890472412109375, "global_step": 141611, "epoch": 3371} {"train_loss": -6.827779769897461, "global_step": 141612, "epoch": 3371} {"train_loss": -6.843288421630859, "global_step": 141613, "epoch": 3371} {"train_loss": -6.856135845184326, "global_step": 141614, "epoch": 3371} {"train_loss": -6.890632152557373, "global_step": 141615, "epoch": 3371} {"train_loss": -6.865721702575684, "global_step": 141616, "epoch": 3371} {"train_loss": -6.713452339172363, "global_step": 141617, "epoch": 3371} {"train_loss": -6.8324666023254395, "global_step": 141618, "epoch": 3371} {"train_loss": -6.898085117340088, "global_step": 141619, "epoch": 3371} {"train_loss": -6.9080095291137695, "global_step": 141620, "epoch": 3371} {"train_loss": -6.676979064941406, "global_step": 141621, "epoch": 3371} {"train_loss": -6.84181022644043, "global_step": 141622, "epoch": 3371} {"train_loss": -6.771199578330631, "global_step": 141623, "epoch": 3371, "val_loss": 67504.2890625} {"train_loss": -6.794846534729004, "global_step": 141624, "epoch": 3372} {"train_loss": -6.8831610679626465, "global_step": 141625, "epoch": 3372} {"train_loss": -6.92337703704834, "global_step": 141626, "epoch": 3372} {"train_loss": -6.860240936279297, "global_step": 141627, "epoch": 3372} {"train_loss": -6.853652000427246, "global_step": 141628, "epoch": 3372} {"train_loss": -6.788796424865723, "global_step": 141629, "epoch": 3372} {"train_loss": -6.806208610534668, "global_step": 141630, "epoch": 3372} {"train_loss": -6.724156379699707, "global_step": 141631, "epoch": 3372} {"train_loss": -6.780779838562012, "global_step": 141632, "epoch": 3372} {"train_loss": -6.788151741027832, "global_step": 141633, "epoch": 3372} {"train_loss": -6.71923828125, "global_step": 141634, "epoch": 3372} {"train_loss": -6.656816482543945, "global_step": 141635, "epoch": 3372} {"train_loss": -6.778194427490234, "global_step": 141636, "epoch": 3372} {"train_loss": -6.830918312072754, "global_step": 141637, "epoch": 3372} {"train_loss": -6.764673233032227, "global_step": 141638, "epoch": 3372} {"train_loss": -6.781263828277588, "global_step": 141639, "epoch": 3372} {"train_loss": -6.662293434143066, "global_step": 141640, "epoch": 3372} {"train_loss": -6.799877166748047, "global_step": 141641, "epoch": 3372} {"train_loss": -6.894981384277344, "global_step": 141642, "epoch": 3372} {"train_loss": -6.747443675994873, "global_step": 141643, "epoch": 3372} {"train_loss": -6.852136611938477, "global_step": 141644, "epoch": 3372} {"train_loss": -6.848348617553711, "global_step": 141645, "epoch": 3372} {"train_loss": -6.803777694702148, "global_step": 141646, "epoch": 3372} {"train_loss": -6.748242378234863, "global_step": 141647, "epoch": 3372} {"train_loss": -6.807165622711182, "global_step": 141648, "epoch": 3372} {"train_loss": -6.712343215942383, "global_step": 141649, "epoch": 3372} {"train_loss": -6.717219829559326, "global_step": 141650, "epoch": 3372} {"train_loss": -6.838505744934082, "global_step": 141651, "epoch": 3372} {"train_loss": -6.782702445983887, "global_step": 141652, "epoch": 3372} {"train_loss": -6.802454948425293, "global_step": 141653, "epoch": 3372} {"train_loss": -6.853930950164795, "global_step": 141654, "epoch": 3372} {"train_loss": -6.773609161376953, "global_step": 141655, "epoch": 3372} {"train_loss": -6.748643398284912, "global_step": 141656, "epoch": 3372} {"train_loss": -6.893165588378906, "global_step": 141657, "epoch": 3372} {"train_loss": -6.763619899749756, "global_step": 141658, "epoch": 3372} {"train_loss": -6.827725410461426, "global_step": 141659, "epoch": 3372} {"train_loss": -6.904732704162598, "global_step": 141660, "epoch": 3372} {"train_loss": -6.873172760009766, "global_step": 141661, "epoch": 3372} {"train_loss": -6.753620147705078, "global_step": 141662, "epoch": 3372} {"train_loss": -6.825523376464844, "global_step": 141663, "epoch": 3372} {"train_loss": -6.856531143188477, "global_step": 141664, "epoch": 3372} {"train_loss": -6.8031565461839945, "global_step": 141665, "epoch": 3372, "val_loss": 67435.515625} {"train_loss": -6.877509117126465, "global_step": 141666, "epoch": 3373} {"train_loss": -6.768767833709717, "global_step": 141667, "epoch": 3373} {"train_loss": -6.750115394592285, "global_step": 141668, "epoch": 3373} {"train_loss": -6.867088317871094, "global_step": 141669, "epoch": 3373} {"train_loss": -6.839734077453613, "global_step": 141670, "epoch": 3373} {"train_loss": -6.839481353759766, "global_step": 141671, "epoch": 3373} {"train_loss": -6.725593090057373, "global_step": 141672, "epoch": 3373} {"train_loss": -6.816469669342041, "global_step": 141673, "epoch": 3373} {"train_loss": -6.7669548988342285, "global_step": 141674, "epoch": 3373} {"train_loss": -6.675229072570801, "global_step": 141675, "epoch": 3373} {"train_loss": -6.709935188293457, "global_step": 141676, "epoch": 3373} {"train_loss": -6.812772750854492, "global_step": 141677, "epoch": 3373} {"train_loss": -6.722639560699463, "global_step": 141678, "epoch": 3373} {"train_loss": -6.714040756225586, "global_step": 141679, "epoch": 3373} {"train_loss": -6.668442726135254, "global_step": 141680, "epoch": 3373} {"train_loss": -6.791933059692383, "global_step": 141681, "epoch": 3373} {"train_loss": -6.8061017990112305, "global_step": 141682, "epoch": 3373} {"train_loss": -6.763786315917969, "global_step": 141683, "epoch": 3373} {"train_loss": -6.646553993225098, "global_step": 141684, "epoch": 3373} {"train_loss": -6.635841369628906, "global_step": 141685, "epoch": 3373} {"train_loss": -6.759500503540039, "global_step": 141686, "epoch": 3373} {"train_loss": -6.670710563659668, "global_step": 141687, "epoch": 3373} {"train_loss": -6.586150646209717, "global_step": 141688, "epoch": 3373} {"train_loss": -6.7871174812316895, "global_step": 141689, "epoch": 3373} {"train_loss": -6.733595848083496, "global_step": 141690, "epoch": 3373} {"train_loss": -6.910189628601074, "global_step": 141691, "epoch": 3373} {"train_loss": -6.746416091918945, "global_step": 141692, "epoch": 3373} {"train_loss": -6.682373046875, "global_step": 141693, "epoch": 3373} {"train_loss": -6.74921989440918, "global_step": 141694, "epoch": 3373} {"train_loss": -6.693578243255615, "global_step": 141695, "epoch": 3373} {"train_loss": -6.75412654876709, "global_step": 141696, "epoch": 3373} {"train_loss": -6.695073127746582, "global_step": 141697, "epoch": 3373} {"train_loss": -6.625578880310059, "global_step": 141698, "epoch": 3373} {"train_loss": -6.813141822814941, "global_step": 141699, "epoch": 3373} {"train_loss": -6.524880409240723, "global_step": 141700, "epoch": 3373} {"train_loss": -6.742130279541016, "global_step": 141701, "epoch": 3373} {"train_loss": -6.63093376159668, "global_step": 141702, "epoch": 3373} {"train_loss": -6.75368070602417, "global_step": 141703, "epoch": 3373} {"train_loss": -6.780842304229736, "global_step": 141704, "epoch": 3373} {"train_loss": -6.698409080505371, "global_step": 141705, "epoch": 3373} {"train_loss": -6.767136573791504, "global_step": 141706, "epoch": 3373} {"train_loss": -6.7389465400150845, "global_step": 141707, "epoch": 3373, "val_loss": 67555.9140625} {"train_loss": -6.840993881225586, "global_step": 141708, "epoch": 3374} {"train_loss": -6.787325382232666, "global_step": 141709, "epoch": 3374} {"train_loss": -6.858373641967773, "global_step": 141710, "epoch": 3374} {"train_loss": -6.741459846496582, "global_step": 141711, "epoch": 3374} {"train_loss": -6.709470272064209, "global_step": 141712, "epoch": 3374} {"train_loss": -6.744817733764648, "global_step": 141713, "epoch": 3374} {"train_loss": -6.688385009765625, "global_step": 141714, "epoch": 3374} {"train_loss": -6.874607563018799, "global_step": 141715, "epoch": 3374} {"train_loss": -6.875296592712402, "global_step": 141716, "epoch": 3374} {"train_loss": -6.782886505126953, "global_step": 141717, "epoch": 3374} {"train_loss": -6.84211540222168, "global_step": 141718, "epoch": 3374} {"train_loss": -6.822497367858887, "global_step": 141719, "epoch": 3374} {"train_loss": -6.772148132324219, "global_step": 141720, "epoch": 3374} {"train_loss": -6.729121685028076, "global_step": 141721, "epoch": 3374} {"train_loss": -6.7139668464660645, "global_step": 141722, "epoch": 3374} {"train_loss": -6.725865364074707, "global_step": 141723, "epoch": 3374} {"train_loss": -6.742815017700195, "global_step": 141724, "epoch": 3374} {"train_loss": -6.714385509490967, "global_step": 141725, "epoch": 3374} {"train_loss": -6.787796974182129, "global_step": 141726, "epoch": 3374} {"train_loss": -6.649661540985107, "global_step": 141727, "epoch": 3374} {"train_loss": -6.745815277099609, "global_step": 141728, "epoch": 3374} {"train_loss": -6.682380676269531, "global_step": 141729, "epoch": 3374} {"train_loss": -6.827361106872559, "global_step": 141730, "epoch": 3374} {"train_loss": -6.65517520904541, "global_step": 141731, "epoch": 3374} {"train_loss": -6.880284786224365, "global_step": 141732, "epoch": 3374} {"train_loss": -6.657966613769531, "global_step": 141733, "epoch": 3374} {"train_loss": -6.759742736816406, "global_step": 141734, "epoch": 3374} {"train_loss": -6.750324249267578, "global_step": 141735, "epoch": 3374} {"train_loss": -6.655440330505371, "global_step": 141736, "epoch": 3374} {"train_loss": -6.773226737976074, "global_step": 141737, "epoch": 3374} {"train_loss": -6.641443252563477, "global_step": 141738, "epoch": 3374} {"train_loss": -6.733150482177734, "global_step": 141739, "epoch": 3374} {"train_loss": -6.79859733581543, "global_step": 141740, "epoch": 3374} {"train_loss": -6.794619560241699, "global_step": 141741, "epoch": 3374} {"train_loss": -6.633556365966797, "global_step": 141742, "epoch": 3374} {"train_loss": -6.689724922180176, "global_step": 141743, "epoch": 3374} {"train_loss": -6.787458419799805, "global_step": 141744, "epoch": 3374} {"train_loss": -6.772451877593994, "global_step": 141745, "epoch": 3374} {"train_loss": -6.692305564880371, "global_step": 141746, "epoch": 3374} {"train_loss": -6.784355640411377, "global_step": 141747, "epoch": 3374} {"train_loss": -6.764089107513428, "global_step": 141748, "epoch": 3374} {"train_loss": -6.750676121030535, "global_step": 141749, "epoch": 3374, "val_loss": 67533.7890625} {"train_loss": -6.799407482147217, "global_step": 141750, "epoch": 3375} {"train_loss": -6.633732795715332, "global_step": 141751, "epoch": 3375} {"train_loss": -6.830653190612793, "global_step": 141752, "epoch": 3375} {"train_loss": -6.699244499206543, "global_step": 141753, "epoch": 3375} {"train_loss": -6.673708915710449, "global_step": 141754, "epoch": 3375} {"train_loss": -6.89084005355835, "global_step": 141755, "epoch": 3375} {"train_loss": -6.774950981140137, "global_step": 141756, "epoch": 3375} {"train_loss": -6.655303955078125, "global_step": 141757, "epoch": 3375} {"train_loss": -6.746046543121338, "global_step": 141758, "epoch": 3375} {"train_loss": -6.761631011962891, "global_step": 141759, "epoch": 3375} {"train_loss": -6.9631147384643555, "global_step": 141760, "epoch": 3375} {"train_loss": -6.85523796081543, "global_step": 141761, "epoch": 3375} {"train_loss": -6.748904228210449, "global_step": 141762, "epoch": 3375} {"train_loss": -6.66147518157959, "global_step": 141763, "epoch": 3375} {"train_loss": -6.7734375, "global_step": 141764, "epoch": 3375} {"train_loss": -6.6861066818237305, "global_step": 141765, "epoch": 3375} {"train_loss": -6.855500221252441, "global_step": 141766, "epoch": 3375} {"train_loss": -6.800237655639648, "global_step": 141767, "epoch": 3375} {"train_loss": -6.772739410400391, "global_step": 141768, "epoch": 3375} {"train_loss": -6.799518585205078, "global_step": 141769, "epoch": 3375} {"train_loss": -6.905435562133789, "global_step": 141770, "epoch": 3375} {"train_loss": -6.806232452392578, "global_step": 141771, "epoch": 3375} {"train_loss": -6.779513359069824, "global_step": 141772, "epoch": 3375} {"train_loss": -6.781893730163574, "global_step": 141773, "epoch": 3375} {"train_loss": -6.860969543457031, "global_step": 141774, "epoch": 3375} {"train_loss": -6.82460880279541, "global_step": 141775, "epoch": 3375} {"train_loss": -6.823604106903076, "global_step": 141776, "epoch": 3375} {"train_loss": -6.8845062255859375, "global_step": 141777, "epoch": 3375} {"train_loss": -6.734691143035889, "global_step": 141778, "epoch": 3375} {"train_loss": -6.804033279418945, "global_step": 141779, "epoch": 3375} {"train_loss": -6.680659294128418, "global_step": 141780, "epoch": 3375} {"train_loss": -6.768481254577637, "global_step": 141781, "epoch": 3375} {"train_loss": -6.757784366607666, "global_step": 141782, "epoch": 3375} {"train_loss": -6.874454975128174, "global_step": 141783, "epoch": 3375} {"train_loss": -6.754868507385254, "global_step": 141784, "epoch": 3375} {"train_loss": -6.79882287979126, "global_step": 141785, "epoch": 3375} {"train_loss": -6.665620803833008, "global_step": 141786, "epoch": 3375} {"train_loss": -6.859325408935547, "global_step": 141787, "epoch": 3375} {"train_loss": -6.751187324523926, "global_step": 141788, "epoch": 3375} {"train_loss": -6.670455455780029, "global_step": 141789, "epoch": 3375} {"train_loss": -6.847105026245117, "global_step": 141790, "epoch": 3375} {"train_loss": -6.779904331479754, "global_step": 141791, "epoch": 3375, "val_loss": 67381.6640625} {"train_loss": -6.711772441864014, "global_step": 141792, "epoch": 3376} {"train_loss": -6.8291401863098145, "global_step": 141793, "epoch": 3376} {"train_loss": -6.6875128746032715, "global_step": 141794, "epoch": 3376} {"train_loss": -6.780900001525879, "global_step": 141795, "epoch": 3376} {"train_loss": -6.8292107582092285, "global_step": 141796, "epoch": 3376} {"train_loss": -6.770867347717285, "global_step": 141797, "epoch": 3376} {"train_loss": -6.772566318511963, "global_step": 141798, "epoch": 3376} {"train_loss": -6.7334675788879395, "global_step": 141799, "epoch": 3376} {"train_loss": -6.7143144607543945, "global_step": 141800, "epoch": 3376} {"train_loss": -6.834362030029297, "global_step": 141801, "epoch": 3376} {"train_loss": -6.745328903198242, "global_step": 141802, "epoch": 3376} {"train_loss": -6.780045509338379, "global_step": 141803, "epoch": 3376} {"train_loss": -6.832283020019531, "global_step": 141804, "epoch": 3376} {"train_loss": -6.744411468505859, "global_step": 141805, "epoch": 3376} {"train_loss": -6.817386627197266, "global_step": 141806, "epoch": 3376} {"train_loss": -6.8228912353515625, "global_step": 141807, "epoch": 3376} {"train_loss": -6.73164176940918, "global_step": 141808, "epoch": 3376} {"train_loss": -6.861997604370117, "global_step": 141809, "epoch": 3376} {"train_loss": -6.730658054351807, "global_step": 141810, "epoch": 3376} {"train_loss": -6.699487686157227, "global_step": 141811, "epoch": 3376} {"train_loss": -6.755375385284424, "global_step": 141812, "epoch": 3376} {"train_loss": -6.799571514129639, "global_step": 141813, "epoch": 3376} {"train_loss": -6.766246318817139, "global_step": 141814, "epoch": 3376} {"train_loss": -6.903878211975098, "global_step": 141815, "epoch": 3376} {"train_loss": -6.7816619873046875, "global_step": 141816, "epoch": 3376} {"train_loss": -6.756341934204102, "global_step": 141817, "epoch": 3376} {"train_loss": -6.771744251251221, "global_step": 141818, "epoch": 3376} {"train_loss": -6.674274444580078, "global_step": 141819, "epoch": 3376} {"train_loss": -6.728416919708252, "global_step": 141820, "epoch": 3376} {"train_loss": -6.832169532775879, "global_step": 141821, "epoch": 3376} {"train_loss": -6.6865553855896, "global_step": 141822, "epoch": 3376} {"train_loss": -6.758408546447754, "global_step": 141823, "epoch": 3376} {"train_loss": -6.589676380157471, "global_step": 141824, "epoch": 3376} {"train_loss": -6.882232666015625, "global_step": 141825, "epoch": 3376} {"train_loss": -6.75172758102417, "global_step": 141826, "epoch": 3376} {"train_loss": -6.649450302124023, "global_step": 141827, "epoch": 3376} {"train_loss": -6.847799301147461, "global_step": 141828, "epoch": 3376} {"train_loss": -6.756160736083984, "global_step": 141829, "epoch": 3376} {"train_loss": -6.714993476867676, "global_step": 141830, "epoch": 3376} {"train_loss": -6.795352935791016, "global_step": 141831, "epoch": 3376} {"train_loss": -6.833377838134766, "global_step": 141832, "epoch": 3376} {"train_loss": -6.766623553775606, "global_step": 141833, "epoch": 3376, "val_loss": 67559.375} {"train_loss": -6.799715518951416, "global_step": 141834, "epoch": 3377} {"train_loss": -6.902437210083008, "global_step": 141835, "epoch": 3377} {"train_loss": -6.634734153747559, "global_step": 141836, "epoch": 3377} {"train_loss": -6.8056640625, "global_step": 141837, "epoch": 3377} {"train_loss": -6.572391510009766, "global_step": 141838, "epoch": 3377} {"train_loss": -6.788043022155762, "global_step": 141839, "epoch": 3377} {"train_loss": -6.8571248054504395, "global_step": 141840, "epoch": 3377} {"train_loss": -6.668065071105957, "global_step": 141841, "epoch": 3377} {"train_loss": -6.822100639343262, "global_step": 141842, "epoch": 3377} {"train_loss": -6.799386024475098, "global_step": 141843, "epoch": 3377} {"train_loss": -6.764811038970947, "global_step": 141844, "epoch": 3377} {"train_loss": -6.717746734619141, "global_step": 141845, "epoch": 3377} {"train_loss": -6.824490547180176, "global_step": 141846, "epoch": 3377} {"train_loss": -6.692986488342285, "global_step": 141847, "epoch": 3377} {"train_loss": -6.62591028213501, "global_step": 141848, "epoch": 3377} {"train_loss": -6.6997833251953125, "global_step": 141849, "epoch": 3377} {"train_loss": -6.5703043937683105, "global_step": 141850, "epoch": 3377} {"train_loss": -6.721061706542969, "global_step": 141851, "epoch": 3377} {"train_loss": -6.549289703369141, "global_step": 141852, "epoch": 3377} {"train_loss": -6.74652099609375, "global_step": 141853, "epoch": 3377} {"train_loss": -6.686130523681641, "global_step": 141854, "epoch": 3377} {"train_loss": -6.828348636627197, "global_step": 141855, "epoch": 3377} {"train_loss": -6.657135009765625, "global_step": 141856, "epoch": 3377} {"train_loss": -6.65479850769043, "global_step": 141857, "epoch": 3377} {"train_loss": -6.705023765563965, "global_step": 141858, "epoch": 3377} {"train_loss": -6.683402061462402, "global_step": 141859, "epoch": 3377} {"train_loss": -6.827332496643066, "global_step": 141860, "epoch": 3377} {"train_loss": -6.695003509521484, "global_step": 141861, "epoch": 3377} {"train_loss": -6.818160533905029, "global_step": 141862, "epoch": 3377} {"train_loss": -6.561396598815918, "global_step": 141863, "epoch": 3377} {"train_loss": -6.7026262283325195, "global_step": 141864, "epoch": 3377} {"train_loss": -6.770357131958008, "global_step": 141865, "epoch": 3377} {"train_loss": -6.722015380859375, "global_step": 141866, "epoch": 3377} {"train_loss": -6.652342796325684, "global_step": 141867, "epoch": 3377} {"train_loss": -6.694070816040039, "global_step": 141868, "epoch": 3377} {"train_loss": -6.69036865234375, "global_step": 141869, "epoch": 3377} {"train_loss": -6.685534477233887, "global_step": 141870, "epoch": 3377} {"train_loss": -6.839845657348633, "global_step": 141871, "epoch": 3377} {"train_loss": -6.794223785400391, "global_step": 141872, "epoch": 3377} {"train_loss": -6.881426811218262, "global_step": 141873, "epoch": 3377} {"train_loss": -6.750340938568115, "global_step": 141874, "epoch": 3377} {"train_loss": -6.729973770323253, "global_step": 141875, "epoch": 3377, "val_loss": 67454.53125} {"train_loss": -6.804616928100586, "global_step": 141876, "epoch": 3378} {"train_loss": -6.703729629516602, "global_step": 141877, "epoch": 3378} {"train_loss": -6.6332292556762695, "global_step": 141878, "epoch": 3378} {"train_loss": -6.822208404541016, "global_step": 141879, "epoch": 3378} {"train_loss": -6.68138313293457, "global_step": 141880, "epoch": 3378} {"train_loss": -6.742177963256836, "global_step": 141881, "epoch": 3378} {"train_loss": -6.822775363922119, "global_step": 141882, "epoch": 3378} {"train_loss": -6.8224897384643555, "global_step": 141883, "epoch": 3378} {"train_loss": -6.776660919189453, "global_step": 141884, "epoch": 3378} {"train_loss": -6.7265777587890625, "global_step": 141885, "epoch": 3378} {"train_loss": -6.799037933349609, "global_step": 141886, "epoch": 3378} {"train_loss": -6.859070777893066, "global_step": 141887, "epoch": 3378} {"train_loss": -6.796237945556641, "global_step": 141888, "epoch": 3378} {"train_loss": -6.791753768920898, "global_step": 141889, "epoch": 3378} {"train_loss": -6.757542133331299, "global_step": 141890, "epoch": 3378} {"train_loss": -6.792911529541016, "global_step": 141891, "epoch": 3378} {"train_loss": -6.868856906890869, "global_step": 141892, "epoch": 3378} {"train_loss": -6.823031425476074, "global_step": 141893, "epoch": 3378} {"train_loss": -6.731893062591553, "global_step": 141894, "epoch": 3378} {"train_loss": -6.817965507507324, "global_step": 141895, "epoch": 3378} {"train_loss": -6.897006988525391, "global_step": 141896, "epoch": 3378} {"train_loss": -6.713030815124512, "global_step": 141897, "epoch": 3378} {"train_loss": -6.8360466957092285, "global_step": 141898, "epoch": 3378} {"train_loss": -6.6940202713012695, "global_step": 141899, "epoch": 3378} {"train_loss": -6.815767288208008, "global_step": 141900, "epoch": 3378} {"train_loss": -6.802557945251465, "global_step": 141901, "epoch": 3378} {"train_loss": -6.636134147644043, "global_step": 141902, "epoch": 3378} {"train_loss": -6.767238616943359, "global_step": 141903, "epoch": 3378} {"train_loss": -6.6840105056762695, "global_step": 141904, "epoch": 3378} {"train_loss": -6.556506156921387, "global_step": 141905, "epoch": 3378} {"train_loss": -6.738953590393066, "global_step": 141906, "epoch": 3378} {"train_loss": -6.766798973083496, "global_step": 141907, "epoch": 3378} {"train_loss": -6.539194583892822, "global_step": 141908, "epoch": 3378} {"train_loss": -6.742685317993164, "global_step": 141909, "epoch": 3378} {"train_loss": -6.643762588500977, "global_step": 141910, "epoch": 3378} {"train_loss": -6.702785015106201, "global_step": 141911, "epoch": 3378} {"train_loss": -6.695131301879883, "global_step": 141912, "epoch": 3378} {"train_loss": -6.605557441711426, "global_step": 141913, "epoch": 3378} {"train_loss": -6.6517462730407715, "global_step": 141914, "epoch": 3378} {"train_loss": -6.575922966003418, "global_step": 141915, "epoch": 3378} {"train_loss": -6.822017669677734, "global_step": 141916, "epoch": 3378} {"train_loss": -6.739742324465797, "global_step": 141917, "epoch": 3378, "val_loss": 67213.5625} {"train_loss": -6.778571128845215, "global_step": 141918, "epoch": 3379} {"train_loss": -6.683403015136719, "global_step": 141919, "epoch": 3379} {"train_loss": -6.788256645202637, "global_step": 141920, "epoch": 3379} {"train_loss": -6.8488311767578125, "global_step": 141921, "epoch": 3379} {"train_loss": -6.751884937286377, "global_step": 141922, "epoch": 3379} {"train_loss": -6.791755199432373, "global_step": 141923, "epoch": 3379} {"train_loss": -6.800519943237305, "global_step": 141924, "epoch": 3379} {"train_loss": -6.712198257446289, "global_step": 141925, "epoch": 3379} {"train_loss": -6.767468452453613, "global_step": 141926, "epoch": 3379} {"train_loss": -6.715309143066406, "global_step": 141927, "epoch": 3379} {"train_loss": -6.788447380065918, "global_step": 141928, "epoch": 3379} {"train_loss": -6.833674430847168, "global_step": 141929, "epoch": 3379} {"train_loss": -6.823053359985352, "global_step": 141930, "epoch": 3379} {"train_loss": -6.748103141784668, "global_step": 141931, "epoch": 3379} {"train_loss": -6.614288330078125, "global_step": 141932, "epoch": 3379} {"train_loss": -6.703313827514648, "global_step": 141933, "epoch": 3379} {"train_loss": -6.737688064575195, "global_step": 141934, "epoch": 3379} {"train_loss": -6.669393062591553, "global_step": 141935, "epoch": 3379} {"train_loss": -6.828014850616455, "global_step": 141936, "epoch": 3379} {"train_loss": -6.8028435707092285, "global_step": 141937, "epoch": 3379} {"train_loss": -6.8447346687316895, "global_step": 141938, "epoch": 3379} {"train_loss": -6.707139015197754, "global_step": 141939, "epoch": 3379} {"train_loss": -6.715026378631592, "global_step": 141940, "epoch": 3379} {"train_loss": -6.913203239440918, "global_step": 141941, "epoch": 3379} {"train_loss": -6.806169509887695, "global_step": 141942, "epoch": 3379} {"train_loss": -6.759669303894043, "global_step": 141943, "epoch": 3379} {"train_loss": -6.726213455200195, "global_step": 141944, "epoch": 3379} {"train_loss": -6.741423606872559, "global_step": 141945, "epoch": 3379} {"train_loss": -6.787785053253174, "global_step": 141946, "epoch": 3379} {"train_loss": -6.908509731292725, "global_step": 141947, "epoch": 3379} {"train_loss": -6.80507755279541, "global_step": 141948, "epoch": 3379} {"train_loss": -6.810119152069092, "global_step": 141949, "epoch": 3379} {"train_loss": -6.796525001525879, "global_step": 141950, "epoch": 3379} {"train_loss": -6.718667984008789, "global_step": 141951, "epoch": 3379} {"train_loss": -6.793253421783447, "global_step": 141952, "epoch": 3379} {"train_loss": -6.728093147277832, "global_step": 141953, "epoch": 3379} {"train_loss": -6.810019493103027, "global_step": 141954, "epoch": 3379} {"train_loss": -6.831722736358643, "global_step": 141955, "epoch": 3379} {"train_loss": -6.696230888366699, "global_step": 141956, "epoch": 3379} {"train_loss": -6.786739349365234, "global_step": 141957, "epoch": 3379} {"train_loss": -6.755117893218994, "global_step": 141958, "epoch": 3379} {"train_loss": -6.772085893721807, "global_step": 141959, "epoch": 3379, "val_loss": 67486.1640625} {"train_loss": -6.803201675415039, "global_step": 141960, "epoch": 3380} {"train_loss": -6.829895496368408, "global_step": 141961, "epoch": 3380} {"train_loss": -6.751279830932617, "global_step": 141962, "epoch": 3380} {"train_loss": -6.80040979385376, "global_step": 141963, "epoch": 3380} {"train_loss": -6.804498195648193, "global_step": 141964, "epoch": 3380} {"train_loss": -6.97809362411499, "global_step": 141965, "epoch": 3380} {"train_loss": -6.782208442687988, "global_step": 141966, "epoch": 3380} {"train_loss": -6.856774806976318, "global_step": 141967, "epoch": 3380} {"train_loss": -6.7634172439575195, "global_step": 141968, "epoch": 3380} {"train_loss": -6.849889755249023, "global_step": 141969, "epoch": 3380} {"train_loss": -6.807704925537109, "global_step": 141970, "epoch": 3380} {"train_loss": -6.891075611114502, "global_step": 141971, "epoch": 3380} {"train_loss": -6.872204780578613, "global_step": 141972, "epoch": 3380} {"train_loss": -6.841221809387207, "global_step": 141973, "epoch": 3380} {"train_loss": -6.852520942687988, "global_step": 141974, "epoch": 3380} {"train_loss": -6.831125736236572, "global_step": 141975, "epoch": 3380} {"train_loss": -6.882621765136719, "global_step": 141976, "epoch": 3380} {"train_loss": -6.827546119689941, "global_step": 141977, "epoch": 3380} {"train_loss": -6.809035301208496, "global_step": 141978, "epoch": 3380} {"train_loss": -6.755020618438721, "global_step": 141979, "epoch": 3380} {"train_loss": -6.763149261474609, "global_step": 141980, "epoch": 3380} {"train_loss": -6.813724994659424, "global_step": 141981, "epoch": 3380} {"train_loss": -6.802647113800049, "global_step": 141982, "epoch": 3380} {"train_loss": -6.865668296813965, "global_step": 141983, "epoch": 3380} {"train_loss": -6.850461959838867, "global_step": 141984, "epoch": 3380} {"train_loss": -6.76705265045166, "global_step": 141985, "epoch": 3380} {"train_loss": -6.780857563018799, "global_step": 141986, "epoch": 3380} {"train_loss": -6.734853744506836, "global_step": 141987, "epoch": 3380} {"train_loss": -6.819085121154785, "global_step": 141988, "epoch": 3380} {"train_loss": -6.7936506271362305, "global_step": 141989, "epoch": 3380} {"train_loss": -6.90023136138916, "global_step": 141990, "epoch": 3380} {"train_loss": -6.8451409339904785, "global_step": 141991, "epoch": 3380} {"train_loss": -6.8003973960876465, "global_step": 141992, "epoch": 3380} {"train_loss": -6.904106616973877, "global_step": 141993, "epoch": 3380} {"train_loss": -6.7406229972839355, "global_step": 141994, "epoch": 3380} {"train_loss": -6.8476762771606445, "global_step": 141995, "epoch": 3380} {"train_loss": -6.773845672607422, "global_step": 141996, "epoch": 3380} {"train_loss": -6.777640342712402, "global_step": 141997, "epoch": 3380} {"train_loss": -6.870452404022217, "global_step": 141998, "epoch": 3380} {"train_loss": -6.773155689239502, "global_step": 141999, "epoch": 3380} {"train_loss": -6.771261215209961, "global_step": 142000, "epoch": 3380} {"train_loss": -6.818130004973638, "global_step": 142001, "epoch": 3380, "val_loss": 67379.484375} {"train_loss": -6.7950968742370605, "global_step": 142002, "epoch": 3381} {"train_loss": -6.851927757263184, "global_step": 142003, "epoch": 3381} {"train_loss": -6.88917350769043, "global_step": 142004, "epoch": 3381} {"train_loss": -6.74593448638916, "global_step": 142005, "epoch": 3381} {"train_loss": -6.82755184173584, "global_step": 142006, "epoch": 3381} {"train_loss": -6.698325157165527, "global_step": 142007, "epoch": 3381} {"train_loss": -6.786785125732422, "global_step": 142008, "epoch": 3381} {"train_loss": -6.831625938415527, "global_step": 142009, "epoch": 3381} {"train_loss": -6.813526153564453, "global_step": 142010, "epoch": 3381} {"train_loss": -6.808864593505859, "global_step": 142011, "epoch": 3381} {"train_loss": -6.844184398651123, "global_step": 142012, "epoch": 3381} {"train_loss": -6.778345108032227, "global_step": 142013, "epoch": 3381} {"train_loss": -6.781445026397705, "global_step": 142014, "epoch": 3381} {"train_loss": -6.847793102264404, "global_step": 142015, "epoch": 3381} {"train_loss": -6.868791580200195, "global_step": 142016, "epoch": 3381} {"train_loss": -6.8160481452941895, "global_step": 142017, "epoch": 3381} {"train_loss": -6.801850318908691, "global_step": 142018, "epoch": 3381} {"train_loss": -6.852935314178467, "global_step": 142019, "epoch": 3381} {"train_loss": -6.7696003913879395, "global_step": 142020, "epoch": 3381} {"train_loss": -6.8182573318481445, "global_step": 142021, "epoch": 3381} {"train_loss": -6.696828842163086, "global_step": 142022, "epoch": 3381} {"train_loss": -6.853583335876465, "global_step": 142023, "epoch": 3381} {"train_loss": -6.954652786254883, "global_step": 142024, "epoch": 3381} {"train_loss": -6.786348342895508, "global_step": 142025, "epoch": 3381} {"train_loss": -6.659455299377441, "global_step": 142026, "epoch": 3381} {"train_loss": -6.768207550048828, "global_step": 142027, "epoch": 3381} {"train_loss": -6.74851655960083, "global_step": 142028, "epoch": 3381} {"train_loss": -6.852116584777832, "global_step": 142029, "epoch": 3381} {"train_loss": -6.793807029724121, "global_step": 142030, "epoch": 3381} {"train_loss": -6.754510879516602, "global_step": 142031, "epoch": 3381} {"train_loss": -6.88942289352417, "global_step": 142032, "epoch": 3381} {"train_loss": -6.759110450744629, "global_step": 142033, "epoch": 3381} {"train_loss": -6.7480268478393555, "global_step": 142034, "epoch": 3381} {"train_loss": -6.786391735076904, "global_step": 142035, "epoch": 3381} {"train_loss": -6.840289115905762, "global_step": 142036, "epoch": 3381} {"train_loss": -6.808115005493164, "global_step": 142037, "epoch": 3381} {"train_loss": -6.8451666831970215, "global_step": 142038, "epoch": 3381} {"train_loss": -6.801894187927246, "global_step": 142039, "epoch": 3381} {"train_loss": -6.789412498474121, "global_step": 142040, "epoch": 3381} {"train_loss": -6.8242034912109375, "global_step": 142041, "epoch": 3381} {"train_loss": -6.829936504364014, "global_step": 142042, "epoch": 3381} {"train_loss": -6.803979930423555, "global_step": 142043, "epoch": 3381, "val_loss": 67444.2890625} {"train_loss": -6.7108988761901855, "global_step": 142044, "epoch": 3382} {"train_loss": -6.900056838989258, "global_step": 142045, "epoch": 3382} {"train_loss": -6.781140327453613, "global_step": 142046, "epoch": 3382} {"train_loss": -6.798645496368408, "global_step": 142047, "epoch": 3382} {"train_loss": -6.872517108917236, "global_step": 142048, "epoch": 3382} {"train_loss": -6.846933364868164, "global_step": 142049, "epoch": 3382} {"train_loss": -6.843530178070068, "global_step": 142050, "epoch": 3382} {"train_loss": -6.851263046264648, "global_step": 142051, "epoch": 3382} {"train_loss": -6.715230941772461, "global_step": 142052, "epoch": 3382} {"train_loss": -6.721127033233643, "global_step": 142053, "epoch": 3382} {"train_loss": -6.827200889587402, "global_step": 142054, "epoch": 3382} {"train_loss": -6.641100883483887, "global_step": 142055, "epoch": 3382} {"train_loss": -6.728967666625977, "global_step": 142056, "epoch": 3382} {"train_loss": -6.737120628356934, "global_step": 142057, "epoch": 3382} {"train_loss": -6.625975608825684, "global_step": 142058, "epoch": 3382} {"train_loss": -6.6543731689453125, "global_step": 142059, "epoch": 3382} {"train_loss": -6.7007975578308105, "global_step": 142060, "epoch": 3382} {"train_loss": -6.650973796844482, "global_step": 142061, "epoch": 3382} {"train_loss": -6.834211349487305, "global_step": 142062, "epoch": 3382} {"train_loss": -6.790825843811035, "global_step": 142063, "epoch": 3382} {"train_loss": -6.656824111938477, "global_step": 142064, "epoch": 3382} {"train_loss": -6.872247219085693, "global_step": 142065, "epoch": 3382} {"train_loss": -6.74777889251709, "global_step": 142066, "epoch": 3382} {"train_loss": -6.612015724182129, "global_step": 142067, "epoch": 3382} {"train_loss": -6.728288173675537, "global_step": 142068, "epoch": 3382} {"train_loss": -6.804078102111816, "global_step": 142069, "epoch": 3382} {"train_loss": -6.72613000869751, "global_step": 142070, "epoch": 3382} {"train_loss": -6.804333686828613, "global_step": 142071, "epoch": 3382} {"train_loss": -6.817720413208008, "global_step": 142072, "epoch": 3382} {"train_loss": -6.770988464355469, "global_step": 142073, "epoch": 3382} {"train_loss": -6.800478935241699, "global_step": 142074, "epoch": 3382} {"train_loss": -6.74318790435791, "global_step": 142075, "epoch": 3382} {"train_loss": -6.670352458953857, "global_step": 142076, "epoch": 3382} {"train_loss": -6.802597999572754, "global_step": 142077, "epoch": 3382} {"train_loss": -6.803409099578857, "global_step": 142078, "epoch": 3382} {"train_loss": -6.841562271118164, "global_step": 142079, "epoch": 3382} {"train_loss": -6.75840950012207, "global_step": 142080, "epoch": 3382} {"train_loss": -6.779412269592285, "global_step": 142081, "epoch": 3382} {"train_loss": -6.740533351898193, "global_step": 142082, "epoch": 3382} {"train_loss": -6.774508476257324, "global_step": 142083, "epoch": 3382} {"train_loss": -6.849890232086182, "global_step": 142084, "epoch": 3382} {"train_loss": -6.763903776804606, "global_step": 142085, "epoch": 3382, "val_loss": 67256.6875} {"train_loss": -6.846561431884766, "global_step": 142086, "epoch": 3383} {"train_loss": -6.8124566078186035, "global_step": 142087, "epoch": 3383} {"train_loss": -6.736417770385742, "global_step": 142088, "epoch": 3383} {"train_loss": -6.822856903076172, "global_step": 142089, "epoch": 3383} {"train_loss": -6.903059482574463, "global_step": 142090, "epoch": 3383} {"train_loss": -6.88810396194458, "global_step": 142091, "epoch": 3383} {"train_loss": -6.842216968536377, "global_step": 142092, "epoch": 3383} {"train_loss": -6.8705854415893555, "global_step": 142093, "epoch": 3383} {"train_loss": -6.862621307373047, "global_step": 142094, "epoch": 3383} {"train_loss": -6.818639755249023, "global_step": 142095, "epoch": 3383} {"train_loss": -6.811611175537109, "global_step": 142096, "epoch": 3383} {"train_loss": -6.861692905426025, "global_step": 142097, "epoch": 3383} {"train_loss": -6.702234268188477, "global_step": 142098, "epoch": 3383} {"train_loss": -6.692980766296387, "global_step": 142099, "epoch": 3383} {"train_loss": -6.948855400085449, "global_step": 142100, "epoch": 3383} {"train_loss": -6.836442947387695, "global_step": 142101, "epoch": 3383} {"train_loss": -6.836906909942627, "global_step": 142102, "epoch": 3383} {"train_loss": -6.946207046508789, "global_step": 142103, "epoch": 3383} {"train_loss": -6.773247241973877, "global_step": 142104, "epoch": 3383} {"train_loss": -6.831496715545654, "global_step": 142105, "epoch": 3383} {"train_loss": -6.74455451965332, "global_step": 142106, "epoch": 3383} {"train_loss": -6.751991271972656, "global_step": 142107, "epoch": 3383} {"train_loss": -6.780085563659668, "global_step": 142108, "epoch": 3383} {"train_loss": -6.9052252769470215, "global_step": 142109, "epoch": 3383} {"train_loss": -6.910329818725586, "global_step": 142110, "epoch": 3383} {"train_loss": -6.770583629608154, "global_step": 142111, "epoch": 3383} {"train_loss": -6.71852445602417, "global_step": 142112, "epoch": 3383} {"train_loss": -6.791507720947266, "global_step": 142113, "epoch": 3383} {"train_loss": -6.793771743774414, "global_step": 142114, "epoch": 3383} {"train_loss": -6.851464748382568, "global_step": 142115, "epoch": 3383} {"train_loss": -6.995862007141113, "global_step": 142116, "epoch": 3383} {"train_loss": -6.697098731994629, "global_step": 142117, "epoch": 3383} {"train_loss": -6.860372543334961, "global_step": 142118, "epoch": 3383} {"train_loss": -6.715175628662109, "global_step": 142119, "epoch": 3383} {"train_loss": -6.810549259185791, "global_step": 142120, "epoch": 3383} {"train_loss": -6.870453834533691, "global_step": 142121, "epoch": 3383} {"train_loss": -6.876190662384033, "global_step": 142122, "epoch": 3383} {"train_loss": -6.875433444976807, "global_step": 142123, "epoch": 3383} {"train_loss": -6.7842254638671875, "global_step": 142124, "epoch": 3383} {"train_loss": -6.860729217529297, "global_step": 142125, "epoch": 3383} {"train_loss": -6.702865123748779, "global_step": 142126, "epoch": 3383} {"train_loss": -6.818523985998971, "global_step": 142127, "epoch": 3383, "val_loss": 67435.203125} {"train_loss": -6.924654960632324, "global_step": 142128, "epoch": 3384} {"train_loss": -6.748842239379883, "global_step": 142129, "epoch": 3384} {"train_loss": -6.698149681091309, "global_step": 142130, "epoch": 3384} {"train_loss": -6.795628547668457, "global_step": 142131, "epoch": 3384} {"train_loss": -6.785408973693848, "global_step": 142132, "epoch": 3384} {"train_loss": -6.736817359924316, "global_step": 142133, "epoch": 3384} {"train_loss": -6.805627822875977, "global_step": 142134, "epoch": 3384} {"train_loss": -6.593908309936523, "global_step": 142135, "epoch": 3384} {"train_loss": -6.752545356750488, "global_step": 142136, "epoch": 3384} {"train_loss": -6.754176139831543, "global_step": 142137, "epoch": 3384} {"train_loss": -6.781623840332031, "global_step": 142138, "epoch": 3384} {"train_loss": -6.782163143157959, "global_step": 142139, "epoch": 3384} {"train_loss": -6.713603973388672, "global_step": 142140, "epoch": 3384} {"train_loss": -6.782021999359131, "global_step": 142141, "epoch": 3384} {"train_loss": -6.810379981994629, "global_step": 142142, "epoch": 3384} {"train_loss": -6.762969970703125, "global_step": 142143, "epoch": 3384} {"train_loss": -6.8672776222229, "global_step": 142144, "epoch": 3384} {"train_loss": -6.725796699523926, "global_step": 142145, "epoch": 3384} {"train_loss": -6.775251388549805, "global_step": 142146, "epoch": 3384} {"train_loss": -6.774314880371094, "global_step": 142147, "epoch": 3384} {"train_loss": -6.781336784362793, "global_step": 142148, "epoch": 3384} {"train_loss": -6.563329696655273, "global_step": 142149, "epoch": 3384} {"train_loss": -6.781796455383301, "global_step": 142150, "epoch": 3384} {"train_loss": -6.832965850830078, "global_step": 142151, "epoch": 3384} {"train_loss": -6.645330429077148, "global_step": 142152, "epoch": 3384} {"train_loss": -6.8018693923950195, "global_step": 142153, "epoch": 3384} {"train_loss": -6.824879169464111, "global_step": 142154, "epoch": 3384} {"train_loss": -6.759485244750977, "global_step": 142155, "epoch": 3384} {"train_loss": -6.8073344230651855, "global_step": 142156, "epoch": 3384} {"train_loss": -6.747398853302002, "global_step": 142157, "epoch": 3384} {"train_loss": -6.736933708190918, "global_step": 142158, "epoch": 3384} {"train_loss": -6.72076416015625, "global_step": 142159, "epoch": 3384} {"train_loss": -6.800168991088867, "global_step": 142160, "epoch": 3384} {"train_loss": -6.888863563537598, "global_step": 142161, "epoch": 3384} {"train_loss": -6.8154401779174805, "global_step": 142162, "epoch": 3384} {"train_loss": -6.669134616851807, "global_step": 142163, "epoch": 3384} {"train_loss": -6.777212142944336, "global_step": 142164, "epoch": 3384} {"train_loss": -6.7267632484436035, "global_step": 142165, "epoch": 3384} {"train_loss": -6.8114519119262695, "global_step": 142166, "epoch": 3384} {"train_loss": -6.87980318069458, "global_step": 142167, "epoch": 3384} {"train_loss": -6.8495283126831055, "global_step": 142168, "epoch": 3384} {"train_loss": -6.772396212532406, "global_step": 142169, "epoch": 3384, "val_loss": 67514.875} {"train_loss": -6.949578285217285, "global_step": 142170, "epoch": 3385} {"train_loss": -6.8927154541015625, "global_step": 142171, "epoch": 3385} {"train_loss": -6.971402168273926, "global_step": 142172, "epoch": 3385} {"train_loss": -6.797737121582031, "global_step": 142173, "epoch": 3385} {"train_loss": -6.807605743408203, "global_step": 142174, "epoch": 3385} {"train_loss": -6.802575588226318, "global_step": 142175, "epoch": 3385} {"train_loss": -6.732224464416504, "global_step": 142176, "epoch": 3385} {"train_loss": -6.859360694885254, "global_step": 142177, "epoch": 3385} {"train_loss": -6.803881645202637, "global_step": 142178, "epoch": 3385} {"train_loss": -6.7813825607299805, "global_step": 142179, "epoch": 3385} {"train_loss": -6.924526691436768, "global_step": 142180, "epoch": 3385} {"train_loss": -6.901312828063965, "global_step": 142181, "epoch": 3385} {"train_loss": -6.868017196655273, "global_step": 142182, "epoch": 3385} {"train_loss": -6.850613594055176, "global_step": 142183, "epoch": 3385} {"train_loss": -6.810376167297363, "global_step": 142184, "epoch": 3385} {"train_loss": -6.766408920288086, "global_step": 142185, "epoch": 3385} {"train_loss": -6.854295253753662, "global_step": 142186, "epoch": 3385} {"train_loss": -6.824708461761475, "global_step": 142187, "epoch": 3385} {"train_loss": -6.755212306976318, "global_step": 142188, "epoch": 3385} {"train_loss": -6.78352165222168, "global_step": 142189, "epoch": 3385} {"train_loss": -6.756677150726318, "global_step": 142190, "epoch": 3385} {"train_loss": -6.794901371002197, "global_step": 142191, "epoch": 3385} {"train_loss": -6.799972057342529, "global_step": 142192, "epoch": 3385} {"train_loss": -6.821933746337891, "global_step": 142193, "epoch": 3385} {"train_loss": -6.733250617980957, "global_step": 142194, "epoch": 3385} {"train_loss": -6.675492763519287, "global_step": 142195, "epoch": 3385} {"train_loss": -6.747284889221191, "global_step": 142196, "epoch": 3385} {"train_loss": -6.7628583908081055, "global_step": 142197, "epoch": 3385} {"train_loss": -6.784829139709473, "global_step": 142198, "epoch": 3385} {"train_loss": -6.806514739990234, "global_step": 142199, "epoch": 3385} {"train_loss": -6.792484283447266, "global_step": 142200, "epoch": 3385} {"train_loss": -6.818765640258789, "global_step": 142201, "epoch": 3385} {"train_loss": -6.835073471069336, "global_step": 142202, "epoch": 3385} {"train_loss": -6.788599014282227, "global_step": 142203, "epoch": 3385} {"train_loss": -6.809944152832031, "global_step": 142204, "epoch": 3385} {"train_loss": -6.757458686828613, "global_step": 142205, "epoch": 3385} {"train_loss": -6.722646236419678, "global_step": 142206, "epoch": 3385} {"train_loss": -6.745477199554443, "global_step": 142207, "epoch": 3385} {"train_loss": -6.80745792388916, "global_step": 142208, "epoch": 3385} {"train_loss": -6.862429141998291, "global_step": 142209, "epoch": 3385} {"train_loss": -6.830143451690674, "global_step": 142210, "epoch": 3385} {"train_loss": -6.81144650777181, "global_step": 142211, "epoch": 3385, "val_loss": 67406.7578125} {"train_loss": -6.940279006958008, "global_step": 142212, "epoch": 3386} {"train_loss": -6.6679253578186035, "global_step": 142213, "epoch": 3386} {"train_loss": -6.779265403747559, "global_step": 142214, "epoch": 3386} {"train_loss": -6.7566237449646, "global_step": 142215, "epoch": 3386} {"train_loss": -6.834016799926758, "global_step": 142216, "epoch": 3386} {"train_loss": -6.716768741607666, "global_step": 142217, "epoch": 3386} {"train_loss": -6.851222038269043, "global_step": 142218, "epoch": 3386} {"train_loss": -6.8048014640808105, "global_step": 142219, "epoch": 3386} {"train_loss": -6.668432712554932, "global_step": 142220, "epoch": 3386} {"train_loss": -6.738300323486328, "global_step": 142221, "epoch": 3386} {"train_loss": -6.823813438415527, "global_step": 142222, "epoch": 3386} {"train_loss": -6.801794528961182, "global_step": 142223, "epoch": 3386} {"train_loss": -6.623648643493652, "global_step": 142224, "epoch": 3386} {"train_loss": -6.777882099151611, "global_step": 142225, "epoch": 3386} {"train_loss": -6.8055267333984375, "global_step": 142226, "epoch": 3386} {"train_loss": -6.72352409362793, "global_step": 142227, "epoch": 3386} {"train_loss": -6.840648651123047, "global_step": 142228, "epoch": 3386} {"train_loss": -6.622694492340088, "global_step": 142229, "epoch": 3386} {"train_loss": -6.861018657684326, "global_step": 142230, "epoch": 3386} {"train_loss": -6.723097801208496, "global_step": 142231, "epoch": 3386} {"train_loss": -6.830294609069824, "global_step": 142232, "epoch": 3386} {"train_loss": -6.902387619018555, "global_step": 142233, "epoch": 3386} {"train_loss": -6.758625507354736, "global_step": 142234, "epoch": 3386} {"train_loss": -6.717349052429199, "global_step": 142235, "epoch": 3386} {"train_loss": -6.765377044677734, "global_step": 142236, "epoch": 3386} {"train_loss": -6.818666458129883, "global_step": 142237, "epoch": 3386} {"train_loss": -6.784741401672363, "global_step": 142238, "epoch": 3386} {"train_loss": -6.844125270843506, "global_step": 142239, "epoch": 3386} {"train_loss": -6.71259880065918, "global_step": 142240, "epoch": 3386} {"train_loss": -6.8382062911987305, "global_step": 142241, "epoch": 3386} {"train_loss": -6.825546741485596, "global_step": 142242, "epoch": 3386} {"train_loss": -6.818317413330078, "global_step": 142243, "epoch": 3386} {"train_loss": -6.763937473297119, "global_step": 142244, "epoch": 3386} {"train_loss": -6.807730197906494, "global_step": 142245, "epoch": 3386} {"train_loss": -6.869060039520264, "global_step": 142246, "epoch": 3386} {"train_loss": -6.849742889404297, "global_step": 142247, "epoch": 3386} {"train_loss": -6.812496185302734, "global_step": 142248, "epoch": 3386} {"train_loss": -6.86978816986084, "global_step": 142249, "epoch": 3386} {"train_loss": -6.839656352996826, "global_step": 142250, "epoch": 3386} {"train_loss": -6.844306468963623, "global_step": 142251, "epoch": 3386} {"train_loss": -6.754047870635986, "global_step": 142252, "epoch": 3386} {"train_loss": -6.789050147646949, "global_step": 142253, "epoch": 3386, "val_loss": 67385.3984375} {"train_loss": -6.8341875076293945, "global_step": 142254, "epoch": 3387} {"train_loss": -6.855045318603516, "global_step": 142255, "epoch": 3387} {"train_loss": -6.832760810852051, "global_step": 142256, "epoch": 3387} {"train_loss": -6.734105587005615, "global_step": 142257, "epoch": 3387} {"train_loss": -6.790740966796875, "global_step": 142258, "epoch": 3387} {"train_loss": -6.817005157470703, "global_step": 142259, "epoch": 3387} {"train_loss": -6.764251708984375, "global_step": 142260, "epoch": 3387} {"train_loss": -6.712719440460205, "global_step": 142261, "epoch": 3387} {"train_loss": -6.706157684326172, "global_step": 142262, "epoch": 3387} {"train_loss": -6.725494384765625, "global_step": 142263, "epoch": 3387} {"train_loss": -6.778611183166504, "global_step": 142264, "epoch": 3387} {"train_loss": -6.622772693634033, "global_step": 142265, "epoch": 3387} {"train_loss": -6.728675842285156, "global_step": 142266, "epoch": 3387} {"train_loss": -6.657819747924805, "global_step": 142267, "epoch": 3387} {"train_loss": -6.711338043212891, "global_step": 142268, "epoch": 3387} {"train_loss": -6.677700042724609, "global_step": 142269, "epoch": 3387} {"train_loss": -6.804056167602539, "global_step": 142270, "epoch": 3387} {"train_loss": -6.724071025848389, "global_step": 142271, "epoch": 3387} {"train_loss": -6.71641731262207, "global_step": 142272, "epoch": 3387} {"train_loss": -6.713681697845459, "global_step": 142273, "epoch": 3387} {"train_loss": -6.805161952972412, "global_step": 142274, "epoch": 3387} {"train_loss": -6.728585243225098, "global_step": 142275, "epoch": 3387} {"train_loss": -6.644903182983398, "global_step": 142276, "epoch": 3387} {"train_loss": -6.677263259887695, "global_step": 142277, "epoch": 3387} {"train_loss": -6.713089466094971, "global_step": 142278, "epoch": 3387} {"train_loss": -6.846040725708008, "global_step": 142279, "epoch": 3387} {"train_loss": -6.719013690948486, "global_step": 142280, "epoch": 3387} {"train_loss": -6.791871070861816, "global_step": 142281, "epoch": 3387} {"train_loss": -6.776278495788574, "global_step": 142282, "epoch": 3387} {"train_loss": -6.813150405883789, "global_step": 142283, "epoch": 3387} {"train_loss": -6.854262351989746, "global_step": 142284, "epoch": 3387} {"train_loss": -6.705081939697266, "global_step": 142285, "epoch": 3387} {"train_loss": -6.78078556060791, "global_step": 142286, "epoch": 3387} {"train_loss": -6.70530366897583, "global_step": 142287, "epoch": 3387} {"train_loss": -6.732378959655762, "global_step": 142288, "epoch": 3387} {"train_loss": -6.834009170532227, "global_step": 142289, "epoch": 3387} {"train_loss": -6.856366157531738, "global_step": 142290, "epoch": 3387} {"train_loss": -6.809551239013672, "global_step": 142291, "epoch": 3387} {"train_loss": -6.678986549377441, "global_step": 142292, "epoch": 3387} {"train_loss": -6.639668941497803, "global_step": 142293, "epoch": 3387} {"train_loss": -6.736569404602051, "global_step": 142294, "epoch": 3387} {"train_loss": -6.750636066709246, "global_step": 142295, "epoch": 3387, "val_loss": 67361.671875} {"train_loss": -6.706499099731445, "global_step": 142296, "epoch": 3388} {"train_loss": -6.769165992736816, "global_step": 142297, "epoch": 3388} {"train_loss": -6.796728610992432, "global_step": 142298, "epoch": 3388} {"train_loss": -6.651620864868164, "global_step": 142299, "epoch": 3388} {"train_loss": -6.7662787437438965, "global_step": 142300, "epoch": 3388} {"train_loss": -6.67599630355835, "global_step": 142301, "epoch": 3388} {"train_loss": -6.723200798034668, "global_step": 142302, "epoch": 3388} {"train_loss": -6.753879070281982, "global_step": 142303, "epoch": 3388} {"train_loss": -6.759650230407715, "global_step": 142304, "epoch": 3388} {"train_loss": -6.626291751861572, "global_step": 142305, "epoch": 3388} {"train_loss": -6.715672016143799, "global_step": 142306, "epoch": 3388} {"train_loss": -6.709150314331055, "global_step": 142307, "epoch": 3388} {"train_loss": -6.589897632598877, "global_step": 142308, "epoch": 3388} {"train_loss": -6.769417762756348, "global_step": 142309, "epoch": 3388} {"train_loss": -6.685546875, "global_step": 142310, "epoch": 3388} {"train_loss": -6.651512145996094, "global_step": 142311, "epoch": 3388} {"train_loss": -6.716215133666992, "global_step": 142312, "epoch": 3388} {"train_loss": -6.701977729797363, "global_step": 142313, "epoch": 3388} {"train_loss": -6.799294471740723, "global_step": 142314, "epoch": 3388} {"train_loss": -6.724786281585693, "global_step": 142315, "epoch": 3388} {"train_loss": -6.905000686645508, "global_step": 142316, "epoch": 3388} {"train_loss": -6.772653579711914, "global_step": 142317, "epoch": 3388} {"train_loss": -6.758673667907715, "global_step": 142318, "epoch": 3388} {"train_loss": -6.854157447814941, "global_step": 142319, "epoch": 3388} {"train_loss": -6.8075761795043945, "global_step": 142320, "epoch": 3388} {"train_loss": -6.727969169616699, "global_step": 142321, "epoch": 3388} {"train_loss": -6.841777324676514, "global_step": 142322, "epoch": 3388} {"train_loss": -6.990525245666504, "global_step": 142323, "epoch": 3388} {"train_loss": -6.681781768798828, "global_step": 142324, "epoch": 3388} {"train_loss": -6.9013237953186035, "global_step": 142325, "epoch": 3388} {"train_loss": -6.741752624511719, "global_step": 142326, "epoch": 3388} {"train_loss": -6.882887363433838, "global_step": 142327, "epoch": 3388} {"train_loss": -6.848883152008057, "global_step": 142328, "epoch": 3388} {"train_loss": -6.852390289306641, "global_step": 142329, "epoch": 3388} {"train_loss": -6.780508041381836, "global_step": 142330, "epoch": 3388} {"train_loss": -6.81787633895874, "global_step": 142331, "epoch": 3388} {"train_loss": -6.793935298919678, "global_step": 142332, "epoch": 3388} {"train_loss": -6.924231052398682, "global_step": 142333, "epoch": 3388} {"train_loss": -6.836310386657715, "global_step": 142334, "epoch": 3388} {"train_loss": -6.762365818023682, "global_step": 142335, "epoch": 3388} {"train_loss": -6.726043701171875, "global_step": 142336, "epoch": 3388} {"train_loss": -6.769936368578956, "global_step": 142337, "epoch": 3388, "val_loss": 67342.953125} {"train_loss": -6.75047492980957, "global_step": 142338, "epoch": 3389} {"train_loss": -6.7011942863464355, "global_step": 142339, "epoch": 3389} {"train_loss": -6.809384822845459, "global_step": 142340, "epoch": 3389} {"train_loss": -6.7286882400512695, "global_step": 142341, "epoch": 3389} {"train_loss": -6.815773010253906, "global_step": 142342, "epoch": 3389} {"train_loss": -6.8456854820251465, "global_step": 142343, "epoch": 3389} {"train_loss": -6.80775260925293, "global_step": 142344, "epoch": 3389} {"train_loss": -6.660113334655762, "global_step": 142345, "epoch": 3389} {"train_loss": -6.797576904296875, "global_step": 142346, "epoch": 3389} {"train_loss": -6.653739929199219, "global_step": 142347, "epoch": 3389} {"train_loss": -6.7210869789123535, "global_step": 142348, "epoch": 3389} {"train_loss": -6.754144668579102, "global_step": 142349, "epoch": 3389} {"train_loss": -6.671812057495117, "global_step": 142350, "epoch": 3389} {"train_loss": -6.7411298751831055, "global_step": 142351, "epoch": 3389} {"train_loss": -6.753194332122803, "global_step": 142352, "epoch": 3389} {"train_loss": -6.756299018859863, "global_step": 142353, "epoch": 3389} {"train_loss": -6.728925704956055, "global_step": 142354, "epoch": 3389} {"train_loss": -6.757349014282227, "global_step": 142355, "epoch": 3389} {"train_loss": -6.686100959777832, "global_step": 142356, "epoch": 3389} {"train_loss": -6.793303489685059, "global_step": 142357, "epoch": 3389} {"train_loss": -6.897825241088867, "global_step": 142358, "epoch": 3389} {"train_loss": -6.834103584289551, "global_step": 142359, "epoch": 3389} {"train_loss": -6.740315914154053, "global_step": 142360, "epoch": 3389} {"train_loss": -6.826442718505859, "global_step": 142361, "epoch": 3389} {"train_loss": -6.658121109008789, "global_step": 142362, "epoch": 3389} {"train_loss": -6.7168498039245605, "global_step": 142363, "epoch": 3389} {"train_loss": -6.79008150100708, "global_step": 142364, "epoch": 3389} {"train_loss": -6.716346740722656, "global_step": 142365, "epoch": 3389} {"train_loss": -6.828286647796631, "global_step": 142366, "epoch": 3389} {"train_loss": -6.773934364318848, "global_step": 142367, "epoch": 3389} {"train_loss": -6.742805480957031, "global_step": 142368, "epoch": 3389} {"train_loss": -6.770892143249512, "global_step": 142369, "epoch": 3389} {"train_loss": -6.707076072692871, "global_step": 142370, "epoch": 3389} {"train_loss": -6.769355773925781, "global_step": 142371, "epoch": 3389} {"train_loss": -6.775829315185547, "global_step": 142372, "epoch": 3389} {"train_loss": -6.715970039367676, "global_step": 142373, "epoch": 3389} {"train_loss": -6.773445129394531, "global_step": 142374, "epoch": 3389} {"train_loss": -6.805600166320801, "global_step": 142375, "epoch": 3389} {"train_loss": -6.782176971435547, "global_step": 142376, "epoch": 3389} {"train_loss": -6.743353843688965, "global_step": 142377, "epoch": 3389} {"train_loss": -6.832550525665283, "global_step": 142378, "epoch": 3389} {"train_loss": -6.759301162901378, "global_step": 142379, "epoch": 3389, "val_loss": 67552.9296875} {"train_loss": -6.787812232971191, "global_step": 142380, "epoch": 3390} {"train_loss": -6.7462310791015625, "global_step": 142381, "epoch": 3390} {"train_loss": -6.755095481872559, "global_step": 142382, "epoch": 3390} {"train_loss": -6.702695369720459, "global_step": 142383, "epoch": 3390} {"train_loss": -6.700606822967529, "global_step": 142384, "epoch": 3390} {"train_loss": -6.777848243713379, "global_step": 142385, "epoch": 3390} {"train_loss": -6.7335524559021, "global_step": 142386, "epoch": 3390} {"train_loss": -6.8688483238220215, "global_step": 142387, "epoch": 3390} {"train_loss": -6.780629634857178, "global_step": 142388, "epoch": 3390} {"train_loss": -6.695333480834961, "global_step": 142389, "epoch": 3390} {"train_loss": -6.875611305236816, "global_step": 142390, "epoch": 3390} {"train_loss": -6.714348793029785, "global_step": 142391, "epoch": 3390} {"train_loss": -6.743840217590332, "global_step": 142392, "epoch": 3390} {"train_loss": -6.817824363708496, "global_step": 142393, "epoch": 3390} {"train_loss": -6.7367024421691895, "global_step": 142394, "epoch": 3390} {"train_loss": -6.746162414550781, "global_step": 142395, "epoch": 3390} {"train_loss": -6.832581520080566, "global_step": 142396, "epoch": 3390} {"train_loss": -6.6995697021484375, "global_step": 142397, "epoch": 3390} {"train_loss": -6.874068737030029, "global_step": 142398, "epoch": 3390} {"train_loss": -6.664571762084961, "global_step": 142399, "epoch": 3390} {"train_loss": -6.779628753662109, "global_step": 142400, "epoch": 3390} {"train_loss": -6.757734298706055, "global_step": 142401, "epoch": 3390} {"train_loss": -6.7008280754089355, "global_step": 142402, "epoch": 3390} {"train_loss": -6.843739986419678, "global_step": 142403, "epoch": 3390} {"train_loss": -6.756147384643555, "global_step": 142404, "epoch": 3390} {"train_loss": -6.770876884460449, "global_step": 142405, "epoch": 3390} {"train_loss": -6.927484512329102, "global_step": 142406, "epoch": 3390} {"train_loss": -6.822613716125488, "global_step": 142407, "epoch": 3390} {"train_loss": -6.833992004394531, "global_step": 142408, "epoch": 3390} {"train_loss": -6.816293239593506, "global_step": 142409, "epoch": 3390} {"train_loss": -6.796636581420898, "global_step": 142410, "epoch": 3390} {"train_loss": -6.796092987060547, "global_step": 142411, "epoch": 3390} {"train_loss": -6.731961250305176, "global_step": 142412, "epoch": 3390} {"train_loss": -6.863347053527832, "global_step": 142413, "epoch": 3390} {"train_loss": -6.69603157043457, "global_step": 142414, "epoch": 3390} {"train_loss": -6.83439826965332, "global_step": 142415, "epoch": 3390} {"train_loss": -6.8322882652282715, "global_step": 142416, "epoch": 3390} {"train_loss": -6.7716546058654785, "global_step": 142417, "epoch": 3390} {"train_loss": -6.783844470977783, "global_step": 142418, "epoch": 3390} {"train_loss": -6.8512773513793945, "global_step": 142419, "epoch": 3390} {"train_loss": -6.725070953369141, "global_step": 142420, "epoch": 3390} {"train_loss": -6.778978608903431, "global_step": 142421, "epoch": 3390, "val_loss": 67490.484375} {"train_loss": -6.698142051696777, "global_step": 142422, "epoch": 3391} {"train_loss": -6.685737609863281, "global_step": 142423, "epoch": 3391} {"train_loss": -6.655425071716309, "global_step": 142424, "epoch": 3391} {"train_loss": -6.764327049255371, "global_step": 142425, "epoch": 3391} {"train_loss": -6.891358375549316, "global_step": 142426, "epoch": 3391} {"train_loss": -6.680991172790527, "global_step": 142427, "epoch": 3391} {"train_loss": -6.665773391723633, "global_step": 142428, "epoch": 3391} {"train_loss": -6.721475601196289, "global_step": 142429, "epoch": 3391} {"train_loss": -6.7310471534729, "global_step": 142430, "epoch": 3391} {"train_loss": -6.794088363647461, "global_step": 142431, "epoch": 3391} {"train_loss": -6.730866432189941, "global_step": 142432, "epoch": 3391} {"train_loss": -6.75133752822876, "global_step": 142433, "epoch": 3391} {"train_loss": -6.670882701873779, "global_step": 142434, "epoch": 3391} {"train_loss": -6.75239372253418, "global_step": 142435, "epoch": 3391} {"train_loss": -6.737698078155518, "global_step": 142436, "epoch": 3391} {"train_loss": -6.693889617919922, "global_step": 142437, "epoch": 3391} {"train_loss": -6.772438049316406, "global_step": 142438, "epoch": 3391} {"train_loss": -6.6690673828125, "global_step": 142439, "epoch": 3391} {"train_loss": -6.755675792694092, "global_step": 142440, "epoch": 3391} {"train_loss": -6.746401309967041, "global_step": 142441, "epoch": 3391} {"train_loss": -6.6847124099731445, "global_step": 142442, "epoch": 3391} {"train_loss": -6.766993522644043, "global_step": 142443, "epoch": 3391} {"train_loss": -6.742727756500244, "global_step": 142444, "epoch": 3391} {"train_loss": -6.881392478942871, "global_step": 142445, "epoch": 3391} {"train_loss": -6.767489433288574, "global_step": 142446, "epoch": 3391} {"train_loss": -6.867740631103516, "global_step": 142447, "epoch": 3391} {"train_loss": -6.729463577270508, "global_step": 142448, "epoch": 3391} {"train_loss": -6.74745512008667, "global_step": 142449, "epoch": 3391} {"train_loss": -6.717855930328369, "global_step": 142450, "epoch": 3391} {"train_loss": -6.6866044998168945, "global_step": 142451, "epoch": 3391} {"train_loss": -6.825977325439453, "global_step": 142452, "epoch": 3391} {"train_loss": -6.64727783203125, "global_step": 142453, "epoch": 3391} {"train_loss": -6.696414947509766, "global_step": 142454, "epoch": 3391} {"train_loss": -6.777763366699219, "global_step": 142455, "epoch": 3391} {"train_loss": -6.734626770019531, "global_step": 142456, "epoch": 3391} {"train_loss": -6.805065155029297, "global_step": 142457, "epoch": 3391} {"train_loss": -6.814925670623779, "global_step": 142458, "epoch": 3391} {"train_loss": -6.872001647949219, "global_step": 142459, "epoch": 3391} {"train_loss": -6.787095069885254, "global_step": 142460, "epoch": 3391} {"train_loss": -6.686318397521973, "global_step": 142461, "epoch": 3391} {"train_loss": -6.728672027587891, "global_step": 142462, "epoch": 3391} {"train_loss": -6.746214321681431, "global_step": 142463, "epoch": 3391, "val_loss": 67639.5625} {"train_loss": -6.786803245544434, "global_step": 142464, "epoch": 3392} {"train_loss": -6.804207801818848, "global_step": 142465, "epoch": 3392} {"train_loss": -6.788494110107422, "global_step": 142466, "epoch": 3392} {"train_loss": -6.730055809020996, "global_step": 142467, "epoch": 3392} {"train_loss": -6.745879173278809, "global_step": 142468, "epoch": 3392} {"train_loss": -6.759476184844971, "global_step": 142469, "epoch": 3392} {"train_loss": -6.962261199951172, "global_step": 142470, "epoch": 3392} {"train_loss": -6.839654922485352, "global_step": 142471, "epoch": 3392} {"train_loss": -6.753257751464844, "global_step": 142472, "epoch": 3392} {"train_loss": -6.7619218826293945, "global_step": 142473, "epoch": 3392} {"train_loss": -6.868636608123779, "global_step": 142474, "epoch": 3392} {"train_loss": -6.890623092651367, "global_step": 142475, "epoch": 3392} {"train_loss": -6.899483680725098, "global_step": 142476, "epoch": 3392} {"train_loss": -6.801808834075928, "global_step": 142477, "epoch": 3392} {"train_loss": -6.795923233032227, "global_step": 142478, "epoch": 3392} {"train_loss": -6.948925495147705, "global_step": 142479, "epoch": 3392} {"train_loss": -6.855867385864258, "global_step": 142480, "epoch": 3392} {"train_loss": -6.785449028015137, "global_step": 142481, "epoch": 3392} {"train_loss": -6.873500823974609, "global_step": 142482, "epoch": 3392} {"train_loss": -6.807360649108887, "global_step": 142483, "epoch": 3392} {"train_loss": -6.826529502868652, "global_step": 142484, "epoch": 3392} {"train_loss": -6.78593635559082, "global_step": 142485, "epoch": 3392} {"train_loss": -6.867768287658691, "global_step": 142486, "epoch": 3392} {"train_loss": -6.79129695892334, "global_step": 142487, "epoch": 3392} {"train_loss": -6.862884521484375, "global_step": 142488, "epoch": 3392} {"train_loss": -6.863093852996826, "global_step": 142489, "epoch": 3392} {"train_loss": -6.821810722351074, "global_step": 142490, "epoch": 3392} {"train_loss": -6.872561454772949, "global_step": 142491, "epoch": 3392} {"train_loss": -6.794937610626221, "global_step": 142492, "epoch": 3392} {"train_loss": -6.975407600402832, "global_step": 142493, "epoch": 3392} {"train_loss": -6.807061195373535, "global_step": 142494, "epoch": 3392} {"train_loss": -6.768885612487793, "global_step": 142495, "epoch": 3392} {"train_loss": -6.769334316253662, "global_step": 142496, "epoch": 3392} {"train_loss": -6.73255729675293, "global_step": 142497, "epoch": 3392} {"train_loss": -6.792781829833984, "global_step": 142498, "epoch": 3392} {"train_loss": -6.822035789489746, "global_step": 142499, "epoch": 3392} {"train_loss": -6.802204608917236, "global_step": 142500, "epoch": 3392} {"train_loss": -6.767158508300781, "global_step": 142501, "epoch": 3392} {"train_loss": -6.719116687774658, "global_step": 142502, "epoch": 3392} {"train_loss": -6.632976531982422, "global_step": 142503, "epoch": 3392} {"train_loss": -6.682855606079102, "global_step": 142504, "epoch": 3392} {"train_loss": -6.804031315303984, "global_step": 142505, "epoch": 3392, "val_loss": 67595.515625} {"train_loss": -6.771222114562988, "global_step": 142506, "epoch": 3393} {"train_loss": -6.7706756591796875, "global_step": 142507, "epoch": 3393} {"train_loss": -6.7457427978515625, "global_step": 142508, "epoch": 3393} {"train_loss": -6.868514060974121, "global_step": 142509, "epoch": 3393} {"train_loss": -6.792798042297363, "global_step": 142510, "epoch": 3393} {"train_loss": -6.688193321228027, "global_step": 142511, "epoch": 3393} {"train_loss": -6.935067176818848, "global_step": 142512, "epoch": 3393} {"train_loss": -6.725091934204102, "global_step": 142513, "epoch": 3393} {"train_loss": -6.823907852172852, "global_step": 142514, "epoch": 3393} {"train_loss": -6.829709053039551, "global_step": 142515, "epoch": 3393} {"train_loss": -6.810083389282227, "global_step": 142516, "epoch": 3393} {"train_loss": -6.622313499450684, "global_step": 142517, "epoch": 3393} {"train_loss": -6.809133529663086, "global_step": 142518, "epoch": 3393} {"train_loss": -6.899393081665039, "global_step": 142519, "epoch": 3393} {"train_loss": -6.804300308227539, "global_step": 142520, "epoch": 3393} {"train_loss": -6.729813575744629, "global_step": 142521, "epoch": 3393} {"train_loss": -6.778793811798096, "global_step": 142522, "epoch": 3393} {"train_loss": -6.692576885223389, "global_step": 142523, "epoch": 3393} {"train_loss": -6.778038501739502, "global_step": 142524, "epoch": 3393} {"train_loss": -6.726000785827637, "global_step": 142525, "epoch": 3393} {"train_loss": -6.812098503112793, "global_step": 142526, "epoch": 3393} {"train_loss": -6.680349349975586, "global_step": 142527, "epoch": 3393} {"train_loss": -6.7411789894104, "global_step": 142528, "epoch": 3393} {"train_loss": -6.817073822021484, "global_step": 142529, "epoch": 3393} {"train_loss": -6.83339262008667, "global_step": 142530, "epoch": 3393} {"train_loss": -6.840051651000977, "global_step": 142531, "epoch": 3393} {"train_loss": -6.741374969482422, "global_step": 142532, "epoch": 3393} {"train_loss": -6.797253608703613, "global_step": 142533, "epoch": 3393} {"train_loss": -6.713374137878418, "global_step": 142534, "epoch": 3393} {"train_loss": -6.743022918701172, "global_step": 142535, "epoch": 3393} {"train_loss": -6.755886077880859, "global_step": 142536, "epoch": 3393} {"train_loss": -6.716302871704102, "global_step": 142537, "epoch": 3393} {"train_loss": -6.775604248046875, "global_step": 142538, "epoch": 3393} {"train_loss": -6.812506675720215, "global_step": 142539, "epoch": 3393} {"train_loss": -6.65305757522583, "global_step": 142540, "epoch": 3393} {"train_loss": -6.681279182434082, "global_step": 142541, "epoch": 3393} {"train_loss": -6.806160926818848, "global_step": 142542, "epoch": 3393} {"train_loss": -6.694797515869141, "global_step": 142543, "epoch": 3393} {"train_loss": -6.766976356506348, "global_step": 142544, "epoch": 3393} {"train_loss": -6.82722282409668, "global_step": 142545, "epoch": 3393} {"train_loss": -6.720269203186035, "global_step": 142546, "epoch": 3393} {"train_loss": -6.770068520591373, "global_step": 142547, "epoch": 3393, "val_loss": 67589.40625} {"train_loss": -6.832607269287109, "global_step": 142548, "epoch": 3394} {"train_loss": -6.660457611083984, "global_step": 142549, "epoch": 3394} {"train_loss": -6.760194778442383, "global_step": 142550, "epoch": 3394} {"train_loss": -6.779322624206543, "global_step": 142551, "epoch": 3394} {"train_loss": -6.754373073577881, "global_step": 142552, "epoch": 3394} {"train_loss": -6.737506866455078, "global_step": 142553, "epoch": 3394} {"train_loss": -6.715352535247803, "global_step": 142554, "epoch": 3394} {"train_loss": -6.817249298095703, "global_step": 142555, "epoch": 3394} {"train_loss": -6.792878150939941, "global_step": 142556, "epoch": 3394} {"train_loss": -6.753793716430664, "global_step": 142557, "epoch": 3394} {"train_loss": -6.810511112213135, "global_step": 142558, "epoch": 3394} {"train_loss": -6.8506951332092285, "global_step": 142559, "epoch": 3394} {"train_loss": -6.782927989959717, "global_step": 142560, "epoch": 3394} {"train_loss": -6.855432510375977, "global_step": 142561, "epoch": 3394} {"train_loss": -6.781023979187012, "global_step": 142562, "epoch": 3394} {"train_loss": -6.714667320251465, "global_step": 142563, "epoch": 3394} {"train_loss": -6.811707496643066, "global_step": 142564, "epoch": 3394} {"train_loss": -6.732232093811035, "global_step": 142565, "epoch": 3394} {"train_loss": -6.926168441772461, "global_step": 142566, "epoch": 3394} {"train_loss": -6.837831497192383, "global_step": 142567, "epoch": 3394} {"train_loss": -6.782805919647217, "global_step": 142568, "epoch": 3394} {"train_loss": -6.789206504821777, "global_step": 142569, "epoch": 3394} {"train_loss": -6.775355339050293, "global_step": 142570, "epoch": 3394} {"train_loss": -6.688738822937012, "global_step": 142571, "epoch": 3394} {"train_loss": -6.755664825439453, "global_step": 142572, "epoch": 3394} {"train_loss": -6.8616943359375, "global_step": 142573, "epoch": 3394} {"train_loss": -6.813457489013672, "global_step": 142574, "epoch": 3394} {"train_loss": -6.843470573425293, "global_step": 142575, "epoch": 3394} {"train_loss": -6.7893218994140625, "global_step": 142576, "epoch": 3394} {"train_loss": -6.691681385040283, "global_step": 142577, "epoch": 3394} {"train_loss": -6.748867034912109, "global_step": 142578, "epoch": 3394} {"train_loss": -6.886174201965332, "global_step": 142579, "epoch": 3394} {"train_loss": -6.599085330963135, "global_step": 142580, "epoch": 3394} {"train_loss": -6.737543106079102, "global_step": 142581, "epoch": 3394} {"train_loss": -6.801931381225586, "global_step": 142582, "epoch": 3394} {"train_loss": -6.670445919036865, "global_step": 142583, "epoch": 3394} {"train_loss": -6.552570343017578, "global_step": 142584, "epoch": 3394} {"train_loss": -6.668084621429443, "global_step": 142585, "epoch": 3394} {"train_loss": -6.553079605102539, "global_step": 142586, "epoch": 3394} {"train_loss": -6.541745662689209, "global_step": 142587, "epoch": 3394} {"train_loss": -6.793954849243164, "global_step": 142588, "epoch": 3394} {"train_loss": -6.755721217110043, "global_step": 142589, "epoch": 3394, "val_loss": 67878.4375} {"train_loss": -6.711333751678467, "global_step": 142590, "epoch": 3395} {"train_loss": -6.773435115814209, "global_step": 142591, "epoch": 3395} {"train_loss": -6.6377458572387695, "global_step": 142592, "epoch": 3395} {"train_loss": -6.746613502502441, "global_step": 142593, "epoch": 3395} {"train_loss": -6.702546119689941, "global_step": 142594, "epoch": 3395} {"train_loss": -6.718437194824219, "global_step": 142595, "epoch": 3395} {"train_loss": -6.7025299072265625, "global_step": 142596, "epoch": 3395} {"train_loss": -6.818183422088623, "global_step": 142597, "epoch": 3395} {"train_loss": -6.842313289642334, "global_step": 142598, "epoch": 3395} {"train_loss": -6.706566333770752, "global_step": 142599, "epoch": 3395} {"train_loss": -6.723908424377441, "global_step": 142600, "epoch": 3395} {"train_loss": -6.82525634765625, "global_step": 142601, "epoch": 3395} {"train_loss": -6.825189113616943, "global_step": 142602, "epoch": 3395} {"train_loss": -6.742204666137695, "global_step": 142603, "epoch": 3395} {"train_loss": -6.641652584075928, "global_step": 142604, "epoch": 3395} {"train_loss": -6.737726211547852, "global_step": 142605, "epoch": 3395} {"train_loss": -6.751391887664795, "global_step": 142606, "epoch": 3395} {"train_loss": -6.728167533874512, "global_step": 142607, "epoch": 3395} {"train_loss": -6.824140548706055, "global_step": 142608, "epoch": 3395} {"train_loss": -6.742531776428223, "global_step": 142609, "epoch": 3395} {"train_loss": -6.757867813110352, "global_step": 142610, "epoch": 3395} {"train_loss": -6.835210800170898, "global_step": 142611, "epoch": 3395} {"train_loss": -6.722262382507324, "global_step": 142612, "epoch": 3395} {"train_loss": -6.715968132019043, "global_step": 142613, "epoch": 3395} {"train_loss": -6.827541351318359, "global_step": 142614, "epoch": 3395} {"train_loss": -6.794468879699707, "global_step": 142615, "epoch": 3395} {"train_loss": -6.756963729858398, "global_step": 142616, "epoch": 3395} {"train_loss": -6.81410026550293, "global_step": 142617, "epoch": 3395} {"train_loss": -6.799172401428223, "global_step": 142618, "epoch": 3395} {"train_loss": -6.8916497230529785, "global_step": 142619, "epoch": 3395} {"train_loss": -6.701046943664551, "global_step": 142620, "epoch": 3395} {"train_loss": -6.8951416015625, "global_step": 142621, "epoch": 3395} {"train_loss": -6.675314903259277, "global_step": 142622, "epoch": 3395} {"train_loss": -6.738059997558594, "global_step": 142623, "epoch": 3395} {"train_loss": -6.799127101898193, "global_step": 142624, "epoch": 3395} {"train_loss": -6.8686628341674805, "global_step": 142625, "epoch": 3395} {"train_loss": -6.963709354400635, "global_step": 142626, "epoch": 3395} {"train_loss": -6.890751838684082, "global_step": 142627, "epoch": 3395} {"train_loss": -6.830474853515625, "global_step": 142628, "epoch": 3395} {"train_loss": -6.817890644073486, "global_step": 142629, "epoch": 3395} {"train_loss": -6.815374374389648, "global_step": 142630, "epoch": 3395} {"train_loss": -6.777580772127424, "global_step": 142631, "epoch": 3395, "val_loss": 67387.7890625} {"train_loss": -6.940255641937256, "global_step": 142632, "epoch": 3396} {"train_loss": -6.98954963684082, "global_step": 142633, "epoch": 3396} {"train_loss": -6.763689994812012, "global_step": 142634, "epoch": 3396} {"train_loss": -6.71648645401001, "global_step": 142635, "epoch": 3396} {"train_loss": -6.8949785232543945, "global_step": 142636, "epoch": 3396} {"train_loss": -6.736947536468506, "global_step": 142637, "epoch": 3396} {"train_loss": -6.752992630004883, "global_step": 142638, "epoch": 3396} {"train_loss": -6.726970672607422, "global_step": 142639, "epoch": 3396} {"train_loss": -6.777811050415039, "global_step": 142640, "epoch": 3396} {"train_loss": -6.793057918548584, "global_step": 142641, "epoch": 3396} {"train_loss": -6.7996721267700195, "global_step": 142642, "epoch": 3396} {"train_loss": -6.922725677490234, "global_step": 142643, "epoch": 3396} {"train_loss": -6.751967430114746, "global_step": 142644, "epoch": 3396} {"train_loss": -6.767708778381348, "global_step": 142645, "epoch": 3396} {"train_loss": -6.729715347290039, "global_step": 142646, "epoch": 3396} {"train_loss": -6.747063636779785, "global_step": 142647, "epoch": 3396} {"train_loss": -6.7751569747924805, "global_step": 142648, "epoch": 3396} {"train_loss": -6.855866432189941, "global_step": 142649, "epoch": 3396} {"train_loss": -6.664342880249023, "global_step": 142650, "epoch": 3396} {"train_loss": -6.726508617401123, "global_step": 142651, "epoch": 3396} {"train_loss": -6.81380558013916, "global_step": 142652, "epoch": 3396} {"train_loss": -6.681321620941162, "global_step": 142653, "epoch": 3396} {"train_loss": -6.74318790435791, "global_step": 142654, "epoch": 3396} {"train_loss": -6.787581443786621, "global_step": 142655, "epoch": 3396} {"train_loss": -6.775620937347412, "global_step": 142656, "epoch": 3396} {"train_loss": -6.734175682067871, "global_step": 142657, "epoch": 3396} {"train_loss": -6.671473026275635, "global_step": 142658, "epoch": 3396} {"train_loss": -6.7216997146606445, "global_step": 142659, "epoch": 3396} {"train_loss": -6.658763885498047, "global_step": 142660, "epoch": 3396} {"train_loss": -6.800457954406738, "global_step": 142661, "epoch": 3396} {"train_loss": -6.535157680511475, "global_step": 142662, "epoch": 3396} {"train_loss": -6.647111892700195, "global_step": 142663, "epoch": 3396} {"train_loss": -6.87027645111084, "global_step": 142664, "epoch": 3396} {"train_loss": -6.660146713256836, "global_step": 142665, "epoch": 3396} {"train_loss": -6.797384262084961, "global_step": 142666, "epoch": 3396} {"train_loss": -6.710692882537842, "global_step": 142667, "epoch": 3396} {"train_loss": -6.654697418212891, "global_step": 142668, "epoch": 3396} {"train_loss": -6.692803382873535, "global_step": 142669, "epoch": 3396} {"train_loss": -6.731605529785156, "global_step": 142670, "epoch": 3396} {"train_loss": -6.723269462585449, "global_step": 142671, "epoch": 3396} {"train_loss": -6.832280158996582, "global_step": 142672, "epoch": 3396} {"train_loss": -6.75539003099714, "global_step": 142673, "epoch": 3396, "val_loss": 67401.8125} {"train_loss": -6.782380104064941, "global_step": 142674, "epoch": 3397} {"train_loss": -6.737030029296875, "global_step": 142675, "epoch": 3397} {"train_loss": -6.8087873458862305, "global_step": 142676, "epoch": 3397} {"train_loss": -6.794869422912598, "global_step": 142677, "epoch": 3397} {"train_loss": -6.631934642791748, "global_step": 142678, "epoch": 3397} {"train_loss": -6.748862266540527, "global_step": 142679, "epoch": 3397} {"train_loss": -6.8171281814575195, "global_step": 142680, "epoch": 3397} {"train_loss": -6.705245018005371, "global_step": 142681, "epoch": 3397} {"train_loss": -6.747143745422363, "global_step": 142682, "epoch": 3397} {"train_loss": -6.774862289428711, "global_step": 142683, "epoch": 3397} {"train_loss": -6.799914360046387, "global_step": 142684, "epoch": 3397} {"train_loss": -6.802430152893066, "global_step": 142685, "epoch": 3397} {"train_loss": -6.832275867462158, "global_step": 142686, "epoch": 3397} {"train_loss": -6.891646862030029, "global_step": 142687, "epoch": 3397} {"train_loss": -6.80523681640625, "global_step": 142688, "epoch": 3397} {"train_loss": -6.842348098754883, "global_step": 142689, "epoch": 3397} {"train_loss": -6.789004325866699, "global_step": 142690, "epoch": 3397} {"train_loss": -6.779500961303711, "global_step": 142691, "epoch": 3397} {"train_loss": -6.859807014465332, "global_step": 142692, "epoch": 3397} {"train_loss": -6.880965232849121, "global_step": 142693, "epoch": 3397} {"train_loss": -6.838390350341797, "global_step": 142694, "epoch": 3397} {"train_loss": -6.903808116912842, "global_step": 142695, "epoch": 3397} {"train_loss": -6.873043060302734, "global_step": 142696, "epoch": 3397} {"train_loss": -6.680466175079346, "global_step": 142697, "epoch": 3397} {"train_loss": -6.866645812988281, "global_step": 142698, "epoch": 3397} {"train_loss": -6.8546247482299805, "global_step": 142699, "epoch": 3397} {"train_loss": -6.949953079223633, "global_step": 142700, "epoch": 3397} {"train_loss": -6.771780967712402, "global_step": 142701, "epoch": 3397} {"train_loss": -6.671695709228516, "global_step": 142702, "epoch": 3397} {"train_loss": -6.866936683654785, "global_step": 142703, "epoch": 3397} {"train_loss": -6.923529624938965, "global_step": 142704, "epoch": 3397} {"train_loss": -6.887497901916504, "global_step": 142705, "epoch": 3397} {"train_loss": -6.913125038146973, "global_step": 142706, "epoch": 3397} {"train_loss": -6.8399128913879395, "global_step": 142707, "epoch": 3397} {"train_loss": -6.864057540893555, "global_step": 142708, "epoch": 3397} {"train_loss": -6.820737361907959, "global_step": 142709, "epoch": 3397} {"train_loss": -6.896080493927002, "global_step": 142710, "epoch": 3397} {"train_loss": -6.786805152893066, "global_step": 142711, "epoch": 3397} {"train_loss": -6.740468978881836, "global_step": 142712, "epoch": 3397} {"train_loss": -6.9220991134643555, "global_step": 142713, "epoch": 3397} {"train_loss": -6.8480329513549805, "global_step": 142714, "epoch": 3397} {"train_loss": -6.817771559669858, "global_step": 142715, "epoch": 3397, "val_loss": 67566.5703125} {"train_loss": -6.859926223754883, "global_step": 142716, "epoch": 3398} {"train_loss": -6.8648905754089355, "global_step": 142717, "epoch": 3398} {"train_loss": -6.830679893493652, "global_step": 142718, "epoch": 3398} {"train_loss": -6.912065029144287, "global_step": 142719, "epoch": 3398} {"train_loss": -6.8939313888549805, "global_step": 142720, "epoch": 3398} {"train_loss": -6.829937934875488, "global_step": 142721, "epoch": 3398} {"train_loss": -6.810065269470215, "global_step": 142722, "epoch": 3398} {"train_loss": -6.776803970336914, "global_step": 142723, "epoch": 3398} {"train_loss": -6.866535186767578, "global_step": 142724, "epoch": 3398} {"train_loss": -6.790729522705078, "global_step": 142725, "epoch": 3398} {"train_loss": -6.76168155670166, "global_step": 142726, "epoch": 3398} {"train_loss": -6.836062908172607, "global_step": 142727, "epoch": 3398} {"train_loss": -6.819697380065918, "global_step": 142728, "epoch": 3398} {"train_loss": -6.743310928344727, "global_step": 142729, "epoch": 3398} {"train_loss": -6.810217380523682, "global_step": 142730, "epoch": 3398} {"train_loss": -6.83668327331543, "global_step": 142731, "epoch": 3398} {"train_loss": -6.897166728973389, "global_step": 142732, "epoch": 3398} {"train_loss": -6.800084590911865, "global_step": 142733, "epoch": 3398} {"train_loss": -6.72047233581543, "global_step": 142734, "epoch": 3398} {"train_loss": -6.774098873138428, "global_step": 142735, "epoch": 3398} {"train_loss": -6.8022918701171875, "global_step": 142736, "epoch": 3398} {"train_loss": -6.843589782714844, "global_step": 142737, "epoch": 3398} {"train_loss": -6.793832778930664, "global_step": 142738, "epoch": 3398} {"train_loss": -6.778069496154785, "global_step": 142739, "epoch": 3398} {"train_loss": -6.864384651184082, "global_step": 142740, "epoch": 3398} {"train_loss": -6.802443027496338, "global_step": 142741, "epoch": 3398} {"train_loss": -6.814375877380371, "global_step": 142742, "epoch": 3398} {"train_loss": -6.817606449127197, "global_step": 142743, "epoch": 3398} {"train_loss": -6.9510602951049805, "global_step": 142744, "epoch": 3398} {"train_loss": -6.801107883453369, "global_step": 142745, "epoch": 3398} {"train_loss": -6.678780555725098, "global_step": 142746, "epoch": 3398} {"train_loss": -6.711026191711426, "global_step": 142747, "epoch": 3398} {"train_loss": -6.786377906799316, "global_step": 142748, "epoch": 3398} {"train_loss": -6.767920017242432, "global_step": 142749, "epoch": 3398} {"train_loss": -6.812638759613037, "global_step": 142750, "epoch": 3398} {"train_loss": -6.835268974304199, "global_step": 142751, "epoch": 3398} {"train_loss": -6.664585113525391, "global_step": 142752, "epoch": 3398} {"train_loss": -6.798633575439453, "global_step": 142753, "epoch": 3398} {"train_loss": -6.85836935043335, "global_step": 142754, "epoch": 3398} {"train_loss": -6.783487319946289, "global_step": 142755, "epoch": 3398} {"train_loss": -6.804247856140137, "global_step": 142756, "epoch": 3398} {"train_loss": -6.8090708028702505, "global_step": 142757, "epoch": 3398, "val_loss": 67714.7421875} {"train_loss": -6.733263969421387, "global_step": 142758, "epoch": 3399} {"train_loss": -6.773881435394287, "global_step": 142759, "epoch": 3399} {"train_loss": -6.790642738342285, "global_step": 142760, "epoch": 3399} {"train_loss": -6.692154407501221, "global_step": 142761, "epoch": 3399} {"train_loss": -6.733584403991699, "global_step": 142762, "epoch": 3399} {"train_loss": -6.857560157775879, "global_step": 142763, "epoch": 3399} {"train_loss": -6.743636131286621, "global_step": 142764, "epoch": 3399} {"train_loss": -6.791356086730957, "global_step": 142765, "epoch": 3399} {"train_loss": -6.824533939361572, "global_step": 142766, "epoch": 3399} {"train_loss": -6.677295684814453, "global_step": 142767, "epoch": 3399} {"train_loss": -6.77755880355835, "global_step": 142768, "epoch": 3399} {"train_loss": -6.833744525909424, "global_step": 142769, "epoch": 3399} {"train_loss": -6.700534820556641, "global_step": 142770, "epoch": 3399} {"train_loss": -6.753329277038574, "global_step": 142771, "epoch": 3399} {"train_loss": -6.844479560852051, "global_step": 142772, "epoch": 3399} {"train_loss": -6.815084457397461, "global_step": 142773, "epoch": 3399} {"train_loss": -6.6738996505737305, "global_step": 142774, "epoch": 3399} {"train_loss": -6.809935569763184, "global_step": 142775, "epoch": 3399} {"train_loss": -6.727632522583008, "global_step": 142776, "epoch": 3399} {"train_loss": -6.7408552169799805, "global_step": 142777, "epoch": 3399} {"train_loss": -6.818171501159668, "global_step": 142778, "epoch": 3399} {"train_loss": -6.80241584777832, "global_step": 142779, "epoch": 3399} {"train_loss": -6.831045627593994, "global_step": 142780, "epoch": 3399} {"train_loss": -6.741698265075684, "global_step": 142781, "epoch": 3399} {"train_loss": -6.771148204803467, "global_step": 142782, "epoch": 3399} {"train_loss": -6.6877336502075195, "global_step": 142783, "epoch": 3399} {"train_loss": -6.747567176818848, "global_step": 142784, "epoch": 3399} {"train_loss": -6.642547607421875, "global_step": 142785, "epoch": 3399} {"train_loss": -6.736391067504883, "global_step": 142786, "epoch": 3399} {"train_loss": -6.654538631439209, "global_step": 142787, "epoch": 3399} {"train_loss": -6.741106033325195, "global_step": 142788, "epoch": 3399} {"train_loss": -6.781844139099121, "global_step": 142789, "epoch": 3399} {"train_loss": -6.772068977355957, "global_step": 142790, "epoch": 3399} {"train_loss": -6.850749969482422, "global_step": 142791, "epoch": 3399} {"train_loss": -6.6916303634643555, "global_step": 142792, "epoch": 3399} {"train_loss": -6.649080753326416, "global_step": 142793, "epoch": 3399} {"train_loss": -6.755343437194824, "global_step": 142794, "epoch": 3399} {"train_loss": -6.742353916168213, "global_step": 142795, "epoch": 3399} {"train_loss": -6.813239097595215, "global_step": 142796, "epoch": 3399} {"train_loss": -6.788686752319336, "global_step": 142797, "epoch": 3399} {"train_loss": -6.824997901916504, "global_step": 142798, "epoch": 3399} {"train_loss": -6.760702326184227, "global_step": 142799, "epoch": 3399, "val_loss": 67358.1328125} {"train_loss": -6.76619815826416, "global_step": 142800, "epoch": 3400} {"train_loss": -6.636554718017578, "global_step": 142801, "epoch": 3400} {"train_loss": -6.78378963470459, "global_step": 142802, "epoch": 3400} {"train_loss": -6.848998069763184, "global_step": 142803, "epoch": 3400} {"train_loss": -6.749300956726074, "global_step": 142804, "epoch": 3400} {"train_loss": -6.827915191650391, "global_step": 142805, "epoch": 3400} {"train_loss": -6.784844398498535, "global_step": 142806, "epoch": 3400} {"train_loss": -6.791563987731934, "global_step": 142807, "epoch": 3400} {"train_loss": -6.734981536865234, "global_step": 142808, "epoch": 3400} {"train_loss": -6.899531364440918, "global_step": 142809, "epoch": 3400} {"train_loss": -6.660993576049805, "global_step": 142810, "epoch": 3400} {"train_loss": -6.84519100189209, "global_step": 142811, "epoch": 3400} {"train_loss": -6.808036804199219, "global_step": 142812, "epoch": 3400} {"train_loss": -6.770469665527344, "global_step": 142813, "epoch": 3400} {"train_loss": -6.775973320007324, "global_step": 142814, "epoch": 3400} {"train_loss": -6.778074264526367, "global_step": 142815, "epoch": 3400} {"train_loss": -6.782854080200195, "global_step": 142816, "epoch": 3400} {"train_loss": -6.831123352050781, "global_step": 142817, "epoch": 3400} {"train_loss": -6.717288494110107, "global_step": 142818, "epoch": 3400} {"train_loss": -6.813621520996094, "global_step": 142819, "epoch": 3400} {"train_loss": -6.864020824432373, "global_step": 142820, "epoch": 3400} {"train_loss": -6.753229141235352, "global_step": 142821, "epoch": 3400} {"train_loss": -6.812727928161621, "global_step": 142822, "epoch": 3400} {"train_loss": -6.915404319763184, "global_step": 142823, "epoch": 3400} {"train_loss": -6.825305461883545, "global_step": 142824, "epoch": 3400} {"train_loss": -6.70784854888916, "global_step": 142825, "epoch": 3400} {"train_loss": -6.7811598777771, "global_step": 142826, "epoch": 3400} {"train_loss": -6.8093414306640625, "global_step": 142827, "epoch": 3400} {"train_loss": -6.785647869110107, "global_step": 142828, "epoch": 3400} {"train_loss": -6.722789764404297, "global_step": 142829, "epoch": 3400} {"train_loss": -6.7899065017700195, "global_step": 142830, "epoch": 3400} {"train_loss": -6.916225433349609, "global_step": 142831, "epoch": 3400} {"train_loss": -6.90781307220459, "global_step": 142832, "epoch": 3400} {"train_loss": -6.7487921714782715, "global_step": 142833, "epoch": 3400} {"train_loss": -6.790280342102051, "global_step": 142834, "epoch": 3400} {"train_loss": -6.875558853149414, "global_step": 142835, "epoch": 3400} {"train_loss": -6.81148624420166, "global_step": 142836, "epoch": 3400} {"train_loss": -6.747653007507324, "global_step": 142837, "epoch": 3400} {"train_loss": -6.796297073364258, "global_step": 142838, "epoch": 3400} {"train_loss": -6.842995643615723, "global_step": 142839, "epoch": 3400} {"train_loss": -6.805712699890137, "global_step": 142840, "epoch": 3400} {"train_loss": -6.795521452313378, "global_step": 142841, "epoch": 3400, "train/sim_max_reward_0": 0.7766888856632813, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.5271925739568686, "train/sim_max_reward_3": 0.9749226150658895, "train/sim_max_reward_4": 0.9775347923931724, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.839136262230221, "test/sim_max_reward_4300002": 0.9226264257642023, "test/sim_max_reward_4300003": 0.9771939218466276, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8975135335555954, "test/sim_max_reward_4300006": 0.7300682771036687, "test/sim_max_reward_4300007": 0.3029384445354333, "test/sim_max_reward_4300008": 0.8682477766672482, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.9705089966720919, "test/sim_max_reward_4300011": 0.3064672643783003, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.4186601059508682, "test/sim_max_reward_4300014": 0.9396631019913313, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.9241977942146672, "test/sim_max_reward_4300017": 0.358691334726353, "test/sim_max_reward_4300018": 0.363438321178302, "test/sim_max_reward_4300019": 0.18629129169531047, "test/sim_max_reward_4300020": 0.8804252030174624, "test/sim_max_reward_4300021": 0.9775683661318728, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.5304201355613428, "test/sim_max_reward_4300024": 0.48968439631313604, "test/sim_max_reward_4300025": 0.9579324763885356, "test/sim_max_reward_4300026": 0.17744957625918958, "test/sim_max_reward_4300027": 0.9838263423135883, "test/sim_max_reward_4300028": 0.98359873864741, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.1344561018865356, "test/sim_max_reward_4300031": 0.4058750484817619, "test/sim_max_reward_4300032": 0.9474234131175447, "test/sim_max_reward_4300033": 0.9922209852737603, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.4537935695650684, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9903215139468257, "test/sim_max_reward_4300038": 0.9132632881482535, "test/sim_max_reward_4300039": 0.8794212350302718, "test/sim_max_reward_4300040": 0.8653208205322084, "test/sim_max_reward_4300041": 0.980903203929079, "test/sim_max_reward_4300042": 0.9528980269927888, "test/sim_max_reward_4300043": 0.14420100087349724, "test/sim_max_reward_4300044": 0.9097910971224833, "test/sim_max_reward_4300045": 0.1977940804244879, "test/sim_max_reward_4300046": 0.0, "test/sim_max_reward_4300047": 0.18499337681543945, "test/sim_max_reward_4300048": 0.00446542987220213, "test/sim_max_reward_4300049": 0.9808021903620666, "train/mean_score": 0.7415539377402333, "test/mean_score": 0.622790413797796, "val_loss": 67523.515625} {"train_loss": -6.8120341300964355, "global_step": 142842, "epoch": 3401} {"train_loss": -6.773616790771484, "global_step": 142843, "epoch": 3401} {"train_loss": -6.899458885192871, "global_step": 142844, "epoch": 3401} {"train_loss": -6.729537010192871, "global_step": 142845, "epoch": 3401} {"train_loss": -6.695655345916748, "global_step": 142846, "epoch": 3401} {"train_loss": -6.820535182952881, "global_step": 142847, "epoch": 3401} {"train_loss": -6.86635684967041, "global_step": 142848, "epoch": 3401} {"train_loss": -6.758110046386719, "global_step": 142849, "epoch": 3401} {"train_loss": -6.75081729888916, "global_step": 142850, "epoch": 3401} {"train_loss": -6.777409553527832, "global_step": 142851, "epoch": 3401} {"train_loss": -6.742513656616211, "global_step": 142852, "epoch": 3401} {"train_loss": -6.900829792022705, "global_step": 142853, "epoch": 3401} {"train_loss": -6.865874290466309, "global_step": 142854, "epoch": 3401} {"train_loss": -6.758112907409668, "global_step": 142855, "epoch": 3401} {"train_loss": -6.944063186645508, "global_step": 142856, "epoch": 3401} {"train_loss": -6.890448570251465, "global_step": 142857, "epoch": 3401} {"train_loss": -6.750023365020752, "global_step": 142858, "epoch": 3401} {"train_loss": -6.966599464416504, "global_step": 142859, "epoch": 3401} {"train_loss": -6.79554557800293, "global_step": 142860, "epoch": 3401} {"train_loss": -6.677370071411133, "global_step": 142861, "epoch": 3401} {"train_loss": -6.831507682800293, "global_step": 142862, "epoch": 3401} {"train_loss": -6.769941329956055, "global_step": 142863, "epoch": 3401} {"train_loss": -6.782652854919434, "global_step": 142864, "epoch": 3401} {"train_loss": -6.698699951171875, "global_step": 142865, "epoch": 3401} {"train_loss": -6.89932107925415, "global_step": 142866, "epoch": 3401} {"train_loss": -6.818610668182373, "global_step": 142867, "epoch": 3401} {"train_loss": -6.84503173828125, "global_step": 142868, "epoch": 3401} {"train_loss": -6.886264324188232, "global_step": 142869, "epoch": 3401} {"train_loss": -6.777796745300293, "global_step": 142870, "epoch": 3401} {"train_loss": -6.856448650360107, "global_step": 142871, "epoch": 3401} {"train_loss": -6.797094821929932, "global_step": 142872, "epoch": 3401} {"train_loss": -6.686975479125977, "global_step": 142873, "epoch": 3401} {"train_loss": -6.714664459228516, "global_step": 142874, "epoch": 3401} {"train_loss": -6.963726043701172, "global_step": 142875, "epoch": 3401} {"train_loss": -6.862823486328125, "global_step": 142876, "epoch": 3401} {"train_loss": -6.844995498657227, "global_step": 142877, "epoch": 3401} {"train_loss": -6.828570365905762, "global_step": 142878, "epoch": 3401} {"train_loss": -6.81392765045166, "global_step": 142879, "epoch": 3401} {"train_loss": -6.855865478515625, "global_step": 142880, "epoch": 3401} {"train_loss": -6.780326843261719, "global_step": 142881, "epoch": 3401} {"train_loss": -6.885807037353516, "global_step": 142882, "epoch": 3401} {"train_loss": -6.814060256594703, "global_step": 142883, "epoch": 3401, "val_loss": 67561.7265625} {"train_loss": -6.8880767822265625, "global_step": 142884, "epoch": 3402} {"train_loss": -6.801083564758301, "global_step": 142885, "epoch": 3402} {"train_loss": -6.7616658210754395, "global_step": 142886, "epoch": 3402} {"train_loss": -6.876112937927246, "global_step": 142887, "epoch": 3402} {"train_loss": -6.735740661621094, "global_step": 142888, "epoch": 3402} {"train_loss": -6.7962236404418945, "global_step": 142889, "epoch": 3402} {"train_loss": -6.923698425292969, "global_step": 142890, "epoch": 3402} {"train_loss": -6.7491984367370605, "global_step": 142891, "epoch": 3402} {"train_loss": -6.83629846572876, "global_step": 142892, "epoch": 3402} {"train_loss": -6.859454154968262, "global_step": 142893, "epoch": 3402} {"train_loss": -6.828845500946045, "global_step": 142894, "epoch": 3402} {"train_loss": -6.764347076416016, "global_step": 142895, "epoch": 3402} {"train_loss": -6.862430095672607, "global_step": 142896, "epoch": 3402} {"train_loss": -6.760047435760498, "global_step": 142897, "epoch": 3402} {"train_loss": -6.787932395935059, "global_step": 142898, "epoch": 3402} {"train_loss": -6.792296409606934, "global_step": 142899, "epoch": 3402} {"train_loss": -6.841873645782471, "global_step": 142900, "epoch": 3402} {"train_loss": -6.818354606628418, "global_step": 142901, "epoch": 3402} {"train_loss": -6.725510120391846, "global_step": 142902, "epoch": 3402} {"train_loss": -6.9029645919799805, "global_step": 142903, "epoch": 3402} {"train_loss": -6.711291313171387, "global_step": 142904, "epoch": 3402} {"train_loss": -6.788186073303223, "global_step": 142905, "epoch": 3402} {"train_loss": -6.840197563171387, "global_step": 142906, "epoch": 3402} {"train_loss": -6.851670265197754, "global_step": 142907, "epoch": 3402} {"train_loss": -6.667963027954102, "global_step": 142908, "epoch": 3402} {"train_loss": -6.716377258300781, "global_step": 142909, "epoch": 3402} {"train_loss": -6.709352493286133, "global_step": 142910, "epoch": 3402} {"train_loss": -6.772526741027832, "global_step": 142911, "epoch": 3402} {"train_loss": -6.804407596588135, "global_step": 142912, "epoch": 3402} {"train_loss": -6.7545647621154785, "global_step": 142913, "epoch": 3402} {"train_loss": -6.798698425292969, "global_step": 142914, "epoch": 3402} {"train_loss": -6.842743873596191, "global_step": 142915, "epoch": 3402} {"train_loss": -6.771633148193359, "global_step": 142916, "epoch": 3402} {"train_loss": -6.6882171630859375, "global_step": 142917, "epoch": 3402} {"train_loss": -6.866650581359863, "global_step": 142918, "epoch": 3402} {"train_loss": -6.886173248291016, "global_step": 142919, "epoch": 3402} {"train_loss": -6.723535537719727, "global_step": 142920, "epoch": 3402} {"train_loss": -6.8498382568359375, "global_step": 142921, "epoch": 3402} {"train_loss": -6.888078689575195, "global_step": 142922, "epoch": 3402} {"train_loss": -6.852982521057129, "global_step": 142923, "epoch": 3402} {"train_loss": -6.827774524688721, "global_step": 142924, "epoch": 3402} {"train_loss": -6.80375709987822, "global_step": 142925, "epoch": 3402, "val_loss": 67428.15625} {"train_loss": -6.857151031494141, "global_step": 142926, "epoch": 3403} {"train_loss": -6.744165420532227, "global_step": 142927, "epoch": 3403} {"train_loss": -6.907670021057129, "global_step": 142928, "epoch": 3403} {"train_loss": -6.864228248596191, "global_step": 142929, "epoch": 3403} {"train_loss": -6.902303695678711, "global_step": 142930, "epoch": 3403} {"train_loss": -6.787594795227051, "global_step": 142931, "epoch": 3403} {"train_loss": -6.763504505157471, "global_step": 142932, "epoch": 3403} {"train_loss": -6.8029913902282715, "global_step": 142933, "epoch": 3403} {"train_loss": -6.851217269897461, "global_step": 142934, "epoch": 3403} {"train_loss": -6.841441631317139, "global_step": 142935, "epoch": 3403} {"train_loss": -6.666062831878662, "global_step": 142936, "epoch": 3403} {"train_loss": -6.767687797546387, "global_step": 142937, "epoch": 3403} {"train_loss": -6.825644016265869, "global_step": 142938, "epoch": 3403} {"train_loss": -6.805784225463867, "global_step": 142939, "epoch": 3403} {"train_loss": -6.770911693572998, "global_step": 142940, "epoch": 3403} {"train_loss": -6.726109504699707, "global_step": 142941, "epoch": 3403} {"train_loss": -6.8350443840026855, "global_step": 142942, "epoch": 3403} {"train_loss": -6.567601680755615, "global_step": 142943, "epoch": 3403} {"train_loss": -6.794686317443848, "global_step": 142944, "epoch": 3403} {"train_loss": -6.746476650238037, "global_step": 142945, "epoch": 3403} {"train_loss": -6.7956647872924805, "global_step": 142946, "epoch": 3403} {"train_loss": -6.702455520629883, "global_step": 142947, "epoch": 3403} {"train_loss": -6.65461540222168, "global_step": 142948, "epoch": 3403} {"train_loss": -6.818880081176758, "global_step": 142949, "epoch": 3403} {"train_loss": -6.602619171142578, "global_step": 142950, "epoch": 3403} {"train_loss": -6.782180309295654, "global_step": 142951, "epoch": 3403} {"train_loss": -6.661108016967773, "global_step": 142952, "epoch": 3403} {"train_loss": -6.773495674133301, "global_step": 142953, "epoch": 3403} {"train_loss": -6.769041538238525, "global_step": 142954, "epoch": 3403} {"train_loss": -6.718955993652344, "global_step": 142955, "epoch": 3403} {"train_loss": -6.758423328399658, "global_step": 142956, "epoch": 3403} {"train_loss": -6.8129167556762695, "global_step": 142957, "epoch": 3403} {"train_loss": -6.666267395019531, "global_step": 142958, "epoch": 3403} {"train_loss": -6.805739879608154, "global_step": 142959, "epoch": 3403} {"train_loss": -6.859355926513672, "global_step": 142960, "epoch": 3403} {"train_loss": -6.7255706787109375, "global_step": 142961, "epoch": 3403} {"train_loss": -6.739435195922852, "global_step": 142962, "epoch": 3403} {"train_loss": -6.847950458526611, "global_step": 142963, "epoch": 3403} {"train_loss": -6.738587379455566, "global_step": 142964, "epoch": 3403} {"train_loss": -6.79123592376709, "global_step": 142965, "epoch": 3403} {"train_loss": -6.800682067871094, "global_step": 142966, "epoch": 3403} {"train_loss": -6.76921474365961, "global_step": 142967, "epoch": 3403, "val_loss": 67722.21875} {"train_loss": -6.686515808105469, "global_step": 142968, "epoch": 3404} {"train_loss": -6.827232360839844, "global_step": 142969, "epoch": 3404} {"train_loss": -6.683409214019775, "global_step": 142970, "epoch": 3404} {"train_loss": -6.718395709991455, "global_step": 142971, "epoch": 3404} {"train_loss": -6.695633888244629, "global_step": 142972, "epoch": 3404} {"train_loss": -6.732994556427002, "global_step": 142973, "epoch": 3404} {"train_loss": -6.705113410949707, "global_step": 142974, "epoch": 3404} {"train_loss": -6.854626655578613, "global_step": 142975, "epoch": 3404} {"train_loss": -6.6614603996276855, "global_step": 142976, "epoch": 3404} {"train_loss": -6.77976131439209, "global_step": 142977, "epoch": 3404} {"train_loss": -6.841329574584961, "global_step": 142978, "epoch": 3404} {"train_loss": -6.8379316329956055, "global_step": 142979, "epoch": 3404} {"train_loss": -6.854884147644043, "global_step": 142980, "epoch": 3404} {"train_loss": -6.863783836364746, "global_step": 142981, "epoch": 3404} {"train_loss": -6.91139030456543, "global_step": 142982, "epoch": 3404} {"train_loss": -6.89109468460083, "global_step": 142983, "epoch": 3404} {"train_loss": -6.870633602142334, "global_step": 142984, "epoch": 3404} {"train_loss": -6.844998836517334, "global_step": 142985, "epoch": 3404} {"train_loss": -6.731300354003906, "global_step": 142986, "epoch": 3404} {"train_loss": -6.8819050788879395, "global_step": 142987, "epoch": 3404} {"train_loss": -6.932101249694824, "global_step": 142988, "epoch": 3404} {"train_loss": -6.703217506408691, "global_step": 142989, "epoch": 3404} {"train_loss": -6.8224101066589355, "global_step": 142990, "epoch": 3404} {"train_loss": -6.861683368682861, "global_step": 142991, "epoch": 3404} {"train_loss": -6.702750205993652, "global_step": 142992, "epoch": 3404} {"train_loss": -6.904295921325684, "global_step": 142993, "epoch": 3404} {"train_loss": -6.9801225662231445, "global_step": 142994, "epoch": 3404} {"train_loss": -6.821558952331543, "global_step": 142995, "epoch": 3404} {"train_loss": -6.860527038574219, "global_step": 142996, "epoch": 3404} {"train_loss": -6.792818069458008, "global_step": 142997, "epoch": 3404} {"train_loss": -6.862962245941162, "global_step": 142998, "epoch": 3404} {"train_loss": -6.81584358215332, "global_step": 142999, "epoch": 3404} {"train_loss": -6.6830244064331055, "global_step": 143000, "epoch": 3404} {"train_loss": -6.7423858642578125, "global_step": 143001, "epoch": 3404} {"train_loss": -6.7669572830200195, "global_step": 143002, "epoch": 3404} {"train_loss": -6.765763282775879, "global_step": 143003, "epoch": 3404} {"train_loss": -6.740452766418457, "global_step": 143004, "epoch": 3404} {"train_loss": -6.788388729095459, "global_step": 143005, "epoch": 3404} {"train_loss": -6.887636661529541, "global_step": 143006, "epoch": 3404} {"train_loss": -6.8362274169921875, "global_step": 143007, "epoch": 3404} {"train_loss": -6.814457893371582, "global_step": 143008, "epoch": 3404} {"train_loss": -6.80008830342974, "global_step": 143009, "epoch": 3404, "val_loss": 67479.1015625} {"train_loss": -6.919661045074463, "global_step": 143010, "epoch": 3405} {"train_loss": -6.813385963439941, "global_step": 143011, "epoch": 3405} {"train_loss": -6.823734760284424, "global_step": 143012, "epoch": 3405} {"train_loss": -6.828317642211914, "global_step": 143013, "epoch": 3405} {"train_loss": -6.665074348449707, "global_step": 143014, "epoch": 3405} {"train_loss": -6.771921157836914, "global_step": 143015, "epoch": 3405} {"train_loss": -6.699258804321289, "global_step": 143016, "epoch": 3405} {"train_loss": -6.753696441650391, "global_step": 143017, "epoch": 3405} {"train_loss": -6.72794771194458, "global_step": 143018, "epoch": 3405} {"train_loss": -6.678264617919922, "global_step": 143019, "epoch": 3405} {"train_loss": -6.758141994476318, "global_step": 143020, "epoch": 3405} {"train_loss": -6.76192569732666, "global_step": 143021, "epoch": 3405} {"train_loss": -6.755002975463867, "global_step": 143022, "epoch": 3405} {"train_loss": -6.767173767089844, "global_step": 143023, "epoch": 3405} {"train_loss": -6.6966047286987305, "global_step": 143024, "epoch": 3405} {"train_loss": -6.851813793182373, "global_step": 143025, "epoch": 3405} {"train_loss": -6.634025573730469, "global_step": 143026, "epoch": 3405} {"train_loss": -6.841750144958496, "global_step": 143027, "epoch": 3405} {"train_loss": -6.862518787384033, "global_step": 143028, "epoch": 3405} {"train_loss": -6.727357864379883, "global_step": 143029, "epoch": 3405} {"train_loss": -6.767394065856934, "global_step": 143030, "epoch": 3405} {"train_loss": -6.871918201446533, "global_step": 143031, "epoch": 3405} {"train_loss": -6.761923789978027, "global_step": 143032, "epoch": 3405} {"train_loss": -6.724069118499756, "global_step": 143033, "epoch": 3405} {"train_loss": -6.778662204742432, "global_step": 143034, "epoch": 3405} {"train_loss": -6.66713809967041, "global_step": 143035, "epoch": 3405} {"train_loss": -6.765138626098633, "global_step": 143036, "epoch": 3405} {"train_loss": -6.683897972106934, "global_step": 143037, "epoch": 3405} {"train_loss": -6.69549036026001, "global_step": 143038, "epoch": 3405} {"train_loss": -6.770589351654053, "global_step": 143039, "epoch": 3405} {"train_loss": -6.711309432983398, "global_step": 143040, "epoch": 3405} {"train_loss": -6.785243034362793, "global_step": 143041, "epoch": 3405} {"train_loss": -6.706884860992432, "global_step": 143042, "epoch": 3405} {"train_loss": -6.721832275390625, "global_step": 143043, "epoch": 3405} {"train_loss": -6.710040092468262, "global_step": 143044, "epoch": 3405} {"train_loss": -6.646323204040527, "global_step": 143045, "epoch": 3405} {"train_loss": -6.803743362426758, "global_step": 143046, "epoch": 3405} {"train_loss": -6.734590530395508, "global_step": 143047, "epoch": 3405} {"train_loss": -6.787600994110107, "global_step": 143048, "epoch": 3405} {"train_loss": -6.84173583984375, "global_step": 143049, "epoch": 3405} {"train_loss": -6.7115678787231445, "global_step": 143050, "epoch": 3405} {"train_loss": -6.756828115099952, "global_step": 143051, "epoch": 3405, "val_loss": 67405.2109375} {"train_loss": -6.843428134918213, "global_step": 143052, "epoch": 3406} {"train_loss": -6.786733150482178, "global_step": 143053, "epoch": 3406} {"train_loss": -6.671372890472412, "global_step": 143054, "epoch": 3406} {"train_loss": -6.770663261413574, "global_step": 143055, "epoch": 3406} {"train_loss": -6.700885772705078, "global_step": 143056, "epoch": 3406} {"train_loss": -6.682007789611816, "global_step": 143057, "epoch": 3406} {"train_loss": -6.7136969566345215, "global_step": 143058, "epoch": 3406} {"train_loss": -6.763941764831543, "global_step": 143059, "epoch": 3406} {"train_loss": -6.782355308532715, "global_step": 143060, "epoch": 3406} {"train_loss": -6.888695240020752, "global_step": 143061, "epoch": 3406} {"train_loss": -6.771458148956299, "global_step": 143062, "epoch": 3406} {"train_loss": -6.925911903381348, "global_step": 143063, "epoch": 3406} {"train_loss": -6.754980087280273, "global_step": 143064, "epoch": 3406} {"train_loss": -6.738584518432617, "global_step": 143065, "epoch": 3406} {"train_loss": -6.7201738357543945, "global_step": 143066, "epoch": 3406} {"train_loss": -6.807747840881348, "global_step": 143067, "epoch": 3406} {"train_loss": -6.7638654708862305, "global_step": 143068, "epoch": 3406} {"train_loss": -6.853189468383789, "global_step": 143069, "epoch": 3406} {"train_loss": -6.829809188842773, "global_step": 143070, "epoch": 3406} {"train_loss": -6.790902614593506, "global_step": 143071, "epoch": 3406} {"train_loss": -6.634554862976074, "global_step": 143072, "epoch": 3406} {"train_loss": -6.816539764404297, "global_step": 143073, "epoch": 3406} {"train_loss": -6.773998260498047, "global_step": 143074, "epoch": 3406} {"train_loss": -6.6538543701171875, "global_step": 143075, "epoch": 3406} {"train_loss": -6.897001266479492, "global_step": 143076, "epoch": 3406} {"train_loss": -6.787252426147461, "global_step": 143077, "epoch": 3406} {"train_loss": -6.804062843322754, "global_step": 143078, "epoch": 3406} {"train_loss": -6.875504970550537, "global_step": 143079, "epoch": 3406} {"train_loss": -6.785572052001953, "global_step": 143080, "epoch": 3406} {"train_loss": -6.946780204772949, "global_step": 143081, "epoch": 3406} {"train_loss": -6.727780818939209, "global_step": 143082, "epoch": 3406} {"train_loss": -6.837765693664551, "global_step": 143083, "epoch": 3406} {"train_loss": -6.8345794677734375, "global_step": 143084, "epoch": 3406} {"train_loss": -6.842196464538574, "global_step": 143085, "epoch": 3406} {"train_loss": -6.893122673034668, "global_step": 143086, "epoch": 3406} {"train_loss": -6.796889781951904, "global_step": 143087, "epoch": 3406} {"train_loss": -6.804230213165283, "global_step": 143088, "epoch": 3406} {"train_loss": -6.872926712036133, "global_step": 143089, "epoch": 3406} {"train_loss": -6.859560012817383, "global_step": 143090, "epoch": 3406} {"train_loss": -6.925775051116943, "global_step": 143091, "epoch": 3406} {"train_loss": -6.737706661224365, "global_step": 143092, "epoch": 3406} {"train_loss": -6.79849902788798, "global_step": 143093, "epoch": 3406, "val_loss": 67491.921875} {"train_loss": -6.742084503173828, "global_step": 143094, "epoch": 3407} {"train_loss": -6.886675834655762, "global_step": 143095, "epoch": 3407} {"train_loss": -6.81326961517334, "global_step": 143096, "epoch": 3407} {"train_loss": -6.871004104614258, "global_step": 143097, "epoch": 3407} {"train_loss": -6.932661533355713, "global_step": 143098, "epoch": 3407} {"train_loss": -6.814699172973633, "global_step": 143099, "epoch": 3407} {"train_loss": -6.863895893096924, "global_step": 143100, "epoch": 3407} {"train_loss": -6.817141532897949, "global_step": 143101, "epoch": 3407} {"train_loss": -6.830628395080566, "global_step": 143102, "epoch": 3407} {"train_loss": -6.8240647315979, "global_step": 143103, "epoch": 3407} {"train_loss": -6.874713897705078, "global_step": 143104, "epoch": 3407} {"train_loss": -6.808778762817383, "global_step": 143105, "epoch": 3407} {"train_loss": -6.90089225769043, "global_step": 143106, "epoch": 3407} {"train_loss": -6.8082475662231445, "global_step": 143107, "epoch": 3407} {"train_loss": -6.7988080978393555, "global_step": 143108, "epoch": 3407} {"train_loss": -6.774290561676025, "global_step": 143109, "epoch": 3407} {"train_loss": -6.847657203674316, "global_step": 143110, "epoch": 3407} {"train_loss": -6.822023391723633, "global_step": 143111, "epoch": 3407} {"train_loss": -6.953022480010986, "global_step": 143112, "epoch": 3407} {"train_loss": -6.801344394683838, "global_step": 143113, "epoch": 3407} {"train_loss": -6.763300895690918, "global_step": 143114, "epoch": 3407} {"train_loss": -6.8041768074035645, "global_step": 143115, "epoch": 3407} {"train_loss": -6.761852264404297, "global_step": 143116, "epoch": 3407} {"train_loss": -6.706027984619141, "global_step": 143117, "epoch": 3407} {"train_loss": -6.774836540222168, "global_step": 143118, "epoch": 3407} {"train_loss": -6.76259183883667, "global_step": 143119, "epoch": 3407} {"train_loss": -6.702288627624512, "global_step": 143120, "epoch": 3407} {"train_loss": -6.747107982635498, "global_step": 143121, "epoch": 3407} {"train_loss": -6.7829742431640625, "global_step": 143122, "epoch": 3407} {"train_loss": -6.556794166564941, "global_step": 143123, "epoch": 3407} {"train_loss": -6.765194892883301, "global_step": 143124, "epoch": 3407} {"train_loss": -6.83464241027832, "global_step": 143125, "epoch": 3407} {"train_loss": -6.6929030418396, "global_step": 143126, "epoch": 3407} {"train_loss": -6.770918369293213, "global_step": 143127, "epoch": 3407} {"train_loss": -6.676322937011719, "global_step": 143128, "epoch": 3407} {"train_loss": -6.7660722732543945, "global_step": 143129, "epoch": 3407} {"train_loss": -6.796961307525635, "global_step": 143130, "epoch": 3407} {"train_loss": -6.8388824462890625, "global_step": 143131, "epoch": 3407} {"train_loss": -6.76832914352417, "global_step": 143132, "epoch": 3407} {"train_loss": -6.717674255371094, "global_step": 143133, "epoch": 3407} {"train_loss": -6.647874355316162, "global_step": 143134, "epoch": 3407} {"train_loss": -6.790206420989263, "global_step": 143135, "epoch": 3407, "val_loss": 67654.1640625} {"train_loss": -6.77739143371582, "global_step": 143136, "epoch": 3408} {"train_loss": -6.782031059265137, "global_step": 143137, "epoch": 3408} {"train_loss": -6.805600166320801, "global_step": 143138, "epoch": 3408} {"train_loss": -6.774924278259277, "global_step": 143139, "epoch": 3408} {"train_loss": -6.789156913757324, "global_step": 143140, "epoch": 3408} {"train_loss": -6.663402557373047, "global_step": 143141, "epoch": 3408} {"train_loss": -6.910264015197754, "global_step": 143142, "epoch": 3408} {"train_loss": -6.860465049743652, "global_step": 143143, "epoch": 3408} {"train_loss": -6.733250141143799, "global_step": 143144, "epoch": 3408} {"train_loss": -6.677206516265869, "global_step": 143145, "epoch": 3408} {"train_loss": -6.781833648681641, "global_step": 143146, "epoch": 3408} {"train_loss": -6.708032608032227, "global_step": 143147, "epoch": 3408} {"train_loss": -6.82627534866333, "global_step": 143148, "epoch": 3408} {"train_loss": -6.70426082611084, "global_step": 143149, "epoch": 3408} {"train_loss": -6.8022847175598145, "global_step": 143150, "epoch": 3408} {"train_loss": -6.756200790405273, "global_step": 143151, "epoch": 3408} {"train_loss": -6.7775373458862305, "global_step": 143152, "epoch": 3408} {"train_loss": -6.764383316040039, "global_step": 143153, "epoch": 3408} {"train_loss": -6.8816609382629395, "global_step": 143154, "epoch": 3408} {"train_loss": -6.749938488006592, "global_step": 143155, "epoch": 3408} {"train_loss": -6.764581680297852, "global_step": 143156, "epoch": 3408} {"train_loss": -6.71425199508667, "global_step": 143157, "epoch": 3408} {"train_loss": -6.671501159667969, "global_step": 143158, "epoch": 3408} {"train_loss": -6.693899154663086, "global_step": 143159, "epoch": 3408} {"train_loss": -6.892290115356445, "global_step": 143160, "epoch": 3408} {"train_loss": -6.715021133422852, "global_step": 143161, "epoch": 3408} {"train_loss": -6.619505882263184, "global_step": 143162, "epoch": 3408} {"train_loss": -6.691536903381348, "global_step": 143163, "epoch": 3408} {"train_loss": -6.718547821044922, "global_step": 143164, "epoch": 3408} {"train_loss": -6.609550476074219, "global_step": 143165, "epoch": 3408} {"train_loss": -6.815739154815674, "global_step": 143166, "epoch": 3408} {"train_loss": -6.5406904220581055, "global_step": 143167, "epoch": 3408} {"train_loss": -6.760085105895996, "global_step": 143168, "epoch": 3408} {"train_loss": -6.713934421539307, "global_step": 143169, "epoch": 3408} {"train_loss": -6.743240833282471, "global_step": 143170, "epoch": 3408} {"train_loss": -6.748117446899414, "global_step": 143171, "epoch": 3408} {"train_loss": -6.7490339279174805, "global_step": 143172, "epoch": 3408} {"train_loss": -6.726104259490967, "global_step": 143173, "epoch": 3408} {"train_loss": -6.688594818115234, "global_step": 143174, "epoch": 3408} {"train_loss": -6.791399002075195, "global_step": 143175, "epoch": 3408} {"train_loss": -6.591324806213379, "global_step": 143176, "epoch": 3408} {"train_loss": -6.745412451880319, "global_step": 143177, "epoch": 3408, "val_loss": 67682.90625} {"train_loss": -6.760339736938477, "global_step": 143178, "epoch": 3409} {"train_loss": -6.729477882385254, "global_step": 143179, "epoch": 3409} {"train_loss": -6.729578018188477, "global_step": 143180, "epoch": 3409} {"train_loss": -6.814511299133301, "global_step": 143181, "epoch": 3409} {"train_loss": -6.779007911682129, "global_step": 143182, "epoch": 3409} {"train_loss": -6.817342758178711, "global_step": 143183, "epoch": 3409} {"train_loss": -6.756995677947998, "global_step": 143184, "epoch": 3409} {"train_loss": -6.759625434875488, "global_step": 143185, "epoch": 3409} {"train_loss": -6.804888725280762, "global_step": 143186, "epoch": 3409} {"train_loss": -6.750141143798828, "global_step": 143187, "epoch": 3409} {"train_loss": -6.722736835479736, "global_step": 143188, "epoch": 3409} {"train_loss": -6.870813369750977, "global_step": 143189, "epoch": 3409} {"train_loss": -6.801695823669434, "global_step": 143190, "epoch": 3409} {"train_loss": -6.8143415451049805, "global_step": 143191, "epoch": 3409} {"train_loss": -6.877362251281738, "global_step": 143192, "epoch": 3409} {"train_loss": -6.826101303100586, "global_step": 143193, "epoch": 3409} {"train_loss": -6.827596664428711, "global_step": 143194, "epoch": 3409} {"train_loss": -6.767339706420898, "global_step": 143195, "epoch": 3409} {"train_loss": -6.791491508483887, "global_step": 143196, "epoch": 3409} {"train_loss": -6.806884288787842, "global_step": 143197, "epoch": 3409} {"train_loss": -6.790564060211182, "global_step": 143198, "epoch": 3409} {"train_loss": -6.764960289001465, "global_step": 143199, "epoch": 3409} {"train_loss": -6.812287330627441, "global_step": 143200, "epoch": 3409} {"train_loss": -6.812565326690674, "global_step": 143201, "epoch": 3409} {"train_loss": -6.779597282409668, "global_step": 143202, "epoch": 3409} {"train_loss": -6.728370666503906, "global_step": 143203, "epoch": 3409} {"train_loss": -6.871623992919922, "global_step": 143204, "epoch": 3409} {"train_loss": -6.771300315856934, "global_step": 143205, "epoch": 3409} {"train_loss": -6.674525260925293, "global_step": 143206, "epoch": 3409} {"train_loss": -6.789467811584473, "global_step": 143207, "epoch": 3409} {"train_loss": -6.793300151824951, "global_step": 143208, "epoch": 3409} {"train_loss": -6.795137405395508, "global_step": 143209, "epoch": 3409} {"train_loss": -6.813860893249512, "global_step": 143210, "epoch": 3409} {"train_loss": -6.833014488220215, "global_step": 143211, "epoch": 3409} {"train_loss": -6.733338832855225, "global_step": 143212, "epoch": 3409} {"train_loss": -6.69742488861084, "global_step": 143213, "epoch": 3409} {"train_loss": -6.775390148162842, "global_step": 143214, "epoch": 3409} {"train_loss": -6.7968597412109375, "global_step": 143215, "epoch": 3409} {"train_loss": -6.706528663635254, "global_step": 143216, "epoch": 3409} {"train_loss": -6.7456889152526855, "global_step": 143217, "epoch": 3409} {"train_loss": -6.705164432525635, "global_step": 143218, "epoch": 3409} {"train_loss": -6.779266584487188, "global_step": 143219, "epoch": 3409, "val_loss": 67389.4140625} {"train_loss": -6.807583332061768, "global_step": 143220, "epoch": 3410} {"train_loss": -6.8441314697265625, "global_step": 143221, "epoch": 3410} {"train_loss": -6.867605209350586, "global_step": 143222, "epoch": 3410} {"train_loss": -6.756462574005127, "global_step": 143223, "epoch": 3410} {"train_loss": -6.755979537963867, "global_step": 143224, "epoch": 3410} {"train_loss": -6.785711288452148, "global_step": 143225, "epoch": 3410} {"train_loss": -6.632016181945801, "global_step": 143226, "epoch": 3410} {"train_loss": -6.907865524291992, "global_step": 143227, "epoch": 3410} {"train_loss": -6.731554985046387, "global_step": 143228, "epoch": 3410} {"train_loss": -6.817862510681152, "global_step": 143229, "epoch": 3410} {"train_loss": -6.717495918273926, "global_step": 143230, "epoch": 3410} {"train_loss": -6.715936660766602, "global_step": 143231, "epoch": 3410} {"train_loss": -6.842018127441406, "global_step": 143232, "epoch": 3410} {"train_loss": -6.909485816955566, "global_step": 143233, "epoch": 3410} {"train_loss": -6.621150493621826, "global_step": 143234, "epoch": 3410} {"train_loss": -6.845762729644775, "global_step": 143235, "epoch": 3410} {"train_loss": -6.812111854553223, "global_step": 143236, "epoch": 3410} {"train_loss": -6.80984354019165, "global_step": 143237, "epoch": 3410} {"train_loss": -6.808756351470947, "global_step": 143238, "epoch": 3410} {"train_loss": -6.846680641174316, "global_step": 143239, "epoch": 3410} {"train_loss": -6.836549282073975, "global_step": 143240, "epoch": 3410} {"train_loss": -6.922677040100098, "global_step": 143241, "epoch": 3410} {"train_loss": -6.926043510437012, "global_step": 143242, "epoch": 3410} {"train_loss": -6.809739112854004, "global_step": 143243, "epoch": 3410} {"train_loss": -6.783975601196289, "global_step": 143244, "epoch": 3410} {"train_loss": -6.94954776763916, "global_step": 143245, "epoch": 3410} {"train_loss": -6.763116836547852, "global_step": 143246, "epoch": 3410} {"train_loss": -6.73528528213501, "global_step": 143247, "epoch": 3410} {"train_loss": -6.773882865905762, "global_step": 143248, "epoch": 3410} {"train_loss": -6.844661712646484, "global_step": 143249, "epoch": 3410} {"train_loss": -6.740362644195557, "global_step": 143250, "epoch": 3410} {"train_loss": -6.8403472900390625, "global_step": 143251, "epoch": 3410} {"train_loss": -6.829533100128174, "global_step": 143252, "epoch": 3410} {"train_loss": -6.808683395385742, "global_step": 143253, "epoch": 3410} {"train_loss": -6.847269058227539, "global_step": 143254, "epoch": 3410} {"train_loss": -6.908576965332031, "global_step": 143255, "epoch": 3410} {"train_loss": -6.809632301330566, "global_step": 143256, "epoch": 3410} {"train_loss": -6.796457290649414, "global_step": 143257, "epoch": 3410} {"train_loss": -6.787484169006348, "global_step": 143258, "epoch": 3410} {"train_loss": -6.84559440612793, "global_step": 143259, "epoch": 3410} {"train_loss": -6.844559192657471, "global_step": 143260, "epoch": 3410} {"train_loss": -6.810371557871501, "global_step": 143261, "epoch": 3410, "val_loss": 67628.7890625} {"train_loss": -6.85246467590332, "global_step": 143262, "epoch": 3411} {"train_loss": -6.8451313972473145, "global_step": 143263, "epoch": 3411} {"train_loss": -6.864226341247559, "global_step": 143264, "epoch": 3411} {"train_loss": -6.8372392654418945, "global_step": 143265, "epoch": 3411} {"train_loss": -6.849309921264648, "global_step": 143266, "epoch": 3411} {"train_loss": -6.744278907775879, "global_step": 143267, "epoch": 3411} {"train_loss": -6.7820844650268555, "global_step": 143268, "epoch": 3411} {"train_loss": -6.76906681060791, "global_step": 143269, "epoch": 3411} {"train_loss": -6.807257652282715, "global_step": 143270, "epoch": 3411} {"train_loss": -6.723088264465332, "global_step": 143271, "epoch": 3411} {"train_loss": -6.7111663818359375, "global_step": 143272, "epoch": 3411} {"train_loss": -6.817860126495361, "global_step": 143273, "epoch": 3411} {"train_loss": -6.708865165710449, "global_step": 143274, "epoch": 3411} {"train_loss": -6.711977958679199, "global_step": 143275, "epoch": 3411} {"train_loss": -6.71812105178833, "global_step": 143276, "epoch": 3411} {"train_loss": -6.74630069732666, "global_step": 143277, "epoch": 3411} {"train_loss": -6.680523872375488, "global_step": 143278, "epoch": 3411} {"train_loss": -6.568227767944336, "global_step": 143279, "epoch": 3411} {"train_loss": -6.818479537963867, "global_step": 143280, "epoch": 3411} {"train_loss": -6.623808860778809, "global_step": 143281, "epoch": 3411} {"train_loss": -6.783785820007324, "global_step": 143282, "epoch": 3411} {"train_loss": -6.789341449737549, "global_step": 143283, "epoch": 3411} {"train_loss": -6.778478145599365, "global_step": 143284, "epoch": 3411} {"train_loss": -6.815290927886963, "global_step": 143285, "epoch": 3411} {"train_loss": -6.70113468170166, "global_step": 143286, "epoch": 3411} {"train_loss": -6.80687141418457, "global_step": 143287, "epoch": 3411} {"train_loss": -6.678842544555664, "global_step": 143288, "epoch": 3411} {"train_loss": -6.766041278839111, "global_step": 143289, "epoch": 3411} {"train_loss": -6.873445510864258, "global_step": 143290, "epoch": 3411} {"train_loss": -6.6970109939575195, "global_step": 143291, "epoch": 3411} {"train_loss": -6.69080114364624, "global_step": 143292, "epoch": 3411} {"train_loss": -6.784942150115967, "global_step": 143293, "epoch": 3411} {"train_loss": -6.745970726013184, "global_step": 143294, "epoch": 3411} {"train_loss": -6.814000129699707, "global_step": 143295, "epoch": 3411} {"train_loss": -6.8475236892700195, "global_step": 143296, "epoch": 3411} {"train_loss": -6.780216693878174, "global_step": 143297, "epoch": 3411} {"train_loss": -6.921778678894043, "global_step": 143298, "epoch": 3411} {"train_loss": -6.782787799835205, "global_step": 143299, "epoch": 3411} {"train_loss": -6.770968437194824, "global_step": 143300, "epoch": 3411} {"train_loss": -6.7699689865112305, "global_step": 143301, "epoch": 3411} {"train_loss": -6.751866340637207, "global_step": 143302, "epoch": 3411} {"train_loss": -6.769953319004604, "global_step": 143303, "epoch": 3411, "val_loss": 67347.9453125} {"train_loss": -6.982498645782471, "global_step": 143304, "epoch": 3412} {"train_loss": -6.860012054443359, "global_step": 143305, "epoch": 3412} {"train_loss": -6.691134452819824, "global_step": 143306, "epoch": 3412} {"train_loss": -6.830295085906982, "global_step": 143307, "epoch": 3412} {"train_loss": -6.756994247436523, "global_step": 143308, "epoch": 3412} {"train_loss": -6.717578411102295, "global_step": 143309, "epoch": 3412} {"train_loss": -6.863922119140625, "global_step": 143310, "epoch": 3412} {"train_loss": -6.870199203491211, "global_step": 143311, "epoch": 3412} {"train_loss": -6.645607948303223, "global_step": 143312, "epoch": 3412} {"train_loss": -6.886996269226074, "global_step": 143313, "epoch": 3412} {"train_loss": -6.826614856719971, "global_step": 143314, "epoch": 3412} {"train_loss": -6.779836654663086, "global_step": 143315, "epoch": 3412} {"train_loss": -6.757826328277588, "global_step": 143316, "epoch": 3412} {"train_loss": -6.707017421722412, "global_step": 143317, "epoch": 3412} {"train_loss": -6.769413471221924, "global_step": 143318, "epoch": 3412} {"train_loss": -6.734446048736572, "global_step": 143319, "epoch": 3412} {"train_loss": -6.811498641967773, "global_step": 143320, "epoch": 3412} {"train_loss": -6.813825607299805, "global_step": 143321, "epoch": 3412} {"train_loss": -6.795016288757324, "global_step": 143322, "epoch": 3412} {"train_loss": -6.723551273345947, "global_step": 143323, "epoch": 3412} {"train_loss": -6.890264511108398, "global_step": 143324, "epoch": 3412} {"train_loss": -6.890098571777344, "global_step": 143325, "epoch": 3412} {"train_loss": -6.784518241882324, "global_step": 143326, "epoch": 3412} {"train_loss": -6.78961181640625, "global_step": 143327, "epoch": 3412} {"train_loss": -6.778846263885498, "global_step": 143328, "epoch": 3412} {"train_loss": -6.786373138427734, "global_step": 143329, "epoch": 3412} {"train_loss": -6.771759033203125, "global_step": 143330, "epoch": 3412} {"train_loss": -6.806155204772949, "global_step": 143331, "epoch": 3412} {"train_loss": -6.736937046051025, "global_step": 143332, "epoch": 3412} {"train_loss": -6.685349464416504, "global_step": 143333, "epoch": 3412} {"train_loss": -6.711299896240234, "global_step": 143334, "epoch": 3412} {"train_loss": -6.879960060119629, "global_step": 143335, "epoch": 3412} {"train_loss": -6.8429975509643555, "global_step": 143336, "epoch": 3412} {"train_loss": -6.648674011230469, "global_step": 143337, "epoch": 3412} {"train_loss": -6.76483154296875, "global_step": 143338, "epoch": 3412} {"train_loss": -6.799135208129883, "global_step": 143339, "epoch": 3412} {"train_loss": -6.738471031188965, "global_step": 143340, "epoch": 3412} {"train_loss": -6.770690441131592, "global_step": 143341, "epoch": 3412} {"train_loss": -6.788522720336914, "global_step": 143342, "epoch": 3412} {"train_loss": -6.717643737792969, "global_step": 143343, "epoch": 3412} {"train_loss": -6.868007659912109, "global_step": 143344, "epoch": 3412} {"train_loss": -6.783681551615397, "global_step": 143345, "epoch": 3412, "val_loss": 67614.4921875} {"train_loss": -6.756326675415039, "global_step": 143346, "epoch": 3413} {"train_loss": -6.744863510131836, "global_step": 143347, "epoch": 3413} {"train_loss": -6.833531379699707, "global_step": 143348, "epoch": 3413} {"train_loss": -6.795139312744141, "global_step": 143349, "epoch": 3413} {"train_loss": -6.829292297363281, "global_step": 143350, "epoch": 3413} {"train_loss": -6.767358779907227, "global_step": 143351, "epoch": 3413} {"train_loss": -6.752062797546387, "global_step": 143352, "epoch": 3413} {"train_loss": -6.707748889923096, "global_step": 143353, "epoch": 3413} {"train_loss": -6.742796897888184, "global_step": 143354, "epoch": 3413} {"train_loss": -6.773947238922119, "global_step": 143355, "epoch": 3413} {"train_loss": -6.743551731109619, "global_step": 143356, "epoch": 3413} {"train_loss": -6.773669242858887, "global_step": 143357, "epoch": 3413} {"train_loss": -6.811619758605957, "global_step": 143358, "epoch": 3413} {"train_loss": -6.718454837799072, "global_step": 143359, "epoch": 3413} {"train_loss": -6.748668670654297, "global_step": 143360, "epoch": 3413} {"train_loss": -6.717713832855225, "global_step": 143361, "epoch": 3413} {"train_loss": -6.907675743103027, "global_step": 143362, "epoch": 3413} {"train_loss": -6.742037773132324, "global_step": 143363, "epoch": 3413} {"train_loss": -6.818879127502441, "global_step": 143364, "epoch": 3413} {"train_loss": -6.899867534637451, "global_step": 143365, "epoch": 3413} {"train_loss": -6.714751243591309, "global_step": 143366, "epoch": 3413} {"train_loss": -6.6917548179626465, "global_step": 143367, "epoch": 3413} {"train_loss": -6.7769904136657715, "global_step": 143368, "epoch": 3413} {"train_loss": -6.811184406280518, "global_step": 143369, "epoch": 3413} {"train_loss": -6.641875267028809, "global_step": 143370, "epoch": 3413} {"train_loss": -6.756608009338379, "global_step": 143371, "epoch": 3413} {"train_loss": -6.83148193359375, "global_step": 143372, "epoch": 3413} {"train_loss": -6.826844692230225, "global_step": 143373, "epoch": 3413} {"train_loss": -6.700355052947998, "global_step": 143374, "epoch": 3413} {"train_loss": -6.892692565917969, "global_step": 143375, "epoch": 3413} {"train_loss": -6.781322956085205, "global_step": 143376, "epoch": 3413} {"train_loss": -6.832820892333984, "global_step": 143377, "epoch": 3413} {"train_loss": -6.744673252105713, "global_step": 143378, "epoch": 3413} {"train_loss": -6.798236846923828, "global_step": 143379, "epoch": 3413} {"train_loss": -6.8485002517700195, "global_step": 143380, "epoch": 3413} {"train_loss": -6.758612632751465, "global_step": 143381, "epoch": 3413} {"train_loss": -6.851273536682129, "global_step": 143382, "epoch": 3413} {"train_loss": -6.868124961853027, "global_step": 143383, "epoch": 3413} {"train_loss": -6.8564372062683105, "global_step": 143384, "epoch": 3413} {"train_loss": -6.756275653839111, "global_step": 143385, "epoch": 3413} {"train_loss": -6.729090690612793, "global_step": 143386, "epoch": 3413} {"train_loss": -6.783800511133103, "global_step": 143387, "epoch": 3413, "val_loss": 67383.5546875} {"train_loss": -6.840327739715576, "global_step": 143388, "epoch": 3414} {"train_loss": -6.846048355102539, "global_step": 143389, "epoch": 3414} {"train_loss": -6.857596397399902, "global_step": 143390, "epoch": 3414} {"train_loss": -6.896382808685303, "global_step": 143391, "epoch": 3414} {"train_loss": -6.791860580444336, "global_step": 143392, "epoch": 3414} {"train_loss": -6.766768455505371, "global_step": 143393, "epoch": 3414} {"train_loss": -6.752899169921875, "global_step": 143394, "epoch": 3414} {"train_loss": -6.768425941467285, "global_step": 143395, "epoch": 3414} {"train_loss": -6.948660373687744, "global_step": 143396, "epoch": 3414} {"train_loss": -6.835480690002441, "global_step": 143397, "epoch": 3414} {"train_loss": -6.9287004470825195, "global_step": 143398, "epoch": 3414} {"train_loss": -6.710050582885742, "global_step": 143399, "epoch": 3414} {"train_loss": -6.827496528625488, "global_step": 143400, "epoch": 3414} {"train_loss": -6.961578369140625, "global_step": 143401, "epoch": 3414} {"train_loss": -6.806497573852539, "global_step": 143402, "epoch": 3414} {"train_loss": -6.797118663787842, "global_step": 143403, "epoch": 3414} {"train_loss": -6.8398308753967285, "global_step": 143404, "epoch": 3414} {"train_loss": -6.820232391357422, "global_step": 143405, "epoch": 3414} {"train_loss": -6.758936882019043, "global_step": 143406, "epoch": 3414} {"train_loss": -6.8386149406433105, "global_step": 143407, "epoch": 3414} {"train_loss": -6.83798360824585, "global_step": 143408, "epoch": 3414} {"train_loss": -6.822412490844727, "global_step": 143409, "epoch": 3414} {"train_loss": -6.916426658630371, "global_step": 143410, "epoch": 3414} {"train_loss": -6.754942417144775, "global_step": 143411, "epoch": 3414} {"train_loss": -6.921656608581543, "global_step": 143412, "epoch": 3414} {"train_loss": -6.796326160430908, "global_step": 143413, "epoch": 3414} {"train_loss": -6.895092487335205, "global_step": 143414, "epoch": 3414} {"train_loss": -6.801517486572266, "global_step": 143415, "epoch": 3414} {"train_loss": -6.738852500915527, "global_step": 143416, "epoch": 3414} {"train_loss": -6.778984546661377, "global_step": 143417, "epoch": 3414} {"train_loss": -6.718335151672363, "global_step": 143418, "epoch": 3414} {"train_loss": -6.750955581665039, "global_step": 143419, "epoch": 3414} {"train_loss": -6.80734920501709, "global_step": 143420, "epoch": 3414} {"train_loss": -6.681675434112549, "global_step": 143421, "epoch": 3414} {"train_loss": -6.847757339477539, "global_step": 143422, "epoch": 3414} {"train_loss": -6.833856105804443, "global_step": 143423, "epoch": 3414} {"train_loss": -6.904311180114746, "global_step": 143424, "epoch": 3414} {"train_loss": -6.806229114532471, "global_step": 143425, "epoch": 3414} {"train_loss": -6.914849281311035, "global_step": 143426, "epoch": 3414} {"train_loss": -6.876925468444824, "global_step": 143427, "epoch": 3414} {"train_loss": -6.896705627441406, "global_step": 143428, "epoch": 3414} {"train_loss": -6.825164749508812, "global_step": 143429, "epoch": 3414, "val_loss": 67585.171875} {"train_loss": -6.810805320739746, "global_step": 143430, "epoch": 3415} {"train_loss": -6.8092474937438965, "global_step": 143431, "epoch": 3415} {"train_loss": -6.840468883514404, "global_step": 143432, "epoch": 3415} {"train_loss": -6.830738067626953, "global_step": 143433, "epoch": 3415} {"train_loss": -6.88581657409668, "global_step": 143434, "epoch": 3415} {"train_loss": -6.867240905761719, "global_step": 143435, "epoch": 3415} {"train_loss": -6.835552215576172, "global_step": 143436, "epoch": 3415} {"train_loss": -6.903346538543701, "global_step": 143437, "epoch": 3415} {"train_loss": -6.733098030090332, "global_step": 143438, "epoch": 3415} {"train_loss": -6.880645275115967, "global_step": 143439, "epoch": 3415} {"train_loss": -6.717066287994385, "global_step": 143440, "epoch": 3415} {"train_loss": -6.885020732879639, "global_step": 143441, "epoch": 3415} {"train_loss": -6.768520355224609, "global_step": 143442, "epoch": 3415} {"train_loss": -6.596583366394043, "global_step": 143443, "epoch": 3415} {"train_loss": -6.800504207611084, "global_step": 143444, "epoch": 3415} {"train_loss": -6.815646171569824, "global_step": 143445, "epoch": 3415} {"train_loss": -7.0143561363220215, "global_step": 143446, "epoch": 3415} {"train_loss": -6.865384101867676, "global_step": 143447, "epoch": 3415} {"train_loss": -6.848114490509033, "global_step": 143448, "epoch": 3415} {"train_loss": -6.85055685043335, "global_step": 143449, "epoch": 3415} {"train_loss": -6.841466903686523, "global_step": 143450, "epoch": 3415} {"train_loss": -6.833855628967285, "global_step": 143451, "epoch": 3415} {"train_loss": -6.749062538146973, "global_step": 143452, "epoch": 3415} {"train_loss": -6.700320243835449, "global_step": 143453, "epoch": 3415} {"train_loss": -6.9177327156066895, "global_step": 143454, "epoch": 3415} {"train_loss": -6.7260894775390625, "global_step": 143455, "epoch": 3415} {"train_loss": -6.826733112335205, "global_step": 143456, "epoch": 3415} {"train_loss": -6.847100257873535, "global_step": 143457, "epoch": 3415} {"train_loss": -6.746078968048096, "global_step": 143458, "epoch": 3415} {"train_loss": -6.731899261474609, "global_step": 143459, "epoch": 3415} {"train_loss": -6.68720817565918, "global_step": 143460, "epoch": 3415} {"train_loss": -6.808220863342285, "global_step": 143461, "epoch": 3415} {"train_loss": -6.815796375274658, "global_step": 143462, "epoch": 3415} {"train_loss": -6.783979415893555, "global_step": 143463, "epoch": 3415} {"train_loss": -6.727550983428955, "global_step": 143464, "epoch": 3415} {"train_loss": -6.793952941894531, "global_step": 143465, "epoch": 3415} {"train_loss": -6.817739486694336, "global_step": 143466, "epoch": 3415} {"train_loss": -6.8919878005981445, "global_step": 143467, "epoch": 3415} {"train_loss": -6.826665878295898, "global_step": 143468, "epoch": 3415} {"train_loss": -6.728470802307129, "global_step": 143469, "epoch": 3415} {"train_loss": -6.745041847229004, "global_step": 143470, "epoch": 3415} {"train_loss": -6.804249979200817, "global_step": 143471, "epoch": 3415, "val_loss": 67454.046875} {"train_loss": -6.713984489440918, "global_step": 143472, "epoch": 3416} {"train_loss": -6.78652286529541, "global_step": 143473, "epoch": 3416} {"train_loss": -6.677279472351074, "global_step": 143474, "epoch": 3416} {"train_loss": -6.749846458435059, "global_step": 143475, "epoch": 3416} {"train_loss": -6.773117542266846, "global_step": 143476, "epoch": 3416} {"train_loss": -6.678763389587402, "global_step": 143477, "epoch": 3416} {"train_loss": -6.725486755371094, "global_step": 143478, "epoch": 3416} {"train_loss": -6.770848751068115, "global_step": 143479, "epoch": 3416} {"train_loss": -6.744100570678711, "global_step": 143480, "epoch": 3416} {"train_loss": -6.851326942443848, "global_step": 143481, "epoch": 3416} {"train_loss": -6.889620780944824, "global_step": 143482, "epoch": 3416} {"train_loss": -6.789668560028076, "global_step": 143483, "epoch": 3416} {"train_loss": -6.720327377319336, "global_step": 143484, "epoch": 3416} {"train_loss": -6.878298282623291, "global_step": 143485, "epoch": 3416} {"train_loss": -6.759443283081055, "global_step": 143486, "epoch": 3416} {"train_loss": -6.740354537963867, "global_step": 143487, "epoch": 3416} {"train_loss": -6.859222412109375, "global_step": 143488, "epoch": 3416} {"train_loss": -6.7977705001831055, "global_step": 143489, "epoch": 3416} {"train_loss": -6.763259410858154, "global_step": 143490, "epoch": 3416} {"train_loss": -6.766324043273926, "global_step": 143491, "epoch": 3416} {"train_loss": -6.802331924438477, "global_step": 143492, "epoch": 3416} {"train_loss": -6.627073764801025, "global_step": 143493, "epoch": 3416} {"train_loss": -6.836034774780273, "global_step": 143494, "epoch": 3416} {"train_loss": -6.607807159423828, "global_step": 143495, "epoch": 3416} {"train_loss": -6.733970642089844, "global_step": 143496, "epoch": 3416} {"train_loss": -6.723304748535156, "global_step": 143497, "epoch": 3416} {"train_loss": -6.602915287017822, "global_step": 143498, "epoch": 3416} {"train_loss": -6.723756790161133, "global_step": 143499, "epoch": 3416} {"train_loss": -6.4147491455078125, "global_step": 143500, "epoch": 3416} {"train_loss": -6.595955848693848, "global_step": 143501, "epoch": 3416} {"train_loss": -6.592250823974609, "global_step": 143502, "epoch": 3416} {"train_loss": -6.676092147827148, "global_step": 143503, "epoch": 3416} {"train_loss": -6.593590259552002, "global_step": 143504, "epoch": 3416} {"train_loss": -6.646455764770508, "global_step": 143505, "epoch": 3416} {"train_loss": -6.569240570068359, "global_step": 143506, "epoch": 3416} {"train_loss": -6.569048881530762, "global_step": 143507, "epoch": 3416} {"train_loss": -6.695456027984619, "global_step": 143508, "epoch": 3416} {"train_loss": -6.5524582862854, "global_step": 143509, "epoch": 3416} {"train_loss": -6.745593547821045, "global_step": 143510, "epoch": 3416} {"train_loss": -6.703127861022949, "global_step": 143511, "epoch": 3416} {"train_loss": -6.6420488357543945, "global_step": 143512, "epoch": 3416} {"train_loss": -6.708329779761178, "global_step": 143513, "epoch": 3416, "val_loss": 67748.953125} {"train_loss": -6.695699691772461, "global_step": 143514, "epoch": 3417} {"train_loss": -6.707812309265137, "global_step": 143515, "epoch": 3417} {"train_loss": -6.654699325561523, "global_step": 143516, "epoch": 3417} {"train_loss": -6.7702436447143555, "global_step": 143517, "epoch": 3417} {"train_loss": -6.711249351501465, "global_step": 143518, "epoch": 3417} {"train_loss": -6.633627891540527, "global_step": 143519, "epoch": 3417} {"train_loss": -6.671136379241943, "global_step": 143520, "epoch": 3417} {"train_loss": -6.743411064147949, "global_step": 143521, "epoch": 3417} {"train_loss": -6.782792568206787, "global_step": 143522, "epoch": 3417} {"train_loss": -6.731423377990723, "global_step": 143523, "epoch": 3417} {"train_loss": -6.7150750160217285, "global_step": 143524, "epoch": 3417} {"train_loss": -6.776233673095703, "global_step": 143525, "epoch": 3417} {"train_loss": -6.669358253479004, "global_step": 143526, "epoch": 3417} {"train_loss": -6.676159858703613, "global_step": 143527, "epoch": 3417} {"train_loss": -6.756868362426758, "global_step": 143528, "epoch": 3417} {"train_loss": -6.762233734130859, "global_step": 143529, "epoch": 3417} {"train_loss": -6.666927337646484, "global_step": 143530, "epoch": 3417} {"train_loss": -6.68094539642334, "global_step": 143531, "epoch": 3417} {"train_loss": -6.780916213989258, "global_step": 143532, "epoch": 3417} {"train_loss": -6.857251167297363, "global_step": 143533, "epoch": 3417} {"train_loss": -6.738349437713623, "global_step": 143534, "epoch": 3417} {"train_loss": -6.815813064575195, "global_step": 143535, "epoch": 3417} {"train_loss": -6.852203369140625, "global_step": 143536, "epoch": 3417} {"train_loss": -6.821256637573242, "global_step": 143537, "epoch": 3417} {"train_loss": -6.748226165771484, "global_step": 143538, "epoch": 3417} {"train_loss": -6.791441917419434, "global_step": 143539, "epoch": 3417} {"train_loss": -6.859217643737793, "global_step": 143540, "epoch": 3417} {"train_loss": -6.852435111999512, "global_step": 143541, "epoch": 3417} {"train_loss": -6.751012802124023, "global_step": 143542, "epoch": 3417} {"train_loss": -6.799314022064209, "global_step": 143543, "epoch": 3417} {"train_loss": -6.883188247680664, "global_step": 143544, "epoch": 3417} {"train_loss": -6.8920135498046875, "global_step": 143545, "epoch": 3417} {"train_loss": -6.853634834289551, "global_step": 143546, "epoch": 3417} {"train_loss": -6.8201704025268555, "global_step": 143547, "epoch": 3417} {"train_loss": -6.828762054443359, "global_step": 143548, "epoch": 3417} {"train_loss": -6.899816513061523, "global_step": 143549, "epoch": 3417} {"train_loss": -6.879816055297852, "global_step": 143550, "epoch": 3417} {"train_loss": -6.940989971160889, "global_step": 143551, "epoch": 3417} {"train_loss": -6.9152631759643555, "global_step": 143552, "epoch": 3417} {"train_loss": -6.904781341552734, "global_step": 143553, "epoch": 3417} {"train_loss": -6.913116455078125, "global_step": 143554, "epoch": 3417} {"train_loss": -6.787724846885318, "global_step": 143555, "epoch": 3417, "val_loss": 67480.875} {"train_loss": -6.950499057769775, "global_step": 143556, "epoch": 3418} {"train_loss": -6.905617713928223, "global_step": 143557, "epoch": 3418} {"train_loss": -6.851536273956299, "global_step": 143558, "epoch": 3418} {"train_loss": -6.907047748565674, "global_step": 143559, "epoch": 3418} {"train_loss": -6.899449825286865, "global_step": 143560, "epoch": 3418} {"train_loss": -6.8407392501831055, "global_step": 143561, "epoch": 3418} {"train_loss": -6.922237873077393, "global_step": 143562, "epoch": 3418} {"train_loss": -6.759840965270996, "global_step": 143563, "epoch": 3418} {"train_loss": -6.8767266273498535, "global_step": 143564, "epoch": 3418} {"train_loss": -6.888639450073242, "global_step": 143565, "epoch": 3418} {"train_loss": -6.795339584350586, "global_step": 143566, "epoch": 3418} {"train_loss": -6.998443603515625, "global_step": 143567, "epoch": 3418} {"train_loss": -6.8650407791137695, "global_step": 143568, "epoch": 3418} {"train_loss": -6.909776210784912, "global_step": 143569, "epoch": 3418} {"train_loss": -6.849521636962891, "global_step": 143570, "epoch": 3418} {"train_loss": -6.91666316986084, "global_step": 143571, "epoch": 3418} {"train_loss": -6.793165683746338, "global_step": 143572, "epoch": 3418} {"train_loss": -6.829076766967773, "global_step": 143573, "epoch": 3418} {"train_loss": -6.9092206954956055, "global_step": 143574, "epoch": 3418} {"train_loss": -6.780076026916504, "global_step": 143575, "epoch": 3418} {"train_loss": -6.784821510314941, "global_step": 143576, "epoch": 3418} {"train_loss": -6.68547248840332, "global_step": 143577, "epoch": 3418} {"train_loss": -6.7242326736450195, "global_step": 143578, "epoch": 3418} {"train_loss": -6.829746246337891, "global_step": 143579, "epoch": 3418} {"train_loss": -6.782078742980957, "global_step": 143580, "epoch": 3418} {"train_loss": -6.748585224151611, "global_step": 143581, "epoch": 3418} {"train_loss": -6.722888946533203, "global_step": 143582, "epoch": 3418} {"train_loss": -6.736480712890625, "global_step": 143583, "epoch": 3418} {"train_loss": -6.779330730438232, "global_step": 143584, "epoch": 3418} {"train_loss": -6.680174827575684, "global_step": 143585, "epoch": 3418} {"train_loss": -6.845192909240723, "global_step": 143586, "epoch": 3418} {"train_loss": -6.763365268707275, "global_step": 143587, "epoch": 3418} {"train_loss": -6.805046081542969, "global_step": 143588, "epoch": 3418} {"train_loss": -6.737982749938965, "global_step": 143589, "epoch": 3418} {"train_loss": -6.770549774169922, "global_step": 143590, "epoch": 3418} {"train_loss": -6.749821662902832, "global_step": 143591, "epoch": 3418} {"train_loss": -6.845028400421143, "global_step": 143592, "epoch": 3418} {"train_loss": -6.804882049560547, "global_step": 143593, "epoch": 3418} {"train_loss": -6.735753059387207, "global_step": 143594, "epoch": 3418} {"train_loss": -6.757509708404541, "global_step": 143595, "epoch": 3418} {"train_loss": -6.818865776062012, "global_step": 143596, "epoch": 3418} {"train_loss": -6.8199575287955145, "global_step": 143597, "epoch": 3418, "val_loss": 67418.75} {"train_loss": -6.68942928314209, "global_step": 143598, "epoch": 3419} {"train_loss": -6.776307106018066, "global_step": 143599, "epoch": 3419} {"train_loss": -6.767169952392578, "global_step": 143600, "epoch": 3419} {"train_loss": -6.819096565246582, "global_step": 143601, "epoch": 3419} {"train_loss": -6.768782615661621, "global_step": 143602, "epoch": 3419} {"train_loss": -6.799076080322266, "global_step": 143603, "epoch": 3419} {"train_loss": -6.815773010253906, "global_step": 143604, "epoch": 3419} {"train_loss": -6.669017314910889, "global_step": 143605, "epoch": 3419} {"train_loss": -6.7861785888671875, "global_step": 143606, "epoch": 3419} {"train_loss": -6.888051986694336, "global_step": 143607, "epoch": 3419} {"train_loss": -6.824726581573486, "global_step": 143608, "epoch": 3419} {"train_loss": -6.803502559661865, "global_step": 143609, "epoch": 3419} {"train_loss": -6.792644023895264, "global_step": 143610, "epoch": 3419} {"train_loss": -6.8093581199646, "global_step": 143611, "epoch": 3419} {"train_loss": -6.845080375671387, "global_step": 143612, "epoch": 3419} {"train_loss": -6.724364280700684, "global_step": 143613, "epoch": 3419} {"train_loss": -6.841427803039551, "global_step": 143614, "epoch": 3419} {"train_loss": -6.808223724365234, "global_step": 143615, "epoch": 3419} {"train_loss": -6.902199745178223, "global_step": 143616, "epoch": 3419} {"train_loss": -6.794510841369629, "global_step": 143617, "epoch": 3419} {"train_loss": -6.833755016326904, "global_step": 143618, "epoch": 3419} {"train_loss": -6.904271125793457, "global_step": 143619, "epoch": 3419} {"train_loss": -6.745576858520508, "global_step": 143620, "epoch": 3419} {"train_loss": -6.8539557456970215, "global_step": 143621, "epoch": 3419} {"train_loss": -6.797889709472656, "global_step": 143622, "epoch": 3419} {"train_loss": -6.7259907722473145, "global_step": 143623, "epoch": 3419} {"train_loss": -6.87282657623291, "global_step": 143624, "epoch": 3419} {"train_loss": -6.827620983123779, "global_step": 143625, "epoch": 3419} {"train_loss": -6.837175369262695, "global_step": 143626, "epoch": 3419} {"train_loss": -6.6922078132629395, "global_step": 143627, "epoch": 3419} {"train_loss": -6.816816806793213, "global_step": 143628, "epoch": 3419} {"train_loss": -6.882524490356445, "global_step": 143629, "epoch": 3419} {"train_loss": -6.79884672164917, "global_step": 143630, "epoch": 3419} {"train_loss": -6.815367698669434, "global_step": 143631, "epoch": 3419} {"train_loss": -6.882323265075684, "global_step": 143632, "epoch": 3419} {"train_loss": -6.836401462554932, "global_step": 143633, "epoch": 3419} {"train_loss": -6.759111404418945, "global_step": 143634, "epoch": 3419} {"train_loss": -6.808710098266602, "global_step": 143635, "epoch": 3419} {"train_loss": -6.79263162612915, "global_step": 143636, "epoch": 3419} {"train_loss": -6.833080291748047, "global_step": 143637, "epoch": 3419} {"train_loss": -6.785706043243408, "global_step": 143638, "epoch": 3419} {"train_loss": -6.805987914403279, "global_step": 143639, "epoch": 3419, "val_loss": 67700.734375} {"train_loss": -6.792121887207031, "global_step": 143640, "epoch": 3420} {"train_loss": -6.801905632019043, "global_step": 143641, "epoch": 3420} {"train_loss": -6.786195755004883, "global_step": 143642, "epoch": 3420} {"train_loss": -6.805941581726074, "global_step": 143643, "epoch": 3420} {"train_loss": -6.669052600860596, "global_step": 143644, "epoch": 3420} {"train_loss": -6.780754089355469, "global_step": 143645, "epoch": 3420} {"train_loss": -6.759361267089844, "global_step": 143646, "epoch": 3420} {"train_loss": -6.800657272338867, "global_step": 143647, "epoch": 3420} {"train_loss": -6.808833599090576, "global_step": 143648, "epoch": 3420} {"train_loss": -6.887884140014648, "global_step": 143649, "epoch": 3420} {"train_loss": -6.850746154785156, "global_step": 143650, "epoch": 3420} {"train_loss": -6.678532600402832, "global_step": 143651, "epoch": 3420} {"train_loss": -6.8018670082092285, "global_step": 143652, "epoch": 3420} {"train_loss": -6.7549238204956055, "global_step": 143653, "epoch": 3420} {"train_loss": -6.693961143493652, "global_step": 143654, "epoch": 3420} {"train_loss": -6.787754535675049, "global_step": 143655, "epoch": 3420} {"train_loss": -6.68785285949707, "global_step": 143656, "epoch": 3420} {"train_loss": -6.624142646789551, "global_step": 143657, "epoch": 3420} {"train_loss": -6.725095748901367, "global_step": 143658, "epoch": 3420} {"train_loss": -6.796940803527832, "global_step": 143659, "epoch": 3420} {"train_loss": -6.722665786743164, "global_step": 143660, "epoch": 3420} {"train_loss": -6.644065856933594, "global_step": 143661, "epoch": 3420} {"train_loss": -6.64882755279541, "global_step": 143662, "epoch": 3420} {"train_loss": -6.750936508178711, "global_step": 143663, "epoch": 3420} {"train_loss": -6.71980094909668, "global_step": 143664, "epoch": 3420} {"train_loss": -6.663741111755371, "global_step": 143665, "epoch": 3420} {"train_loss": -6.683229446411133, "global_step": 143666, "epoch": 3420} {"train_loss": -6.781655311584473, "global_step": 143667, "epoch": 3420} {"train_loss": -6.704554080963135, "global_step": 143668, "epoch": 3420} {"train_loss": -6.823980331420898, "global_step": 143669, "epoch": 3420} {"train_loss": -6.680513381958008, "global_step": 143670, "epoch": 3420} {"train_loss": -6.842738151550293, "global_step": 143671, "epoch": 3420} {"train_loss": -6.667189598083496, "global_step": 143672, "epoch": 3420} {"train_loss": -6.780665397644043, "global_step": 143673, "epoch": 3420} {"train_loss": -6.644435882568359, "global_step": 143674, "epoch": 3420} {"train_loss": -6.752831935882568, "global_step": 143675, "epoch": 3420} {"train_loss": -6.740070343017578, "global_step": 143676, "epoch": 3420} {"train_loss": -6.740087509155273, "global_step": 143677, "epoch": 3420} {"train_loss": -6.702486515045166, "global_step": 143678, "epoch": 3420} {"train_loss": -6.719147682189941, "global_step": 143679, "epoch": 3420} {"train_loss": -6.66182804107666, "global_step": 143680, "epoch": 3420} {"train_loss": -6.740832419622512, "global_step": 143681, "epoch": 3420, "val_loss": 67633.9140625} {"train_loss": -6.874092102050781, "global_step": 143682, "epoch": 3421} {"train_loss": -6.777173042297363, "global_step": 143683, "epoch": 3421} {"train_loss": -6.858705997467041, "global_step": 143684, "epoch": 3421} {"train_loss": -6.714750289916992, "global_step": 143685, "epoch": 3421} {"train_loss": -6.827478408813477, "global_step": 143686, "epoch": 3421} {"train_loss": -6.842212677001953, "global_step": 143687, "epoch": 3421} {"train_loss": -6.801228046417236, "global_step": 143688, "epoch": 3421} {"train_loss": -6.763387680053711, "global_step": 143689, "epoch": 3421} {"train_loss": -6.7929840087890625, "global_step": 143690, "epoch": 3421} {"train_loss": -6.882275104522705, "global_step": 143691, "epoch": 3421} {"train_loss": -6.861966133117676, "global_step": 143692, "epoch": 3421} {"train_loss": -6.764911651611328, "global_step": 143693, "epoch": 3421} {"train_loss": -6.738768100738525, "global_step": 143694, "epoch": 3421} {"train_loss": -6.829606056213379, "global_step": 143695, "epoch": 3421} {"train_loss": -6.803706169128418, "global_step": 143696, "epoch": 3421} {"train_loss": -6.819138050079346, "global_step": 143697, "epoch": 3421} {"train_loss": -6.739236831665039, "global_step": 143698, "epoch": 3421} {"train_loss": -6.7220306396484375, "global_step": 143699, "epoch": 3421} {"train_loss": -6.732338905334473, "global_step": 143700, "epoch": 3421} {"train_loss": -6.90424919128418, "global_step": 143701, "epoch": 3421} {"train_loss": -6.880524635314941, "global_step": 143702, "epoch": 3421} {"train_loss": -6.798954963684082, "global_step": 143703, "epoch": 3421} {"train_loss": -6.879303932189941, "global_step": 143704, "epoch": 3421} {"train_loss": -6.774770736694336, "global_step": 143705, "epoch": 3421} {"train_loss": -6.78102970123291, "global_step": 143706, "epoch": 3421} {"train_loss": -6.921146392822266, "global_step": 143707, "epoch": 3421} {"train_loss": -6.753940582275391, "global_step": 143708, "epoch": 3421} {"train_loss": -6.819360256195068, "global_step": 143709, "epoch": 3421} {"train_loss": -6.769710540771484, "global_step": 143710, "epoch": 3421} {"train_loss": -6.8544392585754395, "global_step": 143711, "epoch": 3421} {"train_loss": -6.745275974273682, "global_step": 143712, "epoch": 3421} {"train_loss": -6.849450588226318, "global_step": 143713, "epoch": 3421} {"train_loss": -6.7263922691345215, "global_step": 143714, "epoch": 3421} {"train_loss": -6.5947699546813965, "global_step": 143715, "epoch": 3421} {"train_loss": -6.768316745758057, "global_step": 143716, "epoch": 3421} {"train_loss": -6.794350624084473, "global_step": 143717, "epoch": 3421} {"train_loss": -6.769947528839111, "global_step": 143718, "epoch": 3421} {"train_loss": -6.92751932144165, "global_step": 143719, "epoch": 3421} {"train_loss": -6.743152141571045, "global_step": 143720, "epoch": 3421} {"train_loss": -6.9162797927856445, "global_step": 143721, "epoch": 3421} {"train_loss": -6.743831157684326, "global_step": 143722, "epoch": 3421} {"train_loss": -6.7984565780276345, "global_step": 143723, "epoch": 3421, "val_loss": 67547.3046875} {"train_loss": -6.747883319854736, "global_step": 143724, "epoch": 3422} {"train_loss": -6.765369892120361, "global_step": 143725, "epoch": 3422} {"train_loss": -6.741092681884766, "global_step": 143726, "epoch": 3422} {"train_loss": -6.876070976257324, "global_step": 143727, "epoch": 3422} {"train_loss": -6.778800964355469, "global_step": 143728, "epoch": 3422} {"train_loss": -6.774112701416016, "global_step": 143729, "epoch": 3422} {"train_loss": -6.7222900390625, "global_step": 143730, "epoch": 3422} {"train_loss": -6.8947978019714355, "global_step": 143731, "epoch": 3422} {"train_loss": -6.780326843261719, "global_step": 143732, "epoch": 3422} {"train_loss": -6.721280097961426, "global_step": 143733, "epoch": 3422} {"train_loss": -6.728477478027344, "global_step": 143734, "epoch": 3422} {"train_loss": -6.842568397521973, "global_step": 143735, "epoch": 3422} {"train_loss": -6.777918338775635, "global_step": 143736, "epoch": 3422} {"train_loss": -6.717674255371094, "global_step": 143737, "epoch": 3422} {"train_loss": -6.746715545654297, "global_step": 143738, "epoch": 3422} {"train_loss": -6.903059005737305, "global_step": 143739, "epoch": 3422} {"train_loss": -6.895303249359131, "global_step": 143740, "epoch": 3422} {"train_loss": -6.770143985748291, "global_step": 143741, "epoch": 3422} {"train_loss": -6.71759033203125, "global_step": 143742, "epoch": 3422} {"train_loss": -6.876513957977295, "global_step": 143743, "epoch": 3422} {"train_loss": -6.797405242919922, "global_step": 143744, "epoch": 3422} {"train_loss": -6.822199821472168, "global_step": 143745, "epoch": 3422} {"train_loss": -6.792512893676758, "global_step": 143746, "epoch": 3422} {"train_loss": -6.732296943664551, "global_step": 143747, "epoch": 3422} {"train_loss": -6.7637810707092285, "global_step": 143748, "epoch": 3422} {"train_loss": -6.787024021148682, "global_step": 143749, "epoch": 3422} {"train_loss": -6.812963485717773, "global_step": 143750, "epoch": 3422} {"train_loss": -6.751673698425293, "global_step": 143751, "epoch": 3422} {"train_loss": -6.80924129486084, "global_step": 143752, "epoch": 3422} {"train_loss": -6.783730506896973, "global_step": 143753, "epoch": 3422} {"train_loss": -6.80314826965332, "global_step": 143754, "epoch": 3422} {"train_loss": -6.656508445739746, "global_step": 143755, "epoch": 3422} {"train_loss": -6.733468055725098, "global_step": 143756, "epoch": 3422} {"train_loss": -6.715401649475098, "global_step": 143757, "epoch": 3422} {"train_loss": -6.679422378540039, "global_step": 143758, "epoch": 3422} {"train_loss": -6.835244178771973, "global_step": 143759, "epoch": 3422} {"train_loss": -6.740374565124512, "global_step": 143760, "epoch": 3422} {"train_loss": -6.793684005737305, "global_step": 143761, "epoch": 3422} {"train_loss": -6.758474349975586, "global_step": 143762, "epoch": 3422} {"train_loss": -6.733892440795898, "global_step": 143763, "epoch": 3422} {"train_loss": -6.7708282470703125, "global_step": 143764, "epoch": 3422} {"train_loss": -6.777316751934233, "global_step": 143765, "epoch": 3422, "val_loss": 67540.875} {"train_loss": -6.80366849899292, "global_step": 143766, "epoch": 3423} {"train_loss": -6.730231285095215, "global_step": 143767, "epoch": 3423} {"train_loss": -6.906442642211914, "global_step": 143768, "epoch": 3423} {"train_loss": -6.800088405609131, "global_step": 143769, "epoch": 3423} {"train_loss": -6.801298141479492, "global_step": 143770, "epoch": 3423} {"train_loss": -6.866896152496338, "global_step": 143771, "epoch": 3423} {"train_loss": -6.860233783721924, "global_step": 143772, "epoch": 3423} {"train_loss": -6.710814476013184, "global_step": 143773, "epoch": 3423} {"train_loss": -6.848319053649902, "global_step": 143774, "epoch": 3423} {"train_loss": -6.937520503997803, "global_step": 143775, "epoch": 3423} {"train_loss": -6.683459281921387, "global_step": 143776, "epoch": 3423} {"train_loss": -6.773663520812988, "global_step": 143777, "epoch": 3423} {"train_loss": -6.832000732421875, "global_step": 143778, "epoch": 3423} {"train_loss": -6.740962028503418, "global_step": 143779, "epoch": 3423} {"train_loss": -6.537448883056641, "global_step": 143780, "epoch": 3423} {"train_loss": -6.7158098220825195, "global_step": 143781, "epoch": 3423} {"train_loss": -6.758220672607422, "global_step": 143782, "epoch": 3423} {"train_loss": -6.611331939697266, "global_step": 143783, "epoch": 3423} {"train_loss": -6.7382612228393555, "global_step": 143784, "epoch": 3423} {"train_loss": -6.649811744689941, "global_step": 143785, "epoch": 3423} {"train_loss": -6.408677101135254, "global_step": 143786, "epoch": 3423} {"train_loss": -6.7514262199401855, "global_step": 143787, "epoch": 3423} {"train_loss": -6.565286636352539, "global_step": 143788, "epoch": 3423} {"train_loss": -6.741945743560791, "global_step": 143789, "epoch": 3423} {"train_loss": -6.577493190765381, "global_step": 143790, "epoch": 3423} {"train_loss": -6.715757369995117, "global_step": 143791, "epoch": 3423} {"train_loss": -6.602757453918457, "global_step": 143792, "epoch": 3423} {"train_loss": -6.729976654052734, "global_step": 143793, "epoch": 3423} {"train_loss": -6.704993724822998, "global_step": 143794, "epoch": 3423} {"train_loss": -6.816666603088379, "global_step": 143795, "epoch": 3423} {"train_loss": -6.6846723556518555, "global_step": 143796, "epoch": 3423} {"train_loss": -6.822235107421875, "global_step": 143797, "epoch": 3423} {"train_loss": -6.739907264709473, "global_step": 143798, "epoch": 3423} {"train_loss": -6.689591407775879, "global_step": 143799, "epoch": 3423} {"train_loss": -6.760973930358887, "global_step": 143800, "epoch": 3423} {"train_loss": -6.691404342651367, "global_step": 143801, "epoch": 3423} {"train_loss": -6.781793594360352, "global_step": 143802, "epoch": 3423} {"train_loss": -6.769527435302734, "global_step": 143803, "epoch": 3423} {"train_loss": -6.807581901550293, "global_step": 143804, "epoch": 3423} {"train_loss": -6.796375274658203, "global_step": 143805, "epoch": 3423} {"train_loss": -6.801959991455078, "global_step": 143806, "epoch": 3423} {"train_loss": -6.738296224957421, "global_step": 143807, "epoch": 3423, "val_loss": 67535.7265625} {"train_loss": -6.9318366050720215, "global_step": 143808, "epoch": 3424} {"train_loss": -6.851336479187012, "global_step": 143809, "epoch": 3424} {"train_loss": -6.821895122528076, "global_step": 143810, "epoch": 3424} {"train_loss": -6.875668048858643, "global_step": 143811, "epoch": 3424} {"train_loss": -6.804106712341309, "global_step": 143812, "epoch": 3424} {"train_loss": -6.913761138916016, "global_step": 143813, "epoch": 3424} {"train_loss": -6.883098602294922, "global_step": 143814, "epoch": 3424} {"train_loss": -6.881509780883789, "global_step": 143815, "epoch": 3424} {"train_loss": -6.938020706176758, "global_step": 143816, "epoch": 3424} {"train_loss": -6.834584712982178, "global_step": 143817, "epoch": 3424} {"train_loss": -6.777080535888672, "global_step": 143818, "epoch": 3424} {"train_loss": -6.837546348571777, "global_step": 143819, "epoch": 3424} {"train_loss": -6.783865928649902, "global_step": 143820, "epoch": 3424} {"train_loss": -6.836019039154053, "global_step": 143821, "epoch": 3424} {"train_loss": -6.814367294311523, "global_step": 143822, "epoch": 3424} {"train_loss": -6.914306640625, "global_step": 143823, "epoch": 3424} {"train_loss": -6.96291446685791, "global_step": 143824, "epoch": 3424} {"train_loss": -6.868521690368652, "global_step": 143825, "epoch": 3424} {"train_loss": -6.847747802734375, "global_step": 143826, "epoch": 3424} {"train_loss": -6.858227729797363, "global_step": 143827, "epoch": 3424} {"train_loss": -6.803890228271484, "global_step": 143828, "epoch": 3424} {"train_loss": -6.8064446449279785, "global_step": 143829, "epoch": 3424} {"train_loss": -6.897466659545898, "global_step": 143830, "epoch": 3424} {"train_loss": -6.7922563552856445, "global_step": 143831, "epoch": 3424} {"train_loss": -6.835202693939209, "global_step": 143832, "epoch": 3424} {"train_loss": -6.891181468963623, "global_step": 143833, "epoch": 3424} {"train_loss": -6.847928524017334, "global_step": 143834, "epoch": 3424} {"train_loss": -6.8974504470825195, "global_step": 143835, "epoch": 3424} {"train_loss": -6.877710342407227, "global_step": 143836, "epoch": 3424} {"train_loss": -6.842416763305664, "global_step": 143837, "epoch": 3424} {"train_loss": -6.832086563110352, "global_step": 143838, "epoch": 3424} {"train_loss": -6.802133560180664, "global_step": 143839, "epoch": 3424} {"train_loss": -6.965570449829102, "global_step": 143840, "epoch": 3424} {"train_loss": -6.976958274841309, "global_step": 143841, "epoch": 3424} {"train_loss": -6.82658576965332, "global_step": 143842, "epoch": 3424} {"train_loss": -6.7840657234191895, "global_step": 143843, "epoch": 3424} {"train_loss": -6.84793758392334, "global_step": 143844, "epoch": 3424} {"train_loss": -6.81837272644043, "global_step": 143845, "epoch": 3424} {"train_loss": -6.827836990356445, "global_step": 143846, "epoch": 3424} {"train_loss": -6.8562469482421875, "global_step": 143847, "epoch": 3424} {"train_loss": -6.896405220031738, "global_step": 143848, "epoch": 3424} {"train_loss": -6.856845163163685, "global_step": 143849, "epoch": 3424, "val_loss": 67692.9140625} {"train_loss": -6.897239685058594, "global_step": 143850, "epoch": 3425} {"train_loss": -6.948818206787109, "global_step": 143851, "epoch": 3425} {"train_loss": -6.842284202575684, "global_step": 143852, "epoch": 3425} {"train_loss": -6.809110164642334, "global_step": 143853, "epoch": 3425} {"train_loss": -6.82359504699707, "global_step": 143854, "epoch": 3425} {"train_loss": -6.790128707885742, "global_step": 143855, "epoch": 3425} {"train_loss": -6.933435440063477, "global_step": 143856, "epoch": 3425} {"train_loss": -6.899208068847656, "global_step": 143857, "epoch": 3425} {"train_loss": -6.81900691986084, "global_step": 143858, "epoch": 3425} {"train_loss": -6.746289253234863, "global_step": 143859, "epoch": 3425} {"train_loss": -6.865753173828125, "global_step": 143860, "epoch": 3425} {"train_loss": -6.777505874633789, "global_step": 143861, "epoch": 3425} {"train_loss": -6.746706962585449, "global_step": 143862, "epoch": 3425} {"train_loss": -6.77726936340332, "global_step": 143863, "epoch": 3425} {"train_loss": -6.708564758300781, "global_step": 143864, "epoch": 3425} {"train_loss": -6.828365325927734, "global_step": 143865, "epoch": 3425} {"train_loss": -6.863643169403076, "global_step": 143866, "epoch": 3425} {"train_loss": -6.89931058883667, "global_step": 143867, "epoch": 3425} {"train_loss": -6.789533615112305, "global_step": 143868, "epoch": 3425} {"train_loss": -6.824744701385498, "global_step": 143869, "epoch": 3425} {"train_loss": -6.6847429275512695, "global_step": 143870, "epoch": 3425} {"train_loss": -6.747779369354248, "global_step": 143871, "epoch": 3425} {"train_loss": -6.824502944946289, "global_step": 143872, "epoch": 3425} {"train_loss": -6.794607639312744, "global_step": 143873, "epoch": 3425} {"train_loss": -6.788485050201416, "global_step": 143874, "epoch": 3425} {"train_loss": -6.8014020919799805, "global_step": 143875, "epoch": 3425} {"train_loss": -6.7952880859375, "global_step": 143876, "epoch": 3425} {"train_loss": -6.7928147315979, "global_step": 143877, "epoch": 3425} {"train_loss": -6.781289100646973, "global_step": 143878, "epoch": 3425} {"train_loss": -6.674785614013672, "global_step": 143879, "epoch": 3425} {"train_loss": -6.842087745666504, "global_step": 143880, "epoch": 3425} {"train_loss": -6.843752384185791, "global_step": 143881, "epoch": 3425} {"train_loss": -6.974241256713867, "global_step": 143882, "epoch": 3425} {"train_loss": -6.778630256652832, "global_step": 143883, "epoch": 3425} {"train_loss": -6.699435710906982, "global_step": 143884, "epoch": 3425} {"train_loss": -6.842226982116699, "global_step": 143885, "epoch": 3425} {"train_loss": -6.803020000457764, "global_step": 143886, "epoch": 3425} {"train_loss": -6.9256134033203125, "global_step": 143887, "epoch": 3425} {"train_loss": -6.682079315185547, "global_step": 143888, "epoch": 3425} {"train_loss": -6.805320739746094, "global_step": 143889, "epoch": 3425} {"train_loss": -6.685482025146484, "global_step": 143890, "epoch": 3425} {"train_loss": -6.809555780319941, "global_step": 143891, "epoch": 3425, "val_loss": 67792.171875} {"train_loss": -6.783226013183594, "global_step": 143892, "epoch": 3426} {"train_loss": -6.795454978942871, "global_step": 143893, "epoch": 3426} {"train_loss": -6.8576507568359375, "global_step": 143894, "epoch": 3426} {"train_loss": -6.768801689147949, "global_step": 143895, "epoch": 3426} {"train_loss": -6.771914482116699, "global_step": 143896, "epoch": 3426} {"train_loss": -6.808672904968262, "global_step": 143897, "epoch": 3426} {"train_loss": -6.871920108795166, "global_step": 143898, "epoch": 3426} {"train_loss": -6.874235153198242, "global_step": 143899, "epoch": 3426} {"train_loss": -6.813826560974121, "global_step": 143900, "epoch": 3426} {"train_loss": -6.744083881378174, "global_step": 143901, "epoch": 3426} {"train_loss": -6.927957534790039, "global_step": 143902, "epoch": 3426} {"train_loss": -6.775493621826172, "global_step": 143903, "epoch": 3426} {"train_loss": -6.764463424682617, "global_step": 143904, "epoch": 3426} {"train_loss": -6.794666290283203, "global_step": 143905, "epoch": 3426} {"train_loss": -6.832555294036865, "global_step": 143906, "epoch": 3426} {"train_loss": -6.830063343048096, "global_step": 143907, "epoch": 3426} {"train_loss": -6.911428451538086, "global_step": 143908, "epoch": 3426} {"train_loss": -6.799271583557129, "global_step": 143909, "epoch": 3426} {"train_loss": -6.78887939453125, "global_step": 143910, "epoch": 3426} {"train_loss": -6.941643238067627, "global_step": 143911, "epoch": 3426} {"train_loss": -6.9584879875183105, "global_step": 143912, "epoch": 3426} {"train_loss": -6.8380937576293945, "global_step": 143913, "epoch": 3426} {"train_loss": -6.729854583740234, "global_step": 143914, "epoch": 3426} {"train_loss": -6.800380706787109, "global_step": 143915, "epoch": 3426} {"train_loss": -6.981398582458496, "global_step": 143916, "epoch": 3426} {"train_loss": -6.781571388244629, "global_step": 143917, "epoch": 3426} {"train_loss": -6.778029441833496, "global_step": 143918, "epoch": 3426} {"train_loss": -6.841178894042969, "global_step": 143919, "epoch": 3426} {"train_loss": -6.815401077270508, "global_step": 143920, "epoch": 3426} {"train_loss": -6.741186141967773, "global_step": 143921, "epoch": 3426} {"train_loss": -6.773303985595703, "global_step": 143922, "epoch": 3426} {"train_loss": -6.783390045166016, "global_step": 143923, "epoch": 3426} {"train_loss": -6.876850605010986, "global_step": 143924, "epoch": 3426} {"train_loss": -6.8546552658081055, "global_step": 143925, "epoch": 3426} {"train_loss": -6.893624305725098, "global_step": 143926, "epoch": 3426} {"train_loss": -6.7559332847595215, "global_step": 143927, "epoch": 3426} {"train_loss": -6.805716037750244, "global_step": 143928, "epoch": 3426} {"train_loss": -6.763796329498291, "global_step": 143929, "epoch": 3426} {"train_loss": -6.804986476898193, "global_step": 143930, "epoch": 3426} {"train_loss": -6.794869422912598, "global_step": 143931, "epoch": 3426} {"train_loss": -6.792229652404785, "global_step": 143932, "epoch": 3426} {"train_loss": -6.820021890458607, "global_step": 143933, "epoch": 3426, "val_loss": 67438.0625} {"train_loss": -6.855257511138916, "global_step": 143934, "epoch": 3427} {"train_loss": -6.842257022857666, "global_step": 143935, "epoch": 3427} {"train_loss": -6.942740440368652, "global_step": 143936, "epoch": 3427} {"train_loss": -6.834875583648682, "global_step": 143937, "epoch": 3427} {"train_loss": -6.8664374351501465, "global_step": 143938, "epoch": 3427} {"train_loss": -6.890669345855713, "global_step": 143939, "epoch": 3427} {"train_loss": -6.987060546875, "global_step": 143940, "epoch": 3427} {"train_loss": -6.865439414978027, "global_step": 143941, "epoch": 3427} {"train_loss": -7.015302658081055, "global_step": 143942, "epoch": 3427} {"train_loss": -6.839848518371582, "global_step": 143943, "epoch": 3427} {"train_loss": -6.882494926452637, "global_step": 143944, "epoch": 3427} {"train_loss": -6.9331254959106445, "global_step": 143945, "epoch": 3427} {"train_loss": -6.930602073669434, "global_step": 143946, "epoch": 3427} {"train_loss": -6.801700592041016, "global_step": 143947, "epoch": 3427} {"train_loss": -6.866467475891113, "global_step": 143948, "epoch": 3427} {"train_loss": -6.838785171508789, "global_step": 143949, "epoch": 3427} {"train_loss": -6.882109642028809, "global_step": 143950, "epoch": 3427} {"train_loss": -6.859550476074219, "global_step": 143951, "epoch": 3427} {"train_loss": -6.853481292724609, "global_step": 143952, "epoch": 3427} {"train_loss": -6.918379306793213, "global_step": 143953, "epoch": 3427} {"train_loss": -6.89631462097168, "global_step": 143954, "epoch": 3427} {"train_loss": -6.783547401428223, "global_step": 143955, "epoch": 3427} {"train_loss": -6.8595871925354, "global_step": 143956, "epoch": 3427} {"train_loss": -6.803234577178955, "global_step": 143957, "epoch": 3427} {"train_loss": -6.843190670013428, "global_step": 143958, "epoch": 3427} {"train_loss": -6.863282203674316, "global_step": 143959, "epoch": 3427} {"train_loss": -6.71879243850708, "global_step": 143960, "epoch": 3427} {"train_loss": -6.795814514160156, "global_step": 143961, "epoch": 3427} {"train_loss": -6.782807350158691, "global_step": 143962, "epoch": 3427} {"train_loss": -6.835484504699707, "global_step": 143963, "epoch": 3427} {"train_loss": -6.761809349060059, "global_step": 143964, "epoch": 3427} {"train_loss": -6.887253761291504, "global_step": 143965, "epoch": 3427} {"train_loss": -6.795383930206299, "global_step": 143966, "epoch": 3427} {"train_loss": -6.799498081207275, "global_step": 143967, "epoch": 3427} {"train_loss": -6.755446910858154, "global_step": 143968, "epoch": 3427} {"train_loss": -6.811802864074707, "global_step": 143969, "epoch": 3427} {"train_loss": -6.877199649810791, "global_step": 143970, "epoch": 3427} {"train_loss": -6.843477249145508, "global_step": 143971, "epoch": 3427} {"train_loss": -6.714752197265625, "global_step": 143972, "epoch": 3427} {"train_loss": -6.789592742919922, "global_step": 143973, "epoch": 3427} {"train_loss": -6.770949363708496, "global_step": 143974, "epoch": 3427} {"train_loss": -6.846838179088774, "global_step": 143975, "epoch": 3427, "val_loss": 67660.265625} {"train_loss": -6.765366554260254, "global_step": 143976, "epoch": 3428} {"train_loss": -6.775332927703857, "global_step": 143977, "epoch": 3428} {"train_loss": -6.8200178146362305, "global_step": 143978, "epoch": 3428} {"train_loss": -6.774942874908447, "global_step": 143979, "epoch": 3428} {"train_loss": -6.753658294677734, "global_step": 143980, "epoch": 3428} {"train_loss": -6.846224308013916, "global_step": 143981, "epoch": 3428} {"train_loss": -6.77720832824707, "global_step": 143982, "epoch": 3428} {"train_loss": -6.629541873931885, "global_step": 143983, "epoch": 3428} {"train_loss": -6.748632907867432, "global_step": 143984, "epoch": 3428} {"train_loss": -6.689211845397949, "global_step": 143985, "epoch": 3428} {"train_loss": -6.684021472930908, "global_step": 143986, "epoch": 3428} {"train_loss": -6.697031021118164, "global_step": 143987, "epoch": 3428} {"train_loss": -6.764745235443115, "global_step": 143988, "epoch": 3428} {"train_loss": -6.89177131652832, "global_step": 143989, "epoch": 3428} {"train_loss": -6.7111992835998535, "global_step": 143990, "epoch": 3428} {"train_loss": -6.905973434448242, "global_step": 143991, "epoch": 3428} {"train_loss": -6.7490129470825195, "global_step": 143992, "epoch": 3428} {"train_loss": -6.89906120300293, "global_step": 143993, "epoch": 3428} {"train_loss": -6.789775848388672, "global_step": 143994, "epoch": 3428} {"train_loss": -6.8097944259643555, "global_step": 143995, "epoch": 3428} {"train_loss": -6.83542013168335, "global_step": 143996, "epoch": 3428} {"train_loss": -6.737807273864746, "global_step": 143997, "epoch": 3428} {"train_loss": -6.782681465148926, "global_step": 143998, "epoch": 3428} {"train_loss": -6.895169258117676, "global_step": 143999, "epoch": 3428} {"train_loss": -6.9677886962890625, "global_step": 144000, "epoch": 3428} {"train_loss": -6.89143180847168, "global_step": 144001, "epoch": 3428} {"train_loss": -6.805606842041016, "global_step": 144002, "epoch": 3428} {"train_loss": -6.956556797027588, "global_step": 144003, "epoch": 3428} {"train_loss": -6.664751052856445, "global_step": 144004, "epoch": 3428} {"train_loss": -6.895902633666992, "global_step": 144005, "epoch": 3428} {"train_loss": -6.761269569396973, "global_step": 144006, "epoch": 3428} {"train_loss": -6.808107376098633, "global_step": 144007, "epoch": 3428} {"train_loss": -6.688567638397217, "global_step": 144008, "epoch": 3428} {"train_loss": -6.782907962799072, "global_step": 144009, "epoch": 3428} {"train_loss": -6.702853679656982, "global_step": 144010, "epoch": 3428} {"train_loss": -6.65281343460083, "global_step": 144011, "epoch": 3428} {"train_loss": -6.788898468017578, "global_step": 144012, "epoch": 3428} {"train_loss": -6.796257972717285, "global_step": 144013, "epoch": 3428} {"train_loss": -6.662405014038086, "global_step": 144014, "epoch": 3428} {"train_loss": -6.812922954559326, "global_step": 144015, "epoch": 3428} {"train_loss": -6.739772796630859, "global_step": 144016, "epoch": 3428} {"train_loss": -6.775502261661348, "global_step": 144017, "epoch": 3428, "val_loss": 67634.5625} {"train_loss": -6.71384334564209, "global_step": 144018, "epoch": 3429} {"train_loss": -6.7729997634887695, "global_step": 144019, "epoch": 3429} {"train_loss": -6.74424934387207, "global_step": 144020, "epoch": 3429} {"train_loss": -6.72025203704834, "global_step": 144021, "epoch": 3429} {"train_loss": -6.77495002746582, "global_step": 144022, "epoch": 3429} {"train_loss": -6.825329780578613, "global_step": 144023, "epoch": 3429} {"train_loss": -6.82255744934082, "global_step": 144024, "epoch": 3429} {"train_loss": -6.737146377563477, "global_step": 144025, "epoch": 3429} {"train_loss": -6.6796064376831055, "global_step": 144026, "epoch": 3429} {"train_loss": -6.826493263244629, "global_step": 144027, "epoch": 3429} {"train_loss": -6.724912643432617, "global_step": 144028, "epoch": 3429} {"train_loss": -6.781102657318115, "global_step": 144029, "epoch": 3429} {"train_loss": -6.817398548126221, "global_step": 144030, "epoch": 3429} {"train_loss": -6.791706085205078, "global_step": 144031, "epoch": 3429} {"train_loss": -6.785750865936279, "global_step": 144032, "epoch": 3429} {"train_loss": -6.94127082824707, "global_step": 144033, "epoch": 3429} {"train_loss": -6.792629241943359, "global_step": 144034, "epoch": 3429} {"train_loss": -6.92790412902832, "global_step": 144035, "epoch": 3429} {"train_loss": -6.786342620849609, "global_step": 144036, "epoch": 3429} {"train_loss": -6.713237762451172, "global_step": 144037, "epoch": 3429} {"train_loss": -6.8480072021484375, "global_step": 144038, "epoch": 3429} {"train_loss": -6.763472080230713, "global_step": 144039, "epoch": 3429} {"train_loss": -6.778957366943359, "global_step": 144040, "epoch": 3429} {"train_loss": -6.80946159362793, "global_step": 144041, "epoch": 3429} {"train_loss": -6.718477725982666, "global_step": 144042, "epoch": 3429} {"train_loss": -6.792651176452637, "global_step": 144043, "epoch": 3429} {"train_loss": -6.929872512817383, "global_step": 144044, "epoch": 3429} {"train_loss": -6.77571964263916, "global_step": 144045, "epoch": 3429} {"train_loss": -6.907135009765625, "global_step": 144046, "epoch": 3429} {"train_loss": -6.849461555480957, "global_step": 144047, "epoch": 3429} {"train_loss": -6.739655494689941, "global_step": 144048, "epoch": 3429} {"train_loss": -6.759047508239746, "global_step": 144049, "epoch": 3429} {"train_loss": -6.797463893890381, "global_step": 144050, "epoch": 3429} {"train_loss": -6.7023396492004395, "global_step": 144051, "epoch": 3429} {"train_loss": -6.710223197937012, "global_step": 144052, "epoch": 3429} {"train_loss": -6.47364616394043, "global_step": 144053, "epoch": 3429} {"train_loss": -6.667267799377441, "global_step": 144054, "epoch": 3429} {"train_loss": -6.745025157928467, "global_step": 144055, "epoch": 3429} {"train_loss": -6.72357177734375, "global_step": 144056, "epoch": 3429} {"train_loss": -6.745007514953613, "global_step": 144057, "epoch": 3429} {"train_loss": -6.54646110534668, "global_step": 144058, "epoch": 3429} {"train_loss": -6.765543767384121, "global_step": 144059, "epoch": 3429, "val_loss": 67661.234375} {"train_loss": -6.7250823974609375, "global_step": 144060, "epoch": 3430} {"train_loss": -6.766792297363281, "global_step": 144061, "epoch": 3430} {"train_loss": -6.695502281188965, "global_step": 144062, "epoch": 3430} {"train_loss": -6.495327472686768, "global_step": 144063, "epoch": 3430} {"train_loss": -6.795550346374512, "global_step": 144064, "epoch": 3430} {"train_loss": -6.627002716064453, "global_step": 144065, "epoch": 3430} {"train_loss": -6.735506057739258, "global_step": 144066, "epoch": 3430} {"train_loss": -6.745408535003662, "global_step": 144067, "epoch": 3430} {"train_loss": -6.728847503662109, "global_step": 144068, "epoch": 3430} {"train_loss": -6.745475769042969, "global_step": 144069, "epoch": 3430} {"train_loss": -6.661663055419922, "global_step": 144070, "epoch": 3430} {"train_loss": -6.852176666259766, "global_step": 144071, "epoch": 3430} {"train_loss": -6.827297210693359, "global_step": 144072, "epoch": 3430} {"train_loss": -6.710912704467773, "global_step": 144073, "epoch": 3430} {"train_loss": -6.7293291091918945, "global_step": 144074, "epoch": 3430} {"train_loss": -6.8031110763549805, "global_step": 144075, "epoch": 3430} {"train_loss": -6.672018051147461, "global_step": 144076, "epoch": 3430} {"train_loss": -6.790932655334473, "global_step": 144077, "epoch": 3430} {"train_loss": -6.7903852462768555, "global_step": 144078, "epoch": 3430} {"train_loss": -6.721905708312988, "global_step": 144079, "epoch": 3430} {"train_loss": -6.6998395919799805, "global_step": 144080, "epoch": 3430} {"train_loss": -6.728598594665527, "global_step": 144081, "epoch": 3430} {"train_loss": -6.800527095794678, "global_step": 144082, "epoch": 3430} {"train_loss": -6.656989097595215, "global_step": 144083, "epoch": 3430} {"train_loss": -6.655603408813477, "global_step": 144084, "epoch": 3430} {"train_loss": -6.772908687591553, "global_step": 144085, "epoch": 3430} {"train_loss": -6.7205047607421875, "global_step": 144086, "epoch": 3430} {"train_loss": -6.754054069519043, "global_step": 144087, "epoch": 3430} {"train_loss": -6.578394889831543, "global_step": 144088, "epoch": 3430} {"train_loss": -6.849587440490723, "global_step": 144089, "epoch": 3430} {"train_loss": -6.750374794006348, "global_step": 144090, "epoch": 3430} {"train_loss": -6.787052631378174, "global_step": 144091, "epoch": 3430} {"train_loss": -6.784335136413574, "global_step": 144092, "epoch": 3430} {"train_loss": -6.83684778213501, "global_step": 144093, "epoch": 3430} {"train_loss": -6.773165702819824, "global_step": 144094, "epoch": 3430} {"train_loss": -6.896849632263184, "global_step": 144095, "epoch": 3430} {"train_loss": -6.885079383850098, "global_step": 144096, "epoch": 3430} {"train_loss": -6.688595771789551, "global_step": 144097, "epoch": 3430} {"train_loss": -6.7978715896606445, "global_step": 144098, "epoch": 3430} {"train_loss": -6.717528343200684, "global_step": 144099, "epoch": 3430} {"train_loss": -6.823206901550293, "global_step": 144100, "epoch": 3430} {"train_loss": -6.745513053167434, "global_step": 144101, "epoch": 3430, "val_loss": 67582.1875} {"train_loss": -6.721235275268555, "global_step": 144102, "epoch": 3431} {"train_loss": -6.836305618286133, "global_step": 144103, "epoch": 3431} {"train_loss": -6.6213531494140625, "global_step": 144104, "epoch": 3431} {"train_loss": -6.9371466636657715, "global_step": 144105, "epoch": 3431} {"train_loss": -6.813053607940674, "global_step": 144106, "epoch": 3431} {"train_loss": -6.803463935852051, "global_step": 144107, "epoch": 3431} {"train_loss": -6.815341472625732, "global_step": 144108, "epoch": 3431} {"train_loss": -6.789386749267578, "global_step": 144109, "epoch": 3431} {"train_loss": -6.730844020843506, "global_step": 144110, "epoch": 3431} {"train_loss": -6.839041233062744, "global_step": 144111, "epoch": 3431} {"train_loss": -6.646636962890625, "global_step": 144112, "epoch": 3431} {"train_loss": -6.837701320648193, "global_step": 144113, "epoch": 3431} {"train_loss": -6.815907955169678, "global_step": 144114, "epoch": 3431} {"train_loss": -6.752287864685059, "global_step": 144115, "epoch": 3431} {"train_loss": -6.725675582885742, "global_step": 144116, "epoch": 3431} {"train_loss": -6.795566558837891, "global_step": 144117, "epoch": 3431} {"train_loss": -6.850950717926025, "global_step": 144118, "epoch": 3431} {"train_loss": -6.643851280212402, "global_step": 144119, "epoch": 3431} {"train_loss": -6.801890850067139, "global_step": 144120, "epoch": 3431} {"train_loss": -6.8146772384643555, "global_step": 144121, "epoch": 3431} {"train_loss": -6.780536651611328, "global_step": 144122, "epoch": 3431} {"train_loss": -6.739621162414551, "global_step": 144123, "epoch": 3431} {"train_loss": -6.812437534332275, "global_step": 144124, "epoch": 3431} {"train_loss": -6.772996425628662, "global_step": 144125, "epoch": 3431} {"train_loss": -6.7782793045043945, "global_step": 144126, "epoch": 3431} {"train_loss": -6.883561134338379, "global_step": 144127, "epoch": 3431} {"train_loss": -6.838546276092529, "global_step": 144128, "epoch": 3431} {"train_loss": -6.881138801574707, "global_step": 144129, "epoch": 3431} {"train_loss": -6.871207237243652, "global_step": 144130, "epoch": 3431} {"train_loss": -6.863663196563721, "global_step": 144131, "epoch": 3431} {"train_loss": -6.801234722137451, "global_step": 144132, "epoch": 3431} {"train_loss": -6.831148147583008, "global_step": 144133, "epoch": 3431} {"train_loss": -6.779489517211914, "global_step": 144134, "epoch": 3431} {"train_loss": -6.922761917114258, "global_step": 144135, "epoch": 3431} {"train_loss": -6.89622163772583, "global_step": 144136, "epoch": 3431} {"train_loss": -6.847899913787842, "global_step": 144137, "epoch": 3431} {"train_loss": -6.887063026428223, "global_step": 144138, "epoch": 3431} {"train_loss": -6.889103889465332, "global_step": 144139, "epoch": 3431} {"train_loss": -6.807873725891113, "global_step": 144140, "epoch": 3431} {"train_loss": -6.933589458465576, "global_step": 144141, "epoch": 3431} {"train_loss": -6.876097679138184, "global_step": 144142, "epoch": 3431} {"train_loss": -6.813195296696255, "global_step": 144143, "epoch": 3431, "val_loss": 67618.4921875} {"train_loss": -6.829990386962891, "global_step": 144144, "epoch": 3432} {"train_loss": -6.841815948486328, "global_step": 144145, "epoch": 3432} {"train_loss": -6.918020248413086, "global_step": 144146, "epoch": 3432} {"train_loss": -6.91452693939209, "global_step": 144147, "epoch": 3432} {"train_loss": -6.800288677215576, "global_step": 144148, "epoch": 3432} {"train_loss": -6.787528038024902, "global_step": 144149, "epoch": 3432} {"train_loss": -6.861028671264648, "global_step": 144150, "epoch": 3432} {"train_loss": -6.888299465179443, "global_step": 144151, "epoch": 3432} {"train_loss": -6.854933261871338, "global_step": 144152, "epoch": 3432} {"train_loss": -6.862048149108887, "global_step": 144153, "epoch": 3432} {"train_loss": -6.803269863128662, "global_step": 144154, "epoch": 3432} {"train_loss": -6.861853122711182, "global_step": 144155, "epoch": 3432} {"train_loss": -6.734185695648193, "global_step": 144156, "epoch": 3432} {"train_loss": -6.857548713684082, "global_step": 144157, "epoch": 3432} {"train_loss": -6.743494033813477, "global_step": 144158, "epoch": 3432} {"train_loss": -6.766050815582275, "global_step": 144159, "epoch": 3432} {"train_loss": -6.888427734375, "global_step": 144160, "epoch": 3432} {"train_loss": -6.744937896728516, "global_step": 144161, "epoch": 3432} {"train_loss": -6.848115921020508, "global_step": 144162, "epoch": 3432} {"train_loss": -6.785064697265625, "global_step": 144163, "epoch": 3432} {"train_loss": -6.7916789054870605, "global_step": 144164, "epoch": 3432} {"train_loss": -6.7791242599487305, "global_step": 144165, "epoch": 3432} {"train_loss": -6.765962600708008, "global_step": 144166, "epoch": 3432} {"train_loss": -6.793635845184326, "global_step": 144167, "epoch": 3432} {"train_loss": -6.8605804443359375, "global_step": 144168, "epoch": 3432} {"train_loss": -6.736265659332275, "global_step": 144169, "epoch": 3432} {"train_loss": -6.774422645568848, "global_step": 144170, "epoch": 3432} {"train_loss": -6.834466934204102, "global_step": 144171, "epoch": 3432} {"train_loss": -6.7974853515625, "global_step": 144172, "epoch": 3432} {"train_loss": -6.794351100921631, "global_step": 144173, "epoch": 3432} {"train_loss": -6.771585464477539, "global_step": 144174, "epoch": 3432} {"train_loss": -6.887823104858398, "global_step": 144175, "epoch": 3432} {"train_loss": -6.764225959777832, "global_step": 144176, "epoch": 3432} {"train_loss": -6.809762001037598, "global_step": 144177, "epoch": 3432} {"train_loss": -6.897620677947998, "global_step": 144178, "epoch": 3432} {"train_loss": -6.870589256286621, "global_step": 144179, "epoch": 3432} {"train_loss": -6.771280288696289, "global_step": 144180, "epoch": 3432} {"train_loss": -6.823537349700928, "global_step": 144181, "epoch": 3432} {"train_loss": -6.88763427734375, "global_step": 144182, "epoch": 3432} {"train_loss": -6.8416876792907715, "global_step": 144183, "epoch": 3432} {"train_loss": -6.906033039093018, "global_step": 144184, "epoch": 3432} {"train_loss": -6.823073500678653, "global_step": 144185, "epoch": 3432, "val_loss": 67700.4375} {"train_loss": -6.857775688171387, "global_step": 144186, "epoch": 3433} {"train_loss": -6.702704429626465, "global_step": 144187, "epoch": 3433} {"train_loss": -6.869028091430664, "global_step": 144188, "epoch": 3433} {"train_loss": -6.856554985046387, "global_step": 144189, "epoch": 3433} {"train_loss": -6.804016590118408, "global_step": 144190, "epoch": 3433} {"train_loss": -6.803606033325195, "global_step": 144191, "epoch": 3433} {"train_loss": -6.845314979553223, "global_step": 144192, "epoch": 3433} {"train_loss": -6.936628818511963, "global_step": 144193, "epoch": 3433} {"train_loss": -6.791845798492432, "global_step": 144194, "epoch": 3433} {"train_loss": -6.710582733154297, "global_step": 144195, "epoch": 3433} {"train_loss": -6.795111656188965, "global_step": 144196, "epoch": 3433} {"train_loss": -6.80307674407959, "global_step": 144197, "epoch": 3433} {"train_loss": -6.749034881591797, "global_step": 144198, "epoch": 3433} {"train_loss": -6.714028358459473, "global_step": 144199, "epoch": 3433} {"train_loss": -6.665907859802246, "global_step": 144200, "epoch": 3433} {"train_loss": -6.694679260253906, "global_step": 144201, "epoch": 3433} {"train_loss": -6.795238971710205, "global_step": 144202, "epoch": 3433} {"train_loss": -6.688104629516602, "global_step": 144203, "epoch": 3433} {"train_loss": -6.761019229888916, "global_step": 144204, "epoch": 3433} {"train_loss": -6.838898181915283, "global_step": 144205, "epoch": 3433} {"train_loss": -6.669933319091797, "global_step": 144206, "epoch": 3433} {"train_loss": -6.761049270629883, "global_step": 144207, "epoch": 3433} {"train_loss": -6.614562034606934, "global_step": 144208, "epoch": 3433} {"train_loss": -6.801200866699219, "global_step": 144209, "epoch": 3433} {"train_loss": -6.668139457702637, "global_step": 144210, "epoch": 3433} {"train_loss": -6.791201591491699, "global_step": 144211, "epoch": 3433} {"train_loss": -6.675237655639648, "global_step": 144212, "epoch": 3433} {"train_loss": -6.6859941482543945, "global_step": 144213, "epoch": 3433} {"train_loss": -6.699448585510254, "global_step": 144214, "epoch": 3433} {"train_loss": -6.685980796813965, "global_step": 144215, "epoch": 3433} {"train_loss": -6.701928615570068, "global_step": 144216, "epoch": 3433} {"train_loss": -6.701096534729004, "global_step": 144217, "epoch": 3433} {"train_loss": -6.743712425231934, "global_step": 144218, "epoch": 3433} {"train_loss": -6.769817352294922, "global_step": 144219, "epoch": 3433} {"train_loss": -6.775533676147461, "global_step": 144220, "epoch": 3433} {"train_loss": -6.731751918792725, "global_step": 144221, "epoch": 3433} {"train_loss": -6.8545427322387695, "global_step": 144222, "epoch": 3433} {"train_loss": -6.7810869216918945, "global_step": 144223, "epoch": 3433} {"train_loss": -6.792970657348633, "global_step": 144224, "epoch": 3433} {"train_loss": -6.797034740447998, "global_step": 144225, "epoch": 3433} {"train_loss": -6.847598552703857, "global_step": 144226, "epoch": 3433} {"train_loss": -6.765644073486328, "global_step": 144227, "epoch": 3433, "val_loss": 67582.015625} {"train_loss": -6.893268585205078, "global_step": 144228, "epoch": 3434} {"train_loss": -6.804682731628418, "global_step": 144229, "epoch": 3434} {"train_loss": -6.783030986785889, "global_step": 144230, "epoch": 3434} {"train_loss": -6.806215286254883, "global_step": 144231, "epoch": 3434} {"train_loss": -6.91747522354126, "global_step": 144232, "epoch": 3434} {"train_loss": -6.93376350402832, "global_step": 144233, "epoch": 3434} {"train_loss": -6.787835121154785, "global_step": 144234, "epoch": 3434} {"train_loss": -6.867448329925537, "global_step": 144235, "epoch": 3434} {"train_loss": -6.801987648010254, "global_step": 144236, "epoch": 3434} {"train_loss": -6.851206302642822, "global_step": 144237, "epoch": 3434} {"train_loss": -6.813932418823242, "global_step": 144238, "epoch": 3434} {"train_loss": -6.78513240814209, "global_step": 144239, "epoch": 3434} {"train_loss": -6.83585786819458, "global_step": 144240, "epoch": 3434} {"train_loss": -6.827614784240723, "global_step": 144241, "epoch": 3434} {"train_loss": -6.809968948364258, "global_step": 144242, "epoch": 3434} {"train_loss": -6.872718811035156, "global_step": 144243, "epoch": 3434} {"train_loss": -6.741629600524902, "global_step": 144244, "epoch": 3434} {"train_loss": -6.899944305419922, "global_step": 144245, "epoch": 3434} {"train_loss": -6.76912260055542, "global_step": 144246, "epoch": 3434} {"train_loss": -6.733220100402832, "global_step": 144247, "epoch": 3434} {"train_loss": -6.866991996765137, "global_step": 144248, "epoch": 3434} {"train_loss": -6.756219863891602, "global_step": 144249, "epoch": 3434} {"train_loss": -6.78036642074585, "global_step": 144250, "epoch": 3434} {"train_loss": -6.811496734619141, "global_step": 144251, "epoch": 3434} {"train_loss": -6.764883041381836, "global_step": 144252, "epoch": 3434} {"train_loss": -6.794063091278076, "global_step": 144253, "epoch": 3434} {"train_loss": -6.908376693725586, "global_step": 144254, "epoch": 3434} {"train_loss": -6.81964635848999, "global_step": 144255, "epoch": 3434} {"train_loss": -6.802072525024414, "global_step": 144256, "epoch": 3434} {"train_loss": -6.860471725463867, "global_step": 144257, "epoch": 3434} {"train_loss": -6.830735206604004, "global_step": 144258, "epoch": 3434} {"train_loss": -6.82028865814209, "global_step": 144259, "epoch": 3434} {"train_loss": -6.907849311828613, "global_step": 144260, "epoch": 3434} {"train_loss": -6.838263511657715, "global_step": 144261, "epoch": 3434} {"train_loss": -6.817163467407227, "global_step": 144262, "epoch": 3434} {"train_loss": -6.896791934967041, "global_step": 144263, "epoch": 3434} {"train_loss": -6.907060623168945, "global_step": 144264, "epoch": 3434} {"train_loss": -6.826786994934082, "global_step": 144265, "epoch": 3434} {"train_loss": -6.873368263244629, "global_step": 144266, "epoch": 3434} {"train_loss": -6.899239540100098, "global_step": 144267, "epoch": 3434} {"train_loss": -6.929358959197998, "global_step": 144268, "epoch": 3434} {"train_loss": -6.835908526466007, "global_step": 144269, "epoch": 3434, "val_loss": 67608.3671875} {"train_loss": -6.757694721221924, "global_step": 144270, "epoch": 3435} {"train_loss": -6.667214870452881, "global_step": 144271, "epoch": 3435} {"train_loss": -6.863692283630371, "global_step": 144272, "epoch": 3435} {"train_loss": -6.7756757736206055, "global_step": 144273, "epoch": 3435} {"train_loss": -6.775774955749512, "global_step": 144274, "epoch": 3435} {"train_loss": -6.81828498840332, "global_step": 144275, "epoch": 3435} {"train_loss": -6.84981632232666, "global_step": 144276, "epoch": 3435} {"train_loss": -6.749382019042969, "global_step": 144277, "epoch": 3435} {"train_loss": -6.676600456237793, "global_step": 144278, "epoch": 3435} {"train_loss": -6.900318145751953, "global_step": 144279, "epoch": 3435} {"train_loss": -6.8043084144592285, "global_step": 144280, "epoch": 3435} {"train_loss": -6.650561809539795, "global_step": 144281, "epoch": 3435} {"train_loss": -6.8163557052612305, "global_step": 144282, "epoch": 3435} {"train_loss": -6.8408308029174805, "global_step": 144283, "epoch": 3435} {"train_loss": -6.760687828063965, "global_step": 144284, "epoch": 3435} {"train_loss": -6.705475807189941, "global_step": 144285, "epoch": 3435} {"train_loss": -6.803750038146973, "global_step": 144286, "epoch": 3435} {"train_loss": -6.75800085067749, "global_step": 144287, "epoch": 3435} {"train_loss": -6.866122245788574, "global_step": 144288, "epoch": 3435} {"train_loss": -6.82462739944458, "global_step": 144289, "epoch": 3435} {"train_loss": -6.793891906738281, "global_step": 144290, "epoch": 3435} {"train_loss": -6.814682960510254, "global_step": 144291, "epoch": 3435} {"train_loss": -6.813514232635498, "global_step": 144292, "epoch": 3435} {"train_loss": -6.792820930480957, "global_step": 144293, "epoch": 3435} {"train_loss": -6.879156112670898, "global_step": 144294, "epoch": 3435} {"train_loss": -6.881888389587402, "global_step": 144295, "epoch": 3435} {"train_loss": -6.880390644073486, "global_step": 144296, "epoch": 3435} {"train_loss": -6.838458061218262, "global_step": 144297, "epoch": 3435} {"train_loss": -6.796506404876709, "global_step": 144298, "epoch": 3435} {"train_loss": -6.766138076782227, "global_step": 144299, "epoch": 3435} {"train_loss": -6.850949287414551, "global_step": 144300, "epoch": 3435} {"train_loss": -6.7612690925598145, "global_step": 144301, "epoch": 3435} {"train_loss": -6.796622276306152, "global_step": 144302, "epoch": 3435} {"train_loss": -6.776252746582031, "global_step": 144303, "epoch": 3435} {"train_loss": -6.794624328613281, "global_step": 144304, "epoch": 3435} {"train_loss": -6.73200798034668, "global_step": 144305, "epoch": 3435} {"train_loss": -6.670762062072754, "global_step": 144306, "epoch": 3435} {"train_loss": -6.767158508300781, "global_step": 144307, "epoch": 3435} {"train_loss": -6.766158103942871, "global_step": 144308, "epoch": 3435} {"train_loss": -6.79583740234375, "global_step": 144309, "epoch": 3435} {"train_loss": -6.773480415344238, "global_step": 144310, "epoch": 3435} {"train_loss": -6.7902514934539795, "global_step": 144311, "epoch": 3435, "val_loss": 67679.4453125} {"train_loss": -6.7719597816467285, "global_step": 144312, "epoch": 3436} {"train_loss": -6.681385040283203, "global_step": 144313, "epoch": 3436} {"train_loss": -6.724862575531006, "global_step": 144314, "epoch": 3436} {"train_loss": -6.754560470581055, "global_step": 144315, "epoch": 3436} {"train_loss": -6.748276233673096, "global_step": 144316, "epoch": 3436} {"train_loss": -6.649781703948975, "global_step": 144317, "epoch": 3436} {"train_loss": -6.768239974975586, "global_step": 144318, "epoch": 3436} {"train_loss": -6.635141849517822, "global_step": 144319, "epoch": 3436} {"train_loss": -6.665716648101807, "global_step": 144320, "epoch": 3436} {"train_loss": -6.852045059204102, "global_step": 144321, "epoch": 3436} {"train_loss": -6.608323097229004, "global_step": 144322, "epoch": 3436} {"train_loss": -6.693412780761719, "global_step": 144323, "epoch": 3436} {"train_loss": -6.674893856048584, "global_step": 144324, "epoch": 3436} {"train_loss": -6.7568769454956055, "global_step": 144325, "epoch": 3436} {"train_loss": -6.723132610321045, "global_step": 144326, "epoch": 3436} {"train_loss": -6.756211280822754, "global_step": 144327, "epoch": 3436} {"train_loss": -6.851322650909424, "global_step": 144328, "epoch": 3436} {"train_loss": -6.639516353607178, "global_step": 144329, "epoch": 3436} {"train_loss": -6.797971725463867, "global_step": 144330, "epoch": 3436} {"train_loss": -6.7303690910339355, "global_step": 144331, "epoch": 3436} {"train_loss": -6.714081764221191, "global_step": 144332, "epoch": 3436} {"train_loss": -6.796375751495361, "global_step": 144333, "epoch": 3436} {"train_loss": -6.715405464172363, "global_step": 144334, "epoch": 3436} {"train_loss": -6.701015472412109, "global_step": 144335, "epoch": 3436} {"train_loss": -6.760138511657715, "global_step": 144336, "epoch": 3436} {"train_loss": -6.6591796875, "global_step": 144337, "epoch": 3436} {"train_loss": -6.828413963317871, "global_step": 144338, "epoch": 3436} {"train_loss": -6.829161643981934, "global_step": 144339, "epoch": 3436} {"train_loss": -6.828100681304932, "global_step": 144340, "epoch": 3436} {"train_loss": -6.7588090896606445, "global_step": 144341, "epoch": 3436} {"train_loss": -6.679542541503906, "global_step": 144342, "epoch": 3436} {"train_loss": -6.802262306213379, "global_step": 144343, "epoch": 3436} {"train_loss": -6.747556686401367, "global_step": 144344, "epoch": 3436} {"train_loss": -6.7606892585754395, "global_step": 144345, "epoch": 3436} {"train_loss": -6.805994987487793, "global_step": 144346, "epoch": 3436} {"train_loss": -6.743838787078857, "global_step": 144347, "epoch": 3436} {"train_loss": -6.777127742767334, "global_step": 144348, "epoch": 3436} {"train_loss": -6.809281349182129, "global_step": 144349, "epoch": 3436} {"train_loss": -6.854625225067139, "global_step": 144350, "epoch": 3436} {"train_loss": -6.873390197753906, "global_step": 144351, "epoch": 3436} {"train_loss": -6.677550792694092, "global_step": 144352, "epoch": 3436} {"train_loss": -6.747529563449678, "global_step": 144353, "epoch": 3436, "val_loss": 67445.4609375} {"train_loss": -6.860367774963379, "global_step": 144354, "epoch": 3437} {"train_loss": -6.725855827331543, "global_step": 144355, "epoch": 3437} {"train_loss": -6.70916748046875, "global_step": 144356, "epoch": 3437} {"train_loss": -6.802165985107422, "global_step": 144357, "epoch": 3437} {"train_loss": -6.68956184387207, "global_step": 144358, "epoch": 3437} {"train_loss": -6.719393730163574, "global_step": 144359, "epoch": 3437} {"train_loss": -6.922577857971191, "global_step": 144360, "epoch": 3437} {"train_loss": -6.725663185119629, "global_step": 144361, "epoch": 3437} {"train_loss": -6.90624475479126, "global_step": 144362, "epoch": 3437} {"train_loss": -6.795102119445801, "global_step": 144363, "epoch": 3437} {"train_loss": -6.718994617462158, "global_step": 144364, "epoch": 3437} {"train_loss": -6.710282802581787, "global_step": 144365, "epoch": 3437} {"train_loss": -6.844202518463135, "global_step": 144366, "epoch": 3437} {"train_loss": -6.747118949890137, "global_step": 144367, "epoch": 3437} {"train_loss": -6.859696388244629, "global_step": 144368, "epoch": 3437} {"train_loss": -6.904796600341797, "global_step": 144369, "epoch": 3437} {"train_loss": -6.717362403869629, "global_step": 144370, "epoch": 3437} {"train_loss": -6.829993724822998, "global_step": 144371, "epoch": 3437} {"train_loss": -6.837135314941406, "global_step": 144372, "epoch": 3437} {"train_loss": -6.774946689605713, "global_step": 144373, "epoch": 3437} {"train_loss": -6.685079574584961, "global_step": 144374, "epoch": 3437} {"train_loss": -6.800983428955078, "global_step": 144375, "epoch": 3437} {"train_loss": -6.858723163604736, "global_step": 144376, "epoch": 3437} {"train_loss": -6.857485771179199, "global_step": 144377, "epoch": 3437} {"train_loss": -6.7011613845825195, "global_step": 144378, "epoch": 3437} {"train_loss": -6.789313793182373, "global_step": 144379, "epoch": 3437} {"train_loss": -6.822357177734375, "global_step": 144380, "epoch": 3437} {"train_loss": -6.8143768310546875, "global_step": 144381, "epoch": 3437} {"train_loss": -6.791382789611816, "global_step": 144382, "epoch": 3437} {"train_loss": -6.899405002593994, "global_step": 144383, "epoch": 3437} {"train_loss": -6.803085803985596, "global_step": 144384, "epoch": 3437} {"train_loss": -6.900895118713379, "global_step": 144385, "epoch": 3437} {"train_loss": -6.760673999786377, "global_step": 144386, "epoch": 3437} {"train_loss": -6.792232513427734, "global_step": 144387, "epoch": 3437} {"train_loss": -6.876083850860596, "global_step": 144388, "epoch": 3437} {"train_loss": -6.833589553833008, "global_step": 144389, "epoch": 3437} {"train_loss": -6.775820732116699, "global_step": 144390, "epoch": 3437} {"train_loss": -6.884054183959961, "global_step": 144391, "epoch": 3437} {"train_loss": -6.851187705993652, "global_step": 144392, "epoch": 3437} {"train_loss": -6.851674556732178, "global_step": 144393, "epoch": 3437} {"train_loss": -6.723170280456543, "global_step": 144394, "epoch": 3437} {"train_loss": -6.801528453826904, "global_step": 144395, "epoch": 3437, "val_loss": 67732.0390625} {"train_loss": -6.810493469238281, "global_step": 144396, "epoch": 3438} {"train_loss": -6.8585205078125, "global_step": 144397, "epoch": 3438} {"train_loss": -6.727611064910889, "global_step": 144398, "epoch": 3438} {"train_loss": -6.782207489013672, "global_step": 144399, "epoch": 3438} {"train_loss": -6.749363899230957, "global_step": 144400, "epoch": 3438} {"train_loss": -6.737575531005859, "global_step": 144401, "epoch": 3438} {"train_loss": -6.818565368652344, "global_step": 144402, "epoch": 3438} {"train_loss": -6.863360404968262, "global_step": 144403, "epoch": 3438} {"train_loss": -6.837709426879883, "global_step": 144404, "epoch": 3438} {"train_loss": -6.720911979675293, "global_step": 144405, "epoch": 3438} {"train_loss": -6.79328727722168, "global_step": 144406, "epoch": 3438} {"train_loss": -6.786517143249512, "global_step": 144407, "epoch": 3438} {"train_loss": -6.853918075561523, "global_step": 144408, "epoch": 3438} {"train_loss": -6.835915565490723, "global_step": 144409, "epoch": 3438} {"train_loss": -6.736855983734131, "global_step": 144410, "epoch": 3438} {"train_loss": -6.856723785400391, "global_step": 144411, "epoch": 3438} {"train_loss": -6.787464141845703, "global_step": 144412, "epoch": 3438} {"train_loss": -6.8925275802612305, "global_step": 144413, "epoch": 3438} {"train_loss": -6.815789222717285, "global_step": 144414, "epoch": 3438} {"train_loss": -6.740719318389893, "global_step": 144415, "epoch": 3438} {"train_loss": -6.721168518066406, "global_step": 144416, "epoch": 3438} {"train_loss": -6.505953311920166, "global_step": 144417, "epoch": 3438} {"train_loss": -6.679218292236328, "global_step": 144418, "epoch": 3438} {"train_loss": -6.6967902183532715, "global_step": 144419, "epoch": 3438} {"train_loss": -6.76950216293335, "global_step": 144420, "epoch": 3438} {"train_loss": -6.763516426086426, "global_step": 144421, "epoch": 3438} {"train_loss": -6.736825466156006, "global_step": 144422, "epoch": 3438} {"train_loss": -6.875837326049805, "global_step": 144423, "epoch": 3438} {"train_loss": -6.825586318969727, "global_step": 144424, "epoch": 3438} {"train_loss": -6.825170993804932, "global_step": 144425, "epoch": 3438} {"train_loss": -6.788547515869141, "global_step": 144426, "epoch": 3438} {"train_loss": -6.803665637969971, "global_step": 144427, "epoch": 3438} {"train_loss": -6.854950428009033, "global_step": 144428, "epoch": 3438} {"train_loss": -6.837197303771973, "global_step": 144429, "epoch": 3438} {"train_loss": -6.702419281005859, "global_step": 144430, "epoch": 3438} {"train_loss": -6.815333366394043, "global_step": 144431, "epoch": 3438} {"train_loss": -6.79384708404541, "global_step": 144432, "epoch": 3438} {"train_loss": -6.694689750671387, "global_step": 144433, "epoch": 3438} {"train_loss": -6.75578498840332, "global_step": 144434, "epoch": 3438} {"train_loss": -6.733470439910889, "global_step": 144435, "epoch": 3438} {"train_loss": -6.727816581726074, "global_step": 144436, "epoch": 3438} {"train_loss": -6.779800823756626, "global_step": 144437, "epoch": 3438, "val_loss": 68084.3984375} {"train_loss": -6.744627952575684, "global_step": 144438, "epoch": 3439} {"train_loss": -6.545466423034668, "global_step": 144439, "epoch": 3439} {"train_loss": -6.558648586273193, "global_step": 144440, "epoch": 3439} {"train_loss": -6.876225471496582, "global_step": 144441, "epoch": 3439} {"train_loss": -6.552181243896484, "global_step": 144442, "epoch": 3439} {"train_loss": -6.739392280578613, "global_step": 144443, "epoch": 3439} {"train_loss": -6.657252311706543, "global_step": 144444, "epoch": 3439} {"train_loss": -6.623795986175537, "global_step": 144445, "epoch": 3439} {"train_loss": -6.704418659210205, "global_step": 144446, "epoch": 3439} {"train_loss": -6.703001976013184, "global_step": 144447, "epoch": 3439} {"train_loss": -6.779211044311523, "global_step": 144448, "epoch": 3439} {"train_loss": -6.773587226867676, "global_step": 144449, "epoch": 3439} {"train_loss": -6.73297119140625, "global_step": 144450, "epoch": 3439} {"train_loss": -6.744543552398682, "global_step": 144451, "epoch": 3439} {"train_loss": -6.830752372741699, "global_step": 144452, "epoch": 3439} {"train_loss": -6.803475379943848, "global_step": 144453, "epoch": 3439} {"train_loss": -6.7170023918151855, "global_step": 144454, "epoch": 3439} {"train_loss": -6.842047691345215, "global_step": 144455, "epoch": 3439} {"train_loss": -6.701094627380371, "global_step": 144456, "epoch": 3439} {"train_loss": -6.949160575866699, "global_step": 144457, "epoch": 3439} {"train_loss": -6.656890869140625, "global_step": 144458, "epoch": 3439} {"train_loss": -6.712737083435059, "global_step": 144459, "epoch": 3439} {"train_loss": -6.8135786056518555, "global_step": 144460, "epoch": 3439} {"train_loss": -6.704170227050781, "global_step": 144461, "epoch": 3439} {"train_loss": -6.852092742919922, "global_step": 144462, "epoch": 3439} {"train_loss": -6.867303848266602, "global_step": 144463, "epoch": 3439} {"train_loss": -6.83582878112793, "global_step": 144464, "epoch": 3439} {"train_loss": -6.598433494567871, "global_step": 144465, "epoch": 3439} {"train_loss": -6.861939430236816, "global_step": 144466, "epoch": 3439} {"train_loss": -6.870173454284668, "global_step": 144467, "epoch": 3439} {"train_loss": -6.910545349121094, "global_step": 144468, "epoch": 3439} {"train_loss": -6.887639999389648, "global_step": 144469, "epoch": 3439} {"train_loss": -6.8565673828125, "global_step": 144470, "epoch": 3439} {"train_loss": -6.838013648986816, "global_step": 144471, "epoch": 3439} {"train_loss": -6.775442123413086, "global_step": 144472, "epoch": 3439} {"train_loss": -6.884760856628418, "global_step": 144473, "epoch": 3439} {"train_loss": -6.815532684326172, "global_step": 144474, "epoch": 3439} {"train_loss": -6.78336238861084, "global_step": 144475, "epoch": 3439} {"train_loss": -6.8290300369262695, "global_step": 144476, "epoch": 3439} {"train_loss": -6.8676323890686035, "global_step": 144477, "epoch": 3439} {"train_loss": -6.770171642303467, "global_step": 144478, "epoch": 3439} {"train_loss": -6.770932118097941, "global_step": 144479, "epoch": 3439, "val_loss": 67516.765625} {"train_loss": -6.833477020263672, "global_step": 144480, "epoch": 3440} {"train_loss": -6.724170684814453, "global_step": 144481, "epoch": 3440} {"train_loss": -6.821467399597168, "global_step": 144482, "epoch": 3440} {"train_loss": -6.69534158706665, "global_step": 144483, "epoch": 3440} {"train_loss": -6.656469345092773, "global_step": 144484, "epoch": 3440} {"train_loss": -6.847506523132324, "global_step": 144485, "epoch": 3440} {"train_loss": -6.764218330383301, "global_step": 144486, "epoch": 3440} {"train_loss": -6.853728771209717, "global_step": 144487, "epoch": 3440} {"train_loss": -6.806964874267578, "global_step": 144488, "epoch": 3440} {"train_loss": -6.644634246826172, "global_step": 144489, "epoch": 3440} {"train_loss": -6.860939025878906, "global_step": 144490, "epoch": 3440} {"train_loss": -6.787125587463379, "global_step": 144491, "epoch": 3440} {"train_loss": -6.763339042663574, "global_step": 144492, "epoch": 3440} {"train_loss": -6.869626045227051, "global_step": 144493, "epoch": 3440} {"train_loss": -6.832624435424805, "global_step": 144494, "epoch": 3440} {"train_loss": -6.8668532371521, "global_step": 144495, "epoch": 3440} {"train_loss": -6.726850509643555, "global_step": 144496, "epoch": 3440} {"train_loss": -6.758427619934082, "global_step": 144497, "epoch": 3440} {"train_loss": -6.810952663421631, "global_step": 144498, "epoch": 3440} {"train_loss": -6.7702412605285645, "global_step": 144499, "epoch": 3440} {"train_loss": -6.862124443054199, "global_step": 144500, "epoch": 3440} {"train_loss": -6.676568984985352, "global_step": 144501, "epoch": 3440} {"train_loss": -6.746340751647949, "global_step": 144502, "epoch": 3440} {"train_loss": -6.772408485412598, "global_step": 144503, "epoch": 3440} {"train_loss": -6.778740882873535, "global_step": 144504, "epoch": 3440} {"train_loss": -6.736114025115967, "global_step": 144505, "epoch": 3440} {"train_loss": -6.808396816253662, "global_step": 144506, "epoch": 3440} {"train_loss": -6.696571350097656, "global_step": 144507, "epoch": 3440} {"train_loss": -6.836104393005371, "global_step": 144508, "epoch": 3440} {"train_loss": -6.610424041748047, "global_step": 144509, "epoch": 3440} {"train_loss": -6.632925033569336, "global_step": 144510, "epoch": 3440} {"train_loss": -6.766262054443359, "global_step": 144511, "epoch": 3440} {"train_loss": -6.613451957702637, "global_step": 144512, "epoch": 3440} {"train_loss": -6.675835609436035, "global_step": 144513, "epoch": 3440} {"train_loss": -6.930951118469238, "global_step": 144514, "epoch": 3440} {"train_loss": -6.8268280029296875, "global_step": 144515, "epoch": 3440} {"train_loss": -6.775767803192139, "global_step": 144516, "epoch": 3440} {"train_loss": -6.829750061035156, "global_step": 144517, "epoch": 3440} {"train_loss": -6.722959041595459, "global_step": 144518, "epoch": 3440} {"train_loss": -6.718204021453857, "global_step": 144519, "epoch": 3440} {"train_loss": -6.804880142211914, "global_step": 144520, "epoch": 3440} {"train_loss": -6.768467903137207, "global_step": 144521, "epoch": 3440, "val_loss": 67672.3046875} {"train_loss": -6.87232780456543, "global_step": 144522, "epoch": 3441} {"train_loss": -6.826791763305664, "global_step": 144523, "epoch": 3441} {"train_loss": -6.776083946228027, "global_step": 144524, "epoch": 3441} {"train_loss": -6.776147842407227, "global_step": 144525, "epoch": 3441} {"train_loss": -6.853876113891602, "global_step": 144526, "epoch": 3441} {"train_loss": -6.870388984680176, "global_step": 144527, "epoch": 3441} {"train_loss": -6.824284076690674, "global_step": 144528, "epoch": 3441} {"train_loss": -6.827592372894287, "global_step": 144529, "epoch": 3441} {"train_loss": -7.000703811645508, "global_step": 144530, "epoch": 3441} {"train_loss": -6.824726104736328, "global_step": 144531, "epoch": 3441} {"train_loss": -6.941615104675293, "global_step": 144532, "epoch": 3441} {"train_loss": -6.78367805480957, "global_step": 144533, "epoch": 3441} {"train_loss": -6.948136329650879, "global_step": 144534, "epoch": 3441} {"train_loss": -6.869414806365967, "global_step": 144535, "epoch": 3441} {"train_loss": -6.76171875, "global_step": 144536, "epoch": 3441} {"train_loss": -6.847206115722656, "global_step": 144537, "epoch": 3441} {"train_loss": -6.9496049880981445, "global_step": 144538, "epoch": 3441} {"train_loss": -6.7615580558776855, "global_step": 144539, "epoch": 3441} {"train_loss": -6.718354225158691, "global_step": 144540, "epoch": 3441} {"train_loss": -6.776738166809082, "global_step": 144541, "epoch": 3441} {"train_loss": -6.775643825531006, "global_step": 144542, "epoch": 3441} {"train_loss": -6.712292671203613, "global_step": 144543, "epoch": 3441} {"train_loss": -6.8492889404296875, "global_step": 144544, "epoch": 3441} {"train_loss": -6.735223770141602, "global_step": 144545, "epoch": 3441} {"train_loss": -6.8488054275512695, "global_step": 144546, "epoch": 3441} {"train_loss": -6.716462135314941, "global_step": 144547, "epoch": 3441} {"train_loss": -6.7390546798706055, "global_step": 144548, "epoch": 3441} {"train_loss": -6.716350078582764, "global_step": 144549, "epoch": 3441} {"train_loss": -6.8229875564575195, "global_step": 144550, "epoch": 3441} {"train_loss": -6.842002868652344, "global_step": 144551, "epoch": 3441} {"train_loss": -6.787289142608643, "global_step": 144552, "epoch": 3441} {"train_loss": -6.774303436279297, "global_step": 144553, "epoch": 3441} {"train_loss": -6.9548821449279785, "global_step": 144554, "epoch": 3441} {"train_loss": -6.783497333526611, "global_step": 144555, "epoch": 3441} {"train_loss": -6.818563461303711, "global_step": 144556, "epoch": 3441} {"train_loss": -6.833032131195068, "global_step": 144557, "epoch": 3441} {"train_loss": -6.7899169921875, "global_step": 144558, "epoch": 3441} {"train_loss": -6.841684818267822, "global_step": 144559, "epoch": 3441} {"train_loss": -6.81675910949707, "global_step": 144560, "epoch": 3441} {"train_loss": -6.734009742736816, "global_step": 144561, "epoch": 3441} {"train_loss": -6.851820945739746, "global_step": 144562, "epoch": 3441} {"train_loss": -6.819371098563785, "global_step": 144563, "epoch": 3441, "val_loss": 67606.1171875} {"train_loss": -6.801053047180176, "global_step": 144564, "epoch": 3442} {"train_loss": -6.900016784667969, "global_step": 144565, "epoch": 3442} {"train_loss": -6.776601791381836, "global_step": 144566, "epoch": 3442} {"train_loss": -6.8017449378967285, "global_step": 144567, "epoch": 3442} {"train_loss": -6.811649322509766, "global_step": 144568, "epoch": 3442} {"train_loss": -6.898032188415527, "global_step": 144569, "epoch": 3442} {"train_loss": -6.80370569229126, "global_step": 144570, "epoch": 3442} {"train_loss": -6.829713821411133, "global_step": 144571, "epoch": 3442} {"train_loss": -6.822577953338623, "global_step": 144572, "epoch": 3442} {"train_loss": -6.8103766441345215, "global_step": 144573, "epoch": 3442} {"train_loss": -6.765894889831543, "global_step": 144574, "epoch": 3442} {"train_loss": -6.686381816864014, "global_step": 144575, "epoch": 3442} {"train_loss": -6.712123870849609, "global_step": 144576, "epoch": 3442} {"train_loss": -6.738712310791016, "global_step": 144577, "epoch": 3442} {"train_loss": -6.824174404144287, "global_step": 144578, "epoch": 3442} {"train_loss": -6.77703857421875, "global_step": 144579, "epoch": 3442} {"train_loss": -6.9049882888793945, "global_step": 144580, "epoch": 3442} {"train_loss": -6.841775417327881, "global_step": 144581, "epoch": 3442} {"train_loss": -6.798452854156494, "global_step": 144582, "epoch": 3442} {"train_loss": -6.804025173187256, "global_step": 144583, "epoch": 3442} {"train_loss": -6.696452617645264, "global_step": 144584, "epoch": 3442} {"train_loss": -6.898990154266357, "global_step": 144585, "epoch": 3442} {"train_loss": -6.826531410217285, "global_step": 144586, "epoch": 3442} {"train_loss": -6.79293155670166, "global_step": 144587, "epoch": 3442} {"train_loss": -6.859475135803223, "global_step": 144588, "epoch": 3442} {"train_loss": -6.829071521759033, "global_step": 144589, "epoch": 3442} {"train_loss": -6.757206916809082, "global_step": 144590, "epoch": 3442} {"train_loss": -6.9383392333984375, "global_step": 144591, "epoch": 3442} {"train_loss": -6.740294933319092, "global_step": 144592, "epoch": 3442} {"train_loss": -6.792703628540039, "global_step": 144593, "epoch": 3442} {"train_loss": -6.824030876159668, "global_step": 144594, "epoch": 3442} {"train_loss": -6.817399978637695, "global_step": 144595, "epoch": 3442} {"train_loss": -6.832844257354736, "global_step": 144596, "epoch": 3442} {"train_loss": -6.965728759765625, "global_step": 144597, "epoch": 3442} {"train_loss": -6.880402565002441, "global_step": 144598, "epoch": 3442} {"train_loss": -6.82601261138916, "global_step": 144599, "epoch": 3442} {"train_loss": -6.771288871765137, "global_step": 144600, "epoch": 3442} {"train_loss": -6.973221778869629, "global_step": 144601, "epoch": 3442} {"train_loss": -6.815073013305664, "global_step": 144602, "epoch": 3442} {"train_loss": -6.949704170227051, "global_step": 144603, "epoch": 3442} {"train_loss": -6.813441276550293, "global_step": 144604, "epoch": 3442} {"train_loss": -6.824555408386957, "global_step": 144605, "epoch": 3442, "val_loss": 67548.1015625} {"train_loss": -6.789540767669678, "global_step": 144606, "epoch": 3443} {"train_loss": -6.956677436828613, "global_step": 144607, "epoch": 3443} {"train_loss": -6.907398223876953, "global_step": 144608, "epoch": 3443} {"train_loss": -6.841856956481934, "global_step": 144609, "epoch": 3443} {"train_loss": -6.801334381103516, "global_step": 144610, "epoch": 3443} {"train_loss": -6.828277587890625, "global_step": 144611, "epoch": 3443} {"train_loss": -6.8995208740234375, "global_step": 144612, "epoch": 3443} {"train_loss": -6.921270370483398, "global_step": 144613, "epoch": 3443} {"train_loss": -6.812814712524414, "global_step": 144614, "epoch": 3443} {"train_loss": -6.8302836418151855, "global_step": 144615, "epoch": 3443} {"train_loss": -6.869781494140625, "global_step": 144616, "epoch": 3443} {"train_loss": -6.837586402893066, "global_step": 144617, "epoch": 3443} {"train_loss": -6.940141677856445, "global_step": 144618, "epoch": 3443} {"train_loss": -6.956812858581543, "global_step": 144619, "epoch": 3443} {"train_loss": -6.855842113494873, "global_step": 144620, "epoch": 3443} {"train_loss": -6.737722396850586, "global_step": 144621, "epoch": 3443} {"train_loss": -6.913873195648193, "global_step": 144622, "epoch": 3443} {"train_loss": -6.871421813964844, "global_step": 144623, "epoch": 3443} {"train_loss": -6.850183486938477, "global_step": 144624, "epoch": 3443} {"train_loss": -6.88833475112915, "global_step": 144625, "epoch": 3443} {"train_loss": -6.876614570617676, "global_step": 144626, "epoch": 3443} {"train_loss": -6.6662092208862305, "global_step": 144627, "epoch": 3443} {"train_loss": -6.912343978881836, "global_step": 144628, "epoch": 3443} {"train_loss": -6.733230113983154, "global_step": 144629, "epoch": 3443} {"train_loss": -6.709527015686035, "global_step": 144630, "epoch": 3443} {"train_loss": -6.806014060974121, "global_step": 144631, "epoch": 3443} {"train_loss": -6.6252264976501465, "global_step": 144632, "epoch": 3443} {"train_loss": -6.753666877746582, "global_step": 144633, "epoch": 3443} {"train_loss": -6.94134521484375, "global_step": 144634, "epoch": 3443} {"train_loss": -6.780818462371826, "global_step": 144635, "epoch": 3443} {"train_loss": -6.727069854736328, "global_step": 144636, "epoch": 3443} {"train_loss": -6.764404296875, "global_step": 144637, "epoch": 3443} {"train_loss": -6.732458114624023, "global_step": 144638, "epoch": 3443} {"train_loss": -6.785035133361816, "global_step": 144639, "epoch": 3443} {"train_loss": -6.826780319213867, "global_step": 144640, "epoch": 3443} {"train_loss": -6.772457122802734, "global_step": 144641, "epoch": 3443} {"train_loss": -6.8807220458984375, "global_step": 144642, "epoch": 3443} {"train_loss": -6.7988386154174805, "global_step": 144643, "epoch": 3443} {"train_loss": -6.784046173095703, "global_step": 144644, "epoch": 3443} {"train_loss": -6.793664455413818, "global_step": 144645, "epoch": 3443} {"train_loss": -6.823660850524902, "global_step": 144646, "epoch": 3443} {"train_loss": -6.8255653267815, "global_step": 144647, "epoch": 3443, "val_loss": 67798.59375} {"train_loss": -6.721240997314453, "global_step": 144648, "epoch": 3444} {"train_loss": -6.708766937255859, "global_step": 144649, "epoch": 3444} {"train_loss": -6.716732501983643, "global_step": 144650, "epoch": 3444} {"train_loss": -6.7771711349487305, "global_step": 144651, "epoch": 3444} {"train_loss": -6.7756195068359375, "global_step": 144652, "epoch": 3444} {"train_loss": -6.822085857391357, "global_step": 144653, "epoch": 3444} {"train_loss": -6.67749547958374, "global_step": 144654, "epoch": 3444} {"train_loss": -6.707977294921875, "global_step": 144655, "epoch": 3444} {"train_loss": -6.828827381134033, "global_step": 144656, "epoch": 3444} {"train_loss": -6.735933780670166, "global_step": 144657, "epoch": 3444} {"train_loss": -6.793422698974609, "global_step": 144658, "epoch": 3444} {"train_loss": -6.765207290649414, "global_step": 144659, "epoch": 3444} {"train_loss": -6.6933207511901855, "global_step": 144660, "epoch": 3444} {"train_loss": -6.71299934387207, "global_step": 144661, "epoch": 3444} {"train_loss": -6.821368217468262, "global_step": 144662, "epoch": 3444} {"train_loss": -6.740911960601807, "global_step": 144663, "epoch": 3444} {"train_loss": -6.857938766479492, "global_step": 144664, "epoch": 3444} {"train_loss": -6.8426713943481445, "global_step": 144665, "epoch": 3444} {"train_loss": -6.668626308441162, "global_step": 144666, "epoch": 3444} {"train_loss": -6.827722072601318, "global_step": 144667, "epoch": 3444} {"train_loss": -6.801048278808594, "global_step": 144668, "epoch": 3444} {"train_loss": -6.793667793273926, "global_step": 144669, "epoch": 3444} {"train_loss": -6.818452835083008, "global_step": 144670, "epoch": 3444} {"train_loss": -6.79972505569458, "global_step": 144671, "epoch": 3444} {"train_loss": -6.742423057556152, "global_step": 144672, "epoch": 3444} {"train_loss": -6.778301239013672, "global_step": 144673, "epoch": 3444} {"train_loss": -6.947864532470703, "global_step": 144674, "epoch": 3444} {"train_loss": -6.705358505249023, "global_step": 144675, "epoch": 3444} {"train_loss": -6.8597412109375, "global_step": 144676, "epoch": 3444} {"train_loss": -6.751822471618652, "global_step": 144677, "epoch": 3444} {"train_loss": -6.625086784362793, "global_step": 144678, "epoch": 3444} {"train_loss": -6.849725723266602, "global_step": 144679, "epoch": 3444} {"train_loss": -6.648122310638428, "global_step": 144680, "epoch": 3444} {"train_loss": -6.781257629394531, "global_step": 144681, "epoch": 3444} {"train_loss": -6.777405738830566, "global_step": 144682, "epoch": 3444} {"train_loss": -6.837301731109619, "global_step": 144683, "epoch": 3444} {"train_loss": -6.889692306518555, "global_step": 144684, "epoch": 3444} {"train_loss": -6.78408670425415, "global_step": 144685, "epoch": 3444} {"train_loss": -6.7624006271362305, "global_step": 144686, "epoch": 3444} {"train_loss": -6.872592926025391, "global_step": 144687, "epoch": 3444} {"train_loss": -6.7461748123168945, "global_step": 144688, "epoch": 3444} {"train_loss": -6.7755098683493475, "global_step": 144689, "epoch": 3444, "val_loss": 67586.2109375} {"train_loss": -6.72838020324707, "global_step": 144690, "epoch": 3445} {"train_loss": -6.83847188949585, "global_step": 144691, "epoch": 3445} {"train_loss": -6.798694610595703, "global_step": 144692, "epoch": 3445} {"train_loss": -6.859189987182617, "global_step": 144693, "epoch": 3445} {"train_loss": -6.745271682739258, "global_step": 144694, "epoch": 3445} {"train_loss": -6.82668399810791, "global_step": 144695, "epoch": 3445} {"train_loss": -6.862798690795898, "global_step": 144696, "epoch": 3445} {"train_loss": -6.886839866638184, "global_step": 144697, "epoch": 3445} {"train_loss": -6.761641502380371, "global_step": 144698, "epoch": 3445} {"train_loss": -6.842869758605957, "global_step": 144699, "epoch": 3445} {"train_loss": -6.899717330932617, "global_step": 144700, "epoch": 3445} {"train_loss": -6.947556018829346, "global_step": 144701, "epoch": 3445} {"train_loss": -6.835413455963135, "global_step": 144702, "epoch": 3445} {"train_loss": -6.833778381347656, "global_step": 144703, "epoch": 3445} {"train_loss": -6.880336761474609, "global_step": 144704, "epoch": 3445} {"train_loss": -6.865666389465332, "global_step": 144705, "epoch": 3445} {"train_loss": -6.850823402404785, "global_step": 144706, "epoch": 3445} {"train_loss": -6.917211532592773, "global_step": 144707, "epoch": 3445} {"train_loss": -6.7879719734191895, "global_step": 144708, "epoch": 3445} {"train_loss": -6.879281044006348, "global_step": 144709, "epoch": 3445} {"train_loss": -6.817559242248535, "global_step": 144710, "epoch": 3445} {"train_loss": -6.771114826202393, "global_step": 144711, "epoch": 3445} {"train_loss": -6.946456432342529, "global_step": 144712, "epoch": 3445} {"train_loss": -6.790474891662598, "global_step": 144713, "epoch": 3445} {"train_loss": -6.763382911682129, "global_step": 144714, "epoch": 3445} {"train_loss": -6.870981216430664, "global_step": 144715, "epoch": 3445} {"train_loss": -6.823668479919434, "global_step": 144716, "epoch": 3445} {"train_loss": -6.691095352172852, "global_step": 144717, "epoch": 3445} {"train_loss": -6.745328903198242, "global_step": 144718, "epoch": 3445} {"train_loss": -6.716111183166504, "global_step": 144719, "epoch": 3445} {"train_loss": -6.921389579772949, "global_step": 144720, "epoch": 3445} {"train_loss": -6.801911354064941, "global_step": 144721, "epoch": 3445} {"train_loss": -6.763744831085205, "global_step": 144722, "epoch": 3445} {"train_loss": -6.868753433227539, "global_step": 144723, "epoch": 3445} {"train_loss": -6.675360679626465, "global_step": 144724, "epoch": 3445} {"train_loss": -6.795494556427002, "global_step": 144725, "epoch": 3445} {"train_loss": -6.795269966125488, "global_step": 144726, "epoch": 3445} {"train_loss": -6.84326696395874, "global_step": 144727, "epoch": 3445} {"train_loss": -6.823858261108398, "global_step": 144728, "epoch": 3445} {"train_loss": -6.772029876708984, "global_step": 144729, "epoch": 3445} {"train_loss": -6.791543006896973, "global_step": 144730, "epoch": 3445} {"train_loss": -6.818102053233555, "global_step": 144731, "epoch": 3445, "val_loss": 67757.8359375} {"train_loss": -6.813104629516602, "global_step": 144732, "epoch": 3446} {"train_loss": -6.6488471031188965, "global_step": 144733, "epoch": 3446} {"train_loss": -6.720907211303711, "global_step": 144734, "epoch": 3446} {"train_loss": -6.786540985107422, "global_step": 144735, "epoch": 3446} {"train_loss": -6.743506908416748, "global_step": 144736, "epoch": 3446} {"train_loss": -6.824661731719971, "global_step": 144737, "epoch": 3446} {"train_loss": -6.858595848083496, "global_step": 144738, "epoch": 3446} {"train_loss": -6.82039737701416, "global_step": 144739, "epoch": 3446} {"train_loss": -6.7961578369140625, "global_step": 144740, "epoch": 3446} {"train_loss": -6.887875080108643, "global_step": 144741, "epoch": 3446} {"train_loss": -6.8000946044921875, "global_step": 144742, "epoch": 3446} {"train_loss": -6.7895660400390625, "global_step": 144743, "epoch": 3446} {"train_loss": -6.923604965209961, "global_step": 144744, "epoch": 3446} {"train_loss": -6.678112030029297, "global_step": 144745, "epoch": 3446} {"train_loss": -6.767708778381348, "global_step": 144746, "epoch": 3446} {"train_loss": -6.692572593688965, "global_step": 144747, "epoch": 3446} {"train_loss": -6.775525093078613, "global_step": 144748, "epoch": 3446} {"train_loss": -6.725757598876953, "global_step": 144749, "epoch": 3446} {"train_loss": -6.93851900100708, "global_step": 144750, "epoch": 3446} {"train_loss": -6.831585884094238, "global_step": 144751, "epoch": 3446} {"train_loss": -6.698602199554443, "global_step": 144752, "epoch": 3446} {"train_loss": -6.897648334503174, "global_step": 144753, "epoch": 3446} {"train_loss": -6.992217540740967, "global_step": 144754, "epoch": 3446} {"train_loss": -6.8186421394348145, "global_step": 144755, "epoch": 3446} {"train_loss": -6.808253765106201, "global_step": 144756, "epoch": 3446} {"train_loss": -6.890389919281006, "global_step": 144757, "epoch": 3446} {"train_loss": -6.754121780395508, "global_step": 144758, "epoch": 3446} {"train_loss": -6.766828536987305, "global_step": 144759, "epoch": 3446} {"train_loss": -6.925074100494385, "global_step": 144760, "epoch": 3446} {"train_loss": -6.786079406738281, "global_step": 144761, "epoch": 3446} {"train_loss": -6.793849945068359, "global_step": 144762, "epoch": 3446} {"train_loss": -6.805881500244141, "global_step": 144763, "epoch": 3446} {"train_loss": -6.884822845458984, "global_step": 144764, "epoch": 3446} {"train_loss": -6.838100433349609, "global_step": 144765, "epoch": 3446} {"train_loss": -6.808282852172852, "global_step": 144766, "epoch": 3446} {"train_loss": -6.902756214141846, "global_step": 144767, "epoch": 3446} {"train_loss": -6.842474460601807, "global_step": 144768, "epoch": 3446} {"train_loss": -6.730650901794434, "global_step": 144769, "epoch": 3446} {"train_loss": -6.756440162658691, "global_step": 144770, "epoch": 3446} {"train_loss": -6.872480392456055, "global_step": 144771, "epoch": 3446} {"train_loss": -6.751187801361084, "global_step": 144772, "epoch": 3446} {"train_loss": -6.804565225328718, "global_step": 144773, "epoch": 3446, "val_loss": 67730.0078125} {"train_loss": -6.701986312866211, "global_step": 144774, "epoch": 3447} {"train_loss": -6.78127908706665, "global_step": 144775, "epoch": 3447} {"train_loss": -6.790164947509766, "global_step": 144776, "epoch": 3447} {"train_loss": -6.7879157066345215, "global_step": 144777, "epoch": 3447} {"train_loss": -6.744381904602051, "global_step": 144778, "epoch": 3447} {"train_loss": -6.753119468688965, "global_step": 144779, "epoch": 3447} {"train_loss": -6.729860305786133, "global_step": 144780, "epoch": 3447} {"train_loss": -6.746504783630371, "global_step": 144781, "epoch": 3447} {"train_loss": -6.836538314819336, "global_step": 144782, "epoch": 3447} {"train_loss": -6.626755714416504, "global_step": 144783, "epoch": 3447} {"train_loss": -6.721808433532715, "global_step": 144784, "epoch": 3447} {"train_loss": -6.848491191864014, "global_step": 144785, "epoch": 3447} {"train_loss": -6.733645439147949, "global_step": 144786, "epoch": 3447} {"train_loss": -6.766180992126465, "global_step": 144787, "epoch": 3447} {"train_loss": -6.756259441375732, "global_step": 144788, "epoch": 3447} {"train_loss": -6.7371907234191895, "global_step": 144789, "epoch": 3447} {"train_loss": -6.74985408782959, "global_step": 144790, "epoch": 3447} {"train_loss": -6.7890167236328125, "global_step": 144791, "epoch": 3447} {"train_loss": -6.758082389831543, "global_step": 144792, "epoch": 3447} {"train_loss": -6.806257247924805, "global_step": 144793, "epoch": 3447} {"train_loss": -6.8353590965271, "global_step": 144794, "epoch": 3447} {"train_loss": -6.8444905281066895, "global_step": 144795, "epoch": 3447} {"train_loss": -6.712335586547852, "global_step": 144796, "epoch": 3447} {"train_loss": -6.675870895385742, "global_step": 144797, "epoch": 3447} {"train_loss": -6.677674293518066, "global_step": 144798, "epoch": 3447} {"train_loss": -6.723726272583008, "global_step": 144799, "epoch": 3447} {"train_loss": -6.835036277770996, "global_step": 144800, "epoch": 3447} {"train_loss": -6.639691352844238, "global_step": 144801, "epoch": 3447} {"train_loss": -6.710110664367676, "global_step": 144802, "epoch": 3447} {"train_loss": -6.74512243270874, "global_step": 144803, "epoch": 3447} {"train_loss": -6.720489978790283, "global_step": 144804, "epoch": 3447} {"train_loss": -6.762055397033691, "global_step": 144805, "epoch": 3447} {"train_loss": -6.699315547943115, "global_step": 144806, "epoch": 3447} {"train_loss": -6.543124198913574, "global_step": 144807, "epoch": 3447} {"train_loss": -6.765826225280762, "global_step": 144808, "epoch": 3447} {"train_loss": -6.608020782470703, "global_step": 144809, "epoch": 3447} {"train_loss": -6.516480445861816, "global_step": 144810, "epoch": 3447} {"train_loss": -6.770915985107422, "global_step": 144811, "epoch": 3447} {"train_loss": -6.619967460632324, "global_step": 144812, "epoch": 3447} {"train_loss": -6.71364164352417, "global_step": 144813, "epoch": 3447} {"train_loss": -6.648590087890625, "global_step": 144814, "epoch": 3447} {"train_loss": -6.728932857513428, "global_step": 144815, "epoch": 3447, "val_loss": 67544.1171875} {"train_loss": -6.716419696807861, "global_step": 144816, "epoch": 3448} {"train_loss": -6.565678119659424, "global_step": 144817, "epoch": 3448} {"train_loss": -6.783197402954102, "global_step": 144818, "epoch": 3448} {"train_loss": -6.628998279571533, "global_step": 144819, "epoch": 3448} {"train_loss": -6.705243110656738, "global_step": 144820, "epoch": 3448} {"train_loss": -6.525002479553223, "global_step": 144821, "epoch": 3448} {"train_loss": -6.759110450744629, "global_step": 144822, "epoch": 3448} {"train_loss": -6.664043426513672, "global_step": 144823, "epoch": 3448} {"train_loss": -6.7013325691223145, "global_step": 144824, "epoch": 3448} {"train_loss": -6.486428737640381, "global_step": 144825, "epoch": 3448} {"train_loss": -6.60721492767334, "global_step": 144826, "epoch": 3448} {"train_loss": -6.822941780090332, "global_step": 144827, "epoch": 3448} {"train_loss": -6.706424713134766, "global_step": 144828, "epoch": 3448} {"train_loss": -6.740057945251465, "global_step": 144829, "epoch": 3448} {"train_loss": -6.7512969970703125, "global_step": 144830, "epoch": 3448} {"train_loss": -6.838913440704346, "global_step": 144831, "epoch": 3448} {"train_loss": -6.790106773376465, "global_step": 144832, "epoch": 3448} {"train_loss": -6.771488666534424, "global_step": 144833, "epoch": 3448} {"train_loss": -6.6962890625, "global_step": 144834, "epoch": 3448} {"train_loss": -6.905073642730713, "global_step": 144835, "epoch": 3448} {"train_loss": -6.821772575378418, "global_step": 144836, "epoch": 3448} {"train_loss": -6.812831878662109, "global_step": 144837, "epoch": 3448} {"train_loss": -6.646324157714844, "global_step": 144838, "epoch": 3448} {"train_loss": -6.767450332641602, "global_step": 144839, "epoch": 3448} {"train_loss": -6.777332782745361, "global_step": 144840, "epoch": 3448} {"train_loss": -6.830757141113281, "global_step": 144841, "epoch": 3448} {"train_loss": -6.7714457511901855, "global_step": 144842, "epoch": 3448} {"train_loss": -6.768523216247559, "global_step": 144843, "epoch": 3448} {"train_loss": -6.951535224914551, "global_step": 144844, "epoch": 3448} {"train_loss": -6.83340311050415, "global_step": 144845, "epoch": 3448} {"train_loss": -6.765137672424316, "global_step": 144846, "epoch": 3448} {"train_loss": -6.772479057312012, "global_step": 144847, "epoch": 3448} {"train_loss": -6.883130073547363, "global_step": 144848, "epoch": 3448} {"train_loss": -6.740726470947266, "global_step": 144849, "epoch": 3448} {"train_loss": -6.897380828857422, "global_step": 144850, "epoch": 3448} {"train_loss": -6.7776079177856445, "global_step": 144851, "epoch": 3448} {"train_loss": -6.8509521484375, "global_step": 144852, "epoch": 3448} {"train_loss": -6.850359916687012, "global_step": 144853, "epoch": 3448} {"train_loss": -6.973802089691162, "global_step": 144854, "epoch": 3448} {"train_loss": -6.813570976257324, "global_step": 144855, "epoch": 3448} {"train_loss": -6.8119120597839355, "global_step": 144856, "epoch": 3448} {"train_loss": -6.763443674360003, "global_step": 144857, "epoch": 3448, "val_loss": 67452.0078125} {"train_loss": -6.714106559753418, "global_step": 144858, "epoch": 3449} {"train_loss": -6.86530876159668, "global_step": 144859, "epoch": 3449} {"train_loss": -6.838838577270508, "global_step": 144860, "epoch": 3449} {"train_loss": -6.813176155090332, "global_step": 144861, "epoch": 3449} {"train_loss": -6.89171838760376, "global_step": 144862, "epoch": 3449} {"train_loss": -6.917666912078857, "global_step": 144863, "epoch": 3449} {"train_loss": -6.840811729431152, "global_step": 144864, "epoch": 3449} {"train_loss": -6.864127159118652, "global_step": 144865, "epoch": 3449} {"train_loss": -6.723515510559082, "global_step": 144866, "epoch": 3449} {"train_loss": -6.73677396774292, "global_step": 144867, "epoch": 3449} {"train_loss": -6.830517768859863, "global_step": 144868, "epoch": 3449} {"train_loss": -6.904732704162598, "global_step": 144869, "epoch": 3449} {"train_loss": -6.727460861206055, "global_step": 144870, "epoch": 3449} {"train_loss": -6.773885726928711, "global_step": 144871, "epoch": 3449} {"train_loss": -6.7310590744018555, "global_step": 144872, "epoch": 3449} {"train_loss": -6.777159214019775, "global_step": 144873, "epoch": 3449} {"train_loss": -6.766376495361328, "global_step": 144874, "epoch": 3449} {"train_loss": -6.720202922821045, "global_step": 144875, "epoch": 3449} {"train_loss": -6.833173751831055, "global_step": 144876, "epoch": 3449} {"train_loss": -6.810783386230469, "global_step": 144877, "epoch": 3449} {"train_loss": -6.784309387207031, "global_step": 144878, "epoch": 3449} {"train_loss": -6.869657516479492, "global_step": 144879, "epoch": 3449} {"train_loss": -6.846818447113037, "global_step": 144880, "epoch": 3449} {"train_loss": -6.762330532073975, "global_step": 144881, "epoch": 3449} {"train_loss": -6.802148818969727, "global_step": 144882, "epoch": 3449} {"train_loss": -6.825102806091309, "global_step": 144883, "epoch": 3449} {"train_loss": -6.938577651977539, "global_step": 144884, "epoch": 3449} {"train_loss": -6.682652473449707, "global_step": 144885, "epoch": 3449} {"train_loss": -6.933618545532227, "global_step": 144886, "epoch": 3449} {"train_loss": -6.795134544372559, "global_step": 144887, "epoch": 3449} {"train_loss": -6.787934303283691, "global_step": 144888, "epoch": 3449} {"train_loss": -6.786478519439697, "global_step": 144889, "epoch": 3449} {"train_loss": -6.762410640716553, "global_step": 144890, "epoch": 3449} {"train_loss": -6.842320442199707, "global_step": 144891, "epoch": 3449} {"train_loss": -6.8932085037231445, "global_step": 144892, "epoch": 3449} {"train_loss": -6.841787338256836, "global_step": 144893, "epoch": 3449} {"train_loss": -6.855853080749512, "global_step": 144894, "epoch": 3449} {"train_loss": -6.871012210845947, "global_step": 144895, "epoch": 3449} {"train_loss": -6.859129905700684, "global_step": 144896, "epoch": 3449} {"train_loss": -6.853802680969238, "global_step": 144897, "epoch": 3449} {"train_loss": -6.791486740112305, "global_step": 144898, "epoch": 3449} {"train_loss": -6.816187381744385, "global_step": 144899, "epoch": 3449, "val_loss": 67756.6171875} {"train_loss": -6.881017208099365, "global_step": 144900, "epoch": 3450} {"train_loss": -6.850751876831055, "global_step": 144901, "epoch": 3450} {"train_loss": -6.860052585601807, "global_step": 144902, "epoch": 3450} {"train_loss": -6.745652198791504, "global_step": 144903, "epoch": 3450} {"train_loss": -6.766007423400879, "global_step": 144904, "epoch": 3450} {"train_loss": -6.824593544006348, "global_step": 144905, "epoch": 3450} {"train_loss": -6.704939365386963, "global_step": 144906, "epoch": 3450} {"train_loss": -6.749024391174316, "global_step": 144907, "epoch": 3450} {"train_loss": -6.919774055480957, "global_step": 144908, "epoch": 3450} {"train_loss": -6.707725524902344, "global_step": 144909, "epoch": 3450} {"train_loss": -6.781140327453613, "global_step": 144910, "epoch": 3450} {"train_loss": -6.731315612792969, "global_step": 144911, "epoch": 3450} {"train_loss": -6.714993000030518, "global_step": 144912, "epoch": 3450} {"train_loss": -6.840438365936279, "global_step": 144913, "epoch": 3450} {"train_loss": -6.818384647369385, "global_step": 144914, "epoch": 3450} {"train_loss": -6.891690254211426, "global_step": 144915, "epoch": 3450} {"train_loss": -6.8438801765441895, "global_step": 144916, "epoch": 3450} {"train_loss": -6.853067398071289, "global_step": 144917, "epoch": 3450} {"train_loss": -6.868487358093262, "global_step": 144918, "epoch": 3450} {"train_loss": -6.866200923919678, "global_step": 144919, "epoch": 3450} {"train_loss": -6.842747688293457, "global_step": 144920, "epoch": 3450} {"train_loss": -6.739757061004639, "global_step": 144921, "epoch": 3450} {"train_loss": -6.842422008514404, "global_step": 144922, "epoch": 3450} {"train_loss": -6.874068260192871, "global_step": 144923, "epoch": 3450} {"train_loss": -6.802552223205566, "global_step": 144924, "epoch": 3450} {"train_loss": -6.846177577972412, "global_step": 144925, "epoch": 3450} {"train_loss": -6.915591239929199, "global_step": 144926, "epoch": 3450} {"train_loss": -6.884385108947754, "global_step": 144927, "epoch": 3450} {"train_loss": -6.804653644561768, "global_step": 144928, "epoch": 3450} {"train_loss": -6.797815799713135, "global_step": 144929, "epoch": 3450} {"train_loss": -6.8361077308654785, "global_step": 144930, "epoch": 3450} {"train_loss": -6.757513046264648, "global_step": 144931, "epoch": 3450} {"train_loss": -6.8191423416137695, "global_step": 144932, "epoch": 3450} {"train_loss": -6.805974006652832, "global_step": 144933, "epoch": 3450} {"train_loss": -6.857943058013916, "global_step": 144934, "epoch": 3450} {"train_loss": -6.8148064613342285, "global_step": 144935, "epoch": 3450} {"train_loss": -6.907264232635498, "global_step": 144936, "epoch": 3450} {"train_loss": -6.843823432922363, "global_step": 144937, "epoch": 3450} {"train_loss": -6.786736488342285, "global_step": 144938, "epoch": 3450} {"train_loss": -6.790358543395996, "global_step": 144939, "epoch": 3450} {"train_loss": -6.82214879989624, "global_step": 144940, "epoch": 3450} {"train_loss": -6.820939540863037, "global_step": 144941, "epoch": 3450, "train/sim_max_reward_0": 0.99446898187612, "train/sim_max_reward_1": 0.9234812110198359, "train/sim_max_reward_2": 0.5679218719995099, "train/sim_max_reward_3": 0.12982979007650902, "train/sim_max_reward_4": 0.9593297574044275, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.31338336932201943, "test/sim_max_reward_4300002": 0.8680778814508102, "test/sim_max_reward_4300003": 0.9044162030727152, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9951477633989784, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.7292664526189102, "test/sim_max_reward_4300008": 0.928931704957285, "test/sim_max_reward_4300009": 0.9750818763067416, "test/sim_max_reward_4300010": 0.9700336249579753, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.9655946274205782, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9858966812143483, "test/sim_max_reward_4300016": 0.08532895057640497, "test/sim_max_reward_4300017": 0.9486510457715812, "test/sim_max_reward_4300018": 0.4225944748183627, "test/sim_max_reward_4300019": 0.18602317801476068, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8970983374581238, "test/sim_max_reward_4300022": 0.9766283502631977, "test/sim_max_reward_4300023": 0.3333790185827825, "test/sim_max_reward_4300024": 0.9565248997301213, "test/sim_max_reward_4300025": 0.9850406953609979, "test/sim_max_reward_4300026": 0.21293795295678733, "test/sim_max_reward_4300027": 0.9229513552173847, "test/sim_max_reward_4300028": 0.9512864156692163, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.24615419473110844, "test/sim_max_reward_4300031": 0.2121820533004124, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.661856892393805, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.36609325688295863, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.5527122599440878, "test/sim_max_reward_4300038": 0.8097488585187633, "test/sim_max_reward_4300039": 0.9067779309200106, "test/sim_max_reward_4300040": 0.8476673207970555, "test/sim_max_reward_4300041": 0.9404686348250103, "test/sim_max_reward_4300042": 0.726580018685874, "test/sim_max_reward_4300043": 0.1477090529298247, "test/sim_max_reward_4300044": 0.889471043466562, "test/sim_max_reward_4300045": 0.2020816945278569, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.1251617045421806, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.26718524335066096, "train/mean_score": 0.6280027286230984, "test/mean_score": 0.5926230647865803, "val_loss": 67508.0625} {"train_loss": -6.814578056335449, "global_step": 144942, "epoch": 3451} {"train_loss": -6.925437927246094, "global_step": 144943, "epoch": 3451} {"train_loss": -6.953171253204346, "global_step": 144944, "epoch": 3451} {"train_loss": -6.877508163452148, "global_step": 144945, "epoch": 3451} {"train_loss": -6.848453044891357, "global_step": 144946, "epoch": 3451} {"train_loss": -6.867916584014893, "global_step": 144947, "epoch": 3451} {"train_loss": -6.855806350708008, "global_step": 144948, "epoch": 3451} {"train_loss": -6.925762176513672, "global_step": 144949, "epoch": 3451} {"train_loss": -6.965312957763672, "global_step": 144950, "epoch": 3451} {"train_loss": -6.846681594848633, "global_step": 144951, "epoch": 3451} {"train_loss": -6.781196594238281, "global_step": 144952, "epoch": 3451} {"train_loss": -6.958713531494141, "global_step": 144953, "epoch": 3451} {"train_loss": -6.774155616760254, "global_step": 144954, "epoch": 3451} {"train_loss": -6.664552688598633, "global_step": 144955, "epoch": 3451} {"train_loss": -6.898709297180176, "global_step": 144956, "epoch": 3451} {"train_loss": -6.793691635131836, "global_step": 144957, "epoch": 3451} {"train_loss": -6.7236008644104, "global_step": 144958, "epoch": 3451} {"train_loss": -6.892299652099609, "global_step": 144959, "epoch": 3451} {"train_loss": -6.708133697509766, "global_step": 144960, "epoch": 3451} {"train_loss": -6.831727027893066, "global_step": 144961, "epoch": 3451} {"train_loss": -6.750577926635742, "global_step": 144962, "epoch": 3451} {"train_loss": -6.765542030334473, "global_step": 144963, "epoch": 3451} {"train_loss": -6.970641136169434, "global_step": 144964, "epoch": 3451} {"train_loss": -6.754673957824707, "global_step": 144965, "epoch": 3451} {"train_loss": -6.668035507202148, "global_step": 144966, "epoch": 3451} {"train_loss": -6.7173357009887695, "global_step": 144967, "epoch": 3451} {"train_loss": -6.7605881690979, "global_step": 144968, "epoch": 3451} {"train_loss": -6.808943748474121, "global_step": 144969, "epoch": 3451} {"train_loss": -6.704802989959717, "global_step": 144970, "epoch": 3451} {"train_loss": -6.824796199798584, "global_step": 144971, "epoch": 3451} {"train_loss": -6.737130641937256, "global_step": 144972, "epoch": 3451} {"train_loss": -6.716884613037109, "global_step": 144973, "epoch": 3451} {"train_loss": -6.778409481048584, "global_step": 144974, "epoch": 3451} {"train_loss": -6.825902938842773, "global_step": 144975, "epoch": 3451} {"train_loss": -6.671268939971924, "global_step": 144976, "epoch": 3451} {"train_loss": -6.7758564949035645, "global_step": 144977, "epoch": 3451} {"train_loss": -6.741447448730469, "global_step": 144978, "epoch": 3451} {"train_loss": -6.7677001953125, "global_step": 144979, "epoch": 3451} {"train_loss": -6.840660572052002, "global_step": 144980, "epoch": 3451} {"train_loss": -6.833785057067871, "global_step": 144981, "epoch": 3451} {"train_loss": -6.725493431091309, "global_step": 144982, "epoch": 3451} {"train_loss": -6.805371704555693, "global_step": 144983, "epoch": 3451, "val_loss": 67585.171875} {"train_loss": -6.808494567871094, "global_step": 144984, "epoch": 3452} {"train_loss": -6.733315467834473, "global_step": 144985, "epoch": 3452} {"train_loss": -6.6790876388549805, "global_step": 144986, "epoch": 3452} {"train_loss": -6.847614765167236, "global_step": 144987, "epoch": 3452} {"train_loss": -6.808919906616211, "global_step": 144988, "epoch": 3452} {"train_loss": -6.734443664550781, "global_step": 144989, "epoch": 3452} {"train_loss": -6.766920566558838, "global_step": 144990, "epoch": 3452} {"train_loss": -6.831687927246094, "global_step": 144991, "epoch": 3452} {"train_loss": -6.766200542449951, "global_step": 144992, "epoch": 3452} {"train_loss": -6.745952129364014, "global_step": 144993, "epoch": 3452} {"train_loss": -6.78279447555542, "global_step": 144994, "epoch": 3452} {"train_loss": -6.73079776763916, "global_step": 144995, "epoch": 3452} {"train_loss": -6.786730766296387, "global_step": 144996, "epoch": 3452} {"train_loss": -6.706031322479248, "global_step": 144997, "epoch": 3452} {"train_loss": -6.620104789733887, "global_step": 144998, "epoch": 3452} {"train_loss": -6.816150665283203, "global_step": 144999, "epoch": 3452} {"train_loss": -6.753936767578125, "global_step": 145000, "epoch": 3452} {"train_loss": -6.708232402801514, "global_step": 145001, "epoch": 3452} {"train_loss": -6.669455051422119, "global_step": 145002, "epoch": 3452} {"train_loss": -6.811379432678223, "global_step": 145003, "epoch": 3452} {"train_loss": -6.878479957580566, "global_step": 145004, "epoch": 3452} {"train_loss": -6.743567943572998, "global_step": 145005, "epoch": 3452} {"train_loss": -6.768524169921875, "global_step": 145006, "epoch": 3452} {"train_loss": -6.7160773277282715, "global_step": 145007, "epoch": 3452} {"train_loss": -6.772275924682617, "global_step": 145008, "epoch": 3452} {"train_loss": -6.834845542907715, "global_step": 145009, "epoch": 3452} {"train_loss": -6.815651893615723, "global_step": 145010, "epoch": 3452} {"train_loss": -6.915111064910889, "global_step": 145011, "epoch": 3452} {"train_loss": -6.840817451477051, "global_step": 145012, "epoch": 3452} {"train_loss": -6.9046735763549805, "global_step": 145013, "epoch": 3452} {"train_loss": -6.7806596755981445, "global_step": 145014, "epoch": 3452} {"train_loss": -6.790075302124023, "global_step": 145015, "epoch": 3452} {"train_loss": -6.8232269287109375, "global_step": 145016, "epoch": 3452} {"train_loss": -6.8079400062561035, "global_step": 145017, "epoch": 3452} {"train_loss": -6.76635217666626, "global_step": 145018, "epoch": 3452} {"train_loss": -6.785739421844482, "global_step": 145019, "epoch": 3452} {"train_loss": -6.807407379150391, "global_step": 145020, "epoch": 3452} {"train_loss": -6.810028076171875, "global_step": 145021, "epoch": 3452} {"train_loss": -6.839719772338867, "global_step": 145022, "epoch": 3452} {"train_loss": -6.8482537269592285, "global_step": 145023, "epoch": 3452} {"train_loss": -6.876513481140137, "global_step": 145024, "epoch": 3452} {"train_loss": -6.785176231747582, "global_step": 145025, "epoch": 3452, "val_loss": 67631.7890625} {"train_loss": -6.822752952575684, "global_step": 145026, "epoch": 3453} {"train_loss": -6.863845348358154, "global_step": 145027, "epoch": 3453} {"train_loss": -6.747916221618652, "global_step": 145028, "epoch": 3453} {"train_loss": -6.82009220123291, "global_step": 145029, "epoch": 3453} {"train_loss": -6.931844711303711, "global_step": 145030, "epoch": 3453} {"train_loss": -6.882645606994629, "global_step": 145031, "epoch": 3453} {"train_loss": -6.881311416625977, "global_step": 145032, "epoch": 3453} {"train_loss": -6.755718231201172, "global_step": 145033, "epoch": 3453} {"train_loss": -6.908786773681641, "global_step": 145034, "epoch": 3453} {"train_loss": -6.838975429534912, "global_step": 145035, "epoch": 3453} {"train_loss": -6.833505153656006, "global_step": 145036, "epoch": 3453} {"train_loss": -6.870553970336914, "global_step": 145037, "epoch": 3453} {"train_loss": -6.899960517883301, "global_step": 145038, "epoch": 3453} {"train_loss": -6.812041282653809, "global_step": 145039, "epoch": 3453} {"train_loss": -6.828771591186523, "global_step": 145040, "epoch": 3453} {"train_loss": -6.885515213012695, "global_step": 145041, "epoch": 3453} {"train_loss": -6.820558547973633, "global_step": 145042, "epoch": 3453} {"train_loss": -6.805420398712158, "global_step": 145043, "epoch": 3453} {"train_loss": -6.915524482727051, "global_step": 145044, "epoch": 3453} {"train_loss": -6.821324825286865, "global_step": 145045, "epoch": 3453} {"train_loss": -6.859151840209961, "global_step": 145046, "epoch": 3453} {"train_loss": -6.83099365234375, "global_step": 145047, "epoch": 3453} {"train_loss": -6.836136817932129, "global_step": 145048, "epoch": 3453} {"train_loss": -6.85120964050293, "global_step": 145049, "epoch": 3453} {"train_loss": -6.767953872680664, "global_step": 145050, "epoch": 3453} {"train_loss": -6.8591156005859375, "global_step": 145051, "epoch": 3453} {"train_loss": -6.8272833824157715, "global_step": 145052, "epoch": 3453} {"train_loss": -6.814506530761719, "global_step": 145053, "epoch": 3453} {"train_loss": -6.686138153076172, "global_step": 145054, "epoch": 3453} {"train_loss": -6.782904624938965, "global_step": 145055, "epoch": 3453} {"train_loss": -6.698227882385254, "global_step": 145056, "epoch": 3453} {"train_loss": -6.840843200683594, "global_step": 145057, "epoch": 3453} {"train_loss": -6.679937839508057, "global_step": 145058, "epoch": 3453} {"train_loss": -6.740606307983398, "global_step": 145059, "epoch": 3453} {"train_loss": -6.811034202575684, "global_step": 145060, "epoch": 3453} {"train_loss": -6.873848915100098, "global_step": 145061, "epoch": 3453} {"train_loss": -6.7652435302734375, "global_step": 145062, "epoch": 3453} {"train_loss": -6.734487056732178, "global_step": 145063, "epoch": 3453} {"train_loss": -6.832624435424805, "global_step": 145064, "epoch": 3453} {"train_loss": -6.737844467163086, "global_step": 145065, "epoch": 3453} {"train_loss": -6.800597190856934, "global_step": 145066, "epoch": 3453} {"train_loss": -6.818511701765514, "global_step": 145067, "epoch": 3453, "val_loss": 67676.0859375} {"train_loss": -6.790643215179443, "global_step": 145068, "epoch": 3454} {"train_loss": -6.837980270385742, "global_step": 145069, "epoch": 3454} {"train_loss": -6.78257417678833, "global_step": 145070, "epoch": 3454} {"train_loss": -6.782149791717529, "global_step": 145071, "epoch": 3454} {"train_loss": -6.755378723144531, "global_step": 145072, "epoch": 3454} {"train_loss": -6.630774021148682, "global_step": 145073, "epoch": 3454} {"train_loss": -6.7571120262146, "global_step": 145074, "epoch": 3454} {"train_loss": -6.734072685241699, "global_step": 145075, "epoch": 3454} {"train_loss": -6.749871253967285, "global_step": 145076, "epoch": 3454} {"train_loss": -6.879822254180908, "global_step": 145077, "epoch": 3454} {"train_loss": -6.66424560546875, "global_step": 145078, "epoch": 3454} {"train_loss": -6.86822509765625, "global_step": 145079, "epoch": 3454} {"train_loss": -6.835288047790527, "global_step": 145080, "epoch": 3454} {"train_loss": -6.8052544593811035, "global_step": 145081, "epoch": 3454} {"train_loss": -6.752171993255615, "global_step": 145082, "epoch": 3454} {"train_loss": -6.8559465408325195, "global_step": 145083, "epoch": 3454} {"train_loss": -6.936730861663818, "global_step": 145084, "epoch": 3454} {"train_loss": -6.89854621887207, "global_step": 145085, "epoch": 3454} {"train_loss": -6.9260759353637695, "global_step": 145086, "epoch": 3454} {"train_loss": -6.833098411560059, "global_step": 145087, "epoch": 3454} {"train_loss": -6.868873119354248, "global_step": 145088, "epoch": 3454} {"train_loss": -6.8278961181640625, "global_step": 145089, "epoch": 3454} {"train_loss": -6.865564346313477, "global_step": 145090, "epoch": 3454} {"train_loss": -6.921300411224365, "global_step": 145091, "epoch": 3454} {"train_loss": -6.752435684204102, "global_step": 145092, "epoch": 3454} {"train_loss": -6.723453044891357, "global_step": 145093, "epoch": 3454} {"train_loss": -6.856266021728516, "global_step": 145094, "epoch": 3454} {"train_loss": -6.868112564086914, "global_step": 145095, "epoch": 3454} {"train_loss": -6.816689491271973, "global_step": 145096, "epoch": 3454} {"train_loss": -6.89797306060791, "global_step": 145097, "epoch": 3454} {"train_loss": -6.79384708404541, "global_step": 145098, "epoch": 3454} {"train_loss": -6.908719062805176, "global_step": 145099, "epoch": 3454} {"train_loss": -6.786304950714111, "global_step": 145100, "epoch": 3454} {"train_loss": -6.786843299865723, "global_step": 145101, "epoch": 3454} {"train_loss": -6.846611499786377, "global_step": 145102, "epoch": 3454} {"train_loss": -6.768840789794922, "global_step": 145103, "epoch": 3454} {"train_loss": -6.881302833557129, "global_step": 145104, "epoch": 3454} {"train_loss": -6.756133079528809, "global_step": 145105, "epoch": 3454} {"train_loss": -6.831080913543701, "global_step": 145106, "epoch": 3454} {"train_loss": -6.810855865478516, "global_step": 145107, "epoch": 3454} {"train_loss": -6.710999488830566, "global_step": 145108, "epoch": 3454} {"train_loss": -6.812658809480213, "global_step": 145109, "epoch": 3454, "val_loss": 67649.0703125} {"train_loss": -6.7927565574646, "global_step": 145110, "epoch": 3455} {"train_loss": -6.739663600921631, "global_step": 145111, "epoch": 3455} {"train_loss": -6.81895112991333, "global_step": 145112, "epoch": 3455} {"train_loss": -6.79097843170166, "global_step": 145113, "epoch": 3455} {"train_loss": -6.822835922241211, "global_step": 145114, "epoch": 3455} {"train_loss": -6.899796485900879, "global_step": 145115, "epoch": 3455} {"train_loss": -6.841546058654785, "global_step": 145116, "epoch": 3455} {"train_loss": -6.826524257659912, "global_step": 145117, "epoch": 3455} {"train_loss": -6.896677017211914, "global_step": 145118, "epoch": 3455} {"train_loss": -6.87973690032959, "global_step": 145119, "epoch": 3455} {"train_loss": -6.868361473083496, "global_step": 145120, "epoch": 3455} {"train_loss": -6.7808918952941895, "global_step": 145121, "epoch": 3455} {"train_loss": -6.833104133605957, "global_step": 145122, "epoch": 3455} {"train_loss": -6.831363677978516, "global_step": 145123, "epoch": 3455} {"train_loss": -6.849782943725586, "global_step": 145124, "epoch": 3455} {"train_loss": -6.871667861938477, "global_step": 145125, "epoch": 3455} {"train_loss": -6.8086700439453125, "global_step": 145126, "epoch": 3455} {"train_loss": -6.890533447265625, "global_step": 145127, "epoch": 3455} {"train_loss": -6.80695104598999, "global_step": 145128, "epoch": 3455} {"train_loss": -6.741176128387451, "global_step": 145129, "epoch": 3455} {"train_loss": -6.941657066345215, "global_step": 145130, "epoch": 3455} {"train_loss": -6.884133338928223, "global_step": 145131, "epoch": 3455} {"train_loss": -7.012197017669678, "global_step": 145132, "epoch": 3455} {"train_loss": -6.836884021759033, "global_step": 145133, "epoch": 3455} {"train_loss": -6.918510437011719, "global_step": 145134, "epoch": 3455} {"train_loss": -6.890567779541016, "global_step": 145135, "epoch": 3455} {"train_loss": -6.881522178649902, "global_step": 145136, "epoch": 3455} {"train_loss": -6.8546833992004395, "global_step": 145137, "epoch": 3455} {"train_loss": -6.866415023803711, "global_step": 145138, "epoch": 3455} {"train_loss": -6.770247936248779, "global_step": 145139, "epoch": 3455} {"train_loss": -6.744403839111328, "global_step": 145140, "epoch": 3455} {"train_loss": -6.780816555023193, "global_step": 145141, "epoch": 3455} {"train_loss": -6.7461347579956055, "global_step": 145142, "epoch": 3455} {"train_loss": -6.917683124542236, "global_step": 145143, "epoch": 3455} {"train_loss": -6.580389022827148, "global_step": 145144, "epoch": 3455} {"train_loss": -6.862037658691406, "global_step": 145145, "epoch": 3455} {"train_loss": -6.781223297119141, "global_step": 145146, "epoch": 3455} {"train_loss": -6.606454849243164, "global_step": 145147, "epoch": 3455} {"train_loss": -6.831238746643066, "global_step": 145148, "epoch": 3455} {"train_loss": -6.710942268371582, "global_step": 145149, "epoch": 3455} {"train_loss": -6.6507568359375, "global_step": 145150, "epoch": 3455} {"train_loss": -6.8215872673761275, "global_step": 145151, "epoch": 3455, "val_loss": 67889.015625} {"train_loss": -6.743082523345947, "global_step": 145152, "epoch": 3456} {"train_loss": -6.803642272949219, "global_step": 145153, "epoch": 3456} {"train_loss": -6.8272929191589355, "global_step": 145154, "epoch": 3456} {"train_loss": -6.79261589050293, "global_step": 145155, "epoch": 3456} {"train_loss": -6.739686965942383, "global_step": 145156, "epoch": 3456} {"train_loss": -6.752999782562256, "global_step": 145157, "epoch": 3456} {"train_loss": -6.819035530090332, "global_step": 145158, "epoch": 3456} {"train_loss": -6.732481002807617, "global_step": 145159, "epoch": 3456} {"train_loss": -6.780755996704102, "global_step": 145160, "epoch": 3456} {"train_loss": -6.875546455383301, "global_step": 145161, "epoch": 3456} {"train_loss": -6.714422225952148, "global_step": 145162, "epoch": 3456} {"train_loss": -6.760587692260742, "global_step": 145163, "epoch": 3456} {"train_loss": -6.71534538269043, "global_step": 145164, "epoch": 3456} {"train_loss": -6.78680419921875, "global_step": 145165, "epoch": 3456} {"train_loss": -6.716714382171631, "global_step": 145166, "epoch": 3456} {"train_loss": -6.767142295837402, "global_step": 145167, "epoch": 3456} {"train_loss": -6.698653697967529, "global_step": 145168, "epoch": 3456} {"train_loss": -6.730766773223877, "global_step": 145169, "epoch": 3456} {"train_loss": -6.737078666687012, "global_step": 145170, "epoch": 3456} {"train_loss": -6.809877872467041, "global_step": 145171, "epoch": 3456} {"train_loss": -6.837106704711914, "global_step": 145172, "epoch": 3456} {"train_loss": -6.827008247375488, "global_step": 145173, "epoch": 3456} {"train_loss": -6.821625709533691, "global_step": 145174, "epoch": 3456} {"train_loss": -6.71687126159668, "global_step": 145175, "epoch": 3456} {"train_loss": -6.743862628936768, "global_step": 145176, "epoch": 3456} {"train_loss": -6.755866050720215, "global_step": 145177, "epoch": 3456} {"train_loss": -6.808727264404297, "global_step": 145178, "epoch": 3456} {"train_loss": -6.688692092895508, "global_step": 145179, "epoch": 3456} {"train_loss": -6.84085750579834, "global_step": 145180, "epoch": 3456} {"train_loss": -6.798616409301758, "global_step": 145181, "epoch": 3456} {"train_loss": -6.690485000610352, "global_step": 145182, "epoch": 3456} {"train_loss": -6.803680419921875, "global_step": 145183, "epoch": 3456} {"train_loss": -6.900321006774902, "global_step": 145184, "epoch": 3456} {"train_loss": -6.74819803237915, "global_step": 145185, "epoch": 3456} {"train_loss": -6.853890419006348, "global_step": 145186, "epoch": 3456} {"train_loss": -6.755167007446289, "global_step": 145187, "epoch": 3456} {"train_loss": -6.853474140167236, "global_step": 145188, "epoch": 3456} {"train_loss": -6.836169242858887, "global_step": 145189, "epoch": 3456} {"train_loss": -6.852651596069336, "global_step": 145190, "epoch": 3456} {"train_loss": -6.774340629577637, "global_step": 145191, "epoch": 3456} {"train_loss": -6.890122413635254, "global_step": 145192, "epoch": 3456} {"train_loss": -6.782639594305129, "global_step": 145193, "epoch": 3456, "val_loss": 67598.6484375} {"train_loss": -6.770909309387207, "global_step": 145194, "epoch": 3457} {"train_loss": -6.780252456665039, "global_step": 145195, "epoch": 3457} {"train_loss": -6.810174942016602, "global_step": 145196, "epoch": 3457} {"train_loss": -6.968530654907227, "global_step": 145197, "epoch": 3457} {"train_loss": -6.869874954223633, "global_step": 145198, "epoch": 3457} {"train_loss": -6.79883337020874, "global_step": 145199, "epoch": 3457} {"train_loss": -6.833774566650391, "global_step": 145200, "epoch": 3457} {"train_loss": -6.934237480163574, "global_step": 145201, "epoch": 3457} {"train_loss": -6.907835483551025, "global_step": 145202, "epoch": 3457} {"train_loss": -6.7782087326049805, "global_step": 145203, "epoch": 3457} {"train_loss": -6.785168647766113, "global_step": 145204, "epoch": 3457} {"train_loss": -6.846803665161133, "global_step": 145205, "epoch": 3457} {"train_loss": -6.776071548461914, "global_step": 145206, "epoch": 3457} {"train_loss": -6.766661167144775, "global_step": 145207, "epoch": 3457} {"train_loss": -6.841930389404297, "global_step": 145208, "epoch": 3457} {"train_loss": -6.882297515869141, "global_step": 145209, "epoch": 3457} {"train_loss": -6.78358793258667, "global_step": 145210, "epoch": 3457} {"train_loss": -6.934840202331543, "global_step": 145211, "epoch": 3457} {"train_loss": -6.711431503295898, "global_step": 145212, "epoch": 3457} {"train_loss": -6.801828384399414, "global_step": 145213, "epoch": 3457} {"train_loss": -6.866184711456299, "global_step": 145214, "epoch": 3457} {"train_loss": -6.771025657653809, "global_step": 145215, "epoch": 3457} {"train_loss": -6.650187969207764, "global_step": 145216, "epoch": 3457} {"train_loss": -6.715271472930908, "global_step": 145217, "epoch": 3457} {"train_loss": -6.783807754516602, "global_step": 145218, "epoch": 3457} {"train_loss": -6.651498317718506, "global_step": 145219, "epoch": 3457} {"train_loss": -6.821037292480469, "global_step": 145220, "epoch": 3457} {"train_loss": -6.712942600250244, "global_step": 145221, "epoch": 3457} {"train_loss": -6.863514423370361, "global_step": 145222, "epoch": 3457} {"train_loss": -6.8274126052856445, "global_step": 145223, "epoch": 3457} {"train_loss": -6.759587287902832, "global_step": 145224, "epoch": 3457} {"train_loss": -6.903546333312988, "global_step": 145225, "epoch": 3457} {"train_loss": -6.797003746032715, "global_step": 145226, "epoch": 3457} {"train_loss": -6.933698654174805, "global_step": 145227, "epoch": 3457} {"train_loss": -6.808079719543457, "global_step": 145228, "epoch": 3457} {"train_loss": -6.789114952087402, "global_step": 145229, "epoch": 3457} {"train_loss": -6.8236236572265625, "global_step": 145230, "epoch": 3457} {"train_loss": -6.841694355010986, "global_step": 145231, "epoch": 3457} {"train_loss": -6.916839122772217, "global_step": 145232, "epoch": 3457} {"train_loss": -6.87363338470459, "global_step": 145233, "epoch": 3457} {"train_loss": -6.791882514953613, "global_step": 145234, "epoch": 3457} {"train_loss": -6.814985082263038, "global_step": 145235, "epoch": 3457, "val_loss": 67521.078125} {"train_loss": -6.906473159790039, "global_step": 145236, "epoch": 3458} {"train_loss": -6.856330871582031, "global_step": 145237, "epoch": 3458} {"train_loss": -6.830765724182129, "global_step": 145238, "epoch": 3458} {"train_loss": -6.891297340393066, "global_step": 145239, "epoch": 3458} {"train_loss": -6.802845001220703, "global_step": 145240, "epoch": 3458} {"train_loss": -6.7781171798706055, "global_step": 145241, "epoch": 3458} {"train_loss": -6.85223913192749, "global_step": 145242, "epoch": 3458} {"train_loss": -6.802407264709473, "global_step": 145243, "epoch": 3458} {"train_loss": -6.870984077453613, "global_step": 145244, "epoch": 3458} {"train_loss": -6.7939043045043945, "global_step": 145245, "epoch": 3458} {"train_loss": -6.941736221313477, "global_step": 145246, "epoch": 3458} {"train_loss": -6.882446765899658, "global_step": 145247, "epoch": 3458} {"train_loss": -6.772089958190918, "global_step": 145248, "epoch": 3458} {"train_loss": -6.869144439697266, "global_step": 145249, "epoch": 3458} {"train_loss": -6.717247009277344, "global_step": 145250, "epoch": 3458} {"train_loss": -6.615994453430176, "global_step": 145251, "epoch": 3458} {"train_loss": -6.772932052612305, "global_step": 145252, "epoch": 3458} {"train_loss": -6.786183834075928, "global_step": 145253, "epoch": 3458} {"train_loss": -6.616840362548828, "global_step": 145254, "epoch": 3458} {"train_loss": -6.812305450439453, "global_step": 145255, "epoch": 3458} {"train_loss": -6.734121322631836, "global_step": 145256, "epoch": 3458} {"train_loss": -6.655339241027832, "global_step": 145257, "epoch": 3458} {"train_loss": -6.71236515045166, "global_step": 145258, "epoch": 3458} {"train_loss": -6.671667098999023, "global_step": 145259, "epoch": 3458} {"train_loss": -6.725747108459473, "global_step": 145260, "epoch": 3458} {"train_loss": -6.6904497146606445, "global_step": 145261, "epoch": 3458} {"train_loss": -6.621367931365967, "global_step": 145262, "epoch": 3458} {"train_loss": -6.629393100738525, "global_step": 145263, "epoch": 3458} {"train_loss": -6.744618892669678, "global_step": 145264, "epoch": 3458} {"train_loss": -6.7795867919921875, "global_step": 145265, "epoch": 3458} {"train_loss": -6.750887870788574, "global_step": 145266, "epoch": 3458} {"train_loss": -6.867970943450928, "global_step": 145267, "epoch": 3458} {"train_loss": -6.7867112159729, "global_step": 145268, "epoch": 3458} {"train_loss": -6.767652988433838, "global_step": 145269, "epoch": 3458} {"train_loss": -6.798929214477539, "global_step": 145270, "epoch": 3458} {"train_loss": -6.776762008666992, "global_step": 145271, "epoch": 3458} {"train_loss": -6.782249450683594, "global_step": 145272, "epoch": 3458} {"train_loss": -6.71314001083374, "global_step": 145273, "epoch": 3458} {"train_loss": -6.786749839782715, "global_step": 145274, "epoch": 3458} {"train_loss": -6.771160125732422, "global_step": 145275, "epoch": 3458} {"train_loss": -6.792734146118164, "global_step": 145276, "epoch": 3458} {"train_loss": -6.774615492139544, "global_step": 145277, "epoch": 3458, "val_loss": 67440.578125} {"train_loss": -6.7343339920043945, "global_step": 145278, "epoch": 3459} {"train_loss": -6.783266544342041, "global_step": 145279, "epoch": 3459} {"train_loss": -6.6974992752075195, "global_step": 145280, "epoch": 3459} {"train_loss": -6.66077995300293, "global_step": 145281, "epoch": 3459} {"train_loss": -6.830501079559326, "global_step": 145282, "epoch": 3459} {"train_loss": -6.574961185455322, "global_step": 145283, "epoch": 3459} {"train_loss": -6.532410621643066, "global_step": 145284, "epoch": 3459} {"train_loss": -6.907830238342285, "global_step": 145285, "epoch": 3459} {"train_loss": -6.463936805725098, "global_step": 145286, "epoch": 3459} {"train_loss": -6.66859769821167, "global_step": 145287, "epoch": 3459} {"train_loss": -6.7001237869262695, "global_step": 145288, "epoch": 3459} {"train_loss": -6.8025665283203125, "global_step": 145289, "epoch": 3459} {"train_loss": -6.714371681213379, "global_step": 145290, "epoch": 3459} {"train_loss": -6.815442085266113, "global_step": 145291, "epoch": 3459} {"train_loss": -6.669313907623291, "global_step": 145292, "epoch": 3459} {"train_loss": -6.769840240478516, "global_step": 145293, "epoch": 3459} {"train_loss": -6.743583679199219, "global_step": 145294, "epoch": 3459} {"train_loss": -6.7397141456604, "global_step": 145295, "epoch": 3459} {"train_loss": -6.787678241729736, "global_step": 145296, "epoch": 3459} {"train_loss": -6.762866020202637, "global_step": 145297, "epoch": 3459} {"train_loss": -6.798268795013428, "global_step": 145298, "epoch": 3459} {"train_loss": -6.757302284240723, "global_step": 145299, "epoch": 3459} {"train_loss": -6.813694953918457, "global_step": 145300, "epoch": 3459} {"train_loss": -6.815445899963379, "global_step": 145301, "epoch": 3459} {"train_loss": -6.646923065185547, "global_step": 145302, "epoch": 3459} {"train_loss": -6.8331499099731445, "global_step": 145303, "epoch": 3459} {"train_loss": -6.8926191329956055, "global_step": 145304, "epoch": 3459} {"train_loss": -6.734710693359375, "global_step": 145305, "epoch": 3459} {"train_loss": -6.783596038818359, "global_step": 145306, "epoch": 3459} {"train_loss": -6.815074920654297, "global_step": 145307, "epoch": 3459} {"train_loss": -6.824262619018555, "global_step": 145308, "epoch": 3459} {"train_loss": -6.879793167114258, "global_step": 145309, "epoch": 3459} {"train_loss": -6.810072898864746, "global_step": 145310, "epoch": 3459} {"train_loss": -6.832625389099121, "global_step": 145311, "epoch": 3459} {"train_loss": -6.773244857788086, "global_step": 145312, "epoch": 3459} {"train_loss": -6.781991958618164, "global_step": 145313, "epoch": 3459} {"train_loss": -6.789772033691406, "global_step": 145314, "epoch": 3459} {"train_loss": -6.681580543518066, "global_step": 145315, "epoch": 3459} {"train_loss": -6.8325629234313965, "global_step": 145316, "epoch": 3459} {"train_loss": -6.819768905639648, "global_step": 145317, "epoch": 3459} {"train_loss": -6.819173336029053, "global_step": 145318, "epoch": 3459} {"train_loss": -6.760196015948341, "global_step": 145319, "epoch": 3459, "val_loss": 67488.734375} {"train_loss": -6.84811544418335, "global_step": 145320, "epoch": 3460} {"train_loss": -6.782503128051758, "global_step": 145321, "epoch": 3460} {"train_loss": -6.8738603591918945, "global_step": 145322, "epoch": 3460} {"train_loss": -6.841948509216309, "global_step": 145323, "epoch": 3460} {"train_loss": -6.78053617477417, "global_step": 145324, "epoch": 3460} {"train_loss": -6.764074802398682, "global_step": 145325, "epoch": 3460} {"train_loss": -6.848236083984375, "global_step": 145326, "epoch": 3460} {"train_loss": -6.76933479309082, "global_step": 145327, "epoch": 3460} {"train_loss": -6.774202346801758, "global_step": 145328, "epoch": 3460} {"train_loss": -6.826943397521973, "global_step": 145329, "epoch": 3460} {"train_loss": -6.83284330368042, "global_step": 145330, "epoch": 3460} {"train_loss": -6.683662414550781, "global_step": 145331, "epoch": 3460} {"train_loss": -6.974403381347656, "global_step": 145332, "epoch": 3460} {"train_loss": -6.8202972412109375, "global_step": 145333, "epoch": 3460} {"train_loss": -6.856823921203613, "global_step": 145334, "epoch": 3460} {"train_loss": -6.833410739898682, "global_step": 145335, "epoch": 3460} {"train_loss": -6.697892189025879, "global_step": 145336, "epoch": 3460} {"train_loss": -6.9333600997924805, "global_step": 145337, "epoch": 3460} {"train_loss": -6.752185821533203, "global_step": 145338, "epoch": 3460} {"train_loss": -6.811988353729248, "global_step": 145339, "epoch": 3460} {"train_loss": -6.857726573944092, "global_step": 145340, "epoch": 3460} {"train_loss": -6.836695671081543, "global_step": 145341, "epoch": 3460} {"train_loss": -6.7675089836120605, "global_step": 145342, "epoch": 3460} {"train_loss": -6.758791923522949, "global_step": 145343, "epoch": 3460} {"train_loss": -6.839648723602295, "global_step": 145344, "epoch": 3460} {"train_loss": -6.8463592529296875, "global_step": 145345, "epoch": 3460} {"train_loss": -6.836766242980957, "global_step": 145346, "epoch": 3460} {"train_loss": -6.8667755126953125, "global_step": 145347, "epoch": 3460} {"train_loss": -6.8623247146606445, "global_step": 145348, "epoch": 3460} {"train_loss": -6.737098693847656, "global_step": 145349, "epoch": 3460} {"train_loss": -6.882962226867676, "global_step": 145350, "epoch": 3460} {"train_loss": -6.881037712097168, "global_step": 145351, "epoch": 3460} {"train_loss": -6.913455009460449, "global_step": 145352, "epoch": 3460} {"train_loss": -6.906027793884277, "global_step": 145353, "epoch": 3460} {"train_loss": -6.9464111328125, "global_step": 145354, "epoch": 3460} {"train_loss": -6.881627559661865, "global_step": 145355, "epoch": 3460} {"train_loss": -6.861365795135498, "global_step": 145356, "epoch": 3460} {"train_loss": -6.801059722900391, "global_step": 145357, "epoch": 3460} {"train_loss": -6.990606307983398, "global_step": 145358, "epoch": 3460} {"train_loss": -6.883070945739746, "global_step": 145359, "epoch": 3460} {"train_loss": -6.873836517333984, "global_step": 145360, "epoch": 3460} {"train_loss": -6.835005374181838, "global_step": 145361, "epoch": 3460, "val_loss": 67591.140625} {"train_loss": -6.776387691497803, "global_step": 145362, "epoch": 3461} {"train_loss": -6.909445762634277, "global_step": 145363, "epoch": 3461} {"train_loss": -6.729497909545898, "global_step": 145364, "epoch": 3461} {"train_loss": -6.8128557205200195, "global_step": 145365, "epoch": 3461} {"train_loss": -6.831226348876953, "global_step": 145366, "epoch": 3461} {"train_loss": -6.911106109619141, "global_step": 145367, "epoch": 3461} {"train_loss": -6.859530448913574, "global_step": 145368, "epoch": 3461} {"train_loss": -6.910559177398682, "global_step": 145369, "epoch": 3461} {"train_loss": -6.82406759262085, "global_step": 145370, "epoch": 3461} {"train_loss": -6.8250837326049805, "global_step": 145371, "epoch": 3461} {"train_loss": -6.753429412841797, "global_step": 145372, "epoch": 3461} {"train_loss": -6.913269996643066, "global_step": 145373, "epoch": 3461} {"train_loss": -6.872179985046387, "global_step": 145374, "epoch": 3461} {"train_loss": -6.892298698425293, "global_step": 145375, "epoch": 3461} {"train_loss": -6.92882776260376, "global_step": 145376, "epoch": 3461} {"train_loss": -6.796551704406738, "global_step": 145377, "epoch": 3461} {"train_loss": -6.850351810455322, "global_step": 145378, "epoch": 3461} {"train_loss": -6.783612251281738, "global_step": 145379, "epoch": 3461} {"train_loss": -6.877426624298096, "global_step": 145380, "epoch": 3461} {"train_loss": -6.814797401428223, "global_step": 145381, "epoch": 3461} {"train_loss": -6.8434295654296875, "global_step": 145382, "epoch": 3461} {"train_loss": -6.833526611328125, "global_step": 145383, "epoch": 3461} {"train_loss": -6.798680305480957, "global_step": 145384, "epoch": 3461} {"train_loss": -6.858175277709961, "global_step": 145385, "epoch": 3461} {"train_loss": -6.850863933563232, "global_step": 145386, "epoch": 3461} {"train_loss": -6.814699649810791, "global_step": 145387, "epoch": 3461} {"train_loss": -6.790082931518555, "global_step": 145388, "epoch": 3461} {"train_loss": -6.869165420532227, "global_step": 145389, "epoch": 3461} {"train_loss": -6.8116374015808105, "global_step": 145390, "epoch": 3461} {"train_loss": -6.943323135375977, "global_step": 145391, "epoch": 3461} {"train_loss": -6.910167694091797, "global_step": 145392, "epoch": 3461} {"train_loss": -6.757198333740234, "global_step": 145393, "epoch": 3461} {"train_loss": -6.869978904724121, "global_step": 145394, "epoch": 3461} {"train_loss": -6.933193683624268, "global_step": 145395, "epoch": 3461} {"train_loss": -6.790053367614746, "global_step": 145396, "epoch": 3461} {"train_loss": -6.910687446594238, "global_step": 145397, "epoch": 3461} {"train_loss": -6.926072120666504, "global_step": 145398, "epoch": 3461} {"train_loss": -6.8690690994262695, "global_step": 145399, "epoch": 3461} {"train_loss": -6.838484764099121, "global_step": 145400, "epoch": 3461} {"train_loss": -6.783811569213867, "global_step": 145401, "epoch": 3461} {"train_loss": -6.827883720397949, "global_step": 145402, "epoch": 3461} {"train_loss": -6.848330032257807, "global_step": 145403, "epoch": 3461, "val_loss": 67587.421875} {"train_loss": -6.895521640777588, "global_step": 145404, "epoch": 3462} {"train_loss": -6.838092803955078, "global_step": 145405, "epoch": 3462} {"train_loss": -6.910623550415039, "global_step": 145406, "epoch": 3462} {"train_loss": -6.853252410888672, "global_step": 145407, "epoch": 3462} {"train_loss": -6.827320098876953, "global_step": 145408, "epoch": 3462} {"train_loss": -6.921232223510742, "global_step": 145409, "epoch": 3462} {"train_loss": -6.839205741882324, "global_step": 145410, "epoch": 3462} {"train_loss": -6.797398567199707, "global_step": 145411, "epoch": 3462} {"train_loss": -6.755805015563965, "global_step": 145412, "epoch": 3462} {"train_loss": -6.868027687072754, "global_step": 145413, "epoch": 3462} {"train_loss": -6.785928726196289, "global_step": 145414, "epoch": 3462} {"train_loss": -6.717404842376709, "global_step": 145415, "epoch": 3462} {"train_loss": -6.859612464904785, "global_step": 145416, "epoch": 3462} {"train_loss": -6.976966857910156, "global_step": 145417, "epoch": 3462} {"train_loss": -6.636489391326904, "global_step": 145418, "epoch": 3462} {"train_loss": -6.751659393310547, "global_step": 145419, "epoch": 3462} {"train_loss": -6.703726291656494, "global_step": 145420, "epoch": 3462} {"train_loss": -6.773517608642578, "global_step": 145421, "epoch": 3462} {"train_loss": -6.801707744598389, "global_step": 145422, "epoch": 3462} {"train_loss": -6.886478424072266, "global_step": 145423, "epoch": 3462} {"train_loss": -6.885025501251221, "global_step": 145424, "epoch": 3462} {"train_loss": -6.811042785644531, "global_step": 145425, "epoch": 3462} {"train_loss": -6.7081756591796875, "global_step": 145426, "epoch": 3462} {"train_loss": -6.769533157348633, "global_step": 145427, "epoch": 3462} {"train_loss": -6.633522033691406, "global_step": 145428, "epoch": 3462} {"train_loss": -6.846380233764648, "global_step": 145429, "epoch": 3462} {"train_loss": -6.819263458251953, "global_step": 145430, "epoch": 3462} {"train_loss": -6.877505302429199, "global_step": 145431, "epoch": 3462} {"train_loss": -6.802505970001221, "global_step": 145432, "epoch": 3462} {"train_loss": -6.7299089431762695, "global_step": 145433, "epoch": 3462} {"train_loss": -6.857238292694092, "global_step": 145434, "epoch": 3462} {"train_loss": -6.800083160400391, "global_step": 145435, "epoch": 3462} {"train_loss": -6.755397319793701, "global_step": 145436, "epoch": 3462} {"train_loss": -6.856459140777588, "global_step": 145437, "epoch": 3462} {"train_loss": -6.713133335113525, "global_step": 145438, "epoch": 3462} {"train_loss": -6.831393241882324, "global_step": 145439, "epoch": 3462} {"train_loss": -6.882387161254883, "global_step": 145440, "epoch": 3462} {"train_loss": -6.816976547241211, "global_step": 145441, "epoch": 3462} {"train_loss": -6.896736145019531, "global_step": 145442, "epoch": 3462} {"train_loss": -6.9286699295043945, "global_step": 145443, "epoch": 3462} {"train_loss": -6.813107013702393, "global_step": 145444, "epoch": 3462} {"train_loss": -6.815551644279843, "global_step": 145445, "epoch": 3462, "val_loss": 67592.8125} {"train_loss": -6.870469570159912, "global_step": 145446, "epoch": 3463} {"train_loss": -6.846458435058594, "global_step": 145447, "epoch": 3463} {"train_loss": -6.827900409698486, "global_step": 145448, "epoch": 3463} {"train_loss": -6.868852615356445, "global_step": 145449, "epoch": 3463} {"train_loss": -6.7856526374816895, "global_step": 145450, "epoch": 3463} {"train_loss": -6.837284088134766, "global_step": 145451, "epoch": 3463} {"train_loss": -6.889405250549316, "global_step": 145452, "epoch": 3463} {"train_loss": -6.821975231170654, "global_step": 145453, "epoch": 3463} {"train_loss": -6.913460731506348, "global_step": 145454, "epoch": 3463} {"train_loss": -6.872134208679199, "global_step": 145455, "epoch": 3463} {"train_loss": -6.804062366485596, "global_step": 145456, "epoch": 3463} {"train_loss": -6.9328837394714355, "global_step": 145457, "epoch": 3463} {"train_loss": -6.842254638671875, "global_step": 145458, "epoch": 3463} {"train_loss": -6.783615589141846, "global_step": 145459, "epoch": 3463} {"train_loss": -6.803312301635742, "global_step": 145460, "epoch": 3463} {"train_loss": -6.722165107727051, "global_step": 145461, "epoch": 3463} {"train_loss": -6.813832759857178, "global_step": 145462, "epoch": 3463} {"train_loss": -6.769333839416504, "global_step": 145463, "epoch": 3463} {"train_loss": -6.754644393920898, "global_step": 145464, "epoch": 3463} {"train_loss": -6.736866474151611, "global_step": 145465, "epoch": 3463} {"train_loss": -6.712002754211426, "global_step": 145466, "epoch": 3463} {"train_loss": -6.894916534423828, "global_step": 145467, "epoch": 3463} {"train_loss": -6.750153541564941, "global_step": 145468, "epoch": 3463} {"train_loss": -6.769064903259277, "global_step": 145469, "epoch": 3463} {"train_loss": -6.716568946838379, "global_step": 145470, "epoch": 3463} {"train_loss": -6.672461986541748, "global_step": 145471, "epoch": 3463} {"train_loss": -6.893538475036621, "global_step": 145472, "epoch": 3463} {"train_loss": -6.858071804046631, "global_step": 145473, "epoch": 3463} {"train_loss": -6.66548490524292, "global_step": 145474, "epoch": 3463} {"train_loss": -6.818431854248047, "global_step": 145475, "epoch": 3463} {"train_loss": -6.71286678314209, "global_step": 145476, "epoch": 3463} {"train_loss": -6.742846488952637, "global_step": 145477, "epoch": 3463} {"train_loss": -6.881819725036621, "global_step": 145478, "epoch": 3463} {"train_loss": -6.847394943237305, "global_step": 145479, "epoch": 3463} {"train_loss": -6.799249172210693, "global_step": 145480, "epoch": 3463} {"train_loss": -6.767960071563721, "global_step": 145481, "epoch": 3463} {"train_loss": -6.8206634521484375, "global_step": 145482, "epoch": 3463} {"train_loss": -6.8440728187561035, "global_step": 145483, "epoch": 3463} {"train_loss": -6.656579494476318, "global_step": 145484, "epoch": 3463} {"train_loss": -6.788967132568359, "global_step": 145485, "epoch": 3463} {"train_loss": -6.835020542144775, "global_step": 145486, "epoch": 3463} {"train_loss": -6.798508859816051, "global_step": 145487, "epoch": 3463, "val_loss": 67680.625} {"train_loss": -6.802095413208008, "global_step": 145488, "epoch": 3464} {"train_loss": -6.670212268829346, "global_step": 145489, "epoch": 3464} {"train_loss": -6.784793376922607, "global_step": 145490, "epoch": 3464} {"train_loss": -6.8129191398620605, "global_step": 145491, "epoch": 3464} {"train_loss": -6.773907661437988, "global_step": 145492, "epoch": 3464} {"train_loss": -6.886364459991455, "global_step": 145493, "epoch": 3464} {"train_loss": -6.684027671813965, "global_step": 145494, "epoch": 3464} {"train_loss": -6.664860725402832, "global_step": 145495, "epoch": 3464} {"train_loss": -6.8571014404296875, "global_step": 145496, "epoch": 3464} {"train_loss": -6.754790306091309, "global_step": 145497, "epoch": 3464} {"train_loss": -6.821298599243164, "global_step": 145498, "epoch": 3464} {"train_loss": -6.785563945770264, "global_step": 145499, "epoch": 3464} {"train_loss": -6.876121520996094, "global_step": 145500, "epoch": 3464} {"train_loss": -6.893301963806152, "global_step": 145501, "epoch": 3464} {"train_loss": -6.817177772521973, "global_step": 145502, "epoch": 3464} {"train_loss": -6.7784576416015625, "global_step": 145503, "epoch": 3464} {"train_loss": -6.706431865692139, "global_step": 145504, "epoch": 3464} {"train_loss": -6.7906293869018555, "global_step": 145505, "epoch": 3464} {"train_loss": -6.853667736053467, "global_step": 145506, "epoch": 3464} {"train_loss": -6.785419464111328, "global_step": 145507, "epoch": 3464} {"train_loss": -6.677738666534424, "global_step": 145508, "epoch": 3464} {"train_loss": -6.75482177734375, "global_step": 145509, "epoch": 3464} {"train_loss": -6.791134357452393, "global_step": 145510, "epoch": 3464} {"train_loss": -6.7666401863098145, "global_step": 145511, "epoch": 3464} {"train_loss": -6.7205705642700195, "global_step": 145512, "epoch": 3464} {"train_loss": -6.697504043579102, "global_step": 145513, "epoch": 3464} {"train_loss": -6.7522478103637695, "global_step": 145514, "epoch": 3464} {"train_loss": -6.765687942504883, "global_step": 145515, "epoch": 3464} {"train_loss": -6.809607028961182, "global_step": 145516, "epoch": 3464} {"train_loss": -6.788007736206055, "global_step": 145517, "epoch": 3464} {"train_loss": -6.797511577606201, "global_step": 145518, "epoch": 3464} {"train_loss": -6.825684547424316, "global_step": 145519, "epoch": 3464} {"train_loss": -6.845616340637207, "global_step": 145520, "epoch": 3464} {"train_loss": -6.821125030517578, "global_step": 145521, "epoch": 3464} {"train_loss": -6.778307914733887, "global_step": 145522, "epoch": 3464} {"train_loss": -6.7442216873168945, "global_step": 145523, "epoch": 3464} {"train_loss": -6.889472961425781, "global_step": 145524, "epoch": 3464} {"train_loss": -6.728569030761719, "global_step": 145525, "epoch": 3464} {"train_loss": -6.841508388519287, "global_step": 145526, "epoch": 3464} {"train_loss": -6.835904121398926, "global_step": 145527, "epoch": 3464} {"train_loss": -6.925260543823242, "global_step": 145528, "epoch": 3464} {"train_loss": -6.791249854224069, "global_step": 145529, "epoch": 3464, "val_loss": 67760.2578125} {"train_loss": -6.836366653442383, "global_step": 145530, "epoch": 3465} {"train_loss": -6.840939521789551, "global_step": 145531, "epoch": 3465} {"train_loss": -6.853164196014404, "global_step": 145532, "epoch": 3465} {"train_loss": -6.858112335205078, "global_step": 145533, "epoch": 3465} {"train_loss": -6.7995219230651855, "global_step": 145534, "epoch": 3465} {"train_loss": -6.924838066101074, "global_step": 145535, "epoch": 3465} {"train_loss": -6.885823726654053, "global_step": 145536, "epoch": 3465} {"train_loss": -6.886768341064453, "global_step": 145537, "epoch": 3465} {"train_loss": -6.864869117736816, "global_step": 145538, "epoch": 3465} {"train_loss": -7.000200271606445, "global_step": 145539, "epoch": 3465} {"train_loss": -6.8371663093566895, "global_step": 145540, "epoch": 3465} {"train_loss": -6.8600544929504395, "global_step": 145541, "epoch": 3465} {"train_loss": -6.8247575759887695, "global_step": 145542, "epoch": 3465} {"train_loss": -6.87216854095459, "global_step": 145543, "epoch": 3465} {"train_loss": -6.9056243896484375, "global_step": 145544, "epoch": 3465} {"train_loss": -6.864105224609375, "global_step": 145545, "epoch": 3465} {"train_loss": -6.866759300231934, "global_step": 145546, "epoch": 3465} {"train_loss": -6.847882270812988, "global_step": 145547, "epoch": 3465} {"train_loss": -6.774112701416016, "global_step": 145548, "epoch": 3465} {"train_loss": -6.85318660736084, "global_step": 145549, "epoch": 3465} {"train_loss": -6.834216117858887, "global_step": 145550, "epoch": 3465} {"train_loss": -6.909085273742676, "global_step": 145551, "epoch": 3465} {"train_loss": -6.785421848297119, "global_step": 145552, "epoch": 3465} {"train_loss": -6.917808532714844, "global_step": 145553, "epoch": 3465} {"train_loss": -6.769526481628418, "global_step": 145554, "epoch": 3465} {"train_loss": -6.819669723510742, "global_step": 145555, "epoch": 3465} {"train_loss": -6.758408069610596, "global_step": 145556, "epoch": 3465} {"train_loss": -6.889865875244141, "global_step": 145557, "epoch": 3465} {"train_loss": -6.89603328704834, "global_step": 145558, "epoch": 3465} {"train_loss": -6.7208380699157715, "global_step": 145559, "epoch": 3465} {"train_loss": -6.786880016326904, "global_step": 145560, "epoch": 3465} {"train_loss": -6.822030067443848, "global_step": 145561, "epoch": 3465} {"train_loss": -6.676326751708984, "global_step": 145562, "epoch": 3465} {"train_loss": -6.73280143737793, "global_step": 145563, "epoch": 3465} {"train_loss": -6.779231071472168, "global_step": 145564, "epoch": 3465} {"train_loss": -6.7230224609375, "global_step": 145565, "epoch": 3465} {"train_loss": -6.786587715148926, "global_step": 145566, "epoch": 3465} {"train_loss": -6.851275444030762, "global_step": 145567, "epoch": 3465} {"train_loss": -6.695150375366211, "global_step": 145568, "epoch": 3465} {"train_loss": -6.819891929626465, "global_step": 145569, "epoch": 3465} {"train_loss": -6.680534362792969, "global_step": 145570, "epoch": 3465} {"train_loss": -6.824877432414463, "global_step": 145571, "epoch": 3465, "val_loss": 67769.1875} {"train_loss": -6.800748825073242, "global_step": 145572, "epoch": 3466} {"train_loss": -6.677364349365234, "global_step": 145573, "epoch": 3466} {"train_loss": -6.780204772949219, "global_step": 145574, "epoch": 3466} {"train_loss": -6.86332368850708, "global_step": 145575, "epoch": 3466} {"train_loss": -6.753936767578125, "global_step": 145576, "epoch": 3466} {"train_loss": -6.780516624450684, "global_step": 145577, "epoch": 3466} {"train_loss": -6.633101463317871, "global_step": 145578, "epoch": 3466} {"train_loss": -6.640692710876465, "global_step": 145579, "epoch": 3466} {"train_loss": -6.686282634735107, "global_step": 145580, "epoch": 3466} {"train_loss": -6.672940254211426, "global_step": 145581, "epoch": 3466} {"train_loss": -6.688131332397461, "global_step": 145582, "epoch": 3466} {"train_loss": -6.671445846557617, "global_step": 145583, "epoch": 3466} {"train_loss": -6.72624397277832, "global_step": 145584, "epoch": 3466} {"train_loss": -6.811333656311035, "global_step": 145585, "epoch": 3466} {"train_loss": -6.5867815017700195, "global_step": 145586, "epoch": 3466} {"train_loss": -6.763367652893066, "global_step": 145587, "epoch": 3466} {"train_loss": -6.74441385269165, "global_step": 145588, "epoch": 3466} {"train_loss": -6.757640838623047, "global_step": 145589, "epoch": 3466} {"train_loss": -6.712800979614258, "global_step": 145590, "epoch": 3466} {"train_loss": -6.758874893188477, "global_step": 145591, "epoch": 3466} {"train_loss": -6.705101013183594, "global_step": 145592, "epoch": 3466} {"train_loss": -6.677659034729004, "global_step": 145593, "epoch": 3466} {"train_loss": -6.807497978210449, "global_step": 145594, "epoch": 3466} {"train_loss": -6.791460037231445, "global_step": 145595, "epoch": 3466} {"train_loss": -6.665920257568359, "global_step": 145596, "epoch": 3466} {"train_loss": -6.851016044616699, "global_step": 145597, "epoch": 3466} {"train_loss": -6.601032257080078, "global_step": 145598, "epoch": 3466} {"train_loss": -6.858319282531738, "global_step": 145599, "epoch": 3466} {"train_loss": -6.6639084815979, "global_step": 145600, "epoch": 3466} {"train_loss": -6.9176483154296875, "global_step": 145601, "epoch": 3466} {"train_loss": -6.745347023010254, "global_step": 145602, "epoch": 3466} {"train_loss": -6.796607971191406, "global_step": 145603, "epoch": 3466} {"train_loss": -6.776048183441162, "global_step": 145604, "epoch": 3466} {"train_loss": -6.788694381713867, "global_step": 145605, "epoch": 3466} {"train_loss": -6.724575042724609, "global_step": 145606, "epoch": 3466} {"train_loss": -6.718255043029785, "global_step": 145607, "epoch": 3466} {"train_loss": -6.897856712341309, "global_step": 145608, "epoch": 3466} {"train_loss": -6.670716762542725, "global_step": 145609, "epoch": 3466} {"train_loss": -6.823361873626709, "global_step": 145610, "epoch": 3466} {"train_loss": -6.757684707641602, "global_step": 145611, "epoch": 3466} {"train_loss": -6.778407096862793, "global_step": 145612, "epoch": 3466} {"train_loss": -6.74721113840739, "global_step": 145613, "epoch": 3466, "val_loss": 67722.1015625} {"train_loss": -6.849062919616699, "global_step": 145614, "epoch": 3467} {"train_loss": -6.983271598815918, "global_step": 145615, "epoch": 3467} {"train_loss": -6.856816291809082, "global_step": 145616, "epoch": 3467} {"train_loss": -6.880954265594482, "global_step": 145617, "epoch": 3467} {"train_loss": -6.875197887420654, "global_step": 145618, "epoch": 3467} {"train_loss": -6.833127975463867, "global_step": 145619, "epoch": 3467} {"train_loss": -6.942793846130371, "global_step": 145620, "epoch": 3467} {"train_loss": -6.775783538818359, "global_step": 145621, "epoch": 3467} {"train_loss": -6.761741638183594, "global_step": 145622, "epoch": 3467} {"train_loss": -6.767337322235107, "global_step": 145623, "epoch": 3467} {"train_loss": -6.831148147583008, "global_step": 145624, "epoch": 3467} {"train_loss": -6.861392498016357, "global_step": 145625, "epoch": 3467} {"train_loss": -6.856926918029785, "global_step": 145626, "epoch": 3467} {"train_loss": -6.6995415687561035, "global_step": 145627, "epoch": 3467} {"train_loss": -6.706567764282227, "global_step": 145628, "epoch": 3467} {"train_loss": -6.726099014282227, "global_step": 145629, "epoch": 3467} {"train_loss": -6.835454940795898, "global_step": 145630, "epoch": 3467} {"train_loss": -6.7780656814575195, "global_step": 145631, "epoch": 3467} {"train_loss": -6.83888578414917, "global_step": 145632, "epoch": 3467} {"train_loss": -6.809347629547119, "global_step": 145633, "epoch": 3467} {"train_loss": -6.822751045227051, "global_step": 145634, "epoch": 3467} {"train_loss": -6.777730941772461, "global_step": 145635, "epoch": 3467} {"train_loss": -6.757656097412109, "global_step": 145636, "epoch": 3467} {"train_loss": -6.772232532501221, "global_step": 145637, "epoch": 3467} {"train_loss": -6.837624549865723, "global_step": 145638, "epoch": 3467} {"train_loss": -6.841104507446289, "global_step": 145639, "epoch": 3467} {"train_loss": -6.774470329284668, "global_step": 145640, "epoch": 3467} {"train_loss": -6.76370906829834, "global_step": 145641, "epoch": 3467} {"train_loss": -6.801041126251221, "global_step": 145642, "epoch": 3467} {"train_loss": -6.666426658630371, "global_step": 145643, "epoch": 3467} {"train_loss": -6.762270927429199, "global_step": 145644, "epoch": 3467} {"train_loss": -6.713230133056641, "global_step": 145645, "epoch": 3467} {"train_loss": -6.7745561599731445, "global_step": 145646, "epoch": 3467} {"train_loss": -6.730965614318848, "global_step": 145647, "epoch": 3467} {"train_loss": -6.778201580047607, "global_step": 145648, "epoch": 3467} {"train_loss": -6.815016746520996, "global_step": 145649, "epoch": 3467} {"train_loss": -6.714015960693359, "global_step": 145650, "epoch": 3467} {"train_loss": -6.752099990844727, "global_step": 145651, "epoch": 3467} {"train_loss": -6.8288164138793945, "global_step": 145652, "epoch": 3467} {"train_loss": -6.773746013641357, "global_step": 145653, "epoch": 3467} {"train_loss": -6.774304389953613, "global_step": 145654, "epoch": 3467} {"train_loss": -6.795676742281232, "global_step": 145655, "epoch": 3467, "val_loss": 67872.4140625} {"train_loss": -6.8201494216918945, "global_step": 145656, "epoch": 3468} {"train_loss": -6.74966287612915, "global_step": 145657, "epoch": 3468} {"train_loss": -6.742733955383301, "global_step": 145658, "epoch": 3468} {"train_loss": -6.7397236824035645, "global_step": 145659, "epoch": 3468} {"train_loss": -6.781931400299072, "global_step": 145660, "epoch": 3468} {"train_loss": -6.7466535568237305, "global_step": 145661, "epoch": 3468} {"train_loss": -6.763570785522461, "global_step": 145662, "epoch": 3468} {"train_loss": -6.8395256996154785, "global_step": 145663, "epoch": 3468} {"train_loss": -6.719735145568848, "global_step": 145664, "epoch": 3468} {"train_loss": -6.673828125, "global_step": 145665, "epoch": 3468} {"train_loss": -6.672499656677246, "global_step": 145666, "epoch": 3468} {"train_loss": -6.764054298400879, "global_step": 145667, "epoch": 3468} {"train_loss": -6.705190181732178, "global_step": 145668, "epoch": 3468} {"train_loss": -6.847041606903076, "global_step": 145669, "epoch": 3468} {"train_loss": -6.793455600738525, "global_step": 145670, "epoch": 3468} {"train_loss": -6.70097017288208, "global_step": 145671, "epoch": 3468} {"train_loss": -6.865886688232422, "global_step": 145672, "epoch": 3468} {"train_loss": -6.6980695724487305, "global_step": 145673, "epoch": 3468} {"train_loss": -6.746245861053467, "global_step": 145674, "epoch": 3468} {"train_loss": -6.840667247772217, "global_step": 145675, "epoch": 3468} {"train_loss": -6.8556904792785645, "global_step": 145676, "epoch": 3468} {"train_loss": -6.816596984863281, "global_step": 145677, "epoch": 3468} {"train_loss": -6.801148414611816, "global_step": 145678, "epoch": 3468} {"train_loss": -6.793036460876465, "global_step": 145679, "epoch": 3468} {"train_loss": -6.735882759094238, "global_step": 145680, "epoch": 3468} {"train_loss": -6.901036262512207, "global_step": 145681, "epoch": 3468} {"train_loss": -6.811622619628906, "global_step": 145682, "epoch": 3468} {"train_loss": -6.873648643493652, "global_step": 145683, "epoch": 3468} {"train_loss": -6.862973213195801, "global_step": 145684, "epoch": 3468} {"train_loss": -6.710139274597168, "global_step": 145685, "epoch": 3468} {"train_loss": -6.827818393707275, "global_step": 145686, "epoch": 3468} {"train_loss": -6.713709354400635, "global_step": 145687, "epoch": 3468} {"train_loss": -6.766002655029297, "global_step": 145688, "epoch": 3468} {"train_loss": -6.795714378356934, "global_step": 145689, "epoch": 3468} {"train_loss": -6.722146987915039, "global_step": 145690, "epoch": 3468} {"train_loss": -6.778206825256348, "global_step": 145691, "epoch": 3468} {"train_loss": -6.702561855316162, "global_step": 145692, "epoch": 3468} {"train_loss": -6.827630043029785, "global_step": 145693, "epoch": 3468} {"train_loss": -6.817196846008301, "global_step": 145694, "epoch": 3468} {"train_loss": -6.84998893737793, "global_step": 145695, "epoch": 3468} {"train_loss": -6.788220405578613, "global_step": 145696, "epoch": 3468} {"train_loss": -6.78251778511774, "global_step": 145697, "epoch": 3468, "val_loss": 67593.5546875} {"train_loss": -6.939166069030762, "global_step": 145698, "epoch": 3469} {"train_loss": -6.828640937805176, "global_step": 145699, "epoch": 3469} {"train_loss": -6.781135559082031, "global_step": 145700, "epoch": 3469} {"train_loss": -6.884171962738037, "global_step": 145701, "epoch": 3469} {"train_loss": -6.823733329772949, "global_step": 145702, "epoch": 3469} {"train_loss": -6.912379741668701, "global_step": 145703, "epoch": 3469} {"train_loss": -6.907611846923828, "global_step": 145704, "epoch": 3469} {"train_loss": -6.874729633331299, "global_step": 145705, "epoch": 3469} {"train_loss": -6.869243144989014, "global_step": 145706, "epoch": 3469} {"train_loss": -6.816595554351807, "global_step": 145707, "epoch": 3469} {"train_loss": -6.844715118408203, "global_step": 145708, "epoch": 3469} {"train_loss": -6.945368766784668, "global_step": 145709, "epoch": 3469} {"train_loss": -6.80845832824707, "global_step": 145710, "epoch": 3469} {"train_loss": -6.799929618835449, "global_step": 145711, "epoch": 3469} {"train_loss": -6.781585216522217, "global_step": 145712, "epoch": 3469} {"train_loss": -6.9332275390625, "global_step": 145713, "epoch": 3469} {"train_loss": -6.790106773376465, "global_step": 145714, "epoch": 3469} {"train_loss": -6.926141262054443, "global_step": 145715, "epoch": 3469} {"train_loss": -6.839897155761719, "global_step": 145716, "epoch": 3469} {"train_loss": -6.761301040649414, "global_step": 145717, "epoch": 3469} {"train_loss": -6.8188066482543945, "global_step": 145718, "epoch": 3469} {"train_loss": -6.782932281494141, "global_step": 145719, "epoch": 3469} {"train_loss": -6.934665679931641, "global_step": 145720, "epoch": 3469} {"train_loss": -6.855016231536865, "global_step": 145721, "epoch": 3469} {"train_loss": -6.880875587463379, "global_step": 145722, "epoch": 3469} {"train_loss": -6.644777297973633, "global_step": 145723, "epoch": 3469} {"train_loss": -6.8194193840026855, "global_step": 145724, "epoch": 3469} {"train_loss": -6.844362258911133, "global_step": 145725, "epoch": 3469} {"train_loss": -6.797630310058594, "global_step": 145726, "epoch": 3469} {"train_loss": -6.763127326965332, "global_step": 145727, "epoch": 3469} {"train_loss": -6.771275520324707, "global_step": 145728, "epoch": 3469} {"train_loss": -6.826104640960693, "global_step": 145729, "epoch": 3469} {"train_loss": -6.781238555908203, "global_step": 145730, "epoch": 3469} {"train_loss": -6.939818382263184, "global_step": 145731, "epoch": 3469} {"train_loss": -6.738101959228516, "global_step": 145732, "epoch": 3469} {"train_loss": -6.7635040283203125, "global_step": 145733, "epoch": 3469} {"train_loss": -6.805139541625977, "global_step": 145734, "epoch": 3469} {"train_loss": -6.8027849197387695, "global_step": 145735, "epoch": 3469} {"train_loss": -6.790048599243164, "global_step": 145736, "epoch": 3469} {"train_loss": -6.677824974060059, "global_step": 145737, "epoch": 3469} {"train_loss": -6.741519927978516, "global_step": 145738, "epoch": 3469} {"train_loss": -6.824487163907006, "global_step": 145739, "epoch": 3469, "val_loss": 67764.796875} {"train_loss": -6.848618507385254, "global_step": 145740, "epoch": 3470} {"train_loss": -6.766354560852051, "global_step": 145741, "epoch": 3470} {"train_loss": -6.841445446014404, "global_step": 145742, "epoch": 3470} {"train_loss": -6.854081630706787, "global_step": 145743, "epoch": 3470} {"train_loss": -6.763437747955322, "global_step": 145744, "epoch": 3470} {"train_loss": -6.9436821937561035, "global_step": 145745, "epoch": 3470} {"train_loss": -6.755500793457031, "global_step": 145746, "epoch": 3470} {"train_loss": -6.764554023742676, "global_step": 145747, "epoch": 3470} {"train_loss": -6.822582244873047, "global_step": 145748, "epoch": 3470} {"train_loss": -6.833268165588379, "global_step": 145749, "epoch": 3470} {"train_loss": -6.78498649597168, "global_step": 145750, "epoch": 3470} {"train_loss": -6.803473472595215, "global_step": 145751, "epoch": 3470} {"train_loss": -6.792533874511719, "global_step": 145752, "epoch": 3470} {"train_loss": -6.834165573120117, "global_step": 145753, "epoch": 3470} {"train_loss": -6.6358642578125, "global_step": 145754, "epoch": 3470} {"train_loss": -6.812406539916992, "global_step": 145755, "epoch": 3470} {"train_loss": -6.775871753692627, "global_step": 145756, "epoch": 3470} {"train_loss": -6.6768903732299805, "global_step": 145757, "epoch": 3470} {"train_loss": -6.707708358764648, "global_step": 145758, "epoch": 3470} {"train_loss": -6.751962661743164, "global_step": 145759, "epoch": 3470} {"train_loss": -6.7976555824279785, "global_step": 145760, "epoch": 3470} {"train_loss": -6.873288154602051, "global_step": 145761, "epoch": 3470} {"train_loss": -6.711596965789795, "global_step": 145762, "epoch": 3470} {"train_loss": -6.770630836486816, "global_step": 145763, "epoch": 3470} {"train_loss": -6.647514343261719, "global_step": 145764, "epoch": 3470} {"train_loss": -6.686136722564697, "global_step": 145765, "epoch": 3470} {"train_loss": -6.8150835037231445, "global_step": 145766, "epoch": 3470} {"train_loss": -6.808558464050293, "global_step": 145767, "epoch": 3470} {"train_loss": -6.810149192810059, "global_step": 145768, "epoch": 3470} {"train_loss": -6.8311543464660645, "global_step": 145769, "epoch": 3470} {"train_loss": -6.708245277404785, "global_step": 145770, "epoch": 3470} {"train_loss": -6.731060028076172, "global_step": 145771, "epoch": 3470} {"train_loss": -6.745100021362305, "global_step": 145772, "epoch": 3470} {"train_loss": -6.908564567565918, "global_step": 145773, "epoch": 3470} {"train_loss": -6.856323719024658, "global_step": 145774, "epoch": 3470} {"train_loss": -6.8149213790893555, "global_step": 145775, "epoch": 3470} {"train_loss": -6.746748924255371, "global_step": 145776, "epoch": 3470} {"train_loss": -6.792182922363281, "global_step": 145777, "epoch": 3470} {"train_loss": -6.837222099304199, "global_step": 145778, "epoch": 3470} {"train_loss": -6.7634382247924805, "global_step": 145779, "epoch": 3470} {"train_loss": -6.811190605163574, "global_step": 145780, "epoch": 3470} {"train_loss": -6.783697809491839, "global_step": 145781, "epoch": 3470, "val_loss": 67658.375} {"train_loss": -6.755293846130371, "global_step": 145782, "epoch": 3471} {"train_loss": -6.885633945465088, "global_step": 145783, "epoch": 3471} {"train_loss": -6.830738067626953, "global_step": 145784, "epoch": 3471} {"train_loss": -6.875654697418213, "global_step": 145785, "epoch": 3471} {"train_loss": -6.759784698486328, "global_step": 145786, "epoch": 3471} {"train_loss": -6.758035182952881, "global_step": 145787, "epoch": 3471} {"train_loss": -6.8953118324279785, "global_step": 145788, "epoch": 3471} {"train_loss": -6.860583782196045, "global_step": 145789, "epoch": 3471} {"train_loss": -6.82564640045166, "global_step": 145790, "epoch": 3471} {"train_loss": -6.956393718719482, "global_step": 145791, "epoch": 3471} {"train_loss": -6.837275981903076, "global_step": 145792, "epoch": 3471} {"train_loss": -6.821008205413818, "global_step": 145793, "epoch": 3471} {"train_loss": -6.878744602203369, "global_step": 145794, "epoch": 3471} {"train_loss": -6.857086181640625, "global_step": 145795, "epoch": 3471} {"train_loss": -6.878026962280273, "global_step": 145796, "epoch": 3471} {"train_loss": -6.757264614105225, "global_step": 145797, "epoch": 3471} {"train_loss": -6.68389892578125, "global_step": 145798, "epoch": 3471} {"train_loss": -6.644330978393555, "global_step": 145799, "epoch": 3471} {"train_loss": -6.781782150268555, "global_step": 145800, "epoch": 3471} {"train_loss": -6.6645917892456055, "global_step": 145801, "epoch": 3471} {"train_loss": -6.753035068511963, "global_step": 145802, "epoch": 3471} {"train_loss": -6.680999279022217, "global_step": 145803, "epoch": 3471} {"train_loss": -6.701127529144287, "global_step": 145804, "epoch": 3471} {"train_loss": -6.771449089050293, "global_step": 145805, "epoch": 3471} {"train_loss": -6.7505202293396, "global_step": 145806, "epoch": 3471} {"train_loss": -6.743338584899902, "global_step": 145807, "epoch": 3471} {"train_loss": -6.6654462814331055, "global_step": 145808, "epoch": 3471} {"train_loss": -6.804408073425293, "global_step": 145809, "epoch": 3471} {"train_loss": -6.813614845275879, "global_step": 145810, "epoch": 3471} {"train_loss": -6.869988918304443, "global_step": 145811, "epoch": 3471} {"train_loss": -6.731305122375488, "global_step": 145812, "epoch": 3471} {"train_loss": -6.934891700744629, "global_step": 145813, "epoch": 3471} {"train_loss": -6.85618782043457, "global_step": 145814, "epoch": 3471} {"train_loss": -6.771852016448975, "global_step": 145815, "epoch": 3471} {"train_loss": -6.70802116394043, "global_step": 145816, "epoch": 3471} {"train_loss": -6.842408180236816, "global_step": 145817, "epoch": 3471} {"train_loss": -6.821113586425781, "global_step": 145818, "epoch": 3471} {"train_loss": -6.74683952331543, "global_step": 145819, "epoch": 3471} {"train_loss": -6.931601524353027, "global_step": 145820, "epoch": 3471} {"train_loss": -6.607034683227539, "global_step": 145821, "epoch": 3471} {"train_loss": -6.631627082824707, "global_step": 145822, "epoch": 3471} {"train_loss": -6.788711252666655, "global_step": 145823, "epoch": 3471, "val_loss": 67613.546875} {"train_loss": -6.715963840484619, "global_step": 145824, "epoch": 3472} {"train_loss": -6.7801361083984375, "global_step": 145825, "epoch": 3472} {"train_loss": -6.8821210861206055, "global_step": 145826, "epoch": 3472} {"train_loss": -6.951618194580078, "global_step": 145827, "epoch": 3472} {"train_loss": -6.850489616394043, "global_step": 145828, "epoch": 3472} {"train_loss": -6.845716953277588, "global_step": 145829, "epoch": 3472} {"train_loss": -6.823974609375, "global_step": 145830, "epoch": 3472} {"train_loss": -6.828566551208496, "global_step": 145831, "epoch": 3472} {"train_loss": -6.850213050842285, "global_step": 145832, "epoch": 3472} {"train_loss": -6.767723560333252, "global_step": 145833, "epoch": 3472} {"train_loss": -6.839998722076416, "global_step": 145834, "epoch": 3472} {"train_loss": -6.907750129699707, "global_step": 145835, "epoch": 3472} {"train_loss": -6.6717071533203125, "global_step": 145836, "epoch": 3472} {"train_loss": -6.787904739379883, "global_step": 145837, "epoch": 3472} {"train_loss": -6.858407974243164, "global_step": 145838, "epoch": 3472} {"train_loss": -6.741419792175293, "global_step": 145839, "epoch": 3472} {"train_loss": -6.741798400878906, "global_step": 145840, "epoch": 3472} {"train_loss": -6.798321723937988, "global_step": 145841, "epoch": 3472} {"train_loss": -6.756142616271973, "global_step": 145842, "epoch": 3472} {"train_loss": -6.880871772766113, "global_step": 145843, "epoch": 3472} {"train_loss": -6.892696380615234, "global_step": 145844, "epoch": 3472} {"train_loss": -6.779577255249023, "global_step": 145845, "epoch": 3472} {"train_loss": -6.895031929016113, "global_step": 145846, "epoch": 3472} {"train_loss": -6.879268169403076, "global_step": 145847, "epoch": 3472} {"train_loss": -6.887326240539551, "global_step": 145848, "epoch": 3472} {"train_loss": -6.858633041381836, "global_step": 145849, "epoch": 3472} {"train_loss": -6.918157577514648, "global_step": 145850, "epoch": 3472} {"train_loss": -6.952867031097412, "global_step": 145851, "epoch": 3472} {"train_loss": -6.938112258911133, "global_step": 145852, "epoch": 3472} {"train_loss": -6.845796585083008, "global_step": 145853, "epoch": 3472} {"train_loss": -6.7264533042907715, "global_step": 145854, "epoch": 3472} {"train_loss": -6.828674793243408, "global_step": 145855, "epoch": 3472} {"train_loss": -6.880271911621094, "global_step": 145856, "epoch": 3472} {"train_loss": -6.800809860229492, "global_step": 145857, "epoch": 3472} {"train_loss": -6.817975997924805, "global_step": 145858, "epoch": 3472} {"train_loss": -6.886508464813232, "global_step": 145859, "epoch": 3472} {"train_loss": -6.740819931030273, "global_step": 145860, "epoch": 3472} {"train_loss": -6.80665922164917, "global_step": 145861, "epoch": 3472} {"train_loss": -6.70123291015625, "global_step": 145862, "epoch": 3472} {"train_loss": -6.590345859527588, "global_step": 145863, "epoch": 3472} {"train_loss": -6.750571250915527, "global_step": 145864, "epoch": 3472} {"train_loss": -6.818758703413463, "global_step": 145865, "epoch": 3472, "val_loss": 67989.6796875} {"train_loss": -6.702470779418945, "global_step": 145866, "epoch": 3473} {"train_loss": -6.768429756164551, "global_step": 145867, "epoch": 3473} {"train_loss": -6.586012840270996, "global_step": 145868, "epoch": 3473} {"train_loss": -6.728246688842773, "global_step": 145869, "epoch": 3473} {"train_loss": -6.744528293609619, "global_step": 145870, "epoch": 3473} {"train_loss": -6.736692428588867, "global_step": 145871, "epoch": 3473} {"train_loss": -6.734409809112549, "global_step": 145872, "epoch": 3473} {"train_loss": -6.702746868133545, "global_step": 145873, "epoch": 3473} {"train_loss": -6.826930999755859, "global_step": 145874, "epoch": 3473} {"train_loss": -6.708355903625488, "global_step": 145875, "epoch": 3473} {"train_loss": -6.709299087524414, "global_step": 145876, "epoch": 3473} {"train_loss": -6.734949111938477, "global_step": 145877, "epoch": 3473} {"train_loss": -6.7096076011657715, "global_step": 145878, "epoch": 3473} {"train_loss": -6.869168281555176, "global_step": 145879, "epoch": 3473} {"train_loss": -6.852165222167969, "global_step": 145880, "epoch": 3473} {"train_loss": -6.847903251647949, "global_step": 145881, "epoch": 3473} {"train_loss": -6.809815406799316, "global_step": 145882, "epoch": 3473} {"train_loss": -6.790194034576416, "global_step": 145883, "epoch": 3473} {"train_loss": -6.7679572105407715, "global_step": 145884, "epoch": 3473} {"train_loss": -6.715106010437012, "global_step": 145885, "epoch": 3473} {"train_loss": -6.748583793640137, "global_step": 145886, "epoch": 3473} {"train_loss": -6.848353385925293, "global_step": 145887, "epoch": 3473} {"train_loss": -6.880336284637451, "global_step": 145888, "epoch": 3473} {"train_loss": -6.786017417907715, "global_step": 145889, "epoch": 3473} {"train_loss": -6.89354133605957, "global_step": 145890, "epoch": 3473} {"train_loss": -6.804697036743164, "global_step": 145891, "epoch": 3473} {"train_loss": -6.898780345916748, "global_step": 145892, "epoch": 3473} {"train_loss": -6.92824649810791, "global_step": 145893, "epoch": 3473} {"train_loss": -6.814145088195801, "global_step": 145894, "epoch": 3473} {"train_loss": -6.833015441894531, "global_step": 145895, "epoch": 3473} {"train_loss": -6.96193790435791, "global_step": 145896, "epoch": 3473} {"train_loss": -6.949568271636963, "global_step": 145897, "epoch": 3473} {"train_loss": -6.835087776184082, "global_step": 145898, "epoch": 3473} {"train_loss": -6.88249397277832, "global_step": 145899, "epoch": 3473} {"train_loss": -6.898087024688721, "global_step": 145900, "epoch": 3473} {"train_loss": -6.717523574829102, "global_step": 145901, "epoch": 3473} {"train_loss": -6.815258026123047, "global_step": 145902, "epoch": 3473} {"train_loss": -6.795009136199951, "global_step": 145903, "epoch": 3473} {"train_loss": -6.816394329071045, "global_step": 145904, "epoch": 3473} {"train_loss": -6.935301303863525, "global_step": 145905, "epoch": 3473} {"train_loss": -6.8184123039245605, "global_step": 145906, "epoch": 3473} {"train_loss": -6.804436626888457, "global_step": 145907, "epoch": 3473, "val_loss": 67806.515625} {"train_loss": -6.879581451416016, "global_step": 145908, "epoch": 3474} {"train_loss": -6.865368843078613, "global_step": 145909, "epoch": 3474} {"train_loss": -6.796964168548584, "global_step": 145910, "epoch": 3474} {"train_loss": -6.8745574951171875, "global_step": 145911, "epoch": 3474} {"train_loss": -6.795065879821777, "global_step": 145912, "epoch": 3474} {"train_loss": -6.919869422912598, "global_step": 145913, "epoch": 3474} {"train_loss": -6.869341850280762, "global_step": 145914, "epoch": 3474} {"train_loss": -6.82785701751709, "global_step": 145915, "epoch": 3474} {"train_loss": -6.772103786468506, "global_step": 145916, "epoch": 3474} {"train_loss": -6.867687225341797, "global_step": 145917, "epoch": 3474} {"train_loss": -6.821433067321777, "global_step": 145918, "epoch": 3474} {"train_loss": -6.734708786010742, "global_step": 145919, "epoch": 3474} {"train_loss": -6.806485176086426, "global_step": 145920, "epoch": 3474} {"train_loss": -6.909415245056152, "global_step": 145921, "epoch": 3474} {"train_loss": -6.693691730499268, "global_step": 145922, "epoch": 3474} {"train_loss": -6.754703521728516, "global_step": 145923, "epoch": 3474} {"train_loss": -6.79119348526001, "global_step": 145924, "epoch": 3474} {"train_loss": -6.740328788757324, "global_step": 145925, "epoch": 3474} {"train_loss": -6.841790676116943, "global_step": 145926, "epoch": 3474} {"train_loss": -6.783388614654541, "global_step": 145927, "epoch": 3474} {"train_loss": -6.896439552307129, "global_step": 145928, "epoch": 3474} {"train_loss": -6.724704742431641, "global_step": 145929, "epoch": 3474} {"train_loss": -6.7563157081604, "global_step": 145930, "epoch": 3474} {"train_loss": -6.856003284454346, "global_step": 145931, "epoch": 3474} {"train_loss": -6.856494426727295, "global_step": 145932, "epoch": 3474} {"train_loss": -6.7569732666015625, "global_step": 145933, "epoch": 3474} {"train_loss": -6.825869083404541, "global_step": 145934, "epoch": 3474} {"train_loss": -6.847933769226074, "global_step": 145935, "epoch": 3474} {"train_loss": -6.873297214508057, "global_step": 145936, "epoch": 3474} {"train_loss": -6.838888168334961, "global_step": 145937, "epoch": 3474} {"train_loss": -6.919271469116211, "global_step": 145938, "epoch": 3474} {"train_loss": -6.76590633392334, "global_step": 145939, "epoch": 3474} {"train_loss": -6.6782097816467285, "global_step": 145940, "epoch": 3474} {"train_loss": -6.948734760284424, "global_step": 145941, "epoch": 3474} {"train_loss": -6.962277412414551, "global_step": 145942, "epoch": 3474} {"train_loss": -6.8955841064453125, "global_step": 145943, "epoch": 3474} {"train_loss": -6.888268947601318, "global_step": 145944, "epoch": 3474} {"train_loss": -6.868180274963379, "global_step": 145945, "epoch": 3474} {"train_loss": -6.940232753753662, "global_step": 145946, "epoch": 3474} {"train_loss": -6.888790130615234, "global_step": 145947, "epoch": 3474} {"train_loss": -6.982329368591309, "global_step": 145948, "epoch": 3474} {"train_loss": -6.837354069664364, "global_step": 145949, "epoch": 3474, "val_loss": 67689.3203125} {"train_loss": -6.822441101074219, "global_step": 145950, "epoch": 3475} {"train_loss": -6.853972911834717, "global_step": 145951, "epoch": 3475} {"train_loss": -6.804049491882324, "global_step": 145952, "epoch": 3475} {"train_loss": -6.930644989013672, "global_step": 145953, "epoch": 3475} {"train_loss": -6.827609539031982, "global_step": 145954, "epoch": 3475} {"train_loss": -6.830379009246826, "global_step": 145955, "epoch": 3475} {"train_loss": -6.898072242736816, "global_step": 145956, "epoch": 3475} {"train_loss": -6.8714494705200195, "global_step": 145957, "epoch": 3475} {"train_loss": -6.950433731079102, "global_step": 145958, "epoch": 3475} {"train_loss": -6.818193435668945, "global_step": 145959, "epoch": 3475} {"train_loss": -6.851890563964844, "global_step": 145960, "epoch": 3475} {"train_loss": -6.903787612915039, "global_step": 145961, "epoch": 3475} {"train_loss": -6.822115898132324, "global_step": 145962, "epoch": 3475} {"train_loss": -6.976243019104004, "global_step": 145963, "epoch": 3475} {"train_loss": -6.857977390289307, "global_step": 145964, "epoch": 3475} {"train_loss": -6.837811470031738, "global_step": 145965, "epoch": 3475} {"train_loss": -6.882230281829834, "global_step": 145966, "epoch": 3475} {"train_loss": -6.774446487426758, "global_step": 145967, "epoch": 3475} {"train_loss": -6.8062520027160645, "global_step": 145968, "epoch": 3475} {"train_loss": -6.816169738769531, "global_step": 145969, "epoch": 3475} {"train_loss": -6.831567764282227, "global_step": 145970, "epoch": 3475} {"train_loss": -6.813730239868164, "global_step": 145971, "epoch": 3475} {"train_loss": -6.955778121948242, "global_step": 145972, "epoch": 3475} {"train_loss": -6.87758731842041, "global_step": 145973, "epoch": 3475} {"train_loss": -6.738691806793213, "global_step": 145974, "epoch": 3475} {"train_loss": -6.808965682983398, "global_step": 145975, "epoch": 3475} {"train_loss": -6.8501105308532715, "global_step": 145976, "epoch": 3475} {"train_loss": -6.904331207275391, "global_step": 145977, "epoch": 3475} {"train_loss": -6.984213829040527, "global_step": 145978, "epoch": 3475} {"train_loss": -6.813982963562012, "global_step": 145979, "epoch": 3475} {"train_loss": -6.899480819702148, "global_step": 145980, "epoch": 3475} {"train_loss": -6.809357643127441, "global_step": 145981, "epoch": 3475} {"train_loss": -6.878068923950195, "global_step": 145982, "epoch": 3475} {"train_loss": -6.849567413330078, "global_step": 145983, "epoch": 3475} {"train_loss": -6.827526092529297, "global_step": 145984, "epoch": 3475} {"train_loss": -6.793283462524414, "global_step": 145985, "epoch": 3475} {"train_loss": -6.825413227081299, "global_step": 145986, "epoch": 3475} {"train_loss": -6.878179550170898, "global_step": 145987, "epoch": 3475} {"train_loss": -6.869486331939697, "global_step": 145988, "epoch": 3475} {"train_loss": -6.671628952026367, "global_step": 145989, "epoch": 3475} {"train_loss": -6.750704765319824, "global_step": 145990, "epoch": 3475} {"train_loss": -6.846509763172695, "global_step": 145991, "epoch": 3475, "val_loss": 67841.46875} {"train_loss": -6.833026885986328, "global_step": 145992, "epoch": 3476} {"train_loss": -6.821159362792969, "global_step": 145993, "epoch": 3476} {"train_loss": -6.949375152587891, "global_step": 145994, "epoch": 3476} {"train_loss": -6.9002227783203125, "global_step": 145995, "epoch": 3476} {"train_loss": -6.831816673278809, "global_step": 145996, "epoch": 3476} {"train_loss": -6.784788131713867, "global_step": 145997, "epoch": 3476} {"train_loss": -6.901209831237793, "global_step": 145998, "epoch": 3476} {"train_loss": -6.7926740646362305, "global_step": 145999, "epoch": 3476} {"train_loss": -6.801997661590576, "global_step": 146000, "epoch": 3476} {"train_loss": -6.76519775390625, "global_step": 146001, "epoch": 3476} {"train_loss": -6.746804237365723, "global_step": 146002, "epoch": 3476} {"train_loss": -6.828432083129883, "global_step": 146003, "epoch": 3476} {"train_loss": -6.802417755126953, "global_step": 146004, "epoch": 3476} {"train_loss": -6.713862419128418, "global_step": 146005, "epoch": 3476} {"train_loss": -6.84559440612793, "global_step": 146006, "epoch": 3476} {"train_loss": -6.698131561279297, "global_step": 146007, "epoch": 3476} {"train_loss": -6.717119216918945, "global_step": 146008, "epoch": 3476} {"train_loss": -6.778066158294678, "global_step": 146009, "epoch": 3476} {"train_loss": -6.661808967590332, "global_step": 146010, "epoch": 3476} {"train_loss": -6.786447525024414, "global_step": 146011, "epoch": 3476} {"train_loss": -6.780276298522949, "global_step": 146012, "epoch": 3476} {"train_loss": -6.7826056480407715, "global_step": 146013, "epoch": 3476} {"train_loss": -6.723593711853027, "global_step": 146014, "epoch": 3476} {"train_loss": -6.806009292602539, "global_step": 146015, "epoch": 3476} {"train_loss": -6.80184268951416, "global_step": 146016, "epoch": 3476} {"train_loss": -6.656876564025879, "global_step": 146017, "epoch": 3476} {"train_loss": -6.712549686431885, "global_step": 146018, "epoch": 3476} {"train_loss": -6.912247180938721, "global_step": 146019, "epoch": 3476} {"train_loss": -6.779563903808594, "global_step": 146020, "epoch": 3476} {"train_loss": -6.736831188201904, "global_step": 146021, "epoch": 3476} {"train_loss": -6.788147926330566, "global_step": 146022, "epoch": 3476} {"train_loss": -6.819565773010254, "global_step": 146023, "epoch": 3476} {"train_loss": -6.825118064880371, "global_step": 146024, "epoch": 3476} {"train_loss": -6.75115966796875, "global_step": 146025, "epoch": 3476} {"train_loss": -6.814878463745117, "global_step": 146026, "epoch": 3476} {"train_loss": -6.794870853424072, "global_step": 146027, "epoch": 3476} {"train_loss": -6.833001613616943, "global_step": 146028, "epoch": 3476} {"train_loss": -6.89666223526001, "global_step": 146029, "epoch": 3476} {"train_loss": -6.757973670959473, "global_step": 146030, "epoch": 3476} {"train_loss": -6.907756328582764, "global_step": 146031, "epoch": 3476} {"train_loss": -6.921151161193848, "global_step": 146032, "epoch": 3476} {"train_loss": -6.801219009217762, "global_step": 146033, "epoch": 3476, "val_loss": 67770.1640625} {"train_loss": -6.818571090698242, "global_step": 146034, "epoch": 3477} {"train_loss": -6.986642837524414, "global_step": 146035, "epoch": 3477} {"train_loss": -6.927287578582764, "global_step": 146036, "epoch": 3477} {"train_loss": -6.881481647491455, "global_step": 146037, "epoch": 3477} {"train_loss": -6.789604187011719, "global_step": 146038, "epoch": 3477} {"train_loss": -6.86058235168457, "global_step": 146039, "epoch": 3477} {"train_loss": -6.863725662231445, "global_step": 146040, "epoch": 3477} {"train_loss": -6.844272136688232, "global_step": 146041, "epoch": 3477} {"train_loss": -6.896468162536621, "global_step": 146042, "epoch": 3477} {"train_loss": -6.7895612716674805, "global_step": 146043, "epoch": 3477} {"train_loss": -6.800515651702881, "global_step": 146044, "epoch": 3477} {"train_loss": -6.8617377281188965, "global_step": 146045, "epoch": 3477} {"train_loss": -6.86885929107666, "global_step": 146046, "epoch": 3477} {"train_loss": -6.769488334655762, "global_step": 146047, "epoch": 3477} {"train_loss": -6.865991592407227, "global_step": 146048, "epoch": 3477} {"train_loss": -6.849592208862305, "global_step": 146049, "epoch": 3477} {"train_loss": -6.81783390045166, "global_step": 146050, "epoch": 3477} {"train_loss": -6.734981536865234, "global_step": 146051, "epoch": 3477} {"train_loss": -6.805946350097656, "global_step": 146052, "epoch": 3477} {"train_loss": -6.778846740722656, "global_step": 146053, "epoch": 3477} {"train_loss": -6.738362789154053, "global_step": 146054, "epoch": 3477} {"train_loss": -6.734018325805664, "global_step": 146055, "epoch": 3477} {"train_loss": -6.699454307556152, "global_step": 146056, "epoch": 3477} {"train_loss": -6.67487907409668, "global_step": 146057, "epoch": 3477} {"train_loss": -6.867939472198486, "global_step": 146058, "epoch": 3477} {"train_loss": -6.918756484985352, "global_step": 146059, "epoch": 3477} {"train_loss": -6.764272689819336, "global_step": 146060, "epoch": 3477} {"train_loss": -6.882754802703857, "global_step": 146061, "epoch": 3477} {"train_loss": -6.681487083435059, "global_step": 146062, "epoch": 3477} {"train_loss": -6.8274335861206055, "global_step": 146063, "epoch": 3477} {"train_loss": -6.7453155517578125, "global_step": 146064, "epoch": 3477} {"train_loss": -6.769124984741211, "global_step": 146065, "epoch": 3477} {"train_loss": -6.812668800354004, "global_step": 146066, "epoch": 3477} {"train_loss": -6.851696968078613, "global_step": 146067, "epoch": 3477} {"train_loss": -6.832980632781982, "global_step": 146068, "epoch": 3477} {"train_loss": -6.817173004150391, "global_step": 146069, "epoch": 3477} {"train_loss": -6.726845741271973, "global_step": 146070, "epoch": 3477} {"train_loss": -6.748656749725342, "global_step": 146071, "epoch": 3477} {"train_loss": -6.778146743774414, "global_step": 146072, "epoch": 3477} {"train_loss": -6.839770317077637, "global_step": 146073, "epoch": 3477} {"train_loss": -6.836292743682861, "global_step": 146074, "epoch": 3477} {"train_loss": -6.811675139835903, "global_step": 146075, "epoch": 3477, "val_loss": 67726.1953125} {"train_loss": -6.833903789520264, "global_step": 146076, "epoch": 3478} {"train_loss": -6.868431091308594, "global_step": 146077, "epoch": 3478} {"train_loss": -6.79132080078125, "global_step": 146078, "epoch": 3478} {"train_loss": -6.924041748046875, "global_step": 146079, "epoch": 3478} {"train_loss": -6.829500675201416, "global_step": 146080, "epoch": 3478} {"train_loss": -6.808863639831543, "global_step": 146081, "epoch": 3478} {"train_loss": -6.907639026641846, "global_step": 146082, "epoch": 3478} {"train_loss": -6.813946723937988, "global_step": 146083, "epoch": 3478} {"train_loss": -6.871617317199707, "global_step": 146084, "epoch": 3478} {"train_loss": -6.873806953430176, "global_step": 146085, "epoch": 3478} {"train_loss": -6.89296817779541, "global_step": 146086, "epoch": 3478} {"train_loss": -6.890750885009766, "global_step": 146087, "epoch": 3478} {"train_loss": -6.725484371185303, "global_step": 146088, "epoch": 3478} {"train_loss": -6.682869911193848, "global_step": 146089, "epoch": 3478} {"train_loss": -6.844330310821533, "global_step": 146090, "epoch": 3478} {"train_loss": -6.722288608551025, "global_step": 146091, "epoch": 3478} {"train_loss": -6.898246765136719, "global_step": 146092, "epoch": 3478} {"train_loss": -6.856105804443359, "global_step": 146093, "epoch": 3478} {"train_loss": -6.8692097663879395, "global_step": 146094, "epoch": 3478} {"train_loss": -6.762918472290039, "global_step": 146095, "epoch": 3478} {"train_loss": -6.798511505126953, "global_step": 146096, "epoch": 3478} {"train_loss": -6.792446613311768, "global_step": 146097, "epoch": 3478} {"train_loss": -6.882963180541992, "global_step": 146098, "epoch": 3478} {"train_loss": -6.837494850158691, "global_step": 146099, "epoch": 3478} {"train_loss": -6.815640449523926, "global_step": 146100, "epoch": 3478} {"train_loss": -6.849257469177246, "global_step": 146101, "epoch": 3478} {"train_loss": -6.815725326538086, "global_step": 146102, "epoch": 3478} {"train_loss": -6.846406936645508, "global_step": 146103, "epoch": 3478} {"train_loss": -6.938180923461914, "global_step": 146104, "epoch": 3478} {"train_loss": -6.8575639724731445, "global_step": 146105, "epoch": 3478} {"train_loss": -6.825990676879883, "global_step": 146106, "epoch": 3478} {"train_loss": -6.941753387451172, "global_step": 146107, "epoch": 3478} {"train_loss": -6.778995513916016, "global_step": 146108, "epoch": 3478} {"train_loss": -6.6917548179626465, "global_step": 146109, "epoch": 3478} {"train_loss": -6.809647560119629, "global_step": 146110, "epoch": 3478} {"train_loss": -6.888768196105957, "global_step": 146111, "epoch": 3478} {"train_loss": -6.901760101318359, "global_step": 146112, "epoch": 3478} {"train_loss": -6.869825839996338, "global_step": 146113, "epoch": 3478} {"train_loss": -6.939164161682129, "global_step": 146114, "epoch": 3478} {"train_loss": -6.925830841064453, "global_step": 146115, "epoch": 3478} {"train_loss": -6.766273498535156, "global_step": 146116, "epoch": 3478} {"train_loss": -6.843164171491351, "global_step": 146117, "epoch": 3478, "val_loss": 67764.21875} {"train_loss": -6.841834545135498, "global_step": 146118, "epoch": 3479} {"train_loss": -6.830826282501221, "global_step": 146119, "epoch": 3479} {"train_loss": -6.805360794067383, "global_step": 146120, "epoch": 3479} {"train_loss": -6.796176910400391, "global_step": 146121, "epoch": 3479} {"train_loss": -6.967065334320068, "global_step": 146122, "epoch": 3479} {"train_loss": -6.94830846786499, "global_step": 146123, "epoch": 3479} {"train_loss": -6.837364196777344, "global_step": 146124, "epoch": 3479} {"train_loss": -6.8544111251831055, "global_step": 146125, "epoch": 3479} {"train_loss": -6.927289009094238, "global_step": 146126, "epoch": 3479} {"train_loss": -6.872420787811279, "global_step": 146127, "epoch": 3479} {"train_loss": -6.833759307861328, "global_step": 146128, "epoch": 3479} {"train_loss": -6.769504547119141, "global_step": 146129, "epoch": 3479} {"train_loss": -6.819287300109863, "global_step": 146130, "epoch": 3479} {"train_loss": -6.826741695404053, "global_step": 146131, "epoch": 3479} {"train_loss": -6.8407392501831055, "global_step": 146132, "epoch": 3479} {"train_loss": -6.7876434326171875, "global_step": 146133, "epoch": 3479} {"train_loss": -6.881671905517578, "global_step": 146134, "epoch": 3479} {"train_loss": -6.854494571685791, "global_step": 146135, "epoch": 3479} {"train_loss": -6.800756931304932, "global_step": 146136, "epoch": 3479} {"train_loss": -6.821805000305176, "global_step": 146137, "epoch": 3479} {"train_loss": -6.900698184967041, "global_step": 146138, "epoch": 3479} {"train_loss": -6.9111247062683105, "global_step": 146139, "epoch": 3479} {"train_loss": -6.823691368103027, "global_step": 146140, "epoch": 3479} {"train_loss": -6.903809070587158, "global_step": 146141, "epoch": 3479} {"train_loss": -6.832545757293701, "global_step": 146142, "epoch": 3479} {"train_loss": -6.859202861785889, "global_step": 146143, "epoch": 3479} {"train_loss": -6.944344997406006, "global_step": 146144, "epoch": 3479} {"train_loss": -6.903874397277832, "global_step": 146145, "epoch": 3479} {"train_loss": -6.838609218597412, "global_step": 146146, "epoch": 3479} {"train_loss": -6.827791213989258, "global_step": 146147, "epoch": 3479} {"train_loss": -6.821674346923828, "global_step": 146148, "epoch": 3479} {"train_loss": -6.834478378295898, "global_step": 146149, "epoch": 3479} {"train_loss": -6.805087566375732, "global_step": 146150, "epoch": 3479} {"train_loss": -6.863853454589844, "global_step": 146151, "epoch": 3479} {"train_loss": -6.862902641296387, "global_step": 146152, "epoch": 3479} {"train_loss": -6.831496238708496, "global_step": 146153, "epoch": 3479} {"train_loss": -6.895450592041016, "global_step": 146154, "epoch": 3479} {"train_loss": -6.821965217590332, "global_step": 146155, "epoch": 3479} {"train_loss": -6.853357315063477, "global_step": 146156, "epoch": 3479} {"train_loss": -6.792749881744385, "global_step": 146157, "epoch": 3479} {"train_loss": -6.881527900695801, "global_step": 146158, "epoch": 3479} {"train_loss": -6.853906835828509, "global_step": 146159, "epoch": 3479, "val_loss": 67714.9140625} {"train_loss": -6.930661201477051, "global_step": 146160, "epoch": 3480} {"train_loss": -6.773466110229492, "global_step": 146161, "epoch": 3480} {"train_loss": -6.87530517578125, "global_step": 146162, "epoch": 3480} {"train_loss": -6.881820201873779, "global_step": 146163, "epoch": 3480} {"train_loss": -6.82865571975708, "global_step": 146164, "epoch": 3480} {"train_loss": -6.98291015625, "global_step": 146165, "epoch": 3480} {"train_loss": -6.859704971313477, "global_step": 146166, "epoch": 3480} {"train_loss": -6.716390609741211, "global_step": 146167, "epoch": 3480} {"train_loss": -6.768529415130615, "global_step": 146168, "epoch": 3480} {"train_loss": -6.824864387512207, "global_step": 146169, "epoch": 3480} {"train_loss": -6.643577575683594, "global_step": 146170, "epoch": 3480} {"train_loss": -6.789431571960449, "global_step": 146171, "epoch": 3480} {"train_loss": -6.790299415588379, "global_step": 146172, "epoch": 3480} {"train_loss": -6.876528739929199, "global_step": 146173, "epoch": 3480} {"train_loss": -6.860291481018066, "global_step": 146174, "epoch": 3480} {"train_loss": -6.84835147857666, "global_step": 146175, "epoch": 3480} {"train_loss": -6.845659255981445, "global_step": 146176, "epoch": 3480} {"train_loss": -6.950730323791504, "global_step": 146177, "epoch": 3480} {"train_loss": -6.770679950714111, "global_step": 146178, "epoch": 3480} {"train_loss": -6.81846284866333, "global_step": 146179, "epoch": 3480} {"train_loss": -6.993562698364258, "global_step": 146180, "epoch": 3480} {"train_loss": -6.9350690841674805, "global_step": 146181, "epoch": 3480} {"train_loss": -6.8399505615234375, "global_step": 146182, "epoch": 3480} {"train_loss": -6.6759185791015625, "global_step": 146183, "epoch": 3480} {"train_loss": -6.7397356033325195, "global_step": 146184, "epoch": 3480} {"train_loss": -6.797501564025879, "global_step": 146185, "epoch": 3480} {"train_loss": -6.927173614501953, "global_step": 146186, "epoch": 3480} {"train_loss": -6.855772018432617, "global_step": 146187, "epoch": 3480} {"train_loss": -6.871723175048828, "global_step": 146188, "epoch": 3480} {"train_loss": -6.84938907623291, "global_step": 146189, "epoch": 3480} {"train_loss": -6.840028285980225, "global_step": 146190, "epoch": 3480} {"train_loss": -6.895221710205078, "global_step": 146191, "epoch": 3480} {"train_loss": -6.935152530670166, "global_step": 146192, "epoch": 3480} {"train_loss": -6.796354293823242, "global_step": 146193, "epoch": 3480} {"train_loss": -6.805145740509033, "global_step": 146194, "epoch": 3480} {"train_loss": -6.943852424621582, "global_step": 146195, "epoch": 3480} {"train_loss": -6.847511291503906, "global_step": 146196, "epoch": 3480} {"train_loss": -6.754413604736328, "global_step": 146197, "epoch": 3480} {"train_loss": -6.788908958435059, "global_step": 146198, "epoch": 3480} {"train_loss": -6.795658111572266, "global_step": 146199, "epoch": 3480} {"train_loss": -6.875118255615234, "global_step": 146200, "epoch": 3480} {"train_loss": -6.838988349551246, "global_step": 146201, "epoch": 3480, "val_loss": 67996.8125} {"train_loss": -6.840473175048828, "global_step": 146202, "epoch": 3481} {"train_loss": -6.7929368019104, "global_step": 146203, "epoch": 3481} {"train_loss": -6.904121398925781, "global_step": 146204, "epoch": 3481} {"train_loss": -6.88103723526001, "global_step": 146205, "epoch": 3481} {"train_loss": -6.915063858032227, "global_step": 146206, "epoch": 3481} {"train_loss": -6.814464569091797, "global_step": 146207, "epoch": 3481} {"train_loss": -6.92314338684082, "global_step": 146208, "epoch": 3481} {"train_loss": -6.9080071449279785, "global_step": 146209, "epoch": 3481} {"train_loss": -6.858668804168701, "global_step": 146210, "epoch": 3481} {"train_loss": -6.9115891456604, "global_step": 146211, "epoch": 3481} {"train_loss": -6.874975204467773, "global_step": 146212, "epoch": 3481} {"train_loss": -6.807912826538086, "global_step": 146213, "epoch": 3481} {"train_loss": -6.776683807373047, "global_step": 146214, "epoch": 3481} {"train_loss": -6.951375484466553, "global_step": 146215, "epoch": 3481} {"train_loss": -6.774269104003906, "global_step": 146216, "epoch": 3481} {"train_loss": -6.8100690841674805, "global_step": 146217, "epoch": 3481} {"train_loss": -6.847901344299316, "global_step": 146218, "epoch": 3481} {"train_loss": -6.6712470054626465, "global_step": 146219, "epoch": 3481} {"train_loss": -6.747644901275635, "global_step": 146220, "epoch": 3481} {"train_loss": -6.733950614929199, "global_step": 146221, "epoch": 3481} {"train_loss": -6.834521770477295, "global_step": 146222, "epoch": 3481} {"train_loss": -6.80773401260376, "global_step": 146223, "epoch": 3481} {"train_loss": -6.922917366027832, "global_step": 146224, "epoch": 3481} {"train_loss": -6.830719947814941, "global_step": 146225, "epoch": 3481} {"train_loss": -6.789490222930908, "global_step": 146226, "epoch": 3481} {"train_loss": -6.8413896560668945, "global_step": 146227, "epoch": 3481} {"train_loss": -6.807339191436768, "global_step": 146228, "epoch": 3481} {"train_loss": -6.7643256187438965, "global_step": 146229, "epoch": 3481} {"train_loss": -6.830430030822754, "global_step": 146230, "epoch": 3481} {"train_loss": -6.690052032470703, "global_step": 146231, "epoch": 3481} {"train_loss": -6.7161664962768555, "global_step": 146232, "epoch": 3481} {"train_loss": -6.8462934494018555, "global_step": 146233, "epoch": 3481} {"train_loss": -6.877387046813965, "global_step": 146234, "epoch": 3481} {"train_loss": -6.800217151641846, "global_step": 146235, "epoch": 3481} {"train_loss": -6.848235130310059, "global_step": 146236, "epoch": 3481} {"train_loss": -6.795601844787598, "global_step": 146237, "epoch": 3481} {"train_loss": -6.751871109008789, "global_step": 146238, "epoch": 3481} {"train_loss": -6.807315826416016, "global_step": 146239, "epoch": 3481} {"train_loss": -6.831287384033203, "global_step": 146240, "epoch": 3481} {"train_loss": -6.7717180252075195, "global_step": 146241, "epoch": 3481} {"train_loss": -6.747279167175293, "global_step": 146242, "epoch": 3481} {"train_loss": -6.822430531183879, "global_step": 146243, "epoch": 3481, "val_loss": 67891.4453125} {"train_loss": -6.770083427429199, "global_step": 146244, "epoch": 3482} {"train_loss": -6.635329246520996, "global_step": 146245, "epoch": 3482} {"train_loss": -6.792015075683594, "global_step": 146246, "epoch": 3482} {"train_loss": -6.666095733642578, "global_step": 146247, "epoch": 3482} {"train_loss": -6.696529388427734, "global_step": 146248, "epoch": 3482} {"train_loss": -6.693480014801025, "global_step": 146249, "epoch": 3482} {"train_loss": -6.618910312652588, "global_step": 146250, "epoch": 3482} {"train_loss": -6.761419773101807, "global_step": 146251, "epoch": 3482} {"train_loss": -6.815183162689209, "global_step": 146252, "epoch": 3482} {"train_loss": -6.828854560852051, "global_step": 146253, "epoch": 3482} {"train_loss": -6.8004279136657715, "global_step": 146254, "epoch": 3482} {"train_loss": -6.767765998840332, "global_step": 146255, "epoch": 3482} {"train_loss": -6.955711364746094, "global_step": 146256, "epoch": 3482} {"train_loss": -6.749847412109375, "global_step": 146257, "epoch": 3482} {"train_loss": -6.758728981018066, "global_step": 146258, "epoch": 3482} {"train_loss": -6.785063743591309, "global_step": 146259, "epoch": 3482} {"train_loss": -6.666891098022461, "global_step": 146260, "epoch": 3482} {"train_loss": -6.827602386474609, "global_step": 146261, "epoch": 3482} {"train_loss": -6.767312049865723, "global_step": 146262, "epoch": 3482} {"train_loss": -6.782547950744629, "global_step": 146263, "epoch": 3482} {"train_loss": -6.805931091308594, "global_step": 146264, "epoch": 3482} {"train_loss": -6.732023239135742, "global_step": 146265, "epoch": 3482} {"train_loss": -6.920368194580078, "global_step": 146266, "epoch": 3482} {"train_loss": -6.801970481872559, "global_step": 146267, "epoch": 3482} {"train_loss": -6.88306999206543, "global_step": 146268, "epoch": 3482} {"train_loss": -6.895179748535156, "global_step": 146269, "epoch": 3482} {"train_loss": -6.706030368804932, "global_step": 146270, "epoch": 3482} {"train_loss": -6.9379401206970215, "global_step": 146271, "epoch": 3482} {"train_loss": -6.773615837097168, "global_step": 146272, "epoch": 3482} {"train_loss": -6.903531551361084, "global_step": 146273, "epoch": 3482} {"train_loss": -6.653181076049805, "global_step": 146274, "epoch": 3482} {"train_loss": -6.865004062652588, "global_step": 146275, "epoch": 3482} {"train_loss": -6.88230037689209, "global_step": 146276, "epoch": 3482} {"train_loss": -6.775604724884033, "global_step": 146277, "epoch": 3482} {"train_loss": -6.8030877113342285, "global_step": 146278, "epoch": 3482} {"train_loss": -6.779829025268555, "global_step": 146279, "epoch": 3482} {"train_loss": -6.705933094024658, "global_step": 146280, "epoch": 3482} {"train_loss": -6.788319110870361, "global_step": 146281, "epoch": 3482} {"train_loss": -6.754267692565918, "global_step": 146282, "epoch": 3482} {"train_loss": -6.7739667892456055, "global_step": 146283, "epoch": 3482} {"train_loss": -6.779293060302734, "global_step": 146284, "epoch": 3482} {"train_loss": -6.78429981640407, "global_step": 146285, "epoch": 3482, "val_loss": 67866.96875} {"train_loss": -6.74340295791626, "global_step": 146286, "epoch": 3483} {"train_loss": -6.776939392089844, "global_step": 146287, "epoch": 3483} {"train_loss": -6.765316963195801, "global_step": 146288, "epoch": 3483} {"train_loss": -6.830499172210693, "global_step": 146289, "epoch": 3483} {"train_loss": -6.900911331176758, "global_step": 146290, "epoch": 3483} {"train_loss": -6.756792068481445, "global_step": 146291, "epoch": 3483} {"train_loss": -6.811824798583984, "global_step": 146292, "epoch": 3483} {"train_loss": -6.817778587341309, "global_step": 146293, "epoch": 3483} {"train_loss": -6.736098766326904, "global_step": 146294, "epoch": 3483} {"train_loss": -6.807300567626953, "global_step": 146295, "epoch": 3483} {"train_loss": -6.644380569458008, "global_step": 146296, "epoch": 3483} {"train_loss": -6.845905780792236, "global_step": 146297, "epoch": 3483} {"train_loss": -6.867148399353027, "global_step": 146298, "epoch": 3483} {"train_loss": -6.7383551597595215, "global_step": 146299, "epoch": 3483} {"train_loss": -6.796771049499512, "global_step": 146300, "epoch": 3483} {"train_loss": -6.660273551940918, "global_step": 146301, "epoch": 3483} {"train_loss": -6.8424859046936035, "global_step": 146302, "epoch": 3483} {"train_loss": -6.8076863288879395, "global_step": 146303, "epoch": 3483} {"train_loss": -6.749027729034424, "global_step": 146304, "epoch": 3483} {"train_loss": -6.764745712280273, "global_step": 146305, "epoch": 3483} {"train_loss": -6.876285552978516, "global_step": 146306, "epoch": 3483} {"train_loss": -6.836705207824707, "global_step": 146307, "epoch": 3483} {"train_loss": -6.936141014099121, "global_step": 146308, "epoch": 3483} {"train_loss": -6.841744422912598, "global_step": 146309, "epoch": 3483} {"train_loss": -6.896420955657959, "global_step": 146310, "epoch": 3483} {"train_loss": -6.829545021057129, "global_step": 146311, "epoch": 3483} {"train_loss": -6.799178123474121, "global_step": 146312, "epoch": 3483} {"train_loss": -6.894017696380615, "global_step": 146313, "epoch": 3483} {"train_loss": -6.8769330978393555, "global_step": 146314, "epoch": 3483} {"train_loss": -6.8607964515686035, "global_step": 146315, "epoch": 3483} {"train_loss": -6.821588516235352, "global_step": 146316, "epoch": 3483} {"train_loss": -6.808673858642578, "global_step": 146317, "epoch": 3483} {"train_loss": -6.894706726074219, "global_step": 146318, "epoch": 3483} {"train_loss": -6.834303855895996, "global_step": 146319, "epoch": 3483} {"train_loss": -6.694031715393066, "global_step": 146320, "epoch": 3483} {"train_loss": -6.850497245788574, "global_step": 146321, "epoch": 3483} {"train_loss": -6.767019271850586, "global_step": 146322, "epoch": 3483} {"train_loss": -6.846477508544922, "global_step": 146323, "epoch": 3483} {"train_loss": -6.821375846862793, "global_step": 146324, "epoch": 3483} {"train_loss": -6.703813076019287, "global_step": 146325, "epoch": 3483} {"train_loss": -6.798734188079834, "global_step": 146326, "epoch": 3483} {"train_loss": -6.808543613978794, "global_step": 146327, "epoch": 3483, "val_loss": 67791.140625} {"train_loss": -6.859452247619629, "global_step": 146328, "epoch": 3484} {"train_loss": -6.768475532531738, "global_step": 146329, "epoch": 3484} {"train_loss": -6.813763618469238, "global_step": 146330, "epoch": 3484} {"train_loss": -6.7993011474609375, "global_step": 146331, "epoch": 3484} {"train_loss": -6.762346267700195, "global_step": 146332, "epoch": 3484} {"train_loss": -6.8393049240112305, "global_step": 146333, "epoch": 3484} {"train_loss": -6.9023518562316895, "global_step": 146334, "epoch": 3484} {"train_loss": -6.932803153991699, "global_step": 146335, "epoch": 3484} {"train_loss": -6.8437910079956055, "global_step": 146336, "epoch": 3484} {"train_loss": -6.875144958496094, "global_step": 146337, "epoch": 3484} {"train_loss": -6.896425247192383, "global_step": 146338, "epoch": 3484} {"train_loss": -6.806663513183594, "global_step": 146339, "epoch": 3484} {"train_loss": -6.850917816162109, "global_step": 146340, "epoch": 3484} {"train_loss": -6.869933605194092, "global_step": 146341, "epoch": 3484} {"train_loss": -6.921952247619629, "global_step": 146342, "epoch": 3484} {"train_loss": -6.872587203979492, "global_step": 146343, "epoch": 3484} {"train_loss": -6.818478584289551, "global_step": 146344, "epoch": 3484} {"train_loss": -6.783205509185791, "global_step": 146345, "epoch": 3484} {"train_loss": -6.890138626098633, "global_step": 146346, "epoch": 3484} {"train_loss": -6.86368989944458, "global_step": 146347, "epoch": 3484} {"train_loss": -6.797781944274902, "global_step": 146348, "epoch": 3484} {"train_loss": -6.870235443115234, "global_step": 146349, "epoch": 3484} {"train_loss": -6.840217113494873, "global_step": 146350, "epoch": 3484} {"train_loss": -6.852935314178467, "global_step": 146351, "epoch": 3484} {"train_loss": -6.851696968078613, "global_step": 146352, "epoch": 3484} {"train_loss": -6.7743024826049805, "global_step": 146353, "epoch": 3484} {"train_loss": -6.810370445251465, "global_step": 146354, "epoch": 3484} {"train_loss": -6.805422306060791, "global_step": 146355, "epoch": 3484} {"train_loss": -6.8451128005981445, "global_step": 146356, "epoch": 3484} {"train_loss": -6.875070571899414, "global_step": 146357, "epoch": 3484} {"train_loss": -6.886904716491699, "global_step": 146358, "epoch": 3484} {"train_loss": -6.857821464538574, "global_step": 146359, "epoch": 3484} {"train_loss": -6.815087795257568, "global_step": 146360, "epoch": 3484} {"train_loss": -6.8588409423828125, "global_step": 146361, "epoch": 3484} {"train_loss": -6.799490451812744, "global_step": 146362, "epoch": 3484} {"train_loss": -6.853862762451172, "global_step": 146363, "epoch": 3484} {"train_loss": -6.928777694702148, "global_step": 146364, "epoch": 3484} {"train_loss": -6.868288516998291, "global_step": 146365, "epoch": 3484} {"train_loss": -6.765798568725586, "global_step": 146366, "epoch": 3484} {"train_loss": -6.881438732147217, "global_step": 146367, "epoch": 3484} {"train_loss": -6.789905548095703, "global_step": 146368, "epoch": 3484} {"train_loss": -6.842552548363095, "global_step": 146369, "epoch": 3484, "val_loss": 67944.390625} {"train_loss": -6.739164352416992, "global_step": 146370, "epoch": 3485} {"train_loss": -6.900470733642578, "global_step": 146371, "epoch": 3485} {"train_loss": -6.748293876647949, "global_step": 146372, "epoch": 3485} {"train_loss": -6.821091651916504, "global_step": 146373, "epoch": 3485} {"train_loss": -6.980464935302734, "global_step": 146374, "epoch": 3485} {"train_loss": -6.790506362915039, "global_step": 146375, "epoch": 3485} {"train_loss": -6.865417003631592, "global_step": 146376, "epoch": 3485} {"train_loss": -6.834407329559326, "global_step": 146377, "epoch": 3485} {"train_loss": -6.74066162109375, "global_step": 146378, "epoch": 3485} {"train_loss": -6.803977966308594, "global_step": 146379, "epoch": 3485} {"train_loss": -6.793941974639893, "global_step": 146380, "epoch": 3485} {"train_loss": -6.771029949188232, "global_step": 146381, "epoch": 3485} {"train_loss": -6.807391166687012, "global_step": 146382, "epoch": 3485} {"train_loss": -6.841041564941406, "global_step": 146383, "epoch": 3485} {"train_loss": -6.782956600189209, "global_step": 146384, "epoch": 3485} {"train_loss": -6.787178993225098, "global_step": 146385, "epoch": 3485} {"train_loss": -6.796092987060547, "global_step": 146386, "epoch": 3485} {"train_loss": -6.833197116851807, "global_step": 146387, "epoch": 3485} {"train_loss": -6.700138568878174, "global_step": 146388, "epoch": 3485} {"train_loss": -6.823093414306641, "global_step": 146389, "epoch": 3485} {"train_loss": -6.792031288146973, "global_step": 146390, "epoch": 3485} {"train_loss": -6.785864353179932, "global_step": 146391, "epoch": 3485} {"train_loss": -6.7446088790893555, "global_step": 146392, "epoch": 3485} {"train_loss": -6.767437934875488, "global_step": 146393, "epoch": 3485} {"train_loss": -6.798373699188232, "global_step": 146394, "epoch": 3485} {"train_loss": -6.707470893859863, "global_step": 146395, "epoch": 3485} {"train_loss": -6.867780685424805, "global_step": 146396, "epoch": 3485} {"train_loss": -6.746334075927734, "global_step": 146397, "epoch": 3485} {"train_loss": -6.7061872482299805, "global_step": 146398, "epoch": 3485} {"train_loss": -6.803072929382324, "global_step": 146399, "epoch": 3485} {"train_loss": -6.763250350952148, "global_step": 146400, "epoch": 3485} {"train_loss": -6.653445243835449, "global_step": 146401, "epoch": 3485} {"train_loss": -6.767021179199219, "global_step": 146402, "epoch": 3485} {"train_loss": -6.8527398109436035, "global_step": 146403, "epoch": 3485} {"train_loss": -6.764613151550293, "global_step": 146404, "epoch": 3485} {"train_loss": -6.832881450653076, "global_step": 146405, "epoch": 3485} {"train_loss": -6.8799333572387695, "global_step": 146406, "epoch": 3485} {"train_loss": -6.829770088195801, "global_step": 146407, "epoch": 3485} {"train_loss": -6.8699493408203125, "global_step": 146408, "epoch": 3485} {"train_loss": -6.806868553161621, "global_step": 146409, "epoch": 3485} {"train_loss": -6.76076602935791, "global_step": 146410, "epoch": 3485} {"train_loss": -6.797133377620152, "global_step": 146411, "epoch": 3485, "val_loss": 67983.328125} {"train_loss": -6.876413345336914, "global_step": 146412, "epoch": 3486} {"train_loss": -6.839533805847168, "global_step": 146413, "epoch": 3486} {"train_loss": -6.802120208740234, "global_step": 146414, "epoch": 3486} {"train_loss": -6.839542865753174, "global_step": 146415, "epoch": 3486} {"train_loss": -6.768757343292236, "global_step": 146416, "epoch": 3486} {"train_loss": -6.788962364196777, "global_step": 146417, "epoch": 3486} {"train_loss": -6.992977142333984, "global_step": 146418, "epoch": 3486} {"train_loss": -6.9022216796875, "global_step": 146419, "epoch": 3486} {"train_loss": -6.839305400848389, "global_step": 146420, "epoch": 3486} {"train_loss": -6.819616317749023, "global_step": 146421, "epoch": 3486} {"train_loss": -6.838489532470703, "global_step": 146422, "epoch": 3486} {"train_loss": -6.7872443199157715, "global_step": 146423, "epoch": 3486} {"train_loss": -6.829440593719482, "global_step": 146424, "epoch": 3486} {"train_loss": -6.893893241882324, "global_step": 146425, "epoch": 3486} {"train_loss": -6.652226448059082, "global_step": 146426, "epoch": 3486} {"train_loss": -6.704996109008789, "global_step": 146427, "epoch": 3486} {"train_loss": -6.905414581298828, "global_step": 146428, "epoch": 3486} {"train_loss": -6.871769428253174, "global_step": 146429, "epoch": 3486} {"train_loss": -6.713513374328613, "global_step": 146430, "epoch": 3486} {"train_loss": -6.646663665771484, "global_step": 146431, "epoch": 3486} {"train_loss": -6.766201972961426, "global_step": 146432, "epoch": 3486} {"train_loss": -6.6921796798706055, "global_step": 146433, "epoch": 3486} {"train_loss": -6.8839874267578125, "global_step": 146434, "epoch": 3486} {"train_loss": -6.542296409606934, "global_step": 146435, "epoch": 3486} {"train_loss": -6.577869415283203, "global_step": 146436, "epoch": 3486} {"train_loss": -6.756563186645508, "global_step": 146437, "epoch": 3486} {"train_loss": -6.503713607788086, "global_step": 146438, "epoch": 3486} {"train_loss": -6.630115032196045, "global_step": 146439, "epoch": 3486} {"train_loss": -6.79359245300293, "global_step": 146440, "epoch": 3486} {"train_loss": -6.444384574890137, "global_step": 146441, "epoch": 3486} {"train_loss": -6.72016716003418, "global_step": 146442, "epoch": 3486} {"train_loss": -6.551053047180176, "global_step": 146443, "epoch": 3486} {"train_loss": -6.6683549880981445, "global_step": 146444, "epoch": 3486} {"train_loss": -6.681196212768555, "global_step": 146445, "epoch": 3486} {"train_loss": -6.738359451293945, "global_step": 146446, "epoch": 3486} {"train_loss": -6.642633438110352, "global_step": 146447, "epoch": 3486} {"train_loss": -6.609696388244629, "global_step": 146448, "epoch": 3486} {"train_loss": -6.702117919921875, "global_step": 146449, "epoch": 3486} {"train_loss": -6.499701499938965, "global_step": 146450, "epoch": 3486} {"train_loss": -6.665858745574951, "global_step": 146451, "epoch": 3486} {"train_loss": -6.685354232788086, "global_step": 146452, "epoch": 3486} {"train_loss": -6.73744341305324, "global_step": 146453, "epoch": 3486, "val_loss": 67799.5546875} {"train_loss": -6.644712924957275, "global_step": 146454, "epoch": 3487} {"train_loss": -6.7420654296875, "global_step": 146455, "epoch": 3487} {"train_loss": -6.6983561515808105, "global_step": 146456, "epoch": 3487} {"train_loss": -6.779818534851074, "global_step": 146457, "epoch": 3487} {"train_loss": -6.680049896240234, "global_step": 146458, "epoch": 3487} {"train_loss": -6.687636375427246, "global_step": 146459, "epoch": 3487} {"train_loss": -6.6887922286987305, "global_step": 146460, "epoch": 3487} {"train_loss": -6.827976703643799, "global_step": 146461, "epoch": 3487} {"train_loss": -6.7602338790893555, "global_step": 146462, "epoch": 3487} {"train_loss": -6.800712585449219, "global_step": 146463, "epoch": 3487} {"train_loss": -6.7823896408081055, "global_step": 146464, "epoch": 3487} {"train_loss": -6.785944938659668, "global_step": 146465, "epoch": 3487} {"train_loss": -6.803062438964844, "global_step": 146466, "epoch": 3487} {"train_loss": -6.8227691650390625, "global_step": 146467, "epoch": 3487} {"train_loss": -6.842240333557129, "global_step": 146468, "epoch": 3487} {"train_loss": -6.884920120239258, "global_step": 146469, "epoch": 3487} {"train_loss": -6.8376007080078125, "global_step": 146470, "epoch": 3487} {"train_loss": -6.732114315032959, "global_step": 146471, "epoch": 3487} {"train_loss": -6.814370155334473, "global_step": 146472, "epoch": 3487} {"train_loss": -6.902798175811768, "global_step": 146473, "epoch": 3487} {"train_loss": -6.808620929718018, "global_step": 146474, "epoch": 3487} {"train_loss": -6.8028788566589355, "global_step": 146475, "epoch": 3487} {"train_loss": -6.709694862365723, "global_step": 146476, "epoch": 3487} {"train_loss": -6.901167869567871, "global_step": 146477, "epoch": 3487} {"train_loss": -6.854662895202637, "global_step": 146478, "epoch": 3487} {"train_loss": -6.702291488647461, "global_step": 146479, "epoch": 3487} {"train_loss": -6.83534049987793, "global_step": 146480, "epoch": 3487} {"train_loss": -6.794292449951172, "global_step": 146481, "epoch": 3487} {"train_loss": -6.784116744995117, "global_step": 146482, "epoch": 3487} {"train_loss": -6.875338554382324, "global_step": 146483, "epoch": 3487} {"train_loss": -6.805163383483887, "global_step": 146484, "epoch": 3487} {"train_loss": -6.943748474121094, "global_step": 146485, "epoch": 3487} {"train_loss": -6.961110591888428, "global_step": 146486, "epoch": 3487} {"train_loss": -6.817604064941406, "global_step": 146487, "epoch": 3487} {"train_loss": -6.86207389831543, "global_step": 146488, "epoch": 3487} {"train_loss": -6.804180145263672, "global_step": 146489, "epoch": 3487} {"train_loss": -6.935251235961914, "global_step": 146490, "epoch": 3487} {"train_loss": -6.99295711517334, "global_step": 146491, "epoch": 3487} {"train_loss": -6.850915908813477, "global_step": 146492, "epoch": 3487} {"train_loss": -6.849725723266602, "global_step": 146493, "epoch": 3487} {"train_loss": -6.82229471206665, "global_step": 146494, "epoch": 3487} {"train_loss": -6.80904483795166, "global_step": 146495, "epoch": 3487, "val_loss": 67712.421875} {"train_loss": -6.83826208114624, "global_step": 146496, "epoch": 3488} {"train_loss": -6.86841344833374, "global_step": 146497, "epoch": 3488} {"train_loss": -6.8361005783081055, "global_step": 146498, "epoch": 3488} {"train_loss": -6.733990669250488, "global_step": 146499, "epoch": 3488} {"train_loss": -6.940835952758789, "global_step": 146500, "epoch": 3488} {"train_loss": -6.898016452789307, "global_step": 146501, "epoch": 3488} {"train_loss": -6.874059200286865, "global_step": 146502, "epoch": 3488} {"train_loss": -6.7294721603393555, "global_step": 146503, "epoch": 3488} {"train_loss": -6.8225297927856445, "global_step": 146504, "epoch": 3488} {"train_loss": -6.897408485412598, "global_step": 146505, "epoch": 3488} {"train_loss": -6.815763473510742, "global_step": 146506, "epoch": 3488} {"train_loss": -6.864729881286621, "global_step": 146507, "epoch": 3488} {"train_loss": -6.837882041931152, "global_step": 146508, "epoch": 3488} {"train_loss": -6.809527397155762, "global_step": 146509, "epoch": 3488} {"train_loss": -6.782027244567871, "global_step": 146510, "epoch": 3488} {"train_loss": -6.771703720092773, "global_step": 146511, "epoch": 3488} {"train_loss": -6.903162479400635, "global_step": 146512, "epoch": 3488} {"train_loss": -6.839550018310547, "global_step": 146513, "epoch": 3488} {"train_loss": -6.868396759033203, "global_step": 146514, "epoch": 3488} {"train_loss": -6.741610527038574, "global_step": 146515, "epoch": 3488} {"train_loss": -6.868928909301758, "global_step": 146516, "epoch": 3488} {"train_loss": -6.862421035766602, "global_step": 146517, "epoch": 3488} {"train_loss": -6.780097007751465, "global_step": 146518, "epoch": 3488} {"train_loss": -6.987053871154785, "global_step": 146519, "epoch": 3488} {"train_loss": -6.808163642883301, "global_step": 146520, "epoch": 3488} {"train_loss": -6.8198137283325195, "global_step": 146521, "epoch": 3488} {"train_loss": -6.795289993286133, "global_step": 146522, "epoch": 3488} {"train_loss": -6.828117847442627, "global_step": 146523, "epoch": 3488} {"train_loss": -6.7234697341918945, "global_step": 146524, "epoch": 3488} {"train_loss": -6.828046798706055, "global_step": 146525, "epoch": 3488} {"train_loss": -6.815215110778809, "global_step": 146526, "epoch": 3488} {"train_loss": -6.857571125030518, "global_step": 146527, "epoch": 3488} {"train_loss": -6.61934757232666, "global_step": 146528, "epoch": 3488} {"train_loss": -6.715114116668701, "global_step": 146529, "epoch": 3488} {"train_loss": -6.653192520141602, "global_step": 146530, "epoch": 3488} {"train_loss": -6.85490608215332, "global_step": 146531, "epoch": 3488} {"train_loss": -6.837352275848389, "global_step": 146532, "epoch": 3488} {"train_loss": -6.827760219573975, "global_step": 146533, "epoch": 3488} {"train_loss": -6.7141523361206055, "global_step": 146534, "epoch": 3488} {"train_loss": -6.725388526916504, "global_step": 146535, "epoch": 3488} {"train_loss": -6.816636085510254, "global_step": 146536, "epoch": 3488} {"train_loss": -6.812713520867484, "global_step": 146537, "epoch": 3488, "val_loss": 67751.734375} {"train_loss": -6.71867561340332, "global_step": 146538, "epoch": 3489} {"train_loss": -6.676894187927246, "global_step": 146539, "epoch": 3489} {"train_loss": -6.8125996589660645, "global_step": 146540, "epoch": 3489} {"train_loss": -6.79652214050293, "global_step": 146541, "epoch": 3489} {"train_loss": -6.789129257202148, "global_step": 146542, "epoch": 3489} {"train_loss": -6.82659912109375, "global_step": 146543, "epoch": 3489} {"train_loss": -6.883530616760254, "global_step": 146544, "epoch": 3489} {"train_loss": -6.710731506347656, "global_step": 146545, "epoch": 3489} {"train_loss": -6.774374485015869, "global_step": 146546, "epoch": 3489} {"train_loss": -6.77351188659668, "global_step": 146547, "epoch": 3489} {"train_loss": -6.764881610870361, "global_step": 146548, "epoch": 3489} {"train_loss": -6.909756660461426, "global_step": 146549, "epoch": 3489} {"train_loss": -6.836372375488281, "global_step": 146550, "epoch": 3489} {"train_loss": -6.76228141784668, "global_step": 146551, "epoch": 3489} {"train_loss": -6.755048751831055, "global_step": 146552, "epoch": 3489} {"train_loss": -6.683928489685059, "global_step": 146553, "epoch": 3489} {"train_loss": -6.902061462402344, "global_step": 146554, "epoch": 3489} {"train_loss": -6.842803001403809, "global_step": 146555, "epoch": 3489} {"train_loss": -6.894747734069824, "global_step": 146556, "epoch": 3489} {"train_loss": -6.858208656311035, "global_step": 146557, "epoch": 3489} {"train_loss": -6.6791205406188965, "global_step": 146558, "epoch": 3489} {"train_loss": -6.927799701690674, "global_step": 146559, "epoch": 3489} {"train_loss": -6.744358062744141, "global_step": 146560, "epoch": 3489} {"train_loss": -6.793200969696045, "global_step": 146561, "epoch": 3489} {"train_loss": -6.945888519287109, "global_step": 146562, "epoch": 3489} {"train_loss": -6.678175926208496, "global_step": 146563, "epoch": 3489} {"train_loss": -6.835263252258301, "global_step": 146564, "epoch": 3489} {"train_loss": -6.854179382324219, "global_step": 146565, "epoch": 3489} {"train_loss": -6.848952293395996, "global_step": 146566, "epoch": 3489} {"train_loss": -6.905026435852051, "global_step": 146567, "epoch": 3489} {"train_loss": -6.8547821044921875, "global_step": 146568, "epoch": 3489} {"train_loss": -6.856081962585449, "global_step": 146569, "epoch": 3489} {"train_loss": -6.758640289306641, "global_step": 146570, "epoch": 3489} {"train_loss": -6.803648948669434, "global_step": 146571, "epoch": 3489} {"train_loss": -6.724475860595703, "global_step": 146572, "epoch": 3489} {"train_loss": -6.831991195678711, "global_step": 146573, "epoch": 3489} {"train_loss": -6.907559394836426, "global_step": 146574, "epoch": 3489} {"train_loss": -6.786426544189453, "global_step": 146575, "epoch": 3489} {"train_loss": -6.81224250793457, "global_step": 146576, "epoch": 3489} {"train_loss": -6.823716163635254, "global_step": 146577, "epoch": 3489} {"train_loss": -6.876710414886475, "global_step": 146578, "epoch": 3489} {"train_loss": -6.811737457911174, "global_step": 146579, "epoch": 3489, "val_loss": 67820.921875} {"train_loss": -6.730974197387695, "global_step": 146580, "epoch": 3490} {"train_loss": -6.88368034362793, "global_step": 146581, "epoch": 3490} {"train_loss": -6.74800443649292, "global_step": 146582, "epoch": 3490} {"train_loss": -6.630832672119141, "global_step": 146583, "epoch": 3490} {"train_loss": -6.832674026489258, "global_step": 146584, "epoch": 3490} {"train_loss": -6.661532402038574, "global_step": 146585, "epoch": 3490} {"train_loss": -6.614104270935059, "global_step": 146586, "epoch": 3490} {"train_loss": -6.6988725662231445, "global_step": 146587, "epoch": 3490} {"train_loss": -6.567492485046387, "global_step": 146588, "epoch": 3490} {"train_loss": -6.753997802734375, "global_step": 146589, "epoch": 3490} {"train_loss": -6.815650939941406, "global_step": 146590, "epoch": 3490} {"train_loss": -6.762622356414795, "global_step": 146591, "epoch": 3490} {"train_loss": -6.769104480743408, "global_step": 146592, "epoch": 3490} {"train_loss": -6.6800312995910645, "global_step": 146593, "epoch": 3490} {"train_loss": -6.681734561920166, "global_step": 146594, "epoch": 3490} {"train_loss": -6.854127883911133, "global_step": 146595, "epoch": 3490} {"train_loss": -6.796097278594971, "global_step": 146596, "epoch": 3490} {"train_loss": -6.774251937866211, "global_step": 146597, "epoch": 3490} {"train_loss": -6.833314895629883, "global_step": 146598, "epoch": 3490} {"train_loss": -6.882908821105957, "global_step": 146599, "epoch": 3490} {"train_loss": -6.800570487976074, "global_step": 146600, "epoch": 3490} {"train_loss": -6.885592460632324, "global_step": 146601, "epoch": 3490} {"train_loss": -6.794926643371582, "global_step": 146602, "epoch": 3490} {"train_loss": -6.919227600097656, "global_step": 146603, "epoch": 3490} {"train_loss": -6.76883602142334, "global_step": 146604, "epoch": 3490} {"train_loss": -6.833029747009277, "global_step": 146605, "epoch": 3490} {"train_loss": -6.8121232986450195, "global_step": 146606, "epoch": 3490} {"train_loss": -6.923351287841797, "global_step": 146607, "epoch": 3490} {"train_loss": -6.8552117347717285, "global_step": 146608, "epoch": 3490} {"train_loss": -6.720010280609131, "global_step": 146609, "epoch": 3490} {"train_loss": -6.841543197631836, "global_step": 146610, "epoch": 3490} {"train_loss": -6.7609124183654785, "global_step": 146611, "epoch": 3490} {"train_loss": -6.837405204772949, "global_step": 146612, "epoch": 3490} {"train_loss": -6.766388893127441, "global_step": 146613, "epoch": 3490} {"train_loss": -6.765155792236328, "global_step": 146614, "epoch": 3490} {"train_loss": -6.772207260131836, "global_step": 146615, "epoch": 3490} {"train_loss": -6.865488529205322, "global_step": 146616, "epoch": 3490} {"train_loss": -6.752492904663086, "global_step": 146617, "epoch": 3490} {"train_loss": -6.901451110839844, "global_step": 146618, "epoch": 3490} {"train_loss": -6.833421230316162, "global_step": 146619, "epoch": 3490} {"train_loss": -6.7137532234191895, "global_step": 146620, "epoch": 3490} {"train_loss": -6.7832333246866865, "global_step": 146621, "epoch": 3490, "val_loss": 67820.6796875} {"train_loss": -6.789923191070557, "global_step": 146622, "epoch": 3491} {"train_loss": -6.787010192871094, "global_step": 146623, "epoch": 3491} {"train_loss": -6.770035266876221, "global_step": 146624, "epoch": 3491} {"train_loss": -6.808862209320068, "global_step": 146625, "epoch": 3491} {"train_loss": -6.723008155822754, "global_step": 146626, "epoch": 3491} {"train_loss": -6.90993595123291, "global_step": 146627, "epoch": 3491} {"train_loss": -6.674704551696777, "global_step": 146628, "epoch": 3491} {"train_loss": -6.7477874755859375, "global_step": 146629, "epoch": 3491} {"train_loss": -6.787294387817383, "global_step": 146630, "epoch": 3491} {"train_loss": -6.715813636779785, "global_step": 146631, "epoch": 3491} {"train_loss": -6.812730312347412, "global_step": 146632, "epoch": 3491} {"train_loss": -6.86909818649292, "global_step": 146633, "epoch": 3491} {"train_loss": -6.818396091461182, "global_step": 146634, "epoch": 3491} {"train_loss": -6.828397750854492, "global_step": 146635, "epoch": 3491} {"train_loss": -6.619583606719971, "global_step": 146636, "epoch": 3491} {"train_loss": -6.833184242248535, "global_step": 146637, "epoch": 3491} {"train_loss": -6.833900451660156, "global_step": 146638, "epoch": 3491} {"train_loss": -6.7780866622924805, "global_step": 146639, "epoch": 3491} {"train_loss": -6.85787296295166, "global_step": 146640, "epoch": 3491} {"train_loss": -6.859455585479736, "global_step": 146641, "epoch": 3491} {"train_loss": -6.813197135925293, "global_step": 146642, "epoch": 3491} {"train_loss": -6.824557781219482, "global_step": 146643, "epoch": 3491} {"train_loss": -6.710659027099609, "global_step": 146644, "epoch": 3491} {"train_loss": -6.863835334777832, "global_step": 146645, "epoch": 3491} {"train_loss": -6.773947715759277, "global_step": 146646, "epoch": 3491} {"train_loss": -6.850017547607422, "global_step": 146647, "epoch": 3491} {"train_loss": -6.778018951416016, "global_step": 146648, "epoch": 3491} {"train_loss": -6.852078437805176, "global_step": 146649, "epoch": 3491} {"train_loss": -6.755937576293945, "global_step": 146650, "epoch": 3491} {"train_loss": -6.7793731689453125, "global_step": 146651, "epoch": 3491} {"train_loss": -6.893365383148193, "global_step": 146652, "epoch": 3491} {"train_loss": -6.795727729797363, "global_step": 146653, "epoch": 3491} {"train_loss": -6.764843940734863, "global_step": 146654, "epoch": 3491} {"train_loss": -6.915984630584717, "global_step": 146655, "epoch": 3491} {"train_loss": -6.7250776290893555, "global_step": 146656, "epoch": 3491} {"train_loss": -6.8044328689575195, "global_step": 146657, "epoch": 3491} {"train_loss": -6.8778581619262695, "global_step": 146658, "epoch": 3491} {"train_loss": -6.746893882751465, "global_step": 146659, "epoch": 3491} {"train_loss": -6.822456359863281, "global_step": 146660, "epoch": 3491} {"train_loss": -6.830765724182129, "global_step": 146661, "epoch": 3491} {"train_loss": -6.919589996337891, "global_step": 146662, "epoch": 3491} {"train_loss": -6.80301106543768, "global_step": 146663, "epoch": 3491, "val_loss": 67859.21875} {"train_loss": -6.862343788146973, "global_step": 146664, "epoch": 3492} {"train_loss": -6.758413314819336, "global_step": 146665, "epoch": 3492} {"train_loss": -6.8108601570129395, "global_step": 146666, "epoch": 3492} {"train_loss": -6.846270561218262, "global_step": 146667, "epoch": 3492} {"train_loss": -6.762901782989502, "global_step": 146668, "epoch": 3492} {"train_loss": -6.583956718444824, "global_step": 146669, "epoch": 3492} {"train_loss": -6.671054363250732, "global_step": 146670, "epoch": 3492} {"train_loss": -6.783783912658691, "global_step": 146671, "epoch": 3492} {"train_loss": -6.534154891967773, "global_step": 146672, "epoch": 3492} {"train_loss": -6.820695400238037, "global_step": 146673, "epoch": 3492} {"train_loss": -6.66827392578125, "global_step": 146674, "epoch": 3492} {"train_loss": -6.6737260818481445, "global_step": 146675, "epoch": 3492} {"train_loss": -6.70602560043335, "global_step": 146676, "epoch": 3492} {"train_loss": -6.636534690856934, "global_step": 146677, "epoch": 3492} {"train_loss": -6.730524063110352, "global_step": 146678, "epoch": 3492} {"train_loss": -6.7383623123168945, "global_step": 146679, "epoch": 3492} {"train_loss": -6.809547424316406, "global_step": 146680, "epoch": 3492} {"train_loss": -6.86988639831543, "global_step": 146681, "epoch": 3492} {"train_loss": -6.756389617919922, "global_step": 146682, "epoch": 3492} {"train_loss": -6.752936840057373, "global_step": 146683, "epoch": 3492} {"train_loss": -6.90740442276001, "global_step": 146684, "epoch": 3492} {"train_loss": -6.773811340332031, "global_step": 146685, "epoch": 3492} {"train_loss": -6.834317207336426, "global_step": 146686, "epoch": 3492} {"train_loss": -6.862020492553711, "global_step": 146687, "epoch": 3492} {"train_loss": -6.739961624145508, "global_step": 146688, "epoch": 3492} {"train_loss": -6.792932987213135, "global_step": 146689, "epoch": 3492} {"train_loss": -6.8697686195373535, "global_step": 146690, "epoch": 3492} {"train_loss": -6.9148359298706055, "global_step": 146691, "epoch": 3492} {"train_loss": -6.930194854736328, "global_step": 146692, "epoch": 3492} {"train_loss": -6.826995849609375, "global_step": 146693, "epoch": 3492} {"train_loss": -6.762759208679199, "global_step": 146694, "epoch": 3492} {"train_loss": -6.813426971435547, "global_step": 146695, "epoch": 3492} {"train_loss": -6.807401657104492, "global_step": 146696, "epoch": 3492} {"train_loss": -6.870517730712891, "global_step": 146697, "epoch": 3492} {"train_loss": -6.85588264465332, "global_step": 146698, "epoch": 3492} {"train_loss": -6.786690711975098, "global_step": 146699, "epoch": 3492} {"train_loss": -6.768256187438965, "global_step": 146700, "epoch": 3492} {"train_loss": -6.918354511260986, "global_step": 146701, "epoch": 3492} {"train_loss": -6.859471797943115, "global_step": 146702, "epoch": 3492} {"train_loss": -6.748664855957031, "global_step": 146703, "epoch": 3492} {"train_loss": -6.904738426208496, "global_step": 146704, "epoch": 3492} {"train_loss": -6.791650068192255, "global_step": 146705, "epoch": 3492, "val_loss": 67634.5234375} {"train_loss": -6.943917751312256, "global_step": 146706, "epoch": 3493} {"train_loss": -6.835204124450684, "global_step": 146707, "epoch": 3493} {"train_loss": -6.855373382568359, "global_step": 146708, "epoch": 3493} {"train_loss": -6.855251312255859, "global_step": 146709, "epoch": 3493} {"train_loss": -6.838870048522949, "global_step": 146710, "epoch": 3493} {"train_loss": -6.879427433013916, "global_step": 146711, "epoch": 3493} {"train_loss": -6.788700103759766, "global_step": 146712, "epoch": 3493} {"train_loss": -6.784049034118652, "global_step": 146713, "epoch": 3493} {"train_loss": -6.873587608337402, "global_step": 146714, "epoch": 3493} {"train_loss": -6.81353235244751, "global_step": 146715, "epoch": 3493} {"train_loss": -6.673039436340332, "global_step": 146716, "epoch": 3493} {"train_loss": -6.737323760986328, "global_step": 146717, "epoch": 3493} {"train_loss": -6.8928022384643555, "global_step": 146718, "epoch": 3493} {"train_loss": -6.87005090713501, "global_step": 146719, "epoch": 3493} {"train_loss": -6.790012359619141, "global_step": 146720, "epoch": 3493} {"train_loss": -6.839534759521484, "global_step": 146721, "epoch": 3493} {"train_loss": -6.8709797859191895, "global_step": 146722, "epoch": 3493} {"train_loss": -6.761089324951172, "global_step": 146723, "epoch": 3493} {"train_loss": -6.791963577270508, "global_step": 146724, "epoch": 3493} {"train_loss": -6.96535062789917, "global_step": 146725, "epoch": 3493} {"train_loss": -6.787448883056641, "global_step": 146726, "epoch": 3493} {"train_loss": -6.913775444030762, "global_step": 146727, "epoch": 3493} {"train_loss": -6.894301414489746, "global_step": 146728, "epoch": 3493} {"train_loss": -6.719083786010742, "global_step": 146729, "epoch": 3493} {"train_loss": -6.81729793548584, "global_step": 146730, "epoch": 3493} {"train_loss": -6.865931510925293, "global_step": 146731, "epoch": 3493} {"train_loss": -6.755692005157471, "global_step": 146732, "epoch": 3493} {"train_loss": -6.741396903991699, "global_step": 146733, "epoch": 3493} {"train_loss": -6.8260111808776855, "global_step": 146734, "epoch": 3493} {"train_loss": -6.806440353393555, "global_step": 146735, "epoch": 3493} {"train_loss": -6.766623020172119, "global_step": 146736, "epoch": 3493} {"train_loss": -6.842494964599609, "global_step": 146737, "epoch": 3493} {"train_loss": -6.786584377288818, "global_step": 146738, "epoch": 3493} {"train_loss": -6.847812652587891, "global_step": 146739, "epoch": 3493} {"train_loss": -6.6548919677734375, "global_step": 146740, "epoch": 3493} {"train_loss": -6.747808456420898, "global_step": 146741, "epoch": 3493} {"train_loss": -6.791141510009766, "global_step": 146742, "epoch": 3493} {"train_loss": -6.74056339263916, "global_step": 146743, "epoch": 3493} {"train_loss": -6.817834854125977, "global_step": 146744, "epoch": 3493} {"train_loss": -6.725057125091553, "global_step": 146745, "epoch": 3493} {"train_loss": -6.845205783843994, "global_step": 146746, "epoch": 3493} {"train_loss": -6.812129894892375, "global_step": 146747, "epoch": 3493, "val_loss": 68019.625} {"train_loss": -6.7871246337890625, "global_step": 146748, "epoch": 3494} {"train_loss": -6.676041603088379, "global_step": 146749, "epoch": 3494} {"train_loss": -6.662502288818359, "global_step": 146750, "epoch": 3494} {"train_loss": -6.835475921630859, "global_step": 146751, "epoch": 3494} {"train_loss": -6.793493747711182, "global_step": 146752, "epoch": 3494} {"train_loss": -6.792694568634033, "global_step": 146753, "epoch": 3494} {"train_loss": -6.772609710693359, "global_step": 146754, "epoch": 3494} {"train_loss": -6.6841721534729, "global_step": 146755, "epoch": 3494} {"train_loss": -6.811141014099121, "global_step": 146756, "epoch": 3494} {"train_loss": -6.764089584350586, "global_step": 146757, "epoch": 3494} {"train_loss": -6.678598880767822, "global_step": 146758, "epoch": 3494} {"train_loss": -6.784626007080078, "global_step": 146759, "epoch": 3494} {"train_loss": -6.830324649810791, "global_step": 146760, "epoch": 3494} {"train_loss": -6.768955230712891, "global_step": 146761, "epoch": 3494} {"train_loss": -6.773908615112305, "global_step": 146762, "epoch": 3494} {"train_loss": -6.8299336433410645, "global_step": 146763, "epoch": 3494} {"train_loss": -6.684343338012695, "global_step": 146764, "epoch": 3494} {"train_loss": -6.79157829284668, "global_step": 146765, "epoch": 3494} {"train_loss": -6.813094615936279, "global_step": 146766, "epoch": 3494} {"train_loss": -6.854124069213867, "global_step": 146767, "epoch": 3494} {"train_loss": -6.856525897979736, "global_step": 146768, "epoch": 3494} {"train_loss": -6.830361366271973, "global_step": 146769, "epoch": 3494} {"train_loss": -6.742459297180176, "global_step": 146770, "epoch": 3494} {"train_loss": -6.825811386108398, "global_step": 146771, "epoch": 3494} {"train_loss": -6.889263153076172, "global_step": 146772, "epoch": 3494} {"train_loss": -6.859608173370361, "global_step": 146773, "epoch": 3494} {"train_loss": -6.79921293258667, "global_step": 146774, "epoch": 3494} {"train_loss": -6.940757751464844, "global_step": 146775, "epoch": 3494} {"train_loss": -6.893466949462891, "global_step": 146776, "epoch": 3494} {"train_loss": -6.697478294372559, "global_step": 146777, "epoch": 3494} {"train_loss": -6.803616523742676, "global_step": 146778, "epoch": 3494} {"train_loss": -6.817020893096924, "global_step": 146779, "epoch": 3494} {"train_loss": -6.775021553039551, "global_step": 146780, "epoch": 3494} {"train_loss": -6.860495090484619, "global_step": 146781, "epoch": 3494} {"train_loss": -6.858765602111816, "global_step": 146782, "epoch": 3494} {"train_loss": -6.819741249084473, "global_step": 146783, "epoch": 3494} {"train_loss": -6.707459449768066, "global_step": 146784, "epoch": 3494} {"train_loss": -6.86357307434082, "global_step": 146785, "epoch": 3494} {"train_loss": -6.954540252685547, "global_step": 146786, "epoch": 3494} {"train_loss": -6.864030838012695, "global_step": 146787, "epoch": 3494} {"train_loss": -6.81673526763916, "global_step": 146788, "epoch": 3494} {"train_loss": -6.802502904619489, "global_step": 146789, "epoch": 3494, "val_loss": 67777.890625} {"train_loss": -6.819293022155762, "global_step": 146790, "epoch": 3495} {"train_loss": -6.809280872344971, "global_step": 146791, "epoch": 3495} {"train_loss": -6.778597831726074, "global_step": 146792, "epoch": 3495} {"train_loss": -6.875323295593262, "global_step": 146793, "epoch": 3495} {"train_loss": -6.76704216003418, "global_step": 146794, "epoch": 3495} {"train_loss": -6.867000102996826, "global_step": 146795, "epoch": 3495} {"train_loss": -6.791252613067627, "global_step": 146796, "epoch": 3495} {"train_loss": -6.784188747406006, "global_step": 146797, "epoch": 3495} {"train_loss": -6.963937759399414, "global_step": 146798, "epoch": 3495} {"train_loss": -6.832030773162842, "global_step": 146799, "epoch": 3495} {"train_loss": -6.951568603515625, "global_step": 146800, "epoch": 3495} {"train_loss": -6.928226947784424, "global_step": 146801, "epoch": 3495} {"train_loss": -6.897253036499023, "global_step": 146802, "epoch": 3495} {"train_loss": -6.823732376098633, "global_step": 146803, "epoch": 3495} {"train_loss": -6.929311752319336, "global_step": 146804, "epoch": 3495} {"train_loss": -6.869913101196289, "global_step": 146805, "epoch": 3495} {"train_loss": -6.863637924194336, "global_step": 146806, "epoch": 3495} {"train_loss": -6.9390411376953125, "global_step": 146807, "epoch": 3495} {"train_loss": -6.837075233459473, "global_step": 146808, "epoch": 3495} {"train_loss": -6.835494518280029, "global_step": 146809, "epoch": 3495} {"train_loss": -6.819780349731445, "global_step": 146810, "epoch": 3495} {"train_loss": -6.857958793640137, "global_step": 146811, "epoch": 3495} {"train_loss": -6.900201320648193, "global_step": 146812, "epoch": 3495} {"train_loss": -6.765626907348633, "global_step": 146813, "epoch": 3495} {"train_loss": -6.925146579742432, "global_step": 146814, "epoch": 3495} {"train_loss": -6.802552223205566, "global_step": 146815, "epoch": 3495} {"train_loss": -6.902480125427246, "global_step": 146816, "epoch": 3495} {"train_loss": -6.845371246337891, "global_step": 146817, "epoch": 3495} {"train_loss": -6.830641746520996, "global_step": 146818, "epoch": 3495} {"train_loss": -6.700745105743408, "global_step": 146819, "epoch": 3495} {"train_loss": -6.736775875091553, "global_step": 146820, "epoch": 3495} {"train_loss": -6.741720199584961, "global_step": 146821, "epoch": 3495} {"train_loss": -6.727303981781006, "global_step": 146822, "epoch": 3495} {"train_loss": -6.676521301269531, "global_step": 146823, "epoch": 3495} {"train_loss": -6.781582355499268, "global_step": 146824, "epoch": 3495} {"train_loss": -6.800281524658203, "global_step": 146825, "epoch": 3495} {"train_loss": -6.835122585296631, "global_step": 146826, "epoch": 3495} {"train_loss": -6.819066524505615, "global_step": 146827, "epoch": 3495} {"train_loss": -6.754287242889404, "global_step": 146828, "epoch": 3495} {"train_loss": -6.865320205688477, "global_step": 146829, "epoch": 3495} {"train_loss": -6.7903900146484375, "global_step": 146830, "epoch": 3495} {"train_loss": -6.8267986206781295, "global_step": 146831, "epoch": 3495, "val_loss": 68007.390625} {"train_loss": -6.873359680175781, "global_step": 146832, "epoch": 3496} {"train_loss": -6.73000431060791, "global_step": 146833, "epoch": 3496} {"train_loss": -6.885658264160156, "global_step": 146834, "epoch": 3496} {"train_loss": -6.8264617919921875, "global_step": 146835, "epoch": 3496} {"train_loss": -6.795914649963379, "global_step": 146836, "epoch": 3496} {"train_loss": -6.681155204772949, "global_step": 146837, "epoch": 3496} {"train_loss": -6.829745292663574, "global_step": 146838, "epoch": 3496} {"train_loss": -6.6724162101745605, "global_step": 146839, "epoch": 3496} {"train_loss": -6.713744163513184, "global_step": 146840, "epoch": 3496} {"train_loss": -6.8030290603637695, "global_step": 146841, "epoch": 3496} {"train_loss": -6.71420955657959, "global_step": 146842, "epoch": 3496} {"train_loss": -6.692216873168945, "global_step": 146843, "epoch": 3496} {"train_loss": -6.894369125366211, "global_step": 146844, "epoch": 3496} {"train_loss": -6.784235000610352, "global_step": 146845, "epoch": 3496} {"train_loss": -6.769125938415527, "global_step": 146846, "epoch": 3496} {"train_loss": -6.801900386810303, "global_step": 146847, "epoch": 3496} {"train_loss": -6.7928361892700195, "global_step": 146848, "epoch": 3496} {"train_loss": -6.927560329437256, "global_step": 146849, "epoch": 3496} {"train_loss": -6.9191741943359375, "global_step": 146850, "epoch": 3496} {"train_loss": -6.788476467132568, "global_step": 146851, "epoch": 3496} {"train_loss": -6.850790977478027, "global_step": 146852, "epoch": 3496} {"train_loss": -6.927945137023926, "global_step": 146853, "epoch": 3496} {"train_loss": -6.849048614501953, "global_step": 146854, "epoch": 3496} {"train_loss": -6.894473552703857, "global_step": 146855, "epoch": 3496} {"train_loss": -6.929511547088623, "global_step": 146856, "epoch": 3496} {"train_loss": -6.793652057647705, "global_step": 146857, "epoch": 3496} {"train_loss": -6.830708026885986, "global_step": 146858, "epoch": 3496} {"train_loss": -6.9278645515441895, "global_step": 146859, "epoch": 3496} {"train_loss": -6.851603031158447, "global_step": 146860, "epoch": 3496} {"train_loss": -6.924996376037598, "global_step": 146861, "epoch": 3496} {"train_loss": -6.835211753845215, "global_step": 146862, "epoch": 3496} {"train_loss": -6.82181453704834, "global_step": 146863, "epoch": 3496} {"train_loss": -6.9554219245910645, "global_step": 146864, "epoch": 3496} {"train_loss": -6.78725528717041, "global_step": 146865, "epoch": 3496} {"train_loss": -6.816943168640137, "global_step": 146866, "epoch": 3496} {"train_loss": -6.8897857666015625, "global_step": 146867, "epoch": 3496} {"train_loss": -6.834747314453125, "global_step": 146868, "epoch": 3496} {"train_loss": -6.846423149108887, "global_step": 146869, "epoch": 3496} {"train_loss": -6.884087085723877, "global_step": 146870, "epoch": 3496} {"train_loss": -6.659891605377197, "global_step": 146871, "epoch": 3496} {"train_loss": -6.8852033615112305, "global_step": 146872, "epoch": 3496} {"train_loss": -6.828281652359736, "global_step": 146873, "epoch": 3496, "val_loss": 67694.015625} {"train_loss": -6.781067371368408, "global_step": 146874, "epoch": 3497} {"train_loss": -6.903823375701904, "global_step": 146875, "epoch": 3497} {"train_loss": -6.8219499588012695, "global_step": 146876, "epoch": 3497} {"train_loss": -6.858485221862793, "global_step": 146877, "epoch": 3497} {"train_loss": -6.899909019470215, "global_step": 146878, "epoch": 3497} {"train_loss": -6.931877613067627, "global_step": 146879, "epoch": 3497} {"train_loss": -6.8705291748046875, "global_step": 146880, "epoch": 3497} {"train_loss": -6.786561012268066, "global_step": 146881, "epoch": 3497} {"train_loss": -6.8958868980407715, "global_step": 146882, "epoch": 3497} {"train_loss": -6.925117015838623, "global_step": 146883, "epoch": 3497} {"train_loss": -6.7422027587890625, "global_step": 146884, "epoch": 3497} {"train_loss": -6.810351371765137, "global_step": 146885, "epoch": 3497} {"train_loss": -6.842902183532715, "global_step": 146886, "epoch": 3497} {"train_loss": -6.5156965255737305, "global_step": 146887, "epoch": 3497} {"train_loss": -6.759268283843994, "global_step": 146888, "epoch": 3497} {"train_loss": -6.912744998931885, "global_step": 146889, "epoch": 3497} {"train_loss": -6.600780487060547, "global_step": 146890, "epoch": 3497} {"train_loss": -6.65483283996582, "global_step": 146891, "epoch": 3497} {"train_loss": -6.8038482666015625, "global_step": 146892, "epoch": 3497} {"train_loss": -6.7976298332214355, "global_step": 146893, "epoch": 3497} {"train_loss": -6.766021728515625, "global_step": 146894, "epoch": 3497} {"train_loss": -6.655243873596191, "global_step": 146895, "epoch": 3497} {"train_loss": -6.772571563720703, "global_step": 146896, "epoch": 3497} {"train_loss": -6.830134391784668, "global_step": 146897, "epoch": 3497} {"train_loss": -6.76242733001709, "global_step": 146898, "epoch": 3497} {"train_loss": -6.8566484451293945, "global_step": 146899, "epoch": 3497} {"train_loss": -6.778875827789307, "global_step": 146900, "epoch": 3497} {"train_loss": -6.818364143371582, "global_step": 146901, "epoch": 3497} {"train_loss": -6.880772113800049, "global_step": 146902, "epoch": 3497} {"train_loss": -6.794307231903076, "global_step": 146903, "epoch": 3497} {"train_loss": -6.757930278778076, "global_step": 146904, "epoch": 3497} {"train_loss": -6.769805908203125, "global_step": 146905, "epoch": 3497} {"train_loss": -6.74102258682251, "global_step": 146906, "epoch": 3497} {"train_loss": -6.826389312744141, "global_step": 146907, "epoch": 3497} {"train_loss": -6.797940254211426, "global_step": 146908, "epoch": 3497} {"train_loss": -6.750932693481445, "global_step": 146909, "epoch": 3497} {"train_loss": -6.959885597229004, "global_step": 146910, "epoch": 3497} {"train_loss": -6.927044868469238, "global_step": 146911, "epoch": 3497} {"train_loss": -6.830236434936523, "global_step": 146912, "epoch": 3497} {"train_loss": -6.901036262512207, "global_step": 146913, "epoch": 3497} {"train_loss": -6.781031608581543, "global_step": 146914, "epoch": 3497} {"train_loss": -6.805780592418852, "global_step": 146915, "epoch": 3497, "val_loss": 67644.578125} {"train_loss": -6.939237594604492, "global_step": 146916, "epoch": 3498} {"train_loss": -6.823975086212158, "global_step": 146917, "epoch": 3498} {"train_loss": -6.910675048828125, "global_step": 146918, "epoch": 3498} {"train_loss": -6.937717914581299, "global_step": 146919, "epoch": 3498} {"train_loss": -6.826740264892578, "global_step": 146920, "epoch": 3498} {"train_loss": -6.915162563323975, "global_step": 146921, "epoch": 3498} {"train_loss": -6.772649765014648, "global_step": 146922, "epoch": 3498} {"train_loss": -6.841785430908203, "global_step": 146923, "epoch": 3498} {"train_loss": -6.707810878753662, "global_step": 146924, "epoch": 3498} {"train_loss": -6.736716270446777, "global_step": 146925, "epoch": 3498} {"train_loss": -6.762143135070801, "global_step": 146926, "epoch": 3498} {"train_loss": -6.733341693878174, "global_step": 146927, "epoch": 3498} {"train_loss": -6.688595771789551, "global_step": 146928, "epoch": 3498} {"train_loss": -6.641641616821289, "global_step": 146929, "epoch": 3498} {"train_loss": -6.735452651977539, "global_step": 146930, "epoch": 3498} {"train_loss": -6.782980918884277, "global_step": 146931, "epoch": 3498} {"train_loss": -6.67160701751709, "global_step": 146932, "epoch": 3498} {"train_loss": -6.806090354919434, "global_step": 146933, "epoch": 3498} {"train_loss": -6.722788333892822, "global_step": 146934, "epoch": 3498} {"train_loss": -6.654311656951904, "global_step": 146935, "epoch": 3498} {"train_loss": -6.710353374481201, "global_step": 146936, "epoch": 3498} {"train_loss": -6.728979587554932, "global_step": 146937, "epoch": 3498} {"train_loss": -6.736291408538818, "global_step": 146938, "epoch": 3498} {"train_loss": -6.76264762878418, "global_step": 146939, "epoch": 3498} {"train_loss": -6.746881484985352, "global_step": 146940, "epoch": 3498} {"train_loss": -6.758329391479492, "global_step": 146941, "epoch": 3498} {"train_loss": -6.737181663513184, "global_step": 146942, "epoch": 3498} {"train_loss": -6.7823567390441895, "global_step": 146943, "epoch": 3498} {"train_loss": -6.759336471557617, "global_step": 146944, "epoch": 3498} {"train_loss": -6.790327072143555, "global_step": 146945, "epoch": 3498} {"train_loss": -6.817265510559082, "global_step": 146946, "epoch": 3498} {"train_loss": -6.734905242919922, "global_step": 146947, "epoch": 3498} {"train_loss": -6.790729522705078, "global_step": 146948, "epoch": 3498} {"train_loss": -6.9225263595581055, "global_step": 146949, "epoch": 3498} {"train_loss": -6.801535606384277, "global_step": 146950, "epoch": 3498} {"train_loss": -6.7797088623046875, "global_step": 146951, "epoch": 3498} {"train_loss": -6.8314666748046875, "global_step": 146952, "epoch": 3498} {"train_loss": -6.881239414215088, "global_step": 146953, "epoch": 3498} {"train_loss": -6.824945449829102, "global_step": 146954, "epoch": 3498} {"train_loss": -6.868464469909668, "global_step": 146955, "epoch": 3498} {"train_loss": -6.9707841873168945, "global_step": 146956, "epoch": 3498} {"train_loss": -6.787094127564203, "global_step": 146957, "epoch": 3498, "val_loss": 67559.578125} {"train_loss": -6.899665832519531, "global_step": 146958, "epoch": 3499} {"train_loss": -6.67996883392334, "global_step": 146959, "epoch": 3499} {"train_loss": -6.902231216430664, "global_step": 146960, "epoch": 3499} {"train_loss": -6.809810638427734, "global_step": 146961, "epoch": 3499} {"train_loss": -6.709427833557129, "global_step": 146962, "epoch": 3499} {"train_loss": -6.793887138366699, "global_step": 146963, "epoch": 3499} {"train_loss": -6.7923407554626465, "global_step": 146964, "epoch": 3499} {"train_loss": -6.752890586853027, "global_step": 146965, "epoch": 3499} {"train_loss": -6.8704328536987305, "global_step": 146966, "epoch": 3499} {"train_loss": -6.905735015869141, "global_step": 146967, "epoch": 3499} {"train_loss": -6.852241039276123, "global_step": 146968, "epoch": 3499} {"train_loss": -6.922720909118652, "global_step": 146969, "epoch": 3499} {"train_loss": -6.781850814819336, "global_step": 146970, "epoch": 3499} {"train_loss": -6.875764846801758, "global_step": 146971, "epoch": 3499} {"train_loss": -6.807348251342773, "global_step": 146972, "epoch": 3499} {"train_loss": -6.7745361328125, "global_step": 146973, "epoch": 3499} {"train_loss": -6.920830726623535, "global_step": 146974, "epoch": 3499} {"train_loss": -6.8140668869018555, "global_step": 146975, "epoch": 3499} {"train_loss": -6.812345504760742, "global_step": 146976, "epoch": 3499} {"train_loss": -6.820131301879883, "global_step": 146977, "epoch": 3499} {"train_loss": -6.8096089363098145, "global_step": 146978, "epoch": 3499} {"train_loss": -6.916094779968262, "global_step": 146979, "epoch": 3499} {"train_loss": -6.785052299499512, "global_step": 146980, "epoch": 3499} {"train_loss": -6.802594184875488, "global_step": 146981, "epoch": 3499} {"train_loss": -6.880939483642578, "global_step": 146982, "epoch": 3499} {"train_loss": -6.858180999755859, "global_step": 146983, "epoch": 3499} {"train_loss": -6.826846122741699, "global_step": 146984, "epoch": 3499} {"train_loss": -6.809089660644531, "global_step": 146985, "epoch": 3499} {"train_loss": -6.819113254547119, "global_step": 146986, "epoch": 3499} {"train_loss": -6.891373634338379, "global_step": 146987, "epoch": 3499} {"train_loss": -6.758685111999512, "global_step": 146988, "epoch": 3499} {"train_loss": -6.723708152770996, "global_step": 146989, "epoch": 3499} {"train_loss": -6.897940158843994, "global_step": 146990, "epoch": 3499} {"train_loss": -6.820797920227051, "global_step": 146991, "epoch": 3499} {"train_loss": -6.967108726501465, "global_step": 146992, "epoch": 3499} {"train_loss": -6.855952262878418, "global_step": 146993, "epoch": 3499} {"train_loss": -6.774164199829102, "global_step": 146994, "epoch": 3499} {"train_loss": -6.897871971130371, "global_step": 146995, "epoch": 3499} {"train_loss": -6.890616416931152, "global_step": 146996, "epoch": 3499} {"train_loss": -6.824648380279541, "global_step": 146997, "epoch": 3499} {"train_loss": -6.829004764556885, "global_step": 146998, "epoch": 3499} {"train_loss": -6.8334067321959, "global_step": 146999, "epoch": 3499, "val_loss": 67850.4375} {"train_loss": -6.871427536010742, "global_step": 147000, "epoch": 3500} {"train_loss": -6.922959327697754, "global_step": 147001, "epoch": 3500} {"train_loss": -6.806752681732178, "global_step": 147002, "epoch": 3500} {"train_loss": -6.7424468994140625, "global_step": 147003, "epoch": 3500} {"train_loss": -6.8792924880981445, "global_step": 147004, "epoch": 3500} {"train_loss": -6.832828998565674, "global_step": 147005, "epoch": 3500} {"train_loss": -6.772159099578857, "global_step": 147006, "epoch": 3500} {"train_loss": -6.9532012939453125, "global_step": 147007, "epoch": 3500} {"train_loss": -6.825742721557617, "global_step": 147008, "epoch": 3500} {"train_loss": -6.775624752044678, "global_step": 147009, "epoch": 3500} {"train_loss": -6.8190460205078125, "global_step": 147010, "epoch": 3500} {"train_loss": -6.897556304931641, "global_step": 147011, "epoch": 3500} {"train_loss": -6.765538215637207, "global_step": 147012, "epoch": 3500} {"train_loss": -7.054098129272461, "global_step": 147013, "epoch": 3500} {"train_loss": -6.818195343017578, "global_step": 147014, "epoch": 3500} {"train_loss": -6.858095169067383, "global_step": 147015, "epoch": 3500} {"train_loss": -6.771203994750977, "global_step": 147016, "epoch": 3500} {"train_loss": -6.752094745635986, "global_step": 147017, "epoch": 3500} {"train_loss": -6.867659568786621, "global_step": 147018, "epoch": 3500} {"train_loss": -6.799707889556885, "global_step": 147019, "epoch": 3500} {"train_loss": -6.8430328369140625, "global_step": 147020, "epoch": 3500} {"train_loss": -6.881197452545166, "global_step": 147021, "epoch": 3500} {"train_loss": -6.797368049621582, "global_step": 147022, "epoch": 3500} {"train_loss": -6.902400016784668, "global_step": 147023, "epoch": 3500} {"train_loss": -6.762010097503662, "global_step": 147024, "epoch": 3500} {"train_loss": -6.8762407302856445, "global_step": 147025, "epoch": 3500} {"train_loss": -6.739536762237549, "global_step": 147026, "epoch": 3500} {"train_loss": -6.807456970214844, "global_step": 147027, "epoch": 3500} {"train_loss": -6.884167671203613, "global_step": 147028, "epoch": 3500} {"train_loss": -6.693329334259033, "global_step": 147029, "epoch": 3500} {"train_loss": -6.949785232543945, "global_step": 147030, "epoch": 3500} {"train_loss": -6.795502662658691, "global_step": 147031, "epoch": 3500} {"train_loss": -6.785280227661133, "global_step": 147032, "epoch": 3500} {"train_loss": -6.803163528442383, "global_step": 147033, "epoch": 3500} {"train_loss": -6.823738098144531, "global_step": 147034, "epoch": 3500} {"train_loss": -6.917768955230713, "global_step": 147035, "epoch": 3500} {"train_loss": -6.823009967803955, "global_step": 147036, "epoch": 3500} {"train_loss": -6.829711437225342, "global_step": 147037, "epoch": 3500} {"train_loss": -6.833761215209961, "global_step": 147038, "epoch": 3500} {"train_loss": -6.81959342956543, "global_step": 147039, "epoch": 3500} {"train_loss": -6.6400651931762695, "global_step": 147040, "epoch": 3500} {"train_loss": -6.829185712905157, "global_step": 147041, "epoch": 3500, "train/sim_max_reward_0": 0.19314740038255593, "train/sim_max_reward_1": 0.7838860786838302, "train/sim_max_reward_2": 0.47865123817706334, "train/sim_max_reward_3": 0.4098688920653756, "train/sim_max_reward_4": 0.9582612995022498, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.33271405884490723, "test/sim_max_reward_4300001": 0.4090298661614353, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.9576351272406228, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8196504550028353, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.34178786191791394, "test/sim_max_reward_4300008": 0.7102994987957265, "test/sim_max_reward_4300009": 0.9942937196339452, "test/sim_max_reward_4300010": 0.8198452856282415, "test/sim_max_reward_4300011": 0.7136818047512897, "test/sim_max_reward_4300012": 0.9961125422235348, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9836315462813898, "test/sim_max_reward_4300016": 0.9618467992284329, "test/sim_max_reward_4300017": 0.9812191728727968, "test/sim_max_reward_4300018": 0.43958063486184196, "test/sim_max_reward_4300019": 0.18601141238224275, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9716462963868994, "test/sim_max_reward_4300022": 0.9636483983656402, "test/sim_max_reward_4300023": 0.3266833948451827, "test/sim_max_reward_4300024": 0.9264622072878903, "test/sim_max_reward_4300025": 0.8956496650115622, "test/sim_max_reward_4300026": 0.16068445142405385, "test/sim_max_reward_4300027": 0.9434092329549199, "test/sim_max_reward_4300028": 0.9565770545082587, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.1245486552610598, "test/sim_max_reward_4300031": 0.2165713982937467, "test/sim_max_reward_4300032": 0.938550330018922, "test/sim_max_reward_4300033": 0.9263999783383047, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8550147142129794, "test/sim_max_reward_4300038": 0.585216708219342, "test/sim_max_reward_4300039": 0.8754539067969282, "test/sim_max_reward_4300040": 0.9186382117675168, "test/sim_max_reward_4300041": 0.3130008485338155, "test/sim_max_reward_4300042": 0.7222997699692806, "test/sim_max_reward_4300043": 0.15662055303581485, "test/sim_max_reward_4300044": 0.9481686903030089, "test/sim_max_reward_4300045": 0.18862407790920466, "test/sim_max_reward_4300046": 0.9172715517446771, "test/sim_max_reward_4300047": 0.12088128354891643, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.1375235895109698, "train/mean_score": 0.5027999446955437, "test/mean_score": 0.5790382594889764, "val_loss": 67762.53125} {"train_loss": -6.944314956665039, "global_step": 147042, "epoch": 3501} {"train_loss": -6.767307281494141, "global_step": 147043, "epoch": 3501} {"train_loss": -6.805999755859375, "global_step": 147044, "epoch": 3501} {"train_loss": -6.930686950683594, "global_step": 147045, "epoch": 3501} {"train_loss": -6.724047660827637, "global_step": 147046, "epoch": 3501} {"train_loss": -6.9162163734436035, "global_step": 147047, "epoch": 3501} {"train_loss": -6.661177158355713, "global_step": 147048, "epoch": 3501} {"train_loss": -6.7540283203125, "global_step": 147049, "epoch": 3501} {"train_loss": -6.839654922485352, "global_step": 147050, "epoch": 3501} {"train_loss": -6.741755485534668, "global_step": 147051, "epoch": 3501} {"train_loss": -6.755602836608887, "global_step": 147052, "epoch": 3501} {"train_loss": -6.6736273765563965, "global_step": 147053, "epoch": 3501} {"train_loss": -6.626018047332764, "global_step": 147054, "epoch": 3501} {"train_loss": -6.749966621398926, "global_step": 147055, "epoch": 3501} {"train_loss": -6.665091037750244, "global_step": 147056, "epoch": 3501} {"train_loss": -6.906210422515869, "global_step": 147057, "epoch": 3501} {"train_loss": -6.753422737121582, "global_step": 147058, "epoch": 3501} {"train_loss": -6.750476837158203, "global_step": 147059, "epoch": 3501} {"train_loss": -6.7318267822265625, "global_step": 147060, "epoch": 3501} {"train_loss": -6.605223655700684, "global_step": 147061, "epoch": 3501} {"train_loss": -6.779853820800781, "global_step": 147062, "epoch": 3501} {"train_loss": -6.812559127807617, "global_step": 147063, "epoch": 3501} {"train_loss": -6.776876449584961, "global_step": 147064, "epoch": 3501} {"train_loss": -6.853911399841309, "global_step": 147065, "epoch": 3501} {"train_loss": -6.839041709899902, "global_step": 147066, "epoch": 3501} {"train_loss": -6.7345991134643555, "global_step": 147067, "epoch": 3501} {"train_loss": -6.90709114074707, "global_step": 147068, "epoch": 3501} {"train_loss": -6.875518798828125, "global_step": 147069, "epoch": 3501} {"train_loss": -6.81585693359375, "global_step": 147070, "epoch": 3501} {"train_loss": -6.993834018707275, "global_step": 147071, "epoch": 3501} {"train_loss": -6.806110858917236, "global_step": 147072, "epoch": 3501} {"train_loss": -6.676321029663086, "global_step": 147073, "epoch": 3501} {"train_loss": -6.826539516448975, "global_step": 147074, "epoch": 3501} {"train_loss": -6.923371315002441, "global_step": 147075, "epoch": 3501} {"train_loss": -6.750721454620361, "global_step": 147076, "epoch": 3501} {"train_loss": -6.947949409484863, "global_step": 147077, "epoch": 3501} {"train_loss": -6.762426853179932, "global_step": 147078, "epoch": 3501} {"train_loss": -6.79648494720459, "global_step": 147079, "epoch": 3501} {"train_loss": -6.902022361755371, "global_step": 147080, "epoch": 3501} {"train_loss": -6.985937595367432, "global_step": 147081, "epoch": 3501} {"train_loss": -6.704746246337891, "global_step": 147082, "epoch": 3501} {"train_loss": -6.80378270149231, "global_step": 147083, "epoch": 3501, "val_loss": 67708.3125} {"train_loss": -6.842623710632324, "global_step": 147084, "epoch": 3502} {"train_loss": -6.870023727416992, "global_step": 147085, "epoch": 3502} {"train_loss": -6.840147018432617, "global_step": 147086, "epoch": 3502} {"train_loss": -6.842535972595215, "global_step": 147087, "epoch": 3502} {"train_loss": -6.8252739906311035, "global_step": 147088, "epoch": 3502} {"train_loss": -6.932999610900879, "global_step": 147089, "epoch": 3502} {"train_loss": -6.867800712585449, "global_step": 147090, "epoch": 3502} {"train_loss": -6.890993118286133, "global_step": 147091, "epoch": 3502} {"train_loss": -6.7546234130859375, "global_step": 147092, "epoch": 3502} {"train_loss": -6.886488437652588, "global_step": 147093, "epoch": 3502} {"train_loss": -6.805313587188721, "global_step": 147094, "epoch": 3502} {"train_loss": -6.77781867980957, "global_step": 147095, "epoch": 3502} {"train_loss": -6.7036261558532715, "global_step": 147096, "epoch": 3502} {"train_loss": -6.765432357788086, "global_step": 147097, "epoch": 3502} {"train_loss": -6.869447231292725, "global_step": 147098, "epoch": 3502} {"train_loss": -6.691682815551758, "global_step": 147099, "epoch": 3502} {"train_loss": -6.830989837646484, "global_step": 147100, "epoch": 3502} {"train_loss": -6.8094024658203125, "global_step": 147101, "epoch": 3502} {"train_loss": -6.904788494110107, "global_step": 147102, "epoch": 3502} {"train_loss": -6.797765731811523, "global_step": 147103, "epoch": 3502} {"train_loss": -6.801634788513184, "global_step": 147104, "epoch": 3502} {"train_loss": -6.849816799163818, "global_step": 147105, "epoch": 3502} {"train_loss": -6.805322170257568, "global_step": 147106, "epoch": 3502} {"train_loss": -6.754642486572266, "global_step": 147107, "epoch": 3502} {"train_loss": -6.769588947296143, "global_step": 147108, "epoch": 3502} {"train_loss": -6.7979230880737305, "global_step": 147109, "epoch": 3502} {"train_loss": -6.808238983154297, "global_step": 147110, "epoch": 3502} {"train_loss": -6.78675651550293, "global_step": 147111, "epoch": 3502} {"train_loss": -6.696122169494629, "global_step": 147112, "epoch": 3502} {"train_loss": -6.8940300941467285, "global_step": 147113, "epoch": 3502} {"train_loss": -6.917747497558594, "global_step": 147114, "epoch": 3502} {"train_loss": -6.849626541137695, "global_step": 147115, "epoch": 3502} {"train_loss": -6.909583568572998, "global_step": 147116, "epoch": 3502} {"train_loss": -6.795845031738281, "global_step": 147117, "epoch": 3502} {"train_loss": -6.727317810058594, "global_step": 147118, "epoch": 3502} {"train_loss": -6.90437126159668, "global_step": 147119, "epoch": 3502} {"train_loss": -6.848456382751465, "global_step": 147120, "epoch": 3502} {"train_loss": -6.889943599700928, "global_step": 147121, "epoch": 3502} {"train_loss": -6.791357040405273, "global_step": 147122, "epoch": 3502} {"train_loss": -6.91337776184082, "global_step": 147123, "epoch": 3502} {"train_loss": -6.756497383117676, "global_step": 147124, "epoch": 3502} {"train_loss": -6.82750517981393, "global_step": 147125, "epoch": 3502, "val_loss": 67899.953125} {"train_loss": -6.892030715942383, "global_step": 147126, "epoch": 3503} {"train_loss": -6.816381454467773, "global_step": 147127, "epoch": 3503} {"train_loss": -6.80466890335083, "global_step": 147128, "epoch": 3503} {"train_loss": -6.936840057373047, "global_step": 147129, "epoch": 3503} {"train_loss": -6.825126647949219, "global_step": 147130, "epoch": 3503} {"train_loss": -6.881143569946289, "global_step": 147131, "epoch": 3503} {"train_loss": -6.923309326171875, "global_step": 147132, "epoch": 3503} {"train_loss": -6.876350402832031, "global_step": 147133, "epoch": 3503} {"train_loss": -6.911603927612305, "global_step": 147134, "epoch": 3503} {"train_loss": -6.900053977966309, "global_step": 147135, "epoch": 3503} {"train_loss": -6.860451698303223, "global_step": 147136, "epoch": 3503} {"train_loss": -6.863216400146484, "global_step": 147137, "epoch": 3503} {"train_loss": -6.837759971618652, "global_step": 147138, "epoch": 3503} {"train_loss": -6.944608211517334, "global_step": 147139, "epoch": 3503} {"train_loss": -6.896970748901367, "global_step": 147140, "epoch": 3503} {"train_loss": -6.901881217956543, "global_step": 147141, "epoch": 3503} {"train_loss": -6.906367301940918, "global_step": 147142, "epoch": 3503} {"train_loss": -6.930707931518555, "global_step": 147143, "epoch": 3503} {"train_loss": -6.775731563568115, "global_step": 147144, "epoch": 3503} {"train_loss": -6.842435836791992, "global_step": 147145, "epoch": 3503} {"train_loss": -6.779443264007568, "global_step": 147146, "epoch": 3503} {"train_loss": -6.840619087219238, "global_step": 147147, "epoch": 3503} {"train_loss": -6.685002326965332, "global_step": 147148, "epoch": 3503} {"train_loss": -6.859443664550781, "global_step": 147149, "epoch": 3503} {"train_loss": -6.871547698974609, "global_step": 147150, "epoch": 3503} {"train_loss": -6.845516204833984, "global_step": 147151, "epoch": 3503} {"train_loss": -6.861665725708008, "global_step": 147152, "epoch": 3503} {"train_loss": -6.752992153167725, "global_step": 147153, "epoch": 3503} {"train_loss": -6.809038162231445, "global_step": 147154, "epoch": 3503} {"train_loss": -6.880675315856934, "global_step": 147155, "epoch": 3503} {"train_loss": -6.832018852233887, "global_step": 147156, "epoch": 3503} {"train_loss": -6.875644207000732, "global_step": 147157, "epoch": 3503} {"train_loss": -6.866616249084473, "global_step": 147158, "epoch": 3503} {"train_loss": -6.930386066436768, "global_step": 147159, "epoch": 3503} {"train_loss": -6.846721649169922, "global_step": 147160, "epoch": 3503} {"train_loss": -6.714561462402344, "global_step": 147161, "epoch": 3503} {"train_loss": -6.831717491149902, "global_step": 147162, "epoch": 3503} {"train_loss": -6.702024936676025, "global_step": 147163, "epoch": 3503} {"train_loss": -6.755095958709717, "global_step": 147164, "epoch": 3503} {"train_loss": -6.806117534637451, "global_step": 147165, "epoch": 3503} {"train_loss": -6.646944999694824, "global_step": 147166, "epoch": 3503} {"train_loss": -6.842755045209612, "global_step": 147167, "epoch": 3503, "val_loss": 67864.3046875} {"train_loss": -6.656144142150879, "global_step": 147168, "epoch": 3504} {"train_loss": -6.841931343078613, "global_step": 147169, "epoch": 3504} {"train_loss": -6.672182083129883, "global_step": 147170, "epoch": 3504} {"train_loss": -6.735252857208252, "global_step": 147171, "epoch": 3504} {"train_loss": -6.75545597076416, "global_step": 147172, "epoch": 3504} {"train_loss": -6.858880043029785, "global_step": 147173, "epoch": 3504} {"train_loss": -6.733622074127197, "global_step": 147174, "epoch": 3504} {"train_loss": -6.706816673278809, "global_step": 147175, "epoch": 3504} {"train_loss": -6.788242340087891, "global_step": 147176, "epoch": 3504} {"train_loss": -6.7454094886779785, "global_step": 147177, "epoch": 3504} {"train_loss": -6.61366605758667, "global_step": 147178, "epoch": 3504} {"train_loss": -6.897098541259766, "global_step": 147179, "epoch": 3504} {"train_loss": -6.805307865142822, "global_step": 147180, "epoch": 3504} {"train_loss": -6.800654411315918, "global_step": 147181, "epoch": 3504} {"train_loss": -6.920731544494629, "global_step": 147182, "epoch": 3504} {"train_loss": -6.813108444213867, "global_step": 147183, "epoch": 3504} {"train_loss": -6.952742576599121, "global_step": 147184, "epoch": 3504} {"train_loss": -6.7550048828125, "global_step": 147185, "epoch": 3504} {"train_loss": -6.7581787109375, "global_step": 147186, "epoch": 3504} {"train_loss": -6.783719062805176, "global_step": 147187, "epoch": 3504} {"train_loss": -6.751217842102051, "global_step": 147188, "epoch": 3504} {"train_loss": -6.843376159667969, "global_step": 147189, "epoch": 3504} {"train_loss": -6.891090393066406, "global_step": 147190, "epoch": 3504} {"train_loss": -6.722970008850098, "global_step": 147191, "epoch": 3504} {"train_loss": -6.816104888916016, "global_step": 147192, "epoch": 3504} {"train_loss": -6.820326805114746, "global_step": 147193, "epoch": 3504} {"train_loss": -6.7827348709106445, "global_step": 147194, "epoch": 3504} {"train_loss": -6.7183918952941895, "global_step": 147195, "epoch": 3504} {"train_loss": -6.753366470336914, "global_step": 147196, "epoch": 3504} {"train_loss": -6.838494300842285, "global_step": 147197, "epoch": 3504} {"train_loss": -6.889904022216797, "global_step": 147198, "epoch": 3504} {"train_loss": -6.75604248046875, "global_step": 147199, "epoch": 3504} {"train_loss": -6.894453048706055, "global_step": 147200, "epoch": 3504} {"train_loss": -6.797098159790039, "global_step": 147201, "epoch": 3504} {"train_loss": -6.884258270263672, "global_step": 147202, "epoch": 3504} {"train_loss": -6.736487865447998, "global_step": 147203, "epoch": 3504} {"train_loss": -6.784521102905273, "global_step": 147204, "epoch": 3504} {"train_loss": -6.898150444030762, "global_step": 147205, "epoch": 3504} {"train_loss": -6.856644153594971, "global_step": 147206, "epoch": 3504} {"train_loss": -6.885008811950684, "global_step": 147207, "epoch": 3504} {"train_loss": -6.829972267150879, "global_step": 147208, "epoch": 3504} {"train_loss": -6.800111293792725, "global_step": 147209, "epoch": 3504, "val_loss": 67790.1015625} {"train_loss": -6.707082748413086, "global_step": 147210, "epoch": 3505} {"train_loss": -6.8846917152404785, "global_step": 147211, "epoch": 3505} {"train_loss": -6.807971000671387, "global_step": 147212, "epoch": 3505} {"train_loss": -6.883391380310059, "global_step": 147213, "epoch": 3505} {"train_loss": -6.915782451629639, "global_step": 147214, "epoch": 3505} {"train_loss": -6.766663551330566, "global_step": 147215, "epoch": 3505} {"train_loss": -6.812551498413086, "global_step": 147216, "epoch": 3505} {"train_loss": -6.782990455627441, "global_step": 147217, "epoch": 3505} {"train_loss": -6.894634246826172, "global_step": 147218, "epoch": 3505} {"train_loss": -6.878837585449219, "global_step": 147219, "epoch": 3505} {"train_loss": -6.845220565795898, "global_step": 147220, "epoch": 3505} {"train_loss": -6.880450248718262, "global_step": 147221, "epoch": 3505} {"train_loss": -6.79367733001709, "global_step": 147222, "epoch": 3505} {"train_loss": -6.925967693328857, "global_step": 147223, "epoch": 3505} {"train_loss": -6.7819294929504395, "global_step": 147224, "epoch": 3505} {"train_loss": -6.804211616516113, "global_step": 147225, "epoch": 3505} {"train_loss": -6.818051338195801, "global_step": 147226, "epoch": 3505} {"train_loss": -6.812339782714844, "global_step": 147227, "epoch": 3505} {"train_loss": -6.961676597595215, "global_step": 147228, "epoch": 3505} {"train_loss": -6.8155717849731445, "global_step": 147229, "epoch": 3505} {"train_loss": -6.724878787994385, "global_step": 147230, "epoch": 3505} {"train_loss": -6.841724872589111, "global_step": 147231, "epoch": 3505} {"train_loss": -6.802301406860352, "global_step": 147232, "epoch": 3505} {"train_loss": -6.755623817443848, "global_step": 147233, "epoch": 3505} {"train_loss": -6.805405616760254, "global_step": 147234, "epoch": 3505} {"train_loss": -6.852290153503418, "global_step": 147235, "epoch": 3505} {"train_loss": -6.852052211761475, "global_step": 147236, "epoch": 3505} {"train_loss": -6.806958198547363, "global_step": 147237, "epoch": 3505} {"train_loss": -6.841700553894043, "global_step": 147238, "epoch": 3505} {"train_loss": -6.820666313171387, "global_step": 147239, "epoch": 3505} {"train_loss": -6.7246809005737305, "global_step": 147240, "epoch": 3505} {"train_loss": -6.80018424987793, "global_step": 147241, "epoch": 3505} {"train_loss": -6.777250289916992, "global_step": 147242, "epoch": 3505} {"train_loss": -6.894335746765137, "global_step": 147243, "epoch": 3505} {"train_loss": -6.68231201171875, "global_step": 147244, "epoch": 3505} {"train_loss": -6.678979873657227, "global_step": 147245, "epoch": 3505} {"train_loss": -6.763993263244629, "global_step": 147246, "epoch": 3505} {"train_loss": -6.722499847412109, "global_step": 147247, "epoch": 3505} {"train_loss": -6.7335286140441895, "global_step": 147248, "epoch": 3505} {"train_loss": -6.861678123474121, "global_step": 147249, "epoch": 3505} {"train_loss": -6.769451141357422, "global_step": 147250, "epoch": 3505} {"train_loss": -6.812573512395223, "global_step": 147251, "epoch": 3505, "val_loss": 67835.703125} {"train_loss": -6.8032660484313965, "global_step": 147252, "epoch": 3506} {"train_loss": -6.885473251342773, "global_step": 147253, "epoch": 3506} {"train_loss": -6.898895263671875, "global_step": 147254, "epoch": 3506} {"train_loss": -6.831169128417969, "global_step": 147255, "epoch": 3506} {"train_loss": -6.768989086151123, "global_step": 147256, "epoch": 3506} {"train_loss": -6.879583835601807, "global_step": 147257, "epoch": 3506} {"train_loss": -6.932201385498047, "global_step": 147258, "epoch": 3506} {"train_loss": -6.804330348968506, "global_step": 147259, "epoch": 3506} {"train_loss": -6.805548667907715, "global_step": 147260, "epoch": 3506} {"train_loss": -6.77224063873291, "global_step": 147261, "epoch": 3506} {"train_loss": -6.736697673797607, "global_step": 147262, "epoch": 3506} {"train_loss": -6.783173561096191, "global_step": 147263, "epoch": 3506} {"train_loss": -6.832138538360596, "global_step": 147264, "epoch": 3506} {"train_loss": -6.8339524269104, "global_step": 147265, "epoch": 3506} {"train_loss": -6.8306379318237305, "global_step": 147266, "epoch": 3506} {"train_loss": -6.811507701873779, "global_step": 147267, "epoch": 3506} {"train_loss": -6.815452575683594, "global_step": 147268, "epoch": 3506} {"train_loss": -6.835161209106445, "global_step": 147269, "epoch": 3506} {"train_loss": -6.7382402420043945, "global_step": 147270, "epoch": 3506} {"train_loss": -6.779506683349609, "global_step": 147271, "epoch": 3506} {"train_loss": -6.738882064819336, "global_step": 147272, "epoch": 3506} {"train_loss": -6.765354156494141, "global_step": 147273, "epoch": 3506} {"train_loss": -6.805373191833496, "global_step": 147274, "epoch": 3506} {"train_loss": -6.785236358642578, "global_step": 147275, "epoch": 3506} {"train_loss": -6.851595878601074, "global_step": 147276, "epoch": 3506} {"train_loss": -6.814665794372559, "global_step": 147277, "epoch": 3506} {"train_loss": -6.702736854553223, "global_step": 147278, "epoch": 3506} {"train_loss": -6.821931838989258, "global_step": 147279, "epoch": 3506} {"train_loss": -6.677336692810059, "global_step": 147280, "epoch": 3506} {"train_loss": -6.761441230773926, "global_step": 147281, "epoch": 3506} {"train_loss": -6.793780326843262, "global_step": 147282, "epoch": 3506} {"train_loss": -6.869168281555176, "global_step": 147283, "epoch": 3506} {"train_loss": -6.682251930236816, "global_step": 147284, "epoch": 3506} {"train_loss": -6.4860968589782715, "global_step": 147285, "epoch": 3506} {"train_loss": -6.7322306632995605, "global_step": 147286, "epoch": 3506} {"train_loss": -6.575206756591797, "global_step": 147287, "epoch": 3506} {"train_loss": -6.708663463592529, "global_step": 147288, "epoch": 3506} {"train_loss": -6.634843349456787, "global_step": 147289, "epoch": 3506} {"train_loss": -6.756028175354004, "global_step": 147290, "epoch": 3506} {"train_loss": -6.590374946594238, "global_step": 147291, "epoch": 3506} {"train_loss": -6.522026062011719, "global_step": 147292, "epoch": 3506} {"train_loss": -6.766511179151989, "global_step": 147293, "epoch": 3506, "val_loss": 68086.578125} {"train_loss": -6.737300872802734, "global_step": 147294, "epoch": 3507} {"train_loss": -6.691534996032715, "global_step": 147295, "epoch": 3507} {"train_loss": -6.7252912521362305, "global_step": 147296, "epoch": 3507} {"train_loss": -6.76019287109375, "global_step": 147297, "epoch": 3507} {"train_loss": -6.737115859985352, "global_step": 147298, "epoch": 3507} {"train_loss": -6.780259609222412, "global_step": 147299, "epoch": 3507} {"train_loss": -6.741365432739258, "global_step": 147300, "epoch": 3507} {"train_loss": -6.775984287261963, "global_step": 147301, "epoch": 3507} {"train_loss": -6.868993759155273, "global_step": 147302, "epoch": 3507} {"train_loss": -6.878391265869141, "global_step": 147303, "epoch": 3507} {"train_loss": -6.781095504760742, "global_step": 147304, "epoch": 3507} {"train_loss": -6.894039630889893, "global_step": 147305, "epoch": 3507} {"train_loss": -6.7993059158325195, "global_step": 147306, "epoch": 3507} {"train_loss": -6.891922473907471, "global_step": 147307, "epoch": 3507} {"train_loss": -6.852205276489258, "global_step": 147308, "epoch": 3507} {"train_loss": -6.78072452545166, "global_step": 147309, "epoch": 3507} {"train_loss": -6.79872989654541, "global_step": 147310, "epoch": 3507} {"train_loss": -6.733741283416748, "global_step": 147311, "epoch": 3507} {"train_loss": -6.789360046386719, "global_step": 147312, "epoch": 3507} {"train_loss": -6.951780319213867, "global_step": 147313, "epoch": 3507} {"train_loss": -6.715336322784424, "global_step": 147314, "epoch": 3507} {"train_loss": -6.818236351013184, "global_step": 147315, "epoch": 3507} {"train_loss": -6.895468711853027, "global_step": 147316, "epoch": 3507} {"train_loss": -6.718858242034912, "global_step": 147317, "epoch": 3507} {"train_loss": -6.774619102478027, "global_step": 147318, "epoch": 3507} {"train_loss": -6.787238121032715, "global_step": 147319, "epoch": 3507} {"train_loss": -6.8153791427612305, "global_step": 147320, "epoch": 3507} {"train_loss": -6.78619384765625, "global_step": 147321, "epoch": 3507} {"train_loss": -6.83586311340332, "global_step": 147322, "epoch": 3507} {"train_loss": -6.797524452209473, "global_step": 147323, "epoch": 3507} {"train_loss": -6.891779899597168, "global_step": 147324, "epoch": 3507} {"train_loss": -6.611125946044922, "global_step": 147325, "epoch": 3507} {"train_loss": -6.814685821533203, "global_step": 147326, "epoch": 3507} {"train_loss": -6.84555721282959, "global_step": 147327, "epoch": 3507} {"train_loss": -6.832915306091309, "global_step": 147328, "epoch": 3507} {"train_loss": -6.857553958892822, "global_step": 147329, "epoch": 3507} {"train_loss": -6.878780841827393, "global_step": 147330, "epoch": 3507} {"train_loss": -6.694506645202637, "global_step": 147331, "epoch": 3507} {"train_loss": -6.796640872955322, "global_step": 147332, "epoch": 3507} {"train_loss": -6.841475009918213, "global_step": 147333, "epoch": 3507} {"train_loss": -6.782905101776123, "global_step": 147334, "epoch": 3507} {"train_loss": -6.7983207021440775, "global_step": 147335, "epoch": 3507, "val_loss": 67656.65625} {"train_loss": -6.752854347229004, "global_step": 147336, "epoch": 3508} {"train_loss": -6.878114700317383, "global_step": 147337, "epoch": 3508} {"train_loss": -6.78068208694458, "global_step": 147338, "epoch": 3508} {"train_loss": -6.789882659912109, "global_step": 147339, "epoch": 3508} {"train_loss": -6.759485244750977, "global_step": 147340, "epoch": 3508} {"train_loss": -6.899728775024414, "global_step": 147341, "epoch": 3508} {"train_loss": -6.84041690826416, "global_step": 147342, "epoch": 3508} {"train_loss": -6.684532165527344, "global_step": 147343, "epoch": 3508} {"train_loss": -6.8086395263671875, "global_step": 147344, "epoch": 3508} {"train_loss": -6.806918144226074, "global_step": 147345, "epoch": 3508} {"train_loss": -6.914502143859863, "global_step": 147346, "epoch": 3508} {"train_loss": -6.843148231506348, "global_step": 147347, "epoch": 3508} {"train_loss": -6.838844299316406, "global_step": 147348, "epoch": 3508} {"train_loss": -6.950960636138916, "global_step": 147349, "epoch": 3508} {"train_loss": -6.890501976013184, "global_step": 147350, "epoch": 3508} {"train_loss": -6.892321586608887, "global_step": 147351, "epoch": 3508} {"train_loss": -6.849251747131348, "global_step": 147352, "epoch": 3508} {"train_loss": -6.853354454040527, "global_step": 147353, "epoch": 3508} {"train_loss": -6.879875183105469, "global_step": 147354, "epoch": 3508} {"train_loss": -6.643176078796387, "global_step": 147355, "epoch": 3508} {"train_loss": -6.78550910949707, "global_step": 147356, "epoch": 3508} {"train_loss": -6.892661094665527, "global_step": 147357, "epoch": 3508} {"train_loss": -6.7825117111206055, "global_step": 147358, "epoch": 3508} {"train_loss": -6.659200668334961, "global_step": 147359, "epoch": 3508} {"train_loss": -6.8500895500183105, "global_step": 147360, "epoch": 3508} {"train_loss": -6.744822025299072, "global_step": 147361, "epoch": 3508} {"train_loss": -6.748181343078613, "global_step": 147362, "epoch": 3508} {"train_loss": -6.773220539093018, "global_step": 147363, "epoch": 3508} {"train_loss": -6.791122913360596, "global_step": 147364, "epoch": 3508} {"train_loss": -6.835135459899902, "global_step": 147365, "epoch": 3508} {"train_loss": -6.856656551361084, "global_step": 147366, "epoch": 3508} {"train_loss": -6.741602897644043, "global_step": 147367, "epoch": 3508} {"train_loss": -6.7615437507629395, "global_step": 147368, "epoch": 3508} {"train_loss": -6.876691818237305, "global_step": 147369, "epoch": 3508} {"train_loss": -6.786150932312012, "global_step": 147370, "epoch": 3508} {"train_loss": -6.882392406463623, "global_step": 147371, "epoch": 3508} {"train_loss": -6.893670558929443, "global_step": 147372, "epoch": 3508} {"train_loss": -6.888931751251221, "global_step": 147373, "epoch": 3508} {"train_loss": -6.7004008293151855, "global_step": 147374, "epoch": 3508} {"train_loss": -6.810235977172852, "global_step": 147375, "epoch": 3508} {"train_loss": -6.8195905685424805, "global_step": 147376, "epoch": 3508} {"train_loss": -6.818410964239211, "global_step": 147377, "epoch": 3508, "val_loss": 67914.171875} {"train_loss": -6.843057632446289, "global_step": 147378, "epoch": 3509} {"train_loss": -6.809625625610352, "global_step": 147379, "epoch": 3509} {"train_loss": -6.873128890991211, "global_step": 147380, "epoch": 3509} {"train_loss": -6.720301628112793, "global_step": 147381, "epoch": 3509} {"train_loss": -6.735816955566406, "global_step": 147382, "epoch": 3509} {"train_loss": -6.8199567794799805, "global_step": 147383, "epoch": 3509} {"train_loss": -6.75446081161499, "global_step": 147384, "epoch": 3509} {"train_loss": -6.793975830078125, "global_step": 147385, "epoch": 3509} {"train_loss": -6.889986038208008, "global_step": 147386, "epoch": 3509} {"train_loss": -6.698513984680176, "global_step": 147387, "epoch": 3509} {"train_loss": -6.910346031188965, "global_step": 147388, "epoch": 3509} {"train_loss": -6.784753322601318, "global_step": 147389, "epoch": 3509} {"train_loss": -6.791083812713623, "global_step": 147390, "epoch": 3509} {"train_loss": -6.908252716064453, "global_step": 147391, "epoch": 3509} {"train_loss": -6.798224925994873, "global_step": 147392, "epoch": 3509} {"train_loss": -6.790826797485352, "global_step": 147393, "epoch": 3509} {"train_loss": -6.789504051208496, "global_step": 147394, "epoch": 3509} {"train_loss": -6.79974365234375, "global_step": 147395, "epoch": 3509} {"train_loss": -6.750754356384277, "global_step": 147396, "epoch": 3509} {"train_loss": -6.9207329750061035, "global_step": 147397, "epoch": 3509} {"train_loss": -6.872593879699707, "global_step": 147398, "epoch": 3509} {"train_loss": -6.795855522155762, "global_step": 147399, "epoch": 3509} {"train_loss": -6.826330184936523, "global_step": 147400, "epoch": 3509} {"train_loss": -6.864377021789551, "global_step": 147401, "epoch": 3509} {"train_loss": -6.83894157409668, "global_step": 147402, "epoch": 3509} {"train_loss": -6.9951629638671875, "global_step": 147403, "epoch": 3509} {"train_loss": -6.775381088256836, "global_step": 147404, "epoch": 3509} {"train_loss": -6.821694850921631, "global_step": 147405, "epoch": 3509} {"train_loss": -6.722990989685059, "global_step": 147406, "epoch": 3509} {"train_loss": -6.865379333496094, "global_step": 147407, "epoch": 3509} {"train_loss": -6.874482154846191, "global_step": 147408, "epoch": 3509} {"train_loss": -6.76426887512207, "global_step": 147409, "epoch": 3509} {"train_loss": -6.919329643249512, "global_step": 147410, "epoch": 3509} {"train_loss": -6.804838180541992, "global_step": 147411, "epoch": 3509} {"train_loss": -6.756738662719727, "global_step": 147412, "epoch": 3509} {"train_loss": -6.814037322998047, "global_step": 147413, "epoch": 3509} {"train_loss": -6.793212890625, "global_step": 147414, "epoch": 3509} {"train_loss": -6.818185806274414, "global_step": 147415, "epoch": 3509} {"train_loss": -6.805349349975586, "global_step": 147416, "epoch": 3509} {"train_loss": -6.811008453369141, "global_step": 147417, "epoch": 3509} {"train_loss": -6.886669158935547, "global_step": 147418, "epoch": 3509} {"train_loss": -6.821725243613834, "global_step": 147419, "epoch": 3509, "val_loss": 68044.375} {"train_loss": -6.742952346801758, "global_step": 147420, "epoch": 3510} {"train_loss": -6.771612644195557, "global_step": 147421, "epoch": 3510} {"train_loss": -6.812819004058838, "global_step": 147422, "epoch": 3510} {"train_loss": -6.809350967407227, "global_step": 147423, "epoch": 3510} {"train_loss": -6.823087692260742, "global_step": 147424, "epoch": 3510} {"train_loss": -6.763627052307129, "global_step": 147425, "epoch": 3510} {"train_loss": -6.818294525146484, "global_step": 147426, "epoch": 3510} {"train_loss": -6.836025238037109, "global_step": 147427, "epoch": 3510} {"train_loss": -6.817685604095459, "global_step": 147428, "epoch": 3510} {"train_loss": -6.944971084594727, "global_step": 147429, "epoch": 3510} {"train_loss": -6.774209976196289, "global_step": 147430, "epoch": 3510} {"train_loss": -6.834113597869873, "global_step": 147431, "epoch": 3510} {"train_loss": -6.929279804229736, "global_step": 147432, "epoch": 3510} {"train_loss": -6.875831604003906, "global_step": 147433, "epoch": 3510} {"train_loss": -6.9053192138671875, "global_step": 147434, "epoch": 3510} {"train_loss": -6.827188968658447, "global_step": 147435, "epoch": 3510} {"train_loss": -6.806155681610107, "global_step": 147436, "epoch": 3510} {"train_loss": -6.838200569152832, "global_step": 147437, "epoch": 3510} {"train_loss": -6.897989749908447, "global_step": 147438, "epoch": 3510} {"train_loss": -6.863656997680664, "global_step": 147439, "epoch": 3510} {"train_loss": -6.74713134765625, "global_step": 147440, "epoch": 3510} {"train_loss": -6.880430221557617, "global_step": 147441, "epoch": 3510} {"train_loss": -6.8916239738464355, "global_step": 147442, "epoch": 3510} {"train_loss": -6.895319938659668, "global_step": 147443, "epoch": 3510} {"train_loss": -6.71565055847168, "global_step": 147444, "epoch": 3510} {"train_loss": -6.83912992477417, "global_step": 147445, "epoch": 3510} {"train_loss": -6.807794570922852, "global_step": 147446, "epoch": 3510} {"train_loss": -6.7833123207092285, "global_step": 147447, "epoch": 3510} {"train_loss": -6.932500839233398, "global_step": 147448, "epoch": 3510} {"train_loss": -6.868512153625488, "global_step": 147449, "epoch": 3510} {"train_loss": -6.9449262619018555, "global_step": 147450, "epoch": 3510} {"train_loss": -6.980020046234131, "global_step": 147451, "epoch": 3510} {"train_loss": -6.789327621459961, "global_step": 147452, "epoch": 3510} {"train_loss": -6.907879829406738, "global_step": 147453, "epoch": 3510} {"train_loss": -6.806800365447998, "global_step": 147454, "epoch": 3510} {"train_loss": -6.877199649810791, "global_step": 147455, "epoch": 3510} {"train_loss": -6.883399486541748, "global_step": 147456, "epoch": 3510} {"train_loss": -6.890439987182617, "global_step": 147457, "epoch": 3510} {"train_loss": -6.824491500854492, "global_step": 147458, "epoch": 3510} {"train_loss": -6.763476371765137, "global_step": 147459, "epoch": 3510} {"train_loss": -6.89046573638916, "global_step": 147460, "epoch": 3510} {"train_loss": -6.846691460836501, "global_step": 147461, "epoch": 3510, "val_loss": 67839.71875} {"train_loss": -6.959848403930664, "global_step": 147462, "epoch": 3511} {"train_loss": -6.942966938018799, "global_step": 147463, "epoch": 3511} {"train_loss": -6.99627685546875, "global_step": 147464, "epoch": 3511} {"train_loss": -6.826174736022949, "global_step": 147465, "epoch": 3511} {"train_loss": -6.850854873657227, "global_step": 147466, "epoch": 3511} {"train_loss": -6.801012992858887, "global_step": 147467, "epoch": 3511} {"train_loss": -6.8938822746276855, "global_step": 147468, "epoch": 3511} {"train_loss": -6.814664840698242, "global_step": 147469, "epoch": 3511} {"train_loss": -6.749975204467773, "global_step": 147470, "epoch": 3511} {"train_loss": -6.805771827697754, "global_step": 147471, "epoch": 3511} {"train_loss": -6.885138034820557, "global_step": 147472, "epoch": 3511} {"train_loss": -6.8470258712768555, "global_step": 147473, "epoch": 3511} {"train_loss": -6.836840629577637, "global_step": 147474, "epoch": 3511} {"train_loss": -6.720593452453613, "global_step": 147475, "epoch": 3511} {"train_loss": -6.746297836303711, "global_step": 147476, "epoch": 3511} {"train_loss": -6.738771438598633, "global_step": 147477, "epoch": 3511} {"train_loss": -6.808420181274414, "global_step": 147478, "epoch": 3511} {"train_loss": -6.8488264083862305, "global_step": 147479, "epoch": 3511} {"train_loss": -6.727362155914307, "global_step": 147480, "epoch": 3511} {"train_loss": -6.7215375900268555, "global_step": 147481, "epoch": 3511} {"train_loss": -6.710198402404785, "global_step": 147482, "epoch": 3511} {"train_loss": -6.826129913330078, "global_step": 147483, "epoch": 3511} {"train_loss": -6.782489776611328, "global_step": 147484, "epoch": 3511} {"train_loss": -6.763652801513672, "global_step": 147485, "epoch": 3511} {"train_loss": -6.750865936279297, "global_step": 147486, "epoch": 3511} {"train_loss": -6.812870025634766, "global_step": 147487, "epoch": 3511} {"train_loss": -6.735315322875977, "global_step": 147488, "epoch": 3511} {"train_loss": -6.899094104766846, "global_step": 147489, "epoch": 3511} {"train_loss": -6.6252617835998535, "global_step": 147490, "epoch": 3511} {"train_loss": -6.664023399353027, "global_step": 147491, "epoch": 3511} {"train_loss": -6.822561264038086, "global_step": 147492, "epoch": 3511} {"train_loss": -6.599159240722656, "global_step": 147493, "epoch": 3511} {"train_loss": -6.894608497619629, "global_step": 147494, "epoch": 3511} {"train_loss": -6.647192001342773, "global_step": 147495, "epoch": 3511} {"train_loss": -6.843035697937012, "global_step": 147496, "epoch": 3511} {"train_loss": -6.8201446533203125, "global_step": 147497, "epoch": 3511} {"train_loss": -6.723178386688232, "global_step": 147498, "epoch": 3511} {"train_loss": -6.795720100402832, "global_step": 147499, "epoch": 3511} {"train_loss": -6.780481338500977, "global_step": 147500, "epoch": 3511} {"train_loss": -6.851966857910156, "global_step": 147501, "epoch": 3511} {"train_loss": -6.624778747558594, "global_step": 147502, "epoch": 3511} {"train_loss": -6.790331919987996, "global_step": 147503, "epoch": 3511, "val_loss": 67713.5546875} {"train_loss": -6.648608207702637, "global_step": 147504, "epoch": 3512} {"train_loss": -6.840663433074951, "global_step": 147505, "epoch": 3512} {"train_loss": -6.71219539642334, "global_step": 147506, "epoch": 3512} {"train_loss": -6.827908992767334, "global_step": 147507, "epoch": 3512} {"train_loss": -6.654481887817383, "global_step": 147508, "epoch": 3512} {"train_loss": -6.728848934173584, "global_step": 147509, "epoch": 3512} {"train_loss": -6.637228012084961, "global_step": 147510, "epoch": 3512} {"train_loss": -6.792366027832031, "global_step": 147511, "epoch": 3512} {"train_loss": -6.755393981933594, "global_step": 147512, "epoch": 3512} {"train_loss": -6.732283592224121, "global_step": 147513, "epoch": 3512} {"train_loss": -6.733911514282227, "global_step": 147514, "epoch": 3512} {"train_loss": -6.802675247192383, "global_step": 147515, "epoch": 3512} {"train_loss": -6.857709884643555, "global_step": 147516, "epoch": 3512} {"train_loss": -6.631292343139648, "global_step": 147517, "epoch": 3512} {"train_loss": -6.7570085525512695, "global_step": 147518, "epoch": 3512} {"train_loss": -6.845554351806641, "global_step": 147519, "epoch": 3512} {"train_loss": -6.845822334289551, "global_step": 147520, "epoch": 3512} {"train_loss": -6.633105278015137, "global_step": 147521, "epoch": 3512} {"train_loss": -6.860650062561035, "global_step": 147522, "epoch": 3512} {"train_loss": -6.8393659591674805, "global_step": 147523, "epoch": 3512} {"train_loss": -6.749441623687744, "global_step": 147524, "epoch": 3512} {"train_loss": -6.843822479248047, "global_step": 147525, "epoch": 3512} {"train_loss": -6.670469284057617, "global_step": 147526, "epoch": 3512} {"train_loss": -6.941192626953125, "global_step": 147527, "epoch": 3512} {"train_loss": -6.8107147216796875, "global_step": 147528, "epoch": 3512} {"train_loss": -6.845490455627441, "global_step": 147529, "epoch": 3512} {"train_loss": -6.838870048522949, "global_step": 147530, "epoch": 3512} {"train_loss": -6.899703025817871, "global_step": 147531, "epoch": 3512} {"train_loss": -6.842826843261719, "global_step": 147532, "epoch": 3512} {"train_loss": -6.720236778259277, "global_step": 147533, "epoch": 3512} {"train_loss": -6.907376289367676, "global_step": 147534, "epoch": 3512} {"train_loss": -6.7731170654296875, "global_step": 147535, "epoch": 3512} {"train_loss": -6.928494930267334, "global_step": 147536, "epoch": 3512} {"train_loss": -6.88848876953125, "global_step": 147537, "epoch": 3512} {"train_loss": -6.823526382446289, "global_step": 147538, "epoch": 3512} {"train_loss": -6.891695499420166, "global_step": 147539, "epoch": 3512} {"train_loss": -6.8514862060546875, "global_step": 147540, "epoch": 3512} {"train_loss": -6.896326065063477, "global_step": 147541, "epoch": 3512} {"train_loss": -6.964199066162109, "global_step": 147542, "epoch": 3512} {"train_loss": -6.901288032531738, "global_step": 147543, "epoch": 3512} {"train_loss": -6.9754486083984375, "global_step": 147544, "epoch": 3512} {"train_loss": -6.8107826482682, "global_step": 147545, "epoch": 3512, "val_loss": 67673.4765625} {"train_loss": -6.944721221923828, "global_step": 147546, "epoch": 3513} {"train_loss": -6.899813175201416, "global_step": 147547, "epoch": 3513} {"train_loss": -6.779581069946289, "global_step": 147548, "epoch": 3513} {"train_loss": -6.84556245803833, "global_step": 147549, "epoch": 3513} {"train_loss": -6.8655195236206055, "global_step": 147550, "epoch": 3513} {"train_loss": -6.9612507820129395, "global_step": 147551, "epoch": 3513} {"train_loss": -6.94015645980835, "global_step": 147552, "epoch": 3513} {"train_loss": -6.813369274139404, "global_step": 147553, "epoch": 3513} {"train_loss": -6.86873197555542, "global_step": 147554, "epoch": 3513} {"train_loss": -6.890174388885498, "global_step": 147555, "epoch": 3513} {"train_loss": -6.8057475090026855, "global_step": 147556, "epoch": 3513} {"train_loss": -6.846931457519531, "global_step": 147557, "epoch": 3513} {"train_loss": -6.977065563201904, "global_step": 147558, "epoch": 3513} {"train_loss": -6.877511024475098, "global_step": 147559, "epoch": 3513} {"train_loss": -6.871129989624023, "global_step": 147560, "epoch": 3513} {"train_loss": -6.80003023147583, "global_step": 147561, "epoch": 3513} {"train_loss": -6.877614498138428, "global_step": 147562, "epoch": 3513} {"train_loss": -6.8720808029174805, "global_step": 147563, "epoch": 3513} {"train_loss": -6.8891754150390625, "global_step": 147564, "epoch": 3513} {"train_loss": -6.888601779937744, "global_step": 147565, "epoch": 3513} {"train_loss": -6.864091873168945, "global_step": 147566, "epoch": 3513} {"train_loss": -6.902720928192139, "global_step": 147567, "epoch": 3513} {"train_loss": -6.842046737670898, "global_step": 147568, "epoch": 3513} {"train_loss": -6.8492207527160645, "global_step": 147569, "epoch": 3513} {"train_loss": -6.831052780151367, "global_step": 147570, "epoch": 3513} {"train_loss": -6.919068336486816, "global_step": 147571, "epoch": 3513} {"train_loss": -6.863083839416504, "global_step": 147572, "epoch": 3513} {"train_loss": -6.909241676330566, "global_step": 147573, "epoch": 3513} {"train_loss": -6.798608303070068, "global_step": 147574, "epoch": 3513} {"train_loss": -6.805390357971191, "global_step": 147575, "epoch": 3513} {"train_loss": -6.883910179138184, "global_step": 147576, "epoch": 3513} {"train_loss": -6.81782341003418, "global_step": 147577, "epoch": 3513} {"train_loss": -6.798274517059326, "global_step": 147578, "epoch": 3513} {"train_loss": -6.810426235198975, "global_step": 147579, "epoch": 3513} {"train_loss": -6.871999740600586, "global_step": 147580, "epoch": 3513} {"train_loss": -6.722951889038086, "global_step": 147581, "epoch": 3513} {"train_loss": -6.931199073791504, "global_step": 147582, "epoch": 3513} {"train_loss": -6.804781913757324, "global_step": 147583, "epoch": 3513} {"train_loss": -6.785599231719971, "global_step": 147584, "epoch": 3513} {"train_loss": -6.838500022888184, "global_step": 147585, "epoch": 3513} {"train_loss": -6.770028591156006, "global_step": 147586, "epoch": 3513} {"train_loss": -6.85625095594497, "global_step": 147587, "epoch": 3513, "val_loss": 67775.2265625} {"train_loss": -6.751211166381836, "global_step": 147588, "epoch": 3514} {"train_loss": -6.888941764831543, "global_step": 147589, "epoch": 3514} {"train_loss": -6.874597072601318, "global_step": 147590, "epoch": 3514} {"train_loss": -6.826110363006592, "global_step": 147591, "epoch": 3514} {"train_loss": -6.8687920570373535, "global_step": 147592, "epoch": 3514} {"train_loss": -6.848328590393066, "global_step": 147593, "epoch": 3514} {"train_loss": -6.813505172729492, "global_step": 147594, "epoch": 3514} {"train_loss": -6.864893436431885, "global_step": 147595, "epoch": 3514} {"train_loss": -6.7603302001953125, "global_step": 147596, "epoch": 3514} {"train_loss": -6.793070316314697, "global_step": 147597, "epoch": 3514} {"train_loss": -6.884122848510742, "global_step": 147598, "epoch": 3514} {"train_loss": -6.717615127563477, "global_step": 147599, "epoch": 3514} {"train_loss": -6.8270368576049805, "global_step": 147600, "epoch": 3514} {"train_loss": -6.8879804611206055, "global_step": 147601, "epoch": 3514} {"train_loss": -6.702864646911621, "global_step": 147602, "epoch": 3514} {"train_loss": -6.8004913330078125, "global_step": 147603, "epoch": 3514} {"train_loss": -6.876477241516113, "global_step": 147604, "epoch": 3514} {"train_loss": -6.803065299987793, "global_step": 147605, "epoch": 3514} {"train_loss": -6.923081874847412, "global_step": 147606, "epoch": 3514} {"train_loss": -6.799551010131836, "global_step": 147607, "epoch": 3514} {"train_loss": -6.9621429443359375, "global_step": 147608, "epoch": 3514} {"train_loss": -6.828286170959473, "global_step": 147609, "epoch": 3514} {"train_loss": -6.794020652770996, "global_step": 147610, "epoch": 3514} {"train_loss": -6.9083123207092285, "global_step": 147611, "epoch": 3514} {"train_loss": -6.90962028503418, "global_step": 147612, "epoch": 3514} {"train_loss": -6.959517955780029, "global_step": 147613, "epoch": 3514} {"train_loss": -6.951067924499512, "global_step": 147614, "epoch": 3514} {"train_loss": -6.826498031616211, "global_step": 147615, "epoch": 3514} {"train_loss": -6.783617973327637, "global_step": 147616, "epoch": 3514} {"train_loss": -6.906499862670898, "global_step": 147617, "epoch": 3514} {"train_loss": -6.722407341003418, "global_step": 147618, "epoch": 3514} {"train_loss": -6.867050647735596, "global_step": 147619, "epoch": 3514} {"train_loss": -6.8501996994018555, "global_step": 147620, "epoch": 3514} {"train_loss": -6.726231575012207, "global_step": 147621, "epoch": 3514} {"train_loss": -6.850958824157715, "global_step": 147622, "epoch": 3514} {"train_loss": -6.680997848510742, "global_step": 147623, "epoch": 3514} {"train_loss": -6.785466194152832, "global_step": 147624, "epoch": 3514} {"train_loss": -6.951685905456543, "global_step": 147625, "epoch": 3514} {"train_loss": -6.5211687088012695, "global_step": 147626, "epoch": 3514} {"train_loss": -6.7367143630981445, "global_step": 147627, "epoch": 3514} {"train_loss": -6.666325569152832, "global_step": 147628, "epoch": 3514} {"train_loss": -6.819948253177461, "global_step": 147629, "epoch": 3514, "val_loss": 67917.921875} {"train_loss": -6.927362442016602, "global_step": 147630, "epoch": 3515} {"train_loss": -6.732932090759277, "global_step": 147631, "epoch": 3515} {"train_loss": -6.775202751159668, "global_step": 147632, "epoch": 3515} {"train_loss": -6.826916694641113, "global_step": 147633, "epoch": 3515} {"train_loss": -6.848112106323242, "global_step": 147634, "epoch": 3515} {"train_loss": -6.695520401000977, "global_step": 147635, "epoch": 3515} {"train_loss": -6.879631042480469, "global_step": 147636, "epoch": 3515} {"train_loss": -6.840328216552734, "global_step": 147637, "epoch": 3515} {"train_loss": -6.837228775024414, "global_step": 147638, "epoch": 3515} {"train_loss": -6.888247489929199, "global_step": 147639, "epoch": 3515} {"train_loss": -6.763422966003418, "global_step": 147640, "epoch": 3515} {"train_loss": -6.929315567016602, "global_step": 147641, "epoch": 3515} {"train_loss": -6.793865203857422, "global_step": 147642, "epoch": 3515} {"train_loss": -6.713565826416016, "global_step": 147643, "epoch": 3515} {"train_loss": -6.850494861602783, "global_step": 147644, "epoch": 3515} {"train_loss": -6.772792816162109, "global_step": 147645, "epoch": 3515} {"train_loss": -6.738748550415039, "global_step": 147646, "epoch": 3515} {"train_loss": -6.7906107902526855, "global_step": 147647, "epoch": 3515} {"train_loss": -6.768942832946777, "global_step": 147648, "epoch": 3515} {"train_loss": -6.778193950653076, "global_step": 147649, "epoch": 3515} {"train_loss": -6.795424461364746, "global_step": 147650, "epoch": 3515} {"train_loss": -6.811490058898926, "global_step": 147651, "epoch": 3515} {"train_loss": -6.754406929016113, "global_step": 147652, "epoch": 3515} {"train_loss": -6.908806324005127, "global_step": 147653, "epoch": 3515} {"train_loss": -6.745993137359619, "global_step": 147654, "epoch": 3515} {"train_loss": -6.800475120544434, "global_step": 147655, "epoch": 3515} {"train_loss": -6.899868965148926, "global_step": 147656, "epoch": 3515} {"train_loss": -6.96790075302124, "global_step": 147657, "epoch": 3515} {"train_loss": -6.7580742835998535, "global_step": 147658, "epoch": 3515} {"train_loss": -6.944890975952148, "global_step": 147659, "epoch": 3515} {"train_loss": -6.905204772949219, "global_step": 147660, "epoch": 3515} {"train_loss": -6.884047508239746, "global_step": 147661, "epoch": 3515} {"train_loss": -6.807024002075195, "global_step": 147662, "epoch": 3515} {"train_loss": -6.876255035400391, "global_step": 147663, "epoch": 3515} {"train_loss": -6.7625932693481445, "global_step": 147664, "epoch": 3515} {"train_loss": -6.904980659484863, "global_step": 147665, "epoch": 3515} {"train_loss": -6.845094203948975, "global_step": 147666, "epoch": 3515} {"train_loss": -6.780735015869141, "global_step": 147667, "epoch": 3515} {"train_loss": -6.884808540344238, "global_step": 147668, "epoch": 3515} {"train_loss": -6.8398590087890625, "global_step": 147669, "epoch": 3515} {"train_loss": -6.898262977600098, "global_step": 147670, "epoch": 3515} {"train_loss": -6.826688618887038, "global_step": 147671, "epoch": 3515, "val_loss": 67768.546875} {"train_loss": -6.879484176635742, "global_step": 147672, "epoch": 3516} {"train_loss": -6.837994575500488, "global_step": 147673, "epoch": 3516} {"train_loss": -6.720446586608887, "global_step": 147674, "epoch": 3516} {"train_loss": -6.899410724639893, "global_step": 147675, "epoch": 3516} {"train_loss": -6.800207138061523, "global_step": 147676, "epoch": 3516} {"train_loss": -6.79519510269165, "global_step": 147677, "epoch": 3516} {"train_loss": -6.9164276123046875, "global_step": 147678, "epoch": 3516} {"train_loss": -6.682337760925293, "global_step": 147679, "epoch": 3516} {"train_loss": -6.769986152648926, "global_step": 147680, "epoch": 3516} {"train_loss": -6.765281677246094, "global_step": 147681, "epoch": 3516} {"train_loss": -6.799921989440918, "global_step": 147682, "epoch": 3516} {"train_loss": -6.802835464477539, "global_step": 147683, "epoch": 3516} {"train_loss": -6.822930335998535, "global_step": 147684, "epoch": 3516} {"train_loss": -6.864989280700684, "global_step": 147685, "epoch": 3516} {"train_loss": -6.74771785736084, "global_step": 147686, "epoch": 3516} {"train_loss": -6.781740665435791, "global_step": 147687, "epoch": 3516} {"train_loss": -6.8672614097595215, "global_step": 147688, "epoch": 3516} {"train_loss": -6.819928169250488, "global_step": 147689, "epoch": 3516} {"train_loss": -6.818493366241455, "global_step": 147690, "epoch": 3516} {"train_loss": -6.828790664672852, "global_step": 147691, "epoch": 3516} {"train_loss": -6.985178470611572, "global_step": 147692, "epoch": 3516} {"train_loss": -6.846251010894775, "global_step": 147693, "epoch": 3516} {"train_loss": -6.904128551483154, "global_step": 147694, "epoch": 3516} {"train_loss": -6.79833984375, "global_step": 147695, "epoch": 3516} {"train_loss": -6.749034881591797, "global_step": 147696, "epoch": 3516} {"train_loss": -6.699206829071045, "global_step": 147697, "epoch": 3516} {"train_loss": -6.789613246917725, "global_step": 147698, "epoch": 3516} {"train_loss": -6.819086074829102, "global_step": 147699, "epoch": 3516} {"train_loss": -6.807416915893555, "global_step": 147700, "epoch": 3516} {"train_loss": -6.816834926605225, "global_step": 147701, "epoch": 3516} {"train_loss": -6.771661758422852, "global_step": 147702, "epoch": 3516} {"train_loss": -6.767983436584473, "global_step": 147703, "epoch": 3516} {"train_loss": -6.840774059295654, "global_step": 147704, "epoch": 3516} {"train_loss": -6.847437858581543, "global_step": 147705, "epoch": 3516} {"train_loss": -6.817868232727051, "global_step": 147706, "epoch": 3516} {"train_loss": -6.918482780456543, "global_step": 147707, "epoch": 3516} {"train_loss": -6.798853874206543, "global_step": 147708, "epoch": 3516} {"train_loss": -6.7781596183776855, "global_step": 147709, "epoch": 3516} {"train_loss": -6.858207702636719, "global_step": 147710, "epoch": 3516} {"train_loss": -6.914516448974609, "global_step": 147711, "epoch": 3516} {"train_loss": -6.842652320861816, "global_step": 147712, "epoch": 3516} {"train_loss": -6.821051722481137, "global_step": 147713, "epoch": 3516, "val_loss": 67969.1796875} {"train_loss": -6.959561347961426, "global_step": 147714, "epoch": 3517} {"train_loss": -6.794207572937012, "global_step": 147715, "epoch": 3517} {"train_loss": -6.794040679931641, "global_step": 147716, "epoch": 3517} {"train_loss": -6.855966567993164, "global_step": 147717, "epoch": 3517} {"train_loss": -6.8183183670043945, "global_step": 147718, "epoch": 3517} {"train_loss": -6.780522346496582, "global_step": 147719, "epoch": 3517} {"train_loss": -6.722198009490967, "global_step": 147720, "epoch": 3517} {"train_loss": -6.952796459197998, "global_step": 147721, "epoch": 3517} {"train_loss": -6.948537826538086, "global_step": 147722, "epoch": 3517} {"train_loss": -6.830145359039307, "global_step": 147723, "epoch": 3517} {"train_loss": -6.924856662750244, "global_step": 147724, "epoch": 3517} {"train_loss": -6.719643592834473, "global_step": 147725, "epoch": 3517} {"train_loss": -7.0068583488464355, "global_step": 147726, "epoch": 3517} {"train_loss": -6.970332145690918, "global_step": 147727, "epoch": 3517} {"train_loss": -6.791593551635742, "global_step": 147728, "epoch": 3517} {"train_loss": -6.759714126586914, "global_step": 147729, "epoch": 3517} {"train_loss": -6.921682357788086, "global_step": 147730, "epoch": 3517} {"train_loss": -6.877598762512207, "global_step": 147731, "epoch": 3517} {"train_loss": -6.693107604980469, "global_step": 147732, "epoch": 3517} {"train_loss": -6.806100845336914, "global_step": 147733, "epoch": 3517} {"train_loss": -6.785999298095703, "global_step": 147734, "epoch": 3517} {"train_loss": -6.740142822265625, "global_step": 147735, "epoch": 3517} {"train_loss": -6.856629371643066, "global_step": 147736, "epoch": 3517} {"train_loss": -6.746268272399902, "global_step": 147737, "epoch": 3517} {"train_loss": -6.803007125854492, "global_step": 147738, "epoch": 3517} {"train_loss": -6.795154571533203, "global_step": 147739, "epoch": 3517} {"train_loss": -6.7945966720581055, "global_step": 147740, "epoch": 3517} {"train_loss": -6.77943229675293, "global_step": 147741, "epoch": 3517} {"train_loss": -6.8573503494262695, "global_step": 147742, "epoch": 3517} {"train_loss": -6.779759407043457, "global_step": 147743, "epoch": 3517} {"train_loss": -6.720466613769531, "global_step": 147744, "epoch": 3517} {"train_loss": -6.813140869140625, "global_step": 147745, "epoch": 3517} {"train_loss": -6.806630611419678, "global_step": 147746, "epoch": 3517} {"train_loss": -6.8415207862854, "global_step": 147747, "epoch": 3517} {"train_loss": -6.883376121520996, "global_step": 147748, "epoch": 3517} {"train_loss": -6.678820610046387, "global_step": 147749, "epoch": 3517} {"train_loss": -6.761064052581787, "global_step": 147750, "epoch": 3517} {"train_loss": -6.873953819274902, "global_step": 147751, "epoch": 3517} {"train_loss": -6.781411170959473, "global_step": 147752, "epoch": 3517} {"train_loss": -6.808805465698242, "global_step": 147753, "epoch": 3517} {"train_loss": -6.806934356689453, "global_step": 147754, "epoch": 3517} {"train_loss": -6.819596597126552, "global_step": 147755, "epoch": 3517, "val_loss": 67710.4296875} {"train_loss": -6.85038423538208, "global_step": 147756, "epoch": 3518} {"train_loss": -6.951388835906982, "global_step": 147757, "epoch": 3518} {"train_loss": -6.753090858459473, "global_step": 147758, "epoch": 3518} {"train_loss": -6.681086540222168, "global_step": 147759, "epoch": 3518} {"train_loss": -6.801772117614746, "global_step": 147760, "epoch": 3518} {"train_loss": -6.863260269165039, "global_step": 147761, "epoch": 3518} {"train_loss": -6.825908184051514, "global_step": 147762, "epoch": 3518} {"train_loss": -6.843475341796875, "global_step": 147763, "epoch": 3518} {"train_loss": -6.81024694442749, "global_step": 147764, "epoch": 3518} {"train_loss": -6.913913726806641, "global_step": 147765, "epoch": 3518} {"train_loss": -6.946819305419922, "global_step": 147766, "epoch": 3518} {"train_loss": -6.814929008483887, "global_step": 147767, "epoch": 3518} {"train_loss": -6.860548973083496, "global_step": 147768, "epoch": 3518} {"train_loss": -6.808755874633789, "global_step": 147769, "epoch": 3518} {"train_loss": -6.886244297027588, "global_step": 147770, "epoch": 3518} {"train_loss": -6.900647163391113, "global_step": 147771, "epoch": 3518} {"train_loss": -6.967573165893555, "global_step": 147772, "epoch": 3518} {"train_loss": -6.815712928771973, "global_step": 147773, "epoch": 3518} {"train_loss": -6.869274139404297, "global_step": 147774, "epoch": 3518} {"train_loss": -6.931428909301758, "global_step": 147775, "epoch": 3518} {"train_loss": -6.815282821655273, "global_step": 147776, "epoch": 3518} {"train_loss": -6.94126033782959, "global_step": 147777, "epoch": 3518} {"train_loss": -6.926942825317383, "global_step": 147778, "epoch": 3518} {"train_loss": -6.9630584716796875, "global_step": 147779, "epoch": 3518} {"train_loss": -6.911427021026611, "global_step": 147780, "epoch": 3518} {"train_loss": -6.909343719482422, "global_step": 147781, "epoch": 3518} {"train_loss": -6.932297229766846, "global_step": 147782, "epoch": 3518} {"train_loss": -6.9376726150512695, "global_step": 147783, "epoch": 3518} {"train_loss": -6.956308364868164, "global_step": 147784, "epoch": 3518} {"train_loss": -6.921342849731445, "global_step": 147785, "epoch": 3518} {"train_loss": -6.842686653137207, "global_step": 147786, "epoch": 3518} {"train_loss": -6.93220329284668, "global_step": 147787, "epoch": 3518} {"train_loss": -6.903267860412598, "global_step": 147788, "epoch": 3518} {"train_loss": -6.928509712219238, "global_step": 147789, "epoch": 3518} {"train_loss": -6.986556053161621, "global_step": 147790, "epoch": 3518} {"train_loss": -6.880122184753418, "global_step": 147791, "epoch": 3518} {"train_loss": -6.951380729675293, "global_step": 147792, "epoch": 3518} {"train_loss": -6.9498209953308105, "global_step": 147793, "epoch": 3518} {"train_loss": -6.855566024780273, "global_step": 147794, "epoch": 3518} {"train_loss": -6.867245674133301, "global_step": 147795, "epoch": 3518} {"train_loss": -6.932819843292236, "global_step": 147796, "epoch": 3518} {"train_loss": -6.886336792083013, "global_step": 147797, "epoch": 3518, "val_loss": 67792.140625} {"train_loss": -6.961169719696045, "global_step": 147798, "epoch": 3519} {"train_loss": -6.88901424407959, "global_step": 147799, "epoch": 3519} {"train_loss": -6.901364326477051, "global_step": 147800, "epoch": 3519} {"train_loss": -6.981410026550293, "global_step": 147801, "epoch": 3519} {"train_loss": -6.850264072418213, "global_step": 147802, "epoch": 3519} {"train_loss": -6.90369987487793, "global_step": 147803, "epoch": 3519} {"train_loss": -6.918124198913574, "global_step": 147804, "epoch": 3519} {"train_loss": -6.767833232879639, "global_step": 147805, "epoch": 3519} {"train_loss": -6.880712509155273, "global_step": 147806, "epoch": 3519} {"train_loss": -6.9024434089660645, "global_step": 147807, "epoch": 3519} {"train_loss": -6.89320707321167, "global_step": 147808, "epoch": 3519} {"train_loss": -6.822059631347656, "global_step": 147809, "epoch": 3519} {"train_loss": -6.862326145172119, "global_step": 147810, "epoch": 3519} {"train_loss": -6.814685821533203, "global_step": 147811, "epoch": 3519} {"train_loss": -6.880061149597168, "global_step": 147812, "epoch": 3519} {"train_loss": -6.8339009284973145, "global_step": 147813, "epoch": 3519} {"train_loss": -6.847199440002441, "global_step": 147814, "epoch": 3519} {"train_loss": -6.9131059646606445, "global_step": 147815, "epoch": 3519} {"train_loss": -6.931199073791504, "global_step": 147816, "epoch": 3519} {"train_loss": -6.900909423828125, "global_step": 147817, "epoch": 3519} {"train_loss": -6.904697418212891, "global_step": 147818, "epoch": 3519} {"train_loss": -6.782980918884277, "global_step": 147819, "epoch": 3519} {"train_loss": -6.784242153167725, "global_step": 147820, "epoch": 3519} {"train_loss": -6.844846725463867, "global_step": 147821, "epoch": 3519} {"train_loss": -6.921979904174805, "global_step": 147822, "epoch": 3519} {"train_loss": -6.7833170890808105, "global_step": 147823, "epoch": 3519} {"train_loss": -6.786780834197998, "global_step": 147824, "epoch": 3519} {"train_loss": -6.870504379272461, "global_step": 147825, "epoch": 3519} {"train_loss": -6.868953704833984, "global_step": 147826, "epoch": 3519} {"train_loss": -6.878424644470215, "global_step": 147827, "epoch": 3519} {"train_loss": -6.833674907684326, "global_step": 147828, "epoch": 3519} {"train_loss": -6.980989456176758, "global_step": 147829, "epoch": 3519} {"train_loss": -6.907991886138916, "global_step": 147830, "epoch": 3519} {"train_loss": -6.8051910400390625, "global_step": 147831, "epoch": 3519} {"train_loss": -6.87812614440918, "global_step": 147832, "epoch": 3519} {"train_loss": -6.757987022399902, "global_step": 147833, "epoch": 3519} {"train_loss": -6.773097038269043, "global_step": 147834, "epoch": 3519} {"train_loss": -6.876413345336914, "global_step": 147835, "epoch": 3519} {"train_loss": -6.847923755645752, "global_step": 147836, "epoch": 3519} {"train_loss": -6.792454719543457, "global_step": 147837, "epoch": 3519} {"train_loss": -6.788630485534668, "global_step": 147838, "epoch": 3519} {"train_loss": -6.857566765376499, "global_step": 147839, "epoch": 3519, "val_loss": 67985.125} {"train_loss": -6.740719795227051, "global_step": 147840, "epoch": 3520} {"train_loss": -6.757852077484131, "global_step": 147841, "epoch": 3520} {"train_loss": -6.740327835083008, "global_step": 147842, "epoch": 3520} {"train_loss": -6.743386745452881, "global_step": 147843, "epoch": 3520} {"train_loss": -6.823378562927246, "global_step": 147844, "epoch": 3520} {"train_loss": -6.910457134246826, "global_step": 147845, "epoch": 3520} {"train_loss": -6.721551895141602, "global_step": 147846, "epoch": 3520} {"train_loss": -6.823851108551025, "global_step": 147847, "epoch": 3520} {"train_loss": -6.795838832855225, "global_step": 147848, "epoch": 3520} {"train_loss": -6.825920581817627, "global_step": 147849, "epoch": 3520} {"train_loss": -6.807299613952637, "global_step": 147850, "epoch": 3520} {"train_loss": -6.873195648193359, "global_step": 147851, "epoch": 3520} {"train_loss": -6.691957473754883, "global_step": 147852, "epoch": 3520} {"train_loss": -6.86625862121582, "global_step": 147853, "epoch": 3520} {"train_loss": -6.820045471191406, "global_step": 147854, "epoch": 3520} {"train_loss": -6.744902610778809, "global_step": 147855, "epoch": 3520} {"train_loss": -6.722357749938965, "global_step": 147856, "epoch": 3520} {"train_loss": -6.783546447753906, "global_step": 147857, "epoch": 3520} {"train_loss": -6.856893539428711, "global_step": 147858, "epoch": 3520} {"train_loss": -6.776331901550293, "global_step": 147859, "epoch": 3520} {"train_loss": -6.836813449859619, "global_step": 147860, "epoch": 3520} {"train_loss": -6.760772705078125, "global_step": 147861, "epoch": 3520} {"train_loss": -6.8152337074279785, "global_step": 147862, "epoch": 3520} {"train_loss": -6.808005332946777, "global_step": 147863, "epoch": 3520} {"train_loss": -6.810480117797852, "global_step": 147864, "epoch": 3520} {"train_loss": -6.738889694213867, "global_step": 147865, "epoch": 3520} {"train_loss": -6.787186622619629, "global_step": 147866, "epoch": 3520} {"train_loss": -6.777193546295166, "global_step": 147867, "epoch": 3520} {"train_loss": -6.89816427230835, "global_step": 147868, "epoch": 3520} {"train_loss": -6.737692832946777, "global_step": 147869, "epoch": 3520} {"train_loss": -6.819460868835449, "global_step": 147870, "epoch": 3520} {"train_loss": -6.927764892578125, "global_step": 147871, "epoch": 3520} {"train_loss": -6.858311653137207, "global_step": 147872, "epoch": 3520} {"train_loss": -6.791824817657471, "global_step": 147873, "epoch": 3520} {"train_loss": -6.789257049560547, "global_step": 147874, "epoch": 3520} {"train_loss": -6.801738262176514, "global_step": 147875, "epoch": 3520} {"train_loss": -6.862655162811279, "global_step": 147876, "epoch": 3520} {"train_loss": -6.800612449645996, "global_step": 147877, "epoch": 3520} {"train_loss": -6.819635391235352, "global_step": 147878, "epoch": 3520} {"train_loss": -6.78540563583374, "global_step": 147879, "epoch": 3520} {"train_loss": -6.821101665496826, "global_step": 147880, "epoch": 3520} {"train_loss": -6.80282347542899, "global_step": 147881, "epoch": 3520, "val_loss": 67823.25} {"train_loss": -6.807585716247559, "global_step": 147882, "epoch": 3521} {"train_loss": -6.86753511428833, "global_step": 147883, "epoch": 3521} {"train_loss": -6.879411697387695, "global_step": 147884, "epoch": 3521} {"train_loss": -6.816774368286133, "global_step": 147885, "epoch": 3521} {"train_loss": -6.716855049133301, "global_step": 147886, "epoch": 3521} {"train_loss": -6.952142715454102, "global_step": 147887, "epoch": 3521} {"train_loss": -6.868907928466797, "global_step": 147888, "epoch": 3521} {"train_loss": -6.798981666564941, "global_step": 147889, "epoch": 3521} {"train_loss": -6.829617500305176, "global_step": 147890, "epoch": 3521} {"train_loss": -6.8835954666137695, "global_step": 147891, "epoch": 3521} {"train_loss": -6.914997100830078, "global_step": 147892, "epoch": 3521} {"train_loss": -6.850154399871826, "global_step": 147893, "epoch": 3521} {"train_loss": -6.768654823303223, "global_step": 147894, "epoch": 3521} {"train_loss": -6.750273704528809, "global_step": 147895, "epoch": 3521} {"train_loss": -6.797060966491699, "global_step": 147896, "epoch": 3521} {"train_loss": -6.807126522064209, "global_step": 147897, "epoch": 3521} {"train_loss": -6.885644912719727, "global_step": 147898, "epoch": 3521} {"train_loss": -6.741393089294434, "global_step": 147899, "epoch": 3521} {"train_loss": -6.743674278259277, "global_step": 147900, "epoch": 3521} {"train_loss": -6.7688212394714355, "global_step": 147901, "epoch": 3521} {"train_loss": -6.755838871002197, "global_step": 147902, "epoch": 3521} {"train_loss": -6.9005351066589355, "global_step": 147903, "epoch": 3521} {"train_loss": -6.825135231018066, "global_step": 147904, "epoch": 3521} {"train_loss": -6.807895183563232, "global_step": 147905, "epoch": 3521} {"train_loss": -6.840229034423828, "global_step": 147906, "epoch": 3521} {"train_loss": -6.801464080810547, "global_step": 147907, "epoch": 3521} {"train_loss": -6.898537635803223, "global_step": 147908, "epoch": 3521} {"train_loss": -6.863539695739746, "global_step": 147909, "epoch": 3521} {"train_loss": -6.843530654907227, "global_step": 147910, "epoch": 3521} {"train_loss": -6.79393196105957, "global_step": 147911, "epoch": 3521} {"train_loss": -6.835694313049316, "global_step": 147912, "epoch": 3521} {"train_loss": -6.810847282409668, "global_step": 147913, "epoch": 3521} {"train_loss": -6.722148895263672, "global_step": 147914, "epoch": 3521} {"train_loss": -6.811317443847656, "global_step": 147915, "epoch": 3521} {"train_loss": -6.926401138305664, "global_step": 147916, "epoch": 3521} {"train_loss": -6.8840837478637695, "global_step": 147917, "epoch": 3521} {"train_loss": -6.855961799621582, "global_step": 147918, "epoch": 3521} {"train_loss": -6.879853248596191, "global_step": 147919, "epoch": 3521} {"train_loss": -6.838615417480469, "global_step": 147920, "epoch": 3521} {"train_loss": -6.897157192230225, "global_step": 147921, "epoch": 3521} {"train_loss": -6.940988540649414, "global_step": 147922, "epoch": 3521} {"train_loss": -6.833825906117757, "global_step": 147923, "epoch": 3521, "val_loss": 67961.640625} {"train_loss": -6.7700324058532715, "global_step": 147924, "epoch": 3522} {"train_loss": -6.801774501800537, "global_step": 147925, "epoch": 3522} {"train_loss": -6.882216930389404, "global_step": 147926, "epoch": 3522} {"train_loss": -6.865428924560547, "global_step": 147927, "epoch": 3522} {"train_loss": -6.800365447998047, "global_step": 147928, "epoch": 3522} {"train_loss": -6.894230842590332, "global_step": 147929, "epoch": 3522} {"train_loss": -6.861940860748291, "global_step": 147930, "epoch": 3522} {"train_loss": -6.9114990234375, "global_step": 147931, "epoch": 3522} {"train_loss": -6.834774017333984, "global_step": 147932, "epoch": 3522} {"train_loss": -6.810513496398926, "global_step": 147933, "epoch": 3522} {"train_loss": -6.702927589416504, "global_step": 147934, "epoch": 3522} {"train_loss": -6.760737895965576, "global_step": 147935, "epoch": 3522} {"train_loss": -6.918804168701172, "global_step": 147936, "epoch": 3522} {"train_loss": -6.8046793937683105, "global_step": 147937, "epoch": 3522} {"train_loss": -6.927015781402588, "global_step": 147938, "epoch": 3522} {"train_loss": -6.9178080558776855, "global_step": 147939, "epoch": 3522} {"train_loss": -6.715970039367676, "global_step": 147940, "epoch": 3522} {"train_loss": -6.82955265045166, "global_step": 147941, "epoch": 3522} {"train_loss": -6.867729187011719, "global_step": 147942, "epoch": 3522} {"train_loss": -6.811690330505371, "global_step": 147943, "epoch": 3522} {"train_loss": -6.795738697052002, "global_step": 147944, "epoch": 3522} {"train_loss": -6.871737957000732, "global_step": 147945, "epoch": 3522} {"train_loss": -6.804134368896484, "global_step": 147946, "epoch": 3522} {"train_loss": -6.66722297668457, "global_step": 147947, "epoch": 3522} {"train_loss": -6.808166980743408, "global_step": 147948, "epoch": 3522} {"train_loss": -6.852982521057129, "global_step": 147949, "epoch": 3522} {"train_loss": -6.725481986999512, "global_step": 147950, "epoch": 3522} {"train_loss": -6.769934177398682, "global_step": 147951, "epoch": 3522} {"train_loss": -6.709176063537598, "global_step": 147952, "epoch": 3522} {"train_loss": -6.700004577636719, "global_step": 147953, "epoch": 3522} {"train_loss": -6.8068718910217285, "global_step": 147954, "epoch": 3522} {"train_loss": -6.802195072174072, "global_step": 147955, "epoch": 3522} {"train_loss": -6.802027225494385, "global_step": 147956, "epoch": 3522} {"train_loss": -6.765079498291016, "global_step": 147957, "epoch": 3522} {"train_loss": -6.81857442855835, "global_step": 147958, "epoch": 3522} {"train_loss": -6.853394985198975, "global_step": 147959, "epoch": 3522} {"train_loss": -6.811306476593018, "global_step": 147960, "epoch": 3522} {"train_loss": -6.848155975341797, "global_step": 147961, "epoch": 3522} {"train_loss": -6.803672790527344, "global_step": 147962, "epoch": 3522} {"train_loss": -6.825685501098633, "global_step": 147963, "epoch": 3522} {"train_loss": -6.827802658081055, "global_step": 147964, "epoch": 3522} {"train_loss": -6.8137853145599365, "global_step": 147965, "epoch": 3522, "val_loss": 67907.3984375} {"train_loss": -6.884037017822266, "global_step": 147966, "epoch": 3523} {"train_loss": -6.917785167694092, "global_step": 147967, "epoch": 3523} {"train_loss": -6.811005115509033, "global_step": 147968, "epoch": 3523} {"train_loss": -6.911397457122803, "global_step": 147969, "epoch": 3523} {"train_loss": -6.89143180847168, "global_step": 147970, "epoch": 3523} {"train_loss": -6.86484956741333, "global_step": 147971, "epoch": 3523} {"train_loss": -6.816659927368164, "global_step": 147972, "epoch": 3523} {"train_loss": -6.850162506103516, "global_step": 147973, "epoch": 3523} {"train_loss": -6.80784797668457, "global_step": 147974, "epoch": 3523} {"train_loss": -6.892607688903809, "global_step": 147975, "epoch": 3523} {"train_loss": -6.874378204345703, "global_step": 147976, "epoch": 3523} {"train_loss": -6.88170862197876, "global_step": 147977, "epoch": 3523} {"train_loss": -7.033653736114502, "global_step": 147978, "epoch": 3523} {"train_loss": -6.880204200744629, "global_step": 147979, "epoch": 3523} {"train_loss": -6.8858795166015625, "global_step": 147980, "epoch": 3523} {"train_loss": -6.866135120391846, "global_step": 147981, "epoch": 3523} {"train_loss": -6.914408206939697, "global_step": 147982, "epoch": 3523} {"train_loss": -6.855693817138672, "global_step": 147983, "epoch": 3523} {"train_loss": -6.9480462074279785, "global_step": 147984, "epoch": 3523} {"train_loss": -6.961307525634766, "global_step": 147985, "epoch": 3523} {"train_loss": -6.858423233032227, "global_step": 147986, "epoch": 3523} {"train_loss": -6.852643966674805, "global_step": 147987, "epoch": 3523} {"train_loss": -6.820154666900635, "global_step": 147988, "epoch": 3523} {"train_loss": -6.915569305419922, "global_step": 147989, "epoch": 3523} {"train_loss": -6.6286940574646, "global_step": 147990, "epoch": 3523} {"train_loss": -6.8000359535217285, "global_step": 147991, "epoch": 3523} {"train_loss": -6.804080009460449, "global_step": 147992, "epoch": 3523} {"train_loss": -6.653660774230957, "global_step": 147993, "epoch": 3523} {"train_loss": -6.838006973266602, "global_step": 147994, "epoch": 3523} {"train_loss": -6.863068580627441, "global_step": 147995, "epoch": 3523} {"train_loss": -6.973773002624512, "global_step": 147996, "epoch": 3523} {"train_loss": -6.802241325378418, "global_step": 147997, "epoch": 3523} {"train_loss": -6.759631633758545, "global_step": 147998, "epoch": 3523} {"train_loss": -6.955234050750732, "global_step": 147999, "epoch": 3523} {"train_loss": -6.7774457931518555, "global_step": 148000, "epoch": 3523} {"train_loss": -6.755443572998047, "global_step": 148001, "epoch": 3523} {"train_loss": -6.813298225402832, "global_step": 148002, "epoch": 3523} {"train_loss": -6.83555269241333, "global_step": 148003, "epoch": 3523} {"train_loss": -6.817474842071533, "global_step": 148004, "epoch": 3523} {"train_loss": -6.8231425285339355, "global_step": 148005, "epoch": 3523} {"train_loss": -6.830372333526611, "global_step": 148006, "epoch": 3523} {"train_loss": -6.845277479716709, "global_step": 148007, "epoch": 3523, "val_loss": 67863.3203125} {"train_loss": -6.863245964050293, "global_step": 148008, "epoch": 3524} {"train_loss": -6.718227386474609, "global_step": 148009, "epoch": 3524} {"train_loss": -6.829776763916016, "global_step": 148010, "epoch": 3524} {"train_loss": -6.828071594238281, "global_step": 148011, "epoch": 3524} {"train_loss": -6.762996673583984, "global_step": 148012, "epoch": 3524} {"train_loss": -6.750567436218262, "global_step": 148013, "epoch": 3524} {"train_loss": -6.797974586486816, "global_step": 148014, "epoch": 3524} {"train_loss": -6.8506293296813965, "global_step": 148015, "epoch": 3524} {"train_loss": -6.8888983726501465, "global_step": 148016, "epoch": 3524} {"train_loss": -6.762637138366699, "global_step": 148017, "epoch": 3524} {"train_loss": -6.787531852722168, "global_step": 148018, "epoch": 3524} {"train_loss": -6.818473815917969, "global_step": 148019, "epoch": 3524} {"train_loss": -6.8133111000061035, "global_step": 148020, "epoch": 3524} {"train_loss": -6.805751800537109, "global_step": 148021, "epoch": 3524} {"train_loss": -6.890272617340088, "global_step": 148022, "epoch": 3524} {"train_loss": -6.904057502746582, "global_step": 148023, "epoch": 3524} {"train_loss": -6.795284748077393, "global_step": 148024, "epoch": 3524} {"train_loss": -6.8689866065979, "global_step": 148025, "epoch": 3524} {"train_loss": -6.839268207550049, "global_step": 148026, "epoch": 3524} {"train_loss": -6.810556888580322, "global_step": 148027, "epoch": 3524} {"train_loss": -6.936275005340576, "global_step": 148028, "epoch": 3524} {"train_loss": -6.941567420959473, "global_step": 148029, "epoch": 3524} {"train_loss": -6.663005352020264, "global_step": 148030, "epoch": 3524} {"train_loss": -6.870817184448242, "global_step": 148031, "epoch": 3524} {"train_loss": -6.870784759521484, "global_step": 148032, "epoch": 3524} {"train_loss": -6.799111843109131, "global_step": 148033, "epoch": 3524} {"train_loss": -6.857298851013184, "global_step": 148034, "epoch": 3524} {"train_loss": -6.851931571960449, "global_step": 148035, "epoch": 3524} {"train_loss": -6.7878737449646, "global_step": 148036, "epoch": 3524} {"train_loss": -6.833950996398926, "global_step": 148037, "epoch": 3524} {"train_loss": -6.790760040283203, "global_step": 148038, "epoch": 3524} {"train_loss": -6.900147438049316, "global_step": 148039, "epoch": 3524} {"train_loss": -6.770216464996338, "global_step": 148040, "epoch": 3524} {"train_loss": -6.729377746582031, "global_step": 148041, "epoch": 3524} {"train_loss": -6.862452507019043, "global_step": 148042, "epoch": 3524} {"train_loss": -6.806907653808594, "global_step": 148043, "epoch": 3524} {"train_loss": -6.737299919128418, "global_step": 148044, "epoch": 3524} {"train_loss": -6.832821846008301, "global_step": 148045, "epoch": 3524} {"train_loss": -6.772741317749023, "global_step": 148046, "epoch": 3524} {"train_loss": -6.690244674682617, "global_step": 148047, "epoch": 3524} {"train_loss": -6.872458457946777, "global_step": 148048, "epoch": 3524} {"train_loss": -6.818045037133353, "global_step": 148049, "epoch": 3524, "val_loss": 67810.8984375} {"train_loss": -6.878355979919434, "global_step": 148050, "epoch": 3525} {"train_loss": -6.9082489013671875, "global_step": 148051, "epoch": 3525} {"train_loss": -6.839932441711426, "global_step": 148052, "epoch": 3525} {"train_loss": -6.9440155029296875, "global_step": 148053, "epoch": 3525} {"train_loss": -6.839582443237305, "global_step": 148054, "epoch": 3525} {"train_loss": -6.840887069702148, "global_step": 148055, "epoch": 3525} {"train_loss": -6.804163455963135, "global_step": 148056, "epoch": 3525} {"train_loss": -6.937066078186035, "global_step": 148057, "epoch": 3525} {"train_loss": -6.921710968017578, "global_step": 148058, "epoch": 3525} {"train_loss": -6.761025428771973, "global_step": 148059, "epoch": 3525} {"train_loss": -6.818428039550781, "global_step": 148060, "epoch": 3525} {"train_loss": -6.78507137298584, "global_step": 148061, "epoch": 3525} {"train_loss": -6.926443099975586, "global_step": 148062, "epoch": 3525} {"train_loss": -6.817032337188721, "global_step": 148063, "epoch": 3525} {"train_loss": -6.829967021942139, "global_step": 148064, "epoch": 3525} {"train_loss": -6.956917762756348, "global_step": 148065, "epoch": 3525} {"train_loss": -6.850687026977539, "global_step": 148066, "epoch": 3525} {"train_loss": -6.841885566711426, "global_step": 148067, "epoch": 3525} {"train_loss": -6.89124059677124, "global_step": 148068, "epoch": 3525} {"train_loss": -6.914920330047607, "global_step": 148069, "epoch": 3525} {"train_loss": -6.864535331726074, "global_step": 148070, "epoch": 3525} {"train_loss": -6.935832977294922, "global_step": 148071, "epoch": 3525} {"train_loss": -6.907731056213379, "global_step": 148072, "epoch": 3525} {"train_loss": -6.804937839508057, "global_step": 148073, "epoch": 3525} {"train_loss": -6.828768253326416, "global_step": 148074, "epoch": 3525} {"train_loss": -6.830309867858887, "global_step": 148075, "epoch": 3525} {"train_loss": -6.812402725219727, "global_step": 148076, "epoch": 3525} {"train_loss": -6.917325019836426, "global_step": 148077, "epoch": 3525} {"train_loss": -6.955543041229248, "global_step": 148078, "epoch": 3525} {"train_loss": -6.8114213943481445, "global_step": 148079, "epoch": 3525} {"train_loss": -6.951611042022705, "global_step": 148080, "epoch": 3525} {"train_loss": -6.846035480499268, "global_step": 148081, "epoch": 3525} {"train_loss": -6.736889839172363, "global_step": 148082, "epoch": 3525} {"train_loss": -6.8663129806518555, "global_step": 148083, "epoch": 3525} {"train_loss": -6.832912921905518, "global_step": 148084, "epoch": 3525} {"train_loss": -6.786317825317383, "global_step": 148085, "epoch": 3525} {"train_loss": -6.888190269470215, "global_step": 148086, "epoch": 3525} {"train_loss": -6.727399826049805, "global_step": 148087, "epoch": 3525} {"train_loss": -6.781167030334473, "global_step": 148088, "epoch": 3525} {"train_loss": -6.909697532653809, "global_step": 148089, "epoch": 3525} {"train_loss": -6.958237648010254, "global_step": 148090, "epoch": 3525} {"train_loss": -6.8609354723067515, "global_step": 148091, "epoch": 3525, "val_loss": 67928.0859375} {"train_loss": -6.999013900756836, "global_step": 148092, "epoch": 3526} {"train_loss": -6.691183567047119, "global_step": 148093, "epoch": 3526} {"train_loss": -6.780339241027832, "global_step": 148094, "epoch": 3526} {"train_loss": -6.762999534606934, "global_step": 148095, "epoch": 3526} {"train_loss": -6.792204856872559, "global_step": 148096, "epoch": 3526} {"train_loss": -6.89619255065918, "global_step": 148097, "epoch": 3526} {"train_loss": -6.900334358215332, "global_step": 148098, "epoch": 3526} {"train_loss": -6.756903648376465, "global_step": 148099, "epoch": 3526} {"train_loss": -6.8621320724487305, "global_step": 148100, "epoch": 3526} {"train_loss": -6.733792304992676, "global_step": 148101, "epoch": 3526} {"train_loss": -6.774463653564453, "global_step": 148102, "epoch": 3526} {"train_loss": -6.744574546813965, "global_step": 148103, "epoch": 3526} {"train_loss": -6.861083030700684, "global_step": 148104, "epoch": 3526} {"train_loss": -6.8672895431518555, "global_step": 148105, "epoch": 3526} {"train_loss": -6.700860023498535, "global_step": 148106, "epoch": 3526} {"train_loss": -6.846085548400879, "global_step": 148107, "epoch": 3526} {"train_loss": -6.9008684158325195, "global_step": 148108, "epoch": 3526} {"train_loss": -6.733932018280029, "global_step": 148109, "epoch": 3526} {"train_loss": -6.809983253479004, "global_step": 148110, "epoch": 3526} {"train_loss": -6.750452995300293, "global_step": 148111, "epoch": 3526} {"train_loss": -6.735728740692139, "global_step": 148112, "epoch": 3526} {"train_loss": -6.791636943817139, "global_step": 148113, "epoch": 3526} {"train_loss": -6.8488874435424805, "global_step": 148114, "epoch": 3526} {"train_loss": -6.828336715698242, "global_step": 148115, "epoch": 3526} {"train_loss": -6.8152995109558105, "global_step": 148116, "epoch": 3526} {"train_loss": -6.781741619110107, "global_step": 148117, "epoch": 3526} {"train_loss": -6.7344207763671875, "global_step": 148118, "epoch": 3526} {"train_loss": -6.802030086517334, "global_step": 148119, "epoch": 3526} {"train_loss": -6.9278130531311035, "global_step": 148120, "epoch": 3526} {"train_loss": -6.805018424987793, "global_step": 148121, "epoch": 3526} {"train_loss": -6.747537136077881, "global_step": 148122, "epoch": 3526} {"train_loss": -6.7495245933532715, "global_step": 148123, "epoch": 3526} {"train_loss": -6.935098648071289, "global_step": 148124, "epoch": 3526} {"train_loss": -6.912515163421631, "global_step": 148125, "epoch": 3526} {"train_loss": -6.86185359954834, "global_step": 148126, "epoch": 3526} {"train_loss": -6.741032123565674, "global_step": 148127, "epoch": 3526} {"train_loss": -6.86066198348999, "global_step": 148128, "epoch": 3526} {"train_loss": -6.884332180023193, "global_step": 148129, "epoch": 3526} {"train_loss": -6.854701042175293, "global_step": 148130, "epoch": 3526} {"train_loss": -6.79954195022583, "global_step": 148131, "epoch": 3526} {"train_loss": -6.808408737182617, "global_step": 148132, "epoch": 3526} {"train_loss": -6.813567785989671, "global_step": 148133, "epoch": 3526, "val_loss": 67974.578125} {"train_loss": -6.838679313659668, "global_step": 148134, "epoch": 3527} {"train_loss": -6.771809101104736, "global_step": 148135, "epoch": 3527} {"train_loss": -6.708420753479004, "global_step": 148136, "epoch": 3527} {"train_loss": -6.713923454284668, "global_step": 148137, "epoch": 3527} {"train_loss": -6.808485984802246, "global_step": 148138, "epoch": 3527} {"train_loss": -6.729679107666016, "global_step": 148139, "epoch": 3527} {"train_loss": -6.8329362869262695, "global_step": 148140, "epoch": 3527} {"train_loss": -6.804008483886719, "global_step": 148141, "epoch": 3527} {"train_loss": -6.749834060668945, "global_step": 148142, "epoch": 3527} {"train_loss": -6.7576398849487305, "global_step": 148143, "epoch": 3527} {"train_loss": -6.792351722717285, "global_step": 148144, "epoch": 3527} {"train_loss": -6.879593849182129, "global_step": 148145, "epoch": 3527} {"train_loss": -6.838639736175537, "global_step": 148146, "epoch": 3527} {"train_loss": -6.862785339355469, "global_step": 148147, "epoch": 3527} {"train_loss": -6.895036697387695, "global_step": 148148, "epoch": 3527} {"train_loss": -6.7830810546875, "global_step": 148149, "epoch": 3527} {"train_loss": -6.842100620269775, "global_step": 148150, "epoch": 3527} {"train_loss": -6.91685676574707, "global_step": 148151, "epoch": 3527} {"train_loss": -6.806174278259277, "global_step": 148152, "epoch": 3527} {"train_loss": -6.873786926269531, "global_step": 148153, "epoch": 3527} {"train_loss": -6.840811729431152, "global_step": 148154, "epoch": 3527} {"train_loss": -6.714807033538818, "global_step": 148155, "epoch": 3527} {"train_loss": -6.8092498779296875, "global_step": 148156, "epoch": 3527} {"train_loss": -6.761342525482178, "global_step": 148157, "epoch": 3527} {"train_loss": -6.89129638671875, "global_step": 148158, "epoch": 3527} {"train_loss": -6.916181564331055, "global_step": 148159, "epoch": 3527} {"train_loss": -6.766060829162598, "global_step": 148160, "epoch": 3527} {"train_loss": -6.881242752075195, "global_step": 148161, "epoch": 3527} {"train_loss": -6.957012176513672, "global_step": 148162, "epoch": 3527} {"train_loss": -6.702462196350098, "global_step": 148163, "epoch": 3527} {"train_loss": -6.945045471191406, "global_step": 148164, "epoch": 3527} {"train_loss": -6.708268165588379, "global_step": 148165, "epoch": 3527} {"train_loss": -6.8001556396484375, "global_step": 148166, "epoch": 3527} {"train_loss": -6.807760238647461, "global_step": 148167, "epoch": 3527} {"train_loss": -6.793074131011963, "global_step": 148168, "epoch": 3527} {"train_loss": -6.788239002227783, "global_step": 148169, "epoch": 3527} {"train_loss": -6.794174671173096, "global_step": 148170, "epoch": 3527} {"train_loss": -6.784083366394043, "global_step": 148171, "epoch": 3527} {"train_loss": -6.801916122436523, "global_step": 148172, "epoch": 3527} {"train_loss": -6.710254669189453, "global_step": 148173, "epoch": 3527} {"train_loss": -6.901557445526123, "global_step": 148174, "epoch": 3527} {"train_loss": -6.813013769331432, "global_step": 148175, "epoch": 3527, "val_loss": 67741.2578125} {"train_loss": -6.976468563079834, "global_step": 148176, "epoch": 3528} {"train_loss": -6.800277233123779, "global_step": 148177, "epoch": 3528} {"train_loss": -6.8306427001953125, "global_step": 148178, "epoch": 3528} {"train_loss": -6.708149433135986, "global_step": 148179, "epoch": 3528} {"train_loss": -6.765010356903076, "global_step": 148180, "epoch": 3528} {"train_loss": -6.803350925445557, "global_step": 148181, "epoch": 3528} {"train_loss": -6.864958763122559, "global_step": 148182, "epoch": 3528} {"train_loss": -6.746420383453369, "global_step": 148183, "epoch": 3528} {"train_loss": -6.799561977386475, "global_step": 148184, "epoch": 3528} {"train_loss": -6.8702778816223145, "global_step": 148185, "epoch": 3528} {"train_loss": -6.854634761810303, "global_step": 148186, "epoch": 3528} {"train_loss": -6.80613899230957, "global_step": 148187, "epoch": 3528} {"train_loss": -6.886466026306152, "global_step": 148188, "epoch": 3528} {"train_loss": -6.6945319175720215, "global_step": 148189, "epoch": 3528} {"train_loss": -6.6789116859436035, "global_step": 148190, "epoch": 3528} {"train_loss": -6.7540283203125, "global_step": 148191, "epoch": 3528} {"train_loss": -6.728374481201172, "global_step": 148192, "epoch": 3528} {"train_loss": -6.810152530670166, "global_step": 148193, "epoch": 3528} {"train_loss": -6.753681182861328, "global_step": 148194, "epoch": 3528} {"train_loss": -6.864251136779785, "global_step": 148195, "epoch": 3528} {"train_loss": -6.7315473556518555, "global_step": 148196, "epoch": 3528} {"train_loss": -6.898417949676514, "global_step": 148197, "epoch": 3528} {"train_loss": -6.84352970123291, "global_step": 148198, "epoch": 3528} {"train_loss": -6.932323932647705, "global_step": 148199, "epoch": 3528} {"train_loss": -6.798952579498291, "global_step": 148200, "epoch": 3528} {"train_loss": -6.828718185424805, "global_step": 148201, "epoch": 3528} {"train_loss": -6.773839950561523, "global_step": 148202, "epoch": 3528} {"train_loss": -6.710131645202637, "global_step": 148203, "epoch": 3528} {"train_loss": -6.835131645202637, "global_step": 148204, "epoch": 3528} {"train_loss": -6.911916255950928, "global_step": 148205, "epoch": 3528} {"train_loss": -6.63033390045166, "global_step": 148206, "epoch": 3528} {"train_loss": -6.821002006530762, "global_step": 148207, "epoch": 3528} {"train_loss": -6.889633655548096, "global_step": 148208, "epoch": 3528} {"train_loss": -6.723482131958008, "global_step": 148209, "epoch": 3528} {"train_loss": -6.81121826171875, "global_step": 148210, "epoch": 3528} {"train_loss": -6.772385597229004, "global_step": 148211, "epoch": 3528} {"train_loss": -6.739838123321533, "global_step": 148212, "epoch": 3528} {"train_loss": -6.871972560882568, "global_step": 148213, "epoch": 3528} {"train_loss": -6.711281776428223, "global_step": 148214, "epoch": 3528} {"train_loss": -6.817103862762451, "global_step": 148215, "epoch": 3528} {"train_loss": -6.755901336669922, "global_step": 148216, "epoch": 3528} {"train_loss": -6.796972229367211, "global_step": 148217, "epoch": 3528, "val_loss": 67748.6640625} {"train_loss": -6.828024864196777, "global_step": 148218, "epoch": 3529} {"train_loss": -6.7972917556762695, "global_step": 148219, "epoch": 3529} {"train_loss": -6.7701616287231445, "global_step": 148220, "epoch": 3529} {"train_loss": -6.86845588684082, "global_step": 148221, "epoch": 3529} {"train_loss": -6.795449256896973, "global_step": 148222, "epoch": 3529} {"train_loss": -6.835989952087402, "global_step": 148223, "epoch": 3529} {"train_loss": -6.783977031707764, "global_step": 148224, "epoch": 3529} {"train_loss": -6.827096939086914, "global_step": 148225, "epoch": 3529} {"train_loss": -6.792459487915039, "global_step": 148226, "epoch": 3529} {"train_loss": -6.872079372406006, "global_step": 148227, "epoch": 3529} {"train_loss": -6.895708084106445, "global_step": 148228, "epoch": 3529} {"train_loss": -6.911778926849365, "global_step": 148229, "epoch": 3529} {"train_loss": -6.928118705749512, "global_step": 148230, "epoch": 3529} {"train_loss": -6.902048110961914, "global_step": 148231, "epoch": 3529} {"train_loss": -6.809316635131836, "global_step": 148232, "epoch": 3529} {"train_loss": -6.931394577026367, "global_step": 148233, "epoch": 3529} {"train_loss": -6.8501667976379395, "global_step": 148234, "epoch": 3529} {"train_loss": -6.896985054016113, "global_step": 148235, "epoch": 3529} {"train_loss": -6.7384819984436035, "global_step": 148236, "epoch": 3529} {"train_loss": -6.954214096069336, "global_step": 148237, "epoch": 3529} {"train_loss": -6.827990531921387, "global_step": 148238, "epoch": 3529} {"train_loss": -6.818246841430664, "global_step": 148239, "epoch": 3529} {"train_loss": -6.885046482086182, "global_step": 148240, "epoch": 3529} {"train_loss": -6.777712821960449, "global_step": 148241, "epoch": 3529} {"train_loss": -6.708423137664795, "global_step": 148242, "epoch": 3529} {"train_loss": -6.813900947570801, "global_step": 148243, "epoch": 3529} {"train_loss": -6.778334617614746, "global_step": 148244, "epoch": 3529} {"train_loss": -6.762166976928711, "global_step": 148245, "epoch": 3529} {"train_loss": -6.870316505432129, "global_step": 148246, "epoch": 3529} {"train_loss": -6.905622482299805, "global_step": 148247, "epoch": 3529} {"train_loss": -6.740547180175781, "global_step": 148248, "epoch": 3529} {"train_loss": -6.875642776489258, "global_step": 148249, "epoch": 3529} {"train_loss": -6.836849212646484, "global_step": 148250, "epoch": 3529} {"train_loss": -6.768506050109863, "global_step": 148251, "epoch": 3529} {"train_loss": -6.801007270812988, "global_step": 148252, "epoch": 3529} {"train_loss": -6.923430919647217, "global_step": 148253, "epoch": 3529} {"train_loss": -6.852618217468262, "global_step": 148254, "epoch": 3529} {"train_loss": -6.6983747482299805, "global_step": 148255, "epoch": 3529} {"train_loss": -6.952539443969727, "global_step": 148256, "epoch": 3529} {"train_loss": -6.83095121383667, "global_step": 148257, "epoch": 3529} {"train_loss": -6.748412132263184, "global_step": 148258, "epoch": 3529} {"train_loss": -6.83391353062221, "global_step": 148259, "epoch": 3529, "val_loss": 67821.234375} {"train_loss": -6.814632892608643, "global_step": 148260, "epoch": 3530} {"train_loss": -6.842070579528809, "global_step": 148261, "epoch": 3530} {"train_loss": -6.731533527374268, "global_step": 148262, "epoch": 3530} {"train_loss": -6.813119888305664, "global_step": 148263, "epoch": 3530} {"train_loss": -6.838273048400879, "global_step": 148264, "epoch": 3530} {"train_loss": -6.71544885635376, "global_step": 148265, "epoch": 3530} {"train_loss": -6.798015594482422, "global_step": 148266, "epoch": 3530} {"train_loss": -6.7427568435668945, "global_step": 148267, "epoch": 3530} {"train_loss": -6.788808822631836, "global_step": 148268, "epoch": 3530} {"train_loss": -6.780032157897949, "global_step": 148269, "epoch": 3530} {"train_loss": -6.844128608703613, "global_step": 148270, "epoch": 3530} {"train_loss": -6.847927093505859, "global_step": 148271, "epoch": 3530} {"train_loss": -6.767921447753906, "global_step": 148272, "epoch": 3530} {"train_loss": -6.888416290283203, "global_step": 148273, "epoch": 3530} {"train_loss": -6.7892913818359375, "global_step": 148274, "epoch": 3530} {"train_loss": -6.725987911224365, "global_step": 148275, "epoch": 3530} {"train_loss": -6.83258581161499, "global_step": 148276, "epoch": 3530} {"train_loss": -6.889488220214844, "global_step": 148277, "epoch": 3530} {"train_loss": -6.780226707458496, "global_step": 148278, "epoch": 3530} {"train_loss": -6.845236301422119, "global_step": 148279, "epoch": 3530} {"train_loss": -6.844259738922119, "global_step": 148280, "epoch": 3530} {"train_loss": -6.639749050140381, "global_step": 148281, "epoch": 3530} {"train_loss": -6.799078941345215, "global_step": 148282, "epoch": 3530} {"train_loss": -6.663837432861328, "global_step": 148283, "epoch": 3530} {"train_loss": -6.800530433654785, "global_step": 148284, "epoch": 3530} {"train_loss": -6.831380844116211, "global_step": 148285, "epoch": 3530} {"train_loss": -6.663477897644043, "global_step": 148286, "epoch": 3530} {"train_loss": -6.838115692138672, "global_step": 148287, "epoch": 3530} {"train_loss": -6.7380781173706055, "global_step": 148288, "epoch": 3530} {"train_loss": -6.808786869049072, "global_step": 148289, "epoch": 3530} {"train_loss": -6.791319847106934, "global_step": 148290, "epoch": 3530} {"train_loss": -6.778747081756592, "global_step": 148291, "epoch": 3530} {"train_loss": -6.877412796020508, "global_step": 148292, "epoch": 3530} {"train_loss": -6.759126663208008, "global_step": 148293, "epoch": 3530} {"train_loss": -6.7974419593811035, "global_step": 148294, "epoch": 3530} {"train_loss": -6.823853492736816, "global_step": 148295, "epoch": 3530} {"train_loss": -6.79239559173584, "global_step": 148296, "epoch": 3530} {"train_loss": -6.911507606506348, "global_step": 148297, "epoch": 3530} {"train_loss": -6.772043704986572, "global_step": 148298, "epoch": 3530} {"train_loss": -6.893821716308594, "global_step": 148299, "epoch": 3530} {"train_loss": -6.86379337310791, "global_step": 148300, "epoch": 3530} {"train_loss": -6.802018790017991, "global_step": 148301, "epoch": 3530, "val_loss": 68009.6015625} {"train_loss": -6.792309761047363, "global_step": 148302, "epoch": 3531} {"train_loss": -6.708189964294434, "global_step": 148303, "epoch": 3531} {"train_loss": -6.869921684265137, "global_step": 148304, "epoch": 3531} {"train_loss": -6.840147972106934, "global_step": 148305, "epoch": 3531} {"train_loss": -6.896400451660156, "global_step": 148306, "epoch": 3531} {"train_loss": -6.766690254211426, "global_step": 148307, "epoch": 3531} {"train_loss": -6.76500129699707, "global_step": 148308, "epoch": 3531} {"train_loss": -6.832481384277344, "global_step": 148309, "epoch": 3531} {"train_loss": -6.842974662780762, "global_step": 148310, "epoch": 3531} {"train_loss": -6.80662727355957, "global_step": 148311, "epoch": 3531} {"train_loss": -6.858633041381836, "global_step": 148312, "epoch": 3531} {"train_loss": -6.749122619628906, "global_step": 148313, "epoch": 3531} {"train_loss": -6.886685848236084, "global_step": 148314, "epoch": 3531} {"train_loss": -6.931632995605469, "global_step": 148315, "epoch": 3531} {"train_loss": -6.829737186431885, "global_step": 148316, "epoch": 3531} {"train_loss": -6.929288864135742, "global_step": 148317, "epoch": 3531} {"train_loss": -6.872265815734863, "global_step": 148318, "epoch": 3531} {"train_loss": -6.8384294509887695, "global_step": 148319, "epoch": 3531} {"train_loss": -6.720094680786133, "global_step": 148320, "epoch": 3531} {"train_loss": -6.878188133239746, "global_step": 148321, "epoch": 3531} {"train_loss": -6.886258125305176, "global_step": 148322, "epoch": 3531} {"train_loss": -6.63275146484375, "global_step": 148323, "epoch": 3531} {"train_loss": -6.905987739562988, "global_step": 148324, "epoch": 3531} {"train_loss": -6.750638961791992, "global_step": 148325, "epoch": 3531} {"train_loss": -6.68790340423584, "global_step": 148326, "epoch": 3531} {"train_loss": -6.794380187988281, "global_step": 148327, "epoch": 3531} {"train_loss": -6.939670085906982, "global_step": 148328, "epoch": 3531} {"train_loss": -6.803982734680176, "global_step": 148329, "epoch": 3531} {"train_loss": -6.888175010681152, "global_step": 148330, "epoch": 3531} {"train_loss": -6.755476951599121, "global_step": 148331, "epoch": 3531} {"train_loss": -6.895352840423584, "global_step": 148332, "epoch": 3531} {"train_loss": -6.892272472381592, "global_step": 148333, "epoch": 3531} {"train_loss": -6.7579803466796875, "global_step": 148334, "epoch": 3531} {"train_loss": -6.792324066162109, "global_step": 148335, "epoch": 3531} {"train_loss": -6.777101039886475, "global_step": 148336, "epoch": 3531} {"train_loss": -6.836092948913574, "global_step": 148337, "epoch": 3531} {"train_loss": -6.812610149383545, "global_step": 148338, "epoch": 3531} {"train_loss": -6.865646839141846, "global_step": 148339, "epoch": 3531} {"train_loss": -6.728436470031738, "global_step": 148340, "epoch": 3531} {"train_loss": -6.881829261779785, "global_step": 148341, "epoch": 3531} {"train_loss": -6.898597717285156, "global_step": 148342, "epoch": 3531} {"train_loss": -6.825035299573626, "global_step": 148343, "epoch": 3531, "val_loss": 67984.59375} {"train_loss": -6.799869060516357, "global_step": 148344, "epoch": 3532} {"train_loss": -6.8059892654418945, "global_step": 148345, "epoch": 3532} {"train_loss": -6.846229553222656, "global_step": 148346, "epoch": 3532} {"train_loss": -6.851222991943359, "global_step": 148347, "epoch": 3532} {"train_loss": -6.825428009033203, "global_step": 148348, "epoch": 3532} {"train_loss": -6.799010276794434, "global_step": 148349, "epoch": 3532} {"train_loss": -6.844569206237793, "global_step": 148350, "epoch": 3532} {"train_loss": -6.880245208740234, "global_step": 148351, "epoch": 3532} {"train_loss": -6.803014755249023, "global_step": 148352, "epoch": 3532} {"train_loss": -6.934615612030029, "global_step": 148353, "epoch": 3532} {"train_loss": -6.841193199157715, "global_step": 148354, "epoch": 3532} {"train_loss": -6.739130020141602, "global_step": 148355, "epoch": 3532} {"train_loss": -6.876745223999023, "global_step": 148356, "epoch": 3532} {"train_loss": -6.855527877807617, "global_step": 148357, "epoch": 3532} {"train_loss": -6.843597412109375, "global_step": 148358, "epoch": 3532} {"train_loss": -6.957730293273926, "global_step": 148359, "epoch": 3532} {"train_loss": -6.808869361877441, "global_step": 148360, "epoch": 3532} {"train_loss": -6.982789993286133, "global_step": 148361, "epoch": 3532} {"train_loss": -6.781094551086426, "global_step": 148362, "epoch": 3532} {"train_loss": -6.79369592666626, "global_step": 148363, "epoch": 3532} {"train_loss": -6.8280463218688965, "global_step": 148364, "epoch": 3532} {"train_loss": -6.8345441818237305, "global_step": 148365, "epoch": 3532} {"train_loss": -6.893157958984375, "global_step": 148366, "epoch": 3532} {"train_loss": -6.894898414611816, "global_step": 148367, "epoch": 3532} {"train_loss": -6.840380668640137, "global_step": 148368, "epoch": 3532} {"train_loss": -6.8189544677734375, "global_step": 148369, "epoch": 3532} {"train_loss": -6.803532600402832, "global_step": 148370, "epoch": 3532} {"train_loss": -6.838794708251953, "global_step": 148371, "epoch": 3532} {"train_loss": -6.758034706115723, "global_step": 148372, "epoch": 3532} {"train_loss": -6.85244083404541, "global_step": 148373, "epoch": 3532} {"train_loss": -6.914700031280518, "global_step": 148374, "epoch": 3532} {"train_loss": -6.8097429275512695, "global_step": 148375, "epoch": 3532} {"train_loss": -6.93781852722168, "global_step": 148376, "epoch": 3532} {"train_loss": -6.8712968826293945, "global_step": 148377, "epoch": 3532} {"train_loss": -6.76392936706543, "global_step": 148378, "epoch": 3532} {"train_loss": -6.803602695465088, "global_step": 148379, "epoch": 3532} {"train_loss": -6.829179763793945, "global_step": 148380, "epoch": 3532} {"train_loss": -6.876327991485596, "global_step": 148381, "epoch": 3532} {"train_loss": -6.914913177490234, "global_step": 148382, "epoch": 3532} {"train_loss": -6.905603885650635, "global_step": 148383, "epoch": 3532} {"train_loss": -6.911031723022461, "global_step": 148384, "epoch": 3532} {"train_loss": -6.849234013330369, "global_step": 148385, "epoch": 3532, "val_loss": 68172.78125} {"train_loss": -6.942647933959961, "global_step": 148386, "epoch": 3533} {"train_loss": -6.78639030456543, "global_step": 148387, "epoch": 3533} {"train_loss": -6.890974998474121, "global_step": 148388, "epoch": 3533} {"train_loss": -6.956616401672363, "global_step": 148389, "epoch": 3533} {"train_loss": -6.835089683532715, "global_step": 148390, "epoch": 3533} {"train_loss": -6.855862617492676, "global_step": 148391, "epoch": 3533} {"train_loss": -6.742835521697998, "global_step": 148392, "epoch": 3533} {"train_loss": -6.820901870727539, "global_step": 148393, "epoch": 3533} {"train_loss": -6.812426567077637, "global_step": 148394, "epoch": 3533} {"train_loss": -6.7297163009643555, "global_step": 148395, "epoch": 3533} {"train_loss": -6.78549861907959, "global_step": 148396, "epoch": 3533} {"train_loss": -6.988888740539551, "global_step": 148397, "epoch": 3533} {"train_loss": -6.761625289916992, "global_step": 148398, "epoch": 3533} {"train_loss": -6.865756511688232, "global_step": 148399, "epoch": 3533} {"train_loss": -6.788121223449707, "global_step": 148400, "epoch": 3533} {"train_loss": -6.76865291595459, "global_step": 148401, "epoch": 3533} {"train_loss": -6.818234920501709, "global_step": 148402, "epoch": 3533} {"train_loss": -6.835090637207031, "global_step": 148403, "epoch": 3533} {"train_loss": -6.848607063293457, "global_step": 148404, "epoch": 3533} {"train_loss": -6.828941345214844, "global_step": 148405, "epoch": 3533} {"train_loss": -6.927725791931152, "global_step": 148406, "epoch": 3533} {"train_loss": -6.888071537017822, "global_step": 148407, "epoch": 3533} {"train_loss": -6.790279388427734, "global_step": 148408, "epoch": 3533} {"train_loss": -6.923480033874512, "global_step": 148409, "epoch": 3533} {"train_loss": -6.821585655212402, "global_step": 148410, "epoch": 3533} {"train_loss": -6.849477767944336, "global_step": 148411, "epoch": 3533} {"train_loss": -6.919399261474609, "global_step": 148412, "epoch": 3533} {"train_loss": -6.784846305847168, "global_step": 148413, "epoch": 3533} {"train_loss": -6.730620384216309, "global_step": 148414, "epoch": 3533} {"train_loss": -6.84889030456543, "global_step": 148415, "epoch": 3533} {"train_loss": -6.760997295379639, "global_step": 148416, "epoch": 3533} {"train_loss": -6.912449836730957, "global_step": 148417, "epoch": 3533} {"train_loss": -6.743710994720459, "global_step": 148418, "epoch": 3533} {"train_loss": -6.9319610595703125, "global_step": 148419, "epoch": 3533} {"train_loss": -6.704241752624512, "global_step": 148420, "epoch": 3533} {"train_loss": -6.833499908447266, "global_step": 148421, "epoch": 3533} {"train_loss": -6.762783050537109, "global_step": 148422, "epoch": 3533} {"train_loss": -6.849959373474121, "global_step": 148423, "epoch": 3533} {"train_loss": -6.857709884643555, "global_step": 148424, "epoch": 3533} {"train_loss": -6.793144226074219, "global_step": 148425, "epoch": 3533} {"train_loss": -6.847297668457031, "global_step": 148426, "epoch": 3533} {"train_loss": -6.829694793337867, "global_step": 148427, "epoch": 3533, "val_loss": 67940.4609375} {"train_loss": -6.741857528686523, "global_step": 148428, "epoch": 3534} {"train_loss": -6.774123668670654, "global_step": 148429, "epoch": 3534} {"train_loss": -6.936501502990723, "global_step": 148430, "epoch": 3534} {"train_loss": -6.786124229431152, "global_step": 148431, "epoch": 3534} {"train_loss": -6.921152114868164, "global_step": 148432, "epoch": 3534} {"train_loss": -6.841829299926758, "global_step": 148433, "epoch": 3534} {"train_loss": -6.858788967132568, "global_step": 148434, "epoch": 3534} {"train_loss": -6.88394021987915, "global_step": 148435, "epoch": 3534} {"train_loss": -6.759698390960693, "global_step": 148436, "epoch": 3534} {"train_loss": -6.765631675720215, "global_step": 148437, "epoch": 3534} {"train_loss": -6.887424945831299, "global_step": 148438, "epoch": 3534} {"train_loss": -6.707102298736572, "global_step": 148439, "epoch": 3534} {"train_loss": -6.848154067993164, "global_step": 148440, "epoch": 3534} {"train_loss": -6.8314924240112305, "global_step": 148441, "epoch": 3534} {"train_loss": -6.714295387268066, "global_step": 148442, "epoch": 3534} {"train_loss": -6.80256462097168, "global_step": 148443, "epoch": 3534} {"train_loss": -6.796440124511719, "global_step": 148444, "epoch": 3534} {"train_loss": -6.743639945983887, "global_step": 148445, "epoch": 3534} {"train_loss": -6.867932319641113, "global_step": 148446, "epoch": 3534} {"train_loss": -6.84890079498291, "global_step": 148447, "epoch": 3534} {"train_loss": -6.827139854431152, "global_step": 148448, "epoch": 3534} {"train_loss": -6.926294326782227, "global_step": 148449, "epoch": 3534} {"train_loss": -6.808234214782715, "global_step": 148450, "epoch": 3534} {"train_loss": -6.853095531463623, "global_step": 148451, "epoch": 3534} {"train_loss": -6.898914813995361, "global_step": 148452, "epoch": 3534} {"train_loss": -6.827763557434082, "global_step": 148453, "epoch": 3534} {"train_loss": -6.734753608703613, "global_step": 148454, "epoch": 3534} {"train_loss": -6.802468776702881, "global_step": 148455, "epoch": 3534} {"train_loss": -6.8027801513671875, "global_step": 148456, "epoch": 3534} {"train_loss": -6.837278366088867, "global_step": 148457, "epoch": 3534} {"train_loss": -6.892146110534668, "global_step": 148458, "epoch": 3534} {"train_loss": -6.726693153381348, "global_step": 148459, "epoch": 3534} {"train_loss": -6.864503860473633, "global_step": 148460, "epoch": 3534} {"train_loss": -6.853853702545166, "global_step": 148461, "epoch": 3534} {"train_loss": -6.75436544418335, "global_step": 148462, "epoch": 3534} {"train_loss": -6.894311428070068, "global_step": 148463, "epoch": 3534} {"train_loss": -6.756705284118652, "global_step": 148464, "epoch": 3534} {"train_loss": -6.804755210876465, "global_step": 148465, "epoch": 3534} {"train_loss": -6.897555351257324, "global_step": 148466, "epoch": 3534} {"train_loss": -6.954802989959717, "global_step": 148467, "epoch": 3534} {"train_loss": -6.901345729827881, "global_step": 148468, "epoch": 3534} {"train_loss": -6.826484078452701, "global_step": 148469, "epoch": 3534, "val_loss": 67837.265625} {"train_loss": -6.832136154174805, "global_step": 148470, "epoch": 3535} {"train_loss": -6.895729064941406, "global_step": 148471, "epoch": 3535} {"train_loss": -6.807352542877197, "global_step": 148472, "epoch": 3535} {"train_loss": -6.754179000854492, "global_step": 148473, "epoch": 3535} {"train_loss": -6.925112247467041, "global_step": 148474, "epoch": 3535} {"train_loss": -6.8346734046936035, "global_step": 148475, "epoch": 3535} {"train_loss": -6.801426887512207, "global_step": 148476, "epoch": 3535} {"train_loss": -6.964582920074463, "global_step": 148477, "epoch": 3535} {"train_loss": -6.8853559494018555, "global_step": 148478, "epoch": 3535} {"train_loss": -6.84836483001709, "global_step": 148479, "epoch": 3535} {"train_loss": -6.770336151123047, "global_step": 148480, "epoch": 3535} {"train_loss": -6.775856971740723, "global_step": 148481, "epoch": 3535} {"train_loss": -6.781063079833984, "global_step": 148482, "epoch": 3535} {"train_loss": -6.673676013946533, "global_step": 148483, "epoch": 3535} {"train_loss": -6.784165859222412, "global_step": 148484, "epoch": 3535} {"train_loss": -6.767842769622803, "global_step": 148485, "epoch": 3535} {"train_loss": -6.746126174926758, "global_step": 148486, "epoch": 3535} {"train_loss": -6.928937911987305, "global_step": 148487, "epoch": 3535} {"train_loss": -6.8756022453308105, "global_step": 148488, "epoch": 3535} {"train_loss": -6.800948143005371, "global_step": 148489, "epoch": 3535} {"train_loss": -6.856790542602539, "global_step": 148490, "epoch": 3535} {"train_loss": -6.8631134033203125, "global_step": 148491, "epoch": 3535} {"train_loss": -6.943799018859863, "global_step": 148492, "epoch": 3535} {"train_loss": -6.928502559661865, "global_step": 148493, "epoch": 3535} {"train_loss": -6.83805513381958, "global_step": 148494, "epoch": 3535} {"train_loss": -6.827679634094238, "global_step": 148495, "epoch": 3535} {"train_loss": -6.880317687988281, "global_step": 148496, "epoch": 3535} {"train_loss": -6.880951404571533, "global_step": 148497, "epoch": 3535} {"train_loss": -6.777828693389893, "global_step": 148498, "epoch": 3535} {"train_loss": -6.825124740600586, "global_step": 148499, "epoch": 3535} {"train_loss": -6.798660755157471, "global_step": 148500, "epoch": 3535} {"train_loss": -6.896958351135254, "global_step": 148501, "epoch": 3535} {"train_loss": -6.762779235839844, "global_step": 148502, "epoch": 3535} {"train_loss": -6.860041618347168, "global_step": 148503, "epoch": 3535} {"train_loss": -6.8187127113342285, "global_step": 148504, "epoch": 3535} {"train_loss": -6.9215168952941895, "global_step": 148505, "epoch": 3535} {"train_loss": -6.798672199249268, "global_step": 148506, "epoch": 3535} {"train_loss": -6.893049240112305, "global_step": 148507, "epoch": 3535} {"train_loss": -6.853275775909424, "global_step": 148508, "epoch": 3535} {"train_loss": -6.741072654724121, "global_step": 148509, "epoch": 3535} {"train_loss": -6.790019989013672, "global_step": 148510, "epoch": 3535} {"train_loss": -6.834331012907482, "global_step": 148511, "epoch": 3535, "val_loss": 67831.75} {"train_loss": -6.826234817504883, "global_step": 148512, "epoch": 3536} {"train_loss": -6.907106399536133, "global_step": 148513, "epoch": 3536} {"train_loss": -6.8354034423828125, "global_step": 148514, "epoch": 3536} {"train_loss": -6.859951496124268, "global_step": 148515, "epoch": 3536} {"train_loss": -6.796988487243652, "global_step": 148516, "epoch": 3536} {"train_loss": -6.86433219909668, "global_step": 148517, "epoch": 3536} {"train_loss": -6.919130325317383, "global_step": 148518, "epoch": 3536} {"train_loss": -6.904799461364746, "global_step": 148519, "epoch": 3536} {"train_loss": -6.85406494140625, "global_step": 148520, "epoch": 3536} {"train_loss": -6.879351615905762, "global_step": 148521, "epoch": 3536} {"train_loss": -6.815456867218018, "global_step": 148522, "epoch": 3536} {"train_loss": -6.772933483123779, "global_step": 148523, "epoch": 3536} {"train_loss": -6.9034576416015625, "global_step": 148524, "epoch": 3536} {"train_loss": -6.865631103515625, "global_step": 148525, "epoch": 3536} {"train_loss": -6.680420398712158, "global_step": 148526, "epoch": 3536} {"train_loss": -6.843740940093994, "global_step": 148527, "epoch": 3536} {"train_loss": -6.953916072845459, "global_step": 148528, "epoch": 3536} {"train_loss": -6.879660606384277, "global_step": 148529, "epoch": 3536} {"train_loss": -6.75327205657959, "global_step": 148530, "epoch": 3536} {"train_loss": -6.901564598083496, "global_step": 148531, "epoch": 3536} {"train_loss": -6.796586036682129, "global_step": 148532, "epoch": 3536} {"train_loss": -6.900639057159424, "global_step": 148533, "epoch": 3536} {"train_loss": -6.789515972137451, "global_step": 148534, "epoch": 3536} {"train_loss": -6.8988542556762695, "global_step": 148535, "epoch": 3536} {"train_loss": -6.771965980529785, "global_step": 148536, "epoch": 3536} {"train_loss": -6.848838806152344, "global_step": 148537, "epoch": 3536} {"train_loss": -6.872653484344482, "global_step": 148538, "epoch": 3536} {"train_loss": -6.867802143096924, "global_step": 148539, "epoch": 3536} {"train_loss": -6.839874267578125, "global_step": 148540, "epoch": 3536} {"train_loss": -6.835763931274414, "global_step": 148541, "epoch": 3536} {"train_loss": -6.883561134338379, "global_step": 148542, "epoch": 3536} {"train_loss": -6.9448018074035645, "global_step": 148543, "epoch": 3536} {"train_loss": -6.766502380371094, "global_step": 148544, "epoch": 3536} {"train_loss": -6.764006614685059, "global_step": 148545, "epoch": 3536} {"train_loss": -6.9256391525268555, "global_step": 148546, "epoch": 3536} {"train_loss": -6.931635856628418, "global_step": 148547, "epoch": 3536} {"train_loss": -6.816246032714844, "global_step": 148548, "epoch": 3536} {"train_loss": -6.798105239868164, "global_step": 148549, "epoch": 3536} {"train_loss": -6.800655841827393, "global_step": 148550, "epoch": 3536} {"train_loss": -6.867217540740967, "global_step": 148551, "epoch": 3536} {"train_loss": -6.78304386138916, "global_step": 148552, "epoch": 3536} {"train_loss": -6.845250992547898, "global_step": 148553, "epoch": 3536, "val_loss": 67971.4765625} {"train_loss": -6.744633674621582, "global_step": 148554, "epoch": 3537} {"train_loss": -6.795536994934082, "global_step": 148555, "epoch": 3537} {"train_loss": -6.940807819366455, "global_step": 148556, "epoch": 3537} {"train_loss": -6.821785926818848, "global_step": 148557, "epoch": 3537} {"train_loss": -6.871755599975586, "global_step": 148558, "epoch": 3537} {"train_loss": -6.768838405609131, "global_step": 148559, "epoch": 3537} {"train_loss": -6.773479461669922, "global_step": 148560, "epoch": 3537} {"train_loss": -6.828663349151611, "global_step": 148561, "epoch": 3537} {"train_loss": -6.86142635345459, "global_step": 148562, "epoch": 3537} {"train_loss": -6.85308837890625, "global_step": 148563, "epoch": 3537} {"train_loss": -6.81456184387207, "global_step": 148564, "epoch": 3537} {"train_loss": -6.906320571899414, "global_step": 148565, "epoch": 3537} {"train_loss": -6.810788154602051, "global_step": 148566, "epoch": 3537} {"train_loss": -6.822925567626953, "global_step": 148567, "epoch": 3537} {"train_loss": -6.912045955657959, "global_step": 148568, "epoch": 3537} {"train_loss": -6.973847389221191, "global_step": 148569, "epoch": 3537} {"train_loss": -6.774811267852783, "global_step": 148570, "epoch": 3537} {"train_loss": -6.968686103820801, "global_step": 148571, "epoch": 3537} {"train_loss": -6.985866546630859, "global_step": 148572, "epoch": 3537} {"train_loss": -6.894274711608887, "global_step": 148573, "epoch": 3537} {"train_loss": -6.9885969161987305, "global_step": 148574, "epoch": 3537} {"train_loss": -6.961357593536377, "global_step": 148575, "epoch": 3537} {"train_loss": -7.0038743019104, "global_step": 148576, "epoch": 3537} {"train_loss": -6.860562801361084, "global_step": 148577, "epoch": 3537} {"train_loss": -6.889312267303467, "global_step": 148578, "epoch": 3537} {"train_loss": -6.885933876037598, "global_step": 148579, "epoch": 3537} {"train_loss": -6.890491485595703, "global_step": 148580, "epoch": 3537} {"train_loss": -6.906978607177734, "global_step": 148581, "epoch": 3537} {"train_loss": -6.904611110687256, "global_step": 148582, "epoch": 3537} {"train_loss": -6.899771213531494, "global_step": 148583, "epoch": 3537} {"train_loss": -6.85705041885376, "global_step": 148584, "epoch": 3537} {"train_loss": -6.957147598266602, "global_step": 148585, "epoch": 3537} {"train_loss": -6.855563163757324, "global_step": 148586, "epoch": 3537} {"train_loss": -6.837138652801514, "global_step": 148587, "epoch": 3537} {"train_loss": -7.02149772644043, "global_step": 148588, "epoch": 3537} {"train_loss": -6.9265522956848145, "global_step": 148589, "epoch": 3537} {"train_loss": -6.904256343841553, "global_step": 148590, "epoch": 3537} {"train_loss": -6.8442182540893555, "global_step": 148591, "epoch": 3537} {"train_loss": -6.848875045776367, "global_step": 148592, "epoch": 3537} {"train_loss": -6.938541412353516, "global_step": 148593, "epoch": 3537} {"train_loss": -6.933704376220703, "global_step": 148594, "epoch": 3537} {"train_loss": -6.883827504657564, "global_step": 148595, "epoch": 3537, "val_loss": 67750.625} {"train_loss": -6.954725742340088, "global_step": 148596, "epoch": 3538} {"train_loss": -6.785519123077393, "global_step": 148597, "epoch": 3538} {"train_loss": -6.805765151977539, "global_step": 148598, "epoch": 3538} {"train_loss": -6.879499435424805, "global_step": 148599, "epoch": 3538} {"train_loss": -6.972927093505859, "global_step": 148600, "epoch": 3538} {"train_loss": -6.831366062164307, "global_step": 148601, "epoch": 3538} {"train_loss": -6.771818161010742, "global_step": 148602, "epoch": 3538} {"train_loss": -6.833044052124023, "global_step": 148603, "epoch": 3538} {"train_loss": -6.888645648956299, "global_step": 148604, "epoch": 3538} {"train_loss": -6.858058929443359, "global_step": 148605, "epoch": 3538} {"train_loss": -6.838558197021484, "global_step": 148606, "epoch": 3538} {"train_loss": -6.882434844970703, "global_step": 148607, "epoch": 3538} {"train_loss": -6.864182949066162, "global_step": 148608, "epoch": 3538} {"train_loss": -6.871955871582031, "global_step": 148609, "epoch": 3538} {"train_loss": -6.842292785644531, "global_step": 148610, "epoch": 3538} {"train_loss": -6.850352764129639, "global_step": 148611, "epoch": 3538} {"train_loss": -6.823877334594727, "global_step": 148612, "epoch": 3538} {"train_loss": -6.755467414855957, "global_step": 148613, "epoch": 3538} {"train_loss": -6.77482795715332, "global_step": 148614, "epoch": 3538} {"train_loss": -6.826645851135254, "global_step": 148615, "epoch": 3538} {"train_loss": -6.69693660736084, "global_step": 148616, "epoch": 3538} {"train_loss": -6.791833877563477, "global_step": 148617, "epoch": 3538} {"train_loss": -6.644928932189941, "global_step": 148618, "epoch": 3538} {"train_loss": -6.877663612365723, "global_step": 148619, "epoch": 3538} {"train_loss": -6.891840934753418, "global_step": 148620, "epoch": 3538} {"train_loss": -6.805473804473877, "global_step": 148621, "epoch": 3538} {"train_loss": -6.858867168426514, "global_step": 148622, "epoch": 3538} {"train_loss": -6.869519233703613, "global_step": 148623, "epoch": 3538} {"train_loss": -6.768543243408203, "global_step": 148624, "epoch": 3538} {"train_loss": -6.954836368560791, "global_step": 148625, "epoch": 3538} {"train_loss": -6.795888423919678, "global_step": 148626, "epoch": 3538} {"train_loss": -6.857804775238037, "global_step": 148627, "epoch": 3538} {"train_loss": -6.885988712310791, "global_step": 148628, "epoch": 3538} {"train_loss": -6.8345184326171875, "global_step": 148629, "epoch": 3538} {"train_loss": -6.814087867736816, "global_step": 148630, "epoch": 3538} {"train_loss": -6.944296836853027, "global_step": 148631, "epoch": 3538} {"train_loss": -6.8842973709106445, "global_step": 148632, "epoch": 3538} {"train_loss": -6.817220687866211, "global_step": 148633, "epoch": 3538} {"train_loss": -6.861911773681641, "global_step": 148634, "epoch": 3538} {"train_loss": -6.909476280212402, "global_step": 148635, "epoch": 3538} {"train_loss": -6.834595680236816, "global_step": 148636, "epoch": 3538} {"train_loss": -6.842740285964239, "global_step": 148637, "epoch": 3538, "val_loss": 67694.1484375} {"train_loss": -6.800779819488525, "global_step": 148638, "epoch": 3539} {"train_loss": -6.833629131317139, "global_step": 148639, "epoch": 3539} {"train_loss": -6.897383689880371, "global_step": 148640, "epoch": 3539} {"train_loss": -6.820036888122559, "global_step": 148641, "epoch": 3539} {"train_loss": -6.820699691772461, "global_step": 148642, "epoch": 3539} {"train_loss": -6.745502471923828, "global_step": 148643, "epoch": 3539} {"train_loss": -6.920072555541992, "global_step": 148644, "epoch": 3539} {"train_loss": -6.836320877075195, "global_step": 148645, "epoch": 3539} {"train_loss": -6.862524509429932, "global_step": 148646, "epoch": 3539} {"train_loss": -6.829415321350098, "global_step": 148647, "epoch": 3539} {"train_loss": -6.703893184661865, "global_step": 148648, "epoch": 3539} {"train_loss": -6.892348766326904, "global_step": 148649, "epoch": 3539} {"train_loss": -6.807609558105469, "global_step": 148650, "epoch": 3539} {"train_loss": -6.711119651794434, "global_step": 148651, "epoch": 3539} {"train_loss": -6.861583709716797, "global_step": 148652, "epoch": 3539} {"train_loss": -6.776430130004883, "global_step": 148653, "epoch": 3539} {"train_loss": -6.5003581047058105, "global_step": 148654, "epoch": 3539} {"train_loss": -6.8006911277771, "global_step": 148655, "epoch": 3539} {"train_loss": -6.749673843383789, "global_step": 148656, "epoch": 3539} {"train_loss": -6.525058746337891, "global_step": 148657, "epoch": 3539} {"train_loss": -6.804359436035156, "global_step": 148658, "epoch": 3539} {"train_loss": -6.660696983337402, "global_step": 148659, "epoch": 3539} {"train_loss": -6.801609039306641, "global_step": 148660, "epoch": 3539} {"train_loss": -6.65835428237915, "global_step": 148661, "epoch": 3539} {"train_loss": -6.787005424499512, "global_step": 148662, "epoch": 3539} {"train_loss": -6.782000541687012, "global_step": 148663, "epoch": 3539} {"train_loss": -6.64259672164917, "global_step": 148664, "epoch": 3539} {"train_loss": -6.704512596130371, "global_step": 148665, "epoch": 3539} {"train_loss": -6.791740417480469, "global_step": 148666, "epoch": 3539} {"train_loss": -6.741972923278809, "global_step": 148667, "epoch": 3539} {"train_loss": -6.648863792419434, "global_step": 148668, "epoch": 3539} {"train_loss": -6.611288070678711, "global_step": 148669, "epoch": 3539} {"train_loss": -6.719686508178711, "global_step": 148670, "epoch": 3539} {"train_loss": -6.740865707397461, "global_step": 148671, "epoch": 3539} {"train_loss": -6.751651763916016, "global_step": 148672, "epoch": 3539} {"train_loss": -6.853455543518066, "global_step": 148673, "epoch": 3539} {"train_loss": -6.688940048217773, "global_step": 148674, "epoch": 3539} {"train_loss": -6.787711143493652, "global_step": 148675, "epoch": 3539} {"train_loss": -6.70510196685791, "global_step": 148676, "epoch": 3539} {"train_loss": -6.907240867614746, "global_step": 148677, "epoch": 3539} {"train_loss": -6.812405109405518, "global_step": 148678, "epoch": 3539} {"train_loss": -6.7638318084535145, "global_step": 148679, "epoch": 3539, "val_loss": 67905.953125} {"train_loss": -6.904819488525391, "global_step": 148680, "epoch": 3540} {"train_loss": -6.775218963623047, "global_step": 148681, "epoch": 3540} {"train_loss": -6.884540557861328, "global_step": 148682, "epoch": 3540} {"train_loss": -6.655204772949219, "global_step": 148683, "epoch": 3540} {"train_loss": -6.867855072021484, "global_step": 148684, "epoch": 3540} {"train_loss": -6.761779308319092, "global_step": 148685, "epoch": 3540} {"train_loss": -6.85618782043457, "global_step": 148686, "epoch": 3540} {"train_loss": -6.782973289489746, "global_step": 148687, "epoch": 3540} {"train_loss": -6.796113014221191, "global_step": 148688, "epoch": 3540} {"train_loss": -6.96917724609375, "global_step": 148689, "epoch": 3540} {"train_loss": -6.8692851066589355, "global_step": 148690, "epoch": 3540} {"train_loss": -6.860137939453125, "global_step": 148691, "epoch": 3540} {"train_loss": -6.923857688903809, "global_step": 148692, "epoch": 3540} {"train_loss": -6.897551536560059, "global_step": 148693, "epoch": 3540} {"train_loss": -6.964643955230713, "global_step": 148694, "epoch": 3540} {"train_loss": -6.904726982116699, "global_step": 148695, "epoch": 3540} {"train_loss": -6.930722713470459, "global_step": 148696, "epoch": 3540} {"train_loss": -6.9060516357421875, "global_step": 148697, "epoch": 3540} {"train_loss": -6.922240257263184, "global_step": 148698, "epoch": 3540} {"train_loss": -6.888394355773926, "global_step": 148699, "epoch": 3540} {"train_loss": -6.8936567306518555, "global_step": 148700, "epoch": 3540} {"train_loss": -6.928399085998535, "global_step": 148701, "epoch": 3540} {"train_loss": -6.810900688171387, "global_step": 148702, "epoch": 3540} {"train_loss": -6.7909111976623535, "global_step": 148703, "epoch": 3540} {"train_loss": -6.8445539474487305, "global_step": 148704, "epoch": 3540} {"train_loss": -6.885869979858398, "global_step": 148705, "epoch": 3540} {"train_loss": -6.864516258239746, "global_step": 148706, "epoch": 3540} {"train_loss": -6.924527168273926, "global_step": 148707, "epoch": 3540} {"train_loss": -6.88590145111084, "global_step": 148708, "epoch": 3540} {"train_loss": -6.924779891967773, "global_step": 148709, "epoch": 3540} {"train_loss": -6.891396522521973, "global_step": 148710, "epoch": 3540} {"train_loss": -6.847935676574707, "global_step": 148711, "epoch": 3540} {"train_loss": -6.921855926513672, "global_step": 148712, "epoch": 3540} {"train_loss": -6.81256103515625, "global_step": 148713, "epoch": 3540} {"train_loss": -6.957368850708008, "global_step": 148714, "epoch": 3540} {"train_loss": -6.918098449707031, "global_step": 148715, "epoch": 3540} {"train_loss": -6.815862655639648, "global_step": 148716, "epoch": 3540} {"train_loss": -6.8076324462890625, "global_step": 148717, "epoch": 3540} {"train_loss": -6.858797073364258, "global_step": 148718, "epoch": 3540} {"train_loss": -6.8714752197265625, "global_step": 148719, "epoch": 3540} {"train_loss": -6.916492462158203, "global_step": 148720, "epoch": 3540} {"train_loss": -6.872040271759033, "global_step": 148721, "epoch": 3540, "val_loss": 67888.8828125} {"train_loss": -6.824977397918701, "global_step": 148722, "epoch": 3541} {"train_loss": -6.9362053871154785, "global_step": 148723, "epoch": 3541} {"train_loss": -6.950664043426514, "global_step": 148724, "epoch": 3541} {"train_loss": -6.920296669006348, "global_step": 148725, "epoch": 3541} {"train_loss": -6.826102256774902, "global_step": 148726, "epoch": 3541} {"train_loss": -6.90658712387085, "global_step": 148727, "epoch": 3541} {"train_loss": -6.938373565673828, "global_step": 148728, "epoch": 3541} {"train_loss": -6.831512928009033, "global_step": 148729, "epoch": 3541} {"train_loss": -6.823554039001465, "global_step": 148730, "epoch": 3541} {"train_loss": -6.8854827880859375, "global_step": 148731, "epoch": 3541} {"train_loss": -6.938328742980957, "global_step": 148732, "epoch": 3541} {"train_loss": -6.813689231872559, "global_step": 148733, "epoch": 3541} {"train_loss": -6.833370208740234, "global_step": 148734, "epoch": 3541} {"train_loss": -6.805661201477051, "global_step": 148735, "epoch": 3541} {"train_loss": -6.8697710037231445, "global_step": 148736, "epoch": 3541} {"train_loss": -6.920893669128418, "global_step": 148737, "epoch": 3541} {"train_loss": -6.875877380371094, "global_step": 148738, "epoch": 3541} {"train_loss": -6.872920989990234, "global_step": 148739, "epoch": 3541} {"train_loss": -6.861765384674072, "global_step": 148740, "epoch": 3541} {"train_loss": -6.815077781677246, "global_step": 148741, "epoch": 3541} {"train_loss": -6.797627925872803, "global_step": 148742, "epoch": 3541} {"train_loss": -6.849279880523682, "global_step": 148743, "epoch": 3541} {"train_loss": -6.7746381759643555, "global_step": 148744, "epoch": 3541} {"train_loss": -6.8333001136779785, "global_step": 148745, "epoch": 3541} {"train_loss": -6.829549789428711, "global_step": 148746, "epoch": 3541} {"train_loss": -6.766239166259766, "global_step": 148747, "epoch": 3541} {"train_loss": -6.790108680725098, "global_step": 148748, "epoch": 3541} {"train_loss": -6.80897331237793, "global_step": 148749, "epoch": 3541} {"train_loss": -6.880681037902832, "global_step": 148750, "epoch": 3541} {"train_loss": -6.984979152679443, "global_step": 148751, "epoch": 3541} {"train_loss": -6.925506591796875, "global_step": 148752, "epoch": 3541} {"train_loss": -6.9154582023620605, "global_step": 148753, "epoch": 3541} {"train_loss": -6.906164169311523, "global_step": 148754, "epoch": 3541} {"train_loss": -6.9664201736450195, "global_step": 148755, "epoch": 3541} {"train_loss": -6.911844730377197, "global_step": 148756, "epoch": 3541} {"train_loss": -6.748048782348633, "global_step": 148757, "epoch": 3541} {"train_loss": -6.7963786125183105, "global_step": 148758, "epoch": 3541} {"train_loss": -6.968136310577393, "global_step": 148759, "epoch": 3541} {"train_loss": -6.9039812088012695, "global_step": 148760, "epoch": 3541} {"train_loss": -6.8581366539001465, "global_step": 148761, "epoch": 3541} {"train_loss": -6.827872276306152, "global_step": 148762, "epoch": 3541} {"train_loss": -6.866576115290324, "global_step": 148763, "epoch": 3541, "val_loss": 67985.5546875} {"train_loss": -6.848996162414551, "global_step": 148764, "epoch": 3542} {"train_loss": -6.813452243804932, "global_step": 148765, "epoch": 3542} {"train_loss": -6.8381781578063965, "global_step": 148766, "epoch": 3542} {"train_loss": -6.963218688964844, "global_step": 148767, "epoch": 3542} {"train_loss": -6.869256973266602, "global_step": 148768, "epoch": 3542} {"train_loss": -6.978204727172852, "global_step": 148769, "epoch": 3542} {"train_loss": -6.984914302825928, "global_step": 148770, "epoch": 3542} {"train_loss": -6.642913818359375, "global_step": 148771, "epoch": 3542} {"train_loss": -6.841678142547607, "global_step": 148772, "epoch": 3542} {"train_loss": -6.854274749755859, "global_step": 148773, "epoch": 3542} {"train_loss": -6.972341060638428, "global_step": 148774, "epoch": 3542} {"train_loss": -6.836258411407471, "global_step": 148775, "epoch": 3542} {"train_loss": -6.682656764984131, "global_step": 148776, "epoch": 3542} {"train_loss": -6.742806434631348, "global_step": 148777, "epoch": 3542} {"train_loss": -6.647341251373291, "global_step": 148778, "epoch": 3542} {"train_loss": -6.732426166534424, "global_step": 148779, "epoch": 3542} {"train_loss": -6.783209800720215, "global_step": 148780, "epoch": 3542} {"train_loss": -6.938776016235352, "global_step": 148781, "epoch": 3542} {"train_loss": -6.7899370193481445, "global_step": 148782, "epoch": 3542} {"train_loss": -6.84993314743042, "global_step": 148783, "epoch": 3542} {"train_loss": -6.869335174560547, "global_step": 148784, "epoch": 3542} {"train_loss": -6.766241550445557, "global_step": 148785, "epoch": 3542} {"train_loss": -6.728313446044922, "global_step": 148786, "epoch": 3542} {"train_loss": -6.594011306762695, "global_step": 148787, "epoch": 3542} {"train_loss": -6.7119550704956055, "global_step": 148788, "epoch": 3542} {"train_loss": -6.749368667602539, "global_step": 148789, "epoch": 3542} {"train_loss": -6.740318298339844, "global_step": 148790, "epoch": 3542} {"train_loss": -6.827868461608887, "global_step": 148791, "epoch": 3542} {"train_loss": -6.675065994262695, "global_step": 148792, "epoch": 3542} {"train_loss": -6.731635570526123, "global_step": 148793, "epoch": 3542} {"train_loss": -6.804722309112549, "global_step": 148794, "epoch": 3542} {"train_loss": -6.821789741516113, "global_step": 148795, "epoch": 3542} {"train_loss": -6.804841041564941, "global_step": 148796, "epoch": 3542} {"train_loss": -6.781651496887207, "global_step": 148797, "epoch": 3542} {"train_loss": -6.860496520996094, "global_step": 148798, "epoch": 3542} {"train_loss": -6.823680877685547, "global_step": 148799, "epoch": 3542} {"train_loss": -6.7521233558654785, "global_step": 148800, "epoch": 3542} {"train_loss": -6.769991397857666, "global_step": 148801, "epoch": 3542} {"train_loss": -6.855871200561523, "global_step": 148802, "epoch": 3542} {"train_loss": -6.835355281829834, "global_step": 148803, "epoch": 3542} {"train_loss": -6.785070896148682, "global_step": 148804, "epoch": 3542} {"train_loss": -6.804815712429228, "global_step": 148805, "epoch": 3542, "val_loss": 67921.5625} {"train_loss": -6.849701881408691, "global_step": 148806, "epoch": 3543} {"train_loss": -6.919466018676758, "global_step": 148807, "epoch": 3543} {"train_loss": -6.933740615844727, "global_step": 148808, "epoch": 3543} {"train_loss": -6.8394880294799805, "global_step": 148809, "epoch": 3543} {"train_loss": -6.86277961730957, "global_step": 148810, "epoch": 3543} {"train_loss": -6.814516067504883, "global_step": 148811, "epoch": 3543} {"train_loss": -6.885323524475098, "global_step": 148812, "epoch": 3543} {"train_loss": -6.808281898498535, "global_step": 148813, "epoch": 3543} {"train_loss": -6.831352233886719, "global_step": 148814, "epoch": 3543} {"train_loss": -6.7744598388671875, "global_step": 148815, "epoch": 3543} {"train_loss": -6.7339348793029785, "global_step": 148816, "epoch": 3543} {"train_loss": -6.878063201904297, "global_step": 148817, "epoch": 3543} {"train_loss": -6.692473888397217, "global_step": 148818, "epoch": 3543} {"train_loss": -6.852816104888916, "global_step": 148819, "epoch": 3543} {"train_loss": -6.794910430908203, "global_step": 148820, "epoch": 3543} {"train_loss": -6.891992568969727, "global_step": 148821, "epoch": 3543} {"train_loss": -6.856306076049805, "global_step": 148822, "epoch": 3543} {"train_loss": -6.874416351318359, "global_step": 148823, "epoch": 3543} {"train_loss": -6.846763610839844, "global_step": 148824, "epoch": 3543} {"train_loss": -6.956914901733398, "global_step": 148825, "epoch": 3543} {"train_loss": -6.823875427246094, "global_step": 148826, "epoch": 3543} {"train_loss": -6.891331195831299, "global_step": 148827, "epoch": 3543} {"train_loss": -6.970710754394531, "global_step": 148828, "epoch": 3543} {"train_loss": -6.899782657623291, "global_step": 148829, "epoch": 3543} {"train_loss": -6.907918930053711, "global_step": 148830, "epoch": 3543} {"train_loss": -6.738584518432617, "global_step": 148831, "epoch": 3543} {"train_loss": -6.874605178833008, "global_step": 148832, "epoch": 3543} {"train_loss": -6.782854080200195, "global_step": 148833, "epoch": 3543} {"train_loss": -6.870792388916016, "global_step": 148834, "epoch": 3543} {"train_loss": -6.742245197296143, "global_step": 148835, "epoch": 3543} {"train_loss": -6.83553409576416, "global_step": 148836, "epoch": 3543} {"train_loss": -6.898003101348877, "global_step": 148837, "epoch": 3543} {"train_loss": -6.851462364196777, "global_step": 148838, "epoch": 3543} {"train_loss": -6.830537796020508, "global_step": 148839, "epoch": 3543} {"train_loss": -6.874480247497559, "global_step": 148840, "epoch": 3543} {"train_loss": -6.970697402954102, "global_step": 148841, "epoch": 3543} {"train_loss": -6.821674346923828, "global_step": 148842, "epoch": 3543} {"train_loss": -6.892378330230713, "global_step": 148843, "epoch": 3543} {"train_loss": -6.958219528198242, "global_step": 148844, "epoch": 3543} {"train_loss": -6.8564534187316895, "global_step": 148845, "epoch": 3543} {"train_loss": -6.785446643829346, "global_step": 148846, "epoch": 3543} {"train_loss": -6.853408518291655, "global_step": 148847, "epoch": 3543, "val_loss": 67935.3984375} {"train_loss": -6.849123477935791, "global_step": 148848, "epoch": 3544} {"train_loss": -6.888822555541992, "global_step": 148849, "epoch": 3544} {"train_loss": -6.715329647064209, "global_step": 148850, "epoch": 3544} {"train_loss": -6.844442367553711, "global_step": 148851, "epoch": 3544} {"train_loss": -6.9780120849609375, "global_step": 148852, "epoch": 3544} {"train_loss": -6.89858865737915, "global_step": 148853, "epoch": 3544} {"train_loss": -6.838762283325195, "global_step": 148854, "epoch": 3544} {"train_loss": -6.900301933288574, "global_step": 148855, "epoch": 3544} {"train_loss": -6.849921226501465, "global_step": 148856, "epoch": 3544} {"train_loss": -6.862120628356934, "global_step": 148857, "epoch": 3544} {"train_loss": -6.843642234802246, "global_step": 148858, "epoch": 3544} {"train_loss": -6.808544158935547, "global_step": 148859, "epoch": 3544} {"train_loss": -6.804028034210205, "global_step": 148860, "epoch": 3544} {"train_loss": -6.833739280700684, "global_step": 148861, "epoch": 3544} {"train_loss": -6.805997848510742, "global_step": 148862, "epoch": 3544} {"train_loss": -6.866097450256348, "global_step": 148863, "epoch": 3544} {"train_loss": -6.804431438446045, "global_step": 148864, "epoch": 3544} {"train_loss": -6.922077178955078, "global_step": 148865, "epoch": 3544} {"train_loss": -6.814082145690918, "global_step": 148866, "epoch": 3544} {"train_loss": -6.860936164855957, "global_step": 148867, "epoch": 3544} {"train_loss": -6.763097763061523, "global_step": 148868, "epoch": 3544} {"train_loss": -6.76201057434082, "global_step": 148869, "epoch": 3544} {"train_loss": -6.789978504180908, "global_step": 148870, "epoch": 3544} {"train_loss": -6.801695823669434, "global_step": 148871, "epoch": 3544} {"train_loss": -6.7516069412231445, "global_step": 148872, "epoch": 3544} {"train_loss": -6.778688430786133, "global_step": 148873, "epoch": 3544} {"train_loss": -6.651954650878906, "global_step": 148874, "epoch": 3544} {"train_loss": -6.735997200012207, "global_step": 148875, "epoch": 3544} {"train_loss": -6.721083641052246, "global_step": 148876, "epoch": 3544} {"train_loss": -6.686850547790527, "global_step": 148877, "epoch": 3544} {"train_loss": -6.722789764404297, "global_step": 148878, "epoch": 3544} {"train_loss": -6.731603622436523, "global_step": 148879, "epoch": 3544} {"train_loss": -6.714560508728027, "global_step": 148880, "epoch": 3544} {"train_loss": -6.730956077575684, "global_step": 148881, "epoch": 3544} {"train_loss": -6.723230361938477, "global_step": 148882, "epoch": 3544} {"train_loss": -6.8373212814331055, "global_step": 148883, "epoch": 3544} {"train_loss": -6.655844688415527, "global_step": 148884, "epoch": 3544} {"train_loss": -6.746687889099121, "global_step": 148885, "epoch": 3544} {"train_loss": -6.721631050109863, "global_step": 148886, "epoch": 3544} {"train_loss": -6.695944309234619, "global_step": 148887, "epoch": 3544} {"train_loss": -6.737844467163086, "global_step": 148888, "epoch": 3544} {"train_loss": -6.789340257644653, "global_step": 148889, "epoch": 3544, "val_loss": 67962.28125} {"train_loss": -6.820559501647949, "global_step": 148890, "epoch": 3545} {"train_loss": -6.86965274810791, "global_step": 148891, "epoch": 3545} {"train_loss": -6.7542219161987305, "global_step": 148892, "epoch": 3545} {"train_loss": -6.804685592651367, "global_step": 148893, "epoch": 3545} {"train_loss": -6.677299499511719, "global_step": 148894, "epoch": 3545} {"train_loss": -6.70877742767334, "global_step": 148895, "epoch": 3545} {"train_loss": -6.718026161193848, "global_step": 148896, "epoch": 3545} {"train_loss": -6.771947860717773, "global_step": 148897, "epoch": 3545} {"train_loss": -6.7794342041015625, "global_step": 148898, "epoch": 3545} {"train_loss": -6.774666786193848, "global_step": 148899, "epoch": 3545} {"train_loss": -6.791130065917969, "global_step": 148900, "epoch": 3545} {"train_loss": -6.925915718078613, "global_step": 148901, "epoch": 3545} {"train_loss": -6.821187973022461, "global_step": 148902, "epoch": 3545} {"train_loss": -6.843629360198975, "global_step": 148903, "epoch": 3545} {"train_loss": -6.913431167602539, "global_step": 148904, "epoch": 3545} {"train_loss": -6.820932388305664, "global_step": 148905, "epoch": 3545} {"train_loss": -6.887811183929443, "global_step": 148906, "epoch": 3545} {"train_loss": -6.849839687347412, "global_step": 148907, "epoch": 3545} {"train_loss": -6.882635593414307, "global_step": 148908, "epoch": 3545} {"train_loss": -6.839598655700684, "global_step": 148909, "epoch": 3545} {"train_loss": -6.703579902648926, "global_step": 148910, "epoch": 3545} {"train_loss": -6.766908645629883, "global_step": 148911, "epoch": 3545} {"train_loss": -6.817108154296875, "global_step": 148912, "epoch": 3545} {"train_loss": -6.8690900802612305, "global_step": 148913, "epoch": 3545} {"train_loss": -6.78659725189209, "global_step": 148914, "epoch": 3545} {"train_loss": -6.867457389831543, "global_step": 148915, "epoch": 3545} {"train_loss": -6.7975921630859375, "global_step": 148916, "epoch": 3545} {"train_loss": -6.817768096923828, "global_step": 148917, "epoch": 3545} {"train_loss": -6.92098331451416, "global_step": 148918, "epoch": 3545} {"train_loss": -6.739189147949219, "global_step": 148919, "epoch": 3545} {"train_loss": -6.722978591918945, "global_step": 148920, "epoch": 3545} {"train_loss": -6.82377815246582, "global_step": 148921, "epoch": 3545} {"train_loss": -6.7822651863098145, "global_step": 148922, "epoch": 3545} {"train_loss": -6.801549911499023, "global_step": 148923, "epoch": 3545} {"train_loss": -6.717874050140381, "global_step": 148924, "epoch": 3545} {"train_loss": -6.840402126312256, "global_step": 148925, "epoch": 3545} {"train_loss": -6.905573844909668, "global_step": 148926, "epoch": 3545} {"train_loss": -6.762502670288086, "global_step": 148927, "epoch": 3545} {"train_loss": -6.727264881134033, "global_step": 148928, "epoch": 3545} {"train_loss": -6.780711650848389, "global_step": 148929, "epoch": 3545} {"train_loss": -6.752885818481445, "global_step": 148930, "epoch": 3545} {"train_loss": -6.805444422222319, "global_step": 148931, "epoch": 3545, "val_loss": 67961.2734375} {"train_loss": -6.673995018005371, "global_step": 148932, "epoch": 3546} {"train_loss": -6.8033552169799805, "global_step": 148933, "epoch": 3546} {"train_loss": -6.86000394821167, "global_step": 148934, "epoch": 3546} {"train_loss": -6.746549129486084, "global_step": 148935, "epoch": 3546} {"train_loss": -6.692667484283447, "global_step": 148936, "epoch": 3546} {"train_loss": -6.920501708984375, "global_step": 148937, "epoch": 3546} {"train_loss": -6.767271041870117, "global_step": 148938, "epoch": 3546} {"train_loss": -6.8563995361328125, "global_step": 148939, "epoch": 3546} {"train_loss": -6.70259428024292, "global_step": 148940, "epoch": 3546} {"train_loss": -6.890928745269775, "global_step": 148941, "epoch": 3546} {"train_loss": -6.823432922363281, "global_step": 148942, "epoch": 3546} {"train_loss": -6.802068710327148, "global_step": 148943, "epoch": 3546} {"train_loss": -6.7846479415893555, "global_step": 148944, "epoch": 3546} {"train_loss": -6.952098369598389, "global_step": 148945, "epoch": 3546} {"train_loss": -6.923758506774902, "global_step": 148946, "epoch": 3546} {"train_loss": -6.903376579284668, "global_step": 148947, "epoch": 3546} {"train_loss": -6.825618743896484, "global_step": 148948, "epoch": 3546} {"train_loss": -6.801413536071777, "global_step": 148949, "epoch": 3546} {"train_loss": -6.821987152099609, "global_step": 148950, "epoch": 3546} {"train_loss": -6.830081939697266, "global_step": 148951, "epoch": 3546} {"train_loss": -6.914615631103516, "global_step": 148952, "epoch": 3546} {"train_loss": -6.821979522705078, "global_step": 148953, "epoch": 3546} {"train_loss": -6.77027702331543, "global_step": 148954, "epoch": 3546} {"train_loss": -6.867773056030273, "global_step": 148955, "epoch": 3546} {"train_loss": -6.916577339172363, "global_step": 148956, "epoch": 3546} {"train_loss": -6.8031158447265625, "global_step": 148957, "epoch": 3546} {"train_loss": -6.92662239074707, "global_step": 148958, "epoch": 3546} {"train_loss": -6.8541154861450195, "global_step": 148959, "epoch": 3546} {"train_loss": -6.887313365936279, "global_step": 148960, "epoch": 3546} {"train_loss": -6.804290771484375, "global_step": 148961, "epoch": 3546} {"train_loss": -6.7437286376953125, "global_step": 148962, "epoch": 3546} {"train_loss": -6.775856018066406, "global_step": 148963, "epoch": 3546} {"train_loss": -6.930808067321777, "global_step": 148964, "epoch": 3546} {"train_loss": -6.814255237579346, "global_step": 148965, "epoch": 3546} {"train_loss": -6.9205522537231445, "global_step": 148966, "epoch": 3546} {"train_loss": -6.8752241134643555, "global_step": 148967, "epoch": 3546} {"train_loss": -6.875214099884033, "global_step": 148968, "epoch": 3546} {"train_loss": -6.864901065826416, "global_step": 148969, "epoch": 3546} {"train_loss": -6.795523643493652, "global_step": 148970, "epoch": 3546} {"train_loss": -6.891782283782959, "global_step": 148971, "epoch": 3546} {"train_loss": -6.958736896514893, "global_step": 148972, "epoch": 3546} {"train_loss": -6.840391976492746, "global_step": 148973, "epoch": 3546, "val_loss": 67931.65625} {"train_loss": -6.90338134765625, "global_step": 148974, "epoch": 3547} {"train_loss": -6.865191459655762, "global_step": 148975, "epoch": 3547} {"train_loss": -6.800359725952148, "global_step": 148976, "epoch": 3547} {"train_loss": -6.897555351257324, "global_step": 148977, "epoch": 3547} {"train_loss": -6.948111534118652, "global_step": 148978, "epoch": 3547} {"train_loss": -6.9068803787231445, "global_step": 148979, "epoch": 3547} {"train_loss": -6.989141464233398, "global_step": 148980, "epoch": 3547} {"train_loss": -6.956521034240723, "global_step": 148981, "epoch": 3547} {"train_loss": -6.936362266540527, "global_step": 148982, "epoch": 3547} {"train_loss": -6.854719638824463, "global_step": 148983, "epoch": 3547} {"train_loss": -6.860803604125977, "global_step": 148984, "epoch": 3547} {"train_loss": -6.934772968292236, "global_step": 148985, "epoch": 3547} {"train_loss": -6.899399280548096, "global_step": 148986, "epoch": 3547} {"train_loss": -6.886448860168457, "global_step": 148987, "epoch": 3547} {"train_loss": -6.891895294189453, "global_step": 148988, "epoch": 3547} {"train_loss": -6.811067581176758, "global_step": 148989, "epoch": 3547} {"train_loss": -6.798729419708252, "global_step": 148990, "epoch": 3547} {"train_loss": -6.9325971603393555, "global_step": 148991, "epoch": 3547} {"train_loss": -6.86462926864624, "global_step": 148992, "epoch": 3547} {"train_loss": -6.972543716430664, "global_step": 148993, "epoch": 3547} {"train_loss": -6.806166172027588, "global_step": 148994, "epoch": 3547} {"train_loss": -6.932093620300293, "global_step": 148995, "epoch": 3547} {"train_loss": -6.860499382019043, "global_step": 148996, "epoch": 3547} {"train_loss": -6.833035469055176, "global_step": 148997, "epoch": 3547} {"train_loss": -6.845392227172852, "global_step": 148998, "epoch": 3547} {"train_loss": -6.938442230224609, "global_step": 148999, "epoch": 3547} {"train_loss": -7.04393196105957, "global_step": 149000, "epoch": 3547} {"train_loss": -6.847162246704102, "global_step": 149001, "epoch": 3547} {"train_loss": -6.916769027709961, "global_step": 149002, "epoch": 3547} {"train_loss": -6.927792549133301, "global_step": 149003, "epoch": 3547} {"train_loss": -6.889218330383301, "global_step": 149004, "epoch": 3547} {"train_loss": -6.813133239746094, "global_step": 149005, "epoch": 3547} {"train_loss": -6.747452259063721, "global_step": 149006, "epoch": 3547} {"train_loss": -6.99160099029541, "global_step": 149007, "epoch": 3547} {"train_loss": -6.88088846206665, "global_step": 149008, "epoch": 3547} {"train_loss": -6.838438510894775, "global_step": 149009, "epoch": 3547} {"train_loss": -6.890284538269043, "global_step": 149010, "epoch": 3547} {"train_loss": -6.861243724822998, "global_step": 149011, "epoch": 3547} {"train_loss": -6.855267524719238, "global_step": 149012, "epoch": 3547} {"train_loss": -6.953263282775879, "global_step": 149013, "epoch": 3547} {"train_loss": -7.003693103790283, "global_step": 149014, "epoch": 3547} {"train_loss": -6.8892334415799095, "global_step": 149015, "epoch": 3547, "val_loss": 68004.4609375} {"train_loss": -6.914125919342041, "global_step": 149016, "epoch": 3548} {"train_loss": -6.922855377197266, "global_step": 149017, "epoch": 3548} {"train_loss": -6.9095778465271, "global_step": 149018, "epoch": 3548} {"train_loss": -6.913165092468262, "global_step": 149019, "epoch": 3548} {"train_loss": -6.903263092041016, "global_step": 149020, "epoch": 3548} {"train_loss": -7.000636100769043, "global_step": 149021, "epoch": 3548} {"train_loss": -6.966715335845947, "global_step": 149022, "epoch": 3548} {"train_loss": -7.061795234680176, "global_step": 149023, "epoch": 3548} {"train_loss": -6.826478958129883, "global_step": 149024, "epoch": 3548} {"train_loss": -6.853140830993652, "global_step": 149025, "epoch": 3548} {"train_loss": -6.905623435974121, "global_step": 149026, "epoch": 3548} {"train_loss": -6.766040802001953, "global_step": 149027, "epoch": 3548} {"train_loss": -6.785341739654541, "global_step": 149028, "epoch": 3548} {"train_loss": -6.791656494140625, "global_step": 149029, "epoch": 3548} {"train_loss": -6.867151737213135, "global_step": 149030, "epoch": 3548} {"train_loss": -6.829473972320557, "global_step": 149031, "epoch": 3548} {"train_loss": -6.712215900421143, "global_step": 149032, "epoch": 3548} {"train_loss": -6.856940746307373, "global_step": 149033, "epoch": 3548} {"train_loss": -6.906612396240234, "global_step": 149034, "epoch": 3548} {"train_loss": -6.884930610656738, "global_step": 149035, "epoch": 3548} {"train_loss": -6.87679386138916, "global_step": 149036, "epoch": 3548} {"train_loss": -6.828400611877441, "global_step": 149037, "epoch": 3548} {"train_loss": -6.914463043212891, "global_step": 149038, "epoch": 3548} {"train_loss": -6.817844390869141, "global_step": 149039, "epoch": 3548} {"train_loss": -6.838561058044434, "global_step": 149040, "epoch": 3548} {"train_loss": -6.843264102935791, "global_step": 149041, "epoch": 3548} {"train_loss": -6.788735389709473, "global_step": 149042, "epoch": 3548} {"train_loss": -6.967998504638672, "global_step": 149043, "epoch": 3548} {"train_loss": -6.830739974975586, "global_step": 149044, "epoch": 3548} {"train_loss": -6.716634750366211, "global_step": 149045, "epoch": 3548} {"train_loss": -6.895374298095703, "global_step": 149046, "epoch": 3548} {"train_loss": -6.906593322753906, "global_step": 149047, "epoch": 3548} {"train_loss": -6.960009574890137, "global_step": 149048, "epoch": 3548} {"train_loss": -6.905595779418945, "global_step": 149049, "epoch": 3548} {"train_loss": -6.929264545440674, "global_step": 149050, "epoch": 3548} {"train_loss": -6.982943534851074, "global_step": 149051, "epoch": 3548} {"train_loss": -6.903163909912109, "global_step": 149052, "epoch": 3548} {"train_loss": -6.876877307891846, "global_step": 149053, "epoch": 3548} {"train_loss": -6.882916450500488, "global_step": 149054, "epoch": 3548} {"train_loss": -6.895334243774414, "global_step": 149055, "epoch": 3548} {"train_loss": -6.884153842926025, "global_step": 149056, "epoch": 3548} {"train_loss": -6.879061505908058, "global_step": 149057, "epoch": 3548, "val_loss": 67868.3203125} {"train_loss": -6.952260494232178, "global_step": 149058, "epoch": 3549} {"train_loss": -6.896105766296387, "global_step": 149059, "epoch": 3549} {"train_loss": -6.81846809387207, "global_step": 149060, "epoch": 3549} {"train_loss": -6.898098945617676, "global_step": 149061, "epoch": 3549} {"train_loss": -6.757309913635254, "global_step": 149062, "epoch": 3549} {"train_loss": -6.847530841827393, "global_step": 149063, "epoch": 3549} {"train_loss": -6.8749566078186035, "global_step": 149064, "epoch": 3549} {"train_loss": -6.940363883972168, "global_step": 149065, "epoch": 3549} {"train_loss": -6.840879440307617, "global_step": 149066, "epoch": 3549} {"train_loss": -6.774499893188477, "global_step": 149067, "epoch": 3549} {"train_loss": -6.777257442474365, "global_step": 149068, "epoch": 3549} {"train_loss": -6.790702819824219, "global_step": 149069, "epoch": 3549} {"train_loss": -6.848130702972412, "global_step": 149070, "epoch": 3549} {"train_loss": -6.8500823974609375, "global_step": 149071, "epoch": 3549} {"train_loss": -6.696083068847656, "global_step": 149072, "epoch": 3549} {"train_loss": -6.856997966766357, "global_step": 149073, "epoch": 3549} {"train_loss": -6.86263370513916, "global_step": 149074, "epoch": 3549} {"train_loss": -6.789020538330078, "global_step": 149075, "epoch": 3549} {"train_loss": -6.711154937744141, "global_step": 149076, "epoch": 3549} {"train_loss": -6.734703063964844, "global_step": 149077, "epoch": 3549} {"train_loss": -6.851950168609619, "global_step": 149078, "epoch": 3549} {"train_loss": -6.783812046051025, "global_step": 149079, "epoch": 3549} {"train_loss": -6.770448207855225, "global_step": 149080, "epoch": 3549} {"train_loss": -6.6987080574035645, "global_step": 149081, "epoch": 3549} {"train_loss": -6.806013107299805, "global_step": 149082, "epoch": 3549} {"train_loss": -6.656561374664307, "global_step": 149083, "epoch": 3549} {"train_loss": -6.798643112182617, "global_step": 149084, "epoch": 3549} {"train_loss": -6.7428741455078125, "global_step": 149085, "epoch": 3549} {"train_loss": -6.689754486083984, "global_step": 149086, "epoch": 3549} {"train_loss": -6.863298416137695, "global_step": 149087, "epoch": 3549} {"train_loss": -6.813600063323975, "global_step": 149088, "epoch": 3549} {"train_loss": -6.80359411239624, "global_step": 149089, "epoch": 3549} {"train_loss": -6.831899642944336, "global_step": 149090, "epoch": 3549} {"train_loss": -6.8298773765563965, "global_step": 149091, "epoch": 3549} {"train_loss": -6.843287467956543, "global_step": 149092, "epoch": 3549} {"train_loss": -6.755437850952148, "global_step": 149093, "epoch": 3549} {"train_loss": -6.9180707931518555, "global_step": 149094, "epoch": 3549} {"train_loss": -6.933114051818848, "global_step": 149095, "epoch": 3549} {"train_loss": -6.833246231079102, "global_step": 149096, "epoch": 3549} {"train_loss": -6.839313507080078, "global_step": 149097, "epoch": 3549} {"train_loss": -6.792001247406006, "global_step": 149098, "epoch": 3549} {"train_loss": -6.814665658133371, "global_step": 149099, "epoch": 3549, "val_loss": 67945.34375} {"train_loss": -6.855273246765137, "global_step": 149100, "epoch": 3550} {"train_loss": -6.844888210296631, "global_step": 149101, "epoch": 3550} {"train_loss": -6.926875591278076, "global_step": 149102, "epoch": 3550} {"train_loss": -6.599003791809082, "global_step": 149103, "epoch": 3550} {"train_loss": -6.702447414398193, "global_step": 149104, "epoch": 3550} {"train_loss": -6.837416648864746, "global_step": 149105, "epoch": 3550} {"train_loss": -6.792853832244873, "global_step": 149106, "epoch": 3550} {"train_loss": -6.875323295593262, "global_step": 149107, "epoch": 3550} {"train_loss": -6.841166019439697, "global_step": 149108, "epoch": 3550} {"train_loss": -6.960215091705322, "global_step": 149109, "epoch": 3550} {"train_loss": -6.816871643066406, "global_step": 149110, "epoch": 3550} {"train_loss": -6.895539283752441, "global_step": 149111, "epoch": 3550} {"train_loss": -6.838155269622803, "global_step": 149112, "epoch": 3550} {"train_loss": -6.846303939819336, "global_step": 149113, "epoch": 3550} {"train_loss": -6.833820343017578, "global_step": 149114, "epoch": 3550} {"train_loss": -6.847777366638184, "global_step": 149115, "epoch": 3550} {"train_loss": -6.867513656616211, "global_step": 149116, "epoch": 3550} {"train_loss": -6.857377052307129, "global_step": 149117, "epoch": 3550} {"train_loss": -6.80023717880249, "global_step": 149118, "epoch": 3550} {"train_loss": -6.705451965332031, "global_step": 149119, "epoch": 3550} {"train_loss": -6.8734588623046875, "global_step": 149120, "epoch": 3550} {"train_loss": -6.862828254699707, "global_step": 149121, "epoch": 3550} {"train_loss": -6.7179765701293945, "global_step": 149122, "epoch": 3550} {"train_loss": -6.851273536682129, "global_step": 149123, "epoch": 3550} {"train_loss": -6.805280685424805, "global_step": 149124, "epoch": 3550} {"train_loss": -6.8433122634887695, "global_step": 149125, "epoch": 3550} {"train_loss": -6.882018566131592, "global_step": 149126, "epoch": 3550} {"train_loss": -6.8501973152160645, "global_step": 149127, "epoch": 3550} {"train_loss": -6.807911396026611, "global_step": 149128, "epoch": 3550} {"train_loss": -6.7224040031433105, "global_step": 149129, "epoch": 3550} {"train_loss": -6.800045013427734, "global_step": 149130, "epoch": 3550} {"train_loss": -6.886375427246094, "global_step": 149131, "epoch": 3550} {"train_loss": -6.723029136657715, "global_step": 149132, "epoch": 3550} {"train_loss": -6.915694236755371, "global_step": 149133, "epoch": 3550} {"train_loss": -6.774990081787109, "global_step": 149134, "epoch": 3550} {"train_loss": -6.8059210777282715, "global_step": 149135, "epoch": 3550} {"train_loss": -6.85378360748291, "global_step": 149136, "epoch": 3550} {"train_loss": -6.8495259284973145, "global_step": 149137, "epoch": 3550} {"train_loss": -6.8870463371276855, "global_step": 149138, "epoch": 3550} {"train_loss": -6.684755325317383, "global_step": 149139, "epoch": 3550} {"train_loss": -6.709748268127441, "global_step": 149140, "epoch": 3550} {"train_loss": -6.819283587591989, "global_step": 149141, "epoch": 3550, "train/sim_max_reward_0": 0.38737783053283215, "train/sim_max_reward_1": 0.7224887303454595, "train/sim_max_reward_2": 0.5082756578166987, "train/sim_max_reward_3": 0.4423253788580129, "train/sim_max_reward_4": 0.9516459478940332, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.4395374766149034, "test/sim_max_reward_4300001": 0.5783054365780389, "test/sim_max_reward_4300002": 0.9583176948188018, "test/sim_max_reward_4300003": 0.9777318565806624, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.41024330423580446, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.2916702947850431, "test/sim_max_reward_4300008": 0.8896123617516202, "test/sim_max_reward_4300009": 0.8518987031924753, "test/sim_max_reward_4300010": 0.3974670129756916, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.9960768868765699, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.43115761678796455, "test/sim_max_reward_4300018": 0.4211279394562431, "test/sim_max_reward_4300019": 0.1857398015724349, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8846548967385977, "test/sim_max_reward_4300022": 0.8425189805810163, "test/sim_max_reward_4300023": 0.9407604812746831, "test/sim_max_reward_4300024": 0.3587329357377938, "test/sim_max_reward_4300025": 0.8839538153588243, "test/sim_max_reward_4300026": 0.0902086059551989, "test/sim_max_reward_4300027": 0.5930616886999186, "test/sim_max_reward_4300028": 1.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.35199971906205907, "test/sim_max_reward_4300031": 0.2787555181925213, "test/sim_max_reward_4300032": 0.8655460696937433, "test/sim_max_reward_4300033": 0.6975021422576535, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.1292175803135594, "test/sim_max_reward_4300036": 0.258523614768265, "test/sim_max_reward_4300037": 0.8701449378778152, "test/sim_max_reward_4300038": 0.39880679018862053, "test/sim_max_reward_4300039": 0.5574418057468082, "test/sim_max_reward_4300040": 0.8493409088641812, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.42858450420959515, "test/sim_max_reward_4300043": 0.12438638117217919, "test/sim_max_reward_4300044": 0.8628790158115318, "test/sim_max_reward_4300045": 0.8813896627614258, "test/sim_max_reward_4300046": 0.4478183695325426, "test/sim_max_reward_4300047": 0.1550593437941251, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.26727709508114494, "train/mean_score": 0.5341830508015373, "test/mean_score": 0.5172657070941868, "val_loss": 67712.0390625} {"train_loss": -6.681891918182373, "global_step": 149142, "epoch": 3551} {"train_loss": -6.766949653625488, "global_step": 149143, "epoch": 3551} {"train_loss": -6.654873847961426, "global_step": 149144, "epoch": 3551} {"train_loss": -6.642673015594482, "global_step": 149145, "epoch": 3551} {"train_loss": -6.600773811340332, "global_step": 149146, "epoch": 3551} {"train_loss": -6.578761577606201, "global_step": 149147, "epoch": 3551} {"train_loss": -6.685764312744141, "global_step": 149148, "epoch": 3551} {"train_loss": -6.635315418243408, "global_step": 149149, "epoch": 3551} {"train_loss": -6.666515350341797, "global_step": 149150, "epoch": 3551} {"train_loss": -6.665801048278809, "global_step": 149151, "epoch": 3551} {"train_loss": -6.8034987449646, "global_step": 149152, "epoch": 3551} {"train_loss": -6.7845458984375, "global_step": 149153, "epoch": 3551} {"train_loss": -6.589120388031006, "global_step": 149154, "epoch": 3551} {"train_loss": -6.914644241333008, "global_step": 149155, "epoch": 3551} {"train_loss": -6.704207897186279, "global_step": 149156, "epoch": 3551} {"train_loss": -6.746788501739502, "global_step": 149157, "epoch": 3551} {"train_loss": -6.7053632736206055, "global_step": 149158, "epoch": 3551} {"train_loss": -6.70412540435791, "global_step": 149159, "epoch": 3551} {"train_loss": -6.7224202156066895, "global_step": 149160, "epoch": 3551} {"train_loss": -6.833354473114014, "global_step": 149161, "epoch": 3551} {"train_loss": -6.785571098327637, "global_step": 149162, "epoch": 3551} {"train_loss": -6.829408168792725, "global_step": 149163, "epoch": 3551} {"train_loss": -6.774720191955566, "global_step": 149164, "epoch": 3551} {"train_loss": -6.7573137283325195, "global_step": 149165, "epoch": 3551} {"train_loss": -6.772967338562012, "global_step": 149166, "epoch": 3551} {"train_loss": -6.841300010681152, "global_step": 149167, "epoch": 3551} {"train_loss": -6.818252086639404, "global_step": 149168, "epoch": 3551} {"train_loss": -6.803062438964844, "global_step": 149169, "epoch": 3551} {"train_loss": -6.7564239501953125, "global_step": 149170, "epoch": 3551} {"train_loss": -6.871384620666504, "global_step": 149171, "epoch": 3551} {"train_loss": -6.774333477020264, "global_step": 149172, "epoch": 3551} {"train_loss": -6.899121284484863, "global_step": 149173, "epoch": 3551} {"train_loss": -6.826504707336426, "global_step": 149174, "epoch": 3551} {"train_loss": -6.827089309692383, "global_step": 149175, "epoch": 3551} {"train_loss": -6.822147846221924, "global_step": 149176, "epoch": 3551} {"train_loss": -6.755005359649658, "global_step": 149177, "epoch": 3551} {"train_loss": -6.909236907958984, "global_step": 149178, "epoch": 3551} {"train_loss": -6.846889972686768, "global_step": 149179, "epoch": 3551} {"train_loss": -6.89036750793457, "global_step": 149180, "epoch": 3551} {"train_loss": -6.755072593688965, "global_step": 149181, "epoch": 3551} {"train_loss": -6.806939601898193, "global_step": 149182, "epoch": 3551} {"train_loss": -6.764592170715332, "global_step": 149183, "epoch": 3551, "val_loss": 68024.1640625} {"train_loss": -6.732481002807617, "global_step": 149184, "epoch": 3552} {"train_loss": -6.816583156585693, "global_step": 149185, "epoch": 3552} {"train_loss": -6.828507423400879, "global_step": 149186, "epoch": 3552} {"train_loss": -6.6910200119018555, "global_step": 149187, "epoch": 3552} {"train_loss": -6.775274753570557, "global_step": 149188, "epoch": 3552} {"train_loss": -6.6750898361206055, "global_step": 149189, "epoch": 3552} {"train_loss": -6.853734970092773, "global_step": 149190, "epoch": 3552} {"train_loss": -6.671034812927246, "global_step": 149191, "epoch": 3552} {"train_loss": -6.722975730895996, "global_step": 149192, "epoch": 3552} {"train_loss": -6.699673652648926, "global_step": 149193, "epoch": 3552} {"train_loss": -6.552623748779297, "global_step": 149194, "epoch": 3552} {"train_loss": -6.766205787658691, "global_step": 149195, "epoch": 3552} {"train_loss": -6.654160499572754, "global_step": 149196, "epoch": 3552} {"train_loss": -6.867207050323486, "global_step": 149197, "epoch": 3552} {"train_loss": -6.730172157287598, "global_step": 149198, "epoch": 3552} {"train_loss": -6.7145514488220215, "global_step": 149199, "epoch": 3552} {"train_loss": -6.759490966796875, "global_step": 149200, "epoch": 3552} {"train_loss": -6.7681684494018555, "global_step": 149201, "epoch": 3552} {"train_loss": -6.659674644470215, "global_step": 149202, "epoch": 3552} {"train_loss": -6.790347576141357, "global_step": 149203, "epoch": 3552} {"train_loss": -6.757637977600098, "global_step": 149204, "epoch": 3552} {"train_loss": -6.774656295776367, "global_step": 149205, "epoch": 3552} {"train_loss": -6.812370777130127, "global_step": 149206, "epoch": 3552} {"train_loss": -6.6199493408203125, "global_step": 149207, "epoch": 3552} {"train_loss": -6.758174896240234, "global_step": 149208, "epoch": 3552} {"train_loss": -6.733527660369873, "global_step": 149209, "epoch": 3552} {"train_loss": -6.779167175292969, "global_step": 149210, "epoch": 3552} {"train_loss": -6.725543975830078, "global_step": 149211, "epoch": 3552} {"train_loss": -6.8367204666137695, "global_step": 149212, "epoch": 3552} {"train_loss": -6.788167953491211, "global_step": 149213, "epoch": 3552} {"train_loss": -6.724910736083984, "global_step": 149214, "epoch": 3552} {"train_loss": -6.837973594665527, "global_step": 149215, "epoch": 3552} {"train_loss": -6.833894729614258, "global_step": 149216, "epoch": 3552} {"train_loss": -6.7423577308654785, "global_step": 149217, "epoch": 3552} {"train_loss": -6.737189292907715, "global_step": 149218, "epoch": 3552} {"train_loss": -6.772467613220215, "global_step": 149219, "epoch": 3552} {"train_loss": -6.854770183563232, "global_step": 149220, "epoch": 3552} {"train_loss": -6.934940814971924, "global_step": 149221, "epoch": 3552} {"train_loss": -6.743377208709717, "global_step": 149222, "epoch": 3552} {"train_loss": -6.819155216217041, "global_step": 149223, "epoch": 3552} {"train_loss": -6.783613681793213, "global_step": 149224, "epoch": 3552} {"train_loss": -6.760822659447079, "global_step": 149225, "epoch": 3552, "val_loss": 68107.1171875} {"train_loss": -6.764263153076172, "global_step": 149226, "epoch": 3553} {"train_loss": -6.828732490539551, "global_step": 149227, "epoch": 3553} {"train_loss": -6.819866180419922, "global_step": 149228, "epoch": 3553} {"train_loss": -6.86422061920166, "global_step": 149229, "epoch": 3553} {"train_loss": -6.939449310302734, "global_step": 149230, "epoch": 3553} {"train_loss": -6.833195686340332, "global_step": 149231, "epoch": 3553} {"train_loss": -6.8986921310424805, "global_step": 149232, "epoch": 3553} {"train_loss": -6.742761611938477, "global_step": 149233, "epoch": 3553} {"train_loss": -6.859724998474121, "global_step": 149234, "epoch": 3553} {"train_loss": -6.855062961578369, "global_step": 149235, "epoch": 3553} {"train_loss": -6.781546592712402, "global_step": 149236, "epoch": 3553} {"train_loss": -6.889754295349121, "global_step": 149237, "epoch": 3553} {"train_loss": -6.766582012176514, "global_step": 149238, "epoch": 3553} {"train_loss": -6.767575740814209, "global_step": 149239, "epoch": 3553} {"train_loss": -6.863171577453613, "global_step": 149240, "epoch": 3553} {"train_loss": -6.793523788452148, "global_step": 149241, "epoch": 3553} {"train_loss": -6.834450721740723, "global_step": 149242, "epoch": 3553} {"train_loss": -6.797598361968994, "global_step": 149243, "epoch": 3553} {"train_loss": -6.827706336975098, "global_step": 149244, "epoch": 3553} {"train_loss": -6.794068336486816, "global_step": 149245, "epoch": 3553} {"train_loss": -6.947200775146484, "global_step": 149246, "epoch": 3553} {"train_loss": -6.792092323303223, "global_step": 149247, "epoch": 3553} {"train_loss": -6.8406782150268555, "global_step": 149248, "epoch": 3553} {"train_loss": -6.872861862182617, "global_step": 149249, "epoch": 3553} {"train_loss": -6.855744361877441, "global_step": 149250, "epoch": 3553} {"train_loss": -6.811922073364258, "global_step": 149251, "epoch": 3553} {"train_loss": -6.932936668395996, "global_step": 149252, "epoch": 3553} {"train_loss": -6.739369869232178, "global_step": 149253, "epoch": 3553} {"train_loss": -6.778890609741211, "global_step": 149254, "epoch": 3553} {"train_loss": -6.765473365783691, "global_step": 149255, "epoch": 3553} {"train_loss": -6.829206466674805, "global_step": 149256, "epoch": 3553} {"train_loss": -6.762185096740723, "global_step": 149257, "epoch": 3553} {"train_loss": -6.664496421813965, "global_step": 149258, "epoch": 3553} {"train_loss": -6.786306381225586, "global_step": 149259, "epoch": 3553} {"train_loss": -6.879626750946045, "global_step": 149260, "epoch": 3553} {"train_loss": -6.814932823181152, "global_step": 149261, "epoch": 3553} {"train_loss": -6.756848335266113, "global_step": 149262, "epoch": 3553} {"train_loss": -6.86539363861084, "global_step": 149263, "epoch": 3553} {"train_loss": -6.815844535827637, "global_step": 149264, "epoch": 3553} {"train_loss": -6.9082207679748535, "global_step": 149265, "epoch": 3553} {"train_loss": -6.934477806091309, "global_step": 149266, "epoch": 3553} {"train_loss": -6.828039748328073, "global_step": 149267, "epoch": 3553, "val_loss": 68000.359375} {"train_loss": -6.793558120727539, "global_step": 149268, "epoch": 3554} {"train_loss": -6.911687850952148, "global_step": 149269, "epoch": 3554} {"train_loss": -6.858750343322754, "global_step": 149270, "epoch": 3554} {"train_loss": -6.958945274353027, "global_step": 149271, "epoch": 3554} {"train_loss": -6.821800231933594, "global_step": 149272, "epoch": 3554} {"train_loss": -6.918076515197754, "global_step": 149273, "epoch": 3554} {"train_loss": -6.8907270431518555, "global_step": 149274, "epoch": 3554} {"train_loss": -6.830592632293701, "global_step": 149275, "epoch": 3554} {"train_loss": -6.711655616760254, "global_step": 149276, "epoch": 3554} {"train_loss": -6.789939880371094, "global_step": 149277, "epoch": 3554} {"train_loss": -6.8001604080200195, "global_step": 149278, "epoch": 3554} {"train_loss": -6.750194549560547, "global_step": 149279, "epoch": 3554} {"train_loss": -6.828030109405518, "global_step": 149280, "epoch": 3554} {"train_loss": -6.924226760864258, "global_step": 149281, "epoch": 3554} {"train_loss": -6.754602432250977, "global_step": 149282, "epoch": 3554} {"train_loss": -6.874852180480957, "global_step": 149283, "epoch": 3554} {"train_loss": -6.836533546447754, "global_step": 149284, "epoch": 3554} {"train_loss": -6.811753273010254, "global_step": 149285, "epoch": 3554} {"train_loss": -6.843934059143066, "global_step": 149286, "epoch": 3554} {"train_loss": -6.852261066436768, "global_step": 149287, "epoch": 3554} {"train_loss": -6.802055835723877, "global_step": 149288, "epoch": 3554} {"train_loss": -6.747980117797852, "global_step": 149289, "epoch": 3554} {"train_loss": -6.804516792297363, "global_step": 149290, "epoch": 3554} {"train_loss": -6.908393859863281, "global_step": 149291, "epoch": 3554} {"train_loss": -6.7763848304748535, "global_step": 149292, "epoch": 3554} {"train_loss": -6.923208713531494, "global_step": 149293, "epoch": 3554} {"train_loss": -6.890153408050537, "global_step": 149294, "epoch": 3554} {"train_loss": -6.8508453369140625, "global_step": 149295, "epoch": 3554} {"train_loss": -6.917166709899902, "global_step": 149296, "epoch": 3554} {"train_loss": -6.808223724365234, "global_step": 149297, "epoch": 3554} {"train_loss": -6.886801719665527, "global_step": 149298, "epoch": 3554} {"train_loss": -6.910909652709961, "global_step": 149299, "epoch": 3554} {"train_loss": -6.981082439422607, "global_step": 149300, "epoch": 3554} {"train_loss": -6.954981803894043, "global_step": 149301, "epoch": 3554} {"train_loss": -6.88676643371582, "global_step": 149302, "epoch": 3554} {"train_loss": -6.949851989746094, "global_step": 149303, "epoch": 3554} {"train_loss": -6.947601318359375, "global_step": 149304, "epoch": 3554} {"train_loss": -6.970266342163086, "global_step": 149305, "epoch": 3554} {"train_loss": -6.866178512573242, "global_step": 149306, "epoch": 3554} {"train_loss": -6.999355316162109, "global_step": 149307, "epoch": 3554} {"train_loss": -6.888657569885254, "global_step": 149308, "epoch": 3554} {"train_loss": -6.864469130833943, "global_step": 149309, "epoch": 3554, "val_loss": 67772.1640625} {"train_loss": -6.9304938316345215, "global_step": 149310, "epoch": 3555} {"train_loss": -6.900480270385742, "global_step": 149311, "epoch": 3555} {"train_loss": -6.868248462677002, "global_step": 149312, "epoch": 3555} {"train_loss": -6.971458911895752, "global_step": 149313, "epoch": 3555} {"train_loss": -6.817477226257324, "global_step": 149314, "epoch": 3555} {"train_loss": -6.803780555725098, "global_step": 149315, "epoch": 3555} {"train_loss": -6.901342868804932, "global_step": 149316, "epoch": 3555} {"train_loss": -6.837512016296387, "global_step": 149317, "epoch": 3555} {"train_loss": -6.840581893920898, "global_step": 149318, "epoch": 3555} {"train_loss": -6.875733852386475, "global_step": 149319, "epoch": 3555} {"train_loss": -7.03179407119751, "global_step": 149320, "epoch": 3555} {"train_loss": -6.849428653717041, "global_step": 149321, "epoch": 3555} {"train_loss": -6.867022514343262, "global_step": 149322, "epoch": 3555} {"train_loss": -6.879112243652344, "global_step": 149323, "epoch": 3555} {"train_loss": -6.733758449554443, "global_step": 149324, "epoch": 3555} {"train_loss": -6.974771499633789, "global_step": 149325, "epoch": 3555} {"train_loss": -6.92592716217041, "global_step": 149326, "epoch": 3555} {"train_loss": -6.908817291259766, "global_step": 149327, "epoch": 3555} {"train_loss": -6.8803887367248535, "global_step": 149328, "epoch": 3555} {"train_loss": -6.918590545654297, "global_step": 149329, "epoch": 3555} {"train_loss": -6.908341407775879, "global_step": 149330, "epoch": 3555} {"train_loss": -6.964855194091797, "global_step": 149331, "epoch": 3555} {"train_loss": -6.772279739379883, "global_step": 149332, "epoch": 3555} {"train_loss": -6.920214653015137, "global_step": 149333, "epoch": 3555} {"train_loss": -6.778576374053955, "global_step": 149334, "epoch": 3555} {"train_loss": -6.73934268951416, "global_step": 149335, "epoch": 3555} {"train_loss": -6.760885238647461, "global_step": 149336, "epoch": 3555} {"train_loss": -6.899300575256348, "global_step": 149337, "epoch": 3555} {"train_loss": -6.744420051574707, "global_step": 149338, "epoch": 3555} {"train_loss": -6.847827911376953, "global_step": 149339, "epoch": 3555} {"train_loss": -6.803112983703613, "global_step": 149340, "epoch": 3555} {"train_loss": -6.874943256378174, "global_step": 149341, "epoch": 3555} {"train_loss": -6.777749061584473, "global_step": 149342, "epoch": 3555} {"train_loss": -6.859050273895264, "global_step": 149343, "epoch": 3555} {"train_loss": -6.9322662353515625, "global_step": 149344, "epoch": 3555} {"train_loss": -6.916677474975586, "global_step": 149345, "epoch": 3555} {"train_loss": -6.922183036804199, "global_step": 149346, "epoch": 3555} {"train_loss": -6.850445747375488, "global_step": 149347, "epoch": 3555} {"train_loss": -6.990569114685059, "global_step": 149348, "epoch": 3555} {"train_loss": -6.991396903991699, "global_step": 149349, "epoch": 3555} {"train_loss": -6.827078819274902, "global_step": 149350, "epoch": 3555} {"train_loss": -6.872856276375907, "global_step": 149351, "epoch": 3555, "val_loss": 67953.953125} {"train_loss": -6.890247344970703, "global_step": 149352, "epoch": 3556} {"train_loss": -6.9376325607299805, "global_step": 149353, "epoch": 3556} {"train_loss": -6.877623558044434, "global_step": 149354, "epoch": 3556} {"train_loss": -6.929243087768555, "global_step": 149355, "epoch": 3556} {"train_loss": -6.837230682373047, "global_step": 149356, "epoch": 3556} {"train_loss": -6.945407867431641, "global_step": 149357, "epoch": 3556} {"train_loss": -6.958210468292236, "global_step": 149358, "epoch": 3556} {"train_loss": -6.834882736206055, "global_step": 149359, "epoch": 3556} {"train_loss": -6.87457799911499, "global_step": 149360, "epoch": 3556} {"train_loss": -6.8164448738098145, "global_step": 149361, "epoch": 3556} {"train_loss": -6.8867597579956055, "global_step": 149362, "epoch": 3556} {"train_loss": -6.785180568695068, "global_step": 149363, "epoch": 3556} {"train_loss": -6.832690715789795, "global_step": 149364, "epoch": 3556} {"train_loss": -6.873390197753906, "global_step": 149365, "epoch": 3556} {"train_loss": -6.695256233215332, "global_step": 149366, "epoch": 3556} {"train_loss": -6.894582271575928, "global_step": 149367, "epoch": 3556} {"train_loss": -6.861700057983398, "global_step": 149368, "epoch": 3556} {"train_loss": -6.886125564575195, "global_step": 149369, "epoch": 3556} {"train_loss": -6.9266839027404785, "global_step": 149370, "epoch": 3556} {"train_loss": -6.813483238220215, "global_step": 149371, "epoch": 3556} {"train_loss": -6.936973571777344, "global_step": 149372, "epoch": 3556} {"train_loss": -6.99791145324707, "global_step": 149373, "epoch": 3556} {"train_loss": -6.803458213806152, "global_step": 149374, "epoch": 3556} {"train_loss": -6.789918422698975, "global_step": 149375, "epoch": 3556} {"train_loss": -6.923493385314941, "global_step": 149376, "epoch": 3556} {"train_loss": -6.762939453125, "global_step": 149377, "epoch": 3556} {"train_loss": -6.847647666931152, "global_step": 149378, "epoch": 3556} {"train_loss": -6.913025856018066, "global_step": 149379, "epoch": 3556} {"train_loss": -6.82041072845459, "global_step": 149380, "epoch": 3556} {"train_loss": -6.814512729644775, "global_step": 149381, "epoch": 3556} {"train_loss": -6.865413665771484, "global_step": 149382, "epoch": 3556} {"train_loss": -6.888424873352051, "global_step": 149383, "epoch": 3556} {"train_loss": -6.828518867492676, "global_step": 149384, "epoch": 3556} {"train_loss": -6.9220075607299805, "global_step": 149385, "epoch": 3556} {"train_loss": -6.691969394683838, "global_step": 149386, "epoch": 3556} {"train_loss": -6.876842498779297, "global_step": 149387, "epoch": 3556} {"train_loss": -6.815077304840088, "global_step": 149388, "epoch": 3556} {"train_loss": -6.944252967834473, "global_step": 149389, "epoch": 3556} {"train_loss": -6.8630266189575195, "global_step": 149390, "epoch": 3556} {"train_loss": -6.906878471374512, "global_step": 149391, "epoch": 3556} {"train_loss": -6.868746280670166, "global_step": 149392, "epoch": 3556} {"train_loss": -6.861510821751186, "global_step": 149393, "epoch": 3556, "val_loss": 68224.0859375} {"train_loss": -6.813508987426758, "global_step": 149394, "epoch": 3557} {"train_loss": -6.877542972564697, "global_step": 149395, "epoch": 3557} {"train_loss": -6.652904033660889, "global_step": 149396, "epoch": 3557} {"train_loss": -6.803556442260742, "global_step": 149397, "epoch": 3557} {"train_loss": -6.87220573425293, "global_step": 149398, "epoch": 3557} {"train_loss": -6.677067756652832, "global_step": 149399, "epoch": 3557} {"train_loss": -6.881128311157227, "global_step": 149400, "epoch": 3557} {"train_loss": -6.8491363525390625, "global_step": 149401, "epoch": 3557} {"train_loss": -6.798207759857178, "global_step": 149402, "epoch": 3557} {"train_loss": -6.7722063064575195, "global_step": 149403, "epoch": 3557} {"train_loss": -6.831948280334473, "global_step": 149404, "epoch": 3557} {"train_loss": -6.838386535644531, "global_step": 149405, "epoch": 3557} {"train_loss": -6.905135154724121, "global_step": 149406, "epoch": 3557} {"train_loss": -6.742343902587891, "global_step": 149407, "epoch": 3557} {"train_loss": -6.854913711547852, "global_step": 149408, "epoch": 3557} {"train_loss": -6.8502516746521, "global_step": 149409, "epoch": 3557} {"train_loss": -6.841804027557373, "global_step": 149410, "epoch": 3557} {"train_loss": -6.895763397216797, "global_step": 149411, "epoch": 3557} {"train_loss": -6.865183353424072, "global_step": 149412, "epoch": 3557} {"train_loss": -6.94523811340332, "global_step": 149413, "epoch": 3557} {"train_loss": -6.763110160827637, "global_step": 149414, "epoch": 3557} {"train_loss": -6.886754035949707, "global_step": 149415, "epoch": 3557} {"train_loss": -6.9028639793396, "global_step": 149416, "epoch": 3557} {"train_loss": -6.876280307769775, "global_step": 149417, "epoch": 3557} {"train_loss": -6.770741939544678, "global_step": 149418, "epoch": 3557} {"train_loss": -6.825428485870361, "global_step": 149419, "epoch": 3557} {"train_loss": -6.883006572723389, "global_step": 149420, "epoch": 3557} {"train_loss": -6.874631881713867, "global_step": 149421, "epoch": 3557} {"train_loss": -6.7823076248168945, "global_step": 149422, "epoch": 3557} {"train_loss": -6.914541244506836, "global_step": 149423, "epoch": 3557} {"train_loss": -6.741548538208008, "global_step": 149424, "epoch": 3557} {"train_loss": -6.846683025360107, "global_step": 149425, "epoch": 3557} {"train_loss": -6.92048454284668, "global_step": 149426, "epoch": 3557} {"train_loss": -6.848946571350098, "global_step": 149427, "epoch": 3557} {"train_loss": -6.816319465637207, "global_step": 149428, "epoch": 3557} {"train_loss": -6.9218244552612305, "global_step": 149429, "epoch": 3557} {"train_loss": -6.84766149520874, "global_step": 149430, "epoch": 3557} {"train_loss": -6.853089332580566, "global_step": 149431, "epoch": 3557} {"train_loss": -6.72170877456665, "global_step": 149432, "epoch": 3557} {"train_loss": -6.867123603820801, "global_step": 149433, "epoch": 3557} {"train_loss": -6.921283721923828, "global_step": 149434, "epoch": 3557} {"train_loss": -6.840274470193045, "global_step": 149435, "epoch": 3557, "val_loss": 67938.2109375} {"train_loss": -6.753945827484131, "global_step": 149436, "epoch": 3558} {"train_loss": -6.823808670043945, "global_step": 149437, "epoch": 3558} {"train_loss": -6.859911918640137, "global_step": 149438, "epoch": 3558} {"train_loss": -6.86580753326416, "global_step": 149439, "epoch": 3558} {"train_loss": -6.9308881759643555, "global_step": 149440, "epoch": 3558} {"train_loss": -6.97654914855957, "global_step": 149441, "epoch": 3558} {"train_loss": -6.870326995849609, "global_step": 149442, "epoch": 3558} {"train_loss": -6.877026081085205, "global_step": 149443, "epoch": 3558} {"train_loss": -6.939593315124512, "global_step": 149444, "epoch": 3558} {"train_loss": -6.857091903686523, "global_step": 149445, "epoch": 3558} {"train_loss": -6.888057708740234, "global_step": 149446, "epoch": 3558} {"train_loss": -6.912983417510986, "global_step": 149447, "epoch": 3558} {"train_loss": -6.871146202087402, "global_step": 149448, "epoch": 3558} {"train_loss": -6.884853363037109, "global_step": 149449, "epoch": 3558} {"train_loss": -6.943240642547607, "global_step": 149450, "epoch": 3558} {"train_loss": -7.007694244384766, "global_step": 149451, "epoch": 3558} {"train_loss": -6.925166606903076, "global_step": 149452, "epoch": 3558} {"train_loss": -6.8543195724487305, "global_step": 149453, "epoch": 3558} {"train_loss": -6.939458847045898, "global_step": 149454, "epoch": 3558} {"train_loss": -6.920295715332031, "global_step": 149455, "epoch": 3558} {"train_loss": -6.864493370056152, "global_step": 149456, "epoch": 3558} {"train_loss": -6.906010627746582, "global_step": 149457, "epoch": 3558} {"train_loss": -6.808716773986816, "global_step": 149458, "epoch": 3558} {"train_loss": -6.956141471862793, "global_step": 149459, "epoch": 3558} {"train_loss": -6.854532241821289, "global_step": 149460, "epoch": 3558} {"train_loss": -6.867641448974609, "global_step": 149461, "epoch": 3558} {"train_loss": -6.823880195617676, "global_step": 149462, "epoch": 3558} {"train_loss": -6.847744941711426, "global_step": 149463, "epoch": 3558} {"train_loss": -6.775753974914551, "global_step": 149464, "epoch": 3558} {"train_loss": -6.873497009277344, "global_step": 149465, "epoch": 3558} {"train_loss": -6.8291802406311035, "global_step": 149466, "epoch": 3558} {"train_loss": -6.859408378601074, "global_step": 149467, "epoch": 3558} {"train_loss": -6.920029640197754, "global_step": 149468, "epoch": 3558} {"train_loss": -6.8234333992004395, "global_step": 149469, "epoch": 3558} {"train_loss": -6.88746452331543, "global_step": 149470, "epoch": 3558} {"train_loss": -6.834049224853516, "global_step": 149471, "epoch": 3558} {"train_loss": -6.933374404907227, "global_step": 149472, "epoch": 3558} {"train_loss": -6.874400615692139, "global_step": 149473, "epoch": 3558} {"train_loss": -6.769752502441406, "global_step": 149474, "epoch": 3558} {"train_loss": -6.950707912445068, "global_step": 149475, "epoch": 3558} {"train_loss": -6.92875337600708, "global_step": 149476, "epoch": 3558} {"train_loss": -6.8800627163478305, "global_step": 149477, "epoch": 3558, "val_loss": 67906.0859375} {"train_loss": -6.86959171295166, "global_step": 149478, "epoch": 3559} {"train_loss": -6.981708526611328, "global_step": 149479, "epoch": 3559} {"train_loss": -6.8518195152282715, "global_step": 149480, "epoch": 3559} {"train_loss": -6.974013805389404, "global_step": 149481, "epoch": 3559} {"train_loss": -7.053995132446289, "global_step": 149482, "epoch": 3559} {"train_loss": -6.8572163581848145, "global_step": 149483, "epoch": 3559} {"train_loss": -6.961605072021484, "global_step": 149484, "epoch": 3559} {"train_loss": -6.885613441467285, "global_step": 149485, "epoch": 3559} {"train_loss": -6.889284133911133, "global_step": 149486, "epoch": 3559} {"train_loss": -6.8570756912231445, "global_step": 149487, "epoch": 3559} {"train_loss": -6.907423496246338, "global_step": 149488, "epoch": 3559} {"train_loss": -6.9660539627075195, "global_step": 149489, "epoch": 3559} {"train_loss": -6.905927658081055, "global_step": 149490, "epoch": 3559} {"train_loss": -6.951471328735352, "global_step": 149491, "epoch": 3559} {"train_loss": -6.810558795928955, "global_step": 149492, "epoch": 3559} {"train_loss": -6.8379387855529785, "global_step": 149493, "epoch": 3559} {"train_loss": -6.7302141189575195, "global_step": 149494, "epoch": 3559} {"train_loss": -6.8345746994018555, "global_step": 149495, "epoch": 3559} {"train_loss": -6.837313175201416, "global_step": 149496, "epoch": 3559} {"train_loss": -6.897259712219238, "global_step": 149497, "epoch": 3559} {"train_loss": -6.676101207733154, "global_step": 149498, "epoch": 3559} {"train_loss": -6.884114742279053, "global_step": 149499, "epoch": 3559} {"train_loss": -6.825873374938965, "global_step": 149500, "epoch": 3559} {"train_loss": -6.68502140045166, "global_step": 149501, "epoch": 3559} {"train_loss": -6.70967435836792, "global_step": 149502, "epoch": 3559} {"train_loss": -6.806257247924805, "global_step": 149503, "epoch": 3559} {"train_loss": -6.775318145751953, "global_step": 149504, "epoch": 3559} {"train_loss": -6.72947359085083, "global_step": 149505, "epoch": 3559} {"train_loss": -6.833075523376465, "global_step": 149506, "epoch": 3559} {"train_loss": -6.898541450500488, "global_step": 149507, "epoch": 3559} {"train_loss": -6.844649314880371, "global_step": 149508, "epoch": 3559} {"train_loss": -6.898868083953857, "global_step": 149509, "epoch": 3559} {"train_loss": -6.9026408195495605, "global_step": 149510, "epoch": 3559} {"train_loss": -6.868818759918213, "global_step": 149511, "epoch": 3559} {"train_loss": -6.836596965789795, "global_step": 149512, "epoch": 3559} {"train_loss": -6.837812423706055, "global_step": 149513, "epoch": 3559} {"train_loss": -6.798515319824219, "global_step": 149514, "epoch": 3559} {"train_loss": -6.864490985870361, "global_step": 149515, "epoch": 3559} {"train_loss": -6.883812427520752, "global_step": 149516, "epoch": 3559} {"train_loss": -6.824649333953857, "global_step": 149517, "epoch": 3559} {"train_loss": -6.856444358825684, "global_step": 149518, "epoch": 3559} {"train_loss": -6.853586798622494, "global_step": 149519, "epoch": 3559, "val_loss": 67967.84375} {"train_loss": -6.721090316772461, "global_step": 149520, "epoch": 3560} {"train_loss": -6.776112079620361, "global_step": 149521, "epoch": 3560} {"train_loss": -6.810314178466797, "global_step": 149522, "epoch": 3560} {"train_loss": -6.71865177154541, "global_step": 149523, "epoch": 3560} {"train_loss": -6.957512855529785, "global_step": 149524, "epoch": 3560} {"train_loss": -6.8345136642456055, "global_step": 149525, "epoch": 3560} {"train_loss": -6.866842269897461, "global_step": 149526, "epoch": 3560} {"train_loss": -6.926015853881836, "global_step": 149527, "epoch": 3560} {"train_loss": -6.833764553070068, "global_step": 149528, "epoch": 3560} {"train_loss": -6.845668315887451, "global_step": 149529, "epoch": 3560} {"train_loss": -6.860363006591797, "global_step": 149530, "epoch": 3560} {"train_loss": -6.890156269073486, "global_step": 149531, "epoch": 3560} {"train_loss": -6.85697078704834, "global_step": 149532, "epoch": 3560} {"train_loss": -6.983823299407959, "global_step": 149533, "epoch": 3560} {"train_loss": -6.844254970550537, "global_step": 149534, "epoch": 3560} {"train_loss": -6.7359209060668945, "global_step": 149535, "epoch": 3560} {"train_loss": -6.808114051818848, "global_step": 149536, "epoch": 3560} {"train_loss": -6.837399482727051, "global_step": 149537, "epoch": 3560} {"train_loss": -6.761571884155273, "global_step": 149538, "epoch": 3560} {"train_loss": -6.848151206970215, "global_step": 149539, "epoch": 3560} {"train_loss": -6.885321617126465, "global_step": 149540, "epoch": 3560} {"train_loss": -6.817835330963135, "global_step": 149541, "epoch": 3560} {"train_loss": -6.791812896728516, "global_step": 149542, "epoch": 3560} {"train_loss": -6.963438987731934, "global_step": 149543, "epoch": 3560} {"train_loss": -6.737931251525879, "global_step": 149544, "epoch": 3560} {"train_loss": -6.643372058868408, "global_step": 149545, "epoch": 3560} {"train_loss": -6.770932197570801, "global_step": 149546, "epoch": 3560} {"train_loss": -6.82466983795166, "global_step": 149547, "epoch": 3560} {"train_loss": -6.732205390930176, "global_step": 149548, "epoch": 3560} {"train_loss": -6.817527770996094, "global_step": 149549, "epoch": 3560} {"train_loss": -6.898276329040527, "global_step": 149550, "epoch": 3560} {"train_loss": -6.649057388305664, "global_step": 149551, "epoch": 3560} {"train_loss": -6.870523452758789, "global_step": 149552, "epoch": 3560} {"train_loss": -6.782550811767578, "global_step": 149553, "epoch": 3560} {"train_loss": -6.807018280029297, "global_step": 149554, "epoch": 3560} {"train_loss": -6.869544982910156, "global_step": 149555, "epoch": 3560} {"train_loss": -6.878103733062744, "global_step": 149556, "epoch": 3560} {"train_loss": -6.773242950439453, "global_step": 149557, "epoch": 3560} {"train_loss": -6.8009033203125, "global_step": 149558, "epoch": 3560} {"train_loss": -6.878617286682129, "global_step": 149559, "epoch": 3560} {"train_loss": -6.838232040405273, "global_step": 149560, "epoch": 3560} {"train_loss": -6.821244591758365, "global_step": 149561, "epoch": 3560, "val_loss": 67843.0859375} {"train_loss": -6.829962253570557, "global_step": 149562, "epoch": 3561} {"train_loss": -6.821634292602539, "global_step": 149563, "epoch": 3561} {"train_loss": -6.804807662963867, "global_step": 149564, "epoch": 3561} {"train_loss": -6.963170528411865, "global_step": 149565, "epoch": 3561} {"train_loss": -6.794661521911621, "global_step": 149566, "epoch": 3561} {"train_loss": -6.7803754806518555, "global_step": 149567, "epoch": 3561} {"train_loss": -6.8724260330200195, "global_step": 149568, "epoch": 3561} {"train_loss": -6.824393272399902, "global_step": 149569, "epoch": 3561} {"train_loss": -6.922000885009766, "global_step": 149570, "epoch": 3561} {"train_loss": -6.966002464294434, "global_step": 149571, "epoch": 3561} {"train_loss": -6.927689552307129, "global_step": 149572, "epoch": 3561} {"train_loss": -6.953855991363525, "global_step": 149573, "epoch": 3561} {"train_loss": -6.84840726852417, "global_step": 149574, "epoch": 3561} {"train_loss": -6.925680160522461, "global_step": 149575, "epoch": 3561} {"train_loss": -6.912824630737305, "global_step": 149576, "epoch": 3561} {"train_loss": -6.936209678649902, "global_step": 149577, "epoch": 3561} {"train_loss": -6.961442947387695, "global_step": 149578, "epoch": 3561} {"train_loss": -6.86448860168457, "global_step": 149579, "epoch": 3561} {"train_loss": -6.953829765319824, "global_step": 149580, "epoch": 3561} {"train_loss": -6.8551812171936035, "global_step": 149581, "epoch": 3561} {"train_loss": -6.952799320220947, "global_step": 149582, "epoch": 3561} {"train_loss": -6.9313764572143555, "global_step": 149583, "epoch": 3561} {"train_loss": -6.946925640106201, "global_step": 149584, "epoch": 3561} {"train_loss": -6.895205497741699, "global_step": 149585, "epoch": 3561} {"train_loss": -6.891120433807373, "global_step": 149586, "epoch": 3561} {"train_loss": -6.916234970092773, "global_step": 149587, "epoch": 3561} {"train_loss": -7.0099358558654785, "global_step": 149588, "epoch": 3561} {"train_loss": -6.932044982910156, "global_step": 149589, "epoch": 3561} {"train_loss": -6.971707344055176, "global_step": 149590, "epoch": 3561} {"train_loss": -6.885842323303223, "global_step": 149591, "epoch": 3561} {"train_loss": -6.896010398864746, "global_step": 149592, "epoch": 3561} {"train_loss": -6.960336685180664, "global_step": 149593, "epoch": 3561} {"train_loss": -6.934416770935059, "global_step": 149594, "epoch": 3561} {"train_loss": -6.9018707275390625, "global_step": 149595, "epoch": 3561} {"train_loss": -6.865246772766113, "global_step": 149596, "epoch": 3561} {"train_loss": -6.795650005340576, "global_step": 149597, "epoch": 3561} {"train_loss": -6.822058200836182, "global_step": 149598, "epoch": 3561} {"train_loss": -6.851077556610107, "global_step": 149599, "epoch": 3561} {"train_loss": -6.717785835266113, "global_step": 149600, "epoch": 3561} {"train_loss": -6.782341957092285, "global_step": 149601, "epoch": 3561} {"train_loss": -6.808438777923584, "global_step": 149602, "epoch": 3561} {"train_loss": -6.8836483387720016, "global_step": 149603, "epoch": 3561, "val_loss": 68039.328125} {"train_loss": -6.835689544677734, "global_step": 149604, "epoch": 3562} {"train_loss": -6.759439945220947, "global_step": 149605, "epoch": 3562} {"train_loss": -6.965624809265137, "global_step": 149606, "epoch": 3562} {"train_loss": -6.904268264770508, "global_step": 149607, "epoch": 3562} {"train_loss": -6.764404773712158, "global_step": 149608, "epoch": 3562} {"train_loss": -6.820970058441162, "global_step": 149609, "epoch": 3562} {"train_loss": -6.814887046813965, "global_step": 149610, "epoch": 3562} {"train_loss": -6.892790794372559, "global_step": 149611, "epoch": 3562} {"train_loss": -6.986470699310303, "global_step": 149612, "epoch": 3562} {"train_loss": -6.917627334594727, "global_step": 149613, "epoch": 3562} {"train_loss": -6.853802680969238, "global_step": 149614, "epoch": 3562} {"train_loss": -6.915119171142578, "global_step": 149615, "epoch": 3562} {"train_loss": -6.824150085449219, "global_step": 149616, "epoch": 3562} {"train_loss": -6.8783698081970215, "global_step": 149617, "epoch": 3562} {"train_loss": -6.80912446975708, "global_step": 149618, "epoch": 3562} {"train_loss": -6.7873358726501465, "global_step": 149619, "epoch": 3562} {"train_loss": -6.826821327209473, "global_step": 149620, "epoch": 3562} {"train_loss": -6.925743103027344, "global_step": 149621, "epoch": 3562} {"train_loss": -6.671572208404541, "global_step": 149622, "epoch": 3562} {"train_loss": -6.83400297164917, "global_step": 149623, "epoch": 3562} {"train_loss": -6.940637588500977, "global_step": 149624, "epoch": 3562} {"train_loss": -6.867351531982422, "global_step": 149625, "epoch": 3562} {"train_loss": -6.789241790771484, "global_step": 149626, "epoch": 3562} {"train_loss": -6.821301460266113, "global_step": 149627, "epoch": 3562} {"train_loss": -6.801545143127441, "global_step": 149628, "epoch": 3562} {"train_loss": -6.823625564575195, "global_step": 149629, "epoch": 3562} {"train_loss": -6.877728462219238, "global_step": 149630, "epoch": 3562} {"train_loss": -6.800874710083008, "global_step": 149631, "epoch": 3562} {"train_loss": -6.750940322875977, "global_step": 149632, "epoch": 3562} {"train_loss": -6.831542491912842, "global_step": 149633, "epoch": 3562} {"train_loss": -6.78396463394165, "global_step": 149634, "epoch": 3562} {"train_loss": -6.730842590332031, "global_step": 149635, "epoch": 3562} {"train_loss": -6.829256057739258, "global_step": 149636, "epoch": 3562} {"train_loss": -6.787137031555176, "global_step": 149637, "epoch": 3562} {"train_loss": -6.632353782653809, "global_step": 149638, "epoch": 3562} {"train_loss": -6.8458662033081055, "global_step": 149639, "epoch": 3562} {"train_loss": -6.762425422668457, "global_step": 149640, "epoch": 3562} {"train_loss": -6.750639915466309, "global_step": 149641, "epoch": 3562} {"train_loss": -6.804752349853516, "global_step": 149642, "epoch": 3562} {"train_loss": -6.674162864685059, "global_step": 149643, "epoch": 3562} {"train_loss": -6.857204437255859, "global_step": 149644, "epoch": 3562} {"train_loss": -6.820315735680716, "global_step": 149645, "epoch": 3562, "val_loss": 68057.40625} {"train_loss": -6.810023784637451, "global_step": 149646, "epoch": 3563} {"train_loss": -6.829431533813477, "global_step": 149647, "epoch": 3563} {"train_loss": -6.844173908233643, "global_step": 149648, "epoch": 3563} {"train_loss": -6.859637260437012, "global_step": 149649, "epoch": 3563} {"train_loss": -6.8358283042907715, "global_step": 149650, "epoch": 3563} {"train_loss": -6.84709358215332, "global_step": 149651, "epoch": 3563} {"train_loss": -6.7504191398620605, "global_step": 149652, "epoch": 3563} {"train_loss": -6.733720779418945, "global_step": 149653, "epoch": 3563} {"train_loss": -6.759431838989258, "global_step": 149654, "epoch": 3563} {"train_loss": -6.841121196746826, "global_step": 149655, "epoch": 3563} {"train_loss": -6.752060890197754, "global_step": 149656, "epoch": 3563} {"train_loss": -6.7776079177856445, "global_step": 149657, "epoch": 3563} {"train_loss": -6.740047931671143, "global_step": 149658, "epoch": 3563} {"train_loss": -6.7645368576049805, "global_step": 149659, "epoch": 3563} {"train_loss": -6.927198886871338, "global_step": 149660, "epoch": 3563} {"train_loss": -6.906803607940674, "global_step": 149661, "epoch": 3563} {"train_loss": -6.894778728485107, "global_step": 149662, "epoch": 3563} {"train_loss": -6.912336349487305, "global_step": 149663, "epoch": 3563} {"train_loss": -6.740487098693848, "global_step": 149664, "epoch": 3563} {"train_loss": -6.937226295471191, "global_step": 149665, "epoch": 3563} {"train_loss": -6.641077995300293, "global_step": 149666, "epoch": 3563} {"train_loss": -6.758627891540527, "global_step": 149667, "epoch": 3563} {"train_loss": -6.846928596496582, "global_step": 149668, "epoch": 3563} {"train_loss": -6.741260051727295, "global_step": 149669, "epoch": 3563} {"train_loss": -6.859846115112305, "global_step": 149670, "epoch": 3563} {"train_loss": -6.740726947784424, "global_step": 149671, "epoch": 3563} {"train_loss": -6.924840927124023, "global_step": 149672, "epoch": 3563} {"train_loss": -6.6632914543151855, "global_step": 149673, "epoch": 3563} {"train_loss": -6.807718753814697, "global_step": 149674, "epoch": 3563} {"train_loss": -6.803403854370117, "global_step": 149675, "epoch": 3563} {"train_loss": -6.779398441314697, "global_step": 149676, "epoch": 3563} {"train_loss": -6.637262344360352, "global_step": 149677, "epoch": 3563} {"train_loss": -6.657465934753418, "global_step": 149678, "epoch": 3563} {"train_loss": -6.800227165222168, "global_step": 149679, "epoch": 3563} {"train_loss": -6.745317459106445, "global_step": 149680, "epoch": 3563} {"train_loss": -6.747309684753418, "global_step": 149681, "epoch": 3563} {"train_loss": -6.795228004455566, "global_step": 149682, "epoch": 3563} {"train_loss": -6.753902435302734, "global_step": 149683, "epoch": 3563} {"train_loss": -6.836935997009277, "global_step": 149684, "epoch": 3563} {"train_loss": -6.713983535766602, "global_step": 149685, "epoch": 3563} {"train_loss": -6.777642726898193, "global_step": 149686, "epoch": 3563} {"train_loss": -6.792479957853045, "global_step": 149687, "epoch": 3563, "val_loss": 68124.1796875} {"train_loss": -6.89097261428833, "global_step": 149688, "epoch": 3564} {"train_loss": -6.770017623901367, "global_step": 149689, "epoch": 3564} {"train_loss": -6.748652458190918, "global_step": 149690, "epoch": 3564} {"train_loss": -6.8423919677734375, "global_step": 149691, "epoch": 3564} {"train_loss": -6.773680686950684, "global_step": 149692, "epoch": 3564} {"train_loss": -6.789291858673096, "global_step": 149693, "epoch": 3564} {"train_loss": -6.829690933227539, "global_step": 149694, "epoch": 3564} {"train_loss": -6.87477445602417, "global_step": 149695, "epoch": 3564} {"train_loss": -6.809245586395264, "global_step": 149696, "epoch": 3564} {"train_loss": -6.8162617683410645, "global_step": 149697, "epoch": 3564} {"train_loss": -6.830280303955078, "global_step": 149698, "epoch": 3564} {"train_loss": -6.819640636444092, "global_step": 149699, "epoch": 3564} {"train_loss": -6.857909202575684, "global_step": 149700, "epoch": 3564} {"train_loss": -6.848732948303223, "global_step": 149701, "epoch": 3564} {"train_loss": -6.743910789489746, "global_step": 149702, "epoch": 3564} {"train_loss": -6.877728462219238, "global_step": 149703, "epoch": 3564} {"train_loss": -6.974338531494141, "global_step": 149704, "epoch": 3564} {"train_loss": -6.895759105682373, "global_step": 149705, "epoch": 3564} {"train_loss": -6.948784351348877, "global_step": 149706, "epoch": 3564} {"train_loss": -6.939120292663574, "global_step": 149707, "epoch": 3564} {"train_loss": -6.821829795837402, "global_step": 149708, "epoch": 3564} {"train_loss": -6.887626647949219, "global_step": 149709, "epoch": 3564} {"train_loss": -6.785978317260742, "global_step": 149710, "epoch": 3564} {"train_loss": -6.938574314117432, "global_step": 149711, "epoch": 3564} {"train_loss": -6.910373687744141, "global_step": 149712, "epoch": 3564} {"train_loss": -6.896673202514648, "global_step": 149713, "epoch": 3564} {"train_loss": -6.731785774230957, "global_step": 149714, "epoch": 3564} {"train_loss": -6.860074996948242, "global_step": 149715, "epoch": 3564} {"train_loss": -6.860358715057373, "global_step": 149716, "epoch": 3564} {"train_loss": -6.76327657699585, "global_step": 149717, "epoch": 3564} {"train_loss": -6.841468334197998, "global_step": 149718, "epoch": 3564} {"train_loss": -6.648349285125732, "global_step": 149719, "epoch": 3564} {"train_loss": -6.80696964263916, "global_step": 149720, "epoch": 3564} {"train_loss": -6.831435680389404, "global_step": 149721, "epoch": 3564} {"train_loss": -6.688547611236572, "global_step": 149722, "epoch": 3564} {"train_loss": -7.01031494140625, "global_step": 149723, "epoch": 3564} {"train_loss": -6.813554763793945, "global_step": 149724, "epoch": 3564} {"train_loss": -6.746764183044434, "global_step": 149725, "epoch": 3564} {"train_loss": -6.925020694732666, "global_step": 149726, "epoch": 3564} {"train_loss": -6.760120868682861, "global_step": 149727, "epoch": 3564} {"train_loss": -6.892751693725586, "global_step": 149728, "epoch": 3564} {"train_loss": -6.835497640428089, "global_step": 149729, "epoch": 3564, "val_loss": 68139.75} {"train_loss": -6.8211774826049805, "global_step": 149730, "epoch": 3565} {"train_loss": -6.928765296936035, "global_step": 149731, "epoch": 3565} {"train_loss": -6.822596549987793, "global_step": 149732, "epoch": 3565} {"train_loss": -6.795010566711426, "global_step": 149733, "epoch": 3565} {"train_loss": -6.864300727844238, "global_step": 149734, "epoch": 3565} {"train_loss": -6.910526275634766, "global_step": 149735, "epoch": 3565} {"train_loss": -6.909431457519531, "global_step": 149736, "epoch": 3565} {"train_loss": -6.875398635864258, "global_step": 149737, "epoch": 3565} {"train_loss": -6.974923133850098, "global_step": 149738, "epoch": 3565} {"train_loss": -6.80334997177124, "global_step": 149739, "epoch": 3565} {"train_loss": -6.864663124084473, "global_step": 149740, "epoch": 3565} {"train_loss": -6.848232269287109, "global_step": 149741, "epoch": 3565} {"train_loss": -6.8647141456604, "global_step": 149742, "epoch": 3565} {"train_loss": -6.980502605438232, "global_step": 149743, "epoch": 3565} {"train_loss": -6.847697734832764, "global_step": 149744, "epoch": 3565} {"train_loss": -6.863755226135254, "global_step": 149745, "epoch": 3565} {"train_loss": -7.021639823913574, "global_step": 149746, "epoch": 3565} {"train_loss": -6.932599067687988, "global_step": 149747, "epoch": 3565} {"train_loss": -6.862551212310791, "global_step": 149748, "epoch": 3565} {"train_loss": -6.8966474533081055, "global_step": 149749, "epoch": 3565} {"train_loss": -6.9209699630737305, "global_step": 149750, "epoch": 3565} {"train_loss": -6.851193428039551, "global_step": 149751, "epoch": 3565} {"train_loss": -6.9062018394470215, "global_step": 149752, "epoch": 3565} {"train_loss": -6.850136756896973, "global_step": 149753, "epoch": 3565} {"train_loss": -6.804137229919434, "global_step": 149754, "epoch": 3565} {"train_loss": -6.883523464202881, "global_step": 149755, "epoch": 3565} {"train_loss": -6.825016021728516, "global_step": 149756, "epoch": 3565} {"train_loss": -6.902859210968018, "global_step": 149757, "epoch": 3565} {"train_loss": -6.832283020019531, "global_step": 149758, "epoch": 3565} {"train_loss": -6.881491184234619, "global_step": 149759, "epoch": 3565} {"train_loss": -6.734925746917725, "global_step": 149760, "epoch": 3565} {"train_loss": -6.867499351501465, "global_step": 149761, "epoch": 3565} {"train_loss": -6.962010383605957, "global_step": 149762, "epoch": 3565} {"train_loss": -6.823053359985352, "global_step": 149763, "epoch": 3565} {"train_loss": -6.924843788146973, "global_step": 149764, "epoch": 3565} {"train_loss": -6.833505153656006, "global_step": 149765, "epoch": 3565} {"train_loss": -6.6921281814575195, "global_step": 149766, "epoch": 3565} {"train_loss": -6.853785514831543, "global_step": 149767, "epoch": 3565} {"train_loss": -6.845402717590332, "global_step": 149768, "epoch": 3565} {"train_loss": -6.8895392417907715, "global_step": 149769, "epoch": 3565} {"train_loss": -6.852874755859375, "global_step": 149770, "epoch": 3565} {"train_loss": -6.867518776939029, "global_step": 149771, "epoch": 3565, "val_loss": 67933.5078125} {"train_loss": -6.848658561706543, "global_step": 149772, "epoch": 3566} {"train_loss": -6.907031059265137, "global_step": 149773, "epoch": 3566} {"train_loss": -6.916955947875977, "global_step": 149774, "epoch": 3566} {"train_loss": -6.7687458992004395, "global_step": 149775, "epoch": 3566} {"train_loss": -6.864141464233398, "global_step": 149776, "epoch": 3566} {"train_loss": -6.779987812042236, "global_step": 149777, "epoch": 3566} {"train_loss": -6.920112609863281, "global_step": 149778, "epoch": 3566} {"train_loss": -6.836114883422852, "global_step": 149779, "epoch": 3566} {"train_loss": -6.824030876159668, "global_step": 149780, "epoch": 3566} {"train_loss": -6.890110492706299, "global_step": 149781, "epoch": 3566} {"train_loss": -6.8541340827941895, "global_step": 149782, "epoch": 3566} {"train_loss": -6.93056583404541, "global_step": 149783, "epoch": 3566} {"train_loss": -6.774410724639893, "global_step": 149784, "epoch": 3566} {"train_loss": -6.7933831214904785, "global_step": 149785, "epoch": 3566} {"train_loss": -6.876054763793945, "global_step": 149786, "epoch": 3566} {"train_loss": -6.825977325439453, "global_step": 149787, "epoch": 3566} {"train_loss": -6.759979724884033, "global_step": 149788, "epoch": 3566} {"train_loss": -6.839327812194824, "global_step": 149789, "epoch": 3566} {"train_loss": -6.97590970993042, "global_step": 149790, "epoch": 3566} {"train_loss": -6.834629535675049, "global_step": 149791, "epoch": 3566} {"train_loss": -6.949711799621582, "global_step": 149792, "epoch": 3566} {"train_loss": -6.801109313964844, "global_step": 149793, "epoch": 3566} {"train_loss": -6.7745819091796875, "global_step": 149794, "epoch": 3566} {"train_loss": -6.861363410949707, "global_step": 149795, "epoch": 3566} {"train_loss": -6.778385162353516, "global_step": 149796, "epoch": 3566} {"train_loss": -6.855476379394531, "global_step": 149797, "epoch": 3566} {"train_loss": -6.738485336303711, "global_step": 149798, "epoch": 3566} {"train_loss": -6.738672256469727, "global_step": 149799, "epoch": 3566} {"train_loss": -6.832265853881836, "global_step": 149800, "epoch": 3566} {"train_loss": -6.897934913635254, "global_step": 149801, "epoch": 3566} {"train_loss": -6.84184455871582, "global_step": 149802, "epoch": 3566} {"train_loss": -6.835846900939941, "global_step": 149803, "epoch": 3566} {"train_loss": -6.877036094665527, "global_step": 149804, "epoch": 3566} {"train_loss": -6.798422813415527, "global_step": 149805, "epoch": 3566} {"train_loss": -6.8496246337890625, "global_step": 149806, "epoch": 3566} {"train_loss": -6.851761817932129, "global_step": 149807, "epoch": 3566} {"train_loss": -6.837765216827393, "global_step": 149808, "epoch": 3566} {"train_loss": -6.839548587799072, "global_step": 149809, "epoch": 3566} {"train_loss": -6.879756927490234, "global_step": 149810, "epoch": 3566} {"train_loss": -6.861693382263184, "global_step": 149811, "epoch": 3566} {"train_loss": -6.9720683097839355, "global_step": 149812, "epoch": 3566} {"train_loss": -6.848820470628285, "global_step": 149813, "epoch": 3566, "val_loss": 67813.0625} {"train_loss": -6.929729461669922, "global_step": 149814, "epoch": 3567} {"train_loss": -6.902379512786865, "global_step": 149815, "epoch": 3567} {"train_loss": -6.910188674926758, "global_step": 149816, "epoch": 3567} {"train_loss": -6.926578044891357, "global_step": 149817, "epoch": 3567} {"train_loss": -6.977817535400391, "global_step": 149818, "epoch": 3567} {"train_loss": -6.901970386505127, "global_step": 149819, "epoch": 3567} {"train_loss": -6.984846115112305, "global_step": 149820, "epoch": 3567} {"train_loss": -6.800441741943359, "global_step": 149821, "epoch": 3567} {"train_loss": -6.8435468673706055, "global_step": 149822, "epoch": 3567} {"train_loss": -6.813409328460693, "global_step": 149823, "epoch": 3567} {"train_loss": -6.849991798400879, "global_step": 149824, "epoch": 3567} {"train_loss": -6.968334197998047, "global_step": 149825, "epoch": 3567} {"train_loss": -6.85845947265625, "global_step": 149826, "epoch": 3567} {"train_loss": -6.796767234802246, "global_step": 149827, "epoch": 3567} {"train_loss": -6.813586235046387, "global_step": 149828, "epoch": 3567} {"train_loss": -6.947494983673096, "global_step": 149829, "epoch": 3567} {"train_loss": -6.828391075134277, "global_step": 149830, "epoch": 3567} {"train_loss": -6.8778510093688965, "global_step": 149831, "epoch": 3567} {"train_loss": -6.778970718383789, "global_step": 149832, "epoch": 3567} {"train_loss": -6.912422180175781, "global_step": 149833, "epoch": 3567} {"train_loss": -6.6751790046691895, "global_step": 149834, "epoch": 3567} {"train_loss": -6.84511137008667, "global_step": 149835, "epoch": 3567} {"train_loss": -6.908729553222656, "global_step": 149836, "epoch": 3567} {"train_loss": -6.730504035949707, "global_step": 149837, "epoch": 3567} {"train_loss": -6.885625839233398, "global_step": 149838, "epoch": 3567} {"train_loss": -7.010846138000488, "global_step": 149839, "epoch": 3567} {"train_loss": -6.804052352905273, "global_step": 149840, "epoch": 3567} {"train_loss": -6.712200164794922, "global_step": 149841, "epoch": 3567} {"train_loss": -6.9109063148498535, "global_step": 149842, "epoch": 3567} {"train_loss": -6.849508285522461, "global_step": 149843, "epoch": 3567} {"train_loss": -6.87291145324707, "global_step": 149844, "epoch": 3567} {"train_loss": -6.866530895233154, "global_step": 149845, "epoch": 3567} {"train_loss": -6.767454624176025, "global_step": 149846, "epoch": 3567} {"train_loss": -6.891223907470703, "global_step": 149847, "epoch": 3567} {"train_loss": -6.8350372314453125, "global_step": 149848, "epoch": 3567} {"train_loss": -6.798488616943359, "global_step": 149849, "epoch": 3567} {"train_loss": -6.727755546569824, "global_step": 149850, "epoch": 3567} {"train_loss": -6.816872596740723, "global_step": 149851, "epoch": 3567} {"train_loss": -6.842825889587402, "global_step": 149852, "epoch": 3567} {"train_loss": -6.805830955505371, "global_step": 149853, "epoch": 3567} {"train_loss": -6.902281284332275, "global_step": 149854, "epoch": 3567} {"train_loss": -6.8551111334846135, "global_step": 149855, "epoch": 3567, "val_loss": 67860.6484375} {"train_loss": -6.6879425048828125, "global_step": 149856, "epoch": 3568} {"train_loss": -6.770096778869629, "global_step": 149857, "epoch": 3568} {"train_loss": -6.840241432189941, "global_step": 149858, "epoch": 3568} {"train_loss": -6.6885986328125, "global_step": 149859, "epoch": 3568} {"train_loss": -6.715526580810547, "global_step": 149860, "epoch": 3568} {"train_loss": -6.808917999267578, "global_step": 149861, "epoch": 3568} {"train_loss": -6.693805694580078, "global_step": 149862, "epoch": 3568} {"train_loss": -6.802480697631836, "global_step": 149863, "epoch": 3568} {"train_loss": -6.771811485290527, "global_step": 149864, "epoch": 3568} {"train_loss": -6.8493428230285645, "global_step": 149865, "epoch": 3568} {"train_loss": -6.778342247009277, "global_step": 149866, "epoch": 3568} {"train_loss": -6.79034423828125, "global_step": 149867, "epoch": 3568} {"train_loss": -6.865819454193115, "global_step": 149868, "epoch": 3568} {"train_loss": -6.744191646575928, "global_step": 149869, "epoch": 3568} {"train_loss": -6.852219104766846, "global_step": 149870, "epoch": 3568} {"train_loss": -6.833914756774902, "global_step": 149871, "epoch": 3568} {"train_loss": -6.911766052246094, "global_step": 149872, "epoch": 3568} {"train_loss": -6.833188056945801, "global_step": 149873, "epoch": 3568} {"train_loss": -6.86810302734375, "global_step": 149874, "epoch": 3568} {"train_loss": -6.880059242248535, "global_step": 149875, "epoch": 3568} {"train_loss": -6.900656700134277, "global_step": 149876, "epoch": 3568} {"train_loss": -6.816567420959473, "global_step": 149877, "epoch": 3568} {"train_loss": -6.8441267013549805, "global_step": 149878, "epoch": 3568} {"train_loss": -6.929235458374023, "global_step": 149879, "epoch": 3568} {"train_loss": -6.730240821838379, "global_step": 149880, "epoch": 3568} {"train_loss": -6.800976753234863, "global_step": 149881, "epoch": 3568} {"train_loss": -6.880481719970703, "global_step": 149882, "epoch": 3568} {"train_loss": -6.799354553222656, "global_step": 149883, "epoch": 3568} {"train_loss": -6.901166915893555, "global_step": 149884, "epoch": 3568} {"train_loss": -6.777956008911133, "global_step": 149885, "epoch": 3568} {"train_loss": -6.923064231872559, "global_step": 149886, "epoch": 3568} {"train_loss": -6.712008476257324, "global_step": 149887, "epoch": 3568} {"train_loss": -6.878766059875488, "global_step": 149888, "epoch": 3568} {"train_loss": -6.879531383514404, "global_step": 149889, "epoch": 3568} {"train_loss": -6.83254337310791, "global_step": 149890, "epoch": 3568} {"train_loss": -6.87064790725708, "global_step": 149891, "epoch": 3568} {"train_loss": -6.842889785766602, "global_step": 149892, "epoch": 3568} {"train_loss": -6.798514366149902, "global_step": 149893, "epoch": 3568} {"train_loss": -6.784557342529297, "global_step": 149894, "epoch": 3568} {"train_loss": -6.781655311584473, "global_step": 149895, "epoch": 3568} {"train_loss": -6.922534942626953, "global_step": 149896, "epoch": 3568} {"train_loss": -6.820542812347412, "global_step": 149897, "epoch": 3568, "val_loss": 67969.96875} {"train_loss": -6.821469783782959, "global_step": 149898, "epoch": 3569} {"train_loss": -6.733280181884766, "global_step": 149899, "epoch": 3569} {"train_loss": -6.792492389678955, "global_step": 149900, "epoch": 3569} {"train_loss": -6.844334602355957, "global_step": 149901, "epoch": 3569} {"train_loss": -6.882425308227539, "global_step": 149902, "epoch": 3569} {"train_loss": -6.986328125, "global_step": 149903, "epoch": 3569} {"train_loss": -6.906928062438965, "global_step": 149904, "epoch": 3569} {"train_loss": -6.739252090454102, "global_step": 149905, "epoch": 3569} {"train_loss": -6.818809509277344, "global_step": 149906, "epoch": 3569} {"train_loss": -6.85440731048584, "global_step": 149907, "epoch": 3569} {"train_loss": -6.742791652679443, "global_step": 149908, "epoch": 3569} {"train_loss": -6.716153144836426, "global_step": 149909, "epoch": 3569} {"train_loss": -6.80535888671875, "global_step": 149910, "epoch": 3569} {"train_loss": -6.735803604125977, "global_step": 149911, "epoch": 3569} {"train_loss": -6.852395057678223, "global_step": 149912, "epoch": 3569} {"train_loss": -6.788710117340088, "global_step": 149913, "epoch": 3569} {"train_loss": -6.78013277053833, "global_step": 149914, "epoch": 3569} {"train_loss": -6.850166320800781, "global_step": 149915, "epoch": 3569} {"train_loss": -6.797755241394043, "global_step": 149916, "epoch": 3569} {"train_loss": -6.766576766967773, "global_step": 149917, "epoch": 3569} {"train_loss": -6.810354232788086, "global_step": 149918, "epoch": 3569} {"train_loss": -6.7952728271484375, "global_step": 149919, "epoch": 3569} {"train_loss": -6.777270793914795, "global_step": 149920, "epoch": 3569} {"train_loss": -6.913647651672363, "global_step": 149921, "epoch": 3569} {"train_loss": -6.817313194274902, "global_step": 149922, "epoch": 3569} {"train_loss": -6.947415828704834, "global_step": 149923, "epoch": 3569} {"train_loss": -6.820446014404297, "global_step": 149924, "epoch": 3569} {"train_loss": -6.853659152984619, "global_step": 149925, "epoch": 3569} {"train_loss": -6.804006099700928, "global_step": 149926, "epoch": 3569} {"train_loss": -6.800728797912598, "global_step": 149927, "epoch": 3569} {"train_loss": -6.903009414672852, "global_step": 149928, "epoch": 3569} {"train_loss": -6.709774494171143, "global_step": 149929, "epoch": 3569} {"train_loss": -6.770046234130859, "global_step": 149930, "epoch": 3569} {"train_loss": -6.909363269805908, "global_step": 149931, "epoch": 3569} {"train_loss": -6.856157302856445, "global_step": 149932, "epoch": 3569} {"train_loss": -6.962800979614258, "global_step": 149933, "epoch": 3569} {"train_loss": -6.909564018249512, "global_step": 149934, "epoch": 3569} {"train_loss": -6.927703380584717, "global_step": 149935, "epoch": 3569} {"train_loss": -6.884368896484375, "global_step": 149936, "epoch": 3569} {"train_loss": -6.73777437210083, "global_step": 149937, "epoch": 3569} {"train_loss": -6.88760232925415, "global_step": 149938, "epoch": 3569} {"train_loss": -6.827277251652309, "global_step": 149939, "epoch": 3569, "val_loss": 67732.21875} {"train_loss": -6.889537811279297, "global_step": 149940, "epoch": 3570} {"train_loss": -6.827020168304443, "global_step": 149941, "epoch": 3570} {"train_loss": -6.844906806945801, "global_step": 149942, "epoch": 3570} {"train_loss": -6.858391761779785, "global_step": 149943, "epoch": 3570} {"train_loss": -6.831229209899902, "global_step": 149944, "epoch": 3570} {"train_loss": -6.901352882385254, "global_step": 149945, "epoch": 3570} {"train_loss": -6.920783996582031, "global_step": 149946, "epoch": 3570} {"train_loss": -6.794003486633301, "global_step": 149947, "epoch": 3570} {"train_loss": -6.832279205322266, "global_step": 149948, "epoch": 3570} {"train_loss": -6.720245361328125, "global_step": 149949, "epoch": 3570} {"train_loss": -6.804518699645996, "global_step": 149950, "epoch": 3570} {"train_loss": -6.847417831420898, "global_step": 149951, "epoch": 3570} {"train_loss": -6.863019943237305, "global_step": 149952, "epoch": 3570} {"train_loss": -6.835206985473633, "global_step": 149953, "epoch": 3570} {"train_loss": -6.929544448852539, "global_step": 149954, "epoch": 3570} {"train_loss": -6.841394424438477, "global_step": 149955, "epoch": 3570} {"train_loss": -6.881031036376953, "global_step": 149956, "epoch": 3570} {"train_loss": -6.943137168884277, "global_step": 149957, "epoch": 3570} {"train_loss": -6.824315547943115, "global_step": 149958, "epoch": 3570} {"train_loss": -6.997950553894043, "global_step": 149959, "epoch": 3570} {"train_loss": -6.840737342834473, "global_step": 149960, "epoch": 3570} {"train_loss": -6.731585502624512, "global_step": 149961, "epoch": 3570} {"train_loss": -6.851334095001221, "global_step": 149962, "epoch": 3570} {"train_loss": -6.778533935546875, "global_step": 149963, "epoch": 3570} {"train_loss": -6.885402679443359, "global_step": 149964, "epoch": 3570} {"train_loss": -6.906699180603027, "global_step": 149965, "epoch": 3570} {"train_loss": -6.864532947540283, "global_step": 149966, "epoch": 3570} {"train_loss": -6.961350917816162, "global_step": 149967, "epoch": 3570} {"train_loss": -6.907588958740234, "global_step": 149968, "epoch": 3570} {"train_loss": -6.835240840911865, "global_step": 149969, "epoch": 3570} {"train_loss": -6.812032222747803, "global_step": 149970, "epoch": 3570} {"train_loss": -6.807647705078125, "global_step": 149971, "epoch": 3570} {"train_loss": -6.837090492248535, "global_step": 149972, "epoch": 3570} {"train_loss": -6.87740421295166, "global_step": 149973, "epoch": 3570} {"train_loss": -6.983177185058594, "global_step": 149974, "epoch": 3570} {"train_loss": -6.864197731018066, "global_step": 149975, "epoch": 3570} {"train_loss": -6.768797397613525, "global_step": 149976, "epoch": 3570} {"train_loss": -6.847353458404541, "global_step": 149977, "epoch": 3570} {"train_loss": -6.765714645385742, "global_step": 149978, "epoch": 3570} {"train_loss": -6.8536248207092285, "global_step": 149979, "epoch": 3570} {"train_loss": -6.841568470001221, "global_step": 149980, "epoch": 3570} {"train_loss": -6.852001042593093, "global_step": 149981, "epoch": 3570, "val_loss": 68018.4140625} {"train_loss": -6.95041561126709, "global_step": 149982, "epoch": 3571} {"train_loss": -6.865511894226074, "global_step": 149983, "epoch": 3571} {"train_loss": -6.812685012817383, "global_step": 149984, "epoch": 3571} {"train_loss": -6.837538719177246, "global_step": 149985, "epoch": 3571} {"train_loss": -6.8083176612854, "global_step": 149986, "epoch": 3571} {"train_loss": -6.944512367248535, "global_step": 149987, "epoch": 3571} {"train_loss": -6.9115424156188965, "global_step": 149988, "epoch": 3571} {"train_loss": -6.846782207489014, "global_step": 149989, "epoch": 3571} {"train_loss": -6.823103427886963, "global_step": 149990, "epoch": 3571} {"train_loss": -6.74885892868042, "global_step": 149991, "epoch": 3571} {"train_loss": -6.919805526733398, "global_step": 149992, "epoch": 3571} {"train_loss": -6.984346866607666, "global_step": 149993, "epoch": 3571} {"train_loss": -6.921994209289551, "global_step": 149994, "epoch": 3571} {"train_loss": -6.880119323730469, "global_step": 149995, "epoch": 3571} {"train_loss": -6.912813186645508, "global_step": 149996, "epoch": 3571} {"train_loss": -6.848759651184082, "global_step": 149997, "epoch": 3571} {"train_loss": -6.724847316741943, "global_step": 149998, "epoch": 3571} {"train_loss": -6.7259840965271, "global_step": 149999, "epoch": 3571} {"train_loss": -6.7062506675720215, "global_step": 150000, "epoch": 3571} {"train_loss": -6.733487606048584, "global_step": 150001, "epoch": 3571} {"train_loss": -6.801703453063965, "global_step": 150002, "epoch": 3571} {"train_loss": -6.784027099609375, "global_step": 150003, "epoch": 3571} {"train_loss": -6.788890361785889, "global_step": 150004, "epoch": 3571} {"train_loss": -6.755635738372803, "global_step": 150005, "epoch": 3571} {"train_loss": -6.813483238220215, "global_step": 150006, "epoch": 3571} {"train_loss": -6.861234188079834, "global_step": 150007, "epoch": 3571} {"train_loss": -6.8152337074279785, "global_step": 150008, "epoch": 3571} {"train_loss": -6.811553955078125, "global_step": 150009, "epoch": 3571} {"train_loss": -6.8852314949035645, "global_step": 150010, "epoch": 3571} {"train_loss": -6.854179382324219, "global_step": 150011, "epoch": 3571} {"train_loss": -6.837067127227783, "global_step": 150012, "epoch": 3571} {"train_loss": -6.876665115356445, "global_step": 150013, "epoch": 3571} {"train_loss": -6.856673240661621, "global_step": 150014, "epoch": 3571} {"train_loss": -6.922245502471924, "global_step": 150015, "epoch": 3571} {"train_loss": -6.79437780380249, "global_step": 150016, "epoch": 3571} {"train_loss": -6.889601707458496, "global_step": 150017, "epoch": 3571} {"train_loss": -6.854154586791992, "global_step": 150018, "epoch": 3571} {"train_loss": -6.889896392822266, "global_step": 150019, "epoch": 3571} {"train_loss": -6.788857460021973, "global_step": 150020, "epoch": 3571} {"train_loss": -6.6259026527404785, "global_step": 150021, "epoch": 3571} {"train_loss": -6.779783248901367, "global_step": 150022, "epoch": 3571} {"train_loss": -6.829041015534174, "global_step": 150023, "epoch": 3571, "val_loss": 68047.890625} {"train_loss": -6.691835403442383, "global_step": 150024, "epoch": 3572} {"train_loss": -6.910885810852051, "global_step": 150025, "epoch": 3572} {"train_loss": -6.627458572387695, "global_step": 150026, "epoch": 3572} {"train_loss": -6.7189435958862305, "global_step": 150027, "epoch": 3572} {"train_loss": -6.882826805114746, "global_step": 150028, "epoch": 3572} {"train_loss": -6.700276851654053, "global_step": 150029, "epoch": 3572} {"train_loss": -6.895524024963379, "global_step": 150030, "epoch": 3572} {"train_loss": -6.891817092895508, "global_step": 150031, "epoch": 3572} {"train_loss": -6.783083915710449, "global_step": 150032, "epoch": 3572} {"train_loss": -6.832484245300293, "global_step": 150033, "epoch": 3572} {"train_loss": -6.7021660804748535, "global_step": 150034, "epoch": 3572} {"train_loss": -6.718459606170654, "global_step": 150035, "epoch": 3572} {"train_loss": -6.868536949157715, "global_step": 150036, "epoch": 3572} {"train_loss": -6.769062042236328, "global_step": 150037, "epoch": 3572} {"train_loss": -6.842398166656494, "global_step": 150038, "epoch": 3572} {"train_loss": -6.940796852111816, "global_step": 150039, "epoch": 3572} {"train_loss": -6.757772922515869, "global_step": 150040, "epoch": 3572} {"train_loss": -6.920564651489258, "global_step": 150041, "epoch": 3572} {"train_loss": -6.685730934143066, "global_step": 150042, "epoch": 3572} {"train_loss": -6.62109375, "global_step": 150043, "epoch": 3572} {"train_loss": -6.919338226318359, "global_step": 150044, "epoch": 3572} {"train_loss": -6.61965799331665, "global_step": 150045, "epoch": 3572} {"train_loss": -6.776413917541504, "global_step": 150046, "epoch": 3572} {"train_loss": -6.781283378601074, "global_step": 150047, "epoch": 3572} {"train_loss": -6.748608589172363, "global_step": 150048, "epoch": 3572} {"train_loss": -6.846577167510986, "global_step": 150049, "epoch": 3572} {"train_loss": -6.630529403686523, "global_step": 150050, "epoch": 3572} {"train_loss": -7.0198259353637695, "global_step": 150051, "epoch": 3572} {"train_loss": -6.715093612670898, "global_step": 150052, "epoch": 3572} {"train_loss": -6.776092529296875, "global_step": 150053, "epoch": 3572} {"train_loss": -6.871513366699219, "global_step": 150054, "epoch": 3572} {"train_loss": -6.801566123962402, "global_step": 150055, "epoch": 3572} {"train_loss": -6.898926734924316, "global_step": 150056, "epoch": 3572} {"train_loss": -6.802048683166504, "global_step": 150057, "epoch": 3572} {"train_loss": -6.929353713989258, "global_step": 150058, "epoch": 3572} {"train_loss": -6.74964714050293, "global_step": 150059, "epoch": 3572} {"train_loss": -6.7879180908203125, "global_step": 150060, "epoch": 3572} {"train_loss": -6.822026252746582, "global_step": 150061, "epoch": 3572} {"train_loss": -6.879063129425049, "global_step": 150062, "epoch": 3572} {"train_loss": -6.8282670974731445, "global_step": 150063, "epoch": 3572} {"train_loss": -6.869873046875, "global_step": 150064, "epoch": 3572} {"train_loss": -6.802511306036086, "global_step": 150065, "epoch": 3572, "val_loss": 67798.7890625} {"train_loss": -6.918527603149414, "global_step": 150066, "epoch": 3573} {"train_loss": -6.9114813804626465, "global_step": 150067, "epoch": 3573} {"train_loss": -6.886750221252441, "global_step": 150068, "epoch": 3573} {"train_loss": -6.908155918121338, "global_step": 150069, "epoch": 3573} {"train_loss": -6.691892623901367, "global_step": 150070, "epoch": 3573} {"train_loss": -6.722618103027344, "global_step": 150071, "epoch": 3573} {"train_loss": -6.784671783447266, "global_step": 150072, "epoch": 3573} {"train_loss": -6.939476013183594, "global_step": 150073, "epoch": 3573} {"train_loss": -6.809714317321777, "global_step": 150074, "epoch": 3573} {"train_loss": -6.671521186828613, "global_step": 150075, "epoch": 3573} {"train_loss": -6.704797744750977, "global_step": 150076, "epoch": 3573} {"train_loss": -6.896444797515869, "global_step": 150077, "epoch": 3573} {"train_loss": -6.682003974914551, "global_step": 150078, "epoch": 3573} {"train_loss": -6.74704647064209, "global_step": 150079, "epoch": 3573} {"train_loss": -6.809004306793213, "global_step": 150080, "epoch": 3573} {"train_loss": -6.822773456573486, "global_step": 150081, "epoch": 3573} {"train_loss": -6.86281681060791, "global_step": 150082, "epoch": 3573} {"train_loss": -6.849615573883057, "global_step": 150083, "epoch": 3573} {"train_loss": -6.891658782958984, "global_step": 150084, "epoch": 3573} {"train_loss": -6.791810035705566, "global_step": 150085, "epoch": 3573} {"train_loss": -6.793680191040039, "global_step": 150086, "epoch": 3573} {"train_loss": -6.84199333190918, "global_step": 150087, "epoch": 3573} {"train_loss": -6.836278915405273, "global_step": 150088, "epoch": 3573} {"train_loss": -6.855960845947266, "global_step": 150089, "epoch": 3573} {"train_loss": -6.8206787109375, "global_step": 150090, "epoch": 3573} {"train_loss": -6.763361930847168, "global_step": 150091, "epoch": 3573} {"train_loss": -6.878871917724609, "global_step": 150092, "epoch": 3573} {"train_loss": -6.855564117431641, "global_step": 150093, "epoch": 3573} {"train_loss": -6.866681098937988, "global_step": 150094, "epoch": 3573} {"train_loss": -6.839277267456055, "global_step": 150095, "epoch": 3573} {"train_loss": -6.974397659301758, "global_step": 150096, "epoch": 3573} {"train_loss": -6.712913513183594, "global_step": 150097, "epoch": 3573} {"train_loss": -6.916203498840332, "global_step": 150098, "epoch": 3573} {"train_loss": -6.807446002960205, "global_step": 150099, "epoch": 3573} {"train_loss": -6.896653175354004, "global_step": 150100, "epoch": 3573} {"train_loss": -6.777050971984863, "global_step": 150101, "epoch": 3573} {"train_loss": -6.980738639831543, "global_step": 150102, "epoch": 3573} {"train_loss": -6.892806529998779, "global_step": 150103, "epoch": 3573} {"train_loss": -6.891150951385498, "global_step": 150104, "epoch": 3573} {"train_loss": -6.800024032592773, "global_step": 150105, "epoch": 3573} {"train_loss": -6.7882914543151855, "global_step": 150106, "epoch": 3573} {"train_loss": -6.830643483570644, "global_step": 150107, "epoch": 3573, "val_loss": 67995.71875} {"train_loss": -6.75982666015625, "global_step": 150108, "epoch": 3574} {"train_loss": -6.895961761474609, "global_step": 150109, "epoch": 3574} {"train_loss": -6.786667823791504, "global_step": 150110, "epoch": 3574} {"train_loss": -6.808218955993652, "global_step": 150111, "epoch": 3574} {"train_loss": -6.812681674957275, "global_step": 150112, "epoch": 3574} {"train_loss": -6.609827041625977, "global_step": 150113, "epoch": 3574} {"train_loss": -6.81150484085083, "global_step": 150114, "epoch": 3574} {"train_loss": -6.715046405792236, "global_step": 150115, "epoch": 3574} {"train_loss": -6.66598653793335, "global_step": 150116, "epoch": 3574} {"train_loss": -6.769192218780518, "global_step": 150117, "epoch": 3574} {"train_loss": -6.798114776611328, "global_step": 150118, "epoch": 3574} {"train_loss": -6.775618076324463, "global_step": 150119, "epoch": 3574} {"train_loss": -6.867061614990234, "global_step": 150120, "epoch": 3574} {"train_loss": -6.672979354858398, "global_step": 150121, "epoch": 3574} {"train_loss": -6.716784477233887, "global_step": 150122, "epoch": 3574} {"train_loss": -6.72182559967041, "global_step": 150123, "epoch": 3574} {"train_loss": -6.681410312652588, "global_step": 150124, "epoch": 3574} {"train_loss": -6.774003028869629, "global_step": 150125, "epoch": 3574} {"train_loss": -6.802805423736572, "global_step": 150126, "epoch": 3574} {"train_loss": -6.721172332763672, "global_step": 150127, "epoch": 3574} {"train_loss": -6.794193744659424, "global_step": 150128, "epoch": 3574} {"train_loss": -6.9464850425720215, "global_step": 150129, "epoch": 3574} {"train_loss": -6.904440879821777, "global_step": 150130, "epoch": 3574} {"train_loss": -6.83588981628418, "global_step": 150131, "epoch": 3574} {"train_loss": -6.846771240234375, "global_step": 150132, "epoch": 3574} {"train_loss": -6.820239067077637, "global_step": 150133, "epoch": 3574} {"train_loss": -6.777912139892578, "global_step": 150134, "epoch": 3574} {"train_loss": -6.866813659667969, "global_step": 150135, "epoch": 3574} {"train_loss": -6.897809028625488, "global_step": 150136, "epoch": 3574} {"train_loss": -6.837240695953369, "global_step": 150137, "epoch": 3574} {"train_loss": -6.78066349029541, "global_step": 150138, "epoch": 3574} {"train_loss": -6.825128555297852, "global_step": 150139, "epoch": 3574} {"train_loss": -6.963351726531982, "global_step": 150140, "epoch": 3574} {"train_loss": -6.891831874847412, "global_step": 150141, "epoch": 3574} {"train_loss": -6.800899505615234, "global_step": 150142, "epoch": 3574} {"train_loss": -6.894692420959473, "global_step": 150143, "epoch": 3574} {"train_loss": -6.752562522888184, "global_step": 150144, "epoch": 3574} {"train_loss": -6.8661699295043945, "global_step": 150145, "epoch": 3574} {"train_loss": -6.958338737487793, "global_step": 150146, "epoch": 3574} {"train_loss": -6.913641929626465, "global_step": 150147, "epoch": 3574} {"train_loss": -6.877717971801758, "global_step": 150148, "epoch": 3574} {"train_loss": -6.809627487545922, "global_step": 150149, "epoch": 3574, "val_loss": 68099.765625} {"train_loss": -6.879138946533203, "global_step": 150150, "epoch": 3575} {"train_loss": -6.922425746917725, "global_step": 150151, "epoch": 3575} {"train_loss": -6.918264865875244, "global_step": 150152, "epoch": 3575} {"train_loss": -6.77874755859375, "global_step": 150153, "epoch": 3575} {"train_loss": -6.955527305603027, "global_step": 150154, "epoch": 3575} {"train_loss": -6.731718063354492, "global_step": 150155, "epoch": 3575} {"train_loss": -6.813819408416748, "global_step": 150156, "epoch": 3575} {"train_loss": -6.851526737213135, "global_step": 150157, "epoch": 3575} {"train_loss": -6.888739585876465, "global_step": 150158, "epoch": 3575} {"train_loss": -6.811890125274658, "global_step": 150159, "epoch": 3575} {"train_loss": -6.818937301635742, "global_step": 150160, "epoch": 3575} {"train_loss": -6.869351387023926, "global_step": 150161, "epoch": 3575} {"train_loss": -6.99983549118042, "global_step": 150162, "epoch": 3575} {"train_loss": -6.9075775146484375, "global_step": 150163, "epoch": 3575} {"train_loss": -6.884393215179443, "global_step": 150164, "epoch": 3575} {"train_loss": -6.902900218963623, "global_step": 150165, "epoch": 3575} {"train_loss": -6.929013252258301, "global_step": 150166, "epoch": 3575} {"train_loss": -6.82392692565918, "global_step": 150167, "epoch": 3575} {"train_loss": -6.848085880279541, "global_step": 150168, "epoch": 3575} {"train_loss": -6.936192512512207, "global_step": 150169, "epoch": 3575} {"train_loss": -6.969393253326416, "global_step": 150170, "epoch": 3575} {"train_loss": -6.8608551025390625, "global_step": 150171, "epoch": 3575} {"train_loss": -6.933516502380371, "global_step": 150172, "epoch": 3575} {"train_loss": -6.8849382400512695, "global_step": 150173, "epoch": 3575} {"train_loss": -6.75692081451416, "global_step": 150174, "epoch": 3575} {"train_loss": -6.877498626708984, "global_step": 150175, "epoch": 3575} {"train_loss": -6.910867691040039, "global_step": 150176, "epoch": 3575} {"train_loss": -6.785677909851074, "global_step": 150177, "epoch": 3575} {"train_loss": -6.938992500305176, "global_step": 150178, "epoch": 3575} {"train_loss": -6.913693904876709, "global_step": 150179, "epoch": 3575} {"train_loss": -6.694980621337891, "global_step": 150180, "epoch": 3575} {"train_loss": -6.732544898986816, "global_step": 150181, "epoch": 3575} {"train_loss": -6.858419418334961, "global_step": 150182, "epoch": 3575} {"train_loss": -6.770569801330566, "global_step": 150183, "epoch": 3575} {"train_loss": -6.746057033538818, "global_step": 150184, "epoch": 3575} {"train_loss": -6.781864166259766, "global_step": 150185, "epoch": 3575} {"train_loss": -6.845316410064697, "global_step": 150186, "epoch": 3575} {"train_loss": -6.784119606018066, "global_step": 150187, "epoch": 3575} {"train_loss": -6.789865970611572, "global_step": 150188, "epoch": 3575} {"train_loss": -6.7924652099609375, "global_step": 150189, "epoch": 3575} {"train_loss": -6.771416187286377, "global_step": 150190, "epoch": 3575} {"train_loss": -6.850487595512753, "global_step": 150191, "epoch": 3575, "val_loss": 68053.5625} {"train_loss": -6.778850555419922, "global_step": 150192, "epoch": 3576} {"train_loss": -6.812189102172852, "global_step": 150193, "epoch": 3576} {"train_loss": -6.9242448806762695, "global_step": 150194, "epoch": 3576} {"train_loss": -6.782966613769531, "global_step": 150195, "epoch": 3576} {"train_loss": -6.944303035736084, "global_step": 150196, "epoch": 3576} {"train_loss": -6.856195449829102, "global_step": 150197, "epoch": 3576} {"train_loss": -6.935800075531006, "global_step": 150198, "epoch": 3576} {"train_loss": -6.796525955200195, "global_step": 150199, "epoch": 3576} {"train_loss": -6.73384428024292, "global_step": 150200, "epoch": 3576} {"train_loss": -6.909292221069336, "global_step": 150201, "epoch": 3576} {"train_loss": -6.766600608825684, "global_step": 150202, "epoch": 3576} {"train_loss": -6.960086345672607, "global_step": 150203, "epoch": 3576} {"train_loss": -6.858331680297852, "global_step": 150204, "epoch": 3576} {"train_loss": -6.832737445831299, "global_step": 150205, "epoch": 3576} {"train_loss": -6.924476146697998, "global_step": 150206, "epoch": 3576} {"train_loss": -6.801104545593262, "global_step": 150207, "epoch": 3576} {"train_loss": -6.830529689788818, "global_step": 150208, "epoch": 3576} {"train_loss": -6.76818323135376, "global_step": 150209, "epoch": 3576} {"train_loss": -6.841081619262695, "global_step": 150210, "epoch": 3576} {"train_loss": -6.8393874168396, "global_step": 150211, "epoch": 3576} {"train_loss": -6.810070991516113, "global_step": 150212, "epoch": 3576} {"train_loss": -6.799419403076172, "global_step": 150213, "epoch": 3576} {"train_loss": -6.821692943572998, "global_step": 150214, "epoch": 3576} {"train_loss": -6.710394382476807, "global_step": 150215, "epoch": 3576} {"train_loss": -6.761717796325684, "global_step": 150216, "epoch": 3576} {"train_loss": -6.802882194519043, "global_step": 150217, "epoch": 3576} {"train_loss": -6.819887638092041, "global_step": 150218, "epoch": 3576} {"train_loss": -6.889286994934082, "global_step": 150219, "epoch": 3576} {"train_loss": -6.7993927001953125, "global_step": 150220, "epoch": 3576} {"train_loss": -6.810799598693848, "global_step": 150221, "epoch": 3576} {"train_loss": -6.8191304206848145, "global_step": 150222, "epoch": 3576} {"train_loss": -6.774738311767578, "global_step": 150223, "epoch": 3576} {"train_loss": -6.875924110412598, "global_step": 150224, "epoch": 3576} {"train_loss": -6.805007457733154, "global_step": 150225, "epoch": 3576} {"train_loss": -6.913888931274414, "global_step": 150226, "epoch": 3576} {"train_loss": -6.705223560333252, "global_step": 150227, "epoch": 3576} {"train_loss": -6.832879543304443, "global_step": 150228, "epoch": 3576} {"train_loss": -6.858058452606201, "global_step": 150229, "epoch": 3576} {"train_loss": -6.840937614440918, "global_step": 150230, "epoch": 3576} {"train_loss": -6.779266834259033, "global_step": 150231, "epoch": 3576} {"train_loss": -6.866832733154297, "global_step": 150232, "epoch": 3576} {"train_loss": -6.828359138397944, "global_step": 150233, "epoch": 3576, "val_loss": 67955.7734375} {"train_loss": -6.862000942230225, "global_step": 150234, "epoch": 3577} {"train_loss": -6.954285144805908, "global_step": 150235, "epoch": 3577} {"train_loss": -6.93343448638916, "global_step": 150236, "epoch": 3577} {"train_loss": -6.936349868774414, "global_step": 150237, "epoch": 3577} {"train_loss": -6.926043510437012, "global_step": 150238, "epoch": 3577} {"train_loss": -6.916192054748535, "global_step": 150239, "epoch": 3577} {"train_loss": -6.8699140548706055, "global_step": 150240, "epoch": 3577} {"train_loss": -6.771090030670166, "global_step": 150241, "epoch": 3577} {"train_loss": -6.887138843536377, "global_step": 150242, "epoch": 3577} {"train_loss": -6.828924179077148, "global_step": 150243, "epoch": 3577} {"train_loss": -6.85429573059082, "global_step": 150244, "epoch": 3577} {"train_loss": -7.052512168884277, "global_step": 150245, "epoch": 3577} {"train_loss": -6.809177398681641, "global_step": 150246, "epoch": 3577} {"train_loss": -6.868668556213379, "global_step": 150247, "epoch": 3577} {"train_loss": -6.834821701049805, "global_step": 150248, "epoch": 3577} {"train_loss": -6.895434379577637, "global_step": 150249, "epoch": 3577} {"train_loss": -6.8378729820251465, "global_step": 150250, "epoch": 3577} {"train_loss": -6.892609119415283, "global_step": 150251, "epoch": 3577} {"train_loss": -6.919788360595703, "global_step": 150252, "epoch": 3577} {"train_loss": -6.766026496887207, "global_step": 150253, "epoch": 3577} {"train_loss": -6.885135650634766, "global_step": 150254, "epoch": 3577} {"train_loss": -6.834630012512207, "global_step": 150255, "epoch": 3577} {"train_loss": -6.7772979736328125, "global_step": 150256, "epoch": 3577} {"train_loss": -6.884002685546875, "global_step": 150257, "epoch": 3577} {"train_loss": -6.670467376708984, "global_step": 150258, "epoch": 3577} {"train_loss": -6.761975288391113, "global_step": 150259, "epoch": 3577} {"train_loss": -6.8395094871521, "global_step": 150260, "epoch": 3577} {"train_loss": -6.579840660095215, "global_step": 150261, "epoch": 3577} {"train_loss": -6.856327056884766, "global_step": 150262, "epoch": 3577} {"train_loss": -6.738354682922363, "global_step": 150263, "epoch": 3577} {"train_loss": -6.856199264526367, "global_step": 150264, "epoch": 3577} {"train_loss": -6.7899556159973145, "global_step": 150265, "epoch": 3577} {"train_loss": -6.748497486114502, "global_step": 150266, "epoch": 3577} {"train_loss": -6.7485032081604, "global_step": 150267, "epoch": 3577} {"train_loss": -6.6067376136779785, "global_step": 150268, "epoch": 3577} {"train_loss": -6.890240669250488, "global_step": 150269, "epoch": 3577} {"train_loss": -6.8007612228393555, "global_step": 150270, "epoch": 3577} {"train_loss": -6.8070478439331055, "global_step": 150271, "epoch": 3577} {"train_loss": -6.875612258911133, "global_step": 150272, "epoch": 3577} {"train_loss": -6.780681610107422, "global_step": 150273, "epoch": 3577} {"train_loss": -6.9000654220581055, "global_step": 150274, "epoch": 3577} {"train_loss": -6.835107553572882, "global_step": 150275, "epoch": 3577, "val_loss": 67972.3984375} {"train_loss": -6.911216735839844, "global_step": 150276, "epoch": 3578} {"train_loss": -6.723204612731934, "global_step": 150277, "epoch": 3578} {"train_loss": -6.728045463562012, "global_step": 150278, "epoch": 3578} {"train_loss": -6.846640586853027, "global_step": 150279, "epoch": 3578} {"train_loss": -6.714821815490723, "global_step": 150280, "epoch": 3578} {"train_loss": -6.775518417358398, "global_step": 150281, "epoch": 3578} {"train_loss": -6.918440341949463, "global_step": 150282, "epoch": 3578} {"train_loss": -6.804443359375, "global_step": 150283, "epoch": 3578} {"train_loss": -6.8449201583862305, "global_step": 150284, "epoch": 3578} {"train_loss": -6.817130088806152, "global_step": 150285, "epoch": 3578} {"train_loss": -6.843319892883301, "global_step": 150286, "epoch": 3578} {"train_loss": -6.862443447113037, "global_step": 150287, "epoch": 3578} {"train_loss": -6.784359455108643, "global_step": 150288, "epoch": 3578} {"train_loss": -6.842493057250977, "global_step": 150289, "epoch": 3578} {"train_loss": -6.850989818572998, "global_step": 150290, "epoch": 3578} {"train_loss": -6.872304439544678, "global_step": 150291, "epoch": 3578} {"train_loss": -6.962250709533691, "global_step": 150292, "epoch": 3578} {"train_loss": -6.928108215332031, "global_step": 150293, "epoch": 3578} {"train_loss": -6.8460283279418945, "global_step": 150294, "epoch": 3578} {"train_loss": -6.774355888366699, "global_step": 150295, "epoch": 3578} {"train_loss": -7.04750919342041, "global_step": 150296, "epoch": 3578} {"train_loss": -6.8844380378723145, "global_step": 150297, "epoch": 3578} {"train_loss": -6.838465690612793, "global_step": 150298, "epoch": 3578} {"train_loss": -6.971190452575684, "global_step": 150299, "epoch": 3578} {"train_loss": -6.851820945739746, "global_step": 150300, "epoch": 3578} {"train_loss": -6.758991718292236, "global_step": 150301, "epoch": 3578} {"train_loss": -6.916861534118652, "global_step": 150302, "epoch": 3578} {"train_loss": -6.946893215179443, "global_step": 150303, "epoch": 3578} {"train_loss": -6.838829517364502, "global_step": 150304, "epoch": 3578} {"train_loss": -6.941859245300293, "global_step": 150305, "epoch": 3578} {"train_loss": -6.928665637969971, "global_step": 150306, "epoch": 3578} {"train_loss": -6.9249725341796875, "global_step": 150307, "epoch": 3578} {"train_loss": -6.927179336547852, "global_step": 150308, "epoch": 3578} {"train_loss": -6.942084312438965, "global_step": 150309, "epoch": 3578} {"train_loss": -6.816761016845703, "global_step": 150310, "epoch": 3578} {"train_loss": -6.879706382751465, "global_step": 150311, "epoch": 3578} {"train_loss": -6.965273380279541, "global_step": 150312, "epoch": 3578} {"train_loss": -6.795077323913574, "global_step": 150313, "epoch": 3578} {"train_loss": -6.877622604370117, "global_step": 150314, "epoch": 3578} {"train_loss": -6.914579391479492, "global_step": 150315, "epoch": 3578} {"train_loss": -6.796474456787109, "global_step": 150316, "epoch": 3578} {"train_loss": -6.8629475094023205, "global_step": 150317, "epoch": 3578, "val_loss": 67672.46875} {"train_loss": -6.901180267333984, "global_step": 150318, "epoch": 3579} {"train_loss": -7.0457940101623535, "global_step": 150319, "epoch": 3579} {"train_loss": -7.075733661651611, "global_step": 150320, "epoch": 3579} {"train_loss": -6.804083347320557, "global_step": 150321, "epoch": 3579} {"train_loss": -6.951858997344971, "global_step": 150322, "epoch": 3579} {"train_loss": -6.990447044372559, "global_step": 150323, "epoch": 3579} {"train_loss": -6.865236759185791, "global_step": 150324, "epoch": 3579} {"train_loss": -6.934925079345703, "global_step": 150325, "epoch": 3579} {"train_loss": -6.801436424255371, "global_step": 150326, "epoch": 3579} {"train_loss": -6.921961307525635, "global_step": 150327, "epoch": 3579} {"train_loss": -6.96101188659668, "global_step": 150328, "epoch": 3579} {"train_loss": -6.838092803955078, "global_step": 150329, "epoch": 3579} {"train_loss": -6.959934234619141, "global_step": 150330, "epoch": 3579} {"train_loss": -6.863609313964844, "global_step": 150331, "epoch": 3579} {"train_loss": -6.932600021362305, "global_step": 150332, "epoch": 3579} {"train_loss": -6.847281455993652, "global_step": 150333, "epoch": 3579} {"train_loss": -6.88543176651001, "global_step": 150334, "epoch": 3579} {"train_loss": -6.859503746032715, "global_step": 150335, "epoch": 3579} {"train_loss": -6.879728317260742, "global_step": 150336, "epoch": 3579} {"train_loss": -6.7967119216918945, "global_step": 150337, "epoch": 3579} {"train_loss": -6.785898208618164, "global_step": 150338, "epoch": 3579} {"train_loss": -6.840428352355957, "global_step": 150339, "epoch": 3579} {"train_loss": -6.85767936706543, "global_step": 150340, "epoch": 3579} {"train_loss": -6.874623775482178, "global_step": 150341, "epoch": 3579} {"train_loss": -6.6755523681640625, "global_step": 150342, "epoch": 3579} {"train_loss": -6.813304901123047, "global_step": 150343, "epoch": 3579} {"train_loss": -6.740070819854736, "global_step": 150344, "epoch": 3579} {"train_loss": -6.803988933563232, "global_step": 150345, "epoch": 3579} {"train_loss": -6.862183570861816, "global_step": 150346, "epoch": 3579} {"train_loss": -6.657607555389404, "global_step": 150347, "epoch": 3579} {"train_loss": -6.77195930480957, "global_step": 150348, "epoch": 3579} {"train_loss": -6.847314834594727, "global_step": 150349, "epoch": 3579} {"train_loss": -6.845785140991211, "global_step": 150350, "epoch": 3579} {"train_loss": -6.781925201416016, "global_step": 150351, "epoch": 3579} {"train_loss": -6.773366451263428, "global_step": 150352, "epoch": 3579} {"train_loss": -6.874558925628662, "global_step": 150353, "epoch": 3579} {"train_loss": -6.829089164733887, "global_step": 150354, "epoch": 3579} {"train_loss": -6.897500991821289, "global_step": 150355, "epoch": 3579} {"train_loss": -6.916359901428223, "global_step": 150356, "epoch": 3579} {"train_loss": -6.91218900680542, "global_step": 150357, "epoch": 3579} {"train_loss": -6.830798625946045, "global_step": 150358, "epoch": 3579} {"train_loss": -6.862235126041231, "global_step": 150359, "epoch": 3579, "val_loss": 67945.921875} {"train_loss": -6.88412618637085, "global_step": 150360, "epoch": 3580} {"train_loss": -6.920760154724121, "global_step": 150361, "epoch": 3580} {"train_loss": -6.838561058044434, "global_step": 150362, "epoch": 3580} {"train_loss": -6.7189483642578125, "global_step": 150363, "epoch": 3580} {"train_loss": -6.910983085632324, "global_step": 150364, "epoch": 3580} {"train_loss": -6.929132461547852, "global_step": 150365, "epoch": 3580} {"train_loss": -6.65696907043457, "global_step": 150366, "epoch": 3580} {"train_loss": -6.8866424560546875, "global_step": 150367, "epoch": 3580} {"train_loss": -6.746370792388916, "global_step": 150368, "epoch": 3580} {"train_loss": -6.7829203605651855, "global_step": 150369, "epoch": 3580} {"train_loss": -6.849094867706299, "global_step": 150370, "epoch": 3580} {"train_loss": -6.68547248840332, "global_step": 150371, "epoch": 3580} {"train_loss": -6.725630760192871, "global_step": 150372, "epoch": 3580} {"train_loss": -6.955822944641113, "global_step": 150373, "epoch": 3580} {"train_loss": -6.78404426574707, "global_step": 150374, "epoch": 3580} {"train_loss": -6.864311218261719, "global_step": 150375, "epoch": 3580} {"train_loss": -6.797198295593262, "global_step": 150376, "epoch": 3580} {"train_loss": -6.7904052734375, "global_step": 150377, "epoch": 3580} {"train_loss": -6.867302417755127, "global_step": 150378, "epoch": 3580} {"train_loss": -6.764009475708008, "global_step": 150379, "epoch": 3580} {"train_loss": -6.851287364959717, "global_step": 150380, "epoch": 3580} {"train_loss": -6.74866247177124, "global_step": 150381, "epoch": 3580} {"train_loss": -6.83369255065918, "global_step": 150382, "epoch": 3580} {"train_loss": -6.885928153991699, "global_step": 150383, "epoch": 3580} {"train_loss": -6.847581386566162, "global_step": 150384, "epoch": 3580} {"train_loss": -6.820021152496338, "global_step": 150385, "epoch": 3580} {"train_loss": -6.91567325592041, "global_step": 150386, "epoch": 3580} {"train_loss": -6.899382591247559, "global_step": 150387, "epoch": 3580} {"train_loss": -6.76991081237793, "global_step": 150388, "epoch": 3580} {"train_loss": -6.847051620483398, "global_step": 150389, "epoch": 3580} {"train_loss": -6.872692108154297, "global_step": 150390, "epoch": 3580} {"train_loss": -6.852240085601807, "global_step": 150391, "epoch": 3580} {"train_loss": -6.84981107711792, "global_step": 150392, "epoch": 3580} {"train_loss": -6.8046417236328125, "global_step": 150393, "epoch": 3580} {"train_loss": -6.686408519744873, "global_step": 150394, "epoch": 3580} {"train_loss": -6.9072771072387695, "global_step": 150395, "epoch": 3580} {"train_loss": -6.8657331466674805, "global_step": 150396, "epoch": 3580} {"train_loss": -6.830573558807373, "global_step": 150397, "epoch": 3580} {"train_loss": -6.845013618469238, "global_step": 150398, "epoch": 3580} {"train_loss": -6.896243095397949, "global_step": 150399, "epoch": 3580} {"train_loss": -6.941688060760498, "global_step": 150400, "epoch": 3580} {"train_loss": -6.83079389163426, "global_step": 150401, "epoch": 3580, "val_loss": 68055.96875} {"train_loss": -6.705982208251953, "global_step": 150402, "epoch": 3581} {"train_loss": -6.840979099273682, "global_step": 150403, "epoch": 3581} {"train_loss": -6.9143571853637695, "global_step": 150404, "epoch": 3581} {"train_loss": -6.940796852111816, "global_step": 150405, "epoch": 3581} {"train_loss": -6.911066055297852, "global_step": 150406, "epoch": 3581} {"train_loss": -6.955918312072754, "global_step": 150407, "epoch": 3581} {"train_loss": -6.853823184967041, "global_step": 150408, "epoch": 3581} {"train_loss": -6.897252082824707, "global_step": 150409, "epoch": 3581} {"train_loss": -6.806094169616699, "global_step": 150410, "epoch": 3581} {"train_loss": -6.971491813659668, "global_step": 150411, "epoch": 3581} {"train_loss": -6.8854265213012695, "global_step": 150412, "epoch": 3581} {"train_loss": -6.896656036376953, "global_step": 150413, "epoch": 3581} {"train_loss": -6.881961822509766, "global_step": 150414, "epoch": 3581} {"train_loss": -6.940759658813477, "global_step": 150415, "epoch": 3581} {"train_loss": -6.904126167297363, "global_step": 150416, "epoch": 3581} {"train_loss": -6.84567403793335, "global_step": 150417, "epoch": 3581} {"train_loss": -6.913841247558594, "global_step": 150418, "epoch": 3581} {"train_loss": -6.917996883392334, "global_step": 150419, "epoch": 3581} {"train_loss": -6.845335006713867, "global_step": 150420, "epoch": 3581} {"train_loss": -6.859459400177002, "global_step": 150421, "epoch": 3581} {"train_loss": -6.913362503051758, "global_step": 150422, "epoch": 3581} {"train_loss": -6.922187805175781, "global_step": 150423, "epoch": 3581} {"train_loss": -6.979802131652832, "global_step": 150424, "epoch": 3581} {"train_loss": -6.897668361663818, "global_step": 150425, "epoch": 3581} {"train_loss": -6.870741844177246, "global_step": 150426, "epoch": 3581} {"train_loss": -6.894522190093994, "global_step": 150427, "epoch": 3581} {"train_loss": -6.984860420227051, "global_step": 150428, "epoch": 3581} {"train_loss": -6.727720260620117, "global_step": 150429, "epoch": 3581} {"train_loss": -6.878442287445068, "global_step": 150430, "epoch": 3581} {"train_loss": -6.791710376739502, "global_step": 150431, "epoch": 3581} {"train_loss": -6.821403503417969, "global_step": 150432, "epoch": 3581} {"train_loss": -6.840524673461914, "global_step": 150433, "epoch": 3581} {"train_loss": -6.9261369705200195, "global_step": 150434, "epoch": 3581} {"train_loss": -6.814815044403076, "global_step": 150435, "epoch": 3581} {"train_loss": -6.709208011627197, "global_step": 150436, "epoch": 3581} {"train_loss": -6.827262878417969, "global_step": 150437, "epoch": 3581} {"train_loss": -6.862645149230957, "global_step": 150438, "epoch": 3581} {"train_loss": -6.818079948425293, "global_step": 150439, "epoch": 3581} {"train_loss": -6.834516525268555, "global_step": 150440, "epoch": 3581} {"train_loss": -6.878089427947998, "global_step": 150441, "epoch": 3581} {"train_loss": -6.796751022338867, "global_step": 150442, "epoch": 3581} {"train_loss": -6.871175130208333, "global_step": 150443, "epoch": 3581, "val_loss": 67827.625} {"train_loss": -6.895379066467285, "global_step": 150444, "epoch": 3582} {"train_loss": -6.809250354766846, "global_step": 150445, "epoch": 3582} {"train_loss": -6.813509464263916, "global_step": 150446, "epoch": 3582} {"train_loss": -6.785469055175781, "global_step": 150447, "epoch": 3582} {"train_loss": -6.917047500610352, "global_step": 150448, "epoch": 3582} {"train_loss": -6.825469493865967, "global_step": 150449, "epoch": 3582} {"train_loss": -6.841241359710693, "global_step": 150450, "epoch": 3582} {"train_loss": -6.923232078552246, "global_step": 150451, "epoch": 3582} {"train_loss": -6.846846103668213, "global_step": 150452, "epoch": 3582} {"train_loss": -6.925397872924805, "global_step": 150453, "epoch": 3582} {"train_loss": -6.883106231689453, "global_step": 150454, "epoch": 3582} {"train_loss": -6.8753662109375, "global_step": 150455, "epoch": 3582} {"train_loss": -6.859901428222656, "global_step": 150456, "epoch": 3582} {"train_loss": -6.8126325607299805, "global_step": 150457, "epoch": 3582} {"train_loss": -6.868436336517334, "global_step": 150458, "epoch": 3582} {"train_loss": -6.915133953094482, "global_step": 150459, "epoch": 3582} {"train_loss": -6.816744804382324, "global_step": 150460, "epoch": 3582} {"train_loss": -6.827330112457275, "global_step": 150461, "epoch": 3582} {"train_loss": -6.853226184844971, "global_step": 150462, "epoch": 3582} {"train_loss": -6.927535533905029, "global_step": 150463, "epoch": 3582} {"train_loss": -6.909305095672607, "global_step": 150464, "epoch": 3582} {"train_loss": -6.681849002838135, "global_step": 150465, "epoch": 3582} {"train_loss": -6.851394176483154, "global_step": 150466, "epoch": 3582} {"train_loss": -6.832388401031494, "global_step": 150467, "epoch": 3582} {"train_loss": -6.778480052947998, "global_step": 150468, "epoch": 3582} {"train_loss": -6.922553062438965, "global_step": 150469, "epoch": 3582} {"train_loss": -6.822123050689697, "global_step": 150470, "epoch": 3582} {"train_loss": -6.928873062133789, "global_step": 150471, "epoch": 3582} {"train_loss": -6.865389823913574, "global_step": 150472, "epoch": 3582} {"train_loss": -6.816385269165039, "global_step": 150473, "epoch": 3582} {"train_loss": -6.950897216796875, "global_step": 150474, "epoch": 3582} {"train_loss": -6.860979080200195, "global_step": 150475, "epoch": 3582} {"train_loss": -6.82845401763916, "global_step": 150476, "epoch": 3582} {"train_loss": -6.829617500305176, "global_step": 150477, "epoch": 3582} {"train_loss": -6.81144905090332, "global_step": 150478, "epoch": 3582} {"train_loss": -6.905750274658203, "global_step": 150479, "epoch": 3582} {"train_loss": -6.904664039611816, "global_step": 150480, "epoch": 3582} {"train_loss": -6.821402549743652, "global_step": 150481, "epoch": 3582} {"train_loss": -6.91109561920166, "global_step": 150482, "epoch": 3582} {"train_loss": -6.744991302490234, "global_step": 150483, "epoch": 3582} {"train_loss": -6.757284164428711, "global_step": 150484, "epoch": 3582} {"train_loss": -6.854835124242873, "global_step": 150485, "epoch": 3582, "val_loss": 68143.25} {"train_loss": -6.80714750289917, "global_step": 150486, "epoch": 3583} {"train_loss": -6.799243927001953, "global_step": 150487, "epoch": 3583} {"train_loss": -6.895338535308838, "global_step": 150488, "epoch": 3583} {"train_loss": -6.7167816162109375, "global_step": 150489, "epoch": 3583} {"train_loss": -6.872870445251465, "global_step": 150490, "epoch": 3583} {"train_loss": -6.906062602996826, "global_step": 150491, "epoch": 3583} {"train_loss": -6.915552139282227, "global_step": 150492, "epoch": 3583} {"train_loss": -6.972908973693848, "global_step": 150493, "epoch": 3583} {"train_loss": -6.983292579650879, "global_step": 150494, "epoch": 3583} {"train_loss": -6.906428337097168, "global_step": 150495, "epoch": 3583} {"train_loss": -6.845224380493164, "global_step": 150496, "epoch": 3583} {"train_loss": -6.850324630737305, "global_step": 150497, "epoch": 3583} {"train_loss": -6.893364906311035, "global_step": 150498, "epoch": 3583} {"train_loss": -6.9021406173706055, "global_step": 150499, "epoch": 3583} {"train_loss": -6.921013832092285, "global_step": 150500, "epoch": 3583} {"train_loss": -6.914243698120117, "global_step": 150501, "epoch": 3583} {"train_loss": -6.827378273010254, "global_step": 150502, "epoch": 3583} {"train_loss": -6.841823577880859, "global_step": 150503, "epoch": 3583} {"train_loss": -6.929948329925537, "global_step": 150504, "epoch": 3583} {"train_loss": -6.914823055267334, "global_step": 150505, "epoch": 3583} {"train_loss": -6.8795905113220215, "global_step": 150506, "epoch": 3583} {"train_loss": -6.986525535583496, "global_step": 150507, "epoch": 3583} {"train_loss": -6.864044189453125, "global_step": 150508, "epoch": 3583} {"train_loss": -6.766837120056152, "global_step": 150509, "epoch": 3583} {"train_loss": -6.928139686584473, "global_step": 150510, "epoch": 3583} {"train_loss": -6.903514862060547, "global_step": 150511, "epoch": 3583} {"train_loss": -6.886676788330078, "global_step": 150512, "epoch": 3583} {"train_loss": -6.942162036895752, "global_step": 150513, "epoch": 3583} {"train_loss": -6.989002227783203, "global_step": 150514, "epoch": 3583} {"train_loss": -6.990569114685059, "global_step": 150515, "epoch": 3583} {"train_loss": -6.889741897583008, "global_step": 150516, "epoch": 3583} {"train_loss": -6.8558197021484375, "global_step": 150517, "epoch": 3583} {"train_loss": -6.80663537979126, "global_step": 150518, "epoch": 3583} {"train_loss": -6.736725807189941, "global_step": 150519, "epoch": 3583} {"train_loss": -6.968383312225342, "global_step": 150520, "epoch": 3583} {"train_loss": -6.908660888671875, "global_step": 150521, "epoch": 3583} {"train_loss": -6.728537559509277, "global_step": 150522, "epoch": 3583} {"train_loss": -6.886003494262695, "global_step": 150523, "epoch": 3583} {"train_loss": -6.7957305908203125, "global_step": 150524, "epoch": 3583} {"train_loss": -6.854373455047607, "global_step": 150525, "epoch": 3583} {"train_loss": -6.809369087219238, "global_step": 150526, "epoch": 3583} {"train_loss": -6.8782677082788375, "global_step": 150527, "epoch": 3583, "val_loss": 68045.6953125} {"train_loss": -6.917510986328125, "global_step": 150528, "epoch": 3584} {"train_loss": -6.905782699584961, "global_step": 150529, "epoch": 3584} {"train_loss": -6.87789249420166, "global_step": 150530, "epoch": 3584} {"train_loss": -6.883782863616943, "global_step": 150531, "epoch": 3584} {"train_loss": -6.85272741317749, "global_step": 150532, "epoch": 3584} {"train_loss": -6.859025001525879, "global_step": 150533, "epoch": 3584} {"train_loss": -6.977119445800781, "global_step": 150534, "epoch": 3584} {"train_loss": -6.901656627655029, "global_step": 150535, "epoch": 3584} {"train_loss": -6.79561710357666, "global_step": 150536, "epoch": 3584} {"train_loss": -6.932280540466309, "global_step": 150537, "epoch": 3584} {"train_loss": -6.935892105102539, "global_step": 150538, "epoch": 3584} {"train_loss": -6.796277046203613, "global_step": 150539, "epoch": 3584} {"train_loss": -6.932162284851074, "global_step": 150540, "epoch": 3584} {"train_loss": -6.847858428955078, "global_step": 150541, "epoch": 3584} {"train_loss": -6.886314868927002, "global_step": 150542, "epoch": 3584} {"train_loss": -6.834670066833496, "global_step": 150543, "epoch": 3584} {"train_loss": -7.01885986328125, "global_step": 150544, "epoch": 3584} {"train_loss": -6.904356002807617, "global_step": 150545, "epoch": 3584} {"train_loss": -6.957918167114258, "global_step": 150546, "epoch": 3584} {"train_loss": -6.829941749572754, "global_step": 150547, "epoch": 3584} {"train_loss": -6.8644914627075195, "global_step": 150548, "epoch": 3584} {"train_loss": -6.894857883453369, "global_step": 150549, "epoch": 3584} {"train_loss": -6.996850967407227, "global_step": 150550, "epoch": 3584} {"train_loss": -6.948296070098877, "global_step": 150551, "epoch": 3584} {"train_loss": -6.962199687957764, "global_step": 150552, "epoch": 3584} {"train_loss": -6.904118537902832, "global_step": 150553, "epoch": 3584} {"train_loss": -6.924648284912109, "global_step": 150554, "epoch": 3584} {"train_loss": -7.00076150894165, "global_step": 150555, "epoch": 3584} {"train_loss": -7.077637672424316, "global_step": 150556, "epoch": 3584} {"train_loss": -6.840386867523193, "global_step": 150557, "epoch": 3584} {"train_loss": -6.883918762207031, "global_step": 150558, "epoch": 3584} {"train_loss": -6.919848442077637, "global_step": 150559, "epoch": 3584} {"train_loss": -6.893124580383301, "global_step": 150560, "epoch": 3584} {"train_loss": -7.025173187255859, "global_step": 150561, "epoch": 3584} {"train_loss": -6.821998596191406, "global_step": 150562, "epoch": 3584} {"train_loss": -6.919808387756348, "global_step": 150563, "epoch": 3584} {"train_loss": -6.9137372970581055, "global_step": 150564, "epoch": 3584} {"train_loss": -6.9076385498046875, "global_step": 150565, "epoch": 3584} {"train_loss": -6.836997985839844, "global_step": 150566, "epoch": 3584} {"train_loss": -6.892107009887695, "global_step": 150567, "epoch": 3584} {"train_loss": -6.793698310852051, "global_step": 150568, "epoch": 3584} {"train_loss": -6.902886402039301, "global_step": 150569, "epoch": 3584, "val_loss": 68031.9921875} {"train_loss": -6.9454193115234375, "global_step": 150570, "epoch": 3585} {"train_loss": -6.918503761291504, "global_step": 150571, "epoch": 3585} {"train_loss": -6.827221870422363, "global_step": 150572, "epoch": 3585} {"train_loss": -6.87248420715332, "global_step": 150573, "epoch": 3585} {"train_loss": -6.861568450927734, "global_step": 150574, "epoch": 3585} {"train_loss": -6.91427755355835, "global_step": 150575, "epoch": 3585} {"train_loss": -6.902703762054443, "global_step": 150576, "epoch": 3585} {"train_loss": -6.873039722442627, "global_step": 150577, "epoch": 3585} {"train_loss": -6.800708293914795, "global_step": 150578, "epoch": 3585} {"train_loss": -6.812358856201172, "global_step": 150579, "epoch": 3585} {"train_loss": -6.9137043952941895, "global_step": 150580, "epoch": 3585} {"train_loss": -6.801192283630371, "global_step": 150581, "epoch": 3585} {"train_loss": -6.794180870056152, "global_step": 150582, "epoch": 3585} {"train_loss": -6.886656761169434, "global_step": 150583, "epoch": 3585} {"train_loss": -6.862391471862793, "global_step": 150584, "epoch": 3585} {"train_loss": -6.767993927001953, "global_step": 150585, "epoch": 3585} {"train_loss": -6.732010841369629, "global_step": 150586, "epoch": 3585} {"train_loss": -6.746868133544922, "global_step": 150587, "epoch": 3585} {"train_loss": -6.911328315734863, "global_step": 150588, "epoch": 3585} {"train_loss": -6.802875518798828, "global_step": 150589, "epoch": 3585} {"train_loss": -6.914936065673828, "global_step": 150590, "epoch": 3585} {"train_loss": -6.762606143951416, "global_step": 150591, "epoch": 3585} {"train_loss": -6.7183637619018555, "global_step": 150592, "epoch": 3585} {"train_loss": -6.896783351898193, "global_step": 150593, "epoch": 3585} {"train_loss": -6.739850044250488, "global_step": 150594, "epoch": 3585} {"train_loss": -6.803321838378906, "global_step": 150595, "epoch": 3585} {"train_loss": -6.800617218017578, "global_step": 150596, "epoch": 3585} {"train_loss": -6.756187438964844, "global_step": 150597, "epoch": 3585} {"train_loss": -6.949008464813232, "global_step": 150598, "epoch": 3585} {"train_loss": -6.881226539611816, "global_step": 150599, "epoch": 3585} {"train_loss": -6.76662540435791, "global_step": 150600, "epoch": 3585} {"train_loss": -6.867549896240234, "global_step": 150601, "epoch": 3585} {"train_loss": -6.841126441955566, "global_step": 150602, "epoch": 3585} {"train_loss": -6.7083845138549805, "global_step": 150603, "epoch": 3585} {"train_loss": -6.834449291229248, "global_step": 150604, "epoch": 3585} {"train_loss": -6.815870761871338, "global_step": 150605, "epoch": 3585} {"train_loss": -6.818948268890381, "global_step": 150606, "epoch": 3585} {"train_loss": -6.795550346374512, "global_step": 150607, "epoch": 3585} {"train_loss": -6.81100606918335, "global_step": 150608, "epoch": 3585} {"train_loss": -6.841102600097656, "global_step": 150609, "epoch": 3585} {"train_loss": -6.859052658081055, "global_step": 150610, "epoch": 3585} {"train_loss": -6.834280127570743, "global_step": 150611, "epoch": 3585, "val_loss": 68179.3984375} {"train_loss": -6.857480049133301, "global_step": 150612, "epoch": 3586} {"train_loss": -6.822745323181152, "global_step": 150613, "epoch": 3586} {"train_loss": -6.919702053070068, "global_step": 150614, "epoch": 3586} {"train_loss": -6.987236022949219, "global_step": 150615, "epoch": 3586} {"train_loss": -6.90338134765625, "global_step": 150616, "epoch": 3586} {"train_loss": -6.727289199829102, "global_step": 150617, "epoch": 3586} {"train_loss": -6.9432597160339355, "global_step": 150618, "epoch": 3586} {"train_loss": -6.850786209106445, "global_step": 150619, "epoch": 3586} {"train_loss": -6.667396545410156, "global_step": 150620, "epoch": 3586} {"train_loss": -6.858209609985352, "global_step": 150621, "epoch": 3586} {"train_loss": -6.82695198059082, "global_step": 150622, "epoch": 3586} {"train_loss": -6.82668399810791, "global_step": 150623, "epoch": 3586} {"train_loss": -6.864728927612305, "global_step": 150624, "epoch": 3586} {"train_loss": -6.891608238220215, "global_step": 150625, "epoch": 3586} {"train_loss": -6.816608428955078, "global_step": 150626, "epoch": 3586} {"train_loss": -6.91188383102417, "global_step": 150627, "epoch": 3586} {"train_loss": -6.89837646484375, "global_step": 150628, "epoch": 3586} {"train_loss": -6.789308071136475, "global_step": 150629, "epoch": 3586} {"train_loss": -6.840329170227051, "global_step": 150630, "epoch": 3586} {"train_loss": -6.947396278381348, "global_step": 150631, "epoch": 3586} {"train_loss": -6.841647148132324, "global_step": 150632, "epoch": 3586} {"train_loss": -6.828664779663086, "global_step": 150633, "epoch": 3586} {"train_loss": -6.876908779144287, "global_step": 150634, "epoch": 3586} {"train_loss": -6.9380879402160645, "global_step": 150635, "epoch": 3586} {"train_loss": -6.863640785217285, "global_step": 150636, "epoch": 3586} {"train_loss": -6.927885055541992, "global_step": 150637, "epoch": 3586} {"train_loss": -6.889348983764648, "global_step": 150638, "epoch": 3586} {"train_loss": -6.892229080200195, "global_step": 150639, "epoch": 3586} {"train_loss": -6.857847213745117, "global_step": 150640, "epoch": 3586} {"train_loss": -6.839751720428467, "global_step": 150641, "epoch": 3586} {"train_loss": -6.78453254699707, "global_step": 150642, "epoch": 3586} {"train_loss": -6.8809051513671875, "global_step": 150643, "epoch": 3586} {"train_loss": -6.811511516571045, "global_step": 150644, "epoch": 3586} {"train_loss": -6.94868278503418, "global_step": 150645, "epoch": 3586} {"train_loss": -6.894104480743408, "global_step": 150646, "epoch": 3586} {"train_loss": -6.725282192230225, "global_step": 150647, "epoch": 3586} {"train_loss": -6.838715553283691, "global_step": 150648, "epoch": 3586} {"train_loss": -6.890473365783691, "global_step": 150649, "epoch": 3586} {"train_loss": -6.768457889556885, "global_step": 150650, "epoch": 3586} {"train_loss": -6.840327262878418, "global_step": 150651, "epoch": 3586} {"train_loss": -6.810658931732178, "global_step": 150652, "epoch": 3586} {"train_loss": -6.856589294615246, "global_step": 150653, "epoch": 3586, "val_loss": 67803.6015625} {"train_loss": -6.853141784667969, "global_step": 150654, "epoch": 3587} {"train_loss": -6.868173122406006, "global_step": 150655, "epoch": 3587} {"train_loss": -6.94992733001709, "global_step": 150656, "epoch": 3587} {"train_loss": -6.921980381011963, "global_step": 150657, "epoch": 3587} {"train_loss": -6.885836124420166, "global_step": 150658, "epoch": 3587} {"train_loss": -6.926627159118652, "global_step": 150659, "epoch": 3587} {"train_loss": -6.959499835968018, "global_step": 150660, "epoch": 3587} {"train_loss": -6.794922828674316, "global_step": 150661, "epoch": 3587} {"train_loss": -7.047308921813965, "global_step": 150662, "epoch": 3587} {"train_loss": -6.841912746429443, "global_step": 150663, "epoch": 3587} {"train_loss": -6.859713554382324, "global_step": 150664, "epoch": 3587} {"train_loss": -6.852675437927246, "global_step": 150665, "epoch": 3587} {"train_loss": -6.918764114379883, "global_step": 150666, "epoch": 3587} {"train_loss": -6.858422756195068, "global_step": 150667, "epoch": 3587} {"train_loss": -6.845494270324707, "global_step": 150668, "epoch": 3587} {"train_loss": -6.841733932495117, "global_step": 150669, "epoch": 3587} {"train_loss": -6.833066940307617, "global_step": 150670, "epoch": 3587} {"train_loss": -6.893877029418945, "global_step": 150671, "epoch": 3587} {"train_loss": -6.918798446655273, "global_step": 150672, "epoch": 3587} {"train_loss": -6.719285011291504, "global_step": 150673, "epoch": 3587} {"train_loss": -6.987992286682129, "global_step": 150674, "epoch": 3587} {"train_loss": -6.759191513061523, "global_step": 150675, "epoch": 3587} {"train_loss": -6.912363052368164, "global_step": 150676, "epoch": 3587} {"train_loss": -6.833023548126221, "global_step": 150677, "epoch": 3587} {"train_loss": -6.800784111022949, "global_step": 150678, "epoch": 3587} {"train_loss": -6.8317060470581055, "global_step": 150679, "epoch": 3587} {"train_loss": -6.8272705078125, "global_step": 150680, "epoch": 3587} {"train_loss": -6.875121116638184, "global_step": 150681, "epoch": 3587} {"train_loss": -6.914175033569336, "global_step": 150682, "epoch": 3587} {"train_loss": -6.855546951293945, "global_step": 150683, "epoch": 3587} {"train_loss": -6.803297996520996, "global_step": 150684, "epoch": 3587} {"train_loss": -6.805840015411377, "global_step": 150685, "epoch": 3587} {"train_loss": -6.934626579284668, "global_step": 150686, "epoch": 3587} {"train_loss": -6.952742099761963, "global_step": 150687, "epoch": 3587} {"train_loss": -6.709135055541992, "global_step": 150688, "epoch": 3587} {"train_loss": -6.81887149810791, "global_step": 150689, "epoch": 3587} {"train_loss": -6.838561058044434, "global_step": 150690, "epoch": 3587} {"train_loss": -6.898262977600098, "global_step": 150691, "epoch": 3587} {"train_loss": -6.879359245300293, "global_step": 150692, "epoch": 3587} {"train_loss": -6.807431221008301, "global_step": 150693, "epoch": 3587} {"train_loss": -6.765526294708252, "global_step": 150694, "epoch": 3587} {"train_loss": -6.862575542359125, "global_step": 150695, "epoch": 3587, "val_loss": 68086.3984375} {"train_loss": -6.854896545410156, "global_step": 150696, "epoch": 3588} {"train_loss": -6.8064374923706055, "global_step": 150697, "epoch": 3588} {"train_loss": -6.743339538574219, "global_step": 150698, "epoch": 3588} {"train_loss": -6.779571533203125, "global_step": 150699, "epoch": 3588} {"train_loss": -6.865303039550781, "global_step": 150700, "epoch": 3588} {"train_loss": -6.907025337219238, "global_step": 150701, "epoch": 3588} {"train_loss": -6.7884745597839355, "global_step": 150702, "epoch": 3588} {"train_loss": -6.878019332885742, "global_step": 150703, "epoch": 3588} {"train_loss": -6.764222145080566, "global_step": 150704, "epoch": 3588} {"train_loss": -6.837709426879883, "global_step": 150705, "epoch": 3588} {"train_loss": -6.865121841430664, "global_step": 150706, "epoch": 3588} {"train_loss": -6.885469436645508, "global_step": 150707, "epoch": 3588} {"train_loss": -6.797043800354004, "global_step": 150708, "epoch": 3588} {"train_loss": -6.902622222900391, "global_step": 150709, "epoch": 3588} {"train_loss": -6.697451114654541, "global_step": 150710, "epoch": 3588} {"train_loss": -6.767527103424072, "global_step": 150711, "epoch": 3588} {"train_loss": -6.820221900939941, "global_step": 150712, "epoch": 3588} {"train_loss": -6.666520118713379, "global_step": 150713, "epoch": 3588} {"train_loss": -6.7440571784973145, "global_step": 150714, "epoch": 3588} {"train_loss": -6.782209873199463, "global_step": 150715, "epoch": 3588} {"train_loss": -6.763415813446045, "global_step": 150716, "epoch": 3588} {"train_loss": -6.82662296295166, "global_step": 150717, "epoch": 3588} {"train_loss": -6.67171573638916, "global_step": 150718, "epoch": 3588} {"train_loss": -6.807773590087891, "global_step": 150719, "epoch": 3588} {"train_loss": -6.761161804199219, "global_step": 150720, "epoch": 3588} {"train_loss": -6.796115875244141, "global_step": 150721, "epoch": 3588} {"train_loss": -6.732280731201172, "global_step": 150722, "epoch": 3588} {"train_loss": -6.786830902099609, "global_step": 150723, "epoch": 3588} {"train_loss": -6.7607221603393555, "global_step": 150724, "epoch": 3588} {"train_loss": -6.841179847717285, "global_step": 150725, "epoch": 3588} {"train_loss": -6.813018321990967, "global_step": 150726, "epoch": 3588} {"train_loss": -6.7152605056762695, "global_step": 150727, "epoch": 3588} {"train_loss": -6.748108863830566, "global_step": 150728, "epoch": 3588} {"train_loss": -6.745025634765625, "global_step": 150729, "epoch": 3588} {"train_loss": -6.7875518798828125, "global_step": 150730, "epoch": 3588} {"train_loss": -6.730316162109375, "global_step": 150731, "epoch": 3588} {"train_loss": -6.754538536071777, "global_step": 150732, "epoch": 3588} {"train_loss": -6.719422817230225, "global_step": 150733, "epoch": 3588} {"train_loss": -6.691875457763672, "global_step": 150734, "epoch": 3588} {"train_loss": -6.874777793884277, "global_step": 150735, "epoch": 3588} {"train_loss": -6.840640068054199, "global_step": 150736, "epoch": 3588} {"train_loss": -6.785962263743083, "global_step": 150737, "epoch": 3588, "val_loss": 68050.890625} {"train_loss": -6.751014709472656, "global_step": 150738, "epoch": 3589} {"train_loss": -6.880744457244873, "global_step": 150739, "epoch": 3589} {"train_loss": -6.97819185256958, "global_step": 150740, "epoch": 3589} {"train_loss": -6.819097518920898, "global_step": 150741, "epoch": 3589} {"train_loss": -6.844850063323975, "global_step": 150742, "epoch": 3589} {"train_loss": -6.901628494262695, "global_step": 150743, "epoch": 3589} {"train_loss": -6.717818260192871, "global_step": 150744, "epoch": 3589} {"train_loss": -6.796698570251465, "global_step": 150745, "epoch": 3589} {"train_loss": -6.837204933166504, "global_step": 150746, "epoch": 3589} {"train_loss": -6.933140754699707, "global_step": 150747, "epoch": 3589} {"train_loss": -6.828061103820801, "global_step": 150748, "epoch": 3589} {"train_loss": -6.7746124267578125, "global_step": 150749, "epoch": 3589} {"train_loss": -6.7502336502075195, "global_step": 150750, "epoch": 3589} {"train_loss": -6.851378440856934, "global_step": 150751, "epoch": 3589} {"train_loss": -6.800929546356201, "global_step": 150752, "epoch": 3589} {"train_loss": -6.882678985595703, "global_step": 150753, "epoch": 3589} {"train_loss": -6.828541278839111, "global_step": 150754, "epoch": 3589} {"train_loss": -6.802982330322266, "global_step": 150755, "epoch": 3589} {"train_loss": -6.889202117919922, "global_step": 150756, "epoch": 3589} {"train_loss": -6.845969200134277, "global_step": 150757, "epoch": 3589} {"train_loss": -6.915207862854004, "global_step": 150758, "epoch": 3589} {"train_loss": -6.804379463195801, "global_step": 150759, "epoch": 3589} {"train_loss": -6.76716947555542, "global_step": 150760, "epoch": 3589} {"train_loss": -6.904352188110352, "global_step": 150761, "epoch": 3589} {"train_loss": -6.718435287475586, "global_step": 150762, "epoch": 3589} {"train_loss": -6.889498710632324, "global_step": 150763, "epoch": 3589} {"train_loss": -6.77484130859375, "global_step": 150764, "epoch": 3589} {"train_loss": -6.760561466217041, "global_step": 150765, "epoch": 3589} {"train_loss": -7.006350517272949, "global_step": 150766, "epoch": 3589} {"train_loss": -6.713174819946289, "global_step": 150767, "epoch": 3589} {"train_loss": -6.8305864334106445, "global_step": 150768, "epoch": 3589} {"train_loss": -6.895417213439941, "global_step": 150769, "epoch": 3589} {"train_loss": -6.926918029785156, "global_step": 150770, "epoch": 3589} {"train_loss": -6.878000259399414, "global_step": 150771, "epoch": 3589} {"train_loss": -6.865874290466309, "global_step": 150772, "epoch": 3589} {"train_loss": -7.00090217590332, "global_step": 150773, "epoch": 3589} {"train_loss": -6.782506942749023, "global_step": 150774, "epoch": 3589} {"train_loss": -6.922342300415039, "global_step": 150775, "epoch": 3589} {"train_loss": -6.794719696044922, "global_step": 150776, "epoch": 3589} {"train_loss": -6.843608856201172, "global_step": 150777, "epoch": 3589} {"train_loss": -6.890305519104004, "global_step": 150778, "epoch": 3589} {"train_loss": -6.8434320858546664, "global_step": 150779, "epoch": 3589, "val_loss": 68031.734375} {"train_loss": -6.844723701477051, "global_step": 150780, "epoch": 3590} {"train_loss": -6.789521217346191, "global_step": 150781, "epoch": 3590} {"train_loss": -6.8936967849731445, "global_step": 150782, "epoch": 3590} {"train_loss": -6.910767078399658, "global_step": 150783, "epoch": 3590} {"train_loss": -6.866863250732422, "global_step": 150784, "epoch": 3590} {"train_loss": -6.994415283203125, "global_step": 150785, "epoch": 3590} {"train_loss": -6.883029937744141, "global_step": 150786, "epoch": 3590} {"train_loss": -6.859169006347656, "global_step": 150787, "epoch": 3590} {"train_loss": -7.0113372802734375, "global_step": 150788, "epoch": 3590} {"train_loss": -6.9868597984313965, "global_step": 150789, "epoch": 3590} {"train_loss": -6.9291672706604, "global_step": 150790, "epoch": 3590} {"train_loss": -6.865965843200684, "global_step": 150791, "epoch": 3590} {"train_loss": -6.800712585449219, "global_step": 150792, "epoch": 3590} {"train_loss": -6.831512451171875, "global_step": 150793, "epoch": 3590} {"train_loss": -6.764790058135986, "global_step": 150794, "epoch": 3590} {"train_loss": -6.961095809936523, "global_step": 150795, "epoch": 3590} {"train_loss": -6.874905586242676, "global_step": 150796, "epoch": 3590} {"train_loss": -6.78091287612915, "global_step": 150797, "epoch": 3590} {"train_loss": -7.000555515289307, "global_step": 150798, "epoch": 3590} {"train_loss": -6.8064799308776855, "global_step": 150799, "epoch": 3590} {"train_loss": -6.844856262207031, "global_step": 150800, "epoch": 3590} {"train_loss": -6.813525199890137, "global_step": 150801, "epoch": 3590} {"train_loss": -6.913457870483398, "global_step": 150802, "epoch": 3590} {"train_loss": -6.884730339050293, "global_step": 150803, "epoch": 3590} {"train_loss": -6.802829742431641, "global_step": 150804, "epoch": 3590} {"train_loss": -6.887801647186279, "global_step": 150805, "epoch": 3590} {"train_loss": -6.810891151428223, "global_step": 150806, "epoch": 3590} {"train_loss": -6.942157745361328, "global_step": 150807, "epoch": 3590} {"train_loss": -6.85310173034668, "global_step": 150808, "epoch": 3590} {"train_loss": -6.877571105957031, "global_step": 150809, "epoch": 3590} {"train_loss": -6.879061698913574, "global_step": 150810, "epoch": 3590} {"train_loss": -6.801741123199463, "global_step": 150811, "epoch": 3590} {"train_loss": -6.808709144592285, "global_step": 150812, "epoch": 3590} {"train_loss": -6.827657699584961, "global_step": 150813, "epoch": 3590} {"train_loss": -6.859670162200928, "global_step": 150814, "epoch": 3590} {"train_loss": -6.819870948791504, "global_step": 150815, "epoch": 3590} {"train_loss": -6.795816421508789, "global_step": 150816, "epoch": 3590} {"train_loss": -6.881954669952393, "global_step": 150817, "epoch": 3590} {"train_loss": -6.930221080780029, "global_step": 150818, "epoch": 3590} {"train_loss": -6.839939117431641, "global_step": 150819, "epoch": 3590} {"train_loss": -6.874106407165527, "global_step": 150820, "epoch": 3590} {"train_loss": -6.86881312869844, "global_step": 150821, "epoch": 3590, "val_loss": 67986.5546875} {"train_loss": -6.973392486572266, "global_step": 150822, "epoch": 3591} {"train_loss": -6.886663913726807, "global_step": 150823, "epoch": 3591} {"train_loss": -6.877896308898926, "global_step": 150824, "epoch": 3591} {"train_loss": -6.815142631530762, "global_step": 150825, "epoch": 3591} {"train_loss": -6.80207633972168, "global_step": 150826, "epoch": 3591} {"train_loss": -6.878624439239502, "global_step": 150827, "epoch": 3591} {"train_loss": -6.89902400970459, "global_step": 150828, "epoch": 3591} {"train_loss": -6.862034797668457, "global_step": 150829, "epoch": 3591} {"train_loss": -6.905672073364258, "global_step": 150830, "epoch": 3591} {"train_loss": -6.947100639343262, "global_step": 150831, "epoch": 3591} {"train_loss": -6.792675018310547, "global_step": 150832, "epoch": 3591} {"train_loss": -6.763498783111572, "global_step": 150833, "epoch": 3591} {"train_loss": -6.845658302307129, "global_step": 150834, "epoch": 3591} {"train_loss": -6.935598373413086, "global_step": 150835, "epoch": 3591} {"train_loss": -6.825648307800293, "global_step": 150836, "epoch": 3591} {"train_loss": -6.921516418457031, "global_step": 150837, "epoch": 3591} {"train_loss": -6.858062744140625, "global_step": 150838, "epoch": 3591} {"train_loss": -6.937299728393555, "global_step": 150839, "epoch": 3591} {"train_loss": -6.843791961669922, "global_step": 150840, "epoch": 3591} {"train_loss": -6.881733417510986, "global_step": 150841, "epoch": 3591} {"train_loss": -6.913280963897705, "global_step": 150842, "epoch": 3591} {"train_loss": -6.860726356506348, "global_step": 150843, "epoch": 3591} {"train_loss": -6.844358444213867, "global_step": 150844, "epoch": 3591} {"train_loss": -6.859264850616455, "global_step": 150845, "epoch": 3591} {"train_loss": -6.749195098876953, "global_step": 150846, "epoch": 3591} {"train_loss": -6.893551826477051, "global_step": 150847, "epoch": 3591} {"train_loss": -6.91124153137207, "global_step": 150848, "epoch": 3591} {"train_loss": -6.892642974853516, "global_step": 150849, "epoch": 3591} {"train_loss": -6.922186374664307, "global_step": 150850, "epoch": 3591} {"train_loss": -6.844578266143799, "global_step": 150851, "epoch": 3591} {"train_loss": -6.812436103820801, "global_step": 150852, "epoch": 3591} {"train_loss": -6.967741966247559, "global_step": 150853, "epoch": 3591} {"train_loss": -7.0383429527282715, "global_step": 150854, "epoch": 3591} {"train_loss": -6.95109224319458, "global_step": 150855, "epoch": 3591} {"train_loss": -7.018886566162109, "global_step": 150856, "epoch": 3591} {"train_loss": -6.9303789138793945, "global_step": 150857, "epoch": 3591} {"train_loss": -6.887843608856201, "global_step": 150858, "epoch": 3591} {"train_loss": -6.981672763824463, "global_step": 150859, "epoch": 3591} {"train_loss": -6.916626930236816, "global_step": 150860, "epoch": 3591} {"train_loss": -6.977128028869629, "global_step": 150861, "epoch": 3591} {"train_loss": -6.91552209854126, "global_step": 150862, "epoch": 3591} {"train_loss": -6.892525775091989, "global_step": 150863, "epoch": 3591, "val_loss": 67927.7109375} {"train_loss": -7.003486633300781, "global_step": 150864, "epoch": 3592} {"train_loss": -6.884369850158691, "global_step": 150865, "epoch": 3592} {"train_loss": -7.051909923553467, "global_step": 150866, "epoch": 3592} {"train_loss": -6.9640116691589355, "global_step": 150867, "epoch": 3592} {"train_loss": -6.987698078155518, "global_step": 150868, "epoch": 3592} {"train_loss": -6.943826198577881, "global_step": 150869, "epoch": 3592} {"train_loss": -6.868241310119629, "global_step": 150870, "epoch": 3592} {"train_loss": -6.891989231109619, "global_step": 150871, "epoch": 3592} {"train_loss": -6.80893611907959, "global_step": 150872, "epoch": 3592} {"train_loss": -6.893026351928711, "global_step": 150873, "epoch": 3592} {"train_loss": -6.905097961425781, "global_step": 150874, "epoch": 3592} {"train_loss": -6.856166362762451, "global_step": 150875, "epoch": 3592} {"train_loss": -6.800074577331543, "global_step": 150876, "epoch": 3592} {"train_loss": -6.948102951049805, "global_step": 150877, "epoch": 3592} {"train_loss": -6.830447196960449, "global_step": 150878, "epoch": 3592} {"train_loss": -6.9101948738098145, "global_step": 150879, "epoch": 3592} {"train_loss": -6.846548080444336, "global_step": 150880, "epoch": 3592} {"train_loss": -6.904997825622559, "global_step": 150881, "epoch": 3592} {"train_loss": -6.837357521057129, "global_step": 150882, "epoch": 3592} {"train_loss": -6.7118120193481445, "global_step": 150883, "epoch": 3592} {"train_loss": -6.8971381187438965, "global_step": 150884, "epoch": 3592} {"train_loss": -6.797946929931641, "global_step": 150885, "epoch": 3592} {"train_loss": -6.828269004821777, "global_step": 150886, "epoch": 3592} {"train_loss": -6.883255958557129, "global_step": 150887, "epoch": 3592} {"train_loss": -6.781533718109131, "global_step": 150888, "epoch": 3592} {"train_loss": -6.874805450439453, "global_step": 150889, "epoch": 3592} {"train_loss": -6.652742385864258, "global_step": 150890, "epoch": 3592} {"train_loss": -6.834290981292725, "global_step": 150891, "epoch": 3592} {"train_loss": -6.902257919311523, "global_step": 150892, "epoch": 3592} {"train_loss": -6.653547763824463, "global_step": 150893, "epoch": 3592} {"train_loss": -6.902580261230469, "global_step": 150894, "epoch": 3592} {"train_loss": -6.896724224090576, "global_step": 150895, "epoch": 3592} {"train_loss": -6.912718772888184, "global_step": 150896, "epoch": 3592} {"train_loss": -6.814111709594727, "global_step": 150897, "epoch": 3592} {"train_loss": -6.739147186279297, "global_step": 150898, "epoch": 3592} {"train_loss": -6.896478652954102, "global_step": 150899, "epoch": 3592} {"train_loss": -6.698360919952393, "global_step": 150900, "epoch": 3592} {"train_loss": -6.859678268432617, "global_step": 150901, "epoch": 3592} {"train_loss": -6.856572151184082, "global_step": 150902, "epoch": 3592} {"train_loss": -6.878596305847168, "global_step": 150903, "epoch": 3592} {"train_loss": -6.8604583740234375, "global_step": 150904, "epoch": 3592} {"train_loss": -6.860784916650681, "global_step": 150905, "epoch": 3592, "val_loss": 68243.3125} {"train_loss": -6.8424224853515625, "global_step": 150906, "epoch": 3593} {"train_loss": -6.850311279296875, "global_step": 150907, "epoch": 3593} {"train_loss": -6.704702854156494, "global_step": 150908, "epoch": 3593} {"train_loss": -6.842031955718994, "global_step": 150909, "epoch": 3593} {"train_loss": -6.870916843414307, "global_step": 150910, "epoch": 3593} {"train_loss": -6.792004585266113, "global_step": 150911, "epoch": 3593} {"train_loss": -6.75120735168457, "global_step": 150912, "epoch": 3593} {"train_loss": -6.819781303405762, "global_step": 150913, "epoch": 3593} {"train_loss": -6.874810218811035, "global_step": 150914, "epoch": 3593} {"train_loss": -6.8476128578186035, "global_step": 150915, "epoch": 3593} {"train_loss": -6.853662490844727, "global_step": 150916, "epoch": 3593} {"train_loss": -6.889769554138184, "global_step": 150917, "epoch": 3593} {"train_loss": -6.8474507331848145, "global_step": 150918, "epoch": 3593} {"train_loss": -6.763737201690674, "global_step": 150919, "epoch": 3593} {"train_loss": -6.834143161773682, "global_step": 150920, "epoch": 3593} {"train_loss": -6.889543533325195, "global_step": 150921, "epoch": 3593} {"train_loss": -6.778361797332764, "global_step": 150922, "epoch": 3593} {"train_loss": -6.729503631591797, "global_step": 150923, "epoch": 3593} {"train_loss": -6.840386867523193, "global_step": 150924, "epoch": 3593} {"train_loss": -6.871135711669922, "global_step": 150925, "epoch": 3593} {"train_loss": -6.826330184936523, "global_step": 150926, "epoch": 3593} {"train_loss": -6.741267681121826, "global_step": 150927, "epoch": 3593} {"train_loss": -6.6891045570373535, "global_step": 150928, "epoch": 3593} {"train_loss": -6.8554534912109375, "global_step": 150929, "epoch": 3593} {"train_loss": -6.822742462158203, "global_step": 150930, "epoch": 3593} {"train_loss": -6.875261306762695, "global_step": 150931, "epoch": 3593} {"train_loss": -6.875136375427246, "global_step": 150932, "epoch": 3593} {"train_loss": -6.7234344482421875, "global_step": 150933, "epoch": 3593} {"train_loss": -6.852867603302002, "global_step": 150934, "epoch": 3593} {"train_loss": -6.860952854156494, "global_step": 150935, "epoch": 3593} {"train_loss": -6.851095199584961, "global_step": 150936, "epoch": 3593} {"train_loss": -6.802762985229492, "global_step": 150937, "epoch": 3593} {"train_loss": -6.7952046394348145, "global_step": 150938, "epoch": 3593} {"train_loss": -6.792925834655762, "global_step": 150939, "epoch": 3593} {"train_loss": -6.844855308532715, "global_step": 150940, "epoch": 3593} {"train_loss": -6.865948677062988, "global_step": 150941, "epoch": 3593} {"train_loss": -6.819649696350098, "global_step": 150942, "epoch": 3593} {"train_loss": -6.843044281005859, "global_step": 150943, "epoch": 3593} {"train_loss": -6.844718933105469, "global_step": 150944, "epoch": 3593} {"train_loss": -6.83787727355957, "global_step": 150945, "epoch": 3593} {"train_loss": -6.777144432067871, "global_step": 150946, "epoch": 3593} {"train_loss": -6.8227878865741545, "global_step": 150947, "epoch": 3593, "val_loss": 67962.890625} {"train_loss": -6.931804656982422, "global_step": 150948, "epoch": 3594} {"train_loss": -6.775111198425293, "global_step": 150949, "epoch": 3594} {"train_loss": -6.91350793838501, "global_step": 150950, "epoch": 3594} {"train_loss": -6.724221229553223, "global_step": 150951, "epoch": 3594} {"train_loss": -6.853515625, "global_step": 150952, "epoch": 3594} {"train_loss": -6.822142124176025, "global_step": 150953, "epoch": 3594} {"train_loss": -6.815694808959961, "global_step": 150954, "epoch": 3594} {"train_loss": -6.895790100097656, "global_step": 150955, "epoch": 3594} {"train_loss": -6.8769941329956055, "global_step": 150956, "epoch": 3594} {"train_loss": -6.881508827209473, "global_step": 150957, "epoch": 3594} {"train_loss": -6.867787837982178, "global_step": 150958, "epoch": 3594} {"train_loss": -6.844151496887207, "global_step": 150959, "epoch": 3594} {"train_loss": -6.8836445808410645, "global_step": 150960, "epoch": 3594} {"train_loss": -6.90134334564209, "global_step": 150961, "epoch": 3594} {"train_loss": -6.825702667236328, "global_step": 150962, "epoch": 3594} {"train_loss": -6.880539894104004, "global_step": 150963, "epoch": 3594} {"train_loss": -6.81854772567749, "global_step": 150964, "epoch": 3594} {"train_loss": -6.856560230255127, "global_step": 150965, "epoch": 3594} {"train_loss": -6.741908550262451, "global_step": 150966, "epoch": 3594} {"train_loss": -6.943160533905029, "global_step": 150967, "epoch": 3594} {"train_loss": -6.858058452606201, "global_step": 150968, "epoch": 3594} {"train_loss": -6.819110870361328, "global_step": 150969, "epoch": 3594} {"train_loss": -6.845938682556152, "global_step": 150970, "epoch": 3594} {"train_loss": -6.8914079666137695, "global_step": 150971, "epoch": 3594} {"train_loss": -6.9382171630859375, "global_step": 150972, "epoch": 3594} {"train_loss": -6.881622314453125, "global_step": 150973, "epoch": 3594} {"train_loss": -6.811697959899902, "global_step": 150974, "epoch": 3594} {"train_loss": -6.897457122802734, "global_step": 150975, "epoch": 3594} {"train_loss": -6.875659465789795, "global_step": 150976, "epoch": 3594} {"train_loss": -6.81505012512207, "global_step": 150977, "epoch": 3594} {"train_loss": -6.722102165222168, "global_step": 150978, "epoch": 3594} {"train_loss": -6.813674449920654, "global_step": 150979, "epoch": 3594} {"train_loss": -6.752927780151367, "global_step": 150980, "epoch": 3594} {"train_loss": -6.764364719390869, "global_step": 150981, "epoch": 3594} {"train_loss": -6.717897415161133, "global_step": 150982, "epoch": 3594} {"train_loss": -6.742318153381348, "global_step": 150983, "epoch": 3594} {"train_loss": -6.908315181732178, "global_step": 150984, "epoch": 3594} {"train_loss": -6.766136169433594, "global_step": 150985, "epoch": 3594} {"train_loss": -6.803192138671875, "global_step": 150986, "epoch": 3594} {"train_loss": -6.68228816986084, "global_step": 150987, "epoch": 3594} {"train_loss": -6.7134690284729, "global_step": 150988, "epoch": 3594} {"train_loss": -6.8280008633931475, "global_step": 150989, "epoch": 3594, "val_loss": 68180.5859375} {"train_loss": -6.754619598388672, "global_step": 150990, "epoch": 3595} {"train_loss": -6.78024959564209, "global_step": 150991, "epoch": 3595} {"train_loss": -6.772460460662842, "global_step": 150992, "epoch": 3595} {"train_loss": -6.848153114318848, "global_step": 150993, "epoch": 3595} {"train_loss": -6.69151496887207, "global_step": 150994, "epoch": 3595} {"train_loss": -6.689718723297119, "global_step": 150995, "epoch": 3595} {"train_loss": -6.775436878204346, "global_step": 150996, "epoch": 3595} {"train_loss": -6.745837211608887, "global_step": 150997, "epoch": 3595} {"train_loss": -6.7786173820495605, "global_step": 150998, "epoch": 3595} {"train_loss": -6.886453151702881, "global_step": 150999, "epoch": 3595} {"train_loss": -6.756760597229004, "global_step": 151000, "epoch": 3595} {"train_loss": -6.660982131958008, "global_step": 151001, "epoch": 3595} {"train_loss": -6.749982833862305, "global_step": 151002, "epoch": 3595} {"train_loss": -6.73819637298584, "global_step": 151003, "epoch": 3595} {"train_loss": -6.870334625244141, "global_step": 151004, "epoch": 3595} {"train_loss": -6.812191963195801, "global_step": 151005, "epoch": 3595} {"train_loss": -6.749392509460449, "global_step": 151006, "epoch": 3595} {"train_loss": -6.861073017120361, "global_step": 151007, "epoch": 3595} {"train_loss": -6.786446571350098, "global_step": 151008, "epoch": 3595} {"train_loss": -6.593815326690674, "global_step": 151009, "epoch": 3595} {"train_loss": -6.785585403442383, "global_step": 151010, "epoch": 3595} {"train_loss": -6.786515712738037, "global_step": 151011, "epoch": 3595} {"train_loss": -6.807730197906494, "global_step": 151012, "epoch": 3595} {"train_loss": -6.783696174621582, "global_step": 151013, "epoch": 3595} {"train_loss": -6.85176944732666, "global_step": 151014, "epoch": 3595} {"train_loss": -6.6623005867004395, "global_step": 151015, "epoch": 3595} {"train_loss": -6.822715759277344, "global_step": 151016, "epoch": 3595} {"train_loss": -6.734802722930908, "global_step": 151017, "epoch": 3595} {"train_loss": -6.80239200592041, "global_step": 151018, "epoch": 3595} {"train_loss": -6.8387322425842285, "global_step": 151019, "epoch": 3595} {"train_loss": -6.867388725280762, "global_step": 151020, "epoch": 3595} {"train_loss": -6.78349494934082, "global_step": 151021, "epoch": 3595} {"train_loss": -6.911590099334717, "global_step": 151022, "epoch": 3595} {"train_loss": -6.718646049499512, "global_step": 151023, "epoch": 3595} {"train_loss": -6.757952690124512, "global_step": 151024, "epoch": 3595} {"train_loss": -6.982537269592285, "global_step": 151025, "epoch": 3595} {"train_loss": -6.734349250793457, "global_step": 151026, "epoch": 3595} {"train_loss": -6.8649396896362305, "global_step": 151027, "epoch": 3595} {"train_loss": -6.770308494567871, "global_step": 151028, "epoch": 3595} {"train_loss": -6.795658111572266, "global_step": 151029, "epoch": 3595} {"train_loss": -6.804788589477539, "global_step": 151030, "epoch": 3595} {"train_loss": -6.784752584639049, "global_step": 151031, "epoch": 3595, "val_loss": 68064.0078125} {"train_loss": -6.754235744476318, "global_step": 151032, "epoch": 3596} {"train_loss": -6.849114894866943, "global_step": 151033, "epoch": 3596} {"train_loss": -6.871746063232422, "global_step": 151034, "epoch": 3596} {"train_loss": -6.870138168334961, "global_step": 151035, "epoch": 3596} {"train_loss": -6.86549186706543, "global_step": 151036, "epoch": 3596} {"train_loss": -6.924893379211426, "global_step": 151037, "epoch": 3596} {"train_loss": -6.844205379486084, "global_step": 151038, "epoch": 3596} {"train_loss": -6.8724188804626465, "global_step": 151039, "epoch": 3596} {"train_loss": -6.850311279296875, "global_step": 151040, "epoch": 3596} {"train_loss": -6.893322944641113, "global_step": 151041, "epoch": 3596} {"train_loss": -6.752224922180176, "global_step": 151042, "epoch": 3596} {"train_loss": -6.87049674987793, "global_step": 151043, "epoch": 3596} {"train_loss": -6.763319969177246, "global_step": 151044, "epoch": 3596} {"train_loss": -7.0024566650390625, "global_step": 151045, "epoch": 3596} {"train_loss": -6.823783874511719, "global_step": 151046, "epoch": 3596} {"train_loss": -6.895859718322754, "global_step": 151047, "epoch": 3596} {"train_loss": -6.949898719787598, "global_step": 151048, "epoch": 3596} {"train_loss": -6.893180847167969, "global_step": 151049, "epoch": 3596} {"train_loss": -6.909180641174316, "global_step": 151050, "epoch": 3596} {"train_loss": -6.846218109130859, "global_step": 151051, "epoch": 3596} {"train_loss": -6.894330978393555, "global_step": 151052, "epoch": 3596} {"train_loss": -6.848903656005859, "global_step": 151053, "epoch": 3596} {"train_loss": -6.801568984985352, "global_step": 151054, "epoch": 3596} {"train_loss": -6.997093200683594, "global_step": 151055, "epoch": 3596} {"train_loss": -6.856560707092285, "global_step": 151056, "epoch": 3596} {"train_loss": -6.846532821655273, "global_step": 151057, "epoch": 3596} {"train_loss": -6.899194717407227, "global_step": 151058, "epoch": 3596} {"train_loss": -6.909554481506348, "global_step": 151059, "epoch": 3596} {"train_loss": -6.939542770385742, "global_step": 151060, "epoch": 3596} {"train_loss": -6.8592424392700195, "global_step": 151061, "epoch": 3596} {"train_loss": -6.801183223724365, "global_step": 151062, "epoch": 3596} {"train_loss": -6.975305557250977, "global_step": 151063, "epoch": 3596} {"train_loss": -6.792129993438721, "global_step": 151064, "epoch": 3596} {"train_loss": -6.937469482421875, "global_step": 151065, "epoch": 3596} {"train_loss": -6.853584289550781, "global_step": 151066, "epoch": 3596} {"train_loss": -6.891389846801758, "global_step": 151067, "epoch": 3596} {"train_loss": -6.8548479080200195, "global_step": 151068, "epoch": 3596} {"train_loss": -6.9154052734375, "global_step": 151069, "epoch": 3596} {"train_loss": -7.003515243530273, "global_step": 151070, "epoch": 3596} {"train_loss": -6.849551200866699, "global_step": 151071, "epoch": 3596} {"train_loss": -6.797735214233398, "global_step": 151072, "epoch": 3596} {"train_loss": -6.873670191991897, "global_step": 151073, "epoch": 3596, "val_loss": 68036.5625} {"train_loss": -6.969977855682373, "global_step": 151074, "epoch": 3597} {"train_loss": -6.952937126159668, "global_step": 151075, "epoch": 3597} {"train_loss": -6.897335052490234, "global_step": 151076, "epoch": 3597} {"train_loss": -6.909738063812256, "global_step": 151077, "epoch": 3597} {"train_loss": -6.990519046783447, "global_step": 151078, "epoch": 3597} {"train_loss": -6.856002330780029, "global_step": 151079, "epoch": 3597} {"train_loss": -6.837698459625244, "global_step": 151080, "epoch": 3597} {"train_loss": -6.962064743041992, "global_step": 151081, "epoch": 3597} {"train_loss": -6.8668718338012695, "global_step": 151082, "epoch": 3597} {"train_loss": -6.686391353607178, "global_step": 151083, "epoch": 3597} {"train_loss": -6.942454814910889, "global_step": 151084, "epoch": 3597} {"train_loss": -6.9239501953125, "global_step": 151085, "epoch": 3597} {"train_loss": -6.906079292297363, "global_step": 151086, "epoch": 3597} {"train_loss": -6.90580940246582, "global_step": 151087, "epoch": 3597} {"train_loss": -6.840283393859863, "global_step": 151088, "epoch": 3597} {"train_loss": -6.927077293395996, "global_step": 151089, "epoch": 3597} {"train_loss": -6.882191181182861, "global_step": 151090, "epoch": 3597} {"train_loss": -6.753605842590332, "global_step": 151091, "epoch": 3597} {"train_loss": -6.96083927154541, "global_step": 151092, "epoch": 3597} {"train_loss": -7.01165771484375, "global_step": 151093, "epoch": 3597} {"train_loss": -6.854328155517578, "global_step": 151094, "epoch": 3597} {"train_loss": -6.835524559020996, "global_step": 151095, "epoch": 3597} {"train_loss": -6.936857223510742, "global_step": 151096, "epoch": 3597} {"train_loss": -6.885037422180176, "global_step": 151097, "epoch": 3597} {"train_loss": -6.843430995941162, "global_step": 151098, "epoch": 3597} {"train_loss": -6.93864631652832, "global_step": 151099, "epoch": 3597} {"train_loss": -6.74237585067749, "global_step": 151100, "epoch": 3597} {"train_loss": -6.778748989105225, "global_step": 151101, "epoch": 3597} {"train_loss": -6.951742172241211, "global_step": 151102, "epoch": 3597} {"train_loss": -6.784285068511963, "global_step": 151103, "epoch": 3597} {"train_loss": -6.8615288734436035, "global_step": 151104, "epoch": 3597} {"train_loss": -6.91233491897583, "global_step": 151105, "epoch": 3597} {"train_loss": -6.747011661529541, "global_step": 151106, "epoch": 3597} {"train_loss": -6.781036376953125, "global_step": 151107, "epoch": 3597} {"train_loss": -6.898505210876465, "global_step": 151108, "epoch": 3597} {"train_loss": -6.880290508270264, "global_step": 151109, "epoch": 3597} {"train_loss": -6.916842460632324, "global_step": 151110, "epoch": 3597} {"train_loss": -6.798234939575195, "global_step": 151111, "epoch": 3597} {"train_loss": -6.9214253425598145, "global_step": 151112, "epoch": 3597} {"train_loss": -6.9276533126831055, "global_step": 151113, "epoch": 3597} {"train_loss": -6.887238502502441, "global_step": 151114, "epoch": 3597} {"train_loss": -6.881520055589222, "global_step": 151115, "epoch": 3597, "val_loss": 68051.296875} {"train_loss": -7.013645172119141, "global_step": 151116, "epoch": 3598} {"train_loss": -6.959362983703613, "global_step": 151117, "epoch": 3598} {"train_loss": -6.860027313232422, "global_step": 151118, "epoch": 3598} {"train_loss": -7.0008344650268555, "global_step": 151119, "epoch": 3598} {"train_loss": -6.923933029174805, "global_step": 151120, "epoch": 3598} {"train_loss": -6.930126190185547, "global_step": 151121, "epoch": 3598} {"train_loss": -6.887228488922119, "global_step": 151122, "epoch": 3598} {"train_loss": -6.945344924926758, "global_step": 151123, "epoch": 3598} {"train_loss": -6.9008469581604, "global_step": 151124, "epoch": 3598} {"train_loss": -6.818284034729004, "global_step": 151125, "epoch": 3598} {"train_loss": -6.858807563781738, "global_step": 151126, "epoch": 3598} {"train_loss": -6.9386396408081055, "global_step": 151127, "epoch": 3598} {"train_loss": -6.8527913093566895, "global_step": 151128, "epoch": 3598} {"train_loss": -6.877199649810791, "global_step": 151129, "epoch": 3598} {"train_loss": -6.848913669586182, "global_step": 151130, "epoch": 3598} {"train_loss": -6.966391563415527, "global_step": 151131, "epoch": 3598} {"train_loss": -6.917799949645996, "global_step": 151132, "epoch": 3598} {"train_loss": -6.99168062210083, "global_step": 151133, "epoch": 3598} {"train_loss": -6.979371070861816, "global_step": 151134, "epoch": 3598} {"train_loss": -6.82496976852417, "global_step": 151135, "epoch": 3598} {"train_loss": -6.814140319824219, "global_step": 151136, "epoch": 3598} {"train_loss": -6.903306007385254, "global_step": 151137, "epoch": 3598} {"train_loss": -6.817739009857178, "global_step": 151138, "epoch": 3598} {"train_loss": -6.7621541023254395, "global_step": 151139, "epoch": 3598} {"train_loss": -6.89986515045166, "global_step": 151140, "epoch": 3598} {"train_loss": -6.866665840148926, "global_step": 151141, "epoch": 3598} {"train_loss": -6.828052520751953, "global_step": 151142, "epoch": 3598} {"train_loss": -6.813250541687012, "global_step": 151143, "epoch": 3598} {"train_loss": -6.928866386413574, "global_step": 151144, "epoch": 3598} {"train_loss": -6.7628302574157715, "global_step": 151145, "epoch": 3598} {"train_loss": -6.924966812133789, "global_step": 151146, "epoch": 3598} {"train_loss": -6.673849582672119, "global_step": 151147, "epoch": 3598} {"train_loss": -6.7562408447265625, "global_step": 151148, "epoch": 3598} {"train_loss": -6.83863639831543, "global_step": 151149, "epoch": 3598} {"train_loss": -6.779871463775635, "global_step": 151150, "epoch": 3598} {"train_loss": -6.721390724182129, "global_step": 151151, "epoch": 3598} {"train_loss": -6.837855815887451, "global_step": 151152, "epoch": 3598} {"train_loss": -6.728979587554932, "global_step": 151153, "epoch": 3598} {"train_loss": -6.743869781494141, "global_step": 151154, "epoch": 3598} {"train_loss": -6.745935440063477, "global_step": 151155, "epoch": 3598} {"train_loss": -6.818520545959473, "global_step": 151156, "epoch": 3598} {"train_loss": -6.8569190956297374, "global_step": 151157, "epoch": 3598, "val_loss": 68069.0859375} {"train_loss": -6.8527936935424805, "global_step": 151158, "epoch": 3599} {"train_loss": -6.803378105163574, "global_step": 151159, "epoch": 3599} {"train_loss": -6.80620002746582, "global_step": 151160, "epoch": 3599} {"train_loss": -6.700880527496338, "global_step": 151161, "epoch": 3599} {"train_loss": -6.640361785888672, "global_step": 151162, "epoch": 3599} {"train_loss": -6.824243068695068, "global_step": 151163, "epoch": 3599} {"train_loss": -6.68479061126709, "global_step": 151164, "epoch": 3599} {"train_loss": -6.717261791229248, "global_step": 151165, "epoch": 3599} {"train_loss": -6.875359535217285, "global_step": 151166, "epoch": 3599} {"train_loss": -6.805179119110107, "global_step": 151167, "epoch": 3599} {"train_loss": -6.773885726928711, "global_step": 151168, "epoch": 3599} {"train_loss": -6.8690595626831055, "global_step": 151169, "epoch": 3599} {"train_loss": -6.762348175048828, "global_step": 151170, "epoch": 3599} {"train_loss": -6.909514904022217, "global_step": 151171, "epoch": 3599} {"train_loss": -6.886260986328125, "global_step": 151172, "epoch": 3599} {"train_loss": -6.858964920043945, "global_step": 151173, "epoch": 3599} {"train_loss": -6.813749313354492, "global_step": 151174, "epoch": 3599} {"train_loss": -6.816007614135742, "global_step": 151175, "epoch": 3599} {"train_loss": -6.884206771850586, "global_step": 151176, "epoch": 3599} {"train_loss": -6.826169013977051, "global_step": 151177, "epoch": 3599} {"train_loss": -6.820863246917725, "global_step": 151178, "epoch": 3599} {"train_loss": -6.880153656005859, "global_step": 151179, "epoch": 3599} {"train_loss": -6.8111982345581055, "global_step": 151180, "epoch": 3599} {"train_loss": -6.927909851074219, "global_step": 151181, "epoch": 3599} {"train_loss": -6.873668670654297, "global_step": 151182, "epoch": 3599} {"train_loss": -6.810445785522461, "global_step": 151183, "epoch": 3599} {"train_loss": -6.908153533935547, "global_step": 151184, "epoch": 3599} {"train_loss": -6.964734077453613, "global_step": 151185, "epoch": 3599} {"train_loss": -6.9813690185546875, "global_step": 151186, "epoch": 3599} {"train_loss": -6.861978530883789, "global_step": 151187, "epoch": 3599} {"train_loss": -6.822779655456543, "global_step": 151188, "epoch": 3599} {"train_loss": -7.028961181640625, "global_step": 151189, "epoch": 3599} {"train_loss": -6.9120025634765625, "global_step": 151190, "epoch": 3599} {"train_loss": -6.829633712768555, "global_step": 151191, "epoch": 3599} {"train_loss": -6.868979454040527, "global_step": 151192, "epoch": 3599} {"train_loss": -6.799766540527344, "global_step": 151193, "epoch": 3599} {"train_loss": -6.780315399169922, "global_step": 151194, "epoch": 3599} {"train_loss": -6.843649864196777, "global_step": 151195, "epoch": 3599} {"train_loss": -6.678847312927246, "global_step": 151196, "epoch": 3599} {"train_loss": -6.8762664794921875, "global_step": 151197, "epoch": 3599} {"train_loss": -6.84155797958374, "global_step": 151198, "epoch": 3599} {"train_loss": -6.8353274549756735, "global_step": 151199, "epoch": 3599, "val_loss": 68079.2734375} {"train_loss": -6.789499282836914, "global_step": 151200, "epoch": 3600} {"train_loss": -6.775652885437012, "global_step": 151201, "epoch": 3600} {"train_loss": -6.911518096923828, "global_step": 151202, "epoch": 3600} {"train_loss": -6.904870986938477, "global_step": 151203, "epoch": 3600} {"train_loss": -6.850391387939453, "global_step": 151204, "epoch": 3600} {"train_loss": -6.914441108703613, "global_step": 151205, "epoch": 3600} {"train_loss": -6.844271659851074, "global_step": 151206, "epoch": 3600} {"train_loss": -6.843146324157715, "global_step": 151207, "epoch": 3600} {"train_loss": -6.912936210632324, "global_step": 151208, "epoch": 3600} {"train_loss": -6.947080612182617, "global_step": 151209, "epoch": 3600} {"train_loss": -6.822861671447754, "global_step": 151210, "epoch": 3600} {"train_loss": -6.798746585845947, "global_step": 151211, "epoch": 3600} {"train_loss": -6.825035095214844, "global_step": 151212, "epoch": 3600} {"train_loss": -6.903313636779785, "global_step": 151213, "epoch": 3600} {"train_loss": -6.824260711669922, "global_step": 151214, "epoch": 3600} {"train_loss": -6.832936763763428, "global_step": 151215, "epoch": 3600} {"train_loss": -6.849470138549805, "global_step": 151216, "epoch": 3600} {"train_loss": -6.833350658416748, "global_step": 151217, "epoch": 3600} {"train_loss": -6.873640537261963, "global_step": 151218, "epoch": 3600} {"train_loss": -6.900354862213135, "global_step": 151219, "epoch": 3600} {"train_loss": -6.927217483520508, "global_step": 151220, "epoch": 3600} {"train_loss": -7.000873565673828, "global_step": 151221, "epoch": 3600} {"train_loss": -6.864652633666992, "global_step": 151222, "epoch": 3600} {"train_loss": -6.885513782501221, "global_step": 151223, "epoch": 3600} {"train_loss": -6.816586017608643, "global_step": 151224, "epoch": 3600} {"train_loss": -6.806458950042725, "global_step": 151225, "epoch": 3600} {"train_loss": -6.871610641479492, "global_step": 151226, "epoch": 3600} {"train_loss": -6.866495132446289, "global_step": 151227, "epoch": 3600} {"train_loss": -6.888789176940918, "global_step": 151228, "epoch": 3600} {"train_loss": -7.009401321411133, "global_step": 151229, "epoch": 3600} {"train_loss": -6.854619026184082, "global_step": 151230, "epoch": 3600} {"train_loss": -6.915203094482422, "global_step": 151231, "epoch": 3600} {"train_loss": -6.882424354553223, "global_step": 151232, "epoch": 3600} {"train_loss": -6.927027225494385, "global_step": 151233, "epoch": 3600} {"train_loss": -6.9615278244018555, "global_step": 151234, "epoch": 3600} {"train_loss": -6.844602108001709, "global_step": 151235, "epoch": 3600} {"train_loss": -6.877666473388672, "global_step": 151236, "epoch": 3600} {"train_loss": -6.849055767059326, "global_step": 151237, "epoch": 3600} {"train_loss": -6.768590927124023, "global_step": 151238, "epoch": 3600} {"train_loss": -6.856438636779785, "global_step": 151239, "epoch": 3600} {"train_loss": -6.770891189575195, "global_step": 151240, "epoch": 3600} {"train_loss": -6.864022947493053, "global_step": 151241, "epoch": 3600, "train/sim_max_reward_0": 0.9094572242609533, "train/sim_max_reward_1": 0.3147579337812027, "train/sim_max_reward_2": 0.881752928282457, "train/sim_max_reward_3": 0.1802776786542253, "train/sim_max_reward_4": 0.9468054013434629, "train/sim_max_reward_5": 0.5172610191381948, "test/sim_max_reward_4300000": 0.23952134587310203, "test/sim_max_reward_4300001": 0.19756854278039745, "test/sim_max_reward_4300002": 0.9660779344230829, "test/sim_max_reward_4300003": 0.9896054304623918, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9903409210840753, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9491431831311906, "test/sim_max_reward_4300008": 0.8781449632972573, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.9087693046001882, "test/sim_max_reward_4300011": 0.9920788683433931, "test/sim_max_reward_4300012": 0.8000505116362201, "test/sim_max_reward_4300013": 0.9492228156025981, "test/sim_max_reward_4300014": 0.9794486200767467, "test/sim_max_reward_4300015": 0.910799165286599, "test/sim_max_reward_4300016": 1.0, "test/sim_max_reward_4300017": 0.9506822569708623, "test/sim_max_reward_4300018": 0.9902035739747107, "test/sim_max_reward_4300019": 0.18601009622428719, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8959362446512684, "test/sim_max_reward_4300022": 0.8552953249032818, "test/sim_max_reward_4300023": 0.36544695700968477, "test/sim_max_reward_4300024": 0.9143223908124295, "test/sim_max_reward_4300025": 0.9442709478781665, "test/sim_max_reward_4300026": 0.17718759817385016, "test/sim_max_reward_4300027": 0.8874982795382796, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.26297487655926727, "test/sim_max_reward_4300031": 0.42536616574160574, "test/sim_max_reward_4300032": 0.9548491611464638, "test/sim_max_reward_4300033": 0.9045439359760303, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9915092717197334, "test/sim_max_reward_4300038": 0.934272419361432, "test/sim_max_reward_4300039": 0.8101631763573514, "test/sim_max_reward_4300040": 0.9148570196947388, "test/sim_max_reward_4300041": 0.8793113900433074, "test/sim_max_reward_4300042": 0.4582201969224223, "test/sim_max_reward_4300043": 0.13050790300363327, "test/sim_max_reward_4300044": 0.870885475002855, "test/sim_max_reward_4300045": 1.0, "test/sim_max_reward_4300046": 0.2122446163593964, "test/sim_max_reward_4300047": 0.2204064562284453, "test/sim_max_reward_4300048": 0.9053442558888115, "test/sim_max_reward_4300049": 0.21454454254419125, "train/mean_score": 0.6250520309100827, "test/mean_score": 0.6244530871931303, "val_loss": 68267.265625} {"train_loss": -6.869269371032715, "global_step": 151242, "epoch": 3601} {"train_loss": -6.566032409667969, "global_step": 151243, "epoch": 3601} {"train_loss": -6.869338035583496, "global_step": 151244, "epoch": 3601} {"train_loss": -6.7725830078125, "global_step": 151245, "epoch": 3601} {"train_loss": -6.740002632141113, "global_step": 151246, "epoch": 3601} {"train_loss": -6.468364715576172, "global_step": 151247, "epoch": 3601} {"train_loss": -6.679429054260254, "global_step": 151248, "epoch": 3601} {"train_loss": -6.53299617767334, "global_step": 151249, "epoch": 3601} {"train_loss": -6.794796943664551, "global_step": 151250, "epoch": 3601} {"train_loss": -6.650965690612793, "global_step": 151251, "epoch": 3601} {"train_loss": -6.609080791473389, "global_step": 151252, "epoch": 3601} {"train_loss": -6.708345413208008, "global_step": 151253, "epoch": 3601} {"train_loss": -6.606791019439697, "global_step": 151254, "epoch": 3601} {"train_loss": -6.676602840423584, "global_step": 151255, "epoch": 3601} {"train_loss": -6.760098457336426, "global_step": 151256, "epoch": 3601} {"train_loss": -6.701479911804199, "global_step": 151257, "epoch": 3601} {"train_loss": -6.675459384918213, "global_step": 151258, "epoch": 3601} {"train_loss": -6.842714786529541, "global_step": 151259, "epoch": 3601} {"train_loss": -6.801849365234375, "global_step": 151260, "epoch": 3601} {"train_loss": -6.744012355804443, "global_step": 151261, "epoch": 3601} {"train_loss": -6.777632236480713, "global_step": 151262, "epoch": 3601} {"train_loss": -6.847688674926758, "global_step": 151263, "epoch": 3601} {"train_loss": -6.694900989532471, "global_step": 151264, "epoch": 3601} {"train_loss": -6.816893100738525, "global_step": 151265, "epoch": 3601} {"train_loss": -6.749734878540039, "global_step": 151266, "epoch": 3601} {"train_loss": -6.807995796203613, "global_step": 151267, "epoch": 3601} {"train_loss": -6.75203275680542, "global_step": 151268, "epoch": 3601} {"train_loss": -6.788804054260254, "global_step": 151269, "epoch": 3601} {"train_loss": -6.807363986968994, "global_step": 151270, "epoch": 3601} {"train_loss": -6.9548258781433105, "global_step": 151271, "epoch": 3601} {"train_loss": -6.902392387390137, "global_step": 151272, "epoch": 3601} {"train_loss": -6.829213619232178, "global_step": 151273, "epoch": 3601} {"train_loss": -6.78388786315918, "global_step": 151274, "epoch": 3601} {"train_loss": -6.793614864349365, "global_step": 151275, "epoch": 3601} {"train_loss": -6.787036895751953, "global_step": 151276, "epoch": 3601} {"train_loss": -6.773313522338867, "global_step": 151277, "epoch": 3601} {"train_loss": -6.91874885559082, "global_step": 151278, "epoch": 3601} {"train_loss": -6.783900260925293, "global_step": 151279, "epoch": 3601} {"train_loss": -6.824231147766113, "global_step": 151280, "epoch": 3601} {"train_loss": -6.712518692016602, "global_step": 151281, "epoch": 3601} {"train_loss": -6.881643295288086, "global_step": 151282, "epoch": 3601} {"train_loss": -6.755097218922207, "global_step": 151283, "epoch": 3601, "val_loss": 67932.828125} {"train_loss": -6.844836711883545, "global_step": 151284, "epoch": 3602} {"train_loss": -6.620728015899658, "global_step": 151285, "epoch": 3602} {"train_loss": -6.933432579040527, "global_step": 151286, "epoch": 3602} {"train_loss": -6.734467506408691, "global_step": 151287, "epoch": 3602} {"train_loss": -6.972916126251221, "global_step": 151288, "epoch": 3602} {"train_loss": -6.7691497802734375, "global_step": 151289, "epoch": 3602} {"train_loss": -6.7617034912109375, "global_step": 151290, "epoch": 3602} {"train_loss": -6.613385200500488, "global_step": 151291, "epoch": 3602} {"train_loss": -6.868200302124023, "global_step": 151292, "epoch": 3602} {"train_loss": -6.709197998046875, "global_step": 151293, "epoch": 3602} {"train_loss": -6.849206447601318, "global_step": 151294, "epoch": 3602} {"train_loss": -6.624304294586182, "global_step": 151295, "epoch": 3602} {"train_loss": -6.811358451843262, "global_step": 151296, "epoch": 3602} {"train_loss": -6.768611907958984, "global_step": 151297, "epoch": 3602} {"train_loss": -6.801210403442383, "global_step": 151298, "epoch": 3602} {"train_loss": -6.766283988952637, "global_step": 151299, "epoch": 3602} {"train_loss": -6.909290313720703, "global_step": 151300, "epoch": 3602} {"train_loss": -6.653716087341309, "global_step": 151301, "epoch": 3602} {"train_loss": -6.900152683258057, "global_step": 151302, "epoch": 3602} {"train_loss": -6.61251163482666, "global_step": 151303, "epoch": 3602} {"train_loss": -6.833077430725098, "global_step": 151304, "epoch": 3602} {"train_loss": -6.793808937072754, "global_step": 151305, "epoch": 3602} {"train_loss": -6.840299606323242, "global_step": 151306, "epoch": 3602} {"train_loss": -6.76912784576416, "global_step": 151307, "epoch": 3602} {"train_loss": -6.8450608253479, "global_step": 151308, "epoch": 3602} {"train_loss": -6.73964262008667, "global_step": 151309, "epoch": 3602} {"train_loss": -6.761105537414551, "global_step": 151310, "epoch": 3602} {"train_loss": -6.83327579498291, "global_step": 151311, "epoch": 3602} {"train_loss": -6.8467230796813965, "global_step": 151312, "epoch": 3602} {"train_loss": -6.741129398345947, "global_step": 151313, "epoch": 3602} {"train_loss": -6.952207565307617, "global_step": 151314, "epoch": 3602} {"train_loss": -6.810118675231934, "global_step": 151315, "epoch": 3602} {"train_loss": -6.928945064544678, "global_step": 151316, "epoch": 3602} {"train_loss": -6.784904956817627, "global_step": 151317, "epoch": 3602} {"train_loss": -6.811389446258545, "global_step": 151318, "epoch": 3602} {"train_loss": -6.917933940887451, "global_step": 151319, "epoch": 3602} {"train_loss": -6.898299694061279, "global_step": 151320, "epoch": 3602} {"train_loss": -6.888519287109375, "global_step": 151321, "epoch": 3602} {"train_loss": -6.8282470703125, "global_step": 151322, "epoch": 3602} {"train_loss": -6.869827747344971, "global_step": 151323, "epoch": 3602} {"train_loss": -6.845175743103027, "global_step": 151324, "epoch": 3602} {"train_loss": -6.80648272378104, "global_step": 151325, "epoch": 3602, "val_loss": 67919.265625} {"train_loss": -6.783784866333008, "global_step": 151326, "epoch": 3603} {"train_loss": -6.893932342529297, "global_step": 151327, "epoch": 3603} {"train_loss": -6.973701477050781, "global_step": 151328, "epoch": 3603} {"train_loss": -6.918878555297852, "global_step": 151329, "epoch": 3603} {"train_loss": -6.878046035766602, "global_step": 151330, "epoch": 3603} {"train_loss": -6.855983257293701, "global_step": 151331, "epoch": 3603} {"train_loss": -6.864508628845215, "global_step": 151332, "epoch": 3603} {"train_loss": -6.83017635345459, "global_step": 151333, "epoch": 3603} {"train_loss": -6.820876598358154, "global_step": 151334, "epoch": 3603} {"train_loss": -6.9971771240234375, "global_step": 151335, "epoch": 3603} {"train_loss": -6.99655818939209, "global_step": 151336, "epoch": 3603} {"train_loss": -6.919666290283203, "global_step": 151337, "epoch": 3603} {"train_loss": -6.870790004730225, "global_step": 151338, "epoch": 3603} {"train_loss": -6.916542053222656, "global_step": 151339, "epoch": 3603} {"train_loss": -6.8935627937316895, "global_step": 151340, "epoch": 3603} {"train_loss": -6.787055969238281, "global_step": 151341, "epoch": 3603} {"train_loss": -6.7912797927856445, "global_step": 151342, "epoch": 3603} {"train_loss": -6.863481521606445, "global_step": 151343, "epoch": 3603} {"train_loss": -6.856779098510742, "global_step": 151344, "epoch": 3603} {"train_loss": -6.777097702026367, "global_step": 151345, "epoch": 3603} {"train_loss": -6.8742523193359375, "global_step": 151346, "epoch": 3603} {"train_loss": -6.799692630767822, "global_step": 151347, "epoch": 3603} {"train_loss": -6.881907939910889, "global_step": 151348, "epoch": 3603} {"train_loss": -6.860597610473633, "global_step": 151349, "epoch": 3603} {"train_loss": -6.931497573852539, "global_step": 151350, "epoch": 3603} {"train_loss": -6.871735572814941, "global_step": 151351, "epoch": 3603} {"train_loss": -6.849508285522461, "global_step": 151352, "epoch": 3603} {"train_loss": -6.933928489685059, "global_step": 151353, "epoch": 3603} {"train_loss": -6.8807759284973145, "global_step": 151354, "epoch": 3603} {"train_loss": -6.967746734619141, "global_step": 151355, "epoch": 3603} {"train_loss": -6.839444160461426, "global_step": 151356, "epoch": 3603} {"train_loss": -6.9352898597717285, "global_step": 151357, "epoch": 3603} {"train_loss": -6.917292594909668, "global_step": 151358, "epoch": 3603} {"train_loss": -6.8671417236328125, "global_step": 151359, "epoch": 3603} {"train_loss": -6.757869720458984, "global_step": 151360, "epoch": 3603} {"train_loss": -6.895116329193115, "global_step": 151361, "epoch": 3603} {"train_loss": -6.804129600524902, "global_step": 151362, "epoch": 3603} {"train_loss": -6.872450828552246, "global_step": 151363, "epoch": 3603} {"train_loss": -6.902074813842773, "global_step": 151364, "epoch": 3603} {"train_loss": -6.682822227478027, "global_step": 151365, "epoch": 3603} {"train_loss": -6.880516052246094, "global_step": 151366, "epoch": 3603} {"train_loss": -6.871413060597011, "global_step": 151367, "epoch": 3603, "val_loss": 67993.375} {"train_loss": -6.787592887878418, "global_step": 151368, "epoch": 3604} {"train_loss": -6.919729232788086, "global_step": 151369, "epoch": 3604} {"train_loss": -6.931899070739746, "global_step": 151370, "epoch": 3604} {"train_loss": -6.887659072875977, "global_step": 151371, "epoch": 3604} {"train_loss": -6.812648773193359, "global_step": 151372, "epoch": 3604} {"train_loss": -6.841756820678711, "global_step": 151373, "epoch": 3604} {"train_loss": -6.945479869842529, "global_step": 151374, "epoch": 3604} {"train_loss": -6.960415840148926, "global_step": 151375, "epoch": 3604} {"train_loss": -6.860693454742432, "global_step": 151376, "epoch": 3604} {"train_loss": -6.863901138305664, "global_step": 151377, "epoch": 3604} {"train_loss": -6.946414947509766, "global_step": 151378, "epoch": 3604} {"train_loss": -6.890030384063721, "global_step": 151379, "epoch": 3604} {"train_loss": -6.914119243621826, "global_step": 151380, "epoch": 3604} {"train_loss": -6.971274375915527, "global_step": 151381, "epoch": 3604} {"train_loss": -6.819043159484863, "global_step": 151382, "epoch": 3604} {"train_loss": -6.672516822814941, "global_step": 151383, "epoch": 3604} {"train_loss": -6.9013566970825195, "global_step": 151384, "epoch": 3604} {"train_loss": -6.769432067871094, "global_step": 151385, "epoch": 3604} {"train_loss": -6.706060409545898, "global_step": 151386, "epoch": 3604} {"train_loss": -6.901027679443359, "global_step": 151387, "epoch": 3604} {"train_loss": -6.687353134155273, "global_step": 151388, "epoch": 3604} {"train_loss": -6.812328815460205, "global_step": 151389, "epoch": 3604} {"train_loss": -6.808038711547852, "global_step": 151390, "epoch": 3604} {"train_loss": -6.848156929016113, "global_step": 151391, "epoch": 3604} {"train_loss": -6.901699542999268, "global_step": 151392, "epoch": 3604} {"train_loss": -6.815394401550293, "global_step": 151393, "epoch": 3604} {"train_loss": -6.8848066329956055, "global_step": 151394, "epoch": 3604} {"train_loss": -6.979290962219238, "global_step": 151395, "epoch": 3604} {"train_loss": -6.924114227294922, "global_step": 151396, "epoch": 3604} {"train_loss": -6.914324760437012, "global_step": 151397, "epoch": 3604} {"train_loss": -6.810927391052246, "global_step": 151398, "epoch": 3604} {"train_loss": -6.877129554748535, "global_step": 151399, "epoch": 3604} {"train_loss": -6.968830108642578, "global_step": 151400, "epoch": 3604} {"train_loss": -6.847043037414551, "global_step": 151401, "epoch": 3604} {"train_loss": -6.891983985900879, "global_step": 151402, "epoch": 3604} {"train_loss": -6.783990383148193, "global_step": 151403, "epoch": 3604} {"train_loss": -6.799727439880371, "global_step": 151404, "epoch": 3604} {"train_loss": -6.826767921447754, "global_step": 151405, "epoch": 3604} {"train_loss": -6.826180458068848, "global_step": 151406, "epoch": 3604} {"train_loss": -6.878262519836426, "global_step": 151407, "epoch": 3604} {"train_loss": -6.92952823638916, "global_step": 151408, "epoch": 3604} {"train_loss": -6.857248976117089, "global_step": 151409, "epoch": 3604, "val_loss": 68023.5625} {"train_loss": -6.9369049072265625, "global_step": 151410, "epoch": 3605} {"train_loss": -6.918415069580078, "global_step": 151411, "epoch": 3605} {"train_loss": -6.889273643493652, "global_step": 151412, "epoch": 3605} {"train_loss": -6.845760822296143, "global_step": 151413, "epoch": 3605} {"train_loss": -6.8812255859375, "global_step": 151414, "epoch": 3605} {"train_loss": -6.883610725402832, "global_step": 151415, "epoch": 3605} {"train_loss": -6.803257465362549, "global_step": 151416, "epoch": 3605} {"train_loss": -6.910243034362793, "global_step": 151417, "epoch": 3605} {"train_loss": -6.880234718322754, "global_step": 151418, "epoch": 3605} {"train_loss": -6.913537979125977, "global_step": 151419, "epoch": 3605} {"train_loss": -6.935019016265869, "global_step": 151420, "epoch": 3605} {"train_loss": -6.882584571838379, "global_step": 151421, "epoch": 3605} {"train_loss": -6.9312744140625, "global_step": 151422, "epoch": 3605} {"train_loss": -6.881126880645752, "global_step": 151423, "epoch": 3605} {"train_loss": -6.798715591430664, "global_step": 151424, "epoch": 3605} {"train_loss": -6.838738441467285, "global_step": 151425, "epoch": 3605} {"train_loss": -6.75655460357666, "global_step": 151426, "epoch": 3605} {"train_loss": -6.81002140045166, "global_step": 151427, "epoch": 3605} {"train_loss": -6.911932468414307, "global_step": 151428, "epoch": 3605} {"train_loss": -6.820615291595459, "global_step": 151429, "epoch": 3605} {"train_loss": -6.867398262023926, "global_step": 151430, "epoch": 3605} {"train_loss": -6.831735134124756, "global_step": 151431, "epoch": 3605} {"train_loss": -6.78798246383667, "global_step": 151432, "epoch": 3605} {"train_loss": -6.7796783447265625, "global_step": 151433, "epoch": 3605} {"train_loss": -6.8604888916015625, "global_step": 151434, "epoch": 3605} {"train_loss": -6.7815351486206055, "global_step": 151435, "epoch": 3605} {"train_loss": -6.918154716491699, "global_step": 151436, "epoch": 3605} {"train_loss": -6.84758186340332, "global_step": 151437, "epoch": 3605} {"train_loss": -6.816123008728027, "global_step": 151438, "epoch": 3605} {"train_loss": -6.8719048500061035, "global_step": 151439, "epoch": 3605} {"train_loss": -6.975100994110107, "global_step": 151440, "epoch": 3605} {"train_loss": -6.8699235916137695, "global_step": 151441, "epoch": 3605} {"train_loss": -6.889665603637695, "global_step": 151442, "epoch": 3605} {"train_loss": -6.981430530548096, "global_step": 151443, "epoch": 3605} {"train_loss": -6.898015975952148, "global_step": 151444, "epoch": 3605} {"train_loss": -6.9867143630981445, "global_step": 151445, "epoch": 3605} {"train_loss": -6.852602958679199, "global_step": 151446, "epoch": 3605} {"train_loss": -6.927712440490723, "global_step": 151447, "epoch": 3605} {"train_loss": -6.945835113525391, "global_step": 151448, "epoch": 3605} {"train_loss": -6.9118757247924805, "global_step": 151449, "epoch": 3605} {"train_loss": -6.8333234786987305, "global_step": 151450, "epoch": 3605} {"train_loss": -6.875172967002506, "global_step": 151451, "epoch": 3605, "val_loss": 68031.5390625} {"train_loss": -6.88455867767334, "global_step": 151452, "epoch": 3606} {"train_loss": -6.877466201782227, "global_step": 151453, "epoch": 3606} {"train_loss": -6.928462982177734, "global_step": 151454, "epoch": 3606} {"train_loss": -6.699862957000732, "global_step": 151455, "epoch": 3606} {"train_loss": -6.811552047729492, "global_step": 151456, "epoch": 3606} {"train_loss": -6.82242488861084, "global_step": 151457, "epoch": 3606} {"train_loss": -6.6897873878479, "global_step": 151458, "epoch": 3606} {"train_loss": -6.90228271484375, "global_step": 151459, "epoch": 3606} {"train_loss": -6.783745288848877, "global_step": 151460, "epoch": 3606} {"train_loss": -6.607399940490723, "global_step": 151461, "epoch": 3606} {"train_loss": -6.785104751586914, "global_step": 151462, "epoch": 3606} {"train_loss": -6.5990309715271, "global_step": 151463, "epoch": 3606} {"train_loss": -6.697793006896973, "global_step": 151464, "epoch": 3606} {"train_loss": -6.782395362854004, "global_step": 151465, "epoch": 3606} {"train_loss": -6.627305030822754, "global_step": 151466, "epoch": 3606} {"train_loss": -6.770016193389893, "global_step": 151467, "epoch": 3606} {"train_loss": -6.765539646148682, "global_step": 151468, "epoch": 3606} {"train_loss": -6.807766437530518, "global_step": 151469, "epoch": 3606} {"train_loss": -6.770880699157715, "global_step": 151470, "epoch": 3606} {"train_loss": -6.9366912841796875, "global_step": 151471, "epoch": 3606} {"train_loss": -6.739144802093506, "global_step": 151472, "epoch": 3606} {"train_loss": -6.875126838684082, "global_step": 151473, "epoch": 3606} {"train_loss": -6.73654842376709, "global_step": 151474, "epoch": 3606} {"train_loss": -6.838961601257324, "global_step": 151475, "epoch": 3606} {"train_loss": -6.7915191650390625, "global_step": 151476, "epoch": 3606} {"train_loss": -6.885566711425781, "global_step": 151477, "epoch": 3606} {"train_loss": -6.822257995605469, "global_step": 151478, "epoch": 3606} {"train_loss": -7.014091491699219, "global_step": 151479, "epoch": 3606} {"train_loss": -6.823594570159912, "global_step": 151480, "epoch": 3606} {"train_loss": -6.830904006958008, "global_step": 151481, "epoch": 3606} {"train_loss": -6.879420280456543, "global_step": 151482, "epoch": 3606} {"train_loss": -6.8815460205078125, "global_step": 151483, "epoch": 3606} {"train_loss": -6.897497177124023, "global_step": 151484, "epoch": 3606} {"train_loss": -6.829153060913086, "global_step": 151485, "epoch": 3606} {"train_loss": -6.825557708740234, "global_step": 151486, "epoch": 3606} {"train_loss": -6.736681938171387, "global_step": 151487, "epoch": 3606} {"train_loss": -6.742785453796387, "global_step": 151488, "epoch": 3606} {"train_loss": -6.868125915527344, "global_step": 151489, "epoch": 3606} {"train_loss": -6.795463562011719, "global_step": 151490, "epoch": 3606} {"train_loss": -6.695209503173828, "global_step": 151491, "epoch": 3606} {"train_loss": -6.904056072235107, "global_step": 151492, "epoch": 3606} {"train_loss": -6.805416356949579, "global_step": 151493, "epoch": 3606, "val_loss": 67992.984375} {"train_loss": -6.80922794342041, "global_step": 151494, "epoch": 3607} {"train_loss": -6.856839656829834, "global_step": 151495, "epoch": 3607} {"train_loss": -6.8603715896606445, "global_step": 151496, "epoch": 3607} {"train_loss": -6.9185309410095215, "global_step": 151497, "epoch": 3607} {"train_loss": -6.885743141174316, "global_step": 151498, "epoch": 3607} {"train_loss": -6.795999050140381, "global_step": 151499, "epoch": 3607} {"train_loss": -6.868978023529053, "global_step": 151500, "epoch": 3607} {"train_loss": -6.914736747741699, "global_step": 151501, "epoch": 3607} {"train_loss": -6.767693519592285, "global_step": 151502, "epoch": 3607} {"train_loss": -6.7315673828125, "global_step": 151503, "epoch": 3607} {"train_loss": -6.836760997772217, "global_step": 151504, "epoch": 3607} {"train_loss": -6.835046768188477, "global_step": 151505, "epoch": 3607} {"train_loss": -6.775019645690918, "global_step": 151506, "epoch": 3607} {"train_loss": -6.997888088226318, "global_step": 151507, "epoch": 3607} {"train_loss": -6.676177501678467, "global_step": 151508, "epoch": 3607} {"train_loss": -6.957498550415039, "global_step": 151509, "epoch": 3607} {"train_loss": -6.768527984619141, "global_step": 151510, "epoch": 3607} {"train_loss": -6.758908748626709, "global_step": 151511, "epoch": 3607} {"train_loss": -6.837456226348877, "global_step": 151512, "epoch": 3607} {"train_loss": -6.897083282470703, "global_step": 151513, "epoch": 3607} {"train_loss": -6.961719036102295, "global_step": 151514, "epoch": 3607} {"train_loss": -6.889557838439941, "global_step": 151515, "epoch": 3607} {"train_loss": -6.788168907165527, "global_step": 151516, "epoch": 3607} {"train_loss": -6.902020454406738, "global_step": 151517, "epoch": 3607} {"train_loss": -6.894946098327637, "global_step": 151518, "epoch": 3607} {"train_loss": -6.930130958557129, "global_step": 151519, "epoch": 3607} {"train_loss": -6.93477201461792, "global_step": 151520, "epoch": 3607} {"train_loss": -6.874670028686523, "global_step": 151521, "epoch": 3607} {"train_loss": -6.871729850769043, "global_step": 151522, "epoch": 3607} {"train_loss": -6.8759307861328125, "global_step": 151523, "epoch": 3607} {"train_loss": -6.976939678192139, "global_step": 151524, "epoch": 3607} {"train_loss": -6.939544200897217, "global_step": 151525, "epoch": 3607} {"train_loss": -6.875061988830566, "global_step": 151526, "epoch": 3607} {"train_loss": -6.924836158752441, "global_step": 151527, "epoch": 3607} {"train_loss": -6.915628910064697, "global_step": 151528, "epoch": 3607} {"train_loss": -6.864877700805664, "global_step": 151529, "epoch": 3607} {"train_loss": -6.868644714355469, "global_step": 151530, "epoch": 3607} {"train_loss": -6.982490539550781, "global_step": 151531, "epoch": 3607} {"train_loss": -6.904393672943115, "global_step": 151532, "epoch": 3607} {"train_loss": -6.894830703735352, "global_step": 151533, "epoch": 3607} {"train_loss": -7.117510795593262, "global_step": 151534, "epoch": 3607} {"train_loss": -6.874815259660993, "global_step": 151535, "epoch": 3607, "val_loss": 67947.3984375} {"train_loss": -6.944725513458252, "global_step": 151536, "epoch": 3608} {"train_loss": -6.923774719238281, "global_step": 151537, "epoch": 3608} {"train_loss": -6.932791709899902, "global_step": 151538, "epoch": 3608} {"train_loss": -6.9377288818359375, "global_step": 151539, "epoch": 3608} {"train_loss": -6.9418840408325195, "global_step": 151540, "epoch": 3608} {"train_loss": -6.950444221496582, "global_step": 151541, "epoch": 3608} {"train_loss": -6.884339332580566, "global_step": 151542, "epoch": 3608} {"train_loss": -6.870791912078857, "global_step": 151543, "epoch": 3608} {"train_loss": -6.939176082611084, "global_step": 151544, "epoch": 3608} {"train_loss": -6.852181434631348, "global_step": 151545, "epoch": 3608} {"train_loss": -6.883394718170166, "global_step": 151546, "epoch": 3608} {"train_loss": -6.950777053833008, "global_step": 151547, "epoch": 3608} {"train_loss": -6.830963134765625, "global_step": 151548, "epoch": 3608} {"train_loss": -6.859416961669922, "global_step": 151549, "epoch": 3608} {"train_loss": -6.933021545410156, "global_step": 151550, "epoch": 3608} {"train_loss": -7.04697322845459, "global_step": 151551, "epoch": 3608} {"train_loss": -6.860265254974365, "global_step": 151552, "epoch": 3608} {"train_loss": -6.904274940490723, "global_step": 151553, "epoch": 3608} {"train_loss": -6.950512409210205, "global_step": 151554, "epoch": 3608} {"train_loss": -6.903693199157715, "global_step": 151555, "epoch": 3608} {"train_loss": -6.950346946716309, "global_step": 151556, "epoch": 3608} {"train_loss": -6.924873352050781, "global_step": 151557, "epoch": 3608} {"train_loss": -6.994655132293701, "global_step": 151558, "epoch": 3608} {"train_loss": -6.8991289138793945, "global_step": 151559, "epoch": 3608} {"train_loss": -6.93483304977417, "global_step": 151560, "epoch": 3608} {"train_loss": -6.943138122558594, "global_step": 151561, "epoch": 3608} {"train_loss": -6.804695129394531, "global_step": 151562, "epoch": 3608} {"train_loss": -7.012678623199463, "global_step": 151563, "epoch": 3608} {"train_loss": -6.9803571701049805, "global_step": 151564, "epoch": 3608} {"train_loss": -6.973552703857422, "global_step": 151565, "epoch": 3608} {"train_loss": -6.8929572105407715, "global_step": 151566, "epoch": 3608} {"train_loss": -6.813323974609375, "global_step": 151567, "epoch": 3608} {"train_loss": -6.8718414306640625, "global_step": 151568, "epoch": 3608} {"train_loss": -6.934811592102051, "global_step": 151569, "epoch": 3608} {"train_loss": -6.8943562507629395, "global_step": 151570, "epoch": 3608} {"train_loss": -6.861252307891846, "global_step": 151571, "epoch": 3608} {"train_loss": -7.0087199211120605, "global_step": 151572, "epoch": 3608} {"train_loss": -6.696985244750977, "global_step": 151573, "epoch": 3608} {"train_loss": -6.6661272048950195, "global_step": 151574, "epoch": 3608} {"train_loss": -6.881158351898193, "global_step": 151575, "epoch": 3608} {"train_loss": -6.713225364685059, "global_step": 151576, "epoch": 3608} {"train_loss": -6.900844108490717, "global_step": 151577, "epoch": 3608, "val_loss": 68136.28125} {"train_loss": -6.842597484588623, "global_step": 151578, "epoch": 3609} {"train_loss": -6.810019493103027, "global_step": 151579, "epoch": 3609} {"train_loss": -6.891735076904297, "global_step": 151580, "epoch": 3609} {"train_loss": -6.998174667358398, "global_step": 151581, "epoch": 3609} {"train_loss": -6.914083480834961, "global_step": 151582, "epoch": 3609} {"train_loss": -6.885275840759277, "global_step": 151583, "epoch": 3609} {"train_loss": -6.7951459884643555, "global_step": 151584, "epoch": 3609} {"train_loss": -6.764225482940674, "global_step": 151585, "epoch": 3609} {"train_loss": -6.944639205932617, "global_step": 151586, "epoch": 3609} {"train_loss": -6.829015731811523, "global_step": 151587, "epoch": 3609} {"train_loss": -6.746445178985596, "global_step": 151588, "epoch": 3609} {"train_loss": -6.912787437438965, "global_step": 151589, "epoch": 3609} {"train_loss": -6.911102294921875, "global_step": 151590, "epoch": 3609} {"train_loss": -6.852049350738525, "global_step": 151591, "epoch": 3609} {"train_loss": -6.92252254486084, "global_step": 151592, "epoch": 3609} {"train_loss": -6.9139204025268555, "global_step": 151593, "epoch": 3609} {"train_loss": -6.988274574279785, "global_step": 151594, "epoch": 3609} {"train_loss": -6.882686614990234, "global_step": 151595, "epoch": 3609} {"train_loss": -6.844801902770996, "global_step": 151596, "epoch": 3609} {"train_loss": -6.87581729888916, "global_step": 151597, "epoch": 3609} {"train_loss": -6.784058094024658, "global_step": 151598, "epoch": 3609} {"train_loss": -6.867898464202881, "global_step": 151599, "epoch": 3609} {"train_loss": -6.8605451583862305, "global_step": 151600, "epoch": 3609} {"train_loss": -6.880186080932617, "global_step": 151601, "epoch": 3609} {"train_loss": -6.7090911865234375, "global_step": 151602, "epoch": 3609} {"train_loss": -6.925126552581787, "global_step": 151603, "epoch": 3609} {"train_loss": -6.835857391357422, "global_step": 151604, "epoch": 3609} {"train_loss": -6.825891494750977, "global_step": 151605, "epoch": 3609} {"train_loss": -6.860043048858643, "global_step": 151606, "epoch": 3609} {"train_loss": -6.8453521728515625, "global_step": 151607, "epoch": 3609} {"train_loss": -6.767940521240234, "global_step": 151608, "epoch": 3609} {"train_loss": -6.820662498474121, "global_step": 151609, "epoch": 3609} {"train_loss": -6.798464775085449, "global_step": 151610, "epoch": 3609} {"train_loss": -6.7213592529296875, "global_step": 151611, "epoch": 3609} {"train_loss": -6.823971271514893, "global_step": 151612, "epoch": 3609} {"train_loss": -6.960222244262695, "global_step": 151613, "epoch": 3609} {"train_loss": -6.870770454406738, "global_step": 151614, "epoch": 3609} {"train_loss": -6.892541885375977, "global_step": 151615, "epoch": 3609} {"train_loss": -6.9427947998046875, "global_step": 151616, "epoch": 3609} {"train_loss": -6.854818820953369, "global_step": 151617, "epoch": 3609} {"train_loss": -6.8532633781433105, "global_step": 151618, "epoch": 3609} {"train_loss": -6.859929731913975, "global_step": 151619, "epoch": 3609, "val_loss": 68265.0390625} {"train_loss": -6.841967582702637, "global_step": 151620, "epoch": 3610} {"train_loss": -6.877686977386475, "global_step": 151621, "epoch": 3610} {"train_loss": -6.801165580749512, "global_step": 151622, "epoch": 3610} {"train_loss": -6.916540145874023, "global_step": 151623, "epoch": 3610} {"train_loss": -6.841917514801025, "global_step": 151624, "epoch": 3610} {"train_loss": -6.821321487426758, "global_step": 151625, "epoch": 3610} {"train_loss": -6.897069454193115, "global_step": 151626, "epoch": 3610} {"train_loss": -6.873113632202148, "global_step": 151627, "epoch": 3610} {"train_loss": -6.955079555511475, "global_step": 151628, "epoch": 3610} {"train_loss": -6.891489028930664, "global_step": 151629, "epoch": 3610} {"train_loss": -6.8568525314331055, "global_step": 151630, "epoch": 3610} {"train_loss": -6.927818298339844, "global_step": 151631, "epoch": 3610} {"train_loss": -6.955479621887207, "global_step": 151632, "epoch": 3610} {"train_loss": -7.049872398376465, "global_step": 151633, "epoch": 3610} {"train_loss": -6.856319904327393, "global_step": 151634, "epoch": 3610} {"train_loss": -6.921143531799316, "global_step": 151635, "epoch": 3610} {"train_loss": -6.88238525390625, "global_step": 151636, "epoch": 3610} {"train_loss": -6.923901557922363, "global_step": 151637, "epoch": 3610} {"train_loss": -6.866072654724121, "global_step": 151638, "epoch": 3610} {"train_loss": -6.808090686798096, "global_step": 151639, "epoch": 3610} {"train_loss": -7.040584564208984, "global_step": 151640, "epoch": 3610} {"train_loss": -6.800987720489502, "global_step": 151641, "epoch": 3610} {"train_loss": -7.025200843811035, "global_step": 151642, "epoch": 3610} {"train_loss": -6.852197647094727, "global_step": 151643, "epoch": 3610} {"train_loss": -6.915889739990234, "global_step": 151644, "epoch": 3610} {"train_loss": -6.9481425285339355, "global_step": 151645, "epoch": 3610} {"train_loss": -6.911184310913086, "global_step": 151646, "epoch": 3610} {"train_loss": -6.918209552764893, "global_step": 151647, "epoch": 3610} {"train_loss": -6.966281890869141, "global_step": 151648, "epoch": 3610} {"train_loss": -6.926793575286865, "global_step": 151649, "epoch": 3610} {"train_loss": -6.726968765258789, "global_step": 151650, "epoch": 3610} {"train_loss": -6.917547225952148, "global_step": 151651, "epoch": 3610} {"train_loss": -6.809186935424805, "global_step": 151652, "epoch": 3610} {"train_loss": -6.762485980987549, "global_step": 151653, "epoch": 3610} {"train_loss": -6.786959171295166, "global_step": 151654, "epoch": 3610} {"train_loss": -6.84230375289917, "global_step": 151655, "epoch": 3610} {"train_loss": -6.826642990112305, "global_step": 151656, "epoch": 3610} {"train_loss": -6.790039539337158, "global_step": 151657, "epoch": 3610} {"train_loss": -6.823017120361328, "global_step": 151658, "epoch": 3610} {"train_loss": -6.772601127624512, "global_step": 151659, "epoch": 3610} {"train_loss": -6.825713157653809, "global_step": 151660, "epoch": 3610} {"train_loss": -6.878506887526739, "global_step": 151661, "epoch": 3610, "val_loss": 67931.7109375} {"train_loss": -6.872440814971924, "global_step": 151662, "epoch": 3611} {"train_loss": -6.848620891571045, "global_step": 151663, "epoch": 3611} {"train_loss": -6.924868583679199, "global_step": 151664, "epoch": 3611} {"train_loss": -6.836360931396484, "global_step": 151665, "epoch": 3611} {"train_loss": -6.798399925231934, "global_step": 151666, "epoch": 3611} {"train_loss": -6.731325149536133, "global_step": 151667, "epoch": 3611} {"train_loss": -6.872544288635254, "global_step": 151668, "epoch": 3611} {"train_loss": -6.854620933532715, "global_step": 151669, "epoch": 3611} {"train_loss": -6.892784595489502, "global_step": 151670, "epoch": 3611} {"train_loss": -6.780437469482422, "global_step": 151671, "epoch": 3611} {"train_loss": -6.784028053283691, "global_step": 151672, "epoch": 3611} {"train_loss": -6.89946174621582, "global_step": 151673, "epoch": 3611} {"train_loss": -6.911048889160156, "global_step": 151674, "epoch": 3611} {"train_loss": -6.833606719970703, "global_step": 151675, "epoch": 3611} {"train_loss": -6.7818498611450195, "global_step": 151676, "epoch": 3611} {"train_loss": -6.963968276977539, "global_step": 151677, "epoch": 3611} {"train_loss": -6.985156536102295, "global_step": 151678, "epoch": 3611} {"train_loss": -6.755936622619629, "global_step": 151679, "epoch": 3611} {"train_loss": -6.913551330566406, "global_step": 151680, "epoch": 3611} {"train_loss": -6.802651882171631, "global_step": 151681, "epoch": 3611} {"train_loss": -6.865123748779297, "global_step": 151682, "epoch": 3611} {"train_loss": -6.931145191192627, "global_step": 151683, "epoch": 3611} {"train_loss": -6.964400291442871, "global_step": 151684, "epoch": 3611} {"train_loss": -6.855721473693848, "global_step": 151685, "epoch": 3611} {"train_loss": -6.875267028808594, "global_step": 151686, "epoch": 3611} {"train_loss": -6.835606098175049, "global_step": 151687, "epoch": 3611} {"train_loss": -6.963954925537109, "global_step": 151688, "epoch": 3611} {"train_loss": -6.8169660568237305, "global_step": 151689, "epoch": 3611} {"train_loss": -6.944123268127441, "global_step": 151690, "epoch": 3611} {"train_loss": -6.917734146118164, "global_step": 151691, "epoch": 3611} {"train_loss": -7.036908149719238, "global_step": 151692, "epoch": 3611} {"train_loss": -6.894351482391357, "global_step": 151693, "epoch": 3611} {"train_loss": -6.9354376792907715, "global_step": 151694, "epoch": 3611} {"train_loss": -6.9468674659729, "global_step": 151695, "epoch": 3611} {"train_loss": -6.912153244018555, "global_step": 151696, "epoch": 3611} {"train_loss": -6.813755989074707, "global_step": 151697, "epoch": 3611} {"train_loss": -6.827966690063477, "global_step": 151698, "epoch": 3611} {"train_loss": -6.835631370544434, "global_step": 151699, "epoch": 3611} {"train_loss": -6.87977409362793, "global_step": 151700, "epoch": 3611} {"train_loss": -6.870009422302246, "global_step": 151701, "epoch": 3611} {"train_loss": -6.92281436920166, "global_step": 151702, "epoch": 3611} {"train_loss": -6.877423831394741, "global_step": 151703, "epoch": 3611, "val_loss": 67868.3515625} {"train_loss": -6.92924690246582, "global_step": 151704, "epoch": 3612} {"train_loss": -6.785398006439209, "global_step": 151705, "epoch": 3612} {"train_loss": -6.926036834716797, "global_step": 151706, "epoch": 3612} {"train_loss": -6.910639762878418, "global_step": 151707, "epoch": 3612} {"train_loss": -6.813867568969727, "global_step": 151708, "epoch": 3612} {"train_loss": -6.844906806945801, "global_step": 151709, "epoch": 3612} {"train_loss": -6.6757636070251465, "global_step": 151710, "epoch": 3612} {"train_loss": -6.815391540527344, "global_step": 151711, "epoch": 3612} {"train_loss": -6.872461318969727, "global_step": 151712, "epoch": 3612} {"train_loss": -6.805912971496582, "global_step": 151713, "epoch": 3612} {"train_loss": -6.87272834777832, "global_step": 151714, "epoch": 3612} {"train_loss": -6.932919979095459, "global_step": 151715, "epoch": 3612} {"train_loss": -6.792941093444824, "global_step": 151716, "epoch": 3612} {"train_loss": -6.8860063552856445, "global_step": 151717, "epoch": 3612} {"train_loss": -6.857097625732422, "global_step": 151718, "epoch": 3612} {"train_loss": -6.796357154846191, "global_step": 151719, "epoch": 3612} {"train_loss": -6.965538501739502, "global_step": 151720, "epoch": 3612} {"train_loss": -6.955830097198486, "global_step": 151721, "epoch": 3612} {"train_loss": -6.901758670806885, "global_step": 151722, "epoch": 3612} {"train_loss": -6.9177961349487305, "global_step": 151723, "epoch": 3612} {"train_loss": -6.726078033447266, "global_step": 151724, "epoch": 3612} {"train_loss": -6.86832332611084, "global_step": 151725, "epoch": 3612} {"train_loss": -6.900234222412109, "global_step": 151726, "epoch": 3612} {"train_loss": -6.853664875030518, "global_step": 151727, "epoch": 3612} {"train_loss": -6.843191146850586, "global_step": 151728, "epoch": 3612} {"train_loss": -6.775357246398926, "global_step": 151729, "epoch": 3612} {"train_loss": -6.679445266723633, "global_step": 151730, "epoch": 3612} {"train_loss": -6.829318046569824, "global_step": 151731, "epoch": 3612} {"train_loss": -6.818214416503906, "global_step": 151732, "epoch": 3612} {"train_loss": -6.8474202156066895, "global_step": 151733, "epoch": 3612} {"train_loss": -6.809775352478027, "global_step": 151734, "epoch": 3612} {"train_loss": -6.770845890045166, "global_step": 151735, "epoch": 3612} {"train_loss": -6.701963424682617, "global_step": 151736, "epoch": 3612} {"train_loss": -6.702083587646484, "global_step": 151737, "epoch": 3612} {"train_loss": -6.851600646972656, "global_step": 151738, "epoch": 3612} {"train_loss": -6.739290237426758, "global_step": 151739, "epoch": 3612} {"train_loss": -6.8517656326293945, "global_step": 151740, "epoch": 3612} {"train_loss": -6.864531517028809, "global_step": 151741, "epoch": 3612} {"train_loss": -6.871652126312256, "global_step": 151742, "epoch": 3612} {"train_loss": -6.82435417175293, "global_step": 151743, "epoch": 3612} {"train_loss": -6.859416484832764, "global_step": 151744, "epoch": 3612} {"train_loss": -6.833513078235445, "global_step": 151745, "epoch": 3612, "val_loss": 68154.6328125} {"train_loss": -6.907885551452637, "global_step": 151746, "epoch": 3613} {"train_loss": -7.024958610534668, "global_step": 151747, "epoch": 3613} {"train_loss": -6.87347412109375, "global_step": 151748, "epoch": 3613} {"train_loss": -6.833890438079834, "global_step": 151749, "epoch": 3613} {"train_loss": -6.73041296005249, "global_step": 151750, "epoch": 3613} {"train_loss": -6.811491966247559, "global_step": 151751, "epoch": 3613} {"train_loss": -6.8432230949401855, "global_step": 151752, "epoch": 3613} {"train_loss": -6.863674163818359, "global_step": 151753, "epoch": 3613} {"train_loss": -6.863463401794434, "global_step": 151754, "epoch": 3613} {"train_loss": -6.93393611907959, "global_step": 151755, "epoch": 3613} {"train_loss": -6.900184631347656, "global_step": 151756, "epoch": 3613} {"train_loss": -6.940947532653809, "global_step": 151757, "epoch": 3613} {"train_loss": -6.904576301574707, "global_step": 151758, "epoch": 3613} {"train_loss": -6.801658630371094, "global_step": 151759, "epoch": 3613} {"train_loss": -6.840314865112305, "global_step": 151760, "epoch": 3613} {"train_loss": -6.789939880371094, "global_step": 151761, "epoch": 3613} {"train_loss": -6.892069339752197, "global_step": 151762, "epoch": 3613} {"train_loss": -6.840664863586426, "global_step": 151763, "epoch": 3613} {"train_loss": -6.797981262207031, "global_step": 151764, "epoch": 3613} {"train_loss": -6.967865467071533, "global_step": 151765, "epoch": 3613} {"train_loss": -6.800236701965332, "global_step": 151766, "epoch": 3613} {"train_loss": -6.889743804931641, "global_step": 151767, "epoch": 3613} {"train_loss": -6.863055229187012, "global_step": 151768, "epoch": 3613} {"train_loss": -6.892270088195801, "global_step": 151769, "epoch": 3613} {"train_loss": -6.763965606689453, "global_step": 151770, "epoch": 3613} {"train_loss": -6.912842750549316, "global_step": 151771, "epoch": 3613} {"train_loss": -6.840098857879639, "global_step": 151772, "epoch": 3613} {"train_loss": -6.879091262817383, "global_step": 151773, "epoch": 3613} {"train_loss": -6.865561485290527, "global_step": 151774, "epoch": 3613} {"train_loss": -6.691876411437988, "global_step": 151775, "epoch": 3613} {"train_loss": -6.740389823913574, "global_step": 151776, "epoch": 3613} {"train_loss": -6.7570343017578125, "global_step": 151777, "epoch": 3613} {"train_loss": -6.702657699584961, "global_step": 151778, "epoch": 3613} {"train_loss": -6.838745594024658, "global_step": 151779, "epoch": 3613} {"train_loss": -6.529620170593262, "global_step": 151780, "epoch": 3613} {"train_loss": -6.7376556396484375, "global_step": 151781, "epoch": 3613} {"train_loss": -6.607020378112793, "global_step": 151782, "epoch": 3613} {"train_loss": -6.738348484039307, "global_step": 151783, "epoch": 3613} {"train_loss": -6.640774726867676, "global_step": 151784, "epoch": 3613} {"train_loss": -6.713902950286865, "global_step": 151785, "epoch": 3613} {"train_loss": -6.844655990600586, "global_step": 151786, "epoch": 3613} {"train_loss": -6.816683678399949, "global_step": 151787, "epoch": 3613, "val_loss": 68022.609375} {"train_loss": -6.801325798034668, "global_step": 151788, "epoch": 3614} {"train_loss": -6.608240127563477, "global_step": 151789, "epoch": 3614} {"train_loss": -6.869867324829102, "global_step": 151790, "epoch": 3614} {"train_loss": -6.758148193359375, "global_step": 151791, "epoch": 3614} {"train_loss": -6.778378963470459, "global_step": 151792, "epoch": 3614} {"train_loss": -6.778580665588379, "global_step": 151793, "epoch": 3614} {"train_loss": -6.87409782409668, "global_step": 151794, "epoch": 3614} {"train_loss": -6.79846715927124, "global_step": 151795, "epoch": 3614} {"train_loss": -6.835488319396973, "global_step": 151796, "epoch": 3614} {"train_loss": -6.845766067504883, "global_step": 151797, "epoch": 3614} {"train_loss": -6.715005874633789, "global_step": 151798, "epoch": 3614} {"train_loss": -6.772267818450928, "global_step": 151799, "epoch": 3614} {"train_loss": -6.811321258544922, "global_step": 151800, "epoch": 3614} {"train_loss": -6.889406681060791, "global_step": 151801, "epoch": 3614} {"train_loss": -6.836499214172363, "global_step": 151802, "epoch": 3614} {"train_loss": -6.82821798324585, "global_step": 151803, "epoch": 3614} {"train_loss": -6.805751800537109, "global_step": 151804, "epoch": 3614} {"train_loss": -6.934880256652832, "global_step": 151805, "epoch": 3614} {"train_loss": -6.62322998046875, "global_step": 151806, "epoch": 3614} {"train_loss": -6.8423357009887695, "global_step": 151807, "epoch": 3614} {"train_loss": -6.718557357788086, "global_step": 151808, "epoch": 3614} {"train_loss": -6.786113262176514, "global_step": 151809, "epoch": 3614} {"train_loss": -6.7714104652404785, "global_step": 151810, "epoch": 3614} {"train_loss": -6.722646713256836, "global_step": 151811, "epoch": 3614} {"train_loss": -6.8191938400268555, "global_step": 151812, "epoch": 3614} {"train_loss": -6.712363243103027, "global_step": 151813, "epoch": 3614} {"train_loss": -6.904212951660156, "global_step": 151814, "epoch": 3614} {"train_loss": -6.781524658203125, "global_step": 151815, "epoch": 3614} {"train_loss": -6.889647960662842, "global_step": 151816, "epoch": 3614} {"train_loss": -6.7790093421936035, "global_step": 151817, "epoch": 3614} {"train_loss": -6.791238307952881, "global_step": 151818, "epoch": 3614} {"train_loss": -6.842026233673096, "global_step": 151819, "epoch": 3614} {"train_loss": -6.878443241119385, "global_step": 151820, "epoch": 3614} {"train_loss": -6.858789443969727, "global_step": 151821, "epoch": 3614} {"train_loss": -6.864126205444336, "global_step": 151822, "epoch": 3614} {"train_loss": -6.950016021728516, "global_step": 151823, "epoch": 3614} {"train_loss": -6.912320137023926, "global_step": 151824, "epoch": 3614} {"train_loss": -6.920342922210693, "global_step": 151825, "epoch": 3614} {"train_loss": -6.902444839477539, "global_step": 151826, "epoch": 3614} {"train_loss": -6.937911510467529, "global_step": 151827, "epoch": 3614} {"train_loss": -6.929093360900879, "global_step": 151828, "epoch": 3614} {"train_loss": -6.822091920035226, "global_step": 151829, "epoch": 3614, "val_loss": 68039.734375} {"train_loss": -6.893716812133789, "global_step": 151830, "epoch": 3615} {"train_loss": -6.8773369789123535, "global_step": 151831, "epoch": 3615} {"train_loss": -6.8741655349731445, "global_step": 151832, "epoch": 3615} {"train_loss": -6.726008415222168, "global_step": 151833, "epoch": 3615} {"train_loss": -6.888139724731445, "global_step": 151834, "epoch": 3615} {"train_loss": -6.949552059173584, "global_step": 151835, "epoch": 3615} {"train_loss": -6.917645454406738, "global_step": 151836, "epoch": 3615} {"train_loss": -6.903688430786133, "global_step": 151837, "epoch": 3615} {"train_loss": -6.885822772979736, "global_step": 151838, "epoch": 3615} {"train_loss": -7.000452041625977, "global_step": 151839, "epoch": 3615} {"train_loss": -6.8159499168396, "global_step": 151840, "epoch": 3615} {"train_loss": -6.756397247314453, "global_step": 151841, "epoch": 3615} {"train_loss": -6.960151195526123, "global_step": 151842, "epoch": 3615} {"train_loss": -6.923453330993652, "global_step": 151843, "epoch": 3615} {"train_loss": -6.76644229888916, "global_step": 151844, "epoch": 3615} {"train_loss": -6.825470447540283, "global_step": 151845, "epoch": 3615} {"train_loss": -6.7212934494018555, "global_step": 151846, "epoch": 3615} {"train_loss": -6.868777275085449, "global_step": 151847, "epoch": 3615} {"train_loss": -6.8438310623168945, "global_step": 151848, "epoch": 3615} {"train_loss": -6.849477767944336, "global_step": 151849, "epoch": 3615} {"train_loss": -6.885777473449707, "global_step": 151850, "epoch": 3615} {"train_loss": -6.870884418487549, "global_step": 151851, "epoch": 3615} {"train_loss": -6.853079319000244, "global_step": 151852, "epoch": 3615} {"train_loss": -6.791878700256348, "global_step": 151853, "epoch": 3615} {"train_loss": -6.888932228088379, "global_step": 151854, "epoch": 3615} {"train_loss": -6.842164516448975, "global_step": 151855, "epoch": 3615} {"train_loss": -6.882124900817871, "global_step": 151856, "epoch": 3615} {"train_loss": -6.90292501449585, "global_step": 151857, "epoch": 3615} {"train_loss": -6.919739723205566, "global_step": 151858, "epoch": 3615} {"train_loss": -6.811227798461914, "global_step": 151859, "epoch": 3615} {"train_loss": -6.98095703125, "global_step": 151860, "epoch": 3615} {"train_loss": -6.866373538970947, "global_step": 151861, "epoch": 3615} {"train_loss": -6.768496990203857, "global_step": 151862, "epoch": 3615} {"train_loss": -6.745434761047363, "global_step": 151863, "epoch": 3615} {"train_loss": -6.766173362731934, "global_step": 151864, "epoch": 3615} {"train_loss": -6.84282112121582, "global_step": 151865, "epoch": 3615} {"train_loss": -6.890995502471924, "global_step": 151866, "epoch": 3615} {"train_loss": -6.892443656921387, "global_step": 151867, "epoch": 3615} {"train_loss": -6.832825183868408, "global_step": 151868, "epoch": 3615} {"train_loss": -6.964438438415527, "global_step": 151869, "epoch": 3615} {"train_loss": -6.815213680267334, "global_step": 151870, "epoch": 3615} {"train_loss": -6.857193413234892, "global_step": 151871, "epoch": 3615, "val_loss": 68263.5} {"train_loss": -6.901065826416016, "global_step": 151872, "epoch": 3616} {"train_loss": -6.714394569396973, "global_step": 151873, "epoch": 3616} {"train_loss": -6.867159843444824, "global_step": 151874, "epoch": 3616} {"train_loss": -6.950899124145508, "global_step": 151875, "epoch": 3616} {"train_loss": -6.831743240356445, "global_step": 151876, "epoch": 3616} {"train_loss": -6.928821086883545, "global_step": 151877, "epoch": 3616} {"train_loss": -6.87969970703125, "global_step": 151878, "epoch": 3616} {"train_loss": -6.902285575866699, "global_step": 151879, "epoch": 3616} {"train_loss": -6.855375289916992, "global_step": 151880, "epoch": 3616} {"train_loss": -6.943010330200195, "global_step": 151881, "epoch": 3616} {"train_loss": -6.973604202270508, "global_step": 151882, "epoch": 3616} {"train_loss": -6.961788177490234, "global_step": 151883, "epoch": 3616} {"train_loss": -6.888428688049316, "global_step": 151884, "epoch": 3616} {"train_loss": -6.876192569732666, "global_step": 151885, "epoch": 3616} {"train_loss": -6.877151012420654, "global_step": 151886, "epoch": 3616} {"train_loss": -6.857522964477539, "global_step": 151887, "epoch": 3616} {"train_loss": -6.950768947601318, "global_step": 151888, "epoch": 3616} {"train_loss": -6.872638702392578, "global_step": 151889, "epoch": 3616} {"train_loss": -6.790187358856201, "global_step": 151890, "epoch": 3616} {"train_loss": -6.873295307159424, "global_step": 151891, "epoch": 3616} {"train_loss": -6.892359733581543, "global_step": 151892, "epoch": 3616} {"train_loss": -6.843593597412109, "global_step": 151893, "epoch": 3616} {"train_loss": -6.842500686645508, "global_step": 151894, "epoch": 3616} {"train_loss": -6.821083068847656, "global_step": 151895, "epoch": 3616} {"train_loss": -6.832363128662109, "global_step": 151896, "epoch": 3616} {"train_loss": -6.865729331970215, "global_step": 151897, "epoch": 3616} {"train_loss": -6.815521717071533, "global_step": 151898, "epoch": 3616} {"train_loss": -6.8795976638793945, "global_step": 151899, "epoch": 3616} {"train_loss": -6.777902603149414, "global_step": 151900, "epoch": 3616} {"train_loss": -6.79034423828125, "global_step": 151901, "epoch": 3616} {"train_loss": -6.8442702293396, "global_step": 151902, "epoch": 3616} {"train_loss": -6.729917526245117, "global_step": 151903, "epoch": 3616} {"train_loss": -6.745539665222168, "global_step": 151904, "epoch": 3616} {"train_loss": -6.676063537597656, "global_step": 151905, "epoch": 3616} {"train_loss": -6.883185386657715, "global_step": 151906, "epoch": 3616} {"train_loss": -6.859348297119141, "global_step": 151907, "epoch": 3616} {"train_loss": -6.860320091247559, "global_step": 151908, "epoch": 3616} {"train_loss": -6.810258865356445, "global_step": 151909, "epoch": 3616} {"train_loss": -6.828227996826172, "global_step": 151910, "epoch": 3616} {"train_loss": -6.888423442840576, "global_step": 151911, "epoch": 3616} {"train_loss": -6.846675872802734, "global_step": 151912, "epoch": 3616} {"train_loss": -6.850657690139044, "global_step": 151913, "epoch": 3616, "val_loss": 67854.765625} {"train_loss": -6.741649150848389, "global_step": 151914, "epoch": 3617} {"train_loss": -6.8778181076049805, "global_step": 151915, "epoch": 3617} {"train_loss": -6.771788120269775, "global_step": 151916, "epoch": 3617} {"train_loss": -6.886523723602295, "global_step": 151917, "epoch": 3617} {"train_loss": -6.747219085693359, "global_step": 151918, "epoch": 3617} {"train_loss": -6.88844108581543, "global_step": 151919, "epoch": 3617} {"train_loss": -6.890620231628418, "global_step": 151920, "epoch": 3617} {"train_loss": -6.902173042297363, "global_step": 151921, "epoch": 3617} {"train_loss": -6.739779949188232, "global_step": 151922, "epoch": 3617} {"train_loss": -6.724239826202393, "global_step": 151923, "epoch": 3617} {"train_loss": -6.863840103149414, "global_step": 151924, "epoch": 3617} {"train_loss": -6.845252990722656, "global_step": 151925, "epoch": 3617} {"train_loss": -6.726853370666504, "global_step": 151926, "epoch": 3617} {"train_loss": -6.760235786437988, "global_step": 151927, "epoch": 3617} {"train_loss": -6.817903518676758, "global_step": 151928, "epoch": 3617} {"train_loss": -6.86116886138916, "global_step": 151929, "epoch": 3617} {"train_loss": -6.834991455078125, "global_step": 151930, "epoch": 3617} {"train_loss": -6.859086036682129, "global_step": 151931, "epoch": 3617} {"train_loss": -6.861748695373535, "global_step": 151932, "epoch": 3617} {"train_loss": -6.766820907592773, "global_step": 151933, "epoch": 3617} {"train_loss": -6.8640336990356445, "global_step": 151934, "epoch": 3617} {"train_loss": -6.81418514251709, "global_step": 151935, "epoch": 3617} {"train_loss": -6.962959289550781, "global_step": 151936, "epoch": 3617} {"train_loss": -6.82640266418457, "global_step": 151937, "epoch": 3617} {"train_loss": -6.914120674133301, "global_step": 151938, "epoch": 3617} {"train_loss": -6.915005683898926, "global_step": 151939, "epoch": 3617} {"train_loss": -6.901427268981934, "global_step": 151940, "epoch": 3617} {"train_loss": -6.970359802246094, "global_step": 151941, "epoch": 3617} {"train_loss": -6.796903133392334, "global_step": 151942, "epoch": 3617} {"train_loss": -6.879363059997559, "global_step": 151943, "epoch": 3617} {"train_loss": -7.046913146972656, "global_step": 151944, "epoch": 3617} {"train_loss": -6.743549346923828, "global_step": 151945, "epoch": 3617} {"train_loss": -6.965521335601807, "global_step": 151946, "epoch": 3617} {"train_loss": -6.863847732543945, "global_step": 151947, "epoch": 3617} {"train_loss": -6.940024375915527, "global_step": 151948, "epoch": 3617} {"train_loss": -6.815901279449463, "global_step": 151949, "epoch": 3617} {"train_loss": -7.043176651000977, "global_step": 151950, "epoch": 3617} {"train_loss": -6.961330413818359, "global_step": 151951, "epoch": 3617} {"train_loss": -6.964273452758789, "global_step": 151952, "epoch": 3617} {"train_loss": -6.967092037200928, "global_step": 151953, "epoch": 3617} {"train_loss": -6.9440226554870605, "global_step": 151954, "epoch": 3617} {"train_loss": -6.866653045018514, "global_step": 151955, "epoch": 3617, "val_loss": 68048.1640625} {"train_loss": -6.852936267852783, "global_step": 151956, "epoch": 3618} {"train_loss": -6.9358439445495605, "global_step": 151957, "epoch": 3618} {"train_loss": -6.9661431312561035, "global_step": 151958, "epoch": 3618} {"train_loss": -6.81678581237793, "global_step": 151959, "epoch": 3618} {"train_loss": -6.899145603179932, "global_step": 151960, "epoch": 3618} {"train_loss": -6.942224025726318, "global_step": 151961, "epoch": 3618} {"train_loss": -6.876972198486328, "global_step": 151962, "epoch": 3618} {"train_loss": -6.86734676361084, "global_step": 151963, "epoch": 3618} {"train_loss": -6.768499851226807, "global_step": 151964, "epoch": 3618} {"train_loss": -6.856603622436523, "global_step": 151965, "epoch": 3618} {"train_loss": -6.990352630615234, "global_step": 151966, "epoch": 3618} {"train_loss": -6.852149486541748, "global_step": 151967, "epoch": 3618} {"train_loss": -6.927585601806641, "global_step": 151968, "epoch": 3618} {"train_loss": -6.873841285705566, "global_step": 151969, "epoch": 3618} {"train_loss": -6.873647689819336, "global_step": 151970, "epoch": 3618} {"train_loss": -6.961219787597656, "global_step": 151971, "epoch": 3618} {"train_loss": -6.843844890594482, "global_step": 151972, "epoch": 3618} {"train_loss": -7.008574485778809, "global_step": 151973, "epoch": 3618} {"train_loss": -6.941493034362793, "global_step": 151974, "epoch": 3618} {"train_loss": -6.975506782531738, "global_step": 151975, "epoch": 3618} {"train_loss": -6.964735984802246, "global_step": 151976, "epoch": 3618} {"train_loss": -6.920070648193359, "global_step": 151977, "epoch": 3618} {"train_loss": -6.9838361740112305, "global_step": 151978, "epoch": 3618} {"train_loss": -6.95483922958374, "global_step": 151979, "epoch": 3618} {"train_loss": -7.054043769836426, "global_step": 151980, "epoch": 3618} {"train_loss": -6.9427900314331055, "global_step": 151981, "epoch": 3618} {"train_loss": -6.9132490158081055, "global_step": 151982, "epoch": 3618} {"train_loss": -6.814844131469727, "global_step": 151983, "epoch": 3618} {"train_loss": -6.9336838722229, "global_step": 151984, "epoch": 3618} {"train_loss": -6.953394889831543, "global_step": 151985, "epoch": 3618} {"train_loss": -6.967550277709961, "global_step": 151986, "epoch": 3618} {"train_loss": -6.981683731079102, "global_step": 151987, "epoch": 3618} {"train_loss": -6.869822978973389, "global_step": 151988, "epoch": 3618} {"train_loss": -6.807793617248535, "global_step": 151989, "epoch": 3618} {"train_loss": -6.878585338592529, "global_step": 151990, "epoch": 3618} {"train_loss": -6.905143737792969, "global_step": 151991, "epoch": 3618} {"train_loss": -6.830704212188721, "global_step": 151992, "epoch": 3618} {"train_loss": -6.776553153991699, "global_step": 151993, "epoch": 3618} {"train_loss": -6.917943000793457, "global_step": 151994, "epoch": 3618} {"train_loss": -6.957992076873779, "global_step": 151995, "epoch": 3618} {"train_loss": -6.9146928787231445, "global_step": 151996, "epoch": 3618} {"train_loss": -6.904504174277896, "global_step": 151997, "epoch": 3618, "val_loss": 68077.0390625} {"train_loss": -6.770751953125, "global_step": 151998, "epoch": 3619} {"train_loss": -6.958213806152344, "global_step": 151999, "epoch": 3619} {"train_loss": -6.82196044921875, "global_step": 152000, "epoch": 3619} {"train_loss": -6.851361274719238, "global_step": 152001, "epoch": 3619} {"train_loss": -6.820644378662109, "global_step": 152002, "epoch": 3619} {"train_loss": -7.023022174835205, "global_step": 152003, "epoch": 3619} {"train_loss": -6.699522972106934, "global_step": 152004, "epoch": 3619} {"train_loss": -6.895228862762451, "global_step": 152005, "epoch": 3619} {"train_loss": -6.905588626861572, "global_step": 152006, "epoch": 3619} {"train_loss": -6.888094902038574, "global_step": 152007, "epoch": 3619} {"train_loss": -6.983858108520508, "global_step": 152008, "epoch": 3619} {"train_loss": -6.8256025314331055, "global_step": 152009, "epoch": 3619} {"train_loss": -6.878260612487793, "global_step": 152010, "epoch": 3619} {"train_loss": -6.934478759765625, "global_step": 152011, "epoch": 3619} {"train_loss": -6.811971664428711, "global_step": 152012, "epoch": 3619} {"train_loss": -6.950730323791504, "global_step": 152013, "epoch": 3619} {"train_loss": -6.872519016265869, "global_step": 152014, "epoch": 3619} {"train_loss": -6.826910972595215, "global_step": 152015, "epoch": 3619} {"train_loss": -6.803737163543701, "global_step": 152016, "epoch": 3619} {"train_loss": -6.846621036529541, "global_step": 152017, "epoch": 3619} {"train_loss": -6.963339805603027, "global_step": 152018, "epoch": 3619} {"train_loss": -6.932021141052246, "global_step": 152019, "epoch": 3619} {"train_loss": -6.9108734130859375, "global_step": 152020, "epoch": 3619} {"train_loss": -6.814087867736816, "global_step": 152021, "epoch": 3619} {"train_loss": -6.95120906829834, "global_step": 152022, "epoch": 3619} {"train_loss": -6.972860336303711, "global_step": 152023, "epoch": 3619} {"train_loss": -6.9810333251953125, "global_step": 152024, "epoch": 3619} {"train_loss": -6.937198638916016, "global_step": 152025, "epoch": 3619} {"train_loss": -6.961373329162598, "global_step": 152026, "epoch": 3619} {"train_loss": -6.905791282653809, "global_step": 152027, "epoch": 3619} {"train_loss": -6.9434967041015625, "global_step": 152028, "epoch": 3619} {"train_loss": -6.922675132751465, "global_step": 152029, "epoch": 3619} {"train_loss": -6.949622631072998, "global_step": 152030, "epoch": 3619} {"train_loss": -6.986003875732422, "global_step": 152031, "epoch": 3619} {"train_loss": -7.035128593444824, "global_step": 152032, "epoch": 3619} {"train_loss": -6.8389105796813965, "global_step": 152033, "epoch": 3619} {"train_loss": -6.819095134735107, "global_step": 152034, "epoch": 3619} {"train_loss": -6.937686443328857, "global_step": 152035, "epoch": 3619} {"train_loss": -6.858078956604004, "global_step": 152036, "epoch": 3619} {"train_loss": -6.854184150695801, "global_step": 152037, "epoch": 3619} {"train_loss": -6.8815836906433105, "global_step": 152038, "epoch": 3619} {"train_loss": -6.897538196472895, "global_step": 152039, "epoch": 3619, "val_loss": 67990.984375} {"train_loss": -6.9579010009765625, "global_step": 152040, "epoch": 3620} {"train_loss": -6.9919328689575195, "global_step": 152041, "epoch": 3620} {"train_loss": -6.886713027954102, "global_step": 152042, "epoch": 3620} {"train_loss": -7.006251811981201, "global_step": 152043, "epoch": 3620} {"train_loss": -6.981678009033203, "global_step": 152044, "epoch": 3620} {"train_loss": -7.030869007110596, "global_step": 152045, "epoch": 3620} {"train_loss": -6.918880462646484, "global_step": 152046, "epoch": 3620} {"train_loss": -6.92226505279541, "global_step": 152047, "epoch": 3620} {"train_loss": -7.031722068786621, "global_step": 152048, "epoch": 3620} {"train_loss": -6.92816162109375, "global_step": 152049, "epoch": 3620} {"train_loss": -6.968705177307129, "global_step": 152050, "epoch": 3620} {"train_loss": -6.863661766052246, "global_step": 152051, "epoch": 3620} {"train_loss": -6.8201727867126465, "global_step": 152052, "epoch": 3620} {"train_loss": -6.775073051452637, "global_step": 152053, "epoch": 3620} {"train_loss": -6.846343517303467, "global_step": 152054, "epoch": 3620} {"train_loss": -6.879305839538574, "global_step": 152055, "epoch": 3620} {"train_loss": -6.791625022888184, "global_step": 152056, "epoch": 3620} {"train_loss": -6.843831539154053, "global_step": 152057, "epoch": 3620} {"train_loss": -6.697539329528809, "global_step": 152058, "epoch": 3620} {"train_loss": -6.627793788909912, "global_step": 152059, "epoch": 3620} {"train_loss": -6.741138458251953, "global_step": 152060, "epoch": 3620} {"train_loss": -6.790505409240723, "global_step": 152061, "epoch": 3620} {"train_loss": -6.787883758544922, "global_step": 152062, "epoch": 3620} {"train_loss": -6.813739776611328, "global_step": 152063, "epoch": 3620} {"train_loss": -6.800172805786133, "global_step": 152064, "epoch": 3620} {"train_loss": -6.848259449005127, "global_step": 152065, "epoch": 3620} {"train_loss": -6.842657089233398, "global_step": 152066, "epoch": 3620} {"train_loss": -6.76197624206543, "global_step": 152067, "epoch": 3620} {"train_loss": -6.571413040161133, "global_step": 152068, "epoch": 3620} {"train_loss": -6.737170219421387, "global_step": 152069, "epoch": 3620} {"train_loss": -6.871853351593018, "global_step": 152070, "epoch": 3620} {"train_loss": -6.81353235244751, "global_step": 152071, "epoch": 3620} {"train_loss": -6.835969924926758, "global_step": 152072, "epoch": 3620} {"train_loss": -6.852987766265869, "global_step": 152073, "epoch": 3620} {"train_loss": -6.873928070068359, "global_step": 152074, "epoch": 3620} {"train_loss": -6.825949668884277, "global_step": 152075, "epoch": 3620} {"train_loss": -6.811714172363281, "global_step": 152076, "epoch": 3620} {"train_loss": -6.830259323120117, "global_step": 152077, "epoch": 3620} {"train_loss": -6.872359275817871, "global_step": 152078, "epoch": 3620} {"train_loss": -6.825957298278809, "global_step": 152079, "epoch": 3620} {"train_loss": -6.921759605407715, "global_step": 152080, "epoch": 3620} {"train_loss": -6.848771969477336, "global_step": 152081, "epoch": 3620, "val_loss": 68169.7265625} {"train_loss": -6.938101291656494, "global_step": 152082, "epoch": 3621} {"train_loss": -6.865550518035889, "global_step": 152083, "epoch": 3621} {"train_loss": -6.895978927612305, "global_step": 152084, "epoch": 3621} {"train_loss": -6.8683671951293945, "global_step": 152085, "epoch": 3621} {"train_loss": -6.862177848815918, "global_step": 152086, "epoch": 3621} {"train_loss": -7.0189104080200195, "global_step": 152087, "epoch": 3621} {"train_loss": -6.904969215393066, "global_step": 152088, "epoch": 3621} {"train_loss": -6.91342830657959, "global_step": 152089, "epoch": 3621} {"train_loss": -6.919589042663574, "global_step": 152090, "epoch": 3621} {"train_loss": -6.795406341552734, "global_step": 152091, "epoch": 3621} {"train_loss": -6.844522953033447, "global_step": 152092, "epoch": 3621} {"train_loss": -6.787712097167969, "global_step": 152093, "epoch": 3621} {"train_loss": -6.865515232086182, "global_step": 152094, "epoch": 3621} {"train_loss": -6.945606231689453, "global_step": 152095, "epoch": 3621} {"train_loss": -6.727606773376465, "global_step": 152096, "epoch": 3621} {"train_loss": -6.841765880584717, "global_step": 152097, "epoch": 3621} {"train_loss": -6.838852405548096, "global_step": 152098, "epoch": 3621} {"train_loss": -6.817787170410156, "global_step": 152099, "epoch": 3621} {"train_loss": -6.85090970993042, "global_step": 152100, "epoch": 3621} {"train_loss": -6.8005571365356445, "global_step": 152101, "epoch": 3621} {"train_loss": -6.898258686065674, "global_step": 152102, "epoch": 3621} {"train_loss": -6.810081481933594, "global_step": 152103, "epoch": 3621} {"train_loss": -6.86593770980835, "global_step": 152104, "epoch": 3621} {"train_loss": -6.913077354431152, "global_step": 152105, "epoch": 3621} {"train_loss": -6.927983283996582, "global_step": 152106, "epoch": 3621} {"train_loss": -6.893597602844238, "global_step": 152107, "epoch": 3621} {"train_loss": -6.989899635314941, "global_step": 152108, "epoch": 3621} {"train_loss": -7.003321647644043, "global_step": 152109, "epoch": 3621} {"train_loss": -6.918140888214111, "global_step": 152110, "epoch": 3621} {"train_loss": -6.989638328552246, "global_step": 152111, "epoch": 3621} {"train_loss": -6.859262466430664, "global_step": 152112, "epoch": 3621} {"train_loss": -6.914020538330078, "global_step": 152113, "epoch": 3621} {"train_loss": -6.861900806427002, "global_step": 152114, "epoch": 3621} {"train_loss": -6.836177825927734, "global_step": 152115, "epoch": 3621} {"train_loss": -6.892302513122559, "global_step": 152116, "epoch": 3621} {"train_loss": -6.927691459655762, "global_step": 152117, "epoch": 3621} {"train_loss": -6.916548728942871, "global_step": 152118, "epoch": 3621} {"train_loss": -6.983188629150391, "global_step": 152119, "epoch": 3621} {"train_loss": -7.035322189331055, "global_step": 152120, "epoch": 3621} {"train_loss": -6.95401668548584, "global_step": 152121, "epoch": 3621} {"train_loss": -6.9760870933532715, "global_step": 152122, "epoch": 3621} {"train_loss": -6.89545016061692, "global_step": 152123, "epoch": 3621, "val_loss": 68083.765625} {"train_loss": -6.8286333084106445, "global_step": 152124, "epoch": 3622} {"train_loss": -7.027137756347656, "global_step": 152125, "epoch": 3622} {"train_loss": -6.910248756408691, "global_step": 152126, "epoch": 3622} {"train_loss": -6.86504602432251, "global_step": 152127, "epoch": 3622} {"train_loss": -6.8865275382995605, "global_step": 152128, "epoch": 3622} {"train_loss": -6.979472637176514, "global_step": 152129, "epoch": 3622} {"train_loss": -6.908348083496094, "global_step": 152130, "epoch": 3622} {"train_loss": -6.968533515930176, "global_step": 152131, "epoch": 3622} {"train_loss": -7.0216217041015625, "global_step": 152132, "epoch": 3622} {"train_loss": -6.904610633850098, "global_step": 152133, "epoch": 3622} {"train_loss": -6.895786285400391, "global_step": 152134, "epoch": 3622} {"train_loss": -7.027355194091797, "global_step": 152135, "epoch": 3622} {"train_loss": -6.862387180328369, "global_step": 152136, "epoch": 3622} {"train_loss": -6.920183181762695, "global_step": 152137, "epoch": 3622} {"train_loss": -6.8968048095703125, "global_step": 152138, "epoch": 3622} {"train_loss": -6.9687604904174805, "global_step": 152139, "epoch": 3622} {"train_loss": -6.920327186584473, "global_step": 152140, "epoch": 3622} {"train_loss": -6.958704948425293, "global_step": 152141, "epoch": 3622} {"train_loss": -6.925810813903809, "global_step": 152142, "epoch": 3622} {"train_loss": -6.895356178283691, "global_step": 152143, "epoch": 3622} {"train_loss": -6.843475818634033, "global_step": 152144, "epoch": 3622} {"train_loss": -6.814149856567383, "global_step": 152145, "epoch": 3622} {"train_loss": -6.969231605529785, "global_step": 152146, "epoch": 3622} {"train_loss": -6.924777030944824, "global_step": 152147, "epoch": 3622} {"train_loss": -6.954497337341309, "global_step": 152148, "epoch": 3622} {"train_loss": -6.931778907775879, "global_step": 152149, "epoch": 3622} {"train_loss": -6.859356880187988, "global_step": 152150, "epoch": 3622} {"train_loss": -6.895606517791748, "global_step": 152151, "epoch": 3622} {"train_loss": -6.960964202880859, "global_step": 152152, "epoch": 3622} {"train_loss": -6.8295674324035645, "global_step": 152153, "epoch": 3622} {"train_loss": -6.864014625549316, "global_step": 152154, "epoch": 3622} {"train_loss": -6.926017761230469, "global_step": 152155, "epoch": 3622} {"train_loss": -6.854833126068115, "global_step": 152156, "epoch": 3622} {"train_loss": -6.86750602722168, "global_step": 152157, "epoch": 3622} {"train_loss": -6.771083831787109, "global_step": 152158, "epoch": 3622} {"train_loss": -6.945567607879639, "global_step": 152159, "epoch": 3622} {"train_loss": -6.831363201141357, "global_step": 152160, "epoch": 3622} {"train_loss": -6.851142406463623, "global_step": 152161, "epoch": 3622} {"train_loss": -6.868251800537109, "global_step": 152162, "epoch": 3622} {"train_loss": -6.952960014343262, "global_step": 152163, "epoch": 3622} {"train_loss": -6.786343097686768, "global_step": 152164, "epoch": 3622} {"train_loss": -6.902660744530814, "global_step": 152165, "epoch": 3622, "val_loss": 68246.5703125} {"train_loss": -6.721377849578857, "global_step": 152166, "epoch": 3623} {"train_loss": -6.9340620040893555, "global_step": 152167, "epoch": 3623} {"train_loss": -6.860481262207031, "global_step": 152168, "epoch": 3623} {"train_loss": -6.8804192543029785, "global_step": 152169, "epoch": 3623} {"train_loss": -6.883994102478027, "global_step": 152170, "epoch": 3623} {"train_loss": -6.830437660217285, "global_step": 152171, "epoch": 3623} {"train_loss": -6.909205436706543, "global_step": 152172, "epoch": 3623} {"train_loss": -6.844846248626709, "global_step": 152173, "epoch": 3623} {"train_loss": -6.889259338378906, "global_step": 152174, "epoch": 3623} {"train_loss": -6.9035868644714355, "global_step": 152175, "epoch": 3623} {"train_loss": -6.821891784667969, "global_step": 152176, "epoch": 3623} {"train_loss": -6.797644138336182, "global_step": 152177, "epoch": 3623} {"train_loss": -6.834535121917725, "global_step": 152178, "epoch": 3623} {"train_loss": -6.9755377769470215, "global_step": 152179, "epoch": 3623} {"train_loss": -6.899171829223633, "global_step": 152180, "epoch": 3623} {"train_loss": -6.8660383224487305, "global_step": 152181, "epoch": 3623} {"train_loss": -6.955972671508789, "global_step": 152182, "epoch": 3623} {"train_loss": -6.959789276123047, "global_step": 152183, "epoch": 3623} {"train_loss": -6.850976943969727, "global_step": 152184, "epoch": 3623} {"train_loss": -6.933784484863281, "global_step": 152185, "epoch": 3623} {"train_loss": -6.873556613922119, "global_step": 152186, "epoch": 3623} {"train_loss": -6.969305992126465, "global_step": 152187, "epoch": 3623} {"train_loss": -6.916003227233887, "global_step": 152188, "epoch": 3623} {"train_loss": -6.8321943283081055, "global_step": 152189, "epoch": 3623} {"train_loss": -6.893786907196045, "global_step": 152190, "epoch": 3623} {"train_loss": -6.91750431060791, "global_step": 152191, "epoch": 3623} {"train_loss": -6.8932881355285645, "global_step": 152192, "epoch": 3623} {"train_loss": -6.850027561187744, "global_step": 152193, "epoch": 3623} {"train_loss": -6.967043399810791, "global_step": 152194, "epoch": 3623} {"train_loss": -6.981658935546875, "global_step": 152195, "epoch": 3623} {"train_loss": -6.982417106628418, "global_step": 152196, "epoch": 3623} {"train_loss": -6.921892166137695, "global_step": 152197, "epoch": 3623} {"train_loss": -6.83317756652832, "global_step": 152198, "epoch": 3623} {"train_loss": -6.812063217163086, "global_step": 152199, "epoch": 3623} {"train_loss": -6.710567951202393, "global_step": 152200, "epoch": 3623} {"train_loss": -6.820762634277344, "global_step": 152201, "epoch": 3623} {"train_loss": -6.750284194946289, "global_step": 152202, "epoch": 3623} {"train_loss": -6.7995991706848145, "global_step": 152203, "epoch": 3623} {"train_loss": -6.965336799621582, "global_step": 152204, "epoch": 3623} {"train_loss": -6.682779312133789, "global_step": 152205, "epoch": 3623} {"train_loss": -6.8559370040893555, "global_step": 152206, "epoch": 3623} {"train_loss": -6.87149783543178, "global_step": 152207, "epoch": 3623, "val_loss": 67983.40625} {"train_loss": -6.734163284301758, "global_step": 152208, "epoch": 3624} {"train_loss": -6.801092147827148, "global_step": 152209, "epoch": 3624} {"train_loss": -6.888188362121582, "global_step": 152210, "epoch": 3624} {"train_loss": -6.788963317871094, "global_step": 152211, "epoch": 3624} {"train_loss": -6.886713027954102, "global_step": 152212, "epoch": 3624} {"train_loss": -6.774423599243164, "global_step": 152213, "epoch": 3624} {"train_loss": -6.858963966369629, "global_step": 152214, "epoch": 3624} {"train_loss": -6.7977094650268555, "global_step": 152215, "epoch": 3624} {"train_loss": -6.9839348793029785, "global_step": 152216, "epoch": 3624} {"train_loss": -6.838419437408447, "global_step": 152217, "epoch": 3624} {"train_loss": -6.9223504066467285, "global_step": 152218, "epoch": 3624} {"train_loss": -6.869749069213867, "global_step": 152219, "epoch": 3624} {"train_loss": -6.833234786987305, "global_step": 152220, "epoch": 3624} {"train_loss": -6.904167175292969, "global_step": 152221, "epoch": 3624} {"train_loss": -7.0307817459106445, "global_step": 152222, "epoch": 3624} {"train_loss": -6.920306205749512, "global_step": 152223, "epoch": 3624} {"train_loss": -6.846311092376709, "global_step": 152224, "epoch": 3624} {"train_loss": -6.938252925872803, "global_step": 152225, "epoch": 3624} {"train_loss": -7.045559883117676, "global_step": 152226, "epoch": 3624} {"train_loss": -6.964036464691162, "global_step": 152227, "epoch": 3624} {"train_loss": -6.950313568115234, "global_step": 152228, "epoch": 3624} {"train_loss": -6.946277618408203, "global_step": 152229, "epoch": 3624} {"train_loss": -6.905205249786377, "global_step": 152230, "epoch": 3624} {"train_loss": -6.7792158126831055, "global_step": 152231, "epoch": 3624} {"train_loss": -6.896502494812012, "global_step": 152232, "epoch": 3624} {"train_loss": -6.828954219818115, "global_step": 152233, "epoch": 3624} {"train_loss": -6.905905723571777, "global_step": 152234, "epoch": 3624} {"train_loss": -6.970057964324951, "global_step": 152235, "epoch": 3624} {"train_loss": -6.860935211181641, "global_step": 152236, "epoch": 3624} {"train_loss": -6.857427597045898, "global_step": 152237, "epoch": 3624} {"train_loss": -6.995759963989258, "global_step": 152238, "epoch": 3624} {"train_loss": -6.980634689331055, "global_step": 152239, "epoch": 3624} {"train_loss": -6.883657455444336, "global_step": 152240, "epoch": 3624} {"train_loss": -6.899792194366455, "global_step": 152241, "epoch": 3624} {"train_loss": -6.8566155433654785, "global_step": 152242, "epoch": 3624} {"train_loss": -6.85058069229126, "global_step": 152243, "epoch": 3624} {"train_loss": -6.982799530029297, "global_step": 152244, "epoch": 3624} {"train_loss": -6.858162879943848, "global_step": 152245, "epoch": 3624} {"train_loss": -6.8211565017700195, "global_step": 152246, "epoch": 3624} {"train_loss": -6.832563400268555, "global_step": 152247, "epoch": 3624} {"train_loss": -7.004926681518555, "global_step": 152248, "epoch": 3624} {"train_loss": -6.893445979981196, "global_step": 152249, "epoch": 3624, "val_loss": 68256.2109375} {"train_loss": -6.95035457611084, "global_step": 152250, "epoch": 3625} {"train_loss": -6.856910228729248, "global_step": 152251, "epoch": 3625} {"train_loss": -6.881608009338379, "global_step": 152252, "epoch": 3625} {"train_loss": -6.859906196594238, "global_step": 152253, "epoch": 3625} {"train_loss": -6.952200889587402, "global_step": 152254, "epoch": 3625} {"train_loss": -6.967266082763672, "global_step": 152255, "epoch": 3625} {"train_loss": -6.855523109436035, "global_step": 152256, "epoch": 3625} {"train_loss": -6.935840606689453, "global_step": 152257, "epoch": 3625} {"train_loss": -6.799245834350586, "global_step": 152258, "epoch": 3625} {"train_loss": -6.90494966506958, "global_step": 152259, "epoch": 3625} {"train_loss": -6.859681606292725, "global_step": 152260, "epoch": 3625} {"train_loss": -6.764662742614746, "global_step": 152261, "epoch": 3625} {"train_loss": -6.880209922790527, "global_step": 152262, "epoch": 3625} {"train_loss": -6.945539474487305, "global_step": 152263, "epoch": 3625} {"train_loss": -6.849583625793457, "global_step": 152264, "epoch": 3625} {"train_loss": -6.933853626251221, "global_step": 152265, "epoch": 3625} {"train_loss": -6.939214706420898, "global_step": 152266, "epoch": 3625} {"train_loss": -6.9485673904418945, "global_step": 152267, "epoch": 3625} {"train_loss": -6.879505157470703, "global_step": 152268, "epoch": 3625} {"train_loss": -6.923959255218506, "global_step": 152269, "epoch": 3625} {"train_loss": -6.8744707107543945, "global_step": 152270, "epoch": 3625} {"train_loss": -7.0079827308654785, "global_step": 152271, "epoch": 3625} {"train_loss": -6.909813404083252, "global_step": 152272, "epoch": 3625} {"train_loss": -6.941478252410889, "global_step": 152273, "epoch": 3625} {"train_loss": -6.889082908630371, "global_step": 152274, "epoch": 3625} {"train_loss": -6.868892192840576, "global_step": 152275, "epoch": 3625} {"train_loss": -7.0089616775512695, "global_step": 152276, "epoch": 3625} {"train_loss": -6.839019775390625, "global_step": 152277, "epoch": 3625} {"train_loss": -6.867048263549805, "global_step": 152278, "epoch": 3625} {"train_loss": -6.928705215454102, "global_step": 152279, "epoch": 3625} {"train_loss": -6.861811637878418, "global_step": 152280, "epoch": 3625} {"train_loss": -6.854549884796143, "global_step": 152281, "epoch": 3625} {"train_loss": -6.856647491455078, "global_step": 152282, "epoch": 3625} {"train_loss": -6.948178291320801, "global_step": 152283, "epoch": 3625} {"train_loss": -6.972427845001221, "global_step": 152284, "epoch": 3625} {"train_loss": -6.8039679527282715, "global_step": 152285, "epoch": 3625} {"train_loss": -6.891127109527588, "global_step": 152286, "epoch": 3625} {"train_loss": -6.864991188049316, "global_step": 152287, "epoch": 3625} {"train_loss": -6.897024631500244, "global_step": 152288, "epoch": 3625} {"train_loss": -6.824620246887207, "global_step": 152289, "epoch": 3625} {"train_loss": -6.960135459899902, "global_step": 152290, "epoch": 3625} {"train_loss": -6.897244850794475, "global_step": 152291, "epoch": 3625, "val_loss": 68072.59375} {"train_loss": -6.863046169281006, "global_step": 152292, "epoch": 3626} {"train_loss": -6.901614189147949, "global_step": 152293, "epoch": 3626} {"train_loss": -6.901058197021484, "global_step": 152294, "epoch": 3626} {"train_loss": -6.893706321716309, "global_step": 152295, "epoch": 3626} {"train_loss": -6.9407782554626465, "global_step": 152296, "epoch": 3626} {"train_loss": -6.954345703125, "global_step": 152297, "epoch": 3626} {"train_loss": -6.8587188720703125, "global_step": 152298, "epoch": 3626} {"train_loss": -6.840483665466309, "global_step": 152299, "epoch": 3626} {"train_loss": -6.843569755554199, "global_step": 152300, "epoch": 3626} {"train_loss": -6.8123297691345215, "global_step": 152301, "epoch": 3626} {"train_loss": -6.942012310028076, "global_step": 152302, "epoch": 3626} {"train_loss": -6.916787147521973, "global_step": 152303, "epoch": 3626} {"train_loss": -6.944925308227539, "global_step": 152304, "epoch": 3626} {"train_loss": -6.8223161697387695, "global_step": 152305, "epoch": 3626} {"train_loss": -6.734645366668701, "global_step": 152306, "epoch": 3626} {"train_loss": -7.055224418640137, "global_step": 152307, "epoch": 3626} {"train_loss": -6.871297359466553, "global_step": 152308, "epoch": 3626} {"train_loss": -6.708130836486816, "global_step": 152309, "epoch": 3626} {"train_loss": -6.907836437225342, "global_step": 152310, "epoch": 3626} {"train_loss": -6.72902774810791, "global_step": 152311, "epoch": 3626} {"train_loss": -6.844236373901367, "global_step": 152312, "epoch": 3626} {"train_loss": -6.838796615600586, "global_step": 152313, "epoch": 3626} {"train_loss": -6.821256160736084, "global_step": 152314, "epoch": 3626} {"train_loss": -6.7693610191345215, "global_step": 152315, "epoch": 3626} {"train_loss": -6.807237148284912, "global_step": 152316, "epoch": 3626} {"train_loss": -6.880152702331543, "global_step": 152317, "epoch": 3626} {"train_loss": -6.9596638679504395, "global_step": 152318, "epoch": 3626} {"train_loss": -6.847372531890869, "global_step": 152319, "epoch": 3626} {"train_loss": -6.7686991691589355, "global_step": 152320, "epoch": 3626} {"train_loss": -6.867982387542725, "global_step": 152321, "epoch": 3626} {"train_loss": -6.824418067932129, "global_step": 152322, "epoch": 3626} {"train_loss": -6.913914203643799, "global_step": 152323, "epoch": 3626} {"train_loss": -6.786377906799316, "global_step": 152324, "epoch": 3626} {"train_loss": -6.898481845855713, "global_step": 152325, "epoch": 3626} {"train_loss": -6.75198221206665, "global_step": 152326, "epoch": 3626} {"train_loss": -6.7492828369140625, "global_step": 152327, "epoch": 3626} {"train_loss": -6.984792709350586, "global_step": 152328, "epoch": 3626} {"train_loss": -6.937077522277832, "global_step": 152329, "epoch": 3626} {"train_loss": -6.890449047088623, "global_step": 152330, "epoch": 3626} {"train_loss": -6.909884452819824, "global_step": 152331, "epoch": 3626} {"train_loss": -6.750914096832275, "global_step": 152332, "epoch": 3626} {"train_loss": -6.857976913452148, "global_step": 152333, "epoch": 3626, "val_loss": 68238.640625} {"train_loss": -6.915550231933594, "global_step": 152334, "epoch": 3627} {"train_loss": -6.76282262802124, "global_step": 152335, "epoch": 3627} {"train_loss": -6.804027557373047, "global_step": 152336, "epoch": 3627} {"train_loss": -6.701847553253174, "global_step": 152337, "epoch": 3627} {"train_loss": -6.964038848876953, "global_step": 152338, "epoch": 3627} {"train_loss": -6.815932750701904, "global_step": 152339, "epoch": 3627} {"train_loss": -6.756480693817139, "global_step": 152340, "epoch": 3627} {"train_loss": -6.743921279907227, "global_step": 152341, "epoch": 3627} {"train_loss": -6.736796855926514, "global_step": 152342, "epoch": 3627} {"train_loss": -6.655705451965332, "global_step": 152343, "epoch": 3627} {"train_loss": -6.875191688537598, "global_step": 152344, "epoch": 3627} {"train_loss": -6.770566463470459, "global_step": 152345, "epoch": 3627} {"train_loss": -6.91653299331665, "global_step": 152346, "epoch": 3627} {"train_loss": -6.657068252563477, "global_step": 152347, "epoch": 3627} {"train_loss": -6.877819061279297, "global_step": 152348, "epoch": 3627} {"train_loss": -6.7327399253845215, "global_step": 152349, "epoch": 3627} {"train_loss": -6.823871612548828, "global_step": 152350, "epoch": 3627} {"train_loss": -6.798431396484375, "global_step": 152351, "epoch": 3627} {"train_loss": -6.943821430206299, "global_step": 152352, "epoch": 3627} {"train_loss": -6.873556613922119, "global_step": 152353, "epoch": 3627} {"train_loss": -6.815570831298828, "global_step": 152354, "epoch": 3627} {"train_loss": -6.758280277252197, "global_step": 152355, "epoch": 3627} {"train_loss": -6.787957191467285, "global_step": 152356, "epoch": 3627} {"train_loss": -6.901340007781982, "global_step": 152357, "epoch": 3627} {"train_loss": -6.728196144104004, "global_step": 152358, "epoch": 3627} {"train_loss": -6.837899208068848, "global_step": 152359, "epoch": 3627} {"train_loss": -6.809628963470459, "global_step": 152360, "epoch": 3627} {"train_loss": -6.710681438446045, "global_step": 152361, "epoch": 3627} {"train_loss": -6.692268371582031, "global_step": 152362, "epoch": 3627} {"train_loss": -6.867609977722168, "global_step": 152363, "epoch": 3627} {"train_loss": -6.8506269454956055, "global_step": 152364, "epoch": 3627} {"train_loss": -6.836862564086914, "global_step": 152365, "epoch": 3627} {"train_loss": -6.916721820831299, "global_step": 152366, "epoch": 3627} {"train_loss": -6.763337135314941, "global_step": 152367, "epoch": 3627} {"train_loss": -6.849187850952148, "global_step": 152368, "epoch": 3627} {"train_loss": -6.930312633514404, "global_step": 152369, "epoch": 3627} {"train_loss": -6.872058868408203, "global_step": 152370, "epoch": 3627} {"train_loss": -6.865686893463135, "global_step": 152371, "epoch": 3627} {"train_loss": -6.831097602844238, "global_step": 152372, "epoch": 3627} {"train_loss": -6.886727809906006, "global_step": 152373, "epoch": 3627} {"train_loss": -6.967713832855225, "global_step": 152374, "epoch": 3627} {"train_loss": -6.819576774324689, "global_step": 152375, "epoch": 3627, "val_loss": 68195.953125} {"train_loss": -6.901943206787109, "global_step": 152376, "epoch": 3628} {"train_loss": -6.941788196563721, "global_step": 152377, "epoch": 3628} {"train_loss": -6.906726360321045, "global_step": 152378, "epoch": 3628} {"train_loss": -6.897998809814453, "global_step": 152379, "epoch": 3628} {"train_loss": -6.963817596435547, "global_step": 152380, "epoch": 3628} {"train_loss": -7.0027852058410645, "global_step": 152381, "epoch": 3628} {"train_loss": -6.859415054321289, "global_step": 152382, "epoch": 3628} {"train_loss": -6.970516204833984, "global_step": 152383, "epoch": 3628} {"train_loss": -6.9356560707092285, "global_step": 152384, "epoch": 3628} {"train_loss": -6.9044952392578125, "global_step": 152385, "epoch": 3628} {"train_loss": -6.966526031494141, "global_step": 152386, "epoch": 3628} {"train_loss": -6.984582901000977, "global_step": 152387, "epoch": 3628} {"train_loss": -6.799091815948486, "global_step": 152388, "epoch": 3628} {"train_loss": -6.887445449829102, "global_step": 152389, "epoch": 3628} {"train_loss": -6.8831329345703125, "global_step": 152390, "epoch": 3628} {"train_loss": -6.8680243492126465, "global_step": 152391, "epoch": 3628} {"train_loss": -6.910247802734375, "global_step": 152392, "epoch": 3628} {"train_loss": -6.95859432220459, "global_step": 152393, "epoch": 3628} {"train_loss": -6.827788352966309, "global_step": 152394, "epoch": 3628} {"train_loss": -6.912812232971191, "global_step": 152395, "epoch": 3628} {"train_loss": -6.980123519897461, "global_step": 152396, "epoch": 3628} {"train_loss": -6.989232540130615, "global_step": 152397, "epoch": 3628} {"train_loss": -7.046849250793457, "global_step": 152398, "epoch": 3628} {"train_loss": -6.974370002746582, "global_step": 152399, "epoch": 3628} {"train_loss": -6.884576320648193, "global_step": 152400, "epoch": 3628} {"train_loss": -6.836942672729492, "global_step": 152401, "epoch": 3628} {"train_loss": -6.932195663452148, "global_step": 152402, "epoch": 3628} {"train_loss": -6.932466983795166, "global_step": 152403, "epoch": 3628} {"train_loss": -6.93881368637085, "global_step": 152404, "epoch": 3628} {"train_loss": -6.92191219329834, "global_step": 152405, "epoch": 3628} {"train_loss": -6.908376216888428, "global_step": 152406, "epoch": 3628} {"train_loss": -6.8932695388793945, "global_step": 152407, "epoch": 3628} {"train_loss": -6.773886203765869, "global_step": 152408, "epoch": 3628} {"train_loss": -6.844552993774414, "global_step": 152409, "epoch": 3628} {"train_loss": -6.830399513244629, "global_step": 152410, "epoch": 3628} {"train_loss": -6.874838352203369, "global_step": 152411, "epoch": 3628} {"train_loss": -6.83399772644043, "global_step": 152412, "epoch": 3628} {"train_loss": -6.845750331878662, "global_step": 152413, "epoch": 3628} {"train_loss": -6.835648536682129, "global_step": 152414, "epoch": 3628} {"train_loss": -6.79267692565918, "global_step": 152415, "epoch": 3628} {"train_loss": -6.7827653884887695, "global_step": 152416, "epoch": 3628} {"train_loss": -6.9026708489372615, "global_step": 152417, "epoch": 3628, "val_loss": 68359.9453125} {"train_loss": -6.8784260749816895, "global_step": 152418, "epoch": 3629} {"train_loss": -6.95751953125, "global_step": 152419, "epoch": 3629} {"train_loss": -6.816441535949707, "global_step": 152420, "epoch": 3629} {"train_loss": -6.889694690704346, "global_step": 152421, "epoch": 3629} {"train_loss": -6.936999320983887, "global_step": 152422, "epoch": 3629} {"train_loss": -6.978800296783447, "global_step": 152423, "epoch": 3629} {"train_loss": -6.884559154510498, "global_step": 152424, "epoch": 3629} {"train_loss": -6.853445529937744, "global_step": 152425, "epoch": 3629} {"train_loss": -6.891419887542725, "global_step": 152426, "epoch": 3629} {"train_loss": -6.9204936027526855, "global_step": 152427, "epoch": 3629} {"train_loss": -6.897075653076172, "global_step": 152428, "epoch": 3629} {"train_loss": -6.8294501304626465, "global_step": 152429, "epoch": 3629} {"train_loss": -6.96870231628418, "global_step": 152430, "epoch": 3629} {"train_loss": -6.907674312591553, "global_step": 152431, "epoch": 3629} {"train_loss": -6.854215145111084, "global_step": 152432, "epoch": 3629} {"train_loss": -6.777935981750488, "global_step": 152433, "epoch": 3629} {"train_loss": -6.743316650390625, "global_step": 152434, "epoch": 3629} {"train_loss": -6.707450866699219, "global_step": 152435, "epoch": 3629} {"train_loss": -6.87154483795166, "global_step": 152436, "epoch": 3629} {"train_loss": -6.878955841064453, "global_step": 152437, "epoch": 3629} {"train_loss": -6.826035976409912, "global_step": 152438, "epoch": 3629} {"train_loss": -6.887388229370117, "global_step": 152439, "epoch": 3629} {"train_loss": -6.846155166625977, "global_step": 152440, "epoch": 3629} {"train_loss": -6.782491683959961, "global_step": 152441, "epoch": 3629} {"train_loss": -6.765257835388184, "global_step": 152442, "epoch": 3629} {"train_loss": -6.881198883056641, "global_step": 152443, "epoch": 3629} {"train_loss": -6.561363697052002, "global_step": 152444, "epoch": 3629} {"train_loss": -6.856706619262695, "global_step": 152445, "epoch": 3629} {"train_loss": -6.840002059936523, "global_step": 152446, "epoch": 3629} {"train_loss": -6.6902618408203125, "global_step": 152447, "epoch": 3629} {"train_loss": -6.903639793395996, "global_step": 152448, "epoch": 3629} {"train_loss": -6.716065406799316, "global_step": 152449, "epoch": 3629} {"train_loss": -6.6877851486206055, "global_step": 152450, "epoch": 3629} {"train_loss": -6.772515296936035, "global_step": 152451, "epoch": 3629} {"train_loss": -6.810528755187988, "global_step": 152452, "epoch": 3629} {"train_loss": -6.779974460601807, "global_step": 152453, "epoch": 3629} {"train_loss": -6.839786529541016, "global_step": 152454, "epoch": 3629} {"train_loss": -6.874269008636475, "global_step": 152455, "epoch": 3629} {"train_loss": -6.820578575134277, "global_step": 152456, "epoch": 3629} {"train_loss": -6.850255966186523, "global_step": 152457, "epoch": 3629} {"train_loss": -6.852470397949219, "global_step": 152458, "epoch": 3629} {"train_loss": -6.836233014152164, "global_step": 152459, "epoch": 3629, "val_loss": 68016.546875} {"train_loss": -6.931320667266846, "global_step": 152460, "epoch": 3630} {"train_loss": -6.864902019500732, "global_step": 152461, "epoch": 3630} {"train_loss": -6.828427791595459, "global_step": 152462, "epoch": 3630} {"train_loss": -6.8760600090026855, "global_step": 152463, "epoch": 3630} {"train_loss": -6.880784034729004, "global_step": 152464, "epoch": 3630} {"train_loss": -6.968257904052734, "global_step": 152465, "epoch": 3630} {"train_loss": -6.78257942199707, "global_step": 152466, "epoch": 3630} {"train_loss": -6.842443466186523, "global_step": 152467, "epoch": 3630} {"train_loss": -6.883541107177734, "global_step": 152468, "epoch": 3630} {"train_loss": -6.806968688964844, "global_step": 152469, "epoch": 3630} {"train_loss": -7.027459144592285, "global_step": 152470, "epoch": 3630} {"train_loss": -6.84639310836792, "global_step": 152471, "epoch": 3630} {"train_loss": -6.723128318786621, "global_step": 152472, "epoch": 3630} {"train_loss": -6.925525665283203, "global_step": 152473, "epoch": 3630} {"train_loss": -6.825978755950928, "global_step": 152474, "epoch": 3630} {"train_loss": -6.772975921630859, "global_step": 152475, "epoch": 3630} {"train_loss": -6.795077323913574, "global_step": 152476, "epoch": 3630} {"train_loss": -6.820856094360352, "global_step": 152477, "epoch": 3630} {"train_loss": -6.967216491699219, "global_step": 152478, "epoch": 3630} {"train_loss": -6.92877197265625, "global_step": 152479, "epoch": 3630} {"train_loss": -6.937544345855713, "global_step": 152480, "epoch": 3630} {"train_loss": -6.881391525268555, "global_step": 152481, "epoch": 3630} {"train_loss": -6.822722434997559, "global_step": 152482, "epoch": 3630} {"train_loss": -6.935431003570557, "global_step": 152483, "epoch": 3630} {"train_loss": -6.921196937561035, "global_step": 152484, "epoch": 3630} {"train_loss": -6.851358890533447, "global_step": 152485, "epoch": 3630} {"train_loss": -6.862070083618164, "global_step": 152486, "epoch": 3630} {"train_loss": -6.856677532196045, "global_step": 152487, "epoch": 3630} {"train_loss": -6.9190874099731445, "global_step": 152488, "epoch": 3630} {"train_loss": -6.80696964263916, "global_step": 152489, "epoch": 3630} {"train_loss": -6.908818244934082, "global_step": 152490, "epoch": 3630} {"train_loss": -6.872161865234375, "global_step": 152491, "epoch": 3630} {"train_loss": -6.904641151428223, "global_step": 152492, "epoch": 3630} {"train_loss": -6.846843719482422, "global_step": 152493, "epoch": 3630} {"train_loss": -6.880903244018555, "global_step": 152494, "epoch": 3630} {"train_loss": -6.958028793334961, "global_step": 152495, "epoch": 3630} {"train_loss": -6.8432698249816895, "global_step": 152496, "epoch": 3630} {"train_loss": -6.981632232666016, "global_step": 152497, "epoch": 3630} {"train_loss": -6.971332550048828, "global_step": 152498, "epoch": 3630} {"train_loss": -6.920121192932129, "global_step": 152499, "epoch": 3630} {"train_loss": -6.906096458435059, "global_step": 152500, "epoch": 3630} {"train_loss": -6.88045689037868, "global_step": 152501, "epoch": 3630, "val_loss": 68047.6875} {"train_loss": -6.945824146270752, "global_step": 152502, "epoch": 3631} {"train_loss": -6.98591423034668, "global_step": 152503, "epoch": 3631} {"train_loss": -6.8918986320495605, "global_step": 152504, "epoch": 3631} {"train_loss": -6.834383010864258, "global_step": 152505, "epoch": 3631} {"train_loss": -6.856321334838867, "global_step": 152506, "epoch": 3631} {"train_loss": -6.963196754455566, "global_step": 152507, "epoch": 3631} {"train_loss": -6.725395202636719, "global_step": 152508, "epoch": 3631} {"train_loss": -6.846227645874023, "global_step": 152509, "epoch": 3631} {"train_loss": -6.8260698318481445, "global_step": 152510, "epoch": 3631} {"train_loss": -6.856090545654297, "global_step": 152511, "epoch": 3631} {"train_loss": -6.87296199798584, "global_step": 152512, "epoch": 3631} {"train_loss": -6.7652740478515625, "global_step": 152513, "epoch": 3631} {"train_loss": -6.7671709060668945, "global_step": 152514, "epoch": 3631} {"train_loss": -6.921809196472168, "global_step": 152515, "epoch": 3631} {"train_loss": -6.8429365158081055, "global_step": 152516, "epoch": 3631} {"train_loss": -6.805423736572266, "global_step": 152517, "epoch": 3631} {"train_loss": -6.810280799865723, "global_step": 152518, "epoch": 3631} {"train_loss": -6.856937408447266, "global_step": 152519, "epoch": 3631} {"train_loss": -6.838553428649902, "global_step": 152520, "epoch": 3631} {"train_loss": -6.802907466888428, "global_step": 152521, "epoch": 3631} {"train_loss": -6.8756914138793945, "global_step": 152522, "epoch": 3631} {"train_loss": -6.848148822784424, "global_step": 152523, "epoch": 3631} {"train_loss": -6.790865421295166, "global_step": 152524, "epoch": 3631} {"train_loss": -6.752387523651123, "global_step": 152525, "epoch": 3631} {"train_loss": -6.772035598754883, "global_step": 152526, "epoch": 3631} {"train_loss": -6.84792423248291, "global_step": 152527, "epoch": 3631} {"train_loss": -6.870697021484375, "global_step": 152528, "epoch": 3631} {"train_loss": -6.862856388092041, "global_step": 152529, "epoch": 3631} {"train_loss": -6.740967750549316, "global_step": 152530, "epoch": 3631} {"train_loss": -6.840519428253174, "global_step": 152531, "epoch": 3631} {"train_loss": -6.858933448791504, "global_step": 152532, "epoch": 3631} {"train_loss": -6.713349342346191, "global_step": 152533, "epoch": 3631} {"train_loss": -6.789142608642578, "global_step": 152534, "epoch": 3631} {"train_loss": -6.856957912445068, "global_step": 152535, "epoch": 3631} {"train_loss": -6.8492584228515625, "global_step": 152536, "epoch": 3631} {"train_loss": -6.821945667266846, "global_step": 152537, "epoch": 3631} {"train_loss": -6.816026210784912, "global_step": 152538, "epoch": 3631} {"train_loss": -6.892891883850098, "global_step": 152539, "epoch": 3631} {"train_loss": -6.890101432800293, "global_step": 152540, "epoch": 3631} {"train_loss": -6.856525421142578, "global_step": 152541, "epoch": 3631} {"train_loss": -6.803596496582031, "global_step": 152542, "epoch": 3631} {"train_loss": -6.839525211425054, "global_step": 152543, "epoch": 3631, "val_loss": 68187.8359375} {"train_loss": -6.789405822753906, "global_step": 152544, "epoch": 3632} {"train_loss": -6.944372177124023, "global_step": 152545, "epoch": 3632} {"train_loss": -7.004701614379883, "global_step": 152546, "epoch": 3632} {"train_loss": -6.779640197753906, "global_step": 152547, "epoch": 3632} {"train_loss": -6.855005741119385, "global_step": 152548, "epoch": 3632} {"train_loss": -6.7588958740234375, "global_step": 152549, "epoch": 3632} {"train_loss": -6.85038423538208, "global_step": 152550, "epoch": 3632} {"train_loss": -6.962711334228516, "global_step": 152551, "epoch": 3632} {"train_loss": -6.719245910644531, "global_step": 152552, "epoch": 3632} {"train_loss": -6.820782661437988, "global_step": 152553, "epoch": 3632} {"train_loss": -6.965386390686035, "global_step": 152554, "epoch": 3632} {"train_loss": -6.778615951538086, "global_step": 152555, "epoch": 3632} {"train_loss": -6.80202579498291, "global_step": 152556, "epoch": 3632} {"train_loss": -6.767292022705078, "global_step": 152557, "epoch": 3632} {"train_loss": -6.821933746337891, "global_step": 152558, "epoch": 3632} {"train_loss": -6.949408531188965, "global_step": 152559, "epoch": 3632} {"train_loss": -6.773924827575684, "global_step": 152560, "epoch": 3632} {"train_loss": -6.800816535949707, "global_step": 152561, "epoch": 3632} {"train_loss": -6.902185916900635, "global_step": 152562, "epoch": 3632} {"train_loss": -6.823464393615723, "global_step": 152563, "epoch": 3632} {"train_loss": -6.874067783355713, "global_step": 152564, "epoch": 3632} {"train_loss": -6.824746608734131, "global_step": 152565, "epoch": 3632} {"train_loss": -6.798066139221191, "global_step": 152566, "epoch": 3632} {"train_loss": -6.811582088470459, "global_step": 152567, "epoch": 3632} {"train_loss": -6.912627220153809, "global_step": 152568, "epoch": 3632} {"train_loss": -6.806580543518066, "global_step": 152569, "epoch": 3632} {"train_loss": -6.708176612854004, "global_step": 152570, "epoch": 3632} {"train_loss": -6.874760627746582, "global_step": 152571, "epoch": 3632} {"train_loss": -6.848894119262695, "global_step": 152572, "epoch": 3632} {"train_loss": -6.748577117919922, "global_step": 152573, "epoch": 3632} {"train_loss": -6.869365215301514, "global_step": 152574, "epoch": 3632} {"train_loss": -6.810774803161621, "global_step": 152575, "epoch": 3632} {"train_loss": -6.8400163650512695, "global_step": 152576, "epoch": 3632} {"train_loss": -6.818278789520264, "global_step": 152577, "epoch": 3632} {"train_loss": -6.8382673263549805, "global_step": 152578, "epoch": 3632} {"train_loss": -6.8109002113342285, "global_step": 152579, "epoch": 3632} {"train_loss": -6.849226951599121, "global_step": 152580, "epoch": 3632} {"train_loss": -6.918294906616211, "global_step": 152581, "epoch": 3632} {"train_loss": -6.862223148345947, "global_step": 152582, "epoch": 3632} {"train_loss": -6.793429374694824, "global_step": 152583, "epoch": 3632} {"train_loss": -6.8768229484558105, "global_step": 152584, "epoch": 3632} {"train_loss": -6.838430404663086, "global_step": 152585, "epoch": 3632, "val_loss": 68186.2265625} {"train_loss": -6.85233736038208, "global_step": 152586, "epoch": 3633} {"train_loss": -6.833818435668945, "global_step": 152587, "epoch": 3633} {"train_loss": -6.942692279815674, "global_step": 152588, "epoch": 3633} {"train_loss": -6.862637996673584, "global_step": 152589, "epoch": 3633} {"train_loss": -6.752408981323242, "global_step": 152590, "epoch": 3633} {"train_loss": -6.8901166915893555, "global_step": 152591, "epoch": 3633} {"train_loss": -6.8713459968566895, "global_step": 152592, "epoch": 3633} {"train_loss": -6.811640739440918, "global_step": 152593, "epoch": 3633} {"train_loss": -6.826124668121338, "global_step": 152594, "epoch": 3633} {"train_loss": -6.856686115264893, "global_step": 152595, "epoch": 3633} {"train_loss": -6.729033470153809, "global_step": 152596, "epoch": 3633} {"train_loss": -6.908627033233643, "global_step": 152597, "epoch": 3633} {"train_loss": -6.941838264465332, "global_step": 152598, "epoch": 3633} {"train_loss": -6.90596866607666, "global_step": 152599, "epoch": 3633} {"train_loss": -6.9203901290893555, "global_step": 152600, "epoch": 3633} {"train_loss": -6.831784248352051, "global_step": 152601, "epoch": 3633} {"train_loss": -6.797481536865234, "global_step": 152602, "epoch": 3633} {"train_loss": -6.879486560821533, "global_step": 152603, "epoch": 3633} {"train_loss": -6.933624267578125, "global_step": 152604, "epoch": 3633} {"train_loss": -6.849323272705078, "global_step": 152605, "epoch": 3633} {"train_loss": -6.97866153717041, "global_step": 152606, "epoch": 3633} {"train_loss": -6.94211483001709, "global_step": 152607, "epoch": 3633} {"train_loss": -6.847653388977051, "global_step": 152608, "epoch": 3633} {"train_loss": -6.857911109924316, "global_step": 152609, "epoch": 3633} {"train_loss": -6.961681365966797, "global_step": 152610, "epoch": 3633} {"train_loss": -6.919025421142578, "global_step": 152611, "epoch": 3633} {"train_loss": -6.917030334472656, "global_step": 152612, "epoch": 3633} {"train_loss": -6.913150787353516, "global_step": 152613, "epoch": 3633} {"train_loss": -6.873873710632324, "global_step": 152614, "epoch": 3633} {"train_loss": -6.945746421813965, "global_step": 152615, "epoch": 3633} {"train_loss": -6.805454254150391, "global_step": 152616, "epoch": 3633} {"train_loss": -6.82069206237793, "global_step": 152617, "epoch": 3633} {"train_loss": -6.858384132385254, "global_step": 152618, "epoch": 3633} {"train_loss": -6.833920478820801, "global_step": 152619, "epoch": 3633} {"train_loss": -6.915707588195801, "global_step": 152620, "epoch": 3633} {"train_loss": -6.804503440856934, "global_step": 152621, "epoch": 3633} {"train_loss": -6.869980812072754, "global_step": 152622, "epoch": 3633} {"train_loss": -6.724336624145508, "global_step": 152623, "epoch": 3633} {"train_loss": -6.932278156280518, "global_step": 152624, "epoch": 3633} {"train_loss": -6.823138236999512, "global_step": 152625, "epoch": 3633} {"train_loss": -6.780084609985352, "global_step": 152626, "epoch": 3633} {"train_loss": -6.86516379174732, "global_step": 152627, "epoch": 3633, "val_loss": 68085.78125} {"train_loss": -6.786452293395996, "global_step": 152628, "epoch": 3634} {"train_loss": -6.847586631774902, "global_step": 152629, "epoch": 3634} {"train_loss": -6.873529434204102, "global_step": 152630, "epoch": 3634} {"train_loss": -6.882534980773926, "global_step": 152631, "epoch": 3634} {"train_loss": -6.817945957183838, "global_step": 152632, "epoch": 3634} {"train_loss": -6.751798629760742, "global_step": 152633, "epoch": 3634} {"train_loss": -6.914885520935059, "global_step": 152634, "epoch": 3634} {"train_loss": -6.852704048156738, "global_step": 152635, "epoch": 3634} {"train_loss": -6.847397804260254, "global_step": 152636, "epoch": 3634} {"train_loss": -6.881080627441406, "global_step": 152637, "epoch": 3634} {"train_loss": -6.817196369171143, "global_step": 152638, "epoch": 3634} {"train_loss": -6.887080192565918, "global_step": 152639, "epoch": 3634} {"train_loss": -6.995367527008057, "global_step": 152640, "epoch": 3634} {"train_loss": -6.910944938659668, "global_step": 152641, "epoch": 3634} {"train_loss": -6.810911178588867, "global_step": 152642, "epoch": 3634} {"train_loss": -6.933204174041748, "global_step": 152643, "epoch": 3634} {"train_loss": -6.87274694442749, "global_step": 152644, "epoch": 3634} {"train_loss": -7.000965118408203, "global_step": 152645, "epoch": 3634} {"train_loss": -6.8717427253723145, "global_step": 152646, "epoch": 3634} {"train_loss": -6.879374980926514, "global_step": 152647, "epoch": 3634} {"train_loss": -6.835351943969727, "global_step": 152648, "epoch": 3634} {"train_loss": -6.993092060089111, "global_step": 152649, "epoch": 3634} {"train_loss": -7.004208564758301, "global_step": 152650, "epoch": 3634} {"train_loss": -6.910470008850098, "global_step": 152651, "epoch": 3634} {"train_loss": -6.8371429443359375, "global_step": 152652, "epoch": 3634} {"train_loss": -6.959524154663086, "global_step": 152653, "epoch": 3634} {"train_loss": -6.851851940155029, "global_step": 152654, "epoch": 3634} {"train_loss": -6.835963249206543, "global_step": 152655, "epoch": 3634} {"train_loss": -6.828788757324219, "global_step": 152656, "epoch": 3634} {"train_loss": -6.840799331665039, "global_step": 152657, "epoch": 3634} {"train_loss": -6.853849411010742, "global_step": 152658, "epoch": 3634} {"train_loss": -6.877681732177734, "global_step": 152659, "epoch": 3634} {"train_loss": -6.8949384689331055, "global_step": 152660, "epoch": 3634} {"train_loss": -6.764392375946045, "global_step": 152661, "epoch": 3634} {"train_loss": -6.898550510406494, "global_step": 152662, "epoch": 3634} {"train_loss": -6.795119285583496, "global_step": 152663, "epoch": 3634} {"train_loss": -6.75868034362793, "global_step": 152664, "epoch": 3634} {"train_loss": -6.8024420738220215, "global_step": 152665, "epoch": 3634} {"train_loss": -6.774313449859619, "global_step": 152666, "epoch": 3634} {"train_loss": -6.797994613647461, "global_step": 152667, "epoch": 3634} {"train_loss": -6.789614200592041, "global_step": 152668, "epoch": 3634} {"train_loss": -6.8610756397247314, "global_step": 152669, "epoch": 3634, "val_loss": 68048.265625} {"train_loss": -6.842044830322266, "global_step": 152670, "epoch": 3635} {"train_loss": -6.97798490524292, "global_step": 152671, "epoch": 3635} {"train_loss": -6.807051658630371, "global_step": 152672, "epoch": 3635} {"train_loss": -6.844820499420166, "global_step": 152673, "epoch": 3635} {"train_loss": -6.939815044403076, "global_step": 152674, "epoch": 3635} {"train_loss": -6.823234558105469, "global_step": 152675, "epoch": 3635} {"train_loss": -6.832724571228027, "global_step": 152676, "epoch": 3635} {"train_loss": -6.768375396728516, "global_step": 152677, "epoch": 3635} {"train_loss": -6.951667785644531, "global_step": 152678, "epoch": 3635} {"train_loss": -6.783090591430664, "global_step": 152679, "epoch": 3635} {"train_loss": -6.836972236633301, "global_step": 152680, "epoch": 3635} {"train_loss": -6.921617031097412, "global_step": 152681, "epoch": 3635} {"train_loss": -6.7972822189331055, "global_step": 152682, "epoch": 3635} {"train_loss": -6.937649250030518, "global_step": 152683, "epoch": 3635} {"train_loss": -6.878971099853516, "global_step": 152684, "epoch": 3635} {"train_loss": -6.849407196044922, "global_step": 152685, "epoch": 3635} {"train_loss": -6.888598918914795, "global_step": 152686, "epoch": 3635} {"train_loss": -6.866846084594727, "global_step": 152687, "epoch": 3635} {"train_loss": -6.889461517333984, "global_step": 152688, "epoch": 3635} {"train_loss": -6.957851409912109, "global_step": 152689, "epoch": 3635} {"train_loss": -6.884904861450195, "global_step": 152690, "epoch": 3635} {"train_loss": -6.889139175415039, "global_step": 152691, "epoch": 3635} {"train_loss": -6.901071071624756, "global_step": 152692, "epoch": 3635} {"train_loss": -6.884692192077637, "global_step": 152693, "epoch": 3635} {"train_loss": -6.876784801483154, "global_step": 152694, "epoch": 3635} {"train_loss": -6.962061882019043, "global_step": 152695, "epoch": 3635} {"train_loss": -6.773482322692871, "global_step": 152696, "epoch": 3635} {"train_loss": -6.743663311004639, "global_step": 152697, "epoch": 3635} {"train_loss": -6.939255714416504, "global_step": 152698, "epoch": 3635} {"train_loss": -6.894883632659912, "global_step": 152699, "epoch": 3635} {"train_loss": -6.864418029785156, "global_step": 152700, "epoch": 3635} {"train_loss": -6.976879119873047, "global_step": 152701, "epoch": 3635} {"train_loss": -6.85969352722168, "global_step": 152702, "epoch": 3635} {"train_loss": -6.905925750732422, "global_step": 152703, "epoch": 3635} {"train_loss": -6.901920318603516, "global_step": 152704, "epoch": 3635} {"train_loss": -6.939631462097168, "global_step": 152705, "epoch": 3635} {"train_loss": -6.771657466888428, "global_step": 152706, "epoch": 3635} {"train_loss": -6.909001350402832, "global_step": 152707, "epoch": 3635} {"train_loss": -6.826029300689697, "global_step": 152708, "epoch": 3635} {"train_loss": -6.86887264251709, "global_step": 152709, "epoch": 3635} {"train_loss": -6.954815864562988, "global_step": 152710, "epoch": 3635} {"train_loss": -6.876844542367118, "global_step": 152711, "epoch": 3635, "val_loss": 68034.7890625} {"train_loss": -6.920005798339844, "global_step": 152712, "epoch": 3636} {"train_loss": -7.039349555969238, "global_step": 152713, "epoch": 3636} {"train_loss": -6.869245529174805, "global_step": 152714, "epoch": 3636} {"train_loss": -6.749344348907471, "global_step": 152715, "epoch": 3636} {"train_loss": -6.8727922439575195, "global_step": 152716, "epoch": 3636} {"train_loss": -6.9201178550720215, "global_step": 152717, "epoch": 3636} {"train_loss": -6.877366542816162, "global_step": 152718, "epoch": 3636} {"train_loss": -6.827510833740234, "global_step": 152719, "epoch": 3636} {"train_loss": -7.004062652587891, "global_step": 152720, "epoch": 3636} {"train_loss": -6.845458984375, "global_step": 152721, "epoch": 3636} {"train_loss": -6.956947326660156, "global_step": 152722, "epoch": 3636} {"train_loss": -6.942180156707764, "global_step": 152723, "epoch": 3636} {"train_loss": -6.982496738433838, "global_step": 152724, "epoch": 3636} {"train_loss": -6.808149337768555, "global_step": 152725, "epoch": 3636} {"train_loss": -6.758365631103516, "global_step": 152726, "epoch": 3636} {"train_loss": -7.050847053527832, "global_step": 152727, "epoch": 3636} {"train_loss": -6.833287239074707, "global_step": 152728, "epoch": 3636} {"train_loss": -6.787712097167969, "global_step": 152729, "epoch": 3636} {"train_loss": -6.87431001663208, "global_step": 152730, "epoch": 3636} {"train_loss": -6.9080305099487305, "global_step": 152731, "epoch": 3636} {"train_loss": -6.874886989593506, "global_step": 152732, "epoch": 3636} {"train_loss": -6.950149059295654, "global_step": 152733, "epoch": 3636} {"train_loss": -6.819273948669434, "global_step": 152734, "epoch": 3636} {"train_loss": -6.93657112121582, "global_step": 152735, "epoch": 3636} {"train_loss": -6.985720634460449, "global_step": 152736, "epoch": 3636} {"train_loss": -6.86653995513916, "global_step": 152737, "epoch": 3636} {"train_loss": -7.012599468231201, "global_step": 152738, "epoch": 3636} {"train_loss": -6.862500190734863, "global_step": 152739, "epoch": 3636} {"train_loss": -6.995845317840576, "global_step": 152740, "epoch": 3636} {"train_loss": -6.874162673950195, "global_step": 152741, "epoch": 3636} {"train_loss": -7.0438361167907715, "global_step": 152742, "epoch": 3636} {"train_loss": -7.068577289581299, "global_step": 152743, "epoch": 3636} {"train_loss": -6.919316291809082, "global_step": 152744, "epoch": 3636} {"train_loss": -6.964813232421875, "global_step": 152745, "epoch": 3636} {"train_loss": -6.945734977722168, "global_step": 152746, "epoch": 3636} {"train_loss": -6.8387041091918945, "global_step": 152747, "epoch": 3636} {"train_loss": -6.803487777709961, "global_step": 152748, "epoch": 3636} {"train_loss": -6.935948371887207, "global_step": 152749, "epoch": 3636} {"train_loss": -6.992160797119141, "global_step": 152750, "epoch": 3636} {"train_loss": -6.9371232986450195, "global_step": 152751, "epoch": 3636} {"train_loss": -7.058238506317139, "global_step": 152752, "epoch": 3636} {"train_loss": -6.914891935530163, "global_step": 152753, "epoch": 3636, "val_loss": 68021.390625} {"train_loss": -6.862869739532471, "global_step": 152754, "epoch": 3637} {"train_loss": -6.975251197814941, "global_step": 152755, "epoch": 3637} {"train_loss": -7.045069694519043, "global_step": 152756, "epoch": 3637} {"train_loss": -6.901345252990723, "global_step": 152757, "epoch": 3637} {"train_loss": -6.975379943847656, "global_step": 152758, "epoch": 3637} {"train_loss": -7.010695457458496, "global_step": 152759, "epoch": 3637} {"train_loss": -6.851335525512695, "global_step": 152760, "epoch": 3637} {"train_loss": -6.96649694442749, "global_step": 152761, "epoch": 3637} {"train_loss": -6.96807336807251, "global_step": 152762, "epoch": 3637} {"train_loss": -6.928491115570068, "global_step": 152763, "epoch": 3637} {"train_loss": -6.963998317718506, "global_step": 152764, "epoch": 3637} {"train_loss": -6.887990474700928, "global_step": 152765, "epoch": 3637} {"train_loss": -6.884064197540283, "global_step": 152766, "epoch": 3637} {"train_loss": -6.957437515258789, "global_step": 152767, "epoch": 3637} {"train_loss": -6.938222408294678, "global_step": 152768, "epoch": 3637} {"train_loss": -6.892483711242676, "global_step": 152769, "epoch": 3637} {"train_loss": -6.955748558044434, "global_step": 152770, "epoch": 3637} {"train_loss": -6.825621604919434, "global_step": 152771, "epoch": 3637} {"train_loss": -6.917978286743164, "global_step": 152772, "epoch": 3637} {"train_loss": -6.7282867431640625, "global_step": 152773, "epoch": 3637} {"train_loss": -6.8814005851745605, "global_step": 152774, "epoch": 3637} {"train_loss": -7.031003952026367, "global_step": 152775, "epoch": 3637} {"train_loss": -6.981111526489258, "global_step": 152776, "epoch": 3637} {"train_loss": -6.916007995605469, "global_step": 152777, "epoch": 3637} {"train_loss": -6.910834312438965, "global_step": 152778, "epoch": 3637} {"train_loss": -6.748640060424805, "global_step": 152779, "epoch": 3637} {"train_loss": -6.841404438018799, "global_step": 152780, "epoch": 3637} {"train_loss": -6.964325428009033, "global_step": 152781, "epoch": 3637} {"train_loss": -6.8895721435546875, "global_step": 152782, "epoch": 3637} {"train_loss": -6.794132709503174, "global_step": 152783, "epoch": 3637} {"train_loss": -6.820497035980225, "global_step": 152784, "epoch": 3637} {"train_loss": -6.86161994934082, "global_step": 152785, "epoch": 3637} {"train_loss": -6.798188209533691, "global_step": 152786, "epoch": 3637} {"train_loss": -6.93084192276001, "global_step": 152787, "epoch": 3637} {"train_loss": -6.85147762298584, "global_step": 152788, "epoch": 3637} {"train_loss": -6.841612815856934, "global_step": 152789, "epoch": 3637} {"train_loss": -6.8551154136657715, "global_step": 152790, "epoch": 3637} {"train_loss": -6.98763370513916, "global_step": 152791, "epoch": 3637} {"train_loss": -6.791368007659912, "global_step": 152792, "epoch": 3637} {"train_loss": -6.836348533630371, "global_step": 152793, "epoch": 3637} {"train_loss": -6.93137264251709, "global_step": 152794, "epoch": 3637} {"train_loss": -6.897163459232876, "global_step": 152795, "epoch": 3637, "val_loss": 68287.9921875} {"train_loss": -6.9474592208862305, "global_step": 152796, "epoch": 3638} {"train_loss": -6.846164703369141, "global_step": 152797, "epoch": 3638} {"train_loss": -6.901121139526367, "global_step": 152798, "epoch": 3638} {"train_loss": -6.866604804992676, "global_step": 152799, "epoch": 3638} {"train_loss": -6.7806172370910645, "global_step": 152800, "epoch": 3638} {"train_loss": -6.926836967468262, "global_step": 152801, "epoch": 3638} {"train_loss": -6.802225112915039, "global_step": 152802, "epoch": 3638} {"train_loss": -6.886610984802246, "global_step": 152803, "epoch": 3638} {"train_loss": -6.824775695800781, "global_step": 152804, "epoch": 3638} {"train_loss": -6.698805809020996, "global_step": 152805, "epoch": 3638} {"train_loss": -6.818596839904785, "global_step": 152806, "epoch": 3638} {"train_loss": -6.759716033935547, "global_step": 152807, "epoch": 3638} {"train_loss": -6.827635765075684, "global_step": 152808, "epoch": 3638} {"train_loss": -6.650740623474121, "global_step": 152809, "epoch": 3638} {"train_loss": -6.833625793457031, "global_step": 152810, "epoch": 3638} {"train_loss": -6.653687477111816, "global_step": 152811, "epoch": 3638} {"train_loss": -6.794731616973877, "global_step": 152812, "epoch": 3638} {"train_loss": -6.902582168579102, "global_step": 152813, "epoch": 3638} {"train_loss": -6.7587456703186035, "global_step": 152814, "epoch": 3638} {"train_loss": -6.905304908752441, "global_step": 152815, "epoch": 3638} {"train_loss": -6.83704948425293, "global_step": 152816, "epoch": 3638} {"train_loss": -6.871185779571533, "global_step": 152817, "epoch": 3638} {"train_loss": -6.79909610748291, "global_step": 152818, "epoch": 3638} {"train_loss": -6.820080757141113, "global_step": 152819, "epoch": 3638} {"train_loss": -6.805630683898926, "global_step": 152820, "epoch": 3638} {"train_loss": -6.832862377166748, "global_step": 152821, "epoch": 3638} {"train_loss": -6.905884265899658, "global_step": 152822, "epoch": 3638} {"train_loss": -6.769113063812256, "global_step": 152823, "epoch": 3638} {"train_loss": -6.7302470207214355, "global_step": 152824, "epoch": 3638} {"train_loss": -6.8814849853515625, "global_step": 152825, "epoch": 3638} {"train_loss": -6.877213954925537, "global_step": 152826, "epoch": 3638} {"train_loss": -6.713827133178711, "global_step": 152827, "epoch": 3638} {"train_loss": -6.775880813598633, "global_step": 152828, "epoch": 3638} {"train_loss": -6.794064521789551, "global_step": 152829, "epoch": 3638} {"train_loss": -6.839260578155518, "global_step": 152830, "epoch": 3638} {"train_loss": -6.825990676879883, "global_step": 152831, "epoch": 3638} {"train_loss": -6.698345184326172, "global_step": 152832, "epoch": 3638} {"train_loss": -6.9628705978393555, "global_step": 152833, "epoch": 3638} {"train_loss": -6.700291156768799, "global_step": 152834, "epoch": 3638} {"train_loss": -6.714609146118164, "global_step": 152835, "epoch": 3638} {"train_loss": -6.7951860427856445, "global_step": 152836, "epoch": 3638} {"train_loss": -6.808363051641555, "global_step": 152837, "epoch": 3638, "val_loss": 68294.8125} {"train_loss": -6.8863606452941895, "global_step": 152838, "epoch": 3639} {"train_loss": -6.61807918548584, "global_step": 152839, "epoch": 3639} {"train_loss": -6.813614845275879, "global_step": 152840, "epoch": 3639} {"train_loss": -6.765135765075684, "global_step": 152841, "epoch": 3639} {"train_loss": -6.835578918457031, "global_step": 152842, "epoch": 3639} {"train_loss": -6.8593902587890625, "global_step": 152843, "epoch": 3639} {"train_loss": -6.776923656463623, "global_step": 152844, "epoch": 3639} {"train_loss": -6.799285411834717, "global_step": 152845, "epoch": 3639} {"train_loss": -6.782155990600586, "global_step": 152846, "epoch": 3639} {"train_loss": -6.835909843444824, "global_step": 152847, "epoch": 3639} {"train_loss": -6.896791458129883, "global_step": 152848, "epoch": 3639} {"train_loss": -6.854876518249512, "global_step": 152849, "epoch": 3639} {"train_loss": -6.882421016693115, "global_step": 152850, "epoch": 3639} {"train_loss": -6.799416542053223, "global_step": 152851, "epoch": 3639} {"train_loss": -6.8345441818237305, "global_step": 152852, "epoch": 3639} {"train_loss": -6.787871360778809, "global_step": 152853, "epoch": 3639} {"train_loss": -6.934876441955566, "global_step": 152854, "epoch": 3639} {"train_loss": -6.883918285369873, "global_step": 152855, "epoch": 3639} {"train_loss": -6.82381534576416, "global_step": 152856, "epoch": 3639} {"train_loss": -6.838273048400879, "global_step": 152857, "epoch": 3639} {"train_loss": -6.815114974975586, "global_step": 152858, "epoch": 3639} {"train_loss": -6.9224162101745605, "global_step": 152859, "epoch": 3639} {"train_loss": -6.872503280639648, "global_step": 152860, "epoch": 3639} {"train_loss": -6.827573776245117, "global_step": 152861, "epoch": 3639} {"train_loss": -6.957160949707031, "global_step": 152862, "epoch": 3639} {"train_loss": -6.779379367828369, "global_step": 152863, "epoch": 3639} {"train_loss": -6.901648044586182, "global_step": 152864, "epoch": 3639} {"train_loss": -6.908961296081543, "global_step": 152865, "epoch": 3639} {"train_loss": -6.90901517868042, "global_step": 152866, "epoch": 3639} {"train_loss": -6.823907375335693, "global_step": 152867, "epoch": 3639} {"train_loss": -6.821603775024414, "global_step": 152868, "epoch": 3639} {"train_loss": -6.859302520751953, "global_step": 152869, "epoch": 3639} {"train_loss": -6.748725891113281, "global_step": 152870, "epoch": 3639} {"train_loss": -6.900540351867676, "global_step": 152871, "epoch": 3639} {"train_loss": -6.8840742111206055, "global_step": 152872, "epoch": 3639} {"train_loss": -6.759507179260254, "global_step": 152873, "epoch": 3639} {"train_loss": -6.730133056640625, "global_step": 152874, "epoch": 3639} {"train_loss": -6.911688804626465, "global_step": 152875, "epoch": 3639} {"train_loss": -6.769329071044922, "global_step": 152876, "epoch": 3639} {"train_loss": -6.801163673400879, "global_step": 152877, "epoch": 3639} {"train_loss": -6.889991760253906, "global_step": 152878, "epoch": 3639} {"train_loss": -6.836936587379093, "global_step": 152879, "epoch": 3639, "val_loss": 68094.140625} {"train_loss": -6.8744330406188965, "global_step": 152880, "epoch": 3640} {"train_loss": -6.80627965927124, "global_step": 152881, "epoch": 3640} {"train_loss": -6.809889316558838, "global_step": 152882, "epoch": 3640} {"train_loss": -6.840441703796387, "global_step": 152883, "epoch": 3640} {"train_loss": -6.9183454513549805, "global_step": 152884, "epoch": 3640} {"train_loss": -6.772767066955566, "global_step": 152885, "epoch": 3640} {"train_loss": -6.8597331047058105, "global_step": 152886, "epoch": 3640} {"train_loss": -6.891907691955566, "global_step": 152887, "epoch": 3640} {"train_loss": -6.862478256225586, "global_step": 152888, "epoch": 3640} {"train_loss": -6.880463123321533, "global_step": 152889, "epoch": 3640} {"train_loss": -6.789267539978027, "global_step": 152890, "epoch": 3640} {"train_loss": -6.8030548095703125, "global_step": 152891, "epoch": 3640} {"train_loss": -6.964717864990234, "global_step": 152892, "epoch": 3640} {"train_loss": -6.910238265991211, "global_step": 152893, "epoch": 3640} {"train_loss": -6.913787364959717, "global_step": 152894, "epoch": 3640} {"train_loss": -6.769915580749512, "global_step": 152895, "epoch": 3640} {"train_loss": -6.959115028381348, "global_step": 152896, "epoch": 3640} {"train_loss": -6.777373313903809, "global_step": 152897, "epoch": 3640} {"train_loss": -6.968587875366211, "global_step": 152898, "epoch": 3640} {"train_loss": -6.966555118560791, "global_step": 152899, "epoch": 3640} {"train_loss": -6.918459415435791, "global_step": 152900, "epoch": 3640} {"train_loss": -6.945951461791992, "global_step": 152901, "epoch": 3640} {"train_loss": -6.953490734100342, "global_step": 152902, "epoch": 3640} {"train_loss": -6.975039482116699, "global_step": 152903, "epoch": 3640} {"train_loss": -6.960921764373779, "global_step": 152904, "epoch": 3640} {"train_loss": -6.999062538146973, "global_step": 152905, "epoch": 3640} {"train_loss": -6.979337215423584, "global_step": 152906, "epoch": 3640} {"train_loss": -6.863309860229492, "global_step": 152907, "epoch": 3640} {"train_loss": -6.815122604370117, "global_step": 152908, "epoch": 3640} {"train_loss": -6.850666046142578, "global_step": 152909, "epoch": 3640} {"train_loss": -6.921174049377441, "global_step": 152910, "epoch": 3640} {"train_loss": -6.99063777923584, "global_step": 152911, "epoch": 3640} {"train_loss": -6.781650543212891, "global_step": 152912, "epoch": 3640} {"train_loss": -6.902717113494873, "global_step": 152913, "epoch": 3640} {"train_loss": -6.9639482498168945, "global_step": 152914, "epoch": 3640} {"train_loss": -6.865629196166992, "global_step": 152915, "epoch": 3640} {"train_loss": -6.975528717041016, "global_step": 152916, "epoch": 3640} {"train_loss": -6.953392028808594, "global_step": 152917, "epoch": 3640} {"train_loss": -6.884275436401367, "global_step": 152918, "epoch": 3640} {"train_loss": -6.727476119995117, "global_step": 152919, "epoch": 3640} {"train_loss": -6.854610919952393, "global_step": 152920, "epoch": 3640} {"train_loss": -6.888722783043271, "global_step": 152921, "epoch": 3640, "val_loss": 68141.5859375} {"train_loss": -6.835493087768555, "global_step": 152922, "epoch": 3641} {"train_loss": -6.944616317749023, "global_step": 152923, "epoch": 3641} {"train_loss": -7.007975101470947, "global_step": 152924, "epoch": 3641} {"train_loss": -6.837762832641602, "global_step": 152925, "epoch": 3641} {"train_loss": -6.954608917236328, "global_step": 152926, "epoch": 3641} {"train_loss": -6.902712345123291, "global_step": 152927, "epoch": 3641} {"train_loss": -6.9103899002075195, "global_step": 152928, "epoch": 3641} {"train_loss": -6.834994792938232, "global_step": 152929, "epoch": 3641} {"train_loss": -6.802305221557617, "global_step": 152930, "epoch": 3641} {"train_loss": -6.9149322509765625, "global_step": 152931, "epoch": 3641} {"train_loss": -6.824793338775635, "global_step": 152932, "epoch": 3641} {"train_loss": -6.835545539855957, "global_step": 152933, "epoch": 3641} {"train_loss": -6.8464813232421875, "global_step": 152934, "epoch": 3641} {"train_loss": -6.841568946838379, "global_step": 152935, "epoch": 3641} {"train_loss": -7.001421928405762, "global_step": 152936, "epoch": 3641} {"train_loss": -6.869802474975586, "global_step": 152937, "epoch": 3641} {"train_loss": -6.919353485107422, "global_step": 152938, "epoch": 3641} {"train_loss": -6.9475860595703125, "global_step": 152939, "epoch": 3641} {"train_loss": -6.907519340515137, "global_step": 152940, "epoch": 3641} {"train_loss": -6.821881294250488, "global_step": 152941, "epoch": 3641} {"train_loss": -6.933959007263184, "global_step": 152942, "epoch": 3641} {"train_loss": -6.91876220703125, "global_step": 152943, "epoch": 3641} {"train_loss": -6.898166656494141, "global_step": 152944, "epoch": 3641} {"train_loss": -6.863139629364014, "global_step": 152945, "epoch": 3641} {"train_loss": -6.860073566436768, "global_step": 152946, "epoch": 3641} {"train_loss": -6.868083477020264, "global_step": 152947, "epoch": 3641} {"train_loss": -6.901797294616699, "global_step": 152948, "epoch": 3641} {"train_loss": -6.858310699462891, "global_step": 152949, "epoch": 3641} {"train_loss": -6.910962104797363, "global_step": 152950, "epoch": 3641} {"train_loss": -6.893348693847656, "global_step": 152951, "epoch": 3641} {"train_loss": -6.881594181060791, "global_step": 152952, "epoch": 3641} {"train_loss": -6.8424882888793945, "global_step": 152953, "epoch": 3641} {"train_loss": -6.92488956451416, "global_step": 152954, "epoch": 3641} {"train_loss": -6.984165191650391, "global_step": 152955, "epoch": 3641} {"train_loss": -6.833182334899902, "global_step": 152956, "epoch": 3641} {"train_loss": -6.918011665344238, "global_step": 152957, "epoch": 3641} {"train_loss": -6.95158052444458, "global_step": 152958, "epoch": 3641} {"train_loss": -6.888176918029785, "global_step": 152959, "epoch": 3641} {"train_loss": -6.9539031982421875, "global_step": 152960, "epoch": 3641} {"train_loss": -6.835684299468994, "global_step": 152961, "epoch": 3641} {"train_loss": -6.876719951629639, "global_step": 152962, "epoch": 3641} {"train_loss": -6.892415466762724, "global_step": 152963, "epoch": 3641, "val_loss": 68109.578125} {"train_loss": -6.884880542755127, "global_step": 152964, "epoch": 3642} {"train_loss": -6.9919047355651855, "global_step": 152965, "epoch": 3642} {"train_loss": -6.907989501953125, "global_step": 152966, "epoch": 3642} {"train_loss": -6.888989448547363, "global_step": 152967, "epoch": 3642} {"train_loss": -6.940528869628906, "global_step": 152968, "epoch": 3642} {"train_loss": -6.924522399902344, "global_step": 152969, "epoch": 3642} {"train_loss": -6.8639631271362305, "global_step": 152970, "epoch": 3642} {"train_loss": -6.994755744934082, "global_step": 152971, "epoch": 3642} {"train_loss": -6.937077522277832, "global_step": 152972, "epoch": 3642} {"train_loss": -6.9093732833862305, "global_step": 152973, "epoch": 3642} {"train_loss": -6.900477409362793, "global_step": 152974, "epoch": 3642} {"train_loss": -6.909743785858154, "global_step": 152975, "epoch": 3642} {"train_loss": -6.879656791687012, "global_step": 152976, "epoch": 3642} {"train_loss": -6.85860013961792, "global_step": 152977, "epoch": 3642} {"train_loss": -6.970780372619629, "global_step": 152978, "epoch": 3642} {"train_loss": -6.714137554168701, "global_step": 152979, "epoch": 3642} {"train_loss": -6.732260704040527, "global_step": 152980, "epoch": 3642} {"train_loss": -6.827117919921875, "global_step": 152981, "epoch": 3642} {"train_loss": -6.879213333129883, "global_step": 152982, "epoch": 3642} {"train_loss": -6.659337997436523, "global_step": 152983, "epoch": 3642} {"train_loss": -6.7301154136657715, "global_step": 152984, "epoch": 3642} {"train_loss": -6.916195869445801, "global_step": 152985, "epoch": 3642} {"train_loss": -6.778843879699707, "global_step": 152986, "epoch": 3642} {"train_loss": -6.888583660125732, "global_step": 152987, "epoch": 3642} {"train_loss": -6.808771133422852, "global_step": 152988, "epoch": 3642} {"train_loss": -6.889670372009277, "global_step": 152989, "epoch": 3642} {"train_loss": -6.774537563323975, "global_step": 152990, "epoch": 3642} {"train_loss": -6.75540828704834, "global_step": 152991, "epoch": 3642} {"train_loss": -6.723138809204102, "global_step": 152992, "epoch": 3642} {"train_loss": -6.857444763183594, "global_step": 152993, "epoch": 3642} {"train_loss": -6.743320941925049, "global_step": 152994, "epoch": 3642} {"train_loss": -6.767085075378418, "global_step": 152995, "epoch": 3642} {"train_loss": -6.816286087036133, "global_step": 152996, "epoch": 3642} {"train_loss": -6.8624444007873535, "global_step": 152997, "epoch": 3642} {"train_loss": -6.84902286529541, "global_step": 152998, "epoch": 3642} {"train_loss": -6.842832565307617, "global_step": 152999, "epoch": 3642} {"train_loss": -6.886560440063477, "global_step": 153000, "epoch": 3642} {"train_loss": -6.8013739585876465, "global_step": 153001, "epoch": 3642} {"train_loss": -6.869693756103516, "global_step": 153002, "epoch": 3642} {"train_loss": -6.918262958526611, "global_step": 153003, "epoch": 3642} {"train_loss": -6.925235271453857, "global_step": 153004, "epoch": 3642} {"train_loss": -6.852024736858549, "global_step": 153005, "epoch": 3642, "val_loss": 68105.71875} {"train_loss": -6.905473232269287, "global_step": 153006, "epoch": 3643} {"train_loss": -6.781267166137695, "global_step": 153007, "epoch": 3643} {"train_loss": -6.88802433013916, "global_step": 153008, "epoch": 3643} {"train_loss": -6.800427436828613, "global_step": 153009, "epoch": 3643} {"train_loss": -6.866448879241943, "global_step": 153010, "epoch": 3643} {"train_loss": -6.934762954711914, "global_step": 153011, "epoch": 3643} {"train_loss": -6.836939811706543, "global_step": 153012, "epoch": 3643} {"train_loss": -6.902126312255859, "global_step": 153013, "epoch": 3643} {"train_loss": -6.922413349151611, "global_step": 153014, "epoch": 3643} {"train_loss": -6.900843620300293, "global_step": 153015, "epoch": 3643} {"train_loss": -6.9193315505981445, "global_step": 153016, "epoch": 3643} {"train_loss": -6.968779563903809, "global_step": 153017, "epoch": 3643} {"train_loss": -6.891167640686035, "global_step": 153018, "epoch": 3643} {"train_loss": -6.863124847412109, "global_step": 153019, "epoch": 3643} {"train_loss": -6.750827789306641, "global_step": 153020, "epoch": 3643} {"train_loss": -6.899303436279297, "global_step": 153021, "epoch": 3643} {"train_loss": -6.8546342849731445, "global_step": 153022, "epoch": 3643} {"train_loss": -6.933620452880859, "global_step": 153023, "epoch": 3643} {"train_loss": -6.858413219451904, "global_step": 153024, "epoch": 3643} {"train_loss": -6.902400016784668, "global_step": 153025, "epoch": 3643} {"train_loss": -7.012688636779785, "global_step": 153026, "epoch": 3643} {"train_loss": -6.905102729797363, "global_step": 153027, "epoch": 3643} {"train_loss": -6.925947666168213, "global_step": 153028, "epoch": 3643} {"train_loss": -6.830138206481934, "global_step": 153029, "epoch": 3643} {"train_loss": -6.85357666015625, "global_step": 153030, "epoch": 3643} {"train_loss": -6.881552696228027, "global_step": 153031, "epoch": 3643} {"train_loss": -6.866231918334961, "global_step": 153032, "epoch": 3643} {"train_loss": -6.88062858581543, "global_step": 153033, "epoch": 3643} {"train_loss": -6.819267272949219, "global_step": 153034, "epoch": 3643} {"train_loss": -7.008451461791992, "global_step": 153035, "epoch": 3643} {"train_loss": -6.929015159606934, "global_step": 153036, "epoch": 3643} {"train_loss": -6.861142158508301, "global_step": 153037, "epoch": 3643} {"train_loss": -6.948218822479248, "global_step": 153038, "epoch": 3643} {"train_loss": -6.752485752105713, "global_step": 153039, "epoch": 3643} {"train_loss": -6.853100776672363, "global_step": 153040, "epoch": 3643} {"train_loss": -6.864409923553467, "global_step": 153041, "epoch": 3643} {"train_loss": -6.919314861297607, "global_step": 153042, "epoch": 3643} {"train_loss": -6.9372663497924805, "global_step": 153043, "epoch": 3643} {"train_loss": -6.949604034423828, "global_step": 153044, "epoch": 3643} {"train_loss": -6.934957504272461, "global_step": 153045, "epoch": 3643} {"train_loss": -6.925271987915039, "global_step": 153046, "epoch": 3643} {"train_loss": -6.887847060248966, "global_step": 153047, "epoch": 3643, "val_loss": 68215.46875} {"train_loss": -6.826080799102783, "global_step": 153048, "epoch": 3644} {"train_loss": -6.795128345489502, "global_step": 153049, "epoch": 3644} {"train_loss": -6.974560737609863, "global_step": 153050, "epoch": 3644} {"train_loss": -6.80735969543457, "global_step": 153051, "epoch": 3644} {"train_loss": -6.764557838439941, "global_step": 153052, "epoch": 3644} {"train_loss": -6.879561424255371, "global_step": 153053, "epoch": 3644} {"train_loss": -6.894583702087402, "global_step": 153054, "epoch": 3644} {"train_loss": -6.807079315185547, "global_step": 153055, "epoch": 3644} {"train_loss": -6.808993339538574, "global_step": 153056, "epoch": 3644} {"train_loss": -6.933480262756348, "global_step": 153057, "epoch": 3644} {"train_loss": -6.896116733551025, "global_step": 153058, "epoch": 3644} {"train_loss": -6.777963638305664, "global_step": 153059, "epoch": 3644} {"train_loss": -6.790763854980469, "global_step": 153060, "epoch": 3644} {"train_loss": -6.846982955932617, "global_step": 153061, "epoch": 3644} {"train_loss": -6.921959400177002, "global_step": 153062, "epoch": 3644} {"train_loss": -6.867128849029541, "global_step": 153063, "epoch": 3644} {"train_loss": -6.880756378173828, "global_step": 153064, "epoch": 3644} {"train_loss": -6.885221481323242, "global_step": 153065, "epoch": 3644} {"train_loss": -6.959563732147217, "global_step": 153066, "epoch": 3644} {"train_loss": -6.955825328826904, "global_step": 153067, "epoch": 3644} {"train_loss": -6.918404579162598, "global_step": 153068, "epoch": 3644} {"train_loss": -6.851320266723633, "global_step": 153069, "epoch": 3644} {"train_loss": -6.844944000244141, "global_step": 153070, "epoch": 3644} {"train_loss": -6.914173126220703, "global_step": 153071, "epoch": 3644} {"train_loss": -6.930931568145752, "global_step": 153072, "epoch": 3644} {"train_loss": -6.7871294021606445, "global_step": 153073, "epoch": 3644} {"train_loss": -6.819892883300781, "global_step": 153074, "epoch": 3644} {"train_loss": -6.955507278442383, "global_step": 153075, "epoch": 3644} {"train_loss": -6.91407585144043, "global_step": 153076, "epoch": 3644} {"train_loss": -6.942756175994873, "global_step": 153077, "epoch": 3644} {"train_loss": -6.909352779388428, "global_step": 153078, "epoch": 3644} {"train_loss": -6.786677360534668, "global_step": 153079, "epoch": 3644} {"train_loss": -6.884222984313965, "global_step": 153080, "epoch": 3644} {"train_loss": -6.968605041503906, "global_step": 153081, "epoch": 3644} {"train_loss": -6.924332141876221, "global_step": 153082, "epoch": 3644} {"train_loss": -6.871511459350586, "global_step": 153083, "epoch": 3644} {"train_loss": -6.931316375732422, "global_step": 153084, "epoch": 3644} {"train_loss": -6.863592147827148, "global_step": 153085, "epoch": 3644} {"train_loss": -6.86031436920166, "global_step": 153086, "epoch": 3644} {"train_loss": -6.939800262451172, "global_step": 153087, "epoch": 3644} {"train_loss": -6.900261878967285, "global_step": 153088, "epoch": 3644} {"train_loss": -6.8815628460475375, "global_step": 153089, "epoch": 3644, "val_loss": 68210.015625} {"train_loss": -6.945058822631836, "global_step": 153090, "epoch": 3645} {"train_loss": -6.931275367736816, "global_step": 153091, "epoch": 3645} {"train_loss": -6.896442413330078, "global_step": 153092, "epoch": 3645} {"train_loss": -6.998116493225098, "global_step": 153093, "epoch": 3645} {"train_loss": -6.966658115386963, "global_step": 153094, "epoch": 3645} {"train_loss": -6.88480806350708, "global_step": 153095, "epoch": 3645} {"train_loss": -6.9108781814575195, "global_step": 153096, "epoch": 3645} {"train_loss": -6.890277862548828, "global_step": 153097, "epoch": 3645} {"train_loss": -6.891197204589844, "global_step": 153098, "epoch": 3645} {"train_loss": -6.867507457733154, "global_step": 153099, "epoch": 3645} {"train_loss": -6.888517379760742, "global_step": 153100, "epoch": 3645} {"train_loss": -6.8316450119018555, "global_step": 153101, "epoch": 3645} {"train_loss": -6.831607341766357, "global_step": 153102, "epoch": 3645} {"train_loss": -6.968936920166016, "global_step": 153103, "epoch": 3645} {"train_loss": -6.933984279632568, "global_step": 153104, "epoch": 3645} {"train_loss": -6.989370346069336, "global_step": 153105, "epoch": 3645} {"train_loss": -6.915282249450684, "global_step": 153106, "epoch": 3645} {"train_loss": -6.87178373336792, "global_step": 153107, "epoch": 3645} {"train_loss": -6.887292861938477, "global_step": 153108, "epoch": 3645} {"train_loss": -6.90439510345459, "global_step": 153109, "epoch": 3645} {"train_loss": -6.895759582519531, "global_step": 153110, "epoch": 3645} {"train_loss": -6.973636150360107, "global_step": 153111, "epoch": 3645} {"train_loss": -6.937320232391357, "global_step": 153112, "epoch": 3645} {"train_loss": -6.892359256744385, "global_step": 153113, "epoch": 3645} {"train_loss": -6.867071628570557, "global_step": 153114, "epoch": 3645} {"train_loss": -7.052267551422119, "global_step": 153115, "epoch": 3645} {"train_loss": -6.969296932220459, "global_step": 153116, "epoch": 3645} {"train_loss": -7.014151573181152, "global_step": 153117, "epoch": 3645} {"train_loss": -6.848767280578613, "global_step": 153118, "epoch": 3645} {"train_loss": -6.799830436706543, "global_step": 153119, "epoch": 3645} {"train_loss": -6.920449733734131, "global_step": 153120, "epoch": 3645} {"train_loss": -6.926538944244385, "global_step": 153121, "epoch": 3645} {"train_loss": -6.849421501159668, "global_step": 153122, "epoch": 3645} {"train_loss": -6.860284805297852, "global_step": 153123, "epoch": 3645} {"train_loss": -6.848390102386475, "global_step": 153124, "epoch": 3645} {"train_loss": -6.871954441070557, "global_step": 153125, "epoch": 3645} {"train_loss": -6.880366325378418, "global_step": 153126, "epoch": 3645} {"train_loss": -6.850371360778809, "global_step": 153127, "epoch": 3645} {"train_loss": -6.990772247314453, "global_step": 153128, "epoch": 3645} {"train_loss": -6.887032508850098, "global_step": 153129, "epoch": 3645} {"train_loss": -6.862090110778809, "global_step": 153130, "epoch": 3645} {"train_loss": -6.90925247328622, "global_step": 153131, "epoch": 3645, "val_loss": 68240.3984375} {"train_loss": -6.863366603851318, "global_step": 153132, "epoch": 3646} {"train_loss": -6.893696308135986, "global_step": 153133, "epoch": 3646} {"train_loss": -6.836047649383545, "global_step": 153134, "epoch": 3646} {"train_loss": -6.858816623687744, "global_step": 153135, "epoch": 3646} {"train_loss": -6.875181198120117, "global_step": 153136, "epoch": 3646} {"train_loss": -6.8579182624816895, "global_step": 153137, "epoch": 3646} {"train_loss": -6.982595443725586, "global_step": 153138, "epoch": 3646} {"train_loss": -6.932008743286133, "global_step": 153139, "epoch": 3646} {"train_loss": -6.90639591217041, "global_step": 153140, "epoch": 3646} {"train_loss": -6.905629634857178, "global_step": 153141, "epoch": 3646} {"train_loss": -7.008700847625732, "global_step": 153142, "epoch": 3646} {"train_loss": -6.853676795959473, "global_step": 153143, "epoch": 3646} {"train_loss": -6.954751968383789, "global_step": 153144, "epoch": 3646} {"train_loss": -6.9154052734375, "global_step": 153145, "epoch": 3646} {"train_loss": -6.809195518493652, "global_step": 153146, "epoch": 3646} {"train_loss": -6.8514909744262695, "global_step": 153147, "epoch": 3646} {"train_loss": -6.944178104400635, "global_step": 153148, "epoch": 3646} {"train_loss": -7.010863304138184, "global_step": 153149, "epoch": 3646} {"train_loss": -7.010196685791016, "global_step": 153150, "epoch": 3646} {"train_loss": -6.889981269836426, "global_step": 153151, "epoch": 3646} {"train_loss": -6.901721477508545, "global_step": 153152, "epoch": 3646} {"train_loss": -7.015007972717285, "global_step": 153153, "epoch": 3646} {"train_loss": -6.988161563873291, "global_step": 153154, "epoch": 3646} {"train_loss": -7.016294479370117, "global_step": 153155, "epoch": 3646} {"train_loss": -7.008033752441406, "global_step": 153156, "epoch": 3646} {"train_loss": -6.969399452209473, "global_step": 153157, "epoch": 3646} {"train_loss": -6.9421257972717285, "global_step": 153158, "epoch": 3646} {"train_loss": -6.852390289306641, "global_step": 153159, "epoch": 3646} {"train_loss": -6.922008991241455, "global_step": 153160, "epoch": 3646} {"train_loss": -6.9690141677856445, "global_step": 153161, "epoch": 3646} {"train_loss": -6.994058609008789, "global_step": 153162, "epoch": 3646} {"train_loss": -7.012151718139648, "global_step": 153163, "epoch": 3646} {"train_loss": -6.946380615234375, "global_step": 153164, "epoch": 3646} {"train_loss": -6.911013603210449, "global_step": 153165, "epoch": 3646} {"train_loss": -6.90606689453125, "global_step": 153166, "epoch": 3646} {"train_loss": -6.996127128601074, "global_step": 153167, "epoch": 3646} {"train_loss": -6.968546390533447, "global_step": 153168, "epoch": 3646} {"train_loss": -6.837122917175293, "global_step": 153169, "epoch": 3646} {"train_loss": -6.922728061676025, "global_step": 153170, "epoch": 3646} {"train_loss": -6.826115608215332, "global_step": 153171, "epoch": 3646} {"train_loss": -6.890190601348877, "global_step": 153172, "epoch": 3646} {"train_loss": -6.926359358287993, "global_step": 153173, "epoch": 3646, "val_loss": 68322.1953125} {"train_loss": -6.889163017272949, "global_step": 153174, "epoch": 3647} {"train_loss": -6.846295356750488, "global_step": 153175, "epoch": 3647} {"train_loss": -6.878181457519531, "global_step": 153176, "epoch": 3647} {"train_loss": -6.884820461273193, "global_step": 153177, "epoch": 3647} {"train_loss": -6.906508445739746, "global_step": 153178, "epoch": 3647} {"train_loss": -6.818308353424072, "global_step": 153179, "epoch": 3647} {"train_loss": -6.9441328048706055, "global_step": 153180, "epoch": 3647} {"train_loss": -6.858782768249512, "global_step": 153181, "epoch": 3647} {"train_loss": -6.602931976318359, "global_step": 153182, "epoch": 3647} {"train_loss": -6.8968095779418945, "global_step": 153183, "epoch": 3647} {"train_loss": -6.814361095428467, "global_step": 153184, "epoch": 3647} {"train_loss": -6.843576431274414, "global_step": 153185, "epoch": 3647} {"train_loss": -6.932036399841309, "global_step": 153186, "epoch": 3647} {"train_loss": -6.942248344421387, "global_step": 153187, "epoch": 3647} {"train_loss": -6.778124809265137, "global_step": 153188, "epoch": 3647} {"train_loss": -6.764497756958008, "global_step": 153189, "epoch": 3647} {"train_loss": -6.796914100646973, "global_step": 153190, "epoch": 3647} {"train_loss": -6.733491897583008, "global_step": 153191, "epoch": 3647} {"train_loss": -6.801995277404785, "global_step": 153192, "epoch": 3647} {"train_loss": -6.916896820068359, "global_step": 153193, "epoch": 3647} {"train_loss": -6.816037178039551, "global_step": 153194, "epoch": 3647} {"train_loss": -6.726534843444824, "global_step": 153195, "epoch": 3647} {"train_loss": -6.698001861572266, "global_step": 153196, "epoch": 3647} {"train_loss": -6.685997009277344, "global_step": 153197, "epoch": 3647} {"train_loss": -6.832009315490723, "global_step": 153198, "epoch": 3647} {"train_loss": -6.704795837402344, "global_step": 153199, "epoch": 3647} {"train_loss": -6.914889335632324, "global_step": 153200, "epoch": 3647} {"train_loss": -6.738584995269775, "global_step": 153201, "epoch": 3647} {"train_loss": -6.719692230224609, "global_step": 153202, "epoch": 3647} {"train_loss": -6.85714054107666, "global_step": 153203, "epoch": 3647} {"train_loss": -6.6871113777160645, "global_step": 153204, "epoch": 3647} {"train_loss": -6.736433982849121, "global_step": 153205, "epoch": 3647} {"train_loss": -6.91718864440918, "global_step": 153206, "epoch": 3647} {"train_loss": -6.811209678649902, "global_step": 153207, "epoch": 3647} {"train_loss": -6.798439979553223, "global_step": 153208, "epoch": 3647} {"train_loss": -6.807227611541748, "global_step": 153209, "epoch": 3647} {"train_loss": -6.84995174407959, "global_step": 153210, "epoch": 3647} {"train_loss": -6.781865119934082, "global_step": 153211, "epoch": 3647} {"train_loss": -6.789256572723389, "global_step": 153212, "epoch": 3647} {"train_loss": -6.859199523925781, "global_step": 153213, "epoch": 3647} {"train_loss": -6.916817665100098, "global_step": 153214, "epoch": 3647} {"train_loss": -6.819250538235619, "global_step": 153215, "epoch": 3647, "val_loss": 68233.8984375} {"train_loss": -6.904067039489746, "global_step": 153216, "epoch": 3648} {"train_loss": -6.815124034881592, "global_step": 153217, "epoch": 3648} {"train_loss": -6.805197715759277, "global_step": 153218, "epoch": 3648} {"train_loss": -6.913008213043213, "global_step": 153219, "epoch": 3648} {"train_loss": -6.871953010559082, "global_step": 153220, "epoch": 3648} {"train_loss": -6.866838455200195, "global_step": 153221, "epoch": 3648} {"train_loss": -6.754683494567871, "global_step": 153222, "epoch": 3648} {"train_loss": -6.791380882263184, "global_step": 153223, "epoch": 3648} {"train_loss": -6.911988258361816, "global_step": 153224, "epoch": 3648} {"train_loss": -6.690080642700195, "global_step": 153225, "epoch": 3648} {"train_loss": -6.8353166580200195, "global_step": 153226, "epoch": 3648} {"train_loss": -6.806249618530273, "global_step": 153227, "epoch": 3648} {"train_loss": -6.871226787567139, "global_step": 153228, "epoch": 3648} {"train_loss": -6.818731307983398, "global_step": 153229, "epoch": 3648} {"train_loss": -6.840244770050049, "global_step": 153230, "epoch": 3648} {"train_loss": -6.8948798179626465, "global_step": 153231, "epoch": 3648} {"train_loss": -6.986660003662109, "global_step": 153232, "epoch": 3648} {"train_loss": -6.882742881774902, "global_step": 153233, "epoch": 3648} {"train_loss": -6.891413688659668, "global_step": 153234, "epoch": 3648} {"train_loss": -6.8999786376953125, "global_step": 153235, "epoch": 3648} {"train_loss": -6.819803237915039, "global_step": 153236, "epoch": 3648} {"train_loss": -6.9688639640808105, "global_step": 153237, "epoch": 3648} {"train_loss": -6.893178939819336, "global_step": 153238, "epoch": 3648} {"train_loss": -6.850366592407227, "global_step": 153239, "epoch": 3648} {"train_loss": -6.824183464050293, "global_step": 153240, "epoch": 3648} {"train_loss": -6.830931663513184, "global_step": 153241, "epoch": 3648} {"train_loss": -6.7478179931640625, "global_step": 153242, "epoch": 3648} {"train_loss": -6.9133710861206055, "global_step": 153243, "epoch": 3648} {"train_loss": -7.017777442932129, "global_step": 153244, "epoch": 3648} {"train_loss": -6.73093318939209, "global_step": 153245, "epoch": 3648} {"train_loss": -6.885751724243164, "global_step": 153246, "epoch": 3648} {"train_loss": -6.879899978637695, "global_step": 153247, "epoch": 3648} {"train_loss": -6.909402370452881, "global_step": 153248, "epoch": 3648} {"train_loss": -6.919026851654053, "global_step": 153249, "epoch": 3648} {"train_loss": -6.838747024536133, "global_step": 153250, "epoch": 3648} {"train_loss": -6.854757785797119, "global_step": 153251, "epoch": 3648} {"train_loss": -6.82982063293457, "global_step": 153252, "epoch": 3648} {"train_loss": -6.822181701660156, "global_step": 153253, "epoch": 3648} {"train_loss": -6.872894287109375, "global_step": 153254, "epoch": 3648} {"train_loss": -6.801681995391846, "global_step": 153255, "epoch": 3648} {"train_loss": -6.879703044891357, "global_step": 153256, "epoch": 3648} {"train_loss": -6.859437329428537, "global_step": 153257, "epoch": 3648, "val_loss": 68223.609375} {"train_loss": -6.9007744789123535, "global_step": 153258, "epoch": 3649} {"train_loss": -6.9665374755859375, "global_step": 153259, "epoch": 3649} {"train_loss": -6.907151222229004, "global_step": 153260, "epoch": 3649} {"train_loss": -6.822453022003174, "global_step": 153261, "epoch": 3649} {"train_loss": -6.807931423187256, "global_step": 153262, "epoch": 3649} {"train_loss": -6.860949993133545, "global_step": 153263, "epoch": 3649} {"train_loss": -6.908100605010986, "global_step": 153264, "epoch": 3649} {"train_loss": -6.826836109161377, "global_step": 153265, "epoch": 3649} {"train_loss": -6.888452053070068, "global_step": 153266, "epoch": 3649} {"train_loss": -6.943638324737549, "global_step": 153267, "epoch": 3649} {"train_loss": -6.855733871459961, "global_step": 153268, "epoch": 3649} {"train_loss": -6.8528151512146, "global_step": 153269, "epoch": 3649} {"train_loss": -6.778554916381836, "global_step": 153270, "epoch": 3649} {"train_loss": -6.910261154174805, "global_step": 153271, "epoch": 3649} {"train_loss": -6.906889915466309, "global_step": 153272, "epoch": 3649} {"train_loss": -6.88075590133667, "global_step": 153273, "epoch": 3649} {"train_loss": -6.865495681762695, "global_step": 153274, "epoch": 3649} {"train_loss": -6.923300266265869, "global_step": 153275, "epoch": 3649} {"train_loss": -6.910483360290527, "global_step": 153276, "epoch": 3649} {"train_loss": -6.951521873474121, "global_step": 153277, "epoch": 3649} {"train_loss": -6.876059532165527, "global_step": 153278, "epoch": 3649} {"train_loss": -7.025757789611816, "global_step": 153279, "epoch": 3649} {"train_loss": -6.902477264404297, "global_step": 153280, "epoch": 3649} {"train_loss": -6.891745567321777, "global_step": 153281, "epoch": 3649} {"train_loss": -6.910712242126465, "global_step": 153282, "epoch": 3649} {"train_loss": -6.9855546951293945, "global_step": 153283, "epoch": 3649} {"train_loss": -6.884661674499512, "global_step": 153284, "epoch": 3649} {"train_loss": -6.81111478805542, "global_step": 153285, "epoch": 3649} {"train_loss": -6.9251604080200195, "global_step": 153286, "epoch": 3649} {"train_loss": -6.882942199707031, "global_step": 153287, "epoch": 3649} {"train_loss": -6.917228698730469, "global_step": 153288, "epoch": 3649} {"train_loss": -6.958037376403809, "global_step": 153289, "epoch": 3649} {"train_loss": -6.922473907470703, "global_step": 153290, "epoch": 3649} {"train_loss": -6.882793426513672, "global_step": 153291, "epoch": 3649} {"train_loss": -6.980887413024902, "global_step": 153292, "epoch": 3649} {"train_loss": -6.936730861663818, "global_step": 153293, "epoch": 3649} {"train_loss": -7.007291316986084, "global_step": 153294, "epoch": 3649} {"train_loss": -6.841678619384766, "global_step": 153295, "epoch": 3649} {"train_loss": -6.948577404022217, "global_step": 153296, "epoch": 3649} {"train_loss": -6.9494147300720215, "global_step": 153297, "epoch": 3649} {"train_loss": -6.967829704284668, "global_step": 153298, "epoch": 3649} {"train_loss": -6.902489083153861, "global_step": 153299, "epoch": 3649, "val_loss": 68282.4609375} {"train_loss": -6.644092559814453, "global_step": 153300, "epoch": 3650} {"train_loss": -6.794539451599121, "global_step": 153301, "epoch": 3650} {"train_loss": -6.877917289733887, "global_step": 153302, "epoch": 3650} {"train_loss": -6.690445899963379, "global_step": 153303, "epoch": 3650} {"train_loss": -6.796910285949707, "global_step": 153304, "epoch": 3650} {"train_loss": -6.8119096755981445, "global_step": 153305, "epoch": 3650} {"train_loss": -6.707236289978027, "global_step": 153306, "epoch": 3650} {"train_loss": -6.962303161621094, "global_step": 153307, "epoch": 3650} {"train_loss": -6.8951921463012695, "global_step": 153308, "epoch": 3650} {"train_loss": -6.830650329589844, "global_step": 153309, "epoch": 3650} {"train_loss": -6.9481730461120605, "global_step": 153310, "epoch": 3650} {"train_loss": -6.826103210449219, "global_step": 153311, "epoch": 3650} {"train_loss": -6.887557029724121, "global_step": 153312, "epoch": 3650} {"train_loss": -6.734256267547607, "global_step": 153313, "epoch": 3650} {"train_loss": -6.76040506362915, "global_step": 153314, "epoch": 3650} {"train_loss": -6.89970064163208, "global_step": 153315, "epoch": 3650} {"train_loss": -6.835447311401367, "global_step": 153316, "epoch": 3650} {"train_loss": -6.877015113830566, "global_step": 153317, "epoch": 3650} {"train_loss": -6.770386219024658, "global_step": 153318, "epoch": 3650} {"train_loss": -6.773068428039551, "global_step": 153319, "epoch": 3650} {"train_loss": -6.799549102783203, "global_step": 153320, "epoch": 3650} {"train_loss": -6.800512790679932, "global_step": 153321, "epoch": 3650} {"train_loss": -6.820198059082031, "global_step": 153322, "epoch": 3650} {"train_loss": -6.9712677001953125, "global_step": 153323, "epoch": 3650} {"train_loss": -6.858458995819092, "global_step": 153324, "epoch": 3650} {"train_loss": -6.894205570220947, "global_step": 153325, "epoch": 3650} {"train_loss": -6.941840648651123, "global_step": 153326, "epoch": 3650} {"train_loss": -6.846906661987305, "global_step": 153327, "epoch": 3650} {"train_loss": -6.918022632598877, "global_step": 153328, "epoch": 3650} {"train_loss": -7.002810955047607, "global_step": 153329, "epoch": 3650} {"train_loss": -6.974514961242676, "global_step": 153330, "epoch": 3650} {"train_loss": -6.854779243469238, "global_step": 153331, "epoch": 3650} {"train_loss": -6.761105060577393, "global_step": 153332, "epoch": 3650} {"train_loss": -6.839056015014648, "global_step": 153333, "epoch": 3650} {"train_loss": -6.895977973937988, "global_step": 153334, "epoch": 3650} {"train_loss": -6.8572235107421875, "global_step": 153335, "epoch": 3650} {"train_loss": -6.81497859954834, "global_step": 153336, "epoch": 3650} {"train_loss": -6.946277618408203, "global_step": 153337, "epoch": 3650} {"train_loss": -6.861860275268555, "global_step": 153338, "epoch": 3650} {"train_loss": -6.8374552726745605, "global_step": 153339, "epoch": 3650} {"train_loss": -6.876665115356445, "global_step": 153340, "epoch": 3650} {"train_loss": -6.845609233492897, "global_step": 153341, "epoch": 3650, "train/sim_max_reward_0": 0.19832112577466782, "train/sim_max_reward_1": 0.9010132920570793, "train/sim_max_reward_2": 0.4414674250942236, "train/sim_max_reward_3": 0.49803920456858974, "train/sim_max_reward_4": 0.9417250231323707, "train/sim_max_reward_5": 0.8386604251372556, "test/sim_max_reward_4300000": 0.4753309226137109, "test/sim_max_reward_4300001": 0.3441702793819972, "test/sim_max_reward_4300002": 0.9266775456668669, "test/sim_max_reward_4300003": 0.9823477562814945, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9497357401213375, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.33543119063353033, "test/sim_max_reward_4300008": 0.7450125791834766, "test/sim_max_reward_4300009": 0.983241669121237, "test/sim_max_reward_4300010": 0.9842280496878529, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.8784988113871336, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9677814915444606, "test/sim_max_reward_4300016": 0.0012996660752393934, "test/sim_max_reward_4300017": 0.9687181909709245, "test/sim_max_reward_4300018": 0.41622516779290664, "test/sim_max_reward_4300019": 0.1859143041541571, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 1.0, "test/sim_max_reward_4300022": 0.9561987308838672, "test/sim_max_reward_4300023": 0.9318286093684279, "test/sim_max_reward_4300024": 0.7831029548087837, "test/sim_max_reward_4300025": 0.8137036423954949, "test/sim_max_reward_4300026": 0.1724618751718285, "test/sim_max_reward_4300027": 0.8469293720586861, "test/sim_max_reward_4300028": 0.8491753680806607, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.28285383110897916, "test/sim_max_reward_4300031": 0.25587831627863517, "test/sim_max_reward_4300032": 0.8628859071018821, "test/sim_max_reward_4300033": 0.8367962008982852, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.16557106182515566, "test/sim_max_reward_4300036": 0.20172527542279503, "test/sim_max_reward_4300037": 0.6444815320994476, "test/sim_max_reward_4300038": 0.8891482175323522, "test/sim_max_reward_4300039": 0.8939373873093789, "test/sim_max_reward_4300040": 0.9331806422576717, "test/sim_max_reward_4300041": 1.0, "test/sim_max_reward_4300042": 0.603647718794272, "test/sim_max_reward_4300043": 0.16190032506463695, "test/sim_max_reward_4300044": 0.8815971221761914, "test/sim_max_reward_4300045": 0.9648127043474894, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.1657472658721484, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.2081349103546688, "train/mean_score": 0.6365377492940311, "test/mean_score": 0.609322928812747, "val_loss": 68302.9375} {"train_loss": -6.776793479919434, "global_step": 153342, "epoch": 3651} {"train_loss": -6.795663833618164, "global_step": 153343, "epoch": 3651} {"train_loss": -6.734007358551025, "global_step": 153344, "epoch": 3651} {"train_loss": -6.905731678009033, "global_step": 153345, "epoch": 3651} {"train_loss": -6.765569686889648, "global_step": 153346, "epoch": 3651} {"train_loss": -6.827404022216797, "global_step": 153347, "epoch": 3651} {"train_loss": -6.925350189208984, "global_step": 153348, "epoch": 3651} {"train_loss": -6.80535888671875, "global_step": 153349, "epoch": 3651} {"train_loss": -6.768057823181152, "global_step": 153350, "epoch": 3651} {"train_loss": -6.838723182678223, "global_step": 153351, "epoch": 3651} {"train_loss": -6.925693511962891, "global_step": 153352, "epoch": 3651} {"train_loss": -6.879243850708008, "global_step": 153353, "epoch": 3651} {"train_loss": -6.862240791320801, "global_step": 153354, "epoch": 3651} {"train_loss": -6.90541934967041, "global_step": 153355, "epoch": 3651} {"train_loss": -6.768694877624512, "global_step": 153356, "epoch": 3651} {"train_loss": -6.879601001739502, "global_step": 153357, "epoch": 3651} {"train_loss": -6.946839332580566, "global_step": 153358, "epoch": 3651} {"train_loss": -6.866878986358643, "global_step": 153359, "epoch": 3651} {"train_loss": -6.908124923706055, "global_step": 153360, "epoch": 3651} {"train_loss": -6.809098243713379, "global_step": 153361, "epoch": 3651} {"train_loss": -6.896503925323486, "global_step": 153362, "epoch": 3651} {"train_loss": -6.854018211364746, "global_step": 153363, "epoch": 3651} {"train_loss": -6.884610176086426, "global_step": 153364, "epoch": 3651} {"train_loss": -6.687128067016602, "global_step": 153365, "epoch": 3651} {"train_loss": -6.818284034729004, "global_step": 153366, "epoch": 3651} {"train_loss": -6.8901495933532715, "global_step": 153367, "epoch": 3651} {"train_loss": -6.758684158325195, "global_step": 153368, "epoch": 3651} {"train_loss": -6.829637050628662, "global_step": 153369, "epoch": 3651} {"train_loss": -6.6663618087768555, "global_step": 153370, "epoch": 3651} {"train_loss": -6.978117942810059, "global_step": 153371, "epoch": 3651} {"train_loss": -6.848936080932617, "global_step": 153372, "epoch": 3651} {"train_loss": -6.751191139221191, "global_step": 153373, "epoch": 3651} {"train_loss": -6.976686477661133, "global_step": 153374, "epoch": 3651} {"train_loss": -6.778839111328125, "global_step": 153375, "epoch": 3651} {"train_loss": -6.723687648773193, "global_step": 153376, "epoch": 3651} {"train_loss": -6.77109432220459, "global_step": 153377, "epoch": 3651} {"train_loss": -6.845133304595947, "global_step": 153378, "epoch": 3651} {"train_loss": -6.790022850036621, "global_step": 153379, "epoch": 3651} {"train_loss": -6.989875793457031, "global_step": 153380, "epoch": 3651} {"train_loss": -6.809292316436768, "global_step": 153381, "epoch": 3651} {"train_loss": -6.78422212600708, "global_step": 153382, "epoch": 3651} {"train_loss": -6.836339076360066, "global_step": 153383, "epoch": 3651, "val_loss": 68333.1015625} {"train_loss": -6.766721725463867, "global_step": 153384, "epoch": 3652} {"train_loss": -6.890671253204346, "global_step": 153385, "epoch": 3652} {"train_loss": -6.925225257873535, "global_step": 153386, "epoch": 3652} {"train_loss": -6.914693355560303, "global_step": 153387, "epoch": 3652} {"train_loss": -6.965344429016113, "global_step": 153388, "epoch": 3652} {"train_loss": -6.943300247192383, "global_step": 153389, "epoch": 3652} {"train_loss": -6.937973976135254, "global_step": 153390, "epoch": 3652} {"train_loss": -6.895670413970947, "global_step": 153391, "epoch": 3652} {"train_loss": -6.8934407234191895, "global_step": 153392, "epoch": 3652} {"train_loss": -6.91464900970459, "global_step": 153393, "epoch": 3652} {"train_loss": -6.867804050445557, "global_step": 153394, "epoch": 3652} {"train_loss": -6.756702899932861, "global_step": 153395, "epoch": 3652} {"train_loss": -6.916990280151367, "global_step": 153396, "epoch": 3652} {"train_loss": -6.888021469116211, "global_step": 153397, "epoch": 3652} {"train_loss": -6.858771324157715, "global_step": 153398, "epoch": 3652} {"train_loss": -6.967128753662109, "global_step": 153399, "epoch": 3652} {"train_loss": -6.8825225830078125, "global_step": 153400, "epoch": 3652} {"train_loss": -6.898481845855713, "global_step": 153401, "epoch": 3652} {"train_loss": -6.822550296783447, "global_step": 153402, "epoch": 3652} {"train_loss": -6.9284257888793945, "global_step": 153403, "epoch": 3652} {"train_loss": -6.925110816955566, "global_step": 153404, "epoch": 3652} {"train_loss": -6.896910667419434, "global_step": 153405, "epoch": 3652} {"train_loss": -6.984491348266602, "global_step": 153406, "epoch": 3652} {"train_loss": -7.018012046813965, "global_step": 153407, "epoch": 3652} {"train_loss": -6.860055923461914, "global_step": 153408, "epoch": 3652} {"train_loss": -6.937884330749512, "global_step": 153409, "epoch": 3652} {"train_loss": -6.896956443786621, "global_step": 153410, "epoch": 3652} {"train_loss": -6.76375675201416, "global_step": 153411, "epoch": 3652} {"train_loss": -6.933197021484375, "global_step": 153412, "epoch": 3652} {"train_loss": -6.945639610290527, "global_step": 153413, "epoch": 3652} {"train_loss": -6.877091407775879, "global_step": 153414, "epoch": 3652} {"train_loss": -6.796686172485352, "global_step": 153415, "epoch": 3652} {"train_loss": -6.714086532592773, "global_step": 153416, "epoch": 3652} {"train_loss": -6.613231658935547, "global_step": 153417, "epoch": 3652} {"train_loss": -6.815564155578613, "global_step": 153418, "epoch": 3652} {"train_loss": -6.949873924255371, "global_step": 153419, "epoch": 3652} {"train_loss": -6.835661888122559, "global_step": 153420, "epoch": 3652} {"train_loss": -6.917716026306152, "global_step": 153421, "epoch": 3652} {"train_loss": -6.927706718444824, "global_step": 153422, "epoch": 3652} {"train_loss": -6.890012741088867, "global_step": 153423, "epoch": 3652} {"train_loss": -6.877007484436035, "global_step": 153424, "epoch": 3652} {"train_loss": -6.882301217033749, "global_step": 153425, "epoch": 3652, "val_loss": 68048.78125} {"train_loss": -6.877310752868652, "global_step": 153426, "epoch": 3653} {"train_loss": -6.789982795715332, "global_step": 153427, "epoch": 3653} {"train_loss": -7.012200832366943, "global_step": 153428, "epoch": 3653} {"train_loss": -6.931481838226318, "global_step": 153429, "epoch": 3653} {"train_loss": -6.810737609863281, "global_step": 153430, "epoch": 3653} {"train_loss": -6.914820671081543, "global_step": 153431, "epoch": 3653} {"train_loss": -6.811871528625488, "global_step": 153432, "epoch": 3653} {"train_loss": -6.895049095153809, "global_step": 153433, "epoch": 3653} {"train_loss": -7.00009822845459, "global_step": 153434, "epoch": 3653} {"train_loss": -7.030543327331543, "global_step": 153435, "epoch": 3653} {"train_loss": -7.019906997680664, "global_step": 153436, "epoch": 3653} {"train_loss": -6.8695831298828125, "global_step": 153437, "epoch": 3653} {"train_loss": -6.902495384216309, "global_step": 153438, "epoch": 3653} {"train_loss": -6.903792381286621, "global_step": 153439, "epoch": 3653} {"train_loss": -6.848618030548096, "global_step": 153440, "epoch": 3653} {"train_loss": -6.926902770996094, "global_step": 153441, "epoch": 3653} {"train_loss": -7.072175979614258, "global_step": 153442, "epoch": 3653} {"train_loss": -6.9751129150390625, "global_step": 153443, "epoch": 3653} {"train_loss": -7.0009026527404785, "global_step": 153444, "epoch": 3653} {"train_loss": -6.89493465423584, "global_step": 153445, "epoch": 3653} {"train_loss": -6.929359436035156, "global_step": 153446, "epoch": 3653} {"train_loss": -6.955998420715332, "global_step": 153447, "epoch": 3653} {"train_loss": -6.78859806060791, "global_step": 153448, "epoch": 3653} {"train_loss": -6.981595993041992, "global_step": 153449, "epoch": 3653} {"train_loss": -6.886139869689941, "global_step": 153450, "epoch": 3653} {"train_loss": -6.981411933898926, "global_step": 153451, "epoch": 3653} {"train_loss": -6.940061092376709, "global_step": 153452, "epoch": 3653} {"train_loss": -6.951783180236816, "global_step": 153453, "epoch": 3653} {"train_loss": -6.893548488616943, "global_step": 153454, "epoch": 3653} {"train_loss": -6.998078346252441, "global_step": 153455, "epoch": 3653} {"train_loss": -6.895071983337402, "global_step": 153456, "epoch": 3653} {"train_loss": -6.764726638793945, "global_step": 153457, "epoch": 3653} {"train_loss": -6.820261478424072, "global_step": 153458, "epoch": 3653} {"train_loss": -6.896512985229492, "global_step": 153459, "epoch": 3653} {"train_loss": -7.006547927856445, "global_step": 153460, "epoch": 3653} {"train_loss": -6.876119613647461, "global_step": 153461, "epoch": 3653} {"train_loss": -6.869811058044434, "global_step": 153462, "epoch": 3653} {"train_loss": -6.998439788818359, "global_step": 153463, "epoch": 3653} {"train_loss": -6.654768943786621, "global_step": 153464, "epoch": 3653} {"train_loss": -6.810647964477539, "global_step": 153465, "epoch": 3653} {"train_loss": -6.8870015144348145, "global_step": 153466, "epoch": 3653} {"train_loss": -6.905504135858445, "global_step": 153467, "epoch": 3653, "val_loss": 68190.671875} {"train_loss": -6.784526824951172, "global_step": 153468, "epoch": 3654} {"train_loss": -6.886704444885254, "global_step": 153469, "epoch": 3654} {"train_loss": -6.817146301269531, "global_step": 153470, "epoch": 3654} {"train_loss": -6.733709335327148, "global_step": 153471, "epoch": 3654} {"train_loss": -6.878574371337891, "global_step": 153472, "epoch": 3654} {"train_loss": -6.7028889656066895, "global_step": 153473, "epoch": 3654} {"train_loss": -6.89749002456665, "global_step": 153474, "epoch": 3654} {"train_loss": -6.772067070007324, "global_step": 153475, "epoch": 3654} {"train_loss": -6.774473190307617, "global_step": 153476, "epoch": 3654} {"train_loss": -6.928296089172363, "global_step": 153477, "epoch": 3654} {"train_loss": -6.829050064086914, "global_step": 153478, "epoch": 3654} {"train_loss": -6.858421325683594, "global_step": 153479, "epoch": 3654} {"train_loss": -6.88801908493042, "global_step": 153480, "epoch": 3654} {"train_loss": -6.900217056274414, "global_step": 153481, "epoch": 3654} {"train_loss": -6.843161582946777, "global_step": 153482, "epoch": 3654} {"train_loss": -6.96513557434082, "global_step": 153483, "epoch": 3654} {"train_loss": -6.8296003341674805, "global_step": 153484, "epoch": 3654} {"train_loss": -6.981174468994141, "global_step": 153485, "epoch": 3654} {"train_loss": -6.878786563873291, "global_step": 153486, "epoch": 3654} {"train_loss": -6.83077335357666, "global_step": 153487, "epoch": 3654} {"train_loss": -6.828502655029297, "global_step": 153488, "epoch": 3654} {"train_loss": -6.880640983581543, "global_step": 153489, "epoch": 3654} {"train_loss": -6.888503551483154, "global_step": 153490, "epoch": 3654} {"train_loss": -6.909632205963135, "global_step": 153491, "epoch": 3654} {"train_loss": -6.886317253112793, "global_step": 153492, "epoch": 3654} {"train_loss": -6.954583644866943, "global_step": 153493, "epoch": 3654} {"train_loss": -6.860067367553711, "global_step": 153494, "epoch": 3654} {"train_loss": -6.9264912605285645, "global_step": 153495, "epoch": 3654} {"train_loss": -6.838482856750488, "global_step": 153496, "epoch": 3654} {"train_loss": -6.941218376159668, "global_step": 153497, "epoch": 3654} {"train_loss": -6.806257724761963, "global_step": 153498, "epoch": 3654} {"train_loss": -6.867888927459717, "global_step": 153499, "epoch": 3654} {"train_loss": -6.9459381103515625, "global_step": 153500, "epoch": 3654} {"train_loss": -6.96024227142334, "global_step": 153501, "epoch": 3654} {"train_loss": -7.023588180541992, "global_step": 153502, "epoch": 3654} {"train_loss": -6.954482078552246, "global_step": 153503, "epoch": 3654} {"train_loss": -6.88136100769043, "global_step": 153504, "epoch": 3654} {"train_loss": -6.867162704467773, "global_step": 153505, "epoch": 3654} {"train_loss": -6.882646560668945, "global_step": 153506, "epoch": 3654} {"train_loss": -6.869903564453125, "global_step": 153507, "epoch": 3654} {"train_loss": -6.847424030303955, "global_step": 153508, "epoch": 3654} {"train_loss": -6.875301111312139, "global_step": 153509, "epoch": 3654, "val_loss": 68277.1875} {"train_loss": -6.846408843994141, "global_step": 153510, "epoch": 3655} {"train_loss": -6.811022758483887, "global_step": 153511, "epoch": 3655} {"train_loss": -6.866894245147705, "global_step": 153512, "epoch": 3655} {"train_loss": -6.900089263916016, "global_step": 153513, "epoch": 3655} {"train_loss": -6.849180698394775, "global_step": 153514, "epoch": 3655} {"train_loss": -6.832108020782471, "global_step": 153515, "epoch": 3655} {"train_loss": -6.928322792053223, "global_step": 153516, "epoch": 3655} {"train_loss": -6.878910541534424, "global_step": 153517, "epoch": 3655} {"train_loss": -6.932553291320801, "global_step": 153518, "epoch": 3655} {"train_loss": -7.025868892669678, "global_step": 153519, "epoch": 3655} {"train_loss": -6.894037246704102, "global_step": 153520, "epoch": 3655} {"train_loss": -6.942913055419922, "global_step": 153521, "epoch": 3655} {"train_loss": -6.97645902633667, "global_step": 153522, "epoch": 3655} {"train_loss": -6.857637882232666, "global_step": 153523, "epoch": 3655} {"train_loss": -6.940412521362305, "global_step": 153524, "epoch": 3655} {"train_loss": -6.913464546203613, "global_step": 153525, "epoch": 3655} {"train_loss": -6.939589500427246, "global_step": 153526, "epoch": 3655} {"train_loss": -6.899188041687012, "global_step": 153527, "epoch": 3655} {"train_loss": -7.034167289733887, "global_step": 153528, "epoch": 3655} {"train_loss": -6.832927703857422, "global_step": 153529, "epoch": 3655} {"train_loss": -6.835762977600098, "global_step": 153530, "epoch": 3655} {"train_loss": -6.862334251403809, "global_step": 153531, "epoch": 3655} {"train_loss": -6.899045944213867, "global_step": 153532, "epoch": 3655} {"train_loss": -6.924554824829102, "global_step": 153533, "epoch": 3655} {"train_loss": -7.04293966293335, "global_step": 153534, "epoch": 3655} {"train_loss": -6.836392402648926, "global_step": 153535, "epoch": 3655} {"train_loss": -6.816944122314453, "global_step": 153536, "epoch": 3655} {"train_loss": -6.924822807312012, "global_step": 153537, "epoch": 3655} {"train_loss": -6.915366172790527, "global_step": 153538, "epoch": 3655} {"train_loss": -6.827409744262695, "global_step": 153539, "epoch": 3655} {"train_loss": -6.938745498657227, "global_step": 153540, "epoch": 3655} {"train_loss": -6.74874210357666, "global_step": 153541, "epoch": 3655} {"train_loss": -6.816196441650391, "global_step": 153542, "epoch": 3655} {"train_loss": -6.88454532623291, "global_step": 153543, "epoch": 3655} {"train_loss": -6.8228373527526855, "global_step": 153544, "epoch": 3655} {"train_loss": -6.814990043640137, "global_step": 153545, "epoch": 3655} {"train_loss": -6.92368745803833, "global_step": 153546, "epoch": 3655} {"train_loss": -6.90315580368042, "global_step": 153547, "epoch": 3655} {"train_loss": -6.985410213470459, "global_step": 153548, "epoch": 3655} {"train_loss": -6.847023010253906, "global_step": 153549, "epoch": 3655} {"train_loss": -6.872375965118408, "global_step": 153550, "epoch": 3655} {"train_loss": -6.894037076405117, "global_step": 153551, "epoch": 3655, "val_loss": 68058.53125} {"train_loss": -6.8369903564453125, "global_step": 153552, "epoch": 3656} {"train_loss": -6.934526443481445, "global_step": 153553, "epoch": 3656} {"train_loss": -6.916101455688477, "global_step": 153554, "epoch": 3656} {"train_loss": -6.965801239013672, "global_step": 153555, "epoch": 3656} {"train_loss": -6.812882423400879, "global_step": 153556, "epoch": 3656} {"train_loss": -6.872710227966309, "global_step": 153557, "epoch": 3656} {"train_loss": -6.906360626220703, "global_step": 153558, "epoch": 3656} {"train_loss": -6.863985538482666, "global_step": 153559, "epoch": 3656} {"train_loss": -6.869248867034912, "global_step": 153560, "epoch": 3656} {"train_loss": -6.795647621154785, "global_step": 153561, "epoch": 3656} {"train_loss": -6.76777982711792, "global_step": 153562, "epoch": 3656} {"train_loss": -6.87800407409668, "global_step": 153563, "epoch": 3656} {"train_loss": -6.848067760467529, "global_step": 153564, "epoch": 3656} {"train_loss": -6.9301042556762695, "global_step": 153565, "epoch": 3656} {"train_loss": -6.903261184692383, "global_step": 153566, "epoch": 3656} {"train_loss": -6.757201194763184, "global_step": 153567, "epoch": 3656} {"train_loss": -6.907427787780762, "global_step": 153568, "epoch": 3656} {"train_loss": -6.829498291015625, "global_step": 153569, "epoch": 3656} {"train_loss": -6.908580780029297, "global_step": 153570, "epoch": 3656} {"train_loss": -6.79437255859375, "global_step": 153571, "epoch": 3656} {"train_loss": -6.89848518371582, "global_step": 153572, "epoch": 3656} {"train_loss": -6.907293796539307, "global_step": 153573, "epoch": 3656} {"train_loss": -6.874131679534912, "global_step": 153574, "epoch": 3656} {"train_loss": -6.9742350578308105, "global_step": 153575, "epoch": 3656} {"train_loss": -6.876770496368408, "global_step": 153576, "epoch": 3656} {"train_loss": -6.853409767150879, "global_step": 153577, "epoch": 3656} {"train_loss": -6.874933242797852, "global_step": 153578, "epoch": 3656} {"train_loss": -6.898332595825195, "global_step": 153579, "epoch": 3656} {"train_loss": -6.8356475830078125, "global_step": 153580, "epoch": 3656} {"train_loss": -6.814725875854492, "global_step": 153581, "epoch": 3656} {"train_loss": -6.926424503326416, "global_step": 153582, "epoch": 3656} {"train_loss": -6.791226863861084, "global_step": 153583, "epoch": 3656} {"train_loss": -6.868976593017578, "global_step": 153584, "epoch": 3656} {"train_loss": -6.91799259185791, "global_step": 153585, "epoch": 3656} {"train_loss": -6.846932411193848, "global_step": 153586, "epoch": 3656} {"train_loss": -6.781774520874023, "global_step": 153587, "epoch": 3656} {"train_loss": -6.8151326179504395, "global_step": 153588, "epoch": 3656} {"train_loss": -6.89364767074585, "global_step": 153589, "epoch": 3656} {"train_loss": -6.917007923126221, "global_step": 153590, "epoch": 3656} {"train_loss": -6.930501461029053, "global_step": 153591, "epoch": 3656} {"train_loss": -6.9167375564575195, "global_step": 153592, "epoch": 3656} {"train_loss": -6.87024940763201, "global_step": 153593, "epoch": 3656, "val_loss": 68106.90625} {"train_loss": -6.947326183319092, "global_step": 153594, "epoch": 3657} {"train_loss": -6.893509864807129, "global_step": 153595, "epoch": 3657} {"train_loss": -6.8547682762146, "global_step": 153596, "epoch": 3657} {"train_loss": -6.894024848937988, "global_step": 153597, "epoch": 3657} {"train_loss": -6.877254009246826, "global_step": 153598, "epoch": 3657} {"train_loss": -6.989843845367432, "global_step": 153599, "epoch": 3657} {"train_loss": -6.828742980957031, "global_step": 153600, "epoch": 3657} {"train_loss": -6.849590301513672, "global_step": 153601, "epoch": 3657} {"train_loss": -6.803169250488281, "global_step": 153602, "epoch": 3657} {"train_loss": -6.864673137664795, "global_step": 153603, "epoch": 3657} {"train_loss": -6.757195949554443, "global_step": 153604, "epoch": 3657} {"train_loss": -6.826141357421875, "global_step": 153605, "epoch": 3657} {"train_loss": -6.90641975402832, "global_step": 153606, "epoch": 3657} {"train_loss": -6.780048847198486, "global_step": 153607, "epoch": 3657} {"train_loss": -6.874604225158691, "global_step": 153608, "epoch": 3657} {"train_loss": -6.95390510559082, "global_step": 153609, "epoch": 3657} {"train_loss": -6.758364677429199, "global_step": 153610, "epoch": 3657} {"train_loss": -6.93881893157959, "global_step": 153611, "epoch": 3657} {"train_loss": -6.851739406585693, "global_step": 153612, "epoch": 3657} {"train_loss": -6.844669342041016, "global_step": 153613, "epoch": 3657} {"train_loss": -6.915032863616943, "global_step": 153614, "epoch": 3657} {"train_loss": -6.77995491027832, "global_step": 153615, "epoch": 3657} {"train_loss": -6.781288146972656, "global_step": 153616, "epoch": 3657} {"train_loss": -6.991301536560059, "global_step": 153617, "epoch": 3657} {"train_loss": -6.864635467529297, "global_step": 153618, "epoch": 3657} {"train_loss": -6.982549667358398, "global_step": 153619, "epoch": 3657} {"train_loss": -6.888644695281982, "global_step": 153620, "epoch": 3657} {"train_loss": -6.825194358825684, "global_step": 153621, "epoch": 3657} {"train_loss": -6.876034259796143, "global_step": 153622, "epoch": 3657} {"train_loss": -6.833683013916016, "global_step": 153623, "epoch": 3657} {"train_loss": -6.883918762207031, "global_step": 153624, "epoch": 3657} {"train_loss": -6.877139091491699, "global_step": 153625, "epoch": 3657} {"train_loss": -6.945894718170166, "global_step": 153626, "epoch": 3657} {"train_loss": -6.965758800506592, "global_step": 153627, "epoch": 3657} {"train_loss": -6.859461307525635, "global_step": 153628, "epoch": 3657} {"train_loss": -6.919760704040527, "global_step": 153629, "epoch": 3657} {"train_loss": -6.977364540100098, "global_step": 153630, "epoch": 3657} {"train_loss": -6.889391899108887, "global_step": 153631, "epoch": 3657} {"train_loss": -6.969325542449951, "global_step": 153632, "epoch": 3657} {"train_loss": -6.930144309997559, "global_step": 153633, "epoch": 3657} {"train_loss": -6.918542861938477, "global_step": 153634, "epoch": 3657} {"train_loss": -6.883301031021845, "global_step": 153635, "epoch": 3657, "val_loss": 68071.7578125} {"train_loss": -6.906809329986572, "global_step": 153636, "epoch": 3658} {"train_loss": -6.877396583557129, "global_step": 153637, "epoch": 3658} {"train_loss": -6.775800704956055, "global_step": 153638, "epoch": 3658} {"train_loss": -6.886551856994629, "global_step": 153639, "epoch": 3658} {"train_loss": -7.000006675720215, "global_step": 153640, "epoch": 3658} {"train_loss": -6.979074478149414, "global_step": 153641, "epoch": 3658} {"train_loss": -6.908205986022949, "global_step": 153642, "epoch": 3658} {"train_loss": -6.854620933532715, "global_step": 153643, "epoch": 3658} {"train_loss": -6.904181480407715, "global_step": 153644, "epoch": 3658} {"train_loss": -7.06068229675293, "global_step": 153645, "epoch": 3658} {"train_loss": -6.876483917236328, "global_step": 153646, "epoch": 3658} {"train_loss": -6.832294464111328, "global_step": 153647, "epoch": 3658} {"train_loss": -6.948011875152588, "global_step": 153648, "epoch": 3658} {"train_loss": -6.8680267333984375, "global_step": 153649, "epoch": 3658} {"train_loss": -6.899585723876953, "global_step": 153650, "epoch": 3658} {"train_loss": -6.928073406219482, "global_step": 153651, "epoch": 3658} {"train_loss": -6.9045000076293945, "global_step": 153652, "epoch": 3658} {"train_loss": -7.009913921356201, "global_step": 153653, "epoch": 3658} {"train_loss": -6.91748046875, "global_step": 153654, "epoch": 3658} {"train_loss": -6.981069564819336, "global_step": 153655, "epoch": 3658} {"train_loss": -6.882076263427734, "global_step": 153656, "epoch": 3658} {"train_loss": -6.959371566772461, "global_step": 153657, "epoch": 3658} {"train_loss": -7.026416778564453, "global_step": 153658, "epoch": 3658} {"train_loss": -6.890142440795898, "global_step": 153659, "epoch": 3658} {"train_loss": -6.900603294372559, "global_step": 153660, "epoch": 3658} {"train_loss": -6.896650791168213, "global_step": 153661, "epoch": 3658} {"train_loss": -6.969127655029297, "global_step": 153662, "epoch": 3658} {"train_loss": -6.779852867126465, "global_step": 153663, "epoch": 3658} {"train_loss": -6.99925422668457, "global_step": 153664, "epoch": 3658} {"train_loss": -6.840142250061035, "global_step": 153665, "epoch": 3658} {"train_loss": -6.727816581726074, "global_step": 153666, "epoch": 3658} {"train_loss": -6.9668474197387695, "global_step": 153667, "epoch": 3658} {"train_loss": -6.901122093200684, "global_step": 153668, "epoch": 3658} {"train_loss": -6.815408229827881, "global_step": 153669, "epoch": 3658} {"train_loss": -6.92960262298584, "global_step": 153670, "epoch": 3658} {"train_loss": -6.823844909667969, "global_step": 153671, "epoch": 3658} {"train_loss": -6.742026329040527, "global_step": 153672, "epoch": 3658} {"train_loss": -6.891769886016846, "global_step": 153673, "epoch": 3658} {"train_loss": -6.687907695770264, "global_step": 153674, "epoch": 3658} {"train_loss": -6.588639259338379, "global_step": 153675, "epoch": 3658} {"train_loss": -6.780254364013672, "global_step": 153676, "epoch": 3658} {"train_loss": -6.878413972400484, "global_step": 153677, "epoch": 3658, "val_loss": 68383.5703125} {"train_loss": -6.860766410827637, "global_step": 153678, "epoch": 3659} {"train_loss": -6.861537456512451, "global_step": 153679, "epoch": 3659} {"train_loss": -6.760730266571045, "global_step": 153680, "epoch": 3659} {"train_loss": -6.813207626342773, "global_step": 153681, "epoch": 3659} {"train_loss": -6.705883026123047, "global_step": 153682, "epoch": 3659} {"train_loss": -6.88491153717041, "global_step": 153683, "epoch": 3659} {"train_loss": -6.657817840576172, "global_step": 153684, "epoch": 3659} {"train_loss": -6.711606025695801, "global_step": 153685, "epoch": 3659} {"train_loss": -6.752678871154785, "global_step": 153686, "epoch": 3659} {"train_loss": -6.778613567352295, "global_step": 153687, "epoch": 3659} {"train_loss": -6.87681245803833, "global_step": 153688, "epoch": 3659} {"train_loss": -6.766118049621582, "global_step": 153689, "epoch": 3659} {"train_loss": -6.769538879394531, "global_step": 153690, "epoch": 3659} {"train_loss": -6.903540134429932, "global_step": 153691, "epoch": 3659} {"train_loss": -6.805671215057373, "global_step": 153692, "epoch": 3659} {"train_loss": -6.877469539642334, "global_step": 153693, "epoch": 3659} {"train_loss": -6.751028060913086, "global_step": 153694, "epoch": 3659} {"train_loss": -6.835224628448486, "global_step": 153695, "epoch": 3659} {"train_loss": -6.677244186401367, "global_step": 153696, "epoch": 3659} {"train_loss": -6.866501331329346, "global_step": 153697, "epoch": 3659} {"train_loss": -6.845643997192383, "global_step": 153698, "epoch": 3659} {"train_loss": -6.996552467346191, "global_step": 153699, "epoch": 3659} {"train_loss": -6.857580661773682, "global_step": 153700, "epoch": 3659} {"train_loss": -6.769883155822754, "global_step": 153701, "epoch": 3659} {"train_loss": -6.904791831970215, "global_step": 153702, "epoch": 3659} {"train_loss": -6.841459274291992, "global_step": 153703, "epoch": 3659} {"train_loss": -6.793186187744141, "global_step": 153704, "epoch": 3659} {"train_loss": -6.817008972167969, "global_step": 153705, "epoch": 3659} {"train_loss": -6.915678977966309, "global_step": 153706, "epoch": 3659} {"train_loss": -6.947393417358398, "global_step": 153707, "epoch": 3659} {"train_loss": -6.84242057800293, "global_step": 153708, "epoch": 3659} {"train_loss": -6.803772449493408, "global_step": 153709, "epoch": 3659} {"train_loss": -6.857783794403076, "global_step": 153710, "epoch": 3659} {"train_loss": -6.9184160232543945, "global_step": 153711, "epoch": 3659} {"train_loss": -6.890679359436035, "global_step": 153712, "epoch": 3659} {"train_loss": -6.865275859832764, "global_step": 153713, "epoch": 3659} {"train_loss": -6.969795227050781, "global_step": 153714, "epoch": 3659} {"train_loss": -6.963093280792236, "global_step": 153715, "epoch": 3659} {"train_loss": -6.822638034820557, "global_step": 153716, "epoch": 3659} {"train_loss": -6.93231201171875, "global_step": 153717, "epoch": 3659} {"train_loss": -6.883801460266113, "global_step": 153718, "epoch": 3659} {"train_loss": -6.841450713929676, "global_step": 153719, "epoch": 3659, "val_loss": 68120.09375} {"train_loss": -6.904295921325684, "global_step": 153720, "epoch": 3660} {"train_loss": -6.956871032714844, "global_step": 153721, "epoch": 3660} {"train_loss": -6.910792350769043, "global_step": 153722, "epoch": 3660} {"train_loss": -6.834023952484131, "global_step": 153723, "epoch": 3660} {"train_loss": -6.9123334884643555, "global_step": 153724, "epoch": 3660} {"train_loss": -6.890780448913574, "global_step": 153725, "epoch": 3660} {"train_loss": -6.952489852905273, "global_step": 153726, "epoch": 3660} {"train_loss": -7.022444248199463, "global_step": 153727, "epoch": 3660} {"train_loss": -6.863613128662109, "global_step": 153728, "epoch": 3660} {"train_loss": -6.959430694580078, "global_step": 153729, "epoch": 3660} {"train_loss": -6.7912139892578125, "global_step": 153730, "epoch": 3660} {"train_loss": -6.958612442016602, "global_step": 153731, "epoch": 3660} {"train_loss": -6.889941215515137, "global_step": 153732, "epoch": 3660} {"train_loss": -6.956418037414551, "global_step": 153733, "epoch": 3660} {"train_loss": -6.9370198249816895, "global_step": 153734, "epoch": 3660} {"train_loss": -6.898570537567139, "global_step": 153735, "epoch": 3660} {"train_loss": -6.807923316955566, "global_step": 153736, "epoch": 3660} {"train_loss": -6.783060073852539, "global_step": 153737, "epoch": 3660} {"train_loss": -7.047502517700195, "global_step": 153738, "epoch": 3660} {"train_loss": -6.769047737121582, "global_step": 153739, "epoch": 3660} {"train_loss": -7.040815353393555, "global_step": 153740, "epoch": 3660} {"train_loss": -6.925395488739014, "global_step": 153741, "epoch": 3660} {"train_loss": -6.813892364501953, "global_step": 153742, "epoch": 3660} {"train_loss": -6.892803192138672, "global_step": 153743, "epoch": 3660} {"train_loss": -6.892242908477783, "global_step": 153744, "epoch": 3660} {"train_loss": -6.929116249084473, "global_step": 153745, "epoch": 3660} {"train_loss": -6.922677040100098, "global_step": 153746, "epoch": 3660} {"train_loss": -6.964331150054932, "global_step": 153747, "epoch": 3660} {"train_loss": -6.964094638824463, "global_step": 153748, "epoch": 3660} {"train_loss": -7.000477313995361, "global_step": 153749, "epoch": 3660} {"train_loss": -6.910097122192383, "global_step": 153750, "epoch": 3660} {"train_loss": -6.900388717651367, "global_step": 153751, "epoch": 3660} {"train_loss": -6.88170862197876, "global_step": 153752, "epoch": 3660} {"train_loss": -6.916757583618164, "global_step": 153753, "epoch": 3660} {"train_loss": -7.045138359069824, "global_step": 153754, "epoch": 3660} {"train_loss": -6.915098190307617, "global_step": 153755, "epoch": 3660} {"train_loss": -6.8484697341918945, "global_step": 153756, "epoch": 3660} {"train_loss": -7.037277698516846, "global_step": 153757, "epoch": 3660} {"train_loss": -6.763518333435059, "global_step": 153758, "epoch": 3660} {"train_loss": -6.87154483795166, "global_step": 153759, "epoch": 3660} {"train_loss": -7.005317211151123, "global_step": 153760, "epoch": 3660} {"train_loss": -6.91692194484529, "global_step": 153761, "epoch": 3660, "val_loss": 68353.1015625} {"train_loss": -6.899791717529297, "global_step": 153762, "epoch": 3661} {"train_loss": -6.8701653480529785, "global_step": 153763, "epoch": 3661} {"train_loss": -6.9524688720703125, "global_step": 153764, "epoch": 3661} {"train_loss": -6.925562858581543, "global_step": 153765, "epoch": 3661} {"train_loss": -6.896439552307129, "global_step": 153766, "epoch": 3661} {"train_loss": -6.989569664001465, "global_step": 153767, "epoch": 3661} {"train_loss": -6.947469711303711, "global_step": 153768, "epoch": 3661} {"train_loss": -6.946800708770752, "global_step": 153769, "epoch": 3661} {"train_loss": -7.024079322814941, "global_step": 153770, "epoch": 3661} {"train_loss": -6.984524250030518, "global_step": 153771, "epoch": 3661} {"train_loss": -6.950743198394775, "global_step": 153772, "epoch": 3661} {"train_loss": -6.994658470153809, "global_step": 153773, "epoch": 3661} {"train_loss": -6.811962127685547, "global_step": 153774, "epoch": 3661} {"train_loss": -6.843264579772949, "global_step": 153775, "epoch": 3661} {"train_loss": -6.847555160522461, "global_step": 153776, "epoch": 3661} {"train_loss": -6.809682846069336, "global_step": 153777, "epoch": 3661} {"train_loss": -6.88533878326416, "global_step": 153778, "epoch": 3661} {"train_loss": -6.717594146728516, "global_step": 153779, "epoch": 3661} {"train_loss": -6.911020278930664, "global_step": 153780, "epoch": 3661} {"train_loss": -6.735257148742676, "global_step": 153781, "epoch": 3661} {"train_loss": -6.909996032714844, "global_step": 153782, "epoch": 3661} {"train_loss": -6.863290309906006, "global_step": 153783, "epoch": 3661} {"train_loss": -6.756036281585693, "global_step": 153784, "epoch": 3661} {"train_loss": -6.843506813049316, "global_step": 153785, "epoch": 3661} {"train_loss": -6.818226337432861, "global_step": 153786, "epoch": 3661} {"train_loss": -6.862181663513184, "global_step": 153787, "epoch": 3661} {"train_loss": -6.7246599197387695, "global_step": 153788, "epoch": 3661} {"train_loss": -6.915521144866943, "global_step": 153789, "epoch": 3661} {"train_loss": -6.832359790802002, "global_step": 153790, "epoch": 3661} {"train_loss": -6.825981140136719, "global_step": 153791, "epoch": 3661} {"train_loss": -6.903318405151367, "global_step": 153792, "epoch": 3661} {"train_loss": -6.8694610595703125, "global_step": 153793, "epoch": 3661} {"train_loss": -6.789937973022461, "global_step": 153794, "epoch": 3661} {"train_loss": -6.668886184692383, "global_step": 153795, "epoch": 3661} {"train_loss": -6.827489376068115, "global_step": 153796, "epoch": 3661} {"train_loss": -6.858663558959961, "global_step": 153797, "epoch": 3661} {"train_loss": -6.902586936950684, "global_step": 153798, "epoch": 3661} {"train_loss": -6.857590675354004, "global_step": 153799, "epoch": 3661} {"train_loss": -6.947373867034912, "global_step": 153800, "epoch": 3661} {"train_loss": -6.931924343109131, "global_step": 153801, "epoch": 3661} {"train_loss": -6.902516841888428, "global_step": 153802, "epoch": 3661} {"train_loss": -6.8719182922726585, "global_step": 153803, "epoch": 3661, "val_loss": 68291.9375} {"train_loss": -6.870270729064941, "global_step": 153804, "epoch": 3662} {"train_loss": -6.852240562438965, "global_step": 153805, "epoch": 3662} {"train_loss": -6.90904426574707, "global_step": 153806, "epoch": 3662} {"train_loss": -6.907839775085449, "global_step": 153807, "epoch": 3662} {"train_loss": -6.937747001647949, "global_step": 153808, "epoch": 3662} {"train_loss": -6.9254279136657715, "global_step": 153809, "epoch": 3662} {"train_loss": -6.79853630065918, "global_step": 153810, "epoch": 3662} {"train_loss": -6.914121627807617, "global_step": 153811, "epoch": 3662} {"train_loss": -6.894290447235107, "global_step": 153812, "epoch": 3662} {"train_loss": -6.869712829589844, "global_step": 153813, "epoch": 3662} {"train_loss": -6.90162467956543, "global_step": 153814, "epoch": 3662} {"train_loss": -6.942712306976318, "global_step": 153815, "epoch": 3662} {"train_loss": -6.8695759773254395, "global_step": 153816, "epoch": 3662} {"train_loss": -6.962006568908691, "global_step": 153817, "epoch": 3662} {"train_loss": -6.861634254455566, "global_step": 153818, "epoch": 3662} {"train_loss": -6.891515254974365, "global_step": 153819, "epoch": 3662} {"train_loss": -6.960636138916016, "global_step": 153820, "epoch": 3662} {"train_loss": -6.809714317321777, "global_step": 153821, "epoch": 3662} {"train_loss": -6.831683158874512, "global_step": 153822, "epoch": 3662} {"train_loss": -6.925165176391602, "global_step": 153823, "epoch": 3662} {"train_loss": -6.891942024230957, "global_step": 153824, "epoch": 3662} {"train_loss": -6.878900527954102, "global_step": 153825, "epoch": 3662} {"train_loss": -6.880283832550049, "global_step": 153826, "epoch": 3662} {"train_loss": -6.9000420570373535, "global_step": 153827, "epoch": 3662} {"train_loss": -6.94437837600708, "global_step": 153828, "epoch": 3662} {"train_loss": -6.982977390289307, "global_step": 153829, "epoch": 3662} {"train_loss": -6.924319267272949, "global_step": 153830, "epoch": 3662} {"train_loss": -6.8456268310546875, "global_step": 153831, "epoch": 3662} {"train_loss": -6.923527717590332, "global_step": 153832, "epoch": 3662} {"train_loss": -6.894037246704102, "global_step": 153833, "epoch": 3662} {"train_loss": -6.954479217529297, "global_step": 153834, "epoch": 3662} {"train_loss": -6.867345809936523, "global_step": 153835, "epoch": 3662} {"train_loss": -6.902747631072998, "global_step": 153836, "epoch": 3662} {"train_loss": -6.888971328735352, "global_step": 153837, "epoch": 3662} {"train_loss": -6.895552635192871, "global_step": 153838, "epoch": 3662} {"train_loss": -7.035916328430176, "global_step": 153839, "epoch": 3662} {"train_loss": -6.837286472320557, "global_step": 153840, "epoch": 3662} {"train_loss": -6.926739692687988, "global_step": 153841, "epoch": 3662} {"train_loss": -7.007228851318359, "global_step": 153842, "epoch": 3662} {"train_loss": -6.888545513153076, "global_step": 153843, "epoch": 3662} {"train_loss": -6.983827590942383, "global_step": 153844, "epoch": 3662} {"train_loss": -6.906396298181443, "global_step": 153845, "epoch": 3662, "val_loss": 68277.7578125} {"train_loss": -6.845678329467773, "global_step": 153846, "epoch": 3663} {"train_loss": -6.798388481140137, "global_step": 153847, "epoch": 3663} {"train_loss": -6.796648979187012, "global_step": 153848, "epoch": 3663} {"train_loss": -6.7804765701293945, "global_step": 153849, "epoch": 3663} {"train_loss": -6.943739891052246, "global_step": 153850, "epoch": 3663} {"train_loss": -6.7582502365112305, "global_step": 153851, "epoch": 3663} {"train_loss": -6.6885857582092285, "global_step": 153852, "epoch": 3663} {"train_loss": -6.909029006958008, "global_step": 153853, "epoch": 3663} {"train_loss": -6.805275917053223, "global_step": 153854, "epoch": 3663} {"train_loss": -6.851595878601074, "global_step": 153855, "epoch": 3663} {"train_loss": -6.885924339294434, "global_step": 153856, "epoch": 3663} {"train_loss": -6.768353462219238, "global_step": 153857, "epoch": 3663} {"train_loss": -6.863546848297119, "global_step": 153858, "epoch": 3663} {"train_loss": -6.642833709716797, "global_step": 153859, "epoch": 3663} {"train_loss": -6.864595413208008, "global_step": 153860, "epoch": 3663} {"train_loss": -6.753846168518066, "global_step": 153861, "epoch": 3663} {"train_loss": -6.749167442321777, "global_step": 153862, "epoch": 3663} {"train_loss": -6.676812171936035, "global_step": 153863, "epoch": 3663} {"train_loss": -6.871921539306641, "global_step": 153864, "epoch": 3663} {"train_loss": -6.659370422363281, "global_step": 153865, "epoch": 3663} {"train_loss": -6.869009494781494, "global_step": 153866, "epoch": 3663} {"train_loss": -6.811004161834717, "global_step": 153867, "epoch": 3663} {"train_loss": -6.904177665710449, "global_step": 153868, "epoch": 3663} {"train_loss": -6.723719596862793, "global_step": 153869, "epoch": 3663} {"train_loss": -6.867383003234863, "global_step": 153870, "epoch": 3663} {"train_loss": -6.698278427124023, "global_step": 153871, "epoch": 3663} {"train_loss": -6.851987361907959, "global_step": 153872, "epoch": 3663} {"train_loss": -6.90362548828125, "global_step": 153873, "epoch": 3663} {"train_loss": -6.949972152709961, "global_step": 153874, "epoch": 3663} {"train_loss": -6.840112209320068, "global_step": 153875, "epoch": 3663} {"train_loss": -6.9675374031066895, "global_step": 153876, "epoch": 3663} {"train_loss": -6.833628177642822, "global_step": 153877, "epoch": 3663} {"train_loss": -6.832086086273193, "global_step": 153878, "epoch": 3663} {"train_loss": -6.808866024017334, "global_step": 153879, "epoch": 3663} {"train_loss": -6.735834121704102, "global_step": 153880, "epoch": 3663} {"train_loss": -6.924391746520996, "global_step": 153881, "epoch": 3663} {"train_loss": -6.828821182250977, "global_step": 153882, "epoch": 3663} {"train_loss": -6.86905574798584, "global_step": 153883, "epoch": 3663} {"train_loss": -6.719161510467529, "global_step": 153884, "epoch": 3663} {"train_loss": -6.9820237159729, "global_step": 153885, "epoch": 3663} {"train_loss": -6.8074727058410645, "global_step": 153886, "epoch": 3663} {"train_loss": -6.818789050692604, "global_step": 153887, "epoch": 3663, "val_loss": 68367.1796875} {"train_loss": -6.8446364402771, "global_step": 153888, "epoch": 3664} {"train_loss": -6.807122707366943, "global_step": 153889, "epoch": 3664} {"train_loss": -6.8881988525390625, "global_step": 153890, "epoch": 3664} {"train_loss": -6.703669548034668, "global_step": 153891, "epoch": 3664} {"train_loss": -6.8969011306762695, "global_step": 153892, "epoch": 3664} {"train_loss": -6.9526801109313965, "global_step": 153893, "epoch": 3664} {"train_loss": -6.924769401550293, "global_step": 153894, "epoch": 3664} {"train_loss": -6.756689071655273, "global_step": 153895, "epoch": 3664} {"train_loss": -6.838508605957031, "global_step": 153896, "epoch": 3664} {"train_loss": -6.808444976806641, "global_step": 153897, "epoch": 3664} {"train_loss": -6.898454666137695, "global_step": 153898, "epoch": 3664} {"train_loss": -6.835905075073242, "global_step": 153899, "epoch": 3664} {"train_loss": -6.8158769607543945, "global_step": 153900, "epoch": 3664} {"train_loss": -6.847640037536621, "global_step": 153901, "epoch": 3664} {"train_loss": -6.745892524719238, "global_step": 153902, "epoch": 3664} {"train_loss": -6.901352882385254, "global_step": 153903, "epoch": 3664} {"train_loss": -6.923259735107422, "global_step": 153904, "epoch": 3664} {"train_loss": -6.85931396484375, "global_step": 153905, "epoch": 3664} {"train_loss": -6.814581871032715, "global_step": 153906, "epoch": 3664} {"train_loss": -6.8870697021484375, "global_step": 153907, "epoch": 3664} {"train_loss": -6.94176721572876, "global_step": 153908, "epoch": 3664} {"train_loss": -6.815103530883789, "global_step": 153909, "epoch": 3664} {"train_loss": -6.854033470153809, "global_step": 153910, "epoch": 3664} {"train_loss": -6.9732584953308105, "global_step": 153911, "epoch": 3664} {"train_loss": -6.800779819488525, "global_step": 153912, "epoch": 3664} {"train_loss": -6.885691165924072, "global_step": 153913, "epoch": 3664} {"train_loss": -6.912610054016113, "global_step": 153914, "epoch": 3664} {"train_loss": -6.947286128997803, "global_step": 153915, "epoch": 3664} {"train_loss": -6.879511833190918, "global_step": 153916, "epoch": 3664} {"train_loss": -6.836161136627197, "global_step": 153917, "epoch": 3664} {"train_loss": -6.892169952392578, "global_step": 153918, "epoch": 3664} {"train_loss": -7.014858722686768, "global_step": 153919, "epoch": 3664} {"train_loss": -6.894410133361816, "global_step": 153920, "epoch": 3664} {"train_loss": -6.812790870666504, "global_step": 153921, "epoch": 3664} {"train_loss": -7.021771430969238, "global_step": 153922, "epoch": 3664} {"train_loss": -6.898184776306152, "global_step": 153923, "epoch": 3664} {"train_loss": -6.902956485748291, "global_step": 153924, "epoch": 3664} {"train_loss": -6.930014610290527, "global_step": 153925, "epoch": 3664} {"train_loss": -6.876558303833008, "global_step": 153926, "epoch": 3664} {"train_loss": -6.972827911376953, "global_step": 153927, "epoch": 3664} {"train_loss": -6.899874687194824, "global_step": 153928, "epoch": 3664} {"train_loss": -6.875760543914068, "global_step": 153929, "epoch": 3664, "val_loss": 68040.9375} {"train_loss": -7.000826358795166, "global_step": 153930, "epoch": 3665} {"train_loss": -6.927532196044922, "global_step": 153931, "epoch": 3665} {"train_loss": -6.949563980102539, "global_step": 153932, "epoch": 3665} {"train_loss": -6.992608070373535, "global_step": 153933, "epoch": 3665} {"train_loss": -6.926596641540527, "global_step": 153934, "epoch": 3665} {"train_loss": -6.9267072677612305, "global_step": 153935, "epoch": 3665} {"train_loss": -6.988341331481934, "global_step": 153936, "epoch": 3665} {"train_loss": -6.867269039154053, "global_step": 153937, "epoch": 3665} {"train_loss": -6.894827365875244, "global_step": 153938, "epoch": 3665} {"train_loss": -6.834038734436035, "global_step": 153939, "epoch": 3665} {"train_loss": -6.99862003326416, "global_step": 153940, "epoch": 3665} {"train_loss": -6.901004314422607, "global_step": 153941, "epoch": 3665} {"train_loss": -6.912437438964844, "global_step": 153942, "epoch": 3665} {"train_loss": -6.960177421569824, "global_step": 153943, "epoch": 3665} {"train_loss": -6.780850410461426, "global_step": 153944, "epoch": 3665} {"train_loss": -6.757942199707031, "global_step": 153945, "epoch": 3665} {"train_loss": -6.832913398742676, "global_step": 153946, "epoch": 3665} {"train_loss": -6.905661582946777, "global_step": 153947, "epoch": 3665} {"train_loss": -6.930830001831055, "global_step": 153948, "epoch": 3665} {"train_loss": -6.887513160705566, "global_step": 153949, "epoch": 3665} {"train_loss": -7.029027938842773, "global_step": 153950, "epoch": 3665} {"train_loss": -6.952244758605957, "global_step": 153951, "epoch": 3665} {"train_loss": -6.967972755432129, "global_step": 153952, "epoch": 3665} {"train_loss": -6.990339756011963, "global_step": 153953, "epoch": 3665} {"train_loss": -6.889852046966553, "global_step": 153954, "epoch": 3665} {"train_loss": -6.976295471191406, "global_step": 153955, "epoch": 3665} {"train_loss": -6.917369842529297, "global_step": 153956, "epoch": 3665} {"train_loss": -7.113668441772461, "global_step": 153957, "epoch": 3665} {"train_loss": -6.820285797119141, "global_step": 153958, "epoch": 3665} {"train_loss": -6.928828239440918, "global_step": 153959, "epoch": 3665} {"train_loss": -6.937459945678711, "global_step": 153960, "epoch": 3665} {"train_loss": -6.835629463195801, "global_step": 153961, "epoch": 3665} {"train_loss": -6.9308061599731445, "global_step": 153962, "epoch": 3665} {"train_loss": -6.961028099060059, "global_step": 153963, "epoch": 3665} {"train_loss": -6.699694633483887, "global_step": 153964, "epoch": 3665} {"train_loss": -6.782248497009277, "global_step": 153965, "epoch": 3665} {"train_loss": -6.9208550453186035, "global_step": 153966, "epoch": 3665} {"train_loss": -6.904850006103516, "global_step": 153967, "epoch": 3665} {"train_loss": -6.863995552062988, "global_step": 153968, "epoch": 3665} {"train_loss": -6.942593574523926, "global_step": 153969, "epoch": 3665} {"train_loss": -6.892964839935303, "global_step": 153970, "epoch": 3665} {"train_loss": -6.914051112674532, "global_step": 153971, "epoch": 3665, "val_loss": 68273.4921875} {"train_loss": -6.752650737762451, "global_step": 153972, "epoch": 3666} {"train_loss": -6.840357780456543, "global_step": 153973, "epoch": 3666} {"train_loss": -6.8912882804870605, "global_step": 153974, "epoch": 3666} {"train_loss": -6.782290458679199, "global_step": 153975, "epoch": 3666} {"train_loss": -6.85953426361084, "global_step": 153976, "epoch": 3666} {"train_loss": -6.927837371826172, "global_step": 153977, "epoch": 3666} {"train_loss": -6.84349250793457, "global_step": 153978, "epoch": 3666} {"train_loss": -6.783477783203125, "global_step": 153979, "epoch": 3666} {"train_loss": -6.914126396179199, "global_step": 153980, "epoch": 3666} {"train_loss": -6.920176982879639, "global_step": 153981, "epoch": 3666} {"train_loss": -6.888718128204346, "global_step": 153982, "epoch": 3666} {"train_loss": -6.866958141326904, "global_step": 153983, "epoch": 3666} {"train_loss": -6.814154624938965, "global_step": 153984, "epoch": 3666} {"train_loss": -6.916110038757324, "global_step": 153985, "epoch": 3666} {"train_loss": -6.917673587799072, "global_step": 153986, "epoch": 3666} {"train_loss": -7.016098976135254, "global_step": 153987, "epoch": 3666} {"train_loss": -6.886043548583984, "global_step": 153988, "epoch": 3666} {"train_loss": -6.892446517944336, "global_step": 153989, "epoch": 3666} {"train_loss": -6.883664131164551, "global_step": 153990, "epoch": 3666} {"train_loss": -6.828350067138672, "global_step": 153991, "epoch": 3666} {"train_loss": -7.03201961517334, "global_step": 153992, "epoch": 3666} {"train_loss": -6.931989669799805, "global_step": 153993, "epoch": 3666} {"train_loss": -6.9064788818359375, "global_step": 153994, "epoch": 3666} {"train_loss": -6.915144443511963, "global_step": 153995, "epoch": 3666} {"train_loss": -7.011082649230957, "global_step": 153996, "epoch": 3666} {"train_loss": -6.973670959472656, "global_step": 153997, "epoch": 3666} {"train_loss": -6.853817939758301, "global_step": 153998, "epoch": 3666} {"train_loss": -6.917156219482422, "global_step": 153999, "epoch": 3666} {"train_loss": -7.03240442276001, "global_step": 154000, "epoch": 3666} {"train_loss": -6.881879806518555, "global_step": 154001, "epoch": 3666} {"train_loss": -6.901668071746826, "global_step": 154002, "epoch": 3666} {"train_loss": -7.007626533508301, "global_step": 154003, "epoch": 3666} {"train_loss": -7.065258979797363, "global_step": 154004, "epoch": 3666} {"train_loss": -6.942107200622559, "global_step": 154005, "epoch": 3666} {"train_loss": -6.8610968589782715, "global_step": 154006, "epoch": 3666} {"train_loss": -7.007978439331055, "global_step": 154007, "epoch": 3666} {"train_loss": -6.991252899169922, "global_step": 154008, "epoch": 3666} {"train_loss": -6.939483642578125, "global_step": 154009, "epoch": 3666} {"train_loss": -6.95467472076416, "global_step": 154010, "epoch": 3666} {"train_loss": -6.7908759117126465, "global_step": 154011, "epoch": 3666} {"train_loss": -6.906939506530762, "global_step": 154012, "epoch": 3666} {"train_loss": -6.90995158467974, "global_step": 154013, "epoch": 3666, "val_loss": 68271.1953125} {"train_loss": -6.857813835144043, "global_step": 154014, "epoch": 3667} {"train_loss": -6.815074920654297, "global_step": 154015, "epoch": 3667} {"train_loss": -6.8464179039001465, "global_step": 154016, "epoch": 3667} {"train_loss": -6.978494644165039, "global_step": 154017, "epoch": 3667} {"train_loss": -6.962745189666748, "global_step": 154018, "epoch": 3667} {"train_loss": -6.983981132507324, "global_step": 154019, "epoch": 3667} {"train_loss": -6.873488903045654, "global_step": 154020, "epoch": 3667} {"train_loss": -6.952741622924805, "global_step": 154021, "epoch": 3667} {"train_loss": -6.9378557205200195, "global_step": 154022, "epoch": 3667} {"train_loss": -6.960173606872559, "global_step": 154023, "epoch": 3667} {"train_loss": -6.908503532409668, "global_step": 154024, "epoch": 3667} {"train_loss": -6.913268089294434, "global_step": 154025, "epoch": 3667} {"train_loss": -6.8424272537231445, "global_step": 154026, "epoch": 3667} {"train_loss": -6.976951599121094, "global_step": 154027, "epoch": 3667} {"train_loss": -6.8019890785217285, "global_step": 154028, "epoch": 3667} {"train_loss": -6.841419696807861, "global_step": 154029, "epoch": 3667} {"train_loss": -6.95404052734375, "global_step": 154030, "epoch": 3667} {"train_loss": -6.887297630310059, "global_step": 154031, "epoch": 3667} {"train_loss": -6.920057773590088, "global_step": 154032, "epoch": 3667} {"train_loss": -6.976797580718994, "global_step": 154033, "epoch": 3667} {"train_loss": -6.836134433746338, "global_step": 154034, "epoch": 3667} {"train_loss": -6.862704277038574, "global_step": 154035, "epoch": 3667} {"train_loss": -6.861839771270752, "global_step": 154036, "epoch": 3667} {"train_loss": -6.900308609008789, "global_step": 154037, "epoch": 3667} {"train_loss": -6.826972961425781, "global_step": 154038, "epoch": 3667} {"train_loss": -6.795838356018066, "global_step": 154039, "epoch": 3667} {"train_loss": -6.823791980743408, "global_step": 154040, "epoch": 3667} {"train_loss": -6.891881465911865, "global_step": 154041, "epoch": 3667} {"train_loss": -6.787639617919922, "global_step": 154042, "epoch": 3667} {"train_loss": -6.816655158996582, "global_step": 154043, "epoch": 3667} {"train_loss": -6.846360206604004, "global_step": 154044, "epoch": 3667} {"train_loss": -6.688899517059326, "global_step": 154045, "epoch": 3667} {"train_loss": -6.7981390953063965, "global_step": 154046, "epoch": 3667} {"train_loss": -6.693408012390137, "global_step": 154047, "epoch": 3667} {"train_loss": -6.8415913581848145, "global_step": 154048, "epoch": 3667} {"train_loss": -6.796316623687744, "global_step": 154049, "epoch": 3667} {"train_loss": -6.84127950668335, "global_step": 154050, "epoch": 3667} {"train_loss": -6.908090591430664, "global_step": 154051, "epoch": 3667} {"train_loss": -6.75513219833374, "global_step": 154052, "epoch": 3667} {"train_loss": -6.856071472167969, "global_step": 154053, "epoch": 3667} {"train_loss": -6.791559219360352, "global_step": 154054, "epoch": 3667} {"train_loss": -6.865661689213344, "global_step": 154055, "epoch": 3667, "val_loss": 68406.3125} {"train_loss": -6.730234146118164, "global_step": 154056, "epoch": 3668} {"train_loss": -6.842772960662842, "global_step": 154057, "epoch": 3668} {"train_loss": -6.684597015380859, "global_step": 154058, "epoch": 3668} {"train_loss": -6.819559097290039, "global_step": 154059, "epoch": 3668} {"train_loss": -6.8979902267456055, "global_step": 154060, "epoch": 3668} {"train_loss": -6.988491535186768, "global_step": 154061, "epoch": 3668} {"train_loss": -6.92392635345459, "global_step": 154062, "epoch": 3668} {"train_loss": -6.870996475219727, "global_step": 154063, "epoch": 3668} {"train_loss": -7.0186004638671875, "global_step": 154064, "epoch": 3668} {"train_loss": -6.854988098144531, "global_step": 154065, "epoch": 3668} {"train_loss": -6.867591857910156, "global_step": 154066, "epoch": 3668} {"train_loss": -6.892622947692871, "global_step": 154067, "epoch": 3668} {"train_loss": -6.901663780212402, "global_step": 154068, "epoch": 3668} {"train_loss": -6.925295829772949, "global_step": 154069, "epoch": 3668} {"train_loss": -6.8658246994018555, "global_step": 154070, "epoch": 3668} {"train_loss": -6.935818195343018, "global_step": 154071, "epoch": 3668} {"train_loss": -6.825835227966309, "global_step": 154072, "epoch": 3668} {"train_loss": -7.022035121917725, "global_step": 154073, "epoch": 3668} {"train_loss": -6.876086235046387, "global_step": 154074, "epoch": 3668} {"train_loss": -6.912384033203125, "global_step": 154075, "epoch": 3668} {"train_loss": -6.902246475219727, "global_step": 154076, "epoch": 3668} {"train_loss": -6.988183975219727, "global_step": 154077, "epoch": 3668} {"train_loss": -6.906047821044922, "global_step": 154078, "epoch": 3668} {"train_loss": -6.902590274810791, "global_step": 154079, "epoch": 3668} {"train_loss": -6.886384963989258, "global_step": 154080, "epoch": 3668} {"train_loss": -6.887831687927246, "global_step": 154081, "epoch": 3668} {"train_loss": -6.900975227355957, "global_step": 154082, "epoch": 3668} {"train_loss": -6.885560989379883, "global_step": 154083, "epoch": 3668} {"train_loss": -6.875575542449951, "global_step": 154084, "epoch": 3668} {"train_loss": -7.002974510192871, "global_step": 154085, "epoch": 3668} {"train_loss": -6.918905735015869, "global_step": 154086, "epoch": 3668} {"train_loss": -6.810678482055664, "global_step": 154087, "epoch": 3668} {"train_loss": -6.813175201416016, "global_step": 154088, "epoch": 3668} {"train_loss": -6.787357330322266, "global_step": 154089, "epoch": 3668} {"train_loss": -6.904068946838379, "global_step": 154090, "epoch": 3668} {"train_loss": -6.7874603271484375, "global_step": 154091, "epoch": 3668} {"train_loss": -6.931275367736816, "global_step": 154092, "epoch": 3668} {"train_loss": -6.836332321166992, "global_step": 154093, "epoch": 3668} {"train_loss": -6.860910415649414, "global_step": 154094, "epoch": 3668} {"train_loss": -6.979888916015625, "global_step": 154095, "epoch": 3668} {"train_loss": -7.020065784454346, "global_step": 154096, "epoch": 3668} {"train_loss": -6.886223736263457, "global_step": 154097, "epoch": 3668, "val_loss": 68185.109375} {"train_loss": -6.847591876983643, "global_step": 154098, "epoch": 3669} {"train_loss": -6.850811958312988, "global_step": 154099, "epoch": 3669} {"train_loss": -6.843239784240723, "global_step": 154100, "epoch": 3669} {"train_loss": -6.881985664367676, "global_step": 154101, "epoch": 3669} {"train_loss": -6.9750237464904785, "global_step": 154102, "epoch": 3669} {"train_loss": -6.875955581665039, "global_step": 154103, "epoch": 3669} {"train_loss": -6.873293876647949, "global_step": 154104, "epoch": 3669} {"train_loss": -6.955161094665527, "global_step": 154105, "epoch": 3669} {"train_loss": -6.912291526794434, "global_step": 154106, "epoch": 3669} {"train_loss": -6.976240158081055, "global_step": 154107, "epoch": 3669} {"train_loss": -6.86101770401001, "global_step": 154108, "epoch": 3669} {"train_loss": -6.816576957702637, "global_step": 154109, "epoch": 3669} {"train_loss": -6.7242536544799805, "global_step": 154110, "epoch": 3669} {"train_loss": -6.88451623916626, "global_step": 154111, "epoch": 3669} {"train_loss": -6.946982383728027, "global_step": 154112, "epoch": 3669} {"train_loss": -6.75758171081543, "global_step": 154113, "epoch": 3669} {"train_loss": -6.837751865386963, "global_step": 154114, "epoch": 3669} {"train_loss": -6.87592887878418, "global_step": 154115, "epoch": 3669} {"train_loss": -6.85585355758667, "global_step": 154116, "epoch": 3669} {"train_loss": -6.804065704345703, "global_step": 154117, "epoch": 3669} {"train_loss": -7.011934280395508, "global_step": 154118, "epoch": 3669} {"train_loss": -6.83796501159668, "global_step": 154119, "epoch": 3669} {"train_loss": -6.839728355407715, "global_step": 154120, "epoch": 3669} {"train_loss": -6.848940372467041, "global_step": 154121, "epoch": 3669} {"train_loss": -6.845216274261475, "global_step": 154122, "epoch": 3669} {"train_loss": -6.7913818359375, "global_step": 154123, "epoch": 3669} {"train_loss": -6.792442321777344, "global_step": 154124, "epoch": 3669} {"train_loss": -6.833945274353027, "global_step": 154125, "epoch": 3669} {"train_loss": -6.732151985168457, "global_step": 154126, "epoch": 3669} {"train_loss": -6.847764492034912, "global_step": 154127, "epoch": 3669} {"train_loss": -6.953127384185791, "global_step": 154128, "epoch": 3669} {"train_loss": -6.719687461853027, "global_step": 154129, "epoch": 3669} {"train_loss": -6.747587203979492, "global_step": 154130, "epoch": 3669} {"train_loss": -6.9330949783325195, "global_step": 154131, "epoch": 3669} {"train_loss": -6.864699363708496, "global_step": 154132, "epoch": 3669} {"train_loss": -6.926518440246582, "global_step": 154133, "epoch": 3669} {"train_loss": -6.824649810791016, "global_step": 154134, "epoch": 3669} {"train_loss": -6.875685691833496, "global_step": 154135, "epoch": 3669} {"train_loss": -6.865929126739502, "global_step": 154136, "epoch": 3669} {"train_loss": -6.968649387359619, "global_step": 154137, "epoch": 3669} {"train_loss": -6.845951080322266, "global_step": 154138, "epoch": 3669} {"train_loss": -6.860062758127849, "global_step": 154139, "epoch": 3669, "val_loss": 68311.125} {"train_loss": -6.88856315612793, "global_step": 154140, "epoch": 3670} {"train_loss": -6.938549995422363, "global_step": 154141, "epoch": 3670} {"train_loss": -6.856884956359863, "global_step": 154142, "epoch": 3670} {"train_loss": -6.884149551391602, "global_step": 154143, "epoch": 3670} {"train_loss": -6.92718505859375, "global_step": 154144, "epoch": 3670} {"train_loss": -6.939621448516846, "global_step": 154145, "epoch": 3670} {"train_loss": -6.845457553863525, "global_step": 154146, "epoch": 3670} {"train_loss": -6.8747477531433105, "global_step": 154147, "epoch": 3670} {"train_loss": -6.873771667480469, "global_step": 154148, "epoch": 3670} {"train_loss": -6.897784233093262, "global_step": 154149, "epoch": 3670} {"train_loss": -6.968093395233154, "global_step": 154150, "epoch": 3670} {"train_loss": -6.963548183441162, "global_step": 154151, "epoch": 3670} {"train_loss": -6.934577941894531, "global_step": 154152, "epoch": 3670} {"train_loss": -6.743101596832275, "global_step": 154153, "epoch": 3670} {"train_loss": -6.8706512451171875, "global_step": 154154, "epoch": 3670} {"train_loss": -7.033241271972656, "global_step": 154155, "epoch": 3670} {"train_loss": -6.881734848022461, "global_step": 154156, "epoch": 3670} {"train_loss": -6.922300338745117, "global_step": 154157, "epoch": 3670} {"train_loss": -6.952681064605713, "global_step": 154158, "epoch": 3670} {"train_loss": -6.94362735748291, "global_step": 154159, "epoch": 3670} {"train_loss": -6.901777267456055, "global_step": 154160, "epoch": 3670} {"train_loss": -6.8696513175964355, "global_step": 154161, "epoch": 3670} {"train_loss": -6.9857072830200195, "global_step": 154162, "epoch": 3670} {"train_loss": -7.000130653381348, "global_step": 154163, "epoch": 3670} {"train_loss": -7.004014015197754, "global_step": 154164, "epoch": 3670} {"train_loss": -6.949748992919922, "global_step": 154165, "epoch": 3670} {"train_loss": -6.963442325592041, "global_step": 154166, "epoch": 3670} {"train_loss": -6.939841270446777, "global_step": 154167, "epoch": 3670} {"train_loss": -6.875226974487305, "global_step": 154168, "epoch": 3670} {"train_loss": -6.850391864776611, "global_step": 154169, "epoch": 3670} {"train_loss": -6.858513355255127, "global_step": 154170, "epoch": 3670} {"train_loss": -6.950547218322754, "global_step": 154171, "epoch": 3670} {"train_loss": -6.836240768432617, "global_step": 154172, "epoch": 3670} {"train_loss": -6.989924430847168, "global_step": 154173, "epoch": 3670} {"train_loss": -6.925319671630859, "global_step": 154174, "epoch": 3670} {"train_loss": -6.944528102874756, "global_step": 154175, "epoch": 3670} {"train_loss": -6.925896644592285, "global_step": 154176, "epoch": 3670} {"train_loss": -6.955739974975586, "global_step": 154177, "epoch": 3670} {"train_loss": -6.924446105957031, "global_step": 154178, "epoch": 3670} {"train_loss": -6.917296409606934, "global_step": 154179, "epoch": 3670} {"train_loss": -6.929744720458984, "global_step": 154180, "epoch": 3670} {"train_loss": -6.918702636446271, "global_step": 154181, "epoch": 3670, "val_loss": 68177.7890625} {"train_loss": -6.836454391479492, "global_step": 154182, "epoch": 3671} {"train_loss": -6.865434646606445, "global_step": 154183, "epoch": 3671} {"train_loss": -6.99509334564209, "global_step": 154184, "epoch": 3671} {"train_loss": -6.922706604003906, "global_step": 154185, "epoch": 3671} {"train_loss": -6.974203109741211, "global_step": 154186, "epoch": 3671} {"train_loss": -6.873345375061035, "global_step": 154187, "epoch": 3671} {"train_loss": -6.993984222412109, "global_step": 154188, "epoch": 3671} {"train_loss": -6.876870155334473, "global_step": 154189, "epoch": 3671} {"train_loss": -6.816312789916992, "global_step": 154190, "epoch": 3671} {"train_loss": -6.985078811645508, "global_step": 154191, "epoch": 3671} {"train_loss": -6.84556245803833, "global_step": 154192, "epoch": 3671} {"train_loss": -6.845322608947754, "global_step": 154193, "epoch": 3671} {"train_loss": -6.975567817687988, "global_step": 154194, "epoch": 3671} {"train_loss": -6.909509181976318, "global_step": 154195, "epoch": 3671} {"train_loss": -6.996429443359375, "global_step": 154196, "epoch": 3671} {"train_loss": -6.901947021484375, "global_step": 154197, "epoch": 3671} {"train_loss": -6.81225061416626, "global_step": 154198, "epoch": 3671} {"train_loss": -7.023953437805176, "global_step": 154199, "epoch": 3671} {"train_loss": -6.960781574249268, "global_step": 154200, "epoch": 3671} {"train_loss": -6.871555805206299, "global_step": 154201, "epoch": 3671} {"train_loss": -6.895500659942627, "global_step": 154202, "epoch": 3671} {"train_loss": -6.923151016235352, "global_step": 154203, "epoch": 3671} {"train_loss": -6.944814682006836, "global_step": 154204, "epoch": 3671} {"train_loss": -6.932547569274902, "global_step": 154205, "epoch": 3671} {"train_loss": -6.8844404220581055, "global_step": 154206, "epoch": 3671} {"train_loss": -6.952965259552002, "global_step": 154207, "epoch": 3671} {"train_loss": -6.962453365325928, "global_step": 154208, "epoch": 3671} {"train_loss": -6.906316757202148, "global_step": 154209, "epoch": 3671} {"train_loss": -6.930364608764648, "global_step": 154210, "epoch": 3671} {"train_loss": -6.847531795501709, "global_step": 154211, "epoch": 3671} {"train_loss": -6.956055164337158, "global_step": 154212, "epoch": 3671} {"train_loss": -6.88397741317749, "global_step": 154213, "epoch": 3671} {"train_loss": -6.91024112701416, "global_step": 154214, "epoch": 3671} {"train_loss": -6.870274066925049, "global_step": 154215, "epoch": 3671} {"train_loss": -6.936314105987549, "global_step": 154216, "epoch": 3671} {"train_loss": -6.94654655456543, "global_step": 154217, "epoch": 3671} {"train_loss": -6.898527145385742, "global_step": 154218, "epoch": 3671} {"train_loss": -6.868169784545898, "global_step": 154219, "epoch": 3671} {"train_loss": -7.0348100662231445, "global_step": 154220, "epoch": 3671} {"train_loss": -6.821610927581787, "global_step": 154221, "epoch": 3671} {"train_loss": -6.8716511726379395, "global_step": 154222, "epoch": 3671} {"train_loss": -6.911835852123442, "global_step": 154223, "epoch": 3671, "val_loss": 68374.59375} {"train_loss": -6.94791316986084, "global_step": 154224, "epoch": 3672} {"train_loss": -6.7715744972229, "global_step": 154225, "epoch": 3672} {"train_loss": -6.936128616333008, "global_step": 154226, "epoch": 3672} {"train_loss": -6.923280715942383, "global_step": 154227, "epoch": 3672} {"train_loss": -6.970767498016357, "global_step": 154228, "epoch": 3672} {"train_loss": -6.8922247886657715, "global_step": 154229, "epoch": 3672} {"train_loss": -6.86339807510376, "global_step": 154230, "epoch": 3672} {"train_loss": -6.861378192901611, "global_step": 154231, "epoch": 3672} {"train_loss": -6.844815731048584, "global_step": 154232, "epoch": 3672} {"train_loss": -6.989529609680176, "global_step": 154233, "epoch": 3672} {"train_loss": -6.7951765060424805, "global_step": 154234, "epoch": 3672} {"train_loss": -6.848968029022217, "global_step": 154235, "epoch": 3672} {"train_loss": -6.811096668243408, "global_step": 154236, "epoch": 3672} {"train_loss": -6.8692216873168945, "global_step": 154237, "epoch": 3672} {"train_loss": -6.855599403381348, "global_step": 154238, "epoch": 3672} {"train_loss": -6.8524274826049805, "global_step": 154239, "epoch": 3672} {"train_loss": -6.819252967834473, "global_step": 154240, "epoch": 3672} {"train_loss": -7.001056671142578, "global_step": 154241, "epoch": 3672} {"train_loss": -6.873846054077148, "global_step": 154242, "epoch": 3672} {"train_loss": -6.838998794555664, "global_step": 154243, "epoch": 3672} {"train_loss": -6.8753275871276855, "global_step": 154244, "epoch": 3672} {"train_loss": -6.885079383850098, "global_step": 154245, "epoch": 3672} {"train_loss": -6.884430885314941, "global_step": 154246, "epoch": 3672} {"train_loss": -6.857049942016602, "global_step": 154247, "epoch": 3672} {"train_loss": -6.859405517578125, "global_step": 154248, "epoch": 3672} {"train_loss": -6.847653865814209, "global_step": 154249, "epoch": 3672} {"train_loss": -6.849941253662109, "global_step": 154250, "epoch": 3672} {"train_loss": -6.784318923950195, "global_step": 154251, "epoch": 3672} {"train_loss": -6.721495628356934, "global_step": 154252, "epoch": 3672} {"train_loss": -6.855030059814453, "global_step": 154253, "epoch": 3672} {"train_loss": -6.803045749664307, "global_step": 154254, "epoch": 3672} {"train_loss": -6.663175582885742, "global_step": 154255, "epoch": 3672} {"train_loss": -6.849803924560547, "global_step": 154256, "epoch": 3672} {"train_loss": -6.7757463455200195, "global_step": 154257, "epoch": 3672} {"train_loss": -6.738522529602051, "global_step": 154258, "epoch": 3672} {"train_loss": -6.863645076751709, "global_step": 154259, "epoch": 3672} {"train_loss": -6.744907855987549, "global_step": 154260, "epoch": 3672} {"train_loss": -6.780385971069336, "global_step": 154261, "epoch": 3672} {"train_loss": -6.681966781616211, "global_step": 154262, "epoch": 3672} {"train_loss": -6.837190628051758, "global_step": 154263, "epoch": 3672} {"train_loss": -6.771207809448242, "global_step": 154264, "epoch": 3672} {"train_loss": -6.837205659775507, "global_step": 154265, "epoch": 3672, "val_loss": 68292.515625} {"train_loss": -6.9250640869140625, "global_step": 154266, "epoch": 3673} {"train_loss": -6.757376670837402, "global_step": 154267, "epoch": 3673} {"train_loss": -6.909300327301025, "global_step": 154268, "epoch": 3673} {"train_loss": -6.758738040924072, "global_step": 154269, "epoch": 3673} {"train_loss": -6.830190658569336, "global_step": 154270, "epoch": 3673} {"train_loss": -6.736235618591309, "global_step": 154271, "epoch": 3673} {"train_loss": -6.925658226013184, "global_step": 154272, "epoch": 3673} {"train_loss": -6.784692764282227, "global_step": 154273, "epoch": 3673} {"train_loss": -6.850785255432129, "global_step": 154274, "epoch": 3673} {"train_loss": -6.743597984313965, "global_step": 154275, "epoch": 3673} {"train_loss": -6.851219654083252, "global_step": 154276, "epoch": 3673} {"train_loss": -6.824759483337402, "global_step": 154277, "epoch": 3673} {"train_loss": -6.917414665222168, "global_step": 154278, "epoch": 3673} {"train_loss": -6.938211441040039, "global_step": 154279, "epoch": 3673} {"train_loss": -6.7828521728515625, "global_step": 154280, "epoch": 3673} {"train_loss": -6.866100311279297, "global_step": 154281, "epoch": 3673} {"train_loss": -6.862083435058594, "global_step": 154282, "epoch": 3673} {"train_loss": -6.972864151000977, "global_step": 154283, "epoch": 3673} {"train_loss": -6.863963603973389, "global_step": 154284, "epoch": 3673} {"train_loss": -6.813910484313965, "global_step": 154285, "epoch": 3673} {"train_loss": -6.889954566955566, "global_step": 154286, "epoch": 3673} {"train_loss": -6.817689418792725, "global_step": 154287, "epoch": 3673} {"train_loss": -6.918566703796387, "global_step": 154288, "epoch": 3673} {"train_loss": -6.905887126922607, "global_step": 154289, "epoch": 3673} {"train_loss": -6.929130554199219, "global_step": 154290, "epoch": 3673} {"train_loss": -6.733734130859375, "global_step": 154291, "epoch": 3673} {"train_loss": -6.849630355834961, "global_step": 154292, "epoch": 3673} {"train_loss": -6.897536277770996, "global_step": 154293, "epoch": 3673} {"train_loss": -6.860485076904297, "global_step": 154294, "epoch": 3673} {"train_loss": -6.925646781921387, "global_step": 154295, "epoch": 3673} {"train_loss": -6.829254150390625, "global_step": 154296, "epoch": 3673} {"train_loss": -6.820192337036133, "global_step": 154297, "epoch": 3673} {"train_loss": -6.770855903625488, "global_step": 154298, "epoch": 3673} {"train_loss": -6.716152191162109, "global_step": 154299, "epoch": 3673} {"train_loss": -6.940522193908691, "global_step": 154300, "epoch": 3673} {"train_loss": -6.768308162689209, "global_step": 154301, "epoch": 3673} {"train_loss": -6.875042915344238, "global_step": 154302, "epoch": 3673} {"train_loss": -6.894209384918213, "global_step": 154303, "epoch": 3673} {"train_loss": -6.912386894226074, "global_step": 154304, "epoch": 3673} {"train_loss": -6.890711784362793, "global_step": 154305, "epoch": 3673} {"train_loss": -6.831778526306152, "global_step": 154306, "epoch": 3673} {"train_loss": -6.850919632684617, "global_step": 154307, "epoch": 3673, "val_loss": 68282.7109375} {"train_loss": -6.900968551635742, "global_step": 154308, "epoch": 3674} {"train_loss": -6.8860344886779785, "global_step": 154309, "epoch": 3674} {"train_loss": -6.884206295013428, "global_step": 154310, "epoch": 3674} {"train_loss": -6.824168682098389, "global_step": 154311, "epoch": 3674} {"train_loss": -6.925753593444824, "global_step": 154312, "epoch": 3674} {"train_loss": -6.800297737121582, "global_step": 154313, "epoch": 3674} {"train_loss": -6.885849952697754, "global_step": 154314, "epoch": 3674} {"train_loss": -6.873481750488281, "global_step": 154315, "epoch": 3674} {"train_loss": -6.9762043952941895, "global_step": 154316, "epoch": 3674} {"train_loss": -6.994346618652344, "global_step": 154317, "epoch": 3674} {"train_loss": -6.809600830078125, "global_step": 154318, "epoch": 3674} {"train_loss": -7.030418395996094, "global_step": 154319, "epoch": 3674} {"train_loss": -6.864230155944824, "global_step": 154320, "epoch": 3674} {"train_loss": -6.860012054443359, "global_step": 154321, "epoch": 3674} {"train_loss": -6.77907133102417, "global_step": 154322, "epoch": 3674} {"train_loss": -6.813669681549072, "global_step": 154323, "epoch": 3674} {"train_loss": -6.817375659942627, "global_step": 154324, "epoch": 3674} {"train_loss": -6.771268844604492, "global_step": 154325, "epoch": 3674} {"train_loss": -6.934654235839844, "global_step": 154326, "epoch": 3674} {"train_loss": -6.758301258087158, "global_step": 154327, "epoch": 3674} {"train_loss": -6.995669364929199, "global_step": 154328, "epoch": 3674} {"train_loss": -6.937386512756348, "global_step": 154329, "epoch": 3674} {"train_loss": -6.88429594039917, "global_step": 154330, "epoch": 3674} {"train_loss": -6.9223480224609375, "global_step": 154331, "epoch": 3674} {"train_loss": -6.830186367034912, "global_step": 154332, "epoch": 3674} {"train_loss": -6.817194938659668, "global_step": 154333, "epoch": 3674} {"train_loss": -6.8564229011535645, "global_step": 154334, "epoch": 3674} {"train_loss": -7.000785827636719, "global_step": 154335, "epoch": 3674} {"train_loss": -6.948093414306641, "global_step": 154336, "epoch": 3674} {"train_loss": -6.889801025390625, "global_step": 154337, "epoch": 3674} {"train_loss": -6.82473611831665, "global_step": 154338, "epoch": 3674} {"train_loss": -6.857795238494873, "global_step": 154339, "epoch": 3674} {"train_loss": -6.897626876831055, "global_step": 154340, "epoch": 3674} {"train_loss": -6.86094856262207, "global_step": 154341, "epoch": 3674} {"train_loss": -6.946455955505371, "global_step": 154342, "epoch": 3674} {"train_loss": -6.907219409942627, "global_step": 154343, "epoch": 3674} {"train_loss": -6.925570487976074, "global_step": 154344, "epoch": 3674} {"train_loss": -6.802701473236084, "global_step": 154345, "epoch": 3674} {"train_loss": -6.889668941497803, "global_step": 154346, "epoch": 3674} {"train_loss": -6.85154914855957, "global_step": 154347, "epoch": 3674} {"train_loss": -6.8349785804748535, "global_step": 154348, "epoch": 3674} {"train_loss": -6.879763171786354, "global_step": 154349, "epoch": 3674, "val_loss": 68225.921875} {"train_loss": -6.88881778717041, "global_step": 154350, "epoch": 3675} {"train_loss": -6.897528171539307, "global_step": 154351, "epoch": 3675} {"train_loss": -6.902106285095215, "global_step": 154352, "epoch": 3675} {"train_loss": -6.941314697265625, "global_step": 154353, "epoch": 3675} {"train_loss": -6.927732467651367, "global_step": 154354, "epoch": 3675} {"train_loss": -6.905797004699707, "global_step": 154355, "epoch": 3675} {"train_loss": -7.003276348114014, "global_step": 154356, "epoch": 3675} {"train_loss": -6.912412166595459, "global_step": 154357, "epoch": 3675} {"train_loss": -6.842416763305664, "global_step": 154358, "epoch": 3675} {"train_loss": -6.961848735809326, "global_step": 154359, "epoch": 3675} {"train_loss": -6.968666076660156, "global_step": 154360, "epoch": 3675} {"train_loss": -6.927570343017578, "global_step": 154361, "epoch": 3675} {"train_loss": -6.9614667892456055, "global_step": 154362, "epoch": 3675} {"train_loss": -6.888669967651367, "global_step": 154363, "epoch": 3675} {"train_loss": -6.828894138336182, "global_step": 154364, "epoch": 3675} {"train_loss": -6.932644844055176, "global_step": 154365, "epoch": 3675} {"train_loss": -6.976715087890625, "global_step": 154366, "epoch": 3675} {"train_loss": -6.816855430603027, "global_step": 154367, "epoch": 3675} {"train_loss": -6.847756385803223, "global_step": 154368, "epoch": 3675} {"train_loss": -6.924636363983154, "global_step": 154369, "epoch": 3675} {"train_loss": -6.923992156982422, "global_step": 154370, "epoch": 3675} {"train_loss": -6.9291911125183105, "global_step": 154371, "epoch": 3675} {"train_loss": -7.002033710479736, "global_step": 154372, "epoch": 3675} {"train_loss": -6.8867387771606445, "global_step": 154373, "epoch": 3675} {"train_loss": -6.903172492980957, "global_step": 154374, "epoch": 3675} {"train_loss": -6.95766544342041, "global_step": 154375, "epoch": 3675} {"train_loss": -6.856114387512207, "global_step": 154376, "epoch": 3675} {"train_loss": -6.901556968688965, "global_step": 154377, "epoch": 3675} {"train_loss": -6.918096542358398, "global_step": 154378, "epoch": 3675} {"train_loss": -6.93400764465332, "global_step": 154379, "epoch": 3675} {"train_loss": -6.9637298583984375, "global_step": 154380, "epoch": 3675} {"train_loss": -6.878786087036133, "global_step": 154381, "epoch": 3675} {"train_loss": -7.0614399909973145, "global_step": 154382, "epoch": 3675} {"train_loss": -7.048233985900879, "global_step": 154383, "epoch": 3675} {"train_loss": -6.917836666107178, "global_step": 154384, "epoch": 3675} {"train_loss": -6.842189788818359, "global_step": 154385, "epoch": 3675} {"train_loss": -6.977640628814697, "global_step": 154386, "epoch": 3675} {"train_loss": -6.959654331207275, "global_step": 154387, "epoch": 3675} {"train_loss": -6.891486644744873, "global_step": 154388, "epoch": 3675} {"train_loss": -6.9764556884765625, "global_step": 154389, "epoch": 3675} {"train_loss": -6.959040641784668, "global_step": 154390, "epoch": 3675} {"train_loss": -6.924564282099406, "global_step": 154391, "epoch": 3675, "val_loss": 68210.4453125} {"train_loss": -6.934626579284668, "global_step": 154392, "epoch": 3676} {"train_loss": -6.900463581085205, "global_step": 154393, "epoch": 3676} {"train_loss": -6.966957092285156, "global_step": 154394, "epoch": 3676} {"train_loss": -6.884469032287598, "global_step": 154395, "epoch": 3676} {"train_loss": -6.850547790527344, "global_step": 154396, "epoch": 3676} {"train_loss": -6.999311447143555, "global_step": 154397, "epoch": 3676} {"train_loss": -6.781650543212891, "global_step": 154398, "epoch": 3676} {"train_loss": -6.9870758056640625, "global_step": 154399, "epoch": 3676} {"train_loss": -6.806746959686279, "global_step": 154400, "epoch": 3676} {"train_loss": -6.905246734619141, "global_step": 154401, "epoch": 3676} {"train_loss": -6.954482078552246, "global_step": 154402, "epoch": 3676} {"train_loss": -6.94025182723999, "global_step": 154403, "epoch": 3676} {"train_loss": -6.752742767333984, "global_step": 154404, "epoch": 3676} {"train_loss": -6.749122619628906, "global_step": 154405, "epoch": 3676} {"train_loss": -6.818733215332031, "global_step": 154406, "epoch": 3676} {"train_loss": -6.935949802398682, "global_step": 154407, "epoch": 3676} {"train_loss": -6.745924949645996, "global_step": 154408, "epoch": 3676} {"train_loss": -6.870423316955566, "global_step": 154409, "epoch": 3676} {"train_loss": -6.7685956954956055, "global_step": 154410, "epoch": 3676} {"train_loss": -6.739987373352051, "global_step": 154411, "epoch": 3676} {"train_loss": -6.901620864868164, "global_step": 154412, "epoch": 3676} {"train_loss": -6.768580436706543, "global_step": 154413, "epoch": 3676} {"train_loss": -6.87307596206665, "global_step": 154414, "epoch": 3676} {"train_loss": -6.753582000732422, "global_step": 154415, "epoch": 3676} {"train_loss": -6.767891883850098, "global_step": 154416, "epoch": 3676} {"train_loss": -6.810626983642578, "global_step": 154417, "epoch": 3676} {"train_loss": -6.835541248321533, "global_step": 154418, "epoch": 3676} {"train_loss": -6.801570415496826, "global_step": 154419, "epoch": 3676} {"train_loss": -6.8893232345581055, "global_step": 154420, "epoch": 3676} {"train_loss": -6.755376815795898, "global_step": 154421, "epoch": 3676} {"train_loss": -6.9419264793396, "global_step": 154422, "epoch": 3676} {"train_loss": -6.812804222106934, "global_step": 154423, "epoch": 3676} {"train_loss": -6.934582233428955, "global_step": 154424, "epoch": 3676} {"train_loss": -6.928278923034668, "global_step": 154425, "epoch": 3676} {"train_loss": -6.766102313995361, "global_step": 154426, "epoch": 3676} {"train_loss": -6.9212493896484375, "global_step": 154427, "epoch": 3676} {"train_loss": -6.87904167175293, "global_step": 154428, "epoch": 3676} {"train_loss": -6.977092742919922, "global_step": 154429, "epoch": 3676} {"train_loss": -6.951773643493652, "global_step": 154430, "epoch": 3676} {"train_loss": -6.93876314163208, "global_step": 154431, "epoch": 3676} {"train_loss": -6.923464298248291, "global_step": 154432, "epoch": 3676} {"train_loss": -6.863777535302298, "global_step": 154433, "epoch": 3676, "val_loss": 68438.0625} {"train_loss": -6.9142913818359375, "global_step": 154434, "epoch": 3677} {"train_loss": -7.005199432373047, "global_step": 154435, "epoch": 3677} {"train_loss": -6.978886604309082, "global_step": 154436, "epoch": 3677} {"train_loss": -6.940324306488037, "global_step": 154437, "epoch": 3677} {"train_loss": -6.954333782196045, "global_step": 154438, "epoch": 3677} {"train_loss": -6.92464017868042, "global_step": 154439, "epoch": 3677} {"train_loss": -6.970797538757324, "global_step": 154440, "epoch": 3677} {"train_loss": -6.9171013832092285, "global_step": 154441, "epoch": 3677} {"train_loss": -6.904614448547363, "global_step": 154442, "epoch": 3677} {"train_loss": -6.869400501251221, "global_step": 154443, "epoch": 3677} {"train_loss": -7.069467067718506, "global_step": 154444, "epoch": 3677} {"train_loss": -6.942536354064941, "global_step": 154445, "epoch": 3677} {"train_loss": -7.013518333435059, "global_step": 154446, "epoch": 3677} {"train_loss": -7.047418594360352, "global_step": 154447, "epoch": 3677} {"train_loss": -6.8917999267578125, "global_step": 154448, "epoch": 3677} {"train_loss": -6.900241851806641, "global_step": 154449, "epoch": 3677} {"train_loss": -6.923866271972656, "global_step": 154450, "epoch": 3677} {"train_loss": -6.87394905090332, "global_step": 154451, "epoch": 3677} {"train_loss": -6.7225518226623535, "global_step": 154452, "epoch": 3677} {"train_loss": -6.866265296936035, "global_step": 154453, "epoch": 3677} {"train_loss": -6.969475746154785, "global_step": 154454, "epoch": 3677} {"train_loss": -6.700814723968506, "global_step": 154455, "epoch": 3677} {"train_loss": -6.723036766052246, "global_step": 154456, "epoch": 3677} {"train_loss": -6.7732744216918945, "global_step": 154457, "epoch": 3677} {"train_loss": -6.9405317306518555, "global_step": 154458, "epoch": 3677} {"train_loss": -6.8186354637146, "global_step": 154459, "epoch": 3677} {"train_loss": -6.7949981689453125, "global_step": 154460, "epoch": 3677} {"train_loss": -6.858432292938232, "global_step": 154461, "epoch": 3677} {"train_loss": -6.782262802124023, "global_step": 154462, "epoch": 3677} {"train_loss": -6.870644569396973, "global_step": 154463, "epoch": 3677} {"train_loss": -6.848724365234375, "global_step": 154464, "epoch": 3677} {"train_loss": -6.781057357788086, "global_step": 154465, "epoch": 3677} {"train_loss": -6.906734466552734, "global_step": 154466, "epoch": 3677} {"train_loss": -6.866572380065918, "global_step": 154467, "epoch": 3677} {"train_loss": -6.95170259475708, "global_step": 154468, "epoch": 3677} {"train_loss": -6.753805637359619, "global_step": 154469, "epoch": 3677} {"train_loss": -6.99600887298584, "global_step": 154470, "epoch": 3677} {"train_loss": -6.831001281738281, "global_step": 154471, "epoch": 3677} {"train_loss": -6.796311855316162, "global_step": 154472, "epoch": 3677} {"train_loss": -6.952495574951172, "global_step": 154473, "epoch": 3677} {"train_loss": -6.869572162628174, "global_step": 154474, "epoch": 3677} {"train_loss": -6.885965279170445, "global_step": 154475, "epoch": 3677, "val_loss": 68382.6328125} {"train_loss": -6.950182914733887, "global_step": 154476, "epoch": 3678} {"train_loss": -6.795271873474121, "global_step": 154477, "epoch": 3678} {"train_loss": -6.868001461029053, "global_step": 154478, "epoch": 3678} {"train_loss": -6.812405586242676, "global_step": 154479, "epoch": 3678} {"train_loss": -6.8217315673828125, "global_step": 154480, "epoch": 3678} {"train_loss": -6.840670585632324, "global_step": 154481, "epoch": 3678} {"train_loss": -6.8231425285339355, "global_step": 154482, "epoch": 3678} {"train_loss": -6.812644958496094, "global_step": 154483, "epoch": 3678} {"train_loss": -6.762946128845215, "global_step": 154484, "epoch": 3678} {"train_loss": -6.755939483642578, "global_step": 154485, "epoch": 3678} {"train_loss": -6.840810775756836, "global_step": 154486, "epoch": 3678} {"train_loss": -6.897653579711914, "global_step": 154487, "epoch": 3678} {"train_loss": -6.651758193969727, "global_step": 154488, "epoch": 3678} {"train_loss": -6.71120023727417, "global_step": 154489, "epoch": 3678} {"train_loss": -6.919267654418945, "global_step": 154490, "epoch": 3678} {"train_loss": -6.7290496826171875, "global_step": 154491, "epoch": 3678} {"train_loss": -6.875681400299072, "global_step": 154492, "epoch": 3678} {"train_loss": -6.754150390625, "global_step": 154493, "epoch": 3678} {"train_loss": -6.864097595214844, "global_step": 154494, "epoch": 3678} {"train_loss": -6.901043891906738, "global_step": 154495, "epoch": 3678} {"train_loss": -6.800926208496094, "global_step": 154496, "epoch": 3678} {"train_loss": -6.834417819976807, "global_step": 154497, "epoch": 3678} {"train_loss": -6.859102249145508, "global_step": 154498, "epoch": 3678} {"train_loss": -6.854254722595215, "global_step": 154499, "epoch": 3678} {"train_loss": -6.818691253662109, "global_step": 154500, "epoch": 3678} {"train_loss": -6.912991523742676, "global_step": 154501, "epoch": 3678} {"train_loss": -6.963298320770264, "global_step": 154502, "epoch": 3678} {"train_loss": -6.832839488983154, "global_step": 154503, "epoch": 3678} {"train_loss": -6.907819747924805, "global_step": 154504, "epoch": 3678} {"train_loss": -6.880455017089844, "global_step": 154505, "epoch": 3678} {"train_loss": -6.894484519958496, "global_step": 154506, "epoch": 3678} {"train_loss": -7.0133161544799805, "global_step": 154507, "epoch": 3678} {"train_loss": -6.991278171539307, "global_step": 154508, "epoch": 3678} {"train_loss": -6.804207801818848, "global_step": 154509, "epoch": 3678} {"train_loss": -6.933034896850586, "global_step": 154510, "epoch": 3678} {"train_loss": -6.89484977722168, "global_step": 154511, "epoch": 3678} {"train_loss": -6.841838836669922, "global_step": 154512, "epoch": 3678} {"train_loss": -6.940306663513184, "global_step": 154513, "epoch": 3678} {"train_loss": -6.860185623168945, "global_step": 154514, "epoch": 3678} {"train_loss": -6.920592308044434, "global_step": 154515, "epoch": 3678} {"train_loss": -7.042233943939209, "global_step": 154516, "epoch": 3678} {"train_loss": -6.860752026240031, "global_step": 154517, "epoch": 3678, "val_loss": 68154.28125} {"train_loss": -6.872415065765381, "global_step": 154518, "epoch": 3679} {"train_loss": -7.0332231521606445, "global_step": 154519, "epoch": 3679} {"train_loss": -6.863039970397949, "global_step": 154520, "epoch": 3679} {"train_loss": -6.884197235107422, "global_step": 154521, "epoch": 3679} {"train_loss": -6.965871334075928, "global_step": 154522, "epoch": 3679} {"train_loss": -6.918962001800537, "global_step": 154523, "epoch": 3679} {"train_loss": -6.933340549468994, "global_step": 154524, "epoch": 3679} {"train_loss": -6.847877502441406, "global_step": 154525, "epoch": 3679} {"train_loss": -6.9121904373168945, "global_step": 154526, "epoch": 3679} {"train_loss": -6.805655002593994, "global_step": 154527, "epoch": 3679} {"train_loss": -6.911360263824463, "global_step": 154528, "epoch": 3679} {"train_loss": -6.843597888946533, "global_step": 154529, "epoch": 3679} {"train_loss": -6.884742736816406, "global_step": 154530, "epoch": 3679} {"train_loss": -7.024487495422363, "global_step": 154531, "epoch": 3679} {"train_loss": -6.932435035705566, "global_step": 154532, "epoch": 3679} {"train_loss": -6.944663047790527, "global_step": 154533, "epoch": 3679} {"train_loss": -6.947736740112305, "global_step": 154534, "epoch": 3679} {"train_loss": -6.946971893310547, "global_step": 154535, "epoch": 3679} {"train_loss": -6.9119873046875, "global_step": 154536, "epoch": 3679} {"train_loss": -7.005510330200195, "global_step": 154537, "epoch": 3679} {"train_loss": -6.895576477050781, "global_step": 154538, "epoch": 3679} {"train_loss": -6.898024082183838, "global_step": 154539, "epoch": 3679} {"train_loss": -6.857641220092773, "global_step": 154540, "epoch": 3679} {"train_loss": -6.952768802642822, "global_step": 154541, "epoch": 3679} {"train_loss": -6.993561267852783, "global_step": 154542, "epoch": 3679} {"train_loss": -6.932558536529541, "global_step": 154543, "epoch": 3679} {"train_loss": -6.938166618347168, "global_step": 154544, "epoch": 3679} {"train_loss": -7.002072334289551, "global_step": 154545, "epoch": 3679} {"train_loss": -6.8707594871521, "global_step": 154546, "epoch": 3679} {"train_loss": -6.861408710479736, "global_step": 154547, "epoch": 3679} {"train_loss": -6.848567962646484, "global_step": 154548, "epoch": 3679} {"train_loss": -6.852175712585449, "global_step": 154549, "epoch": 3679} {"train_loss": -6.945781230926514, "global_step": 154550, "epoch": 3679} {"train_loss": -6.938802719116211, "global_step": 154551, "epoch": 3679} {"train_loss": -6.959312915802002, "global_step": 154552, "epoch": 3679} {"train_loss": -7.03939151763916, "global_step": 154553, "epoch": 3679} {"train_loss": -6.878379821777344, "global_step": 154554, "epoch": 3679} {"train_loss": -7.041995048522949, "global_step": 154555, "epoch": 3679} {"train_loss": -6.946826457977295, "global_step": 154556, "epoch": 3679} {"train_loss": -6.992833137512207, "global_step": 154557, "epoch": 3679} {"train_loss": -7.027942180633545, "global_step": 154558, "epoch": 3679} {"train_loss": -6.927874383472261, "global_step": 154559, "epoch": 3679, "val_loss": 68115.3828125} {"train_loss": -6.8979949951171875, "global_step": 154560, "epoch": 3680} {"train_loss": -6.949246406555176, "global_step": 154561, "epoch": 3680} {"train_loss": -6.93001651763916, "global_step": 154562, "epoch": 3680} {"train_loss": -6.877473831176758, "global_step": 154563, "epoch": 3680} {"train_loss": -6.804200649261475, "global_step": 154564, "epoch": 3680} {"train_loss": -6.937904357910156, "global_step": 154565, "epoch": 3680} {"train_loss": -6.918457984924316, "global_step": 154566, "epoch": 3680} {"train_loss": -6.878154754638672, "global_step": 154567, "epoch": 3680} {"train_loss": -6.82258939743042, "global_step": 154568, "epoch": 3680} {"train_loss": -6.73919677734375, "global_step": 154569, "epoch": 3680} {"train_loss": -6.949943542480469, "global_step": 154570, "epoch": 3680} {"train_loss": -6.808798789978027, "global_step": 154571, "epoch": 3680} {"train_loss": -6.796299934387207, "global_step": 154572, "epoch": 3680} {"train_loss": -6.753063201904297, "global_step": 154573, "epoch": 3680} {"train_loss": -6.627601623535156, "global_step": 154574, "epoch": 3680} {"train_loss": -6.867396354675293, "global_step": 154575, "epoch": 3680} {"train_loss": -6.9169602394104, "global_step": 154576, "epoch": 3680} {"train_loss": -6.722794532775879, "global_step": 154577, "epoch": 3680} {"train_loss": -6.893181324005127, "global_step": 154578, "epoch": 3680} {"train_loss": -6.781232833862305, "global_step": 154579, "epoch": 3680} {"train_loss": -6.820348739624023, "global_step": 154580, "epoch": 3680} {"train_loss": -6.778980255126953, "global_step": 154581, "epoch": 3680} {"train_loss": -6.776121139526367, "global_step": 154582, "epoch": 3680} {"train_loss": -6.77029275894165, "global_step": 154583, "epoch": 3680} {"train_loss": -6.747747421264648, "global_step": 154584, "epoch": 3680} {"train_loss": -6.829018592834473, "global_step": 154585, "epoch": 3680} {"train_loss": -6.94469690322876, "global_step": 154586, "epoch": 3680} {"train_loss": -6.828469753265381, "global_step": 154587, "epoch": 3680} {"train_loss": -6.931179046630859, "global_step": 154588, "epoch": 3680} {"train_loss": -6.897345066070557, "global_step": 154589, "epoch": 3680} {"train_loss": -6.969396591186523, "global_step": 154590, "epoch": 3680} {"train_loss": -6.858434677124023, "global_step": 154591, "epoch": 3680} {"train_loss": -6.881706237792969, "global_step": 154592, "epoch": 3680} {"train_loss": -6.853879928588867, "global_step": 154593, "epoch": 3680} {"train_loss": -6.850873947143555, "global_step": 154594, "epoch": 3680} {"train_loss": -6.8910980224609375, "global_step": 154595, "epoch": 3680} {"train_loss": -6.8935065269470215, "global_step": 154596, "epoch": 3680} {"train_loss": -6.839939594268799, "global_step": 154597, "epoch": 3680} {"train_loss": -6.8037309646606445, "global_step": 154598, "epoch": 3680} {"train_loss": -6.863772869110107, "global_step": 154599, "epoch": 3680} {"train_loss": -6.889077186584473, "global_step": 154600, "epoch": 3680} {"train_loss": -6.847953444435483, "global_step": 154601, "epoch": 3680, "val_loss": 68311.015625} {"train_loss": -6.905864238739014, "global_step": 154602, "epoch": 3681} {"train_loss": -6.8222126960754395, "global_step": 154603, "epoch": 3681} {"train_loss": -6.891294479370117, "global_step": 154604, "epoch": 3681} {"train_loss": -6.787482261657715, "global_step": 154605, "epoch": 3681} {"train_loss": -6.864140510559082, "global_step": 154606, "epoch": 3681} {"train_loss": -6.844052314758301, "global_step": 154607, "epoch": 3681} {"train_loss": -6.914617538452148, "global_step": 154608, "epoch": 3681} {"train_loss": -6.916600227355957, "global_step": 154609, "epoch": 3681} {"train_loss": -6.792645454406738, "global_step": 154610, "epoch": 3681} {"train_loss": -6.849914073944092, "global_step": 154611, "epoch": 3681} {"train_loss": -6.829402923583984, "global_step": 154612, "epoch": 3681} {"train_loss": -6.845057964324951, "global_step": 154613, "epoch": 3681} {"train_loss": -6.859409332275391, "global_step": 154614, "epoch": 3681} {"train_loss": -6.8681159019470215, "global_step": 154615, "epoch": 3681} {"train_loss": -6.851828575134277, "global_step": 154616, "epoch": 3681} {"train_loss": -6.91563606262207, "global_step": 154617, "epoch": 3681} {"train_loss": -6.885939598083496, "global_step": 154618, "epoch": 3681} {"train_loss": -7.0781569480896, "global_step": 154619, "epoch": 3681} {"train_loss": -6.916337013244629, "global_step": 154620, "epoch": 3681} {"train_loss": -6.948678493499756, "global_step": 154621, "epoch": 3681} {"train_loss": -6.81795072555542, "global_step": 154622, "epoch": 3681} {"train_loss": -7.036368370056152, "global_step": 154623, "epoch": 3681} {"train_loss": -6.831540107727051, "global_step": 154624, "epoch": 3681} {"train_loss": -6.940657138824463, "global_step": 154625, "epoch": 3681} {"train_loss": -6.9480438232421875, "global_step": 154626, "epoch": 3681} {"train_loss": -6.978351593017578, "global_step": 154627, "epoch": 3681} {"train_loss": -6.878012180328369, "global_step": 154628, "epoch": 3681} {"train_loss": -6.980506896972656, "global_step": 154629, "epoch": 3681} {"train_loss": -6.817785263061523, "global_step": 154630, "epoch": 3681} {"train_loss": -6.865857124328613, "global_step": 154631, "epoch": 3681} {"train_loss": -6.978031635284424, "global_step": 154632, "epoch": 3681} {"train_loss": -6.917193412780762, "global_step": 154633, "epoch": 3681} {"train_loss": -6.770416736602783, "global_step": 154634, "epoch": 3681} {"train_loss": -6.93203067779541, "global_step": 154635, "epoch": 3681} {"train_loss": -6.989255428314209, "global_step": 154636, "epoch": 3681} {"train_loss": -6.903382778167725, "global_step": 154637, "epoch": 3681} {"train_loss": -6.840675354003906, "global_step": 154638, "epoch": 3681} {"train_loss": -6.9398651123046875, "global_step": 154639, "epoch": 3681} {"train_loss": -6.7701520919799805, "global_step": 154640, "epoch": 3681} {"train_loss": -6.870444297790527, "global_step": 154641, "epoch": 3681} {"train_loss": -6.92434024810791, "global_step": 154642, "epoch": 3681} {"train_loss": -6.888476723716373, "global_step": 154643, "epoch": 3681, "val_loss": 68113.640625} {"train_loss": -7.003459930419922, "global_step": 154644, "epoch": 3682} {"train_loss": -6.848440170288086, "global_step": 154645, "epoch": 3682} {"train_loss": -6.908785820007324, "global_step": 154646, "epoch": 3682} {"train_loss": -6.990732192993164, "global_step": 154647, "epoch": 3682} {"train_loss": -6.961372375488281, "global_step": 154648, "epoch": 3682} {"train_loss": -6.891165733337402, "global_step": 154649, "epoch": 3682} {"train_loss": -7.013880729675293, "global_step": 154650, "epoch": 3682} {"train_loss": -6.971474647521973, "global_step": 154651, "epoch": 3682} {"train_loss": -6.832084655761719, "global_step": 154652, "epoch": 3682} {"train_loss": -7.043652057647705, "global_step": 154653, "epoch": 3682} {"train_loss": -6.912177085876465, "global_step": 154654, "epoch": 3682} {"train_loss": -6.858316421508789, "global_step": 154655, "epoch": 3682} {"train_loss": -6.957071781158447, "global_step": 154656, "epoch": 3682} {"train_loss": -6.957973003387451, "global_step": 154657, "epoch": 3682} {"train_loss": -6.886913299560547, "global_step": 154658, "epoch": 3682} {"train_loss": -7.041512489318848, "global_step": 154659, "epoch": 3682} {"train_loss": -7.030293941497803, "global_step": 154660, "epoch": 3682} {"train_loss": -6.873651504516602, "global_step": 154661, "epoch": 3682} {"train_loss": -6.931670188903809, "global_step": 154662, "epoch": 3682} {"train_loss": -6.973762035369873, "global_step": 154663, "epoch": 3682} {"train_loss": -6.996315002441406, "global_step": 154664, "epoch": 3682} {"train_loss": -6.954379558563232, "global_step": 154665, "epoch": 3682} {"train_loss": -7.0277886390686035, "global_step": 154666, "epoch": 3682} {"train_loss": -6.978764533996582, "global_step": 154667, "epoch": 3682} {"train_loss": -6.828859329223633, "global_step": 154668, "epoch": 3682} {"train_loss": -6.939128398895264, "global_step": 154669, "epoch": 3682} {"train_loss": -6.981634616851807, "global_step": 154670, "epoch": 3682} {"train_loss": -6.952744960784912, "global_step": 154671, "epoch": 3682} {"train_loss": -6.9826555252075195, "global_step": 154672, "epoch": 3682} {"train_loss": -7.01582670211792, "global_step": 154673, "epoch": 3682} {"train_loss": -6.8707275390625, "global_step": 154674, "epoch": 3682} {"train_loss": -6.894084453582764, "global_step": 154675, "epoch": 3682} {"train_loss": -6.8668599128723145, "global_step": 154676, "epoch": 3682} {"train_loss": -6.80189323425293, "global_step": 154677, "epoch": 3682} {"train_loss": -6.8054094314575195, "global_step": 154678, "epoch": 3682} {"train_loss": -6.850271224975586, "global_step": 154679, "epoch": 3682} {"train_loss": -6.876856327056885, "global_step": 154680, "epoch": 3682} {"train_loss": -6.805114269256592, "global_step": 154681, "epoch": 3682} {"train_loss": -6.906853675842285, "global_step": 154682, "epoch": 3682} {"train_loss": -6.782323360443115, "global_step": 154683, "epoch": 3682} {"train_loss": -6.962983131408691, "global_step": 154684, "epoch": 3682} {"train_loss": -6.922729878198533, "global_step": 154685, "epoch": 3682, "val_loss": 68388.4765625} {"train_loss": -6.792359352111816, "global_step": 154686, "epoch": 3683} {"train_loss": -6.8155035972595215, "global_step": 154687, "epoch": 3683} {"train_loss": -6.767988204956055, "global_step": 154688, "epoch": 3683} {"train_loss": -6.90623664855957, "global_step": 154689, "epoch": 3683} {"train_loss": -6.81009578704834, "global_step": 154690, "epoch": 3683} {"train_loss": -6.8401899337768555, "global_step": 154691, "epoch": 3683} {"train_loss": -6.81431770324707, "global_step": 154692, "epoch": 3683} {"train_loss": -6.936090469360352, "global_step": 154693, "epoch": 3683} {"train_loss": -6.868701934814453, "global_step": 154694, "epoch": 3683} {"train_loss": -6.856964588165283, "global_step": 154695, "epoch": 3683} {"train_loss": -6.88456916809082, "global_step": 154696, "epoch": 3683} {"train_loss": -6.9763712882995605, "global_step": 154697, "epoch": 3683} {"train_loss": -6.846612930297852, "global_step": 154698, "epoch": 3683} {"train_loss": -6.849991798400879, "global_step": 154699, "epoch": 3683} {"train_loss": -6.8753252029418945, "global_step": 154700, "epoch": 3683} {"train_loss": -6.861017227172852, "global_step": 154701, "epoch": 3683} {"train_loss": -6.9367218017578125, "global_step": 154702, "epoch": 3683} {"train_loss": -6.872895240783691, "global_step": 154703, "epoch": 3683} {"train_loss": -6.955467224121094, "global_step": 154704, "epoch": 3683} {"train_loss": -6.965300559997559, "global_step": 154705, "epoch": 3683} {"train_loss": -6.840086936950684, "global_step": 154706, "epoch": 3683} {"train_loss": -6.724583625793457, "global_step": 154707, "epoch": 3683} {"train_loss": -6.808403968811035, "global_step": 154708, "epoch": 3683} {"train_loss": -6.803664207458496, "global_step": 154709, "epoch": 3683} {"train_loss": -6.758014678955078, "global_step": 154710, "epoch": 3683} {"train_loss": -7.034040451049805, "global_step": 154711, "epoch": 3683} {"train_loss": -6.941497802734375, "global_step": 154712, "epoch": 3683} {"train_loss": -6.878162384033203, "global_step": 154713, "epoch": 3683} {"train_loss": -6.877033710479736, "global_step": 154714, "epoch": 3683} {"train_loss": -6.773365020751953, "global_step": 154715, "epoch": 3683} {"train_loss": -6.8998870849609375, "global_step": 154716, "epoch": 3683} {"train_loss": -6.865177154541016, "global_step": 154717, "epoch": 3683} {"train_loss": -6.8335065841674805, "global_step": 154718, "epoch": 3683} {"train_loss": -6.7910966873168945, "global_step": 154719, "epoch": 3683} {"train_loss": -6.838630676269531, "global_step": 154720, "epoch": 3683} {"train_loss": -6.910634517669678, "global_step": 154721, "epoch": 3683} {"train_loss": -6.778871536254883, "global_step": 154722, "epoch": 3683} {"train_loss": -6.968716144561768, "global_step": 154723, "epoch": 3683} {"train_loss": -6.93189811706543, "global_step": 154724, "epoch": 3683} {"train_loss": -6.86830997467041, "global_step": 154725, "epoch": 3683} {"train_loss": -6.796291351318359, "global_step": 154726, "epoch": 3683} {"train_loss": -6.86247874441601, "global_step": 154727, "epoch": 3683, "val_loss": 68384.6171875} {"train_loss": -7.064323425292969, "global_step": 154728, "epoch": 3684} {"train_loss": -6.779827117919922, "global_step": 154729, "epoch": 3684} {"train_loss": -6.8998589515686035, "global_step": 154730, "epoch": 3684} {"train_loss": -6.826505661010742, "global_step": 154731, "epoch": 3684} {"train_loss": -6.96539306640625, "global_step": 154732, "epoch": 3684} {"train_loss": -6.93069314956665, "global_step": 154733, "epoch": 3684} {"train_loss": -6.961766242980957, "global_step": 154734, "epoch": 3684} {"train_loss": -6.903702735900879, "global_step": 154735, "epoch": 3684} {"train_loss": -6.964349746704102, "global_step": 154736, "epoch": 3684} {"train_loss": -6.92418098449707, "global_step": 154737, "epoch": 3684} {"train_loss": -6.924287796020508, "global_step": 154738, "epoch": 3684} {"train_loss": -6.829276084899902, "global_step": 154739, "epoch": 3684} {"train_loss": -6.821155071258545, "global_step": 154740, "epoch": 3684} {"train_loss": -6.889799118041992, "global_step": 154741, "epoch": 3684} {"train_loss": -6.7503156661987305, "global_step": 154742, "epoch": 3684} {"train_loss": -6.844754219055176, "global_step": 154743, "epoch": 3684} {"train_loss": -6.951190948486328, "global_step": 154744, "epoch": 3684} {"train_loss": -6.89539909362793, "global_step": 154745, "epoch": 3684} {"train_loss": -6.9100213050842285, "global_step": 154746, "epoch": 3684} {"train_loss": -6.804749011993408, "global_step": 154747, "epoch": 3684} {"train_loss": -6.951577186584473, "global_step": 154748, "epoch": 3684} {"train_loss": -6.727731227874756, "global_step": 154749, "epoch": 3684} {"train_loss": -6.881201267242432, "global_step": 154750, "epoch": 3684} {"train_loss": -6.769955635070801, "global_step": 154751, "epoch": 3684} {"train_loss": -6.879083633422852, "global_step": 154752, "epoch": 3684} {"train_loss": -6.764654159545898, "global_step": 154753, "epoch": 3684} {"train_loss": -6.844768524169922, "global_step": 154754, "epoch": 3684} {"train_loss": -6.890244960784912, "global_step": 154755, "epoch": 3684} {"train_loss": -6.780593395233154, "global_step": 154756, "epoch": 3684} {"train_loss": -6.9516496658325195, "global_step": 154757, "epoch": 3684} {"train_loss": -6.696855545043945, "global_step": 154758, "epoch": 3684} {"train_loss": -6.8819475173950195, "global_step": 154759, "epoch": 3684} {"train_loss": -6.831423759460449, "global_step": 154760, "epoch": 3684} {"train_loss": -6.723478317260742, "global_step": 154761, "epoch": 3684} {"train_loss": -6.891844749450684, "global_step": 154762, "epoch": 3684} {"train_loss": -6.811344146728516, "global_step": 154763, "epoch": 3684} {"train_loss": -6.863584041595459, "global_step": 154764, "epoch": 3684} {"train_loss": -6.859157562255859, "global_step": 154765, "epoch": 3684} {"train_loss": -6.7567219734191895, "global_step": 154766, "epoch": 3684} {"train_loss": -6.7446393966674805, "global_step": 154767, "epoch": 3684} {"train_loss": -6.796462059020996, "global_step": 154768, "epoch": 3684} {"train_loss": -6.85852787608192, "global_step": 154769, "epoch": 3684, "val_loss": 68408.859375} {"train_loss": -6.834135055541992, "global_step": 154770, "epoch": 3685} {"train_loss": -6.871319770812988, "global_step": 154771, "epoch": 3685} {"train_loss": -6.820066452026367, "global_step": 154772, "epoch": 3685} {"train_loss": -6.939847946166992, "global_step": 154773, "epoch": 3685} {"train_loss": -6.796496391296387, "global_step": 154774, "epoch": 3685} {"train_loss": -6.860312461853027, "global_step": 154775, "epoch": 3685} {"train_loss": -6.999258041381836, "global_step": 154776, "epoch": 3685} {"train_loss": -6.839929580688477, "global_step": 154777, "epoch": 3685} {"train_loss": -6.875367164611816, "global_step": 154778, "epoch": 3685} {"train_loss": -6.935810565948486, "global_step": 154779, "epoch": 3685} {"train_loss": -6.672499656677246, "global_step": 154780, "epoch": 3685} {"train_loss": -6.895216464996338, "global_step": 154781, "epoch": 3685} {"train_loss": -6.713983535766602, "global_step": 154782, "epoch": 3685} {"train_loss": -6.782406330108643, "global_step": 154783, "epoch": 3685} {"train_loss": -6.874614715576172, "global_step": 154784, "epoch": 3685} {"train_loss": -6.643825054168701, "global_step": 154785, "epoch": 3685} {"train_loss": -6.886981964111328, "global_step": 154786, "epoch": 3685} {"train_loss": -6.81178617477417, "global_step": 154787, "epoch": 3685} {"train_loss": -6.910364151000977, "global_step": 154788, "epoch": 3685} {"train_loss": -6.889433860778809, "global_step": 154789, "epoch": 3685} {"train_loss": -6.8694281578063965, "global_step": 154790, "epoch": 3685} {"train_loss": -6.900737285614014, "global_step": 154791, "epoch": 3685} {"train_loss": -6.814343452453613, "global_step": 154792, "epoch": 3685} {"train_loss": -6.840819835662842, "global_step": 154793, "epoch": 3685} {"train_loss": -6.908312797546387, "global_step": 154794, "epoch": 3685} {"train_loss": -6.894018650054932, "global_step": 154795, "epoch": 3685} {"train_loss": -6.9572906494140625, "global_step": 154796, "epoch": 3685} {"train_loss": -6.907039642333984, "global_step": 154797, "epoch": 3685} {"train_loss": -6.922442436218262, "global_step": 154798, "epoch": 3685} {"train_loss": -6.939334869384766, "global_step": 154799, "epoch": 3685} {"train_loss": -6.936016082763672, "global_step": 154800, "epoch": 3685} {"train_loss": -6.779884338378906, "global_step": 154801, "epoch": 3685} {"train_loss": -6.81688928604126, "global_step": 154802, "epoch": 3685} {"train_loss": -6.9047698974609375, "global_step": 154803, "epoch": 3685} {"train_loss": -6.82759952545166, "global_step": 154804, "epoch": 3685} {"train_loss": -6.796886920928955, "global_step": 154805, "epoch": 3685} {"train_loss": -6.84721040725708, "global_step": 154806, "epoch": 3685} {"train_loss": -6.858009338378906, "global_step": 154807, "epoch": 3685} {"train_loss": -6.829236030578613, "global_step": 154808, "epoch": 3685} {"train_loss": -6.92694616317749, "global_step": 154809, "epoch": 3685} {"train_loss": -6.8185529708862305, "global_step": 154810, "epoch": 3685} {"train_loss": -6.857247715904599, "global_step": 154811, "epoch": 3685, "val_loss": 68327.7890625} {"train_loss": -6.813971996307373, "global_step": 154812, "epoch": 3686} {"train_loss": -6.8231024742126465, "global_step": 154813, "epoch": 3686} {"train_loss": -6.8893561363220215, "global_step": 154814, "epoch": 3686} {"train_loss": -6.919100284576416, "global_step": 154815, "epoch": 3686} {"train_loss": -6.819883346557617, "global_step": 154816, "epoch": 3686} {"train_loss": -6.923601150512695, "global_step": 154817, "epoch": 3686} {"train_loss": -6.87957763671875, "global_step": 154818, "epoch": 3686} {"train_loss": -6.79166841506958, "global_step": 154819, "epoch": 3686} {"train_loss": -6.924437046051025, "global_step": 154820, "epoch": 3686} {"train_loss": -6.831220626831055, "global_step": 154821, "epoch": 3686} {"train_loss": -6.884362697601318, "global_step": 154822, "epoch": 3686} {"train_loss": -6.9699625968933105, "global_step": 154823, "epoch": 3686} {"train_loss": -6.7057414054870605, "global_step": 154824, "epoch": 3686} {"train_loss": -6.7978668212890625, "global_step": 154825, "epoch": 3686} {"train_loss": -6.837737083435059, "global_step": 154826, "epoch": 3686} {"train_loss": -6.801732063293457, "global_step": 154827, "epoch": 3686} {"train_loss": -6.756505966186523, "global_step": 154828, "epoch": 3686} {"train_loss": -6.8072614669799805, "global_step": 154829, "epoch": 3686} {"train_loss": -6.928973197937012, "global_step": 154830, "epoch": 3686} {"train_loss": -6.924826622009277, "global_step": 154831, "epoch": 3686} {"train_loss": -6.89488410949707, "global_step": 154832, "epoch": 3686} {"train_loss": -6.818934440612793, "global_step": 154833, "epoch": 3686} {"train_loss": -6.888786792755127, "global_step": 154834, "epoch": 3686} {"train_loss": -6.91486930847168, "global_step": 154835, "epoch": 3686} {"train_loss": -6.885157585144043, "global_step": 154836, "epoch": 3686} {"train_loss": -6.811427593231201, "global_step": 154837, "epoch": 3686} {"train_loss": -6.863564491271973, "global_step": 154838, "epoch": 3686} {"train_loss": -6.890761375427246, "global_step": 154839, "epoch": 3686} {"train_loss": -6.788180828094482, "global_step": 154840, "epoch": 3686} {"train_loss": -6.949044227600098, "global_step": 154841, "epoch": 3686} {"train_loss": -6.795902729034424, "global_step": 154842, "epoch": 3686} {"train_loss": -6.875236511230469, "global_step": 154843, "epoch": 3686} {"train_loss": -6.965921401977539, "global_step": 154844, "epoch": 3686} {"train_loss": -6.942111015319824, "global_step": 154845, "epoch": 3686} {"train_loss": -6.991547584533691, "global_step": 154846, "epoch": 3686} {"train_loss": -7.003615379333496, "global_step": 154847, "epoch": 3686} {"train_loss": -6.939883232116699, "global_step": 154848, "epoch": 3686} {"train_loss": -6.8751702308654785, "global_step": 154849, "epoch": 3686} {"train_loss": -6.900291919708252, "global_step": 154850, "epoch": 3686} {"train_loss": -6.876059055328369, "global_step": 154851, "epoch": 3686} {"train_loss": -6.860028266906738, "global_step": 154852, "epoch": 3686} {"train_loss": -6.874040228979928, "global_step": 154853, "epoch": 3686, "val_loss": 68358.3515625} {"train_loss": -6.9606218338012695, "global_step": 154854, "epoch": 3687} {"train_loss": -6.998369216918945, "global_step": 154855, "epoch": 3687} {"train_loss": -7.023378372192383, "global_step": 154856, "epoch": 3687} {"train_loss": -6.890954971313477, "global_step": 154857, "epoch": 3687} {"train_loss": -6.957686901092529, "global_step": 154858, "epoch": 3687} {"train_loss": -6.88548469543457, "global_step": 154859, "epoch": 3687} {"train_loss": -6.816950798034668, "global_step": 154860, "epoch": 3687} {"train_loss": -6.84498405456543, "global_step": 154861, "epoch": 3687} {"train_loss": -6.884773254394531, "global_step": 154862, "epoch": 3687} {"train_loss": -6.9369707107543945, "global_step": 154863, "epoch": 3687} {"train_loss": -6.780811309814453, "global_step": 154864, "epoch": 3687} {"train_loss": -6.858123779296875, "global_step": 154865, "epoch": 3687} {"train_loss": -6.8770036697387695, "global_step": 154866, "epoch": 3687} {"train_loss": -6.886662483215332, "global_step": 154867, "epoch": 3687} {"train_loss": -6.960447788238525, "global_step": 154868, "epoch": 3687} {"train_loss": -6.984989166259766, "global_step": 154869, "epoch": 3687} {"train_loss": -6.8274688720703125, "global_step": 154870, "epoch": 3687} {"train_loss": -7.056849479675293, "global_step": 154871, "epoch": 3687} {"train_loss": -6.966659069061279, "global_step": 154872, "epoch": 3687} {"train_loss": -6.911600112915039, "global_step": 154873, "epoch": 3687} {"train_loss": -6.916913032531738, "global_step": 154874, "epoch": 3687} {"train_loss": -6.980918884277344, "global_step": 154875, "epoch": 3687} {"train_loss": -6.851333141326904, "global_step": 154876, "epoch": 3687} {"train_loss": -7.04591178894043, "global_step": 154877, "epoch": 3687} {"train_loss": -6.9559221267700195, "global_step": 154878, "epoch": 3687} {"train_loss": -6.926347732543945, "global_step": 154879, "epoch": 3687} {"train_loss": -6.955132007598877, "global_step": 154880, "epoch": 3687} {"train_loss": -6.945289611816406, "global_step": 154881, "epoch": 3687} {"train_loss": -7.071178436279297, "global_step": 154882, "epoch": 3687} {"train_loss": -6.90506649017334, "global_step": 154883, "epoch": 3687} {"train_loss": -6.81276798248291, "global_step": 154884, "epoch": 3687} {"train_loss": -7.116061687469482, "global_step": 154885, "epoch": 3687} {"train_loss": -6.955302715301514, "global_step": 154886, "epoch": 3687} {"train_loss": -6.988421440124512, "global_step": 154887, "epoch": 3687} {"train_loss": -6.9464826583862305, "global_step": 154888, "epoch": 3687} {"train_loss": -6.88286018371582, "global_step": 154889, "epoch": 3687} {"train_loss": -6.925280570983887, "global_step": 154890, "epoch": 3687} {"train_loss": -6.842602729797363, "global_step": 154891, "epoch": 3687} {"train_loss": -6.935640811920166, "global_step": 154892, "epoch": 3687} {"train_loss": -6.806634426116943, "global_step": 154893, "epoch": 3687} {"train_loss": -6.962684154510498, "global_step": 154894, "epoch": 3687} {"train_loss": -6.9282979511079335, "global_step": 154895, "epoch": 3687, "val_loss": 68340.453125} {"train_loss": -6.772542953491211, "global_step": 154896, "epoch": 3688} {"train_loss": -6.940288543701172, "global_step": 154897, "epoch": 3688} {"train_loss": -7.047982215881348, "global_step": 154898, "epoch": 3688} {"train_loss": -6.865610122680664, "global_step": 154899, "epoch": 3688} {"train_loss": -6.919887542724609, "global_step": 154900, "epoch": 3688} {"train_loss": -7.025453567504883, "global_step": 154901, "epoch": 3688} {"train_loss": -6.963652610778809, "global_step": 154902, "epoch": 3688} {"train_loss": -6.894330024719238, "global_step": 154903, "epoch": 3688} {"train_loss": -6.971048831939697, "global_step": 154904, "epoch": 3688} {"train_loss": -6.938421249389648, "global_step": 154905, "epoch": 3688} {"train_loss": -6.969903945922852, "global_step": 154906, "epoch": 3688} {"train_loss": -6.9474334716796875, "global_step": 154907, "epoch": 3688} {"train_loss": -6.863959789276123, "global_step": 154908, "epoch": 3688} {"train_loss": -6.870777130126953, "global_step": 154909, "epoch": 3688} {"train_loss": -6.7374982833862305, "global_step": 154910, "epoch": 3688} {"train_loss": -6.776102066040039, "global_step": 154911, "epoch": 3688} {"train_loss": -6.818160057067871, "global_step": 154912, "epoch": 3688} {"train_loss": -6.857601165771484, "global_step": 154913, "epoch": 3688} {"train_loss": -6.869410991668701, "global_step": 154914, "epoch": 3688} {"train_loss": -6.77124547958374, "global_step": 154915, "epoch": 3688} {"train_loss": -6.7215423583984375, "global_step": 154916, "epoch": 3688} {"train_loss": -6.923404693603516, "global_step": 154917, "epoch": 3688} {"train_loss": -6.718690872192383, "global_step": 154918, "epoch": 3688} {"train_loss": -6.820727825164795, "global_step": 154919, "epoch": 3688} {"train_loss": -6.9242963790893555, "global_step": 154920, "epoch": 3688} {"train_loss": -6.8582329750061035, "global_step": 154921, "epoch": 3688} {"train_loss": -6.814194679260254, "global_step": 154922, "epoch": 3688} {"train_loss": -7.000849723815918, "global_step": 154923, "epoch": 3688} {"train_loss": -6.793940544128418, "global_step": 154924, "epoch": 3688} {"train_loss": -6.918168544769287, "global_step": 154925, "epoch": 3688} {"train_loss": -6.82326602935791, "global_step": 154926, "epoch": 3688} {"train_loss": -6.982219219207764, "global_step": 154927, "epoch": 3688} {"train_loss": -6.93381404876709, "global_step": 154928, "epoch": 3688} {"train_loss": -6.837677478790283, "global_step": 154929, "epoch": 3688} {"train_loss": -6.97592830657959, "global_step": 154930, "epoch": 3688} {"train_loss": -6.836776256561279, "global_step": 154931, "epoch": 3688} {"train_loss": -6.8743133544921875, "global_step": 154932, "epoch": 3688} {"train_loss": -6.893539905548096, "global_step": 154933, "epoch": 3688} {"train_loss": -6.8940653800964355, "global_step": 154934, "epoch": 3688} {"train_loss": -6.825117111206055, "global_step": 154935, "epoch": 3688} {"train_loss": -6.988683223724365, "global_step": 154936, "epoch": 3688} {"train_loss": -6.877233573368618, "global_step": 154937, "epoch": 3688, "val_loss": 68296.8125} {"train_loss": -6.855480670928955, "global_step": 154938, "epoch": 3689} {"train_loss": -6.960635662078857, "global_step": 154939, "epoch": 3689} {"train_loss": -6.888058185577393, "global_step": 154940, "epoch": 3689} {"train_loss": -6.9564337730407715, "global_step": 154941, "epoch": 3689} {"train_loss": -6.8668107986450195, "global_step": 154942, "epoch": 3689} {"train_loss": -6.9342756271362305, "global_step": 154943, "epoch": 3689} {"train_loss": -7.098077774047852, "global_step": 154944, "epoch": 3689} {"train_loss": -6.891461372375488, "global_step": 154945, "epoch": 3689} {"train_loss": -6.983631134033203, "global_step": 154946, "epoch": 3689} {"train_loss": -6.923609256744385, "global_step": 154947, "epoch": 3689} {"train_loss": -7.003727436065674, "global_step": 154948, "epoch": 3689} {"train_loss": -6.973926067352295, "global_step": 154949, "epoch": 3689} {"train_loss": -6.921447277069092, "global_step": 154950, "epoch": 3689} {"train_loss": -6.909704208374023, "global_step": 154951, "epoch": 3689} {"train_loss": -6.896645545959473, "global_step": 154952, "epoch": 3689} {"train_loss": -6.931585311889648, "global_step": 154953, "epoch": 3689} {"train_loss": -6.860421180725098, "global_step": 154954, "epoch": 3689} {"train_loss": -6.874870300292969, "global_step": 154955, "epoch": 3689} {"train_loss": -6.895282745361328, "global_step": 154956, "epoch": 3689} {"train_loss": -6.743185997009277, "global_step": 154957, "epoch": 3689} {"train_loss": -6.72100830078125, "global_step": 154958, "epoch": 3689} {"train_loss": -6.921649932861328, "global_step": 154959, "epoch": 3689} {"train_loss": -6.858730792999268, "global_step": 154960, "epoch": 3689} {"train_loss": -6.752738952636719, "global_step": 154961, "epoch": 3689} {"train_loss": -6.766393661499023, "global_step": 154962, "epoch": 3689} {"train_loss": -6.718730926513672, "global_step": 154963, "epoch": 3689} {"train_loss": -6.607657432556152, "global_step": 154964, "epoch": 3689} {"train_loss": -6.823426246643066, "global_step": 154965, "epoch": 3689} {"train_loss": -6.598034381866455, "global_step": 154966, "epoch": 3689} {"train_loss": -6.935797691345215, "global_step": 154967, "epoch": 3689} {"train_loss": -6.797060012817383, "global_step": 154968, "epoch": 3689} {"train_loss": -6.867305755615234, "global_step": 154969, "epoch": 3689} {"train_loss": -6.802468299865723, "global_step": 154970, "epoch": 3689} {"train_loss": -6.700750827789307, "global_step": 154971, "epoch": 3689} {"train_loss": -6.9145026206970215, "global_step": 154972, "epoch": 3689} {"train_loss": -6.634286403656006, "global_step": 154973, "epoch": 3689} {"train_loss": -6.768007278442383, "global_step": 154974, "epoch": 3689} {"train_loss": -6.762238502502441, "global_step": 154975, "epoch": 3689} {"train_loss": -6.873921871185303, "global_step": 154976, "epoch": 3689} {"train_loss": -6.819589614868164, "global_step": 154977, "epoch": 3689} {"train_loss": -6.791452407836914, "global_step": 154978, "epoch": 3689} {"train_loss": -6.849447273072743, "global_step": 154979, "epoch": 3689, "val_loss": 68288.0078125} {"train_loss": -6.786144256591797, "global_step": 154980, "epoch": 3690} {"train_loss": -6.8009138107299805, "global_step": 154981, "epoch": 3690} {"train_loss": -6.921725273132324, "global_step": 154982, "epoch": 3690} {"train_loss": -6.775760650634766, "global_step": 154983, "epoch": 3690} {"train_loss": -6.795480728149414, "global_step": 154984, "epoch": 3690} {"train_loss": -6.864372253417969, "global_step": 154985, "epoch": 3690} {"train_loss": -6.829171180725098, "global_step": 154986, "epoch": 3690} {"train_loss": -6.956456661224365, "global_step": 154987, "epoch": 3690} {"train_loss": -6.913517951965332, "global_step": 154988, "epoch": 3690} {"train_loss": -6.8657121658325195, "global_step": 154989, "epoch": 3690} {"train_loss": -6.975996971130371, "global_step": 154990, "epoch": 3690} {"train_loss": -6.885913848876953, "global_step": 154991, "epoch": 3690} {"train_loss": -6.917130470275879, "global_step": 154992, "epoch": 3690} {"train_loss": -7.040957927703857, "global_step": 154993, "epoch": 3690} {"train_loss": -6.83139705657959, "global_step": 154994, "epoch": 3690} {"train_loss": -6.88767147064209, "global_step": 154995, "epoch": 3690} {"train_loss": -6.965071678161621, "global_step": 154996, "epoch": 3690} {"train_loss": -6.937636852264404, "global_step": 154997, "epoch": 3690} {"train_loss": -6.884128570556641, "global_step": 154998, "epoch": 3690} {"train_loss": -7.029293537139893, "global_step": 154999, "epoch": 3690} {"train_loss": -6.9664506912231445, "global_step": 155000, "epoch": 3690} {"train_loss": -6.851588249206543, "global_step": 155001, "epoch": 3690} {"train_loss": -6.914503574371338, "global_step": 155002, "epoch": 3690} {"train_loss": -7.017536163330078, "global_step": 155003, "epoch": 3690} {"train_loss": -6.869035720825195, "global_step": 155004, "epoch": 3690} {"train_loss": -6.938394546508789, "global_step": 155005, "epoch": 3690} {"train_loss": -6.890145301818848, "global_step": 155006, "epoch": 3690} {"train_loss": -6.906535625457764, "global_step": 155007, "epoch": 3690} {"train_loss": -6.902617931365967, "global_step": 155008, "epoch": 3690} {"train_loss": -6.782837390899658, "global_step": 155009, "epoch": 3690} {"train_loss": -6.947556018829346, "global_step": 155010, "epoch": 3690} {"train_loss": -6.951864242553711, "global_step": 155011, "epoch": 3690} {"train_loss": -6.9124298095703125, "global_step": 155012, "epoch": 3690} {"train_loss": -6.872463226318359, "global_step": 155013, "epoch": 3690} {"train_loss": -6.84892463684082, "global_step": 155014, "epoch": 3690} {"train_loss": -6.791409492492676, "global_step": 155015, "epoch": 3690} {"train_loss": -6.829814434051514, "global_step": 155016, "epoch": 3690} {"train_loss": -6.942333698272705, "global_step": 155017, "epoch": 3690} {"train_loss": -6.9094743728637695, "global_step": 155018, "epoch": 3690} {"train_loss": -6.859518527984619, "global_step": 155019, "epoch": 3690} {"train_loss": -7.010599136352539, "global_step": 155020, "epoch": 3690} {"train_loss": -6.895245324997675, "global_step": 155021, "epoch": 3690, "val_loss": 68385.5859375} {"train_loss": -6.928736686706543, "global_step": 155022, "epoch": 3691} {"train_loss": -6.93506383895874, "global_step": 155023, "epoch": 3691} {"train_loss": -6.983759880065918, "global_step": 155024, "epoch": 3691} {"train_loss": -6.984715461730957, "global_step": 155025, "epoch": 3691} {"train_loss": -6.962862968444824, "global_step": 155026, "epoch": 3691} {"train_loss": -6.859928131103516, "global_step": 155027, "epoch": 3691} {"train_loss": -6.95490026473999, "global_step": 155028, "epoch": 3691} {"train_loss": -6.8176984786987305, "global_step": 155029, "epoch": 3691} {"train_loss": -6.885950088500977, "global_step": 155030, "epoch": 3691} {"train_loss": -7.013716697692871, "global_step": 155031, "epoch": 3691} {"train_loss": -6.9329633712768555, "global_step": 155032, "epoch": 3691} {"train_loss": -6.887088298797607, "global_step": 155033, "epoch": 3691} {"train_loss": -6.919832706451416, "global_step": 155034, "epoch": 3691} {"train_loss": -6.917779922485352, "global_step": 155035, "epoch": 3691} {"train_loss": -6.840206146240234, "global_step": 155036, "epoch": 3691} {"train_loss": -6.951846122741699, "global_step": 155037, "epoch": 3691} {"train_loss": -6.8632001876831055, "global_step": 155038, "epoch": 3691} {"train_loss": -6.905819892883301, "global_step": 155039, "epoch": 3691} {"train_loss": -7.001474380493164, "global_step": 155040, "epoch": 3691} {"train_loss": -6.926455497741699, "global_step": 155041, "epoch": 3691} {"train_loss": -6.929205894470215, "global_step": 155042, "epoch": 3691} {"train_loss": -6.837413787841797, "global_step": 155043, "epoch": 3691} {"train_loss": -6.82687520980835, "global_step": 155044, "epoch": 3691} {"train_loss": -6.871777534484863, "global_step": 155045, "epoch": 3691} {"train_loss": -6.880894660949707, "global_step": 155046, "epoch": 3691} {"train_loss": -6.843682289123535, "global_step": 155047, "epoch": 3691} {"train_loss": -6.861016273498535, "global_step": 155048, "epoch": 3691} {"train_loss": -6.890570163726807, "global_step": 155049, "epoch": 3691} {"train_loss": -6.955343723297119, "global_step": 155050, "epoch": 3691} {"train_loss": -6.694128513336182, "global_step": 155051, "epoch": 3691} {"train_loss": -6.831145286560059, "global_step": 155052, "epoch": 3691} {"train_loss": -6.85671329498291, "global_step": 155053, "epoch": 3691} {"train_loss": -6.896577835083008, "global_step": 155054, "epoch": 3691} {"train_loss": -6.947954177856445, "global_step": 155055, "epoch": 3691} {"train_loss": -6.876919746398926, "global_step": 155056, "epoch": 3691} {"train_loss": -6.820799827575684, "global_step": 155057, "epoch": 3691} {"train_loss": -6.635335445404053, "global_step": 155058, "epoch": 3691} {"train_loss": -6.858709335327148, "global_step": 155059, "epoch": 3691} {"train_loss": -6.9690446853637695, "global_step": 155060, "epoch": 3691} {"train_loss": -6.867070198059082, "global_step": 155061, "epoch": 3691} {"train_loss": -6.863985061645508, "global_step": 155062, "epoch": 3691} {"train_loss": -6.888763632093157, "global_step": 155063, "epoch": 3691, "val_loss": 68280.671875} {"train_loss": -6.911532878875732, "global_step": 155064, "epoch": 3692} {"train_loss": -6.85233211517334, "global_step": 155065, "epoch": 3692} {"train_loss": -6.830000877380371, "global_step": 155066, "epoch": 3692} {"train_loss": -6.954652786254883, "global_step": 155067, "epoch": 3692} {"train_loss": -6.961102485656738, "global_step": 155068, "epoch": 3692} {"train_loss": -6.879284858703613, "global_step": 155069, "epoch": 3692} {"train_loss": -6.871649265289307, "global_step": 155070, "epoch": 3692} {"train_loss": -6.97515344619751, "global_step": 155071, "epoch": 3692} {"train_loss": -7.0764360427856445, "global_step": 155072, "epoch": 3692} {"train_loss": -6.811790466308594, "global_step": 155073, "epoch": 3692} {"train_loss": -6.947759628295898, "global_step": 155074, "epoch": 3692} {"train_loss": -6.948311805725098, "global_step": 155075, "epoch": 3692} {"train_loss": -6.8407487869262695, "global_step": 155076, "epoch": 3692} {"train_loss": -6.983590126037598, "global_step": 155077, "epoch": 3692} {"train_loss": -6.907536029815674, "global_step": 155078, "epoch": 3692} {"train_loss": -7.004454612731934, "global_step": 155079, "epoch": 3692} {"train_loss": -6.892557144165039, "global_step": 155080, "epoch": 3692} {"train_loss": -6.906866073608398, "global_step": 155081, "epoch": 3692} {"train_loss": -6.91886043548584, "global_step": 155082, "epoch": 3692} {"train_loss": -6.824873924255371, "global_step": 155083, "epoch": 3692} {"train_loss": -6.995660781860352, "global_step": 155084, "epoch": 3692} {"train_loss": -6.905269622802734, "global_step": 155085, "epoch": 3692} {"train_loss": -6.918285369873047, "global_step": 155086, "epoch": 3692} {"train_loss": -6.98022985458374, "global_step": 155087, "epoch": 3692} {"train_loss": -6.960482120513916, "global_step": 155088, "epoch": 3692} {"train_loss": -6.976889133453369, "global_step": 155089, "epoch": 3692} {"train_loss": -6.860118865966797, "global_step": 155090, "epoch": 3692} {"train_loss": -6.867008209228516, "global_step": 155091, "epoch": 3692} {"train_loss": -6.869967460632324, "global_step": 155092, "epoch": 3692} {"train_loss": -6.786464691162109, "global_step": 155093, "epoch": 3692} {"train_loss": -6.850935459136963, "global_step": 155094, "epoch": 3692} {"train_loss": -7.037530899047852, "global_step": 155095, "epoch": 3692} {"train_loss": -6.964932441711426, "global_step": 155096, "epoch": 3692} {"train_loss": -6.835793972015381, "global_step": 155097, "epoch": 3692} {"train_loss": -6.915186882019043, "global_step": 155098, "epoch": 3692} {"train_loss": -6.904273986816406, "global_step": 155099, "epoch": 3692} {"train_loss": -6.810210227966309, "global_step": 155100, "epoch": 3692} {"train_loss": -6.924628257751465, "global_step": 155101, "epoch": 3692} {"train_loss": -6.869509696960449, "global_step": 155102, "epoch": 3692} {"train_loss": -6.91385555267334, "global_step": 155103, "epoch": 3692} {"train_loss": -6.821375846862793, "global_step": 155104, "epoch": 3692} {"train_loss": -6.908195631844657, "global_step": 155105, "epoch": 3692, "val_loss": 68305.4375} {"train_loss": -6.865540504455566, "global_step": 155106, "epoch": 3693} {"train_loss": -6.963983535766602, "global_step": 155107, "epoch": 3693} {"train_loss": -7.000920295715332, "global_step": 155108, "epoch": 3693} {"train_loss": -6.960000038146973, "global_step": 155109, "epoch": 3693} {"train_loss": -6.904569149017334, "global_step": 155110, "epoch": 3693} {"train_loss": -6.900791645050049, "global_step": 155111, "epoch": 3693} {"train_loss": -6.833530426025391, "global_step": 155112, "epoch": 3693} {"train_loss": -6.925505638122559, "global_step": 155113, "epoch": 3693} {"train_loss": -6.904013633728027, "global_step": 155114, "epoch": 3693} {"train_loss": -6.99753999710083, "global_step": 155115, "epoch": 3693} {"train_loss": -6.837002754211426, "global_step": 155116, "epoch": 3693} {"train_loss": -6.861632823944092, "global_step": 155117, "epoch": 3693} {"train_loss": -6.877994060516357, "global_step": 155118, "epoch": 3693} {"train_loss": -6.78908634185791, "global_step": 155119, "epoch": 3693} {"train_loss": -6.956753253936768, "global_step": 155120, "epoch": 3693} {"train_loss": -6.971940517425537, "global_step": 155121, "epoch": 3693} {"train_loss": -6.914162635803223, "global_step": 155122, "epoch": 3693} {"train_loss": -6.875786781311035, "global_step": 155123, "epoch": 3693} {"train_loss": -6.811561584472656, "global_step": 155124, "epoch": 3693} {"train_loss": -6.898610591888428, "global_step": 155125, "epoch": 3693} {"train_loss": -6.964404582977295, "global_step": 155126, "epoch": 3693} {"train_loss": -6.909104824066162, "global_step": 155127, "epoch": 3693} {"train_loss": -6.8875203132629395, "global_step": 155128, "epoch": 3693} {"train_loss": -6.9575090408325195, "global_step": 155129, "epoch": 3693} {"train_loss": -6.826555252075195, "global_step": 155130, "epoch": 3693} {"train_loss": -6.760425567626953, "global_step": 155131, "epoch": 3693} {"train_loss": -6.899478912353516, "global_step": 155132, "epoch": 3693} {"train_loss": -6.841205596923828, "global_step": 155133, "epoch": 3693} {"train_loss": -6.816066265106201, "global_step": 155134, "epoch": 3693} {"train_loss": -6.858952522277832, "global_step": 155135, "epoch": 3693} {"train_loss": -6.811142444610596, "global_step": 155136, "epoch": 3693} {"train_loss": -6.889829158782959, "global_step": 155137, "epoch": 3693} {"train_loss": -6.810210227966309, "global_step": 155138, "epoch": 3693} {"train_loss": -6.854225158691406, "global_step": 155139, "epoch": 3693} {"train_loss": -6.781091690063477, "global_step": 155140, "epoch": 3693} {"train_loss": -6.90374755859375, "global_step": 155141, "epoch": 3693} {"train_loss": -7.041777610778809, "global_step": 155142, "epoch": 3693} {"train_loss": -6.832859992980957, "global_step": 155143, "epoch": 3693} {"train_loss": -6.869014263153076, "global_step": 155144, "epoch": 3693} {"train_loss": -6.871162414550781, "global_step": 155145, "epoch": 3693} {"train_loss": -6.854561805725098, "global_step": 155146, "epoch": 3693} {"train_loss": -6.884982971918015, "global_step": 155147, "epoch": 3693, "val_loss": 68194.5703125} {"train_loss": -6.85835075378418, "global_step": 155148, "epoch": 3694} {"train_loss": -6.904209613800049, "global_step": 155149, "epoch": 3694} {"train_loss": -6.774223327636719, "global_step": 155150, "epoch": 3694} {"train_loss": -6.948823928833008, "global_step": 155151, "epoch": 3694} {"train_loss": -6.882019996643066, "global_step": 155152, "epoch": 3694} {"train_loss": -6.7872772216796875, "global_step": 155153, "epoch": 3694} {"train_loss": -7.031954765319824, "global_step": 155154, "epoch": 3694} {"train_loss": -7.0036444664001465, "global_step": 155155, "epoch": 3694} {"train_loss": -6.961214065551758, "global_step": 155156, "epoch": 3694} {"train_loss": -7.007049083709717, "global_step": 155157, "epoch": 3694} {"train_loss": -6.85379695892334, "global_step": 155158, "epoch": 3694} {"train_loss": -6.817656993865967, "global_step": 155159, "epoch": 3694} {"train_loss": -6.913097381591797, "global_step": 155160, "epoch": 3694} {"train_loss": -6.883652687072754, "global_step": 155161, "epoch": 3694} {"train_loss": -6.8674421310424805, "global_step": 155162, "epoch": 3694} {"train_loss": -6.90474271774292, "global_step": 155163, "epoch": 3694} {"train_loss": -6.917004585266113, "global_step": 155164, "epoch": 3694} {"train_loss": -6.874532699584961, "global_step": 155165, "epoch": 3694} {"train_loss": -6.8630452156066895, "global_step": 155166, "epoch": 3694} {"train_loss": -7.009147644042969, "global_step": 155167, "epoch": 3694} {"train_loss": -6.834595680236816, "global_step": 155168, "epoch": 3694} {"train_loss": -6.880234718322754, "global_step": 155169, "epoch": 3694} {"train_loss": -6.880919456481934, "global_step": 155170, "epoch": 3694} {"train_loss": -6.848601818084717, "global_step": 155171, "epoch": 3694} {"train_loss": -6.907777786254883, "global_step": 155172, "epoch": 3694} {"train_loss": -6.854190826416016, "global_step": 155173, "epoch": 3694} {"train_loss": -6.798210144042969, "global_step": 155174, "epoch": 3694} {"train_loss": -6.790287017822266, "global_step": 155175, "epoch": 3694} {"train_loss": -6.907342910766602, "global_step": 155176, "epoch": 3694} {"train_loss": -6.875153541564941, "global_step": 155177, "epoch": 3694} {"train_loss": -6.890091896057129, "global_step": 155178, "epoch": 3694} {"train_loss": -6.922176361083984, "global_step": 155179, "epoch": 3694} {"train_loss": -6.8993964195251465, "global_step": 155180, "epoch": 3694} {"train_loss": -6.868791580200195, "global_step": 155181, "epoch": 3694} {"train_loss": -6.903102874755859, "global_step": 155182, "epoch": 3694} {"train_loss": -6.774883270263672, "global_step": 155183, "epoch": 3694} {"train_loss": -6.88865852355957, "global_step": 155184, "epoch": 3694} {"train_loss": -6.828307151794434, "global_step": 155185, "epoch": 3694} {"train_loss": -6.901567459106445, "global_step": 155186, "epoch": 3694} {"train_loss": -7.003249168395996, "global_step": 155187, "epoch": 3694} {"train_loss": -6.805872917175293, "global_step": 155188, "epoch": 3694} {"train_loss": -6.886130991436186, "global_step": 155189, "epoch": 3694, "val_loss": 68270.265625} {"train_loss": -6.848085403442383, "global_step": 155190, "epoch": 3695} {"train_loss": -6.91172981262207, "global_step": 155191, "epoch": 3695} {"train_loss": -6.9570231437683105, "global_step": 155192, "epoch": 3695} {"train_loss": -6.784770488739014, "global_step": 155193, "epoch": 3695} {"train_loss": -6.916430950164795, "global_step": 155194, "epoch": 3695} {"train_loss": -6.907958984375, "global_step": 155195, "epoch": 3695} {"train_loss": -6.914007663726807, "global_step": 155196, "epoch": 3695} {"train_loss": -6.967201232910156, "global_step": 155197, "epoch": 3695} {"train_loss": -6.839147090911865, "global_step": 155198, "epoch": 3695} {"train_loss": -6.835737228393555, "global_step": 155199, "epoch": 3695} {"train_loss": -6.806303024291992, "global_step": 155200, "epoch": 3695} {"train_loss": -6.850739479064941, "global_step": 155201, "epoch": 3695} {"train_loss": -6.968848705291748, "global_step": 155202, "epoch": 3695} {"train_loss": -6.849248886108398, "global_step": 155203, "epoch": 3695} {"train_loss": -6.905227184295654, "global_step": 155204, "epoch": 3695} {"train_loss": -6.863750457763672, "global_step": 155205, "epoch": 3695} {"train_loss": -6.898332595825195, "global_step": 155206, "epoch": 3695} {"train_loss": -6.873823165893555, "global_step": 155207, "epoch": 3695} {"train_loss": -6.88979434967041, "global_step": 155208, "epoch": 3695} {"train_loss": -6.962785720825195, "global_step": 155209, "epoch": 3695} {"train_loss": -6.914242744445801, "global_step": 155210, "epoch": 3695} {"train_loss": -6.894920349121094, "global_step": 155211, "epoch": 3695} {"train_loss": -6.950573921203613, "global_step": 155212, "epoch": 3695} {"train_loss": -6.798650741577148, "global_step": 155213, "epoch": 3695} {"train_loss": -6.976659297943115, "global_step": 155214, "epoch": 3695} {"train_loss": -6.874519348144531, "global_step": 155215, "epoch": 3695} {"train_loss": -6.918613433837891, "global_step": 155216, "epoch": 3695} {"train_loss": -7.030457496643066, "global_step": 155217, "epoch": 3695} {"train_loss": -6.860742092132568, "global_step": 155218, "epoch": 3695} {"train_loss": -6.904689788818359, "global_step": 155219, "epoch": 3695} {"train_loss": -6.925173759460449, "global_step": 155220, "epoch": 3695} {"train_loss": -6.920905590057373, "global_step": 155221, "epoch": 3695} {"train_loss": -6.793276786804199, "global_step": 155222, "epoch": 3695} {"train_loss": -6.997005462646484, "global_step": 155223, "epoch": 3695} {"train_loss": -6.801316261291504, "global_step": 155224, "epoch": 3695} {"train_loss": -6.742303848266602, "global_step": 155225, "epoch": 3695} {"train_loss": -6.918905735015869, "global_step": 155226, "epoch": 3695} {"train_loss": -6.577659606933594, "global_step": 155227, "epoch": 3695} {"train_loss": -6.835758686065674, "global_step": 155228, "epoch": 3695} {"train_loss": -6.74904727935791, "global_step": 155229, "epoch": 3695} {"train_loss": -6.801630020141602, "global_step": 155230, "epoch": 3695} {"train_loss": -6.8771390574319025, "global_step": 155231, "epoch": 3695, "val_loss": 68449.640625} {"train_loss": -6.822319507598877, "global_step": 155232, "epoch": 3696} {"train_loss": -6.946959972381592, "global_step": 155233, "epoch": 3696} {"train_loss": -6.888458251953125, "global_step": 155234, "epoch": 3696} {"train_loss": -6.787232398986816, "global_step": 155235, "epoch": 3696} {"train_loss": -6.919352054595947, "global_step": 155236, "epoch": 3696} {"train_loss": -6.90418815612793, "global_step": 155237, "epoch": 3696} {"train_loss": -6.784847736358643, "global_step": 155238, "epoch": 3696} {"train_loss": -6.896821022033691, "global_step": 155239, "epoch": 3696} {"train_loss": -6.898284912109375, "global_step": 155240, "epoch": 3696} {"train_loss": -6.883886814117432, "global_step": 155241, "epoch": 3696} {"train_loss": -6.768950462341309, "global_step": 155242, "epoch": 3696} {"train_loss": -6.950568675994873, "global_step": 155243, "epoch": 3696} {"train_loss": -6.776092529296875, "global_step": 155244, "epoch": 3696} {"train_loss": -6.861932754516602, "global_step": 155245, "epoch": 3696} {"train_loss": -7.007698059082031, "global_step": 155246, "epoch": 3696} {"train_loss": -6.95469856262207, "global_step": 155247, "epoch": 3696} {"train_loss": -6.903565883636475, "global_step": 155248, "epoch": 3696} {"train_loss": -6.77226448059082, "global_step": 155249, "epoch": 3696} {"train_loss": -6.958526611328125, "global_step": 155250, "epoch": 3696} {"train_loss": -6.868527412414551, "global_step": 155251, "epoch": 3696} {"train_loss": -6.78726053237915, "global_step": 155252, "epoch": 3696} {"train_loss": -6.959987640380859, "global_step": 155253, "epoch": 3696} {"train_loss": -6.8075151443481445, "global_step": 155254, "epoch": 3696} {"train_loss": -6.9036054611206055, "global_step": 155255, "epoch": 3696} {"train_loss": -6.887011528015137, "global_step": 155256, "epoch": 3696} {"train_loss": -6.9555344581604, "global_step": 155257, "epoch": 3696} {"train_loss": -6.923004627227783, "global_step": 155258, "epoch": 3696} {"train_loss": -6.867615699768066, "global_step": 155259, "epoch": 3696} {"train_loss": -6.955740928649902, "global_step": 155260, "epoch": 3696} {"train_loss": -6.804082870483398, "global_step": 155261, "epoch": 3696} {"train_loss": -6.903614044189453, "global_step": 155262, "epoch": 3696} {"train_loss": -6.8897833824157715, "global_step": 155263, "epoch": 3696} {"train_loss": -6.979610919952393, "global_step": 155264, "epoch": 3696} {"train_loss": -6.871253490447998, "global_step": 155265, "epoch": 3696} {"train_loss": -6.861713409423828, "global_step": 155266, "epoch": 3696} {"train_loss": -6.996232509613037, "global_step": 155267, "epoch": 3696} {"train_loss": -6.834251403808594, "global_step": 155268, "epoch": 3696} {"train_loss": -6.914607048034668, "global_step": 155269, "epoch": 3696} {"train_loss": -6.932770729064941, "global_step": 155270, "epoch": 3696} {"train_loss": -6.89858865737915, "global_step": 155271, "epoch": 3696} {"train_loss": -6.952163219451904, "global_step": 155272, "epoch": 3696} {"train_loss": -6.889126573290143, "global_step": 155273, "epoch": 3696, "val_loss": 68314.578125} {"train_loss": -6.993835926055908, "global_step": 155274, "epoch": 3697} {"train_loss": -6.84528923034668, "global_step": 155275, "epoch": 3697} {"train_loss": -7.014819145202637, "global_step": 155276, "epoch": 3697} {"train_loss": -6.753047943115234, "global_step": 155277, "epoch": 3697} {"train_loss": -6.7717390060424805, "global_step": 155278, "epoch": 3697} {"train_loss": -6.993701934814453, "global_step": 155279, "epoch": 3697} {"train_loss": -6.856517791748047, "global_step": 155280, "epoch": 3697} {"train_loss": -6.9722900390625, "global_step": 155281, "epoch": 3697} {"train_loss": -6.870424270629883, "global_step": 155282, "epoch": 3697} {"train_loss": -6.981542587280273, "global_step": 155283, "epoch": 3697} {"train_loss": -6.870552062988281, "global_step": 155284, "epoch": 3697} {"train_loss": -6.884090423583984, "global_step": 155285, "epoch": 3697} {"train_loss": -6.873403072357178, "global_step": 155286, "epoch": 3697} {"train_loss": -6.82464599609375, "global_step": 155287, "epoch": 3697} {"train_loss": -6.8679304122924805, "global_step": 155288, "epoch": 3697} {"train_loss": -6.933146953582764, "global_step": 155289, "epoch": 3697} {"train_loss": -6.993955612182617, "global_step": 155290, "epoch": 3697} {"train_loss": -6.8897600173950195, "global_step": 155291, "epoch": 3697} {"train_loss": -6.954951286315918, "global_step": 155292, "epoch": 3697} {"train_loss": -6.910235404968262, "global_step": 155293, "epoch": 3697} {"train_loss": -6.93289852142334, "global_step": 155294, "epoch": 3697} {"train_loss": -6.925212860107422, "global_step": 155295, "epoch": 3697} {"train_loss": -6.971244812011719, "global_step": 155296, "epoch": 3697} {"train_loss": -6.926916599273682, "global_step": 155297, "epoch": 3697} {"train_loss": -6.832742691040039, "global_step": 155298, "epoch": 3697} {"train_loss": -6.873998641967773, "global_step": 155299, "epoch": 3697} {"train_loss": -6.758380889892578, "global_step": 155300, "epoch": 3697} {"train_loss": -6.901019096374512, "global_step": 155301, "epoch": 3697} {"train_loss": -6.892697334289551, "global_step": 155302, "epoch": 3697} {"train_loss": -6.965654373168945, "global_step": 155303, "epoch": 3697} {"train_loss": -6.865856647491455, "global_step": 155304, "epoch": 3697} {"train_loss": -6.864021301269531, "global_step": 155305, "epoch": 3697} {"train_loss": -6.834546089172363, "global_step": 155306, "epoch": 3697} {"train_loss": -7.04364013671875, "global_step": 155307, "epoch": 3697} {"train_loss": -6.988890647888184, "global_step": 155308, "epoch": 3697} {"train_loss": -6.832956314086914, "global_step": 155309, "epoch": 3697} {"train_loss": -6.879013538360596, "global_step": 155310, "epoch": 3697} {"train_loss": -6.878704071044922, "global_step": 155311, "epoch": 3697} {"train_loss": -6.793520927429199, "global_step": 155312, "epoch": 3697} {"train_loss": -6.996054649353027, "global_step": 155313, "epoch": 3697} {"train_loss": -6.792340278625488, "global_step": 155314, "epoch": 3697} {"train_loss": -6.891932839439029, "global_step": 155315, "epoch": 3697, "val_loss": 68376.484375} {"train_loss": -6.939262866973877, "global_step": 155316, "epoch": 3698} {"train_loss": -6.908935546875, "global_step": 155317, "epoch": 3698} {"train_loss": -6.864199638366699, "global_step": 155318, "epoch": 3698} {"train_loss": -6.9857354164123535, "global_step": 155319, "epoch": 3698} {"train_loss": -6.838790416717529, "global_step": 155320, "epoch": 3698} {"train_loss": -6.874385833740234, "global_step": 155321, "epoch": 3698} {"train_loss": -6.869479656219482, "global_step": 155322, "epoch": 3698} {"train_loss": -6.879855155944824, "global_step": 155323, "epoch": 3698} {"train_loss": -6.848824501037598, "global_step": 155324, "epoch": 3698} {"train_loss": -6.830343246459961, "global_step": 155325, "epoch": 3698} {"train_loss": -6.860910415649414, "global_step": 155326, "epoch": 3698} {"train_loss": -6.952933311462402, "global_step": 155327, "epoch": 3698} {"train_loss": -6.871990203857422, "global_step": 155328, "epoch": 3698} {"train_loss": -6.835701942443848, "global_step": 155329, "epoch": 3698} {"train_loss": -6.908974647521973, "global_step": 155330, "epoch": 3698} {"train_loss": -6.827317714691162, "global_step": 155331, "epoch": 3698} {"train_loss": -7.001563549041748, "global_step": 155332, "epoch": 3698} {"train_loss": -6.868958950042725, "global_step": 155333, "epoch": 3698} {"train_loss": -6.979238033294678, "global_step": 155334, "epoch": 3698} {"train_loss": -6.870299339294434, "global_step": 155335, "epoch": 3698} {"train_loss": -6.942838668823242, "global_step": 155336, "epoch": 3698} {"train_loss": -6.933661460876465, "global_step": 155337, "epoch": 3698} {"train_loss": -6.806778907775879, "global_step": 155338, "epoch": 3698} {"train_loss": -6.776097297668457, "global_step": 155339, "epoch": 3698} {"train_loss": -6.890865802764893, "global_step": 155340, "epoch": 3698} {"train_loss": -6.873010158538818, "global_step": 155341, "epoch": 3698} {"train_loss": -6.859392166137695, "global_step": 155342, "epoch": 3698} {"train_loss": -6.9609222412109375, "global_step": 155343, "epoch": 3698} {"train_loss": -6.889995574951172, "global_step": 155344, "epoch": 3698} {"train_loss": -6.970065116882324, "global_step": 155345, "epoch": 3698} {"train_loss": -6.954068183898926, "global_step": 155346, "epoch": 3698} {"train_loss": -6.944896221160889, "global_step": 155347, "epoch": 3698} {"train_loss": -6.8487467765808105, "global_step": 155348, "epoch": 3698} {"train_loss": -7.037542819976807, "global_step": 155349, "epoch": 3698} {"train_loss": -6.997679710388184, "global_step": 155350, "epoch": 3698} {"train_loss": -6.989985466003418, "global_step": 155351, "epoch": 3698} {"train_loss": -6.984350681304932, "global_step": 155352, "epoch": 3698} {"train_loss": -6.940732002258301, "global_step": 155353, "epoch": 3698} {"train_loss": -6.957924842834473, "global_step": 155354, "epoch": 3698} {"train_loss": -6.941959381103516, "global_step": 155355, "epoch": 3698} {"train_loss": -6.893454551696777, "global_step": 155356, "epoch": 3698} {"train_loss": -6.911114272617159, "global_step": 155357, "epoch": 3698, "val_loss": 68315.1875} {"train_loss": -6.960555076599121, "global_step": 155358, "epoch": 3699} {"train_loss": -6.956730842590332, "global_step": 155359, "epoch": 3699} {"train_loss": -6.999711036682129, "global_step": 155360, "epoch": 3699} {"train_loss": -6.978472709655762, "global_step": 155361, "epoch": 3699} {"train_loss": -6.975656986236572, "global_step": 155362, "epoch": 3699} {"train_loss": -6.880038261413574, "global_step": 155363, "epoch": 3699} {"train_loss": -6.899949073791504, "global_step": 155364, "epoch": 3699} {"train_loss": -6.912688732147217, "global_step": 155365, "epoch": 3699} {"train_loss": -6.754810810089111, "global_step": 155366, "epoch": 3699} {"train_loss": -6.921416282653809, "global_step": 155367, "epoch": 3699} {"train_loss": -6.887792587280273, "global_step": 155368, "epoch": 3699} {"train_loss": -6.862561225891113, "global_step": 155369, "epoch": 3699} {"train_loss": -6.728121280670166, "global_step": 155370, "epoch": 3699} {"train_loss": -6.967970848083496, "global_step": 155371, "epoch": 3699} {"train_loss": -6.788857936859131, "global_step": 155372, "epoch": 3699} {"train_loss": -6.77394437789917, "global_step": 155373, "epoch": 3699} {"train_loss": -6.767147064208984, "global_step": 155374, "epoch": 3699} {"train_loss": -6.780368328094482, "global_step": 155375, "epoch": 3699} {"train_loss": -6.799413681030273, "global_step": 155376, "epoch": 3699} {"train_loss": -6.834160804748535, "global_step": 155377, "epoch": 3699} {"train_loss": -6.804442405700684, "global_step": 155378, "epoch": 3699} {"train_loss": -6.887690544128418, "global_step": 155379, "epoch": 3699} {"train_loss": -6.776865482330322, "global_step": 155380, "epoch": 3699} {"train_loss": -6.835253715515137, "global_step": 155381, "epoch": 3699} {"train_loss": -6.784305572509766, "global_step": 155382, "epoch": 3699} {"train_loss": -6.749570369720459, "global_step": 155383, "epoch": 3699} {"train_loss": -6.884647369384766, "global_step": 155384, "epoch": 3699} {"train_loss": -6.8471760749816895, "global_step": 155385, "epoch": 3699} {"train_loss": -6.772493362426758, "global_step": 155386, "epoch": 3699} {"train_loss": -6.855817794799805, "global_step": 155387, "epoch": 3699} {"train_loss": -6.857837677001953, "global_step": 155388, "epoch": 3699} {"train_loss": -6.880920886993408, "global_step": 155389, "epoch": 3699} {"train_loss": -6.857497215270996, "global_step": 155390, "epoch": 3699} {"train_loss": -6.8031840324401855, "global_step": 155391, "epoch": 3699} {"train_loss": -6.899321556091309, "global_step": 155392, "epoch": 3699} {"train_loss": -6.883990287780762, "global_step": 155393, "epoch": 3699} {"train_loss": -6.890506744384766, "global_step": 155394, "epoch": 3699} {"train_loss": -6.977144241333008, "global_step": 155395, "epoch": 3699} {"train_loss": -6.845776081085205, "global_step": 155396, "epoch": 3699} {"train_loss": -6.887309551239014, "global_step": 155397, "epoch": 3699} {"train_loss": -6.935224533081055, "global_step": 155398, "epoch": 3699} {"train_loss": -6.861889521280925, "global_step": 155399, "epoch": 3699, "val_loss": 68295.3828125} {"train_loss": -7.02520751953125, "global_step": 155400, "epoch": 3700} {"train_loss": -6.955898761749268, "global_step": 155401, "epoch": 3700} {"train_loss": -6.982237815856934, "global_step": 155402, "epoch": 3700} {"train_loss": -6.882308483123779, "global_step": 155403, "epoch": 3700} {"train_loss": -6.962614059448242, "global_step": 155404, "epoch": 3700} {"train_loss": -6.856683254241943, "global_step": 155405, "epoch": 3700} {"train_loss": -6.949263095855713, "global_step": 155406, "epoch": 3700} {"train_loss": -6.917311191558838, "global_step": 155407, "epoch": 3700} {"train_loss": -6.819815158843994, "global_step": 155408, "epoch": 3700} {"train_loss": -6.903569221496582, "global_step": 155409, "epoch": 3700} {"train_loss": -6.812928199768066, "global_step": 155410, "epoch": 3700} {"train_loss": -7.025280952453613, "global_step": 155411, "epoch": 3700} {"train_loss": -6.944980621337891, "global_step": 155412, "epoch": 3700} {"train_loss": -6.813690185546875, "global_step": 155413, "epoch": 3700} {"train_loss": -6.924992084503174, "global_step": 155414, "epoch": 3700} {"train_loss": -6.935052871704102, "global_step": 155415, "epoch": 3700} {"train_loss": -6.9804887771606445, "global_step": 155416, "epoch": 3700} {"train_loss": -7.017304420471191, "global_step": 155417, "epoch": 3700} {"train_loss": -6.981790542602539, "global_step": 155418, "epoch": 3700} {"train_loss": -6.9763336181640625, "global_step": 155419, "epoch": 3700} {"train_loss": -6.799457550048828, "global_step": 155420, "epoch": 3700} {"train_loss": -6.94775390625, "global_step": 155421, "epoch": 3700} {"train_loss": -6.756604194641113, "global_step": 155422, "epoch": 3700} {"train_loss": -6.726866722106934, "global_step": 155423, "epoch": 3700} {"train_loss": -6.909387588500977, "global_step": 155424, "epoch": 3700} {"train_loss": -6.731963157653809, "global_step": 155425, "epoch": 3700} {"train_loss": -6.842601776123047, "global_step": 155426, "epoch": 3700} {"train_loss": -6.76564359664917, "global_step": 155427, "epoch": 3700} {"train_loss": -6.719293594360352, "global_step": 155428, "epoch": 3700} {"train_loss": -6.784073352813721, "global_step": 155429, "epoch": 3700} {"train_loss": -6.786184310913086, "global_step": 155430, "epoch": 3700} {"train_loss": -6.858645439147949, "global_step": 155431, "epoch": 3700} {"train_loss": -6.796966552734375, "global_step": 155432, "epoch": 3700} {"train_loss": -6.835536003112793, "global_step": 155433, "epoch": 3700} {"train_loss": -6.9497246742248535, "global_step": 155434, "epoch": 3700} {"train_loss": -6.720897197723389, "global_step": 155435, "epoch": 3700} {"train_loss": -6.870512962341309, "global_step": 155436, "epoch": 3700} {"train_loss": -6.8413238525390625, "global_step": 155437, "epoch": 3700} {"train_loss": -6.9924540519714355, "global_step": 155438, "epoch": 3700} {"train_loss": -6.792957305908203, "global_step": 155439, "epoch": 3700} {"train_loss": -6.988935470581055, "global_step": 155440, "epoch": 3700} {"train_loss": -6.878635871978033, "global_step": 155441, "epoch": 3700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.7520055526832059, "train/sim_max_reward_3": 0.2607589971691499, "train/sim_max_reward_4": 0.956197302282762, "train/sim_max_reward_5": 0.8105647551612761, "test/sim_max_reward_4300000": 0.10938690226765166, "test/sim_max_reward_4300001": 0.5833429946050871, "test/sim_max_reward_4300002": 0.8559001582643002, "test/sim_max_reward_4300003": 0.797185843978995, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9848752402131471, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3200280679636776, "test/sim_max_reward_4300008": 0.43230354940471766, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.3967625737753739, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.4133242239363472, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.982145026968414, "test/sim_max_reward_4300016": 0.06277373853136173, "test/sim_max_reward_4300017": 0.8905565436624584, "test/sim_max_reward_4300018": 0.4539932928053797, "test/sim_max_reward_4300019": 0.18600799843504032, "test/sim_max_reward_4300020": 0.07603323597717945, "test/sim_max_reward_4300021": 0.3124715449736391, "test/sim_max_reward_4300022": 0.9601693910332851, "test/sim_max_reward_4300023": 0.4119193632282843, "test/sim_max_reward_4300024": 0.9896465003651239, "test/sim_max_reward_4300025": 0.8318983349861853, "test/sim_max_reward_4300026": 0.09946825247936952, "test/sim_max_reward_4300027": 0.9598770798893388, "test/sim_max_reward_4300028": 0.9561323663776063, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.11885022159924026, "test/sim_max_reward_4300031": 0.20874825227139415, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.6716889117283875, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 1.0, "test/sim_max_reward_4300036": 0.2059836208992041, "test/sim_max_reward_4300037": 1.0, "test/sim_max_reward_4300038": 0.9661699567958031, "test/sim_max_reward_4300039": 0.9085253286937074, "test/sim_max_reward_4300040": 0.9310760672187114, "test/sim_max_reward_4300041": 0.9797920264512268, "test/sim_max_reward_4300042": 0.4925242507283897, "test/sim_max_reward_4300043": 0.08909079773207466, "test/sim_max_reward_4300044": 0.936976431824421, "test/sim_max_reward_4300045": 0.19319484129649062, "test/sim_max_reward_4300046": 0.9512333073475141, "test/sim_max_reward_4300047": 0.15893476125936865, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.19091814618873215, "train/mean_score": 0.7965877678827323, "test/mean_score": 0.5417148650193183, "val_loss": 68356.8203125} {"train_loss": -7.004215240478516, "global_step": 155442, "epoch": 3701} {"train_loss": -6.967436790466309, "global_step": 155443, "epoch": 3701} {"train_loss": -6.945253372192383, "global_step": 155444, "epoch": 3701} {"train_loss": -6.965332508087158, "global_step": 155445, "epoch": 3701} {"train_loss": -6.9043169021606445, "global_step": 155446, "epoch": 3701} {"train_loss": -6.919310092926025, "global_step": 155447, "epoch": 3701} {"train_loss": -6.867534160614014, "global_step": 155448, "epoch": 3701} {"train_loss": -7.062813758850098, "global_step": 155449, "epoch": 3701} {"train_loss": -6.930851459503174, "global_step": 155450, "epoch": 3701} {"train_loss": -6.954456806182861, "global_step": 155451, "epoch": 3701} {"train_loss": -6.961496353149414, "global_step": 155452, "epoch": 3701} {"train_loss": -6.843459129333496, "global_step": 155453, "epoch": 3701} {"train_loss": -6.8282599449157715, "global_step": 155454, "epoch": 3701} {"train_loss": -6.995400905609131, "global_step": 155455, "epoch": 3701} {"train_loss": -6.9719953536987305, "global_step": 155456, "epoch": 3701} {"train_loss": -6.867228031158447, "global_step": 155457, "epoch": 3701} {"train_loss": -6.909728050231934, "global_step": 155458, "epoch": 3701} {"train_loss": -6.941768646240234, "global_step": 155459, "epoch": 3701} {"train_loss": -6.919588565826416, "global_step": 155460, "epoch": 3701} {"train_loss": -6.893121719360352, "global_step": 155461, "epoch": 3701} {"train_loss": -6.951560974121094, "global_step": 155462, "epoch": 3701} {"train_loss": -6.955782890319824, "global_step": 155463, "epoch": 3701} {"train_loss": -6.9862775802612305, "global_step": 155464, "epoch": 3701} {"train_loss": -7.032817840576172, "global_step": 155465, "epoch": 3701} {"train_loss": -6.978263854980469, "global_step": 155466, "epoch": 3701} {"train_loss": -6.9199724197387695, "global_step": 155467, "epoch": 3701} {"train_loss": -6.8431396484375, "global_step": 155468, "epoch": 3701} {"train_loss": -6.853673458099365, "global_step": 155469, "epoch": 3701} {"train_loss": -7.064153671264648, "global_step": 155470, "epoch": 3701} {"train_loss": -7.0231804847717285, "global_step": 155471, "epoch": 3701} {"train_loss": -6.9976630210876465, "global_step": 155472, "epoch": 3701} {"train_loss": -6.907392978668213, "global_step": 155473, "epoch": 3701} {"train_loss": -6.872291564941406, "global_step": 155474, "epoch": 3701} {"train_loss": -6.935132026672363, "global_step": 155475, "epoch": 3701} {"train_loss": -6.826614856719971, "global_step": 155476, "epoch": 3701} {"train_loss": -6.8887529373168945, "global_step": 155477, "epoch": 3701} {"train_loss": -6.866395473480225, "global_step": 155478, "epoch": 3701} {"train_loss": -6.819750785827637, "global_step": 155479, "epoch": 3701} {"train_loss": -6.8012471199035645, "global_step": 155480, "epoch": 3701} {"train_loss": -6.858316421508789, "global_step": 155481, "epoch": 3701} {"train_loss": -6.908426284790039, "global_step": 155482, "epoch": 3701} {"train_loss": -6.924954017003377, "global_step": 155483, "epoch": 3701, "val_loss": 68202.7890625} {"train_loss": -6.837071418762207, "global_step": 155484, "epoch": 3702} {"train_loss": -6.872746467590332, "global_step": 155485, "epoch": 3702} {"train_loss": -6.812506198883057, "global_step": 155486, "epoch": 3702} {"train_loss": -6.933014392852783, "global_step": 155487, "epoch": 3702} {"train_loss": -6.882596492767334, "global_step": 155488, "epoch": 3702} {"train_loss": -6.7851104736328125, "global_step": 155489, "epoch": 3702} {"train_loss": -6.9107346534729, "global_step": 155490, "epoch": 3702} {"train_loss": -6.807194709777832, "global_step": 155491, "epoch": 3702} {"train_loss": -6.897481918334961, "global_step": 155492, "epoch": 3702} {"train_loss": -6.9441704750061035, "global_step": 155493, "epoch": 3702} {"train_loss": -6.83467960357666, "global_step": 155494, "epoch": 3702} {"train_loss": -6.819466590881348, "global_step": 155495, "epoch": 3702} {"train_loss": -6.842285633087158, "global_step": 155496, "epoch": 3702} {"train_loss": -6.897890567779541, "global_step": 155497, "epoch": 3702} {"train_loss": -6.7951812744140625, "global_step": 155498, "epoch": 3702} {"train_loss": -6.859724998474121, "global_step": 155499, "epoch": 3702} {"train_loss": -6.912021636962891, "global_step": 155500, "epoch": 3702} {"train_loss": -6.874396324157715, "global_step": 155501, "epoch": 3702} {"train_loss": -6.830230712890625, "global_step": 155502, "epoch": 3702} {"train_loss": -6.953254222869873, "global_step": 155503, "epoch": 3702} {"train_loss": -6.9382171630859375, "global_step": 155504, "epoch": 3702} {"train_loss": -6.754045009613037, "global_step": 155505, "epoch": 3702} {"train_loss": -6.912045478820801, "global_step": 155506, "epoch": 3702} {"train_loss": -6.892037391662598, "global_step": 155507, "epoch": 3702} {"train_loss": -6.964841842651367, "global_step": 155508, "epoch": 3702} {"train_loss": -6.959169387817383, "global_step": 155509, "epoch": 3702} {"train_loss": -6.909761905670166, "global_step": 155510, "epoch": 3702} {"train_loss": -6.963123321533203, "global_step": 155511, "epoch": 3702} {"train_loss": -6.915069580078125, "global_step": 155512, "epoch": 3702} {"train_loss": -6.924234867095947, "global_step": 155513, "epoch": 3702} {"train_loss": -6.977419853210449, "global_step": 155514, "epoch": 3702} {"train_loss": -7.045219421386719, "global_step": 155515, "epoch": 3702} {"train_loss": -6.864233016967773, "global_step": 155516, "epoch": 3702} {"train_loss": -6.901246070861816, "global_step": 155517, "epoch": 3702} {"train_loss": -6.991412162780762, "global_step": 155518, "epoch": 3702} {"train_loss": -6.848560333251953, "global_step": 155519, "epoch": 3702} {"train_loss": -7.036310195922852, "global_step": 155520, "epoch": 3702} {"train_loss": -6.932607650756836, "global_step": 155521, "epoch": 3702} {"train_loss": -6.927722930908203, "global_step": 155522, "epoch": 3702} {"train_loss": -6.879090309143066, "global_step": 155523, "epoch": 3702} {"train_loss": -7.039748191833496, "global_step": 155524, "epoch": 3702} {"train_loss": -6.901754731223697, "global_step": 155525, "epoch": 3702, "val_loss": 68284.984375} {"train_loss": -6.965456008911133, "global_step": 155526, "epoch": 3703} {"train_loss": -6.998403549194336, "global_step": 155527, "epoch": 3703} {"train_loss": -6.915729522705078, "global_step": 155528, "epoch": 3703} {"train_loss": -6.878142356872559, "global_step": 155529, "epoch": 3703} {"train_loss": -6.972173690795898, "global_step": 155530, "epoch": 3703} {"train_loss": -6.981919288635254, "global_step": 155531, "epoch": 3703} {"train_loss": -7.024168968200684, "global_step": 155532, "epoch": 3703} {"train_loss": -6.997474193572998, "global_step": 155533, "epoch": 3703} {"train_loss": -6.841160774230957, "global_step": 155534, "epoch": 3703} {"train_loss": -6.922201156616211, "global_step": 155535, "epoch": 3703} {"train_loss": -6.790684700012207, "global_step": 155536, "epoch": 3703} {"train_loss": -6.911101341247559, "global_step": 155537, "epoch": 3703} {"train_loss": -6.825495719909668, "global_step": 155538, "epoch": 3703} {"train_loss": -6.9891252517700195, "global_step": 155539, "epoch": 3703} {"train_loss": -6.915341854095459, "global_step": 155540, "epoch": 3703} {"train_loss": -6.947399616241455, "global_step": 155541, "epoch": 3703} {"train_loss": -7.0421295166015625, "global_step": 155542, "epoch": 3703} {"train_loss": -6.821136474609375, "global_step": 155543, "epoch": 3703} {"train_loss": -6.964287757873535, "global_step": 155544, "epoch": 3703} {"train_loss": -6.933540344238281, "global_step": 155545, "epoch": 3703} {"train_loss": -6.819875240325928, "global_step": 155546, "epoch": 3703} {"train_loss": -7.014646530151367, "global_step": 155547, "epoch": 3703} {"train_loss": -6.924612522125244, "global_step": 155548, "epoch": 3703} {"train_loss": -6.852044582366943, "global_step": 155549, "epoch": 3703} {"train_loss": -7.110476493835449, "global_step": 155550, "epoch": 3703} {"train_loss": -6.830060958862305, "global_step": 155551, "epoch": 3703} {"train_loss": -6.861685752868652, "global_step": 155552, "epoch": 3703} {"train_loss": -7.032553195953369, "global_step": 155553, "epoch": 3703} {"train_loss": -6.982956886291504, "global_step": 155554, "epoch": 3703} {"train_loss": -6.799867630004883, "global_step": 155555, "epoch": 3703} {"train_loss": -6.861061096191406, "global_step": 155556, "epoch": 3703} {"train_loss": -6.869476318359375, "global_step": 155557, "epoch": 3703} {"train_loss": -6.948121070861816, "global_step": 155558, "epoch": 3703} {"train_loss": -6.989253044128418, "global_step": 155559, "epoch": 3703} {"train_loss": -6.847282409667969, "global_step": 155560, "epoch": 3703} {"train_loss": -6.8413591384887695, "global_step": 155561, "epoch": 3703} {"train_loss": -6.891685485839844, "global_step": 155562, "epoch": 3703} {"train_loss": -6.824073314666748, "global_step": 155563, "epoch": 3703} {"train_loss": -6.774730682373047, "global_step": 155564, "epoch": 3703} {"train_loss": -6.9098734855651855, "global_step": 155565, "epoch": 3703} {"train_loss": -6.960291862487793, "global_step": 155566, "epoch": 3703} {"train_loss": -6.915443374997094, "global_step": 155567, "epoch": 3703, "val_loss": 68159.9921875} {"train_loss": -6.971311569213867, "global_step": 155568, "epoch": 3704} {"train_loss": -6.8045854568481445, "global_step": 155569, "epoch": 3704} {"train_loss": -6.73866081237793, "global_step": 155570, "epoch": 3704} {"train_loss": -6.859564304351807, "global_step": 155571, "epoch": 3704} {"train_loss": -7.009596824645996, "global_step": 155572, "epoch": 3704} {"train_loss": -6.880288124084473, "global_step": 155573, "epoch": 3704} {"train_loss": -6.956476211547852, "global_step": 155574, "epoch": 3704} {"train_loss": -6.845362663269043, "global_step": 155575, "epoch": 3704} {"train_loss": -6.796698570251465, "global_step": 155576, "epoch": 3704} {"train_loss": -6.889706611633301, "global_step": 155577, "epoch": 3704} {"train_loss": -6.8697357177734375, "global_step": 155578, "epoch": 3704} {"train_loss": -6.859341144561768, "global_step": 155579, "epoch": 3704} {"train_loss": -6.838886260986328, "global_step": 155580, "epoch": 3704} {"train_loss": -6.835594177246094, "global_step": 155581, "epoch": 3704} {"train_loss": -6.84421968460083, "global_step": 155582, "epoch": 3704} {"train_loss": -6.94244384765625, "global_step": 155583, "epoch": 3704} {"train_loss": -6.888670444488525, "global_step": 155584, "epoch": 3704} {"train_loss": -6.752467155456543, "global_step": 155585, "epoch": 3704} {"train_loss": -6.862471580505371, "global_step": 155586, "epoch": 3704} {"train_loss": -6.964844703674316, "global_step": 155587, "epoch": 3704} {"train_loss": -6.932883262634277, "global_step": 155588, "epoch": 3704} {"train_loss": -6.9127655029296875, "global_step": 155589, "epoch": 3704} {"train_loss": -6.946380615234375, "global_step": 155590, "epoch": 3704} {"train_loss": -6.9453535079956055, "global_step": 155591, "epoch": 3704} {"train_loss": -6.894207000732422, "global_step": 155592, "epoch": 3704} {"train_loss": -6.883983612060547, "global_step": 155593, "epoch": 3704} {"train_loss": -6.7885236740112305, "global_step": 155594, "epoch": 3704} {"train_loss": -6.929878234863281, "global_step": 155595, "epoch": 3704} {"train_loss": -6.911037921905518, "global_step": 155596, "epoch": 3704} {"train_loss": -6.843174457550049, "global_step": 155597, "epoch": 3704} {"train_loss": -6.814366340637207, "global_step": 155598, "epoch": 3704} {"train_loss": -6.990570545196533, "global_step": 155599, "epoch": 3704} {"train_loss": -6.953761100769043, "global_step": 155600, "epoch": 3704} {"train_loss": -6.793914794921875, "global_step": 155601, "epoch": 3704} {"train_loss": -6.899354934692383, "global_step": 155602, "epoch": 3704} {"train_loss": -6.868507385253906, "global_step": 155603, "epoch": 3704} {"train_loss": -6.847240447998047, "global_step": 155604, "epoch": 3704} {"train_loss": -6.899150848388672, "global_step": 155605, "epoch": 3704} {"train_loss": -6.852080345153809, "global_step": 155606, "epoch": 3704} {"train_loss": -7.009900093078613, "global_step": 155607, "epoch": 3704} {"train_loss": -6.913193702697754, "global_step": 155608, "epoch": 3704} {"train_loss": -6.882556563331967, "global_step": 155609, "epoch": 3704, "val_loss": 68302.7109375} {"train_loss": -6.93568229675293, "global_step": 155610, "epoch": 3705} {"train_loss": -6.931819915771484, "global_step": 155611, "epoch": 3705} {"train_loss": -6.776172637939453, "global_step": 155612, "epoch": 3705} {"train_loss": -6.9606547355651855, "global_step": 155613, "epoch": 3705} {"train_loss": -6.885928153991699, "global_step": 155614, "epoch": 3705} {"train_loss": -6.891822814941406, "global_step": 155615, "epoch": 3705} {"train_loss": -6.940869331359863, "global_step": 155616, "epoch": 3705} {"train_loss": -6.898634910583496, "global_step": 155617, "epoch": 3705} {"train_loss": -6.959281921386719, "global_step": 155618, "epoch": 3705} {"train_loss": -6.839103698730469, "global_step": 155619, "epoch": 3705} {"train_loss": -6.977572917938232, "global_step": 155620, "epoch": 3705} {"train_loss": -6.923194885253906, "global_step": 155621, "epoch": 3705} {"train_loss": -6.831932067871094, "global_step": 155622, "epoch": 3705} {"train_loss": -6.924874782562256, "global_step": 155623, "epoch": 3705} {"train_loss": -6.962246417999268, "global_step": 155624, "epoch": 3705} {"train_loss": -6.8770527839660645, "global_step": 155625, "epoch": 3705} {"train_loss": -6.922214508056641, "global_step": 155626, "epoch": 3705} {"train_loss": -6.858966827392578, "global_step": 155627, "epoch": 3705} {"train_loss": -6.882321834564209, "global_step": 155628, "epoch": 3705} {"train_loss": -6.9419708251953125, "global_step": 155629, "epoch": 3705} {"train_loss": -6.857828140258789, "global_step": 155630, "epoch": 3705} {"train_loss": -6.9991044998168945, "global_step": 155631, "epoch": 3705} {"train_loss": -6.807652473449707, "global_step": 155632, "epoch": 3705} {"train_loss": -6.847963333129883, "global_step": 155633, "epoch": 3705} {"train_loss": -6.859334945678711, "global_step": 155634, "epoch": 3705} {"train_loss": -6.781837463378906, "global_step": 155635, "epoch": 3705} {"train_loss": -7.007284164428711, "global_step": 155636, "epoch": 3705} {"train_loss": -6.955255508422852, "global_step": 155637, "epoch": 3705} {"train_loss": -6.90013313293457, "global_step": 155638, "epoch": 3705} {"train_loss": -6.900176048278809, "global_step": 155639, "epoch": 3705} {"train_loss": -6.822639465332031, "global_step": 155640, "epoch": 3705} {"train_loss": -6.9209184646606445, "global_step": 155641, "epoch": 3705} {"train_loss": -6.884343147277832, "global_step": 155642, "epoch": 3705} {"train_loss": -6.896749496459961, "global_step": 155643, "epoch": 3705} {"train_loss": -6.925895690917969, "global_step": 155644, "epoch": 3705} {"train_loss": -6.789423942565918, "global_step": 155645, "epoch": 3705} {"train_loss": -6.910366058349609, "global_step": 155646, "epoch": 3705} {"train_loss": -6.8401031494140625, "global_step": 155647, "epoch": 3705} {"train_loss": -6.862004280090332, "global_step": 155648, "epoch": 3705} {"train_loss": -6.885371208190918, "global_step": 155649, "epoch": 3705} {"train_loss": -6.710212707519531, "global_step": 155650, "epoch": 3705} {"train_loss": -6.888718207677205, "global_step": 155651, "epoch": 3705, "val_loss": 68308.8828125} {"train_loss": -6.906102180480957, "global_step": 155652, "epoch": 3706} {"train_loss": -6.875187873840332, "global_step": 155653, "epoch": 3706} {"train_loss": -6.978167533874512, "global_step": 155654, "epoch": 3706} {"train_loss": -6.8833818435668945, "global_step": 155655, "epoch": 3706} {"train_loss": -6.754604816436768, "global_step": 155656, "epoch": 3706} {"train_loss": -6.998348236083984, "global_step": 155657, "epoch": 3706} {"train_loss": -6.744399070739746, "global_step": 155658, "epoch": 3706} {"train_loss": -6.951940536499023, "global_step": 155659, "epoch": 3706} {"train_loss": -6.994748115539551, "global_step": 155660, "epoch": 3706} {"train_loss": -6.8590087890625, "global_step": 155661, "epoch": 3706} {"train_loss": -6.911826133728027, "global_step": 155662, "epoch": 3706} {"train_loss": -6.902563571929932, "global_step": 155663, "epoch": 3706} {"train_loss": -6.909242630004883, "global_step": 155664, "epoch": 3706} {"train_loss": -6.86748743057251, "global_step": 155665, "epoch": 3706} {"train_loss": -6.844880104064941, "global_step": 155666, "epoch": 3706} {"train_loss": -6.894187927246094, "global_step": 155667, "epoch": 3706} {"train_loss": -6.821135997772217, "global_step": 155668, "epoch": 3706} {"train_loss": -6.911506652832031, "global_step": 155669, "epoch": 3706} {"train_loss": -6.8327460289001465, "global_step": 155670, "epoch": 3706} {"train_loss": -6.961568355560303, "global_step": 155671, "epoch": 3706} {"train_loss": -6.8401312828063965, "global_step": 155672, "epoch": 3706} {"train_loss": -6.887974262237549, "global_step": 155673, "epoch": 3706} {"train_loss": -6.899631500244141, "global_step": 155674, "epoch": 3706} {"train_loss": -6.918065547943115, "global_step": 155675, "epoch": 3706} {"train_loss": -6.8423662185668945, "global_step": 155676, "epoch": 3706} {"train_loss": -6.874612331390381, "global_step": 155677, "epoch": 3706} {"train_loss": -6.944031715393066, "global_step": 155678, "epoch": 3706} {"train_loss": -6.907689094543457, "global_step": 155679, "epoch": 3706} {"train_loss": -7.056230068206787, "global_step": 155680, "epoch": 3706} {"train_loss": -6.910504341125488, "global_step": 155681, "epoch": 3706} {"train_loss": -6.920422554016113, "global_step": 155682, "epoch": 3706} {"train_loss": -6.809091091156006, "global_step": 155683, "epoch": 3706} {"train_loss": -7.030255317687988, "global_step": 155684, "epoch": 3706} {"train_loss": -6.954844951629639, "global_step": 155685, "epoch": 3706} {"train_loss": -6.863595008850098, "global_step": 155686, "epoch": 3706} {"train_loss": -6.895767688751221, "global_step": 155687, "epoch": 3706} {"train_loss": -6.8111114501953125, "global_step": 155688, "epoch": 3706} {"train_loss": -6.836970329284668, "global_step": 155689, "epoch": 3706} {"train_loss": -6.937751770019531, "global_step": 155690, "epoch": 3706} {"train_loss": -6.850533485412598, "global_step": 155691, "epoch": 3706} {"train_loss": -7.099621772766113, "global_step": 155692, "epoch": 3706} {"train_loss": -6.901787837346395, "global_step": 155693, "epoch": 3706, "val_loss": 68324.3359375} {"train_loss": -6.961788654327393, "global_step": 155694, "epoch": 3707} {"train_loss": -6.947505950927734, "global_step": 155695, "epoch": 3707} {"train_loss": -6.963404178619385, "global_step": 155696, "epoch": 3707} {"train_loss": -6.834565162658691, "global_step": 155697, "epoch": 3707} {"train_loss": -6.999317169189453, "global_step": 155698, "epoch": 3707} {"train_loss": -6.859462738037109, "global_step": 155699, "epoch": 3707} {"train_loss": -6.874232769012451, "global_step": 155700, "epoch": 3707} {"train_loss": -7.007685661315918, "global_step": 155701, "epoch": 3707} {"train_loss": -6.962202072143555, "global_step": 155702, "epoch": 3707} {"train_loss": -6.945278644561768, "global_step": 155703, "epoch": 3707} {"train_loss": -6.991181373596191, "global_step": 155704, "epoch": 3707} {"train_loss": -6.957298278808594, "global_step": 155705, "epoch": 3707} {"train_loss": -6.874454021453857, "global_step": 155706, "epoch": 3707} {"train_loss": -7.0514631271362305, "global_step": 155707, "epoch": 3707} {"train_loss": -6.872617721557617, "global_step": 155708, "epoch": 3707} {"train_loss": -6.84438419342041, "global_step": 155709, "epoch": 3707} {"train_loss": -6.915582656860352, "global_step": 155710, "epoch": 3707} {"train_loss": -6.997888565063477, "global_step": 155711, "epoch": 3707} {"train_loss": -6.851396560668945, "global_step": 155712, "epoch": 3707} {"train_loss": -6.842875003814697, "global_step": 155713, "epoch": 3707} {"train_loss": -6.926670551300049, "global_step": 155714, "epoch": 3707} {"train_loss": -6.792386054992676, "global_step": 155715, "epoch": 3707} {"train_loss": -6.909690856933594, "global_step": 155716, "epoch": 3707} {"train_loss": -6.951607704162598, "global_step": 155717, "epoch": 3707} {"train_loss": -6.9404377937316895, "global_step": 155718, "epoch": 3707} {"train_loss": -6.9928741455078125, "global_step": 155719, "epoch": 3707} {"train_loss": -6.970438003540039, "global_step": 155720, "epoch": 3707} {"train_loss": -6.9989728927612305, "global_step": 155721, "epoch": 3707} {"train_loss": -6.811409950256348, "global_step": 155722, "epoch": 3707} {"train_loss": -6.957771301269531, "global_step": 155723, "epoch": 3707} {"train_loss": -6.915026664733887, "global_step": 155724, "epoch": 3707} {"train_loss": -6.864292621612549, "global_step": 155725, "epoch": 3707} {"train_loss": -6.8638410568237305, "global_step": 155726, "epoch": 3707} {"train_loss": -6.823879241943359, "global_step": 155727, "epoch": 3707} {"train_loss": -6.78304386138916, "global_step": 155728, "epoch": 3707} {"train_loss": -6.982963562011719, "global_step": 155729, "epoch": 3707} {"train_loss": -6.944631576538086, "global_step": 155730, "epoch": 3707} {"train_loss": -6.884448051452637, "global_step": 155731, "epoch": 3707} {"train_loss": -6.873833656311035, "global_step": 155732, "epoch": 3707} {"train_loss": -6.899684429168701, "global_step": 155733, "epoch": 3707} {"train_loss": -6.921367645263672, "global_step": 155734, "epoch": 3707} {"train_loss": -6.912401290166946, "global_step": 155735, "epoch": 3707, "val_loss": 68346.1796875} {"train_loss": -6.861301422119141, "global_step": 155736, "epoch": 3708} {"train_loss": -6.660470962524414, "global_step": 155737, "epoch": 3708} {"train_loss": -6.7499566078186035, "global_step": 155738, "epoch": 3708} {"train_loss": -6.88145637512207, "global_step": 155739, "epoch": 3708} {"train_loss": -6.944856643676758, "global_step": 155740, "epoch": 3708} {"train_loss": -6.834784984588623, "global_step": 155741, "epoch": 3708} {"train_loss": -6.8546037673950195, "global_step": 155742, "epoch": 3708} {"train_loss": -6.8500847816467285, "global_step": 155743, "epoch": 3708} {"train_loss": -6.823600769042969, "global_step": 155744, "epoch": 3708} {"train_loss": -6.940594673156738, "global_step": 155745, "epoch": 3708} {"train_loss": -6.83791446685791, "global_step": 155746, "epoch": 3708} {"train_loss": -6.868868827819824, "global_step": 155747, "epoch": 3708} {"train_loss": -6.9680633544921875, "global_step": 155748, "epoch": 3708} {"train_loss": -6.898028373718262, "global_step": 155749, "epoch": 3708} {"train_loss": -6.932252407073975, "global_step": 155750, "epoch": 3708} {"train_loss": -6.864416599273682, "global_step": 155751, "epoch": 3708} {"train_loss": -6.791530609130859, "global_step": 155752, "epoch": 3708} {"train_loss": -6.840976238250732, "global_step": 155753, "epoch": 3708} {"train_loss": -6.859132289886475, "global_step": 155754, "epoch": 3708} {"train_loss": -6.750307083129883, "global_step": 155755, "epoch": 3708} {"train_loss": -6.84511661529541, "global_step": 155756, "epoch": 3708} {"train_loss": -6.824789047241211, "global_step": 155757, "epoch": 3708} {"train_loss": -6.834890842437744, "global_step": 155758, "epoch": 3708} {"train_loss": -6.824261665344238, "global_step": 155759, "epoch": 3708} {"train_loss": -6.806248664855957, "global_step": 155760, "epoch": 3708} {"train_loss": -6.960519313812256, "global_step": 155761, "epoch": 3708} {"train_loss": -6.941559791564941, "global_step": 155762, "epoch": 3708} {"train_loss": -7.01505184173584, "global_step": 155763, "epoch": 3708} {"train_loss": -6.80879020690918, "global_step": 155764, "epoch": 3708} {"train_loss": -6.893309116363525, "global_step": 155765, "epoch": 3708} {"train_loss": -6.931780815124512, "global_step": 155766, "epoch": 3708} {"train_loss": -6.958230495452881, "global_step": 155767, "epoch": 3708} {"train_loss": -6.894868850708008, "global_step": 155768, "epoch": 3708} {"train_loss": -7.040086269378662, "global_step": 155769, "epoch": 3708} {"train_loss": -6.8693742752075195, "global_step": 155770, "epoch": 3708} {"train_loss": -6.962846279144287, "global_step": 155771, "epoch": 3708} {"train_loss": -7.027427673339844, "global_step": 155772, "epoch": 3708} {"train_loss": -6.944851875305176, "global_step": 155773, "epoch": 3708} {"train_loss": -7.0024003982543945, "global_step": 155774, "epoch": 3708} {"train_loss": -6.864389896392822, "global_step": 155775, "epoch": 3708} {"train_loss": -6.951225280761719, "global_step": 155776, "epoch": 3708} {"train_loss": -6.8843190897078745, "global_step": 155777, "epoch": 3708, "val_loss": 68251.6875} {"train_loss": -6.97925329208374, "global_step": 155778, "epoch": 3709} {"train_loss": -6.918474197387695, "global_step": 155779, "epoch": 3709} {"train_loss": -6.869109153747559, "global_step": 155780, "epoch": 3709} {"train_loss": -7.0250067710876465, "global_step": 155781, "epoch": 3709} {"train_loss": -6.970715045928955, "global_step": 155782, "epoch": 3709} {"train_loss": -6.916093826293945, "global_step": 155783, "epoch": 3709} {"train_loss": -6.965924263000488, "global_step": 155784, "epoch": 3709} {"train_loss": -6.902303695678711, "global_step": 155785, "epoch": 3709} {"train_loss": -6.769596099853516, "global_step": 155786, "epoch": 3709} {"train_loss": -6.921439170837402, "global_step": 155787, "epoch": 3709} {"train_loss": -6.816061019897461, "global_step": 155788, "epoch": 3709} {"train_loss": -6.794179916381836, "global_step": 155789, "epoch": 3709} {"train_loss": -6.8830437660217285, "global_step": 155790, "epoch": 3709} {"train_loss": -6.769002914428711, "global_step": 155791, "epoch": 3709} {"train_loss": -6.935722351074219, "global_step": 155792, "epoch": 3709} {"train_loss": -6.790304660797119, "global_step": 155793, "epoch": 3709} {"train_loss": -6.884050369262695, "global_step": 155794, "epoch": 3709} {"train_loss": -6.783847808837891, "global_step": 155795, "epoch": 3709} {"train_loss": -6.854160785675049, "global_step": 155796, "epoch": 3709} {"train_loss": -6.899347305297852, "global_step": 155797, "epoch": 3709} {"train_loss": -6.819515228271484, "global_step": 155798, "epoch": 3709} {"train_loss": -6.750646591186523, "global_step": 155799, "epoch": 3709} {"train_loss": -6.726117134094238, "global_step": 155800, "epoch": 3709} {"train_loss": -6.952083110809326, "global_step": 155801, "epoch": 3709} {"train_loss": -6.708295822143555, "global_step": 155802, "epoch": 3709} {"train_loss": -6.805618762969971, "global_step": 155803, "epoch": 3709} {"train_loss": -6.763639450073242, "global_step": 155804, "epoch": 3709} {"train_loss": -6.711557388305664, "global_step": 155805, "epoch": 3709} {"train_loss": -6.765647888183594, "global_step": 155806, "epoch": 3709} {"train_loss": -6.746329307556152, "global_step": 155807, "epoch": 3709} {"train_loss": -6.757558345794678, "global_step": 155808, "epoch": 3709} {"train_loss": -6.70405387878418, "global_step": 155809, "epoch": 3709} {"train_loss": -6.799966335296631, "global_step": 155810, "epoch": 3709} {"train_loss": -6.934930324554443, "global_step": 155811, "epoch": 3709} {"train_loss": -6.858036994934082, "global_step": 155812, "epoch": 3709} {"train_loss": -6.846553802490234, "global_step": 155813, "epoch": 3709} {"train_loss": -6.866488456726074, "global_step": 155814, "epoch": 3709} {"train_loss": -6.879593849182129, "global_step": 155815, "epoch": 3709} {"train_loss": -6.920001983642578, "global_step": 155816, "epoch": 3709} {"train_loss": -6.952094554901123, "global_step": 155817, "epoch": 3709} {"train_loss": -6.933685779571533, "global_step": 155818, "epoch": 3709} {"train_loss": -6.849139769872029, "global_step": 155819, "epoch": 3709, "val_loss": 68405.046875} {"train_loss": -6.969782829284668, "global_step": 155820, "epoch": 3710} {"train_loss": -6.934989929199219, "global_step": 155821, "epoch": 3710} {"train_loss": -6.957688331604004, "global_step": 155822, "epoch": 3710} {"train_loss": -6.955574035644531, "global_step": 155823, "epoch": 3710} {"train_loss": -7.0360212326049805, "global_step": 155824, "epoch": 3710} {"train_loss": -6.966053009033203, "global_step": 155825, "epoch": 3710} {"train_loss": -6.8587236404418945, "global_step": 155826, "epoch": 3710} {"train_loss": -6.917664051055908, "global_step": 155827, "epoch": 3710} {"train_loss": -6.827193737030029, "global_step": 155828, "epoch": 3710} {"train_loss": -6.9541826248168945, "global_step": 155829, "epoch": 3710} {"train_loss": -6.861942291259766, "global_step": 155830, "epoch": 3710} {"train_loss": -6.886648178100586, "global_step": 155831, "epoch": 3710} {"train_loss": -6.925586700439453, "global_step": 155832, "epoch": 3710} {"train_loss": -6.949496269226074, "global_step": 155833, "epoch": 3710} {"train_loss": -6.870467185974121, "global_step": 155834, "epoch": 3710} {"train_loss": -6.8912458419799805, "global_step": 155835, "epoch": 3710} {"train_loss": -6.884174823760986, "global_step": 155836, "epoch": 3710} {"train_loss": -6.97227668762207, "global_step": 155837, "epoch": 3710} {"train_loss": -6.918196201324463, "global_step": 155838, "epoch": 3710} {"train_loss": -6.888104438781738, "global_step": 155839, "epoch": 3710} {"train_loss": -6.879025459289551, "global_step": 155840, "epoch": 3710} {"train_loss": -6.977804183959961, "global_step": 155841, "epoch": 3710} {"train_loss": -6.853959560394287, "global_step": 155842, "epoch": 3710} {"train_loss": -6.831722259521484, "global_step": 155843, "epoch": 3710} {"train_loss": -6.970852851867676, "global_step": 155844, "epoch": 3710} {"train_loss": -6.895171165466309, "global_step": 155845, "epoch": 3710} {"train_loss": -6.888176918029785, "global_step": 155846, "epoch": 3710} {"train_loss": -6.953122615814209, "global_step": 155847, "epoch": 3710} {"train_loss": -6.770142078399658, "global_step": 155848, "epoch": 3710} {"train_loss": -6.915096282958984, "global_step": 155849, "epoch": 3710} {"train_loss": -6.939082145690918, "global_step": 155850, "epoch": 3710} {"train_loss": -6.986574172973633, "global_step": 155851, "epoch": 3710} {"train_loss": -7.038497447967529, "global_step": 155852, "epoch": 3710} {"train_loss": -6.874389171600342, "global_step": 155853, "epoch": 3710} {"train_loss": -6.9066267013549805, "global_step": 155854, "epoch": 3710} {"train_loss": -6.956085205078125, "global_step": 155855, "epoch": 3710} {"train_loss": -7.0615234375, "global_step": 155856, "epoch": 3710} {"train_loss": -6.944849014282227, "global_step": 155857, "epoch": 3710} {"train_loss": -7.005970001220703, "global_step": 155858, "epoch": 3710} {"train_loss": -6.881912708282471, "global_step": 155859, "epoch": 3710} {"train_loss": -6.973976135253906, "global_step": 155860, "epoch": 3710} {"train_loss": -6.925284362974621, "global_step": 155861, "epoch": 3710, "val_loss": 68221.234375} {"train_loss": -6.964753150939941, "global_step": 155862, "epoch": 3711} {"train_loss": -7.007338047027588, "global_step": 155863, "epoch": 3711} {"train_loss": -6.851560592651367, "global_step": 155864, "epoch": 3711} {"train_loss": -6.881058692932129, "global_step": 155865, "epoch": 3711} {"train_loss": -6.944265365600586, "global_step": 155866, "epoch": 3711} {"train_loss": -6.937809467315674, "global_step": 155867, "epoch": 3711} {"train_loss": -6.785184860229492, "global_step": 155868, "epoch": 3711} {"train_loss": -6.865592956542969, "global_step": 155869, "epoch": 3711} {"train_loss": -6.9213151931762695, "global_step": 155870, "epoch": 3711} {"train_loss": -6.74037504196167, "global_step": 155871, "epoch": 3711} {"train_loss": -6.828161239624023, "global_step": 155872, "epoch": 3711} {"train_loss": -6.875161647796631, "global_step": 155873, "epoch": 3711} {"train_loss": -6.7209625244140625, "global_step": 155874, "epoch": 3711} {"train_loss": -6.760247707366943, "global_step": 155875, "epoch": 3711} {"train_loss": -6.916048049926758, "global_step": 155876, "epoch": 3711} {"train_loss": -6.754037380218506, "global_step": 155877, "epoch": 3711} {"train_loss": -6.862666130065918, "global_step": 155878, "epoch": 3711} {"train_loss": -6.803048133850098, "global_step": 155879, "epoch": 3711} {"train_loss": -6.8805646896362305, "global_step": 155880, "epoch": 3711} {"train_loss": -6.81435489654541, "global_step": 155881, "epoch": 3711} {"train_loss": -6.861668586730957, "global_step": 155882, "epoch": 3711} {"train_loss": -6.9073381423950195, "global_step": 155883, "epoch": 3711} {"train_loss": -6.865517616271973, "global_step": 155884, "epoch": 3711} {"train_loss": -6.8453049659729, "global_step": 155885, "epoch": 3711} {"train_loss": -6.851828575134277, "global_step": 155886, "epoch": 3711} {"train_loss": -6.9282989501953125, "global_step": 155887, "epoch": 3711} {"train_loss": -6.885579586029053, "global_step": 155888, "epoch": 3711} {"train_loss": -6.889921188354492, "global_step": 155889, "epoch": 3711} {"train_loss": -6.86083984375, "global_step": 155890, "epoch": 3711} {"train_loss": -6.8876051902771, "global_step": 155891, "epoch": 3711} {"train_loss": -6.7567458152771, "global_step": 155892, "epoch": 3711} {"train_loss": -6.796191692352295, "global_step": 155893, "epoch": 3711} {"train_loss": -6.889459133148193, "global_step": 155894, "epoch": 3711} {"train_loss": -6.838555335998535, "global_step": 155895, "epoch": 3711} {"train_loss": -6.848514556884766, "global_step": 155896, "epoch": 3711} {"train_loss": -6.740767478942871, "global_step": 155897, "epoch": 3711} {"train_loss": -6.913843631744385, "global_step": 155898, "epoch": 3711} {"train_loss": -6.918900489807129, "global_step": 155899, "epoch": 3711} {"train_loss": -6.845025062561035, "global_step": 155900, "epoch": 3711} {"train_loss": -6.837447643280029, "global_step": 155901, "epoch": 3711} {"train_loss": -6.792088031768799, "global_step": 155902, "epoch": 3711} {"train_loss": -6.855676582881382, "global_step": 155903, "epoch": 3711, "val_loss": 68174.1484375} {"train_loss": -6.97688627243042, "global_step": 155904, "epoch": 3712} {"train_loss": -6.704033851623535, "global_step": 155905, "epoch": 3712} {"train_loss": -6.901916980743408, "global_step": 155906, "epoch": 3712} {"train_loss": -6.921285629272461, "global_step": 155907, "epoch": 3712} {"train_loss": -6.77531623840332, "global_step": 155908, "epoch": 3712} {"train_loss": -6.887723445892334, "global_step": 155909, "epoch": 3712} {"train_loss": -6.696211338043213, "global_step": 155910, "epoch": 3712} {"train_loss": -6.809386253356934, "global_step": 155911, "epoch": 3712} {"train_loss": -6.927346229553223, "global_step": 155912, "epoch": 3712} {"train_loss": -6.7729315757751465, "global_step": 155913, "epoch": 3712} {"train_loss": -6.895505905151367, "global_step": 155914, "epoch": 3712} {"train_loss": -6.946384429931641, "global_step": 155915, "epoch": 3712} {"train_loss": -6.898738861083984, "global_step": 155916, "epoch": 3712} {"train_loss": -6.785568714141846, "global_step": 155917, "epoch": 3712} {"train_loss": -6.995297431945801, "global_step": 155918, "epoch": 3712} {"train_loss": -6.775550842285156, "global_step": 155919, "epoch": 3712} {"train_loss": -6.822693824768066, "global_step": 155920, "epoch": 3712} {"train_loss": -6.956493377685547, "global_step": 155921, "epoch": 3712} {"train_loss": -6.8574419021606445, "global_step": 155922, "epoch": 3712} {"train_loss": -6.845877647399902, "global_step": 155923, "epoch": 3712} {"train_loss": -6.9186625480651855, "global_step": 155924, "epoch": 3712} {"train_loss": -6.926416397094727, "global_step": 155925, "epoch": 3712} {"train_loss": -6.826547622680664, "global_step": 155926, "epoch": 3712} {"train_loss": -6.932498931884766, "global_step": 155927, "epoch": 3712} {"train_loss": -6.933320999145508, "global_step": 155928, "epoch": 3712} {"train_loss": -6.937441825866699, "global_step": 155929, "epoch": 3712} {"train_loss": -6.896202087402344, "global_step": 155930, "epoch": 3712} {"train_loss": -6.918319225311279, "global_step": 155931, "epoch": 3712} {"train_loss": -6.917025089263916, "global_step": 155932, "epoch": 3712} {"train_loss": -6.896203517913818, "global_step": 155933, "epoch": 3712} {"train_loss": -7.03771448135376, "global_step": 155934, "epoch": 3712} {"train_loss": -6.852392196655273, "global_step": 155935, "epoch": 3712} {"train_loss": -6.944284439086914, "global_step": 155936, "epoch": 3712} {"train_loss": -6.951484680175781, "global_step": 155937, "epoch": 3712} {"train_loss": -6.923955917358398, "global_step": 155938, "epoch": 3712} {"train_loss": -6.858658790588379, "global_step": 155939, "epoch": 3712} {"train_loss": -6.851167678833008, "global_step": 155940, "epoch": 3712} {"train_loss": -7.012054920196533, "global_step": 155941, "epoch": 3712} {"train_loss": -6.867536544799805, "global_step": 155942, "epoch": 3712} {"train_loss": -6.951296806335449, "global_step": 155943, "epoch": 3712} {"train_loss": -7.004403114318848, "global_step": 155944, "epoch": 3712} {"train_loss": -6.89411643573216, "global_step": 155945, "epoch": 3712, "val_loss": 68219.0546875} {"train_loss": -6.9486846923828125, "global_step": 155946, "epoch": 3713} {"train_loss": -6.970170974731445, "global_step": 155947, "epoch": 3713} {"train_loss": -6.891316890716553, "global_step": 155948, "epoch": 3713} {"train_loss": -6.939048767089844, "global_step": 155949, "epoch": 3713} {"train_loss": -6.832514762878418, "global_step": 155950, "epoch": 3713} {"train_loss": -6.942295551300049, "global_step": 155951, "epoch": 3713} {"train_loss": -6.825499534606934, "global_step": 155952, "epoch": 3713} {"train_loss": -6.959209442138672, "global_step": 155953, "epoch": 3713} {"train_loss": -6.859447956085205, "global_step": 155954, "epoch": 3713} {"train_loss": -6.922600746154785, "global_step": 155955, "epoch": 3713} {"train_loss": -6.951404571533203, "global_step": 155956, "epoch": 3713} {"train_loss": -6.888847351074219, "global_step": 155957, "epoch": 3713} {"train_loss": -6.867612838745117, "global_step": 155958, "epoch": 3713} {"train_loss": -6.892416954040527, "global_step": 155959, "epoch": 3713} {"train_loss": -6.902247428894043, "global_step": 155960, "epoch": 3713} {"train_loss": -6.944351673126221, "global_step": 155961, "epoch": 3713} {"train_loss": -6.965714454650879, "global_step": 155962, "epoch": 3713} {"train_loss": -6.894279956817627, "global_step": 155963, "epoch": 3713} {"train_loss": -6.9973859786987305, "global_step": 155964, "epoch": 3713} {"train_loss": -6.98005485534668, "global_step": 155965, "epoch": 3713} {"train_loss": -6.951258659362793, "global_step": 155966, "epoch": 3713} {"train_loss": -6.907214164733887, "global_step": 155967, "epoch": 3713} {"train_loss": -6.925444602966309, "global_step": 155968, "epoch": 3713} {"train_loss": -7.036555290222168, "global_step": 155969, "epoch": 3713} {"train_loss": -6.806116104125977, "global_step": 155970, "epoch": 3713} {"train_loss": -6.850701808929443, "global_step": 155971, "epoch": 3713} {"train_loss": -7.0457916259765625, "global_step": 155972, "epoch": 3713} {"train_loss": -6.94444465637207, "global_step": 155973, "epoch": 3713} {"train_loss": -6.959111213684082, "global_step": 155974, "epoch": 3713} {"train_loss": -6.901654243469238, "global_step": 155975, "epoch": 3713} {"train_loss": -6.943753719329834, "global_step": 155976, "epoch": 3713} {"train_loss": -6.837196350097656, "global_step": 155977, "epoch": 3713} {"train_loss": -7.069966793060303, "global_step": 155978, "epoch": 3713} {"train_loss": -6.88530969619751, "global_step": 155979, "epoch": 3713} {"train_loss": -6.910616874694824, "global_step": 155980, "epoch": 3713} {"train_loss": -6.987926959991455, "global_step": 155981, "epoch": 3713} {"train_loss": -6.95591926574707, "global_step": 155982, "epoch": 3713} {"train_loss": -6.911122798919678, "global_step": 155983, "epoch": 3713} {"train_loss": -6.870577335357666, "global_step": 155984, "epoch": 3713} {"train_loss": -6.795064926147461, "global_step": 155985, "epoch": 3713} {"train_loss": -6.826277256011963, "global_step": 155986, "epoch": 3713} {"train_loss": -6.91964814776466, "global_step": 155987, "epoch": 3713, "val_loss": 68327.4609375} {"train_loss": -6.960475444793701, "global_step": 155988, "epoch": 3714} {"train_loss": -6.9622721672058105, "global_step": 155989, "epoch": 3714} {"train_loss": -6.808982849121094, "global_step": 155990, "epoch": 3714} {"train_loss": -6.858443260192871, "global_step": 155991, "epoch": 3714} {"train_loss": -6.884272575378418, "global_step": 155992, "epoch": 3714} {"train_loss": -6.705355644226074, "global_step": 155993, "epoch": 3714} {"train_loss": -6.965792655944824, "global_step": 155994, "epoch": 3714} {"train_loss": -6.877388954162598, "global_step": 155995, "epoch": 3714} {"train_loss": -6.9882049560546875, "global_step": 155996, "epoch": 3714} {"train_loss": -6.8955078125, "global_step": 155997, "epoch": 3714} {"train_loss": -6.94926643371582, "global_step": 155998, "epoch": 3714} {"train_loss": -6.854445934295654, "global_step": 155999, "epoch": 3714} {"train_loss": -6.892852783203125, "global_step": 156000, "epoch": 3714} {"train_loss": -6.951565265655518, "global_step": 156001, "epoch": 3714} {"train_loss": -6.87923526763916, "global_step": 156002, "epoch": 3714} {"train_loss": -6.9688334465026855, "global_step": 156003, "epoch": 3714} {"train_loss": -6.880450248718262, "global_step": 156004, "epoch": 3714} {"train_loss": -6.805905818939209, "global_step": 156005, "epoch": 3714} {"train_loss": -6.896947860717773, "global_step": 156006, "epoch": 3714} {"train_loss": -6.814486503601074, "global_step": 156007, "epoch": 3714} {"train_loss": -6.878740310668945, "global_step": 156008, "epoch": 3714} {"train_loss": -6.886360168457031, "global_step": 156009, "epoch": 3714} {"train_loss": -6.907320022583008, "global_step": 156010, "epoch": 3714} {"train_loss": -7.052865505218506, "global_step": 156011, "epoch": 3714} {"train_loss": -6.958358287811279, "global_step": 156012, "epoch": 3714} {"train_loss": -6.94193172454834, "global_step": 156013, "epoch": 3714} {"train_loss": -6.912961959838867, "global_step": 156014, "epoch": 3714} {"train_loss": -6.90924596786499, "global_step": 156015, "epoch": 3714} {"train_loss": -6.865324020385742, "global_step": 156016, "epoch": 3714} {"train_loss": -6.80673885345459, "global_step": 156017, "epoch": 3714} {"train_loss": -7.002681732177734, "global_step": 156018, "epoch": 3714} {"train_loss": -7.01236629486084, "global_step": 156019, "epoch": 3714} {"train_loss": -6.854389667510986, "global_step": 156020, "epoch": 3714} {"train_loss": -6.901112079620361, "global_step": 156021, "epoch": 3714} {"train_loss": -6.795170783996582, "global_step": 156022, "epoch": 3714} {"train_loss": -6.869002819061279, "global_step": 156023, "epoch": 3714} {"train_loss": -6.8343305587768555, "global_step": 156024, "epoch": 3714} {"train_loss": -6.829732894897461, "global_step": 156025, "epoch": 3714} {"train_loss": -6.970480442047119, "global_step": 156026, "epoch": 3714} {"train_loss": -6.750535011291504, "global_step": 156027, "epoch": 3714} {"train_loss": -6.711761474609375, "global_step": 156028, "epoch": 3714} {"train_loss": -6.889259383791969, "global_step": 156029, "epoch": 3714, "val_loss": 68512.375} {"train_loss": -6.781425476074219, "global_step": 156030, "epoch": 3715} {"train_loss": -6.873622894287109, "global_step": 156031, "epoch": 3715} {"train_loss": -6.966728210449219, "global_step": 156032, "epoch": 3715} {"train_loss": -6.790718078613281, "global_step": 156033, "epoch": 3715} {"train_loss": -6.871225357055664, "global_step": 156034, "epoch": 3715} {"train_loss": -6.816864490509033, "global_step": 156035, "epoch": 3715} {"train_loss": -6.792343616485596, "global_step": 156036, "epoch": 3715} {"train_loss": -6.7990875244140625, "global_step": 156037, "epoch": 3715} {"train_loss": -6.915106773376465, "global_step": 156038, "epoch": 3715} {"train_loss": -6.712817192077637, "global_step": 156039, "epoch": 3715} {"train_loss": -6.899286270141602, "global_step": 156040, "epoch": 3715} {"train_loss": -6.803550720214844, "global_step": 156041, "epoch": 3715} {"train_loss": -6.743298053741455, "global_step": 156042, "epoch": 3715} {"train_loss": -7.034621715545654, "global_step": 156043, "epoch": 3715} {"train_loss": -6.901195526123047, "global_step": 156044, "epoch": 3715} {"train_loss": -6.882257461547852, "global_step": 156045, "epoch": 3715} {"train_loss": -6.765279769897461, "global_step": 156046, "epoch": 3715} {"train_loss": -6.723805904388428, "global_step": 156047, "epoch": 3715} {"train_loss": -6.9784040451049805, "global_step": 156048, "epoch": 3715} {"train_loss": -6.9059062004089355, "global_step": 156049, "epoch": 3715} {"train_loss": -6.820496559143066, "global_step": 156050, "epoch": 3715} {"train_loss": -6.929653167724609, "global_step": 156051, "epoch": 3715} {"train_loss": -6.847612380981445, "global_step": 156052, "epoch": 3715} {"train_loss": -6.847425937652588, "global_step": 156053, "epoch": 3715} {"train_loss": -6.884549140930176, "global_step": 156054, "epoch": 3715} {"train_loss": -6.834157466888428, "global_step": 156055, "epoch": 3715} {"train_loss": -6.895594596862793, "global_step": 156056, "epoch": 3715} {"train_loss": -6.844426155090332, "global_step": 156057, "epoch": 3715} {"train_loss": -6.857064247131348, "global_step": 156058, "epoch": 3715} {"train_loss": -6.936956882476807, "global_step": 156059, "epoch": 3715} {"train_loss": -6.878536224365234, "global_step": 156060, "epoch": 3715} {"train_loss": -6.910399436950684, "global_step": 156061, "epoch": 3715} {"train_loss": -6.940181255340576, "global_step": 156062, "epoch": 3715} {"train_loss": -6.861627101898193, "global_step": 156063, "epoch": 3715} {"train_loss": -6.852547645568848, "global_step": 156064, "epoch": 3715} {"train_loss": -6.9490227699279785, "global_step": 156065, "epoch": 3715} {"train_loss": -7.046748161315918, "global_step": 156066, "epoch": 3715} {"train_loss": -6.954435348510742, "global_step": 156067, "epoch": 3715} {"train_loss": -6.917447566986084, "global_step": 156068, "epoch": 3715} {"train_loss": -7.017930507659912, "global_step": 156069, "epoch": 3715} {"train_loss": -6.89379358291626, "global_step": 156070, "epoch": 3715} {"train_loss": -6.874673525492351, "global_step": 156071, "epoch": 3715, "val_loss": 68217.9453125} {"train_loss": -7.020620346069336, "global_step": 156072, "epoch": 3716} {"train_loss": -6.987354278564453, "global_step": 156073, "epoch": 3716} {"train_loss": -7.056857109069824, "global_step": 156074, "epoch": 3716} {"train_loss": -6.973323822021484, "global_step": 156075, "epoch": 3716} {"train_loss": -6.783751487731934, "global_step": 156076, "epoch": 3716} {"train_loss": -6.836172580718994, "global_step": 156077, "epoch": 3716} {"train_loss": -6.915466785430908, "global_step": 156078, "epoch": 3716} {"train_loss": -6.905306339263916, "global_step": 156079, "epoch": 3716} {"train_loss": -6.9409871101379395, "global_step": 156080, "epoch": 3716} {"train_loss": -6.929865837097168, "global_step": 156081, "epoch": 3716} {"train_loss": -6.846283912658691, "global_step": 156082, "epoch": 3716} {"train_loss": -6.752256870269775, "global_step": 156083, "epoch": 3716} {"train_loss": -6.940016746520996, "global_step": 156084, "epoch": 3716} {"train_loss": -6.8936591148376465, "global_step": 156085, "epoch": 3716} {"train_loss": -6.8779520988464355, "global_step": 156086, "epoch": 3716} {"train_loss": -6.957569122314453, "global_step": 156087, "epoch": 3716} {"train_loss": -6.714298248291016, "global_step": 156088, "epoch": 3716} {"train_loss": -6.881917953491211, "global_step": 156089, "epoch": 3716} {"train_loss": -6.903387546539307, "global_step": 156090, "epoch": 3716} {"train_loss": -6.847705841064453, "global_step": 156091, "epoch": 3716} {"train_loss": -6.84359073638916, "global_step": 156092, "epoch": 3716} {"train_loss": -6.987142562866211, "global_step": 156093, "epoch": 3716} {"train_loss": -6.802948951721191, "global_step": 156094, "epoch": 3716} {"train_loss": -6.929562568664551, "global_step": 156095, "epoch": 3716} {"train_loss": -6.968873023986816, "global_step": 156096, "epoch": 3716} {"train_loss": -6.854475021362305, "global_step": 156097, "epoch": 3716} {"train_loss": -6.840805530548096, "global_step": 156098, "epoch": 3716} {"train_loss": -6.820163726806641, "global_step": 156099, "epoch": 3716} {"train_loss": -6.99256706237793, "global_step": 156100, "epoch": 3716} {"train_loss": -6.9108099937438965, "global_step": 156101, "epoch": 3716} {"train_loss": -6.815062046051025, "global_step": 156102, "epoch": 3716} {"train_loss": -7.03529167175293, "global_step": 156103, "epoch": 3716} {"train_loss": -6.829598903656006, "global_step": 156104, "epoch": 3716} {"train_loss": -6.900892734527588, "global_step": 156105, "epoch": 3716} {"train_loss": -6.830095291137695, "global_step": 156106, "epoch": 3716} {"train_loss": -6.948887348175049, "global_step": 156107, "epoch": 3716} {"train_loss": -6.880096435546875, "global_step": 156108, "epoch": 3716} {"train_loss": -6.930507659912109, "global_step": 156109, "epoch": 3716} {"train_loss": -6.979080677032471, "global_step": 156110, "epoch": 3716} {"train_loss": -6.7890625, "global_step": 156111, "epoch": 3716} {"train_loss": -6.798440456390381, "global_step": 156112, "epoch": 3716} {"train_loss": -6.893439644858951, "global_step": 156113, "epoch": 3716, "val_loss": 68549.15625} {"train_loss": -6.754964828491211, "global_step": 156114, "epoch": 3717} {"train_loss": -6.798112392425537, "global_step": 156115, "epoch": 3717} {"train_loss": -6.942191123962402, "global_step": 156116, "epoch": 3717} {"train_loss": -6.8812150955200195, "global_step": 156117, "epoch": 3717} {"train_loss": -6.7839555740356445, "global_step": 156118, "epoch": 3717} {"train_loss": -6.841447353363037, "global_step": 156119, "epoch": 3717} {"train_loss": -6.887317657470703, "global_step": 156120, "epoch": 3717} {"train_loss": -6.796350955963135, "global_step": 156121, "epoch": 3717} {"train_loss": -6.882440567016602, "global_step": 156122, "epoch": 3717} {"train_loss": -6.792689323425293, "global_step": 156123, "epoch": 3717} {"train_loss": -6.683111190795898, "global_step": 156124, "epoch": 3717} {"train_loss": -6.902698516845703, "global_step": 156125, "epoch": 3717} {"train_loss": -6.849238395690918, "global_step": 156126, "epoch": 3717} {"train_loss": -6.9259538650512695, "global_step": 156127, "epoch": 3717} {"train_loss": -6.88389778137207, "global_step": 156128, "epoch": 3717} {"train_loss": -6.86225700378418, "global_step": 156129, "epoch": 3717} {"train_loss": -6.830049991607666, "global_step": 156130, "epoch": 3717} {"train_loss": -6.997869491577148, "global_step": 156131, "epoch": 3717} {"train_loss": -6.96568489074707, "global_step": 156132, "epoch": 3717} {"train_loss": -6.880701541900635, "global_step": 156133, "epoch": 3717} {"train_loss": -6.907986640930176, "global_step": 156134, "epoch": 3717} {"train_loss": -6.913331985473633, "global_step": 156135, "epoch": 3717} {"train_loss": -6.960240364074707, "global_step": 156136, "epoch": 3717} {"train_loss": -6.841923713684082, "global_step": 156137, "epoch": 3717} {"train_loss": -6.89350700378418, "global_step": 156138, "epoch": 3717} {"train_loss": -6.855425834655762, "global_step": 156139, "epoch": 3717} {"train_loss": -6.9022908210754395, "global_step": 156140, "epoch": 3717} {"train_loss": -7.002810955047607, "global_step": 156141, "epoch": 3717} {"train_loss": -6.927533149719238, "global_step": 156142, "epoch": 3717} {"train_loss": -6.92741584777832, "global_step": 156143, "epoch": 3717} {"train_loss": -7.022960662841797, "global_step": 156144, "epoch": 3717} {"train_loss": -6.997671604156494, "global_step": 156145, "epoch": 3717} {"train_loss": -6.861171722412109, "global_step": 156146, "epoch": 3717} {"train_loss": -6.920112609863281, "global_step": 156147, "epoch": 3717} {"train_loss": -6.832448959350586, "global_step": 156148, "epoch": 3717} {"train_loss": -6.841507911682129, "global_step": 156149, "epoch": 3717} {"train_loss": -6.852259635925293, "global_step": 156150, "epoch": 3717} {"train_loss": -7.014344215393066, "global_step": 156151, "epoch": 3717} {"train_loss": -6.950191497802734, "global_step": 156152, "epoch": 3717} {"train_loss": -6.9703874588012695, "global_step": 156153, "epoch": 3717} {"train_loss": -6.897805213928223, "global_step": 156154, "epoch": 3717} {"train_loss": -6.889682542710077, "global_step": 156155, "epoch": 3717, "val_loss": 68254.1015625} {"train_loss": -6.963356018066406, "global_step": 156156, "epoch": 3718} {"train_loss": -7.032566070556641, "global_step": 156157, "epoch": 3718} {"train_loss": -6.909940242767334, "global_step": 156158, "epoch": 3718} {"train_loss": -6.849758148193359, "global_step": 156159, "epoch": 3718} {"train_loss": -6.9307355880737305, "global_step": 156160, "epoch": 3718} {"train_loss": -6.923218250274658, "global_step": 156161, "epoch": 3718} {"train_loss": -6.922641754150391, "global_step": 156162, "epoch": 3718} {"train_loss": -6.910852432250977, "global_step": 156163, "epoch": 3718} {"train_loss": -6.939546585083008, "global_step": 156164, "epoch": 3718} {"train_loss": -7.048111915588379, "global_step": 156165, "epoch": 3718} {"train_loss": -6.978435039520264, "global_step": 156166, "epoch": 3718} {"train_loss": -6.934640884399414, "global_step": 156167, "epoch": 3718} {"train_loss": -7.0238494873046875, "global_step": 156168, "epoch": 3718} {"train_loss": -6.8265533447265625, "global_step": 156169, "epoch": 3718} {"train_loss": -7.018250465393066, "global_step": 156170, "epoch": 3718} {"train_loss": -6.868464469909668, "global_step": 156171, "epoch": 3718} {"train_loss": -6.997426986694336, "global_step": 156172, "epoch": 3718} {"train_loss": -6.98286247253418, "global_step": 156173, "epoch": 3718} {"train_loss": -6.982219696044922, "global_step": 156174, "epoch": 3718} {"train_loss": -7.004136085510254, "global_step": 156175, "epoch": 3718} {"train_loss": -6.939700126647949, "global_step": 156176, "epoch": 3718} {"train_loss": -6.9652814865112305, "global_step": 156177, "epoch": 3718} {"train_loss": -6.796067714691162, "global_step": 156178, "epoch": 3718} {"train_loss": -6.882396697998047, "global_step": 156179, "epoch": 3718} {"train_loss": -6.901174545288086, "global_step": 156180, "epoch": 3718} {"train_loss": -6.91464900970459, "global_step": 156181, "epoch": 3718} {"train_loss": -6.994089126586914, "global_step": 156182, "epoch": 3718} {"train_loss": -6.953129768371582, "global_step": 156183, "epoch": 3718} {"train_loss": -6.864034175872803, "global_step": 156184, "epoch": 3718} {"train_loss": -6.839266777038574, "global_step": 156185, "epoch": 3718} {"train_loss": -6.956154823303223, "global_step": 156186, "epoch": 3718} {"train_loss": -7.003724098205566, "global_step": 156187, "epoch": 3718} {"train_loss": -6.936214447021484, "global_step": 156188, "epoch": 3718} {"train_loss": -6.912666320800781, "global_step": 156189, "epoch": 3718} {"train_loss": -6.9373345375061035, "global_step": 156190, "epoch": 3718} {"train_loss": -6.964740753173828, "global_step": 156191, "epoch": 3718} {"train_loss": -6.928098678588867, "global_step": 156192, "epoch": 3718} {"train_loss": -6.967036247253418, "global_step": 156193, "epoch": 3718} {"train_loss": -6.883090019226074, "global_step": 156194, "epoch": 3718} {"train_loss": -6.92732048034668, "global_step": 156195, "epoch": 3718} {"train_loss": -6.9299726486206055, "global_step": 156196, "epoch": 3718} {"train_loss": -6.937823715664091, "global_step": 156197, "epoch": 3718, "val_loss": 68280.71875} {"train_loss": -6.921939849853516, "global_step": 156198, "epoch": 3719} {"train_loss": -6.852317810058594, "global_step": 156199, "epoch": 3719} {"train_loss": -6.789740085601807, "global_step": 156200, "epoch": 3719} {"train_loss": -6.873751640319824, "global_step": 156201, "epoch": 3719} {"train_loss": -6.864188194274902, "global_step": 156202, "epoch": 3719} {"train_loss": -6.699904441833496, "global_step": 156203, "epoch": 3719} {"train_loss": -6.930841445922852, "global_step": 156204, "epoch": 3719} {"train_loss": -6.977074146270752, "global_step": 156205, "epoch": 3719} {"train_loss": -6.945230960845947, "global_step": 156206, "epoch": 3719} {"train_loss": -6.889925003051758, "global_step": 156207, "epoch": 3719} {"train_loss": -6.821900844573975, "global_step": 156208, "epoch": 3719} {"train_loss": -6.895503044128418, "global_step": 156209, "epoch": 3719} {"train_loss": -6.8429856300354, "global_step": 156210, "epoch": 3719} {"train_loss": -6.873505592346191, "global_step": 156211, "epoch": 3719} {"train_loss": -6.808333873748779, "global_step": 156212, "epoch": 3719} {"train_loss": -6.820060729980469, "global_step": 156213, "epoch": 3719} {"train_loss": -6.969993591308594, "global_step": 156214, "epoch": 3719} {"train_loss": -6.858963489532471, "global_step": 156215, "epoch": 3719} {"train_loss": -6.88157320022583, "global_step": 156216, "epoch": 3719} {"train_loss": -6.856670379638672, "global_step": 156217, "epoch": 3719} {"train_loss": -6.840663909912109, "global_step": 156218, "epoch": 3719} {"train_loss": -6.9129862785339355, "global_step": 156219, "epoch": 3719} {"train_loss": -6.865013599395752, "global_step": 156220, "epoch": 3719} {"train_loss": -7.00834846496582, "global_step": 156221, "epoch": 3719} {"train_loss": -6.831827640533447, "global_step": 156222, "epoch": 3719} {"train_loss": -6.932785511016846, "global_step": 156223, "epoch": 3719} {"train_loss": -6.938232898712158, "global_step": 156224, "epoch": 3719} {"train_loss": -6.972860813140869, "global_step": 156225, "epoch": 3719} {"train_loss": -6.962951183319092, "global_step": 156226, "epoch": 3719} {"train_loss": -6.768050670623779, "global_step": 156227, "epoch": 3719} {"train_loss": -6.975835800170898, "global_step": 156228, "epoch": 3719} {"train_loss": -6.917725086212158, "global_step": 156229, "epoch": 3719} {"train_loss": -7.079565048217773, "global_step": 156230, "epoch": 3719} {"train_loss": -6.929457664489746, "global_step": 156231, "epoch": 3719} {"train_loss": -6.858720779418945, "global_step": 156232, "epoch": 3719} {"train_loss": -6.961337089538574, "global_step": 156233, "epoch": 3719} {"train_loss": -6.897463798522949, "global_step": 156234, "epoch": 3719} {"train_loss": -6.753304481506348, "global_step": 156235, "epoch": 3719} {"train_loss": -6.801236152648926, "global_step": 156236, "epoch": 3719} {"train_loss": -6.817790985107422, "global_step": 156237, "epoch": 3719} {"train_loss": -6.831442356109619, "global_step": 156238, "epoch": 3719} {"train_loss": -6.883434011822655, "global_step": 156239, "epoch": 3719, "val_loss": 68431.234375} {"train_loss": -6.877976894378662, "global_step": 156240, "epoch": 3720} {"train_loss": -6.790461540222168, "global_step": 156241, "epoch": 3720} {"train_loss": -6.939436912536621, "global_step": 156242, "epoch": 3720} {"train_loss": -6.83915901184082, "global_step": 156243, "epoch": 3720} {"train_loss": -6.805280685424805, "global_step": 156244, "epoch": 3720} {"train_loss": -6.95111083984375, "global_step": 156245, "epoch": 3720} {"train_loss": -7.006278038024902, "global_step": 156246, "epoch": 3720} {"train_loss": -6.8652262687683105, "global_step": 156247, "epoch": 3720} {"train_loss": -6.945171356201172, "global_step": 156248, "epoch": 3720} {"train_loss": -6.890992164611816, "global_step": 156249, "epoch": 3720} {"train_loss": -6.929611682891846, "global_step": 156250, "epoch": 3720} {"train_loss": -6.967646598815918, "global_step": 156251, "epoch": 3720} {"train_loss": -6.972789764404297, "global_step": 156252, "epoch": 3720} {"train_loss": -6.925512790679932, "global_step": 156253, "epoch": 3720} {"train_loss": -6.941291809082031, "global_step": 156254, "epoch": 3720} {"train_loss": -6.94770622253418, "global_step": 156255, "epoch": 3720} {"train_loss": -7.108262062072754, "global_step": 156256, "epoch": 3720} {"train_loss": -6.984214782714844, "global_step": 156257, "epoch": 3720} {"train_loss": -6.964293003082275, "global_step": 156258, "epoch": 3720} {"train_loss": -6.940011024475098, "global_step": 156259, "epoch": 3720} {"train_loss": -6.963838577270508, "global_step": 156260, "epoch": 3720} {"train_loss": -6.807486534118652, "global_step": 156261, "epoch": 3720} {"train_loss": -6.892750263214111, "global_step": 156262, "epoch": 3720} {"train_loss": -6.922107696533203, "global_step": 156263, "epoch": 3720} {"train_loss": -7.0040364265441895, "global_step": 156264, "epoch": 3720} {"train_loss": -6.9340105056762695, "global_step": 156265, "epoch": 3720} {"train_loss": -6.856059551239014, "global_step": 156266, "epoch": 3720} {"train_loss": -6.8161702156066895, "global_step": 156267, "epoch": 3720} {"train_loss": -6.98396110534668, "global_step": 156268, "epoch": 3720} {"train_loss": -7.017599105834961, "global_step": 156269, "epoch": 3720} {"train_loss": -6.881435394287109, "global_step": 156270, "epoch": 3720} {"train_loss": -6.850865364074707, "global_step": 156271, "epoch": 3720} {"train_loss": -6.886884689331055, "global_step": 156272, "epoch": 3720} {"train_loss": -6.955385208129883, "global_step": 156273, "epoch": 3720} {"train_loss": -6.929073810577393, "global_step": 156274, "epoch": 3720} {"train_loss": -6.8861236572265625, "global_step": 156275, "epoch": 3720} {"train_loss": -6.93632173538208, "global_step": 156276, "epoch": 3720} {"train_loss": -6.9287567138671875, "global_step": 156277, "epoch": 3720} {"train_loss": -6.832297325134277, "global_step": 156278, "epoch": 3720} {"train_loss": -6.985857963562012, "global_step": 156279, "epoch": 3720} {"train_loss": -6.943807601928711, "global_step": 156280, "epoch": 3720} {"train_loss": -6.920888594218662, "global_step": 156281, "epoch": 3720, "val_loss": 68279.2421875} {"train_loss": -6.775697708129883, "global_step": 156282, "epoch": 3721} {"train_loss": -6.870640754699707, "global_step": 156283, "epoch": 3721} {"train_loss": -6.925578594207764, "global_step": 156284, "epoch": 3721} {"train_loss": -6.78712797164917, "global_step": 156285, "epoch": 3721} {"train_loss": -6.925620079040527, "global_step": 156286, "epoch": 3721} {"train_loss": -6.873456001281738, "global_step": 156287, "epoch": 3721} {"train_loss": -6.930637359619141, "global_step": 156288, "epoch": 3721} {"train_loss": -6.903524398803711, "global_step": 156289, "epoch": 3721} {"train_loss": -6.894328594207764, "global_step": 156290, "epoch": 3721} {"train_loss": -6.862527847290039, "global_step": 156291, "epoch": 3721} {"train_loss": -6.883456230163574, "global_step": 156292, "epoch": 3721} {"train_loss": -6.930421352386475, "global_step": 156293, "epoch": 3721} {"train_loss": -7.053709506988525, "global_step": 156294, "epoch": 3721} {"train_loss": -6.871535778045654, "global_step": 156295, "epoch": 3721} {"train_loss": -6.926169395446777, "global_step": 156296, "epoch": 3721} {"train_loss": -6.9464263916015625, "global_step": 156297, "epoch": 3721} {"train_loss": -6.888863563537598, "global_step": 156298, "epoch": 3721} {"train_loss": -6.919536590576172, "global_step": 156299, "epoch": 3721} {"train_loss": -6.969124794006348, "global_step": 156300, "epoch": 3721} {"train_loss": -6.961155891418457, "global_step": 156301, "epoch": 3721} {"train_loss": -6.958897590637207, "global_step": 156302, "epoch": 3721} {"train_loss": -6.874192237854004, "global_step": 156303, "epoch": 3721} {"train_loss": -6.930959701538086, "global_step": 156304, "epoch": 3721} {"train_loss": -6.840237617492676, "global_step": 156305, "epoch": 3721} {"train_loss": -7.014917373657227, "global_step": 156306, "epoch": 3721} {"train_loss": -6.999847412109375, "global_step": 156307, "epoch": 3721} {"train_loss": -6.9403886795043945, "global_step": 156308, "epoch": 3721} {"train_loss": -6.928560256958008, "global_step": 156309, "epoch": 3721} {"train_loss": -6.911180019378662, "global_step": 156310, "epoch": 3721} {"train_loss": -6.8952484130859375, "global_step": 156311, "epoch": 3721} {"train_loss": -6.930044651031494, "global_step": 156312, "epoch": 3721} {"train_loss": -6.963084697723389, "global_step": 156313, "epoch": 3721} {"train_loss": -6.967887878417969, "global_step": 156314, "epoch": 3721} {"train_loss": -6.814395904541016, "global_step": 156315, "epoch": 3721} {"train_loss": -6.956653594970703, "global_step": 156316, "epoch": 3721} {"train_loss": -6.873019218444824, "global_step": 156317, "epoch": 3721} {"train_loss": -6.9332275390625, "global_step": 156318, "epoch": 3721} {"train_loss": -6.963033676147461, "global_step": 156319, "epoch": 3721} {"train_loss": -7.016727924346924, "global_step": 156320, "epoch": 3721} {"train_loss": -6.851187705993652, "global_step": 156321, "epoch": 3721} {"train_loss": -6.909295082092285, "global_step": 156322, "epoch": 3721} {"train_loss": -6.917194956824893, "global_step": 156323, "epoch": 3721, "val_loss": 68339.1328125} {"train_loss": -6.989469528198242, "global_step": 156324, "epoch": 3722} {"train_loss": -7.048320293426514, "global_step": 156325, "epoch": 3722} {"train_loss": -6.939897537231445, "global_step": 156326, "epoch": 3722} {"train_loss": -6.9448652267456055, "global_step": 156327, "epoch": 3722} {"train_loss": -6.8942718505859375, "global_step": 156328, "epoch": 3722} {"train_loss": -6.94123649597168, "global_step": 156329, "epoch": 3722} {"train_loss": -6.906440734863281, "global_step": 156330, "epoch": 3722} {"train_loss": -6.910687446594238, "global_step": 156331, "epoch": 3722} {"train_loss": -6.932695388793945, "global_step": 156332, "epoch": 3722} {"train_loss": -6.859159469604492, "global_step": 156333, "epoch": 3722} {"train_loss": -6.929207801818848, "global_step": 156334, "epoch": 3722} {"train_loss": -6.928067207336426, "global_step": 156335, "epoch": 3722} {"train_loss": -6.893833160400391, "global_step": 156336, "epoch": 3722} {"train_loss": -6.871438026428223, "global_step": 156337, "epoch": 3722} {"train_loss": -6.882417678833008, "global_step": 156338, "epoch": 3722} {"train_loss": -7.019571304321289, "global_step": 156339, "epoch": 3722} {"train_loss": -6.990786075592041, "global_step": 156340, "epoch": 3722} {"train_loss": -6.929730415344238, "global_step": 156341, "epoch": 3722} {"train_loss": -6.972451210021973, "global_step": 156342, "epoch": 3722} {"train_loss": -6.907064437866211, "global_step": 156343, "epoch": 3722} {"train_loss": -6.951341152191162, "global_step": 156344, "epoch": 3722} {"train_loss": -6.974296569824219, "global_step": 156345, "epoch": 3722} {"train_loss": -6.9923319816589355, "global_step": 156346, "epoch": 3722} {"train_loss": -6.988067626953125, "global_step": 156347, "epoch": 3722} {"train_loss": -6.872315883636475, "global_step": 156348, "epoch": 3722} {"train_loss": -6.862304210662842, "global_step": 156349, "epoch": 3722} {"train_loss": -6.880424976348877, "global_step": 156350, "epoch": 3722} {"train_loss": -6.967830657958984, "global_step": 156351, "epoch": 3722} {"train_loss": -6.936244010925293, "global_step": 156352, "epoch": 3722} {"train_loss": -6.93827486038208, "global_step": 156353, "epoch": 3722} {"train_loss": -6.855118751525879, "global_step": 156354, "epoch": 3722} {"train_loss": -6.846062660217285, "global_step": 156355, "epoch": 3722} {"train_loss": -6.909855365753174, "global_step": 156356, "epoch": 3722} {"train_loss": -6.916025161743164, "global_step": 156357, "epoch": 3722} {"train_loss": -6.759455680847168, "global_step": 156358, "epoch": 3722} {"train_loss": -6.86572265625, "global_step": 156359, "epoch": 3722} {"train_loss": -6.9001874923706055, "global_step": 156360, "epoch": 3722} {"train_loss": -6.9554595947265625, "global_step": 156361, "epoch": 3722} {"train_loss": -7.0087738037109375, "global_step": 156362, "epoch": 3722} {"train_loss": -6.889990329742432, "global_step": 156363, "epoch": 3722} {"train_loss": -6.993505477905273, "global_step": 156364, "epoch": 3722} {"train_loss": -6.92665635971796, "global_step": 156365, "epoch": 3722, "val_loss": 68528.7734375} {"train_loss": -6.913576126098633, "global_step": 156366, "epoch": 3723} {"train_loss": -6.9211812019348145, "global_step": 156367, "epoch": 3723} {"train_loss": -6.9450788497924805, "global_step": 156368, "epoch": 3723} {"train_loss": -6.947229385375977, "global_step": 156369, "epoch": 3723} {"train_loss": -7.02824068069458, "global_step": 156370, "epoch": 3723} {"train_loss": -7.006477355957031, "global_step": 156371, "epoch": 3723} {"train_loss": -6.908072471618652, "global_step": 156372, "epoch": 3723} {"train_loss": -6.893842697143555, "global_step": 156373, "epoch": 3723} {"train_loss": -6.859096527099609, "global_step": 156374, "epoch": 3723} {"train_loss": -7.027407646179199, "global_step": 156375, "epoch": 3723} {"train_loss": -6.970440864562988, "global_step": 156376, "epoch": 3723} {"train_loss": -6.9766998291015625, "global_step": 156377, "epoch": 3723} {"train_loss": -6.845172882080078, "global_step": 156378, "epoch": 3723} {"train_loss": -6.9047136306762695, "global_step": 156379, "epoch": 3723} {"train_loss": -6.865168571472168, "global_step": 156380, "epoch": 3723} {"train_loss": -6.917165756225586, "global_step": 156381, "epoch": 3723} {"train_loss": -6.837909698486328, "global_step": 156382, "epoch": 3723} {"train_loss": -6.963502883911133, "global_step": 156383, "epoch": 3723} {"train_loss": -6.906149387359619, "global_step": 156384, "epoch": 3723} {"train_loss": -6.8567914962768555, "global_step": 156385, "epoch": 3723} {"train_loss": -6.956143856048584, "global_step": 156386, "epoch": 3723} {"train_loss": -6.932142734527588, "global_step": 156387, "epoch": 3723} {"train_loss": -6.9509782791137695, "global_step": 156388, "epoch": 3723} {"train_loss": -7.083512306213379, "global_step": 156389, "epoch": 3723} {"train_loss": -6.998136520385742, "global_step": 156390, "epoch": 3723} {"train_loss": -6.886834144592285, "global_step": 156391, "epoch": 3723} {"train_loss": -6.8081512451171875, "global_step": 156392, "epoch": 3723} {"train_loss": -7.020485877990723, "global_step": 156393, "epoch": 3723} {"train_loss": -6.899906158447266, "global_step": 156394, "epoch": 3723} {"train_loss": -6.863944053649902, "global_step": 156395, "epoch": 3723} {"train_loss": -6.875655174255371, "global_step": 156396, "epoch": 3723} {"train_loss": -6.754998207092285, "global_step": 156397, "epoch": 3723} {"train_loss": -6.98734712600708, "global_step": 156398, "epoch": 3723} {"train_loss": -6.934760093688965, "global_step": 156399, "epoch": 3723} {"train_loss": -6.780489921569824, "global_step": 156400, "epoch": 3723} {"train_loss": -6.844632148742676, "global_step": 156401, "epoch": 3723} {"train_loss": -6.707869529724121, "global_step": 156402, "epoch": 3723} {"train_loss": -6.877978324890137, "global_step": 156403, "epoch": 3723} {"train_loss": -6.843870162963867, "global_step": 156404, "epoch": 3723} {"train_loss": -6.8282623291015625, "global_step": 156405, "epoch": 3723} {"train_loss": -6.846142768859863, "global_step": 156406, "epoch": 3723} {"train_loss": -6.902434894016811, "global_step": 156407, "epoch": 3723, "val_loss": 68440.546875} {"train_loss": -6.656290531158447, "global_step": 156408, "epoch": 3724} {"train_loss": -6.782093048095703, "global_step": 156409, "epoch": 3724} {"train_loss": -6.762320518493652, "global_step": 156410, "epoch": 3724} {"train_loss": -6.861562728881836, "global_step": 156411, "epoch": 3724} {"train_loss": -6.801015853881836, "global_step": 156412, "epoch": 3724} {"train_loss": -6.713150978088379, "global_step": 156413, "epoch": 3724} {"train_loss": -6.928863048553467, "global_step": 156414, "epoch": 3724} {"train_loss": -6.668057441711426, "global_step": 156415, "epoch": 3724} {"train_loss": -6.83765983581543, "global_step": 156416, "epoch": 3724} {"train_loss": -6.833431243896484, "global_step": 156417, "epoch": 3724} {"train_loss": -6.8004865646362305, "global_step": 156418, "epoch": 3724} {"train_loss": -6.977272987365723, "global_step": 156419, "epoch": 3724} {"train_loss": -6.84295129776001, "global_step": 156420, "epoch": 3724} {"train_loss": -6.865416049957275, "global_step": 156421, "epoch": 3724} {"train_loss": -6.841012954711914, "global_step": 156422, "epoch": 3724} {"train_loss": -6.84702205657959, "global_step": 156423, "epoch": 3724} {"train_loss": -6.836112022399902, "global_step": 156424, "epoch": 3724} {"train_loss": -6.8922529220581055, "global_step": 156425, "epoch": 3724} {"train_loss": -6.9364423751831055, "global_step": 156426, "epoch": 3724} {"train_loss": -6.895379066467285, "global_step": 156427, "epoch": 3724} {"train_loss": -6.9178876876831055, "global_step": 156428, "epoch": 3724} {"train_loss": -6.8737969398498535, "global_step": 156429, "epoch": 3724} {"train_loss": -6.93325138092041, "global_step": 156430, "epoch": 3724} {"train_loss": -6.911299228668213, "global_step": 156431, "epoch": 3724} {"train_loss": -6.891286849975586, "global_step": 156432, "epoch": 3724} {"train_loss": -6.947402000427246, "global_step": 156433, "epoch": 3724} {"train_loss": -6.920706748962402, "global_step": 156434, "epoch": 3724} {"train_loss": -6.960028648376465, "global_step": 156435, "epoch": 3724} {"train_loss": -6.955015182495117, "global_step": 156436, "epoch": 3724} {"train_loss": -6.8493499755859375, "global_step": 156437, "epoch": 3724} {"train_loss": -6.889044284820557, "global_step": 156438, "epoch": 3724} {"train_loss": -6.948022365570068, "global_step": 156439, "epoch": 3724} {"train_loss": -6.888443470001221, "global_step": 156440, "epoch": 3724} {"train_loss": -6.954449653625488, "global_step": 156441, "epoch": 3724} {"train_loss": -6.894891738891602, "global_step": 156442, "epoch": 3724} {"train_loss": -6.833556175231934, "global_step": 156443, "epoch": 3724} {"train_loss": -6.856300354003906, "global_step": 156444, "epoch": 3724} {"train_loss": -6.887067794799805, "global_step": 156445, "epoch": 3724} {"train_loss": -6.8224263191223145, "global_step": 156446, "epoch": 3724} {"train_loss": -6.880336284637451, "global_step": 156447, "epoch": 3724} {"train_loss": -6.934542179107666, "global_step": 156448, "epoch": 3724} {"train_loss": -6.86618987719218, "global_step": 156449, "epoch": 3724, "val_loss": 68325.0078125} {"train_loss": -6.955557823181152, "global_step": 156450, "epoch": 3725} {"train_loss": -6.950695991516113, "global_step": 156451, "epoch": 3725} {"train_loss": -6.893277168273926, "global_step": 156452, "epoch": 3725} {"train_loss": -6.911077976226807, "global_step": 156453, "epoch": 3725} {"train_loss": -6.944045543670654, "global_step": 156454, "epoch": 3725} {"train_loss": -6.928330421447754, "global_step": 156455, "epoch": 3725} {"train_loss": -6.871523857116699, "global_step": 156456, "epoch": 3725} {"train_loss": -6.815980911254883, "global_step": 156457, "epoch": 3725} {"train_loss": -6.850372314453125, "global_step": 156458, "epoch": 3725} {"train_loss": -6.902313232421875, "global_step": 156459, "epoch": 3725} {"train_loss": -6.967211723327637, "global_step": 156460, "epoch": 3725} {"train_loss": -6.720516204833984, "global_step": 156461, "epoch": 3725} {"train_loss": -6.9020233154296875, "global_step": 156462, "epoch": 3725} {"train_loss": -6.912698745727539, "global_step": 156463, "epoch": 3725} {"train_loss": -6.941232681274414, "global_step": 156464, "epoch": 3725} {"train_loss": -6.851864814758301, "global_step": 156465, "epoch": 3725} {"train_loss": -6.996773719787598, "global_step": 156466, "epoch": 3725} {"train_loss": -6.842280387878418, "global_step": 156467, "epoch": 3725} {"train_loss": -6.8090410232543945, "global_step": 156468, "epoch": 3725} {"train_loss": -6.939330101013184, "global_step": 156469, "epoch": 3725} {"train_loss": -6.901312351226807, "global_step": 156470, "epoch": 3725} {"train_loss": -6.932345867156982, "global_step": 156471, "epoch": 3725} {"train_loss": -6.9757399559021, "global_step": 156472, "epoch": 3725} {"train_loss": -6.983608245849609, "global_step": 156473, "epoch": 3725} {"train_loss": -6.928694248199463, "global_step": 156474, "epoch": 3725} {"train_loss": -6.832090377807617, "global_step": 156475, "epoch": 3725} {"train_loss": -6.924262523651123, "global_step": 156476, "epoch": 3725} {"train_loss": -6.9925127029418945, "global_step": 156477, "epoch": 3725} {"train_loss": -6.888518333435059, "global_step": 156478, "epoch": 3725} {"train_loss": -6.957748889923096, "global_step": 156479, "epoch": 3725} {"train_loss": -6.972048759460449, "global_step": 156480, "epoch": 3725} {"train_loss": -7.041903495788574, "global_step": 156481, "epoch": 3725} {"train_loss": -6.931423187255859, "global_step": 156482, "epoch": 3725} {"train_loss": -6.888333320617676, "global_step": 156483, "epoch": 3725} {"train_loss": -6.821706771850586, "global_step": 156484, "epoch": 3725} {"train_loss": -6.982513427734375, "global_step": 156485, "epoch": 3725} {"train_loss": -7.025876045227051, "global_step": 156486, "epoch": 3725} {"train_loss": -6.92271614074707, "global_step": 156487, "epoch": 3725} {"train_loss": -6.896919250488281, "global_step": 156488, "epoch": 3725} {"train_loss": -6.950729846954346, "global_step": 156489, "epoch": 3725} {"train_loss": -6.968644618988037, "global_step": 156490, "epoch": 3725} {"train_loss": -6.91989955447969, "global_step": 156491, "epoch": 3725, "val_loss": 68344.0625} {"train_loss": -6.969253063201904, "global_step": 156492, "epoch": 3726} {"train_loss": -7.029398441314697, "global_step": 156493, "epoch": 3726} {"train_loss": -6.945134162902832, "global_step": 156494, "epoch": 3726} {"train_loss": -6.81346321105957, "global_step": 156495, "epoch": 3726} {"train_loss": -7.012106895446777, "global_step": 156496, "epoch": 3726} {"train_loss": -7.085695743560791, "global_step": 156497, "epoch": 3726} {"train_loss": -6.952040672302246, "global_step": 156498, "epoch": 3726} {"train_loss": -6.942131042480469, "global_step": 156499, "epoch": 3726} {"train_loss": -6.9803547859191895, "global_step": 156500, "epoch": 3726} {"train_loss": -6.96098518371582, "global_step": 156501, "epoch": 3726} {"train_loss": -6.96105432510376, "global_step": 156502, "epoch": 3726} {"train_loss": -6.938232421875, "global_step": 156503, "epoch": 3726} {"train_loss": -6.989371299743652, "global_step": 156504, "epoch": 3726} {"train_loss": -6.906435489654541, "global_step": 156505, "epoch": 3726} {"train_loss": -6.995896339416504, "global_step": 156506, "epoch": 3726} {"train_loss": -7.05826997756958, "global_step": 156507, "epoch": 3726} {"train_loss": -7.010402202606201, "global_step": 156508, "epoch": 3726} {"train_loss": -7.018722057342529, "global_step": 156509, "epoch": 3726} {"train_loss": -6.967932224273682, "global_step": 156510, "epoch": 3726} {"train_loss": -6.89168643951416, "global_step": 156511, "epoch": 3726} {"train_loss": -6.909010887145996, "global_step": 156512, "epoch": 3726} {"train_loss": -6.93011474609375, "global_step": 156513, "epoch": 3726} {"train_loss": -7.00222110748291, "global_step": 156514, "epoch": 3726} {"train_loss": -6.952382564544678, "global_step": 156515, "epoch": 3726} {"train_loss": -6.93002986907959, "global_step": 156516, "epoch": 3726} {"train_loss": -7.009647369384766, "global_step": 156517, "epoch": 3726} {"train_loss": -6.840643882751465, "global_step": 156518, "epoch": 3726} {"train_loss": -6.857513427734375, "global_step": 156519, "epoch": 3726} {"train_loss": -6.885878562927246, "global_step": 156520, "epoch": 3726} {"train_loss": -6.918586730957031, "global_step": 156521, "epoch": 3726} {"train_loss": -6.924490928649902, "global_step": 156522, "epoch": 3726} {"train_loss": -6.994627952575684, "global_step": 156523, "epoch": 3726} {"train_loss": -6.85152530670166, "global_step": 156524, "epoch": 3726} {"train_loss": -6.741347312927246, "global_step": 156525, "epoch": 3726} {"train_loss": -6.844164848327637, "global_step": 156526, "epoch": 3726} {"train_loss": -6.98781681060791, "global_step": 156527, "epoch": 3726} {"train_loss": -6.816471099853516, "global_step": 156528, "epoch": 3726} {"train_loss": -6.871234893798828, "global_step": 156529, "epoch": 3726} {"train_loss": -6.871481895446777, "global_step": 156530, "epoch": 3726} {"train_loss": -6.972149848937988, "global_step": 156531, "epoch": 3726} {"train_loss": -6.814258575439453, "global_step": 156532, "epoch": 3726} {"train_loss": -6.934462785720825, "global_step": 156533, "epoch": 3726, "val_loss": 68507.0} {"train_loss": -6.880046844482422, "global_step": 156534, "epoch": 3727} {"train_loss": -6.913354873657227, "global_step": 156535, "epoch": 3727} {"train_loss": -6.891703128814697, "global_step": 156536, "epoch": 3727} {"train_loss": -6.729825973510742, "global_step": 156537, "epoch": 3727} {"train_loss": -6.941540241241455, "global_step": 156538, "epoch": 3727} {"train_loss": -6.744277000427246, "global_step": 156539, "epoch": 3727} {"train_loss": -6.776276588439941, "global_step": 156540, "epoch": 3727} {"train_loss": -6.7669901847839355, "global_step": 156541, "epoch": 3727} {"train_loss": -6.684259414672852, "global_step": 156542, "epoch": 3727} {"train_loss": -6.827888488769531, "global_step": 156543, "epoch": 3727} {"train_loss": -6.689159870147705, "global_step": 156544, "epoch": 3727} {"train_loss": -6.718008041381836, "global_step": 156545, "epoch": 3727} {"train_loss": -6.892130374908447, "global_step": 156546, "epoch": 3727} {"train_loss": -6.7658281326293945, "global_step": 156547, "epoch": 3727} {"train_loss": -6.981978416442871, "global_step": 156548, "epoch": 3727} {"train_loss": -6.706082344055176, "global_step": 156549, "epoch": 3727} {"train_loss": -6.852466583251953, "global_step": 156550, "epoch": 3727} {"train_loss": -6.943710803985596, "global_step": 156551, "epoch": 3727} {"train_loss": -6.661069393157959, "global_step": 156552, "epoch": 3727} {"train_loss": -6.783126354217529, "global_step": 156553, "epoch": 3727} {"train_loss": -6.806300640106201, "global_step": 156554, "epoch": 3727} {"train_loss": -6.843989849090576, "global_step": 156555, "epoch": 3727} {"train_loss": -6.877628326416016, "global_step": 156556, "epoch": 3727} {"train_loss": -6.91505241394043, "global_step": 156557, "epoch": 3727} {"train_loss": -6.903140544891357, "global_step": 156558, "epoch": 3727} {"train_loss": -6.874200344085693, "global_step": 156559, "epoch": 3727} {"train_loss": -6.957706928253174, "global_step": 156560, "epoch": 3727} {"train_loss": -6.955595016479492, "global_step": 156561, "epoch": 3727} {"train_loss": -6.923262596130371, "global_step": 156562, "epoch": 3727} {"train_loss": -6.938724517822266, "global_step": 156563, "epoch": 3727} {"train_loss": -6.991455078125, "global_step": 156564, "epoch": 3727} {"train_loss": -6.860635757446289, "global_step": 156565, "epoch": 3727} {"train_loss": -6.94210147857666, "global_step": 156566, "epoch": 3727} {"train_loss": -6.867892265319824, "global_step": 156567, "epoch": 3727} {"train_loss": -6.842910289764404, "global_step": 156568, "epoch": 3727} {"train_loss": -6.932634353637695, "global_step": 156569, "epoch": 3727} {"train_loss": -6.837228775024414, "global_step": 156570, "epoch": 3727} {"train_loss": -6.922033786773682, "global_step": 156571, "epoch": 3727} {"train_loss": -6.858308792114258, "global_step": 156572, "epoch": 3727} {"train_loss": -6.792752265930176, "global_step": 156573, "epoch": 3727} {"train_loss": -6.886022090911865, "global_step": 156574, "epoch": 3727} {"train_loss": -6.851217973799932, "global_step": 156575, "epoch": 3727, "val_loss": 68580.921875} {"train_loss": -6.762768745422363, "global_step": 156576, "epoch": 3728} {"train_loss": -6.938874244689941, "global_step": 156577, "epoch": 3728} {"train_loss": -6.800513744354248, "global_step": 156578, "epoch": 3728} {"train_loss": -6.97810697555542, "global_step": 156579, "epoch": 3728} {"train_loss": -6.85141658782959, "global_step": 156580, "epoch": 3728} {"train_loss": -6.799991607666016, "global_step": 156581, "epoch": 3728} {"train_loss": -6.9362359046936035, "global_step": 156582, "epoch": 3728} {"train_loss": -6.87216329574585, "global_step": 156583, "epoch": 3728} {"train_loss": -6.97122859954834, "global_step": 156584, "epoch": 3728} {"train_loss": -6.980584144592285, "global_step": 156585, "epoch": 3728} {"train_loss": -6.85746431350708, "global_step": 156586, "epoch": 3728} {"train_loss": -6.902121543884277, "global_step": 156587, "epoch": 3728} {"train_loss": -6.903791427612305, "global_step": 156588, "epoch": 3728} {"train_loss": -6.87021541595459, "global_step": 156589, "epoch": 3728} {"train_loss": -6.955880165100098, "global_step": 156590, "epoch": 3728} {"train_loss": -6.963824272155762, "global_step": 156591, "epoch": 3728} {"train_loss": -6.89300537109375, "global_step": 156592, "epoch": 3728} {"train_loss": -6.92475700378418, "global_step": 156593, "epoch": 3728} {"train_loss": -6.968715667724609, "global_step": 156594, "epoch": 3728} {"train_loss": -6.982597351074219, "global_step": 156595, "epoch": 3728} {"train_loss": -6.981428623199463, "global_step": 156596, "epoch": 3728} {"train_loss": -6.879953861236572, "global_step": 156597, "epoch": 3728} {"train_loss": -6.9763336181640625, "global_step": 156598, "epoch": 3728} {"train_loss": -6.8918232917785645, "global_step": 156599, "epoch": 3728} {"train_loss": -6.877447128295898, "global_step": 156600, "epoch": 3728} {"train_loss": -7.025998115539551, "global_step": 156601, "epoch": 3728} {"train_loss": -7.040307998657227, "global_step": 156602, "epoch": 3728} {"train_loss": -6.920823097229004, "global_step": 156603, "epoch": 3728} {"train_loss": -6.953973293304443, "global_step": 156604, "epoch": 3728} {"train_loss": -6.932629585266113, "global_step": 156605, "epoch": 3728} {"train_loss": -6.885158538818359, "global_step": 156606, "epoch": 3728} {"train_loss": -6.937012195587158, "global_step": 156607, "epoch": 3728} {"train_loss": -6.964349269866943, "global_step": 156608, "epoch": 3728} {"train_loss": -6.919003963470459, "global_step": 156609, "epoch": 3728} {"train_loss": -6.878273010253906, "global_step": 156610, "epoch": 3728} {"train_loss": -6.934646129608154, "global_step": 156611, "epoch": 3728} {"train_loss": -6.96431827545166, "global_step": 156612, "epoch": 3728} {"train_loss": -6.9737043380737305, "global_step": 156613, "epoch": 3728} {"train_loss": -6.966524124145508, "global_step": 156614, "epoch": 3728} {"train_loss": -6.915489196777344, "global_step": 156615, "epoch": 3728} {"train_loss": -6.9322967529296875, "global_step": 156616, "epoch": 3728} {"train_loss": -6.923025982720511, "global_step": 156617, "epoch": 3728, "val_loss": 68467.671875} {"train_loss": -6.829502582550049, "global_step": 156618, "epoch": 3729} {"train_loss": -6.947151184082031, "global_step": 156619, "epoch": 3729} {"train_loss": -6.929251670837402, "global_step": 156620, "epoch": 3729} {"train_loss": -6.811938285827637, "global_step": 156621, "epoch": 3729} {"train_loss": -6.864063262939453, "global_step": 156622, "epoch": 3729} {"train_loss": -6.9974470138549805, "global_step": 156623, "epoch": 3729} {"train_loss": -6.809787750244141, "global_step": 156624, "epoch": 3729} {"train_loss": -6.90131950378418, "global_step": 156625, "epoch": 3729} {"train_loss": -6.914328575134277, "global_step": 156626, "epoch": 3729} {"train_loss": -6.838537693023682, "global_step": 156627, "epoch": 3729} {"train_loss": -7.016541481018066, "global_step": 156628, "epoch": 3729} {"train_loss": -6.971013069152832, "global_step": 156629, "epoch": 3729} {"train_loss": -7.004634857177734, "global_step": 156630, "epoch": 3729} {"train_loss": -6.916715621948242, "global_step": 156631, "epoch": 3729} {"train_loss": -6.929385185241699, "global_step": 156632, "epoch": 3729} {"train_loss": -6.932573318481445, "global_step": 156633, "epoch": 3729} {"train_loss": -6.823704719543457, "global_step": 156634, "epoch": 3729} {"train_loss": -6.927515983581543, "global_step": 156635, "epoch": 3729} {"train_loss": -6.836849212646484, "global_step": 156636, "epoch": 3729} {"train_loss": -6.844482421875, "global_step": 156637, "epoch": 3729} {"train_loss": -7.020083904266357, "global_step": 156638, "epoch": 3729} {"train_loss": -6.916330337524414, "global_step": 156639, "epoch": 3729} {"train_loss": -7.0091681480407715, "global_step": 156640, "epoch": 3729} {"train_loss": -6.741339683532715, "global_step": 156641, "epoch": 3729} {"train_loss": -6.943881511688232, "global_step": 156642, "epoch": 3729} {"train_loss": -6.992609024047852, "global_step": 156643, "epoch": 3729} {"train_loss": -6.8017706871032715, "global_step": 156644, "epoch": 3729} {"train_loss": -6.881093978881836, "global_step": 156645, "epoch": 3729} {"train_loss": -6.869937896728516, "global_step": 156646, "epoch": 3729} {"train_loss": -6.914988994598389, "global_step": 156647, "epoch": 3729} {"train_loss": -6.7728376388549805, "global_step": 156648, "epoch": 3729} {"train_loss": -6.945233345031738, "global_step": 156649, "epoch": 3729} {"train_loss": -6.893697261810303, "global_step": 156650, "epoch": 3729} {"train_loss": -6.921877384185791, "global_step": 156651, "epoch": 3729} {"train_loss": -7.024153232574463, "global_step": 156652, "epoch": 3729} {"train_loss": -6.9714226722717285, "global_step": 156653, "epoch": 3729} {"train_loss": -6.965712547302246, "global_step": 156654, "epoch": 3729} {"train_loss": -6.90572452545166, "global_step": 156655, "epoch": 3729} {"train_loss": -6.921004295349121, "global_step": 156656, "epoch": 3729} {"train_loss": -6.9120402336120605, "global_step": 156657, "epoch": 3729} {"train_loss": -6.925947189331055, "global_step": 156658, "epoch": 3729} {"train_loss": -6.908824239458356, "global_step": 156659, "epoch": 3729, "val_loss": 68337.3203125} {"train_loss": -6.9151692390441895, "global_step": 156660, "epoch": 3730} {"train_loss": -7.033378601074219, "global_step": 156661, "epoch": 3730} {"train_loss": -6.81913423538208, "global_step": 156662, "epoch": 3730} {"train_loss": -6.951963424682617, "global_step": 156663, "epoch": 3730} {"train_loss": -6.885051250457764, "global_step": 156664, "epoch": 3730} {"train_loss": -6.989296913146973, "global_step": 156665, "epoch": 3730} {"train_loss": -7.022126197814941, "global_step": 156666, "epoch": 3730} {"train_loss": -6.8090620040893555, "global_step": 156667, "epoch": 3730} {"train_loss": -6.921257019042969, "global_step": 156668, "epoch": 3730} {"train_loss": -6.913342475891113, "global_step": 156669, "epoch": 3730} {"train_loss": -6.97274112701416, "global_step": 156670, "epoch": 3730} {"train_loss": -6.796796798706055, "global_step": 156671, "epoch": 3730} {"train_loss": -6.8931989669799805, "global_step": 156672, "epoch": 3730} {"train_loss": -6.972553730010986, "global_step": 156673, "epoch": 3730} {"train_loss": -7.003134727478027, "global_step": 156674, "epoch": 3730} {"train_loss": -6.811697006225586, "global_step": 156675, "epoch": 3730} {"train_loss": -6.964925765991211, "global_step": 156676, "epoch": 3730} {"train_loss": -7.064260482788086, "global_step": 156677, "epoch": 3730} {"train_loss": -6.992574691772461, "global_step": 156678, "epoch": 3730} {"train_loss": -6.957098960876465, "global_step": 156679, "epoch": 3730} {"train_loss": -7.021841049194336, "global_step": 156680, "epoch": 3730} {"train_loss": -6.90512752532959, "global_step": 156681, "epoch": 3730} {"train_loss": -6.859830856323242, "global_step": 156682, "epoch": 3730} {"train_loss": -6.9700093269348145, "global_step": 156683, "epoch": 3730} {"train_loss": -6.943756580352783, "global_step": 156684, "epoch": 3730} {"train_loss": -6.884453773498535, "global_step": 156685, "epoch": 3730} {"train_loss": -6.842790126800537, "global_step": 156686, "epoch": 3730} {"train_loss": -7.021240711212158, "global_step": 156687, "epoch": 3730} {"train_loss": -6.892928123474121, "global_step": 156688, "epoch": 3730} {"train_loss": -6.9231977462768555, "global_step": 156689, "epoch": 3730} {"train_loss": -7.007321357727051, "global_step": 156690, "epoch": 3730} {"train_loss": -6.851352691650391, "global_step": 156691, "epoch": 3730} {"train_loss": -6.912741661071777, "global_step": 156692, "epoch": 3730} {"train_loss": -6.939043998718262, "global_step": 156693, "epoch": 3730} {"train_loss": -7.0243754386901855, "global_step": 156694, "epoch": 3730} {"train_loss": -6.9217963218688965, "global_step": 156695, "epoch": 3730} {"train_loss": -6.986823081970215, "global_step": 156696, "epoch": 3730} {"train_loss": -6.889761924743652, "global_step": 156697, "epoch": 3730} {"train_loss": -6.898675441741943, "global_step": 156698, "epoch": 3730} {"train_loss": -6.9162492752075195, "global_step": 156699, "epoch": 3730} {"train_loss": -7.006712913513184, "global_step": 156700, "epoch": 3730} {"train_loss": -6.934979938325428, "global_step": 156701, "epoch": 3730, "val_loss": 68441.6328125} {"train_loss": -7.027259826660156, "global_step": 156702, "epoch": 3731} {"train_loss": -6.817737102508545, "global_step": 156703, "epoch": 3731} {"train_loss": -6.83502197265625, "global_step": 156704, "epoch": 3731} {"train_loss": -6.842671871185303, "global_step": 156705, "epoch": 3731} {"train_loss": -7.008920669555664, "global_step": 156706, "epoch": 3731} {"train_loss": -6.8019914627075195, "global_step": 156707, "epoch": 3731} {"train_loss": -6.918763160705566, "global_step": 156708, "epoch": 3731} {"train_loss": -6.873214244842529, "global_step": 156709, "epoch": 3731} {"train_loss": -7.007999420166016, "global_step": 156710, "epoch": 3731} {"train_loss": -6.809717178344727, "global_step": 156711, "epoch": 3731} {"train_loss": -6.886537551879883, "global_step": 156712, "epoch": 3731} {"train_loss": -6.992055892944336, "global_step": 156713, "epoch": 3731} {"train_loss": -6.946172714233398, "global_step": 156714, "epoch": 3731} {"train_loss": -6.943598747253418, "global_step": 156715, "epoch": 3731} {"train_loss": -6.943245887756348, "global_step": 156716, "epoch": 3731} {"train_loss": -6.745105743408203, "global_step": 156717, "epoch": 3731} {"train_loss": -6.9004034996032715, "global_step": 156718, "epoch": 3731} {"train_loss": -6.956910610198975, "global_step": 156719, "epoch": 3731} {"train_loss": -6.919247627258301, "global_step": 156720, "epoch": 3731} {"train_loss": -6.813645839691162, "global_step": 156721, "epoch": 3731} {"train_loss": -6.9636311531066895, "global_step": 156722, "epoch": 3731} {"train_loss": -6.926347732543945, "global_step": 156723, "epoch": 3731} {"train_loss": -6.767788887023926, "global_step": 156724, "epoch": 3731} {"train_loss": -6.9360527992248535, "global_step": 156725, "epoch": 3731} {"train_loss": -6.9031782150268555, "global_step": 156726, "epoch": 3731} {"train_loss": -6.870378494262695, "global_step": 156727, "epoch": 3731} {"train_loss": -6.9302849769592285, "global_step": 156728, "epoch": 3731} {"train_loss": -6.939985275268555, "global_step": 156729, "epoch": 3731} {"train_loss": -6.926604270935059, "global_step": 156730, "epoch": 3731} {"train_loss": -7.017238616943359, "global_step": 156731, "epoch": 3731} {"train_loss": -6.780921936035156, "global_step": 156732, "epoch": 3731} {"train_loss": -6.806329727172852, "global_step": 156733, "epoch": 3731} {"train_loss": -6.897747993469238, "global_step": 156734, "epoch": 3731} {"train_loss": -6.790441513061523, "global_step": 156735, "epoch": 3731} {"train_loss": -6.960558891296387, "global_step": 156736, "epoch": 3731} {"train_loss": -6.834494590759277, "global_step": 156737, "epoch": 3731} {"train_loss": -6.978408336639404, "global_step": 156738, "epoch": 3731} {"train_loss": -6.893091201782227, "global_step": 156739, "epoch": 3731} {"train_loss": -6.857804298400879, "global_step": 156740, "epoch": 3731} {"train_loss": -6.847027778625488, "global_step": 156741, "epoch": 3731} {"train_loss": -6.741462707519531, "global_step": 156742, "epoch": 3731} {"train_loss": -6.889882201240177, "global_step": 156743, "epoch": 3731, "val_loss": 68373.3125} {"train_loss": -6.964418888092041, "global_step": 156744, "epoch": 3732} {"train_loss": -6.90154504776001, "global_step": 156745, "epoch": 3732} {"train_loss": -6.871555805206299, "global_step": 156746, "epoch": 3732} {"train_loss": -6.888117790222168, "global_step": 156747, "epoch": 3732} {"train_loss": -6.9531145095825195, "global_step": 156748, "epoch": 3732} {"train_loss": -6.995088577270508, "global_step": 156749, "epoch": 3732} {"train_loss": -6.864742755889893, "global_step": 156750, "epoch": 3732} {"train_loss": -6.887632369995117, "global_step": 156751, "epoch": 3732} {"train_loss": -6.838949680328369, "global_step": 156752, "epoch": 3732} {"train_loss": -6.846543788909912, "global_step": 156753, "epoch": 3732} {"train_loss": -6.849799156188965, "global_step": 156754, "epoch": 3732} {"train_loss": -6.934056282043457, "global_step": 156755, "epoch": 3732} {"train_loss": -6.836037635803223, "global_step": 156756, "epoch": 3732} {"train_loss": -6.9034318923950195, "global_step": 156757, "epoch": 3732} {"train_loss": -6.940677165985107, "global_step": 156758, "epoch": 3732} {"train_loss": -6.939191818237305, "global_step": 156759, "epoch": 3732} {"train_loss": -6.944004058837891, "global_step": 156760, "epoch": 3732} {"train_loss": -6.86073637008667, "global_step": 156761, "epoch": 3732} {"train_loss": -6.93772029876709, "global_step": 156762, "epoch": 3732} {"train_loss": -6.90360164642334, "global_step": 156763, "epoch": 3732} {"train_loss": -6.935340881347656, "global_step": 156764, "epoch": 3732} {"train_loss": -6.930202960968018, "global_step": 156765, "epoch": 3732} {"train_loss": -6.925489902496338, "global_step": 156766, "epoch": 3732} {"train_loss": -6.974828720092773, "global_step": 156767, "epoch": 3732} {"train_loss": -7.019630432128906, "global_step": 156768, "epoch": 3732} {"train_loss": -6.906565189361572, "global_step": 156769, "epoch": 3732} {"train_loss": -6.995328426361084, "global_step": 156770, "epoch": 3732} {"train_loss": -6.939176559448242, "global_step": 156771, "epoch": 3732} {"train_loss": -6.935302734375, "global_step": 156772, "epoch": 3732} {"train_loss": -6.944731712341309, "global_step": 156773, "epoch": 3732} {"train_loss": -7.071501731872559, "global_step": 156774, "epoch": 3732} {"train_loss": -6.945872783660889, "global_step": 156775, "epoch": 3732} {"train_loss": -6.846029758453369, "global_step": 156776, "epoch": 3732} {"train_loss": -7.013731956481934, "global_step": 156777, "epoch": 3732} {"train_loss": -6.9840593338012695, "global_step": 156778, "epoch": 3732} {"train_loss": -6.975504398345947, "global_step": 156779, "epoch": 3732} {"train_loss": -6.996738433837891, "global_step": 156780, "epoch": 3732} {"train_loss": -7.05540657043457, "global_step": 156781, "epoch": 3732} {"train_loss": -6.952090263366699, "global_step": 156782, "epoch": 3732} {"train_loss": -7.070865154266357, "global_step": 156783, "epoch": 3732} {"train_loss": -7.004749298095703, "global_step": 156784, "epoch": 3732} {"train_loss": -6.9384389491308305, "global_step": 156785, "epoch": 3732, "val_loss": 68349.2578125} {"train_loss": -6.936628341674805, "global_step": 156786, "epoch": 3733} {"train_loss": -6.995597839355469, "global_step": 156787, "epoch": 3733} {"train_loss": -7.005782127380371, "global_step": 156788, "epoch": 3733} {"train_loss": -7.041904926300049, "global_step": 156789, "epoch": 3733} {"train_loss": -6.960766792297363, "global_step": 156790, "epoch": 3733} {"train_loss": -6.952313423156738, "global_step": 156791, "epoch": 3733} {"train_loss": -6.891783237457275, "global_step": 156792, "epoch": 3733} {"train_loss": -6.986990928649902, "global_step": 156793, "epoch": 3733} {"train_loss": -6.859704971313477, "global_step": 156794, "epoch": 3733} {"train_loss": -6.8785834312438965, "global_step": 156795, "epoch": 3733} {"train_loss": -7.0160675048828125, "global_step": 156796, "epoch": 3733} {"train_loss": -6.955901145935059, "global_step": 156797, "epoch": 3733} {"train_loss": -6.977817058563232, "global_step": 156798, "epoch": 3733} {"train_loss": -6.954751491546631, "global_step": 156799, "epoch": 3733} {"train_loss": -6.830255508422852, "global_step": 156800, "epoch": 3733} {"train_loss": -6.947021961212158, "global_step": 156801, "epoch": 3733} {"train_loss": -6.98231315612793, "global_step": 156802, "epoch": 3733} {"train_loss": -6.988523483276367, "global_step": 156803, "epoch": 3733} {"train_loss": -6.881594181060791, "global_step": 156804, "epoch": 3733} {"train_loss": -7.0574188232421875, "global_step": 156805, "epoch": 3733} {"train_loss": -6.9250993728637695, "global_step": 156806, "epoch": 3733} {"train_loss": -6.987611293792725, "global_step": 156807, "epoch": 3733} {"train_loss": -6.884540557861328, "global_step": 156808, "epoch": 3733} {"train_loss": -6.98628568649292, "global_step": 156809, "epoch": 3733} {"train_loss": -7.0280985832214355, "global_step": 156810, "epoch": 3733} {"train_loss": -6.838058948516846, "global_step": 156811, "epoch": 3733} {"train_loss": -6.934622287750244, "global_step": 156812, "epoch": 3733} {"train_loss": -6.910173416137695, "global_step": 156813, "epoch": 3733} {"train_loss": -6.898231506347656, "global_step": 156814, "epoch": 3733} {"train_loss": -6.846410751342773, "global_step": 156815, "epoch": 3733} {"train_loss": -6.8611907958984375, "global_step": 156816, "epoch": 3733} {"train_loss": -6.855222702026367, "global_step": 156817, "epoch": 3733} {"train_loss": -6.98913049697876, "global_step": 156818, "epoch": 3733} {"train_loss": -6.8372802734375, "global_step": 156819, "epoch": 3733} {"train_loss": -6.948716163635254, "global_step": 156820, "epoch": 3733} {"train_loss": -6.870964527130127, "global_step": 156821, "epoch": 3733} {"train_loss": -6.953676223754883, "global_step": 156822, "epoch": 3733} {"train_loss": -6.8981218338012695, "global_step": 156823, "epoch": 3733} {"train_loss": -6.8903961181640625, "global_step": 156824, "epoch": 3733} {"train_loss": -7.008756160736084, "global_step": 156825, "epoch": 3733} {"train_loss": -6.840333938598633, "global_step": 156826, "epoch": 3733} {"train_loss": -6.934572651272728, "global_step": 156827, "epoch": 3733, "val_loss": 68275.21875} {"train_loss": -7.012664318084717, "global_step": 156828, "epoch": 3734} {"train_loss": -6.968989372253418, "global_step": 156829, "epoch": 3734} {"train_loss": -6.827723503112793, "global_step": 156830, "epoch": 3734} {"train_loss": -6.901002883911133, "global_step": 156831, "epoch": 3734} {"train_loss": -6.897316932678223, "global_step": 156832, "epoch": 3734} {"train_loss": -6.878992557525635, "global_step": 156833, "epoch": 3734} {"train_loss": -6.858631134033203, "global_step": 156834, "epoch": 3734} {"train_loss": -6.937074661254883, "global_step": 156835, "epoch": 3734} {"train_loss": -6.856303691864014, "global_step": 156836, "epoch": 3734} {"train_loss": -6.899473190307617, "global_step": 156837, "epoch": 3734} {"train_loss": -6.856529235839844, "global_step": 156838, "epoch": 3734} {"train_loss": -6.684723377227783, "global_step": 156839, "epoch": 3734} {"train_loss": -6.829014301300049, "global_step": 156840, "epoch": 3734} {"train_loss": -6.868281841278076, "global_step": 156841, "epoch": 3734} {"train_loss": -6.809317588806152, "global_step": 156842, "epoch": 3734} {"train_loss": -6.785923957824707, "global_step": 156843, "epoch": 3734} {"train_loss": -6.759407043457031, "global_step": 156844, "epoch": 3734} {"train_loss": -6.787130355834961, "global_step": 156845, "epoch": 3734} {"train_loss": -6.812518119812012, "global_step": 156846, "epoch": 3734} {"train_loss": -6.883601665496826, "global_step": 156847, "epoch": 3734} {"train_loss": -6.937424182891846, "global_step": 156848, "epoch": 3734} {"train_loss": -6.879583835601807, "global_step": 156849, "epoch": 3734} {"train_loss": -6.936883926391602, "global_step": 156850, "epoch": 3734} {"train_loss": -6.9172773361206055, "global_step": 156851, "epoch": 3734} {"train_loss": -6.949837684631348, "global_step": 156852, "epoch": 3734} {"train_loss": -6.945956707000732, "global_step": 156853, "epoch": 3734} {"train_loss": -6.9281158447265625, "global_step": 156854, "epoch": 3734} {"train_loss": -6.976456642150879, "global_step": 156855, "epoch": 3734} {"train_loss": -6.9097442626953125, "global_step": 156856, "epoch": 3734} {"train_loss": -6.910332679748535, "global_step": 156857, "epoch": 3734} {"train_loss": -6.982033729553223, "global_step": 156858, "epoch": 3734} {"train_loss": -6.870880603790283, "global_step": 156859, "epoch": 3734} {"train_loss": -6.8431196212768555, "global_step": 156860, "epoch": 3734} {"train_loss": -6.829220294952393, "global_step": 156861, "epoch": 3734} {"train_loss": -6.882762908935547, "global_step": 156862, "epoch": 3734} {"train_loss": -6.887960433959961, "global_step": 156863, "epoch": 3734} {"train_loss": -6.785336971282959, "global_step": 156864, "epoch": 3734} {"train_loss": -6.905091285705566, "global_step": 156865, "epoch": 3734} {"train_loss": -6.841608047485352, "global_step": 156866, "epoch": 3734} {"train_loss": -6.834850311279297, "global_step": 156867, "epoch": 3734} {"train_loss": -6.955132007598877, "global_step": 156868, "epoch": 3734} {"train_loss": -6.879466352008638, "global_step": 156869, "epoch": 3734, "val_loss": 68335.4609375} {"train_loss": -6.873659133911133, "global_step": 156870, "epoch": 3735} {"train_loss": -6.935259819030762, "global_step": 156871, "epoch": 3735} {"train_loss": -6.945021629333496, "global_step": 156872, "epoch": 3735} {"train_loss": -6.800615310668945, "global_step": 156873, "epoch": 3735} {"train_loss": -7.016637802124023, "global_step": 156874, "epoch": 3735} {"train_loss": -6.929828643798828, "global_step": 156875, "epoch": 3735} {"train_loss": -6.961982727050781, "global_step": 156876, "epoch": 3735} {"train_loss": -6.915542125701904, "global_step": 156877, "epoch": 3735} {"train_loss": -6.80380392074585, "global_step": 156878, "epoch": 3735} {"train_loss": -7.052134037017822, "global_step": 156879, "epoch": 3735} {"train_loss": -6.758211135864258, "global_step": 156880, "epoch": 3735} {"train_loss": -6.879697799682617, "global_step": 156881, "epoch": 3735} {"train_loss": -6.917537689208984, "global_step": 156882, "epoch": 3735} {"train_loss": -6.951484680175781, "global_step": 156883, "epoch": 3735} {"train_loss": -6.806597709655762, "global_step": 156884, "epoch": 3735} {"train_loss": -6.866935729980469, "global_step": 156885, "epoch": 3735} {"train_loss": -7.001038074493408, "global_step": 156886, "epoch": 3735} {"train_loss": -6.949063301086426, "global_step": 156887, "epoch": 3735} {"train_loss": -6.866894721984863, "global_step": 156888, "epoch": 3735} {"train_loss": -6.968560218811035, "global_step": 156889, "epoch": 3735} {"train_loss": -6.7776288986206055, "global_step": 156890, "epoch": 3735} {"train_loss": -6.956030368804932, "global_step": 156891, "epoch": 3735} {"train_loss": -6.826394557952881, "global_step": 156892, "epoch": 3735} {"train_loss": -6.881830215454102, "global_step": 156893, "epoch": 3735} {"train_loss": -6.801504611968994, "global_step": 156894, "epoch": 3735} {"train_loss": -6.869638442993164, "global_step": 156895, "epoch": 3735} {"train_loss": -6.7414445877075195, "global_step": 156896, "epoch": 3735} {"train_loss": -6.904571533203125, "global_step": 156897, "epoch": 3735} {"train_loss": -6.7984819412231445, "global_step": 156898, "epoch": 3735} {"train_loss": -6.928361892700195, "global_step": 156899, "epoch": 3735} {"train_loss": -6.936248779296875, "global_step": 156900, "epoch": 3735} {"train_loss": -6.774511814117432, "global_step": 156901, "epoch": 3735} {"train_loss": -6.829468727111816, "global_step": 156902, "epoch": 3735} {"train_loss": -6.785521984100342, "global_step": 156903, "epoch": 3735} {"train_loss": -6.913893222808838, "global_step": 156904, "epoch": 3735} {"train_loss": -6.877541542053223, "global_step": 156905, "epoch": 3735} {"train_loss": -6.902670383453369, "global_step": 156906, "epoch": 3735} {"train_loss": -6.890800476074219, "global_step": 156907, "epoch": 3735} {"train_loss": -6.909377098083496, "global_step": 156908, "epoch": 3735} {"train_loss": -6.855489253997803, "global_step": 156909, "epoch": 3735} {"train_loss": -6.953105449676514, "global_step": 156910, "epoch": 3735} {"train_loss": -6.885562760489328, "global_step": 156911, "epoch": 3735, "val_loss": 68391.2109375} {"train_loss": -6.784764289855957, "global_step": 156912, "epoch": 3736} {"train_loss": -6.960667610168457, "global_step": 156913, "epoch": 3736} {"train_loss": -6.950579643249512, "global_step": 156914, "epoch": 3736} {"train_loss": -6.867003440856934, "global_step": 156915, "epoch": 3736} {"train_loss": -6.904943466186523, "global_step": 156916, "epoch": 3736} {"train_loss": -6.977555751800537, "global_step": 156917, "epoch": 3736} {"train_loss": -6.914323806762695, "global_step": 156918, "epoch": 3736} {"train_loss": -6.835214614868164, "global_step": 156919, "epoch": 3736} {"train_loss": -6.908353805541992, "global_step": 156920, "epoch": 3736} {"train_loss": -6.882882118225098, "global_step": 156921, "epoch": 3736} {"train_loss": -6.881345748901367, "global_step": 156922, "epoch": 3736} {"train_loss": -6.984638214111328, "global_step": 156923, "epoch": 3736} {"train_loss": -6.994767189025879, "global_step": 156924, "epoch": 3736} {"train_loss": -7.0673723220825195, "global_step": 156925, "epoch": 3736} {"train_loss": -6.920841693878174, "global_step": 156926, "epoch": 3736} {"train_loss": -6.993812561035156, "global_step": 156927, "epoch": 3736} {"train_loss": -7.0141730308532715, "global_step": 156928, "epoch": 3736} {"train_loss": -6.772878646850586, "global_step": 156929, "epoch": 3736} {"train_loss": -6.941245079040527, "global_step": 156930, "epoch": 3736} {"train_loss": -6.863698959350586, "global_step": 156931, "epoch": 3736} {"train_loss": -6.9753007888793945, "global_step": 156932, "epoch": 3736} {"train_loss": -6.960062503814697, "global_step": 156933, "epoch": 3736} {"train_loss": -6.911825180053711, "global_step": 156934, "epoch": 3736} {"train_loss": -6.957241535186768, "global_step": 156935, "epoch": 3736} {"train_loss": -7.014657974243164, "global_step": 156936, "epoch": 3736} {"train_loss": -6.899721622467041, "global_step": 156937, "epoch": 3736} {"train_loss": -7.056802749633789, "global_step": 156938, "epoch": 3736} {"train_loss": -6.989521026611328, "global_step": 156939, "epoch": 3736} {"train_loss": -6.91052770614624, "global_step": 156940, "epoch": 3736} {"train_loss": -6.953701019287109, "global_step": 156941, "epoch": 3736} {"train_loss": -6.997585296630859, "global_step": 156942, "epoch": 3736} {"train_loss": -6.966660976409912, "global_step": 156943, "epoch": 3736} {"train_loss": -6.937097549438477, "global_step": 156944, "epoch": 3736} {"train_loss": -6.96325159072876, "global_step": 156945, "epoch": 3736} {"train_loss": -6.941709518432617, "global_step": 156946, "epoch": 3736} {"train_loss": -7.033137321472168, "global_step": 156947, "epoch": 3736} {"train_loss": -6.846961975097656, "global_step": 156948, "epoch": 3736} {"train_loss": -6.94821834564209, "global_step": 156949, "epoch": 3736} {"train_loss": -6.993699550628662, "global_step": 156950, "epoch": 3736} {"train_loss": -6.989287376403809, "global_step": 156951, "epoch": 3736} {"train_loss": -7.029523849487305, "global_step": 156952, "epoch": 3736} {"train_loss": -6.945090452829997, "global_step": 156953, "epoch": 3736, "val_loss": 68561.390625} {"train_loss": -7.049510955810547, "global_step": 156954, "epoch": 3737} {"train_loss": -6.9671525955200195, "global_step": 156955, "epoch": 3737} {"train_loss": -7.007991313934326, "global_step": 156956, "epoch": 3737} {"train_loss": -6.910889625549316, "global_step": 156957, "epoch": 3737} {"train_loss": -7.047850608825684, "global_step": 156958, "epoch": 3737} {"train_loss": -6.996246814727783, "global_step": 156959, "epoch": 3737} {"train_loss": -6.869039058685303, "global_step": 156960, "epoch": 3737} {"train_loss": -6.960622787475586, "global_step": 156961, "epoch": 3737} {"train_loss": -6.964177131652832, "global_step": 156962, "epoch": 3737} {"train_loss": -6.925476551055908, "global_step": 156963, "epoch": 3737} {"train_loss": -6.972662925720215, "global_step": 156964, "epoch": 3737} {"train_loss": -7.005129814147949, "global_step": 156965, "epoch": 3737} {"train_loss": -6.962608814239502, "global_step": 156966, "epoch": 3737} {"train_loss": -7.110172748565674, "global_step": 156967, "epoch": 3737} {"train_loss": -6.952702045440674, "global_step": 156968, "epoch": 3737} {"train_loss": -6.823150157928467, "global_step": 156969, "epoch": 3737} {"train_loss": -7.010953903198242, "global_step": 156970, "epoch": 3737} {"train_loss": -6.999349594116211, "global_step": 156971, "epoch": 3737} {"train_loss": -6.942958831787109, "global_step": 156972, "epoch": 3737} {"train_loss": -6.881197929382324, "global_step": 156973, "epoch": 3737} {"train_loss": -6.943574905395508, "global_step": 156974, "epoch": 3737} {"train_loss": -6.921897888183594, "global_step": 156975, "epoch": 3737} {"train_loss": -6.986401557922363, "global_step": 156976, "epoch": 3737} {"train_loss": -6.999405860900879, "global_step": 156977, "epoch": 3737} {"train_loss": -6.860806465148926, "global_step": 156978, "epoch": 3737} {"train_loss": -6.85508918762207, "global_step": 156979, "epoch": 3737} {"train_loss": -6.975064277648926, "global_step": 156980, "epoch": 3737} {"train_loss": -6.969489097595215, "global_step": 156981, "epoch": 3737} {"train_loss": -6.793437480926514, "global_step": 156982, "epoch": 3737} {"train_loss": -6.952065467834473, "global_step": 156983, "epoch": 3737} {"train_loss": -6.922441005706787, "global_step": 156984, "epoch": 3737} {"train_loss": -6.900360107421875, "global_step": 156985, "epoch": 3737} {"train_loss": -7.080183506011963, "global_step": 156986, "epoch": 3737} {"train_loss": -6.881147384643555, "global_step": 156987, "epoch": 3737} {"train_loss": -6.969356536865234, "global_step": 156988, "epoch": 3737} {"train_loss": -6.936867713928223, "global_step": 156989, "epoch": 3737} {"train_loss": -6.891385078430176, "global_step": 156990, "epoch": 3737} {"train_loss": -6.915273189544678, "global_step": 156991, "epoch": 3737} {"train_loss": -6.899863243103027, "global_step": 156992, "epoch": 3737} {"train_loss": -6.9728617668151855, "global_step": 156993, "epoch": 3737} {"train_loss": -6.971858978271484, "global_step": 156994, "epoch": 3737} {"train_loss": -6.947829677945092, "global_step": 156995, "epoch": 3737, "val_loss": 68293.2578125} {"train_loss": -6.933993816375732, "global_step": 156996, "epoch": 3738} {"train_loss": -6.93742036819458, "global_step": 156997, "epoch": 3738} {"train_loss": -6.858706951141357, "global_step": 156998, "epoch": 3738} {"train_loss": -6.965089797973633, "global_step": 156999, "epoch": 3738} {"train_loss": -6.891629219055176, "global_step": 157000, "epoch": 3738} {"train_loss": -6.841248512268066, "global_step": 157001, "epoch": 3738} {"train_loss": -6.897242546081543, "global_step": 157002, "epoch": 3738} {"train_loss": -6.912476539611816, "global_step": 157003, "epoch": 3738} {"train_loss": -6.821484565734863, "global_step": 157004, "epoch": 3738} {"train_loss": -6.937243461608887, "global_step": 157005, "epoch": 3738} {"train_loss": -6.604877471923828, "global_step": 157006, "epoch": 3738} {"train_loss": -6.87030553817749, "global_step": 157007, "epoch": 3738} {"train_loss": -6.813806533813477, "global_step": 157008, "epoch": 3738} {"train_loss": -6.826607704162598, "global_step": 157009, "epoch": 3738} {"train_loss": -6.861922264099121, "global_step": 157010, "epoch": 3738} {"train_loss": -6.926784515380859, "global_step": 157011, "epoch": 3738} {"train_loss": -6.850043296813965, "global_step": 157012, "epoch": 3738} {"train_loss": -6.9810791015625, "global_step": 157013, "epoch": 3738} {"train_loss": -6.818572998046875, "global_step": 157014, "epoch": 3738} {"train_loss": -6.880087852478027, "global_step": 157015, "epoch": 3738} {"train_loss": -6.871151924133301, "global_step": 157016, "epoch": 3738} {"train_loss": -6.811914920806885, "global_step": 157017, "epoch": 3738} {"train_loss": -6.863292694091797, "global_step": 157018, "epoch": 3738} {"train_loss": -6.8807268142700195, "global_step": 157019, "epoch": 3738} {"train_loss": -6.908491611480713, "global_step": 157020, "epoch": 3738} {"train_loss": -6.779423713684082, "global_step": 157021, "epoch": 3738} {"train_loss": -6.944474220275879, "global_step": 157022, "epoch": 3738} {"train_loss": -6.792647361755371, "global_step": 157023, "epoch": 3738} {"train_loss": -6.817570209503174, "global_step": 157024, "epoch": 3738} {"train_loss": -6.965732574462891, "global_step": 157025, "epoch": 3738} {"train_loss": -6.7669782638549805, "global_step": 157026, "epoch": 3738} {"train_loss": -6.925094127655029, "global_step": 157027, "epoch": 3738} {"train_loss": -6.683587074279785, "global_step": 157028, "epoch": 3738} {"train_loss": -6.978080749511719, "global_step": 157029, "epoch": 3738} {"train_loss": -6.865277290344238, "global_step": 157030, "epoch": 3738} {"train_loss": -6.840552806854248, "global_step": 157031, "epoch": 3738} {"train_loss": -6.823392868041992, "global_step": 157032, "epoch": 3738} {"train_loss": -6.98819637298584, "global_step": 157033, "epoch": 3738} {"train_loss": -6.913096904754639, "global_step": 157034, "epoch": 3738} {"train_loss": -6.843576908111572, "global_step": 157035, "epoch": 3738} {"train_loss": -7.03762674331665, "global_step": 157036, "epoch": 3738} {"train_loss": -6.875755855015346, "global_step": 157037, "epoch": 3738, "val_loss": 68421.65625} {"train_loss": -7.005528450012207, "global_step": 157038, "epoch": 3739} {"train_loss": -6.830920696258545, "global_step": 157039, "epoch": 3739} {"train_loss": -6.99327278137207, "global_step": 157040, "epoch": 3739} {"train_loss": -6.893887519836426, "global_step": 157041, "epoch": 3739} {"train_loss": -6.944299697875977, "global_step": 157042, "epoch": 3739} {"train_loss": -6.851799011230469, "global_step": 157043, "epoch": 3739} {"train_loss": -6.877334117889404, "global_step": 157044, "epoch": 3739} {"train_loss": -6.989295482635498, "global_step": 157045, "epoch": 3739} {"train_loss": -6.96051025390625, "global_step": 157046, "epoch": 3739} {"train_loss": -6.79141902923584, "global_step": 157047, "epoch": 3739} {"train_loss": -6.887731552124023, "global_step": 157048, "epoch": 3739} {"train_loss": -6.839437961578369, "global_step": 157049, "epoch": 3739} {"train_loss": -6.729674339294434, "global_step": 157050, "epoch": 3739} {"train_loss": -6.914523601531982, "global_step": 157051, "epoch": 3739} {"train_loss": -6.882418632507324, "global_step": 157052, "epoch": 3739} {"train_loss": -6.815959930419922, "global_step": 157053, "epoch": 3739} {"train_loss": -6.9252729415893555, "global_step": 157054, "epoch": 3739} {"train_loss": -6.768590927124023, "global_step": 157055, "epoch": 3739} {"train_loss": -6.88621711730957, "global_step": 157056, "epoch": 3739} {"train_loss": -6.856300354003906, "global_step": 157057, "epoch": 3739} {"train_loss": -6.800763130187988, "global_step": 157058, "epoch": 3739} {"train_loss": -6.815861701965332, "global_step": 157059, "epoch": 3739} {"train_loss": -6.6018829345703125, "global_step": 157060, "epoch": 3739} {"train_loss": -6.7432451248168945, "global_step": 157061, "epoch": 3739} {"train_loss": -6.744353294372559, "global_step": 157062, "epoch": 3739} {"train_loss": -6.676949501037598, "global_step": 157063, "epoch": 3739} {"train_loss": -6.7639851570129395, "global_step": 157064, "epoch": 3739} {"train_loss": -6.74509334564209, "global_step": 157065, "epoch": 3739} {"train_loss": -6.875500202178955, "global_step": 157066, "epoch": 3739} {"train_loss": -6.793401718139648, "global_step": 157067, "epoch": 3739} {"train_loss": -6.86562442779541, "global_step": 157068, "epoch": 3739} {"train_loss": -6.701224327087402, "global_step": 157069, "epoch": 3739} {"train_loss": -6.840939521789551, "global_step": 157070, "epoch": 3739} {"train_loss": -6.761781215667725, "global_step": 157071, "epoch": 3739} {"train_loss": -6.830871105194092, "global_step": 157072, "epoch": 3739} {"train_loss": -6.728038787841797, "global_step": 157073, "epoch": 3739} {"train_loss": -6.782139778137207, "global_step": 157074, "epoch": 3739} {"train_loss": -6.80279541015625, "global_step": 157075, "epoch": 3739} {"train_loss": -6.899087905883789, "global_step": 157076, "epoch": 3739} {"train_loss": -6.870710372924805, "global_step": 157077, "epoch": 3739} {"train_loss": -6.840147972106934, "global_step": 157078, "epoch": 3739} {"train_loss": -6.836443867002215, "global_step": 157079, "epoch": 3739, "val_loss": 68462.796875} {"train_loss": -6.9171342849731445, "global_step": 157080, "epoch": 3740} {"train_loss": -6.894927978515625, "global_step": 157081, "epoch": 3740} {"train_loss": -6.735911846160889, "global_step": 157082, "epoch": 3740} {"train_loss": -6.886458873748779, "global_step": 157083, "epoch": 3740} {"train_loss": -6.933361530303955, "global_step": 157084, "epoch": 3740} {"train_loss": -6.979876518249512, "global_step": 157085, "epoch": 3740} {"train_loss": -6.985044002532959, "global_step": 157086, "epoch": 3740} {"train_loss": -6.856708526611328, "global_step": 157087, "epoch": 3740} {"train_loss": -6.969583988189697, "global_step": 157088, "epoch": 3740} {"train_loss": -6.868264198303223, "global_step": 157089, "epoch": 3740} {"train_loss": -6.915223121643066, "global_step": 157090, "epoch": 3740} {"train_loss": -6.886436939239502, "global_step": 157091, "epoch": 3740} {"train_loss": -6.989373207092285, "global_step": 157092, "epoch": 3740} {"train_loss": -6.858549118041992, "global_step": 157093, "epoch": 3740} {"train_loss": -6.862176418304443, "global_step": 157094, "epoch": 3740} {"train_loss": -6.964892864227295, "global_step": 157095, "epoch": 3740} {"train_loss": -6.982349872589111, "global_step": 157096, "epoch": 3740} {"train_loss": -7.034767150878906, "global_step": 157097, "epoch": 3740} {"train_loss": -6.903936386108398, "global_step": 157098, "epoch": 3740} {"train_loss": -7.003330230712891, "global_step": 157099, "epoch": 3740} {"train_loss": -6.934969425201416, "global_step": 157100, "epoch": 3740} {"train_loss": -6.964090347290039, "global_step": 157101, "epoch": 3740} {"train_loss": -7.059589862823486, "global_step": 157102, "epoch": 3740} {"train_loss": -7.006091594696045, "global_step": 157103, "epoch": 3740} {"train_loss": -6.900425910949707, "global_step": 157104, "epoch": 3740} {"train_loss": -7.019955635070801, "global_step": 157105, "epoch": 3740} {"train_loss": -6.959824085235596, "global_step": 157106, "epoch": 3740} {"train_loss": -6.915972709655762, "global_step": 157107, "epoch": 3740} {"train_loss": -6.9733381271362305, "global_step": 157108, "epoch": 3740} {"train_loss": -6.961509704589844, "global_step": 157109, "epoch": 3740} {"train_loss": -7.007556915283203, "global_step": 157110, "epoch": 3740} {"train_loss": -6.945159912109375, "global_step": 157111, "epoch": 3740} {"train_loss": -6.957913398742676, "global_step": 157112, "epoch": 3740} {"train_loss": -7.002493858337402, "global_step": 157113, "epoch": 3740} {"train_loss": -6.965045928955078, "global_step": 157114, "epoch": 3740} {"train_loss": -6.944606781005859, "global_step": 157115, "epoch": 3740} {"train_loss": -6.877307415008545, "global_step": 157116, "epoch": 3740} {"train_loss": -6.902213096618652, "global_step": 157117, "epoch": 3740} {"train_loss": -6.880041122436523, "global_step": 157118, "epoch": 3740} {"train_loss": -6.921478271484375, "global_step": 157119, "epoch": 3740} {"train_loss": -6.815315246582031, "global_step": 157120, "epoch": 3740} {"train_loss": -6.936754351570492, "global_step": 157121, "epoch": 3740, "val_loss": 68295.9609375} {"train_loss": -6.91530704498291, "global_step": 157122, "epoch": 3741} {"train_loss": -6.905677795410156, "global_step": 157123, "epoch": 3741} {"train_loss": -6.85499382019043, "global_step": 157124, "epoch": 3741} {"train_loss": -6.967851638793945, "global_step": 157125, "epoch": 3741} {"train_loss": -6.901190280914307, "global_step": 157126, "epoch": 3741} {"train_loss": -6.857520580291748, "global_step": 157127, "epoch": 3741} {"train_loss": -6.942915916442871, "global_step": 157128, "epoch": 3741} {"train_loss": -6.9791646003723145, "global_step": 157129, "epoch": 3741} {"train_loss": -6.933200836181641, "global_step": 157130, "epoch": 3741} {"train_loss": -6.931395530700684, "global_step": 157131, "epoch": 3741} {"train_loss": -7.018474102020264, "global_step": 157132, "epoch": 3741} {"train_loss": -6.809739112854004, "global_step": 157133, "epoch": 3741} {"train_loss": -6.939614295959473, "global_step": 157134, "epoch": 3741} {"train_loss": -6.897729873657227, "global_step": 157135, "epoch": 3741} {"train_loss": -6.979944229125977, "global_step": 157136, "epoch": 3741} {"train_loss": -6.941510200500488, "global_step": 157137, "epoch": 3741} {"train_loss": -6.926806449890137, "global_step": 157138, "epoch": 3741} {"train_loss": -6.938542366027832, "global_step": 157139, "epoch": 3741} {"train_loss": -6.864193916320801, "global_step": 157140, "epoch": 3741} {"train_loss": -6.89901876449585, "global_step": 157141, "epoch": 3741} {"train_loss": -7.05101203918457, "global_step": 157142, "epoch": 3741} {"train_loss": -6.9165568351745605, "global_step": 157143, "epoch": 3741} {"train_loss": -6.990036964416504, "global_step": 157144, "epoch": 3741} {"train_loss": -6.98468542098999, "global_step": 157145, "epoch": 3741} {"train_loss": -6.807493209838867, "global_step": 157146, "epoch": 3741} {"train_loss": -6.946471214294434, "global_step": 157147, "epoch": 3741} {"train_loss": -6.913998603820801, "global_step": 157148, "epoch": 3741} {"train_loss": -6.862758636474609, "global_step": 157149, "epoch": 3741} {"train_loss": -6.986263275146484, "global_step": 157150, "epoch": 3741} {"train_loss": -6.952030658721924, "global_step": 157151, "epoch": 3741} {"train_loss": -7.004987716674805, "global_step": 157152, "epoch": 3741} {"train_loss": -6.9061431884765625, "global_step": 157153, "epoch": 3741} {"train_loss": -6.851232528686523, "global_step": 157154, "epoch": 3741} {"train_loss": -6.84300422668457, "global_step": 157155, "epoch": 3741} {"train_loss": -6.895865440368652, "global_step": 157156, "epoch": 3741} {"train_loss": -6.992097854614258, "global_step": 157157, "epoch": 3741} {"train_loss": -6.923955917358398, "global_step": 157158, "epoch": 3741} {"train_loss": -6.952977657318115, "global_step": 157159, "epoch": 3741} {"train_loss": -6.851661682128906, "global_step": 157160, "epoch": 3741} {"train_loss": -6.951958656311035, "global_step": 157161, "epoch": 3741} {"train_loss": -6.964301109313965, "global_step": 157162, "epoch": 3741} {"train_loss": -6.926726488840012, "global_step": 157163, "epoch": 3741, "val_loss": 68400.0078125} {"train_loss": -6.941343784332275, "global_step": 157164, "epoch": 3742} {"train_loss": -6.98309326171875, "global_step": 157165, "epoch": 3742} {"train_loss": -6.9363861083984375, "global_step": 157166, "epoch": 3742} {"train_loss": -6.946362495422363, "global_step": 157167, "epoch": 3742} {"train_loss": -6.848546981811523, "global_step": 157168, "epoch": 3742} {"train_loss": -6.961268424987793, "global_step": 157169, "epoch": 3742} {"train_loss": -6.8480424880981445, "global_step": 157170, "epoch": 3742} {"train_loss": -6.838459014892578, "global_step": 157171, "epoch": 3742} {"train_loss": -6.966751575469971, "global_step": 157172, "epoch": 3742} {"train_loss": -6.991568565368652, "global_step": 157173, "epoch": 3742} {"train_loss": -6.767189979553223, "global_step": 157174, "epoch": 3742} {"train_loss": -6.947023391723633, "global_step": 157175, "epoch": 3742} {"train_loss": -6.884402275085449, "global_step": 157176, "epoch": 3742} {"train_loss": -6.711736679077148, "global_step": 157177, "epoch": 3742} {"train_loss": -6.984552383422852, "global_step": 157178, "epoch": 3742} {"train_loss": -6.846741676330566, "global_step": 157179, "epoch": 3742} {"train_loss": -6.737817287445068, "global_step": 157180, "epoch": 3742} {"train_loss": -6.908480644226074, "global_step": 157181, "epoch": 3742} {"train_loss": -6.769883632659912, "global_step": 157182, "epoch": 3742} {"train_loss": -6.85947847366333, "global_step": 157183, "epoch": 3742} {"train_loss": -6.874950408935547, "global_step": 157184, "epoch": 3742} {"train_loss": -6.85983943939209, "global_step": 157185, "epoch": 3742} {"train_loss": -6.8915629386901855, "global_step": 157186, "epoch": 3742} {"train_loss": -6.953834533691406, "global_step": 157187, "epoch": 3742} {"train_loss": -6.776991367340088, "global_step": 157188, "epoch": 3742} {"train_loss": -6.86866569519043, "global_step": 157189, "epoch": 3742} {"train_loss": -6.891404151916504, "global_step": 157190, "epoch": 3742} {"train_loss": -6.910240173339844, "global_step": 157191, "epoch": 3742} {"train_loss": -6.956510066986084, "global_step": 157192, "epoch": 3742} {"train_loss": -6.883615970611572, "global_step": 157193, "epoch": 3742} {"train_loss": -6.896169662475586, "global_step": 157194, "epoch": 3742} {"train_loss": -6.923429489135742, "global_step": 157195, "epoch": 3742} {"train_loss": -6.953668594360352, "global_step": 157196, "epoch": 3742} {"train_loss": -6.92448616027832, "global_step": 157197, "epoch": 3742} {"train_loss": -6.852786064147949, "global_step": 157198, "epoch": 3742} {"train_loss": -6.950805187225342, "global_step": 157199, "epoch": 3742} {"train_loss": -6.916879653930664, "global_step": 157200, "epoch": 3742} {"train_loss": -6.884253025054932, "global_step": 157201, "epoch": 3742} {"train_loss": -7.006148338317871, "global_step": 157202, "epoch": 3742} {"train_loss": -6.848908424377441, "global_step": 157203, "epoch": 3742} {"train_loss": -7.018570423126221, "global_step": 157204, "epoch": 3742} {"train_loss": -6.895862227394467, "global_step": 157205, "epoch": 3742, "val_loss": 68405.9609375} {"train_loss": -6.933903694152832, "global_step": 157206, "epoch": 3743} {"train_loss": -6.9211225509643555, "global_step": 157207, "epoch": 3743} {"train_loss": -6.885354995727539, "global_step": 157208, "epoch": 3743} {"train_loss": -6.919076919555664, "global_step": 157209, "epoch": 3743} {"train_loss": -6.912256240844727, "global_step": 157210, "epoch": 3743} {"train_loss": -6.681704521179199, "global_step": 157211, "epoch": 3743} {"train_loss": -6.883411407470703, "global_step": 157212, "epoch": 3743} {"train_loss": -6.934944152832031, "global_step": 157213, "epoch": 3743} {"train_loss": -6.86403751373291, "global_step": 157214, "epoch": 3743} {"train_loss": -6.943688869476318, "global_step": 157215, "epoch": 3743} {"train_loss": -6.962367057800293, "global_step": 157216, "epoch": 3743} {"train_loss": -6.894852638244629, "global_step": 157217, "epoch": 3743} {"train_loss": -6.816391944885254, "global_step": 157218, "epoch": 3743} {"train_loss": -6.807279109954834, "global_step": 157219, "epoch": 3743} {"train_loss": -6.839970588684082, "global_step": 157220, "epoch": 3743} {"train_loss": -6.750345230102539, "global_step": 157221, "epoch": 3743} {"train_loss": -6.9808878898620605, "global_step": 157222, "epoch": 3743} {"train_loss": -6.81418514251709, "global_step": 157223, "epoch": 3743} {"train_loss": -6.778063774108887, "global_step": 157224, "epoch": 3743} {"train_loss": -6.869235515594482, "global_step": 157225, "epoch": 3743} {"train_loss": -6.72540283203125, "global_step": 157226, "epoch": 3743} {"train_loss": -6.913788795471191, "global_step": 157227, "epoch": 3743} {"train_loss": -6.7616705894470215, "global_step": 157228, "epoch": 3743} {"train_loss": -6.856895446777344, "global_step": 157229, "epoch": 3743} {"train_loss": -6.73832368850708, "global_step": 157230, "epoch": 3743} {"train_loss": -6.805427551269531, "global_step": 157231, "epoch": 3743} {"train_loss": -6.850125312805176, "global_step": 157232, "epoch": 3743} {"train_loss": -6.711971282958984, "global_step": 157233, "epoch": 3743} {"train_loss": -6.9225287437438965, "global_step": 157234, "epoch": 3743} {"train_loss": -6.710515975952148, "global_step": 157235, "epoch": 3743} {"train_loss": -6.832002639770508, "global_step": 157236, "epoch": 3743} {"train_loss": -6.630878448486328, "global_step": 157237, "epoch": 3743} {"train_loss": -6.8597187995910645, "global_step": 157238, "epoch": 3743} {"train_loss": -6.768311500549316, "global_step": 157239, "epoch": 3743} {"train_loss": -6.715384483337402, "global_step": 157240, "epoch": 3743} {"train_loss": -6.77211856842041, "global_step": 157241, "epoch": 3743} {"train_loss": -6.738589286804199, "global_step": 157242, "epoch": 3743} {"train_loss": -6.812655448913574, "global_step": 157243, "epoch": 3743} {"train_loss": -6.892746448516846, "global_step": 157244, "epoch": 3743} {"train_loss": -6.676089286804199, "global_step": 157245, "epoch": 3743} {"train_loss": -6.810741424560547, "global_step": 157246, "epoch": 3743} {"train_loss": -6.823329380580357, "global_step": 157247, "epoch": 3743, "val_loss": 68172.6640625} {"train_loss": -6.764848709106445, "global_step": 157248, "epoch": 3744} {"train_loss": -6.832597732543945, "global_step": 157249, "epoch": 3744} {"train_loss": -6.762148380279541, "global_step": 157250, "epoch": 3744} {"train_loss": -6.85853385925293, "global_step": 157251, "epoch": 3744} {"train_loss": -6.761168479919434, "global_step": 157252, "epoch": 3744} {"train_loss": -6.816495895385742, "global_step": 157253, "epoch": 3744} {"train_loss": -6.763407230377197, "global_step": 157254, "epoch": 3744} {"train_loss": -6.919094085693359, "global_step": 157255, "epoch": 3744} {"train_loss": -6.826119899749756, "global_step": 157256, "epoch": 3744} {"train_loss": -6.722771644592285, "global_step": 157257, "epoch": 3744} {"train_loss": -6.90516471862793, "global_step": 157258, "epoch": 3744} {"train_loss": -6.85346794128418, "global_step": 157259, "epoch": 3744} {"train_loss": -6.903610706329346, "global_step": 157260, "epoch": 3744} {"train_loss": -6.910284996032715, "global_step": 157261, "epoch": 3744} {"train_loss": -6.936452388763428, "global_step": 157262, "epoch": 3744} {"train_loss": -6.924487113952637, "global_step": 157263, "epoch": 3744} {"train_loss": -6.961544036865234, "global_step": 157264, "epoch": 3744} {"train_loss": -6.942716598510742, "global_step": 157265, "epoch": 3744} {"train_loss": -6.969590187072754, "global_step": 157266, "epoch": 3744} {"train_loss": -6.990113735198975, "global_step": 157267, "epoch": 3744} {"train_loss": -6.873668670654297, "global_step": 157268, "epoch": 3744} {"train_loss": -6.875070095062256, "global_step": 157269, "epoch": 3744} {"train_loss": -6.891183376312256, "global_step": 157270, "epoch": 3744} {"train_loss": -6.844544887542725, "global_step": 157271, "epoch": 3744} {"train_loss": -6.922298908233643, "global_step": 157272, "epoch": 3744} {"train_loss": -6.9218621253967285, "global_step": 157273, "epoch": 3744} {"train_loss": -6.901350021362305, "global_step": 157274, "epoch": 3744} {"train_loss": -6.846301078796387, "global_step": 157275, "epoch": 3744} {"train_loss": -6.915344715118408, "global_step": 157276, "epoch": 3744} {"train_loss": -6.893796920776367, "global_step": 157277, "epoch": 3744} {"train_loss": -6.877200126647949, "global_step": 157278, "epoch": 3744} {"train_loss": -6.871651649475098, "global_step": 157279, "epoch": 3744} {"train_loss": -7.076575756072998, "global_step": 157280, "epoch": 3744} {"train_loss": -6.799539566040039, "global_step": 157281, "epoch": 3744} {"train_loss": -6.864731311798096, "global_step": 157282, "epoch": 3744} {"train_loss": -7.027434349060059, "global_step": 157283, "epoch": 3744} {"train_loss": -6.88873291015625, "global_step": 157284, "epoch": 3744} {"train_loss": -6.9365434646606445, "global_step": 157285, "epoch": 3744} {"train_loss": -6.953298091888428, "global_step": 157286, "epoch": 3744} {"train_loss": -6.926708698272705, "global_step": 157287, "epoch": 3744} {"train_loss": -6.976569175720215, "global_step": 157288, "epoch": 3744} {"train_loss": -6.889071203413463, "global_step": 157289, "epoch": 3744, "val_loss": 68321.6875} {"train_loss": -6.9569196701049805, "global_step": 157290, "epoch": 3745} {"train_loss": -6.851360321044922, "global_step": 157291, "epoch": 3745} {"train_loss": -6.911185264587402, "global_step": 157292, "epoch": 3745} {"train_loss": -6.9256134033203125, "global_step": 157293, "epoch": 3745} {"train_loss": -6.8519134521484375, "global_step": 157294, "epoch": 3745} {"train_loss": -6.919223308563232, "global_step": 157295, "epoch": 3745} {"train_loss": -6.911934852600098, "global_step": 157296, "epoch": 3745} {"train_loss": -6.883340835571289, "global_step": 157297, "epoch": 3745} {"train_loss": -7.019021034240723, "global_step": 157298, "epoch": 3745} {"train_loss": -6.9081854820251465, "global_step": 157299, "epoch": 3745} {"train_loss": -6.957882881164551, "global_step": 157300, "epoch": 3745} {"train_loss": -6.925623893737793, "global_step": 157301, "epoch": 3745} {"train_loss": -6.931023597717285, "global_step": 157302, "epoch": 3745} {"train_loss": -7.112730026245117, "global_step": 157303, "epoch": 3745} {"train_loss": -7.019722938537598, "global_step": 157304, "epoch": 3745} {"train_loss": -7.007167816162109, "global_step": 157305, "epoch": 3745} {"train_loss": -6.874149322509766, "global_step": 157306, "epoch": 3745} {"train_loss": -7.009554386138916, "global_step": 157307, "epoch": 3745} {"train_loss": -6.9658002853393555, "global_step": 157308, "epoch": 3745} {"train_loss": -6.923253059387207, "global_step": 157309, "epoch": 3745} {"train_loss": -7.022483825683594, "global_step": 157310, "epoch": 3745} {"train_loss": -7.012416839599609, "global_step": 157311, "epoch": 3745} {"train_loss": -7.074159622192383, "global_step": 157312, "epoch": 3745} {"train_loss": -6.968645095825195, "global_step": 157313, "epoch": 3745} {"train_loss": -7.046767234802246, "global_step": 157314, "epoch": 3745} {"train_loss": -6.945974349975586, "global_step": 157315, "epoch": 3745} {"train_loss": -6.910003662109375, "global_step": 157316, "epoch": 3745} {"train_loss": -6.99029541015625, "global_step": 157317, "epoch": 3745} {"train_loss": -6.95166540145874, "global_step": 157318, "epoch": 3745} {"train_loss": -6.975839614868164, "global_step": 157319, "epoch": 3745} {"train_loss": -6.92392635345459, "global_step": 157320, "epoch": 3745} {"train_loss": -6.979247570037842, "global_step": 157321, "epoch": 3745} {"train_loss": -6.945804119110107, "global_step": 157322, "epoch": 3745} {"train_loss": -6.807836532592773, "global_step": 157323, "epoch": 3745} {"train_loss": -6.897917747497559, "global_step": 157324, "epoch": 3745} {"train_loss": -6.898410320281982, "global_step": 157325, "epoch": 3745} {"train_loss": -6.932436943054199, "global_step": 157326, "epoch": 3745} {"train_loss": -6.917303562164307, "global_step": 157327, "epoch": 3745} {"train_loss": -6.943734169006348, "global_step": 157328, "epoch": 3745} {"train_loss": -6.869469165802002, "global_step": 157329, "epoch": 3745} {"train_loss": -6.867051124572754, "global_step": 157330, "epoch": 3745} {"train_loss": -6.947470846630278, "global_step": 157331, "epoch": 3745, "val_loss": 68419.515625} {"train_loss": -6.968356609344482, "global_step": 157332, "epoch": 3746} {"train_loss": -6.86256217956543, "global_step": 157333, "epoch": 3746} {"train_loss": -6.916364669799805, "global_step": 157334, "epoch": 3746} {"train_loss": -6.962028503417969, "global_step": 157335, "epoch": 3746} {"train_loss": -7.108509063720703, "global_step": 157336, "epoch": 3746} {"train_loss": -7.019452095031738, "global_step": 157337, "epoch": 3746} {"train_loss": -6.942194938659668, "global_step": 157338, "epoch": 3746} {"train_loss": -6.943245887756348, "global_step": 157339, "epoch": 3746} {"train_loss": -6.895303249359131, "global_step": 157340, "epoch": 3746} {"train_loss": -6.908804893493652, "global_step": 157341, "epoch": 3746} {"train_loss": -7.0105485916137695, "global_step": 157342, "epoch": 3746} {"train_loss": -6.9538774490356445, "global_step": 157343, "epoch": 3746} {"train_loss": -6.936149597167969, "global_step": 157344, "epoch": 3746} {"train_loss": -6.908149719238281, "global_step": 157345, "epoch": 3746} {"train_loss": -6.967424392700195, "global_step": 157346, "epoch": 3746} {"train_loss": -6.773536205291748, "global_step": 157347, "epoch": 3746} {"train_loss": -6.832454681396484, "global_step": 157348, "epoch": 3746} {"train_loss": -6.823439598083496, "global_step": 157349, "epoch": 3746} {"train_loss": -6.867552757263184, "global_step": 157350, "epoch": 3746} {"train_loss": -6.9083333015441895, "global_step": 157351, "epoch": 3746} {"train_loss": -6.778820037841797, "global_step": 157352, "epoch": 3746} {"train_loss": -6.977141380310059, "global_step": 157353, "epoch": 3746} {"train_loss": -6.862380504608154, "global_step": 157354, "epoch": 3746} {"train_loss": -6.792326927185059, "global_step": 157355, "epoch": 3746} {"train_loss": -6.9084248542785645, "global_step": 157356, "epoch": 3746} {"train_loss": -6.809040069580078, "global_step": 157357, "epoch": 3746} {"train_loss": -6.951234817504883, "global_step": 157358, "epoch": 3746} {"train_loss": -6.90256929397583, "global_step": 157359, "epoch": 3746} {"train_loss": -6.835626602172852, "global_step": 157360, "epoch": 3746} {"train_loss": -6.852471351623535, "global_step": 157361, "epoch": 3746} {"train_loss": -6.855815410614014, "global_step": 157362, "epoch": 3746} {"train_loss": -6.901821136474609, "global_step": 157363, "epoch": 3746} {"train_loss": -6.7991108894348145, "global_step": 157364, "epoch": 3746} {"train_loss": -6.894586563110352, "global_step": 157365, "epoch": 3746} {"train_loss": -6.922489643096924, "global_step": 157366, "epoch": 3746} {"train_loss": -6.808233737945557, "global_step": 157367, "epoch": 3746} {"train_loss": -6.858051300048828, "global_step": 157368, "epoch": 3746} {"train_loss": -6.893363952636719, "global_step": 157369, "epoch": 3746} {"train_loss": -6.86943244934082, "global_step": 157370, "epoch": 3746} {"train_loss": -6.963744163513184, "global_step": 157371, "epoch": 3746} {"train_loss": -6.981523513793945, "global_step": 157372, "epoch": 3746} {"train_loss": -6.901258264269147, "global_step": 157373, "epoch": 3746, "val_loss": 68509.6953125} {"train_loss": -6.992765426635742, "global_step": 157374, "epoch": 3747} {"train_loss": -6.9763898849487305, "global_step": 157375, "epoch": 3747} {"train_loss": -6.963762283325195, "global_step": 157376, "epoch": 3747} {"train_loss": -6.909419536590576, "global_step": 157377, "epoch": 3747} {"train_loss": -6.920140266418457, "global_step": 157378, "epoch": 3747} {"train_loss": -6.870697021484375, "global_step": 157379, "epoch": 3747} {"train_loss": -6.9437642097473145, "global_step": 157380, "epoch": 3747} {"train_loss": -6.935399055480957, "global_step": 157381, "epoch": 3747} {"train_loss": -6.906558990478516, "global_step": 157382, "epoch": 3747} {"train_loss": -7.120996475219727, "global_step": 157383, "epoch": 3747} {"train_loss": -6.807705879211426, "global_step": 157384, "epoch": 3747} {"train_loss": -7.007800579071045, "global_step": 157385, "epoch": 3747} {"train_loss": -6.92253303527832, "global_step": 157386, "epoch": 3747} {"train_loss": -6.950010776519775, "global_step": 157387, "epoch": 3747} {"train_loss": -6.88161563873291, "global_step": 157388, "epoch": 3747} {"train_loss": -6.975522994995117, "global_step": 157389, "epoch": 3747} {"train_loss": -6.98404598236084, "global_step": 157390, "epoch": 3747} {"train_loss": -7.058711051940918, "global_step": 157391, "epoch": 3747} {"train_loss": -6.854666233062744, "global_step": 157392, "epoch": 3747} {"train_loss": -6.9928693771362305, "global_step": 157393, "epoch": 3747} {"train_loss": -6.853271007537842, "global_step": 157394, "epoch": 3747} {"train_loss": -7.023821830749512, "global_step": 157395, "epoch": 3747} {"train_loss": -7.011817932128906, "global_step": 157396, "epoch": 3747} {"train_loss": -6.979255676269531, "global_step": 157397, "epoch": 3747} {"train_loss": -7.006760597229004, "global_step": 157398, "epoch": 3747} {"train_loss": -6.856832981109619, "global_step": 157399, "epoch": 3747} {"train_loss": -7.063230991363525, "global_step": 157400, "epoch": 3747} {"train_loss": -6.933201789855957, "global_step": 157401, "epoch": 3747} {"train_loss": -7.037230014801025, "global_step": 157402, "epoch": 3747} {"train_loss": -6.812586784362793, "global_step": 157403, "epoch": 3747} {"train_loss": -6.7387800216674805, "global_step": 157404, "epoch": 3747} {"train_loss": -6.8672075271606445, "global_step": 157405, "epoch": 3747} {"train_loss": -6.829128742218018, "global_step": 157406, "epoch": 3747} {"train_loss": -6.799036502838135, "global_step": 157407, "epoch": 3747} {"train_loss": -6.90596866607666, "global_step": 157408, "epoch": 3747} {"train_loss": -6.886252403259277, "global_step": 157409, "epoch": 3747} {"train_loss": -6.869314193725586, "global_step": 157410, "epoch": 3747} {"train_loss": -6.908877372741699, "global_step": 157411, "epoch": 3747} {"train_loss": -6.86390495300293, "global_step": 157412, "epoch": 3747} {"train_loss": -7.000208377838135, "global_step": 157413, "epoch": 3747} {"train_loss": -6.9319915771484375, "global_step": 157414, "epoch": 3747} {"train_loss": -6.931027911958241, "global_step": 157415, "epoch": 3747, "val_loss": 68505.9921875} {"train_loss": -6.856711387634277, "global_step": 157416, "epoch": 3748} {"train_loss": -6.827085971832275, "global_step": 157417, "epoch": 3748} {"train_loss": -6.906519412994385, "global_step": 157418, "epoch": 3748} {"train_loss": -6.9785614013671875, "global_step": 157419, "epoch": 3748} {"train_loss": -6.855145454406738, "global_step": 157420, "epoch": 3748} {"train_loss": -6.809218406677246, "global_step": 157421, "epoch": 3748} {"train_loss": -6.9564208984375, "global_step": 157422, "epoch": 3748} {"train_loss": -6.762885093688965, "global_step": 157423, "epoch": 3748} {"train_loss": -6.9562177658081055, "global_step": 157424, "epoch": 3748} {"train_loss": -6.699709892272949, "global_step": 157425, "epoch": 3748} {"train_loss": -6.856478691101074, "global_step": 157426, "epoch": 3748} {"train_loss": -6.900279521942139, "global_step": 157427, "epoch": 3748} {"train_loss": -6.931535720825195, "global_step": 157428, "epoch": 3748} {"train_loss": -6.75064754486084, "global_step": 157429, "epoch": 3748} {"train_loss": -6.820962429046631, "global_step": 157430, "epoch": 3748} {"train_loss": -6.896251678466797, "global_step": 157431, "epoch": 3748} {"train_loss": -6.899629592895508, "global_step": 157432, "epoch": 3748} {"train_loss": -6.930769920349121, "global_step": 157433, "epoch": 3748} {"train_loss": -6.902600288391113, "global_step": 157434, "epoch": 3748} {"train_loss": -6.937939167022705, "global_step": 157435, "epoch": 3748} {"train_loss": -6.890268325805664, "global_step": 157436, "epoch": 3748} {"train_loss": -6.8890275955200195, "global_step": 157437, "epoch": 3748} {"train_loss": -6.874871253967285, "global_step": 157438, "epoch": 3748} {"train_loss": -6.871736526489258, "global_step": 157439, "epoch": 3748} {"train_loss": -6.808005332946777, "global_step": 157440, "epoch": 3748} {"train_loss": -6.869429588317871, "global_step": 157441, "epoch": 3748} {"train_loss": -6.843973636627197, "global_step": 157442, "epoch": 3748} {"train_loss": -6.8749871253967285, "global_step": 157443, "epoch": 3748} {"train_loss": -6.857928276062012, "global_step": 157444, "epoch": 3748} {"train_loss": -6.983015060424805, "global_step": 157445, "epoch": 3748} {"train_loss": -6.947089195251465, "global_step": 157446, "epoch": 3748} {"train_loss": -6.847123146057129, "global_step": 157447, "epoch": 3748} {"train_loss": -6.925803184509277, "global_step": 157448, "epoch": 3748} {"train_loss": -6.921598434448242, "global_step": 157449, "epoch": 3748} {"train_loss": -6.83267879486084, "global_step": 157450, "epoch": 3748} {"train_loss": -7.037555694580078, "global_step": 157451, "epoch": 3748} {"train_loss": -6.943486213684082, "global_step": 157452, "epoch": 3748} {"train_loss": -6.992894172668457, "global_step": 157453, "epoch": 3748} {"train_loss": -6.888419151306152, "global_step": 157454, "epoch": 3748} {"train_loss": -6.961254119873047, "global_step": 157455, "epoch": 3748} {"train_loss": -6.842990875244141, "global_step": 157456, "epoch": 3748} {"train_loss": -6.888133775620234, "global_step": 157457, "epoch": 3748, "val_loss": 68384.5078125} {"train_loss": -6.991368293762207, "global_step": 157458, "epoch": 3749} {"train_loss": -7.043342590332031, "global_step": 157459, "epoch": 3749} {"train_loss": -6.876757621765137, "global_step": 157460, "epoch": 3749} {"train_loss": -6.953118324279785, "global_step": 157461, "epoch": 3749} {"train_loss": -6.974261283874512, "global_step": 157462, "epoch": 3749} {"train_loss": -7.07327938079834, "global_step": 157463, "epoch": 3749} {"train_loss": -6.898860931396484, "global_step": 157464, "epoch": 3749} {"train_loss": -7.040112495422363, "global_step": 157465, "epoch": 3749} {"train_loss": -7.020274639129639, "global_step": 157466, "epoch": 3749} {"train_loss": -7.039222240447998, "global_step": 157467, "epoch": 3749} {"train_loss": -6.975752830505371, "global_step": 157468, "epoch": 3749} {"train_loss": -6.909499168395996, "global_step": 157469, "epoch": 3749} {"train_loss": -6.872986793518066, "global_step": 157470, "epoch": 3749} {"train_loss": -6.953207969665527, "global_step": 157471, "epoch": 3749} {"train_loss": -7.010679244995117, "global_step": 157472, "epoch": 3749} {"train_loss": -6.944108963012695, "global_step": 157473, "epoch": 3749} {"train_loss": -6.875306129455566, "global_step": 157474, "epoch": 3749} {"train_loss": -6.920270919799805, "global_step": 157475, "epoch": 3749} {"train_loss": -6.948184013366699, "global_step": 157476, "epoch": 3749} {"train_loss": -6.913778781890869, "global_step": 157477, "epoch": 3749} {"train_loss": -7.004389762878418, "global_step": 157478, "epoch": 3749} {"train_loss": -6.969899654388428, "global_step": 157479, "epoch": 3749} {"train_loss": -6.976410388946533, "global_step": 157480, "epoch": 3749} {"train_loss": -7.052931308746338, "global_step": 157481, "epoch": 3749} {"train_loss": -6.9604363441467285, "global_step": 157482, "epoch": 3749} {"train_loss": -6.873435974121094, "global_step": 157483, "epoch": 3749} {"train_loss": -7.046789169311523, "global_step": 157484, "epoch": 3749} {"train_loss": -7.045987129211426, "global_step": 157485, "epoch": 3749} {"train_loss": -6.88081169128418, "global_step": 157486, "epoch": 3749} {"train_loss": -6.917362213134766, "global_step": 157487, "epoch": 3749} {"train_loss": -6.863460540771484, "global_step": 157488, "epoch": 3749} {"train_loss": -6.9903106689453125, "global_step": 157489, "epoch": 3749} {"train_loss": -6.986845016479492, "global_step": 157490, "epoch": 3749} {"train_loss": -6.915693283081055, "global_step": 157491, "epoch": 3749} {"train_loss": -6.984443664550781, "global_step": 157492, "epoch": 3749} {"train_loss": -7.017154693603516, "global_step": 157493, "epoch": 3749} {"train_loss": -6.9023661613464355, "global_step": 157494, "epoch": 3749} {"train_loss": -6.876837730407715, "global_step": 157495, "epoch": 3749} {"train_loss": -6.842770576477051, "global_step": 157496, "epoch": 3749} {"train_loss": -7.070860862731934, "global_step": 157497, "epoch": 3749} {"train_loss": -6.970007419586182, "global_step": 157498, "epoch": 3749} {"train_loss": -6.959712448574248, "global_step": 157499, "epoch": 3749, "val_loss": 68383.6796875} {"train_loss": -7.11868143081665, "global_step": 157500, "epoch": 3750} {"train_loss": -6.910250663757324, "global_step": 157501, "epoch": 3750} {"train_loss": -6.8726091384887695, "global_step": 157502, "epoch": 3750} {"train_loss": -6.972080230712891, "global_step": 157503, "epoch": 3750} {"train_loss": -6.924619674682617, "global_step": 157504, "epoch": 3750} {"train_loss": -6.910473823547363, "global_step": 157505, "epoch": 3750} {"train_loss": -6.917457580566406, "global_step": 157506, "epoch": 3750} {"train_loss": -6.960619926452637, "global_step": 157507, "epoch": 3750} {"train_loss": -6.926510810852051, "global_step": 157508, "epoch": 3750} {"train_loss": -7.009387016296387, "global_step": 157509, "epoch": 3750} {"train_loss": -6.951367378234863, "global_step": 157510, "epoch": 3750} {"train_loss": -6.968411445617676, "global_step": 157511, "epoch": 3750} {"train_loss": -6.9591779708862305, "global_step": 157512, "epoch": 3750} {"train_loss": -7.008695602416992, "global_step": 157513, "epoch": 3750} {"train_loss": -6.963924407958984, "global_step": 157514, "epoch": 3750} {"train_loss": -7.016500949859619, "global_step": 157515, "epoch": 3750} {"train_loss": -6.940528869628906, "global_step": 157516, "epoch": 3750} {"train_loss": -7.012474060058594, "global_step": 157517, "epoch": 3750} {"train_loss": -6.927268981933594, "global_step": 157518, "epoch": 3750} {"train_loss": -7.045624732971191, "global_step": 157519, "epoch": 3750} {"train_loss": -7.026715278625488, "global_step": 157520, "epoch": 3750} {"train_loss": -7.0086846351623535, "global_step": 157521, "epoch": 3750} {"train_loss": -6.969047546386719, "global_step": 157522, "epoch": 3750} {"train_loss": -6.895968437194824, "global_step": 157523, "epoch": 3750} {"train_loss": -6.93108606338501, "global_step": 157524, "epoch": 3750} {"train_loss": -6.844208240509033, "global_step": 157525, "epoch": 3750} {"train_loss": -6.798514366149902, "global_step": 157526, "epoch": 3750} {"train_loss": -6.8362531661987305, "global_step": 157527, "epoch": 3750} {"train_loss": -6.988506317138672, "global_step": 157528, "epoch": 3750} {"train_loss": -6.869515419006348, "global_step": 157529, "epoch": 3750} {"train_loss": -6.9990034103393555, "global_step": 157530, "epoch": 3750} {"train_loss": -7.0572829246521, "global_step": 157531, "epoch": 3750} {"train_loss": -6.9544997215271, "global_step": 157532, "epoch": 3750} {"train_loss": -6.981836318969727, "global_step": 157533, "epoch": 3750} {"train_loss": -6.962989807128906, "global_step": 157534, "epoch": 3750} {"train_loss": -6.848602294921875, "global_step": 157535, "epoch": 3750} {"train_loss": -6.855390548706055, "global_step": 157536, "epoch": 3750} {"train_loss": -7.057181358337402, "global_step": 157537, "epoch": 3750} {"train_loss": -6.949804306030273, "global_step": 157538, "epoch": 3750} {"train_loss": -6.984789848327637, "global_step": 157539, "epoch": 3750} {"train_loss": -7.028158187866211, "global_step": 157540, "epoch": 3750} {"train_loss": -6.956303119659424, "global_step": 157541, "epoch": 3750, "train/sim_max_reward_0": 0.19288815612240448, "train/sim_max_reward_1": 0.9822177707679633, "train/sim_max_reward_2": 0.33896184736063506, "train/sim_max_reward_3": 0.9708972438594421, "train/sim_max_reward_4": 0.9314589870781025, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0, "test/sim_max_reward_4300001": 0.20965767108271588, "test/sim_max_reward_4300002": 0.9674734045125236, "test/sim_max_reward_4300003": 0.9877810348431048, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9647812143265008, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3377493373941959, "test/sim_max_reward_4300008": 0.9654997668365152, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.6645994923709804, "test/sim_max_reward_4300012": 0.783433252473819, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 0.9626654293858548, "test/sim_max_reward_4300015": 0.979799131042093, "test/sim_max_reward_4300016": 0.9137059108242915, "test/sim_max_reward_4300017": 0.8849796712796741, "test/sim_max_reward_4300018": 0.3968998349201434, "test/sim_max_reward_4300019": 0.18526677353710358, "test/sim_max_reward_4300020": 0.27602744706414833, "test/sim_max_reward_4300021": 0.820176022075197, "test/sim_max_reward_4300022": 0.9574052999649032, "test/sim_max_reward_4300023": 0.32876779218988883, "test/sim_max_reward_4300024": 1.0, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.25699408563460513, "test/sim_max_reward_4300027": 0.7751473588151456, "test/sim_max_reward_4300028": 0.3788722121418745, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.1577051411860276, "test/sim_max_reward_4300031": 0.9171688812777397, "test/sim_max_reward_4300032": 0.9833908256034926, "test/sim_max_reward_4300033": 0.6200377496039, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.5216279643976587, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8481804626864272, "test/sim_max_reward_4300038": 0.38364283780393726, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.8412593000863942, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7210400311388696, "test/sim_max_reward_4300043": 0.12308593529371771, "test/sim_max_reward_4300044": 0.9650786182264918, "test/sim_max_reward_4300045": 0.9760607351073397, "test/sim_max_reward_4300046": 0.9612435011125644, "test/sim_max_reward_4300047": 0.19215150953251023, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.22284846529184457, "train/mean_score": 0.6015681274251224, "test/mean_score": 0.5729446464287392, "val_loss": 68215.0859375} {"train_loss": -6.991168022155762, "global_step": 157542, "epoch": 3751} {"train_loss": -7.1358137130737305, "global_step": 157543, "epoch": 3751} {"train_loss": -6.977505683898926, "global_step": 157544, "epoch": 3751} {"train_loss": -7.02581787109375, "global_step": 157545, "epoch": 3751} {"train_loss": -7.031834602355957, "global_step": 157546, "epoch": 3751} {"train_loss": -7.063323974609375, "global_step": 157547, "epoch": 3751} {"train_loss": -6.924338340759277, "global_step": 157548, "epoch": 3751} {"train_loss": -6.956514835357666, "global_step": 157549, "epoch": 3751} {"train_loss": -7.013629913330078, "global_step": 157550, "epoch": 3751} {"train_loss": -6.935846328735352, "global_step": 157551, "epoch": 3751} {"train_loss": -6.9080657958984375, "global_step": 157552, "epoch": 3751} {"train_loss": -7.063044548034668, "global_step": 157553, "epoch": 3751} {"train_loss": -6.962460517883301, "global_step": 157554, "epoch": 3751} {"train_loss": -6.872964859008789, "global_step": 157555, "epoch": 3751} {"train_loss": -7.0118255615234375, "global_step": 157556, "epoch": 3751} {"train_loss": -6.952301979064941, "global_step": 157557, "epoch": 3751} {"train_loss": -6.995223045349121, "global_step": 157558, "epoch": 3751} {"train_loss": -6.988411903381348, "global_step": 157559, "epoch": 3751} {"train_loss": -6.898739814758301, "global_step": 157560, "epoch": 3751} {"train_loss": -7.030204772949219, "global_step": 157561, "epoch": 3751} {"train_loss": -7.008265495300293, "global_step": 157562, "epoch": 3751} {"train_loss": -6.869290351867676, "global_step": 157563, "epoch": 3751} {"train_loss": -6.924772262573242, "global_step": 157564, "epoch": 3751} {"train_loss": -6.815243721008301, "global_step": 157565, "epoch": 3751} {"train_loss": -6.83488655090332, "global_step": 157566, "epoch": 3751} {"train_loss": -6.84470272064209, "global_step": 157567, "epoch": 3751} {"train_loss": -6.956786155700684, "global_step": 157568, "epoch": 3751} {"train_loss": -6.9007744789123535, "global_step": 157569, "epoch": 3751} {"train_loss": -6.886171340942383, "global_step": 157570, "epoch": 3751} {"train_loss": -6.874349594116211, "global_step": 157571, "epoch": 3751} {"train_loss": -6.791888236999512, "global_step": 157572, "epoch": 3751} {"train_loss": -6.955440521240234, "global_step": 157573, "epoch": 3751} {"train_loss": -6.9458417892456055, "global_step": 157574, "epoch": 3751} {"train_loss": -6.962124824523926, "global_step": 157575, "epoch": 3751} {"train_loss": -6.897906303405762, "global_step": 157576, "epoch": 3751} {"train_loss": -6.962265968322754, "global_step": 157577, "epoch": 3751} {"train_loss": -6.911548137664795, "global_step": 157578, "epoch": 3751} {"train_loss": -6.918838977813721, "global_step": 157579, "epoch": 3751} {"train_loss": -6.858452320098877, "global_step": 157580, "epoch": 3751} {"train_loss": -6.920034885406494, "global_step": 157581, "epoch": 3751} {"train_loss": -6.962462425231934, "global_step": 157582, "epoch": 3751} {"train_loss": -6.944948798134213, "global_step": 157583, "epoch": 3751, "val_loss": 68338.7421875} {"train_loss": -6.944573402404785, "global_step": 157584, "epoch": 3752} {"train_loss": -6.974270820617676, "global_step": 157585, "epoch": 3752} {"train_loss": -6.945924758911133, "global_step": 157586, "epoch": 3752} {"train_loss": -7.039499282836914, "global_step": 157587, "epoch": 3752} {"train_loss": -7.020096778869629, "global_step": 157588, "epoch": 3752} {"train_loss": -6.984670639038086, "global_step": 157589, "epoch": 3752} {"train_loss": -6.944300651550293, "global_step": 157590, "epoch": 3752} {"train_loss": -7.031002044677734, "global_step": 157591, "epoch": 3752} {"train_loss": -7.058013916015625, "global_step": 157592, "epoch": 3752} {"train_loss": -6.860671520233154, "global_step": 157593, "epoch": 3752} {"train_loss": -6.848471641540527, "global_step": 157594, "epoch": 3752} {"train_loss": -6.931278228759766, "global_step": 157595, "epoch": 3752} {"train_loss": -6.985291481018066, "global_step": 157596, "epoch": 3752} {"train_loss": -6.907242298126221, "global_step": 157597, "epoch": 3752} {"train_loss": -6.898225784301758, "global_step": 157598, "epoch": 3752} {"train_loss": -6.884274959564209, "global_step": 157599, "epoch": 3752} {"train_loss": -6.91535758972168, "global_step": 157600, "epoch": 3752} {"train_loss": -6.931157112121582, "global_step": 157601, "epoch": 3752} {"train_loss": -6.945505142211914, "global_step": 157602, "epoch": 3752} {"train_loss": -6.929775238037109, "global_step": 157603, "epoch": 3752} {"train_loss": -6.925530910491943, "global_step": 157604, "epoch": 3752} {"train_loss": -6.946211338043213, "global_step": 157605, "epoch": 3752} {"train_loss": -6.888852119445801, "global_step": 157606, "epoch": 3752} {"train_loss": -6.909424781799316, "global_step": 157607, "epoch": 3752} {"train_loss": -6.833591461181641, "global_step": 157608, "epoch": 3752} {"train_loss": -6.882373809814453, "global_step": 157609, "epoch": 3752} {"train_loss": -7.018893241882324, "global_step": 157610, "epoch": 3752} {"train_loss": -6.84858512878418, "global_step": 157611, "epoch": 3752} {"train_loss": -6.937804222106934, "global_step": 157612, "epoch": 3752} {"train_loss": -7.004945755004883, "global_step": 157613, "epoch": 3752} {"train_loss": -6.753862380981445, "global_step": 157614, "epoch": 3752} {"train_loss": -6.973255157470703, "global_step": 157615, "epoch": 3752} {"train_loss": -6.804471492767334, "global_step": 157616, "epoch": 3752} {"train_loss": -6.854111194610596, "global_step": 157617, "epoch": 3752} {"train_loss": -6.879555702209473, "global_step": 157618, "epoch": 3752} {"train_loss": -6.876046180725098, "global_step": 157619, "epoch": 3752} {"train_loss": -7.0109405517578125, "global_step": 157620, "epoch": 3752} {"train_loss": -6.925191402435303, "global_step": 157621, "epoch": 3752} {"train_loss": -7.052809715270996, "global_step": 157622, "epoch": 3752} {"train_loss": -6.98292350769043, "global_step": 157623, "epoch": 3752} {"train_loss": -6.844074249267578, "global_step": 157624, "epoch": 3752} {"train_loss": -6.932427167892456, "global_step": 157625, "epoch": 3752, "val_loss": 68445.6875} {"train_loss": -6.920143127441406, "global_step": 157626, "epoch": 3753} {"train_loss": -6.9361572265625, "global_step": 157627, "epoch": 3753} {"train_loss": -6.974440574645996, "global_step": 157628, "epoch": 3753} {"train_loss": -6.941075325012207, "global_step": 157629, "epoch": 3753} {"train_loss": -6.897332191467285, "global_step": 157630, "epoch": 3753} {"train_loss": -6.890283584594727, "global_step": 157631, "epoch": 3753} {"train_loss": -6.91079044342041, "global_step": 157632, "epoch": 3753} {"train_loss": -6.959416389465332, "global_step": 157633, "epoch": 3753} {"train_loss": -6.993899822235107, "global_step": 157634, "epoch": 3753} {"train_loss": -7.017045021057129, "global_step": 157635, "epoch": 3753} {"train_loss": -7.020831108093262, "global_step": 157636, "epoch": 3753} {"train_loss": -6.8863205909729, "global_step": 157637, "epoch": 3753} {"train_loss": -6.885707378387451, "global_step": 157638, "epoch": 3753} {"train_loss": -6.913875579833984, "global_step": 157639, "epoch": 3753} {"train_loss": -6.903824806213379, "global_step": 157640, "epoch": 3753} {"train_loss": -7.104040622711182, "global_step": 157641, "epoch": 3753} {"train_loss": -6.966606140136719, "global_step": 157642, "epoch": 3753} {"train_loss": -6.83250617980957, "global_step": 157643, "epoch": 3753} {"train_loss": -6.858243465423584, "global_step": 157644, "epoch": 3753} {"train_loss": -7.025097846984863, "global_step": 157645, "epoch": 3753} {"train_loss": -6.947710037231445, "global_step": 157646, "epoch": 3753} {"train_loss": -6.948647499084473, "global_step": 157647, "epoch": 3753} {"train_loss": -6.890077590942383, "global_step": 157648, "epoch": 3753} {"train_loss": -6.974993705749512, "global_step": 157649, "epoch": 3753} {"train_loss": -6.96964693069458, "global_step": 157650, "epoch": 3753} {"train_loss": -6.923418998718262, "global_step": 157651, "epoch": 3753} {"train_loss": -6.8665266036987305, "global_step": 157652, "epoch": 3753} {"train_loss": -6.947356224060059, "global_step": 157653, "epoch": 3753} {"train_loss": -6.749476909637451, "global_step": 157654, "epoch": 3753} {"train_loss": -6.834361553192139, "global_step": 157655, "epoch": 3753} {"train_loss": -6.9631147384643555, "global_step": 157656, "epoch": 3753} {"train_loss": -6.8914103507995605, "global_step": 157657, "epoch": 3753} {"train_loss": -6.89591121673584, "global_step": 157658, "epoch": 3753} {"train_loss": -6.86571741104126, "global_step": 157659, "epoch": 3753} {"train_loss": -7.014822006225586, "global_step": 157660, "epoch": 3753} {"train_loss": -6.962820053100586, "global_step": 157661, "epoch": 3753} {"train_loss": -6.9924116134643555, "global_step": 157662, "epoch": 3753} {"train_loss": -6.941250324249268, "global_step": 157663, "epoch": 3753} {"train_loss": -6.970473766326904, "global_step": 157664, "epoch": 3753} {"train_loss": -6.976025581359863, "global_step": 157665, "epoch": 3753} {"train_loss": -6.824953079223633, "global_step": 157666, "epoch": 3753} {"train_loss": -6.931107691356114, "global_step": 157667, "epoch": 3753, "val_loss": 68522.4453125} {"train_loss": -6.956546783447266, "global_step": 157668, "epoch": 3754} {"train_loss": -6.856972694396973, "global_step": 157669, "epoch": 3754} {"train_loss": -6.9198102951049805, "global_step": 157670, "epoch": 3754} {"train_loss": -6.927921295166016, "global_step": 157671, "epoch": 3754} {"train_loss": -6.957012176513672, "global_step": 157672, "epoch": 3754} {"train_loss": -6.870648384094238, "global_step": 157673, "epoch": 3754} {"train_loss": -6.879630088806152, "global_step": 157674, "epoch": 3754} {"train_loss": -6.908674240112305, "global_step": 157675, "epoch": 3754} {"train_loss": -6.840936660766602, "global_step": 157676, "epoch": 3754} {"train_loss": -6.903317451477051, "global_step": 157677, "epoch": 3754} {"train_loss": -6.906899452209473, "global_step": 157678, "epoch": 3754} {"train_loss": -6.819789886474609, "global_step": 157679, "epoch": 3754} {"train_loss": -6.892544746398926, "global_step": 157680, "epoch": 3754} {"train_loss": -6.908755302429199, "global_step": 157681, "epoch": 3754} {"train_loss": -6.843746185302734, "global_step": 157682, "epoch": 3754} {"train_loss": -6.803586959838867, "global_step": 157683, "epoch": 3754} {"train_loss": -6.9401397705078125, "global_step": 157684, "epoch": 3754} {"train_loss": -6.830321311950684, "global_step": 157685, "epoch": 3754} {"train_loss": -6.938772678375244, "global_step": 157686, "epoch": 3754} {"train_loss": -6.916731834411621, "global_step": 157687, "epoch": 3754} {"train_loss": -6.992622375488281, "global_step": 157688, "epoch": 3754} {"train_loss": -6.966438293457031, "global_step": 157689, "epoch": 3754} {"train_loss": -6.916405200958252, "global_step": 157690, "epoch": 3754} {"train_loss": -6.820302486419678, "global_step": 157691, "epoch": 3754} {"train_loss": -6.850751876831055, "global_step": 157692, "epoch": 3754} {"train_loss": -6.799494743347168, "global_step": 157693, "epoch": 3754} {"train_loss": -6.76033878326416, "global_step": 157694, "epoch": 3754} {"train_loss": -6.970757961273193, "global_step": 157695, "epoch": 3754} {"train_loss": -6.92641544342041, "global_step": 157696, "epoch": 3754} {"train_loss": -6.745572090148926, "global_step": 157697, "epoch": 3754} {"train_loss": -6.942841529846191, "global_step": 157698, "epoch": 3754} {"train_loss": -6.861255645751953, "global_step": 157699, "epoch": 3754} {"train_loss": -6.850897789001465, "global_step": 157700, "epoch": 3754} {"train_loss": -6.977777481079102, "global_step": 157701, "epoch": 3754} {"train_loss": -6.817342758178711, "global_step": 157702, "epoch": 3754} {"train_loss": -6.965394973754883, "global_step": 157703, "epoch": 3754} {"train_loss": -6.8566389083862305, "global_step": 157704, "epoch": 3754} {"train_loss": -6.9465789794921875, "global_step": 157705, "epoch": 3754} {"train_loss": -6.962498664855957, "global_step": 157706, "epoch": 3754} {"train_loss": -6.833325386047363, "global_step": 157707, "epoch": 3754} {"train_loss": -6.998224258422852, "global_step": 157708, "epoch": 3754} {"train_loss": -6.895477215449016, "global_step": 157709, "epoch": 3754, "val_loss": 68521.9140625} {"train_loss": -6.989859580993652, "global_step": 157710, "epoch": 3755} {"train_loss": -6.949965476989746, "global_step": 157711, "epoch": 3755} {"train_loss": -6.954470634460449, "global_step": 157712, "epoch": 3755} {"train_loss": -7.016174793243408, "global_step": 157713, "epoch": 3755} {"train_loss": -6.933592796325684, "global_step": 157714, "epoch": 3755} {"train_loss": -6.938596725463867, "global_step": 157715, "epoch": 3755} {"train_loss": -6.975787162780762, "global_step": 157716, "epoch": 3755} {"train_loss": -6.971550941467285, "global_step": 157717, "epoch": 3755} {"train_loss": -6.903847694396973, "global_step": 157718, "epoch": 3755} {"train_loss": -6.943516731262207, "global_step": 157719, "epoch": 3755} {"train_loss": -6.990898132324219, "global_step": 157720, "epoch": 3755} {"train_loss": -6.924363136291504, "global_step": 157721, "epoch": 3755} {"train_loss": -6.837137699127197, "global_step": 157722, "epoch": 3755} {"train_loss": -6.977712631225586, "global_step": 157723, "epoch": 3755} {"train_loss": -6.943638801574707, "global_step": 157724, "epoch": 3755} {"train_loss": -6.9969587326049805, "global_step": 157725, "epoch": 3755} {"train_loss": -6.904359817504883, "global_step": 157726, "epoch": 3755} {"train_loss": -6.991453170776367, "global_step": 157727, "epoch": 3755} {"train_loss": -6.949638843536377, "global_step": 157728, "epoch": 3755} {"train_loss": -6.984750270843506, "global_step": 157729, "epoch": 3755} {"train_loss": -6.863530158996582, "global_step": 157730, "epoch": 3755} {"train_loss": -6.96672248840332, "global_step": 157731, "epoch": 3755} {"train_loss": -6.898132801055908, "global_step": 157732, "epoch": 3755} {"train_loss": -6.985819339752197, "global_step": 157733, "epoch": 3755} {"train_loss": -6.940899848937988, "global_step": 157734, "epoch": 3755} {"train_loss": -6.976096153259277, "global_step": 157735, "epoch": 3755} {"train_loss": -6.929403305053711, "global_step": 157736, "epoch": 3755} {"train_loss": -6.945169448852539, "global_step": 157737, "epoch": 3755} {"train_loss": -6.883375644683838, "global_step": 157738, "epoch": 3755} {"train_loss": -6.828551292419434, "global_step": 157739, "epoch": 3755} {"train_loss": -7.067778587341309, "global_step": 157740, "epoch": 3755} {"train_loss": -6.830265998840332, "global_step": 157741, "epoch": 3755} {"train_loss": -6.905185699462891, "global_step": 157742, "epoch": 3755} {"train_loss": -6.890252113342285, "global_step": 157743, "epoch": 3755} {"train_loss": -6.843976974487305, "global_step": 157744, "epoch": 3755} {"train_loss": -6.854102611541748, "global_step": 157745, "epoch": 3755} {"train_loss": -6.954793453216553, "global_step": 157746, "epoch": 3755} {"train_loss": -6.810965538024902, "global_step": 157747, "epoch": 3755} {"train_loss": -6.850503921508789, "global_step": 157748, "epoch": 3755} {"train_loss": -6.880713939666748, "global_step": 157749, "epoch": 3755} {"train_loss": -6.921030044555664, "global_step": 157750, "epoch": 3755} {"train_loss": -6.926028001876104, "global_step": 157751, "epoch": 3755, "val_loss": 68489.7890625} {"train_loss": -6.846129417419434, "global_step": 157752, "epoch": 3756} {"train_loss": -6.870383262634277, "global_step": 157753, "epoch": 3756} {"train_loss": -6.676058292388916, "global_step": 157754, "epoch": 3756} {"train_loss": -6.9787821769714355, "global_step": 157755, "epoch": 3756} {"train_loss": -6.7521772384643555, "global_step": 157756, "epoch": 3756} {"train_loss": -6.80355978012085, "global_step": 157757, "epoch": 3756} {"train_loss": -6.8666863441467285, "global_step": 157758, "epoch": 3756} {"train_loss": -6.706245422363281, "global_step": 157759, "epoch": 3756} {"train_loss": -6.818130970001221, "global_step": 157760, "epoch": 3756} {"train_loss": -6.843449115753174, "global_step": 157761, "epoch": 3756} {"train_loss": -6.764505386352539, "global_step": 157762, "epoch": 3756} {"train_loss": -6.781545639038086, "global_step": 157763, "epoch": 3756} {"train_loss": -6.8725786209106445, "global_step": 157764, "epoch": 3756} {"train_loss": -6.890160083770752, "global_step": 157765, "epoch": 3756} {"train_loss": -6.924328327178955, "global_step": 157766, "epoch": 3756} {"train_loss": -6.701898574829102, "global_step": 157767, "epoch": 3756} {"train_loss": -6.7912397384643555, "global_step": 157768, "epoch": 3756} {"train_loss": -6.938848495483398, "global_step": 157769, "epoch": 3756} {"train_loss": -6.76271915435791, "global_step": 157770, "epoch": 3756} {"train_loss": -6.927833080291748, "global_step": 157771, "epoch": 3756} {"train_loss": -6.794353485107422, "global_step": 157772, "epoch": 3756} {"train_loss": -6.913348197937012, "global_step": 157773, "epoch": 3756} {"train_loss": -6.919962406158447, "global_step": 157774, "epoch": 3756} {"train_loss": -6.817992210388184, "global_step": 157775, "epoch": 3756} {"train_loss": -6.914021015167236, "global_step": 157776, "epoch": 3756} {"train_loss": -6.852083683013916, "global_step": 157777, "epoch": 3756} {"train_loss": -6.856015682220459, "global_step": 157778, "epoch": 3756} {"train_loss": -6.892959117889404, "global_step": 157779, "epoch": 3756} {"train_loss": -6.802234172821045, "global_step": 157780, "epoch": 3756} {"train_loss": -6.885348320007324, "global_step": 157781, "epoch": 3756} {"train_loss": -6.929958820343018, "global_step": 157782, "epoch": 3756} {"train_loss": -6.956325054168701, "global_step": 157783, "epoch": 3756} {"train_loss": -6.9356489181518555, "global_step": 157784, "epoch": 3756} {"train_loss": -6.859813690185547, "global_step": 157785, "epoch": 3756} {"train_loss": -6.947667121887207, "global_step": 157786, "epoch": 3756} {"train_loss": -6.967440605163574, "global_step": 157787, "epoch": 3756} {"train_loss": -6.968332767486572, "global_step": 157788, "epoch": 3756} {"train_loss": -6.9618048667907715, "global_step": 157789, "epoch": 3756} {"train_loss": -6.961855888366699, "global_step": 157790, "epoch": 3756} {"train_loss": -6.928524971008301, "global_step": 157791, "epoch": 3756} {"train_loss": -7.017927646636963, "global_step": 157792, "epoch": 3756} {"train_loss": -6.867826529911587, "global_step": 157793, "epoch": 3756, "val_loss": 68450.2734375} {"train_loss": -6.953502655029297, "global_step": 157794, "epoch": 3757} {"train_loss": -6.931122303009033, "global_step": 157795, "epoch": 3757} {"train_loss": -7.024115562438965, "global_step": 157796, "epoch": 3757} {"train_loss": -6.840334892272949, "global_step": 157797, "epoch": 3757} {"train_loss": -6.858989715576172, "global_step": 157798, "epoch": 3757} {"train_loss": -6.853817939758301, "global_step": 157799, "epoch": 3757} {"train_loss": -6.950592041015625, "global_step": 157800, "epoch": 3757} {"train_loss": -6.893685817718506, "global_step": 157801, "epoch": 3757} {"train_loss": -7.000428199768066, "global_step": 157802, "epoch": 3757} {"train_loss": -6.963225841522217, "global_step": 157803, "epoch": 3757} {"train_loss": -6.8972601890563965, "global_step": 157804, "epoch": 3757} {"train_loss": -6.902170181274414, "global_step": 157805, "epoch": 3757} {"train_loss": -7.048479080200195, "global_step": 157806, "epoch": 3757} {"train_loss": -6.997199058532715, "global_step": 157807, "epoch": 3757} {"train_loss": -6.935935020446777, "global_step": 157808, "epoch": 3757} {"train_loss": -6.916450023651123, "global_step": 157809, "epoch": 3757} {"train_loss": -6.9992451667785645, "global_step": 157810, "epoch": 3757} {"train_loss": -6.879466533660889, "global_step": 157811, "epoch": 3757} {"train_loss": -6.783164978027344, "global_step": 157812, "epoch": 3757} {"train_loss": -7.015079975128174, "global_step": 157813, "epoch": 3757} {"train_loss": -6.952888488769531, "global_step": 157814, "epoch": 3757} {"train_loss": -6.929166316986084, "global_step": 157815, "epoch": 3757} {"train_loss": -6.9181742668151855, "global_step": 157816, "epoch": 3757} {"train_loss": -6.914259910583496, "global_step": 157817, "epoch": 3757} {"train_loss": -6.9337053298950195, "global_step": 157818, "epoch": 3757} {"train_loss": -6.885566711425781, "global_step": 157819, "epoch": 3757} {"train_loss": -6.882026672363281, "global_step": 157820, "epoch": 3757} {"train_loss": -6.904813289642334, "global_step": 157821, "epoch": 3757} {"train_loss": -6.937981605529785, "global_step": 157822, "epoch": 3757} {"train_loss": -6.850517749786377, "global_step": 157823, "epoch": 3757} {"train_loss": -6.884972095489502, "global_step": 157824, "epoch": 3757} {"train_loss": -6.893320083618164, "global_step": 157825, "epoch": 3757} {"train_loss": -6.955244541168213, "global_step": 157826, "epoch": 3757} {"train_loss": -6.757739067077637, "global_step": 157827, "epoch": 3757} {"train_loss": -6.804161548614502, "global_step": 157828, "epoch": 3757} {"train_loss": -6.75680685043335, "global_step": 157829, "epoch": 3757} {"train_loss": -6.658267974853516, "global_step": 157830, "epoch": 3757} {"train_loss": -6.8222174644470215, "global_step": 157831, "epoch": 3757} {"train_loss": -6.844256401062012, "global_step": 157832, "epoch": 3757} {"train_loss": -6.920515060424805, "global_step": 157833, "epoch": 3757} {"train_loss": -6.9119439125061035, "global_step": 157834, "epoch": 3757} {"train_loss": -6.8966170606159025, "global_step": 157835, "epoch": 3757, "val_loss": 68403.921875} {"train_loss": -6.990335941314697, "global_step": 157836, "epoch": 3758} {"train_loss": -6.778324604034424, "global_step": 157837, "epoch": 3758} {"train_loss": -6.871701240539551, "global_step": 157838, "epoch": 3758} {"train_loss": -6.736390113830566, "global_step": 157839, "epoch": 3758} {"train_loss": -6.779899597167969, "global_step": 157840, "epoch": 3758} {"train_loss": -6.926729202270508, "global_step": 157841, "epoch": 3758} {"train_loss": -6.6744384765625, "global_step": 157842, "epoch": 3758} {"train_loss": -6.848262786865234, "global_step": 157843, "epoch": 3758} {"train_loss": -6.63309383392334, "global_step": 157844, "epoch": 3758} {"train_loss": -6.882272720336914, "global_step": 157845, "epoch": 3758} {"train_loss": -6.699963569641113, "global_step": 157846, "epoch": 3758} {"train_loss": -6.966245174407959, "global_step": 157847, "epoch": 3758} {"train_loss": -6.897160530090332, "global_step": 157848, "epoch": 3758} {"train_loss": -6.9278364181518555, "global_step": 157849, "epoch": 3758} {"train_loss": -6.876267910003662, "global_step": 157850, "epoch": 3758} {"train_loss": -6.918753623962402, "global_step": 157851, "epoch": 3758} {"train_loss": -6.927080154418945, "global_step": 157852, "epoch": 3758} {"train_loss": -6.912508010864258, "global_step": 157853, "epoch": 3758} {"train_loss": -6.751154899597168, "global_step": 157854, "epoch": 3758} {"train_loss": -6.916505813598633, "global_step": 157855, "epoch": 3758} {"train_loss": -6.812813758850098, "global_step": 157856, "epoch": 3758} {"train_loss": -6.8325910568237305, "global_step": 157857, "epoch": 3758} {"train_loss": -6.990362167358398, "global_step": 157858, "epoch": 3758} {"train_loss": -6.872908592224121, "global_step": 157859, "epoch": 3758} {"train_loss": -6.730932235717773, "global_step": 157860, "epoch": 3758} {"train_loss": -6.816145896911621, "global_step": 157861, "epoch": 3758} {"train_loss": -6.887542724609375, "global_step": 157862, "epoch": 3758} {"train_loss": -6.878687381744385, "global_step": 157863, "epoch": 3758} {"train_loss": -6.835694789886475, "global_step": 157864, "epoch": 3758} {"train_loss": -6.831578731536865, "global_step": 157865, "epoch": 3758} {"train_loss": -6.857257843017578, "global_step": 157866, "epoch": 3758} {"train_loss": -6.941690921783447, "global_step": 157867, "epoch": 3758} {"train_loss": -6.867114543914795, "global_step": 157868, "epoch": 3758} {"train_loss": -6.9358038902282715, "global_step": 157869, "epoch": 3758} {"train_loss": -6.969898223876953, "global_step": 157870, "epoch": 3758} {"train_loss": -6.86588191986084, "global_step": 157871, "epoch": 3758} {"train_loss": -6.977406024932861, "global_step": 157872, "epoch": 3758} {"train_loss": -6.864830017089844, "global_step": 157873, "epoch": 3758} {"train_loss": -6.828998565673828, "global_step": 157874, "epoch": 3758} {"train_loss": -6.819612503051758, "global_step": 157875, "epoch": 3758} {"train_loss": -6.846525192260742, "global_step": 157876, "epoch": 3758} {"train_loss": -6.858197087333316, "global_step": 157877, "epoch": 3758, "val_loss": 68564.7578125} {"train_loss": -6.887684345245361, "global_step": 157878, "epoch": 3759} {"train_loss": -6.82163143157959, "global_step": 157879, "epoch": 3759} {"train_loss": -6.959010124206543, "global_step": 157880, "epoch": 3759} {"train_loss": -6.911128520965576, "global_step": 157881, "epoch": 3759} {"train_loss": -6.832759857177734, "global_step": 157882, "epoch": 3759} {"train_loss": -6.9050397872924805, "global_step": 157883, "epoch": 3759} {"train_loss": -6.903774738311768, "global_step": 157884, "epoch": 3759} {"train_loss": -6.846776008605957, "global_step": 157885, "epoch": 3759} {"train_loss": -6.883058071136475, "global_step": 157886, "epoch": 3759} {"train_loss": -7.0125226974487305, "global_step": 157887, "epoch": 3759} {"train_loss": -6.99822998046875, "global_step": 157888, "epoch": 3759} {"train_loss": -6.964339256286621, "global_step": 157889, "epoch": 3759} {"train_loss": -6.884282112121582, "global_step": 157890, "epoch": 3759} {"train_loss": -6.981741905212402, "global_step": 157891, "epoch": 3759} {"train_loss": -7.018049240112305, "global_step": 157892, "epoch": 3759} {"train_loss": -6.8843889236450195, "global_step": 157893, "epoch": 3759} {"train_loss": -6.900109767913818, "global_step": 157894, "epoch": 3759} {"train_loss": -7.036722183227539, "global_step": 157895, "epoch": 3759} {"train_loss": -6.861337661743164, "global_step": 157896, "epoch": 3759} {"train_loss": -6.953216552734375, "global_step": 157897, "epoch": 3759} {"train_loss": -6.845270156860352, "global_step": 157898, "epoch": 3759} {"train_loss": -6.985074043273926, "global_step": 157899, "epoch": 3759} {"train_loss": -6.828854560852051, "global_step": 157900, "epoch": 3759} {"train_loss": -6.851558685302734, "global_step": 157901, "epoch": 3759} {"train_loss": -7.067617416381836, "global_step": 157902, "epoch": 3759} {"train_loss": -6.9506001472473145, "global_step": 157903, "epoch": 3759} {"train_loss": -7.002353668212891, "global_step": 157904, "epoch": 3759} {"train_loss": -6.9331769943237305, "global_step": 157905, "epoch": 3759} {"train_loss": -6.934660911560059, "global_step": 157906, "epoch": 3759} {"train_loss": -6.897125720977783, "global_step": 157907, "epoch": 3759} {"train_loss": -6.897340774536133, "global_step": 157908, "epoch": 3759} {"train_loss": -6.936859130859375, "global_step": 157909, "epoch": 3759} {"train_loss": -6.961747646331787, "global_step": 157910, "epoch": 3759} {"train_loss": -6.8562421798706055, "global_step": 157911, "epoch": 3759} {"train_loss": -6.864320755004883, "global_step": 157912, "epoch": 3759} {"train_loss": -6.8861985206604, "global_step": 157913, "epoch": 3759} {"train_loss": -6.733835220336914, "global_step": 157914, "epoch": 3759} {"train_loss": -6.928523540496826, "global_step": 157915, "epoch": 3759} {"train_loss": -6.923463344573975, "global_step": 157916, "epoch": 3759} {"train_loss": -6.897652626037598, "global_step": 157917, "epoch": 3759} {"train_loss": -6.9599761962890625, "global_step": 157918, "epoch": 3759} {"train_loss": -6.91631631624131, "global_step": 157919, "epoch": 3759, "val_loss": 68268.0078125} {"train_loss": -6.916154861450195, "global_step": 157920, "epoch": 3760} {"train_loss": -7.102428913116455, "global_step": 157921, "epoch": 3760} {"train_loss": -6.945052146911621, "global_step": 157922, "epoch": 3760} {"train_loss": -7.018196105957031, "global_step": 157923, "epoch": 3760} {"train_loss": -6.8167572021484375, "global_step": 157924, "epoch": 3760} {"train_loss": -6.927746772766113, "global_step": 157925, "epoch": 3760} {"train_loss": -6.959437370300293, "global_step": 157926, "epoch": 3760} {"train_loss": -6.8929219245910645, "global_step": 157927, "epoch": 3760} {"train_loss": -6.989922046661377, "global_step": 157928, "epoch": 3760} {"train_loss": -6.854124546051025, "global_step": 157929, "epoch": 3760} {"train_loss": -6.972789287567139, "global_step": 157930, "epoch": 3760} {"train_loss": -7.012010097503662, "global_step": 157931, "epoch": 3760} {"train_loss": -6.916075706481934, "global_step": 157932, "epoch": 3760} {"train_loss": -7.023677825927734, "global_step": 157933, "epoch": 3760} {"train_loss": -6.942129135131836, "global_step": 157934, "epoch": 3760} {"train_loss": -6.880301475524902, "global_step": 157935, "epoch": 3760} {"train_loss": -7.025054454803467, "global_step": 157936, "epoch": 3760} {"train_loss": -6.8253068923950195, "global_step": 157937, "epoch": 3760} {"train_loss": -6.946806907653809, "global_step": 157938, "epoch": 3760} {"train_loss": -6.940792083740234, "global_step": 157939, "epoch": 3760} {"train_loss": -6.9015116691589355, "global_step": 157940, "epoch": 3760} {"train_loss": -7.034839630126953, "global_step": 157941, "epoch": 3760} {"train_loss": -7.040261268615723, "global_step": 157942, "epoch": 3760} {"train_loss": -6.994977951049805, "global_step": 157943, "epoch": 3760} {"train_loss": -6.839443683624268, "global_step": 157944, "epoch": 3760} {"train_loss": -6.9732561111450195, "global_step": 157945, "epoch": 3760} {"train_loss": -6.976039886474609, "global_step": 157946, "epoch": 3760} {"train_loss": -6.79913854598999, "global_step": 157947, "epoch": 3760} {"train_loss": -6.852309226989746, "global_step": 157948, "epoch": 3760} {"train_loss": -7.019763946533203, "global_step": 157949, "epoch": 3760} {"train_loss": -6.843047142028809, "global_step": 157950, "epoch": 3760} {"train_loss": -6.96087121963501, "global_step": 157951, "epoch": 3760} {"train_loss": -6.914135932922363, "global_step": 157952, "epoch": 3760} {"train_loss": -6.772151470184326, "global_step": 157953, "epoch": 3760} {"train_loss": -6.860384941101074, "global_step": 157954, "epoch": 3760} {"train_loss": -6.864647388458252, "global_step": 157955, "epoch": 3760} {"train_loss": -7.00381326675415, "global_step": 157956, "epoch": 3760} {"train_loss": -6.815364360809326, "global_step": 157957, "epoch": 3760} {"train_loss": -6.7326860427856445, "global_step": 157958, "epoch": 3760} {"train_loss": -6.957212448120117, "global_step": 157959, "epoch": 3760} {"train_loss": -6.881467819213867, "global_step": 157960, "epoch": 3760} {"train_loss": -6.926674070812407, "global_step": 157961, "epoch": 3760, "val_loss": 68496.5390625} {"train_loss": -6.889825820922852, "global_step": 157962, "epoch": 3761} {"train_loss": -6.916111946105957, "global_step": 157963, "epoch": 3761} {"train_loss": -6.880764007568359, "global_step": 157964, "epoch": 3761} {"train_loss": -6.894705295562744, "global_step": 157965, "epoch": 3761} {"train_loss": -6.943535804748535, "global_step": 157966, "epoch": 3761} {"train_loss": -6.82078218460083, "global_step": 157967, "epoch": 3761} {"train_loss": -6.882424354553223, "global_step": 157968, "epoch": 3761} {"train_loss": -6.950233459472656, "global_step": 157969, "epoch": 3761} {"train_loss": -6.8938446044921875, "global_step": 157970, "epoch": 3761} {"train_loss": -6.871150016784668, "global_step": 157971, "epoch": 3761} {"train_loss": -6.929965972900391, "global_step": 157972, "epoch": 3761} {"train_loss": -6.918009281158447, "global_step": 157973, "epoch": 3761} {"train_loss": -7.015435218811035, "global_step": 157974, "epoch": 3761} {"train_loss": -6.909609794616699, "global_step": 157975, "epoch": 3761} {"train_loss": -6.856308937072754, "global_step": 157976, "epoch": 3761} {"train_loss": -6.9558820724487305, "global_step": 157977, "epoch": 3761} {"train_loss": -6.974443435668945, "global_step": 157978, "epoch": 3761} {"train_loss": -7.0223870277404785, "global_step": 157979, "epoch": 3761} {"train_loss": -6.931905746459961, "global_step": 157980, "epoch": 3761} {"train_loss": -6.8231425285339355, "global_step": 157981, "epoch": 3761} {"train_loss": -6.947294235229492, "global_step": 157982, "epoch": 3761} {"train_loss": -6.861682891845703, "global_step": 157983, "epoch": 3761} {"train_loss": -6.930822849273682, "global_step": 157984, "epoch": 3761} {"train_loss": -6.938539981842041, "global_step": 157985, "epoch": 3761} {"train_loss": -6.8118720054626465, "global_step": 157986, "epoch": 3761} {"train_loss": -7.0138702392578125, "global_step": 157987, "epoch": 3761} {"train_loss": -6.819053649902344, "global_step": 157988, "epoch": 3761} {"train_loss": -6.945953845977783, "global_step": 157989, "epoch": 3761} {"train_loss": -7.014655113220215, "global_step": 157990, "epoch": 3761} {"train_loss": -6.835814476013184, "global_step": 157991, "epoch": 3761} {"train_loss": -7.056241035461426, "global_step": 157992, "epoch": 3761} {"train_loss": -6.88823938369751, "global_step": 157993, "epoch": 3761} {"train_loss": -6.916378974914551, "global_step": 157994, "epoch": 3761} {"train_loss": -6.979820728302002, "global_step": 157995, "epoch": 3761} {"train_loss": -6.946311950683594, "global_step": 157996, "epoch": 3761} {"train_loss": -6.884185791015625, "global_step": 157997, "epoch": 3761} {"train_loss": -6.830039978027344, "global_step": 157998, "epoch": 3761} {"train_loss": -6.909618377685547, "global_step": 157999, "epoch": 3761} {"train_loss": -6.986727714538574, "global_step": 158000, "epoch": 3761} {"train_loss": -6.861464500427246, "global_step": 158001, "epoch": 3761} {"train_loss": -6.824270248413086, "global_step": 158002, "epoch": 3761} {"train_loss": -6.916187309083485, "global_step": 158003, "epoch": 3761, "val_loss": 68298.6015625} {"train_loss": -6.9792914390563965, "global_step": 158004, "epoch": 3762} {"train_loss": -6.9018168449401855, "global_step": 158005, "epoch": 3762} {"train_loss": -6.912286758422852, "global_step": 158006, "epoch": 3762} {"train_loss": -6.923816204071045, "global_step": 158007, "epoch": 3762} {"train_loss": -7.009332656860352, "global_step": 158008, "epoch": 3762} {"train_loss": -6.934637069702148, "global_step": 158009, "epoch": 3762} {"train_loss": -6.897525310516357, "global_step": 158010, "epoch": 3762} {"train_loss": -6.849340438842773, "global_step": 158011, "epoch": 3762} {"train_loss": -6.922455787658691, "global_step": 158012, "epoch": 3762} {"train_loss": -7.036148548126221, "global_step": 158013, "epoch": 3762} {"train_loss": -7.018378734588623, "global_step": 158014, "epoch": 3762} {"train_loss": -6.9750518798828125, "global_step": 158015, "epoch": 3762} {"train_loss": -6.964874267578125, "global_step": 158016, "epoch": 3762} {"train_loss": -7.023331642150879, "global_step": 158017, "epoch": 3762} {"train_loss": -7.001624584197998, "global_step": 158018, "epoch": 3762} {"train_loss": -6.94556999206543, "global_step": 158019, "epoch": 3762} {"train_loss": -6.9882941246032715, "global_step": 158020, "epoch": 3762} {"train_loss": -6.924887180328369, "global_step": 158021, "epoch": 3762} {"train_loss": -6.846561908721924, "global_step": 158022, "epoch": 3762} {"train_loss": -6.8705854415893555, "global_step": 158023, "epoch": 3762} {"train_loss": -6.796834945678711, "global_step": 158024, "epoch": 3762} {"train_loss": -6.945102691650391, "global_step": 158025, "epoch": 3762} {"train_loss": -6.907863616943359, "global_step": 158026, "epoch": 3762} {"train_loss": -6.947080612182617, "global_step": 158027, "epoch": 3762} {"train_loss": -7.098903179168701, "global_step": 158028, "epoch": 3762} {"train_loss": -6.95082950592041, "global_step": 158029, "epoch": 3762} {"train_loss": -7.008296966552734, "global_step": 158030, "epoch": 3762} {"train_loss": -7.0213422775268555, "global_step": 158031, "epoch": 3762} {"train_loss": -6.822304725646973, "global_step": 158032, "epoch": 3762} {"train_loss": -7.032387733459473, "global_step": 158033, "epoch": 3762} {"train_loss": -6.884611129760742, "global_step": 158034, "epoch": 3762} {"train_loss": -6.887263298034668, "global_step": 158035, "epoch": 3762} {"train_loss": -6.922210216522217, "global_step": 158036, "epoch": 3762} {"train_loss": -6.952408790588379, "global_step": 158037, "epoch": 3762} {"train_loss": -6.840234756469727, "global_step": 158038, "epoch": 3762} {"train_loss": -6.869976043701172, "global_step": 158039, "epoch": 3762} {"train_loss": -6.87493896484375, "global_step": 158040, "epoch": 3762} {"train_loss": -6.930741786956787, "global_step": 158041, "epoch": 3762} {"train_loss": -7.052639007568359, "global_step": 158042, "epoch": 3762} {"train_loss": -6.893363952636719, "global_step": 158043, "epoch": 3762} {"train_loss": -6.8996195793151855, "global_step": 158044, "epoch": 3762} {"train_loss": -6.937762975692749, "global_step": 158045, "epoch": 3762, "val_loss": 68441.4921875} {"train_loss": -6.767924785614014, "global_step": 158046, "epoch": 3763} {"train_loss": -7.013652801513672, "global_step": 158047, "epoch": 3763} {"train_loss": -7.065122604370117, "global_step": 158048, "epoch": 3763} {"train_loss": -6.996612548828125, "global_step": 158049, "epoch": 3763} {"train_loss": -6.953350067138672, "global_step": 158050, "epoch": 3763} {"train_loss": -6.970831871032715, "global_step": 158051, "epoch": 3763} {"train_loss": -6.979706764221191, "global_step": 158052, "epoch": 3763} {"train_loss": -6.884726524353027, "global_step": 158053, "epoch": 3763} {"train_loss": -6.964572429656982, "global_step": 158054, "epoch": 3763} {"train_loss": -6.8729047775268555, "global_step": 158055, "epoch": 3763} {"train_loss": -6.959166526794434, "global_step": 158056, "epoch": 3763} {"train_loss": -7.024892330169678, "global_step": 158057, "epoch": 3763} {"train_loss": -6.957596778869629, "global_step": 158058, "epoch": 3763} {"train_loss": -7.075352668762207, "global_step": 158059, "epoch": 3763} {"train_loss": -6.9387664794921875, "global_step": 158060, "epoch": 3763} {"train_loss": -7.0144805908203125, "global_step": 158061, "epoch": 3763} {"train_loss": -6.963539123535156, "global_step": 158062, "epoch": 3763} {"train_loss": -6.965307235717773, "global_step": 158063, "epoch": 3763} {"train_loss": -6.918237686157227, "global_step": 158064, "epoch": 3763} {"train_loss": -6.969950199127197, "global_step": 158065, "epoch": 3763} {"train_loss": -6.854085922241211, "global_step": 158066, "epoch": 3763} {"train_loss": -6.932833671569824, "global_step": 158067, "epoch": 3763} {"train_loss": -6.991679668426514, "global_step": 158068, "epoch": 3763} {"train_loss": -6.990063667297363, "global_step": 158069, "epoch": 3763} {"train_loss": -6.967276573181152, "global_step": 158070, "epoch": 3763} {"train_loss": -6.929313659667969, "global_step": 158071, "epoch": 3763} {"train_loss": -6.972716331481934, "global_step": 158072, "epoch": 3763} {"train_loss": -7.134524345397949, "global_step": 158073, "epoch": 3763} {"train_loss": -7.000389575958252, "global_step": 158074, "epoch": 3763} {"train_loss": -6.942047119140625, "global_step": 158075, "epoch": 3763} {"train_loss": -6.992761611938477, "global_step": 158076, "epoch": 3763} {"train_loss": -7.030679702758789, "global_step": 158077, "epoch": 3763} {"train_loss": -6.912376403808594, "global_step": 158078, "epoch": 3763} {"train_loss": -6.940820693969727, "global_step": 158079, "epoch": 3763} {"train_loss": -6.879579544067383, "global_step": 158080, "epoch": 3763} {"train_loss": -6.865453720092773, "global_step": 158081, "epoch": 3763} {"train_loss": -6.846621990203857, "global_step": 158082, "epoch": 3763} {"train_loss": -7.005952835083008, "global_step": 158083, "epoch": 3763} {"train_loss": -6.9164557456970215, "global_step": 158084, "epoch": 3763} {"train_loss": -6.934573173522949, "global_step": 158085, "epoch": 3763} {"train_loss": -7.041356086730957, "global_step": 158086, "epoch": 3763} {"train_loss": -6.96030330657959, "global_step": 158087, "epoch": 3763, "val_loss": 68545.4375} {"train_loss": -6.861789226531982, "global_step": 158088, "epoch": 3764} {"train_loss": -6.851351737976074, "global_step": 158089, "epoch": 3764} {"train_loss": -6.836124897003174, "global_step": 158090, "epoch": 3764} {"train_loss": -6.733621597290039, "global_step": 158091, "epoch": 3764} {"train_loss": -6.866278648376465, "global_step": 158092, "epoch": 3764} {"train_loss": -6.832973480224609, "global_step": 158093, "epoch": 3764} {"train_loss": -6.705624580383301, "global_step": 158094, "epoch": 3764} {"train_loss": -6.984321594238281, "global_step": 158095, "epoch": 3764} {"train_loss": -6.8147969245910645, "global_step": 158096, "epoch": 3764} {"train_loss": -6.763787269592285, "global_step": 158097, "epoch": 3764} {"train_loss": -6.84254264831543, "global_step": 158098, "epoch": 3764} {"train_loss": -6.7709503173828125, "global_step": 158099, "epoch": 3764} {"train_loss": -6.877140045166016, "global_step": 158100, "epoch": 3764} {"train_loss": -6.784763336181641, "global_step": 158101, "epoch": 3764} {"train_loss": -6.733590602874756, "global_step": 158102, "epoch": 3764} {"train_loss": -6.893414497375488, "global_step": 158103, "epoch": 3764} {"train_loss": -7.015654563903809, "global_step": 158104, "epoch": 3764} {"train_loss": -6.8110504150390625, "global_step": 158105, "epoch": 3764} {"train_loss": -6.887448310852051, "global_step": 158106, "epoch": 3764} {"train_loss": -6.896150588989258, "global_step": 158107, "epoch": 3764} {"train_loss": -6.799823760986328, "global_step": 158108, "epoch": 3764} {"train_loss": -6.910967826843262, "global_step": 158109, "epoch": 3764} {"train_loss": -6.903980255126953, "global_step": 158110, "epoch": 3764} {"train_loss": -6.881021976470947, "global_step": 158111, "epoch": 3764} {"train_loss": -6.842302322387695, "global_step": 158112, "epoch": 3764} {"train_loss": -6.911315441131592, "global_step": 158113, "epoch": 3764} {"train_loss": -6.95535945892334, "global_step": 158114, "epoch": 3764} {"train_loss": -6.843536853790283, "global_step": 158115, "epoch": 3764} {"train_loss": -6.989516258239746, "global_step": 158116, "epoch": 3764} {"train_loss": -6.906162261962891, "global_step": 158117, "epoch": 3764} {"train_loss": -6.882650375366211, "global_step": 158118, "epoch": 3764} {"train_loss": -6.990819931030273, "global_step": 158119, "epoch": 3764} {"train_loss": -6.8584794998168945, "global_step": 158120, "epoch": 3764} {"train_loss": -6.98453426361084, "global_step": 158121, "epoch": 3764} {"train_loss": -7.015235424041748, "global_step": 158122, "epoch": 3764} {"train_loss": -7.020895481109619, "global_step": 158123, "epoch": 3764} {"train_loss": -6.956085205078125, "global_step": 158124, "epoch": 3764} {"train_loss": -6.9322309494018555, "global_step": 158125, "epoch": 3764} {"train_loss": -6.937876224517822, "global_step": 158126, "epoch": 3764} {"train_loss": -6.899692058563232, "global_step": 158127, "epoch": 3764} {"train_loss": -6.928199768066406, "global_step": 158128, "epoch": 3764} {"train_loss": -6.880987485249837, "global_step": 158129, "epoch": 3764, "val_loss": 68380.953125} {"train_loss": -7.0022873878479, "global_step": 158130, "epoch": 3765} {"train_loss": -6.892510414123535, "global_step": 158131, "epoch": 3765} {"train_loss": -6.905821323394775, "global_step": 158132, "epoch": 3765} {"train_loss": -6.956126689910889, "global_step": 158133, "epoch": 3765} {"train_loss": -7.012663841247559, "global_step": 158134, "epoch": 3765} {"train_loss": -6.891261577606201, "global_step": 158135, "epoch": 3765} {"train_loss": -6.972169399261475, "global_step": 158136, "epoch": 3765} {"train_loss": -6.85288143157959, "global_step": 158137, "epoch": 3765} {"train_loss": -6.872260570526123, "global_step": 158138, "epoch": 3765} {"train_loss": -6.927179336547852, "global_step": 158139, "epoch": 3765} {"train_loss": -6.78621768951416, "global_step": 158140, "epoch": 3765} {"train_loss": -6.7470479011535645, "global_step": 158141, "epoch": 3765} {"train_loss": -7.015497207641602, "global_step": 158142, "epoch": 3765} {"train_loss": -6.982395172119141, "global_step": 158143, "epoch": 3765} {"train_loss": -6.9226484298706055, "global_step": 158144, "epoch": 3765} {"train_loss": -6.942755699157715, "global_step": 158145, "epoch": 3765} {"train_loss": -6.820047378540039, "global_step": 158146, "epoch": 3765} {"train_loss": -6.994816780090332, "global_step": 158147, "epoch": 3765} {"train_loss": -6.963628768920898, "global_step": 158148, "epoch": 3765} {"train_loss": -6.972450256347656, "global_step": 158149, "epoch": 3765} {"train_loss": -6.959819793701172, "global_step": 158150, "epoch": 3765} {"train_loss": -6.986444473266602, "global_step": 158151, "epoch": 3765} {"train_loss": -6.980869293212891, "global_step": 158152, "epoch": 3765} {"train_loss": -6.97391414642334, "global_step": 158153, "epoch": 3765} {"train_loss": -6.939121246337891, "global_step": 158154, "epoch": 3765} {"train_loss": -6.941312789916992, "global_step": 158155, "epoch": 3765} {"train_loss": -6.747803211212158, "global_step": 158156, "epoch": 3765} {"train_loss": -7.0638628005981445, "global_step": 158157, "epoch": 3765} {"train_loss": -6.925790786743164, "global_step": 158158, "epoch": 3765} {"train_loss": -6.903985500335693, "global_step": 158159, "epoch": 3765} {"train_loss": -6.922945976257324, "global_step": 158160, "epoch": 3765} {"train_loss": -6.91132926940918, "global_step": 158161, "epoch": 3765} {"train_loss": -7.006166458129883, "global_step": 158162, "epoch": 3765} {"train_loss": -7.0084075927734375, "global_step": 158163, "epoch": 3765} {"train_loss": -6.960944175720215, "global_step": 158164, "epoch": 3765} {"train_loss": -6.951136589050293, "global_step": 158165, "epoch": 3765} {"train_loss": -6.895738124847412, "global_step": 158166, "epoch": 3765} {"train_loss": -6.932244777679443, "global_step": 158167, "epoch": 3765} {"train_loss": -6.924661636352539, "global_step": 158168, "epoch": 3765} {"train_loss": -7.009913921356201, "global_step": 158169, "epoch": 3765} {"train_loss": -6.866053581237793, "global_step": 158170, "epoch": 3765} {"train_loss": -6.9337832019442605, "global_step": 158171, "epoch": 3765, "val_loss": 68317.96875} {"train_loss": -7.0086989402771, "global_step": 158172, "epoch": 3766} {"train_loss": -6.974900245666504, "global_step": 158173, "epoch": 3766} {"train_loss": -7.017997741699219, "global_step": 158174, "epoch": 3766} {"train_loss": -6.9673614501953125, "global_step": 158175, "epoch": 3766} {"train_loss": -6.994388580322266, "global_step": 158176, "epoch": 3766} {"train_loss": -6.943638801574707, "global_step": 158177, "epoch": 3766} {"train_loss": -7.054177284240723, "global_step": 158178, "epoch": 3766} {"train_loss": -6.927641868591309, "global_step": 158179, "epoch": 3766} {"train_loss": -7.040947437286377, "global_step": 158180, "epoch": 3766} {"train_loss": -6.941371917724609, "global_step": 158181, "epoch": 3766} {"train_loss": -7.040888786315918, "global_step": 158182, "epoch": 3766} {"train_loss": -6.872631072998047, "global_step": 158183, "epoch": 3766} {"train_loss": -6.946795463562012, "global_step": 158184, "epoch": 3766} {"train_loss": -6.988161563873291, "global_step": 158185, "epoch": 3766} {"train_loss": -7.0315632820129395, "global_step": 158186, "epoch": 3766} {"train_loss": -7.003530502319336, "global_step": 158187, "epoch": 3766} {"train_loss": -7.009848594665527, "global_step": 158188, "epoch": 3766} {"train_loss": -6.945773124694824, "global_step": 158189, "epoch": 3766} {"train_loss": -6.949230670928955, "global_step": 158190, "epoch": 3766} {"train_loss": -6.898983001708984, "global_step": 158191, "epoch": 3766} {"train_loss": -6.94368314743042, "global_step": 158192, "epoch": 3766} {"train_loss": -6.951689720153809, "global_step": 158193, "epoch": 3766} {"train_loss": -6.884228229522705, "global_step": 158194, "epoch": 3766} {"train_loss": -7.072635650634766, "global_step": 158195, "epoch": 3766} {"train_loss": -6.953310012817383, "global_step": 158196, "epoch": 3766} {"train_loss": -6.970746040344238, "global_step": 158197, "epoch": 3766} {"train_loss": -6.877389907836914, "global_step": 158198, "epoch": 3766} {"train_loss": -6.987186431884766, "global_step": 158199, "epoch": 3766} {"train_loss": -7.034512519836426, "global_step": 158200, "epoch": 3766} {"train_loss": -6.912722587585449, "global_step": 158201, "epoch": 3766} {"train_loss": -6.856767654418945, "global_step": 158202, "epoch": 3766} {"train_loss": -6.9179582595825195, "global_step": 158203, "epoch": 3766} {"train_loss": -6.860128402709961, "global_step": 158204, "epoch": 3766} {"train_loss": -6.835760116577148, "global_step": 158205, "epoch": 3766} {"train_loss": -6.945104598999023, "global_step": 158206, "epoch": 3766} {"train_loss": -6.63907527923584, "global_step": 158207, "epoch": 3766} {"train_loss": -6.865689277648926, "global_step": 158208, "epoch": 3766} {"train_loss": -6.603806495666504, "global_step": 158209, "epoch": 3766} {"train_loss": -6.773141384124756, "global_step": 158210, "epoch": 3766} {"train_loss": -6.830508232116699, "global_step": 158211, "epoch": 3766} {"train_loss": -6.729201316833496, "global_step": 158212, "epoch": 3766} {"train_loss": -6.9215619677589055, "global_step": 158213, "epoch": 3766, "val_loss": 68765.4765625} {"train_loss": -6.8274383544921875, "global_step": 158214, "epoch": 3767} {"train_loss": -6.5417070388793945, "global_step": 158215, "epoch": 3767} {"train_loss": -6.848991394042969, "global_step": 158216, "epoch": 3767} {"train_loss": -6.745427131652832, "global_step": 158217, "epoch": 3767} {"train_loss": -6.8323774337768555, "global_step": 158218, "epoch": 3767} {"train_loss": -6.6856489181518555, "global_step": 158219, "epoch": 3767} {"train_loss": -6.725220203399658, "global_step": 158220, "epoch": 3767} {"train_loss": -6.771366596221924, "global_step": 158221, "epoch": 3767} {"train_loss": -6.727348327636719, "global_step": 158222, "epoch": 3767} {"train_loss": -6.858897686004639, "global_step": 158223, "epoch": 3767} {"train_loss": -6.9477667808532715, "global_step": 158224, "epoch": 3767} {"train_loss": -6.896571636199951, "global_step": 158225, "epoch": 3767} {"train_loss": -6.738799095153809, "global_step": 158226, "epoch": 3767} {"train_loss": -6.916680812835693, "global_step": 158227, "epoch": 3767} {"train_loss": -6.919462203979492, "global_step": 158228, "epoch": 3767} {"train_loss": -6.967526435852051, "global_step": 158229, "epoch": 3767} {"train_loss": -6.885561466217041, "global_step": 158230, "epoch": 3767} {"train_loss": -6.837639808654785, "global_step": 158231, "epoch": 3767} {"train_loss": -6.864407062530518, "global_step": 158232, "epoch": 3767} {"train_loss": -6.965485572814941, "global_step": 158233, "epoch": 3767} {"train_loss": -6.833525657653809, "global_step": 158234, "epoch": 3767} {"train_loss": -6.96585750579834, "global_step": 158235, "epoch": 3767} {"train_loss": -6.758220195770264, "global_step": 158236, "epoch": 3767} {"train_loss": -6.894513130187988, "global_step": 158237, "epoch": 3767} {"train_loss": -6.880027770996094, "global_step": 158238, "epoch": 3767} {"train_loss": -6.885626316070557, "global_step": 158239, "epoch": 3767} {"train_loss": -7.015499114990234, "global_step": 158240, "epoch": 3767} {"train_loss": -6.722640514373779, "global_step": 158241, "epoch": 3767} {"train_loss": -6.91885232925415, "global_step": 158242, "epoch": 3767} {"train_loss": -6.966157913208008, "global_step": 158243, "epoch": 3767} {"train_loss": -6.811945915222168, "global_step": 158244, "epoch": 3767} {"train_loss": -6.938483715057373, "global_step": 158245, "epoch": 3767} {"train_loss": -6.8956379890441895, "global_step": 158246, "epoch": 3767} {"train_loss": -6.905454635620117, "global_step": 158247, "epoch": 3767} {"train_loss": -6.9619340896606445, "global_step": 158248, "epoch": 3767} {"train_loss": -6.774234771728516, "global_step": 158249, "epoch": 3767} {"train_loss": -6.803999900817871, "global_step": 158250, "epoch": 3767} {"train_loss": -6.8592329025268555, "global_step": 158251, "epoch": 3767} {"train_loss": -6.912243843078613, "global_step": 158252, "epoch": 3767} {"train_loss": -6.978233814239502, "global_step": 158253, "epoch": 3767} {"train_loss": -6.971586227416992, "global_step": 158254, "epoch": 3767} {"train_loss": -6.860315697533744, "global_step": 158255, "epoch": 3767, "val_loss": 68356.0078125} {"train_loss": -6.960454940795898, "global_step": 158256, "epoch": 3768} {"train_loss": -6.916467666625977, "global_step": 158257, "epoch": 3768} {"train_loss": -7.0088043212890625, "global_step": 158258, "epoch": 3768} {"train_loss": -6.925711631774902, "global_step": 158259, "epoch": 3768} {"train_loss": -6.933149337768555, "global_step": 158260, "epoch": 3768} {"train_loss": -6.983772277832031, "global_step": 158261, "epoch": 3768} {"train_loss": -7.013079643249512, "global_step": 158262, "epoch": 3768} {"train_loss": -6.98024845123291, "global_step": 158263, "epoch": 3768} {"train_loss": -7.067832946777344, "global_step": 158264, "epoch": 3768} {"train_loss": -7.117557525634766, "global_step": 158265, "epoch": 3768} {"train_loss": -6.9285736083984375, "global_step": 158266, "epoch": 3768} {"train_loss": -6.987898826599121, "global_step": 158267, "epoch": 3768} {"train_loss": -7.019057750701904, "global_step": 158268, "epoch": 3768} {"train_loss": -7.133355140686035, "global_step": 158269, "epoch": 3768} {"train_loss": -7.083260536193848, "global_step": 158270, "epoch": 3768} {"train_loss": -7.104609966278076, "global_step": 158271, "epoch": 3768} {"train_loss": -6.95000696182251, "global_step": 158272, "epoch": 3768} {"train_loss": -6.844873428344727, "global_step": 158273, "epoch": 3768} {"train_loss": -6.856122016906738, "global_step": 158274, "epoch": 3768} {"train_loss": -7.040699005126953, "global_step": 158275, "epoch": 3768} {"train_loss": -7.063446044921875, "global_step": 158276, "epoch": 3768} {"train_loss": -6.8683180809021, "global_step": 158277, "epoch": 3768} {"train_loss": -6.980739593505859, "global_step": 158278, "epoch": 3768} {"train_loss": -6.926397800445557, "global_step": 158279, "epoch": 3768} {"train_loss": -7.015763282775879, "global_step": 158280, "epoch": 3768} {"train_loss": -6.853946685791016, "global_step": 158281, "epoch": 3768} {"train_loss": -6.941768646240234, "global_step": 158282, "epoch": 3768} {"train_loss": -6.776975631713867, "global_step": 158283, "epoch": 3768} {"train_loss": -6.973153591156006, "global_step": 158284, "epoch": 3768} {"train_loss": -6.990782737731934, "global_step": 158285, "epoch": 3768} {"train_loss": -6.751630783081055, "global_step": 158286, "epoch": 3768} {"train_loss": -6.95333194732666, "global_step": 158287, "epoch": 3768} {"train_loss": -6.893177032470703, "global_step": 158288, "epoch": 3768} {"train_loss": -6.9469828605651855, "global_step": 158289, "epoch": 3768} {"train_loss": -6.919820785522461, "global_step": 158290, "epoch": 3768} {"train_loss": -7.062314033508301, "global_step": 158291, "epoch": 3768} {"train_loss": -7.030762672424316, "global_step": 158292, "epoch": 3768} {"train_loss": -7.057003974914551, "global_step": 158293, "epoch": 3768} {"train_loss": -6.912091255187988, "global_step": 158294, "epoch": 3768} {"train_loss": -6.883853912353516, "global_step": 158295, "epoch": 3768} {"train_loss": -6.879917621612549, "global_step": 158296, "epoch": 3768} {"train_loss": -6.9619697616213845, "global_step": 158297, "epoch": 3768, "val_loss": 68691.9609375} {"train_loss": -6.86865758895874, "global_step": 158298, "epoch": 3769} {"train_loss": -6.910134315490723, "global_step": 158299, "epoch": 3769} {"train_loss": -6.726102352142334, "global_step": 158300, "epoch": 3769} {"train_loss": -6.934564590454102, "global_step": 158301, "epoch": 3769} {"train_loss": -6.7425994873046875, "global_step": 158302, "epoch": 3769} {"train_loss": -7.006051063537598, "global_step": 158303, "epoch": 3769} {"train_loss": -6.985518455505371, "global_step": 158304, "epoch": 3769} {"train_loss": -6.965395927429199, "global_step": 158305, "epoch": 3769} {"train_loss": -6.994437217712402, "global_step": 158306, "epoch": 3769} {"train_loss": -7.041149139404297, "global_step": 158307, "epoch": 3769} {"train_loss": -6.870392799377441, "global_step": 158308, "epoch": 3769} {"train_loss": -6.844460487365723, "global_step": 158309, "epoch": 3769} {"train_loss": -6.939111232757568, "global_step": 158310, "epoch": 3769} {"train_loss": -7.0084686279296875, "global_step": 158311, "epoch": 3769} {"train_loss": -7.023538112640381, "global_step": 158312, "epoch": 3769} {"train_loss": -7.034323215484619, "global_step": 158313, "epoch": 3769} {"train_loss": -6.924304962158203, "global_step": 158314, "epoch": 3769} {"train_loss": -6.915772438049316, "global_step": 158315, "epoch": 3769} {"train_loss": -6.912752151489258, "global_step": 158316, "epoch": 3769} {"train_loss": -6.915919780731201, "global_step": 158317, "epoch": 3769} {"train_loss": -6.857915878295898, "global_step": 158318, "epoch": 3769} {"train_loss": -7.006377696990967, "global_step": 158319, "epoch": 3769} {"train_loss": -6.872159481048584, "global_step": 158320, "epoch": 3769} {"train_loss": -7.002810478210449, "global_step": 158321, "epoch": 3769} {"train_loss": -6.884915828704834, "global_step": 158322, "epoch": 3769} {"train_loss": -6.89475154876709, "global_step": 158323, "epoch": 3769} {"train_loss": -7.048109531402588, "global_step": 158324, "epoch": 3769} {"train_loss": -6.958315849304199, "global_step": 158325, "epoch": 3769} {"train_loss": -6.923238277435303, "global_step": 158326, "epoch": 3769} {"train_loss": -6.96114444732666, "global_step": 158327, "epoch": 3769} {"train_loss": -6.946750640869141, "global_step": 158328, "epoch": 3769} {"train_loss": -7.026535987854004, "global_step": 158329, "epoch": 3769} {"train_loss": -6.965505599975586, "global_step": 158330, "epoch": 3769} {"train_loss": -6.960285663604736, "global_step": 158331, "epoch": 3769} {"train_loss": -6.991631507873535, "global_step": 158332, "epoch": 3769} {"train_loss": -6.98557186126709, "global_step": 158333, "epoch": 3769} {"train_loss": -7.083653926849365, "global_step": 158334, "epoch": 3769} {"train_loss": -7.038011074066162, "global_step": 158335, "epoch": 3769} {"train_loss": -6.992911338806152, "global_step": 158336, "epoch": 3769} {"train_loss": -7.042058944702148, "global_step": 158337, "epoch": 3769} {"train_loss": -6.888705253601074, "global_step": 158338, "epoch": 3769} {"train_loss": -6.949293681553432, "global_step": 158339, "epoch": 3769, "val_loss": 68467.9375} {"train_loss": -6.978241920471191, "global_step": 158340, "epoch": 3770} {"train_loss": -7.05126953125, "global_step": 158341, "epoch": 3770} {"train_loss": -7.044764518737793, "global_step": 158342, "epoch": 3770} {"train_loss": -6.914342880249023, "global_step": 158343, "epoch": 3770} {"train_loss": -6.893606662750244, "global_step": 158344, "epoch": 3770} {"train_loss": -6.931882381439209, "global_step": 158345, "epoch": 3770} {"train_loss": -6.928832530975342, "global_step": 158346, "epoch": 3770} {"train_loss": -6.903618812561035, "global_step": 158347, "epoch": 3770} {"train_loss": -6.880403995513916, "global_step": 158348, "epoch": 3770} {"train_loss": -6.91622257232666, "global_step": 158349, "epoch": 3770} {"train_loss": -6.846875190734863, "global_step": 158350, "epoch": 3770} {"train_loss": -6.961521148681641, "global_step": 158351, "epoch": 3770} {"train_loss": -6.866634368896484, "global_step": 158352, "epoch": 3770} {"train_loss": -6.887172698974609, "global_step": 158353, "epoch": 3770} {"train_loss": -6.934117794036865, "global_step": 158354, "epoch": 3770} {"train_loss": -6.973045825958252, "global_step": 158355, "epoch": 3770} {"train_loss": -6.962954998016357, "global_step": 158356, "epoch": 3770} {"train_loss": -7.0719757080078125, "global_step": 158357, "epoch": 3770} {"train_loss": -6.971858978271484, "global_step": 158358, "epoch": 3770} {"train_loss": -6.923277378082275, "global_step": 158359, "epoch": 3770} {"train_loss": -6.929152488708496, "global_step": 158360, "epoch": 3770} {"train_loss": -7.0332255363464355, "global_step": 158361, "epoch": 3770} {"train_loss": -7.002610206604004, "global_step": 158362, "epoch": 3770} {"train_loss": -6.998021125793457, "global_step": 158363, "epoch": 3770} {"train_loss": -7.033221244812012, "global_step": 158364, "epoch": 3770} {"train_loss": -6.947591304779053, "global_step": 158365, "epoch": 3770} {"train_loss": -6.914287567138672, "global_step": 158366, "epoch": 3770} {"train_loss": -6.787635803222656, "global_step": 158367, "epoch": 3770} {"train_loss": -6.823966979980469, "global_step": 158368, "epoch": 3770} {"train_loss": -6.94773530960083, "global_step": 158369, "epoch": 3770} {"train_loss": -7.010912895202637, "global_step": 158370, "epoch": 3770} {"train_loss": -6.9266204833984375, "global_step": 158371, "epoch": 3770} {"train_loss": -6.786797523498535, "global_step": 158372, "epoch": 3770} {"train_loss": -6.957907199859619, "global_step": 158373, "epoch": 3770} {"train_loss": -6.946998119354248, "global_step": 158374, "epoch": 3770} {"train_loss": -7.016676902770996, "global_step": 158375, "epoch": 3770} {"train_loss": -6.817377090454102, "global_step": 158376, "epoch": 3770} {"train_loss": -6.940573215484619, "global_step": 158377, "epoch": 3770} {"train_loss": -6.862687110900879, "global_step": 158378, "epoch": 3770} {"train_loss": -6.846284866333008, "global_step": 158379, "epoch": 3770} {"train_loss": -6.888116836547852, "global_step": 158380, "epoch": 3770} {"train_loss": -6.9319223789941695, "global_step": 158381, "epoch": 3770, "val_loss": 68494.734375} {"train_loss": -6.865116119384766, "global_step": 158382, "epoch": 3771} {"train_loss": -6.899901390075684, "global_step": 158383, "epoch": 3771} {"train_loss": -6.729404449462891, "global_step": 158384, "epoch": 3771} {"train_loss": -6.87899112701416, "global_step": 158385, "epoch": 3771} {"train_loss": -6.85920524597168, "global_step": 158386, "epoch": 3771} {"train_loss": -6.9008893966674805, "global_step": 158387, "epoch": 3771} {"train_loss": -6.795240879058838, "global_step": 158388, "epoch": 3771} {"train_loss": -6.8610358238220215, "global_step": 158389, "epoch": 3771} {"train_loss": -6.844305038452148, "global_step": 158390, "epoch": 3771} {"train_loss": -6.796485900878906, "global_step": 158391, "epoch": 3771} {"train_loss": -6.976657390594482, "global_step": 158392, "epoch": 3771} {"train_loss": -6.820641040802002, "global_step": 158393, "epoch": 3771} {"train_loss": -6.88300895690918, "global_step": 158394, "epoch": 3771} {"train_loss": -6.908527374267578, "global_step": 158395, "epoch": 3771} {"train_loss": -6.857203960418701, "global_step": 158396, "epoch": 3771} {"train_loss": -6.93916654586792, "global_step": 158397, "epoch": 3771} {"train_loss": -6.958065986633301, "global_step": 158398, "epoch": 3771} {"train_loss": -7.004415512084961, "global_step": 158399, "epoch": 3771} {"train_loss": -7.001106262207031, "global_step": 158400, "epoch": 3771} {"train_loss": -6.894617080688477, "global_step": 158401, "epoch": 3771} {"train_loss": -6.939138412475586, "global_step": 158402, "epoch": 3771} {"train_loss": -7.071959495544434, "global_step": 158403, "epoch": 3771} {"train_loss": -6.94170618057251, "global_step": 158404, "epoch": 3771} {"train_loss": -6.983785629272461, "global_step": 158405, "epoch": 3771} {"train_loss": -7.036823272705078, "global_step": 158406, "epoch": 3771} {"train_loss": -6.952610969543457, "global_step": 158407, "epoch": 3771} {"train_loss": -7.057616233825684, "global_step": 158408, "epoch": 3771} {"train_loss": -7.038774490356445, "global_step": 158409, "epoch": 3771} {"train_loss": -7.003819465637207, "global_step": 158410, "epoch": 3771} {"train_loss": -7.034432888031006, "global_step": 158411, "epoch": 3771} {"train_loss": -6.977644443511963, "global_step": 158412, "epoch": 3771} {"train_loss": -6.961370944976807, "global_step": 158413, "epoch": 3771} {"train_loss": -6.944262504577637, "global_step": 158414, "epoch": 3771} {"train_loss": -6.991131782531738, "global_step": 158415, "epoch": 3771} {"train_loss": -6.860887050628662, "global_step": 158416, "epoch": 3771} {"train_loss": -6.954127788543701, "global_step": 158417, "epoch": 3771} {"train_loss": -6.94188117980957, "global_step": 158418, "epoch": 3771} {"train_loss": -6.928355693817139, "global_step": 158419, "epoch": 3771} {"train_loss": -6.975983142852783, "global_step": 158420, "epoch": 3771} {"train_loss": -6.875897407531738, "global_step": 158421, "epoch": 3771} {"train_loss": -7.056914329528809, "global_step": 158422, "epoch": 3771} {"train_loss": -6.9328269844963435, "global_step": 158423, "epoch": 3771, "val_loss": 68396.6015625} {"train_loss": -6.968546390533447, "global_step": 158424, "epoch": 3772} {"train_loss": -7.060864448547363, "global_step": 158425, "epoch": 3772} {"train_loss": -6.920532703399658, "global_step": 158426, "epoch": 3772} {"train_loss": -6.908910751342773, "global_step": 158427, "epoch": 3772} {"train_loss": -6.941308975219727, "global_step": 158428, "epoch": 3772} {"train_loss": -6.940996170043945, "global_step": 158429, "epoch": 3772} {"train_loss": -6.954381465911865, "global_step": 158430, "epoch": 3772} {"train_loss": -6.885368347167969, "global_step": 158431, "epoch": 3772} {"train_loss": -6.898846626281738, "global_step": 158432, "epoch": 3772} {"train_loss": -6.926819801330566, "global_step": 158433, "epoch": 3772} {"train_loss": -6.919846534729004, "global_step": 158434, "epoch": 3772} {"train_loss": -6.942724227905273, "global_step": 158435, "epoch": 3772} {"train_loss": -6.965854644775391, "global_step": 158436, "epoch": 3772} {"train_loss": -6.909858226776123, "global_step": 158437, "epoch": 3772} {"train_loss": -6.955565452575684, "global_step": 158438, "epoch": 3772} {"train_loss": -7.007687568664551, "global_step": 158439, "epoch": 3772} {"train_loss": -6.996901512145996, "global_step": 158440, "epoch": 3772} {"train_loss": -6.940511703491211, "global_step": 158441, "epoch": 3772} {"train_loss": -6.908694267272949, "global_step": 158442, "epoch": 3772} {"train_loss": -6.931761741638184, "global_step": 158443, "epoch": 3772} {"train_loss": -7.086174011230469, "global_step": 158444, "epoch": 3772} {"train_loss": -6.964922904968262, "global_step": 158445, "epoch": 3772} {"train_loss": -6.949459552764893, "global_step": 158446, "epoch": 3772} {"train_loss": -7.045032501220703, "global_step": 158447, "epoch": 3772} {"train_loss": -7.032573223114014, "global_step": 158448, "epoch": 3772} {"train_loss": -6.834144115447998, "global_step": 158449, "epoch": 3772} {"train_loss": -6.907037734985352, "global_step": 158450, "epoch": 3772} {"train_loss": -6.928172588348389, "global_step": 158451, "epoch": 3772} {"train_loss": -6.8501434326171875, "global_step": 158452, "epoch": 3772} {"train_loss": -6.8960676193237305, "global_step": 158453, "epoch": 3772} {"train_loss": -6.983419418334961, "global_step": 158454, "epoch": 3772} {"train_loss": -6.936913013458252, "global_step": 158455, "epoch": 3772} {"train_loss": -6.9208269119262695, "global_step": 158456, "epoch": 3772} {"train_loss": -6.852044105529785, "global_step": 158457, "epoch": 3772} {"train_loss": -6.812618732452393, "global_step": 158458, "epoch": 3772} {"train_loss": -6.972173690795898, "global_step": 158459, "epoch": 3772} {"train_loss": -6.961698055267334, "global_step": 158460, "epoch": 3772} {"train_loss": -7.001404762268066, "global_step": 158461, "epoch": 3772} {"train_loss": -6.790104866027832, "global_step": 158462, "epoch": 3772} {"train_loss": -6.97730016708374, "global_step": 158463, "epoch": 3772} {"train_loss": -6.991786479949951, "global_step": 158464, "epoch": 3772} {"train_loss": -6.941366683869135, "global_step": 158465, "epoch": 3772, "val_loss": 68793.140625} {"train_loss": -6.89537239074707, "global_step": 158466, "epoch": 3773} {"train_loss": -7.011346340179443, "global_step": 158467, "epoch": 3773} {"train_loss": -6.938231945037842, "global_step": 158468, "epoch": 3773} {"train_loss": -6.970035552978516, "global_step": 158469, "epoch": 3773} {"train_loss": -6.955913543701172, "global_step": 158470, "epoch": 3773} {"train_loss": -6.9277167320251465, "global_step": 158471, "epoch": 3773} {"train_loss": -7.0301618576049805, "global_step": 158472, "epoch": 3773} {"train_loss": -7.136834144592285, "global_step": 158473, "epoch": 3773} {"train_loss": -6.983524322509766, "global_step": 158474, "epoch": 3773} {"train_loss": -6.9318695068359375, "global_step": 158475, "epoch": 3773} {"train_loss": -7.006497859954834, "global_step": 158476, "epoch": 3773} {"train_loss": -6.880049228668213, "global_step": 158477, "epoch": 3773} {"train_loss": -6.9741973876953125, "global_step": 158478, "epoch": 3773} {"train_loss": -7.020938873291016, "global_step": 158479, "epoch": 3773} {"train_loss": -6.972696304321289, "global_step": 158480, "epoch": 3773} {"train_loss": -6.9225616455078125, "global_step": 158481, "epoch": 3773} {"train_loss": -6.914105415344238, "global_step": 158482, "epoch": 3773} {"train_loss": -6.9770708084106445, "global_step": 158483, "epoch": 3773} {"train_loss": -6.884766578674316, "global_step": 158484, "epoch": 3773} {"train_loss": -6.829907417297363, "global_step": 158485, "epoch": 3773} {"train_loss": -7.046093940734863, "global_step": 158486, "epoch": 3773} {"train_loss": -6.937561511993408, "global_step": 158487, "epoch": 3773} {"train_loss": -6.838052272796631, "global_step": 158488, "epoch": 3773} {"train_loss": -6.816364288330078, "global_step": 158489, "epoch": 3773} {"train_loss": -6.97043514251709, "global_step": 158490, "epoch": 3773} {"train_loss": -6.870367527008057, "global_step": 158491, "epoch": 3773} {"train_loss": -6.891656398773193, "global_step": 158492, "epoch": 3773} {"train_loss": -6.823145866394043, "global_step": 158493, "epoch": 3773} {"train_loss": -6.751041412353516, "global_step": 158494, "epoch": 3773} {"train_loss": -6.816238880157471, "global_step": 158495, "epoch": 3773} {"train_loss": -6.873141288757324, "global_step": 158496, "epoch": 3773} {"train_loss": -6.72140645980835, "global_step": 158497, "epoch": 3773} {"train_loss": -6.871245861053467, "global_step": 158498, "epoch": 3773} {"train_loss": -6.745965003967285, "global_step": 158499, "epoch": 3773} {"train_loss": -6.730706214904785, "global_step": 158500, "epoch": 3773} {"train_loss": -6.799612045288086, "global_step": 158501, "epoch": 3773} {"train_loss": -6.722867965698242, "global_step": 158502, "epoch": 3773} {"train_loss": -6.816135406494141, "global_step": 158503, "epoch": 3773} {"train_loss": -6.640016078948975, "global_step": 158504, "epoch": 3773} {"train_loss": -6.975117206573486, "global_step": 158505, "epoch": 3773} {"train_loss": -6.809822082519531, "global_step": 158506, "epoch": 3773} {"train_loss": -6.890938997268677, "global_step": 158507, "epoch": 3773, "val_loss": 68611.3515625} {"train_loss": -6.903663158416748, "global_step": 158508, "epoch": 3774} {"train_loss": -6.78887939453125, "global_step": 158509, "epoch": 3774} {"train_loss": -6.893887042999268, "global_step": 158510, "epoch": 3774} {"train_loss": -6.759324073791504, "global_step": 158511, "epoch": 3774} {"train_loss": -6.7998247146606445, "global_step": 158512, "epoch": 3774} {"train_loss": -6.836435317993164, "global_step": 158513, "epoch": 3774} {"train_loss": -6.63454532623291, "global_step": 158514, "epoch": 3774} {"train_loss": -6.866888523101807, "global_step": 158515, "epoch": 3774} {"train_loss": -6.760719299316406, "global_step": 158516, "epoch": 3774} {"train_loss": -6.875005722045898, "global_step": 158517, "epoch": 3774} {"train_loss": -6.819129943847656, "global_step": 158518, "epoch": 3774} {"train_loss": -6.802219867706299, "global_step": 158519, "epoch": 3774} {"train_loss": -6.884968280792236, "global_step": 158520, "epoch": 3774} {"train_loss": -6.8617024421691895, "global_step": 158521, "epoch": 3774} {"train_loss": -6.863955020904541, "global_step": 158522, "epoch": 3774} {"train_loss": -6.961645126342773, "global_step": 158523, "epoch": 3774} {"train_loss": -6.912384510040283, "global_step": 158524, "epoch": 3774} {"train_loss": -6.951656341552734, "global_step": 158525, "epoch": 3774} {"train_loss": -7.0236053466796875, "global_step": 158526, "epoch": 3774} {"train_loss": -6.891629219055176, "global_step": 158527, "epoch": 3774} {"train_loss": -6.906783103942871, "global_step": 158528, "epoch": 3774} {"train_loss": -6.902809143066406, "global_step": 158529, "epoch": 3774} {"train_loss": -6.826830863952637, "global_step": 158530, "epoch": 3774} {"train_loss": -6.947627067565918, "global_step": 158531, "epoch": 3774} {"train_loss": -7.067783355712891, "global_step": 158532, "epoch": 3774} {"train_loss": -6.844416618347168, "global_step": 158533, "epoch": 3774} {"train_loss": -7.096840858459473, "global_step": 158534, "epoch": 3774} {"train_loss": -7.028027534484863, "global_step": 158535, "epoch": 3774} {"train_loss": -7.093945026397705, "global_step": 158536, "epoch": 3774} {"train_loss": -6.955895900726318, "global_step": 158537, "epoch": 3774} {"train_loss": -6.912360191345215, "global_step": 158538, "epoch": 3774} {"train_loss": -6.955855846405029, "global_step": 158539, "epoch": 3774} {"train_loss": -7.018211841583252, "global_step": 158540, "epoch": 3774} {"train_loss": -7.004209041595459, "global_step": 158541, "epoch": 3774} {"train_loss": -6.894149303436279, "global_step": 158542, "epoch": 3774} {"train_loss": -6.935898303985596, "global_step": 158543, "epoch": 3774} {"train_loss": -6.983213424682617, "global_step": 158544, "epoch": 3774} {"train_loss": -6.909811019897461, "global_step": 158545, "epoch": 3774} {"train_loss": -6.956573486328125, "global_step": 158546, "epoch": 3774} {"train_loss": -6.979617118835449, "global_step": 158547, "epoch": 3774} {"train_loss": -7.01910924911499, "global_step": 158548, "epoch": 3774} {"train_loss": -6.9103797390347435, "global_step": 158549, "epoch": 3774, "val_loss": 68575.0625} {"train_loss": -7.014936923980713, "global_step": 158550, "epoch": 3775} {"train_loss": -7.07828950881958, "global_step": 158551, "epoch": 3775} {"train_loss": -7.03234338760376, "global_step": 158552, "epoch": 3775} {"train_loss": -7.020094871520996, "global_step": 158553, "epoch": 3775} {"train_loss": -7.0966877937316895, "global_step": 158554, "epoch": 3775} {"train_loss": -7.095543384552002, "global_step": 158555, "epoch": 3775} {"train_loss": -6.964918613433838, "global_step": 158556, "epoch": 3775} {"train_loss": -7.025943756103516, "global_step": 158557, "epoch": 3775} {"train_loss": -6.950074195861816, "global_step": 158558, "epoch": 3775} {"train_loss": -6.954442977905273, "global_step": 158559, "epoch": 3775} {"train_loss": -7.090945243835449, "global_step": 158560, "epoch": 3775} {"train_loss": -6.95939302444458, "global_step": 158561, "epoch": 3775} {"train_loss": -7.034543037414551, "global_step": 158562, "epoch": 3775} {"train_loss": -7.004414081573486, "global_step": 158563, "epoch": 3775} {"train_loss": -6.847362041473389, "global_step": 158564, "epoch": 3775} {"train_loss": -6.912808895111084, "global_step": 158565, "epoch": 3775} {"train_loss": -6.995358467102051, "global_step": 158566, "epoch": 3775} {"train_loss": -6.883157730102539, "global_step": 158567, "epoch": 3775} {"train_loss": -6.954333782196045, "global_step": 158568, "epoch": 3775} {"train_loss": -7.0021867752075195, "global_step": 158569, "epoch": 3775} {"train_loss": -6.8736066818237305, "global_step": 158570, "epoch": 3775} {"train_loss": -6.908165454864502, "global_step": 158571, "epoch": 3775} {"train_loss": -7.059251308441162, "global_step": 158572, "epoch": 3775} {"train_loss": -6.913854122161865, "global_step": 158573, "epoch": 3775} {"train_loss": -6.906278610229492, "global_step": 158574, "epoch": 3775} {"train_loss": -7.041444778442383, "global_step": 158575, "epoch": 3775} {"train_loss": -6.939266681671143, "global_step": 158576, "epoch": 3775} {"train_loss": -6.942139625549316, "global_step": 158577, "epoch": 3775} {"train_loss": -6.973589897155762, "global_step": 158578, "epoch": 3775} {"train_loss": -7.022313117980957, "global_step": 158579, "epoch": 3775} {"train_loss": -6.882926940917969, "global_step": 158580, "epoch": 3775} {"train_loss": -7.025831699371338, "global_step": 158581, "epoch": 3775} {"train_loss": -6.999319076538086, "global_step": 158582, "epoch": 3775} {"train_loss": -6.964398384094238, "global_step": 158583, "epoch": 3775} {"train_loss": -6.89877462387085, "global_step": 158584, "epoch": 3775} {"train_loss": -6.965510845184326, "global_step": 158585, "epoch": 3775} {"train_loss": -6.9673943519592285, "global_step": 158586, "epoch": 3775} {"train_loss": -6.9779582023620605, "global_step": 158587, "epoch": 3775} {"train_loss": -6.827765464782715, "global_step": 158588, "epoch": 3775} {"train_loss": -6.933470249176025, "global_step": 158589, "epoch": 3775} {"train_loss": -6.782388687133789, "global_step": 158590, "epoch": 3775} {"train_loss": -6.963327623548961, "global_step": 158591, "epoch": 3775, "val_loss": 68344.5859375} {"train_loss": -7.0832014083862305, "global_step": 158592, "epoch": 3776} {"train_loss": -6.961036682128906, "global_step": 158593, "epoch": 3776} {"train_loss": -6.9600830078125, "global_step": 158594, "epoch": 3776} {"train_loss": -6.936583518981934, "global_step": 158595, "epoch": 3776} {"train_loss": -6.861842155456543, "global_step": 158596, "epoch": 3776} {"train_loss": -7.005424499511719, "global_step": 158597, "epoch": 3776} {"train_loss": -6.924763202667236, "global_step": 158598, "epoch": 3776} {"train_loss": -6.971314907073975, "global_step": 158599, "epoch": 3776} {"train_loss": -6.792246341705322, "global_step": 158600, "epoch": 3776} {"train_loss": -6.972341060638428, "global_step": 158601, "epoch": 3776} {"train_loss": -6.856442928314209, "global_step": 158602, "epoch": 3776} {"train_loss": -6.963470458984375, "global_step": 158603, "epoch": 3776} {"train_loss": -6.880682468414307, "global_step": 158604, "epoch": 3776} {"train_loss": -6.793170928955078, "global_step": 158605, "epoch": 3776} {"train_loss": -6.781960487365723, "global_step": 158606, "epoch": 3776} {"train_loss": -6.848306655883789, "global_step": 158607, "epoch": 3776} {"train_loss": -6.872813701629639, "global_step": 158608, "epoch": 3776} {"train_loss": -6.8374738693237305, "global_step": 158609, "epoch": 3776} {"train_loss": -6.839900970458984, "global_step": 158610, "epoch": 3776} {"train_loss": -6.926620960235596, "global_step": 158611, "epoch": 3776} {"train_loss": -6.756447792053223, "global_step": 158612, "epoch": 3776} {"train_loss": -6.853333950042725, "global_step": 158613, "epoch": 3776} {"train_loss": -6.826381683349609, "global_step": 158614, "epoch": 3776} {"train_loss": -6.729612350463867, "global_step": 158615, "epoch": 3776} {"train_loss": -6.975171089172363, "global_step": 158616, "epoch": 3776} {"train_loss": -6.866977214813232, "global_step": 158617, "epoch": 3776} {"train_loss": -6.930292129516602, "global_step": 158618, "epoch": 3776} {"train_loss": -6.895142078399658, "global_step": 158619, "epoch": 3776} {"train_loss": -6.92768669128418, "global_step": 158620, "epoch": 3776} {"train_loss": -6.932263374328613, "global_step": 158621, "epoch": 3776} {"train_loss": -6.909733772277832, "global_step": 158622, "epoch": 3776} {"train_loss": -6.90433931350708, "global_step": 158623, "epoch": 3776} {"train_loss": -6.9269304275512695, "global_step": 158624, "epoch": 3776} {"train_loss": -6.85400390625, "global_step": 158625, "epoch": 3776} {"train_loss": -6.980712413787842, "global_step": 158626, "epoch": 3776} {"train_loss": -6.985169410705566, "global_step": 158627, "epoch": 3776} {"train_loss": -6.951911926269531, "global_step": 158628, "epoch": 3776} {"train_loss": -6.901000022888184, "global_step": 158629, "epoch": 3776} {"train_loss": -6.895358562469482, "global_step": 158630, "epoch": 3776} {"train_loss": -6.79817533493042, "global_step": 158631, "epoch": 3776} {"train_loss": -6.920414924621582, "global_step": 158632, "epoch": 3776} {"train_loss": -6.895038661502657, "global_step": 158633, "epoch": 3776, "val_loss": 68571.53125} {"train_loss": -6.681085109710693, "global_step": 158634, "epoch": 3777} {"train_loss": -6.816272258758545, "global_step": 158635, "epoch": 3777} {"train_loss": -6.848293304443359, "global_step": 158636, "epoch": 3777} {"train_loss": -6.757637023925781, "global_step": 158637, "epoch": 3777} {"train_loss": -6.926284313201904, "global_step": 158638, "epoch": 3777} {"train_loss": -6.800595760345459, "global_step": 158639, "epoch": 3777} {"train_loss": -6.871108531951904, "global_step": 158640, "epoch": 3777} {"train_loss": -6.752601623535156, "global_step": 158641, "epoch": 3777} {"train_loss": -6.819788932800293, "global_step": 158642, "epoch": 3777} {"train_loss": -6.898723125457764, "global_step": 158643, "epoch": 3777} {"train_loss": -6.866339683532715, "global_step": 158644, "epoch": 3777} {"train_loss": -6.808505058288574, "global_step": 158645, "epoch": 3777} {"train_loss": -6.8855061531066895, "global_step": 158646, "epoch": 3777} {"train_loss": -6.801461219787598, "global_step": 158647, "epoch": 3777} {"train_loss": -6.861708641052246, "global_step": 158648, "epoch": 3777} {"train_loss": -6.86046028137207, "global_step": 158649, "epoch": 3777} {"train_loss": -6.832056999206543, "global_step": 158650, "epoch": 3777} {"train_loss": -6.874581813812256, "global_step": 158651, "epoch": 3777} {"train_loss": -6.808228492736816, "global_step": 158652, "epoch": 3777} {"train_loss": -6.940347671508789, "global_step": 158653, "epoch": 3777} {"train_loss": -6.889097690582275, "global_step": 158654, "epoch": 3777} {"train_loss": -6.903453826904297, "global_step": 158655, "epoch": 3777} {"train_loss": -6.940998077392578, "global_step": 158656, "epoch": 3777} {"train_loss": -6.873124122619629, "global_step": 158657, "epoch": 3777} {"train_loss": -6.853891372680664, "global_step": 158658, "epoch": 3777} {"train_loss": -6.851531028747559, "global_step": 158659, "epoch": 3777} {"train_loss": -6.907107353210449, "global_step": 158660, "epoch": 3777} {"train_loss": -6.849587440490723, "global_step": 158661, "epoch": 3777} {"train_loss": -6.838719367980957, "global_step": 158662, "epoch": 3777} {"train_loss": -6.968340873718262, "global_step": 158663, "epoch": 3777} {"train_loss": -7.028092384338379, "global_step": 158664, "epoch": 3777} {"train_loss": -6.867319583892822, "global_step": 158665, "epoch": 3777} {"train_loss": -6.927748680114746, "global_step": 158666, "epoch": 3777} {"train_loss": -6.978893756866455, "global_step": 158667, "epoch": 3777} {"train_loss": -6.955161094665527, "global_step": 158668, "epoch": 3777} {"train_loss": -6.850833892822266, "global_step": 158669, "epoch": 3777} {"train_loss": -6.885425090789795, "global_step": 158670, "epoch": 3777} {"train_loss": -6.918566703796387, "global_step": 158671, "epoch": 3777} {"train_loss": -7.085894584655762, "global_step": 158672, "epoch": 3777} {"train_loss": -6.947995185852051, "global_step": 158673, "epoch": 3777} {"train_loss": -6.941803932189941, "global_step": 158674, "epoch": 3777} {"train_loss": -6.8776710941678, "global_step": 158675, "epoch": 3777, "val_loss": 68512.078125} {"train_loss": -6.925168991088867, "global_step": 158676, "epoch": 3778} {"train_loss": -6.858909606933594, "global_step": 158677, "epoch": 3778} {"train_loss": -6.885525226593018, "global_step": 158678, "epoch": 3778} {"train_loss": -6.970712661743164, "global_step": 158679, "epoch": 3778} {"train_loss": -6.845436096191406, "global_step": 158680, "epoch": 3778} {"train_loss": -6.886551856994629, "global_step": 158681, "epoch": 3778} {"train_loss": -6.910651683807373, "global_step": 158682, "epoch": 3778} {"train_loss": -6.876811981201172, "global_step": 158683, "epoch": 3778} {"train_loss": -6.944847106933594, "global_step": 158684, "epoch": 3778} {"train_loss": -6.977880001068115, "global_step": 158685, "epoch": 3778} {"train_loss": -7.070391654968262, "global_step": 158686, "epoch": 3778} {"train_loss": -6.8953857421875, "global_step": 158687, "epoch": 3778} {"train_loss": -6.994728088378906, "global_step": 158688, "epoch": 3778} {"train_loss": -7.051086902618408, "global_step": 158689, "epoch": 3778} {"train_loss": -6.882371425628662, "global_step": 158690, "epoch": 3778} {"train_loss": -7.046576023101807, "global_step": 158691, "epoch": 3778} {"train_loss": -6.872870445251465, "global_step": 158692, "epoch": 3778} {"train_loss": -7.049319267272949, "global_step": 158693, "epoch": 3778} {"train_loss": -7.104194164276123, "global_step": 158694, "epoch": 3778} {"train_loss": -6.968600273132324, "global_step": 158695, "epoch": 3778} {"train_loss": -6.997533798217773, "global_step": 158696, "epoch": 3778} {"train_loss": -6.922743320465088, "global_step": 158697, "epoch": 3778} {"train_loss": -6.985728740692139, "global_step": 158698, "epoch": 3778} {"train_loss": -6.929140090942383, "global_step": 158699, "epoch": 3778} {"train_loss": -7.026715278625488, "global_step": 158700, "epoch": 3778} {"train_loss": -6.983560562133789, "global_step": 158701, "epoch": 3778} {"train_loss": -7.048728942871094, "global_step": 158702, "epoch": 3778} {"train_loss": -6.970816135406494, "global_step": 158703, "epoch": 3778} {"train_loss": -7.066586494445801, "global_step": 158704, "epoch": 3778} {"train_loss": -7.008652687072754, "global_step": 158705, "epoch": 3778} {"train_loss": -6.946364402770996, "global_step": 158706, "epoch": 3778} {"train_loss": -6.893779754638672, "global_step": 158707, "epoch": 3778} {"train_loss": -6.992676734924316, "global_step": 158708, "epoch": 3778} {"train_loss": -6.974305152893066, "global_step": 158709, "epoch": 3778} {"train_loss": -7.0475358963012695, "global_step": 158710, "epoch": 3778} {"train_loss": -7.072997093200684, "global_step": 158711, "epoch": 3778} {"train_loss": -7.0524702072143555, "global_step": 158712, "epoch": 3778} {"train_loss": -6.9346771240234375, "global_step": 158713, "epoch": 3778} {"train_loss": -7.051136016845703, "global_step": 158714, "epoch": 3778} {"train_loss": -6.886685371398926, "global_step": 158715, "epoch": 3778} {"train_loss": -6.864741325378418, "global_step": 158716, "epoch": 3778} {"train_loss": -6.967175358817691, "global_step": 158717, "epoch": 3778, "val_loss": 68557.265625} {"train_loss": -6.9930009841918945, "global_step": 158718, "epoch": 3779} {"train_loss": -6.904670715332031, "global_step": 158719, "epoch": 3779} {"train_loss": -6.980040550231934, "global_step": 158720, "epoch": 3779} {"train_loss": -6.965353965759277, "global_step": 158721, "epoch": 3779} {"train_loss": -6.9441423416137695, "global_step": 158722, "epoch": 3779} {"train_loss": -6.895512580871582, "global_step": 158723, "epoch": 3779} {"train_loss": -6.9829607009887695, "global_step": 158724, "epoch": 3779} {"train_loss": -7.027082443237305, "global_step": 158725, "epoch": 3779} {"train_loss": -6.896745204925537, "global_step": 158726, "epoch": 3779} {"train_loss": -6.896931171417236, "global_step": 158727, "epoch": 3779} {"train_loss": -6.9083380699157715, "global_step": 158728, "epoch": 3779} {"train_loss": -6.978339195251465, "global_step": 158729, "epoch": 3779} {"train_loss": -6.952839374542236, "global_step": 158730, "epoch": 3779} {"train_loss": -6.934840202331543, "global_step": 158731, "epoch": 3779} {"train_loss": -6.855134963989258, "global_step": 158732, "epoch": 3779} {"train_loss": -6.808423042297363, "global_step": 158733, "epoch": 3779} {"train_loss": -6.913677215576172, "global_step": 158734, "epoch": 3779} {"train_loss": -6.729826927185059, "global_step": 158735, "epoch": 3779} {"train_loss": -6.865817070007324, "global_step": 158736, "epoch": 3779} {"train_loss": -6.933021545410156, "global_step": 158737, "epoch": 3779} {"train_loss": -6.758063316345215, "global_step": 158738, "epoch": 3779} {"train_loss": -6.89786434173584, "global_step": 158739, "epoch": 3779} {"train_loss": -6.945855140686035, "global_step": 158740, "epoch": 3779} {"train_loss": -6.772764682769775, "global_step": 158741, "epoch": 3779} {"train_loss": -6.940373420715332, "global_step": 158742, "epoch": 3779} {"train_loss": -6.857561111450195, "global_step": 158743, "epoch": 3779} {"train_loss": -6.800589561462402, "global_step": 158744, "epoch": 3779} {"train_loss": -6.86769962310791, "global_step": 158745, "epoch": 3779} {"train_loss": -6.935998916625977, "global_step": 158746, "epoch": 3779} {"train_loss": -6.948264122009277, "global_step": 158747, "epoch": 3779} {"train_loss": -6.8643927574157715, "global_step": 158748, "epoch": 3779} {"train_loss": -6.870486259460449, "global_step": 158749, "epoch": 3779} {"train_loss": -6.954338550567627, "global_step": 158750, "epoch": 3779} {"train_loss": -6.928748607635498, "global_step": 158751, "epoch": 3779} {"train_loss": -7.005841255187988, "global_step": 158752, "epoch": 3779} {"train_loss": -6.802116870880127, "global_step": 158753, "epoch": 3779} {"train_loss": -7.02398681640625, "global_step": 158754, "epoch": 3779} {"train_loss": -6.962308406829834, "global_step": 158755, "epoch": 3779} {"train_loss": -7.075233459472656, "global_step": 158756, "epoch": 3779} {"train_loss": -6.884746551513672, "global_step": 158757, "epoch": 3779} {"train_loss": -7.030765533447266, "global_step": 158758, "epoch": 3779} {"train_loss": -6.912029266357422, "global_step": 158759, "epoch": 3779, "val_loss": 68462.234375} {"train_loss": -7.027421474456787, "global_step": 158760, "epoch": 3780} {"train_loss": -6.9831647872924805, "global_step": 158761, "epoch": 3780} {"train_loss": -7.003871440887451, "global_step": 158762, "epoch": 3780} {"train_loss": -6.916356086730957, "global_step": 158763, "epoch": 3780} {"train_loss": -6.90712833404541, "global_step": 158764, "epoch": 3780} {"train_loss": -6.982608795166016, "global_step": 158765, "epoch": 3780} {"train_loss": -7.062158107757568, "global_step": 158766, "epoch": 3780} {"train_loss": -6.894963264465332, "global_step": 158767, "epoch": 3780} {"train_loss": -6.957076072692871, "global_step": 158768, "epoch": 3780} {"train_loss": -7.0690388679504395, "global_step": 158769, "epoch": 3780} {"train_loss": -7.023102760314941, "global_step": 158770, "epoch": 3780} {"train_loss": -6.986780166625977, "global_step": 158771, "epoch": 3780} {"train_loss": -7.008443832397461, "global_step": 158772, "epoch": 3780} {"train_loss": -6.939149856567383, "global_step": 158773, "epoch": 3780} {"train_loss": -6.947633743286133, "global_step": 158774, "epoch": 3780} {"train_loss": -7.121655464172363, "global_step": 158775, "epoch": 3780} {"train_loss": -6.8235015869140625, "global_step": 158776, "epoch": 3780} {"train_loss": -6.951809883117676, "global_step": 158777, "epoch": 3780} {"train_loss": -6.974691867828369, "global_step": 158778, "epoch": 3780} {"train_loss": -6.9464311599731445, "global_step": 158779, "epoch": 3780} {"train_loss": -6.928317070007324, "global_step": 158780, "epoch": 3780} {"train_loss": -6.986705303192139, "global_step": 158781, "epoch": 3780} {"train_loss": -6.939599514007568, "global_step": 158782, "epoch": 3780} {"train_loss": -6.959753036499023, "global_step": 158783, "epoch": 3780} {"train_loss": -6.858383655548096, "global_step": 158784, "epoch": 3780} {"train_loss": -6.958357810974121, "global_step": 158785, "epoch": 3780} {"train_loss": -6.947137832641602, "global_step": 158786, "epoch": 3780} {"train_loss": -7.059686660766602, "global_step": 158787, "epoch": 3780} {"train_loss": -7.051595687866211, "global_step": 158788, "epoch": 3780} {"train_loss": -6.97498893737793, "global_step": 158789, "epoch": 3780} {"train_loss": -6.965415954589844, "global_step": 158790, "epoch": 3780} {"train_loss": -6.958510398864746, "global_step": 158791, "epoch": 3780} {"train_loss": -6.874283790588379, "global_step": 158792, "epoch": 3780} {"train_loss": -6.91768217086792, "global_step": 158793, "epoch": 3780} {"train_loss": -7.053554534912109, "global_step": 158794, "epoch": 3780} {"train_loss": -7.035888671875, "global_step": 158795, "epoch": 3780} {"train_loss": -6.9855451583862305, "global_step": 158796, "epoch": 3780} {"train_loss": -6.906907081604004, "global_step": 158797, "epoch": 3780} {"train_loss": -7.08776330947876, "global_step": 158798, "epoch": 3780} {"train_loss": -7.014171600341797, "global_step": 158799, "epoch": 3780} {"train_loss": -7.012475490570068, "global_step": 158800, "epoch": 3780} {"train_loss": -6.977000338690622, "global_step": 158801, "epoch": 3780, "val_loss": 68623.890625} {"train_loss": -6.987015247344971, "global_step": 158802, "epoch": 3781} {"train_loss": -7.0235595703125, "global_step": 158803, "epoch": 3781} {"train_loss": -7.083710670471191, "global_step": 158804, "epoch": 3781} {"train_loss": -6.935269355773926, "global_step": 158805, "epoch": 3781} {"train_loss": -6.992076873779297, "global_step": 158806, "epoch": 3781} {"train_loss": -7.027785301208496, "global_step": 158807, "epoch": 3781} {"train_loss": -7.038287162780762, "global_step": 158808, "epoch": 3781} {"train_loss": -6.807399749755859, "global_step": 158809, "epoch": 3781} {"train_loss": -7.010763168334961, "global_step": 158810, "epoch": 3781} {"train_loss": -6.987831115722656, "global_step": 158811, "epoch": 3781} {"train_loss": -6.9310760498046875, "global_step": 158812, "epoch": 3781} {"train_loss": -6.998885154724121, "global_step": 158813, "epoch": 3781} {"train_loss": -7.082175254821777, "global_step": 158814, "epoch": 3781} {"train_loss": -6.8845295906066895, "global_step": 158815, "epoch": 3781} {"train_loss": -6.8975324630737305, "global_step": 158816, "epoch": 3781} {"train_loss": -6.96196174621582, "global_step": 158817, "epoch": 3781} {"train_loss": -7.006843090057373, "global_step": 158818, "epoch": 3781} {"train_loss": -6.974909782409668, "global_step": 158819, "epoch": 3781} {"train_loss": -6.953188896179199, "global_step": 158820, "epoch": 3781} {"train_loss": -6.980385780334473, "global_step": 158821, "epoch": 3781} {"train_loss": -6.967410087585449, "global_step": 158822, "epoch": 3781} {"train_loss": -7.00045108795166, "global_step": 158823, "epoch": 3781} {"train_loss": -6.935335159301758, "global_step": 158824, "epoch": 3781} {"train_loss": -6.877347946166992, "global_step": 158825, "epoch": 3781} {"train_loss": -6.825292587280273, "global_step": 158826, "epoch": 3781} {"train_loss": -6.916538715362549, "global_step": 158827, "epoch": 3781} {"train_loss": -6.861956596374512, "global_step": 158828, "epoch": 3781} {"train_loss": -6.831234931945801, "global_step": 158829, "epoch": 3781} {"train_loss": -6.884169578552246, "global_step": 158830, "epoch": 3781} {"train_loss": -6.91013240814209, "global_step": 158831, "epoch": 3781} {"train_loss": -6.901220321655273, "global_step": 158832, "epoch": 3781} {"train_loss": -6.869999885559082, "global_step": 158833, "epoch": 3781} {"train_loss": -6.800248146057129, "global_step": 158834, "epoch": 3781} {"train_loss": -6.861327171325684, "global_step": 158835, "epoch": 3781} {"train_loss": -6.864996910095215, "global_step": 158836, "epoch": 3781} {"train_loss": -6.733380317687988, "global_step": 158837, "epoch": 3781} {"train_loss": -6.8226094245910645, "global_step": 158838, "epoch": 3781} {"train_loss": -6.906795501708984, "global_step": 158839, "epoch": 3781} {"train_loss": -6.704483985900879, "global_step": 158840, "epoch": 3781} {"train_loss": -6.966933250427246, "global_step": 158841, "epoch": 3781} {"train_loss": -6.876221656799316, "global_step": 158842, "epoch": 3781} {"train_loss": -6.919138874326434, "global_step": 158843, "epoch": 3781, "val_loss": 68692.8046875} {"train_loss": -6.80488395690918, "global_step": 158844, "epoch": 3782} {"train_loss": -6.871306896209717, "global_step": 158845, "epoch": 3782} {"train_loss": -6.755093574523926, "global_step": 158846, "epoch": 3782} {"train_loss": -6.891359329223633, "global_step": 158847, "epoch": 3782} {"train_loss": -6.857657432556152, "global_step": 158848, "epoch": 3782} {"train_loss": -6.856743812561035, "global_step": 158849, "epoch": 3782} {"train_loss": -6.898000240325928, "global_step": 158850, "epoch": 3782} {"train_loss": -6.842209339141846, "global_step": 158851, "epoch": 3782} {"train_loss": -6.881670951843262, "global_step": 158852, "epoch": 3782} {"train_loss": -6.7498779296875, "global_step": 158853, "epoch": 3782} {"train_loss": -6.934849739074707, "global_step": 158854, "epoch": 3782} {"train_loss": -6.834892272949219, "global_step": 158855, "epoch": 3782} {"train_loss": -6.889951705932617, "global_step": 158856, "epoch": 3782} {"train_loss": -6.933939456939697, "global_step": 158857, "epoch": 3782} {"train_loss": -6.886971473693848, "global_step": 158858, "epoch": 3782} {"train_loss": -6.848714828491211, "global_step": 158859, "epoch": 3782} {"train_loss": -6.8219170570373535, "global_step": 158860, "epoch": 3782} {"train_loss": -6.8127360343933105, "global_step": 158861, "epoch": 3782} {"train_loss": -6.888937950134277, "global_step": 158862, "epoch": 3782} {"train_loss": -6.848446846008301, "global_step": 158863, "epoch": 3782} {"train_loss": -6.800377368927002, "global_step": 158864, "epoch": 3782} {"train_loss": -6.79802942276001, "global_step": 158865, "epoch": 3782} {"train_loss": -6.9255266189575195, "global_step": 158866, "epoch": 3782} {"train_loss": -6.869564533233643, "global_step": 158867, "epoch": 3782} {"train_loss": -6.904455184936523, "global_step": 158868, "epoch": 3782} {"train_loss": -6.843268394470215, "global_step": 158869, "epoch": 3782} {"train_loss": -6.844006538391113, "global_step": 158870, "epoch": 3782} {"train_loss": -6.805086135864258, "global_step": 158871, "epoch": 3782} {"train_loss": -6.9005303382873535, "global_step": 158872, "epoch": 3782} {"train_loss": -6.9695143699646, "global_step": 158873, "epoch": 3782} {"train_loss": -6.850301742553711, "global_step": 158874, "epoch": 3782} {"train_loss": -6.9452433586120605, "global_step": 158875, "epoch": 3782} {"train_loss": -6.83144474029541, "global_step": 158876, "epoch": 3782} {"train_loss": -6.865070819854736, "global_step": 158877, "epoch": 3782} {"train_loss": -6.990453720092773, "global_step": 158878, "epoch": 3782} {"train_loss": -6.835234642028809, "global_step": 158879, "epoch": 3782} {"train_loss": -6.928177356719971, "global_step": 158880, "epoch": 3782} {"train_loss": -6.818820953369141, "global_step": 158881, "epoch": 3782} {"train_loss": -6.9446306228637695, "global_step": 158882, "epoch": 3782} {"train_loss": -6.892770767211914, "global_step": 158883, "epoch": 3782} {"train_loss": -6.949272155761719, "global_step": 158884, "epoch": 3782} {"train_loss": -6.870739187513079, "global_step": 158885, "epoch": 3782, "val_loss": 68345.828125} {"train_loss": -6.97363805770874, "global_step": 158886, "epoch": 3783} {"train_loss": -6.879798889160156, "global_step": 158887, "epoch": 3783} {"train_loss": -6.992402076721191, "global_step": 158888, "epoch": 3783} {"train_loss": -7.003170013427734, "global_step": 158889, "epoch": 3783} {"train_loss": -6.964919567108154, "global_step": 158890, "epoch": 3783} {"train_loss": -7.091097354888916, "global_step": 158891, "epoch": 3783} {"train_loss": -6.900111198425293, "global_step": 158892, "epoch": 3783} {"train_loss": -6.932183265686035, "global_step": 158893, "epoch": 3783} {"train_loss": -7.066155433654785, "global_step": 158894, "epoch": 3783} {"train_loss": -6.946715354919434, "global_step": 158895, "epoch": 3783} {"train_loss": -7.1292243003845215, "global_step": 158896, "epoch": 3783} {"train_loss": -6.957616806030273, "global_step": 158897, "epoch": 3783} {"train_loss": -7.051185607910156, "global_step": 158898, "epoch": 3783} {"train_loss": -6.990392684936523, "global_step": 158899, "epoch": 3783} {"train_loss": -6.968299865722656, "global_step": 158900, "epoch": 3783} {"train_loss": -7.000412464141846, "global_step": 158901, "epoch": 3783} {"train_loss": -6.887764930725098, "global_step": 158902, "epoch": 3783} {"train_loss": -6.98516845703125, "global_step": 158903, "epoch": 3783} {"train_loss": -7.03987979888916, "global_step": 158904, "epoch": 3783} {"train_loss": -6.902910232543945, "global_step": 158905, "epoch": 3783} {"train_loss": -7.0270280838012695, "global_step": 158906, "epoch": 3783} {"train_loss": -6.881300926208496, "global_step": 158907, "epoch": 3783} {"train_loss": -6.902256488800049, "global_step": 158908, "epoch": 3783} {"train_loss": -7.000609874725342, "global_step": 158909, "epoch": 3783} {"train_loss": -6.836612701416016, "global_step": 158910, "epoch": 3783} {"train_loss": -6.997143268585205, "global_step": 158911, "epoch": 3783} {"train_loss": -6.962583065032959, "global_step": 158912, "epoch": 3783} {"train_loss": -7.026785850524902, "global_step": 158913, "epoch": 3783} {"train_loss": -7.013693809509277, "global_step": 158914, "epoch": 3783} {"train_loss": -7.011288166046143, "global_step": 158915, "epoch": 3783} {"train_loss": -6.98242712020874, "global_step": 158916, "epoch": 3783} {"train_loss": -6.966385841369629, "global_step": 158917, "epoch": 3783} {"train_loss": -6.976082801818848, "global_step": 158918, "epoch": 3783} {"train_loss": -6.93817138671875, "global_step": 158919, "epoch": 3783} {"train_loss": -6.9626617431640625, "global_step": 158920, "epoch": 3783} {"train_loss": -6.955793857574463, "global_step": 158921, "epoch": 3783} {"train_loss": -6.977273941040039, "global_step": 158922, "epoch": 3783} {"train_loss": -6.965892791748047, "global_step": 158923, "epoch": 3783} {"train_loss": -6.98997163772583, "global_step": 158924, "epoch": 3783} {"train_loss": -7.079896926879883, "global_step": 158925, "epoch": 3783} {"train_loss": -7.001091957092285, "global_step": 158926, "epoch": 3783} {"train_loss": -6.9769914377303355, "global_step": 158927, "epoch": 3783, "val_loss": 68619.859375} {"train_loss": -6.936470985412598, "global_step": 158928, "epoch": 3784} {"train_loss": -7.087241172790527, "global_step": 158929, "epoch": 3784} {"train_loss": -6.9359540939331055, "global_step": 158930, "epoch": 3784} {"train_loss": -6.979584693908691, "global_step": 158931, "epoch": 3784} {"train_loss": -6.928830146789551, "global_step": 158932, "epoch": 3784} {"train_loss": -6.970954895019531, "global_step": 158933, "epoch": 3784} {"train_loss": -6.895142078399658, "global_step": 158934, "epoch": 3784} {"train_loss": -6.978018760681152, "global_step": 158935, "epoch": 3784} {"train_loss": -6.863432884216309, "global_step": 158936, "epoch": 3784} {"train_loss": -6.901325225830078, "global_step": 158937, "epoch": 3784} {"train_loss": -6.9369096755981445, "global_step": 158938, "epoch": 3784} {"train_loss": -6.888537406921387, "global_step": 158939, "epoch": 3784} {"train_loss": -7.005290985107422, "global_step": 158940, "epoch": 3784} {"train_loss": -7.141786575317383, "global_step": 158941, "epoch": 3784} {"train_loss": -6.929116249084473, "global_step": 158942, "epoch": 3784} {"train_loss": -6.992188453674316, "global_step": 158943, "epoch": 3784} {"train_loss": -6.986681938171387, "global_step": 158944, "epoch": 3784} {"train_loss": -6.861382484436035, "global_step": 158945, "epoch": 3784} {"train_loss": -6.914393424987793, "global_step": 158946, "epoch": 3784} {"train_loss": -6.925989151000977, "global_step": 158947, "epoch": 3784} {"train_loss": -6.952757358551025, "global_step": 158948, "epoch": 3784} {"train_loss": -6.882716178894043, "global_step": 158949, "epoch": 3784} {"train_loss": -6.915743827819824, "global_step": 158950, "epoch": 3784} {"train_loss": -6.970755577087402, "global_step": 158951, "epoch": 3784} {"train_loss": -6.913641929626465, "global_step": 158952, "epoch": 3784} {"train_loss": -6.865777015686035, "global_step": 158953, "epoch": 3784} {"train_loss": -6.944159507751465, "global_step": 158954, "epoch": 3784} {"train_loss": -6.858482360839844, "global_step": 158955, "epoch": 3784} {"train_loss": -6.96492862701416, "global_step": 158956, "epoch": 3784} {"train_loss": -7.080995559692383, "global_step": 158957, "epoch": 3784} {"train_loss": -6.940180778503418, "global_step": 158958, "epoch": 3784} {"train_loss": -7.137452125549316, "global_step": 158959, "epoch": 3784} {"train_loss": -6.991666316986084, "global_step": 158960, "epoch": 3784} {"train_loss": -7.004112243652344, "global_step": 158961, "epoch": 3784} {"train_loss": -7.022928237915039, "global_step": 158962, "epoch": 3784} {"train_loss": -6.886234283447266, "global_step": 158963, "epoch": 3784} {"train_loss": -6.8821539878845215, "global_step": 158964, "epoch": 3784} {"train_loss": -6.887603282928467, "global_step": 158965, "epoch": 3784} {"train_loss": -6.925701141357422, "global_step": 158966, "epoch": 3784} {"train_loss": -6.89072322845459, "global_step": 158967, "epoch": 3784} {"train_loss": -6.93507719039917, "global_step": 158968, "epoch": 3784} {"train_loss": -6.9478590829031805, "global_step": 158969, "epoch": 3784, "val_loss": 68383.078125} {"train_loss": -6.916058540344238, "global_step": 158970, "epoch": 3785} {"train_loss": -6.989481449127197, "global_step": 158971, "epoch": 3785} {"train_loss": -6.930477619171143, "global_step": 158972, "epoch": 3785} {"train_loss": -6.839010238647461, "global_step": 158973, "epoch": 3785} {"train_loss": -7.016167640686035, "global_step": 158974, "epoch": 3785} {"train_loss": -6.951159477233887, "global_step": 158975, "epoch": 3785} {"train_loss": -6.908177375793457, "global_step": 158976, "epoch": 3785} {"train_loss": -6.829119682312012, "global_step": 158977, "epoch": 3785} {"train_loss": -6.968664169311523, "global_step": 158978, "epoch": 3785} {"train_loss": -6.912770748138428, "global_step": 158979, "epoch": 3785} {"train_loss": -6.915677070617676, "global_step": 158980, "epoch": 3785} {"train_loss": -7.007220268249512, "global_step": 158981, "epoch": 3785} {"train_loss": -6.992774963378906, "global_step": 158982, "epoch": 3785} {"train_loss": -6.992962837219238, "global_step": 158983, "epoch": 3785} {"train_loss": -6.981374263763428, "global_step": 158984, "epoch": 3785} {"train_loss": -6.80374002456665, "global_step": 158985, "epoch": 3785} {"train_loss": -6.839644432067871, "global_step": 158986, "epoch": 3785} {"train_loss": -6.990352630615234, "global_step": 158987, "epoch": 3785} {"train_loss": -6.934194087982178, "global_step": 158988, "epoch": 3785} {"train_loss": -6.904707908630371, "global_step": 158989, "epoch": 3785} {"train_loss": -7.013215065002441, "global_step": 158990, "epoch": 3785} {"train_loss": -6.891071319580078, "global_step": 158991, "epoch": 3785} {"train_loss": -6.899518013000488, "global_step": 158992, "epoch": 3785} {"train_loss": -6.839328765869141, "global_step": 158993, "epoch": 3785} {"train_loss": -6.951571941375732, "global_step": 158994, "epoch": 3785} {"train_loss": -6.83448600769043, "global_step": 158995, "epoch": 3785} {"train_loss": -6.987822532653809, "global_step": 158996, "epoch": 3785} {"train_loss": -6.987151145935059, "global_step": 158997, "epoch": 3785} {"train_loss": -6.947171211242676, "global_step": 158998, "epoch": 3785} {"train_loss": -6.96372127532959, "global_step": 158999, "epoch": 3785} {"train_loss": -6.882530212402344, "global_step": 159000, "epoch": 3785} {"train_loss": -6.831964492797852, "global_step": 159001, "epoch": 3785} {"train_loss": -7.026307106018066, "global_step": 159002, "epoch": 3785} {"train_loss": -6.963955402374268, "global_step": 159003, "epoch": 3785} {"train_loss": -6.907041072845459, "global_step": 159004, "epoch": 3785} {"train_loss": -6.935082912445068, "global_step": 159005, "epoch": 3785} {"train_loss": -6.887591361999512, "global_step": 159006, "epoch": 3785} {"train_loss": -6.9749250411987305, "global_step": 159007, "epoch": 3785} {"train_loss": -6.911435127258301, "global_step": 159008, "epoch": 3785} {"train_loss": -6.834486484527588, "global_step": 159009, "epoch": 3785} {"train_loss": -6.846030235290527, "global_step": 159010, "epoch": 3785} {"train_loss": -6.924510808218093, "global_step": 159011, "epoch": 3785, "val_loss": 68509.0546875} {"train_loss": -7.0194268226623535, "global_step": 159012, "epoch": 3786} {"train_loss": -6.843770980834961, "global_step": 159013, "epoch": 3786} {"train_loss": -6.719779014587402, "global_step": 159014, "epoch": 3786} {"train_loss": -6.963307857513428, "global_step": 159015, "epoch": 3786} {"train_loss": -6.793961048126221, "global_step": 159016, "epoch": 3786} {"train_loss": -6.966917037963867, "global_step": 159017, "epoch": 3786} {"train_loss": -6.869124412536621, "global_step": 159018, "epoch": 3786} {"train_loss": -6.874912261962891, "global_step": 159019, "epoch": 3786} {"train_loss": -6.766691207885742, "global_step": 159020, "epoch": 3786} {"train_loss": -6.928859710693359, "global_step": 159021, "epoch": 3786} {"train_loss": -6.894707679748535, "global_step": 159022, "epoch": 3786} {"train_loss": -7.028731346130371, "global_step": 159023, "epoch": 3786} {"train_loss": -6.924627304077148, "global_step": 159024, "epoch": 3786} {"train_loss": -6.925506591796875, "global_step": 159025, "epoch": 3786} {"train_loss": -6.891556739807129, "global_step": 159026, "epoch": 3786} {"train_loss": -6.941798210144043, "global_step": 159027, "epoch": 3786} {"train_loss": -6.8913893699646, "global_step": 159028, "epoch": 3786} {"train_loss": -7.069990158081055, "global_step": 159029, "epoch": 3786} {"train_loss": -6.83768892288208, "global_step": 159030, "epoch": 3786} {"train_loss": -6.966785907745361, "global_step": 159031, "epoch": 3786} {"train_loss": -6.974070072174072, "global_step": 159032, "epoch": 3786} {"train_loss": -6.965505123138428, "global_step": 159033, "epoch": 3786} {"train_loss": -6.980951309204102, "global_step": 159034, "epoch": 3786} {"train_loss": -6.983635425567627, "global_step": 159035, "epoch": 3786} {"train_loss": -6.952137470245361, "global_step": 159036, "epoch": 3786} {"train_loss": -6.94533634185791, "global_step": 159037, "epoch": 3786} {"train_loss": -6.9498491287231445, "global_step": 159038, "epoch": 3786} {"train_loss": -6.895356178283691, "global_step": 159039, "epoch": 3786} {"train_loss": -6.955101013183594, "global_step": 159040, "epoch": 3786} {"train_loss": -6.996129512786865, "global_step": 159041, "epoch": 3786} {"train_loss": -7.079612731933594, "global_step": 159042, "epoch": 3786} {"train_loss": -6.887538909912109, "global_step": 159043, "epoch": 3786} {"train_loss": -6.96700382232666, "global_step": 159044, "epoch": 3786} {"train_loss": -6.904829978942871, "global_step": 159045, "epoch": 3786} {"train_loss": -6.860763072967529, "global_step": 159046, "epoch": 3786} {"train_loss": -6.8386077880859375, "global_step": 159047, "epoch": 3786} {"train_loss": -6.92915153503418, "global_step": 159048, "epoch": 3786} {"train_loss": -6.986171722412109, "global_step": 159049, "epoch": 3786} {"train_loss": -7.045551776885986, "global_step": 159050, "epoch": 3786} {"train_loss": -6.925676345825195, "global_step": 159051, "epoch": 3786} {"train_loss": -6.962541580200195, "global_step": 159052, "epoch": 3786} {"train_loss": -6.931278467178345, "global_step": 159053, "epoch": 3786, "val_loss": 68293.71875} {"train_loss": -7.053732872009277, "global_step": 159054, "epoch": 3787} {"train_loss": -6.991449356079102, "global_step": 159055, "epoch": 3787} {"train_loss": -6.930022239685059, "global_step": 159056, "epoch": 3787} {"train_loss": -6.902911186218262, "global_step": 159057, "epoch": 3787} {"train_loss": -7.022216796875, "global_step": 159058, "epoch": 3787} {"train_loss": -7.037968635559082, "global_step": 159059, "epoch": 3787} {"train_loss": -7.036546230316162, "global_step": 159060, "epoch": 3787} {"train_loss": -6.983019828796387, "global_step": 159061, "epoch": 3787} {"train_loss": -7.010012626647949, "global_step": 159062, "epoch": 3787} {"train_loss": -7.020752429962158, "global_step": 159063, "epoch": 3787} {"train_loss": -7.0025634765625, "global_step": 159064, "epoch": 3787} {"train_loss": -7.0783796310424805, "global_step": 159065, "epoch": 3787} {"train_loss": -7.069491386413574, "global_step": 159066, "epoch": 3787} {"train_loss": -6.960530757904053, "global_step": 159067, "epoch": 3787} {"train_loss": -6.975706577301025, "global_step": 159068, "epoch": 3787} {"train_loss": -6.925135135650635, "global_step": 159069, "epoch": 3787} {"train_loss": -6.918920516967773, "global_step": 159070, "epoch": 3787} {"train_loss": -6.761972427368164, "global_step": 159071, "epoch": 3787} {"train_loss": -6.854564666748047, "global_step": 159072, "epoch": 3787} {"train_loss": -6.9355268478393555, "global_step": 159073, "epoch": 3787} {"train_loss": -6.862463474273682, "global_step": 159074, "epoch": 3787} {"train_loss": -6.962719917297363, "global_step": 159075, "epoch": 3787} {"train_loss": -7.042396068572998, "global_step": 159076, "epoch": 3787} {"train_loss": -7.022284507751465, "global_step": 159077, "epoch": 3787} {"train_loss": -7.03108549118042, "global_step": 159078, "epoch": 3787} {"train_loss": -6.89508056640625, "global_step": 159079, "epoch": 3787} {"train_loss": -7.027646064758301, "global_step": 159080, "epoch": 3787} {"train_loss": -7.014569282531738, "global_step": 159081, "epoch": 3787} {"train_loss": -6.948073387145996, "global_step": 159082, "epoch": 3787} {"train_loss": -6.914313316345215, "global_step": 159083, "epoch": 3787} {"train_loss": -6.985238075256348, "global_step": 159084, "epoch": 3787} {"train_loss": -6.881657123565674, "global_step": 159085, "epoch": 3787} {"train_loss": -7.02234411239624, "global_step": 159086, "epoch": 3787} {"train_loss": -6.960773468017578, "global_step": 159087, "epoch": 3787} {"train_loss": -6.830577850341797, "global_step": 159088, "epoch": 3787} {"train_loss": -6.849424362182617, "global_step": 159089, "epoch": 3787} {"train_loss": -6.9668779373168945, "global_step": 159090, "epoch": 3787} {"train_loss": -6.945544719696045, "global_step": 159091, "epoch": 3787} {"train_loss": -6.928549289703369, "global_step": 159092, "epoch": 3787} {"train_loss": -6.903470039367676, "global_step": 159093, "epoch": 3787} {"train_loss": -6.888760089874268, "global_step": 159094, "epoch": 3787} {"train_loss": -6.961478823707218, "global_step": 159095, "epoch": 3787, "val_loss": 68666.7890625} {"train_loss": -6.987520217895508, "global_step": 159096, "epoch": 3788} {"train_loss": -6.983234405517578, "global_step": 159097, "epoch": 3788} {"train_loss": -6.976179122924805, "global_step": 159098, "epoch": 3788} {"train_loss": -6.961791038513184, "global_step": 159099, "epoch": 3788} {"train_loss": -6.966955661773682, "global_step": 159100, "epoch": 3788} {"train_loss": -6.910432815551758, "global_step": 159101, "epoch": 3788} {"train_loss": -6.916555404663086, "global_step": 159102, "epoch": 3788} {"train_loss": -6.890518665313721, "global_step": 159103, "epoch": 3788} {"train_loss": -6.998592853546143, "global_step": 159104, "epoch": 3788} {"train_loss": -6.90515661239624, "global_step": 159105, "epoch": 3788} {"train_loss": -6.880741119384766, "global_step": 159106, "epoch": 3788} {"train_loss": -6.970047950744629, "global_step": 159107, "epoch": 3788} {"train_loss": -6.837030410766602, "global_step": 159108, "epoch": 3788} {"train_loss": -6.975001811981201, "global_step": 159109, "epoch": 3788} {"train_loss": -6.932703018188477, "global_step": 159110, "epoch": 3788} {"train_loss": -6.957242012023926, "global_step": 159111, "epoch": 3788} {"train_loss": -6.941519737243652, "global_step": 159112, "epoch": 3788} {"train_loss": -7.020711898803711, "global_step": 159113, "epoch": 3788} {"train_loss": -6.90507698059082, "global_step": 159114, "epoch": 3788} {"train_loss": -7.017114639282227, "global_step": 159115, "epoch": 3788} {"train_loss": -6.879517555236816, "global_step": 159116, "epoch": 3788} {"train_loss": -6.895445823669434, "global_step": 159117, "epoch": 3788} {"train_loss": -6.975664138793945, "global_step": 159118, "epoch": 3788} {"train_loss": -6.988965034484863, "global_step": 159119, "epoch": 3788} {"train_loss": -6.900019645690918, "global_step": 159120, "epoch": 3788} {"train_loss": -6.906506538391113, "global_step": 159121, "epoch": 3788} {"train_loss": -6.815463066101074, "global_step": 159122, "epoch": 3788} {"train_loss": -6.958400726318359, "global_step": 159123, "epoch": 3788} {"train_loss": -7.014454364776611, "global_step": 159124, "epoch": 3788} {"train_loss": -6.887882709503174, "global_step": 159125, "epoch": 3788} {"train_loss": -6.905441761016846, "global_step": 159126, "epoch": 3788} {"train_loss": -7.000892162322998, "global_step": 159127, "epoch": 3788} {"train_loss": -7.057229042053223, "global_step": 159128, "epoch": 3788} {"train_loss": -6.9534454345703125, "global_step": 159129, "epoch": 3788} {"train_loss": -6.939430236816406, "global_step": 159130, "epoch": 3788} {"train_loss": -6.8480224609375, "global_step": 159131, "epoch": 3788} {"train_loss": -6.864465713500977, "global_step": 159132, "epoch": 3788} {"train_loss": -6.991560935974121, "global_step": 159133, "epoch": 3788} {"train_loss": -6.803150653839111, "global_step": 159134, "epoch": 3788} {"train_loss": -6.899205207824707, "global_step": 159135, "epoch": 3788} {"train_loss": -6.8812360763549805, "global_step": 159136, "epoch": 3788} {"train_loss": -6.933032138007028, "global_step": 159137, "epoch": 3788, "val_loss": 68606.3515625} {"train_loss": -7.054116249084473, "global_step": 159138, "epoch": 3789} {"train_loss": -6.950447082519531, "global_step": 159139, "epoch": 3789} {"train_loss": -6.957076072692871, "global_step": 159140, "epoch": 3789} {"train_loss": -6.947945594787598, "global_step": 159141, "epoch": 3789} {"train_loss": -6.994277000427246, "global_step": 159142, "epoch": 3789} {"train_loss": -6.939530372619629, "global_step": 159143, "epoch": 3789} {"train_loss": -7.070885181427002, "global_step": 159144, "epoch": 3789} {"train_loss": -6.905821323394775, "global_step": 159145, "epoch": 3789} {"train_loss": -6.978236675262451, "global_step": 159146, "epoch": 3789} {"train_loss": -7.018393516540527, "global_step": 159147, "epoch": 3789} {"train_loss": -6.939214706420898, "global_step": 159148, "epoch": 3789} {"train_loss": -6.9324164390563965, "global_step": 159149, "epoch": 3789} {"train_loss": -6.946905136108398, "global_step": 159150, "epoch": 3789} {"train_loss": -6.922801971435547, "global_step": 159151, "epoch": 3789} {"train_loss": -6.955455780029297, "global_step": 159152, "epoch": 3789} {"train_loss": -7.03507137298584, "global_step": 159153, "epoch": 3789} {"train_loss": -6.996591567993164, "global_step": 159154, "epoch": 3789} {"train_loss": -6.957144737243652, "global_step": 159155, "epoch": 3789} {"train_loss": -7.021971702575684, "global_step": 159156, "epoch": 3789} {"train_loss": -6.890107154846191, "global_step": 159157, "epoch": 3789} {"train_loss": -6.980198383331299, "global_step": 159158, "epoch": 3789} {"train_loss": -6.837005615234375, "global_step": 159159, "epoch": 3789} {"train_loss": -6.887391090393066, "global_step": 159160, "epoch": 3789} {"train_loss": -6.873102188110352, "global_step": 159161, "epoch": 3789} {"train_loss": -6.867592811584473, "global_step": 159162, "epoch": 3789} {"train_loss": -6.9433794021606445, "global_step": 159163, "epoch": 3789} {"train_loss": -6.887136936187744, "global_step": 159164, "epoch": 3789} {"train_loss": -6.956005573272705, "global_step": 159165, "epoch": 3789} {"train_loss": -7.055194854736328, "global_step": 159166, "epoch": 3789} {"train_loss": -6.89069938659668, "global_step": 159167, "epoch": 3789} {"train_loss": -6.951032638549805, "global_step": 159168, "epoch": 3789} {"train_loss": -7.015960693359375, "global_step": 159169, "epoch": 3789} {"train_loss": -6.973888397216797, "global_step": 159170, "epoch": 3789} {"train_loss": -6.979895114898682, "global_step": 159171, "epoch": 3789} {"train_loss": -7.014042854309082, "global_step": 159172, "epoch": 3789} {"train_loss": -6.908637523651123, "global_step": 159173, "epoch": 3789} {"train_loss": -6.866260528564453, "global_step": 159174, "epoch": 3789} {"train_loss": -6.992712020874023, "global_step": 159175, "epoch": 3789} {"train_loss": -6.9073967933654785, "global_step": 159176, "epoch": 3789} {"train_loss": -6.970127105712891, "global_step": 159177, "epoch": 3789} {"train_loss": -7.070372581481934, "global_step": 159178, "epoch": 3789} {"train_loss": -6.958204803012666, "global_step": 159179, "epoch": 3789, "val_loss": 68696.3515625} {"train_loss": -6.915806770324707, "global_step": 159180, "epoch": 3790} {"train_loss": -6.992682456970215, "global_step": 159181, "epoch": 3790} {"train_loss": -6.977739334106445, "global_step": 159182, "epoch": 3790} {"train_loss": -6.953265190124512, "global_step": 159183, "epoch": 3790} {"train_loss": -6.9996466636657715, "global_step": 159184, "epoch": 3790} {"train_loss": -6.923704624176025, "global_step": 159185, "epoch": 3790} {"train_loss": -6.828909873962402, "global_step": 159186, "epoch": 3790} {"train_loss": -6.775412559509277, "global_step": 159187, "epoch": 3790} {"train_loss": -6.919130802154541, "global_step": 159188, "epoch": 3790} {"train_loss": -6.696858882904053, "global_step": 159189, "epoch": 3790} {"train_loss": -6.764385223388672, "global_step": 159190, "epoch": 3790} {"train_loss": -6.772984504699707, "global_step": 159191, "epoch": 3790} {"train_loss": -6.809171676635742, "global_step": 159192, "epoch": 3790} {"train_loss": -6.83021354675293, "global_step": 159193, "epoch": 3790} {"train_loss": -6.740936279296875, "global_step": 159194, "epoch": 3790} {"train_loss": -6.875274181365967, "global_step": 159195, "epoch": 3790} {"train_loss": -6.765583038330078, "global_step": 159196, "epoch": 3790} {"train_loss": -6.869162559509277, "global_step": 159197, "epoch": 3790} {"train_loss": -6.870615005493164, "global_step": 159198, "epoch": 3790} {"train_loss": -6.874294281005859, "global_step": 159199, "epoch": 3790} {"train_loss": -6.939121723175049, "global_step": 159200, "epoch": 3790} {"train_loss": -6.815657138824463, "global_step": 159201, "epoch": 3790} {"train_loss": -6.740602016448975, "global_step": 159202, "epoch": 3790} {"train_loss": -6.819209098815918, "global_step": 159203, "epoch": 3790} {"train_loss": -6.971861839294434, "global_step": 159204, "epoch": 3790} {"train_loss": -6.911705493927002, "global_step": 159205, "epoch": 3790} {"train_loss": -6.788364887237549, "global_step": 159206, "epoch": 3790} {"train_loss": -6.861550331115723, "global_step": 159207, "epoch": 3790} {"train_loss": -6.81591796875, "global_step": 159208, "epoch": 3790} {"train_loss": -6.772880554199219, "global_step": 159209, "epoch": 3790} {"train_loss": -6.8981614112854, "global_step": 159210, "epoch": 3790} {"train_loss": -6.85087776184082, "global_step": 159211, "epoch": 3790} {"train_loss": -6.88306188583374, "global_step": 159212, "epoch": 3790} {"train_loss": -6.998917102813721, "global_step": 159213, "epoch": 3790} {"train_loss": -6.909755706787109, "global_step": 159214, "epoch": 3790} {"train_loss": -6.894744873046875, "global_step": 159215, "epoch": 3790} {"train_loss": -6.741398811340332, "global_step": 159216, "epoch": 3790} {"train_loss": -7.007206916809082, "global_step": 159217, "epoch": 3790} {"train_loss": -6.8279242515563965, "global_step": 159218, "epoch": 3790} {"train_loss": -6.8841753005981445, "global_step": 159219, "epoch": 3790} {"train_loss": -6.928969383239746, "global_step": 159220, "epoch": 3790} {"train_loss": -6.864574545905704, "global_step": 159221, "epoch": 3790, "val_loss": 68627.3046875} {"train_loss": -6.94375467300415, "global_step": 159222, "epoch": 3791} {"train_loss": -6.936822891235352, "global_step": 159223, "epoch": 3791} {"train_loss": -6.859742164611816, "global_step": 159224, "epoch": 3791} {"train_loss": -6.911785125732422, "global_step": 159225, "epoch": 3791} {"train_loss": -6.963814735412598, "global_step": 159226, "epoch": 3791} {"train_loss": -6.847308158874512, "global_step": 159227, "epoch": 3791} {"train_loss": -6.787379264831543, "global_step": 159228, "epoch": 3791} {"train_loss": -6.906987190246582, "global_step": 159229, "epoch": 3791} {"train_loss": -6.8915324211120605, "global_step": 159230, "epoch": 3791} {"train_loss": -6.909401893615723, "global_step": 159231, "epoch": 3791} {"train_loss": -7.0522565841674805, "global_step": 159232, "epoch": 3791} {"train_loss": -6.987836837768555, "global_step": 159233, "epoch": 3791} {"train_loss": -6.913322448730469, "global_step": 159234, "epoch": 3791} {"train_loss": -7.028644561767578, "global_step": 159235, "epoch": 3791} {"train_loss": -7.003748893737793, "global_step": 159236, "epoch": 3791} {"train_loss": -6.963194370269775, "global_step": 159237, "epoch": 3791} {"train_loss": -7.1200714111328125, "global_step": 159238, "epoch": 3791} {"train_loss": -7.013783931732178, "global_step": 159239, "epoch": 3791} {"train_loss": -7.000781059265137, "global_step": 159240, "epoch": 3791} {"train_loss": -7.033064842224121, "global_step": 159241, "epoch": 3791} {"train_loss": -7.062977313995361, "global_step": 159242, "epoch": 3791} {"train_loss": -6.955892086029053, "global_step": 159243, "epoch": 3791} {"train_loss": -6.989418029785156, "global_step": 159244, "epoch": 3791} {"train_loss": -6.758405685424805, "global_step": 159245, "epoch": 3791} {"train_loss": -6.922476768493652, "global_step": 159246, "epoch": 3791} {"train_loss": -6.99842643737793, "global_step": 159247, "epoch": 3791} {"train_loss": -6.990502834320068, "global_step": 159248, "epoch": 3791} {"train_loss": -6.863864421844482, "global_step": 159249, "epoch": 3791} {"train_loss": -6.940203666687012, "global_step": 159250, "epoch": 3791} {"train_loss": -6.922060012817383, "global_step": 159251, "epoch": 3791} {"train_loss": -6.978780746459961, "global_step": 159252, "epoch": 3791} {"train_loss": -6.976780891418457, "global_step": 159253, "epoch": 3791} {"train_loss": -6.931413650512695, "global_step": 159254, "epoch": 3791} {"train_loss": -6.927833557128906, "global_step": 159255, "epoch": 3791} {"train_loss": -6.896550178527832, "global_step": 159256, "epoch": 3791} {"train_loss": -6.944838523864746, "global_step": 159257, "epoch": 3791} {"train_loss": -6.977165699005127, "global_step": 159258, "epoch": 3791} {"train_loss": -6.797814846038818, "global_step": 159259, "epoch": 3791} {"train_loss": -6.944870948791504, "global_step": 159260, "epoch": 3791} {"train_loss": -6.957491874694824, "global_step": 159261, "epoch": 3791} {"train_loss": -6.947770118713379, "global_step": 159262, "epoch": 3791} {"train_loss": -6.9477679161798385, "global_step": 159263, "epoch": 3791, "val_loss": 68443.0390625} {"train_loss": -6.94351863861084, "global_step": 159264, "epoch": 3792} {"train_loss": -6.8936052322387695, "global_step": 159265, "epoch": 3792} {"train_loss": -6.86818790435791, "global_step": 159266, "epoch": 3792} {"train_loss": -6.960489749908447, "global_step": 159267, "epoch": 3792} {"train_loss": -6.73660945892334, "global_step": 159268, "epoch": 3792} {"train_loss": -6.893710613250732, "global_step": 159269, "epoch": 3792} {"train_loss": -6.912529468536377, "global_step": 159270, "epoch": 3792} {"train_loss": -6.833430290222168, "global_step": 159271, "epoch": 3792} {"train_loss": -6.99202823638916, "global_step": 159272, "epoch": 3792} {"train_loss": -6.937691688537598, "global_step": 159273, "epoch": 3792} {"train_loss": -6.897571563720703, "global_step": 159274, "epoch": 3792} {"train_loss": -6.799797058105469, "global_step": 159275, "epoch": 3792} {"train_loss": -6.832995891571045, "global_step": 159276, "epoch": 3792} {"train_loss": -6.870438575744629, "global_step": 159277, "epoch": 3792} {"train_loss": -6.987324237823486, "global_step": 159278, "epoch": 3792} {"train_loss": -6.9281110763549805, "global_step": 159279, "epoch": 3792} {"train_loss": -6.922486305236816, "global_step": 159280, "epoch": 3792} {"train_loss": -6.817042827606201, "global_step": 159281, "epoch": 3792} {"train_loss": -6.919745445251465, "global_step": 159282, "epoch": 3792} {"train_loss": -6.86478328704834, "global_step": 159283, "epoch": 3792} {"train_loss": -6.791701316833496, "global_step": 159284, "epoch": 3792} {"train_loss": -6.926263332366943, "global_step": 159285, "epoch": 3792} {"train_loss": -6.949429988861084, "global_step": 159286, "epoch": 3792} {"train_loss": -7.037347793579102, "global_step": 159287, "epoch": 3792} {"train_loss": -6.94703483581543, "global_step": 159288, "epoch": 3792} {"train_loss": -7.005441665649414, "global_step": 159289, "epoch": 3792} {"train_loss": -6.9812703132629395, "global_step": 159290, "epoch": 3792} {"train_loss": -6.9460978507995605, "global_step": 159291, "epoch": 3792} {"train_loss": -6.952971935272217, "global_step": 159292, "epoch": 3792} {"train_loss": -6.972167015075684, "global_step": 159293, "epoch": 3792} {"train_loss": -7.002326965332031, "global_step": 159294, "epoch": 3792} {"train_loss": -6.796721458435059, "global_step": 159295, "epoch": 3792} {"train_loss": -6.800827980041504, "global_step": 159296, "epoch": 3792} {"train_loss": -6.931081771850586, "global_step": 159297, "epoch": 3792} {"train_loss": -7.044425010681152, "global_step": 159298, "epoch": 3792} {"train_loss": -6.852133750915527, "global_step": 159299, "epoch": 3792} {"train_loss": -6.96925163269043, "global_step": 159300, "epoch": 3792} {"train_loss": -6.952968120574951, "global_step": 159301, "epoch": 3792} {"train_loss": -6.878844738006592, "global_step": 159302, "epoch": 3792} {"train_loss": -6.910918235778809, "global_step": 159303, "epoch": 3792} {"train_loss": -6.888605117797852, "global_step": 159304, "epoch": 3792} {"train_loss": -6.9133033865974065, "global_step": 159305, "epoch": 3792, "val_loss": 68478.421875} {"train_loss": -7.034454345703125, "global_step": 159306, "epoch": 3793} {"train_loss": -6.993696212768555, "global_step": 159307, "epoch": 3793} {"train_loss": -6.957560062408447, "global_step": 159308, "epoch": 3793} {"train_loss": -6.994268894195557, "global_step": 159309, "epoch": 3793} {"train_loss": -6.966241359710693, "global_step": 159310, "epoch": 3793} {"train_loss": -6.891408443450928, "global_step": 159311, "epoch": 3793} {"train_loss": -6.883653163909912, "global_step": 159312, "epoch": 3793} {"train_loss": -6.892636775970459, "global_step": 159313, "epoch": 3793} {"train_loss": -6.936614036560059, "global_step": 159314, "epoch": 3793} {"train_loss": -7.013589859008789, "global_step": 159315, "epoch": 3793} {"train_loss": -6.993194103240967, "global_step": 159316, "epoch": 3793} {"train_loss": -6.983409404754639, "global_step": 159317, "epoch": 3793} {"train_loss": -7.0025177001953125, "global_step": 159318, "epoch": 3793} {"train_loss": -7.036907196044922, "global_step": 159319, "epoch": 3793} {"train_loss": -6.990295886993408, "global_step": 159320, "epoch": 3793} {"train_loss": -7.045068264007568, "global_step": 159321, "epoch": 3793} {"train_loss": -6.9397382736206055, "global_step": 159322, "epoch": 3793} {"train_loss": -6.982507705688477, "global_step": 159323, "epoch": 3793} {"train_loss": -6.957226276397705, "global_step": 159324, "epoch": 3793} {"train_loss": -7.081561088562012, "global_step": 159325, "epoch": 3793} {"train_loss": -6.895158290863037, "global_step": 159326, "epoch": 3793} {"train_loss": -6.919355392456055, "global_step": 159327, "epoch": 3793} {"train_loss": -6.931143760681152, "global_step": 159328, "epoch": 3793} {"train_loss": -6.985729217529297, "global_step": 159329, "epoch": 3793} {"train_loss": -6.99597692489624, "global_step": 159330, "epoch": 3793} {"train_loss": -6.966386318206787, "global_step": 159331, "epoch": 3793} {"train_loss": -6.995656967163086, "global_step": 159332, "epoch": 3793} {"train_loss": -6.971304893493652, "global_step": 159333, "epoch": 3793} {"train_loss": -6.97767972946167, "global_step": 159334, "epoch": 3793} {"train_loss": -6.885278224945068, "global_step": 159335, "epoch": 3793} {"train_loss": -6.882787704467773, "global_step": 159336, "epoch": 3793} {"train_loss": -6.927494049072266, "global_step": 159337, "epoch": 3793} {"train_loss": -6.938861846923828, "global_step": 159338, "epoch": 3793} {"train_loss": -6.920406818389893, "global_step": 159339, "epoch": 3793} {"train_loss": -6.989260196685791, "global_step": 159340, "epoch": 3793} {"train_loss": -6.981883525848389, "global_step": 159341, "epoch": 3793} {"train_loss": -6.855749130249023, "global_step": 159342, "epoch": 3793} {"train_loss": -7.020795822143555, "global_step": 159343, "epoch": 3793} {"train_loss": -6.895234107971191, "global_step": 159344, "epoch": 3793} {"train_loss": -6.761648654937744, "global_step": 159345, "epoch": 3793} {"train_loss": -6.901244163513184, "global_step": 159346, "epoch": 3793} {"train_loss": -6.952507586706252, "global_step": 159347, "epoch": 3793, "val_loss": 68565.3828125} {"train_loss": -7.002455234527588, "global_step": 159348, "epoch": 3794} {"train_loss": -6.962080955505371, "global_step": 159349, "epoch": 3794} {"train_loss": -6.975638389587402, "global_step": 159350, "epoch": 3794} {"train_loss": -6.89288330078125, "global_step": 159351, "epoch": 3794} {"train_loss": -7.001678466796875, "global_step": 159352, "epoch": 3794} {"train_loss": -6.899655342102051, "global_step": 159353, "epoch": 3794} {"train_loss": -6.910383224487305, "global_step": 159354, "epoch": 3794} {"train_loss": -6.85667610168457, "global_step": 159355, "epoch": 3794} {"train_loss": -6.890170097351074, "global_step": 159356, "epoch": 3794} {"train_loss": -7.0547943115234375, "global_step": 159357, "epoch": 3794} {"train_loss": -6.959961414337158, "global_step": 159358, "epoch": 3794} {"train_loss": -6.933664321899414, "global_step": 159359, "epoch": 3794} {"train_loss": -6.862673282623291, "global_step": 159360, "epoch": 3794} {"train_loss": -6.97531795501709, "global_step": 159361, "epoch": 3794} {"train_loss": -7.006800651550293, "global_step": 159362, "epoch": 3794} {"train_loss": -7.006968975067139, "global_step": 159363, "epoch": 3794} {"train_loss": -6.978555202484131, "global_step": 159364, "epoch": 3794} {"train_loss": -6.996981620788574, "global_step": 159365, "epoch": 3794} {"train_loss": -7.0615620613098145, "global_step": 159366, "epoch": 3794} {"train_loss": -6.8946661949157715, "global_step": 159367, "epoch": 3794} {"train_loss": -6.949161529541016, "global_step": 159368, "epoch": 3794} {"train_loss": -6.92151403427124, "global_step": 159369, "epoch": 3794} {"train_loss": -6.967255592346191, "global_step": 159370, "epoch": 3794} {"train_loss": -6.994931221008301, "global_step": 159371, "epoch": 3794} {"train_loss": -6.9611968994140625, "global_step": 159372, "epoch": 3794} {"train_loss": -6.936410903930664, "global_step": 159373, "epoch": 3794} {"train_loss": -7.021724700927734, "global_step": 159374, "epoch": 3794} {"train_loss": -6.860659122467041, "global_step": 159375, "epoch": 3794} {"train_loss": -6.967706203460693, "global_step": 159376, "epoch": 3794} {"train_loss": -6.928289413452148, "global_step": 159377, "epoch": 3794} {"train_loss": -7.000741958618164, "global_step": 159378, "epoch": 3794} {"train_loss": -6.867193222045898, "global_step": 159379, "epoch": 3794} {"train_loss": -6.905390739440918, "global_step": 159380, "epoch": 3794} {"train_loss": -6.9491963386535645, "global_step": 159381, "epoch": 3794} {"train_loss": -6.859927177429199, "global_step": 159382, "epoch": 3794} {"train_loss": -6.987303256988525, "global_step": 159383, "epoch": 3794} {"train_loss": -6.824653625488281, "global_step": 159384, "epoch": 3794} {"train_loss": -6.9127583503723145, "global_step": 159385, "epoch": 3794} {"train_loss": -6.883055686950684, "global_step": 159386, "epoch": 3794} {"train_loss": -6.93675422668457, "global_step": 159387, "epoch": 3794} {"train_loss": -7.006418704986572, "global_step": 159388, "epoch": 3794} {"train_loss": -6.944961820329938, "global_step": 159389, "epoch": 3794, "val_loss": 68633.015625} {"train_loss": -7.084674835205078, "global_step": 159390, "epoch": 3795} {"train_loss": -6.947878360748291, "global_step": 159391, "epoch": 3795} {"train_loss": -7.144392013549805, "global_step": 159392, "epoch": 3795} {"train_loss": -6.963113784790039, "global_step": 159393, "epoch": 3795} {"train_loss": -6.98870849609375, "global_step": 159394, "epoch": 3795} {"train_loss": -7.028365135192871, "global_step": 159395, "epoch": 3795} {"train_loss": -6.979991912841797, "global_step": 159396, "epoch": 3795} {"train_loss": -6.901034355163574, "global_step": 159397, "epoch": 3795} {"train_loss": -6.902302265167236, "global_step": 159398, "epoch": 3795} {"train_loss": -6.864099502563477, "global_step": 159399, "epoch": 3795} {"train_loss": -6.939181327819824, "global_step": 159400, "epoch": 3795} {"train_loss": -6.975600242614746, "global_step": 159401, "epoch": 3795} {"train_loss": -7.024421691894531, "global_step": 159402, "epoch": 3795} {"train_loss": -6.916378021240234, "global_step": 159403, "epoch": 3795} {"train_loss": -6.999205589294434, "global_step": 159404, "epoch": 3795} {"train_loss": -6.991367340087891, "global_step": 159405, "epoch": 3795} {"train_loss": -7.031091690063477, "global_step": 159406, "epoch": 3795} {"train_loss": -6.950453281402588, "global_step": 159407, "epoch": 3795} {"train_loss": -7.035665512084961, "global_step": 159408, "epoch": 3795} {"train_loss": -7.006170272827148, "global_step": 159409, "epoch": 3795} {"train_loss": -6.99787712097168, "global_step": 159410, "epoch": 3795} {"train_loss": -6.9433722496032715, "global_step": 159411, "epoch": 3795} {"train_loss": -7.117734909057617, "global_step": 159412, "epoch": 3795} {"train_loss": -7.075479507446289, "global_step": 159413, "epoch": 3795} {"train_loss": -7.028144359588623, "global_step": 159414, "epoch": 3795} {"train_loss": -6.99656343460083, "global_step": 159415, "epoch": 3795} {"train_loss": -6.98086404800415, "global_step": 159416, "epoch": 3795} {"train_loss": -6.890986442565918, "global_step": 159417, "epoch": 3795} {"train_loss": -6.869422912597656, "global_step": 159418, "epoch": 3795} {"train_loss": -7.007701873779297, "global_step": 159419, "epoch": 3795} {"train_loss": -6.8856611251831055, "global_step": 159420, "epoch": 3795} {"train_loss": -6.993288993835449, "global_step": 159421, "epoch": 3795} {"train_loss": -6.951450347900391, "global_step": 159422, "epoch": 3795} {"train_loss": -6.6930108070373535, "global_step": 159423, "epoch": 3795} {"train_loss": -6.842229843139648, "global_step": 159424, "epoch": 3795} {"train_loss": -6.954868793487549, "global_step": 159425, "epoch": 3795} {"train_loss": -6.770143032073975, "global_step": 159426, "epoch": 3795} {"train_loss": -6.793872833251953, "global_step": 159427, "epoch": 3795} {"train_loss": -7.0107927322387695, "global_step": 159428, "epoch": 3795} {"train_loss": -6.8873677253723145, "global_step": 159429, "epoch": 3795} {"train_loss": -6.930879592895508, "global_step": 159430, "epoch": 3795} {"train_loss": -6.957632076172602, "global_step": 159431, "epoch": 3795, "val_loss": 68415.9609375} {"train_loss": -6.8284687995910645, "global_step": 159432, "epoch": 3796} {"train_loss": -6.922093391418457, "global_step": 159433, "epoch": 3796} {"train_loss": -6.7972412109375, "global_step": 159434, "epoch": 3796} {"train_loss": -6.908509254455566, "global_step": 159435, "epoch": 3796} {"train_loss": -6.734588623046875, "global_step": 159436, "epoch": 3796} {"train_loss": -6.885185718536377, "global_step": 159437, "epoch": 3796} {"train_loss": -6.946340560913086, "global_step": 159438, "epoch": 3796} {"train_loss": -6.749846935272217, "global_step": 159439, "epoch": 3796} {"train_loss": -6.92836856842041, "global_step": 159440, "epoch": 3796} {"train_loss": -6.756380081176758, "global_step": 159441, "epoch": 3796} {"train_loss": -6.800503730773926, "global_step": 159442, "epoch": 3796} {"train_loss": -6.853736877441406, "global_step": 159443, "epoch": 3796} {"train_loss": -6.885475158691406, "global_step": 159444, "epoch": 3796} {"train_loss": -6.813667297363281, "global_step": 159445, "epoch": 3796} {"train_loss": -6.857849597930908, "global_step": 159446, "epoch": 3796} {"train_loss": -6.8357768058776855, "global_step": 159447, "epoch": 3796} {"train_loss": -6.908912181854248, "global_step": 159448, "epoch": 3796} {"train_loss": -6.8898210525512695, "global_step": 159449, "epoch": 3796} {"train_loss": -6.819766998291016, "global_step": 159450, "epoch": 3796} {"train_loss": -6.83868408203125, "global_step": 159451, "epoch": 3796} {"train_loss": -6.735531806945801, "global_step": 159452, "epoch": 3796} {"train_loss": -6.8770904541015625, "global_step": 159453, "epoch": 3796} {"train_loss": -6.831402778625488, "global_step": 159454, "epoch": 3796} {"train_loss": -6.844928741455078, "global_step": 159455, "epoch": 3796} {"train_loss": -6.842898368835449, "global_step": 159456, "epoch": 3796} {"train_loss": -6.884242057800293, "global_step": 159457, "epoch": 3796} {"train_loss": -6.816569805145264, "global_step": 159458, "epoch": 3796} {"train_loss": -6.866575241088867, "global_step": 159459, "epoch": 3796} {"train_loss": -6.841682434082031, "global_step": 159460, "epoch": 3796} {"train_loss": -6.753124713897705, "global_step": 159461, "epoch": 3796} {"train_loss": -6.849320411682129, "global_step": 159462, "epoch": 3796} {"train_loss": -6.883177757263184, "global_step": 159463, "epoch": 3796} {"train_loss": -6.872739791870117, "global_step": 159464, "epoch": 3796} {"train_loss": -6.875304698944092, "global_step": 159465, "epoch": 3796} {"train_loss": -6.916071891784668, "global_step": 159466, "epoch": 3796} {"train_loss": -6.926457405090332, "global_step": 159467, "epoch": 3796} {"train_loss": -6.960658550262451, "global_step": 159468, "epoch": 3796} {"train_loss": -6.890500068664551, "global_step": 159469, "epoch": 3796} {"train_loss": -6.948198318481445, "global_step": 159470, "epoch": 3796} {"train_loss": -6.895597457885742, "global_step": 159471, "epoch": 3796} {"train_loss": -7.010381698608398, "global_step": 159472, "epoch": 3796} {"train_loss": -6.862629493077596, "global_step": 159473, "epoch": 3796, "val_loss": 68393.9140625} {"train_loss": -6.9687395095825195, "global_step": 159474, "epoch": 3797} {"train_loss": -6.905637264251709, "global_step": 159475, "epoch": 3797} {"train_loss": -6.83003044128418, "global_step": 159476, "epoch": 3797} {"train_loss": -6.900132179260254, "global_step": 159477, "epoch": 3797} {"train_loss": -6.9784650802612305, "global_step": 159478, "epoch": 3797} {"train_loss": -6.944394588470459, "global_step": 159479, "epoch": 3797} {"train_loss": -6.940886974334717, "global_step": 159480, "epoch": 3797} {"train_loss": -7.090235233306885, "global_step": 159481, "epoch": 3797} {"train_loss": -6.90713357925415, "global_step": 159482, "epoch": 3797} {"train_loss": -6.9683027267456055, "global_step": 159483, "epoch": 3797} {"train_loss": -7.065935134887695, "global_step": 159484, "epoch": 3797} {"train_loss": -6.950875282287598, "global_step": 159485, "epoch": 3797} {"train_loss": -6.948477745056152, "global_step": 159486, "epoch": 3797} {"train_loss": -6.891444206237793, "global_step": 159487, "epoch": 3797} {"train_loss": -6.9680023193359375, "global_step": 159488, "epoch": 3797} {"train_loss": -7.050660610198975, "global_step": 159489, "epoch": 3797} {"train_loss": -6.914626121520996, "global_step": 159490, "epoch": 3797} {"train_loss": -6.979491710662842, "global_step": 159491, "epoch": 3797} {"train_loss": -6.945303916931152, "global_step": 159492, "epoch": 3797} {"train_loss": -6.959062576293945, "global_step": 159493, "epoch": 3797} {"train_loss": -6.950595855712891, "global_step": 159494, "epoch": 3797} {"train_loss": -6.875087738037109, "global_step": 159495, "epoch": 3797} {"train_loss": -6.862966537475586, "global_step": 159496, "epoch": 3797} {"train_loss": -6.881028175354004, "global_step": 159497, "epoch": 3797} {"train_loss": -6.707569122314453, "global_step": 159498, "epoch": 3797} {"train_loss": -6.927682876586914, "global_step": 159499, "epoch": 3797} {"train_loss": -7.047932147979736, "global_step": 159500, "epoch": 3797} {"train_loss": -6.9613037109375, "global_step": 159501, "epoch": 3797} {"train_loss": -6.902143955230713, "global_step": 159502, "epoch": 3797} {"train_loss": -6.964168071746826, "global_step": 159503, "epoch": 3797} {"train_loss": -6.944524765014648, "global_step": 159504, "epoch": 3797} {"train_loss": -6.841656684875488, "global_step": 159505, "epoch": 3797} {"train_loss": -6.825647354125977, "global_step": 159506, "epoch": 3797} {"train_loss": -6.922998428344727, "global_step": 159507, "epoch": 3797} {"train_loss": -6.891523361206055, "global_step": 159508, "epoch": 3797} {"train_loss": -6.845129489898682, "global_step": 159509, "epoch": 3797} {"train_loss": -6.883303165435791, "global_step": 159510, "epoch": 3797} {"train_loss": -6.960847854614258, "global_step": 159511, "epoch": 3797} {"train_loss": -6.841033935546875, "global_step": 159512, "epoch": 3797} {"train_loss": -7.01154088973999, "global_step": 159513, "epoch": 3797} {"train_loss": -6.9320220947265625, "global_step": 159514, "epoch": 3797} {"train_loss": -6.931002809887841, "global_step": 159515, "epoch": 3797, "val_loss": 68430.0625} {"train_loss": -6.95720100402832, "global_step": 159516, "epoch": 3798} {"train_loss": -6.996063709259033, "global_step": 159517, "epoch": 3798} {"train_loss": -7.003979682922363, "global_step": 159518, "epoch": 3798} {"train_loss": -7.038910865783691, "global_step": 159519, "epoch": 3798} {"train_loss": -7.002721786499023, "global_step": 159520, "epoch": 3798} {"train_loss": -7.050897598266602, "global_step": 159521, "epoch": 3798} {"train_loss": -6.967992305755615, "global_step": 159522, "epoch": 3798} {"train_loss": -7.037254333496094, "global_step": 159523, "epoch": 3798} {"train_loss": -7.003420829772949, "global_step": 159524, "epoch": 3798} {"train_loss": -7.028489589691162, "global_step": 159525, "epoch": 3798} {"train_loss": -6.917262077331543, "global_step": 159526, "epoch": 3798} {"train_loss": -6.9968719482421875, "global_step": 159527, "epoch": 3798} {"train_loss": -7.024281024932861, "global_step": 159528, "epoch": 3798} {"train_loss": -6.966927528381348, "global_step": 159529, "epoch": 3798} {"train_loss": -6.842120170593262, "global_step": 159530, "epoch": 3798} {"train_loss": -6.951678276062012, "global_step": 159531, "epoch": 3798} {"train_loss": -6.90993595123291, "global_step": 159532, "epoch": 3798} {"train_loss": -6.747262001037598, "global_step": 159533, "epoch": 3798} {"train_loss": -6.984755516052246, "global_step": 159534, "epoch": 3798} {"train_loss": -6.839418888092041, "global_step": 159535, "epoch": 3798} {"train_loss": -6.813508987426758, "global_step": 159536, "epoch": 3798} {"train_loss": -6.944002151489258, "global_step": 159537, "epoch": 3798} {"train_loss": -6.925417900085449, "global_step": 159538, "epoch": 3798} {"train_loss": -6.9127960205078125, "global_step": 159539, "epoch": 3798} {"train_loss": -6.89786434173584, "global_step": 159540, "epoch": 3798} {"train_loss": -6.817684173583984, "global_step": 159541, "epoch": 3798} {"train_loss": -6.901396751403809, "global_step": 159542, "epoch": 3798} {"train_loss": -6.817715167999268, "global_step": 159543, "epoch": 3798} {"train_loss": -6.922689437866211, "global_step": 159544, "epoch": 3798} {"train_loss": -6.800778388977051, "global_step": 159545, "epoch": 3798} {"train_loss": -6.848291397094727, "global_step": 159546, "epoch": 3798} {"train_loss": -6.672754287719727, "global_step": 159547, "epoch": 3798} {"train_loss": -6.955709457397461, "global_step": 159548, "epoch": 3798} {"train_loss": -6.683951377868652, "global_step": 159549, "epoch": 3798} {"train_loss": -6.743685245513916, "global_step": 159550, "epoch": 3798} {"train_loss": -6.8828935623168945, "global_step": 159551, "epoch": 3798} {"train_loss": -6.774074077606201, "global_step": 159552, "epoch": 3798} {"train_loss": -6.90799617767334, "global_step": 159553, "epoch": 3798} {"train_loss": -6.72525691986084, "global_step": 159554, "epoch": 3798} {"train_loss": -6.816987037658691, "global_step": 159555, "epoch": 3798} {"train_loss": -6.736772060394287, "global_step": 159556, "epoch": 3798} {"train_loss": -6.899796281542097, "global_step": 159557, "epoch": 3798, "val_loss": 68667.953125} {"train_loss": -6.92667818069458, "global_step": 159558, "epoch": 3799} {"train_loss": -6.811627388000488, "global_step": 159559, "epoch": 3799} {"train_loss": -6.956859111785889, "global_step": 159560, "epoch": 3799} {"train_loss": -6.8495588302612305, "global_step": 159561, "epoch": 3799} {"train_loss": -6.8841753005981445, "global_step": 159562, "epoch": 3799} {"train_loss": -6.713022708892822, "global_step": 159563, "epoch": 3799} {"train_loss": -6.897817134857178, "global_step": 159564, "epoch": 3799} {"train_loss": -6.764959335327148, "global_step": 159565, "epoch": 3799} {"train_loss": -6.819848537445068, "global_step": 159566, "epoch": 3799} {"train_loss": -6.907587051391602, "global_step": 159567, "epoch": 3799} {"train_loss": -6.91322135925293, "global_step": 159568, "epoch": 3799} {"train_loss": -6.873929023742676, "global_step": 159569, "epoch": 3799} {"train_loss": -6.788261413574219, "global_step": 159570, "epoch": 3799} {"train_loss": -6.902797698974609, "global_step": 159571, "epoch": 3799} {"train_loss": -6.914158344268799, "global_step": 159572, "epoch": 3799} {"train_loss": -6.890893936157227, "global_step": 159573, "epoch": 3799} {"train_loss": -6.915196418762207, "global_step": 159574, "epoch": 3799} {"train_loss": -7.01125431060791, "global_step": 159575, "epoch": 3799} {"train_loss": -6.89207649230957, "global_step": 159576, "epoch": 3799} {"train_loss": -6.958036422729492, "global_step": 159577, "epoch": 3799} {"train_loss": -6.864920616149902, "global_step": 159578, "epoch": 3799} {"train_loss": -6.971462249755859, "global_step": 159579, "epoch": 3799} {"train_loss": -7.106472015380859, "global_step": 159580, "epoch": 3799} {"train_loss": -6.914091110229492, "global_step": 159581, "epoch": 3799} {"train_loss": -6.947047710418701, "global_step": 159582, "epoch": 3799} {"train_loss": -6.942532062530518, "global_step": 159583, "epoch": 3799} {"train_loss": -6.904858589172363, "global_step": 159584, "epoch": 3799} {"train_loss": -6.946200370788574, "global_step": 159585, "epoch": 3799} {"train_loss": -7.095952987670898, "global_step": 159586, "epoch": 3799} {"train_loss": -7.120329856872559, "global_step": 159587, "epoch": 3799} {"train_loss": -6.930757522583008, "global_step": 159588, "epoch": 3799} {"train_loss": -7.07169246673584, "global_step": 159589, "epoch": 3799} {"train_loss": -7.001314163208008, "global_step": 159590, "epoch": 3799} {"train_loss": -6.824609756469727, "global_step": 159591, "epoch": 3799} {"train_loss": -6.915838718414307, "global_step": 159592, "epoch": 3799} {"train_loss": -6.852118492126465, "global_step": 159593, "epoch": 3799} {"train_loss": -6.882302761077881, "global_step": 159594, "epoch": 3799} {"train_loss": -6.893089771270752, "global_step": 159595, "epoch": 3799} {"train_loss": -6.943337917327881, "global_step": 159596, "epoch": 3799} {"train_loss": -6.951443672180176, "global_step": 159597, "epoch": 3799} {"train_loss": -6.958895683288574, "global_step": 159598, "epoch": 3799} {"train_loss": -6.916566054026286, "global_step": 159599, "epoch": 3799, "val_loss": 68607.0} {"train_loss": -6.934593200683594, "global_step": 159600, "epoch": 3800} {"train_loss": -6.876434326171875, "global_step": 159601, "epoch": 3800} {"train_loss": -6.909200668334961, "global_step": 159602, "epoch": 3800} {"train_loss": -7.028180122375488, "global_step": 159603, "epoch": 3800} {"train_loss": -6.980460166931152, "global_step": 159604, "epoch": 3800} {"train_loss": -6.897629737854004, "global_step": 159605, "epoch": 3800} {"train_loss": -6.9174346923828125, "global_step": 159606, "epoch": 3800} {"train_loss": -7.0380449295043945, "global_step": 159607, "epoch": 3800} {"train_loss": -7.015052318572998, "global_step": 159608, "epoch": 3800} {"train_loss": -6.9144697189331055, "global_step": 159609, "epoch": 3800} {"train_loss": -6.8518242835998535, "global_step": 159610, "epoch": 3800} {"train_loss": -6.937408447265625, "global_step": 159611, "epoch": 3800} {"train_loss": -6.992310523986816, "global_step": 159612, "epoch": 3800} {"train_loss": -6.942634582519531, "global_step": 159613, "epoch": 3800} {"train_loss": -6.8296613693237305, "global_step": 159614, "epoch": 3800} {"train_loss": -6.6988325119018555, "global_step": 159615, "epoch": 3800} {"train_loss": -6.924354553222656, "global_step": 159616, "epoch": 3800} {"train_loss": -6.961068153381348, "global_step": 159617, "epoch": 3800} {"train_loss": -6.918593406677246, "global_step": 159618, "epoch": 3800} {"train_loss": -6.999629020690918, "global_step": 159619, "epoch": 3800} {"train_loss": -6.888744831085205, "global_step": 159620, "epoch": 3800} {"train_loss": -6.970719337463379, "global_step": 159621, "epoch": 3800} {"train_loss": -6.980958938598633, "global_step": 159622, "epoch": 3800} {"train_loss": -6.897618293762207, "global_step": 159623, "epoch": 3800} {"train_loss": -6.943178176879883, "global_step": 159624, "epoch": 3800} {"train_loss": -6.969453811645508, "global_step": 159625, "epoch": 3800} {"train_loss": -6.846972465515137, "global_step": 159626, "epoch": 3800} {"train_loss": -6.990029335021973, "global_step": 159627, "epoch": 3800} {"train_loss": -6.857447624206543, "global_step": 159628, "epoch": 3800} {"train_loss": -7.001469135284424, "global_step": 159629, "epoch": 3800} {"train_loss": -7.039116859436035, "global_step": 159630, "epoch": 3800} {"train_loss": -6.986748218536377, "global_step": 159631, "epoch": 3800} {"train_loss": -6.8729400634765625, "global_step": 159632, "epoch": 3800} {"train_loss": -6.994250297546387, "global_step": 159633, "epoch": 3800} {"train_loss": -6.936280250549316, "global_step": 159634, "epoch": 3800} {"train_loss": -6.967489242553711, "global_step": 159635, "epoch": 3800} {"train_loss": -6.988153457641602, "global_step": 159636, "epoch": 3800} {"train_loss": -7.061553001403809, "global_step": 159637, "epoch": 3800} {"train_loss": -6.960491180419922, "global_step": 159638, "epoch": 3800} {"train_loss": -7.0843186378479, "global_step": 159639, "epoch": 3800} {"train_loss": -7.016974449157715, "global_step": 159640, "epoch": 3800} {"train_loss": -6.947162015097482, "global_step": 159641, "epoch": 3800, "train/sim_max_reward_0": 0.9160254296761037, "train/sim_max_reward_1": 0.8611980670815057, "train/sim_max_reward_2": 0.6901760140750063, "train/sim_max_reward_3": 0.44403931633106575, "train/sim_max_reward_4": 0.8539236519357427, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8367317048262636, "test/sim_max_reward_4300001": 0.5830675475011525, "test/sim_max_reward_4300002": 0.93975771525521, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9165265530453065, "test/sim_max_reward_4300006": 0.21342984168337154, "test/sim_max_reward_4300007": 0.8626976703285306, "test/sim_max_reward_4300008": 0.8688838681803868, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.9719681162435889, "test/sim_max_reward_4300011": 0.9815704744339376, "test/sim_max_reward_4300012": 0.7965253706558995, "test/sim_max_reward_4300013": 0.82572414090907, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9779244504444892, "test/sim_max_reward_4300016": 0.9127763952204849, "test/sim_max_reward_4300017": 0.3425467385352189, "test/sim_max_reward_4300018": 0.45185672518937126, "test/sim_max_reward_4300019": 0.18364840504493726, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.7439707604287471, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.3687991840681544, "test/sim_max_reward_4300024": 0.3539617450455827, "test/sim_max_reward_4300025": 0.9014003457524182, "test/sim_max_reward_4300026": 0.19840413827675232, "test/sim_max_reward_4300027": 0.9548354214320354, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.12845508764520208, "test/sim_max_reward_4300031": 0.34311843162592953, "test/sim_max_reward_4300032": 0.8782992150790213, "test/sim_max_reward_4300033": 0.692783305066688, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.13015911394196866, "test/sim_max_reward_4300036": 0.19988090579562945, "test/sim_max_reward_4300037": 0.9720132165237766, "test/sim_max_reward_4300038": 0.9618254505211474, "test/sim_max_reward_4300039": 0.9319542932447629, "test/sim_max_reward_4300040": 0.24837439493520017, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7123256560661662, "test/sim_max_reward_4300043": 0.4184335046632822, "test/sim_max_reward_4300044": 1.0, "test/sim_max_reward_4300045": 0.9720250112377671, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.15550039457900597, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.3288512954946342, "train/mean_score": 0.6597245397436019, "test/mean_score": 0.5855368138746075, "val_loss": 68555.625} {"train_loss": -6.980135440826416, "global_step": 159642, "epoch": 3801} {"train_loss": -6.874262809753418, "global_step": 159643, "epoch": 3801} {"train_loss": -7.019033432006836, "global_step": 159644, "epoch": 3801} {"train_loss": -7.060659885406494, "global_step": 159645, "epoch": 3801} {"train_loss": -7.000575065612793, "global_step": 159646, "epoch": 3801} {"train_loss": -6.857443332672119, "global_step": 159647, "epoch": 3801} {"train_loss": -7.021889686584473, "global_step": 159648, "epoch": 3801} {"train_loss": -6.964876174926758, "global_step": 159649, "epoch": 3801} {"train_loss": -6.957688808441162, "global_step": 159650, "epoch": 3801} {"train_loss": -6.944100379943848, "global_step": 159651, "epoch": 3801} {"train_loss": -6.89840030670166, "global_step": 159652, "epoch": 3801} {"train_loss": -7.018164157867432, "global_step": 159653, "epoch": 3801} {"train_loss": -7.082411766052246, "global_step": 159654, "epoch": 3801} {"train_loss": -6.9198713302612305, "global_step": 159655, "epoch": 3801} {"train_loss": -6.973958969116211, "global_step": 159656, "epoch": 3801} {"train_loss": -6.920049667358398, "global_step": 159657, "epoch": 3801} {"train_loss": -6.863101959228516, "global_step": 159658, "epoch": 3801} {"train_loss": -6.8278632164001465, "global_step": 159659, "epoch": 3801} {"train_loss": -6.890434265136719, "global_step": 159660, "epoch": 3801} {"train_loss": -6.746120929718018, "global_step": 159661, "epoch": 3801} {"train_loss": -7.028803825378418, "global_step": 159662, "epoch": 3801} {"train_loss": -6.897250175476074, "global_step": 159663, "epoch": 3801} {"train_loss": -6.863785743713379, "global_step": 159664, "epoch": 3801} {"train_loss": -7.022615432739258, "global_step": 159665, "epoch": 3801} {"train_loss": -6.860874176025391, "global_step": 159666, "epoch": 3801} {"train_loss": -6.902438640594482, "global_step": 159667, "epoch": 3801} {"train_loss": -6.956342697143555, "global_step": 159668, "epoch": 3801} {"train_loss": -6.9677934646606445, "global_step": 159669, "epoch": 3801} {"train_loss": -6.872912406921387, "global_step": 159670, "epoch": 3801} {"train_loss": -6.856011867523193, "global_step": 159671, "epoch": 3801} {"train_loss": -6.962974548339844, "global_step": 159672, "epoch": 3801} {"train_loss": -6.887208938598633, "global_step": 159673, "epoch": 3801} {"train_loss": -6.855447769165039, "global_step": 159674, "epoch": 3801} {"train_loss": -6.9841227531433105, "global_step": 159675, "epoch": 3801} {"train_loss": -6.742121696472168, "global_step": 159676, "epoch": 3801} {"train_loss": -6.918682098388672, "global_step": 159677, "epoch": 3801} {"train_loss": -6.915829658508301, "global_step": 159678, "epoch": 3801} {"train_loss": -6.894000053405762, "global_step": 159679, "epoch": 3801} {"train_loss": -6.809545516967773, "global_step": 159680, "epoch": 3801} {"train_loss": -6.955451488494873, "global_step": 159681, "epoch": 3801} {"train_loss": -6.938955783843994, "global_step": 159682, "epoch": 3801} {"train_loss": -6.923951909655616, "global_step": 159683, "epoch": 3801, "val_loss": 68613.0625} {"train_loss": -6.879108428955078, "global_step": 159684, "epoch": 3802} {"train_loss": -6.918379783630371, "global_step": 159685, "epoch": 3802} {"train_loss": -7.001727104187012, "global_step": 159686, "epoch": 3802} {"train_loss": -6.766378402709961, "global_step": 159687, "epoch": 3802} {"train_loss": -6.982170104980469, "global_step": 159688, "epoch": 3802} {"train_loss": -7.000027656555176, "global_step": 159689, "epoch": 3802} {"train_loss": -6.8304853439331055, "global_step": 159690, "epoch": 3802} {"train_loss": -6.990947723388672, "global_step": 159691, "epoch": 3802} {"train_loss": -6.980871200561523, "global_step": 159692, "epoch": 3802} {"train_loss": -6.965757369995117, "global_step": 159693, "epoch": 3802} {"train_loss": -6.992718696594238, "global_step": 159694, "epoch": 3802} {"train_loss": -6.997403144836426, "global_step": 159695, "epoch": 3802} {"train_loss": -6.901744842529297, "global_step": 159696, "epoch": 3802} {"train_loss": -6.957723140716553, "global_step": 159697, "epoch": 3802} {"train_loss": -7.006195545196533, "global_step": 159698, "epoch": 3802} {"train_loss": -6.960928916931152, "global_step": 159699, "epoch": 3802} {"train_loss": -6.984060764312744, "global_step": 159700, "epoch": 3802} {"train_loss": -6.797922134399414, "global_step": 159701, "epoch": 3802} {"train_loss": -6.93368673324585, "global_step": 159702, "epoch": 3802} {"train_loss": -6.952897071838379, "global_step": 159703, "epoch": 3802} {"train_loss": -6.950357913970947, "global_step": 159704, "epoch": 3802} {"train_loss": -6.7522053718566895, "global_step": 159705, "epoch": 3802} {"train_loss": -6.870166301727295, "global_step": 159706, "epoch": 3802} {"train_loss": -6.956143379211426, "global_step": 159707, "epoch": 3802} {"train_loss": -6.912208557128906, "global_step": 159708, "epoch": 3802} {"train_loss": -7.057512283325195, "global_step": 159709, "epoch": 3802} {"train_loss": -6.818432807922363, "global_step": 159710, "epoch": 3802} {"train_loss": -7.025874137878418, "global_step": 159711, "epoch": 3802} {"train_loss": -6.874067306518555, "global_step": 159712, "epoch": 3802} {"train_loss": -6.983245849609375, "global_step": 159713, "epoch": 3802} {"train_loss": -6.991993427276611, "global_step": 159714, "epoch": 3802} {"train_loss": -6.916416645050049, "global_step": 159715, "epoch": 3802} {"train_loss": -6.9951653480529785, "global_step": 159716, "epoch": 3802} {"train_loss": -6.821452617645264, "global_step": 159717, "epoch": 3802} {"train_loss": -7.027062892913818, "global_step": 159718, "epoch": 3802} {"train_loss": -6.945907115936279, "global_step": 159719, "epoch": 3802} {"train_loss": -7.00982666015625, "global_step": 159720, "epoch": 3802} {"train_loss": -6.967641830444336, "global_step": 159721, "epoch": 3802} {"train_loss": -6.847046852111816, "global_step": 159722, "epoch": 3802} {"train_loss": -6.983861446380615, "global_step": 159723, "epoch": 3802} {"train_loss": -6.9132513999938965, "global_step": 159724, "epoch": 3802} {"train_loss": -6.9366500718253, "global_step": 159725, "epoch": 3802, "val_loss": 68394.421875} {"train_loss": -6.88613748550415, "global_step": 159726, "epoch": 3803} {"train_loss": -6.967802047729492, "global_step": 159727, "epoch": 3803} {"train_loss": -6.966544151306152, "global_step": 159728, "epoch": 3803} {"train_loss": -6.943948745727539, "global_step": 159729, "epoch": 3803} {"train_loss": -6.969932556152344, "global_step": 159730, "epoch": 3803} {"train_loss": -6.945121765136719, "global_step": 159731, "epoch": 3803} {"train_loss": -6.925084114074707, "global_step": 159732, "epoch": 3803} {"train_loss": -7.022839546203613, "global_step": 159733, "epoch": 3803} {"train_loss": -7.041839599609375, "global_step": 159734, "epoch": 3803} {"train_loss": -6.976351737976074, "global_step": 159735, "epoch": 3803} {"train_loss": -7.046433925628662, "global_step": 159736, "epoch": 3803} {"train_loss": -6.955801963806152, "global_step": 159737, "epoch": 3803} {"train_loss": -6.988007068634033, "global_step": 159738, "epoch": 3803} {"train_loss": -7.013540267944336, "global_step": 159739, "epoch": 3803} {"train_loss": -7.017576217651367, "global_step": 159740, "epoch": 3803} {"train_loss": -6.862321853637695, "global_step": 159741, "epoch": 3803} {"train_loss": -6.973774433135986, "global_step": 159742, "epoch": 3803} {"train_loss": -6.953973770141602, "global_step": 159743, "epoch": 3803} {"train_loss": -6.983384609222412, "global_step": 159744, "epoch": 3803} {"train_loss": -6.994279861450195, "global_step": 159745, "epoch": 3803} {"train_loss": -7.040668487548828, "global_step": 159746, "epoch": 3803} {"train_loss": -7.071173667907715, "global_step": 159747, "epoch": 3803} {"train_loss": -6.965152263641357, "global_step": 159748, "epoch": 3803} {"train_loss": -6.9698920249938965, "global_step": 159749, "epoch": 3803} {"train_loss": -6.850986480712891, "global_step": 159750, "epoch": 3803} {"train_loss": -6.99554443359375, "global_step": 159751, "epoch": 3803} {"train_loss": -7.070493221282959, "global_step": 159752, "epoch": 3803} {"train_loss": -6.9706621170043945, "global_step": 159753, "epoch": 3803} {"train_loss": -6.9440107345581055, "global_step": 159754, "epoch": 3803} {"train_loss": -7.050425052642822, "global_step": 159755, "epoch": 3803} {"train_loss": -6.878026008605957, "global_step": 159756, "epoch": 3803} {"train_loss": -7.042176246643066, "global_step": 159757, "epoch": 3803} {"train_loss": -6.95628547668457, "global_step": 159758, "epoch": 3803} {"train_loss": -6.902092933654785, "global_step": 159759, "epoch": 3803} {"train_loss": -6.892638206481934, "global_step": 159760, "epoch": 3803} {"train_loss": -6.902165412902832, "global_step": 159761, "epoch": 3803} {"train_loss": -6.953040599822998, "global_step": 159762, "epoch": 3803} {"train_loss": -6.826004981994629, "global_step": 159763, "epoch": 3803} {"train_loss": -6.9582624435424805, "global_step": 159764, "epoch": 3803} {"train_loss": -7.007370948791504, "global_step": 159765, "epoch": 3803} {"train_loss": -6.929277420043945, "global_step": 159766, "epoch": 3803} {"train_loss": -6.964714527130127, "global_step": 159767, "epoch": 3803, "val_loss": 68447.6796875} {"train_loss": -6.972500801086426, "global_step": 159768, "epoch": 3804} {"train_loss": -6.992630958557129, "global_step": 159769, "epoch": 3804} {"train_loss": -6.9647297859191895, "global_step": 159770, "epoch": 3804} {"train_loss": -6.956306457519531, "global_step": 159771, "epoch": 3804} {"train_loss": -6.957268238067627, "global_step": 159772, "epoch": 3804} {"train_loss": -6.948908805847168, "global_step": 159773, "epoch": 3804} {"train_loss": -6.986090183258057, "global_step": 159774, "epoch": 3804} {"train_loss": -6.920378684997559, "global_step": 159775, "epoch": 3804} {"train_loss": -7.053006172180176, "global_step": 159776, "epoch": 3804} {"train_loss": -7.124410152435303, "global_step": 159777, "epoch": 3804} {"train_loss": -6.980250358581543, "global_step": 159778, "epoch": 3804} {"train_loss": -6.996794700622559, "global_step": 159779, "epoch": 3804} {"train_loss": -6.827958106994629, "global_step": 159780, "epoch": 3804} {"train_loss": -6.92752742767334, "global_step": 159781, "epoch": 3804} {"train_loss": -7.0482048988342285, "global_step": 159782, "epoch": 3804} {"train_loss": -6.855742454528809, "global_step": 159783, "epoch": 3804} {"train_loss": -6.9517502784729, "global_step": 159784, "epoch": 3804} {"train_loss": -6.934609889984131, "global_step": 159785, "epoch": 3804} {"train_loss": -6.891623020172119, "global_step": 159786, "epoch": 3804} {"train_loss": -6.880261421203613, "global_step": 159787, "epoch": 3804} {"train_loss": -7.002692699432373, "global_step": 159788, "epoch": 3804} {"train_loss": -6.955351829528809, "global_step": 159789, "epoch": 3804} {"train_loss": -6.882782936096191, "global_step": 159790, "epoch": 3804} {"train_loss": -6.930173873901367, "global_step": 159791, "epoch": 3804} {"train_loss": -6.942497253417969, "global_step": 159792, "epoch": 3804} {"train_loss": -6.833619117736816, "global_step": 159793, "epoch": 3804} {"train_loss": -6.956606864929199, "global_step": 159794, "epoch": 3804} {"train_loss": -6.975101947784424, "global_step": 159795, "epoch": 3804} {"train_loss": -6.8958048820495605, "global_step": 159796, "epoch": 3804} {"train_loss": -6.77616024017334, "global_step": 159797, "epoch": 3804} {"train_loss": -6.798714637756348, "global_step": 159798, "epoch": 3804} {"train_loss": -6.856281280517578, "global_step": 159799, "epoch": 3804} {"train_loss": -6.847024917602539, "global_step": 159800, "epoch": 3804} {"train_loss": -6.878769874572754, "global_step": 159801, "epoch": 3804} {"train_loss": -6.890789985656738, "global_step": 159802, "epoch": 3804} {"train_loss": -6.910538673400879, "global_step": 159803, "epoch": 3804} {"train_loss": -6.98846435546875, "global_step": 159804, "epoch": 3804} {"train_loss": -6.849468231201172, "global_step": 159805, "epoch": 3804} {"train_loss": -6.901246547698975, "global_step": 159806, "epoch": 3804} {"train_loss": -6.837944030761719, "global_step": 159807, "epoch": 3804} {"train_loss": -6.952580451965332, "global_step": 159808, "epoch": 3804} {"train_loss": -6.922849166960943, "global_step": 159809, "epoch": 3804, "val_loss": 68525.8671875} {"train_loss": -6.911705017089844, "global_step": 159810, "epoch": 3805} {"train_loss": -6.913388252258301, "global_step": 159811, "epoch": 3805} {"train_loss": -6.813257217407227, "global_step": 159812, "epoch": 3805} {"train_loss": -6.877100944519043, "global_step": 159813, "epoch": 3805} {"train_loss": -6.847616672515869, "global_step": 159814, "epoch": 3805} {"train_loss": -6.834575653076172, "global_step": 159815, "epoch": 3805} {"train_loss": -6.868729591369629, "global_step": 159816, "epoch": 3805} {"train_loss": -6.787789344787598, "global_step": 159817, "epoch": 3805} {"train_loss": -6.949550628662109, "global_step": 159818, "epoch": 3805} {"train_loss": -6.76295280456543, "global_step": 159819, "epoch": 3805} {"train_loss": -6.869104862213135, "global_step": 159820, "epoch": 3805} {"train_loss": -6.8457159996032715, "global_step": 159821, "epoch": 3805} {"train_loss": -6.98362922668457, "global_step": 159822, "epoch": 3805} {"train_loss": -6.877072334289551, "global_step": 159823, "epoch": 3805} {"train_loss": -6.9441142082214355, "global_step": 159824, "epoch": 3805} {"train_loss": -6.942537784576416, "global_step": 159825, "epoch": 3805} {"train_loss": -6.8777995109558105, "global_step": 159826, "epoch": 3805} {"train_loss": -6.88658332824707, "global_step": 159827, "epoch": 3805} {"train_loss": -6.962632179260254, "global_step": 159828, "epoch": 3805} {"train_loss": -6.8322649002075195, "global_step": 159829, "epoch": 3805} {"train_loss": -6.971598148345947, "global_step": 159830, "epoch": 3805} {"train_loss": -6.9842753410339355, "global_step": 159831, "epoch": 3805} {"train_loss": -7.070406436920166, "global_step": 159832, "epoch": 3805} {"train_loss": -6.9512224197387695, "global_step": 159833, "epoch": 3805} {"train_loss": -6.99365234375, "global_step": 159834, "epoch": 3805} {"train_loss": -7.093422889709473, "global_step": 159835, "epoch": 3805} {"train_loss": -7.107239723205566, "global_step": 159836, "epoch": 3805} {"train_loss": -6.966900825500488, "global_step": 159837, "epoch": 3805} {"train_loss": -6.945346832275391, "global_step": 159838, "epoch": 3805} {"train_loss": -6.950446605682373, "global_step": 159839, "epoch": 3805} {"train_loss": -6.918137550354004, "global_step": 159840, "epoch": 3805} {"train_loss": -6.93815803527832, "global_step": 159841, "epoch": 3805} {"train_loss": -7.0178117752075195, "global_step": 159842, "epoch": 3805} {"train_loss": -7.02407169342041, "global_step": 159843, "epoch": 3805} {"train_loss": -7.004200458526611, "global_step": 159844, "epoch": 3805} {"train_loss": -6.801455020904541, "global_step": 159845, "epoch": 3805} {"train_loss": -6.832523345947266, "global_step": 159846, "epoch": 3805} {"train_loss": -6.998203277587891, "global_step": 159847, "epoch": 3805} {"train_loss": -6.880878448486328, "global_step": 159848, "epoch": 3805} {"train_loss": -6.827342987060547, "global_step": 159849, "epoch": 3805} {"train_loss": -7.019557476043701, "global_step": 159850, "epoch": 3805} {"train_loss": -6.919219505219233, "global_step": 159851, "epoch": 3805, "val_loss": 68429.109375} {"train_loss": -6.961807727813721, "global_step": 159852, "epoch": 3806} {"train_loss": -6.918697357177734, "global_step": 159853, "epoch": 3806} {"train_loss": -6.806038856506348, "global_step": 159854, "epoch": 3806} {"train_loss": -6.946762561798096, "global_step": 159855, "epoch": 3806} {"train_loss": -6.8460917472839355, "global_step": 159856, "epoch": 3806} {"train_loss": -6.960007190704346, "global_step": 159857, "epoch": 3806} {"train_loss": -6.88408899307251, "global_step": 159858, "epoch": 3806} {"train_loss": -6.890941619873047, "global_step": 159859, "epoch": 3806} {"train_loss": -6.874255180358887, "global_step": 159860, "epoch": 3806} {"train_loss": -6.923924922943115, "global_step": 159861, "epoch": 3806} {"train_loss": -6.842694282531738, "global_step": 159862, "epoch": 3806} {"train_loss": -6.907644271850586, "global_step": 159863, "epoch": 3806} {"train_loss": -6.793546676635742, "global_step": 159864, "epoch": 3806} {"train_loss": -6.808882236480713, "global_step": 159865, "epoch": 3806} {"train_loss": -6.871547698974609, "global_step": 159866, "epoch": 3806} {"train_loss": -6.8553080558776855, "global_step": 159867, "epoch": 3806} {"train_loss": -6.929670333862305, "global_step": 159868, "epoch": 3806} {"train_loss": -6.82952880859375, "global_step": 159869, "epoch": 3806} {"train_loss": -7.01131534576416, "global_step": 159870, "epoch": 3806} {"train_loss": -6.818717956542969, "global_step": 159871, "epoch": 3806} {"train_loss": -6.877973556518555, "global_step": 159872, "epoch": 3806} {"train_loss": -6.714699745178223, "global_step": 159873, "epoch": 3806} {"train_loss": -6.838772773742676, "global_step": 159874, "epoch": 3806} {"train_loss": -6.902880668640137, "global_step": 159875, "epoch": 3806} {"train_loss": -6.64211368560791, "global_step": 159876, "epoch": 3806} {"train_loss": -6.948276996612549, "global_step": 159877, "epoch": 3806} {"train_loss": -6.723265647888184, "global_step": 159878, "epoch": 3806} {"train_loss": -6.871461868286133, "global_step": 159879, "epoch": 3806} {"train_loss": -6.805548191070557, "global_step": 159880, "epoch": 3806} {"train_loss": -6.856940746307373, "global_step": 159881, "epoch": 3806} {"train_loss": -6.942011833190918, "global_step": 159882, "epoch": 3806} {"train_loss": -6.950599193572998, "global_step": 159883, "epoch": 3806} {"train_loss": -6.957493782043457, "global_step": 159884, "epoch": 3806} {"train_loss": -6.858550071716309, "global_step": 159885, "epoch": 3806} {"train_loss": -6.915053367614746, "global_step": 159886, "epoch": 3806} {"train_loss": -6.833232402801514, "global_step": 159887, "epoch": 3806} {"train_loss": -6.894059181213379, "global_step": 159888, "epoch": 3806} {"train_loss": -6.934610366821289, "global_step": 159889, "epoch": 3806} {"train_loss": -6.97713041305542, "global_step": 159890, "epoch": 3806} {"train_loss": -7.019865036010742, "global_step": 159891, "epoch": 3806} {"train_loss": -6.9177045822143555, "global_step": 159892, "epoch": 3806} {"train_loss": -6.881834552401588, "global_step": 159893, "epoch": 3806, "val_loss": 68440.0390625} {"train_loss": -6.977435111999512, "global_step": 159894, "epoch": 3807} {"train_loss": -7.026880741119385, "global_step": 159895, "epoch": 3807} {"train_loss": -6.8966169357299805, "global_step": 159896, "epoch": 3807} {"train_loss": -6.86675500869751, "global_step": 159897, "epoch": 3807} {"train_loss": -6.9636688232421875, "global_step": 159898, "epoch": 3807} {"train_loss": -6.959527969360352, "global_step": 159899, "epoch": 3807} {"train_loss": -6.873119354248047, "global_step": 159900, "epoch": 3807} {"train_loss": -6.946194648742676, "global_step": 159901, "epoch": 3807} {"train_loss": -7.019098281860352, "global_step": 159902, "epoch": 3807} {"train_loss": -7.018047332763672, "global_step": 159903, "epoch": 3807} {"train_loss": -6.990821838378906, "global_step": 159904, "epoch": 3807} {"train_loss": -6.8507609367370605, "global_step": 159905, "epoch": 3807} {"train_loss": -6.965592384338379, "global_step": 159906, "epoch": 3807} {"train_loss": -6.809183597564697, "global_step": 159907, "epoch": 3807} {"train_loss": -6.7759175300598145, "global_step": 159908, "epoch": 3807} {"train_loss": -6.899531364440918, "global_step": 159909, "epoch": 3807} {"train_loss": -6.893147945404053, "global_step": 159910, "epoch": 3807} {"train_loss": -6.746635437011719, "global_step": 159911, "epoch": 3807} {"train_loss": -6.917279243469238, "global_step": 159912, "epoch": 3807} {"train_loss": -6.8173017501831055, "global_step": 159913, "epoch": 3807} {"train_loss": -6.897229194641113, "global_step": 159914, "epoch": 3807} {"train_loss": -6.967323303222656, "global_step": 159915, "epoch": 3807} {"train_loss": -6.709500312805176, "global_step": 159916, "epoch": 3807} {"train_loss": -6.971778869628906, "global_step": 159917, "epoch": 3807} {"train_loss": -6.759189605712891, "global_step": 159918, "epoch": 3807} {"train_loss": -6.902590751647949, "global_step": 159919, "epoch": 3807} {"train_loss": -6.733210563659668, "global_step": 159920, "epoch": 3807} {"train_loss": -6.950689315795898, "global_step": 159921, "epoch": 3807} {"train_loss": -6.866537094116211, "global_step": 159922, "epoch": 3807} {"train_loss": -6.747930526733398, "global_step": 159923, "epoch": 3807} {"train_loss": -6.875792503356934, "global_step": 159924, "epoch": 3807} {"train_loss": -6.752190589904785, "global_step": 159925, "epoch": 3807} {"train_loss": -6.895205020904541, "global_step": 159926, "epoch": 3807} {"train_loss": -6.842303276062012, "global_step": 159927, "epoch": 3807} {"train_loss": -6.835673809051514, "global_step": 159928, "epoch": 3807} {"train_loss": -6.912820339202881, "global_step": 159929, "epoch": 3807} {"train_loss": -7.0150299072265625, "global_step": 159930, "epoch": 3807} {"train_loss": -6.851984024047852, "global_step": 159931, "epoch": 3807} {"train_loss": -7.044535160064697, "global_step": 159932, "epoch": 3807} {"train_loss": -6.849697113037109, "global_step": 159933, "epoch": 3807} {"train_loss": -6.8503594398498535, "global_step": 159934, "epoch": 3807} {"train_loss": -6.888373953955514, "global_step": 159935, "epoch": 3807, "val_loss": 68397.7734375} {"train_loss": -6.9632463455200195, "global_step": 159936, "epoch": 3808} {"train_loss": -6.912028789520264, "global_step": 159937, "epoch": 3808} {"train_loss": -6.908950328826904, "global_step": 159938, "epoch": 3808} {"train_loss": -6.963956832885742, "global_step": 159939, "epoch": 3808} {"train_loss": -7.059104919433594, "global_step": 159940, "epoch": 3808} {"train_loss": -7.0376081466674805, "global_step": 159941, "epoch": 3808} {"train_loss": -6.930209159851074, "global_step": 159942, "epoch": 3808} {"train_loss": -6.932456970214844, "global_step": 159943, "epoch": 3808} {"train_loss": -6.9286651611328125, "global_step": 159944, "epoch": 3808} {"train_loss": -6.928099632263184, "global_step": 159945, "epoch": 3808} {"train_loss": -6.920427322387695, "global_step": 159946, "epoch": 3808} {"train_loss": -6.928157806396484, "global_step": 159947, "epoch": 3808} {"train_loss": -6.896904468536377, "global_step": 159948, "epoch": 3808} {"train_loss": -6.967482566833496, "global_step": 159949, "epoch": 3808} {"train_loss": -6.740264892578125, "global_step": 159950, "epoch": 3808} {"train_loss": -6.97208309173584, "global_step": 159951, "epoch": 3808} {"train_loss": -6.990908622741699, "global_step": 159952, "epoch": 3808} {"train_loss": -7.013383865356445, "global_step": 159953, "epoch": 3808} {"train_loss": -6.839208602905273, "global_step": 159954, "epoch": 3808} {"train_loss": -6.902379989624023, "global_step": 159955, "epoch": 3808} {"train_loss": -6.8576507568359375, "global_step": 159956, "epoch": 3808} {"train_loss": -6.814953327178955, "global_step": 159957, "epoch": 3808} {"train_loss": -6.956734657287598, "global_step": 159958, "epoch": 3808} {"train_loss": -6.858352184295654, "global_step": 159959, "epoch": 3808} {"train_loss": -7.012739181518555, "global_step": 159960, "epoch": 3808} {"train_loss": -6.773233890533447, "global_step": 159961, "epoch": 3808} {"train_loss": -6.90975284576416, "global_step": 159962, "epoch": 3808} {"train_loss": -6.9365129470825195, "global_step": 159963, "epoch": 3808} {"train_loss": -6.938467979431152, "global_step": 159964, "epoch": 3808} {"train_loss": -6.980521202087402, "global_step": 159965, "epoch": 3808} {"train_loss": -6.869011878967285, "global_step": 159966, "epoch": 3808} {"train_loss": -7.013226509094238, "global_step": 159967, "epoch": 3808} {"train_loss": -7.02861213684082, "global_step": 159968, "epoch": 3808} {"train_loss": -6.879783630371094, "global_step": 159969, "epoch": 3808} {"train_loss": -6.928864479064941, "global_step": 159970, "epoch": 3808} {"train_loss": -6.937367916107178, "global_step": 159971, "epoch": 3808} {"train_loss": -6.847142696380615, "global_step": 159972, "epoch": 3808} {"train_loss": -6.941700458526611, "global_step": 159973, "epoch": 3808} {"train_loss": -6.827602386474609, "global_step": 159974, "epoch": 3808} {"train_loss": -6.898714065551758, "global_step": 159975, "epoch": 3808} {"train_loss": -6.945042610168457, "global_step": 159976, "epoch": 3808} {"train_loss": -6.92067950112479, "global_step": 159977, "epoch": 3808, "val_loss": 68526.9609375} {"train_loss": -6.885855674743652, "global_step": 159978, "epoch": 3809} {"train_loss": -6.959863185882568, "global_step": 159979, "epoch": 3809} {"train_loss": -6.7168684005737305, "global_step": 159980, "epoch": 3809} {"train_loss": -7.001481056213379, "global_step": 159981, "epoch": 3809} {"train_loss": -6.921289443969727, "global_step": 159982, "epoch": 3809} {"train_loss": -7.094310283660889, "global_step": 159983, "epoch": 3809} {"train_loss": -6.8764262199401855, "global_step": 159984, "epoch": 3809} {"train_loss": -7.004910469055176, "global_step": 159985, "epoch": 3809} {"train_loss": -6.866368770599365, "global_step": 159986, "epoch": 3809} {"train_loss": -6.93646764755249, "global_step": 159987, "epoch": 3809} {"train_loss": -6.989238739013672, "global_step": 159988, "epoch": 3809} {"train_loss": -6.935515403747559, "global_step": 159989, "epoch": 3809} {"train_loss": -6.760750770568848, "global_step": 159990, "epoch": 3809} {"train_loss": -6.915464401245117, "global_step": 159991, "epoch": 3809} {"train_loss": -6.7587127685546875, "global_step": 159992, "epoch": 3809} {"train_loss": -7.033930778503418, "global_step": 159993, "epoch": 3809} {"train_loss": -6.824346542358398, "global_step": 159994, "epoch": 3809} {"train_loss": -6.900254249572754, "global_step": 159995, "epoch": 3809} {"train_loss": -7.0375213623046875, "global_step": 159996, "epoch": 3809} {"train_loss": -6.9084625244140625, "global_step": 159997, "epoch": 3809} {"train_loss": -6.976649284362793, "global_step": 159998, "epoch": 3809} {"train_loss": -7.011274337768555, "global_step": 159999, "epoch": 3809} {"train_loss": -6.997377395629883, "global_step": 160000, "epoch": 3809} {"train_loss": -6.938480854034424, "global_step": 160001, "epoch": 3809} {"train_loss": -6.963616371154785, "global_step": 160002, "epoch": 3809} {"train_loss": -6.797547817230225, "global_step": 160003, "epoch": 3809} {"train_loss": -6.995905876159668, "global_step": 160004, "epoch": 3809} {"train_loss": -6.827202796936035, "global_step": 160005, "epoch": 3809} {"train_loss": -6.981750011444092, "global_step": 160006, "epoch": 3809} {"train_loss": -6.969703674316406, "global_step": 160007, "epoch": 3809} {"train_loss": -6.795350074768066, "global_step": 160008, "epoch": 3809} {"train_loss": -6.921834945678711, "global_step": 160009, "epoch": 3809} {"train_loss": -6.8526153564453125, "global_step": 160010, "epoch": 3809} {"train_loss": -6.884496688842773, "global_step": 160011, "epoch": 3809} {"train_loss": -7.003966331481934, "global_step": 160012, "epoch": 3809} {"train_loss": -6.824235916137695, "global_step": 160013, "epoch": 3809} {"train_loss": -6.7871503829956055, "global_step": 160014, "epoch": 3809} {"train_loss": -6.904926300048828, "global_step": 160015, "epoch": 3809} {"train_loss": -6.840291500091553, "global_step": 160016, "epoch": 3809} {"train_loss": -6.892658233642578, "global_step": 160017, "epoch": 3809} {"train_loss": -6.872452735900879, "global_step": 160018, "epoch": 3809} {"train_loss": -6.909863982881818, "global_step": 160019, "epoch": 3809, "val_loss": 68641.484375} {"train_loss": -6.925576210021973, "global_step": 160020, "epoch": 3810} {"train_loss": -6.927366256713867, "global_step": 160021, "epoch": 3810} {"train_loss": -6.918088912963867, "global_step": 160022, "epoch": 3810} {"train_loss": -6.99911642074585, "global_step": 160023, "epoch": 3810} {"train_loss": -6.976415634155273, "global_step": 160024, "epoch": 3810} {"train_loss": -6.8892107009887695, "global_step": 160025, "epoch": 3810} {"train_loss": -6.953174591064453, "global_step": 160026, "epoch": 3810} {"train_loss": -6.9499311447143555, "global_step": 160027, "epoch": 3810} {"train_loss": -6.982673645019531, "global_step": 160028, "epoch": 3810} {"train_loss": -6.999123573303223, "global_step": 160029, "epoch": 3810} {"train_loss": -6.824648857116699, "global_step": 160030, "epoch": 3810} {"train_loss": -6.9197096824646, "global_step": 160031, "epoch": 3810} {"train_loss": -6.966501235961914, "global_step": 160032, "epoch": 3810} {"train_loss": -6.937640190124512, "global_step": 160033, "epoch": 3810} {"train_loss": -6.916994094848633, "global_step": 160034, "epoch": 3810} {"train_loss": -6.8884735107421875, "global_step": 160035, "epoch": 3810} {"train_loss": -6.987638473510742, "global_step": 160036, "epoch": 3810} {"train_loss": -7.058994293212891, "global_step": 160037, "epoch": 3810} {"train_loss": -7.0214738845825195, "global_step": 160038, "epoch": 3810} {"train_loss": -7.028431415557861, "global_step": 160039, "epoch": 3810} {"train_loss": -7.042607307434082, "global_step": 160040, "epoch": 3810} {"train_loss": -7.023516654968262, "global_step": 160041, "epoch": 3810} {"train_loss": -7.00346565246582, "global_step": 160042, "epoch": 3810} {"train_loss": -7.027541160583496, "global_step": 160043, "epoch": 3810} {"train_loss": -7.0329461097717285, "global_step": 160044, "epoch": 3810} {"train_loss": -6.98225736618042, "global_step": 160045, "epoch": 3810} {"train_loss": -7.004061222076416, "global_step": 160046, "epoch": 3810} {"train_loss": -7.002349376678467, "global_step": 160047, "epoch": 3810} {"train_loss": -7.153042793273926, "global_step": 160048, "epoch": 3810} {"train_loss": -7.019540309906006, "global_step": 160049, "epoch": 3810} {"train_loss": -6.927326202392578, "global_step": 160050, "epoch": 3810} {"train_loss": -7.083664417266846, "global_step": 160051, "epoch": 3810} {"train_loss": -6.94078254699707, "global_step": 160052, "epoch": 3810} {"train_loss": -6.9278106689453125, "global_step": 160053, "epoch": 3810} {"train_loss": -6.975934028625488, "global_step": 160054, "epoch": 3810} {"train_loss": -6.93785285949707, "global_step": 160055, "epoch": 3810} {"train_loss": -6.895439624786377, "global_step": 160056, "epoch": 3810} {"train_loss": -7.058440208435059, "global_step": 160057, "epoch": 3810} {"train_loss": -7.049142360687256, "global_step": 160058, "epoch": 3810} {"train_loss": -7.049521446228027, "global_step": 160059, "epoch": 3810} {"train_loss": -7.009374618530273, "global_step": 160060, "epoch": 3810} {"train_loss": -6.978674298241025, "global_step": 160061, "epoch": 3810, "val_loss": 68520.4453125} {"train_loss": -6.95990514755249, "global_step": 160062, "epoch": 3811} {"train_loss": -7.019799709320068, "global_step": 160063, "epoch": 3811} {"train_loss": -6.92781925201416, "global_step": 160064, "epoch": 3811} {"train_loss": -7.079558849334717, "global_step": 160065, "epoch": 3811} {"train_loss": -6.967480659484863, "global_step": 160066, "epoch": 3811} {"train_loss": -7.018561840057373, "global_step": 160067, "epoch": 3811} {"train_loss": -6.926364898681641, "global_step": 160068, "epoch": 3811} {"train_loss": -6.892782211303711, "global_step": 160069, "epoch": 3811} {"train_loss": -7.057720184326172, "global_step": 160070, "epoch": 3811} {"train_loss": -7.003121376037598, "global_step": 160071, "epoch": 3811} {"train_loss": -6.91142463684082, "global_step": 160072, "epoch": 3811} {"train_loss": -7.021603107452393, "global_step": 160073, "epoch": 3811} {"train_loss": -6.909954071044922, "global_step": 160074, "epoch": 3811} {"train_loss": -7.012287139892578, "global_step": 160075, "epoch": 3811} {"train_loss": -6.984160423278809, "global_step": 160076, "epoch": 3811} {"train_loss": -6.856165885925293, "global_step": 160077, "epoch": 3811} {"train_loss": -6.967495918273926, "global_step": 160078, "epoch": 3811} {"train_loss": -6.955202579498291, "global_step": 160079, "epoch": 3811} {"train_loss": -6.759596824645996, "global_step": 160080, "epoch": 3811} {"train_loss": -6.939660549163818, "global_step": 160081, "epoch": 3811} {"train_loss": -6.789322853088379, "global_step": 160082, "epoch": 3811} {"train_loss": -6.790681838989258, "global_step": 160083, "epoch": 3811} {"train_loss": -6.783754348754883, "global_step": 160084, "epoch": 3811} {"train_loss": -6.798397064208984, "global_step": 160085, "epoch": 3811} {"train_loss": -6.850166320800781, "global_step": 160086, "epoch": 3811} {"train_loss": -6.633308410644531, "global_step": 160087, "epoch": 3811} {"train_loss": -6.9566450119018555, "global_step": 160088, "epoch": 3811} {"train_loss": -6.764679908752441, "global_step": 160089, "epoch": 3811} {"train_loss": -6.781772613525391, "global_step": 160090, "epoch": 3811} {"train_loss": -6.856629371643066, "global_step": 160091, "epoch": 3811} {"train_loss": -6.83608865737915, "global_step": 160092, "epoch": 3811} {"train_loss": -6.7873854637146, "global_step": 160093, "epoch": 3811} {"train_loss": -6.733909606933594, "global_step": 160094, "epoch": 3811} {"train_loss": -6.879403591156006, "global_step": 160095, "epoch": 3811} {"train_loss": -6.837355613708496, "global_step": 160096, "epoch": 3811} {"train_loss": -6.845329284667969, "global_step": 160097, "epoch": 3811} {"train_loss": -6.844052314758301, "global_step": 160098, "epoch": 3811} {"train_loss": -6.9037322998046875, "global_step": 160099, "epoch": 3811} {"train_loss": -6.852519989013672, "global_step": 160100, "epoch": 3811} {"train_loss": -6.84200382232666, "global_step": 160101, "epoch": 3811} {"train_loss": -6.906830787658691, "global_step": 160102, "epoch": 3811} {"train_loss": -6.890049116952079, "global_step": 160103, "epoch": 3811, "val_loss": 68744.3984375} {"train_loss": -6.880688667297363, "global_step": 160104, "epoch": 3812} {"train_loss": -6.893574237823486, "global_step": 160105, "epoch": 3812} {"train_loss": -6.8955278396606445, "global_step": 160106, "epoch": 3812} {"train_loss": -6.913813591003418, "global_step": 160107, "epoch": 3812} {"train_loss": -6.96007776260376, "global_step": 160108, "epoch": 3812} {"train_loss": -6.956991195678711, "global_step": 160109, "epoch": 3812} {"train_loss": -6.959150791168213, "global_step": 160110, "epoch": 3812} {"train_loss": -6.944673538208008, "global_step": 160111, "epoch": 3812} {"train_loss": -7.018556594848633, "global_step": 160112, "epoch": 3812} {"train_loss": -6.94053316116333, "global_step": 160113, "epoch": 3812} {"train_loss": -7.007453441619873, "global_step": 160114, "epoch": 3812} {"train_loss": -6.904785633087158, "global_step": 160115, "epoch": 3812} {"train_loss": -6.9302520751953125, "global_step": 160116, "epoch": 3812} {"train_loss": -6.82243537902832, "global_step": 160117, "epoch": 3812} {"train_loss": -6.926536560058594, "global_step": 160118, "epoch": 3812} {"train_loss": -7.045224189758301, "global_step": 160119, "epoch": 3812} {"train_loss": -7.006049156188965, "global_step": 160120, "epoch": 3812} {"train_loss": -7.032278537750244, "global_step": 160121, "epoch": 3812} {"train_loss": -6.9921159744262695, "global_step": 160122, "epoch": 3812} {"train_loss": -7.035776138305664, "global_step": 160123, "epoch": 3812} {"train_loss": -7.030299186706543, "global_step": 160124, "epoch": 3812} {"train_loss": -7.02340030670166, "global_step": 160125, "epoch": 3812} {"train_loss": -7.048892974853516, "global_step": 160126, "epoch": 3812} {"train_loss": -7.044564247131348, "global_step": 160127, "epoch": 3812} {"train_loss": -7.016856670379639, "global_step": 160128, "epoch": 3812} {"train_loss": -6.951173305511475, "global_step": 160129, "epoch": 3812} {"train_loss": -7.004153251647949, "global_step": 160130, "epoch": 3812} {"train_loss": -6.935009002685547, "global_step": 160131, "epoch": 3812} {"train_loss": -6.98821496963501, "global_step": 160132, "epoch": 3812} {"train_loss": -6.917325973510742, "global_step": 160133, "epoch": 3812} {"train_loss": -7.102546691894531, "global_step": 160134, "epoch": 3812} {"train_loss": -6.848376274108887, "global_step": 160135, "epoch": 3812} {"train_loss": -6.903534889221191, "global_step": 160136, "epoch": 3812} {"train_loss": -6.905328750610352, "global_step": 160137, "epoch": 3812} {"train_loss": -6.849490165710449, "global_step": 160138, "epoch": 3812} {"train_loss": -6.900594711303711, "global_step": 160139, "epoch": 3812} {"train_loss": -6.894015789031982, "global_step": 160140, "epoch": 3812} {"train_loss": -7.047726631164551, "global_step": 160141, "epoch": 3812} {"train_loss": -6.876852989196777, "global_step": 160142, "epoch": 3812} {"train_loss": -6.919828414916992, "global_step": 160143, "epoch": 3812} {"train_loss": -6.965863227844238, "global_step": 160144, "epoch": 3812} {"train_loss": -6.956742014203753, "global_step": 160145, "epoch": 3812, "val_loss": 68623.4609375} {"train_loss": -7.036280155181885, "global_step": 160146, "epoch": 3813} {"train_loss": -7.0551252365112305, "global_step": 160147, "epoch": 3813} {"train_loss": -6.899448871612549, "global_step": 160148, "epoch": 3813} {"train_loss": -6.9222259521484375, "global_step": 160149, "epoch": 3813} {"train_loss": -6.9508514404296875, "global_step": 160150, "epoch": 3813} {"train_loss": -6.943586349487305, "global_step": 160151, "epoch": 3813} {"train_loss": -7.018614768981934, "global_step": 160152, "epoch": 3813} {"train_loss": -6.954239845275879, "global_step": 160153, "epoch": 3813} {"train_loss": -7.0684428215026855, "global_step": 160154, "epoch": 3813} {"train_loss": -6.968369007110596, "global_step": 160155, "epoch": 3813} {"train_loss": -6.946598052978516, "global_step": 160156, "epoch": 3813} {"train_loss": -6.978489398956299, "global_step": 160157, "epoch": 3813} {"train_loss": -6.980564594268799, "global_step": 160158, "epoch": 3813} {"train_loss": -7.043161392211914, "global_step": 160159, "epoch": 3813} {"train_loss": -6.941176414489746, "global_step": 160160, "epoch": 3813} {"train_loss": -7.061023712158203, "global_step": 160161, "epoch": 3813} {"train_loss": -6.951798439025879, "global_step": 160162, "epoch": 3813} {"train_loss": -7.000360488891602, "global_step": 160163, "epoch": 3813} {"train_loss": -7.005712985992432, "global_step": 160164, "epoch": 3813} {"train_loss": -6.985659122467041, "global_step": 160165, "epoch": 3813} {"train_loss": -7.086012840270996, "global_step": 160166, "epoch": 3813} {"train_loss": -6.949143886566162, "global_step": 160167, "epoch": 3813} {"train_loss": -6.9970703125, "global_step": 160168, "epoch": 3813} {"train_loss": -7.033710479736328, "global_step": 160169, "epoch": 3813} {"train_loss": -6.886641502380371, "global_step": 160170, "epoch": 3813} {"train_loss": -7.019272327423096, "global_step": 160171, "epoch": 3813} {"train_loss": -6.968523025512695, "global_step": 160172, "epoch": 3813} {"train_loss": -6.964023590087891, "global_step": 160173, "epoch": 3813} {"train_loss": -6.938830852508545, "global_step": 160174, "epoch": 3813} {"train_loss": -6.823727130889893, "global_step": 160175, "epoch": 3813} {"train_loss": -6.961938858032227, "global_step": 160176, "epoch": 3813} {"train_loss": -6.921686172485352, "global_step": 160177, "epoch": 3813} {"train_loss": -6.8685173988342285, "global_step": 160178, "epoch": 3813} {"train_loss": -7.092751502990723, "global_step": 160179, "epoch": 3813} {"train_loss": -6.974846839904785, "global_step": 160180, "epoch": 3813} {"train_loss": -6.998048782348633, "global_step": 160181, "epoch": 3813} {"train_loss": -7.010602951049805, "global_step": 160182, "epoch": 3813} {"train_loss": -7.044032096862793, "global_step": 160183, "epoch": 3813} {"train_loss": -7.0216779708862305, "global_step": 160184, "epoch": 3813} {"train_loss": -6.933957576751709, "global_step": 160185, "epoch": 3813} {"train_loss": -6.995925426483154, "global_step": 160186, "epoch": 3813} {"train_loss": -6.984738997050694, "global_step": 160187, "epoch": 3813, "val_loss": 68586.78125} {"train_loss": -6.9677228927612305, "global_step": 160188, "epoch": 3814} {"train_loss": -7.055054187774658, "global_step": 160189, "epoch": 3814} {"train_loss": -6.8867621421813965, "global_step": 160190, "epoch": 3814} {"train_loss": -6.912623405456543, "global_step": 160191, "epoch": 3814} {"train_loss": -6.947279453277588, "global_step": 160192, "epoch": 3814} {"train_loss": -6.98510217666626, "global_step": 160193, "epoch": 3814} {"train_loss": -7.009304046630859, "global_step": 160194, "epoch": 3814} {"train_loss": -6.918359756469727, "global_step": 160195, "epoch": 3814} {"train_loss": -6.945965766906738, "global_step": 160196, "epoch": 3814} {"train_loss": -6.985638618469238, "global_step": 160197, "epoch": 3814} {"train_loss": -7.012693405151367, "global_step": 160198, "epoch": 3814} {"train_loss": -7.1161394119262695, "global_step": 160199, "epoch": 3814} {"train_loss": -6.940638065338135, "global_step": 160200, "epoch": 3814} {"train_loss": -7.005834579467773, "global_step": 160201, "epoch": 3814} {"train_loss": -6.920768737792969, "global_step": 160202, "epoch": 3814} {"train_loss": -7.015656471252441, "global_step": 160203, "epoch": 3814} {"train_loss": -7.098813533782959, "global_step": 160204, "epoch": 3814} {"train_loss": -7.020125389099121, "global_step": 160205, "epoch": 3814} {"train_loss": -7.108572006225586, "global_step": 160206, "epoch": 3814} {"train_loss": -7.011650085449219, "global_step": 160207, "epoch": 3814} {"train_loss": -7.027068614959717, "global_step": 160208, "epoch": 3814} {"train_loss": -6.965639591217041, "global_step": 160209, "epoch": 3814} {"train_loss": -6.942969799041748, "global_step": 160210, "epoch": 3814} {"train_loss": -6.954234600067139, "global_step": 160211, "epoch": 3814} {"train_loss": -6.981797218322754, "global_step": 160212, "epoch": 3814} {"train_loss": -6.907797336578369, "global_step": 160213, "epoch": 3814} {"train_loss": -7.0121846199035645, "global_step": 160214, "epoch": 3814} {"train_loss": -6.921503067016602, "global_step": 160215, "epoch": 3814} {"train_loss": -6.983731269836426, "global_step": 160216, "epoch": 3814} {"train_loss": -6.906191349029541, "global_step": 160217, "epoch": 3814} {"train_loss": -6.973841667175293, "global_step": 160218, "epoch": 3814} {"train_loss": -6.8643341064453125, "global_step": 160219, "epoch": 3814} {"train_loss": -7.093676567077637, "global_step": 160220, "epoch": 3814} {"train_loss": -6.825352668762207, "global_step": 160221, "epoch": 3814} {"train_loss": -6.733832359313965, "global_step": 160222, "epoch": 3814} {"train_loss": -6.966625690460205, "global_step": 160223, "epoch": 3814} {"train_loss": -6.924764633178711, "global_step": 160224, "epoch": 3814} {"train_loss": -6.898674964904785, "global_step": 160225, "epoch": 3814} {"train_loss": -6.950214385986328, "global_step": 160226, "epoch": 3814} {"train_loss": -6.880867958068848, "global_step": 160227, "epoch": 3814} {"train_loss": -6.806058883666992, "global_step": 160228, "epoch": 3814} {"train_loss": -6.9589938549768355, "global_step": 160229, "epoch": 3814, "val_loss": 68546.671875} {"train_loss": -6.973852157592773, "global_step": 160230, "epoch": 3815} {"train_loss": -6.89627742767334, "global_step": 160231, "epoch": 3815} {"train_loss": -6.856914520263672, "global_step": 160232, "epoch": 3815} {"train_loss": -6.74357271194458, "global_step": 160233, "epoch": 3815} {"train_loss": -6.84283447265625, "global_step": 160234, "epoch": 3815} {"train_loss": -6.910151481628418, "global_step": 160235, "epoch": 3815} {"train_loss": -6.8785905838012695, "global_step": 160236, "epoch": 3815} {"train_loss": -6.832393169403076, "global_step": 160237, "epoch": 3815} {"train_loss": -6.933526039123535, "global_step": 160238, "epoch": 3815} {"train_loss": -6.78964900970459, "global_step": 160239, "epoch": 3815} {"train_loss": -6.832857131958008, "global_step": 160240, "epoch": 3815} {"train_loss": -6.950389862060547, "global_step": 160241, "epoch": 3815} {"train_loss": -6.8210368156433105, "global_step": 160242, "epoch": 3815} {"train_loss": -6.77562141418457, "global_step": 160243, "epoch": 3815} {"train_loss": -6.947999000549316, "global_step": 160244, "epoch": 3815} {"train_loss": -6.877777099609375, "global_step": 160245, "epoch": 3815} {"train_loss": -6.8238983154296875, "global_step": 160246, "epoch": 3815} {"train_loss": -6.9037065505981445, "global_step": 160247, "epoch": 3815} {"train_loss": -6.8296074867248535, "global_step": 160248, "epoch": 3815} {"train_loss": -6.996403694152832, "global_step": 160249, "epoch": 3815} {"train_loss": -6.905007362365723, "global_step": 160250, "epoch": 3815} {"train_loss": -6.958442687988281, "global_step": 160251, "epoch": 3815} {"train_loss": -6.911853790283203, "global_step": 160252, "epoch": 3815} {"train_loss": -6.848960876464844, "global_step": 160253, "epoch": 3815} {"train_loss": -6.789423942565918, "global_step": 160254, "epoch": 3815} {"train_loss": -6.899428844451904, "global_step": 160255, "epoch": 3815} {"train_loss": -6.955861568450928, "global_step": 160256, "epoch": 3815} {"train_loss": -6.941655158996582, "global_step": 160257, "epoch": 3815} {"train_loss": -6.857097625732422, "global_step": 160258, "epoch": 3815} {"train_loss": -6.96864128112793, "global_step": 160259, "epoch": 3815} {"train_loss": -6.866449356079102, "global_step": 160260, "epoch": 3815} {"train_loss": -6.8870086669921875, "global_step": 160261, "epoch": 3815} {"train_loss": -6.964177131652832, "global_step": 160262, "epoch": 3815} {"train_loss": -6.973090171813965, "global_step": 160263, "epoch": 3815} {"train_loss": -7.005291938781738, "global_step": 160264, "epoch": 3815} {"train_loss": -6.958530426025391, "global_step": 160265, "epoch": 3815} {"train_loss": -6.869485855102539, "global_step": 160266, "epoch": 3815} {"train_loss": -6.897734642028809, "global_step": 160267, "epoch": 3815} {"train_loss": -6.744096755981445, "global_step": 160268, "epoch": 3815} {"train_loss": -6.983964920043945, "global_step": 160269, "epoch": 3815} {"train_loss": -6.848209857940674, "global_step": 160270, "epoch": 3815} {"train_loss": -6.8870054086049395, "global_step": 160271, "epoch": 3815, "val_loss": 68714.5859375} {"train_loss": -6.891141891479492, "global_step": 160272, "epoch": 3816} {"train_loss": -6.938375473022461, "global_step": 160273, "epoch": 3816} {"train_loss": -6.92540168762207, "global_step": 160274, "epoch": 3816} {"train_loss": -6.883197784423828, "global_step": 160275, "epoch": 3816} {"train_loss": -6.939489364624023, "global_step": 160276, "epoch": 3816} {"train_loss": -6.947526931762695, "global_step": 160277, "epoch": 3816} {"train_loss": -6.924724578857422, "global_step": 160278, "epoch": 3816} {"train_loss": -6.89649772644043, "global_step": 160279, "epoch": 3816} {"train_loss": -6.780850410461426, "global_step": 160280, "epoch": 3816} {"train_loss": -6.865680694580078, "global_step": 160281, "epoch": 3816} {"train_loss": -6.963418006896973, "global_step": 160282, "epoch": 3816} {"train_loss": -6.897296905517578, "global_step": 160283, "epoch": 3816} {"train_loss": -6.963430404663086, "global_step": 160284, "epoch": 3816} {"train_loss": -7.032819747924805, "global_step": 160285, "epoch": 3816} {"train_loss": -6.871339321136475, "global_step": 160286, "epoch": 3816} {"train_loss": -6.911865234375, "global_step": 160287, "epoch": 3816} {"train_loss": -6.909455299377441, "global_step": 160288, "epoch": 3816} {"train_loss": -6.8757123947143555, "global_step": 160289, "epoch": 3816} {"train_loss": -6.97972297668457, "global_step": 160290, "epoch": 3816} {"train_loss": -6.965857028961182, "global_step": 160291, "epoch": 3816} {"train_loss": -6.927667140960693, "global_step": 160292, "epoch": 3816} {"train_loss": -7.0028395652771, "global_step": 160293, "epoch": 3816} {"train_loss": -6.901832580566406, "global_step": 160294, "epoch": 3816} {"train_loss": -6.917029857635498, "global_step": 160295, "epoch": 3816} {"train_loss": -6.930797576904297, "global_step": 160296, "epoch": 3816} {"train_loss": -6.955376148223877, "global_step": 160297, "epoch": 3816} {"train_loss": -6.880073070526123, "global_step": 160298, "epoch": 3816} {"train_loss": -6.934759140014648, "global_step": 160299, "epoch": 3816} {"train_loss": -6.903254508972168, "global_step": 160300, "epoch": 3816} {"train_loss": -6.968597888946533, "global_step": 160301, "epoch": 3816} {"train_loss": -6.951563358306885, "global_step": 160302, "epoch": 3816} {"train_loss": -7.030591011047363, "global_step": 160303, "epoch": 3816} {"train_loss": -6.966498374938965, "global_step": 160304, "epoch": 3816} {"train_loss": -6.922767639160156, "global_step": 160305, "epoch": 3816} {"train_loss": -6.848642826080322, "global_step": 160306, "epoch": 3816} {"train_loss": -6.88284158706665, "global_step": 160307, "epoch": 3816} {"train_loss": -6.989582538604736, "global_step": 160308, "epoch": 3816} {"train_loss": -6.955452919006348, "global_step": 160309, "epoch": 3816} {"train_loss": -7.050834655761719, "global_step": 160310, "epoch": 3816} {"train_loss": -7.057623386383057, "global_step": 160311, "epoch": 3816} {"train_loss": -7.0720744132995605, "global_step": 160312, "epoch": 3816} {"train_loss": -6.936436743963332, "global_step": 160313, "epoch": 3816, "val_loss": 68649.984375} {"train_loss": -6.893767356872559, "global_step": 160314, "epoch": 3817} {"train_loss": -6.968259811401367, "global_step": 160315, "epoch": 3817} {"train_loss": -6.946889400482178, "global_step": 160316, "epoch": 3817} {"train_loss": -6.938565254211426, "global_step": 160317, "epoch": 3817} {"train_loss": -7.0521063804626465, "global_step": 160318, "epoch": 3817} {"train_loss": -6.921497821807861, "global_step": 160319, "epoch": 3817} {"train_loss": -7.049618721008301, "global_step": 160320, "epoch": 3817} {"train_loss": -6.952543258666992, "global_step": 160321, "epoch": 3817} {"train_loss": -7.014782428741455, "global_step": 160322, "epoch": 3817} {"train_loss": -7.00133752822876, "global_step": 160323, "epoch": 3817} {"train_loss": -7.087358474731445, "global_step": 160324, "epoch": 3817} {"train_loss": -6.935997486114502, "global_step": 160325, "epoch": 3817} {"train_loss": -6.868717670440674, "global_step": 160326, "epoch": 3817} {"train_loss": -6.893206596374512, "global_step": 160327, "epoch": 3817} {"train_loss": -7.035906791687012, "global_step": 160328, "epoch": 3817} {"train_loss": -7.0283379554748535, "global_step": 160329, "epoch": 3817} {"train_loss": -7.071588516235352, "global_step": 160330, "epoch": 3817} {"train_loss": -7.0114946365356445, "global_step": 160331, "epoch": 3817} {"train_loss": -7.04063606262207, "global_step": 160332, "epoch": 3817} {"train_loss": -6.961517333984375, "global_step": 160333, "epoch": 3817} {"train_loss": -6.906302452087402, "global_step": 160334, "epoch": 3817} {"train_loss": -6.985080718994141, "global_step": 160335, "epoch": 3817} {"train_loss": -7.060524940490723, "global_step": 160336, "epoch": 3817} {"train_loss": -7.102578163146973, "global_step": 160337, "epoch": 3817} {"train_loss": -7.10496711730957, "global_step": 160338, "epoch": 3817} {"train_loss": -7.070416450500488, "global_step": 160339, "epoch": 3817} {"train_loss": -7.039888381958008, "global_step": 160340, "epoch": 3817} {"train_loss": -7.05339241027832, "global_step": 160341, "epoch": 3817} {"train_loss": -7.052101135253906, "global_step": 160342, "epoch": 3817} {"train_loss": -6.928342819213867, "global_step": 160343, "epoch": 3817} {"train_loss": -6.8714494705200195, "global_step": 160344, "epoch": 3817} {"train_loss": -7.011587142944336, "global_step": 160345, "epoch": 3817} {"train_loss": -6.969422817230225, "global_step": 160346, "epoch": 3817} {"train_loss": -6.911479473114014, "global_step": 160347, "epoch": 3817} {"train_loss": -7.0189738273620605, "global_step": 160348, "epoch": 3817} {"train_loss": -6.83167028427124, "global_step": 160349, "epoch": 3817} {"train_loss": -6.873256683349609, "global_step": 160350, "epoch": 3817} {"train_loss": -6.952092170715332, "global_step": 160351, "epoch": 3817} {"train_loss": -7.026812553405762, "global_step": 160352, "epoch": 3817} {"train_loss": -6.833847522735596, "global_step": 160353, "epoch": 3817} {"train_loss": -6.8614606857299805, "global_step": 160354, "epoch": 3817} {"train_loss": -6.977289642606463, "global_step": 160355, "epoch": 3817, "val_loss": 68823.859375} {"train_loss": -6.9736328125, "global_step": 160356, "epoch": 3818} {"train_loss": -6.820110321044922, "global_step": 160357, "epoch": 3818} {"train_loss": -6.789262771606445, "global_step": 160358, "epoch": 3818} {"train_loss": -6.909646034240723, "global_step": 160359, "epoch": 3818} {"train_loss": -6.891679763793945, "global_step": 160360, "epoch": 3818} {"train_loss": -6.916383266448975, "global_step": 160361, "epoch": 3818} {"train_loss": -6.912796974182129, "global_step": 160362, "epoch": 3818} {"train_loss": -6.905130863189697, "global_step": 160363, "epoch": 3818} {"train_loss": -6.893512725830078, "global_step": 160364, "epoch": 3818} {"train_loss": -6.881594657897949, "global_step": 160365, "epoch": 3818} {"train_loss": -6.890868186950684, "global_step": 160366, "epoch": 3818} {"train_loss": -6.9160685539245605, "global_step": 160367, "epoch": 3818} {"train_loss": -6.920175075531006, "global_step": 160368, "epoch": 3818} {"train_loss": -6.840664386749268, "global_step": 160369, "epoch": 3818} {"train_loss": -6.7952561378479, "global_step": 160370, "epoch": 3818} {"train_loss": -6.898800849914551, "global_step": 160371, "epoch": 3818} {"train_loss": -6.876093864440918, "global_step": 160372, "epoch": 3818} {"train_loss": -6.9671950340271, "global_step": 160373, "epoch": 3818} {"train_loss": -6.989412307739258, "global_step": 160374, "epoch": 3818} {"train_loss": -6.962554454803467, "global_step": 160375, "epoch": 3818} {"train_loss": -6.971067428588867, "global_step": 160376, "epoch": 3818} {"train_loss": -6.989497184753418, "global_step": 160377, "epoch": 3818} {"train_loss": -6.98757266998291, "global_step": 160378, "epoch": 3818} {"train_loss": -7.058383941650391, "global_step": 160379, "epoch": 3818} {"train_loss": -6.952897071838379, "global_step": 160380, "epoch": 3818} {"train_loss": -7.053740501403809, "global_step": 160381, "epoch": 3818} {"train_loss": -6.988475799560547, "global_step": 160382, "epoch": 3818} {"train_loss": -6.9885406494140625, "global_step": 160383, "epoch": 3818} {"train_loss": -7.081560134887695, "global_step": 160384, "epoch": 3818} {"train_loss": -6.916169166564941, "global_step": 160385, "epoch": 3818} {"train_loss": -6.974070072174072, "global_step": 160386, "epoch": 3818} {"train_loss": -7.123133659362793, "global_step": 160387, "epoch": 3818} {"train_loss": -6.9387712478637695, "global_step": 160388, "epoch": 3818} {"train_loss": -6.927264213562012, "global_step": 160389, "epoch": 3818} {"train_loss": -6.964136123657227, "global_step": 160390, "epoch": 3818} {"train_loss": -6.855200290679932, "global_step": 160391, "epoch": 3818} {"train_loss": -6.908517837524414, "global_step": 160392, "epoch": 3818} {"train_loss": -7.0632429122924805, "global_step": 160393, "epoch": 3818} {"train_loss": -6.936132431030273, "global_step": 160394, "epoch": 3818} {"train_loss": -6.926624298095703, "global_step": 160395, "epoch": 3818} {"train_loss": -6.957586288452148, "global_step": 160396, "epoch": 3818} {"train_loss": -6.93829878171285, "global_step": 160397, "epoch": 3818, "val_loss": 68618.421875} {"train_loss": -6.9222259521484375, "global_step": 160398, "epoch": 3819} {"train_loss": -6.922035217285156, "global_step": 160399, "epoch": 3819} {"train_loss": -6.928886413574219, "global_step": 160400, "epoch": 3819} {"train_loss": -6.876229286193848, "global_step": 160401, "epoch": 3819} {"train_loss": -6.782221794128418, "global_step": 160402, "epoch": 3819} {"train_loss": -6.769015312194824, "global_step": 160403, "epoch": 3819} {"train_loss": -6.782172679901123, "global_step": 160404, "epoch": 3819} {"train_loss": -6.80583381652832, "global_step": 160405, "epoch": 3819} {"train_loss": -6.679933071136475, "global_step": 160406, "epoch": 3819} {"train_loss": -6.84880256652832, "global_step": 160407, "epoch": 3819} {"train_loss": -6.680828094482422, "global_step": 160408, "epoch": 3819} {"train_loss": -6.847127914428711, "global_step": 160409, "epoch": 3819} {"train_loss": -6.857911109924316, "global_step": 160410, "epoch": 3819} {"train_loss": -6.745443344116211, "global_step": 160411, "epoch": 3819} {"train_loss": -6.8628740310668945, "global_step": 160412, "epoch": 3819} {"train_loss": -6.739545822143555, "global_step": 160413, "epoch": 3819} {"train_loss": -6.740665912628174, "global_step": 160414, "epoch": 3819} {"train_loss": -6.85687255859375, "global_step": 160415, "epoch": 3819} {"train_loss": -6.736656188964844, "global_step": 160416, "epoch": 3819} {"train_loss": -6.7242631912231445, "global_step": 160417, "epoch": 3819} {"train_loss": -6.93289852142334, "global_step": 160418, "epoch": 3819} {"train_loss": -6.759800910949707, "global_step": 160419, "epoch": 3819} {"train_loss": -6.94354248046875, "global_step": 160420, "epoch": 3819} {"train_loss": -6.909492015838623, "global_step": 160421, "epoch": 3819} {"train_loss": -6.935388088226318, "global_step": 160422, "epoch": 3819} {"train_loss": -6.872922897338867, "global_step": 160423, "epoch": 3819} {"train_loss": -6.911567687988281, "global_step": 160424, "epoch": 3819} {"train_loss": -6.937372207641602, "global_step": 160425, "epoch": 3819} {"train_loss": -6.843472480773926, "global_step": 160426, "epoch": 3819} {"train_loss": -6.906198501586914, "global_step": 160427, "epoch": 3819} {"train_loss": -6.810226917266846, "global_step": 160428, "epoch": 3819} {"train_loss": -7.0062150955200195, "global_step": 160429, "epoch": 3819} {"train_loss": -7.031159400939941, "global_step": 160430, "epoch": 3819} {"train_loss": -6.921525001525879, "global_step": 160431, "epoch": 3819} {"train_loss": -6.844387054443359, "global_step": 160432, "epoch": 3819} {"train_loss": -6.927262783050537, "global_step": 160433, "epoch": 3819} {"train_loss": -6.976624011993408, "global_step": 160434, "epoch": 3819} {"train_loss": -6.857234477996826, "global_step": 160435, "epoch": 3819} {"train_loss": -6.880030155181885, "global_step": 160436, "epoch": 3819} {"train_loss": -6.888008117675781, "global_step": 160437, "epoch": 3819} {"train_loss": -6.952998161315918, "global_step": 160438, "epoch": 3819} {"train_loss": -6.8588184515635175, "global_step": 160439, "epoch": 3819, "val_loss": 68543.109375} {"train_loss": -7.029065132141113, "global_step": 160440, "epoch": 3820} {"train_loss": -6.992628574371338, "global_step": 160441, "epoch": 3820} {"train_loss": -6.909129619598389, "global_step": 160442, "epoch": 3820} {"train_loss": -6.966904640197754, "global_step": 160443, "epoch": 3820} {"train_loss": -6.872164726257324, "global_step": 160444, "epoch": 3820} {"train_loss": -6.945892333984375, "global_step": 160445, "epoch": 3820} {"train_loss": -7.07761812210083, "global_step": 160446, "epoch": 3820} {"train_loss": -6.878073692321777, "global_step": 160447, "epoch": 3820} {"train_loss": -6.905820846557617, "global_step": 160448, "epoch": 3820} {"train_loss": -6.884042739868164, "global_step": 160449, "epoch": 3820} {"train_loss": -6.850764274597168, "global_step": 160450, "epoch": 3820} {"train_loss": -6.866397857666016, "global_step": 160451, "epoch": 3820} {"train_loss": -7.053170204162598, "global_step": 160452, "epoch": 3820} {"train_loss": -6.911696434020996, "global_step": 160453, "epoch": 3820} {"train_loss": -7.058259010314941, "global_step": 160454, "epoch": 3820} {"train_loss": -6.914885520935059, "global_step": 160455, "epoch": 3820} {"train_loss": -6.883312225341797, "global_step": 160456, "epoch": 3820} {"train_loss": -6.998569488525391, "global_step": 160457, "epoch": 3820} {"train_loss": -6.929250717163086, "global_step": 160458, "epoch": 3820} {"train_loss": -6.961773872375488, "global_step": 160459, "epoch": 3820} {"train_loss": -7.0531768798828125, "global_step": 160460, "epoch": 3820} {"train_loss": -7.047550201416016, "global_step": 160461, "epoch": 3820} {"train_loss": -6.988379955291748, "global_step": 160462, "epoch": 3820} {"train_loss": -7.057543754577637, "global_step": 160463, "epoch": 3820} {"train_loss": -6.872479438781738, "global_step": 160464, "epoch": 3820} {"train_loss": -7.000297546386719, "global_step": 160465, "epoch": 3820} {"train_loss": -6.998414516448975, "global_step": 160466, "epoch": 3820} {"train_loss": -6.832659721374512, "global_step": 160467, "epoch": 3820} {"train_loss": -7.06618595123291, "global_step": 160468, "epoch": 3820} {"train_loss": -6.84137487411499, "global_step": 160469, "epoch": 3820} {"train_loss": -6.932445049285889, "global_step": 160470, "epoch": 3820} {"train_loss": -6.9936370849609375, "global_step": 160471, "epoch": 3820} {"train_loss": -6.8730621337890625, "global_step": 160472, "epoch": 3820} {"train_loss": -6.941471099853516, "global_step": 160473, "epoch": 3820} {"train_loss": -7.023557662963867, "global_step": 160474, "epoch": 3820} {"train_loss": -6.7838850021362305, "global_step": 160475, "epoch": 3820} {"train_loss": -6.9770989418029785, "global_step": 160476, "epoch": 3820} {"train_loss": -6.978287696838379, "global_step": 160477, "epoch": 3820} {"train_loss": -6.896003723144531, "global_step": 160478, "epoch": 3820} {"train_loss": -6.982047080993652, "global_step": 160479, "epoch": 3820} {"train_loss": -6.901214599609375, "global_step": 160480, "epoch": 3820} {"train_loss": -6.948352200644357, "global_step": 160481, "epoch": 3820, "val_loss": 68538.2734375} {"train_loss": -7.058320045471191, "global_step": 160482, "epoch": 3821} {"train_loss": -6.946150779724121, "global_step": 160483, "epoch": 3821} {"train_loss": -6.864482879638672, "global_step": 160484, "epoch": 3821} {"train_loss": -6.933773040771484, "global_step": 160485, "epoch": 3821} {"train_loss": -7.010680198669434, "global_step": 160486, "epoch": 3821} {"train_loss": -6.992391586303711, "global_step": 160487, "epoch": 3821} {"train_loss": -7.003696918487549, "global_step": 160488, "epoch": 3821} {"train_loss": -6.975433349609375, "global_step": 160489, "epoch": 3821} {"train_loss": -6.953551292419434, "global_step": 160490, "epoch": 3821} {"train_loss": -7.011000633239746, "global_step": 160491, "epoch": 3821} {"train_loss": -6.971566200256348, "global_step": 160492, "epoch": 3821} {"train_loss": -7.138429164886475, "global_step": 160493, "epoch": 3821} {"train_loss": -7.056035995483398, "global_step": 160494, "epoch": 3821} {"train_loss": -7.0640411376953125, "global_step": 160495, "epoch": 3821} {"train_loss": -7.112907886505127, "global_step": 160496, "epoch": 3821} {"train_loss": -7.010631561279297, "global_step": 160497, "epoch": 3821} {"train_loss": -7.060986518859863, "global_step": 160498, "epoch": 3821} {"train_loss": -7.031181335449219, "global_step": 160499, "epoch": 3821} {"train_loss": -6.941473007202148, "global_step": 160500, "epoch": 3821} {"train_loss": -6.982973575592041, "global_step": 160501, "epoch": 3821} {"train_loss": -7.077569484710693, "global_step": 160502, "epoch": 3821} {"train_loss": -7.027163028717041, "global_step": 160503, "epoch": 3821} {"train_loss": -6.984984874725342, "global_step": 160504, "epoch": 3821} {"train_loss": -6.9616546630859375, "global_step": 160505, "epoch": 3821} {"train_loss": -6.930336952209473, "global_step": 160506, "epoch": 3821} {"train_loss": -6.857450008392334, "global_step": 160507, "epoch": 3821} {"train_loss": -6.993800163269043, "global_step": 160508, "epoch": 3821} {"train_loss": -6.821906566619873, "global_step": 160509, "epoch": 3821} {"train_loss": -6.884251594543457, "global_step": 160510, "epoch": 3821} {"train_loss": -7.009984016418457, "global_step": 160511, "epoch": 3821} {"train_loss": -6.8743157386779785, "global_step": 160512, "epoch": 3821} {"train_loss": -7.073265075683594, "global_step": 160513, "epoch": 3821} {"train_loss": -7.021750450134277, "global_step": 160514, "epoch": 3821} {"train_loss": -6.905342102050781, "global_step": 160515, "epoch": 3821} {"train_loss": -6.9088897705078125, "global_step": 160516, "epoch": 3821} {"train_loss": -6.959480285644531, "global_step": 160517, "epoch": 3821} {"train_loss": -6.867814540863037, "global_step": 160518, "epoch": 3821} {"train_loss": -6.867510795593262, "global_step": 160519, "epoch": 3821} {"train_loss": -6.8926849365234375, "global_step": 160520, "epoch": 3821} {"train_loss": -6.905340194702148, "global_step": 160521, "epoch": 3821} {"train_loss": -7.005946636199951, "global_step": 160522, "epoch": 3821} {"train_loss": -6.973893540246146, "global_step": 160523, "epoch": 3821, "val_loss": 68610.5390625} {"train_loss": -6.825084686279297, "global_step": 160524, "epoch": 3822} {"train_loss": -6.9920244216918945, "global_step": 160525, "epoch": 3822} {"train_loss": -6.948394775390625, "global_step": 160526, "epoch": 3822} {"train_loss": -6.845069885253906, "global_step": 160527, "epoch": 3822} {"train_loss": -6.944222450256348, "global_step": 160528, "epoch": 3822} {"train_loss": -6.9737372398376465, "global_step": 160529, "epoch": 3822} {"train_loss": -6.902728080749512, "global_step": 160530, "epoch": 3822} {"train_loss": -7.051083087921143, "global_step": 160531, "epoch": 3822} {"train_loss": -6.84913444519043, "global_step": 160532, "epoch": 3822} {"train_loss": -6.812211513519287, "global_step": 160533, "epoch": 3822} {"train_loss": -7.062041282653809, "global_step": 160534, "epoch": 3822} {"train_loss": -6.966169357299805, "global_step": 160535, "epoch": 3822} {"train_loss": -6.918769359588623, "global_step": 160536, "epoch": 3822} {"train_loss": -6.979851722717285, "global_step": 160537, "epoch": 3822} {"train_loss": -6.876702785491943, "global_step": 160538, "epoch": 3822} {"train_loss": -6.93347692489624, "global_step": 160539, "epoch": 3822} {"train_loss": -7.081764221191406, "global_step": 160540, "epoch": 3822} {"train_loss": -6.923093795776367, "global_step": 160541, "epoch": 3822} {"train_loss": -7.054297924041748, "global_step": 160542, "epoch": 3822} {"train_loss": -6.849804878234863, "global_step": 160543, "epoch": 3822} {"train_loss": -6.969038009643555, "global_step": 160544, "epoch": 3822} {"train_loss": -6.987274646759033, "global_step": 160545, "epoch": 3822} {"train_loss": -6.87876033782959, "global_step": 160546, "epoch": 3822} {"train_loss": -6.812537670135498, "global_step": 160547, "epoch": 3822} {"train_loss": -6.888420104980469, "global_step": 160548, "epoch": 3822} {"train_loss": -6.851966381072998, "global_step": 160549, "epoch": 3822} {"train_loss": -6.890568733215332, "global_step": 160550, "epoch": 3822} {"train_loss": -6.926308631896973, "global_step": 160551, "epoch": 3822} {"train_loss": -6.884969234466553, "global_step": 160552, "epoch": 3822} {"train_loss": -6.972568511962891, "global_step": 160553, "epoch": 3822} {"train_loss": -6.884798049926758, "global_step": 160554, "epoch": 3822} {"train_loss": -7.012488842010498, "global_step": 160555, "epoch": 3822} {"train_loss": -7.037959098815918, "global_step": 160556, "epoch": 3822} {"train_loss": -6.822852611541748, "global_step": 160557, "epoch": 3822} {"train_loss": -6.972105979919434, "global_step": 160558, "epoch": 3822} {"train_loss": -7.034250736236572, "global_step": 160559, "epoch": 3822} {"train_loss": -6.8347296714782715, "global_step": 160560, "epoch": 3822} {"train_loss": -6.949277877807617, "global_step": 160561, "epoch": 3822} {"train_loss": -7.056507110595703, "global_step": 160562, "epoch": 3822} {"train_loss": -6.99675178527832, "global_step": 160563, "epoch": 3822} {"train_loss": -6.950318813323975, "global_step": 160564, "epoch": 3822} {"train_loss": -6.9386970315660745, "global_step": 160565, "epoch": 3822, "val_loss": 68569.1796875} {"train_loss": -7.094761848449707, "global_step": 160566, "epoch": 3823} {"train_loss": -6.963641166687012, "global_step": 160567, "epoch": 3823} {"train_loss": -7.105982780456543, "global_step": 160568, "epoch": 3823} {"train_loss": -7.052998065948486, "global_step": 160569, "epoch": 3823} {"train_loss": -7.102082252502441, "global_step": 160570, "epoch": 3823} {"train_loss": -7.008199214935303, "global_step": 160571, "epoch": 3823} {"train_loss": -7.025150299072266, "global_step": 160572, "epoch": 3823} {"train_loss": -6.9901227951049805, "global_step": 160573, "epoch": 3823} {"train_loss": -6.893614768981934, "global_step": 160574, "epoch": 3823} {"train_loss": -6.85634708404541, "global_step": 160575, "epoch": 3823} {"train_loss": -7.0058488845825195, "global_step": 160576, "epoch": 3823} {"train_loss": -7.0029706954956055, "global_step": 160577, "epoch": 3823} {"train_loss": -7.079922676086426, "global_step": 160578, "epoch": 3823} {"train_loss": -6.971612930297852, "global_step": 160579, "epoch": 3823} {"train_loss": -7.009809494018555, "global_step": 160580, "epoch": 3823} {"train_loss": -7.064986228942871, "global_step": 160581, "epoch": 3823} {"train_loss": -7.0639448165893555, "global_step": 160582, "epoch": 3823} {"train_loss": -6.975654602050781, "global_step": 160583, "epoch": 3823} {"train_loss": -6.953512668609619, "global_step": 160584, "epoch": 3823} {"train_loss": -6.9649128913879395, "global_step": 160585, "epoch": 3823} {"train_loss": -6.996299743652344, "global_step": 160586, "epoch": 3823} {"train_loss": -6.986169815063477, "global_step": 160587, "epoch": 3823} {"train_loss": -6.985566139221191, "global_step": 160588, "epoch": 3823} {"train_loss": -7.007271766662598, "global_step": 160589, "epoch": 3823} {"train_loss": -7.019575119018555, "global_step": 160590, "epoch": 3823} {"train_loss": -7.007372856140137, "global_step": 160591, "epoch": 3823} {"train_loss": -6.974993705749512, "global_step": 160592, "epoch": 3823} {"train_loss": -7.04905891418457, "global_step": 160593, "epoch": 3823} {"train_loss": -6.955929756164551, "global_step": 160594, "epoch": 3823} {"train_loss": -7.152716636657715, "global_step": 160595, "epoch": 3823} {"train_loss": -6.988933563232422, "global_step": 160596, "epoch": 3823} {"train_loss": -6.880973815917969, "global_step": 160597, "epoch": 3823} {"train_loss": -7.093832492828369, "global_step": 160598, "epoch": 3823} {"train_loss": -7.0123982429504395, "global_step": 160599, "epoch": 3823} {"train_loss": -7.028693675994873, "global_step": 160600, "epoch": 3823} {"train_loss": -7.031693935394287, "global_step": 160601, "epoch": 3823} {"train_loss": -6.971603870391846, "global_step": 160602, "epoch": 3823} {"train_loss": -6.915112495422363, "global_step": 160603, "epoch": 3823} {"train_loss": -6.841984748840332, "global_step": 160604, "epoch": 3823} {"train_loss": -7.037717819213867, "global_step": 160605, "epoch": 3823} {"train_loss": -6.854854583740234, "global_step": 160606, "epoch": 3823} {"train_loss": -6.9943225383758545, "global_step": 160607, "epoch": 3823, "val_loss": 68517.65625} {"train_loss": -6.978841304779053, "global_step": 160608, "epoch": 3824} {"train_loss": -6.947907447814941, "global_step": 160609, "epoch": 3824} {"train_loss": -6.969597816467285, "global_step": 160610, "epoch": 3824} {"train_loss": -6.814047813415527, "global_step": 160611, "epoch": 3824} {"train_loss": -6.911093711853027, "global_step": 160612, "epoch": 3824} {"train_loss": -6.838367462158203, "global_step": 160613, "epoch": 3824} {"train_loss": -6.900627613067627, "global_step": 160614, "epoch": 3824} {"train_loss": -6.779841423034668, "global_step": 160615, "epoch": 3824} {"train_loss": -6.8741865158081055, "global_step": 160616, "epoch": 3824} {"train_loss": -6.984027862548828, "global_step": 160617, "epoch": 3824} {"train_loss": -6.922370433807373, "global_step": 160618, "epoch": 3824} {"train_loss": -6.812079429626465, "global_step": 160619, "epoch": 3824} {"train_loss": -6.908262729644775, "global_step": 160620, "epoch": 3824} {"train_loss": -7.014339923858643, "global_step": 160621, "epoch": 3824} {"train_loss": -6.957477569580078, "global_step": 160622, "epoch": 3824} {"train_loss": -6.970080375671387, "global_step": 160623, "epoch": 3824} {"train_loss": -6.948846340179443, "global_step": 160624, "epoch": 3824} {"train_loss": -6.884984016418457, "global_step": 160625, "epoch": 3824} {"train_loss": -6.942652225494385, "global_step": 160626, "epoch": 3824} {"train_loss": -6.846113204956055, "global_step": 160627, "epoch": 3824} {"train_loss": -6.872429847717285, "global_step": 160628, "epoch": 3824} {"train_loss": -6.979731559753418, "global_step": 160629, "epoch": 3824} {"train_loss": -6.895062446594238, "global_step": 160630, "epoch": 3824} {"train_loss": -6.879081726074219, "global_step": 160631, "epoch": 3824} {"train_loss": -6.936327934265137, "global_step": 160632, "epoch": 3824} {"train_loss": -6.858475685119629, "global_step": 160633, "epoch": 3824} {"train_loss": -6.898029327392578, "global_step": 160634, "epoch": 3824} {"train_loss": -6.919870376586914, "global_step": 160635, "epoch": 3824} {"train_loss": -6.787722587585449, "global_step": 160636, "epoch": 3824} {"train_loss": -6.919419765472412, "global_step": 160637, "epoch": 3824} {"train_loss": -7.013230323791504, "global_step": 160638, "epoch": 3824} {"train_loss": -6.877326965332031, "global_step": 160639, "epoch": 3824} {"train_loss": -6.9684624671936035, "global_step": 160640, "epoch": 3824} {"train_loss": -7.000734806060791, "global_step": 160641, "epoch": 3824} {"train_loss": -6.937918186187744, "global_step": 160642, "epoch": 3824} {"train_loss": -6.897141456604004, "global_step": 160643, "epoch": 3824} {"train_loss": -6.9562482833862305, "global_step": 160644, "epoch": 3824} {"train_loss": -6.932435989379883, "global_step": 160645, "epoch": 3824} {"train_loss": -7.051486968994141, "global_step": 160646, "epoch": 3824} {"train_loss": -7.039229393005371, "global_step": 160647, "epoch": 3824} {"train_loss": -6.9765520095825195, "global_step": 160648, "epoch": 3824} {"train_loss": -6.922520081202189, "global_step": 160649, "epoch": 3824, "val_loss": 68461.1796875} {"train_loss": -7.00880765914917, "global_step": 160650, "epoch": 3825} {"train_loss": -6.837215423583984, "global_step": 160651, "epoch": 3825} {"train_loss": -6.884316444396973, "global_step": 160652, "epoch": 3825} {"train_loss": -7.018752574920654, "global_step": 160653, "epoch": 3825} {"train_loss": -6.851992607116699, "global_step": 160654, "epoch": 3825} {"train_loss": -6.966936111450195, "global_step": 160655, "epoch": 3825} {"train_loss": -6.93458890914917, "global_step": 160656, "epoch": 3825} {"train_loss": -6.900618553161621, "global_step": 160657, "epoch": 3825} {"train_loss": -6.93671178817749, "global_step": 160658, "epoch": 3825} {"train_loss": -6.997025966644287, "global_step": 160659, "epoch": 3825} {"train_loss": -6.895478248596191, "global_step": 160660, "epoch": 3825} {"train_loss": -6.7731781005859375, "global_step": 160661, "epoch": 3825} {"train_loss": -6.921618461608887, "global_step": 160662, "epoch": 3825} {"train_loss": -6.830663204193115, "global_step": 160663, "epoch": 3825} {"train_loss": -6.834217548370361, "global_step": 160664, "epoch": 3825} {"train_loss": -6.934693336486816, "global_step": 160665, "epoch": 3825} {"train_loss": -6.9748148918151855, "global_step": 160666, "epoch": 3825} {"train_loss": -6.916093826293945, "global_step": 160667, "epoch": 3825} {"train_loss": -6.977591037750244, "global_step": 160668, "epoch": 3825} {"train_loss": -6.906733989715576, "global_step": 160669, "epoch": 3825} {"train_loss": -6.934423923492432, "global_step": 160670, "epoch": 3825} {"train_loss": -6.892457962036133, "global_step": 160671, "epoch": 3825} {"train_loss": -6.92579984664917, "global_step": 160672, "epoch": 3825} {"train_loss": -6.8980607986450195, "global_step": 160673, "epoch": 3825} {"train_loss": -6.815031051635742, "global_step": 160674, "epoch": 3825} {"train_loss": -6.851009368896484, "global_step": 160675, "epoch": 3825} {"train_loss": -6.8897013664245605, "global_step": 160676, "epoch": 3825} {"train_loss": -6.812074184417725, "global_step": 160677, "epoch": 3825} {"train_loss": -7.043642044067383, "global_step": 160678, "epoch": 3825} {"train_loss": -6.7130842208862305, "global_step": 160679, "epoch": 3825} {"train_loss": -6.851751804351807, "global_step": 160680, "epoch": 3825} {"train_loss": -6.828249931335449, "global_step": 160681, "epoch": 3825} {"train_loss": -6.800240993499756, "global_step": 160682, "epoch": 3825} {"train_loss": -6.931754112243652, "global_step": 160683, "epoch": 3825} {"train_loss": -6.864326000213623, "global_step": 160684, "epoch": 3825} {"train_loss": -6.916158676147461, "global_step": 160685, "epoch": 3825} {"train_loss": -6.813024520874023, "global_step": 160686, "epoch": 3825} {"train_loss": -6.913680076599121, "global_step": 160687, "epoch": 3825} {"train_loss": -6.8572211265563965, "global_step": 160688, "epoch": 3825} {"train_loss": -6.972675323486328, "global_step": 160689, "epoch": 3825} {"train_loss": -6.907112121582031, "global_step": 160690, "epoch": 3825} {"train_loss": -6.899753036953154, "global_step": 160691, "epoch": 3825, "val_loss": 68621.3125} {"train_loss": -6.938993453979492, "global_step": 160692, "epoch": 3826} {"train_loss": -7.044543743133545, "global_step": 160693, "epoch": 3826} {"train_loss": -7.0699591636657715, "global_step": 160694, "epoch": 3826} {"train_loss": -6.9407854080200195, "global_step": 160695, "epoch": 3826} {"train_loss": -7.0559186935424805, "global_step": 160696, "epoch": 3826} {"train_loss": -6.910667419433594, "global_step": 160697, "epoch": 3826} {"train_loss": -7.023458480834961, "global_step": 160698, "epoch": 3826} {"train_loss": -7.031485557556152, "global_step": 160699, "epoch": 3826} {"train_loss": -7.0255327224731445, "global_step": 160700, "epoch": 3826} {"train_loss": -7.025516033172607, "global_step": 160701, "epoch": 3826} {"train_loss": -7.019064426422119, "global_step": 160702, "epoch": 3826} {"train_loss": -6.943432807922363, "global_step": 160703, "epoch": 3826} {"train_loss": -7.041799545288086, "global_step": 160704, "epoch": 3826} {"train_loss": -7.067011833190918, "global_step": 160705, "epoch": 3826} {"train_loss": -7.030909061431885, "global_step": 160706, "epoch": 3826} {"train_loss": -6.837201118469238, "global_step": 160707, "epoch": 3826} {"train_loss": -6.932676792144775, "global_step": 160708, "epoch": 3826} {"train_loss": -6.913158416748047, "global_step": 160709, "epoch": 3826} {"train_loss": -6.986225128173828, "global_step": 160710, "epoch": 3826} {"train_loss": -6.974550724029541, "global_step": 160711, "epoch": 3826} {"train_loss": -6.8590312004089355, "global_step": 160712, "epoch": 3826} {"train_loss": -6.955601692199707, "global_step": 160713, "epoch": 3826} {"train_loss": -6.912192344665527, "global_step": 160714, "epoch": 3826} {"train_loss": -6.841029167175293, "global_step": 160715, "epoch": 3826} {"train_loss": -6.99415397644043, "global_step": 160716, "epoch": 3826} {"train_loss": -6.966595649719238, "global_step": 160717, "epoch": 3826} {"train_loss": -6.742029190063477, "global_step": 160718, "epoch": 3826} {"train_loss": -6.928174018859863, "global_step": 160719, "epoch": 3826} {"train_loss": -6.83567476272583, "global_step": 160720, "epoch": 3826} {"train_loss": -6.829262733459473, "global_step": 160721, "epoch": 3826} {"train_loss": -7.0018086433410645, "global_step": 160722, "epoch": 3826} {"train_loss": -6.873657703399658, "global_step": 160723, "epoch": 3826} {"train_loss": -6.938441753387451, "global_step": 160724, "epoch": 3826} {"train_loss": -6.912811279296875, "global_step": 160725, "epoch": 3826} {"train_loss": -6.824492454528809, "global_step": 160726, "epoch": 3826} {"train_loss": -6.914618492126465, "global_step": 160727, "epoch": 3826} {"train_loss": -6.899708271026611, "global_step": 160728, "epoch": 3826} {"train_loss": -6.95991325378418, "global_step": 160729, "epoch": 3826} {"train_loss": -6.865501403808594, "global_step": 160730, "epoch": 3826} {"train_loss": -7.031490325927734, "global_step": 160731, "epoch": 3826} {"train_loss": -6.984217166900635, "global_step": 160732, "epoch": 3826} {"train_loss": -6.947860195523217, "global_step": 160733, "epoch": 3826, "val_loss": 68643.921875} {"train_loss": -7.080292701721191, "global_step": 160734, "epoch": 3827} {"train_loss": -6.897543907165527, "global_step": 160735, "epoch": 3827} {"train_loss": -6.892889022827148, "global_step": 160736, "epoch": 3827} {"train_loss": -6.93380069732666, "global_step": 160737, "epoch": 3827} {"train_loss": -6.871115684509277, "global_step": 160738, "epoch": 3827} {"train_loss": -7.028452396392822, "global_step": 160739, "epoch": 3827} {"train_loss": -6.887529373168945, "global_step": 160740, "epoch": 3827} {"train_loss": -7.066895484924316, "global_step": 160741, "epoch": 3827} {"train_loss": -6.971052169799805, "global_step": 160742, "epoch": 3827} {"train_loss": -7.003281593322754, "global_step": 160743, "epoch": 3827} {"train_loss": -6.963832378387451, "global_step": 160744, "epoch": 3827} {"train_loss": -6.954355239868164, "global_step": 160745, "epoch": 3827} {"train_loss": -6.959229946136475, "global_step": 160746, "epoch": 3827} {"train_loss": -6.920650005340576, "global_step": 160747, "epoch": 3827} {"train_loss": -6.921657562255859, "global_step": 160748, "epoch": 3827} {"train_loss": -6.96413516998291, "global_step": 160749, "epoch": 3827} {"train_loss": -6.9347734451293945, "global_step": 160750, "epoch": 3827} {"train_loss": -6.9523115158081055, "global_step": 160751, "epoch": 3827} {"train_loss": -6.876023292541504, "global_step": 160752, "epoch": 3827} {"train_loss": -6.948114395141602, "global_step": 160753, "epoch": 3827} {"train_loss": -7.101586818695068, "global_step": 160754, "epoch": 3827} {"train_loss": -6.946099281311035, "global_step": 160755, "epoch": 3827} {"train_loss": -6.959422588348389, "global_step": 160756, "epoch": 3827} {"train_loss": -7.011483192443848, "global_step": 160757, "epoch": 3827} {"train_loss": -6.855862617492676, "global_step": 160758, "epoch": 3827} {"train_loss": -6.972484588623047, "global_step": 160759, "epoch": 3827} {"train_loss": -6.971879482269287, "global_step": 160760, "epoch": 3827} {"train_loss": -6.989727020263672, "global_step": 160761, "epoch": 3827} {"train_loss": -6.988095760345459, "global_step": 160762, "epoch": 3827} {"train_loss": -7.107206344604492, "global_step": 160763, "epoch": 3827} {"train_loss": -7.107159614562988, "global_step": 160764, "epoch": 3827} {"train_loss": -7.057845592498779, "global_step": 160765, "epoch": 3827} {"train_loss": -6.8986968994140625, "global_step": 160766, "epoch": 3827} {"train_loss": -7.069645881652832, "global_step": 160767, "epoch": 3827} {"train_loss": -6.976650238037109, "global_step": 160768, "epoch": 3827} {"train_loss": -7.007907867431641, "global_step": 160769, "epoch": 3827} {"train_loss": -6.930876731872559, "global_step": 160770, "epoch": 3827} {"train_loss": -7.019587993621826, "global_step": 160771, "epoch": 3827} {"train_loss": -6.9144487380981445, "global_step": 160772, "epoch": 3827} {"train_loss": -7.070138454437256, "global_step": 160773, "epoch": 3827} {"train_loss": -7.019735336303711, "global_step": 160774, "epoch": 3827} {"train_loss": -6.973549138932001, "global_step": 160775, "epoch": 3827, "val_loss": 68642.0703125} {"train_loss": -7.046492576599121, "global_step": 160776, "epoch": 3828} {"train_loss": -6.98652982711792, "global_step": 160777, "epoch": 3828} {"train_loss": -6.925647735595703, "global_step": 160778, "epoch": 3828} {"train_loss": -6.943675994873047, "global_step": 160779, "epoch": 3828} {"train_loss": -7.060775279998779, "global_step": 160780, "epoch": 3828} {"train_loss": -6.873472213745117, "global_step": 160781, "epoch": 3828} {"train_loss": -6.961881637573242, "global_step": 160782, "epoch": 3828} {"train_loss": -7.000107765197754, "global_step": 160783, "epoch": 3828} {"train_loss": -6.882793426513672, "global_step": 160784, "epoch": 3828} {"train_loss": -6.962701797485352, "global_step": 160785, "epoch": 3828} {"train_loss": -6.894280910491943, "global_step": 160786, "epoch": 3828} {"train_loss": -6.897684574127197, "global_step": 160787, "epoch": 3828} {"train_loss": -7.023976802825928, "global_step": 160788, "epoch": 3828} {"train_loss": -6.826510906219482, "global_step": 160789, "epoch": 3828} {"train_loss": -6.899203300476074, "global_step": 160790, "epoch": 3828} {"train_loss": -6.96400260925293, "global_step": 160791, "epoch": 3828} {"train_loss": -6.936583042144775, "global_step": 160792, "epoch": 3828} {"train_loss": -6.95765495300293, "global_step": 160793, "epoch": 3828} {"train_loss": -6.842438697814941, "global_step": 160794, "epoch": 3828} {"train_loss": -6.960452079772949, "global_step": 160795, "epoch": 3828} {"train_loss": -7.022465705871582, "global_step": 160796, "epoch": 3828} {"train_loss": -6.859952926635742, "global_step": 160797, "epoch": 3828} {"train_loss": -7.003146171569824, "global_step": 160798, "epoch": 3828} {"train_loss": -7.032184600830078, "global_step": 160799, "epoch": 3828} {"train_loss": -6.888208389282227, "global_step": 160800, "epoch": 3828} {"train_loss": -7.095129013061523, "global_step": 160801, "epoch": 3828} {"train_loss": -6.961258888244629, "global_step": 160802, "epoch": 3828} {"train_loss": -6.948184013366699, "global_step": 160803, "epoch": 3828} {"train_loss": -6.966584205627441, "global_step": 160804, "epoch": 3828} {"train_loss": -7.010831356048584, "global_step": 160805, "epoch": 3828} {"train_loss": -6.952186584472656, "global_step": 160806, "epoch": 3828} {"train_loss": -6.896315574645996, "global_step": 160807, "epoch": 3828} {"train_loss": -7.124701499938965, "global_step": 160808, "epoch": 3828} {"train_loss": -6.985019683837891, "global_step": 160809, "epoch": 3828} {"train_loss": -7.123353958129883, "global_step": 160810, "epoch": 3828} {"train_loss": -7.078952789306641, "global_step": 160811, "epoch": 3828} {"train_loss": -6.949510097503662, "global_step": 160812, "epoch": 3828} {"train_loss": -7.0040082931518555, "global_step": 160813, "epoch": 3828} {"train_loss": -7.010415077209473, "global_step": 160814, "epoch": 3828} {"train_loss": -6.8539719581604, "global_step": 160815, "epoch": 3828} {"train_loss": -6.968921184539795, "global_step": 160816, "epoch": 3828} {"train_loss": -6.968233630770729, "global_step": 160817, "epoch": 3828, "val_loss": 68741.765625} {"train_loss": -6.827273368835449, "global_step": 160818, "epoch": 3829} {"train_loss": -6.95985221862793, "global_step": 160819, "epoch": 3829} {"train_loss": -7.0033278465271, "global_step": 160820, "epoch": 3829} {"train_loss": -6.861276626586914, "global_step": 160821, "epoch": 3829} {"train_loss": -7.007327079772949, "global_step": 160822, "epoch": 3829} {"train_loss": -7.013060569763184, "global_step": 160823, "epoch": 3829} {"train_loss": -6.825862407684326, "global_step": 160824, "epoch": 3829} {"train_loss": -6.900965690612793, "global_step": 160825, "epoch": 3829} {"train_loss": -6.878061294555664, "global_step": 160826, "epoch": 3829} {"train_loss": -7.006948471069336, "global_step": 160827, "epoch": 3829} {"train_loss": -6.879751205444336, "global_step": 160828, "epoch": 3829} {"train_loss": -7.064304828643799, "global_step": 160829, "epoch": 3829} {"train_loss": -6.897185802459717, "global_step": 160830, "epoch": 3829} {"train_loss": -7.000797271728516, "global_step": 160831, "epoch": 3829} {"train_loss": -6.93454647064209, "global_step": 160832, "epoch": 3829} {"train_loss": -7.025213241577148, "global_step": 160833, "epoch": 3829} {"train_loss": -7.080127239227295, "global_step": 160834, "epoch": 3829} {"train_loss": -6.925585746765137, "global_step": 160835, "epoch": 3829} {"train_loss": -6.818538665771484, "global_step": 160836, "epoch": 3829} {"train_loss": -6.959184646606445, "global_step": 160837, "epoch": 3829} {"train_loss": -6.794002532958984, "global_step": 160838, "epoch": 3829} {"train_loss": -6.80164909362793, "global_step": 160839, "epoch": 3829} {"train_loss": -6.96385383605957, "global_step": 160840, "epoch": 3829} {"train_loss": -6.996879577636719, "global_step": 160841, "epoch": 3829} {"train_loss": -7.04162073135376, "global_step": 160842, "epoch": 3829} {"train_loss": -6.940465927124023, "global_step": 160843, "epoch": 3829} {"train_loss": -6.9519171714782715, "global_step": 160844, "epoch": 3829} {"train_loss": -6.966241836547852, "global_step": 160845, "epoch": 3829} {"train_loss": -6.9936370849609375, "global_step": 160846, "epoch": 3829} {"train_loss": -7.029711723327637, "global_step": 160847, "epoch": 3829} {"train_loss": -6.994106769561768, "global_step": 160848, "epoch": 3829} {"train_loss": -6.94359016418457, "global_step": 160849, "epoch": 3829} {"train_loss": -7.058030605316162, "global_step": 160850, "epoch": 3829} {"train_loss": -7.0007781982421875, "global_step": 160851, "epoch": 3829} {"train_loss": -7.048936367034912, "global_step": 160852, "epoch": 3829} {"train_loss": -7.002197265625, "global_step": 160853, "epoch": 3829} {"train_loss": -6.930699348449707, "global_step": 160854, "epoch": 3829} {"train_loss": -6.989199638366699, "global_step": 160855, "epoch": 3829} {"train_loss": -7.074517250061035, "global_step": 160856, "epoch": 3829} {"train_loss": -6.924534797668457, "global_step": 160857, "epoch": 3829} {"train_loss": -6.957293510437012, "global_step": 160858, "epoch": 3829} {"train_loss": -6.958438362394061, "global_step": 160859, "epoch": 3829, "val_loss": 68546.53125} {"train_loss": -7.018291473388672, "global_step": 160860, "epoch": 3830} {"train_loss": -7.062465190887451, "global_step": 160861, "epoch": 3830} {"train_loss": -6.946176052093506, "global_step": 160862, "epoch": 3830} {"train_loss": -6.9884796142578125, "global_step": 160863, "epoch": 3830} {"train_loss": -6.939209938049316, "global_step": 160864, "epoch": 3830} {"train_loss": -7.004137992858887, "global_step": 160865, "epoch": 3830} {"train_loss": -6.94621467590332, "global_step": 160866, "epoch": 3830} {"train_loss": -7.02855110168457, "global_step": 160867, "epoch": 3830} {"train_loss": -7.039267539978027, "global_step": 160868, "epoch": 3830} {"train_loss": -6.949223518371582, "global_step": 160869, "epoch": 3830} {"train_loss": -6.996331214904785, "global_step": 160870, "epoch": 3830} {"train_loss": -6.897278785705566, "global_step": 160871, "epoch": 3830} {"train_loss": -7.149710178375244, "global_step": 160872, "epoch": 3830} {"train_loss": -7.0385823249816895, "global_step": 160873, "epoch": 3830} {"train_loss": -7.043466567993164, "global_step": 160874, "epoch": 3830} {"train_loss": -6.956533908843994, "global_step": 160875, "epoch": 3830} {"train_loss": -6.915924072265625, "global_step": 160876, "epoch": 3830} {"train_loss": -6.929895401000977, "global_step": 160877, "epoch": 3830} {"train_loss": -7.026350975036621, "global_step": 160878, "epoch": 3830} {"train_loss": -6.99314022064209, "global_step": 160879, "epoch": 3830} {"train_loss": -6.849921226501465, "global_step": 160880, "epoch": 3830} {"train_loss": -6.8992767333984375, "global_step": 160881, "epoch": 3830} {"train_loss": -6.953263282775879, "global_step": 160882, "epoch": 3830} {"train_loss": -6.842662811279297, "global_step": 160883, "epoch": 3830} {"train_loss": -7.032954692840576, "global_step": 160884, "epoch": 3830} {"train_loss": -6.978758811950684, "global_step": 160885, "epoch": 3830} {"train_loss": -6.882690906524658, "global_step": 160886, "epoch": 3830} {"train_loss": -6.932558059692383, "global_step": 160887, "epoch": 3830} {"train_loss": -6.850969314575195, "global_step": 160888, "epoch": 3830} {"train_loss": -6.9550323486328125, "global_step": 160889, "epoch": 3830} {"train_loss": -6.872089385986328, "global_step": 160890, "epoch": 3830} {"train_loss": -6.902046203613281, "global_step": 160891, "epoch": 3830} {"train_loss": -6.939657688140869, "global_step": 160892, "epoch": 3830} {"train_loss": -6.899179935455322, "global_step": 160893, "epoch": 3830} {"train_loss": -6.996766090393066, "global_step": 160894, "epoch": 3830} {"train_loss": -6.920444488525391, "global_step": 160895, "epoch": 3830} {"train_loss": -7.0434064865112305, "global_step": 160896, "epoch": 3830} {"train_loss": -6.990063667297363, "global_step": 160897, "epoch": 3830} {"train_loss": -6.966644763946533, "global_step": 160898, "epoch": 3830} {"train_loss": -7.101229667663574, "global_step": 160899, "epoch": 3830} {"train_loss": -7.026690483093262, "global_step": 160900, "epoch": 3830} {"train_loss": -6.969832692827497, "global_step": 160901, "epoch": 3830, "val_loss": 68533.34375} {"train_loss": -6.891301155090332, "global_step": 160902, "epoch": 3831} {"train_loss": -7.004738807678223, "global_step": 160903, "epoch": 3831} {"train_loss": -6.8609466552734375, "global_step": 160904, "epoch": 3831} {"train_loss": -6.943455219268799, "global_step": 160905, "epoch": 3831} {"train_loss": -6.967411994934082, "global_step": 160906, "epoch": 3831} {"train_loss": -6.947869300842285, "global_step": 160907, "epoch": 3831} {"train_loss": -6.992623805999756, "global_step": 160908, "epoch": 3831} {"train_loss": -6.9390058517456055, "global_step": 160909, "epoch": 3831} {"train_loss": -6.804072380065918, "global_step": 160910, "epoch": 3831} {"train_loss": -6.844463348388672, "global_step": 160911, "epoch": 3831} {"train_loss": -6.92397403717041, "global_step": 160912, "epoch": 3831} {"train_loss": -6.947449207305908, "global_step": 160913, "epoch": 3831} {"train_loss": -6.917950630187988, "global_step": 160914, "epoch": 3831} {"train_loss": -7.0605621337890625, "global_step": 160915, "epoch": 3831} {"train_loss": -6.826148986816406, "global_step": 160916, "epoch": 3831} {"train_loss": -6.967564582824707, "global_step": 160917, "epoch": 3831} {"train_loss": -6.955744743347168, "global_step": 160918, "epoch": 3831} {"train_loss": -7.012172698974609, "global_step": 160919, "epoch": 3831} {"train_loss": -6.957620620727539, "global_step": 160920, "epoch": 3831} {"train_loss": -7.014596939086914, "global_step": 160921, "epoch": 3831} {"train_loss": -6.989845275878906, "global_step": 160922, "epoch": 3831} {"train_loss": -6.953866004943848, "global_step": 160923, "epoch": 3831} {"train_loss": -6.978570938110352, "global_step": 160924, "epoch": 3831} {"train_loss": -6.928162574768066, "global_step": 160925, "epoch": 3831} {"train_loss": -7.040513038635254, "global_step": 160926, "epoch": 3831} {"train_loss": -6.870290756225586, "global_step": 160927, "epoch": 3831} {"train_loss": -6.873773097991943, "global_step": 160928, "epoch": 3831} {"train_loss": -6.893355846405029, "global_step": 160929, "epoch": 3831} {"train_loss": -6.820316314697266, "global_step": 160930, "epoch": 3831} {"train_loss": -6.846893787384033, "global_step": 160931, "epoch": 3831} {"train_loss": -6.816906929016113, "global_step": 160932, "epoch": 3831} {"train_loss": -6.950808525085449, "global_step": 160933, "epoch": 3831} {"train_loss": -6.741567611694336, "global_step": 160934, "epoch": 3831} {"train_loss": -6.8238525390625, "global_step": 160935, "epoch": 3831} {"train_loss": -6.889277458190918, "global_step": 160936, "epoch": 3831} {"train_loss": -6.856790542602539, "global_step": 160937, "epoch": 3831} {"train_loss": -6.918251037597656, "global_step": 160938, "epoch": 3831} {"train_loss": -6.930490970611572, "global_step": 160939, "epoch": 3831} {"train_loss": -6.943566799163818, "global_step": 160940, "epoch": 3831} {"train_loss": -6.967852592468262, "global_step": 160941, "epoch": 3831} {"train_loss": -6.896870136260986, "global_step": 160942, "epoch": 3831} {"train_loss": -6.923114027295794, "global_step": 160943, "epoch": 3831, "val_loss": 68659.1015625} {"train_loss": -7.027950763702393, "global_step": 160944, "epoch": 3832} {"train_loss": -6.9357099533081055, "global_step": 160945, "epoch": 3832} {"train_loss": -7.049334526062012, "global_step": 160946, "epoch": 3832} {"train_loss": -6.956038475036621, "global_step": 160947, "epoch": 3832} {"train_loss": -6.9316205978393555, "global_step": 160948, "epoch": 3832} {"train_loss": -7.03322172164917, "global_step": 160949, "epoch": 3832} {"train_loss": -6.954345703125, "global_step": 160950, "epoch": 3832} {"train_loss": -7.106326103210449, "global_step": 160951, "epoch": 3832} {"train_loss": -6.946100234985352, "global_step": 160952, "epoch": 3832} {"train_loss": -6.976070404052734, "global_step": 160953, "epoch": 3832} {"train_loss": -6.919952392578125, "global_step": 160954, "epoch": 3832} {"train_loss": -7.008903503417969, "global_step": 160955, "epoch": 3832} {"train_loss": -6.907024383544922, "global_step": 160956, "epoch": 3832} {"train_loss": -6.867677211761475, "global_step": 160957, "epoch": 3832} {"train_loss": -7.101932048797607, "global_step": 160958, "epoch": 3832} {"train_loss": -6.9568023681640625, "global_step": 160959, "epoch": 3832} {"train_loss": -6.934259414672852, "global_step": 160960, "epoch": 3832} {"train_loss": -6.988927841186523, "global_step": 160961, "epoch": 3832} {"train_loss": -6.980304718017578, "global_step": 160962, "epoch": 3832} {"train_loss": -6.932211875915527, "global_step": 160963, "epoch": 3832} {"train_loss": -6.860126495361328, "global_step": 160964, "epoch": 3832} {"train_loss": -6.7906494140625, "global_step": 160965, "epoch": 3832} {"train_loss": -6.8852386474609375, "global_step": 160966, "epoch": 3832} {"train_loss": -6.9534406661987305, "global_step": 160967, "epoch": 3832} {"train_loss": -6.93867301940918, "global_step": 160968, "epoch": 3832} {"train_loss": -6.9827680587768555, "global_step": 160969, "epoch": 3832} {"train_loss": -6.962322235107422, "global_step": 160970, "epoch": 3832} {"train_loss": -7.035149097442627, "global_step": 160971, "epoch": 3832} {"train_loss": -7.0003461837768555, "global_step": 160972, "epoch": 3832} {"train_loss": -7.037172794342041, "global_step": 160973, "epoch": 3832} {"train_loss": -6.955636024475098, "global_step": 160974, "epoch": 3832} {"train_loss": -7.031192779541016, "global_step": 160975, "epoch": 3832} {"train_loss": -7.037747383117676, "global_step": 160976, "epoch": 3832} {"train_loss": -6.966423988342285, "global_step": 160977, "epoch": 3832} {"train_loss": -7.024885177612305, "global_step": 160978, "epoch": 3832} {"train_loss": -7.009881019592285, "global_step": 160979, "epoch": 3832} {"train_loss": -7.03593111038208, "global_step": 160980, "epoch": 3832} {"train_loss": -7.040922164916992, "global_step": 160981, "epoch": 3832} {"train_loss": -6.952090263366699, "global_step": 160982, "epoch": 3832} {"train_loss": -7.065617561340332, "global_step": 160983, "epoch": 3832} {"train_loss": -6.9701151847839355, "global_step": 160984, "epoch": 3832} {"train_loss": -6.9778882548922585, "global_step": 160985, "epoch": 3832, "val_loss": 68396.28125} {"train_loss": -7.038262367248535, "global_step": 160986, "epoch": 3833} {"train_loss": -6.92491340637207, "global_step": 160987, "epoch": 3833} {"train_loss": -7.114507675170898, "global_step": 160988, "epoch": 3833} {"train_loss": -7.0077385902404785, "global_step": 160989, "epoch": 3833} {"train_loss": -7.095320224761963, "global_step": 160990, "epoch": 3833} {"train_loss": -7.049537658691406, "global_step": 160991, "epoch": 3833} {"train_loss": -6.949358940124512, "global_step": 160992, "epoch": 3833} {"train_loss": -6.956711769104004, "global_step": 160993, "epoch": 3833} {"train_loss": -7.077900409698486, "global_step": 160994, "epoch": 3833} {"train_loss": -7.109005928039551, "global_step": 160995, "epoch": 3833} {"train_loss": -7.0028228759765625, "global_step": 160996, "epoch": 3833} {"train_loss": -6.983343124389648, "global_step": 160997, "epoch": 3833} {"train_loss": -7.062610626220703, "global_step": 160998, "epoch": 3833} {"train_loss": -6.856417655944824, "global_step": 160999, "epoch": 3833} {"train_loss": -6.887839317321777, "global_step": 161000, "epoch": 3833} {"train_loss": -6.994879722595215, "global_step": 161001, "epoch": 3833} {"train_loss": -6.989353179931641, "global_step": 161002, "epoch": 3833} {"train_loss": -6.853653907775879, "global_step": 161003, "epoch": 3833} {"train_loss": -6.955410003662109, "global_step": 161004, "epoch": 3833} {"train_loss": -6.955826759338379, "global_step": 161005, "epoch": 3833} {"train_loss": -6.897470474243164, "global_step": 161006, "epoch": 3833} {"train_loss": -6.8915324211120605, "global_step": 161007, "epoch": 3833} {"train_loss": -6.864131927490234, "global_step": 161008, "epoch": 3833} {"train_loss": -6.715693473815918, "global_step": 161009, "epoch": 3833} {"train_loss": -6.814321517944336, "global_step": 161010, "epoch": 3833} {"train_loss": -6.902639389038086, "global_step": 161011, "epoch": 3833} {"train_loss": -6.941677093505859, "global_step": 161012, "epoch": 3833} {"train_loss": -6.951562881469727, "global_step": 161013, "epoch": 3833} {"train_loss": -6.926807403564453, "global_step": 161014, "epoch": 3833} {"train_loss": -6.976523399353027, "global_step": 161015, "epoch": 3833} {"train_loss": -7.010167598724365, "global_step": 161016, "epoch": 3833} {"train_loss": -6.992631912231445, "global_step": 161017, "epoch": 3833} {"train_loss": -6.924764633178711, "global_step": 161018, "epoch": 3833} {"train_loss": -6.951684951782227, "global_step": 161019, "epoch": 3833} {"train_loss": -6.782323360443115, "global_step": 161020, "epoch": 3833} {"train_loss": -6.742371559143066, "global_step": 161021, "epoch": 3833} {"train_loss": -6.813838958740234, "global_step": 161022, "epoch": 3833} {"train_loss": -6.815070152282715, "global_step": 161023, "epoch": 3833} {"train_loss": -6.894430160522461, "global_step": 161024, "epoch": 3833} {"train_loss": -6.7772722244262695, "global_step": 161025, "epoch": 3833} {"train_loss": -6.7506256103515625, "global_step": 161026, "epoch": 3833} {"train_loss": -6.933537505921864, "global_step": 161027, "epoch": 3833, "val_loss": 68643.921875} {"train_loss": -6.849936485290527, "global_step": 161028, "epoch": 3834} {"train_loss": -6.91106653213501, "global_step": 161029, "epoch": 3834} {"train_loss": -6.916861534118652, "global_step": 161030, "epoch": 3834} {"train_loss": -6.7935709953308105, "global_step": 161031, "epoch": 3834} {"train_loss": -6.981295585632324, "global_step": 161032, "epoch": 3834} {"train_loss": -6.801262855529785, "global_step": 161033, "epoch": 3834} {"train_loss": -6.991109848022461, "global_step": 161034, "epoch": 3834} {"train_loss": -6.8101701736450195, "global_step": 161035, "epoch": 3834} {"train_loss": -6.928432941436768, "global_step": 161036, "epoch": 3834} {"train_loss": -6.8984375, "global_step": 161037, "epoch": 3834} {"train_loss": -6.8417510986328125, "global_step": 161038, "epoch": 3834} {"train_loss": -7.0196990966796875, "global_step": 161039, "epoch": 3834} {"train_loss": -6.915952682495117, "global_step": 161040, "epoch": 3834} {"train_loss": -6.870244979858398, "global_step": 161041, "epoch": 3834} {"train_loss": -6.979397773742676, "global_step": 161042, "epoch": 3834} {"train_loss": -7.044029712677002, "global_step": 161043, "epoch": 3834} {"train_loss": -6.98158073425293, "global_step": 161044, "epoch": 3834} {"train_loss": -7.0376482009887695, "global_step": 161045, "epoch": 3834} {"train_loss": -6.958920478820801, "global_step": 161046, "epoch": 3834} {"train_loss": -7.032506465911865, "global_step": 161047, "epoch": 3834} {"train_loss": -6.983104228973389, "global_step": 161048, "epoch": 3834} {"train_loss": -7.016242027282715, "global_step": 161049, "epoch": 3834} {"train_loss": -6.851025581359863, "global_step": 161050, "epoch": 3834} {"train_loss": -6.881475448608398, "global_step": 161051, "epoch": 3834} {"train_loss": -7.0593743324279785, "global_step": 161052, "epoch": 3834} {"train_loss": -6.900130748748779, "global_step": 161053, "epoch": 3834} {"train_loss": -7.0889177322387695, "global_step": 161054, "epoch": 3834} {"train_loss": -6.919358253479004, "global_step": 161055, "epoch": 3834} {"train_loss": -6.896681785583496, "global_step": 161056, "epoch": 3834} {"train_loss": -6.8918914794921875, "global_step": 161057, "epoch": 3834} {"train_loss": -6.899367809295654, "global_step": 161058, "epoch": 3834} {"train_loss": -6.809706211090088, "global_step": 161059, "epoch": 3834} {"train_loss": -6.922909736633301, "global_step": 161060, "epoch": 3834} {"train_loss": -6.809018135070801, "global_step": 161061, "epoch": 3834} {"train_loss": -6.856281280517578, "global_step": 161062, "epoch": 3834} {"train_loss": -6.762131690979004, "global_step": 161063, "epoch": 3834} {"train_loss": -6.896328926086426, "global_step": 161064, "epoch": 3834} {"train_loss": -6.887663841247559, "global_step": 161065, "epoch": 3834} {"train_loss": -6.981390953063965, "global_step": 161066, "epoch": 3834} {"train_loss": -6.863186836242676, "global_step": 161067, "epoch": 3834} {"train_loss": -6.922238349914551, "global_step": 161068, "epoch": 3834} {"train_loss": -6.919461602256412, "global_step": 161069, "epoch": 3834, "val_loss": 68663.46875} {"train_loss": -6.982867240905762, "global_step": 161070, "epoch": 3835} {"train_loss": -6.996406078338623, "global_step": 161071, "epoch": 3835} {"train_loss": -7.150149345397949, "global_step": 161072, "epoch": 3835} {"train_loss": -6.977747917175293, "global_step": 161073, "epoch": 3835} {"train_loss": -6.881638050079346, "global_step": 161074, "epoch": 3835} {"train_loss": -6.98312520980835, "global_step": 161075, "epoch": 3835} {"train_loss": -6.922117233276367, "global_step": 161076, "epoch": 3835} {"train_loss": -6.9636030197143555, "global_step": 161077, "epoch": 3835} {"train_loss": -6.9482574462890625, "global_step": 161078, "epoch": 3835} {"train_loss": -6.925389766693115, "global_step": 161079, "epoch": 3835} {"train_loss": -6.906017780303955, "global_step": 161080, "epoch": 3835} {"train_loss": -6.945087909698486, "global_step": 161081, "epoch": 3835} {"train_loss": -7.047756195068359, "global_step": 161082, "epoch": 3835} {"train_loss": -6.957089424133301, "global_step": 161083, "epoch": 3835} {"train_loss": -6.953269004821777, "global_step": 161084, "epoch": 3835} {"train_loss": -6.939004898071289, "global_step": 161085, "epoch": 3835} {"train_loss": -6.918889999389648, "global_step": 161086, "epoch": 3835} {"train_loss": -7.053678035736084, "global_step": 161087, "epoch": 3835} {"train_loss": -6.991237640380859, "global_step": 161088, "epoch": 3835} {"train_loss": -6.864269256591797, "global_step": 161089, "epoch": 3835} {"train_loss": -7.049266815185547, "global_step": 161090, "epoch": 3835} {"train_loss": -6.977997779846191, "global_step": 161091, "epoch": 3835} {"train_loss": -7.009941577911377, "global_step": 161092, "epoch": 3835} {"train_loss": -6.839846611022949, "global_step": 161093, "epoch": 3835} {"train_loss": -6.977980613708496, "global_step": 161094, "epoch": 3835} {"train_loss": -6.928655624389648, "global_step": 161095, "epoch": 3835} {"train_loss": -6.824331283569336, "global_step": 161096, "epoch": 3835} {"train_loss": -6.929512023925781, "global_step": 161097, "epoch": 3835} {"train_loss": -6.8815107345581055, "global_step": 161098, "epoch": 3835} {"train_loss": -6.841332912445068, "global_step": 161099, "epoch": 3835} {"train_loss": -6.931601047515869, "global_step": 161100, "epoch": 3835} {"train_loss": -6.922369956970215, "global_step": 161101, "epoch": 3835} {"train_loss": -6.927626609802246, "global_step": 161102, "epoch": 3835} {"train_loss": -6.8613176345825195, "global_step": 161103, "epoch": 3835} {"train_loss": -6.921727657318115, "global_step": 161104, "epoch": 3835} {"train_loss": -6.856812000274658, "global_step": 161105, "epoch": 3835} {"train_loss": -6.929554462432861, "global_step": 161106, "epoch": 3835} {"train_loss": -6.862303733825684, "global_step": 161107, "epoch": 3835} {"train_loss": -6.841431617736816, "global_step": 161108, "epoch": 3835} {"train_loss": -6.976562023162842, "global_step": 161109, "epoch": 3835} {"train_loss": -6.830206394195557, "global_step": 161110, "epoch": 3835} {"train_loss": -6.93589312689645, "global_step": 161111, "epoch": 3835, "val_loss": 68779.21875} {"train_loss": -6.862856388092041, "global_step": 161112, "epoch": 3836} {"train_loss": -7.014972686767578, "global_step": 161113, "epoch": 3836} {"train_loss": -6.986671447753906, "global_step": 161114, "epoch": 3836} {"train_loss": -6.876431465148926, "global_step": 161115, "epoch": 3836} {"train_loss": -6.956697463989258, "global_step": 161116, "epoch": 3836} {"train_loss": -6.938796043395996, "global_step": 161117, "epoch": 3836} {"train_loss": -6.788050651550293, "global_step": 161118, "epoch": 3836} {"train_loss": -6.88517951965332, "global_step": 161119, "epoch": 3836} {"train_loss": -6.902042388916016, "global_step": 161120, "epoch": 3836} {"train_loss": -6.866594314575195, "global_step": 161121, "epoch": 3836} {"train_loss": -7.042093276977539, "global_step": 161122, "epoch": 3836} {"train_loss": -6.829581260681152, "global_step": 161123, "epoch": 3836} {"train_loss": -6.984550952911377, "global_step": 161124, "epoch": 3836} {"train_loss": -6.806903839111328, "global_step": 161125, "epoch": 3836} {"train_loss": -6.916085720062256, "global_step": 161126, "epoch": 3836} {"train_loss": -6.8274922370910645, "global_step": 161127, "epoch": 3836} {"train_loss": -6.865708351135254, "global_step": 161128, "epoch": 3836} {"train_loss": -6.904891014099121, "global_step": 161129, "epoch": 3836} {"train_loss": -6.897245407104492, "global_step": 161130, "epoch": 3836} {"train_loss": -6.830994606018066, "global_step": 161131, "epoch": 3836} {"train_loss": -6.867010116577148, "global_step": 161132, "epoch": 3836} {"train_loss": -6.909168243408203, "global_step": 161133, "epoch": 3836} {"train_loss": -6.927860260009766, "global_step": 161134, "epoch": 3836} {"train_loss": -6.959773063659668, "global_step": 161135, "epoch": 3836} {"train_loss": -6.979554176330566, "global_step": 161136, "epoch": 3836} {"train_loss": -6.9849348068237305, "global_step": 161137, "epoch": 3836} {"train_loss": -7.0008344650268555, "global_step": 161138, "epoch": 3836} {"train_loss": -6.875359535217285, "global_step": 161139, "epoch": 3836} {"train_loss": -6.883509635925293, "global_step": 161140, "epoch": 3836} {"train_loss": -6.8934526443481445, "global_step": 161141, "epoch": 3836} {"train_loss": -6.906747341156006, "global_step": 161142, "epoch": 3836} {"train_loss": -6.987224578857422, "global_step": 161143, "epoch": 3836} {"train_loss": -6.9413275718688965, "global_step": 161144, "epoch": 3836} {"train_loss": -7.014476776123047, "global_step": 161145, "epoch": 3836} {"train_loss": -6.981764793395996, "global_step": 161146, "epoch": 3836} {"train_loss": -6.920408248901367, "global_step": 161147, "epoch": 3836} {"train_loss": -6.9940385818481445, "global_step": 161148, "epoch": 3836} {"train_loss": -6.972407341003418, "global_step": 161149, "epoch": 3836} {"train_loss": -7.054527759552002, "global_step": 161150, "epoch": 3836} {"train_loss": -6.929754257202148, "global_step": 161151, "epoch": 3836} {"train_loss": -6.986385822296143, "global_step": 161152, "epoch": 3836} {"train_loss": -6.9281026635851175, "global_step": 161153, "epoch": 3836, "val_loss": 68682.4453125} {"train_loss": -6.950986385345459, "global_step": 161154, "epoch": 3837} {"train_loss": -7.030725479125977, "global_step": 161155, "epoch": 3837} {"train_loss": -6.864646911621094, "global_step": 161156, "epoch": 3837} {"train_loss": -7.035673141479492, "global_step": 161157, "epoch": 3837} {"train_loss": -6.996397495269775, "global_step": 161158, "epoch": 3837} {"train_loss": -6.844424247741699, "global_step": 161159, "epoch": 3837} {"train_loss": -7.012617111206055, "global_step": 161160, "epoch": 3837} {"train_loss": -7.020219802856445, "global_step": 161161, "epoch": 3837} {"train_loss": -6.919493675231934, "global_step": 161162, "epoch": 3837} {"train_loss": -7.001312255859375, "global_step": 161163, "epoch": 3837} {"train_loss": -6.858673572540283, "global_step": 161164, "epoch": 3837} {"train_loss": -6.890413284301758, "global_step": 161165, "epoch": 3837} {"train_loss": -7.044073104858398, "global_step": 161166, "epoch": 3837} {"train_loss": -6.860549449920654, "global_step": 161167, "epoch": 3837} {"train_loss": -7.022172927856445, "global_step": 161168, "epoch": 3837} {"train_loss": -6.891953468322754, "global_step": 161169, "epoch": 3837} {"train_loss": -6.913178443908691, "global_step": 161170, "epoch": 3837} {"train_loss": -6.875514507293701, "global_step": 161171, "epoch": 3837} {"train_loss": -6.856756210327148, "global_step": 161172, "epoch": 3837} {"train_loss": -6.943216323852539, "global_step": 161173, "epoch": 3837} {"train_loss": -6.915596961975098, "global_step": 161174, "epoch": 3837} {"train_loss": -7.010698318481445, "global_step": 161175, "epoch": 3837} {"train_loss": -6.998081684112549, "global_step": 161176, "epoch": 3837} {"train_loss": -7.018399238586426, "global_step": 161177, "epoch": 3837} {"train_loss": -6.813528537750244, "global_step": 161178, "epoch": 3837} {"train_loss": -7.029233932495117, "global_step": 161179, "epoch": 3837} {"train_loss": -6.749323844909668, "global_step": 161180, "epoch": 3837} {"train_loss": -6.83759069442749, "global_step": 161181, "epoch": 3837} {"train_loss": -6.934482574462891, "global_step": 161182, "epoch": 3837} {"train_loss": -6.914332866668701, "global_step": 161183, "epoch": 3837} {"train_loss": -6.944404602050781, "global_step": 161184, "epoch": 3837} {"train_loss": -6.891119956970215, "global_step": 161185, "epoch": 3837} {"train_loss": -6.858551025390625, "global_step": 161186, "epoch": 3837} {"train_loss": -6.913646697998047, "global_step": 161187, "epoch": 3837} {"train_loss": -6.818869590759277, "global_step": 161188, "epoch": 3837} {"train_loss": -6.938785076141357, "global_step": 161189, "epoch": 3837} {"train_loss": -6.813333511352539, "global_step": 161190, "epoch": 3837} {"train_loss": -6.980096817016602, "global_step": 161191, "epoch": 3837} {"train_loss": -6.874017715454102, "global_step": 161192, "epoch": 3837} {"train_loss": -6.845521926879883, "global_step": 161193, "epoch": 3837} {"train_loss": -6.849797248840332, "global_step": 161194, "epoch": 3837} {"train_loss": -6.920870644705636, "global_step": 161195, "epoch": 3837, "val_loss": 68768.390625} {"train_loss": -7.02426290512085, "global_step": 161196, "epoch": 3838} {"train_loss": -6.9405131340026855, "global_step": 161197, "epoch": 3838} {"train_loss": -6.958797454833984, "global_step": 161198, "epoch": 3838} {"train_loss": -6.839860916137695, "global_step": 161199, "epoch": 3838} {"train_loss": -6.939571857452393, "global_step": 161200, "epoch": 3838} {"train_loss": -6.977826118469238, "global_step": 161201, "epoch": 3838} {"train_loss": -7.000777721405029, "global_step": 161202, "epoch": 3838} {"train_loss": -6.932812690734863, "global_step": 161203, "epoch": 3838} {"train_loss": -6.936534881591797, "global_step": 161204, "epoch": 3838} {"train_loss": -6.9631876945495605, "global_step": 161205, "epoch": 3838} {"train_loss": -6.934325218200684, "global_step": 161206, "epoch": 3838} {"train_loss": -6.9301300048828125, "global_step": 161207, "epoch": 3838} {"train_loss": -6.805239677429199, "global_step": 161208, "epoch": 3838} {"train_loss": -7.002372741699219, "global_step": 161209, "epoch": 3838} {"train_loss": -6.864101409912109, "global_step": 161210, "epoch": 3838} {"train_loss": -7.021484375, "global_step": 161211, "epoch": 3838} {"train_loss": -6.933592796325684, "global_step": 161212, "epoch": 3838} {"train_loss": -6.934852123260498, "global_step": 161213, "epoch": 3838} {"train_loss": -7.046460151672363, "global_step": 161214, "epoch": 3838} {"train_loss": -7.008406639099121, "global_step": 161215, "epoch": 3838} {"train_loss": -6.948202133178711, "global_step": 161216, "epoch": 3838} {"train_loss": -7.070149898529053, "global_step": 161217, "epoch": 3838} {"train_loss": -6.960066318511963, "global_step": 161218, "epoch": 3838} {"train_loss": -6.99896240234375, "global_step": 161219, "epoch": 3838} {"train_loss": -7.043778419494629, "global_step": 161220, "epoch": 3838} {"train_loss": -6.95113468170166, "global_step": 161221, "epoch": 3838} {"train_loss": -7.011046409606934, "global_step": 161222, "epoch": 3838} {"train_loss": -7.045004844665527, "global_step": 161223, "epoch": 3838} {"train_loss": -7.027040004730225, "global_step": 161224, "epoch": 3838} {"train_loss": -7.011462211608887, "global_step": 161225, "epoch": 3838} {"train_loss": -6.938476085662842, "global_step": 161226, "epoch": 3838} {"train_loss": -7.0203142166137695, "global_step": 161227, "epoch": 3838} {"train_loss": -7.01912260055542, "global_step": 161228, "epoch": 3838} {"train_loss": -6.921978950500488, "global_step": 161229, "epoch": 3838} {"train_loss": -7.008615493774414, "global_step": 161230, "epoch": 3838} {"train_loss": -6.980988025665283, "global_step": 161231, "epoch": 3838} {"train_loss": -7.062999725341797, "global_step": 161232, "epoch": 3838} {"train_loss": -6.989086151123047, "global_step": 161233, "epoch": 3838} {"train_loss": -7.041520118713379, "global_step": 161234, "epoch": 3838} {"train_loss": -7.043798446655273, "global_step": 161235, "epoch": 3838} {"train_loss": -6.975270748138428, "global_step": 161236, "epoch": 3838} {"train_loss": -6.976067338671003, "global_step": 161237, "epoch": 3838, "val_loss": 68517.4375} {"train_loss": -7.125756740570068, "global_step": 161238, "epoch": 3839} {"train_loss": -7.06442928314209, "global_step": 161239, "epoch": 3839} {"train_loss": -7.071588516235352, "global_step": 161240, "epoch": 3839} {"train_loss": -7.04698371887207, "global_step": 161241, "epoch": 3839} {"train_loss": -7.0503315925598145, "global_step": 161242, "epoch": 3839} {"train_loss": -6.937192440032959, "global_step": 161243, "epoch": 3839} {"train_loss": -7.113117694854736, "global_step": 161244, "epoch": 3839} {"train_loss": -6.981510639190674, "global_step": 161245, "epoch": 3839} {"train_loss": -7.030091285705566, "global_step": 161246, "epoch": 3839} {"train_loss": -7.085301399230957, "global_step": 161247, "epoch": 3839} {"train_loss": -7.069730281829834, "global_step": 161248, "epoch": 3839} {"train_loss": -7.0485382080078125, "global_step": 161249, "epoch": 3839} {"train_loss": -7.079139709472656, "global_step": 161250, "epoch": 3839} {"train_loss": -6.940326690673828, "global_step": 161251, "epoch": 3839} {"train_loss": -7.049391269683838, "global_step": 161252, "epoch": 3839} {"train_loss": -6.990077018737793, "global_step": 161253, "epoch": 3839} {"train_loss": -7.08351993560791, "global_step": 161254, "epoch": 3839} {"train_loss": -7.021310806274414, "global_step": 161255, "epoch": 3839} {"train_loss": -6.986969947814941, "global_step": 161256, "epoch": 3839} {"train_loss": -7.018315315246582, "global_step": 161257, "epoch": 3839} {"train_loss": -7.043521404266357, "global_step": 161258, "epoch": 3839} {"train_loss": -6.934833526611328, "global_step": 161259, "epoch": 3839} {"train_loss": -7.036686420440674, "global_step": 161260, "epoch": 3839} {"train_loss": -6.955880165100098, "global_step": 161261, "epoch": 3839} {"train_loss": -6.957302093505859, "global_step": 161262, "epoch": 3839} {"train_loss": -6.989377975463867, "global_step": 161263, "epoch": 3839} {"train_loss": -6.916351318359375, "global_step": 161264, "epoch": 3839} {"train_loss": -6.95827054977417, "global_step": 161265, "epoch": 3839} {"train_loss": -6.905335903167725, "global_step": 161266, "epoch": 3839} {"train_loss": -6.953102111816406, "global_step": 161267, "epoch": 3839} {"train_loss": -7.017457008361816, "global_step": 161268, "epoch": 3839} {"train_loss": -6.940049648284912, "global_step": 161269, "epoch": 3839} {"train_loss": -7.039718151092529, "global_step": 161270, "epoch": 3839} {"train_loss": -7.051736831665039, "global_step": 161271, "epoch": 3839} {"train_loss": -6.993722915649414, "global_step": 161272, "epoch": 3839} {"train_loss": -6.929427146911621, "global_step": 161273, "epoch": 3839} {"train_loss": -7.052613258361816, "global_step": 161274, "epoch": 3839} {"train_loss": -7.01092529296875, "global_step": 161275, "epoch": 3839} {"train_loss": -6.947548866271973, "global_step": 161276, "epoch": 3839} {"train_loss": -7.096900939941406, "global_step": 161277, "epoch": 3839} {"train_loss": -6.982174873352051, "global_step": 161278, "epoch": 3839} {"train_loss": -7.014118626004174, "global_step": 161279, "epoch": 3839, "val_loss": 68666.78125} {"train_loss": -6.9754638671875, "global_step": 161280, "epoch": 3840} {"train_loss": -7.0174126625061035, "global_step": 161281, "epoch": 3840} {"train_loss": -6.847831726074219, "global_step": 161282, "epoch": 3840} {"train_loss": -6.877224922180176, "global_step": 161283, "epoch": 3840} {"train_loss": -6.979048252105713, "global_step": 161284, "epoch": 3840} {"train_loss": -7.100898742675781, "global_step": 161285, "epoch": 3840} {"train_loss": -6.971372604370117, "global_step": 161286, "epoch": 3840} {"train_loss": -6.9187331199646, "global_step": 161287, "epoch": 3840} {"train_loss": -6.880865097045898, "global_step": 161288, "epoch": 3840} {"train_loss": -6.911250591278076, "global_step": 161289, "epoch": 3840} {"train_loss": -7.026445388793945, "global_step": 161290, "epoch": 3840} {"train_loss": -7.035721778869629, "global_step": 161291, "epoch": 3840} {"train_loss": -7.036982536315918, "global_step": 161292, "epoch": 3840} {"train_loss": -6.966564178466797, "global_step": 161293, "epoch": 3840} {"train_loss": -7.035395622253418, "global_step": 161294, "epoch": 3840} {"train_loss": -6.907723903656006, "global_step": 161295, "epoch": 3840} {"train_loss": -7.049901008605957, "global_step": 161296, "epoch": 3840} {"train_loss": -7.018919944763184, "global_step": 161297, "epoch": 3840} {"train_loss": -6.925662994384766, "global_step": 161298, "epoch": 3840} {"train_loss": -6.890185832977295, "global_step": 161299, "epoch": 3840} {"train_loss": -6.959278583526611, "global_step": 161300, "epoch": 3840} {"train_loss": -6.923820495605469, "global_step": 161301, "epoch": 3840} {"train_loss": -6.921736240386963, "global_step": 161302, "epoch": 3840} {"train_loss": -6.966148853302002, "global_step": 161303, "epoch": 3840} {"train_loss": -6.951584815979004, "global_step": 161304, "epoch": 3840} {"train_loss": -6.902264595031738, "global_step": 161305, "epoch": 3840} {"train_loss": -7.04710578918457, "global_step": 161306, "epoch": 3840} {"train_loss": -6.985440254211426, "global_step": 161307, "epoch": 3840} {"train_loss": -6.999086856842041, "global_step": 161308, "epoch": 3840} {"train_loss": -7.047072410583496, "global_step": 161309, "epoch": 3840} {"train_loss": -7.0047712326049805, "global_step": 161310, "epoch": 3840} {"train_loss": -6.8709516525268555, "global_step": 161311, "epoch": 3840} {"train_loss": -7.051098823547363, "global_step": 161312, "epoch": 3840} {"train_loss": -6.862325191497803, "global_step": 161313, "epoch": 3840} {"train_loss": -6.897662162780762, "global_step": 161314, "epoch": 3840} {"train_loss": -7.007975101470947, "global_step": 161315, "epoch": 3840} {"train_loss": -7.082561492919922, "global_step": 161316, "epoch": 3840} {"train_loss": -6.948770046234131, "global_step": 161317, "epoch": 3840} {"train_loss": -6.9426774978637695, "global_step": 161318, "epoch": 3840} {"train_loss": -6.987261772155762, "global_step": 161319, "epoch": 3840} {"train_loss": -6.884490013122559, "global_step": 161320, "epoch": 3840} {"train_loss": -6.964734997068133, "global_step": 161321, "epoch": 3840, "val_loss": 68571.8125} {"train_loss": -6.8895063400268555, "global_step": 161322, "epoch": 3841} {"train_loss": -6.825304985046387, "global_step": 161323, "epoch": 3841} {"train_loss": -6.999098777770996, "global_step": 161324, "epoch": 3841} {"train_loss": -6.783854961395264, "global_step": 161325, "epoch": 3841} {"train_loss": -7.041247367858887, "global_step": 161326, "epoch": 3841} {"train_loss": -6.786447525024414, "global_step": 161327, "epoch": 3841} {"train_loss": -6.720385551452637, "global_step": 161328, "epoch": 3841} {"train_loss": -6.900371074676514, "global_step": 161329, "epoch": 3841} {"train_loss": -6.869075775146484, "global_step": 161330, "epoch": 3841} {"train_loss": -6.812082290649414, "global_step": 161331, "epoch": 3841} {"train_loss": -6.8972697257995605, "global_step": 161332, "epoch": 3841} {"train_loss": -6.982735633850098, "global_step": 161333, "epoch": 3841} {"train_loss": -6.757800102233887, "global_step": 161334, "epoch": 3841} {"train_loss": -6.8554558753967285, "global_step": 161335, "epoch": 3841} {"train_loss": -6.894553184509277, "global_step": 161336, "epoch": 3841} {"train_loss": -6.781911373138428, "global_step": 161337, "epoch": 3841} {"train_loss": -6.848177909851074, "global_step": 161338, "epoch": 3841} {"train_loss": -6.76273250579834, "global_step": 161339, "epoch": 3841} {"train_loss": -7.019284248352051, "global_step": 161340, "epoch": 3841} {"train_loss": -6.886070251464844, "global_step": 161341, "epoch": 3841} {"train_loss": -6.923786163330078, "global_step": 161342, "epoch": 3841} {"train_loss": -6.860003471374512, "global_step": 161343, "epoch": 3841} {"train_loss": -6.844079971313477, "global_step": 161344, "epoch": 3841} {"train_loss": -6.919528007507324, "global_step": 161345, "epoch": 3841} {"train_loss": -6.799197196960449, "global_step": 161346, "epoch": 3841} {"train_loss": -6.94047212600708, "global_step": 161347, "epoch": 3841} {"train_loss": -6.90981388092041, "global_step": 161348, "epoch": 3841} {"train_loss": -6.964061737060547, "global_step": 161349, "epoch": 3841} {"train_loss": -6.796769618988037, "global_step": 161350, "epoch": 3841} {"train_loss": -7.012031555175781, "global_step": 161351, "epoch": 3841} {"train_loss": -6.933096885681152, "global_step": 161352, "epoch": 3841} {"train_loss": -6.899328231811523, "global_step": 161353, "epoch": 3841} {"train_loss": -6.988348007202148, "global_step": 161354, "epoch": 3841} {"train_loss": -6.925902366638184, "global_step": 161355, "epoch": 3841} {"train_loss": -6.983436584472656, "global_step": 161356, "epoch": 3841} {"train_loss": -7.00204610824585, "global_step": 161357, "epoch": 3841} {"train_loss": -6.964231491088867, "global_step": 161358, "epoch": 3841} {"train_loss": -7.003517150878906, "global_step": 161359, "epoch": 3841} {"train_loss": -6.979891777038574, "global_step": 161360, "epoch": 3841} {"train_loss": -6.991944313049316, "global_step": 161361, "epoch": 3841} {"train_loss": -6.999420166015625, "global_step": 161362, "epoch": 3841} {"train_loss": -6.899728809084211, "global_step": 161363, "epoch": 3841, "val_loss": 68472.1640625} {"train_loss": -7.133177280426025, "global_step": 161364, "epoch": 3842} {"train_loss": -6.811649799346924, "global_step": 161365, "epoch": 3842} {"train_loss": -6.919160842895508, "global_step": 161366, "epoch": 3842} {"train_loss": -7.00877571105957, "global_step": 161367, "epoch": 3842} {"train_loss": -6.931327819824219, "global_step": 161368, "epoch": 3842} {"train_loss": -6.891896724700928, "global_step": 161369, "epoch": 3842} {"train_loss": -6.954129219055176, "global_step": 161370, "epoch": 3842} {"train_loss": -6.896665573120117, "global_step": 161371, "epoch": 3842} {"train_loss": -6.854954719543457, "global_step": 161372, "epoch": 3842} {"train_loss": -6.974396705627441, "global_step": 161373, "epoch": 3842} {"train_loss": -6.954128742218018, "global_step": 161374, "epoch": 3842} {"train_loss": -7.023292064666748, "global_step": 161375, "epoch": 3842} {"train_loss": -6.921816349029541, "global_step": 161376, "epoch": 3842} {"train_loss": -6.928752899169922, "global_step": 161377, "epoch": 3842} {"train_loss": -7.002419948577881, "global_step": 161378, "epoch": 3842} {"train_loss": -7.071498870849609, "global_step": 161379, "epoch": 3842} {"train_loss": -6.8521223068237305, "global_step": 161380, "epoch": 3842} {"train_loss": -7.014822959899902, "global_step": 161381, "epoch": 3842} {"train_loss": -6.944221496582031, "global_step": 161382, "epoch": 3842} {"train_loss": -6.961979389190674, "global_step": 161383, "epoch": 3842} {"train_loss": -6.859526634216309, "global_step": 161384, "epoch": 3842} {"train_loss": -6.894946098327637, "global_step": 161385, "epoch": 3842} {"train_loss": -6.932730674743652, "global_step": 161386, "epoch": 3842} {"train_loss": -6.921967506408691, "global_step": 161387, "epoch": 3842} {"train_loss": -6.902239799499512, "global_step": 161388, "epoch": 3842} {"train_loss": -7.056727409362793, "global_step": 161389, "epoch": 3842} {"train_loss": -6.9686126708984375, "global_step": 161390, "epoch": 3842} {"train_loss": -6.853792667388916, "global_step": 161391, "epoch": 3842} {"train_loss": -6.909631729125977, "global_step": 161392, "epoch": 3842} {"train_loss": -6.918645858764648, "global_step": 161393, "epoch": 3842} {"train_loss": -7.060571670532227, "global_step": 161394, "epoch": 3842} {"train_loss": -6.954180717468262, "global_step": 161395, "epoch": 3842} {"train_loss": -6.917025566101074, "global_step": 161396, "epoch": 3842} {"train_loss": -6.854007720947266, "global_step": 161397, "epoch": 3842} {"train_loss": -6.895115852355957, "global_step": 161398, "epoch": 3842} {"train_loss": -6.927697658538818, "global_step": 161399, "epoch": 3842} {"train_loss": -6.833963394165039, "global_step": 161400, "epoch": 3842} {"train_loss": -7.010588645935059, "global_step": 161401, "epoch": 3842} {"train_loss": -6.831057071685791, "global_step": 161402, "epoch": 3842} {"train_loss": -6.909411430358887, "global_step": 161403, "epoch": 3842} {"train_loss": -6.935361862182617, "global_step": 161404, "epoch": 3842} {"train_loss": -6.937558503378005, "global_step": 161405, "epoch": 3842, "val_loss": 68651.9609375} {"train_loss": -6.924613952636719, "global_step": 161406, "epoch": 3843} {"train_loss": -6.833957672119141, "global_step": 161407, "epoch": 3843} {"train_loss": -6.8688435554504395, "global_step": 161408, "epoch": 3843} {"train_loss": -6.955532550811768, "global_step": 161409, "epoch": 3843} {"train_loss": -6.940977573394775, "global_step": 161410, "epoch": 3843} {"train_loss": -7.008889198303223, "global_step": 161411, "epoch": 3843} {"train_loss": -6.940391540527344, "global_step": 161412, "epoch": 3843} {"train_loss": -7.046266555786133, "global_step": 161413, "epoch": 3843} {"train_loss": -6.947652339935303, "global_step": 161414, "epoch": 3843} {"train_loss": -6.803673267364502, "global_step": 161415, "epoch": 3843} {"train_loss": -6.915554046630859, "global_step": 161416, "epoch": 3843} {"train_loss": -7.028041839599609, "global_step": 161417, "epoch": 3843} {"train_loss": -7.031639099121094, "global_step": 161418, "epoch": 3843} {"train_loss": -6.911390781402588, "global_step": 161419, "epoch": 3843} {"train_loss": -6.854610443115234, "global_step": 161420, "epoch": 3843} {"train_loss": -7.0498223304748535, "global_step": 161421, "epoch": 3843} {"train_loss": -6.952683448791504, "global_step": 161422, "epoch": 3843} {"train_loss": -6.957187175750732, "global_step": 161423, "epoch": 3843} {"train_loss": -6.9899678230285645, "global_step": 161424, "epoch": 3843} {"train_loss": -6.965676307678223, "global_step": 161425, "epoch": 3843} {"train_loss": -7.0001935958862305, "global_step": 161426, "epoch": 3843} {"train_loss": -7.033908843994141, "global_step": 161427, "epoch": 3843} {"train_loss": -6.984502792358398, "global_step": 161428, "epoch": 3843} {"train_loss": -6.951015472412109, "global_step": 161429, "epoch": 3843} {"train_loss": -6.9241719245910645, "global_step": 161430, "epoch": 3843} {"train_loss": -6.920724868774414, "global_step": 161431, "epoch": 3843} {"train_loss": -6.7489213943481445, "global_step": 161432, "epoch": 3843} {"train_loss": -7.022252082824707, "global_step": 161433, "epoch": 3843} {"train_loss": -7.004726409912109, "global_step": 161434, "epoch": 3843} {"train_loss": -7.071664810180664, "global_step": 161435, "epoch": 3843} {"train_loss": -7.035219669342041, "global_step": 161436, "epoch": 3843} {"train_loss": -6.850716590881348, "global_step": 161437, "epoch": 3843} {"train_loss": -6.898769378662109, "global_step": 161438, "epoch": 3843} {"train_loss": -6.973760604858398, "global_step": 161439, "epoch": 3843} {"train_loss": -6.96335506439209, "global_step": 161440, "epoch": 3843} {"train_loss": -6.889189720153809, "global_step": 161441, "epoch": 3843} {"train_loss": -7.0210280418396, "global_step": 161442, "epoch": 3843} {"train_loss": -6.9204487800598145, "global_step": 161443, "epoch": 3843} {"train_loss": -6.9899678230285645, "global_step": 161444, "epoch": 3843} {"train_loss": -7.028623104095459, "global_step": 161445, "epoch": 3843} {"train_loss": -6.887111663818359, "global_step": 161446, "epoch": 3843} {"train_loss": -6.952714136668614, "global_step": 161447, "epoch": 3843, "val_loss": 68604.375} {"train_loss": -6.933324813842773, "global_step": 161448, "epoch": 3844} {"train_loss": -6.9539995193481445, "global_step": 161449, "epoch": 3844} {"train_loss": -7.042048454284668, "global_step": 161450, "epoch": 3844} {"train_loss": -6.939922332763672, "global_step": 161451, "epoch": 3844} {"train_loss": -6.842794418334961, "global_step": 161452, "epoch": 3844} {"train_loss": -6.965376853942871, "global_step": 161453, "epoch": 3844} {"train_loss": -6.813034534454346, "global_step": 161454, "epoch": 3844} {"train_loss": -6.907193183898926, "global_step": 161455, "epoch": 3844} {"train_loss": -6.97686243057251, "global_step": 161456, "epoch": 3844} {"train_loss": -6.9072136878967285, "global_step": 161457, "epoch": 3844} {"train_loss": -7.058882236480713, "global_step": 161458, "epoch": 3844} {"train_loss": -6.949457168579102, "global_step": 161459, "epoch": 3844} {"train_loss": -6.911733627319336, "global_step": 161460, "epoch": 3844} {"train_loss": -6.87946891784668, "global_step": 161461, "epoch": 3844} {"train_loss": -6.901828289031982, "global_step": 161462, "epoch": 3844} {"train_loss": -7.020529747009277, "global_step": 161463, "epoch": 3844} {"train_loss": -6.989696025848389, "global_step": 161464, "epoch": 3844} {"train_loss": -6.901283264160156, "global_step": 161465, "epoch": 3844} {"train_loss": -6.999152183532715, "global_step": 161466, "epoch": 3844} {"train_loss": -6.930079460144043, "global_step": 161467, "epoch": 3844} {"train_loss": -6.99698543548584, "global_step": 161468, "epoch": 3844} {"train_loss": -6.899727821350098, "global_step": 161469, "epoch": 3844} {"train_loss": -6.992879867553711, "global_step": 161470, "epoch": 3844} {"train_loss": -7.054057598114014, "global_step": 161471, "epoch": 3844} {"train_loss": -6.915299892425537, "global_step": 161472, "epoch": 3844} {"train_loss": -6.91344690322876, "global_step": 161473, "epoch": 3844} {"train_loss": -6.964486122131348, "global_step": 161474, "epoch": 3844} {"train_loss": -6.973106384277344, "global_step": 161475, "epoch": 3844} {"train_loss": -6.981453895568848, "global_step": 161476, "epoch": 3844} {"train_loss": -6.822519302368164, "global_step": 161477, "epoch": 3844} {"train_loss": -7.010148525238037, "global_step": 161478, "epoch": 3844} {"train_loss": -6.900137901306152, "global_step": 161479, "epoch": 3844} {"train_loss": -6.9727277755737305, "global_step": 161480, "epoch": 3844} {"train_loss": -6.994685173034668, "global_step": 161481, "epoch": 3844} {"train_loss": -6.98554801940918, "global_step": 161482, "epoch": 3844} {"train_loss": -7.034689903259277, "global_step": 161483, "epoch": 3844} {"train_loss": -6.989819526672363, "global_step": 161484, "epoch": 3844} {"train_loss": -6.986760139465332, "global_step": 161485, "epoch": 3844} {"train_loss": -6.957180023193359, "global_step": 161486, "epoch": 3844} {"train_loss": -6.980582237243652, "global_step": 161487, "epoch": 3844} {"train_loss": -6.913271427154541, "global_step": 161488, "epoch": 3844} {"train_loss": -6.95127180644444, "global_step": 161489, "epoch": 3844, "val_loss": 68639.2578125} {"train_loss": -6.975198745727539, "global_step": 161490, "epoch": 3845} {"train_loss": -7.021209716796875, "global_step": 161491, "epoch": 3845} {"train_loss": -6.983133316040039, "global_step": 161492, "epoch": 3845} {"train_loss": -6.912105560302734, "global_step": 161493, "epoch": 3845} {"train_loss": -6.91971492767334, "global_step": 161494, "epoch": 3845} {"train_loss": -7.012704849243164, "global_step": 161495, "epoch": 3845} {"train_loss": -6.977583885192871, "global_step": 161496, "epoch": 3845} {"train_loss": -6.981740951538086, "global_step": 161497, "epoch": 3845} {"train_loss": -6.981996536254883, "global_step": 161498, "epoch": 3845} {"train_loss": -7.035443305969238, "global_step": 161499, "epoch": 3845} {"train_loss": -6.980712890625, "global_step": 161500, "epoch": 3845} {"train_loss": -6.967134952545166, "global_step": 161501, "epoch": 3845} {"train_loss": -7.002213954925537, "global_step": 161502, "epoch": 3845} {"train_loss": -6.910698890686035, "global_step": 161503, "epoch": 3845} {"train_loss": -7.003137588500977, "global_step": 161504, "epoch": 3845} {"train_loss": -7.009742736816406, "global_step": 161505, "epoch": 3845} {"train_loss": -6.916136264801025, "global_step": 161506, "epoch": 3845} {"train_loss": -6.930403709411621, "global_step": 161507, "epoch": 3845} {"train_loss": -6.849481582641602, "global_step": 161508, "epoch": 3845} {"train_loss": -7.045212268829346, "global_step": 161509, "epoch": 3845} {"train_loss": -6.902496337890625, "global_step": 161510, "epoch": 3845} {"train_loss": -7.008472919464111, "global_step": 161511, "epoch": 3845} {"train_loss": -6.951417922973633, "global_step": 161512, "epoch": 3845} {"train_loss": -6.969803810119629, "global_step": 161513, "epoch": 3845} {"train_loss": -7.052802562713623, "global_step": 161514, "epoch": 3845} {"train_loss": -6.847064971923828, "global_step": 161515, "epoch": 3845} {"train_loss": -6.928539276123047, "global_step": 161516, "epoch": 3845} {"train_loss": -7.019023895263672, "global_step": 161517, "epoch": 3845} {"train_loss": -6.9902801513671875, "global_step": 161518, "epoch": 3845} {"train_loss": -7.024102210998535, "global_step": 161519, "epoch": 3845} {"train_loss": -6.975975036621094, "global_step": 161520, "epoch": 3845} {"train_loss": -6.808355331420898, "global_step": 161521, "epoch": 3845} {"train_loss": -6.9432830810546875, "global_step": 161522, "epoch": 3845} {"train_loss": -6.995566368103027, "global_step": 161523, "epoch": 3845} {"train_loss": -6.977949142456055, "global_step": 161524, "epoch": 3845} {"train_loss": -6.896990776062012, "global_step": 161525, "epoch": 3845} {"train_loss": -6.956254959106445, "global_step": 161526, "epoch": 3845} {"train_loss": -6.936990737915039, "global_step": 161527, "epoch": 3845} {"train_loss": -6.969799518585205, "global_step": 161528, "epoch": 3845} {"train_loss": -6.989988327026367, "global_step": 161529, "epoch": 3845} {"train_loss": -6.950272560119629, "global_step": 161530, "epoch": 3845} {"train_loss": -6.962744724182856, "global_step": 161531, "epoch": 3845, "val_loss": 68688.234375} {"train_loss": -7.108500957489014, "global_step": 161532, "epoch": 3846} {"train_loss": -7.068995475769043, "global_step": 161533, "epoch": 3846} {"train_loss": -6.985100746154785, "global_step": 161534, "epoch": 3846} {"train_loss": -7.0617899894714355, "global_step": 161535, "epoch": 3846} {"train_loss": -6.920567989349365, "global_step": 161536, "epoch": 3846} {"train_loss": -6.970395088195801, "global_step": 161537, "epoch": 3846} {"train_loss": -7.038614273071289, "global_step": 161538, "epoch": 3846} {"train_loss": -6.8766632080078125, "global_step": 161539, "epoch": 3846} {"train_loss": -6.949883937835693, "global_step": 161540, "epoch": 3846} {"train_loss": -6.974678039550781, "global_step": 161541, "epoch": 3846} {"train_loss": -6.956099510192871, "global_step": 161542, "epoch": 3846} {"train_loss": -6.998697280883789, "global_step": 161543, "epoch": 3846} {"train_loss": -7.015178680419922, "global_step": 161544, "epoch": 3846} {"train_loss": -6.888372421264648, "global_step": 161545, "epoch": 3846} {"train_loss": -6.9737114906311035, "global_step": 161546, "epoch": 3846} {"train_loss": -7.021538734436035, "global_step": 161547, "epoch": 3846} {"train_loss": -6.96849250793457, "global_step": 161548, "epoch": 3846} {"train_loss": -7.022980690002441, "global_step": 161549, "epoch": 3846} {"train_loss": -6.956932067871094, "global_step": 161550, "epoch": 3846} {"train_loss": -7.089972972869873, "global_step": 161551, "epoch": 3846} {"train_loss": -6.895936012268066, "global_step": 161552, "epoch": 3846} {"train_loss": -7.075935363769531, "global_step": 161553, "epoch": 3846} {"train_loss": -7.039830207824707, "global_step": 161554, "epoch": 3846} {"train_loss": -6.922611236572266, "global_step": 161555, "epoch": 3846} {"train_loss": -6.977189540863037, "global_step": 161556, "epoch": 3846} {"train_loss": -6.928426742553711, "global_step": 161557, "epoch": 3846} {"train_loss": -6.799568176269531, "global_step": 161558, "epoch": 3846} {"train_loss": -6.96353006362915, "global_step": 161559, "epoch": 3846} {"train_loss": -6.979327201843262, "global_step": 161560, "epoch": 3846} {"train_loss": -6.917185306549072, "global_step": 161561, "epoch": 3846} {"train_loss": -6.917358875274658, "global_step": 161562, "epoch": 3846} {"train_loss": -6.85360050201416, "global_step": 161563, "epoch": 3846} {"train_loss": -6.986392498016357, "global_step": 161564, "epoch": 3846} {"train_loss": -6.696379661560059, "global_step": 161565, "epoch": 3846} {"train_loss": -6.920105934143066, "global_step": 161566, "epoch": 3846} {"train_loss": -6.757881164550781, "global_step": 161567, "epoch": 3846} {"train_loss": -6.936687469482422, "global_step": 161568, "epoch": 3846} {"train_loss": -6.788702487945557, "global_step": 161569, "epoch": 3846} {"train_loss": -6.866245746612549, "global_step": 161570, "epoch": 3846} {"train_loss": -6.829899787902832, "global_step": 161571, "epoch": 3846} {"train_loss": -6.823349475860596, "global_step": 161572, "epoch": 3846} {"train_loss": -6.946840184075492, "global_step": 161573, "epoch": 3846, "val_loss": 68667.1953125} {"train_loss": -6.759016036987305, "global_step": 161574, "epoch": 3847} {"train_loss": -6.864136695861816, "global_step": 161575, "epoch": 3847} {"train_loss": -6.932435989379883, "global_step": 161576, "epoch": 3847} {"train_loss": -6.964818000793457, "global_step": 161577, "epoch": 3847} {"train_loss": -7.045041084289551, "global_step": 161578, "epoch": 3847} {"train_loss": -6.987404823303223, "global_step": 161579, "epoch": 3847} {"train_loss": -6.958475112915039, "global_step": 161580, "epoch": 3847} {"train_loss": -6.9443745613098145, "global_step": 161581, "epoch": 3847} {"train_loss": -6.93206787109375, "global_step": 161582, "epoch": 3847} {"train_loss": -6.917794227600098, "global_step": 161583, "epoch": 3847} {"train_loss": -7.026274681091309, "global_step": 161584, "epoch": 3847} {"train_loss": -6.992565155029297, "global_step": 161585, "epoch": 3847} {"train_loss": -6.991066932678223, "global_step": 161586, "epoch": 3847} {"train_loss": -7.027351379394531, "global_step": 161587, "epoch": 3847} {"train_loss": -6.970106601715088, "global_step": 161588, "epoch": 3847} {"train_loss": -7.018558025360107, "global_step": 161589, "epoch": 3847} {"train_loss": -7.050104141235352, "global_step": 161590, "epoch": 3847} {"train_loss": -7.050114154815674, "global_step": 161591, "epoch": 3847} {"train_loss": -6.8923492431640625, "global_step": 161592, "epoch": 3847} {"train_loss": -7.012959957122803, "global_step": 161593, "epoch": 3847} {"train_loss": -6.992422103881836, "global_step": 161594, "epoch": 3847} {"train_loss": -6.950232982635498, "global_step": 161595, "epoch": 3847} {"train_loss": -6.975478172302246, "global_step": 161596, "epoch": 3847} {"train_loss": -7.112595558166504, "global_step": 161597, "epoch": 3847} {"train_loss": -7.021413803100586, "global_step": 161598, "epoch": 3847} {"train_loss": -6.988589763641357, "global_step": 161599, "epoch": 3847} {"train_loss": -6.987240791320801, "global_step": 161600, "epoch": 3847} {"train_loss": -7.037137031555176, "global_step": 161601, "epoch": 3847} {"train_loss": -7.095713138580322, "global_step": 161602, "epoch": 3847} {"train_loss": -6.933032512664795, "global_step": 161603, "epoch": 3847} {"train_loss": -7.010924339294434, "global_step": 161604, "epoch": 3847} {"train_loss": -6.942497253417969, "global_step": 161605, "epoch": 3847} {"train_loss": -6.939422607421875, "global_step": 161606, "epoch": 3847} {"train_loss": -7.010180473327637, "global_step": 161607, "epoch": 3847} {"train_loss": -6.950571060180664, "global_step": 161608, "epoch": 3847} {"train_loss": -6.878913879394531, "global_step": 161609, "epoch": 3847} {"train_loss": -6.953174591064453, "global_step": 161610, "epoch": 3847} {"train_loss": -7.003630638122559, "global_step": 161611, "epoch": 3847} {"train_loss": -6.898746490478516, "global_step": 161612, "epoch": 3847} {"train_loss": -6.957575798034668, "global_step": 161613, "epoch": 3847} {"train_loss": -6.9942779541015625, "global_step": 161614, "epoch": 3847} {"train_loss": -6.976014455159505, "global_step": 161615, "epoch": 3847, "val_loss": 68633.1640625} {"train_loss": -7.1065993309021, "global_step": 161616, "epoch": 3848} {"train_loss": -6.88908576965332, "global_step": 161617, "epoch": 3848} {"train_loss": -7.021900653839111, "global_step": 161618, "epoch": 3848} {"train_loss": -6.865461349487305, "global_step": 161619, "epoch": 3848} {"train_loss": -6.983672142028809, "global_step": 161620, "epoch": 3848} {"train_loss": -6.91286563873291, "global_step": 161621, "epoch": 3848} {"train_loss": -6.905311584472656, "global_step": 161622, "epoch": 3848} {"train_loss": -7.009284973144531, "global_step": 161623, "epoch": 3848} {"train_loss": -6.880610942840576, "global_step": 161624, "epoch": 3848} {"train_loss": -6.886364459991455, "global_step": 161625, "epoch": 3848} {"train_loss": -7.007240295410156, "global_step": 161626, "epoch": 3848} {"train_loss": -6.864184379577637, "global_step": 161627, "epoch": 3848} {"train_loss": -6.8707275390625, "global_step": 161628, "epoch": 3848} {"train_loss": -6.881508827209473, "global_step": 161629, "epoch": 3848} {"train_loss": -6.912908554077148, "global_step": 161630, "epoch": 3848} {"train_loss": -6.826365947723389, "global_step": 161631, "epoch": 3848} {"train_loss": -6.875510215759277, "global_step": 161632, "epoch": 3848} {"train_loss": -6.871580600738525, "global_step": 161633, "epoch": 3848} {"train_loss": -6.854015350341797, "global_step": 161634, "epoch": 3848} {"train_loss": -6.874899864196777, "global_step": 161635, "epoch": 3848} {"train_loss": -6.928857326507568, "global_step": 161636, "epoch": 3848} {"train_loss": -6.963014602661133, "global_step": 161637, "epoch": 3848} {"train_loss": -6.86370849609375, "global_step": 161638, "epoch": 3848} {"train_loss": -6.860222816467285, "global_step": 161639, "epoch": 3848} {"train_loss": -6.870926856994629, "global_step": 161640, "epoch": 3848} {"train_loss": -6.9036760330200195, "global_step": 161641, "epoch": 3848} {"train_loss": -6.937722206115723, "global_step": 161642, "epoch": 3848} {"train_loss": -6.817623615264893, "global_step": 161643, "epoch": 3848} {"train_loss": -6.976977348327637, "global_step": 161644, "epoch": 3848} {"train_loss": -6.701135635375977, "global_step": 161645, "epoch": 3848} {"train_loss": -6.775647163391113, "global_step": 161646, "epoch": 3848} {"train_loss": -6.916855335235596, "global_step": 161647, "epoch": 3848} {"train_loss": -6.678595542907715, "global_step": 161648, "epoch": 3848} {"train_loss": -6.915907859802246, "global_step": 161649, "epoch": 3848} {"train_loss": -6.764778137207031, "global_step": 161650, "epoch": 3848} {"train_loss": -6.969632625579834, "global_step": 161651, "epoch": 3848} {"train_loss": -6.830750942230225, "global_step": 161652, "epoch": 3848} {"train_loss": -6.889509677886963, "global_step": 161653, "epoch": 3848} {"train_loss": -6.843128204345703, "global_step": 161654, "epoch": 3848} {"train_loss": -6.856437683105469, "global_step": 161655, "epoch": 3848} {"train_loss": -6.955120086669922, "global_step": 161656, "epoch": 3848} {"train_loss": -6.889687231608799, "global_step": 161657, "epoch": 3848, "val_loss": 68600.8984375} {"train_loss": -7.001695156097412, "global_step": 161658, "epoch": 3849} {"train_loss": -6.957944869995117, "global_step": 161659, "epoch": 3849} {"train_loss": -6.933016777038574, "global_step": 161660, "epoch": 3849} {"train_loss": -6.994675636291504, "global_step": 161661, "epoch": 3849} {"train_loss": -7.009448528289795, "global_step": 161662, "epoch": 3849} {"train_loss": -6.982983589172363, "global_step": 161663, "epoch": 3849} {"train_loss": -7.03027868270874, "global_step": 161664, "epoch": 3849} {"train_loss": -6.944775581359863, "global_step": 161665, "epoch": 3849} {"train_loss": -6.926470756530762, "global_step": 161666, "epoch": 3849} {"train_loss": -7.05405855178833, "global_step": 161667, "epoch": 3849} {"train_loss": -6.927867412567139, "global_step": 161668, "epoch": 3849} {"train_loss": -7.046634674072266, "global_step": 161669, "epoch": 3849} {"train_loss": -6.967327117919922, "global_step": 161670, "epoch": 3849} {"train_loss": -7.022454261779785, "global_step": 161671, "epoch": 3849} {"train_loss": -6.936537742614746, "global_step": 161672, "epoch": 3849} {"train_loss": -6.972271919250488, "global_step": 161673, "epoch": 3849} {"train_loss": -6.952352523803711, "global_step": 161674, "epoch": 3849} {"train_loss": -7.03210973739624, "global_step": 161675, "epoch": 3849} {"train_loss": -7.0625786781311035, "global_step": 161676, "epoch": 3849} {"train_loss": -6.801577568054199, "global_step": 161677, "epoch": 3849} {"train_loss": -6.963280200958252, "global_step": 161678, "epoch": 3849} {"train_loss": -6.928404808044434, "global_step": 161679, "epoch": 3849} {"train_loss": -6.869815349578857, "global_step": 161680, "epoch": 3849} {"train_loss": -6.93220853805542, "global_step": 161681, "epoch": 3849} {"train_loss": -6.9292097091674805, "global_step": 161682, "epoch": 3849} {"train_loss": -6.94911527633667, "global_step": 161683, "epoch": 3849} {"train_loss": -7.065703392028809, "global_step": 161684, "epoch": 3849} {"train_loss": -6.922308921813965, "global_step": 161685, "epoch": 3849} {"train_loss": -7.028125762939453, "global_step": 161686, "epoch": 3849} {"train_loss": -6.925817966461182, "global_step": 161687, "epoch": 3849} {"train_loss": -7.013631820678711, "global_step": 161688, "epoch": 3849} {"train_loss": -6.965917110443115, "global_step": 161689, "epoch": 3849} {"train_loss": -6.870895862579346, "global_step": 161690, "epoch": 3849} {"train_loss": -7.031869411468506, "global_step": 161691, "epoch": 3849} {"train_loss": -6.9246745109558105, "global_step": 161692, "epoch": 3849} {"train_loss": -7.040331840515137, "global_step": 161693, "epoch": 3849} {"train_loss": -6.958000183105469, "global_step": 161694, "epoch": 3849} {"train_loss": -6.959288597106934, "global_step": 161695, "epoch": 3849} {"train_loss": -6.974296569824219, "global_step": 161696, "epoch": 3849} {"train_loss": -6.957921981811523, "global_step": 161697, "epoch": 3849} {"train_loss": -6.884133338928223, "global_step": 161698, "epoch": 3849} {"train_loss": -6.966950439271473, "global_step": 161699, "epoch": 3849, "val_loss": 68561.9921875} {"train_loss": -6.841274738311768, "global_step": 161700, "epoch": 3850} {"train_loss": -6.983670711517334, "global_step": 161701, "epoch": 3850} {"train_loss": -6.887507915496826, "global_step": 161702, "epoch": 3850} {"train_loss": -6.883322715759277, "global_step": 161703, "epoch": 3850} {"train_loss": -6.972487449645996, "global_step": 161704, "epoch": 3850} {"train_loss": -6.914658069610596, "global_step": 161705, "epoch": 3850} {"train_loss": -6.943426132202148, "global_step": 161706, "epoch": 3850} {"train_loss": -6.889039993286133, "global_step": 161707, "epoch": 3850} {"train_loss": -6.98013973236084, "global_step": 161708, "epoch": 3850} {"train_loss": -6.966130256652832, "global_step": 161709, "epoch": 3850} {"train_loss": -7.0184502601623535, "global_step": 161710, "epoch": 3850} {"train_loss": -7.079766750335693, "global_step": 161711, "epoch": 3850} {"train_loss": -6.846963882446289, "global_step": 161712, "epoch": 3850} {"train_loss": -6.872173309326172, "global_step": 161713, "epoch": 3850} {"train_loss": -6.938732147216797, "global_step": 161714, "epoch": 3850} {"train_loss": -6.955347061157227, "global_step": 161715, "epoch": 3850} {"train_loss": -7.025651931762695, "global_step": 161716, "epoch": 3850} {"train_loss": -6.959907531738281, "global_step": 161717, "epoch": 3850} {"train_loss": -6.987078666687012, "global_step": 161718, "epoch": 3850} {"train_loss": -6.950419902801514, "global_step": 161719, "epoch": 3850} {"train_loss": -6.974626064300537, "global_step": 161720, "epoch": 3850} {"train_loss": -6.980442047119141, "global_step": 161721, "epoch": 3850} {"train_loss": -7.030573844909668, "global_step": 161722, "epoch": 3850} {"train_loss": -7.128923416137695, "global_step": 161723, "epoch": 3850} {"train_loss": -7.156133651733398, "global_step": 161724, "epoch": 3850} {"train_loss": -7.0293169021606445, "global_step": 161725, "epoch": 3850} {"train_loss": -7.052909851074219, "global_step": 161726, "epoch": 3850} {"train_loss": -6.990825653076172, "global_step": 161727, "epoch": 3850} {"train_loss": -6.948907852172852, "global_step": 161728, "epoch": 3850} {"train_loss": -7.066051483154297, "global_step": 161729, "epoch": 3850} {"train_loss": -7.0048065185546875, "global_step": 161730, "epoch": 3850} {"train_loss": -7.040693283081055, "global_step": 161731, "epoch": 3850} {"train_loss": -6.994712829589844, "global_step": 161732, "epoch": 3850} {"train_loss": -7.037593841552734, "global_step": 161733, "epoch": 3850} {"train_loss": -7.002348899841309, "global_step": 161734, "epoch": 3850} {"train_loss": -6.971212863922119, "global_step": 161735, "epoch": 3850} {"train_loss": -7.013400077819824, "global_step": 161736, "epoch": 3850} {"train_loss": -7.0026350021362305, "global_step": 161737, "epoch": 3850} {"train_loss": -6.802892684936523, "global_step": 161738, "epoch": 3850} {"train_loss": -6.959184646606445, "global_step": 161739, "epoch": 3850} {"train_loss": -6.912302017211914, "global_step": 161740, "epoch": 3850} {"train_loss": -6.973425842466808, "global_step": 161741, "epoch": 3850, "train/sim_max_reward_0": 0.37210085626066214, "train/sim_max_reward_1": 0.7048848234728597, "train/sim_max_reward_2": 0.8708936681299406, "train/sim_max_reward_3": 0.39671042428775327, "train/sim_max_reward_4": 0.7924428488456424, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.0013542850565730453, "test/sim_max_reward_4300001": 0.40569281787328426, "test/sim_max_reward_4300002": 0.8218231105429951, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9944668258522175, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.6683609625650979, "test/sim_max_reward_4300008": 0.9882719930492061, "test/sim_max_reward_4300009": 0.8862494695935258, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9320079715430288, "test/sim_max_reward_4300012": 0.9140296369710447, "test/sim_max_reward_4300013": 0.9711139161146018, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.3919012557908242, "test/sim_max_reward_4300019": 0.18591986951504158, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8979612508976702, "test/sim_max_reward_4300022": 0.9435124004699389, "test/sim_max_reward_4300023": 0.32769301339129364, "test/sim_max_reward_4300024": 0.9609848997415429, "test/sim_max_reward_4300025": 0.9214095591306053, "test/sim_max_reward_4300026": 0.16398623925312847, "test/sim_max_reward_4300027": 1.0, "test/sim_max_reward_4300028": 0.8805871913946556, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.1333402939039833, "test/sim_max_reward_4300031": 0.21071215433381868, "test/sim_max_reward_4300032": 0.9367963466953115, "test/sim_max_reward_4300033": 0.7169527524133136, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.48686102131942466, "test/sim_max_reward_4300036": 0.25397009026350753, "test/sim_max_reward_4300037": 1.0, "test/sim_max_reward_4300038": 0.02992939717989305, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.37776665923459535, "test/sim_max_reward_4300041": 0.9608642125011635, "test/sim_max_reward_4300042": 0.5169043894861058, "test/sim_max_reward_4300043": 0.15926517329602757, "test/sim_max_reward_4300044": 0.8412571976905124, "test/sim_max_reward_4300045": 0.9634921545272076, "test/sim_max_reward_4300046": 0.9649624960531479, "test/sim_max_reward_4300047": 0.14566044639571532, "test/sim_max_reward_4300048": 0.9221621413201786, "test/sim_max_reward_4300049": 0.1008699002422548, "train/mean_score": 0.5550028967265076, "test/mean_score": 0.5798985520082345, "val_loss": 68640.625} {"train_loss": -7.040727615356445, "global_step": 161742, "epoch": 3851} {"train_loss": -6.985378265380859, "global_step": 161743, "epoch": 3851} {"train_loss": -6.826054573059082, "global_step": 161744, "epoch": 3851} {"train_loss": -6.924416542053223, "global_step": 161745, "epoch": 3851} {"train_loss": -6.930471420288086, "global_step": 161746, "epoch": 3851} {"train_loss": -6.850907325744629, "global_step": 161747, "epoch": 3851} {"train_loss": -6.954348564147949, "global_step": 161748, "epoch": 3851} {"train_loss": -6.718077182769775, "global_step": 161749, "epoch": 3851} {"train_loss": -6.853161811828613, "global_step": 161750, "epoch": 3851} {"train_loss": -6.8305864334106445, "global_step": 161751, "epoch": 3851} {"train_loss": -6.955373764038086, "global_step": 161752, "epoch": 3851} {"train_loss": -7.000997543334961, "global_step": 161753, "epoch": 3851} {"train_loss": -6.974323749542236, "global_step": 161754, "epoch": 3851} {"train_loss": -7.042380332946777, "global_step": 161755, "epoch": 3851} {"train_loss": -6.897088050842285, "global_step": 161756, "epoch": 3851} {"train_loss": -6.948095798492432, "global_step": 161757, "epoch": 3851} {"train_loss": -7.075869083404541, "global_step": 161758, "epoch": 3851} {"train_loss": -6.91813850402832, "global_step": 161759, "epoch": 3851} {"train_loss": -7.0824079513549805, "global_step": 161760, "epoch": 3851} {"train_loss": -6.98805046081543, "global_step": 161761, "epoch": 3851} {"train_loss": -6.867937088012695, "global_step": 161762, "epoch": 3851} {"train_loss": -7.023386001586914, "global_step": 161763, "epoch": 3851} {"train_loss": -7.021991729736328, "global_step": 161764, "epoch": 3851} {"train_loss": -7.006153106689453, "global_step": 161765, "epoch": 3851} {"train_loss": -6.980910301208496, "global_step": 161766, "epoch": 3851} {"train_loss": -6.941219806671143, "global_step": 161767, "epoch": 3851} {"train_loss": -6.931015968322754, "global_step": 161768, "epoch": 3851} {"train_loss": -7.009576797485352, "global_step": 161769, "epoch": 3851} {"train_loss": -7.14076042175293, "global_step": 161770, "epoch": 3851} {"train_loss": -6.976063251495361, "global_step": 161771, "epoch": 3851} {"train_loss": -6.891839981079102, "global_step": 161772, "epoch": 3851} {"train_loss": -6.9551215171813965, "global_step": 161773, "epoch": 3851} {"train_loss": -6.928402900695801, "global_step": 161774, "epoch": 3851} {"train_loss": -7.071140289306641, "global_step": 161775, "epoch": 3851} {"train_loss": -7.079422950744629, "global_step": 161776, "epoch": 3851} {"train_loss": -6.7996063232421875, "global_step": 161777, "epoch": 3851} {"train_loss": -6.913741111755371, "global_step": 161778, "epoch": 3851} {"train_loss": -7.014338493347168, "global_step": 161779, "epoch": 3851} {"train_loss": -7.001230239868164, "global_step": 161780, "epoch": 3851} {"train_loss": -6.950331211090088, "global_step": 161781, "epoch": 3851} {"train_loss": -6.993834495544434, "global_step": 161782, "epoch": 3851} {"train_loss": -6.959175893238613, "global_step": 161783, "epoch": 3851, "val_loss": 68767.375} {"train_loss": -7.032047748565674, "global_step": 161784, "epoch": 3852} {"train_loss": -7.029294967651367, "global_step": 161785, "epoch": 3852} {"train_loss": -7.033302307128906, "global_step": 161786, "epoch": 3852} {"train_loss": -6.929813385009766, "global_step": 161787, "epoch": 3852} {"train_loss": -7.019900321960449, "global_step": 161788, "epoch": 3852} {"train_loss": -7.028831481933594, "global_step": 161789, "epoch": 3852} {"train_loss": -6.940202236175537, "global_step": 161790, "epoch": 3852} {"train_loss": -7.0764079093933105, "global_step": 161791, "epoch": 3852} {"train_loss": -6.954200744628906, "global_step": 161792, "epoch": 3852} {"train_loss": -6.916478157043457, "global_step": 161793, "epoch": 3852} {"train_loss": -6.911447048187256, "global_step": 161794, "epoch": 3852} {"train_loss": -6.979679107666016, "global_step": 161795, "epoch": 3852} {"train_loss": -6.896351337432861, "global_step": 161796, "epoch": 3852} {"train_loss": -7.069986343383789, "global_step": 161797, "epoch": 3852} {"train_loss": -6.969731330871582, "global_step": 161798, "epoch": 3852} {"train_loss": -6.9878411293029785, "global_step": 161799, "epoch": 3852} {"train_loss": -6.970932960510254, "global_step": 161800, "epoch": 3852} {"train_loss": -6.932798862457275, "global_step": 161801, "epoch": 3852} {"train_loss": -6.9395647048950195, "global_step": 161802, "epoch": 3852} {"train_loss": -6.994086742401123, "global_step": 161803, "epoch": 3852} {"train_loss": -6.898962020874023, "global_step": 161804, "epoch": 3852} {"train_loss": -6.993887901306152, "global_step": 161805, "epoch": 3852} {"train_loss": -7.047686576843262, "global_step": 161806, "epoch": 3852} {"train_loss": -7.031351566314697, "global_step": 161807, "epoch": 3852} {"train_loss": -6.955143451690674, "global_step": 161808, "epoch": 3852} {"train_loss": -6.977090835571289, "global_step": 161809, "epoch": 3852} {"train_loss": -7.093994140625, "global_step": 161810, "epoch": 3852} {"train_loss": -6.944906234741211, "global_step": 161811, "epoch": 3852} {"train_loss": -7.009509086608887, "global_step": 161812, "epoch": 3852} {"train_loss": -6.986444473266602, "global_step": 161813, "epoch": 3852} {"train_loss": -7.082895278930664, "global_step": 161814, "epoch": 3852} {"train_loss": -6.953125, "global_step": 161815, "epoch": 3852} {"train_loss": -6.901967525482178, "global_step": 161816, "epoch": 3852} {"train_loss": -6.9101881980896, "global_step": 161817, "epoch": 3852} {"train_loss": -6.9673357009887695, "global_step": 161818, "epoch": 3852} {"train_loss": -6.987105369567871, "global_step": 161819, "epoch": 3852} {"train_loss": -6.880517959594727, "global_step": 161820, "epoch": 3852} {"train_loss": -6.9432172775268555, "global_step": 161821, "epoch": 3852} {"train_loss": -6.993378639221191, "global_step": 161822, "epoch": 3852} {"train_loss": -7.045382499694824, "global_step": 161823, "epoch": 3852} {"train_loss": -6.83992862701416, "global_step": 161824, "epoch": 3852} {"train_loss": -6.974952640987578, "global_step": 161825, "epoch": 3852, "val_loss": 68593.9609375} {"train_loss": -6.9601311683654785, "global_step": 161826, "epoch": 3853} {"train_loss": -6.799153804779053, "global_step": 161827, "epoch": 3853} {"train_loss": -6.92789363861084, "global_step": 161828, "epoch": 3853} {"train_loss": -6.969119071960449, "global_step": 161829, "epoch": 3853} {"train_loss": -6.748435974121094, "global_step": 161830, "epoch": 3853} {"train_loss": -6.9859466552734375, "global_step": 161831, "epoch": 3853} {"train_loss": -6.7884063720703125, "global_step": 161832, "epoch": 3853} {"train_loss": -6.950623035430908, "global_step": 161833, "epoch": 3853} {"train_loss": -6.843470096588135, "global_step": 161834, "epoch": 3853} {"train_loss": -6.90061616897583, "global_step": 161835, "epoch": 3853} {"train_loss": -7.010218143463135, "global_step": 161836, "epoch": 3853} {"train_loss": -6.974514007568359, "global_step": 161837, "epoch": 3853} {"train_loss": -6.972208023071289, "global_step": 161838, "epoch": 3853} {"train_loss": -6.8710198402404785, "global_step": 161839, "epoch": 3853} {"train_loss": -6.987704277038574, "global_step": 161840, "epoch": 3853} {"train_loss": -6.962204456329346, "global_step": 161841, "epoch": 3853} {"train_loss": -6.939043998718262, "global_step": 161842, "epoch": 3853} {"train_loss": -7.0118608474731445, "global_step": 161843, "epoch": 3853} {"train_loss": -6.993072986602783, "global_step": 161844, "epoch": 3853} {"train_loss": -7.057921886444092, "global_step": 161845, "epoch": 3853} {"train_loss": -7.00868034362793, "global_step": 161846, "epoch": 3853} {"train_loss": -6.972372055053711, "global_step": 161847, "epoch": 3853} {"train_loss": -7.088474273681641, "global_step": 161848, "epoch": 3853} {"train_loss": -7.035175800323486, "global_step": 161849, "epoch": 3853} {"train_loss": -7.071742057800293, "global_step": 161850, "epoch": 3853} {"train_loss": -6.946363925933838, "global_step": 161851, "epoch": 3853} {"train_loss": -6.918468952178955, "global_step": 161852, "epoch": 3853} {"train_loss": -6.913320541381836, "global_step": 161853, "epoch": 3853} {"train_loss": -6.864940643310547, "global_step": 161854, "epoch": 3853} {"train_loss": -7.032083511352539, "global_step": 161855, "epoch": 3853} {"train_loss": -6.913239479064941, "global_step": 161856, "epoch": 3853} {"train_loss": -6.85595703125, "global_step": 161857, "epoch": 3853} {"train_loss": -6.856205463409424, "global_step": 161858, "epoch": 3853} {"train_loss": -6.919832706451416, "global_step": 161859, "epoch": 3853} {"train_loss": -6.956934928894043, "global_step": 161860, "epoch": 3853} {"train_loss": -6.933053016662598, "global_step": 161861, "epoch": 3853} {"train_loss": -6.903521537780762, "global_step": 161862, "epoch": 3853} {"train_loss": -6.955451488494873, "global_step": 161863, "epoch": 3853} {"train_loss": -6.890449523925781, "global_step": 161864, "epoch": 3853} {"train_loss": -6.83713436126709, "global_step": 161865, "epoch": 3853} {"train_loss": -6.82366943359375, "global_step": 161866, "epoch": 3853} {"train_loss": -6.933679603395008, "global_step": 161867, "epoch": 3853, "val_loss": 68659.140625} {"train_loss": -7.024999618530273, "global_step": 161868, "epoch": 3854} {"train_loss": -6.883186340332031, "global_step": 161869, "epoch": 3854} {"train_loss": -6.955161094665527, "global_step": 161870, "epoch": 3854} {"train_loss": -7.027164936065674, "global_step": 161871, "epoch": 3854} {"train_loss": -6.953893184661865, "global_step": 161872, "epoch": 3854} {"train_loss": -7.025038719177246, "global_step": 161873, "epoch": 3854} {"train_loss": -6.985647678375244, "global_step": 161874, "epoch": 3854} {"train_loss": -7.012683868408203, "global_step": 161875, "epoch": 3854} {"train_loss": -6.981377601623535, "global_step": 161876, "epoch": 3854} {"train_loss": -6.939550876617432, "global_step": 161877, "epoch": 3854} {"train_loss": -6.969399452209473, "global_step": 161878, "epoch": 3854} {"train_loss": -6.870561599731445, "global_step": 161879, "epoch": 3854} {"train_loss": -7.010678768157959, "global_step": 161880, "epoch": 3854} {"train_loss": -6.951747894287109, "global_step": 161881, "epoch": 3854} {"train_loss": -6.880255222320557, "global_step": 161882, "epoch": 3854} {"train_loss": -7.009472846984863, "global_step": 161883, "epoch": 3854} {"train_loss": -6.840400695800781, "global_step": 161884, "epoch": 3854} {"train_loss": -7.071303367614746, "global_step": 161885, "epoch": 3854} {"train_loss": -6.969422817230225, "global_step": 161886, "epoch": 3854} {"train_loss": -7.013008117675781, "global_step": 161887, "epoch": 3854} {"train_loss": -6.935776710510254, "global_step": 161888, "epoch": 3854} {"train_loss": -7.001137733459473, "global_step": 161889, "epoch": 3854} {"train_loss": -6.882705211639404, "global_step": 161890, "epoch": 3854} {"train_loss": -6.771500587463379, "global_step": 161891, "epoch": 3854} {"train_loss": -6.965532302856445, "global_step": 161892, "epoch": 3854} {"train_loss": -6.86299991607666, "global_step": 161893, "epoch": 3854} {"train_loss": -6.952426433563232, "global_step": 161894, "epoch": 3854} {"train_loss": -6.985505104064941, "global_step": 161895, "epoch": 3854} {"train_loss": -6.858691215515137, "global_step": 161896, "epoch": 3854} {"train_loss": -6.930904388427734, "global_step": 161897, "epoch": 3854} {"train_loss": -7.052981376647949, "global_step": 161898, "epoch": 3854} {"train_loss": -6.873487949371338, "global_step": 161899, "epoch": 3854} {"train_loss": -6.949642658233643, "global_step": 161900, "epoch": 3854} {"train_loss": -7.025489330291748, "global_step": 161901, "epoch": 3854} {"train_loss": -6.840869426727295, "global_step": 161902, "epoch": 3854} {"train_loss": -6.963723182678223, "global_step": 161903, "epoch": 3854} {"train_loss": -6.9626312255859375, "global_step": 161904, "epoch": 3854} {"train_loss": -6.856632709503174, "global_step": 161905, "epoch": 3854} {"train_loss": -6.889472961425781, "global_step": 161906, "epoch": 3854} {"train_loss": -6.924734592437744, "global_step": 161907, "epoch": 3854} {"train_loss": -6.996981143951416, "global_step": 161908, "epoch": 3854} {"train_loss": -6.9465267317635675, "global_step": 161909, "epoch": 3854, "val_loss": 68477.234375} {"train_loss": -6.906284332275391, "global_step": 161910, "epoch": 3855} {"train_loss": -6.982355117797852, "global_step": 161911, "epoch": 3855} {"train_loss": -6.979957580566406, "global_step": 161912, "epoch": 3855} {"train_loss": -6.970923900604248, "global_step": 161913, "epoch": 3855} {"train_loss": -6.966335296630859, "global_step": 161914, "epoch": 3855} {"train_loss": -6.919716835021973, "global_step": 161915, "epoch": 3855} {"train_loss": -7.003894805908203, "global_step": 161916, "epoch": 3855} {"train_loss": -6.979567527770996, "global_step": 161917, "epoch": 3855} {"train_loss": -6.968317031860352, "global_step": 161918, "epoch": 3855} {"train_loss": -6.926702499389648, "global_step": 161919, "epoch": 3855} {"train_loss": -6.900433540344238, "global_step": 161920, "epoch": 3855} {"train_loss": -6.954925060272217, "global_step": 161921, "epoch": 3855} {"train_loss": -6.840790748596191, "global_step": 161922, "epoch": 3855} {"train_loss": -6.97353458404541, "global_step": 161923, "epoch": 3855} {"train_loss": -6.958240032196045, "global_step": 161924, "epoch": 3855} {"train_loss": -6.97271728515625, "global_step": 161925, "epoch": 3855} {"train_loss": -6.931125164031982, "global_step": 161926, "epoch": 3855} {"train_loss": -6.912794589996338, "global_step": 161927, "epoch": 3855} {"train_loss": -6.923993110656738, "global_step": 161928, "epoch": 3855} {"train_loss": -6.980581283569336, "global_step": 161929, "epoch": 3855} {"train_loss": -7.021152496337891, "global_step": 161930, "epoch": 3855} {"train_loss": -6.8791704177856445, "global_step": 161931, "epoch": 3855} {"train_loss": -6.895930767059326, "global_step": 161932, "epoch": 3855} {"train_loss": -6.809816837310791, "global_step": 161933, "epoch": 3855} {"train_loss": -6.836480140686035, "global_step": 161934, "epoch": 3855} {"train_loss": -6.904447078704834, "global_step": 161935, "epoch": 3855} {"train_loss": -6.819850921630859, "global_step": 161936, "epoch": 3855} {"train_loss": -6.814896583557129, "global_step": 161937, "epoch": 3855} {"train_loss": -6.984457015991211, "global_step": 161938, "epoch": 3855} {"train_loss": -6.874993324279785, "global_step": 161939, "epoch": 3855} {"train_loss": -6.880475044250488, "global_step": 161940, "epoch": 3855} {"train_loss": -6.86395263671875, "global_step": 161941, "epoch": 3855} {"train_loss": -6.862558364868164, "global_step": 161942, "epoch": 3855} {"train_loss": -6.965126991271973, "global_step": 161943, "epoch": 3855} {"train_loss": -6.917518615722656, "global_step": 161944, "epoch": 3855} {"train_loss": -6.914755821228027, "global_step": 161945, "epoch": 3855} {"train_loss": -6.836053848266602, "global_step": 161946, "epoch": 3855} {"train_loss": -6.844911098480225, "global_step": 161947, "epoch": 3855} {"train_loss": -6.931245803833008, "global_step": 161948, "epoch": 3855} {"train_loss": -6.827058792114258, "global_step": 161949, "epoch": 3855} {"train_loss": -6.892642498016357, "global_step": 161950, "epoch": 3855} {"train_loss": -6.91507575625465, "global_step": 161951, "epoch": 3855, "val_loss": 68802.9453125} {"train_loss": -6.933697700500488, "global_step": 161952, "epoch": 3856} {"train_loss": -6.961177825927734, "global_step": 161953, "epoch": 3856} {"train_loss": -6.856238842010498, "global_step": 161954, "epoch": 3856} {"train_loss": -7.053136825561523, "global_step": 161955, "epoch": 3856} {"train_loss": -6.949618816375732, "global_step": 161956, "epoch": 3856} {"train_loss": -6.921690940856934, "global_step": 161957, "epoch": 3856} {"train_loss": -6.995822906494141, "global_step": 161958, "epoch": 3856} {"train_loss": -6.917274475097656, "global_step": 161959, "epoch": 3856} {"train_loss": -7.018484115600586, "global_step": 161960, "epoch": 3856} {"train_loss": -6.976080894470215, "global_step": 161961, "epoch": 3856} {"train_loss": -6.988219738006592, "global_step": 161962, "epoch": 3856} {"train_loss": -7.111772060394287, "global_step": 161963, "epoch": 3856} {"train_loss": -6.933543682098389, "global_step": 161964, "epoch": 3856} {"train_loss": -7.083446025848389, "global_step": 161965, "epoch": 3856} {"train_loss": -7.0231828689575195, "global_step": 161966, "epoch": 3856} {"train_loss": -6.984455585479736, "global_step": 161967, "epoch": 3856} {"train_loss": -6.976655006408691, "global_step": 161968, "epoch": 3856} {"train_loss": -6.95684814453125, "global_step": 161969, "epoch": 3856} {"train_loss": -7.062268257141113, "global_step": 161970, "epoch": 3856} {"train_loss": -7.015484809875488, "global_step": 161971, "epoch": 3856} {"train_loss": -6.913835048675537, "global_step": 161972, "epoch": 3856} {"train_loss": -6.9585065841674805, "global_step": 161973, "epoch": 3856} {"train_loss": -6.825280666351318, "global_step": 161974, "epoch": 3856} {"train_loss": -6.898064136505127, "global_step": 161975, "epoch": 3856} {"train_loss": -7.023168563842773, "global_step": 161976, "epoch": 3856} {"train_loss": -6.815761566162109, "global_step": 161977, "epoch": 3856} {"train_loss": -7.0604400634765625, "global_step": 161978, "epoch": 3856} {"train_loss": -7.001702785491943, "global_step": 161979, "epoch": 3856} {"train_loss": -6.836763381958008, "global_step": 161980, "epoch": 3856} {"train_loss": -6.921163558959961, "global_step": 161981, "epoch": 3856} {"train_loss": -6.944770812988281, "global_step": 161982, "epoch": 3856} {"train_loss": -6.815892219543457, "global_step": 161983, "epoch": 3856} {"train_loss": -7.012365341186523, "global_step": 161984, "epoch": 3856} {"train_loss": -6.80573844909668, "global_step": 161985, "epoch": 3856} {"train_loss": -6.952136993408203, "global_step": 161986, "epoch": 3856} {"train_loss": -6.865278720855713, "global_step": 161987, "epoch": 3856} {"train_loss": -6.823358058929443, "global_step": 161988, "epoch": 3856} {"train_loss": -7.01186466217041, "global_step": 161989, "epoch": 3856} {"train_loss": -6.803442001342773, "global_step": 161990, "epoch": 3856} {"train_loss": -6.92825984954834, "global_step": 161991, "epoch": 3856} {"train_loss": -6.9051833152771, "global_step": 161992, "epoch": 3856} {"train_loss": -6.947449638730004, "global_step": 161993, "epoch": 3856, "val_loss": 68820.21875} {"train_loss": -6.972323417663574, "global_step": 161994, "epoch": 3857} {"train_loss": -6.73987340927124, "global_step": 161995, "epoch": 3857} {"train_loss": -6.878996849060059, "global_step": 161996, "epoch": 3857} {"train_loss": -6.931366920471191, "global_step": 161997, "epoch": 3857} {"train_loss": -6.95078182220459, "global_step": 161998, "epoch": 3857} {"train_loss": -6.844978332519531, "global_step": 161999, "epoch": 3857} {"train_loss": -6.9596147537231445, "global_step": 162000, "epoch": 3857} {"train_loss": -6.857680320739746, "global_step": 162001, "epoch": 3857} {"train_loss": -6.838568687438965, "global_step": 162002, "epoch": 3857} {"train_loss": -6.880723476409912, "global_step": 162003, "epoch": 3857} {"train_loss": -6.9469194412231445, "global_step": 162004, "epoch": 3857} {"train_loss": -6.978866100311279, "global_step": 162005, "epoch": 3857} {"train_loss": -6.919328689575195, "global_step": 162006, "epoch": 3857} {"train_loss": -6.987271308898926, "global_step": 162007, "epoch": 3857} {"train_loss": -6.941122055053711, "global_step": 162008, "epoch": 3857} {"train_loss": -6.898652076721191, "global_step": 162009, "epoch": 3857} {"train_loss": -6.983675003051758, "global_step": 162010, "epoch": 3857} {"train_loss": -6.823304653167725, "global_step": 162011, "epoch": 3857} {"train_loss": -7.012235164642334, "global_step": 162012, "epoch": 3857} {"train_loss": -7.092387676239014, "global_step": 162013, "epoch": 3857} {"train_loss": -6.959171772003174, "global_step": 162014, "epoch": 3857} {"train_loss": -6.9930219650268555, "global_step": 162015, "epoch": 3857} {"train_loss": -7.012709617614746, "global_step": 162016, "epoch": 3857} {"train_loss": -6.995771408081055, "global_step": 162017, "epoch": 3857} {"train_loss": -6.903918266296387, "global_step": 162018, "epoch": 3857} {"train_loss": -7.010022163391113, "global_step": 162019, "epoch": 3857} {"train_loss": -6.983591079711914, "global_step": 162020, "epoch": 3857} {"train_loss": -6.809089660644531, "global_step": 162021, "epoch": 3857} {"train_loss": -6.9681901931762695, "global_step": 162022, "epoch": 3857} {"train_loss": -6.888919830322266, "global_step": 162023, "epoch": 3857} {"train_loss": -6.902204513549805, "global_step": 162024, "epoch": 3857} {"train_loss": -6.984404563903809, "global_step": 162025, "epoch": 3857} {"train_loss": -7.000031471252441, "global_step": 162026, "epoch": 3857} {"train_loss": -7.001549243927002, "global_step": 162027, "epoch": 3857} {"train_loss": -6.848886966705322, "global_step": 162028, "epoch": 3857} {"train_loss": -7.003124713897705, "global_step": 162029, "epoch": 3857} {"train_loss": -6.9312968254089355, "global_step": 162030, "epoch": 3857} {"train_loss": -6.843749046325684, "global_step": 162031, "epoch": 3857} {"train_loss": -7.053292751312256, "global_step": 162032, "epoch": 3857} {"train_loss": -6.989095211029053, "global_step": 162033, "epoch": 3857} {"train_loss": -7.016596794128418, "global_step": 162034, "epoch": 3857} {"train_loss": -6.941408157348633, "global_step": 162035, "epoch": 3857, "val_loss": 68808.3125} {"train_loss": -6.894768714904785, "global_step": 162036, "epoch": 3858} {"train_loss": -6.951602935791016, "global_step": 162037, "epoch": 3858} {"train_loss": -7.061921119689941, "global_step": 162038, "epoch": 3858} {"train_loss": -7.053006649017334, "global_step": 162039, "epoch": 3858} {"train_loss": -7.084122657775879, "global_step": 162040, "epoch": 3858} {"train_loss": -7.123859405517578, "global_step": 162041, "epoch": 3858} {"train_loss": -6.967123508453369, "global_step": 162042, "epoch": 3858} {"train_loss": -7.005475044250488, "global_step": 162043, "epoch": 3858} {"train_loss": -6.965909004211426, "global_step": 162044, "epoch": 3858} {"train_loss": -7.010439872741699, "global_step": 162045, "epoch": 3858} {"train_loss": -6.888457298278809, "global_step": 162046, "epoch": 3858} {"train_loss": -6.952934741973877, "global_step": 162047, "epoch": 3858} {"train_loss": -6.97515344619751, "global_step": 162048, "epoch": 3858} {"train_loss": -6.693192005157471, "global_step": 162049, "epoch": 3858} {"train_loss": -6.560628890991211, "global_step": 162050, "epoch": 3858} {"train_loss": -7.0501861572265625, "global_step": 162051, "epoch": 3858} {"train_loss": -6.87713623046875, "global_step": 162052, "epoch": 3858} {"train_loss": -6.924749374389648, "global_step": 162053, "epoch": 3858} {"train_loss": -6.8729095458984375, "global_step": 162054, "epoch": 3858} {"train_loss": -6.886924743652344, "global_step": 162055, "epoch": 3858} {"train_loss": -6.963944435119629, "global_step": 162056, "epoch": 3858} {"train_loss": -6.854692459106445, "global_step": 162057, "epoch": 3858} {"train_loss": -6.854055404663086, "global_step": 162058, "epoch": 3858} {"train_loss": -6.979139804840088, "global_step": 162059, "epoch": 3858} {"train_loss": -6.863447189331055, "global_step": 162060, "epoch": 3858} {"train_loss": -6.894556045532227, "global_step": 162061, "epoch": 3858} {"train_loss": -6.954389572143555, "global_step": 162062, "epoch": 3858} {"train_loss": -6.887701034545898, "global_step": 162063, "epoch": 3858} {"train_loss": -6.907975196838379, "global_step": 162064, "epoch": 3858} {"train_loss": -6.906966209411621, "global_step": 162065, "epoch": 3858} {"train_loss": -6.94641637802124, "global_step": 162066, "epoch": 3858} {"train_loss": -6.976979732513428, "global_step": 162067, "epoch": 3858} {"train_loss": -6.908031463623047, "global_step": 162068, "epoch": 3858} {"train_loss": -6.806301116943359, "global_step": 162069, "epoch": 3858} {"train_loss": -6.895169258117676, "global_step": 162070, "epoch": 3858} {"train_loss": -6.950511455535889, "global_step": 162071, "epoch": 3858} {"train_loss": -6.885931015014648, "global_step": 162072, "epoch": 3858} {"train_loss": -6.893373489379883, "global_step": 162073, "epoch": 3858} {"train_loss": -6.926033973693848, "global_step": 162074, "epoch": 3858} {"train_loss": -6.956317901611328, "global_step": 162075, "epoch": 3858} {"train_loss": -7.043466567993164, "global_step": 162076, "epoch": 3858} {"train_loss": -6.928191491535732, "global_step": 162077, "epoch": 3858, "val_loss": 68480.7734375} {"train_loss": -7.020875930786133, "global_step": 162078, "epoch": 3859} {"train_loss": -7.004080772399902, "global_step": 162079, "epoch": 3859} {"train_loss": -6.943871974945068, "global_step": 162080, "epoch": 3859} {"train_loss": -6.930367469787598, "global_step": 162081, "epoch": 3859} {"train_loss": -6.967548847198486, "global_step": 162082, "epoch": 3859} {"train_loss": -7.077585220336914, "global_step": 162083, "epoch": 3859} {"train_loss": -7.058825969696045, "global_step": 162084, "epoch": 3859} {"train_loss": -6.872533798217773, "global_step": 162085, "epoch": 3859} {"train_loss": -7.033184051513672, "global_step": 162086, "epoch": 3859} {"train_loss": -7.071105480194092, "global_step": 162087, "epoch": 3859} {"train_loss": -6.973086833953857, "global_step": 162088, "epoch": 3859} {"train_loss": -6.96409273147583, "global_step": 162089, "epoch": 3859} {"train_loss": -6.943756103515625, "global_step": 162090, "epoch": 3859} {"train_loss": -6.9863457679748535, "global_step": 162091, "epoch": 3859} {"train_loss": -6.871767044067383, "global_step": 162092, "epoch": 3859} {"train_loss": -6.933570384979248, "global_step": 162093, "epoch": 3859} {"train_loss": -7.027885913848877, "global_step": 162094, "epoch": 3859} {"train_loss": -6.818207740783691, "global_step": 162095, "epoch": 3859} {"train_loss": -6.967325210571289, "global_step": 162096, "epoch": 3859} {"train_loss": -6.878605365753174, "global_step": 162097, "epoch": 3859} {"train_loss": -6.954380035400391, "global_step": 162098, "epoch": 3859} {"train_loss": -6.990105628967285, "global_step": 162099, "epoch": 3859} {"train_loss": -6.949098587036133, "global_step": 162100, "epoch": 3859} {"train_loss": -6.997744560241699, "global_step": 162101, "epoch": 3859} {"train_loss": -6.914910793304443, "global_step": 162102, "epoch": 3859} {"train_loss": -6.8441925048828125, "global_step": 162103, "epoch": 3859} {"train_loss": -6.846304893493652, "global_step": 162104, "epoch": 3859} {"train_loss": -6.879683494567871, "global_step": 162105, "epoch": 3859} {"train_loss": -6.9308624267578125, "global_step": 162106, "epoch": 3859} {"train_loss": -7.012146949768066, "global_step": 162107, "epoch": 3859} {"train_loss": -6.977558612823486, "global_step": 162108, "epoch": 3859} {"train_loss": -6.972507476806641, "global_step": 162109, "epoch": 3859} {"train_loss": -6.950039863586426, "global_step": 162110, "epoch": 3859} {"train_loss": -6.92243766784668, "global_step": 162111, "epoch": 3859} {"train_loss": -6.925387382507324, "global_step": 162112, "epoch": 3859} {"train_loss": -6.90834903717041, "global_step": 162113, "epoch": 3859} {"train_loss": -7.130867004394531, "global_step": 162114, "epoch": 3859} {"train_loss": -7.030392646789551, "global_step": 162115, "epoch": 3859} {"train_loss": -7.0588698387146, "global_step": 162116, "epoch": 3859} {"train_loss": -6.990047454833984, "global_step": 162117, "epoch": 3859} {"train_loss": -6.997066497802734, "global_step": 162118, "epoch": 3859} {"train_loss": -6.962010394959223, "global_step": 162119, "epoch": 3859, "val_loss": 68601.46875} {"train_loss": -6.939870834350586, "global_step": 162120, "epoch": 3860} {"train_loss": -6.875110626220703, "global_step": 162121, "epoch": 3860} {"train_loss": -6.948631763458252, "global_step": 162122, "epoch": 3860} {"train_loss": -7.0853118896484375, "global_step": 162123, "epoch": 3860} {"train_loss": -6.968239784240723, "global_step": 162124, "epoch": 3860} {"train_loss": -7.095595359802246, "global_step": 162125, "epoch": 3860} {"train_loss": -6.930517196655273, "global_step": 162126, "epoch": 3860} {"train_loss": -7.0259904861450195, "global_step": 162127, "epoch": 3860} {"train_loss": -6.983503818511963, "global_step": 162128, "epoch": 3860} {"train_loss": -7.031832218170166, "global_step": 162129, "epoch": 3860} {"train_loss": -6.922316551208496, "global_step": 162130, "epoch": 3860} {"train_loss": -7.02772855758667, "global_step": 162131, "epoch": 3860} {"train_loss": -7.032121181488037, "global_step": 162132, "epoch": 3860} {"train_loss": -6.967547416687012, "global_step": 162133, "epoch": 3860} {"train_loss": -7.115857124328613, "global_step": 162134, "epoch": 3860} {"train_loss": -7.0383501052856445, "global_step": 162135, "epoch": 3860} {"train_loss": -7.017085552215576, "global_step": 162136, "epoch": 3860} {"train_loss": -7.095277309417725, "global_step": 162137, "epoch": 3860} {"train_loss": -6.949620246887207, "global_step": 162138, "epoch": 3860} {"train_loss": -7.042900085449219, "global_step": 162139, "epoch": 3860} {"train_loss": -7.01308012008667, "global_step": 162140, "epoch": 3860} {"train_loss": -7.018664836883545, "global_step": 162141, "epoch": 3860} {"train_loss": -6.931851863861084, "global_step": 162142, "epoch": 3860} {"train_loss": -7.044539928436279, "global_step": 162143, "epoch": 3860} {"train_loss": -6.8504838943481445, "global_step": 162144, "epoch": 3860} {"train_loss": -6.977128028869629, "global_step": 162145, "epoch": 3860} {"train_loss": -6.920022964477539, "global_step": 162146, "epoch": 3860} {"train_loss": -7.072901725769043, "global_step": 162147, "epoch": 3860} {"train_loss": -6.953324317932129, "global_step": 162148, "epoch": 3860} {"train_loss": -7.03555965423584, "global_step": 162149, "epoch": 3860} {"train_loss": -7.088502407073975, "global_step": 162150, "epoch": 3860} {"train_loss": -6.941972732543945, "global_step": 162151, "epoch": 3860} {"train_loss": -6.91435432434082, "global_step": 162152, "epoch": 3860} {"train_loss": -6.962430000305176, "global_step": 162153, "epoch": 3860} {"train_loss": -6.9398908615112305, "global_step": 162154, "epoch": 3860} {"train_loss": -6.908825874328613, "global_step": 162155, "epoch": 3860} {"train_loss": -6.984692096710205, "global_step": 162156, "epoch": 3860} {"train_loss": -7.081880569458008, "global_step": 162157, "epoch": 3860} {"train_loss": -6.991296291351318, "global_step": 162158, "epoch": 3860} {"train_loss": -7.0393781661987305, "global_step": 162159, "epoch": 3860} {"train_loss": -6.920249938964844, "global_step": 162160, "epoch": 3860} {"train_loss": -6.992368471054804, "global_step": 162161, "epoch": 3860, "val_loss": 68649.765625} {"train_loss": -7.02921199798584, "global_step": 162162, "epoch": 3861} {"train_loss": -7.041319847106934, "global_step": 162163, "epoch": 3861} {"train_loss": -6.983903408050537, "global_step": 162164, "epoch": 3861} {"train_loss": -7.048222064971924, "global_step": 162165, "epoch": 3861} {"train_loss": -7.031575679779053, "global_step": 162166, "epoch": 3861} {"train_loss": -6.959822654724121, "global_step": 162167, "epoch": 3861} {"train_loss": -6.941598892211914, "global_step": 162168, "epoch": 3861} {"train_loss": -6.904726028442383, "global_step": 162169, "epoch": 3861} {"train_loss": -6.929157257080078, "global_step": 162170, "epoch": 3861} {"train_loss": -6.966818332672119, "global_step": 162171, "epoch": 3861} {"train_loss": -6.982481002807617, "global_step": 162172, "epoch": 3861} {"train_loss": -6.79081916809082, "global_step": 162173, "epoch": 3861} {"train_loss": -6.9885993003845215, "global_step": 162174, "epoch": 3861} {"train_loss": -6.878939628601074, "global_step": 162175, "epoch": 3861} {"train_loss": -6.893185615539551, "global_step": 162176, "epoch": 3861} {"train_loss": -7.083454132080078, "global_step": 162177, "epoch": 3861} {"train_loss": -6.878291130065918, "global_step": 162178, "epoch": 3861} {"train_loss": -6.9343085289001465, "global_step": 162179, "epoch": 3861} {"train_loss": -6.9538679122924805, "global_step": 162180, "epoch": 3861} {"train_loss": -6.8295769691467285, "global_step": 162181, "epoch": 3861} {"train_loss": -6.954187393188477, "global_step": 162182, "epoch": 3861} {"train_loss": -7.054688930511475, "global_step": 162183, "epoch": 3861} {"train_loss": -6.822681427001953, "global_step": 162184, "epoch": 3861} {"train_loss": -6.921726703643799, "global_step": 162185, "epoch": 3861} {"train_loss": -6.912440776824951, "global_step": 162186, "epoch": 3861} {"train_loss": -6.897372722625732, "global_step": 162187, "epoch": 3861} {"train_loss": -6.90516996383667, "global_step": 162188, "epoch": 3861} {"train_loss": -6.844289779663086, "global_step": 162189, "epoch": 3861} {"train_loss": -6.96531867980957, "global_step": 162190, "epoch": 3861} {"train_loss": -6.858128070831299, "global_step": 162191, "epoch": 3861} {"train_loss": -7.114319801330566, "global_step": 162192, "epoch": 3861} {"train_loss": -6.943338871002197, "global_step": 162193, "epoch": 3861} {"train_loss": -6.887943267822266, "global_step": 162194, "epoch": 3861} {"train_loss": -6.86165714263916, "global_step": 162195, "epoch": 3861} {"train_loss": -6.892646789550781, "global_step": 162196, "epoch": 3861} {"train_loss": -6.93594217300415, "global_step": 162197, "epoch": 3861} {"train_loss": -6.924097061157227, "global_step": 162198, "epoch": 3861} {"train_loss": -6.877630710601807, "global_step": 162199, "epoch": 3861} {"train_loss": -6.873746871948242, "global_step": 162200, "epoch": 3861} {"train_loss": -6.762334823608398, "global_step": 162201, "epoch": 3861} {"train_loss": -6.981950759887695, "global_step": 162202, "epoch": 3861} {"train_loss": -6.931616124652681, "global_step": 162203, "epoch": 3861, "val_loss": 68854.4609375} {"train_loss": -6.86450719833374, "global_step": 162204, "epoch": 3862} {"train_loss": -6.925414085388184, "global_step": 162205, "epoch": 3862} {"train_loss": -6.753102779388428, "global_step": 162206, "epoch": 3862} {"train_loss": -7.023986339569092, "global_step": 162207, "epoch": 3862} {"train_loss": -6.93013334274292, "global_step": 162208, "epoch": 3862} {"train_loss": -6.9450364112854, "global_step": 162209, "epoch": 3862} {"train_loss": -6.976850986480713, "global_step": 162210, "epoch": 3862} {"train_loss": -6.939330101013184, "global_step": 162211, "epoch": 3862} {"train_loss": -6.898803234100342, "global_step": 162212, "epoch": 3862} {"train_loss": -7.005936622619629, "global_step": 162213, "epoch": 3862} {"train_loss": -6.97431755065918, "global_step": 162214, "epoch": 3862} {"train_loss": -6.904606819152832, "global_step": 162215, "epoch": 3862} {"train_loss": -6.912256240844727, "global_step": 162216, "epoch": 3862} {"train_loss": -6.995656967163086, "global_step": 162217, "epoch": 3862} {"train_loss": -7.033138751983643, "global_step": 162218, "epoch": 3862} {"train_loss": -6.997246742248535, "global_step": 162219, "epoch": 3862} {"train_loss": -6.9990997314453125, "global_step": 162220, "epoch": 3862} {"train_loss": -6.940840721130371, "global_step": 162221, "epoch": 3862} {"train_loss": -6.934567451477051, "global_step": 162222, "epoch": 3862} {"train_loss": -6.982538223266602, "global_step": 162223, "epoch": 3862} {"train_loss": -6.989213943481445, "global_step": 162224, "epoch": 3862} {"train_loss": -7.014182090759277, "global_step": 162225, "epoch": 3862} {"train_loss": -7.005990505218506, "global_step": 162226, "epoch": 3862} {"train_loss": -6.8907976150512695, "global_step": 162227, "epoch": 3862} {"train_loss": -7.132733345031738, "global_step": 162228, "epoch": 3862} {"train_loss": -7.0332136154174805, "global_step": 162229, "epoch": 3862} {"train_loss": -6.986110687255859, "global_step": 162230, "epoch": 3862} {"train_loss": -6.995275974273682, "global_step": 162231, "epoch": 3862} {"train_loss": -6.981569290161133, "global_step": 162232, "epoch": 3862} {"train_loss": -6.903637886047363, "global_step": 162233, "epoch": 3862} {"train_loss": -7.150110244750977, "global_step": 162234, "epoch": 3862} {"train_loss": -7.090519905090332, "global_step": 162235, "epoch": 3862} {"train_loss": -7.005800247192383, "global_step": 162236, "epoch": 3862} {"train_loss": -7.045660972595215, "global_step": 162237, "epoch": 3862} {"train_loss": -7.111222743988037, "global_step": 162238, "epoch": 3862} {"train_loss": -6.983613967895508, "global_step": 162239, "epoch": 3862} {"train_loss": -7.00417423248291, "global_step": 162240, "epoch": 3862} {"train_loss": -7.065302848815918, "global_step": 162241, "epoch": 3862} {"train_loss": -7.038542747497559, "global_step": 162242, "epoch": 3862} {"train_loss": -7.106303691864014, "global_step": 162243, "epoch": 3862} {"train_loss": -6.976077079772949, "global_step": 162244, "epoch": 3862} {"train_loss": -6.985693193617321, "global_step": 162245, "epoch": 3862, "val_loss": 68423.78125} {"train_loss": -7.099855899810791, "global_step": 162246, "epoch": 3863} {"train_loss": -6.946990966796875, "global_step": 162247, "epoch": 3863} {"train_loss": -7.0083723068237305, "global_step": 162248, "epoch": 3863} {"train_loss": -6.906647682189941, "global_step": 162249, "epoch": 3863} {"train_loss": -7.128807544708252, "global_step": 162250, "epoch": 3863} {"train_loss": -6.94746732711792, "global_step": 162251, "epoch": 3863} {"train_loss": -6.934001445770264, "global_step": 162252, "epoch": 3863} {"train_loss": -6.971426486968994, "global_step": 162253, "epoch": 3863} {"train_loss": -6.996509552001953, "global_step": 162254, "epoch": 3863} {"train_loss": -6.983459949493408, "global_step": 162255, "epoch": 3863} {"train_loss": -7.036426544189453, "global_step": 162256, "epoch": 3863} {"train_loss": -7.038449287414551, "global_step": 162257, "epoch": 3863} {"train_loss": -7.0459208488464355, "global_step": 162258, "epoch": 3863} {"train_loss": -6.999358177185059, "global_step": 162259, "epoch": 3863} {"train_loss": -6.945757865905762, "global_step": 162260, "epoch": 3863} {"train_loss": -6.901826858520508, "global_step": 162261, "epoch": 3863} {"train_loss": -7.025189399719238, "global_step": 162262, "epoch": 3863} {"train_loss": -7.084208965301514, "global_step": 162263, "epoch": 3863} {"train_loss": -6.959799766540527, "global_step": 162264, "epoch": 3863} {"train_loss": -7.012085437774658, "global_step": 162265, "epoch": 3863} {"train_loss": -6.857680320739746, "global_step": 162266, "epoch": 3863} {"train_loss": -7.053064346313477, "global_step": 162267, "epoch": 3863} {"train_loss": -7.016922473907471, "global_step": 162268, "epoch": 3863} {"train_loss": -6.9981689453125, "global_step": 162269, "epoch": 3863} {"train_loss": -6.972452640533447, "global_step": 162270, "epoch": 3863} {"train_loss": -6.89669132232666, "global_step": 162271, "epoch": 3863} {"train_loss": -6.955362796783447, "global_step": 162272, "epoch": 3863} {"train_loss": -7.12734842300415, "global_step": 162273, "epoch": 3863} {"train_loss": -6.940674304962158, "global_step": 162274, "epoch": 3863} {"train_loss": -7.091048240661621, "global_step": 162275, "epoch": 3863} {"train_loss": -6.997827529907227, "global_step": 162276, "epoch": 3863} {"train_loss": -6.937166690826416, "global_step": 162277, "epoch": 3863} {"train_loss": -7.057076930999756, "global_step": 162278, "epoch": 3863} {"train_loss": -6.95004940032959, "global_step": 162279, "epoch": 3863} {"train_loss": -7.015964508056641, "global_step": 162280, "epoch": 3863} {"train_loss": -7.0629987716674805, "global_step": 162281, "epoch": 3863} {"train_loss": -7.097470283508301, "global_step": 162282, "epoch": 3863} {"train_loss": -7.065502166748047, "global_step": 162283, "epoch": 3863} {"train_loss": -7.135396957397461, "global_step": 162284, "epoch": 3863} {"train_loss": -7.117636203765869, "global_step": 162285, "epoch": 3863} {"train_loss": -6.9788103103637695, "global_step": 162286, "epoch": 3863} {"train_loss": -7.0101709479377385, "global_step": 162287, "epoch": 3863, "val_loss": 68732.7890625} {"train_loss": -6.989694595336914, "global_step": 162288, "epoch": 3864} {"train_loss": -6.955034255981445, "global_step": 162289, "epoch": 3864} {"train_loss": -7.038626670837402, "global_step": 162290, "epoch": 3864} {"train_loss": -7.046637058258057, "global_step": 162291, "epoch": 3864} {"train_loss": -7.0778093338012695, "global_step": 162292, "epoch": 3864} {"train_loss": -7.006913661956787, "global_step": 162293, "epoch": 3864} {"train_loss": -6.933078765869141, "global_step": 162294, "epoch": 3864} {"train_loss": -7.115799427032471, "global_step": 162295, "epoch": 3864} {"train_loss": -7.061956405639648, "global_step": 162296, "epoch": 3864} {"train_loss": -6.933632850646973, "global_step": 162297, "epoch": 3864} {"train_loss": -6.992742538452148, "global_step": 162298, "epoch": 3864} {"train_loss": -6.993005752563477, "global_step": 162299, "epoch": 3864} {"train_loss": -6.999655246734619, "global_step": 162300, "epoch": 3864} {"train_loss": -7.055552005767822, "global_step": 162301, "epoch": 3864} {"train_loss": -7.030421257019043, "global_step": 162302, "epoch": 3864} {"train_loss": -7.01477575302124, "global_step": 162303, "epoch": 3864} {"train_loss": -7.004559516906738, "global_step": 162304, "epoch": 3864} {"train_loss": -6.937346458435059, "global_step": 162305, "epoch": 3864} {"train_loss": -6.999826431274414, "global_step": 162306, "epoch": 3864} {"train_loss": -6.965446472167969, "global_step": 162307, "epoch": 3864} {"train_loss": -6.9641900062561035, "global_step": 162308, "epoch": 3864} {"train_loss": -7.003780841827393, "global_step": 162309, "epoch": 3864} {"train_loss": -7.027890205383301, "global_step": 162310, "epoch": 3864} {"train_loss": -6.9422760009765625, "global_step": 162311, "epoch": 3864} {"train_loss": -7.00749397277832, "global_step": 162312, "epoch": 3864} {"train_loss": -6.920764923095703, "global_step": 162313, "epoch": 3864} {"train_loss": -6.927054405212402, "global_step": 162314, "epoch": 3864} {"train_loss": -6.9612135887146, "global_step": 162315, "epoch": 3864} {"train_loss": -6.868922233581543, "global_step": 162316, "epoch": 3864} {"train_loss": -6.998956203460693, "global_step": 162317, "epoch": 3864} {"train_loss": -6.9473443031311035, "global_step": 162318, "epoch": 3864} {"train_loss": -6.809606552124023, "global_step": 162319, "epoch": 3864} {"train_loss": -7.015528678894043, "global_step": 162320, "epoch": 3864} {"train_loss": -6.956888675689697, "global_step": 162321, "epoch": 3864} {"train_loss": -6.804232120513916, "global_step": 162322, "epoch": 3864} {"train_loss": -6.9623212814331055, "global_step": 162323, "epoch": 3864} {"train_loss": -6.883758068084717, "global_step": 162324, "epoch": 3864} {"train_loss": -6.856461524963379, "global_step": 162325, "epoch": 3864} {"train_loss": -6.920175075531006, "global_step": 162326, "epoch": 3864} {"train_loss": -6.872990608215332, "global_step": 162327, "epoch": 3864} {"train_loss": -6.974656105041504, "global_step": 162328, "epoch": 3864} {"train_loss": -6.966403813589187, "global_step": 162329, "epoch": 3864, "val_loss": 68380.78125} {"train_loss": -6.881095886230469, "global_step": 162330, "epoch": 3865} {"train_loss": -6.7985734939575195, "global_step": 162331, "epoch": 3865} {"train_loss": -6.924105167388916, "global_step": 162332, "epoch": 3865} {"train_loss": -6.828332901000977, "global_step": 162333, "epoch": 3865} {"train_loss": -6.935965538024902, "global_step": 162334, "epoch": 3865} {"train_loss": -6.922269344329834, "global_step": 162335, "epoch": 3865} {"train_loss": -6.925261497497559, "global_step": 162336, "epoch": 3865} {"train_loss": -6.9078569412231445, "global_step": 162337, "epoch": 3865} {"train_loss": -6.8239850997924805, "global_step": 162338, "epoch": 3865} {"train_loss": -6.9214253425598145, "global_step": 162339, "epoch": 3865} {"train_loss": -6.916154861450195, "global_step": 162340, "epoch": 3865} {"train_loss": -6.890722274780273, "global_step": 162341, "epoch": 3865} {"train_loss": -6.935520172119141, "global_step": 162342, "epoch": 3865} {"train_loss": -6.8051629066467285, "global_step": 162343, "epoch": 3865} {"train_loss": -6.940995216369629, "global_step": 162344, "epoch": 3865} {"train_loss": -6.949173450469971, "global_step": 162345, "epoch": 3865} {"train_loss": -6.888523101806641, "global_step": 162346, "epoch": 3865} {"train_loss": -6.944236755371094, "global_step": 162347, "epoch": 3865} {"train_loss": -6.901213645935059, "global_step": 162348, "epoch": 3865} {"train_loss": -6.9092512130737305, "global_step": 162349, "epoch": 3865} {"train_loss": -7.014831066131592, "global_step": 162350, "epoch": 3865} {"train_loss": -6.843454360961914, "global_step": 162351, "epoch": 3865} {"train_loss": -6.865708827972412, "global_step": 162352, "epoch": 3865} {"train_loss": -6.909220218658447, "global_step": 162353, "epoch": 3865} {"train_loss": -6.908601760864258, "global_step": 162354, "epoch": 3865} {"train_loss": -6.871756553649902, "global_step": 162355, "epoch": 3865} {"train_loss": -6.975432395935059, "global_step": 162356, "epoch": 3865} {"train_loss": -6.862575531005859, "global_step": 162357, "epoch": 3865} {"train_loss": -6.938593864440918, "global_step": 162358, "epoch": 3865} {"train_loss": -6.993459224700928, "global_step": 162359, "epoch": 3865} {"train_loss": -6.870112419128418, "global_step": 162360, "epoch": 3865} {"train_loss": -6.926481246948242, "global_step": 162361, "epoch": 3865} {"train_loss": -6.966284275054932, "global_step": 162362, "epoch": 3865} {"train_loss": -6.731781482696533, "global_step": 162363, "epoch": 3865} {"train_loss": -6.871485710144043, "global_step": 162364, "epoch": 3865} {"train_loss": -7.006436347961426, "global_step": 162365, "epoch": 3865} {"train_loss": -6.9177069664001465, "global_step": 162366, "epoch": 3865} {"train_loss": -6.938248157501221, "global_step": 162367, "epoch": 3865} {"train_loss": -6.962451934814453, "global_step": 162368, "epoch": 3865} {"train_loss": -6.9569196701049805, "global_step": 162369, "epoch": 3865} {"train_loss": -6.993486404418945, "global_step": 162370, "epoch": 3865} {"train_loss": -6.909980081376576, "global_step": 162371, "epoch": 3865, "val_loss": 68628.1875} {"train_loss": -6.968696594238281, "global_step": 162372, "epoch": 3866} {"train_loss": -6.787213325500488, "global_step": 162373, "epoch": 3866} {"train_loss": -6.962379455566406, "global_step": 162374, "epoch": 3866} {"train_loss": -6.958173751831055, "global_step": 162375, "epoch": 3866} {"train_loss": -6.957915306091309, "global_step": 162376, "epoch": 3866} {"train_loss": -6.945973873138428, "global_step": 162377, "epoch": 3866} {"train_loss": -6.857203483581543, "global_step": 162378, "epoch": 3866} {"train_loss": -7.010141372680664, "global_step": 162379, "epoch": 3866} {"train_loss": -6.995728492736816, "global_step": 162380, "epoch": 3866} {"train_loss": -7.010735511779785, "global_step": 162381, "epoch": 3866} {"train_loss": -6.840813636779785, "global_step": 162382, "epoch": 3866} {"train_loss": -7.088902473449707, "global_step": 162383, "epoch": 3866} {"train_loss": -7.000718116760254, "global_step": 162384, "epoch": 3866} {"train_loss": -6.905835151672363, "global_step": 162385, "epoch": 3866} {"train_loss": -6.840024948120117, "global_step": 162386, "epoch": 3866} {"train_loss": -7.009461402893066, "global_step": 162387, "epoch": 3866} {"train_loss": -6.878688812255859, "global_step": 162388, "epoch": 3866} {"train_loss": -6.917891502380371, "global_step": 162389, "epoch": 3866} {"train_loss": -6.9989800453186035, "global_step": 162390, "epoch": 3866} {"train_loss": -7.058164596557617, "global_step": 162391, "epoch": 3866} {"train_loss": -6.905097007751465, "global_step": 162392, "epoch": 3866} {"train_loss": -6.9151506423950195, "global_step": 162393, "epoch": 3866} {"train_loss": -7.064129829406738, "global_step": 162394, "epoch": 3866} {"train_loss": -7.042959690093994, "global_step": 162395, "epoch": 3866} {"train_loss": -7.056632995605469, "global_step": 162396, "epoch": 3866} {"train_loss": -7.048897743225098, "global_step": 162397, "epoch": 3866} {"train_loss": -7.060730457305908, "global_step": 162398, "epoch": 3866} {"train_loss": -7.002906799316406, "global_step": 162399, "epoch": 3866} {"train_loss": -6.956812858581543, "global_step": 162400, "epoch": 3866} {"train_loss": -6.959709167480469, "global_step": 162401, "epoch": 3866} {"train_loss": -7.041329383850098, "global_step": 162402, "epoch": 3866} {"train_loss": -6.99749755859375, "global_step": 162403, "epoch": 3866} {"train_loss": -7.023785591125488, "global_step": 162404, "epoch": 3866} {"train_loss": -6.986262321472168, "global_step": 162405, "epoch": 3866} {"train_loss": -7.0186543464660645, "global_step": 162406, "epoch": 3866} {"train_loss": -7.050898551940918, "global_step": 162407, "epoch": 3866} {"train_loss": -7.0079240798950195, "global_step": 162408, "epoch": 3866} {"train_loss": -7.010012626647949, "global_step": 162409, "epoch": 3866} {"train_loss": -6.950766086578369, "global_step": 162410, "epoch": 3866} {"train_loss": -6.981372833251953, "global_step": 162411, "epoch": 3866} {"train_loss": -6.938058853149414, "global_step": 162412, "epoch": 3866} {"train_loss": -6.97681280544826, "global_step": 162413, "epoch": 3866, "val_loss": 68572.53125} {"train_loss": -6.977535247802734, "global_step": 162414, "epoch": 3867} {"train_loss": -7.060279369354248, "global_step": 162415, "epoch": 3867} {"train_loss": -7.054098129272461, "global_step": 162416, "epoch": 3867} {"train_loss": -6.976434707641602, "global_step": 162417, "epoch": 3867} {"train_loss": -6.991765022277832, "global_step": 162418, "epoch": 3867} {"train_loss": -6.9602370262146, "global_step": 162419, "epoch": 3867} {"train_loss": -7.111651420593262, "global_step": 162420, "epoch": 3867} {"train_loss": -7.023529052734375, "global_step": 162421, "epoch": 3867} {"train_loss": -7.086252689361572, "global_step": 162422, "epoch": 3867} {"train_loss": -7.004108905792236, "global_step": 162423, "epoch": 3867} {"train_loss": -6.964674472808838, "global_step": 162424, "epoch": 3867} {"train_loss": -7.0157365798950195, "global_step": 162425, "epoch": 3867} {"train_loss": -6.981412410736084, "global_step": 162426, "epoch": 3867} {"train_loss": -6.995351791381836, "global_step": 162427, "epoch": 3867} {"train_loss": -6.985954761505127, "global_step": 162428, "epoch": 3867} {"train_loss": -6.824634075164795, "global_step": 162429, "epoch": 3867} {"train_loss": -7.0305047035217285, "global_step": 162430, "epoch": 3867} {"train_loss": -6.953924179077148, "global_step": 162431, "epoch": 3867} {"train_loss": -7.0381622314453125, "global_step": 162432, "epoch": 3867} {"train_loss": -6.987103462219238, "global_step": 162433, "epoch": 3867} {"train_loss": -6.918490409851074, "global_step": 162434, "epoch": 3867} {"train_loss": -6.951407432556152, "global_step": 162435, "epoch": 3867} {"train_loss": -6.977012634277344, "global_step": 162436, "epoch": 3867} {"train_loss": -6.881757736206055, "global_step": 162437, "epoch": 3867} {"train_loss": -6.871037483215332, "global_step": 162438, "epoch": 3867} {"train_loss": -6.928589820861816, "global_step": 162439, "epoch": 3867} {"train_loss": -6.749059677124023, "global_step": 162440, "epoch": 3867} {"train_loss": -6.979009628295898, "global_step": 162441, "epoch": 3867} {"train_loss": -7.017484188079834, "global_step": 162442, "epoch": 3867} {"train_loss": -6.97710657119751, "global_step": 162443, "epoch": 3867} {"train_loss": -7.001614570617676, "global_step": 162444, "epoch": 3867} {"train_loss": -6.911273956298828, "global_step": 162445, "epoch": 3867} {"train_loss": -6.8506364822387695, "global_step": 162446, "epoch": 3867} {"train_loss": -6.939896106719971, "global_step": 162447, "epoch": 3867} {"train_loss": -6.864635467529297, "global_step": 162448, "epoch": 3867} {"train_loss": -6.927202224731445, "global_step": 162449, "epoch": 3867} {"train_loss": -6.851726531982422, "global_step": 162450, "epoch": 3867} {"train_loss": -7.025512218475342, "global_step": 162451, "epoch": 3867} {"train_loss": -6.914823532104492, "global_step": 162452, "epoch": 3867} {"train_loss": -6.964699745178223, "global_step": 162453, "epoch": 3867} {"train_loss": -6.946043968200684, "global_step": 162454, "epoch": 3867} {"train_loss": -6.962332305454073, "global_step": 162455, "epoch": 3867, "val_loss": 68683.7109375} {"train_loss": -6.963484764099121, "global_step": 162456, "epoch": 3868} {"train_loss": -6.948258876800537, "global_step": 162457, "epoch": 3868} {"train_loss": -6.932031631469727, "global_step": 162458, "epoch": 3868} {"train_loss": -7.079707145690918, "global_step": 162459, "epoch": 3868} {"train_loss": -6.95018196105957, "global_step": 162460, "epoch": 3868} {"train_loss": -6.98440408706665, "global_step": 162461, "epoch": 3868} {"train_loss": -7.0563812255859375, "global_step": 162462, "epoch": 3868} {"train_loss": -7.038673400878906, "global_step": 162463, "epoch": 3868} {"train_loss": -7.038227081298828, "global_step": 162464, "epoch": 3868} {"train_loss": -7.003154754638672, "global_step": 162465, "epoch": 3868} {"train_loss": -7.154600143432617, "global_step": 162466, "epoch": 3868} {"train_loss": -6.922675132751465, "global_step": 162467, "epoch": 3868} {"train_loss": -6.970926284790039, "global_step": 162468, "epoch": 3868} {"train_loss": -7.081862449645996, "global_step": 162469, "epoch": 3868} {"train_loss": -6.891628742218018, "global_step": 162470, "epoch": 3868} {"train_loss": -7.039112567901611, "global_step": 162471, "epoch": 3868} {"train_loss": -7.066664218902588, "global_step": 162472, "epoch": 3868} {"train_loss": -7.075270652770996, "global_step": 162473, "epoch": 3868} {"train_loss": -6.945782661437988, "global_step": 162474, "epoch": 3868} {"train_loss": -7.003127098083496, "global_step": 162475, "epoch": 3868} {"train_loss": -6.970417022705078, "global_step": 162476, "epoch": 3868} {"train_loss": -6.965361595153809, "global_step": 162477, "epoch": 3868} {"train_loss": -6.963756561279297, "global_step": 162478, "epoch": 3868} {"train_loss": -6.713920593261719, "global_step": 162479, "epoch": 3868} {"train_loss": -7.003815174102783, "global_step": 162480, "epoch": 3868} {"train_loss": -6.8697829246521, "global_step": 162481, "epoch": 3868} {"train_loss": -6.821413516998291, "global_step": 162482, "epoch": 3868} {"train_loss": -6.907485485076904, "global_step": 162483, "epoch": 3868} {"train_loss": -6.869098663330078, "global_step": 162484, "epoch": 3868} {"train_loss": -6.7923994064331055, "global_step": 162485, "epoch": 3868} {"train_loss": -6.870489120483398, "global_step": 162486, "epoch": 3868} {"train_loss": -6.954533576965332, "global_step": 162487, "epoch": 3868} {"train_loss": -6.789763450622559, "global_step": 162488, "epoch": 3868} {"train_loss": -6.787158966064453, "global_step": 162489, "epoch": 3868} {"train_loss": -6.742714881896973, "global_step": 162490, "epoch": 3868} {"train_loss": -6.872119903564453, "global_step": 162491, "epoch": 3868} {"train_loss": -6.850569725036621, "global_step": 162492, "epoch": 3868} {"train_loss": -6.838044166564941, "global_step": 162493, "epoch": 3868} {"train_loss": -6.738801956176758, "global_step": 162494, "epoch": 3868} {"train_loss": -6.968166828155518, "global_step": 162495, "epoch": 3868} {"train_loss": -6.9077558517456055, "global_step": 162496, "epoch": 3868} {"train_loss": -6.9335529917762395, "global_step": 162497, "epoch": 3868, "val_loss": 68690.9609375} {"train_loss": -7.014382362365723, "global_step": 162498, "epoch": 3869} {"train_loss": -6.763429641723633, "global_step": 162499, "epoch": 3869} {"train_loss": -6.861382961273193, "global_step": 162500, "epoch": 3869} {"train_loss": -6.98537540435791, "global_step": 162501, "epoch": 3869} {"train_loss": -6.926545143127441, "global_step": 162502, "epoch": 3869} {"train_loss": -6.814899444580078, "global_step": 162503, "epoch": 3869} {"train_loss": -6.829434871673584, "global_step": 162504, "epoch": 3869} {"train_loss": -6.8664021492004395, "global_step": 162505, "epoch": 3869} {"train_loss": -7.021027088165283, "global_step": 162506, "epoch": 3869} {"train_loss": -6.705432891845703, "global_step": 162507, "epoch": 3869} {"train_loss": -6.856958389282227, "global_step": 162508, "epoch": 3869} {"train_loss": -6.890024185180664, "global_step": 162509, "epoch": 3869} {"train_loss": -6.880476951599121, "global_step": 162510, "epoch": 3869} {"train_loss": -6.971037864685059, "global_step": 162511, "epoch": 3869} {"train_loss": -6.892850875854492, "global_step": 162512, "epoch": 3869} {"train_loss": -6.890913963317871, "global_step": 162513, "epoch": 3869} {"train_loss": -6.734140872955322, "global_step": 162514, "epoch": 3869} {"train_loss": -6.924043655395508, "global_step": 162515, "epoch": 3869} {"train_loss": -6.895452976226807, "global_step": 162516, "epoch": 3869} {"train_loss": -6.938529968261719, "global_step": 162517, "epoch": 3869} {"train_loss": -7.043752670288086, "global_step": 162518, "epoch": 3869} {"train_loss": -6.846776008605957, "global_step": 162519, "epoch": 3869} {"train_loss": -7.002069473266602, "global_step": 162520, "epoch": 3869} {"train_loss": -7.009451389312744, "global_step": 162521, "epoch": 3869} {"train_loss": -7.010502815246582, "global_step": 162522, "epoch": 3869} {"train_loss": -7.007923126220703, "global_step": 162523, "epoch": 3869} {"train_loss": -6.947484970092773, "global_step": 162524, "epoch": 3869} {"train_loss": -7.0000901222229, "global_step": 162525, "epoch": 3869} {"train_loss": -6.941463470458984, "global_step": 162526, "epoch": 3869} {"train_loss": -6.964548110961914, "global_step": 162527, "epoch": 3869} {"train_loss": -6.999011993408203, "global_step": 162528, "epoch": 3869} {"train_loss": -6.9537153244018555, "global_step": 162529, "epoch": 3869} {"train_loss": -7.068099021911621, "global_step": 162530, "epoch": 3869} {"train_loss": -6.891055583953857, "global_step": 162531, "epoch": 3869} {"train_loss": -6.963625907897949, "global_step": 162532, "epoch": 3869} {"train_loss": -7.043695449829102, "global_step": 162533, "epoch": 3869} {"train_loss": -7.038263320922852, "global_step": 162534, "epoch": 3869} {"train_loss": -6.931775093078613, "global_step": 162535, "epoch": 3869} {"train_loss": -7.051886081695557, "global_step": 162536, "epoch": 3869} {"train_loss": -6.970439434051514, "global_step": 162537, "epoch": 3869} {"train_loss": -6.932347297668457, "global_step": 162538, "epoch": 3869} {"train_loss": -6.934742030643282, "global_step": 162539, "epoch": 3869, "val_loss": 68749.5859375} {"train_loss": -6.987566947937012, "global_step": 162540, "epoch": 3870} {"train_loss": -6.933688163757324, "global_step": 162541, "epoch": 3870} {"train_loss": -6.90056037902832, "global_step": 162542, "epoch": 3870} {"train_loss": -6.9461588859558105, "global_step": 162543, "epoch": 3870} {"train_loss": -7.034911632537842, "global_step": 162544, "epoch": 3870} {"train_loss": -7.03528356552124, "global_step": 162545, "epoch": 3870} {"train_loss": -7.048771858215332, "global_step": 162546, "epoch": 3870} {"train_loss": -7.033529758453369, "global_step": 162547, "epoch": 3870} {"train_loss": -7.021963119506836, "global_step": 162548, "epoch": 3870} {"train_loss": -7.0074782371521, "global_step": 162549, "epoch": 3870} {"train_loss": -6.9674835205078125, "global_step": 162550, "epoch": 3870} {"train_loss": -7.125852584838867, "global_step": 162551, "epoch": 3870} {"train_loss": -7.089069366455078, "global_step": 162552, "epoch": 3870} {"train_loss": -7.08211088180542, "global_step": 162553, "epoch": 3870} {"train_loss": -7.094880104064941, "global_step": 162554, "epoch": 3870} {"train_loss": -6.949002265930176, "global_step": 162555, "epoch": 3870} {"train_loss": -6.889516830444336, "global_step": 162556, "epoch": 3870} {"train_loss": -6.952544212341309, "global_step": 162557, "epoch": 3870} {"train_loss": -7.109710693359375, "global_step": 162558, "epoch": 3870} {"train_loss": -6.992070198059082, "global_step": 162559, "epoch": 3870} {"train_loss": -6.9210309982299805, "global_step": 162560, "epoch": 3870} {"train_loss": -6.92122745513916, "global_step": 162561, "epoch": 3870} {"train_loss": -7.016231536865234, "global_step": 162562, "epoch": 3870} {"train_loss": -6.950704097747803, "global_step": 162563, "epoch": 3870} {"train_loss": -7.000272274017334, "global_step": 162564, "epoch": 3870} {"train_loss": -6.928439617156982, "global_step": 162565, "epoch": 3870} {"train_loss": -6.876376152038574, "global_step": 162566, "epoch": 3870} {"train_loss": -6.992284774780273, "global_step": 162567, "epoch": 3870} {"train_loss": -6.932780742645264, "global_step": 162568, "epoch": 3870} {"train_loss": -6.96955680847168, "global_step": 162569, "epoch": 3870} {"train_loss": -6.943520545959473, "global_step": 162570, "epoch": 3870} {"train_loss": -6.825024604797363, "global_step": 162571, "epoch": 3870} {"train_loss": -6.935096263885498, "global_step": 162572, "epoch": 3870} {"train_loss": -7.013553619384766, "global_step": 162573, "epoch": 3870} {"train_loss": -6.899746894836426, "global_step": 162574, "epoch": 3870} {"train_loss": -7.02077579498291, "global_step": 162575, "epoch": 3870} {"train_loss": -6.989187240600586, "global_step": 162576, "epoch": 3870} {"train_loss": -6.902535438537598, "global_step": 162577, "epoch": 3870} {"train_loss": -7.009387969970703, "global_step": 162578, "epoch": 3870} {"train_loss": -6.952383041381836, "global_step": 162579, "epoch": 3870} {"train_loss": -6.848136901855469, "global_step": 162580, "epoch": 3870} {"train_loss": -6.9747557867141, "global_step": 162581, "epoch": 3870, "val_loss": 68652.421875} {"train_loss": -6.8155694007873535, "global_step": 162582, "epoch": 3871} {"train_loss": -6.893235206604004, "global_step": 162583, "epoch": 3871} {"train_loss": -6.900607585906982, "global_step": 162584, "epoch": 3871} {"train_loss": -6.852463722229004, "global_step": 162585, "epoch": 3871} {"train_loss": -6.84991979598999, "global_step": 162586, "epoch": 3871} {"train_loss": -6.935539245605469, "global_step": 162587, "epoch": 3871} {"train_loss": -6.863615989685059, "global_step": 162588, "epoch": 3871} {"train_loss": -6.730264663696289, "global_step": 162589, "epoch": 3871} {"train_loss": -6.767128944396973, "global_step": 162590, "epoch": 3871} {"train_loss": -6.976108074188232, "global_step": 162591, "epoch": 3871} {"train_loss": -6.8416666984558105, "global_step": 162592, "epoch": 3871} {"train_loss": -6.823220252990723, "global_step": 162593, "epoch": 3871} {"train_loss": -6.902201175689697, "global_step": 162594, "epoch": 3871} {"train_loss": -6.908397674560547, "global_step": 162595, "epoch": 3871} {"train_loss": -6.970139503479004, "global_step": 162596, "epoch": 3871} {"train_loss": -7.027097225189209, "global_step": 162597, "epoch": 3871} {"train_loss": -6.9569830894470215, "global_step": 162598, "epoch": 3871} {"train_loss": -6.984292030334473, "global_step": 162599, "epoch": 3871} {"train_loss": -6.899623870849609, "global_step": 162600, "epoch": 3871} {"train_loss": -6.944140434265137, "global_step": 162601, "epoch": 3871} {"train_loss": -6.9914445877075195, "global_step": 162602, "epoch": 3871} {"train_loss": -6.9711408615112305, "global_step": 162603, "epoch": 3871} {"train_loss": -6.8170366287231445, "global_step": 162604, "epoch": 3871} {"train_loss": -6.9478278160095215, "global_step": 162605, "epoch": 3871} {"train_loss": -6.989124298095703, "global_step": 162606, "epoch": 3871} {"train_loss": -6.9197893142700195, "global_step": 162607, "epoch": 3871} {"train_loss": -6.918622016906738, "global_step": 162608, "epoch": 3871} {"train_loss": -6.95911169052124, "global_step": 162609, "epoch": 3871} {"train_loss": -6.990246295928955, "global_step": 162610, "epoch": 3871} {"train_loss": -6.96700382232666, "global_step": 162611, "epoch": 3871} {"train_loss": -6.933736801147461, "global_step": 162612, "epoch": 3871} {"train_loss": -7.031737804412842, "global_step": 162613, "epoch": 3871} {"train_loss": -6.921001434326172, "global_step": 162614, "epoch": 3871} {"train_loss": -6.935338497161865, "global_step": 162615, "epoch": 3871} {"train_loss": -7.003004550933838, "global_step": 162616, "epoch": 3871} {"train_loss": -6.985678195953369, "global_step": 162617, "epoch": 3871} {"train_loss": -6.9647979736328125, "global_step": 162618, "epoch": 3871} {"train_loss": -7.03438663482666, "global_step": 162619, "epoch": 3871} {"train_loss": -7.1133317947387695, "global_step": 162620, "epoch": 3871} {"train_loss": -6.94354248046875, "global_step": 162621, "epoch": 3871} {"train_loss": -6.973948955535889, "global_step": 162622, "epoch": 3871} {"train_loss": -6.931765454156058, "global_step": 162623, "epoch": 3871, "val_loss": 68452.59375} {"train_loss": -7.032318115234375, "global_step": 162624, "epoch": 3872} {"train_loss": -7.061115264892578, "global_step": 162625, "epoch": 3872} {"train_loss": -7.028312683105469, "global_step": 162626, "epoch": 3872} {"train_loss": -6.917416572570801, "global_step": 162627, "epoch": 3872} {"train_loss": -6.943246364593506, "global_step": 162628, "epoch": 3872} {"train_loss": -7.039502143859863, "global_step": 162629, "epoch": 3872} {"train_loss": -6.885190963745117, "global_step": 162630, "epoch": 3872} {"train_loss": -7.021144866943359, "global_step": 162631, "epoch": 3872} {"train_loss": -6.978235721588135, "global_step": 162632, "epoch": 3872} {"train_loss": -6.959192752838135, "global_step": 162633, "epoch": 3872} {"train_loss": -6.939505577087402, "global_step": 162634, "epoch": 3872} {"train_loss": -6.958722114562988, "global_step": 162635, "epoch": 3872} {"train_loss": -7.020054817199707, "global_step": 162636, "epoch": 3872} {"train_loss": -6.875814437866211, "global_step": 162637, "epoch": 3872} {"train_loss": -6.999521255493164, "global_step": 162638, "epoch": 3872} {"train_loss": -7.016353130340576, "global_step": 162639, "epoch": 3872} {"train_loss": -6.918098449707031, "global_step": 162640, "epoch": 3872} {"train_loss": -6.920226097106934, "global_step": 162641, "epoch": 3872} {"train_loss": -6.935441970825195, "global_step": 162642, "epoch": 3872} {"train_loss": -6.962841033935547, "global_step": 162643, "epoch": 3872} {"train_loss": -6.9681525230407715, "global_step": 162644, "epoch": 3872} {"train_loss": -6.96171760559082, "global_step": 162645, "epoch": 3872} {"train_loss": -6.9922685623168945, "global_step": 162646, "epoch": 3872} {"train_loss": -6.926436901092529, "global_step": 162647, "epoch": 3872} {"train_loss": -6.963619232177734, "global_step": 162648, "epoch": 3872} {"train_loss": -6.974371433258057, "global_step": 162649, "epoch": 3872} {"train_loss": -7.004884243011475, "global_step": 162650, "epoch": 3872} {"train_loss": -6.926037788391113, "global_step": 162651, "epoch": 3872} {"train_loss": -6.906668663024902, "global_step": 162652, "epoch": 3872} {"train_loss": -6.967375755310059, "global_step": 162653, "epoch": 3872} {"train_loss": -6.9782209396362305, "global_step": 162654, "epoch": 3872} {"train_loss": -6.701481819152832, "global_step": 162655, "epoch": 3872} {"train_loss": -7.019959449768066, "global_step": 162656, "epoch": 3872} {"train_loss": -6.907298564910889, "global_step": 162657, "epoch": 3872} {"train_loss": -6.8912224769592285, "global_step": 162658, "epoch": 3872} {"train_loss": -6.980171203613281, "global_step": 162659, "epoch": 3872} {"train_loss": -6.866628646850586, "global_step": 162660, "epoch": 3872} {"train_loss": -7.02846622467041, "global_step": 162661, "epoch": 3872} {"train_loss": -6.954189300537109, "global_step": 162662, "epoch": 3872} {"train_loss": -6.959346771240234, "global_step": 162663, "epoch": 3872} {"train_loss": -6.934563636779785, "global_step": 162664, "epoch": 3872} {"train_loss": -6.957443566549392, "global_step": 162665, "epoch": 3872, "val_loss": 68714.6953125} {"train_loss": -6.922327041625977, "global_step": 162666, "epoch": 3873} {"train_loss": -6.984079837799072, "global_step": 162667, "epoch": 3873} {"train_loss": -6.897103309631348, "global_step": 162668, "epoch": 3873} {"train_loss": -7.0029497146606445, "global_step": 162669, "epoch": 3873} {"train_loss": -7.02681827545166, "global_step": 162670, "epoch": 3873} {"train_loss": -6.985776901245117, "global_step": 162671, "epoch": 3873} {"train_loss": -6.95866060256958, "global_step": 162672, "epoch": 3873} {"train_loss": -7.077430725097656, "global_step": 162673, "epoch": 3873} {"train_loss": -7.066168785095215, "global_step": 162674, "epoch": 3873} {"train_loss": -6.950864315032959, "global_step": 162675, "epoch": 3873} {"train_loss": -7.066555976867676, "global_step": 162676, "epoch": 3873} {"train_loss": -7.027103424072266, "global_step": 162677, "epoch": 3873} {"train_loss": -6.925335884094238, "global_step": 162678, "epoch": 3873} {"train_loss": -7.012475967407227, "global_step": 162679, "epoch": 3873} {"train_loss": -6.981146812438965, "global_step": 162680, "epoch": 3873} {"train_loss": -7.053587913513184, "global_step": 162681, "epoch": 3873} {"train_loss": -7.0943684577941895, "global_step": 162682, "epoch": 3873} {"train_loss": -6.980993747711182, "global_step": 162683, "epoch": 3873} {"train_loss": -6.89600944519043, "global_step": 162684, "epoch": 3873} {"train_loss": -6.915028095245361, "global_step": 162685, "epoch": 3873} {"train_loss": -6.954154014587402, "global_step": 162686, "epoch": 3873} {"train_loss": -6.9718732833862305, "global_step": 162687, "epoch": 3873} {"train_loss": -6.9689202308654785, "global_step": 162688, "epoch": 3873} {"train_loss": -6.820359706878662, "global_step": 162689, "epoch": 3873} {"train_loss": -7.037273406982422, "global_step": 162690, "epoch": 3873} {"train_loss": -6.961415767669678, "global_step": 162691, "epoch": 3873} {"train_loss": -6.970508098602295, "global_step": 162692, "epoch": 3873} {"train_loss": -6.953771591186523, "global_step": 162693, "epoch": 3873} {"train_loss": -6.959136962890625, "global_step": 162694, "epoch": 3873} {"train_loss": -6.891328811645508, "global_step": 162695, "epoch": 3873} {"train_loss": -6.939574241638184, "global_step": 162696, "epoch": 3873} {"train_loss": -6.899985313415527, "global_step": 162697, "epoch": 3873} {"train_loss": -6.824752330780029, "global_step": 162698, "epoch": 3873} {"train_loss": -6.835147857666016, "global_step": 162699, "epoch": 3873} {"train_loss": -6.886065483093262, "global_step": 162700, "epoch": 3873} {"train_loss": -6.8189496994018555, "global_step": 162701, "epoch": 3873} {"train_loss": -6.785675048828125, "global_step": 162702, "epoch": 3873} {"train_loss": -6.9249162673950195, "global_step": 162703, "epoch": 3873} {"train_loss": -6.986656188964844, "global_step": 162704, "epoch": 3873} {"train_loss": -6.919566631317139, "global_step": 162705, "epoch": 3873} {"train_loss": -6.857893943786621, "global_step": 162706, "epoch": 3873} {"train_loss": -6.952423107056391, "global_step": 162707, "epoch": 3873, "val_loss": 68807.5} {"train_loss": -6.864089012145996, "global_step": 162708, "epoch": 3874} {"train_loss": -6.899961471557617, "global_step": 162709, "epoch": 3874} {"train_loss": -6.995437145233154, "global_step": 162710, "epoch": 3874} {"train_loss": -6.934966564178467, "global_step": 162711, "epoch": 3874} {"train_loss": -6.771904468536377, "global_step": 162712, "epoch": 3874} {"train_loss": -6.928610801696777, "global_step": 162713, "epoch": 3874} {"train_loss": -6.962795734405518, "global_step": 162714, "epoch": 3874} {"train_loss": -6.92137336730957, "global_step": 162715, "epoch": 3874} {"train_loss": -6.859953880310059, "global_step": 162716, "epoch": 3874} {"train_loss": -6.916632652282715, "global_step": 162717, "epoch": 3874} {"train_loss": -6.968613624572754, "global_step": 162718, "epoch": 3874} {"train_loss": -6.932522773742676, "global_step": 162719, "epoch": 3874} {"train_loss": -6.979980945587158, "global_step": 162720, "epoch": 3874} {"train_loss": -6.951791763305664, "global_step": 162721, "epoch": 3874} {"train_loss": -6.955023765563965, "global_step": 162722, "epoch": 3874} {"train_loss": -6.94731330871582, "global_step": 162723, "epoch": 3874} {"train_loss": -6.894780158996582, "global_step": 162724, "epoch": 3874} {"train_loss": -6.967383861541748, "global_step": 162725, "epoch": 3874} {"train_loss": -6.886171817779541, "global_step": 162726, "epoch": 3874} {"train_loss": -6.88931941986084, "global_step": 162727, "epoch": 3874} {"train_loss": -6.834973335266113, "global_step": 162728, "epoch": 3874} {"train_loss": -6.671575546264648, "global_step": 162729, "epoch": 3874} {"train_loss": -6.939159393310547, "global_step": 162730, "epoch": 3874} {"train_loss": -6.9552083015441895, "global_step": 162731, "epoch": 3874} {"train_loss": -6.782482624053955, "global_step": 162732, "epoch": 3874} {"train_loss": -6.923696517944336, "global_step": 162733, "epoch": 3874} {"train_loss": -6.897318363189697, "global_step": 162734, "epoch": 3874} {"train_loss": -6.844050407409668, "global_step": 162735, "epoch": 3874} {"train_loss": -6.8670854568481445, "global_step": 162736, "epoch": 3874} {"train_loss": -6.84848690032959, "global_step": 162737, "epoch": 3874} {"train_loss": -7.0063886642456055, "global_step": 162738, "epoch": 3874} {"train_loss": -6.958090305328369, "global_step": 162739, "epoch": 3874} {"train_loss": -6.785781383514404, "global_step": 162740, "epoch": 3874} {"train_loss": -7.032761573791504, "global_step": 162741, "epoch": 3874} {"train_loss": -6.906144142150879, "global_step": 162742, "epoch": 3874} {"train_loss": -6.8667144775390625, "global_step": 162743, "epoch": 3874} {"train_loss": -6.800804615020752, "global_step": 162744, "epoch": 3874} {"train_loss": -6.939162254333496, "global_step": 162745, "epoch": 3874} {"train_loss": -6.982412338256836, "global_step": 162746, "epoch": 3874} {"train_loss": -6.853952407836914, "global_step": 162747, "epoch": 3874} {"train_loss": -6.900053977966309, "global_step": 162748, "epoch": 3874} {"train_loss": -6.905212481816609, "global_step": 162749, "epoch": 3874, "val_loss": 68713.8046875} {"train_loss": -6.932791709899902, "global_step": 162750, "epoch": 3875} {"train_loss": -6.945674896240234, "global_step": 162751, "epoch": 3875} {"train_loss": -6.850951194763184, "global_step": 162752, "epoch": 3875} {"train_loss": -6.925464153289795, "global_step": 162753, "epoch": 3875} {"train_loss": -6.846129417419434, "global_step": 162754, "epoch": 3875} {"train_loss": -6.9661688804626465, "global_step": 162755, "epoch": 3875} {"train_loss": -6.936208724975586, "global_step": 162756, "epoch": 3875} {"train_loss": -6.800840377807617, "global_step": 162757, "epoch": 3875} {"train_loss": -6.901074409484863, "global_step": 162758, "epoch": 3875} {"train_loss": -6.933445930480957, "global_step": 162759, "epoch": 3875} {"train_loss": -6.8632001876831055, "global_step": 162760, "epoch": 3875} {"train_loss": -6.803558349609375, "global_step": 162761, "epoch": 3875} {"train_loss": -6.879899024963379, "global_step": 162762, "epoch": 3875} {"train_loss": -6.689137935638428, "global_step": 162763, "epoch": 3875} {"train_loss": -6.944000244140625, "global_step": 162764, "epoch": 3875} {"train_loss": -6.737107276916504, "global_step": 162765, "epoch": 3875} {"train_loss": -6.800947189331055, "global_step": 162766, "epoch": 3875} {"train_loss": -6.700788497924805, "global_step": 162767, "epoch": 3875} {"train_loss": -6.915060520172119, "global_step": 162768, "epoch": 3875} {"train_loss": -6.857163429260254, "global_step": 162769, "epoch": 3875} {"train_loss": -6.759738922119141, "global_step": 162770, "epoch": 3875} {"train_loss": -6.829837322235107, "global_step": 162771, "epoch": 3875} {"train_loss": -6.8442888259887695, "global_step": 162772, "epoch": 3875} {"train_loss": -6.958427429199219, "global_step": 162773, "epoch": 3875} {"train_loss": -6.912875652313232, "global_step": 162774, "epoch": 3875} {"train_loss": -6.864494323730469, "global_step": 162775, "epoch": 3875} {"train_loss": -7.0655059814453125, "global_step": 162776, "epoch": 3875} {"train_loss": -6.909669876098633, "global_step": 162777, "epoch": 3875} {"train_loss": -6.978519916534424, "global_step": 162778, "epoch": 3875} {"train_loss": -6.939243316650391, "global_step": 162779, "epoch": 3875} {"train_loss": -6.997427463531494, "global_step": 162780, "epoch": 3875} {"train_loss": -7.004575729370117, "global_step": 162781, "epoch": 3875} {"train_loss": -6.981961727142334, "global_step": 162782, "epoch": 3875} {"train_loss": -6.861993312835693, "global_step": 162783, "epoch": 3875} {"train_loss": -6.971256732940674, "global_step": 162784, "epoch": 3875} {"train_loss": -7.123661041259766, "global_step": 162785, "epoch": 3875} {"train_loss": -7.005746841430664, "global_step": 162786, "epoch": 3875} {"train_loss": -6.998661994934082, "global_step": 162787, "epoch": 3875} {"train_loss": -7.033707618713379, "global_step": 162788, "epoch": 3875} {"train_loss": -6.920513153076172, "global_step": 162789, "epoch": 3875} {"train_loss": -7.027944564819336, "global_step": 162790, "epoch": 3875} {"train_loss": -6.909500689733596, "global_step": 162791, "epoch": 3875, "val_loss": 68908.4453125} {"train_loss": -6.8664960861206055, "global_step": 162792, "epoch": 3876} {"train_loss": -7.035041809082031, "global_step": 162793, "epoch": 3876} {"train_loss": -7.070281505584717, "global_step": 162794, "epoch": 3876} {"train_loss": -6.9393110275268555, "global_step": 162795, "epoch": 3876} {"train_loss": -7.112314224243164, "global_step": 162796, "epoch": 3876} {"train_loss": -7.039496421813965, "global_step": 162797, "epoch": 3876} {"train_loss": -7.059963703155518, "global_step": 162798, "epoch": 3876} {"train_loss": -6.977015495300293, "global_step": 162799, "epoch": 3876} {"train_loss": -7.046533107757568, "global_step": 162800, "epoch": 3876} {"train_loss": -6.9582109451293945, "global_step": 162801, "epoch": 3876} {"train_loss": -7.019808292388916, "global_step": 162802, "epoch": 3876} {"train_loss": -7.109004020690918, "global_step": 162803, "epoch": 3876} {"train_loss": -7.121211051940918, "global_step": 162804, "epoch": 3876} {"train_loss": -7.089907169342041, "global_step": 162805, "epoch": 3876} {"train_loss": -7.024906635284424, "global_step": 162806, "epoch": 3876} {"train_loss": -6.998085021972656, "global_step": 162807, "epoch": 3876} {"train_loss": -7.043732643127441, "global_step": 162808, "epoch": 3876} {"train_loss": -7.038769721984863, "global_step": 162809, "epoch": 3876} {"train_loss": -7.024172782897949, "global_step": 162810, "epoch": 3876} {"train_loss": -7.034235000610352, "global_step": 162811, "epoch": 3876} {"train_loss": -6.965505599975586, "global_step": 162812, "epoch": 3876} {"train_loss": -7.008369445800781, "global_step": 162813, "epoch": 3876} {"train_loss": -7.027061462402344, "global_step": 162814, "epoch": 3876} {"train_loss": -6.990068435668945, "global_step": 162815, "epoch": 3876} {"train_loss": -7.1133856773376465, "global_step": 162816, "epoch": 3876} {"train_loss": -7.073756217956543, "global_step": 162817, "epoch": 3876} {"train_loss": -6.9898505210876465, "global_step": 162818, "epoch": 3876} {"train_loss": -7.075814247131348, "global_step": 162819, "epoch": 3876} {"train_loss": -6.971059322357178, "global_step": 162820, "epoch": 3876} {"train_loss": -7.021722316741943, "global_step": 162821, "epoch": 3876} {"train_loss": -7.037272930145264, "global_step": 162822, "epoch": 3876} {"train_loss": -6.936715126037598, "global_step": 162823, "epoch": 3876} {"train_loss": -6.948759078979492, "global_step": 162824, "epoch": 3876} {"train_loss": -6.944558143615723, "global_step": 162825, "epoch": 3876} {"train_loss": -7.019280910491943, "global_step": 162826, "epoch": 3876} {"train_loss": -6.922366142272949, "global_step": 162827, "epoch": 3876} {"train_loss": -6.99022102355957, "global_step": 162828, "epoch": 3876} {"train_loss": -6.975067138671875, "global_step": 162829, "epoch": 3876} {"train_loss": -7.031589508056641, "global_step": 162830, "epoch": 3876} {"train_loss": -6.984884262084961, "global_step": 162831, "epoch": 3876} {"train_loss": -6.857991695404053, "global_step": 162832, "epoch": 3876} {"train_loss": -7.0147087914603095, "global_step": 162833, "epoch": 3876, "val_loss": 68792.828125} {"train_loss": -7.050370216369629, "global_step": 162834, "epoch": 3877} {"train_loss": -6.978109359741211, "global_step": 162835, "epoch": 3877} {"train_loss": -6.920900821685791, "global_step": 162836, "epoch": 3877} {"train_loss": -6.899680137634277, "global_step": 162837, "epoch": 3877} {"train_loss": -6.914909839630127, "global_step": 162838, "epoch": 3877} {"train_loss": -6.9492340087890625, "global_step": 162839, "epoch": 3877} {"train_loss": -7.052622318267822, "global_step": 162840, "epoch": 3877} {"train_loss": -7.113403797149658, "global_step": 162841, "epoch": 3877} {"train_loss": -7.056510925292969, "global_step": 162842, "epoch": 3877} {"train_loss": -7.090510845184326, "global_step": 162843, "epoch": 3877} {"train_loss": -6.960943698883057, "global_step": 162844, "epoch": 3877} {"train_loss": -6.950275421142578, "global_step": 162845, "epoch": 3877} {"train_loss": -7.044621467590332, "global_step": 162846, "epoch": 3877} {"train_loss": -7.061241149902344, "global_step": 162847, "epoch": 3877} {"train_loss": -7.01328182220459, "global_step": 162848, "epoch": 3877} {"train_loss": -6.939301490783691, "global_step": 162849, "epoch": 3877} {"train_loss": -7.033999443054199, "global_step": 162850, "epoch": 3877} {"train_loss": -6.8989105224609375, "global_step": 162851, "epoch": 3877} {"train_loss": -6.983659267425537, "global_step": 162852, "epoch": 3877} {"train_loss": -7.1587700843811035, "global_step": 162853, "epoch": 3877} {"train_loss": -6.989726543426514, "global_step": 162854, "epoch": 3877} {"train_loss": -7.048498153686523, "global_step": 162855, "epoch": 3877} {"train_loss": -6.915511131286621, "global_step": 162856, "epoch": 3877} {"train_loss": -6.864605903625488, "global_step": 162857, "epoch": 3877} {"train_loss": -7.0545549392700195, "global_step": 162858, "epoch": 3877} {"train_loss": -6.951054573059082, "global_step": 162859, "epoch": 3877} {"train_loss": -6.856489658355713, "global_step": 162860, "epoch": 3877} {"train_loss": -6.907299041748047, "global_step": 162861, "epoch": 3877} {"train_loss": -6.783865451812744, "global_step": 162862, "epoch": 3877} {"train_loss": -6.949394226074219, "global_step": 162863, "epoch": 3877} {"train_loss": -6.770567893981934, "global_step": 162864, "epoch": 3877} {"train_loss": -6.8110761642456055, "global_step": 162865, "epoch": 3877} {"train_loss": -6.958200454711914, "global_step": 162866, "epoch": 3877} {"train_loss": -6.7805047035217285, "global_step": 162867, "epoch": 3877} {"train_loss": -6.835268497467041, "global_step": 162868, "epoch": 3877} {"train_loss": -6.971231937408447, "global_step": 162869, "epoch": 3877} {"train_loss": -6.776543617248535, "global_step": 162870, "epoch": 3877} {"train_loss": -6.80497932434082, "global_step": 162871, "epoch": 3877} {"train_loss": -6.893631935119629, "global_step": 162872, "epoch": 3877} {"train_loss": -6.739018440246582, "global_step": 162873, "epoch": 3877} {"train_loss": -6.832625389099121, "global_step": 162874, "epoch": 3877} {"train_loss": -6.936659574508667, "global_step": 162875, "epoch": 3877, "val_loss": 68778.8203125} {"train_loss": -6.928377628326416, "global_step": 162876, "epoch": 3878} {"train_loss": -6.8977508544921875, "global_step": 162877, "epoch": 3878} {"train_loss": -6.871315956115723, "global_step": 162878, "epoch": 3878} {"train_loss": -6.794222831726074, "global_step": 162879, "epoch": 3878} {"train_loss": -6.91859769821167, "global_step": 162880, "epoch": 3878} {"train_loss": -6.85797643661499, "global_step": 162881, "epoch": 3878} {"train_loss": -6.9590911865234375, "global_step": 162882, "epoch": 3878} {"train_loss": -6.895516395568848, "global_step": 162883, "epoch": 3878} {"train_loss": -6.898305892944336, "global_step": 162884, "epoch": 3878} {"train_loss": -6.881405830383301, "global_step": 162885, "epoch": 3878} {"train_loss": -6.807435512542725, "global_step": 162886, "epoch": 3878} {"train_loss": -6.846280574798584, "global_step": 162887, "epoch": 3878} {"train_loss": -6.962765216827393, "global_step": 162888, "epoch": 3878} {"train_loss": -6.8624114990234375, "global_step": 162889, "epoch": 3878} {"train_loss": -7.066119194030762, "global_step": 162890, "epoch": 3878} {"train_loss": -6.895226955413818, "global_step": 162891, "epoch": 3878} {"train_loss": -6.88819694519043, "global_step": 162892, "epoch": 3878} {"train_loss": -6.948473930358887, "global_step": 162893, "epoch": 3878} {"train_loss": -6.847322940826416, "global_step": 162894, "epoch": 3878} {"train_loss": -6.875610828399658, "global_step": 162895, "epoch": 3878} {"train_loss": -6.966212272644043, "global_step": 162896, "epoch": 3878} {"train_loss": -6.942540168762207, "global_step": 162897, "epoch": 3878} {"train_loss": -6.9957594871521, "global_step": 162898, "epoch": 3878} {"train_loss": -6.957450866699219, "global_step": 162899, "epoch": 3878} {"train_loss": -6.963891983032227, "global_step": 162900, "epoch": 3878} {"train_loss": -6.893592834472656, "global_step": 162901, "epoch": 3878} {"train_loss": -6.80143404006958, "global_step": 162902, "epoch": 3878} {"train_loss": -6.885862350463867, "global_step": 162903, "epoch": 3878} {"train_loss": -6.928820610046387, "global_step": 162904, "epoch": 3878} {"train_loss": -6.8891282081604, "global_step": 162905, "epoch": 3878} {"train_loss": -6.878205299377441, "global_step": 162906, "epoch": 3878} {"train_loss": -6.957361221313477, "global_step": 162907, "epoch": 3878} {"train_loss": -6.886460304260254, "global_step": 162908, "epoch": 3878} {"train_loss": -6.891373634338379, "global_step": 162909, "epoch": 3878} {"train_loss": -6.851662635803223, "global_step": 162910, "epoch": 3878} {"train_loss": -7.092529296875, "global_step": 162911, "epoch": 3878} {"train_loss": -6.891393184661865, "global_step": 162912, "epoch": 3878} {"train_loss": -6.838752746582031, "global_step": 162913, "epoch": 3878} {"train_loss": -7.059274196624756, "global_step": 162914, "epoch": 3878} {"train_loss": -6.87753963470459, "global_step": 162915, "epoch": 3878} {"train_loss": -6.925543785095215, "global_step": 162916, "epoch": 3878} {"train_loss": -6.910907313937233, "global_step": 162917, "epoch": 3878, "val_loss": 68703.109375} {"train_loss": -6.996120452880859, "global_step": 162918, "epoch": 3879} {"train_loss": -6.902891635894775, "global_step": 162919, "epoch": 3879} {"train_loss": -6.752005100250244, "global_step": 162920, "epoch": 3879} {"train_loss": -6.949063301086426, "global_step": 162921, "epoch": 3879} {"train_loss": -6.874337196350098, "global_step": 162922, "epoch": 3879} {"train_loss": -6.903242588043213, "global_step": 162923, "epoch": 3879} {"train_loss": -6.985480308532715, "global_step": 162924, "epoch": 3879} {"train_loss": -7.073333740234375, "global_step": 162925, "epoch": 3879} {"train_loss": -7.078549861907959, "global_step": 162926, "epoch": 3879} {"train_loss": -6.912909030914307, "global_step": 162927, "epoch": 3879} {"train_loss": -6.911530494689941, "global_step": 162928, "epoch": 3879} {"train_loss": -6.759961128234863, "global_step": 162929, "epoch": 3879} {"train_loss": -6.931591033935547, "global_step": 162930, "epoch": 3879} {"train_loss": -6.99224853515625, "global_step": 162931, "epoch": 3879} {"train_loss": -6.880241870880127, "global_step": 162932, "epoch": 3879} {"train_loss": -7.033888339996338, "global_step": 162933, "epoch": 3879} {"train_loss": -6.889321804046631, "global_step": 162934, "epoch": 3879} {"train_loss": -6.916003227233887, "global_step": 162935, "epoch": 3879} {"train_loss": -7.04394006729126, "global_step": 162936, "epoch": 3879} {"train_loss": -6.832133769989014, "global_step": 162937, "epoch": 3879} {"train_loss": -6.950390815734863, "global_step": 162938, "epoch": 3879} {"train_loss": -6.948319911956787, "global_step": 162939, "epoch": 3879} {"train_loss": -7.004697799682617, "global_step": 162940, "epoch": 3879} {"train_loss": -6.9404096603393555, "global_step": 162941, "epoch": 3879} {"train_loss": -6.870814800262451, "global_step": 162942, "epoch": 3879} {"train_loss": -7.058356761932373, "global_step": 162943, "epoch": 3879} {"train_loss": -6.870121002197266, "global_step": 162944, "epoch": 3879} {"train_loss": -6.947220325469971, "global_step": 162945, "epoch": 3879} {"train_loss": -6.835362434387207, "global_step": 162946, "epoch": 3879} {"train_loss": -6.881830215454102, "global_step": 162947, "epoch": 3879} {"train_loss": -7.020247936248779, "global_step": 162948, "epoch": 3879} {"train_loss": -6.8744916915893555, "global_step": 162949, "epoch": 3879} {"train_loss": -7.051119804382324, "global_step": 162950, "epoch": 3879} {"train_loss": -6.898345947265625, "global_step": 162951, "epoch": 3879} {"train_loss": -7.005366325378418, "global_step": 162952, "epoch": 3879} {"train_loss": -6.971182823181152, "global_step": 162953, "epoch": 3879} {"train_loss": -6.932353973388672, "global_step": 162954, "epoch": 3879} {"train_loss": -6.904706001281738, "global_step": 162955, "epoch": 3879} {"train_loss": -6.949680328369141, "global_step": 162956, "epoch": 3879} {"train_loss": -7.027139186859131, "global_step": 162957, "epoch": 3879} {"train_loss": -6.887359142303467, "global_step": 162958, "epoch": 3879} {"train_loss": -6.937461455663045, "global_step": 162959, "epoch": 3879, "val_loss": 68826.4453125} {"train_loss": -7.031872749328613, "global_step": 162960, "epoch": 3880} {"train_loss": -6.996547698974609, "global_step": 162961, "epoch": 3880} {"train_loss": -6.928372383117676, "global_step": 162962, "epoch": 3880} {"train_loss": -6.987117290496826, "global_step": 162963, "epoch": 3880} {"train_loss": -6.991503715515137, "global_step": 162964, "epoch": 3880} {"train_loss": -6.9165754318237305, "global_step": 162965, "epoch": 3880} {"train_loss": -7.075867652893066, "global_step": 162966, "epoch": 3880} {"train_loss": -7.036187648773193, "global_step": 162967, "epoch": 3880} {"train_loss": -7.009607315063477, "global_step": 162968, "epoch": 3880} {"train_loss": -6.949204921722412, "global_step": 162969, "epoch": 3880} {"train_loss": -7.065563201904297, "global_step": 162970, "epoch": 3880} {"train_loss": -6.957995414733887, "global_step": 162971, "epoch": 3880} {"train_loss": -7.108737945556641, "global_step": 162972, "epoch": 3880} {"train_loss": -6.94417667388916, "global_step": 162973, "epoch": 3880} {"train_loss": -6.944880485534668, "global_step": 162974, "epoch": 3880} {"train_loss": -7.129697322845459, "global_step": 162975, "epoch": 3880} {"train_loss": -7.012104034423828, "global_step": 162976, "epoch": 3880} {"train_loss": -7.017190933227539, "global_step": 162977, "epoch": 3880} {"train_loss": -7.0324201583862305, "global_step": 162978, "epoch": 3880} {"train_loss": -6.935163974761963, "global_step": 162979, "epoch": 3880} {"train_loss": -7.090357780456543, "global_step": 162980, "epoch": 3880} {"train_loss": -6.960665225982666, "global_step": 162981, "epoch": 3880} {"train_loss": -6.913522720336914, "global_step": 162982, "epoch": 3880} {"train_loss": -7.024160385131836, "global_step": 162983, "epoch": 3880} {"train_loss": -6.91871976852417, "global_step": 162984, "epoch": 3880} {"train_loss": -6.8572492599487305, "global_step": 162985, "epoch": 3880} {"train_loss": -7.099708080291748, "global_step": 162986, "epoch": 3880} {"train_loss": -6.974569797515869, "global_step": 162987, "epoch": 3880} {"train_loss": -6.981027126312256, "global_step": 162988, "epoch": 3880} {"train_loss": -7.038577079772949, "global_step": 162989, "epoch": 3880} {"train_loss": -7.053043842315674, "global_step": 162990, "epoch": 3880} {"train_loss": -6.90809965133667, "global_step": 162991, "epoch": 3880} {"train_loss": -6.931555271148682, "global_step": 162992, "epoch": 3880} {"train_loss": -7.0433878898620605, "global_step": 162993, "epoch": 3880} {"train_loss": -7.017511367797852, "global_step": 162994, "epoch": 3880} {"train_loss": -6.940299034118652, "global_step": 162995, "epoch": 3880} {"train_loss": -7.064753532409668, "global_step": 162996, "epoch": 3880} {"train_loss": -6.937901973724365, "global_step": 162997, "epoch": 3880} {"train_loss": -7.077812671661377, "global_step": 162998, "epoch": 3880} {"train_loss": -7.075780868530273, "global_step": 162999, "epoch": 3880} {"train_loss": -6.932476043701172, "global_step": 163000, "epoch": 3880} {"train_loss": -6.995691855748494, "global_step": 163001, "epoch": 3880, "val_loss": 68630.3359375} {"train_loss": -6.955646514892578, "global_step": 163002, "epoch": 3881} {"train_loss": -6.961421012878418, "global_step": 163003, "epoch": 3881} {"train_loss": -6.9982008934021, "global_step": 163004, "epoch": 3881} {"train_loss": -7.007626056671143, "global_step": 163005, "epoch": 3881} {"train_loss": -6.976295471191406, "global_step": 163006, "epoch": 3881} {"train_loss": -6.956782817840576, "global_step": 163007, "epoch": 3881} {"train_loss": -7.034520149230957, "global_step": 163008, "epoch": 3881} {"train_loss": -6.931974411010742, "global_step": 163009, "epoch": 3881} {"train_loss": -7.029550075531006, "global_step": 163010, "epoch": 3881} {"train_loss": -7.117565631866455, "global_step": 163011, "epoch": 3881} {"train_loss": -7.005485534667969, "global_step": 163012, "epoch": 3881} {"train_loss": -6.977821350097656, "global_step": 163013, "epoch": 3881} {"train_loss": -6.837604522705078, "global_step": 163014, "epoch": 3881} {"train_loss": -7.04799222946167, "global_step": 163015, "epoch": 3881} {"train_loss": -7.003793716430664, "global_step": 163016, "epoch": 3881} {"train_loss": -7.052668571472168, "global_step": 163017, "epoch": 3881} {"train_loss": -7.042849540710449, "global_step": 163018, "epoch": 3881} {"train_loss": -7.082764625549316, "global_step": 163019, "epoch": 3881} {"train_loss": -6.961337089538574, "global_step": 163020, "epoch": 3881} {"train_loss": -7.077535629272461, "global_step": 163021, "epoch": 3881} {"train_loss": -6.90595817565918, "global_step": 163022, "epoch": 3881} {"train_loss": -7.106764793395996, "global_step": 163023, "epoch": 3881} {"train_loss": -7.116832256317139, "global_step": 163024, "epoch": 3881} {"train_loss": -7.026656627655029, "global_step": 163025, "epoch": 3881} {"train_loss": -6.990937232971191, "global_step": 163026, "epoch": 3881} {"train_loss": -7.014359474182129, "global_step": 163027, "epoch": 3881} {"train_loss": -6.797891616821289, "global_step": 163028, "epoch": 3881} {"train_loss": -6.909341812133789, "global_step": 163029, "epoch": 3881} {"train_loss": -6.90953254699707, "global_step": 163030, "epoch": 3881} {"train_loss": -6.875013828277588, "global_step": 163031, "epoch": 3881} {"train_loss": -7.085488319396973, "global_step": 163032, "epoch": 3881} {"train_loss": -6.852553367614746, "global_step": 163033, "epoch": 3881} {"train_loss": -6.9773430824279785, "global_step": 163034, "epoch": 3881} {"train_loss": -6.847875595092773, "global_step": 163035, "epoch": 3881} {"train_loss": -6.868215560913086, "global_step": 163036, "epoch": 3881} {"train_loss": -6.958483695983887, "global_step": 163037, "epoch": 3881} {"train_loss": -6.9281086921691895, "global_step": 163038, "epoch": 3881} {"train_loss": -6.903062343597412, "global_step": 163039, "epoch": 3881} {"train_loss": -6.836534023284912, "global_step": 163040, "epoch": 3881} {"train_loss": -6.955521106719971, "global_step": 163041, "epoch": 3881} {"train_loss": -6.774983882904053, "global_step": 163042, "epoch": 3881} {"train_loss": -6.967446406682332, "global_step": 163043, "epoch": 3881, "val_loss": 68844.4765625} {"train_loss": -6.99368143081665, "global_step": 163044, "epoch": 3882} {"train_loss": -6.845888137817383, "global_step": 163045, "epoch": 3882} {"train_loss": -7.004807472229004, "global_step": 163046, "epoch": 3882} {"train_loss": -6.900398254394531, "global_step": 163047, "epoch": 3882} {"train_loss": -6.885187149047852, "global_step": 163048, "epoch": 3882} {"train_loss": -7.008805751800537, "global_step": 163049, "epoch": 3882} {"train_loss": -6.90976619720459, "global_step": 163050, "epoch": 3882} {"train_loss": -7.0099334716796875, "global_step": 163051, "epoch": 3882} {"train_loss": -6.967774391174316, "global_step": 163052, "epoch": 3882} {"train_loss": -6.900040149688721, "global_step": 163053, "epoch": 3882} {"train_loss": -6.964344501495361, "global_step": 163054, "epoch": 3882} {"train_loss": -6.889608383178711, "global_step": 163055, "epoch": 3882} {"train_loss": -6.827741622924805, "global_step": 163056, "epoch": 3882} {"train_loss": -6.836625576019287, "global_step": 163057, "epoch": 3882} {"train_loss": -6.792191505432129, "global_step": 163058, "epoch": 3882} {"train_loss": -6.887022495269775, "global_step": 163059, "epoch": 3882} {"train_loss": -6.788098335266113, "global_step": 163060, "epoch": 3882} {"train_loss": -6.74273157119751, "global_step": 163061, "epoch": 3882} {"train_loss": -7.003300189971924, "global_step": 163062, "epoch": 3882} {"train_loss": -6.831094264984131, "global_step": 163063, "epoch": 3882} {"train_loss": -6.972720623016357, "global_step": 163064, "epoch": 3882} {"train_loss": -6.998147010803223, "global_step": 163065, "epoch": 3882} {"train_loss": -6.789507865905762, "global_step": 163066, "epoch": 3882} {"train_loss": -6.9114909172058105, "global_step": 163067, "epoch": 3882} {"train_loss": -6.83984375, "global_step": 163068, "epoch": 3882} {"train_loss": -6.990063190460205, "global_step": 163069, "epoch": 3882} {"train_loss": -6.798161506652832, "global_step": 163070, "epoch": 3882} {"train_loss": -6.751221656799316, "global_step": 163071, "epoch": 3882} {"train_loss": -6.963693141937256, "global_step": 163072, "epoch": 3882} {"train_loss": -6.699209213256836, "global_step": 163073, "epoch": 3882} {"train_loss": -6.985806465148926, "global_step": 163074, "epoch": 3882} {"train_loss": -6.825033187866211, "global_step": 163075, "epoch": 3882} {"train_loss": -6.9382195472717285, "global_step": 163076, "epoch": 3882} {"train_loss": -6.898330211639404, "global_step": 163077, "epoch": 3882} {"train_loss": -6.940716743469238, "global_step": 163078, "epoch": 3882} {"train_loss": -6.91972541809082, "global_step": 163079, "epoch": 3882} {"train_loss": -6.848729610443115, "global_step": 163080, "epoch": 3882} {"train_loss": -6.882813453674316, "global_step": 163081, "epoch": 3882} {"train_loss": -6.947014331817627, "global_step": 163082, "epoch": 3882} {"train_loss": -6.8308610916137695, "global_step": 163083, "epoch": 3882} {"train_loss": -6.831180572509766, "global_step": 163084, "epoch": 3882} {"train_loss": -6.889424528394427, "global_step": 163085, "epoch": 3882, "val_loss": 68701.078125} {"train_loss": -6.874697685241699, "global_step": 163086, "epoch": 3883} {"train_loss": -6.946651458740234, "global_step": 163087, "epoch": 3883} {"train_loss": -6.750994682312012, "global_step": 163088, "epoch": 3883} {"train_loss": -6.881431579589844, "global_step": 163089, "epoch": 3883} {"train_loss": -6.857024669647217, "global_step": 163090, "epoch": 3883} {"train_loss": -6.759577751159668, "global_step": 163091, "epoch": 3883} {"train_loss": -6.942108154296875, "global_step": 163092, "epoch": 3883} {"train_loss": -6.758488655090332, "global_step": 163093, "epoch": 3883} {"train_loss": -6.780396461486816, "global_step": 163094, "epoch": 3883} {"train_loss": -6.916944980621338, "global_step": 163095, "epoch": 3883} {"train_loss": -6.7681169509887695, "global_step": 163096, "epoch": 3883} {"train_loss": -6.980931758880615, "global_step": 163097, "epoch": 3883} {"train_loss": -6.7795867919921875, "global_step": 163098, "epoch": 3883} {"train_loss": -6.785858154296875, "global_step": 163099, "epoch": 3883} {"train_loss": -6.903460502624512, "global_step": 163100, "epoch": 3883} {"train_loss": -6.896448135375977, "global_step": 163101, "epoch": 3883} {"train_loss": -6.987091064453125, "global_step": 163102, "epoch": 3883} {"train_loss": -6.715335845947266, "global_step": 163103, "epoch": 3883} {"train_loss": -6.980475425720215, "global_step": 163104, "epoch": 3883} {"train_loss": -6.936022758483887, "global_step": 163105, "epoch": 3883} {"train_loss": -6.854963302612305, "global_step": 163106, "epoch": 3883} {"train_loss": -6.841897964477539, "global_step": 163107, "epoch": 3883} {"train_loss": -6.832277297973633, "global_step": 163108, "epoch": 3883} {"train_loss": -6.848183631896973, "global_step": 163109, "epoch": 3883} {"train_loss": -6.979963302612305, "global_step": 163110, "epoch": 3883} {"train_loss": -6.749729156494141, "global_step": 163111, "epoch": 3883} {"train_loss": -6.8982625007629395, "global_step": 163112, "epoch": 3883} {"train_loss": -7.007723331451416, "global_step": 163113, "epoch": 3883} {"train_loss": -6.829663276672363, "global_step": 163114, "epoch": 3883} {"train_loss": -7.014181137084961, "global_step": 163115, "epoch": 3883} {"train_loss": -6.923295021057129, "global_step": 163116, "epoch": 3883} {"train_loss": -6.879828453063965, "global_step": 163117, "epoch": 3883} {"train_loss": -7.035558223724365, "global_step": 163118, "epoch": 3883} {"train_loss": -7.0927019119262695, "global_step": 163119, "epoch": 3883} {"train_loss": -6.934587001800537, "global_step": 163120, "epoch": 3883} {"train_loss": -6.972187042236328, "global_step": 163121, "epoch": 3883} {"train_loss": -6.9535627365112305, "global_step": 163122, "epoch": 3883} {"train_loss": -6.994799613952637, "global_step": 163123, "epoch": 3883} {"train_loss": -6.997986793518066, "global_step": 163124, "epoch": 3883} {"train_loss": -7.055548191070557, "global_step": 163125, "epoch": 3883} {"train_loss": -7.021899223327637, "global_step": 163126, "epoch": 3883} {"train_loss": -6.90212557429359, "global_step": 163127, "epoch": 3883, "val_loss": 68712.890625} {"train_loss": -6.9615068435668945, "global_step": 163128, "epoch": 3884} {"train_loss": -7.0048346519470215, "global_step": 163129, "epoch": 3884} {"train_loss": -7.001930236816406, "global_step": 163130, "epoch": 3884} {"train_loss": -7.03196907043457, "global_step": 163131, "epoch": 3884} {"train_loss": -6.979546546936035, "global_step": 163132, "epoch": 3884} {"train_loss": -7.035743713378906, "global_step": 163133, "epoch": 3884} {"train_loss": -7.058992385864258, "global_step": 163134, "epoch": 3884} {"train_loss": -6.9679274559021, "global_step": 163135, "epoch": 3884} {"train_loss": -7.099306583404541, "global_step": 163136, "epoch": 3884} {"train_loss": -6.917085647583008, "global_step": 163137, "epoch": 3884} {"train_loss": -7.018286228179932, "global_step": 163138, "epoch": 3884} {"train_loss": -7.039777755737305, "global_step": 163139, "epoch": 3884} {"train_loss": -7.000611305236816, "global_step": 163140, "epoch": 3884} {"train_loss": -6.968655586242676, "global_step": 163141, "epoch": 3884} {"train_loss": -6.996410369873047, "global_step": 163142, "epoch": 3884} {"train_loss": -6.927646636962891, "global_step": 163143, "epoch": 3884} {"train_loss": -7.120572090148926, "global_step": 163144, "epoch": 3884} {"train_loss": -7.0060038566589355, "global_step": 163145, "epoch": 3884} {"train_loss": -6.866812705993652, "global_step": 163146, "epoch": 3884} {"train_loss": -6.973263740539551, "global_step": 163147, "epoch": 3884} {"train_loss": -6.973238945007324, "global_step": 163148, "epoch": 3884} {"train_loss": -7.0058674812316895, "global_step": 163149, "epoch": 3884} {"train_loss": -7.07859992980957, "global_step": 163150, "epoch": 3884} {"train_loss": -7.087807655334473, "global_step": 163151, "epoch": 3884} {"train_loss": -6.957390785217285, "global_step": 163152, "epoch": 3884} {"train_loss": -7.0484442710876465, "global_step": 163153, "epoch": 3884} {"train_loss": -6.918160915374756, "global_step": 163154, "epoch": 3884} {"train_loss": -6.928841590881348, "global_step": 163155, "epoch": 3884} {"train_loss": -6.984681129455566, "global_step": 163156, "epoch": 3884} {"train_loss": -7.011516094207764, "global_step": 163157, "epoch": 3884} {"train_loss": -6.922120571136475, "global_step": 163158, "epoch": 3884} {"train_loss": -7.077617168426514, "global_step": 163159, "epoch": 3884} {"train_loss": -6.993106842041016, "global_step": 163160, "epoch": 3884} {"train_loss": -7.070967197418213, "global_step": 163161, "epoch": 3884} {"train_loss": -6.9531450271606445, "global_step": 163162, "epoch": 3884} {"train_loss": -7.036746025085449, "global_step": 163163, "epoch": 3884} {"train_loss": -7.0245819091796875, "global_step": 163164, "epoch": 3884} {"train_loss": -7.007124900817871, "global_step": 163165, "epoch": 3884} {"train_loss": -6.933584213256836, "global_step": 163166, "epoch": 3884} {"train_loss": -7.0377302169799805, "global_step": 163167, "epoch": 3884} {"train_loss": -6.964683532714844, "global_step": 163168, "epoch": 3884} {"train_loss": -7.000385011945452, "global_step": 163169, "epoch": 3884, "val_loss": 68674.53125} {"train_loss": -7.168351173400879, "global_step": 163170, "epoch": 3885} {"train_loss": -7.0111403465271, "global_step": 163171, "epoch": 3885} {"train_loss": -6.959375381469727, "global_step": 163172, "epoch": 3885} {"train_loss": -7.005764484405518, "global_step": 163173, "epoch": 3885} {"train_loss": -6.966361045837402, "global_step": 163174, "epoch": 3885} {"train_loss": -6.992563724517822, "global_step": 163175, "epoch": 3885} {"train_loss": -7.097304344177246, "global_step": 163176, "epoch": 3885} {"train_loss": -6.998429298400879, "global_step": 163177, "epoch": 3885} {"train_loss": -6.996988296508789, "global_step": 163178, "epoch": 3885} {"train_loss": -7.075013637542725, "global_step": 163179, "epoch": 3885} {"train_loss": -7.049415588378906, "global_step": 163180, "epoch": 3885} {"train_loss": -7.022453308105469, "global_step": 163181, "epoch": 3885} {"train_loss": -6.955756187438965, "global_step": 163182, "epoch": 3885} {"train_loss": -6.998480796813965, "global_step": 163183, "epoch": 3885} {"train_loss": -6.9997382164001465, "global_step": 163184, "epoch": 3885} {"train_loss": -6.99794340133667, "global_step": 163185, "epoch": 3885} {"train_loss": -6.894520282745361, "global_step": 163186, "epoch": 3885} {"train_loss": -6.97933292388916, "global_step": 163187, "epoch": 3885} {"train_loss": -6.979614734649658, "global_step": 163188, "epoch": 3885} {"train_loss": -7.053201675415039, "global_step": 163189, "epoch": 3885} {"train_loss": -6.931355953216553, "global_step": 163190, "epoch": 3885} {"train_loss": -6.935329914093018, "global_step": 163191, "epoch": 3885} {"train_loss": -6.941382884979248, "global_step": 163192, "epoch": 3885} {"train_loss": -7.071402549743652, "global_step": 163193, "epoch": 3885} {"train_loss": -6.914908409118652, "global_step": 163194, "epoch": 3885} {"train_loss": -7.079935073852539, "global_step": 163195, "epoch": 3885} {"train_loss": -7.018174171447754, "global_step": 163196, "epoch": 3885} {"train_loss": -6.798812389373779, "global_step": 163197, "epoch": 3885} {"train_loss": -7.1237921714782715, "global_step": 163198, "epoch": 3885} {"train_loss": -7.060161113739014, "global_step": 163199, "epoch": 3885} {"train_loss": -7.112872123718262, "global_step": 163200, "epoch": 3885} {"train_loss": -6.992853164672852, "global_step": 163201, "epoch": 3885} {"train_loss": -6.971283435821533, "global_step": 163202, "epoch": 3885} {"train_loss": -7.026056289672852, "global_step": 163203, "epoch": 3885} {"train_loss": -7.02963924407959, "global_step": 163204, "epoch": 3885} {"train_loss": -6.9942426681518555, "global_step": 163205, "epoch": 3885} {"train_loss": -6.924019813537598, "global_step": 163206, "epoch": 3885} {"train_loss": -6.962405204772949, "global_step": 163207, "epoch": 3885} {"train_loss": -7.070923805236816, "global_step": 163208, "epoch": 3885} {"train_loss": -6.972026824951172, "global_step": 163209, "epoch": 3885} {"train_loss": -6.954193115234375, "global_step": 163210, "epoch": 3885} {"train_loss": -7.003589119229998, "global_step": 163211, "epoch": 3885, "val_loss": 68715.7421875} {"train_loss": -7.041659355163574, "global_step": 163212, "epoch": 3886} {"train_loss": -7.086582183837891, "global_step": 163213, "epoch": 3886} {"train_loss": -7.074636459350586, "global_step": 163214, "epoch": 3886} {"train_loss": -6.992654323577881, "global_step": 163215, "epoch": 3886} {"train_loss": -7.080683708190918, "global_step": 163216, "epoch": 3886} {"train_loss": -6.932773113250732, "global_step": 163217, "epoch": 3886} {"train_loss": -6.80213737487793, "global_step": 163218, "epoch": 3886} {"train_loss": -7.055527210235596, "global_step": 163219, "epoch": 3886} {"train_loss": -6.915541648864746, "global_step": 163220, "epoch": 3886} {"train_loss": -7.034355163574219, "global_step": 163221, "epoch": 3886} {"train_loss": -6.959986686706543, "global_step": 163222, "epoch": 3886} {"train_loss": -6.920615196228027, "global_step": 163223, "epoch": 3886} {"train_loss": -6.992719650268555, "global_step": 163224, "epoch": 3886} {"train_loss": -6.972090721130371, "global_step": 163225, "epoch": 3886} {"train_loss": -7.005758762359619, "global_step": 163226, "epoch": 3886} {"train_loss": -6.905076026916504, "global_step": 163227, "epoch": 3886} {"train_loss": -6.954965114593506, "global_step": 163228, "epoch": 3886} {"train_loss": -6.877231121063232, "global_step": 163229, "epoch": 3886} {"train_loss": -6.951177597045898, "global_step": 163230, "epoch": 3886} {"train_loss": -6.9321489334106445, "global_step": 163231, "epoch": 3886} {"train_loss": -6.786202907562256, "global_step": 163232, "epoch": 3886} {"train_loss": -6.973773002624512, "global_step": 163233, "epoch": 3886} {"train_loss": -6.910749435424805, "global_step": 163234, "epoch": 3886} {"train_loss": -6.804736614227295, "global_step": 163235, "epoch": 3886} {"train_loss": -6.812255859375, "global_step": 163236, "epoch": 3886} {"train_loss": -6.839779376983643, "global_step": 163237, "epoch": 3886} {"train_loss": -6.921652793884277, "global_step": 163238, "epoch": 3886} {"train_loss": -7.013299942016602, "global_step": 163239, "epoch": 3886} {"train_loss": -7.008612155914307, "global_step": 163240, "epoch": 3886} {"train_loss": -7.011268615722656, "global_step": 163241, "epoch": 3886} {"train_loss": -6.957512855529785, "global_step": 163242, "epoch": 3886} {"train_loss": -6.942080497741699, "global_step": 163243, "epoch": 3886} {"train_loss": -6.996899604797363, "global_step": 163244, "epoch": 3886} {"train_loss": -6.872505187988281, "global_step": 163245, "epoch": 3886} {"train_loss": -7.039016246795654, "global_step": 163246, "epoch": 3886} {"train_loss": -6.8748040199279785, "global_step": 163247, "epoch": 3886} {"train_loss": -6.882786750793457, "global_step": 163248, "epoch": 3886} {"train_loss": -6.961519241333008, "global_step": 163249, "epoch": 3886} {"train_loss": -6.893279552459717, "global_step": 163250, "epoch": 3886} {"train_loss": -6.87528133392334, "global_step": 163251, "epoch": 3886} {"train_loss": -6.99353551864624, "global_step": 163252, "epoch": 3886} {"train_loss": -6.945310569944835, "global_step": 163253, "epoch": 3886, "val_loss": 68768.171875} {"train_loss": -6.955855369567871, "global_step": 163254, "epoch": 3887} {"train_loss": -6.890171051025391, "global_step": 163255, "epoch": 3887} {"train_loss": -6.93265438079834, "global_step": 163256, "epoch": 3887} {"train_loss": -6.916104316711426, "global_step": 163257, "epoch": 3887} {"train_loss": -7.028310775756836, "global_step": 163258, "epoch": 3887} {"train_loss": -6.964303016662598, "global_step": 163259, "epoch": 3887} {"train_loss": -7.026597023010254, "global_step": 163260, "epoch": 3887} {"train_loss": -7.003650665283203, "global_step": 163261, "epoch": 3887} {"train_loss": -6.938345909118652, "global_step": 163262, "epoch": 3887} {"train_loss": -6.959676742553711, "global_step": 163263, "epoch": 3887} {"train_loss": -6.962449073791504, "global_step": 163264, "epoch": 3887} {"train_loss": -7.007404327392578, "global_step": 163265, "epoch": 3887} {"train_loss": -7.0132832527160645, "global_step": 163266, "epoch": 3887} {"train_loss": -6.921207427978516, "global_step": 163267, "epoch": 3887} {"train_loss": -6.81838846206665, "global_step": 163268, "epoch": 3887} {"train_loss": -6.881546497344971, "global_step": 163269, "epoch": 3887} {"train_loss": -7.023967742919922, "global_step": 163270, "epoch": 3887} {"train_loss": -6.920840263366699, "global_step": 163271, "epoch": 3887} {"train_loss": -7.000710964202881, "global_step": 163272, "epoch": 3887} {"train_loss": -6.969419479370117, "global_step": 163273, "epoch": 3887} {"train_loss": -6.844978332519531, "global_step": 163274, "epoch": 3887} {"train_loss": -6.827004432678223, "global_step": 163275, "epoch": 3887} {"train_loss": -7.000298976898193, "global_step": 163276, "epoch": 3887} {"train_loss": -6.953530788421631, "global_step": 163277, "epoch": 3887} {"train_loss": -6.885518550872803, "global_step": 163278, "epoch": 3887} {"train_loss": -6.944859504699707, "global_step": 163279, "epoch": 3887} {"train_loss": -6.783239364624023, "global_step": 163280, "epoch": 3887} {"train_loss": -6.992614269256592, "global_step": 163281, "epoch": 3887} {"train_loss": -6.880890846252441, "global_step": 163282, "epoch": 3887} {"train_loss": -6.9824652671813965, "global_step": 163283, "epoch": 3887} {"train_loss": -6.9272894859313965, "global_step": 163284, "epoch": 3887} {"train_loss": -7.021054744720459, "global_step": 163285, "epoch": 3887} {"train_loss": -6.983524322509766, "global_step": 163286, "epoch": 3887} {"train_loss": -6.845280647277832, "global_step": 163287, "epoch": 3887} {"train_loss": -6.954839706420898, "global_step": 163288, "epoch": 3887} {"train_loss": -6.991484642028809, "global_step": 163289, "epoch": 3887} {"train_loss": -6.987380027770996, "global_step": 163290, "epoch": 3887} {"train_loss": -7.032983779907227, "global_step": 163291, "epoch": 3887} {"train_loss": -7.003918647766113, "global_step": 163292, "epoch": 3887} {"train_loss": -7.029976844787598, "global_step": 163293, "epoch": 3887} {"train_loss": -7.057439804077148, "global_step": 163294, "epoch": 3887} {"train_loss": -6.9546388785044355, "global_step": 163295, "epoch": 3887, "val_loss": 68535.078125} {"train_loss": -7.085556983947754, "global_step": 163296, "epoch": 3888} {"train_loss": -7.034936904907227, "global_step": 163297, "epoch": 3888} {"train_loss": -6.9585957527160645, "global_step": 163298, "epoch": 3888} {"train_loss": -7.089653015136719, "global_step": 163299, "epoch": 3888} {"train_loss": -7.050137519836426, "global_step": 163300, "epoch": 3888} {"train_loss": -6.888649940490723, "global_step": 163301, "epoch": 3888} {"train_loss": -7.035370826721191, "global_step": 163302, "epoch": 3888} {"train_loss": -6.9914703369140625, "global_step": 163303, "epoch": 3888} {"train_loss": -6.926849365234375, "global_step": 163304, "epoch": 3888} {"train_loss": -7.022394180297852, "global_step": 163305, "epoch": 3888} {"train_loss": -6.913699150085449, "global_step": 163306, "epoch": 3888} {"train_loss": -6.878839492797852, "global_step": 163307, "epoch": 3888} {"train_loss": -6.920892715454102, "global_step": 163308, "epoch": 3888} {"train_loss": -6.975873947143555, "global_step": 163309, "epoch": 3888} {"train_loss": -6.914087295532227, "global_step": 163310, "epoch": 3888} {"train_loss": -6.863442420959473, "global_step": 163311, "epoch": 3888} {"train_loss": -6.946149826049805, "global_step": 163312, "epoch": 3888} {"train_loss": -6.853363037109375, "global_step": 163313, "epoch": 3888} {"train_loss": -6.897371292114258, "global_step": 163314, "epoch": 3888} {"train_loss": -7.0231852531433105, "global_step": 163315, "epoch": 3888} {"train_loss": -6.8612165451049805, "global_step": 163316, "epoch": 3888} {"train_loss": -6.998552322387695, "global_step": 163317, "epoch": 3888} {"train_loss": -6.987270355224609, "global_step": 163318, "epoch": 3888} {"train_loss": -6.956604957580566, "global_step": 163319, "epoch": 3888} {"train_loss": -7.088305473327637, "global_step": 163320, "epoch": 3888} {"train_loss": -7.027195930480957, "global_step": 163321, "epoch": 3888} {"train_loss": -6.896196365356445, "global_step": 163322, "epoch": 3888} {"train_loss": -6.959460735321045, "global_step": 163323, "epoch": 3888} {"train_loss": -6.959161758422852, "global_step": 163324, "epoch": 3888} {"train_loss": -6.815676689147949, "global_step": 163325, "epoch": 3888} {"train_loss": -6.954905033111572, "global_step": 163326, "epoch": 3888} {"train_loss": -6.958393096923828, "global_step": 163327, "epoch": 3888} {"train_loss": -6.909433364868164, "global_step": 163328, "epoch": 3888} {"train_loss": -7.032587051391602, "global_step": 163329, "epoch": 3888} {"train_loss": -6.8249664306640625, "global_step": 163330, "epoch": 3888} {"train_loss": -6.941962242126465, "global_step": 163331, "epoch": 3888} {"train_loss": -7.013157844543457, "global_step": 163332, "epoch": 3888} {"train_loss": -6.946567058563232, "global_step": 163333, "epoch": 3888} {"train_loss": -6.9554924964904785, "global_step": 163334, "epoch": 3888} {"train_loss": -6.89632511138916, "global_step": 163335, "epoch": 3888} {"train_loss": -7.028620719909668, "global_step": 163336, "epoch": 3888} {"train_loss": -6.955908366612026, "global_step": 163337, "epoch": 3888, "val_loss": 68525.578125} {"train_loss": -6.9966206550598145, "global_step": 163338, "epoch": 3889} {"train_loss": -6.992641448974609, "global_step": 163339, "epoch": 3889} {"train_loss": -6.955440044403076, "global_step": 163340, "epoch": 3889} {"train_loss": -6.919387340545654, "global_step": 163341, "epoch": 3889} {"train_loss": -7.017526626586914, "global_step": 163342, "epoch": 3889} {"train_loss": -7.002969264984131, "global_step": 163343, "epoch": 3889} {"train_loss": -6.997600078582764, "global_step": 163344, "epoch": 3889} {"train_loss": -6.931983947753906, "global_step": 163345, "epoch": 3889} {"train_loss": -6.9816484451293945, "global_step": 163346, "epoch": 3889} {"train_loss": -6.9256486892700195, "global_step": 163347, "epoch": 3889} {"train_loss": -6.982382774353027, "global_step": 163348, "epoch": 3889} {"train_loss": -6.938057899475098, "global_step": 163349, "epoch": 3889} {"train_loss": -6.840716361999512, "global_step": 163350, "epoch": 3889} {"train_loss": -7.047651290893555, "global_step": 163351, "epoch": 3889} {"train_loss": -6.882679462432861, "global_step": 163352, "epoch": 3889} {"train_loss": -6.829286575317383, "global_step": 163353, "epoch": 3889} {"train_loss": -7.071166515350342, "global_step": 163354, "epoch": 3889} {"train_loss": -6.827040195465088, "global_step": 163355, "epoch": 3889} {"train_loss": -7.078681945800781, "global_step": 163356, "epoch": 3889} {"train_loss": -6.929251194000244, "global_step": 163357, "epoch": 3889} {"train_loss": -6.934537887573242, "global_step": 163358, "epoch": 3889} {"train_loss": -6.90758752822876, "global_step": 163359, "epoch": 3889} {"train_loss": -6.915053367614746, "global_step": 163360, "epoch": 3889} {"train_loss": -7.041419982910156, "global_step": 163361, "epoch": 3889} {"train_loss": -6.875618934631348, "global_step": 163362, "epoch": 3889} {"train_loss": -6.935940742492676, "global_step": 163363, "epoch": 3889} {"train_loss": -6.880107879638672, "global_step": 163364, "epoch": 3889} {"train_loss": -6.959233283996582, "global_step": 163365, "epoch": 3889} {"train_loss": -6.927206516265869, "global_step": 163366, "epoch": 3889} {"train_loss": -6.873261451721191, "global_step": 163367, "epoch": 3889} {"train_loss": -7.014143943786621, "global_step": 163368, "epoch": 3889} {"train_loss": -7.011397361755371, "global_step": 163369, "epoch": 3889} {"train_loss": -6.9246931076049805, "global_step": 163370, "epoch": 3889} {"train_loss": -6.9701619148254395, "global_step": 163371, "epoch": 3889} {"train_loss": -7.033939838409424, "global_step": 163372, "epoch": 3889} {"train_loss": -6.764494895935059, "global_step": 163373, "epoch": 3889} {"train_loss": -7.008584022521973, "global_step": 163374, "epoch": 3889} {"train_loss": -6.839503765106201, "global_step": 163375, "epoch": 3889} {"train_loss": -6.919852256774902, "global_step": 163376, "epoch": 3889} {"train_loss": -6.946462631225586, "global_step": 163377, "epoch": 3889} {"train_loss": -6.968966960906982, "global_step": 163378, "epoch": 3889} {"train_loss": -6.946590366817656, "global_step": 163379, "epoch": 3889, "val_loss": 68896.5234375} {"train_loss": -6.660327434539795, "global_step": 163380, "epoch": 3890} {"train_loss": -6.886013031005859, "global_step": 163381, "epoch": 3890} {"train_loss": -6.670026779174805, "global_step": 163382, "epoch": 3890} {"train_loss": -6.809523105621338, "global_step": 163383, "epoch": 3890} {"train_loss": -6.819637298583984, "global_step": 163384, "epoch": 3890} {"train_loss": -6.792140483856201, "global_step": 163385, "epoch": 3890} {"train_loss": -6.874472618103027, "global_step": 163386, "epoch": 3890} {"train_loss": -6.742956161499023, "global_step": 163387, "epoch": 3890} {"train_loss": -7.018575668334961, "global_step": 163388, "epoch": 3890} {"train_loss": -6.829092979431152, "global_step": 163389, "epoch": 3890} {"train_loss": -6.84512996673584, "global_step": 163390, "epoch": 3890} {"train_loss": -6.821849346160889, "global_step": 163391, "epoch": 3890} {"train_loss": -6.914497375488281, "global_step": 163392, "epoch": 3890} {"train_loss": -6.967714309692383, "global_step": 163393, "epoch": 3890} {"train_loss": -6.851385116577148, "global_step": 163394, "epoch": 3890} {"train_loss": -6.910357475280762, "global_step": 163395, "epoch": 3890} {"train_loss": -6.920315742492676, "global_step": 163396, "epoch": 3890} {"train_loss": -6.966311454772949, "global_step": 163397, "epoch": 3890} {"train_loss": -6.90980339050293, "global_step": 163398, "epoch": 3890} {"train_loss": -6.972997665405273, "global_step": 163399, "epoch": 3890} {"train_loss": -6.998838424682617, "global_step": 163400, "epoch": 3890} {"train_loss": -6.986150741577148, "global_step": 163401, "epoch": 3890} {"train_loss": -6.888775825500488, "global_step": 163402, "epoch": 3890} {"train_loss": -7.0471367835998535, "global_step": 163403, "epoch": 3890} {"train_loss": -6.994165420532227, "global_step": 163404, "epoch": 3890} {"train_loss": -6.973505973815918, "global_step": 163405, "epoch": 3890} {"train_loss": -6.990511894226074, "global_step": 163406, "epoch": 3890} {"train_loss": -6.910647392272949, "global_step": 163407, "epoch": 3890} {"train_loss": -7.025750160217285, "global_step": 163408, "epoch": 3890} {"train_loss": -6.894821643829346, "global_step": 163409, "epoch": 3890} {"train_loss": -7.0152201652526855, "global_step": 163410, "epoch": 3890} {"train_loss": -6.967949867248535, "global_step": 163411, "epoch": 3890} {"train_loss": -7.003209114074707, "global_step": 163412, "epoch": 3890} {"train_loss": -7.065476894378662, "global_step": 163413, "epoch": 3890} {"train_loss": -7.005924224853516, "global_step": 163414, "epoch": 3890} {"train_loss": -7.0240607261657715, "global_step": 163415, "epoch": 3890} {"train_loss": -7.093420505523682, "global_step": 163416, "epoch": 3890} {"train_loss": -7.048612594604492, "global_step": 163417, "epoch": 3890} {"train_loss": -7.002380847930908, "global_step": 163418, "epoch": 3890} {"train_loss": -6.979493141174316, "global_step": 163419, "epoch": 3890} {"train_loss": -6.998276710510254, "global_step": 163420, "epoch": 3890} {"train_loss": -6.931049744288127, "global_step": 163421, "epoch": 3890, "val_loss": 68597.546875} {"train_loss": -6.86361026763916, "global_step": 163422, "epoch": 3891} {"train_loss": -7.100214004516602, "global_step": 163423, "epoch": 3891} {"train_loss": -6.932123184204102, "global_step": 163424, "epoch": 3891} {"train_loss": -6.8413190841674805, "global_step": 163425, "epoch": 3891} {"train_loss": -6.996304035186768, "global_step": 163426, "epoch": 3891} {"train_loss": -6.796669960021973, "global_step": 163427, "epoch": 3891} {"train_loss": -6.91329288482666, "global_step": 163428, "epoch": 3891} {"train_loss": -6.8521270751953125, "global_step": 163429, "epoch": 3891} {"train_loss": -6.836184978485107, "global_step": 163430, "epoch": 3891} {"train_loss": -6.929196834564209, "global_step": 163431, "epoch": 3891} {"train_loss": -6.8731584548950195, "global_step": 163432, "epoch": 3891} {"train_loss": -6.9132161140441895, "global_step": 163433, "epoch": 3891} {"train_loss": -6.903595924377441, "global_step": 163434, "epoch": 3891} {"train_loss": -6.940884590148926, "global_step": 163435, "epoch": 3891} {"train_loss": -7.012049674987793, "global_step": 163436, "epoch": 3891} {"train_loss": -6.978708267211914, "global_step": 163437, "epoch": 3891} {"train_loss": -6.930981159210205, "global_step": 163438, "epoch": 3891} {"train_loss": -7.002071380615234, "global_step": 163439, "epoch": 3891} {"train_loss": -6.95164680480957, "global_step": 163440, "epoch": 3891} {"train_loss": -6.867631912231445, "global_step": 163441, "epoch": 3891} {"train_loss": -7.005949974060059, "global_step": 163442, "epoch": 3891} {"train_loss": -7.009035110473633, "global_step": 163443, "epoch": 3891} {"train_loss": -6.968690872192383, "global_step": 163444, "epoch": 3891} {"train_loss": -7.121960163116455, "global_step": 163445, "epoch": 3891} {"train_loss": -6.969236373901367, "global_step": 163446, "epoch": 3891} {"train_loss": -6.938992023468018, "global_step": 163447, "epoch": 3891} {"train_loss": -6.991322994232178, "global_step": 163448, "epoch": 3891} {"train_loss": -6.958993434906006, "global_step": 163449, "epoch": 3891} {"train_loss": -7.005771636962891, "global_step": 163450, "epoch": 3891} {"train_loss": -6.944131851196289, "global_step": 163451, "epoch": 3891} {"train_loss": -7.071062088012695, "global_step": 163452, "epoch": 3891} {"train_loss": -6.990772247314453, "global_step": 163453, "epoch": 3891} {"train_loss": -7.050411224365234, "global_step": 163454, "epoch": 3891} {"train_loss": -7.005719184875488, "global_step": 163455, "epoch": 3891} {"train_loss": -6.993819236755371, "global_step": 163456, "epoch": 3891} {"train_loss": -7.080844879150391, "global_step": 163457, "epoch": 3891} {"train_loss": -7.006861686706543, "global_step": 163458, "epoch": 3891} {"train_loss": -7.07199764251709, "global_step": 163459, "epoch": 3891} {"train_loss": -7.077489852905273, "global_step": 163460, "epoch": 3891} {"train_loss": -7.074450969696045, "global_step": 163461, "epoch": 3891} {"train_loss": -7.0066304206848145, "global_step": 163462, "epoch": 3891} {"train_loss": -6.9721510637374156, "global_step": 163463, "epoch": 3891, "val_loss": 68620.5625} {"train_loss": -7.062743186950684, "global_step": 163464, "epoch": 3892} {"train_loss": -7.082208633422852, "global_step": 163465, "epoch": 3892} {"train_loss": -7.07729434967041, "global_step": 163466, "epoch": 3892} {"train_loss": -6.985062599182129, "global_step": 163467, "epoch": 3892} {"train_loss": -7.057050704956055, "global_step": 163468, "epoch": 3892} {"train_loss": -7.174185752868652, "global_step": 163469, "epoch": 3892} {"train_loss": -7.101870536804199, "global_step": 163470, "epoch": 3892} {"train_loss": -6.990880966186523, "global_step": 163471, "epoch": 3892} {"train_loss": -7.008252143859863, "global_step": 163472, "epoch": 3892} {"train_loss": -6.92390251159668, "global_step": 163473, "epoch": 3892} {"train_loss": -6.880466938018799, "global_step": 163474, "epoch": 3892} {"train_loss": -7.08193302154541, "global_step": 163475, "epoch": 3892} {"train_loss": -6.903279781341553, "global_step": 163476, "epoch": 3892} {"train_loss": -6.969278335571289, "global_step": 163477, "epoch": 3892} {"train_loss": -7.089888095855713, "global_step": 163478, "epoch": 3892} {"train_loss": -7.05534553527832, "global_step": 163479, "epoch": 3892} {"train_loss": -6.926581382751465, "global_step": 163480, "epoch": 3892} {"train_loss": -6.901433944702148, "global_step": 163481, "epoch": 3892} {"train_loss": -7.038360118865967, "global_step": 163482, "epoch": 3892} {"train_loss": -7.043166160583496, "global_step": 163483, "epoch": 3892} {"train_loss": -7.079952716827393, "global_step": 163484, "epoch": 3892} {"train_loss": -7.063717842102051, "global_step": 163485, "epoch": 3892} {"train_loss": -6.982044219970703, "global_step": 163486, "epoch": 3892} {"train_loss": -6.998347759246826, "global_step": 163487, "epoch": 3892} {"train_loss": -7.039977073669434, "global_step": 163488, "epoch": 3892} {"train_loss": -6.928063869476318, "global_step": 163489, "epoch": 3892} {"train_loss": -6.966311454772949, "global_step": 163490, "epoch": 3892} {"train_loss": -7.029468536376953, "global_step": 163491, "epoch": 3892} {"train_loss": -6.94928503036499, "global_step": 163492, "epoch": 3892} {"train_loss": -7.04218053817749, "global_step": 163493, "epoch": 3892} {"train_loss": -6.968099594116211, "global_step": 163494, "epoch": 3892} {"train_loss": -7.125673294067383, "global_step": 163495, "epoch": 3892} {"train_loss": -7.034247398376465, "global_step": 163496, "epoch": 3892} {"train_loss": -7.00217342376709, "global_step": 163497, "epoch": 3892} {"train_loss": -6.950684547424316, "global_step": 163498, "epoch": 3892} {"train_loss": -6.945469856262207, "global_step": 163499, "epoch": 3892} {"train_loss": -7.082016944885254, "global_step": 163500, "epoch": 3892} {"train_loss": -6.890993118286133, "global_step": 163501, "epoch": 3892} {"train_loss": -7.065629959106445, "global_step": 163502, "epoch": 3892} {"train_loss": -6.945216178894043, "global_step": 163503, "epoch": 3892} {"train_loss": -7.0481977462768555, "global_step": 163504, "epoch": 3892} {"train_loss": -7.010584036509196, "global_step": 163505, "epoch": 3892, "val_loss": 69087.7734375} {"train_loss": -6.9939093589782715, "global_step": 163506, "epoch": 3893} {"train_loss": -6.843868255615234, "global_step": 163507, "epoch": 3893} {"train_loss": -6.962983131408691, "global_step": 163508, "epoch": 3893} {"train_loss": -6.948565483093262, "global_step": 163509, "epoch": 3893} {"train_loss": -7.018910884857178, "global_step": 163510, "epoch": 3893} {"train_loss": -7.022725582122803, "global_step": 163511, "epoch": 3893} {"train_loss": -7.0106000900268555, "global_step": 163512, "epoch": 3893} {"train_loss": -6.916421890258789, "global_step": 163513, "epoch": 3893} {"train_loss": -7.019828796386719, "global_step": 163514, "epoch": 3893} {"train_loss": -6.970852851867676, "global_step": 163515, "epoch": 3893} {"train_loss": -6.928114891052246, "global_step": 163516, "epoch": 3893} {"train_loss": -6.983166694641113, "global_step": 163517, "epoch": 3893} {"train_loss": -6.998654365539551, "global_step": 163518, "epoch": 3893} {"train_loss": -6.90519905090332, "global_step": 163519, "epoch": 3893} {"train_loss": -6.86734676361084, "global_step": 163520, "epoch": 3893} {"train_loss": -7.0320940017700195, "global_step": 163521, "epoch": 3893} {"train_loss": -6.855340003967285, "global_step": 163522, "epoch": 3893} {"train_loss": -6.895365238189697, "global_step": 163523, "epoch": 3893} {"train_loss": -6.937394142150879, "global_step": 163524, "epoch": 3893} {"train_loss": -6.995904922485352, "global_step": 163525, "epoch": 3893} {"train_loss": -6.85224723815918, "global_step": 163526, "epoch": 3893} {"train_loss": -7.107987403869629, "global_step": 163527, "epoch": 3893} {"train_loss": -7.030045032501221, "global_step": 163528, "epoch": 3893} {"train_loss": -7.1314239501953125, "global_step": 163529, "epoch": 3893} {"train_loss": -7.065311431884766, "global_step": 163530, "epoch": 3893} {"train_loss": -7.026406764984131, "global_step": 163531, "epoch": 3893} {"train_loss": -7.044524192810059, "global_step": 163532, "epoch": 3893} {"train_loss": -6.982301712036133, "global_step": 163533, "epoch": 3893} {"train_loss": -6.890175819396973, "global_step": 163534, "epoch": 3893} {"train_loss": -7.001559734344482, "global_step": 163535, "epoch": 3893} {"train_loss": -6.989015579223633, "global_step": 163536, "epoch": 3893} {"train_loss": -7.0204997062683105, "global_step": 163537, "epoch": 3893} {"train_loss": -7.041570663452148, "global_step": 163538, "epoch": 3893} {"train_loss": -7.049949645996094, "global_step": 163539, "epoch": 3893} {"train_loss": -7.001034736633301, "global_step": 163540, "epoch": 3893} {"train_loss": -7.055864334106445, "global_step": 163541, "epoch": 3893} {"train_loss": -6.952284812927246, "global_step": 163542, "epoch": 3893} {"train_loss": -6.994444847106934, "global_step": 163543, "epoch": 3893} {"train_loss": -7.053606986999512, "global_step": 163544, "epoch": 3893} {"train_loss": -6.917612075805664, "global_step": 163545, "epoch": 3893} {"train_loss": -6.970735549926758, "global_step": 163546, "epoch": 3893} {"train_loss": -6.9825442518506735, "global_step": 163547, "epoch": 3893, "val_loss": 68673.5078125} {"train_loss": -7.005892753601074, "global_step": 163548, "epoch": 3894} {"train_loss": -6.990830421447754, "global_step": 163549, "epoch": 3894} {"train_loss": -6.9910149574279785, "global_step": 163550, "epoch": 3894} {"train_loss": -7.107465744018555, "global_step": 163551, "epoch": 3894} {"train_loss": -6.927554130554199, "global_step": 163552, "epoch": 3894} {"train_loss": -7.054685592651367, "global_step": 163553, "epoch": 3894} {"train_loss": -6.935208320617676, "global_step": 163554, "epoch": 3894} {"train_loss": -6.997176170349121, "global_step": 163555, "epoch": 3894} {"train_loss": -6.90745735168457, "global_step": 163556, "epoch": 3894} {"train_loss": -6.932082176208496, "global_step": 163557, "epoch": 3894} {"train_loss": -7.016358375549316, "global_step": 163558, "epoch": 3894} {"train_loss": -6.951879501342773, "global_step": 163559, "epoch": 3894} {"train_loss": -6.92517614364624, "global_step": 163560, "epoch": 3894} {"train_loss": -6.996110439300537, "global_step": 163561, "epoch": 3894} {"train_loss": -6.889742374420166, "global_step": 163562, "epoch": 3894} {"train_loss": -6.9365034103393555, "global_step": 163563, "epoch": 3894} {"train_loss": -7.035597324371338, "global_step": 163564, "epoch": 3894} {"train_loss": -6.91162109375, "global_step": 163565, "epoch": 3894} {"train_loss": -6.953090667724609, "global_step": 163566, "epoch": 3894} {"train_loss": -6.933853626251221, "global_step": 163567, "epoch": 3894} {"train_loss": -7.086365699768066, "global_step": 163568, "epoch": 3894} {"train_loss": -6.981015205383301, "global_step": 163569, "epoch": 3894} {"train_loss": -6.9135236740112305, "global_step": 163570, "epoch": 3894} {"train_loss": -7.045231342315674, "global_step": 163571, "epoch": 3894} {"train_loss": -7.012988090515137, "global_step": 163572, "epoch": 3894} {"train_loss": -7.027901649475098, "global_step": 163573, "epoch": 3894} {"train_loss": -6.9445013999938965, "global_step": 163574, "epoch": 3894} {"train_loss": -7.153131484985352, "global_step": 163575, "epoch": 3894} {"train_loss": -6.942717552185059, "global_step": 163576, "epoch": 3894} {"train_loss": -6.893187522888184, "global_step": 163577, "epoch": 3894} {"train_loss": -7.06894588470459, "global_step": 163578, "epoch": 3894} {"train_loss": -6.974976539611816, "global_step": 163579, "epoch": 3894} {"train_loss": -6.866696357727051, "global_step": 163580, "epoch": 3894} {"train_loss": -6.974416255950928, "global_step": 163581, "epoch": 3894} {"train_loss": -6.9750261306762695, "global_step": 163582, "epoch": 3894} {"train_loss": -6.952032089233398, "global_step": 163583, "epoch": 3894} {"train_loss": -6.947701454162598, "global_step": 163584, "epoch": 3894} {"train_loss": -6.970585823059082, "global_step": 163585, "epoch": 3894} {"train_loss": -6.879815578460693, "global_step": 163586, "epoch": 3894} {"train_loss": -6.833006858825684, "global_step": 163587, "epoch": 3894} {"train_loss": -6.780282974243164, "global_step": 163588, "epoch": 3894} {"train_loss": -6.96572969073341, "global_step": 163589, "epoch": 3894, "val_loss": 68767.9609375} {"train_loss": -6.89223051071167, "global_step": 163590, "epoch": 3895} {"train_loss": -6.846714973449707, "global_step": 163591, "epoch": 3895} {"train_loss": -6.875600814819336, "global_step": 163592, "epoch": 3895} {"train_loss": -6.9476518630981445, "global_step": 163593, "epoch": 3895} {"train_loss": -6.888101577758789, "global_step": 163594, "epoch": 3895} {"train_loss": -6.90635347366333, "global_step": 163595, "epoch": 3895} {"train_loss": -6.936577320098877, "global_step": 163596, "epoch": 3895} {"train_loss": -6.938851356506348, "global_step": 163597, "epoch": 3895} {"train_loss": -6.928225517272949, "global_step": 163598, "epoch": 3895} {"train_loss": -6.963129997253418, "global_step": 163599, "epoch": 3895} {"train_loss": -6.9407758712768555, "global_step": 163600, "epoch": 3895} {"train_loss": -7.051881790161133, "global_step": 163601, "epoch": 3895} {"train_loss": -6.923399925231934, "global_step": 163602, "epoch": 3895} {"train_loss": -7.057156562805176, "global_step": 163603, "epoch": 3895} {"train_loss": -7.064637660980225, "global_step": 163604, "epoch": 3895} {"train_loss": -7.010034084320068, "global_step": 163605, "epoch": 3895} {"train_loss": -6.959961891174316, "global_step": 163606, "epoch": 3895} {"train_loss": -7.006897926330566, "global_step": 163607, "epoch": 3895} {"train_loss": -7.13084602355957, "global_step": 163608, "epoch": 3895} {"train_loss": -6.967977523803711, "global_step": 163609, "epoch": 3895} {"train_loss": -6.994429111480713, "global_step": 163610, "epoch": 3895} {"train_loss": -7.087540149688721, "global_step": 163611, "epoch": 3895} {"train_loss": -6.9368977546691895, "global_step": 163612, "epoch": 3895} {"train_loss": -6.992195129394531, "global_step": 163613, "epoch": 3895} {"train_loss": -6.923466205596924, "global_step": 163614, "epoch": 3895} {"train_loss": -6.899685859680176, "global_step": 163615, "epoch": 3895} {"train_loss": -6.947404861450195, "global_step": 163616, "epoch": 3895} {"train_loss": -6.966132164001465, "global_step": 163617, "epoch": 3895} {"train_loss": -7.010504722595215, "global_step": 163618, "epoch": 3895} {"train_loss": -7.042483329772949, "global_step": 163619, "epoch": 3895} {"train_loss": -6.979304313659668, "global_step": 163620, "epoch": 3895} {"train_loss": -6.9815168380737305, "global_step": 163621, "epoch": 3895} {"train_loss": -7.061457633972168, "global_step": 163622, "epoch": 3895} {"train_loss": -6.93208122253418, "global_step": 163623, "epoch": 3895} {"train_loss": -7.007146835327148, "global_step": 163624, "epoch": 3895} {"train_loss": -7.083277702331543, "global_step": 163625, "epoch": 3895} {"train_loss": -7.00473690032959, "global_step": 163626, "epoch": 3895} {"train_loss": -7.074436187744141, "global_step": 163627, "epoch": 3895} {"train_loss": -7.1033453941345215, "global_step": 163628, "epoch": 3895} {"train_loss": -6.960786819458008, "global_step": 163629, "epoch": 3895} {"train_loss": -6.999936103820801, "global_step": 163630, "epoch": 3895} {"train_loss": -6.979940437135243, "global_step": 163631, "epoch": 3895, "val_loss": 68611.859375} {"train_loss": -6.987363815307617, "global_step": 163632, "epoch": 3896} {"train_loss": -7.041037559509277, "global_step": 163633, "epoch": 3896} {"train_loss": -6.964542388916016, "global_step": 163634, "epoch": 3896} {"train_loss": -6.943530082702637, "global_step": 163635, "epoch": 3896} {"train_loss": -6.9801154136657715, "global_step": 163636, "epoch": 3896} {"train_loss": -7.074378967285156, "global_step": 163637, "epoch": 3896} {"train_loss": -6.9990386962890625, "global_step": 163638, "epoch": 3896} {"train_loss": -7.032045841217041, "global_step": 163639, "epoch": 3896} {"train_loss": -7.006114482879639, "global_step": 163640, "epoch": 3896} {"train_loss": -6.970221042633057, "global_step": 163641, "epoch": 3896} {"train_loss": -6.967443943023682, "global_step": 163642, "epoch": 3896} {"train_loss": -6.91909646987915, "global_step": 163643, "epoch": 3896} {"train_loss": -6.942320823669434, "global_step": 163644, "epoch": 3896} {"train_loss": -6.996047019958496, "global_step": 163645, "epoch": 3896} {"train_loss": -7.100711822509766, "global_step": 163646, "epoch": 3896} {"train_loss": -6.963151454925537, "global_step": 163647, "epoch": 3896} {"train_loss": -7.001499176025391, "global_step": 163648, "epoch": 3896} {"train_loss": -6.989730358123779, "global_step": 163649, "epoch": 3896} {"train_loss": -6.94521427154541, "global_step": 163650, "epoch": 3896} {"train_loss": -6.972224235534668, "global_step": 163651, "epoch": 3896} {"train_loss": -7.006474018096924, "global_step": 163652, "epoch": 3896} {"train_loss": -6.861830234527588, "global_step": 163653, "epoch": 3896} {"train_loss": -6.898870944976807, "global_step": 163654, "epoch": 3896} {"train_loss": -7.061093807220459, "global_step": 163655, "epoch": 3896} {"train_loss": -6.958172798156738, "global_step": 163656, "epoch": 3896} {"train_loss": -6.9936933517456055, "global_step": 163657, "epoch": 3896} {"train_loss": -6.984013557434082, "global_step": 163658, "epoch": 3896} {"train_loss": -6.960653305053711, "global_step": 163659, "epoch": 3896} {"train_loss": -6.945898056030273, "global_step": 163660, "epoch": 3896} {"train_loss": -7.006191730499268, "global_step": 163661, "epoch": 3896} {"train_loss": -7.00613260269165, "global_step": 163662, "epoch": 3896} {"train_loss": -7.035239219665527, "global_step": 163663, "epoch": 3896} {"train_loss": -6.984210014343262, "global_step": 163664, "epoch": 3896} {"train_loss": -6.987546920776367, "global_step": 163665, "epoch": 3896} {"train_loss": -7.060148239135742, "global_step": 163666, "epoch": 3896} {"train_loss": -6.922377109527588, "global_step": 163667, "epoch": 3896} {"train_loss": -7.049546241760254, "global_step": 163668, "epoch": 3896} {"train_loss": -7.019046783447266, "global_step": 163669, "epoch": 3896} {"train_loss": -6.988718509674072, "global_step": 163670, "epoch": 3896} {"train_loss": -6.96433162689209, "global_step": 163671, "epoch": 3896} {"train_loss": -6.974331855773926, "global_step": 163672, "epoch": 3896} {"train_loss": -6.988393976574852, "global_step": 163673, "epoch": 3896, "val_loss": 68618.09375} {"train_loss": -7.039999485015869, "global_step": 163674, "epoch": 3897} {"train_loss": -7.03434944152832, "global_step": 163675, "epoch": 3897} {"train_loss": -7.043286323547363, "global_step": 163676, "epoch": 3897} {"train_loss": -7.030121803283691, "global_step": 163677, "epoch": 3897} {"train_loss": -6.989362716674805, "global_step": 163678, "epoch": 3897} {"train_loss": -6.996277332305908, "global_step": 163679, "epoch": 3897} {"train_loss": -7.026226043701172, "global_step": 163680, "epoch": 3897} {"train_loss": -7.0655975341796875, "global_step": 163681, "epoch": 3897} {"train_loss": -7.02901554107666, "global_step": 163682, "epoch": 3897} {"train_loss": -6.96864128112793, "global_step": 163683, "epoch": 3897} {"train_loss": -7.088457107543945, "global_step": 163684, "epoch": 3897} {"train_loss": -7.065496444702148, "global_step": 163685, "epoch": 3897} {"train_loss": -7.06193208694458, "global_step": 163686, "epoch": 3897} {"train_loss": -7.002372741699219, "global_step": 163687, "epoch": 3897} {"train_loss": -6.905572891235352, "global_step": 163688, "epoch": 3897} {"train_loss": -7.049093723297119, "global_step": 163689, "epoch": 3897} {"train_loss": -6.910009384155273, "global_step": 163690, "epoch": 3897} {"train_loss": -6.861140727996826, "global_step": 163691, "epoch": 3897} {"train_loss": -7.0104594230651855, "global_step": 163692, "epoch": 3897} {"train_loss": -7.045469284057617, "global_step": 163693, "epoch": 3897} {"train_loss": -7.010538578033447, "global_step": 163694, "epoch": 3897} {"train_loss": -7.187955379486084, "global_step": 163695, "epoch": 3897} {"train_loss": -6.948563575744629, "global_step": 163696, "epoch": 3897} {"train_loss": -6.954648494720459, "global_step": 163697, "epoch": 3897} {"train_loss": -6.950473785400391, "global_step": 163698, "epoch": 3897} {"train_loss": -7.030895233154297, "global_step": 163699, "epoch": 3897} {"train_loss": -6.929683685302734, "global_step": 163700, "epoch": 3897} {"train_loss": -7.050337314605713, "global_step": 163701, "epoch": 3897} {"train_loss": -6.989749908447266, "global_step": 163702, "epoch": 3897} {"train_loss": -6.966841697692871, "global_step": 163703, "epoch": 3897} {"train_loss": -7.052798271179199, "global_step": 163704, "epoch": 3897} {"train_loss": -7.026744365692139, "global_step": 163705, "epoch": 3897} {"train_loss": -6.968930244445801, "global_step": 163706, "epoch": 3897} {"train_loss": -6.935927391052246, "global_step": 163707, "epoch": 3897} {"train_loss": -7.023344993591309, "global_step": 163708, "epoch": 3897} {"train_loss": -7.0352630615234375, "global_step": 163709, "epoch": 3897} {"train_loss": -6.961939811706543, "global_step": 163710, "epoch": 3897} {"train_loss": -7.018266201019287, "global_step": 163711, "epoch": 3897} {"train_loss": -6.986109256744385, "global_step": 163712, "epoch": 3897} {"train_loss": -6.933713436126709, "global_step": 163713, "epoch": 3897} {"train_loss": -6.956750869750977, "global_step": 163714, "epoch": 3897} {"train_loss": -6.99817555291312, "global_step": 163715, "epoch": 3897, "val_loss": 68763.7578125} {"train_loss": -7.0649919509887695, "global_step": 163716, "epoch": 3898} {"train_loss": -6.987960338592529, "global_step": 163717, "epoch": 3898} {"train_loss": -6.914594650268555, "global_step": 163718, "epoch": 3898} {"train_loss": -6.989716529846191, "global_step": 163719, "epoch": 3898} {"train_loss": -7.004543304443359, "global_step": 163720, "epoch": 3898} {"train_loss": -7.0202860832214355, "global_step": 163721, "epoch": 3898} {"train_loss": -6.938549995422363, "global_step": 163722, "epoch": 3898} {"train_loss": -6.975283145904541, "global_step": 163723, "epoch": 3898} {"train_loss": -7.025893211364746, "global_step": 163724, "epoch": 3898} {"train_loss": -7.030848979949951, "global_step": 163725, "epoch": 3898} {"train_loss": -7.039214134216309, "global_step": 163726, "epoch": 3898} {"train_loss": -7.00764799118042, "global_step": 163727, "epoch": 3898} {"train_loss": -6.959872722625732, "global_step": 163728, "epoch": 3898} {"train_loss": -6.976004600524902, "global_step": 163729, "epoch": 3898} {"train_loss": -6.941203594207764, "global_step": 163730, "epoch": 3898} {"train_loss": -6.85247802734375, "global_step": 163731, "epoch": 3898} {"train_loss": -6.973068714141846, "global_step": 163732, "epoch": 3898} {"train_loss": -7.027677059173584, "global_step": 163733, "epoch": 3898} {"train_loss": -7.04012393951416, "global_step": 163734, "epoch": 3898} {"train_loss": -6.975558280944824, "global_step": 163735, "epoch": 3898} {"train_loss": -6.948565483093262, "global_step": 163736, "epoch": 3898} {"train_loss": -6.985386371612549, "global_step": 163737, "epoch": 3898} {"train_loss": -6.92668342590332, "global_step": 163738, "epoch": 3898} {"train_loss": -6.919023513793945, "global_step": 163739, "epoch": 3898} {"train_loss": -7.037897109985352, "global_step": 163740, "epoch": 3898} {"train_loss": -6.941656589508057, "global_step": 163741, "epoch": 3898} {"train_loss": -7.009143352508545, "global_step": 163742, "epoch": 3898} {"train_loss": -7.120797157287598, "global_step": 163743, "epoch": 3898} {"train_loss": -6.929282188415527, "global_step": 163744, "epoch": 3898} {"train_loss": -7.007858753204346, "global_step": 163745, "epoch": 3898} {"train_loss": -7.015201568603516, "global_step": 163746, "epoch": 3898} {"train_loss": -6.824708461761475, "global_step": 163747, "epoch": 3898} {"train_loss": -7.012176990509033, "global_step": 163748, "epoch": 3898} {"train_loss": -6.9640913009643555, "global_step": 163749, "epoch": 3898} {"train_loss": -6.876748085021973, "global_step": 163750, "epoch": 3898} {"train_loss": -6.926998138427734, "global_step": 163751, "epoch": 3898} {"train_loss": -7.029470443725586, "global_step": 163752, "epoch": 3898} {"train_loss": -6.977766036987305, "global_step": 163753, "epoch": 3898} {"train_loss": -6.92535400390625, "global_step": 163754, "epoch": 3898} {"train_loss": -7.024984836578369, "global_step": 163755, "epoch": 3898} {"train_loss": -6.963160514831543, "global_step": 163756, "epoch": 3898} {"train_loss": -6.9773261092958, "global_step": 163757, "epoch": 3898, "val_loss": 68685.28125} {"train_loss": -7.003159523010254, "global_step": 163758, "epoch": 3899} {"train_loss": -7.053707122802734, "global_step": 163759, "epoch": 3899} {"train_loss": -6.979748249053955, "global_step": 163760, "epoch": 3899} {"train_loss": -7.0175018310546875, "global_step": 163761, "epoch": 3899} {"train_loss": -7.037403106689453, "global_step": 163762, "epoch": 3899} {"train_loss": -6.933987617492676, "global_step": 163763, "epoch": 3899} {"train_loss": -7.047068119049072, "global_step": 163764, "epoch": 3899} {"train_loss": -7.03156042098999, "global_step": 163765, "epoch": 3899} {"train_loss": -6.973030090332031, "global_step": 163766, "epoch": 3899} {"train_loss": -6.966971397399902, "global_step": 163767, "epoch": 3899} {"train_loss": -6.965089797973633, "global_step": 163768, "epoch": 3899} {"train_loss": -6.8622822761535645, "global_step": 163769, "epoch": 3899} {"train_loss": -6.904142379760742, "global_step": 163770, "epoch": 3899} {"train_loss": -7.0335917472839355, "global_step": 163771, "epoch": 3899} {"train_loss": -6.9680585861206055, "global_step": 163772, "epoch": 3899} {"train_loss": -6.821401596069336, "global_step": 163773, "epoch": 3899} {"train_loss": -6.984452247619629, "global_step": 163774, "epoch": 3899} {"train_loss": -6.852258205413818, "global_step": 163775, "epoch": 3899} {"train_loss": -6.917597770690918, "global_step": 163776, "epoch": 3899} {"train_loss": -6.901590347290039, "global_step": 163777, "epoch": 3899} {"train_loss": -6.897242546081543, "global_step": 163778, "epoch": 3899} {"train_loss": -6.971129417419434, "global_step": 163779, "epoch": 3899} {"train_loss": -6.9016313552856445, "global_step": 163780, "epoch": 3899} {"train_loss": -6.897215843200684, "global_step": 163781, "epoch": 3899} {"train_loss": -6.966133117675781, "global_step": 163782, "epoch": 3899} {"train_loss": -6.790286064147949, "global_step": 163783, "epoch": 3899} {"train_loss": -6.887082099914551, "global_step": 163784, "epoch": 3899} {"train_loss": -6.989361763000488, "global_step": 163785, "epoch": 3899} {"train_loss": -7.053378105163574, "global_step": 163786, "epoch": 3899} {"train_loss": -6.838322162628174, "global_step": 163787, "epoch": 3899} {"train_loss": -7.064251899719238, "global_step": 163788, "epoch": 3899} {"train_loss": -7.077269554138184, "global_step": 163789, "epoch": 3899} {"train_loss": -7.0179338455200195, "global_step": 163790, "epoch": 3899} {"train_loss": -7.017688751220703, "global_step": 163791, "epoch": 3899} {"train_loss": -6.8967132568359375, "global_step": 163792, "epoch": 3899} {"train_loss": -6.964920997619629, "global_step": 163793, "epoch": 3899} {"train_loss": -6.894652366638184, "global_step": 163794, "epoch": 3899} {"train_loss": -6.853180885314941, "global_step": 163795, "epoch": 3899} {"train_loss": -6.9694013595581055, "global_step": 163796, "epoch": 3899} {"train_loss": -6.973446846008301, "global_step": 163797, "epoch": 3899} {"train_loss": -6.992387771606445, "global_step": 163798, "epoch": 3899} {"train_loss": -6.957303444544475, "global_step": 163799, "epoch": 3899, "val_loss": 68711.3125} {"train_loss": -6.972636699676514, "global_step": 163800, "epoch": 3900} {"train_loss": -7.020404815673828, "global_step": 163801, "epoch": 3900} {"train_loss": -7.054397106170654, "global_step": 163802, "epoch": 3900} {"train_loss": -7.11531400680542, "global_step": 163803, "epoch": 3900} {"train_loss": -6.903547286987305, "global_step": 163804, "epoch": 3900} {"train_loss": -6.991391181945801, "global_step": 163805, "epoch": 3900} {"train_loss": -7.084652900695801, "global_step": 163806, "epoch": 3900} {"train_loss": -6.894601345062256, "global_step": 163807, "epoch": 3900} {"train_loss": -6.9957170486450195, "global_step": 163808, "epoch": 3900} {"train_loss": -6.971282005310059, "global_step": 163809, "epoch": 3900} {"train_loss": -6.826615333557129, "global_step": 163810, "epoch": 3900} {"train_loss": -6.907384395599365, "global_step": 163811, "epoch": 3900} {"train_loss": -6.960562705993652, "global_step": 163812, "epoch": 3900} {"train_loss": -6.975467681884766, "global_step": 163813, "epoch": 3900} {"train_loss": -6.925261497497559, "global_step": 163814, "epoch": 3900} {"train_loss": -6.884021759033203, "global_step": 163815, "epoch": 3900} {"train_loss": -6.999451637268066, "global_step": 163816, "epoch": 3900} {"train_loss": -6.82513427734375, "global_step": 163817, "epoch": 3900} {"train_loss": -6.89884090423584, "global_step": 163818, "epoch": 3900} {"train_loss": -6.919065952301025, "global_step": 163819, "epoch": 3900} {"train_loss": -6.89963436126709, "global_step": 163820, "epoch": 3900} {"train_loss": -6.957695960998535, "global_step": 163821, "epoch": 3900} {"train_loss": -7.032609939575195, "global_step": 163822, "epoch": 3900} {"train_loss": -7.040196418762207, "global_step": 163823, "epoch": 3900} {"train_loss": -7.055295944213867, "global_step": 163824, "epoch": 3900} {"train_loss": -6.839773178100586, "global_step": 163825, "epoch": 3900} {"train_loss": -7.023554801940918, "global_step": 163826, "epoch": 3900} {"train_loss": -7.039936542510986, "global_step": 163827, "epoch": 3900} {"train_loss": -6.8909502029418945, "global_step": 163828, "epoch": 3900} {"train_loss": -7.005853176116943, "global_step": 163829, "epoch": 3900} {"train_loss": -6.977529048919678, "global_step": 163830, "epoch": 3900} {"train_loss": -6.942412853240967, "global_step": 163831, "epoch": 3900} {"train_loss": -7.169783592224121, "global_step": 163832, "epoch": 3900} {"train_loss": -6.932554721832275, "global_step": 163833, "epoch": 3900} {"train_loss": -6.939493179321289, "global_step": 163834, "epoch": 3900} {"train_loss": -7.028292655944824, "global_step": 163835, "epoch": 3900} {"train_loss": -6.982627868652344, "global_step": 163836, "epoch": 3900} {"train_loss": -6.8979291915893555, "global_step": 163837, "epoch": 3900} {"train_loss": -6.9916181564331055, "global_step": 163838, "epoch": 3900} {"train_loss": -7.023118495941162, "global_step": 163839, "epoch": 3900} {"train_loss": -6.962925910949707, "global_step": 163840, "epoch": 3900} {"train_loss": -6.973430134001232, "global_step": 163841, "epoch": 3900, "train/sim_max_reward_0": 0.19641217551262144, "train/sim_max_reward_1": 0.9806073047834573, "train/sim_max_reward_2": 0.9953475811172756, "train/sim_max_reward_3": 0.40237279828173533, "train/sim_max_reward_4": 0.9909805957698804, "train/sim_max_reward_5": 0.8833417236064177, "test/sim_max_reward_4300000": 0.9039169386989886, "test/sim_max_reward_4300001": 0.5463669900866862, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.8814816905474673, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9966789119536521, "test/sim_max_reward_4300008": 0.9375127321077235, "test/sim_max_reward_4300009": 0.9569129290570749, "test/sim_max_reward_4300010": 0.7266099740027714, "test/sim_max_reward_4300011": 0.9919185294736025, "test/sim_max_reward_4300012": 0.8435783868399892, "test/sim_max_reward_4300013": 0.933156793344149, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.936830271326915, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.3982300485193239, "test/sim_max_reward_4300018": 0.3981028468342981, "test/sim_max_reward_4300019": 0.18348629038279646, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8774141312636737, "test/sim_max_reward_4300022": 0.8611674661441943, "test/sim_max_reward_4300023": 0.7151767552209906, "test/sim_max_reward_4300024": 0.8128632683672912, "test/sim_max_reward_4300025": 0.8566894158545887, "test/sim_max_reward_4300026": 0.050878423390650566, "test/sim_max_reward_4300027": 0.83114730623947, "test/sim_max_reward_4300028": 0.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.10466815628357377, "test/sim_max_reward_4300031": 0.20919249314771218, "test/sim_max_reward_4300032": 0.901375596118841, "test/sim_max_reward_4300033": 1.0, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.940237903169971, "test/sim_max_reward_4300036": 0.22458930519062129, "test/sim_max_reward_4300037": 0.8648011052462194, "test/sim_max_reward_4300038": 0.9892505049504486, "test/sim_max_reward_4300039": 0.7726873256484437, "test/sim_max_reward_4300040": 1.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.4524250436589697, "test/sim_max_reward_4300043": 0.01912165197990456, "test/sim_max_reward_4300044": 0.9794074586125089, "test/sim_max_reward_4300045": 0.8857979605105382, "test/sim_max_reward_4300046": 0.15336814872229648, "test/sim_max_reward_4300047": 0.16633330796389675, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.26039154332330244, "train/mean_score": 0.7415103631785646, "test/mean_score": 0.5715920341798566, "val_loss": 68687.234375} {"train_loss": -6.949812889099121, "global_step": 163842, "epoch": 3901} {"train_loss": -7.142640590667725, "global_step": 163843, "epoch": 3901} {"train_loss": -7.083460330963135, "global_step": 163844, "epoch": 3901} {"train_loss": -7.084482192993164, "global_step": 163845, "epoch": 3901} {"train_loss": -6.988334655761719, "global_step": 163846, "epoch": 3901} {"train_loss": -6.983170032501221, "global_step": 163847, "epoch": 3901} {"train_loss": -7.104190349578857, "global_step": 163848, "epoch": 3901} {"train_loss": -7.008444786071777, "global_step": 163849, "epoch": 3901} {"train_loss": -6.938769340515137, "global_step": 163850, "epoch": 3901} {"train_loss": -7.0267333984375, "global_step": 163851, "epoch": 3901} {"train_loss": -6.958647727966309, "global_step": 163852, "epoch": 3901} {"train_loss": -7.034902095794678, "global_step": 163853, "epoch": 3901} {"train_loss": -7.090259075164795, "global_step": 163854, "epoch": 3901} {"train_loss": -7.06881856918335, "global_step": 163855, "epoch": 3901} {"train_loss": -7.012964725494385, "global_step": 163856, "epoch": 3901} {"train_loss": -7.011239528656006, "global_step": 163857, "epoch": 3901} {"train_loss": -7.035530090332031, "global_step": 163858, "epoch": 3901} {"train_loss": -7.123451232910156, "global_step": 163859, "epoch": 3901} {"train_loss": -7.0756611824035645, "global_step": 163860, "epoch": 3901} {"train_loss": -7.0657196044921875, "global_step": 163861, "epoch": 3901} {"train_loss": -6.968572616577148, "global_step": 163862, "epoch": 3901} {"train_loss": -7.017939567565918, "global_step": 163863, "epoch": 3901} {"train_loss": -6.926799774169922, "global_step": 163864, "epoch": 3901} {"train_loss": -6.996286392211914, "global_step": 163865, "epoch": 3901} {"train_loss": -7.085726737976074, "global_step": 163866, "epoch": 3901} {"train_loss": -7.084283828735352, "global_step": 163867, "epoch": 3901} {"train_loss": -7.018568992614746, "global_step": 163868, "epoch": 3901} {"train_loss": -7.010012626647949, "global_step": 163869, "epoch": 3901} {"train_loss": -7.004161834716797, "global_step": 163870, "epoch": 3901} {"train_loss": -7.081494331359863, "global_step": 163871, "epoch": 3901} {"train_loss": -6.951260566711426, "global_step": 163872, "epoch": 3901} {"train_loss": -7.009059906005859, "global_step": 163873, "epoch": 3901} {"train_loss": -6.950631618499756, "global_step": 163874, "epoch": 3901} {"train_loss": -7.100975036621094, "global_step": 163875, "epoch": 3901} {"train_loss": -7.005542278289795, "global_step": 163876, "epoch": 3901} {"train_loss": -7.009173393249512, "global_step": 163877, "epoch": 3901} {"train_loss": -7.044230937957764, "global_step": 163878, "epoch": 3901} {"train_loss": -7.074334144592285, "global_step": 163879, "epoch": 3901} {"train_loss": -6.99415922164917, "global_step": 163880, "epoch": 3901} {"train_loss": -6.843084335327148, "global_step": 163881, "epoch": 3901} {"train_loss": -6.950227737426758, "global_step": 163882, "epoch": 3901} {"train_loss": -7.021237555004301, "global_step": 163883, "epoch": 3901, "val_loss": 68843.5078125} {"train_loss": -6.835312843322754, "global_step": 163884, "epoch": 3902} {"train_loss": -6.702913761138916, "global_step": 163885, "epoch": 3902} {"train_loss": -6.95670747756958, "global_step": 163886, "epoch": 3902} {"train_loss": -6.887829303741455, "global_step": 163887, "epoch": 3902} {"train_loss": -6.616971969604492, "global_step": 163888, "epoch": 3902} {"train_loss": -7.140236854553223, "global_step": 163889, "epoch": 3902} {"train_loss": -6.873830318450928, "global_step": 163890, "epoch": 3902} {"train_loss": -6.857542037963867, "global_step": 163891, "epoch": 3902} {"train_loss": -6.901432037353516, "global_step": 163892, "epoch": 3902} {"train_loss": -6.992190361022949, "global_step": 163893, "epoch": 3902} {"train_loss": -6.8293352127075195, "global_step": 163894, "epoch": 3902} {"train_loss": -6.8616156578063965, "global_step": 163895, "epoch": 3902} {"train_loss": -6.871907711029053, "global_step": 163896, "epoch": 3902} {"train_loss": -6.686851501464844, "global_step": 163897, "epoch": 3902} {"train_loss": -6.95173454284668, "global_step": 163898, "epoch": 3902} {"train_loss": -6.695333957672119, "global_step": 163899, "epoch": 3902} {"train_loss": -6.876169681549072, "global_step": 163900, "epoch": 3902} {"train_loss": -6.826647758483887, "global_step": 163901, "epoch": 3902} {"train_loss": -6.942600250244141, "global_step": 163902, "epoch": 3902} {"train_loss": -6.877910614013672, "global_step": 163903, "epoch": 3902} {"train_loss": -6.895016670227051, "global_step": 163904, "epoch": 3902} {"train_loss": -6.9421772956848145, "global_step": 163905, "epoch": 3902} {"train_loss": -6.912648677825928, "global_step": 163906, "epoch": 3902} {"train_loss": -7.03080415725708, "global_step": 163907, "epoch": 3902} {"train_loss": -7.048189640045166, "global_step": 163908, "epoch": 3902} {"train_loss": -6.864174842834473, "global_step": 163909, "epoch": 3902} {"train_loss": -7.012509346008301, "global_step": 163910, "epoch": 3902} {"train_loss": -6.9120049476623535, "global_step": 163911, "epoch": 3902} {"train_loss": -6.897658348083496, "global_step": 163912, "epoch": 3902} {"train_loss": -6.918276786804199, "global_step": 163913, "epoch": 3902} {"train_loss": -6.884255409240723, "global_step": 163914, "epoch": 3902} {"train_loss": -6.898540019989014, "global_step": 163915, "epoch": 3902} {"train_loss": -6.837126731872559, "global_step": 163916, "epoch": 3902} {"train_loss": -6.853619575500488, "global_step": 163917, "epoch": 3902} {"train_loss": -7.01298713684082, "global_step": 163918, "epoch": 3902} {"train_loss": -6.981950759887695, "global_step": 163919, "epoch": 3902} {"train_loss": -6.90059757232666, "global_step": 163920, "epoch": 3902} {"train_loss": -6.998445510864258, "global_step": 163921, "epoch": 3902} {"train_loss": -7.018462181091309, "global_step": 163922, "epoch": 3902} {"train_loss": -6.957782745361328, "global_step": 163923, "epoch": 3902} {"train_loss": -7.011836528778076, "global_step": 163924, "epoch": 3902} {"train_loss": -6.9024962811242965, "global_step": 163925, "epoch": 3902, "val_loss": 68685.0703125} {"train_loss": -6.99501895904541, "global_step": 163926, "epoch": 3903} {"train_loss": -6.971319198608398, "global_step": 163927, "epoch": 3903} {"train_loss": -6.943489074707031, "global_step": 163928, "epoch": 3903} {"train_loss": -7.04833984375, "global_step": 163929, "epoch": 3903} {"train_loss": -6.9445881843566895, "global_step": 163930, "epoch": 3903} {"train_loss": -6.937880992889404, "global_step": 163931, "epoch": 3903} {"train_loss": -7.088462829589844, "global_step": 163932, "epoch": 3903} {"train_loss": -7.005254745483398, "global_step": 163933, "epoch": 3903} {"train_loss": -6.931437015533447, "global_step": 163934, "epoch": 3903} {"train_loss": -7.047458648681641, "global_step": 163935, "epoch": 3903} {"train_loss": -6.968331336975098, "global_step": 163936, "epoch": 3903} {"train_loss": -7.074892997741699, "global_step": 163937, "epoch": 3903} {"train_loss": -7.0240373611450195, "global_step": 163938, "epoch": 3903} {"train_loss": -6.8601861000061035, "global_step": 163939, "epoch": 3903} {"train_loss": -7.047137260437012, "global_step": 163940, "epoch": 3903} {"train_loss": -6.951871395111084, "global_step": 163941, "epoch": 3903} {"train_loss": -7.09002685546875, "global_step": 163942, "epoch": 3903} {"train_loss": -7.025627136230469, "global_step": 163943, "epoch": 3903} {"train_loss": -7.0321946144104, "global_step": 163944, "epoch": 3903} {"train_loss": -6.990971088409424, "global_step": 163945, "epoch": 3903} {"train_loss": -6.978510856628418, "global_step": 163946, "epoch": 3903} {"train_loss": -6.941076755523682, "global_step": 163947, "epoch": 3903} {"train_loss": -6.995989799499512, "global_step": 163948, "epoch": 3903} {"train_loss": -6.93778133392334, "global_step": 163949, "epoch": 3903} {"train_loss": -7.100689888000488, "global_step": 163950, "epoch": 3903} {"train_loss": -7.029294967651367, "global_step": 163951, "epoch": 3903} {"train_loss": -6.967631816864014, "global_step": 163952, "epoch": 3903} {"train_loss": -6.921996116638184, "global_step": 163953, "epoch": 3903} {"train_loss": -7.009180068969727, "global_step": 163954, "epoch": 3903} {"train_loss": -7.016826152801514, "global_step": 163955, "epoch": 3903} {"train_loss": -6.997452259063721, "global_step": 163956, "epoch": 3903} {"train_loss": -7.008010387420654, "global_step": 163957, "epoch": 3903} {"train_loss": -7.006227970123291, "global_step": 163958, "epoch": 3903} {"train_loss": -6.984407901763916, "global_step": 163959, "epoch": 3903} {"train_loss": -7.031488418579102, "global_step": 163960, "epoch": 3903} {"train_loss": -6.9926629066467285, "global_step": 163961, "epoch": 3903} {"train_loss": -6.908016681671143, "global_step": 163962, "epoch": 3903} {"train_loss": -7.03786039352417, "global_step": 163963, "epoch": 3903} {"train_loss": -6.93472957611084, "global_step": 163964, "epoch": 3903} {"train_loss": -7.041220664978027, "global_step": 163965, "epoch": 3903} {"train_loss": -7.035992622375488, "global_step": 163966, "epoch": 3903} {"train_loss": -6.996249403272357, "global_step": 163967, "epoch": 3903, "val_loss": 68767.125} {"train_loss": -7.019556999206543, "global_step": 163968, "epoch": 3904} {"train_loss": -7.05363655090332, "global_step": 163969, "epoch": 3904} {"train_loss": -6.988778114318848, "global_step": 163970, "epoch": 3904} {"train_loss": -7.167287826538086, "global_step": 163971, "epoch": 3904} {"train_loss": -7.102641582489014, "global_step": 163972, "epoch": 3904} {"train_loss": -7.103991985321045, "global_step": 163973, "epoch": 3904} {"train_loss": -7.064558029174805, "global_step": 163974, "epoch": 3904} {"train_loss": -7.056907653808594, "global_step": 163975, "epoch": 3904} {"train_loss": -7.026773452758789, "global_step": 163976, "epoch": 3904} {"train_loss": -7.0230865478515625, "global_step": 163977, "epoch": 3904} {"train_loss": -6.996664047241211, "global_step": 163978, "epoch": 3904} {"train_loss": -6.946193695068359, "global_step": 163979, "epoch": 3904} {"train_loss": -6.940154552459717, "global_step": 163980, "epoch": 3904} {"train_loss": -7.019103050231934, "global_step": 163981, "epoch": 3904} {"train_loss": -7.11735200881958, "global_step": 163982, "epoch": 3904} {"train_loss": -7.018779754638672, "global_step": 163983, "epoch": 3904} {"train_loss": -6.947839736938477, "global_step": 163984, "epoch": 3904} {"train_loss": -6.9926228523254395, "global_step": 163985, "epoch": 3904} {"train_loss": -7.022304534912109, "global_step": 163986, "epoch": 3904} {"train_loss": -6.974398136138916, "global_step": 163987, "epoch": 3904} {"train_loss": -7.066844940185547, "global_step": 163988, "epoch": 3904} {"train_loss": -7.020041465759277, "global_step": 163989, "epoch": 3904} {"train_loss": -7.076848030090332, "global_step": 163990, "epoch": 3904} {"train_loss": -6.928974151611328, "global_step": 163991, "epoch": 3904} {"train_loss": -7.057178497314453, "global_step": 163992, "epoch": 3904} {"train_loss": -7.145488739013672, "global_step": 163993, "epoch": 3904} {"train_loss": -6.980752944946289, "global_step": 163994, "epoch": 3904} {"train_loss": -7.034570693969727, "global_step": 163995, "epoch": 3904} {"train_loss": -7.052823066711426, "global_step": 163996, "epoch": 3904} {"train_loss": -7.045133113861084, "global_step": 163997, "epoch": 3904} {"train_loss": -6.94708251953125, "global_step": 163998, "epoch": 3904} {"train_loss": -7.0104780197143555, "global_step": 163999, "epoch": 3904} {"train_loss": -6.938488960266113, "global_step": 164000, "epoch": 3904} {"train_loss": -6.953746795654297, "global_step": 164001, "epoch": 3904} {"train_loss": -6.993369102478027, "global_step": 164002, "epoch": 3904} {"train_loss": -7.018884181976318, "global_step": 164003, "epoch": 3904} {"train_loss": -7.0405497550964355, "global_step": 164004, "epoch": 3904} {"train_loss": -7.146236419677734, "global_step": 164005, "epoch": 3904} {"train_loss": -7.0299530029296875, "global_step": 164006, "epoch": 3904} {"train_loss": -6.981925010681152, "global_step": 164007, "epoch": 3904} {"train_loss": -6.9903950691223145, "global_step": 164008, "epoch": 3904} {"train_loss": -7.0237915970030285, "global_step": 164009, "epoch": 3904, "val_loss": 68774.71875} {"train_loss": -6.9631500244140625, "global_step": 164010, "epoch": 3905} {"train_loss": -7.011575222015381, "global_step": 164011, "epoch": 3905} {"train_loss": -7.037929534912109, "global_step": 164012, "epoch": 3905} {"train_loss": -7.08870792388916, "global_step": 164013, "epoch": 3905} {"train_loss": -7.001188278198242, "global_step": 164014, "epoch": 3905} {"train_loss": -7.0437140464782715, "global_step": 164015, "epoch": 3905} {"train_loss": -6.920574188232422, "global_step": 164016, "epoch": 3905} {"train_loss": -6.95816707611084, "global_step": 164017, "epoch": 3905} {"train_loss": -7.140007019042969, "global_step": 164018, "epoch": 3905} {"train_loss": -7.024302005767822, "global_step": 164019, "epoch": 3905} {"train_loss": -7.103370189666748, "global_step": 164020, "epoch": 3905} {"train_loss": -6.951512813568115, "global_step": 164021, "epoch": 3905} {"train_loss": -6.953211784362793, "global_step": 164022, "epoch": 3905} {"train_loss": -6.9671950340271, "global_step": 164023, "epoch": 3905} {"train_loss": -7.0696282386779785, "global_step": 164024, "epoch": 3905} {"train_loss": -7.070107936859131, "global_step": 164025, "epoch": 3905} {"train_loss": -7.014767169952393, "global_step": 164026, "epoch": 3905} {"train_loss": -7.113253593444824, "global_step": 164027, "epoch": 3905} {"train_loss": -6.938114643096924, "global_step": 164028, "epoch": 3905} {"train_loss": -6.8347883224487305, "global_step": 164029, "epoch": 3905} {"train_loss": -7.051843643188477, "global_step": 164030, "epoch": 3905} {"train_loss": -6.959699630737305, "global_step": 164031, "epoch": 3905} {"train_loss": -6.831456184387207, "global_step": 164032, "epoch": 3905} {"train_loss": -6.909358501434326, "global_step": 164033, "epoch": 3905} {"train_loss": -6.910701751708984, "global_step": 164034, "epoch": 3905} {"train_loss": -6.962533950805664, "global_step": 164035, "epoch": 3905} {"train_loss": -6.875619411468506, "global_step": 164036, "epoch": 3905} {"train_loss": -6.922544479370117, "global_step": 164037, "epoch": 3905} {"train_loss": -6.966941833496094, "global_step": 164038, "epoch": 3905} {"train_loss": -6.968267440795898, "global_step": 164039, "epoch": 3905} {"train_loss": -6.943406105041504, "global_step": 164040, "epoch": 3905} {"train_loss": -6.90372371673584, "global_step": 164041, "epoch": 3905} {"train_loss": -7.069593906402588, "global_step": 164042, "epoch": 3905} {"train_loss": -7.025292873382568, "global_step": 164043, "epoch": 3905} {"train_loss": -7.091176509857178, "global_step": 164044, "epoch": 3905} {"train_loss": -6.98542594909668, "global_step": 164045, "epoch": 3905} {"train_loss": -6.902924537658691, "global_step": 164046, "epoch": 3905} {"train_loss": -6.972680568695068, "global_step": 164047, "epoch": 3905} {"train_loss": -7.019473075866699, "global_step": 164048, "epoch": 3905} {"train_loss": -6.916881561279297, "global_step": 164049, "epoch": 3905} {"train_loss": -7.073426723480225, "global_step": 164050, "epoch": 3905} {"train_loss": -6.985654808226085, "global_step": 164051, "epoch": 3905, "val_loss": 68954.1640625} {"train_loss": -7.057525157928467, "global_step": 164052, "epoch": 3906} {"train_loss": -7.00369930267334, "global_step": 164053, "epoch": 3906} {"train_loss": -6.9708147048950195, "global_step": 164054, "epoch": 3906} {"train_loss": -6.988425254821777, "global_step": 164055, "epoch": 3906} {"train_loss": -6.961307525634766, "global_step": 164056, "epoch": 3906} {"train_loss": -6.982787609100342, "global_step": 164057, "epoch": 3906} {"train_loss": -6.868898868560791, "global_step": 164058, "epoch": 3906} {"train_loss": -6.900225639343262, "global_step": 164059, "epoch": 3906} {"train_loss": -6.8230791091918945, "global_step": 164060, "epoch": 3906} {"train_loss": -6.975227355957031, "global_step": 164061, "epoch": 3906} {"train_loss": -6.762170791625977, "global_step": 164062, "epoch": 3906} {"train_loss": -7.080109596252441, "global_step": 164063, "epoch": 3906} {"train_loss": -6.940917491912842, "global_step": 164064, "epoch": 3906} {"train_loss": -6.813800811767578, "global_step": 164065, "epoch": 3906} {"train_loss": -6.893592357635498, "global_step": 164066, "epoch": 3906} {"train_loss": -6.844301223754883, "global_step": 164067, "epoch": 3906} {"train_loss": -6.916134834289551, "global_step": 164068, "epoch": 3906} {"train_loss": -6.787020206451416, "global_step": 164069, "epoch": 3906} {"train_loss": -6.947272777557373, "global_step": 164070, "epoch": 3906} {"train_loss": -7.069449424743652, "global_step": 164071, "epoch": 3906} {"train_loss": -7.04512357711792, "global_step": 164072, "epoch": 3906} {"train_loss": -6.920748233795166, "global_step": 164073, "epoch": 3906} {"train_loss": -6.980131149291992, "global_step": 164074, "epoch": 3906} {"train_loss": -6.890895366668701, "global_step": 164075, "epoch": 3906} {"train_loss": -6.939833641052246, "global_step": 164076, "epoch": 3906} {"train_loss": -6.934106826782227, "global_step": 164077, "epoch": 3906} {"train_loss": -7.042386531829834, "global_step": 164078, "epoch": 3906} {"train_loss": -6.963376045227051, "global_step": 164079, "epoch": 3906} {"train_loss": -7.166529655456543, "global_step": 164080, "epoch": 3906} {"train_loss": -6.88275146484375, "global_step": 164081, "epoch": 3906} {"train_loss": -6.956068515777588, "global_step": 164082, "epoch": 3906} {"train_loss": -6.9743332862854, "global_step": 164083, "epoch": 3906} {"train_loss": -7.040205478668213, "global_step": 164084, "epoch": 3906} {"train_loss": -6.819150447845459, "global_step": 164085, "epoch": 3906} {"train_loss": -6.941096305847168, "global_step": 164086, "epoch": 3906} {"train_loss": -6.970388412475586, "global_step": 164087, "epoch": 3906} {"train_loss": -6.992320537567139, "global_step": 164088, "epoch": 3906} {"train_loss": -6.833601474761963, "global_step": 164089, "epoch": 3906} {"train_loss": -7.034493446350098, "global_step": 164090, "epoch": 3906} {"train_loss": -6.850435733795166, "global_step": 164091, "epoch": 3906} {"train_loss": -6.935391426086426, "global_step": 164092, "epoch": 3906} {"train_loss": -6.943849756604149, "global_step": 164093, "epoch": 3906, "val_loss": 68813.6796875} {"train_loss": -6.9527788162231445, "global_step": 164094, "epoch": 3907} {"train_loss": -6.991050720214844, "global_step": 164095, "epoch": 3907} {"train_loss": -6.913217067718506, "global_step": 164096, "epoch": 3907} {"train_loss": -6.9918413162231445, "global_step": 164097, "epoch": 3907} {"train_loss": -6.890328407287598, "global_step": 164098, "epoch": 3907} {"train_loss": -7.064910411834717, "global_step": 164099, "epoch": 3907} {"train_loss": -7.1003499031066895, "global_step": 164100, "epoch": 3907} {"train_loss": -6.9561309814453125, "global_step": 164101, "epoch": 3907} {"train_loss": -7.03555965423584, "global_step": 164102, "epoch": 3907} {"train_loss": -7.089901924133301, "global_step": 164103, "epoch": 3907} {"train_loss": -6.978506565093994, "global_step": 164104, "epoch": 3907} {"train_loss": -7.001785755157471, "global_step": 164105, "epoch": 3907} {"train_loss": -7.107178688049316, "global_step": 164106, "epoch": 3907} {"train_loss": -6.9787445068359375, "global_step": 164107, "epoch": 3907} {"train_loss": -6.895452499389648, "global_step": 164108, "epoch": 3907} {"train_loss": -6.990698337554932, "global_step": 164109, "epoch": 3907} {"train_loss": -6.9848175048828125, "global_step": 164110, "epoch": 3907} {"train_loss": -6.9835100173950195, "global_step": 164111, "epoch": 3907} {"train_loss": -7.066290378570557, "global_step": 164112, "epoch": 3907} {"train_loss": -6.908562660217285, "global_step": 164113, "epoch": 3907} {"train_loss": -7.038914203643799, "global_step": 164114, "epoch": 3907} {"train_loss": -7.105494976043701, "global_step": 164115, "epoch": 3907} {"train_loss": -7.114568710327148, "global_step": 164116, "epoch": 3907} {"train_loss": -7.05739688873291, "global_step": 164117, "epoch": 3907} {"train_loss": -6.989630222320557, "global_step": 164118, "epoch": 3907} {"train_loss": -7.019981384277344, "global_step": 164119, "epoch": 3907} {"train_loss": -7.005368232727051, "global_step": 164120, "epoch": 3907} {"train_loss": -7.012298583984375, "global_step": 164121, "epoch": 3907} {"train_loss": -7.00685453414917, "global_step": 164122, "epoch": 3907} {"train_loss": -7.072467803955078, "global_step": 164123, "epoch": 3907} {"train_loss": -7.019480228424072, "global_step": 164124, "epoch": 3907} {"train_loss": -7.017442226409912, "global_step": 164125, "epoch": 3907} {"train_loss": -6.88088321685791, "global_step": 164126, "epoch": 3907} {"train_loss": -6.840526103973389, "global_step": 164127, "epoch": 3907} {"train_loss": -7.0000410079956055, "global_step": 164128, "epoch": 3907} {"train_loss": -6.899987697601318, "global_step": 164129, "epoch": 3907} {"train_loss": -6.869604587554932, "global_step": 164130, "epoch": 3907} {"train_loss": -6.949113845825195, "global_step": 164131, "epoch": 3907} {"train_loss": -7.024636268615723, "global_step": 164132, "epoch": 3907} {"train_loss": -6.9218316078186035, "global_step": 164133, "epoch": 3907} {"train_loss": -6.908066749572754, "global_step": 164134, "epoch": 3907} {"train_loss": -6.992662055151803, "global_step": 164135, "epoch": 3907, "val_loss": 68761.9140625} {"train_loss": -6.960395812988281, "global_step": 164136, "epoch": 3908} {"train_loss": -6.961458206176758, "global_step": 164137, "epoch": 3908} {"train_loss": -6.836678504943848, "global_step": 164138, "epoch": 3908} {"train_loss": -7.068145275115967, "global_step": 164139, "epoch": 3908} {"train_loss": -7.028353214263916, "global_step": 164140, "epoch": 3908} {"train_loss": -7.11257266998291, "global_step": 164141, "epoch": 3908} {"train_loss": -7.045426368713379, "global_step": 164142, "epoch": 3908} {"train_loss": -6.983510971069336, "global_step": 164143, "epoch": 3908} {"train_loss": -6.9539289474487305, "global_step": 164144, "epoch": 3908} {"train_loss": -7.090249061584473, "global_step": 164145, "epoch": 3908} {"train_loss": -6.971478462219238, "global_step": 164146, "epoch": 3908} {"train_loss": -6.920342922210693, "global_step": 164147, "epoch": 3908} {"train_loss": -7.011720657348633, "global_step": 164148, "epoch": 3908} {"train_loss": -6.977416038513184, "global_step": 164149, "epoch": 3908} {"train_loss": -6.965611457824707, "global_step": 164150, "epoch": 3908} {"train_loss": -7.029475688934326, "global_step": 164151, "epoch": 3908} {"train_loss": -6.993241786956787, "global_step": 164152, "epoch": 3908} {"train_loss": -6.885538578033447, "global_step": 164153, "epoch": 3908} {"train_loss": -6.927845478057861, "global_step": 164154, "epoch": 3908} {"train_loss": -7.016641616821289, "global_step": 164155, "epoch": 3908} {"train_loss": -7.071380615234375, "global_step": 164156, "epoch": 3908} {"train_loss": -7.060587406158447, "global_step": 164157, "epoch": 3908} {"train_loss": -6.9908270835876465, "global_step": 164158, "epoch": 3908} {"train_loss": -7.056877613067627, "global_step": 164159, "epoch": 3908} {"train_loss": -7.053004264831543, "global_step": 164160, "epoch": 3908} {"train_loss": -7.088205814361572, "global_step": 164161, "epoch": 3908} {"train_loss": -7.023781776428223, "global_step": 164162, "epoch": 3908} {"train_loss": -7.045234203338623, "global_step": 164163, "epoch": 3908} {"train_loss": -6.962984085083008, "global_step": 164164, "epoch": 3908} {"train_loss": -6.985111236572266, "global_step": 164165, "epoch": 3908} {"train_loss": -6.945148468017578, "global_step": 164166, "epoch": 3908} {"train_loss": -7.044961929321289, "global_step": 164167, "epoch": 3908} {"train_loss": -7.0168609619140625, "global_step": 164168, "epoch": 3908} {"train_loss": -6.904526710510254, "global_step": 164169, "epoch": 3908} {"train_loss": -7.060622215270996, "global_step": 164170, "epoch": 3908} {"train_loss": -6.988519191741943, "global_step": 164171, "epoch": 3908} {"train_loss": -6.935809135437012, "global_step": 164172, "epoch": 3908} {"train_loss": -6.939552307128906, "global_step": 164173, "epoch": 3908} {"train_loss": -6.938073635101318, "global_step": 164174, "epoch": 3908} {"train_loss": -6.945172309875488, "global_step": 164175, "epoch": 3908} {"train_loss": -7.079917907714844, "global_step": 164176, "epoch": 3908} {"train_loss": -6.999642690022786, "global_step": 164177, "epoch": 3908, "val_loss": 68877.59375} {"train_loss": -7.098505973815918, "global_step": 164178, "epoch": 3909} {"train_loss": -6.959190368652344, "global_step": 164179, "epoch": 3909} {"train_loss": -6.935942649841309, "global_step": 164180, "epoch": 3909} {"train_loss": -6.8034820556640625, "global_step": 164181, "epoch": 3909} {"train_loss": -6.984455585479736, "global_step": 164182, "epoch": 3909} {"train_loss": -6.979062080383301, "global_step": 164183, "epoch": 3909} {"train_loss": -6.9161057472229, "global_step": 164184, "epoch": 3909} {"train_loss": -6.855586051940918, "global_step": 164185, "epoch": 3909} {"train_loss": -7.002014636993408, "global_step": 164186, "epoch": 3909} {"train_loss": -6.884552001953125, "global_step": 164187, "epoch": 3909} {"train_loss": -6.904706954956055, "global_step": 164188, "epoch": 3909} {"train_loss": -6.874811172485352, "global_step": 164189, "epoch": 3909} {"train_loss": -6.861001014709473, "global_step": 164190, "epoch": 3909} {"train_loss": -7.018870830535889, "global_step": 164191, "epoch": 3909} {"train_loss": -6.809361457824707, "global_step": 164192, "epoch": 3909} {"train_loss": -6.826496601104736, "global_step": 164193, "epoch": 3909} {"train_loss": -6.952898979187012, "global_step": 164194, "epoch": 3909} {"train_loss": -6.859183311462402, "global_step": 164195, "epoch": 3909} {"train_loss": -7.013381004333496, "global_step": 164196, "epoch": 3909} {"train_loss": -6.970432281494141, "global_step": 164197, "epoch": 3909} {"train_loss": -6.9635009765625, "global_step": 164198, "epoch": 3909} {"train_loss": -6.992530345916748, "global_step": 164199, "epoch": 3909} {"train_loss": -6.991100788116455, "global_step": 164200, "epoch": 3909} {"train_loss": -7.027935028076172, "global_step": 164201, "epoch": 3909} {"train_loss": -6.899567604064941, "global_step": 164202, "epoch": 3909} {"train_loss": -6.914239883422852, "global_step": 164203, "epoch": 3909} {"train_loss": -6.756831645965576, "global_step": 164204, "epoch": 3909} {"train_loss": -6.923511028289795, "global_step": 164205, "epoch": 3909} {"train_loss": -6.854612827301025, "global_step": 164206, "epoch": 3909} {"train_loss": -6.947117805480957, "global_step": 164207, "epoch": 3909} {"train_loss": -6.976210117340088, "global_step": 164208, "epoch": 3909} {"train_loss": -6.7481231689453125, "global_step": 164209, "epoch": 3909} {"train_loss": -6.9629011154174805, "global_step": 164210, "epoch": 3909} {"train_loss": -6.8845415115356445, "global_step": 164211, "epoch": 3909} {"train_loss": -6.927467346191406, "global_step": 164212, "epoch": 3909} {"train_loss": -6.99267053604126, "global_step": 164213, "epoch": 3909} {"train_loss": -6.945662498474121, "global_step": 164214, "epoch": 3909} {"train_loss": -6.7718048095703125, "global_step": 164215, "epoch": 3909} {"train_loss": -6.817174434661865, "global_step": 164216, "epoch": 3909} {"train_loss": -6.803287506103516, "global_step": 164217, "epoch": 3909} {"train_loss": -6.732943534851074, "global_step": 164218, "epoch": 3909} {"train_loss": -6.90956829843067, "global_step": 164219, "epoch": 3909, "val_loss": 68659.765625} {"train_loss": -6.79144287109375, "global_step": 164220, "epoch": 3910} {"train_loss": -6.815578460693359, "global_step": 164221, "epoch": 3910} {"train_loss": -6.9707794189453125, "global_step": 164222, "epoch": 3910} {"train_loss": -6.9872541427612305, "global_step": 164223, "epoch": 3910} {"train_loss": -6.788433074951172, "global_step": 164224, "epoch": 3910} {"train_loss": -6.89830207824707, "global_step": 164225, "epoch": 3910} {"train_loss": -6.811389923095703, "global_step": 164226, "epoch": 3910} {"train_loss": -6.937056541442871, "global_step": 164227, "epoch": 3910} {"train_loss": -6.854426860809326, "global_step": 164228, "epoch": 3910} {"train_loss": -6.938610076904297, "global_step": 164229, "epoch": 3910} {"train_loss": -6.867770195007324, "global_step": 164230, "epoch": 3910} {"train_loss": -6.9963698387146, "global_step": 164231, "epoch": 3910} {"train_loss": -6.819104194641113, "global_step": 164232, "epoch": 3910} {"train_loss": -6.838702201843262, "global_step": 164233, "epoch": 3910} {"train_loss": -6.887059211730957, "global_step": 164234, "epoch": 3910} {"train_loss": -6.960258483886719, "global_step": 164235, "epoch": 3910} {"train_loss": -6.878326416015625, "global_step": 164236, "epoch": 3910} {"train_loss": -7.009979248046875, "global_step": 164237, "epoch": 3910} {"train_loss": -6.876547813415527, "global_step": 164238, "epoch": 3910} {"train_loss": -6.801661491394043, "global_step": 164239, "epoch": 3910} {"train_loss": -6.925853729248047, "global_step": 164240, "epoch": 3910} {"train_loss": -6.832339763641357, "global_step": 164241, "epoch": 3910} {"train_loss": -6.822858810424805, "global_step": 164242, "epoch": 3910} {"train_loss": -6.874658584594727, "global_step": 164243, "epoch": 3910} {"train_loss": -6.843563079833984, "global_step": 164244, "epoch": 3910} {"train_loss": -6.848963737487793, "global_step": 164245, "epoch": 3910} {"train_loss": -6.949484825134277, "global_step": 164246, "epoch": 3910} {"train_loss": -6.883465766906738, "global_step": 164247, "epoch": 3910} {"train_loss": -7.011558532714844, "global_step": 164248, "epoch": 3910} {"train_loss": -6.888374328613281, "global_step": 164249, "epoch": 3910} {"train_loss": -6.991706848144531, "global_step": 164250, "epoch": 3910} {"train_loss": -6.9044342041015625, "global_step": 164251, "epoch": 3910} {"train_loss": -6.8552069664001465, "global_step": 164252, "epoch": 3910} {"train_loss": -7.056221961975098, "global_step": 164253, "epoch": 3910} {"train_loss": -6.902411460876465, "global_step": 164254, "epoch": 3910} {"train_loss": -6.770552635192871, "global_step": 164255, "epoch": 3910} {"train_loss": -7.080026149749756, "global_step": 164256, "epoch": 3910} {"train_loss": -6.8620710372924805, "global_step": 164257, "epoch": 3910} {"train_loss": -6.826507568359375, "global_step": 164258, "epoch": 3910} {"train_loss": -6.839896202087402, "global_step": 164259, "epoch": 3910} {"train_loss": -6.88136625289917, "global_step": 164260, "epoch": 3910} {"train_loss": -6.895758492606027, "global_step": 164261, "epoch": 3910, "val_loss": 69042.671875} {"train_loss": -6.789153575897217, "global_step": 164262, "epoch": 3911} {"train_loss": -6.897436141967773, "global_step": 164263, "epoch": 3911} {"train_loss": -6.892394065856934, "global_step": 164264, "epoch": 3911} {"train_loss": -6.983823776245117, "global_step": 164265, "epoch": 3911} {"train_loss": -6.898545742034912, "global_step": 164266, "epoch": 3911} {"train_loss": -6.863958835601807, "global_step": 164267, "epoch": 3911} {"train_loss": -6.927896499633789, "global_step": 164268, "epoch": 3911} {"train_loss": -6.991352081298828, "global_step": 164269, "epoch": 3911} {"train_loss": -6.872661113739014, "global_step": 164270, "epoch": 3911} {"train_loss": -6.929722309112549, "global_step": 164271, "epoch": 3911} {"train_loss": -6.7482829093933105, "global_step": 164272, "epoch": 3911} {"train_loss": -6.818050384521484, "global_step": 164273, "epoch": 3911} {"train_loss": -6.705175399780273, "global_step": 164274, "epoch": 3911} {"train_loss": -6.7198262214660645, "global_step": 164275, "epoch": 3911} {"train_loss": -6.942580223083496, "global_step": 164276, "epoch": 3911} {"train_loss": -6.928559303283691, "global_step": 164277, "epoch": 3911} {"train_loss": -6.9264421463012695, "global_step": 164278, "epoch": 3911} {"train_loss": -6.741199493408203, "global_step": 164279, "epoch": 3911} {"train_loss": -6.89656925201416, "global_step": 164280, "epoch": 3911} {"train_loss": -6.812997817993164, "global_step": 164281, "epoch": 3911} {"train_loss": -6.930262565612793, "global_step": 164282, "epoch": 3911} {"train_loss": -7.029445171356201, "global_step": 164283, "epoch": 3911} {"train_loss": -7.020907402038574, "global_step": 164284, "epoch": 3911} {"train_loss": -6.924136161804199, "global_step": 164285, "epoch": 3911} {"train_loss": -6.999402046203613, "global_step": 164286, "epoch": 3911} {"train_loss": -6.904304504394531, "global_step": 164287, "epoch": 3911} {"train_loss": -6.939607620239258, "global_step": 164288, "epoch": 3911} {"train_loss": -7.034435272216797, "global_step": 164289, "epoch": 3911} {"train_loss": -6.922707557678223, "global_step": 164290, "epoch": 3911} {"train_loss": -7.060372352600098, "global_step": 164291, "epoch": 3911} {"train_loss": -7.069741249084473, "global_step": 164292, "epoch": 3911} {"train_loss": -7.07966947555542, "global_step": 164293, "epoch": 3911} {"train_loss": -7.002033233642578, "global_step": 164294, "epoch": 3911} {"train_loss": -7.007203102111816, "global_step": 164295, "epoch": 3911} {"train_loss": -6.934021949768066, "global_step": 164296, "epoch": 3911} {"train_loss": -7.093957424163818, "global_step": 164297, "epoch": 3911} {"train_loss": -6.9850945472717285, "global_step": 164298, "epoch": 3911} {"train_loss": -7.033529281616211, "global_step": 164299, "epoch": 3911} {"train_loss": -7.074215888977051, "global_step": 164300, "epoch": 3911} {"train_loss": -7.131466865539551, "global_step": 164301, "epoch": 3911} {"train_loss": -7.051530838012695, "global_step": 164302, "epoch": 3911} {"train_loss": -6.943071853546869, "global_step": 164303, "epoch": 3911, "val_loss": 68756.890625} {"train_loss": -7.118093490600586, "global_step": 164304, "epoch": 3912} {"train_loss": -7.120046138763428, "global_step": 164305, "epoch": 3912} {"train_loss": -7.067977428436279, "global_step": 164306, "epoch": 3912} {"train_loss": -7.050414085388184, "global_step": 164307, "epoch": 3912} {"train_loss": -7.014848709106445, "global_step": 164308, "epoch": 3912} {"train_loss": -7.001228332519531, "global_step": 164309, "epoch": 3912} {"train_loss": -7.09637975692749, "global_step": 164310, "epoch": 3912} {"train_loss": -7.130475044250488, "global_step": 164311, "epoch": 3912} {"train_loss": -7.10175895690918, "global_step": 164312, "epoch": 3912} {"train_loss": -7.127617835998535, "global_step": 164313, "epoch": 3912} {"train_loss": -7.129828453063965, "global_step": 164314, "epoch": 3912} {"train_loss": -7.046497344970703, "global_step": 164315, "epoch": 3912} {"train_loss": -6.967164039611816, "global_step": 164316, "epoch": 3912} {"train_loss": -6.996556282043457, "global_step": 164317, "epoch": 3912} {"train_loss": -7.008079528808594, "global_step": 164318, "epoch": 3912} {"train_loss": -6.912336349487305, "global_step": 164319, "epoch": 3912} {"train_loss": -6.971272945404053, "global_step": 164320, "epoch": 3912} {"train_loss": -6.973676681518555, "global_step": 164321, "epoch": 3912} {"train_loss": -6.987536430358887, "global_step": 164322, "epoch": 3912} {"train_loss": -7.132333278656006, "global_step": 164323, "epoch": 3912} {"train_loss": -6.952291488647461, "global_step": 164324, "epoch": 3912} {"train_loss": -6.978004455566406, "global_step": 164325, "epoch": 3912} {"train_loss": -7.063072204589844, "global_step": 164326, "epoch": 3912} {"train_loss": -7.062864303588867, "global_step": 164327, "epoch": 3912} {"train_loss": -7.034256935119629, "global_step": 164328, "epoch": 3912} {"train_loss": -6.984369277954102, "global_step": 164329, "epoch": 3912} {"train_loss": -6.9387102127075195, "global_step": 164330, "epoch": 3912} {"train_loss": -6.876999855041504, "global_step": 164331, "epoch": 3912} {"train_loss": -6.924227237701416, "global_step": 164332, "epoch": 3912} {"train_loss": -6.8888959884643555, "global_step": 164333, "epoch": 3912} {"train_loss": -7.011134624481201, "global_step": 164334, "epoch": 3912} {"train_loss": -7.083977222442627, "global_step": 164335, "epoch": 3912} {"train_loss": -6.915223121643066, "global_step": 164336, "epoch": 3912} {"train_loss": -6.9341912269592285, "global_step": 164337, "epoch": 3912} {"train_loss": -7.0351972579956055, "global_step": 164338, "epoch": 3912} {"train_loss": -6.836112976074219, "global_step": 164339, "epoch": 3912} {"train_loss": -6.89469575881958, "global_step": 164340, "epoch": 3912} {"train_loss": -7.015336036682129, "global_step": 164341, "epoch": 3912} {"train_loss": -6.8197784423828125, "global_step": 164342, "epoch": 3912} {"train_loss": -6.8057403564453125, "global_step": 164343, "epoch": 3912} {"train_loss": -6.9636077880859375, "global_step": 164344, "epoch": 3912} {"train_loss": -6.996382543018886, "global_step": 164345, "epoch": 3912, "val_loss": 68662.3359375} {"train_loss": -7.025754928588867, "global_step": 164346, "epoch": 3913} {"train_loss": -6.903621673583984, "global_step": 164347, "epoch": 3913} {"train_loss": -6.98426628112793, "global_step": 164348, "epoch": 3913} {"train_loss": -7.041250228881836, "global_step": 164349, "epoch": 3913} {"train_loss": -6.89896297454834, "global_step": 164350, "epoch": 3913} {"train_loss": -6.8622965812683105, "global_step": 164351, "epoch": 3913} {"train_loss": -6.866415023803711, "global_step": 164352, "epoch": 3913} {"train_loss": -6.894720077514648, "global_step": 164353, "epoch": 3913} {"train_loss": -6.951106071472168, "global_step": 164354, "epoch": 3913} {"train_loss": -6.986150741577148, "global_step": 164355, "epoch": 3913} {"train_loss": -6.921291351318359, "global_step": 164356, "epoch": 3913} {"train_loss": -6.893682479858398, "global_step": 164357, "epoch": 3913} {"train_loss": -6.907533645629883, "global_step": 164358, "epoch": 3913} {"train_loss": -6.9046630859375, "global_step": 164359, "epoch": 3913} {"train_loss": -7.02011775970459, "global_step": 164360, "epoch": 3913} {"train_loss": -6.890402793884277, "global_step": 164361, "epoch": 3913} {"train_loss": -6.875475883483887, "global_step": 164362, "epoch": 3913} {"train_loss": -7.02784538269043, "global_step": 164363, "epoch": 3913} {"train_loss": -6.912636756896973, "global_step": 164364, "epoch": 3913} {"train_loss": -6.907069206237793, "global_step": 164365, "epoch": 3913} {"train_loss": -6.940123558044434, "global_step": 164366, "epoch": 3913} {"train_loss": -6.905187129974365, "global_step": 164367, "epoch": 3913} {"train_loss": -6.96222448348999, "global_step": 164368, "epoch": 3913} {"train_loss": -6.872222900390625, "global_step": 164369, "epoch": 3913} {"train_loss": -6.799671173095703, "global_step": 164370, "epoch": 3913} {"train_loss": -7.01979398727417, "global_step": 164371, "epoch": 3913} {"train_loss": -6.976342678070068, "global_step": 164372, "epoch": 3913} {"train_loss": -6.936459541320801, "global_step": 164373, "epoch": 3913} {"train_loss": -6.993975639343262, "global_step": 164374, "epoch": 3913} {"train_loss": -6.958174705505371, "global_step": 164375, "epoch": 3913} {"train_loss": -6.978792190551758, "global_step": 164376, "epoch": 3913} {"train_loss": -6.866053581237793, "global_step": 164377, "epoch": 3913} {"train_loss": -7.0669403076171875, "global_step": 164378, "epoch": 3913} {"train_loss": -6.86442232131958, "global_step": 164379, "epoch": 3913} {"train_loss": -6.926064491271973, "global_step": 164380, "epoch": 3913} {"train_loss": -6.93182373046875, "global_step": 164381, "epoch": 3913} {"train_loss": -6.7834882736206055, "global_step": 164382, "epoch": 3913} {"train_loss": -7.048620223999023, "global_step": 164383, "epoch": 3913} {"train_loss": -6.938068389892578, "global_step": 164384, "epoch": 3913} {"train_loss": -6.9085588455200195, "global_step": 164385, "epoch": 3913} {"train_loss": -6.971830368041992, "global_step": 164386, "epoch": 3913} {"train_loss": -6.93405142284575, "global_step": 164387, "epoch": 3913, "val_loss": 68870.7109375} {"train_loss": -6.9277753829956055, "global_step": 164388, "epoch": 3914} {"train_loss": -6.819160461425781, "global_step": 164389, "epoch": 3914} {"train_loss": -6.879178047180176, "global_step": 164390, "epoch": 3914} {"train_loss": -6.788821220397949, "global_step": 164391, "epoch": 3914} {"train_loss": -7.015894889831543, "global_step": 164392, "epoch": 3914} {"train_loss": -6.766498565673828, "global_step": 164393, "epoch": 3914} {"train_loss": -6.739080905914307, "global_step": 164394, "epoch": 3914} {"train_loss": -6.9061279296875, "global_step": 164395, "epoch": 3914} {"train_loss": -6.762279510498047, "global_step": 164396, "epoch": 3914} {"train_loss": -7.002954006195068, "global_step": 164397, "epoch": 3914} {"train_loss": -6.777028560638428, "global_step": 164398, "epoch": 3914} {"train_loss": -7.006709098815918, "global_step": 164399, "epoch": 3914} {"train_loss": -6.893822193145752, "global_step": 164400, "epoch": 3914} {"train_loss": -6.862156867980957, "global_step": 164401, "epoch": 3914} {"train_loss": -6.989678382873535, "global_step": 164402, "epoch": 3914} {"train_loss": -7.059996604919434, "global_step": 164403, "epoch": 3914} {"train_loss": -6.936059951782227, "global_step": 164404, "epoch": 3914} {"train_loss": -7.034766674041748, "global_step": 164405, "epoch": 3914} {"train_loss": -7.017660617828369, "global_step": 164406, "epoch": 3914} {"train_loss": -6.947170257568359, "global_step": 164407, "epoch": 3914} {"train_loss": -6.949397087097168, "global_step": 164408, "epoch": 3914} {"train_loss": -6.937612056732178, "global_step": 164409, "epoch": 3914} {"train_loss": -6.906589508056641, "global_step": 164410, "epoch": 3914} {"train_loss": -7.015893936157227, "global_step": 164411, "epoch": 3914} {"train_loss": -7.058889865875244, "global_step": 164412, "epoch": 3914} {"train_loss": -7.0037522315979, "global_step": 164413, "epoch": 3914} {"train_loss": -7.027320861816406, "global_step": 164414, "epoch": 3914} {"train_loss": -6.913219451904297, "global_step": 164415, "epoch": 3914} {"train_loss": -7.019933700561523, "global_step": 164416, "epoch": 3914} {"train_loss": -6.989795207977295, "global_step": 164417, "epoch": 3914} {"train_loss": -7.007637023925781, "global_step": 164418, "epoch": 3914} {"train_loss": -7.13926887512207, "global_step": 164419, "epoch": 3914} {"train_loss": -6.985746383666992, "global_step": 164420, "epoch": 3914} {"train_loss": -7.1468825340271, "global_step": 164421, "epoch": 3914} {"train_loss": -7.065730571746826, "global_step": 164422, "epoch": 3914} {"train_loss": -7.068516254425049, "global_step": 164423, "epoch": 3914} {"train_loss": -7.035313606262207, "global_step": 164424, "epoch": 3914} {"train_loss": -7.014026641845703, "global_step": 164425, "epoch": 3914} {"train_loss": -6.971997261047363, "global_step": 164426, "epoch": 3914} {"train_loss": -7.00830078125, "global_step": 164427, "epoch": 3914} {"train_loss": -7.127732753753662, "global_step": 164428, "epoch": 3914} {"train_loss": -6.962966691879999, "global_step": 164429, "epoch": 3914, "val_loss": 68788.5703125} {"train_loss": -7.055150508880615, "global_step": 164430, "epoch": 3915} {"train_loss": -7.082010746002197, "global_step": 164431, "epoch": 3915} {"train_loss": -7.037935733795166, "global_step": 164432, "epoch": 3915} {"train_loss": -7.007240295410156, "global_step": 164433, "epoch": 3915} {"train_loss": -6.971979141235352, "global_step": 164434, "epoch": 3915} {"train_loss": -6.945023536682129, "global_step": 164435, "epoch": 3915} {"train_loss": -7.151528835296631, "global_step": 164436, "epoch": 3915} {"train_loss": -6.949469566345215, "global_step": 164437, "epoch": 3915} {"train_loss": -7.028949737548828, "global_step": 164438, "epoch": 3915} {"train_loss": -7.100065231323242, "global_step": 164439, "epoch": 3915} {"train_loss": -7.101176738739014, "global_step": 164440, "epoch": 3915} {"train_loss": -7.105263710021973, "global_step": 164441, "epoch": 3915} {"train_loss": -7.0259246826171875, "global_step": 164442, "epoch": 3915} {"train_loss": -6.9866943359375, "global_step": 164443, "epoch": 3915} {"train_loss": -6.979413986206055, "global_step": 164444, "epoch": 3915} {"train_loss": -7.0760722160339355, "global_step": 164445, "epoch": 3915} {"train_loss": -6.978583335876465, "global_step": 164446, "epoch": 3915} {"train_loss": -6.921377182006836, "global_step": 164447, "epoch": 3915} {"train_loss": -7.03045654296875, "global_step": 164448, "epoch": 3915} {"train_loss": -6.839773178100586, "global_step": 164449, "epoch": 3915} {"train_loss": -7.038137435913086, "global_step": 164450, "epoch": 3915} {"train_loss": -7.03009033203125, "global_step": 164451, "epoch": 3915} {"train_loss": -6.953768730163574, "global_step": 164452, "epoch": 3915} {"train_loss": -6.989568710327148, "global_step": 164453, "epoch": 3915} {"train_loss": -6.851583003997803, "global_step": 164454, "epoch": 3915} {"train_loss": -7.069098949432373, "global_step": 164455, "epoch": 3915} {"train_loss": -6.796394348144531, "global_step": 164456, "epoch": 3915} {"train_loss": -6.894772052764893, "global_step": 164457, "epoch": 3915} {"train_loss": -6.945168495178223, "global_step": 164458, "epoch": 3915} {"train_loss": -6.893228530883789, "global_step": 164459, "epoch": 3915} {"train_loss": -6.9551496505737305, "global_step": 164460, "epoch": 3915} {"train_loss": -6.861995697021484, "global_step": 164461, "epoch": 3915} {"train_loss": -6.938885688781738, "global_step": 164462, "epoch": 3915} {"train_loss": -6.948657035827637, "global_step": 164463, "epoch": 3915} {"train_loss": -6.915186882019043, "global_step": 164464, "epoch": 3915} {"train_loss": -6.959419250488281, "global_step": 164465, "epoch": 3915} {"train_loss": -6.846558570861816, "global_step": 164466, "epoch": 3915} {"train_loss": -7.03944206237793, "global_step": 164467, "epoch": 3915} {"train_loss": -6.919660568237305, "global_step": 164468, "epoch": 3915} {"train_loss": -6.982749938964844, "global_step": 164469, "epoch": 3915} {"train_loss": -6.997722625732422, "global_step": 164470, "epoch": 3915} {"train_loss": -6.982083570389521, "global_step": 164471, "epoch": 3915, "val_loss": 68662.5546875} {"train_loss": -6.909087181091309, "global_step": 164472, "epoch": 3916} {"train_loss": -6.876035690307617, "global_step": 164473, "epoch": 3916} {"train_loss": -6.886223316192627, "global_step": 164474, "epoch": 3916} {"train_loss": -7.013546943664551, "global_step": 164475, "epoch": 3916} {"train_loss": -7.039761543273926, "global_step": 164476, "epoch": 3916} {"train_loss": -6.888361930847168, "global_step": 164477, "epoch": 3916} {"train_loss": -6.9873247146606445, "global_step": 164478, "epoch": 3916} {"train_loss": -6.991927623748779, "global_step": 164479, "epoch": 3916} {"train_loss": -6.937726974487305, "global_step": 164480, "epoch": 3916} {"train_loss": -6.989085674285889, "global_step": 164481, "epoch": 3916} {"train_loss": -7.06256628036499, "global_step": 164482, "epoch": 3916} {"train_loss": -6.992002487182617, "global_step": 164483, "epoch": 3916} {"train_loss": -6.974847316741943, "global_step": 164484, "epoch": 3916} {"train_loss": -7.002938747406006, "global_step": 164485, "epoch": 3916} {"train_loss": -6.91977071762085, "global_step": 164486, "epoch": 3916} {"train_loss": -7.091622829437256, "global_step": 164487, "epoch": 3916} {"train_loss": -7.031853675842285, "global_step": 164488, "epoch": 3916} {"train_loss": -6.9665021896362305, "global_step": 164489, "epoch": 3916} {"train_loss": -6.906415939331055, "global_step": 164490, "epoch": 3916} {"train_loss": -6.991386413574219, "global_step": 164491, "epoch": 3916} {"train_loss": -6.85059928894043, "global_step": 164492, "epoch": 3916} {"train_loss": -7.021204471588135, "global_step": 164493, "epoch": 3916} {"train_loss": -7.069416046142578, "global_step": 164494, "epoch": 3916} {"train_loss": -7.099819660186768, "global_step": 164495, "epoch": 3916} {"train_loss": -6.961447715759277, "global_step": 164496, "epoch": 3916} {"train_loss": -7.005631923675537, "global_step": 164497, "epoch": 3916} {"train_loss": -6.966065406799316, "global_step": 164498, "epoch": 3916} {"train_loss": -7.058245658874512, "global_step": 164499, "epoch": 3916} {"train_loss": -7.059850692749023, "global_step": 164500, "epoch": 3916} {"train_loss": -6.938239097595215, "global_step": 164501, "epoch": 3916} {"train_loss": -6.937147617340088, "global_step": 164502, "epoch": 3916} {"train_loss": -6.973183631896973, "global_step": 164503, "epoch": 3916} {"train_loss": -7.134389877319336, "global_step": 164504, "epoch": 3916} {"train_loss": -7.014786720275879, "global_step": 164505, "epoch": 3916} {"train_loss": -6.9422478675842285, "global_step": 164506, "epoch": 3916} {"train_loss": -7.070838928222656, "global_step": 164507, "epoch": 3916} {"train_loss": -7.095494270324707, "global_step": 164508, "epoch": 3916} {"train_loss": -6.932366371154785, "global_step": 164509, "epoch": 3916} {"train_loss": -7.02916145324707, "global_step": 164510, "epoch": 3916} {"train_loss": -7.015490531921387, "global_step": 164511, "epoch": 3916} {"train_loss": -7.041833877563477, "global_step": 164512, "epoch": 3916} {"train_loss": -6.993044399079823, "global_step": 164513, "epoch": 3916, "val_loss": 68613.265625} {"train_loss": -7.103184700012207, "global_step": 164514, "epoch": 3917} {"train_loss": -6.984086990356445, "global_step": 164515, "epoch": 3917} {"train_loss": -7.0538105964660645, "global_step": 164516, "epoch": 3917} {"train_loss": -7.040562629699707, "global_step": 164517, "epoch": 3917} {"train_loss": -6.936514854431152, "global_step": 164518, "epoch": 3917} {"train_loss": -7.135494232177734, "global_step": 164519, "epoch": 3917} {"train_loss": -6.943906784057617, "global_step": 164520, "epoch": 3917} {"train_loss": -6.967033386230469, "global_step": 164521, "epoch": 3917} {"train_loss": -7.014461517333984, "global_step": 164522, "epoch": 3917} {"train_loss": -6.937920570373535, "global_step": 164523, "epoch": 3917} {"train_loss": -6.968693256378174, "global_step": 164524, "epoch": 3917} {"train_loss": -6.979263782501221, "global_step": 164525, "epoch": 3917} {"train_loss": -7.000734806060791, "global_step": 164526, "epoch": 3917} {"train_loss": -7.155895233154297, "global_step": 164527, "epoch": 3917} {"train_loss": -6.971823692321777, "global_step": 164528, "epoch": 3917} {"train_loss": -6.892674922943115, "global_step": 164529, "epoch": 3917} {"train_loss": -6.977054119110107, "global_step": 164530, "epoch": 3917} {"train_loss": -7.084853172302246, "global_step": 164531, "epoch": 3917} {"train_loss": -7.104361534118652, "global_step": 164532, "epoch": 3917} {"train_loss": -6.996955394744873, "global_step": 164533, "epoch": 3917} {"train_loss": -7.031520843505859, "global_step": 164534, "epoch": 3917} {"train_loss": -7.009509086608887, "global_step": 164535, "epoch": 3917} {"train_loss": -6.9668288230896, "global_step": 164536, "epoch": 3917} {"train_loss": -6.975388526916504, "global_step": 164537, "epoch": 3917} {"train_loss": -6.97602653503418, "global_step": 164538, "epoch": 3917} {"train_loss": -7.050800323486328, "global_step": 164539, "epoch": 3917} {"train_loss": -6.899415493011475, "global_step": 164540, "epoch": 3917} {"train_loss": -6.913442611694336, "global_step": 164541, "epoch": 3917} {"train_loss": -7.013664245605469, "global_step": 164542, "epoch": 3917} {"train_loss": -6.944716930389404, "global_step": 164543, "epoch": 3917} {"train_loss": -6.897823333740234, "global_step": 164544, "epoch": 3917} {"train_loss": -7.057343482971191, "global_step": 164545, "epoch": 3917} {"train_loss": -7.00253963470459, "global_step": 164546, "epoch": 3917} {"train_loss": -7.00892448425293, "global_step": 164547, "epoch": 3917} {"train_loss": -7.056970119476318, "global_step": 164548, "epoch": 3917} {"train_loss": -6.986372470855713, "global_step": 164549, "epoch": 3917} {"train_loss": -6.835587501525879, "global_step": 164550, "epoch": 3917} {"train_loss": -6.959497928619385, "global_step": 164551, "epoch": 3917} {"train_loss": -7.099430561065674, "global_step": 164552, "epoch": 3917} {"train_loss": -6.922137260437012, "global_step": 164553, "epoch": 3917} {"train_loss": -6.939363479614258, "global_step": 164554, "epoch": 3917} {"train_loss": -6.993335099447341, "global_step": 164555, "epoch": 3917, "val_loss": 68804.8359375} {"train_loss": -6.910234451293945, "global_step": 164556, "epoch": 3918} {"train_loss": -7.026192665100098, "global_step": 164557, "epoch": 3918} {"train_loss": -7.001420974731445, "global_step": 164558, "epoch": 3918} {"train_loss": -7.067862510681152, "global_step": 164559, "epoch": 3918} {"train_loss": -7.104903221130371, "global_step": 164560, "epoch": 3918} {"train_loss": -6.947513103485107, "global_step": 164561, "epoch": 3918} {"train_loss": -7.090141773223877, "global_step": 164562, "epoch": 3918} {"train_loss": -7.073993682861328, "global_step": 164563, "epoch": 3918} {"train_loss": -6.8693037033081055, "global_step": 164564, "epoch": 3918} {"train_loss": -6.946354389190674, "global_step": 164565, "epoch": 3918} {"train_loss": -7.076859474182129, "global_step": 164566, "epoch": 3918} {"train_loss": -6.972677707672119, "global_step": 164567, "epoch": 3918} {"train_loss": -7.073808670043945, "global_step": 164568, "epoch": 3918} {"train_loss": -6.9457292556762695, "global_step": 164569, "epoch": 3918} {"train_loss": -7.090333938598633, "global_step": 164570, "epoch": 3918} {"train_loss": -7.022258758544922, "global_step": 164571, "epoch": 3918} {"train_loss": -7.010915279388428, "global_step": 164572, "epoch": 3918} {"train_loss": -6.9207444190979, "global_step": 164573, "epoch": 3918} {"train_loss": -7.001533508300781, "global_step": 164574, "epoch": 3918} {"train_loss": -6.964923858642578, "global_step": 164575, "epoch": 3918} {"train_loss": -6.819650650024414, "global_step": 164576, "epoch": 3918} {"train_loss": -6.867342948913574, "global_step": 164577, "epoch": 3918} {"train_loss": -7.101872444152832, "global_step": 164578, "epoch": 3918} {"train_loss": -6.730160713195801, "global_step": 164579, "epoch": 3918} {"train_loss": -6.93780517578125, "global_step": 164580, "epoch": 3918} {"train_loss": -6.826846122741699, "global_step": 164581, "epoch": 3918} {"train_loss": -6.971407413482666, "global_step": 164582, "epoch": 3918} {"train_loss": -6.986880302429199, "global_step": 164583, "epoch": 3918} {"train_loss": -6.877500057220459, "global_step": 164584, "epoch": 3918} {"train_loss": -7.007773399353027, "global_step": 164585, "epoch": 3918} {"train_loss": -7.006703853607178, "global_step": 164586, "epoch": 3918} {"train_loss": -6.925793647766113, "global_step": 164587, "epoch": 3918} {"train_loss": -6.942818641662598, "global_step": 164588, "epoch": 3918} {"train_loss": -7.041666030883789, "global_step": 164589, "epoch": 3918} {"train_loss": -6.979587554931641, "global_step": 164590, "epoch": 3918} {"train_loss": -6.867738723754883, "global_step": 164591, "epoch": 3918} {"train_loss": -7.087209701538086, "global_step": 164592, "epoch": 3918} {"train_loss": -7.0674638748168945, "global_step": 164593, "epoch": 3918} {"train_loss": -6.953603744506836, "global_step": 164594, "epoch": 3918} {"train_loss": -7.006728172302246, "global_step": 164595, "epoch": 3918} {"train_loss": -6.895474910736084, "global_step": 164596, "epoch": 3918} {"train_loss": -6.976333220799764, "global_step": 164597, "epoch": 3918, "val_loss": 68641.6953125} {"train_loss": -6.942698001861572, "global_step": 164598, "epoch": 3919} {"train_loss": -6.981375217437744, "global_step": 164599, "epoch": 3919} {"train_loss": -6.916318893432617, "global_step": 164600, "epoch": 3919} {"train_loss": -7.0311970710754395, "global_step": 164601, "epoch": 3919} {"train_loss": -6.945515155792236, "global_step": 164602, "epoch": 3919} {"train_loss": -7.029966831207275, "global_step": 164603, "epoch": 3919} {"train_loss": -6.907965660095215, "global_step": 164604, "epoch": 3919} {"train_loss": -7.0126447677612305, "global_step": 164605, "epoch": 3919} {"train_loss": -6.924282073974609, "global_step": 164606, "epoch": 3919} {"train_loss": -7.066025257110596, "global_step": 164607, "epoch": 3919} {"train_loss": -7.155493259429932, "global_step": 164608, "epoch": 3919} {"train_loss": -7.007938861846924, "global_step": 164609, "epoch": 3919} {"train_loss": -7.0290446281433105, "global_step": 164610, "epoch": 3919} {"train_loss": -6.95945930480957, "global_step": 164611, "epoch": 3919} {"train_loss": -6.952960014343262, "global_step": 164612, "epoch": 3919} {"train_loss": -6.83979606628418, "global_step": 164613, "epoch": 3919} {"train_loss": -7.00171422958374, "global_step": 164614, "epoch": 3919} {"train_loss": -6.911776542663574, "global_step": 164615, "epoch": 3919} {"train_loss": -6.763708114624023, "global_step": 164616, "epoch": 3919} {"train_loss": -6.907291889190674, "global_step": 164617, "epoch": 3919} {"train_loss": -6.928427219390869, "global_step": 164618, "epoch": 3919} {"train_loss": -6.873681545257568, "global_step": 164619, "epoch": 3919} {"train_loss": -6.912384986877441, "global_step": 164620, "epoch": 3919} {"train_loss": -6.804299354553223, "global_step": 164621, "epoch": 3919} {"train_loss": -6.88804292678833, "global_step": 164622, "epoch": 3919} {"train_loss": -6.829373836517334, "global_step": 164623, "epoch": 3919} {"train_loss": -6.693443775177002, "global_step": 164624, "epoch": 3919} {"train_loss": -7.004101753234863, "global_step": 164625, "epoch": 3919} {"train_loss": -6.739727020263672, "global_step": 164626, "epoch": 3919} {"train_loss": -6.955252647399902, "global_step": 164627, "epoch": 3919} {"train_loss": -6.630937576293945, "global_step": 164628, "epoch": 3919} {"train_loss": -6.83554220199585, "global_step": 164629, "epoch": 3919} {"train_loss": -6.632343292236328, "global_step": 164630, "epoch": 3919} {"train_loss": -6.830914497375488, "global_step": 164631, "epoch": 3919} {"train_loss": -6.855236053466797, "global_step": 164632, "epoch": 3919} {"train_loss": -6.793666839599609, "global_step": 164633, "epoch": 3919} {"train_loss": -6.894582748413086, "global_step": 164634, "epoch": 3919} {"train_loss": -6.84837532043457, "global_step": 164635, "epoch": 3919} {"train_loss": -6.972766876220703, "global_step": 164636, "epoch": 3919} {"train_loss": -6.9305596351623535, "global_step": 164637, "epoch": 3919} {"train_loss": -6.8797736167907715, "global_step": 164638, "epoch": 3919} {"train_loss": -6.900300570896694, "global_step": 164639, "epoch": 3919, "val_loss": 68592.28125} {"train_loss": -6.965728282928467, "global_step": 164640, "epoch": 3920} {"train_loss": -6.842668533325195, "global_step": 164641, "epoch": 3920} {"train_loss": -6.902584075927734, "global_step": 164642, "epoch": 3920} {"train_loss": -6.899044036865234, "global_step": 164643, "epoch": 3920} {"train_loss": -6.8838605880737305, "global_step": 164644, "epoch": 3920} {"train_loss": -6.844485759735107, "global_step": 164645, "epoch": 3920} {"train_loss": -6.928707122802734, "global_step": 164646, "epoch": 3920} {"train_loss": -6.875404357910156, "global_step": 164647, "epoch": 3920} {"train_loss": -6.82236385345459, "global_step": 164648, "epoch": 3920} {"train_loss": -7.021823883056641, "global_step": 164649, "epoch": 3920} {"train_loss": -6.86351203918457, "global_step": 164650, "epoch": 3920} {"train_loss": -7.008500099182129, "global_step": 164651, "epoch": 3920} {"train_loss": -6.929790496826172, "global_step": 164652, "epoch": 3920} {"train_loss": -6.943538188934326, "global_step": 164653, "epoch": 3920} {"train_loss": -7.008581638336182, "global_step": 164654, "epoch": 3920} {"train_loss": -6.894506454467773, "global_step": 164655, "epoch": 3920} {"train_loss": -6.951160430908203, "global_step": 164656, "epoch": 3920} {"train_loss": -6.967071056365967, "global_step": 164657, "epoch": 3920} {"train_loss": -7.016434192657471, "global_step": 164658, "epoch": 3920} {"train_loss": -6.992452144622803, "global_step": 164659, "epoch": 3920} {"train_loss": -6.925004959106445, "global_step": 164660, "epoch": 3920} {"train_loss": -7.057931900024414, "global_step": 164661, "epoch": 3920} {"train_loss": -6.889163017272949, "global_step": 164662, "epoch": 3920} {"train_loss": -7.0817108154296875, "global_step": 164663, "epoch": 3920} {"train_loss": -6.894066333770752, "global_step": 164664, "epoch": 3920} {"train_loss": -7.0235772132873535, "global_step": 164665, "epoch": 3920} {"train_loss": -7.021204948425293, "global_step": 164666, "epoch": 3920} {"train_loss": -6.992844104766846, "global_step": 164667, "epoch": 3920} {"train_loss": -6.891703128814697, "global_step": 164668, "epoch": 3920} {"train_loss": -7.014969825744629, "global_step": 164669, "epoch": 3920} {"train_loss": -6.99797248840332, "global_step": 164670, "epoch": 3920} {"train_loss": -7.034156799316406, "global_step": 164671, "epoch": 3920} {"train_loss": -6.96987771987915, "global_step": 164672, "epoch": 3920} {"train_loss": -7.059199333190918, "global_step": 164673, "epoch": 3920} {"train_loss": -7.042782783508301, "global_step": 164674, "epoch": 3920} {"train_loss": -6.961302757263184, "global_step": 164675, "epoch": 3920} {"train_loss": -6.987303256988525, "global_step": 164676, "epoch": 3920} {"train_loss": -6.963491439819336, "global_step": 164677, "epoch": 3920} {"train_loss": -6.994990825653076, "global_step": 164678, "epoch": 3920} {"train_loss": -6.882299900054932, "global_step": 164679, "epoch": 3920} {"train_loss": -7.138400077819824, "global_step": 164680, "epoch": 3920} {"train_loss": -6.960905041013445, "global_step": 164681, "epoch": 3920, "val_loss": 68773.90625} {"train_loss": -7.00788688659668, "global_step": 164682, "epoch": 3921} {"train_loss": -7.0146379470825195, "global_step": 164683, "epoch": 3921} {"train_loss": -6.979588508605957, "global_step": 164684, "epoch": 3921} {"train_loss": -7.0009870529174805, "global_step": 164685, "epoch": 3921} {"train_loss": -7.0398406982421875, "global_step": 164686, "epoch": 3921} {"train_loss": -7.026418209075928, "global_step": 164687, "epoch": 3921} {"train_loss": -7.025581359863281, "global_step": 164688, "epoch": 3921} {"train_loss": -7.0036725997924805, "global_step": 164689, "epoch": 3921} {"train_loss": -6.972323417663574, "global_step": 164690, "epoch": 3921} {"train_loss": -6.9596099853515625, "global_step": 164691, "epoch": 3921} {"train_loss": -6.993412971496582, "global_step": 164692, "epoch": 3921} {"train_loss": -6.939865589141846, "global_step": 164693, "epoch": 3921} {"train_loss": -6.949541091918945, "global_step": 164694, "epoch": 3921} {"train_loss": -6.964409828186035, "global_step": 164695, "epoch": 3921} {"train_loss": -6.903000831604004, "global_step": 164696, "epoch": 3921} {"train_loss": -6.8271870613098145, "global_step": 164697, "epoch": 3921} {"train_loss": -6.993697643280029, "global_step": 164698, "epoch": 3921} {"train_loss": -6.994664192199707, "global_step": 164699, "epoch": 3921} {"train_loss": -7.021002292633057, "global_step": 164700, "epoch": 3921} {"train_loss": -7.016772747039795, "global_step": 164701, "epoch": 3921} {"train_loss": -6.944703102111816, "global_step": 164702, "epoch": 3921} {"train_loss": -6.971920013427734, "global_step": 164703, "epoch": 3921} {"train_loss": -6.952333450317383, "global_step": 164704, "epoch": 3921} {"train_loss": -6.941584587097168, "global_step": 164705, "epoch": 3921} {"train_loss": -7.062390327453613, "global_step": 164706, "epoch": 3921} {"train_loss": -6.863041877746582, "global_step": 164707, "epoch": 3921} {"train_loss": -7.067607879638672, "global_step": 164708, "epoch": 3921} {"train_loss": -6.9232072830200195, "global_step": 164709, "epoch": 3921} {"train_loss": -6.901333808898926, "global_step": 164710, "epoch": 3921} {"train_loss": -7.04844856262207, "global_step": 164711, "epoch": 3921} {"train_loss": -6.931045055389404, "global_step": 164712, "epoch": 3921} {"train_loss": -7.0195465087890625, "global_step": 164713, "epoch": 3921} {"train_loss": -6.858673095703125, "global_step": 164714, "epoch": 3921} {"train_loss": -7.039716720581055, "global_step": 164715, "epoch": 3921} {"train_loss": -7.063885688781738, "global_step": 164716, "epoch": 3921} {"train_loss": -6.950200080871582, "global_step": 164717, "epoch": 3921} {"train_loss": -7.08378791809082, "global_step": 164718, "epoch": 3921} {"train_loss": -6.860931396484375, "global_step": 164719, "epoch": 3921} {"train_loss": -6.977894306182861, "global_step": 164720, "epoch": 3921} {"train_loss": -7.035789966583252, "global_step": 164721, "epoch": 3921} {"train_loss": -6.958806991577148, "global_step": 164722, "epoch": 3921} {"train_loss": -6.978146995816912, "global_step": 164723, "epoch": 3921, "val_loss": 68745.4296875} {"train_loss": -6.960724830627441, "global_step": 164724, "epoch": 3922} {"train_loss": -6.945511817932129, "global_step": 164725, "epoch": 3922} {"train_loss": -7.051340103149414, "global_step": 164726, "epoch": 3922} {"train_loss": -6.871830940246582, "global_step": 164727, "epoch": 3922} {"train_loss": -7.081930160522461, "global_step": 164728, "epoch": 3922} {"train_loss": -6.975973606109619, "global_step": 164729, "epoch": 3922} {"train_loss": -7.0514092445373535, "global_step": 164730, "epoch": 3922} {"train_loss": -7.024463653564453, "global_step": 164731, "epoch": 3922} {"train_loss": -7.051692008972168, "global_step": 164732, "epoch": 3922} {"train_loss": -6.9052348136901855, "global_step": 164733, "epoch": 3922} {"train_loss": -6.935750961303711, "global_step": 164734, "epoch": 3922} {"train_loss": -7.046672344207764, "global_step": 164735, "epoch": 3922} {"train_loss": -6.953399181365967, "global_step": 164736, "epoch": 3922} {"train_loss": -6.963357448577881, "global_step": 164737, "epoch": 3922} {"train_loss": -6.921568870544434, "global_step": 164738, "epoch": 3922} {"train_loss": -7.00677490234375, "global_step": 164739, "epoch": 3922} {"train_loss": -6.940950393676758, "global_step": 164740, "epoch": 3922} {"train_loss": -7.065700531005859, "global_step": 164741, "epoch": 3922} {"train_loss": -7.002841949462891, "global_step": 164742, "epoch": 3922} {"train_loss": -6.9046630859375, "global_step": 164743, "epoch": 3922} {"train_loss": -6.975798606872559, "global_step": 164744, "epoch": 3922} {"train_loss": -6.970667839050293, "global_step": 164745, "epoch": 3922} {"train_loss": -7.072093963623047, "global_step": 164746, "epoch": 3922} {"train_loss": -6.950397491455078, "global_step": 164747, "epoch": 3922} {"train_loss": -7.001251697540283, "global_step": 164748, "epoch": 3922} {"train_loss": -6.956596851348877, "global_step": 164749, "epoch": 3922} {"train_loss": -7.00825309753418, "global_step": 164750, "epoch": 3922} {"train_loss": -7.000213623046875, "global_step": 164751, "epoch": 3922} {"train_loss": -6.95503044128418, "global_step": 164752, "epoch": 3922} {"train_loss": -6.9649457931518555, "global_step": 164753, "epoch": 3922} {"train_loss": -6.855432033538818, "global_step": 164754, "epoch": 3922} {"train_loss": -6.982736587524414, "global_step": 164755, "epoch": 3922} {"train_loss": -7.042678356170654, "global_step": 164756, "epoch": 3922} {"train_loss": -7.0257720947265625, "global_step": 164757, "epoch": 3922} {"train_loss": -7.071432113647461, "global_step": 164758, "epoch": 3922} {"train_loss": -6.989326477050781, "global_step": 164759, "epoch": 3922} {"train_loss": -6.9208221435546875, "global_step": 164760, "epoch": 3922} {"train_loss": -6.9470319747924805, "global_step": 164761, "epoch": 3922} {"train_loss": -7.031763553619385, "global_step": 164762, "epoch": 3922} {"train_loss": -6.967194557189941, "global_step": 164763, "epoch": 3922} {"train_loss": -6.956943035125732, "global_step": 164764, "epoch": 3922} {"train_loss": -6.9829225313095815, "global_step": 164765, "epoch": 3922, "val_loss": 68814.421875} {"train_loss": -7.038392066955566, "global_step": 164766, "epoch": 3923} {"train_loss": -6.957731246948242, "global_step": 164767, "epoch": 3923} {"train_loss": -7.026694297790527, "global_step": 164768, "epoch": 3923} {"train_loss": -6.908950328826904, "global_step": 164769, "epoch": 3923} {"train_loss": -6.954317092895508, "global_step": 164770, "epoch": 3923} {"train_loss": -7.050555229187012, "global_step": 164771, "epoch": 3923} {"train_loss": -7.11760139465332, "global_step": 164772, "epoch": 3923} {"train_loss": -7.1081647872924805, "global_step": 164773, "epoch": 3923} {"train_loss": -7.1099443435668945, "global_step": 164774, "epoch": 3923} {"train_loss": -7.059917449951172, "global_step": 164775, "epoch": 3923} {"train_loss": -6.995175361633301, "global_step": 164776, "epoch": 3923} {"train_loss": -6.997962951660156, "global_step": 164777, "epoch": 3923} {"train_loss": -7.019155025482178, "global_step": 164778, "epoch": 3923} {"train_loss": -7.03593635559082, "global_step": 164779, "epoch": 3923} {"train_loss": -7.128325939178467, "global_step": 164780, "epoch": 3923} {"train_loss": -7.107106685638428, "global_step": 164781, "epoch": 3923} {"train_loss": -7.117356300354004, "global_step": 164782, "epoch": 3923} {"train_loss": -6.9737396240234375, "global_step": 164783, "epoch": 3923} {"train_loss": -6.985302925109863, "global_step": 164784, "epoch": 3923} {"train_loss": -6.977229118347168, "global_step": 164785, "epoch": 3923} {"train_loss": -7.045476913452148, "global_step": 164786, "epoch": 3923} {"train_loss": -7.0258941650390625, "global_step": 164787, "epoch": 3923} {"train_loss": -7.009363174438477, "global_step": 164788, "epoch": 3923} {"train_loss": -7.16739559173584, "global_step": 164789, "epoch": 3923} {"train_loss": -7.075984954833984, "global_step": 164790, "epoch": 3923} {"train_loss": -7.02577018737793, "global_step": 164791, "epoch": 3923} {"train_loss": -7.045166015625, "global_step": 164792, "epoch": 3923} {"train_loss": -7.030470848083496, "global_step": 164793, "epoch": 3923} {"train_loss": -7.1204376220703125, "global_step": 164794, "epoch": 3923} {"train_loss": -6.999682426452637, "global_step": 164795, "epoch": 3923} {"train_loss": -6.939841270446777, "global_step": 164796, "epoch": 3923} {"train_loss": -7.0248541831970215, "global_step": 164797, "epoch": 3923} {"train_loss": -7.110385894775391, "global_step": 164798, "epoch": 3923} {"train_loss": -7.099000930786133, "global_step": 164799, "epoch": 3923} {"train_loss": -6.874050140380859, "global_step": 164800, "epoch": 3923} {"train_loss": -7.085287570953369, "global_step": 164801, "epoch": 3923} {"train_loss": -7.044013500213623, "global_step": 164802, "epoch": 3923} {"train_loss": -7.053170680999756, "global_step": 164803, "epoch": 3923} {"train_loss": -6.955737113952637, "global_step": 164804, "epoch": 3923} {"train_loss": -6.944415092468262, "global_step": 164805, "epoch": 3923} {"train_loss": -6.98112154006958, "global_step": 164806, "epoch": 3923} {"train_loss": -7.029482898258028, "global_step": 164807, "epoch": 3923, "val_loss": 68660.4375} {"train_loss": -7.041584014892578, "global_step": 164808, "epoch": 3924} {"train_loss": -7.121236324310303, "global_step": 164809, "epoch": 3924} {"train_loss": -6.865455627441406, "global_step": 164810, "epoch": 3924} {"train_loss": -7.003157615661621, "global_step": 164811, "epoch": 3924} {"train_loss": -6.957027435302734, "global_step": 164812, "epoch": 3924} {"train_loss": -6.975759506225586, "global_step": 164813, "epoch": 3924} {"train_loss": -7.024806499481201, "global_step": 164814, "epoch": 3924} {"train_loss": -7.045198440551758, "global_step": 164815, "epoch": 3924} {"train_loss": -6.951943397521973, "global_step": 164816, "epoch": 3924} {"train_loss": -7.000271797180176, "global_step": 164817, "epoch": 3924} {"train_loss": -7.063630104064941, "global_step": 164818, "epoch": 3924} {"train_loss": -6.857975482940674, "global_step": 164819, "epoch": 3924} {"train_loss": -6.992465019226074, "global_step": 164820, "epoch": 3924} {"train_loss": -6.942846298217773, "global_step": 164821, "epoch": 3924} {"train_loss": -6.89951753616333, "global_step": 164822, "epoch": 3924} {"train_loss": -7.05239200592041, "global_step": 164823, "epoch": 3924} {"train_loss": -7.10686731338501, "global_step": 164824, "epoch": 3924} {"train_loss": -6.838091850280762, "global_step": 164825, "epoch": 3924} {"train_loss": -7.019534111022949, "global_step": 164826, "epoch": 3924} {"train_loss": -7.055539131164551, "global_step": 164827, "epoch": 3924} {"train_loss": -6.987853527069092, "global_step": 164828, "epoch": 3924} {"train_loss": -6.972451686859131, "global_step": 164829, "epoch": 3924} {"train_loss": -7.123509407043457, "global_step": 164830, "epoch": 3924} {"train_loss": -7.080394268035889, "global_step": 164831, "epoch": 3924} {"train_loss": -7.097442150115967, "global_step": 164832, "epoch": 3924} {"train_loss": -7.074624061584473, "global_step": 164833, "epoch": 3924} {"train_loss": -7.049393177032471, "global_step": 164834, "epoch": 3924} {"train_loss": -7.027911186218262, "global_step": 164835, "epoch": 3924} {"train_loss": -7.122173309326172, "global_step": 164836, "epoch": 3924} {"train_loss": -7.1307806968688965, "global_step": 164837, "epoch": 3924} {"train_loss": -6.993255138397217, "global_step": 164838, "epoch": 3924} {"train_loss": -6.973104000091553, "global_step": 164839, "epoch": 3924} {"train_loss": -6.985180854797363, "global_step": 164840, "epoch": 3924} {"train_loss": -6.978724479675293, "global_step": 164841, "epoch": 3924} {"train_loss": -6.90342378616333, "global_step": 164842, "epoch": 3924} {"train_loss": -6.933231353759766, "global_step": 164843, "epoch": 3924} {"train_loss": -7.09486198425293, "global_step": 164844, "epoch": 3924} {"train_loss": -6.944275856018066, "global_step": 164845, "epoch": 3924} {"train_loss": -6.934864521026611, "global_step": 164846, "epoch": 3924} {"train_loss": -7.054573059082031, "global_step": 164847, "epoch": 3924} {"train_loss": -7.034658432006836, "global_step": 164848, "epoch": 3924} {"train_loss": -7.008006425130935, "global_step": 164849, "epoch": 3924, "val_loss": 68644.7265625} {"train_loss": -7.059298992156982, "global_step": 164850, "epoch": 3925} {"train_loss": -7.050732612609863, "global_step": 164851, "epoch": 3925} {"train_loss": -7.020023345947266, "global_step": 164852, "epoch": 3925} {"train_loss": -6.868316650390625, "global_step": 164853, "epoch": 3925} {"train_loss": -7.037345886230469, "global_step": 164854, "epoch": 3925} {"train_loss": -7.002760887145996, "global_step": 164855, "epoch": 3925} {"train_loss": -6.975395679473877, "global_step": 164856, "epoch": 3925} {"train_loss": -6.872367858886719, "global_step": 164857, "epoch": 3925} {"train_loss": -7.010417938232422, "global_step": 164858, "epoch": 3925} {"train_loss": -6.8194684982299805, "global_step": 164859, "epoch": 3925} {"train_loss": -7.0008225440979, "global_step": 164860, "epoch": 3925} {"train_loss": -7.0600905418396, "global_step": 164861, "epoch": 3925} {"train_loss": -6.901031017303467, "global_step": 164862, "epoch": 3925} {"train_loss": -6.938027858734131, "global_step": 164863, "epoch": 3925} {"train_loss": -6.942967414855957, "global_step": 164864, "epoch": 3925} {"train_loss": -6.909815788269043, "global_step": 164865, "epoch": 3925} {"train_loss": -7.01039981842041, "global_step": 164866, "epoch": 3925} {"train_loss": -6.9474029541015625, "global_step": 164867, "epoch": 3925} {"train_loss": -6.918449401855469, "global_step": 164868, "epoch": 3925} {"train_loss": -6.929367542266846, "global_step": 164869, "epoch": 3925} {"train_loss": -6.884374618530273, "global_step": 164870, "epoch": 3925} {"train_loss": -7.039359092712402, "global_step": 164871, "epoch": 3925} {"train_loss": -6.869387626647949, "global_step": 164872, "epoch": 3925} {"train_loss": -6.891554832458496, "global_step": 164873, "epoch": 3925} {"train_loss": -6.8906025886535645, "global_step": 164874, "epoch": 3925} {"train_loss": -6.676277160644531, "global_step": 164875, "epoch": 3925} {"train_loss": -6.964022159576416, "global_step": 164876, "epoch": 3925} {"train_loss": -6.842313766479492, "global_step": 164877, "epoch": 3925} {"train_loss": -6.894808769226074, "global_step": 164878, "epoch": 3925} {"train_loss": -6.832294464111328, "global_step": 164879, "epoch": 3925} {"train_loss": -6.948399066925049, "global_step": 164880, "epoch": 3925} {"train_loss": -6.973862648010254, "global_step": 164881, "epoch": 3925} {"train_loss": -6.821321964263916, "global_step": 164882, "epoch": 3925} {"train_loss": -7.094137668609619, "global_step": 164883, "epoch": 3925} {"train_loss": -6.954474925994873, "global_step": 164884, "epoch": 3925} {"train_loss": -7.008048057556152, "global_step": 164885, "epoch": 3925} {"train_loss": -6.88401985168457, "global_step": 164886, "epoch": 3925} {"train_loss": -6.9824934005737305, "global_step": 164887, "epoch": 3925} {"train_loss": -7.013791561126709, "global_step": 164888, "epoch": 3925} {"train_loss": -6.995366096496582, "global_step": 164889, "epoch": 3925} {"train_loss": -6.912599086761475, "global_step": 164890, "epoch": 3925} {"train_loss": -6.942720594860258, "global_step": 164891, "epoch": 3925, "val_loss": 68592.515625} {"train_loss": -6.969414710998535, "global_step": 164892, "epoch": 3926} {"train_loss": -7.0800065994262695, "global_step": 164893, "epoch": 3926} {"train_loss": -6.966817378997803, "global_step": 164894, "epoch": 3926} {"train_loss": -6.966371059417725, "global_step": 164895, "epoch": 3926} {"train_loss": -7.023798942565918, "global_step": 164896, "epoch": 3926} {"train_loss": -6.891838073730469, "global_step": 164897, "epoch": 3926} {"train_loss": -7.0668230056762695, "global_step": 164898, "epoch": 3926} {"train_loss": -7.129488468170166, "global_step": 164899, "epoch": 3926} {"train_loss": -6.862545490264893, "global_step": 164900, "epoch": 3926} {"train_loss": -7.096441268920898, "global_step": 164901, "epoch": 3926} {"train_loss": -6.966599941253662, "global_step": 164902, "epoch": 3926} {"train_loss": -6.9892497062683105, "global_step": 164903, "epoch": 3926} {"train_loss": -7.138602256774902, "global_step": 164904, "epoch": 3926} {"train_loss": -6.949388027191162, "global_step": 164905, "epoch": 3926} {"train_loss": -6.958260536193848, "global_step": 164906, "epoch": 3926} {"train_loss": -7.108401775360107, "global_step": 164907, "epoch": 3926} {"train_loss": -7.066625595092773, "global_step": 164908, "epoch": 3926} {"train_loss": -6.876556396484375, "global_step": 164909, "epoch": 3926} {"train_loss": -7.1122355461120605, "global_step": 164910, "epoch": 3926} {"train_loss": -7.065321922302246, "global_step": 164911, "epoch": 3926} {"train_loss": -7.043193817138672, "global_step": 164912, "epoch": 3926} {"train_loss": -7.091170310974121, "global_step": 164913, "epoch": 3926} {"train_loss": -7.051460266113281, "global_step": 164914, "epoch": 3926} {"train_loss": -7.056784629821777, "global_step": 164915, "epoch": 3926} {"train_loss": -6.949338436126709, "global_step": 164916, "epoch": 3926} {"train_loss": -6.922513008117676, "global_step": 164917, "epoch": 3926} {"train_loss": -7.023774147033691, "global_step": 164918, "epoch": 3926} {"train_loss": -6.909735202789307, "global_step": 164919, "epoch": 3926} {"train_loss": -7.022495269775391, "global_step": 164920, "epoch": 3926} {"train_loss": -6.898688316345215, "global_step": 164921, "epoch": 3926} {"train_loss": -6.998478412628174, "global_step": 164922, "epoch": 3926} {"train_loss": -6.96193265914917, "global_step": 164923, "epoch": 3926} {"train_loss": -7.08164644241333, "global_step": 164924, "epoch": 3926} {"train_loss": -6.972043991088867, "global_step": 164925, "epoch": 3926} {"train_loss": -6.893421649932861, "global_step": 164926, "epoch": 3926} {"train_loss": -7.057626724243164, "global_step": 164927, "epoch": 3926} {"train_loss": -6.944019317626953, "global_step": 164928, "epoch": 3926} {"train_loss": -6.87117338180542, "global_step": 164929, "epoch": 3926} {"train_loss": -7.01405143737793, "global_step": 164930, "epoch": 3926} {"train_loss": -6.966794013977051, "global_step": 164931, "epoch": 3926} {"train_loss": -7.087038516998291, "global_step": 164932, "epoch": 3926} {"train_loss": -7.00127895673116, "global_step": 164933, "epoch": 3926, "val_loss": 68801.578125} {"train_loss": -7.068404197692871, "global_step": 164934, "epoch": 3927} {"train_loss": -7.064745903015137, "global_step": 164935, "epoch": 3927} {"train_loss": -7.098062515258789, "global_step": 164936, "epoch": 3927} {"train_loss": -6.8929443359375, "global_step": 164937, "epoch": 3927} {"train_loss": -7.030735015869141, "global_step": 164938, "epoch": 3927} {"train_loss": -6.916279315948486, "global_step": 164939, "epoch": 3927} {"train_loss": -6.914168834686279, "global_step": 164940, "epoch": 3927} {"train_loss": -6.8697733879089355, "global_step": 164941, "epoch": 3927} {"train_loss": -7.0601606369018555, "global_step": 164942, "epoch": 3927} {"train_loss": -7.016210556030273, "global_step": 164943, "epoch": 3927} {"train_loss": -7.045816421508789, "global_step": 164944, "epoch": 3927} {"train_loss": -6.8929338455200195, "global_step": 164945, "epoch": 3927} {"train_loss": -7.0139970779418945, "global_step": 164946, "epoch": 3927} {"train_loss": -7.030521392822266, "global_step": 164947, "epoch": 3927} {"train_loss": -6.958347797393799, "global_step": 164948, "epoch": 3927} {"train_loss": -6.97586727142334, "global_step": 164949, "epoch": 3927} {"train_loss": -7.093745231628418, "global_step": 164950, "epoch": 3927} {"train_loss": -6.911519527435303, "global_step": 164951, "epoch": 3927} {"train_loss": -6.867109298706055, "global_step": 164952, "epoch": 3927} {"train_loss": -7.053279399871826, "global_step": 164953, "epoch": 3927} {"train_loss": -6.968642234802246, "global_step": 164954, "epoch": 3927} {"train_loss": -6.989480972290039, "global_step": 164955, "epoch": 3927} {"train_loss": -6.975707054138184, "global_step": 164956, "epoch": 3927} {"train_loss": -7.038309097290039, "global_step": 164957, "epoch": 3927} {"train_loss": -6.992490768432617, "global_step": 164958, "epoch": 3927} {"train_loss": -7.046971321105957, "global_step": 164959, "epoch": 3927} {"train_loss": -7.0433349609375, "global_step": 164960, "epoch": 3927} {"train_loss": -7.061097621917725, "global_step": 164961, "epoch": 3927} {"train_loss": -7.095062732696533, "global_step": 164962, "epoch": 3927} {"train_loss": -7.002959728240967, "global_step": 164963, "epoch": 3927} {"train_loss": -7.02971887588501, "global_step": 164964, "epoch": 3927} {"train_loss": -7.009442329406738, "global_step": 164965, "epoch": 3927} {"train_loss": -6.97502326965332, "global_step": 164966, "epoch": 3927} {"train_loss": -7.084639549255371, "global_step": 164967, "epoch": 3927} {"train_loss": -7.054840087890625, "global_step": 164968, "epoch": 3927} {"train_loss": -6.9481940269470215, "global_step": 164969, "epoch": 3927} {"train_loss": -7.013364791870117, "global_step": 164970, "epoch": 3927} {"train_loss": -6.987083435058594, "global_step": 164971, "epoch": 3927} {"train_loss": -6.9844160079956055, "global_step": 164972, "epoch": 3927} {"train_loss": -6.931377410888672, "global_step": 164973, "epoch": 3927} {"train_loss": -6.993268013000488, "global_step": 164974, "epoch": 3927} {"train_loss": -7.001011803036644, "global_step": 164975, "epoch": 3927, "val_loss": 68687.75} {"train_loss": -7.001564025878906, "global_step": 164976, "epoch": 3928} {"train_loss": -6.960935592651367, "global_step": 164977, "epoch": 3928} {"train_loss": -6.921664714813232, "global_step": 164978, "epoch": 3928} {"train_loss": -7.002100944519043, "global_step": 164979, "epoch": 3928} {"train_loss": -6.958481788635254, "global_step": 164980, "epoch": 3928} {"train_loss": -6.907550811767578, "global_step": 164981, "epoch": 3928} {"train_loss": -7.102980613708496, "global_step": 164982, "epoch": 3928} {"train_loss": -6.792135238647461, "global_step": 164983, "epoch": 3928} {"train_loss": -6.734316825866699, "global_step": 164984, "epoch": 3928} {"train_loss": -7.070137023925781, "global_step": 164985, "epoch": 3928} {"train_loss": -7.025270938873291, "global_step": 164986, "epoch": 3928} {"train_loss": -7.020017623901367, "global_step": 164987, "epoch": 3928} {"train_loss": -7.05229377746582, "global_step": 164988, "epoch": 3928} {"train_loss": -6.997354507446289, "global_step": 164989, "epoch": 3928} {"train_loss": -7.059737205505371, "global_step": 164990, "epoch": 3928} {"train_loss": -6.9503374099731445, "global_step": 164991, "epoch": 3928} {"train_loss": -6.982161521911621, "global_step": 164992, "epoch": 3928} {"train_loss": -7.034590721130371, "global_step": 164993, "epoch": 3928} {"train_loss": -7.030684471130371, "global_step": 164994, "epoch": 3928} {"train_loss": -6.946626663208008, "global_step": 164995, "epoch": 3928} {"train_loss": -6.976943016052246, "global_step": 164996, "epoch": 3928} {"train_loss": -7.094518184661865, "global_step": 164997, "epoch": 3928} {"train_loss": -6.986019611358643, "global_step": 164998, "epoch": 3928} {"train_loss": -6.978550910949707, "global_step": 164999, "epoch": 3928} {"train_loss": -7.003406524658203, "global_step": 165000, "epoch": 3928} {"train_loss": -6.990887641906738, "global_step": 165001, "epoch": 3928} {"train_loss": -6.968971252441406, "global_step": 165002, "epoch": 3928} {"train_loss": -6.943253993988037, "global_step": 165003, "epoch": 3928} {"train_loss": -6.958836555480957, "global_step": 165004, "epoch": 3928} {"train_loss": -6.868294715881348, "global_step": 165005, "epoch": 3928} {"train_loss": -7.010957717895508, "global_step": 165006, "epoch": 3928} {"train_loss": -6.994095802307129, "global_step": 165007, "epoch": 3928} {"train_loss": -7.053048610687256, "global_step": 165008, "epoch": 3928} {"train_loss": -6.955423355102539, "global_step": 165009, "epoch": 3928} {"train_loss": -7.017218589782715, "global_step": 165010, "epoch": 3928} {"train_loss": -6.928623676300049, "global_step": 165011, "epoch": 3928} {"train_loss": -6.876389980316162, "global_step": 165012, "epoch": 3928} {"train_loss": -7.012214660644531, "global_step": 165013, "epoch": 3928} {"train_loss": -7.061707973480225, "global_step": 165014, "epoch": 3928} {"train_loss": -6.999927520751953, "global_step": 165015, "epoch": 3928} {"train_loss": -7.020245552062988, "global_step": 165016, "epoch": 3928} {"train_loss": -6.9790621030898325, "global_step": 165017, "epoch": 3928, "val_loss": 68978.7578125} {"train_loss": -6.892155647277832, "global_step": 165018, "epoch": 3929} {"train_loss": -6.872098445892334, "global_step": 165019, "epoch": 3929} {"train_loss": -7.054311752319336, "global_step": 165020, "epoch": 3929} {"train_loss": -6.899822235107422, "global_step": 165021, "epoch": 3929} {"train_loss": -6.882936954498291, "global_step": 165022, "epoch": 3929} {"train_loss": -7.017236709594727, "global_step": 165023, "epoch": 3929} {"train_loss": -6.7604570388793945, "global_step": 165024, "epoch": 3929} {"train_loss": -6.808115005493164, "global_step": 165025, "epoch": 3929} {"train_loss": -7.026587963104248, "global_step": 165026, "epoch": 3929} {"train_loss": -6.863445281982422, "global_step": 165027, "epoch": 3929} {"train_loss": -6.931317329406738, "global_step": 165028, "epoch": 3929} {"train_loss": -6.933993339538574, "global_step": 165029, "epoch": 3929} {"train_loss": -6.979361057281494, "global_step": 165030, "epoch": 3929} {"train_loss": -6.979125022888184, "global_step": 165031, "epoch": 3929} {"train_loss": -6.898978233337402, "global_step": 165032, "epoch": 3929} {"train_loss": -7.018331527709961, "global_step": 165033, "epoch": 3929} {"train_loss": -6.940896987915039, "global_step": 165034, "epoch": 3929} {"train_loss": -6.9860358238220215, "global_step": 165035, "epoch": 3929} {"train_loss": -6.884320259094238, "global_step": 165036, "epoch": 3929} {"train_loss": -6.992337703704834, "global_step": 165037, "epoch": 3929} {"train_loss": -6.980769157409668, "global_step": 165038, "epoch": 3929} {"train_loss": -6.922128677368164, "global_step": 165039, "epoch": 3929} {"train_loss": -6.843322277069092, "global_step": 165040, "epoch": 3929} {"train_loss": -7.097477436065674, "global_step": 165041, "epoch": 3929} {"train_loss": -6.937138557434082, "global_step": 165042, "epoch": 3929} {"train_loss": -6.984151840209961, "global_step": 165043, "epoch": 3929} {"train_loss": -6.8880791664123535, "global_step": 165044, "epoch": 3929} {"train_loss": -6.960476398468018, "global_step": 165045, "epoch": 3929} {"train_loss": -7.0274658203125, "global_step": 165046, "epoch": 3929} {"train_loss": -6.8770270347595215, "global_step": 165047, "epoch": 3929} {"train_loss": -6.960723876953125, "global_step": 165048, "epoch": 3929} {"train_loss": -6.798794746398926, "global_step": 165049, "epoch": 3929} {"train_loss": -6.943107604980469, "global_step": 165050, "epoch": 3929} {"train_loss": -6.9446306228637695, "global_step": 165051, "epoch": 3929} {"train_loss": -6.947289943695068, "global_step": 165052, "epoch": 3929} {"train_loss": -6.984988212585449, "global_step": 165053, "epoch": 3929} {"train_loss": -6.9812517166137695, "global_step": 165054, "epoch": 3929} {"train_loss": -6.9891557693481445, "global_step": 165055, "epoch": 3929} {"train_loss": -6.992188453674316, "global_step": 165056, "epoch": 3929} {"train_loss": -6.916048049926758, "global_step": 165057, "epoch": 3929} {"train_loss": -6.982877731323242, "global_step": 165058, "epoch": 3929} {"train_loss": -6.944361561820621, "global_step": 165059, "epoch": 3929, "val_loss": 68886.2734375} {"train_loss": -6.953095436096191, "global_step": 165060, "epoch": 3930} {"train_loss": -6.953191757202148, "global_step": 165061, "epoch": 3930} {"train_loss": -6.923120975494385, "global_step": 165062, "epoch": 3930} {"train_loss": -7.093132972717285, "global_step": 165063, "epoch": 3930} {"train_loss": -6.9876708984375, "global_step": 165064, "epoch": 3930} {"train_loss": -6.969963073730469, "global_step": 165065, "epoch": 3930} {"train_loss": -6.989543914794922, "global_step": 165066, "epoch": 3930} {"train_loss": -6.860149383544922, "global_step": 165067, "epoch": 3930} {"train_loss": -7.056576728820801, "global_step": 165068, "epoch": 3930} {"train_loss": -6.935676097869873, "global_step": 165069, "epoch": 3930} {"train_loss": -6.844298362731934, "global_step": 165070, "epoch": 3930} {"train_loss": -6.9735565185546875, "global_step": 165071, "epoch": 3930} {"train_loss": -6.989850997924805, "global_step": 165072, "epoch": 3930} {"train_loss": -6.970249652862549, "global_step": 165073, "epoch": 3930} {"train_loss": -7.014172554016113, "global_step": 165074, "epoch": 3930} {"train_loss": -6.974164962768555, "global_step": 165075, "epoch": 3930} {"train_loss": -6.993065357208252, "global_step": 165076, "epoch": 3930} {"train_loss": -6.865720748901367, "global_step": 165077, "epoch": 3930} {"train_loss": -6.959280014038086, "global_step": 165078, "epoch": 3930} {"train_loss": -6.888617515563965, "global_step": 165079, "epoch": 3930} {"train_loss": -7.033764839172363, "global_step": 165080, "epoch": 3930} {"train_loss": -6.959475517272949, "global_step": 165081, "epoch": 3930} {"train_loss": -6.852080821990967, "global_step": 165082, "epoch": 3930} {"train_loss": -6.855218887329102, "global_step": 165083, "epoch": 3930} {"train_loss": -6.7623748779296875, "global_step": 165084, "epoch": 3930} {"train_loss": -7.014713287353516, "global_step": 165085, "epoch": 3930} {"train_loss": -6.97999906539917, "global_step": 165086, "epoch": 3930} {"train_loss": -6.964959144592285, "global_step": 165087, "epoch": 3930} {"train_loss": -6.96444034576416, "global_step": 165088, "epoch": 3930} {"train_loss": -6.965567111968994, "global_step": 165089, "epoch": 3930} {"train_loss": -7.042417526245117, "global_step": 165090, "epoch": 3930} {"train_loss": -7.06850004196167, "global_step": 165091, "epoch": 3930} {"train_loss": -7.006577491760254, "global_step": 165092, "epoch": 3930} {"train_loss": -6.969306945800781, "global_step": 165093, "epoch": 3930} {"train_loss": -6.940250396728516, "global_step": 165094, "epoch": 3930} {"train_loss": -6.86264705657959, "global_step": 165095, "epoch": 3930} {"train_loss": -6.987483978271484, "global_step": 165096, "epoch": 3930} {"train_loss": -6.881695747375488, "global_step": 165097, "epoch": 3930} {"train_loss": -6.940182685852051, "global_step": 165098, "epoch": 3930} {"train_loss": -6.891597270965576, "global_step": 165099, "epoch": 3930} {"train_loss": -7.016594886779785, "global_step": 165100, "epoch": 3930} {"train_loss": -6.954614003499349, "global_step": 165101, "epoch": 3930, "val_loss": 69001.671875} {"train_loss": -6.896514415740967, "global_step": 165102, "epoch": 3931} {"train_loss": -6.978066444396973, "global_step": 165103, "epoch": 3931} {"train_loss": -6.987085342407227, "global_step": 165104, "epoch": 3931} {"train_loss": -6.9459547996521, "global_step": 165105, "epoch": 3931} {"train_loss": -6.895890235900879, "global_step": 165106, "epoch": 3931} {"train_loss": -7.0446248054504395, "global_step": 165107, "epoch": 3931} {"train_loss": -6.947262763977051, "global_step": 165108, "epoch": 3931} {"train_loss": -6.946104526519775, "global_step": 165109, "epoch": 3931} {"train_loss": -7.009156227111816, "global_step": 165110, "epoch": 3931} {"train_loss": -6.991094589233398, "global_step": 165111, "epoch": 3931} {"train_loss": -6.949298858642578, "global_step": 165112, "epoch": 3931} {"train_loss": -6.988925457000732, "global_step": 165113, "epoch": 3931} {"train_loss": -6.999703884124756, "global_step": 165114, "epoch": 3931} {"train_loss": -7.087194919586182, "global_step": 165115, "epoch": 3931} {"train_loss": -7.039191246032715, "global_step": 165116, "epoch": 3931} {"train_loss": -6.99919319152832, "global_step": 165117, "epoch": 3931} {"train_loss": -7.054219722747803, "global_step": 165118, "epoch": 3931} {"train_loss": -7.015430450439453, "global_step": 165119, "epoch": 3931} {"train_loss": -7.064462661743164, "global_step": 165120, "epoch": 3931} {"train_loss": -7.032749176025391, "global_step": 165121, "epoch": 3931} {"train_loss": -7.016593933105469, "global_step": 165122, "epoch": 3931} {"train_loss": -7.001765727996826, "global_step": 165123, "epoch": 3931} {"train_loss": -7.006577968597412, "global_step": 165124, "epoch": 3931} {"train_loss": -7.010764122009277, "global_step": 165125, "epoch": 3931} {"train_loss": -7.012627601623535, "global_step": 165126, "epoch": 3931} {"train_loss": -7.083493232727051, "global_step": 165127, "epoch": 3931} {"train_loss": -6.911241054534912, "global_step": 165128, "epoch": 3931} {"train_loss": -6.95866060256958, "global_step": 165129, "epoch": 3931} {"train_loss": -7.006247520446777, "global_step": 165130, "epoch": 3931} {"train_loss": -6.951043605804443, "global_step": 165131, "epoch": 3931} {"train_loss": -7.107966899871826, "global_step": 165132, "epoch": 3931} {"train_loss": -7.03194522857666, "global_step": 165133, "epoch": 3931} {"train_loss": -7.090328693389893, "global_step": 165134, "epoch": 3931} {"train_loss": -7.057122707366943, "global_step": 165135, "epoch": 3931} {"train_loss": -7.019405364990234, "global_step": 165136, "epoch": 3931} {"train_loss": -6.9562788009643555, "global_step": 165137, "epoch": 3931} {"train_loss": -7.107264041900635, "global_step": 165138, "epoch": 3931} {"train_loss": -7.0539093017578125, "global_step": 165139, "epoch": 3931} {"train_loss": -7.093148708343506, "global_step": 165140, "epoch": 3931} {"train_loss": -7.1453704833984375, "global_step": 165141, "epoch": 3931} {"train_loss": -7.053921222686768, "global_step": 165142, "epoch": 3931} {"train_loss": -7.012836626597813, "global_step": 165143, "epoch": 3931, "val_loss": 68695.9140625} {"train_loss": -7.001996040344238, "global_step": 165144, "epoch": 3932} {"train_loss": -6.992142677307129, "global_step": 165145, "epoch": 3932} {"train_loss": -7.031101226806641, "global_step": 165146, "epoch": 3932} {"train_loss": -7.032186508178711, "global_step": 165147, "epoch": 3932} {"train_loss": -7.136458873748779, "global_step": 165148, "epoch": 3932} {"train_loss": -6.981759071350098, "global_step": 165149, "epoch": 3932} {"train_loss": -6.980489253997803, "global_step": 165150, "epoch": 3932} {"train_loss": -7.036487102508545, "global_step": 165151, "epoch": 3932} {"train_loss": -7.09063720703125, "global_step": 165152, "epoch": 3932} {"train_loss": -7.021849155426025, "global_step": 165153, "epoch": 3932} {"train_loss": -7.088662147521973, "global_step": 165154, "epoch": 3932} {"train_loss": -7.002782344818115, "global_step": 165155, "epoch": 3932} {"train_loss": -7.082914352416992, "global_step": 165156, "epoch": 3932} {"train_loss": -7.051149368286133, "global_step": 165157, "epoch": 3932} {"train_loss": -7.0077691078186035, "global_step": 165158, "epoch": 3932} {"train_loss": -6.9594902992248535, "global_step": 165159, "epoch": 3932} {"train_loss": -7.059910774230957, "global_step": 165160, "epoch": 3932} {"train_loss": -7.04502534866333, "global_step": 165161, "epoch": 3932} {"train_loss": -6.885553359985352, "global_step": 165162, "epoch": 3932} {"train_loss": -7.035301685333252, "global_step": 165163, "epoch": 3932} {"train_loss": -6.927506923675537, "global_step": 165164, "epoch": 3932} {"train_loss": -6.867109298706055, "global_step": 165165, "epoch": 3932} {"train_loss": -6.983457565307617, "global_step": 165166, "epoch": 3932} {"train_loss": -6.876590728759766, "global_step": 165167, "epoch": 3932} {"train_loss": -6.9758477210998535, "global_step": 165168, "epoch": 3932} {"train_loss": -7.050942897796631, "global_step": 165169, "epoch": 3932} {"train_loss": -6.961343765258789, "global_step": 165170, "epoch": 3932} {"train_loss": -6.971070289611816, "global_step": 165171, "epoch": 3932} {"train_loss": -6.858362197875977, "global_step": 165172, "epoch": 3932} {"train_loss": -6.8269147872924805, "global_step": 165173, "epoch": 3932} {"train_loss": -6.968266487121582, "global_step": 165174, "epoch": 3932} {"train_loss": -6.8560285568237305, "global_step": 165175, "epoch": 3932} {"train_loss": -6.843246936798096, "global_step": 165176, "epoch": 3932} {"train_loss": -6.834229469299316, "global_step": 165177, "epoch": 3932} {"train_loss": -6.794524669647217, "global_step": 165178, "epoch": 3932} {"train_loss": -6.905911922454834, "global_step": 165179, "epoch": 3932} {"train_loss": -6.800318241119385, "global_step": 165180, "epoch": 3932} {"train_loss": -6.8092193603515625, "global_step": 165181, "epoch": 3932} {"train_loss": -6.808553695678711, "global_step": 165182, "epoch": 3932} {"train_loss": -6.810186386108398, "global_step": 165183, "epoch": 3932} {"train_loss": -6.855040550231934, "global_step": 165184, "epoch": 3932} {"train_loss": -6.945969751902989, "global_step": 165185, "epoch": 3932, "val_loss": 68799.7109375} {"train_loss": -6.800985336303711, "global_step": 165186, "epoch": 3933} {"train_loss": -6.82113790512085, "global_step": 165187, "epoch": 3933} {"train_loss": -6.968008041381836, "global_step": 165188, "epoch": 3933} {"train_loss": -6.82984733581543, "global_step": 165189, "epoch": 3933} {"train_loss": -6.890454292297363, "global_step": 165190, "epoch": 3933} {"train_loss": -6.921597957611084, "global_step": 165191, "epoch": 3933} {"train_loss": -6.927200794219971, "global_step": 165192, "epoch": 3933} {"train_loss": -6.837932109832764, "global_step": 165193, "epoch": 3933} {"train_loss": -7.028909206390381, "global_step": 165194, "epoch": 3933} {"train_loss": -6.917668342590332, "global_step": 165195, "epoch": 3933} {"train_loss": -6.992805480957031, "global_step": 165196, "epoch": 3933} {"train_loss": -6.962000846862793, "global_step": 165197, "epoch": 3933} {"train_loss": -6.975742816925049, "global_step": 165198, "epoch": 3933} {"train_loss": -6.925172805786133, "global_step": 165199, "epoch": 3933} {"train_loss": -7.001704692840576, "global_step": 165200, "epoch": 3933} {"train_loss": -6.907710075378418, "global_step": 165201, "epoch": 3933} {"train_loss": -6.98793363571167, "global_step": 165202, "epoch": 3933} {"train_loss": -6.8817138671875, "global_step": 165203, "epoch": 3933} {"train_loss": -7.048218727111816, "global_step": 165204, "epoch": 3933} {"train_loss": -6.979387283325195, "global_step": 165205, "epoch": 3933} {"train_loss": -6.911914825439453, "global_step": 165206, "epoch": 3933} {"train_loss": -6.92955207824707, "global_step": 165207, "epoch": 3933} {"train_loss": -6.953614234924316, "global_step": 165208, "epoch": 3933} {"train_loss": -7.067605972290039, "global_step": 165209, "epoch": 3933} {"train_loss": -7.047023296356201, "global_step": 165210, "epoch": 3933} {"train_loss": -6.972442626953125, "global_step": 165211, "epoch": 3933} {"train_loss": -6.889925479888916, "global_step": 165212, "epoch": 3933} {"train_loss": -6.950649261474609, "global_step": 165213, "epoch": 3933} {"train_loss": -7.011674880981445, "global_step": 165214, "epoch": 3933} {"train_loss": -7.056162357330322, "global_step": 165215, "epoch": 3933} {"train_loss": -6.863234519958496, "global_step": 165216, "epoch": 3933} {"train_loss": -7.026165008544922, "global_step": 165217, "epoch": 3933} {"train_loss": -7.004951477050781, "global_step": 165218, "epoch": 3933} {"train_loss": -6.9932379722595215, "global_step": 165219, "epoch": 3933} {"train_loss": -7.033714294433594, "global_step": 165220, "epoch": 3933} {"train_loss": -7.0492706298828125, "global_step": 165221, "epoch": 3933} {"train_loss": -7.023459434509277, "global_step": 165222, "epoch": 3933} {"train_loss": -7.0100297927856445, "global_step": 165223, "epoch": 3933} {"train_loss": -7.018240928649902, "global_step": 165224, "epoch": 3933} {"train_loss": -7.079578399658203, "global_step": 165225, "epoch": 3933} {"train_loss": -6.980399131774902, "global_step": 165226, "epoch": 3933} {"train_loss": -6.966939971560524, "global_step": 165227, "epoch": 3933, "val_loss": 68715.4140625} {"train_loss": -7.124411582946777, "global_step": 165228, "epoch": 3934} {"train_loss": -6.988641738891602, "global_step": 165229, "epoch": 3934} {"train_loss": -6.977347373962402, "global_step": 165230, "epoch": 3934} {"train_loss": -7.000251293182373, "global_step": 165231, "epoch": 3934} {"train_loss": -7.077340602874756, "global_step": 165232, "epoch": 3934} {"train_loss": -7.185759544372559, "global_step": 165233, "epoch": 3934} {"train_loss": -7.051379203796387, "global_step": 165234, "epoch": 3934} {"train_loss": -7.064332008361816, "global_step": 165235, "epoch": 3934} {"train_loss": -7.057153701782227, "global_step": 165236, "epoch": 3934} {"train_loss": -6.981305122375488, "global_step": 165237, "epoch": 3934} {"train_loss": -6.9757490158081055, "global_step": 165238, "epoch": 3934} {"train_loss": -7.054417133331299, "global_step": 165239, "epoch": 3934} {"train_loss": -7.042568683624268, "global_step": 165240, "epoch": 3934} {"train_loss": -6.969996452331543, "global_step": 165241, "epoch": 3934} {"train_loss": -7.073487758636475, "global_step": 165242, "epoch": 3934} {"train_loss": -6.9195966720581055, "global_step": 165243, "epoch": 3934} {"train_loss": -7.055208683013916, "global_step": 165244, "epoch": 3934} {"train_loss": -7.07830810546875, "global_step": 165245, "epoch": 3934} {"train_loss": -7.004005432128906, "global_step": 165246, "epoch": 3934} {"train_loss": -7.025722026824951, "global_step": 165247, "epoch": 3934} {"train_loss": -7.042876243591309, "global_step": 165248, "epoch": 3934} {"train_loss": -7.176137924194336, "global_step": 165249, "epoch": 3934} {"train_loss": -7.153043746948242, "global_step": 165250, "epoch": 3934} {"train_loss": -7.094446182250977, "global_step": 165251, "epoch": 3934} {"train_loss": -7.015995979309082, "global_step": 165252, "epoch": 3934} {"train_loss": -7.050119400024414, "global_step": 165253, "epoch": 3934} {"train_loss": -7.162859916687012, "global_step": 165254, "epoch": 3934} {"train_loss": -7.03132438659668, "global_step": 165255, "epoch": 3934} {"train_loss": -7.081263542175293, "global_step": 165256, "epoch": 3934} {"train_loss": -7.097567081451416, "global_step": 165257, "epoch": 3934} {"train_loss": -7.013457775115967, "global_step": 165258, "epoch": 3934} {"train_loss": -6.9726643562316895, "global_step": 165259, "epoch": 3934} {"train_loss": -6.961573600769043, "global_step": 165260, "epoch": 3934} {"train_loss": -6.8300018310546875, "global_step": 165261, "epoch": 3934} {"train_loss": -6.925209999084473, "global_step": 165262, "epoch": 3934} {"train_loss": -6.8323774337768555, "global_step": 165263, "epoch": 3934} {"train_loss": -6.869345188140869, "global_step": 165264, "epoch": 3934} {"train_loss": -6.9688520431518555, "global_step": 165265, "epoch": 3934} {"train_loss": -6.83879280090332, "global_step": 165266, "epoch": 3934} {"train_loss": -6.910083770751953, "global_step": 165267, "epoch": 3934} {"train_loss": -6.953027725219727, "global_step": 165268, "epoch": 3934} {"train_loss": -7.016393604732695, "global_step": 165269, "epoch": 3934, "val_loss": 68863.125} {"train_loss": -7.040398120880127, "global_step": 165270, "epoch": 3935} {"train_loss": -6.920967102050781, "global_step": 165271, "epoch": 3935} {"train_loss": -6.974123001098633, "global_step": 165272, "epoch": 3935} {"train_loss": -6.900218963623047, "global_step": 165273, "epoch": 3935} {"train_loss": -6.899369239807129, "global_step": 165274, "epoch": 3935} {"train_loss": -7.018411636352539, "global_step": 165275, "epoch": 3935} {"train_loss": -6.930200576782227, "global_step": 165276, "epoch": 3935} {"train_loss": -6.966744422912598, "global_step": 165277, "epoch": 3935} {"train_loss": -7.014530181884766, "global_step": 165278, "epoch": 3935} {"train_loss": -6.959917068481445, "global_step": 165279, "epoch": 3935} {"train_loss": -7.062448501586914, "global_step": 165280, "epoch": 3935} {"train_loss": -7.001570701599121, "global_step": 165281, "epoch": 3935} {"train_loss": -6.998467445373535, "global_step": 165282, "epoch": 3935} {"train_loss": -7.079676628112793, "global_step": 165283, "epoch": 3935} {"train_loss": -7.039374828338623, "global_step": 165284, "epoch": 3935} {"train_loss": -7.040352821350098, "global_step": 165285, "epoch": 3935} {"train_loss": -7.000012397766113, "global_step": 165286, "epoch": 3935} {"train_loss": -7.035585403442383, "global_step": 165287, "epoch": 3935} {"train_loss": -6.8860979080200195, "global_step": 165288, "epoch": 3935} {"train_loss": -7.0293684005737305, "global_step": 165289, "epoch": 3935} {"train_loss": -7.099055290222168, "global_step": 165290, "epoch": 3935} {"train_loss": -6.975269794464111, "global_step": 165291, "epoch": 3935} {"train_loss": -7.13362979888916, "global_step": 165292, "epoch": 3935} {"train_loss": -7.064986705780029, "global_step": 165293, "epoch": 3935} {"train_loss": -7.105307579040527, "global_step": 165294, "epoch": 3935} {"train_loss": -6.996228218078613, "global_step": 165295, "epoch": 3935} {"train_loss": -6.942814826965332, "global_step": 165296, "epoch": 3935} {"train_loss": -7.031191825866699, "global_step": 165297, "epoch": 3935} {"train_loss": -7.06558895111084, "global_step": 165298, "epoch": 3935} {"train_loss": -6.891360282897949, "global_step": 165299, "epoch": 3935} {"train_loss": -6.966180801391602, "global_step": 165300, "epoch": 3935} {"train_loss": -7.027546405792236, "global_step": 165301, "epoch": 3935} {"train_loss": -6.996630668640137, "global_step": 165302, "epoch": 3935} {"train_loss": -7.178518295288086, "global_step": 165303, "epoch": 3935} {"train_loss": -6.902949810028076, "global_step": 165304, "epoch": 3935} {"train_loss": -7.047557830810547, "global_step": 165305, "epoch": 3935} {"train_loss": -7.072112560272217, "global_step": 165306, "epoch": 3935} {"train_loss": -7.012347221374512, "global_step": 165307, "epoch": 3935} {"train_loss": -6.990787982940674, "global_step": 165308, "epoch": 3935} {"train_loss": -7.0206522941589355, "global_step": 165309, "epoch": 3935} {"train_loss": -7.171215057373047, "global_step": 165310, "epoch": 3935} {"train_loss": -7.009994450069609, "global_step": 165311, "epoch": 3935, "val_loss": 68824.109375} {"train_loss": -7.008485317230225, "global_step": 165312, "epoch": 3936} {"train_loss": -6.9614105224609375, "global_step": 165313, "epoch": 3936} {"train_loss": -6.979000091552734, "global_step": 165314, "epoch": 3936} {"train_loss": -7.0704522132873535, "global_step": 165315, "epoch": 3936} {"train_loss": -7.015399932861328, "global_step": 165316, "epoch": 3936} {"train_loss": -7.080144882202148, "global_step": 165317, "epoch": 3936} {"train_loss": -7.053961753845215, "global_step": 165318, "epoch": 3936} {"train_loss": -7.0061163902282715, "global_step": 165319, "epoch": 3936} {"train_loss": -6.857999801635742, "global_step": 165320, "epoch": 3936} {"train_loss": -6.94134521484375, "global_step": 165321, "epoch": 3936} {"train_loss": -7.001038074493408, "global_step": 165322, "epoch": 3936} {"train_loss": -6.935545444488525, "global_step": 165323, "epoch": 3936} {"train_loss": -7.088888168334961, "global_step": 165324, "epoch": 3936} {"train_loss": -7.038560390472412, "global_step": 165325, "epoch": 3936} {"train_loss": -7.019462585449219, "global_step": 165326, "epoch": 3936} {"train_loss": -6.89209508895874, "global_step": 165327, "epoch": 3936} {"train_loss": -7.040163516998291, "global_step": 165328, "epoch": 3936} {"train_loss": -6.957499980926514, "global_step": 165329, "epoch": 3936} {"train_loss": -7.120329856872559, "global_step": 165330, "epoch": 3936} {"train_loss": -7.084756851196289, "global_step": 165331, "epoch": 3936} {"train_loss": -7.021890640258789, "global_step": 165332, "epoch": 3936} {"train_loss": -7.177580833435059, "global_step": 165333, "epoch": 3936} {"train_loss": -7.061379432678223, "global_step": 165334, "epoch": 3936} {"train_loss": -7.00216007232666, "global_step": 165335, "epoch": 3936} {"train_loss": -7.0404052734375, "global_step": 165336, "epoch": 3936} {"train_loss": -7.111802577972412, "global_step": 165337, "epoch": 3936} {"train_loss": -7.076006889343262, "global_step": 165338, "epoch": 3936} {"train_loss": -7.013016700744629, "global_step": 165339, "epoch": 3936} {"train_loss": -6.986875534057617, "global_step": 165340, "epoch": 3936} {"train_loss": -7.050466060638428, "global_step": 165341, "epoch": 3936} {"train_loss": -7.145413398742676, "global_step": 165342, "epoch": 3936} {"train_loss": -7.007068634033203, "global_step": 165343, "epoch": 3936} {"train_loss": -7.043670654296875, "global_step": 165344, "epoch": 3936} {"train_loss": -7.135819435119629, "global_step": 165345, "epoch": 3936} {"train_loss": -7.006583213806152, "global_step": 165346, "epoch": 3936} {"train_loss": -6.865757465362549, "global_step": 165347, "epoch": 3936} {"train_loss": -7.014089584350586, "global_step": 165348, "epoch": 3936} {"train_loss": -6.966205596923828, "global_step": 165349, "epoch": 3936} {"train_loss": -6.995025634765625, "global_step": 165350, "epoch": 3936} {"train_loss": -7.009805679321289, "global_step": 165351, "epoch": 3936} {"train_loss": -6.95635461807251, "global_step": 165352, "epoch": 3936} {"train_loss": -7.0186284610203336, "global_step": 165353, "epoch": 3936, "val_loss": 68815.796875} {"train_loss": -6.84609317779541, "global_step": 165354, "epoch": 3937} {"train_loss": -6.908368110656738, "global_step": 165355, "epoch": 3937} {"train_loss": -6.953324794769287, "global_step": 165356, "epoch": 3937} {"train_loss": -6.720470905303955, "global_step": 165357, "epoch": 3937} {"train_loss": -6.871264457702637, "global_step": 165358, "epoch": 3937} {"train_loss": -6.882318019866943, "global_step": 165359, "epoch": 3937} {"train_loss": -6.761008262634277, "global_step": 165360, "epoch": 3937} {"train_loss": -7.019644737243652, "global_step": 165361, "epoch": 3937} {"train_loss": -6.810384273529053, "global_step": 165362, "epoch": 3937} {"train_loss": -6.83785343170166, "global_step": 165363, "epoch": 3937} {"train_loss": -6.994409084320068, "global_step": 165364, "epoch": 3937} {"train_loss": -6.7629804611206055, "global_step": 165365, "epoch": 3937} {"train_loss": -6.924239158630371, "global_step": 165366, "epoch": 3937} {"train_loss": -6.79920768737793, "global_step": 165367, "epoch": 3937} {"train_loss": -6.958864212036133, "global_step": 165368, "epoch": 3937} {"train_loss": -6.9822773933410645, "global_step": 165369, "epoch": 3937} {"train_loss": -6.940790176391602, "global_step": 165370, "epoch": 3937} {"train_loss": -6.964899063110352, "global_step": 165371, "epoch": 3937} {"train_loss": -6.904014587402344, "global_step": 165372, "epoch": 3937} {"train_loss": -6.87191104888916, "global_step": 165373, "epoch": 3937} {"train_loss": -6.873038291931152, "global_step": 165374, "epoch": 3937} {"train_loss": -6.98274040222168, "global_step": 165375, "epoch": 3937} {"train_loss": -6.819025039672852, "global_step": 165376, "epoch": 3937} {"train_loss": -6.937674522399902, "global_step": 165377, "epoch": 3937} {"train_loss": -6.960512161254883, "global_step": 165378, "epoch": 3937} {"train_loss": -6.770986557006836, "global_step": 165379, "epoch": 3937} {"train_loss": -6.963845252990723, "global_step": 165380, "epoch": 3937} {"train_loss": -6.929144382476807, "global_step": 165381, "epoch": 3937} {"train_loss": -6.976046562194824, "global_step": 165382, "epoch": 3937} {"train_loss": -6.981451034545898, "global_step": 165383, "epoch": 3937} {"train_loss": -6.877656936645508, "global_step": 165384, "epoch": 3937} {"train_loss": -6.878596305847168, "global_step": 165385, "epoch": 3937} {"train_loss": -6.969439506530762, "global_step": 165386, "epoch": 3937} {"train_loss": -6.957550048828125, "global_step": 165387, "epoch": 3937} {"train_loss": -6.898070812225342, "global_step": 165388, "epoch": 3937} {"train_loss": -6.915112495422363, "global_step": 165389, "epoch": 3937} {"train_loss": -6.966330528259277, "global_step": 165390, "epoch": 3937} {"train_loss": -6.894454479217529, "global_step": 165391, "epoch": 3937} {"train_loss": -7.04293155670166, "global_step": 165392, "epoch": 3937} {"train_loss": -7.010051250457764, "global_step": 165393, "epoch": 3937} {"train_loss": -6.812035083770752, "global_step": 165394, "epoch": 3937} {"train_loss": -6.908839997791109, "global_step": 165395, "epoch": 3937, "val_loss": 68855.2265625} {"train_loss": -6.909277439117432, "global_step": 165396, "epoch": 3938} {"train_loss": -7.0322957038879395, "global_step": 165397, "epoch": 3938} {"train_loss": -6.979159832000732, "global_step": 165398, "epoch": 3938} {"train_loss": -7.035431385040283, "global_step": 165399, "epoch": 3938} {"train_loss": -6.925455093383789, "global_step": 165400, "epoch": 3938} {"train_loss": -6.915545463562012, "global_step": 165401, "epoch": 3938} {"train_loss": -6.927474021911621, "global_step": 165402, "epoch": 3938} {"train_loss": -6.94721794128418, "global_step": 165403, "epoch": 3938} {"train_loss": -6.953150749206543, "global_step": 165404, "epoch": 3938} {"train_loss": -6.940720558166504, "global_step": 165405, "epoch": 3938} {"train_loss": -7.017487525939941, "global_step": 165406, "epoch": 3938} {"train_loss": -6.949123859405518, "global_step": 165407, "epoch": 3938} {"train_loss": -6.986504077911377, "global_step": 165408, "epoch": 3938} {"train_loss": -6.9156904220581055, "global_step": 165409, "epoch": 3938} {"train_loss": -6.986786365509033, "global_step": 165410, "epoch": 3938} {"train_loss": -6.789429664611816, "global_step": 165411, "epoch": 3938} {"train_loss": -6.940311908721924, "global_step": 165412, "epoch": 3938} {"train_loss": -6.770498752593994, "global_step": 165413, "epoch": 3938} {"train_loss": -7.029662609100342, "global_step": 165414, "epoch": 3938} {"train_loss": -6.866551876068115, "global_step": 165415, "epoch": 3938} {"train_loss": -6.740837097167969, "global_step": 165416, "epoch": 3938} {"train_loss": -6.983540058135986, "global_step": 165417, "epoch": 3938} {"train_loss": -6.770481109619141, "global_step": 165418, "epoch": 3938} {"train_loss": -6.947404861450195, "global_step": 165419, "epoch": 3938} {"train_loss": -6.915323734283447, "global_step": 165420, "epoch": 3938} {"train_loss": -6.858896255493164, "global_step": 165421, "epoch": 3938} {"train_loss": -6.897067070007324, "global_step": 165422, "epoch": 3938} {"train_loss": -7.022612571716309, "global_step": 165423, "epoch": 3938} {"train_loss": -6.864656925201416, "global_step": 165424, "epoch": 3938} {"train_loss": -7.015419960021973, "global_step": 165425, "epoch": 3938} {"train_loss": -7.052757263183594, "global_step": 165426, "epoch": 3938} {"train_loss": -6.897668838500977, "global_step": 165427, "epoch": 3938} {"train_loss": -6.902460098266602, "global_step": 165428, "epoch": 3938} {"train_loss": -7.008065700531006, "global_step": 165429, "epoch": 3938} {"train_loss": -6.995924949645996, "global_step": 165430, "epoch": 3938} {"train_loss": -6.955418109893799, "global_step": 165431, "epoch": 3938} {"train_loss": -6.938351154327393, "global_step": 165432, "epoch": 3938} {"train_loss": -6.958200454711914, "global_step": 165433, "epoch": 3938} {"train_loss": -7.016059875488281, "global_step": 165434, "epoch": 3938} {"train_loss": -6.988973617553711, "global_step": 165435, "epoch": 3938} {"train_loss": -7.016386985778809, "global_step": 165436, "epoch": 3938} {"train_loss": -6.941308407556443, "global_step": 165437, "epoch": 3938, "val_loss": 68792.328125} {"train_loss": -6.961235046386719, "global_step": 165438, "epoch": 3939} {"train_loss": -7.071925163269043, "global_step": 165439, "epoch": 3939} {"train_loss": -7.064791679382324, "global_step": 165440, "epoch": 3939} {"train_loss": -6.935945510864258, "global_step": 165441, "epoch": 3939} {"train_loss": -7.067999839782715, "global_step": 165442, "epoch": 3939} {"train_loss": -7.032605171203613, "global_step": 165443, "epoch": 3939} {"train_loss": -6.9731597900390625, "global_step": 165444, "epoch": 3939} {"train_loss": -6.991972923278809, "global_step": 165445, "epoch": 3939} {"train_loss": -6.950082778930664, "global_step": 165446, "epoch": 3939} {"train_loss": -6.90488338470459, "global_step": 165447, "epoch": 3939} {"train_loss": -6.905420780181885, "global_step": 165448, "epoch": 3939} {"train_loss": -6.889586925506592, "global_step": 165449, "epoch": 3939} {"train_loss": -6.8394880294799805, "global_step": 165450, "epoch": 3939} {"train_loss": -6.951789855957031, "global_step": 165451, "epoch": 3939} {"train_loss": -6.843107223510742, "global_step": 165452, "epoch": 3939} {"train_loss": -6.943968296051025, "global_step": 165453, "epoch": 3939} {"train_loss": -6.702908039093018, "global_step": 165454, "epoch": 3939} {"train_loss": -6.83161735534668, "global_step": 165455, "epoch": 3939} {"train_loss": -6.916598796844482, "global_step": 165456, "epoch": 3939} {"train_loss": -6.719918727874756, "global_step": 165457, "epoch": 3939} {"train_loss": -6.866393089294434, "global_step": 165458, "epoch": 3939} {"train_loss": -6.950339317321777, "global_step": 165459, "epoch": 3939} {"train_loss": -6.936535358428955, "global_step": 165460, "epoch": 3939} {"train_loss": -6.842013359069824, "global_step": 165461, "epoch": 3939} {"train_loss": -6.913124084472656, "global_step": 165462, "epoch": 3939} {"train_loss": -6.947720527648926, "global_step": 165463, "epoch": 3939} {"train_loss": -6.888219833374023, "global_step": 165464, "epoch": 3939} {"train_loss": -7.047568321228027, "global_step": 165465, "epoch": 3939} {"train_loss": -6.8534650802612305, "global_step": 165466, "epoch": 3939} {"train_loss": -6.992559432983398, "global_step": 165467, "epoch": 3939} {"train_loss": -6.980804443359375, "global_step": 165468, "epoch": 3939} {"train_loss": -6.917137145996094, "global_step": 165469, "epoch": 3939} {"train_loss": -6.84910774230957, "global_step": 165470, "epoch": 3939} {"train_loss": -6.847929000854492, "global_step": 165471, "epoch": 3939} {"train_loss": -6.917239189147949, "global_step": 165472, "epoch": 3939} {"train_loss": -6.952061653137207, "global_step": 165473, "epoch": 3939} {"train_loss": -6.90721321105957, "global_step": 165474, "epoch": 3939} {"train_loss": -7.089532852172852, "global_step": 165475, "epoch": 3939} {"train_loss": -7.0010175704956055, "global_step": 165476, "epoch": 3939} {"train_loss": -7.010896682739258, "global_step": 165477, "epoch": 3939} {"train_loss": -6.967267036437988, "global_step": 165478, "epoch": 3939} {"train_loss": -6.933259612038022, "global_step": 165479, "epoch": 3939, "val_loss": 68867.0234375} {"train_loss": -7.017195701599121, "global_step": 165480, "epoch": 3940} {"train_loss": -7.057818412780762, "global_step": 165481, "epoch": 3940} {"train_loss": -6.966297626495361, "global_step": 165482, "epoch": 3940} {"train_loss": -6.9410905838012695, "global_step": 165483, "epoch": 3940} {"train_loss": -6.8706159591674805, "global_step": 165484, "epoch": 3940} {"train_loss": -7.011746883392334, "global_step": 165485, "epoch": 3940} {"train_loss": -6.844667434692383, "global_step": 165486, "epoch": 3940} {"train_loss": -6.956412315368652, "global_step": 165487, "epoch": 3940} {"train_loss": -6.975546836853027, "global_step": 165488, "epoch": 3940} {"train_loss": -6.9181227684021, "global_step": 165489, "epoch": 3940} {"train_loss": -6.8815813064575195, "global_step": 165490, "epoch": 3940} {"train_loss": -6.9866509437561035, "global_step": 165491, "epoch": 3940} {"train_loss": -6.9381513595581055, "global_step": 165492, "epoch": 3940} {"train_loss": -6.886429786682129, "global_step": 165493, "epoch": 3940} {"train_loss": -6.946951866149902, "global_step": 165494, "epoch": 3940} {"train_loss": -6.988779067993164, "global_step": 165495, "epoch": 3940} {"train_loss": -6.9372758865356445, "global_step": 165496, "epoch": 3940} {"train_loss": -6.946925640106201, "global_step": 165497, "epoch": 3940} {"train_loss": -7.026662826538086, "global_step": 165498, "epoch": 3940} {"train_loss": -7.039464473724365, "global_step": 165499, "epoch": 3940} {"train_loss": -7.022207260131836, "global_step": 165500, "epoch": 3940} {"train_loss": -7.006039619445801, "global_step": 165501, "epoch": 3940} {"train_loss": -6.991252899169922, "global_step": 165502, "epoch": 3940} {"train_loss": -6.96537971496582, "global_step": 165503, "epoch": 3940} {"train_loss": -6.986623764038086, "global_step": 165504, "epoch": 3940} {"train_loss": -7.0122880935668945, "global_step": 165505, "epoch": 3940} {"train_loss": -7.021608352661133, "global_step": 165506, "epoch": 3940} {"train_loss": -6.963301181793213, "global_step": 165507, "epoch": 3940} {"train_loss": -7.05251407623291, "global_step": 165508, "epoch": 3940} {"train_loss": -6.945307731628418, "global_step": 165509, "epoch": 3940} {"train_loss": -6.969311714172363, "global_step": 165510, "epoch": 3940} {"train_loss": -6.9833831787109375, "global_step": 165511, "epoch": 3940} {"train_loss": -6.979872703552246, "global_step": 165512, "epoch": 3940} {"train_loss": -6.902936935424805, "global_step": 165513, "epoch": 3940} {"train_loss": -7.013971328735352, "global_step": 165514, "epoch": 3940} {"train_loss": -7.03900146484375, "global_step": 165515, "epoch": 3940} {"train_loss": -6.887548446655273, "global_step": 165516, "epoch": 3940} {"train_loss": -7.052111625671387, "global_step": 165517, "epoch": 3940} {"train_loss": -6.874332427978516, "global_step": 165518, "epoch": 3940} {"train_loss": -6.910159111022949, "global_step": 165519, "epoch": 3940} {"train_loss": -6.968213081359863, "global_step": 165520, "epoch": 3940} {"train_loss": -6.968695742743356, "global_step": 165521, "epoch": 3940, "val_loss": 68923.234375} {"train_loss": -6.942082405090332, "global_step": 165522, "epoch": 3941} {"train_loss": -6.9404754638671875, "global_step": 165523, "epoch": 3941} {"train_loss": -6.922852516174316, "global_step": 165524, "epoch": 3941} {"train_loss": -6.953322887420654, "global_step": 165525, "epoch": 3941} {"train_loss": -7.014218330383301, "global_step": 165526, "epoch": 3941} {"train_loss": -6.890861988067627, "global_step": 165527, "epoch": 3941} {"train_loss": -6.978409767150879, "global_step": 165528, "epoch": 3941} {"train_loss": -7.008245468139648, "global_step": 165529, "epoch": 3941} {"train_loss": -7.008182525634766, "global_step": 165530, "epoch": 3941} {"train_loss": -6.933198928833008, "global_step": 165531, "epoch": 3941} {"train_loss": -7.0726637840271, "global_step": 165532, "epoch": 3941} {"train_loss": -7.142459869384766, "global_step": 165533, "epoch": 3941} {"train_loss": -7.105401039123535, "global_step": 165534, "epoch": 3941} {"train_loss": -7.1172871589660645, "global_step": 165535, "epoch": 3941} {"train_loss": -7.092164039611816, "global_step": 165536, "epoch": 3941} {"train_loss": -6.986687660217285, "global_step": 165537, "epoch": 3941} {"train_loss": -7.046202659606934, "global_step": 165538, "epoch": 3941} {"train_loss": -6.970528602600098, "global_step": 165539, "epoch": 3941} {"train_loss": -6.985007286071777, "global_step": 165540, "epoch": 3941} {"train_loss": -6.993198871612549, "global_step": 165541, "epoch": 3941} {"train_loss": -7.088696479797363, "global_step": 165542, "epoch": 3941} {"train_loss": -7.058234214782715, "global_step": 165543, "epoch": 3941} {"train_loss": -6.989232063293457, "global_step": 165544, "epoch": 3941} {"train_loss": -6.945129871368408, "global_step": 165545, "epoch": 3941} {"train_loss": -7.142738342285156, "global_step": 165546, "epoch": 3941} {"train_loss": -7.023902893066406, "global_step": 165547, "epoch": 3941} {"train_loss": -6.990354537963867, "global_step": 165548, "epoch": 3941} {"train_loss": -7.016685962677002, "global_step": 165549, "epoch": 3941} {"train_loss": -7.036840915679932, "global_step": 165550, "epoch": 3941} {"train_loss": -7.093486785888672, "global_step": 165551, "epoch": 3941} {"train_loss": -6.9738006591796875, "global_step": 165552, "epoch": 3941} {"train_loss": -7.092923164367676, "global_step": 165553, "epoch": 3941} {"train_loss": -7.028381824493408, "global_step": 165554, "epoch": 3941} {"train_loss": -7.0512847900390625, "global_step": 165555, "epoch": 3941} {"train_loss": -7.10873556137085, "global_step": 165556, "epoch": 3941} {"train_loss": -6.9405364990234375, "global_step": 165557, "epoch": 3941} {"train_loss": -7.034885406494141, "global_step": 165558, "epoch": 3941} {"train_loss": -7.011300086975098, "global_step": 165559, "epoch": 3941} {"train_loss": -7.001348495483398, "global_step": 165560, "epoch": 3941} {"train_loss": -6.900507926940918, "global_step": 165561, "epoch": 3941} {"train_loss": -6.941124439239502, "global_step": 165562, "epoch": 3941} {"train_loss": -7.012145519256592, "global_step": 165563, "epoch": 3941, "val_loss": 68751.390625} {"train_loss": -6.940879821777344, "global_step": 165564, "epoch": 3942} {"train_loss": -7.0601911544799805, "global_step": 165565, "epoch": 3942} {"train_loss": -6.718775749206543, "global_step": 165566, "epoch": 3942} {"train_loss": -6.961287498474121, "global_step": 165567, "epoch": 3942} {"train_loss": -7.038127899169922, "global_step": 165568, "epoch": 3942} {"train_loss": -7.022299766540527, "global_step": 165569, "epoch": 3942} {"train_loss": -7.1214704513549805, "global_step": 165570, "epoch": 3942} {"train_loss": -7.127284049987793, "global_step": 165571, "epoch": 3942} {"train_loss": -6.89866828918457, "global_step": 165572, "epoch": 3942} {"train_loss": -6.943389892578125, "global_step": 165573, "epoch": 3942} {"train_loss": -7.0458831787109375, "global_step": 165574, "epoch": 3942} {"train_loss": -7.050580024719238, "global_step": 165575, "epoch": 3942} {"train_loss": -6.979413032531738, "global_step": 165576, "epoch": 3942} {"train_loss": -7.082775592803955, "global_step": 165577, "epoch": 3942} {"train_loss": -6.966854572296143, "global_step": 165578, "epoch": 3942} {"train_loss": -6.919744968414307, "global_step": 165579, "epoch": 3942} {"train_loss": -6.919496536254883, "global_step": 165580, "epoch": 3942} {"train_loss": -6.879810333251953, "global_step": 165581, "epoch": 3942} {"train_loss": -6.907778263092041, "global_step": 165582, "epoch": 3942} {"train_loss": -6.906209945678711, "global_step": 165583, "epoch": 3942} {"train_loss": -6.855050086975098, "global_step": 165584, "epoch": 3942} {"train_loss": -7.041775226593018, "global_step": 165585, "epoch": 3942} {"train_loss": -6.9256134033203125, "global_step": 165586, "epoch": 3942} {"train_loss": -6.826506614685059, "global_step": 165587, "epoch": 3942} {"train_loss": -7.005576133728027, "global_step": 165588, "epoch": 3942} {"train_loss": -6.820943832397461, "global_step": 165589, "epoch": 3942} {"train_loss": -6.980018615722656, "global_step": 165590, "epoch": 3942} {"train_loss": -6.984653949737549, "global_step": 165591, "epoch": 3942} {"train_loss": -6.90848970413208, "global_step": 165592, "epoch": 3942} {"train_loss": -7.034572601318359, "global_step": 165593, "epoch": 3942} {"train_loss": -6.778045177459717, "global_step": 165594, "epoch": 3942} {"train_loss": -6.849623203277588, "global_step": 165595, "epoch": 3942} {"train_loss": -6.9445037841796875, "global_step": 165596, "epoch": 3942} {"train_loss": -6.912014007568359, "global_step": 165597, "epoch": 3942} {"train_loss": -6.918449401855469, "global_step": 165598, "epoch": 3942} {"train_loss": -6.844191551208496, "global_step": 165599, "epoch": 3942} {"train_loss": -6.965301990509033, "global_step": 165600, "epoch": 3942} {"train_loss": -6.933365821838379, "global_step": 165601, "epoch": 3942} {"train_loss": -7.112701892852783, "global_step": 165602, "epoch": 3942} {"train_loss": -7.032057762145996, "global_step": 165603, "epoch": 3942} {"train_loss": -6.839200019836426, "global_step": 165604, "epoch": 3942} {"train_loss": -6.951505286352975, "global_step": 165605, "epoch": 3942, "val_loss": 68791.3046875} {"train_loss": -6.936891555786133, "global_step": 165606, "epoch": 3943} {"train_loss": -7.067654609680176, "global_step": 165607, "epoch": 3943} {"train_loss": -7.022082805633545, "global_step": 165608, "epoch": 3943} {"train_loss": -7.0778303146362305, "global_step": 165609, "epoch": 3943} {"train_loss": -6.949924468994141, "global_step": 165610, "epoch": 3943} {"train_loss": -6.877806186676025, "global_step": 165611, "epoch": 3943} {"train_loss": -6.880280494689941, "global_step": 165612, "epoch": 3943} {"train_loss": -7.075684547424316, "global_step": 165613, "epoch": 3943} {"train_loss": -7.080667972564697, "global_step": 165614, "epoch": 3943} {"train_loss": -6.968595504760742, "global_step": 165615, "epoch": 3943} {"train_loss": -7.103213787078857, "global_step": 165616, "epoch": 3943} {"train_loss": -6.906766891479492, "global_step": 165617, "epoch": 3943} {"train_loss": -6.930905342102051, "global_step": 165618, "epoch": 3943} {"train_loss": -6.861614227294922, "global_step": 165619, "epoch": 3943} {"train_loss": -6.926462650299072, "global_step": 165620, "epoch": 3943} {"train_loss": -7.024154186248779, "global_step": 165621, "epoch": 3943} {"train_loss": -6.913591384887695, "global_step": 165622, "epoch": 3943} {"train_loss": -6.98975944519043, "global_step": 165623, "epoch": 3943} {"train_loss": -7.030703067779541, "global_step": 165624, "epoch": 3943} {"train_loss": -7.010628700256348, "global_step": 165625, "epoch": 3943} {"train_loss": -6.940572738647461, "global_step": 165626, "epoch": 3943} {"train_loss": -7.040565490722656, "global_step": 165627, "epoch": 3943} {"train_loss": -6.968847751617432, "global_step": 165628, "epoch": 3943} {"train_loss": -6.891320705413818, "global_step": 165629, "epoch": 3943} {"train_loss": -6.88596248626709, "global_step": 165630, "epoch": 3943} {"train_loss": -6.839170455932617, "global_step": 165631, "epoch": 3943} {"train_loss": -6.939670562744141, "global_step": 165632, "epoch": 3943} {"train_loss": -6.92037296295166, "global_step": 165633, "epoch": 3943} {"train_loss": -6.843339920043945, "global_step": 165634, "epoch": 3943} {"train_loss": -6.934420585632324, "global_step": 165635, "epoch": 3943} {"train_loss": -6.949636459350586, "global_step": 165636, "epoch": 3943} {"train_loss": -6.972872734069824, "global_step": 165637, "epoch": 3943} {"train_loss": -6.954136371612549, "global_step": 165638, "epoch": 3943} {"train_loss": -6.828631401062012, "global_step": 165639, "epoch": 3943} {"train_loss": -6.922970771789551, "global_step": 165640, "epoch": 3943} {"train_loss": -6.970983505249023, "global_step": 165641, "epoch": 3943} {"train_loss": -6.908133029937744, "global_step": 165642, "epoch": 3943} {"train_loss": -6.901777267456055, "global_step": 165643, "epoch": 3943} {"train_loss": -6.916563987731934, "global_step": 165644, "epoch": 3943} {"train_loss": -7.0209550857543945, "global_step": 165645, "epoch": 3943} {"train_loss": -6.828306198120117, "global_step": 165646, "epoch": 3943} {"train_loss": -6.948930524644398, "global_step": 165647, "epoch": 3943, "val_loss": 68722.3125} {"train_loss": -6.985922813415527, "global_step": 165648, "epoch": 3944} {"train_loss": -6.950425148010254, "global_step": 165649, "epoch": 3944} {"train_loss": -6.944530487060547, "global_step": 165650, "epoch": 3944} {"train_loss": -6.981212615966797, "global_step": 165651, "epoch": 3944} {"train_loss": -6.903865337371826, "global_step": 165652, "epoch": 3944} {"train_loss": -7.036902904510498, "global_step": 165653, "epoch": 3944} {"train_loss": -7.01318883895874, "global_step": 165654, "epoch": 3944} {"train_loss": -7.109111785888672, "global_step": 165655, "epoch": 3944} {"train_loss": -7.002972602844238, "global_step": 165656, "epoch": 3944} {"train_loss": -7.022902488708496, "global_step": 165657, "epoch": 3944} {"train_loss": -7.024359226226807, "global_step": 165658, "epoch": 3944} {"train_loss": -7.002506732940674, "global_step": 165659, "epoch": 3944} {"train_loss": -7.013389587402344, "global_step": 165660, "epoch": 3944} {"train_loss": -7.0164794921875, "global_step": 165661, "epoch": 3944} {"train_loss": -7.106396198272705, "global_step": 165662, "epoch": 3944} {"train_loss": -7.0220746994018555, "global_step": 165663, "epoch": 3944} {"train_loss": -6.9874138832092285, "global_step": 165664, "epoch": 3944} {"train_loss": -6.977132797241211, "global_step": 165665, "epoch": 3944} {"train_loss": -6.95441198348999, "global_step": 165666, "epoch": 3944} {"train_loss": -6.964883327484131, "global_step": 165667, "epoch": 3944} {"train_loss": -7.0884552001953125, "global_step": 165668, "epoch": 3944} {"train_loss": -7.124939918518066, "global_step": 165669, "epoch": 3944} {"train_loss": -7.041342258453369, "global_step": 165670, "epoch": 3944} {"train_loss": -7.107717037200928, "global_step": 165671, "epoch": 3944} {"train_loss": -6.969333648681641, "global_step": 165672, "epoch": 3944} {"train_loss": -6.993143558502197, "global_step": 165673, "epoch": 3944} {"train_loss": -7.077219009399414, "global_step": 165674, "epoch": 3944} {"train_loss": -7.03961181640625, "global_step": 165675, "epoch": 3944} {"train_loss": -7.013678550720215, "global_step": 165676, "epoch": 3944} {"train_loss": -7.023391246795654, "global_step": 165677, "epoch": 3944} {"train_loss": -7.101681709289551, "global_step": 165678, "epoch": 3944} {"train_loss": -7.101350784301758, "global_step": 165679, "epoch": 3944} {"train_loss": -6.969317436218262, "global_step": 165680, "epoch": 3944} {"train_loss": -7.043859481811523, "global_step": 165681, "epoch": 3944} {"train_loss": -7.015050888061523, "global_step": 165682, "epoch": 3944} {"train_loss": -7.087841033935547, "global_step": 165683, "epoch": 3944} {"train_loss": -7.068841457366943, "global_step": 165684, "epoch": 3944} {"train_loss": -7.062420845031738, "global_step": 165685, "epoch": 3944} {"train_loss": -7.055326461791992, "global_step": 165686, "epoch": 3944} {"train_loss": -6.991507530212402, "global_step": 165687, "epoch": 3944} {"train_loss": -6.884333610534668, "global_step": 165688, "epoch": 3944} {"train_loss": -7.018856241589501, "global_step": 165689, "epoch": 3944, "val_loss": 68727.8203125} {"train_loss": -6.883242607116699, "global_step": 165690, "epoch": 3945} {"train_loss": -6.926044464111328, "global_step": 165691, "epoch": 3945} {"train_loss": -7.027554512023926, "global_step": 165692, "epoch": 3945} {"train_loss": -6.925015449523926, "global_step": 165693, "epoch": 3945} {"train_loss": -6.9005937576293945, "global_step": 165694, "epoch": 3945} {"train_loss": -6.952209949493408, "global_step": 165695, "epoch": 3945} {"train_loss": -6.933721542358398, "global_step": 165696, "epoch": 3945} {"train_loss": -6.886509895324707, "global_step": 165697, "epoch": 3945} {"train_loss": -6.963670253753662, "global_step": 165698, "epoch": 3945} {"train_loss": -7.100500106811523, "global_step": 165699, "epoch": 3945} {"train_loss": -6.963716506958008, "global_step": 165700, "epoch": 3945} {"train_loss": -6.959284782409668, "global_step": 165701, "epoch": 3945} {"train_loss": -6.98015832901001, "global_step": 165702, "epoch": 3945} {"train_loss": -6.903774261474609, "global_step": 165703, "epoch": 3945} {"train_loss": -6.898123264312744, "global_step": 165704, "epoch": 3945} {"train_loss": -6.913607120513916, "global_step": 165705, "epoch": 3945} {"train_loss": -7.090779781341553, "global_step": 165706, "epoch": 3945} {"train_loss": -6.943236351013184, "global_step": 165707, "epoch": 3945} {"train_loss": -6.912740707397461, "global_step": 165708, "epoch": 3945} {"train_loss": -6.945581436157227, "global_step": 165709, "epoch": 3945} {"train_loss": -6.867517471313477, "global_step": 165710, "epoch": 3945} {"train_loss": -7.062539577484131, "global_step": 165711, "epoch": 3945} {"train_loss": -7.017822265625, "global_step": 165712, "epoch": 3945} {"train_loss": -6.889296531677246, "global_step": 165713, "epoch": 3945} {"train_loss": -6.991471767425537, "global_step": 165714, "epoch": 3945} {"train_loss": -6.985528469085693, "global_step": 165715, "epoch": 3945} {"train_loss": -6.902336120605469, "global_step": 165716, "epoch": 3945} {"train_loss": -6.941392421722412, "global_step": 165717, "epoch": 3945} {"train_loss": -7.085858345031738, "global_step": 165718, "epoch": 3945} {"train_loss": -6.888751029968262, "global_step": 165719, "epoch": 3945} {"train_loss": -6.957896709442139, "global_step": 165720, "epoch": 3945} {"train_loss": -7.107382774353027, "global_step": 165721, "epoch": 3945} {"train_loss": -6.999523162841797, "global_step": 165722, "epoch": 3945} {"train_loss": -7.070250511169434, "global_step": 165723, "epoch": 3945} {"train_loss": -6.994985580444336, "global_step": 165724, "epoch": 3945} {"train_loss": -7.091139316558838, "global_step": 165725, "epoch": 3945} {"train_loss": -7.095653533935547, "global_step": 165726, "epoch": 3945} {"train_loss": -7.054253578186035, "global_step": 165727, "epoch": 3945} {"train_loss": -7.040052890777588, "global_step": 165728, "epoch": 3945} {"train_loss": -7.024879455566406, "global_step": 165729, "epoch": 3945} {"train_loss": -7.1425323486328125, "global_step": 165730, "epoch": 3945} {"train_loss": -6.982066177186512, "global_step": 165731, "epoch": 3945, "val_loss": 68901.1328125} {"train_loss": -7.086010456085205, "global_step": 165732, "epoch": 3946} {"train_loss": -7.035826683044434, "global_step": 165733, "epoch": 3946} {"train_loss": -6.963386535644531, "global_step": 165734, "epoch": 3946} {"train_loss": -7.061251640319824, "global_step": 165735, "epoch": 3946} {"train_loss": -7.094934463500977, "global_step": 165736, "epoch": 3946} {"train_loss": -6.942227840423584, "global_step": 165737, "epoch": 3946} {"train_loss": -6.954845905303955, "global_step": 165738, "epoch": 3946} {"train_loss": -7.009088516235352, "global_step": 165739, "epoch": 3946} {"train_loss": -6.951225280761719, "global_step": 165740, "epoch": 3946} {"train_loss": -7.044271469116211, "global_step": 165741, "epoch": 3946} {"train_loss": -7.020654678344727, "global_step": 165742, "epoch": 3946} {"train_loss": -7.073148727416992, "global_step": 165743, "epoch": 3946} {"train_loss": -7.143245697021484, "global_step": 165744, "epoch": 3946} {"train_loss": -6.917014122009277, "global_step": 165745, "epoch": 3946} {"train_loss": -6.89368200302124, "global_step": 165746, "epoch": 3946} {"train_loss": -7.060687065124512, "global_step": 165747, "epoch": 3946} {"train_loss": -7.068877696990967, "global_step": 165748, "epoch": 3946} {"train_loss": -7.077237129211426, "global_step": 165749, "epoch": 3946} {"train_loss": -7.083447456359863, "global_step": 165750, "epoch": 3946} {"train_loss": -7.0448808670043945, "global_step": 165751, "epoch": 3946} {"train_loss": -7.1073222160339355, "global_step": 165752, "epoch": 3946} {"train_loss": -7.0396857261657715, "global_step": 165753, "epoch": 3946} {"train_loss": -6.975668907165527, "global_step": 165754, "epoch": 3946} {"train_loss": -7.055692195892334, "global_step": 165755, "epoch": 3946} {"train_loss": -7.054785251617432, "global_step": 165756, "epoch": 3946} {"train_loss": -7.017484188079834, "global_step": 165757, "epoch": 3946} {"train_loss": -7.02289342880249, "global_step": 165758, "epoch": 3946} {"train_loss": -6.959463119506836, "global_step": 165759, "epoch": 3946} {"train_loss": -6.993632793426514, "global_step": 165760, "epoch": 3946} {"train_loss": -7.011211395263672, "global_step": 165761, "epoch": 3946} {"train_loss": -7.060140609741211, "global_step": 165762, "epoch": 3946} {"train_loss": -6.993310451507568, "global_step": 165763, "epoch": 3946} {"train_loss": -6.9850287437438965, "global_step": 165764, "epoch": 3946} {"train_loss": -6.960364818572998, "global_step": 165765, "epoch": 3946} {"train_loss": -6.993664741516113, "global_step": 165766, "epoch": 3946} {"train_loss": -6.998835563659668, "global_step": 165767, "epoch": 3946} {"train_loss": -7.104866027832031, "global_step": 165768, "epoch": 3946} {"train_loss": -7.082610607147217, "global_step": 165769, "epoch": 3946} {"train_loss": -7.030435562133789, "global_step": 165770, "epoch": 3946} {"train_loss": -7.0477375984191895, "global_step": 165771, "epoch": 3946} {"train_loss": -7.115321636199951, "global_step": 165772, "epoch": 3946} {"train_loss": -7.024704217910767, "global_step": 165773, "epoch": 3946, "val_loss": 68707.6171875} {"train_loss": -7.1742777824401855, "global_step": 165774, "epoch": 3947} {"train_loss": -6.90593147277832, "global_step": 165775, "epoch": 3947} {"train_loss": -6.845406532287598, "global_step": 165776, "epoch": 3947} {"train_loss": -6.962094306945801, "global_step": 165777, "epoch": 3947} {"train_loss": -6.807472229003906, "global_step": 165778, "epoch": 3947} {"train_loss": -7.001154899597168, "global_step": 165779, "epoch": 3947} {"train_loss": -6.8783416748046875, "global_step": 165780, "epoch": 3947} {"train_loss": -6.89729642868042, "global_step": 165781, "epoch": 3947} {"train_loss": -6.943819999694824, "global_step": 165782, "epoch": 3947} {"train_loss": -6.79617977142334, "global_step": 165783, "epoch": 3947} {"train_loss": -6.919395923614502, "global_step": 165784, "epoch": 3947} {"train_loss": -6.944660186767578, "global_step": 165785, "epoch": 3947} {"train_loss": -6.877383232116699, "global_step": 165786, "epoch": 3947} {"train_loss": -6.949993133544922, "global_step": 165787, "epoch": 3947} {"train_loss": -6.883281707763672, "global_step": 165788, "epoch": 3947} {"train_loss": -6.912727355957031, "global_step": 165789, "epoch": 3947} {"train_loss": -7.000725269317627, "global_step": 165790, "epoch": 3947} {"train_loss": -6.804564476013184, "global_step": 165791, "epoch": 3947} {"train_loss": -7.030799865722656, "global_step": 165792, "epoch": 3947} {"train_loss": -6.8521857261657715, "global_step": 165793, "epoch": 3947} {"train_loss": -6.884706497192383, "global_step": 165794, "epoch": 3947} {"train_loss": -6.966883659362793, "global_step": 165795, "epoch": 3947} {"train_loss": -6.908243179321289, "global_step": 165796, "epoch": 3947} {"train_loss": -6.9995622634887695, "global_step": 165797, "epoch": 3947} {"train_loss": -6.976800918579102, "global_step": 165798, "epoch": 3947} {"train_loss": -6.974564552307129, "global_step": 165799, "epoch": 3947} {"train_loss": -6.8413896560668945, "global_step": 165800, "epoch": 3947} {"train_loss": -6.953948020935059, "global_step": 165801, "epoch": 3947} {"train_loss": -6.879578590393066, "global_step": 165802, "epoch": 3947} {"train_loss": -6.996621131896973, "global_step": 165803, "epoch": 3947} {"train_loss": -6.956051349639893, "global_step": 165804, "epoch": 3947} {"train_loss": -6.91240119934082, "global_step": 165805, "epoch": 3947} {"train_loss": -6.9425883293151855, "global_step": 165806, "epoch": 3947} {"train_loss": -6.929149627685547, "global_step": 165807, "epoch": 3947} {"train_loss": -6.935192108154297, "global_step": 165808, "epoch": 3947} {"train_loss": -6.9528679847717285, "global_step": 165809, "epoch": 3947} {"train_loss": -7.016143798828125, "global_step": 165810, "epoch": 3947} {"train_loss": -6.9996538162231445, "global_step": 165811, "epoch": 3947} {"train_loss": -7.098657131195068, "global_step": 165812, "epoch": 3947} {"train_loss": -6.931136131286621, "global_step": 165813, "epoch": 3947} {"train_loss": -7.085896968841553, "global_step": 165814, "epoch": 3947} {"train_loss": -6.940047264099121, "global_step": 165815, "epoch": 3947, "val_loss": 68804.5859375} {"train_loss": -7.084949970245361, "global_step": 165816, "epoch": 3948} {"train_loss": -6.952648162841797, "global_step": 165817, "epoch": 3948} {"train_loss": -7.10248327255249, "global_step": 165818, "epoch": 3948} {"train_loss": -7.0055155754089355, "global_step": 165819, "epoch": 3948} {"train_loss": -6.9520368576049805, "global_step": 165820, "epoch": 3948} {"train_loss": -6.957364082336426, "global_step": 165821, "epoch": 3948} {"train_loss": -6.977553367614746, "global_step": 165822, "epoch": 3948} {"train_loss": -7.009676456451416, "global_step": 165823, "epoch": 3948} {"train_loss": -6.960384368896484, "global_step": 165824, "epoch": 3948} {"train_loss": -6.898395538330078, "global_step": 165825, "epoch": 3948} {"train_loss": -7.0326738357543945, "global_step": 165826, "epoch": 3948} {"train_loss": -7.0490217208862305, "global_step": 165827, "epoch": 3948} {"train_loss": -7.028436183929443, "global_step": 165828, "epoch": 3948} {"train_loss": -7.078996658325195, "global_step": 165829, "epoch": 3948} {"train_loss": -7.081187725067139, "global_step": 165830, "epoch": 3948} {"train_loss": -7.046259880065918, "global_step": 165831, "epoch": 3948} {"train_loss": -6.893693447113037, "global_step": 165832, "epoch": 3948} {"train_loss": -7.105389595031738, "global_step": 165833, "epoch": 3948} {"train_loss": -6.978255271911621, "global_step": 165834, "epoch": 3948} {"train_loss": -7.081547737121582, "global_step": 165835, "epoch": 3948} {"train_loss": -6.928240776062012, "global_step": 165836, "epoch": 3948} {"train_loss": -6.9991455078125, "global_step": 165837, "epoch": 3948} {"train_loss": -7.042994499206543, "global_step": 165838, "epoch": 3948} {"train_loss": -6.949143409729004, "global_step": 165839, "epoch": 3948} {"train_loss": -6.992209434509277, "global_step": 165840, "epoch": 3948} {"train_loss": -6.81764030456543, "global_step": 165841, "epoch": 3948} {"train_loss": -7.013166427612305, "global_step": 165842, "epoch": 3948} {"train_loss": -6.8836469650268555, "global_step": 165843, "epoch": 3948} {"train_loss": -6.860666275024414, "global_step": 165844, "epoch": 3948} {"train_loss": -7.004897117614746, "global_step": 165845, "epoch": 3948} {"train_loss": -6.85606050491333, "global_step": 165846, "epoch": 3948} {"train_loss": -7.0439910888671875, "global_step": 165847, "epoch": 3948} {"train_loss": -7.01904296875, "global_step": 165848, "epoch": 3948} {"train_loss": -7.009487152099609, "global_step": 165849, "epoch": 3948} {"train_loss": -7.039740085601807, "global_step": 165850, "epoch": 3948} {"train_loss": -6.894283771514893, "global_step": 165851, "epoch": 3948} {"train_loss": -6.838592529296875, "global_step": 165852, "epoch": 3948} {"train_loss": -7.019684791564941, "global_step": 165853, "epoch": 3948} {"train_loss": -6.880033493041992, "global_step": 165854, "epoch": 3948} {"train_loss": -7.068488121032715, "global_step": 165855, "epoch": 3948} {"train_loss": -6.93283748626709, "global_step": 165856, "epoch": 3948} {"train_loss": -6.984500101634434, "global_step": 165857, "epoch": 3948, "val_loss": 68918.6015625} {"train_loss": -7.103649139404297, "global_step": 165858, "epoch": 3949} {"train_loss": -6.727779388427734, "global_step": 165859, "epoch": 3949} {"train_loss": -7.02001428604126, "global_step": 165860, "epoch": 3949} {"train_loss": -6.987598896026611, "global_step": 165861, "epoch": 3949} {"train_loss": -6.973669528961182, "global_step": 165862, "epoch": 3949} {"train_loss": -7.030930519104004, "global_step": 165863, "epoch": 3949} {"train_loss": -6.951653957366943, "global_step": 165864, "epoch": 3949} {"train_loss": -6.80924129486084, "global_step": 165865, "epoch": 3949} {"train_loss": -6.941682815551758, "global_step": 165866, "epoch": 3949} {"train_loss": -6.953671932220459, "global_step": 165867, "epoch": 3949} {"train_loss": -6.906010627746582, "global_step": 165868, "epoch": 3949} {"train_loss": -6.969162464141846, "global_step": 165869, "epoch": 3949} {"train_loss": -6.999029636383057, "global_step": 165870, "epoch": 3949} {"train_loss": -6.9354023933410645, "global_step": 165871, "epoch": 3949} {"train_loss": -6.994747638702393, "global_step": 165872, "epoch": 3949} {"train_loss": -7.082729816436768, "global_step": 165873, "epoch": 3949} {"train_loss": -7.055108070373535, "global_step": 165874, "epoch": 3949} {"train_loss": -7.0099406242370605, "global_step": 165875, "epoch": 3949} {"train_loss": -7.072441101074219, "global_step": 165876, "epoch": 3949} {"train_loss": -7.061270713806152, "global_step": 165877, "epoch": 3949} {"train_loss": -6.959592342376709, "global_step": 165878, "epoch": 3949} {"train_loss": -7.025860786437988, "global_step": 165879, "epoch": 3949} {"train_loss": -7.0027971267700195, "global_step": 165880, "epoch": 3949} {"train_loss": -7.062458038330078, "global_step": 165881, "epoch": 3949} {"train_loss": -7.008006572723389, "global_step": 165882, "epoch": 3949} {"train_loss": -6.991764545440674, "global_step": 165883, "epoch": 3949} {"train_loss": -6.894756317138672, "global_step": 165884, "epoch": 3949} {"train_loss": -6.970279216766357, "global_step": 165885, "epoch": 3949} {"train_loss": -6.963903427124023, "global_step": 165886, "epoch": 3949} {"train_loss": -6.912975311279297, "global_step": 165887, "epoch": 3949} {"train_loss": -6.98552131652832, "global_step": 165888, "epoch": 3949} {"train_loss": -6.86693000793457, "global_step": 165889, "epoch": 3949} {"train_loss": -7.047954082489014, "global_step": 165890, "epoch": 3949} {"train_loss": -7.027287006378174, "global_step": 165891, "epoch": 3949} {"train_loss": -6.912878513336182, "global_step": 165892, "epoch": 3949} {"train_loss": -6.960183143615723, "global_step": 165893, "epoch": 3949} {"train_loss": -6.9640421867370605, "global_step": 165894, "epoch": 3949} {"train_loss": -6.970654487609863, "global_step": 165895, "epoch": 3949} {"train_loss": -6.981954574584961, "global_step": 165896, "epoch": 3949} {"train_loss": -6.9182963371276855, "global_step": 165897, "epoch": 3949} {"train_loss": -6.9754252433776855, "global_step": 165898, "epoch": 3949} {"train_loss": -6.976028181257702, "global_step": 165899, "epoch": 3949, "val_loss": 69078.1953125} {"train_loss": -6.892238616943359, "global_step": 165900, "epoch": 3950} {"train_loss": -7.016332626342773, "global_step": 165901, "epoch": 3950} {"train_loss": -6.992979049682617, "global_step": 165902, "epoch": 3950} {"train_loss": -6.954120635986328, "global_step": 165903, "epoch": 3950} {"train_loss": -7.000983715057373, "global_step": 165904, "epoch": 3950} {"train_loss": -6.960362434387207, "global_step": 165905, "epoch": 3950} {"train_loss": -6.96573543548584, "global_step": 165906, "epoch": 3950} {"train_loss": -7.022581100463867, "global_step": 165907, "epoch": 3950} {"train_loss": -6.894637584686279, "global_step": 165908, "epoch": 3950} {"train_loss": -7.127533435821533, "global_step": 165909, "epoch": 3950} {"train_loss": -6.971789360046387, "global_step": 165910, "epoch": 3950} {"train_loss": -6.946260929107666, "global_step": 165911, "epoch": 3950} {"train_loss": -6.9698381423950195, "global_step": 165912, "epoch": 3950} {"train_loss": -6.895454406738281, "global_step": 165913, "epoch": 3950} {"train_loss": -6.989736080169678, "global_step": 165914, "epoch": 3950} {"train_loss": -6.972591400146484, "global_step": 165915, "epoch": 3950} {"train_loss": -7.035652160644531, "global_step": 165916, "epoch": 3950} {"train_loss": -7.069082260131836, "global_step": 165917, "epoch": 3950} {"train_loss": -7.058809280395508, "global_step": 165918, "epoch": 3950} {"train_loss": -6.92898416519165, "global_step": 165919, "epoch": 3950} {"train_loss": -6.8451056480407715, "global_step": 165920, "epoch": 3950} {"train_loss": -6.8798065185546875, "global_step": 165921, "epoch": 3950} {"train_loss": -6.947945594787598, "global_step": 165922, "epoch": 3950} {"train_loss": -6.939077377319336, "global_step": 165923, "epoch": 3950} {"train_loss": -6.981066703796387, "global_step": 165924, "epoch": 3950} {"train_loss": -7.018270969390869, "global_step": 165925, "epoch": 3950} {"train_loss": -7.011382102966309, "global_step": 165926, "epoch": 3950} {"train_loss": -6.938828468322754, "global_step": 165927, "epoch": 3950} {"train_loss": -6.934861183166504, "global_step": 165928, "epoch": 3950} {"train_loss": -6.879759311676025, "global_step": 165929, "epoch": 3950} {"train_loss": -6.929013252258301, "global_step": 165930, "epoch": 3950} {"train_loss": -7.003510475158691, "global_step": 165931, "epoch": 3950} {"train_loss": -7.025001525878906, "global_step": 165932, "epoch": 3950} {"train_loss": -6.895216464996338, "global_step": 165933, "epoch": 3950} {"train_loss": -6.94666051864624, "global_step": 165934, "epoch": 3950} {"train_loss": -7.028280735015869, "global_step": 165935, "epoch": 3950} {"train_loss": -6.905359745025635, "global_step": 165936, "epoch": 3950} {"train_loss": -6.913669586181641, "global_step": 165937, "epoch": 3950} {"train_loss": -7.024051666259766, "global_step": 165938, "epoch": 3950} {"train_loss": -6.892163276672363, "global_step": 165939, "epoch": 3950} {"train_loss": -6.992836952209473, "global_step": 165940, "epoch": 3950} {"train_loss": -6.967386370613461, "global_step": 165941, "epoch": 3950, "train/sim_max_reward_0": 0.9320732754341727, "train/sim_max_reward_1": 0.8910935761334448, "train/sim_max_reward_2": 0.5431031599790085, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.9197835704175003, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4300000": 0.01734050794164764, "test/sim_max_reward_4300001": 0.36585586639254897, "test/sim_max_reward_4300002": 0.8839140249662105, "test/sim_max_reward_4300003": 0.9627054712853484, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9781483217632986, "test/sim_max_reward_4300006": 0.8902709347731527, "test/sim_max_reward_4300007": 0.9266205358360741, "test/sim_max_reward_4300008": 1.0, "test/sim_max_reward_4300009": 0.9476416308982852, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.9721470044800089, "test/sim_max_reward_4300013": 0.9604212611106523, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.9391744055112851, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.4009727842255066, "test/sim_max_reward_4300019": 0.1859882165736861, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.3337993831447895, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.9506797470879426, "test/sim_max_reward_4300024": 0.6421974416267688, "test/sim_max_reward_4300025": 0.832436030489636, "test/sim_max_reward_4300026": 0.050878423390650566, "test/sim_max_reward_4300027": 0.8856567440553772, "test/sim_max_reward_4300028": 0.0014307349343027796, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.2748853352144964, "test/sim_max_reward_4300031": 0.22496733857474926, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.9651520946764776, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.8986291206558767, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.9254250283221427, "test/sim_max_reward_4300038": 0.9989963673530807, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.5621008146507397, "test/sim_max_reward_4300041": 0.8672204593096176, "test/sim_max_reward_4300042": 0.46577058346039124, "test/sim_max_reward_4300043": 0.14271749074417045, "test/sim_max_reward_4300044": 1.0, "test/sim_max_reward_4300045": 0.9767399681197836, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.12594344683075015, "test/sim_max_reward_4300048": 7.4404412196472e-05, "test/sim_max_reward_4300049": 0.18340136616983635, "train/mean_score": 0.8810089303273544, "test/mean_score": 0.6191066301870849, "val_loss": 68801.859375} {"train_loss": -6.974995136260986, "global_step": 165942, "epoch": 3951} {"train_loss": -7.018184661865234, "global_step": 165943, "epoch": 3951} {"train_loss": -7.019060134887695, "global_step": 165944, "epoch": 3951} {"train_loss": -7.022615432739258, "global_step": 165945, "epoch": 3951} {"train_loss": -6.878481864929199, "global_step": 165946, "epoch": 3951} {"train_loss": -7.173090934753418, "global_step": 165947, "epoch": 3951} {"train_loss": -7.007139682769775, "global_step": 165948, "epoch": 3951} {"train_loss": -7.002621650695801, "global_step": 165949, "epoch": 3951} {"train_loss": -7.068524360656738, "global_step": 165950, "epoch": 3951} {"train_loss": -7.140244483947754, "global_step": 165951, "epoch": 3951} {"train_loss": -7.13519287109375, "global_step": 165952, "epoch": 3951} {"train_loss": -6.995303630828857, "global_step": 165953, "epoch": 3951} {"train_loss": -7.072658061981201, "global_step": 165954, "epoch": 3951} {"train_loss": -7.020829677581787, "global_step": 165955, "epoch": 3951} {"train_loss": -7.046549320220947, "global_step": 165956, "epoch": 3951} {"train_loss": -7.0498576164245605, "global_step": 165957, "epoch": 3951} {"train_loss": -6.951030731201172, "global_step": 165958, "epoch": 3951} {"train_loss": -7.0246477127075195, "global_step": 165959, "epoch": 3951} {"train_loss": -7.084736347198486, "global_step": 165960, "epoch": 3951} {"train_loss": -7.1899003982543945, "global_step": 165961, "epoch": 3951} {"train_loss": -7.084604263305664, "global_step": 165962, "epoch": 3951} {"train_loss": -7.063197135925293, "global_step": 165963, "epoch": 3951} {"train_loss": -6.983154296875, "global_step": 165964, "epoch": 3951} {"train_loss": -6.919623374938965, "global_step": 165965, "epoch": 3951} {"train_loss": -7.077057361602783, "global_step": 165966, "epoch": 3951} {"train_loss": -6.876955986022949, "global_step": 165967, "epoch": 3951} {"train_loss": -7.107500076293945, "global_step": 165968, "epoch": 3951} {"train_loss": -7.040966987609863, "global_step": 165969, "epoch": 3951} {"train_loss": -6.970159530639648, "global_step": 165970, "epoch": 3951} {"train_loss": -7.063871383666992, "global_step": 165971, "epoch": 3951} {"train_loss": -6.932767868041992, "global_step": 165972, "epoch": 3951} {"train_loss": -7.008613586425781, "global_step": 165973, "epoch": 3951} {"train_loss": -6.915369510650635, "global_step": 165974, "epoch": 3951} {"train_loss": -6.990959167480469, "global_step": 165975, "epoch": 3951} {"train_loss": -6.988969326019287, "global_step": 165976, "epoch": 3951} {"train_loss": -6.92791223526001, "global_step": 165977, "epoch": 3951} {"train_loss": -6.901571273803711, "global_step": 165978, "epoch": 3951} {"train_loss": -6.946407318115234, "global_step": 165979, "epoch": 3951} {"train_loss": -7.023196697235107, "global_step": 165980, "epoch": 3951} {"train_loss": -6.917342185974121, "global_step": 165981, "epoch": 3951} {"train_loss": -7.074587821960449, "global_step": 165982, "epoch": 3951} {"train_loss": -7.015502520969936, "global_step": 165983, "epoch": 3951, "val_loss": 68872.2265625} {"train_loss": -6.964498519897461, "global_step": 165984, "epoch": 3952} {"train_loss": -6.914475917816162, "global_step": 165985, "epoch": 3952} {"train_loss": -6.853363990783691, "global_step": 165986, "epoch": 3952} {"train_loss": -6.943351745605469, "global_step": 165987, "epoch": 3952} {"train_loss": -6.863507270812988, "global_step": 165988, "epoch": 3952} {"train_loss": -6.95578670501709, "global_step": 165989, "epoch": 3952} {"train_loss": -6.973590850830078, "global_step": 165990, "epoch": 3952} {"train_loss": -6.899364471435547, "global_step": 165991, "epoch": 3952} {"train_loss": -7.07924747467041, "global_step": 165992, "epoch": 3952} {"train_loss": -6.887157440185547, "global_step": 165993, "epoch": 3952} {"train_loss": -7.025533199310303, "global_step": 165994, "epoch": 3952} {"train_loss": -6.946105480194092, "global_step": 165995, "epoch": 3952} {"train_loss": -6.985847473144531, "global_step": 165996, "epoch": 3952} {"train_loss": -6.942926406860352, "global_step": 165997, "epoch": 3952} {"train_loss": -6.923954963684082, "global_step": 165998, "epoch": 3952} {"train_loss": -6.899137496948242, "global_step": 165999, "epoch": 3952} {"train_loss": -6.853935241699219, "global_step": 166000, "epoch": 3952} {"train_loss": -7.05546760559082, "global_step": 166001, "epoch": 3952} {"train_loss": -6.985917091369629, "global_step": 166002, "epoch": 3952} {"train_loss": -7.001461029052734, "global_step": 166003, "epoch": 3952} {"train_loss": -6.938000202178955, "global_step": 166004, "epoch": 3952} {"train_loss": -7.01936149597168, "global_step": 166005, "epoch": 3952} {"train_loss": -7.067696571350098, "global_step": 166006, "epoch": 3952} {"train_loss": -6.942599296569824, "global_step": 166007, "epoch": 3952} {"train_loss": -6.947717666625977, "global_step": 166008, "epoch": 3952} {"train_loss": -7.002844333648682, "global_step": 166009, "epoch": 3952} {"train_loss": -7.0062360763549805, "global_step": 166010, "epoch": 3952} {"train_loss": -7.063467979431152, "global_step": 166011, "epoch": 3952} {"train_loss": -7.064866542816162, "global_step": 166012, "epoch": 3952} {"train_loss": -7.063861846923828, "global_step": 166013, "epoch": 3952} {"train_loss": -7.07652473449707, "global_step": 166014, "epoch": 3952} {"train_loss": -6.956866264343262, "global_step": 166015, "epoch": 3952} {"train_loss": -7.053014755249023, "global_step": 166016, "epoch": 3952} {"train_loss": -6.999176979064941, "global_step": 166017, "epoch": 3952} {"train_loss": -7.066466331481934, "global_step": 166018, "epoch": 3952} {"train_loss": -7.118985176086426, "global_step": 166019, "epoch": 3952} {"train_loss": -7.020805835723877, "global_step": 166020, "epoch": 3952} {"train_loss": -7.007067680358887, "global_step": 166021, "epoch": 3952} {"train_loss": -6.953718662261963, "global_step": 166022, "epoch": 3952} {"train_loss": -6.961990833282471, "global_step": 166023, "epoch": 3952} {"train_loss": -6.9578328132629395, "global_step": 166024, "epoch": 3952} {"train_loss": -6.982504765192668, "global_step": 166025, "epoch": 3952, "val_loss": 68728.4609375} {"train_loss": -6.900258541107178, "global_step": 166026, "epoch": 3953} {"train_loss": -6.910162448883057, "global_step": 166027, "epoch": 3953} {"train_loss": -6.944692134857178, "global_step": 166028, "epoch": 3953} {"train_loss": -6.962734222412109, "global_step": 166029, "epoch": 3953} {"train_loss": -7.094460964202881, "global_step": 166030, "epoch": 3953} {"train_loss": -6.818415641784668, "global_step": 166031, "epoch": 3953} {"train_loss": -6.917778491973877, "global_step": 166032, "epoch": 3953} {"train_loss": -6.912990570068359, "global_step": 166033, "epoch": 3953} {"train_loss": -6.860274314880371, "global_step": 166034, "epoch": 3953} {"train_loss": -7.009639739990234, "global_step": 166035, "epoch": 3953} {"train_loss": -6.810009479522705, "global_step": 166036, "epoch": 3953} {"train_loss": -6.9713640213012695, "global_step": 166037, "epoch": 3953} {"train_loss": -7.090004920959473, "global_step": 166038, "epoch": 3953} {"train_loss": -6.878625869750977, "global_step": 166039, "epoch": 3953} {"train_loss": -6.966635704040527, "global_step": 166040, "epoch": 3953} {"train_loss": -6.883129119873047, "global_step": 166041, "epoch": 3953} {"train_loss": -7.011958122253418, "global_step": 166042, "epoch": 3953} {"train_loss": -6.958248138427734, "global_step": 166043, "epoch": 3953} {"train_loss": -6.981649398803711, "global_step": 166044, "epoch": 3953} {"train_loss": -7.024024963378906, "global_step": 166045, "epoch": 3953} {"train_loss": -6.970949172973633, "global_step": 166046, "epoch": 3953} {"train_loss": -6.920614719390869, "global_step": 166047, "epoch": 3953} {"train_loss": -6.926385402679443, "global_step": 166048, "epoch": 3953} {"train_loss": -6.965039253234863, "global_step": 166049, "epoch": 3953} {"train_loss": -6.889464855194092, "global_step": 166050, "epoch": 3953} {"train_loss": -6.846468448638916, "global_step": 166051, "epoch": 3953} {"train_loss": -6.929643630981445, "global_step": 166052, "epoch": 3953} {"train_loss": -6.95336389541626, "global_step": 166053, "epoch": 3953} {"train_loss": -6.89936637878418, "global_step": 166054, "epoch": 3953} {"train_loss": -6.953728675842285, "global_step": 166055, "epoch": 3953} {"train_loss": -6.973963737487793, "global_step": 166056, "epoch": 3953} {"train_loss": -6.957491397857666, "global_step": 166057, "epoch": 3953} {"train_loss": -6.910125732421875, "global_step": 166058, "epoch": 3953} {"train_loss": -6.965177059173584, "global_step": 166059, "epoch": 3953} {"train_loss": -7.004386901855469, "global_step": 166060, "epoch": 3953} {"train_loss": -6.779016017913818, "global_step": 166061, "epoch": 3953} {"train_loss": -6.986117362976074, "global_step": 166062, "epoch": 3953} {"train_loss": -6.952895164489746, "global_step": 166063, "epoch": 3953} {"train_loss": -6.900510787963867, "global_step": 166064, "epoch": 3953} {"train_loss": -6.82783317565918, "global_step": 166065, "epoch": 3953} {"train_loss": -6.924039840698242, "global_step": 166066, "epoch": 3953} {"train_loss": -6.935206277029855, "global_step": 166067, "epoch": 3953, "val_loss": 68526.1640625} {"train_loss": -6.8731255531311035, "global_step": 166068, "epoch": 3954} {"train_loss": -6.953009128570557, "global_step": 166069, "epoch": 3954} {"train_loss": -6.811786651611328, "global_step": 166070, "epoch": 3954} {"train_loss": -6.960470676422119, "global_step": 166071, "epoch": 3954} {"train_loss": -6.879365921020508, "global_step": 166072, "epoch": 3954} {"train_loss": -6.952467918395996, "global_step": 166073, "epoch": 3954} {"train_loss": -6.872724533081055, "global_step": 166074, "epoch": 3954} {"train_loss": -6.90524435043335, "global_step": 166075, "epoch": 3954} {"train_loss": -6.980868339538574, "global_step": 166076, "epoch": 3954} {"train_loss": -7.05781364440918, "global_step": 166077, "epoch": 3954} {"train_loss": -6.84202241897583, "global_step": 166078, "epoch": 3954} {"train_loss": -6.967368125915527, "global_step": 166079, "epoch": 3954} {"train_loss": -7.023483753204346, "global_step": 166080, "epoch": 3954} {"train_loss": -6.951662063598633, "global_step": 166081, "epoch": 3954} {"train_loss": -6.961591720581055, "global_step": 166082, "epoch": 3954} {"train_loss": -6.999264717102051, "global_step": 166083, "epoch": 3954} {"train_loss": -6.874443054199219, "global_step": 166084, "epoch": 3954} {"train_loss": -6.940731525421143, "global_step": 166085, "epoch": 3954} {"train_loss": -6.848580360412598, "global_step": 166086, "epoch": 3954} {"train_loss": -7.089774131774902, "global_step": 166087, "epoch": 3954} {"train_loss": -6.870878219604492, "global_step": 166088, "epoch": 3954} {"train_loss": -7.018251419067383, "global_step": 166089, "epoch": 3954} {"train_loss": -6.971842288970947, "global_step": 166090, "epoch": 3954} {"train_loss": -6.947453498840332, "global_step": 166091, "epoch": 3954} {"train_loss": -7.036972999572754, "global_step": 166092, "epoch": 3954} {"train_loss": -6.927057266235352, "global_step": 166093, "epoch": 3954} {"train_loss": -6.9152512550354, "global_step": 166094, "epoch": 3954} {"train_loss": -7.035322189331055, "global_step": 166095, "epoch": 3954} {"train_loss": -6.852267265319824, "global_step": 166096, "epoch": 3954} {"train_loss": -6.987709045410156, "global_step": 166097, "epoch": 3954} {"train_loss": -6.944804668426514, "global_step": 166098, "epoch": 3954} {"train_loss": -6.837627410888672, "global_step": 166099, "epoch": 3954} {"train_loss": -6.867087364196777, "global_step": 166100, "epoch": 3954} {"train_loss": -6.991909027099609, "global_step": 166101, "epoch": 3954} {"train_loss": -6.951422691345215, "global_step": 166102, "epoch": 3954} {"train_loss": -6.968319416046143, "global_step": 166103, "epoch": 3954} {"train_loss": -6.976305961608887, "global_step": 166104, "epoch": 3954} {"train_loss": -6.830885887145996, "global_step": 166105, "epoch": 3954} {"train_loss": -7.007342338562012, "global_step": 166106, "epoch": 3954} {"train_loss": -6.909319877624512, "global_step": 166107, "epoch": 3954} {"train_loss": -6.838834762573242, "global_step": 166108, "epoch": 3954} {"train_loss": -6.937866460709345, "global_step": 166109, "epoch": 3954, "val_loss": 68788.234375} {"train_loss": -6.902070045471191, "global_step": 166110, "epoch": 3955} {"train_loss": -6.985814094543457, "global_step": 166111, "epoch": 3955} {"train_loss": -7.071784496307373, "global_step": 166112, "epoch": 3955} {"train_loss": -6.861081123352051, "global_step": 166113, "epoch": 3955} {"train_loss": -6.962712287902832, "global_step": 166114, "epoch": 3955} {"train_loss": -6.94904088973999, "global_step": 166115, "epoch": 3955} {"train_loss": -6.952203750610352, "global_step": 166116, "epoch": 3955} {"train_loss": -7.112098217010498, "global_step": 166117, "epoch": 3955} {"train_loss": -7.007120132446289, "global_step": 166118, "epoch": 3955} {"train_loss": -6.963838577270508, "global_step": 166119, "epoch": 3955} {"train_loss": -6.968491554260254, "global_step": 166120, "epoch": 3955} {"train_loss": -6.930204391479492, "global_step": 166121, "epoch": 3955} {"train_loss": -7.069650650024414, "global_step": 166122, "epoch": 3955} {"train_loss": -6.959439277648926, "global_step": 166123, "epoch": 3955} {"train_loss": -7.041506767272949, "global_step": 166124, "epoch": 3955} {"train_loss": -6.922950744628906, "global_step": 166125, "epoch": 3955} {"train_loss": -7.215001106262207, "global_step": 166126, "epoch": 3955} {"train_loss": -6.973972320556641, "global_step": 166127, "epoch": 3955} {"train_loss": -7.044977188110352, "global_step": 166128, "epoch": 3955} {"train_loss": -6.955348491668701, "global_step": 166129, "epoch": 3955} {"train_loss": -6.967148303985596, "global_step": 166130, "epoch": 3955} {"train_loss": -6.956205368041992, "global_step": 166131, "epoch": 3955} {"train_loss": -7.121547222137451, "global_step": 166132, "epoch": 3955} {"train_loss": -6.989997386932373, "global_step": 166133, "epoch": 3955} {"train_loss": -6.9833269119262695, "global_step": 166134, "epoch": 3955} {"train_loss": -6.996579170227051, "global_step": 166135, "epoch": 3955} {"train_loss": -7.1104736328125, "global_step": 166136, "epoch": 3955} {"train_loss": -6.948925495147705, "global_step": 166137, "epoch": 3955} {"train_loss": -6.976993560791016, "global_step": 166138, "epoch": 3955} {"train_loss": -7.01895809173584, "global_step": 166139, "epoch": 3955} {"train_loss": -6.9370269775390625, "global_step": 166140, "epoch": 3955} {"train_loss": -6.9849748611450195, "global_step": 166141, "epoch": 3955} {"train_loss": -6.969222068786621, "global_step": 166142, "epoch": 3955} {"train_loss": -6.990389823913574, "global_step": 166143, "epoch": 3955} {"train_loss": -6.985137939453125, "global_step": 166144, "epoch": 3955} {"train_loss": -6.990400791168213, "global_step": 166145, "epoch": 3955} {"train_loss": -7.094846725463867, "global_step": 166146, "epoch": 3955} {"train_loss": -6.991565704345703, "global_step": 166147, "epoch": 3955} {"train_loss": -7.068973541259766, "global_step": 166148, "epoch": 3955} {"train_loss": -7.029821395874023, "global_step": 166149, "epoch": 3955} {"train_loss": -7.11312198638916, "global_step": 166150, "epoch": 3955} {"train_loss": -7.001691080275036, "global_step": 166151, "epoch": 3955, "val_loss": 68840.765625} {"train_loss": -7.117585182189941, "global_step": 166152, "epoch": 3956} {"train_loss": -7.138894081115723, "global_step": 166153, "epoch": 3956} {"train_loss": -7.088112831115723, "global_step": 166154, "epoch": 3956} {"train_loss": -6.9742865562438965, "global_step": 166155, "epoch": 3956} {"train_loss": -7.011275291442871, "global_step": 166156, "epoch": 3956} {"train_loss": -7.092249870300293, "global_step": 166157, "epoch": 3956} {"train_loss": -7.054943561553955, "global_step": 166158, "epoch": 3956} {"train_loss": -6.960724830627441, "global_step": 166159, "epoch": 3956} {"train_loss": -7.068807125091553, "global_step": 166160, "epoch": 3956} {"train_loss": -7.008368015289307, "global_step": 166161, "epoch": 3956} {"train_loss": -7.074843883514404, "global_step": 166162, "epoch": 3956} {"train_loss": -7.042470455169678, "global_step": 166163, "epoch": 3956} {"train_loss": -6.9205780029296875, "global_step": 166164, "epoch": 3956} {"train_loss": -7.053323745727539, "global_step": 166165, "epoch": 3956} {"train_loss": -7.0954742431640625, "global_step": 166166, "epoch": 3956} {"train_loss": -6.996852874755859, "global_step": 166167, "epoch": 3956} {"train_loss": -6.999546527862549, "global_step": 166168, "epoch": 3956} {"train_loss": -7.019670009613037, "global_step": 166169, "epoch": 3956} {"train_loss": -7.157177925109863, "global_step": 166170, "epoch": 3956} {"train_loss": -7.119484901428223, "global_step": 166171, "epoch": 3956} {"train_loss": -7.029231071472168, "global_step": 166172, "epoch": 3956} {"train_loss": -6.993338584899902, "global_step": 166173, "epoch": 3956} {"train_loss": -7.021248817443848, "global_step": 166174, "epoch": 3956} {"train_loss": -6.887073516845703, "global_step": 166175, "epoch": 3956} {"train_loss": -6.957610130310059, "global_step": 166176, "epoch": 3956} {"train_loss": -6.971755027770996, "global_step": 166177, "epoch": 3956} {"train_loss": -7.131223201751709, "global_step": 166178, "epoch": 3956} {"train_loss": -7.01007080078125, "global_step": 166179, "epoch": 3956} {"train_loss": -6.887707710266113, "global_step": 166180, "epoch": 3956} {"train_loss": -7.110473155975342, "global_step": 166181, "epoch": 3956} {"train_loss": -7.029949188232422, "global_step": 166182, "epoch": 3956} {"train_loss": -6.985764503479004, "global_step": 166183, "epoch": 3956} {"train_loss": -7.10137939453125, "global_step": 166184, "epoch": 3956} {"train_loss": -6.941030025482178, "global_step": 166185, "epoch": 3956} {"train_loss": -7.031528949737549, "global_step": 166186, "epoch": 3956} {"train_loss": -7.022438049316406, "global_step": 166187, "epoch": 3956} {"train_loss": -6.990453720092773, "global_step": 166188, "epoch": 3956} {"train_loss": -7.069874286651611, "global_step": 166189, "epoch": 3956} {"train_loss": -6.988924503326416, "global_step": 166190, "epoch": 3956} {"train_loss": -6.920716762542725, "global_step": 166191, "epoch": 3956} {"train_loss": -7.0279645919799805, "global_step": 166192, "epoch": 3956} {"train_loss": -7.02752997761681, "global_step": 166193, "epoch": 3956, "val_loss": 68905.609375} {"train_loss": -7.032353401184082, "global_step": 166194, "epoch": 3957} {"train_loss": -7.016297340393066, "global_step": 166195, "epoch": 3957} {"train_loss": -7.056193828582764, "global_step": 166196, "epoch": 3957} {"train_loss": -6.94981575012207, "global_step": 166197, "epoch": 3957} {"train_loss": -7.002017021179199, "global_step": 166198, "epoch": 3957} {"train_loss": -7.001713752746582, "global_step": 166199, "epoch": 3957} {"train_loss": -7.005171775817871, "global_step": 166200, "epoch": 3957} {"train_loss": -6.924770355224609, "global_step": 166201, "epoch": 3957} {"train_loss": -6.9488630294799805, "global_step": 166202, "epoch": 3957} {"train_loss": -7.052154541015625, "global_step": 166203, "epoch": 3957} {"train_loss": -7.128149032592773, "global_step": 166204, "epoch": 3957} {"train_loss": -6.990571975708008, "global_step": 166205, "epoch": 3957} {"train_loss": -7.030007362365723, "global_step": 166206, "epoch": 3957} {"train_loss": -7.09505558013916, "global_step": 166207, "epoch": 3957} {"train_loss": -7.1196441650390625, "global_step": 166208, "epoch": 3957} {"train_loss": -7.0839409828186035, "global_step": 166209, "epoch": 3957} {"train_loss": -7.014212608337402, "global_step": 166210, "epoch": 3957} {"train_loss": -7.005497932434082, "global_step": 166211, "epoch": 3957} {"train_loss": -7.09824275970459, "global_step": 166212, "epoch": 3957} {"train_loss": -7.153555870056152, "global_step": 166213, "epoch": 3957} {"train_loss": -7.06112003326416, "global_step": 166214, "epoch": 3957} {"train_loss": -7.0785369873046875, "global_step": 166215, "epoch": 3957} {"train_loss": -7.024538993835449, "global_step": 166216, "epoch": 3957} {"train_loss": -7.10209846496582, "global_step": 166217, "epoch": 3957} {"train_loss": -7.109989643096924, "global_step": 166218, "epoch": 3957} {"train_loss": -7.051021575927734, "global_step": 166219, "epoch": 3957} {"train_loss": -7.050413131713867, "global_step": 166220, "epoch": 3957} {"train_loss": -7.128331184387207, "global_step": 166221, "epoch": 3957} {"train_loss": -7.056926727294922, "global_step": 166222, "epoch": 3957} {"train_loss": -7.054800033569336, "global_step": 166223, "epoch": 3957} {"train_loss": -7.047384738922119, "global_step": 166224, "epoch": 3957} {"train_loss": -7.033084869384766, "global_step": 166225, "epoch": 3957} {"train_loss": -7.096766948699951, "global_step": 166226, "epoch": 3957} {"train_loss": -6.895890712738037, "global_step": 166227, "epoch": 3957} {"train_loss": -7.054044723510742, "global_step": 166228, "epoch": 3957} {"train_loss": -7.129707336425781, "global_step": 166229, "epoch": 3957} {"train_loss": -7.11373233795166, "global_step": 166230, "epoch": 3957} {"train_loss": -6.949026107788086, "global_step": 166231, "epoch": 3957} {"train_loss": -6.923661231994629, "global_step": 166232, "epoch": 3957} {"train_loss": -7.0423688888549805, "global_step": 166233, "epoch": 3957} {"train_loss": -7.01857328414917, "global_step": 166234, "epoch": 3957} {"train_loss": -7.041248741604033, "global_step": 166235, "epoch": 3957, "val_loss": 68779.21875} {"train_loss": -7.067134857177734, "global_step": 166236, "epoch": 3958} {"train_loss": -7.011148452758789, "global_step": 166237, "epoch": 3958} {"train_loss": -7.029113292694092, "global_step": 166238, "epoch": 3958} {"train_loss": -7.124752044677734, "global_step": 166239, "epoch": 3958} {"train_loss": -7.093626022338867, "global_step": 166240, "epoch": 3958} {"train_loss": -7.005455493927002, "global_step": 166241, "epoch": 3958} {"train_loss": -6.999273300170898, "global_step": 166242, "epoch": 3958} {"train_loss": -6.974618434906006, "global_step": 166243, "epoch": 3958} {"train_loss": -6.951492786407471, "global_step": 166244, "epoch": 3958} {"train_loss": -7.024301528930664, "global_step": 166245, "epoch": 3958} {"train_loss": -6.98387336730957, "global_step": 166246, "epoch": 3958} {"train_loss": -7.131929874420166, "global_step": 166247, "epoch": 3958} {"train_loss": -7.071023941040039, "global_step": 166248, "epoch": 3958} {"train_loss": -7.021690368652344, "global_step": 166249, "epoch": 3958} {"train_loss": -7.030816078186035, "global_step": 166250, "epoch": 3958} {"train_loss": -6.944644451141357, "global_step": 166251, "epoch": 3958} {"train_loss": -7.077662467956543, "global_step": 166252, "epoch": 3958} {"train_loss": -7.077229022979736, "global_step": 166253, "epoch": 3958} {"train_loss": -7.210175514221191, "global_step": 166254, "epoch": 3958} {"train_loss": -7.023112773895264, "global_step": 166255, "epoch": 3958} {"train_loss": -7.041757583618164, "global_step": 166256, "epoch": 3958} {"train_loss": -6.950719833374023, "global_step": 166257, "epoch": 3958} {"train_loss": -7.1350531578063965, "global_step": 166258, "epoch": 3958} {"train_loss": -7.050284385681152, "global_step": 166259, "epoch": 3958} {"train_loss": -7.071171283721924, "global_step": 166260, "epoch": 3958} {"train_loss": -6.949930191040039, "global_step": 166261, "epoch": 3958} {"train_loss": -6.993717670440674, "global_step": 166262, "epoch": 3958} {"train_loss": -7.037386894226074, "global_step": 166263, "epoch": 3958} {"train_loss": -6.973264694213867, "global_step": 166264, "epoch": 3958} {"train_loss": -6.934046745300293, "global_step": 166265, "epoch": 3958} {"train_loss": -6.968659400939941, "global_step": 166266, "epoch": 3958} {"train_loss": -7.069347381591797, "global_step": 166267, "epoch": 3958} {"train_loss": -7.113914966583252, "global_step": 166268, "epoch": 3958} {"train_loss": -6.951467514038086, "global_step": 166269, "epoch": 3958} {"train_loss": -6.988030910491943, "global_step": 166270, "epoch": 3958} {"train_loss": -7.02579927444458, "global_step": 166271, "epoch": 3958} {"train_loss": -6.966562747955322, "global_step": 166272, "epoch": 3958} {"train_loss": -7.121660232543945, "global_step": 166273, "epoch": 3958} {"train_loss": -7.003688812255859, "global_step": 166274, "epoch": 3958} {"train_loss": -6.882228851318359, "global_step": 166275, "epoch": 3958} {"train_loss": -7.0921430587768555, "global_step": 166276, "epoch": 3958} {"train_loss": -7.0318660622551326, "global_step": 166277, "epoch": 3958, "val_loss": 68800.578125} {"train_loss": -7.014646530151367, "global_step": 166278, "epoch": 3959} {"train_loss": -7.02581787109375, "global_step": 166279, "epoch": 3959} {"train_loss": -6.956254005432129, "global_step": 166280, "epoch": 3959} {"train_loss": -7.100154399871826, "global_step": 166281, "epoch": 3959} {"train_loss": -6.980939865112305, "global_step": 166282, "epoch": 3959} {"train_loss": -6.959687232971191, "global_step": 166283, "epoch": 3959} {"train_loss": -7.0894975662231445, "global_step": 166284, "epoch": 3959} {"train_loss": -6.923168182373047, "global_step": 166285, "epoch": 3959} {"train_loss": -7.014121055603027, "global_step": 166286, "epoch": 3959} {"train_loss": -7.121769905090332, "global_step": 166287, "epoch": 3959} {"train_loss": -6.999551773071289, "global_step": 166288, "epoch": 3959} {"train_loss": -6.82943058013916, "global_step": 166289, "epoch": 3959} {"train_loss": -6.966695785522461, "global_step": 166290, "epoch": 3959} {"train_loss": -6.763552188873291, "global_step": 166291, "epoch": 3959} {"train_loss": -6.941370010375977, "global_step": 166292, "epoch": 3959} {"train_loss": -6.850966930389404, "global_step": 166293, "epoch": 3959} {"train_loss": -6.946595668792725, "global_step": 166294, "epoch": 3959} {"train_loss": -6.930739402770996, "global_step": 166295, "epoch": 3959} {"train_loss": -6.869579792022705, "global_step": 166296, "epoch": 3959} {"train_loss": -7.019387245178223, "global_step": 166297, "epoch": 3959} {"train_loss": -6.97604513168335, "global_step": 166298, "epoch": 3959} {"train_loss": -6.904119968414307, "global_step": 166299, "epoch": 3959} {"train_loss": -6.926497936248779, "global_step": 166300, "epoch": 3959} {"train_loss": -6.984967231750488, "global_step": 166301, "epoch": 3959} {"train_loss": -6.962007999420166, "global_step": 166302, "epoch": 3959} {"train_loss": -7.017355918884277, "global_step": 166303, "epoch": 3959} {"train_loss": -7.047340393066406, "global_step": 166304, "epoch": 3959} {"train_loss": -6.947098731994629, "global_step": 166305, "epoch": 3959} {"train_loss": -6.831463813781738, "global_step": 166306, "epoch": 3959} {"train_loss": -6.944149494171143, "global_step": 166307, "epoch": 3959} {"train_loss": -7.029397010803223, "global_step": 166308, "epoch": 3959} {"train_loss": -6.999671936035156, "global_step": 166309, "epoch": 3959} {"train_loss": -6.859650611877441, "global_step": 166310, "epoch": 3959} {"train_loss": -6.866808891296387, "global_step": 166311, "epoch": 3959} {"train_loss": -6.889269828796387, "global_step": 166312, "epoch": 3959} {"train_loss": -6.974753379821777, "global_step": 166313, "epoch": 3959} {"train_loss": -6.9869489669799805, "global_step": 166314, "epoch": 3959} {"train_loss": -7.01835823059082, "global_step": 166315, "epoch": 3959} {"train_loss": -7.028987407684326, "global_step": 166316, "epoch": 3959} {"train_loss": -6.961271286010742, "global_step": 166317, "epoch": 3959} {"train_loss": -6.980043888092041, "global_step": 166318, "epoch": 3959} {"train_loss": -6.962501900536673, "global_step": 166319, "epoch": 3959, "val_loss": 68962.1875} {"train_loss": -6.8902587890625, "global_step": 166320, "epoch": 3960} {"train_loss": -6.993321418762207, "global_step": 166321, "epoch": 3960} {"train_loss": -6.982892990112305, "global_step": 166322, "epoch": 3960} {"train_loss": -6.99934720993042, "global_step": 166323, "epoch": 3960} {"train_loss": -7.000225067138672, "global_step": 166324, "epoch": 3960} {"train_loss": -6.931818962097168, "global_step": 166325, "epoch": 3960} {"train_loss": -6.940794944763184, "global_step": 166326, "epoch": 3960} {"train_loss": -7.050348281860352, "global_step": 166327, "epoch": 3960} {"train_loss": -6.982499122619629, "global_step": 166328, "epoch": 3960} {"train_loss": -7.026684284210205, "global_step": 166329, "epoch": 3960} {"train_loss": -6.907757759094238, "global_step": 166330, "epoch": 3960} {"train_loss": -7.0119171142578125, "global_step": 166331, "epoch": 3960} {"train_loss": -7.0180559158325195, "global_step": 166332, "epoch": 3960} {"train_loss": -7.0004048347473145, "global_step": 166333, "epoch": 3960} {"train_loss": -7.037230968475342, "global_step": 166334, "epoch": 3960} {"train_loss": -6.961342811584473, "global_step": 166335, "epoch": 3960} {"train_loss": -6.934234619140625, "global_step": 166336, "epoch": 3960} {"train_loss": -7.018906593322754, "global_step": 166337, "epoch": 3960} {"train_loss": -7.034862041473389, "global_step": 166338, "epoch": 3960} {"train_loss": -7.091923236846924, "global_step": 166339, "epoch": 3960} {"train_loss": -6.975972652435303, "global_step": 166340, "epoch": 3960} {"train_loss": -6.814194679260254, "global_step": 166341, "epoch": 3960} {"train_loss": -6.843395233154297, "global_step": 166342, "epoch": 3960} {"train_loss": -6.84333610534668, "global_step": 166343, "epoch": 3960} {"train_loss": -6.757786273956299, "global_step": 166344, "epoch": 3960} {"train_loss": -6.937655448913574, "global_step": 166345, "epoch": 3960} {"train_loss": -6.779178619384766, "global_step": 166346, "epoch": 3960} {"train_loss": -6.646097660064697, "global_step": 166347, "epoch": 3960} {"train_loss": -6.830510139465332, "global_step": 166348, "epoch": 3960} {"train_loss": -6.693061828613281, "global_step": 166349, "epoch": 3960} {"train_loss": -6.857648849487305, "global_step": 166350, "epoch": 3960} {"train_loss": -6.726407051086426, "global_step": 166351, "epoch": 3960} {"train_loss": -7.004715919494629, "global_step": 166352, "epoch": 3960} {"train_loss": -6.766192436218262, "global_step": 166353, "epoch": 3960} {"train_loss": -6.872260570526123, "global_step": 166354, "epoch": 3960} {"train_loss": -6.696642875671387, "global_step": 166355, "epoch": 3960} {"train_loss": -6.941427707672119, "global_step": 166356, "epoch": 3960} {"train_loss": -6.844498634338379, "global_step": 166357, "epoch": 3960} {"train_loss": -6.907578468322754, "global_step": 166358, "epoch": 3960} {"train_loss": -6.86573600769043, "global_step": 166359, "epoch": 3960} {"train_loss": -6.962732791900635, "global_step": 166360, "epoch": 3960} {"train_loss": -6.909913539886475, "global_step": 166361, "epoch": 3960, "val_loss": 68739.0546875} {"train_loss": -6.889854431152344, "global_step": 166362, "epoch": 3961} {"train_loss": -6.9025983810424805, "global_step": 166363, "epoch": 3961} {"train_loss": -7.011035442352295, "global_step": 166364, "epoch": 3961} {"train_loss": -6.855535984039307, "global_step": 166365, "epoch": 3961} {"train_loss": -6.930302619934082, "global_step": 166366, "epoch": 3961} {"train_loss": -6.837128162384033, "global_step": 166367, "epoch": 3961} {"train_loss": -6.955508708953857, "global_step": 166368, "epoch": 3961} {"train_loss": -6.900030136108398, "global_step": 166369, "epoch": 3961} {"train_loss": -6.995815277099609, "global_step": 166370, "epoch": 3961} {"train_loss": -7.11681604385376, "global_step": 166371, "epoch": 3961} {"train_loss": -7.009947299957275, "global_step": 166372, "epoch": 3961} {"train_loss": -6.961846351623535, "global_step": 166373, "epoch": 3961} {"train_loss": -6.879544258117676, "global_step": 166374, "epoch": 3961} {"train_loss": -7.006623268127441, "global_step": 166375, "epoch": 3961} {"train_loss": -6.8649139404296875, "global_step": 166376, "epoch": 3961} {"train_loss": -6.920072555541992, "global_step": 166377, "epoch": 3961} {"train_loss": -6.948690891265869, "global_step": 166378, "epoch": 3961} {"train_loss": -6.967400550842285, "global_step": 166379, "epoch": 3961} {"train_loss": -6.816978454589844, "global_step": 166380, "epoch": 3961} {"train_loss": -6.8945698738098145, "global_step": 166381, "epoch": 3961} {"train_loss": -6.855489253997803, "global_step": 166382, "epoch": 3961} {"train_loss": -7.005119323730469, "global_step": 166383, "epoch": 3961} {"train_loss": -6.864806175231934, "global_step": 166384, "epoch": 3961} {"train_loss": -6.928194999694824, "global_step": 166385, "epoch": 3961} {"train_loss": -7.020355224609375, "global_step": 166386, "epoch": 3961} {"train_loss": -6.923922538757324, "global_step": 166387, "epoch": 3961} {"train_loss": -6.970090389251709, "global_step": 166388, "epoch": 3961} {"train_loss": -6.954305171966553, "global_step": 166389, "epoch": 3961} {"train_loss": -7.004709243774414, "global_step": 166390, "epoch": 3961} {"train_loss": -6.893038749694824, "global_step": 166391, "epoch": 3961} {"train_loss": -7.023664474487305, "global_step": 166392, "epoch": 3961} {"train_loss": -6.870155334472656, "global_step": 166393, "epoch": 3961} {"train_loss": -6.869306564331055, "global_step": 166394, "epoch": 3961} {"train_loss": -6.938637733459473, "global_step": 166395, "epoch": 3961} {"train_loss": -6.939072608947754, "global_step": 166396, "epoch": 3961} {"train_loss": -6.895445823669434, "global_step": 166397, "epoch": 3961} {"train_loss": -7.015422821044922, "global_step": 166398, "epoch": 3961} {"train_loss": -6.97327995300293, "global_step": 166399, "epoch": 3961} {"train_loss": -6.9344563484191895, "global_step": 166400, "epoch": 3961} {"train_loss": -7.13058614730835, "global_step": 166401, "epoch": 3961} {"train_loss": -7.000002861022949, "global_step": 166402, "epoch": 3961} {"train_loss": -6.943381264096215, "global_step": 166403, "epoch": 3961, "val_loss": 69021.9609375} {"train_loss": -6.967530727386475, "global_step": 166404, "epoch": 3962} {"train_loss": -7.081790447235107, "global_step": 166405, "epoch": 3962} {"train_loss": -6.866298675537109, "global_step": 166406, "epoch": 3962} {"train_loss": -6.97429895401001, "global_step": 166407, "epoch": 3962} {"train_loss": -7.050174713134766, "global_step": 166408, "epoch": 3962} {"train_loss": -7.051654815673828, "global_step": 166409, "epoch": 3962} {"train_loss": -6.951617240905762, "global_step": 166410, "epoch": 3962} {"train_loss": -6.9345808029174805, "global_step": 166411, "epoch": 3962} {"train_loss": -7.0219950675964355, "global_step": 166412, "epoch": 3962} {"train_loss": -6.950464248657227, "global_step": 166413, "epoch": 3962} {"train_loss": -6.965709686279297, "global_step": 166414, "epoch": 3962} {"train_loss": -6.8965535163879395, "global_step": 166415, "epoch": 3962} {"train_loss": -6.904274940490723, "global_step": 166416, "epoch": 3962} {"train_loss": -6.990616321563721, "global_step": 166417, "epoch": 3962} {"train_loss": -6.639801025390625, "global_step": 166418, "epoch": 3962} {"train_loss": -7.0034589767456055, "global_step": 166419, "epoch": 3962} {"train_loss": -6.853520393371582, "global_step": 166420, "epoch": 3962} {"train_loss": -6.750433921813965, "global_step": 166421, "epoch": 3962} {"train_loss": -6.854893684387207, "global_step": 166422, "epoch": 3962} {"train_loss": -6.8127312660217285, "global_step": 166423, "epoch": 3962} {"train_loss": -6.760609149932861, "global_step": 166424, "epoch": 3962} {"train_loss": -6.979466438293457, "global_step": 166425, "epoch": 3962} {"train_loss": -6.8039703369140625, "global_step": 166426, "epoch": 3962} {"train_loss": -6.880593776702881, "global_step": 166427, "epoch": 3962} {"train_loss": -7.02684211730957, "global_step": 166428, "epoch": 3962} {"train_loss": -6.999676704406738, "global_step": 166429, "epoch": 3962} {"train_loss": -6.911172866821289, "global_step": 166430, "epoch": 3962} {"train_loss": -6.951813697814941, "global_step": 166431, "epoch": 3962} {"train_loss": -6.978806972503662, "global_step": 166432, "epoch": 3962} {"train_loss": -6.906839847564697, "global_step": 166433, "epoch": 3962} {"train_loss": -6.970942974090576, "global_step": 166434, "epoch": 3962} {"train_loss": -6.9258713722229, "global_step": 166435, "epoch": 3962} {"train_loss": -7.0336480140686035, "global_step": 166436, "epoch": 3962} {"train_loss": -7.0540618896484375, "global_step": 166437, "epoch": 3962} {"train_loss": -7.064400672912598, "global_step": 166438, "epoch": 3962} {"train_loss": -7.040613174438477, "global_step": 166439, "epoch": 3962} {"train_loss": -7.019567489624023, "global_step": 166440, "epoch": 3962} {"train_loss": -7.027828216552734, "global_step": 166441, "epoch": 3962} {"train_loss": -6.973818302154541, "global_step": 166442, "epoch": 3962} {"train_loss": -7.007597923278809, "global_step": 166443, "epoch": 3962} {"train_loss": -7.045706748962402, "global_step": 166444, "epoch": 3962} {"train_loss": -6.947538409914289, "global_step": 166445, "epoch": 3962, "val_loss": 68680.5390625} {"train_loss": -7.053017616271973, "global_step": 166446, "epoch": 3963} {"train_loss": -6.9380598068237305, "global_step": 166447, "epoch": 3963} {"train_loss": -7.0890278816223145, "global_step": 166448, "epoch": 3963} {"train_loss": -7.053466796875, "global_step": 166449, "epoch": 3963} {"train_loss": -7.030420780181885, "global_step": 166450, "epoch": 3963} {"train_loss": -7.074368476867676, "global_step": 166451, "epoch": 3963} {"train_loss": -7.215441703796387, "global_step": 166452, "epoch": 3963} {"train_loss": -6.9908857345581055, "global_step": 166453, "epoch": 3963} {"train_loss": -7.186532020568848, "global_step": 166454, "epoch": 3963} {"train_loss": -7.0263495445251465, "global_step": 166455, "epoch": 3963} {"train_loss": -6.982365608215332, "global_step": 166456, "epoch": 3963} {"train_loss": -7.078366279602051, "global_step": 166457, "epoch": 3963} {"train_loss": -7.005870819091797, "global_step": 166458, "epoch": 3963} {"train_loss": -7.065021514892578, "global_step": 166459, "epoch": 3963} {"train_loss": -7.0234479904174805, "global_step": 166460, "epoch": 3963} {"train_loss": -7.087488174438477, "global_step": 166461, "epoch": 3963} {"train_loss": -6.968573570251465, "global_step": 166462, "epoch": 3963} {"train_loss": -7.029457092285156, "global_step": 166463, "epoch": 3963} {"train_loss": -7.138823509216309, "global_step": 166464, "epoch": 3963} {"train_loss": -7.040998458862305, "global_step": 166465, "epoch": 3963} {"train_loss": -7.011707782745361, "global_step": 166466, "epoch": 3963} {"train_loss": -6.98378849029541, "global_step": 166467, "epoch": 3963} {"train_loss": -7.205223083496094, "global_step": 166468, "epoch": 3963} {"train_loss": -7.219473361968994, "global_step": 166469, "epoch": 3963} {"train_loss": -7.096222877502441, "global_step": 166470, "epoch": 3963} {"train_loss": -7.119534492492676, "global_step": 166471, "epoch": 3963} {"train_loss": -6.932344436645508, "global_step": 166472, "epoch": 3963} {"train_loss": -7.074202060699463, "global_step": 166473, "epoch": 3963} {"train_loss": -7.09505033493042, "global_step": 166474, "epoch": 3963} {"train_loss": -6.9420166015625, "global_step": 166475, "epoch": 3963} {"train_loss": -7.091247081756592, "global_step": 166476, "epoch": 3963} {"train_loss": -7.092648506164551, "global_step": 166477, "epoch": 3963} {"train_loss": -6.922863960266113, "global_step": 166478, "epoch": 3963} {"train_loss": -6.923286437988281, "global_step": 166479, "epoch": 3963} {"train_loss": -7.072171688079834, "global_step": 166480, "epoch": 3963} {"train_loss": -6.955080032348633, "global_step": 166481, "epoch": 3963} {"train_loss": -7.003331184387207, "global_step": 166482, "epoch": 3963} {"train_loss": -7.01676082611084, "global_step": 166483, "epoch": 3963} {"train_loss": -6.972407341003418, "global_step": 166484, "epoch": 3963} {"train_loss": -6.858278274536133, "global_step": 166485, "epoch": 3963} {"train_loss": -7.026613712310791, "global_step": 166486, "epoch": 3963} {"train_loss": -7.04134886605399, "global_step": 166487, "epoch": 3963, "val_loss": 68861.921875} {"train_loss": -6.935196876525879, "global_step": 166488, "epoch": 3964} {"train_loss": -6.9235405921936035, "global_step": 166489, "epoch": 3964} {"train_loss": -7.023824691772461, "global_step": 166490, "epoch": 3964} {"train_loss": -7.058138847351074, "global_step": 166491, "epoch": 3964} {"train_loss": -7.101048469543457, "global_step": 166492, "epoch": 3964} {"train_loss": -6.989665985107422, "global_step": 166493, "epoch": 3964} {"train_loss": -7.094353199005127, "global_step": 166494, "epoch": 3964} {"train_loss": -7.063697814941406, "global_step": 166495, "epoch": 3964} {"train_loss": -7.021042346954346, "global_step": 166496, "epoch": 3964} {"train_loss": -6.977423191070557, "global_step": 166497, "epoch": 3964} {"train_loss": -7.089057922363281, "global_step": 166498, "epoch": 3964} {"train_loss": -7.030620098114014, "global_step": 166499, "epoch": 3964} {"train_loss": -6.896130084991455, "global_step": 166500, "epoch": 3964} {"train_loss": -6.955469608306885, "global_step": 166501, "epoch": 3964} {"train_loss": -6.982099533081055, "global_step": 166502, "epoch": 3964} {"train_loss": -6.890937805175781, "global_step": 166503, "epoch": 3964} {"train_loss": -6.987789154052734, "global_step": 166504, "epoch": 3964} {"train_loss": -6.991989612579346, "global_step": 166505, "epoch": 3964} {"train_loss": -6.904350757598877, "global_step": 166506, "epoch": 3964} {"train_loss": -6.909335136413574, "global_step": 166507, "epoch": 3964} {"train_loss": -7.036708831787109, "global_step": 166508, "epoch": 3964} {"train_loss": -6.885533332824707, "global_step": 166509, "epoch": 3964} {"train_loss": -7.006277561187744, "global_step": 166510, "epoch": 3964} {"train_loss": -6.9567341804504395, "global_step": 166511, "epoch": 3964} {"train_loss": -6.8345513343811035, "global_step": 166512, "epoch": 3964} {"train_loss": -6.899340629577637, "global_step": 166513, "epoch": 3964} {"train_loss": -6.839303016662598, "global_step": 166514, "epoch": 3964} {"train_loss": -6.955819606781006, "global_step": 166515, "epoch": 3964} {"train_loss": -6.889492988586426, "global_step": 166516, "epoch": 3964} {"train_loss": -6.83428955078125, "global_step": 166517, "epoch": 3964} {"train_loss": -6.8776140213012695, "global_step": 166518, "epoch": 3964} {"train_loss": -6.864198207855225, "global_step": 166519, "epoch": 3964} {"train_loss": -7.083939552307129, "global_step": 166520, "epoch": 3964} {"train_loss": -6.878259658813477, "global_step": 166521, "epoch": 3964} {"train_loss": -6.94330358505249, "global_step": 166522, "epoch": 3964} {"train_loss": -6.912215232849121, "global_step": 166523, "epoch": 3964} {"train_loss": -6.993577003479004, "global_step": 166524, "epoch": 3964} {"train_loss": -6.86762809753418, "global_step": 166525, "epoch": 3964} {"train_loss": -6.963776588439941, "global_step": 166526, "epoch": 3964} {"train_loss": -6.984992980957031, "global_step": 166527, "epoch": 3964} {"train_loss": -7.04575252532959, "global_step": 166528, "epoch": 3964} {"train_loss": -6.9599503221965975, "global_step": 166529, "epoch": 3964, "val_loss": 68842.953125} {"train_loss": -6.778693199157715, "global_step": 166530, "epoch": 3965} {"train_loss": -6.914212226867676, "global_step": 166531, "epoch": 3965} {"train_loss": -6.8891730308532715, "global_step": 166532, "epoch": 3965} {"train_loss": -6.921276569366455, "global_step": 166533, "epoch": 3965} {"train_loss": -6.911995887756348, "global_step": 166534, "epoch": 3965} {"train_loss": -6.940493583679199, "global_step": 166535, "epoch": 3965} {"train_loss": -7.013505935668945, "global_step": 166536, "epoch": 3965} {"train_loss": -6.9857378005981445, "global_step": 166537, "epoch": 3965} {"train_loss": -6.991786956787109, "global_step": 166538, "epoch": 3965} {"train_loss": -7.068734169006348, "global_step": 166539, "epoch": 3965} {"train_loss": -7.043033599853516, "global_step": 166540, "epoch": 3965} {"train_loss": -7.045130729675293, "global_step": 166541, "epoch": 3965} {"train_loss": -7.1446661949157715, "global_step": 166542, "epoch": 3965} {"train_loss": -7.112070560455322, "global_step": 166543, "epoch": 3965} {"train_loss": -7.144116401672363, "global_step": 166544, "epoch": 3965} {"train_loss": -6.966402053833008, "global_step": 166545, "epoch": 3965} {"train_loss": -6.955140113830566, "global_step": 166546, "epoch": 3965} {"train_loss": -6.942230224609375, "global_step": 166547, "epoch": 3965} {"train_loss": -7.056290626525879, "global_step": 166548, "epoch": 3965} {"train_loss": -6.980091094970703, "global_step": 166549, "epoch": 3965} {"train_loss": -7.064452171325684, "global_step": 166550, "epoch": 3965} {"train_loss": -7.133673667907715, "global_step": 166551, "epoch": 3965} {"train_loss": -7.048516750335693, "global_step": 166552, "epoch": 3965} {"train_loss": -7.004046440124512, "global_step": 166553, "epoch": 3965} {"train_loss": -6.908390522003174, "global_step": 166554, "epoch": 3965} {"train_loss": -7.043907165527344, "global_step": 166555, "epoch": 3965} {"train_loss": -7.008464813232422, "global_step": 166556, "epoch": 3965} {"train_loss": -7.008961200714111, "global_step": 166557, "epoch": 3965} {"train_loss": -6.9917426109313965, "global_step": 166558, "epoch": 3965} {"train_loss": -6.899949550628662, "global_step": 166559, "epoch": 3965} {"train_loss": -7.036410331726074, "global_step": 166560, "epoch": 3965} {"train_loss": -6.943305492401123, "global_step": 166561, "epoch": 3965} {"train_loss": -6.964847564697266, "global_step": 166562, "epoch": 3965} {"train_loss": -6.939545631408691, "global_step": 166563, "epoch": 3965} {"train_loss": -7.003602981567383, "global_step": 166564, "epoch": 3965} {"train_loss": -6.940864562988281, "global_step": 166565, "epoch": 3965} {"train_loss": -6.851274013519287, "global_step": 166566, "epoch": 3965} {"train_loss": -6.838695526123047, "global_step": 166567, "epoch": 3965} {"train_loss": -6.9845733642578125, "global_step": 166568, "epoch": 3965} {"train_loss": -6.825399398803711, "global_step": 166569, "epoch": 3965} {"train_loss": -6.921091556549072, "global_step": 166570, "epoch": 3965} {"train_loss": -6.97754488672529, "global_step": 166571, "epoch": 3965, "val_loss": 68922.5390625} {"train_loss": -7.032973766326904, "global_step": 166572, "epoch": 3966} {"train_loss": -6.950221061706543, "global_step": 166573, "epoch": 3966} {"train_loss": -6.906239986419678, "global_step": 166574, "epoch": 3966} {"train_loss": -6.999236583709717, "global_step": 166575, "epoch": 3966} {"train_loss": -6.9697041511535645, "global_step": 166576, "epoch": 3966} {"train_loss": -6.950628280639648, "global_step": 166577, "epoch": 3966} {"train_loss": -7.020840644836426, "global_step": 166578, "epoch": 3966} {"train_loss": -7.064562797546387, "global_step": 166579, "epoch": 3966} {"train_loss": -7.047491550445557, "global_step": 166580, "epoch": 3966} {"train_loss": -6.956489562988281, "global_step": 166581, "epoch": 3966} {"train_loss": -6.902395248413086, "global_step": 166582, "epoch": 3966} {"train_loss": -6.952269554138184, "global_step": 166583, "epoch": 3966} {"train_loss": -6.921679496765137, "global_step": 166584, "epoch": 3966} {"train_loss": -6.968735694885254, "global_step": 166585, "epoch": 3966} {"train_loss": -6.777588367462158, "global_step": 166586, "epoch": 3966} {"train_loss": -7.017936706542969, "global_step": 166587, "epoch": 3966} {"train_loss": -7.00537109375, "global_step": 166588, "epoch": 3966} {"train_loss": -6.991543292999268, "global_step": 166589, "epoch": 3966} {"train_loss": -6.9541449546813965, "global_step": 166590, "epoch": 3966} {"train_loss": -7.0503034591674805, "global_step": 166591, "epoch": 3966} {"train_loss": -6.737293243408203, "global_step": 166592, "epoch": 3966} {"train_loss": -6.978233337402344, "global_step": 166593, "epoch": 3966} {"train_loss": -6.988652229309082, "global_step": 166594, "epoch": 3966} {"train_loss": -6.876555442810059, "global_step": 166595, "epoch": 3966} {"train_loss": -6.9857378005981445, "global_step": 166596, "epoch": 3966} {"train_loss": -7.016378879547119, "global_step": 166597, "epoch": 3966} {"train_loss": -6.964809417724609, "global_step": 166598, "epoch": 3966} {"train_loss": -6.929978847503662, "global_step": 166599, "epoch": 3966} {"train_loss": -6.96242618560791, "global_step": 166600, "epoch": 3966} {"train_loss": -6.951775550842285, "global_step": 166601, "epoch": 3966} {"train_loss": -6.923001766204834, "global_step": 166602, "epoch": 3966} {"train_loss": -7.004888534545898, "global_step": 166603, "epoch": 3966} {"train_loss": -6.986754417419434, "global_step": 166604, "epoch": 3966} {"train_loss": -7.08021879196167, "global_step": 166605, "epoch": 3966} {"train_loss": -7.119100570678711, "global_step": 166606, "epoch": 3966} {"train_loss": -6.902042388916016, "global_step": 166607, "epoch": 3966} {"train_loss": -6.8761444091796875, "global_step": 166608, "epoch": 3966} {"train_loss": -7.016983985900879, "global_step": 166609, "epoch": 3966} {"train_loss": -6.913224697113037, "global_step": 166610, "epoch": 3966} {"train_loss": -6.9576568603515625, "global_step": 166611, "epoch": 3966} {"train_loss": -7.03422737121582, "global_step": 166612, "epoch": 3966} {"train_loss": -6.967130274999709, "global_step": 166613, "epoch": 3966, "val_loss": 68781.90625} {"train_loss": -6.94215726852417, "global_step": 166614, "epoch": 3967} {"train_loss": -7.03886079788208, "global_step": 166615, "epoch": 3967} {"train_loss": -6.970203399658203, "global_step": 166616, "epoch": 3967} {"train_loss": -6.977829933166504, "global_step": 166617, "epoch": 3967} {"train_loss": -6.974791526794434, "global_step": 166618, "epoch": 3967} {"train_loss": -7.012325286865234, "global_step": 166619, "epoch": 3967} {"train_loss": -7.02268123626709, "global_step": 166620, "epoch": 3967} {"train_loss": -7.039281368255615, "global_step": 166621, "epoch": 3967} {"train_loss": -6.96905517578125, "global_step": 166622, "epoch": 3967} {"train_loss": -6.982912063598633, "global_step": 166623, "epoch": 3967} {"train_loss": -7.022994518280029, "global_step": 166624, "epoch": 3967} {"train_loss": -6.9430036544799805, "global_step": 166625, "epoch": 3967} {"train_loss": -6.953725814819336, "global_step": 166626, "epoch": 3967} {"train_loss": -7.06562614440918, "global_step": 166627, "epoch": 3967} {"train_loss": -7.145228385925293, "global_step": 166628, "epoch": 3967} {"train_loss": -7.056731700897217, "global_step": 166629, "epoch": 3967} {"train_loss": -7.026681423187256, "global_step": 166630, "epoch": 3967} {"train_loss": -7.046715259552002, "global_step": 166631, "epoch": 3967} {"train_loss": -7.048300743103027, "global_step": 166632, "epoch": 3967} {"train_loss": -6.991004943847656, "global_step": 166633, "epoch": 3967} {"train_loss": -6.996132850646973, "global_step": 166634, "epoch": 3967} {"train_loss": -7.1945624351501465, "global_step": 166635, "epoch": 3967} {"train_loss": -6.904428482055664, "global_step": 166636, "epoch": 3967} {"train_loss": -7.0081915855407715, "global_step": 166637, "epoch": 3967} {"train_loss": -7.065404415130615, "global_step": 166638, "epoch": 3967} {"train_loss": -6.937190055847168, "global_step": 166639, "epoch": 3967} {"train_loss": -7.004146575927734, "global_step": 166640, "epoch": 3967} {"train_loss": -6.986677169799805, "global_step": 166641, "epoch": 3967} {"train_loss": -7.059083938598633, "global_step": 166642, "epoch": 3967} {"train_loss": -7.006818771362305, "global_step": 166643, "epoch": 3967} {"train_loss": -7.14614725112915, "global_step": 166644, "epoch": 3967} {"train_loss": -7.042016983032227, "global_step": 166645, "epoch": 3967} {"train_loss": -6.989260673522949, "global_step": 166646, "epoch": 3967} {"train_loss": -7.030412673950195, "global_step": 166647, "epoch": 3967} {"train_loss": -7.023249626159668, "global_step": 166648, "epoch": 3967} {"train_loss": -7.027063369750977, "global_step": 166649, "epoch": 3967} {"train_loss": -7.043617248535156, "global_step": 166650, "epoch": 3967} {"train_loss": -7.064478397369385, "global_step": 166651, "epoch": 3967} {"train_loss": -7.007230281829834, "global_step": 166652, "epoch": 3967} {"train_loss": -7.020937919616699, "global_step": 166653, "epoch": 3967} {"train_loss": -7.100289344787598, "global_step": 166654, "epoch": 3967} {"train_loss": -7.022095316932315, "global_step": 166655, "epoch": 3967, "val_loss": 68763.828125} {"train_loss": -6.974041938781738, "global_step": 166656, "epoch": 3968} {"train_loss": -7.039471626281738, "global_step": 166657, "epoch": 3968} {"train_loss": -7.040742874145508, "global_step": 166658, "epoch": 3968} {"train_loss": -6.982039451599121, "global_step": 166659, "epoch": 3968} {"train_loss": -6.918881416320801, "global_step": 166660, "epoch": 3968} {"train_loss": -7.071761131286621, "global_step": 166661, "epoch": 3968} {"train_loss": -6.982337951660156, "global_step": 166662, "epoch": 3968} {"train_loss": -7.123353004455566, "global_step": 166663, "epoch": 3968} {"train_loss": -7.093320846557617, "global_step": 166664, "epoch": 3968} {"train_loss": -7.039737701416016, "global_step": 166665, "epoch": 3968} {"train_loss": -6.99189567565918, "global_step": 166666, "epoch": 3968} {"train_loss": -7.154928207397461, "global_step": 166667, "epoch": 3968} {"train_loss": -6.977333068847656, "global_step": 166668, "epoch": 3968} {"train_loss": -7.155345916748047, "global_step": 166669, "epoch": 3968} {"train_loss": -6.979931831359863, "global_step": 166670, "epoch": 3968} {"train_loss": -7.090994358062744, "global_step": 166671, "epoch": 3968} {"train_loss": -6.96877384185791, "global_step": 166672, "epoch": 3968} {"train_loss": -7.155184745788574, "global_step": 166673, "epoch": 3968} {"train_loss": -7.144883155822754, "global_step": 166674, "epoch": 3968} {"train_loss": -7.077154159545898, "global_step": 166675, "epoch": 3968} {"train_loss": -7.17717170715332, "global_step": 166676, "epoch": 3968} {"train_loss": -6.957864761352539, "global_step": 166677, "epoch": 3968} {"train_loss": -7.074314117431641, "global_step": 166678, "epoch": 3968} {"train_loss": -7.072546005249023, "global_step": 166679, "epoch": 3968} {"train_loss": -7.070825576782227, "global_step": 166680, "epoch": 3968} {"train_loss": -7.095791816711426, "global_step": 166681, "epoch": 3968} {"train_loss": -6.980284214019775, "global_step": 166682, "epoch": 3968} {"train_loss": -7.12524938583374, "global_step": 166683, "epoch": 3968} {"train_loss": -7.093604564666748, "global_step": 166684, "epoch": 3968} {"train_loss": -7.09929084777832, "global_step": 166685, "epoch": 3968} {"train_loss": -7.069149017333984, "global_step": 166686, "epoch": 3968} {"train_loss": -7.020386219024658, "global_step": 166687, "epoch": 3968} {"train_loss": -7.144411563873291, "global_step": 166688, "epoch": 3968} {"train_loss": -7.049277305603027, "global_step": 166689, "epoch": 3968} {"train_loss": -7.066332817077637, "global_step": 166690, "epoch": 3968} {"train_loss": -7.043769836425781, "global_step": 166691, "epoch": 3968} {"train_loss": -7.065594673156738, "global_step": 166692, "epoch": 3968} {"train_loss": -7.045957088470459, "global_step": 166693, "epoch": 3968} {"train_loss": -7.047878265380859, "global_step": 166694, "epoch": 3968} {"train_loss": -7.009159564971924, "global_step": 166695, "epoch": 3968} {"train_loss": -7.079127311706543, "global_step": 166696, "epoch": 3968} {"train_loss": -7.057792845226469, "global_step": 166697, "epoch": 3968, "val_loss": 68898.515625} {"train_loss": -6.991283416748047, "global_step": 166698, "epoch": 3969} {"train_loss": -7.081088542938232, "global_step": 166699, "epoch": 3969} {"train_loss": -7.029962062835693, "global_step": 166700, "epoch": 3969} {"train_loss": -6.983166694641113, "global_step": 166701, "epoch": 3969} {"train_loss": -7.115662574768066, "global_step": 166702, "epoch": 3969} {"train_loss": -6.952294826507568, "global_step": 166703, "epoch": 3969} {"train_loss": -6.877194404602051, "global_step": 166704, "epoch": 3969} {"train_loss": -7.03187370300293, "global_step": 166705, "epoch": 3969} {"train_loss": -6.835213661193848, "global_step": 166706, "epoch": 3969} {"train_loss": -6.951678276062012, "global_step": 166707, "epoch": 3969} {"train_loss": -6.953432559967041, "global_step": 166708, "epoch": 3969} {"train_loss": -6.847916126251221, "global_step": 166709, "epoch": 3969} {"train_loss": -7.038939476013184, "global_step": 166710, "epoch": 3969} {"train_loss": -6.9573516845703125, "global_step": 166711, "epoch": 3969} {"train_loss": -6.955371379852295, "global_step": 166712, "epoch": 3969} {"train_loss": -6.929171562194824, "global_step": 166713, "epoch": 3969} {"train_loss": -7.021317481994629, "global_step": 166714, "epoch": 3969} {"train_loss": -6.941065311431885, "global_step": 166715, "epoch": 3969} {"train_loss": -6.833128452301025, "global_step": 166716, "epoch": 3969} {"train_loss": -6.8630571365356445, "global_step": 166717, "epoch": 3969} {"train_loss": -6.9614057540893555, "global_step": 166718, "epoch": 3969} {"train_loss": -6.99359655380249, "global_step": 166719, "epoch": 3969} {"train_loss": -6.979659557342529, "global_step": 166720, "epoch": 3969} {"train_loss": -6.963045120239258, "global_step": 166721, "epoch": 3969} {"train_loss": -6.920443534851074, "global_step": 166722, "epoch": 3969} {"train_loss": -6.943615913391113, "global_step": 166723, "epoch": 3969} {"train_loss": -6.991783142089844, "global_step": 166724, "epoch": 3969} {"train_loss": -6.988873481750488, "global_step": 166725, "epoch": 3969} {"train_loss": -6.949152946472168, "global_step": 166726, "epoch": 3969} {"train_loss": -6.95195198059082, "global_step": 166727, "epoch": 3969} {"train_loss": -7.042006492614746, "global_step": 166728, "epoch": 3969} {"train_loss": -6.990018844604492, "global_step": 166729, "epoch": 3969} {"train_loss": -6.943060874938965, "global_step": 166730, "epoch": 3969} {"train_loss": -7.058138847351074, "global_step": 166731, "epoch": 3969} {"train_loss": -7.052855014801025, "global_step": 166732, "epoch": 3969} {"train_loss": -7.029016971588135, "global_step": 166733, "epoch": 3969} {"train_loss": -7.063579082489014, "global_step": 166734, "epoch": 3969} {"train_loss": -7.082192420959473, "global_step": 166735, "epoch": 3969} {"train_loss": -7.013851165771484, "global_step": 166736, "epoch": 3969} {"train_loss": -6.997983932495117, "global_step": 166737, "epoch": 3969} {"train_loss": -6.82618522644043, "global_step": 166738, "epoch": 3969} {"train_loss": -6.973229533150082, "global_step": 166739, "epoch": 3969, "val_loss": 68999.3984375} {"train_loss": -7.014342784881592, "global_step": 166740, "epoch": 3970} {"train_loss": -6.841088771820068, "global_step": 166741, "epoch": 3970} {"train_loss": -6.952690124511719, "global_step": 166742, "epoch": 3970} {"train_loss": -6.7845458984375, "global_step": 166743, "epoch": 3970} {"train_loss": -6.893091201782227, "global_step": 166744, "epoch": 3970} {"train_loss": -6.9261932373046875, "global_step": 166745, "epoch": 3970} {"train_loss": -6.838497638702393, "global_step": 166746, "epoch": 3970} {"train_loss": -6.941238880157471, "global_step": 166747, "epoch": 3970} {"train_loss": -6.897543907165527, "global_step": 166748, "epoch": 3970} {"train_loss": -7.001359939575195, "global_step": 166749, "epoch": 3970} {"train_loss": -6.8663129806518555, "global_step": 166750, "epoch": 3970} {"train_loss": -6.923742294311523, "global_step": 166751, "epoch": 3970} {"train_loss": -6.824825286865234, "global_step": 166752, "epoch": 3970} {"train_loss": -6.964858531951904, "global_step": 166753, "epoch": 3970} {"train_loss": -6.96600341796875, "global_step": 166754, "epoch": 3970} {"train_loss": -6.904226779937744, "global_step": 166755, "epoch": 3970} {"train_loss": -6.99278450012207, "global_step": 166756, "epoch": 3970} {"train_loss": -6.956829071044922, "global_step": 166757, "epoch": 3970} {"train_loss": -6.946284294128418, "global_step": 166758, "epoch": 3970} {"train_loss": -6.915524482727051, "global_step": 166759, "epoch": 3970} {"train_loss": -7.040867328643799, "global_step": 166760, "epoch": 3970} {"train_loss": -6.90598201751709, "global_step": 166761, "epoch": 3970} {"train_loss": -6.934089660644531, "global_step": 166762, "epoch": 3970} {"train_loss": -6.99290132522583, "global_step": 166763, "epoch": 3970} {"train_loss": -6.8663835525512695, "global_step": 166764, "epoch": 3970} {"train_loss": -6.996438026428223, "global_step": 166765, "epoch": 3970} {"train_loss": -7.031827926635742, "global_step": 166766, "epoch": 3970} {"train_loss": -7.033207893371582, "global_step": 166767, "epoch": 3970} {"train_loss": -7.021623134613037, "global_step": 166768, "epoch": 3970} {"train_loss": -7.01900577545166, "global_step": 166769, "epoch": 3970} {"train_loss": -6.968827247619629, "global_step": 166770, "epoch": 3970} {"train_loss": -6.975940227508545, "global_step": 166771, "epoch": 3970} {"train_loss": -6.973879337310791, "global_step": 166772, "epoch": 3970} {"train_loss": -7.0390448570251465, "global_step": 166773, "epoch": 3970} {"train_loss": -6.904555320739746, "global_step": 166774, "epoch": 3970} {"train_loss": -6.989328384399414, "global_step": 166775, "epoch": 3970} {"train_loss": -6.971945762634277, "global_step": 166776, "epoch": 3970} {"train_loss": -6.950291633605957, "global_step": 166777, "epoch": 3970} {"train_loss": -6.680153846740723, "global_step": 166778, "epoch": 3970} {"train_loss": -6.9058122634887695, "global_step": 166779, "epoch": 3970} {"train_loss": -6.919538974761963, "global_step": 166780, "epoch": 3970} {"train_loss": -6.939682040895734, "global_step": 166781, "epoch": 3970, "val_loss": 68963.859375} {"train_loss": -6.963251113891602, "global_step": 166782, "epoch": 3971} {"train_loss": -6.86436653137207, "global_step": 166783, "epoch": 3971} {"train_loss": -6.951998710632324, "global_step": 166784, "epoch": 3971} {"train_loss": -6.856294631958008, "global_step": 166785, "epoch": 3971} {"train_loss": -6.883081436157227, "global_step": 166786, "epoch": 3971} {"train_loss": -7.018143177032471, "global_step": 166787, "epoch": 3971} {"train_loss": -6.919163703918457, "global_step": 166788, "epoch": 3971} {"train_loss": -6.950761795043945, "global_step": 166789, "epoch": 3971} {"train_loss": -6.8837480545043945, "global_step": 166790, "epoch": 3971} {"train_loss": -6.814614772796631, "global_step": 166791, "epoch": 3971} {"train_loss": -6.852710723876953, "global_step": 166792, "epoch": 3971} {"train_loss": -6.894898414611816, "global_step": 166793, "epoch": 3971} {"train_loss": -6.892754554748535, "global_step": 166794, "epoch": 3971} {"train_loss": -6.7945237159729, "global_step": 166795, "epoch": 3971} {"train_loss": -6.7665252685546875, "global_step": 166796, "epoch": 3971} {"train_loss": -6.778717041015625, "global_step": 166797, "epoch": 3971} {"train_loss": -6.756837844848633, "global_step": 166798, "epoch": 3971} {"train_loss": -6.786623001098633, "global_step": 166799, "epoch": 3971} {"train_loss": -6.98630952835083, "global_step": 166800, "epoch": 3971} {"train_loss": -6.7855658531188965, "global_step": 166801, "epoch": 3971} {"train_loss": -6.879707336425781, "global_step": 166802, "epoch": 3971} {"train_loss": -6.6824517250061035, "global_step": 166803, "epoch": 3971} {"train_loss": -6.921581268310547, "global_step": 166804, "epoch": 3971} {"train_loss": -6.873312950134277, "global_step": 166805, "epoch": 3971} {"train_loss": -6.943743705749512, "global_step": 166806, "epoch": 3971} {"train_loss": -7.005159854888916, "global_step": 166807, "epoch": 3971} {"train_loss": -6.965709686279297, "global_step": 166808, "epoch": 3971} {"train_loss": -6.972148895263672, "global_step": 166809, "epoch": 3971} {"train_loss": -6.979770183563232, "global_step": 166810, "epoch": 3971} {"train_loss": -6.929843902587891, "global_step": 166811, "epoch": 3971} {"train_loss": -7.034872055053711, "global_step": 166812, "epoch": 3971} {"train_loss": -6.950050354003906, "global_step": 166813, "epoch": 3971} {"train_loss": -7.018068313598633, "global_step": 166814, "epoch": 3971} {"train_loss": -7.04412317276001, "global_step": 166815, "epoch": 3971} {"train_loss": -6.962047100067139, "global_step": 166816, "epoch": 3971} {"train_loss": -6.955508708953857, "global_step": 166817, "epoch": 3971} {"train_loss": -7.05413293838501, "global_step": 166818, "epoch": 3971} {"train_loss": -7.061490058898926, "global_step": 166819, "epoch": 3971} {"train_loss": -6.810437202453613, "global_step": 166820, "epoch": 3971} {"train_loss": -7.080328464508057, "global_step": 166821, "epoch": 3971} {"train_loss": -6.977311611175537, "global_step": 166822, "epoch": 3971} {"train_loss": -6.915575981140137, "global_step": 166823, "epoch": 3971, "val_loss": 68895.421875} {"train_loss": -6.921964645385742, "global_step": 166824, "epoch": 3972} {"train_loss": -7.064846992492676, "global_step": 166825, "epoch": 3972} {"train_loss": -6.951361656188965, "global_step": 166826, "epoch": 3972} {"train_loss": -7.003318786621094, "global_step": 166827, "epoch": 3972} {"train_loss": -7.1433000564575195, "global_step": 166828, "epoch": 3972} {"train_loss": -7.000581741333008, "global_step": 166829, "epoch": 3972} {"train_loss": -6.977410316467285, "global_step": 166830, "epoch": 3972} {"train_loss": -7.056269645690918, "global_step": 166831, "epoch": 3972} {"train_loss": -7.039361953735352, "global_step": 166832, "epoch": 3972} {"train_loss": -7.142032623291016, "global_step": 166833, "epoch": 3972} {"train_loss": -6.900710105895996, "global_step": 166834, "epoch": 3972} {"train_loss": -6.991572380065918, "global_step": 166835, "epoch": 3972} {"train_loss": -7.057027816772461, "global_step": 166836, "epoch": 3972} {"train_loss": -6.9938249588012695, "global_step": 166837, "epoch": 3972} {"train_loss": -7.014695644378662, "global_step": 166838, "epoch": 3972} {"train_loss": -6.96728515625, "global_step": 166839, "epoch": 3972} {"train_loss": -6.98873233795166, "global_step": 166840, "epoch": 3972} {"train_loss": -7.040520668029785, "global_step": 166841, "epoch": 3972} {"train_loss": -6.954084396362305, "global_step": 166842, "epoch": 3972} {"train_loss": -7.007336139678955, "global_step": 166843, "epoch": 3972} {"train_loss": -6.952881813049316, "global_step": 166844, "epoch": 3972} {"train_loss": -6.971039295196533, "global_step": 166845, "epoch": 3972} {"train_loss": -6.931143760681152, "global_step": 166846, "epoch": 3972} {"train_loss": -7.160854816436768, "global_step": 166847, "epoch": 3972} {"train_loss": -6.926536560058594, "global_step": 166848, "epoch": 3972} {"train_loss": -7.021880626678467, "global_step": 166849, "epoch": 3972} {"train_loss": -6.992969512939453, "global_step": 166850, "epoch": 3972} {"train_loss": -6.846225738525391, "global_step": 166851, "epoch": 3972} {"train_loss": -7.078899383544922, "global_step": 166852, "epoch": 3972} {"train_loss": -6.891363143920898, "global_step": 166853, "epoch": 3972} {"train_loss": -6.809513092041016, "global_step": 166854, "epoch": 3972} {"train_loss": -6.9482316970825195, "global_step": 166855, "epoch": 3972} {"train_loss": -6.800002098083496, "global_step": 166856, "epoch": 3972} {"train_loss": -6.792562484741211, "global_step": 166857, "epoch": 3972} {"train_loss": -6.948486328125, "global_step": 166858, "epoch": 3972} {"train_loss": -6.722400188446045, "global_step": 166859, "epoch": 3972} {"train_loss": -6.9548139572143555, "global_step": 166860, "epoch": 3972} {"train_loss": -6.782033920288086, "global_step": 166861, "epoch": 3972} {"train_loss": -7.054782867431641, "global_step": 166862, "epoch": 3972} {"train_loss": -6.942994594573975, "global_step": 166863, "epoch": 3972} {"train_loss": -7.111845970153809, "global_step": 166864, "epoch": 3972} {"train_loss": -6.973504566010975, "global_step": 166865, "epoch": 3972, "val_loss": 69029.8125} {"train_loss": -6.8500075340271, "global_step": 166866, "epoch": 3973} {"train_loss": -7.004336833953857, "global_step": 166867, "epoch": 3973} {"train_loss": -6.9874348640441895, "global_step": 166868, "epoch": 3973} {"train_loss": -7.0196027755737305, "global_step": 166869, "epoch": 3973} {"train_loss": -6.994741439819336, "global_step": 166870, "epoch": 3973} {"train_loss": -7.036194801330566, "global_step": 166871, "epoch": 3973} {"train_loss": -7.042722702026367, "global_step": 166872, "epoch": 3973} {"train_loss": -7.058793067932129, "global_step": 166873, "epoch": 3973} {"train_loss": -7.042308807373047, "global_step": 166874, "epoch": 3973} {"train_loss": -6.965896129608154, "global_step": 166875, "epoch": 3973} {"train_loss": -7.1347880363464355, "global_step": 166876, "epoch": 3973} {"train_loss": -6.93992280960083, "global_step": 166877, "epoch": 3973} {"train_loss": -6.99450159072876, "global_step": 166878, "epoch": 3973} {"train_loss": -7.160260200500488, "global_step": 166879, "epoch": 3973} {"train_loss": -6.949311256408691, "global_step": 166880, "epoch": 3973} {"train_loss": -7.01699161529541, "global_step": 166881, "epoch": 3973} {"train_loss": -6.973475933074951, "global_step": 166882, "epoch": 3973} {"train_loss": -7.073480129241943, "global_step": 166883, "epoch": 3973} {"train_loss": -7.010866641998291, "global_step": 166884, "epoch": 3973} {"train_loss": -7.059496879577637, "global_step": 166885, "epoch": 3973} {"train_loss": -6.872490882873535, "global_step": 166886, "epoch": 3973} {"train_loss": -6.9320173263549805, "global_step": 166887, "epoch": 3973} {"train_loss": -7.013251304626465, "global_step": 166888, "epoch": 3973} {"train_loss": -6.890944004058838, "global_step": 166889, "epoch": 3973} {"train_loss": -6.928047180175781, "global_step": 166890, "epoch": 3973} {"train_loss": -6.91533088684082, "global_step": 166891, "epoch": 3973} {"train_loss": -7.05549430847168, "global_step": 166892, "epoch": 3973} {"train_loss": -7.014806747436523, "global_step": 166893, "epoch": 3973} {"train_loss": -7.025026321411133, "global_step": 166894, "epoch": 3973} {"train_loss": -7.089003562927246, "global_step": 166895, "epoch": 3973} {"train_loss": -6.977296829223633, "global_step": 166896, "epoch": 3973} {"train_loss": -7.068506240844727, "global_step": 166897, "epoch": 3973} {"train_loss": -6.991066932678223, "global_step": 166898, "epoch": 3973} {"train_loss": -6.93532657623291, "global_step": 166899, "epoch": 3973} {"train_loss": -7.024871826171875, "global_step": 166900, "epoch": 3973} {"train_loss": -6.947925567626953, "global_step": 166901, "epoch": 3973} {"train_loss": -7.053497314453125, "global_step": 166902, "epoch": 3973} {"train_loss": -6.929863929748535, "global_step": 166903, "epoch": 3973} {"train_loss": -6.930908203125, "global_step": 166904, "epoch": 3973} {"train_loss": -6.984643936157227, "global_step": 166905, "epoch": 3973} {"train_loss": -7.014315605163574, "global_step": 166906, "epoch": 3973} {"train_loss": -6.997848942166283, "global_step": 166907, "epoch": 3973, "val_loss": 68950.0390625} {"train_loss": -6.8970842361450195, "global_step": 166908, "epoch": 3974} {"train_loss": -6.990385055541992, "global_step": 166909, "epoch": 3974} {"train_loss": -7.052571773529053, "global_step": 166910, "epoch": 3974} {"train_loss": -6.9626359939575195, "global_step": 166911, "epoch": 3974} {"train_loss": -7.031084060668945, "global_step": 166912, "epoch": 3974} {"train_loss": -6.918604850769043, "global_step": 166913, "epoch": 3974} {"train_loss": -6.868374824523926, "global_step": 166914, "epoch": 3974} {"train_loss": -6.978292465209961, "global_step": 166915, "epoch": 3974} {"train_loss": -7.052539348602295, "global_step": 166916, "epoch": 3974} {"train_loss": -7.007240295410156, "global_step": 166917, "epoch": 3974} {"train_loss": -6.928496360778809, "global_step": 166918, "epoch": 3974} {"train_loss": -6.855882167816162, "global_step": 166919, "epoch": 3974} {"train_loss": -7.0540289878845215, "global_step": 166920, "epoch": 3974} {"train_loss": -6.868786811828613, "global_step": 166921, "epoch": 3974} {"train_loss": -6.867889404296875, "global_step": 166922, "epoch": 3974} {"train_loss": -7.134020805358887, "global_step": 166923, "epoch": 3974} {"train_loss": -7.004572868347168, "global_step": 166924, "epoch": 3974} {"train_loss": -6.85478401184082, "global_step": 166925, "epoch": 3974} {"train_loss": -7.005405426025391, "global_step": 166926, "epoch": 3974} {"train_loss": -6.843987941741943, "global_step": 166927, "epoch": 3974} {"train_loss": -6.97744083404541, "global_step": 166928, "epoch": 3974} {"train_loss": -6.991464138031006, "global_step": 166929, "epoch": 3974} {"train_loss": -6.859457492828369, "global_step": 166930, "epoch": 3974} {"train_loss": -6.942841529846191, "global_step": 166931, "epoch": 3974} {"train_loss": -6.930496692657471, "global_step": 166932, "epoch": 3974} {"train_loss": -6.897319793701172, "global_step": 166933, "epoch": 3974} {"train_loss": -7.0087127685546875, "global_step": 166934, "epoch": 3974} {"train_loss": -6.818753242492676, "global_step": 166935, "epoch": 3974} {"train_loss": -6.981328010559082, "global_step": 166936, "epoch": 3974} {"train_loss": -6.963985443115234, "global_step": 166937, "epoch": 3974} {"train_loss": -7.06074333190918, "global_step": 166938, "epoch": 3974} {"train_loss": -6.998204708099365, "global_step": 166939, "epoch": 3974} {"train_loss": -6.849501609802246, "global_step": 166940, "epoch": 3974} {"train_loss": -7.02073860168457, "global_step": 166941, "epoch": 3974} {"train_loss": -7.0048089027404785, "global_step": 166942, "epoch": 3974} {"train_loss": -7.04579496383667, "global_step": 166943, "epoch": 3974} {"train_loss": -6.97573184967041, "global_step": 166944, "epoch": 3974} {"train_loss": -7.074969291687012, "global_step": 166945, "epoch": 3974} {"train_loss": -6.9826979637146, "global_step": 166946, "epoch": 3974} {"train_loss": -7.0132904052734375, "global_step": 166947, "epoch": 3974} {"train_loss": -6.953670024871826, "global_step": 166948, "epoch": 3974} {"train_loss": -6.9673775604793, "global_step": 166949, "epoch": 3974, "val_loss": 68953.4609375} {"train_loss": -7.069436073303223, "global_step": 166950, "epoch": 3975} {"train_loss": -7.090275287628174, "global_step": 166951, "epoch": 3975} {"train_loss": -7.092837333679199, "global_step": 166952, "epoch": 3975} {"train_loss": -7.05612850189209, "global_step": 166953, "epoch": 3975} {"train_loss": -7.12818717956543, "global_step": 166954, "epoch": 3975} {"train_loss": -6.985438346862793, "global_step": 166955, "epoch": 3975} {"train_loss": -7.101771354675293, "global_step": 166956, "epoch": 3975} {"train_loss": -7.1702375411987305, "global_step": 166957, "epoch": 3975} {"train_loss": -7.077990531921387, "global_step": 166958, "epoch": 3975} {"train_loss": -7.099953651428223, "global_step": 166959, "epoch": 3975} {"train_loss": -7.115476131439209, "global_step": 166960, "epoch": 3975} {"train_loss": -7.045562267303467, "global_step": 166961, "epoch": 3975} {"train_loss": -7.070987701416016, "global_step": 166962, "epoch": 3975} {"train_loss": -7.013915061950684, "global_step": 166963, "epoch": 3975} {"train_loss": -6.9958391189575195, "global_step": 166964, "epoch": 3975} {"train_loss": -7.0886054039001465, "global_step": 166965, "epoch": 3975} {"train_loss": -6.908195495605469, "global_step": 166966, "epoch": 3975} {"train_loss": -7.049460411071777, "global_step": 166967, "epoch": 3975} {"train_loss": -6.867741584777832, "global_step": 166968, "epoch": 3975} {"train_loss": -6.9372639656066895, "global_step": 166969, "epoch": 3975} {"train_loss": -6.893459320068359, "global_step": 166970, "epoch": 3975} {"train_loss": -7.019017219543457, "global_step": 166971, "epoch": 3975} {"train_loss": -6.881350994110107, "global_step": 166972, "epoch": 3975} {"train_loss": -6.93533992767334, "global_step": 166973, "epoch": 3975} {"train_loss": -6.973933219909668, "global_step": 166974, "epoch": 3975} {"train_loss": -7.049732208251953, "global_step": 166975, "epoch": 3975} {"train_loss": -6.967057228088379, "global_step": 166976, "epoch": 3975} {"train_loss": -6.809360027313232, "global_step": 166977, "epoch": 3975} {"train_loss": -6.886767387390137, "global_step": 166978, "epoch": 3975} {"train_loss": -6.873262405395508, "global_step": 166979, "epoch": 3975} {"train_loss": -7.0835371017456055, "global_step": 166980, "epoch": 3975} {"train_loss": -6.939761161804199, "global_step": 166981, "epoch": 3975} {"train_loss": -6.8650665283203125, "global_step": 166982, "epoch": 3975} {"train_loss": -6.896014213562012, "global_step": 166983, "epoch": 3975} {"train_loss": -6.868334770202637, "global_step": 166984, "epoch": 3975} {"train_loss": -7.004017353057861, "global_step": 166985, "epoch": 3975} {"train_loss": -6.876676559448242, "global_step": 166986, "epoch": 3975} {"train_loss": -6.858362197875977, "global_step": 166987, "epoch": 3975} {"train_loss": -6.941784858703613, "global_step": 166988, "epoch": 3975} {"train_loss": -6.980887413024902, "global_step": 166989, "epoch": 3975} {"train_loss": -6.9655632972717285, "global_step": 166990, "epoch": 3975} {"train_loss": -6.989926133837018, "global_step": 166991, "epoch": 3975, "val_loss": 68817.078125} {"train_loss": -6.978809356689453, "global_step": 166992, "epoch": 3976} {"train_loss": -6.94731330871582, "global_step": 166993, "epoch": 3976} {"train_loss": -7.049663543701172, "global_step": 166994, "epoch": 3976} {"train_loss": -7.053243637084961, "global_step": 166995, "epoch": 3976} {"train_loss": -6.997348785400391, "global_step": 166996, "epoch": 3976} {"train_loss": -7.069234371185303, "global_step": 166997, "epoch": 3976} {"train_loss": -6.903714179992676, "global_step": 166998, "epoch": 3976} {"train_loss": -6.948809623718262, "global_step": 166999, "epoch": 3976} {"train_loss": -6.994471549987793, "global_step": 167000, "epoch": 3976} {"train_loss": -6.965132713317871, "global_step": 167001, "epoch": 3976} {"train_loss": -6.999209403991699, "global_step": 167002, "epoch": 3976} {"train_loss": -7.0299248695373535, "global_step": 167003, "epoch": 3976} {"train_loss": -7.0069169998168945, "global_step": 167004, "epoch": 3976} {"train_loss": -7.120813369750977, "global_step": 167005, "epoch": 3976} {"train_loss": -7.045235633850098, "global_step": 167006, "epoch": 3976} {"train_loss": -7.019008159637451, "global_step": 167007, "epoch": 3976} {"train_loss": -7.018681049346924, "global_step": 167008, "epoch": 3976} {"train_loss": -7.085540771484375, "global_step": 167009, "epoch": 3976} {"train_loss": -7.069492340087891, "global_step": 167010, "epoch": 3976} {"train_loss": -7.1159987449646, "global_step": 167011, "epoch": 3976} {"train_loss": -7.153580665588379, "global_step": 167012, "epoch": 3976} {"train_loss": -7.082677364349365, "global_step": 167013, "epoch": 3976} {"train_loss": -6.9937744140625, "global_step": 167014, "epoch": 3976} {"train_loss": -7.006052017211914, "global_step": 167015, "epoch": 3976} {"train_loss": -7.063562393188477, "global_step": 167016, "epoch": 3976} {"train_loss": -7.052787780761719, "global_step": 167017, "epoch": 3976} {"train_loss": -7.085702896118164, "global_step": 167018, "epoch": 3976} {"train_loss": -7.048172950744629, "global_step": 167019, "epoch": 3976} {"train_loss": -7.007766246795654, "global_step": 167020, "epoch": 3976} {"train_loss": -7.0889177322387695, "global_step": 167021, "epoch": 3976} {"train_loss": -7.015897750854492, "global_step": 167022, "epoch": 3976} {"train_loss": -6.99003267288208, "global_step": 167023, "epoch": 3976} {"train_loss": -7.015858173370361, "global_step": 167024, "epoch": 3976} {"train_loss": -7.06714391708374, "global_step": 167025, "epoch": 3976} {"train_loss": -6.998517990112305, "global_step": 167026, "epoch": 3976} {"train_loss": -6.992616653442383, "global_step": 167027, "epoch": 3976} {"train_loss": -6.945734024047852, "global_step": 167028, "epoch": 3976} {"train_loss": -6.991680145263672, "global_step": 167029, "epoch": 3976} {"train_loss": -7.024609565734863, "global_step": 167030, "epoch": 3976} {"train_loss": -7.012845516204834, "global_step": 167031, "epoch": 3976} {"train_loss": -6.981542587280273, "global_step": 167032, "epoch": 3976} {"train_loss": -7.021485521679833, "global_step": 167033, "epoch": 3976, "val_loss": 69003.4296875} {"train_loss": -6.879417896270752, "global_step": 167034, "epoch": 3977} {"train_loss": -6.898244857788086, "global_step": 167035, "epoch": 3977} {"train_loss": -6.968710422515869, "global_step": 167036, "epoch": 3977} {"train_loss": -6.9835004806518555, "global_step": 167037, "epoch": 3977} {"train_loss": -6.775757789611816, "global_step": 167038, "epoch": 3977} {"train_loss": -6.872835159301758, "global_step": 167039, "epoch": 3977} {"train_loss": -6.968847274780273, "global_step": 167040, "epoch": 3977} {"train_loss": -6.99617862701416, "global_step": 167041, "epoch": 3977} {"train_loss": -6.925766944885254, "global_step": 167042, "epoch": 3977} {"train_loss": -7.038022994995117, "global_step": 167043, "epoch": 3977} {"train_loss": -7.077284812927246, "global_step": 167044, "epoch": 3977} {"train_loss": -6.92167854309082, "global_step": 167045, "epoch": 3977} {"train_loss": -6.947478771209717, "global_step": 167046, "epoch": 3977} {"train_loss": -7.074434757232666, "global_step": 167047, "epoch": 3977} {"train_loss": -7.020656585693359, "global_step": 167048, "epoch": 3977} {"train_loss": -7.146465301513672, "global_step": 167049, "epoch": 3977} {"train_loss": -7.101137638092041, "global_step": 167050, "epoch": 3977} {"train_loss": -7.123879909515381, "global_step": 167051, "epoch": 3977} {"train_loss": -7.022123336791992, "global_step": 167052, "epoch": 3977} {"train_loss": -7.018643379211426, "global_step": 167053, "epoch": 3977} {"train_loss": -6.977147579193115, "global_step": 167054, "epoch": 3977} {"train_loss": -7.0152997970581055, "global_step": 167055, "epoch": 3977} {"train_loss": -7.007077217102051, "global_step": 167056, "epoch": 3977} {"train_loss": -6.942226409912109, "global_step": 167057, "epoch": 3977} {"train_loss": -7.099247455596924, "global_step": 167058, "epoch": 3977} {"train_loss": -6.972798824310303, "global_step": 167059, "epoch": 3977} {"train_loss": -6.940429210662842, "global_step": 167060, "epoch": 3977} {"train_loss": -6.976430892944336, "global_step": 167061, "epoch": 3977} {"train_loss": -7.0208940505981445, "global_step": 167062, "epoch": 3977} {"train_loss": -6.977655410766602, "global_step": 167063, "epoch": 3977} {"train_loss": -7.011075496673584, "global_step": 167064, "epoch": 3977} {"train_loss": -6.922000885009766, "global_step": 167065, "epoch": 3977} {"train_loss": -7.050751686096191, "global_step": 167066, "epoch": 3977} {"train_loss": -7.089663505554199, "global_step": 167067, "epoch": 3977} {"train_loss": -7.012382984161377, "global_step": 167068, "epoch": 3977} {"train_loss": -7.089459419250488, "global_step": 167069, "epoch": 3977} {"train_loss": -6.954372882843018, "global_step": 167070, "epoch": 3977} {"train_loss": -7.107341766357422, "global_step": 167071, "epoch": 3977} {"train_loss": -7.119295120239258, "global_step": 167072, "epoch": 3977} {"train_loss": -7.147622108459473, "global_step": 167073, "epoch": 3977} {"train_loss": -7.11107063293457, "global_step": 167074, "epoch": 3977} {"train_loss": -7.007092021760487, "global_step": 167075, "epoch": 3977, "val_loss": 68804.4140625} {"train_loss": -7.101548671722412, "global_step": 167076, "epoch": 3978} {"train_loss": -7.042200088500977, "global_step": 167077, "epoch": 3978} {"train_loss": -7.095571041107178, "global_step": 167078, "epoch": 3978} {"train_loss": -7.125695705413818, "global_step": 167079, "epoch": 3978} {"train_loss": -7.119234085083008, "global_step": 167080, "epoch": 3978} {"train_loss": -7.113742828369141, "global_step": 167081, "epoch": 3978} {"train_loss": -7.092144966125488, "global_step": 167082, "epoch": 3978} {"train_loss": -7.10219669342041, "global_step": 167083, "epoch": 3978} {"train_loss": -7.19596004486084, "global_step": 167084, "epoch": 3978} {"train_loss": -7.058839321136475, "global_step": 167085, "epoch": 3978} {"train_loss": -7.137087345123291, "global_step": 167086, "epoch": 3978} {"train_loss": -7.056802749633789, "global_step": 167087, "epoch": 3978} {"train_loss": -7.150401592254639, "global_step": 167088, "epoch": 3978} {"train_loss": -7.103503227233887, "global_step": 167089, "epoch": 3978} {"train_loss": -7.101837158203125, "global_step": 167090, "epoch": 3978} {"train_loss": -7.150561809539795, "global_step": 167091, "epoch": 3978} {"train_loss": -7.081345558166504, "global_step": 167092, "epoch": 3978} {"train_loss": -6.995135307312012, "global_step": 167093, "epoch": 3978} {"train_loss": -7.002248764038086, "global_step": 167094, "epoch": 3978} {"train_loss": -7.069573879241943, "global_step": 167095, "epoch": 3978} {"train_loss": -7.280797004699707, "global_step": 167096, "epoch": 3978} {"train_loss": -7.115734577178955, "global_step": 167097, "epoch": 3978} {"train_loss": -6.98129940032959, "global_step": 167098, "epoch": 3978} {"train_loss": -6.958559036254883, "global_step": 167099, "epoch": 3978} {"train_loss": -7.0226521492004395, "global_step": 167100, "epoch": 3978} {"train_loss": -7.07608699798584, "global_step": 167101, "epoch": 3978} {"train_loss": -6.8974103927612305, "global_step": 167102, "epoch": 3978} {"train_loss": -6.981294631958008, "global_step": 167103, "epoch": 3978} {"train_loss": -7.066542625427246, "global_step": 167104, "epoch": 3978} {"train_loss": -6.997414588928223, "global_step": 167105, "epoch": 3978} {"train_loss": -6.955556869506836, "global_step": 167106, "epoch": 3978} {"train_loss": -7.00346565246582, "global_step": 167107, "epoch": 3978} {"train_loss": -7.039897441864014, "global_step": 167108, "epoch": 3978} {"train_loss": -6.98084831237793, "global_step": 167109, "epoch": 3978} {"train_loss": -6.977877140045166, "global_step": 167110, "epoch": 3978} {"train_loss": -7.1196088790893555, "global_step": 167111, "epoch": 3978} {"train_loss": -7.028356552124023, "global_step": 167112, "epoch": 3978} {"train_loss": -6.839599609375, "global_step": 167113, "epoch": 3978} {"train_loss": -7.006159782409668, "global_step": 167114, "epoch": 3978} {"train_loss": -7.109516620635986, "global_step": 167115, "epoch": 3978} {"train_loss": -6.974947452545166, "global_step": 167116, "epoch": 3978} {"train_loss": -7.054293802806309, "global_step": 167117, "epoch": 3978, "val_loss": 68957.1875} {"train_loss": -6.978614807128906, "global_step": 167118, "epoch": 3979} {"train_loss": -6.8916544914245605, "global_step": 167119, "epoch": 3979} {"train_loss": -7.033733367919922, "global_step": 167120, "epoch": 3979} {"train_loss": -6.974460601806641, "global_step": 167121, "epoch": 3979} {"train_loss": -6.844852447509766, "global_step": 167122, "epoch": 3979} {"train_loss": -6.8641157150268555, "global_step": 167123, "epoch": 3979} {"train_loss": -6.918036460876465, "global_step": 167124, "epoch": 3979} {"train_loss": -6.869297027587891, "global_step": 167125, "epoch": 3979} {"train_loss": -6.873142719268799, "global_step": 167126, "epoch": 3979} {"train_loss": -6.828396797180176, "global_step": 167127, "epoch": 3979} {"train_loss": -6.8786468505859375, "global_step": 167128, "epoch": 3979} {"train_loss": -6.91251277923584, "global_step": 167129, "epoch": 3979} {"train_loss": -6.913790702819824, "global_step": 167130, "epoch": 3979} {"train_loss": -6.894927978515625, "global_step": 167131, "epoch": 3979} {"train_loss": -6.89907169342041, "global_step": 167132, "epoch": 3979} {"train_loss": -7.090699195861816, "global_step": 167133, "epoch": 3979} {"train_loss": -6.907557487487793, "global_step": 167134, "epoch": 3979} {"train_loss": -6.952348709106445, "global_step": 167135, "epoch": 3979} {"train_loss": -7.004958629608154, "global_step": 167136, "epoch": 3979} {"train_loss": -6.970853805541992, "global_step": 167137, "epoch": 3979} {"train_loss": -7.085902214050293, "global_step": 167138, "epoch": 3979} {"train_loss": -6.951206207275391, "global_step": 167139, "epoch": 3979} {"train_loss": -6.936952590942383, "global_step": 167140, "epoch": 3979} {"train_loss": -6.984148025512695, "global_step": 167141, "epoch": 3979} {"train_loss": -6.951174259185791, "global_step": 167142, "epoch": 3979} {"train_loss": -6.988731384277344, "global_step": 167143, "epoch": 3979} {"train_loss": -6.98576545715332, "global_step": 167144, "epoch": 3979} {"train_loss": -7.083159446716309, "global_step": 167145, "epoch": 3979} {"train_loss": -7.0677571296691895, "global_step": 167146, "epoch": 3979} {"train_loss": -7.116346836090088, "global_step": 167147, "epoch": 3979} {"train_loss": -7.024627685546875, "global_step": 167148, "epoch": 3979} {"train_loss": -7.068395614624023, "global_step": 167149, "epoch": 3979} {"train_loss": -6.984726905822754, "global_step": 167150, "epoch": 3979} {"train_loss": -6.9580583572387695, "global_step": 167151, "epoch": 3979} {"train_loss": -6.9630126953125, "global_step": 167152, "epoch": 3979} {"train_loss": -6.931290626525879, "global_step": 167153, "epoch": 3979} {"train_loss": -6.989771842956543, "global_step": 167154, "epoch": 3979} {"train_loss": -7.031656265258789, "global_step": 167155, "epoch": 3979} {"train_loss": -7.064670085906982, "global_step": 167156, "epoch": 3979} {"train_loss": -6.7499895095825195, "global_step": 167157, "epoch": 3979} {"train_loss": -6.972315788269043, "global_step": 167158, "epoch": 3979} {"train_loss": -6.959727173759823, "global_step": 167159, "epoch": 3979, "val_loss": 68996.2421875} {"train_loss": -6.870366096496582, "global_step": 167160, "epoch": 3980} {"train_loss": -6.9289751052856445, "global_step": 167161, "epoch": 3980} {"train_loss": -6.881581783294678, "global_step": 167162, "epoch": 3980} {"train_loss": -6.945664405822754, "global_step": 167163, "epoch": 3980} {"train_loss": -6.957369804382324, "global_step": 167164, "epoch": 3980} {"train_loss": -6.854351997375488, "global_step": 167165, "epoch": 3980} {"train_loss": -7.002324104309082, "global_step": 167166, "epoch": 3980} {"train_loss": -6.867837905883789, "global_step": 167167, "epoch": 3980} {"train_loss": -6.845304489135742, "global_step": 167168, "epoch": 3980} {"train_loss": -7.034939765930176, "global_step": 167169, "epoch": 3980} {"train_loss": -6.913883209228516, "global_step": 167170, "epoch": 3980} {"train_loss": -6.9143452644348145, "global_step": 167171, "epoch": 3980} {"train_loss": -7.02161979675293, "global_step": 167172, "epoch": 3980} {"train_loss": -6.897761344909668, "global_step": 167173, "epoch": 3980} {"train_loss": -6.974155902862549, "global_step": 167174, "epoch": 3980} {"train_loss": -6.954929351806641, "global_step": 167175, "epoch": 3980} {"train_loss": -6.962847709655762, "global_step": 167176, "epoch": 3980} {"train_loss": -6.944493293762207, "global_step": 167177, "epoch": 3980} {"train_loss": -6.949182033538818, "global_step": 167178, "epoch": 3980} {"train_loss": -7.041153430938721, "global_step": 167179, "epoch": 3980} {"train_loss": -6.936488628387451, "global_step": 167180, "epoch": 3980} {"train_loss": -7.068401336669922, "global_step": 167181, "epoch": 3980} {"train_loss": -7.045255184173584, "global_step": 167182, "epoch": 3980} {"train_loss": -6.938464641571045, "global_step": 167183, "epoch": 3980} {"train_loss": -7.1291656494140625, "global_step": 167184, "epoch": 3980} {"train_loss": -7.0286865234375, "global_step": 167185, "epoch": 3980} {"train_loss": -7.037191867828369, "global_step": 167186, "epoch": 3980} {"train_loss": -6.989058971405029, "global_step": 167187, "epoch": 3980} {"train_loss": -7.002562522888184, "global_step": 167188, "epoch": 3980} {"train_loss": -7.016179084777832, "global_step": 167189, "epoch": 3980} {"train_loss": -7.054323673248291, "global_step": 167190, "epoch": 3980} {"train_loss": -6.989245891571045, "global_step": 167191, "epoch": 3980} {"train_loss": -7.056419372558594, "global_step": 167192, "epoch": 3980} {"train_loss": -7.02010440826416, "global_step": 167193, "epoch": 3980} {"train_loss": -7.084569931030273, "global_step": 167194, "epoch": 3980} {"train_loss": -7.026778221130371, "global_step": 167195, "epoch": 3980} {"train_loss": -7.093122959136963, "global_step": 167196, "epoch": 3980} {"train_loss": -7.043973922729492, "global_step": 167197, "epoch": 3980} {"train_loss": -7.055743217468262, "global_step": 167198, "epoch": 3980} {"train_loss": -7.044308662414551, "global_step": 167199, "epoch": 3980} {"train_loss": -6.917599678039551, "global_step": 167200, "epoch": 3980} {"train_loss": -6.985193581808181, "global_step": 167201, "epoch": 3980, "val_loss": 68850.859375} {"train_loss": -6.9999799728393555, "global_step": 167202, "epoch": 3981} {"train_loss": -7.0650177001953125, "global_step": 167203, "epoch": 3981} {"train_loss": -6.9843831062316895, "global_step": 167204, "epoch": 3981} {"train_loss": -7.016604423522949, "global_step": 167205, "epoch": 3981} {"train_loss": -7.065954685211182, "global_step": 167206, "epoch": 3981} {"train_loss": -7.064429759979248, "global_step": 167207, "epoch": 3981} {"train_loss": -6.9477620124816895, "global_step": 167208, "epoch": 3981} {"train_loss": -6.9745259284973145, "global_step": 167209, "epoch": 3981} {"train_loss": -7.058749198913574, "global_step": 167210, "epoch": 3981} {"train_loss": -7.025813102722168, "global_step": 167211, "epoch": 3981} {"train_loss": -7.05325984954834, "global_step": 167212, "epoch": 3981} {"train_loss": -6.968216896057129, "global_step": 167213, "epoch": 3981} {"train_loss": -7.059861183166504, "global_step": 167214, "epoch": 3981} {"train_loss": -7.062566757202148, "global_step": 167215, "epoch": 3981} {"train_loss": -7.014032363891602, "global_step": 167216, "epoch": 3981} {"train_loss": -7.060518264770508, "global_step": 167217, "epoch": 3981} {"train_loss": -7.072167873382568, "global_step": 167218, "epoch": 3981} {"train_loss": -7.0021071434021, "global_step": 167219, "epoch": 3981} {"train_loss": -6.984687805175781, "global_step": 167220, "epoch": 3981} {"train_loss": -7.105671405792236, "global_step": 167221, "epoch": 3981} {"train_loss": -7.0305047035217285, "global_step": 167222, "epoch": 3981} {"train_loss": -6.971806526184082, "global_step": 167223, "epoch": 3981} {"train_loss": -7.163366317749023, "global_step": 167224, "epoch": 3981} {"train_loss": -6.984559059143066, "global_step": 167225, "epoch": 3981} {"train_loss": -6.938589572906494, "global_step": 167226, "epoch": 3981} {"train_loss": -6.987545013427734, "global_step": 167227, "epoch": 3981} {"train_loss": -7.026971817016602, "global_step": 167228, "epoch": 3981} {"train_loss": -7.135220050811768, "global_step": 167229, "epoch": 3981} {"train_loss": -7.042363166809082, "global_step": 167230, "epoch": 3981} {"train_loss": -7.072782516479492, "global_step": 167231, "epoch": 3981} {"train_loss": -6.9919209480285645, "global_step": 167232, "epoch": 3981} {"train_loss": -7.062259197235107, "global_step": 167233, "epoch": 3981} {"train_loss": -6.940681457519531, "global_step": 167234, "epoch": 3981} {"train_loss": -7.003066539764404, "global_step": 167235, "epoch": 3981} {"train_loss": -6.969212532043457, "global_step": 167236, "epoch": 3981} {"train_loss": -7.070230484008789, "global_step": 167237, "epoch": 3981} {"train_loss": -7.069908142089844, "global_step": 167238, "epoch": 3981} {"train_loss": -6.9030866622924805, "global_step": 167239, "epoch": 3981} {"train_loss": -7.150500297546387, "global_step": 167240, "epoch": 3981} {"train_loss": -6.99301815032959, "global_step": 167241, "epoch": 3981} {"train_loss": -6.982244491577148, "global_step": 167242, "epoch": 3981} {"train_loss": -7.025938737960089, "global_step": 167243, "epoch": 3981, "val_loss": 68950.0546875} {"train_loss": -7.079482078552246, "global_step": 167244, "epoch": 3982} {"train_loss": -7.010190963745117, "global_step": 167245, "epoch": 3982} {"train_loss": -7.029738426208496, "global_step": 167246, "epoch": 3982} {"train_loss": -7.07869815826416, "global_step": 167247, "epoch": 3982} {"train_loss": -6.892877578735352, "global_step": 167248, "epoch": 3982} {"train_loss": -7.108851432800293, "global_step": 167249, "epoch": 3982} {"train_loss": -7.133419990539551, "global_step": 167250, "epoch": 3982} {"train_loss": -7.082046985626221, "global_step": 167251, "epoch": 3982} {"train_loss": -7.005031585693359, "global_step": 167252, "epoch": 3982} {"train_loss": -6.891778469085693, "global_step": 167253, "epoch": 3982} {"train_loss": -7.148465156555176, "global_step": 167254, "epoch": 3982} {"train_loss": -6.990520477294922, "global_step": 167255, "epoch": 3982} {"train_loss": -7.030168533325195, "global_step": 167256, "epoch": 3982} {"train_loss": -7.011776924133301, "global_step": 167257, "epoch": 3982} {"train_loss": -6.965219020843506, "global_step": 167258, "epoch": 3982} {"train_loss": -7.1318793296813965, "global_step": 167259, "epoch": 3982} {"train_loss": -6.996827125549316, "global_step": 167260, "epoch": 3982} {"train_loss": -6.932840347290039, "global_step": 167261, "epoch": 3982} {"train_loss": -7.041705131530762, "global_step": 167262, "epoch": 3982} {"train_loss": -6.847803115844727, "global_step": 167263, "epoch": 3982} {"train_loss": -6.978816986083984, "global_step": 167264, "epoch": 3982} {"train_loss": -7.0088419914245605, "global_step": 167265, "epoch": 3982} {"train_loss": -7.107775688171387, "global_step": 167266, "epoch": 3982} {"train_loss": -7.095829486846924, "global_step": 167267, "epoch": 3982} {"train_loss": -6.946291923522949, "global_step": 167268, "epoch": 3982} {"train_loss": -7.080804347991943, "global_step": 167269, "epoch": 3982} {"train_loss": -6.997119903564453, "global_step": 167270, "epoch": 3982} {"train_loss": -6.962651252746582, "global_step": 167271, "epoch": 3982} {"train_loss": -6.998578071594238, "global_step": 167272, "epoch": 3982} {"train_loss": -7.062609672546387, "global_step": 167273, "epoch": 3982} {"train_loss": -7.054985046386719, "global_step": 167274, "epoch": 3982} {"train_loss": -7.031265735626221, "global_step": 167275, "epoch": 3982} {"train_loss": -7.152041912078857, "global_step": 167276, "epoch": 3982} {"train_loss": -6.97110652923584, "global_step": 167277, "epoch": 3982} {"train_loss": -7.0116987228393555, "global_step": 167278, "epoch": 3982} {"train_loss": -7.133575439453125, "global_step": 167279, "epoch": 3982} {"train_loss": -7.067379951477051, "global_step": 167280, "epoch": 3982} {"train_loss": -7.072244644165039, "global_step": 167281, "epoch": 3982} {"train_loss": -7.127518177032471, "global_step": 167282, "epoch": 3982} {"train_loss": -7.102634429931641, "global_step": 167283, "epoch": 3982} {"train_loss": -6.835504531860352, "global_step": 167284, "epoch": 3982} {"train_loss": -7.02806145804269, "global_step": 167285, "epoch": 3982, "val_loss": 69025.53125} {"train_loss": -7.063364028930664, "global_step": 167286, "epoch": 3983} {"train_loss": -7.010530471801758, "global_step": 167287, "epoch": 3983} {"train_loss": -7.00316047668457, "global_step": 167288, "epoch": 3983} {"train_loss": -6.90997314453125, "global_step": 167289, "epoch": 3983} {"train_loss": -7.056519508361816, "global_step": 167290, "epoch": 3983} {"train_loss": -7.02378511428833, "global_step": 167291, "epoch": 3983} {"train_loss": -6.97147798538208, "global_step": 167292, "epoch": 3983} {"train_loss": -7.040096282958984, "global_step": 167293, "epoch": 3983} {"train_loss": -6.974885940551758, "global_step": 167294, "epoch": 3983} {"train_loss": -6.820872783660889, "global_step": 167295, "epoch": 3983} {"train_loss": -6.905170440673828, "global_step": 167296, "epoch": 3983} {"train_loss": -6.95374870300293, "global_step": 167297, "epoch": 3983} {"train_loss": -6.800029277801514, "global_step": 167298, "epoch": 3983} {"train_loss": -6.8344011306762695, "global_step": 167299, "epoch": 3983} {"train_loss": -7.00612735748291, "global_step": 167300, "epoch": 3983} {"train_loss": -6.8114213943481445, "global_step": 167301, "epoch": 3983} {"train_loss": -6.970834732055664, "global_step": 167302, "epoch": 3983} {"train_loss": -6.694191932678223, "global_step": 167303, "epoch": 3983} {"train_loss": -6.901108741760254, "global_step": 167304, "epoch": 3983} {"train_loss": -6.95371150970459, "global_step": 167305, "epoch": 3983} {"train_loss": -7.026162147521973, "global_step": 167306, "epoch": 3983} {"train_loss": -6.973782539367676, "global_step": 167307, "epoch": 3983} {"train_loss": -6.931574821472168, "global_step": 167308, "epoch": 3983} {"train_loss": -6.899117946624756, "global_step": 167309, "epoch": 3983} {"train_loss": -6.949378967285156, "global_step": 167310, "epoch": 3983} {"train_loss": -6.981127738952637, "global_step": 167311, "epoch": 3983} {"train_loss": -6.980161190032959, "global_step": 167312, "epoch": 3983} {"train_loss": -6.944967269897461, "global_step": 167313, "epoch": 3983} {"train_loss": -6.835233688354492, "global_step": 167314, "epoch": 3983} {"train_loss": -6.917678356170654, "global_step": 167315, "epoch": 3983} {"train_loss": -6.985915660858154, "global_step": 167316, "epoch": 3983} {"train_loss": -6.9121012687683105, "global_step": 167317, "epoch": 3983} {"train_loss": -7.0692138671875, "global_step": 167318, "epoch": 3983} {"train_loss": -6.910373210906982, "global_step": 167319, "epoch": 3983} {"train_loss": -6.795724868774414, "global_step": 167320, "epoch": 3983} {"train_loss": -7.025722980499268, "global_step": 167321, "epoch": 3983} {"train_loss": -6.723802089691162, "global_step": 167322, "epoch": 3983} {"train_loss": -6.9202775955200195, "global_step": 167323, "epoch": 3983} {"train_loss": -7.030012607574463, "global_step": 167324, "epoch": 3983} {"train_loss": -6.870728969573975, "global_step": 167325, "epoch": 3983} {"train_loss": -6.994440078735352, "global_step": 167326, "epoch": 3983} {"train_loss": -6.93513298034668, "global_step": 167327, "epoch": 3983, "val_loss": 68986.3125} {"train_loss": -6.92325496673584, "global_step": 167328, "epoch": 3984} {"train_loss": -7.012213706970215, "global_step": 167329, "epoch": 3984} {"train_loss": -6.8469390869140625, "global_step": 167330, "epoch": 3984} {"train_loss": -6.94976806640625, "global_step": 167331, "epoch": 3984} {"train_loss": -6.928230285644531, "global_step": 167332, "epoch": 3984} {"train_loss": -6.91642427444458, "global_step": 167333, "epoch": 3984} {"train_loss": -6.826155185699463, "global_step": 167334, "epoch": 3984} {"train_loss": -6.880353927612305, "global_step": 167335, "epoch": 3984} {"train_loss": -6.796222686767578, "global_step": 167336, "epoch": 3984} {"train_loss": -6.984683036804199, "global_step": 167337, "epoch": 3984} {"train_loss": -6.966750144958496, "global_step": 167338, "epoch": 3984} {"train_loss": -6.908162593841553, "global_step": 167339, "epoch": 3984} {"train_loss": -6.879485130310059, "global_step": 167340, "epoch": 3984} {"train_loss": -6.9131646156311035, "global_step": 167341, "epoch": 3984} {"train_loss": -7.047871112823486, "global_step": 167342, "epoch": 3984} {"train_loss": -6.964146614074707, "global_step": 167343, "epoch": 3984} {"train_loss": -6.874872207641602, "global_step": 167344, "epoch": 3984} {"train_loss": -6.902823448181152, "global_step": 167345, "epoch": 3984} {"train_loss": -6.960262775421143, "global_step": 167346, "epoch": 3984} {"train_loss": -7.020885467529297, "global_step": 167347, "epoch": 3984} {"train_loss": -6.923469543457031, "global_step": 167348, "epoch": 3984} {"train_loss": -6.853133201599121, "global_step": 167349, "epoch": 3984} {"train_loss": -6.944059371948242, "global_step": 167350, "epoch": 3984} {"train_loss": -6.921596527099609, "global_step": 167351, "epoch": 3984} {"train_loss": -6.9849853515625, "global_step": 167352, "epoch": 3984} {"train_loss": -6.950104713439941, "global_step": 167353, "epoch": 3984} {"train_loss": -6.919085502624512, "global_step": 167354, "epoch": 3984} {"train_loss": -7.006947994232178, "global_step": 167355, "epoch": 3984} {"train_loss": -6.9979400634765625, "global_step": 167356, "epoch": 3984} {"train_loss": -7.021275520324707, "global_step": 167357, "epoch": 3984} {"train_loss": -6.902654647827148, "global_step": 167358, "epoch": 3984} {"train_loss": -7.064120292663574, "global_step": 167359, "epoch": 3984} {"train_loss": -6.944980621337891, "global_step": 167360, "epoch": 3984} {"train_loss": -7.044390678405762, "global_step": 167361, "epoch": 3984} {"train_loss": -6.900545120239258, "global_step": 167362, "epoch": 3984} {"train_loss": -7.026839733123779, "global_step": 167363, "epoch": 3984} {"train_loss": -7.087294578552246, "global_step": 167364, "epoch": 3984} {"train_loss": -6.894550800323486, "global_step": 167365, "epoch": 3984} {"train_loss": -7.043699264526367, "global_step": 167366, "epoch": 3984} {"train_loss": -6.9553399085998535, "global_step": 167367, "epoch": 3984} {"train_loss": -7.083799362182617, "global_step": 167368, "epoch": 3984} {"train_loss": -6.9495238690149215, "global_step": 167369, "epoch": 3984, "val_loss": 68903.1015625} {"train_loss": -7.017126083374023, "global_step": 167370, "epoch": 3985} {"train_loss": -6.998869895935059, "global_step": 167371, "epoch": 3985} {"train_loss": -6.955183982849121, "global_step": 167372, "epoch": 3985} {"train_loss": -6.986340522766113, "global_step": 167373, "epoch": 3985} {"train_loss": -7.006034851074219, "global_step": 167374, "epoch": 3985} {"train_loss": -7.0502119064331055, "global_step": 167375, "epoch": 3985} {"train_loss": -7.032975196838379, "global_step": 167376, "epoch": 3985} {"train_loss": -6.873347282409668, "global_step": 167377, "epoch": 3985} {"train_loss": -7.099384784698486, "global_step": 167378, "epoch": 3985} {"train_loss": -6.986759662628174, "global_step": 167379, "epoch": 3985} {"train_loss": -7.178215980529785, "global_step": 167380, "epoch": 3985} {"train_loss": -6.798642158508301, "global_step": 167381, "epoch": 3985} {"train_loss": -7.085330009460449, "global_step": 167382, "epoch": 3985} {"train_loss": -7.0703535079956055, "global_step": 167383, "epoch": 3985} {"train_loss": -7.050294876098633, "global_step": 167384, "epoch": 3985} {"train_loss": -7.043817043304443, "global_step": 167385, "epoch": 3985} {"train_loss": -6.992180347442627, "global_step": 167386, "epoch": 3985} {"train_loss": -7.146981239318848, "global_step": 167387, "epoch": 3985} {"train_loss": -6.944492340087891, "global_step": 167388, "epoch": 3985} {"train_loss": -7.113431930541992, "global_step": 167389, "epoch": 3985} {"train_loss": -7.027692794799805, "global_step": 167390, "epoch": 3985} {"train_loss": -7.0742998123168945, "global_step": 167391, "epoch": 3985} {"train_loss": -7.002590179443359, "global_step": 167392, "epoch": 3985} {"train_loss": -6.98704719543457, "global_step": 167393, "epoch": 3985} {"train_loss": -7.031241416931152, "global_step": 167394, "epoch": 3985} {"train_loss": -7.074405670166016, "global_step": 167395, "epoch": 3985} {"train_loss": -7.048471450805664, "global_step": 167396, "epoch": 3985} {"train_loss": -7.073059558868408, "global_step": 167397, "epoch": 3985} {"train_loss": -7.193398475646973, "global_step": 167398, "epoch": 3985} {"train_loss": -7.0711469650268555, "global_step": 167399, "epoch": 3985} {"train_loss": -7.123355388641357, "global_step": 167400, "epoch": 3985} {"train_loss": -7.042340278625488, "global_step": 167401, "epoch": 3985} {"train_loss": -7.0677490234375, "global_step": 167402, "epoch": 3985} {"train_loss": -7.074893474578857, "global_step": 167403, "epoch": 3985} {"train_loss": -7.104105472564697, "global_step": 167404, "epoch": 3985} {"train_loss": -6.969974040985107, "global_step": 167405, "epoch": 3985} {"train_loss": -6.9927544593811035, "global_step": 167406, "epoch": 3985} {"train_loss": -6.994953632354736, "global_step": 167407, "epoch": 3985} {"train_loss": -7.031002998352051, "global_step": 167408, "epoch": 3985} {"train_loss": -7.0460405349731445, "global_step": 167409, "epoch": 3985} {"train_loss": -7.047917366027832, "global_step": 167410, "epoch": 3985} {"train_loss": -7.036279258273897, "global_step": 167411, "epoch": 3985, "val_loss": 68978.0078125} {"train_loss": -7.054288864135742, "global_step": 167412, "epoch": 3986} {"train_loss": -7.016411781311035, "global_step": 167413, "epoch": 3986} {"train_loss": -6.913461208343506, "global_step": 167414, "epoch": 3986} {"train_loss": -7.037330627441406, "global_step": 167415, "epoch": 3986} {"train_loss": -6.998822212219238, "global_step": 167416, "epoch": 3986} {"train_loss": -7.046436309814453, "global_step": 167417, "epoch": 3986} {"train_loss": -7.047987461090088, "global_step": 167418, "epoch": 3986} {"train_loss": -7.092252254486084, "global_step": 167419, "epoch": 3986} {"train_loss": -6.991540908813477, "global_step": 167420, "epoch": 3986} {"train_loss": -7.048212051391602, "global_step": 167421, "epoch": 3986} {"train_loss": -6.862785816192627, "global_step": 167422, "epoch": 3986} {"train_loss": -7.050428867340088, "global_step": 167423, "epoch": 3986} {"train_loss": -7.119173526763916, "global_step": 167424, "epoch": 3986} {"train_loss": -7.154547691345215, "global_step": 167425, "epoch": 3986} {"train_loss": -7.075082778930664, "global_step": 167426, "epoch": 3986} {"train_loss": -6.99654483795166, "global_step": 167427, "epoch": 3986} {"train_loss": -7.020041465759277, "global_step": 167428, "epoch": 3986} {"train_loss": -6.990896701812744, "global_step": 167429, "epoch": 3986} {"train_loss": -6.833744049072266, "global_step": 167430, "epoch": 3986} {"train_loss": -6.937349319458008, "global_step": 167431, "epoch": 3986} {"train_loss": -7.06198787689209, "global_step": 167432, "epoch": 3986} {"train_loss": -6.897266387939453, "global_step": 167433, "epoch": 3986} {"train_loss": -6.942000389099121, "global_step": 167434, "epoch": 3986} {"train_loss": -7.006340026855469, "global_step": 167435, "epoch": 3986} {"train_loss": -6.99445104598999, "global_step": 167436, "epoch": 3986} {"train_loss": -6.946600914001465, "global_step": 167437, "epoch": 3986} {"train_loss": -6.91950798034668, "global_step": 167438, "epoch": 3986} {"train_loss": -6.741677761077881, "global_step": 167439, "epoch": 3986} {"train_loss": -6.903592109680176, "global_step": 167440, "epoch": 3986} {"train_loss": -6.917698860168457, "global_step": 167441, "epoch": 3986} {"train_loss": -6.850655555725098, "global_step": 167442, "epoch": 3986} {"train_loss": -6.86702823638916, "global_step": 167443, "epoch": 3986} {"train_loss": -6.8809814453125, "global_step": 167444, "epoch": 3986} {"train_loss": -6.956776142120361, "global_step": 167445, "epoch": 3986} {"train_loss": -6.933521270751953, "global_step": 167446, "epoch": 3986} {"train_loss": -7.004315376281738, "global_step": 167447, "epoch": 3986} {"train_loss": -6.893301486968994, "global_step": 167448, "epoch": 3986} {"train_loss": -6.929269313812256, "global_step": 167449, "epoch": 3986} {"train_loss": -6.905196666717529, "global_step": 167450, "epoch": 3986} {"train_loss": -6.9156413078308105, "global_step": 167451, "epoch": 3986} {"train_loss": -7.016956806182861, "global_step": 167452, "epoch": 3986} {"train_loss": -6.970517771584647, "global_step": 167453, "epoch": 3986, "val_loss": 68881.859375} {"train_loss": -6.886332988739014, "global_step": 167454, "epoch": 3987} {"train_loss": -6.87012243270874, "global_step": 167455, "epoch": 3987} {"train_loss": -6.9088897705078125, "global_step": 167456, "epoch": 3987} {"train_loss": -6.761538505554199, "global_step": 167457, "epoch": 3987} {"train_loss": -6.951686859130859, "global_step": 167458, "epoch": 3987} {"train_loss": -6.913119316101074, "global_step": 167459, "epoch": 3987} {"train_loss": -6.694253921508789, "global_step": 167460, "epoch": 3987} {"train_loss": -6.951525688171387, "global_step": 167461, "epoch": 3987} {"train_loss": -6.8128509521484375, "global_step": 167462, "epoch": 3987} {"train_loss": -6.869865417480469, "global_step": 167463, "epoch": 3987} {"train_loss": -6.979293346405029, "global_step": 167464, "epoch": 3987} {"train_loss": -6.782557487487793, "global_step": 167465, "epoch": 3987} {"train_loss": -6.933455944061279, "global_step": 167466, "epoch": 3987} {"train_loss": -7.055362701416016, "global_step": 167467, "epoch": 3987} {"train_loss": -6.892792224884033, "global_step": 167468, "epoch": 3987} {"train_loss": -6.9581403732299805, "global_step": 167469, "epoch": 3987} {"train_loss": -7.005704879760742, "global_step": 167470, "epoch": 3987} {"train_loss": -7.021148681640625, "global_step": 167471, "epoch": 3987} {"train_loss": -6.901659965515137, "global_step": 167472, "epoch": 3987} {"train_loss": -6.965618133544922, "global_step": 167473, "epoch": 3987} {"train_loss": -6.927065849304199, "global_step": 167474, "epoch": 3987} {"train_loss": -6.997438430786133, "global_step": 167475, "epoch": 3987} {"train_loss": -7.0486860275268555, "global_step": 167476, "epoch": 3987} {"train_loss": -7.045395374298096, "global_step": 167477, "epoch": 3987} {"train_loss": -7.099088191986084, "global_step": 167478, "epoch": 3987} {"train_loss": -7.033818244934082, "global_step": 167479, "epoch": 3987} {"train_loss": -7.034293174743652, "global_step": 167480, "epoch": 3987} {"train_loss": -7.1285176277160645, "global_step": 167481, "epoch": 3987} {"train_loss": -7.057270050048828, "global_step": 167482, "epoch": 3987} {"train_loss": -7.0694732666015625, "global_step": 167483, "epoch": 3987} {"train_loss": -7.027588844299316, "global_step": 167484, "epoch": 3987} {"train_loss": -7.0189666748046875, "global_step": 167485, "epoch": 3987} {"train_loss": -7.072091579437256, "global_step": 167486, "epoch": 3987} {"train_loss": -6.964223384857178, "global_step": 167487, "epoch": 3987} {"train_loss": -7.212431907653809, "global_step": 167488, "epoch": 3987} {"train_loss": -7.130142688751221, "global_step": 167489, "epoch": 3987} {"train_loss": -6.904081344604492, "global_step": 167490, "epoch": 3987} {"train_loss": -6.9933271408081055, "global_step": 167491, "epoch": 3987} {"train_loss": -7.082622528076172, "global_step": 167492, "epoch": 3987} {"train_loss": -6.9154205322265625, "global_step": 167493, "epoch": 3987} {"train_loss": -7.006345272064209, "global_step": 167494, "epoch": 3987} {"train_loss": -6.9727390720730735, "global_step": 167495, "epoch": 3987, "val_loss": 68956.75} {"train_loss": -7.055710792541504, "global_step": 167496, "epoch": 3988} {"train_loss": -6.949759483337402, "global_step": 167497, "epoch": 3988} {"train_loss": -7.0249128341674805, "global_step": 167498, "epoch": 3988} {"train_loss": -7.145476341247559, "global_step": 167499, "epoch": 3988} {"train_loss": -7.098734378814697, "global_step": 167500, "epoch": 3988} {"train_loss": -7.004034042358398, "global_step": 167501, "epoch": 3988} {"train_loss": -6.99892520904541, "global_step": 167502, "epoch": 3988} {"train_loss": -6.992701530456543, "global_step": 167503, "epoch": 3988} {"train_loss": -7.024028301239014, "global_step": 167504, "epoch": 3988} {"train_loss": -7.0958251953125, "global_step": 167505, "epoch": 3988} {"train_loss": -6.959868907928467, "global_step": 167506, "epoch": 3988} {"train_loss": -7.096598148345947, "global_step": 167507, "epoch": 3988} {"train_loss": -7.048774719238281, "global_step": 167508, "epoch": 3988} {"train_loss": -6.963594913482666, "global_step": 167509, "epoch": 3988} {"train_loss": -7.186568260192871, "global_step": 167510, "epoch": 3988} {"train_loss": -7.006157398223877, "global_step": 167511, "epoch": 3988} {"train_loss": -6.989384651184082, "global_step": 167512, "epoch": 3988} {"train_loss": -7.04829216003418, "global_step": 167513, "epoch": 3988} {"train_loss": -7.026390552520752, "global_step": 167514, "epoch": 3988} {"train_loss": -6.877371311187744, "global_step": 167515, "epoch": 3988} {"train_loss": -7.055087089538574, "global_step": 167516, "epoch": 3988} {"train_loss": -6.959927082061768, "global_step": 167517, "epoch": 3988} {"train_loss": -6.875995635986328, "global_step": 167518, "epoch": 3988} {"train_loss": -7.09441614151001, "global_step": 167519, "epoch": 3988} {"train_loss": -6.89710807800293, "global_step": 167520, "epoch": 3988} {"train_loss": -6.9439520835876465, "global_step": 167521, "epoch": 3988} {"train_loss": -6.913227081298828, "global_step": 167522, "epoch": 3988} {"train_loss": -6.966202735900879, "global_step": 167523, "epoch": 3988} {"train_loss": -6.900522232055664, "global_step": 167524, "epoch": 3988} {"train_loss": -7.082907199859619, "global_step": 167525, "epoch": 3988} {"train_loss": -6.950915336608887, "global_step": 167526, "epoch": 3988} {"train_loss": -6.983806610107422, "global_step": 167527, "epoch": 3988} {"train_loss": -7.018529415130615, "global_step": 167528, "epoch": 3988} {"train_loss": -7.039220809936523, "global_step": 167529, "epoch": 3988} {"train_loss": -6.986275672912598, "global_step": 167530, "epoch": 3988} {"train_loss": -6.99513578414917, "global_step": 167531, "epoch": 3988} {"train_loss": -6.906933784484863, "global_step": 167532, "epoch": 3988} {"train_loss": -7.004621505737305, "global_step": 167533, "epoch": 3988} {"train_loss": -6.8896942138671875, "global_step": 167534, "epoch": 3988} {"train_loss": -6.982217788696289, "global_step": 167535, "epoch": 3988} {"train_loss": -6.911913871765137, "global_step": 167536, "epoch": 3988} {"train_loss": -6.997914439155942, "global_step": 167537, "epoch": 3988, "val_loss": 69080.3359375} {"train_loss": -6.875204563140869, "global_step": 167538, "epoch": 3989} {"train_loss": -6.934831619262695, "global_step": 167539, "epoch": 3989} {"train_loss": -6.913850784301758, "global_step": 167540, "epoch": 3989} {"train_loss": -6.843654632568359, "global_step": 167541, "epoch": 3989} {"train_loss": -7.007370948791504, "global_step": 167542, "epoch": 3989} {"train_loss": -7.19970703125, "global_step": 167543, "epoch": 3989} {"train_loss": -6.908092498779297, "global_step": 167544, "epoch": 3989} {"train_loss": -6.8620500564575195, "global_step": 167545, "epoch": 3989} {"train_loss": -6.981685638427734, "global_step": 167546, "epoch": 3989} {"train_loss": -6.839833736419678, "global_step": 167547, "epoch": 3989} {"train_loss": -6.907251358032227, "global_step": 167548, "epoch": 3989} {"train_loss": -7.00464391708374, "global_step": 167549, "epoch": 3989} {"train_loss": -6.88356876373291, "global_step": 167550, "epoch": 3989} {"train_loss": -6.895222187042236, "global_step": 167551, "epoch": 3989} {"train_loss": -6.906290054321289, "global_step": 167552, "epoch": 3989} {"train_loss": -6.821312427520752, "global_step": 167553, "epoch": 3989} {"train_loss": -6.918510913848877, "global_step": 167554, "epoch": 3989} {"train_loss": -6.874393463134766, "global_step": 167555, "epoch": 3989} {"train_loss": -7.010032653808594, "global_step": 167556, "epoch": 3989} {"train_loss": -6.892309665679932, "global_step": 167557, "epoch": 3989} {"train_loss": -7.059759140014648, "global_step": 167558, "epoch": 3989} {"train_loss": -6.948246479034424, "global_step": 167559, "epoch": 3989} {"train_loss": -7.017289161682129, "global_step": 167560, "epoch": 3989} {"train_loss": -6.853603839874268, "global_step": 167561, "epoch": 3989} {"train_loss": -6.8999834060668945, "global_step": 167562, "epoch": 3989} {"train_loss": -6.972587585449219, "global_step": 167563, "epoch": 3989} {"train_loss": -6.854438781738281, "global_step": 167564, "epoch": 3989} {"train_loss": -6.987854957580566, "global_step": 167565, "epoch": 3989} {"train_loss": -6.9518280029296875, "global_step": 167566, "epoch": 3989} {"train_loss": -6.8928141593933105, "global_step": 167567, "epoch": 3989} {"train_loss": -6.972810745239258, "global_step": 167568, "epoch": 3989} {"train_loss": -6.916072368621826, "global_step": 167569, "epoch": 3989} {"train_loss": -7.043917655944824, "global_step": 167570, "epoch": 3989} {"train_loss": -6.951898574829102, "global_step": 167571, "epoch": 3989} {"train_loss": -6.933645248413086, "global_step": 167572, "epoch": 3989} {"train_loss": -7.085317611694336, "global_step": 167573, "epoch": 3989} {"train_loss": -6.952272891998291, "global_step": 167574, "epoch": 3989} {"train_loss": -6.966958522796631, "global_step": 167575, "epoch": 3989} {"train_loss": -7.0223894119262695, "global_step": 167576, "epoch": 3989} {"train_loss": -7.0713605880737305, "global_step": 167577, "epoch": 3989} {"train_loss": -7.0116705894470215, "global_step": 167578, "epoch": 3989} {"train_loss": -6.95158364659264, "global_step": 167579, "epoch": 3989, "val_loss": 68985.9375} {"train_loss": -6.987564563751221, "global_step": 167580, "epoch": 3990} {"train_loss": -7.168183326721191, "global_step": 167581, "epoch": 3990} {"train_loss": -7.014763832092285, "global_step": 167582, "epoch": 3990} {"train_loss": -7.040559768676758, "global_step": 167583, "epoch": 3990} {"train_loss": -7.044953346252441, "global_step": 167584, "epoch": 3990} {"train_loss": -6.93528413772583, "global_step": 167585, "epoch": 3990} {"train_loss": -6.930879592895508, "global_step": 167586, "epoch": 3990} {"train_loss": -6.895015239715576, "global_step": 167587, "epoch": 3990} {"train_loss": -7.00672721862793, "global_step": 167588, "epoch": 3990} {"train_loss": -7.066054344177246, "global_step": 167589, "epoch": 3990} {"train_loss": -7.068948745727539, "global_step": 167590, "epoch": 3990} {"train_loss": -7.0643839836120605, "global_step": 167591, "epoch": 3990} {"train_loss": -6.980354309082031, "global_step": 167592, "epoch": 3990} {"train_loss": -6.849701881408691, "global_step": 167593, "epoch": 3990} {"train_loss": -7.013798713684082, "global_step": 167594, "epoch": 3990} {"train_loss": -6.944981575012207, "global_step": 167595, "epoch": 3990} {"train_loss": -7.027753829956055, "global_step": 167596, "epoch": 3990} {"train_loss": -6.946717262268066, "global_step": 167597, "epoch": 3990} {"train_loss": -6.989801406860352, "global_step": 167598, "epoch": 3990} {"train_loss": -7.008822917938232, "global_step": 167599, "epoch": 3990} {"train_loss": -6.853611946105957, "global_step": 167600, "epoch": 3990} {"train_loss": -6.9369797706604, "global_step": 167601, "epoch": 3990} {"train_loss": -6.958916664123535, "global_step": 167602, "epoch": 3990} {"train_loss": -7.033703327178955, "global_step": 167603, "epoch": 3990} {"train_loss": -6.940526962280273, "global_step": 167604, "epoch": 3990} {"train_loss": -6.897308349609375, "global_step": 167605, "epoch": 3990} {"train_loss": -6.921273231506348, "global_step": 167606, "epoch": 3990} {"train_loss": -6.964818954467773, "global_step": 167607, "epoch": 3990} {"train_loss": -6.963912010192871, "global_step": 167608, "epoch": 3990} {"train_loss": -7.039444446563721, "global_step": 167609, "epoch": 3990} {"train_loss": -7.004900932312012, "global_step": 167610, "epoch": 3990} {"train_loss": -7.033644199371338, "global_step": 167611, "epoch": 3990} {"train_loss": -6.936973571777344, "global_step": 167612, "epoch": 3990} {"train_loss": -6.931357383728027, "global_step": 167613, "epoch": 3990} {"train_loss": -6.92965030670166, "global_step": 167614, "epoch": 3990} {"train_loss": -6.868373870849609, "global_step": 167615, "epoch": 3990} {"train_loss": -7.034905433654785, "global_step": 167616, "epoch": 3990} {"train_loss": -6.966165542602539, "global_step": 167617, "epoch": 3990} {"train_loss": -7.041325569152832, "global_step": 167618, "epoch": 3990} {"train_loss": -7.061713218688965, "global_step": 167619, "epoch": 3990} {"train_loss": -6.976480484008789, "global_step": 167620, "epoch": 3990} {"train_loss": -6.982162407466343, "global_step": 167621, "epoch": 3990, "val_loss": 68933.9921875} {"train_loss": -7.067643642425537, "global_step": 167622, "epoch": 3991} {"train_loss": -7.001454830169678, "global_step": 167623, "epoch": 3991} {"train_loss": -7.070087432861328, "global_step": 167624, "epoch": 3991} {"train_loss": -6.934014320373535, "global_step": 167625, "epoch": 3991} {"train_loss": -6.926854133605957, "global_step": 167626, "epoch": 3991} {"train_loss": -6.949790000915527, "global_step": 167627, "epoch": 3991} {"train_loss": -7.088720321655273, "global_step": 167628, "epoch": 3991} {"train_loss": -7.009710311889648, "global_step": 167629, "epoch": 3991} {"train_loss": -6.881247043609619, "global_step": 167630, "epoch": 3991} {"train_loss": -7.02805233001709, "global_step": 167631, "epoch": 3991} {"train_loss": -7.060516357421875, "global_step": 167632, "epoch": 3991} {"train_loss": -7.026654243469238, "global_step": 167633, "epoch": 3991} {"train_loss": -7.005606651306152, "global_step": 167634, "epoch": 3991} {"train_loss": -7.053354740142822, "global_step": 167635, "epoch": 3991} {"train_loss": -6.870951175689697, "global_step": 167636, "epoch": 3991} {"train_loss": -7.02097749710083, "global_step": 167637, "epoch": 3991} {"train_loss": -7.007144927978516, "global_step": 167638, "epoch": 3991} {"train_loss": -7.117216110229492, "global_step": 167639, "epoch": 3991} {"train_loss": -7.030806064605713, "global_step": 167640, "epoch": 3991} {"train_loss": -7.03046989440918, "global_step": 167641, "epoch": 3991} {"train_loss": -7.050516605377197, "global_step": 167642, "epoch": 3991} {"train_loss": -6.940777778625488, "global_step": 167643, "epoch": 3991} {"train_loss": -7.161966800689697, "global_step": 167644, "epoch": 3991} {"train_loss": -7.048026084899902, "global_step": 167645, "epoch": 3991} {"train_loss": -6.949593544006348, "global_step": 167646, "epoch": 3991} {"train_loss": -7.120753765106201, "global_step": 167647, "epoch": 3991} {"train_loss": -7.014278411865234, "global_step": 167648, "epoch": 3991} {"train_loss": -6.946547508239746, "global_step": 167649, "epoch": 3991} {"train_loss": -6.983092308044434, "global_step": 167650, "epoch": 3991} {"train_loss": -7.033830165863037, "global_step": 167651, "epoch": 3991} {"train_loss": -7.022717475891113, "global_step": 167652, "epoch": 3991} {"train_loss": -7.057678699493408, "global_step": 167653, "epoch": 3991} {"train_loss": -7.0509819984436035, "global_step": 167654, "epoch": 3991} {"train_loss": -6.987329483032227, "global_step": 167655, "epoch": 3991} {"train_loss": -6.948829174041748, "global_step": 167656, "epoch": 3991} {"train_loss": -7.035149574279785, "global_step": 167657, "epoch": 3991} {"train_loss": -6.969738483428955, "global_step": 167658, "epoch": 3991} {"train_loss": -7.09401273727417, "global_step": 167659, "epoch": 3991} {"train_loss": -7.029191970825195, "global_step": 167660, "epoch": 3991} {"train_loss": -6.8365678787231445, "global_step": 167661, "epoch": 3991} {"train_loss": -6.923013687133789, "global_step": 167662, "epoch": 3991} {"train_loss": -7.006709462120419, "global_step": 167663, "epoch": 3991, "val_loss": 68878.4765625} {"train_loss": -6.8432793617248535, "global_step": 167664, "epoch": 3992} {"train_loss": -7.044200897216797, "global_step": 167665, "epoch": 3992} {"train_loss": -6.964766502380371, "global_step": 167666, "epoch": 3992} {"train_loss": -7.014695167541504, "global_step": 167667, "epoch": 3992} {"train_loss": -6.822293281555176, "global_step": 167668, "epoch": 3992} {"train_loss": -6.929271697998047, "global_step": 167669, "epoch": 3992} {"train_loss": -7.023853778839111, "global_step": 167670, "epoch": 3992} {"train_loss": -6.797158241271973, "global_step": 167671, "epoch": 3992} {"train_loss": -7.07255744934082, "global_step": 167672, "epoch": 3992} {"train_loss": -6.929779529571533, "global_step": 167673, "epoch": 3992} {"train_loss": -6.960500717163086, "global_step": 167674, "epoch": 3992} {"train_loss": -7.06108283996582, "global_step": 167675, "epoch": 3992} {"train_loss": -6.843160629272461, "global_step": 167676, "epoch": 3992} {"train_loss": -6.974345684051514, "global_step": 167677, "epoch": 3992} {"train_loss": -6.9656171798706055, "global_step": 167678, "epoch": 3992} {"train_loss": -7.04259729385376, "global_step": 167679, "epoch": 3992} {"train_loss": -6.973433017730713, "global_step": 167680, "epoch": 3992} {"train_loss": -6.995753288269043, "global_step": 167681, "epoch": 3992} {"train_loss": -7.08158540725708, "global_step": 167682, "epoch": 3992} {"train_loss": -6.939303874969482, "global_step": 167683, "epoch": 3992} {"train_loss": -6.996247291564941, "global_step": 167684, "epoch": 3992} {"train_loss": -7.0484209060668945, "global_step": 167685, "epoch": 3992} {"train_loss": -7.047981262207031, "global_step": 167686, "epoch": 3992} {"train_loss": -7.062270164489746, "global_step": 167687, "epoch": 3992} {"train_loss": -6.957234859466553, "global_step": 167688, "epoch": 3992} {"train_loss": -7.059256553649902, "global_step": 167689, "epoch": 3992} {"train_loss": -7.067885875701904, "global_step": 167690, "epoch": 3992} {"train_loss": -7.006841659545898, "global_step": 167691, "epoch": 3992} {"train_loss": -7.081554412841797, "global_step": 167692, "epoch": 3992} {"train_loss": -6.949583530426025, "global_step": 167693, "epoch": 3992} {"train_loss": -6.984445095062256, "global_step": 167694, "epoch": 3992} {"train_loss": -7.064153671264648, "global_step": 167695, "epoch": 3992} {"train_loss": -6.839550018310547, "global_step": 167696, "epoch": 3992} {"train_loss": -7.11715030670166, "global_step": 167697, "epoch": 3992} {"train_loss": -6.990504264831543, "global_step": 167698, "epoch": 3992} {"train_loss": -7.09657096862793, "global_step": 167699, "epoch": 3992} {"train_loss": -7.052068710327148, "global_step": 167700, "epoch": 3992} {"train_loss": -6.927257537841797, "global_step": 167701, "epoch": 3992} {"train_loss": -7.1211442947387695, "global_step": 167702, "epoch": 3992} {"train_loss": -7.081311225891113, "global_step": 167703, "epoch": 3992} {"train_loss": -7.092413902282715, "global_step": 167704, "epoch": 3992} {"train_loss": -6.998417377471924, "global_step": 167705, "epoch": 3992, "val_loss": 68771.5859375} {"train_loss": -7.064373970031738, "global_step": 167706, "epoch": 3993} {"train_loss": -7.012470245361328, "global_step": 167707, "epoch": 3993} {"train_loss": -6.985875129699707, "global_step": 167708, "epoch": 3993} {"train_loss": -6.827330589294434, "global_step": 167709, "epoch": 3993} {"train_loss": -7.108887672424316, "global_step": 167710, "epoch": 3993} {"train_loss": -6.99832010269165, "global_step": 167711, "epoch": 3993} {"train_loss": -6.950936317443848, "global_step": 167712, "epoch": 3993} {"train_loss": -6.999820232391357, "global_step": 167713, "epoch": 3993} {"train_loss": -6.694047927856445, "global_step": 167714, "epoch": 3993} {"train_loss": -7.081390380859375, "global_step": 167715, "epoch": 3993} {"train_loss": -6.989371299743652, "global_step": 167716, "epoch": 3993} {"train_loss": -6.987142562866211, "global_step": 167717, "epoch": 3993} {"train_loss": -6.9898552894592285, "global_step": 167718, "epoch": 3993} {"train_loss": -6.9403581619262695, "global_step": 167719, "epoch": 3993} {"train_loss": -6.935781955718994, "global_step": 167720, "epoch": 3993} {"train_loss": -7.012927055358887, "global_step": 167721, "epoch": 3993} {"train_loss": -7.036005973815918, "global_step": 167722, "epoch": 3993} {"train_loss": -6.966640472412109, "global_step": 167723, "epoch": 3993} {"train_loss": -6.957676887512207, "global_step": 167724, "epoch": 3993} {"train_loss": -6.947906494140625, "global_step": 167725, "epoch": 3993} {"train_loss": -7.023556709289551, "global_step": 167726, "epoch": 3993} {"train_loss": -7.095302581787109, "global_step": 167727, "epoch": 3993} {"train_loss": -6.932855606079102, "global_step": 167728, "epoch": 3993} {"train_loss": -7.083439350128174, "global_step": 167729, "epoch": 3993} {"train_loss": -7.107798099517822, "global_step": 167730, "epoch": 3993} {"train_loss": -7.02610445022583, "global_step": 167731, "epoch": 3993} {"train_loss": -7.099318981170654, "global_step": 167732, "epoch": 3993} {"train_loss": -7.0479230880737305, "global_step": 167733, "epoch": 3993} {"train_loss": -7.134490013122559, "global_step": 167734, "epoch": 3993} {"train_loss": -7.043756008148193, "global_step": 167735, "epoch": 3993} {"train_loss": -7.082627296447754, "global_step": 167736, "epoch": 3993} {"train_loss": -6.9744768142700195, "global_step": 167737, "epoch": 3993} {"train_loss": -7.062578201293945, "global_step": 167738, "epoch": 3993} {"train_loss": -7.04625129699707, "global_step": 167739, "epoch": 3993} {"train_loss": -6.940986633300781, "global_step": 167740, "epoch": 3993} {"train_loss": -7.009321212768555, "global_step": 167741, "epoch": 3993} {"train_loss": -6.998554229736328, "global_step": 167742, "epoch": 3993} {"train_loss": -6.988716125488281, "global_step": 167743, "epoch": 3993} {"train_loss": -7.118769645690918, "global_step": 167744, "epoch": 3993} {"train_loss": -7.055992126464844, "global_step": 167745, "epoch": 3993} {"train_loss": -6.927188873291016, "global_step": 167746, "epoch": 3993} {"train_loss": -7.009215059734526, "global_step": 167747, "epoch": 3993, "val_loss": 68814.0859375} {"train_loss": -6.88668155670166, "global_step": 167748, "epoch": 3994} {"train_loss": -7.045209884643555, "global_step": 167749, "epoch": 3994} {"train_loss": -6.928155422210693, "global_step": 167750, "epoch": 3994} {"train_loss": -6.947564125061035, "global_step": 167751, "epoch": 3994} {"train_loss": -6.995207786560059, "global_step": 167752, "epoch": 3994} {"train_loss": -6.972919940948486, "global_step": 167753, "epoch": 3994} {"train_loss": -6.936491012573242, "global_step": 167754, "epoch": 3994} {"train_loss": -6.8676652908325195, "global_step": 167755, "epoch": 3994} {"train_loss": -6.998008728027344, "global_step": 167756, "epoch": 3994} {"train_loss": -7.040415287017822, "global_step": 167757, "epoch": 3994} {"train_loss": -6.888759613037109, "global_step": 167758, "epoch": 3994} {"train_loss": -6.928707122802734, "global_step": 167759, "epoch": 3994} {"train_loss": -7.064176559448242, "global_step": 167760, "epoch": 3994} {"train_loss": -7.006956577301025, "global_step": 167761, "epoch": 3994} {"train_loss": -6.966670989990234, "global_step": 167762, "epoch": 3994} {"train_loss": -7.044419288635254, "global_step": 167763, "epoch": 3994} {"train_loss": -7.015446662902832, "global_step": 167764, "epoch": 3994} {"train_loss": -7.004354476928711, "global_step": 167765, "epoch": 3994} {"train_loss": -7.0534820556640625, "global_step": 167766, "epoch": 3994} {"train_loss": -7.124514579772949, "global_step": 167767, "epoch": 3994} {"train_loss": -7.124916076660156, "global_step": 167768, "epoch": 3994} {"train_loss": -6.974497318267822, "global_step": 167769, "epoch": 3994} {"train_loss": -7.060945987701416, "global_step": 167770, "epoch": 3994} {"train_loss": -7.003826141357422, "global_step": 167771, "epoch": 3994} {"train_loss": -6.89796257019043, "global_step": 167772, "epoch": 3994} {"train_loss": -7.1443986892700195, "global_step": 167773, "epoch": 3994} {"train_loss": -7.1336588859558105, "global_step": 167774, "epoch": 3994} {"train_loss": -7.014817237854004, "global_step": 167775, "epoch": 3994} {"train_loss": -7.042019844055176, "global_step": 167776, "epoch": 3994} {"train_loss": -7.007421493530273, "global_step": 167777, "epoch": 3994} {"train_loss": -7.0697855949401855, "global_step": 167778, "epoch": 3994} {"train_loss": -7.040839195251465, "global_step": 167779, "epoch": 3994} {"train_loss": -6.9871392250061035, "global_step": 167780, "epoch": 3994} {"train_loss": -7.009937286376953, "global_step": 167781, "epoch": 3994} {"train_loss": -7.038622856140137, "global_step": 167782, "epoch": 3994} {"train_loss": -7.08828067779541, "global_step": 167783, "epoch": 3994} {"train_loss": -7.055700778961182, "global_step": 167784, "epoch": 3994} {"train_loss": -7.0455241203308105, "global_step": 167785, "epoch": 3994} {"train_loss": -7.0920844078063965, "global_step": 167786, "epoch": 3994} {"train_loss": -7.057374954223633, "global_step": 167787, "epoch": 3994} {"train_loss": -7.103149890899658, "global_step": 167788, "epoch": 3994} {"train_loss": -7.017021860395159, "global_step": 167789, "epoch": 3994, "val_loss": 68915.515625} {"train_loss": -7.055734634399414, "global_step": 167790, "epoch": 3995} {"train_loss": -6.945612907409668, "global_step": 167791, "epoch": 3995} {"train_loss": -7.112389087677002, "global_step": 167792, "epoch": 3995} {"train_loss": -6.917279243469238, "global_step": 167793, "epoch": 3995} {"train_loss": -7.039033889770508, "global_step": 167794, "epoch": 3995} {"train_loss": -7.006403923034668, "global_step": 167795, "epoch": 3995} {"train_loss": -7.06261682510376, "global_step": 167796, "epoch": 3995} {"train_loss": -6.945804595947266, "global_step": 167797, "epoch": 3995} {"train_loss": -7.093497276306152, "global_step": 167798, "epoch": 3995} {"train_loss": -7.123491287231445, "global_step": 167799, "epoch": 3995} {"train_loss": -6.9097089767456055, "global_step": 167800, "epoch": 3995} {"train_loss": -6.849520683288574, "global_step": 167801, "epoch": 3995} {"train_loss": -6.99611759185791, "global_step": 167802, "epoch": 3995} {"train_loss": -6.9010009765625, "global_step": 167803, "epoch": 3995} {"train_loss": -6.866389274597168, "global_step": 167804, "epoch": 3995} {"train_loss": -6.967351913452148, "global_step": 167805, "epoch": 3995} {"train_loss": -6.863271713256836, "global_step": 167806, "epoch": 3995} {"train_loss": -7.004878044128418, "global_step": 167807, "epoch": 3995} {"train_loss": -6.925450801849365, "global_step": 167808, "epoch": 3995} {"train_loss": -6.903268814086914, "global_step": 167809, "epoch": 3995} {"train_loss": -6.98304557800293, "global_step": 167810, "epoch": 3995} {"train_loss": -7.028783798217773, "global_step": 167811, "epoch": 3995} {"train_loss": -7.046675682067871, "global_step": 167812, "epoch": 3995} {"train_loss": -6.98032283782959, "global_step": 167813, "epoch": 3995} {"train_loss": -7.067331314086914, "global_step": 167814, "epoch": 3995} {"train_loss": -6.990176200866699, "global_step": 167815, "epoch": 3995} {"train_loss": -7.01483154296875, "global_step": 167816, "epoch": 3995} {"train_loss": -7.030896186828613, "global_step": 167817, "epoch": 3995} {"train_loss": -6.853819847106934, "global_step": 167818, "epoch": 3995} {"train_loss": -7.160550594329834, "global_step": 167819, "epoch": 3995} {"train_loss": -6.9401092529296875, "global_step": 167820, "epoch": 3995} {"train_loss": -7.018195152282715, "global_step": 167821, "epoch": 3995} {"train_loss": -7.016083717346191, "global_step": 167822, "epoch": 3995} {"train_loss": -6.976298809051514, "global_step": 167823, "epoch": 3995} {"train_loss": -7.020318508148193, "global_step": 167824, "epoch": 3995} {"train_loss": -6.977446556091309, "global_step": 167825, "epoch": 3995} {"train_loss": -7.031998634338379, "global_step": 167826, "epoch": 3995} {"train_loss": -7.0823540687561035, "global_step": 167827, "epoch": 3995} {"train_loss": -6.935075283050537, "global_step": 167828, "epoch": 3995} {"train_loss": -7.037629127502441, "global_step": 167829, "epoch": 3995} {"train_loss": -6.983101844787598, "global_step": 167830, "epoch": 3995} {"train_loss": -6.992038522447858, "global_step": 167831, "epoch": 3995, "val_loss": 68824.125} {"train_loss": -7.004556655883789, "global_step": 167832, "epoch": 3996} {"train_loss": -7.117932319641113, "global_step": 167833, "epoch": 3996} {"train_loss": -7.046474933624268, "global_step": 167834, "epoch": 3996} {"train_loss": -7.054804801940918, "global_step": 167835, "epoch": 3996} {"train_loss": -7.127899169921875, "global_step": 167836, "epoch": 3996} {"train_loss": -7.0467143058776855, "global_step": 167837, "epoch": 3996} {"train_loss": -7.15791130065918, "global_step": 167838, "epoch": 3996} {"train_loss": -6.971652030944824, "global_step": 167839, "epoch": 3996} {"train_loss": -7.075225353240967, "global_step": 167840, "epoch": 3996} {"train_loss": -6.95247220993042, "global_step": 167841, "epoch": 3996} {"train_loss": -6.979840278625488, "global_step": 167842, "epoch": 3996} {"train_loss": -7.066971778869629, "global_step": 167843, "epoch": 3996} {"train_loss": -6.942578315734863, "global_step": 167844, "epoch": 3996} {"train_loss": -7.088020324707031, "global_step": 167845, "epoch": 3996} {"train_loss": -7.1882219314575195, "global_step": 167846, "epoch": 3996} {"train_loss": -7.082324028015137, "global_step": 167847, "epoch": 3996} {"train_loss": -7.069849967956543, "global_step": 167848, "epoch": 3996} {"train_loss": -7.015329360961914, "global_step": 167849, "epoch": 3996} {"train_loss": -7.0598554611206055, "global_step": 167850, "epoch": 3996} {"train_loss": -6.989020347595215, "global_step": 167851, "epoch": 3996} {"train_loss": -6.990974426269531, "global_step": 167852, "epoch": 3996} {"train_loss": -6.989265441894531, "global_step": 167853, "epoch": 3996} {"train_loss": -7.008835315704346, "global_step": 167854, "epoch": 3996} {"train_loss": -7.0539727210998535, "global_step": 167855, "epoch": 3996} {"train_loss": -7.090357780456543, "global_step": 167856, "epoch": 3996} {"train_loss": -7.153743267059326, "global_step": 167857, "epoch": 3996} {"train_loss": -7.050856113433838, "global_step": 167858, "epoch": 3996} {"train_loss": -7.004484176635742, "global_step": 167859, "epoch": 3996} {"train_loss": -7.160992622375488, "global_step": 167860, "epoch": 3996} {"train_loss": -6.987349033355713, "global_step": 167861, "epoch": 3996} {"train_loss": -7.100401401519775, "global_step": 167862, "epoch": 3996} {"train_loss": -7.088823318481445, "global_step": 167863, "epoch": 3996} {"train_loss": -7.081703186035156, "global_step": 167864, "epoch": 3996} {"train_loss": -7.1433868408203125, "global_step": 167865, "epoch": 3996} {"train_loss": -7.005542755126953, "global_step": 167866, "epoch": 3996} {"train_loss": -7.018634796142578, "global_step": 167867, "epoch": 3996} {"train_loss": -7.015920639038086, "global_step": 167868, "epoch": 3996} {"train_loss": -6.922569274902344, "global_step": 167869, "epoch": 3996} {"train_loss": -7.0430707931518555, "global_step": 167870, "epoch": 3996} {"train_loss": -7.105917453765869, "global_step": 167871, "epoch": 3996} {"train_loss": -7.074721336364746, "global_step": 167872, "epoch": 3996} {"train_loss": -7.050925209408715, "global_step": 167873, "epoch": 3996, "val_loss": 68895.7421875} {"train_loss": -7.140230178833008, "global_step": 167874, "epoch": 3997} {"train_loss": -7.085988998413086, "global_step": 167875, "epoch": 3997} {"train_loss": -7.136299133300781, "global_step": 167876, "epoch": 3997} {"train_loss": -6.897644996643066, "global_step": 167877, "epoch": 3997} {"train_loss": -6.985713958740234, "global_step": 167878, "epoch": 3997} {"train_loss": -6.901621341705322, "global_step": 167879, "epoch": 3997} {"train_loss": -6.977168083190918, "global_step": 167880, "epoch": 3997} {"train_loss": -6.988494873046875, "global_step": 167881, "epoch": 3997} {"train_loss": -7.0356903076171875, "global_step": 167882, "epoch": 3997} {"train_loss": -6.890431880950928, "global_step": 167883, "epoch": 3997} {"train_loss": -6.949987411499023, "global_step": 167884, "epoch": 3997} {"train_loss": -6.991616249084473, "global_step": 167885, "epoch": 3997} {"train_loss": -6.958517074584961, "global_step": 167886, "epoch": 3997} {"train_loss": -7.065564155578613, "global_step": 167887, "epoch": 3997} {"train_loss": -6.946375846862793, "global_step": 167888, "epoch": 3997} {"train_loss": -7.00208854675293, "global_step": 167889, "epoch": 3997} {"train_loss": -7.039796352386475, "global_step": 167890, "epoch": 3997} {"train_loss": -6.981061935424805, "global_step": 167891, "epoch": 3997} {"train_loss": -7.0254621505737305, "global_step": 167892, "epoch": 3997} {"train_loss": -7.025284290313721, "global_step": 167893, "epoch": 3997} {"train_loss": -7.157907485961914, "global_step": 167894, "epoch": 3997} {"train_loss": -6.98784065246582, "global_step": 167895, "epoch": 3997} {"train_loss": -7.132044792175293, "global_step": 167896, "epoch": 3997} {"train_loss": -6.987772464752197, "global_step": 167897, "epoch": 3997} {"train_loss": -7.102795600891113, "global_step": 167898, "epoch": 3997} {"train_loss": -6.965319633483887, "global_step": 167899, "epoch": 3997} {"train_loss": -7.078649044036865, "global_step": 167900, "epoch": 3997} {"train_loss": -7.0963850021362305, "global_step": 167901, "epoch": 3997} {"train_loss": -7.060253143310547, "global_step": 167902, "epoch": 3997} {"train_loss": -7.12407112121582, "global_step": 167903, "epoch": 3997} {"train_loss": -7.01928186416626, "global_step": 167904, "epoch": 3997} {"train_loss": -6.958404541015625, "global_step": 167905, "epoch": 3997} {"train_loss": -7.039264678955078, "global_step": 167906, "epoch": 3997} {"train_loss": -7.0213704109191895, "global_step": 167907, "epoch": 3997} {"train_loss": -7.001105308532715, "global_step": 167908, "epoch": 3997} {"train_loss": -6.917238712310791, "global_step": 167909, "epoch": 3997} {"train_loss": -6.902742385864258, "global_step": 167910, "epoch": 3997} {"train_loss": -7.077070713043213, "global_step": 167911, "epoch": 3997} {"train_loss": -7.027359962463379, "global_step": 167912, "epoch": 3997} {"train_loss": -6.923103332519531, "global_step": 167913, "epoch": 3997} {"train_loss": -6.929511070251465, "global_step": 167914, "epoch": 3997} {"train_loss": -7.012495336078462, "global_step": 167915, "epoch": 3997, "val_loss": 68842.6640625} {"train_loss": -7.016308307647705, "global_step": 167916, "epoch": 3998} {"train_loss": -6.918023586273193, "global_step": 167917, "epoch": 3998} {"train_loss": -7.098794937133789, "global_step": 167918, "epoch": 3998} {"train_loss": -6.871881008148193, "global_step": 167919, "epoch": 3998} {"train_loss": -6.952022552490234, "global_step": 167920, "epoch": 3998} {"train_loss": -6.997008323669434, "global_step": 167921, "epoch": 3998} {"train_loss": -7.007265567779541, "global_step": 167922, "epoch": 3998} {"train_loss": -6.970798969268799, "global_step": 167923, "epoch": 3998} {"train_loss": -6.954081058502197, "global_step": 167924, "epoch": 3998} {"train_loss": -6.984345436096191, "global_step": 167925, "epoch": 3998} {"train_loss": -6.876058578491211, "global_step": 167926, "epoch": 3998} {"train_loss": -6.914266586303711, "global_step": 167927, "epoch": 3998} {"train_loss": -7.095609188079834, "global_step": 167928, "epoch": 3998} {"train_loss": -6.882376670837402, "global_step": 167929, "epoch": 3998} {"train_loss": -6.9435930252075195, "global_step": 167930, "epoch": 3998} {"train_loss": -7.016204833984375, "global_step": 167931, "epoch": 3998} {"train_loss": -6.923630714416504, "global_step": 167932, "epoch": 3998} {"train_loss": -6.796422004699707, "global_step": 167933, "epoch": 3998} {"train_loss": -6.927138805389404, "global_step": 167934, "epoch": 3998} {"train_loss": -6.963400840759277, "global_step": 167935, "epoch": 3998} {"train_loss": -6.9350056648254395, "global_step": 167936, "epoch": 3998} {"train_loss": -6.932508945465088, "global_step": 167937, "epoch": 3998} {"train_loss": -7.046415328979492, "global_step": 167938, "epoch": 3998} {"train_loss": -7.074306011199951, "global_step": 167939, "epoch": 3998} {"train_loss": -6.940489768981934, "global_step": 167940, "epoch": 3998} {"train_loss": -7.022760391235352, "global_step": 167941, "epoch": 3998} {"train_loss": -6.928851127624512, "global_step": 167942, "epoch": 3998} {"train_loss": -7.021954536437988, "global_step": 167943, "epoch": 3998} {"train_loss": -6.999505996704102, "global_step": 167944, "epoch": 3998} {"train_loss": -6.884293079376221, "global_step": 167945, "epoch": 3998} {"train_loss": -7.0136799812316895, "global_step": 167946, "epoch": 3998} {"train_loss": -6.9679670333862305, "global_step": 167947, "epoch": 3998} {"train_loss": -6.980758190155029, "global_step": 167948, "epoch": 3998} {"train_loss": -7.068996429443359, "global_step": 167949, "epoch": 3998} {"train_loss": -6.883098125457764, "global_step": 167950, "epoch": 3998} {"train_loss": -7.136292457580566, "global_step": 167951, "epoch": 3998} {"train_loss": -6.981627464294434, "global_step": 167952, "epoch": 3998} {"train_loss": -7.017767906188965, "global_step": 167953, "epoch": 3998} {"train_loss": -6.965763092041016, "global_step": 167954, "epoch": 3998} {"train_loss": -7.031212329864502, "global_step": 167955, "epoch": 3998} {"train_loss": -7.007776737213135, "global_step": 167956, "epoch": 3998} {"train_loss": -6.976413091023763, "global_step": 167957, "epoch": 3998, "val_loss": 68966.4296875} {"train_loss": -6.998660087585449, "global_step": 167958, "epoch": 3999} {"train_loss": -7.0739240646362305, "global_step": 167959, "epoch": 3999} {"train_loss": -7.072817802429199, "global_step": 167960, "epoch": 3999} {"train_loss": -6.840813159942627, "global_step": 167961, "epoch": 3999} {"train_loss": -7.054940223693848, "global_step": 167962, "epoch": 3999} {"train_loss": -7.054899215698242, "global_step": 167963, "epoch": 3999} {"train_loss": -7.020651340484619, "global_step": 167964, "epoch": 3999} {"train_loss": -7.020597457885742, "global_step": 167965, "epoch": 3999} {"train_loss": -6.968454837799072, "global_step": 167966, "epoch": 3999} {"train_loss": -6.9673542976379395, "global_step": 167967, "epoch": 3999} {"train_loss": -7.10213565826416, "global_step": 167968, "epoch": 3999} {"train_loss": -6.915666103363037, "global_step": 167969, "epoch": 3999} {"train_loss": -6.956118106842041, "global_step": 167970, "epoch": 3999} {"train_loss": -7.024777889251709, "global_step": 167971, "epoch": 3999} {"train_loss": -6.980583190917969, "global_step": 167972, "epoch": 3999} {"train_loss": -7.043633937835693, "global_step": 167973, "epoch": 3999} {"train_loss": -6.911984443664551, "global_step": 167974, "epoch": 3999} {"train_loss": -7.077456474304199, "global_step": 167975, "epoch": 3999} {"train_loss": -7.030828952789307, "global_step": 167976, "epoch": 3999} {"train_loss": -6.847595691680908, "global_step": 167977, "epoch": 3999} {"train_loss": -6.993450164794922, "global_step": 167978, "epoch": 3999} {"train_loss": -6.92362117767334, "global_step": 167979, "epoch": 3999} {"train_loss": -6.963451385498047, "global_step": 167980, "epoch": 3999} {"train_loss": -6.937817096710205, "global_step": 167981, "epoch": 3999} {"train_loss": -7.123240947723389, "global_step": 167982, "epoch": 3999} {"train_loss": -6.958545207977295, "global_step": 167983, "epoch": 3999} {"train_loss": -6.94866943359375, "global_step": 167984, "epoch": 3999} {"train_loss": -6.776879787445068, "global_step": 167985, "epoch": 3999} {"train_loss": -6.964187145233154, "global_step": 167986, "epoch": 3999} {"train_loss": -7.066249847412109, "global_step": 167987, "epoch": 3999} {"train_loss": -7.0383100509643555, "global_step": 167988, "epoch": 3999} {"train_loss": -6.941386699676514, "global_step": 167989, "epoch": 3999} {"train_loss": -6.984602451324463, "global_step": 167990, "epoch": 3999} {"train_loss": -6.986516952514648, "global_step": 167991, "epoch": 3999} {"train_loss": -7.135639667510986, "global_step": 167992, "epoch": 3999} {"train_loss": -6.945246696472168, "global_step": 167993, "epoch": 3999} {"train_loss": -6.935413360595703, "global_step": 167994, "epoch": 3999} {"train_loss": -6.928324222564697, "global_step": 167995, "epoch": 3999} {"train_loss": -7.077470779418945, "global_step": 167996, "epoch": 3999} {"train_loss": -7.109197616577148, "global_step": 167997, "epoch": 3999} {"train_loss": -7.03452205657959, "global_step": 167998, "epoch": 3999} {"train_loss": -6.994053874697004, "global_step": 167999, "epoch": 3999, "val_loss": 68840.390625} {"train_loss": -6.985309600830078, "global_step": 168000, "epoch": 4000} {"train_loss": -7.009096145629883, "global_step": 168001, "epoch": 4000} {"train_loss": -7.059509754180908, "global_step": 168002, "epoch": 4000} {"train_loss": -7.034322738647461, "global_step": 168003, "epoch": 4000} {"train_loss": -7.029644012451172, "global_step": 168004, "epoch": 4000} {"train_loss": -6.932114601135254, "global_step": 168005, "epoch": 4000} {"train_loss": -6.957188606262207, "global_step": 168006, "epoch": 4000} {"train_loss": -7.0012383460998535, "global_step": 168007, "epoch": 4000} {"train_loss": -6.992245674133301, "global_step": 168008, "epoch": 4000} {"train_loss": -6.950869083404541, "global_step": 168009, "epoch": 4000} {"train_loss": -7.071081161499023, "global_step": 168010, "epoch": 4000} {"train_loss": -7.085928440093994, "global_step": 168011, "epoch": 4000} {"train_loss": -7.127038955688477, "global_step": 168012, "epoch": 4000} {"train_loss": -7.031821250915527, "global_step": 168013, "epoch": 4000} {"train_loss": -7.0053019523620605, "global_step": 168014, "epoch": 4000} {"train_loss": -7.063196182250977, "global_step": 168015, "epoch": 4000} {"train_loss": -7.052780628204346, "global_step": 168016, "epoch": 4000} {"train_loss": -7.13565731048584, "global_step": 168017, "epoch": 4000} {"train_loss": -6.999965667724609, "global_step": 168018, "epoch": 4000} {"train_loss": -7.054217338562012, "global_step": 168019, "epoch": 4000} {"train_loss": -7.021927833557129, "global_step": 168020, "epoch": 4000} {"train_loss": -7.003177642822266, "global_step": 168021, "epoch": 4000} {"train_loss": -7.074037075042725, "global_step": 168022, "epoch": 4000} {"train_loss": -7.1362504959106445, "global_step": 168023, "epoch": 4000} {"train_loss": -7.036637306213379, "global_step": 168024, "epoch": 4000} {"train_loss": -7.138657093048096, "global_step": 168025, "epoch": 4000} {"train_loss": -7.102018356323242, "global_step": 168026, "epoch": 4000} {"train_loss": -7.089509963989258, "global_step": 168027, "epoch": 4000} {"train_loss": -7.100485801696777, "global_step": 168028, "epoch": 4000} {"train_loss": -7.207077980041504, "global_step": 168029, "epoch": 4000} {"train_loss": -6.9997148513793945, "global_step": 168030, "epoch": 4000} {"train_loss": -7.069120407104492, "global_step": 168031, "epoch": 4000} {"train_loss": -7.04440450668335, "global_step": 168032, "epoch": 4000} {"train_loss": -7.02453088760376, "global_step": 168033, "epoch": 4000} {"train_loss": -7.056005954742432, "global_step": 168034, "epoch": 4000} {"train_loss": -6.998734474182129, "global_step": 168035, "epoch": 4000} {"train_loss": -7.006247520446777, "global_step": 168036, "epoch": 4000} {"train_loss": -7.001380920410156, "global_step": 168037, "epoch": 4000} {"train_loss": -7.00675106048584, "global_step": 168038, "epoch": 4000} {"train_loss": -6.987363338470459, "global_step": 168039, "epoch": 4000} {"train_loss": -7.031729698181152, "global_step": 168040, "epoch": 4000} {"train_loss": -7.039933113824754, "global_step": 168041, "epoch": 4000, "train/sim_max_reward_0": 0.19261258872876097, "train/sim_max_reward_1": 0.9520613190604501, "train/sim_max_reward_2": 0.4653267270839971, "train/sim_max_reward_3": 0.993542814364235, "train/sim_max_reward_4": 0.9821935602197178, "train/sim_max_reward_5": 0.22213157279897394, "test/sim_max_reward_4300000": 0.2106961803280016, "test/sim_max_reward_4300001": 0.5235211101858603, "test/sim_max_reward_4300002": 0.9530543287502341, "test/sim_max_reward_4300003": 0.997779794565786, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8023139414986238, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 1.0, "test/sim_max_reward_4300008": 0.9360194560539511, "test/sim_max_reward_4300009": 0.9863076299064565, "test/sim_max_reward_4300010": 0.9329179162630681, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.967408705749757, "test/sim_max_reward_4300013": 0.4044959581120971, "test/sim_max_reward_4300014": 0.9942745585243804, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 1.0, "test/sim_max_reward_4300017": 0.6838442325515481, "test/sim_max_reward_4300018": 0.4016682024006327, "test/sim_max_reward_4300019": 0.18590318120870106, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.98642634053469, "test/sim_max_reward_4300022": 0.9244212352522905, "test/sim_max_reward_4300023": 0.32935934736316413, "test/sim_max_reward_4300024": 0.9544696178161454, "test/sim_max_reward_4300025": 0.3189094456641599, "test/sim_max_reward_4300026": 0.9223390893523395, "test/sim_max_reward_4300027": 0.9486522647231127, "test/sim_max_reward_4300028": 0.8943019685081615, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.16863980011131136, "test/sim_max_reward_4300031": 0.30202645448748106, "test/sim_max_reward_4300032": 0.9174363490093571, "test/sim_max_reward_4300033": 0.9485435126457196, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.41559538753374486, "test/sim_max_reward_4300036": 0.2069880100011738, "test/sim_max_reward_4300037": 0.7700723114426716, "test/sim_max_reward_4300038": 0.7529795032374111, "test/sim_max_reward_4300039": 0.9623496936031937, "test/sim_max_reward_4300040": 0.9132874204126868, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.9331347299586829, "test/sim_max_reward_4300043": 0.16056365056138844, "test/sim_max_reward_4300044": 0.8958611173912747, "test/sim_max_reward_4300045": 0.19416459164283215, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.10304359218094275, "test/sim_max_reward_4300048": 0.414173054795449, "test/sim_max_reward_4300049": 0.29994917780028235, "train/mean_score": 0.6346447637093559, "test/mean_score": 0.612674539338761, "val_loss": 69046.0703125} {"train_loss": -7.107505798339844, "global_step": 168042, "epoch": 4001} {"train_loss": -6.980564594268799, "global_step": 168043, "epoch": 4001} {"train_loss": -7.136965751647949, "global_step": 168044, "epoch": 4001} {"train_loss": -7.062880039215088, "global_step": 168045, "epoch": 4001} {"train_loss": -7.049422264099121, "global_step": 168046, "epoch": 4001} {"train_loss": -7.116057395935059, "global_step": 168047, "epoch": 4001} {"train_loss": -7.058560371398926, "global_step": 168048, "epoch": 4001} {"train_loss": -7.079287528991699, "global_step": 168049, "epoch": 4001} {"train_loss": -6.962398529052734, "global_step": 168050, "epoch": 4001} {"train_loss": -6.92092227935791, "global_step": 168051, "epoch": 4001} {"train_loss": -7.067314624786377, "global_step": 168052, "epoch": 4001} {"train_loss": -7.112471580505371, "global_step": 168053, "epoch": 4001} {"train_loss": -6.9938249588012695, "global_step": 168054, "epoch": 4001} {"train_loss": -7.073635101318359, "global_step": 168055, "epoch": 4001} {"train_loss": -7.052734375, "global_step": 168056, "epoch": 4001} {"train_loss": -7.056560516357422, "global_step": 168057, "epoch": 4001} {"train_loss": -7.055917739868164, "global_step": 168058, "epoch": 4001} {"train_loss": -7.045271873474121, "global_step": 168059, "epoch": 4001} {"train_loss": -7.031944274902344, "global_step": 168060, "epoch": 4001} {"train_loss": -7.017058849334717, "global_step": 168061, "epoch": 4001} {"train_loss": -7.1374735832214355, "global_step": 168062, "epoch": 4001} {"train_loss": -7.052430152893066, "global_step": 168063, "epoch": 4001} {"train_loss": -6.915529727935791, "global_step": 168064, "epoch": 4001} {"train_loss": -7.003026962280273, "global_step": 168065, "epoch": 4001} {"train_loss": -6.911654472351074, "global_step": 168066, "epoch": 4001} {"train_loss": -6.99269962310791, "global_step": 168067, "epoch": 4001} {"train_loss": -7.107780933380127, "global_step": 168068, "epoch": 4001} {"train_loss": -6.9148125648498535, "global_step": 168069, "epoch": 4001} {"train_loss": -6.860035419464111, "global_step": 168070, "epoch": 4001} {"train_loss": -7.163373947143555, "global_step": 168071, "epoch": 4001} {"train_loss": -7.01009464263916, "global_step": 168072, "epoch": 4001} {"train_loss": -6.9640421867370605, "global_step": 168073, "epoch": 4001} {"train_loss": -7.076883792877197, "global_step": 168074, "epoch": 4001} {"train_loss": -6.986833572387695, "global_step": 168075, "epoch": 4001} {"train_loss": -7.0476226806640625, "global_step": 168076, "epoch": 4001} {"train_loss": -7.13726806640625, "global_step": 168077, "epoch": 4001} {"train_loss": -7.218482971191406, "global_step": 168078, "epoch": 4001} {"train_loss": -6.995849132537842, "global_step": 168079, "epoch": 4001} {"train_loss": -7.044894218444824, "global_step": 168080, "epoch": 4001} {"train_loss": -7.091673851013184, "global_step": 168081, "epoch": 4001} {"train_loss": -7.1451263427734375, "global_step": 168082, "epoch": 4001} {"train_loss": -7.040553933098202, "global_step": 168083, "epoch": 4001, "val_loss": 68928.4375} {"train_loss": -7.016968250274658, "global_step": 168084, "epoch": 4002} {"train_loss": -6.971101760864258, "global_step": 168085, "epoch": 4002} {"train_loss": -7.107141494750977, "global_step": 168086, "epoch": 4002} {"train_loss": -7.047311305999756, "global_step": 168087, "epoch": 4002} {"train_loss": -7.064019680023193, "global_step": 168088, "epoch": 4002} {"train_loss": -7.108654022216797, "global_step": 168089, "epoch": 4002} {"train_loss": -7.0974273681640625, "global_step": 168090, "epoch": 4002} {"train_loss": -7.171162128448486, "global_step": 168091, "epoch": 4002} {"train_loss": -7.098907947540283, "global_step": 168092, "epoch": 4002} {"train_loss": -6.985201358795166, "global_step": 168093, "epoch": 4002} {"train_loss": -7.060687065124512, "global_step": 168094, "epoch": 4002} {"train_loss": -7.047773838043213, "global_step": 168095, "epoch": 4002} {"train_loss": -6.971103668212891, "global_step": 168096, "epoch": 4002} {"train_loss": -7.019129276275635, "global_step": 168097, "epoch": 4002} {"train_loss": -6.982123374938965, "global_step": 168098, "epoch": 4002} {"train_loss": -6.861001014709473, "global_step": 168099, "epoch": 4002} {"train_loss": -6.961662292480469, "global_step": 168100, "epoch": 4002} {"train_loss": -6.927463531494141, "global_step": 168101, "epoch": 4002} {"train_loss": -7.0246076583862305, "global_step": 168102, "epoch": 4002} {"train_loss": -7.089025497436523, "global_step": 168103, "epoch": 4002} {"train_loss": -6.993914604187012, "global_step": 168104, "epoch": 4002} {"train_loss": -6.885400772094727, "global_step": 168105, "epoch": 4002} {"train_loss": -7.081957817077637, "global_step": 168106, "epoch": 4002} {"train_loss": -6.929977893829346, "global_step": 168107, "epoch": 4002} {"train_loss": -6.928124904632568, "global_step": 168108, "epoch": 4002} {"train_loss": -7.123500823974609, "global_step": 168109, "epoch": 4002} {"train_loss": -6.87841796875, "global_step": 168110, "epoch": 4002} {"train_loss": -7.010679721832275, "global_step": 168111, "epoch": 4002} {"train_loss": -6.9155049324035645, "global_step": 168112, "epoch": 4002} {"train_loss": -6.836822509765625, "global_step": 168113, "epoch": 4002} {"train_loss": -6.9871015548706055, "global_step": 168114, "epoch": 4002} {"train_loss": -6.871710300445557, "global_step": 168115, "epoch": 4002} {"train_loss": -6.90434455871582, "global_step": 168116, "epoch": 4002} {"train_loss": -6.920836448669434, "global_step": 168117, "epoch": 4002} {"train_loss": -6.989410400390625, "global_step": 168118, "epoch": 4002} {"train_loss": -6.995471954345703, "global_step": 168119, "epoch": 4002} {"train_loss": -6.948997974395752, "global_step": 168120, "epoch": 4002} {"train_loss": -6.971395492553711, "global_step": 168121, "epoch": 4002} {"train_loss": -6.885425567626953, "global_step": 168122, "epoch": 4002} {"train_loss": -6.932502746582031, "global_step": 168123, "epoch": 4002} {"train_loss": -6.948794364929199, "global_step": 168124, "epoch": 4002} {"train_loss": -6.986676885968163, "global_step": 168125, "epoch": 4002, "val_loss": 69013.484375} {"train_loss": -6.976685523986816, "global_step": 168126, "epoch": 4003} {"train_loss": -6.999449253082275, "global_step": 168127, "epoch": 4003} {"train_loss": -7.0038981437683105, "global_step": 168128, "epoch": 4003} {"train_loss": -6.88472843170166, "global_step": 168129, "epoch": 4003} {"train_loss": -6.987215518951416, "global_step": 168130, "epoch": 4003} {"train_loss": -6.903590202331543, "global_step": 168131, "epoch": 4003} {"train_loss": -6.852873802185059, "global_step": 168132, "epoch": 4003} {"train_loss": -6.955432415008545, "global_step": 168133, "epoch": 4003} {"train_loss": -6.964570045471191, "global_step": 168134, "epoch": 4003} {"train_loss": -6.886619567871094, "global_step": 168135, "epoch": 4003} {"train_loss": -7.01418399810791, "global_step": 168136, "epoch": 4003} {"train_loss": -6.943872451782227, "global_step": 168137, "epoch": 4003} {"train_loss": -7.056910514831543, "global_step": 168138, "epoch": 4003} {"train_loss": -7.023211479187012, "global_step": 168139, "epoch": 4003} {"train_loss": -6.986313819885254, "global_step": 168140, "epoch": 4003} {"train_loss": -7.036959648132324, "global_step": 168141, "epoch": 4003} {"train_loss": -6.941635608673096, "global_step": 168142, "epoch": 4003} {"train_loss": -7.130486488342285, "global_step": 168143, "epoch": 4003} {"train_loss": -7.042841911315918, "global_step": 168144, "epoch": 4003} {"train_loss": -7.005617141723633, "global_step": 168145, "epoch": 4003} {"train_loss": -7.019116401672363, "global_step": 168146, "epoch": 4003} {"train_loss": -6.995161533355713, "global_step": 168147, "epoch": 4003} {"train_loss": -7.0569610595703125, "global_step": 168148, "epoch": 4003} {"train_loss": -7.033389091491699, "global_step": 168149, "epoch": 4003} {"train_loss": -6.957581520080566, "global_step": 168150, "epoch": 4003} {"train_loss": -7.051413536071777, "global_step": 168151, "epoch": 4003} {"train_loss": -6.912848949432373, "global_step": 168152, "epoch": 4003} {"train_loss": -6.981578826904297, "global_step": 168153, "epoch": 4003} {"train_loss": -7.002015113830566, "global_step": 168154, "epoch": 4003} {"train_loss": -7.0164384841918945, "global_step": 168155, "epoch": 4003} {"train_loss": -6.974635124206543, "global_step": 168156, "epoch": 4003} {"train_loss": -6.929166793823242, "global_step": 168157, "epoch": 4003} {"train_loss": -6.935402870178223, "global_step": 168158, "epoch": 4003} {"train_loss": -7.063396453857422, "global_step": 168159, "epoch": 4003} {"train_loss": -7.034592628479004, "global_step": 168160, "epoch": 4003} {"train_loss": -7.055810928344727, "global_step": 168161, "epoch": 4003} {"train_loss": -7.090482234954834, "global_step": 168162, "epoch": 4003} {"train_loss": -6.971877098083496, "global_step": 168163, "epoch": 4003} {"train_loss": -6.933651924133301, "global_step": 168164, "epoch": 4003} {"train_loss": -6.892767906188965, "global_step": 168165, "epoch": 4003} {"train_loss": -7.019959449768066, "global_step": 168166, "epoch": 4003} {"train_loss": -6.9844284284682505, "global_step": 168167, "epoch": 4003, "val_loss": 68967.5546875} {"train_loss": -6.79575252532959, "global_step": 168168, "epoch": 4004} {"train_loss": -6.831758975982666, "global_step": 168169, "epoch": 4004} {"train_loss": -6.631183624267578, "global_step": 168170, "epoch": 4004} {"train_loss": -6.868012428283691, "global_step": 168171, "epoch": 4004} {"train_loss": -6.571272850036621, "global_step": 168172, "epoch": 4004} {"train_loss": -6.777682304382324, "global_step": 168173, "epoch": 4004} {"train_loss": -6.623079299926758, "global_step": 168174, "epoch": 4004} {"train_loss": -6.780406475067139, "global_step": 168175, "epoch": 4004} {"train_loss": -6.801307678222656, "global_step": 168176, "epoch": 4004} {"train_loss": -6.893115043640137, "global_step": 168177, "epoch": 4004} {"train_loss": -6.805763244628906, "global_step": 168178, "epoch": 4004} {"train_loss": -6.850472927093506, "global_step": 168179, "epoch": 4004} {"train_loss": -6.823148250579834, "global_step": 168180, "epoch": 4004} {"train_loss": -6.997640132904053, "global_step": 168181, "epoch": 4004} {"train_loss": -6.902039527893066, "global_step": 168182, "epoch": 4004} {"train_loss": -6.948232650756836, "global_step": 168183, "epoch": 4004} {"train_loss": -6.861950397491455, "global_step": 168184, "epoch": 4004} {"train_loss": -6.996328830718994, "global_step": 168185, "epoch": 4004} {"train_loss": -6.901590347290039, "global_step": 168186, "epoch": 4004} {"train_loss": -6.997448921203613, "global_step": 168187, "epoch": 4004} {"train_loss": -6.896453380584717, "global_step": 168188, "epoch": 4004} {"train_loss": -6.912253379821777, "global_step": 168189, "epoch": 4004} {"train_loss": -6.945704936981201, "global_step": 168190, "epoch": 4004} {"train_loss": -6.912234306335449, "global_step": 168191, "epoch": 4004} {"train_loss": -6.967846393585205, "global_step": 168192, "epoch": 4004} {"train_loss": -6.916942119598389, "global_step": 168193, "epoch": 4004} {"train_loss": -6.977542400360107, "global_step": 168194, "epoch": 4004} {"train_loss": -6.92142391204834, "global_step": 168195, "epoch": 4004} {"train_loss": -6.926874160766602, "global_step": 168196, "epoch": 4004} {"train_loss": -6.94647741317749, "global_step": 168197, "epoch": 4004} {"train_loss": -7.01418399810791, "global_step": 168198, "epoch": 4004} {"train_loss": -7.067575454711914, "global_step": 168199, "epoch": 4004} {"train_loss": -6.986183166503906, "global_step": 168200, "epoch": 4004} {"train_loss": -7.001977920532227, "global_step": 168201, "epoch": 4004} {"train_loss": -6.941037654876709, "global_step": 168202, "epoch": 4004} {"train_loss": -6.995532035827637, "global_step": 168203, "epoch": 4004} {"train_loss": -7.093388557434082, "global_step": 168204, "epoch": 4004} {"train_loss": -7.008419990539551, "global_step": 168205, "epoch": 4004} {"train_loss": -6.9561920166015625, "global_step": 168206, "epoch": 4004} {"train_loss": -7.063579559326172, "global_step": 168207, "epoch": 4004} {"train_loss": -7.025599956512451, "global_step": 168208, "epoch": 4004} {"train_loss": -6.908749421437581, "global_step": 168209, "epoch": 4004, "val_loss": 68920.203125} {"train_loss": -7.113592147827148, "global_step": 168210, "epoch": 4005} {"train_loss": -6.955539226531982, "global_step": 168211, "epoch": 4005} {"train_loss": -7.060323715209961, "global_step": 168212, "epoch": 4005} {"train_loss": -6.955438613891602, "global_step": 168213, "epoch": 4005} {"train_loss": -7.027065277099609, "global_step": 168214, "epoch": 4005} {"train_loss": -7.0719194412231445, "global_step": 168215, "epoch": 4005} {"train_loss": -6.913168907165527, "global_step": 168216, "epoch": 4005} {"train_loss": -7.045425891876221, "global_step": 168217, "epoch": 4005} {"train_loss": -6.95497465133667, "global_step": 168218, "epoch": 4005} {"train_loss": -6.945810317993164, "global_step": 168219, "epoch": 4005} {"train_loss": -6.97028923034668, "global_step": 168220, "epoch": 4005} {"train_loss": -7.1553778648376465, "global_step": 168221, "epoch": 4005} {"train_loss": -6.907035827636719, "global_step": 168222, "epoch": 4005} {"train_loss": -6.995181560516357, "global_step": 168223, "epoch": 4005} {"train_loss": -6.918150901794434, "global_step": 168224, "epoch": 4005} {"train_loss": -7.192085266113281, "global_step": 168225, "epoch": 4005} {"train_loss": -7.098406791687012, "global_step": 168226, "epoch": 4005} {"train_loss": -7.057398796081543, "global_step": 168227, "epoch": 4005} {"train_loss": -7.114849090576172, "global_step": 168228, "epoch": 4005} {"train_loss": -7.050993919372559, "global_step": 168229, "epoch": 4005} {"train_loss": -7.096870422363281, "global_step": 168230, "epoch": 4005} {"train_loss": -6.998518943786621, "global_step": 168231, "epoch": 4005} {"train_loss": -7.069644927978516, "global_step": 168232, "epoch": 4005} {"train_loss": -7.12802791595459, "global_step": 168233, "epoch": 4005} {"train_loss": -6.968482971191406, "global_step": 168234, "epoch": 4005} {"train_loss": -7.108447074890137, "global_step": 168235, "epoch": 4005} {"train_loss": -7.088972568511963, "global_step": 168236, "epoch": 4005} {"train_loss": -7.055243968963623, "global_step": 168237, "epoch": 4005} {"train_loss": -7.017735958099365, "global_step": 168238, "epoch": 4005} {"train_loss": -7.164821624755859, "global_step": 168239, "epoch": 4005} {"train_loss": -7.0324883460998535, "global_step": 168240, "epoch": 4005} {"train_loss": -6.941652297973633, "global_step": 168241, "epoch": 4005} {"train_loss": -7.063621520996094, "global_step": 168242, "epoch": 4005} {"train_loss": -7.069777488708496, "global_step": 168243, "epoch": 4005} {"train_loss": -7.1432390213012695, "global_step": 168244, "epoch": 4005} {"train_loss": -7.168893814086914, "global_step": 168245, "epoch": 4005} {"train_loss": -7.123542785644531, "global_step": 168246, "epoch": 4005} {"train_loss": -7.11689567565918, "global_step": 168247, "epoch": 4005} {"train_loss": -7.0949554443359375, "global_step": 168248, "epoch": 4005} {"train_loss": -7.075462341308594, "global_step": 168249, "epoch": 4005} {"train_loss": -7.069847106933594, "global_step": 168250, "epoch": 4005} {"train_loss": -7.051400059745426, "global_step": 168251, "epoch": 4005, "val_loss": 68787.5390625} {"train_loss": -6.998589515686035, "global_step": 168252, "epoch": 4006} {"train_loss": -7.115963935852051, "global_step": 168253, "epoch": 4006} {"train_loss": -7.204136848449707, "global_step": 168254, "epoch": 4006} {"train_loss": -7.059171676635742, "global_step": 168255, "epoch": 4006} {"train_loss": -7.071043968200684, "global_step": 168256, "epoch": 4006} {"train_loss": -7.136695384979248, "global_step": 168257, "epoch": 4006} {"train_loss": -6.977838039398193, "global_step": 168258, "epoch": 4006} {"train_loss": -7.04303503036499, "global_step": 168259, "epoch": 4006} {"train_loss": -7.022139549255371, "global_step": 168260, "epoch": 4006} {"train_loss": -6.973888874053955, "global_step": 168261, "epoch": 4006} {"train_loss": -7.088985919952393, "global_step": 168262, "epoch": 4006} {"train_loss": -7.083548545837402, "global_step": 168263, "epoch": 4006} {"train_loss": -7.057923316955566, "global_step": 168264, "epoch": 4006} {"train_loss": -7.0660400390625, "global_step": 168265, "epoch": 4006} {"train_loss": -6.9304962158203125, "global_step": 168266, "epoch": 4006} {"train_loss": -6.994983673095703, "global_step": 168267, "epoch": 4006} {"train_loss": -6.880921363830566, "global_step": 168268, "epoch": 4006} {"train_loss": -6.901504993438721, "global_step": 168269, "epoch": 4006} {"train_loss": -6.986761093139648, "global_step": 168270, "epoch": 4006} {"train_loss": -6.9606757164001465, "global_step": 168271, "epoch": 4006} {"train_loss": -6.675065040588379, "global_step": 168272, "epoch": 4006} {"train_loss": -6.925195693969727, "global_step": 168273, "epoch": 4006} {"train_loss": -6.665402889251709, "global_step": 168274, "epoch": 4006} {"train_loss": -6.8473591804504395, "global_step": 168275, "epoch": 4006} {"train_loss": -6.835511207580566, "global_step": 168276, "epoch": 4006} {"train_loss": -6.618430137634277, "global_step": 168277, "epoch": 4006} {"train_loss": -6.874534606933594, "global_step": 168278, "epoch": 4006} {"train_loss": -6.579682350158691, "global_step": 168279, "epoch": 4006} {"train_loss": -6.92300271987915, "global_step": 168280, "epoch": 4006} {"train_loss": -6.796298027038574, "global_step": 168281, "epoch": 4006} {"train_loss": -6.9472174644470215, "global_step": 168282, "epoch": 4006} {"train_loss": -6.7430419921875, "global_step": 168283, "epoch": 4006} {"train_loss": -6.893258094787598, "global_step": 168284, "epoch": 4006} {"train_loss": -6.915151596069336, "global_step": 168285, "epoch": 4006} {"train_loss": -6.923774719238281, "global_step": 168286, "epoch": 4006} {"train_loss": -6.850571155548096, "global_step": 168287, "epoch": 4006} {"train_loss": -6.969081878662109, "global_step": 168288, "epoch": 4006} {"train_loss": -6.959623336791992, "global_step": 168289, "epoch": 4006} {"train_loss": -7.042028427124023, "global_step": 168290, "epoch": 4006} {"train_loss": -6.8692827224731445, "global_step": 168291, "epoch": 4006} {"train_loss": -6.971136569976807, "global_step": 168292, "epoch": 4006} {"train_loss": -6.938069150561378, "global_step": 168293, "epoch": 4006, "val_loss": 68953.765625} {"train_loss": -7.0072808265686035, "global_step": 168294, "epoch": 4007} {"train_loss": -6.880936622619629, "global_step": 168295, "epoch": 4007} {"train_loss": -6.948440074920654, "global_step": 168296, "epoch": 4007} {"train_loss": -6.920626640319824, "global_step": 168297, "epoch": 4007} {"train_loss": -6.9744768142700195, "global_step": 168298, "epoch": 4007} {"train_loss": -6.9572272300720215, "global_step": 168299, "epoch": 4007} {"train_loss": -6.965408802032471, "global_step": 168300, "epoch": 4007} {"train_loss": -7.0787177085876465, "global_step": 168301, "epoch": 4007} {"train_loss": -6.962697505950928, "global_step": 168302, "epoch": 4007} {"train_loss": -7.08153772354126, "global_step": 168303, "epoch": 4007} {"train_loss": -6.914267539978027, "global_step": 168304, "epoch": 4007} {"train_loss": -6.897884368896484, "global_step": 168305, "epoch": 4007} {"train_loss": -7.082769393920898, "global_step": 168306, "epoch": 4007} {"train_loss": -6.96732234954834, "global_step": 168307, "epoch": 4007} {"train_loss": -6.958439826965332, "global_step": 168308, "epoch": 4007} {"train_loss": -7.06218147277832, "global_step": 168309, "epoch": 4007} {"train_loss": -7.059329509735107, "global_step": 168310, "epoch": 4007} {"train_loss": -6.932440280914307, "global_step": 168311, "epoch": 4007} {"train_loss": -7.0432047843933105, "global_step": 168312, "epoch": 4007} {"train_loss": -6.981668472290039, "global_step": 168313, "epoch": 4007} {"train_loss": -6.886134147644043, "global_step": 168314, "epoch": 4007} {"train_loss": -7.026602745056152, "global_step": 168315, "epoch": 4007} {"train_loss": -7.067403316497803, "global_step": 168316, "epoch": 4007} {"train_loss": -7.041112899780273, "global_step": 168317, "epoch": 4007} {"train_loss": -7.027281761169434, "global_step": 168318, "epoch": 4007} {"train_loss": -7.101896286010742, "global_step": 168319, "epoch": 4007} {"train_loss": -7.038856506347656, "global_step": 168320, "epoch": 4007} {"train_loss": -7.007970809936523, "global_step": 168321, "epoch": 4007} {"train_loss": -7.02861213684082, "global_step": 168322, "epoch": 4007} {"train_loss": -6.915309429168701, "global_step": 168323, "epoch": 4007} {"train_loss": -6.997508525848389, "global_step": 168324, "epoch": 4007} {"train_loss": -7.085865497589111, "global_step": 168325, "epoch": 4007} {"train_loss": -6.988539218902588, "global_step": 168326, "epoch": 4007} {"train_loss": -6.951178550720215, "global_step": 168327, "epoch": 4007} {"train_loss": -7.033134460449219, "global_step": 168328, "epoch": 4007} {"train_loss": -7.017327308654785, "global_step": 168329, "epoch": 4007} {"train_loss": -7.0102081298828125, "global_step": 168330, "epoch": 4007} {"train_loss": -7.003775119781494, "global_step": 168331, "epoch": 4007} {"train_loss": -6.966485023498535, "global_step": 168332, "epoch": 4007} {"train_loss": -7.005497932434082, "global_step": 168333, "epoch": 4007} {"train_loss": -7.07275915145874, "global_step": 168334, "epoch": 4007} {"train_loss": -7.00242018699646, "global_step": 168335, "epoch": 4007, "val_loss": 68851.984375} {"train_loss": -7.022661209106445, "global_step": 168336, "epoch": 4008} {"train_loss": -6.980210304260254, "global_step": 168337, "epoch": 4008} {"train_loss": -7.050737380981445, "global_step": 168338, "epoch": 4008} {"train_loss": -6.987658500671387, "global_step": 168339, "epoch": 4008} {"train_loss": -7.077991485595703, "global_step": 168340, "epoch": 4008} {"train_loss": -7.012202262878418, "global_step": 168341, "epoch": 4008} {"train_loss": -7.0479230880737305, "global_step": 168342, "epoch": 4008} {"train_loss": -7.175061225891113, "global_step": 168343, "epoch": 4008} {"train_loss": -6.964757442474365, "global_step": 168344, "epoch": 4008} {"train_loss": -6.984428405761719, "global_step": 168345, "epoch": 4008} {"train_loss": -7.179573059082031, "global_step": 168346, "epoch": 4008} {"train_loss": -6.991853713989258, "global_step": 168347, "epoch": 4008} {"train_loss": -7.070156574249268, "global_step": 168348, "epoch": 4008} {"train_loss": -7.139194011688232, "global_step": 168349, "epoch": 4008} {"train_loss": -7.031253814697266, "global_step": 168350, "epoch": 4008} {"train_loss": -7.029806137084961, "global_step": 168351, "epoch": 4008} {"train_loss": -6.9956536293029785, "global_step": 168352, "epoch": 4008} {"train_loss": -6.994447708129883, "global_step": 168353, "epoch": 4008} {"train_loss": -6.996056079864502, "global_step": 168354, "epoch": 4008} {"train_loss": -7.049062728881836, "global_step": 168355, "epoch": 4008} {"train_loss": -7.021716117858887, "global_step": 168356, "epoch": 4008} {"train_loss": -7.123182773590088, "global_step": 168357, "epoch": 4008} {"train_loss": -7.115795612335205, "global_step": 168358, "epoch": 4008} {"train_loss": -6.864659309387207, "global_step": 168359, "epoch": 4008} {"train_loss": -6.963841438293457, "global_step": 168360, "epoch": 4008} {"train_loss": -7.0633745193481445, "global_step": 168361, "epoch": 4008} {"train_loss": -6.878406524658203, "global_step": 168362, "epoch": 4008} {"train_loss": -7.070766448974609, "global_step": 168363, "epoch": 4008} {"train_loss": -6.917614936828613, "global_step": 168364, "epoch": 4008} {"train_loss": -6.9463911056518555, "global_step": 168365, "epoch": 4008} {"train_loss": -7.0073089599609375, "global_step": 168366, "epoch": 4008} {"train_loss": -7.061978340148926, "global_step": 168367, "epoch": 4008} {"train_loss": -7.022879123687744, "global_step": 168368, "epoch": 4008} {"train_loss": -7.049245834350586, "global_step": 168369, "epoch": 4008} {"train_loss": -6.983264446258545, "global_step": 168370, "epoch": 4008} {"train_loss": -6.9084577560424805, "global_step": 168371, "epoch": 4008} {"train_loss": -7.053380489349365, "global_step": 168372, "epoch": 4008} {"train_loss": -6.958130359649658, "global_step": 168373, "epoch": 4008} {"train_loss": -6.9610490798950195, "global_step": 168374, "epoch": 4008} {"train_loss": -6.8972368240356445, "global_step": 168375, "epoch": 4008} {"train_loss": -6.984856605529785, "global_step": 168376, "epoch": 4008} {"train_loss": -7.016786450431461, "global_step": 168377, "epoch": 4008, "val_loss": 68700.8515625} {"train_loss": -6.883603096008301, "global_step": 168378, "epoch": 4009} {"train_loss": -7.009520530700684, "global_step": 168379, "epoch": 4009} {"train_loss": -6.901484966278076, "global_step": 168380, "epoch": 4009} {"train_loss": -6.944737434387207, "global_step": 168381, "epoch": 4009} {"train_loss": -6.926443099975586, "global_step": 168382, "epoch": 4009} {"train_loss": -6.923493385314941, "global_step": 168383, "epoch": 4009} {"train_loss": -7.092013359069824, "global_step": 168384, "epoch": 4009} {"train_loss": -6.891774654388428, "global_step": 168385, "epoch": 4009} {"train_loss": -7.007443904876709, "global_step": 168386, "epoch": 4009} {"train_loss": -7.017595291137695, "global_step": 168387, "epoch": 4009} {"train_loss": -6.957832336425781, "global_step": 168388, "epoch": 4009} {"train_loss": -6.966651916503906, "global_step": 168389, "epoch": 4009} {"train_loss": -6.956496238708496, "global_step": 168390, "epoch": 4009} {"train_loss": -6.96666145324707, "global_step": 168391, "epoch": 4009} {"train_loss": -7.07342004776001, "global_step": 168392, "epoch": 4009} {"train_loss": -7.077570915222168, "global_step": 168393, "epoch": 4009} {"train_loss": -6.955697536468506, "global_step": 168394, "epoch": 4009} {"train_loss": -7.078046798706055, "global_step": 168395, "epoch": 4009} {"train_loss": -7.089092254638672, "global_step": 168396, "epoch": 4009} {"train_loss": -7.03671932220459, "global_step": 168397, "epoch": 4009} {"train_loss": -7.08784294128418, "global_step": 168398, "epoch": 4009} {"train_loss": -6.97738790512085, "global_step": 168399, "epoch": 4009} {"train_loss": -7.078454971313477, "global_step": 168400, "epoch": 4009} {"train_loss": -7.019791603088379, "global_step": 168401, "epoch": 4009} {"train_loss": -6.923519134521484, "global_step": 168402, "epoch": 4009} {"train_loss": -6.976639270782471, "global_step": 168403, "epoch": 4009} {"train_loss": -6.937108516693115, "global_step": 168404, "epoch": 4009} {"train_loss": -6.952099323272705, "global_step": 168405, "epoch": 4009} {"train_loss": -6.967668533325195, "global_step": 168406, "epoch": 4009} {"train_loss": -6.981996536254883, "global_step": 168407, "epoch": 4009} {"train_loss": -6.956027984619141, "global_step": 168408, "epoch": 4009} {"train_loss": -6.971151351928711, "global_step": 168409, "epoch": 4009} {"train_loss": -7.070210933685303, "global_step": 168410, "epoch": 4009} {"train_loss": -7.060741424560547, "global_step": 168411, "epoch": 4009} {"train_loss": -7.041754245758057, "global_step": 168412, "epoch": 4009} {"train_loss": -6.949038028717041, "global_step": 168413, "epoch": 4009} {"train_loss": -6.954168319702148, "global_step": 168414, "epoch": 4009} {"train_loss": -7.091339111328125, "global_step": 168415, "epoch": 4009} {"train_loss": -7.0312933921813965, "global_step": 168416, "epoch": 4009} {"train_loss": -6.882299423217773, "global_step": 168417, "epoch": 4009} {"train_loss": -7.140970230102539, "global_step": 168418, "epoch": 4009} {"train_loss": -6.996709040233067, "global_step": 168419, "epoch": 4009, "val_loss": 68866.3984375} {"train_loss": -7.135587215423584, "global_step": 168420, "epoch": 4010} {"train_loss": -7.088205337524414, "global_step": 168421, "epoch": 4010} {"train_loss": -6.982265949249268, "global_step": 168422, "epoch": 4010} {"train_loss": -7.091300010681152, "global_step": 168423, "epoch": 4010} {"train_loss": -7.116406440734863, "global_step": 168424, "epoch": 4010} {"train_loss": -7.155409336090088, "global_step": 168425, "epoch": 4010} {"train_loss": -7.102780818939209, "global_step": 168426, "epoch": 4010} {"train_loss": -7.087289810180664, "global_step": 168427, "epoch": 4010} {"train_loss": -7.1375908851623535, "global_step": 168428, "epoch": 4010} {"train_loss": -7.104765892028809, "global_step": 168429, "epoch": 4010} {"train_loss": -7.080635070800781, "global_step": 168430, "epoch": 4010} {"train_loss": -7.012121200561523, "global_step": 168431, "epoch": 4010} {"train_loss": -7.11595344543457, "global_step": 168432, "epoch": 4010} {"train_loss": -7.104755878448486, "global_step": 168433, "epoch": 4010} {"train_loss": -7.023585319519043, "global_step": 168434, "epoch": 4010} {"train_loss": -7.004993438720703, "global_step": 168435, "epoch": 4010} {"train_loss": -7.064572334289551, "global_step": 168436, "epoch": 4010} {"train_loss": -7.239398002624512, "global_step": 168437, "epoch": 4010} {"train_loss": -7.124576091766357, "global_step": 168438, "epoch": 4010} {"train_loss": -7.212636947631836, "global_step": 168439, "epoch": 4010} {"train_loss": -7.082570552825928, "global_step": 168440, "epoch": 4010} {"train_loss": -7.059370040893555, "global_step": 168441, "epoch": 4010} {"train_loss": -7.1116132736206055, "global_step": 168442, "epoch": 4010} {"train_loss": -7.013850212097168, "global_step": 168443, "epoch": 4010} {"train_loss": -7.126800537109375, "global_step": 168444, "epoch": 4010} {"train_loss": -6.990121364593506, "global_step": 168445, "epoch": 4010} {"train_loss": -6.998229026794434, "global_step": 168446, "epoch": 4010} {"train_loss": -7.1651811599731445, "global_step": 168447, "epoch": 4010} {"train_loss": -7.043435096740723, "global_step": 168448, "epoch": 4010} {"train_loss": -7.0280046463012695, "global_step": 168449, "epoch": 4010} {"train_loss": -7.078812599182129, "global_step": 168450, "epoch": 4010} {"train_loss": -7.0285210609436035, "global_step": 168451, "epoch": 4010} {"train_loss": -6.897341728210449, "global_step": 168452, "epoch": 4010} {"train_loss": -7.023432731628418, "global_step": 168453, "epoch": 4010} {"train_loss": -6.993749141693115, "global_step": 168454, "epoch": 4010} {"train_loss": -7.044315338134766, "global_step": 168455, "epoch": 4010} {"train_loss": -7.0628838539123535, "global_step": 168456, "epoch": 4010} {"train_loss": -6.98707389831543, "global_step": 168457, "epoch": 4010} {"train_loss": -6.961480617523193, "global_step": 168458, "epoch": 4010} {"train_loss": -7.066108703613281, "global_step": 168459, "epoch": 4010} {"train_loss": -6.989537715911865, "global_step": 168460, "epoch": 4010} {"train_loss": -7.065546103886196, "global_step": 168461, "epoch": 4010, "val_loss": 68801.2578125} {"train_loss": -7.086261749267578, "global_step": 168462, "epoch": 4011} {"train_loss": -6.889878273010254, "global_step": 168463, "epoch": 4011} {"train_loss": -7.0522260665893555, "global_step": 168464, "epoch": 4011} {"train_loss": -7.011502265930176, "global_step": 168465, "epoch": 4011} {"train_loss": -7.01181697845459, "global_step": 168466, "epoch": 4011} {"train_loss": -7.1071977615356445, "global_step": 168467, "epoch": 4011} {"train_loss": -7.117531776428223, "global_step": 168468, "epoch": 4011} {"train_loss": -7.058419227600098, "global_step": 168469, "epoch": 4011} {"train_loss": -7.090890884399414, "global_step": 168470, "epoch": 4011} {"train_loss": -6.930487632751465, "global_step": 168471, "epoch": 4011} {"train_loss": -6.79896354675293, "global_step": 168472, "epoch": 4011} {"train_loss": -6.87660551071167, "global_step": 168473, "epoch": 4011} {"train_loss": -6.871260643005371, "global_step": 168474, "epoch": 4011} {"train_loss": -6.852934837341309, "global_step": 168475, "epoch": 4011} {"train_loss": -6.930375099182129, "global_step": 168476, "epoch": 4011} {"train_loss": -7.051858901977539, "global_step": 168477, "epoch": 4011} {"train_loss": -6.99704122543335, "global_step": 168478, "epoch": 4011} {"train_loss": -6.906214714050293, "global_step": 168479, "epoch": 4011} {"train_loss": -7.011710166931152, "global_step": 168480, "epoch": 4011} {"train_loss": -7.043028831481934, "global_step": 168481, "epoch": 4011} {"train_loss": -7.028885364532471, "global_step": 168482, "epoch": 4011} {"train_loss": -7.049827575683594, "global_step": 168483, "epoch": 4011} {"train_loss": -7.003307819366455, "global_step": 168484, "epoch": 4011} {"train_loss": -7.04287576675415, "global_step": 168485, "epoch": 4011} {"train_loss": -7.037039756774902, "global_step": 168486, "epoch": 4011} {"train_loss": -7.002902984619141, "global_step": 168487, "epoch": 4011} {"train_loss": -6.964953422546387, "global_step": 168488, "epoch": 4011} {"train_loss": -7.099634170532227, "global_step": 168489, "epoch": 4011} {"train_loss": -7.1283769607543945, "global_step": 168490, "epoch": 4011} {"train_loss": -7.032621383666992, "global_step": 168491, "epoch": 4011} {"train_loss": -7.079756259918213, "global_step": 168492, "epoch": 4011} {"train_loss": -7.122115135192871, "global_step": 168493, "epoch": 4011} {"train_loss": -7.043560981750488, "global_step": 168494, "epoch": 4011} {"train_loss": -7.047951698303223, "global_step": 168495, "epoch": 4011} {"train_loss": -7.0946455001831055, "global_step": 168496, "epoch": 4011} {"train_loss": -7.146263122558594, "global_step": 168497, "epoch": 4011} {"train_loss": -7.096706390380859, "global_step": 168498, "epoch": 4011} {"train_loss": -6.931703567504883, "global_step": 168499, "epoch": 4011} {"train_loss": -7.0888166427612305, "global_step": 168500, "epoch": 4011} {"train_loss": -7.104530334472656, "global_step": 168501, "epoch": 4011} {"train_loss": -7.0070905685424805, "global_step": 168502, "epoch": 4011} {"train_loss": -7.02239111491612, "global_step": 168503, "epoch": 4011, "val_loss": 68809.0625} {"train_loss": -7.1544294357299805, "global_step": 168504, "epoch": 4012} {"train_loss": -7.110841751098633, "global_step": 168505, "epoch": 4012} {"train_loss": -7.073456287384033, "global_step": 168506, "epoch": 4012} {"train_loss": -7.082354545593262, "global_step": 168507, "epoch": 4012} {"train_loss": -7.0244951248168945, "global_step": 168508, "epoch": 4012} {"train_loss": -7.083132743835449, "global_step": 168509, "epoch": 4012} {"train_loss": -7.12459659576416, "global_step": 168510, "epoch": 4012} {"train_loss": -7.060922622680664, "global_step": 168511, "epoch": 4012} {"train_loss": -7.085879325866699, "global_step": 168512, "epoch": 4012} {"train_loss": -7.041173934936523, "global_step": 168513, "epoch": 4012} {"train_loss": -7.0709614753723145, "global_step": 168514, "epoch": 4012} {"train_loss": -6.99161434173584, "global_step": 168515, "epoch": 4012} {"train_loss": -7.0238189697265625, "global_step": 168516, "epoch": 4012} {"train_loss": -7.0740556716918945, "global_step": 168517, "epoch": 4012} {"train_loss": -7.054542541503906, "global_step": 168518, "epoch": 4012} {"train_loss": -7.01612663269043, "global_step": 168519, "epoch": 4012} {"train_loss": -7.108550071716309, "global_step": 168520, "epoch": 4012} {"train_loss": -7.116565704345703, "global_step": 168521, "epoch": 4012} {"train_loss": -7.045729637145996, "global_step": 168522, "epoch": 4012} {"train_loss": -6.917389869689941, "global_step": 168523, "epoch": 4012} {"train_loss": -6.932181358337402, "global_step": 168524, "epoch": 4012} {"train_loss": -7.059351921081543, "global_step": 168525, "epoch": 4012} {"train_loss": -6.917003154754639, "global_step": 168526, "epoch": 4012} {"train_loss": -6.942949295043945, "global_step": 168527, "epoch": 4012} {"train_loss": -7.034285068511963, "global_step": 168528, "epoch": 4012} {"train_loss": -6.968801498413086, "global_step": 168529, "epoch": 4012} {"train_loss": -6.925543308258057, "global_step": 168530, "epoch": 4012} {"train_loss": -6.859582901000977, "global_step": 168531, "epoch": 4012} {"train_loss": -7.0884246826171875, "global_step": 168532, "epoch": 4012} {"train_loss": -6.809385299682617, "global_step": 168533, "epoch": 4012} {"train_loss": -7.022136211395264, "global_step": 168534, "epoch": 4012} {"train_loss": -6.949193954467773, "global_step": 168535, "epoch": 4012} {"train_loss": -6.882417678833008, "global_step": 168536, "epoch": 4012} {"train_loss": -7.006168842315674, "global_step": 168537, "epoch": 4012} {"train_loss": -6.975780010223389, "global_step": 168538, "epoch": 4012} {"train_loss": -7.004553318023682, "global_step": 168539, "epoch": 4012} {"train_loss": -6.8682732582092285, "global_step": 168540, "epoch": 4012} {"train_loss": -6.994668960571289, "global_step": 168541, "epoch": 4012} {"train_loss": -6.962079048156738, "global_step": 168542, "epoch": 4012} {"train_loss": -7.015969753265381, "global_step": 168543, "epoch": 4012} {"train_loss": -7.003788948059082, "global_step": 168544, "epoch": 4012} {"train_loss": -7.009179648898897, "global_step": 168545, "epoch": 4012, "val_loss": 69088.6953125} {"train_loss": -7.120650291442871, "global_step": 168546, "epoch": 4013} {"train_loss": -6.8862528800964355, "global_step": 168547, "epoch": 4013} {"train_loss": -7.062277317047119, "global_step": 168548, "epoch": 4013} {"train_loss": -7.108634948730469, "global_step": 168549, "epoch": 4013} {"train_loss": -6.983155727386475, "global_step": 168550, "epoch": 4013} {"train_loss": -7.007322788238525, "global_step": 168551, "epoch": 4013} {"train_loss": -7.0349016189575195, "global_step": 168552, "epoch": 4013} {"train_loss": -6.990555286407471, "global_step": 168553, "epoch": 4013} {"train_loss": -7.0717878341674805, "global_step": 168554, "epoch": 4013} {"train_loss": -6.988508224487305, "global_step": 168555, "epoch": 4013} {"train_loss": -6.936318397521973, "global_step": 168556, "epoch": 4013} {"train_loss": -6.913978576660156, "global_step": 168557, "epoch": 4013} {"train_loss": -6.977445602416992, "global_step": 168558, "epoch": 4013} {"train_loss": -7.005266189575195, "global_step": 168559, "epoch": 4013} {"train_loss": -6.973360538482666, "global_step": 168560, "epoch": 4013} {"train_loss": -7.023486137390137, "global_step": 168561, "epoch": 4013} {"train_loss": -6.954170227050781, "global_step": 168562, "epoch": 4013} {"train_loss": -6.943564414978027, "global_step": 168563, "epoch": 4013} {"train_loss": -6.972920894622803, "global_step": 168564, "epoch": 4013} {"train_loss": -6.935729026794434, "global_step": 168565, "epoch": 4013} {"train_loss": -6.983478546142578, "global_step": 168566, "epoch": 4013} {"train_loss": -6.975749969482422, "global_step": 168567, "epoch": 4013} {"train_loss": -7.0860676765441895, "global_step": 168568, "epoch": 4013} {"train_loss": -6.940871715545654, "global_step": 168569, "epoch": 4013} {"train_loss": -7.007692337036133, "global_step": 168570, "epoch": 4013} {"train_loss": -7.025210380554199, "global_step": 168571, "epoch": 4013} {"train_loss": -7.109396457672119, "global_step": 168572, "epoch": 4013} {"train_loss": -7.109942436218262, "global_step": 168573, "epoch": 4013} {"train_loss": -6.935420989990234, "global_step": 168574, "epoch": 4013} {"train_loss": -6.945907115936279, "global_step": 168575, "epoch": 4013} {"train_loss": -6.978994369506836, "global_step": 168576, "epoch": 4013} {"train_loss": -6.9583916664123535, "global_step": 168577, "epoch": 4013} {"train_loss": -7.090339660644531, "global_step": 168578, "epoch": 4013} {"train_loss": -7.038219451904297, "global_step": 168579, "epoch": 4013} {"train_loss": -6.984988212585449, "global_step": 168580, "epoch": 4013} {"train_loss": -7.057631015777588, "global_step": 168581, "epoch": 4013} {"train_loss": -7.119712829589844, "global_step": 168582, "epoch": 4013} {"train_loss": -6.970722198486328, "global_step": 168583, "epoch": 4013} {"train_loss": -7.064872741699219, "global_step": 168584, "epoch": 4013} {"train_loss": -7.048043727874756, "global_step": 168585, "epoch": 4013} {"train_loss": -7.059316635131836, "global_step": 168586, "epoch": 4013} {"train_loss": -7.009033486956642, "global_step": 168587, "epoch": 4013, "val_loss": 68924.03125} {"train_loss": -7.081218719482422, "global_step": 168588, "epoch": 4014} {"train_loss": -7.017329216003418, "global_step": 168589, "epoch": 4014} {"train_loss": -7.049661636352539, "global_step": 168590, "epoch": 4014} {"train_loss": -6.953910827636719, "global_step": 168591, "epoch": 4014} {"train_loss": -7.037402153015137, "global_step": 168592, "epoch": 4014} {"train_loss": -7.042022705078125, "global_step": 168593, "epoch": 4014} {"train_loss": -6.980215549468994, "global_step": 168594, "epoch": 4014} {"train_loss": -7.0290117263793945, "global_step": 168595, "epoch": 4014} {"train_loss": -6.867229461669922, "global_step": 168596, "epoch": 4014} {"train_loss": -7.0711517333984375, "global_step": 168597, "epoch": 4014} {"train_loss": -7.019359111785889, "global_step": 168598, "epoch": 4014} {"train_loss": -6.947660446166992, "global_step": 168599, "epoch": 4014} {"train_loss": -7.054948806762695, "global_step": 168600, "epoch": 4014} {"train_loss": -7.102640151977539, "global_step": 168601, "epoch": 4014} {"train_loss": -7.035717010498047, "global_step": 168602, "epoch": 4014} {"train_loss": -6.989678859710693, "global_step": 168603, "epoch": 4014} {"train_loss": -7.060024261474609, "global_step": 168604, "epoch": 4014} {"train_loss": -7.103899955749512, "global_step": 168605, "epoch": 4014} {"train_loss": -7.009269714355469, "global_step": 168606, "epoch": 4014} {"train_loss": -7.058626174926758, "global_step": 168607, "epoch": 4014} {"train_loss": -6.780967712402344, "global_step": 168608, "epoch": 4014} {"train_loss": -6.9027509689331055, "global_step": 168609, "epoch": 4014} {"train_loss": -7.098455429077148, "global_step": 168610, "epoch": 4014} {"train_loss": -6.972403526306152, "global_step": 168611, "epoch": 4014} {"train_loss": -6.972204685211182, "global_step": 168612, "epoch": 4014} {"train_loss": -6.998605728149414, "global_step": 168613, "epoch": 4014} {"train_loss": -6.987763404846191, "global_step": 168614, "epoch": 4014} {"train_loss": -6.986780166625977, "global_step": 168615, "epoch": 4014} {"train_loss": -7.031394958496094, "global_step": 168616, "epoch": 4014} {"train_loss": -6.900705337524414, "global_step": 168617, "epoch": 4014} {"train_loss": -7.030125141143799, "global_step": 168618, "epoch": 4014} {"train_loss": -7.031811714172363, "global_step": 168619, "epoch": 4014} {"train_loss": -6.916376113891602, "global_step": 168620, "epoch": 4014} {"train_loss": -6.963996410369873, "global_step": 168621, "epoch": 4014} {"train_loss": -6.929514408111572, "global_step": 168622, "epoch": 4014} {"train_loss": -6.976790428161621, "global_step": 168623, "epoch": 4014} {"train_loss": -6.950528144836426, "global_step": 168624, "epoch": 4014} {"train_loss": -6.932336807250977, "global_step": 168625, "epoch": 4014} {"train_loss": -6.947484016418457, "global_step": 168626, "epoch": 4014} {"train_loss": -7.015632152557373, "global_step": 168627, "epoch": 4014} {"train_loss": -6.912014007568359, "global_step": 168628, "epoch": 4014} {"train_loss": -6.99071817171006, "global_step": 168629, "epoch": 4014, "val_loss": 69195.0234375} {"train_loss": -6.914793968200684, "global_step": 168630, "epoch": 4015} {"train_loss": -6.855585098266602, "global_step": 168631, "epoch": 4015} {"train_loss": -7.036245822906494, "global_step": 168632, "epoch": 4015} {"train_loss": -6.793440818786621, "global_step": 168633, "epoch": 4015} {"train_loss": -6.8115692138671875, "global_step": 168634, "epoch": 4015} {"train_loss": -6.97977352142334, "global_step": 168635, "epoch": 4015} {"train_loss": -6.549299240112305, "global_step": 168636, "epoch": 4015} {"train_loss": -6.969083309173584, "global_step": 168637, "epoch": 4015} {"train_loss": -6.914259433746338, "global_step": 168638, "epoch": 4015} {"train_loss": -7.097987174987793, "global_step": 168639, "epoch": 4015} {"train_loss": -7.024223804473877, "global_step": 168640, "epoch": 4015} {"train_loss": -6.923269271850586, "global_step": 168641, "epoch": 4015} {"train_loss": -6.865588188171387, "global_step": 168642, "epoch": 4015} {"train_loss": -7.007962226867676, "global_step": 168643, "epoch": 4015} {"train_loss": -6.994708061218262, "global_step": 168644, "epoch": 4015} {"train_loss": -6.929815292358398, "global_step": 168645, "epoch": 4015} {"train_loss": -7.07303524017334, "global_step": 168646, "epoch": 4015} {"train_loss": -6.981235504150391, "global_step": 168647, "epoch": 4015} {"train_loss": -6.855439186096191, "global_step": 168648, "epoch": 4015} {"train_loss": -7.031432151794434, "global_step": 168649, "epoch": 4015} {"train_loss": -7.0425872802734375, "global_step": 168650, "epoch": 4015} {"train_loss": -7.043302536010742, "global_step": 168651, "epoch": 4015} {"train_loss": -7.112998962402344, "global_step": 168652, "epoch": 4015} {"train_loss": -7.108477592468262, "global_step": 168653, "epoch": 4015} {"train_loss": -7.073369979858398, "global_step": 168654, "epoch": 4015} {"train_loss": -6.998199462890625, "global_step": 168655, "epoch": 4015} {"train_loss": -7.067914962768555, "global_step": 168656, "epoch": 4015} {"train_loss": -7.103947639465332, "global_step": 168657, "epoch": 4015} {"train_loss": -6.988035678863525, "global_step": 168658, "epoch": 4015} {"train_loss": -7.08562707901001, "global_step": 168659, "epoch": 4015} {"train_loss": -7.080799579620361, "global_step": 168660, "epoch": 4015} {"train_loss": -7.010329723358154, "global_step": 168661, "epoch": 4015} {"train_loss": -6.987332344055176, "global_step": 168662, "epoch": 4015} {"train_loss": -6.999227523803711, "global_step": 168663, "epoch": 4015} {"train_loss": -7.071462631225586, "global_step": 168664, "epoch": 4015} {"train_loss": -6.97084903717041, "global_step": 168665, "epoch": 4015} {"train_loss": -6.953230381011963, "global_step": 168666, "epoch": 4015} {"train_loss": -7.023338317871094, "global_step": 168667, "epoch": 4015} {"train_loss": -7.009180068969727, "global_step": 168668, "epoch": 4015} {"train_loss": -6.977888107299805, "global_step": 168669, "epoch": 4015} {"train_loss": -7.009769439697266, "global_step": 168670, "epoch": 4015} {"train_loss": -6.986553771155221, "global_step": 168671, "epoch": 4015, "val_loss": 68884.625} {"train_loss": -6.951801300048828, "global_step": 168672, "epoch": 4016} {"train_loss": -7.073227405548096, "global_step": 168673, "epoch": 4016} {"train_loss": -7.046768665313721, "global_step": 168674, "epoch": 4016} {"train_loss": -7.019503593444824, "global_step": 168675, "epoch": 4016} {"train_loss": -6.964364528656006, "global_step": 168676, "epoch": 4016} {"train_loss": -6.983458518981934, "global_step": 168677, "epoch": 4016} {"train_loss": -7.039639472961426, "global_step": 168678, "epoch": 4016} {"train_loss": -6.9407548904418945, "global_step": 168679, "epoch": 4016} {"train_loss": -7.013309001922607, "global_step": 168680, "epoch": 4016} {"train_loss": -6.884535312652588, "global_step": 168681, "epoch": 4016} {"train_loss": -7.062067031860352, "global_step": 168682, "epoch": 4016} {"train_loss": -6.925224781036377, "global_step": 168683, "epoch": 4016} {"train_loss": -6.871935844421387, "global_step": 168684, "epoch": 4016} {"train_loss": -6.959963798522949, "global_step": 168685, "epoch": 4016} {"train_loss": -7.068993091583252, "global_step": 168686, "epoch": 4016} {"train_loss": -6.746526718139648, "global_step": 168687, "epoch": 4016} {"train_loss": -6.95644474029541, "global_step": 168688, "epoch": 4016} {"train_loss": -6.7941083908081055, "global_step": 168689, "epoch": 4016} {"train_loss": -7.005299091339111, "global_step": 168690, "epoch": 4016} {"train_loss": -6.935803413391113, "global_step": 168691, "epoch": 4016} {"train_loss": -7.025656700134277, "global_step": 168692, "epoch": 4016} {"train_loss": -6.99544620513916, "global_step": 168693, "epoch": 4016} {"train_loss": -6.97368860244751, "global_step": 168694, "epoch": 4016} {"train_loss": -7.014495849609375, "global_step": 168695, "epoch": 4016} {"train_loss": -6.954360485076904, "global_step": 168696, "epoch": 4016} {"train_loss": -6.939221382141113, "global_step": 168697, "epoch": 4016} {"train_loss": -7.031152725219727, "global_step": 168698, "epoch": 4016} {"train_loss": -6.913645267486572, "global_step": 168699, "epoch": 4016} {"train_loss": -7.040083885192871, "global_step": 168700, "epoch": 4016} {"train_loss": -6.853382110595703, "global_step": 168701, "epoch": 4016} {"train_loss": -7.106163501739502, "global_step": 168702, "epoch": 4016} {"train_loss": -6.912802696228027, "global_step": 168703, "epoch": 4016} {"train_loss": -6.973018646240234, "global_step": 168704, "epoch": 4016} {"train_loss": -6.874973297119141, "global_step": 168705, "epoch": 4016} {"train_loss": -6.963680744171143, "global_step": 168706, "epoch": 4016} {"train_loss": -6.946288585662842, "global_step": 168707, "epoch": 4016} {"train_loss": -6.948003768920898, "global_step": 168708, "epoch": 4016} {"train_loss": -6.959840774536133, "global_step": 168709, "epoch": 4016} {"train_loss": -7.074098587036133, "global_step": 168710, "epoch": 4016} {"train_loss": -7.060638427734375, "global_step": 168711, "epoch": 4016} {"train_loss": -7.072298049926758, "global_step": 168712, "epoch": 4016} {"train_loss": -6.972622031257266, "global_step": 168713, "epoch": 4016, "val_loss": 68889.3125} {"train_loss": -7.054473400115967, "global_step": 168714, "epoch": 4017} {"train_loss": -6.9571943283081055, "global_step": 168715, "epoch": 4017} {"train_loss": -7.112876892089844, "global_step": 168716, "epoch": 4017} {"train_loss": -7.065141677856445, "global_step": 168717, "epoch": 4017} {"train_loss": -7.042494773864746, "global_step": 168718, "epoch": 4017} {"train_loss": -7.089186191558838, "global_step": 168719, "epoch": 4017} {"train_loss": -6.9975762367248535, "global_step": 168720, "epoch": 4017} {"train_loss": -7.112766265869141, "global_step": 168721, "epoch": 4017} {"train_loss": -7.120456695556641, "global_step": 168722, "epoch": 4017} {"train_loss": -7.01388692855835, "global_step": 168723, "epoch": 4017} {"train_loss": -7.058929443359375, "global_step": 168724, "epoch": 4017} {"train_loss": -7.067586898803711, "global_step": 168725, "epoch": 4017} {"train_loss": -7.077540397644043, "global_step": 168726, "epoch": 4017} {"train_loss": -6.947080612182617, "global_step": 168727, "epoch": 4017} {"train_loss": -6.915543079376221, "global_step": 168728, "epoch": 4017} {"train_loss": -7.109917163848877, "global_step": 168729, "epoch": 4017} {"train_loss": -6.941033840179443, "global_step": 168730, "epoch": 4017} {"train_loss": -6.951874256134033, "global_step": 168731, "epoch": 4017} {"train_loss": -7.0318756103515625, "global_step": 168732, "epoch": 4017} {"train_loss": -7.011538982391357, "global_step": 168733, "epoch": 4017} {"train_loss": -6.917839050292969, "global_step": 168734, "epoch": 4017} {"train_loss": -6.927781105041504, "global_step": 168735, "epoch": 4017} {"train_loss": -7.019026756286621, "global_step": 168736, "epoch": 4017} {"train_loss": -6.944878578186035, "global_step": 168737, "epoch": 4017} {"train_loss": -6.816556930541992, "global_step": 168738, "epoch": 4017} {"train_loss": -7.042253494262695, "global_step": 168739, "epoch": 4017} {"train_loss": -6.879335880279541, "global_step": 168740, "epoch": 4017} {"train_loss": -7.007829666137695, "global_step": 168741, "epoch": 4017} {"train_loss": -6.958547115325928, "global_step": 168742, "epoch": 4017} {"train_loss": -6.887569427490234, "global_step": 168743, "epoch": 4017} {"train_loss": -7.023110389709473, "global_step": 168744, "epoch": 4017} {"train_loss": -6.838249206542969, "global_step": 168745, "epoch": 4017} {"train_loss": -7.011849403381348, "global_step": 168746, "epoch": 4017} {"train_loss": -6.86527156829834, "global_step": 168747, "epoch": 4017} {"train_loss": -6.980036735534668, "global_step": 168748, "epoch": 4017} {"train_loss": -7.001180648803711, "global_step": 168749, "epoch": 4017} {"train_loss": -6.922154426574707, "global_step": 168750, "epoch": 4017} {"train_loss": -6.942286014556885, "global_step": 168751, "epoch": 4017} {"train_loss": -6.943540573120117, "global_step": 168752, "epoch": 4017} {"train_loss": -7.077120780944824, "global_step": 168753, "epoch": 4017} {"train_loss": -6.883411407470703, "global_step": 168754, "epoch": 4017} {"train_loss": -6.992094210215977, "global_step": 168755, "epoch": 4017, "val_loss": 68832.4375} {"train_loss": -6.908699035644531, "global_step": 168756, "epoch": 4018} {"train_loss": -6.902226448059082, "global_step": 168757, "epoch": 4018} {"train_loss": -6.664179801940918, "global_step": 168758, "epoch": 4018} {"train_loss": -7.084780693054199, "global_step": 168759, "epoch": 4018} {"train_loss": -6.986678123474121, "global_step": 168760, "epoch": 4018} {"train_loss": -6.863827705383301, "global_step": 168761, "epoch": 4018} {"train_loss": -6.8733015060424805, "global_step": 168762, "epoch": 4018} {"train_loss": -6.970601558685303, "global_step": 168763, "epoch": 4018} {"train_loss": -6.834986209869385, "global_step": 168764, "epoch": 4018} {"train_loss": -6.829799652099609, "global_step": 168765, "epoch": 4018} {"train_loss": -6.898548126220703, "global_step": 168766, "epoch": 4018} {"train_loss": -7.002821922302246, "global_step": 168767, "epoch": 4018} {"train_loss": -6.9991254806518555, "global_step": 168768, "epoch": 4018} {"train_loss": -7.00248384475708, "global_step": 168769, "epoch": 4018} {"train_loss": -6.881773948669434, "global_step": 168770, "epoch": 4018} {"train_loss": -6.9216179847717285, "global_step": 168771, "epoch": 4018} {"train_loss": -6.907031059265137, "global_step": 168772, "epoch": 4018} {"train_loss": -6.861440181732178, "global_step": 168773, "epoch": 4018} {"train_loss": -6.978493690490723, "global_step": 168774, "epoch": 4018} {"train_loss": -6.852714538574219, "global_step": 168775, "epoch": 4018} {"train_loss": -6.909882068634033, "global_step": 168776, "epoch": 4018} {"train_loss": -6.939830303192139, "global_step": 168777, "epoch": 4018} {"train_loss": -6.987919807434082, "global_step": 168778, "epoch": 4018} {"train_loss": -6.91389274597168, "global_step": 168779, "epoch": 4018} {"train_loss": -7.10243034362793, "global_step": 168780, "epoch": 4018} {"train_loss": -6.845476150512695, "global_step": 168781, "epoch": 4018} {"train_loss": -6.954575538635254, "global_step": 168782, "epoch": 4018} {"train_loss": -6.913209915161133, "global_step": 168783, "epoch": 4018} {"train_loss": -6.980172157287598, "global_step": 168784, "epoch": 4018} {"train_loss": -6.741543769836426, "global_step": 168785, "epoch": 4018} {"train_loss": -7.012184143066406, "global_step": 168786, "epoch": 4018} {"train_loss": -6.753963470458984, "global_step": 168787, "epoch": 4018} {"train_loss": -7.020890235900879, "global_step": 168788, "epoch": 4018} {"train_loss": -7.002036094665527, "global_step": 168789, "epoch": 4018} {"train_loss": -7.018329620361328, "global_step": 168790, "epoch": 4018} {"train_loss": -6.959934711456299, "global_step": 168791, "epoch": 4018} {"train_loss": -7.027154922485352, "global_step": 168792, "epoch": 4018} {"train_loss": -6.916715621948242, "global_step": 168793, "epoch": 4018} {"train_loss": -7.054635047912598, "global_step": 168794, "epoch": 4018} {"train_loss": -6.9827680587768555, "global_step": 168795, "epoch": 4018} {"train_loss": -6.937575340270996, "global_step": 168796, "epoch": 4018} {"train_loss": -6.932340360823131, "global_step": 168797, "epoch": 4018, "val_loss": 68850.78125} {"train_loss": -7.090470314025879, "global_step": 168798, "epoch": 4019} {"train_loss": -7.042691230773926, "global_step": 168799, "epoch": 4019} {"train_loss": -7.019863605499268, "global_step": 168800, "epoch": 4019} {"train_loss": -6.92977237701416, "global_step": 168801, "epoch": 4019} {"train_loss": -6.944144248962402, "global_step": 168802, "epoch": 4019} {"train_loss": -7.0938720703125, "global_step": 168803, "epoch": 4019} {"train_loss": -7.122153282165527, "global_step": 168804, "epoch": 4019} {"train_loss": -7.1641974449157715, "global_step": 168805, "epoch": 4019} {"train_loss": -7.083740234375, "global_step": 168806, "epoch": 4019} {"train_loss": -7.065982818603516, "global_step": 168807, "epoch": 4019} {"train_loss": -7.015991687774658, "global_step": 168808, "epoch": 4019} {"train_loss": -7.113155841827393, "global_step": 168809, "epoch": 4019} {"train_loss": -7.069149017333984, "global_step": 168810, "epoch": 4019} {"train_loss": -7.0194902420043945, "global_step": 168811, "epoch": 4019} {"train_loss": -7.145862579345703, "global_step": 168812, "epoch": 4019} {"train_loss": -7.137537479400635, "global_step": 168813, "epoch": 4019} {"train_loss": -7.0500688552856445, "global_step": 168814, "epoch": 4019} {"train_loss": -7.010870933532715, "global_step": 168815, "epoch": 4019} {"train_loss": -7.124296188354492, "global_step": 168816, "epoch": 4019} {"train_loss": -7.062740325927734, "global_step": 168817, "epoch": 4019} {"train_loss": -6.983977317810059, "global_step": 168818, "epoch": 4019} {"train_loss": -7.058680534362793, "global_step": 168819, "epoch": 4019} {"train_loss": -7.086100101470947, "global_step": 168820, "epoch": 4019} {"train_loss": -7.037895202636719, "global_step": 168821, "epoch": 4019} {"train_loss": -7.0756449699401855, "global_step": 168822, "epoch": 4019} {"train_loss": -7.130751609802246, "global_step": 168823, "epoch": 4019} {"train_loss": -6.973825454711914, "global_step": 168824, "epoch": 4019} {"train_loss": -7.021565914154053, "global_step": 168825, "epoch": 4019} {"train_loss": -7.098444938659668, "global_step": 168826, "epoch": 4019} {"train_loss": -6.889987945556641, "global_step": 168827, "epoch": 4019} {"train_loss": -7.021270751953125, "global_step": 168828, "epoch": 4019} {"train_loss": -7.1248273849487305, "global_step": 168829, "epoch": 4019} {"train_loss": -6.96390438079834, "global_step": 168830, "epoch": 4019} {"train_loss": -6.9297590255737305, "global_step": 168831, "epoch": 4019} {"train_loss": -6.920058250427246, "global_step": 168832, "epoch": 4019} {"train_loss": -7.091025352478027, "global_step": 168833, "epoch": 4019} {"train_loss": -6.853086471557617, "global_step": 168834, "epoch": 4019} {"train_loss": -7.0140604972839355, "global_step": 168835, "epoch": 4019} {"train_loss": -6.98311185836792, "global_step": 168836, "epoch": 4019} {"train_loss": -6.830558776855469, "global_step": 168837, "epoch": 4019} {"train_loss": -7.018892288208008, "global_step": 168838, "epoch": 4019} {"train_loss": -7.034254312515259, "global_step": 168839, "epoch": 4019, "val_loss": 69006.890625} {"train_loss": -6.898648262023926, "global_step": 168840, "epoch": 4020} {"train_loss": -6.987408638000488, "global_step": 168841, "epoch": 4020} {"train_loss": -6.929969310760498, "global_step": 168842, "epoch": 4020} {"train_loss": -7.07255744934082, "global_step": 168843, "epoch": 4020} {"train_loss": -6.910789489746094, "global_step": 168844, "epoch": 4020} {"train_loss": -6.950640678405762, "global_step": 168845, "epoch": 4020} {"train_loss": -6.987992286682129, "global_step": 168846, "epoch": 4020} {"train_loss": -7.004131317138672, "global_step": 168847, "epoch": 4020} {"train_loss": -7.098114013671875, "global_step": 168848, "epoch": 4020} {"train_loss": -6.954217910766602, "global_step": 168849, "epoch": 4020} {"train_loss": -6.999044418334961, "global_step": 168850, "epoch": 4020} {"train_loss": -6.8104248046875, "global_step": 168851, "epoch": 4020} {"train_loss": -6.963354587554932, "global_step": 168852, "epoch": 4020} {"train_loss": -6.885482311248779, "global_step": 168853, "epoch": 4020} {"train_loss": -6.879087448120117, "global_step": 168854, "epoch": 4020} {"train_loss": -7.090163230895996, "global_step": 168855, "epoch": 4020} {"train_loss": -6.912437438964844, "global_step": 168856, "epoch": 4020} {"train_loss": -7.044083595275879, "global_step": 168857, "epoch": 4020} {"train_loss": -7.0055460929870605, "global_step": 168858, "epoch": 4020} {"train_loss": -7.071150779724121, "global_step": 168859, "epoch": 4020} {"train_loss": -7.09670877456665, "global_step": 168860, "epoch": 4020} {"train_loss": -6.885156631469727, "global_step": 168861, "epoch": 4020} {"train_loss": -6.9644389152526855, "global_step": 168862, "epoch": 4020} {"train_loss": -7.038646697998047, "global_step": 168863, "epoch": 4020} {"train_loss": -7.012038230895996, "global_step": 168864, "epoch": 4020} {"train_loss": -6.8819379806518555, "global_step": 168865, "epoch": 4020} {"train_loss": -6.966678142547607, "global_step": 168866, "epoch": 4020} {"train_loss": -7.082345962524414, "global_step": 168867, "epoch": 4020} {"train_loss": -6.763734817504883, "global_step": 168868, "epoch": 4020} {"train_loss": -6.97558069229126, "global_step": 168869, "epoch": 4020} {"train_loss": -7.022593975067139, "global_step": 168870, "epoch": 4020} {"train_loss": -6.893835067749023, "global_step": 168871, "epoch": 4020} {"train_loss": -7.026852607727051, "global_step": 168872, "epoch": 4020} {"train_loss": -6.901571273803711, "global_step": 168873, "epoch": 4020} {"train_loss": -6.884049415588379, "global_step": 168874, "epoch": 4020} {"train_loss": -7.034148216247559, "global_step": 168875, "epoch": 4020} {"train_loss": -6.900787353515625, "global_step": 168876, "epoch": 4020} {"train_loss": -6.979121208190918, "global_step": 168877, "epoch": 4020} {"train_loss": -6.913213729858398, "global_step": 168878, "epoch": 4020} {"train_loss": -6.882110595703125, "global_step": 168879, "epoch": 4020} {"train_loss": -6.955575942993164, "global_step": 168880, "epoch": 4020} {"train_loss": -6.962367159979684, "global_step": 168881, "epoch": 4020, "val_loss": 69071.3203125} {"train_loss": -6.866057872772217, "global_step": 168882, "epoch": 4021} {"train_loss": -6.980651378631592, "global_step": 168883, "epoch": 4021} {"train_loss": -6.935626029968262, "global_step": 168884, "epoch": 4021} {"train_loss": -6.961535453796387, "global_step": 168885, "epoch": 4021} {"train_loss": -6.908962726593018, "global_step": 168886, "epoch": 4021} {"train_loss": -6.913966655731201, "global_step": 168887, "epoch": 4021} {"train_loss": -6.843043804168701, "global_step": 168888, "epoch": 4021} {"train_loss": -7.010858058929443, "global_step": 168889, "epoch": 4021} {"train_loss": -6.95745849609375, "global_step": 168890, "epoch": 4021} {"train_loss": -6.983095169067383, "global_step": 168891, "epoch": 4021} {"train_loss": -6.905786514282227, "global_step": 168892, "epoch": 4021} {"train_loss": -6.933742523193359, "global_step": 168893, "epoch": 4021} {"train_loss": -6.843232154846191, "global_step": 168894, "epoch": 4021} {"train_loss": -6.875122547149658, "global_step": 168895, "epoch": 4021} {"train_loss": -6.989513397216797, "global_step": 168896, "epoch": 4021} {"train_loss": -6.9892730712890625, "global_step": 168897, "epoch": 4021} {"train_loss": -6.980345726013184, "global_step": 168898, "epoch": 4021} {"train_loss": -6.957039833068848, "global_step": 168899, "epoch": 4021} {"train_loss": -6.9034905433654785, "global_step": 168900, "epoch": 4021} {"train_loss": -7.0276923179626465, "global_step": 168901, "epoch": 4021} {"train_loss": -6.868361949920654, "global_step": 168902, "epoch": 4021} {"train_loss": -6.92515754699707, "global_step": 168903, "epoch": 4021} {"train_loss": -6.884439945220947, "global_step": 168904, "epoch": 4021} {"train_loss": -6.964001655578613, "global_step": 168905, "epoch": 4021} {"train_loss": -6.929746627807617, "global_step": 168906, "epoch": 4021} {"train_loss": -6.934319496154785, "global_step": 168907, "epoch": 4021} {"train_loss": -7.045668125152588, "global_step": 168908, "epoch": 4021} {"train_loss": -6.896388053894043, "global_step": 168909, "epoch": 4021} {"train_loss": -6.926662921905518, "global_step": 168910, "epoch": 4021} {"train_loss": -6.982210159301758, "global_step": 168911, "epoch": 4021} {"train_loss": -6.936836242675781, "global_step": 168912, "epoch": 4021} {"train_loss": -6.947880744934082, "global_step": 168913, "epoch": 4021} {"train_loss": -6.8901567459106445, "global_step": 168914, "epoch": 4021} {"train_loss": -7.031162261962891, "global_step": 168915, "epoch": 4021} {"train_loss": -7.0485615730285645, "global_step": 168916, "epoch": 4021} {"train_loss": -6.955746173858643, "global_step": 168917, "epoch": 4021} {"train_loss": -6.990670204162598, "global_step": 168918, "epoch": 4021} {"train_loss": -6.987340927124023, "global_step": 168919, "epoch": 4021} {"train_loss": -7.115850448608398, "global_step": 168920, "epoch": 4021} {"train_loss": -7.070244789123535, "global_step": 168921, "epoch": 4021} {"train_loss": -7.060452938079834, "global_step": 168922, "epoch": 4021} {"train_loss": -6.957578511465163, "global_step": 168923, "epoch": 4021, "val_loss": 69053.3046875} {"train_loss": -7.078348159790039, "global_step": 168924, "epoch": 4022} {"train_loss": -6.95194673538208, "global_step": 168925, "epoch": 4022} {"train_loss": -7.036158561706543, "global_step": 168926, "epoch": 4022} {"train_loss": -6.943902492523193, "global_step": 168927, "epoch": 4022} {"train_loss": -7.1655449867248535, "global_step": 168928, "epoch": 4022} {"train_loss": -6.943159103393555, "global_step": 168929, "epoch": 4022} {"train_loss": -7.0311737060546875, "global_step": 168930, "epoch": 4022} {"train_loss": -7.066194534301758, "global_step": 168931, "epoch": 4022} {"train_loss": -7.0491743087768555, "global_step": 168932, "epoch": 4022} {"train_loss": -7.1200032234191895, "global_step": 168933, "epoch": 4022} {"train_loss": -7.019927978515625, "global_step": 168934, "epoch": 4022} {"train_loss": -6.913565635681152, "global_step": 168935, "epoch": 4022} {"train_loss": -7.044388294219971, "global_step": 168936, "epoch": 4022} {"train_loss": -7.165977478027344, "global_step": 168937, "epoch": 4022} {"train_loss": -7.053281784057617, "global_step": 168938, "epoch": 4022} {"train_loss": -7.1708455085754395, "global_step": 168939, "epoch": 4022} {"train_loss": -6.948223114013672, "global_step": 168940, "epoch": 4022} {"train_loss": -7.11198616027832, "global_step": 168941, "epoch": 4022} {"train_loss": -7.048862934112549, "global_step": 168942, "epoch": 4022} {"train_loss": -7.049766540527344, "global_step": 168943, "epoch": 4022} {"train_loss": -7.061934947967529, "global_step": 168944, "epoch": 4022} {"train_loss": -7.006462097167969, "global_step": 168945, "epoch": 4022} {"train_loss": -7.009156227111816, "global_step": 168946, "epoch": 4022} {"train_loss": -7.130263328552246, "global_step": 168947, "epoch": 4022} {"train_loss": -7.07419490814209, "global_step": 168948, "epoch": 4022} {"train_loss": -7.041207313537598, "global_step": 168949, "epoch": 4022} {"train_loss": -7.106106758117676, "global_step": 168950, "epoch": 4022} {"train_loss": -7.099429130554199, "global_step": 168951, "epoch": 4022} {"train_loss": -7.116955757141113, "global_step": 168952, "epoch": 4022} {"train_loss": -7.090236186981201, "global_step": 168953, "epoch": 4022} {"train_loss": -7.133910655975342, "global_step": 168954, "epoch": 4022} {"train_loss": -7.115170478820801, "global_step": 168955, "epoch": 4022} {"train_loss": -7.044842720031738, "global_step": 168956, "epoch": 4022} {"train_loss": -7.143244743347168, "global_step": 168957, "epoch": 4022} {"train_loss": -7.1320929527282715, "global_step": 168958, "epoch": 4022} {"train_loss": -7.128935813903809, "global_step": 168959, "epoch": 4022} {"train_loss": -7.114367485046387, "global_step": 168960, "epoch": 4022} {"train_loss": -7.001868724822998, "global_step": 168961, "epoch": 4022} {"train_loss": -7.128944396972656, "global_step": 168962, "epoch": 4022} {"train_loss": -7.211438179016113, "global_step": 168963, "epoch": 4022} {"train_loss": -7.074099063873291, "global_step": 168964, "epoch": 4022} {"train_loss": -7.0717840648832775, "global_step": 168965, "epoch": 4022, "val_loss": 68993.78125} {"train_loss": -7.147943019866943, "global_step": 168966, "epoch": 4023} {"train_loss": -7.082122325897217, "global_step": 168967, "epoch": 4023} {"train_loss": -7.149893760681152, "global_step": 168968, "epoch": 4023} {"train_loss": -7.209922790527344, "global_step": 168969, "epoch": 4023} {"train_loss": -6.9943766593933105, "global_step": 168970, "epoch": 4023} {"train_loss": -7.1108832359313965, "global_step": 168971, "epoch": 4023} {"train_loss": -7.023542404174805, "global_step": 168972, "epoch": 4023} {"train_loss": -7.069823265075684, "global_step": 168973, "epoch": 4023} {"train_loss": -7.170797348022461, "global_step": 168974, "epoch": 4023} {"train_loss": -7.244840621948242, "global_step": 168975, "epoch": 4023} {"train_loss": -7.037688255310059, "global_step": 168976, "epoch": 4023} {"train_loss": -7.02640438079834, "global_step": 168977, "epoch": 4023} {"train_loss": -7.12858772277832, "global_step": 168978, "epoch": 4023} {"train_loss": -7.183248519897461, "global_step": 168979, "epoch": 4023} {"train_loss": -7.026020050048828, "global_step": 168980, "epoch": 4023} {"train_loss": -7.072413921356201, "global_step": 168981, "epoch": 4023} {"train_loss": -7.068288326263428, "global_step": 168982, "epoch": 4023} {"train_loss": -7.013038635253906, "global_step": 168983, "epoch": 4023} {"train_loss": -6.976629734039307, "global_step": 168984, "epoch": 4023} {"train_loss": -7.070345401763916, "global_step": 168985, "epoch": 4023} {"train_loss": -7.12211799621582, "global_step": 168986, "epoch": 4023} {"train_loss": -7.13897705078125, "global_step": 168987, "epoch": 4023} {"train_loss": -6.957406044006348, "global_step": 168988, "epoch": 4023} {"train_loss": -7.015087127685547, "global_step": 168989, "epoch": 4023} {"train_loss": -7.009539604187012, "global_step": 168990, "epoch": 4023} {"train_loss": -7.0549468994140625, "global_step": 168991, "epoch": 4023} {"train_loss": -6.995868682861328, "global_step": 168992, "epoch": 4023} {"train_loss": -7.060308933258057, "global_step": 168993, "epoch": 4023} {"train_loss": -7.178142547607422, "global_step": 168994, "epoch": 4023} {"train_loss": -6.99109411239624, "global_step": 168995, "epoch": 4023} {"train_loss": -6.962773323059082, "global_step": 168996, "epoch": 4023} {"train_loss": -6.931788921356201, "global_step": 168997, "epoch": 4023} {"train_loss": -6.99551248550415, "global_step": 168998, "epoch": 4023} {"train_loss": -7.006569862365723, "global_step": 168999, "epoch": 4023} {"train_loss": -7.010221004486084, "global_step": 169000, "epoch": 4023} {"train_loss": -6.924106597900391, "global_step": 169001, "epoch": 4023} {"train_loss": -6.946264266967773, "global_step": 169002, "epoch": 4023} {"train_loss": -6.925276279449463, "global_step": 169003, "epoch": 4023} {"train_loss": -6.976330757141113, "global_step": 169004, "epoch": 4023} {"train_loss": -6.996656894683838, "global_step": 169005, "epoch": 4023} {"train_loss": -6.808384895324707, "global_step": 169006, "epoch": 4023} {"train_loss": -7.041922433035714, "global_step": 169007, "epoch": 4023, "val_loss": 68818.0390625} {"train_loss": -6.866332530975342, "global_step": 169008, "epoch": 4024} {"train_loss": -6.91793155670166, "global_step": 169009, "epoch": 4024} {"train_loss": -7.012677192687988, "global_step": 169010, "epoch": 4024} {"train_loss": -6.91017484664917, "global_step": 169011, "epoch": 4024} {"train_loss": -6.952086448669434, "global_step": 169012, "epoch": 4024} {"train_loss": -6.806270122528076, "global_step": 169013, "epoch": 4024} {"train_loss": -6.993957996368408, "global_step": 169014, "epoch": 4024} {"train_loss": -6.910580158233643, "global_step": 169015, "epoch": 4024} {"train_loss": -7.044242858886719, "global_step": 169016, "epoch": 4024} {"train_loss": -6.948712348937988, "global_step": 169017, "epoch": 4024} {"train_loss": -6.986548900604248, "global_step": 169018, "epoch": 4024} {"train_loss": -6.992728233337402, "global_step": 169019, "epoch": 4024} {"train_loss": -7.0330305099487305, "global_step": 169020, "epoch": 4024} {"train_loss": -6.8732452392578125, "global_step": 169021, "epoch": 4024} {"train_loss": -6.973523139953613, "global_step": 169022, "epoch": 4024} {"train_loss": -6.912940979003906, "global_step": 169023, "epoch": 4024} {"train_loss": -6.974616050720215, "global_step": 169024, "epoch": 4024} {"train_loss": -6.937183856964111, "global_step": 169025, "epoch": 4024} {"train_loss": -7.019940376281738, "global_step": 169026, "epoch": 4024} {"train_loss": -6.997705459594727, "global_step": 169027, "epoch": 4024} {"train_loss": -6.865258693695068, "global_step": 169028, "epoch": 4024} {"train_loss": -6.868056774139404, "global_step": 169029, "epoch": 4024} {"train_loss": -6.9266133308410645, "global_step": 169030, "epoch": 4024} {"train_loss": -6.984066963195801, "global_step": 169031, "epoch": 4024} {"train_loss": -6.973601341247559, "global_step": 169032, "epoch": 4024} {"train_loss": -6.944859504699707, "global_step": 169033, "epoch": 4024} {"train_loss": -7.044173717498779, "global_step": 169034, "epoch": 4024} {"train_loss": -6.943389892578125, "global_step": 169035, "epoch": 4024} {"train_loss": -7.0069427490234375, "global_step": 169036, "epoch": 4024} {"train_loss": -6.953686714172363, "global_step": 169037, "epoch": 4024} {"train_loss": -6.993133544921875, "global_step": 169038, "epoch": 4024} {"train_loss": -7.119171142578125, "global_step": 169039, "epoch": 4024} {"train_loss": -6.98201847076416, "global_step": 169040, "epoch": 4024} {"train_loss": -7.0070295333862305, "global_step": 169041, "epoch": 4024} {"train_loss": -7.089658737182617, "global_step": 169042, "epoch": 4024} {"train_loss": -7.073688983917236, "global_step": 169043, "epoch": 4024} {"train_loss": -7.051791667938232, "global_step": 169044, "epoch": 4024} {"train_loss": -7.006307601928711, "global_step": 169045, "epoch": 4024} {"train_loss": -6.990630149841309, "global_step": 169046, "epoch": 4024} {"train_loss": -7.084968566894531, "global_step": 169047, "epoch": 4024} {"train_loss": -7.032999038696289, "global_step": 169048, "epoch": 4024} {"train_loss": -6.97655523390997, "global_step": 169049, "epoch": 4024, "val_loss": 68986.7578125} {"train_loss": -7.167670726776123, "global_step": 169050, "epoch": 4025} {"train_loss": -7.034647464752197, "global_step": 169051, "epoch": 4025} {"train_loss": -7.006453514099121, "global_step": 169052, "epoch": 4025} {"train_loss": -7.211344242095947, "global_step": 169053, "epoch": 4025} {"train_loss": -6.962177276611328, "global_step": 169054, "epoch": 4025} {"train_loss": -7.0929059982299805, "global_step": 169055, "epoch": 4025} {"train_loss": -7.015133380889893, "global_step": 169056, "epoch": 4025} {"train_loss": -6.9745683670043945, "global_step": 169057, "epoch": 4025} {"train_loss": -6.971516132354736, "global_step": 169058, "epoch": 4025} {"train_loss": -7.000282287597656, "global_step": 169059, "epoch": 4025} {"train_loss": -7.070542812347412, "global_step": 169060, "epoch": 4025} {"train_loss": -7.007406234741211, "global_step": 169061, "epoch": 4025} {"train_loss": -7.038503646850586, "global_step": 169062, "epoch": 4025} {"train_loss": -6.976698875427246, "global_step": 169063, "epoch": 4025} {"train_loss": -7.017312526702881, "global_step": 169064, "epoch": 4025} {"train_loss": -7.166992664337158, "global_step": 169065, "epoch": 4025} {"train_loss": -7.070188522338867, "global_step": 169066, "epoch": 4025} {"train_loss": -7.099407196044922, "global_step": 169067, "epoch": 4025} {"train_loss": -7.08942174911499, "global_step": 169068, "epoch": 4025} {"train_loss": -7.145350456237793, "global_step": 169069, "epoch": 4025} {"train_loss": -7.162951946258545, "global_step": 169070, "epoch": 4025} {"train_loss": -7.063156604766846, "global_step": 169071, "epoch": 4025} {"train_loss": -6.951040267944336, "global_step": 169072, "epoch": 4025} {"train_loss": -7.013053894042969, "global_step": 169073, "epoch": 4025} {"train_loss": -7.112309455871582, "global_step": 169074, "epoch": 4025} {"train_loss": -6.999031066894531, "global_step": 169075, "epoch": 4025} {"train_loss": -7.062412261962891, "global_step": 169076, "epoch": 4025} {"train_loss": -7.122098445892334, "global_step": 169077, "epoch": 4025} {"train_loss": -6.99815559387207, "global_step": 169078, "epoch": 4025} {"train_loss": -7.132720947265625, "global_step": 169079, "epoch": 4025} {"train_loss": -6.906142711639404, "global_step": 169080, "epoch": 4025} {"train_loss": -7.029016494750977, "global_step": 169081, "epoch": 4025} {"train_loss": -7.156036853790283, "global_step": 169082, "epoch": 4025} {"train_loss": -6.903243541717529, "global_step": 169083, "epoch": 4025} {"train_loss": -6.897177696228027, "global_step": 169084, "epoch": 4025} {"train_loss": -7.008091926574707, "global_step": 169085, "epoch": 4025} {"train_loss": -7.037075996398926, "global_step": 169086, "epoch": 4025} {"train_loss": -7.200259208679199, "global_step": 169087, "epoch": 4025} {"train_loss": -7.047934532165527, "global_step": 169088, "epoch": 4025} {"train_loss": -7.012565612792969, "global_step": 169089, "epoch": 4025} {"train_loss": -7.096628189086914, "global_step": 169090, "epoch": 4025} {"train_loss": -7.049067871911185, "global_step": 169091, "epoch": 4025, "val_loss": 68936.2890625} {"train_loss": -7.013669967651367, "global_step": 169092, "epoch": 4026} {"train_loss": -6.996743202209473, "global_step": 169093, "epoch": 4026} {"train_loss": -7.177924156188965, "global_step": 169094, "epoch": 4026} {"train_loss": -7.055747032165527, "global_step": 169095, "epoch": 4026} {"train_loss": -7.1270904541015625, "global_step": 169096, "epoch": 4026} {"train_loss": -6.978532314300537, "global_step": 169097, "epoch": 4026} {"train_loss": -7.124588966369629, "global_step": 169098, "epoch": 4026} {"train_loss": -7.100040912628174, "global_step": 169099, "epoch": 4026} {"train_loss": -7.073402404785156, "global_step": 169100, "epoch": 4026} {"train_loss": -7.040605068206787, "global_step": 169101, "epoch": 4026} {"train_loss": -7.072513580322266, "global_step": 169102, "epoch": 4026} {"train_loss": -6.9941935539245605, "global_step": 169103, "epoch": 4026} {"train_loss": -7.1483564376831055, "global_step": 169104, "epoch": 4026} {"train_loss": -7.051539897918701, "global_step": 169105, "epoch": 4026} {"train_loss": -7.073720932006836, "global_step": 169106, "epoch": 4026} {"train_loss": -7.014192581176758, "global_step": 169107, "epoch": 4026} {"train_loss": -7.050480842590332, "global_step": 169108, "epoch": 4026} {"train_loss": -7.200718402862549, "global_step": 169109, "epoch": 4026} {"train_loss": -7.083686828613281, "global_step": 169110, "epoch": 4026} {"train_loss": -7.0412821769714355, "global_step": 169111, "epoch": 4026} {"train_loss": -7.160437107086182, "global_step": 169112, "epoch": 4026} {"train_loss": -6.997560501098633, "global_step": 169113, "epoch": 4026} {"train_loss": -7.020495891571045, "global_step": 169114, "epoch": 4026} {"train_loss": -7.095239639282227, "global_step": 169115, "epoch": 4026} {"train_loss": -6.96513032913208, "global_step": 169116, "epoch": 4026} {"train_loss": -6.996218681335449, "global_step": 169117, "epoch": 4026} {"train_loss": -7.094146728515625, "global_step": 169118, "epoch": 4026} {"train_loss": -7.041010856628418, "global_step": 169119, "epoch": 4026} {"train_loss": -7.019496917724609, "global_step": 169120, "epoch": 4026} {"train_loss": -6.919587135314941, "global_step": 169121, "epoch": 4026} {"train_loss": -7.048467636108398, "global_step": 169122, "epoch": 4026} {"train_loss": -7.061620235443115, "global_step": 169123, "epoch": 4026} {"train_loss": -7.0520477294921875, "global_step": 169124, "epoch": 4026} {"train_loss": -6.964343070983887, "global_step": 169125, "epoch": 4026} {"train_loss": -7.065096378326416, "global_step": 169126, "epoch": 4026} {"train_loss": -6.914655685424805, "global_step": 169127, "epoch": 4026} {"train_loss": -7.092621803283691, "global_step": 169128, "epoch": 4026} {"train_loss": -6.905366897583008, "global_step": 169129, "epoch": 4026} {"train_loss": -7.099532604217529, "global_step": 169130, "epoch": 4026} {"train_loss": -7.103417873382568, "global_step": 169131, "epoch": 4026} {"train_loss": -7.061253547668457, "global_step": 169132, "epoch": 4026} {"train_loss": -7.050606421061924, "global_step": 169133, "epoch": 4026, "val_loss": 68838.0078125} {"train_loss": -7.0088605880737305, "global_step": 169134, "epoch": 4027} {"train_loss": -7.05265998840332, "global_step": 169135, "epoch": 4027} {"train_loss": -7.1083526611328125, "global_step": 169136, "epoch": 4027} {"train_loss": -7.035543441772461, "global_step": 169137, "epoch": 4027} {"train_loss": -7.018383026123047, "global_step": 169138, "epoch": 4027} {"train_loss": -6.9935173988342285, "global_step": 169139, "epoch": 4027} {"train_loss": -7.0179033279418945, "global_step": 169140, "epoch": 4027} {"train_loss": -6.906421661376953, "global_step": 169141, "epoch": 4027} {"train_loss": -7.02606201171875, "global_step": 169142, "epoch": 4027} {"train_loss": -6.813967704772949, "global_step": 169143, "epoch": 4027} {"train_loss": -6.979612350463867, "global_step": 169144, "epoch": 4027} {"train_loss": -7.017637729644775, "global_step": 169145, "epoch": 4027} {"train_loss": -6.884269714355469, "global_step": 169146, "epoch": 4027} {"train_loss": -6.912707805633545, "global_step": 169147, "epoch": 4027} {"train_loss": -6.991154670715332, "global_step": 169148, "epoch": 4027} {"train_loss": -6.926641464233398, "global_step": 169149, "epoch": 4027} {"train_loss": -6.895195007324219, "global_step": 169150, "epoch": 4027} {"train_loss": -6.914243698120117, "global_step": 169151, "epoch": 4027} {"train_loss": -6.981485366821289, "global_step": 169152, "epoch": 4027} {"train_loss": -6.862102031707764, "global_step": 169153, "epoch": 4027} {"train_loss": -7.031185150146484, "global_step": 169154, "epoch": 4027} {"train_loss": -7.0013346672058105, "global_step": 169155, "epoch": 4027} {"train_loss": -6.932550430297852, "global_step": 169156, "epoch": 4027} {"train_loss": -6.985235691070557, "global_step": 169157, "epoch": 4027} {"train_loss": -6.857187271118164, "global_step": 169158, "epoch": 4027} {"train_loss": -6.984724044799805, "global_step": 169159, "epoch": 4027} {"train_loss": -6.950930118560791, "global_step": 169160, "epoch": 4027} {"train_loss": -7.021537780761719, "global_step": 169161, "epoch": 4027} {"train_loss": -7.027411460876465, "global_step": 169162, "epoch": 4027} {"train_loss": -6.905423164367676, "global_step": 169163, "epoch": 4027} {"train_loss": -6.986234664916992, "global_step": 169164, "epoch": 4027} {"train_loss": -6.932991981506348, "global_step": 169165, "epoch": 4027} {"train_loss": -7.008975505828857, "global_step": 169166, "epoch": 4027} {"train_loss": -7.005779266357422, "global_step": 169167, "epoch": 4027} {"train_loss": -6.863778114318848, "global_step": 169168, "epoch": 4027} {"train_loss": -7.0116167068481445, "global_step": 169169, "epoch": 4027} {"train_loss": -7.00345516204834, "global_step": 169170, "epoch": 4027} {"train_loss": -6.907879829406738, "global_step": 169171, "epoch": 4027} {"train_loss": -7.064210414886475, "global_step": 169172, "epoch": 4027} {"train_loss": -6.906171798706055, "global_step": 169173, "epoch": 4027} {"train_loss": -6.992936134338379, "global_step": 169174, "epoch": 4027} {"train_loss": -6.967325233277821, "global_step": 169175, "epoch": 4027, "val_loss": 69052.6171875} {"train_loss": -6.9218878746032715, "global_step": 169176, "epoch": 4028} {"train_loss": -6.887957572937012, "global_step": 169177, "epoch": 4028} {"train_loss": -6.9526872634887695, "global_step": 169178, "epoch": 4028} {"train_loss": -7.072531700134277, "global_step": 169179, "epoch": 4028} {"train_loss": -6.909562110900879, "global_step": 169180, "epoch": 4028} {"train_loss": -6.968081474304199, "global_step": 169181, "epoch": 4028} {"train_loss": -6.868747711181641, "global_step": 169182, "epoch": 4028} {"train_loss": -6.849608421325684, "global_step": 169183, "epoch": 4028} {"train_loss": -6.9498796463012695, "global_step": 169184, "epoch": 4028} {"train_loss": -6.893828392028809, "global_step": 169185, "epoch": 4028} {"train_loss": -6.977478504180908, "global_step": 169186, "epoch": 4028} {"train_loss": -6.987264633178711, "global_step": 169187, "epoch": 4028} {"train_loss": -7.024491310119629, "global_step": 169188, "epoch": 4028} {"train_loss": -6.994605541229248, "global_step": 169189, "epoch": 4028} {"train_loss": -6.986212253570557, "global_step": 169190, "epoch": 4028} {"train_loss": -7.022891998291016, "global_step": 169191, "epoch": 4028} {"train_loss": -7.028067588806152, "global_step": 169192, "epoch": 4028} {"train_loss": -7.0504841804504395, "global_step": 169193, "epoch": 4028} {"train_loss": -7.0046539306640625, "global_step": 169194, "epoch": 4028} {"train_loss": -6.957681655883789, "global_step": 169195, "epoch": 4028} {"train_loss": -7.0394721031188965, "global_step": 169196, "epoch": 4028} {"train_loss": -6.957582473754883, "global_step": 169197, "epoch": 4028} {"train_loss": -7.156072616577148, "global_step": 169198, "epoch": 4028} {"train_loss": -7.007316589355469, "global_step": 169199, "epoch": 4028} {"train_loss": -7.005618095397949, "global_step": 169200, "epoch": 4028} {"train_loss": -7.161950588226318, "global_step": 169201, "epoch": 4028} {"train_loss": -7.085033416748047, "global_step": 169202, "epoch": 4028} {"train_loss": -7.028090953826904, "global_step": 169203, "epoch": 4028} {"train_loss": -7.022488594055176, "global_step": 169204, "epoch": 4028} {"train_loss": -7.039952278137207, "global_step": 169205, "epoch": 4028} {"train_loss": -7.044030666351318, "global_step": 169206, "epoch": 4028} {"train_loss": -6.9402546882629395, "global_step": 169207, "epoch": 4028} {"train_loss": -6.944058895111084, "global_step": 169208, "epoch": 4028} {"train_loss": -6.959015846252441, "global_step": 169209, "epoch": 4028} {"train_loss": -6.971894264221191, "global_step": 169210, "epoch": 4028} {"train_loss": -6.9487409591674805, "global_step": 169211, "epoch": 4028} {"train_loss": -7.019384384155273, "global_step": 169212, "epoch": 4028} {"train_loss": -6.819118499755859, "global_step": 169213, "epoch": 4028} {"train_loss": -7.060002326965332, "global_step": 169214, "epoch": 4028} {"train_loss": -7.036740303039551, "global_step": 169215, "epoch": 4028} {"train_loss": -6.878985404968262, "global_step": 169216, "epoch": 4028} {"train_loss": -6.98710678872608, "global_step": 169217, "epoch": 4028, "val_loss": 69038.5390625} {"train_loss": -7.011174201965332, "global_step": 169218, "epoch": 4029} {"train_loss": -6.944931983947754, "global_step": 169219, "epoch": 4029} {"train_loss": -7.059178829193115, "global_step": 169220, "epoch": 4029} {"train_loss": -6.890551567077637, "global_step": 169221, "epoch": 4029} {"train_loss": -7.0553693771362305, "global_step": 169222, "epoch": 4029} {"train_loss": -6.939003944396973, "global_step": 169223, "epoch": 4029} {"train_loss": -6.931197643280029, "global_step": 169224, "epoch": 4029} {"train_loss": -6.922882080078125, "global_step": 169225, "epoch": 4029} {"train_loss": -6.934972763061523, "global_step": 169226, "epoch": 4029} {"train_loss": -7.147989273071289, "global_step": 169227, "epoch": 4029} {"train_loss": -6.943188190460205, "global_step": 169228, "epoch": 4029} {"train_loss": -7.050411224365234, "global_step": 169229, "epoch": 4029} {"train_loss": -6.973844051361084, "global_step": 169230, "epoch": 4029} {"train_loss": -7.017159461975098, "global_step": 169231, "epoch": 4029} {"train_loss": -7.15789270401001, "global_step": 169232, "epoch": 4029} {"train_loss": -6.918045997619629, "global_step": 169233, "epoch": 4029} {"train_loss": -6.86363410949707, "global_step": 169234, "epoch": 4029} {"train_loss": -7.043412208557129, "global_step": 169235, "epoch": 4029} {"train_loss": -6.921909332275391, "global_step": 169236, "epoch": 4029} {"train_loss": -7.042309761047363, "global_step": 169237, "epoch": 4029} {"train_loss": -7.057921409606934, "global_step": 169238, "epoch": 4029} {"train_loss": -6.92258882522583, "global_step": 169239, "epoch": 4029} {"train_loss": -6.924896240234375, "global_step": 169240, "epoch": 4029} {"train_loss": -7.065145492553711, "global_step": 169241, "epoch": 4029} {"train_loss": -6.9699201583862305, "global_step": 169242, "epoch": 4029} {"train_loss": -7.126909255981445, "global_step": 169243, "epoch": 4029} {"train_loss": -7.096001625061035, "global_step": 169244, "epoch": 4029} {"train_loss": -7.136363506317139, "global_step": 169245, "epoch": 4029} {"train_loss": -7.065232276916504, "global_step": 169246, "epoch": 4029} {"train_loss": -6.9459028244018555, "global_step": 169247, "epoch": 4029} {"train_loss": -7.079480171203613, "global_step": 169248, "epoch": 4029} {"train_loss": -7.041829586029053, "global_step": 169249, "epoch": 4029} {"train_loss": -7.0138654708862305, "global_step": 169250, "epoch": 4029} {"train_loss": -6.974160194396973, "global_step": 169251, "epoch": 4029} {"train_loss": -6.955371856689453, "global_step": 169252, "epoch": 4029} {"train_loss": -6.955591678619385, "global_step": 169253, "epoch": 4029} {"train_loss": -7.011099815368652, "global_step": 169254, "epoch": 4029} {"train_loss": -6.881119728088379, "global_step": 169255, "epoch": 4029} {"train_loss": -6.924919128417969, "global_step": 169256, "epoch": 4029} {"train_loss": -7.009383678436279, "global_step": 169257, "epoch": 4029} {"train_loss": -6.993330001831055, "global_step": 169258, "epoch": 4029} {"train_loss": -6.999410958517165, "global_step": 169259, "epoch": 4029, "val_loss": 69025.4453125} {"train_loss": -6.952958106994629, "global_step": 169260, "epoch": 4030} {"train_loss": -6.9770917892456055, "global_step": 169261, "epoch": 4030} {"train_loss": -6.987822532653809, "global_step": 169262, "epoch": 4030} {"train_loss": -6.909789562225342, "global_step": 169263, "epoch": 4030} {"train_loss": -7.144661903381348, "global_step": 169264, "epoch": 4030} {"train_loss": -7.080507278442383, "global_step": 169265, "epoch": 4030} {"train_loss": -7.0212602615356445, "global_step": 169266, "epoch": 4030} {"train_loss": -6.961493015289307, "global_step": 169267, "epoch": 4030} {"train_loss": -7.068436622619629, "global_step": 169268, "epoch": 4030} {"train_loss": -6.92408561706543, "global_step": 169269, "epoch": 4030} {"train_loss": -7.057322025299072, "global_step": 169270, "epoch": 4030} {"train_loss": -6.974913120269775, "global_step": 169271, "epoch": 4030} {"train_loss": -6.841121196746826, "global_step": 169272, "epoch": 4030} {"train_loss": -6.975954532623291, "global_step": 169273, "epoch": 4030} {"train_loss": -6.866881370544434, "global_step": 169274, "epoch": 4030} {"train_loss": -6.8856072425842285, "global_step": 169275, "epoch": 4030} {"train_loss": -7.079509735107422, "global_step": 169276, "epoch": 4030} {"train_loss": -6.991561412811279, "global_step": 169277, "epoch": 4030} {"train_loss": -7.043768882751465, "global_step": 169278, "epoch": 4030} {"train_loss": -7.15828800201416, "global_step": 169279, "epoch": 4030} {"train_loss": -7.071022033691406, "global_step": 169280, "epoch": 4030} {"train_loss": -7.016287803649902, "global_step": 169281, "epoch": 4030} {"train_loss": -7.045758247375488, "global_step": 169282, "epoch": 4030} {"train_loss": -7.03305721282959, "global_step": 169283, "epoch": 4030} {"train_loss": -7.020995140075684, "global_step": 169284, "epoch": 4030} {"train_loss": -6.971347808837891, "global_step": 169285, "epoch": 4030} {"train_loss": -6.961267948150635, "global_step": 169286, "epoch": 4030} {"train_loss": -6.970337867736816, "global_step": 169287, "epoch": 4030} {"train_loss": -7.04176139831543, "global_step": 169288, "epoch": 4030} {"train_loss": -7.140671730041504, "global_step": 169289, "epoch": 4030} {"train_loss": -7.081454753875732, "global_step": 169290, "epoch": 4030} {"train_loss": -7.001770496368408, "global_step": 169291, "epoch": 4030} {"train_loss": -7.104144096374512, "global_step": 169292, "epoch": 4030} {"train_loss": -7.083295822143555, "global_step": 169293, "epoch": 4030} {"train_loss": -7.047137260437012, "global_step": 169294, "epoch": 4030} {"train_loss": -7.073145389556885, "global_step": 169295, "epoch": 4030} {"train_loss": -7.095750331878662, "global_step": 169296, "epoch": 4030} {"train_loss": -7.003739833831787, "global_step": 169297, "epoch": 4030} {"train_loss": -6.97171688079834, "global_step": 169298, "epoch": 4030} {"train_loss": -6.978719234466553, "global_step": 169299, "epoch": 4030} {"train_loss": -6.94183349609375, "global_step": 169300, "epoch": 4030} {"train_loss": -7.013999689192999, "global_step": 169301, "epoch": 4030, "val_loss": 68956.609375} {"train_loss": -7.08278226852417, "global_step": 169302, "epoch": 4031} {"train_loss": -6.949686527252197, "global_step": 169303, "epoch": 4031} {"train_loss": -7.101500511169434, "global_step": 169304, "epoch": 4031} {"train_loss": -7.041419982910156, "global_step": 169305, "epoch": 4031} {"train_loss": -6.902078628540039, "global_step": 169306, "epoch": 4031} {"train_loss": -7.1676435470581055, "global_step": 169307, "epoch": 4031} {"train_loss": -7.115612030029297, "global_step": 169308, "epoch": 4031} {"train_loss": -7.011651992797852, "global_step": 169309, "epoch": 4031} {"train_loss": -7.034037113189697, "global_step": 169310, "epoch": 4031} {"train_loss": -6.999459266662598, "global_step": 169311, "epoch": 4031} {"train_loss": -7.072047710418701, "global_step": 169312, "epoch": 4031} {"train_loss": -7.150077819824219, "global_step": 169313, "epoch": 4031} {"train_loss": -7.033659934997559, "global_step": 169314, "epoch": 4031} {"train_loss": -7.051826477050781, "global_step": 169315, "epoch": 4031} {"train_loss": -7.009862899780273, "global_step": 169316, "epoch": 4031} {"train_loss": -7.082878589630127, "global_step": 169317, "epoch": 4031} {"train_loss": -6.946674346923828, "global_step": 169318, "epoch": 4031} {"train_loss": -6.973447322845459, "global_step": 169319, "epoch": 4031} {"train_loss": -6.991972923278809, "global_step": 169320, "epoch": 4031} {"train_loss": -6.957862377166748, "global_step": 169321, "epoch": 4031} {"train_loss": -6.9344377517700195, "global_step": 169322, "epoch": 4031} {"train_loss": -6.968415260314941, "global_step": 169323, "epoch": 4031} {"train_loss": -7.02207612991333, "global_step": 169324, "epoch": 4031} {"train_loss": -6.966026306152344, "global_step": 169325, "epoch": 4031} {"train_loss": -7.00396203994751, "global_step": 169326, "epoch": 4031} {"train_loss": -6.938859462738037, "global_step": 169327, "epoch": 4031} {"train_loss": -6.986544609069824, "global_step": 169328, "epoch": 4031} {"train_loss": -7.026893138885498, "global_step": 169329, "epoch": 4031} {"train_loss": -6.981624603271484, "global_step": 169330, "epoch": 4031} {"train_loss": -6.995959281921387, "global_step": 169331, "epoch": 4031} {"train_loss": -7.103139400482178, "global_step": 169332, "epoch": 4031} {"train_loss": -7.023534774780273, "global_step": 169333, "epoch": 4031} {"train_loss": -7.085369110107422, "global_step": 169334, "epoch": 4031} {"train_loss": -7.072494029998779, "global_step": 169335, "epoch": 4031} {"train_loss": -7.047774791717529, "global_step": 169336, "epoch": 4031} {"train_loss": -7.003786087036133, "global_step": 169337, "epoch": 4031} {"train_loss": -7.061969757080078, "global_step": 169338, "epoch": 4031} {"train_loss": -6.799274444580078, "global_step": 169339, "epoch": 4031} {"train_loss": -6.963774681091309, "global_step": 169340, "epoch": 4031} {"train_loss": -7.031682014465332, "global_step": 169341, "epoch": 4031} {"train_loss": -6.967742443084717, "global_step": 169342, "epoch": 4031} {"train_loss": -7.014595360982986, "global_step": 169343, "epoch": 4031, "val_loss": 69107.5390625} {"train_loss": -7.03688383102417, "global_step": 169344, "epoch": 4032} {"train_loss": -6.923427581787109, "global_step": 169345, "epoch": 4032} {"train_loss": -7.062802791595459, "global_step": 169346, "epoch": 4032} {"train_loss": -7.127019882202148, "global_step": 169347, "epoch": 4032} {"train_loss": -6.957761764526367, "global_step": 169348, "epoch": 4032} {"train_loss": -7.064153671264648, "global_step": 169349, "epoch": 4032} {"train_loss": -7.0905585289001465, "global_step": 169350, "epoch": 4032} {"train_loss": -7.021665096282959, "global_step": 169351, "epoch": 4032} {"train_loss": -6.883816242218018, "global_step": 169352, "epoch": 4032} {"train_loss": -7.062248706817627, "global_step": 169353, "epoch": 4032} {"train_loss": -6.9473137855529785, "global_step": 169354, "epoch": 4032} {"train_loss": -6.918534278869629, "global_step": 169355, "epoch": 4032} {"train_loss": -6.94529914855957, "global_step": 169356, "epoch": 4032} {"train_loss": -6.964659690856934, "global_step": 169357, "epoch": 4032} {"train_loss": -6.918952941894531, "global_step": 169358, "epoch": 4032} {"train_loss": -7.0558271408081055, "global_step": 169359, "epoch": 4032} {"train_loss": -6.927849292755127, "global_step": 169360, "epoch": 4032} {"train_loss": -7.024949073791504, "global_step": 169361, "epoch": 4032} {"train_loss": -7.072583198547363, "global_step": 169362, "epoch": 4032} {"train_loss": -7.04661226272583, "global_step": 169363, "epoch": 4032} {"train_loss": -7.008092403411865, "global_step": 169364, "epoch": 4032} {"train_loss": -6.840781211853027, "global_step": 169365, "epoch": 4032} {"train_loss": -6.999812602996826, "global_step": 169366, "epoch": 4032} {"train_loss": -6.917721271514893, "global_step": 169367, "epoch": 4032} {"train_loss": -6.966209411621094, "global_step": 169368, "epoch": 4032} {"train_loss": -6.99973201751709, "global_step": 169369, "epoch": 4032} {"train_loss": -6.981259346008301, "global_step": 169370, "epoch": 4032} {"train_loss": -7.055169105529785, "global_step": 169371, "epoch": 4032} {"train_loss": -6.963534832000732, "global_step": 169372, "epoch": 4032} {"train_loss": -7.051834583282471, "global_step": 169373, "epoch": 4032} {"train_loss": -7.015406131744385, "global_step": 169374, "epoch": 4032} {"train_loss": -6.923877716064453, "global_step": 169375, "epoch": 4032} {"train_loss": -6.946442604064941, "global_step": 169376, "epoch": 4032} {"train_loss": -7.065718650817871, "global_step": 169377, "epoch": 4032} {"train_loss": -6.998645782470703, "global_step": 169378, "epoch": 4032} {"train_loss": -6.946950912475586, "global_step": 169379, "epoch": 4032} {"train_loss": -7.011795997619629, "global_step": 169380, "epoch": 4032} {"train_loss": -6.874080657958984, "global_step": 169381, "epoch": 4032} {"train_loss": -7.040299892425537, "global_step": 169382, "epoch": 4032} {"train_loss": -7.046785354614258, "global_step": 169383, "epoch": 4032} {"train_loss": -7.062448024749756, "global_step": 169384, "epoch": 4032} {"train_loss": -6.996481009892055, "global_step": 169385, "epoch": 4032, "val_loss": 68854.765625} {"train_loss": -6.964422225952148, "global_step": 169386, "epoch": 4033} {"train_loss": -6.99139404296875, "global_step": 169387, "epoch": 4033} {"train_loss": -7.043267250061035, "global_step": 169388, "epoch": 4033} {"train_loss": -6.955135345458984, "global_step": 169389, "epoch": 4033} {"train_loss": -7.060595989227295, "global_step": 169390, "epoch": 4033} {"train_loss": -6.956298351287842, "global_step": 169391, "epoch": 4033} {"train_loss": -7.006149768829346, "global_step": 169392, "epoch": 4033} {"train_loss": -6.966906547546387, "global_step": 169393, "epoch": 4033} {"train_loss": -6.976626873016357, "global_step": 169394, "epoch": 4033} {"train_loss": -6.980868816375732, "global_step": 169395, "epoch": 4033} {"train_loss": -6.994076728820801, "global_step": 169396, "epoch": 4033} {"train_loss": -7.071248531341553, "global_step": 169397, "epoch": 4033} {"train_loss": -7.021323204040527, "global_step": 169398, "epoch": 4033} {"train_loss": -7.018424987792969, "global_step": 169399, "epoch": 4033} {"train_loss": -6.961655616760254, "global_step": 169400, "epoch": 4033} {"train_loss": -7.083181858062744, "global_step": 169401, "epoch": 4033} {"train_loss": -7.080313682556152, "global_step": 169402, "epoch": 4033} {"train_loss": -7.046263694763184, "global_step": 169403, "epoch": 4033} {"train_loss": -6.993593215942383, "global_step": 169404, "epoch": 4033} {"train_loss": -7.076390266418457, "global_step": 169405, "epoch": 4033} {"train_loss": -7.085253715515137, "global_step": 169406, "epoch": 4033} {"train_loss": -7.055861949920654, "global_step": 169407, "epoch": 4033} {"train_loss": -7.072487831115723, "global_step": 169408, "epoch": 4033} {"train_loss": -6.975110054016113, "global_step": 169409, "epoch": 4033} {"train_loss": -6.99862003326416, "global_step": 169410, "epoch": 4033} {"train_loss": -7.092453956604004, "global_step": 169411, "epoch": 4033} {"train_loss": -6.987868785858154, "global_step": 169412, "epoch": 4033} {"train_loss": -6.935226917266846, "global_step": 169413, "epoch": 4033} {"train_loss": -7.008977890014648, "global_step": 169414, "epoch": 4033} {"train_loss": -6.785496234893799, "global_step": 169415, "epoch": 4033} {"train_loss": -7.006155014038086, "global_step": 169416, "epoch": 4033} {"train_loss": -6.88399600982666, "global_step": 169417, "epoch": 4033} {"train_loss": -6.902091979980469, "global_step": 169418, "epoch": 4033} {"train_loss": -7.146050930023193, "global_step": 169419, "epoch": 4033} {"train_loss": -6.925141334533691, "global_step": 169420, "epoch": 4033} {"train_loss": -7.0515899658203125, "global_step": 169421, "epoch": 4033} {"train_loss": -6.917479991912842, "global_step": 169422, "epoch": 4033} {"train_loss": -7.038675785064697, "global_step": 169423, "epoch": 4033} {"train_loss": -6.986485481262207, "global_step": 169424, "epoch": 4033} {"train_loss": -7.072098255157471, "global_step": 169425, "epoch": 4033} {"train_loss": -6.991071701049805, "global_step": 169426, "epoch": 4033} {"train_loss": -7.002972795849755, "global_step": 169427, "epoch": 4033, "val_loss": 68844.40625} {"train_loss": -7.042883396148682, "global_step": 169428, "epoch": 4034} {"train_loss": -7.015823841094971, "global_step": 169429, "epoch": 4034} {"train_loss": -6.961278915405273, "global_step": 169430, "epoch": 4034} {"train_loss": -7.10860538482666, "global_step": 169431, "epoch": 4034} {"train_loss": -7.020401477813721, "global_step": 169432, "epoch": 4034} {"train_loss": -7.1128153800964355, "global_step": 169433, "epoch": 4034} {"train_loss": -7.028905868530273, "global_step": 169434, "epoch": 4034} {"train_loss": -7.008098125457764, "global_step": 169435, "epoch": 4034} {"train_loss": -6.9706573486328125, "global_step": 169436, "epoch": 4034} {"train_loss": -6.98284387588501, "global_step": 169437, "epoch": 4034} {"train_loss": -7.023139953613281, "global_step": 169438, "epoch": 4034} {"train_loss": -7.024871349334717, "global_step": 169439, "epoch": 4034} {"train_loss": -6.990748882293701, "global_step": 169440, "epoch": 4034} {"train_loss": -6.949314594268799, "global_step": 169441, "epoch": 4034} {"train_loss": -7.006502628326416, "global_step": 169442, "epoch": 4034} {"train_loss": -6.951635360717773, "global_step": 169443, "epoch": 4034} {"train_loss": -6.98970890045166, "global_step": 169444, "epoch": 4034} {"train_loss": -7.1044840812683105, "global_step": 169445, "epoch": 4034} {"train_loss": -6.954670429229736, "global_step": 169446, "epoch": 4034} {"train_loss": -6.950997352600098, "global_step": 169447, "epoch": 4034} {"train_loss": -6.901053428649902, "global_step": 169448, "epoch": 4034} {"train_loss": -6.9955058097839355, "global_step": 169449, "epoch": 4034} {"train_loss": -6.982461929321289, "global_step": 169450, "epoch": 4034} {"train_loss": -7.047686576843262, "global_step": 169451, "epoch": 4034} {"train_loss": -7.143224716186523, "global_step": 169452, "epoch": 4034} {"train_loss": -6.890358924865723, "global_step": 169453, "epoch": 4034} {"train_loss": -6.949624061584473, "global_step": 169454, "epoch": 4034} {"train_loss": -6.905619144439697, "global_step": 169455, "epoch": 4034} {"train_loss": -6.894383430480957, "global_step": 169456, "epoch": 4034} {"train_loss": -7.111950874328613, "global_step": 169457, "epoch": 4034} {"train_loss": -6.88890266418457, "global_step": 169458, "epoch": 4034} {"train_loss": -7.073060035705566, "global_step": 169459, "epoch": 4034} {"train_loss": -6.945488929748535, "global_step": 169460, "epoch": 4034} {"train_loss": -7.019477844238281, "global_step": 169461, "epoch": 4034} {"train_loss": -7.039018630981445, "global_step": 169462, "epoch": 4034} {"train_loss": -6.929703712463379, "global_step": 169463, "epoch": 4034} {"train_loss": -7.031863212585449, "global_step": 169464, "epoch": 4034} {"train_loss": -6.957927703857422, "global_step": 169465, "epoch": 4034} {"train_loss": -7.025075435638428, "global_step": 169466, "epoch": 4034} {"train_loss": -7.13809871673584, "global_step": 169467, "epoch": 4034} {"train_loss": -6.974914073944092, "global_step": 169468, "epoch": 4034} {"train_loss": -7.0027257942018055, "global_step": 169469, "epoch": 4034, "val_loss": 69106.6015625} {"train_loss": -6.971035480499268, "global_step": 169470, "epoch": 4035} {"train_loss": -7.019826889038086, "global_step": 169471, "epoch": 4035} {"train_loss": -6.8522467613220215, "global_step": 169472, "epoch": 4035} {"train_loss": -6.9991559982299805, "global_step": 169473, "epoch": 4035} {"train_loss": -7.013497352600098, "global_step": 169474, "epoch": 4035} {"train_loss": -7.0149030685424805, "global_step": 169475, "epoch": 4035} {"train_loss": -7.023120880126953, "global_step": 169476, "epoch": 4035} {"train_loss": -6.753210067749023, "global_step": 169477, "epoch": 4035} {"train_loss": -7.115314960479736, "global_step": 169478, "epoch": 4035} {"train_loss": -6.95583438873291, "global_step": 169479, "epoch": 4035} {"train_loss": -6.887811183929443, "global_step": 169480, "epoch": 4035} {"train_loss": -7.0582594871521, "global_step": 169481, "epoch": 4035} {"train_loss": -7.017257213592529, "global_step": 169482, "epoch": 4035} {"train_loss": -6.974731922149658, "global_step": 169483, "epoch": 4035} {"train_loss": -6.996486186981201, "global_step": 169484, "epoch": 4035} {"train_loss": -6.947298049926758, "global_step": 169485, "epoch": 4035} {"train_loss": -6.976667404174805, "global_step": 169486, "epoch": 4035} {"train_loss": -7.013420581817627, "global_step": 169487, "epoch": 4035} {"train_loss": -7.03731632232666, "global_step": 169488, "epoch": 4035} {"train_loss": -7.079747200012207, "global_step": 169489, "epoch": 4035} {"train_loss": -7.07540225982666, "global_step": 169490, "epoch": 4035} {"train_loss": -7.045131683349609, "global_step": 169491, "epoch": 4035} {"train_loss": -7.0962395668029785, "global_step": 169492, "epoch": 4035} {"train_loss": -7.088486671447754, "global_step": 169493, "epoch": 4035} {"train_loss": -6.967742443084717, "global_step": 169494, "epoch": 4035} {"train_loss": -7.02998161315918, "global_step": 169495, "epoch": 4035} {"train_loss": -7.019112586975098, "global_step": 169496, "epoch": 4035} {"train_loss": -7.026012897491455, "global_step": 169497, "epoch": 4035} {"train_loss": -7.082521915435791, "global_step": 169498, "epoch": 4035} {"train_loss": -6.895686149597168, "global_step": 169499, "epoch": 4035} {"train_loss": -6.952423095703125, "global_step": 169500, "epoch": 4035} {"train_loss": -7.064211845397949, "global_step": 169501, "epoch": 4035} {"train_loss": -6.98715877532959, "global_step": 169502, "epoch": 4035} {"train_loss": -7.12568473815918, "global_step": 169503, "epoch": 4035} {"train_loss": -6.8561787605285645, "global_step": 169504, "epoch": 4035} {"train_loss": -6.823390960693359, "global_step": 169505, "epoch": 4035} {"train_loss": -6.970505237579346, "global_step": 169506, "epoch": 4035} {"train_loss": -6.801813125610352, "global_step": 169507, "epoch": 4035} {"train_loss": -7.047961235046387, "global_step": 169508, "epoch": 4035} {"train_loss": -6.902284145355225, "global_step": 169509, "epoch": 4035} {"train_loss": -7.054338455200195, "global_step": 169510, "epoch": 4035} {"train_loss": -6.992649691445487, "global_step": 169511, "epoch": 4035, "val_loss": 68905.6015625} {"train_loss": -7.054245948791504, "global_step": 169512, "epoch": 4036} {"train_loss": -6.921572685241699, "global_step": 169513, "epoch": 4036} {"train_loss": -7.028543472290039, "global_step": 169514, "epoch": 4036} {"train_loss": -6.956609725952148, "global_step": 169515, "epoch": 4036} {"train_loss": -6.933549404144287, "global_step": 169516, "epoch": 4036} {"train_loss": -7.022133827209473, "global_step": 169517, "epoch": 4036} {"train_loss": -6.989457607269287, "global_step": 169518, "epoch": 4036} {"train_loss": -6.949522018432617, "global_step": 169519, "epoch": 4036} {"train_loss": -7.136358261108398, "global_step": 169520, "epoch": 4036} {"train_loss": -6.911717414855957, "global_step": 169521, "epoch": 4036} {"train_loss": -7.047394752502441, "global_step": 169522, "epoch": 4036} {"train_loss": -7.013265132904053, "global_step": 169523, "epoch": 4036} {"train_loss": -7.038119316101074, "global_step": 169524, "epoch": 4036} {"train_loss": -7.026297092437744, "global_step": 169525, "epoch": 4036} {"train_loss": -6.949130058288574, "global_step": 169526, "epoch": 4036} {"train_loss": -6.9928436279296875, "global_step": 169527, "epoch": 4036} {"train_loss": -7.0761308670043945, "global_step": 169528, "epoch": 4036} {"train_loss": -7.095089435577393, "global_step": 169529, "epoch": 4036} {"train_loss": -7.0358452796936035, "global_step": 169530, "epoch": 4036} {"train_loss": -7.060800552368164, "global_step": 169531, "epoch": 4036} {"train_loss": -7.028555393218994, "global_step": 169532, "epoch": 4036} {"train_loss": -7.035278797149658, "global_step": 169533, "epoch": 4036} {"train_loss": -7.078646659851074, "global_step": 169534, "epoch": 4036} {"train_loss": -6.984253406524658, "global_step": 169535, "epoch": 4036} {"train_loss": -7.047361850738525, "global_step": 169536, "epoch": 4036} {"train_loss": -7.040887832641602, "global_step": 169537, "epoch": 4036} {"train_loss": -7.086091995239258, "global_step": 169538, "epoch": 4036} {"train_loss": -7.108105182647705, "global_step": 169539, "epoch": 4036} {"train_loss": -6.994379997253418, "global_step": 169540, "epoch": 4036} {"train_loss": -7.099669456481934, "global_step": 169541, "epoch": 4036} {"train_loss": -7.070208549499512, "global_step": 169542, "epoch": 4036} {"train_loss": -7.1531829833984375, "global_step": 169543, "epoch": 4036} {"train_loss": -6.895200252532959, "global_step": 169544, "epoch": 4036} {"train_loss": -6.95391845703125, "global_step": 169545, "epoch": 4036} {"train_loss": -7.078638076782227, "global_step": 169546, "epoch": 4036} {"train_loss": -6.986317157745361, "global_step": 169547, "epoch": 4036} {"train_loss": -7.009400844573975, "global_step": 169548, "epoch": 4036} {"train_loss": -7.01676607131958, "global_step": 169549, "epoch": 4036} {"train_loss": -7.012948989868164, "global_step": 169550, "epoch": 4036} {"train_loss": -7.033564567565918, "global_step": 169551, "epoch": 4036} {"train_loss": -7.016437530517578, "global_step": 169552, "epoch": 4036} {"train_loss": -7.022701422373454, "global_step": 169553, "epoch": 4036, "val_loss": 69315.0} {"train_loss": -7.060248851776123, "global_step": 169554, "epoch": 4037} {"train_loss": -7.070308208465576, "global_step": 169555, "epoch": 4037} {"train_loss": -7.030549049377441, "global_step": 169556, "epoch": 4037} {"train_loss": -6.932560920715332, "global_step": 169557, "epoch": 4037} {"train_loss": -6.932164669036865, "global_step": 169558, "epoch": 4037} {"train_loss": -6.91254997253418, "global_step": 169559, "epoch": 4037} {"train_loss": -7.065770626068115, "global_step": 169560, "epoch": 4037} {"train_loss": -6.885534763336182, "global_step": 169561, "epoch": 4037} {"train_loss": -7.0821428298950195, "global_step": 169562, "epoch": 4037} {"train_loss": -7.053473949432373, "global_step": 169563, "epoch": 4037} {"train_loss": -7.067093849182129, "global_step": 169564, "epoch": 4037} {"train_loss": -6.995467185974121, "global_step": 169565, "epoch": 4037} {"train_loss": -6.905942916870117, "global_step": 169566, "epoch": 4037} {"train_loss": -7.104352951049805, "global_step": 169567, "epoch": 4037} {"train_loss": -7.003195762634277, "global_step": 169568, "epoch": 4037} {"train_loss": -6.841030120849609, "global_step": 169569, "epoch": 4037} {"train_loss": -7.064513206481934, "global_step": 169570, "epoch": 4037} {"train_loss": -6.9028239250183105, "global_step": 169571, "epoch": 4037} {"train_loss": -6.8302764892578125, "global_step": 169572, "epoch": 4037} {"train_loss": -7.027182579040527, "global_step": 169573, "epoch": 4037} {"train_loss": -7.0456953048706055, "global_step": 169574, "epoch": 4037} {"train_loss": -6.84495735168457, "global_step": 169575, "epoch": 4037} {"train_loss": -6.872178554534912, "global_step": 169576, "epoch": 4037} {"train_loss": -6.868744850158691, "global_step": 169577, "epoch": 4037} {"train_loss": -6.798583030700684, "global_step": 169578, "epoch": 4037} {"train_loss": -6.9973883628845215, "global_step": 169579, "epoch": 4037} {"train_loss": -6.89840030670166, "global_step": 169580, "epoch": 4037} {"train_loss": -7.049139976501465, "global_step": 169581, "epoch": 4037} {"train_loss": -6.9185380935668945, "global_step": 169582, "epoch": 4037} {"train_loss": -7.051889419555664, "global_step": 169583, "epoch": 4037} {"train_loss": -7.040686130523682, "global_step": 169584, "epoch": 4037} {"train_loss": -6.9413557052612305, "global_step": 169585, "epoch": 4037} {"train_loss": -7.109361171722412, "global_step": 169586, "epoch": 4037} {"train_loss": -6.942931652069092, "global_step": 169587, "epoch": 4037} {"train_loss": -7.084695816040039, "global_step": 169588, "epoch": 4037} {"train_loss": -7.032164573669434, "global_step": 169589, "epoch": 4037} {"train_loss": -6.910312652587891, "global_step": 169590, "epoch": 4037} {"train_loss": -6.883430480957031, "global_step": 169591, "epoch": 4037} {"train_loss": -7.089389801025391, "global_step": 169592, "epoch": 4037} {"train_loss": -6.917563438415527, "global_step": 169593, "epoch": 4037} {"train_loss": -6.871912956237793, "global_step": 169594, "epoch": 4037} {"train_loss": -6.972912186668033, "global_step": 169595, "epoch": 4037, "val_loss": 68928.4453125} {"train_loss": -7.035608291625977, "global_step": 169596, "epoch": 4038} {"train_loss": -6.857451438903809, "global_step": 169597, "epoch": 4038} {"train_loss": -6.853394508361816, "global_step": 169598, "epoch": 4038} {"train_loss": -6.970743656158447, "global_step": 169599, "epoch": 4038} {"train_loss": -6.810608863830566, "global_step": 169600, "epoch": 4038} {"train_loss": -6.890189170837402, "global_step": 169601, "epoch": 4038} {"train_loss": -6.72733211517334, "global_step": 169602, "epoch": 4038} {"train_loss": -6.926907539367676, "global_step": 169603, "epoch": 4038} {"train_loss": -6.8552327156066895, "global_step": 169604, "epoch": 4038} {"train_loss": -6.879373550415039, "global_step": 169605, "epoch": 4038} {"train_loss": -6.791464805603027, "global_step": 169606, "epoch": 4038} {"train_loss": -6.937172889709473, "global_step": 169607, "epoch": 4038} {"train_loss": -6.802518844604492, "global_step": 169608, "epoch": 4038} {"train_loss": -6.926890850067139, "global_step": 169609, "epoch": 4038} {"train_loss": -6.847318649291992, "global_step": 169610, "epoch": 4038} {"train_loss": -6.83762264251709, "global_step": 169611, "epoch": 4038} {"train_loss": -6.90280818939209, "global_step": 169612, "epoch": 4038} {"train_loss": -6.938158988952637, "global_step": 169613, "epoch": 4038} {"train_loss": -6.970793724060059, "global_step": 169614, "epoch": 4038} {"train_loss": -6.879079818725586, "global_step": 169615, "epoch": 4038} {"train_loss": -6.9689531326293945, "global_step": 169616, "epoch": 4038} {"train_loss": -6.949798107147217, "global_step": 169617, "epoch": 4038} {"train_loss": -6.966780662536621, "global_step": 169618, "epoch": 4038} {"train_loss": -6.927824974060059, "global_step": 169619, "epoch": 4038} {"train_loss": -6.941551208496094, "global_step": 169620, "epoch": 4038} {"train_loss": -6.847586154937744, "global_step": 169621, "epoch": 4038} {"train_loss": -6.9967241287231445, "global_step": 169622, "epoch": 4038} {"train_loss": -6.841428279876709, "global_step": 169623, "epoch": 4038} {"train_loss": -7.01011323928833, "global_step": 169624, "epoch": 4038} {"train_loss": -6.993742942810059, "global_step": 169625, "epoch": 4038} {"train_loss": -6.953783988952637, "global_step": 169626, "epoch": 4038} {"train_loss": -6.991361618041992, "global_step": 169627, "epoch": 4038} {"train_loss": -7.032817840576172, "global_step": 169628, "epoch": 4038} {"train_loss": -6.955105304718018, "global_step": 169629, "epoch": 4038} {"train_loss": -7.109786510467529, "global_step": 169630, "epoch": 4038} {"train_loss": -7.059418678283691, "global_step": 169631, "epoch": 4038} {"train_loss": -7.043706893920898, "global_step": 169632, "epoch": 4038} {"train_loss": -6.941315650939941, "global_step": 169633, "epoch": 4038} {"train_loss": -6.996492385864258, "global_step": 169634, "epoch": 4038} {"train_loss": -7.001315116882324, "global_step": 169635, "epoch": 4038} {"train_loss": -7.138503074645996, "global_step": 169636, "epoch": 4038} {"train_loss": -6.938412121364048, "global_step": 169637, "epoch": 4038, "val_loss": 68959.109375} {"train_loss": -7.134424209594727, "global_step": 169638, "epoch": 4039} {"train_loss": -7.154046058654785, "global_step": 169639, "epoch": 4039} {"train_loss": -7.117825508117676, "global_step": 169640, "epoch": 4039} {"train_loss": -7.127791404724121, "global_step": 169641, "epoch": 4039} {"train_loss": -7.1313157081604, "global_step": 169642, "epoch": 4039} {"train_loss": -7.118438243865967, "global_step": 169643, "epoch": 4039} {"train_loss": -7.126323699951172, "global_step": 169644, "epoch": 4039} {"train_loss": -7.145355224609375, "global_step": 169645, "epoch": 4039} {"train_loss": -7.09394645690918, "global_step": 169646, "epoch": 4039} {"train_loss": -7.134521484375, "global_step": 169647, "epoch": 4039} {"train_loss": -7.058748722076416, "global_step": 169648, "epoch": 4039} {"train_loss": -7.093754768371582, "global_step": 169649, "epoch": 4039} {"train_loss": -7.1362810134887695, "global_step": 169650, "epoch": 4039} {"train_loss": -7.074629783630371, "global_step": 169651, "epoch": 4039} {"train_loss": -6.976419925689697, "global_step": 169652, "epoch": 4039} {"train_loss": -6.987953186035156, "global_step": 169653, "epoch": 4039} {"train_loss": -7.156522274017334, "global_step": 169654, "epoch": 4039} {"train_loss": -7.044539451599121, "global_step": 169655, "epoch": 4039} {"train_loss": -7.000492095947266, "global_step": 169656, "epoch": 4039} {"train_loss": -7.0599684715271, "global_step": 169657, "epoch": 4039} {"train_loss": -7.118566036224365, "global_step": 169658, "epoch": 4039} {"train_loss": -7.114872455596924, "global_step": 169659, "epoch": 4039} {"train_loss": -7.024415493011475, "global_step": 169660, "epoch": 4039} {"train_loss": -7.137800216674805, "global_step": 169661, "epoch": 4039} {"train_loss": -7.070448875427246, "global_step": 169662, "epoch": 4039} {"train_loss": -7.1086297035217285, "global_step": 169663, "epoch": 4039} {"train_loss": -7.089393615722656, "global_step": 169664, "epoch": 4039} {"train_loss": -7.04372501373291, "global_step": 169665, "epoch": 4039} {"train_loss": -7.295337677001953, "global_step": 169666, "epoch": 4039} {"train_loss": -7.02842903137207, "global_step": 169667, "epoch": 4039} {"train_loss": -7.0240325927734375, "global_step": 169668, "epoch": 4039} {"train_loss": -7.157426834106445, "global_step": 169669, "epoch": 4039} {"train_loss": -7.025813579559326, "global_step": 169670, "epoch": 4039} {"train_loss": -7.117620468139648, "global_step": 169671, "epoch": 4039} {"train_loss": -7.149691104888916, "global_step": 169672, "epoch": 4039} {"train_loss": -7.0734758377075195, "global_step": 169673, "epoch": 4039} {"train_loss": -7.040828227996826, "global_step": 169674, "epoch": 4039} {"train_loss": -7.162078857421875, "global_step": 169675, "epoch": 4039} {"train_loss": -7.041354179382324, "global_step": 169676, "epoch": 4039} {"train_loss": -6.996471405029297, "global_step": 169677, "epoch": 4039} {"train_loss": -7.036691665649414, "global_step": 169678, "epoch": 4039} {"train_loss": -7.0918943881988525, "global_step": 169679, "epoch": 4039, "val_loss": 68791.0} {"train_loss": -7.102388381958008, "global_step": 169680, "epoch": 4040} {"train_loss": -7.176695823669434, "global_step": 169681, "epoch": 4040} {"train_loss": -7.1908721923828125, "global_step": 169682, "epoch": 4040} {"train_loss": -7.17321252822876, "global_step": 169683, "epoch": 4040} {"train_loss": -7.131421089172363, "global_step": 169684, "epoch": 4040} {"train_loss": -7.009930610656738, "global_step": 169685, "epoch": 4040} {"train_loss": -6.923625946044922, "global_step": 169686, "epoch": 4040} {"train_loss": -7.115083694458008, "global_step": 169687, "epoch": 4040} {"train_loss": -6.8808064460754395, "global_step": 169688, "epoch": 4040} {"train_loss": -7.016077041625977, "global_step": 169689, "epoch": 4040} {"train_loss": -6.927835464477539, "global_step": 169690, "epoch": 4040} {"train_loss": -6.883863925933838, "global_step": 169691, "epoch": 4040} {"train_loss": -6.85772705078125, "global_step": 169692, "epoch": 4040} {"train_loss": -6.837404251098633, "global_step": 169693, "epoch": 4040} {"train_loss": -6.910588264465332, "global_step": 169694, "epoch": 4040} {"train_loss": -6.879913330078125, "global_step": 169695, "epoch": 4040} {"train_loss": -6.971480369567871, "global_step": 169696, "epoch": 4040} {"train_loss": -7.024205207824707, "global_step": 169697, "epoch": 4040} {"train_loss": -7.0511250495910645, "global_step": 169698, "epoch": 4040} {"train_loss": -7.01713752746582, "global_step": 169699, "epoch": 4040} {"train_loss": -7.060456275939941, "global_step": 169700, "epoch": 4040} {"train_loss": -6.942226886749268, "global_step": 169701, "epoch": 4040} {"train_loss": -7.001779556274414, "global_step": 169702, "epoch": 4040} {"train_loss": -6.916743278503418, "global_step": 169703, "epoch": 4040} {"train_loss": -7.045779228210449, "global_step": 169704, "epoch": 4040} {"train_loss": -6.932462215423584, "global_step": 169705, "epoch": 4040} {"train_loss": -7.0239129066467285, "global_step": 169706, "epoch": 4040} {"train_loss": -6.91664981842041, "global_step": 169707, "epoch": 4040} {"train_loss": -6.956984519958496, "global_step": 169708, "epoch": 4040} {"train_loss": -6.969069480895996, "global_step": 169709, "epoch": 4040} {"train_loss": -6.985563278198242, "global_step": 169710, "epoch": 4040} {"train_loss": -6.933132648468018, "global_step": 169711, "epoch": 4040} {"train_loss": -6.950360298156738, "global_step": 169712, "epoch": 4040} {"train_loss": -6.925908088684082, "global_step": 169713, "epoch": 4040} {"train_loss": -6.991367340087891, "global_step": 169714, "epoch": 4040} {"train_loss": -6.891488075256348, "global_step": 169715, "epoch": 4040} {"train_loss": -7.021343231201172, "global_step": 169716, "epoch": 4040} {"train_loss": -6.829591751098633, "global_step": 169717, "epoch": 4040} {"train_loss": -6.935471057891846, "global_step": 169718, "epoch": 4040} {"train_loss": -7.013588905334473, "global_step": 169719, "epoch": 4040} {"train_loss": -7.051095485687256, "global_step": 169720, "epoch": 4040} {"train_loss": -6.985171590532575, "global_step": 169721, "epoch": 4040, "val_loss": 68697.359375} {"train_loss": -6.985478401184082, "global_step": 169722, "epoch": 4041} {"train_loss": -6.997563362121582, "global_step": 169723, "epoch": 4041} {"train_loss": -7.0143585205078125, "global_step": 169724, "epoch": 4041} {"train_loss": -6.9767069816589355, "global_step": 169725, "epoch": 4041} {"train_loss": -7.063515663146973, "global_step": 169726, "epoch": 4041} {"train_loss": -6.941139221191406, "global_step": 169727, "epoch": 4041} {"train_loss": -6.950686931610107, "global_step": 169728, "epoch": 4041} {"train_loss": -6.949455738067627, "global_step": 169729, "epoch": 4041} {"train_loss": -6.958514213562012, "global_step": 169730, "epoch": 4041} {"train_loss": -7.003294944763184, "global_step": 169731, "epoch": 4041} {"train_loss": -6.961576461791992, "global_step": 169732, "epoch": 4041} {"train_loss": -6.955476760864258, "global_step": 169733, "epoch": 4041} {"train_loss": -7.016118049621582, "global_step": 169734, "epoch": 4041} {"train_loss": -6.9820990562438965, "global_step": 169735, "epoch": 4041} {"train_loss": -6.981889247894287, "global_step": 169736, "epoch": 4041} {"train_loss": -7.129843235015869, "global_step": 169737, "epoch": 4041} {"train_loss": -6.941838264465332, "global_step": 169738, "epoch": 4041} {"train_loss": -6.947581768035889, "global_step": 169739, "epoch": 4041} {"train_loss": -7.013690948486328, "global_step": 169740, "epoch": 4041} {"train_loss": -7.003481864929199, "global_step": 169741, "epoch": 4041} {"train_loss": -7.0531415939331055, "global_step": 169742, "epoch": 4041} {"train_loss": -6.973580360412598, "global_step": 169743, "epoch": 4041} {"train_loss": -6.786317825317383, "global_step": 169744, "epoch": 4041} {"train_loss": -6.996747970581055, "global_step": 169745, "epoch": 4041} {"train_loss": -6.918670654296875, "global_step": 169746, "epoch": 4041} {"train_loss": -6.889214515686035, "global_step": 169747, "epoch": 4041} {"train_loss": -6.985177993774414, "global_step": 169748, "epoch": 4041} {"train_loss": -6.833193302154541, "global_step": 169749, "epoch": 4041} {"train_loss": -7.021892547607422, "global_step": 169750, "epoch": 4041} {"train_loss": -6.878710746765137, "global_step": 169751, "epoch": 4041} {"train_loss": -6.979290962219238, "global_step": 169752, "epoch": 4041} {"train_loss": -6.941135406494141, "global_step": 169753, "epoch": 4041} {"train_loss": -6.97260856628418, "global_step": 169754, "epoch": 4041} {"train_loss": -7.104105472564697, "global_step": 169755, "epoch": 4041} {"train_loss": -7.02165412902832, "global_step": 169756, "epoch": 4041} {"train_loss": -7.0822272300720215, "global_step": 169757, "epoch": 4041} {"train_loss": -7.050593376159668, "global_step": 169758, "epoch": 4041} {"train_loss": -6.998584270477295, "global_step": 169759, "epoch": 4041} {"train_loss": -6.940662860870361, "global_step": 169760, "epoch": 4041} {"train_loss": -6.952711582183838, "global_step": 169761, "epoch": 4041} {"train_loss": -7.028428554534912, "global_step": 169762, "epoch": 4041} {"train_loss": -6.982283683050246, "global_step": 169763, "epoch": 4041, "val_loss": 68873.2109375} {"train_loss": -6.939225673675537, "global_step": 169764, "epoch": 4042} {"train_loss": -6.925202369689941, "global_step": 169765, "epoch": 4042} {"train_loss": -6.862527847290039, "global_step": 169766, "epoch": 4042} {"train_loss": -7.099236011505127, "global_step": 169767, "epoch": 4042} {"train_loss": -6.900653839111328, "global_step": 169768, "epoch": 4042} {"train_loss": -7.1106486320495605, "global_step": 169769, "epoch": 4042} {"train_loss": -6.969991683959961, "global_step": 169770, "epoch": 4042} {"train_loss": -7.041787147521973, "global_step": 169771, "epoch": 4042} {"train_loss": -7.052548408508301, "global_step": 169772, "epoch": 4042} {"train_loss": -6.981811046600342, "global_step": 169773, "epoch": 4042} {"train_loss": -7.064326286315918, "global_step": 169774, "epoch": 4042} {"train_loss": -7.074424743652344, "global_step": 169775, "epoch": 4042} {"train_loss": -7.104269027709961, "global_step": 169776, "epoch": 4042} {"train_loss": -7.197537422180176, "global_step": 169777, "epoch": 4042} {"train_loss": -7.099583625793457, "global_step": 169778, "epoch": 4042} {"train_loss": -7.097230434417725, "global_step": 169779, "epoch": 4042} {"train_loss": -7.064873218536377, "global_step": 169780, "epoch": 4042} {"train_loss": -7.102886199951172, "global_step": 169781, "epoch": 4042} {"train_loss": -7.003664970397949, "global_step": 169782, "epoch": 4042} {"train_loss": -7.050002574920654, "global_step": 169783, "epoch": 4042} {"train_loss": -7.057178974151611, "global_step": 169784, "epoch": 4042} {"train_loss": -7.158843040466309, "global_step": 169785, "epoch": 4042} {"train_loss": -7.050230026245117, "global_step": 169786, "epoch": 4042} {"train_loss": -7.01434326171875, "global_step": 169787, "epoch": 4042} {"train_loss": -6.992786407470703, "global_step": 169788, "epoch": 4042} {"train_loss": -7.055965900421143, "global_step": 169789, "epoch": 4042} {"train_loss": -6.9049787521362305, "global_step": 169790, "epoch": 4042} {"train_loss": -6.917561054229736, "global_step": 169791, "epoch": 4042} {"train_loss": -7.107630729675293, "global_step": 169792, "epoch": 4042} {"train_loss": -6.969834327697754, "global_step": 169793, "epoch": 4042} {"train_loss": -7.057153224945068, "global_step": 169794, "epoch": 4042} {"train_loss": -6.930446624755859, "global_step": 169795, "epoch": 4042} {"train_loss": -6.910146713256836, "global_step": 169796, "epoch": 4042} {"train_loss": -7.0376996994018555, "global_step": 169797, "epoch": 4042} {"train_loss": -6.877209663391113, "global_step": 169798, "epoch": 4042} {"train_loss": -6.940439224243164, "global_step": 169799, "epoch": 4042} {"train_loss": -6.9826531410217285, "global_step": 169800, "epoch": 4042} {"train_loss": -7.021003723144531, "global_step": 169801, "epoch": 4042} {"train_loss": -7.016376972198486, "global_step": 169802, "epoch": 4042} {"train_loss": -6.993539333343506, "global_step": 169803, "epoch": 4042} {"train_loss": -6.988084316253662, "global_step": 169804, "epoch": 4042} {"train_loss": -7.012677828470866, "global_step": 169805, "epoch": 4042, "val_loss": 68992.921875} {"train_loss": -7.048939228057861, "global_step": 169806, "epoch": 4043} {"train_loss": -6.95826530456543, "global_step": 169807, "epoch": 4043} {"train_loss": -6.954505920410156, "global_step": 169808, "epoch": 4043} {"train_loss": -6.977607727050781, "global_step": 169809, "epoch": 4043} {"train_loss": -6.979546070098877, "global_step": 169810, "epoch": 4043} {"train_loss": -7.071115970611572, "global_step": 169811, "epoch": 4043} {"train_loss": -7.016785144805908, "global_step": 169812, "epoch": 4043} {"train_loss": -6.966597557067871, "global_step": 169813, "epoch": 4043} {"train_loss": -7.090828895568848, "global_step": 169814, "epoch": 4043} {"train_loss": -7.012408256530762, "global_step": 169815, "epoch": 4043} {"train_loss": -7.121417999267578, "global_step": 169816, "epoch": 4043} {"train_loss": -6.927751541137695, "global_step": 169817, "epoch": 4043} {"train_loss": -7.117824554443359, "global_step": 169818, "epoch": 4043} {"train_loss": -7.0148606300354, "global_step": 169819, "epoch": 4043} {"train_loss": -7.072628021240234, "global_step": 169820, "epoch": 4043} {"train_loss": -7.018918037414551, "global_step": 169821, "epoch": 4043} {"train_loss": -7.080023765563965, "global_step": 169822, "epoch": 4043} {"train_loss": -7.042502403259277, "global_step": 169823, "epoch": 4043} {"train_loss": -7.042479515075684, "global_step": 169824, "epoch": 4043} {"train_loss": -7.030099868774414, "global_step": 169825, "epoch": 4043} {"train_loss": -7.010124206542969, "global_step": 169826, "epoch": 4043} {"train_loss": -7.104055404663086, "global_step": 169827, "epoch": 4043} {"train_loss": -7.041481018066406, "global_step": 169828, "epoch": 4043} {"train_loss": -7.132281303405762, "global_step": 169829, "epoch": 4043} {"train_loss": -6.979674339294434, "global_step": 169830, "epoch": 4043} {"train_loss": -7.074532508850098, "global_step": 169831, "epoch": 4043} {"train_loss": -6.974122047424316, "global_step": 169832, "epoch": 4043} {"train_loss": -7.035640239715576, "global_step": 169833, "epoch": 4043} {"train_loss": -7.14213752746582, "global_step": 169834, "epoch": 4043} {"train_loss": -7.026334762573242, "global_step": 169835, "epoch": 4043} {"train_loss": -7.005476951599121, "global_step": 169836, "epoch": 4043} {"train_loss": -7.067045211791992, "global_step": 169837, "epoch": 4043} {"train_loss": -6.975597858428955, "global_step": 169838, "epoch": 4043} {"train_loss": -7.059831619262695, "global_step": 169839, "epoch": 4043} {"train_loss": -7.10873556137085, "global_step": 169840, "epoch": 4043} {"train_loss": -7.013184070587158, "global_step": 169841, "epoch": 4043} {"train_loss": -7.006645679473877, "global_step": 169842, "epoch": 4043} {"train_loss": -7.020942211151123, "global_step": 169843, "epoch": 4043} {"train_loss": -6.9784321784973145, "global_step": 169844, "epoch": 4043} {"train_loss": -6.9972429275512695, "global_step": 169845, "epoch": 4043} {"train_loss": -6.877292633056641, "global_step": 169846, "epoch": 4043} {"train_loss": -7.030700411115374, "global_step": 169847, "epoch": 4043, "val_loss": 68924.4375} {"train_loss": -6.9573893547058105, "global_step": 169848, "epoch": 4044} {"train_loss": -6.985138893127441, "global_step": 169849, "epoch": 4044} {"train_loss": -7.000205039978027, "global_step": 169850, "epoch": 4044} {"train_loss": -6.934957981109619, "global_step": 169851, "epoch": 4044} {"train_loss": -7.023028373718262, "global_step": 169852, "epoch": 4044} {"train_loss": -6.9944963455200195, "global_step": 169853, "epoch": 4044} {"train_loss": -7.037967205047607, "global_step": 169854, "epoch": 4044} {"train_loss": -7.026590347290039, "global_step": 169855, "epoch": 4044} {"train_loss": -7.033581733703613, "global_step": 169856, "epoch": 4044} {"train_loss": -7.016080856323242, "global_step": 169857, "epoch": 4044} {"train_loss": -6.959705352783203, "global_step": 169858, "epoch": 4044} {"train_loss": -7.003021717071533, "global_step": 169859, "epoch": 4044} {"train_loss": -7.000357151031494, "global_step": 169860, "epoch": 4044} {"train_loss": -7.0461626052856445, "global_step": 169861, "epoch": 4044} {"train_loss": -7.019895553588867, "global_step": 169862, "epoch": 4044} {"train_loss": -7.006173133850098, "global_step": 169863, "epoch": 4044} {"train_loss": -6.973945617675781, "global_step": 169864, "epoch": 4044} {"train_loss": -7.073652267456055, "global_step": 169865, "epoch": 4044} {"train_loss": -7.003630638122559, "global_step": 169866, "epoch": 4044} {"train_loss": -7.055796146392822, "global_step": 169867, "epoch": 4044} {"train_loss": -7.089941024780273, "global_step": 169868, "epoch": 4044} {"train_loss": -7.10823917388916, "global_step": 169869, "epoch": 4044} {"train_loss": -7.148521423339844, "global_step": 169870, "epoch": 4044} {"train_loss": -6.959111213684082, "global_step": 169871, "epoch": 4044} {"train_loss": -7.074662208557129, "global_step": 169872, "epoch": 4044} {"train_loss": -7.016366004943848, "global_step": 169873, "epoch": 4044} {"train_loss": -7.027041435241699, "global_step": 169874, "epoch": 4044} {"train_loss": -7.065847396850586, "global_step": 169875, "epoch": 4044} {"train_loss": -7.0160651206970215, "global_step": 169876, "epoch": 4044} {"train_loss": -7.024868011474609, "global_step": 169877, "epoch": 4044} {"train_loss": -6.9717817306518555, "global_step": 169878, "epoch": 4044} {"train_loss": -7.164789199829102, "global_step": 169879, "epoch": 4044} {"train_loss": -7.022672653198242, "global_step": 169880, "epoch": 4044} {"train_loss": -6.978470802307129, "global_step": 169881, "epoch": 4044} {"train_loss": -7.008031845092773, "global_step": 169882, "epoch": 4044} {"train_loss": -6.992866516113281, "global_step": 169883, "epoch": 4044} {"train_loss": -7.0258989334106445, "global_step": 169884, "epoch": 4044} {"train_loss": -7.039288520812988, "global_step": 169885, "epoch": 4044} {"train_loss": -7.0414018630981445, "global_step": 169886, "epoch": 4044} {"train_loss": -7.066863059997559, "global_step": 169887, "epoch": 4044} {"train_loss": -7.044618129730225, "global_step": 169888, "epoch": 4044} {"train_loss": -7.02691514151437, "global_step": 169889, "epoch": 4044, "val_loss": 69091.2734375} {"train_loss": -7.077380180358887, "global_step": 169890, "epoch": 4045} {"train_loss": -7.0865020751953125, "global_step": 169891, "epoch": 4045} {"train_loss": -7.044287204742432, "global_step": 169892, "epoch": 4045} {"train_loss": -7.089117050170898, "global_step": 169893, "epoch": 4045} {"train_loss": -6.977396488189697, "global_step": 169894, "epoch": 4045} {"train_loss": -7.0492682456970215, "global_step": 169895, "epoch": 4045} {"train_loss": -7.040533542633057, "global_step": 169896, "epoch": 4045} {"train_loss": -6.89004373550415, "global_step": 169897, "epoch": 4045} {"train_loss": -7.020233631134033, "global_step": 169898, "epoch": 4045} {"train_loss": -7.007874488830566, "global_step": 169899, "epoch": 4045} {"train_loss": -6.923038482666016, "global_step": 169900, "epoch": 4045} {"train_loss": -7.0500030517578125, "global_step": 169901, "epoch": 4045} {"train_loss": -6.793313026428223, "global_step": 169902, "epoch": 4045} {"train_loss": -6.877095699310303, "global_step": 169903, "epoch": 4045} {"train_loss": -7.025728225708008, "global_step": 169904, "epoch": 4045} {"train_loss": -6.907556056976318, "global_step": 169905, "epoch": 4045} {"train_loss": -7.013679027557373, "global_step": 169906, "epoch": 4045} {"train_loss": -6.950203895568848, "global_step": 169907, "epoch": 4045} {"train_loss": -6.905640602111816, "global_step": 169908, "epoch": 4045} {"train_loss": -6.954467296600342, "global_step": 169909, "epoch": 4045} {"train_loss": -6.9108147621154785, "global_step": 169910, "epoch": 4045} {"train_loss": -7.099599361419678, "global_step": 169911, "epoch": 4045} {"train_loss": -7.056345462799072, "global_step": 169912, "epoch": 4045} {"train_loss": -6.929091930389404, "global_step": 169913, "epoch": 4045} {"train_loss": -7.101816177368164, "global_step": 169914, "epoch": 4045} {"train_loss": -7.051822662353516, "global_step": 169915, "epoch": 4045} {"train_loss": -7.053337574005127, "global_step": 169916, "epoch": 4045} {"train_loss": -6.975979804992676, "global_step": 169917, "epoch": 4045} {"train_loss": -6.951815128326416, "global_step": 169918, "epoch": 4045} {"train_loss": -7.195549488067627, "global_step": 169919, "epoch": 4045} {"train_loss": -6.961994171142578, "global_step": 169920, "epoch": 4045} {"train_loss": -7.071506500244141, "global_step": 169921, "epoch": 4045} {"train_loss": -7.029116630554199, "global_step": 169922, "epoch": 4045} {"train_loss": -6.981795787811279, "global_step": 169923, "epoch": 4045} {"train_loss": -7.066320419311523, "global_step": 169924, "epoch": 4045} {"train_loss": -7.078192710876465, "global_step": 169925, "epoch": 4045} {"train_loss": -7.058704376220703, "global_step": 169926, "epoch": 4045} {"train_loss": -6.935050964355469, "global_step": 169927, "epoch": 4045} {"train_loss": -7.149260520935059, "global_step": 169928, "epoch": 4045} {"train_loss": -7.067447185516357, "global_step": 169929, "epoch": 4045} {"train_loss": -6.970775127410889, "global_step": 169930, "epoch": 4045} {"train_loss": -7.011664651689076, "global_step": 169931, "epoch": 4045, "val_loss": 68886.2265625} {"train_loss": -7.112080097198486, "global_step": 169932, "epoch": 4046} {"train_loss": -7.104097366333008, "global_step": 169933, "epoch": 4046} {"train_loss": -7.139339447021484, "global_step": 169934, "epoch": 4046} {"train_loss": -7.076731204986572, "global_step": 169935, "epoch": 4046} {"train_loss": -7.141421794891357, "global_step": 169936, "epoch": 4046} {"train_loss": -7.115316390991211, "global_step": 169937, "epoch": 4046} {"train_loss": -7.078289031982422, "global_step": 169938, "epoch": 4046} {"train_loss": -7.022083282470703, "global_step": 169939, "epoch": 4046} {"train_loss": -7.003091812133789, "global_step": 169940, "epoch": 4046} {"train_loss": -7.044753074645996, "global_step": 169941, "epoch": 4046} {"train_loss": -7.050004482269287, "global_step": 169942, "epoch": 4046} {"train_loss": -7.047024726867676, "global_step": 169943, "epoch": 4046} {"train_loss": -7.130502700805664, "global_step": 169944, "epoch": 4046} {"train_loss": -7.038235664367676, "global_step": 169945, "epoch": 4046} {"train_loss": -6.986148834228516, "global_step": 169946, "epoch": 4046} {"train_loss": -6.968480110168457, "global_step": 169947, "epoch": 4046} {"train_loss": -6.888455390930176, "global_step": 169948, "epoch": 4046} {"train_loss": -6.932018280029297, "global_step": 169949, "epoch": 4046} {"train_loss": -7.000890731811523, "global_step": 169950, "epoch": 4046} {"train_loss": -7.019461631774902, "global_step": 169951, "epoch": 4046} {"train_loss": -7.031700134277344, "global_step": 169952, "epoch": 4046} {"train_loss": -7.092041015625, "global_step": 169953, "epoch": 4046} {"train_loss": -7.140169143676758, "global_step": 169954, "epoch": 4046} {"train_loss": -6.965010643005371, "global_step": 169955, "epoch": 4046} {"train_loss": -6.9831647872924805, "global_step": 169956, "epoch": 4046} {"train_loss": -6.959124565124512, "global_step": 169957, "epoch": 4046} {"train_loss": -7.033482551574707, "global_step": 169958, "epoch": 4046} {"train_loss": -6.942420959472656, "global_step": 169959, "epoch": 4046} {"train_loss": -6.984783172607422, "global_step": 169960, "epoch": 4046} {"train_loss": -7.032964706420898, "global_step": 169961, "epoch": 4046} {"train_loss": -7.044613361358643, "global_step": 169962, "epoch": 4046} {"train_loss": -7.007633209228516, "global_step": 169963, "epoch": 4046} {"train_loss": -7.014352798461914, "global_step": 169964, "epoch": 4046} {"train_loss": -7.127715110778809, "global_step": 169965, "epoch": 4046} {"train_loss": -6.966963291168213, "global_step": 169966, "epoch": 4046} {"train_loss": -6.924898147583008, "global_step": 169967, "epoch": 4046} {"train_loss": -7.08258056640625, "global_step": 169968, "epoch": 4046} {"train_loss": -6.901017665863037, "global_step": 169969, "epoch": 4046} {"train_loss": -7.0342888832092285, "global_step": 169970, "epoch": 4046} {"train_loss": -7.044674873352051, "global_step": 169971, "epoch": 4046} {"train_loss": -6.9845476150512695, "global_step": 169972, "epoch": 4046} {"train_loss": -7.030183848880586, "global_step": 169973, "epoch": 4046, "val_loss": 68752.6953125} {"train_loss": -6.977928161621094, "global_step": 169974, "epoch": 4047} {"train_loss": -7.035677909851074, "global_step": 169975, "epoch": 4047} {"train_loss": -6.976125717163086, "global_step": 169976, "epoch": 4047} {"train_loss": -7.026893615722656, "global_step": 169977, "epoch": 4047} {"train_loss": -6.908348083496094, "global_step": 169978, "epoch": 4047} {"train_loss": -7.043745517730713, "global_step": 169979, "epoch": 4047} {"train_loss": -6.967883110046387, "global_step": 169980, "epoch": 4047} {"train_loss": -6.9494781494140625, "global_step": 169981, "epoch": 4047} {"train_loss": -6.990445137023926, "global_step": 169982, "epoch": 4047} {"train_loss": -6.895343780517578, "global_step": 169983, "epoch": 4047} {"train_loss": -6.933901309967041, "global_step": 169984, "epoch": 4047} {"train_loss": -7.049102783203125, "global_step": 169985, "epoch": 4047} {"train_loss": -6.834104537963867, "global_step": 169986, "epoch": 4047} {"train_loss": -6.8887128829956055, "global_step": 169987, "epoch": 4047} {"train_loss": -6.915721893310547, "global_step": 169988, "epoch": 4047} {"train_loss": -6.921267986297607, "global_step": 169989, "epoch": 4047} {"train_loss": -7.0387139320373535, "global_step": 169990, "epoch": 4047} {"train_loss": -7.044185638427734, "global_step": 169991, "epoch": 4047} {"train_loss": -6.785224914550781, "global_step": 169992, "epoch": 4047} {"train_loss": -6.908734321594238, "global_step": 169993, "epoch": 4047} {"train_loss": -6.93202018737793, "global_step": 169994, "epoch": 4047} {"train_loss": -6.913618087768555, "global_step": 169995, "epoch": 4047} {"train_loss": -7.068225860595703, "global_step": 169996, "epoch": 4047} {"train_loss": -6.929830074310303, "global_step": 169997, "epoch": 4047} {"train_loss": -6.983410835266113, "global_step": 169998, "epoch": 4047} {"train_loss": -6.9458513259887695, "global_step": 169999, "epoch": 4047} {"train_loss": -6.9410176277160645, "global_step": 170000, "epoch": 4047} {"train_loss": -6.900413513183594, "global_step": 170001, "epoch": 4047} {"train_loss": -7.01674747467041, "global_step": 170002, "epoch": 4047} {"train_loss": -7.011513710021973, "global_step": 170003, "epoch": 4047} {"train_loss": -7.000845909118652, "global_step": 170004, "epoch": 4047} {"train_loss": -6.988805294036865, "global_step": 170005, "epoch": 4047} {"train_loss": -7.071467399597168, "global_step": 170006, "epoch": 4047} {"train_loss": -7.036574363708496, "global_step": 170007, "epoch": 4047} {"train_loss": -6.946498870849609, "global_step": 170008, "epoch": 4047} {"train_loss": -6.937273979187012, "global_step": 170009, "epoch": 4047} {"train_loss": -6.738565444946289, "global_step": 170010, "epoch": 4047} {"train_loss": -6.925874710083008, "global_step": 170011, "epoch": 4047} {"train_loss": -6.99293327331543, "global_step": 170012, "epoch": 4047} {"train_loss": -6.982448101043701, "global_step": 170013, "epoch": 4047} {"train_loss": -7.059550762176514, "global_step": 170014, "epoch": 4047} {"train_loss": -6.963196425210862, "global_step": 170015, "epoch": 4047, "val_loss": 68777.359375} {"train_loss": -6.899082183837891, "global_step": 170016, "epoch": 4048} {"train_loss": -7.107535362243652, "global_step": 170017, "epoch": 4048} {"train_loss": -6.96285343170166, "global_step": 170018, "epoch": 4048} {"train_loss": -7.029415130615234, "global_step": 170019, "epoch": 4048} {"train_loss": -6.925793170928955, "global_step": 170020, "epoch": 4048} {"train_loss": -7.055530548095703, "global_step": 170021, "epoch": 4048} {"train_loss": -7.063185691833496, "global_step": 170022, "epoch": 4048} {"train_loss": -7.044801712036133, "global_step": 170023, "epoch": 4048} {"train_loss": -7.0123701095581055, "global_step": 170024, "epoch": 4048} {"train_loss": -6.85038423538208, "global_step": 170025, "epoch": 4048} {"train_loss": -6.968297004699707, "global_step": 170026, "epoch": 4048} {"train_loss": -6.825954437255859, "global_step": 170027, "epoch": 4048} {"train_loss": -7.063778877258301, "global_step": 170028, "epoch": 4048} {"train_loss": -7.001062393188477, "global_step": 170029, "epoch": 4048} {"train_loss": -6.950176239013672, "global_step": 170030, "epoch": 4048} {"train_loss": -6.910102367401123, "global_step": 170031, "epoch": 4048} {"train_loss": -6.898575305938721, "global_step": 170032, "epoch": 4048} {"train_loss": -6.83743953704834, "global_step": 170033, "epoch": 4048} {"train_loss": -7.041936874389648, "global_step": 170034, "epoch": 4048} {"train_loss": -7.06552791595459, "global_step": 170035, "epoch": 4048} {"train_loss": -6.995625972747803, "global_step": 170036, "epoch": 4048} {"train_loss": -7.039219856262207, "global_step": 170037, "epoch": 4048} {"train_loss": -6.97938346862793, "global_step": 170038, "epoch": 4048} {"train_loss": -6.957208156585693, "global_step": 170039, "epoch": 4048} {"train_loss": -6.980020046234131, "global_step": 170040, "epoch": 4048} {"train_loss": -7.021481513977051, "global_step": 170041, "epoch": 4048} {"train_loss": -7.080047607421875, "global_step": 170042, "epoch": 4048} {"train_loss": -6.953123092651367, "global_step": 170043, "epoch": 4048} {"train_loss": -7.0137715339660645, "global_step": 170044, "epoch": 4048} {"train_loss": -6.995472431182861, "global_step": 170045, "epoch": 4048} {"train_loss": -6.941051959991455, "global_step": 170046, "epoch": 4048} {"train_loss": -6.937941551208496, "global_step": 170047, "epoch": 4048} {"train_loss": -6.929142475128174, "global_step": 170048, "epoch": 4048} {"train_loss": -6.930294990539551, "global_step": 170049, "epoch": 4048} {"train_loss": -7.025263786315918, "global_step": 170050, "epoch": 4048} {"train_loss": -7.006848335266113, "global_step": 170051, "epoch": 4048} {"train_loss": -6.964451313018799, "global_step": 170052, "epoch": 4048} {"train_loss": -7.037447929382324, "global_step": 170053, "epoch": 4048} {"train_loss": -7.0203351974487305, "global_step": 170054, "epoch": 4048} {"train_loss": -6.97374963760376, "global_step": 170055, "epoch": 4048} {"train_loss": -6.909871578216553, "global_step": 170056, "epoch": 4048} {"train_loss": -6.979070515859695, "global_step": 170057, "epoch": 4048, "val_loss": 69091.6953125} {"train_loss": -7.008092880249023, "global_step": 170058, "epoch": 4049} {"train_loss": -6.975409984588623, "global_step": 170059, "epoch": 4049} {"train_loss": -7.059948921203613, "global_step": 170060, "epoch": 4049} {"train_loss": -7.028678894042969, "global_step": 170061, "epoch": 4049} {"train_loss": -6.995965957641602, "global_step": 170062, "epoch": 4049} {"train_loss": -7.024141311645508, "global_step": 170063, "epoch": 4049} {"train_loss": -6.952756404876709, "global_step": 170064, "epoch": 4049} {"train_loss": -6.96165657043457, "global_step": 170065, "epoch": 4049} {"train_loss": -7.089147567749023, "global_step": 170066, "epoch": 4049} {"train_loss": -6.9678826332092285, "global_step": 170067, "epoch": 4049} {"train_loss": -7.0509233474731445, "global_step": 170068, "epoch": 4049} {"train_loss": -7.046555995941162, "global_step": 170069, "epoch": 4049} {"train_loss": -6.939173221588135, "global_step": 170070, "epoch": 4049} {"train_loss": -6.984907150268555, "global_step": 170071, "epoch": 4049} {"train_loss": -7.041965007781982, "global_step": 170072, "epoch": 4049} {"train_loss": -6.9628400802612305, "global_step": 170073, "epoch": 4049} {"train_loss": -7.036436080932617, "global_step": 170074, "epoch": 4049} {"train_loss": -6.940363883972168, "global_step": 170075, "epoch": 4049} {"train_loss": -7.04982852935791, "global_step": 170076, "epoch": 4049} {"train_loss": -6.999885082244873, "global_step": 170077, "epoch": 4049} {"train_loss": -6.953056335449219, "global_step": 170078, "epoch": 4049} {"train_loss": -7.145003795623779, "global_step": 170079, "epoch": 4049} {"train_loss": -7.002521514892578, "global_step": 170080, "epoch": 4049} {"train_loss": -7.068087577819824, "global_step": 170081, "epoch": 4049} {"train_loss": -6.910736083984375, "global_step": 170082, "epoch": 4049} {"train_loss": -7.00208044052124, "global_step": 170083, "epoch": 4049} {"train_loss": -7.054429054260254, "global_step": 170084, "epoch": 4049} {"train_loss": -7.08972692489624, "global_step": 170085, "epoch": 4049} {"train_loss": -6.9614081382751465, "global_step": 170086, "epoch": 4049} {"train_loss": -7.017793655395508, "global_step": 170087, "epoch": 4049} {"train_loss": -6.824804306030273, "global_step": 170088, "epoch": 4049} {"train_loss": -6.966113567352295, "global_step": 170089, "epoch": 4049} {"train_loss": -6.9977288246154785, "global_step": 170090, "epoch": 4049} {"train_loss": -7.033116817474365, "global_step": 170091, "epoch": 4049} {"train_loss": -7.046715259552002, "global_step": 170092, "epoch": 4049} {"train_loss": -7.043409824371338, "global_step": 170093, "epoch": 4049} {"train_loss": -7.021806716918945, "global_step": 170094, "epoch": 4049} {"train_loss": -7.009793281555176, "global_step": 170095, "epoch": 4049} {"train_loss": -6.979617118835449, "global_step": 170096, "epoch": 4049} {"train_loss": -6.954521179199219, "global_step": 170097, "epoch": 4049} {"train_loss": -7.070980072021484, "global_step": 170098, "epoch": 4049} {"train_loss": -7.005974042983282, "global_step": 170099, "epoch": 4049, "val_loss": 68926.8671875} {"train_loss": -6.925769805908203, "global_step": 170100, "epoch": 4050} {"train_loss": -7.028746128082275, "global_step": 170101, "epoch": 4050} {"train_loss": -6.922975540161133, "global_step": 170102, "epoch": 4050} {"train_loss": -6.983354091644287, "global_step": 170103, "epoch": 4050} {"train_loss": -6.979994773864746, "global_step": 170104, "epoch": 4050} {"train_loss": -7.0127482414245605, "global_step": 170105, "epoch": 4050} {"train_loss": -6.956399917602539, "global_step": 170106, "epoch": 4050} {"train_loss": -7.156293869018555, "global_step": 170107, "epoch": 4050} {"train_loss": -6.956877708435059, "global_step": 170108, "epoch": 4050} {"train_loss": -6.956365585327148, "global_step": 170109, "epoch": 4050} {"train_loss": -7.045060634613037, "global_step": 170110, "epoch": 4050} {"train_loss": -7.133691310882568, "global_step": 170111, "epoch": 4050} {"train_loss": -6.987926959991455, "global_step": 170112, "epoch": 4050} {"train_loss": -7.042795181274414, "global_step": 170113, "epoch": 4050} {"train_loss": -6.975594520568848, "global_step": 170114, "epoch": 4050} {"train_loss": -7.023830413818359, "global_step": 170115, "epoch": 4050} {"train_loss": -7.001870155334473, "global_step": 170116, "epoch": 4050} {"train_loss": -7.0881171226501465, "global_step": 170117, "epoch": 4050} {"train_loss": -7.079405784606934, "global_step": 170118, "epoch": 4050} {"train_loss": -7.104397773742676, "global_step": 170119, "epoch": 4050} {"train_loss": -7.049541473388672, "global_step": 170120, "epoch": 4050} {"train_loss": -6.965850830078125, "global_step": 170121, "epoch": 4050} {"train_loss": -7.114720344543457, "global_step": 170122, "epoch": 4050} {"train_loss": -7.07169246673584, "global_step": 170123, "epoch": 4050} {"train_loss": -7.0344367027282715, "global_step": 170124, "epoch": 4050} {"train_loss": -7.017158031463623, "global_step": 170125, "epoch": 4050} {"train_loss": -7.069673538208008, "global_step": 170126, "epoch": 4050} {"train_loss": -7.081568717956543, "global_step": 170127, "epoch": 4050} {"train_loss": -6.8856201171875, "global_step": 170128, "epoch": 4050} {"train_loss": -7.0152482986450195, "global_step": 170129, "epoch": 4050} {"train_loss": -6.971232891082764, "global_step": 170130, "epoch": 4050} {"train_loss": -6.998228073120117, "global_step": 170131, "epoch": 4050} {"train_loss": -6.90349006652832, "global_step": 170132, "epoch": 4050} {"train_loss": -6.952559471130371, "global_step": 170133, "epoch": 4050} {"train_loss": -7.00724983215332, "global_step": 170134, "epoch": 4050} {"train_loss": -6.97657585144043, "global_step": 170135, "epoch": 4050} {"train_loss": -7.116890907287598, "global_step": 170136, "epoch": 4050} {"train_loss": -6.996500015258789, "global_step": 170137, "epoch": 4050} {"train_loss": -6.961188316345215, "global_step": 170138, "epoch": 4050} {"train_loss": -7.084394931793213, "global_step": 170139, "epoch": 4050} {"train_loss": -7.099127292633057, "global_step": 170140, "epoch": 4050} {"train_loss": -7.016667570386614, "global_step": 170141, "epoch": 4050, "train/sim_max_reward_0": 0.5891573741349708, "train/sim_max_reward_1": 0.9378038571404749, "train/sim_max_reward_2": 0.9211557346310515, "train/sim_max_reward_3": 0.38371731063201237, "train/sim_max_reward_4": 0.9638649737484192, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.9984584548641735, "test/sim_max_reward_4300001": 0.8870332140149566, "test/sim_max_reward_4300002": 0.9591819980094666, "test/sim_max_reward_4300003": 0.8454321764139255, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.7259957177396107, "test/sim_max_reward_4300006": 0.9554181784512727, "test/sim_max_reward_4300007": 1.0, "test/sim_max_reward_4300008": 1.0, "test/sim_max_reward_4300009": 0.9591502752980581, "test/sim_max_reward_4300010": 0.9913731282923237, "test/sim_max_reward_4300011": 0.9223904829995052, "test/sim_max_reward_4300012": 0.9451972599526907, "test/sim_max_reward_4300013": 0.4033546510309547, "test/sim_max_reward_4300014": 0.9659413447947397, "test/sim_max_reward_4300015": 0.9283344938185515, "test/sim_max_reward_4300016": 0.8962852877377125, "test/sim_max_reward_4300017": 0.9372063272631532, "test/sim_max_reward_4300018": 0.40562548525444586, "test/sim_max_reward_4300019": 0.1860460881279548, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9667905743998639, "test/sim_max_reward_4300022": 0.8056439513995911, "test/sim_max_reward_4300023": 0.7533838698174287, "test/sim_max_reward_4300024": 1.0, "test/sim_max_reward_4300025": 0.8476313911070236, "test/sim_max_reward_4300026": 0.17421064508854914, "test/sim_max_reward_4300027": 0.9195410806077768, "test/sim_max_reward_4300028": 0.0583474879759581, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.007331619368324528, "test/sim_max_reward_4300031": 0.49036750567090115, "test/sim_max_reward_4300032": 0.9575336062216727, "test/sim_max_reward_4300033": 0.6505036126015743, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.33032546189046036, "test/sim_max_reward_4300036": 0.20191719830678337, "test/sim_max_reward_4300037": 0.6720071334346364, "test/sim_max_reward_4300038": 0.8043392265321307, "test/sim_max_reward_4300039": 0.9905313361388277, "test/sim_max_reward_4300040": 0.9888463702312731, "test/sim_max_reward_4300041": 0.7662916138663867, "test/sim_max_reward_4300042": 0.940211110567036, "test/sim_max_reward_4300043": 0.13696879985733104, "test/sim_max_reward_4300044": 0.8248551743667826, "test/sim_max_reward_4300045": 0.9731071331508367, "test/sim_max_reward_4300046": 0.9401549172692877, "test/sim_max_reward_4300047": 0.6769275800486705, "test/sim_max_reward_4300048": 0.955235463165897, "test/sim_max_reward_4300049": 0.25013317675814356, "train/mean_score": 0.6647806682748527, "test/mean_score": 0.6802279141743185, "val_loss": 68914.25} {"train_loss": -7.043948650360107, "global_step": 170142, "epoch": 4051} {"train_loss": -7.0704545974731445, "global_step": 170143, "epoch": 4051} {"train_loss": -7.041945457458496, "global_step": 170144, "epoch": 4051} {"train_loss": -6.974878787994385, "global_step": 170145, "epoch": 4051} {"train_loss": -7.034346580505371, "global_step": 170146, "epoch": 4051} {"train_loss": -6.938005447387695, "global_step": 170147, "epoch": 4051} {"train_loss": -7.035962104797363, "global_step": 170148, "epoch": 4051} {"train_loss": -7.060886383056641, "global_step": 170149, "epoch": 4051} {"train_loss": -7.040356636047363, "global_step": 170150, "epoch": 4051} {"train_loss": -6.9003496170043945, "global_step": 170151, "epoch": 4051} {"train_loss": -6.963475704193115, "global_step": 170152, "epoch": 4051} {"train_loss": -6.957894802093506, "global_step": 170153, "epoch": 4051} {"train_loss": -7.005523681640625, "global_step": 170154, "epoch": 4051} {"train_loss": -7.049016952514648, "global_step": 170155, "epoch": 4051} {"train_loss": -7.0352044105529785, "global_step": 170156, "epoch": 4051} {"train_loss": -7.01185417175293, "global_step": 170157, "epoch": 4051} {"train_loss": -7.071929454803467, "global_step": 170158, "epoch": 4051} {"train_loss": -7.023248195648193, "global_step": 170159, "epoch": 4051} {"train_loss": -7.006040573120117, "global_step": 170160, "epoch": 4051} {"train_loss": -7.115166664123535, "global_step": 170161, "epoch": 4051} {"train_loss": -7.051739692687988, "global_step": 170162, "epoch": 4051} {"train_loss": -7.036923408508301, "global_step": 170163, "epoch": 4051} {"train_loss": -7.06938362121582, "global_step": 170164, "epoch": 4051} {"train_loss": -7.096270561218262, "global_step": 170165, "epoch": 4051} {"train_loss": -7.046933174133301, "global_step": 170166, "epoch": 4051} {"train_loss": -7.027218818664551, "global_step": 170167, "epoch": 4051} {"train_loss": -6.96928596496582, "global_step": 170168, "epoch": 4051} {"train_loss": -6.98085355758667, "global_step": 170169, "epoch": 4051} {"train_loss": -6.8157267570495605, "global_step": 170170, "epoch": 4051} {"train_loss": -6.914642810821533, "global_step": 170171, "epoch": 4051} {"train_loss": -6.859004974365234, "global_step": 170172, "epoch": 4051} {"train_loss": -6.968313694000244, "global_step": 170173, "epoch": 4051} {"train_loss": -6.944119453430176, "global_step": 170174, "epoch": 4051} {"train_loss": -6.910805702209473, "global_step": 170175, "epoch": 4051} {"train_loss": -6.918683052062988, "global_step": 170176, "epoch": 4051} {"train_loss": -6.9672980308532715, "global_step": 170177, "epoch": 4051} {"train_loss": -6.96634578704834, "global_step": 170178, "epoch": 4051} {"train_loss": -6.9012041091918945, "global_step": 170179, "epoch": 4051} {"train_loss": -6.981368541717529, "global_step": 170180, "epoch": 4051} {"train_loss": -6.970213890075684, "global_step": 170181, "epoch": 4051} {"train_loss": -6.811129093170166, "global_step": 170182, "epoch": 4051} {"train_loss": -6.98622499193464, "global_step": 170183, "epoch": 4051, "val_loss": 68864.7421875} {"train_loss": -6.95156192779541, "global_step": 170184, "epoch": 4052} {"train_loss": -6.922459602355957, "global_step": 170185, "epoch": 4052} {"train_loss": -6.934364318847656, "global_step": 170186, "epoch": 4052} {"train_loss": -6.963917255401611, "global_step": 170187, "epoch": 4052} {"train_loss": -7.026557922363281, "global_step": 170188, "epoch": 4052} {"train_loss": -6.9862589836120605, "global_step": 170189, "epoch": 4052} {"train_loss": -7.0689191818237305, "global_step": 170190, "epoch": 4052} {"train_loss": -6.88638973236084, "global_step": 170191, "epoch": 4052} {"train_loss": -6.9430341720581055, "global_step": 170192, "epoch": 4052} {"train_loss": -6.962287425994873, "global_step": 170193, "epoch": 4052} {"train_loss": -6.8765058517456055, "global_step": 170194, "epoch": 4052} {"train_loss": -6.949762344360352, "global_step": 170195, "epoch": 4052} {"train_loss": -6.878823280334473, "global_step": 170196, "epoch": 4052} {"train_loss": -6.950556755065918, "global_step": 170197, "epoch": 4052} {"train_loss": -6.9447832107543945, "global_step": 170198, "epoch": 4052} {"train_loss": -6.893919944763184, "global_step": 170199, "epoch": 4052} {"train_loss": -6.931457042694092, "global_step": 170200, "epoch": 4052} {"train_loss": -6.99014949798584, "global_step": 170201, "epoch": 4052} {"train_loss": -6.968661785125732, "global_step": 170202, "epoch": 4052} {"train_loss": -7.005533695220947, "global_step": 170203, "epoch": 4052} {"train_loss": -6.972657680511475, "global_step": 170204, "epoch": 4052} {"train_loss": -6.887159824371338, "global_step": 170205, "epoch": 4052} {"train_loss": -7.011343002319336, "global_step": 170206, "epoch": 4052} {"train_loss": -7.086237907409668, "global_step": 170207, "epoch": 4052} {"train_loss": -6.987766742706299, "global_step": 170208, "epoch": 4052} {"train_loss": -7.014320373535156, "global_step": 170209, "epoch": 4052} {"train_loss": -7.078819274902344, "global_step": 170210, "epoch": 4052} {"train_loss": -7.112824440002441, "global_step": 170211, "epoch": 4052} {"train_loss": -7.0055999755859375, "global_step": 170212, "epoch": 4052} {"train_loss": -7.042344093322754, "global_step": 170213, "epoch": 4052} {"train_loss": -7.063462257385254, "global_step": 170214, "epoch": 4052} {"train_loss": -7.014801979064941, "global_step": 170215, "epoch": 4052} {"train_loss": -7.057727813720703, "global_step": 170216, "epoch": 4052} {"train_loss": -6.956963539123535, "global_step": 170217, "epoch": 4052} {"train_loss": -7.028015613555908, "global_step": 170218, "epoch": 4052} {"train_loss": -6.867804050445557, "global_step": 170219, "epoch": 4052} {"train_loss": -7.123638153076172, "global_step": 170220, "epoch": 4052} {"train_loss": -7.055121898651123, "global_step": 170221, "epoch": 4052} {"train_loss": -6.977026462554932, "global_step": 170222, "epoch": 4052} {"train_loss": -7.112958908081055, "global_step": 170223, "epoch": 4052} {"train_loss": -6.983474254608154, "global_step": 170224, "epoch": 4052} {"train_loss": -6.990040790467035, "global_step": 170225, "epoch": 4052, "val_loss": 68974.375} {"train_loss": -7.026378631591797, "global_step": 170226, "epoch": 4053} {"train_loss": -7.104196548461914, "global_step": 170227, "epoch": 4053} {"train_loss": -7.058615207672119, "global_step": 170228, "epoch": 4053} {"train_loss": -6.8595476150512695, "global_step": 170229, "epoch": 4053} {"train_loss": -7.051487445831299, "global_step": 170230, "epoch": 4053} {"train_loss": -6.956532001495361, "global_step": 170231, "epoch": 4053} {"train_loss": -7.02030086517334, "global_step": 170232, "epoch": 4053} {"train_loss": -6.982832908630371, "global_step": 170233, "epoch": 4053} {"train_loss": -6.91628885269165, "global_step": 170234, "epoch": 4053} {"train_loss": -6.927717685699463, "global_step": 170235, "epoch": 4053} {"train_loss": -6.9542646408081055, "global_step": 170236, "epoch": 4053} {"train_loss": -6.921429634094238, "global_step": 170237, "epoch": 4053} {"train_loss": -6.962724208831787, "global_step": 170238, "epoch": 4053} {"train_loss": -6.890071392059326, "global_step": 170239, "epoch": 4053} {"train_loss": -7.083120822906494, "global_step": 170240, "epoch": 4053} {"train_loss": -6.972674369812012, "global_step": 170241, "epoch": 4053} {"train_loss": -6.9050469398498535, "global_step": 170242, "epoch": 4053} {"train_loss": -6.972043514251709, "global_step": 170243, "epoch": 4053} {"train_loss": -6.93220329284668, "global_step": 170244, "epoch": 4053} {"train_loss": -6.963006973266602, "global_step": 170245, "epoch": 4053} {"train_loss": -7.057424545288086, "global_step": 170246, "epoch": 4053} {"train_loss": -6.892971992492676, "global_step": 170247, "epoch": 4053} {"train_loss": -7.041825294494629, "global_step": 170248, "epoch": 4053} {"train_loss": -7.012672424316406, "global_step": 170249, "epoch": 4053} {"train_loss": -6.959411144256592, "global_step": 170250, "epoch": 4053} {"train_loss": -7.073200702667236, "global_step": 170251, "epoch": 4053} {"train_loss": -6.967987060546875, "global_step": 170252, "epoch": 4053} {"train_loss": -7.0015974044799805, "global_step": 170253, "epoch": 4053} {"train_loss": -7.08101749420166, "global_step": 170254, "epoch": 4053} {"train_loss": -6.957581520080566, "global_step": 170255, "epoch": 4053} {"train_loss": -6.948918342590332, "global_step": 170256, "epoch": 4053} {"train_loss": -7.006326675415039, "global_step": 170257, "epoch": 4053} {"train_loss": -7.019272804260254, "global_step": 170258, "epoch": 4053} {"train_loss": -6.904168128967285, "global_step": 170259, "epoch": 4053} {"train_loss": -7.032999038696289, "global_step": 170260, "epoch": 4053} {"train_loss": -6.9505615234375, "global_step": 170261, "epoch": 4053} {"train_loss": -7.099880218505859, "global_step": 170262, "epoch": 4053} {"train_loss": -6.82521915435791, "global_step": 170263, "epoch": 4053} {"train_loss": -6.78472375869751, "global_step": 170264, "epoch": 4053} {"train_loss": -7.0176801681518555, "global_step": 170265, "epoch": 4053} {"train_loss": -6.820803642272949, "global_step": 170266, "epoch": 4053} {"train_loss": -6.976342655363537, "global_step": 170267, "epoch": 4053, "val_loss": 69301.484375} {"train_loss": -6.8731303215026855, "global_step": 170268, "epoch": 4054} {"train_loss": -6.978277206420898, "global_step": 170269, "epoch": 4054} {"train_loss": -6.801212787628174, "global_step": 170270, "epoch": 4054} {"train_loss": -7.00291109085083, "global_step": 170271, "epoch": 4054} {"train_loss": -6.856849670410156, "global_step": 170272, "epoch": 4054} {"train_loss": -6.905341148376465, "global_step": 170273, "epoch": 4054} {"train_loss": -7.027472496032715, "global_step": 170274, "epoch": 4054} {"train_loss": -6.994813919067383, "global_step": 170275, "epoch": 4054} {"train_loss": -6.946788787841797, "global_step": 170276, "epoch": 4054} {"train_loss": -6.974592208862305, "global_step": 170277, "epoch": 4054} {"train_loss": -6.910060882568359, "global_step": 170278, "epoch": 4054} {"train_loss": -6.995396614074707, "global_step": 170279, "epoch": 4054} {"train_loss": -7.050534248352051, "global_step": 170280, "epoch": 4054} {"train_loss": -7.082785129547119, "global_step": 170281, "epoch": 4054} {"train_loss": -6.945248603820801, "global_step": 170282, "epoch": 4054} {"train_loss": -6.9805192947387695, "global_step": 170283, "epoch": 4054} {"train_loss": -7.095667362213135, "global_step": 170284, "epoch": 4054} {"train_loss": -6.969152450561523, "global_step": 170285, "epoch": 4054} {"train_loss": -7.07530403137207, "global_step": 170286, "epoch": 4054} {"train_loss": -6.960904121398926, "global_step": 170287, "epoch": 4054} {"train_loss": -7.0316267013549805, "global_step": 170288, "epoch": 4054} {"train_loss": -7.0478386878967285, "global_step": 170289, "epoch": 4054} {"train_loss": -7.021746635437012, "global_step": 170290, "epoch": 4054} {"train_loss": -7.048225402832031, "global_step": 170291, "epoch": 4054} {"train_loss": -7.089694499969482, "global_step": 170292, "epoch": 4054} {"train_loss": -7.024311065673828, "global_step": 170293, "epoch": 4054} {"train_loss": -7.003998756408691, "global_step": 170294, "epoch": 4054} {"train_loss": -7.09589147567749, "global_step": 170295, "epoch": 4054} {"train_loss": -7.017196178436279, "global_step": 170296, "epoch": 4054} {"train_loss": -7.061157703399658, "global_step": 170297, "epoch": 4054} {"train_loss": -6.974466323852539, "global_step": 170298, "epoch": 4054} {"train_loss": -7.034460067749023, "global_step": 170299, "epoch": 4054} {"train_loss": -7.036186218261719, "global_step": 170300, "epoch": 4054} {"train_loss": -7.050384521484375, "global_step": 170301, "epoch": 4054} {"train_loss": -7.044904708862305, "global_step": 170302, "epoch": 4054} {"train_loss": -7.010427951812744, "global_step": 170303, "epoch": 4054} {"train_loss": -7.092680931091309, "global_step": 170304, "epoch": 4054} {"train_loss": -7.099822998046875, "global_step": 170305, "epoch": 4054} {"train_loss": -7.003452777862549, "global_step": 170306, "epoch": 4054} {"train_loss": -7.086198329925537, "global_step": 170307, "epoch": 4054} {"train_loss": -7.033555507659912, "global_step": 170308, "epoch": 4054} {"train_loss": -7.0099362305232455, "global_step": 170309, "epoch": 4054, "val_loss": 68912.5390625} {"train_loss": -7.084540367126465, "global_step": 170310, "epoch": 4055} {"train_loss": -7.121529579162598, "global_step": 170311, "epoch": 4055} {"train_loss": -7.157015800476074, "global_step": 170312, "epoch": 4055} {"train_loss": -7.108368873596191, "global_step": 170313, "epoch": 4055} {"train_loss": -7.03272008895874, "global_step": 170314, "epoch": 4055} {"train_loss": -7.105127334594727, "global_step": 170315, "epoch": 4055} {"train_loss": -7.032559394836426, "global_step": 170316, "epoch": 4055} {"train_loss": -7.074276924133301, "global_step": 170317, "epoch": 4055} {"train_loss": -6.999820709228516, "global_step": 170318, "epoch": 4055} {"train_loss": -6.999479293823242, "global_step": 170319, "epoch": 4055} {"train_loss": -6.9570465087890625, "global_step": 170320, "epoch": 4055} {"train_loss": -7.2134904861450195, "global_step": 170321, "epoch": 4055} {"train_loss": -7.107295036315918, "global_step": 170322, "epoch": 4055} {"train_loss": -7.111160755157471, "global_step": 170323, "epoch": 4055} {"train_loss": -7.071347236633301, "global_step": 170324, "epoch": 4055} {"train_loss": -7.066537857055664, "global_step": 170325, "epoch": 4055} {"train_loss": -6.982423305511475, "global_step": 170326, "epoch": 4055} {"train_loss": -7.074085712432861, "global_step": 170327, "epoch": 4055} {"train_loss": -7.076389312744141, "global_step": 170328, "epoch": 4055} {"train_loss": -7.016478538513184, "global_step": 170329, "epoch": 4055} {"train_loss": -7.06381368637085, "global_step": 170330, "epoch": 4055} {"train_loss": -7.044217109680176, "global_step": 170331, "epoch": 4055} {"train_loss": -7.115597724914551, "global_step": 170332, "epoch": 4055} {"train_loss": -7.062862396240234, "global_step": 170333, "epoch": 4055} {"train_loss": -7.185517311096191, "global_step": 170334, "epoch": 4055} {"train_loss": -7.023687362670898, "global_step": 170335, "epoch": 4055} {"train_loss": -7.098264217376709, "global_step": 170336, "epoch": 4055} {"train_loss": -7.077201843261719, "global_step": 170337, "epoch": 4055} {"train_loss": -7.1152801513671875, "global_step": 170338, "epoch": 4055} {"train_loss": -7.188882350921631, "global_step": 170339, "epoch": 4055} {"train_loss": -7.093132019042969, "global_step": 170340, "epoch": 4055} {"train_loss": -7.134920120239258, "global_step": 170341, "epoch": 4055} {"train_loss": -7.074236869812012, "global_step": 170342, "epoch": 4055} {"train_loss": -7.040445327758789, "global_step": 170343, "epoch": 4055} {"train_loss": -7.098466396331787, "global_step": 170344, "epoch": 4055} {"train_loss": -7.013730049133301, "global_step": 170345, "epoch": 4055} {"train_loss": -7.052445888519287, "global_step": 170346, "epoch": 4055} {"train_loss": -7.147249221801758, "global_step": 170347, "epoch": 4055} {"train_loss": -7.201817989349365, "global_step": 170348, "epoch": 4055} {"train_loss": -7.1402058601379395, "global_step": 170349, "epoch": 4055} {"train_loss": -7.127115249633789, "global_step": 170350, "epoch": 4055} {"train_loss": -7.0848852679842995, "global_step": 170351, "epoch": 4055, "val_loss": 68895.890625} {"train_loss": -7.093047142028809, "global_step": 170352, "epoch": 4056} {"train_loss": -7.090070724487305, "global_step": 170353, "epoch": 4056} {"train_loss": -7.093769550323486, "global_step": 170354, "epoch": 4056} {"train_loss": -6.975205421447754, "global_step": 170355, "epoch": 4056} {"train_loss": -7.287812232971191, "global_step": 170356, "epoch": 4056} {"train_loss": -7.0863494873046875, "global_step": 170357, "epoch": 4056} {"train_loss": -7.164510726928711, "global_step": 170358, "epoch": 4056} {"train_loss": -7.029444694519043, "global_step": 170359, "epoch": 4056} {"train_loss": -7.045714378356934, "global_step": 170360, "epoch": 4056} {"train_loss": -7.195329189300537, "global_step": 170361, "epoch": 4056} {"train_loss": -6.976309299468994, "global_step": 170362, "epoch": 4056} {"train_loss": -7.077421188354492, "global_step": 170363, "epoch": 4056} {"train_loss": -7.088044166564941, "global_step": 170364, "epoch": 4056} {"train_loss": -7.154117584228516, "global_step": 170365, "epoch": 4056} {"train_loss": -7.182136535644531, "global_step": 170366, "epoch": 4056} {"train_loss": -7.073925018310547, "global_step": 170367, "epoch": 4056} {"train_loss": -7.049768447875977, "global_step": 170368, "epoch": 4056} {"train_loss": -7.177652359008789, "global_step": 170369, "epoch": 4056} {"train_loss": -7.001816749572754, "global_step": 170370, "epoch": 4056} {"train_loss": -7.123812675476074, "global_step": 170371, "epoch": 4056} {"train_loss": -7.149097919464111, "global_step": 170372, "epoch": 4056} {"train_loss": -7.046513557434082, "global_step": 170373, "epoch": 4056} {"train_loss": -7.125326156616211, "global_step": 170374, "epoch": 4056} {"train_loss": -7.0170207023620605, "global_step": 170375, "epoch": 4056} {"train_loss": -7.077175140380859, "global_step": 170376, "epoch": 4056} {"train_loss": -7.152538299560547, "global_step": 170377, "epoch": 4056} {"train_loss": -7.018937110900879, "global_step": 170378, "epoch": 4056} {"train_loss": -6.966732501983643, "global_step": 170379, "epoch": 4056} {"train_loss": -7.047275543212891, "global_step": 170380, "epoch": 4056} {"train_loss": -7.159771919250488, "global_step": 170381, "epoch": 4056} {"train_loss": -7.141172409057617, "global_step": 170382, "epoch": 4056} {"train_loss": -7.17106294631958, "global_step": 170383, "epoch": 4056} {"train_loss": -7.0293731689453125, "global_step": 170384, "epoch": 4056} {"train_loss": -6.974011421203613, "global_step": 170385, "epoch": 4056} {"train_loss": -7.101581573486328, "global_step": 170386, "epoch": 4056} {"train_loss": -7.179289817810059, "global_step": 170387, "epoch": 4056} {"train_loss": -7.213084697723389, "global_step": 170388, "epoch": 4056} {"train_loss": -7.107766151428223, "global_step": 170389, "epoch": 4056} {"train_loss": -7.097017765045166, "global_step": 170390, "epoch": 4056} {"train_loss": -7.015748023986816, "global_step": 170391, "epoch": 4056} {"train_loss": -7.051477432250977, "global_step": 170392, "epoch": 4056} {"train_loss": -7.094705808730352, "global_step": 170393, "epoch": 4056, "val_loss": 68934.015625} {"train_loss": -6.979622840881348, "global_step": 170394, "epoch": 4057} {"train_loss": -7.024722099304199, "global_step": 170395, "epoch": 4057} {"train_loss": -7.153946876525879, "global_step": 170396, "epoch": 4057} {"train_loss": -6.8322038650512695, "global_step": 170397, "epoch": 4057} {"train_loss": -6.923740863800049, "global_step": 170398, "epoch": 4057} {"train_loss": -7.00568151473999, "global_step": 170399, "epoch": 4057} {"train_loss": -7.037469863891602, "global_step": 170400, "epoch": 4057} {"train_loss": -6.920976161956787, "global_step": 170401, "epoch": 4057} {"train_loss": -6.936089515686035, "global_step": 170402, "epoch": 4057} {"train_loss": -6.913234710693359, "global_step": 170403, "epoch": 4057} {"train_loss": -6.957578659057617, "global_step": 170404, "epoch": 4057} {"train_loss": -7.074653148651123, "global_step": 170405, "epoch": 4057} {"train_loss": -6.881842136383057, "global_step": 170406, "epoch": 4057} {"train_loss": -7.081335544586182, "global_step": 170407, "epoch": 4057} {"train_loss": -7.034024238586426, "global_step": 170408, "epoch": 4057} {"train_loss": -6.786933422088623, "global_step": 170409, "epoch": 4057} {"train_loss": -7.045567035675049, "global_step": 170410, "epoch": 4057} {"train_loss": -6.965670585632324, "global_step": 170411, "epoch": 4057} {"train_loss": -6.906765460968018, "global_step": 170412, "epoch": 4057} {"train_loss": -6.957130432128906, "global_step": 170413, "epoch": 4057} {"train_loss": -6.982744216918945, "global_step": 170414, "epoch": 4057} {"train_loss": -7.008608818054199, "global_step": 170415, "epoch": 4057} {"train_loss": -6.960212707519531, "global_step": 170416, "epoch": 4057} {"train_loss": -6.936442852020264, "global_step": 170417, "epoch": 4057} {"train_loss": -6.90172815322876, "global_step": 170418, "epoch": 4057} {"train_loss": -6.968034267425537, "global_step": 170419, "epoch": 4057} {"train_loss": -6.9875664710998535, "global_step": 170420, "epoch": 4057} {"train_loss": -6.989503860473633, "global_step": 170421, "epoch": 4057} {"train_loss": -6.911155700683594, "global_step": 170422, "epoch": 4057} {"train_loss": -6.924431800842285, "global_step": 170423, "epoch": 4057} {"train_loss": -7.020312309265137, "global_step": 170424, "epoch": 4057} {"train_loss": -7.045588970184326, "global_step": 170425, "epoch": 4057} {"train_loss": -7.015965461730957, "global_step": 170426, "epoch": 4057} {"train_loss": -7.0968241691589355, "global_step": 170427, "epoch": 4057} {"train_loss": -6.955719470977783, "global_step": 170428, "epoch": 4057} {"train_loss": -7.030987739562988, "global_step": 170429, "epoch": 4057} {"train_loss": -7.042431831359863, "global_step": 170430, "epoch": 4057} {"train_loss": -7.0699310302734375, "global_step": 170431, "epoch": 4057} {"train_loss": -7.049155235290527, "global_step": 170432, "epoch": 4057} {"train_loss": -7.097902297973633, "global_step": 170433, "epoch": 4057} {"train_loss": -7.075484275817871, "global_step": 170434, "epoch": 4057} {"train_loss": -6.988752331052508, "global_step": 170435, "epoch": 4057, "val_loss": 69080.1640625} {"train_loss": -7.008462905883789, "global_step": 170436, "epoch": 4058} {"train_loss": -7.111003398895264, "global_step": 170437, "epoch": 4058} {"train_loss": -7.0355024337768555, "global_step": 170438, "epoch": 4058} {"train_loss": -7.095824241638184, "global_step": 170439, "epoch": 4058} {"train_loss": -6.970102310180664, "global_step": 170440, "epoch": 4058} {"train_loss": -6.93599796295166, "global_step": 170441, "epoch": 4058} {"train_loss": -6.9914984703063965, "global_step": 170442, "epoch": 4058} {"train_loss": -7.038870811462402, "global_step": 170443, "epoch": 4058} {"train_loss": -7.064431667327881, "global_step": 170444, "epoch": 4058} {"train_loss": -7.0370049476623535, "global_step": 170445, "epoch": 4058} {"train_loss": -7.012560844421387, "global_step": 170446, "epoch": 4058} {"train_loss": -7.029907703399658, "global_step": 170447, "epoch": 4058} {"train_loss": -7.174868583679199, "global_step": 170448, "epoch": 4058} {"train_loss": -7.060695648193359, "global_step": 170449, "epoch": 4058} {"train_loss": -6.962925434112549, "global_step": 170450, "epoch": 4058} {"train_loss": -7.015037536621094, "global_step": 170451, "epoch": 4058} {"train_loss": -7.0530242919921875, "global_step": 170452, "epoch": 4058} {"train_loss": -7.089941024780273, "global_step": 170453, "epoch": 4058} {"train_loss": -6.993096351623535, "global_step": 170454, "epoch": 4058} {"train_loss": -6.966043472290039, "global_step": 170455, "epoch": 4058} {"train_loss": -7.210745811462402, "global_step": 170456, "epoch": 4058} {"train_loss": -6.961479187011719, "global_step": 170457, "epoch": 4058} {"train_loss": -7.001999855041504, "global_step": 170458, "epoch": 4058} {"train_loss": -7.01250696182251, "global_step": 170459, "epoch": 4058} {"train_loss": -6.940253257751465, "global_step": 170460, "epoch": 4058} {"train_loss": -7.038507461547852, "global_step": 170461, "epoch": 4058} {"train_loss": -7.0710906982421875, "global_step": 170462, "epoch": 4058} {"train_loss": -7.0640668869018555, "global_step": 170463, "epoch": 4058} {"train_loss": -7.106620788574219, "global_step": 170464, "epoch": 4058} {"train_loss": -6.971583366394043, "global_step": 170465, "epoch": 4058} {"train_loss": -6.921797752380371, "global_step": 170466, "epoch": 4058} {"train_loss": -7.089944362640381, "global_step": 170467, "epoch": 4058} {"train_loss": -6.993340492248535, "global_step": 170468, "epoch": 4058} {"train_loss": -7.007807731628418, "global_step": 170469, "epoch": 4058} {"train_loss": -7.070504188537598, "global_step": 170470, "epoch": 4058} {"train_loss": -7.087468147277832, "global_step": 170471, "epoch": 4058} {"train_loss": -7.042201042175293, "global_step": 170472, "epoch": 4058} {"train_loss": -7.072427272796631, "global_step": 170473, "epoch": 4058} {"train_loss": -7.089375019073486, "global_step": 170474, "epoch": 4058} {"train_loss": -7.147765159606934, "global_step": 170475, "epoch": 4058} {"train_loss": -6.993004322052002, "global_step": 170476, "epoch": 4058} {"train_loss": -7.03636984598069, "global_step": 170477, "epoch": 4058, "val_loss": 68974.875} {"train_loss": -7.115769386291504, "global_step": 170478, "epoch": 4059} {"train_loss": -7.055041313171387, "global_step": 170479, "epoch": 4059} {"train_loss": -7.190605163574219, "global_step": 170480, "epoch": 4059} {"train_loss": -7.16385555267334, "global_step": 170481, "epoch": 4059} {"train_loss": -7.022826194763184, "global_step": 170482, "epoch": 4059} {"train_loss": -7.108498573303223, "global_step": 170483, "epoch": 4059} {"train_loss": -7.142963886260986, "global_step": 170484, "epoch": 4059} {"train_loss": -7.091697692871094, "global_step": 170485, "epoch": 4059} {"train_loss": -7.159799575805664, "global_step": 170486, "epoch": 4059} {"train_loss": -7.099889278411865, "global_step": 170487, "epoch": 4059} {"train_loss": -7.042413234710693, "global_step": 170488, "epoch": 4059} {"train_loss": -7.171072006225586, "global_step": 170489, "epoch": 4059} {"train_loss": -7.044206619262695, "global_step": 170490, "epoch": 4059} {"train_loss": -7.208532333374023, "global_step": 170491, "epoch": 4059} {"train_loss": -7.0551652908325195, "global_step": 170492, "epoch": 4059} {"train_loss": -7.076532363891602, "global_step": 170493, "epoch": 4059} {"train_loss": -7.090428352355957, "global_step": 170494, "epoch": 4059} {"train_loss": -7.234626770019531, "global_step": 170495, "epoch": 4059} {"train_loss": -7.123600959777832, "global_step": 170496, "epoch": 4059} {"train_loss": -7.06276798248291, "global_step": 170497, "epoch": 4059} {"train_loss": -7.098479747772217, "global_step": 170498, "epoch": 4059} {"train_loss": -7.151129722595215, "global_step": 170499, "epoch": 4059} {"train_loss": -7.090325832366943, "global_step": 170500, "epoch": 4059} {"train_loss": -7.137423992156982, "global_step": 170501, "epoch": 4059} {"train_loss": -7.141073226928711, "global_step": 170502, "epoch": 4059} {"train_loss": -7.170028209686279, "global_step": 170503, "epoch": 4059} {"train_loss": -7.031594276428223, "global_step": 170504, "epoch": 4059} {"train_loss": -7.06920051574707, "global_step": 170505, "epoch": 4059} {"train_loss": -7.056053161621094, "global_step": 170506, "epoch": 4059} {"train_loss": -7.079010963439941, "global_step": 170507, "epoch": 4059} {"train_loss": -6.931311130523682, "global_step": 170508, "epoch": 4059} {"train_loss": -7.078765869140625, "global_step": 170509, "epoch": 4059} {"train_loss": -6.992432594299316, "global_step": 170510, "epoch": 4059} {"train_loss": -7.027838706970215, "global_step": 170511, "epoch": 4059} {"train_loss": -7.048334121704102, "global_step": 170512, "epoch": 4059} {"train_loss": -7.103268623352051, "global_step": 170513, "epoch": 4059} {"train_loss": -6.912372589111328, "global_step": 170514, "epoch": 4059} {"train_loss": -7.02030086517334, "global_step": 170515, "epoch": 4059} {"train_loss": -7.069642066955566, "global_step": 170516, "epoch": 4059} {"train_loss": -6.994229793548584, "global_step": 170517, "epoch": 4059} {"train_loss": -7.0266876220703125, "global_step": 170518, "epoch": 4059} {"train_loss": -7.084370772043864, "global_step": 170519, "epoch": 4059, "val_loss": 69076.15625} {"train_loss": -7.0375895500183105, "global_step": 170520, "epoch": 4060} {"train_loss": -7.003926753997803, "global_step": 170521, "epoch": 4060} {"train_loss": -7.076937198638916, "global_step": 170522, "epoch": 4060} {"train_loss": -6.937307357788086, "global_step": 170523, "epoch": 4060} {"train_loss": -7.063067436218262, "global_step": 170524, "epoch": 4060} {"train_loss": -6.943987846374512, "global_step": 170525, "epoch": 4060} {"train_loss": -6.996092796325684, "global_step": 170526, "epoch": 4060} {"train_loss": -7.0800676345825195, "global_step": 170527, "epoch": 4060} {"train_loss": -7.021389007568359, "global_step": 170528, "epoch": 4060} {"train_loss": -7.078126907348633, "global_step": 170529, "epoch": 4060} {"train_loss": -6.962253570556641, "global_step": 170530, "epoch": 4060} {"train_loss": -7.1761674880981445, "global_step": 170531, "epoch": 4060} {"train_loss": -7.06897497177124, "global_step": 170532, "epoch": 4060} {"train_loss": -7.017782211303711, "global_step": 170533, "epoch": 4060} {"train_loss": -7.140202522277832, "global_step": 170534, "epoch": 4060} {"train_loss": -7.037435531616211, "global_step": 170535, "epoch": 4060} {"train_loss": -7.042369842529297, "global_step": 170536, "epoch": 4060} {"train_loss": -7.06733512878418, "global_step": 170537, "epoch": 4060} {"train_loss": -6.960270404815674, "global_step": 170538, "epoch": 4060} {"train_loss": -7.109618186950684, "global_step": 170539, "epoch": 4060} {"train_loss": -7.021548271179199, "global_step": 170540, "epoch": 4060} {"train_loss": -7.021968841552734, "global_step": 170541, "epoch": 4060} {"train_loss": -7.018130302429199, "global_step": 170542, "epoch": 4060} {"train_loss": -7.118735313415527, "global_step": 170543, "epoch": 4060} {"train_loss": -6.8979692459106445, "global_step": 170544, "epoch": 4060} {"train_loss": -7.090672492980957, "global_step": 170545, "epoch": 4060} {"train_loss": -6.991813659667969, "global_step": 170546, "epoch": 4060} {"train_loss": -6.909574508666992, "global_step": 170547, "epoch": 4060} {"train_loss": -7.121781349182129, "global_step": 170548, "epoch": 4060} {"train_loss": -7.085972785949707, "global_step": 170549, "epoch": 4060} {"train_loss": -7.093718528747559, "global_step": 170550, "epoch": 4060} {"train_loss": -7.044710636138916, "global_step": 170551, "epoch": 4060} {"train_loss": -7.031223773956299, "global_step": 170552, "epoch": 4060} {"train_loss": -6.966477870941162, "global_step": 170553, "epoch": 4060} {"train_loss": -7.05903434753418, "global_step": 170554, "epoch": 4060} {"train_loss": -6.9390482902526855, "global_step": 170555, "epoch": 4060} {"train_loss": -7.08554744720459, "global_step": 170556, "epoch": 4060} {"train_loss": -7.084397315979004, "global_step": 170557, "epoch": 4060} {"train_loss": -6.897737503051758, "global_step": 170558, "epoch": 4060} {"train_loss": -7.007634162902832, "global_step": 170559, "epoch": 4060} {"train_loss": -7.056458473205566, "global_step": 170560, "epoch": 4060} {"train_loss": -7.030897208622524, "global_step": 170561, "epoch": 4060, "val_loss": 68871.546875} {"train_loss": -7.043150424957275, "global_step": 170562, "epoch": 4061} {"train_loss": -6.9134721755981445, "global_step": 170563, "epoch": 4061} {"train_loss": -6.934300899505615, "global_step": 170564, "epoch": 4061} {"train_loss": -6.954616069793701, "global_step": 170565, "epoch": 4061} {"train_loss": -7.085409641265869, "global_step": 170566, "epoch": 4061} {"train_loss": -6.999205589294434, "global_step": 170567, "epoch": 4061} {"train_loss": -7.126152038574219, "global_step": 170568, "epoch": 4061} {"train_loss": -7.059133052825928, "global_step": 170569, "epoch": 4061} {"train_loss": -7.0755615234375, "global_step": 170570, "epoch": 4061} {"train_loss": -7.1018877029418945, "global_step": 170571, "epoch": 4061} {"train_loss": -7.139858245849609, "global_step": 170572, "epoch": 4061} {"train_loss": -7.0331339836120605, "global_step": 170573, "epoch": 4061} {"train_loss": -6.994465351104736, "global_step": 170574, "epoch": 4061} {"train_loss": -7.103828430175781, "global_step": 170575, "epoch": 4061} {"train_loss": -7.041081428527832, "global_step": 170576, "epoch": 4061} {"train_loss": -6.968530654907227, "global_step": 170577, "epoch": 4061} {"train_loss": -7.10603141784668, "global_step": 170578, "epoch": 4061} {"train_loss": -7.028229713439941, "global_step": 170579, "epoch": 4061} {"train_loss": -7.093194007873535, "global_step": 170580, "epoch": 4061} {"train_loss": -6.9178619384765625, "global_step": 170581, "epoch": 4061} {"train_loss": -6.910308837890625, "global_step": 170582, "epoch": 4061} {"train_loss": -7.061947822570801, "global_step": 170583, "epoch": 4061} {"train_loss": -6.9922990798950195, "global_step": 170584, "epoch": 4061} {"train_loss": -6.947024345397949, "global_step": 170585, "epoch": 4061} {"train_loss": -6.902312755584717, "global_step": 170586, "epoch": 4061} {"train_loss": -7.005313396453857, "global_step": 170587, "epoch": 4061} {"train_loss": -6.943247318267822, "global_step": 170588, "epoch": 4061} {"train_loss": -7.007041931152344, "global_step": 170589, "epoch": 4061} {"train_loss": -7.042798042297363, "global_step": 170590, "epoch": 4061} {"train_loss": -6.889630317687988, "global_step": 170591, "epoch": 4061} {"train_loss": -7.025022029876709, "global_step": 170592, "epoch": 4061} {"train_loss": -7.0477070808410645, "global_step": 170593, "epoch": 4061} {"train_loss": -7.046257495880127, "global_step": 170594, "epoch": 4061} {"train_loss": -7.059515476226807, "global_step": 170595, "epoch": 4061} {"train_loss": -6.933404445648193, "global_step": 170596, "epoch": 4061} {"train_loss": -6.946221351623535, "global_step": 170597, "epoch": 4061} {"train_loss": -6.964134693145752, "global_step": 170598, "epoch": 4061} {"train_loss": -7.056639671325684, "global_step": 170599, "epoch": 4061} {"train_loss": -6.985012531280518, "global_step": 170600, "epoch": 4061} {"train_loss": -7.023285865783691, "global_step": 170601, "epoch": 4061} {"train_loss": -7.022708892822266, "global_step": 170602, "epoch": 4061} {"train_loss": -7.014367126283192, "global_step": 170603, "epoch": 4061, "val_loss": 69110.515625} {"train_loss": -7.166316509246826, "global_step": 170604, "epoch": 4062} {"train_loss": -7.135280609130859, "global_step": 170605, "epoch": 4062} {"train_loss": -7.118503570556641, "global_step": 170606, "epoch": 4062} {"train_loss": -6.985744953155518, "global_step": 170607, "epoch": 4062} {"train_loss": -7.233593940734863, "global_step": 170608, "epoch": 4062} {"train_loss": -7.097051620483398, "global_step": 170609, "epoch": 4062} {"train_loss": -7.130251884460449, "global_step": 170610, "epoch": 4062} {"train_loss": -7.014540195465088, "global_step": 170611, "epoch": 4062} {"train_loss": -7.03783655166626, "global_step": 170612, "epoch": 4062} {"train_loss": -7.0872955322265625, "global_step": 170613, "epoch": 4062} {"train_loss": -7.0708770751953125, "global_step": 170614, "epoch": 4062} {"train_loss": -6.971596717834473, "global_step": 170615, "epoch": 4062} {"train_loss": -7.113833427429199, "global_step": 170616, "epoch": 4062} {"train_loss": -6.9318718910217285, "global_step": 170617, "epoch": 4062} {"train_loss": -6.982926368713379, "global_step": 170618, "epoch": 4062} {"train_loss": -7.000070571899414, "global_step": 170619, "epoch": 4062} {"train_loss": -7.023850440979004, "global_step": 170620, "epoch": 4062} {"train_loss": -7.03580904006958, "global_step": 170621, "epoch": 4062} {"train_loss": -7.08397102355957, "global_step": 170622, "epoch": 4062} {"train_loss": -6.8821306228637695, "global_step": 170623, "epoch": 4062} {"train_loss": -7.099546909332275, "global_step": 170624, "epoch": 4062} {"train_loss": -7.088403701782227, "global_step": 170625, "epoch": 4062} {"train_loss": -7.015379428863525, "global_step": 170626, "epoch": 4062} {"train_loss": -6.942980766296387, "global_step": 170627, "epoch": 4062} {"train_loss": -6.956521987915039, "global_step": 170628, "epoch": 4062} {"train_loss": -6.945066928863525, "global_step": 170629, "epoch": 4062} {"train_loss": -6.730375289916992, "global_step": 170630, "epoch": 4062} {"train_loss": -7.014032363891602, "global_step": 170631, "epoch": 4062} {"train_loss": -7.063170433044434, "global_step": 170632, "epoch": 4062} {"train_loss": -7.016994476318359, "global_step": 170633, "epoch": 4062} {"train_loss": -6.9928131103515625, "global_step": 170634, "epoch": 4062} {"train_loss": -7.011497974395752, "global_step": 170635, "epoch": 4062} {"train_loss": -6.915585517883301, "global_step": 170636, "epoch": 4062} {"train_loss": -6.993346214294434, "global_step": 170637, "epoch": 4062} {"train_loss": -7.015835285186768, "global_step": 170638, "epoch": 4062} {"train_loss": -6.945829391479492, "global_step": 170639, "epoch": 4062} {"train_loss": -6.8454670906066895, "global_step": 170640, "epoch": 4062} {"train_loss": -6.899379730224609, "global_step": 170641, "epoch": 4062} {"train_loss": -6.940881729125977, "global_step": 170642, "epoch": 4062} {"train_loss": -7.078860282897949, "global_step": 170643, "epoch": 4062} {"train_loss": -6.953823566436768, "global_step": 170644, "epoch": 4062} {"train_loss": -7.013282639639718, "global_step": 170645, "epoch": 4062, "val_loss": 68925.34375} {"train_loss": -7.059854507446289, "global_step": 170646, "epoch": 4063} {"train_loss": -6.899152755737305, "global_step": 170647, "epoch": 4063} {"train_loss": -7.044086456298828, "global_step": 170648, "epoch": 4063} {"train_loss": -7.027020454406738, "global_step": 170649, "epoch": 4063} {"train_loss": -7.037256240844727, "global_step": 170650, "epoch": 4063} {"train_loss": -6.87286901473999, "global_step": 170651, "epoch": 4063} {"train_loss": -7.018681049346924, "global_step": 170652, "epoch": 4063} {"train_loss": -7.0686798095703125, "global_step": 170653, "epoch": 4063} {"train_loss": -7.012066841125488, "global_step": 170654, "epoch": 4063} {"train_loss": -7.017311096191406, "global_step": 170655, "epoch": 4063} {"train_loss": -7.072015762329102, "global_step": 170656, "epoch": 4063} {"train_loss": -7.076026439666748, "global_step": 170657, "epoch": 4063} {"train_loss": -6.898290634155273, "global_step": 170658, "epoch": 4063} {"train_loss": -6.794887065887451, "global_step": 170659, "epoch": 4063} {"train_loss": -7.008734703063965, "global_step": 170660, "epoch": 4063} {"train_loss": -6.796540260314941, "global_step": 170661, "epoch": 4063} {"train_loss": -6.897696018218994, "global_step": 170662, "epoch": 4063} {"train_loss": -6.9297099113464355, "global_step": 170663, "epoch": 4063} {"train_loss": -6.9848737716674805, "global_step": 170664, "epoch": 4063} {"train_loss": -7.061694622039795, "global_step": 170665, "epoch": 4063} {"train_loss": -6.935129165649414, "global_step": 170666, "epoch": 4063} {"train_loss": -6.966756820678711, "global_step": 170667, "epoch": 4063} {"train_loss": -6.873633861541748, "global_step": 170668, "epoch": 4063} {"train_loss": -6.944879055023193, "global_step": 170669, "epoch": 4063} {"train_loss": -6.994643688201904, "global_step": 170670, "epoch": 4063} {"train_loss": -7.0455002784729, "global_step": 170671, "epoch": 4063} {"train_loss": -7.0873589515686035, "global_step": 170672, "epoch": 4063} {"train_loss": -7.1041154861450195, "global_step": 170673, "epoch": 4063} {"train_loss": -6.972853183746338, "global_step": 170674, "epoch": 4063} {"train_loss": -7.053664207458496, "global_step": 170675, "epoch": 4063} {"train_loss": -7.02146577835083, "global_step": 170676, "epoch": 4063} {"train_loss": -7.002151012420654, "global_step": 170677, "epoch": 4063} {"train_loss": -7.071717262268066, "global_step": 170678, "epoch": 4063} {"train_loss": -7.164063453674316, "global_step": 170679, "epoch": 4063} {"train_loss": -7.0644941329956055, "global_step": 170680, "epoch": 4063} {"train_loss": -7.067953109741211, "global_step": 170681, "epoch": 4063} {"train_loss": -7.107349395751953, "global_step": 170682, "epoch": 4063} {"train_loss": -7.080544471740723, "global_step": 170683, "epoch": 4063} {"train_loss": -7.049686431884766, "global_step": 170684, "epoch": 4063} {"train_loss": -7.165248870849609, "global_step": 170685, "epoch": 4063} {"train_loss": -6.992860317230225, "global_step": 170686, "epoch": 4063} {"train_loss": -7.009168375106085, "global_step": 170687, "epoch": 4063, "val_loss": 68840.7578125} {"train_loss": -7.022051811218262, "global_step": 170688, "epoch": 4064} {"train_loss": -7.143801689147949, "global_step": 170689, "epoch": 4064} {"train_loss": -7.120258331298828, "global_step": 170690, "epoch": 4064} {"train_loss": -7.012639999389648, "global_step": 170691, "epoch": 4064} {"train_loss": -7.007199287414551, "global_step": 170692, "epoch": 4064} {"train_loss": -7.0195770263671875, "global_step": 170693, "epoch": 4064} {"train_loss": -7.144657611846924, "global_step": 170694, "epoch": 4064} {"train_loss": -7.04836368560791, "global_step": 170695, "epoch": 4064} {"train_loss": -6.917280197143555, "global_step": 170696, "epoch": 4064} {"train_loss": -7.12817907333374, "global_step": 170697, "epoch": 4064} {"train_loss": -7.19359016418457, "global_step": 170698, "epoch": 4064} {"train_loss": -7.051427841186523, "global_step": 170699, "epoch": 4064} {"train_loss": -7.083489418029785, "global_step": 170700, "epoch": 4064} {"train_loss": -7.113665580749512, "global_step": 170701, "epoch": 4064} {"train_loss": -7.011681079864502, "global_step": 170702, "epoch": 4064} {"train_loss": -7.024658203125, "global_step": 170703, "epoch": 4064} {"train_loss": -7.120903015136719, "global_step": 170704, "epoch": 4064} {"train_loss": -7.102440357208252, "global_step": 170705, "epoch": 4064} {"train_loss": -7.125004291534424, "global_step": 170706, "epoch": 4064} {"train_loss": -7.054141998291016, "global_step": 170707, "epoch": 4064} {"train_loss": -7.135337829589844, "global_step": 170708, "epoch": 4064} {"train_loss": -7.212211608886719, "global_step": 170709, "epoch": 4064} {"train_loss": -7.02440071105957, "global_step": 170710, "epoch": 4064} {"train_loss": -7.131851673126221, "global_step": 170711, "epoch": 4064} {"train_loss": -7.170260429382324, "global_step": 170712, "epoch": 4064} {"train_loss": -7.133082389831543, "global_step": 170713, "epoch": 4064} {"train_loss": -7.15938663482666, "global_step": 170714, "epoch": 4064} {"train_loss": -7.153959274291992, "global_step": 170715, "epoch": 4064} {"train_loss": -7.06474494934082, "global_step": 170716, "epoch": 4064} {"train_loss": -6.924638271331787, "global_step": 170717, "epoch": 4064} {"train_loss": -7.148345947265625, "global_step": 170718, "epoch": 4064} {"train_loss": -6.968194007873535, "global_step": 170719, "epoch": 4064} {"train_loss": -6.996066570281982, "global_step": 170720, "epoch": 4064} {"train_loss": -7.046977519989014, "global_step": 170721, "epoch": 4064} {"train_loss": -7.129083633422852, "global_step": 170722, "epoch": 4064} {"train_loss": -7.045785903930664, "global_step": 170723, "epoch": 4064} {"train_loss": -7.065579414367676, "global_step": 170724, "epoch": 4064} {"train_loss": -7.0366668701171875, "global_step": 170725, "epoch": 4064} {"train_loss": -7.044896125793457, "global_step": 170726, "epoch": 4064} {"train_loss": -7.123815536499023, "global_step": 170727, "epoch": 4064} {"train_loss": -7.06779670715332, "global_step": 170728, "epoch": 4064} {"train_loss": -7.078813371204195, "global_step": 170729, "epoch": 4064, "val_loss": 68965.1640625} {"train_loss": -7.022578239440918, "global_step": 170730, "epoch": 4065} {"train_loss": -7.1529436111450195, "global_step": 170731, "epoch": 4065} {"train_loss": -6.939659118652344, "global_step": 170732, "epoch": 4065} {"train_loss": -7.128778457641602, "global_step": 170733, "epoch": 4065} {"train_loss": -6.873991012573242, "global_step": 170734, "epoch": 4065} {"train_loss": -6.931340217590332, "global_step": 170735, "epoch": 4065} {"train_loss": -7.038086891174316, "global_step": 170736, "epoch": 4065} {"train_loss": -6.915475368499756, "global_step": 170737, "epoch": 4065} {"train_loss": -6.983258247375488, "global_step": 170738, "epoch": 4065} {"train_loss": -6.88599967956543, "global_step": 170739, "epoch": 4065} {"train_loss": -6.944849967956543, "global_step": 170740, "epoch": 4065} {"train_loss": -6.916505336761475, "global_step": 170741, "epoch": 4065} {"train_loss": -6.866537570953369, "global_step": 170742, "epoch": 4065} {"train_loss": -7.035182952880859, "global_step": 170743, "epoch": 4065} {"train_loss": -6.929521560668945, "global_step": 170744, "epoch": 4065} {"train_loss": -6.859786033630371, "global_step": 170745, "epoch": 4065} {"train_loss": -7.007326126098633, "global_step": 170746, "epoch": 4065} {"train_loss": -6.901137828826904, "global_step": 170747, "epoch": 4065} {"train_loss": -6.97506856918335, "global_step": 170748, "epoch": 4065} {"train_loss": -7.015320777893066, "global_step": 170749, "epoch": 4065} {"train_loss": -6.944470405578613, "global_step": 170750, "epoch": 4065} {"train_loss": -7.077128887176514, "global_step": 170751, "epoch": 4065} {"train_loss": -6.96980094909668, "global_step": 170752, "epoch": 4065} {"train_loss": -6.977818489074707, "global_step": 170753, "epoch": 4065} {"train_loss": -7.008625030517578, "global_step": 170754, "epoch": 4065} {"train_loss": -6.901948928833008, "global_step": 170755, "epoch": 4065} {"train_loss": -7.040345668792725, "global_step": 170756, "epoch": 4065} {"train_loss": -6.95438289642334, "global_step": 170757, "epoch": 4065} {"train_loss": -7.01729154586792, "global_step": 170758, "epoch": 4065} {"train_loss": -7.034523010253906, "global_step": 170759, "epoch": 4065} {"train_loss": -6.934712886810303, "global_step": 170760, "epoch": 4065} {"train_loss": -6.928272247314453, "global_step": 170761, "epoch": 4065} {"train_loss": -6.980064392089844, "global_step": 170762, "epoch": 4065} {"train_loss": -7.005282402038574, "global_step": 170763, "epoch": 4065} {"train_loss": -6.941099166870117, "global_step": 170764, "epoch": 4065} {"train_loss": -6.929181098937988, "global_step": 170765, "epoch": 4065} {"train_loss": -6.93406867980957, "global_step": 170766, "epoch": 4065} {"train_loss": -7.005955696105957, "global_step": 170767, "epoch": 4065} {"train_loss": -6.998517036437988, "global_step": 170768, "epoch": 4065} {"train_loss": -6.954092025756836, "global_step": 170769, "epoch": 4065} {"train_loss": -6.985821723937988, "global_step": 170770, "epoch": 4065} {"train_loss": -6.9753444875989645, "global_step": 170771, "epoch": 4065, "val_loss": 68862.7421875} {"train_loss": -7.10833740234375, "global_step": 170772, "epoch": 4066} {"train_loss": -7.0970635414123535, "global_step": 170773, "epoch": 4066} {"train_loss": -7.076756477355957, "global_step": 170774, "epoch": 4066} {"train_loss": -7.022293567657471, "global_step": 170775, "epoch": 4066} {"train_loss": -7.138904571533203, "global_step": 170776, "epoch": 4066} {"train_loss": -7.0686936378479, "global_step": 170777, "epoch": 4066} {"train_loss": -7.175898551940918, "global_step": 170778, "epoch": 4066} {"train_loss": -7.065155029296875, "global_step": 170779, "epoch": 4066} {"train_loss": -7.031497001647949, "global_step": 170780, "epoch": 4066} {"train_loss": -7.072222709655762, "global_step": 170781, "epoch": 4066} {"train_loss": -6.946152687072754, "global_step": 170782, "epoch": 4066} {"train_loss": -7.0281853675842285, "global_step": 170783, "epoch": 4066} {"train_loss": -6.943755149841309, "global_step": 170784, "epoch": 4066} {"train_loss": -7.059160232543945, "global_step": 170785, "epoch": 4066} {"train_loss": -7.048173904418945, "global_step": 170786, "epoch": 4066} {"train_loss": -6.975061416625977, "global_step": 170787, "epoch": 4066} {"train_loss": -7.151611804962158, "global_step": 170788, "epoch": 4066} {"train_loss": -7.031538009643555, "global_step": 170789, "epoch": 4066} {"train_loss": -7.039621829986572, "global_step": 170790, "epoch": 4066} {"train_loss": -6.959409236907959, "global_step": 170791, "epoch": 4066} {"train_loss": -6.899015426635742, "global_step": 170792, "epoch": 4066} {"train_loss": -7.043459415435791, "global_step": 170793, "epoch": 4066} {"train_loss": -6.90272855758667, "global_step": 170794, "epoch": 4066} {"train_loss": -6.919101238250732, "global_step": 170795, "epoch": 4066} {"train_loss": -6.917740821838379, "global_step": 170796, "epoch": 4066} {"train_loss": -7.112174034118652, "global_step": 170797, "epoch": 4066} {"train_loss": -6.948992729187012, "global_step": 170798, "epoch": 4066} {"train_loss": -6.940650463104248, "global_step": 170799, "epoch": 4066} {"train_loss": -7.064995765686035, "global_step": 170800, "epoch": 4066} {"train_loss": -6.948927402496338, "global_step": 170801, "epoch": 4066} {"train_loss": -6.946999549865723, "global_step": 170802, "epoch": 4066} {"train_loss": -7.023012161254883, "global_step": 170803, "epoch": 4066} {"train_loss": -7.020408630371094, "global_step": 170804, "epoch": 4066} {"train_loss": -7.033771514892578, "global_step": 170805, "epoch": 4066} {"train_loss": -7.1311445236206055, "global_step": 170806, "epoch": 4066} {"train_loss": -7.089798927307129, "global_step": 170807, "epoch": 4066} {"train_loss": -6.997611045837402, "global_step": 170808, "epoch": 4066} {"train_loss": -7.036795139312744, "global_step": 170809, "epoch": 4066} {"train_loss": -7.158601760864258, "global_step": 170810, "epoch": 4066} {"train_loss": -7.033437728881836, "global_step": 170811, "epoch": 4066} {"train_loss": -6.941460132598877, "global_step": 170812, "epoch": 4066} {"train_loss": -7.032583123161679, "global_step": 170813, "epoch": 4066, "val_loss": 69020.5234375} {"train_loss": -7.056604385375977, "global_step": 170814, "epoch": 4067} {"train_loss": -7.118579864501953, "global_step": 170815, "epoch": 4067} {"train_loss": -7.013277053833008, "global_step": 170816, "epoch": 4067} {"train_loss": -7.117060661315918, "global_step": 170817, "epoch": 4067} {"train_loss": -6.983778953552246, "global_step": 170818, "epoch": 4067} {"train_loss": -7.179760932922363, "global_step": 170819, "epoch": 4067} {"train_loss": -7.126426696777344, "global_step": 170820, "epoch": 4067} {"train_loss": -7.063006401062012, "global_step": 170821, "epoch": 4067} {"train_loss": -7.085536003112793, "global_step": 170822, "epoch": 4067} {"train_loss": -7.034855842590332, "global_step": 170823, "epoch": 4067} {"train_loss": -7.016573905944824, "global_step": 170824, "epoch": 4067} {"train_loss": -7.074470043182373, "global_step": 170825, "epoch": 4067} {"train_loss": -7.104992866516113, "global_step": 170826, "epoch": 4067} {"train_loss": -7.008572101593018, "global_step": 170827, "epoch": 4067} {"train_loss": -7.143012046813965, "global_step": 170828, "epoch": 4067} {"train_loss": -7.068017959594727, "global_step": 170829, "epoch": 4067} {"train_loss": -7.024265289306641, "global_step": 170830, "epoch": 4067} {"train_loss": -6.818685531616211, "global_step": 170831, "epoch": 4067} {"train_loss": -7.091167449951172, "global_step": 170832, "epoch": 4067} {"train_loss": -6.931615829467773, "global_step": 170833, "epoch": 4067} {"train_loss": -6.965240478515625, "global_step": 170834, "epoch": 4067} {"train_loss": -6.9425201416015625, "global_step": 170835, "epoch": 4067} {"train_loss": -6.968701362609863, "global_step": 170836, "epoch": 4067} {"train_loss": -7.000637531280518, "global_step": 170837, "epoch": 4067} {"train_loss": -7.032722473144531, "global_step": 170838, "epoch": 4067} {"train_loss": -6.872939109802246, "global_step": 170839, "epoch": 4067} {"train_loss": -7.118577003479004, "global_step": 170840, "epoch": 4067} {"train_loss": -6.95212459564209, "global_step": 170841, "epoch": 4067} {"train_loss": -6.972143650054932, "global_step": 170842, "epoch": 4067} {"train_loss": -7.106393814086914, "global_step": 170843, "epoch": 4067} {"train_loss": -6.849375247955322, "global_step": 170844, "epoch": 4067} {"train_loss": -7.019814491271973, "global_step": 170845, "epoch": 4067} {"train_loss": -7.062981605529785, "global_step": 170846, "epoch": 4067} {"train_loss": -7.068931579589844, "global_step": 170847, "epoch": 4067} {"train_loss": -7.034209251403809, "global_step": 170848, "epoch": 4067} {"train_loss": -6.948448181152344, "global_step": 170849, "epoch": 4067} {"train_loss": -6.956287384033203, "global_step": 170850, "epoch": 4067} {"train_loss": -7.091835021972656, "global_step": 170851, "epoch": 4067} {"train_loss": -6.946412086486816, "global_step": 170852, "epoch": 4067} {"train_loss": -7.040912628173828, "global_step": 170853, "epoch": 4067} {"train_loss": -7.029433250427246, "global_step": 170854, "epoch": 4067} {"train_loss": -7.024457375208537, "global_step": 170855, "epoch": 4067, "val_loss": 69013.2890625} {"train_loss": -7.0527849197387695, "global_step": 170856, "epoch": 4068} {"train_loss": -7.1050872802734375, "global_step": 170857, "epoch": 4068} {"train_loss": -7.0947184562683105, "global_step": 170858, "epoch": 4068} {"train_loss": -7.046028137207031, "global_step": 170859, "epoch": 4068} {"train_loss": -7.102644443511963, "global_step": 170860, "epoch": 4068} {"train_loss": -7.044346809387207, "global_step": 170861, "epoch": 4068} {"train_loss": -7.017306804656982, "global_step": 170862, "epoch": 4068} {"train_loss": -7.129308700561523, "global_step": 170863, "epoch": 4068} {"train_loss": -7.157257080078125, "global_step": 170864, "epoch": 4068} {"train_loss": -7.073451042175293, "global_step": 170865, "epoch": 4068} {"train_loss": -7.048618316650391, "global_step": 170866, "epoch": 4068} {"train_loss": -7.1465044021606445, "global_step": 170867, "epoch": 4068} {"train_loss": -7.080965995788574, "global_step": 170868, "epoch": 4068} {"train_loss": -6.954276084899902, "global_step": 170869, "epoch": 4068} {"train_loss": -7.038357734680176, "global_step": 170870, "epoch": 4068} {"train_loss": -7.095699310302734, "global_step": 170871, "epoch": 4068} {"train_loss": -7.074477195739746, "global_step": 170872, "epoch": 4068} {"train_loss": -7.048222541809082, "global_step": 170873, "epoch": 4068} {"train_loss": -7.068281650543213, "global_step": 170874, "epoch": 4068} {"train_loss": -7.012655258178711, "global_step": 170875, "epoch": 4068} {"train_loss": -7.0315046310424805, "global_step": 170876, "epoch": 4068} {"train_loss": -6.944253921508789, "global_step": 170877, "epoch": 4068} {"train_loss": -7.028242111206055, "global_step": 170878, "epoch": 4068} {"train_loss": -6.914920806884766, "global_step": 170879, "epoch": 4068} {"train_loss": -6.970697402954102, "global_step": 170880, "epoch": 4068} {"train_loss": -7.003205299377441, "global_step": 170881, "epoch": 4068} {"train_loss": -6.969657897949219, "global_step": 170882, "epoch": 4068} {"train_loss": -7.07396125793457, "global_step": 170883, "epoch": 4068} {"train_loss": -6.953029632568359, "global_step": 170884, "epoch": 4068} {"train_loss": -7.001108169555664, "global_step": 170885, "epoch": 4068} {"train_loss": -7.012942790985107, "global_step": 170886, "epoch": 4068} {"train_loss": -6.881982803344727, "global_step": 170887, "epoch": 4068} {"train_loss": -6.93635368347168, "global_step": 170888, "epoch": 4068} {"train_loss": -6.955511093139648, "global_step": 170889, "epoch": 4068} {"train_loss": -6.90355920791626, "global_step": 170890, "epoch": 4068} {"train_loss": -6.9766998291015625, "global_step": 170891, "epoch": 4068} {"train_loss": -6.976591110229492, "global_step": 170892, "epoch": 4068} {"train_loss": -6.942305088043213, "global_step": 170893, "epoch": 4068} {"train_loss": -7.021629333496094, "global_step": 170894, "epoch": 4068} {"train_loss": -6.93037223815918, "global_step": 170895, "epoch": 4068} {"train_loss": -7.030483245849609, "global_step": 170896, "epoch": 4068} {"train_loss": -7.020104453677223, "global_step": 170897, "epoch": 4068, "val_loss": 69144.765625} {"train_loss": -6.9691691398620605, "global_step": 170898, "epoch": 4069} {"train_loss": -6.8715596199035645, "global_step": 170899, "epoch": 4069} {"train_loss": -6.9699811935424805, "global_step": 170900, "epoch": 4069} {"train_loss": -7.009443283081055, "global_step": 170901, "epoch": 4069} {"train_loss": -6.967930793762207, "global_step": 170902, "epoch": 4069} {"train_loss": -6.909106731414795, "global_step": 170903, "epoch": 4069} {"train_loss": -7.028359889984131, "global_step": 170904, "epoch": 4069} {"train_loss": -6.936455726623535, "global_step": 170905, "epoch": 4069} {"train_loss": -7.064181327819824, "global_step": 170906, "epoch": 4069} {"train_loss": -6.970016956329346, "global_step": 170907, "epoch": 4069} {"train_loss": -7.019584655761719, "global_step": 170908, "epoch": 4069} {"train_loss": -7.042417049407959, "global_step": 170909, "epoch": 4069} {"train_loss": -7.031459331512451, "global_step": 170910, "epoch": 4069} {"train_loss": -7.06773567199707, "global_step": 170911, "epoch": 4069} {"train_loss": -7.01561164855957, "global_step": 170912, "epoch": 4069} {"train_loss": -6.995079517364502, "global_step": 170913, "epoch": 4069} {"train_loss": -7.031317710876465, "global_step": 170914, "epoch": 4069} {"train_loss": -7.076374053955078, "global_step": 170915, "epoch": 4069} {"train_loss": -7.075835704803467, "global_step": 170916, "epoch": 4069} {"train_loss": -7.072626113891602, "global_step": 170917, "epoch": 4069} {"train_loss": -7.011843204498291, "global_step": 170918, "epoch": 4069} {"train_loss": -7.088621616363525, "global_step": 170919, "epoch": 4069} {"train_loss": -7.060299396514893, "global_step": 170920, "epoch": 4069} {"train_loss": -7.090564727783203, "global_step": 170921, "epoch": 4069} {"train_loss": -7.28355598449707, "global_step": 170922, "epoch": 4069} {"train_loss": -7.043055534362793, "global_step": 170923, "epoch": 4069} {"train_loss": -7.066890716552734, "global_step": 170924, "epoch": 4069} {"train_loss": -7.052175521850586, "global_step": 170925, "epoch": 4069} {"train_loss": -6.929385185241699, "global_step": 170926, "epoch": 4069} {"train_loss": -7.093771934509277, "global_step": 170927, "epoch": 4069} {"train_loss": -7.120131492614746, "global_step": 170928, "epoch": 4069} {"train_loss": -7.010941028594971, "global_step": 170929, "epoch": 4069} {"train_loss": -7.009997367858887, "global_step": 170930, "epoch": 4069} {"train_loss": -7.079668998718262, "global_step": 170931, "epoch": 4069} {"train_loss": -7.060352325439453, "global_step": 170932, "epoch": 4069} {"train_loss": -7.05985164642334, "global_step": 170933, "epoch": 4069} {"train_loss": -7.088713645935059, "global_step": 170934, "epoch": 4069} {"train_loss": -7.032853126525879, "global_step": 170935, "epoch": 4069} {"train_loss": -7.060596466064453, "global_step": 170936, "epoch": 4069} {"train_loss": -6.9583868980407715, "global_step": 170937, "epoch": 4069} {"train_loss": -7.134571075439453, "global_step": 170938, "epoch": 4069} {"train_loss": -7.035958880469913, "global_step": 170939, "epoch": 4069, "val_loss": 68891.6875} {"train_loss": -7.122371673583984, "global_step": 170940, "epoch": 4070} {"train_loss": -7.1071929931640625, "global_step": 170941, "epoch": 4070} {"train_loss": -7.130489349365234, "global_step": 170942, "epoch": 4070} {"train_loss": -7.110850811004639, "global_step": 170943, "epoch": 4070} {"train_loss": -7.102843761444092, "global_step": 170944, "epoch": 4070} {"train_loss": -7.156646728515625, "global_step": 170945, "epoch": 4070} {"train_loss": -7.143908500671387, "global_step": 170946, "epoch": 4070} {"train_loss": -7.139585494995117, "global_step": 170947, "epoch": 4070} {"train_loss": -7.024094581604004, "global_step": 170948, "epoch": 4070} {"train_loss": -7.008148670196533, "global_step": 170949, "epoch": 4070} {"train_loss": -7.119998931884766, "global_step": 170950, "epoch": 4070} {"train_loss": -7.116905689239502, "global_step": 170951, "epoch": 4070} {"train_loss": -7.035769462585449, "global_step": 170952, "epoch": 4070} {"train_loss": -7.033641815185547, "global_step": 170953, "epoch": 4070} {"train_loss": -7.014983177185059, "global_step": 170954, "epoch": 4070} {"train_loss": -7.176756858825684, "global_step": 170955, "epoch": 4070} {"train_loss": -7.101479530334473, "global_step": 170956, "epoch": 4070} {"train_loss": -7.035794734954834, "global_step": 170957, "epoch": 4070} {"train_loss": -7.148782730102539, "global_step": 170958, "epoch": 4070} {"train_loss": -7.144932270050049, "global_step": 170959, "epoch": 4070} {"train_loss": -7.160046100616455, "global_step": 170960, "epoch": 4070} {"train_loss": -7.164295196533203, "global_step": 170961, "epoch": 4070} {"train_loss": -7.101244926452637, "global_step": 170962, "epoch": 4070} {"train_loss": -7.042830467224121, "global_step": 170963, "epoch": 4070} {"train_loss": -7.075848579406738, "global_step": 170964, "epoch": 4070} {"train_loss": -7.11244010925293, "global_step": 170965, "epoch": 4070} {"train_loss": -7.080666542053223, "global_step": 170966, "epoch": 4070} {"train_loss": -7.1047821044921875, "global_step": 170967, "epoch": 4070} {"train_loss": -7.168554306030273, "global_step": 170968, "epoch": 4070} {"train_loss": -7.126507759094238, "global_step": 170969, "epoch": 4070} {"train_loss": -7.103551864624023, "global_step": 170970, "epoch": 4070} {"train_loss": -7.086130142211914, "global_step": 170971, "epoch": 4070} {"train_loss": -7.048640251159668, "global_step": 170972, "epoch": 4070} {"train_loss": -6.984348773956299, "global_step": 170973, "epoch": 4070} {"train_loss": -6.93212890625, "global_step": 170974, "epoch": 4070} {"train_loss": -7.0116376876831055, "global_step": 170975, "epoch": 4070} {"train_loss": -7.080120086669922, "global_step": 170976, "epoch": 4070} {"train_loss": -7.028476715087891, "global_step": 170977, "epoch": 4070} {"train_loss": -7.054105758666992, "global_step": 170978, "epoch": 4070} {"train_loss": -6.970839023590088, "global_step": 170979, "epoch": 4070} {"train_loss": -6.91323184967041, "global_step": 170980, "epoch": 4070} {"train_loss": -7.077811649867466, "global_step": 170981, "epoch": 4070, "val_loss": 69086.03125} {"train_loss": -6.927689552307129, "global_step": 170982, "epoch": 4071} {"train_loss": -7.058908462524414, "global_step": 170983, "epoch": 4071} {"train_loss": -6.999932765960693, "global_step": 170984, "epoch": 4071} {"train_loss": -6.884420394897461, "global_step": 170985, "epoch": 4071} {"train_loss": -6.871036529541016, "global_step": 170986, "epoch": 4071} {"train_loss": -6.727663516998291, "global_step": 170987, "epoch": 4071} {"train_loss": -6.880198001861572, "global_step": 170988, "epoch": 4071} {"train_loss": -6.814593315124512, "global_step": 170989, "epoch": 4071} {"train_loss": -6.825283050537109, "global_step": 170990, "epoch": 4071} {"train_loss": -7.008052349090576, "global_step": 170991, "epoch": 4071} {"train_loss": -6.834331512451172, "global_step": 170992, "epoch": 4071} {"train_loss": -7.119204044342041, "global_step": 170993, "epoch": 4071} {"train_loss": -6.95107364654541, "global_step": 170994, "epoch": 4071} {"train_loss": -6.969265460968018, "global_step": 170995, "epoch": 4071} {"train_loss": -6.9034318923950195, "global_step": 170996, "epoch": 4071} {"train_loss": -6.945493698120117, "global_step": 170997, "epoch": 4071} {"train_loss": -7.003556251525879, "global_step": 170998, "epoch": 4071} {"train_loss": -6.990259647369385, "global_step": 170999, "epoch": 4071} {"train_loss": -6.999691009521484, "global_step": 171000, "epoch": 4071} {"train_loss": -6.920021057128906, "global_step": 171001, "epoch": 4071} {"train_loss": -7.01025915145874, "global_step": 171002, "epoch": 4071} {"train_loss": -6.981318473815918, "global_step": 171003, "epoch": 4071} {"train_loss": -7.042622089385986, "global_step": 171004, "epoch": 4071} {"train_loss": -7.01397705078125, "global_step": 171005, "epoch": 4071} {"train_loss": -7.1282548904418945, "global_step": 171006, "epoch": 4071} {"train_loss": -6.984343528747559, "global_step": 171007, "epoch": 4071} {"train_loss": -7.071034908294678, "global_step": 171008, "epoch": 4071} {"train_loss": -7.096341133117676, "global_step": 171009, "epoch": 4071} {"train_loss": -7.058725357055664, "global_step": 171010, "epoch": 4071} {"train_loss": -7.157792568206787, "global_step": 171011, "epoch": 4071} {"train_loss": -7.073979377746582, "global_step": 171012, "epoch": 4071} {"train_loss": -6.992827892303467, "global_step": 171013, "epoch": 4071} {"train_loss": -6.961400508880615, "global_step": 171014, "epoch": 4071} {"train_loss": -7.05193567276001, "global_step": 171015, "epoch": 4071} {"train_loss": -7.005974292755127, "global_step": 171016, "epoch": 4071} {"train_loss": -7.003796577453613, "global_step": 171017, "epoch": 4071} {"train_loss": -7.082448959350586, "global_step": 171018, "epoch": 4071} {"train_loss": -7.058417320251465, "global_step": 171019, "epoch": 4071} {"train_loss": -6.96169900894165, "global_step": 171020, "epoch": 4071} {"train_loss": -7.101195335388184, "global_step": 171021, "epoch": 4071} {"train_loss": -7.0228590965271, "global_step": 171022, "epoch": 4071} {"train_loss": -6.98872725168864, "global_step": 171023, "epoch": 4071, "val_loss": 69156.7890625} {"train_loss": -7.139483451843262, "global_step": 171024, "epoch": 4072} {"train_loss": -6.9168267250061035, "global_step": 171025, "epoch": 4072} {"train_loss": -7.027678489685059, "global_step": 171026, "epoch": 4072} {"train_loss": -6.964112281799316, "global_step": 171027, "epoch": 4072} {"train_loss": -6.835064888000488, "global_step": 171028, "epoch": 4072} {"train_loss": -7.124401092529297, "global_step": 171029, "epoch": 4072} {"train_loss": -6.982093334197998, "global_step": 171030, "epoch": 4072} {"train_loss": -6.997934341430664, "global_step": 171031, "epoch": 4072} {"train_loss": -6.958144187927246, "global_step": 171032, "epoch": 4072} {"train_loss": -6.879574775695801, "global_step": 171033, "epoch": 4072} {"train_loss": -7.065211772918701, "global_step": 171034, "epoch": 4072} {"train_loss": -6.988193511962891, "global_step": 171035, "epoch": 4072} {"train_loss": -6.90179443359375, "global_step": 171036, "epoch": 4072} {"train_loss": -7.1087517738342285, "global_step": 171037, "epoch": 4072} {"train_loss": -6.980454921722412, "global_step": 171038, "epoch": 4072} {"train_loss": -7.023951530456543, "global_step": 171039, "epoch": 4072} {"train_loss": -7.128923416137695, "global_step": 171040, "epoch": 4072} {"train_loss": -6.896710395812988, "global_step": 171041, "epoch": 4072} {"train_loss": -6.97167444229126, "global_step": 171042, "epoch": 4072} {"train_loss": -7.066861152648926, "global_step": 171043, "epoch": 4072} {"train_loss": -7.03336238861084, "global_step": 171044, "epoch": 4072} {"train_loss": -6.967816352844238, "global_step": 171045, "epoch": 4072} {"train_loss": -7.027137756347656, "global_step": 171046, "epoch": 4072} {"train_loss": -7.1274614334106445, "global_step": 171047, "epoch": 4072} {"train_loss": -7.030369281768799, "global_step": 171048, "epoch": 4072} {"train_loss": -6.976308345794678, "global_step": 171049, "epoch": 4072} {"train_loss": -7.157070636749268, "global_step": 171050, "epoch": 4072} {"train_loss": -7.182559967041016, "global_step": 171051, "epoch": 4072} {"train_loss": -7.0180277824401855, "global_step": 171052, "epoch": 4072} {"train_loss": -7.054427146911621, "global_step": 171053, "epoch": 4072} {"train_loss": -7.015521049499512, "global_step": 171054, "epoch": 4072} {"train_loss": -7.011030197143555, "global_step": 171055, "epoch": 4072} {"train_loss": -6.9627227783203125, "global_step": 171056, "epoch": 4072} {"train_loss": -7.055618762969971, "global_step": 171057, "epoch": 4072} {"train_loss": -6.861605644226074, "global_step": 171058, "epoch": 4072} {"train_loss": -7.142097473144531, "global_step": 171059, "epoch": 4072} {"train_loss": -7.175169944763184, "global_step": 171060, "epoch": 4072} {"train_loss": -6.9642744064331055, "global_step": 171061, "epoch": 4072} {"train_loss": -7.084396839141846, "global_step": 171062, "epoch": 4072} {"train_loss": -6.943219184875488, "global_step": 171063, "epoch": 4072} {"train_loss": -7.04331111907959, "global_step": 171064, "epoch": 4072} {"train_loss": -7.018575350443522, "global_step": 171065, "epoch": 4072, "val_loss": 68900.8671875} {"train_loss": -7.045970916748047, "global_step": 171066, "epoch": 4073} {"train_loss": -7.202208995819092, "global_step": 171067, "epoch": 4073} {"train_loss": -7.059595108032227, "global_step": 171068, "epoch": 4073} {"train_loss": -7.071468830108643, "global_step": 171069, "epoch": 4073} {"train_loss": -7.126002311706543, "global_step": 171070, "epoch": 4073} {"train_loss": -7.123706340789795, "global_step": 171071, "epoch": 4073} {"train_loss": -7.043286323547363, "global_step": 171072, "epoch": 4073} {"train_loss": -7.023855686187744, "global_step": 171073, "epoch": 4073} {"train_loss": -7.062229633331299, "global_step": 171074, "epoch": 4073} {"train_loss": -6.920654296875, "global_step": 171075, "epoch": 4073} {"train_loss": -7.074143409729004, "global_step": 171076, "epoch": 4073} {"train_loss": -7.063883304595947, "global_step": 171077, "epoch": 4073} {"train_loss": -6.990188121795654, "global_step": 171078, "epoch": 4073} {"train_loss": -7.104712963104248, "global_step": 171079, "epoch": 4073} {"train_loss": -6.931052207946777, "global_step": 171080, "epoch": 4073} {"train_loss": -6.981633186340332, "global_step": 171081, "epoch": 4073} {"train_loss": -7.065773963928223, "global_step": 171082, "epoch": 4073} {"train_loss": -7.013307094573975, "global_step": 171083, "epoch": 4073} {"train_loss": -6.975747108459473, "global_step": 171084, "epoch": 4073} {"train_loss": -7.102433204650879, "global_step": 171085, "epoch": 4073} {"train_loss": -6.919395923614502, "global_step": 171086, "epoch": 4073} {"train_loss": -7.1917314529418945, "global_step": 171087, "epoch": 4073} {"train_loss": -6.931796073913574, "global_step": 171088, "epoch": 4073} {"train_loss": -7.040637016296387, "global_step": 171089, "epoch": 4073} {"train_loss": -7.066707134246826, "global_step": 171090, "epoch": 4073} {"train_loss": -7.013332366943359, "global_step": 171091, "epoch": 4073} {"train_loss": -6.982804298400879, "global_step": 171092, "epoch": 4073} {"train_loss": -7.053619384765625, "global_step": 171093, "epoch": 4073} {"train_loss": -6.851875305175781, "global_step": 171094, "epoch": 4073} {"train_loss": -7.076415538787842, "global_step": 171095, "epoch": 4073} {"train_loss": -6.930935859680176, "global_step": 171096, "epoch": 4073} {"train_loss": -7.048307418823242, "global_step": 171097, "epoch": 4073} {"train_loss": -7.001853942871094, "global_step": 171098, "epoch": 4073} {"train_loss": -6.95163106918335, "global_step": 171099, "epoch": 4073} {"train_loss": -6.988700866699219, "global_step": 171100, "epoch": 4073} {"train_loss": -7.020744800567627, "global_step": 171101, "epoch": 4073} {"train_loss": -6.9772629737854, "global_step": 171102, "epoch": 4073} {"train_loss": -6.967411518096924, "global_step": 171103, "epoch": 4073} {"train_loss": -7.084062576293945, "global_step": 171104, "epoch": 4073} {"train_loss": -6.975955009460449, "global_step": 171105, "epoch": 4073} {"train_loss": -7.089191913604736, "global_step": 171106, "epoch": 4073} {"train_loss": -7.030907403855097, "global_step": 171107, "epoch": 4073, "val_loss": 68848.875} {"train_loss": -6.906322002410889, "global_step": 171108, "epoch": 4074} {"train_loss": -7.012884140014648, "global_step": 171109, "epoch": 4074} {"train_loss": -7.085503101348877, "global_step": 171110, "epoch": 4074} {"train_loss": -6.931369304656982, "global_step": 171111, "epoch": 4074} {"train_loss": -7.0056610107421875, "global_step": 171112, "epoch": 4074} {"train_loss": -6.834482192993164, "global_step": 171113, "epoch": 4074} {"train_loss": -6.9480204582214355, "global_step": 171114, "epoch": 4074} {"train_loss": -7.0134968757629395, "global_step": 171115, "epoch": 4074} {"train_loss": -6.953370094299316, "global_step": 171116, "epoch": 4074} {"train_loss": -6.996087074279785, "global_step": 171117, "epoch": 4074} {"train_loss": -7.007946014404297, "global_step": 171118, "epoch": 4074} {"train_loss": -6.947535514831543, "global_step": 171119, "epoch": 4074} {"train_loss": -7.052159786224365, "global_step": 171120, "epoch": 4074} {"train_loss": -6.9363322257995605, "global_step": 171121, "epoch": 4074} {"train_loss": -7.063415050506592, "global_step": 171122, "epoch": 4074} {"train_loss": -6.939284801483154, "global_step": 171123, "epoch": 4074} {"train_loss": -6.941187858581543, "global_step": 171124, "epoch": 4074} {"train_loss": -6.864216327667236, "global_step": 171125, "epoch": 4074} {"train_loss": -6.861825466156006, "global_step": 171126, "epoch": 4074} {"train_loss": -7.102557182312012, "global_step": 171127, "epoch": 4074} {"train_loss": -6.960220813751221, "global_step": 171128, "epoch": 4074} {"train_loss": -6.896852493286133, "global_step": 171129, "epoch": 4074} {"train_loss": -6.981190204620361, "global_step": 171130, "epoch": 4074} {"train_loss": -6.858364582061768, "global_step": 171131, "epoch": 4074} {"train_loss": -7.012190341949463, "global_step": 171132, "epoch": 4074} {"train_loss": -6.892616271972656, "global_step": 171133, "epoch": 4074} {"train_loss": -6.838775634765625, "global_step": 171134, "epoch": 4074} {"train_loss": -6.980088710784912, "global_step": 171135, "epoch": 4074} {"train_loss": -6.919814109802246, "global_step": 171136, "epoch": 4074} {"train_loss": -7.0079731941223145, "global_step": 171137, "epoch": 4074} {"train_loss": -6.920111656188965, "global_step": 171138, "epoch": 4074} {"train_loss": -6.878963947296143, "global_step": 171139, "epoch": 4074} {"train_loss": -7.180412292480469, "global_step": 171140, "epoch": 4074} {"train_loss": -7.026983261108398, "global_step": 171141, "epoch": 4074} {"train_loss": -7.012455463409424, "global_step": 171142, "epoch": 4074} {"train_loss": -7.008545875549316, "global_step": 171143, "epoch": 4074} {"train_loss": -6.901822090148926, "global_step": 171144, "epoch": 4074} {"train_loss": -6.968456268310547, "global_step": 171145, "epoch": 4074} {"train_loss": -7.022470951080322, "global_step": 171146, "epoch": 4074} {"train_loss": -7.047802448272705, "global_step": 171147, "epoch": 4074} {"train_loss": -7.067899227142334, "global_step": 171148, "epoch": 4074} {"train_loss": -6.971941527866182, "global_step": 171149, "epoch": 4074, "val_loss": 69044.3984375} {"train_loss": -7.024809837341309, "global_step": 171150, "epoch": 4075} {"train_loss": -7.111546516418457, "global_step": 171151, "epoch": 4075} {"train_loss": -7.072803020477295, "global_step": 171152, "epoch": 4075} {"train_loss": -7.065909385681152, "global_step": 171153, "epoch": 4075} {"train_loss": -7.134129524230957, "global_step": 171154, "epoch": 4075} {"train_loss": -6.897312164306641, "global_step": 171155, "epoch": 4075} {"train_loss": -7.081235408782959, "global_step": 171156, "epoch": 4075} {"train_loss": -7.065524101257324, "global_step": 171157, "epoch": 4075} {"train_loss": -6.995622158050537, "global_step": 171158, "epoch": 4075} {"train_loss": -7.073668479919434, "global_step": 171159, "epoch": 4075} {"train_loss": -6.904211044311523, "global_step": 171160, "epoch": 4075} {"train_loss": -6.932685852050781, "global_step": 171161, "epoch": 4075} {"train_loss": -7.049941062927246, "global_step": 171162, "epoch": 4075} {"train_loss": -7.008288860321045, "global_step": 171163, "epoch": 4075} {"train_loss": -7.084762096405029, "global_step": 171164, "epoch": 4075} {"train_loss": -6.894133567810059, "global_step": 171165, "epoch": 4075} {"train_loss": -7.0492401123046875, "global_step": 171166, "epoch": 4075} {"train_loss": -6.974651336669922, "global_step": 171167, "epoch": 4075} {"train_loss": -7.041646957397461, "global_step": 171168, "epoch": 4075} {"train_loss": -6.971835136413574, "global_step": 171169, "epoch": 4075} {"train_loss": -6.9823503494262695, "global_step": 171170, "epoch": 4075} {"train_loss": -7.059668064117432, "global_step": 171171, "epoch": 4075} {"train_loss": -7.121457099914551, "global_step": 171172, "epoch": 4075} {"train_loss": -6.970582962036133, "global_step": 171173, "epoch": 4075} {"train_loss": -6.935471534729004, "global_step": 171174, "epoch": 4075} {"train_loss": -7.002352237701416, "global_step": 171175, "epoch": 4075} {"train_loss": -6.984493732452393, "global_step": 171176, "epoch": 4075} {"train_loss": -6.971011161804199, "global_step": 171177, "epoch": 4075} {"train_loss": -7.054325103759766, "global_step": 171178, "epoch": 4075} {"train_loss": -6.889148712158203, "global_step": 171179, "epoch": 4075} {"train_loss": -6.898927688598633, "global_step": 171180, "epoch": 4075} {"train_loss": -7.07457160949707, "global_step": 171181, "epoch": 4075} {"train_loss": -7.051684379577637, "global_step": 171182, "epoch": 4075} {"train_loss": -7.065751075744629, "global_step": 171183, "epoch": 4075} {"train_loss": -7.017860412597656, "global_step": 171184, "epoch": 4075} {"train_loss": -7.002098560333252, "global_step": 171185, "epoch": 4075} {"train_loss": -7.039581298828125, "global_step": 171186, "epoch": 4075} {"train_loss": -7.045722961425781, "global_step": 171187, "epoch": 4075} {"train_loss": -7.075497150421143, "global_step": 171188, "epoch": 4075} {"train_loss": -7.081087589263916, "global_step": 171189, "epoch": 4075} {"train_loss": -7.150715351104736, "global_step": 171190, "epoch": 4075} {"train_loss": -7.021571443194435, "global_step": 171191, "epoch": 4075, "val_loss": 68806.8125} {"train_loss": -6.971097946166992, "global_step": 171192, "epoch": 4076} {"train_loss": -7.042409420013428, "global_step": 171193, "epoch": 4076} {"train_loss": -7.017814636230469, "global_step": 171194, "epoch": 4076} {"train_loss": -7.1268510818481445, "global_step": 171195, "epoch": 4076} {"train_loss": -7.067749500274658, "global_step": 171196, "epoch": 4076} {"train_loss": -6.969850540161133, "global_step": 171197, "epoch": 4076} {"train_loss": -7.031706809997559, "global_step": 171198, "epoch": 4076} {"train_loss": -7.07929801940918, "global_step": 171199, "epoch": 4076} {"train_loss": -7.109800338745117, "global_step": 171200, "epoch": 4076} {"train_loss": -6.987061977386475, "global_step": 171201, "epoch": 4076} {"train_loss": -7.0116400718688965, "global_step": 171202, "epoch": 4076} {"train_loss": -6.86640739440918, "global_step": 171203, "epoch": 4076} {"train_loss": -7.060749530792236, "global_step": 171204, "epoch": 4076} {"train_loss": -6.992319107055664, "global_step": 171205, "epoch": 4076} {"train_loss": -6.89617919921875, "global_step": 171206, "epoch": 4076} {"train_loss": -6.997725963592529, "global_step": 171207, "epoch": 4076} {"train_loss": -6.954360008239746, "global_step": 171208, "epoch": 4076} {"train_loss": -7.000312805175781, "global_step": 171209, "epoch": 4076} {"train_loss": -6.947723388671875, "global_step": 171210, "epoch": 4076} {"train_loss": -6.8773512840271, "global_step": 171211, "epoch": 4076} {"train_loss": -7.014021873474121, "global_step": 171212, "epoch": 4076} {"train_loss": -6.779128074645996, "global_step": 171213, "epoch": 4076} {"train_loss": -7.030718803405762, "global_step": 171214, "epoch": 4076} {"train_loss": -6.9277520179748535, "global_step": 171215, "epoch": 4076} {"train_loss": -6.916547775268555, "global_step": 171216, "epoch": 4076} {"train_loss": -6.962849140167236, "global_step": 171217, "epoch": 4076} {"train_loss": -6.8900041580200195, "global_step": 171218, "epoch": 4076} {"train_loss": -6.964166641235352, "global_step": 171219, "epoch": 4076} {"train_loss": -6.789675712585449, "global_step": 171220, "epoch": 4076} {"train_loss": -7.032308101654053, "global_step": 171221, "epoch": 4076} {"train_loss": -6.848325252532959, "global_step": 171222, "epoch": 4076} {"train_loss": -6.856025695800781, "global_step": 171223, "epoch": 4076} {"train_loss": -6.926703929901123, "global_step": 171224, "epoch": 4076} {"train_loss": -6.85609245300293, "global_step": 171225, "epoch": 4076} {"train_loss": -6.991316795349121, "global_step": 171226, "epoch": 4076} {"train_loss": -6.7512664794921875, "global_step": 171227, "epoch": 4076} {"train_loss": -6.9956159591674805, "global_step": 171228, "epoch": 4076} {"train_loss": -6.8062744140625, "global_step": 171229, "epoch": 4076} {"train_loss": -6.990300178527832, "global_step": 171230, "epoch": 4076} {"train_loss": -6.848474979400635, "global_step": 171231, "epoch": 4076} {"train_loss": -6.936392784118652, "global_step": 171232, "epoch": 4076} {"train_loss": -6.954160883313134, "global_step": 171233, "epoch": 4076, "val_loss": 69148.0} {"train_loss": -7.057047367095947, "global_step": 171234, "epoch": 4077} {"train_loss": -6.875364303588867, "global_step": 171235, "epoch": 4077} {"train_loss": -7.085766792297363, "global_step": 171236, "epoch": 4077} {"train_loss": -6.956911563873291, "global_step": 171237, "epoch": 4077} {"train_loss": -7.00037145614624, "global_step": 171238, "epoch": 4077} {"train_loss": -7.142027854919434, "global_step": 171239, "epoch": 4077} {"train_loss": -6.965295791625977, "global_step": 171240, "epoch": 4077} {"train_loss": -7.007662296295166, "global_step": 171241, "epoch": 4077} {"train_loss": -6.998076438903809, "global_step": 171242, "epoch": 4077} {"train_loss": -7.095340728759766, "global_step": 171243, "epoch": 4077} {"train_loss": -7.0431671142578125, "global_step": 171244, "epoch": 4077} {"train_loss": -6.957170486450195, "global_step": 171245, "epoch": 4077} {"train_loss": -7.139743804931641, "global_step": 171246, "epoch": 4077} {"train_loss": -7.0292768478393555, "global_step": 171247, "epoch": 4077} {"train_loss": -6.909795761108398, "global_step": 171248, "epoch": 4077} {"train_loss": -6.974390983581543, "global_step": 171249, "epoch": 4077} {"train_loss": -7.072652816772461, "global_step": 171250, "epoch": 4077} {"train_loss": -6.958649635314941, "global_step": 171251, "epoch": 4077} {"train_loss": -7.028662204742432, "global_step": 171252, "epoch": 4077} {"train_loss": -7.039336681365967, "global_step": 171253, "epoch": 4077} {"train_loss": -6.957111358642578, "global_step": 171254, "epoch": 4077} {"train_loss": -7.038152694702148, "global_step": 171255, "epoch": 4077} {"train_loss": -6.9794511795043945, "global_step": 171256, "epoch": 4077} {"train_loss": -7.016211032867432, "global_step": 171257, "epoch": 4077} {"train_loss": -7.1487627029418945, "global_step": 171258, "epoch": 4077} {"train_loss": -7.156174659729004, "global_step": 171259, "epoch": 4077} {"train_loss": -6.897172927856445, "global_step": 171260, "epoch": 4077} {"train_loss": -7.083786964416504, "global_step": 171261, "epoch": 4077} {"train_loss": -7.094132423400879, "global_step": 171262, "epoch": 4077} {"train_loss": -7.049258232116699, "global_step": 171263, "epoch": 4077} {"train_loss": -7.140954971313477, "global_step": 171264, "epoch": 4077} {"train_loss": -7.010333061218262, "global_step": 171265, "epoch": 4077} {"train_loss": -7.110807418823242, "global_step": 171266, "epoch": 4077} {"train_loss": -7.15065860748291, "global_step": 171267, "epoch": 4077} {"train_loss": -7.027842998504639, "global_step": 171268, "epoch": 4077} {"train_loss": -6.99157190322876, "global_step": 171269, "epoch": 4077} {"train_loss": -7.09352970123291, "global_step": 171270, "epoch": 4077} {"train_loss": -7.06071138381958, "global_step": 171271, "epoch": 4077} {"train_loss": -7.075544357299805, "global_step": 171272, "epoch": 4077} {"train_loss": -7.057177543640137, "global_step": 171273, "epoch": 4077} {"train_loss": -7.016166687011719, "global_step": 171274, "epoch": 4077} {"train_loss": -7.036224853424799, "global_step": 171275, "epoch": 4077, "val_loss": 68924.984375} {"train_loss": -6.961635589599609, "global_step": 171276, "epoch": 4078} {"train_loss": -7.038485050201416, "global_step": 171277, "epoch": 4078} {"train_loss": -7.0739898681640625, "global_step": 171278, "epoch": 4078} {"train_loss": -7.084045886993408, "global_step": 171279, "epoch": 4078} {"train_loss": -7.070022106170654, "global_step": 171280, "epoch": 4078} {"train_loss": -7.00546932220459, "global_step": 171281, "epoch": 4078} {"train_loss": -7.112222671508789, "global_step": 171282, "epoch": 4078} {"train_loss": -6.93090295791626, "global_step": 171283, "epoch": 4078} {"train_loss": -7.12489652633667, "global_step": 171284, "epoch": 4078} {"train_loss": -7.188192367553711, "global_step": 171285, "epoch": 4078} {"train_loss": -7.043850898742676, "global_step": 171286, "epoch": 4078} {"train_loss": -7.067354679107666, "global_step": 171287, "epoch": 4078} {"train_loss": -7.109228134155273, "global_step": 171288, "epoch": 4078} {"train_loss": -7.029825210571289, "global_step": 171289, "epoch": 4078} {"train_loss": -7.081648826599121, "global_step": 171290, "epoch": 4078} {"train_loss": -7.013584136962891, "global_step": 171291, "epoch": 4078} {"train_loss": -7.06069278717041, "global_step": 171292, "epoch": 4078} {"train_loss": -6.978964805603027, "global_step": 171293, "epoch": 4078} {"train_loss": -7.15566349029541, "global_step": 171294, "epoch": 4078} {"train_loss": -7.111634254455566, "global_step": 171295, "epoch": 4078} {"train_loss": -7.1413164138793945, "global_step": 171296, "epoch": 4078} {"train_loss": -7.012294769287109, "global_step": 171297, "epoch": 4078} {"train_loss": -7.172236442565918, "global_step": 171298, "epoch": 4078} {"train_loss": -7.158314228057861, "global_step": 171299, "epoch": 4078} {"train_loss": -7.109665393829346, "global_step": 171300, "epoch": 4078} {"train_loss": -7.143110275268555, "global_step": 171301, "epoch": 4078} {"train_loss": -7.055598258972168, "global_step": 171302, "epoch": 4078} {"train_loss": -7.046815872192383, "global_step": 171303, "epoch": 4078} {"train_loss": -7.074980735778809, "global_step": 171304, "epoch": 4078} {"train_loss": -7.128999710083008, "global_step": 171305, "epoch": 4078} {"train_loss": -7.094090461730957, "global_step": 171306, "epoch": 4078} {"train_loss": -7.149104595184326, "global_step": 171307, "epoch": 4078} {"train_loss": -7.107596397399902, "global_step": 171308, "epoch": 4078} {"train_loss": -7.055559158325195, "global_step": 171309, "epoch": 4078} {"train_loss": -7.138935565948486, "global_step": 171310, "epoch": 4078} {"train_loss": -7.083855152130127, "global_step": 171311, "epoch": 4078} {"train_loss": -7.097331523895264, "global_step": 171312, "epoch": 4078} {"train_loss": -7.0123209953308105, "global_step": 171313, "epoch": 4078} {"train_loss": -7.145463943481445, "global_step": 171314, "epoch": 4078} {"train_loss": -7.107514381408691, "global_step": 171315, "epoch": 4078} {"train_loss": -7.044212818145752, "global_step": 171316, "epoch": 4078} {"train_loss": -7.081143084026518, "global_step": 171317, "epoch": 4078, "val_loss": 68973.578125} {"train_loss": -6.999568939208984, "global_step": 171318, "epoch": 4079} {"train_loss": -6.991481781005859, "global_step": 171319, "epoch": 4079} {"train_loss": -6.993090629577637, "global_step": 171320, "epoch": 4079} {"train_loss": -6.8833441734313965, "global_step": 171321, "epoch": 4079} {"train_loss": -7.142755508422852, "global_step": 171322, "epoch": 4079} {"train_loss": -7.079390048980713, "global_step": 171323, "epoch": 4079} {"train_loss": -6.986174583435059, "global_step": 171324, "epoch": 4079} {"train_loss": -7.119398593902588, "global_step": 171325, "epoch": 4079} {"train_loss": -7.001247406005859, "global_step": 171326, "epoch": 4079} {"train_loss": -7.050936222076416, "global_step": 171327, "epoch": 4079} {"train_loss": -7.035789966583252, "global_step": 171328, "epoch": 4079} {"train_loss": -6.935832977294922, "global_step": 171329, "epoch": 4079} {"train_loss": -6.983315467834473, "global_step": 171330, "epoch": 4079} {"train_loss": -7.078051567077637, "global_step": 171331, "epoch": 4079} {"train_loss": -7.009477615356445, "global_step": 171332, "epoch": 4079} {"train_loss": -7.127401351928711, "global_step": 171333, "epoch": 4079} {"train_loss": -6.996994972229004, "global_step": 171334, "epoch": 4079} {"train_loss": -6.944476127624512, "global_step": 171335, "epoch": 4079} {"train_loss": -7.072103977203369, "global_step": 171336, "epoch": 4079} {"train_loss": -6.987646102905273, "global_step": 171337, "epoch": 4079} {"train_loss": -7.070955753326416, "global_step": 171338, "epoch": 4079} {"train_loss": -7.03069543838501, "global_step": 171339, "epoch": 4079} {"train_loss": -7.049571990966797, "global_step": 171340, "epoch": 4079} {"train_loss": -6.999133586883545, "global_step": 171341, "epoch": 4079} {"train_loss": -7.048038005828857, "global_step": 171342, "epoch": 4079} {"train_loss": -7.045384407043457, "global_step": 171343, "epoch": 4079} {"train_loss": -7.14113187789917, "global_step": 171344, "epoch": 4079} {"train_loss": -7.152665138244629, "global_step": 171345, "epoch": 4079} {"train_loss": -7.140476226806641, "global_step": 171346, "epoch": 4079} {"train_loss": -7.0127434730529785, "global_step": 171347, "epoch": 4079} {"train_loss": -7.092424392700195, "global_step": 171348, "epoch": 4079} {"train_loss": -7.013233184814453, "global_step": 171349, "epoch": 4079} {"train_loss": -6.964189529418945, "global_step": 171350, "epoch": 4079} {"train_loss": -7.012415409088135, "global_step": 171351, "epoch": 4079} {"train_loss": -7.1469526290893555, "global_step": 171352, "epoch": 4079} {"train_loss": -7.123213291168213, "global_step": 171353, "epoch": 4079} {"train_loss": -7.088741779327393, "global_step": 171354, "epoch": 4079} {"train_loss": -7.067715644836426, "global_step": 171355, "epoch": 4079} {"train_loss": -7.0339155197143555, "global_step": 171356, "epoch": 4079} {"train_loss": -6.988616466522217, "global_step": 171357, "epoch": 4079} {"train_loss": -7.024580955505371, "global_step": 171358, "epoch": 4079} {"train_loss": -7.040717965080624, "global_step": 171359, "epoch": 4079, "val_loss": 68896.984375} {"train_loss": -7.025305271148682, "global_step": 171360, "epoch": 4080} {"train_loss": -7.007231712341309, "global_step": 171361, "epoch": 4080} {"train_loss": -7.129733085632324, "global_step": 171362, "epoch": 4080} {"train_loss": -7.085862159729004, "global_step": 171363, "epoch": 4080} {"train_loss": -7.033400535583496, "global_step": 171364, "epoch": 4080} {"train_loss": -7.1213555335998535, "global_step": 171365, "epoch": 4080} {"train_loss": -7.128808975219727, "global_step": 171366, "epoch": 4080} {"train_loss": -7.126086235046387, "global_step": 171367, "epoch": 4080} {"train_loss": -7.063718795776367, "global_step": 171368, "epoch": 4080} {"train_loss": -6.9818010330200195, "global_step": 171369, "epoch": 4080} {"train_loss": -7.1219258308410645, "global_step": 171370, "epoch": 4080} {"train_loss": -7.129391670227051, "global_step": 171371, "epoch": 4080} {"train_loss": -7.130239963531494, "global_step": 171372, "epoch": 4080} {"train_loss": -7.0899152755737305, "global_step": 171373, "epoch": 4080} {"train_loss": -7.10592794418335, "global_step": 171374, "epoch": 4080} {"train_loss": -7.008414268493652, "global_step": 171375, "epoch": 4080} {"train_loss": -7.132277488708496, "global_step": 171376, "epoch": 4080} {"train_loss": -6.977479934692383, "global_step": 171377, "epoch": 4080} {"train_loss": -7.204492568969727, "global_step": 171378, "epoch": 4080} {"train_loss": -7.053408622741699, "global_step": 171379, "epoch": 4080} {"train_loss": -6.967074394226074, "global_step": 171380, "epoch": 4080} {"train_loss": -7.11617374420166, "global_step": 171381, "epoch": 4080} {"train_loss": -7.143001079559326, "global_step": 171382, "epoch": 4080} {"train_loss": -7.0283355712890625, "global_step": 171383, "epoch": 4080} {"train_loss": -7.012570381164551, "global_step": 171384, "epoch": 4080} {"train_loss": -7.110856056213379, "global_step": 171385, "epoch": 4080} {"train_loss": -7.193380355834961, "global_step": 171386, "epoch": 4080} {"train_loss": -7.155909538269043, "global_step": 171387, "epoch": 4080} {"train_loss": -7.086365699768066, "global_step": 171388, "epoch": 4080} {"train_loss": -7.071979999542236, "global_step": 171389, "epoch": 4080} {"train_loss": -7.095246315002441, "global_step": 171390, "epoch": 4080} {"train_loss": -6.9941864013671875, "global_step": 171391, "epoch": 4080} {"train_loss": -7.092505931854248, "global_step": 171392, "epoch": 4080} {"train_loss": -7.0727081298828125, "global_step": 171393, "epoch": 4080} {"train_loss": -7.111762046813965, "global_step": 171394, "epoch": 4080} {"train_loss": -7.114376068115234, "global_step": 171395, "epoch": 4080} {"train_loss": -6.9647674560546875, "global_step": 171396, "epoch": 4080} {"train_loss": -7.032050132751465, "global_step": 171397, "epoch": 4080} {"train_loss": -7.0803680419921875, "global_step": 171398, "epoch": 4080} {"train_loss": -6.990958213806152, "global_step": 171399, "epoch": 4080} {"train_loss": -7.018089294433594, "global_step": 171400, "epoch": 4080} {"train_loss": -7.075169472467332, "global_step": 171401, "epoch": 4080, "val_loss": 69160.8984375} {"train_loss": -6.9818525314331055, "global_step": 171402, "epoch": 4081} {"train_loss": -6.952541351318359, "global_step": 171403, "epoch": 4081} {"train_loss": -7.074406147003174, "global_step": 171404, "epoch": 4081} {"train_loss": -6.916038513183594, "global_step": 171405, "epoch": 4081} {"train_loss": -6.98283052444458, "global_step": 171406, "epoch": 4081} {"train_loss": -6.987710952758789, "global_step": 171407, "epoch": 4081} {"train_loss": -6.8903985023498535, "global_step": 171408, "epoch": 4081} {"train_loss": -7.005194664001465, "global_step": 171409, "epoch": 4081} {"train_loss": -6.981398105621338, "global_step": 171410, "epoch": 4081} {"train_loss": -6.9164628982543945, "global_step": 171411, "epoch": 4081} {"train_loss": -6.946690559387207, "global_step": 171412, "epoch": 4081} {"train_loss": -6.901567459106445, "global_step": 171413, "epoch": 4081} {"train_loss": -7.0709404945373535, "global_step": 171414, "epoch": 4081} {"train_loss": -7.061343669891357, "global_step": 171415, "epoch": 4081} {"train_loss": -6.9133501052856445, "global_step": 171416, "epoch": 4081} {"train_loss": -6.951848030090332, "global_step": 171417, "epoch": 4081} {"train_loss": -6.8872175216674805, "global_step": 171418, "epoch": 4081} {"train_loss": -6.988306999206543, "global_step": 171419, "epoch": 4081} {"train_loss": -7.058802604675293, "global_step": 171420, "epoch": 4081} {"train_loss": -7.004698276519775, "global_step": 171421, "epoch": 4081} {"train_loss": -7.100771903991699, "global_step": 171422, "epoch": 4081} {"train_loss": -7.095002174377441, "global_step": 171423, "epoch": 4081} {"train_loss": -6.824700355529785, "global_step": 171424, "epoch": 4081} {"train_loss": -7.042117118835449, "global_step": 171425, "epoch": 4081} {"train_loss": -7.081105709075928, "global_step": 171426, "epoch": 4081} {"train_loss": -6.926698207855225, "global_step": 171427, "epoch": 4081} {"train_loss": -7.1104416847229, "global_step": 171428, "epoch": 4081} {"train_loss": -7.058933734893799, "global_step": 171429, "epoch": 4081} {"train_loss": -7.057399749755859, "global_step": 171430, "epoch": 4081} {"train_loss": -6.970550537109375, "global_step": 171431, "epoch": 4081} {"train_loss": -6.951291561126709, "global_step": 171432, "epoch": 4081} {"train_loss": -7.066019535064697, "global_step": 171433, "epoch": 4081} {"train_loss": -7.069194793701172, "global_step": 171434, "epoch": 4081} {"train_loss": -6.958786964416504, "global_step": 171435, "epoch": 4081} {"train_loss": -7.105091094970703, "global_step": 171436, "epoch": 4081} {"train_loss": -7.044124603271484, "global_step": 171437, "epoch": 4081} {"train_loss": -7.112545013427734, "global_step": 171438, "epoch": 4081} {"train_loss": -7.14965295791626, "global_step": 171439, "epoch": 4081} {"train_loss": -6.971066951751709, "global_step": 171440, "epoch": 4081} {"train_loss": -7.011660575866699, "global_step": 171441, "epoch": 4081} {"train_loss": -7.107061862945557, "global_step": 171442, "epoch": 4081} {"train_loss": -7.0054612046196345, "global_step": 171443, "epoch": 4081, "val_loss": 69028.65625} {"train_loss": -7.00443696975708, "global_step": 171444, "epoch": 4082} {"train_loss": -7.107539653778076, "global_step": 171445, "epoch": 4082} {"train_loss": -7.0845537185668945, "global_step": 171446, "epoch": 4082} {"train_loss": -6.963285446166992, "global_step": 171447, "epoch": 4082} {"train_loss": -7.068253040313721, "global_step": 171448, "epoch": 4082} {"train_loss": -7.096148490905762, "global_step": 171449, "epoch": 4082} {"train_loss": -6.995965003967285, "global_step": 171450, "epoch": 4082} {"train_loss": -7.052867889404297, "global_step": 171451, "epoch": 4082} {"train_loss": -7.035426616668701, "global_step": 171452, "epoch": 4082} {"train_loss": -7.0540771484375, "global_step": 171453, "epoch": 4082} {"train_loss": -6.968844413757324, "global_step": 171454, "epoch": 4082} {"train_loss": -7.013664722442627, "global_step": 171455, "epoch": 4082} {"train_loss": -6.897111892700195, "global_step": 171456, "epoch": 4082} {"train_loss": -6.982424736022949, "global_step": 171457, "epoch": 4082} {"train_loss": -7.035757541656494, "global_step": 171458, "epoch": 4082} {"train_loss": -6.955436706542969, "global_step": 171459, "epoch": 4082} {"train_loss": -6.982515335083008, "global_step": 171460, "epoch": 4082} {"train_loss": -7.038843154907227, "global_step": 171461, "epoch": 4082} {"train_loss": -6.936078071594238, "global_step": 171462, "epoch": 4082} {"train_loss": -7.010746002197266, "global_step": 171463, "epoch": 4082} {"train_loss": -6.892822742462158, "global_step": 171464, "epoch": 4082} {"train_loss": -6.987906455993652, "global_step": 171465, "epoch": 4082} {"train_loss": -7.003721237182617, "global_step": 171466, "epoch": 4082} {"train_loss": -6.878235340118408, "global_step": 171467, "epoch": 4082} {"train_loss": -7.113223552703857, "global_step": 171468, "epoch": 4082} {"train_loss": -6.856450080871582, "global_step": 171469, "epoch": 4082} {"train_loss": -6.923945426940918, "global_step": 171470, "epoch": 4082} {"train_loss": -6.992160320281982, "global_step": 171471, "epoch": 4082} {"train_loss": -6.987299919128418, "global_step": 171472, "epoch": 4082} {"train_loss": -6.948357582092285, "global_step": 171473, "epoch": 4082} {"train_loss": -6.98448371887207, "global_step": 171474, "epoch": 4082} {"train_loss": -6.937503814697266, "global_step": 171475, "epoch": 4082} {"train_loss": -7.019770622253418, "global_step": 171476, "epoch": 4082} {"train_loss": -7.068337440490723, "global_step": 171477, "epoch": 4082} {"train_loss": -7.043024063110352, "global_step": 171478, "epoch": 4082} {"train_loss": -6.983044624328613, "global_step": 171479, "epoch": 4082} {"train_loss": -6.967738151550293, "global_step": 171480, "epoch": 4082} {"train_loss": -7.038822174072266, "global_step": 171481, "epoch": 4082} {"train_loss": -7.020571708679199, "global_step": 171482, "epoch": 4082} {"train_loss": -7.018691062927246, "global_step": 171483, "epoch": 4082} {"train_loss": -7.050734519958496, "global_step": 171484, "epoch": 4082} {"train_loss": -7.001877092179798, "global_step": 171485, "epoch": 4082, "val_loss": 69145.0078125} {"train_loss": -6.9002685546875, "global_step": 171486, "epoch": 4083} {"train_loss": -6.948624610900879, "global_step": 171487, "epoch": 4083} {"train_loss": -7.02287483215332, "global_step": 171488, "epoch": 4083} {"train_loss": -6.9556498527526855, "global_step": 171489, "epoch": 4083} {"train_loss": -7.063939094543457, "global_step": 171490, "epoch": 4083} {"train_loss": -7.046810626983643, "global_step": 171491, "epoch": 4083} {"train_loss": -7.041788101196289, "global_step": 171492, "epoch": 4083} {"train_loss": -6.989670753479004, "global_step": 171493, "epoch": 4083} {"train_loss": -7.0225138664245605, "global_step": 171494, "epoch": 4083} {"train_loss": -7.031949043273926, "global_step": 171495, "epoch": 4083} {"train_loss": -7.156641006469727, "global_step": 171496, "epoch": 4083} {"train_loss": -7.003915786743164, "global_step": 171497, "epoch": 4083} {"train_loss": -6.976326942443848, "global_step": 171498, "epoch": 4083} {"train_loss": -7.0836968421936035, "global_step": 171499, "epoch": 4083} {"train_loss": -6.989441871643066, "global_step": 171500, "epoch": 4083} {"train_loss": -7.0683207511901855, "global_step": 171501, "epoch": 4083} {"train_loss": -7.083835124969482, "global_step": 171502, "epoch": 4083} {"train_loss": -6.952053070068359, "global_step": 171503, "epoch": 4083} {"train_loss": -7.078340530395508, "global_step": 171504, "epoch": 4083} {"train_loss": -6.935113906860352, "global_step": 171505, "epoch": 4083} {"train_loss": -7.000097274780273, "global_step": 171506, "epoch": 4083} {"train_loss": -7.076467514038086, "global_step": 171507, "epoch": 4083} {"train_loss": -7.051352024078369, "global_step": 171508, "epoch": 4083} {"train_loss": -6.9640212059021, "global_step": 171509, "epoch": 4083} {"train_loss": -7.113440036773682, "global_step": 171510, "epoch": 4083} {"train_loss": -6.9366631507873535, "global_step": 171511, "epoch": 4083} {"train_loss": -7.110675811767578, "global_step": 171512, "epoch": 4083} {"train_loss": -7.084806442260742, "global_step": 171513, "epoch": 4083} {"train_loss": -7.095563888549805, "global_step": 171514, "epoch": 4083} {"train_loss": -7.033262252807617, "global_step": 171515, "epoch": 4083} {"train_loss": -7.051003932952881, "global_step": 171516, "epoch": 4083} {"train_loss": -7.096562385559082, "global_step": 171517, "epoch": 4083} {"train_loss": -7.115966320037842, "global_step": 171518, "epoch": 4083} {"train_loss": -7.045564651489258, "global_step": 171519, "epoch": 4083} {"train_loss": -7.056652545928955, "global_step": 171520, "epoch": 4083} {"train_loss": -7.127778053283691, "global_step": 171521, "epoch": 4083} {"train_loss": -7.146589279174805, "global_step": 171522, "epoch": 4083} {"train_loss": -7.128592014312744, "global_step": 171523, "epoch": 4083} {"train_loss": -7.094872951507568, "global_step": 171524, "epoch": 4083} {"train_loss": -7.057339191436768, "global_step": 171525, "epoch": 4083} {"train_loss": -7.1242475509643555, "global_step": 171526, "epoch": 4083} {"train_loss": -7.047561656861078, "global_step": 171527, "epoch": 4083, "val_loss": 68983.484375} {"train_loss": -7.16534423828125, "global_step": 171528, "epoch": 4084} {"train_loss": -7.192546367645264, "global_step": 171529, "epoch": 4084} {"train_loss": -7.155513763427734, "global_step": 171530, "epoch": 4084} {"train_loss": -6.870326042175293, "global_step": 171531, "epoch": 4084} {"train_loss": -7.140345573425293, "global_step": 171532, "epoch": 4084} {"train_loss": -7.070093154907227, "global_step": 171533, "epoch": 4084} {"train_loss": -7.069058418273926, "global_step": 171534, "epoch": 4084} {"train_loss": -7.118616580963135, "global_step": 171535, "epoch": 4084} {"train_loss": -7.04817533493042, "global_step": 171536, "epoch": 4084} {"train_loss": -7.017345428466797, "global_step": 171537, "epoch": 4084} {"train_loss": -7.182652473449707, "global_step": 171538, "epoch": 4084} {"train_loss": -7.117940902709961, "global_step": 171539, "epoch": 4084} {"train_loss": -7.011097431182861, "global_step": 171540, "epoch": 4084} {"train_loss": -7.076414108276367, "global_step": 171541, "epoch": 4084} {"train_loss": -6.951061248779297, "global_step": 171542, "epoch": 4084} {"train_loss": -7.124761581420898, "global_step": 171543, "epoch": 4084} {"train_loss": -6.978946685791016, "global_step": 171544, "epoch": 4084} {"train_loss": -7.027415752410889, "global_step": 171545, "epoch": 4084} {"train_loss": -7.1966447830200195, "global_step": 171546, "epoch": 4084} {"train_loss": -7.092243194580078, "global_step": 171547, "epoch": 4084} {"train_loss": -7.075532913208008, "global_step": 171548, "epoch": 4084} {"train_loss": -6.976379871368408, "global_step": 171549, "epoch": 4084} {"train_loss": -6.907684803009033, "global_step": 171550, "epoch": 4084} {"train_loss": -7.028578281402588, "global_step": 171551, "epoch": 4084} {"train_loss": -7.133907318115234, "global_step": 171552, "epoch": 4084} {"train_loss": -6.937336444854736, "global_step": 171553, "epoch": 4084} {"train_loss": -7.08795166015625, "global_step": 171554, "epoch": 4084} {"train_loss": -6.908834457397461, "global_step": 171555, "epoch": 4084} {"train_loss": -7.07968807220459, "global_step": 171556, "epoch": 4084} {"train_loss": -6.989436149597168, "global_step": 171557, "epoch": 4084} {"train_loss": -6.966238021850586, "global_step": 171558, "epoch": 4084} {"train_loss": -7.122723579406738, "global_step": 171559, "epoch": 4084} {"train_loss": -6.8794450759887695, "global_step": 171560, "epoch": 4084} {"train_loss": -7.019242286682129, "global_step": 171561, "epoch": 4084} {"train_loss": -7.022348880767822, "global_step": 171562, "epoch": 4084} {"train_loss": -6.917585372924805, "global_step": 171563, "epoch": 4084} {"train_loss": -7.0427470207214355, "global_step": 171564, "epoch": 4084} {"train_loss": -6.885792255401611, "global_step": 171565, "epoch": 4084} {"train_loss": -7.0442304611206055, "global_step": 171566, "epoch": 4084} {"train_loss": -6.891772270202637, "global_step": 171567, "epoch": 4084} {"train_loss": -6.988334655761719, "global_step": 171568, "epoch": 4084} {"train_loss": -7.036935908453805, "global_step": 171569, "epoch": 4084, "val_loss": 69052.171875} {"train_loss": -6.808753967285156, "global_step": 171570, "epoch": 4085} {"train_loss": -6.834688186645508, "global_step": 171571, "epoch": 4085} {"train_loss": -6.966888427734375, "global_step": 171572, "epoch": 4085} {"train_loss": -6.828412055969238, "global_step": 171573, "epoch": 4085} {"train_loss": -6.991876602172852, "global_step": 171574, "epoch": 4085} {"train_loss": -6.9784626960754395, "global_step": 171575, "epoch": 4085} {"train_loss": -6.961304664611816, "global_step": 171576, "epoch": 4085} {"train_loss": -6.99875545501709, "global_step": 171577, "epoch": 4085} {"train_loss": -7.054009914398193, "global_step": 171578, "epoch": 4085} {"train_loss": -6.877881050109863, "global_step": 171579, "epoch": 4085} {"train_loss": -6.935912132263184, "global_step": 171580, "epoch": 4085} {"train_loss": -7.077686786651611, "global_step": 171581, "epoch": 4085} {"train_loss": -7.114928245544434, "global_step": 171582, "epoch": 4085} {"train_loss": -7.0251946449279785, "global_step": 171583, "epoch": 4085} {"train_loss": -6.929110050201416, "global_step": 171584, "epoch": 4085} {"train_loss": -7.031721115112305, "global_step": 171585, "epoch": 4085} {"train_loss": -6.874347686767578, "global_step": 171586, "epoch": 4085} {"train_loss": -6.938827991485596, "global_step": 171587, "epoch": 4085} {"train_loss": -6.965851783752441, "global_step": 171588, "epoch": 4085} {"train_loss": -7.06370210647583, "global_step": 171589, "epoch": 4085} {"train_loss": -6.942453384399414, "global_step": 171590, "epoch": 4085} {"train_loss": -6.879429817199707, "global_step": 171591, "epoch": 4085} {"train_loss": -7.011775970458984, "global_step": 171592, "epoch": 4085} {"train_loss": -6.944580078125, "global_step": 171593, "epoch": 4085} {"train_loss": -7.195470809936523, "global_step": 171594, "epoch": 4085} {"train_loss": -6.883172035217285, "global_step": 171595, "epoch": 4085} {"train_loss": -6.894033908843994, "global_step": 171596, "epoch": 4085} {"train_loss": -7.005858421325684, "global_step": 171597, "epoch": 4085} {"train_loss": -6.80372953414917, "global_step": 171598, "epoch": 4085} {"train_loss": -7.003127098083496, "global_step": 171599, "epoch": 4085} {"train_loss": -6.904486656188965, "global_step": 171600, "epoch": 4085} {"train_loss": -6.860292434692383, "global_step": 171601, "epoch": 4085} {"train_loss": -6.987972259521484, "global_step": 171602, "epoch": 4085} {"train_loss": -6.9237565994262695, "global_step": 171603, "epoch": 4085} {"train_loss": -7.035100936889648, "global_step": 171604, "epoch": 4085} {"train_loss": -7.069332599639893, "global_step": 171605, "epoch": 4085} {"train_loss": -6.959271430969238, "global_step": 171606, "epoch": 4085} {"train_loss": -6.980764389038086, "global_step": 171607, "epoch": 4085} {"train_loss": -7.053286552429199, "global_step": 171608, "epoch": 4085} {"train_loss": -7.017819404602051, "global_step": 171609, "epoch": 4085} {"train_loss": -6.866490364074707, "global_step": 171610, "epoch": 4085} {"train_loss": -6.963293279920306, "global_step": 171611, "epoch": 4085, "val_loss": 69080.203125} {"train_loss": -6.936698913574219, "global_step": 171612, "epoch": 4086} {"train_loss": -7.080126762390137, "global_step": 171613, "epoch": 4086} {"train_loss": -6.951122283935547, "global_step": 171614, "epoch": 4086} {"train_loss": -6.9218430519104, "global_step": 171615, "epoch": 4086} {"train_loss": -7.019352912902832, "global_step": 171616, "epoch": 4086} {"train_loss": -7.104684829711914, "global_step": 171617, "epoch": 4086} {"train_loss": -7.007084846496582, "global_step": 171618, "epoch": 4086} {"train_loss": -6.972406387329102, "global_step": 171619, "epoch": 4086} {"train_loss": -7.035778999328613, "global_step": 171620, "epoch": 4086} {"train_loss": -7.035024166107178, "global_step": 171621, "epoch": 4086} {"train_loss": -7.114744663238525, "global_step": 171622, "epoch": 4086} {"train_loss": -6.992396354675293, "global_step": 171623, "epoch": 4086} {"train_loss": -7.075672626495361, "global_step": 171624, "epoch": 4086} {"train_loss": -7.031219482421875, "global_step": 171625, "epoch": 4086} {"train_loss": -7.093268394470215, "global_step": 171626, "epoch": 4086} {"train_loss": -6.97128438949585, "global_step": 171627, "epoch": 4086} {"train_loss": -6.944077014923096, "global_step": 171628, "epoch": 4086} {"train_loss": -6.974179267883301, "global_step": 171629, "epoch": 4086} {"train_loss": -7.019247055053711, "global_step": 171630, "epoch": 4086} {"train_loss": -7.109736919403076, "global_step": 171631, "epoch": 4086} {"train_loss": -6.998683929443359, "global_step": 171632, "epoch": 4086} {"train_loss": -7.079695701599121, "global_step": 171633, "epoch": 4086} {"train_loss": -7.021936893463135, "global_step": 171634, "epoch": 4086} {"train_loss": -7.066576957702637, "global_step": 171635, "epoch": 4086} {"train_loss": -7.082300662994385, "global_step": 171636, "epoch": 4086} {"train_loss": -6.929713249206543, "global_step": 171637, "epoch": 4086} {"train_loss": -7.073328495025635, "global_step": 171638, "epoch": 4086} {"train_loss": -7.058865547180176, "global_step": 171639, "epoch": 4086} {"train_loss": -6.944276332855225, "global_step": 171640, "epoch": 4086} {"train_loss": -7.019717216491699, "global_step": 171641, "epoch": 4086} {"train_loss": -7.000619888305664, "global_step": 171642, "epoch": 4086} {"train_loss": -6.941314697265625, "global_step": 171643, "epoch": 4086} {"train_loss": -6.965095520019531, "global_step": 171644, "epoch": 4086} {"train_loss": -6.87894344329834, "global_step": 171645, "epoch": 4086} {"train_loss": -7.067791938781738, "global_step": 171646, "epoch": 4086} {"train_loss": -7.013160705566406, "global_step": 171647, "epoch": 4086} {"train_loss": -6.996801853179932, "global_step": 171648, "epoch": 4086} {"train_loss": -7.0269269943237305, "global_step": 171649, "epoch": 4086} {"train_loss": -7.026481628417969, "global_step": 171650, "epoch": 4086} {"train_loss": -6.853353977203369, "global_step": 171651, "epoch": 4086} {"train_loss": -7.017417907714844, "global_step": 171652, "epoch": 4086} {"train_loss": -7.007274468739827, "global_step": 171653, "epoch": 4086, "val_loss": 69071.375} {"train_loss": -6.819576263427734, "global_step": 171654, "epoch": 4087} {"train_loss": -7.060126781463623, "global_step": 171655, "epoch": 4087} {"train_loss": -6.837663650512695, "global_step": 171656, "epoch": 4087} {"train_loss": -7.081281661987305, "global_step": 171657, "epoch": 4087} {"train_loss": -7.027976036071777, "global_step": 171658, "epoch": 4087} {"train_loss": -6.900246620178223, "global_step": 171659, "epoch": 4087} {"train_loss": -6.849143028259277, "global_step": 171660, "epoch": 4087} {"train_loss": -6.93429708480835, "global_step": 171661, "epoch": 4087} {"train_loss": -6.929450035095215, "global_step": 171662, "epoch": 4087} {"train_loss": -7.0897321701049805, "global_step": 171663, "epoch": 4087} {"train_loss": -6.829761028289795, "global_step": 171664, "epoch": 4087} {"train_loss": -6.985084533691406, "global_step": 171665, "epoch": 4087} {"train_loss": -7.078874588012695, "global_step": 171666, "epoch": 4087} {"train_loss": -7.102450370788574, "global_step": 171667, "epoch": 4087} {"train_loss": -7.003574371337891, "global_step": 171668, "epoch": 4087} {"train_loss": -7.10862398147583, "global_step": 171669, "epoch": 4087} {"train_loss": -6.975676536560059, "global_step": 171670, "epoch": 4087} {"train_loss": -7.1471757888793945, "global_step": 171671, "epoch": 4087} {"train_loss": -7.058737754821777, "global_step": 171672, "epoch": 4087} {"train_loss": -7.0574188232421875, "global_step": 171673, "epoch": 4087} {"train_loss": -7.04408073425293, "global_step": 171674, "epoch": 4087} {"train_loss": -7.018916130065918, "global_step": 171675, "epoch": 4087} {"train_loss": -7.015554428100586, "global_step": 171676, "epoch": 4087} {"train_loss": -7.149658679962158, "global_step": 171677, "epoch": 4087} {"train_loss": -7.0713348388671875, "global_step": 171678, "epoch": 4087} {"train_loss": -7.02855920791626, "global_step": 171679, "epoch": 4087} {"train_loss": -7.000362396240234, "global_step": 171680, "epoch": 4087} {"train_loss": -6.986331939697266, "global_step": 171681, "epoch": 4087} {"train_loss": -7.071523666381836, "global_step": 171682, "epoch": 4087} {"train_loss": -7.101477146148682, "global_step": 171683, "epoch": 4087} {"train_loss": -6.951107978820801, "global_step": 171684, "epoch": 4087} {"train_loss": -6.984264373779297, "global_step": 171685, "epoch": 4087} {"train_loss": -6.989025592803955, "global_step": 171686, "epoch": 4087} {"train_loss": -7.108150482177734, "global_step": 171687, "epoch": 4087} {"train_loss": -6.922131538391113, "global_step": 171688, "epoch": 4087} {"train_loss": -6.936999797821045, "global_step": 171689, "epoch": 4087} {"train_loss": -6.896517753601074, "global_step": 171690, "epoch": 4087} {"train_loss": -6.890769004821777, "global_step": 171691, "epoch": 4087} {"train_loss": -7.091955184936523, "global_step": 171692, "epoch": 4087} {"train_loss": -6.85266637802124, "global_step": 171693, "epoch": 4087} {"train_loss": -7.002172470092773, "global_step": 171694, "epoch": 4087} {"train_loss": -6.999485515412831, "global_step": 171695, "epoch": 4087, "val_loss": 68974.171875} {"train_loss": -6.8376922607421875, "global_step": 171696, "epoch": 4088} {"train_loss": -6.96436882019043, "global_step": 171697, "epoch": 4088} {"train_loss": -7.063656806945801, "global_step": 171698, "epoch": 4088} {"train_loss": -6.915289878845215, "global_step": 171699, "epoch": 4088} {"train_loss": -7.102200984954834, "global_step": 171700, "epoch": 4088} {"train_loss": -6.91650390625, "global_step": 171701, "epoch": 4088} {"train_loss": -6.987858295440674, "global_step": 171702, "epoch": 4088} {"train_loss": -7.078981876373291, "global_step": 171703, "epoch": 4088} {"train_loss": -7.120375633239746, "global_step": 171704, "epoch": 4088} {"train_loss": -6.991024494171143, "global_step": 171705, "epoch": 4088} {"train_loss": -7.006959438323975, "global_step": 171706, "epoch": 4088} {"train_loss": -7.070817947387695, "global_step": 171707, "epoch": 4088} {"train_loss": -7.058041095733643, "global_step": 171708, "epoch": 4088} {"train_loss": -6.963849067687988, "global_step": 171709, "epoch": 4088} {"train_loss": -7.057412147521973, "global_step": 171710, "epoch": 4088} {"train_loss": -7.042436122894287, "global_step": 171711, "epoch": 4088} {"train_loss": -7.085002899169922, "global_step": 171712, "epoch": 4088} {"train_loss": -6.897059440612793, "global_step": 171713, "epoch": 4088} {"train_loss": -7.054078578948975, "global_step": 171714, "epoch": 4088} {"train_loss": -7.0221967697143555, "global_step": 171715, "epoch": 4088} {"train_loss": -7.111457824707031, "global_step": 171716, "epoch": 4088} {"train_loss": -6.9532341957092285, "global_step": 171717, "epoch": 4088} {"train_loss": -7.112804889678955, "global_step": 171718, "epoch": 4088} {"train_loss": -6.977376937866211, "global_step": 171719, "epoch": 4088} {"train_loss": -6.92342472076416, "global_step": 171720, "epoch": 4088} {"train_loss": -7.026849746704102, "global_step": 171721, "epoch": 4088} {"train_loss": -6.955624580383301, "global_step": 171722, "epoch": 4088} {"train_loss": -7.058568000793457, "global_step": 171723, "epoch": 4088} {"train_loss": -6.974244117736816, "global_step": 171724, "epoch": 4088} {"train_loss": -7.047345161437988, "global_step": 171725, "epoch": 4088} {"train_loss": -7.010380744934082, "global_step": 171726, "epoch": 4088} {"train_loss": -7.063343048095703, "global_step": 171727, "epoch": 4088} {"train_loss": -7.033799648284912, "global_step": 171728, "epoch": 4088} {"train_loss": -7.022111892700195, "global_step": 171729, "epoch": 4088} {"train_loss": -7.154406547546387, "global_step": 171730, "epoch": 4088} {"train_loss": -6.995059967041016, "global_step": 171731, "epoch": 4088} {"train_loss": -7.047384262084961, "global_step": 171732, "epoch": 4088} {"train_loss": -7.055088996887207, "global_step": 171733, "epoch": 4088} {"train_loss": -7.104480743408203, "global_step": 171734, "epoch": 4088} {"train_loss": -6.968092918395996, "global_step": 171735, "epoch": 4088} {"train_loss": -7.1364641189575195, "global_step": 171736, "epoch": 4088} {"train_loss": -7.0275537967681885, "global_step": 171737, "epoch": 4088, "val_loss": 68953.5625} {"train_loss": -7.09415864944458, "global_step": 171738, "epoch": 4089} {"train_loss": -7.20911169052124, "global_step": 171739, "epoch": 4089} {"train_loss": -7.104457855224609, "global_step": 171740, "epoch": 4089} {"train_loss": -7.160976886749268, "global_step": 171741, "epoch": 4089} {"train_loss": -7.161243438720703, "global_step": 171742, "epoch": 4089} {"train_loss": -7.1208295822143555, "global_step": 171743, "epoch": 4089} {"train_loss": -7.127223014831543, "global_step": 171744, "epoch": 4089} {"train_loss": -7.118840217590332, "global_step": 171745, "epoch": 4089} {"train_loss": -7.045722484588623, "global_step": 171746, "epoch": 4089} {"train_loss": -7.1063361167907715, "global_step": 171747, "epoch": 4089} {"train_loss": -7.186960697174072, "global_step": 171748, "epoch": 4089} {"train_loss": -7.140488624572754, "global_step": 171749, "epoch": 4089} {"train_loss": -7.034946918487549, "global_step": 171750, "epoch": 4089} {"train_loss": -7.06353235244751, "global_step": 171751, "epoch": 4089} {"train_loss": -7.173537254333496, "global_step": 171752, "epoch": 4089} {"train_loss": -7.113002777099609, "global_step": 171753, "epoch": 4089} {"train_loss": -7.098694324493408, "global_step": 171754, "epoch": 4089} {"train_loss": -7.060218334197998, "global_step": 171755, "epoch": 4089} {"train_loss": -7.008932113647461, "global_step": 171756, "epoch": 4089} {"train_loss": -7.2320098876953125, "global_step": 171757, "epoch": 4089} {"train_loss": -7.180763244628906, "global_step": 171758, "epoch": 4089} {"train_loss": -7.212652206420898, "global_step": 171759, "epoch": 4089} {"train_loss": -7.138689994812012, "global_step": 171760, "epoch": 4089} {"train_loss": -7.028521537780762, "global_step": 171761, "epoch": 4089} {"train_loss": -7.0529046058654785, "global_step": 171762, "epoch": 4089} {"train_loss": -7.066682815551758, "global_step": 171763, "epoch": 4089} {"train_loss": -7.071500778198242, "global_step": 171764, "epoch": 4089} {"train_loss": -7.0736002922058105, "global_step": 171765, "epoch": 4089} {"train_loss": -7.1854095458984375, "global_step": 171766, "epoch": 4089} {"train_loss": -7.098541259765625, "global_step": 171767, "epoch": 4089} {"train_loss": -7.059760093688965, "global_step": 171768, "epoch": 4089} {"train_loss": -7.148708343505859, "global_step": 171769, "epoch": 4089} {"train_loss": -7.073057174682617, "global_step": 171770, "epoch": 4089} {"train_loss": -7.082313060760498, "global_step": 171771, "epoch": 4089} {"train_loss": -7.003671646118164, "global_step": 171772, "epoch": 4089} {"train_loss": -7.0242695808410645, "global_step": 171773, "epoch": 4089} {"train_loss": -7.112311363220215, "global_step": 171774, "epoch": 4089} {"train_loss": -6.989099979400635, "global_step": 171775, "epoch": 4089} {"train_loss": -7.09413480758667, "global_step": 171776, "epoch": 4089} {"train_loss": -6.979953289031982, "global_step": 171777, "epoch": 4089} {"train_loss": -7.141655921936035, "global_step": 171778, "epoch": 4089} {"train_loss": -7.103813398452032, "global_step": 171779, "epoch": 4089, "val_loss": 68930.2578125} {"train_loss": -7.042223930358887, "global_step": 171780, "epoch": 4090} {"train_loss": -7.129588603973389, "global_step": 171781, "epoch": 4090} {"train_loss": -7.209578037261963, "global_step": 171782, "epoch": 4090} {"train_loss": -7.08551025390625, "global_step": 171783, "epoch": 4090} {"train_loss": -7.105254173278809, "global_step": 171784, "epoch": 4090} {"train_loss": -7.135345458984375, "global_step": 171785, "epoch": 4090} {"train_loss": -7.072965145111084, "global_step": 171786, "epoch": 4090} {"train_loss": -7.08327579498291, "global_step": 171787, "epoch": 4090} {"train_loss": -7.035730838775635, "global_step": 171788, "epoch": 4090} {"train_loss": -7.180051803588867, "global_step": 171789, "epoch": 4090} {"train_loss": -7.113367080688477, "global_step": 171790, "epoch": 4090} {"train_loss": -7.100704193115234, "global_step": 171791, "epoch": 4090} {"train_loss": -7.046997547149658, "global_step": 171792, "epoch": 4090} {"train_loss": -7.080832481384277, "global_step": 171793, "epoch": 4090} {"train_loss": -6.957278251647949, "global_step": 171794, "epoch": 4090} {"train_loss": -6.956875801086426, "global_step": 171795, "epoch": 4090} {"train_loss": -7.118579387664795, "global_step": 171796, "epoch": 4090} {"train_loss": -7.005765914916992, "global_step": 171797, "epoch": 4090} {"train_loss": -6.954239845275879, "global_step": 171798, "epoch": 4090} {"train_loss": -6.960540771484375, "global_step": 171799, "epoch": 4090} {"train_loss": -7.180664539337158, "global_step": 171800, "epoch": 4090} {"train_loss": -7.074450969696045, "global_step": 171801, "epoch": 4090} {"train_loss": -7.130430221557617, "global_step": 171802, "epoch": 4090} {"train_loss": -7.169948101043701, "global_step": 171803, "epoch": 4090} {"train_loss": -7.024321556091309, "global_step": 171804, "epoch": 4090} {"train_loss": -6.916533946990967, "global_step": 171805, "epoch": 4090} {"train_loss": -7.052348613739014, "global_step": 171806, "epoch": 4090} {"train_loss": -7.0138044357299805, "global_step": 171807, "epoch": 4090} {"train_loss": -6.989789962768555, "global_step": 171808, "epoch": 4090} {"train_loss": -7.04832649230957, "global_step": 171809, "epoch": 4090} {"train_loss": -7.065906524658203, "global_step": 171810, "epoch": 4090} {"train_loss": -7.067285537719727, "global_step": 171811, "epoch": 4090} {"train_loss": -7.13521146774292, "global_step": 171812, "epoch": 4090} {"train_loss": -7.081040382385254, "global_step": 171813, "epoch": 4090} {"train_loss": -7.072501182556152, "global_step": 171814, "epoch": 4090} {"train_loss": -7.092513084411621, "global_step": 171815, "epoch": 4090} {"train_loss": -7.022022247314453, "global_step": 171816, "epoch": 4090} {"train_loss": -7.025651931762695, "global_step": 171817, "epoch": 4090} {"train_loss": -7.0682759284973145, "global_step": 171818, "epoch": 4090} {"train_loss": -6.990893363952637, "global_step": 171819, "epoch": 4090} {"train_loss": -7.015526294708252, "global_step": 171820, "epoch": 4090} {"train_loss": -7.062014636539278, "global_step": 171821, "epoch": 4090, "val_loss": 68796.328125} {"train_loss": -7.205381393432617, "global_step": 171822, "epoch": 4091} {"train_loss": -7.066366672515869, "global_step": 171823, "epoch": 4091} {"train_loss": -6.869160175323486, "global_step": 171824, "epoch": 4091} {"train_loss": -6.896917819976807, "global_step": 171825, "epoch": 4091} {"train_loss": -7.0772271156311035, "global_step": 171826, "epoch": 4091} {"train_loss": -6.946164131164551, "global_step": 171827, "epoch": 4091} {"train_loss": -6.892297744750977, "global_step": 171828, "epoch": 4091} {"train_loss": -7.046018600463867, "global_step": 171829, "epoch": 4091} {"train_loss": -6.912899971008301, "global_step": 171830, "epoch": 4091} {"train_loss": -7.017816066741943, "global_step": 171831, "epoch": 4091} {"train_loss": -7.008232116699219, "global_step": 171832, "epoch": 4091} {"train_loss": -7.091446876525879, "global_step": 171833, "epoch": 4091} {"train_loss": -7.073221206665039, "global_step": 171834, "epoch": 4091} {"train_loss": -6.945065498352051, "global_step": 171835, "epoch": 4091} {"train_loss": -7.019067287445068, "global_step": 171836, "epoch": 4091} {"train_loss": -7.046999931335449, "global_step": 171837, "epoch": 4091} {"train_loss": -6.997763156890869, "global_step": 171838, "epoch": 4091} {"train_loss": -6.931778907775879, "global_step": 171839, "epoch": 4091} {"train_loss": -6.828754425048828, "global_step": 171840, "epoch": 4091} {"train_loss": -7.076127529144287, "global_step": 171841, "epoch": 4091} {"train_loss": -6.827178478240967, "global_step": 171842, "epoch": 4091} {"train_loss": -6.989551067352295, "global_step": 171843, "epoch": 4091} {"train_loss": -6.952116012573242, "global_step": 171844, "epoch": 4091} {"train_loss": -6.989416122436523, "global_step": 171845, "epoch": 4091} {"train_loss": -6.928414344787598, "global_step": 171846, "epoch": 4091} {"train_loss": -6.930788040161133, "global_step": 171847, "epoch": 4091} {"train_loss": -6.985771179199219, "global_step": 171848, "epoch": 4091} {"train_loss": -6.8961076736450195, "global_step": 171849, "epoch": 4091} {"train_loss": -7.112526893615723, "global_step": 171850, "epoch": 4091} {"train_loss": -6.949998378753662, "global_step": 171851, "epoch": 4091} {"train_loss": -7.076874732971191, "global_step": 171852, "epoch": 4091} {"train_loss": -6.885697841644287, "global_step": 171853, "epoch": 4091} {"train_loss": -7.0576324462890625, "global_step": 171854, "epoch": 4091} {"train_loss": -7.026049613952637, "global_step": 171855, "epoch": 4091} {"train_loss": -6.884529113769531, "global_step": 171856, "epoch": 4091} {"train_loss": -6.876136779785156, "global_step": 171857, "epoch": 4091} {"train_loss": -6.922677993774414, "global_step": 171858, "epoch": 4091} {"train_loss": -7.059293270111084, "global_step": 171859, "epoch": 4091} {"train_loss": -6.82789421081543, "global_step": 171860, "epoch": 4091} {"train_loss": -7.028680801391602, "global_step": 171861, "epoch": 4091} {"train_loss": -6.98322057723999, "global_step": 171862, "epoch": 4091} {"train_loss": -6.979496819632394, "global_step": 171863, "epoch": 4091, "val_loss": 69125.4453125} {"train_loss": -6.987481117248535, "global_step": 171864, "epoch": 4092} {"train_loss": -7.041982650756836, "global_step": 171865, "epoch": 4092} {"train_loss": -7.057924747467041, "global_step": 171866, "epoch": 4092} {"train_loss": -7.0111470222473145, "global_step": 171867, "epoch": 4092} {"train_loss": -7.035789489746094, "global_step": 171868, "epoch": 4092} {"train_loss": -6.8953328132629395, "global_step": 171869, "epoch": 4092} {"train_loss": -6.992044448852539, "global_step": 171870, "epoch": 4092} {"train_loss": -6.907947540283203, "global_step": 171871, "epoch": 4092} {"train_loss": -7.035205364227295, "global_step": 171872, "epoch": 4092} {"train_loss": -7.00247049331665, "global_step": 171873, "epoch": 4092} {"train_loss": -6.985129356384277, "global_step": 171874, "epoch": 4092} {"train_loss": -6.96146297454834, "global_step": 171875, "epoch": 4092} {"train_loss": -6.9633026123046875, "global_step": 171876, "epoch": 4092} {"train_loss": -6.9859514236450195, "global_step": 171877, "epoch": 4092} {"train_loss": -6.928638458251953, "global_step": 171878, "epoch": 4092} {"train_loss": -6.986173629760742, "global_step": 171879, "epoch": 4092} {"train_loss": -6.924569606781006, "global_step": 171880, "epoch": 4092} {"train_loss": -6.999960422515869, "global_step": 171881, "epoch": 4092} {"train_loss": -7.013118267059326, "global_step": 171882, "epoch": 4092} {"train_loss": -7.014864921569824, "global_step": 171883, "epoch": 4092} {"train_loss": -6.889471054077148, "global_step": 171884, "epoch": 4092} {"train_loss": -6.885447978973389, "global_step": 171885, "epoch": 4092} {"train_loss": -6.939509868621826, "global_step": 171886, "epoch": 4092} {"train_loss": -6.933582305908203, "global_step": 171887, "epoch": 4092} {"train_loss": -6.845789909362793, "global_step": 171888, "epoch": 4092} {"train_loss": -7.001214027404785, "global_step": 171889, "epoch": 4092} {"train_loss": -7.023637771606445, "global_step": 171890, "epoch": 4092} {"train_loss": -7.022019863128662, "global_step": 171891, "epoch": 4092} {"train_loss": -7.0346527099609375, "global_step": 171892, "epoch": 4092} {"train_loss": -7.042423248291016, "global_step": 171893, "epoch": 4092} {"train_loss": -7.061234474182129, "global_step": 171894, "epoch": 4092} {"train_loss": -7.104976654052734, "global_step": 171895, "epoch": 4092} {"train_loss": -6.97619104385376, "global_step": 171896, "epoch": 4092} {"train_loss": -7.015327453613281, "global_step": 171897, "epoch": 4092} {"train_loss": -7.152371406555176, "global_step": 171898, "epoch": 4092} {"train_loss": -7.0074639320373535, "global_step": 171899, "epoch": 4092} {"train_loss": -6.915858268737793, "global_step": 171900, "epoch": 4092} {"train_loss": -7.0216217041015625, "global_step": 171901, "epoch": 4092} {"train_loss": -7.10322380065918, "global_step": 171902, "epoch": 4092} {"train_loss": -7.097004413604736, "global_step": 171903, "epoch": 4092} {"train_loss": -7.044445991516113, "global_step": 171904, "epoch": 4092} {"train_loss": -6.997944434483846, "global_step": 171905, "epoch": 4092, "val_loss": 69007.03125} {"train_loss": -7.080781936645508, "global_step": 171906, "epoch": 4093} {"train_loss": -7.010965347290039, "global_step": 171907, "epoch": 4093} {"train_loss": -7.1495819091796875, "global_step": 171908, "epoch": 4093} {"train_loss": -7.199131965637207, "global_step": 171909, "epoch": 4093} {"train_loss": -7.067221641540527, "global_step": 171910, "epoch": 4093} {"train_loss": -7.13682746887207, "global_step": 171911, "epoch": 4093} {"train_loss": -7.087551116943359, "global_step": 171912, "epoch": 4093} {"train_loss": -7.012792587280273, "global_step": 171913, "epoch": 4093} {"train_loss": -7.1466474533081055, "global_step": 171914, "epoch": 4093} {"train_loss": -7.098968505859375, "global_step": 171915, "epoch": 4093} {"train_loss": -7.031278610229492, "global_step": 171916, "epoch": 4093} {"train_loss": -7.200965881347656, "global_step": 171917, "epoch": 4093} {"train_loss": -7.118937015533447, "global_step": 171918, "epoch": 4093} {"train_loss": -7.000341892242432, "global_step": 171919, "epoch": 4093} {"train_loss": -7.140418529510498, "global_step": 171920, "epoch": 4093} {"train_loss": -7.089849472045898, "global_step": 171921, "epoch": 4093} {"train_loss": -7.03956937789917, "global_step": 171922, "epoch": 4093} {"train_loss": -7.043159484863281, "global_step": 171923, "epoch": 4093} {"train_loss": -7.104231834411621, "global_step": 171924, "epoch": 4093} {"train_loss": -7.00776481628418, "global_step": 171925, "epoch": 4093} {"train_loss": -7.017268180847168, "global_step": 171926, "epoch": 4093} {"train_loss": -7.049046516418457, "global_step": 171927, "epoch": 4093} {"train_loss": -7.08488655090332, "global_step": 171928, "epoch": 4093} {"train_loss": -7.008955478668213, "global_step": 171929, "epoch": 4093} {"train_loss": -7.090314865112305, "global_step": 171930, "epoch": 4093} {"train_loss": -6.974753379821777, "global_step": 171931, "epoch": 4093} {"train_loss": -6.9609575271606445, "global_step": 171932, "epoch": 4093} {"train_loss": -7.050760269165039, "global_step": 171933, "epoch": 4093} {"train_loss": -6.961257457733154, "global_step": 171934, "epoch": 4093} {"train_loss": -7.068833351135254, "global_step": 171935, "epoch": 4093} {"train_loss": -7.004932403564453, "global_step": 171936, "epoch": 4093} {"train_loss": -7.041881561279297, "global_step": 171937, "epoch": 4093} {"train_loss": -7.024288654327393, "global_step": 171938, "epoch": 4093} {"train_loss": -7.018588066101074, "global_step": 171939, "epoch": 4093} {"train_loss": -7.029118537902832, "global_step": 171940, "epoch": 4093} {"train_loss": -7.026455879211426, "global_step": 171941, "epoch": 4093} {"train_loss": -6.938877582550049, "global_step": 171942, "epoch": 4093} {"train_loss": -6.942594051361084, "global_step": 171943, "epoch": 4093} {"train_loss": -6.844367027282715, "global_step": 171944, "epoch": 4093} {"train_loss": -6.986198425292969, "global_step": 171945, "epoch": 4093} {"train_loss": -7.046214580535889, "global_step": 171946, "epoch": 4093} {"train_loss": -7.046016534169515, "global_step": 171947, "epoch": 4093, "val_loss": 69143.71875} {"train_loss": -7.085123062133789, "global_step": 171948, "epoch": 4094} {"train_loss": -7.128421306610107, "global_step": 171949, "epoch": 4094} {"train_loss": -6.898493766784668, "global_step": 171950, "epoch": 4094} {"train_loss": -7.06874942779541, "global_step": 171951, "epoch": 4094} {"train_loss": -7.054624080657959, "global_step": 171952, "epoch": 4094} {"train_loss": -6.850257873535156, "global_step": 171953, "epoch": 4094} {"train_loss": -6.956641674041748, "global_step": 171954, "epoch": 4094} {"train_loss": -7.018597602844238, "global_step": 171955, "epoch": 4094} {"train_loss": -7.007279396057129, "global_step": 171956, "epoch": 4094} {"train_loss": -7.070773124694824, "global_step": 171957, "epoch": 4094} {"train_loss": -6.996912956237793, "global_step": 171958, "epoch": 4094} {"train_loss": -7.060331344604492, "global_step": 171959, "epoch": 4094} {"train_loss": -6.972796440124512, "global_step": 171960, "epoch": 4094} {"train_loss": -6.903759956359863, "global_step": 171961, "epoch": 4094} {"train_loss": -6.8519062995910645, "global_step": 171962, "epoch": 4094} {"train_loss": -7.09596061706543, "global_step": 171963, "epoch": 4094} {"train_loss": -7.117101669311523, "global_step": 171964, "epoch": 4094} {"train_loss": -6.995329856872559, "global_step": 171965, "epoch": 4094} {"train_loss": -7.033421993255615, "global_step": 171966, "epoch": 4094} {"train_loss": -6.985599994659424, "global_step": 171967, "epoch": 4094} {"train_loss": -7.050859451293945, "global_step": 171968, "epoch": 4094} {"train_loss": -7.1070380210876465, "global_step": 171969, "epoch": 4094} {"train_loss": -7.073463439941406, "global_step": 171970, "epoch": 4094} {"train_loss": -7.006708145141602, "global_step": 171971, "epoch": 4094} {"train_loss": -7.086308479309082, "global_step": 171972, "epoch": 4094} {"train_loss": -7.078213691711426, "global_step": 171973, "epoch": 4094} {"train_loss": -7.085128307342529, "global_step": 171974, "epoch": 4094} {"train_loss": -7.120406150817871, "global_step": 171975, "epoch": 4094} {"train_loss": -6.921174049377441, "global_step": 171976, "epoch": 4094} {"train_loss": -7.031130790710449, "global_step": 171977, "epoch": 4094} {"train_loss": -7.007587909698486, "global_step": 171978, "epoch": 4094} {"train_loss": -6.872485160827637, "global_step": 171979, "epoch": 4094} {"train_loss": -7.039885997772217, "global_step": 171980, "epoch": 4094} {"train_loss": -7.01522159576416, "global_step": 171981, "epoch": 4094} {"train_loss": -6.990654945373535, "global_step": 171982, "epoch": 4094} {"train_loss": -7.037448406219482, "global_step": 171983, "epoch": 4094} {"train_loss": -6.976949691772461, "global_step": 171984, "epoch": 4094} {"train_loss": -7.060161590576172, "global_step": 171985, "epoch": 4094} {"train_loss": -6.956469535827637, "global_step": 171986, "epoch": 4094} {"train_loss": -7.098354816436768, "global_step": 171987, "epoch": 4094} {"train_loss": -6.980684757232666, "global_step": 171988, "epoch": 4094} {"train_loss": -7.019242899758475, "global_step": 171989, "epoch": 4094, "val_loss": 69092.640625} {"train_loss": -7.092418670654297, "global_step": 171990, "epoch": 4095} {"train_loss": -7.011862754821777, "global_step": 171991, "epoch": 4095} {"train_loss": -7.079745292663574, "global_step": 171992, "epoch": 4095} {"train_loss": -7.149343013763428, "global_step": 171993, "epoch": 4095} {"train_loss": -6.923873424530029, "global_step": 171994, "epoch": 4095} {"train_loss": -7.074803352355957, "global_step": 171995, "epoch": 4095} {"train_loss": -7.07437801361084, "global_step": 171996, "epoch": 4095} {"train_loss": -7.0942559242248535, "global_step": 171997, "epoch": 4095} {"train_loss": -7.038724899291992, "global_step": 171998, "epoch": 4095} {"train_loss": -7.133833408355713, "global_step": 171999, "epoch": 4095} {"train_loss": -7.067384243011475, "global_step": 172000, "epoch": 4095} {"train_loss": -7.040020942687988, "global_step": 172001, "epoch": 4095} {"train_loss": -6.943574905395508, "global_step": 172002, "epoch": 4095} {"train_loss": -7.086952209472656, "global_step": 172003, "epoch": 4095} {"train_loss": -7.144163131713867, "global_step": 172004, "epoch": 4095} {"train_loss": -7.034907341003418, "global_step": 172005, "epoch": 4095} {"train_loss": -7.105648994445801, "global_step": 172006, "epoch": 4095} {"train_loss": -7.055320739746094, "global_step": 172007, "epoch": 4095} {"train_loss": -7.091734886169434, "global_step": 172008, "epoch": 4095} {"train_loss": -7.21793270111084, "global_step": 172009, "epoch": 4095} {"train_loss": -7.1044602394104, "global_step": 172010, "epoch": 4095} {"train_loss": -6.983222484588623, "global_step": 172011, "epoch": 4095} {"train_loss": -7.039727687835693, "global_step": 172012, "epoch": 4095} {"train_loss": -7.154623508453369, "global_step": 172013, "epoch": 4095} {"train_loss": -7.009241104125977, "global_step": 172014, "epoch": 4095} {"train_loss": -7.074619293212891, "global_step": 172015, "epoch": 4095} {"train_loss": -7.079805850982666, "global_step": 172016, "epoch": 4095} {"train_loss": -7.06801176071167, "global_step": 172017, "epoch": 4095} {"train_loss": -7.025474548339844, "global_step": 172018, "epoch": 4095} {"train_loss": -7.112998008728027, "global_step": 172019, "epoch": 4095} {"train_loss": -7.129580020904541, "global_step": 172020, "epoch": 4095} {"train_loss": -7.047149181365967, "global_step": 172021, "epoch": 4095} {"train_loss": -7.0525288581848145, "global_step": 172022, "epoch": 4095} {"train_loss": -7.077969074249268, "global_step": 172023, "epoch": 4095} {"train_loss": -6.9820356369018555, "global_step": 172024, "epoch": 4095} {"train_loss": -7.024445056915283, "global_step": 172025, "epoch": 4095} {"train_loss": -6.878146171569824, "global_step": 172026, "epoch": 4095} {"train_loss": -6.998807907104492, "global_step": 172027, "epoch": 4095} {"train_loss": -7.049269676208496, "global_step": 172028, "epoch": 4095} {"train_loss": -7.04271125793457, "global_step": 172029, "epoch": 4095} {"train_loss": -7.043963432312012, "global_step": 172030, "epoch": 4095} {"train_loss": -7.061679340544201, "global_step": 172031, "epoch": 4095, "val_loss": 69261.4140625} {"train_loss": -6.932090759277344, "global_step": 172032, "epoch": 4096} {"train_loss": -7.0833234786987305, "global_step": 172033, "epoch": 4096} {"train_loss": -6.777815818786621, "global_step": 172034, "epoch": 4096} {"train_loss": -6.999788284301758, "global_step": 172035, "epoch": 4096} {"train_loss": -7.053606986999512, "global_step": 172036, "epoch": 4096} {"train_loss": -7.082162857055664, "global_step": 172037, "epoch": 4096} {"train_loss": -7.087125301361084, "global_step": 172038, "epoch": 4096} {"train_loss": -7.046446800231934, "global_step": 172039, "epoch": 4096} {"train_loss": -7.084715843200684, "global_step": 172040, "epoch": 4096} {"train_loss": -7.078049659729004, "global_step": 172041, "epoch": 4096} {"train_loss": -6.9605913162231445, "global_step": 172042, "epoch": 4096} {"train_loss": -7.101888179779053, "global_step": 172043, "epoch": 4096} {"train_loss": -7.071506023406982, "global_step": 172044, "epoch": 4096} {"train_loss": -7.05522346496582, "global_step": 172045, "epoch": 4096} {"train_loss": -6.9038496017456055, "global_step": 172046, "epoch": 4096} {"train_loss": -7.069954872131348, "global_step": 172047, "epoch": 4096} {"train_loss": -7.021566867828369, "global_step": 172048, "epoch": 4096} {"train_loss": -7.048776626586914, "global_step": 172049, "epoch": 4096} {"train_loss": -7.234969139099121, "global_step": 172050, "epoch": 4096} {"train_loss": -7.087350845336914, "global_step": 172051, "epoch": 4096} {"train_loss": -7.01650857925415, "global_step": 172052, "epoch": 4096} {"train_loss": -7.04600191116333, "global_step": 172053, "epoch": 4096} {"train_loss": -7.137077808380127, "global_step": 172054, "epoch": 4096} {"train_loss": -7.047344207763672, "global_step": 172055, "epoch": 4096} {"train_loss": -7.13170051574707, "global_step": 172056, "epoch": 4096} {"train_loss": -7.085615158081055, "global_step": 172057, "epoch": 4096} {"train_loss": -7.129983901977539, "global_step": 172058, "epoch": 4096} {"train_loss": -6.956042289733887, "global_step": 172059, "epoch": 4096} {"train_loss": -6.972252368927002, "global_step": 172060, "epoch": 4096} {"train_loss": -7.10343074798584, "global_step": 172061, "epoch": 4096} {"train_loss": -7.154089450836182, "global_step": 172062, "epoch": 4096} {"train_loss": -7.109587669372559, "global_step": 172063, "epoch": 4096} {"train_loss": -7.139391899108887, "global_step": 172064, "epoch": 4096} {"train_loss": -7.219224452972412, "global_step": 172065, "epoch": 4096} {"train_loss": -7.129117965698242, "global_step": 172066, "epoch": 4096} {"train_loss": -7.0527496337890625, "global_step": 172067, "epoch": 4096} {"train_loss": -7.163244247436523, "global_step": 172068, "epoch": 4096} {"train_loss": -7.162672996520996, "global_step": 172069, "epoch": 4096} {"train_loss": -7.06103515625, "global_step": 172070, "epoch": 4096} {"train_loss": -7.0968122482299805, "global_step": 172071, "epoch": 4096} {"train_loss": -7.176275253295898, "global_step": 172072, "epoch": 4096} {"train_loss": -7.0693204289390925, "global_step": 172073, "epoch": 4096, "val_loss": 69177.078125} {"train_loss": -7.030716896057129, "global_step": 172074, "epoch": 4097} {"train_loss": -7.201963424682617, "global_step": 172075, "epoch": 4097} {"train_loss": -7.065439224243164, "global_step": 172076, "epoch": 4097} {"train_loss": -6.995881080627441, "global_step": 172077, "epoch": 4097} {"train_loss": -7.036037445068359, "global_step": 172078, "epoch": 4097} {"train_loss": -6.99554967880249, "global_step": 172079, "epoch": 4097} {"train_loss": -7.029448509216309, "global_step": 172080, "epoch": 4097} {"train_loss": -7.074346542358398, "global_step": 172081, "epoch": 4097} {"train_loss": -7.09500789642334, "global_step": 172082, "epoch": 4097} {"train_loss": -7.032284736633301, "global_step": 172083, "epoch": 4097} {"train_loss": -6.944454193115234, "global_step": 172084, "epoch": 4097} {"train_loss": -6.9484710693359375, "global_step": 172085, "epoch": 4097} {"train_loss": -7.095608234405518, "global_step": 172086, "epoch": 4097} {"train_loss": -6.844414710998535, "global_step": 172087, "epoch": 4097} {"train_loss": -6.905961990356445, "global_step": 172088, "epoch": 4097} {"train_loss": -7.147273540496826, "global_step": 172089, "epoch": 4097} {"train_loss": -7.047823905944824, "global_step": 172090, "epoch": 4097} {"train_loss": -6.887269020080566, "global_step": 172091, "epoch": 4097} {"train_loss": -7.0193705558776855, "global_step": 172092, "epoch": 4097} {"train_loss": -7.011259078979492, "global_step": 172093, "epoch": 4097} {"train_loss": -6.985291481018066, "global_step": 172094, "epoch": 4097} {"train_loss": -7.072989463806152, "global_step": 172095, "epoch": 4097} {"train_loss": -7.086822032928467, "global_step": 172096, "epoch": 4097} {"train_loss": -7.014122486114502, "global_step": 172097, "epoch": 4097} {"train_loss": -7.0152130126953125, "global_step": 172098, "epoch": 4097} {"train_loss": -7.0756120681762695, "global_step": 172099, "epoch": 4097} {"train_loss": -7.018002510070801, "global_step": 172100, "epoch": 4097} {"train_loss": -7.097607612609863, "global_step": 172101, "epoch": 4097} {"train_loss": -7.165120601654053, "global_step": 172102, "epoch": 4097} {"train_loss": -7.066244602203369, "global_step": 172103, "epoch": 4097} {"train_loss": -7.141887664794922, "global_step": 172104, "epoch": 4097} {"train_loss": -7.0937652587890625, "global_step": 172105, "epoch": 4097} {"train_loss": -7.072244644165039, "global_step": 172106, "epoch": 4097} {"train_loss": -7.08853816986084, "global_step": 172107, "epoch": 4097} {"train_loss": -7.084224700927734, "global_step": 172108, "epoch": 4097} {"train_loss": -7.098995685577393, "global_step": 172109, "epoch": 4097} {"train_loss": -7.128568172454834, "global_step": 172110, "epoch": 4097} {"train_loss": -7.094346523284912, "global_step": 172111, "epoch": 4097} {"train_loss": -7.142401695251465, "global_step": 172112, "epoch": 4097} {"train_loss": -7.196775436401367, "global_step": 172113, "epoch": 4097} {"train_loss": -6.989223003387451, "global_step": 172114, "epoch": 4097} {"train_loss": -7.051354521796817, "global_step": 172115, "epoch": 4097, "val_loss": 68931.671875} {"train_loss": -7.020742416381836, "global_step": 172116, "epoch": 4098} {"train_loss": -7.207229137420654, "global_step": 172117, "epoch": 4098} {"train_loss": -7.039445400238037, "global_step": 172118, "epoch": 4098} {"train_loss": -7.0679168701171875, "global_step": 172119, "epoch": 4098} {"train_loss": -7.059053421020508, "global_step": 172120, "epoch": 4098} {"train_loss": -7.00298547744751, "global_step": 172121, "epoch": 4098} {"train_loss": -6.963861465454102, "global_step": 172122, "epoch": 4098} {"train_loss": -7.063047885894775, "global_step": 172123, "epoch": 4098} {"train_loss": -7.202863693237305, "global_step": 172124, "epoch": 4098} {"train_loss": -6.992641448974609, "global_step": 172125, "epoch": 4098} {"train_loss": -6.913921356201172, "global_step": 172126, "epoch": 4098} {"train_loss": -7.0911712646484375, "global_step": 172127, "epoch": 4098} {"train_loss": -6.982186794281006, "global_step": 172128, "epoch": 4098} {"train_loss": -7.185610771179199, "global_step": 172129, "epoch": 4098} {"train_loss": -7.055795669555664, "global_step": 172130, "epoch": 4098} {"train_loss": -7.109645366668701, "global_step": 172131, "epoch": 4098} {"train_loss": -7.129915714263916, "global_step": 172132, "epoch": 4098} {"train_loss": -7.154391288757324, "global_step": 172133, "epoch": 4098} {"train_loss": -7.0334577560424805, "global_step": 172134, "epoch": 4098} {"train_loss": -7.049857139587402, "global_step": 172135, "epoch": 4098} {"train_loss": -7.050319671630859, "global_step": 172136, "epoch": 4098} {"train_loss": -7.0110979080200195, "global_step": 172137, "epoch": 4098} {"train_loss": -6.993975639343262, "global_step": 172138, "epoch": 4098} {"train_loss": -7.053389072418213, "global_step": 172139, "epoch": 4098} {"train_loss": -6.9250593185424805, "global_step": 172140, "epoch": 4098} {"train_loss": -6.892178535461426, "global_step": 172141, "epoch": 4098} {"train_loss": -6.943206787109375, "global_step": 172142, "epoch": 4098} {"train_loss": -6.960353851318359, "global_step": 172143, "epoch": 4098} {"train_loss": -6.967451572418213, "global_step": 172144, "epoch": 4098} {"train_loss": -7.080915451049805, "global_step": 172145, "epoch": 4098} {"train_loss": -6.7775044441223145, "global_step": 172146, "epoch": 4098} {"train_loss": -6.903929233551025, "global_step": 172147, "epoch": 4098} {"train_loss": -6.86990213394165, "global_step": 172148, "epoch": 4098} {"train_loss": -6.986238479614258, "global_step": 172149, "epoch": 4098} {"train_loss": -6.895384311676025, "global_step": 172150, "epoch": 4098} {"train_loss": -6.889930725097656, "global_step": 172151, "epoch": 4098} {"train_loss": -6.932751655578613, "global_step": 172152, "epoch": 4098} {"train_loss": -6.901710033416748, "global_step": 172153, "epoch": 4098} {"train_loss": -7.013341903686523, "global_step": 172154, "epoch": 4098} {"train_loss": -6.88642692565918, "global_step": 172155, "epoch": 4098} {"train_loss": -6.963714599609375, "global_step": 172156, "epoch": 4098} {"train_loss": -7.0071144217536565, "global_step": 172157, "epoch": 4098, "val_loss": 69098.140625} {"train_loss": -7.080971717834473, "global_step": 172158, "epoch": 4099} {"train_loss": -7.00740385055542, "global_step": 172159, "epoch": 4099} {"train_loss": -7.051238536834717, "global_step": 172160, "epoch": 4099} {"train_loss": -7.057310104370117, "global_step": 172161, "epoch": 4099} {"train_loss": -7.038333892822266, "global_step": 172162, "epoch": 4099} {"train_loss": -6.9762067794799805, "global_step": 172163, "epoch": 4099} {"train_loss": -7.008443832397461, "global_step": 172164, "epoch": 4099} {"train_loss": -7.004758834838867, "global_step": 172165, "epoch": 4099} {"train_loss": -7.048576354980469, "global_step": 172166, "epoch": 4099} {"train_loss": -7.088379383087158, "global_step": 172167, "epoch": 4099} {"train_loss": -7.075897693634033, "global_step": 172168, "epoch": 4099} {"train_loss": -6.99031925201416, "global_step": 172169, "epoch": 4099} {"train_loss": -7.071026802062988, "global_step": 172170, "epoch": 4099} {"train_loss": -7.025698661804199, "global_step": 172171, "epoch": 4099} {"train_loss": -6.975668907165527, "global_step": 172172, "epoch": 4099} {"train_loss": -6.967071533203125, "global_step": 172173, "epoch": 4099} {"train_loss": -6.987205982208252, "global_step": 172174, "epoch": 4099} {"train_loss": -7.056260585784912, "global_step": 172175, "epoch": 4099} {"train_loss": -7.135390281677246, "global_step": 172176, "epoch": 4099} {"train_loss": -7.0980224609375, "global_step": 172177, "epoch": 4099} {"train_loss": -7.0325608253479, "global_step": 172178, "epoch": 4099} {"train_loss": -6.944307327270508, "global_step": 172179, "epoch": 4099} {"train_loss": -7.099802017211914, "global_step": 172180, "epoch": 4099} {"train_loss": -6.975847244262695, "global_step": 172181, "epoch": 4099} {"train_loss": -7.017829895019531, "global_step": 172182, "epoch": 4099} {"train_loss": -6.992654323577881, "global_step": 172183, "epoch": 4099} {"train_loss": -7.080041885375977, "global_step": 172184, "epoch": 4099} {"train_loss": -7.0306572914123535, "global_step": 172185, "epoch": 4099} {"train_loss": -7.0234599113464355, "global_step": 172186, "epoch": 4099} {"train_loss": -6.991413593292236, "global_step": 172187, "epoch": 4099} {"train_loss": -7.058344841003418, "global_step": 172188, "epoch": 4099} {"train_loss": -7.000929355621338, "global_step": 172189, "epoch": 4099} {"train_loss": -7.023411273956299, "global_step": 172190, "epoch": 4099} {"train_loss": -7.0647382736206055, "global_step": 172191, "epoch": 4099} {"train_loss": -6.983406066894531, "global_step": 172192, "epoch": 4099} {"train_loss": -7.106680870056152, "global_step": 172193, "epoch": 4099} {"train_loss": -6.993526935577393, "global_step": 172194, "epoch": 4099} {"train_loss": -7.027931213378906, "global_step": 172195, "epoch": 4099} {"train_loss": -7.0524373054504395, "global_step": 172196, "epoch": 4099} {"train_loss": -6.870090484619141, "global_step": 172197, "epoch": 4099} {"train_loss": -7.048118591308594, "global_step": 172198, "epoch": 4099} {"train_loss": -7.02799425806318, "global_step": 172199, "epoch": 4099, "val_loss": 68907.84375} {"train_loss": -7.07728910446167, "global_step": 172200, "epoch": 4100} {"train_loss": -7.102869987487793, "global_step": 172201, "epoch": 4100} {"train_loss": -7.085993766784668, "global_step": 172202, "epoch": 4100} {"train_loss": -7.0612077713012695, "global_step": 172203, "epoch": 4100} {"train_loss": -6.968493461608887, "global_step": 172204, "epoch": 4100} {"train_loss": -7.035213470458984, "global_step": 172205, "epoch": 4100} {"train_loss": -7.051964282989502, "global_step": 172206, "epoch": 4100} {"train_loss": -6.972352981567383, "global_step": 172207, "epoch": 4100} {"train_loss": -6.992877006530762, "global_step": 172208, "epoch": 4100} {"train_loss": -7.104158401489258, "global_step": 172209, "epoch": 4100} {"train_loss": -6.923007965087891, "global_step": 172210, "epoch": 4100} {"train_loss": -7.044455528259277, "global_step": 172211, "epoch": 4100} {"train_loss": -6.944759368896484, "global_step": 172212, "epoch": 4100} {"train_loss": -6.9963297843933105, "global_step": 172213, "epoch": 4100} {"train_loss": -7.021378040313721, "global_step": 172214, "epoch": 4100} {"train_loss": -6.968958854675293, "global_step": 172215, "epoch": 4100} {"train_loss": -6.9899187088012695, "global_step": 172216, "epoch": 4100} {"train_loss": -6.978986740112305, "global_step": 172217, "epoch": 4100} {"train_loss": -7.027161121368408, "global_step": 172218, "epoch": 4100} {"train_loss": -6.9358673095703125, "global_step": 172219, "epoch": 4100} {"train_loss": -7.034938812255859, "global_step": 172220, "epoch": 4100} {"train_loss": -7.040406227111816, "global_step": 172221, "epoch": 4100} {"train_loss": -6.979012966156006, "global_step": 172222, "epoch": 4100} {"train_loss": -7.129347801208496, "global_step": 172223, "epoch": 4100} {"train_loss": -7.016230583190918, "global_step": 172224, "epoch": 4100} {"train_loss": -7.027569770812988, "global_step": 172225, "epoch": 4100} {"train_loss": -7.057040214538574, "global_step": 172226, "epoch": 4100} {"train_loss": -7.084817886352539, "global_step": 172227, "epoch": 4100} {"train_loss": -7.045459747314453, "global_step": 172228, "epoch": 4100} {"train_loss": -7.025035858154297, "global_step": 172229, "epoch": 4100} {"train_loss": -7.140511512756348, "global_step": 172230, "epoch": 4100} {"train_loss": -7.023880958557129, "global_step": 172231, "epoch": 4100} {"train_loss": -7.0132317543029785, "global_step": 172232, "epoch": 4100} {"train_loss": -7.162296772003174, "global_step": 172233, "epoch": 4100} {"train_loss": -7.011880874633789, "global_step": 172234, "epoch": 4100} {"train_loss": -7.0613603591918945, "global_step": 172235, "epoch": 4100} {"train_loss": -6.9713969230651855, "global_step": 172236, "epoch": 4100} {"train_loss": -7.11646032333374, "global_step": 172237, "epoch": 4100} {"train_loss": -7.025569915771484, "global_step": 172238, "epoch": 4100} {"train_loss": -7.092996597290039, "global_step": 172239, "epoch": 4100} {"train_loss": -7.136926174163818, "global_step": 172240, "epoch": 4100} {"train_loss": -7.0393446286519366, "global_step": 172241, "epoch": 4100, "train/sim_max_reward_0": 0.20081252576423753, "train/sim_max_reward_1": 0.9601480430515154, "train/sim_max_reward_2": 0.9194522731480561, "train/sim_max_reward_3": 0.13600016096008036, "train/sim_max_reward_4": 0.9589616178488811, "train/sim_max_reward_5": 0.9615010118616846, "test/sim_max_reward_4300000": 0.13276817308430547, "test/sim_max_reward_4300001": 0.5365770177264956, "test/sim_max_reward_4300002": 0.9920062133621587, "test/sim_max_reward_4300003": 0.9600854614465432, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8437571671777712, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9729899131815938, "test/sim_max_reward_4300008": 0.46735163296664534, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.40723262723882375, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.13095236618716674, "test/sim_max_reward_4300017": 0.9699703066777425, "test/sim_max_reward_4300018": 0.31356986692992084, "test/sim_max_reward_4300019": 0.18611283365940134, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9281071213125086, "test/sim_max_reward_4300022": 0.8745411091647616, "test/sim_max_reward_4300023": 0.8349711432616015, "test/sim_max_reward_4300024": 0.6040271638522989, "test/sim_max_reward_4300025": 0.8696228736113806, "test/sim_max_reward_4300026": 0.050878423390650566, "test/sim_max_reward_4300027": 0.8771631944869174, "test/sim_max_reward_4300028": 1.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.23242677217369648, "test/sim_max_reward_4300031": 0.208923955348928, "test/sim_max_reward_4300032": 0.9976095853432565, "test/sim_max_reward_4300033": 1.0, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.8406220346586389, "test/sim_max_reward_4300036": 0.20031857848833742, "test/sim_max_reward_4300037": 0.8186990393483141, "test/sim_max_reward_4300038": 1.0, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.7830963859449392, "test/sim_max_reward_4300041": 0.9155939027797062, "test/sim_max_reward_4300042": 0.6971796954606132, "test/sim_max_reward_4300043": 0.12741307895030277, "test/sim_max_reward_4300044": 1.0, "test/sim_max_reward_4300045": 0.9495742613501822, "test/sim_max_reward_4300046": 0.9009012088776011, "test/sim_max_reward_4300047": 0.1645292465509047, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.2577443099944225, "train/mean_score": 0.6894792721057424, "test/mean_score": 0.6012630153759563, "val_loss": 69012.1015625} {"train_loss": -7.079421043395996, "global_step": 172242, "epoch": 4101} {"train_loss": -7.099973678588867, "global_step": 172243, "epoch": 4101} {"train_loss": -7.102337837219238, "global_step": 172244, "epoch": 4101} {"train_loss": -7.076375961303711, "global_step": 172245, "epoch": 4101} {"train_loss": -7.184440612792969, "global_step": 172246, "epoch": 4101} {"train_loss": -7.083695411682129, "global_step": 172247, "epoch": 4101} {"train_loss": -7.051770210266113, "global_step": 172248, "epoch": 4101} {"train_loss": -7.209522247314453, "global_step": 172249, "epoch": 4101} {"train_loss": -7.114620685577393, "global_step": 172250, "epoch": 4101} {"train_loss": -7.0168657302856445, "global_step": 172251, "epoch": 4101} {"train_loss": -7.207618713378906, "global_step": 172252, "epoch": 4101} {"train_loss": -7.099926471710205, "global_step": 172253, "epoch": 4101} {"train_loss": -7.158816337585449, "global_step": 172254, "epoch": 4101} {"train_loss": -7.125157833099365, "global_step": 172255, "epoch": 4101} {"train_loss": -7.15859317779541, "global_step": 172256, "epoch": 4101} {"train_loss": -7.138392925262451, "global_step": 172257, "epoch": 4101} {"train_loss": -7.132040023803711, "global_step": 172258, "epoch": 4101} {"train_loss": -7.112699508666992, "global_step": 172259, "epoch": 4101} {"train_loss": -7.125741004943848, "global_step": 172260, "epoch": 4101} {"train_loss": -7.06052827835083, "global_step": 172261, "epoch": 4101} {"train_loss": -7.170499801635742, "global_step": 172262, "epoch": 4101} {"train_loss": -7.000387191772461, "global_step": 172263, "epoch": 4101} {"train_loss": -7.055912017822266, "global_step": 172264, "epoch": 4101} {"train_loss": -7.1121826171875, "global_step": 172265, "epoch": 4101} {"train_loss": -7.148975372314453, "global_step": 172266, "epoch": 4101} {"train_loss": -7.113825798034668, "global_step": 172267, "epoch": 4101} {"train_loss": -6.991124153137207, "global_step": 172268, "epoch": 4101} {"train_loss": -7.157190322875977, "global_step": 172269, "epoch": 4101} {"train_loss": -6.9622931480407715, "global_step": 172270, "epoch": 4101} {"train_loss": -6.933568954467773, "global_step": 172271, "epoch": 4101} {"train_loss": -6.865133285522461, "global_step": 172272, "epoch": 4101} {"train_loss": -7.055117130279541, "global_step": 172273, "epoch": 4101} {"train_loss": -6.895107746124268, "global_step": 172274, "epoch": 4101} {"train_loss": -6.960906028747559, "global_step": 172275, "epoch": 4101} {"train_loss": -7.012895584106445, "global_step": 172276, "epoch": 4101} {"train_loss": -6.81027364730835, "global_step": 172277, "epoch": 4101} {"train_loss": -6.955150127410889, "global_step": 172278, "epoch": 4101} {"train_loss": -6.9428019523620605, "global_step": 172279, "epoch": 4101} {"train_loss": -6.99241828918457, "global_step": 172280, "epoch": 4101} {"train_loss": -6.991937637329102, "global_step": 172281, "epoch": 4101} {"train_loss": -6.963006973266602, "global_step": 172282, "epoch": 4101} {"train_loss": -7.055389120465233, "global_step": 172283, "epoch": 4101, "val_loss": 69090.8515625} {"train_loss": -6.853412628173828, "global_step": 172284, "epoch": 4102} {"train_loss": -7.051005840301514, "global_step": 172285, "epoch": 4102} {"train_loss": -6.9056854248046875, "global_step": 172286, "epoch": 4102} {"train_loss": -6.967103481292725, "global_step": 172287, "epoch": 4102} {"train_loss": -6.930678844451904, "global_step": 172288, "epoch": 4102} {"train_loss": -7.014901161193848, "global_step": 172289, "epoch": 4102} {"train_loss": -6.940723419189453, "global_step": 172290, "epoch": 4102} {"train_loss": -7.017734527587891, "global_step": 172291, "epoch": 4102} {"train_loss": -6.994936943054199, "global_step": 172292, "epoch": 4102} {"train_loss": -6.980069160461426, "global_step": 172293, "epoch": 4102} {"train_loss": -7.075592994689941, "global_step": 172294, "epoch": 4102} {"train_loss": -7.0702996253967285, "global_step": 172295, "epoch": 4102} {"train_loss": -7.039782524108887, "global_step": 172296, "epoch": 4102} {"train_loss": -6.944771766662598, "global_step": 172297, "epoch": 4102} {"train_loss": -6.9895782470703125, "global_step": 172298, "epoch": 4102} {"train_loss": -7.021153450012207, "global_step": 172299, "epoch": 4102} {"train_loss": -6.964838981628418, "global_step": 172300, "epoch": 4102} {"train_loss": -6.926851749420166, "global_step": 172301, "epoch": 4102} {"train_loss": -6.928323268890381, "global_step": 172302, "epoch": 4102} {"train_loss": -6.999695301055908, "global_step": 172303, "epoch": 4102} {"train_loss": -6.913653373718262, "global_step": 172304, "epoch": 4102} {"train_loss": -6.9733452796936035, "global_step": 172305, "epoch": 4102} {"train_loss": -6.986075401306152, "global_step": 172306, "epoch": 4102} {"train_loss": -6.954409599304199, "global_step": 172307, "epoch": 4102} {"train_loss": -7.009943962097168, "global_step": 172308, "epoch": 4102} {"train_loss": -7.099893569946289, "global_step": 172309, "epoch": 4102} {"train_loss": -7.055438995361328, "global_step": 172310, "epoch": 4102} {"train_loss": -7.000997066497803, "global_step": 172311, "epoch": 4102} {"train_loss": -7.087886810302734, "global_step": 172312, "epoch": 4102} {"train_loss": -7.065616607666016, "global_step": 172313, "epoch": 4102} {"train_loss": -7.0688371658325195, "global_step": 172314, "epoch": 4102} {"train_loss": -7.064925193786621, "global_step": 172315, "epoch": 4102} {"train_loss": -7.106544017791748, "global_step": 172316, "epoch": 4102} {"train_loss": -7.001397609710693, "global_step": 172317, "epoch": 4102} {"train_loss": -7.129531383514404, "global_step": 172318, "epoch": 4102} {"train_loss": -7.030243873596191, "global_step": 172319, "epoch": 4102} {"train_loss": -7.009539604187012, "global_step": 172320, "epoch": 4102} {"train_loss": -7.053799629211426, "global_step": 172321, "epoch": 4102} {"train_loss": -7.060366630554199, "global_step": 172322, "epoch": 4102} {"train_loss": -7.151693344116211, "global_step": 172323, "epoch": 4102} {"train_loss": -7.056797027587891, "global_step": 172324, "epoch": 4102} {"train_loss": -7.015034176054455, "global_step": 172325, "epoch": 4102, "val_loss": 69077.859375} {"train_loss": -7.059320449829102, "global_step": 172326, "epoch": 4103} {"train_loss": -7.1669511795043945, "global_step": 172327, "epoch": 4103} {"train_loss": -7.13835334777832, "global_step": 172328, "epoch": 4103} {"train_loss": -7.111663818359375, "global_step": 172329, "epoch": 4103} {"train_loss": -7.105260848999023, "global_step": 172330, "epoch": 4103} {"train_loss": -7.07214879989624, "global_step": 172331, "epoch": 4103} {"train_loss": -7.007366180419922, "global_step": 172332, "epoch": 4103} {"train_loss": -7.0197577476501465, "global_step": 172333, "epoch": 4103} {"train_loss": -7.1016764640808105, "global_step": 172334, "epoch": 4103} {"train_loss": -7.092256546020508, "global_step": 172335, "epoch": 4103} {"train_loss": -7.070765972137451, "global_step": 172336, "epoch": 4103} {"train_loss": -7.02742862701416, "global_step": 172337, "epoch": 4103} {"train_loss": -7.142563343048096, "global_step": 172338, "epoch": 4103} {"train_loss": -7.003889560699463, "global_step": 172339, "epoch": 4103} {"train_loss": -7.157009124755859, "global_step": 172340, "epoch": 4103} {"train_loss": -7.093649864196777, "global_step": 172341, "epoch": 4103} {"train_loss": -6.978454113006592, "global_step": 172342, "epoch": 4103} {"train_loss": -7.025640487670898, "global_step": 172343, "epoch": 4103} {"train_loss": -6.955592632293701, "global_step": 172344, "epoch": 4103} {"train_loss": -6.970429420471191, "global_step": 172345, "epoch": 4103} {"train_loss": -7.084542274475098, "global_step": 172346, "epoch": 4103} {"train_loss": -6.958386421203613, "global_step": 172347, "epoch": 4103} {"train_loss": -7.039426803588867, "global_step": 172348, "epoch": 4103} {"train_loss": -7.025340557098389, "global_step": 172349, "epoch": 4103} {"train_loss": -7.129964828491211, "global_step": 172350, "epoch": 4103} {"train_loss": -6.998046398162842, "global_step": 172351, "epoch": 4103} {"train_loss": -7.014253616333008, "global_step": 172352, "epoch": 4103} {"train_loss": -7.125295639038086, "global_step": 172353, "epoch": 4103} {"train_loss": -6.97274112701416, "global_step": 172354, "epoch": 4103} {"train_loss": -7.160257339477539, "global_step": 172355, "epoch": 4103} {"train_loss": -6.9459075927734375, "global_step": 172356, "epoch": 4103} {"train_loss": -7.094385147094727, "global_step": 172357, "epoch": 4103} {"train_loss": -7.073017597198486, "global_step": 172358, "epoch": 4103} {"train_loss": -7.037214279174805, "global_step": 172359, "epoch": 4103} {"train_loss": -7.052801132202148, "global_step": 172360, "epoch": 4103} {"train_loss": -7.014253616333008, "global_step": 172361, "epoch": 4103} {"train_loss": -7.057794094085693, "global_step": 172362, "epoch": 4103} {"train_loss": -7.034049987792969, "global_step": 172363, "epoch": 4103} {"train_loss": -6.897800922393799, "global_step": 172364, "epoch": 4103} {"train_loss": -7.125298500061035, "global_step": 172365, "epoch": 4103} {"train_loss": -6.990672588348389, "global_step": 172366, "epoch": 4103} {"train_loss": -7.051371154331026, "global_step": 172367, "epoch": 4103, "val_loss": 68926.09375} {"train_loss": -7.076457977294922, "global_step": 172368, "epoch": 4104} {"train_loss": -7.098038673400879, "global_step": 172369, "epoch": 4104} {"train_loss": -6.989657402038574, "global_step": 172370, "epoch": 4104} {"train_loss": -7.103705883026123, "global_step": 172371, "epoch": 4104} {"train_loss": -7.099860191345215, "global_step": 172372, "epoch": 4104} {"train_loss": -6.927609920501709, "global_step": 172373, "epoch": 4104} {"train_loss": -7.139015197753906, "global_step": 172374, "epoch": 4104} {"train_loss": -7.135044574737549, "global_step": 172375, "epoch": 4104} {"train_loss": -7.15008544921875, "global_step": 172376, "epoch": 4104} {"train_loss": -7.103973388671875, "global_step": 172377, "epoch": 4104} {"train_loss": -7.141889572143555, "global_step": 172378, "epoch": 4104} {"train_loss": -7.0845136642456055, "global_step": 172379, "epoch": 4104} {"train_loss": -7.065644264221191, "global_step": 172380, "epoch": 4104} {"train_loss": -7.069436550140381, "global_step": 172381, "epoch": 4104} {"train_loss": -7.121441841125488, "global_step": 172382, "epoch": 4104} {"train_loss": -7.214086532592773, "global_step": 172383, "epoch": 4104} {"train_loss": -7.045511245727539, "global_step": 172384, "epoch": 4104} {"train_loss": -7.123754501342773, "global_step": 172385, "epoch": 4104} {"train_loss": -7.195635795593262, "global_step": 172386, "epoch": 4104} {"train_loss": -7.236228942871094, "global_step": 172387, "epoch": 4104} {"train_loss": -7.017807960510254, "global_step": 172388, "epoch": 4104} {"train_loss": -7.147700309753418, "global_step": 172389, "epoch": 4104} {"train_loss": -7.20119047164917, "global_step": 172390, "epoch": 4104} {"train_loss": -7.116252422332764, "global_step": 172391, "epoch": 4104} {"train_loss": -7.149173259735107, "global_step": 172392, "epoch": 4104} {"train_loss": -7.137444019317627, "global_step": 172393, "epoch": 4104} {"train_loss": -7.109220504760742, "global_step": 172394, "epoch": 4104} {"train_loss": -7.078773021697998, "global_step": 172395, "epoch": 4104} {"train_loss": -7.186192512512207, "global_step": 172396, "epoch": 4104} {"train_loss": -7.044672966003418, "global_step": 172397, "epoch": 4104} {"train_loss": -6.977766036987305, "global_step": 172398, "epoch": 4104} {"train_loss": -7.160930633544922, "global_step": 172399, "epoch": 4104} {"train_loss": -6.979824066162109, "global_step": 172400, "epoch": 4104} {"train_loss": -7.124579906463623, "global_step": 172401, "epoch": 4104} {"train_loss": -7.096499919891357, "global_step": 172402, "epoch": 4104} {"train_loss": -7.095905303955078, "global_step": 172403, "epoch": 4104} {"train_loss": -7.034411430358887, "global_step": 172404, "epoch": 4104} {"train_loss": -6.975047588348389, "global_step": 172405, "epoch": 4104} {"train_loss": -7.079667091369629, "global_step": 172406, "epoch": 4104} {"train_loss": -7.208508491516113, "global_step": 172407, "epoch": 4104} {"train_loss": -7.260025978088379, "global_step": 172408, "epoch": 4104} {"train_loss": -7.10414871715364, "global_step": 172409, "epoch": 4104, "val_loss": 69095.4375} {"train_loss": -7.014759063720703, "global_step": 172410, "epoch": 4105} {"train_loss": -7.095548629760742, "global_step": 172411, "epoch": 4105} {"train_loss": -7.0937604904174805, "global_step": 172412, "epoch": 4105} {"train_loss": -7.073179244995117, "global_step": 172413, "epoch": 4105} {"train_loss": -7.113926887512207, "global_step": 172414, "epoch": 4105} {"train_loss": -7.086406707763672, "global_step": 172415, "epoch": 4105} {"train_loss": -6.869088649749756, "global_step": 172416, "epoch": 4105} {"train_loss": -7.122647285461426, "global_step": 172417, "epoch": 4105} {"train_loss": -6.993098258972168, "global_step": 172418, "epoch": 4105} {"train_loss": -7.159843921661377, "global_step": 172419, "epoch": 4105} {"train_loss": -7.041569232940674, "global_step": 172420, "epoch": 4105} {"train_loss": -6.934966087341309, "global_step": 172421, "epoch": 4105} {"train_loss": -7.054542064666748, "global_step": 172422, "epoch": 4105} {"train_loss": -6.957389831542969, "global_step": 172423, "epoch": 4105} {"train_loss": -7.087881088256836, "global_step": 172424, "epoch": 4105} {"train_loss": -7.074159622192383, "global_step": 172425, "epoch": 4105} {"train_loss": -6.964500427246094, "global_step": 172426, "epoch": 4105} {"train_loss": -6.975016117095947, "global_step": 172427, "epoch": 4105} {"train_loss": -6.899984359741211, "global_step": 172428, "epoch": 4105} {"train_loss": -7.156696319580078, "global_step": 172429, "epoch": 4105} {"train_loss": -7.04605770111084, "global_step": 172430, "epoch": 4105} {"train_loss": -7.165471076965332, "global_step": 172431, "epoch": 4105} {"train_loss": -7.100862503051758, "global_step": 172432, "epoch": 4105} {"train_loss": -7.205233573913574, "global_step": 172433, "epoch": 4105} {"train_loss": -7.094321250915527, "global_step": 172434, "epoch": 4105} {"train_loss": -7.062661170959473, "global_step": 172435, "epoch": 4105} {"train_loss": -6.962820529937744, "global_step": 172436, "epoch": 4105} {"train_loss": -7.014029502868652, "global_step": 172437, "epoch": 4105} {"train_loss": -7.0614142417907715, "global_step": 172438, "epoch": 4105} {"train_loss": -6.884500026702881, "global_step": 172439, "epoch": 4105} {"train_loss": -7.013452529907227, "global_step": 172440, "epoch": 4105} {"train_loss": -6.956376075744629, "global_step": 172441, "epoch": 4105} {"train_loss": -6.944045066833496, "global_step": 172442, "epoch": 4105} {"train_loss": -7.010523796081543, "global_step": 172443, "epoch": 4105} {"train_loss": -6.9449849128723145, "global_step": 172444, "epoch": 4105} {"train_loss": -7.038212299346924, "global_step": 172445, "epoch": 4105} {"train_loss": -6.996606826782227, "global_step": 172446, "epoch": 4105} {"train_loss": -6.906109809875488, "global_step": 172447, "epoch": 4105} {"train_loss": -7.087602615356445, "global_step": 172448, "epoch": 4105} {"train_loss": -7.034774303436279, "global_step": 172449, "epoch": 4105} {"train_loss": -7.087409973144531, "global_step": 172450, "epoch": 4105} {"train_loss": -7.03173245702471, "global_step": 172451, "epoch": 4105, "val_loss": 69264.9765625} {"train_loss": -7.039705753326416, "global_step": 172452, "epoch": 4106} {"train_loss": -6.9877119064331055, "global_step": 172453, "epoch": 4106} {"train_loss": -6.980672836303711, "global_step": 172454, "epoch": 4106} {"train_loss": -7.072020530700684, "global_step": 172455, "epoch": 4106} {"train_loss": -6.995173454284668, "global_step": 172456, "epoch": 4106} {"train_loss": -6.954120635986328, "global_step": 172457, "epoch": 4106} {"train_loss": -6.941290378570557, "global_step": 172458, "epoch": 4106} {"train_loss": -7.1701202392578125, "global_step": 172459, "epoch": 4106} {"train_loss": -6.936145782470703, "global_step": 172460, "epoch": 4106} {"train_loss": -7.049325942993164, "global_step": 172461, "epoch": 4106} {"train_loss": -7.005726337432861, "global_step": 172462, "epoch": 4106} {"train_loss": -7.085390090942383, "global_step": 172463, "epoch": 4106} {"train_loss": -7.01388692855835, "global_step": 172464, "epoch": 4106} {"train_loss": -7.106794834136963, "global_step": 172465, "epoch": 4106} {"train_loss": -7.082180976867676, "global_step": 172466, "epoch": 4106} {"train_loss": -7.087275505065918, "global_step": 172467, "epoch": 4106} {"train_loss": -7.103490829467773, "global_step": 172468, "epoch": 4106} {"train_loss": -7.1041717529296875, "global_step": 172469, "epoch": 4106} {"train_loss": -7.181264400482178, "global_step": 172470, "epoch": 4106} {"train_loss": -7.094825744628906, "global_step": 172471, "epoch": 4106} {"train_loss": -7.077393054962158, "global_step": 172472, "epoch": 4106} {"train_loss": -7.012876510620117, "global_step": 172473, "epoch": 4106} {"train_loss": -7.0896406173706055, "global_step": 172474, "epoch": 4106} {"train_loss": -7.006331443786621, "global_step": 172475, "epoch": 4106} {"train_loss": -7.122296333312988, "global_step": 172476, "epoch": 4106} {"train_loss": -7.069759368896484, "global_step": 172477, "epoch": 4106} {"train_loss": -7.086484909057617, "global_step": 172478, "epoch": 4106} {"train_loss": -7.106749057769775, "global_step": 172479, "epoch": 4106} {"train_loss": -7.003218650817871, "global_step": 172480, "epoch": 4106} {"train_loss": -7.068643569946289, "global_step": 172481, "epoch": 4106} {"train_loss": -7.146177768707275, "global_step": 172482, "epoch": 4106} {"train_loss": -7.03965950012207, "global_step": 172483, "epoch": 4106} {"train_loss": -7.215915203094482, "global_step": 172484, "epoch": 4106} {"train_loss": -7.058754920959473, "global_step": 172485, "epoch": 4106} {"train_loss": -7.1195783615112305, "global_step": 172486, "epoch": 4106} {"train_loss": -7.083950519561768, "global_step": 172487, "epoch": 4106} {"train_loss": -7.075236797332764, "global_step": 172488, "epoch": 4106} {"train_loss": -7.087050914764404, "global_step": 172489, "epoch": 4106} {"train_loss": -7.228482246398926, "global_step": 172490, "epoch": 4106} {"train_loss": -7.066216468811035, "global_step": 172491, "epoch": 4106} {"train_loss": -7.096792697906494, "global_step": 172492, "epoch": 4106} {"train_loss": -7.071405864897228, "global_step": 172493, "epoch": 4106, "val_loss": 68890.375} {"train_loss": -7.085241794586182, "global_step": 172494, "epoch": 4107} {"train_loss": -6.954678535461426, "global_step": 172495, "epoch": 4107} {"train_loss": -7.117188453674316, "global_step": 172496, "epoch": 4107} {"train_loss": -7.075091361999512, "global_step": 172497, "epoch": 4107} {"train_loss": -7.105990409851074, "global_step": 172498, "epoch": 4107} {"train_loss": -7.001015663146973, "global_step": 172499, "epoch": 4107} {"train_loss": -7.013628005981445, "global_step": 172500, "epoch": 4107} {"train_loss": -7.000231742858887, "global_step": 172501, "epoch": 4107} {"train_loss": -7.0461883544921875, "global_step": 172502, "epoch": 4107} {"train_loss": -7.0020751953125, "global_step": 172503, "epoch": 4107} {"train_loss": -7.136594772338867, "global_step": 172504, "epoch": 4107} {"train_loss": -7.172908782958984, "global_step": 172505, "epoch": 4107} {"train_loss": -7.061163425445557, "global_step": 172506, "epoch": 4107} {"train_loss": -7.142267227172852, "global_step": 172507, "epoch": 4107} {"train_loss": -7.14992618560791, "global_step": 172508, "epoch": 4107} {"train_loss": -7.117911338806152, "global_step": 172509, "epoch": 4107} {"train_loss": -7.075735092163086, "global_step": 172510, "epoch": 4107} {"train_loss": -6.895001411437988, "global_step": 172511, "epoch": 4107} {"train_loss": -7.025750637054443, "global_step": 172512, "epoch": 4107} {"train_loss": -7.11918830871582, "global_step": 172513, "epoch": 4107} {"train_loss": -6.980701923370361, "global_step": 172514, "epoch": 4107} {"train_loss": -6.987707138061523, "global_step": 172515, "epoch": 4107} {"train_loss": -6.95154333114624, "global_step": 172516, "epoch": 4107} {"train_loss": -7.030219078063965, "global_step": 172517, "epoch": 4107} {"train_loss": -6.912036418914795, "global_step": 172518, "epoch": 4107} {"train_loss": -6.739124298095703, "global_step": 172519, "epoch": 4107} {"train_loss": -6.925530433654785, "global_step": 172520, "epoch": 4107} {"train_loss": -6.844263076782227, "global_step": 172521, "epoch": 4107} {"train_loss": -6.872742652893066, "global_step": 172522, "epoch": 4107} {"train_loss": -6.891165256500244, "global_step": 172523, "epoch": 4107} {"train_loss": -6.942449569702148, "global_step": 172524, "epoch": 4107} {"train_loss": -6.925176620483398, "global_step": 172525, "epoch": 4107} {"train_loss": -6.898954391479492, "global_step": 172526, "epoch": 4107} {"train_loss": -6.849264144897461, "global_step": 172527, "epoch": 4107} {"train_loss": -6.967179775238037, "global_step": 172528, "epoch": 4107} {"train_loss": -6.880279541015625, "global_step": 172529, "epoch": 4107} {"train_loss": -7.013517379760742, "global_step": 172530, "epoch": 4107} {"train_loss": -6.913321495056152, "global_step": 172531, "epoch": 4107} {"train_loss": -7.00577449798584, "global_step": 172532, "epoch": 4107} {"train_loss": -7.015360355377197, "global_step": 172533, "epoch": 4107} {"train_loss": -6.936019420623779, "global_step": 172534, "epoch": 4107} {"train_loss": -6.993095273063297, "global_step": 172535, "epoch": 4107, "val_loss": 69251.0703125} {"train_loss": -7.070082187652588, "global_step": 172536, "epoch": 4108} {"train_loss": -6.839112281799316, "global_step": 172537, "epoch": 4108} {"train_loss": -6.981078147888184, "global_step": 172538, "epoch": 4108} {"train_loss": -7.015512466430664, "global_step": 172539, "epoch": 4108} {"train_loss": -7.0444488525390625, "global_step": 172540, "epoch": 4108} {"train_loss": -7.049105644226074, "global_step": 172541, "epoch": 4108} {"train_loss": -6.919530868530273, "global_step": 172542, "epoch": 4108} {"train_loss": -7.050963878631592, "global_step": 172543, "epoch": 4108} {"train_loss": -7.085202217102051, "global_step": 172544, "epoch": 4108} {"train_loss": -7.096507549285889, "global_step": 172545, "epoch": 4108} {"train_loss": -7.047264099121094, "global_step": 172546, "epoch": 4108} {"train_loss": -7.013873100280762, "global_step": 172547, "epoch": 4108} {"train_loss": -7.136183738708496, "global_step": 172548, "epoch": 4108} {"train_loss": -7.0623369216918945, "global_step": 172549, "epoch": 4108} {"train_loss": -7.076379776000977, "global_step": 172550, "epoch": 4108} {"train_loss": -7.023898601531982, "global_step": 172551, "epoch": 4108} {"train_loss": -7.003212928771973, "global_step": 172552, "epoch": 4108} {"train_loss": -7.110057830810547, "global_step": 172553, "epoch": 4108} {"train_loss": -6.942286491394043, "global_step": 172554, "epoch": 4108} {"train_loss": -7.0305585861206055, "global_step": 172555, "epoch": 4108} {"train_loss": -7.160968780517578, "global_step": 172556, "epoch": 4108} {"train_loss": -7.102201461791992, "global_step": 172557, "epoch": 4108} {"train_loss": -7.141146183013916, "global_step": 172558, "epoch": 4108} {"train_loss": -7.06782865524292, "global_step": 172559, "epoch": 4108} {"train_loss": -7.107278823852539, "global_step": 172560, "epoch": 4108} {"train_loss": -7.003129959106445, "global_step": 172561, "epoch": 4108} {"train_loss": -7.031854629516602, "global_step": 172562, "epoch": 4108} {"train_loss": -7.1156768798828125, "global_step": 172563, "epoch": 4108} {"train_loss": -7.105960369110107, "global_step": 172564, "epoch": 4108} {"train_loss": -7.164956092834473, "global_step": 172565, "epoch": 4108} {"train_loss": -7.060332775115967, "global_step": 172566, "epoch": 4108} {"train_loss": -7.115810394287109, "global_step": 172567, "epoch": 4108} {"train_loss": -7.013737201690674, "global_step": 172568, "epoch": 4108} {"train_loss": -7.034309387207031, "global_step": 172569, "epoch": 4108} {"train_loss": -7.02081298828125, "global_step": 172570, "epoch": 4108} {"train_loss": -7.038106918334961, "global_step": 172571, "epoch": 4108} {"train_loss": -6.9555182456970215, "global_step": 172572, "epoch": 4108} {"train_loss": -7.108356475830078, "global_step": 172573, "epoch": 4108} {"train_loss": -7.027230739593506, "global_step": 172574, "epoch": 4108} {"train_loss": -6.855468273162842, "global_step": 172575, "epoch": 4108} {"train_loss": -7.068853378295898, "global_step": 172576, "epoch": 4108} {"train_loss": -7.0442967755453925, "global_step": 172577, "epoch": 4108, "val_loss": 68888.703125} {"train_loss": -6.946183204650879, "global_step": 172578, "epoch": 4109} {"train_loss": -7.075535297393799, "global_step": 172579, "epoch": 4109} {"train_loss": -6.9806671142578125, "global_step": 172580, "epoch": 4109} {"train_loss": -7.078747272491455, "global_step": 172581, "epoch": 4109} {"train_loss": -7.013368129730225, "global_step": 172582, "epoch": 4109} {"train_loss": -6.936257362365723, "global_step": 172583, "epoch": 4109} {"train_loss": -7.042754173278809, "global_step": 172584, "epoch": 4109} {"train_loss": -6.958858013153076, "global_step": 172585, "epoch": 4109} {"train_loss": -7.00321626663208, "global_step": 172586, "epoch": 4109} {"train_loss": -6.963056564331055, "global_step": 172587, "epoch": 4109} {"train_loss": -7.046111106872559, "global_step": 172588, "epoch": 4109} {"train_loss": -7.084280014038086, "global_step": 172589, "epoch": 4109} {"train_loss": -6.874975204467773, "global_step": 172590, "epoch": 4109} {"train_loss": -7.000898361206055, "global_step": 172591, "epoch": 4109} {"train_loss": -7.077549457550049, "global_step": 172592, "epoch": 4109} {"train_loss": -6.970574378967285, "global_step": 172593, "epoch": 4109} {"train_loss": -7.135615348815918, "global_step": 172594, "epoch": 4109} {"train_loss": -7.071854114532471, "global_step": 172595, "epoch": 4109} {"train_loss": -7.021956443786621, "global_step": 172596, "epoch": 4109} {"train_loss": -6.983975410461426, "global_step": 172597, "epoch": 4109} {"train_loss": -6.966826438903809, "global_step": 172598, "epoch": 4109} {"train_loss": -7.006554126739502, "global_step": 172599, "epoch": 4109} {"train_loss": -6.861598014831543, "global_step": 172600, "epoch": 4109} {"train_loss": -7.0912675857543945, "global_step": 172601, "epoch": 4109} {"train_loss": -7.006758689880371, "global_step": 172602, "epoch": 4109} {"train_loss": -6.828904151916504, "global_step": 172603, "epoch": 4109} {"train_loss": -7.003530502319336, "global_step": 172604, "epoch": 4109} {"train_loss": -6.775023460388184, "global_step": 172605, "epoch": 4109} {"train_loss": -6.877475261688232, "global_step": 172606, "epoch": 4109} {"train_loss": -6.882414817810059, "global_step": 172607, "epoch": 4109} {"train_loss": -6.8137335777282715, "global_step": 172608, "epoch": 4109} {"train_loss": -6.960991382598877, "global_step": 172609, "epoch": 4109} {"train_loss": -6.795743465423584, "global_step": 172610, "epoch": 4109} {"train_loss": -6.98323917388916, "global_step": 172611, "epoch": 4109} {"train_loss": -6.787252426147461, "global_step": 172612, "epoch": 4109} {"train_loss": -6.942758560180664, "global_step": 172613, "epoch": 4109} {"train_loss": -6.98142671585083, "global_step": 172614, "epoch": 4109} {"train_loss": -6.989361763000488, "global_step": 172615, "epoch": 4109} {"train_loss": -6.8759989738464355, "global_step": 172616, "epoch": 4109} {"train_loss": -6.808694362640381, "global_step": 172617, "epoch": 4109} {"train_loss": -6.9109649658203125, "global_step": 172618, "epoch": 4109} {"train_loss": -6.960315534046718, "global_step": 172619, "epoch": 4109, "val_loss": 69064.0078125} {"train_loss": -7.039288520812988, "global_step": 172620, "epoch": 4110} {"train_loss": -6.945508003234863, "global_step": 172621, "epoch": 4110} {"train_loss": -6.960422515869141, "global_step": 172622, "epoch": 4110} {"train_loss": -6.978728771209717, "global_step": 172623, "epoch": 4110} {"train_loss": -6.9121904373168945, "global_step": 172624, "epoch": 4110} {"train_loss": -6.876289367675781, "global_step": 172625, "epoch": 4110} {"train_loss": -6.941976547241211, "global_step": 172626, "epoch": 4110} {"train_loss": -7.076539039611816, "global_step": 172627, "epoch": 4110} {"train_loss": -6.9928789138793945, "global_step": 172628, "epoch": 4110} {"train_loss": -7.035919189453125, "global_step": 172629, "epoch": 4110} {"train_loss": -7.001566410064697, "global_step": 172630, "epoch": 4110} {"train_loss": -6.992110252380371, "global_step": 172631, "epoch": 4110} {"train_loss": -7.060579299926758, "global_step": 172632, "epoch": 4110} {"train_loss": -7.0654096603393555, "global_step": 172633, "epoch": 4110} {"train_loss": -7.068408966064453, "global_step": 172634, "epoch": 4110} {"train_loss": -7.022299766540527, "global_step": 172635, "epoch": 4110} {"train_loss": -7.067531585693359, "global_step": 172636, "epoch": 4110} {"train_loss": -6.988039970397949, "global_step": 172637, "epoch": 4110} {"train_loss": -7.107547760009766, "global_step": 172638, "epoch": 4110} {"train_loss": -6.918490886688232, "global_step": 172639, "epoch": 4110} {"train_loss": -7.179283618927002, "global_step": 172640, "epoch": 4110} {"train_loss": -7.187838554382324, "global_step": 172641, "epoch": 4110} {"train_loss": -7.099579811096191, "global_step": 172642, "epoch": 4110} {"train_loss": -7.078949928283691, "global_step": 172643, "epoch": 4110} {"train_loss": -7.119416236877441, "global_step": 172644, "epoch": 4110} {"train_loss": -7.198343753814697, "global_step": 172645, "epoch": 4110} {"train_loss": -7.1339335441589355, "global_step": 172646, "epoch": 4110} {"train_loss": -7.0434675216674805, "global_step": 172647, "epoch": 4110} {"train_loss": -7.179258346557617, "global_step": 172648, "epoch": 4110} {"train_loss": -7.1142578125, "global_step": 172649, "epoch": 4110} {"train_loss": -7.088204383850098, "global_step": 172650, "epoch": 4110} {"train_loss": -7.0222554206848145, "global_step": 172651, "epoch": 4110} {"train_loss": -7.1375932693481445, "global_step": 172652, "epoch": 4110} {"train_loss": -7.041314601898193, "global_step": 172653, "epoch": 4110} {"train_loss": -7.171157360076904, "global_step": 172654, "epoch": 4110} {"train_loss": -7.068842887878418, "global_step": 172655, "epoch": 4110} {"train_loss": -7.092501163482666, "global_step": 172656, "epoch": 4110} {"train_loss": -7.10668420791626, "global_step": 172657, "epoch": 4110} {"train_loss": -7.123842239379883, "global_step": 172658, "epoch": 4110} {"train_loss": -6.961446762084961, "global_step": 172659, "epoch": 4110} {"train_loss": -7.080069065093994, "global_step": 172660, "epoch": 4110} {"train_loss": -7.0526541982378275, "global_step": 172661, "epoch": 4110, "val_loss": 69156.34375} {"train_loss": -6.949930191040039, "global_step": 172662, "epoch": 4111} {"train_loss": -7.100122928619385, "global_step": 172663, "epoch": 4111} {"train_loss": -6.905910968780518, "global_step": 172664, "epoch": 4111} {"train_loss": -6.945171356201172, "global_step": 172665, "epoch": 4111} {"train_loss": -7.059319496154785, "global_step": 172666, "epoch": 4111} {"train_loss": -7.009119033813477, "global_step": 172667, "epoch": 4111} {"train_loss": -7.15736198425293, "global_step": 172668, "epoch": 4111} {"train_loss": -7.013917922973633, "global_step": 172669, "epoch": 4111} {"train_loss": -7.007236480712891, "global_step": 172670, "epoch": 4111} {"train_loss": -7.059657573699951, "global_step": 172671, "epoch": 4111} {"train_loss": -7.025168418884277, "global_step": 172672, "epoch": 4111} {"train_loss": -7.038381576538086, "global_step": 172673, "epoch": 4111} {"train_loss": -7.207995414733887, "global_step": 172674, "epoch": 4111} {"train_loss": -6.919572830200195, "global_step": 172675, "epoch": 4111} {"train_loss": -7.035545825958252, "global_step": 172676, "epoch": 4111} {"train_loss": -7.049067497253418, "global_step": 172677, "epoch": 4111} {"train_loss": -7.0610551834106445, "global_step": 172678, "epoch": 4111} {"train_loss": -7.04000186920166, "global_step": 172679, "epoch": 4111} {"train_loss": -6.971646785736084, "global_step": 172680, "epoch": 4111} {"train_loss": -6.972146987915039, "global_step": 172681, "epoch": 4111} {"train_loss": -7.055464744567871, "global_step": 172682, "epoch": 4111} {"train_loss": -7.026898384094238, "global_step": 172683, "epoch": 4111} {"train_loss": -7.016335487365723, "global_step": 172684, "epoch": 4111} {"train_loss": -7.0799336433410645, "global_step": 172685, "epoch": 4111} {"train_loss": -6.996447563171387, "global_step": 172686, "epoch": 4111} {"train_loss": -6.970697402954102, "global_step": 172687, "epoch": 4111} {"train_loss": -7.067378997802734, "global_step": 172688, "epoch": 4111} {"train_loss": -7.031325340270996, "global_step": 172689, "epoch": 4111} {"train_loss": -6.999140739440918, "global_step": 172690, "epoch": 4111} {"train_loss": -7.040575981140137, "global_step": 172691, "epoch": 4111} {"train_loss": -7.137668609619141, "global_step": 172692, "epoch": 4111} {"train_loss": -7.026088714599609, "global_step": 172693, "epoch": 4111} {"train_loss": -7.097235679626465, "global_step": 172694, "epoch": 4111} {"train_loss": -7.019347190856934, "global_step": 172695, "epoch": 4111} {"train_loss": -7.024040222167969, "global_step": 172696, "epoch": 4111} {"train_loss": -7.1151251792907715, "global_step": 172697, "epoch": 4111} {"train_loss": -7.12111759185791, "global_step": 172698, "epoch": 4111} {"train_loss": -7.1996307373046875, "global_step": 172699, "epoch": 4111} {"train_loss": -7.12497091293335, "global_step": 172700, "epoch": 4111} {"train_loss": -7.023896217346191, "global_step": 172701, "epoch": 4111} {"train_loss": -6.902796268463135, "global_step": 172702, "epoch": 4111} {"train_loss": -7.042505945478167, "global_step": 172703, "epoch": 4111, "val_loss": 69061.8359375} {"train_loss": -7.093051910400391, "global_step": 172704, "epoch": 4112} {"train_loss": -7.079259872436523, "global_step": 172705, "epoch": 4112} {"train_loss": -7.179783344268799, "global_step": 172706, "epoch": 4112} {"train_loss": -7.104920387268066, "global_step": 172707, "epoch": 4112} {"train_loss": -7.088177680969238, "global_step": 172708, "epoch": 4112} {"train_loss": -7.056033134460449, "global_step": 172709, "epoch": 4112} {"train_loss": -6.924543380737305, "global_step": 172710, "epoch": 4112} {"train_loss": -7.11331033706665, "global_step": 172711, "epoch": 4112} {"train_loss": -7.136961460113525, "global_step": 172712, "epoch": 4112} {"train_loss": -7.087454795837402, "global_step": 172713, "epoch": 4112} {"train_loss": -6.972835063934326, "global_step": 172714, "epoch": 4112} {"train_loss": -7.115453720092773, "global_step": 172715, "epoch": 4112} {"train_loss": -7.098090171813965, "global_step": 172716, "epoch": 4112} {"train_loss": -7.043135643005371, "global_step": 172717, "epoch": 4112} {"train_loss": -7.057082653045654, "global_step": 172718, "epoch": 4112} {"train_loss": -7.014631271362305, "global_step": 172719, "epoch": 4112} {"train_loss": -7.044685363769531, "global_step": 172720, "epoch": 4112} {"train_loss": -7.0345048904418945, "global_step": 172721, "epoch": 4112} {"train_loss": -7.082221984863281, "global_step": 172722, "epoch": 4112} {"train_loss": -6.999829292297363, "global_step": 172723, "epoch": 4112} {"train_loss": -7.011589050292969, "global_step": 172724, "epoch": 4112} {"train_loss": -7.136559963226318, "global_step": 172725, "epoch": 4112} {"train_loss": -6.957556247711182, "global_step": 172726, "epoch": 4112} {"train_loss": -7.097879409790039, "global_step": 172727, "epoch": 4112} {"train_loss": -7.119474411010742, "global_step": 172728, "epoch": 4112} {"train_loss": -7.006389617919922, "global_step": 172729, "epoch": 4112} {"train_loss": -7.0353193283081055, "global_step": 172730, "epoch": 4112} {"train_loss": -7.005419731140137, "global_step": 172731, "epoch": 4112} {"train_loss": -7.003763675689697, "global_step": 172732, "epoch": 4112} {"train_loss": -7.097202301025391, "global_step": 172733, "epoch": 4112} {"train_loss": -7.005420207977295, "global_step": 172734, "epoch": 4112} {"train_loss": -6.995163440704346, "global_step": 172735, "epoch": 4112} {"train_loss": -7.015770435333252, "global_step": 172736, "epoch": 4112} {"train_loss": -6.964109420776367, "global_step": 172737, "epoch": 4112} {"train_loss": -6.937684535980225, "global_step": 172738, "epoch": 4112} {"train_loss": -7.10647439956665, "global_step": 172739, "epoch": 4112} {"train_loss": -6.969433784484863, "global_step": 172740, "epoch": 4112} {"train_loss": -7.066074848175049, "global_step": 172741, "epoch": 4112} {"train_loss": -7.083406925201416, "global_step": 172742, "epoch": 4112} {"train_loss": -7.056771755218506, "global_step": 172743, "epoch": 4112} {"train_loss": -7.088356971740723, "global_step": 172744, "epoch": 4112} {"train_loss": -7.051555440539405, "global_step": 172745, "epoch": 4112, "val_loss": 69005.265625} {"train_loss": -6.999786376953125, "global_step": 172746, "epoch": 4113} {"train_loss": -7.005996227264404, "global_step": 172747, "epoch": 4113} {"train_loss": -7.074112892150879, "global_step": 172748, "epoch": 4113} {"train_loss": -7.119516372680664, "global_step": 172749, "epoch": 4113} {"train_loss": -7.027862548828125, "global_step": 172750, "epoch": 4113} {"train_loss": -7.001584529876709, "global_step": 172751, "epoch": 4113} {"train_loss": -7.127231597900391, "global_step": 172752, "epoch": 4113} {"train_loss": -7.030867576599121, "global_step": 172753, "epoch": 4113} {"train_loss": -6.921794891357422, "global_step": 172754, "epoch": 4113} {"train_loss": -7.063432693481445, "global_step": 172755, "epoch": 4113} {"train_loss": -7.133554458618164, "global_step": 172756, "epoch": 4113} {"train_loss": -7.102553844451904, "global_step": 172757, "epoch": 4113} {"train_loss": -7.062509536743164, "global_step": 172758, "epoch": 4113} {"train_loss": -7.097883224487305, "global_step": 172759, "epoch": 4113} {"train_loss": -7.0644001960754395, "global_step": 172760, "epoch": 4113} {"train_loss": -7.030711650848389, "global_step": 172761, "epoch": 4113} {"train_loss": -7.046560764312744, "global_step": 172762, "epoch": 4113} {"train_loss": -7.061809062957764, "global_step": 172763, "epoch": 4113} {"train_loss": -6.9992499351501465, "global_step": 172764, "epoch": 4113} {"train_loss": -7.088259696960449, "global_step": 172765, "epoch": 4113} {"train_loss": -6.856043338775635, "global_step": 172766, "epoch": 4113} {"train_loss": -6.986884117126465, "global_step": 172767, "epoch": 4113} {"train_loss": -7.04586935043335, "global_step": 172768, "epoch": 4113} {"train_loss": -7.098127365112305, "global_step": 172769, "epoch": 4113} {"train_loss": -7.03072452545166, "global_step": 172770, "epoch": 4113} {"train_loss": -7.039377212524414, "global_step": 172771, "epoch": 4113} {"train_loss": -7.067845344543457, "global_step": 172772, "epoch": 4113} {"train_loss": -7.085838317871094, "global_step": 172773, "epoch": 4113} {"train_loss": -7.0701904296875, "global_step": 172774, "epoch": 4113} {"train_loss": -7.100953102111816, "global_step": 172775, "epoch": 4113} {"train_loss": -7.029196739196777, "global_step": 172776, "epoch": 4113} {"train_loss": -7.057669639587402, "global_step": 172777, "epoch": 4113} {"train_loss": -6.990418434143066, "global_step": 172778, "epoch": 4113} {"train_loss": -7.11492919921875, "global_step": 172779, "epoch": 4113} {"train_loss": -7.00969934463501, "global_step": 172780, "epoch": 4113} {"train_loss": -7.030210494995117, "global_step": 172781, "epoch": 4113} {"train_loss": -7.112857818603516, "global_step": 172782, "epoch": 4113} {"train_loss": -7.045466899871826, "global_step": 172783, "epoch": 4113} {"train_loss": -7.094076156616211, "global_step": 172784, "epoch": 4113} {"train_loss": -7.072422981262207, "global_step": 172785, "epoch": 4113} {"train_loss": -7.095252513885498, "global_step": 172786, "epoch": 4113} {"train_loss": -7.054288035347348, "global_step": 172787, "epoch": 4113, "val_loss": 69003.6640625} {"train_loss": -7.014238357543945, "global_step": 172788, "epoch": 4114} {"train_loss": -7.152766227722168, "global_step": 172789, "epoch": 4114} {"train_loss": -7.285515785217285, "global_step": 172790, "epoch": 4114} {"train_loss": -7.182926177978516, "global_step": 172791, "epoch": 4114} {"train_loss": -7.148233890533447, "global_step": 172792, "epoch": 4114} {"train_loss": -7.126290798187256, "global_step": 172793, "epoch": 4114} {"train_loss": -7.140832424163818, "global_step": 172794, "epoch": 4114} {"train_loss": -7.064063549041748, "global_step": 172795, "epoch": 4114} {"train_loss": -7.151578903198242, "global_step": 172796, "epoch": 4114} {"train_loss": -7.098923683166504, "global_step": 172797, "epoch": 4114} {"train_loss": -7.093869209289551, "global_step": 172798, "epoch": 4114} {"train_loss": -7.022208213806152, "global_step": 172799, "epoch": 4114} {"train_loss": -7.005940914154053, "global_step": 172800, "epoch": 4114} {"train_loss": -7.019280910491943, "global_step": 172801, "epoch": 4114} {"train_loss": -6.920310020446777, "global_step": 172802, "epoch": 4114} {"train_loss": -7.037394046783447, "global_step": 172803, "epoch": 4114} {"train_loss": -6.9004740715026855, "global_step": 172804, "epoch": 4114} {"train_loss": -6.967740535736084, "global_step": 172805, "epoch": 4114} {"train_loss": -7.162803649902344, "global_step": 172806, "epoch": 4114} {"train_loss": -6.9641032218933105, "global_step": 172807, "epoch": 4114} {"train_loss": -7.019286155700684, "global_step": 172808, "epoch": 4114} {"train_loss": -7.084070205688477, "global_step": 172809, "epoch": 4114} {"train_loss": -7.08711051940918, "global_step": 172810, "epoch": 4114} {"train_loss": -7.150223255157471, "global_step": 172811, "epoch": 4114} {"train_loss": -6.974071502685547, "global_step": 172812, "epoch": 4114} {"train_loss": -6.981973648071289, "global_step": 172813, "epoch": 4114} {"train_loss": -7.085369110107422, "global_step": 172814, "epoch": 4114} {"train_loss": -6.957043170928955, "global_step": 172815, "epoch": 4114} {"train_loss": -6.96904182434082, "global_step": 172816, "epoch": 4114} {"train_loss": -6.943635940551758, "global_step": 172817, "epoch": 4114} {"train_loss": -6.984933853149414, "global_step": 172818, "epoch": 4114} {"train_loss": -7.01528787612915, "global_step": 172819, "epoch": 4114} {"train_loss": -6.997499465942383, "global_step": 172820, "epoch": 4114} {"train_loss": -7.054724216461182, "global_step": 172821, "epoch": 4114} {"train_loss": -6.992801189422607, "global_step": 172822, "epoch": 4114} {"train_loss": -6.963000774383545, "global_step": 172823, "epoch": 4114} {"train_loss": -6.979903697967529, "global_step": 172824, "epoch": 4114} {"train_loss": -7.037965297698975, "global_step": 172825, "epoch": 4114} {"train_loss": -6.9712653160095215, "global_step": 172826, "epoch": 4114} {"train_loss": -6.976613998413086, "global_step": 172827, "epoch": 4114} {"train_loss": -7.0400190353393555, "global_step": 172828, "epoch": 4114} {"train_loss": -7.038854496819632, "global_step": 172829, "epoch": 4114, "val_loss": 69430.4140625} {"train_loss": -7.004071235656738, "global_step": 172830, "epoch": 4115} {"train_loss": -7.005218505859375, "global_step": 172831, "epoch": 4115} {"train_loss": -7.062582969665527, "global_step": 172832, "epoch": 4115} {"train_loss": -7.055443286895752, "global_step": 172833, "epoch": 4115} {"train_loss": -7.110842704772949, "global_step": 172834, "epoch": 4115} {"train_loss": -7.062079429626465, "global_step": 172835, "epoch": 4115} {"train_loss": -6.950531005859375, "global_step": 172836, "epoch": 4115} {"train_loss": -7.1078996658325195, "global_step": 172837, "epoch": 4115} {"train_loss": -7.0346832275390625, "global_step": 172838, "epoch": 4115} {"train_loss": -7.032628059387207, "global_step": 172839, "epoch": 4115} {"train_loss": -7.075933456420898, "global_step": 172840, "epoch": 4115} {"train_loss": -7.0227952003479, "global_step": 172841, "epoch": 4115} {"train_loss": -7.029497146606445, "global_step": 172842, "epoch": 4115} {"train_loss": -6.937784194946289, "global_step": 172843, "epoch": 4115} {"train_loss": -6.970545768737793, "global_step": 172844, "epoch": 4115} {"train_loss": -6.964132308959961, "global_step": 172845, "epoch": 4115} {"train_loss": -7.020846366882324, "global_step": 172846, "epoch": 4115} {"train_loss": -7.008902072906494, "global_step": 172847, "epoch": 4115} {"train_loss": -7.003201484680176, "global_step": 172848, "epoch": 4115} {"train_loss": -7.05728816986084, "global_step": 172849, "epoch": 4115} {"train_loss": -7.057343006134033, "global_step": 172850, "epoch": 4115} {"train_loss": -7.015902519226074, "global_step": 172851, "epoch": 4115} {"train_loss": -7.030765533447266, "global_step": 172852, "epoch": 4115} {"train_loss": -7.028417110443115, "global_step": 172853, "epoch": 4115} {"train_loss": -7.081610679626465, "global_step": 172854, "epoch": 4115} {"train_loss": -7.154945373535156, "global_step": 172855, "epoch": 4115} {"train_loss": -7.204311370849609, "global_step": 172856, "epoch": 4115} {"train_loss": -7.079624176025391, "global_step": 172857, "epoch": 4115} {"train_loss": -7.031081676483154, "global_step": 172858, "epoch": 4115} {"train_loss": -7.109189033508301, "global_step": 172859, "epoch": 4115} {"train_loss": -7.0816850662231445, "global_step": 172860, "epoch": 4115} {"train_loss": -7.128702163696289, "global_step": 172861, "epoch": 4115} {"train_loss": -7.11630916595459, "global_step": 172862, "epoch": 4115} {"train_loss": -6.945687770843506, "global_step": 172863, "epoch": 4115} {"train_loss": -7.0944976806640625, "global_step": 172864, "epoch": 4115} {"train_loss": -7.02141809463501, "global_step": 172865, "epoch": 4115} {"train_loss": -7.135429382324219, "global_step": 172866, "epoch": 4115} {"train_loss": -7.193947792053223, "global_step": 172867, "epoch": 4115} {"train_loss": -6.917119026184082, "global_step": 172868, "epoch": 4115} {"train_loss": -7.095395088195801, "global_step": 172869, "epoch": 4115} {"train_loss": -6.943668365478516, "global_step": 172870, "epoch": 4115} {"train_loss": -7.047054574603126, "global_step": 172871, "epoch": 4115, "val_loss": 69047.6015625} {"train_loss": -6.91566276550293, "global_step": 172872, "epoch": 4116} {"train_loss": -7.077348709106445, "global_step": 172873, "epoch": 4116} {"train_loss": -7.035270690917969, "global_step": 172874, "epoch": 4116} {"train_loss": -6.958320617675781, "global_step": 172875, "epoch": 4116} {"train_loss": -6.976532936096191, "global_step": 172876, "epoch": 4116} {"train_loss": -7.00704288482666, "global_step": 172877, "epoch": 4116} {"train_loss": -7.072877883911133, "global_step": 172878, "epoch": 4116} {"train_loss": -7.014400959014893, "global_step": 172879, "epoch": 4116} {"train_loss": -7.033489227294922, "global_step": 172880, "epoch": 4116} {"train_loss": -6.994625091552734, "global_step": 172881, "epoch": 4116} {"train_loss": -7.16095495223999, "global_step": 172882, "epoch": 4116} {"train_loss": -6.86993408203125, "global_step": 172883, "epoch": 4116} {"train_loss": -7.000122547149658, "global_step": 172884, "epoch": 4116} {"train_loss": -7.031411647796631, "global_step": 172885, "epoch": 4116} {"train_loss": -7.029365539550781, "global_step": 172886, "epoch": 4116} {"train_loss": -7.048203945159912, "global_step": 172887, "epoch": 4116} {"train_loss": -7.004502296447754, "global_step": 172888, "epoch": 4116} {"train_loss": -7.034672737121582, "global_step": 172889, "epoch": 4116} {"train_loss": -6.987070560455322, "global_step": 172890, "epoch": 4116} {"train_loss": -7.026495456695557, "global_step": 172891, "epoch": 4116} {"train_loss": -6.971235275268555, "global_step": 172892, "epoch": 4116} {"train_loss": -7.005073070526123, "global_step": 172893, "epoch": 4116} {"train_loss": -6.991744041442871, "global_step": 172894, "epoch": 4116} {"train_loss": -7.057801246643066, "global_step": 172895, "epoch": 4116} {"train_loss": -7.015280723571777, "global_step": 172896, "epoch": 4116} {"train_loss": -6.970925331115723, "global_step": 172897, "epoch": 4116} {"train_loss": -6.953269958496094, "global_step": 172898, "epoch": 4116} {"train_loss": -6.945876598358154, "global_step": 172899, "epoch": 4116} {"train_loss": -6.967120170593262, "global_step": 172900, "epoch": 4116} {"train_loss": -7.006557464599609, "global_step": 172901, "epoch": 4116} {"train_loss": -7.074926376342773, "global_step": 172902, "epoch": 4116} {"train_loss": -6.96414852142334, "global_step": 172903, "epoch": 4116} {"train_loss": -7.013017654418945, "global_step": 172904, "epoch": 4116} {"train_loss": -7.091413974761963, "global_step": 172905, "epoch": 4116} {"train_loss": -7.042294502258301, "global_step": 172906, "epoch": 4116} {"train_loss": -7.112794399261475, "global_step": 172907, "epoch": 4116} {"train_loss": -7.016883373260498, "global_step": 172908, "epoch": 4116} {"train_loss": -7.051424026489258, "global_step": 172909, "epoch": 4116} {"train_loss": -7.077394485473633, "global_step": 172910, "epoch": 4116} {"train_loss": -6.982224464416504, "global_step": 172911, "epoch": 4116} {"train_loss": -7.111537933349609, "global_step": 172912, "epoch": 4116} {"train_loss": -7.0188102040972025, "global_step": 172913, "epoch": 4116, "val_loss": 69158.71875} {"train_loss": -7.085366249084473, "global_step": 172914, "epoch": 4117} {"train_loss": -6.978384017944336, "global_step": 172915, "epoch": 4117} {"train_loss": -6.874929904937744, "global_step": 172916, "epoch": 4117} {"train_loss": -7.029767036437988, "global_step": 172917, "epoch": 4117} {"train_loss": -7.078517913818359, "global_step": 172918, "epoch": 4117} {"train_loss": -7.140226364135742, "global_step": 172919, "epoch": 4117} {"train_loss": -7.125636100769043, "global_step": 172920, "epoch": 4117} {"train_loss": -7.014915466308594, "global_step": 172921, "epoch": 4117} {"train_loss": -7.087975025177002, "global_step": 172922, "epoch": 4117} {"train_loss": -7.165590286254883, "global_step": 172923, "epoch": 4117} {"train_loss": -6.9557342529296875, "global_step": 172924, "epoch": 4117} {"train_loss": -6.996764183044434, "global_step": 172925, "epoch": 4117} {"train_loss": -6.988064765930176, "global_step": 172926, "epoch": 4117} {"train_loss": -7.078219413757324, "global_step": 172927, "epoch": 4117} {"train_loss": -7.090270042419434, "global_step": 172928, "epoch": 4117} {"train_loss": -7.143337726593018, "global_step": 172929, "epoch": 4117} {"train_loss": -7.0605573654174805, "global_step": 172930, "epoch": 4117} {"train_loss": -6.937448501586914, "global_step": 172931, "epoch": 4117} {"train_loss": -7.081039905548096, "global_step": 172932, "epoch": 4117} {"train_loss": -7.140041351318359, "global_step": 172933, "epoch": 4117} {"train_loss": -7.059259414672852, "global_step": 172934, "epoch": 4117} {"train_loss": -7.053953170776367, "global_step": 172935, "epoch": 4117} {"train_loss": -7.059775352478027, "global_step": 172936, "epoch": 4117} {"train_loss": -7.098753929138184, "global_step": 172937, "epoch": 4117} {"train_loss": -7.003166675567627, "global_step": 172938, "epoch": 4117} {"train_loss": -7.042644500732422, "global_step": 172939, "epoch": 4117} {"train_loss": -7.158332824707031, "global_step": 172940, "epoch": 4117} {"train_loss": -7.0156636238098145, "global_step": 172941, "epoch": 4117} {"train_loss": -7.122668743133545, "global_step": 172942, "epoch": 4117} {"train_loss": -7.089219093322754, "global_step": 172943, "epoch": 4117} {"train_loss": -7.12562370300293, "global_step": 172944, "epoch": 4117} {"train_loss": -7.192948818206787, "global_step": 172945, "epoch": 4117} {"train_loss": -7.119813919067383, "global_step": 172946, "epoch": 4117} {"train_loss": -7.096139907836914, "global_step": 172947, "epoch": 4117} {"train_loss": -7.120926856994629, "global_step": 172948, "epoch": 4117} {"train_loss": -6.96986722946167, "global_step": 172949, "epoch": 4117} {"train_loss": -7.0917463302612305, "global_step": 172950, "epoch": 4117} {"train_loss": -7.030393600463867, "global_step": 172951, "epoch": 4117} {"train_loss": -7.093354225158691, "global_step": 172952, "epoch": 4117} {"train_loss": -7.131237983703613, "global_step": 172953, "epoch": 4117} {"train_loss": -7.115898609161377, "global_step": 172954, "epoch": 4117} {"train_loss": -7.070518300646827, "global_step": 172955, "epoch": 4117, "val_loss": 69003.5546875} {"train_loss": -7.207065105438232, "global_step": 172956, "epoch": 4118} {"train_loss": -7.11259651184082, "global_step": 172957, "epoch": 4118} {"train_loss": -7.062078475952148, "global_step": 172958, "epoch": 4118} {"train_loss": -7.023317337036133, "global_step": 172959, "epoch": 4118} {"train_loss": -7.179888725280762, "global_step": 172960, "epoch": 4118} {"train_loss": -7.0805983543396, "global_step": 172961, "epoch": 4118} {"train_loss": -7.172557830810547, "global_step": 172962, "epoch": 4118} {"train_loss": -7.187465190887451, "global_step": 172963, "epoch": 4118} {"train_loss": -7.068803787231445, "global_step": 172964, "epoch": 4118} {"train_loss": -7.158854007720947, "global_step": 172965, "epoch": 4118} {"train_loss": -7.127040386199951, "global_step": 172966, "epoch": 4118} {"train_loss": -7.114551067352295, "global_step": 172967, "epoch": 4118} {"train_loss": -7.164877891540527, "global_step": 172968, "epoch": 4118} {"train_loss": -7.214916229248047, "global_step": 172969, "epoch": 4118} {"train_loss": -7.08669376373291, "global_step": 172970, "epoch": 4118} {"train_loss": -7.181206226348877, "global_step": 172971, "epoch": 4118} {"train_loss": -7.027562141418457, "global_step": 172972, "epoch": 4118} {"train_loss": -7.020567417144775, "global_step": 172973, "epoch": 4118} {"train_loss": -7.102692604064941, "global_step": 172974, "epoch": 4118} {"train_loss": -7.076154708862305, "global_step": 172975, "epoch": 4118} {"train_loss": -6.9827470779418945, "global_step": 172976, "epoch": 4118} {"train_loss": -7.055401802062988, "global_step": 172977, "epoch": 4118} {"train_loss": -7.117147445678711, "global_step": 172978, "epoch": 4118} {"train_loss": -6.847087860107422, "global_step": 172979, "epoch": 4118} {"train_loss": -7.098146438598633, "global_step": 172980, "epoch": 4118} {"train_loss": -6.992010593414307, "global_step": 172981, "epoch": 4118} {"train_loss": -6.91343879699707, "global_step": 172982, "epoch": 4118} {"train_loss": -7.087553977966309, "global_step": 172983, "epoch": 4118} {"train_loss": -6.924932479858398, "global_step": 172984, "epoch": 4118} {"train_loss": -6.982935905456543, "global_step": 172985, "epoch": 4118} {"train_loss": -7.084000110626221, "global_step": 172986, "epoch": 4118} {"train_loss": -6.986347198486328, "global_step": 172987, "epoch": 4118} {"train_loss": -6.950778007507324, "global_step": 172988, "epoch": 4118} {"train_loss": -6.995098114013672, "global_step": 172989, "epoch": 4118} {"train_loss": -6.849520683288574, "global_step": 172990, "epoch": 4118} {"train_loss": -6.980725288391113, "global_step": 172991, "epoch": 4118} {"train_loss": -6.87290620803833, "global_step": 172992, "epoch": 4118} {"train_loss": -7.021297454833984, "global_step": 172993, "epoch": 4118} {"train_loss": -6.898932933807373, "global_step": 172994, "epoch": 4118} {"train_loss": -6.9149980545043945, "global_step": 172995, "epoch": 4118} {"train_loss": -6.967349052429199, "global_step": 172996, "epoch": 4118} {"train_loss": -7.042587938762846, "global_step": 172997, "epoch": 4118, "val_loss": 69397.375} {"train_loss": -6.99787712097168, "global_step": 172998, "epoch": 4119} {"train_loss": -7.002485275268555, "global_step": 172999, "epoch": 4119} {"train_loss": -6.951420783996582, "global_step": 173000, "epoch": 4119} {"train_loss": -7.003192901611328, "global_step": 173001, "epoch": 4119} {"train_loss": -7.07366418838501, "global_step": 173002, "epoch": 4119} {"train_loss": -6.92875862121582, "global_step": 173003, "epoch": 4119} {"train_loss": -7.114077568054199, "global_step": 173004, "epoch": 4119} {"train_loss": -7.0539960861206055, "global_step": 173005, "epoch": 4119} {"train_loss": -7.048361301422119, "global_step": 173006, "epoch": 4119} {"train_loss": -7.073615550994873, "global_step": 173007, "epoch": 4119} {"train_loss": -7.008963584899902, "global_step": 173008, "epoch": 4119} {"train_loss": -6.984359264373779, "global_step": 173009, "epoch": 4119} {"train_loss": -6.990935802459717, "global_step": 173010, "epoch": 4119} {"train_loss": -7.1130266189575195, "global_step": 173011, "epoch": 4119} {"train_loss": -7.066269397735596, "global_step": 173012, "epoch": 4119} {"train_loss": -6.957400798797607, "global_step": 173013, "epoch": 4119} {"train_loss": -6.969132423400879, "global_step": 173014, "epoch": 4119} {"train_loss": -6.971071243286133, "global_step": 173015, "epoch": 4119} {"train_loss": -7.038089752197266, "global_step": 173016, "epoch": 4119} {"train_loss": -7.131078720092773, "global_step": 173017, "epoch": 4119} {"train_loss": -7.068563938140869, "global_step": 173018, "epoch": 4119} {"train_loss": -7.102557182312012, "global_step": 173019, "epoch": 4119} {"train_loss": -7.032600402832031, "global_step": 173020, "epoch": 4119} {"train_loss": -7.040104866027832, "global_step": 173021, "epoch": 4119} {"train_loss": -7.085057258605957, "global_step": 173022, "epoch": 4119} {"train_loss": -7.123291015625, "global_step": 173023, "epoch": 4119} {"train_loss": -7.113657474517822, "global_step": 173024, "epoch": 4119} {"train_loss": -7.132245063781738, "global_step": 173025, "epoch": 4119} {"train_loss": -7.1672563552856445, "global_step": 173026, "epoch": 4119} {"train_loss": -7.121699810028076, "global_step": 173027, "epoch": 4119} {"train_loss": -7.081108093261719, "global_step": 173028, "epoch": 4119} {"train_loss": -7.082103729248047, "global_step": 173029, "epoch": 4119} {"train_loss": -7.084067344665527, "global_step": 173030, "epoch": 4119} {"train_loss": -7.168831825256348, "global_step": 173031, "epoch": 4119} {"train_loss": -7.074223518371582, "global_step": 173032, "epoch": 4119} {"train_loss": -6.912572860717773, "global_step": 173033, "epoch": 4119} {"train_loss": -7.010346412658691, "global_step": 173034, "epoch": 4119} {"train_loss": -7.119887828826904, "global_step": 173035, "epoch": 4119} {"train_loss": -6.8600263595581055, "global_step": 173036, "epoch": 4119} {"train_loss": -7.123603343963623, "global_step": 173037, "epoch": 4119} {"train_loss": -7.021604537963867, "global_step": 173038, "epoch": 4119} {"train_loss": -7.045957849139259, "global_step": 173039, "epoch": 4119, "val_loss": 68988.859375} {"train_loss": -7.069919109344482, "global_step": 173040, "epoch": 4120} {"train_loss": -6.895441055297852, "global_step": 173041, "epoch": 4120} {"train_loss": -6.996600151062012, "global_step": 173042, "epoch": 4120} {"train_loss": -6.968043327331543, "global_step": 173043, "epoch": 4120} {"train_loss": -6.815900802612305, "global_step": 173044, "epoch": 4120} {"train_loss": -7.1204833984375, "global_step": 173045, "epoch": 4120} {"train_loss": -6.778013229370117, "global_step": 173046, "epoch": 4120} {"train_loss": -7.002931594848633, "global_step": 173047, "epoch": 4120} {"train_loss": -6.727256774902344, "global_step": 173048, "epoch": 4120} {"train_loss": -6.891998291015625, "global_step": 173049, "epoch": 4120} {"train_loss": -6.902499198913574, "global_step": 173050, "epoch": 4120} {"train_loss": -6.81320858001709, "global_step": 173051, "epoch": 4120} {"train_loss": -6.986531734466553, "global_step": 173052, "epoch": 4120} {"train_loss": -7.016698837280273, "global_step": 173053, "epoch": 4120} {"train_loss": -6.928519248962402, "global_step": 173054, "epoch": 4120} {"train_loss": -7.029547691345215, "global_step": 173055, "epoch": 4120} {"train_loss": -7.006746292114258, "global_step": 173056, "epoch": 4120} {"train_loss": -6.853248596191406, "global_step": 173057, "epoch": 4120} {"train_loss": -6.8627214431762695, "global_step": 173058, "epoch": 4120} {"train_loss": -6.956973075866699, "global_step": 173059, "epoch": 4120} {"train_loss": -6.953602313995361, "global_step": 173060, "epoch": 4120} {"train_loss": -7.027489185333252, "global_step": 173061, "epoch": 4120} {"train_loss": -7.01814603805542, "global_step": 173062, "epoch": 4120} {"train_loss": -7.00963020324707, "global_step": 173063, "epoch": 4120} {"train_loss": -7.055129051208496, "global_step": 173064, "epoch": 4120} {"train_loss": -6.916261196136475, "global_step": 173065, "epoch": 4120} {"train_loss": -6.915387153625488, "global_step": 173066, "epoch": 4120} {"train_loss": -6.98854923248291, "global_step": 173067, "epoch": 4120} {"train_loss": -7.007403373718262, "global_step": 173068, "epoch": 4120} {"train_loss": -6.915152072906494, "global_step": 173069, "epoch": 4120} {"train_loss": -7.074494361877441, "global_step": 173070, "epoch": 4120} {"train_loss": -7.007369041442871, "global_step": 173071, "epoch": 4120} {"train_loss": -7.035411834716797, "global_step": 173072, "epoch": 4120} {"train_loss": -6.998859405517578, "global_step": 173073, "epoch": 4120} {"train_loss": -7.037134170532227, "global_step": 173074, "epoch": 4120} {"train_loss": -7.059012413024902, "global_step": 173075, "epoch": 4120} {"train_loss": -7.079051971435547, "global_step": 173076, "epoch": 4120} {"train_loss": -7.064003944396973, "global_step": 173077, "epoch": 4120} {"train_loss": -7.1056952476501465, "global_step": 173078, "epoch": 4120} {"train_loss": -7.205133438110352, "global_step": 173079, "epoch": 4120} {"train_loss": -7.124404430389404, "global_step": 173080, "epoch": 4120} {"train_loss": -6.984612112953549, "global_step": 173081, "epoch": 4120, "val_loss": 68931.9140625} {"train_loss": -7.150280475616455, "global_step": 173082, "epoch": 4121} {"train_loss": -7.106389045715332, "global_step": 173083, "epoch": 4121} {"train_loss": -7.067109107971191, "global_step": 173084, "epoch": 4121} {"train_loss": -7.162858009338379, "global_step": 173085, "epoch": 4121} {"train_loss": -7.077347278594971, "global_step": 173086, "epoch": 4121} {"train_loss": -7.039697647094727, "global_step": 173087, "epoch": 4121} {"train_loss": -7.075748920440674, "global_step": 173088, "epoch": 4121} {"train_loss": -7.0307159423828125, "global_step": 173089, "epoch": 4121} {"train_loss": -7.155055999755859, "global_step": 173090, "epoch": 4121} {"train_loss": -7.09250545501709, "global_step": 173091, "epoch": 4121} {"train_loss": -7.052105903625488, "global_step": 173092, "epoch": 4121} {"train_loss": -7.051924705505371, "global_step": 173093, "epoch": 4121} {"train_loss": -7.130800247192383, "global_step": 173094, "epoch": 4121} {"train_loss": -7.192546367645264, "global_step": 173095, "epoch": 4121} {"train_loss": -7.119063854217529, "global_step": 173096, "epoch": 4121} {"train_loss": -7.039434432983398, "global_step": 173097, "epoch": 4121} {"train_loss": -7.136230945587158, "global_step": 173098, "epoch": 4121} {"train_loss": -6.896859169006348, "global_step": 173099, "epoch": 4121} {"train_loss": -7.047183036804199, "global_step": 173100, "epoch": 4121} {"train_loss": -7.0511698722839355, "global_step": 173101, "epoch": 4121} {"train_loss": -6.965691566467285, "global_step": 173102, "epoch": 4121} {"train_loss": -7.087417125701904, "global_step": 173103, "epoch": 4121} {"train_loss": -6.890027046203613, "global_step": 173104, "epoch": 4121} {"train_loss": -7.080394744873047, "global_step": 173105, "epoch": 4121} {"train_loss": -7.0764479637146, "global_step": 173106, "epoch": 4121} {"train_loss": -7.102513313293457, "global_step": 173107, "epoch": 4121} {"train_loss": -7.125833988189697, "global_step": 173108, "epoch": 4121} {"train_loss": -7.1525750160217285, "global_step": 173109, "epoch": 4121} {"train_loss": -7.0374040603637695, "global_step": 173110, "epoch": 4121} {"train_loss": -7.031939506530762, "global_step": 173111, "epoch": 4121} {"train_loss": -7.196623802185059, "global_step": 173112, "epoch": 4121} {"train_loss": -6.979406833648682, "global_step": 173113, "epoch": 4121} {"train_loss": -7.110719680786133, "global_step": 173114, "epoch": 4121} {"train_loss": -7.10749626159668, "global_step": 173115, "epoch": 4121} {"train_loss": -6.990272521972656, "global_step": 173116, "epoch": 4121} {"train_loss": -7.119231224060059, "global_step": 173117, "epoch": 4121} {"train_loss": -7.04276704788208, "global_step": 173118, "epoch": 4121} {"train_loss": -7.146923542022705, "global_step": 173119, "epoch": 4121} {"train_loss": -7.159873962402344, "global_step": 173120, "epoch": 4121} {"train_loss": -7.0671586990356445, "global_step": 173121, "epoch": 4121} {"train_loss": -7.159379482269287, "global_step": 173122, "epoch": 4121} {"train_loss": -7.082449742725918, "global_step": 173123, "epoch": 4121, "val_loss": 69089.6640625} {"train_loss": -7.099032402038574, "global_step": 173124, "epoch": 4122} {"train_loss": -7.171483039855957, "global_step": 173125, "epoch": 4122} {"train_loss": -7.171442031860352, "global_step": 173126, "epoch": 4122} {"train_loss": -7.119471549987793, "global_step": 173127, "epoch": 4122} {"train_loss": -7.203771591186523, "global_step": 173128, "epoch": 4122} {"train_loss": -7.120297431945801, "global_step": 173129, "epoch": 4122} {"train_loss": -6.9722089767456055, "global_step": 173130, "epoch": 4122} {"train_loss": -7.147877216339111, "global_step": 173131, "epoch": 4122} {"train_loss": -7.2478814125061035, "global_step": 173132, "epoch": 4122} {"train_loss": -7.0474371910095215, "global_step": 173133, "epoch": 4122} {"train_loss": -7.076168060302734, "global_step": 173134, "epoch": 4122} {"train_loss": -7.053906440734863, "global_step": 173135, "epoch": 4122} {"train_loss": -7.205192565917969, "global_step": 173136, "epoch": 4122} {"train_loss": -7.107913017272949, "global_step": 173137, "epoch": 4122} {"train_loss": -7.076992034912109, "global_step": 173138, "epoch": 4122} {"train_loss": -6.98006010055542, "global_step": 173139, "epoch": 4122} {"train_loss": -7.032266139984131, "global_step": 173140, "epoch": 4122} {"train_loss": -7.043599605560303, "global_step": 173141, "epoch": 4122} {"train_loss": -7.094526290893555, "global_step": 173142, "epoch": 4122} {"train_loss": -7.207284450531006, "global_step": 173143, "epoch": 4122} {"train_loss": -7.097295761108398, "global_step": 173144, "epoch": 4122} {"train_loss": -7.139407634735107, "global_step": 173145, "epoch": 4122} {"train_loss": -7.047432899475098, "global_step": 173146, "epoch": 4122} {"train_loss": -7.005460262298584, "global_step": 173147, "epoch": 4122} {"train_loss": -7.11686897277832, "global_step": 173148, "epoch": 4122} {"train_loss": -7.0987958908081055, "global_step": 173149, "epoch": 4122} {"train_loss": -7.176530361175537, "global_step": 173150, "epoch": 4122} {"train_loss": -7.062550067901611, "global_step": 173151, "epoch": 4122} {"train_loss": -7.17545747756958, "global_step": 173152, "epoch": 4122} {"train_loss": -7.051497459411621, "global_step": 173153, "epoch": 4122} {"train_loss": -7.093852519989014, "global_step": 173154, "epoch": 4122} {"train_loss": -7.084788799285889, "global_step": 173155, "epoch": 4122} {"train_loss": -6.976528644561768, "global_step": 173156, "epoch": 4122} {"train_loss": -7.2136149406433105, "global_step": 173157, "epoch": 4122} {"train_loss": -7.092290878295898, "global_step": 173158, "epoch": 4122} {"train_loss": -6.95999002456665, "global_step": 173159, "epoch": 4122} {"train_loss": -7.126921653747559, "global_step": 173160, "epoch": 4122} {"train_loss": -7.01462984085083, "global_step": 173161, "epoch": 4122} {"train_loss": -6.901914596557617, "global_step": 173162, "epoch": 4122} {"train_loss": -7.059453964233398, "global_step": 173163, "epoch": 4122} {"train_loss": -7.119728088378906, "global_step": 173164, "epoch": 4122} {"train_loss": -7.092489185787382, "global_step": 173165, "epoch": 4122, "val_loss": 69113.484375} {"train_loss": -6.973328590393066, "global_step": 173166, "epoch": 4123} {"train_loss": -7.094142913818359, "global_step": 173167, "epoch": 4123} {"train_loss": -7.079537391662598, "global_step": 173168, "epoch": 4123} {"train_loss": -7.217677116394043, "global_step": 173169, "epoch": 4123} {"train_loss": -7.061407089233398, "global_step": 173170, "epoch": 4123} {"train_loss": -7.115652561187744, "global_step": 173171, "epoch": 4123} {"train_loss": -7.108261585235596, "global_step": 173172, "epoch": 4123} {"train_loss": -7.095766544342041, "global_step": 173173, "epoch": 4123} {"train_loss": -6.973480224609375, "global_step": 173174, "epoch": 4123} {"train_loss": -7.0546135902404785, "global_step": 173175, "epoch": 4123} {"train_loss": -7.070981502532959, "global_step": 173176, "epoch": 4123} {"train_loss": -6.966883182525635, "global_step": 173177, "epoch": 4123} {"train_loss": -7.065011978149414, "global_step": 173178, "epoch": 4123} {"train_loss": -6.9287896156311035, "global_step": 173179, "epoch": 4123} {"train_loss": -6.960934638977051, "global_step": 173180, "epoch": 4123} {"train_loss": -7.052605628967285, "global_step": 173181, "epoch": 4123} {"train_loss": -7.079958915710449, "global_step": 173182, "epoch": 4123} {"train_loss": -7.013443946838379, "global_step": 173183, "epoch": 4123} {"train_loss": -7.122842788696289, "global_step": 173184, "epoch": 4123} {"train_loss": -6.945073127746582, "global_step": 173185, "epoch": 4123} {"train_loss": -7.0774736404418945, "global_step": 173186, "epoch": 4123} {"train_loss": -6.9553422927856445, "global_step": 173187, "epoch": 4123} {"train_loss": -7.00281286239624, "global_step": 173188, "epoch": 4123} {"train_loss": -7.067492485046387, "global_step": 173189, "epoch": 4123} {"train_loss": -7.068055152893066, "global_step": 173190, "epoch": 4123} {"train_loss": -7.035285472869873, "global_step": 173191, "epoch": 4123} {"train_loss": -7.007969856262207, "global_step": 173192, "epoch": 4123} {"train_loss": -6.985276222229004, "global_step": 173193, "epoch": 4123} {"train_loss": -7.029139518737793, "global_step": 173194, "epoch": 4123} {"train_loss": -7.089975357055664, "global_step": 173195, "epoch": 4123} {"train_loss": -6.980647563934326, "global_step": 173196, "epoch": 4123} {"train_loss": -6.9278669357299805, "global_step": 173197, "epoch": 4123} {"train_loss": -6.956229209899902, "global_step": 173198, "epoch": 4123} {"train_loss": -7.045263767242432, "global_step": 173199, "epoch": 4123} {"train_loss": -7.028494358062744, "global_step": 173200, "epoch": 4123} {"train_loss": -6.888930797576904, "global_step": 173201, "epoch": 4123} {"train_loss": -7.078846454620361, "global_step": 173202, "epoch": 4123} {"train_loss": -7.141051292419434, "global_step": 173203, "epoch": 4123} {"train_loss": -7.009141445159912, "global_step": 173204, "epoch": 4123} {"train_loss": -7.004312515258789, "global_step": 173205, "epoch": 4123} {"train_loss": -6.994283199310303, "global_step": 173206, "epoch": 4123} {"train_loss": -7.033785581588745, "global_step": 173207, "epoch": 4123, "val_loss": 68951.515625} {"train_loss": -7.051645278930664, "global_step": 173208, "epoch": 4124} {"train_loss": -7.079071521759033, "global_step": 173209, "epoch": 4124} {"train_loss": -7.060451030731201, "global_step": 173210, "epoch": 4124} {"train_loss": -7.12632417678833, "global_step": 173211, "epoch": 4124} {"train_loss": -6.99440860748291, "global_step": 173212, "epoch": 4124} {"train_loss": -7.1206536293029785, "global_step": 173213, "epoch": 4124} {"train_loss": -7.075303077697754, "global_step": 173214, "epoch": 4124} {"train_loss": -7.0328826904296875, "global_step": 173215, "epoch": 4124} {"train_loss": -7.119680404663086, "global_step": 173216, "epoch": 4124} {"train_loss": -7.14698600769043, "global_step": 173217, "epoch": 4124} {"train_loss": -7.052777290344238, "global_step": 173218, "epoch": 4124} {"train_loss": -7.074644088745117, "global_step": 173219, "epoch": 4124} {"train_loss": -7.038403511047363, "global_step": 173220, "epoch": 4124} {"train_loss": -6.913021087646484, "global_step": 173221, "epoch": 4124} {"train_loss": -7.139176368713379, "global_step": 173222, "epoch": 4124} {"train_loss": -6.975290298461914, "global_step": 173223, "epoch": 4124} {"train_loss": -6.933780670166016, "global_step": 173224, "epoch": 4124} {"train_loss": -7.1005401611328125, "global_step": 173225, "epoch": 4124} {"train_loss": -7.072739601135254, "global_step": 173226, "epoch": 4124} {"train_loss": -6.879045486450195, "global_step": 173227, "epoch": 4124} {"train_loss": -7.085684776306152, "global_step": 173228, "epoch": 4124} {"train_loss": -7.067556381225586, "global_step": 173229, "epoch": 4124} {"train_loss": -7.034838676452637, "global_step": 173230, "epoch": 4124} {"train_loss": -6.8580641746521, "global_step": 173231, "epoch": 4124} {"train_loss": -6.902324199676514, "global_step": 173232, "epoch": 4124} {"train_loss": -7.099662780761719, "global_step": 173233, "epoch": 4124} {"train_loss": -6.987619400024414, "global_step": 173234, "epoch": 4124} {"train_loss": -6.878264427185059, "global_step": 173235, "epoch": 4124} {"train_loss": -7.082923889160156, "global_step": 173236, "epoch": 4124} {"train_loss": -7.008823394775391, "global_step": 173237, "epoch": 4124} {"train_loss": -7.017848491668701, "global_step": 173238, "epoch": 4124} {"train_loss": -7.023985862731934, "global_step": 173239, "epoch": 4124} {"train_loss": -6.963176727294922, "global_step": 173240, "epoch": 4124} {"train_loss": -6.987278461456299, "global_step": 173241, "epoch": 4124} {"train_loss": -6.833242416381836, "global_step": 173242, "epoch": 4124} {"train_loss": -6.849411964416504, "global_step": 173243, "epoch": 4124} {"train_loss": -7.00100564956665, "global_step": 173244, "epoch": 4124} {"train_loss": -6.668639659881592, "global_step": 173245, "epoch": 4124} {"train_loss": -6.783169746398926, "global_step": 173246, "epoch": 4124} {"train_loss": -6.708729267120361, "global_step": 173247, "epoch": 4124} {"train_loss": -6.862641334533691, "global_step": 173248, "epoch": 4124} {"train_loss": -6.988887275968279, "global_step": 173249, "epoch": 4124, "val_loss": 69307.4921875} {"train_loss": -6.841048240661621, "global_step": 173250, "epoch": 4125} {"train_loss": -6.758975028991699, "global_step": 173251, "epoch": 4125} {"train_loss": -6.8829731941223145, "global_step": 173252, "epoch": 4125} {"train_loss": -6.960304260253906, "global_step": 173253, "epoch": 4125} {"train_loss": -6.927820205688477, "global_step": 173254, "epoch": 4125} {"train_loss": -6.810323715209961, "global_step": 173255, "epoch": 4125} {"train_loss": -6.913197040557861, "global_step": 173256, "epoch": 4125} {"train_loss": -6.837218761444092, "global_step": 173257, "epoch": 4125} {"train_loss": -6.9645795822143555, "global_step": 173258, "epoch": 4125} {"train_loss": -6.858695030212402, "global_step": 173259, "epoch": 4125} {"train_loss": -7.0156378746032715, "global_step": 173260, "epoch": 4125} {"train_loss": -6.8573198318481445, "global_step": 173261, "epoch": 4125} {"train_loss": -6.9207539558410645, "global_step": 173262, "epoch": 4125} {"train_loss": -6.973217964172363, "global_step": 173263, "epoch": 4125} {"train_loss": -6.947432518005371, "global_step": 173264, "epoch": 4125} {"train_loss": -6.924050331115723, "global_step": 173265, "epoch": 4125} {"train_loss": -6.996118545532227, "global_step": 173266, "epoch": 4125} {"train_loss": -7.070171356201172, "global_step": 173267, "epoch": 4125} {"train_loss": -7.02419376373291, "global_step": 173268, "epoch": 4125} {"train_loss": -6.988061904907227, "global_step": 173269, "epoch": 4125} {"train_loss": -7.005605220794678, "global_step": 173270, "epoch": 4125} {"train_loss": -6.931666374206543, "global_step": 173271, "epoch": 4125} {"train_loss": -6.985716819763184, "global_step": 173272, "epoch": 4125} {"train_loss": -6.972784042358398, "global_step": 173273, "epoch": 4125} {"train_loss": -7.022824764251709, "global_step": 173274, "epoch": 4125} {"train_loss": -7.075483798980713, "global_step": 173275, "epoch": 4125} {"train_loss": -6.865545749664307, "global_step": 173276, "epoch": 4125} {"train_loss": -7.10681676864624, "global_step": 173277, "epoch": 4125} {"train_loss": -7.075287342071533, "global_step": 173278, "epoch": 4125} {"train_loss": -6.9603166580200195, "global_step": 173279, "epoch": 4125} {"train_loss": -6.946802616119385, "global_step": 173280, "epoch": 4125} {"train_loss": -7.021208763122559, "global_step": 173281, "epoch": 4125} {"train_loss": -6.97210693359375, "global_step": 173282, "epoch": 4125} {"train_loss": -6.914065361022949, "global_step": 173283, "epoch": 4125} {"train_loss": -7.112857818603516, "global_step": 173284, "epoch": 4125} {"train_loss": -6.818811893463135, "global_step": 173285, "epoch": 4125} {"train_loss": -6.938232421875, "global_step": 173286, "epoch": 4125} {"train_loss": -6.8884477615356445, "global_step": 173287, "epoch": 4125} {"train_loss": -7.001662254333496, "global_step": 173288, "epoch": 4125} {"train_loss": -7.094804286956787, "global_step": 173289, "epoch": 4125} {"train_loss": -6.9223432540893555, "global_step": 173290, "epoch": 4125} {"train_loss": -6.9573557149796255, "global_step": 173291, "epoch": 4125, "val_loss": 69080.4609375} {"train_loss": -6.944526672363281, "global_step": 173292, "epoch": 4126} {"train_loss": -7.053741455078125, "global_step": 173293, "epoch": 4126} {"train_loss": -7.183855056762695, "global_step": 173294, "epoch": 4126} {"train_loss": -7.144108295440674, "global_step": 173295, "epoch": 4126} {"train_loss": -7.166784286499023, "global_step": 173296, "epoch": 4126} {"train_loss": -7.106784820556641, "global_step": 173297, "epoch": 4126} {"train_loss": -7.152490615844727, "global_step": 173298, "epoch": 4126} {"train_loss": -7.115534782409668, "global_step": 173299, "epoch": 4126} {"train_loss": -7.016761779785156, "global_step": 173300, "epoch": 4126} {"train_loss": -7.142263412475586, "global_step": 173301, "epoch": 4126} {"train_loss": -7.147047996520996, "global_step": 173302, "epoch": 4126} {"train_loss": -7.187321662902832, "global_step": 173303, "epoch": 4126} {"train_loss": -7.052489280700684, "global_step": 173304, "epoch": 4126} {"train_loss": -7.103367805480957, "global_step": 173305, "epoch": 4126} {"train_loss": -7.0732421875, "global_step": 173306, "epoch": 4126} {"train_loss": -7.168453216552734, "global_step": 173307, "epoch": 4126} {"train_loss": -7.054324150085449, "global_step": 173308, "epoch": 4126} {"train_loss": -7.152489185333252, "global_step": 173309, "epoch": 4126} {"train_loss": -7.168697357177734, "global_step": 173310, "epoch": 4126} {"train_loss": -7.075941562652588, "global_step": 173311, "epoch": 4126} {"train_loss": -7.072503089904785, "global_step": 173312, "epoch": 4126} {"train_loss": -7.006553649902344, "global_step": 173313, "epoch": 4126} {"train_loss": -7.114354133605957, "global_step": 173314, "epoch": 4126} {"train_loss": -7.057754993438721, "global_step": 173315, "epoch": 4126} {"train_loss": -7.034004211425781, "global_step": 173316, "epoch": 4126} {"train_loss": -7.047170162200928, "global_step": 173317, "epoch": 4126} {"train_loss": -7.087255477905273, "global_step": 173318, "epoch": 4126} {"train_loss": -7.098240852355957, "global_step": 173319, "epoch": 4126} {"train_loss": -7.022931098937988, "global_step": 173320, "epoch": 4126} {"train_loss": -7.1350626945495605, "global_step": 173321, "epoch": 4126} {"train_loss": -7.1337175369262695, "global_step": 173322, "epoch": 4126} {"train_loss": -7.103102684020996, "global_step": 173323, "epoch": 4126} {"train_loss": -7.126721382141113, "global_step": 173324, "epoch": 4126} {"train_loss": -6.97202205657959, "global_step": 173325, "epoch": 4126} {"train_loss": -7.124217510223389, "global_step": 173326, "epoch": 4126} {"train_loss": -6.986557483673096, "global_step": 173327, "epoch": 4126} {"train_loss": -6.913247585296631, "global_step": 173328, "epoch": 4126} {"train_loss": -7.140447616577148, "global_step": 173329, "epoch": 4126} {"train_loss": -6.940934181213379, "global_step": 173330, "epoch": 4126} {"train_loss": -6.919195175170898, "global_step": 173331, "epoch": 4126} {"train_loss": -7.0160393714904785, "global_step": 173332, "epoch": 4126} {"train_loss": -7.075390758968535, "global_step": 173333, "epoch": 4126, "val_loss": 69144.0390625} {"train_loss": -7.11809778213501, "global_step": 173334, "epoch": 4127} {"train_loss": -7.088761329650879, "global_step": 173335, "epoch": 4127} {"train_loss": -7.140718936920166, "global_step": 173336, "epoch": 4127} {"train_loss": -7.008091926574707, "global_step": 173337, "epoch": 4127} {"train_loss": -7.07930850982666, "global_step": 173338, "epoch": 4127} {"train_loss": -7.092679977416992, "global_step": 173339, "epoch": 4127} {"train_loss": -6.957710266113281, "global_step": 173340, "epoch": 4127} {"train_loss": -7.009634017944336, "global_step": 173341, "epoch": 4127} {"train_loss": -7.086777210235596, "global_step": 173342, "epoch": 4127} {"train_loss": -6.951850891113281, "global_step": 173343, "epoch": 4127} {"train_loss": -7.019700050354004, "global_step": 173344, "epoch": 4127} {"train_loss": -7.123614311218262, "global_step": 173345, "epoch": 4127} {"train_loss": -7.055281639099121, "global_step": 173346, "epoch": 4127} {"train_loss": -7.158923149108887, "global_step": 173347, "epoch": 4127} {"train_loss": -7.033699035644531, "global_step": 173348, "epoch": 4127} {"train_loss": -7.073348522186279, "global_step": 173349, "epoch": 4127} {"train_loss": -7.050978660583496, "global_step": 173350, "epoch": 4127} {"train_loss": -7.0472211837768555, "global_step": 173351, "epoch": 4127} {"train_loss": -7.13472318649292, "global_step": 173352, "epoch": 4127} {"train_loss": -7.126906394958496, "global_step": 173353, "epoch": 4127} {"train_loss": -7.065369606018066, "global_step": 173354, "epoch": 4127} {"train_loss": -7.168241500854492, "global_step": 173355, "epoch": 4127} {"train_loss": -7.098079681396484, "global_step": 173356, "epoch": 4127} {"train_loss": -7.2277631759643555, "global_step": 173357, "epoch": 4127} {"train_loss": -7.18450927734375, "global_step": 173358, "epoch": 4127} {"train_loss": -7.0419535636901855, "global_step": 173359, "epoch": 4127} {"train_loss": -6.92128849029541, "global_step": 173360, "epoch": 4127} {"train_loss": -7.027402400970459, "global_step": 173361, "epoch": 4127} {"train_loss": -6.939700126647949, "global_step": 173362, "epoch": 4127} {"train_loss": -7.027681350708008, "global_step": 173363, "epoch": 4127} {"train_loss": -7.114601135253906, "global_step": 173364, "epoch": 4127} {"train_loss": -6.909057140350342, "global_step": 173365, "epoch": 4127} {"train_loss": -7.0783257484436035, "global_step": 173366, "epoch": 4127} {"train_loss": -6.935183525085449, "global_step": 173367, "epoch": 4127} {"train_loss": -6.9859819412231445, "global_step": 173368, "epoch": 4127} {"train_loss": -7.066941261291504, "global_step": 173369, "epoch": 4127} {"train_loss": -7.030421257019043, "global_step": 173370, "epoch": 4127} {"train_loss": -7.028613090515137, "global_step": 173371, "epoch": 4127} {"train_loss": -6.991382598876953, "global_step": 173372, "epoch": 4127} {"train_loss": -7.042239189147949, "global_step": 173373, "epoch": 4127} {"train_loss": -7.123755931854248, "global_step": 173374, "epoch": 4127} {"train_loss": -7.0574402922675725, "global_step": 173375, "epoch": 4127, "val_loss": 68986.890625} {"train_loss": -7.215271949768066, "global_step": 173376, "epoch": 4128} {"train_loss": -7.017120838165283, "global_step": 173377, "epoch": 4128} {"train_loss": -7.141929626464844, "global_step": 173378, "epoch": 4128} {"train_loss": -7.229704856872559, "global_step": 173379, "epoch": 4128} {"train_loss": -7.061732292175293, "global_step": 173380, "epoch": 4128} {"train_loss": -7.086370468139648, "global_step": 173381, "epoch": 4128} {"train_loss": -7.0457329750061035, "global_step": 173382, "epoch": 4128} {"train_loss": -7.06020450592041, "global_step": 173383, "epoch": 4128} {"train_loss": -7.132877826690674, "global_step": 173384, "epoch": 4128} {"train_loss": -7.007098197937012, "global_step": 173385, "epoch": 4128} {"train_loss": -7.07005500793457, "global_step": 173386, "epoch": 4128} {"train_loss": -7.111149787902832, "global_step": 173387, "epoch": 4128} {"train_loss": -7.067071914672852, "global_step": 173388, "epoch": 4128} {"train_loss": -7.059384346008301, "global_step": 173389, "epoch": 4128} {"train_loss": -7.109841346740723, "global_step": 173390, "epoch": 4128} {"train_loss": -7.128866195678711, "global_step": 173391, "epoch": 4128} {"train_loss": -7.116732597351074, "global_step": 173392, "epoch": 4128} {"train_loss": -7.085965156555176, "global_step": 173393, "epoch": 4128} {"train_loss": -7.03440523147583, "global_step": 173394, "epoch": 4128} {"train_loss": -7.22728967666626, "global_step": 173395, "epoch": 4128} {"train_loss": -6.924152374267578, "global_step": 173396, "epoch": 4128} {"train_loss": -7.042489051818848, "global_step": 173397, "epoch": 4128} {"train_loss": -7.06195068359375, "global_step": 173398, "epoch": 4128} {"train_loss": -7.049985885620117, "global_step": 173399, "epoch": 4128} {"train_loss": -6.9395036697387695, "global_step": 173400, "epoch": 4128} {"train_loss": -7.085598468780518, "global_step": 173401, "epoch": 4128} {"train_loss": -7.12265682220459, "global_step": 173402, "epoch": 4128} {"train_loss": -7.016887664794922, "global_step": 173403, "epoch": 4128} {"train_loss": -7.088078498840332, "global_step": 173404, "epoch": 4128} {"train_loss": -7.0473127365112305, "global_step": 173405, "epoch": 4128} {"train_loss": -7.049983024597168, "global_step": 173406, "epoch": 4128} {"train_loss": -7.095367908477783, "global_step": 173407, "epoch": 4128} {"train_loss": -7.192962646484375, "global_step": 173408, "epoch": 4128} {"train_loss": -6.964513301849365, "global_step": 173409, "epoch": 4128} {"train_loss": -6.981982231140137, "global_step": 173410, "epoch": 4128} {"train_loss": -7.079942226409912, "global_step": 173411, "epoch": 4128} {"train_loss": -7.029983997344971, "global_step": 173412, "epoch": 4128} {"train_loss": -7.11297607421875, "global_step": 173413, "epoch": 4128} {"train_loss": -7.157304763793945, "global_step": 173414, "epoch": 4128} {"train_loss": -7.046803951263428, "global_step": 173415, "epoch": 4128} {"train_loss": -6.973729610443115, "global_step": 173416, "epoch": 4128} {"train_loss": -7.073848213468279, "global_step": 173417, "epoch": 4128, "val_loss": 69254.71875} {"train_loss": -6.934520721435547, "global_step": 173418, "epoch": 4129} {"train_loss": -6.842567443847656, "global_step": 173419, "epoch": 4129} {"train_loss": -7.022389888763428, "global_step": 173420, "epoch": 4129} {"train_loss": -7.07720947265625, "global_step": 173421, "epoch": 4129} {"train_loss": -6.962831974029541, "global_step": 173422, "epoch": 4129} {"train_loss": -6.879518985748291, "global_step": 173423, "epoch": 4129} {"train_loss": -6.886194229125977, "global_step": 173424, "epoch": 4129} {"train_loss": -6.958004951477051, "global_step": 173425, "epoch": 4129} {"train_loss": -6.818782806396484, "global_step": 173426, "epoch": 4129} {"train_loss": -7.024388313293457, "global_step": 173427, "epoch": 4129} {"train_loss": -6.992477893829346, "global_step": 173428, "epoch": 4129} {"train_loss": -6.833156108856201, "global_step": 173429, "epoch": 4129} {"train_loss": -6.848590850830078, "global_step": 173430, "epoch": 4129} {"train_loss": -6.906970024108887, "global_step": 173431, "epoch": 4129} {"train_loss": -7.09052848815918, "global_step": 173432, "epoch": 4129} {"train_loss": -6.901959419250488, "global_step": 173433, "epoch": 4129} {"train_loss": -6.983294486999512, "global_step": 173434, "epoch": 4129} {"train_loss": -7.008645057678223, "global_step": 173435, "epoch": 4129} {"train_loss": -6.98348331451416, "global_step": 173436, "epoch": 4129} {"train_loss": -6.893247604370117, "global_step": 173437, "epoch": 4129} {"train_loss": -7.077852249145508, "global_step": 173438, "epoch": 4129} {"train_loss": -6.851041793823242, "global_step": 173439, "epoch": 4129} {"train_loss": -6.981000900268555, "global_step": 173440, "epoch": 4129} {"train_loss": -6.959062576293945, "global_step": 173441, "epoch": 4129} {"train_loss": -7.027618408203125, "global_step": 173442, "epoch": 4129} {"train_loss": -6.989869117736816, "global_step": 173443, "epoch": 4129} {"train_loss": -6.949243545532227, "global_step": 173444, "epoch": 4129} {"train_loss": -6.871894359588623, "global_step": 173445, "epoch": 4129} {"train_loss": -6.9700422286987305, "global_step": 173446, "epoch": 4129} {"train_loss": -6.984867095947266, "global_step": 173447, "epoch": 4129} {"train_loss": -6.971735000610352, "global_step": 173448, "epoch": 4129} {"train_loss": -7.028605937957764, "global_step": 173449, "epoch": 4129} {"train_loss": -7.049666404724121, "global_step": 173450, "epoch": 4129} {"train_loss": -7.015781402587891, "global_step": 173451, "epoch": 4129} {"train_loss": -7.109138011932373, "global_step": 173452, "epoch": 4129} {"train_loss": -6.922771453857422, "global_step": 173453, "epoch": 4129} {"train_loss": -7.10703182220459, "global_step": 173454, "epoch": 4129} {"train_loss": -7.0387187004089355, "global_step": 173455, "epoch": 4129} {"train_loss": -6.982569694519043, "global_step": 173456, "epoch": 4129} {"train_loss": -7.11152458190918, "global_step": 173457, "epoch": 4129} {"train_loss": -7.091607570648193, "global_step": 173458, "epoch": 4129} {"train_loss": -6.977374723979405, "global_step": 173459, "epoch": 4129, "val_loss": 69146.3515625} {"train_loss": -7.016332626342773, "global_step": 173460, "epoch": 4130} {"train_loss": -7.036487579345703, "global_step": 173461, "epoch": 4130} {"train_loss": -6.908648490905762, "global_step": 173462, "epoch": 4130} {"train_loss": -7.061031341552734, "global_step": 173463, "epoch": 4130} {"train_loss": -7.140410423278809, "global_step": 173464, "epoch": 4130} {"train_loss": -7.115748882293701, "global_step": 173465, "epoch": 4130} {"train_loss": -7.077770233154297, "global_step": 173466, "epoch": 4130} {"train_loss": -7.144896507263184, "global_step": 173467, "epoch": 4130} {"train_loss": -7.120955467224121, "global_step": 173468, "epoch": 4130} {"train_loss": -7.123708724975586, "global_step": 173469, "epoch": 4130} {"train_loss": -7.1312456130981445, "global_step": 173470, "epoch": 4130} {"train_loss": -7.092947959899902, "global_step": 173471, "epoch": 4130} {"train_loss": -7.122075080871582, "global_step": 173472, "epoch": 4130} {"train_loss": -7.0615129470825195, "global_step": 173473, "epoch": 4130} {"train_loss": -7.1022419929504395, "global_step": 173474, "epoch": 4130} {"train_loss": -7.120115280151367, "global_step": 173475, "epoch": 4130} {"train_loss": -7.053277015686035, "global_step": 173476, "epoch": 4130} {"train_loss": -7.13151216506958, "global_step": 173477, "epoch": 4130} {"train_loss": -6.962003707885742, "global_step": 173478, "epoch": 4130} {"train_loss": -7.0916595458984375, "global_step": 173479, "epoch": 4130} {"train_loss": -7.1611833572387695, "global_step": 173480, "epoch": 4130} {"train_loss": -7.030287265777588, "global_step": 173481, "epoch": 4130} {"train_loss": -7.043802261352539, "global_step": 173482, "epoch": 4130} {"train_loss": -6.964912414550781, "global_step": 173483, "epoch": 4130} {"train_loss": -7.061387062072754, "global_step": 173484, "epoch": 4130} {"train_loss": -7.037444591522217, "global_step": 173485, "epoch": 4130} {"train_loss": -7.04537296295166, "global_step": 173486, "epoch": 4130} {"train_loss": -7.061201095581055, "global_step": 173487, "epoch": 4130} {"train_loss": -7.003582000732422, "global_step": 173488, "epoch": 4130} {"train_loss": -7.096867561340332, "global_step": 173489, "epoch": 4130} {"train_loss": -7.111192226409912, "global_step": 173490, "epoch": 4130} {"train_loss": -7.073609828948975, "global_step": 173491, "epoch": 4130} {"train_loss": -7.05424165725708, "global_step": 173492, "epoch": 4130} {"train_loss": -7.047984600067139, "global_step": 173493, "epoch": 4130} {"train_loss": -7.1532206535339355, "global_step": 173494, "epoch": 4130} {"train_loss": -6.984928131103516, "global_step": 173495, "epoch": 4130} {"train_loss": -7.090625762939453, "global_step": 173496, "epoch": 4130} {"train_loss": -6.979494571685791, "global_step": 173497, "epoch": 4130} {"train_loss": -7.110283374786377, "global_step": 173498, "epoch": 4130} {"train_loss": -6.868875503540039, "global_step": 173499, "epoch": 4130} {"train_loss": -7.063482284545898, "global_step": 173500, "epoch": 4130} {"train_loss": -7.062546514329457, "global_step": 173501, "epoch": 4130, "val_loss": 69369.5703125} {"train_loss": -7.0554046630859375, "global_step": 173502, "epoch": 4131} {"train_loss": -6.968284606933594, "global_step": 173503, "epoch": 4131} {"train_loss": -6.778684616088867, "global_step": 173504, "epoch": 4131} {"train_loss": -6.8530683517456055, "global_step": 173505, "epoch": 4131} {"train_loss": -7.056879043579102, "global_step": 173506, "epoch": 4131} {"train_loss": -6.829153060913086, "global_step": 173507, "epoch": 4131} {"train_loss": -6.9591193199157715, "global_step": 173508, "epoch": 4131} {"train_loss": -6.877844333648682, "global_step": 173509, "epoch": 4131} {"train_loss": -7.082970142364502, "global_step": 173510, "epoch": 4131} {"train_loss": -6.94844913482666, "global_step": 173511, "epoch": 4131} {"train_loss": -6.8752946853637695, "global_step": 173512, "epoch": 4131} {"train_loss": -6.800426483154297, "global_step": 173513, "epoch": 4131} {"train_loss": -6.9827117919921875, "global_step": 173514, "epoch": 4131} {"train_loss": -6.939798355102539, "global_step": 173515, "epoch": 4131} {"train_loss": -6.928947448730469, "global_step": 173516, "epoch": 4131} {"train_loss": -6.997367858886719, "global_step": 173517, "epoch": 4131} {"train_loss": -7.0288496017456055, "global_step": 173518, "epoch": 4131} {"train_loss": -6.960646152496338, "global_step": 173519, "epoch": 4131} {"train_loss": -7.0438995361328125, "global_step": 173520, "epoch": 4131} {"train_loss": -7.037994384765625, "global_step": 173521, "epoch": 4131} {"train_loss": -6.850630283355713, "global_step": 173522, "epoch": 4131} {"train_loss": -6.924581527709961, "global_step": 173523, "epoch": 4131} {"train_loss": -6.832436561584473, "global_step": 173524, "epoch": 4131} {"train_loss": -6.908143520355225, "global_step": 173525, "epoch": 4131} {"train_loss": -6.979287147521973, "global_step": 173526, "epoch": 4131} {"train_loss": -7.100317001342773, "global_step": 173527, "epoch": 4131} {"train_loss": -7.016663551330566, "global_step": 173528, "epoch": 4131} {"train_loss": -6.9291486740112305, "global_step": 173529, "epoch": 4131} {"train_loss": -7.151325702667236, "global_step": 173530, "epoch": 4131} {"train_loss": -6.833693027496338, "global_step": 173531, "epoch": 4131} {"train_loss": -7.071907997131348, "global_step": 173532, "epoch": 4131} {"train_loss": -7.122243404388428, "global_step": 173533, "epoch": 4131} {"train_loss": -7.050077438354492, "global_step": 173534, "epoch": 4131} {"train_loss": -7.078862190246582, "global_step": 173535, "epoch": 4131} {"train_loss": -7.086099624633789, "global_step": 173536, "epoch": 4131} {"train_loss": -7.052781105041504, "global_step": 173537, "epoch": 4131} {"train_loss": -7.065958023071289, "global_step": 173538, "epoch": 4131} {"train_loss": -6.894854545593262, "global_step": 173539, "epoch": 4131} {"train_loss": -7.135267734527588, "global_step": 173540, "epoch": 4131} {"train_loss": -7.0001630783081055, "global_step": 173541, "epoch": 4131} {"train_loss": -7.043498992919922, "global_step": 173542, "epoch": 4131} {"train_loss": -6.981814032509213, "global_step": 173543, "epoch": 4131, "val_loss": 68929.109375} {"train_loss": -7.0921220779418945, "global_step": 173544, "epoch": 4132} {"train_loss": -7.225356578826904, "global_step": 173545, "epoch": 4132} {"train_loss": -7.0094757080078125, "global_step": 173546, "epoch": 4132} {"train_loss": -7.209734916687012, "global_step": 173547, "epoch": 4132} {"train_loss": -7.210696697235107, "global_step": 173548, "epoch": 4132} {"train_loss": -6.973770618438721, "global_step": 173549, "epoch": 4132} {"train_loss": -7.117525577545166, "global_step": 173550, "epoch": 4132} {"train_loss": -7.060478210449219, "global_step": 173551, "epoch": 4132} {"train_loss": -6.995209217071533, "global_step": 173552, "epoch": 4132} {"train_loss": -7.022782325744629, "global_step": 173553, "epoch": 4132} {"train_loss": -7.01534366607666, "global_step": 173554, "epoch": 4132} {"train_loss": -6.998384952545166, "global_step": 173555, "epoch": 4132} {"train_loss": -7.058125019073486, "global_step": 173556, "epoch": 4132} {"train_loss": -7.131916046142578, "global_step": 173557, "epoch": 4132} {"train_loss": -7.077363967895508, "global_step": 173558, "epoch": 4132} {"train_loss": -7.104178428649902, "global_step": 173559, "epoch": 4132} {"train_loss": -7.142789363861084, "global_step": 173560, "epoch": 4132} {"train_loss": -7.110093116760254, "global_step": 173561, "epoch": 4132} {"train_loss": -7.112611770629883, "global_step": 173562, "epoch": 4132} {"train_loss": -7.052273750305176, "global_step": 173563, "epoch": 4132} {"train_loss": -7.149272441864014, "global_step": 173564, "epoch": 4132} {"train_loss": -7.1736626625061035, "global_step": 173565, "epoch": 4132} {"train_loss": -7.174836158752441, "global_step": 173566, "epoch": 4132} {"train_loss": -7.142576217651367, "global_step": 173567, "epoch": 4132} {"train_loss": -7.150889873504639, "global_step": 173568, "epoch": 4132} {"train_loss": -7.111569881439209, "global_step": 173569, "epoch": 4132} {"train_loss": -7.111579418182373, "global_step": 173570, "epoch": 4132} {"train_loss": -7.114253997802734, "global_step": 173571, "epoch": 4132} {"train_loss": -6.986170768737793, "global_step": 173572, "epoch": 4132} {"train_loss": -7.11426305770874, "global_step": 173573, "epoch": 4132} {"train_loss": -7.073941230773926, "global_step": 173574, "epoch": 4132} {"train_loss": -7.088354110717773, "global_step": 173575, "epoch": 4132} {"train_loss": -6.851511001586914, "global_step": 173576, "epoch": 4132} {"train_loss": -7.094531059265137, "global_step": 173577, "epoch": 4132} {"train_loss": -6.946414947509766, "global_step": 173578, "epoch": 4132} {"train_loss": -6.947229385375977, "global_step": 173579, "epoch": 4132} {"train_loss": -6.945576190948486, "global_step": 173580, "epoch": 4132} {"train_loss": -6.828521728515625, "global_step": 173581, "epoch": 4132} {"train_loss": -6.960139274597168, "global_step": 173582, "epoch": 4132} {"train_loss": -7.032808303833008, "global_step": 173583, "epoch": 4132} {"train_loss": -6.8221588134765625, "global_step": 173584, "epoch": 4132} {"train_loss": -7.061778170721872, "global_step": 173585, "epoch": 4132, "val_loss": 68908.109375} {"train_loss": -7.056979179382324, "global_step": 173586, "epoch": 4133} {"train_loss": -6.972768306732178, "global_step": 173587, "epoch": 4133} {"train_loss": -7.0479841232299805, "global_step": 173588, "epoch": 4133} {"train_loss": -7.0601606369018555, "global_step": 173589, "epoch": 4133} {"train_loss": -6.867938041687012, "global_step": 173590, "epoch": 4133} {"train_loss": -7.015926361083984, "global_step": 173591, "epoch": 4133} {"train_loss": -6.982080459594727, "global_step": 173592, "epoch": 4133} {"train_loss": -6.907553672790527, "global_step": 173593, "epoch": 4133} {"train_loss": -7.035048484802246, "global_step": 173594, "epoch": 4133} {"train_loss": -7.180867671966553, "global_step": 173595, "epoch": 4133} {"train_loss": -6.986559867858887, "global_step": 173596, "epoch": 4133} {"train_loss": -6.970603942871094, "global_step": 173597, "epoch": 4133} {"train_loss": -7.031578063964844, "global_step": 173598, "epoch": 4133} {"train_loss": -6.896007537841797, "global_step": 173599, "epoch": 4133} {"train_loss": -6.92778205871582, "global_step": 173600, "epoch": 4133} {"train_loss": -7.012101650238037, "global_step": 173601, "epoch": 4133} {"train_loss": -6.941169738769531, "global_step": 173602, "epoch": 4133} {"train_loss": -7.043783664703369, "global_step": 173603, "epoch": 4133} {"train_loss": -6.962038040161133, "global_step": 173604, "epoch": 4133} {"train_loss": -7.06404972076416, "global_step": 173605, "epoch": 4133} {"train_loss": -6.975930690765381, "global_step": 173606, "epoch": 4133} {"train_loss": -7.052348613739014, "global_step": 173607, "epoch": 4133} {"train_loss": -7.059438705444336, "global_step": 173608, "epoch": 4133} {"train_loss": -7.037014961242676, "global_step": 173609, "epoch": 4133} {"train_loss": -7.01548957824707, "global_step": 173610, "epoch": 4133} {"train_loss": -7.050369739532471, "global_step": 173611, "epoch": 4133} {"train_loss": -7.1114702224731445, "global_step": 173612, "epoch": 4133} {"train_loss": -6.924651145935059, "global_step": 173613, "epoch": 4133} {"train_loss": -7.016041278839111, "global_step": 173614, "epoch": 4133} {"train_loss": -6.8880486488342285, "global_step": 173615, "epoch": 4133} {"train_loss": -6.981403350830078, "global_step": 173616, "epoch": 4133} {"train_loss": -7.07135009765625, "global_step": 173617, "epoch": 4133} {"train_loss": -6.905534744262695, "global_step": 173618, "epoch": 4133} {"train_loss": -7.028365612030029, "global_step": 173619, "epoch": 4133} {"train_loss": -7.12104606628418, "global_step": 173620, "epoch": 4133} {"train_loss": -7.056951999664307, "global_step": 173621, "epoch": 4133} {"train_loss": -6.991830825805664, "global_step": 173622, "epoch": 4133} {"train_loss": -7.069921970367432, "global_step": 173623, "epoch": 4133} {"train_loss": -7.1467390060424805, "global_step": 173624, "epoch": 4133} {"train_loss": -7.003614902496338, "global_step": 173625, "epoch": 4133} {"train_loss": -7.116148948669434, "global_step": 173626, "epoch": 4133} {"train_loss": -7.0134235336667015, "global_step": 173627, "epoch": 4133, "val_loss": 69164.7421875} {"train_loss": -7.072866439819336, "global_step": 173628, "epoch": 4134} {"train_loss": -6.932135581970215, "global_step": 173629, "epoch": 4134} {"train_loss": -7.021103858947754, "global_step": 173630, "epoch": 4134} {"train_loss": -7.009468078613281, "global_step": 173631, "epoch": 4134} {"train_loss": -7.212395668029785, "global_step": 173632, "epoch": 4134} {"train_loss": -6.9369049072265625, "global_step": 173633, "epoch": 4134} {"train_loss": -6.996552467346191, "global_step": 173634, "epoch": 4134} {"train_loss": -7.060329437255859, "global_step": 173635, "epoch": 4134} {"train_loss": -7.023678779602051, "global_step": 173636, "epoch": 4134} {"train_loss": -7.014997482299805, "global_step": 173637, "epoch": 4134} {"train_loss": -6.995814323425293, "global_step": 173638, "epoch": 4134} {"train_loss": -7.110397815704346, "global_step": 173639, "epoch": 4134} {"train_loss": -7.019711017608643, "global_step": 173640, "epoch": 4134} {"train_loss": -6.9720940589904785, "global_step": 173641, "epoch": 4134} {"train_loss": -6.927746772766113, "global_step": 173642, "epoch": 4134} {"train_loss": -7.019975662231445, "global_step": 173643, "epoch": 4134} {"train_loss": -6.949006080627441, "global_step": 173644, "epoch": 4134} {"train_loss": -6.999523639678955, "global_step": 173645, "epoch": 4134} {"train_loss": -6.9407477378845215, "global_step": 173646, "epoch": 4134} {"train_loss": -6.94638204574585, "global_step": 173647, "epoch": 4134} {"train_loss": -7.0655436515808105, "global_step": 173648, "epoch": 4134} {"train_loss": -6.959175109863281, "global_step": 173649, "epoch": 4134} {"train_loss": -7.128361701965332, "global_step": 173650, "epoch": 4134} {"train_loss": -7.080327033996582, "global_step": 173651, "epoch": 4134} {"train_loss": -7.059318542480469, "global_step": 173652, "epoch": 4134} {"train_loss": -7.113791465759277, "global_step": 173653, "epoch": 4134} {"train_loss": -7.08189582824707, "global_step": 173654, "epoch": 4134} {"train_loss": -7.121335506439209, "global_step": 173655, "epoch": 4134} {"train_loss": -7.128942966461182, "global_step": 173656, "epoch": 4134} {"train_loss": -7.146874904632568, "global_step": 173657, "epoch": 4134} {"train_loss": -7.176689624786377, "global_step": 173658, "epoch": 4134} {"train_loss": -7.061033248901367, "global_step": 173659, "epoch": 4134} {"train_loss": -7.106667518615723, "global_step": 173660, "epoch": 4134} {"train_loss": -7.022619247436523, "global_step": 173661, "epoch": 4134} {"train_loss": -6.977633953094482, "global_step": 173662, "epoch": 4134} {"train_loss": -7.041332244873047, "global_step": 173663, "epoch": 4134} {"train_loss": -6.982098579406738, "global_step": 173664, "epoch": 4134} {"train_loss": -7.073568344116211, "global_step": 173665, "epoch": 4134} {"train_loss": -6.952702522277832, "global_step": 173666, "epoch": 4134} {"train_loss": -7.068298816680908, "global_step": 173667, "epoch": 4134} {"train_loss": -7.222577095031738, "global_step": 173668, "epoch": 4134} {"train_loss": -7.041415089652652, "global_step": 173669, "epoch": 4134, "val_loss": 69076.1796875} {"train_loss": -7.0613508224487305, "global_step": 173670, "epoch": 4135} {"train_loss": -7.172490119934082, "global_step": 173671, "epoch": 4135} {"train_loss": -7.083627700805664, "global_step": 173672, "epoch": 4135} {"train_loss": -7.124948978424072, "global_step": 173673, "epoch": 4135} {"train_loss": -7.003996849060059, "global_step": 173674, "epoch": 4135} {"train_loss": -7.110755920410156, "global_step": 173675, "epoch": 4135} {"train_loss": -6.995598316192627, "global_step": 173676, "epoch": 4135} {"train_loss": -7.091163635253906, "global_step": 173677, "epoch": 4135} {"train_loss": -7.184757232666016, "global_step": 173678, "epoch": 4135} {"train_loss": -7.070918083190918, "global_step": 173679, "epoch": 4135} {"train_loss": -7.079599380493164, "global_step": 173680, "epoch": 4135} {"train_loss": -7.080545902252197, "global_step": 173681, "epoch": 4135} {"train_loss": -7.059698581695557, "global_step": 173682, "epoch": 4135} {"train_loss": -7.061802387237549, "global_step": 173683, "epoch": 4135} {"train_loss": -7.079128265380859, "global_step": 173684, "epoch": 4135} {"train_loss": -7.178496360778809, "global_step": 173685, "epoch": 4135} {"train_loss": -6.967512130737305, "global_step": 173686, "epoch": 4135} {"train_loss": -7.033161640167236, "global_step": 173687, "epoch": 4135} {"train_loss": -7.0306267738342285, "global_step": 173688, "epoch": 4135} {"train_loss": -7.1849446296691895, "global_step": 173689, "epoch": 4135} {"train_loss": -7.038570404052734, "global_step": 173690, "epoch": 4135} {"train_loss": -7.029080867767334, "global_step": 173691, "epoch": 4135} {"train_loss": -7.181112289428711, "global_step": 173692, "epoch": 4135} {"train_loss": -7.0825605392456055, "global_step": 173693, "epoch": 4135} {"train_loss": -7.188422679901123, "global_step": 173694, "epoch": 4135} {"train_loss": -7.045605182647705, "global_step": 173695, "epoch": 4135} {"train_loss": -7.0597734451293945, "global_step": 173696, "epoch": 4135} {"train_loss": -7.178751468658447, "global_step": 173697, "epoch": 4135} {"train_loss": -7.103386878967285, "global_step": 173698, "epoch": 4135} {"train_loss": -7.153707504272461, "global_step": 173699, "epoch": 4135} {"train_loss": -7.197206974029541, "global_step": 173700, "epoch": 4135} {"train_loss": -7.09036111831665, "global_step": 173701, "epoch": 4135} {"train_loss": -7.092459678649902, "global_step": 173702, "epoch": 4135} {"train_loss": -7.256059169769287, "global_step": 173703, "epoch": 4135} {"train_loss": -7.07337760925293, "global_step": 173704, "epoch": 4135} {"train_loss": -7.204741954803467, "global_step": 173705, "epoch": 4135} {"train_loss": -7.132718086242676, "global_step": 173706, "epoch": 4135} {"train_loss": -7.093243598937988, "global_step": 173707, "epoch": 4135} {"train_loss": -7.056705951690674, "global_step": 173708, "epoch": 4135} {"train_loss": -7.1147141456604, "global_step": 173709, "epoch": 4135} {"train_loss": -7.109135150909424, "global_step": 173710, "epoch": 4135} {"train_loss": -7.10124489239284, "global_step": 173711, "epoch": 4135, "val_loss": 69117.8828125} {"train_loss": -7.084745407104492, "global_step": 173712, "epoch": 4136} {"train_loss": -7.212026596069336, "global_step": 173713, "epoch": 4136} {"train_loss": -7.063558578491211, "global_step": 173714, "epoch": 4136} {"train_loss": -7.1545562744140625, "global_step": 173715, "epoch": 4136} {"train_loss": -6.929974555969238, "global_step": 173716, "epoch": 4136} {"train_loss": -7.026703357696533, "global_step": 173717, "epoch": 4136} {"train_loss": -7.030940532684326, "global_step": 173718, "epoch": 4136} {"train_loss": -7.107008934020996, "global_step": 173719, "epoch": 4136} {"train_loss": -6.945742607116699, "global_step": 173720, "epoch": 4136} {"train_loss": -7.098292827606201, "global_step": 173721, "epoch": 4136} {"train_loss": -7.071679592132568, "global_step": 173722, "epoch": 4136} {"train_loss": -6.970705032348633, "global_step": 173723, "epoch": 4136} {"train_loss": -7.015071868896484, "global_step": 173724, "epoch": 4136} {"train_loss": -7.075896263122559, "global_step": 173725, "epoch": 4136} {"train_loss": -6.925736427307129, "global_step": 173726, "epoch": 4136} {"train_loss": -7.095839500427246, "global_step": 173727, "epoch": 4136} {"train_loss": -7.085314750671387, "global_step": 173728, "epoch": 4136} {"train_loss": -6.965762615203857, "global_step": 173729, "epoch": 4136} {"train_loss": -7.082010269165039, "global_step": 173730, "epoch": 4136} {"train_loss": -7.036181926727295, "global_step": 173731, "epoch": 4136} {"train_loss": -6.941337585449219, "global_step": 173732, "epoch": 4136} {"train_loss": -6.888317584991455, "global_step": 173733, "epoch": 4136} {"train_loss": -7.00814151763916, "global_step": 173734, "epoch": 4136} {"train_loss": -6.807819366455078, "global_step": 173735, "epoch": 4136} {"train_loss": -6.809459686279297, "global_step": 173736, "epoch": 4136} {"train_loss": -6.961019515991211, "global_step": 173737, "epoch": 4136} {"train_loss": -6.7420244216918945, "global_step": 173738, "epoch": 4136} {"train_loss": -7.039270401000977, "global_step": 173739, "epoch": 4136} {"train_loss": -6.788954734802246, "global_step": 173740, "epoch": 4136} {"train_loss": -6.936798095703125, "global_step": 173741, "epoch": 4136} {"train_loss": -6.906561851501465, "global_step": 173742, "epoch": 4136} {"train_loss": -6.850470542907715, "global_step": 173743, "epoch": 4136} {"train_loss": -6.859145164489746, "global_step": 173744, "epoch": 4136} {"train_loss": -6.949895858764648, "global_step": 173745, "epoch": 4136} {"train_loss": -6.901371955871582, "global_step": 173746, "epoch": 4136} {"train_loss": -6.932743549346924, "global_step": 173747, "epoch": 4136} {"train_loss": -6.811928749084473, "global_step": 173748, "epoch": 4136} {"train_loss": -7.0774102210998535, "global_step": 173749, "epoch": 4136} {"train_loss": -6.917238712310791, "global_step": 173750, "epoch": 4136} {"train_loss": -6.91515588760376, "global_step": 173751, "epoch": 4136} {"train_loss": -6.9485979080200195, "global_step": 173752, "epoch": 4136} {"train_loss": -6.97627870241801, "global_step": 173753, "epoch": 4136, "val_loss": 68953.265625} {"train_loss": -6.958726406097412, "global_step": 173754, "epoch": 4137} {"train_loss": -6.985641002655029, "global_step": 173755, "epoch": 4137} {"train_loss": -7.038359642028809, "global_step": 173756, "epoch": 4137} {"train_loss": -6.982845306396484, "global_step": 173757, "epoch": 4137} {"train_loss": -7.050265312194824, "global_step": 173758, "epoch": 4137} {"train_loss": -7.037493705749512, "global_step": 173759, "epoch": 4137} {"train_loss": -7.010509490966797, "global_step": 173760, "epoch": 4137} {"train_loss": -7.105695724487305, "global_step": 173761, "epoch": 4137} {"train_loss": -7.007390975952148, "global_step": 173762, "epoch": 4137} {"train_loss": -7.0426740646362305, "global_step": 173763, "epoch": 4137} {"train_loss": -7.027557373046875, "global_step": 173764, "epoch": 4137} {"train_loss": -6.925018310546875, "global_step": 173765, "epoch": 4137} {"train_loss": -6.925205707550049, "global_step": 173766, "epoch": 4137} {"train_loss": -7.171527862548828, "global_step": 173767, "epoch": 4137} {"train_loss": -7.075922012329102, "global_step": 173768, "epoch": 4137} {"train_loss": -7.117386817932129, "global_step": 173769, "epoch": 4137} {"train_loss": -6.953963279724121, "global_step": 173770, "epoch": 4137} {"train_loss": -7.0476908683776855, "global_step": 173771, "epoch": 4137} {"train_loss": -7.089190483093262, "global_step": 173772, "epoch": 4137} {"train_loss": -6.963923454284668, "global_step": 173773, "epoch": 4137} {"train_loss": -6.900591850280762, "global_step": 173774, "epoch": 4137} {"train_loss": -7.081506729125977, "global_step": 173775, "epoch": 4137} {"train_loss": -6.897924423217773, "global_step": 173776, "epoch": 4137} {"train_loss": -7.080348968505859, "global_step": 173777, "epoch": 4137} {"train_loss": -6.87814998626709, "global_step": 173778, "epoch": 4137} {"train_loss": -7.049901008605957, "global_step": 173779, "epoch": 4137} {"train_loss": -7.064565181732178, "global_step": 173780, "epoch": 4137} {"train_loss": -6.980982780456543, "global_step": 173781, "epoch": 4137} {"train_loss": -7.002312660217285, "global_step": 173782, "epoch": 4137} {"train_loss": -6.970044136047363, "global_step": 173783, "epoch": 4137} {"train_loss": -7.048943996429443, "global_step": 173784, "epoch": 4137} {"train_loss": -6.919462203979492, "global_step": 173785, "epoch": 4137} {"train_loss": -6.999043941497803, "global_step": 173786, "epoch": 4137} {"train_loss": -7.004261493682861, "global_step": 173787, "epoch": 4137} {"train_loss": -7.078908920288086, "global_step": 173788, "epoch": 4137} {"train_loss": -7.0646071434021, "global_step": 173789, "epoch": 4137} {"train_loss": -6.984230041503906, "global_step": 173790, "epoch": 4137} {"train_loss": -7.184727668762207, "global_step": 173791, "epoch": 4137} {"train_loss": -7.131836891174316, "global_step": 173792, "epoch": 4137} {"train_loss": -6.9822540283203125, "global_step": 173793, "epoch": 4137} {"train_loss": -7.015937805175781, "global_step": 173794, "epoch": 4137} {"train_loss": -7.020694471540905, "global_step": 173795, "epoch": 4137, "val_loss": 68778.2578125} {"train_loss": -6.987462997436523, "global_step": 173796, "epoch": 4138} {"train_loss": -7.0831122398376465, "global_step": 173797, "epoch": 4138} {"train_loss": -7.108772277832031, "global_step": 173798, "epoch": 4138} {"train_loss": -7.126113414764404, "global_step": 173799, "epoch": 4138} {"train_loss": -7.000560283660889, "global_step": 173800, "epoch": 4138} {"train_loss": -7.0373101234436035, "global_step": 173801, "epoch": 4138} {"train_loss": -7.036468029022217, "global_step": 173802, "epoch": 4138} {"train_loss": -7.024601936340332, "global_step": 173803, "epoch": 4138} {"train_loss": -7.1833906173706055, "global_step": 173804, "epoch": 4138} {"train_loss": -6.996935844421387, "global_step": 173805, "epoch": 4138} {"train_loss": -7.033702850341797, "global_step": 173806, "epoch": 4138} {"train_loss": -7.135102272033691, "global_step": 173807, "epoch": 4138} {"train_loss": -7.101631164550781, "global_step": 173808, "epoch": 4138} {"train_loss": -7.085717678070068, "global_step": 173809, "epoch": 4138} {"train_loss": -7.29917049407959, "global_step": 173810, "epoch": 4138} {"train_loss": -6.951860427856445, "global_step": 173811, "epoch": 4138} {"train_loss": -6.982411861419678, "global_step": 173812, "epoch": 4138} {"train_loss": -7.062941551208496, "global_step": 173813, "epoch": 4138} {"train_loss": -7.176449775695801, "global_step": 173814, "epoch": 4138} {"train_loss": -7.075236797332764, "global_step": 173815, "epoch": 4138} {"train_loss": -7.072903633117676, "global_step": 173816, "epoch": 4138} {"train_loss": -7.109773635864258, "global_step": 173817, "epoch": 4138} {"train_loss": -7.076727867126465, "global_step": 173818, "epoch": 4138} {"train_loss": -7.087801933288574, "global_step": 173819, "epoch": 4138} {"train_loss": -7.162483215332031, "global_step": 173820, "epoch": 4138} {"train_loss": -7.047168731689453, "global_step": 173821, "epoch": 4138} {"train_loss": -6.774023056030273, "global_step": 173822, "epoch": 4138} {"train_loss": -6.97846794128418, "global_step": 173823, "epoch": 4138} {"train_loss": -7.042942047119141, "global_step": 173824, "epoch": 4138} {"train_loss": -6.942068099975586, "global_step": 173825, "epoch": 4138} {"train_loss": -6.947554588317871, "global_step": 173826, "epoch": 4138} {"train_loss": -7.1154398918151855, "global_step": 173827, "epoch": 4138} {"train_loss": -6.961122035980225, "global_step": 173828, "epoch": 4138} {"train_loss": -6.943162441253662, "global_step": 173829, "epoch": 4138} {"train_loss": -6.981671333312988, "global_step": 173830, "epoch": 4138} {"train_loss": -6.969578266143799, "global_step": 173831, "epoch": 4138} {"train_loss": -7.013004302978516, "global_step": 173832, "epoch": 4138} {"train_loss": -6.913930416107178, "global_step": 173833, "epoch": 4138} {"train_loss": -7.023948669433594, "global_step": 173834, "epoch": 4138} {"train_loss": -6.823179244995117, "global_step": 173835, "epoch": 4138} {"train_loss": -6.908424377441406, "global_step": 173836, "epoch": 4138} {"train_loss": -7.0328521728515625, "global_step": 173837, "epoch": 4138, "val_loss": 69237.9453125} {"train_loss": -7.002445220947266, "global_step": 173838, "epoch": 4139} {"train_loss": -6.8704071044921875, "global_step": 173839, "epoch": 4139} {"train_loss": -7.0639872550964355, "global_step": 173840, "epoch": 4139} {"train_loss": -6.936602592468262, "global_step": 173841, "epoch": 4139} {"train_loss": -6.899761199951172, "global_step": 173842, "epoch": 4139} {"train_loss": -7.093197822570801, "global_step": 173843, "epoch": 4139} {"train_loss": -6.858787536621094, "global_step": 173844, "epoch": 4139} {"train_loss": -6.9454731941223145, "global_step": 173845, "epoch": 4139} {"train_loss": -6.968687057495117, "global_step": 173846, "epoch": 4139} {"train_loss": -6.937162399291992, "global_step": 173847, "epoch": 4139} {"train_loss": -6.9557342529296875, "global_step": 173848, "epoch": 4139} {"train_loss": -7.095040321350098, "global_step": 173849, "epoch": 4139} {"train_loss": -6.885101318359375, "global_step": 173850, "epoch": 4139} {"train_loss": -7.011198043823242, "global_step": 173851, "epoch": 4139} {"train_loss": -6.894426345825195, "global_step": 173852, "epoch": 4139} {"train_loss": -6.963679313659668, "global_step": 173853, "epoch": 4139} {"train_loss": -6.887098789215088, "global_step": 173854, "epoch": 4139} {"train_loss": -6.9270195960998535, "global_step": 173855, "epoch": 4139} {"train_loss": -7.051555633544922, "global_step": 173856, "epoch": 4139} {"train_loss": -6.902366638183594, "global_step": 173857, "epoch": 4139} {"train_loss": -7.050438404083252, "global_step": 173858, "epoch": 4139} {"train_loss": -6.938135147094727, "global_step": 173859, "epoch": 4139} {"train_loss": -6.9075775146484375, "global_step": 173860, "epoch": 4139} {"train_loss": -6.890206336975098, "global_step": 173861, "epoch": 4139} {"train_loss": -6.770608901977539, "global_step": 173862, "epoch": 4139} {"train_loss": -6.931020736694336, "global_step": 173863, "epoch": 4139} {"train_loss": -6.8420209884643555, "global_step": 173864, "epoch": 4139} {"train_loss": -6.787172317504883, "global_step": 173865, "epoch": 4139} {"train_loss": -6.9962005615234375, "global_step": 173866, "epoch": 4139} {"train_loss": -6.838122844696045, "global_step": 173867, "epoch": 4139} {"train_loss": -6.7943220138549805, "global_step": 173868, "epoch": 4139} {"train_loss": -6.837268829345703, "global_step": 173869, "epoch": 4139} {"train_loss": -6.8191328048706055, "global_step": 173870, "epoch": 4139} {"train_loss": -6.855122089385986, "global_step": 173871, "epoch": 4139} {"train_loss": -6.871884346008301, "global_step": 173872, "epoch": 4139} {"train_loss": -6.876037120819092, "global_step": 173873, "epoch": 4139} {"train_loss": -6.989969730377197, "global_step": 173874, "epoch": 4139} {"train_loss": -6.975709915161133, "global_step": 173875, "epoch": 4139} {"train_loss": -6.854848384857178, "global_step": 173876, "epoch": 4139} {"train_loss": -6.978508949279785, "global_step": 173877, "epoch": 4139} {"train_loss": -6.943674087524414, "global_step": 173878, "epoch": 4139} {"train_loss": -6.92365821202596, "global_step": 173879, "epoch": 4139, "val_loss": 68934.6484375} {"train_loss": -6.979263782501221, "global_step": 173880, "epoch": 4140} {"train_loss": -7.062355995178223, "global_step": 173881, "epoch": 4140} {"train_loss": -7.033823490142822, "global_step": 173882, "epoch": 4140} {"train_loss": -7.100805282592773, "global_step": 173883, "epoch": 4140} {"train_loss": -6.942008972167969, "global_step": 173884, "epoch": 4140} {"train_loss": -6.939723014831543, "global_step": 173885, "epoch": 4140} {"train_loss": -7.124875068664551, "global_step": 173886, "epoch": 4140} {"train_loss": -6.938299655914307, "global_step": 173887, "epoch": 4140} {"train_loss": -7.066164016723633, "global_step": 173888, "epoch": 4140} {"train_loss": -7.129956245422363, "global_step": 173889, "epoch": 4140} {"train_loss": -7.060041427612305, "global_step": 173890, "epoch": 4140} {"train_loss": -7.121281147003174, "global_step": 173891, "epoch": 4140} {"train_loss": -7.077275276184082, "global_step": 173892, "epoch": 4140} {"train_loss": -7.167223930358887, "global_step": 173893, "epoch": 4140} {"train_loss": -7.1637725830078125, "global_step": 173894, "epoch": 4140} {"train_loss": -7.106286525726318, "global_step": 173895, "epoch": 4140} {"train_loss": -7.152886390686035, "global_step": 173896, "epoch": 4140} {"train_loss": -7.023230075836182, "global_step": 173897, "epoch": 4140} {"train_loss": -7.119974613189697, "global_step": 173898, "epoch": 4140} {"train_loss": -7.119146347045898, "global_step": 173899, "epoch": 4140} {"train_loss": -7.079831123352051, "global_step": 173900, "epoch": 4140} {"train_loss": -7.142788410186768, "global_step": 173901, "epoch": 4140} {"train_loss": -7.036367416381836, "global_step": 173902, "epoch": 4140} {"train_loss": -7.129079818725586, "global_step": 173903, "epoch": 4140} {"train_loss": -7.119187355041504, "global_step": 173904, "epoch": 4140} {"train_loss": -7.037931442260742, "global_step": 173905, "epoch": 4140} {"train_loss": -7.0605645179748535, "global_step": 173906, "epoch": 4140} {"train_loss": -7.104104995727539, "global_step": 173907, "epoch": 4140} {"train_loss": -7.033113479614258, "global_step": 173908, "epoch": 4140} {"train_loss": -6.986268043518066, "global_step": 173909, "epoch": 4140} {"train_loss": -7.068144798278809, "global_step": 173910, "epoch": 4140} {"train_loss": -7.054836273193359, "global_step": 173911, "epoch": 4140} {"train_loss": -7.029843330383301, "global_step": 173912, "epoch": 4140} {"train_loss": -7.067666053771973, "global_step": 173913, "epoch": 4140} {"train_loss": -7.089794635772705, "global_step": 173914, "epoch": 4140} {"train_loss": -6.918718338012695, "global_step": 173915, "epoch": 4140} {"train_loss": -7.140662670135498, "global_step": 173916, "epoch": 4140} {"train_loss": -7.094979286193848, "global_step": 173917, "epoch": 4140} {"train_loss": -7.021234035491943, "global_step": 173918, "epoch": 4140} {"train_loss": -7.152842044830322, "global_step": 173919, "epoch": 4140} {"train_loss": -6.933635711669922, "global_step": 173920, "epoch": 4140} {"train_loss": -7.065537600290208, "global_step": 173921, "epoch": 4140, "val_loss": 69104.65625} {"train_loss": -7.022109508514404, "global_step": 173922, "epoch": 4141} {"train_loss": -7.19818115234375, "global_step": 173923, "epoch": 4141} {"train_loss": -7.052344799041748, "global_step": 173924, "epoch": 4141} {"train_loss": -6.999507904052734, "global_step": 173925, "epoch": 4141} {"train_loss": -7.070640563964844, "global_step": 173926, "epoch": 4141} {"train_loss": -7.045004844665527, "global_step": 173927, "epoch": 4141} {"train_loss": -7.1420488357543945, "global_step": 173928, "epoch": 4141} {"train_loss": -7.051109313964844, "global_step": 173929, "epoch": 4141} {"train_loss": -7.022941589355469, "global_step": 173930, "epoch": 4141} {"train_loss": -7.043287754058838, "global_step": 173931, "epoch": 4141} {"train_loss": -7.048304557800293, "global_step": 173932, "epoch": 4141} {"train_loss": -7.03195858001709, "global_step": 173933, "epoch": 4141} {"train_loss": -7.1555304527282715, "global_step": 173934, "epoch": 4141} {"train_loss": -7.027843952178955, "global_step": 173935, "epoch": 4141} {"train_loss": -6.947238922119141, "global_step": 173936, "epoch": 4141} {"train_loss": -6.959850311279297, "global_step": 173937, "epoch": 4141} {"train_loss": -7.148303031921387, "global_step": 173938, "epoch": 4141} {"train_loss": -6.972063064575195, "global_step": 173939, "epoch": 4141} {"train_loss": -7.135807991027832, "global_step": 173940, "epoch": 4141} {"train_loss": -6.939009666442871, "global_step": 173941, "epoch": 4141} {"train_loss": -7.000649452209473, "global_step": 173942, "epoch": 4141} {"train_loss": -7.111503601074219, "global_step": 173943, "epoch": 4141} {"train_loss": -6.966304779052734, "global_step": 173944, "epoch": 4141} {"train_loss": -6.9559173583984375, "global_step": 173945, "epoch": 4141} {"train_loss": -6.9818572998046875, "global_step": 173946, "epoch": 4141} {"train_loss": -6.6858811378479, "global_step": 173947, "epoch": 4141} {"train_loss": -6.968935489654541, "global_step": 173948, "epoch": 4141} {"train_loss": -6.944806098937988, "global_step": 173949, "epoch": 4141} {"train_loss": -6.843052864074707, "global_step": 173950, "epoch": 4141} {"train_loss": -7.064969539642334, "global_step": 173951, "epoch": 4141} {"train_loss": -6.866197109222412, "global_step": 173952, "epoch": 4141} {"train_loss": -6.986420631408691, "global_step": 173953, "epoch": 4141} {"train_loss": -6.943268775939941, "global_step": 173954, "epoch": 4141} {"train_loss": -6.909111976623535, "global_step": 173955, "epoch": 4141} {"train_loss": -6.929778575897217, "global_step": 173956, "epoch": 4141} {"train_loss": -6.933233261108398, "global_step": 173957, "epoch": 4141} {"train_loss": -6.939217567443848, "global_step": 173958, "epoch": 4141} {"train_loss": -6.946636199951172, "global_step": 173959, "epoch": 4141} {"train_loss": -6.920167922973633, "global_step": 173960, "epoch": 4141} {"train_loss": -6.992366790771484, "global_step": 173961, "epoch": 4141} {"train_loss": -6.888060569763184, "global_step": 173962, "epoch": 4141} {"train_loss": -6.9962434995742075, "global_step": 173963, "epoch": 4141, "val_loss": 69118.0625} {"train_loss": -6.850708484649658, "global_step": 173964, "epoch": 4142} {"train_loss": -6.933316230773926, "global_step": 173965, "epoch": 4142} {"train_loss": -7.106078147888184, "global_step": 173966, "epoch": 4142} {"train_loss": -6.978682994842529, "global_step": 173967, "epoch": 4142} {"train_loss": -7.087118625640869, "global_step": 173968, "epoch": 4142} {"train_loss": -6.94584846496582, "global_step": 173969, "epoch": 4142} {"train_loss": -7.022995948791504, "global_step": 173970, "epoch": 4142} {"train_loss": -7.029193878173828, "global_step": 173971, "epoch": 4142} {"train_loss": -7.049154281616211, "global_step": 173972, "epoch": 4142} {"train_loss": -7.126161575317383, "global_step": 173973, "epoch": 4142} {"train_loss": -7.042458534240723, "global_step": 173974, "epoch": 4142} {"train_loss": -7.031716346740723, "global_step": 173975, "epoch": 4142} {"train_loss": -7.2052741050720215, "global_step": 173976, "epoch": 4142} {"train_loss": -6.986800670623779, "global_step": 173977, "epoch": 4142} {"train_loss": -7.112116813659668, "global_step": 173978, "epoch": 4142} {"train_loss": -7.182401657104492, "global_step": 173979, "epoch": 4142} {"train_loss": -7.096393585205078, "global_step": 173980, "epoch": 4142} {"train_loss": -7.072812080383301, "global_step": 173981, "epoch": 4142} {"train_loss": -7.142223358154297, "global_step": 173982, "epoch": 4142} {"train_loss": -7.096771240234375, "global_step": 173983, "epoch": 4142} {"train_loss": -7.127004146575928, "global_step": 173984, "epoch": 4142} {"train_loss": -7.216079235076904, "global_step": 173985, "epoch": 4142} {"train_loss": -7.116364479064941, "global_step": 173986, "epoch": 4142} {"train_loss": -7.010235786437988, "global_step": 173987, "epoch": 4142} {"train_loss": -7.086897850036621, "global_step": 173988, "epoch": 4142} {"train_loss": -7.1163716316223145, "global_step": 173989, "epoch": 4142} {"train_loss": -7.134129524230957, "global_step": 173990, "epoch": 4142} {"train_loss": -7.210378170013428, "global_step": 173991, "epoch": 4142} {"train_loss": -7.031144618988037, "global_step": 173992, "epoch": 4142} {"train_loss": -7.072985649108887, "global_step": 173993, "epoch": 4142} {"train_loss": -7.247324466705322, "global_step": 173994, "epoch": 4142} {"train_loss": -7.15610408782959, "global_step": 173995, "epoch": 4142} {"train_loss": -7.158161640167236, "global_step": 173996, "epoch": 4142} {"train_loss": -7.1872029304504395, "global_step": 173997, "epoch": 4142} {"train_loss": -7.054014205932617, "global_step": 173998, "epoch": 4142} {"train_loss": -7.105677604675293, "global_step": 173999, "epoch": 4142} {"train_loss": -7.152056694030762, "global_step": 174000, "epoch": 4142} {"train_loss": -7.158063888549805, "global_step": 174001, "epoch": 4142} {"train_loss": -7.136927604675293, "global_step": 174002, "epoch": 4142} {"train_loss": -7.190551280975342, "global_step": 174003, "epoch": 4142} {"train_loss": -7.086299896240234, "global_step": 174004, "epoch": 4142} {"train_loss": -7.095323233377366, "global_step": 174005, "epoch": 4142, "val_loss": 68984.6484375} {"train_loss": -7.154695510864258, "global_step": 174006, "epoch": 4143} {"train_loss": -7.091978073120117, "global_step": 174007, "epoch": 4143} {"train_loss": -7.214623928070068, "global_step": 174008, "epoch": 4143} {"train_loss": -7.194765090942383, "global_step": 174009, "epoch": 4143} {"train_loss": -7.177313327789307, "global_step": 174010, "epoch": 4143} {"train_loss": -7.157607555389404, "global_step": 174011, "epoch": 4143} {"train_loss": -7.1395697593688965, "global_step": 174012, "epoch": 4143} {"train_loss": -7.177964210510254, "global_step": 174013, "epoch": 4143} {"train_loss": -7.159296035766602, "global_step": 174014, "epoch": 4143} {"train_loss": -7.065681457519531, "global_step": 174015, "epoch": 4143} {"train_loss": -7.147711277008057, "global_step": 174016, "epoch": 4143} {"train_loss": -7.187130451202393, "global_step": 174017, "epoch": 4143} {"train_loss": -7.0991339683532715, "global_step": 174018, "epoch": 4143} {"train_loss": -7.172167778015137, "global_step": 174019, "epoch": 4143} {"train_loss": -7.178112030029297, "global_step": 174020, "epoch": 4143} {"train_loss": -7.17764949798584, "global_step": 174021, "epoch": 4143} {"train_loss": -7.1428046226501465, "global_step": 174022, "epoch": 4143} {"train_loss": -7.170318603515625, "global_step": 174023, "epoch": 4143} {"train_loss": -7.003225803375244, "global_step": 174024, "epoch": 4143} {"train_loss": -7.0735979080200195, "global_step": 174025, "epoch": 4143} {"train_loss": -7.008890151977539, "global_step": 174026, "epoch": 4143} {"train_loss": -7.027247428894043, "global_step": 174027, "epoch": 4143} {"train_loss": -6.951857566833496, "global_step": 174028, "epoch": 4143} {"train_loss": -6.976739883422852, "global_step": 174029, "epoch": 4143} {"train_loss": -7.127100944519043, "global_step": 174030, "epoch": 4143} {"train_loss": -6.990478992462158, "global_step": 174031, "epoch": 4143} {"train_loss": -7.011040210723877, "global_step": 174032, "epoch": 4143} {"train_loss": -7.001396179199219, "global_step": 174033, "epoch": 4143} {"train_loss": -6.923696517944336, "global_step": 174034, "epoch": 4143} {"train_loss": -7.141023635864258, "global_step": 174035, "epoch": 4143} {"train_loss": -7.053160667419434, "global_step": 174036, "epoch": 4143} {"train_loss": -7.013487339019775, "global_step": 174037, "epoch": 4143} {"train_loss": -7.14755916595459, "global_step": 174038, "epoch": 4143} {"train_loss": -7.070295333862305, "global_step": 174039, "epoch": 4143} {"train_loss": -7.085616111755371, "global_step": 174040, "epoch": 4143} {"train_loss": -7.120485305786133, "global_step": 174041, "epoch": 4143} {"train_loss": -6.922451972961426, "global_step": 174042, "epoch": 4143} {"train_loss": -7.039252281188965, "global_step": 174043, "epoch": 4143} {"train_loss": -7.057953834533691, "global_step": 174044, "epoch": 4143} {"train_loss": -6.94697380065918, "global_step": 174045, "epoch": 4143} {"train_loss": -7.116546630859375, "global_step": 174046, "epoch": 4143} {"train_loss": -7.085184494654338, "global_step": 174047, "epoch": 4143, "val_loss": 69179.1640625} {"train_loss": -7.035674095153809, "global_step": 174048, "epoch": 4144} {"train_loss": -6.99835729598999, "global_step": 174049, "epoch": 4144} {"train_loss": -6.967054843902588, "global_step": 174050, "epoch": 4144} {"train_loss": -7.047432899475098, "global_step": 174051, "epoch": 4144} {"train_loss": -7.087416648864746, "global_step": 174052, "epoch": 4144} {"train_loss": -6.877507209777832, "global_step": 174053, "epoch": 4144} {"train_loss": -7.059826850891113, "global_step": 174054, "epoch": 4144} {"train_loss": -6.981069087982178, "global_step": 174055, "epoch": 4144} {"train_loss": -6.90367317199707, "global_step": 174056, "epoch": 4144} {"train_loss": -6.949162006378174, "global_step": 174057, "epoch": 4144} {"train_loss": -7.080555438995361, "global_step": 174058, "epoch": 4144} {"train_loss": -6.992951393127441, "global_step": 174059, "epoch": 4144} {"train_loss": -6.998296737670898, "global_step": 174060, "epoch": 4144} {"train_loss": -7.0593461990356445, "global_step": 174061, "epoch": 4144} {"train_loss": -7.0329718589782715, "global_step": 174062, "epoch": 4144} {"train_loss": -7.04364013671875, "global_step": 174063, "epoch": 4144} {"train_loss": -7.034124374389648, "global_step": 174064, "epoch": 4144} {"train_loss": -7.033784866333008, "global_step": 174065, "epoch": 4144} {"train_loss": -7.121301174163818, "global_step": 174066, "epoch": 4144} {"train_loss": -7.053623199462891, "global_step": 174067, "epoch": 4144} {"train_loss": -7.10599422454834, "global_step": 174068, "epoch": 4144} {"train_loss": -7.109396934509277, "global_step": 174069, "epoch": 4144} {"train_loss": -7.2042646408081055, "global_step": 174070, "epoch": 4144} {"train_loss": -7.118851661682129, "global_step": 174071, "epoch": 4144} {"train_loss": -7.1441192626953125, "global_step": 174072, "epoch": 4144} {"train_loss": -7.062770843505859, "global_step": 174073, "epoch": 4144} {"train_loss": -7.036537170410156, "global_step": 174074, "epoch": 4144} {"train_loss": -7.234026908874512, "global_step": 174075, "epoch": 4144} {"train_loss": -7.139447212219238, "global_step": 174076, "epoch": 4144} {"train_loss": -7.120089530944824, "global_step": 174077, "epoch": 4144} {"train_loss": -7.015311241149902, "global_step": 174078, "epoch": 4144} {"train_loss": -7.116824626922607, "global_step": 174079, "epoch": 4144} {"train_loss": -7.03185510635376, "global_step": 174080, "epoch": 4144} {"train_loss": -7.099558353424072, "global_step": 174081, "epoch": 4144} {"train_loss": -7.112801551818848, "global_step": 174082, "epoch": 4144} {"train_loss": -7.120883941650391, "global_step": 174083, "epoch": 4144} {"train_loss": -7.034204483032227, "global_step": 174084, "epoch": 4144} {"train_loss": -7.012869834899902, "global_step": 174085, "epoch": 4144} {"train_loss": -7.024649143218994, "global_step": 174086, "epoch": 4144} {"train_loss": -7.118939399719238, "global_step": 174087, "epoch": 4144} {"train_loss": -7.128547191619873, "global_step": 174088, "epoch": 4144} {"train_loss": -7.057431062062581, "global_step": 174089, "epoch": 4144, "val_loss": 69187.859375} {"train_loss": -7.195491790771484, "global_step": 174090, "epoch": 4145} {"train_loss": -7.121448516845703, "global_step": 174091, "epoch": 4145} {"train_loss": -7.1944804191589355, "global_step": 174092, "epoch": 4145} {"train_loss": -7.3195719718933105, "global_step": 174093, "epoch": 4145} {"train_loss": -7.153364181518555, "global_step": 174094, "epoch": 4145} {"train_loss": -7.13109827041626, "global_step": 174095, "epoch": 4145} {"train_loss": -6.979898929595947, "global_step": 174096, "epoch": 4145} {"train_loss": -7.242346286773682, "global_step": 174097, "epoch": 4145} {"train_loss": -7.102388381958008, "global_step": 174098, "epoch": 4145} {"train_loss": -7.070875644683838, "global_step": 174099, "epoch": 4145} {"train_loss": -7.0781755447387695, "global_step": 174100, "epoch": 4145} {"train_loss": -7.1349897384643555, "global_step": 174101, "epoch": 4145} {"train_loss": -7.157312393188477, "global_step": 174102, "epoch": 4145} {"train_loss": -7.16448450088501, "global_step": 174103, "epoch": 4145} {"train_loss": -7.057670593261719, "global_step": 174104, "epoch": 4145} {"train_loss": -7.056657791137695, "global_step": 174105, "epoch": 4145} {"train_loss": -7.155388832092285, "global_step": 174106, "epoch": 4145} {"train_loss": -7.198505401611328, "global_step": 174107, "epoch": 4145} {"train_loss": -7.069735527038574, "global_step": 174108, "epoch": 4145} {"train_loss": -7.120264053344727, "global_step": 174109, "epoch": 4145} {"train_loss": -7.240599632263184, "global_step": 174110, "epoch": 4145} {"train_loss": -7.111799240112305, "global_step": 174111, "epoch": 4145} {"train_loss": -7.068842887878418, "global_step": 174112, "epoch": 4145} {"train_loss": -7.057727336883545, "global_step": 174113, "epoch": 4145} {"train_loss": -6.992623329162598, "global_step": 174114, "epoch": 4145} {"train_loss": -7.005958557128906, "global_step": 174115, "epoch": 4145} {"train_loss": -6.998780250549316, "global_step": 174116, "epoch": 4145} {"train_loss": -7.078153610229492, "global_step": 174117, "epoch": 4145} {"train_loss": -6.958075046539307, "global_step": 174118, "epoch": 4145} {"train_loss": -7.099409103393555, "global_step": 174119, "epoch": 4145} {"train_loss": -7.073081016540527, "global_step": 174120, "epoch": 4145} {"train_loss": -7.204680442810059, "global_step": 174121, "epoch": 4145} {"train_loss": -7.030284881591797, "global_step": 174122, "epoch": 4145} {"train_loss": -7.123204231262207, "global_step": 174123, "epoch": 4145} {"train_loss": -7.129917144775391, "global_step": 174124, "epoch": 4145} {"train_loss": -7.17441987991333, "global_step": 174125, "epoch": 4145} {"train_loss": -7.081372261047363, "global_step": 174126, "epoch": 4145} {"train_loss": -7.038900375366211, "global_step": 174127, "epoch": 4145} {"train_loss": -7.06116247177124, "global_step": 174128, "epoch": 4145} {"train_loss": -7.0660295486450195, "global_step": 174129, "epoch": 4145} {"train_loss": -7.063407897949219, "global_step": 174130, "epoch": 4145} {"train_loss": -7.103323754810152, "global_step": 174131, "epoch": 4145, "val_loss": 69108.3515625} {"train_loss": -7.1347761154174805, "global_step": 174132, "epoch": 4146} {"train_loss": -6.997925281524658, "global_step": 174133, "epoch": 4146} {"train_loss": -7.03997802734375, "global_step": 174134, "epoch": 4146} {"train_loss": -6.950272560119629, "global_step": 174135, "epoch": 4146} {"train_loss": -7.052773952484131, "global_step": 174136, "epoch": 4146} {"train_loss": -7.040236949920654, "global_step": 174137, "epoch": 4146} {"train_loss": -7.039046287536621, "global_step": 174138, "epoch": 4146} {"train_loss": -6.865746974945068, "global_step": 174139, "epoch": 4146} {"train_loss": -7.117824077606201, "global_step": 174140, "epoch": 4146} {"train_loss": -6.97613000869751, "global_step": 174141, "epoch": 4146} {"train_loss": -7.006497383117676, "global_step": 174142, "epoch": 4146} {"train_loss": -7.058079242706299, "global_step": 174143, "epoch": 4146} {"train_loss": -7.066531181335449, "global_step": 174144, "epoch": 4146} {"train_loss": -7.122209548950195, "global_step": 174145, "epoch": 4146} {"train_loss": -7.051933288574219, "global_step": 174146, "epoch": 4146} {"train_loss": -7.106734275817871, "global_step": 174147, "epoch": 4146} {"train_loss": -7.082879066467285, "global_step": 174148, "epoch": 4146} {"train_loss": -7.042611122131348, "global_step": 174149, "epoch": 4146} {"train_loss": -7.014964580535889, "global_step": 174150, "epoch": 4146} {"train_loss": -7.06171989440918, "global_step": 174151, "epoch": 4146} {"train_loss": -7.055805206298828, "global_step": 174152, "epoch": 4146} {"train_loss": -6.898581504821777, "global_step": 174153, "epoch": 4146} {"train_loss": -7.101004600524902, "global_step": 174154, "epoch": 4146} {"train_loss": -7.1254425048828125, "global_step": 174155, "epoch": 4146} {"train_loss": -7.158018589019775, "global_step": 174156, "epoch": 4146} {"train_loss": -7.134572982788086, "global_step": 174157, "epoch": 4146} {"train_loss": -7.0338287353515625, "global_step": 174158, "epoch": 4146} {"train_loss": -7.08934211730957, "global_step": 174159, "epoch": 4146} {"train_loss": -7.062355041503906, "global_step": 174160, "epoch": 4146} {"train_loss": -7.086648941040039, "global_step": 174161, "epoch": 4146} {"train_loss": -7.060998916625977, "global_step": 174162, "epoch": 4146} {"train_loss": -7.006006240844727, "global_step": 174163, "epoch": 4146} {"train_loss": -7.068055152893066, "global_step": 174164, "epoch": 4146} {"train_loss": -7.1110992431640625, "global_step": 174165, "epoch": 4146} {"train_loss": -7.202487945556641, "global_step": 174166, "epoch": 4146} {"train_loss": -7.025777339935303, "global_step": 174167, "epoch": 4146} {"train_loss": -7.057201385498047, "global_step": 174168, "epoch": 4146} {"train_loss": -7.08186149597168, "global_step": 174169, "epoch": 4146} {"train_loss": -7.086769104003906, "global_step": 174170, "epoch": 4146} {"train_loss": -7.126665115356445, "global_step": 174171, "epoch": 4146} {"train_loss": -7.1820068359375, "global_step": 174172, "epoch": 4146} {"train_loss": -7.063713073730469, "global_step": 174173, "epoch": 4146, "val_loss": 68898.9921875} {"train_loss": -7.085200309753418, "global_step": 174174, "epoch": 4147} {"train_loss": -7.0274810791015625, "global_step": 174175, "epoch": 4147} {"train_loss": -6.868207931518555, "global_step": 174176, "epoch": 4147} {"train_loss": -7.030874252319336, "global_step": 174177, "epoch": 4147} {"train_loss": -7.145258903503418, "global_step": 174178, "epoch": 4147} {"train_loss": -6.977617263793945, "global_step": 174179, "epoch": 4147} {"train_loss": -7.031036853790283, "global_step": 174180, "epoch": 4147} {"train_loss": -6.958088397979736, "global_step": 174181, "epoch": 4147} {"train_loss": -7.1522603034973145, "global_step": 174182, "epoch": 4147} {"train_loss": -7.146431922912598, "global_step": 174183, "epoch": 4147} {"train_loss": -6.955514907836914, "global_step": 174184, "epoch": 4147} {"train_loss": -7.082849502563477, "global_step": 174185, "epoch": 4147} {"train_loss": -7.09982967376709, "global_step": 174186, "epoch": 4147} {"train_loss": -6.885125160217285, "global_step": 174187, "epoch": 4147} {"train_loss": -7.133296966552734, "global_step": 174188, "epoch": 4147} {"train_loss": -6.977563858032227, "global_step": 174189, "epoch": 4147} {"train_loss": -6.931073188781738, "global_step": 174190, "epoch": 4147} {"train_loss": -7.0413055419921875, "global_step": 174191, "epoch": 4147} {"train_loss": -6.898293495178223, "global_step": 174192, "epoch": 4147} {"train_loss": -7.028486728668213, "global_step": 174193, "epoch": 4147} {"train_loss": -7.003697395324707, "global_step": 174194, "epoch": 4147} {"train_loss": -6.987113952636719, "global_step": 174195, "epoch": 4147} {"train_loss": -6.988747596740723, "global_step": 174196, "epoch": 4147} {"train_loss": -6.9491190910339355, "global_step": 174197, "epoch": 4147} {"train_loss": -6.897887229919434, "global_step": 174198, "epoch": 4147} {"train_loss": -7.082923412322998, "global_step": 174199, "epoch": 4147} {"train_loss": -6.9211506843566895, "global_step": 174200, "epoch": 4147} {"train_loss": -7.074836730957031, "global_step": 174201, "epoch": 4147} {"train_loss": -7.120361804962158, "global_step": 174202, "epoch": 4147} {"train_loss": -7.035084247589111, "global_step": 174203, "epoch": 4147} {"train_loss": -7.015904426574707, "global_step": 174204, "epoch": 4147} {"train_loss": -7.0765862464904785, "global_step": 174205, "epoch": 4147} {"train_loss": -7.0488433837890625, "global_step": 174206, "epoch": 4147} {"train_loss": -7.078217506408691, "global_step": 174207, "epoch": 4147} {"train_loss": -7.068977355957031, "global_step": 174208, "epoch": 4147} {"train_loss": -7.136474609375, "global_step": 174209, "epoch": 4147} {"train_loss": -7.107912540435791, "global_step": 174210, "epoch": 4147} {"train_loss": -7.141641616821289, "global_step": 174211, "epoch": 4147} {"train_loss": -7.051487445831299, "global_step": 174212, "epoch": 4147} {"train_loss": -7.129137992858887, "global_step": 174213, "epoch": 4147} {"train_loss": -7.035450458526611, "global_step": 174214, "epoch": 4147} {"train_loss": -7.031509842191424, "global_step": 174215, "epoch": 4147, "val_loss": 69031.5859375} {"train_loss": -7.140348434448242, "global_step": 174216, "epoch": 4148} {"train_loss": -7.0589752197265625, "global_step": 174217, "epoch": 4148} {"train_loss": -7.089338302612305, "global_step": 174218, "epoch": 4148} {"train_loss": -7.071739196777344, "global_step": 174219, "epoch": 4148} {"train_loss": -7.057453155517578, "global_step": 174220, "epoch": 4148} {"train_loss": -7.165938377380371, "global_step": 174221, "epoch": 4148} {"train_loss": -7.065127372741699, "global_step": 174222, "epoch": 4148} {"train_loss": -7.104518413543701, "global_step": 174223, "epoch": 4148} {"train_loss": -6.979193687438965, "global_step": 174224, "epoch": 4148} {"train_loss": -7.121640682220459, "global_step": 174225, "epoch": 4148} {"train_loss": -7.088627815246582, "global_step": 174226, "epoch": 4148} {"train_loss": -7.061223983764648, "global_step": 174227, "epoch": 4148} {"train_loss": -7.1893086433410645, "global_step": 174228, "epoch": 4148} {"train_loss": -7.114880561828613, "global_step": 174229, "epoch": 4148} {"train_loss": -7.044571876525879, "global_step": 174230, "epoch": 4148} {"train_loss": -7.229962348937988, "global_step": 174231, "epoch": 4148} {"train_loss": -7.137941360473633, "global_step": 174232, "epoch": 4148} {"train_loss": -7.056633949279785, "global_step": 174233, "epoch": 4148} {"train_loss": -7.17592716217041, "global_step": 174234, "epoch": 4148} {"train_loss": -7.02742338180542, "global_step": 174235, "epoch": 4148} {"train_loss": -7.134215354919434, "global_step": 174236, "epoch": 4148} {"train_loss": -7.1468682289123535, "global_step": 174237, "epoch": 4148} {"train_loss": -7.119552135467529, "global_step": 174238, "epoch": 4148} {"train_loss": -7.057158470153809, "global_step": 174239, "epoch": 4148} {"train_loss": -7.003145217895508, "global_step": 174240, "epoch": 4148} {"train_loss": -7.054826736450195, "global_step": 174241, "epoch": 4148} {"train_loss": -7.117514610290527, "global_step": 174242, "epoch": 4148} {"train_loss": -7.021679878234863, "global_step": 174243, "epoch": 4148} {"train_loss": -6.913830757141113, "global_step": 174244, "epoch": 4148} {"train_loss": -7.079824924468994, "global_step": 174245, "epoch": 4148} {"train_loss": -7.020069122314453, "global_step": 174246, "epoch": 4148} {"train_loss": -7.011980056762695, "global_step": 174247, "epoch": 4148} {"train_loss": -7.073001861572266, "global_step": 174248, "epoch": 4148} {"train_loss": -6.938141822814941, "global_step": 174249, "epoch": 4148} {"train_loss": -7.1008758544921875, "global_step": 174250, "epoch": 4148} {"train_loss": -7.094363212585449, "global_step": 174251, "epoch": 4148} {"train_loss": -7.028187274932861, "global_step": 174252, "epoch": 4148} {"train_loss": -7.032353401184082, "global_step": 174253, "epoch": 4148} {"train_loss": -7.072937965393066, "global_step": 174254, "epoch": 4148} {"train_loss": -7.024465560913086, "global_step": 174255, "epoch": 4148} {"train_loss": -6.883695602416992, "global_step": 174256, "epoch": 4148} {"train_loss": -7.069320031574795, "global_step": 174257, "epoch": 4148, "val_loss": 69084.2421875} {"train_loss": -6.9638495445251465, "global_step": 174258, "epoch": 4149} {"train_loss": -6.957979202270508, "global_step": 174259, "epoch": 4149} {"train_loss": -6.913904190063477, "global_step": 174260, "epoch": 4149} {"train_loss": -7.099725246429443, "global_step": 174261, "epoch": 4149} {"train_loss": -6.960738182067871, "global_step": 174262, "epoch": 4149} {"train_loss": -6.859546184539795, "global_step": 174263, "epoch": 4149} {"train_loss": -6.903408527374268, "global_step": 174264, "epoch": 4149} {"train_loss": -7.002300262451172, "global_step": 174265, "epoch": 4149} {"train_loss": -6.975214958190918, "global_step": 174266, "epoch": 4149} {"train_loss": -6.955533981323242, "global_step": 174267, "epoch": 4149} {"train_loss": -6.872769355773926, "global_step": 174268, "epoch": 4149} {"train_loss": -6.962146759033203, "global_step": 174269, "epoch": 4149} {"train_loss": -6.964210510253906, "global_step": 174270, "epoch": 4149} {"train_loss": -7.010617733001709, "global_step": 174271, "epoch": 4149} {"train_loss": -6.954534530639648, "global_step": 174272, "epoch": 4149} {"train_loss": -7.054638862609863, "global_step": 174273, "epoch": 4149} {"train_loss": -7.027098655700684, "global_step": 174274, "epoch": 4149} {"train_loss": -6.9842705726623535, "global_step": 174275, "epoch": 4149} {"train_loss": -7.122065544128418, "global_step": 174276, "epoch": 4149} {"train_loss": -6.941365718841553, "global_step": 174277, "epoch": 4149} {"train_loss": -7.015224456787109, "global_step": 174278, "epoch": 4149} {"train_loss": -7.030297756195068, "global_step": 174279, "epoch": 4149} {"train_loss": -6.947162628173828, "global_step": 174280, "epoch": 4149} {"train_loss": -7.1226067543029785, "global_step": 174281, "epoch": 4149} {"train_loss": -6.889958381652832, "global_step": 174282, "epoch": 4149} {"train_loss": -6.936850547790527, "global_step": 174283, "epoch": 4149} {"train_loss": -7.049752235412598, "global_step": 174284, "epoch": 4149} {"train_loss": -6.98263692855835, "global_step": 174285, "epoch": 4149} {"train_loss": -6.979430675506592, "global_step": 174286, "epoch": 4149} {"train_loss": -7.001513481140137, "global_step": 174287, "epoch": 4149} {"train_loss": -7.048259735107422, "global_step": 174288, "epoch": 4149} {"train_loss": -7.086836814880371, "global_step": 174289, "epoch": 4149} {"train_loss": -7.132250785827637, "global_step": 174290, "epoch": 4149} {"train_loss": -7.107421875, "global_step": 174291, "epoch": 4149} {"train_loss": -7.054160118103027, "global_step": 174292, "epoch": 4149} {"train_loss": -7.161770820617676, "global_step": 174293, "epoch": 4149} {"train_loss": -7.032304763793945, "global_step": 174294, "epoch": 4149} {"train_loss": -7.125705242156982, "global_step": 174295, "epoch": 4149} {"train_loss": -7.062547206878662, "global_step": 174296, "epoch": 4149} {"train_loss": -7.071486473083496, "global_step": 174297, "epoch": 4149} {"train_loss": -7.123225688934326, "global_step": 174298, "epoch": 4149} {"train_loss": -7.0122348581041605, "global_step": 174299, "epoch": 4149, "val_loss": 69007.6796875} {"train_loss": -7.014272212982178, "global_step": 174300, "epoch": 4150} {"train_loss": -7.070770263671875, "global_step": 174301, "epoch": 4150} {"train_loss": -7.072347640991211, "global_step": 174302, "epoch": 4150} {"train_loss": -7.051183700561523, "global_step": 174303, "epoch": 4150} {"train_loss": -7.029960632324219, "global_step": 174304, "epoch": 4150} {"train_loss": -7.195955753326416, "global_step": 174305, "epoch": 4150} {"train_loss": -7.082257270812988, "global_step": 174306, "epoch": 4150} {"train_loss": -7.037481784820557, "global_step": 174307, "epoch": 4150} {"train_loss": -7.065268516540527, "global_step": 174308, "epoch": 4150} {"train_loss": -7.123346328735352, "global_step": 174309, "epoch": 4150} {"train_loss": -7.096778392791748, "global_step": 174310, "epoch": 4150} {"train_loss": -7.112957954406738, "global_step": 174311, "epoch": 4150} {"train_loss": -6.984129905700684, "global_step": 174312, "epoch": 4150} {"train_loss": -7.112959384918213, "global_step": 174313, "epoch": 4150} {"train_loss": -7.148581504821777, "global_step": 174314, "epoch": 4150} {"train_loss": -7.091952323913574, "global_step": 174315, "epoch": 4150} {"train_loss": -7.104730129241943, "global_step": 174316, "epoch": 4150} {"train_loss": -7.085732460021973, "global_step": 174317, "epoch": 4150} {"train_loss": -6.984807968139648, "global_step": 174318, "epoch": 4150} {"train_loss": -7.097654819488525, "global_step": 174319, "epoch": 4150} {"train_loss": -7.060548782348633, "global_step": 174320, "epoch": 4150} {"train_loss": -6.978376388549805, "global_step": 174321, "epoch": 4150} {"train_loss": -7.197617530822754, "global_step": 174322, "epoch": 4150} {"train_loss": -7.016095161437988, "global_step": 174323, "epoch": 4150} {"train_loss": -7.101378440856934, "global_step": 174324, "epoch": 4150} {"train_loss": -7.116117477416992, "global_step": 174325, "epoch": 4150} {"train_loss": -7.025162696838379, "global_step": 174326, "epoch": 4150} {"train_loss": -7.038299083709717, "global_step": 174327, "epoch": 4150} {"train_loss": -6.97631311416626, "global_step": 174328, "epoch": 4150} {"train_loss": -7.094291687011719, "global_step": 174329, "epoch": 4150} {"train_loss": -7.017584800720215, "global_step": 174330, "epoch": 4150} {"train_loss": -7.045714378356934, "global_step": 174331, "epoch": 4150} {"train_loss": -7.068264007568359, "global_step": 174332, "epoch": 4150} {"train_loss": -7.025693416595459, "global_step": 174333, "epoch": 4150} {"train_loss": -7.084317684173584, "global_step": 174334, "epoch": 4150} {"train_loss": -7.133145332336426, "global_step": 174335, "epoch": 4150} {"train_loss": -7.002359390258789, "global_step": 174336, "epoch": 4150} {"train_loss": -6.987786293029785, "global_step": 174337, "epoch": 4150} {"train_loss": -7.078400611877441, "global_step": 174338, "epoch": 4150} {"train_loss": -7.13704776763916, "global_step": 174339, "epoch": 4150} {"train_loss": -7.062475681304932, "global_step": 174340, "epoch": 4150} {"train_loss": -7.06946587562561, "global_step": 174341, "epoch": 4150, "train/sim_max_reward_0": 0.8807393747569187, "train/sim_max_reward_1": 0.7315243086749588, "train/sim_max_reward_2": 0.7001831313045589, "train/sim_max_reward_3": 0.9787318589333264, "train/sim_max_reward_4": 0.9833798744496318, "train/sim_max_reward_5": 0.8970335548800277, "test/sim_max_reward_4300000": 0.7278928025662756, "test/sim_max_reward_4300001": 0.4371280578888722, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9575516380111684, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3244690568127945, "test/sim_max_reward_4300008": 1.0, "test/sim_max_reward_4300009": 0.8768711909198965, "test/sim_max_reward_4300010": 1.0, "test/sim_max_reward_4300011": 0.6429097707082946, "test/sim_max_reward_4300012": 0.8636934190129772, "test/sim_max_reward_4300013": 0.8787300832555626, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9848627769871144, "test/sim_max_reward_4300016": 1.0, "test/sim_max_reward_4300017": 0.9100429429112393, "test/sim_max_reward_4300018": 0.40295692867257793, "test/sim_max_reward_4300019": 0.1860273389921517, "test/sim_max_reward_4300020": 0.004934028119203437, "test/sim_max_reward_4300021": 0.9917137141835184, "test/sim_max_reward_4300022": 0.9652263780148689, "test/sim_max_reward_4300023": 0.7350209828406821, "test/sim_max_reward_4300024": 1.0, "test/sim_max_reward_4300025": 0.9843194909138253, "test/sim_max_reward_4300026": 0.08310898186605874, "test/sim_max_reward_4300027": 0.9246993276968289, "test/sim_max_reward_4300028": 0.08294085715828702, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.2931891041623217, "test/sim_max_reward_4300031": 0.6446661403519546, "test/sim_max_reward_4300032": 0.947853617212256, "test/sim_max_reward_4300033": 1.0, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.9411440759995696, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.8769004388296946, "test/sim_max_reward_4300038": 0.5748328517132888, "test/sim_max_reward_4300039": 0.8027435915763204, "test/sim_max_reward_4300040": 0.7671845712235609, "test/sim_max_reward_4300041": 0.9066218050172095, "test/sim_max_reward_4300042": 0.477105117553513, "test/sim_max_reward_4300043": 0.01912165197990456, "test/sim_max_reward_4300044": 0.915487044878626, "test/sim_max_reward_4300045": 0.17831221852617676, "test/sim_max_reward_4300046": 0.16069392896571805, "test/sim_max_reward_4300047": 0.20179867315030212, "test/sim_max_reward_4300048": 0.8430239156809284, "test/sim_max_reward_4300049": 0.2551944876741402, "train/mean_score": 0.8619320171665703, "test/mean_score": 0.6197200244480089, "val_loss": 69211.703125} {"train_loss": -6.9452643394470215, "global_step": 174342, "epoch": 4151} {"train_loss": -7.0744428634643555, "global_step": 174343, "epoch": 4151} {"train_loss": -7.1089982986450195, "global_step": 174344, "epoch": 4151} {"train_loss": -7.110832214355469, "global_step": 174345, "epoch": 4151} {"train_loss": -7.0029802322387695, "global_step": 174346, "epoch": 4151} {"train_loss": -7.0617570877075195, "global_step": 174347, "epoch": 4151} {"train_loss": -6.9896135330200195, "global_step": 174348, "epoch": 4151} {"train_loss": -7.092857837677002, "global_step": 174349, "epoch": 4151} {"train_loss": -7.0737104415893555, "global_step": 174350, "epoch": 4151} {"train_loss": -7.147397041320801, "global_step": 174351, "epoch": 4151} {"train_loss": -7.125632286071777, "global_step": 174352, "epoch": 4151} {"train_loss": -7.0516886711120605, "global_step": 174353, "epoch": 4151} {"train_loss": -7.0371928215026855, "global_step": 174354, "epoch": 4151} {"train_loss": -6.926793098449707, "global_step": 174355, "epoch": 4151} {"train_loss": -7.06480073928833, "global_step": 174356, "epoch": 4151} {"train_loss": -6.901808738708496, "global_step": 174357, "epoch": 4151} {"train_loss": -6.954014778137207, "global_step": 174358, "epoch": 4151} {"train_loss": -6.964731216430664, "global_step": 174359, "epoch": 4151} {"train_loss": -6.985207557678223, "global_step": 174360, "epoch": 4151} {"train_loss": -6.994373321533203, "global_step": 174361, "epoch": 4151} {"train_loss": -6.980874061584473, "global_step": 174362, "epoch": 4151} {"train_loss": -7.017395496368408, "global_step": 174363, "epoch": 4151} {"train_loss": -7.043068885803223, "global_step": 174364, "epoch": 4151} {"train_loss": -7.00295352935791, "global_step": 174365, "epoch": 4151} {"train_loss": -7.052960395812988, "global_step": 174366, "epoch": 4151} {"train_loss": -7.027697563171387, "global_step": 174367, "epoch": 4151} {"train_loss": -7.002419471740723, "global_step": 174368, "epoch": 4151} {"train_loss": -7.083000183105469, "global_step": 174369, "epoch": 4151} {"train_loss": -7.072283744812012, "global_step": 174370, "epoch": 4151} {"train_loss": -7.052746295928955, "global_step": 174371, "epoch": 4151} {"train_loss": -7.012629508972168, "global_step": 174372, "epoch": 4151} {"train_loss": -6.99885368347168, "global_step": 174373, "epoch": 4151} {"train_loss": -7.034521102905273, "global_step": 174374, "epoch": 4151} {"train_loss": -6.909677028656006, "global_step": 174375, "epoch": 4151} {"train_loss": -7.054900646209717, "global_step": 174376, "epoch": 4151} {"train_loss": -7.123390197753906, "global_step": 174377, "epoch": 4151} {"train_loss": -7.043577671051025, "global_step": 174378, "epoch": 4151} {"train_loss": -7.080131530761719, "global_step": 174379, "epoch": 4151} {"train_loss": -7.074073791503906, "global_step": 174380, "epoch": 4151} {"train_loss": -7.168705463409424, "global_step": 174381, "epoch": 4151} {"train_loss": -7.084001064300537, "global_step": 174382, "epoch": 4151} {"train_loss": -7.037488721665882, "global_step": 174383, "epoch": 4151, "val_loss": 69224.578125} {"train_loss": -7.158371925354004, "global_step": 174384, "epoch": 4152} {"train_loss": -7.0290327072143555, "global_step": 174385, "epoch": 4152} {"train_loss": -7.156824111938477, "global_step": 174386, "epoch": 4152} {"train_loss": -7.012542724609375, "global_step": 174387, "epoch": 4152} {"train_loss": -7.061121940612793, "global_step": 174388, "epoch": 4152} {"train_loss": -7.1195502281188965, "global_step": 174389, "epoch": 4152} {"train_loss": -7.086719512939453, "global_step": 174390, "epoch": 4152} {"train_loss": -7.088052749633789, "global_step": 174391, "epoch": 4152} {"train_loss": -7.11934757232666, "global_step": 174392, "epoch": 4152} {"train_loss": -7.037474632263184, "global_step": 174393, "epoch": 4152} {"train_loss": -7.093960762023926, "global_step": 174394, "epoch": 4152} {"train_loss": -7.072658538818359, "global_step": 174395, "epoch": 4152} {"train_loss": -6.948371410369873, "global_step": 174396, "epoch": 4152} {"train_loss": -6.93860387802124, "global_step": 174397, "epoch": 4152} {"train_loss": -7.096901893615723, "global_step": 174398, "epoch": 4152} {"train_loss": -7.061466217041016, "global_step": 174399, "epoch": 4152} {"train_loss": -6.968494415283203, "global_step": 174400, "epoch": 4152} {"train_loss": -7.084805011749268, "global_step": 174401, "epoch": 4152} {"train_loss": -6.998111248016357, "global_step": 174402, "epoch": 4152} {"train_loss": -7.064383029937744, "global_step": 174403, "epoch": 4152} {"train_loss": -7.0054426193237305, "global_step": 174404, "epoch": 4152} {"train_loss": -6.963034629821777, "global_step": 174405, "epoch": 4152} {"train_loss": -7.076803207397461, "global_step": 174406, "epoch": 4152} {"train_loss": -7.032690525054932, "global_step": 174407, "epoch": 4152} {"train_loss": -7.042959213256836, "global_step": 174408, "epoch": 4152} {"train_loss": -7.082045078277588, "global_step": 174409, "epoch": 4152} {"train_loss": -7.003498077392578, "global_step": 174410, "epoch": 4152} {"train_loss": -7.090246200561523, "global_step": 174411, "epoch": 4152} {"train_loss": -7.0176544189453125, "global_step": 174412, "epoch": 4152} {"train_loss": -7.062900543212891, "global_step": 174413, "epoch": 4152} {"train_loss": -7.1090006828308105, "global_step": 174414, "epoch": 4152} {"train_loss": -6.991293907165527, "global_step": 174415, "epoch": 4152} {"train_loss": -6.999591827392578, "global_step": 174416, "epoch": 4152} {"train_loss": -7.022112846374512, "global_step": 174417, "epoch": 4152} {"train_loss": -6.99456262588501, "global_step": 174418, "epoch": 4152} {"train_loss": -6.994738578796387, "global_step": 174419, "epoch": 4152} {"train_loss": -6.995535850524902, "global_step": 174420, "epoch": 4152} {"train_loss": -7.102394104003906, "global_step": 174421, "epoch": 4152} {"train_loss": -7.036601543426514, "global_step": 174422, "epoch": 4152} {"train_loss": -7.0072808265686035, "global_step": 174423, "epoch": 4152} {"train_loss": -7.1148295402526855, "global_step": 174424, "epoch": 4152} {"train_loss": -7.046342293421428, "global_step": 174425, "epoch": 4152, "val_loss": 69149.765625} {"train_loss": -7.063048839569092, "global_step": 174426, "epoch": 4153} {"train_loss": -7.034520626068115, "global_step": 174427, "epoch": 4153} {"train_loss": -7.022096633911133, "global_step": 174428, "epoch": 4153} {"train_loss": -7.198373794555664, "global_step": 174429, "epoch": 4153} {"train_loss": -7.0179667472839355, "global_step": 174430, "epoch": 4153} {"train_loss": -7.074682235717773, "global_step": 174431, "epoch": 4153} {"train_loss": -7.045968055725098, "global_step": 174432, "epoch": 4153} {"train_loss": -7.079493045806885, "global_step": 174433, "epoch": 4153} {"train_loss": -7.042635917663574, "global_step": 174434, "epoch": 4153} {"train_loss": -7.116564750671387, "global_step": 174435, "epoch": 4153} {"train_loss": -7.031038761138916, "global_step": 174436, "epoch": 4153} {"train_loss": -7.067836761474609, "global_step": 174437, "epoch": 4153} {"train_loss": -7.065267562866211, "global_step": 174438, "epoch": 4153} {"train_loss": -7.0612921714782715, "global_step": 174439, "epoch": 4153} {"train_loss": -7.122217178344727, "global_step": 174440, "epoch": 4153} {"train_loss": -7.090612411499023, "global_step": 174441, "epoch": 4153} {"train_loss": -7.063220024108887, "global_step": 174442, "epoch": 4153} {"train_loss": -7.068037033081055, "global_step": 174443, "epoch": 4153} {"train_loss": -7.033034324645996, "global_step": 174444, "epoch": 4153} {"train_loss": -7.181563377380371, "global_step": 174445, "epoch": 4153} {"train_loss": -7.0674519538879395, "global_step": 174446, "epoch": 4153} {"train_loss": -7.1354217529296875, "global_step": 174447, "epoch": 4153} {"train_loss": -7.085454940795898, "global_step": 174448, "epoch": 4153} {"train_loss": -7.134570121765137, "global_step": 174449, "epoch": 4153} {"train_loss": -7.138687610626221, "global_step": 174450, "epoch": 4153} {"train_loss": -7.022371768951416, "global_step": 174451, "epoch": 4153} {"train_loss": -7.198553085327148, "global_step": 174452, "epoch": 4153} {"train_loss": -7.006613254547119, "global_step": 174453, "epoch": 4153} {"train_loss": -7.04947566986084, "global_step": 174454, "epoch": 4153} {"train_loss": -6.960958957672119, "global_step": 174455, "epoch": 4153} {"train_loss": -7.1242995262146, "global_step": 174456, "epoch": 4153} {"train_loss": -7.06129264831543, "global_step": 174457, "epoch": 4153} {"train_loss": -7.117470741271973, "global_step": 174458, "epoch": 4153} {"train_loss": -7.124055862426758, "global_step": 174459, "epoch": 4153} {"train_loss": -6.992895603179932, "global_step": 174460, "epoch": 4153} {"train_loss": -7.14335298538208, "global_step": 174461, "epoch": 4153} {"train_loss": -6.972901344299316, "global_step": 174462, "epoch": 4153} {"train_loss": -7.0183539390563965, "global_step": 174463, "epoch": 4153} {"train_loss": -7.095760345458984, "global_step": 174464, "epoch": 4153} {"train_loss": -7.0447235107421875, "global_step": 174465, "epoch": 4153} {"train_loss": -7.129005432128906, "global_step": 174466, "epoch": 4153} {"train_loss": -7.076407546088809, "global_step": 174467, "epoch": 4153, "val_loss": 69001.9375} {"train_loss": -7.049682140350342, "global_step": 174468, "epoch": 4154} {"train_loss": -7.088863372802734, "global_step": 174469, "epoch": 4154} {"train_loss": -7.086185455322266, "global_step": 174470, "epoch": 4154} {"train_loss": -7.022339820861816, "global_step": 174471, "epoch": 4154} {"train_loss": -7.1326446533203125, "global_step": 174472, "epoch": 4154} {"train_loss": -7.058934211730957, "global_step": 174473, "epoch": 4154} {"train_loss": -6.874311447143555, "global_step": 174474, "epoch": 4154} {"train_loss": -7.136685371398926, "global_step": 174475, "epoch": 4154} {"train_loss": -6.999181270599365, "global_step": 174476, "epoch": 4154} {"train_loss": -7.029173374176025, "global_step": 174477, "epoch": 4154} {"train_loss": -7.115470886230469, "global_step": 174478, "epoch": 4154} {"train_loss": -7.050063610076904, "global_step": 174479, "epoch": 4154} {"train_loss": -6.941477298736572, "global_step": 174480, "epoch": 4154} {"train_loss": -7.004639625549316, "global_step": 174481, "epoch": 4154} {"train_loss": -7.011261940002441, "global_step": 174482, "epoch": 4154} {"train_loss": -7.082029342651367, "global_step": 174483, "epoch": 4154} {"train_loss": -7.048381328582764, "global_step": 174484, "epoch": 4154} {"train_loss": -7.044861793518066, "global_step": 174485, "epoch": 4154} {"train_loss": -7.053902626037598, "global_step": 174486, "epoch": 4154} {"train_loss": -6.985048294067383, "global_step": 174487, "epoch": 4154} {"train_loss": -7.11583948135376, "global_step": 174488, "epoch": 4154} {"train_loss": -7.034201145172119, "global_step": 174489, "epoch": 4154} {"train_loss": -6.990528106689453, "global_step": 174490, "epoch": 4154} {"train_loss": -7.09419584274292, "global_step": 174491, "epoch": 4154} {"train_loss": -6.963692665100098, "global_step": 174492, "epoch": 4154} {"train_loss": -6.935545921325684, "global_step": 174493, "epoch": 4154} {"train_loss": -6.982409954071045, "global_step": 174494, "epoch": 4154} {"train_loss": -7.017765045166016, "global_step": 174495, "epoch": 4154} {"train_loss": -6.884398460388184, "global_step": 174496, "epoch": 4154} {"train_loss": -6.973553657531738, "global_step": 174497, "epoch": 4154} {"train_loss": -6.902841567993164, "global_step": 174498, "epoch": 4154} {"train_loss": -6.900753021240234, "global_step": 174499, "epoch": 4154} {"train_loss": -6.920285224914551, "global_step": 174500, "epoch": 4154} {"train_loss": -6.884113311767578, "global_step": 174501, "epoch": 4154} {"train_loss": -7.048615455627441, "global_step": 174502, "epoch": 4154} {"train_loss": -6.911325454711914, "global_step": 174503, "epoch": 4154} {"train_loss": -6.935130596160889, "global_step": 174504, "epoch": 4154} {"train_loss": -6.980515480041504, "global_step": 174505, "epoch": 4154} {"train_loss": -6.913302421569824, "global_step": 174506, "epoch": 4154} {"train_loss": -7.020226001739502, "global_step": 174507, "epoch": 4154} {"train_loss": -7.000051975250244, "global_step": 174508, "epoch": 4154} {"train_loss": -7.006960880188715, "global_step": 174509, "epoch": 4154, "val_loss": 69181.1875} {"train_loss": -7.057937145233154, "global_step": 174510, "epoch": 4155} {"train_loss": -6.923259735107422, "global_step": 174511, "epoch": 4155} {"train_loss": -7.062536239624023, "global_step": 174512, "epoch": 4155} {"train_loss": -7.060702800750732, "global_step": 174513, "epoch": 4155} {"train_loss": -6.987572193145752, "global_step": 174514, "epoch": 4155} {"train_loss": -6.977331161499023, "global_step": 174515, "epoch": 4155} {"train_loss": -6.873686790466309, "global_step": 174516, "epoch": 4155} {"train_loss": -7.106194972991943, "global_step": 174517, "epoch": 4155} {"train_loss": -7.053310394287109, "global_step": 174518, "epoch": 4155} {"train_loss": -7.003631591796875, "global_step": 174519, "epoch": 4155} {"train_loss": -7.061951637268066, "global_step": 174520, "epoch": 4155} {"train_loss": -6.98662805557251, "global_step": 174521, "epoch": 4155} {"train_loss": -7.030877590179443, "global_step": 174522, "epoch": 4155} {"train_loss": -7.022757530212402, "global_step": 174523, "epoch": 4155} {"train_loss": -7.0256476402282715, "global_step": 174524, "epoch": 4155} {"train_loss": -7.012208461761475, "global_step": 174525, "epoch": 4155} {"train_loss": -6.943441390991211, "global_step": 174526, "epoch": 4155} {"train_loss": -7.102301120758057, "global_step": 174527, "epoch": 4155} {"train_loss": -6.914650917053223, "global_step": 174528, "epoch": 4155} {"train_loss": -7.021633148193359, "global_step": 174529, "epoch": 4155} {"train_loss": -7.018951416015625, "global_step": 174530, "epoch": 4155} {"train_loss": -6.92467737197876, "global_step": 174531, "epoch": 4155} {"train_loss": -6.977376461029053, "global_step": 174532, "epoch": 4155} {"train_loss": -7.090909004211426, "global_step": 174533, "epoch": 4155} {"train_loss": -7.077103614807129, "global_step": 174534, "epoch": 4155} {"train_loss": -6.971826553344727, "global_step": 174535, "epoch": 4155} {"train_loss": -7.165520668029785, "global_step": 174536, "epoch": 4155} {"train_loss": -6.9936981201171875, "global_step": 174537, "epoch": 4155} {"train_loss": -7.0534234046936035, "global_step": 174538, "epoch": 4155} {"train_loss": -7.159234046936035, "global_step": 174539, "epoch": 4155} {"train_loss": -6.8887038230896, "global_step": 174540, "epoch": 4155} {"train_loss": -7.109749794006348, "global_step": 174541, "epoch": 4155} {"train_loss": -6.973012924194336, "global_step": 174542, "epoch": 4155} {"train_loss": -6.92470645904541, "global_step": 174543, "epoch": 4155} {"train_loss": -7.085178375244141, "global_step": 174544, "epoch": 4155} {"train_loss": -6.877773761749268, "global_step": 174545, "epoch": 4155} {"train_loss": -7.143815517425537, "global_step": 174546, "epoch": 4155} {"train_loss": -6.914623737335205, "global_step": 174547, "epoch": 4155} {"train_loss": -6.974931716918945, "global_step": 174548, "epoch": 4155} {"train_loss": -7.101920127868652, "global_step": 174549, "epoch": 4155} {"train_loss": -7.008774757385254, "global_step": 174550, "epoch": 4155} {"train_loss": -7.017183599017915, "global_step": 174551, "epoch": 4155, "val_loss": 69246.328125} {"train_loss": -7.1028337478637695, "global_step": 174552, "epoch": 4156} {"train_loss": -7.123786926269531, "global_step": 174553, "epoch": 4156} {"train_loss": -7.071797847747803, "global_step": 174554, "epoch": 4156} {"train_loss": -7.108743190765381, "global_step": 174555, "epoch": 4156} {"train_loss": -7.093774795532227, "global_step": 174556, "epoch": 4156} {"train_loss": -7.057414531707764, "global_step": 174557, "epoch": 4156} {"train_loss": -7.021684169769287, "global_step": 174558, "epoch": 4156} {"train_loss": -7.124058723449707, "global_step": 174559, "epoch": 4156} {"train_loss": -7.099714279174805, "global_step": 174560, "epoch": 4156} {"train_loss": -7.096449375152588, "global_step": 174561, "epoch": 4156} {"train_loss": -7.059142589569092, "global_step": 174562, "epoch": 4156} {"train_loss": -6.997492790222168, "global_step": 174563, "epoch": 4156} {"train_loss": -7.082757949829102, "global_step": 174564, "epoch": 4156} {"train_loss": -7.119643211364746, "global_step": 174565, "epoch": 4156} {"train_loss": -7.035408020019531, "global_step": 174566, "epoch": 4156} {"train_loss": -7.124458312988281, "global_step": 174567, "epoch": 4156} {"train_loss": -6.971643447875977, "global_step": 174568, "epoch": 4156} {"train_loss": -7.12696647644043, "global_step": 174569, "epoch": 4156} {"train_loss": -6.966989994049072, "global_step": 174570, "epoch": 4156} {"train_loss": -6.962869167327881, "global_step": 174571, "epoch": 4156} {"train_loss": -6.945258617401123, "global_step": 174572, "epoch": 4156} {"train_loss": -7.032909870147705, "global_step": 174573, "epoch": 4156} {"train_loss": -6.972376346588135, "global_step": 174574, "epoch": 4156} {"train_loss": -7.009045124053955, "global_step": 174575, "epoch": 4156} {"train_loss": -7.203510761260986, "global_step": 174576, "epoch": 4156} {"train_loss": -7.032909870147705, "global_step": 174577, "epoch": 4156} {"train_loss": -6.904943466186523, "global_step": 174578, "epoch": 4156} {"train_loss": -7.053732872009277, "global_step": 174579, "epoch": 4156} {"train_loss": -6.997775554656982, "global_step": 174580, "epoch": 4156} {"train_loss": -6.97737979888916, "global_step": 174581, "epoch": 4156} {"train_loss": -6.982446193695068, "global_step": 174582, "epoch": 4156} {"train_loss": -6.928592681884766, "global_step": 174583, "epoch": 4156} {"train_loss": -7.132716178894043, "global_step": 174584, "epoch": 4156} {"train_loss": -6.905143737792969, "global_step": 174585, "epoch": 4156} {"train_loss": -6.902835845947266, "global_step": 174586, "epoch": 4156} {"train_loss": -7.037761688232422, "global_step": 174587, "epoch": 4156} {"train_loss": -6.917080879211426, "global_step": 174588, "epoch": 4156} {"train_loss": -7.078142166137695, "global_step": 174589, "epoch": 4156} {"train_loss": -6.946989059448242, "global_step": 174590, "epoch": 4156} {"train_loss": -7.030051231384277, "global_step": 174591, "epoch": 4156} {"train_loss": -7.069435119628906, "global_step": 174592, "epoch": 4156} {"train_loss": -7.033218020484561, "global_step": 174593, "epoch": 4156, "val_loss": 69218.078125} {"train_loss": -7.144391059875488, "global_step": 174594, "epoch": 4157} {"train_loss": -6.977519989013672, "global_step": 174595, "epoch": 4157} {"train_loss": -7.171628952026367, "global_step": 174596, "epoch": 4157} {"train_loss": -7.06646728515625, "global_step": 174597, "epoch": 4157} {"train_loss": -7.09159517288208, "global_step": 174598, "epoch": 4157} {"train_loss": -7.197111129760742, "global_step": 174599, "epoch": 4157} {"train_loss": -7.025208473205566, "global_step": 174600, "epoch": 4157} {"train_loss": -7.140563011169434, "global_step": 174601, "epoch": 4157} {"train_loss": -7.076666355133057, "global_step": 174602, "epoch": 4157} {"train_loss": -7.0751166343688965, "global_step": 174603, "epoch": 4157} {"train_loss": -7.1176862716674805, "global_step": 174604, "epoch": 4157} {"train_loss": -7.155814170837402, "global_step": 174605, "epoch": 4157} {"train_loss": -7.020132064819336, "global_step": 174606, "epoch": 4157} {"train_loss": -7.045939922332764, "global_step": 174607, "epoch": 4157} {"train_loss": -7.102969169616699, "global_step": 174608, "epoch": 4157} {"train_loss": -7.1033172607421875, "global_step": 174609, "epoch": 4157} {"train_loss": -7.023128509521484, "global_step": 174610, "epoch": 4157} {"train_loss": -7.142929553985596, "global_step": 174611, "epoch": 4157} {"train_loss": -7.104279518127441, "global_step": 174612, "epoch": 4157} {"train_loss": -7.098352432250977, "global_step": 174613, "epoch": 4157} {"train_loss": -7.097203254699707, "global_step": 174614, "epoch": 4157} {"train_loss": -7.007605075836182, "global_step": 174615, "epoch": 4157} {"train_loss": -7.0651421546936035, "global_step": 174616, "epoch": 4157} {"train_loss": -7.090186595916748, "global_step": 174617, "epoch": 4157} {"train_loss": -7.088670253753662, "global_step": 174618, "epoch": 4157} {"train_loss": -6.95897912979126, "global_step": 174619, "epoch": 4157} {"train_loss": -7.079489707946777, "global_step": 174620, "epoch": 4157} {"train_loss": -7.2463603019714355, "global_step": 174621, "epoch": 4157} {"train_loss": -7.018016815185547, "global_step": 174622, "epoch": 4157} {"train_loss": -6.986777305603027, "global_step": 174623, "epoch": 4157} {"train_loss": -7.121592998504639, "global_step": 174624, "epoch": 4157} {"train_loss": -7.066271781921387, "global_step": 174625, "epoch": 4157} {"train_loss": -7.067105293273926, "global_step": 174626, "epoch": 4157} {"train_loss": -7.1397552490234375, "global_step": 174627, "epoch": 4157} {"train_loss": -7.102710247039795, "global_step": 174628, "epoch": 4157} {"train_loss": -7.084444046020508, "global_step": 174629, "epoch": 4157} {"train_loss": -6.940369129180908, "global_step": 174630, "epoch": 4157} {"train_loss": -7.12209415435791, "global_step": 174631, "epoch": 4157} {"train_loss": -7.1200714111328125, "global_step": 174632, "epoch": 4157} {"train_loss": -6.998068809509277, "global_step": 174633, "epoch": 4157} {"train_loss": -7.109944820404053, "global_step": 174634, "epoch": 4157} {"train_loss": -7.081909191040766, "global_step": 174635, "epoch": 4157, "val_loss": 69144.59375} {"train_loss": -7.067480087280273, "global_step": 174636, "epoch": 4158} {"train_loss": -7.161861419677734, "global_step": 174637, "epoch": 4158} {"train_loss": -7.052661895751953, "global_step": 174638, "epoch": 4158} {"train_loss": -7.022019863128662, "global_step": 174639, "epoch": 4158} {"train_loss": -7.056927680969238, "global_step": 174640, "epoch": 4158} {"train_loss": -6.954032897949219, "global_step": 174641, "epoch": 4158} {"train_loss": -6.984380722045898, "global_step": 174642, "epoch": 4158} {"train_loss": -7.170483112335205, "global_step": 174643, "epoch": 4158} {"train_loss": -7.023064613342285, "global_step": 174644, "epoch": 4158} {"train_loss": -7.076490879058838, "global_step": 174645, "epoch": 4158} {"train_loss": -7.059587478637695, "global_step": 174646, "epoch": 4158} {"train_loss": -7.01253080368042, "global_step": 174647, "epoch": 4158} {"train_loss": -6.9637346267700195, "global_step": 174648, "epoch": 4158} {"train_loss": -6.858285903930664, "global_step": 174649, "epoch": 4158} {"train_loss": -7.006333827972412, "global_step": 174650, "epoch": 4158} {"train_loss": -7.117165565490723, "global_step": 174651, "epoch": 4158} {"train_loss": -6.840730667114258, "global_step": 174652, "epoch": 4158} {"train_loss": -7.067440509796143, "global_step": 174653, "epoch": 4158} {"train_loss": -7.006662368774414, "global_step": 174654, "epoch": 4158} {"train_loss": -6.936578750610352, "global_step": 174655, "epoch": 4158} {"train_loss": -7.098112106323242, "global_step": 174656, "epoch": 4158} {"train_loss": -7.062232971191406, "global_step": 174657, "epoch": 4158} {"train_loss": -7.020071029663086, "global_step": 174658, "epoch": 4158} {"train_loss": -7.074490547180176, "global_step": 174659, "epoch": 4158} {"train_loss": -6.964097023010254, "global_step": 174660, "epoch": 4158} {"train_loss": -6.931628227233887, "global_step": 174661, "epoch": 4158} {"train_loss": -7.0333404541015625, "global_step": 174662, "epoch": 4158} {"train_loss": -6.969452857971191, "global_step": 174663, "epoch": 4158} {"train_loss": -7.06074333190918, "global_step": 174664, "epoch": 4158} {"train_loss": -6.957892417907715, "global_step": 174665, "epoch": 4158} {"train_loss": -7.071523666381836, "global_step": 174666, "epoch": 4158} {"train_loss": -6.962571144104004, "global_step": 174667, "epoch": 4158} {"train_loss": -7.025730133056641, "global_step": 174668, "epoch": 4158} {"train_loss": -7.014287948608398, "global_step": 174669, "epoch": 4158} {"train_loss": -7.031826019287109, "global_step": 174670, "epoch": 4158} {"train_loss": -7.11125373840332, "global_step": 174671, "epoch": 4158} {"train_loss": -7.041864395141602, "global_step": 174672, "epoch": 4158} {"train_loss": -7.027735710144043, "global_step": 174673, "epoch": 4158} {"train_loss": -6.992972373962402, "global_step": 174674, "epoch": 4158} {"train_loss": -7.194451332092285, "global_step": 174675, "epoch": 4158} {"train_loss": -7.078229904174805, "global_step": 174676, "epoch": 4158} {"train_loss": -7.029903911408924, "global_step": 174677, "epoch": 4158, "val_loss": 69031.515625} {"train_loss": -7.1350250244140625, "global_step": 174678, "epoch": 4159} {"train_loss": -7.106910705566406, "global_step": 174679, "epoch": 4159} {"train_loss": -7.145465850830078, "global_step": 174680, "epoch": 4159} {"train_loss": -6.996898174285889, "global_step": 174681, "epoch": 4159} {"train_loss": -7.152219295501709, "global_step": 174682, "epoch": 4159} {"train_loss": -7.094365119934082, "global_step": 174683, "epoch": 4159} {"train_loss": -7.09930419921875, "global_step": 174684, "epoch": 4159} {"train_loss": -7.140929222106934, "global_step": 174685, "epoch": 4159} {"train_loss": -7.109458923339844, "global_step": 174686, "epoch": 4159} {"train_loss": -7.015730381011963, "global_step": 174687, "epoch": 4159} {"train_loss": -7.102273941040039, "global_step": 174688, "epoch": 4159} {"train_loss": -6.991950035095215, "global_step": 174689, "epoch": 4159} {"train_loss": -7.0391740798950195, "global_step": 174690, "epoch": 4159} {"train_loss": -7.025581359863281, "global_step": 174691, "epoch": 4159} {"train_loss": -6.992372512817383, "global_step": 174692, "epoch": 4159} {"train_loss": -7.173814296722412, "global_step": 174693, "epoch": 4159} {"train_loss": -7.019713401794434, "global_step": 174694, "epoch": 4159} {"train_loss": -7.029354095458984, "global_step": 174695, "epoch": 4159} {"train_loss": -7.077915668487549, "global_step": 174696, "epoch": 4159} {"train_loss": -6.959555625915527, "global_step": 174697, "epoch": 4159} {"train_loss": -7.095429420471191, "global_step": 174698, "epoch": 4159} {"train_loss": -7.197360992431641, "global_step": 174699, "epoch": 4159} {"train_loss": -7.029502868652344, "global_step": 174700, "epoch": 4159} {"train_loss": -6.961916923522949, "global_step": 174701, "epoch": 4159} {"train_loss": -6.963713645935059, "global_step": 174702, "epoch": 4159} {"train_loss": -7.015693664550781, "global_step": 174703, "epoch": 4159} {"train_loss": -7.0043158531188965, "global_step": 174704, "epoch": 4159} {"train_loss": -6.931182861328125, "global_step": 174705, "epoch": 4159} {"train_loss": -7.130180358886719, "global_step": 174706, "epoch": 4159} {"train_loss": -7.008315086364746, "global_step": 174707, "epoch": 4159} {"train_loss": -7.160922050476074, "global_step": 174708, "epoch": 4159} {"train_loss": -7.0692243576049805, "global_step": 174709, "epoch": 4159} {"train_loss": -7.059288024902344, "global_step": 174710, "epoch": 4159} {"train_loss": -7.04304313659668, "global_step": 174711, "epoch": 4159} {"train_loss": -7.020484447479248, "global_step": 174712, "epoch": 4159} {"train_loss": -7.173096656799316, "global_step": 174713, "epoch": 4159} {"train_loss": -7.089297294616699, "global_step": 174714, "epoch": 4159} {"train_loss": -7.182825565338135, "global_step": 174715, "epoch": 4159} {"train_loss": -7.197187900543213, "global_step": 174716, "epoch": 4159} {"train_loss": -7.111815452575684, "global_step": 174717, "epoch": 4159} {"train_loss": -7.216391563415527, "global_step": 174718, "epoch": 4159} {"train_loss": -7.076527618226551, "global_step": 174719, "epoch": 4159, "val_loss": 68961.3828125} {"train_loss": -7.164335250854492, "global_step": 174720, "epoch": 4160} {"train_loss": -7.196295261383057, "global_step": 174721, "epoch": 4160} {"train_loss": -7.13964319229126, "global_step": 174722, "epoch": 4160} {"train_loss": -7.139946460723877, "global_step": 174723, "epoch": 4160} {"train_loss": -7.161342620849609, "global_step": 174724, "epoch": 4160} {"train_loss": -7.267430782318115, "global_step": 174725, "epoch": 4160} {"train_loss": -7.112415313720703, "global_step": 174726, "epoch": 4160} {"train_loss": -7.069361686706543, "global_step": 174727, "epoch": 4160} {"train_loss": -7.0884480476379395, "global_step": 174728, "epoch": 4160} {"train_loss": -7.186758518218994, "global_step": 174729, "epoch": 4160} {"train_loss": -7.129312515258789, "global_step": 174730, "epoch": 4160} {"train_loss": -7.0237016677856445, "global_step": 174731, "epoch": 4160} {"train_loss": -7.203115463256836, "global_step": 174732, "epoch": 4160} {"train_loss": -7.084880352020264, "global_step": 174733, "epoch": 4160} {"train_loss": -7.1036458015441895, "global_step": 174734, "epoch": 4160} {"train_loss": -7.028783798217773, "global_step": 174735, "epoch": 4160} {"train_loss": -7.072579383850098, "global_step": 174736, "epoch": 4160} {"train_loss": -7.047677516937256, "global_step": 174737, "epoch": 4160} {"train_loss": -7.059307098388672, "global_step": 174738, "epoch": 4160} {"train_loss": -7.1244354248046875, "global_step": 174739, "epoch": 4160} {"train_loss": -7.2473673820495605, "global_step": 174740, "epoch": 4160} {"train_loss": -7.038139820098877, "global_step": 174741, "epoch": 4160} {"train_loss": -7.010962963104248, "global_step": 174742, "epoch": 4160} {"train_loss": -7.065962791442871, "global_step": 174743, "epoch": 4160} {"train_loss": -7.033693313598633, "global_step": 174744, "epoch": 4160} {"train_loss": -7.071974754333496, "global_step": 174745, "epoch": 4160} {"train_loss": -7.14711332321167, "global_step": 174746, "epoch": 4160} {"train_loss": -7.013077259063721, "global_step": 174747, "epoch": 4160} {"train_loss": -7.115983963012695, "global_step": 174748, "epoch": 4160} {"train_loss": -7.081340789794922, "global_step": 174749, "epoch": 4160} {"train_loss": -6.93882942199707, "global_step": 174750, "epoch": 4160} {"train_loss": -7.07141637802124, "global_step": 174751, "epoch": 4160} {"train_loss": -6.93749475479126, "global_step": 174752, "epoch": 4160} {"train_loss": -7.028443336486816, "global_step": 174753, "epoch": 4160} {"train_loss": -7.029562950134277, "global_step": 174754, "epoch": 4160} {"train_loss": -7.015997886657715, "global_step": 174755, "epoch": 4160} {"train_loss": -7.056036949157715, "global_step": 174756, "epoch": 4160} {"train_loss": -6.937629699707031, "global_step": 174757, "epoch": 4160} {"train_loss": -7.0038628578186035, "global_step": 174758, "epoch": 4160} {"train_loss": -6.970671653747559, "global_step": 174759, "epoch": 4160} {"train_loss": -6.799655437469482, "global_step": 174760, "epoch": 4160} {"train_loss": -7.073219219843547, "global_step": 174761, "epoch": 4160, "val_loss": 69275.140625} {"train_loss": -6.852566242218018, "global_step": 174762, "epoch": 4161} {"train_loss": -7.020213603973389, "global_step": 174763, "epoch": 4161} {"train_loss": -6.964264869689941, "global_step": 174764, "epoch": 4161} {"train_loss": -7.041960716247559, "global_step": 174765, "epoch": 4161} {"train_loss": -7.055302619934082, "global_step": 174766, "epoch": 4161} {"train_loss": -7.103127956390381, "global_step": 174767, "epoch": 4161} {"train_loss": -6.97803258895874, "global_step": 174768, "epoch": 4161} {"train_loss": -6.98626708984375, "global_step": 174769, "epoch": 4161} {"train_loss": -6.969383239746094, "global_step": 174770, "epoch": 4161} {"train_loss": -6.951491355895996, "global_step": 174771, "epoch": 4161} {"train_loss": -7.086467742919922, "global_step": 174772, "epoch": 4161} {"train_loss": -7.001955986022949, "global_step": 174773, "epoch": 4161} {"train_loss": -7.074172019958496, "global_step": 174774, "epoch": 4161} {"train_loss": -6.960564613342285, "global_step": 174775, "epoch": 4161} {"train_loss": -7.148756980895996, "global_step": 174776, "epoch": 4161} {"train_loss": -7.022917747497559, "global_step": 174777, "epoch": 4161} {"train_loss": -7.142083168029785, "global_step": 174778, "epoch": 4161} {"train_loss": -7.024231910705566, "global_step": 174779, "epoch": 4161} {"train_loss": -7.060703277587891, "global_step": 174780, "epoch": 4161} {"train_loss": -6.984797954559326, "global_step": 174781, "epoch": 4161} {"train_loss": -6.974968910217285, "global_step": 174782, "epoch": 4161} {"train_loss": -7.0871076583862305, "global_step": 174783, "epoch": 4161} {"train_loss": -7.008050441741943, "global_step": 174784, "epoch": 4161} {"train_loss": -6.9717912673950195, "global_step": 174785, "epoch": 4161} {"train_loss": -7.048988342285156, "global_step": 174786, "epoch": 4161} {"train_loss": -7.099544525146484, "global_step": 174787, "epoch": 4161} {"train_loss": -7.038970470428467, "global_step": 174788, "epoch": 4161} {"train_loss": -6.947329521179199, "global_step": 174789, "epoch": 4161} {"train_loss": -7.140177249908447, "global_step": 174790, "epoch": 4161} {"train_loss": -6.977083683013916, "global_step": 174791, "epoch": 4161} {"train_loss": -6.971898078918457, "global_step": 174792, "epoch": 4161} {"train_loss": -7.166053295135498, "global_step": 174793, "epoch": 4161} {"train_loss": -7.109188079833984, "global_step": 174794, "epoch": 4161} {"train_loss": -7.031896591186523, "global_step": 174795, "epoch": 4161} {"train_loss": -6.960519790649414, "global_step": 174796, "epoch": 4161} {"train_loss": -6.889646530151367, "global_step": 174797, "epoch": 4161} {"train_loss": -7.099782943725586, "global_step": 174798, "epoch": 4161} {"train_loss": -6.858581066131592, "global_step": 174799, "epoch": 4161} {"train_loss": -6.890446662902832, "global_step": 174800, "epoch": 4161} {"train_loss": -7.015854358673096, "global_step": 174801, "epoch": 4161} {"train_loss": -6.986452102661133, "global_step": 174802, "epoch": 4161} {"train_loss": -7.016363813763573, "global_step": 174803, "epoch": 4161, "val_loss": 69202.109375} {"train_loss": -6.708826065063477, "global_step": 174804, "epoch": 4162} {"train_loss": -6.8906965255737305, "global_step": 174805, "epoch": 4162} {"train_loss": -6.885016441345215, "global_step": 174806, "epoch": 4162} {"train_loss": -7.022845268249512, "global_step": 174807, "epoch": 4162} {"train_loss": -6.95781946182251, "global_step": 174808, "epoch": 4162} {"train_loss": -7.046647071838379, "global_step": 174809, "epoch": 4162} {"train_loss": -7.008345603942871, "global_step": 174810, "epoch": 4162} {"train_loss": -6.928078651428223, "global_step": 174811, "epoch": 4162} {"train_loss": -6.959106922149658, "global_step": 174812, "epoch": 4162} {"train_loss": -7.025974273681641, "global_step": 174813, "epoch": 4162} {"train_loss": -6.891022682189941, "global_step": 174814, "epoch": 4162} {"train_loss": -6.929586410522461, "global_step": 174815, "epoch": 4162} {"train_loss": -7.012993812561035, "global_step": 174816, "epoch": 4162} {"train_loss": -6.887975215911865, "global_step": 174817, "epoch": 4162} {"train_loss": -7.006402969360352, "global_step": 174818, "epoch": 4162} {"train_loss": -6.872602462768555, "global_step": 174819, "epoch": 4162} {"train_loss": -7.050230026245117, "global_step": 174820, "epoch": 4162} {"train_loss": -7.053313255310059, "global_step": 174821, "epoch": 4162} {"train_loss": -7.050598621368408, "global_step": 174822, "epoch": 4162} {"train_loss": -7.013318061828613, "global_step": 174823, "epoch": 4162} {"train_loss": -7.1256866455078125, "global_step": 174824, "epoch": 4162} {"train_loss": -6.820635795593262, "global_step": 174825, "epoch": 4162} {"train_loss": -6.978092193603516, "global_step": 174826, "epoch": 4162} {"train_loss": -6.88324499130249, "global_step": 174827, "epoch": 4162} {"train_loss": -6.925227642059326, "global_step": 174828, "epoch": 4162} {"train_loss": -6.933411598205566, "global_step": 174829, "epoch": 4162} {"train_loss": -6.89801025390625, "global_step": 174830, "epoch": 4162} {"train_loss": -7.154130458831787, "global_step": 174831, "epoch": 4162} {"train_loss": -6.8527607917785645, "global_step": 174832, "epoch": 4162} {"train_loss": -7.187124729156494, "global_step": 174833, "epoch": 4162} {"train_loss": -6.920269966125488, "global_step": 174834, "epoch": 4162} {"train_loss": -7.02994441986084, "global_step": 174835, "epoch": 4162} {"train_loss": -6.962101459503174, "global_step": 174836, "epoch": 4162} {"train_loss": -7.036314964294434, "global_step": 174837, "epoch": 4162} {"train_loss": -6.945294380187988, "global_step": 174838, "epoch": 4162} {"train_loss": -7.127750396728516, "global_step": 174839, "epoch": 4162} {"train_loss": -6.864686012268066, "global_step": 174840, "epoch": 4162} {"train_loss": -6.985126495361328, "global_step": 174841, "epoch": 4162} {"train_loss": -6.833808898925781, "global_step": 174842, "epoch": 4162} {"train_loss": -6.883092880249023, "global_step": 174843, "epoch": 4162} {"train_loss": -6.961339950561523, "global_step": 174844, "epoch": 4162} {"train_loss": -6.961969477789743, "global_step": 174845, "epoch": 4162, "val_loss": 69204.515625} {"train_loss": -6.983165740966797, "global_step": 174846, "epoch": 4163} {"train_loss": -6.998932838439941, "global_step": 174847, "epoch": 4163} {"train_loss": -6.960906982421875, "global_step": 174848, "epoch": 4163} {"train_loss": -6.944161415100098, "global_step": 174849, "epoch": 4163} {"train_loss": -6.908676624298096, "global_step": 174850, "epoch": 4163} {"train_loss": -6.996424198150635, "global_step": 174851, "epoch": 4163} {"train_loss": -7.054707050323486, "global_step": 174852, "epoch": 4163} {"train_loss": -7.046999931335449, "global_step": 174853, "epoch": 4163} {"train_loss": -7.153402328491211, "global_step": 174854, "epoch": 4163} {"train_loss": -7.031447410583496, "global_step": 174855, "epoch": 4163} {"train_loss": -7.064682960510254, "global_step": 174856, "epoch": 4163} {"train_loss": -7.089371204376221, "global_step": 174857, "epoch": 4163} {"train_loss": -6.992459297180176, "global_step": 174858, "epoch": 4163} {"train_loss": -7.197847366333008, "global_step": 174859, "epoch": 4163} {"train_loss": -7.172933578491211, "global_step": 174860, "epoch": 4163} {"train_loss": -7.075175762176514, "global_step": 174861, "epoch": 4163} {"train_loss": -6.994194507598877, "global_step": 174862, "epoch": 4163} {"train_loss": -7.033111572265625, "global_step": 174863, "epoch": 4163} {"train_loss": -7.043128490447998, "global_step": 174864, "epoch": 4163} {"train_loss": -7.021995544433594, "global_step": 174865, "epoch": 4163} {"train_loss": -7.101681709289551, "global_step": 174866, "epoch": 4163} {"train_loss": -7.021836280822754, "global_step": 174867, "epoch": 4163} {"train_loss": -6.938759803771973, "global_step": 174868, "epoch": 4163} {"train_loss": -7.024169921875, "global_step": 174869, "epoch": 4163} {"train_loss": -6.869717597961426, "global_step": 174870, "epoch": 4163} {"train_loss": -7.0017194747924805, "global_step": 174871, "epoch": 4163} {"train_loss": -7.075666904449463, "global_step": 174872, "epoch": 4163} {"train_loss": -6.872005462646484, "global_step": 174873, "epoch": 4163} {"train_loss": -7.045042991638184, "global_step": 174874, "epoch": 4163} {"train_loss": -7.131641387939453, "global_step": 174875, "epoch": 4163} {"train_loss": -7.00777530670166, "global_step": 174876, "epoch": 4163} {"train_loss": -6.9314680099487305, "global_step": 174877, "epoch": 4163} {"train_loss": -7.062450408935547, "global_step": 174878, "epoch": 4163} {"train_loss": -7.065998077392578, "global_step": 174879, "epoch": 4163} {"train_loss": -7.019301414489746, "global_step": 174880, "epoch": 4163} {"train_loss": -7.08349084854126, "global_step": 174881, "epoch": 4163} {"train_loss": -6.952567100524902, "global_step": 174882, "epoch": 4163} {"train_loss": -7.101626396179199, "global_step": 174883, "epoch": 4163} {"train_loss": -7.014422416687012, "global_step": 174884, "epoch": 4163} {"train_loss": -6.951434135437012, "global_step": 174885, "epoch": 4163} {"train_loss": -6.950738906860352, "global_step": 174886, "epoch": 4163} {"train_loss": -7.023646286555699, "global_step": 174887, "epoch": 4163, "val_loss": 68887.75} {"train_loss": -7.074689865112305, "global_step": 174888, "epoch": 4164} {"train_loss": -7.037234306335449, "global_step": 174889, "epoch": 4164} {"train_loss": -7.162300109863281, "global_step": 174890, "epoch": 4164} {"train_loss": -7.065263748168945, "global_step": 174891, "epoch": 4164} {"train_loss": -7.071202278137207, "global_step": 174892, "epoch": 4164} {"train_loss": -7.157114028930664, "global_step": 174893, "epoch": 4164} {"train_loss": -7.176349639892578, "global_step": 174894, "epoch": 4164} {"train_loss": -7.163018226623535, "global_step": 174895, "epoch": 4164} {"train_loss": -7.056992530822754, "global_step": 174896, "epoch": 4164} {"train_loss": -7.1831583976745605, "global_step": 174897, "epoch": 4164} {"train_loss": -7.019947052001953, "global_step": 174898, "epoch": 4164} {"train_loss": -7.072259902954102, "global_step": 174899, "epoch": 4164} {"train_loss": -7.092039585113525, "global_step": 174900, "epoch": 4164} {"train_loss": -7.013799667358398, "global_step": 174901, "epoch": 4164} {"train_loss": -7.0924072265625, "global_step": 174902, "epoch": 4164} {"train_loss": -7.048828601837158, "global_step": 174903, "epoch": 4164} {"train_loss": -6.979369163513184, "global_step": 174904, "epoch": 4164} {"train_loss": -7.005345821380615, "global_step": 174905, "epoch": 4164} {"train_loss": -7.0726118087768555, "global_step": 174906, "epoch": 4164} {"train_loss": -7.121609687805176, "global_step": 174907, "epoch": 4164} {"train_loss": -7.037962436676025, "global_step": 174908, "epoch": 4164} {"train_loss": -7.111225605010986, "global_step": 174909, "epoch": 4164} {"train_loss": -6.965123653411865, "global_step": 174910, "epoch": 4164} {"train_loss": -6.872183322906494, "global_step": 174911, "epoch": 4164} {"train_loss": -6.965177059173584, "global_step": 174912, "epoch": 4164} {"train_loss": -6.946623802185059, "global_step": 174913, "epoch": 4164} {"train_loss": -7.050266265869141, "global_step": 174914, "epoch": 4164} {"train_loss": -7.027830123901367, "global_step": 174915, "epoch": 4164} {"train_loss": -7.019164085388184, "global_step": 174916, "epoch": 4164} {"train_loss": -7.072107791900635, "global_step": 174917, "epoch": 4164} {"train_loss": -7.0562896728515625, "global_step": 174918, "epoch": 4164} {"train_loss": -7.046109199523926, "global_step": 174919, "epoch": 4164} {"train_loss": -7.11314058303833, "global_step": 174920, "epoch": 4164} {"train_loss": -7.0259857177734375, "global_step": 174921, "epoch": 4164} {"train_loss": -7.0749831199646, "global_step": 174922, "epoch": 4164} {"train_loss": -7.0422773361206055, "global_step": 174923, "epoch": 4164} {"train_loss": -7.059350967407227, "global_step": 174924, "epoch": 4164} {"train_loss": -7.10366678237915, "global_step": 174925, "epoch": 4164} {"train_loss": -7.012945175170898, "global_step": 174926, "epoch": 4164} {"train_loss": -7.22940731048584, "global_step": 174927, "epoch": 4164} {"train_loss": -7.070289611816406, "global_step": 174928, "epoch": 4164} {"train_loss": -7.064148130871001, "global_step": 174929, "epoch": 4164, "val_loss": 69101.265625} {"train_loss": -7.06655216217041, "global_step": 174930, "epoch": 4165} {"train_loss": -7.17933464050293, "global_step": 174931, "epoch": 4165} {"train_loss": -7.023797512054443, "global_step": 174932, "epoch": 4165} {"train_loss": -7.185133457183838, "global_step": 174933, "epoch": 4165} {"train_loss": -7.096957206726074, "global_step": 174934, "epoch": 4165} {"train_loss": -7.1649322509765625, "global_step": 174935, "epoch": 4165} {"train_loss": -7.128090858459473, "global_step": 174936, "epoch": 4165} {"train_loss": -7.191946983337402, "global_step": 174937, "epoch": 4165} {"train_loss": -7.149592399597168, "global_step": 174938, "epoch": 4165} {"train_loss": -7.12094783782959, "global_step": 174939, "epoch": 4165} {"train_loss": -7.175777435302734, "global_step": 174940, "epoch": 4165} {"train_loss": -7.021458625793457, "global_step": 174941, "epoch": 4165} {"train_loss": -7.106665134429932, "global_step": 174942, "epoch": 4165} {"train_loss": -7.052250862121582, "global_step": 174943, "epoch": 4165} {"train_loss": -7.054740905761719, "global_step": 174944, "epoch": 4165} {"train_loss": -7.201803207397461, "global_step": 174945, "epoch": 4165} {"train_loss": -7.124786376953125, "global_step": 174946, "epoch": 4165} {"train_loss": -7.181262016296387, "global_step": 174947, "epoch": 4165} {"train_loss": -7.046751976013184, "global_step": 174948, "epoch": 4165} {"train_loss": -7.19431734085083, "global_step": 174949, "epoch": 4165} {"train_loss": -7.219175338745117, "global_step": 174950, "epoch": 4165} {"train_loss": -7.196704864501953, "global_step": 174951, "epoch": 4165} {"train_loss": -7.192119598388672, "global_step": 174952, "epoch": 4165} {"train_loss": -7.071803092956543, "global_step": 174953, "epoch": 4165} {"train_loss": -7.036821365356445, "global_step": 174954, "epoch": 4165} {"train_loss": -7.073033332824707, "global_step": 174955, "epoch": 4165} {"train_loss": -7.14651346206665, "global_step": 174956, "epoch": 4165} {"train_loss": -7.120396614074707, "global_step": 174957, "epoch": 4165} {"train_loss": -7.225736618041992, "global_step": 174958, "epoch": 4165} {"train_loss": -7.057822227478027, "global_step": 174959, "epoch": 4165} {"train_loss": -7.097761154174805, "global_step": 174960, "epoch": 4165} {"train_loss": -7.092318534851074, "global_step": 174961, "epoch": 4165} {"train_loss": -7.095495700836182, "global_step": 174962, "epoch": 4165} {"train_loss": -7.119220733642578, "global_step": 174963, "epoch": 4165} {"train_loss": -6.968316078186035, "global_step": 174964, "epoch": 4165} {"train_loss": -7.09931755065918, "global_step": 174965, "epoch": 4165} {"train_loss": -7.129611015319824, "global_step": 174966, "epoch": 4165} {"train_loss": -6.963369369506836, "global_step": 174967, "epoch": 4165} {"train_loss": -7.1293253898620605, "global_step": 174968, "epoch": 4165} {"train_loss": -7.134518623352051, "global_step": 174969, "epoch": 4165} {"train_loss": -7.082592964172363, "global_step": 174970, "epoch": 4165} {"train_loss": -7.1107257434300015, "global_step": 174971, "epoch": 4165, "val_loss": 69139.0859375} {"train_loss": -6.996391296386719, "global_step": 174972, "epoch": 4166} {"train_loss": -7.101068019866943, "global_step": 174973, "epoch": 4166} {"train_loss": -6.981524467468262, "global_step": 174974, "epoch": 4166} {"train_loss": -7.009270191192627, "global_step": 174975, "epoch": 4166} {"train_loss": -7.061471462249756, "global_step": 174976, "epoch": 4166} {"train_loss": -7.013818264007568, "global_step": 174977, "epoch": 4166} {"train_loss": -7.133566856384277, "global_step": 174978, "epoch": 4166} {"train_loss": -7.084929466247559, "global_step": 174979, "epoch": 4166} {"train_loss": -7.130043983459473, "global_step": 174980, "epoch": 4166} {"train_loss": -7.026510238647461, "global_step": 174981, "epoch": 4166} {"train_loss": -7.069487571716309, "global_step": 174982, "epoch": 4166} {"train_loss": -7.074853897094727, "global_step": 174983, "epoch": 4166} {"train_loss": -7.07656717300415, "global_step": 174984, "epoch": 4166} {"train_loss": -7.051973342895508, "global_step": 174985, "epoch": 4166} {"train_loss": -7.092109680175781, "global_step": 174986, "epoch": 4166} {"train_loss": -6.952851295471191, "global_step": 174987, "epoch": 4166} {"train_loss": -7.05504846572876, "global_step": 174988, "epoch": 4166} {"train_loss": -7.083908557891846, "global_step": 174989, "epoch": 4166} {"train_loss": -7.040891647338867, "global_step": 174990, "epoch": 4166} {"train_loss": -6.980412483215332, "global_step": 174991, "epoch": 4166} {"train_loss": -6.992877960205078, "global_step": 174992, "epoch": 4166} {"train_loss": -7.085506439208984, "global_step": 174993, "epoch": 4166} {"train_loss": -7.036721229553223, "global_step": 174994, "epoch": 4166} {"train_loss": -6.9744553565979, "global_step": 174995, "epoch": 4166} {"train_loss": -7.157876968383789, "global_step": 174996, "epoch": 4166} {"train_loss": -7.169724941253662, "global_step": 174997, "epoch": 4166} {"train_loss": -7.116262912750244, "global_step": 174998, "epoch": 4166} {"train_loss": -7.168877124786377, "global_step": 174999, "epoch": 4166} {"train_loss": -7.051235675811768, "global_step": 175000, "epoch": 4166} {"train_loss": -7.037551403045654, "global_step": 175001, "epoch": 4166} {"train_loss": -7.083131790161133, "global_step": 175002, "epoch": 4166} {"train_loss": -7.049743175506592, "global_step": 175003, "epoch": 4166} {"train_loss": -7.0937700271606445, "global_step": 175004, "epoch": 4166} {"train_loss": -7.06281852722168, "global_step": 175005, "epoch": 4166} {"train_loss": -7.113205909729004, "global_step": 175006, "epoch": 4166} {"train_loss": -7.0137505531311035, "global_step": 175007, "epoch": 4166} {"train_loss": -7.073722839355469, "global_step": 175008, "epoch": 4166} {"train_loss": -7.056719779968262, "global_step": 175009, "epoch": 4166} {"train_loss": -7.0319719314575195, "global_step": 175010, "epoch": 4166} {"train_loss": -6.9465532302856445, "global_step": 175011, "epoch": 4166} {"train_loss": -7.0677642822265625, "global_step": 175012, "epoch": 4166} {"train_loss": -7.059180974960327, "global_step": 175013, "epoch": 4166, "val_loss": 69179.578125} {"train_loss": -7.1540679931640625, "global_step": 175014, "epoch": 4167} {"train_loss": -6.967178821563721, "global_step": 175015, "epoch": 4167} {"train_loss": -7.034786224365234, "global_step": 175016, "epoch": 4167} {"train_loss": -7.038722515106201, "global_step": 175017, "epoch": 4167} {"train_loss": -6.894833564758301, "global_step": 175018, "epoch": 4167} {"train_loss": -6.998993873596191, "global_step": 175019, "epoch": 4167} {"train_loss": -6.992079734802246, "global_step": 175020, "epoch": 4167} {"train_loss": -6.962018966674805, "global_step": 175021, "epoch": 4167} {"train_loss": -7.038370609283447, "global_step": 175022, "epoch": 4167} {"train_loss": -6.978744983673096, "global_step": 175023, "epoch": 4167} {"train_loss": -7.03234338760376, "global_step": 175024, "epoch": 4167} {"train_loss": -6.94722318649292, "global_step": 175025, "epoch": 4167} {"train_loss": -6.970337867736816, "global_step": 175026, "epoch": 4167} {"train_loss": -6.973541259765625, "global_step": 175027, "epoch": 4167} {"train_loss": -6.9344024658203125, "global_step": 175028, "epoch": 4167} {"train_loss": -7.154282569885254, "global_step": 175029, "epoch": 4167} {"train_loss": -7.133381366729736, "global_step": 175030, "epoch": 4167} {"train_loss": -7.070070266723633, "global_step": 175031, "epoch": 4167} {"train_loss": -7.02752685546875, "global_step": 175032, "epoch": 4167} {"train_loss": -7.031530380249023, "global_step": 175033, "epoch": 4167} {"train_loss": -7.076850891113281, "global_step": 175034, "epoch": 4167} {"train_loss": -7.056657314300537, "global_step": 175035, "epoch": 4167} {"train_loss": -7.0349931716918945, "global_step": 175036, "epoch": 4167} {"train_loss": -7.025172233581543, "global_step": 175037, "epoch": 4167} {"train_loss": -6.970547676086426, "global_step": 175038, "epoch": 4167} {"train_loss": -6.977191925048828, "global_step": 175039, "epoch": 4167} {"train_loss": -7.031724452972412, "global_step": 175040, "epoch": 4167} {"train_loss": -7.042116641998291, "global_step": 175041, "epoch": 4167} {"train_loss": -7.074310302734375, "global_step": 175042, "epoch": 4167} {"train_loss": -6.840859889984131, "global_step": 175043, "epoch": 4167} {"train_loss": -7.070433139801025, "global_step": 175044, "epoch": 4167} {"train_loss": -7.030401229858398, "global_step": 175045, "epoch": 4167} {"train_loss": -7.171176910400391, "global_step": 175046, "epoch": 4167} {"train_loss": -7.0829925537109375, "global_step": 175047, "epoch": 4167} {"train_loss": -7.028711318969727, "global_step": 175048, "epoch": 4167} {"train_loss": -7.172540664672852, "global_step": 175049, "epoch": 4167} {"train_loss": -7.136308670043945, "global_step": 175050, "epoch": 4167} {"train_loss": -7.079868316650391, "global_step": 175051, "epoch": 4167} {"train_loss": -7.143110275268555, "global_step": 175052, "epoch": 4167} {"train_loss": -7.120863914489746, "global_step": 175053, "epoch": 4167} {"train_loss": -7.0140862464904785, "global_step": 175054, "epoch": 4167} {"train_loss": -7.039428949356079, "global_step": 175055, "epoch": 4167, "val_loss": 69057.9375} {"train_loss": -7.253947734832764, "global_step": 175056, "epoch": 4168} {"train_loss": -7.0897698402404785, "global_step": 175057, "epoch": 4168} {"train_loss": -7.054195404052734, "global_step": 175058, "epoch": 4168} {"train_loss": -7.087979793548584, "global_step": 175059, "epoch": 4168} {"train_loss": -7.094755172729492, "global_step": 175060, "epoch": 4168} {"train_loss": -7.082123756408691, "global_step": 175061, "epoch": 4168} {"train_loss": -7.19407844543457, "global_step": 175062, "epoch": 4168} {"train_loss": -7.033031463623047, "global_step": 175063, "epoch": 4168} {"train_loss": -7.220525741577148, "global_step": 175064, "epoch": 4168} {"train_loss": -7.163713455200195, "global_step": 175065, "epoch": 4168} {"train_loss": -6.97389554977417, "global_step": 175066, "epoch": 4168} {"train_loss": -7.062752723693848, "global_step": 175067, "epoch": 4168} {"train_loss": -7.006557464599609, "global_step": 175068, "epoch": 4168} {"train_loss": -7.057132720947266, "global_step": 175069, "epoch": 4168} {"train_loss": -7.170139312744141, "global_step": 175070, "epoch": 4168} {"train_loss": -7.1031694412231445, "global_step": 175071, "epoch": 4168} {"train_loss": -7.084076881408691, "global_step": 175072, "epoch": 4168} {"train_loss": -7.133583068847656, "global_step": 175073, "epoch": 4168} {"train_loss": -7.093857288360596, "global_step": 175074, "epoch": 4168} {"train_loss": -7.164659023284912, "global_step": 175075, "epoch": 4168} {"train_loss": -7.0329484939575195, "global_step": 175076, "epoch": 4168} {"train_loss": -7.07667350769043, "global_step": 175077, "epoch": 4168} {"train_loss": -7.157966613769531, "global_step": 175078, "epoch": 4168} {"train_loss": -7.0628252029418945, "global_step": 175079, "epoch": 4168} {"train_loss": -7.142892837524414, "global_step": 175080, "epoch": 4168} {"train_loss": -7.2681379318237305, "global_step": 175081, "epoch": 4168} {"train_loss": -7.134944915771484, "global_step": 175082, "epoch": 4168} {"train_loss": -7.289106369018555, "global_step": 175083, "epoch": 4168} {"train_loss": -7.0947265625, "global_step": 175084, "epoch": 4168} {"train_loss": -7.126107215881348, "global_step": 175085, "epoch": 4168} {"train_loss": -7.0855817794799805, "global_step": 175086, "epoch": 4168} {"train_loss": -7.074347496032715, "global_step": 175087, "epoch": 4168} {"train_loss": -7.114346027374268, "global_step": 175088, "epoch": 4168} {"train_loss": -7.121264934539795, "global_step": 175089, "epoch": 4168} {"train_loss": -7.0969648361206055, "global_step": 175090, "epoch": 4168} {"train_loss": -7.194894790649414, "global_step": 175091, "epoch": 4168} {"train_loss": -7.0913543701171875, "global_step": 175092, "epoch": 4168} {"train_loss": -6.927463054656982, "global_step": 175093, "epoch": 4168} {"train_loss": -7.120518684387207, "global_step": 175094, "epoch": 4168} {"train_loss": -6.961134910583496, "global_step": 175095, "epoch": 4168} {"train_loss": -7.094210624694824, "global_step": 175096, "epoch": 4168} {"train_loss": -7.109183742886498, "global_step": 175097, "epoch": 4168, "val_loss": 68949.640625} {"train_loss": -7.104938983917236, "global_step": 175098, "epoch": 4169} {"train_loss": -7.026272296905518, "global_step": 175099, "epoch": 4169} {"train_loss": -7.0692877769470215, "global_step": 175100, "epoch": 4169} {"train_loss": -7.117083549499512, "global_step": 175101, "epoch": 4169} {"train_loss": -7.2585954666137695, "global_step": 175102, "epoch": 4169} {"train_loss": -7.112874984741211, "global_step": 175103, "epoch": 4169} {"train_loss": -7.181904315948486, "global_step": 175104, "epoch": 4169} {"train_loss": -7.09991455078125, "global_step": 175105, "epoch": 4169} {"train_loss": -7.087737560272217, "global_step": 175106, "epoch": 4169} {"train_loss": -7.066232681274414, "global_step": 175107, "epoch": 4169} {"train_loss": -7.070877552032471, "global_step": 175108, "epoch": 4169} {"train_loss": -7.024275779724121, "global_step": 175109, "epoch": 4169} {"train_loss": -7.061619758605957, "global_step": 175110, "epoch": 4169} {"train_loss": -7.155115127563477, "global_step": 175111, "epoch": 4169} {"train_loss": -7.011139869689941, "global_step": 175112, "epoch": 4169} {"train_loss": -7.064810752868652, "global_step": 175113, "epoch": 4169} {"train_loss": -7.1202192306518555, "global_step": 175114, "epoch": 4169} {"train_loss": -7.028292655944824, "global_step": 175115, "epoch": 4169} {"train_loss": -7.01970100402832, "global_step": 175116, "epoch": 4169} {"train_loss": -6.961874008178711, "global_step": 175117, "epoch": 4169} {"train_loss": -7.148118019104004, "global_step": 175118, "epoch": 4169} {"train_loss": -7.04202938079834, "global_step": 175119, "epoch": 4169} {"train_loss": -7.079608917236328, "global_step": 175120, "epoch": 4169} {"train_loss": -6.889240264892578, "global_step": 175121, "epoch": 4169} {"train_loss": -7.024448394775391, "global_step": 175122, "epoch": 4169} {"train_loss": -7.09095573425293, "global_step": 175123, "epoch": 4169} {"train_loss": -6.995301246643066, "global_step": 175124, "epoch": 4169} {"train_loss": -7.0963263511657715, "global_step": 175125, "epoch": 4169} {"train_loss": -7.044661521911621, "global_step": 175126, "epoch": 4169} {"train_loss": -6.984445571899414, "global_step": 175127, "epoch": 4169} {"train_loss": -6.884357452392578, "global_step": 175128, "epoch": 4169} {"train_loss": -7.016913414001465, "global_step": 175129, "epoch": 4169} {"train_loss": -7.026860237121582, "global_step": 175130, "epoch": 4169} {"train_loss": -6.984662055969238, "global_step": 175131, "epoch": 4169} {"train_loss": -6.994663715362549, "global_step": 175132, "epoch": 4169} {"train_loss": -6.8075056076049805, "global_step": 175133, "epoch": 4169} {"train_loss": -6.965996742248535, "global_step": 175134, "epoch": 4169} {"train_loss": -6.9828996658325195, "global_step": 175135, "epoch": 4169} {"train_loss": -7.0144805908203125, "global_step": 175136, "epoch": 4169} {"train_loss": -7.021718502044678, "global_step": 175137, "epoch": 4169} {"train_loss": -7.044855117797852, "global_step": 175138, "epoch": 4169} {"train_loss": -7.042153165453956, "global_step": 175139, "epoch": 4169, "val_loss": 69225.3984375} {"train_loss": -7.165747165679932, "global_step": 175140, "epoch": 4170} {"train_loss": -6.976777076721191, "global_step": 175141, "epoch": 4170} {"train_loss": -6.923130035400391, "global_step": 175142, "epoch": 4170} {"train_loss": -7.041644096374512, "global_step": 175143, "epoch": 4170} {"train_loss": -6.896556854248047, "global_step": 175144, "epoch": 4170} {"train_loss": -6.957238674163818, "global_step": 175145, "epoch": 4170} {"train_loss": -6.897516250610352, "global_step": 175146, "epoch": 4170} {"train_loss": -7.082783222198486, "global_step": 175147, "epoch": 4170} {"train_loss": -6.988455772399902, "global_step": 175148, "epoch": 4170} {"train_loss": -7.081826686859131, "global_step": 175149, "epoch": 4170} {"train_loss": -7.019887924194336, "global_step": 175150, "epoch": 4170} {"train_loss": -7.0785932540893555, "global_step": 175151, "epoch": 4170} {"train_loss": -7.046846389770508, "global_step": 175152, "epoch": 4170} {"train_loss": -7.042691707611084, "global_step": 175153, "epoch": 4170} {"train_loss": -7.1327972412109375, "global_step": 175154, "epoch": 4170} {"train_loss": -7.048974990844727, "global_step": 175155, "epoch": 4170} {"train_loss": -6.97361946105957, "global_step": 175156, "epoch": 4170} {"train_loss": -6.983800888061523, "global_step": 175157, "epoch": 4170} {"train_loss": -7.116701126098633, "global_step": 175158, "epoch": 4170} {"train_loss": -7.033881187438965, "global_step": 175159, "epoch": 4170} {"train_loss": -7.145413875579834, "global_step": 175160, "epoch": 4170} {"train_loss": -7.0911478996276855, "global_step": 175161, "epoch": 4170} {"train_loss": -7.020255088806152, "global_step": 175162, "epoch": 4170} {"train_loss": -7.058797836303711, "global_step": 175163, "epoch": 4170} {"train_loss": -7.063174247741699, "global_step": 175164, "epoch": 4170} {"train_loss": -7.0090131759643555, "global_step": 175165, "epoch": 4170} {"train_loss": -7.104640007019043, "global_step": 175166, "epoch": 4170} {"train_loss": -7.005876064300537, "global_step": 175167, "epoch": 4170} {"train_loss": -6.992303848266602, "global_step": 175168, "epoch": 4170} {"train_loss": -7.0179033279418945, "global_step": 175169, "epoch": 4170} {"train_loss": -7.09097957611084, "global_step": 175170, "epoch": 4170} {"train_loss": -7.057093620300293, "global_step": 175171, "epoch": 4170} {"train_loss": -7.038969039916992, "global_step": 175172, "epoch": 4170} {"train_loss": -7.114526748657227, "global_step": 175173, "epoch": 4170} {"train_loss": -6.990296363830566, "global_step": 175174, "epoch": 4170} {"train_loss": -7.094364643096924, "global_step": 175175, "epoch": 4170} {"train_loss": -7.033902645111084, "global_step": 175176, "epoch": 4170} {"train_loss": -7.1034440994262695, "global_step": 175177, "epoch": 4170} {"train_loss": -7.098901748657227, "global_step": 175178, "epoch": 4170} {"train_loss": -7.119978427886963, "global_step": 175179, "epoch": 4170} {"train_loss": -7.121172904968262, "global_step": 175180, "epoch": 4170} {"train_loss": -7.046843767166138, "global_step": 175181, "epoch": 4170, "val_loss": 69100.5078125} {"train_loss": -7.109177589416504, "global_step": 175182, "epoch": 4171} {"train_loss": -7.024402618408203, "global_step": 175183, "epoch": 4171} {"train_loss": -7.122003555297852, "global_step": 175184, "epoch": 4171} {"train_loss": -7.166802406311035, "global_step": 175185, "epoch": 4171} {"train_loss": -7.06242036819458, "global_step": 175186, "epoch": 4171} {"train_loss": -7.1972503662109375, "global_step": 175187, "epoch": 4171} {"train_loss": -7.173337936401367, "global_step": 175188, "epoch": 4171} {"train_loss": -7.203460693359375, "global_step": 175189, "epoch": 4171} {"train_loss": -7.105025291442871, "global_step": 175190, "epoch": 4171} {"train_loss": -7.160675048828125, "global_step": 175191, "epoch": 4171} {"train_loss": -7.091231822967529, "global_step": 175192, "epoch": 4171} {"train_loss": -7.096315383911133, "global_step": 175193, "epoch": 4171} {"train_loss": -7.144344329833984, "global_step": 175194, "epoch": 4171} {"train_loss": -7.064558029174805, "global_step": 175195, "epoch": 4171} {"train_loss": -7.182748794555664, "global_step": 175196, "epoch": 4171} {"train_loss": -7.1632232666015625, "global_step": 175197, "epoch": 4171} {"train_loss": -7.178536891937256, "global_step": 175198, "epoch": 4171} {"train_loss": -7.090709686279297, "global_step": 175199, "epoch": 4171} {"train_loss": -7.039182186126709, "global_step": 175200, "epoch": 4171} {"train_loss": -7.046113967895508, "global_step": 175201, "epoch": 4171} {"train_loss": -7.189338684082031, "global_step": 175202, "epoch": 4171} {"train_loss": -7.129230976104736, "global_step": 175203, "epoch": 4171} {"train_loss": -7.095917701721191, "global_step": 175204, "epoch": 4171} {"train_loss": -7.161155700683594, "global_step": 175205, "epoch": 4171} {"train_loss": -7.110579013824463, "global_step": 175206, "epoch": 4171} {"train_loss": -7.081901550292969, "global_step": 175207, "epoch": 4171} {"train_loss": -7.08721923828125, "global_step": 175208, "epoch": 4171} {"train_loss": -7.14250373840332, "global_step": 175209, "epoch": 4171} {"train_loss": -6.994260787963867, "global_step": 175210, "epoch": 4171} {"train_loss": -7.094333648681641, "global_step": 175211, "epoch": 4171} {"train_loss": -7.131713390350342, "global_step": 175212, "epoch": 4171} {"train_loss": -7.102893352508545, "global_step": 175213, "epoch": 4171} {"train_loss": -7.242680072784424, "global_step": 175214, "epoch": 4171} {"train_loss": -7.174505233764648, "global_step": 175215, "epoch": 4171} {"train_loss": -7.143167495727539, "global_step": 175216, "epoch": 4171} {"train_loss": -7.19450569152832, "global_step": 175217, "epoch": 4171} {"train_loss": -7.076932907104492, "global_step": 175218, "epoch": 4171} {"train_loss": -7.094038963317871, "global_step": 175219, "epoch": 4171} {"train_loss": -7.16011905670166, "global_step": 175220, "epoch": 4171} {"train_loss": -7.19596004486084, "global_step": 175221, "epoch": 4171} {"train_loss": -7.068482875823975, "global_step": 175222, "epoch": 4171} {"train_loss": -7.1229928107488725, "global_step": 175223, "epoch": 4171, "val_loss": 69081.5546875} {"train_loss": -7.103890419006348, "global_step": 175224, "epoch": 4172} {"train_loss": -7.077042579650879, "global_step": 175225, "epoch": 4172} {"train_loss": -7.135807037353516, "global_step": 175226, "epoch": 4172} {"train_loss": -7.113704681396484, "global_step": 175227, "epoch": 4172} {"train_loss": -7.064260482788086, "global_step": 175228, "epoch": 4172} {"train_loss": -7.26827335357666, "global_step": 175229, "epoch": 4172} {"train_loss": -7.054009437561035, "global_step": 175230, "epoch": 4172} {"train_loss": -7.158478736877441, "global_step": 175231, "epoch": 4172} {"train_loss": -7.123012542724609, "global_step": 175232, "epoch": 4172} {"train_loss": -7.0680317878723145, "global_step": 175233, "epoch": 4172} {"train_loss": -7.120798587799072, "global_step": 175234, "epoch": 4172} {"train_loss": -7.099806785583496, "global_step": 175235, "epoch": 4172} {"train_loss": -6.948871612548828, "global_step": 175236, "epoch": 4172} {"train_loss": -7.123135566711426, "global_step": 175237, "epoch": 4172} {"train_loss": -7.032890319824219, "global_step": 175238, "epoch": 4172} {"train_loss": -6.9414753913879395, "global_step": 175239, "epoch": 4172} {"train_loss": -7.0674543380737305, "global_step": 175240, "epoch": 4172} {"train_loss": -7.0750250816345215, "global_step": 175241, "epoch": 4172} {"train_loss": -7.040157318115234, "global_step": 175242, "epoch": 4172} {"train_loss": -7.013625621795654, "global_step": 175243, "epoch": 4172} {"train_loss": -7.021292686462402, "global_step": 175244, "epoch": 4172} {"train_loss": -6.936399459838867, "global_step": 175245, "epoch": 4172} {"train_loss": -7.039168834686279, "global_step": 175246, "epoch": 4172} {"train_loss": -6.962871551513672, "global_step": 175247, "epoch": 4172} {"train_loss": -6.9625043869018555, "global_step": 175248, "epoch": 4172} {"train_loss": -6.979666709899902, "global_step": 175249, "epoch": 4172} {"train_loss": -7.010262966156006, "global_step": 175250, "epoch": 4172} {"train_loss": -7.071990013122559, "global_step": 175251, "epoch": 4172} {"train_loss": -6.998388767242432, "global_step": 175252, "epoch": 4172} {"train_loss": -7.08198356628418, "global_step": 175253, "epoch": 4172} {"train_loss": -7.115673065185547, "global_step": 175254, "epoch": 4172} {"train_loss": -7.03953742980957, "global_step": 175255, "epoch": 4172} {"train_loss": -7.132293701171875, "global_step": 175256, "epoch": 4172} {"train_loss": -6.904106140136719, "global_step": 175257, "epoch": 4172} {"train_loss": -7.109764099121094, "global_step": 175258, "epoch": 4172} {"train_loss": -6.951731204986572, "global_step": 175259, "epoch": 4172} {"train_loss": -7.1784138679504395, "global_step": 175260, "epoch": 4172} {"train_loss": -6.986416339874268, "global_step": 175261, "epoch": 4172} {"train_loss": -7.071075439453125, "global_step": 175262, "epoch": 4172} {"train_loss": -7.050376892089844, "global_step": 175263, "epoch": 4172} {"train_loss": -7.031585693359375, "global_step": 175264, "epoch": 4172} {"train_loss": -7.056779407319569, "global_step": 175265, "epoch": 4172, "val_loss": 69052.2734375} {"train_loss": -7.213710308074951, "global_step": 175266, "epoch": 4173} {"train_loss": -7.154035568237305, "global_step": 175267, "epoch": 4173} {"train_loss": -7.058441162109375, "global_step": 175268, "epoch": 4173} {"train_loss": -7.119448661804199, "global_step": 175269, "epoch": 4173} {"train_loss": -7.071168899536133, "global_step": 175270, "epoch": 4173} {"train_loss": -6.9871931076049805, "global_step": 175271, "epoch": 4173} {"train_loss": -7.061532020568848, "global_step": 175272, "epoch": 4173} {"train_loss": -7.001090049743652, "global_step": 175273, "epoch": 4173} {"train_loss": -7.113536834716797, "global_step": 175274, "epoch": 4173} {"train_loss": -7.055603504180908, "global_step": 175275, "epoch": 4173} {"train_loss": -6.909109115600586, "global_step": 175276, "epoch": 4173} {"train_loss": -7.109817028045654, "global_step": 175277, "epoch": 4173} {"train_loss": -6.9611968994140625, "global_step": 175278, "epoch": 4173} {"train_loss": -7.032830715179443, "global_step": 175279, "epoch": 4173} {"train_loss": -7.067681312561035, "global_step": 175280, "epoch": 4173} {"train_loss": -7.007616996765137, "global_step": 175281, "epoch": 4173} {"train_loss": -7.0991997718811035, "global_step": 175282, "epoch": 4173} {"train_loss": -6.941617012023926, "global_step": 175283, "epoch": 4173} {"train_loss": -7.020577430725098, "global_step": 175284, "epoch": 4173} {"train_loss": -7.086041450500488, "global_step": 175285, "epoch": 4173} {"train_loss": -6.8977742195129395, "global_step": 175286, "epoch": 4173} {"train_loss": -7.08013916015625, "global_step": 175287, "epoch": 4173} {"train_loss": -7.049103736877441, "global_step": 175288, "epoch": 4173} {"train_loss": -7.026799201965332, "global_step": 175289, "epoch": 4173} {"train_loss": -7.018875598907471, "global_step": 175290, "epoch": 4173} {"train_loss": -6.94871711730957, "global_step": 175291, "epoch": 4173} {"train_loss": -7.183464050292969, "global_step": 175292, "epoch": 4173} {"train_loss": -6.991154670715332, "global_step": 175293, "epoch": 4173} {"train_loss": -6.973666667938232, "global_step": 175294, "epoch": 4173} {"train_loss": -7.069505214691162, "global_step": 175295, "epoch": 4173} {"train_loss": -6.804862022399902, "global_step": 175296, "epoch": 4173} {"train_loss": -7.103915691375732, "global_step": 175297, "epoch": 4173} {"train_loss": -7.0604448318481445, "global_step": 175298, "epoch": 4173} {"train_loss": -7.007389068603516, "global_step": 175299, "epoch": 4173} {"train_loss": -7.095344543457031, "global_step": 175300, "epoch": 4173} {"train_loss": -6.985210418701172, "global_step": 175301, "epoch": 4173} {"train_loss": -6.979617595672607, "global_step": 175302, "epoch": 4173} {"train_loss": -7.067790985107422, "global_step": 175303, "epoch": 4173} {"train_loss": -6.8200178146362305, "global_step": 175304, "epoch": 4173} {"train_loss": -7.116554260253906, "global_step": 175305, "epoch": 4173} {"train_loss": -7.136602401733398, "global_step": 175306, "epoch": 4173} {"train_loss": -7.036543778010777, "global_step": 175307, "epoch": 4173, "val_loss": 69091.3515625} {"train_loss": -7.161151885986328, "global_step": 175308, "epoch": 4174} {"train_loss": -7.030097007751465, "global_step": 175309, "epoch": 4174} {"train_loss": -7.096283912658691, "global_step": 175310, "epoch": 4174} {"train_loss": -7.12686824798584, "global_step": 175311, "epoch": 4174} {"train_loss": -7.085865020751953, "global_step": 175312, "epoch": 4174} {"train_loss": -7.105035305023193, "global_step": 175313, "epoch": 4174} {"train_loss": -6.946897506713867, "global_step": 175314, "epoch": 4174} {"train_loss": -7.134995460510254, "global_step": 175315, "epoch": 4174} {"train_loss": -7.028044700622559, "global_step": 175316, "epoch": 4174} {"train_loss": -6.895768642425537, "global_step": 175317, "epoch": 4174} {"train_loss": -7.052889823913574, "global_step": 175318, "epoch": 4174} {"train_loss": -6.870216369628906, "global_step": 175319, "epoch": 4174} {"train_loss": -7.048859596252441, "global_step": 175320, "epoch": 4174} {"train_loss": -6.967540740966797, "global_step": 175321, "epoch": 4174} {"train_loss": -6.8561110496521, "global_step": 175322, "epoch": 4174} {"train_loss": -7.014957427978516, "global_step": 175323, "epoch": 4174} {"train_loss": -6.757491111755371, "global_step": 175324, "epoch": 4174} {"train_loss": -6.96480655670166, "global_step": 175325, "epoch": 4174} {"train_loss": -6.64501953125, "global_step": 175326, "epoch": 4174} {"train_loss": -6.893765449523926, "global_step": 175327, "epoch": 4174} {"train_loss": -6.862168312072754, "global_step": 175328, "epoch": 4174} {"train_loss": -6.864264488220215, "global_step": 175329, "epoch": 4174} {"train_loss": -6.908836364746094, "global_step": 175330, "epoch": 4174} {"train_loss": -6.88071346282959, "global_step": 175331, "epoch": 4174} {"train_loss": -7.043200969696045, "global_step": 175332, "epoch": 4174} {"train_loss": -6.889794826507568, "global_step": 175333, "epoch": 4174} {"train_loss": -6.985560417175293, "global_step": 175334, "epoch": 4174} {"train_loss": -7.000797271728516, "global_step": 175335, "epoch": 4174} {"train_loss": -6.91169548034668, "global_step": 175336, "epoch": 4174} {"train_loss": -6.878295421600342, "global_step": 175337, "epoch": 4174} {"train_loss": -7.035519123077393, "global_step": 175338, "epoch": 4174} {"train_loss": -6.935652732849121, "global_step": 175339, "epoch": 4174} {"train_loss": -7.0162200927734375, "global_step": 175340, "epoch": 4174} {"train_loss": -6.872108459472656, "global_step": 175341, "epoch": 4174} {"train_loss": -7.015997409820557, "global_step": 175342, "epoch": 4174} {"train_loss": -6.895223617553711, "global_step": 175343, "epoch": 4174} {"train_loss": -6.979122638702393, "global_step": 175344, "epoch": 4174} {"train_loss": -6.998172283172607, "global_step": 175345, "epoch": 4174} {"train_loss": -6.944944381713867, "global_step": 175346, "epoch": 4174} {"train_loss": -6.963736534118652, "global_step": 175347, "epoch": 4174} {"train_loss": -7.070908069610596, "global_step": 175348, "epoch": 4174} {"train_loss": -6.966649418785458, "global_step": 175349, "epoch": 4174, "val_loss": 69120.28125} {"train_loss": -7.040244102478027, "global_step": 175350, "epoch": 4175} {"train_loss": -6.953939437866211, "global_step": 175351, "epoch": 4175} {"train_loss": -7.053804397583008, "global_step": 175352, "epoch": 4175} {"train_loss": -7.083266258239746, "global_step": 175353, "epoch": 4175} {"train_loss": -7.199095726013184, "global_step": 175354, "epoch": 4175} {"train_loss": -7.138980865478516, "global_step": 175355, "epoch": 4175} {"train_loss": -6.968986511230469, "global_step": 175356, "epoch": 4175} {"train_loss": -7.0705485343933105, "global_step": 175357, "epoch": 4175} {"train_loss": -7.128354072570801, "global_step": 175358, "epoch": 4175} {"train_loss": -7.056541442871094, "global_step": 175359, "epoch": 4175} {"train_loss": -7.087413311004639, "global_step": 175360, "epoch": 4175} {"train_loss": -7.0448808670043945, "global_step": 175361, "epoch": 4175} {"train_loss": -7.0827813148498535, "global_step": 175362, "epoch": 4175} {"train_loss": -7.100069999694824, "global_step": 175363, "epoch": 4175} {"train_loss": -7.156210899353027, "global_step": 175364, "epoch": 4175} {"train_loss": -7.0374040603637695, "global_step": 175365, "epoch": 4175} {"train_loss": -7.059689044952393, "global_step": 175366, "epoch": 4175} {"train_loss": -7.047496318817139, "global_step": 175367, "epoch": 4175} {"train_loss": -6.994719505310059, "global_step": 175368, "epoch": 4175} {"train_loss": -7.05739164352417, "global_step": 175369, "epoch": 4175} {"train_loss": -7.102110862731934, "global_step": 175370, "epoch": 4175} {"train_loss": -6.972119331359863, "global_step": 175371, "epoch": 4175} {"train_loss": -7.0372700691223145, "global_step": 175372, "epoch": 4175} {"train_loss": -7.03065299987793, "global_step": 175373, "epoch": 4175} {"train_loss": -7.0577392578125, "global_step": 175374, "epoch": 4175} {"train_loss": -7.140089988708496, "global_step": 175375, "epoch": 4175} {"train_loss": -7.106432914733887, "global_step": 175376, "epoch": 4175} {"train_loss": -7.135441303253174, "global_step": 175377, "epoch": 4175} {"train_loss": -7.184135437011719, "global_step": 175378, "epoch": 4175} {"train_loss": -7.076542377471924, "global_step": 175379, "epoch": 4175} {"train_loss": -7.09751033782959, "global_step": 175380, "epoch": 4175} {"train_loss": -6.976585388183594, "global_step": 175381, "epoch": 4175} {"train_loss": -7.133759021759033, "global_step": 175382, "epoch": 4175} {"train_loss": -7.056719779968262, "global_step": 175383, "epoch": 4175} {"train_loss": -7.174936294555664, "global_step": 175384, "epoch": 4175} {"train_loss": -7.183671474456787, "global_step": 175385, "epoch": 4175} {"train_loss": -7.031316757202148, "global_step": 175386, "epoch": 4175} {"train_loss": -7.136926651000977, "global_step": 175387, "epoch": 4175} {"train_loss": -7.265066146850586, "global_step": 175388, "epoch": 4175} {"train_loss": -7.185711860656738, "global_step": 175389, "epoch": 4175} {"train_loss": -7.112507343292236, "global_step": 175390, "epoch": 4175} {"train_loss": -7.086852754865374, "global_step": 175391, "epoch": 4175, "val_loss": 69225.8671875} {"train_loss": -7.221917152404785, "global_step": 175392, "epoch": 4176} {"train_loss": -7.169012069702148, "global_step": 175393, "epoch": 4176} {"train_loss": -7.028703212738037, "global_step": 175394, "epoch": 4176} {"train_loss": -7.168045520782471, "global_step": 175395, "epoch": 4176} {"train_loss": -7.117430686950684, "global_step": 175396, "epoch": 4176} {"train_loss": -7.085384368896484, "global_step": 175397, "epoch": 4176} {"train_loss": -7.044702529907227, "global_step": 175398, "epoch": 4176} {"train_loss": -7.108096122741699, "global_step": 175399, "epoch": 4176} {"train_loss": -7.141812324523926, "global_step": 175400, "epoch": 4176} {"train_loss": -7.171025276184082, "global_step": 175401, "epoch": 4176} {"train_loss": -7.110659122467041, "global_step": 175402, "epoch": 4176} {"train_loss": -7.175030708312988, "global_step": 175403, "epoch": 4176} {"train_loss": -7.1543731689453125, "global_step": 175404, "epoch": 4176} {"train_loss": -7.222569942474365, "global_step": 175405, "epoch": 4176} {"train_loss": -7.063779830932617, "global_step": 175406, "epoch": 4176} {"train_loss": -7.024860382080078, "global_step": 175407, "epoch": 4176} {"train_loss": -6.973845481872559, "global_step": 175408, "epoch": 4176} {"train_loss": -7.119019508361816, "global_step": 175409, "epoch": 4176} {"train_loss": -7.029481887817383, "global_step": 175410, "epoch": 4176} {"train_loss": -7.112553596496582, "global_step": 175411, "epoch": 4176} {"train_loss": -7.076689720153809, "global_step": 175412, "epoch": 4176} {"train_loss": -7.092364311218262, "global_step": 175413, "epoch": 4176} {"train_loss": -7.085550308227539, "global_step": 175414, "epoch": 4176} {"train_loss": -7.076666355133057, "global_step": 175415, "epoch": 4176} {"train_loss": -7.031391143798828, "global_step": 175416, "epoch": 4176} {"train_loss": -7.121846675872803, "global_step": 175417, "epoch": 4176} {"train_loss": -7.060258865356445, "global_step": 175418, "epoch": 4176} {"train_loss": -7.065778732299805, "global_step": 175419, "epoch": 4176} {"train_loss": -7.051115989685059, "global_step": 175420, "epoch": 4176} {"train_loss": -7.197109699249268, "global_step": 175421, "epoch": 4176} {"train_loss": -7.030723571777344, "global_step": 175422, "epoch": 4176} {"train_loss": -7.19070291519165, "global_step": 175423, "epoch": 4176} {"train_loss": -7.129213333129883, "global_step": 175424, "epoch": 4176} {"train_loss": -7.118467330932617, "global_step": 175425, "epoch": 4176} {"train_loss": -7.180386543273926, "global_step": 175426, "epoch": 4176} {"train_loss": -7.109342575073242, "global_step": 175427, "epoch": 4176} {"train_loss": -7.041665077209473, "global_step": 175428, "epoch": 4176} {"train_loss": -7.049476623535156, "global_step": 175429, "epoch": 4176} {"train_loss": -7.162468433380127, "global_step": 175430, "epoch": 4176} {"train_loss": -7.189741134643555, "global_step": 175431, "epoch": 4176} {"train_loss": -7.148137092590332, "global_step": 175432, "epoch": 4176} {"train_loss": -7.106907583418346, "global_step": 175433, "epoch": 4176, "val_loss": 69157.6953125} {"train_loss": -7.167000770568848, "global_step": 175434, "epoch": 4177} {"train_loss": -7.112113952636719, "global_step": 175435, "epoch": 4177} {"train_loss": -7.208920478820801, "global_step": 175436, "epoch": 4177} {"train_loss": -7.154592037200928, "global_step": 175437, "epoch": 4177} {"train_loss": -7.151801586151123, "global_step": 175438, "epoch": 4177} {"train_loss": -7.11357307434082, "global_step": 175439, "epoch": 4177} {"train_loss": -7.222934246063232, "global_step": 175440, "epoch": 4177} {"train_loss": -7.127255439758301, "global_step": 175441, "epoch": 4177} {"train_loss": -7.062670707702637, "global_step": 175442, "epoch": 4177} {"train_loss": -7.196798324584961, "global_step": 175443, "epoch": 4177} {"train_loss": -7.086255073547363, "global_step": 175444, "epoch": 4177} {"train_loss": -7.1229472160339355, "global_step": 175445, "epoch": 4177} {"train_loss": -7.20617151260376, "global_step": 175446, "epoch": 4177} {"train_loss": -7.0477094650268555, "global_step": 175447, "epoch": 4177} {"train_loss": -7.113301753997803, "global_step": 175448, "epoch": 4177} {"train_loss": -7.107478141784668, "global_step": 175449, "epoch": 4177} {"train_loss": -7.159010410308838, "global_step": 175450, "epoch": 4177} {"train_loss": -7.082630157470703, "global_step": 175451, "epoch": 4177} {"train_loss": -7.155002593994141, "global_step": 175452, "epoch": 4177} {"train_loss": -7.08760929107666, "global_step": 175453, "epoch": 4177} {"train_loss": -7.026607036590576, "global_step": 175454, "epoch": 4177} {"train_loss": -7.160503387451172, "global_step": 175455, "epoch": 4177} {"train_loss": -7.058265686035156, "global_step": 175456, "epoch": 4177} {"train_loss": -6.8997297286987305, "global_step": 175457, "epoch": 4177} {"train_loss": -7.065825462341309, "global_step": 175458, "epoch": 4177} {"train_loss": -7.071078300476074, "global_step": 175459, "epoch": 4177} {"train_loss": -6.96780252456665, "global_step": 175460, "epoch": 4177} {"train_loss": -7.039548873901367, "global_step": 175461, "epoch": 4177} {"train_loss": -7.030451774597168, "global_step": 175462, "epoch": 4177} {"train_loss": -7.048488616943359, "global_step": 175463, "epoch": 4177} {"train_loss": -7.0767292976379395, "global_step": 175464, "epoch": 4177} {"train_loss": -7.054664611816406, "global_step": 175465, "epoch": 4177} {"train_loss": -7.038652420043945, "global_step": 175466, "epoch": 4177} {"train_loss": -7.0545220375061035, "global_step": 175467, "epoch": 4177} {"train_loss": -7.053293704986572, "global_step": 175468, "epoch": 4177} {"train_loss": -6.951902389526367, "global_step": 175469, "epoch": 4177} {"train_loss": -7.110747814178467, "global_step": 175470, "epoch": 4177} {"train_loss": -7.113617897033691, "global_step": 175471, "epoch": 4177} {"train_loss": -6.962627410888672, "global_step": 175472, "epoch": 4177} {"train_loss": -7.098783016204834, "global_step": 175473, "epoch": 4177} {"train_loss": -7.083654403686523, "global_step": 175474, "epoch": 4177} {"train_loss": -7.085875670115153, "global_step": 175475, "epoch": 4177, "val_loss": 69153.359375} {"train_loss": -7.103377342224121, "global_step": 175476, "epoch": 4178} {"train_loss": -6.966890335083008, "global_step": 175477, "epoch": 4178} {"train_loss": -6.930542945861816, "global_step": 175478, "epoch": 4178} {"train_loss": -7.0544633865356445, "global_step": 175479, "epoch": 4178} {"train_loss": -6.984665870666504, "global_step": 175480, "epoch": 4178} {"train_loss": -7.063103199005127, "global_step": 175481, "epoch": 4178} {"train_loss": -6.999156951904297, "global_step": 175482, "epoch": 4178} {"train_loss": -7.145545959472656, "global_step": 175483, "epoch": 4178} {"train_loss": -7.0194091796875, "global_step": 175484, "epoch": 4178} {"train_loss": -7.054416179656982, "global_step": 175485, "epoch": 4178} {"train_loss": -7.125607490539551, "global_step": 175486, "epoch": 4178} {"train_loss": -7.072296619415283, "global_step": 175487, "epoch": 4178} {"train_loss": -7.1464080810546875, "global_step": 175488, "epoch": 4178} {"train_loss": -7.052772521972656, "global_step": 175489, "epoch": 4178} {"train_loss": -7.080752849578857, "global_step": 175490, "epoch": 4178} {"train_loss": -7.126918315887451, "global_step": 175491, "epoch": 4178} {"train_loss": -7.052223205566406, "global_step": 175492, "epoch": 4178} {"train_loss": -7.165834903717041, "global_step": 175493, "epoch": 4178} {"train_loss": -7.074618816375732, "global_step": 175494, "epoch": 4178} {"train_loss": -7.137626647949219, "global_step": 175495, "epoch": 4178} {"train_loss": -7.118625640869141, "global_step": 175496, "epoch": 4178} {"train_loss": -7.045511245727539, "global_step": 175497, "epoch": 4178} {"train_loss": -7.057424545288086, "global_step": 175498, "epoch": 4178} {"train_loss": -6.906481742858887, "global_step": 175499, "epoch": 4178} {"train_loss": -7.079104900360107, "global_step": 175500, "epoch": 4178} {"train_loss": -7.073129653930664, "global_step": 175501, "epoch": 4178} {"train_loss": -7.063371658325195, "global_step": 175502, "epoch": 4178} {"train_loss": -7.055951118469238, "global_step": 175503, "epoch": 4178} {"train_loss": -7.006349563598633, "global_step": 175504, "epoch": 4178} {"train_loss": -6.971859931945801, "global_step": 175505, "epoch": 4178} {"train_loss": -6.835453510284424, "global_step": 175506, "epoch": 4178} {"train_loss": -7.026471138000488, "global_step": 175507, "epoch": 4178} {"train_loss": -6.957408428192139, "global_step": 175508, "epoch": 4178} {"train_loss": -7.064859867095947, "global_step": 175509, "epoch": 4178} {"train_loss": -6.787297248840332, "global_step": 175510, "epoch": 4178} {"train_loss": -6.792110443115234, "global_step": 175511, "epoch": 4178} {"train_loss": -7.010622024536133, "global_step": 175512, "epoch": 4178} {"train_loss": -6.8452959060668945, "global_step": 175513, "epoch": 4178} {"train_loss": -7.00620174407959, "global_step": 175514, "epoch": 4178} {"train_loss": -6.902280330657959, "global_step": 175515, "epoch": 4178} {"train_loss": -6.962284088134766, "global_step": 175516, "epoch": 4178} {"train_loss": -7.015715553646996, "global_step": 175517, "epoch": 4178, "val_loss": 69119.078125} {"train_loss": -6.979339122772217, "global_step": 175518, "epoch": 4179} {"train_loss": -7.009331226348877, "global_step": 175519, "epoch": 4179} {"train_loss": -7.001893997192383, "global_step": 175520, "epoch": 4179} {"train_loss": -7.080015659332275, "global_step": 175521, "epoch": 4179} {"train_loss": -7.043526649475098, "global_step": 175522, "epoch": 4179} {"train_loss": -6.862781524658203, "global_step": 175523, "epoch": 4179} {"train_loss": -7.086285591125488, "global_step": 175524, "epoch": 4179} {"train_loss": -7.034794330596924, "global_step": 175525, "epoch": 4179} {"train_loss": -7.0999860763549805, "global_step": 175526, "epoch": 4179} {"train_loss": -6.9778313636779785, "global_step": 175527, "epoch": 4179} {"train_loss": -7.079599380493164, "global_step": 175528, "epoch": 4179} {"train_loss": -7.053877353668213, "global_step": 175529, "epoch": 4179} {"train_loss": -7.14184045791626, "global_step": 175530, "epoch": 4179} {"train_loss": -7.175930976867676, "global_step": 175531, "epoch": 4179} {"train_loss": -7.123716354370117, "global_step": 175532, "epoch": 4179} {"train_loss": -7.111692428588867, "global_step": 175533, "epoch": 4179} {"train_loss": -6.991721153259277, "global_step": 175534, "epoch": 4179} {"train_loss": -7.151479721069336, "global_step": 175535, "epoch": 4179} {"train_loss": -7.093221664428711, "global_step": 175536, "epoch": 4179} {"train_loss": -7.115733623504639, "global_step": 175537, "epoch": 4179} {"train_loss": -7.225466728210449, "global_step": 175538, "epoch": 4179} {"train_loss": -7.112130641937256, "global_step": 175539, "epoch": 4179} {"train_loss": -7.088451385498047, "global_step": 175540, "epoch": 4179} {"train_loss": -7.068062782287598, "global_step": 175541, "epoch": 4179} {"train_loss": -7.054460525512695, "global_step": 175542, "epoch": 4179} {"train_loss": -7.082530975341797, "global_step": 175543, "epoch": 4179} {"train_loss": -7.237752437591553, "global_step": 175544, "epoch": 4179} {"train_loss": -7.100878715515137, "global_step": 175545, "epoch": 4179} {"train_loss": -7.106082439422607, "global_step": 175546, "epoch": 4179} {"train_loss": -7.0644450187683105, "global_step": 175547, "epoch": 4179} {"train_loss": -7.132937431335449, "global_step": 175548, "epoch": 4179} {"train_loss": -7.1094489097595215, "global_step": 175549, "epoch": 4179} {"train_loss": -7.131885051727295, "global_step": 175550, "epoch": 4179} {"train_loss": -7.233620643615723, "global_step": 175551, "epoch": 4179} {"train_loss": -7.149943828582764, "global_step": 175552, "epoch": 4179} {"train_loss": -7.151996612548828, "global_step": 175553, "epoch": 4179} {"train_loss": -7.183921813964844, "global_step": 175554, "epoch": 4179} {"train_loss": -7.007097244262695, "global_step": 175555, "epoch": 4179} {"train_loss": -7.02786922454834, "global_step": 175556, "epoch": 4179} {"train_loss": -7.072392463684082, "global_step": 175557, "epoch": 4179} {"train_loss": -7.111872673034668, "global_step": 175558, "epoch": 4179} {"train_loss": -7.08922096661159, "global_step": 175559, "epoch": 4179, "val_loss": 69267.6015625} {"train_loss": -7.039905071258545, "global_step": 175560, "epoch": 4180} {"train_loss": -7.138428688049316, "global_step": 175561, "epoch": 4180} {"train_loss": -7.246185302734375, "global_step": 175562, "epoch": 4180} {"train_loss": -7.204626083374023, "global_step": 175563, "epoch": 4180} {"train_loss": -7.225325584411621, "global_step": 175564, "epoch": 4180} {"train_loss": -7.236976146697998, "global_step": 175565, "epoch": 4180} {"train_loss": -7.12227201461792, "global_step": 175566, "epoch": 4180} {"train_loss": -7.128273010253906, "global_step": 175567, "epoch": 4180} {"train_loss": -7.17995548248291, "global_step": 175568, "epoch": 4180} {"train_loss": -7.171872615814209, "global_step": 175569, "epoch": 4180} {"train_loss": -7.129515647888184, "global_step": 175570, "epoch": 4180} {"train_loss": -7.072044372558594, "global_step": 175571, "epoch": 4180} {"train_loss": -7.140989303588867, "global_step": 175572, "epoch": 4180} {"train_loss": -7.0968122482299805, "global_step": 175573, "epoch": 4180} {"train_loss": -7.060981750488281, "global_step": 175574, "epoch": 4180} {"train_loss": -6.953210353851318, "global_step": 175575, "epoch": 4180} {"train_loss": -7.0874834060668945, "global_step": 175576, "epoch": 4180} {"train_loss": -7.080193042755127, "global_step": 175577, "epoch": 4180} {"train_loss": -7.08286190032959, "global_step": 175578, "epoch": 4180} {"train_loss": -6.974846839904785, "global_step": 175579, "epoch": 4180} {"train_loss": -7.0143632888793945, "global_step": 175580, "epoch": 4180} {"train_loss": -7.048221588134766, "global_step": 175581, "epoch": 4180} {"train_loss": -7.1613383293151855, "global_step": 175582, "epoch": 4180} {"train_loss": -7.061954498291016, "global_step": 175583, "epoch": 4180} {"train_loss": -7.140917778015137, "global_step": 175584, "epoch": 4180} {"train_loss": -7.120705604553223, "global_step": 175585, "epoch": 4180} {"train_loss": -7.132716178894043, "global_step": 175586, "epoch": 4180} {"train_loss": -7.101944923400879, "global_step": 175587, "epoch": 4180} {"train_loss": -7.122710227966309, "global_step": 175588, "epoch": 4180} {"train_loss": -7.079468727111816, "global_step": 175589, "epoch": 4180} {"train_loss": -7.087316036224365, "global_step": 175590, "epoch": 4180} {"train_loss": -7.055914878845215, "global_step": 175591, "epoch": 4180} {"train_loss": -7.139406681060791, "global_step": 175592, "epoch": 4180} {"train_loss": -7.092109203338623, "global_step": 175593, "epoch": 4180} {"train_loss": -7.068081855773926, "global_step": 175594, "epoch": 4180} {"train_loss": -7.060314178466797, "global_step": 175595, "epoch": 4180} {"train_loss": -7.036380767822266, "global_step": 175596, "epoch": 4180} {"train_loss": -7.139839172363281, "global_step": 175597, "epoch": 4180} {"train_loss": -7.158283233642578, "global_step": 175598, "epoch": 4180} {"train_loss": -7.119809150695801, "global_step": 175599, "epoch": 4180} {"train_loss": -7.142707824707031, "global_step": 175600, "epoch": 4180} {"train_loss": -7.10830705506461, "global_step": 175601, "epoch": 4180, "val_loss": 69221.0234375} {"train_loss": -7.155908584594727, "global_step": 175602, "epoch": 4181} {"train_loss": -7.123775005340576, "global_step": 175603, "epoch": 4181} {"train_loss": -7.2638163566589355, "global_step": 175604, "epoch": 4181} {"train_loss": -7.174012660980225, "global_step": 175605, "epoch": 4181} {"train_loss": -7.112649440765381, "global_step": 175606, "epoch": 4181} {"train_loss": -7.035778522491455, "global_step": 175607, "epoch": 4181} {"train_loss": -7.180188179016113, "global_step": 175608, "epoch": 4181} {"train_loss": -7.111274719238281, "global_step": 175609, "epoch": 4181} {"train_loss": -7.099658012390137, "global_step": 175610, "epoch": 4181} {"train_loss": -7.166603088378906, "global_step": 175611, "epoch": 4181} {"train_loss": -7.169976711273193, "global_step": 175612, "epoch": 4181} {"train_loss": -7.16338586807251, "global_step": 175613, "epoch": 4181} {"train_loss": -7.177702903747559, "global_step": 175614, "epoch": 4181} {"train_loss": -7.192866325378418, "global_step": 175615, "epoch": 4181} {"train_loss": -7.0449676513671875, "global_step": 175616, "epoch": 4181} {"train_loss": -7.085328578948975, "global_step": 175617, "epoch": 4181} {"train_loss": -7.04194450378418, "global_step": 175618, "epoch": 4181} {"train_loss": -7.118095397949219, "global_step": 175619, "epoch": 4181} {"train_loss": -7.071310520172119, "global_step": 175620, "epoch": 4181} {"train_loss": -6.94534969329834, "global_step": 175621, "epoch": 4181} {"train_loss": -7.058201789855957, "global_step": 175622, "epoch": 4181} {"train_loss": -6.935866832733154, "global_step": 175623, "epoch": 4181} {"train_loss": -6.798684120178223, "global_step": 175624, "epoch": 4181} {"train_loss": -6.7559051513671875, "global_step": 175625, "epoch": 4181} {"train_loss": -7.12521505355835, "global_step": 175626, "epoch": 4181} {"train_loss": -6.777508735656738, "global_step": 175627, "epoch": 4181} {"train_loss": -7.070751190185547, "global_step": 175628, "epoch": 4181} {"train_loss": -6.828232765197754, "global_step": 175629, "epoch": 4181} {"train_loss": -7.0138959884643555, "global_step": 175630, "epoch": 4181} {"train_loss": -7.013463973999023, "global_step": 175631, "epoch": 4181} {"train_loss": -6.96926736831665, "global_step": 175632, "epoch": 4181} {"train_loss": -7.044222831726074, "global_step": 175633, "epoch": 4181} {"train_loss": -6.9665937423706055, "global_step": 175634, "epoch": 4181} {"train_loss": -6.974659442901611, "global_step": 175635, "epoch": 4181} {"train_loss": -7.028387069702148, "global_step": 175636, "epoch": 4181} {"train_loss": -6.988457679748535, "global_step": 175637, "epoch": 4181} {"train_loss": -6.9462175369262695, "global_step": 175638, "epoch": 4181} {"train_loss": -6.995845794677734, "global_step": 175639, "epoch": 4181} {"train_loss": -6.975881099700928, "global_step": 175640, "epoch": 4181} {"train_loss": -7.104836940765381, "global_step": 175641, "epoch": 4181} {"train_loss": -7.065743923187256, "global_step": 175642, "epoch": 4181} {"train_loss": -7.0419937542506625, "global_step": 175643, "epoch": 4181, "val_loss": 69312.46875} {"train_loss": -6.883030891418457, "global_step": 175644, "epoch": 4182} {"train_loss": -7.098372459411621, "global_step": 175645, "epoch": 4182} {"train_loss": -7.005766868591309, "global_step": 175646, "epoch": 4182} {"train_loss": -6.936210632324219, "global_step": 175647, "epoch": 4182} {"train_loss": -7.03672456741333, "global_step": 175648, "epoch": 4182} {"train_loss": -7.105025291442871, "global_step": 175649, "epoch": 4182} {"train_loss": -7.098267078399658, "global_step": 175650, "epoch": 4182} {"train_loss": -7.03480339050293, "global_step": 175651, "epoch": 4182} {"train_loss": -7.170969009399414, "global_step": 175652, "epoch": 4182} {"train_loss": -7.015422821044922, "global_step": 175653, "epoch": 4182} {"train_loss": -7.124922752380371, "global_step": 175654, "epoch": 4182} {"train_loss": -7.127319812774658, "global_step": 175655, "epoch": 4182} {"train_loss": -7.061511993408203, "global_step": 175656, "epoch": 4182} {"train_loss": -7.0502424240112305, "global_step": 175657, "epoch": 4182} {"train_loss": -7.201285362243652, "global_step": 175658, "epoch": 4182} {"train_loss": -7.006649971008301, "global_step": 175659, "epoch": 4182} {"train_loss": -6.974104881286621, "global_step": 175660, "epoch": 4182} {"train_loss": -7.002191543579102, "global_step": 175661, "epoch": 4182} {"train_loss": -7.14909553527832, "global_step": 175662, "epoch": 4182} {"train_loss": -7.152437686920166, "global_step": 175663, "epoch": 4182} {"train_loss": -6.98918342590332, "global_step": 175664, "epoch": 4182} {"train_loss": -7.106513500213623, "global_step": 175665, "epoch": 4182} {"train_loss": -6.996736526489258, "global_step": 175666, "epoch": 4182} {"train_loss": -7.132866859436035, "global_step": 175667, "epoch": 4182} {"train_loss": -7.095636367797852, "global_step": 175668, "epoch": 4182} {"train_loss": -6.951426982879639, "global_step": 175669, "epoch": 4182} {"train_loss": -7.043674468994141, "global_step": 175670, "epoch": 4182} {"train_loss": -6.9268975257873535, "global_step": 175671, "epoch": 4182} {"train_loss": -7.159972190856934, "global_step": 175672, "epoch": 4182} {"train_loss": -7.0961151123046875, "global_step": 175673, "epoch": 4182} {"train_loss": -7.092729568481445, "global_step": 175674, "epoch": 4182} {"train_loss": -7.142838478088379, "global_step": 175675, "epoch": 4182} {"train_loss": -7.075304985046387, "global_step": 175676, "epoch": 4182} {"train_loss": -7.125618934631348, "global_step": 175677, "epoch": 4182} {"train_loss": -7.105249404907227, "global_step": 175678, "epoch": 4182} {"train_loss": -7.080202102661133, "global_step": 175679, "epoch": 4182} {"train_loss": -7.2366790771484375, "global_step": 175680, "epoch": 4182} {"train_loss": -7.185391902923584, "global_step": 175681, "epoch": 4182} {"train_loss": -7.162002086639404, "global_step": 175682, "epoch": 4182} {"train_loss": -7.180174827575684, "global_step": 175683, "epoch": 4182} {"train_loss": -7.112730026245117, "global_step": 175684, "epoch": 4182} {"train_loss": -7.076781954084124, "global_step": 175685, "epoch": 4182, "val_loss": 68932.4375} {"train_loss": -7.150139331817627, "global_step": 175686, "epoch": 4183} {"train_loss": -7.124148368835449, "global_step": 175687, "epoch": 4183} {"train_loss": -7.254798412322998, "global_step": 175688, "epoch": 4183} {"train_loss": -7.115079879760742, "global_step": 175689, "epoch": 4183} {"train_loss": -7.143209934234619, "global_step": 175690, "epoch": 4183} {"train_loss": -7.089853286743164, "global_step": 175691, "epoch": 4183} {"train_loss": -7.2049150466918945, "global_step": 175692, "epoch": 4183} {"train_loss": -7.1029253005981445, "global_step": 175693, "epoch": 4183} {"train_loss": -7.10044002532959, "global_step": 175694, "epoch": 4183} {"train_loss": -7.080056190490723, "global_step": 175695, "epoch": 4183} {"train_loss": -7.0112786293029785, "global_step": 175696, "epoch": 4183} {"train_loss": -7.280304908752441, "global_step": 175697, "epoch": 4183} {"train_loss": -7.100512981414795, "global_step": 175698, "epoch": 4183} {"train_loss": -7.059385299682617, "global_step": 175699, "epoch": 4183} {"train_loss": -6.969449996948242, "global_step": 175700, "epoch": 4183} {"train_loss": -7.182111740112305, "global_step": 175701, "epoch": 4183} {"train_loss": -7.045781135559082, "global_step": 175702, "epoch": 4183} {"train_loss": -7.026208877563477, "global_step": 175703, "epoch": 4183} {"train_loss": -7.143290042877197, "global_step": 175704, "epoch": 4183} {"train_loss": -7.05150032043457, "global_step": 175705, "epoch": 4183} {"train_loss": -6.968080997467041, "global_step": 175706, "epoch": 4183} {"train_loss": -7.0992937088012695, "global_step": 175707, "epoch": 4183} {"train_loss": -6.971035003662109, "global_step": 175708, "epoch": 4183} {"train_loss": -7.076426029205322, "global_step": 175709, "epoch": 4183} {"train_loss": -7.041274070739746, "global_step": 175710, "epoch": 4183} {"train_loss": -7.005967140197754, "global_step": 175711, "epoch": 4183} {"train_loss": -7.079878807067871, "global_step": 175712, "epoch": 4183} {"train_loss": -7.2159504890441895, "global_step": 175713, "epoch": 4183} {"train_loss": -7.082322120666504, "global_step": 175714, "epoch": 4183} {"train_loss": -7.136447429656982, "global_step": 175715, "epoch": 4183} {"train_loss": -7.077345848083496, "global_step": 175716, "epoch": 4183} {"train_loss": -7.0295729637146, "global_step": 175717, "epoch": 4183} {"train_loss": -7.159285068511963, "global_step": 175718, "epoch": 4183} {"train_loss": -7.089751243591309, "global_step": 175719, "epoch": 4183} {"train_loss": -7.012692451477051, "global_step": 175720, "epoch": 4183} {"train_loss": -7.148923873901367, "global_step": 175721, "epoch": 4183} {"train_loss": -6.998979568481445, "global_step": 175722, "epoch": 4183} {"train_loss": -7.042185306549072, "global_step": 175723, "epoch": 4183} {"train_loss": -7.185878753662109, "global_step": 175724, "epoch": 4183} {"train_loss": -7.01612663269043, "global_step": 175725, "epoch": 4183} {"train_loss": -7.054044723510742, "global_step": 175726, "epoch": 4183} {"train_loss": -7.09110148747762, "global_step": 175727, "epoch": 4183, "val_loss": 69187.7421875} {"train_loss": -7.063087463378906, "global_step": 175728, "epoch": 4184} {"train_loss": -7.003104209899902, "global_step": 175729, "epoch": 4184} {"train_loss": -7.137663841247559, "global_step": 175730, "epoch": 4184} {"train_loss": -6.907142639160156, "global_step": 175731, "epoch": 4184} {"train_loss": -6.89835786819458, "global_step": 175732, "epoch": 4184} {"train_loss": -7.149833679199219, "global_step": 175733, "epoch": 4184} {"train_loss": -7.049232006072998, "global_step": 175734, "epoch": 4184} {"train_loss": -6.925798416137695, "global_step": 175735, "epoch": 4184} {"train_loss": -7.128964424133301, "global_step": 175736, "epoch": 4184} {"train_loss": -6.974006652832031, "global_step": 175737, "epoch": 4184} {"train_loss": -7.103823661804199, "global_step": 175738, "epoch": 4184} {"train_loss": -7.145211219787598, "global_step": 175739, "epoch": 4184} {"train_loss": -6.911667346954346, "global_step": 175740, "epoch": 4184} {"train_loss": -7.040417671203613, "global_step": 175741, "epoch": 4184} {"train_loss": -7.046289443969727, "global_step": 175742, "epoch": 4184} {"train_loss": -6.9649977684021, "global_step": 175743, "epoch": 4184} {"train_loss": -7.082774639129639, "global_step": 175744, "epoch": 4184} {"train_loss": -7.019559383392334, "global_step": 175745, "epoch": 4184} {"train_loss": -7.000978469848633, "global_step": 175746, "epoch": 4184} {"train_loss": -7.083040237426758, "global_step": 175747, "epoch": 4184} {"train_loss": -6.983083724975586, "global_step": 175748, "epoch": 4184} {"train_loss": -7.065708637237549, "global_step": 175749, "epoch": 4184} {"train_loss": -7.080474853515625, "global_step": 175750, "epoch": 4184} {"train_loss": -7.030689716339111, "global_step": 175751, "epoch": 4184} {"train_loss": -6.997300624847412, "global_step": 175752, "epoch": 4184} {"train_loss": -7.082901477813721, "global_step": 175753, "epoch": 4184} {"train_loss": -7.132175445556641, "global_step": 175754, "epoch": 4184} {"train_loss": -7.112996578216553, "global_step": 175755, "epoch": 4184} {"train_loss": -7.148155689239502, "global_step": 175756, "epoch": 4184} {"train_loss": -7.0552568435668945, "global_step": 175757, "epoch": 4184} {"train_loss": -7.0897979736328125, "global_step": 175758, "epoch": 4184} {"train_loss": -7.087715148925781, "global_step": 175759, "epoch": 4184} {"train_loss": -7.1183319091796875, "global_step": 175760, "epoch": 4184} {"train_loss": -7.197127342224121, "global_step": 175761, "epoch": 4184} {"train_loss": -7.011990547180176, "global_step": 175762, "epoch": 4184} {"train_loss": -7.202687740325928, "global_step": 175763, "epoch": 4184} {"train_loss": -7.048559188842773, "global_step": 175764, "epoch": 4184} {"train_loss": -7.045853614807129, "global_step": 175765, "epoch": 4184} {"train_loss": -7.153970241546631, "global_step": 175766, "epoch": 4184} {"train_loss": -7.142899513244629, "global_step": 175767, "epoch": 4184} {"train_loss": -7.17448091506958, "global_step": 175768, "epoch": 4184} {"train_loss": -7.068323158082508, "global_step": 175769, "epoch": 4184, "val_loss": 69356.78125} {"train_loss": -7.092895030975342, "global_step": 175770, "epoch": 4185} {"train_loss": -7.131970405578613, "global_step": 175771, "epoch": 4185} {"train_loss": -7.055907726287842, "global_step": 175772, "epoch": 4185} {"train_loss": -7.08901309967041, "global_step": 175773, "epoch": 4185} {"train_loss": -7.074665546417236, "global_step": 175774, "epoch": 4185} {"train_loss": -7.0925092697143555, "global_step": 175775, "epoch": 4185} {"train_loss": -7.102317810058594, "global_step": 175776, "epoch": 4185} {"train_loss": -6.999645233154297, "global_step": 175777, "epoch": 4185} {"train_loss": -7.119575500488281, "global_step": 175778, "epoch": 4185} {"train_loss": -7.120242118835449, "global_step": 175779, "epoch": 4185} {"train_loss": -7.011261940002441, "global_step": 175780, "epoch": 4185} {"train_loss": -7.2258830070495605, "global_step": 175781, "epoch": 4185} {"train_loss": -7.2096781730651855, "global_step": 175782, "epoch": 4185} {"train_loss": -7.122280120849609, "global_step": 175783, "epoch": 4185} {"train_loss": -7.221782207489014, "global_step": 175784, "epoch": 4185} {"train_loss": -7.025790214538574, "global_step": 175785, "epoch": 4185} {"train_loss": -7.159903049468994, "global_step": 175786, "epoch": 4185} {"train_loss": -7.10455322265625, "global_step": 175787, "epoch": 4185} {"train_loss": -7.160373687744141, "global_step": 175788, "epoch": 4185} {"train_loss": -7.238085746765137, "global_step": 175789, "epoch": 4185} {"train_loss": -7.044105052947998, "global_step": 175790, "epoch": 4185} {"train_loss": -7.166831016540527, "global_step": 175791, "epoch": 4185} {"train_loss": -7.096190929412842, "global_step": 175792, "epoch": 4185} {"train_loss": -7.019902229309082, "global_step": 175793, "epoch": 4185} {"train_loss": -7.018735885620117, "global_step": 175794, "epoch": 4185} {"train_loss": -7.011392593383789, "global_step": 175795, "epoch": 4185} {"train_loss": -7.1108856201171875, "global_step": 175796, "epoch": 4185} {"train_loss": -7.096193790435791, "global_step": 175797, "epoch": 4185} {"train_loss": -6.990299224853516, "global_step": 175798, "epoch": 4185} {"train_loss": -7.051767349243164, "global_step": 175799, "epoch": 4185} {"train_loss": -7.248909950256348, "global_step": 175800, "epoch": 4185} {"train_loss": -7.074909210205078, "global_step": 175801, "epoch": 4185} {"train_loss": -7.092667102813721, "global_step": 175802, "epoch": 4185} {"train_loss": -7.112452507019043, "global_step": 175803, "epoch": 4185} {"train_loss": -7.002705097198486, "global_step": 175804, "epoch": 4185} {"train_loss": -6.960135459899902, "global_step": 175805, "epoch": 4185} {"train_loss": -7.0749125480651855, "global_step": 175806, "epoch": 4185} {"train_loss": -7.1098151206970215, "global_step": 175807, "epoch": 4185} {"train_loss": -6.9661664962768555, "global_step": 175808, "epoch": 4185} {"train_loss": -7.118674278259277, "global_step": 175809, "epoch": 4185} {"train_loss": -7.133549690246582, "global_step": 175810, "epoch": 4185} {"train_loss": -7.094391584396362, "global_step": 175811, "epoch": 4185, "val_loss": 69078.515625} {"train_loss": -7.010746955871582, "global_step": 175812, "epoch": 4186} {"train_loss": -7.093832015991211, "global_step": 175813, "epoch": 4186} {"train_loss": -7.1400227546691895, "global_step": 175814, "epoch": 4186} {"train_loss": -7.121402740478516, "global_step": 175815, "epoch": 4186} {"train_loss": -7.126911640167236, "global_step": 175816, "epoch": 4186} {"train_loss": -7.0714287757873535, "global_step": 175817, "epoch": 4186} {"train_loss": -7.035841941833496, "global_step": 175818, "epoch": 4186} {"train_loss": -6.9998650550842285, "global_step": 175819, "epoch": 4186} {"train_loss": -7.0150628089904785, "global_step": 175820, "epoch": 4186} {"train_loss": -7.100847244262695, "global_step": 175821, "epoch": 4186} {"train_loss": -7.040470123291016, "global_step": 175822, "epoch": 4186} {"train_loss": -7.093764781951904, "global_step": 175823, "epoch": 4186} {"train_loss": -7.082335948944092, "global_step": 175824, "epoch": 4186} {"train_loss": -7.110074043273926, "global_step": 175825, "epoch": 4186} {"train_loss": -7.118321895599365, "global_step": 175826, "epoch": 4186} {"train_loss": -7.1194047927856445, "global_step": 175827, "epoch": 4186} {"train_loss": -7.080911636352539, "global_step": 175828, "epoch": 4186} {"train_loss": -7.155682563781738, "global_step": 175829, "epoch": 4186} {"train_loss": -7.142210960388184, "global_step": 175830, "epoch": 4186} {"train_loss": -7.121774673461914, "global_step": 175831, "epoch": 4186} {"train_loss": -7.057194709777832, "global_step": 175832, "epoch": 4186} {"train_loss": -7.047946453094482, "global_step": 175833, "epoch": 4186} {"train_loss": -7.143880844116211, "global_step": 175834, "epoch": 4186} {"train_loss": -6.992982387542725, "global_step": 175835, "epoch": 4186} {"train_loss": -7.116581916809082, "global_step": 175836, "epoch": 4186} {"train_loss": -7.050187587738037, "global_step": 175837, "epoch": 4186} {"train_loss": -7.069662570953369, "global_step": 175838, "epoch": 4186} {"train_loss": -7.033858299255371, "global_step": 175839, "epoch": 4186} {"train_loss": -7.107384204864502, "global_step": 175840, "epoch": 4186} {"train_loss": -7.076498031616211, "global_step": 175841, "epoch": 4186} {"train_loss": -7.053549289703369, "global_step": 175842, "epoch": 4186} {"train_loss": -7.064075946807861, "global_step": 175843, "epoch": 4186} {"train_loss": -6.980319023132324, "global_step": 175844, "epoch": 4186} {"train_loss": -7.033351421356201, "global_step": 175845, "epoch": 4186} {"train_loss": -7.084836006164551, "global_step": 175846, "epoch": 4186} {"train_loss": -6.894981384277344, "global_step": 175847, "epoch": 4186} {"train_loss": -7.049039840698242, "global_step": 175848, "epoch": 4186} {"train_loss": -7.1055521965026855, "global_step": 175849, "epoch": 4186} {"train_loss": -6.9069085121154785, "global_step": 175850, "epoch": 4186} {"train_loss": -7.107728958129883, "global_step": 175851, "epoch": 4186} {"train_loss": -7.0178937911987305, "global_step": 175852, "epoch": 4186} {"train_loss": -7.065950881867182, "global_step": 175853, "epoch": 4186, "val_loss": 69165.53125} {"train_loss": -7.0315680503845215, "global_step": 175854, "epoch": 4187} {"train_loss": -6.928056240081787, "global_step": 175855, "epoch": 4187} {"train_loss": -7.024477005004883, "global_step": 175856, "epoch": 4187} {"train_loss": -7.069818496704102, "global_step": 175857, "epoch": 4187} {"train_loss": -6.851571083068848, "global_step": 175858, "epoch": 4187} {"train_loss": -7.060948371887207, "global_step": 175859, "epoch": 4187} {"train_loss": -6.868333339691162, "global_step": 175860, "epoch": 4187} {"train_loss": -6.883446216583252, "global_step": 175861, "epoch": 4187} {"train_loss": -6.970623016357422, "global_step": 175862, "epoch": 4187} {"train_loss": -6.901357650756836, "global_step": 175863, "epoch": 4187} {"train_loss": -6.954275131225586, "global_step": 175864, "epoch": 4187} {"train_loss": -7.012006759643555, "global_step": 175865, "epoch": 4187} {"train_loss": -7.088561058044434, "global_step": 175866, "epoch": 4187} {"train_loss": -7.021633625030518, "global_step": 175867, "epoch": 4187} {"train_loss": -7.029156684875488, "global_step": 175868, "epoch": 4187} {"train_loss": -7.251053333282471, "global_step": 175869, "epoch": 4187} {"train_loss": -7.074906349182129, "global_step": 175870, "epoch": 4187} {"train_loss": -7.129980087280273, "global_step": 175871, "epoch": 4187} {"train_loss": -7.241203308105469, "global_step": 175872, "epoch": 4187} {"train_loss": -7.016672134399414, "global_step": 175873, "epoch": 4187} {"train_loss": -7.144094467163086, "global_step": 175874, "epoch": 4187} {"train_loss": -7.19797945022583, "global_step": 175875, "epoch": 4187} {"train_loss": -7.1439409255981445, "global_step": 175876, "epoch": 4187} {"train_loss": -7.179789066314697, "global_step": 175877, "epoch": 4187} {"train_loss": -7.114104270935059, "global_step": 175878, "epoch": 4187} {"train_loss": -7.201115608215332, "global_step": 175879, "epoch": 4187} {"train_loss": -7.207427024841309, "global_step": 175880, "epoch": 4187} {"train_loss": -7.157338619232178, "global_step": 175881, "epoch": 4187} {"train_loss": -7.134174346923828, "global_step": 175882, "epoch": 4187} {"train_loss": -7.102849960327148, "global_step": 175883, "epoch": 4187} {"train_loss": -7.1356000900268555, "global_step": 175884, "epoch": 4187} {"train_loss": -7.146238327026367, "global_step": 175885, "epoch": 4187} {"train_loss": -7.117980003356934, "global_step": 175886, "epoch": 4187} {"train_loss": -7.087372779846191, "global_step": 175887, "epoch": 4187} {"train_loss": -7.200071334838867, "global_step": 175888, "epoch": 4187} {"train_loss": -7.04783821105957, "global_step": 175889, "epoch": 4187} {"train_loss": -7.2083845138549805, "global_step": 175890, "epoch": 4187} {"train_loss": -7.155883312225342, "global_step": 175891, "epoch": 4187} {"train_loss": -7.134574890136719, "global_step": 175892, "epoch": 4187} {"train_loss": -7.027356147766113, "global_step": 175893, "epoch": 4187} {"train_loss": -7.212514877319336, "global_step": 175894, "epoch": 4187} {"train_loss": -7.086876290185111, "global_step": 175895, "epoch": 4187, "val_loss": 69299.7421875} {"train_loss": -7.034661769866943, "global_step": 175896, "epoch": 4188} {"train_loss": -7.1857147216796875, "global_step": 175897, "epoch": 4188} {"train_loss": -7.300107955932617, "global_step": 175898, "epoch": 4188} {"train_loss": -7.054113388061523, "global_step": 175899, "epoch": 4188} {"train_loss": -7.187220573425293, "global_step": 175900, "epoch": 4188} {"train_loss": -7.208603858947754, "global_step": 175901, "epoch": 4188} {"train_loss": -7.112059593200684, "global_step": 175902, "epoch": 4188} {"train_loss": -7.212578773498535, "global_step": 175903, "epoch": 4188} {"train_loss": -7.165539741516113, "global_step": 175904, "epoch": 4188} {"train_loss": -7.206882953643799, "global_step": 175905, "epoch": 4188} {"train_loss": -7.0840959548950195, "global_step": 175906, "epoch": 4188} {"train_loss": -7.14693546295166, "global_step": 175907, "epoch": 4188} {"train_loss": -7.108773231506348, "global_step": 175908, "epoch": 4188} {"train_loss": -7.096036911010742, "global_step": 175909, "epoch": 4188} {"train_loss": -7.130060195922852, "global_step": 175910, "epoch": 4188} {"train_loss": -7.205876350402832, "global_step": 175911, "epoch": 4188} {"train_loss": -7.092001914978027, "global_step": 175912, "epoch": 4188} {"train_loss": -7.130794048309326, "global_step": 175913, "epoch": 4188} {"train_loss": -7.196911811828613, "global_step": 175914, "epoch": 4188} {"train_loss": -7.0444817543029785, "global_step": 175915, "epoch": 4188} {"train_loss": -7.100555419921875, "global_step": 175916, "epoch": 4188} {"train_loss": -7.020031929016113, "global_step": 175917, "epoch": 4188} {"train_loss": -7.067840576171875, "global_step": 175918, "epoch": 4188} {"train_loss": -7.115443706512451, "global_step": 175919, "epoch": 4188} {"train_loss": -7.057887077331543, "global_step": 175920, "epoch": 4188} {"train_loss": -6.9403181076049805, "global_step": 175921, "epoch": 4188} {"train_loss": -6.910226345062256, "global_step": 175922, "epoch": 4188} {"train_loss": -6.991491794586182, "global_step": 175923, "epoch": 4188} {"train_loss": -7.131358623504639, "global_step": 175924, "epoch": 4188} {"train_loss": -7.039094924926758, "global_step": 175925, "epoch": 4188} {"train_loss": -7.115168571472168, "global_step": 175926, "epoch": 4188} {"train_loss": -7.206562042236328, "global_step": 175927, "epoch": 4188} {"train_loss": -7.01954984664917, "global_step": 175928, "epoch": 4188} {"train_loss": -7.051981449127197, "global_step": 175929, "epoch": 4188} {"train_loss": -6.919408321380615, "global_step": 175930, "epoch": 4188} {"train_loss": -7.188936233520508, "global_step": 175931, "epoch": 4188} {"train_loss": -7.002058982849121, "global_step": 175932, "epoch": 4188} {"train_loss": -7.0517964363098145, "global_step": 175933, "epoch": 4188} {"train_loss": -7.106771469116211, "global_step": 175934, "epoch": 4188} {"train_loss": -7.05527400970459, "global_step": 175935, "epoch": 4188} {"train_loss": -6.986910820007324, "global_step": 175936, "epoch": 4188} {"train_loss": -7.096448262532552, "global_step": 175937, "epoch": 4188, "val_loss": 69164.7890625} {"train_loss": -7.0352983474731445, "global_step": 175938, "epoch": 4189} {"train_loss": -7.153298377990723, "global_step": 175939, "epoch": 4189} {"train_loss": -7.049700736999512, "global_step": 175940, "epoch": 4189} {"train_loss": -7.0821943283081055, "global_step": 175941, "epoch": 4189} {"train_loss": -7.029373645782471, "global_step": 175942, "epoch": 4189} {"train_loss": -6.970767974853516, "global_step": 175943, "epoch": 4189} {"train_loss": -7.046566009521484, "global_step": 175944, "epoch": 4189} {"train_loss": -7.104088306427002, "global_step": 175945, "epoch": 4189} {"train_loss": -7.218716621398926, "global_step": 175946, "epoch": 4189} {"train_loss": -7.1339945793151855, "global_step": 175947, "epoch": 4189} {"train_loss": -7.030375957489014, "global_step": 175948, "epoch": 4189} {"train_loss": -7.0560479164123535, "global_step": 175949, "epoch": 4189} {"train_loss": -7.12478494644165, "global_step": 175950, "epoch": 4189} {"train_loss": -7.174543857574463, "global_step": 175951, "epoch": 4189} {"train_loss": -7.174436092376709, "global_step": 175952, "epoch": 4189} {"train_loss": -7.0449748039245605, "global_step": 175953, "epoch": 4189} {"train_loss": -7.137688159942627, "global_step": 175954, "epoch": 4189} {"train_loss": -6.936395645141602, "global_step": 175955, "epoch": 4189} {"train_loss": -7.075313568115234, "global_step": 175956, "epoch": 4189} {"train_loss": -6.9876532554626465, "global_step": 175957, "epoch": 4189} {"train_loss": -7.129005432128906, "global_step": 175958, "epoch": 4189} {"train_loss": -6.988715171813965, "global_step": 175959, "epoch": 4189} {"train_loss": -6.897424697875977, "global_step": 175960, "epoch": 4189} {"train_loss": -6.984118461608887, "global_step": 175961, "epoch": 4189} {"train_loss": -6.971219062805176, "global_step": 175962, "epoch": 4189} {"train_loss": -6.872424602508545, "global_step": 175963, "epoch": 4189} {"train_loss": -7.0244669914245605, "global_step": 175964, "epoch": 4189} {"train_loss": -6.860357284545898, "global_step": 175965, "epoch": 4189} {"train_loss": -6.826208114624023, "global_step": 175966, "epoch": 4189} {"train_loss": -6.967211723327637, "global_step": 175967, "epoch": 4189} {"train_loss": -6.968472480773926, "global_step": 175968, "epoch": 4189} {"train_loss": -6.894613265991211, "global_step": 175969, "epoch": 4189} {"train_loss": -7.0708160400390625, "global_step": 175970, "epoch": 4189} {"train_loss": -6.939929008483887, "global_step": 175971, "epoch": 4189} {"train_loss": -7.0452117919921875, "global_step": 175972, "epoch": 4189} {"train_loss": -6.9191484451293945, "global_step": 175973, "epoch": 4189} {"train_loss": -6.978891372680664, "global_step": 175974, "epoch": 4189} {"train_loss": -7.067108154296875, "global_step": 175975, "epoch": 4189} {"train_loss": -6.936553955078125, "global_step": 175976, "epoch": 4189} {"train_loss": -7.057557582855225, "global_step": 175977, "epoch": 4189} {"train_loss": -7.050464630126953, "global_step": 175978, "epoch": 4189} {"train_loss": -7.023978324163528, "global_step": 175979, "epoch": 4189, "val_loss": 69171.453125} {"train_loss": -7.029737949371338, "global_step": 175980, "epoch": 4190} {"train_loss": -7.115850925445557, "global_step": 175981, "epoch": 4190} {"train_loss": -7.125017166137695, "global_step": 175982, "epoch": 4190} {"train_loss": -7.0499067306518555, "global_step": 175983, "epoch": 4190} {"train_loss": -7.016467094421387, "global_step": 175984, "epoch": 4190} {"train_loss": -7.038843631744385, "global_step": 175985, "epoch": 4190} {"train_loss": -7.0541181564331055, "global_step": 175986, "epoch": 4190} {"train_loss": -7.069766998291016, "global_step": 175987, "epoch": 4190} {"train_loss": -7.1346354484558105, "global_step": 175988, "epoch": 4190} {"train_loss": -7.179482936859131, "global_step": 175989, "epoch": 4190} {"train_loss": -7.196971893310547, "global_step": 175990, "epoch": 4190} {"train_loss": -7.072032928466797, "global_step": 175991, "epoch": 4190} {"train_loss": -7.058608055114746, "global_step": 175992, "epoch": 4190} {"train_loss": -6.971767425537109, "global_step": 175993, "epoch": 4190} {"train_loss": -6.994046211242676, "global_step": 175994, "epoch": 4190} {"train_loss": -7.020267486572266, "global_step": 175995, "epoch": 4190} {"train_loss": -7.178711414337158, "global_step": 175996, "epoch": 4190} {"train_loss": -7.105003833770752, "global_step": 175997, "epoch": 4190} {"train_loss": -6.972102642059326, "global_step": 175998, "epoch": 4190} {"train_loss": -7.0674896240234375, "global_step": 175999, "epoch": 4190} {"train_loss": -7.1072282791137695, "global_step": 176000, "epoch": 4190} {"train_loss": -7.053862571716309, "global_step": 176001, "epoch": 4190} {"train_loss": -7.103120803833008, "global_step": 176002, "epoch": 4190} {"train_loss": -7.220266342163086, "global_step": 176003, "epoch": 4190} {"train_loss": -7.088396072387695, "global_step": 176004, "epoch": 4190} {"train_loss": -7.084117889404297, "global_step": 176005, "epoch": 4190} {"train_loss": -7.00305700302124, "global_step": 176006, "epoch": 4190} {"train_loss": -7.13069486618042, "global_step": 176007, "epoch": 4190} {"train_loss": -7.006740570068359, "global_step": 176008, "epoch": 4190} {"train_loss": -6.945951461791992, "global_step": 176009, "epoch": 4190} {"train_loss": -7.018260955810547, "global_step": 176010, "epoch": 4190} {"train_loss": -6.874487400054932, "global_step": 176011, "epoch": 4190} {"train_loss": -6.934755802154541, "global_step": 176012, "epoch": 4190} {"train_loss": -7.0193562507629395, "global_step": 176013, "epoch": 4190} {"train_loss": -6.985260009765625, "global_step": 176014, "epoch": 4190} {"train_loss": -6.9901862144470215, "global_step": 176015, "epoch": 4190} {"train_loss": -7.038861274719238, "global_step": 176016, "epoch": 4190} {"train_loss": -6.933877944946289, "global_step": 176017, "epoch": 4190} {"train_loss": -7.13350772857666, "global_step": 176018, "epoch": 4190} {"train_loss": -7.017149448394775, "global_step": 176019, "epoch": 4190} {"train_loss": -7.089700698852539, "global_step": 176020, "epoch": 4190} {"train_loss": -7.055056980678013, "global_step": 176021, "epoch": 4190, "val_loss": 69336.21875} {"train_loss": -7.084376811981201, "global_step": 176022, "epoch": 4191} {"train_loss": -7.09477424621582, "global_step": 176023, "epoch": 4191} {"train_loss": -7.063984394073486, "global_step": 176024, "epoch": 4191} {"train_loss": -6.955214023590088, "global_step": 176025, "epoch": 4191} {"train_loss": -6.9893622398376465, "global_step": 176026, "epoch": 4191} {"train_loss": -6.955696105957031, "global_step": 176027, "epoch": 4191} {"train_loss": -7.053230285644531, "global_step": 176028, "epoch": 4191} {"train_loss": -7.099831581115723, "global_step": 176029, "epoch": 4191} {"train_loss": -6.9555535316467285, "global_step": 176030, "epoch": 4191} {"train_loss": -6.981144905090332, "global_step": 176031, "epoch": 4191} {"train_loss": -6.997363567352295, "global_step": 176032, "epoch": 4191} {"train_loss": -6.99318790435791, "global_step": 176033, "epoch": 4191} {"train_loss": -7.121572494506836, "global_step": 176034, "epoch": 4191} {"train_loss": -7.022412300109863, "global_step": 176035, "epoch": 4191} {"train_loss": -7.0015459060668945, "global_step": 176036, "epoch": 4191} {"train_loss": -7.052786350250244, "global_step": 176037, "epoch": 4191} {"train_loss": -6.994470596313477, "global_step": 176038, "epoch": 4191} {"train_loss": -6.909250259399414, "global_step": 176039, "epoch": 4191} {"train_loss": -7.068524360656738, "global_step": 176040, "epoch": 4191} {"train_loss": -7.000558853149414, "global_step": 176041, "epoch": 4191} {"train_loss": -7.020297527313232, "global_step": 176042, "epoch": 4191} {"train_loss": -6.959569931030273, "global_step": 176043, "epoch": 4191} {"train_loss": -6.976107597351074, "global_step": 176044, "epoch": 4191} {"train_loss": -6.999422073364258, "global_step": 176045, "epoch": 4191} {"train_loss": -7.010257720947266, "global_step": 176046, "epoch": 4191} {"train_loss": -7.089791297912598, "global_step": 176047, "epoch": 4191} {"train_loss": -7.03627872467041, "global_step": 176048, "epoch": 4191} {"train_loss": -7.127638816833496, "global_step": 176049, "epoch": 4191} {"train_loss": -7.071778774261475, "global_step": 176050, "epoch": 4191} {"train_loss": -7.094388484954834, "global_step": 176051, "epoch": 4191} {"train_loss": -7.158596038818359, "global_step": 176052, "epoch": 4191} {"train_loss": -7.0283203125, "global_step": 176053, "epoch": 4191} {"train_loss": -7.0541253089904785, "global_step": 176054, "epoch": 4191} {"train_loss": -6.9053120613098145, "global_step": 176055, "epoch": 4191} {"train_loss": -7.025173187255859, "global_step": 176056, "epoch": 4191} {"train_loss": -7.079420566558838, "global_step": 176057, "epoch": 4191} {"train_loss": -7.066011428833008, "global_step": 176058, "epoch": 4191} {"train_loss": -6.942134857177734, "global_step": 176059, "epoch": 4191} {"train_loss": -6.981039047241211, "global_step": 176060, "epoch": 4191} {"train_loss": -7.013967037200928, "global_step": 176061, "epoch": 4191} {"train_loss": -7.198418617248535, "global_step": 176062, "epoch": 4191} {"train_loss": -7.028048140662057, "global_step": 176063, "epoch": 4191, "val_loss": 69357.4765625} {"train_loss": -7.047857284545898, "global_step": 176064, "epoch": 4192} {"train_loss": -7.054100036621094, "global_step": 176065, "epoch": 4192} {"train_loss": -6.9915547370910645, "global_step": 176066, "epoch": 4192} {"train_loss": -7.04927396774292, "global_step": 176067, "epoch": 4192} {"train_loss": -7.104790687561035, "global_step": 176068, "epoch": 4192} {"train_loss": -7.094298839569092, "global_step": 176069, "epoch": 4192} {"train_loss": -7.15383768081665, "global_step": 176070, "epoch": 4192} {"train_loss": -7.0021562576293945, "global_step": 176071, "epoch": 4192} {"train_loss": -7.0812764167785645, "global_step": 176072, "epoch": 4192} {"train_loss": -7.057439804077148, "global_step": 176073, "epoch": 4192} {"train_loss": -7.05407190322876, "global_step": 176074, "epoch": 4192} {"train_loss": -7.181827545166016, "global_step": 176075, "epoch": 4192} {"train_loss": -7.123312950134277, "global_step": 176076, "epoch": 4192} {"train_loss": -7.0405168533325195, "global_step": 176077, "epoch": 4192} {"train_loss": -7.136421203613281, "global_step": 176078, "epoch": 4192} {"train_loss": -7.066132068634033, "global_step": 176079, "epoch": 4192} {"train_loss": -7.041274070739746, "global_step": 176080, "epoch": 4192} {"train_loss": -7.138189315795898, "global_step": 176081, "epoch": 4192} {"train_loss": -7.098211288452148, "global_step": 176082, "epoch": 4192} {"train_loss": -7.093603134155273, "global_step": 176083, "epoch": 4192} {"train_loss": -7.0861968994140625, "global_step": 176084, "epoch": 4192} {"train_loss": -7.082484722137451, "global_step": 176085, "epoch": 4192} {"train_loss": -7.019874095916748, "global_step": 176086, "epoch": 4192} {"train_loss": -7.018952369689941, "global_step": 176087, "epoch": 4192} {"train_loss": -7.059362411499023, "global_step": 176088, "epoch": 4192} {"train_loss": -6.913439750671387, "global_step": 176089, "epoch": 4192} {"train_loss": -6.957087516784668, "global_step": 176090, "epoch": 4192} {"train_loss": -7.000252723693848, "global_step": 176091, "epoch": 4192} {"train_loss": -6.91370964050293, "global_step": 176092, "epoch": 4192} {"train_loss": -6.912822723388672, "global_step": 176093, "epoch": 4192} {"train_loss": -6.928524017333984, "global_step": 176094, "epoch": 4192} {"train_loss": -7.009575843811035, "global_step": 176095, "epoch": 4192} {"train_loss": -6.849814414978027, "global_step": 176096, "epoch": 4192} {"train_loss": -6.960490703582764, "global_step": 176097, "epoch": 4192} {"train_loss": -6.849762916564941, "global_step": 176098, "epoch": 4192} {"train_loss": -6.993651390075684, "global_step": 176099, "epoch": 4192} {"train_loss": -7.021705627441406, "global_step": 176100, "epoch": 4192} {"train_loss": -7.138017654418945, "global_step": 176101, "epoch": 4192} {"train_loss": -7.103475570678711, "global_step": 176102, "epoch": 4192} {"train_loss": -7.043354034423828, "global_step": 176103, "epoch": 4192} {"train_loss": -7.033908843994141, "global_step": 176104, "epoch": 4192} {"train_loss": -7.036042905989147, "global_step": 176105, "epoch": 4192, "val_loss": 69135.375} {"train_loss": -6.967299938201904, "global_step": 176106, "epoch": 4193} {"train_loss": -7.1911091804504395, "global_step": 176107, "epoch": 4193} {"train_loss": -7.023896217346191, "global_step": 176108, "epoch": 4193} {"train_loss": -7.056612491607666, "global_step": 176109, "epoch": 4193} {"train_loss": -7.048107147216797, "global_step": 176110, "epoch": 4193} {"train_loss": -6.9935688972473145, "global_step": 176111, "epoch": 4193} {"train_loss": -7.134692192077637, "global_step": 176112, "epoch": 4193} {"train_loss": -6.98759651184082, "global_step": 176113, "epoch": 4193} {"train_loss": -7.080965518951416, "global_step": 176114, "epoch": 4193} {"train_loss": -7.016330718994141, "global_step": 176115, "epoch": 4193} {"train_loss": -7.037849426269531, "global_step": 176116, "epoch": 4193} {"train_loss": -6.869815826416016, "global_step": 176117, "epoch": 4193} {"train_loss": -7.004605293273926, "global_step": 176118, "epoch": 4193} {"train_loss": -6.955933094024658, "global_step": 176119, "epoch": 4193} {"train_loss": -7.056882381439209, "global_step": 176120, "epoch": 4193} {"train_loss": -7.068448543548584, "global_step": 176121, "epoch": 4193} {"train_loss": -7.11260461807251, "global_step": 176122, "epoch": 4193} {"train_loss": -7.0620551109313965, "global_step": 176123, "epoch": 4193} {"train_loss": -7.083312034606934, "global_step": 176124, "epoch": 4193} {"train_loss": -7.013125419616699, "global_step": 176125, "epoch": 4193} {"train_loss": -6.991747856140137, "global_step": 176126, "epoch": 4193} {"train_loss": -7.132608413696289, "global_step": 176127, "epoch": 4193} {"train_loss": -7.023986339569092, "global_step": 176128, "epoch": 4193} {"train_loss": -7.104195594787598, "global_step": 176129, "epoch": 4193} {"train_loss": -6.990413188934326, "global_step": 176130, "epoch": 4193} {"train_loss": -7.043552398681641, "global_step": 176131, "epoch": 4193} {"train_loss": -7.027492046356201, "global_step": 176132, "epoch": 4193} {"train_loss": -6.998808860778809, "global_step": 176133, "epoch": 4193} {"train_loss": -7.095768928527832, "global_step": 176134, "epoch": 4193} {"train_loss": -7.022434711456299, "global_step": 176135, "epoch": 4193} {"train_loss": -7.071206092834473, "global_step": 176136, "epoch": 4193} {"train_loss": -6.932192802429199, "global_step": 176137, "epoch": 4193} {"train_loss": -7.166330814361572, "global_step": 176138, "epoch": 4193} {"train_loss": -6.900185585021973, "global_step": 176139, "epoch": 4193} {"train_loss": -7.0359907150268555, "global_step": 176140, "epoch": 4193} {"train_loss": -7.119868278503418, "global_step": 176141, "epoch": 4193} {"train_loss": -7.073003768920898, "global_step": 176142, "epoch": 4193} {"train_loss": -7.118986129760742, "global_step": 176143, "epoch": 4193} {"train_loss": -7.054441452026367, "global_step": 176144, "epoch": 4193} {"train_loss": -7.099333763122559, "global_step": 176145, "epoch": 4193} {"train_loss": -7.103321552276611, "global_step": 176146, "epoch": 4193} {"train_loss": -7.048658234732492, "global_step": 176147, "epoch": 4193, "val_loss": 69215.671875} {"train_loss": -7.139001369476318, "global_step": 176148, "epoch": 4194} {"train_loss": -7.018779277801514, "global_step": 176149, "epoch": 4194} {"train_loss": -7.241938591003418, "global_step": 176150, "epoch": 4194} {"train_loss": -7.0790510177612305, "global_step": 176151, "epoch": 4194} {"train_loss": -7.132208824157715, "global_step": 176152, "epoch": 4194} {"train_loss": -7.154201507568359, "global_step": 176153, "epoch": 4194} {"train_loss": -7.130260467529297, "global_step": 176154, "epoch": 4194} {"train_loss": -7.086845397949219, "global_step": 176155, "epoch": 4194} {"train_loss": -7.078708171844482, "global_step": 176156, "epoch": 4194} {"train_loss": -7.0431976318359375, "global_step": 176157, "epoch": 4194} {"train_loss": -7.10130500793457, "global_step": 176158, "epoch": 4194} {"train_loss": -7.099445343017578, "global_step": 176159, "epoch": 4194} {"train_loss": -7.062750816345215, "global_step": 176160, "epoch": 4194} {"train_loss": -7.055097579956055, "global_step": 176161, "epoch": 4194} {"train_loss": -7.046275615692139, "global_step": 176162, "epoch": 4194} {"train_loss": -7.010133743286133, "global_step": 176163, "epoch": 4194} {"train_loss": -7.1658034324646, "global_step": 176164, "epoch": 4194} {"train_loss": -7.060884475708008, "global_step": 176165, "epoch": 4194} {"train_loss": -7.066988468170166, "global_step": 176166, "epoch": 4194} {"train_loss": -7.088350296020508, "global_step": 176167, "epoch": 4194} {"train_loss": -7.102363586425781, "global_step": 176168, "epoch": 4194} {"train_loss": -7.104046821594238, "global_step": 176169, "epoch": 4194} {"train_loss": -7.018499374389648, "global_step": 176170, "epoch": 4194} {"train_loss": -7.211954116821289, "global_step": 176171, "epoch": 4194} {"train_loss": -7.113263130187988, "global_step": 176172, "epoch": 4194} {"train_loss": -7.082660675048828, "global_step": 176173, "epoch": 4194} {"train_loss": -7.1431450843811035, "global_step": 176174, "epoch": 4194} {"train_loss": -7.153351783752441, "global_step": 176175, "epoch": 4194} {"train_loss": -7.137580871582031, "global_step": 176176, "epoch": 4194} {"train_loss": -7.155522346496582, "global_step": 176177, "epoch": 4194} {"train_loss": -7.171946048736572, "global_step": 176178, "epoch": 4194} {"train_loss": -7.073780536651611, "global_step": 176179, "epoch": 4194} {"train_loss": -7.029884338378906, "global_step": 176180, "epoch": 4194} {"train_loss": -7.0191850662231445, "global_step": 176181, "epoch": 4194} {"train_loss": -7.149662971496582, "global_step": 176182, "epoch": 4194} {"train_loss": -7.128653526306152, "global_step": 176183, "epoch": 4194} {"train_loss": -7.167341232299805, "global_step": 176184, "epoch": 4194} {"train_loss": -6.996700286865234, "global_step": 176185, "epoch": 4194} {"train_loss": -7.1746110916137695, "global_step": 176186, "epoch": 4194} {"train_loss": -6.898972034454346, "global_step": 176187, "epoch": 4194} {"train_loss": -6.986337661743164, "global_step": 176188, "epoch": 4194} {"train_loss": -7.095329897744315, "global_step": 176189, "epoch": 4194, "val_loss": 69137.3359375} {"train_loss": -6.954123020172119, "global_step": 176190, "epoch": 4195} {"train_loss": -6.930353164672852, "global_step": 176191, "epoch": 4195} {"train_loss": -7.053371429443359, "global_step": 176192, "epoch": 4195} {"train_loss": -6.887874603271484, "global_step": 176193, "epoch": 4195} {"train_loss": -7.091428279876709, "global_step": 176194, "epoch": 4195} {"train_loss": -7.171723365783691, "global_step": 176195, "epoch": 4195} {"train_loss": -6.983038902282715, "global_step": 176196, "epoch": 4195} {"train_loss": -7.169285774230957, "global_step": 176197, "epoch": 4195} {"train_loss": -6.929827690124512, "global_step": 176198, "epoch": 4195} {"train_loss": -7.094264030456543, "global_step": 176199, "epoch": 4195} {"train_loss": -6.984490394592285, "global_step": 176200, "epoch": 4195} {"train_loss": -7.008338928222656, "global_step": 176201, "epoch": 4195} {"train_loss": -6.981747150421143, "global_step": 176202, "epoch": 4195} {"train_loss": -7.051620960235596, "global_step": 176203, "epoch": 4195} {"train_loss": -6.955256462097168, "global_step": 176204, "epoch": 4195} {"train_loss": -7.071796417236328, "global_step": 176205, "epoch": 4195} {"train_loss": -7.156110763549805, "global_step": 176206, "epoch": 4195} {"train_loss": -7.1279754638671875, "global_step": 176207, "epoch": 4195} {"train_loss": -7.135308742523193, "global_step": 176208, "epoch": 4195} {"train_loss": -7.090813636779785, "global_step": 176209, "epoch": 4195} {"train_loss": -7.083552360534668, "global_step": 176210, "epoch": 4195} {"train_loss": -7.064149856567383, "global_step": 176211, "epoch": 4195} {"train_loss": -7.054776191711426, "global_step": 176212, "epoch": 4195} {"train_loss": -7.069844722747803, "global_step": 176213, "epoch": 4195} {"train_loss": -7.157205104827881, "global_step": 176214, "epoch": 4195} {"train_loss": -6.964478015899658, "global_step": 176215, "epoch": 4195} {"train_loss": -7.180389404296875, "global_step": 176216, "epoch": 4195} {"train_loss": -7.193417549133301, "global_step": 176217, "epoch": 4195} {"train_loss": -7.12456750869751, "global_step": 176218, "epoch": 4195} {"train_loss": -7.124747276306152, "global_step": 176219, "epoch": 4195} {"train_loss": -7.17048978805542, "global_step": 176220, "epoch": 4195} {"train_loss": -7.145087242126465, "global_step": 176221, "epoch": 4195} {"train_loss": -7.059202194213867, "global_step": 176222, "epoch": 4195} {"train_loss": -7.080669403076172, "global_step": 176223, "epoch": 4195} {"train_loss": -7.062926769256592, "global_step": 176224, "epoch": 4195} {"train_loss": -7.095162391662598, "global_step": 176225, "epoch": 4195} {"train_loss": -7.120178699493408, "global_step": 176226, "epoch": 4195} {"train_loss": -7.073777198791504, "global_step": 176227, "epoch": 4195} {"train_loss": -7.203921318054199, "global_step": 176228, "epoch": 4195} {"train_loss": -7.113578796386719, "global_step": 176229, "epoch": 4195} {"train_loss": -7.1719441413879395, "global_step": 176230, "epoch": 4195} {"train_loss": -7.075844537644159, "global_step": 176231, "epoch": 4195, "val_loss": 69187.328125} {"train_loss": -7.092280864715576, "global_step": 176232, "epoch": 4196} {"train_loss": -7.165424346923828, "global_step": 176233, "epoch": 4196} {"train_loss": -7.182396411895752, "global_step": 176234, "epoch": 4196} {"train_loss": -7.051843643188477, "global_step": 176235, "epoch": 4196} {"train_loss": -7.233080863952637, "global_step": 176236, "epoch": 4196} {"train_loss": -7.232983589172363, "global_step": 176237, "epoch": 4196} {"train_loss": -7.262684345245361, "global_step": 176238, "epoch": 4196} {"train_loss": -7.123495101928711, "global_step": 176239, "epoch": 4196} {"train_loss": -7.1403398513793945, "global_step": 176240, "epoch": 4196} {"train_loss": -6.969144344329834, "global_step": 176241, "epoch": 4196} {"train_loss": -7.021365642547607, "global_step": 176242, "epoch": 4196} {"train_loss": -7.138141632080078, "global_step": 176243, "epoch": 4196} {"train_loss": -7.098196029663086, "global_step": 176244, "epoch": 4196} {"train_loss": -7.0659589767456055, "global_step": 176245, "epoch": 4196} {"train_loss": -7.118771553039551, "global_step": 176246, "epoch": 4196} {"train_loss": -7.199913024902344, "global_step": 176247, "epoch": 4196} {"train_loss": -7.185755729675293, "global_step": 176248, "epoch": 4196} {"train_loss": -7.164764404296875, "global_step": 176249, "epoch": 4196} {"train_loss": -7.158476829528809, "global_step": 176250, "epoch": 4196} {"train_loss": -7.101455211639404, "global_step": 176251, "epoch": 4196} {"train_loss": -7.082062721252441, "global_step": 176252, "epoch": 4196} {"train_loss": -7.206521987915039, "global_step": 176253, "epoch": 4196} {"train_loss": -7.191887378692627, "global_step": 176254, "epoch": 4196} {"train_loss": -7.126584529876709, "global_step": 176255, "epoch": 4196} {"train_loss": -7.087776184082031, "global_step": 176256, "epoch": 4196} {"train_loss": -7.085365295410156, "global_step": 176257, "epoch": 4196} {"train_loss": -7.024936199188232, "global_step": 176258, "epoch": 4196} {"train_loss": -7.108040809631348, "global_step": 176259, "epoch": 4196} {"train_loss": -7.127330780029297, "global_step": 176260, "epoch": 4196} {"train_loss": -7.1201348304748535, "global_step": 176261, "epoch": 4196} {"train_loss": -7.080953598022461, "global_step": 176262, "epoch": 4196} {"train_loss": -7.165164947509766, "global_step": 176263, "epoch": 4196} {"train_loss": -7.125186920166016, "global_step": 176264, "epoch": 4196} {"train_loss": -7.093961715698242, "global_step": 176265, "epoch": 4196} {"train_loss": -7.113097667694092, "global_step": 176266, "epoch": 4196} {"train_loss": -7.073199272155762, "global_step": 176267, "epoch": 4196} {"train_loss": -7.100427627563477, "global_step": 176268, "epoch": 4196} {"train_loss": -7.1368279457092285, "global_step": 176269, "epoch": 4196} {"train_loss": -7.18098258972168, "global_step": 176270, "epoch": 4196} {"train_loss": -7.042000770568848, "global_step": 176271, "epoch": 4196} {"train_loss": -7.049488067626953, "global_step": 176272, "epoch": 4196} {"train_loss": -7.1213002772558305, "global_step": 176273, "epoch": 4196, "val_loss": 69280.328125} {"train_loss": -7.0416951179504395, "global_step": 176274, "epoch": 4197} {"train_loss": -7.118542671203613, "global_step": 176275, "epoch": 4197} {"train_loss": -7.192598819732666, "global_step": 176276, "epoch": 4197} {"train_loss": -7.120429515838623, "global_step": 176277, "epoch": 4197} {"train_loss": -7.138659477233887, "global_step": 176278, "epoch": 4197} {"train_loss": -7.140286922454834, "global_step": 176279, "epoch": 4197} {"train_loss": -7.142226696014404, "global_step": 176280, "epoch": 4197} {"train_loss": -7.165580749511719, "global_step": 176281, "epoch": 4197} {"train_loss": -7.004609107971191, "global_step": 176282, "epoch": 4197} {"train_loss": -7.160216331481934, "global_step": 176283, "epoch": 4197} {"train_loss": -7.1461381912231445, "global_step": 176284, "epoch": 4197} {"train_loss": -7.15534782409668, "global_step": 176285, "epoch": 4197} {"train_loss": -7.139804840087891, "global_step": 176286, "epoch": 4197} {"train_loss": -7.117987632751465, "global_step": 176287, "epoch": 4197} {"train_loss": -7.110788822174072, "global_step": 176288, "epoch": 4197} {"train_loss": -7.0446085929870605, "global_step": 176289, "epoch": 4197} {"train_loss": -7.004124641418457, "global_step": 176290, "epoch": 4197} {"train_loss": -7.090870380401611, "global_step": 176291, "epoch": 4197} {"train_loss": -7.124989986419678, "global_step": 176292, "epoch": 4197} {"train_loss": -7.0627851486206055, "global_step": 176293, "epoch": 4197} {"train_loss": -7.102813720703125, "global_step": 176294, "epoch": 4197} {"train_loss": -6.897212028503418, "global_step": 176295, "epoch": 4197} {"train_loss": -7.216248512268066, "global_step": 176296, "epoch": 4197} {"train_loss": -7.16048526763916, "global_step": 176297, "epoch": 4197} {"train_loss": -7.031798362731934, "global_step": 176298, "epoch": 4197} {"train_loss": -7.153346538543701, "global_step": 176299, "epoch": 4197} {"train_loss": -7.138054370880127, "global_step": 176300, "epoch": 4197} {"train_loss": -6.944348335266113, "global_step": 176301, "epoch": 4197} {"train_loss": -7.080821514129639, "global_step": 176302, "epoch": 4197} {"train_loss": -7.131008148193359, "global_step": 176303, "epoch": 4197} {"train_loss": -6.99237060546875, "global_step": 176304, "epoch": 4197} {"train_loss": -7.051923751831055, "global_step": 176305, "epoch": 4197} {"train_loss": -7.009977340698242, "global_step": 176306, "epoch": 4197} {"train_loss": -6.965351104736328, "global_step": 176307, "epoch": 4197} {"train_loss": -7.102715015411377, "global_step": 176308, "epoch": 4197} {"train_loss": -6.950674057006836, "global_step": 176309, "epoch": 4197} {"train_loss": -7.0411481857299805, "global_step": 176310, "epoch": 4197} {"train_loss": -7.0020036697387695, "global_step": 176311, "epoch": 4197} {"train_loss": -7.043341636657715, "global_step": 176312, "epoch": 4197} {"train_loss": -6.992387294769287, "global_step": 176313, "epoch": 4197} {"train_loss": -6.962091445922852, "global_step": 176314, "epoch": 4197} {"train_loss": -7.077740078880673, "global_step": 176315, "epoch": 4197, "val_loss": 69140.6953125} {"train_loss": -6.952897548675537, "global_step": 176316, "epoch": 4198} {"train_loss": -7.0375657081604, "global_step": 176317, "epoch": 4198} {"train_loss": -7.062949180603027, "global_step": 176318, "epoch": 4198} {"train_loss": -7.114136695861816, "global_step": 176319, "epoch": 4198} {"train_loss": -7.053625106811523, "global_step": 176320, "epoch": 4198} {"train_loss": -7.008093357086182, "global_step": 176321, "epoch": 4198} {"train_loss": -7.092159271240234, "global_step": 176322, "epoch": 4198} {"train_loss": -7.09309196472168, "global_step": 176323, "epoch": 4198} {"train_loss": -7.112883567810059, "global_step": 176324, "epoch": 4198} {"train_loss": -7.08477258682251, "global_step": 176325, "epoch": 4198} {"train_loss": -7.169256687164307, "global_step": 176326, "epoch": 4198} {"train_loss": -7.038236618041992, "global_step": 176327, "epoch": 4198} {"train_loss": -7.129199981689453, "global_step": 176328, "epoch": 4198} {"train_loss": -7.062906265258789, "global_step": 176329, "epoch": 4198} {"train_loss": -7.161135673522949, "global_step": 176330, "epoch": 4198} {"train_loss": -7.081567287445068, "global_step": 176331, "epoch": 4198} {"train_loss": -7.080941677093506, "global_step": 176332, "epoch": 4198} {"train_loss": -7.1337738037109375, "global_step": 176333, "epoch": 4198} {"train_loss": -7.142671585083008, "global_step": 176334, "epoch": 4198} {"train_loss": -7.112889289855957, "global_step": 176335, "epoch": 4198} {"train_loss": -7.093962669372559, "global_step": 176336, "epoch": 4198} {"train_loss": -6.99317741394043, "global_step": 176337, "epoch": 4198} {"train_loss": -7.134313583374023, "global_step": 176338, "epoch": 4198} {"train_loss": -7.06987190246582, "global_step": 176339, "epoch": 4198} {"train_loss": -7.098474502563477, "global_step": 176340, "epoch": 4198} {"train_loss": -7.13789701461792, "global_step": 176341, "epoch": 4198} {"train_loss": -7.239116668701172, "global_step": 176342, "epoch": 4198} {"train_loss": -7.095731735229492, "global_step": 176343, "epoch": 4198} {"train_loss": -7.051877498626709, "global_step": 176344, "epoch": 4198} {"train_loss": -7.139127731323242, "global_step": 176345, "epoch": 4198} {"train_loss": -7.143922805786133, "global_step": 176346, "epoch": 4198} {"train_loss": -7.064201354980469, "global_step": 176347, "epoch": 4198} {"train_loss": -7.080628871917725, "global_step": 176348, "epoch": 4198} {"train_loss": -7.133939743041992, "global_step": 176349, "epoch": 4198} {"train_loss": -7.212677001953125, "global_step": 176350, "epoch": 4198} {"train_loss": -7.137718200683594, "global_step": 176351, "epoch": 4198} {"train_loss": -7.1184868812561035, "global_step": 176352, "epoch": 4198} {"train_loss": -7.2028608322143555, "global_step": 176353, "epoch": 4198} {"train_loss": -7.189903259277344, "global_step": 176354, "epoch": 4198} {"train_loss": -7.163424491882324, "global_step": 176355, "epoch": 4198} {"train_loss": -7.0206427574157715, "global_step": 176356, "epoch": 4198} {"train_loss": -7.104094005766369, "global_step": 176357, "epoch": 4198, "val_loss": 69266.015625} {"train_loss": -7.071838855743408, "global_step": 176358, "epoch": 4199} {"train_loss": -6.958199501037598, "global_step": 176359, "epoch": 4199} {"train_loss": -6.974031925201416, "global_step": 176360, "epoch": 4199} {"train_loss": -7.030799865722656, "global_step": 176361, "epoch": 4199} {"train_loss": -6.946062088012695, "global_step": 176362, "epoch": 4199} {"train_loss": -6.938072204589844, "global_step": 176363, "epoch": 4199} {"train_loss": -7.132909774780273, "global_step": 176364, "epoch": 4199} {"train_loss": -6.934334754943848, "global_step": 176365, "epoch": 4199} {"train_loss": -7.044593334197998, "global_step": 176366, "epoch": 4199} {"train_loss": -7.061792373657227, "global_step": 176367, "epoch": 4199} {"train_loss": -6.937363624572754, "global_step": 176368, "epoch": 4199} {"train_loss": -7.087759017944336, "global_step": 176369, "epoch": 4199} {"train_loss": -6.970980644226074, "global_step": 176370, "epoch": 4199} {"train_loss": -7.013457298278809, "global_step": 176371, "epoch": 4199} {"train_loss": -7.044991493225098, "global_step": 176372, "epoch": 4199} {"train_loss": -7.087505340576172, "global_step": 176373, "epoch": 4199} {"train_loss": -7.095363616943359, "global_step": 176374, "epoch": 4199} {"train_loss": -7.066832542419434, "global_step": 176375, "epoch": 4199} {"train_loss": -7.053115367889404, "global_step": 176376, "epoch": 4199} {"train_loss": -7.0350165367126465, "global_step": 176377, "epoch": 4199} {"train_loss": -7.011960029602051, "global_step": 176378, "epoch": 4199} {"train_loss": -7.03751277923584, "global_step": 176379, "epoch": 4199} {"train_loss": -7.019671440124512, "global_step": 176380, "epoch": 4199} {"train_loss": -7.1568756103515625, "global_step": 176381, "epoch": 4199} {"train_loss": -7.016508102416992, "global_step": 176382, "epoch": 4199} {"train_loss": -7.125240325927734, "global_step": 176383, "epoch": 4199} {"train_loss": -7.105355262756348, "global_step": 176384, "epoch": 4199} {"train_loss": -7.134774208068848, "global_step": 176385, "epoch": 4199} {"train_loss": -7.085606575012207, "global_step": 176386, "epoch": 4199} {"train_loss": -7.067079544067383, "global_step": 176387, "epoch": 4199} {"train_loss": -7.130827903747559, "global_step": 176388, "epoch": 4199} {"train_loss": -7.123204708099365, "global_step": 176389, "epoch": 4199} {"train_loss": -7.182427406311035, "global_step": 176390, "epoch": 4199} {"train_loss": -7.155490875244141, "global_step": 176391, "epoch": 4199} {"train_loss": -7.114139556884766, "global_step": 176392, "epoch": 4199} {"train_loss": -7.125334739685059, "global_step": 176393, "epoch": 4199} {"train_loss": -7.171104431152344, "global_step": 176394, "epoch": 4199} {"train_loss": -7.090705394744873, "global_step": 176395, "epoch": 4199} {"train_loss": -7.158376216888428, "global_step": 176396, "epoch": 4199} {"train_loss": -7.148296356201172, "global_step": 176397, "epoch": 4199} {"train_loss": -7.102344036102295, "global_step": 176398, "epoch": 4199} {"train_loss": -7.065963461285546, "global_step": 176399, "epoch": 4199, "val_loss": 69364.953125} {"train_loss": -7.042150497436523, "global_step": 176400, "epoch": 4200} {"train_loss": -6.952343940734863, "global_step": 176401, "epoch": 4200} {"train_loss": -7.026060104370117, "global_step": 176402, "epoch": 4200} {"train_loss": -7.214732646942139, "global_step": 176403, "epoch": 4200} {"train_loss": -7.131537437438965, "global_step": 176404, "epoch": 4200} {"train_loss": -7.224603652954102, "global_step": 176405, "epoch": 4200} {"train_loss": -7.104473114013672, "global_step": 176406, "epoch": 4200} {"train_loss": -7.058119773864746, "global_step": 176407, "epoch": 4200} {"train_loss": -7.062007904052734, "global_step": 176408, "epoch": 4200} {"train_loss": -7.042602062225342, "global_step": 176409, "epoch": 4200} {"train_loss": -7.029916286468506, "global_step": 176410, "epoch": 4200} {"train_loss": -7.069395542144775, "global_step": 176411, "epoch": 4200} {"train_loss": -7.005118370056152, "global_step": 176412, "epoch": 4200} {"train_loss": -7.082550048828125, "global_step": 176413, "epoch": 4200} {"train_loss": -7.151423454284668, "global_step": 176414, "epoch": 4200} {"train_loss": -6.926382541656494, "global_step": 176415, "epoch": 4200} {"train_loss": -6.86274528503418, "global_step": 176416, "epoch": 4200} {"train_loss": -7.0656843185424805, "global_step": 176417, "epoch": 4200} {"train_loss": -6.884372711181641, "global_step": 176418, "epoch": 4200} {"train_loss": -6.917685031890869, "global_step": 176419, "epoch": 4200} {"train_loss": -7.091423988342285, "global_step": 176420, "epoch": 4200} {"train_loss": -7.104976654052734, "global_step": 176421, "epoch": 4200} {"train_loss": -7.088357925415039, "global_step": 176422, "epoch": 4200} {"train_loss": -7.198575019836426, "global_step": 176423, "epoch": 4200} {"train_loss": -7.036800384521484, "global_step": 176424, "epoch": 4200} {"train_loss": -7.091073989868164, "global_step": 176425, "epoch": 4200} {"train_loss": -7.140664100646973, "global_step": 176426, "epoch": 4200} {"train_loss": -7.180552959442139, "global_step": 176427, "epoch": 4200} {"train_loss": -7.078351974487305, "global_step": 176428, "epoch": 4200} {"train_loss": -7.0233917236328125, "global_step": 176429, "epoch": 4200} {"train_loss": -7.114755630493164, "global_step": 176430, "epoch": 4200} {"train_loss": -7.138223171234131, "global_step": 176431, "epoch": 4200} {"train_loss": -7.117730140686035, "global_step": 176432, "epoch": 4200} {"train_loss": -7.151745796203613, "global_step": 176433, "epoch": 4200} {"train_loss": -7.012241363525391, "global_step": 176434, "epoch": 4200} {"train_loss": -7.115636348724365, "global_step": 176435, "epoch": 4200} {"train_loss": -7.179010391235352, "global_step": 176436, "epoch": 4200} {"train_loss": -7.089896202087402, "global_step": 176437, "epoch": 4200} {"train_loss": -7.130328178405762, "global_step": 176438, "epoch": 4200} {"train_loss": -7.103318214416504, "global_step": 176439, "epoch": 4200} {"train_loss": -7.089108467102051, "global_step": 176440, "epoch": 4200} {"train_loss": -7.075470072882516, "global_step": 176441, "epoch": 4200, "train/sim_max_reward_0": 0.8834689936185466, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.572079523885662, "train/sim_max_reward_3": 0.13240110395443075, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.944623652970374, "test/sim_max_reward_4300001": 0.5141952187643465, "test/sim_max_reward_4300002": 0.9378100698398484, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8490310084952557, "test/sim_max_reward_4300006": 0.6884096720434959, "test/sim_max_reward_4300007": 0.17048035828444186, "test/sim_max_reward_4300008": 0.9135630912199415, "test/sim_max_reward_4300009": 0.9406260299143694, "test/sim_max_reward_4300010": 0.9681182228507141, "test/sim_max_reward_4300011": 0.9869830324953787, "test/sim_max_reward_4300012": 0.9547021274399223, "test/sim_max_reward_4300013": 0.4035636659681807, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9903280029043818, "test/sim_max_reward_4300016": 0.700681556506292, "test/sim_max_reward_4300017": 0.9266813881730015, "test/sim_max_reward_4300018": 0.39226262895862374, "test/sim_max_reward_4300019": 0.18579541379777262, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9284001653986144, "test/sim_max_reward_4300022": 0.8494970385771679, "test/sim_max_reward_4300023": 1.0, "test/sim_max_reward_4300024": 0.3951413947074557, "test/sim_max_reward_4300025": 0.9708822633431552, "test/sim_max_reward_4300026": 0.19045021758761987, "test/sim_max_reward_4300027": 0.9136053911488385, "test/sim_max_reward_4300028": 1.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.30070194817340873, "test/sim_max_reward_4300031": 0.20858878065105282, "test/sim_max_reward_4300032": 0.9039612273242853, "test/sim_max_reward_4300033": 0.6575686394304452, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.3892967932971555, "test/sim_max_reward_4300036": 0.22654534212275385, "test/sim_max_reward_4300037": 0.6602499278191089, "test/sim_max_reward_4300038": 0.9082194935995503, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.9453060492164171, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.4861732550441108, "test/sim_max_reward_4300043": 0.1432208708241308, "test/sim_max_reward_4300044": 0.7796962998343171, "test/sim_max_reward_4300045": 0.9737181137803272, "test/sim_max_reward_4300046": 0.9891818278945764, "test/sim_max_reward_4300047": 0.12305289750495414, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.2435958940262865, "train/mean_score": 0.6301557301368045, "test/mean_score": 0.6134148615348272, "val_loss": 69239.0859375} {"train_loss": -7.186491012573242, "global_step": 176442, "epoch": 4201} {"train_loss": -7.144850730895996, "global_step": 176443, "epoch": 4201} {"train_loss": -7.131947040557861, "global_step": 176444, "epoch": 4201} {"train_loss": -7.054383277893066, "global_step": 176445, "epoch": 4201} {"train_loss": -7.082060813903809, "global_step": 176446, "epoch": 4201} {"train_loss": -7.120649337768555, "global_step": 176447, "epoch": 4201} {"train_loss": -7.053849220275879, "global_step": 176448, "epoch": 4201} {"train_loss": -7.086580276489258, "global_step": 176449, "epoch": 4201} {"train_loss": -7.043932914733887, "global_step": 176450, "epoch": 4201} {"train_loss": -7.019274711608887, "global_step": 176451, "epoch": 4201} {"train_loss": -7.151510715484619, "global_step": 176452, "epoch": 4201} {"train_loss": -7.017734527587891, "global_step": 176453, "epoch": 4201} {"train_loss": -7.034426689147949, "global_step": 176454, "epoch": 4201} {"train_loss": -6.983513832092285, "global_step": 176455, "epoch": 4201} {"train_loss": -6.9798126220703125, "global_step": 176456, "epoch": 4201} {"train_loss": -7.027998924255371, "global_step": 176457, "epoch": 4201} {"train_loss": -7.0315961837768555, "global_step": 176458, "epoch": 4201} {"train_loss": -7.015893459320068, "global_step": 176459, "epoch": 4201} {"train_loss": -7.17265510559082, "global_step": 176460, "epoch": 4201} {"train_loss": -6.99559211730957, "global_step": 176461, "epoch": 4201} {"train_loss": -7.028080940246582, "global_step": 176462, "epoch": 4201} {"train_loss": -7.093642234802246, "global_step": 176463, "epoch": 4201} {"train_loss": -7.105476379394531, "global_step": 176464, "epoch": 4201} {"train_loss": -7.12158203125, "global_step": 176465, "epoch": 4201} {"train_loss": -7.079855918884277, "global_step": 176466, "epoch": 4201} {"train_loss": -6.994328498840332, "global_step": 176467, "epoch": 4201} {"train_loss": -7.18325138092041, "global_step": 176468, "epoch": 4201} {"train_loss": -6.9799065589904785, "global_step": 176469, "epoch": 4201} {"train_loss": -7.055121421813965, "global_step": 176470, "epoch": 4201} {"train_loss": -6.969606876373291, "global_step": 176471, "epoch": 4201} {"train_loss": -7.052708625793457, "global_step": 176472, "epoch": 4201} {"train_loss": -7.045660972595215, "global_step": 176473, "epoch": 4201} {"train_loss": -7.01072883605957, "global_step": 176474, "epoch": 4201} {"train_loss": -7.025731563568115, "global_step": 176475, "epoch": 4201} {"train_loss": -6.954765319824219, "global_step": 176476, "epoch": 4201} {"train_loss": -7.144397735595703, "global_step": 176477, "epoch": 4201} {"train_loss": -7.111796855926514, "global_step": 176478, "epoch": 4201} {"train_loss": -7.031940460205078, "global_step": 176479, "epoch": 4201} {"train_loss": -7.040521621704102, "global_step": 176480, "epoch": 4201} {"train_loss": -6.953982353210449, "global_step": 176481, "epoch": 4201} {"train_loss": -7.021987438201904, "global_step": 176482, "epoch": 4201} {"train_loss": -7.0580928439185735, "global_step": 176483, "epoch": 4201, "val_loss": 69350.875} {"train_loss": -6.969689846038818, "global_step": 176484, "epoch": 4202} {"train_loss": -7.0539422035217285, "global_step": 176485, "epoch": 4202} {"train_loss": -6.940272331237793, "global_step": 176486, "epoch": 4202} {"train_loss": -7.036077499389648, "global_step": 176487, "epoch": 4202} {"train_loss": -7.104968070983887, "global_step": 176488, "epoch": 4202} {"train_loss": -7.023809909820557, "global_step": 176489, "epoch": 4202} {"train_loss": -7.002473831176758, "global_step": 176490, "epoch": 4202} {"train_loss": -7.081999778747559, "global_step": 176491, "epoch": 4202} {"train_loss": -7.014368057250977, "global_step": 176492, "epoch": 4202} {"train_loss": -7.0995306968688965, "global_step": 176493, "epoch": 4202} {"train_loss": -7.042348861694336, "global_step": 176494, "epoch": 4202} {"train_loss": -7.110969066619873, "global_step": 176495, "epoch": 4202} {"train_loss": -7.180874824523926, "global_step": 176496, "epoch": 4202} {"train_loss": -7.012788772583008, "global_step": 176497, "epoch": 4202} {"train_loss": -7.058980941772461, "global_step": 176498, "epoch": 4202} {"train_loss": -7.1666741371154785, "global_step": 176499, "epoch": 4202} {"train_loss": -7.078429222106934, "global_step": 176500, "epoch": 4202} {"train_loss": -7.088369369506836, "global_step": 176501, "epoch": 4202} {"train_loss": -7.131041526794434, "global_step": 176502, "epoch": 4202} {"train_loss": -7.047849655151367, "global_step": 176503, "epoch": 4202} {"train_loss": -7.051093101501465, "global_step": 176504, "epoch": 4202} {"train_loss": -7.05709981918335, "global_step": 176505, "epoch": 4202} {"train_loss": -6.987675189971924, "global_step": 176506, "epoch": 4202} {"train_loss": -7.056097984313965, "global_step": 176507, "epoch": 4202} {"train_loss": -7.166059494018555, "global_step": 176508, "epoch": 4202} {"train_loss": -7.009974479675293, "global_step": 176509, "epoch": 4202} {"train_loss": -7.039811611175537, "global_step": 176510, "epoch": 4202} {"train_loss": -7.116475582122803, "global_step": 176511, "epoch": 4202} {"train_loss": -6.9454498291015625, "global_step": 176512, "epoch": 4202} {"train_loss": -7.0893378257751465, "global_step": 176513, "epoch": 4202} {"train_loss": -7.13910436630249, "global_step": 176514, "epoch": 4202} {"train_loss": -6.990981101989746, "global_step": 176515, "epoch": 4202} {"train_loss": -7.000869274139404, "global_step": 176516, "epoch": 4202} {"train_loss": -7.116046905517578, "global_step": 176517, "epoch": 4202} {"train_loss": -7.069246292114258, "global_step": 176518, "epoch": 4202} {"train_loss": -7.037168502807617, "global_step": 176519, "epoch": 4202} {"train_loss": -6.940053939819336, "global_step": 176520, "epoch": 4202} {"train_loss": -7.031018257141113, "global_step": 176521, "epoch": 4202} {"train_loss": -7.043108940124512, "global_step": 176522, "epoch": 4202} {"train_loss": -7.078271389007568, "global_step": 176523, "epoch": 4202} {"train_loss": -6.929324150085449, "global_step": 176524, "epoch": 4202} {"train_loss": -7.0520455950782415, "global_step": 176525, "epoch": 4202, "val_loss": 69242.390625} {"train_loss": -7.200090408325195, "global_step": 176526, "epoch": 4203} {"train_loss": -7.082469940185547, "global_step": 176527, "epoch": 4203} {"train_loss": -7.037781715393066, "global_step": 176528, "epoch": 4203} {"train_loss": -7.141730308532715, "global_step": 176529, "epoch": 4203} {"train_loss": -7.009512901306152, "global_step": 176530, "epoch": 4203} {"train_loss": -7.130112171173096, "global_step": 176531, "epoch": 4203} {"train_loss": -7.059372901916504, "global_step": 176532, "epoch": 4203} {"train_loss": -7.141083717346191, "global_step": 176533, "epoch": 4203} {"train_loss": -7.027683258056641, "global_step": 176534, "epoch": 4203} {"train_loss": -7.186222553253174, "global_step": 176535, "epoch": 4203} {"train_loss": -7.096545696258545, "global_step": 176536, "epoch": 4203} {"train_loss": -7.0104265213012695, "global_step": 176537, "epoch": 4203} {"train_loss": -7.008481979370117, "global_step": 176538, "epoch": 4203} {"train_loss": -7.150534629821777, "global_step": 176539, "epoch": 4203} {"train_loss": -6.9947075843811035, "global_step": 176540, "epoch": 4203} {"train_loss": -7.179262638092041, "global_step": 176541, "epoch": 4203} {"train_loss": -7.145749092102051, "global_step": 176542, "epoch": 4203} {"train_loss": -6.988423824310303, "global_step": 176543, "epoch": 4203} {"train_loss": -6.952694416046143, "global_step": 176544, "epoch": 4203} {"train_loss": -7.078069686889648, "global_step": 176545, "epoch": 4203} {"train_loss": -7.011538505554199, "global_step": 176546, "epoch": 4203} {"train_loss": -7.057173728942871, "global_step": 176547, "epoch": 4203} {"train_loss": -7.119567394256592, "global_step": 176548, "epoch": 4203} {"train_loss": -7.134660720825195, "global_step": 176549, "epoch": 4203} {"train_loss": -7.033535957336426, "global_step": 176550, "epoch": 4203} {"train_loss": -7.030322074890137, "global_step": 176551, "epoch": 4203} {"train_loss": -7.101805686950684, "global_step": 176552, "epoch": 4203} {"train_loss": -7.015398025512695, "global_step": 176553, "epoch": 4203} {"train_loss": -6.866236209869385, "global_step": 176554, "epoch": 4203} {"train_loss": -7.069591999053955, "global_step": 176555, "epoch": 4203} {"train_loss": -6.92825984954834, "global_step": 176556, "epoch": 4203} {"train_loss": -7.026579856872559, "global_step": 176557, "epoch": 4203} {"train_loss": -7.101400852203369, "global_step": 176558, "epoch": 4203} {"train_loss": -7.0984978675842285, "global_step": 176559, "epoch": 4203} {"train_loss": -6.881742477416992, "global_step": 176560, "epoch": 4203} {"train_loss": -7.078287124633789, "global_step": 176561, "epoch": 4203} {"train_loss": -7.042959213256836, "global_step": 176562, "epoch": 4203} {"train_loss": -7.052404403686523, "global_step": 176563, "epoch": 4203} {"train_loss": -6.9856109619140625, "global_step": 176564, "epoch": 4203} {"train_loss": -7.007568836212158, "global_step": 176565, "epoch": 4203} {"train_loss": -7.105130195617676, "global_step": 176566, "epoch": 4203} {"train_loss": -7.055516867410569, "global_step": 176567, "epoch": 4203, "val_loss": 69340.078125} {"train_loss": -7.1340460777282715, "global_step": 176568, "epoch": 4204} {"train_loss": -7.142546653747559, "global_step": 176569, "epoch": 4204} {"train_loss": -7.019771575927734, "global_step": 176570, "epoch": 4204} {"train_loss": -7.174576282501221, "global_step": 176571, "epoch": 4204} {"train_loss": -7.054730415344238, "global_step": 176572, "epoch": 4204} {"train_loss": -7.120362281799316, "global_step": 176573, "epoch": 4204} {"train_loss": -7.076279163360596, "global_step": 176574, "epoch": 4204} {"train_loss": -7.164311408996582, "global_step": 176575, "epoch": 4204} {"train_loss": -7.034146308898926, "global_step": 176576, "epoch": 4204} {"train_loss": -7.034224510192871, "global_step": 176577, "epoch": 4204} {"train_loss": -7.018435955047607, "global_step": 176578, "epoch": 4204} {"train_loss": -7.0132951736450195, "global_step": 176579, "epoch": 4204} {"train_loss": -7.1576690673828125, "global_step": 176580, "epoch": 4204} {"train_loss": -7.059847831726074, "global_step": 176581, "epoch": 4204} {"train_loss": -7.027591705322266, "global_step": 176582, "epoch": 4204} {"train_loss": -7.116613388061523, "global_step": 176583, "epoch": 4204} {"train_loss": -6.993099689483643, "global_step": 176584, "epoch": 4204} {"train_loss": -7.123409271240234, "global_step": 176585, "epoch": 4204} {"train_loss": -7.105012893676758, "global_step": 176586, "epoch": 4204} {"train_loss": -7.02338981628418, "global_step": 176587, "epoch": 4204} {"train_loss": -7.233998775482178, "global_step": 176588, "epoch": 4204} {"train_loss": -7.1059160232543945, "global_step": 176589, "epoch": 4204} {"train_loss": -7.185437202453613, "global_step": 176590, "epoch": 4204} {"train_loss": -7.12005615234375, "global_step": 176591, "epoch": 4204} {"train_loss": -7.121383190155029, "global_step": 176592, "epoch": 4204} {"train_loss": -7.073319911956787, "global_step": 176593, "epoch": 4204} {"train_loss": -6.940435409545898, "global_step": 176594, "epoch": 4204} {"train_loss": -7.078469276428223, "global_step": 176595, "epoch": 4204} {"train_loss": -7.095673084259033, "global_step": 176596, "epoch": 4204} {"train_loss": -7.046281337738037, "global_step": 176597, "epoch": 4204} {"train_loss": -7.091599464416504, "global_step": 176598, "epoch": 4204} {"train_loss": -7.073162078857422, "global_step": 176599, "epoch": 4204} {"train_loss": -7.087166786193848, "global_step": 176600, "epoch": 4204} {"train_loss": -7.068552494049072, "global_step": 176601, "epoch": 4204} {"train_loss": -7.055395603179932, "global_step": 176602, "epoch": 4204} {"train_loss": -7.171291351318359, "global_step": 176603, "epoch": 4204} {"train_loss": -6.898294925689697, "global_step": 176604, "epoch": 4204} {"train_loss": -7.166943073272705, "global_step": 176605, "epoch": 4204} {"train_loss": -7.069696426391602, "global_step": 176606, "epoch": 4204} {"train_loss": -6.993371963500977, "global_step": 176607, "epoch": 4204} {"train_loss": -7.138327121734619, "global_step": 176608, "epoch": 4204} {"train_loss": -7.081261146636236, "global_step": 176609, "epoch": 4204, "val_loss": 69123.59375} {"train_loss": -7.024049282073975, "global_step": 176610, "epoch": 4205} {"train_loss": -7.146617889404297, "global_step": 176611, "epoch": 4205} {"train_loss": -7.0455498695373535, "global_step": 176612, "epoch": 4205} {"train_loss": -6.992288589477539, "global_step": 176613, "epoch": 4205} {"train_loss": -7.03885555267334, "global_step": 176614, "epoch": 4205} {"train_loss": -7.02114200592041, "global_step": 176615, "epoch": 4205} {"train_loss": -7.04716682434082, "global_step": 176616, "epoch": 4205} {"train_loss": -6.937156677246094, "global_step": 176617, "epoch": 4205} {"train_loss": -6.976986408233643, "global_step": 176618, "epoch": 4205} {"train_loss": -7.057099342346191, "global_step": 176619, "epoch": 4205} {"train_loss": -6.918872833251953, "global_step": 176620, "epoch": 4205} {"train_loss": -7.120718002319336, "global_step": 176621, "epoch": 4205} {"train_loss": -6.999594211578369, "global_step": 176622, "epoch": 4205} {"train_loss": -6.988189697265625, "global_step": 176623, "epoch": 4205} {"train_loss": -7.093822002410889, "global_step": 176624, "epoch": 4205} {"train_loss": -6.92812967300415, "global_step": 176625, "epoch": 4205} {"train_loss": -7.051965713500977, "global_step": 176626, "epoch": 4205} {"train_loss": -7.071319103240967, "global_step": 176627, "epoch": 4205} {"train_loss": -7.008672714233398, "global_step": 176628, "epoch": 4205} {"train_loss": -7.042975425720215, "global_step": 176629, "epoch": 4205} {"train_loss": -7.097987174987793, "global_step": 176630, "epoch": 4205} {"train_loss": -7.053918838500977, "global_step": 176631, "epoch": 4205} {"train_loss": -7.0238823890686035, "global_step": 176632, "epoch": 4205} {"train_loss": -7.022370338439941, "global_step": 176633, "epoch": 4205} {"train_loss": -7.000088691711426, "global_step": 176634, "epoch": 4205} {"train_loss": -7.034039497375488, "global_step": 176635, "epoch": 4205} {"train_loss": -7.105019569396973, "global_step": 176636, "epoch": 4205} {"train_loss": -7.122720718383789, "global_step": 176637, "epoch": 4205} {"train_loss": -7.088230133056641, "global_step": 176638, "epoch": 4205} {"train_loss": -7.1443023681640625, "global_step": 176639, "epoch": 4205} {"train_loss": -7.068852424621582, "global_step": 176640, "epoch": 4205} {"train_loss": -7.107251167297363, "global_step": 176641, "epoch": 4205} {"train_loss": -7.062498569488525, "global_step": 176642, "epoch": 4205} {"train_loss": -7.214529514312744, "global_step": 176643, "epoch": 4205} {"train_loss": -7.184439182281494, "global_step": 176644, "epoch": 4205} {"train_loss": -7.111216068267822, "global_step": 176645, "epoch": 4205} {"train_loss": -7.023138999938965, "global_step": 176646, "epoch": 4205} {"train_loss": -7.025512218475342, "global_step": 176647, "epoch": 4205} {"train_loss": -7.029270648956299, "global_step": 176648, "epoch": 4205} {"train_loss": -7.105415344238281, "global_step": 176649, "epoch": 4205} {"train_loss": -7.075765609741211, "global_step": 176650, "epoch": 4205} {"train_loss": -7.052663541975475, "global_step": 176651, "epoch": 4205, "val_loss": 69297.9765625} {"train_loss": -7.126945495605469, "global_step": 176652, "epoch": 4206} {"train_loss": -7.147120475769043, "global_step": 176653, "epoch": 4206} {"train_loss": -7.1172614097595215, "global_step": 176654, "epoch": 4206} {"train_loss": -7.216986179351807, "global_step": 176655, "epoch": 4206} {"train_loss": -7.118730068206787, "global_step": 176656, "epoch": 4206} {"train_loss": -7.1661787033081055, "global_step": 176657, "epoch": 4206} {"train_loss": -7.1598615646362305, "global_step": 176658, "epoch": 4206} {"train_loss": -7.10653018951416, "global_step": 176659, "epoch": 4206} {"train_loss": -7.073064804077148, "global_step": 176660, "epoch": 4206} {"train_loss": -7.069024085998535, "global_step": 176661, "epoch": 4206} {"train_loss": -7.126025676727295, "global_step": 176662, "epoch": 4206} {"train_loss": -7.1237077713012695, "global_step": 176663, "epoch": 4206} {"train_loss": -7.0614333152771, "global_step": 176664, "epoch": 4206} {"train_loss": -7.147607326507568, "global_step": 176665, "epoch": 4206} {"train_loss": -7.171195030212402, "global_step": 176666, "epoch": 4206} {"train_loss": -6.9522786140441895, "global_step": 176667, "epoch": 4206} {"train_loss": -7.036387920379639, "global_step": 176668, "epoch": 4206} {"train_loss": -7.035525321960449, "global_step": 176669, "epoch": 4206} {"train_loss": -7.097620010375977, "global_step": 176670, "epoch": 4206} {"train_loss": -7.0895490646362305, "global_step": 176671, "epoch": 4206} {"train_loss": -7.095412254333496, "global_step": 176672, "epoch": 4206} {"train_loss": -6.888622760772705, "global_step": 176673, "epoch": 4206} {"train_loss": -7.105563163757324, "global_step": 176674, "epoch": 4206} {"train_loss": -6.955379962921143, "global_step": 176675, "epoch": 4206} {"train_loss": -7.139118671417236, "global_step": 176676, "epoch": 4206} {"train_loss": -6.970155715942383, "global_step": 176677, "epoch": 4206} {"train_loss": -7.103574752807617, "global_step": 176678, "epoch": 4206} {"train_loss": -7.037242889404297, "global_step": 176679, "epoch": 4206} {"train_loss": -6.991924285888672, "global_step": 176680, "epoch": 4206} {"train_loss": -7.095030784606934, "global_step": 176681, "epoch": 4206} {"train_loss": -6.986665725708008, "global_step": 176682, "epoch": 4206} {"train_loss": -7.003271579742432, "global_step": 176683, "epoch": 4206} {"train_loss": -7.047122001647949, "global_step": 176684, "epoch": 4206} {"train_loss": -6.968697547912598, "global_step": 176685, "epoch": 4206} {"train_loss": -7.073247909545898, "global_step": 176686, "epoch": 4206} {"train_loss": -6.900465965270996, "global_step": 176687, "epoch": 4206} {"train_loss": -7.061419486999512, "global_step": 176688, "epoch": 4206} {"train_loss": -7.084963798522949, "global_step": 176689, "epoch": 4206} {"train_loss": -7.130259037017822, "global_step": 176690, "epoch": 4206} {"train_loss": -7.0089240074157715, "global_step": 176691, "epoch": 4206} {"train_loss": -7.065243721008301, "global_step": 176692, "epoch": 4206} {"train_loss": -7.06788892973037, "global_step": 176693, "epoch": 4206, "val_loss": 69229.8515625} {"train_loss": -7.004641532897949, "global_step": 176694, "epoch": 4207} {"train_loss": -7.194301605224609, "global_step": 176695, "epoch": 4207} {"train_loss": -7.154635429382324, "global_step": 176696, "epoch": 4207} {"train_loss": -7.032841682434082, "global_step": 176697, "epoch": 4207} {"train_loss": -7.135961055755615, "global_step": 176698, "epoch": 4207} {"train_loss": -7.045639991760254, "global_step": 176699, "epoch": 4207} {"train_loss": -7.2484283447265625, "global_step": 176700, "epoch": 4207} {"train_loss": -7.138052940368652, "global_step": 176701, "epoch": 4207} {"train_loss": -7.153398513793945, "global_step": 176702, "epoch": 4207} {"train_loss": -7.04793643951416, "global_step": 176703, "epoch": 4207} {"train_loss": -7.147879600524902, "global_step": 176704, "epoch": 4207} {"train_loss": -7.046982765197754, "global_step": 176705, "epoch": 4207} {"train_loss": -7.175011157989502, "global_step": 176706, "epoch": 4207} {"train_loss": -7.068234443664551, "global_step": 176707, "epoch": 4207} {"train_loss": -6.998842239379883, "global_step": 176708, "epoch": 4207} {"train_loss": -7.185928821563721, "global_step": 176709, "epoch": 4207} {"train_loss": -7.139709949493408, "global_step": 176710, "epoch": 4207} {"train_loss": -7.122909069061279, "global_step": 176711, "epoch": 4207} {"train_loss": -7.131213188171387, "global_step": 176712, "epoch": 4207} {"train_loss": -7.11074686050415, "global_step": 176713, "epoch": 4207} {"train_loss": -7.191620826721191, "global_step": 176714, "epoch": 4207} {"train_loss": -7.136703968048096, "global_step": 176715, "epoch": 4207} {"train_loss": -6.971138954162598, "global_step": 176716, "epoch": 4207} {"train_loss": -7.158811569213867, "global_step": 176717, "epoch": 4207} {"train_loss": -7.152316093444824, "global_step": 176718, "epoch": 4207} {"train_loss": -7.019754409790039, "global_step": 176719, "epoch": 4207} {"train_loss": -7.116340160369873, "global_step": 176720, "epoch": 4207} {"train_loss": -6.965235710144043, "global_step": 176721, "epoch": 4207} {"train_loss": -7.036188125610352, "global_step": 176722, "epoch": 4207} {"train_loss": -6.838797569274902, "global_step": 176723, "epoch": 4207} {"train_loss": -7.034982204437256, "global_step": 176724, "epoch": 4207} {"train_loss": -6.985367774963379, "global_step": 176725, "epoch": 4207} {"train_loss": -7.013186931610107, "global_step": 176726, "epoch": 4207} {"train_loss": -7.011700630187988, "global_step": 176727, "epoch": 4207} {"train_loss": -6.757912635803223, "global_step": 176728, "epoch": 4207} {"train_loss": -7.043824672698975, "global_step": 176729, "epoch": 4207} {"train_loss": -7.011541843414307, "global_step": 176730, "epoch": 4207} {"train_loss": -7.038965225219727, "global_step": 176731, "epoch": 4207} {"train_loss": -7.011124610900879, "global_step": 176732, "epoch": 4207} {"train_loss": -6.930190563201904, "global_step": 176733, "epoch": 4207} {"train_loss": -7.021430015563965, "global_step": 176734, "epoch": 4207} {"train_loss": -7.066091934839885, "global_step": 176735, "epoch": 4207, "val_loss": 69217.609375} {"train_loss": -7.162517547607422, "global_step": 176736, "epoch": 4208} {"train_loss": -7.033045768737793, "global_step": 176737, "epoch": 4208} {"train_loss": -7.046885013580322, "global_step": 176738, "epoch": 4208} {"train_loss": -7.028811454772949, "global_step": 176739, "epoch": 4208} {"train_loss": -6.989227294921875, "global_step": 176740, "epoch": 4208} {"train_loss": -7.102450370788574, "global_step": 176741, "epoch": 4208} {"train_loss": -7.139124870300293, "global_step": 176742, "epoch": 4208} {"train_loss": -7.1270270347595215, "global_step": 176743, "epoch": 4208} {"train_loss": -7.113352298736572, "global_step": 176744, "epoch": 4208} {"train_loss": -7.088458061218262, "global_step": 176745, "epoch": 4208} {"train_loss": -7.128300189971924, "global_step": 176746, "epoch": 4208} {"train_loss": -7.079914569854736, "global_step": 176747, "epoch": 4208} {"train_loss": -7.032145023345947, "global_step": 176748, "epoch": 4208} {"train_loss": -7.127370834350586, "global_step": 176749, "epoch": 4208} {"train_loss": -7.037830829620361, "global_step": 176750, "epoch": 4208} {"train_loss": -7.195647716522217, "global_step": 176751, "epoch": 4208} {"train_loss": -7.187555313110352, "global_step": 176752, "epoch": 4208} {"train_loss": -7.14054012298584, "global_step": 176753, "epoch": 4208} {"train_loss": -6.976345062255859, "global_step": 176754, "epoch": 4208} {"train_loss": -7.119916915893555, "global_step": 176755, "epoch": 4208} {"train_loss": -6.96852445602417, "global_step": 176756, "epoch": 4208} {"train_loss": -6.726595878601074, "global_step": 176757, "epoch": 4208} {"train_loss": -6.986418724060059, "global_step": 176758, "epoch": 4208} {"train_loss": -7.167885780334473, "global_step": 176759, "epoch": 4208} {"train_loss": -6.931443691253662, "global_step": 176760, "epoch": 4208} {"train_loss": -7.0157880783081055, "global_step": 176761, "epoch": 4208} {"train_loss": -6.934684753417969, "global_step": 176762, "epoch": 4208} {"train_loss": -6.971898078918457, "global_step": 176763, "epoch": 4208} {"train_loss": -7.003655433654785, "global_step": 176764, "epoch": 4208} {"train_loss": -6.890176773071289, "global_step": 176765, "epoch": 4208} {"train_loss": -6.917259693145752, "global_step": 176766, "epoch": 4208} {"train_loss": -6.978057861328125, "global_step": 176767, "epoch": 4208} {"train_loss": -7.046644687652588, "global_step": 176768, "epoch": 4208} {"train_loss": -7.035524845123291, "global_step": 176769, "epoch": 4208} {"train_loss": -6.996502876281738, "global_step": 176770, "epoch": 4208} {"train_loss": -6.969231605529785, "global_step": 176771, "epoch": 4208} {"train_loss": -7.028413772583008, "global_step": 176772, "epoch": 4208} {"train_loss": -7.095131874084473, "global_step": 176773, "epoch": 4208} {"train_loss": -6.988835334777832, "global_step": 176774, "epoch": 4208} {"train_loss": -6.997834205627441, "global_step": 176775, "epoch": 4208} {"train_loss": -6.961338996887207, "global_step": 176776, "epoch": 4208} {"train_loss": -7.034872827075777, "global_step": 176777, "epoch": 4208, "val_loss": 69236.3671875} {"train_loss": -7.0371317863464355, "global_step": 176778, "epoch": 4209} {"train_loss": -7.0875630378723145, "global_step": 176779, "epoch": 4209} {"train_loss": -7.027884006500244, "global_step": 176780, "epoch": 4209} {"train_loss": -7.035041809082031, "global_step": 176781, "epoch": 4209} {"train_loss": -7.081780433654785, "global_step": 176782, "epoch": 4209} {"train_loss": -6.99207878112793, "global_step": 176783, "epoch": 4209} {"train_loss": -6.970346450805664, "global_step": 176784, "epoch": 4209} {"train_loss": -7.066229820251465, "global_step": 176785, "epoch": 4209} {"train_loss": -7.064138412475586, "global_step": 176786, "epoch": 4209} {"train_loss": -6.9808454513549805, "global_step": 176787, "epoch": 4209} {"train_loss": -7.012372970581055, "global_step": 176788, "epoch": 4209} {"train_loss": -6.961884498596191, "global_step": 176789, "epoch": 4209} {"train_loss": -7.055697917938232, "global_step": 176790, "epoch": 4209} {"train_loss": -6.964128494262695, "global_step": 176791, "epoch": 4209} {"train_loss": -7.050626754760742, "global_step": 176792, "epoch": 4209} {"train_loss": -7.138503551483154, "global_step": 176793, "epoch": 4209} {"train_loss": -7.030311584472656, "global_step": 176794, "epoch": 4209} {"train_loss": -7.012657165527344, "global_step": 176795, "epoch": 4209} {"train_loss": -6.966458320617676, "global_step": 176796, "epoch": 4209} {"train_loss": -7.060120105743408, "global_step": 176797, "epoch": 4209} {"train_loss": -7.046455383300781, "global_step": 176798, "epoch": 4209} {"train_loss": -7.02669620513916, "global_step": 176799, "epoch": 4209} {"train_loss": -6.992580413818359, "global_step": 176800, "epoch": 4209} {"train_loss": -7.010006904602051, "global_step": 176801, "epoch": 4209} {"train_loss": -7.093792915344238, "global_step": 176802, "epoch": 4209} {"train_loss": -7.02766227722168, "global_step": 176803, "epoch": 4209} {"train_loss": -7.117685794830322, "global_step": 176804, "epoch": 4209} {"train_loss": -7.222704887390137, "global_step": 176805, "epoch": 4209} {"train_loss": -7.103097438812256, "global_step": 176806, "epoch": 4209} {"train_loss": -7.086248397827148, "global_step": 176807, "epoch": 4209} {"train_loss": -7.049373149871826, "global_step": 176808, "epoch": 4209} {"train_loss": -7.085569381713867, "global_step": 176809, "epoch": 4209} {"train_loss": -7.105240821838379, "global_step": 176810, "epoch": 4209} {"train_loss": -7.1255903244018555, "global_step": 176811, "epoch": 4209} {"train_loss": -7.042365550994873, "global_step": 176812, "epoch": 4209} {"train_loss": -7.17617654800415, "global_step": 176813, "epoch": 4209} {"train_loss": -7.062119960784912, "global_step": 176814, "epoch": 4209} {"train_loss": -7.0659403800964355, "global_step": 176815, "epoch": 4209} {"train_loss": -7.159303665161133, "global_step": 176816, "epoch": 4209} {"train_loss": -7.152971267700195, "global_step": 176817, "epoch": 4209} {"train_loss": -7.1236371994018555, "global_step": 176818, "epoch": 4209} {"train_loss": -7.062128918511527, "global_step": 176819, "epoch": 4209, "val_loss": 69131.8515625} {"train_loss": -7.132844924926758, "global_step": 176820, "epoch": 4210} {"train_loss": -7.0661725997924805, "global_step": 176821, "epoch": 4210} {"train_loss": -7.180042266845703, "global_step": 176822, "epoch": 4210} {"train_loss": -7.102513313293457, "global_step": 176823, "epoch": 4210} {"train_loss": -7.0903544425964355, "global_step": 176824, "epoch": 4210} {"train_loss": -7.307037353515625, "global_step": 176825, "epoch": 4210} {"train_loss": -7.197325706481934, "global_step": 176826, "epoch": 4210} {"train_loss": -7.163376808166504, "global_step": 176827, "epoch": 4210} {"train_loss": -7.100939750671387, "global_step": 176828, "epoch": 4210} {"train_loss": -7.073306560516357, "global_step": 176829, "epoch": 4210} {"train_loss": -7.084634780883789, "global_step": 176830, "epoch": 4210} {"train_loss": -7.087945938110352, "global_step": 176831, "epoch": 4210} {"train_loss": -7.114794731140137, "global_step": 176832, "epoch": 4210} {"train_loss": -7.1182541847229, "global_step": 176833, "epoch": 4210} {"train_loss": -7.154709339141846, "global_step": 176834, "epoch": 4210} {"train_loss": -7.123266696929932, "global_step": 176835, "epoch": 4210} {"train_loss": -7.16464900970459, "global_step": 176836, "epoch": 4210} {"train_loss": -7.146575927734375, "global_step": 176837, "epoch": 4210} {"train_loss": -7.107836723327637, "global_step": 176838, "epoch": 4210} {"train_loss": -7.14323091506958, "global_step": 176839, "epoch": 4210} {"train_loss": -7.037538528442383, "global_step": 176840, "epoch": 4210} {"train_loss": -7.02012300491333, "global_step": 176841, "epoch": 4210} {"train_loss": -7.105096340179443, "global_step": 176842, "epoch": 4210} {"train_loss": -7.051491737365723, "global_step": 176843, "epoch": 4210} {"train_loss": -7.092499256134033, "global_step": 176844, "epoch": 4210} {"train_loss": -7.012580871582031, "global_step": 176845, "epoch": 4210} {"train_loss": -7.058528900146484, "global_step": 176846, "epoch": 4210} {"train_loss": -6.9930830001831055, "global_step": 176847, "epoch": 4210} {"train_loss": -7.100536346435547, "global_step": 176848, "epoch": 4210} {"train_loss": -7.1365580558776855, "global_step": 176849, "epoch": 4210} {"train_loss": -7.119257926940918, "global_step": 176850, "epoch": 4210} {"train_loss": -7.173460960388184, "global_step": 176851, "epoch": 4210} {"train_loss": -7.103669166564941, "global_step": 176852, "epoch": 4210} {"train_loss": -7.160877227783203, "global_step": 176853, "epoch": 4210} {"train_loss": -7.046578407287598, "global_step": 176854, "epoch": 4210} {"train_loss": -7.110978126525879, "global_step": 176855, "epoch": 4210} {"train_loss": -6.993022918701172, "global_step": 176856, "epoch": 4210} {"train_loss": -7.089603424072266, "global_step": 176857, "epoch": 4210} {"train_loss": -7.078169822692871, "global_step": 176858, "epoch": 4210} {"train_loss": -7.126316070556641, "global_step": 176859, "epoch": 4210} {"train_loss": -7.178659439086914, "global_step": 176860, "epoch": 4210} {"train_loss": -7.109628393536522, "global_step": 176861, "epoch": 4210, "val_loss": 69105.7265625} {"train_loss": -7.150503635406494, "global_step": 176862, "epoch": 4211} {"train_loss": -7.130857467651367, "global_step": 176863, "epoch": 4211} {"train_loss": -7.134889602661133, "global_step": 176864, "epoch": 4211} {"train_loss": -7.01482629776001, "global_step": 176865, "epoch": 4211} {"train_loss": -7.066364288330078, "global_step": 176866, "epoch": 4211} {"train_loss": -6.958776473999023, "global_step": 176867, "epoch": 4211} {"train_loss": -7.157917022705078, "global_step": 176868, "epoch": 4211} {"train_loss": -7.1017165184021, "global_step": 176869, "epoch": 4211} {"train_loss": -7.010814666748047, "global_step": 176870, "epoch": 4211} {"train_loss": -7.051641941070557, "global_step": 176871, "epoch": 4211} {"train_loss": -6.951693534851074, "global_step": 176872, "epoch": 4211} {"train_loss": -7.135441303253174, "global_step": 176873, "epoch": 4211} {"train_loss": -7.118479251861572, "global_step": 176874, "epoch": 4211} {"train_loss": -6.891971588134766, "global_step": 176875, "epoch": 4211} {"train_loss": -6.99488639831543, "global_step": 176876, "epoch": 4211} {"train_loss": -6.987024784088135, "global_step": 176877, "epoch": 4211} {"train_loss": -6.96641731262207, "global_step": 176878, "epoch": 4211} {"train_loss": -7.137165546417236, "global_step": 176879, "epoch": 4211} {"train_loss": -6.966520309448242, "global_step": 176880, "epoch": 4211} {"train_loss": -7.1381330490112305, "global_step": 176881, "epoch": 4211} {"train_loss": -7.078731060028076, "global_step": 176882, "epoch": 4211} {"train_loss": -6.919471263885498, "global_step": 176883, "epoch": 4211} {"train_loss": -7.097908973693848, "global_step": 176884, "epoch": 4211} {"train_loss": -7.030307769775391, "global_step": 176885, "epoch": 4211} {"train_loss": -6.993236064910889, "global_step": 176886, "epoch": 4211} {"train_loss": -7.1055426597595215, "global_step": 176887, "epoch": 4211} {"train_loss": -7.028231620788574, "global_step": 176888, "epoch": 4211} {"train_loss": -7.033910751342773, "global_step": 176889, "epoch": 4211} {"train_loss": -7.1020379066467285, "global_step": 176890, "epoch": 4211} {"train_loss": -7.074501037597656, "global_step": 176891, "epoch": 4211} {"train_loss": -6.97928524017334, "global_step": 176892, "epoch": 4211} {"train_loss": -7.14859676361084, "global_step": 176893, "epoch": 4211} {"train_loss": -6.992729187011719, "global_step": 176894, "epoch": 4211} {"train_loss": -7.027375221252441, "global_step": 176895, "epoch": 4211} {"train_loss": -7.103058338165283, "global_step": 176896, "epoch": 4211} {"train_loss": -7.127508163452148, "global_step": 176897, "epoch": 4211} {"train_loss": -7.175334930419922, "global_step": 176898, "epoch": 4211} {"train_loss": -7.033935546875, "global_step": 176899, "epoch": 4211} {"train_loss": -7.123631477355957, "global_step": 176900, "epoch": 4211} {"train_loss": -7.217028617858887, "global_step": 176901, "epoch": 4211} {"train_loss": -7.1347150802612305, "global_step": 176902, "epoch": 4211} {"train_loss": -7.064441045125325, "global_step": 176903, "epoch": 4211, "val_loss": 69061.71875} {"train_loss": -7.062127113342285, "global_step": 176904, "epoch": 4212} {"train_loss": -7.121163368225098, "global_step": 176905, "epoch": 4212} {"train_loss": -7.119360446929932, "global_step": 176906, "epoch": 4212} {"train_loss": -7.053714752197266, "global_step": 176907, "epoch": 4212} {"train_loss": -7.009580612182617, "global_step": 176908, "epoch": 4212} {"train_loss": -7.112441062927246, "global_step": 176909, "epoch": 4212} {"train_loss": -7.112588882446289, "global_step": 176910, "epoch": 4212} {"train_loss": -7.0766425132751465, "global_step": 176911, "epoch": 4212} {"train_loss": -7.128120422363281, "global_step": 176912, "epoch": 4212} {"train_loss": -6.976005554199219, "global_step": 176913, "epoch": 4212} {"train_loss": -7.092777252197266, "global_step": 176914, "epoch": 4212} {"train_loss": -6.989005088806152, "global_step": 176915, "epoch": 4212} {"train_loss": -7.002185344696045, "global_step": 176916, "epoch": 4212} {"train_loss": -7.122310638427734, "global_step": 176917, "epoch": 4212} {"train_loss": -7.028305530548096, "global_step": 176918, "epoch": 4212} {"train_loss": -7.138217926025391, "global_step": 176919, "epoch": 4212} {"train_loss": -6.939569473266602, "global_step": 176920, "epoch": 4212} {"train_loss": -7.02293586730957, "global_step": 176921, "epoch": 4212} {"train_loss": -6.864531517028809, "global_step": 176922, "epoch": 4212} {"train_loss": -6.91765022277832, "global_step": 176923, "epoch": 4212} {"train_loss": -6.921361446380615, "global_step": 176924, "epoch": 4212} {"train_loss": -6.978215217590332, "global_step": 176925, "epoch": 4212} {"train_loss": -7.0003275871276855, "global_step": 176926, "epoch": 4212} {"train_loss": -6.908341407775879, "global_step": 176927, "epoch": 4212} {"train_loss": -7.064943790435791, "global_step": 176928, "epoch": 4212} {"train_loss": -6.871305465698242, "global_step": 176929, "epoch": 4212} {"train_loss": -7.090457916259766, "global_step": 176930, "epoch": 4212} {"train_loss": -7.00894832611084, "global_step": 176931, "epoch": 4212} {"train_loss": -7.106961250305176, "global_step": 176932, "epoch": 4212} {"train_loss": -7.163023948669434, "global_step": 176933, "epoch": 4212} {"train_loss": -7.091975212097168, "global_step": 176934, "epoch": 4212} {"train_loss": -7.116397857666016, "global_step": 176935, "epoch": 4212} {"train_loss": -7.0583977699279785, "global_step": 176936, "epoch": 4212} {"train_loss": -7.034305095672607, "global_step": 176937, "epoch": 4212} {"train_loss": -7.0769171714782715, "global_step": 176938, "epoch": 4212} {"train_loss": -6.979758262634277, "global_step": 176939, "epoch": 4212} {"train_loss": -7.033177852630615, "global_step": 176940, "epoch": 4212} {"train_loss": -7.105410099029541, "global_step": 176941, "epoch": 4212} {"train_loss": -7.0541672706604, "global_step": 176942, "epoch": 4212} {"train_loss": -7.061916351318359, "global_step": 176943, "epoch": 4212} {"train_loss": -7.093752384185791, "global_step": 176944, "epoch": 4212} {"train_loss": -7.041515543347313, "global_step": 176945, "epoch": 4212, "val_loss": 69137.7890625} {"train_loss": -7.06895637512207, "global_step": 176946, "epoch": 4213} {"train_loss": -7.203516006469727, "global_step": 176947, "epoch": 4213} {"train_loss": -7.123802661895752, "global_step": 176948, "epoch": 4213} {"train_loss": -7.064014434814453, "global_step": 176949, "epoch": 4213} {"train_loss": -7.145045280456543, "global_step": 176950, "epoch": 4213} {"train_loss": -7.220322608947754, "global_step": 176951, "epoch": 4213} {"train_loss": -7.0673980712890625, "global_step": 176952, "epoch": 4213} {"train_loss": -7.107160568237305, "global_step": 176953, "epoch": 4213} {"train_loss": -7.175004959106445, "global_step": 176954, "epoch": 4213} {"train_loss": -7.169822692871094, "global_step": 176955, "epoch": 4213} {"train_loss": -7.0728535652160645, "global_step": 176956, "epoch": 4213} {"train_loss": -7.033085823059082, "global_step": 176957, "epoch": 4213} {"train_loss": -7.194714546203613, "global_step": 176958, "epoch": 4213} {"train_loss": -7.17459774017334, "global_step": 176959, "epoch": 4213} {"train_loss": -7.186844348907471, "global_step": 176960, "epoch": 4213} {"train_loss": -7.123438835144043, "global_step": 176961, "epoch": 4213} {"train_loss": -7.04151725769043, "global_step": 176962, "epoch": 4213} {"train_loss": -7.162995338439941, "global_step": 176963, "epoch": 4213} {"train_loss": -7.078426361083984, "global_step": 176964, "epoch": 4213} {"train_loss": -7.025260925292969, "global_step": 176965, "epoch": 4213} {"train_loss": -7.15771484375, "global_step": 176966, "epoch": 4213} {"train_loss": -7.063201904296875, "global_step": 176967, "epoch": 4213} {"train_loss": -7.078861236572266, "global_step": 176968, "epoch": 4213} {"train_loss": -7.065404891967773, "global_step": 176969, "epoch": 4213} {"train_loss": -7.136451721191406, "global_step": 176970, "epoch": 4213} {"train_loss": -7.061736106872559, "global_step": 176971, "epoch": 4213} {"train_loss": -6.987248420715332, "global_step": 176972, "epoch": 4213} {"train_loss": -7.080963134765625, "global_step": 176973, "epoch": 4213} {"train_loss": -7.078296661376953, "global_step": 176974, "epoch": 4213} {"train_loss": -7.138154029846191, "global_step": 176975, "epoch": 4213} {"train_loss": -7.123563766479492, "global_step": 176976, "epoch": 4213} {"train_loss": -7.098888874053955, "global_step": 176977, "epoch": 4213} {"train_loss": -7.14012336730957, "global_step": 176978, "epoch": 4213} {"train_loss": -7.176371097564697, "global_step": 176979, "epoch": 4213} {"train_loss": -7.128610134124756, "global_step": 176980, "epoch": 4213} {"train_loss": -7.2060747146606445, "global_step": 176981, "epoch": 4213} {"train_loss": -7.105870246887207, "global_step": 176982, "epoch": 4213} {"train_loss": -7.1264824867248535, "global_step": 176983, "epoch": 4213} {"train_loss": -7.1346940994262695, "global_step": 176984, "epoch": 4213} {"train_loss": -7.087037086486816, "global_step": 176985, "epoch": 4213} {"train_loss": -7.193483352661133, "global_step": 176986, "epoch": 4213} {"train_loss": -7.11543793905349, "global_step": 176987, "epoch": 4213, "val_loss": 69169.625} {"train_loss": -7.120839595794678, "global_step": 176988, "epoch": 4214} {"train_loss": -7.092257499694824, "global_step": 176989, "epoch": 4214} {"train_loss": -7.200492858886719, "global_step": 176990, "epoch": 4214} {"train_loss": -7.08890438079834, "global_step": 176991, "epoch": 4214} {"train_loss": -7.15897798538208, "global_step": 176992, "epoch": 4214} {"train_loss": -7.002184867858887, "global_step": 176993, "epoch": 4214} {"train_loss": -7.103946208953857, "global_step": 176994, "epoch": 4214} {"train_loss": -7.181386947631836, "global_step": 176995, "epoch": 4214} {"train_loss": -7.090104103088379, "global_step": 176996, "epoch": 4214} {"train_loss": -7.001958847045898, "global_step": 176997, "epoch": 4214} {"train_loss": -7.059196472167969, "global_step": 176998, "epoch": 4214} {"train_loss": -7.139094352722168, "global_step": 176999, "epoch": 4214} {"train_loss": -6.993085861206055, "global_step": 177000, "epoch": 4214} {"train_loss": -7.107230186462402, "global_step": 177001, "epoch": 4214} {"train_loss": -7.025886058807373, "global_step": 177002, "epoch": 4214} {"train_loss": -7.048440456390381, "global_step": 177003, "epoch": 4214} {"train_loss": -7.085458755493164, "global_step": 177004, "epoch": 4214} {"train_loss": -7.147219657897949, "global_step": 177005, "epoch": 4214} {"train_loss": -7.020839691162109, "global_step": 177006, "epoch": 4214} {"train_loss": -7.121817111968994, "global_step": 177007, "epoch": 4214} {"train_loss": -6.979537010192871, "global_step": 177008, "epoch": 4214} {"train_loss": -6.948333740234375, "global_step": 177009, "epoch": 4214} {"train_loss": -7.024530410766602, "global_step": 177010, "epoch": 4214} {"train_loss": -6.8749871253967285, "global_step": 177011, "epoch": 4214} {"train_loss": -7.046998977661133, "global_step": 177012, "epoch": 4214} {"train_loss": -7.113456726074219, "global_step": 177013, "epoch": 4214} {"train_loss": -6.8839616775512695, "global_step": 177014, "epoch": 4214} {"train_loss": -7.118873596191406, "global_step": 177015, "epoch": 4214} {"train_loss": -6.992419242858887, "global_step": 177016, "epoch": 4214} {"train_loss": -7.029520511627197, "global_step": 177017, "epoch": 4214} {"train_loss": -7.0149688720703125, "global_step": 177018, "epoch": 4214} {"train_loss": -6.991480827331543, "global_step": 177019, "epoch": 4214} {"train_loss": -7.113146781921387, "global_step": 177020, "epoch": 4214} {"train_loss": -7.092798233032227, "global_step": 177021, "epoch": 4214} {"train_loss": -7.0870137214660645, "global_step": 177022, "epoch": 4214} {"train_loss": -7.078141689300537, "global_step": 177023, "epoch": 4214} {"train_loss": -7.099996089935303, "global_step": 177024, "epoch": 4214} {"train_loss": -7.0725226402282715, "global_step": 177025, "epoch": 4214} {"train_loss": -7.070110321044922, "global_step": 177026, "epoch": 4214} {"train_loss": -7.159290313720703, "global_step": 177027, "epoch": 4214} {"train_loss": -7.080775260925293, "global_step": 177028, "epoch": 4214} {"train_loss": -7.0665702138628275, "global_step": 177029, "epoch": 4214, "val_loss": 69205.4140625} {"train_loss": -7.1724467277526855, "global_step": 177030, "epoch": 4215} {"train_loss": -7.1294355392456055, "global_step": 177031, "epoch": 4215} {"train_loss": -7.158062934875488, "global_step": 177032, "epoch": 4215} {"train_loss": -7.09968376159668, "global_step": 177033, "epoch": 4215} {"train_loss": -7.190960884094238, "global_step": 177034, "epoch": 4215} {"train_loss": -7.2311859130859375, "global_step": 177035, "epoch": 4215} {"train_loss": -7.105310916900635, "global_step": 177036, "epoch": 4215} {"train_loss": -7.0895843505859375, "global_step": 177037, "epoch": 4215} {"train_loss": -7.1352691650390625, "global_step": 177038, "epoch": 4215} {"train_loss": -7.10893440246582, "global_step": 177039, "epoch": 4215} {"train_loss": -7.117374897003174, "global_step": 177040, "epoch": 4215} {"train_loss": -7.137617111206055, "global_step": 177041, "epoch": 4215} {"train_loss": -7.114558219909668, "global_step": 177042, "epoch": 4215} {"train_loss": -7.1466898918151855, "global_step": 177043, "epoch": 4215} {"train_loss": -7.110870838165283, "global_step": 177044, "epoch": 4215} {"train_loss": -7.196941375732422, "global_step": 177045, "epoch": 4215} {"train_loss": -7.113046646118164, "global_step": 177046, "epoch": 4215} {"train_loss": -6.990780830383301, "global_step": 177047, "epoch": 4215} {"train_loss": -7.159010887145996, "global_step": 177048, "epoch": 4215} {"train_loss": -7.060640811920166, "global_step": 177049, "epoch": 4215} {"train_loss": -6.830196380615234, "global_step": 177050, "epoch": 4215} {"train_loss": -7.00404691696167, "global_step": 177051, "epoch": 4215} {"train_loss": -7.118744850158691, "global_step": 177052, "epoch": 4215} {"train_loss": -6.8446784019470215, "global_step": 177053, "epoch": 4215} {"train_loss": -6.975151538848877, "global_step": 177054, "epoch": 4215} {"train_loss": -6.870905876159668, "global_step": 177055, "epoch": 4215} {"train_loss": -6.843889236450195, "global_step": 177056, "epoch": 4215} {"train_loss": -6.999186038970947, "global_step": 177057, "epoch": 4215} {"train_loss": -6.941332817077637, "global_step": 177058, "epoch": 4215} {"train_loss": -6.8737335205078125, "global_step": 177059, "epoch": 4215} {"train_loss": -7.031188011169434, "global_step": 177060, "epoch": 4215} {"train_loss": -6.841707229614258, "global_step": 177061, "epoch": 4215} {"train_loss": -6.929914474487305, "global_step": 177062, "epoch": 4215} {"train_loss": -7.104338645935059, "global_step": 177063, "epoch": 4215} {"train_loss": -7.0521345138549805, "global_step": 177064, "epoch": 4215} {"train_loss": -7.003336429595947, "global_step": 177065, "epoch": 4215} {"train_loss": -7.057493686676025, "global_step": 177066, "epoch": 4215} {"train_loss": -6.971407890319824, "global_step": 177067, "epoch": 4215} {"train_loss": -7.106391429901123, "global_step": 177068, "epoch": 4215} {"train_loss": -7.157365798950195, "global_step": 177069, "epoch": 4215} {"train_loss": -7.065499782562256, "global_step": 177070, "epoch": 4215} {"train_loss": -7.052873736336117, "global_step": 177071, "epoch": 4215, "val_loss": 69077.84375} {"train_loss": -7.074523448944092, "global_step": 177072, "epoch": 4216} {"train_loss": -7.092824935913086, "global_step": 177073, "epoch": 4216} {"train_loss": -7.038724422454834, "global_step": 177074, "epoch": 4216} {"train_loss": -7.199251651763916, "global_step": 177075, "epoch": 4216} {"train_loss": -7.145359516143799, "global_step": 177076, "epoch": 4216} {"train_loss": -7.0744547843933105, "global_step": 177077, "epoch": 4216} {"train_loss": -7.203501224517822, "global_step": 177078, "epoch": 4216} {"train_loss": -7.160489082336426, "global_step": 177079, "epoch": 4216} {"train_loss": -7.1292829513549805, "global_step": 177080, "epoch": 4216} {"train_loss": -7.134688854217529, "global_step": 177081, "epoch": 4216} {"train_loss": -7.000356674194336, "global_step": 177082, "epoch": 4216} {"train_loss": -7.131577968597412, "global_step": 177083, "epoch": 4216} {"train_loss": -7.063724040985107, "global_step": 177084, "epoch": 4216} {"train_loss": -7.130778789520264, "global_step": 177085, "epoch": 4216} {"train_loss": -7.14110803604126, "global_step": 177086, "epoch": 4216} {"train_loss": -7.187506198883057, "global_step": 177087, "epoch": 4216} {"train_loss": -7.205531597137451, "global_step": 177088, "epoch": 4216} {"train_loss": -7.259373664855957, "global_step": 177089, "epoch": 4216} {"train_loss": -7.147306442260742, "global_step": 177090, "epoch": 4216} {"train_loss": -7.141047954559326, "global_step": 177091, "epoch": 4216} {"train_loss": -7.188080787658691, "global_step": 177092, "epoch": 4216} {"train_loss": -7.181081771850586, "global_step": 177093, "epoch": 4216} {"train_loss": -7.039053916931152, "global_step": 177094, "epoch": 4216} {"train_loss": -6.957004070281982, "global_step": 177095, "epoch": 4216} {"train_loss": -7.165496826171875, "global_step": 177096, "epoch": 4216} {"train_loss": -7.051477909088135, "global_step": 177097, "epoch": 4216} {"train_loss": -7.084724426269531, "global_step": 177098, "epoch": 4216} {"train_loss": -7.264806747436523, "global_step": 177099, "epoch": 4216} {"train_loss": -7.112404823303223, "global_step": 177100, "epoch": 4216} {"train_loss": -7.0949201583862305, "global_step": 177101, "epoch": 4216} {"train_loss": -7.237384796142578, "global_step": 177102, "epoch": 4216} {"train_loss": -7.118639945983887, "global_step": 177103, "epoch": 4216} {"train_loss": -7.095405578613281, "global_step": 177104, "epoch": 4216} {"train_loss": -7.139919281005859, "global_step": 177105, "epoch": 4216} {"train_loss": -7.073174953460693, "global_step": 177106, "epoch": 4216} {"train_loss": -7.073614120483398, "global_step": 177107, "epoch": 4216} {"train_loss": -7.248117446899414, "global_step": 177108, "epoch": 4216} {"train_loss": -7.043791770935059, "global_step": 177109, "epoch": 4216} {"train_loss": -7.056442737579346, "global_step": 177110, "epoch": 4216} {"train_loss": -7.001001834869385, "global_step": 177111, "epoch": 4216} {"train_loss": -7.124589920043945, "global_step": 177112, "epoch": 4216} {"train_loss": -7.120094469615391, "global_step": 177113, "epoch": 4216, "val_loss": 69257.21875} {"train_loss": -7.0400543212890625, "global_step": 177114, "epoch": 4217} {"train_loss": -7.09967041015625, "global_step": 177115, "epoch": 4217} {"train_loss": -7.107562065124512, "global_step": 177116, "epoch": 4217} {"train_loss": -7.120370864868164, "global_step": 177117, "epoch": 4217} {"train_loss": -7.191195487976074, "global_step": 177118, "epoch": 4217} {"train_loss": -7.08031702041626, "global_step": 177119, "epoch": 4217} {"train_loss": -7.002986907958984, "global_step": 177120, "epoch": 4217} {"train_loss": -7.035242080688477, "global_step": 177121, "epoch": 4217} {"train_loss": -7.055478096008301, "global_step": 177122, "epoch": 4217} {"train_loss": -7.121851921081543, "global_step": 177123, "epoch": 4217} {"train_loss": -7.008873462677002, "global_step": 177124, "epoch": 4217} {"train_loss": -7.071905136108398, "global_step": 177125, "epoch": 4217} {"train_loss": -6.972094535827637, "global_step": 177126, "epoch": 4217} {"train_loss": -7.0251641273498535, "global_step": 177127, "epoch": 4217} {"train_loss": -7.095170021057129, "global_step": 177128, "epoch": 4217} {"train_loss": -7.036444664001465, "global_step": 177129, "epoch": 4217} {"train_loss": -7.113845348358154, "global_step": 177130, "epoch": 4217} {"train_loss": -7.133134365081787, "global_step": 177131, "epoch": 4217} {"train_loss": -7.068789958953857, "global_step": 177132, "epoch": 4217} {"train_loss": -7.185938358306885, "global_step": 177133, "epoch": 4217} {"train_loss": -7.003419399261475, "global_step": 177134, "epoch": 4217} {"train_loss": -7.080810546875, "global_step": 177135, "epoch": 4217} {"train_loss": -7.096210956573486, "global_step": 177136, "epoch": 4217} {"train_loss": -7.02786111831665, "global_step": 177137, "epoch": 4217} {"train_loss": -7.16506290435791, "global_step": 177138, "epoch": 4217} {"train_loss": -7.148614883422852, "global_step": 177139, "epoch": 4217} {"train_loss": -7.0779924392700195, "global_step": 177140, "epoch": 4217} {"train_loss": -7.100004196166992, "global_step": 177141, "epoch": 4217} {"train_loss": -7.134256362915039, "global_step": 177142, "epoch": 4217} {"train_loss": -7.137472629547119, "global_step": 177143, "epoch": 4217} {"train_loss": -7.190133571624756, "global_step": 177144, "epoch": 4217} {"train_loss": -7.266842842102051, "global_step": 177145, "epoch": 4217} {"train_loss": -7.161361217498779, "global_step": 177146, "epoch": 4217} {"train_loss": -7.137542724609375, "global_step": 177147, "epoch": 4217} {"train_loss": -7.16149377822876, "global_step": 177148, "epoch": 4217} {"train_loss": -7.137033462524414, "global_step": 177149, "epoch": 4217} {"train_loss": -7.198807716369629, "global_step": 177150, "epoch": 4217} {"train_loss": -7.157018661499023, "global_step": 177151, "epoch": 4217} {"train_loss": -7.02700662612915, "global_step": 177152, "epoch": 4217} {"train_loss": -7.140525817871094, "global_step": 177153, "epoch": 4217} {"train_loss": -7.11958646774292, "global_step": 177154, "epoch": 4217} {"train_loss": -7.102716173444476, "global_step": 177155, "epoch": 4217, "val_loss": 69528.953125} {"train_loss": -6.9030985832214355, "global_step": 177156, "epoch": 4218} {"train_loss": -7.149336338043213, "global_step": 177157, "epoch": 4218} {"train_loss": -7.17147159576416, "global_step": 177158, "epoch": 4218} {"train_loss": -6.975233554840088, "global_step": 177159, "epoch": 4218} {"train_loss": -7.163427352905273, "global_step": 177160, "epoch": 4218} {"train_loss": -7.240188121795654, "global_step": 177161, "epoch": 4218} {"train_loss": -7.103878021240234, "global_step": 177162, "epoch": 4218} {"train_loss": -7.124905586242676, "global_step": 177163, "epoch": 4218} {"train_loss": -7.111494064331055, "global_step": 177164, "epoch": 4218} {"train_loss": -7.135581970214844, "global_step": 177165, "epoch": 4218} {"train_loss": -7.093104362487793, "global_step": 177166, "epoch": 4218} {"train_loss": -7.049615859985352, "global_step": 177167, "epoch": 4218} {"train_loss": -7.06325626373291, "global_step": 177168, "epoch": 4218} {"train_loss": -7.195263862609863, "global_step": 177169, "epoch": 4218} {"train_loss": -7.061104774475098, "global_step": 177170, "epoch": 4218} {"train_loss": -7.154967308044434, "global_step": 177171, "epoch": 4218} {"train_loss": -7.050220489501953, "global_step": 177172, "epoch": 4218} {"train_loss": -7.1530303955078125, "global_step": 177173, "epoch": 4218} {"train_loss": -7.0327301025390625, "global_step": 177174, "epoch": 4218} {"train_loss": -7.0935282707214355, "global_step": 177175, "epoch": 4218} {"train_loss": -7.096945762634277, "global_step": 177176, "epoch": 4218} {"train_loss": -7.1395111083984375, "global_step": 177177, "epoch": 4218} {"train_loss": -7.064129829406738, "global_step": 177178, "epoch": 4218} {"train_loss": -7.095241546630859, "global_step": 177179, "epoch": 4218} {"train_loss": -6.958512306213379, "global_step": 177180, "epoch": 4218} {"train_loss": -6.929594039916992, "global_step": 177181, "epoch": 4218} {"train_loss": -7.010435581207275, "global_step": 177182, "epoch": 4218} {"train_loss": -7.0066304206848145, "global_step": 177183, "epoch": 4218} {"train_loss": -6.931014060974121, "global_step": 177184, "epoch": 4218} {"train_loss": -7.055610656738281, "global_step": 177185, "epoch": 4218} {"train_loss": -6.917300224304199, "global_step": 177186, "epoch": 4218} {"train_loss": -7.020408630371094, "global_step": 177187, "epoch": 4218} {"train_loss": -6.985517501831055, "global_step": 177188, "epoch": 4218} {"train_loss": -6.8612284660339355, "global_step": 177189, "epoch": 4218} {"train_loss": -7.020352840423584, "global_step": 177190, "epoch": 4218} {"train_loss": -6.827446937561035, "global_step": 177191, "epoch": 4218} {"train_loss": -7.106484413146973, "global_step": 177192, "epoch": 4218} {"train_loss": -6.929624557495117, "global_step": 177193, "epoch": 4218} {"train_loss": -6.951303958892822, "global_step": 177194, "epoch": 4218} {"train_loss": -7.027478218078613, "global_step": 177195, "epoch": 4218} {"train_loss": -6.991093158721924, "global_step": 177196, "epoch": 4218} {"train_loss": -7.045643488566081, "global_step": 177197, "epoch": 4218, "val_loss": 69197.796875} {"train_loss": -7.012637615203857, "global_step": 177198, "epoch": 4219} {"train_loss": -6.942074775695801, "global_step": 177199, "epoch": 4219} {"train_loss": -7.1098480224609375, "global_step": 177200, "epoch": 4219} {"train_loss": -7.013430595397949, "global_step": 177201, "epoch": 4219} {"train_loss": -6.9054107666015625, "global_step": 177202, "epoch": 4219} {"train_loss": -7.0059404373168945, "global_step": 177203, "epoch": 4219} {"train_loss": -6.96177339553833, "global_step": 177204, "epoch": 4219} {"train_loss": -7.142195701599121, "global_step": 177205, "epoch": 4219} {"train_loss": -7.105083465576172, "global_step": 177206, "epoch": 4219} {"train_loss": -7.119414329528809, "global_step": 177207, "epoch": 4219} {"train_loss": -7.027500152587891, "global_step": 177208, "epoch": 4219} {"train_loss": -7.059791564941406, "global_step": 177209, "epoch": 4219} {"train_loss": -6.943231582641602, "global_step": 177210, "epoch": 4219} {"train_loss": -7.080204486846924, "global_step": 177211, "epoch": 4219} {"train_loss": -7.1016106605529785, "global_step": 177212, "epoch": 4219} {"train_loss": -7.062555313110352, "global_step": 177213, "epoch": 4219} {"train_loss": -6.983664512634277, "global_step": 177214, "epoch": 4219} {"train_loss": -7.010634422302246, "global_step": 177215, "epoch": 4219} {"train_loss": -7.01781702041626, "global_step": 177216, "epoch": 4219} {"train_loss": -6.9492034912109375, "global_step": 177217, "epoch": 4219} {"train_loss": -7.006161689758301, "global_step": 177218, "epoch": 4219} {"train_loss": -7.021612167358398, "global_step": 177219, "epoch": 4219} {"train_loss": -6.97510290145874, "global_step": 177220, "epoch": 4219} {"train_loss": -7.066323280334473, "global_step": 177221, "epoch": 4219} {"train_loss": -7.115995407104492, "global_step": 177222, "epoch": 4219} {"train_loss": -7.094820022583008, "global_step": 177223, "epoch": 4219} {"train_loss": -7.038543701171875, "global_step": 177224, "epoch": 4219} {"train_loss": -7.109677314758301, "global_step": 177225, "epoch": 4219} {"train_loss": -7.0685930252075195, "global_step": 177226, "epoch": 4219} {"train_loss": -7.113073348999023, "global_step": 177227, "epoch": 4219} {"train_loss": -7.185817241668701, "global_step": 177228, "epoch": 4219} {"train_loss": -7.012035846710205, "global_step": 177229, "epoch": 4219} {"train_loss": -7.21062707901001, "global_step": 177230, "epoch": 4219} {"train_loss": -7.071834564208984, "global_step": 177231, "epoch": 4219} {"train_loss": -7.072015762329102, "global_step": 177232, "epoch": 4219} {"train_loss": -7.0554118156433105, "global_step": 177233, "epoch": 4219} {"train_loss": -6.922155380249023, "global_step": 177234, "epoch": 4219} {"train_loss": -6.956255912780762, "global_step": 177235, "epoch": 4219} {"train_loss": -7.059975624084473, "global_step": 177236, "epoch": 4219} {"train_loss": -6.998177528381348, "global_step": 177237, "epoch": 4219} {"train_loss": -6.955528259277344, "global_step": 177238, "epoch": 4219} {"train_loss": -7.043389604205177, "global_step": 177239, "epoch": 4219, "val_loss": 69045.359375} {"train_loss": -7.070934772491455, "global_step": 177240, "epoch": 4220} {"train_loss": -7.08944034576416, "global_step": 177241, "epoch": 4220} {"train_loss": -7.034441947937012, "global_step": 177242, "epoch": 4220} {"train_loss": -7.112684726715088, "global_step": 177243, "epoch": 4220} {"train_loss": -6.997442245483398, "global_step": 177244, "epoch": 4220} {"train_loss": -7.068955421447754, "global_step": 177245, "epoch": 4220} {"train_loss": -7.133496284484863, "global_step": 177246, "epoch": 4220} {"train_loss": -7.149563789367676, "global_step": 177247, "epoch": 4220} {"train_loss": -7.070246696472168, "global_step": 177248, "epoch": 4220} {"train_loss": -7.064348220825195, "global_step": 177249, "epoch": 4220} {"train_loss": -7.143324375152588, "global_step": 177250, "epoch": 4220} {"train_loss": -7.071565628051758, "global_step": 177251, "epoch": 4220} {"train_loss": -7.0765228271484375, "global_step": 177252, "epoch": 4220} {"train_loss": -7.08718204498291, "global_step": 177253, "epoch": 4220} {"train_loss": -7.168022155761719, "global_step": 177254, "epoch": 4220} {"train_loss": -7.085146903991699, "global_step": 177255, "epoch": 4220} {"train_loss": -7.150813579559326, "global_step": 177256, "epoch": 4220} {"train_loss": -7.1219940185546875, "global_step": 177257, "epoch": 4220} {"train_loss": -7.072652816772461, "global_step": 177258, "epoch": 4220} {"train_loss": -7.087738513946533, "global_step": 177259, "epoch": 4220} {"train_loss": -7.1464338302612305, "global_step": 177260, "epoch": 4220} {"train_loss": -7.2114949226379395, "global_step": 177261, "epoch": 4220} {"train_loss": -7.082274436950684, "global_step": 177262, "epoch": 4220} {"train_loss": -7.184042930603027, "global_step": 177263, "epoch": 4220} {"train_loss": -7.097107887268066, "global_step": 177264, "epoch": 4220} {"train_loss": -7.07399845123291, "global_step": 177265, "epoch": 4220} {"train_loss": -7.134444236755371, "global_step": 177266, "epoch": 4220} {"train_loss": -7.190483093261719, "global_step": 177267, "epoch": 4220} {"train_loss": -7.076111793518066, "global_step": 177268, "epoch": 4220} {"train_loss": -7.184806823730469, "global_step": 177269, "epoch": 4220} {"train_loss": -7.104006290435791, "global_step": 177270, "epoch": 4220} {"train_loss": -7.172603607177734, "global_step": 177271, "epoch": 4220} {"train_loss": -7.014125347137451, "global_step": 177272, "epoch": 4220} {"train_loss": -7.0818305015563965, "global_step": 177273, "epoch": 4220} {"train_loss": -7.104994773864746, "global_step": 177274, "epoch": 4220} {"train_loss": -7.0673370361328125, "global_step": 177275, "epoch": 4220} {"train_loss": -7.145282745361328, "global_step": 177276, "epoch": 4220} {"train_loss": -7.0778913497924805, "global_step": 177277, "epoch": 4220} {"train_loss": -7.096297264099121, "global_step": 177278, "epoch": 4220} {"train_loss": -7.095525741577148, "global_step": 177279, "epoch": 4220} {"train_loss": -7.077481269836426, "global_step": 177280, "epoch": 4220} {"train_loss": -7.103047416323707, "global_step": 177281, "epoch": 4220, "val_loss": 69236.875} {"train_loss": -7.06291389465332, "global_step": 177282, "epoch": 4221} {"train_loss": -7.073965072631836, "global_step": 177283, "epoch": 4221} {"train_loss": -7.135062217712402, "global_step": 177284, "epoch": 4221} {"train_loss": -7.136463165283203, "global_step": 177285, "epoch": 4221} {"train_loss": -7.148600101470947, "global_step": 177286, "epoch": 4221} {"train_loss": -7.1543288230896, "global_step": 177287, "epoch": 4221} {"train_loss": -7.228344917297363, "global_step": 177288, "epoch": 4221} {"train_loss": -7.003154754638672, "global_step": 177289, "epoch": 4221} {"train_loss": -7.129553318023682, "global_step": 177290, "epoch": 4221} {"train_loss": -7.132486820220947, "global_step": 177291, "epoch": 4221} {"train_loss": -7.1400628089904785, "global_step": 177292, "epoch": 4221} {"train_loss": -7.092052459716797, "global_step": 177293, "epoch": 4221} {"train_loss": -7.115479469299316, "global_step": 177294, "epoch": 4221} {"train_loss": -7.082408905029297, "global_step": 177295, "epoch": 4221} {"train_loss": -7.183755874633789, "global_step": 177296, "epoch": 4221} {"train_loss": -7.227881908416748, "global_step": 177297, "epoch": 4221} {"train_loss": -7.059957504272461, "global_step": 177298, "epoch": 4221} {"train_loss": -7.110663414001465, "global_step": 177299, "epoch": 4221} {"train_loss": -7.113029479980469, "global_step": 177300, "epoch": 4221} {"train_loss": -7.119692802429199, "global_step": 177301, "epoch": 4221} {"train_loss": -7.141409873962402, "global_step": 177302, "epoch": 4221} {"train_loss": -7.002577781677246, "global_step": 177303, "epoch": 4221} {"train_loss": -7.218249320983887, "global_step": 177304, "epoch": 4221} {"train_loss": -7.133752822875977, "global_step": 177305, "epoch": 4221} {"train_loss": -6.976045608520508, "global_step": 177306, "epoch": 4221} {"train_loss": -7.129879474639893, "global_step": 177307, "epoch": 4221} {"train_loss": -7.154128551483154, "global_step": 177308, "epoch": 4221} {"train_loss": -7.1374335289001465, "global_step": 177309, "epoch": 4221} {"train_loss": -7.068674087524414, "global_step": 177310, "epoch": 4221} {"train_loss": -7.072177886962891, "global_step": 177311, "epoch": 4221} {"train_loss": -7.0093207359313965, "global_step": 177312, "epoch": 4221} {"train_loss": -7.148303985595703, "global_step": 177313, "epoch": 4221} {"train_loss": -7.1456146240234375, "global_step": 177314, "epoch": 4221} {"train_loss": -7.188261985778809, "global_step": 177315, "epoch": 4221} {"train_loss": -6.9873175621032715, "global_step": 177316, "epoch": 4221} {"train_loss": -6.999175548553467, "global_step": 177317, "epoch": 4221} {"train_loss": -7.1417107582092285, "global_step": 177318, "epoch": 4221} {"train_loss": -6.996914863586426, "global_step": 177319, "epoch": 4221} {"train_loss": -6.887897491455078, "global_step": 177320, "epoch": 4221} {"train_loss": -7.140293598175049, "global_step": 177321, "epoch": 4221} {"train_loss": -7.014212608337402, "global_step": 177322, "epoch": 4221} {"train_loss": -7.101918697357178, "global_step": 177323, "epoch": 4221, "val_loss": 69238.125} {"train_loss": -7.0829267501831055, "global_step": 177324, "epoch": 4222} {"train_loss": -7.0041961669921875, "global_step": 177325, "epoch": 4222} {"train_loss": -6.963757514953613, "global_step": 177326, "epoch": 4222} {"train_loss": -7.00546407699585, "global_step": 177327, "epoch": 4222} {"train_loss": -7.0495686531066895, "global_step": 177328, "epoch": 4222} {"train_loss": -7.014859199523926, "global_step": 177329, "epoch": 4222} {"train_loss": -7.1175971031188965, "global_step": 177330, "epoch": 4222} {"train_loss": -7.095186710357666, "global_step": 177331, "epoch": 4222} {"train_loss": -7.0264201164245605, "global_step": 177332, "epoch": 4222} {"train_loss": -6.976090431213379, "global_step": 177333, "epoch": 4222} {"train_loss": -6.970439910888672, "global_step": 177334, "epoch": 4222} {"train_loss": -7.072947025299072, "global_step": 177335, "epoch": 4222} {"train_loss": -7.0225090980529785, "global_step": 177336, "epoch": 4222} {"train_loss": -7.048468589782715, "global_step": 177337, "epoch": 4222} {"train_loss": -7.078152656555176, "global_step": 177338, "epoch": 4222} {"train_loss": -7.032378196716309, "global_step": 177339, "epoch": 4222} {"train_loss": -7.158876419067383, "global_step": 177340, "epoch": 4222} {"train_loss": -7.114403247833252, "global_step": 177341, "epoch": 4222} {"train_loss": -7.1566572189331055, "global_step": 177342, "epoch": 4222} {"train_loss": -6.976293563842773, "global_step": 177343, "epoch": 4222} {"train_loss": -7.109645366668701, "global_step": 177344, "epoch": 4222} {"train_loss": -7.114961624145508, "global_step": 177345, "epoch": 4222} {"train_loss": -7.153751373291016, "global_step": 177346, "epoch": 4222} {"train_loss": -7.025149345397949, "global_step": 177347, "epoch": 4222} {"train_loss": -7.12103796005249, "global_step": 177348, "epoch": 4222} {"train_loss": -7.1454572677612305, "global_step": 177349, "epoch": 4222} {"train_loss": -7.161110877990723, "global_step": 177350, "epoch": 4222} {"train_loss": -7.161611557006836, "global_step": 177351, "epoch": 4222} {"train_loss": -7.151818752288818, "global_step": 177352, "epoch": 4222} {"train_loss": -7.096250534057617, "global_step": 177353, "epoch": 4222} {"train_loss": -7.1646904945373535, "global_step": 177354, "epoch": 4222} {"train_loss": -7.141066074371338, "global_step": 177355, "epoch": 4222} {"train_loss": -7.153816223144531, "global_step": 177356, "epoch": 4222} {"train_loss": -7.149191856384277, "global_step": 177357, "epoch": 4222} {"train_loss": -7.023890972137451, "global_step": 177358, "epoch": 4222} {"train_loss": -6.985233306884766, "global_step": 177359, "epoch": 4222} {"train_loss": -7.045778274536133, "global_step": 177360, "epoch": 4222} {"train_loss": -7.102643013000488, "global_step": 177361, "epoch": 4222} {"train_loss": -7.006077766418457, "global_step": 177362, "epoch": 4222} {"train_loss": -7.1409196853637695, "global_step": 177363, "epoch": 4222} {"train_loss": -7.1199164390563965, "global_step": 177364, "epoch": 4222} {"train_loss": -7.076701221011934, "global_step": 177365, "epoch": 4222, "val_loss": 69338.875} {"train_loss": -7.015209197998047, "global_step": 177366, "epoch": 4223} {"train_loss": -7.1135945320129395, "global_step": 177367, "epoch": 4223} {"train_loss": -7.045876502990723, "global_step": 177368, "epoch": 4223} {"train_loss": -6.984130859375, "global_step": 177369, "epoch": 4223} {"train_loss": -7.066205978393555, "global_step": 177370, "epoch": 4223} {"train_loss": -7.015052795410156, "global_step": 177371, "epoch": 4223} {"train_loss": -7.048702239990234, "global_step": 177372, "epoch": 4223} {"train_loss": -6.955061912536621, "global_step": 177373, "epoch": 4223} {"train_loss": -7.01498556137085, "global_step": 177374, "epoch": 4223} {"train_loss": -7.12396764755249, "global_step": 177375, "epoch": 4223} {"train_loss": -7.0519304275512695, "global_step": 177376, "epoch": 4223} {"train_loss": -7.0859575271606445, "global_step": 177377, "epoch": 4223} {"train_loss": -6.987983703613281, "global_step": 177378, "epoch": 4223} {"train_loss": -7.055569171905518, "global_step": 177379, "epoch": 4223} {"train_loss": -7.138053894042969, "global_step": 177380, "epoch": 4223} {"train_loss": -7.148407936096191, "global_step": 177381, "epoch": 4223} {"train_loss": -7.145449638366699, "global_step": 177382, "epoch": 4223} {"train_loss": -7.074386119842529, "global_step": 177383, "epoch": 4223} {"train_loss": -7.061330795288086, "global_step": 177384, "epoch": 4223} {"train_loss": -7.052187919616699, "global_step": 177385, "epoch": 4223} {"train_loss": -6.995410919189453, "global_step": 177386, "epoch": 4223} {"train_loss": -6.925577640533447, "global_step": 177387, "epoch": 4223} {"train_loss": -7.132646083831787, "global_step": 177388, "epoch": 4223} {"train_loss": -7.093480587005615, "global_step": 177389, "epoch": 4223} {"train_loss": -7.098781108856201, "global_step": 177390, "epoch": 4223} {"train_loss": -7.007100582122803, "global_step": 177391, "epoch": 4223} {"train_loss": -7.061785697937012, "global_step": 177392, "epoch": 4223} {"train_loss": -7.091714859008789, "global_step": 177393, "epoch": 4223} {"train_loss": -7.083912372589111, "global_step": 177394, "epoch": 4223} {"train_loss": -7.040309906005859, "global_step": 177395, "epoch": 4223} {"train_loss": -6.951560020446777, "global_step": 177396, "epoch": 4223} {"train_loss": -7.156270980834961, "global_step": 177397, "epoch": 4223} {"train_loss": -7.055034637451172, "global_step": 177398, "epoch": 4223} {"train_loss": -7.099794387817383, "global_step": 177399, "epoch": 4223} {"train_loss": -7.083418846130371, "global_step": 177400, "epoch": 4223} {"train_loss": -7.125133514404297, "global_step": 177401, "epoch": 4223} {"train_loss": -7.064019203186035, "global_step": 177402, "epoch": 4223} {"train_loss": -7.037336826324463, "global_step": 177403, "epoch": 4223} {"train_loss": -6.940959930419922, "global_step": 177404, "epoch": 4223} {"train_loss": -7.032773971557617, "global_step": 177405, "epoch": 4223} {"train_loss": -7.015292167663574, "global_step": 177406, "epoch": 4223} {"train_loss": -7.057615677515666, "global_step": 177407, "epoch": 4223, "val_loss": 69285.2578125} {"train_loss": -7.097655296325684, "global_step": 177408, "epoch": 4224} {"train_loss": -6.983083248138428, "global_step": 177409, "epoch": 4224} {"train_loss": -6.960111618041992, "global_step": 177410, "epoch": 4224} {"train_loss": -7.071063041687012, "global_step": 177411, "epoch": 4224} {"train_loss": -6.900444984436035, "global_step": 177412, "epoch": 4224} {"train_loss": -7.0734758377075195, "global_step": 177413, "epoch": 4224} {"train_loss": -7.0916666984558105, "global_step": 177414, "epoch": 4224} {"train_loss": -6.946420669555664, "global_step": 177415, "epoch": 4224} {"train_loss": -7.01190185546875, "global_step": 177416, "epoch": 4224} {"train_loss": -7.070065975189209, "global_step": 177417, "epoch": 4224} {"train_loss": -7.134696960449219, "global_step": 177418, "epoch": 4224} {"train_loss": -7.0054931640625, "global_step": 177419, "epoch": 4224} {"train_loss": -7.021301746368408, "global_step": 177420, "epoch": 4224} {"train_loss": -7.069089889526367, "global_step": 177421, "epoch": 4224} {"train_loss": -7.007781982421875, "global_step": 177422, "epoch": 4224} {"train_loss": -7.114974021911621, "global_step": 177423, "epoch": 4224} {"train_loss": -7.073921203613281, "global_step": 177424, "epoch": 4224} {"train_loss": -6.984549522399902, "global_step": 177425, "epoch": 4224} {"train_loss": -6.915396690368652, "global_step": 177426, "epoch": 4224} {"train_loss": -6.862580299377441, "global_step": 177427, "epoch": 4224} {"train_loss": -6.994368553161621, "global_step": 177428, "epoch": 4224} {"train_loss": -6.984218597412109, "global_step": 177429, "epoch": 4224} {"train_loss": -6.78734016418457, "global_step": 177430, "epoch": 4224} {"train_loss": -6.95977258682251, "global_step": 177431, "epoch": 4224} {"train_loss": -7.011160850524902, "global_step": 177432, "epoch": 4224} {"train_loss": -6.9348626136779785, "global_step": 177433, "epoch": 4224} {"train_loss": -7.01438045501709, "global_step": 177434, "epoch": 4224} {"train_loss": -6.792657375335693, "global_step": 177435, "epoch": 4224} {"train_loss": -6.762739181518555, "global_step": 177436, "epoch": 4224} {"train_loss": -6.951181411743164, "global_step": 177437, "epoch": 4224} {"train_loss": -6.856776237487793, "global_step": 177438, "epoch": 4224} {"train_loss": -6.899957180023193, "global_step": 177439, "epoch": 4224} {"train_loss": -7.102196216583252, "global_step": 177440, "epoch": 4224} {"train_loss": -7.009001731872559, "global_step": 177441, "epoch": 4224} {"train_loss": -6.980221271514893, "global_step": 177442, "epoch": 4224} {"train_loss": -7.107340335845947, "global_step": 177443, "epoch": 4224} {"train_loss": -6.995576858520508, "global_step": 177444, "epoch": 4224} {"train_loss": -7.059521198272705, "global_step": 177445, "epoch": 4224} {"train_loss": -6.994794845581055, "global_step": 177446, "epoch": 4224} {"train_loss": -7.144783973693848, "global_step": 177447, "epoch": 4224} {"train_loss": -6.961447715759277, "global_step": 177448, "epoch": 4224} {"train_loss": -6.992982762200492, "global_step": 177449, "epoch": 4224, "val_loss": 69240.6875} {"train_loss": -6.966509819030762, "global_step": 177450, "epoch": 4225} {"train_loss": -7.063037872314453, "global_step": 177451, "epoch": 4225} {"train_loss": -7.049727439880371, "global_step": 177452, "epoch": 4225} {"train_loss": -7.037350654602051, "global_step": 177453, "epoch": 4225} {"train_loss": -6.9962873458862305, "global_step": 177454, "epoch": 4225} {"train_loss": -7.127281665802002, "global_step": 177455, "epoch": 4225} {"train_loss": -6.983579635620117, "global_step": 177456, "epoch": 4225} {"train_loss": -7.145740985870361, "global_step": 177457, "epoch": 4225} {"train_loss": -7.083528518676758, "global_step": 177458, "epoch": 4225} {"train_loss": -6.970992565155029, "global_step": 177459, "epoch": 4225} {"train_loss": -7.10381555557251, "global_step": 177460, "epoch": 4225} {"train_loss": -6.854902267456055, "global_step": 177461, "epoch": 4225} {"train_loss": -6.844581604003906, "global_step": 177462, "epoch": 4225} {"train_loss": -7.109855651855469, "global_step": 177463, "epoch": 4225} {"train_loss": -6.970877170562744, "global_step": 177464, "epoch": 4225} {"train_loss": -7.086062431335449, "global_step": 177465, "epoch": 4225} {"train_loss": -7.030479431152344, "global_step": 177466, "epoch": 4225} {"train_loss": -7.012231349945068, "global_step": 177467, "epoch": 4225} {"train_loss": -6.976856231689453, "global_step": 177468, "epoch": 4225} {"train_loss": -6.977530002593994, "global_step": 177469, "epoch": 4225} {"train_loss": -7.081968307495117, "global_step": 177470, "epoch": 4225} {"train_loss": -6.927373886108398, "global_step": 177471, "epoch": 4225} {"train_loss": -6.891880035400391, "global_step": 177472, "epoch": 4225} {"train_loss": -6.9850592613220215, "global_step": 177473, "epoch": 4225} {"train_loss": -6.969142913818359, "global_step": 177474, "epoch": 4225} {"train_loss": -7.004776954650879, "global_step": 177475, "epoch": 4225} {"train_loss": -6.968923091888428, "global_step": 177476, "epoch": 4225} {"train_loss": -6.976895332336426, "global_step": 177477, "epoch": 4225} {"train_loss": -7.047675132751465, "global_step": 177478, "epoch": 4225} {"train_loss": -7.1199140548706055, "global_step": 177479, "epoch": 4225} {"train_loss": -7.024471282958984, "global_step": 177480, "epoch": 4225} {"train_loss": -7.1214919090271, "global_step": 177481, "epoch": 4225} {"train_loss": -7.066261291503906, "global_step": 177482, "epoch": 4225} {"train_loss": -7.066806793212891, "global_step": 177483, "epoch": 4225} {"train_loss": -7.105464935302734, "global_step": 177484, "epoch": 4225} {"train_loss": -7.130127906799316, "global_step": 177485, "epoch": 4225} {"train_loss": -7.267570495605469, "global_step": 177486, "epoch": 4225} {"train_loss": -7.147263526916504, "global_step": 177487, "epoch": 4225} {"train_loss": -7.171595573425293, "global_step": 177488, "epoch": 4225} {"train_loss": -7.017111778259277, "global_step": 177489, "epoch": 4225} {"train_loss": -7.137089729309082, "global_step": 177490, "epoch": 4225} {"train_loss": -7.039476462772915, "global_step": 177491, "epoch": 4225, "val_loss": 69231.8984375} {"train_loss": -7.13232946395874, "global_step": 177492, "epoch": 4226} {"train_loss": -7.207083702087402, "global_step": 177493, "epoch": 4226} {"train_loss": -7.128098011016846, "global_step": 177494, "epoch": 4226} {"train_loss": -7.138894557952881, "global_step": 177495, "epoch": 4226} {"train_loss": -7.183436393737793, "global_step": 177496, "epoch": 4226} {"train_loss": -7.127165794372559, "global_step": 177497, "epoch": 4226} {"train_loss": -7.131958961486816, "global_step": 177498, "epoch": 4226} {"train_loss": -7.239509582519531, "global_step": 177499, "epoch": 4226} {"train_loss": -7.157454967498779, "global_step": 177500, "epoch": 4226} {"train_loss": -7.161297798156738, "global_step": 177501, "epoch": 4226} {"train_loss": -7.172009468078613, "global_step": 177502, "epoch": 4226} {"train_loss": -7.071228981018066, "global_step": 177503, "epoch": 4226} {"train_loss": -7.175685882568359, "global_step": 177504, "epoch": 4226} {"train_loss": -7.110592365264893, "global_step": 177505, "epoch": 4226} {"train_loss": -7.132524490356445, "global_step": 177506, "epoch": 4226} {"train_loss": -7.179757118225098, "global_step": 177507, "epoch": 4226} {"train_loss": -7.2221760749816895, "global_step": 177508, "epoch": 4226} {"train_loss": -7.144611358642578, "global_step": 177509, "epoch": 4226} {"train_loss": -7.091490745544434, "global_step": 177510, "epoch": 4226} {"train_loss": -7.041687965393066, "global_step": 177511, "epoch": 4226} {"train_loss": -7.185949325561523, "global_step": 177512, "epoch": 4226} {"train_loss": -7.166994094848633, "global_step": 177513, "epoch": 4226} {"train_loss": -7.03926420211792, "global_step": 177514, "epoch": 4226} {"train_loss": -7.162888050079346, "global_step": 177515, "epoch": 4226} {"train_loss": -7.127105712890625, "global_step": 177516, "epoch": 4226} {"train_loss": -7.150235652923584, "global_step": 177517, "epoch": 4226} {"train_loss": -7.1039323806762695, "global_step": 177518, "epoch": 4226} {"train_loss": -7.201008319854736, "global_step": 177519, "epoch": 4226} {"train_loss": -7.172161102294922, "global_step": 177520, "epoch": 4226} {"train_loss": -7.0352067947387695, "global_step": 177521, "epoch": 4226} {"train_loss": -7.040438652038574, "global_step": 177522, "epoch": 4226} {"train_loss": -7.153212547302246, "global_step": 177523, "epoch": 4226} {"train_loss": -7.154420852661133, "global_step": 177524, "epoch": 4226} {"train_loss": -7.129456520080566, "global_step": 177525, "epoch": 4226} {"train_loss": -7.237719535827637, "global_step": 177526, "epoch": 4226} {"train_loss": -7.11325216293335, "global_step": 177527, "epoch": 4226} {"train_loss": -7.112604141235352, "global_step": 177528, "epoch": 4226} {"train_loss": -7.122304916381836, "global_step": 177529, "epoch": 4226} {"train_loss": -7.155529022216797, "global_step": 177530, "epoch": 4226} {"train_loss": -7.128710746765137, "global_step": 177531, "epoch": 4226} {"train_loss": -7.151861190795898, "global_step": 177532, "epoch": 4226} {"train_loss": -7.142932903198969, "global_step": 177533, "epoch": 4226, "val_loss": 69104.78125} {"train_loss": -7.215045928955078, "global_step": 177534, "epoch": 4227} {"train_loss": -7.092367172241211, "global_step": 177535, "epoch": 4227} {"train_loss": -7.14285135269165, "global_step": 177536, "epoch": 4227} {"train_loss": -7.272981643676758, "global_step": 177537, "epoch": 4227} {"train_loss": -7.100956916809082, "global_step": 177538, "epoch": 4227} {"train_loss": -7.213897705078125, "global_step": 177539, "epoch": 4227} {"train_loss": -7.059844017028809, "global_step": 177540, "epoch": 4227} {"train_loss": -7.175447940826416, "global_step": 177541, "epoch": 4227} {"train_loss": -7.135698318481445, "global_step": 177542, "epoch": 4227} {"train_loss": -7.235215187072754, "global_step": 177543, "epoch": 4227} {"train_loss": -7.057019233703613, "global_step": 177544, "epoch": 4227} {"train_loss": -7.176906585693359, "global_step": 177545, "epoch": 4227} {"train_loss": -7.097682476043701, "global_step": 177546, "epoch": 4227} {"train_loss": -7.031796932220459, "global_step": 177547, "epoch": 4227} {"train_loss": -7.25079345703125, "global_step": 177548, "epoch": 4227} {"train_loss": -7.17720365524292, "global_step": 177549, "epoch": 4227} {"train_loss": -7.1798200607299805, "global_step": 177550, "epoch": 4227} {"train_loss": -7.1434197425842285, "global_step": 177551, "epoch": 4227} {"train_loss": -7.114532947540283, "global_step": 177552, "epoch": 4227} {"train_loss": -6.99412727355957, "global_step": 177553, "epoch": 4227} {"train_loss": -7.158987998962402, "global_step": 177554, "epoch": 4227} {"train_loss": -7.077304840087891, "global_step": 177555, "epoch": 4227} {"train_loss": -6.7433061599731445, "global_step": 177556, "epoch": 4227} {"train_loss": -7.121109962463379, "global_step": 177557, "epoch": 4227} {"train_loss": -7.049724102020264, "global_step": 177558, "epoch": 4227} {"train_loss": -6.940005302429199, "global_step": 177559, "epoch": 4227} {"train_loss": -7.0148468017578125, "global_step": 177560, "epoch": 4227} {"train_loss": -7.139754295349121, "global_step": 177561, "epoch": 4227} {"train_loss": -7.135044574737549, "global_step": 177562, "epoch": 4227} {"train_loss": -7.0826263427734375, "global_step": 177563, "epoch": 4227} {"train_loss": -7.03623104095459, "global_step": 177564, "epoch": 4227} {"train_loss": -7.137523651123047, "global_step": 177565, "epoch": 4227} {"train_loss": -7.073484420776367, "global_step": 177566, "epoch": 4227} {"train_loss": -7.025040626525879, "global_step": 177567, "epoch": 4227} {"train_loss": -7.03084659576416, "global_step": 177568, "epoch": 4227} {"train_loss": -6.967360019683838, "global_step": 177569, "epoch": 4227} {"train_loss": -7.127259254455566, "global_step": 177570, "epoch": 4227} {"train_loss": -7.009564399719238, "global_step": 177571, "epoch": 4227} {"train_loss": -7.159809589385986, "global_step": 177572, "epoch": 4227} {"train_loss": -7.129265785217285, "global_step": 177573, "epoch": 4227} {"train_loss": -6.997909069061279, "global_step": 177574, "epoch": 4227} {"train_loss": -7.098143384570167, "global_step": 177575, "epoch": 4227, "val_loss": 69245.015625} {"train_loss": -7.165903568267822, "global_step": 177576, "epoch": 4228} {"train_loss": -6.959622383117676, "global_step": 177577, "epoch": 4228} {"train_loss": -7.106175422668457, "global_step": 177578, "epoch": 4228} {"train_loss": -7.005524635314941, "global_step": 177579, "epoch": 4228} {"train_loss": -7.106858253479004, "global_step": 177580, "epoch": 4228} {"train_loss": -7.169350624084473, "global_step": 177581, "epoch": 4228} {"train_loss": -7.040772438049316, "global_step": 177582, "epoch": 4228} {"train_loss": -7.080974102020264, "global_step": 177583, "epoch": 4228} {"train_loss": -7.053091526031494, "global_step": 177584, "epoch": 4228} {"train_loss": -6.964362144470215, "global_step": 177585, "epoch": 4228} {"train_loss": -7.185894966125488, "global_step": 177586, "epoch": 4228} {"train_loss": -6.949011325836182, "global_step": 177587, "epoch": 4228} {"train_loss": -7.079827308654785, "global_step": 177588, "epoch": 4228} {"train_loss": -7.11091423034668, "global_step": 177589, "epoch": 4228} {"train_loss": -6.889840126037598, "global_step": 177590, "epoch": 4228} {"train_loss": -7.007586479187012, "global_step": 177591, "epoch": 4228} {"train_loss": -6.903636932373047, "global_step": 177592, "epoch": 4228} {"train_loss": -6.940891742706299, "global_step": 177593, "epoch": 4228} {"train_loss": -7.093016147613525, "global_step": 177594, "epoch": 4228} {"train_loss": -7.065673828125, "global_step": 177595, "epoch": 4228} {"train_loss": -7.087736129760742, "global_step": 177596, "epoch": 4228} {"train_loss": -7.001646041870117, "global_step": 177597, "epoch": 4228} {"train_loss": -7.09013032913208, "global_step": 177598, "epoch": 4228} {"train_loss": -7.060819625854492, "global_step": 177599, "epoch": 4228} {"train_loss": -7.065469264984131, "global_step": 177600, "epoch": 4228} {"train_loss": -7.091490268707275, "global_step": 177601, "epoch": 4228} {"train_loss": -7.062160491943359, "global_step": 177602, "epoch": 4228} {"train_loss": -7.093850135803223, "global_step": 177603, "epoch": 4228} {"train_loss": -6.983366012573242, "global_step": 177604, "epoch": 4228} {"train_loss": -6.902157783508301, "global_step": 177605, "epoch": 4228} {"train_loss": -7.030396461486816, "global_step": 177606, "epoch": 4228} {"train_loss": -6.902688026428223, "global_step": 177607, "epoch": 4228} {"train_loss": -6.961745262145996, "global_step": 177608, "epoch": 4228} {"train_loss": -7.082035064697266, "global_step": 177609, "epoch": 4228} {"train_loss": -7.011809349060059, "global_step": 177610, "epoch": 4228} {"train_loss": -7.010201454162598, "global_step": 177611, "epoch": 4228} {"train_loss": -7.259708404541016, "global_step": 177612, "epoch": 4228} {"train_loss": -7.057146072387695, "global_step": 177613, "epoch": 4228} {"train_loss": -7.0837016105651855, "global_step": 177614, "epoch": 4228} {"train_loss": -7.065946578979492, "global_step": 177615, "epoch": 4228} {"train_loss": -7.080784797668457, "global_step": 177616, "epoch": 4228} {"train_loss": -7.047918796539307, "global_step": 177617, "epoch": 4228, "val_loss": 69405.53125} {"train_loss": -7.0914306640625, "global_step": 177618, "epoch": 4229} {"train_loss": -7.125205039978027, "global_step": 177619, "epoch": 4229} {"train_loss": -7.120862007141113, "global_step": 177620, "epoch": 4229} {"train_loss": -6.96150016784668, "global_step": 177621, "epoch": 4229} {"train_loss": -7.196760654449463, "global_step": 177622, "epoch": 4229} {"train_loss": -7.1997270584106445, "global_step": 177623, "epoch": 4229} {"train_loss": -7.1770124435424805, "global_step": 177624, "epoch": 4229} {"train_loss": -7.0649871826171875, "global_step": 177625, "epoch": 4229} {"train_loss": -7.148496627807617, "global_step": 177626, "epoch": 4229} {"train_loss": -7.213265895843506, "global_step": 177627, "epoch": 4229} {"train_loss": -7.168824195861816, "global_step": 177628, "epoch": 4229} {"train_loss": -7.0671281814575195, "global_step": 177629, "epoch": 4229} {"train_loss": -7.108979225158691, "global_step": 177630, "epoch": 4229} {"train_loss": -7.0964179039001465, "global_step": 177631, "epoch": 4229} {"train_loss": -7.215028762817383, "global_step": 177632, "epoch": 4229} {"train_loss": -7.10639762878418, "global_step": 177633, "epoch": 4229} {"train_loss": -7.053241729736328, "global_step": 177634, "epoch": 4229} {"train_loss": -7.114026069641113, "global_step": 177635, "epoch": 4229} {"train_loss": -7.102893829345703, "global_step": 177636, "epoch": 4229} {"train_loss": -7.114636421203613, "global_step": 177637, "epoch": 4229} {"train_loss": -7.150057792663574, "global_step": 177638, "epoch": 4229} {"train_loss": -7.045165061950684, "global_step": 177639, "epoch": 4229} {"train_loss": -7.144026279449463, "global_step": 177640, "epoch": 4229} {"train_loss": -7.153902530670166, "global_step": 177641, "epoch": 4229} {"train_loss": -7.025358200073242, "global_step": 177642, "epoch": 4229} {"train_loss": -7.073003768920898, "global_step": 177643, "epoch": 4229} {"train_loss": -7.089944839477539, "global_step": 177644, "epoch": 4229} {"train_loss": -7.0305938720703125, "global_step": 177645, "epoch": 4229} {"train_loss": -7.125778675079346, "global_step": 177646, "epoch": 4229} {"train_loss": -7.035634994506836, "global_step": 177647, "epoch": 4229} {"train_loss": -7.07493257522583, "global_step": 177648, "epoch": 4229} {"train_loss": -7.120849609375, "global_step": 177649, "epoch": 4229} {"train_loss": -7.121173858642578, "global_step": 177650, "epoch": 4229} {"train_loss": -7.155252456665039, "global_step": 177651, "epoch": 4229} {"train_loss": -7.151869773864746, "global_step": 177652, "epoch": 4229} {"train_loss": -7.0845465660095215, "global_step": 177653, "epoch": 4229} {"train_loss": -7.214155197143555, "global_step": 177654, "epoch": 4229} {"train_loss": -7.219099998474121, "global_step": 177655, "epoch": 4229} {"train_loss": -7.2149810791015625, "global_step": 177656, "epoch": 4229} {"train_loss": -7.294751167297363, "global_step": 177657, "epoch": 4229} {"train_loss": -7.177877902984619, "global_step": 177658, "epoch": 4229} {"train_loss": -7.12447316305978, "global_step": 177659, "epoch": 4229, "val_loss": 69189.875} {"train_loss": -7.301266670227051, "global_step": 177660, "epoch": 4230} {"train_loss": -6.983928680419922, "global_step": 177661, "epoch": 4230} {"train_loss": -7.162275791168213, "global_step": 177662, "epoch": 4230} {"train_loss": -7.084904670715332, "global_step": 177663, "epoch": 4230} {"train_loss": -6.946099281311035, "global_step": 177664, "epoch": 4230} {"train_loss": -6.936551094055176, "global_step": 177665, "epoch": 4230} {"train_loss": -7.025806427001953, "global_step": 177666, "epoch": 4230} {"train_loss": -6.937285423278809, "global_step": 177667, "epoch": 4230} {"train_loss": -6.960017204284668, "global_step": 177668, "epoch": 4230} {"train_loss": -7.075263977050781, "global_step": 177669, "epoch": 4230} {"train_loss": -7.034599304199219, "global_step": 177670, "epoch": 4230} {"train_loss": -6.907896041870117, "global_step": 177671, "epoch": 4230} {"train_loss": -7.036562442779541, "global_step": 177672, "epoch": 4230} {"train_loss": -7.0294060707092285, "global_step": 177673, "epoch": 4230} {"train_loss": -7.039604663848877, "global_step": 177674, "epoch": 4230} {"train_loss": -7.04902982711792, "global_step": 177675, "epoch": 4230} {"train_loss": -6.964048385620117, "global_step": 177676, "epoch": 4230} {"train_loss": -7.055727005004883, "global_step": 177677, "epoch": 4230} {"train_loss": -6.903501033782959, "global_step": 177678, "epoch": 4230} {"train_loss": -7.125523567199707, "global_step": 177679, "epoch": 4230} {"train_loss": -6.950958728790283, "global_step": 177680, "epoch": 4230} {"train_loss": -7.078662872314453, "global_step": 177681, "epoch": 4230} {"train_loss": -7.016107559204102, "global_step": 177682, "epoch": 4230} {"train_loss": -7.100508689880371, "global_step": 177683, "epoch": 4230} {"train_loss": -7.061777591705322, "global_step": 177684, "epoch": 4230} {"train_loss": -7.070852279663086, "global_step": 177685, "epoch": 4230} {"train_loss": -7.014095306396484, "global_step": 177686, "epoch": 4230} {"train_loss": -6.974147319793701, "global_step": 177687, "epoch": 4230} {"train_loss": -7.135859489440918, "global_step": 177688, "epoch": 4230} {"train_loss": -7.053030967712402, "global_step": 177689, "epoch": 4230} {"train_loss": -6.9735260009765625, "global_step": 177690, "epoch": 4230} {"train_loss": -7.000246047973633, "global_step": 177691, "epoch": 4230} {"train_loss": -7.047539710998535, "global_step": 177692, "epoch": 4230} {"train_loss": -7.183474540710449, "global_step": 177693, "epoch": 4230} {"train_loss": -7.011777400970459, "global_step": 177694, "epoch": 4230} {"train_loss": -6.928696632385254, "global_step": 177695, "epoch": 4230} {"train_loss": -7.047119140625, "global_step": 177696, "epoch": 4230} {"train_loss": -7.056717395782471, "global_step": 177697, "epoch": 4230} {"train_loss": -7.098608016967773, "global_step": 177698, "epoch": 4230} {"train_loss": -7.170417785644531, "global_step": 177699, "epoch": 4230} {"train_loss": -6.911463737487793, "global_step": 177700, "epoch": 4230} {"train_loss": -7.034183445430937, "global_step": 177701, "epoch": 4230, "val_loss": 69285.0390625} {"train_loss": -7.158574104309082, "global_step": 177702, "epoch": 4231} {"train_loss": -7.077014923095703, "global_step": 177703, "epoch": 4231} {"train_loss": -7.05848503112793, "global_step": 177704, "epoch": 4231} {"train_loss": -7.027774810791016, "global_step": 177705, "epoch": 4231} {"train_loss": -7.142152786254883, "global_step": 177706, "epoch": 4231} {"train_loss": -7.193151473999023, "global_step": 177707, "epoch": 4231} {"train_loss": -7.206899166107178, "global_step": 177708, "epoch": 4231} {"train_loss": -7.190365314483643, "global_step": 177709, "epoch": 4231} {"train_loss": -7.137421131134033, "global_step": 177710, "epoch": 4231} {"train_loss": -7.101166248321533, "global_step": 177711, "epoch": 4231} {"train_loss": -7.18629264831543, "global_step": 177712, "epoch": 4231} {"train_loss": -7.136941909790039, "global_step": 177713, "epoch": 4231} {"train_loss": -7.2229108810424805, "global_step": 177714, "epoch": 4231} {"train_loss": -7.059959411621094, "global_step": 177715, "epoch": 4231} {"train_loss": -7.004631996154785, "global_step": 177716, "epoch": 4231} {"train_loss": -7.07936954498291, "global_step": 177717, "epoch": 4231} {"train_loss": -7.098239898681641, "global_step": 177718, "epoch": 4231} {"train_loss": -7.0083746910095215, "global_step": 177719, "epoch": 4231} {"train_loss": -7.212054252624512, "global_step": 177720, "epoch": 4231} {"train_loss": -7.12722110748291, "global_step": 177721, "epoch": 4231} {"train_loss": -7.055496692657471, "global_step": 177722, "epoch": 4231} {"train_loss": -7.066457748413086, "global_step": 177723, "epoch": 4231} {"train_loss": -7.184587001800537, "global_step": 177724, "epoch": 4231} {"train_loss": -7.167361259460449, "global_step": 177725, "epoch": 4231} {"train_loss": -7.03973388671875, "global_step": 177726, "epoch": 4231} {"train_loss": -7.248040199279785, "global_step": 177727, "epoch": 4231} {"train_loss": -7.232840538024902, "global_step": 177728, "epoch": 4231} {"train_loss": -7.124472618103027, "global_step": 177729, "epoch": 4231} {"train_loss": -7.185720443725586, "global_step": 177730, "epoch": 4231} {"train_loss": -7.212567329406738, "global_step": 177731, "epoch": 4231} {"train_loss": -7.118659496307373, "global_step": 177732, "epoch": 4231} {"train_loss": -7.231860160827637, "global_step": 177733, "epoch": 4231} {"train_loss": -7.1681060791015625, "global_step": 177734, "epoch": 4231} {"train_loss": -7.186503887176514, "global_step": 177735, "epoch": 4231} {"train_loss": -7.171849250793457, "global_step": 177736, "epoch": 4231} {"train_loss": -7.118452548980713, "global_step": 177737, "epoch": 4231} {"train_loss": -7.119498252868652, "global_step": 177738, "epoch": 4231} {"train_loss": -7.1212310791015625, "global_step": 177739, "epoch": 4231} {"train_loss": -7.074805736541748, "global_step": 177740, "epoch": 4231} {"train_loss": -7.169648170471191, "global_step": 177741, "epoch": 4231} {"train_loss": -7.209646224975586, "global_step": 177742, "epoch": 4231} {"train_loss": -7.137891746702648, "global_step": 177743, "epoch": 4231, "val_loss": 69339.484375} {"train_loss": -7.038906574249268, "global_step": 177744, "epoch": 4232} {"train_loss": -7.193473815917969, "global_step": 177745, "epoch": 4232} {"train_loss": -7.284183502197266, "global_step": 177746, "epoch": 4232} {"train_loss": -7.086907863616943, "global_step": 177747, "epoch": 4232} {"train_loss": -7.060483932495117, "global_step": 177748, "epoch": 4232} {"train_loss": -7.122696876525879, "global_step": 177749, "epoch": 4232} {"train_loss": -7.192315101623535, "global_step": 177750, "epoch": 4232} {"train_loss": -7.061797618865967, "global_step": 177751, "epoch": 4232} {"train_loss": -7.1244635581970215, "global_step": 177752, "epoch": 4232} {"train_loss": -7.165401458740234, "global_step": 177753, "epoch": 4232} {"train_loss": -7.134344100952148, "global_step": 177754, "epoch": 4232} {"train_loss": -7.173088550567627, "global_step": 177755, "epoch": 4232} {"train_loss": -7.0905938148498535, "global_step": 177756, "epoch": 4232} {"train_loss": -7.223832130432129, "global_step": 177757, "epoch": 4232} {"train_loss": -7.091526031494141, "global_step": 177758, "epoch": 4232} {"train_loss": -7.076578617095947, "global_step": 177759, "epoch": 4232} {"train_loss": -7.1687726974487305, "global_step": 177760, "epoch": 4232} {"train_loss": -7.001178741455078, "global_step": 177761, "epoch": 4232} {"train_loss": -7.102777481079102, "global_step": 177762, "epoch": 4232} {"train_loss": -7.076934337615967, "global_step": 177763, "epoch": 4232} {"train_loss": -7.02818489074707, "global_step": 177764, "epoch": 4232} {"train_loss": -7.022360801696777, "global_step": 177765, "epoch": 4232} {"train_loss": -7.1586809158325195, "global_step": 177766, "epoch": 4232} {"train_loss": -6.938760280609131, "global_step": 177767, "epoch": 4232} {"train_loss": -6.997653961181641, "global_step": 177768, "epoch": 4232} {"train_loss": -7.254175186157227, "global_step": 177769, "epoch": 4232} {"train_loss": -6.953446388244629, "global_step": 177770, "epoch": 4232} {"train_loss": -7.122056007385254, "global_step": 177771, "epoch": 4232} {"train_loss": -7.139366149902344, "global_step": 177772, "epoch": 4232} {"train_loss": -7.0773234367370605, "global_step": 177773, "epoch": 4232} {"train_loss": -7.131437301635742, "global_step": 177774, "epoch": 4232} {"train_loss": -7.161111831665039, "global_step": 177775, "epoch": 4232} {"train_loss": -6.968339443206787, "global_step": 177776, "epoch": 4232} {"train_loss": -7.04567813873291, "global_step": 177777, "epoch": 4232} {"train_loss": -6.983196258544922, "global_step": 177778, "epoch": 4232} {"train_loss": -7.028876781463623, "global_step": 177779, "epoch": 4232} {"train_loss": -7.278125286102295, "global_step": 177780, "epoch": 4232} {"train_loss": -7.076184272766113, "global_step": 177781, "epoch": 4232} {"train_loss": -7.119381904602051, "global_step": 177782, "epoch": 4232} {"train_loss": -7.148155212402344, "global_step": 177783, "epoch": 4232} {"train_loss": -6.973064422607422, "global_step": 177784, "epoch": 4232} {"train_loss": -7.100026119323004, "global_step": 177785, "epoch": 4232, "val_loss": 69238.1484375} {"train_loss": -7.169695854187012, "global_step": 177786, "epoch": 4233} {"train_loss": -7.205398082733154, "global_step": 177787, "epoch": 4233} {"train_loss": -7.141853332519531, "global_step": 177788, "epoch": 4233} {"train_loss": -7.158125877380371, "global_step": 177789, "epoch": 4233} {"train_loss": -7.090506553649902, "global_step": 177790, "epoch": 4233} {"train_loss": -7.122557640075684, "global_step": 177791, "epoch": 4233} {"train_loss": -7.068090438842773, "global_step": 177792, "epoch": 4233} {"train_loss": -7.194229602813721, "global_step": 177793, "epoch": 4233} {"train_loss": -7.093070983886719, "global_step": 177794, "epoch": 4233} {"train_loss": -7.2223052978515625, "global_step": 177795, "epoch": 4233} {"train_loss": -7.151866912841797, "global_step": 177796, "epoch": 4233} {"train_loss": -7.182048797607422, "global_step": 177797, "epoch": 4233} {"train_loss": -7.049144744873047, "global_step": 177798, "epoch": 4233} {"train_loss": -7.218224048614502, "global_step": 177799, "epoch": 4233} {"train_loss": -7.11082649230957, "global_step": 177800, "epoch": 4233} {"train_loss": -7.148571491241455, "global_step": 177801, "epoch": 4233} {"train_loss": -7.250711917877197, "global_step": 177802, "epoch": 4233} {"train_loss": -7.124879837036133, "global_step": 177803, "epoch": 4233} {"train_loss": -7.193315505981445, "global_step": 177804, "epoch": 4233} {"train_loss": -7.1245341300964355, "global_step": 177805, "epoch": 4233} {"train_loss": -7.048010349273682, "global_step": 177806, "epoch": 4233} {"train_loss": -7.211391448974609, "global_step": 177807, "epoch": 4233} {"train_loss": -7.1453328132629395, "global_step": 177808, "epoch": 4233} {"train_loss": -7.104062080383301, "global_step": 177809, "epoch": 4233} {"train_loss": -7.238747596740723, "global_step": 177810, "epoch": 4233} {"train_loss": -7.110677242279053, "global_step": 177811, "epoch": 4233} {"train_loss": -7.116720199584961, "global_step": 177812, "epoch": 4233} {"train_loss": -7.1181321144104, "global_step": 177813, "epoch": 4233} {"train_loss": -6.991590976715088, "global_step": 177814, "epoch": 4233} {"train_loss": -7.029815673828125, "global_step": 177815, "epoch": 4233} {"train_loss": -7.078683853149414, "global_step": 177816, "epoch": 4233} {"train_loss": -7.061995506286621, "global_step": 177817, "epoch": 4233} {"train_loss": -7.215339660644531, "global_step": 177818, "epoch": 4233} {"train_loss": -6.956504821777344, "global_step": 177819, "epoch": 4233} {"train_loss": -7.098067283630371, "global_step": 177820, "epoch": 4233} {"train_loss": -7.015412330627441, "global_step": 177821, "epoch": 4233} {"train_loss": -7.033505439758301, "global_step": 177822, "epoch": 4233} {"train_loss": -7.154419898986816, "global_step": 177823, "epoch": 4233} {"train_loss": -7.015519142150879, "global_step": 177824, "epoch": 4233} {"train_loss": -7.1474223136901855, "global_step": 177825, "epoch": 4233} {"train_loss": -7.117454528808594, "global_step": 177826, "epoch": 4233} {"train_loss": -7.122651406696865, "global_step": 177827, "epoch": 4233, "val_loss": 69161.921875} {"train_loss": -7.065293788909912, "global_step": 177828, "epoch": 4234} {"train_loss": -7.147319316864014, "global_step": 177829, "epoch": 4234} {"train_loss": -7.020235538482666, "global_step": 177830, "epoch": 4234} {"train_loss": -7.065518856048584, "global_step": 177831, "epoch": 4234} {"train_loss": -7.216815948486328, "global_step": 177832, "epoch": 4234} {"train_loss": -7.0156097412109375, "global_step": 177833, "epoch": 4234} {"train_loss": -7.062355995178223, "global_step": 177834, "epoch": 4234} {"train_loss": -7.223304748535156, "global_step": 177835, "epoch": 4234} {"train_loss": -7.108186721801758, "global_step": 177836, "epoch": 4234} {"train_loss": -7.119420051574707, "global_step": 177837, "epoch": 4234} {"train_loss": -7.096222877502441, "global_step": 177838, "epoch": 4234} {"train_loss": -7.184240341186523, "global_step": 177839, "epoch": 4234} {"train_loss": -7.09346866607666, "global_step": 177840, "epoch": 4234} {"train_loss": -7.057633876800537, "global_step": 177841, "epoch": 4234} {"train_loss": -7.217124938964844, "global_step": 177842, "epoch": 4234} {"train_loss": -7.297719478607178, "global_step": 177843, "epoch": 4234} {"train_loss": -7.14683198928833, "global_step": 177844, "epoch": 4234} {"train_loss": -7.218102931976318, "global_step": 177845, "epoch": 4234} {"train_loss": -7.109018325805664, "global_step": 177846, "epoch": 4234} {"train_loss": -7.108325004577637, "global_step": 177847, "epoch": 4234} {"train_loss": -7.180255889892578, "global_step": 177848, "epoch": 4234} {"train_loss": -7.063971519470215, "global_step": 177849, "epoch": 4234} {"train_loss": -7.061593532562256, "global_step": 177850, "epoch": 4234} {"train_loss": -7.065618515014648, "global_step": 177851, "epoch": 4234} {"train_loss": -7.025979518890381, "global_step": 177852, "epoch": 4234} {"train_loss": -7.0245280265808105, "global_step": 177853, "epoch": 4234} {"train_loss": -7.022477626800537, "global_step": 177854, "epoch": 4234} {"train_loss": -7.106293678283691, "global_step": 177855, "epoch": 4234} {"train_loss": -7.069159030914307, "global_step": 177856, "epoch": 4234} {"train_loss": -7.038805961608887, "global_step": 177857, "epoch": 4234} {"train_loss": -7.073894023895264, "global_step": 177858, "epoch": 4234} {"train_loss": -7.067112922668457, "global_step": 177859, "epoch": 4234} {"train_loss": -7.06525182723999, "global_step": 177860, "epoch": 4234} {"train_loss": -7.070661544799805, "global_step": 177861, "epoch": 4234} {"train_loss": -7.044849872589111, "global_step": 177862, "epoch": 4234} {"train_loss": -7.078806400299072, "global_step": 177863, "epoch": 4234} {"train_loss": -7.0848493576049805, "global_step": 177864, "epoch": 4234} {"train_loss": -7.141977787017822, "global_step": 177865, "epoch": 4234} {"train_loss": -7.054024696350098, "global_step": 177866, "epoch": 4234} {"train_loss": -7.163840293884277, "global_step": 177867, "epoch": 4234} {"train_loss": -7.214899063110352, "global_step": 177868, "epoch": 4234} {"train_loss": -7.103284279505412, "global_step": 177869, "epoch": 4234, "val_loss": 69253.2421875} {"train_loss": -7.119479179382324, "global_step": 177870, "epoch": 4235} {"train_loss": -7.039643287658691, "global_step": 177871, "epoch": 4235} {"train_loss": -7.06532096862793, "global_step": 177872, "epoch": 4235} {"train_loss": -7.023900032043457, "global_step": 177873, "epoch": 4235} {"train_loss": -7.074385166168213, "global_step": 177874, "epoch": 4235} {"train_loss": -7.022946834564209, "global_step": 177875, "epoch": 4235} {"train_loss": -7.006427764892578, "global_step": 177876, "epoch": 4235} {"train_loss": -7.067694664001465, "global_step": 177877, "epoch": 4235} {"train_loss": -6.960415840148926, "global_step": 177878, "epoch": 4235} {"train_loss": -7.0272722244262695, "global_step": 177879, "epoch": 4235} {"train_loss": -6.974634170532227, "global_step": 177880, "epoch": 4235} {"train_loss": -6.953869819641113, "global_step": 177881, "epoch": 4235} {"train_loss": -7.012720108032227, "global_step": 177882, "epoch": 4235} {"train_loss": -6.91752815246582, "global_step": 177883, "epoch": 4235} {"train_loss": -7.035876274108887, "global_step": 177884, "epoch": 4235} {"train_loss": -7.0071001052856445, "global_step": 177885, "epoch": 4235} {"train_loss": -7.039087772369385, "global_step": 177886, "epoch": 4235} {"train_loss": -7.0713090896606445, "global_step": 177887, "epoch": 4235} {"train_loss": -7.028641700744629, "global_step": 177888, "epoch": 4235} {"train_loss": -7.057068824768066, "global_step": 177889, "epoch": 4235} {"train_loss": -7.0372748374938965, "global_step": 177890, "epoch": 4235} {"train_loss": -7.090586185455322, "global_step": 177891, "epoch": 4235} {"train_loss": -7.046950340270996, "global_step": 177892, "epoch": 4235} {"train_loss": -7.179378986358643, "global_step": 177893, "epoch": 4235} {"train_loss": -7.053124904632568, "global_step": 177894, "epoch": 4235} {"train_loss": -7.097017288208008, "global_step": 177895, "epoch": 4235} {"train_loss": -7.157068252563477, "global_step": 177896, "epoch": 4235} {"train_loss": -7.1330485343933105, "global_step": 177897, "epoch": 4235} {"train_loss": -7.129334449768066, "global_step": 177898, "epoch": 4235} {"train_loss": -7.032620906829834, "global_step": 177899, "epoch": 4235} {"train_loss": -7.0240068435668945, "global_step": 177900, "epoch": 4235} {"train_loss": -7.038913249969482, "global_step": 177901, "epoch": 4235} {"train_loss": -7.0430006980896, "global_step": 177902, "epoch": 4235} {"train_loss": -6.993622779846191, "global_step": 177903, "epoch": 4235} {"train_loss": -7.164223670959473, "global_step": 177904, "epoch": 4235} {"train_loss": -7.036513328552246, "global_step": 177905, "epoch": 4235} {"train_loss": -7.013130187988281, "global_step": 177906, "epoch": 4235} {"train_loss": -7.110103130340576, "global_step": 177907, "epoch": 4235} {"train_loss": -7.015824317932129, "global_step": 177908, "epoch": 4235} {"train_loss": -7.042068004608154, "global_step": 177909, "epoch": 4235} {"train_loss": -6.991091728210449, "global_step": 177910, "epoch": 4235} {"train_loss": -7.0472228072938465, "global_step": 177911, "epoch": 4235, "val_loss": 69225.2109375} {"train_loss": -7.016201972961426, "global_step": 177912, "epoch": 4236} {"train_loss": -6.997351169586182, "global_step": 177913, "epoch": 4236} {"train_loss": -7.020730495452881, "global_step": 177914, "epoch": 4236} {"train_loss": -7.06070613861084, "global_step": 177915, "epoch": 4236} {"train_loss": -7.105145454406738, "global_step": 177916, "epoch": 4236} {"train_loss": -7.126270294189453, "global_step": 177917, "epoch": 4236} {"train_loss": -7.0690484046936035, "global_step": 177918, "epoch": 4236} {"train_loss": -7.119897842407227, "global_step": 177919, "epoch": 4236} {"train_loss": -7.186897277832031, "global_step": 177920, "epoch": 4236} {"train_loss": -7.125738143920898, "global_step": 177921, "epoch": 4236} {"train_loss": -7.159416198730469, "global_step": 177922, "epoch": 4236} {"train_loss": -7.1219353675842285, "global_step": 177923, "epoch": 4236} {"train_loss": -7.106743812561035, "global_step": 177924, "epoch": 4236} {"train_loss": -7.056090354919434, "global_step": 177925, "epoch": 4236} {"train_loss": -7.159286022186279, "global_step": 177926, "epoch": 4236} {"train_loss": -7.237941265106201, "global_step": 177927, "epoch": 4236} {"train_loss": -7.133856296539307, "global_step": 177928, "epoch": 4236} {"train_loss": -7.162038803100586, "global_step": 177929, "epoch": 4236} {"train_loss": -7.043248176574707, "global_step": 177930, "epoch": 4236} {"train_loss": -7.215169906616211, "global_step": 177931, "epoch": 4236} {"train_loss": -7.148727893829346, "global_step": 177932, "epoch": 4236} {"train_loss": -7.073670387268066, "global_step": 177933, "epoch": 4236} {"train_loss": -7.089288234710693, "global_step": 177934, "epoch": 4236} {"train_loss": -7.106269836425781, "global_step": 177935, "epoch": 4236} {"train_loss": -7.0288190841674805, "global_step": 177936, "epoch": 4236} {"train_loss": -7.1212029457092285, "global_step": 177937, "epoch": 4236} {"train_loss": -7.043041706085205, "global_step": 177938, "epoch": 4236} {"train_loss": -7.170398712158203, "global_step": 177939, "epoch": 4236} {"train_loss": -7.142309665679932, "global_step": 177940, "epoch": 4236} {"train_loss": -7.083070278167725, "global_step": 177941, "epoch": 4236} {"train_loss": -7.022319316864014, "global_step": 177942, "epoch": 4236} {"train_loss": -7.113480567932129, "global_step": 177943, "epoch": 4236} {"train_loss": -7.1041412353515625, "global_step": 177944, "epoch": 4236} {"train_loss": -7.12273645401001, "global_step": 177945, "epoch": 4236} {"train_loss": -7.045773506164551, "global_step": 177946, "epoch": 4236} {"train_loss": -7.040037155151367, "global_step": 177947, "epoch": 4236} {"train_loss": -7.108616352081299, "global_step": 177948, "epoch": 4236} {"train_loss": -7.1878662109375, "global_step": 177949, "epoch": 4236} {"train_loss": -7.158980846405029, "global_step": 177950, "epoch": 4236} {"train_loss": -7.071247100830078, "global_step": 177951, "epoch": 4236} {"train_loss": -7.073266983032227, "global_step": 177952, "epoch": 4236} {"train_loss": -7.105151653289795, "global_step": 177953, "epoch": 4236, "val_loss": 69285.1484375} {"train_loss": -7.0715012550354, "global_step": 177954, "epoch": 4237} {"train_loss": -7.0078864097595215, "global_step": 177955, "epoch": 4237} {"train_loss": -7.024544715881348, "global_step": 177956, "epoch": 4237} {"train_loss": -7.126171112060547, "global_step": 177957, "epoch": 4237} {"train_loss": -7.128686428070068, "global_step": 177958, "epoch": 4237} {"train_loss": -7.100811004638672, "global_step": 177959, "epoch": 4237} {"train_loss": -7.122561454772949, "global_step": 177960, "epoch": 4237} {"train_loss": -7.116479396820068, "global_step": 177961, "epoch": 4237} {"train_loss": -7.191458225250244, "global_step": 177962, "epoch": 4237} {"train_loss": -7.118449687957764, "global_step": 177963, "epoch": 4237} {"train_loss": -7.144569396972656, "global_step": 177964, "epoch": 4237} {"train_loss": -7.176956653594971, "global_step": 177965, "epoch": 4237} {"train_loss": -7.236692905426025, "global_step": 177966, "epoch": 4237} {"train_loss": -7.00272798538208, "global_step": 177967, "epoch": 4237} {"train_loss": -7.100543975830078, "global_step": 177968, "epoch": 4237} {"train_loss": -7.176095962524414, "global_step": 177969, "epoch": 4237} {"train_loss": -7.04721736907959, "global_step": 177970, "epoch": 4237} {"train_loss": -7.092190742492676, "global_step": 177971, "epoch": 4237} {"train_loss": -7.043622970581055, "global_step": 177972, "epoch": 4237} {"train_loss": -7.107479572296143, "global_step": 177973, "epoch": 4237} {"train_loss": -7.054210186004639, "global_step": 177974, "epoch": 4237} {"train_loss": -7.153616428375244, "global_step": 177975, "epoch": 4237} {"train_loss": -7.099380016326904, "global_step": 177976, "epoch": 4237} {"train_loss": -7.118273735046387, "global_step": 177977, "epoch": 4237} {"train_loss": -6.986189365386963, "global_step": 177978, "epoch": 4237} {"train_loss": -7.154436111450195, "global_step": 177979, "epoch": 4237} {"train_loss": -7.096607685089111, "global_step": 177980, "epoch": 4237} {"train_loss": -7.173371315002441, "global_step": 177981, "epoch": 4237} {"train_loss": -7.059207916259766, "global_step": 177982, "epoch": 4237} {"train_loss": -7.147579669952393, "global_step": 177983, "epoch": 4237} {"train_loss": -7.2037506103515625, "global_step": 177984, "epoch": 4237} {"train_loss": -7.115149974822998, "global_step": 177985, "epoch": 4237} {"train_loss": -7.159066200256348, "global_step": 177986, "epoch": 4237} {"train_loss": -7.162215232849121, "global_step": 177987, "epoch": 4237} {"train_loss": -7.206570625305176, "global_step": 177988, "epoch": 4237} {"train_loss": -7.170504570007324, "global_step": 177989, "epoch": 4237} {"train_loss": -7.1797404289245605, "global_step": 177990, "epoch": 4237} {"train_loss": -7.07523250579834, "global_step": 177991, "epoch": 4237} {"train_loss": -7.221047878265381, "global_step": 177992, "epoch": 4237} {"train_loss": -7.238674163818359, "global_step": 177993, "epoch": 4237} {"train_loss": -7.2173261642456055, "global_step": 177994, "epoch": 4237} {"train_loss": -7.122760761351812, "global_step": 177995, "epoch": 4237, "val_loss": 69166.8046875} {"train_loss": -7.1541900634765625, "global_step": 177996, "epoch": 4238} {"train_loss": -7.153388977050781, "global_step": 177997, "epoch": 4238} {"train_loss": -7.2004899978637695, "global_step": 177998, "epoch": 4238} {"train_loss": -7.20467472076416, "global_step": 177999, "epoch": 4238} {"train_loss": -7.1550517082214355, "global_step": 178000, "epoch": 4238} {"train_loss": -7.113348484039307, "global_step": 178001, "epoch": 4238} {"train_loss": -6.979290008544922, "global_step": 178002, "epoch": 4238} {"train_loss": -7.062125205993652, "global_step": 178003, "epoch": 4238} {"train_loss": -7.108748912811279, "global_step": 178004, "epoch": 4238} {"train_loss": -6.991487503051758, "global_step": 178005, "epoch": 4238} {"train_loss": -7.062297821044922, "global_step": 178006, "epoch": 4238} {"train_loss": -7.067708969116211, "global_step": 178007, "epoch": 4238} {"train_loss": -6.986220836639404, "global_step": 178008, "epoch": 4238} {"train_loss": -6.905580520629883, "global_step": 178009, "epoch": 4238} {"train_loss": -7.0643205642700195, "global_step": 178010, "epoch": 4238} {"train_loss": -7.077253341674805, "global_step": 178011, "epoch": 4238} {"train_loss": -7.179003715515137, "global_step": 178012, "epoch": 4238} {"train_loss": -7.157495975494385, "global_step": 178013, "epoch": 4238} {"train_loss": -7.056872367858887, "global_step": 178014, "epoch": 4238} {"train_loss": -7.159493923187256, "global_step": 178015, "epoch": 4238} {"train_loss": -7.039784908294678, "global_step": 178016, "epoch": 4238} {"train_loss": -7.067751884460449, "global_step": 178017, "epoch": 4238} {"train_loss": -7.116174697875977, "global_step": 178018, "epoch": 4238} {"train_loss": -7.064988136291504, "global_step": 178019, "epoch": 4238} {"train_loss": -7.131215572357178, "global_step": 178020, "epoch": 4238} {"train_loss": -7.124752998352051, "global_step": 178021, "epoch": 4238} {"train_loss": -7.140541076660156, "global_step": 178022, "epoch": 4238} {"train_loss": -7.089857578277588, "global_step": 178023, "epoch": 4238} {"train_loss": -7.087015628814697, "global_step": 178024, "epoch": 4238} {"train_loss": -7.117912769317627, "global_step": 178025, "epoch": 4238} {"train_loss": -7.050214767456055, "global_step": 178026, "epoch": 4238} {"train_loss": -7.1125993728637695, "global_step": 178027, "epoch": 4238} {"train_loss": -7.126587390899658, "global_step": 178028, "epoch": 4238} {"train_loss": -7.1438398361206055, "global_step": 178029, "epoch": 4238} {"train_loss": -7.101738929748535, "global_step": 178030, "epoch": 4238} {"train_loss": -7.17179536819458, "global_step": 178031, "epoch": 4238} {"train_loss": -7.167610168457031, "global_step": 178032, "epoch": 4238} {"train_loss": -7.163078784942627, "global_step": 178033, "epoch": 4238} {"train_loss": -7.111918926239014, "global_step": 178034, "epoch": 4238} {"train_loss": -7.114014625549316, "global_step": 178035, "epoch": 4238} {"train_loss": -7.176616668701172, "global_step": 178036, "epoch": 4238} {"train_loss": -7.105025507154918, "global_step": 178037, "epoch": 4238, "val_loss": 69272.1875} {"train_loss": -7.153172969818115, "global_step": 178038, "epoch": 4239} {"train_loss": -7.221047878265381, "global_step": 178039, "epoch": 4239} {"train_loss": -7.0822062492370605, "global_step": 178040, "epoch": 4239} {"train_loss": -7.166772842407227, "global_step": 178041, "epoch": 4239} {"train_loss": -7.17477560043335, "global_step": 178042, "epoch": 4239} {"train_loss": -7.23326301574707, "global_step": 178043, "epoch": 4239} {"train_loss": -7.052659034729004, "global_step": 178044, "epoch": 4239} {"train_loss": -7.170105457305908, "global_step": 178045, "epoch": 4239} {"train_loss": -7.121703624725342, "global_step": 178046, "epoch": 4239} {"train_loss": -7.2352118492126465, "global_step": 178047, "epoch": 4239} {"train_loss": -7.196594715118408, "global_step": 178048, "epoch": 4239} {"train_loss": -7.139019966125488, "global_step": 178049, "epoch": 4239} {"train_loss": -7.180515766143799, "global_step": 178050, "epoch": 4239} {"train_loss": -7.099071502685547, "global_step": 178051, "epoch": 4239} {"train_loss": -7.073345184326172, "global_step": 178052, "epoch": 4239} {"train_loss": -7.155559539794922, "global_step": 178053, "epoch": 4239} {"train_loss": -7.090510368347168, "global_step": 178054, "epoch": 4239} {"train_loss": -7.065540313720703, "global_step": 178055, "epoch": 4239} {"train_loss": -7.011777877807617, "global_step": 178056, "epoch": 4239} {"train_loss": -7.170469284057617, "global_step": 178057, "epoch": 4239} {"train_loss": -7.071457386016846, "global_step": 178058, "epoch": 4239} {"train_loss": -6.929414749145508, "global_step": 178059, "epoch": 4239} {"train_loss": -7.195441722869873, "global_step": 178060, "epoch": 4239} {"train_loss": -6.989539623260498, "global_step": 178061, "epoch": 4239} {"train_loss": -6.916940689086914, "global_step": 178062, "epoch": 4239} {"train_loss": -7.115556716918945, "global_step": 178063, "epoch": 4239} {"train_loss": -6.946002960205078, "global_step": 178064, "epoch": 4239} {"train_loss": -7.056494235992432, "global_step": 178065, "epoch": 4239} {"train_loss": -6.949432373046875, "global_step": 178066, "epoch": 4239} {"train_loss": -6.816120147705078, "global_step": 178067, "epoch": 4239} {"train_loss": -7.083597183227539, "global_step": 178068, "epoch": 4239} {"train_loss": -6.929032325744629, "global_step": 178069, "epoch": 4239} {"train_loss": -7.010010719299316, "global_step": 178070, "epoch": 4239} {"train_loss": -7.010148048400879, "global_step": 178071, "epoch": 4239} {"train_loss": -6.992617607116699, "global_step": 178072, "epoch": 4239} {"train_loss": -6.914515018463135, "global_step": 178073, "epoch": 4239} {"train_loss": -7.111690044403076, "global_step": 178074, "epoch": 4239} {"train_loss": -6.858546257019043, "global_step": 178075, "epoch": 4239} {"train_loss": -6.957313537597656, "global_step": 178076, "epoch": 4239} {"train_loss": -6.914623260498047, "global_step": 178077, "epoch": 4239} {"train_loss": -6.934568405151367, "global_step": 178078, "epoch": 4239} {"train_loss": -7.060144197373163, "global_step": 178079, "epoch": 4239, "val_loss": 69305.9765625} {"train_loss": -6.970916748046875, "global_step": 178080, "epoch": 4240} {"train_loss": -7.095623970031738, "global_step": 178081, "epoch": 4240} {"train_loss": -6.881191730499268, "global_step": 178082, "epoch": 4240} {"train_loss": -7.048953056335449, "global_step": 178083, "epoch": 4240} {"train_loss": -6.967869758605957, "global_step": 178084, "epoch": 4240} {"train_loss": -7.038874626159668, "global_step": 178085, "epoch": 4240} {"train_loss": -7.017520904541016, "global_step": 178086, "epoch": 4240} {"train_loss": -7.103762149810791, "global_step": 178087, "epoch": 4240} {"train_loss": -7.031674385070801, "global_step": 178088, "epoch": 4240} {"train_loss": -7.015546798706055, "global_step": 178089, "epoch": 4240} {"train_loss": -7.125028610229492, "global_step": 178090, "epoch": 4240} {"train_loss": -6.976884365081787, "global_step": 178091, "epoch": 4240} {"train_loss": -7.116787910461426, "global_step": 178092, "epoch": 4240} {"train_loss": -7.066653251647949, "global_step": 178093, "epoch": 4240} {"train_loss": -7.107836723327637, "global_step": 178094, "epoch": 4240} {"train_loss": -7.022161483764648, "global_step": 178095, "epoch": 4240} {"train_loss": -7.203680515289307, "global_step": 178096, "epoch": 4240} {"train_loss": -7.118744850158691, "global_step": 178097, "epoch": 4240} {"train_loss": -7.162806034088135, "global_step": 178098, "epoch": 4240} {"train_loss": -7.22287654876709, "global_step": 178099, "epoch": 4240} {"train_loss": -7.227241039276123, "global_step": 178100, "epoch": 4240} {"train_loss": -7.129968643188477, "global_step": 178101, "epoch": 4240} {"train_loss": -7.0063157081604, "global_step": 178102, "epoch": 4240} {"train_loss": -7.156859874725342, "global_step": 178103, "epoch": 4240} {"train_loss": -7.091195106506348, "global_step": 178104, "epoch": 4240} {"train_loss": -7.029144287109375, "global_step": 178105, "epoch": 4240} {"train_loss": -7.149216651916504, "global_step": 178106, "epoch": 4240} {"train_loss": -7.147149085998535, "global_step": 178107, "epoch": 4240} {"train_loss": -7.08595085144043, "global_step": 178108, "epoch": 4240} {"train_loss": -7.170279502868652, "global_step": 178109, "epoch": 4240} {"train_loss": -7.1308770179748535, "global_step": 178110, "epoch": 4240} {"train_loss": -7.17100715637207, "global_step": 178111, "epoch": 4240} {"train_loss": -7.108654022216797, "global_step": 178112, "epoch": 4240} {"train_loss": -7.134149074554443, "global_step": 178113, "epoch": 4240} {"train_loss": -7.241580963134766, "global_step": 178114, "epoch": 4240} {"train_loss": -7.240477561950684, "global_step": 178115, "epoch": 4240} {"train_loss": -7.138305187225342, "global_step": 178116, "epoch": 4240} {"train_loss": -7.043397903442383, "global_step": 178117, "epoch": 4240} {"train_loss": -7.092820167541504, "global_step": 178118, "epoch": 4240} {"train_loss": -7.248582363128662, "global_step": 178119, "epoch": 4240} {"train_loss": -7.155613899230957, "global_step": 178120, "epoch": 4240} {"train_loss": -7.10311348097665, "global_step": 178121, "epoch": 4240, "val_loss": 69221.3203125} {"train_loss": -7.19844388961792, "global_step": 178122, "epoch": 4241} {"train_loss": -6.953199863433838, "global_step": 178123, "epoch": 4241} {"train_loss": -7.171272277832031, "global_step": 178124, "epoch": 4241} {"train_loss": -7.103952407836914, "global_step": 178125, "epoch": 4241} {"train_loss": -6.9756693840026855, "global_step": 178126, "epoch": 4241} {"train_loss": -7.076158046722412, "global_step": 178127, "epoch": 4241} {"train_loss": -7.113912582397461, "global_step": 178128, "epoch": 4241} {"train_loss": -7.0829973220825195, "global_step": 178129, "epoch": 4241} {"train_loss": -7.08143424987793, "global_step": 178130, "epoch": 4241} {"train_loss": -7.139403343200684, "global_step": 178131, "epoch": 4241} {"train_loss": -7.122828483581543, "global_step": 178132, "epoch": 4241} {"train_loss": -7.080667495727539, "global_step": 178133, "epoch": 4241} {"train_loss": -7.138799667358398, "global_step": 178134, "epoch": 4241} {"train_loss": -7.107877254486084, "global_step": 178135, "epoch": 4241} {"train_loss": -7.004000663757324, "global_step": 178136, "epoch": 4241} {"train_loss": -7.067959785461426, "global_step": 178137, "epoch": 4241} {"train_loss": -7.084165573120117, "global_step": 178138, "epoch": 4241} {"train_loss": -6.985761642456055, "global_step": 178139, "epoch": 4241} {"train_loss": -7.1371684074401855, "global_step": 178140, "epoch": 4241} {"train_loss": -6.927970886230469, "global_step": 178141, "epoch": 4241} {"train_loss": -7.076828956604004, "global_step": 178142, "epoch": 4241} {"train_loss": -7.148073196411133, "global_step": 178143, "epoch": 4241} {"train_loss": -7.0174102783203125, "global_step": 178144, "epoch": 4241} {"train_loss": -6.9836812019348145, "global_step": 178145, "epoch": 4241} {"train_loss": -7.177450180053711, "global_step": 178146, "epoch": 4241} {"train_loss": -6.974301815032959, "global_step": 178147, "epoch": 4241} {"train_loss": -6.973980903625488, "global_step": 178148, "epoch": 4241} {"train_loss": -7.118701934814453, "global_step": 178149, "epoch": 4241} {"train_loss": -7.072614669799805, "global_step": 178150, "epoch": 4241} {"train_loss": -6.985358238220215, "global_step": 178151, "epoch": 4241} {"train_loss": -7.073814392089844, "global_step": 178152, "epoch": 4241} {"train_loss": -6.964071750640869, "global_step": 178153, "epoch": 4241} {"train_loss": -7.096613883972168, "global_step": 178154, "epoch": 4241} {"train_loss": -7.040189266204834, "global_step": 178155, "epoch": 4241} {"train_loss": -6.98496150970459, "global_step": 178156, "epoch": 4241} {"train_loss": -7.020374774932861, "global_step": 178157, "epoch": 4241} {"train_loss": -7.008311748504639, "global_step": 178158, "epoch": 4241} {"train_loss": -7.057417869567871, "global_step": 178159, "epoch": 4241} {"train_loss": -6.9713134765625, "global_step": 178160, "epoch": 4241} {"train_loss": -6.992112636566162, "global_step": 178161, "epoch": 4241} {"train_loss": -6.97995662689209, "global_step": 178162, "epoch": 4241} {"train_loss": -7.053734654471988, "global_step": 178163, "epoch": 4241, "val_loss": 69220.7578125} {"train_loss": -7.03754997253418, "global_step": 178164, "epoch": 4242} {"train_loss": -6.900060653686523, "global_step": 178165, "epoch": 4242} {"train_loss": -7.040195465087891, "global_step": 178166, "epoch": 4242} {"train_loss": -7.053934097290039, "global_step": 178167, "epoch": 4242} {"train_loss": -7.060452938079834, "global_step": 178168, "epoch": 4242} {"train_loss": -6.950983047485352, "global_step": 178169, "epoch": 4242} {"train_loss": -7.076343536376953, "global_step": 178170, "epoch": 4242} {"train_loss": -6.889002323150635, "global_step": 178171, "epoch": 4242} {"train_loss": -7.014466762542725, "global_step": 178172, "epoch": 4242} {"train_loss": -6.915104866027832, "global_step": 178173, "epoch": 4242} {"train_loss": -7.07526969909668, "global_step": 178174, "epoch": 4242} {"train_loss": -7.121798038482666, "global_step": 178175, "epoch": 4242} {"train_loss": -7.107083797454834, "global_step": 178176, "epoch": 4242} {"train_loss": -7.112090110778809, "global_step": 178177, "epoch": 4242} {"train_loss": -7.062349796295166, "global_step": 178178, "epoch": 4242} {"train_loss": -7.15769100189209, "global_step": 178179, "epoch": 4242} {"train_loss": -7.155619144439697, "global_step": 178180, "epoch": 4242} {"train_loss": -7.114339828491211, "global_step": 178181, "epoch": 4242} {"train_loss": -7.106832504272461, "global_step": 178182, "epoch": 4242} {"train_loss": -7.13566255569458, "global_step": 178183, "epoch": 4242} {"train_loss": -7.119397163391113, "global_step": 178184, "epoch": 4242} {"train_loss": -7.1329665184021, "global_step": 178185, "epoch": 4242} {"train_loss": -7.149853706359863, "global_step": 178186, "epoch": 4242} {"train_loss": -7.12846565246582, "global_step": 178187, "epoch": 4242} {"train_loss": -7.102972984313965, "global_step": 178188, "epoch": 4242} {"train_loss": -7.050826549530029, "global_step": 178189, "epoch": 4242} {"train_loss": -7.106634616851807, "global_step": 178190, "epoch": 4242} {"train_loss": -7.048027038574219, "global_step": 178191, "epoch": 4242} {"train_loss": -7.113516330718994, "global_step": 178192, "epoch": 4242} {"train_loss": -7.077971935272217, "global_step": 178193, "epoch": 4242} {"train_loss": -7.057574272155762, "global_step": 178194, "epoch": 4242} {"train_loss": -7.146487236022949, "global_step": 178195, "epoch": 4242} {"train_loss": -6.931427001953125, "global_step": 178196, "epoch": 4242} {"train_loss": -7.180596351623535, "global_step": 178197, "epoch": 4242} {"train_loss": -7.021354675292969, "global_step": 178198, "epoch": 4242} {"train_loss": -7.0091729164123535, "global_step": 178199, "epoch": 4242} {"train_loss": -7.06978702545166, "global_step": 178200, "epoch": 4242} {"train_loss": -7.1336493492126465, "global_step": 178201, "epoch": 4242} {"train_loss": -7.158291816711426, "global_step": 178202, "epoch": 4242} {"train_loss": -7.123723030090332, "global_step": 178203, "epoch": 4242} {"train_loss": -7.126453399658203, "global_step": 178204, "epoch": 4242} {"train_loss": -7.07451655751183, "global_step": 178205, "epoch": 4242, "val_loss": 68995.3671875} {"train_loss": -7.156240463256836, "global_step": 178206, "epoch": 4243} {"train_loss": -7.1950860023498535, "global_step": 178207, "epoch": 4243} {"train_loss": -7.195927619934082, "global_step": 178208, "epoch": 4243} {"train_loss": -7.188056945800781, "global_step": 178209, "epoch": 4243} {"train_loss": -7.200551986694336, "global_step": 178210, "epoch": 4243} {"train_loss": -7.162190914154053, "global_step": 178211, "epoch": 4243} {"train_loss": -7.083432197570801, "global_step": 178212, "epoch": 4243} {"train_loss": -7.155519008636475, "global_step": 178213, "epoch": 4243} {"train_loss": -7.098893165588379, "global_step": 178214, "epoch": 4243} {"train_loss": -7.053442478179932, "global_step": 178215, "epoch": 4243} {"train_loss": -7.047067165374756, "global_step": 178216, "epoch": 4243} {"train_loss": -7.137938499450684, "global_step": 178217, "epoch": 4243} {"train_loss": -7.168753623962402, "global_step": 178218, "epoch": 4243} {"train_loss": -7.076761245727539, "global_step": 178219, "epoch": 4243} {"train_loss": -7.009139060974121, "global_step": 178220, "epoch": 4243} {"train_loss": -7.027848720550537, "global_step": 178221, "epoch": 4243} {"train_loss": -7.180476665496826, "global_step": 178222, "epoch": 4243} {"train_loss": -7.069606781005859, "global_step": 178223, "epoch": 4243} {"train_loss": -7.090088844299316, "global_step": 178224, "epoch": 4243} {"train_loss": -7.180246353149414, "global_step": 178225, "epoch": 4243} {"train_loss": -6.975171089172363, "global_step": 178226, "epoch": 4243} {"train_loss": -7.117000579833984, "global_step": 178227, "epoch": 4243} {"train_loss": -7.119709491729736, "global_step": 178228, "epoch": 4243} {"train_loss": -7.094846725463867, "global_step": 178229, "epoch": 4243} {"train_loss": -7.039628982543945, "global_step": 178230, "epoch": 4243} {"train_loss": -7.015655517578125, "global_step": 178231, "epoch": 4243} {"train_loss": -7.044620990753174, "global_step": 178232, "epoch": 4243} {"train_loss": -6.979345321655273, "global_step": 178233, "epoch": 4243} {"train_loss": -7.063873291015625, "global_step": 178234, "epoch": 4243} {"train_loss": -7.026913166046143, "global_step": 178235, "epoch": 4243} {"train_loss": -6.9754228591918945, "global_step": 178236, "epoch": 4243} {"train_loss": -7.051109313964844, "global_step": 178237, "epoch": 4243} {"train_loss": -6.96111536026001, "global_step": 178238, "epoch": 4243} {"train_loss": -7.003927230834961, "global_step": 178239, "epoch": 4243} {"train_loss": -7.063074111938477, "global_step": 178240, "epoch": 4243} {"train_loss": -6.9759111404418945, "global_step": 178241, "epoch": 4243} {"train_loss": -7.0581817626953125, "global_step": 178242, "epoch": 4243} {"train_loss": -7.06672477722168, "global_step": 178243, "epoch": 4243} {"train_loss": -6.902174949645996, "global_step": 178244, "epoch": 4243} {"train_loss": -7.145172119140625, "global_step": 178245, "epoch": 4243} {"train_loss": -7.067712306976318, "global_step": 178246, "epoch": 4243} {"train_loss": -7.081838085537865, "global_step": 178247, "epoch": 4243, "val_loss": 69348.203125} {"train_loss": -7.1689133644104, "global_step": 178248, "epoch": 4244} {"train_loss": -6.998076915740967, "global_step": 178249, "epoch": 4244} {"train_loss": -6.995062828063965, "global_step": 178250, "epoch": 4244} {"train_loss": -7.153255462646484, "global_step": 178251, "epoch": 4244} {"train_loss": -6.859369277954102, "global_step": 178252, "epoch": 4244} {"train_loss": -7.115619659423828, "global_step": 178253, "epoch": 4244} {"train_loss": -7.043322563171387, "global_step": 178254, "epoch": 4244} {"train_loss": -6.848710060119629, "global_step": 178255, "epoch": 4244} {"train_loss": -7.060108184814453, "global_step": 178256, "epoch": 4244} {"train_loss": -6.974828720092773, "global_step": 178257, "epoch": 4244} {"train_loss": -6.834922790527344, "global_step": 178258, "epoch": 4244} {"train_loss": -7.019646644592285, "global_step": 178259, "epoch": 4244} {"train_loss": -7.013606071472168, "global_step": 178260, "epoch": 4244} {"train_loss": -7.01499605178833, "global_step": 178261, "epoch": 4244} {"train_loss": -7.1118879318237305, "global_step": 178262, "epoch": 4244} {"train_loss": -7.02900505065918, "global_step": 178263, "epoch": 4244} {"train_loss": -7.058034896850586, "global_step": 178264, "epoch": 4244} {"train_loss": -7.107546329498291, "global_step": 178265, "epoch": 4244} {"train_loss": -7.087176322937012, "global_step": 178266, "epoch": 4244} {"train_loss": -7.020818710327148, "global_step": 178267, "epoch": 4244} {"train_loss": -7.076255798339844, "global_step": 178268, "epoch": 4244} {"train_loss": -7.04721736907959, "global_step": 178269, "epoch": 4244} {"train_loss": -7.0230817794799805, "global_step": 178270, "epoch": 4244} {"train_loss": -7.035358428955078, "global_step": 178271, "epoch": 4244} {"train_loss": -7.085914611816406, "global_step": 178272, "epoch": 4244} {"train_loss": -7.096657752990723, "global_step": 178273, "epoch": 4244} {"train_loss": -7.146389961242676, "global_step": 178274, "epoch": 4244} {"train_loss": -7.12162971496582, "global_step": 178275, "epoch": 4244} {"train_loss": -7.107769966125488, "global_step": 178276, "epoch": 4244} {"train_loss": -7.101426124572754, "global_step": 178277, "epoch": 4244} {"train_loss": -7.138284206390381, "global_step": 178278, "epoch": 4244} {"train_loss": -7.152333736419678, "global_step": 178279, "epoch": 4244} {"train_loss": -7.165062427520752, "global_step": 178280, "epoch": 4244} {"train_loss": -7.084202766418457, "global_step": 178281, "epoch": 4244} {"train_loss": -7.196209907531738, "global_step": 178282, "epoch": 4244} {"train_loss": -7.165499210357666, "global_step": 178283, "epoch": 4244} {"train_loss": -7.071529388427734, "global_step": 178284, "epoch": 4244} {"train_loss": -7.202359676361084, "global_step": 178285, "epoch": 4244} {"train_loss": -7.161579132080078, "global_step": 178286, "epoch": 4244} {"train_loss": -7.099194526672363, "global_step": 178287, "epoch": 4244} {"train_loss": -7.261134147644043, "global_step": 178288, "epoch": 4244} {"train_loss": -7.074514854521978, "global_step": 178289, "epoch": 4244, "val_loss": 69065.921875} {"train_loss": -7.110793113708496, "global_step": 178290, "epoch": 4245} {"train_loss": -7.236085891723633, "global_step": 178291, "epoch": 4245} {"train_loss": -7.142047882080078, "global_step": 178292, "epoch": 4245} {"train_loss": -7.184370994567871, "global_step": 178293, "epoch": 4245} {"train_loss": -7.083791732788086, "global_step": 178294, "epoch": 4245} {"train_loss": -7.161121368408203, "global_step": 178295, "epoch": 4245} {"train_loss": -7.142117500305176, "global_step": 178296, "epoch": 4245} {"train_loss": -7.117398738861084, "global_step": 178297, "epoch": 4245} {"train_loss": -7.1486358642578125, "global_step": 178298, "epoch": 4245} {"train_loss": -7.2227349281311035, "global_step": 178299, "epoch": 4245} {"train_loss": -7.21576452255249, "global_step": 178300, "epoch": 4245} {"train_loss": -7.170285224914551, "global_step": 178301, "epoch": 4245} {"train_loss": -7.107194900512695, "global_step": 178302, "epoch": 4245} {"train_loss": -7.164938926696777, "global_step": 178303, "epoch": 4245} {"train_loss": -7.033740997314453, "global_step": 178304, "epoch": 4245} {"train_loss": -7.128050327301025, "global_step": 178305, "epoch": 4245} {"train_loss": -7.148190498352051, "global_step": 178306, "epoch": 4245} {"train_loss": -7.13464879989624, "global_step": 178307, "epoch": 4245} {"train_loss": -7.133740425109863, "global_step": 178308, "epoch": 4245} {"train_loss": -7.251657962799072, "global_step": 178309, "epoch": 4245} {"train_loss": -7.063015937805176, "global_step": 178310, "epoch": 4245} {"train_loss": -7.096083641052246, "global_step": 178311, "epoch": 4245} {"train_loss": -7.343729496002197, "global_step": 178312, "epoch": 4245} {"train_loss": -7.1862030029296875, "global_step": 178313, "epoch": 4245} {"train_loss": -7.142394065856934, "global_step": 178314, "epoch": 4245} {"train_loss": -7.090040683746338, "global_step": 178315, "epoch": 4245} {"train_loss": -7.051748275756836, "global_step": 178316, "epoch": 4245} {"train_loss": -7.120168209075928, "global_step": 178317, "epoch": 4245} {"train_loss": -7.049097061157227, "global_step": 178318, "epoch": 4245} {"train_loss": -7.184286117553711, "global_step": 178319, "epoch": 4245} {"train_loss": -7.139291763305664, "global_step": 178320, "epoch": 4245} {"train_loss": -7.144033432006836, "global_step": 178321, "epoch": 4245} {"train_loss": -7.133092880249023, "global_step": 178322, "epoch": 4245} {"train_loss": -7.099983215332031, "global_step": 178323, "epoch": 4245} {"train_loss": -7.042656421661377, "global_step": 178324, "epoch": 4245} {"train_loss": -7.117645263671875, "global_step": 178325, "epoch": 4245} {"train_loss": -6.9571990966796875, "global_step": 178326, "epoch": 4245} {"train_loss": -7.0107316970825195, "global_step": 178327, "epoch": 4245} {"train_loss": -7.0464582443237305, "global_step": 178328, "epoch": 4245} {"train_loss": -6.951874732971191, "global_step": 178329, "epoch": 4245} {"train_loss": -7.006834030151367, "global_step": 178330, "epoch": 4245} {"train_loss": -7.119648286274502, "global_step": 178331, "epoch": 4245, "val_loss": 69125.234375} {"train_loss": -6.931976318359375, "global_step": 178332, "epoch": 4246} {"train_loss": -7.0140533447265625, "global_step": 178333, "epoch": 4246} {"train_loss": -6.833690643310547, "global_step": 178334, "epoch": 4246} {"train_loss": -7.0715107917785645, "global_step": 178335, "epoch": 4246} {"train_loss": -7.046186923980713, "global_step": 178336, "epoch": 4246} {"train_loss": -6.955882549285889, "global_step": 178337, "epoch": 4246} {"train_loss": -6.947580337524414, "global_step": 178338, "epoch": 4246} {"train_loss": -7.025025367736816, "global_step": 178339, "epoch": 4246} {"train_loss": -6.892331123352051, "global_step": 178340, "epoch": 4246} {"train_loss": -7.076929569244385, "global_step": 178341, "epoch": 4246} {"train_loss": -7.039480209350586, "global_step": 178342, "epoch": 4246} {"train_loss": -7.011923313140869, "global_step": 178343, "epoch": 4246} {"train_loss": -7.031152725219727, "global_step": 178344, "epoch": 4246} {"train_loss": -7.076385498046875, "global_step": 178345, "epoch": 4246} {"train_loss": -7.026588439941406, "global_step": 178346, "epoch": 4246} {"train_loss": -6.97918701171875, "global_step": 178347, "epoch": 4246} {"train_loss": -7.096782207489014, "global_step": 178348, "epoch": 4246} {"train_loss": -7.060436248779297, "global_step": 178349, "epoch": 4246} {"train_loss": -7.177828311920166, "global_step": 178350, "epoch": 4246} {"train_loss": -7.087038993835449, "global_step": 178351, "epoch": 4246} {"train_loss": -7.12172269821167, "global_step": 178352, "epoch": 4246} {"train_loss": -7.1249189376831055, "global_step": 178353, "epoch": 4246} {"train_loss": -7.114476203918457, "global_step": 178354, "epoch": 4246} {"train_loss": -7.184516906738281, "global_step": 178355, "epoch": 4246} {"train_loss": -7.0807695388793945, "global_step": 178356, "epoch": 4246} {"train_loss": -7.108377456665039, "global_step": 178357, "epoch": 4246} {"train_loss": -7.119450569152832, "global_step": 178358, "epoch": 4246} {"train_loss": -7.151844024658203, "global_step": 178359, "epoch": 4246} {"train_loss": -7.160276412963867, "global_step": 178360, "epoch": 4246} {"train_loss": -7.150077819824219, "global_step": 178361, "epoch": 4246} {"train_loss": -7.219575881958008, "global_step": 178362, "epoch": 4246} {"train_loss": -7.050748825073242, "global_step": 178363, "epoch": 4246} {"train_loss": -7.118754863739014, "global_step": 178364, "epoch": 4246} {"train_loss": -7.106498718261719, "global_step": 178365, "epoch": 4246} {"train_loss": -7.114691257476807, "global_step": 178366, "epoch": 4246} {"train_loss": -7.072843551635742, "global_step": 178367, "epoch": 4246} {"train_loss": -7.082529544830322, "global_step": 178368, "epoch": 4246} {"train_loss": -7.054175853729248, "global_step": 178369, "epoch": 4246} {"train_loss": -7.1352128982543945, "global_step": 178370, "epoch": 4246} {"train_loss": -7.189637184143066, "global_step": 178371, "epoch": 4246} {"train_loss": -7.069600582122803, "global_step": 178372, "epoch": 4246} {"train_loss": -7.071610189619518, "global_step": 178373, "epoch": 4246, "val_loss": 69233.609375} {"train_loss": -7.047898292541504, "global_step": 178374, "epoch": 4247} {"train_loss": -6.863539695739746, "global_step": 178375, "epoch": 4247} {"train_loss": -7.042779922485352, "global_step": 178376, "epoch": 4247} {"train_loss": -6.8771443367004395, "global_step": 178377, "epoch": 4247} {"train_loss": -7.0249552726745605, "global_step": 178378, "epoch": 4247} {"train_loss": -7.088888168334961, "global_step": 178379, "epoch": 4247} {"train_loss": -6.9968581199646, "global_step": 178380, "epoch": 4247} {"train_loss": -7.140937805175781, "global_step": 178381, "epoch": 4247} {"train_loss": -7.055591583251953, "global_step": 178382, "epoch": 4247} {"train_loss": -6.953274726867676, "global_step": 178383, "epoch": 4247} {"train_loss": -7.1075358390808105, "global_step": 178384, "epoch": 4247} {"train_loss": -7.106992721557617, "global_step": 178385, "epoch": 4247} {"train_loss": -6.869111061096191, "global_step": 178386, "epoch": 4247} {"train_loss": -7.025958061218262, "global_step": 178387, "epoch": 4247} {"train_loss": -6.943090915679932, "global_step": 178388, "epoch": 4247} {"train_loss": -6.867481708526611, "global_step": 178389, "epoch": 4247} {"train_loss": -7.190847396850586, "global_step": 178390, "epoch": 4247} {"train_loss": -7.011484146118164, "global_step": 178391, "epoch": 4247} {"train_loss": -7.070815563201904, "global_step": 178392, "epoch": 4247} {"train_loss": -7.1325273513793945, "global_step": 178393, "epoch": 4247} {"train_loss": -7.001636505126953, "global_step": 178394, "epoch": 4247} {"train_loss": -7.177816867828369, "global_step": 178395, "epoch": 4247} {"train_loss": -7.046111106872559, "global_step": 178396, "epoch": 4247} {"train_loss": -7.133276462554932, "global_step": 178397, "epoch": 4247} {"train_loss": -7.084524154663086, "global_step": 178398, "epoch": 4247} {"train_loss": -7.127020835876465, "global_step": 178399, "epoch": 4247} {"train_loss": -7.166892051696777, "global_step": 178400, "epoch": 4247} {"train_loss": -6.988864421844482, "global_step": 178401, "epoch": 4247} {"train_loss": -7.124063491821289, "global_step": 178402, "epoch": 4247} {"train_loss": -7.20430850982666, "global_step": 178403, "epoch": 4247} {"train_loss": -7.022345066070557, "global_step": 178404, "epoch": 4247} {"train_loss": -7.054187297821045, "global_step": 178405, "epoch": 4247} {"train_loss": -7.162799835205078, "global_step": 178406, "epoch": 4247} {"train_loss": -7.121330261230469, "global_step": 178407, "epoch": 4247} {"train_loss": -7.241635322570801, "global_step": 178408, "epoch": 4247} {"train_loss": -7.142314910888672, "global_step": 178409, "epoch": 4247} {"train_loss": -7.24411153793335, "global_step": 178410, "epoch": 4247} {"train_loss": -7.150035858154297, "global_step": 178411, "epoch": 4247} {"train_loss": -7.137569427490234, "global_step": 178412, "epoch": 4247} {"train_loss": -7.122068881988525, "global_step": 178413, "epoch": 4247} {"train_loss": -7.143136024475098, "global_step": 178414, "epoch": 4247} {"train_loss": -7.0766443865639825, "global_step": 178415, "epoch": 4247, "val_loss": 69074.125} {"train_loss": -7.129408836364746, "global_step": 178416, "epoch": 4248} {"train_loss": -7.173307418823242, "global_step": 178417, "epoch": 4248} {"train_loss": -7.259058475494385, "global_step": 178418, "epoch": 4248} {"train_loss": -7.194767951965332, "global_step": 178419, "epoch": 4248} {"train_loss": -7.1872711181640625, "global_step": 178420, "epoch": 4248} {"train_loss": -7.086297988891602, "global_step": 178421, "epoch": 4248} {"train_loss": -7.023972511291504, "global_step": 178422, "epoch": 4248} {"train_loss": -7.263665199279785, "global_step": 178423, "epoch": 4248} {"train_loss": -7.145174980163574, "global_step": 178424, "epoch": 4248} {"train_loss": -7.073507308959961, "global_step": 178425, "epoch": 4248} {"train_loss": -7.1487016677856445, "global_step": 178426, "epoch": 4248} {"train_loss": -7.1667890548706055, "global_step": 178427, "epoch": 4248} {"train_loss": -7.111931324005127, "global_step": 178428, "epoch": 4248} {"train_loss": -7.058107852935791, "global_step": 178429, "epoch": 4248} {"train_loss": -7.094537734985352, "global_step": 178430, "epoch": 4248} {"train_loss": -7.170720100402832, "global_step": 178431, "epoch": 4248} {"train_loss": -7.043333530426025, "global_step": 178432, "epoch": 4248} {"train_loss": -7.15194034576416, "global_step": 178433, "epoch": 4248} {"train_loss": -7.036984443664551, "global_step": 178434, "epoch": 4248} {"train_loss": -7.148298263549805, "global_step": 178435, "epoch": 4248} {"train_loss": -7.1214213371276855, "global_step": 178436, "epoch": 4248} {"train_loss": -7.1609039306640625, "global_step": 178437, "epoch": 4248} {"train_loss": -7.151645183563232, "global_step": 178438, "epoch": 4248} {"train_loss": -7.096169471740723, "global_step": 178439, "epoch": 4248} {"train_loss": -7.171753883361816, "global_step": 178440, "epoch": 4248} {"train_loss": -7.200272083282471, "global_step": 178441, "epoch": 4248} {"train_loss": -7.1671576499938965, "global_step": 178442, "epoch": 4248} {"train_loss": -7.1147284507751465, "global_step": 178443, "epoch": 4248} {"train_loss": -7.201246738433838, "global_step": 178444, "epoch": 4248} {"train_loss": -7.037558078765869, "global_step": 178445, "epoch": 4248} {"train_loss": -7.062836170196533, "global_step": 178446, "epoch": 4248} {"train_loss": -7.183326721191406, "global_step": 178447, "epoch": 4248} {"train_loss": -7.121466159820557, "global_step": 178448, "epoch": 4248} {"train_loss": -7.035626411437988, "global_step": 178449, "epoch": 4248} {"train_loss": -7.059218883514404, "global_step": 178450, "epoch": 4248} {"train_loss": -6.874655246734619, "global_step": 178451, "epoch": 4248} {"train_loss": -7.091219902038574, "global_step": 178452, "epoch": 4248} {"train_loss": -6.928280353546143, "global_step": 178453, "epoch": 4248} {"train_loss": -6.881190776824951, "global_step": 178454, "epoch": 4248} {"train_loss": -7.054338455200195, "global_step": 178455, "epoch": 4248} {"train_loss": -7.009461402893066, "global_step": 178456, "epoch": 4248} {"train_loss": -7.104965425672985, "global_step": 178457, "epoch": 4248, "val_loss": 69474.03125} {"train_loss": -7.0907793045043945, "global_step": 178458, "epoch": 4249} {"train_loss": -6.995074272155762, "global_step": 178459, "epoch": 4249} {"train_loss": -7.022217273712158, "global_step": 178460, "epoch": 4249} {"train_loss": -7.059450149536133, "global_step": 178461, "epoch": 4249} {"train_loss": -7.042020797729492, "global_step": 178462, "epoch": 4249} {"train_loss": -7.092449188232422, "global_step": 178463, "epoch": 4249} {"train_loss": -7.106104850769043, "global_step": 178464, "epoch": 4249} {"train_loss": -7.100816249847412, "global_step": 178465, "epoch": 4249} {"train_loss": -7.285793781280518, "global_step": 178466, "epoch": 4249} {"train_loss": -7.0928874015808105, "global_step": 178467, "epoch": 4249} {"train_loss": -7.1509222984313965, "global_step": 178468, "epoch": 4249} {"train_loss": -7.069777488708496, "global_step": 178469, "epoch": 4249} {"train_loss": -7.112932205200195, "global_step": 178470, "epoch": 4249} {"train_loss": -7.183690071105957, "global_step": 178471, "epoch": 4249} {"train_loss": -7.076466083526611, "global_step": 178472, "epoch": 4249} {"train_loss": -7.153988838195801, "global_step": 178473, "epoch": 4249} {"train_loss": -7.153400421142578, "global_step": 178474, "epoch": 4249} {"train_loss": -7.158150672912598, "global_step": 178475, "epoch": 4249} {"train_loss": -7.174954414367676, "global_step": 178476, "epoch": 4249} {"train_loss": -7.137938499450684, "global_step": 178477, "epoch": 4249} {"train_loss": -7.156846046447754, "global_step": 178478, "epoch": 4249} {"train_loss": -7.241337776184082, "global_step": 178479, "epoch": 4249} {"train_loss": -7.106584072113037, "global_step": 178480, "epoch": 4249} {"train_loss": -7.206296920776367, "global_step": 178481, "epoch": 4249} {"train_loss": -7.027019500732422, "global_step": 178482, "epoch": 4249} {"train_loss": -7.0676589012146, "global_step": 178483, "epoch": 4249} {"train_loss": -7.212014198303223, "global_step": 178484, "epoch": 4249} {"train_loss": -7.12876033782959, "global_step": 178485, "epoch": 4249} {"train_loss": -7.214444637298584, "global_step": 178486, "epoch": 4249} {"train_loss": -7.210329055786133, "global_step": 178487, "epoch": 4249} {"train_loss": -7.036910057067871, "global_step": 178488, "epoch": 4249} {"train_loss": -7.200883865356445, "global_step": 178489, "epoch": 4249} {"train_loss": -7.058518886566162, "global_step": 178490, "epoch": 4249} {"train_loss": -7.040168762207031, "global_step": 178491, "epoch": 4249} {"train_loss": -6.99899959564209, "global_step": 178492, "epoch": 4249} {"train_loss": -7.0614166259765625, "global_step": 178493, "epoch": 4249} {"train_loss": -7.026611804962158, "global_step": 178494, "epoch": 4249} {"train_loss": -7.038825988769531, "global_step": 178495, "epoch": 4249} {"train_loss": -7.106729507446289, "global_step": 178496, "epoch": 4249} {"train_loss": -7.114058494567871, "global_step": 178497, "epoch": 4249} {"train_loss": -7.054416179656982, "global_step": 178498, "epoch": 4249} {"train_loss": -7.1110782736823674, "global_step": 178499, "epoch": 4249, "val_loss": 69355.2578125} {"train_loss": -7.181924819946289, "global_step": 178500, "epoch": 4250} {"train_loss": -7.0537261962890625, "global_step": 178501, "epoch": 4250} {"train_loss": -7.17866325378418, "global_step": 178502, "epoch": 4250} {"train_loss": -7.1212158203125, "global_step": 178503, "epoch": 4250} {"train_loss": -7.133409023284912, "global_step": 178504, "epoch": 4250} {"train_loss": -7.10725212097168, "global_step": 178505, "epoch": 4250} {"train_loss": -7.180222511291504, "global_step": 178506, "epoch": 4250} {"train_loss": -7.09122371673584, "global_step": 178507, "epoch": 4250} {"train_loss": -7.051190376281738, "global_step": 178508, "epoch": 4250} {"train_loss": -7.138364791870117, "global_step": 178509, "epoch": 4250} {"train_loss": -7.110749244689941, "global_step": 178510, "epoch": 4250} {"train_loss": -7.176669120788574, "global_step": 178511, "epoch": 4250} {"train_loss": -7.07588005065918, "global_step": 178512, "epoch": 4250} {"train_loss": -7.124368190765381, "global_step": 178513, "epoch": 4250} {"train_loss": -7.029367923736572, "global_step": 178514, "epoch": 4250} {"train_loss": -7.183912754058838, "global_step": 178515, "epoch": 4250} {"train_loss": -7.181240081787109, "global_step": 178516, "epoch": 4250} {"train_loss": -7.222784519195557, "global_step": 178517, "epoch": 4250} {"train_loss": -7.126864433288574, "global_step": 178518, "epoch": 4250} {"train_loss": -7.2716264724731445, "global_step": 178519, "epoch": 4250} {"train_loss": -7.089624881744385, "global_step": 178520, "epoch": 4250} {"train_loss": -7.20907735824585, "global_step": 178521, "epoch": 4250} {"train_loss": -7.174783706665039, "global_step": 178522, "epoch": 4250} {"train_loss": -7.162799835205078, "global_step": 178523, "epoch": 4250} {"train_loss": -7.156549453735352, "global_step": 178524, "epoch": 4250} {"train_loss": -7.090010166168213, "global_step": 178525, "epoch": 4250} {"train_loss": -7.168902397155762, "global_step": 178526, "epoch": 4250} {"train_loss": -7.136224746704102, "global_step": 178527, "epoch": 4250} {"train_loss": -7.047306060791016, "global_step": 178528, "epoch": 4250} {"train_loss": -7.09437894821167, "global_step": 178529, "epoch": 4250} {"train_loss": -7.16701602935791, "global_step": 178530, "epoch": 4250} {"train_loss": -7.085789680480957, "global_step": 178531, "epoch": 4250} {"train_loss": -6.974937915802002, "global_step": 178532, "epoch": 4250} {"train_loss": -7.059764385223389, "global_step": 178533, "epoch": 4250} {"train_loss": -6.98427152633667, "global_step": 178534, "epoch": 4250} {"train_loss": -6.950343132019043, "global_step": 178535, "epoch": 4250} {"train_loss": -7.153285980224609, "global_step": 178536, "epoch": 4250} {"train_loss": -7.065709590911865, "global_step": 178537, "epoch": 4250} {"train_loss": -6.878753185272217, "global_step": 178538, "epoch": 4250} {"train_loss": -7.010447025299072, "global_step": 178539, "epoch": 4250} {"train_loss": -6.990283012390137, "global_step": 178540, "epoch": 4250} {"train_loss": -7.107477278936477, "global_step": 178541, "epoch": 4250, "train/sim_max_reward_0": 0.19050896077491392, "train/sim_max_reward_1": 0.4590578249995358, "train/sim_max_reward_2": 0.8660789416143051, "train/sim_max_reward_3": 0.9482963097869994, "train/sim_max_reward_4": 0.885032228651061, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8438476220355209, "test/sim_max_reward_4300001": 0.6019857212919519, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.961419519694425, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9921969741616126, "test/sim_max_reward_4300006": 0.9652297625907481, "test/sim_max_reward_4300007": 0.8537680024085098, "test/sim_max_reward_4300008": 0.97800534113139, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.9457537931284051, "test/sim_max_reward_4300011": 0.9958993887813689, "test/sim_max_reward_4300012": 0.8968372542859485, "test/sim_max_reward_4300013": 0.40334365015098356, "test/sim_max_reward_4300014": 0.9929566712418335, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.8548951165601109, "test/sim_max_reward_4300017": 0.40627206668936605, "test/sim_max_reward_4300018": 0.37499114036279135, "test/sim_max_reward_4300019": 0.18605428969243992, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9843681969781656, "test/sim_max_reward_4300022": 0.9929318311453884, "test/sim_max_reward_4300023": 0.9958708388545743, "test/sim_max_reward_4300024": 0.6623210210830326, "test/sim_max_reward_4300025": 0.9184315549561968, "test/sim_max_reward_4300026": 0.7629034926973465, "test/sim_max_reward_4300027": 0.9594977684614442, "test/sim_max_reward_4300028": 0.9004419135034276, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.9861700542855933, "test/sim_max_reward_4300031": 0.35716662844066555, "test/sim_max_reward_4300032": 0.989302987410133, "test/sim_max_reward_4300033": 0.9545733552761168, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.4650803642349304, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 1.0, "test/sim_max_reward_4300038": 0.38171640859330824, "test/sim_max_reward_4300039": 0.960245677541674, "test/sim_max_reward_4300040": 0.5504804805823243, "test/sim_max_reward_4300041": 0.39068466957185705, "test/sim_max_reward_4300042": 0.7049328952389918, "test/sim_max_reward_4300043": 0.144605605435894, "test/sim_max_reward_4300044": 0.9874691432916158, "test/sim_max_reward_4300045": 0.9710079135441783, "test/sim_max_reward_4300046": 0.8337230170948662, "test/sim_max_reward_4300047": 0.12932362032830932, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 1.0, "train/mean_score": 0.5903265041981671, "test/mean_score": 0.6890346794626041, "val_loss": 69159.28125} {"train_loss": -7.240617752075195, "global_step": 178542, "epoch": 4251} {"train_loss": -6.987536430358887, "global_step": 178543, "epoch": 4251} {"train_loss": -6.883506774902344, "global_step": 178544, "epoch": 4251} {"train_loss": -7.05173397064209, "global_step": 178545, "epoch": 4251} {"train_loss": -7.114527225494385, "global_step": 178546, "epoch": 4251} {"train_loss": -7.083643913269043, "global_step": 178547, "epoch": 4251} {"train_loss": -7.119969367980957, "global_step": 178548, "epoch": 4251} {"train_loss": -7.026944160461426, "global_step": 178549, "epoch": 4251} {"train_loss": -6.983840465545654, "global_step": 178550, "epoch": 4251} {"train_loss": -7.123009204864502, "global_step": 178551, "epoch": 4251} {"train_loss": -7.0466837882995605, "global_step": 178552, "epoch": 4251} {"train_loss": -7.127318382263184, "global_step": 178553, "epoch": 4251} {"train_loss": -7.053863048553467, "global_step": 178554, "epoch": 4251} {"train_loss": -6.999393939971924, "global_step": 178555, "epoch": 4251} {"train_loss": -7.022966384887695, "global_step": 178556, "epoch": 4251} {"train_loss": -6.945893287658691, "global_step": 178557, "epoch": 4251} {"train_loss": -7.034632682800293, "global_step": 178558, "epoch": 4251} {"train_loss": -7.188565731048584, "global_step": 178559, "epoch": 4251} {"train_loss": -7.045869827270508, "global_step": 178560, "epoch": 4251} {"train_loss": -7.041904926300049, "global_step": 178561, "epoch": 4251} {"train_loss": -7.166938781738281, "global_step": 178562, "epoch": 4251} {"train_loss": -7.111647605895996, "global_step": 178563, "epoch": 4251} {"train_loss": -7.011777877807617, "global_step": 178564, "epoch": 4251} {"train_loss": -7.2047119140625, "global_step": 178565, "epoch": 4251} {"train_loss": -7.074881553649902, "global_step": 178566, "epoch": 4251} {"train_loss": -7.014886379241943, "global_step": 178567, "epoch": 4251} {"train_loss": -7.206882476806641, "global_step": 178568, "epoch": 4251} {"train_loss": -7.117069244384766, "global_step": 178569, "epoch": 4251} {"train_loss": -7.004390239715576, "global_step": 178570, "epoch": 4251} {"train_loss": -7.132359027862549, "global_step": 178571, "epoch": 4251} {"train_loss": -7.0643391609191895, "global_step": 178572, "epoch": 4251} {"train_loss": -7.062798500061035, "global_step": 178573, "epoch": 4251} {"train_loss": -6.989606857299805, "global_step": 178574, "epoch": 4251} {"train_loss": -7.050187110900879, "global_step": 178575, "epoch": 4251} {"train_loss": -6.938056945800781, "global_step": 178576, "epoch": 4251} {"train_loss": -6.954838752746582, "global_step": 178577, "epoch": 4251} {"train_loss": -7.058596611022949, "global_step": 178578, "epoch": 4251} {"train_loss": -7.015417098999023, "global_step": 178579, "epoch": 4251} {"train_loss": -7.102103233337402, "global_step": 178580, "epoch": 4251} {"train_loss": -6.917716026306152, "global_step": 178581, "epoch": 4251} {"train_loss": -7.134095191955566, "global_step": 178582, "epoch": 4251} {"train_loss": -7.0583763009025935, "global_step": 178583, "epoch": 4251, "val_loss": 69484.21875} {"train_loss": -7.082254409790039, "global_step": 178584, "epoch": 4252} {"train_loss": -6.985513210296631, "global_step": 178585, "epoch": 4252} {"train_loss": -6.808566093444824, "global_step": 178586, "epoch": 4252} {"train_loss": -6.803841590881348, "global_step": 178587, "epoch": 4252} {"train_loss": -6.8569536209106445, "global_step": 178588, "epoch": 4252} {"train_loss": -6.983110427856445, "global_step": 178589, "epoch": 4252} {"train_loss": -7.002694129943848, "global_step": 178590, "epoch": 4252} {"train_loss": -6.899402618408203, "global_step": 178591, "epoch": 4252} {"train_loss": -7.044318199157715, "global_step": 178592, "epoch": 4252} {"train_loss": -6.924795627593994, "global_step": 178593, "epoch": 4252} {"train_loss": -7.014303207397461, "global_step": 178594, "epoch": 4252} {"train_loss": -6.9564361572265625, "global_step": 178595, "epoch": 4252} {"train_loss": -7.096344470977783, "global_step": 178596, "epoch": 4252} {"train_loss": -7.007925987243652, "global_step": 178597, "epoch": 4252} {"train_loss": -7.008419036865234, "global_step": 178598, "epoch": 4252} {"train_loss": -7.024351119995117, "global_step": 178599, "epoch": 4252} {"train_loss": -7.150196075439453, "global_step": 178600, "epoch": 4252} {"train_loss": -7.075193405151367, "global_step": 178601, "epoch": 4252} {"train_loss": -6.917302131652832, "global_step": 178602, "epoch": 4252} {"train_loss": -7.155627250671387, "global_step": 178603, "epoch": 4252} {"train_loss": -7.1237897872924805, "global_step": 178604, "epoch": 4252} {"train_loss": -7.093511581420898, "global_step": 178605, "epoch": 4252} {"train_loss": -7.079647541046143, "global_step": 178606, "epoch": 4252} {"train_loss": -7.1013898849487305, "global_step": 178607, "epoch": 4252} {"train_loss": -7.184530258178711, "global_step": 178608, "epoch": 4252} {"train_loss": -7.159232139587402, "global_step": 178609, "epoch": 4252} {"train_loss": -7.145070552825928, "global_step": 178610, "epoch": 4252} {"train_loss": -7.223817348480225, "global_step": 178611, "epoch": 4252} {"train_loss": -7.0833845138549805, "global_step": 178612, "epoch": 4252} {"train_loss": -7.043810844421387, "global_step": 178613, "epoch": 4252} {"train_loss": -7.130108833312988, "global_step": 178614, "epoch": 4252} {"train_loss": -7.208902359008789, "global_step": 178615, "epoch": 4252} {"train_loss": -7.121797561645508, "global_step": 178616, "epoch": 4252} {"train_loss": -7.120761871337891, "global_step": 178617, "epoch": 4252} {"train_loss": -7.130644798278809, "global_step": 178618, "epoch": 4252} {"train_loss": -6.95832633972168, "global_step": 178619, "epoch": 4252} {"train_loss": -7.032514572143555, "global_step": 178620, "epoch": 4252} {"train_loss": -7.088335990905762, "global_step": 178621, "epoch": 4252} {"train_loss": -7.081879615783691, "global_step": 178622, "epoch": 4252} {"train_loss": -7.125744819641113, "global_step": 178623, "epoch": 4252} {"train_loss": -7.091755390167236, "global_step": 178624, "epoch": 4252} {"train_loss": -7.0520567780449275, "global_step": 178625, "epoch": 4252, "val_loss": 69405.7578125} {"train_loss": -7.10027551651001, "global_step": 178626, "epoch": 4253} {"train_loss": -7.1369428634643555, "global_step": 178627, "epoch": 4253} {"train_loss": -7.181343078613281, "global_step": 178628, "epoch": 4253} {"train_loss": -6.987138271331787, "global_step": 178629, "epoch": 4253} {"train_loss": -7.133474349975586, "global_step": 178630, "epoch": 4253} {"train_loss": -7.082972526550293, "global_step": 178631, "epoch": 4253} {"train_loss": -6.893157005310059, "global_step": 178632, "epoch": 4253} {"train_loss": -7.17232084274292, "global_step": 178633, "epoch": 4253} {"train_loss": -7.010825157165527, "global_step": 178634, "epoch": 4253} {"train_loss": -7.0966081619262695, "global_step": 178635, "epoch": 4253} {"train_loss": -6.954278945922852, "global_step": 178636, "epoch": 4253} {"train_loss": -7.0104169845581055, "global_step": 178637, "epoch": 4253} {"train_loss": -7.036527156829834, "global_step": 178638, "epoch": 4253} {"train_loss": -7.022387981414795, "global_step": 178639, "epoch": 4253} {"train_loss": -7.104465961456299, "global_step": 178640, "epoch": 4253} {"train_loss": -7.133927345275879, "global_step": 178641, "epoch": 4253} {"train_loss": -7.024066925048828, "global_step": 178642, "epoch": 4253} {"train_loss": -6.959946632385254, "global_step": 178643, "epoch": 4253} {"train_loss": -6.861825942993164, "global_step": 178644, "epoch": 4253} {"train_loss": -7.02115535736084, "global_step": 178645, "epoch": 4253} {"train_loss": -6.937530040740967, "global_step": 178646, "epoch": 4253} {"train_loss": -6.967743396759033, "global_step": 178647, "epoch": 4253} {"train_loss": -6.904813289642334, "global_step": 178648, "epoch": 4253} {"train_loss": -6.891536235809326, "global_step": 178649, "epoch": 4253} {"train_loss": -7.02700662612915, "global_step": 178650, "epoch": 4253} {"train_loss": -7.072524070739746, "global_step": 178651, "epoch": 4253} {"train_loss": -6.981764793395996, "global_step": 178652, "epoch": 4253} {"train_loss": -7.116851806640625, "global_step": 178653, "epoch": 4253} {"train_loss": -6.922799110412598, "global_step": 178654, "epoch": 4253} {"train_loss": -7.151163578033447, "global_step": 178655, "epoch": 4253} {"train_loss": -6.990752220153809, "global_step": 178656, "epoch": 4253} {"train_loss": -7.092210292816162, "global_step": 178657, "epoch": 4253} {"train_loss": -7.023663520812988, "global_step": 178658, "epoch": 4253} {"train_loss": -7.114326477050781, "global_step": 178659, "epoch": 4253} {"train_loss": -6.963461875915527, "global_step": 178660, "epoch": 4253} {"train_loss": -7.063872337341309, "global_step": 178661, "epoch": 4253} {"train_loss": -7.018004417419434, "global_step": 178662, "epoch": 4253} {"train_loss": -7.010101318359375, "global_step": 178663, "epoch": 4253} {"train_loss": -7.067806720733643, "global_step": 178664, "epoch": 4253} {"train_loss": -6.866166114807129, "global_step": 178665, "epoch": 4253} {"train_loss": -7.198180675506592, "global_step": 178666, "epoch": 4253} {"train_loss": -7.031561170305524, "global_step": 178667, "epoch": 4253, "val_loss": 69244.875} {"train_loss": -7.0579915046691895, "global_step": 178668, "epoch": 4254} {"train_loss": -7.013399600982666, "global_step": 178669, "epoch": 4254} {"train_loss": -7.008620262145996, "global_step": 178670, "epoch": 4254} {"train_loss": -7.060066223144531, "global_step": 178671, "epoch": 4254} {"train_loss": -7.076565742492676, "global_step": 178672, "epoch": 4254} {"train_loss": -7.082362651824951, "global_step": 178673, "epoch": 4254} {"train_loss": -7.117705345153809, "global_step": 178674, "epoch": 4254} {"train_loss": -7.05767822265625, "global_step": 178675, "epoch": 4254} {"train_loss": -7.12033224105835, "global_step": 178676, "epoch": 4254} {"train_loss": -7.06027364730835, "global_step": 178677, "epoch": 4254} {"train_loss": -7.157166481018066, "global_step": 178678, "epoch": 4254} {"train_loss": -7.165503978729248, "global_step": 178679, "epoch": 4254} {"train_loss": -7.173064231872559, "global_step": 178680, "epoch": 4254} {"train_loss": -7.108757019042969, "global_step": 178681, "epoch": 4254} {"train_loss": -7.0759382247924805, "global_step": 178682, "epoch": 4254} {"train_loss": -7.141939163208008, "global_step": 178683, "epoch": 4254} {"train_loss": -7.225069999694824, "global_step": 178684, "epoch": 4254} {"train_loss": -7.145406723022461, "global_step": 178685, "epoch": 4254} {"train_loss": -7.145151138305664, "global_step": 178686, "epoch": 4254} {"train_loss": -7.084892272949219, "global_step": 178687, "epoch": 4254} {"train_loss": -7.176444053649902, "global_step": 178688, "epoch": 4254} {"train_loss": -7.11484432220459, "global_step": 178689, "epoch": 4254} {"train_loss": -7.199084281921387, "global_step": 178690, "epoch": 4254} {"train_loss": -7.219332695007324, "global_step": 178691, "epoch": 4254} {"train_loss": -7.257669925689697, "global_step": 178692, "epoch": 4254} {"train_loss": -7.028132438659668, "global_step": 178693, "epoch": 4254} {"train_loss": -7.096752166748047, "global_step": 178694, "epoch": 4254} {"train_loss": -7.218879699707031, "global_step": 178695, "epoch": 4254} {"train_loss": -7.010833740234375, "global_step": 178696, "epoch": 4254} {"train_loss": -7.132000923156738, "global_step": 178697, "epoch": 4254} {"train_loss": -7.025485992431641, "global_step": 178698, "epoch": 4254} {"train_loss": -7.073978900909424, "global_step": 178699, "epoch": 4254} {"train_loss": -7.100996971130371, "global_step": 178700, "epoch": 4254} {"train_loss": -7.113465309143066, "global_step": 178701, "epoch": 4254} {"train_loss": -7.21451473236084, "global_step": 178702, "epoch": 4254} {"train_loss": -7.124874114990234, "global_step": 178703, "epoch": 4254} {"train_loss": -7.134832382202148, "global_step": 178704, "epoch": 4254} {"train_loss": -7.157414436340332, "global_step": 178705, "epoch": 4254} {"train_loss": -7.172747611999512, "global_step": 178706, "epoch": 4254} {"train_loss": -7.063912868499756, "global_step": 178707, "epoch": 4254} {"train_loss": -7.1829023361206055, "global_step": 178708, "epoch": 4254} {"train_loss": -7.120008230209351, "global_step": 178709, "epoch": 4254, "val_loss": 69125.4921875} {"train_loss": -7.160803318023682, "global_step": 178710, "epoch": 4255} {"train_loss": -7.1789350509643555, "global_step": 178711, "epoch": 4255} {"train_loss": -7.178753852844238, "global_step": 178712, "epoch": 4255} {"train_loss": -7.102775573730469, "global_step": 178713, "epoch": 4255} {"train_loss": -7.215028762817383, "global_step": 178714, "epoch": 4255} {"train_loss": -7.145908832550049, "global_step": 178715, "epoch": 4255} {"train_loss": -7.130307197570801, "global_step": 178716, "epoch": 4255} {"train_loss": -7.271276473999023, "global_step": 178717, "epoch": 4255} {"train_loss": -7.221051216125488, "global_step": 178718, "epoch": 4255} {"train_loss": -7.056563377380371, "global_step": 178719, "epoch": 4255} {"train_loss": -7.243503570556641, "global_step": 178720, "epoch": 4255} {"train_loss": -7.246642589569092, "global_step": 178721, "epoch": 4255} {"train_loss": -7.157573223114014, "global_step": 178722, "epoch": 4255} {"train_loss": -7.208733558654785, "global_step": 178723, "epoch": 4255} {"train_loss": -7.099549770355225, "global_step": 178724, "epoch": 4255} {"train_loss": -7.128520965576172, "global_step": 178725, "epoch": 4255} {"train_loss": -7.165693283081055, "global_step": 178726, "epoch": 4255} {"train_loss": -7.142224311828613, "global_step": 178727, "epoch": 4255} {"train_loss": -7.161793231964111, "global_step": 178728, "epoch": 4255} {"train_loss": -7.299739360809326, "global_step": 178729, "epoch": 4255} {"train_loss": -7.264190673828125, "global_step": 178730, "epoch": 4255} {"train_loss": -7.075178146362305, "global_step": 178731, "epoch": 4255} {"train_loss": -7.219573020935059, "global_step": 178732, "epoch": 4255} {"train_loss": -7.179117202758789, "global_step": 178733, "epoch": 4255} {"train_loss": -7.1370134353637695, "global_step": 178734, "epoch": 4255} {"train_loss": -7.2388739585876465, "global_step": 178735, "epoch": 4255} {"train_loss": -7.163701057434082, "global_step": 178736, "epoch": 4255} {"train_loss": -7.279477119445801, "global_step": 178737, "epoch": 4255} {"train_loss": -7.1084065437316895, "global_step": 178738, "epoch": 4255} {"train_loss": -7.164752006530762, "global_step": 178739, "epoch": 4255} {"train_loss": -7.185970306396484, "global_step": 178740, "epoch": 4255} {"train_loss": -7.186121463775635, "global_step": 178741, "epoch": 4255} {"train_loss": -7.247128009796143, "global_step": 178742, "epoch": 4255} {"train_loss": -7.214062213897705, "global_step": 178743, "epoch": 4255} {"train_loss": -7.118620872497559, "global_step": 178744, "epoch": 4255} {"train_loss": -7.224566459655762, "global_step": 178745, "epoch": 4255} {"train_loss": -7.076282978057861, "global_step": 178746, "epoch": 4255} {"train_loss": -7.301866054534912, "global_step": 178747, "epoch": 4255} {"train_loss": -7.026899337768555, "global_step": 178748, "epoch": 4255} {"train_loss": -7.050116062164307, "global_step": 178749, "epoch": 4255} {"train_loss": -7.1383209228515625, "global_step": 178750, "epoch": 4255} {"train_loss": -7.17269964445205, "global_step": 178751, "epoch": 4255, "val_loss": 69175.640625} {"train_loss": -7.130815505981445, "global_step": 178752, "epoch": 4256} {"train_loss": -7.210482597351074, "global_step": 178753, "epoch": 4256} {"train_loss": -7.033343315124512, "global_step": 178754, "epoch": 4256} {"train_loss": -7.134553909301758, "global_step": 178755, "epoch": 4256} {"train_loss": -7.213312149047852, "global_step": 178756, "epoch": 4256} {"train_loss": -7.097761154174805, "global_step": 178757, "epoch": 4256} {"train_loss": -6.987447738647461, "global_step": 178758, "epoch": 4256} {"train_loss": -7.047452449798584, "global_step": 178759, "epoch": 4256} {"train_loss": -7.111842632293701, "global_step": 178760, "epoch": 4256} {"train_loss": -7.108050346374512, "global_step": 178761, "epoch": 4256} {"train_loss": -7.161293983459473, "global_step": 178762, "epoch": 4256} {"train_loss": -7.096173286437988, "global_step": 178763, "epoch": 4256} {"train_loss": -7.041435241699219, "global_step": 178764, "epoch": 4256} {"train_loss": -7.117269515991211, "global_step": 178765, "epoch": 4256} {"train_loss": -7.09848165512085, "global_step": 178766, "epoch": 4256} {"train_loss": -7.131412982940674, "global_step": 178767, "epoch": 4256} {"train_loss": -7.144909858703613, "global_step": 178768, "epoch": 4256} {"train_loss": -7.07523775100708, "global_step": 178769, "epoch": 4256} {"train_loss": -7.091641902923584, "global_step": 178770, "epoch": 4256} {"train_loss": -7.001440048217773, "global_step": 178771, "epoch": 4256} {"train_loss": -6.972992897033691, "global_step": 178772, "epoch": 4256} {"train_loss": -7.004490852355957, "global_step": 178773, "epoch": 4256} {"train_loss": -7.065569877624512, "global_step": 178774, "epoch": 4256} {"train_loss": -7.124239921569824, "global_step": 178775, "epoch": 4256} {"train_loss": -7.17116117477417, "global_step": 178776, "epoch": 4256} {"train_loss": -6.9571990966796875, "global_step": 178777, "epoch": 4256} {"train_loss": -7.040046691894531, "global_step": 178778, "epoch": 4256} {"train_loss": -6.985057830810547, "global_step": 178779, "epoch": 4256} {"train_loss": -7.013951301574707, "global_step": 178780, "epoch": 4256} {"train_loss": -7.021590232849121, "global_step": 178781, "epoch": 4256} {"train_loss": -6.938907623291016, "global_step": 178782, "epoch": 4256} {"train_loss": -6.9352335929870605, "global_step": 178783, "epoch": 4256} {"train_loss": -6.914275646209717, "global_step": 178784, "epoch": 4256} {"train_loss": -6.905369758605957, "global_step": 178785, "epoch": 4256} {"train_loss": -7.016020774841309, "global_step": 178786, "epoch": 4256} {"train_loss": -6.769096851348877, "global_step": 178787, "epoch": 4256} {"train_loss": -7.002439975738525, "global_step": 178788, "epoch": 4256} {"train_loss": -6.855039596557617, "global_step": 178789, "epoch": 4256} {"train_loss": -6.959582328796387, "global_step": 178790, "epoch": 4256} {"train_loss": -6.976407527923584, "global_step": 178791, "epoch": 4256} {"train_loss": -6.984156608581543, "global_step": 178792, "epoch": 4256} {"train_loss": -7.040745814641316, "global_step": 178793, "epoch": 4256, "val_loss": 69286.4375} {"train_loss": -6.90570068359375, "global_step": 178794, "epoch": 4257} {"train_loss": -6.955909729003906, "global_step": 178795, "epoch": 4257} {"train_loss": -6.960719585418701, "global_step": 178796, "epoch": 4257} {"train_loss": -6.974653244018555, "global_step": 178797, "epoch": 4257} {"train_loss": -7.078533172607422, "global_step": 178798, "epoch": 4257} {"train_loss": -7.018777847290039, "global_step": 178799, "epoch": 4257} {"train_loss": -7.018111228942871, "global_step": 178800, "epoch": 4257} {"train_loss": -7.067322254180908, "global_step": 178801, "epoch": 4257} {"train_loss": -6.975612640380859, "global_step": 178802, "epoch": 4257} {"train_loss": -6.973071098327637, "global_step": 178803, "epoch": 4257} {"train_loss": -6.951948165893555, "global_step": 178804, "epoch": 4257} {"train_loss": -7.0314435958862305, "global_step": 178805, "epoch": 4257} {"train_loss": -7.122042655944824, "global_step": 178806, "epoch": 4257} {"train_loss": -7.030282974243164, "global_step": 178807, "epoch": 4257} {"train_loss": -6.95420503616333, "global_step": 178808, "epoch": 4257} {"train_loss": -7.085016250610352, "global_step": 178809, "epoch": 4257} {"train_loss": -7.091019630432129, "global_step": 178810, "epoch": 4257} {"train_loss": -7.128540992736816, "global_step": 178811, "epoch": 4257} {"train_loss": -6.969541549682617, "global_step": 178812, "epoch": 4257} {"train_loss": -6.994938373565674, "global_step": 178813, "epoch": 4257} {"train_loss": -7.162294387817383, "global_step": 178814, "epoch": 4257} {"train_loss": -7.151518821716309, "global_step": 178815, "epoch": 4257} {"train_loss": -7.196542263031006, "global_step": 178816, "epoch": 4257} {"train_loss": -7.1728620529174805, "global_step": 178817, "epoch": 4257} {"train_loss": -7.128551006317139, "global_step": 178818, "epoch": 4257} {"train_loss": -7.07650089263916, "global_step": 178819, "epoch": 4257} {"train_loss": -7.140692710876465, "global_step": 178820, "epoch": 4257} {"train_loss": -7.133512020111084, "global_step": 178821, "epoch": 4257} {"train_loss": -7.148656845092773, "global_step": 178822, "epoch": 4257} {"train_loss": -7.018120765686035, "global_step": 178823, "epoch": 4257} {"train_loss": -7.237142562866211, "global_step": 178824, "epoch": 4257} {"train_loss": -7.069769859313965, "global_step": 178825, "epoch": 4257} {"train_loss": -7.2583513259887695, "global_step": 178826, "epoch": 4257} {"train_loss": -7.202948570251465, "global_step": 178827, "epoch": 4257} {"train_loss": -7.249856948852539, "global_step": 178828, "epoch": 4257} {"train_loss": -7.190308570861816, "global_step": 178829, "epoch": 4257} {"train_loss": -7.20902681350708, "global_step": 178830, "epoch": 4257} {"train_loss": -7.054770469665527, "global_step": 178831, "epoch": 4257} {"train_loss": -7.128403186798096, "global_step": 178832, "epoch": 4257} {"train_loss": -7.17880392074585, "global_step": 178833, "epoch": 4257} {"train_loss": -7.102710247039795, "global_step": 178834, "epoch": 4257} {"train_loss": -7.084025314876011, "global_step": 178835, "epoch": 4257, "val_loss": 69172.8984375} {"train_loss": -7.303755760192871, "global_step": 178836, "epoch": 4258} {"train_loss": -7.238787651062012, "global_step": 178837, "epoch": 4258} {"train_loss": -7.125906467437744, "global_step": 178838, "epoch": 4258} {"train_loss": -7.086994647979736, "global_step": 178839, "epoch": 4258} {"train_loss": -7.115485191345215, "global_step": 178840, "epoch": 4258} {"train_loss": -7.089101791381836, "global_step": 178841, "epoch": 4258} {"train_loss": -7.213898658752441, "global_step": 178842, "epoch": 4258} {"train_loss": -7.076478958129883, "global_step": 178843, "epoch": 4258} {"train_loss": -7.124861717224121, "global_step": 178844, "epoch": 4258} {"train_loss": -7.255201816558838, "global_step": 178845, "epoch": 4258} {"train_loss": -7.108160972595215, "global_step": 178846, "epoch": 4258} {"train_loss": -7.264533996582031, "global_step": 178847, "epoch": 4258} {"train_loss": -7.161964416503906, "global_step": 178848, "epoch": 4258} {"train_loss": -7.102267265319824, "global_step": 178849, "epoch": 4258} {"train_loss": -7.012076377868652, "global_step": 178850, "epoch": 4258} {"train_loss": -7.181652069091797, "global_step": 178851, "epoch": 4258} {"train_loss": -7.104212760925293, "global_step": 178852, "epoch": 4258} {"train_loss": -7.056422710418701, "global_step": 178853, "epoch": 4258} {"train_loss": -7.210707187652588, "global_step": 178854, "epoch": 4258} {"train_loss": -7.135099411010742, "global_step": 178855, "epoch": 4258} {"train_loss": -7.063324451446533, "global_step": 178856, "epoch": 4258} {"train_loss": -7.075829029083252, "global_step": 178857, "epoch": 4258} {"train_loss": -7.169534206390381, "global_step": 178858, "epoch": 4258} {"train_loss": -7.177639961242676, "global_step": 178859, "epoch": 4258} {"train_loss": -7.182307243347168, "global_step": 178860, "epoch": 4258} {"train_loss": -7.144612789154053, "global_step": 178861, "epoch": 4258} {"train_loss": -7.151655673980713, "global_step": 178862, "epoch": 4258} {"train_loss": -7.099318504333496, "global_step": 178863, "epoch": 4258} {"train_loss": -7.129575729370117, "global_step": 178864, "epoch": 4258} {"train_loss": -7.116209030151367, "global_step": 178865, "epoch": 4258} {"train_loss": -7.037718296051025, "global_step": 178866, "epoch": 4258} {"train_loss": -7.211536884307861, "global_step": 178867, "epoch": 4258} {"train_loss": -7.006281852722168, "global_step": 178868, "epoch": 4258} {"train_loss": -7.073592185974121, "global_step": 178869, "epoch": 4258} {"train_loss": -7.098879814147949, "global_step": 178870, "epoch": 4258} {"train_loss": -7.034519195556641, "global_step": 178871, "epoch": 4258} {"train_loss": -7.087037563323975, "global_step": 178872, "epoch": 4258} {"train_loss": -7.043701648712158, "global_step": 178873, "epoch": 4258} {"train_loss": -6.806403160095215, "global_step": 178874, "epoch": 4258} {"train_loss": -7.098016738891602, "global_step": 178875, "epoch": 4258} {"train_loss": -7.115322113037109, "global_step": 178876, "epoch": 4258} {"train_loss": -7.114706516265869, "global_step": 178877, "epoch": 4258, "val_loss": 69273.453125} {"train_loss": -7.067695617675781, "global_step": 178878, "epoch": 4259} {"train_loss": -6.946468353271484, "global_step": 178879, "epoch": 4259} {"train_loss": -6.930883407592773, "global_step": 178880, "epoch": 4259} {"train_loss": -7.061929702758789, "global_step": 178881, "epoch": 4259} {"train_loss": -7.009283065795898, "global_step": 178882, "epoch": 4259} {"train_loss": -7.142909049987793, "global_step": 178883, "epoch": 4259} {"train_loss": -7.074528694152832, "global_step": 178884, "epoch": 4259} {"train_loss": -7.046852111816406, "global_step": 178885, "epoch": 4259} {"train_loss": -7.113546371459961, "global_step": 178886, "epoch": 4259} {"train_loss": -7.060983657836914, "global_step": 178887, "epoch": 4259} {"train_loss": -7.099462985992432, "global_step": 178888, "epoch": 4259} {"train_loss": -7.074338912963867, "global_step": 178889, "epoch": 4259} {"train_loss": -7.047118663787842, "global_step": 178890, "epoch": 4259} {"train_loss": -7.127266883850098, "global_step": 178891, "epoch": 4259} {"train_loss": -7.0111494064331055, "global_step": 178892, "epoch": 4259} {"train_loss": -7.215390205383301, "global_step": 178893, "epoch": 4259} {"train_loss": -7.067444324493408, "global_step": 178894, "epoch": 4259} {"train_loss": -7.122157573699951, "global_step": 178895, "epoch": 4259} {"train_loss": -7.171355724334717, "global_step": 178896, "epoch": 4259} {"train_loss": -7.143542289733887, "global_step": 178897, "epoch": 4259} {"train_loss": -7.136020660400391, "global_step": 178898, "epoch": 4259} {"train_loss": -7.085206031799316, "global_step": 178899, "epoch": 4259} {"train_loss": -6.963875770568848, "global_step": 178900, "epoch": 4259} {"train_loss": -7.083891868591309, "global_step": 178901, "epoch": 4259} {"train_loss": -7.176758289337158, "global_step": 178902, "epoch": 4259} {"train_loss": -7.0687055587768555, "global_step": 178903, "epoch": 4259} {"train_loss": -7.051837921142578, "global_step": 178904, "epoch": 4259} {"train_loss": -7.05512809753418, "global_step": 178905, "epoch": 4259} {"train_loss": -7.04651403427124, "global_step": 178906, "epoch": 4259} {"train_loss": -7.0813493728637695, "global_step": 178907, "epoch": 4259} {"train_loss": -7.079609394073486, "global_step": 178908, "epoch": 4259} {"train_loss": -7.068398475646973, "global_step": 178909, "epoch": 4259} {"train_loss": -7.11688232421875, "global_step": 178910, "epoch": 4259} {"train_loss": -7.102799415588379, "global_step": 178911, "epoch": 4259} {"train_loss": -6.9609055519104, "global_step": 178912, "epoch": 4259} {"train_loss": -7.055310249328613, "global_step": 178913, "epoch": 4259} {"train_loss": -7.19065523147583, "global_step": 178914, "epoch": 4259} {"train_loss": -7.085113048553467, "global_step": 178915, "epoch": 4259} {"train_loss": -7.133051872253418, "global_step": 178916, "epoch": 4259} {"train_loss": -7.183099746704102, "global_step": 178917, "epoch": 4259} {"train_loss": -7.057459354400635, "global_step": 178918, "epoch": 4259} {"train_loss": -7.079907678422474, "global_step": 178919, "epoch": 4259, "val_loss": 69333.2734375} {"train_loss": -7.004709243774414, "global_step": 178920, "epoch": 4260} {"train_loss": -6.998856544494629, "global_step": 178921, "epoch": 4260} {"train_loss": -7.038506507873535, "global_step": 178922, "epoch": 4260} {"train_loss": -6.971465110778809, "global_step": 178923, "epoch": 4260} {"train_loss": -7.05949068069458, "global_step": 178924, "epoch": 4260} {"train_loss": -7.117838382720947, "global_step": 178925, "epoch": 4260} {"train_loss": -7.0684356689453125, "global_step": 178926, "epoch": 4260} {"train_loss": -7.07621431350708, "global_step": 178927, "epoch": 4260} {"train_loss": -7.002995014190674, "global_step": 178928, "epoch": 4260} {"train_loss": -7.175395488739014, "global_step": 178929, "epoch": 4260} {"train_loss": -7.064912796020508, "global_step": 178930, "epoch": 4260} {"train_loss": -7.1631879806518555, "global_step": 178931, "epoch": 4260} {"train_loss": -7.070574760437012, "global_step": 178932, "epoch": 4260} {"train_loss": -7.087891578674316, "global_step": 178933, "epoch": 4260} {"train_loss": -7.043595790863037, "global_step": 178934, "epoch": 4260} {"train_loss": -7.144608497619629, "global_step": 178935, "epoch": 4260} {"train_loss": -6.942938327789307, "global_step": 178936, "epoch": 4260} {"train_loss": -7.046719074249268, "global_step": 178937, "epoch": 4260} {"train_loss": -7.095646858215332, "global_step": 178938, "epoch": 4260} {"train_loss": -6.998786926269531, "global_step": 178939, "epoch": 4260} {"train_loss": -7.018653392791748, "global_step": 178940, "epoch": 4260} {"train_loss": -7.023857116699219, "global_step": 178941, "epoch": 4260} {"train_loss": -7.0985107421875, "global_step": 178942, "epoch": 4260} {"train_loss": -7.080905437469482, "global_step": 178943, "epoch": 4260} {"train_loss": -7.048172950744629, "global_step": 178944, "epoch": 4260} {"train_loss": -7.081408500671387, "global_step": 178945, "epoch": 4260} {"train_loss": -7.083163261413574, "global_step": 178946, "epoch": 4260} {"train_loss": -7.0134148597717285, "global_step": 178947, "epoch": 4260} {"train_loss": -7.21387243270874, "global_step": 178948, "epoch": 4260} {"train_loss": -7.0558929443359375, "global_step": 178949, "epoch": 4260} {"train_loss": -7.067922592163086, "global_step": 178950, "epoch": 4260} {"train_loss": -7.132271766662598, "global_step": 178951, "epoch": 4260} {"train_loss": -7.101518154144287, "global_step": 178952, "epoch": 4260} {"train_loss": -7.128908157348633, "global_step": 178953, "epoch": 4260} {"train_loss": -7.1271820068359375, "global_step": 178954, "epoch": 4260} {"train_loss": -7.179728984832764, "global_step": 178955, "epoch": 4260} {"train_loss": -7.26885986328125, "global_step": 178956, "epoch": 4260} {"train_loss": -7.243661403656006, "global_step": 178957, "epoch": 4260} {"train_loss": -7.126631259918213, "global_step": 178958, "epoch": 4260} {"train_loss": -7.236449718475342, "global_step": 178959, "epoch": 4260} {"train_loss": -7.1908650398254395, "global_step": 178960, "epoch": 4260} {"train_loss": -7.0917856352669855, "global_step": 178961, "epoch": 4260, "val_loss": 69183.0859375} {"train_loss": -7.120492458343506, "global_step": 178962, "epoch": 4261} {"train_loss": -7.149176597595215, "global_step": 178963, "epoch": 4261} {"train_loss": -7.143179893493652, "global_step": 178964, "epoch": 4261} {"train_loss": -7.139270782470703, "global_step": 178965, "epoch": 4261} {"train_loss": -7.18735408782959, "global_step": 178966, "epoch": 4261} {"train_loss": -7.205994606018066, "global_step": 178967, "epoch": 4261} {"train_loss": -7.1235198974609375, "global_step": 178968, "epoch": 4261} {"train_loss": -7.074799537658691, "global_step": 178969, "epoch": 4261} {"train_loss": -7.064701557159424, "global_step": 178970, "epoch": 4261} {"train_loss": -7.188963890075684, "global_step": 178971, "epoch": 4261} {"train_loss": -7.109999656677246, "global_step": 178972, "epoch": 4261} {"train_loss": -7.231639862060547, "global_step": 178973, "epoch": 4261} {"train_loss": -7.13529634475708, "global_step": 178974, "epoch": 4261} {"train_loss": -7.189267158508301, "global_step": 178975, "epoch": 4261} {"train_loss": -7.232452392578125, "global_step": 178976, "epoch": 4261} {"train_loss": -7.176377296447754, "global_step": 178977, "epoch": 4261} {"train_loss": -7.016277313232422, "global_step": 178978, "epoch": 4261} {"train_loss": -7.210599422454834, "global_step": 178979, "epoch": 4261} {"train_loss": -7.0976762771606445, "global_step": 178980, "epoch": 4261} {"train_loss": -7.2375993728637695, "global_step": 178981, "epoch": 4261} {"train_loss": -7.067609786987305, "global_step": 178982, "epoch": 4261} {"train_loss": -7.139366149902344, "global_step": 178983, "epoch": 4261} {"train_loss": -7.13701057434082, "global_step": 178984, "epoch": 4261} {"train_loss": -7.128260612487793, "global_step": 178985, "epoch": 4261} {"train_loss": -7.135010719299316, "global_step": 178986, "epoch": 4261} {"train_loss": -7.019218921661377, "global_step": 178987, "epoch": 4261} {"train_loss": -7.113835334777832, "global_step": 178988, "epoch": 4261} {"train_loss": -7.146238327026367, "global_step": 178989, "epoch": 4261} {"train_loss": -7.080430030822754, "global_step": 178990, "epoch": 4261} {"train_loss": -7.0895094871521, "global_step": 178991, "epoch": 4261} {"train_loss": -7.134454250335693, "global_step": 178992, "epoch": 4261} {"train_loss": -7.182168960571289, "global_step": 178993, "epoch": 4261} {"train_loss": -7.075466156005859, "global_step": 178994, "epoch": 4261} {"train_loss": -7.161590576171875, "global_step": 178995, "epoch": 4261} {"train_loss": -7.058084487915039, "global_step": 178996, "epoch": 4261} {"train_loss": -7.085601806640625, "global_step": 178997, "epoch": 4261} {"train_loss": -6.980676174163818, "global_step": 178998, "epoch": 4261} {"train_loss": -6.933138847351074, "global_step": 178999, "epoch": 4261} {"train_loss": -7.120723724365234, "global_step": 179000, "epoch": 4261} {"train_loss": -7.104821681976318, "global_step": 179001, "epoch": 4261} {"train_loss": -7.096107006072998, "global_step": 179002, "epoch": 4261} {"train_loss": -7.120166744504656, "global_step": 179003, "epoch": 4261, "val_loss": 69407.046875} {"train_loss": -7.077286243438721, "global_step": 179004, "epoch": 4262} {"train_loss": -7.13223934173584, "global_step": 179005, "epoch": 4262} {"train_loss": -7.003124237060547, "global_step": 179006, "epoch": 4262} {"train_loss": -7.046847343444824, "global_step": 179007, "epoch": 4262} {"train_loss": -7.166128158569336, "global_step": 179008, "epoch": 4262} {"train_loss": -7.166054725646973, "global_step": 179009, "epoch": 4262} {"train_loss": -7.136446952819824, "global_step": 179010, "epoch": 4262} {"train_loss": -7.230280876159668, "global_step": 179011, "epoch": 4262} {"train_loss": -7.082212448120117, "global_step": 179012, "epoch": 4262} {"train_loss": -7.199701309204102, "global_step": 179013, "epoch": 4262} {"train_loss": -7.026750564575195, "global_step": 179014, "epoch": 4262} {"train_loss": -7.208908557891846, "global_step": 179015, "epoch": 4262} {"train_loss": -7.053237438201904, "global_step": 179016, "epoch": 4262} {"train_loss": -7.115375995635986, "global_step": 179017, "epoch": 4262} {"train_loss": -6.970820426940918, "global_step": 179018, "epoch": 4262} {"train_loss": -7.039900779724121, "global_step": 179019, "epoch": 4262} {"train_loss": -7.17250919342041, "global_step": 179020, "epoch": 4262} {"train_loss": -7.058548927307129, "global_step": 179021, "epoch": 4262} {"train_loss": -7.1296892166137695, "global_step": 179022, "epoch": 4262} {"train_loss": -7.228611946105957, "global_step": 179023, "epoch": 4262} {"train_loss": -7.042845726013184, "global_step": 179024, "epoch": 4262} {"train_loss": -7.197004795074463, "global_step": 179025, "epoch": 4262} {"train_loss": -7.163686275482178, "global_step": 179026, "epoch": 4262} {"train_loss": -7.226099967956543, "global_step": 179027, "epoch": 4262} {"train_loss": -7.142446517944336, "global_step": 179028, "epoch": 4262} {"train_loss": -7.075765132904053, "global_step": 179029, "epoch": 4262} {"train_loss": -7.019796371459961, "global_step": 179030, "epoch": 4262} {"train_loss": -7.182979583740234, "global_step": 179031, "epoch": 4262} {"train_loss": -7.130809783935547, "global_step": 179032, "epoch": 4262} {"train_loss": -7.043049335479736, "global_step": 179033, "epoch": 4262} {"train_loss": -7.046405792236328, "global_step": 179034, "epoch": 4262} {"train_loss": -7.08656120300293, "global_step": 179035, "epoch": 4262} {"train_loss": -7.191106796264648, "global_step": 179036, "epoch": 4262} {"train_loss": -7.158501148223877, "global_step": 179037, "epoch": 4262} {"train_loss": -7.092738628387451, "global_step": 179038, "epoch": 4262} {"train_loss": -7.100709915161133, "global_step": 179039, "epoch": 4262} {"train_loss": -7.05977725982666, "global_step": 179040, "epoch": 4262} {"train_loss": -6.991559982299805, "global_step": 179041, "epoch": 4262} {"train_loss": -7.0765380859375, "global_step": 179042, "epoch": 4262} {"train_loss": -7.134982109069824, "global_step": 179043, "epoch": 4262} {"train_loss": -7.098898887634277, "global_step": 179044, "epoch": 4262} {"train_loss": -7.109573057719639, "global_step": 179045, "epoch": 4262, "val_loss": 69330.7890625} {"train_loss": -7.127079963684082, "global_step": 179046, "epoch": 4263} {"train_loss": -7.079753875732422, "global_step": 179047, "epoch": 4263} {"train_loss": -7.015105724334717, "global_step": 179048, "epoch": 4263} {"train_loss": -7.16926383972168, "global_step": 179049, "epoch": 4263} {"train_loss": -7.16890811920166, "global_step": 179050, "epoch": 4263} {"train_loss": -7.12151575088501, "global_step": 179051, "epoch": 4263} {"train_loss": -7.138532638549805, "global_step": 179052, "epoch": 4263} {"train_loss": -7.0760040283203125, "global_step": 179053, "epoch": 4263} {"train_loss": -7.299628257751465, "global_step": 179054, "epoch": 4263} {"train_loss": -7.00542688369751, "global_step": 179055, "epoch": 4263} {"train_loss": -7.102035999298096, "global_step": 179056, "epoch": 4263} {"train_loss": -7.119207859039307, "global_step": 179057, "epoch": 4263} {"train_loss": -7.113901138305664, "global_step": 179058, "epoch": 4263} {"train_loss": -7.054030418395996, "global_step": 179059, "epoch": 4263} {"train_loss": -7.088640213012695, "global_step": 179060, "epoch": 4263} {"train_loss": -7.210720062255859, "global_step": 179061, "epoch": 4263} {"train_loss": -7.079541206359863, "global_step": 179062, "epoch": 4263} {"train_loss": -7.095135688781738, "global_step": 179063, "epoch": 4263} {"train_loss": -7.071566104888916, "global_step": 179064, "epoch": 4263} {"train_loss": -7.079703330993652, "global_step": 179065, "epoch": 4263} {"train_loss": -7.16566276550293, "global_step": 179066, "epoch": 4263} {"train_loss": -7.134537696838379, "global_step": 179067, "epoch": 4263} {"train_loss": -7.155339241027832, "global_step": 179068, "epoch": 4263} {"train_loss": -7.173564434051514, "global_step": 179069, "epoch": 4263} {"train_loss": -6.9835991859436035, "global_step": 179070, "epoch": 4263} {"train_loss": -7.050149917602539, "global_step": 179071, "epoch": 4263} {"train_loss": -7.098738193511963, "global_step": 179072, "epoch": 4263} {"train_loss": -7.0938615798950195, "global_step": 179073, "epoch": 4263} {"train_loss": -7.111264228820801, "global_step": 179074, "epoch": 4263} {"train_loss": -7.019669532775879, "global_step": 179075, "epoch": 4263} {"train_loss": -7.0595293045043945, "global_step": 179076, "epoch": 4263} {"train_loss": -7.149480819702148, "global_step": 179077, "epoch": 4263} {"train_loss": -7.177874565124512, "global_step": 179078, "epoch": 4263} {"train_loss": -7.0826921463012695, "global_step": 179079, "epoch": 4263} {"train_loss": -7.12866735458374, "global_step": 179080, "epoch": 4263} {"train_loss": -7.089344501495361, "global_step": 179081, "epoch": 4263} {"train_loss": -7.082197189331055, "global_step": 179082, "epoch": 4263} {"train_loss": -7.1317362785339355, "global_step": 179083, "epoch": 4263} {"train_loss": -7.093877792358398, "global_step": 179084, "epoch": 4263} {"train_loss": -7.129540920257568, "global_step": 179085, "epoch": 4263} {"train_loss": -7.219963073730469, "global_step": 179086, "epoch": 4263} {"train_loss": -7.108843667166574, "global_step": 179087, "epoch": 4263, "val_loss": 69346.5} {"train_loss": -7.159111976623535, "global_step": 179088, "epoch": 4264} {"train_loss": -7.222877502441406, "global_step": 179089, "epoch": 4264} {"train_loss": -7.161880016326904, "global_step": 179090, "epoch": 4264} {"train_loss": -7.187230110168457, "global_step": 179091, "epoch": 4264} {"train_loss": -7.08604621887207, "global_step": 179092, "epoch": 4264} {"train_loss": -7.086517333984375, "global_step": 179093, "epoch": 4264} {"train_loss": -7.229681968688965, "global_step": 179094, "epoch": 4264} {"train_loss": -7.192902565002441, "global_step": 179095, "epoch": 4264} {"train_loss": -7.1616716384887695, "global_step": 179096, "epoch": 4264} {"train_loss": -7.2034196853637695, "global_step": 179097, "epoch": 4264} {"train_loss": -7.152313232421875, "global_step": 179098, "epoch": 4264} {"train_loss": -7.146918296813965, "global_step": 179099, "epoch": 4264} {"train_loss": -7.125608444213867, "global_step": 179100, "epoch": 4264} {"train_loss": -7.241703033447266, "global_step": 179101, "epoch": 4264} {"train_loss": -7.120322227478027, "global_step": 179102, "epoch": 4264} {"train_loss": -7.096187591552734, "global_step": 179103, "epoch": 4264} {"train_loss": -7.056571960449219, "global_step": 179104, "epoch": 4264} {"train_loss": -7.082616806030273, "global_step": 179105, "epoch": 4264} {"train_loss": -7.1195526123046875, "global_step": 179106, "epoch": 4264} {"train_loss": -7.100833892822266, "global_step": 179107, "epoch": 4264} {"train_loss": -7.094815254211426, "global_step": 179108, "epoch": 4264} {"train_loss": -7.0809736251831055, "global_step": 179109, "epoch": 4264} {"train_loss": -7.2393622398376465, "global_step": 179110, "epoch": 4264} {"train_loss": -7.057185173034668, "global_step": 179111, "epoch": 4264} {"train_loss": -7.272554397583008, "global_step": 179112, "epoch": 4264} {"train_loss": -7.105817794799805, "global_step": 179113, "epoch": 4264} {"train_loss": -7.108311653137207, "global_step": 179114, "epoch": 4264} {"train_loss": -7.133342742919922, "global_step": 179115, "epoch": 4264} {"train_loss": -7.161352634429932, "global_step": 179116, "epoch": 4264} {"train_loss": -7.219037055969238, "global_step": 179117, "epoch": 4264} {"train_loss": -7.103961944580078, "global_step": 179118, "epoch": 4264} {"train_loss": -7.016449451446533, "global_step": 179119, "epoch": 4264} {"train_loss": -7.127922058105469, "global_step": 179120, "epoch": 4264} {"train_loss": -7.182622909545898, "global_step": 179121, "epoch": 4264} {"train_loss": -7.182831764221191, "global_step": 179122, "epoch": 4264} {"train_loss": -7.120702743530273, "global_step": 179123, "epoch": 4264} {"train_loss": -7.1190996170043945, "global_step": 179124, "epoch": 4264} {"train_loss": -7.129802703857422, "global_step": 179125, "epoch": 4264} {"train_loss": -7.2004899978637695, "global_step": 179126, "epoch": 4264} {"train_loss": -7.187849044799805, "global_step": 179127, "epoch": 4264} {"train_loss": -6.977311134338379, "global_step": 179128, "epoch": 4264} {"train_loss": -7.141207649594262, "global_step": 179129, "epoch": 4264, "val_loss": 69292.5703125} {"train_loss": -7.083061218261719, "global_step": 179130, "epoch": 4265} {"train_loss": -7.094181537628174, "global_step": 179131, "epoch": 4265} {"train_loss": -7.075187683105469, "global_step": 179132, "epoch": 4265} {"train_loss": -7.103795051574707, "global_step": 179133, "epoch": 4265} {"train_loss": -7.133919715881348, "global_step": 179134, "epoch": 4265} {"train_loss": -7.27618932723999, "global_step": 179135, "epoch": 4265} {"train_loss": -7.07606315612793, "global_step": 179136, "epoch": 4265} {"train_loss": -7.0730133056640625, "global_step": 179137, "epoch": 4265} {"train_loss": -7.160576820373535, "global_step": 179138, "epoch": 4265} {"train_loss": -7.157571792602539, "global_step": 179139, "epoch": 4265} {"train_loss": -7.076915740966797, "global_step": 179140, "epoch": 4265} {"train_loss": -7.093958854675293, "global_step": 179141, "epoch": 4265} {"train_loss": -7.040748596191406, "global_step": 179142, "epoch": 4265} {"train_loss": -7.023155689239502, "global_step": 179143, "epoch": 4265} {"train_loss": -7.053005695343018, "global_step": 179144, "epoch": 4265} {"train_loss": -7.187198162078857, "global_step": 179145, "epoch": 4265} {"train_loss": -7.179058074951172, "global_step": 179146, "epoch": 4265} {"train_loss": -7.093196868896484, "global_step": 179147, "epoch": 4265} {"train_loss": -7.185007572174072, "global_step": 179148, "epoch": 4265} {"train_loss": -7.0910115242004395, "global_step": 179149, "epoch": 4265} {"train_loss": -7.158450126647949, "global_step": 179150, "epoch": 4265} {"train_loss": -7.021280288696289, "global_step": 179151, "epoch": 4265} {"train_loss": -7.1346354484558105, "global_step": 179152, "epoch": 4265} {"train_loss": -7.121776103973389, "global_step": 179153, "epoch": 4265} {"train_loss": -7.06578254699707, "global_step": 179154, "epoch": 4265} {"train_loss": -7.116739273071289, "global_step": 179155, "epoch": 4265} {"train_loss": -7.205539226531982, "global_step": 179156, "epoch": 4265} {"train_loss": -7.071134567260742, "global_step": 179157, "epoch": 4265} {"train_loss": -7.155594825744629, "global_step": 179158, "epoch": 4265} {"train_loss": -7.057881832122803, "global_step": 179159, "epoch": 4265} {"train_loss": -7.129427909851074, "global_step": 179160, "epoch": 4265} {"train_loss": -7.085208415985107, "global_step": 179161, "epoch": 4265} {"train_loss": -7.043770790100098, "global_step": 179162, "epoch": 4265} {"train_loss": -7.041034698486328, "global_step": 179163, "epoch": 4265} {"train_loss": -7.0196733474731445, "global_step": 179164, "epoch": 4265} {"train_loss": -7.041518688201904, "global_step": 179165, "epoch": 4265} {"train_loss": -6.814723968505859, "global_step": 179166, "epoch": 4265} {"train_loss": -6.9805450439453125, "global_step": 179167, "epoch": 4265} {"train_loss": -7.102924346923828, "global_step": 179168, "epoch": 4265} {"train_loss": -6.999595642089844, "global_step": 179169, "epoch": 4265} {"train_loss": -7.139581203460693, "global_step": 179170, "epoch": 4265} {"train_loss": -7.086751268023536, "global_step": 179171, "epoch": 4265, "val_loss": 69473.390625} {"train_loss": -7.067153453826904, "global_step": 179172, "epoch": 4266} {"train_loss": -7.047954082489014, "global_step": 179173, "epoch": 4266} {"train_loss": -6.999263286590576, "global_step": 179174, "epoch": 4266} {"train_loss": -7.100536823272705, "global_step": 179175, "epoch": 4266} {"train_loss": -7.069660663604736, "global_step": 179176, "epoch": 4266} {"train_loss": -6.985770225524902, "global_step": 179177, "epoch": 4266} {"train_loss": -7.121824264526367, "global_step": 179178, "epoch": 4266} {"train_loss": -7.08408260345459, "global_step": 179179, "epoch": 4266} {"train_loss": -7.000866889953613, "global_step": 179180, "epoch": 4266} {"train_loss": -6.938859939575195, "global_step": 179181, "epoch": 4266} {"train_loss": -7.117169380187988, "global_step": 179182, "epoch": 4266} {"train_loss": -7.072257995605469, "global_step": 179183, "epoch": 4266} {"train_loss": -7.0584259033203125, "global_step": 179184, "epoch": 4266} {"train_loss": -7.0578107833862305, "global_step": 179185, "epoch": 4266} {"train_loss": -7.07739782333374, "global_step": 179186, "epoch": 4266} {"train_loss": -7.0874762535095215, "global_step": 179187, "epoch": 4266} {"train_loss": -7.079938888549805, "global_step": 179188, "epoch": 4266} {"train_loss": -7.030768871307373, "global_step": 179189, "epoch": 4266} {"train_loss": -7.019350051879883, "global_step": 179190, "epoch": 4266} {"train_loss": -7.1525983810424805, "global_step": 179191, "epoch": 4266} {"train_loss": -7.082705974578857, "global_step": 179192, "epoch": 4266} {"train_loss": -7.231224060058594, "global_step": 179193, "epoch": 4266} {"train_loss": -7.1212663650512695, "global_step": 179194, "epoch": 4266} {"train_loss": -7.112113952636719, "global_step": 179195, "epoch": 4266} {"train_loss": -7.144387245178223, "global_step": 179196, "epoch": 4266} {"train_loss": -7.1103105545043945, "global_step": 179197, "epoch": 4266} {"train_loss": -7.116741180419922, "global_step": 179198, "epoch": 4266} {"train_loss": -7.162517547607422, "global_step": 179199, "epoch": 4266} {"train_loss": -7.183189392089844, "global_step": 179200, "epoch": 4266} {"train_loss": -7.128493309020996, "global_step": 179201, "epoch": 4266} {"train_loss": -7.141711235046387, "global_step": 179202, "epoch": 4266} {"train_loss": -7.148592948913574, "global_step": 179203, "epoch": 4266} {"train_loss": -7.103923797607422, "global_step": 179204, "epoch": 4266} {"train_loss": -7.096532821655273, "global_step": 179205, "epoch": 4266} {"train_loss": -7.140185356140137, "global_step": 179206, "epoch": 4266} {"train_loss": -7.034625053405762, "global_step": 179207, "epoch": 4266} {"train_loss": -7.146234512329102, "global_step": 179208, "epoch": 4266} {"train_loss": -7.174469470977783, "global_step": 179209, "epoch": 4266} {"train_loss": -7.148687362670898, "global_step": 179210, "epoch": 4266} {"train_loss": -7.2144880294799805, "global_step": 179211, "epoch": 4266} {"train_loss": -7.142274856567383, "global_step": 179212, "epoch": 4266} {"train_loss": -7.100322484970093, "global_step": 179213, "epoch": 4266, "val_loss": 69400.6171875} {"train_loss": -7.1739373207092285, "global_step": 179214, "epoch": 4267} {"train_loss": -7.135284423828125, "global_step": 179215, "epoch": 4267} {"train_loss": -7.162425994873047, "global_step": 179216, "epoch": 4267} {"train_loss": -7.0572099685668945, "global_step": 179217, "epoch": 4267} {"train_loss": -7.125722885131836, "global_step": 179218, "epoch": 4267} {"train_loss": -7.099368095397949, "global_step": 179219, "epoch": 4267} {"train_loss": -7.1296491622924805, "global_step": 179220, "epoch": 4267} {"train_loss": -7.087650299072266, "global_step": 179221, "epoch": 4267} {"train_loss": -6.9158430099487305, "global_step": 179222, "epoch": 4267} {"train_loss": -6.9749345779418945, "global_step": 179223, "epoch": 4267} {"train_loss": -7.099308013916016, "global_step": 179224, "epoch": 4267} {"train_loss": -6.869064807891846, "global_step": 179225, "epoch": 4267} {"train_loss": -7.1669721603393555, "global_step": 179226, "epoch": 4267} {"train_loss": -7.143802642822266, "global_step": 179227, "epoch": 4267} {"train_loss": -7.154776096343994, "global_step": 179228, "epoch": 4267} {"train_loss": -7.1608381271362305, "global_step": 179229, "epoch": 4267} {"train_loss": -7.194068908691406, "global_step": 179230, "epoch": 4267} {"train_loss": -7.131258487701416, "global_step": 179231, "epoch": 4267} {"train_loss": -7.011142730712891, "global_step": 179232, "epoch": 4267} {"train_loss": -7.05013370513916, "global_step": 179233, "epoch": 4267} {"train_loss": -7.076549530029297, "global_step": 179234, "epoch": 4267} {"train_loss": -7.052104949951172, "global_step": 179235, "epoch": 4267} {"train_loss": -6.9767961502075195, "global_step": 179236, "epoch": 4267} {"train_loss": -7.095350742340088, "global_step": 179237, "epoch": 4267} {"train_loss": -6.956219673156738, "global_step": 179238, "epoch": 4267} {"train_loss": -6.901517868041992, "global_step": 179239, "epoch": 4267} {"train_loss": -7.061955451965332, "global_step": 179240, "epoch": 4267} {"train_loss": -7.04383659362793, "global_step": 179241, "epoch": 4267} {"train_loss": -7.08510684967041, "global_step": 179242, "epoch": 4267} {"train_loss": -7.080428123474121, "global_step": 179243, "epoch": 4267} {"train_loss": -7.065826416015625, "global_step": 179244, "epoch": 4267} {"train_loss": -7.077263832092285, "global_step": 179245, "epoch": 4267} {"train_loss": -6.975983619689941, "global_step": 179246, "epoch": 4267} {"train_loss": -6.961480617523193, "global_step": 179247, "epoch": 4267} {"train_loss": -7.134777069091797, "global_step": 179248, "epoch": 4267} {"train_loss": -7.059086322784424, "global_step": 179249, "epoch": 4267} {"train_loss": -7.060583114624023, "global_step": 179250, "epoch": 4267} {"train_loss": -7.0783233642578125, "global_step": 179251, "epoch": 4267} {"train_loss": -7.0300140380859375, "global_step": 179252, "epoch": 4267} {"train_loss": -7.052297115325928, "global_step": 179253, "epoch": 4267} {"train_loss": -6.926468372344971, "global_step": 179254, "epoch": 4267} {"train_loss": -7.0634019147782094, "global_step": 179255, "epoch": 4267, "val_loss": 69258.3046875} {"train_loss": -7.015882968902588, "global_step": 179256, "epoch": 4268} {"train_loss": -7.12747049331665, "global_step": 179257, "epoch": 4268} {"train_loss": -6.974686145782471, "global_step": 179258, "epoch": 4268} {"train_loss": -7.12385892868042, "global_step": 179259, "epoch": 4268} {"train_loss": -7.082829475402832, "global_step": 179260, "epoch": 4268} {"train_loss": -7.0849761962890625, "global_step": 179261, "epoch": 4268} {"train_loss": -7.0966997146606445, "global_step": 179262, "epoch": 4268} {"train_loss": -7.20643424987793, "global_step": 179263, "epoch": 4268} {"train_loss": -6.950427055358887, "global_step": 179264, "epoch": 4268} {"train_loss": -7.197749137878418, "global_step": 179265, "epoch": 4268} {"train_loss": -7.083044052124023, "global_step": 179266, "epoch": 4268} {"train_loss": -6.933028697967529, "global_step": 179267, "epoch": 4268} {"train_loss": -7.232314109802246, "global_step": 179268, "epoch": 4268} {"train_loss": -7.10775089263916, "global_step": 179269, "epoch": 4268} {"train_loss": -7.201018810272217, "global_step": 179270, "epoch": 4268} {"train_loss": -7.018625736236572, "global_step": 179271, "epoch": 4268} {"train_loss": -7.1935319900512695, "global_step": 179272, "epoch": 4268} {"train_loss": -7.199344635009766, "global_step": 179273, "epoch": 4268} {"train_loss": -7.142335891723633, "global_step": 179274, "epoch": 4268} {"train_loss": -7.139670372009277, "global_step": 179275, "epoch": 4268} {"train_loss": -7.132785797119141, "global_step": 179276, "epoch": 4268} {"train_loss": -7.120403289794922, "global_step": 179277, "epoch": 4268} {"train_loss": -7.062450408935547, "global_step": 179278, "epoch": 4268} {"train_loss": -7.101302146911621, "global_step": 179279, "epoch": 4268} {"train_loss": -7.07688045501709, "global_step": 179280, "epoch": 4268} {"train_loss": -7.0004682540893555, "global_step": 179281, "epoch": 4268} {"train_loss": -7.0557661056518555, "global_step": 179282, "epoch": 4268} {"train_loss": -7.197585105895996, "global_step": 179283, "epoch": 4268} {"train_loss": -7.102123260498047, "global_step": 179284, "epoch": 4268} {"train_loss": -7.145451545715332, "global_step": 179285, "epoch": 4268} {"train_loss": -7.110197067260742, "global_step": 179286, "epoch": 4268} {"train_loss": -7.023349761962891, "global_step": 179287, "epoch": 4268} {"train_loss": -7.17891263961792, "global_step": 179288, "epoch": 4268} {"train_loss": -7.09090518951416, "global_step": 179289, "epoch": 4268} {"train_loss": -7.116375923156738, "global_step": 179290, "epoch": 4268} {"train_loss": -7.082712650299072, "global_step": 179291, "epoch": 4268} {"train_loss": -7.133325576782227, "global_step": 179292, "epoch": 4268} {"train_loss": -7.158747673034668, "global_step": 179293, "epoch": 4268} {"train_loss": -7.106019020080566, "global_step": 179294, "epoch": 4268} {"train_loss": -7.109724998474121, "global_step": 179295, "epoch": 4268} {"train_loss": -7.124947547912598, "global_step": 179296, "epoch": 4268} {"train_loss": -7.1055155254545665, "global_step": 179297, "epoch": 4268, "val_loss": 69169.8203125} {"train_loss": -7.159481048583984, "global_step": 179298, "epoch": 4269} {"train_loss": -7.178555488586426, "global_step": 179299, "epoch": 4269} {"train_loss": -7.129504203796387, "global_step": 179300, "epoch": 4269} {"train_loss": -7.090605735778809, "global_step": 179301, "epoch": 4269} {"train_loss": -7.203108787536621, "global_step": 179302, "epoch": 4269} {"train_loss": -7.1510772705078125, "global_step": 179303, "epoch": 4269} {"train_loss": -7.159369468688965, "global_step": 179304, "epoch": 4269} {"train_loss": -7.146017074584961, "global_step": 179305, "epoch": 4269} {"train_loss": -7.104545593261719, "global_step": 179306, "epoch": 4269} {"train_loss": -7.121892929077148, "global_step": 179307, "epoch": 4269} {"train_loss": -7.191672325134277, "global_step": 179308, "epoch": 4269} {"train_loss": -7.123826026916504, "global_step": 179309, "epoch": 4269} {"train_loss": -7.124141693115234, "global_step": 179310, "epoch": 4269} {"train_loss": -7.087068557739258, "global_step": 179311, "epoch": 4269} {"train_loss": -7.118922233581543, "global_step": 179312, "epoch": 4269} {"train_loss": -7.215843200683594, "global_step": 179313, "epoch": 4269} {"train_loss": -7.164926528930664, "global_step": 179314, "epoch": 4269} {"train_loss": -7.096375465393066, "global_step": 179315, "epoch": 4269} {"train_loss": -7.115521430969238, "global_step": 179316, "epoch": 4269} {"train_loss": -7.125643253326416, "global_step": 179317, "epoch": 4269} {"train_loss": -7.1693878173828125, "global_step": 179318, "epoch": 4269} {"train_loss": -7.169862270355225, "global_step": 179319, "epoch": 4269} {"train_loss": -7.225783348083496, "global_step": 179320, "epoch": 4269} {"train_loss": -7.196284770965576, "global_step": 179321, "epoch": 4269} {"train_loss": -7.125453948974609, "global_step": 179322, "epoch": 4269} {"train_loss": -7.1742963790893555, "global_step": 179323, "epoch": 4269} {"train_loss": -7.227378845214844, "global_step": 179324, "epoch": 4269} {"train_loss": -7.17413330078125, "global_step": 179325, "epoch": 4269} {"train_loss": -7.0029215812683105, "global_step": 179326, "epoch": 4269} {"train_loss": -7.181350231170654, "global_step": 179327, "epoch": 4269} {"train_loss": -7.2574639320373535, "global_step": 179328, "epoch": 4269} {"train_loss": -7.088384628295898, "global_step": 179329, "epoch": 4269} {"train_loss": -7.1444244384765625, "global_step": 179330, "epoch": 4269} {"train_loss": -7.190301418304443, "global_step": 179331, "epoch": 4269} {"train_loss": -7.080303192138672, "global_step": 179332, "epoch": 4269} {"train_loss": -7.193438529968262, "global_step": 179333, "epoch": 4269} {"train_loss": -7.246772766113281, "global_step": 179334, "epoch": 4269} {"train_loss": -7.125863075256348, "global_step": 179335, "epoch": 4269} {"train_loss": -7.17021369934082, "global_step": 179336, "epoch": 4269} {"train_loss": -7.126581192016602, "global_step": 179337, "epoch": 4269} {"train_loss": -7.098528861999512, "global_step": 179338, "epoch": 4269} {"train_loss": -7.150192862465268, "global_step": 179339, "epoch": 4269, "val_loss": 69185.4296875} {"train_loss": -7.172971248626709, "global_step": 179340, "epoch": 4270} {"train_loss": -7.1372880935668945, "global_step": 179341, "epoch": 4270} {"train_loss": -7.110781669616699, "global_step": 179342, "epoch": 4270} {"train_loss": -7.119612216949463, "global_step": 179343, "epoch": 4270} {"train_loss": -7.0616135597229, "global_step": 179344, "epoch": 4270} {"train_loss": -6.890983581542969, "global_step": 179345, "epoch": 4270} {"train_loss": -7.003609657287598, "global_step": 179346, "epoch": 4270} {"train_loss": -7.136908054351807, "global_step": 179347, "epoch": 4270} {"train_loss": -7.038863182067871, "global_step": 179348, "epoch": 4270} {"train_loss": -7.156648635864258, "global_step": 179349, "epoch": 4270} {"train_loss": -7.047950744628906, "global_step": 179350, "epoch": 4270} {"train_loss": -6.853125095367432, "global_step": 179351, "epoch": 4270} {"train_loss": -6.956617832183838, "global_step": 179352, "epoch": 4270} {"train_loss": -7.0211687088012695, "global_step": 179353, "epoch": 4270} {"train_loss": -6.838752746582031, "global_step": 179354, "epoch": 4270} {"train_loss": -7.078039169311523, "global_step": 179355, "epoch": 4270} {"train_loss": -6.901444435119629, "global_step": 179356, "epoch": 4270} {"train_loss": -6.992378234863281, "global_step": 179357, "epoch": 4270} {"train_loss": -6.96461296081543, "global_step": 179358, "epoch": 4270} {"train_loss": -6.963352203369141, "global_step": 179359, "epoch": 4270} {"train_loss": -6.9507904052734375, "global_step": 179360, "epoch": 4270} {"train_loss": -6.963218688964844, "global_step": 179361, "epoch": 4270} {"train_loss": -7.04253625869751, "global_step": 179362, "epoch": 4270} {"train_loss": -7.053343296051025, "global_step": 179363, "epoch": 4270} {"train_loss": -7.008726596832275, "global_step": 179364, "epoch": 4270} {"train_loss": -7.063531875610352, "global_step": 179365, "epoch": 4270} {"train_loss": -7.045577526092529, "global_step": 179366, "epoch": 4270} {"train_loss": -6.9990553855896, "global_step": 179367, "epoch": 4270} {"train_loss": -7.052855968475342, "global_step": 179368, "epoch": 4270} {"train_loss": -7.030801773071289, "global_step": 179369, "epoch": 4270} {"train_loss": -7.037599563598633, "global_step": 179370, "epoch": 4270} {"train_loss": -7.042884349822998, "global_step": 179371, "epoch": 4270} {"train_loss": -6.96002197265625, "global_step": 179372, "epoch": 4270} {"train_loss": -6.981370449066162, "global_step": 179373, "epoch": 4270} {"train_loss": -7.118176460266113, "global_step": 179374, "epoch": 4270} {"train_loss": -6.9510650634765625, "global_step": 179375, "epoch": 4270} {"train_loss": -7.057977676391602, "global_step": 179376, "epoch": 4270} {"train_loss": -7.071016788482666, "global_step": 179377, "epoch": 4270} {"train_loss": -7.117817401885986, "global_step": 179378, "epoch": 4270} {"train_loss": -7.011161804199219, "global_step": 179379, "epoch": 4270} {"train_loss": -7.181364059448242, "global_step": 179380, "epoch": 4270} {"train_loss": -7.026886758350191, "global_step": 179381, "epoch": 4270, "val_loss": 69305.9375} {"train_loss": -6.998183727264404, "global_step": 179382, "epoch": 4271} {"train_loss": -7.026715278625488, "global_step": 179383, "epoch": 4271} {"train_loss": -7.121180057525635, "global_step": 179384, "epoch": 4271} {"train_loss": -7.143914222717285, "global_step": 179385, "epoch": 4271} {"train_loss": -7.009941577911377, "global_step": 179386, "epoch": 4271} {"train_loss": -7.057978630065918, "global_step": 179387, "epoch": 4271} {"train_loss": -7.040961265563965, "global_step": 179388, "epoch": 4271} {"train_loss": -7.097403526306152, "global_step": 179389, "epoch": 4271} {"train_loss": -7.147175312042236, "global_step": 179390, "epoch": 4271} {"train_loss": -7.226472854614258, "global_step": 179391, "epoch": 4271} {"train_loss": -7.141942024230957, "global_step": 179392, "epoch": 4271} {"train_loss": -7.09749698638916, "global_step": 179393, "epoch": 4271} {"train_loss": -7.168137073516846, "global_step": 179394, "epoch": 4271} {"train_loss": -7.137093544006348, "global_step": 179395, "epoch": 4271} {"train_loss": -7.180264949798584, "global_step": 179396, "epoch": 4271} {"train_loss": -7.070539474487305, "global_step": 179397, "epoch": 4271} {"train_loss": -7.196104049682617, "global_step": 179398, "epoch": 4271} {"train_loss": -7.269926071166992, "global_step": 179399, "epoch": 4271} {"train_loss": -7.031574249267578, "global_step": 179400, "epoch": 4271} {"train_loss": -7.091261863708496, "global_step": 179401, "epoch": 4271} {"train_loss": -7.2368268966674805, "global_step": 179402, "epoch": 4271} {"train_loss": -7.048702239990234, "global_step": 179403, "epoch": 4271} {"train_loss": -7.107302665710449, "global_step": 179404, "epoch": 4271} {"train_loss": -7.18094539642334, "global_step": 179405, "epoch": 4271} {"train_loss": -7.077576637268066, "global_step": 179406, "epoch": 4271} {"train_loss": -7.13841438293457, "global_step": 179407, "epoch": 4271} {"train_loss": -7.153111457824707, "global_step": 179408, "epoch": 4271} {"train_loss": -7.207790374755859, "global_step": 179409, "epoch": 4271} {"train_loss": -7.204673767089844, "global_step": 179410, "epoch": 4271} {"train_loss": -7.171915531158447, "global_step": 179411, "epoch": 4271} {"train_loss": -7.225826263427734, "global_step": 179412, "epoch": 4271} {"train_loss": -7.000452995300293, "global_step": 179413, "epoch": 4271} {"train_loss": -6.933410167694092, "global_step": 179414, "epoch": 4271} {"train_loss": -7.1119890213012695, "global_step": 179415, "epoch": 4271} {"train_loss": -7.071065902709961, "global_step": 179416, "epoch": 4271} {"train_loss": -7.0826416015625, "global_step": 179417, "epoch": 4271} {"train_loss": -7.058248519897461, "global_step": 179418, "epoch": 4271} {"train_loss": -7.157972812652588, "global_step": 179419, "epoch": 4271} {"train_loss": -6.98392391204834, "global_step": 179420, "epoch": 4271} {"train_loss": -7.207245349884033, "global_step": 179421, "epoch": 4271} {"train_loss": -7.119990348815918, "global_step": 179422, "epoch": 4271} {"train_loss": -7.114092281886509, "global_step": 179423, "epoch": 4271, "val_loss": 69293.4921875} {"train_loss": -7.156987190246582, "global_step": 179424, "epoch": 4272} {"train_loss": -7.027478218078613, "global_step": 179425, "epoch": 4272} {"train_loss": -7.136557579040527, "global_step": 179426, "epoch": 4272} {"train_loss": -7.094940662384033, "global_step": 179427, "epoch": 4272} {"train_loss": -7.085738658905029, "global_step": 179428, "epoch": 4272} {"train_loss": -7.095619201660156, "global_step": 179429, "epoch": 4272} {"train_loss": -7.042363166809082, "global_step": 179430, "epoch": 4272} {"train_loss": -7.048079490661621, "global_step": 179431, "epoch": 4272} {"train_loss": -6.956977844238281, "global_step": 179432, "epoch": 4272} {"train_loss": -7.04611873626709, "global_step": 179433, "epoch": 4272} {"train_loss": -6.976280689239502, "global_step": 179434, "epoch": 4272} {"train_loss": -7.050873756408691, "global_step": 179435, "epoch": 4272} {"train_loss": -7.190274715423584, "global_step": 179436, "epoch": 4272} {"train_loss": -7.045654296875, "global_step": 179437, "epoch": 4272} {"train_loss": -7.0700883865356445, "global_step": 179438, "epoch": 4272} {"train_loss": -7.077598571777344, "global_step": 179439, "epoch": 4272} {"train_loss": -7.032918930053711, "global_step": 179440, "epoch": 4272} {"train_loss": -7.028142929077148, "global_step": 179441, "epoch": 4272} {"train_loss": -7.181160926818848, "global_step": 179442, "epoch": 4272} {"train_loss": -7.076350212097168, "global_step": 179443, "epoch": 4272} {"train_loss": -7.194411754608154, "global_step": 179444, "epoch": 4272} {"train_loss": -7.076175212860107, "global_step": 179445, "epoch": 4272} {"train_loss": -7.10396671295166, "global_step": 179446, "epoch": 4272} {"train_loss": -7.121546268463135, "global_step": 179447, "epoch": 4272} {"train_loss": -7.097237586975098, "global_step": 179448, "epoch": 4272} {"train_loss": -7.137394428253174, "global_step": 179449, "epoch": 4272} {"train_loss": -7.143987655639648, "global_step": 179450, "epoch": 4272} {"train_loss": -7.127995491027832, "global_step": 179451, "epoch": 4272} {"train_loss": -7.034905433654785, "global_step": 179452, "epoch": 4272} {"train_loss": -7.096132755279541, "global_step": 179453, "epoch": 4272} {"train_loss": -7.159350872039795, "global_step": 179454, "epoch": 4272} {"train_loss": -7.046449661254883, "global_step": 179455, "epoch": 4272} {"train_loss": -6.993376731872559, "global_step": 179456, "epoch": 4272} {"train_loss": -7.132524490356445, "global_step": 179457, "epoch": 4272} {"train_loss": -7.040444374084473, "global_step": 179458, "epoch": 4272} {"train_loss": -7.0239362716674805, "global_step": 179459, "epoch": 4272} {"train_loss": -7.056301593780518, "global_step": 179460, "epoch": 4272} {"train_loss": -7.057589054107666, "global_step": 179461, "epoch": 4272} {"train_loss": -7.083636283874512, "global_step": 179462, "epoch": 4272} {"train_loss": -7.069914817810059, "global_step": 179463, "epoch": 4272} {"train_loss": -7.165273189544678, "global_step": 179464, "epoch": 4272} {"train_loss": -7.082768644605364, "global_step": 179465, "epoch": 4272, "val_loss": 69394.1015625} {"train_loss": -7.26803731918335, "global_step": 179466, "epoch": 4273} {"train_loss": -6.962590217590332, "global_step": 179467, "epoch": 4273} {"train_loss": -7.146371841430664, "global_step": 179468, "epoch": 4273} {"train_loss": -6.904836654663086, "global_step": 179469, "epoch": 4273} {"train_loss": -6.842299461364746, "global_step": 179470, "epoch": 4273} {"train_loss": -7.019817352294922, "global_step": 179471, "epoch": 4273} {"train_loss": -6.971424102783203, "global_step": 179472, "epoch": 4273} {"train_loss": -7.048118591308594, "global_step": 179473, "epoch": 4273} {"train_loss": -6.954648971557617, "global_step": 179474, "epoch": 4273} {"train_loss": -6.985963344573975, "global_step": 179475, "epoch": 4273} {"train_loss": -7.010721206665039, "global_step": 179476, "epoch": 4273} {"train_loss": -6.993623733520508, "global_step": 179477, "epoch": 4273} {"train_loss": -6.933802604675293, "global_step": 179478, "epoch": 4273} {"train_loss": -7.13947057723999, "global_step": 179479, "epoch": 4273} {"train_loss": -7.061408519744873, "global_step": 179480, "epoch": 4273} {"train_loss": -7.08812141418457, "global_step": 179481, "epoch": 4273} {"train_loss": -7.086991310119629, "global_step": 179482, "epoch": 4273} {"train_loss": -6.964600086212158, "global_step": 179483, "epoch": 4273} {"train_loss": -7.039841651916504, "global_step": 179484, "epoch": 4273} {"train_loss": -7.089883804321289, "global_step": 179485, "epoch": 4273} {"train_loss": -7.017266750335693, "global_step": 179486, "epoch": 4273} {"train_loss": -7.0195794105529785, "global_step": 179487, "epoch": 4273} {"train_loss": -7.021602630615234, "global_step": 179488, "epoch": 4273} {"train_loss": -7.07092809677124, "global_step": 179489, "epoch": 4273} {"train_loss": -7.084989070892334, "global_step": 179490, "epoch": 4273} {"train_loss": -7.030594825744629, "global_step": 179491, "epoch": 4273} {"train_loss": -7.05698299407959, "global_step": 179492, "epoch": 4273} {"train_loss": -7.0314860343933105, "global_step": 179493, "epoch": 4273} {"train_loss": -6.875178337097168, "global_step": 179494, "epoch": 4273} {"train_loss": -7.216575622558594, "global_step": 179495, "epoch": 4273} {"train_loss": -6.91252326965332, "global_step": 179496, "epoch": 4273} {"train_loss": -7.03460693359375, "global_step": 179497, "epoch": 4273} {"train_loss": -7.1213250160217285, "global_step": 179498, "epoch": 4273} {"train_loss": -7.16061544418335, "global_step": 179499, "epoch": 4273} {"train_loss": -7.0429277420043945, "global_step": 179500, "epoch": 4273} {"train_loss": -7.017855644226074, "global_step": 179501, "epoch": 4273} {"train_loss": -7.205099582672119, "global_step": 179502, "epoch": 4273} {"train_loss": -7.127777099609375, "global_step": 179503, "epoch": 4273} {"train_loss": -7.143617630004883, "global_step": 179504, "epoch": 4273} {"train_loss": -7.144827842712402, "global_step": 179505, "epoch": 4273} {"train_loss": -7.076650619506836, "global_step": 179506, "epoch": 4273} {"train_loss": -7.046725942974999, "global_step": 179507, "epoch": 4273, "val_loss": 69247.984375} {"train_loss": -7.219791412353516, "global_step": 179508, "epoch": 4274} {"train_loss": -7.214257717132568, "global_step": 179509, "epoch": 4274} {"train_loss": -7.226183891296387, "global_step": 179510, "epoch": 4274} {"train_loss": -7.17247200012207, "global_step": 179511, "epoch": 4274} {"train_loss": -7.174437522888184, "global_step": 179512, "epoch": 4274} {"train_loss": -7.132833957672119, "global_step": 179513, "epoch": 4274} {"train_loss": -7.130288124084473, "global_step": 179514, "epoch": 4274} {"train_loss": -7.165412902832031, "global_step": 179515, "epoch": 4274} {"train_loss": -7.133005142211914, "global_step": 179516, "epoch": 4274} {"train_loss": -7.211302757263184, "global_step": 179517, "epoch": 4274} {"train_loss": -7.114312648773193, "global_step": 179518, "epoch": 4274} {"train_loss": -7.239140510559082, "global_step": 179519, "epoch": 4274} {"train_loss": -7.090598106384277, "global_step": 179520, "epoch": 4274} {"train_loss": -7.162649154663086, "global_step": 179521, "epoch": 4274} {"train_loss": -7.229691505432129, "global_step": 179522, "epoch": 4274} {"train_loss": -7.119878768920898, "global_step": 179523, "epoch": 4274} {"train_loss": -7.052551746368408, "global_step": 179524, "epoch": 4274} {"train_loss": -7.144837379455566, "global_step": 179525, "epoch": 4274} {"train_loss": -7.117351531982422, "global_step": 179526, "epoch": 4274} {"train_loss": -7.127956390380859, "global_step": 179527, "epoch": 4274} {"train_loss": -7.087169647216797, "global_step": 179528, "epoch": 4274} {"train_loss": -7.072965621948242, "global_step": 179529, "epoch": 4274} {"train_loss": -7.228443145751953, "global_step": 179530, "epoch": 4274} {"train_loss": -7.162334442138672, "global_step": 179531, "epoch": 4274} {"train_loss": -7.089326858520508, "global_step": 179532, "epoch": 4274} {"train_loss": -7.074619293212891, "global_step": 179533, "epoch": 4274} {"train_loss": -7.092465400695801, "global_step": 179534, "epoch": 4274} {"train_loss": -7.198301315307617, "global_step": 179535, "epoch": 4274} {"train_loss": -7.116052627563477, "global_step": 179536, "epoch": 4274} {"train_loss": -7.159931182861328, "global_step": 179537, "epoch": 4274} {"train_loss": -7.124224662780762, "global_step": 179538, "epoch": 4274} {"train_loss": -7.107194423675537, "global_step": 179539, "epoch": 4274} {"train_loss": -6.984705448150635, "global_step": 179540, "epoch": 4274} {"train_loss": -7.0520477294921875, "global_step": 179541, "epoch": 4274} {"train_loss": -7.01677131652832, "global_step": 179542, "epoch": 4274} {"train_loss": -6.91536808013916, "global_step": 179543, "epoch": 4274} {"train_loss": -7.189126491546631, "global_step": 179544, "epoch": 4274} {"train_loss": -7.0746917724609375, "global_step": 179545, "epoch": 4274} {"train_loss": -7.139524459838867, "global_step": 179546, "epoch": 4274} {"train_loss": -7.148866653442383, "global_step": 179547, "epoch": 4274} {"train_loss": -7.086225509643555, "global_step": 179548, "epoch": 4274} {"train_loss": -7.126513640085856, "global_step": 179549, "epoch": 4274, "val_loss": 69279.3671875} {"train_loss": -7.149960517883301, "global_step": 179550, "epoch": 4275} {"train_loss": -7.0566816329956055, "global_step": 179551, "epoch": 4275} {"train_loss": -7.163250923156738, "global_step": 179552, "epoch": 4275} {"train_loss": -7.116446495056152, "global_step": 179553, "epoch": 4275} {"train_loss": -6.936769962310791, "global_step": 179554, "epoch": 4275} {"train_loss": -7.207761764526367, "global_step": 179555, "epoch": 4275} {"train_loss": -7.133269309997559, "global_step": 179556, "epoch": 4275} {"train_loss": -7.031119346618652, "global_step": 179557, "epoch": 4275} {"train_loss": -7.212057113647461, "global_step": 179558, "epoch": 4275} {"train_loss": -7.031650066375732, "global_step": 179559, "epoch": 4275} {"train_loss": -7.114419937133789, "global_step": 179560, "epoch": 4275} {"train_loss": -7.187745094299316, "global_step": 179561, "epoch": 4275} {"train_loss": -7.096917152404785, "global_step": 179562, "epoch": 4275} {"train_loss": -7.09352970123291, "global_step": 179563, "epoch": 4275} {"train_loss": -7.075168132781982, "global_step": 179564, "epoch": 4275} {"train_loss": -7.246818542480469, "global_step": 179565, "epoch": 4275} {"train_loss": -7.161086082458496, "global_step": 179566, "epoch": 4275} {"train_loss": -7.151793956756592, "global_step": 179567, "epoch": 4275} {"train_loss": -7.15477991104126, "global_step": 179568, "epoch": 4275} {"train_loss": -7.036111354827881, "global_step": 179569, "epoch": 4275} {"train_loss": -7.076790809631348, "global_step": 179570, "epoch": 4275} {"train_loss": -7.132964134216309, "global_step": 179571, "epoch": 4275} {"train_loss": -6.942892551422119, "global_step": 179572, "epoch": 4275} {"train_loss": -7.142431259155273, "global_step": 179573, "epoch": 4275} {"train_loss": -7.0718488693237305, "global_step": 179574, "epoch": 4275} {"train_loss": -6.970858097076416, "global_step": 179575, "epoch": 4275} {"train_loss": -6.975029945373535, "global_step": 179576, "epoch": 4275} {"train_loss": -7.042110443115234, "global_step": 179577, "epoch": 4275} {"train_loss": -6.924611568450928, "global_step": 179578, "epoch": 4275} {"train_loss": -7.030525207519531, "global_step": 179579, "epoch": 4275} {"train_loss": -7.004158973693848, "global_step": 179580, "epoch": 4275} {"train_loss": -6.957842826843262, "global_step": 179581, "epoch": 4275} {"train_loss": -7.039697647094727, "global_step": 179582, "epoch": 4275} {"train_loss": -7.047683238983154, "global_step": 179583, "epoch": 4275} {"train_loss": -7.090163230895996, "global_step": 179584, "epoch": 4275} {"train_loss": -7.097299575805664, "global_step": 179585, "epoch": 4275} {"train_loss": -7.042707920074463, "global_step": 179586, "epoch": 4275} {"train_loss": -7.085092544555664, "global_step": 179587, "epoch": 4275} {"train_loss": -7.0149407386779785, "global_step": 179588, "epoch": 4275} {"train_loss": -7.121466159820557, "global_step": 179589, "epoch": 4275} {"train_loss": -7.055666923522949, "global_step": 179590, "epoch": 4275} {"train_loss": -7.075893481572469, "global_step": 179591, "epoch": 4275, "val_loss": 69262.2734375} {"train_loss": -7.044998645782471, "global_step": 179592, "epoch": 4276} {"train_loss": -7.075016021728516, "global_step": 179593, "epoch": 4276} {"train_loss": -7.055018424987793, "global_step": 179594, "epoch": 4276} {"train_loss": -7.088597297668457, "global_step": 179595, "epoch": 4276} {"train_loss": -7.057906150817871, "global_step": 179596, "epoch": 4276} {"train_loss": -7.029733657836914, "global_step": 179597, "epoch": 4276} {"train_loss": -7.06131649017334, "global_step": 179598, "epoch": 4276} {"train_loss": -7.197518348693848, "global_step": 179599, "epoch": 4276} {"train_loss": -7.0228271484375, "global_step": 179600, "epoch": 4276} {"train_loss": -7.153260707855225, "global_step": 179601, "epoch": 4276} {"train_loss": -7.2480363845825195, "global_step": 179602, "epoch": 4276} {"train_loss": -7.107178688049316, "global_step": 179603, "epoch": 4276} {"train_loss": -7.161993980407715, "global_step": 179604, "epoch": 4276} {"train_loss": -7.090242385864258, "global_step": 179605, "epoch": 4276} {"train_loss": -7.091987133026123, "global_step": 179606, "epoch": 4276} {"train_loss": -7.134202003479004, "global_step": 179607, "epoch": 4276} {"train_loss": -7.160070419311523, "global_step": 179608, "epoch": 4276} {"train_loss": -7.086178779602051, "global_step": 179609, "epoch": 4276} {"train_loss": -7.210121154785156, "global_step": 179610, "epoch": 4276} {"train_loss": -7.061975479125977, "global_step": 179611, "epoch": 4276} {"train_loss": -7.154888153076172, "global_step": 179612, "epoch": 4276} {"train_loss": -7.212421894073486, "global_step": 179613, "epoch": 4276} {"train_loss": -7.016788482666016, "global_step": 179614, "epoch": 4276} {"train_loss": -7.223891258239746, "global_step": 179615, "epoch": 4276} {"train_loss": -7.072730541229248, "global_step": 179616, "epoch": 4276} {"train_loss": -7.16586971282959, "global_step": 179617, "epoch": 4276} {"train_loss": -7.089437961578369, "global_step": 179618, "epoch": 4276} {"train_loss": -7.049944877624512, "global_step": 179619, "epoch": 4276} {"train_loss": -7.118461608886719, "global_step": 179620, "epoch": 4276} {"train_loss": -7.218042373657227, "global_step": 179621, "epoch": 4276} {"train_loss": -7.032648086547852, "global_step": 179622, "epoch": 4276} {"train_loss": -7.013833045959473, "global_step": 179623, "epoch": 4276} {"train_loss": -7.129009246826172, "global_step": 179624, "epoch": 4276} {"train_loss": -7.046627044677734, "global_step": 179625, "epoch": 4276} {"train_loss": -7.139669418334961, "global_step": 179626, "epoch": 4276} {"train_loss": -7.1747002601623535, "global_step": 179627, "epoch": 4276} {"train_loss": -7.107542991638184, "global_step": 179628, "epoch": 4276} {"train_loss": -7.0403571128845215, "global_step": 179629, "epoch": 4276} {"train_loss": -7.031340599060059, "global_step": 179630, "epoch": 4276} {"train_loss": -7.015870094299316, "global_step": 179631, "epoch": 4276} {"train_loss": -6.951045036315918, "global_step": 179632, "epoch": 4276} {"train_loss": -7.103089752651396, "global_step": 179633, "epoch": 4276, "val_loss": 69316.828125} {"train_loss": -7.1547980308532715, "global_step": 179634, "epoch": 4277} {"train_loss": -7.124856472015381, "global_step": 179635, "epoch": 4277} {"train_loss": -7.092996597290039, "global_step": 179636, "epoch": 4277} {"train_loss": -7.120661735534668, "global_step": 179637, "epoch": 4277} {"train_loss": -7.0948052406311035, "global_step": 179638, "epoch": 4277} {"train_loss": -7.16333532333374, "global_step": 179639, "epoch": 4277} {"train_loss": -7.059127330780029, "global_step": 179640, "epoch": 4277} {"train_loss": -7.050861358642578, "global_step": 179641, "epoch": 4277} {"train_loss": -7.2301836013793945, "global_step": 179642, "epoch": 4277} {"train_loss": -7.0965189933776855, "global_step": 179643, "epoch": 4277} {"train_loss": -7.063311576843262, "global_step": 179644, "epoch": 4277} {"train_loss": -7.101038932800293, "global_step": 179645, "epoch": 4277} {"train_loss": -6.990522384643555, "global_step": 179646, "epoch": 4277} {"train_loss": -7.039572715759277, "global_step": 179647, "epoch": 4277} {"train_loss": -7.053070068359375, "global_step": 179648, "epoch": 4277} {"train_loss": -6.958585262298584, "global_step": 179649, "epoch": 4277} {"train_loss": -7.098827362060547, "global_step": 179650, "epoch": 4277} {"train_loss": -6.987618446350098, "global_step": 179651, "epoch": 4277} {"train_loss": -6.949723243713379, "global_step": 179652, "epoch": 4277} {"train_loss": -7.15714168548584, "global_step": 179653, "epoch": 4277} {"train_loss": -7.031894683837891, "global_step": 179654, "epoch": 4277} {"train_loss": -7.019438743591309, "global_step": 179655, "epoch": 4277} {"train_loss": -7.145289421081543, "global_step": 179656, "epoch": 4277} {"train_loss": -7.027996063232422, "global_step": 179657, "epoch": 4277} {"train_loss": -7.125792503356934, "global_step": 179658, "epoch": 4277} {"train_loss": -7.193213939666748, "global_step": 179659, "epoch": 4277} {"train_loss": -6.959160804748535, "global_step": 179660, "epoch": 4277} {"train_loss": -7.064723968505859, "global_step": 179661, "epoch": 4277} {"train_loss": -7.102977752685547, "global_step": 179662, "epoch": 4277} {"train_loss": -7.0970964431762695, "global_step": 179663, "epoch": 4277} {"train_loss": -7.151144027709961, "global_step": 179664, "epoch": 4277} {"train_loss": -7.162033557891846, "global_step": 179665, "epoch": 4277} {"train_loss": -7.077143669128418, "global_step": 179666, "epoch": 4277} {"train_loss": -7.228235244750977, "global_step": 179667, "epoch": 4277} {"train_loss": -7.151276111602783, "global_step": 179668, "epoch": 4277} {"train_loss": -7.206923961639404, "global_step": 179669, "epoch": 4277} {"train_loss": -7.112216472625732, "global_step": 179670, "epoch": 4277} {"train_loss": -7.213740825653076, "global_step": 179671, "epoch": 4277} {"train_loss": -7.175110340118408, "global_step": 179672, "epoch": 4277} {"train_loss": -7.115408897399902, "global_step": 179673, "epoch": 4277} {"train_loss": -7.205853462219238, "global_step": 179674, "epoch": 4277} {"train_loss": -7.1046439579554965, "global_step": 179675, "epoch": 4277, "val_loss": 69184.03125} {"train_loss": -7.149016380310059, "global_step": 179676, "epoch": 4278} {"train_loss": -7.10985803604126, "global_step": 179677, "epoch": 4278} {"train_loss": -7.146021842956543, "global_step": 179678, "epoch": 4278} {"train_loss": -6.978828430175781, "global_step": 179679, "epoch": 4278} {"train_loss": -7.273197650909424, "global_step": 179680, "epoch": 4278} {"train_loss": -7.140052318572998, "global_step": 179681, "epoch": 4278} {"train_loss": -7.112524032592773, "global_step": 179682, "epoch": 4278} {"train_loss": -7.250593185424805, "global_step": 179683, "epoch": 4278} {"train_loss": -7.204052925109863, "global_step": 179684, "epoch": 4278} {"train_loss": -7.103212356567383, "global_step": 179685, "epoch": 4278} {"train_loss": -7.0365214347839355, "global_step": 179686, "epoch": 4278} {"train_loss": -7.1017351150512695, "global_step": 179687, "epoch": 4278} {"train_loss": -6.915411949157715, "global_step": 179688, "epoch": 4278} {"train_loss": -7.1474199295043945, "global_step": 179689, "epoch": 4278} {"train_loss": -6.983933448791504, "global_step": 179690, "epoch": 4278} {"train_loss": -6.9292402267456055, "global_step": 179691, "epoch": 4278} {"train_loss": -7.182185173034668, "global_step": 179692, "epoch": 4278} {"train_loss": -6.899502754211426, "global_step": 179693, "epoch": 4278} {"train_loss": -7.111910820007324, "global_step": 179694, "epoch": 4278} {"train_loss": -7.095034122467041, "global_step": 179695, "epoch": 4278} {"train_loss": -6.963510990142822, "global_step": 179696, "epoch": 4278} {"train_loss": -7.169610977172852, "global_step": 179697, "epoch": 4278} {"train_loss": -7.1104021072387695, "global_step": 179698, "epoch": 4278} {"train_loss": -7.085731506347656, "global_step": 179699, "epoch": 4278} {"train_loss": -7.0241923332214355, "global_step": 179700, "epoch": 4278} {"train_loss": -7.12442684173584, "global_step": 179701, "epoch": 4278} {"train_loss": -7.054080963134766, "global_step": 179702, "epoch": 4278} {"train_loss": -7.110305309295654, "global_step": 179703, "epoch": 4278} {"train_loss": -7.125930309295654, "global_step": 179704, "epoch": 4278} {"train_loss": -7.213964462280273, "global_step": 179705, "epoch": 4278} {"train_loss": -7.034449577331543, "global_step": 179706, "epoch": 4278} {"train_loss": -6.9547038078308105, "global_step": 179707, "epoch": 4278} {"train_loss": -7.118438243865967, "global_step": 179708, "epoch": 4278} {"train_loss": -7.038332939147949, "global_step": 179709, "epoch": 4278} {"train_loss": -7.088596343994141, "global_step": 179710, "epoch": 4278} {"train_loss": -7.033225059509277, "global_step": 179711, "epoch": 4278} {"train_loss": -7.2165446281433105, "global_step": 179712, "epoch": 4278} {"train_loss": -7.070400238037109, "global_step": 179713, "epoch": 4278} {"train_loss": -7.053813457489014, "global_step": 179714, "epoch": 4278} {"train_loss": -7.119533538818359, "global_step": 179715, "epoch": 4278} {"train_loss": -7.034579753875732, "global_step": 179716, "epoch": 4278} {"train_loss": -7.087807235263643, "global_step": 179717, "epoch": 4278, "val_loss": 69417.21875} {"train_loss": -7.085937023162842, "global_step": 179718, "epoch": 4279} {"train_loss": -6.9584856033325195, "global_step": 179719, "epoch": 4279} {"train_loss": -7.061392784118652, "global_step": 179720, "epoch": 4279} {"train_loss": -6.950651168823242, "global_step": 179721, "epoch": 4279} {"train_loss": -7.052258491516113, "global_step": 179722, "epoch": 4279} {"train_loss": -7.042141914367676, "global_step": 179723, "epoch": 4279} {"train_loss": -6.942755699157715, "global_step": 179724, "epoch": 4279} {"train_loss": -7.237821578979492, "global_step": 179725, "epoch": 4279} {"train_loss": -7.026346206665039, "global_step": 179726, "epoch": 4279} {"train_loss": -7.087460517883301, "global_step": 179727, "epoch": 4279} {"train_loss": -7.1666669845581055, "global_step": 179728, "epoch": 4279} {"train_loss": -7.16245698928833, "global_step": 179729, "epoch": 4279} {"train_loss": -7.127763748168945, "global_step": 179730, "epoch": 4279} {"train_loss": -7.181011199951172, "global_step": 179731, "epoch": 4279} {"train_loss": -7.112270832061768, "global_step": 179732, "epoch": 4279} {"train_loss": -7.315522193908691, "global_step": 179733, "epoch": 4279} {"train_loss": -7.109985828399658, "global_step": 179734, "epoch": 4279} {"train_loss": -7.1046247482299805, "global_step": 179735, "epoch": 4279} {"train_loss": -7.197793483734131, "global_step": 179736, "epoch": 4279} {"train_loss": -7.1583662033081055, "global_step": 179737, "epoch": 4279} {"train_loss": -7.152543067932129, "global_step": 179738, "epoch": 4279} {"train_loss": -7.097502708435059, "global_step": 179739, "epoch": 4279} {"train_loss": -7.178267955780029, "global_step": 179740, "epoch": 4279} {"train_loss": -7.136170387268066, "global_step": 179741, "epoch": 4279} {"train_loss": -7.146681308746338, "global_step": 179742, "epoch": 4279} {"train_loss": -7.166414260864258, "global_step": 179743, "epoch": 4279} {"train_loss": -7.089944839477539, "global_step": 179744, "epoch": 4279} {"train_loss": -7.156550407409668, "global_step": 179745, "epoch": 4279} {"train_loss": -7.188061714172363, "global_step": 179746, "epoch": 4279} {"train_loss": -7.1824750900268555, "global_step": 179747, "epoch": 4279} {"train_loss": -6.972420692443848, "global_step": 179748, "epoch": 4279} {"train_loss": -7.010265350341797, "global_step": 179749, "epoch": 4279} {"train_loss": -7.058594226837158, "global_step": 179750, "epoch": 4279} {"train_loss": -7.136092185974121, "global_step": 179751, "epoch": 4279} {"train_loss": -7.096743583679199, "global_step": 179752, "epoch": 4279} {"train_loss": -7.223732948303223, "global_step": 179753, "epoch": 4279} {"train_loss": -7.105470180511475, "global_step": 179754, "epoch": 4279} {"train_loss": -7.244813919067383, "global_step": 179755, "epoch": 4279} {"train_loss": -7.115593910217285, "global_step": 179756, "epoch": 4279} {"train_loss": -7.178182601928711, "global_step": 179757, "epoch": 4279} {"train_loss": -7.070047855377197, "global_step": 179758, "epoch": 4279} {"train_loss": -7.116725331261044, "global_step": 179759, "epoch": 4279, "val_loss": 69418.3828125} {"train_loss": -7.27048921585083, "global_step": 179760, "epoch": 4280} {"train_loss": -7.097107887268066, "global_step": 179761, "epoch": 4280} {"train_loss": -7.180354118347168, "global_step": 179762, "epoch": 4280} {"train_loss": -7.118986129760742, "global_step": 179763, "epoch": 4280} {"train_loss": -7.124953269958496, "global_step": 179764, "epoch": 4280} {"train_loss": -7.1869707107543945, "global_step": 179765, "epoch": 4280} {"train_loss": -7.110693454742432, "global_step": 179766, "epoch": 4280} {"train_loss": -7.105483055114746, "global_step": 179767, "epoch": 4280} {"train_loss": -7.150008201599121, "global_step": 179768, "epoch": 4280} {"train_loss": -7.117171764373779, "global_step": 179769, "epoch": 4280} {"train_loss": -7.084061622619629, "global_step": 179770, "epoch": 4280} {"train_loss": -7.206229209899902, "global_step": 179771, "epoch": 4280} {"train_loss": -7.156930446624756, "global_step": 179772, "epoch": 4280} {"train_loss": -7.179599761962891, "global_step": 179773, "epoch": 4280} {"train_loss": -7.154609203338623, "global_step": 179774, "epoch": 4280} {"train_loss": -7.080222129821777, "global_step": 179775, "epoch": 4280} {"train_loss": -7.077077865600586, "global_step": 179776, "epoch": 4280} {"train_loss": -7.127288818359375, "global_step": 179777, "epoch": 4280} {"train_loss": -7.177794933319092, "global_step": 179778, "epoch": 4280} {"train_loss": -7.060422420501709, "global_step": 179779, "epoch": 4280} {"train_loss": -7.072937965393066, "global_step": 179780, "epoch": 4280} {"train_loss": -7.125398635864258, "global_step": 179781, "epoch": 4280} {"train_loss": -7.229407787322998, "global_step": 179782, "epoch": 4280} {"train_loss": -7.037700653076172, "global_step": 179783, "epoch": 4280} {"train_loss": -7.167801856994629, "global_step": 179784, "epoch": 4280} {"train_loss": -7.211124420166016, "global_step": 179785, "epoch": 4280} {"train_loss": -7.068385124206543, "global_step": 179786, "epoch": 4280} {"train_loss": -7.080792427062988, "global_step": 179787, "epoch": 4280} {"train_loss": -7.144369602203369, "global_step": 179788, "epoch": 4280} {"train_loss": -7.141891002655029, "global_step": 179789, "epoch": 4280} {"train_loss": -7.111201763153076, "global_step": 179790, "epoch": 4280} {"train_loss": -7.121267795562744, "global_step": 179791, "epoch": 4280} {"train_loss": -7.12274169921875, "global_step": 179792, "epoch": 4280} {"train_loss": -7.063657760620117, "global_step": 179793, "epoch": 4280} {"train_loss": -7.094480037689209, "global_step": 179794, "epoch": 4280} {"train_loss": -7.111659049987793, "global_step": 179795, "epoch": 4280} {"train_loss": -7.114296913146973, "global_step": 179796, "epoch": 4280} {"train_loss": -7.144716739654541, "global_step": 179797, "epoch": 4280} {"train_loss": -7.162286758422852, "global_step": 179798, "epoch": 4280} {"train_loss": -7.068872928619385, "global_step": 179799, "epoch": 4280} {"train_loss": -7.131381034851074, "global_step": 179800, "epoch": 4280} {"train_loss": -7.127413136618478, "global_step": 179801, "epoch": 4280, "val_loss": 69584.1640625} {"train_loss": -6.947267532348633, "global_step": 179802, "epoch": 4281} {"train_loss": -7.111415863037109, "global_step": 179803, "epoch": 4281} {"train_loss": -7.220480918884277, "global_step": 179804, "epoch": 4281} {"train_loss": -7.117108345031738, "global_step": 179805, "epoch": 4281} {"train_loss": -7.155981540679932, "global_step": 179806, "epoch": 4281} {"train_loss": -7.209786415100098, "global_step": 179807, "epoch": 4281} {"train_loss": -7.078700065612793, "global_step": 179808, "epoch": 4281} {"train_loss": -7.136807441711426, "global_step": 179809, "epoch": 4281} {"train_loss": -7.067409038543701, "global_step": 179810, "epoch": 4281} {"train_loss": -7.117383003234863, "global_step": 179811, "epoch": 4281} {"train_loss": -7.066291809082031, "global_step": 179812, "epoch": 4281} {"train_loss": -7.038987159729004, "global_step": 179813, "epoch": 4281} {"train_loss": -7.10923957824707, "global_step": 179814, "epoch": 4281} {"train_loss": -6.973365783691406, "global_step": 179815, "epoch": 4281} {"train_loss": -7.064867973327637, "global_step": 179816, "epoch": 4281} {"train_loss": -6.924407005310059, "global_step": 179817, "epoch": 4281} {"train_loss": -7.06834602355957, "global_step": 179818, "epoch": 4281} {"train_loss": -7.088788032531738, "global_step": 179819, "epoch": 4281} {"train_loss": -7.022858142852783, "global_step": 179820, "epoch": 4281} {"train_loss": -7.164512634277344, "global_step": 179821, "epoch": 4281} {"train_loss": -7.0749053955078125, "global_step": 179822, "epoch": 4281} {"train_loss": -7.006217956542969, "global_step": 179823, "epoch": 4281} {"train_loss": -7.056288242340088, "global_step": 179824, "epoch": 4281} {"train_loss": -7.057492256164551, "global_step": 179825, "epoch": 4281} {"train_loss": -7.028215408325195, "global_step": 179826, "epoch": 4281} {"train_loss": -7.169242858886719, "global_step": 179827, "epoch": 4281} {"train_loss": -7.185670852661133, "global_step": 179828, "epoch": 4281} {"train_loss": -7.132962703704834, "global_step": 179829, "epoch": 4281} {"train_loss": -7.114537239074707, "global_step": 179830, "epoch": 4281} {"train_loss": -7.147101402282715, "global_step": 179831, "epoch": 4281} {"train_loss": -7.06505012512207, "global_step": 179832, "epoch": 4281} {"train_loss": -7.055019855499268, "global_step": 179833, "epoch": 4281} {"train_loss": -7.159969806671143, "global_step": 179834, "epoch": 4281} {"train_loss": -7.136236667633057, "global_step": 179835, "epoch": 4281} {"train_loss": -7.1112141609191895, "global_step": 179836, "epoch": 4281} {"train_loss": -7.147332191467285, "global_step": 179837, "epoch": 4281} {"train_loss": -7.046545028686523, "global_step": 179838, "epoch": 4281} {"train_loss": -7.047496318817139, "global_step": 179839, "epoch": 4281} {"train_loss": -7.038475036621094, "global_step": 179840, "epoch": 4281} {"train_loss": -7.0332489013671875, "global_step": 179841, "epoch": 4281} {"train_loss": -7.059516429901123, "global_step": 179842, "epoch": 4281} {"train_loss": -7.086951153618949, "global_step": 179843, "epoch": 4281, "val_loss": 69577.6171875} {"train_loss": -7.150265693664551, "global_step": 179844, "epoch": 4282} {"train_loss": -7.161800384521484, "global_step": 179845, "epoch": 4282} {"train_loss": -7.1308746337890625, "global_step": 179846, "epoch": 4282} {"train_loss": -7.286767959594727, "global_step": 179847, "epoch": 4282} {"train_loss": -7.177757740020752, "global_step": 179848, "epoch": 4282} {"train_loss": -7.168610572814941, "global_step": 179849, "epoch": 4282} {"train_loss": -7.067307472229004, "global_step": 179850, "epoch": 4282} {"train_loss": -7.101825714111328, "global_step": 179851, "epoch": 4282} {"train_loss": -7.193877220153809, "global_step": 179852, "epoch": 4282} {"train_loss": -7.232190132141113, "global_step": 179853, "epoch": 4282} {"train_loss": -7.079797744750977, "global_step": 179854, "epoch": 4282} {"train_loss": -7.236146450042725, "global_step": 179855, "epoch": 4282} {"train_loss": -7.202578067779541, "global_step": 179856, "epoch": 4282} {"train_loss": -7.109953880310059, "global_step": 179857, "epoch": 4282} {"train_loss": -7.075033187866211, "global_step": 179858, "epoch": 4282} {"train_loss": -7.175424098968506, "global_step": 179859, "epoch": 4282} {"train_loss": -7.110640525817871, "global_step": 179860, "epoch": 4282} {"train_loss": -7.129176139831543, "global_step": 179861, "epoch": 4282} {"train_loss": -7.091090679168701, "global_step": 179862, "epoch": 4282} {"train_loss": -7.129153251647949, "global_step": 179863, "epoch": 4282} {"train_loss": -7.097929954528809, "global_step": 179864, "epoch": 4282} {"train_loss": -7.066581726074219, "global_step": 179865, "epoch": 4282} {"train_loss": -7.006965637207031, "global_step": 179866, "epoch": 4282} {"train_loss": -7.114744186401367, "global_step": 179867, "epoch": 4282} {"train_loss": -7.016846656799316, "global_step": 179868, "epoch": 4282} {"train_loss": -7.077586650848389, "global_step": 179869, "epoch": 4282} {"train_loss": -6.996481895446777, "global_step": 179870, "epoch": 4282} {"train_loss": -6.924353122711182, "global_step": 179871, "epoch": 4282} {"train_loss": -6.975179672241211, "global_step": 179872, "epoch": 4282} {"train_loss": -6.9573445320129395, "global_step": 179873, "epoch": 4282} {"train_loss": -6.8043532371521, "global_step": 179874, "epoch": 4282} {"train_loss": -6.6945905685424805, "global_step": 179875, "epoch": 4282} {"train_loss": -6.863927841186523, "global_step": 179876, "epoch": 4282} {"train_loss": -6.909911155700684, "global_step": 179877, "epoch": 4282} {"train_loss": -7.016358375549316, "global_step": 179878, "epoch": 4282} {"train_loss": -6.932448387145996, "global_step": 179879, "epoch": 4282} {"train_loss": -7.033836364746094, "global_step": 179880, "epoch": 4282} {"train_loss": -6.903940677642822, "global_step": 179881, "epoch": 4282} {"train_loss": -6.989480972290039, "global_step": 179882, "epoch": 4282} {"train_loss": -7.07699728012085, "global_step": 179883, "epoch": 4282} {"train_loss": -6.992441654205322, "global_step": 179884, "epoch": 4282} {"train_loss": -7.060489677247547, "global_step": 179885, "epoch": 4282, "val_loss": 69485.8515625} {"train_loss": -7.152916431427002, "global_step": 179886, "epoch": 4283} {"train_loss": -7.094357013702393, "global_step": 179887, "epoch": 4283} {"train_loss": -7.017612457275391, "global_step": 179888, "epoch": 4283} {"train_loss": -7.101718425750732, "global_step": 179889, "epoch": 4283} {"train_loss": -7.037442207336426, "global_step": 179890, "epoch": 4283} {"train_loss": -7.161181449890137, "global_step": 179891, "epoch": 4283} {"train_loss": -7.091667175292969, "global_step": 179892, "epoch": 4283} {"train_loss": -7.1184844970703125, "global_step": 179893, "epoch": 4283} {"train_loss": -7.019655227661133, "global_step": 179894, "epoch": 4283} {"train_loss": -7.103263854980469, "global_step": 179895, "epoch": 4283} {"train_loss": -7.176201343536377, "global_step": 179896, "epoch": 4283} {"train_loss": -7.054605484008789, "global_step": 179897, "epoch": 4283} {"train_loss": -7.099851608276367, "global_step": 179898, "epoch": 4283} {"train_loss": -7.083709239959717, "global_step": 179899, "epoch": 4283} {"train_loss": -7.0388288497924805, "global_step": 179900, "epoch": 4283} {"train_loss": -7.006462097167969, "global_step": 179901, "epoch": 4283} {"train_loss": -7.221723556518555, "global_step": 179902, "epoch": 4283} {"train_loss": -7.034212112426758, "global_step": 179903, "epoch": 4283} {"train_loss": -7.10426139831543, "global_step": 179904, "epoch": 4283} {"train_loss": -6.96080207824707, "global_step": 179905, "epoch": 4283} {"train_loss": -6.898514747619629, "global_step": 179906, "epoch": 4283} {"train_loss": -7.055622577667236, "global_step": 179907, "epoch": 4283} {"train_loss": -6.887426376342773, "global_step": 179908, "epoch": 4283} {"train_loss": -7.1252899169921875, "global_step": 179909, "epoch": 4283} {"train_loss": -7.011425971984863, "global_step": 179910, "epoch": 4283} {"train_loss": -6.890582084655762, "global_step": 179911, "epoch": 4283} {"train_loss": -6.978854179382324, "global_step": 179912, "epoch": 4283} {"train_loss": -7.09494686126709, "global_step": 179913, "epoch": 4283} {"train_loss": -6.983826160430908, "global_step": 179914, "epoch": 4283} {"train_loss": -7.1230645179748535, "global_step": 179915, "epoch": 4283} {"train_loss": -7.096895694732666, "global_step": 179916, "epoch": 4283} {"train_loss": -7.007241725921631, "global_step": 179917, "epoch": 4283} {"train_loss": -7.0649094581604, "global_step": 179918, "epoch": 4283} {"train_loss": -7.060074329376221, "global_step": 179919, "epoch": 4283} {"train_loss": -7.116201400756836, "global_step": 179920, "epoch": 4283} {"train_loss": -6.979619979858398, "global_step": 179921, "epoch": 4283} {"train_loss": -7.054741859436035, "global_step": 179922, "epoch": 4283} {"train_loss": -7.027376174926758, "global_step": 179923, "epoch": 4283} {"train_loss": -7.065362453460693, "global_step": 179924, "epoch": 4283} {"train_loss": -7.215507507324219, "global_step": 179925, "epoch": 4283} {"train_loss": -7.139009475708008, "global_step": 179926, "epoch": 4283} {"train_loss": -7.064355157670521, "global_step": 179927, "epoch": 4283, "val_loss": 69313.578125} {"train_loss": -7.125699043273926, "global_step": 179928, "epoch": 4284} {"train_loss": -7.131802082061768, "global_step": 179929, "epoch": 4284} {"train_loss": -7.249387741088867, "global_step": 179930, "epoch": 4284} {"train_loss": -7.101285934448242, "global_step": 179931, "epoch": 4284} {"train_loss": -7.069813251495361, "global_step": 179932, "epoch": 4284} {"train_loss": -7.253714561462402, "global_step": 179933, "epoch": 4284} {"train_loss": -7.144129276275635, "global_step": 179934, "epoch": 4284} {"train_loss": -7.224321365356445, "global_step": 179935, "epoch": 4284} {"train_loss": -7.119877815246582, "global_step": 179936, "epoch": 4284} {"train_loss": -7.255002498626709, "global_step": 179937, "epoch": 4284} {"train_loss": -7.371145248413086, "global_step": 179938, "epoch": 4284} {"train_loss": -7.0402326583862305, "global_step": 179939, "epoch": 4284} {"train_loss": -7.1430745124816895, "global_step": 179940, "epoch": 4284} {"train_loss": -7.1718573570251465, "global_step": 179941, "epoch": 4284} {"train_loss": -7.202700138092041, "global_step": 179942, "epoch": 4284} {"train_loss": -7.161810874938965, "global_step": 179943, "epoch": 4284} {"train_loss": -7.235783576965332, "global_step": 179944, "epoch": 4284} {"train_loss": -7.2735066413879395, "global_step": 179945, "epoch": 4284} {"train_loss": -7.145705223083496, "global_step": 179946, "epoch": 4284} {"train_loss": -7.096665382385254, "global_step": 179947, "epoch": 4284} {"train_loss": -7.056059837341309, "global_step": 179948, "epoch": 4284} {"train_loss": -7.079164981842041, "global_step": 179949, "epoch": 4284} {"train_loss": -7.1377668380737305, "global_step": 179950, "epoch": 4284} {"train_loss": -7.103461265563965, "global_step": 179951, "epoch": 4284} {"train_loss": -7.200509071350098, "global_step": 179952, "epoch": 4284} {"train_loss": -7.212769031524658, "global_step": 179953, "epoch": 4284} {"train_loss": -7.135882377624512, "global_step": 179954, "epoch": 4284} {"train_loss": -7.072315216064453, "global_step": 179955, "epoch": 4284} {"train_loss": -7.187639236450195, "global_step": 179956, "epoch": 4284} {"train_loss": -7.164076805114746, "global_step": 179957, "epoch": 4284} {"train_loss": -7.132080078125, "global_step": 179958, "epoch": 4284} {"train_loss": -7.2158308029174805, "global_step": 179959, "epoch": 4284} {"train_loss": -7.165338516235352, "global_step": 179960, "epoch": 4284} {"train_loss": -7.081042766571045, "global_step": 179961, "epoch": 4284} {"train_loss": -7.129973411560059, "global_step": 179962, "epoch": 4284} {"train_loss": -7.205163955688477, "global_step": 179963, "epoch": 4284} {"train_loss": -7.244236946105957, "global_step": 179964, "epoch": 4284} {"train_loss": -7.11785888671875, "global_step": 179965, "epoch": 4284} {"train_loss": -7.181219577789307, "global_step": 179966, "epoch": 4284} {"train_loss": -7.205731391906738, "global_step": 179967, "epoch": 4284} {"train_loss": -7.180692672729492, "global_step": 179968, "epoch": 4284} {"train_loss": -7.160895495187669, "global_step": 179969, "epoch": 4284, "val_loss": 69438.3359375} {"train_loss": -7.1482062339782715, "global_step": 179970, "epoch": 4285} {"train_loss": -7.058426380157471, "global_step": 179971, "epoch": 4285} {"train_loss": -7.10471773147583, "global_step": 179972, "epoch": 4285} {"train_loss": -7.295056343078613, "global_step": 179973, "epoch": 4285} {"train_loss": -7.190121173858643, "global_step": 179974, "epoch": 4285} {"train_loss": -7.06417179107666, "global_step": 179975, "epoch": 4285} {"train_loss": -7.157859802246094, "global_step": 179976, "epoch": 4285} {"train_loss": -7.084568977355957, "global_step": 179977, "epoch": 4285} {"train_loss": -7.011985778808594, "global_step": 179978, "epoch": 4285} {"train_loss": -7.101968288421631, "global_step": 179979, "epoch": 4285} {"train_loss": -7.033867359161377, "global_step": 179980, "epoch": 4285} {"train_loss": -6.990647315979004, "global_step": 179981, "epoch": 4285} {"train_loss": -7.111380577087402, "global_step": 179982, "epoch": 4285} {"train_loss": -6.833031177520752, "global_step": 179983, "epoch": 4285} {"train_loss": -6.793593406677246, "global_step": 179984, "epoch": 4285} {"train_loss": -7.085014343261719, "global_step": 179985, "epoch": 4285} {"train_loss": -6.846088409423828, "global_step": 179986, "epoch": 4285} {"train_loss": -6.963521957397461, "global_step": 179987, "epoch": 4285} {"train_loss": -6.962202072143555, "global_step": 179988, "epoch": 4285} {"train_loss": -6.878072261810303, "global_step": 179989, "epoch": 4285} {"train_loss": -6.9815168380737305, "global_step": 179990, "epoch": 4285} {"train_loss": -6.89534854888916, "global_step": 179991, "epoch": 4285} {"train_loss": -7.02251672744751, "global_step": 179992, "epoch": 4285} {"train_loss": -6.966799736022949, "global_step": 179993, "epoch": 4285} {"train_loss": -6.964291572570801, "global_step": 179994, "epoch": 4285} {"train_loss": -6.945117950439453, "global_step": 179995, "epoch": 4285} {"train_loss": -6.91773796081543, "global_step": 179996, "epoch": 4285} {"train_loss": -6.9851484298706055, "global_step": 179997, "epoch": 4285} {"train_loss": -6.965109348297119, "global_step": 179998, "epoch": 4285} {"train_loss": -7.139878273010254, "global_step": 179999, "epoch": 4285} {"train_loss": -7.036281108856201, "global_step": 180000, "epoch": 4285} {"train_loss": -7.154818058013916, "global_step": 180001, "epoch": 4285} {"train_loss": -7.069200038909912, "global_step": 180002, "epoch": 4285} {"train_loss": -7.101644515991211, "global_step": 180003, "epoch": 4285} {"train_loss": -7.000741004943848, "global_step": 180004, "epoch": 4285} {"train_loss": -6.989823341369629, "global_step": 180005, "epoch": 4285} {"train_loss": -7.118624210357666, "global_step": 180006, "epoch": 4285} {"train_loss": -7.092709064483643, "global_step": 180007, "epoch": 4285} {"train_loss": -7.137323379516602, "global_step": 180008, "epoch": 4285} {"train_loss": -6.987927436828613, "global_step": 180009, "epoch": 4285} {"train_loss": -6.96281623840332, "global_step": 180010, "epoch": 4285} {"train_loss": -7.030707506906419, "global_step": 180011, "epoch": 4285, "val_loss": 69266.7109375} {"train_loss": -6.9901909828186035, "global_step": 180012, "epoch": 4286} {"train_loss": -6.983735084533691, "global_step": 180013, "epoch": 4286} {"train_loss": -7.205744743347168, "global_step": 180014, "epoch": 4286} {"train_loss": -6.989316940307617, "global_step": 180015, "epoch": 4286} {"train_loss": -7.205285549163818, "global_step": 180016, "epoch": 4286} {"train_loss": -7.124044418334961, "global_step": 180017, "epoch": 4286} {"train_loss": -7.024466037750244, "global_step": 180018, "epoch": 4286} {"train_loss": -7.11648416519165, "global_step": 180019, "epoch": 4286} {"train_loss": -7.077789783477783, "global_step": 180020, "epoch": 4286} {"train_loss": -7.119729995727539, "global_step": 180021, "epoch": 4286} {"train_loss": -7.13417911529541, "global_step": 180022, "epoch": 4286} {"train_loss": -6.976797580718994, "global_step": 180023, "epoch": 4286} {"train_loss": -7.1226725578308105, "global_step": 180024, "epoch": 4286} {"train_loss": -7.054300308227539, "global_step": 180025, "epoch": 4286} {"train_loss": -7.134372711181641, "global_step": 180026, "epoch": 4286} {"train_loss": -7.068437576293945, "global_step": 180027, "epoch": 4286} {"train_loss": -7.194931983947754, "global_step": 180028, "epoch": 4286} {"train_loss": -7.21844482421875, "global_step": 180029, "epoch": 4286} {"train_loss": -7.0172271728515625, "global_step": 180030, "epoch": 4286} {"train_loss": -7.260778427124023, "global_step": 180031, "epoch": 4286} {"train_loss": -6.9895219802856445, "global_step": 180032, "epoch": 4286} {"train_loss": -7.004230499267578, "global_step": 180033, "epoch": 4286} {"train_loss": -7.202354907989502, "global_step": 180034, "epoch": 4286} {"train_loss": -6.999396324157715, "global_step": 180035, "epoch": 4286} {"train_loss": -7.183168411254883, "global_step": 180036, "epoch": 4286} {"train_loss": -7.185361385345459, "global_step": 180037, "epoch": 4286} {"train_loss": -6.931122303009033, "global_step": 180038, "epoch": 4286} {"train_loss": -7.084039688110352, "global_step": 180039, "epoch": 4286} {"train_loss": -6.99736213684082, "global_step": 180040, "epoch": 4286} {"train_loss": -7.013973236083984, "global_step": 180041, "epoch": 4286} {"train_loss": -7.2058305740356445, "global_step": 180042, "epoch": 4286} {"train_loss": -7.075301170349121, "global_step": 180043, "epoch": 4286} {"train_loss": -6.982367992401123, "global_step": 180044, "epoch": 4286} {"train_loss": -7.011528015136719, "global_step": 180045, "epoch": 4286} {"train_loss": -6.952543258666992, "global_step": 180046, "epoch": 4286} {"train_loss": -7.1294355392456055, "global_step": 180047, "epoch": 4286} {"train_loss": -7.152039527893066, "global_step": 180048, "epoch": 4286} {"train_loss": -7.059141159057617, "global_step": 180049, "epoch": 4286} {"train_loss": -7.109339714050293, "global_step": 180050, "epoch": 4286} {"train_loss": -7.0573601722717285, "global_step": 180051, "epoch": 4286} {"train_loss": -7.114920616149902, "global_step": 180052, "epoch": 4286} {"train_loss": -7.0853690419878275, "global_step": 180053, "epoch": 4286, "val_loss": 69401.5390625} {"train_loss": -7.0906829833984375, "global_step": 180054, "epoch": 4287} {"train_loss": -6.998469829559326, "global_step": 180055, "epoch": 4287} {"train_loss": -7.044393539428711, "global_step": 180056, "epoch": 4287} {"train_loss": -7.191040992736816, "global_step": 180057, "epoch": 4287} {"train_loss": -7.041202545166016, "global_step": 180058, "epoch": 4287} {"train_loss": -7.152962684631348, "global_step": 180059, "epoch": 4287} {"train_loss": -7.092379570007324, "global_step": 180060, "epoch": 4287} {"train_loss": -7.107381820678711, "global_step": 180061, "epoch": 4287} {"train_loss": -7.034921646118164, "global_step": 180062, "epoch": 4287} {"train_loss": -6.966056823730469, "global_step": 180063, "epoch": 4287} {"train_loss": -7.0909552574157715, "global_step": 180064, "epoch": 4287} {"train_loss": -7.0908589363098145, "global_step": 180065, "epoch": 4287} {"train_loss": -7.0548095703125, "global_step": 180066, "epoch": 4287} {"train_loss": -7.112199783325195, "global_step": 180067, "epoch": 4287} {"train_loss": -7.167792320251465, "global_step": 180068, "epoch": 4287} {"train_loss": -7.321364402770996, "global_step": 180069, "epoch": 4287} {"train_loss": -7.073293209075928, "global_step": 180070, "epoch": 4287} {"train_loss": -7.1602277755737305, "global_step": 180071, "epoch": 4287} {"train_loss": -7.222794532775879, "global_step": 180072, "epoch": 4287} {"train_loss": -7.081950664520264, "global_step": 180073, "epoch": 4287} {"train_loss": -7.135258197784424, "global_step": 180074, "epoch": 4287} {"train_loss": -7.1781229972839355, "global_step": 180075, "epoch": 4287} {"train_loss": -7.031761169433594, "global_step": 180076, "epoch": 4287} {"train_loss": -7.183931350708008, "global_step": 180077, "epoch": 4287} {"train_loss": -7.051712989807129, "global_step": 180078, "epoch": 4287} {"train_loss": -7.221541404724121, "global_step": 180079, "epoch": 4287} {"train_loss": -7.085844993591309, "global_step": 180080, "epoch": 4287} {"train_loss": -7.105727195739746, "global_step": 180081, "epoch": 4287} {"train_loss": -7.053652763366699, "global_step": 180082, "epoch": 4287} {"train_loss": -7.102025985717773, "global_step": 180083, "epoch": 4287} {"train_loss": -7.1382832527160645, "global_step": 180084, "epoch": 4287} {"train_loss": -7.054308891296387, "global_step": 180085, "epoch": 4287} {"train_loss": -7.019172191619873, "global_step": 180086, "epoch": 4287} {"train_loss": -7.245850086212158, "global_step": 180087, "epoch": 4287} {"train_loss": -7.184776306152344, "global_step": 180088, "epoch": 4287} {"train_loss": -7.243229866027832, "global_step": 180089, "epoch": 4287} {"train_loss": -7.114360332489014, "global_step": 180090, "epoch": 4287} {"train_loss": -7.1630539894104, "global_step": 180091, "epoch": 4287} {"train_loss": -7.193924427032471, "global_step": 180092, "epoch": 4287} {"train_loss": -7.199862480163574, "global_step": 180093, "epoch": 4287} {"train_loss": -7.152621269226074, "global_step": 180094, "epoch": 4287} {"train_loss": -7.123541684377761, "global_step": 180095, "epoch": 4287, "val_loss": 69334.53125} {"train_loss": -7.242240905761719, "global_step": 180096, "epoch": 4288} {"train_loss": -7.184191703796387, "global_step": 180097, "epoch": 4288} {"train_loss": -7.080501079559326, "global_step": 180098, "epoch": 4288} {"train_loss": -7.17819881439209, "global_step": 180099, "epoch": 4288} {"train_loss": -7.183685302734375, "global_step": 180100, "epoch": 4288} {"train_loss": -7.224834442138672, "global_step": 180101, "epoch": 4288} {"train_loss": -7.116388320922852, "global_step": 180102, "epoch": 4288} {"train_loss": -7.2182159423828125, "global_step": 180103, "epoch": 4288} {"train_loss": -7.247359275817871, "global_step": 180104, "epoch": 4288} {"train_loss": -7.1736626625061035, "global_step": 180105, "epoch": 4288} {"train_loss": -7.281871318817139, "global_step": 180106, "epoch": 4288} {"train_loss": -7.100645065307617, "global_step": 180107, "epoch": 4288} {"train_loss": -7.1463823318481445, "global_step": 180108, "epoch": 4288} {"train_loss": -7.138999938964844, "global_step": 180109, "epoch": 4288} {"train_loss": -7.132020950317383, "global_step": 180110, "epoch": 4288} {"train_loss": -7.174191474914551, "global_step": 180111, "epoch": 4288} {"train_loss": -7.086200714111328, "global_step": 180112, "epoch": 4288} {"train_loss": -7.215997695922852, "global_step": 180113, "epoch": 4288} {"train_loss": -7.181934356689453, "global_step": 180114, "epoch": 4288} {"train_loss": -7.087880611419678, "global_step": 180115, "epoch": 4288} {"train_loss": -7.091070652008057, "global_step": 180116, "epoch": 4288} {"train_loss": -7.174277305603027, "global_step": 180117, "epoch": 4288} {"train_loss": -7.000608444213867, "global_step": 180118, "epoch": 4288} {"train_loss": -7.108731269836426, "global_step": 180119, "epoch": 4288} {"train_loss": -7.022994518280029, "global_step": 180120, "epoch": 4288} {"train_loss": -7.02857780456543, "global_step": 180121, "epoch": 4288} {"train_loss": -7.201046943664551, "global_step": 180122, "epoch": 4288} {"train_loss": -7.186392784118652, "global_step": 180123, "epoch": 4288} {"train_loss": -7.015964984893799, "global_step": 180124, "epoch": 4288} {"train_loss": -7.125128746032715, "global_step": 180125, "epoch": 4288} {"train_loss": -6.939266204833984, "global_step": 180126, "epoch": 4288} {"train_loss": -7.096062660217285, "global_step": 180127, "epoch": 4288} {"train_loss": -7.144434928894043, "global_step": 180128, "epoch": 4288} {"train_loss": -7.118720054626465, "global_step": 180129, "epoch": 4288} {"train_loss": -7.1247453689575195, "global_step": 180130, "epoch": 4288} {"train_loss": -7.085465431213379, "global_step": 180131, "epoch": 4288} {"train_loss": -6.966444969177246, "global_step": 180132, "epoch": 4288} {"train_loss": -6.832156658172607, "global_step": 180133, "epoch": 4288} {"train_loss": -6.938664436340332, "global_step": 180134, "epoch": 4288} {"train_loss": -7.106544494628906, "global_step": 180135, "epoch": 4288} {"train_loss": -6.912387847900391, "global_step": 180136, "epoch": 4288} {"train_loss": -7.109602110726493, "global_step": 180137, "epoch": 4288, "val_loss": 69288.2265625} {"train_loss": -6.9637908935546875, "global_step": 180138, "epoch": 4289} {"train_loss": -7.019739151000977, "global_step": 180139, "epoch": 4289} {"train_loss": -6.95820951461792, "global_step": 180140, "epoch": 4289} {"train_loss": -7.051109313964844, "global_step": 180141, "epoch": 4289} {"train_loss": -7.147456645965576, "global_step": 180142, "epoch": 4289} {"train_loss": -6.897011756896973, "global_step": 180143, "epoch": 4289} {"train_loss": -7.02288818359375, "global_step": 180144, "epoch": 4289} {"train_loss": -6.927188873291016, "global_step": 180145, "epoch": 4289} {"train_loss": -6.917198181152344, "global_step": 180146, "epoch": 4289} {"train_loss": -7.062739372253418, "global_step": 180147, "epoch": 4289} {"train_loss": -6.967011451721191, "global_step": 180148, "epoch": 4289} {"train_loss": -6.9942827224731445, "global_step": 180149, "epoch": 4289} {"train_loss": -6.938800811767578, "global_step": 180150, "epoch": 4289} {"train_loss": -7.065219879150391, "global_step": 180151, "epoch": 4289} {"train_loss": -7.041062355041504, "global_step": 180152, "epoch": 4289} {"train_loss": -6.997305870056152, "global_step": 180153, "epoch": 4289} {"train_loss": -7.000938415527344, "global_step": 180154, "epoch": 4289} {"train_loss": -7.093637466430664, "global_step": 180155, "epoch": 4289} {"train_loss": -7.071794509887695, "global_step": 180156, "epoch": 4289} {"train_loss": -7.078430652618408, "global_step": 180157, "epoch": 4289} {"train_loss": -7.125992298126221, "global_step": 180158, "epoch": 4289} {"train_loss": -7.065037250518799, "global_step": 180159, "epoch": 4289} {"train_loss": -7.040355682373047, "global_step": 180160, "epoch": 4289} {"train_loss": -7.039908409118652, "global_step": 180161, "epoch": 4289} {"train_loss": -7.074339389801025, "global_step": 180162, "epoch": 4289} {"train_loss": -6.890847206115723, "global_step": 180163, "epoch": 4289} {"train_loss": -7.075466156005859, "global_step": 180164, "epoch": 4289} {"train_loss": -6.956845760345459, "global_step": 180165, "epoch": 4289} {"train_loss": -6.913898944854736, "global_step": 180166, "epoch": 4289} {"train_loss": -7.018377304077148, "global_step": 180167, "epoch": 4289} {"train_loss": -7.092028617858887, "global_step": 180168, "epoch": 4289} {"train_loss": -7.005036354064941, "global_step": 180169, "epoch": 4289} {"train_loss": -7.197969436645508, "global_step": 180170, "epoch": 4289} {"train_loss": -7.1385345458984375, "global_step": 180171, "epoch": 4289} {"train_loss": -7.030210494995117, "global_step": 180172, "epoch": 4289} {"train_loss": -7.105715274810791, "global_step": 180173, "epoch": 4289} {"train_loss": -7.069745063781738, "global_step": 180174, "epoch": 4289} {"train_loss": -7.067558288574219, "global_step": 180175, "epoch": 4289} {"train_loss": -7.1489176750183105, "global_step": 180176, "epoch": 4289} {"train_loss": -7.096755504608154, "global_step": 180177, "epoch": 4289} {"train_loss": -7.179380416870117, "global_step": 180178, "epoch": 4289} {"train_loss": -7.04125265848069, "global_step": 180179, "epoch": 4289, "val_loss": 69265.4140625} {"train_loss": -7.05256986618042, "global_step": 180180, "epoch": 4290} {"train_loss": -7.040163993835449, "global_step": 180181, "epoch": 4290} {"train_loss": -7.130629539489746, "global_step": 180182, "epoch": 4290} {"train_loss": -7.119629859924316, "global_step": 180183, "epoch": 4290} {"train_loss": -7.102330207824707, "global_step": 180184, "epoch": 4290} {"train_loss": -7.070417404174805, "global_step": 180185, "epoch": 4290} {"train_loss": -7.234312534332275, "global_step": 180186, "epoch": 4290} {"train_loss": -7.201898574829102, "global_step": 180187, "epoch": 4290} {"train_loss": -7.198676109313965, "global_step": 180188, "epoch": 4290} {"train_loss": -7.109645843505859, "global_step": 180189, "epoch": 4290} {"train_loss": -7.121760368347168, "global_step": 180190, "epoch": 4290} {"train_loss": -7.1218719482421875, "global_step": 180191, "epoch": 4290} {"train_loss": -7.083674907684326, "global_step": 180192, "epoch": 4290} {"train_loss": -7.140225887298584, "global_step": 180193, "epoch": 4290} {"train_loss": -7.1715898513793945, "global_step": 180194, "epoch": 4290} {"train_loss": -7.280008792877197, "global_step": 180195, "epoch": 4290} {"train_loss": -7.193897247314453, "global_step": 180196, "epoch": 4290} {"train_loss": -7.087393760681152, "global_step": 180197, "epoch": 4290} {"train_loss": -7.164759635925293, "global_step": 180198, "epoch": 4290} {"train_loss": -7.130053520202637, "global_step": 180199, "epoch": 4290} {"train_loss": -7.117197513580322, "global_step": 180200, "epoch": 4290} {"train_loss": -7.116786956787109, "global_step": 180201, "epoch": 4290} {"train_loss": -7.171660423278809, "global_step": 180202, "epoch": 4290} {"train_loss": -7.107595443725586, "global_step": 180203, "epoch": 4290} {"train_loss": -7.117074966430664, "global_step": 180204, "epoch": 4290} {"train_loss": -7.106298446655273, "global_step": 180205, "epoch": 4290} {"train_loss": -6.941243648529053, "global_step": 180206, "epoch": 4290} {"train_loss": -7.085585594177246, "global_step": 180207, "epoch": 4290} {"train_loss": -7.081714630126953, "global_step": 180208, "epoch": 4290} {"train_loss": -7.1466217041015625, "global_step": 180209, "epoch": 4290} {"train_loss": -6.9844970703125, "global_step": 180210, "epoch": 4290} {"train_loss": -6.989741802215576, "global_step": 180211, "epoch": 4290} {"train_loss": -7.110734939575195, "global_step": 180212, "epoch": 4290} {"train_loss": -6.950137138366699, "global_step": 180213, "epoch": 4290} {"train_loss": -6.987817764282227, "global_step": 180214, "epoch": 4290} {"train_loss": -6.977755546569824, "global_step": 180215, "epoch": 4290} {"train_loss": -6.97623348236084, "global_step": 180216, "epoch": 4290} {"train_loss": -6.903328895568848, "global_step": 180217, "epoch": 4290} {"train_loss": -7.035351753234863, "global_step": 180218, "epoch": 4290} {"train_loss": -6.9863386154174805, "global_step": 180219, "epoch": 4290} {"train_loss": -7.053754806518555, "global_step": 180220, "epoch": 4290} {"train_loss": -7.087921585355486, "global_step": 180221, "epoch": 4290, "val_loss": 69320.1875} {"train_loss": -6.832291603088379, "global_step": 180222, "epoch": 4291} {"train_loss": -7.043044090270996, "global_step": 180223, "epoch": 4291} {"train_loss": -6.907293319702148, "global_step": 180224, "epoch": 4291} {"train_loss": -7.025071144104004, "global_step": 180225, "epoch": 4291} {"train_loss": -7.027547836303711, "global_step": 180226, "epoch": 4291} {"train_loss": -6.935837268829346, "global_step": 180227, "epoch": 4291} {"train_loss": -7.072789192199707, "global_step": 180228, "epoch": 4291} {"train_loss": -7.197486877441406, "global_step": 180229, "epoch": 4291} {"train_loss": -7.052406311035156, "global_step": 180230, "epoch": 4291} {"train_loss": -7.139707565307617, "global_step": 180231, "epoch": 4291} {"train_loss": -6.909933567047119, "global_step": 180232, "epoch": 4291} {"train_loss": -6.983738899230957, "global_step": 180233, "epoch": 4291} {"train_loss": -7.084090709686279, "global_step": 180234, "epoch": 4291} {"train_loss": -6.90908145904541, "global_step": 180235, "epoch": 4291} {"train_loss": -6.963089942932129, "global_step": 180236, "epoch": 4291} {"train_loss": -7.140608310699463, "global_step": 180237, "epoch": 4291} {"train_loss": -7.033730506896973, "global_step": 180238, "epoch": 4291} {"train_loss": -6.924522399902344, "global_step": 180239, "epoch": 4291} {"train_loss": -7.1487884521484375, "global_step": 180240, "epoch": 4291} {"train_loss": -6.924049377441406, "global_step": 180241, "epoch": 4291} {"train_loss": -6.982120037078857, "global_step": 180242, "epoch": 4291} {"train_loss": -7.019746780395508, "global_step": 180243, "epoch": 4291} {"train_loss": -7.011870861053467, "global_step": 180244, "epoch": 4291} {"train_loss": -7.1020097732543945, "global_step": 180245, "epoch": 4291} {"train_loss": -7.1074910163879395, "global_step": 180246, "epoch": 4291} {"train_loss": -7.024795055389404, "global_step": 180247, "epoch": 4291} {"train_loss": -7.147336006164551, "global_step": 180248, "epoch": 4291} {"train_loss": -7.076417922973633, "global_step": 180249, "epoch": 4291} {"train_loss": -7.096827507019043, "global_step": 180250, "epoch": 4291} {"train_loss": -7.140072345733643, "global_step": 180251, "epoch": 4291} {"train_loss": -6.879363059997559, "global_step": 180252, "epoch": 4291} {"train_loss": -7.119937419891357, "global_step": 180253, "epoch": 4291} {"train_loss": -7.084586143493652, "global_step": 180254, "epoch": 4291} {"train_loss": -7.061954975128174, "global_step": 180255, "epoch": 4291} {"train_loss": -7.0226287841796875, "global_step": 180256, "epoch": 4291} {"train_loss": -7.105590343475342, "global_step": 180257, "epoch": 4291} {"train_loss": -7.192718982696533, "global_step": 180258, "epoch": 4291} {"train_loss": -7.069800853729248, "global_step": 180259, "epoch": 4291} {"train_loss": -7.144881248474121, "global_step": 180260, "epoch": 4291} {"train_loss": -7.013067245483398, "global_step": 180261, "epoch": 4291} {"train_loss": -7.063286781311035, "global_step": 180262, "epoch": 4291} {"train_loss": -7.042890525999523, "global_step": 180263, "epoch": 4291, "val_loss": 69377.734375} {"train_loss": -7.07970666885376, "global_step": 180264, "epoch": 4292} {"train_loss": -7.110581398010254, "global_step": 180265, "epoch": 4292} {"train_loss": -7.0086870193481445, "global_step": 180266, "epoch": 4292} {"train_loss": -7.18302583694458, "global_step": 180267, "epoch": 4292} {"train_loss": -7.061918258666992, "global_step": 180268, "epoch": 4292} {"train_loss": -7.159759521484375, "global_step": 180269, "epoch": 4292} {"train_loss": -7.1786627769470215, "global_step": 180270, "epoch": 4292} {"train_loss": -7.07798957824707, "global_step": 180271, "epoch": 4292} {"train_loss": -7.108006954193115, "global_step": 180272, "epoch": 4292} {"train_loss": -7.130012512207031, "global_step": 180273, "epoch": 4292} {"train_loss": -7.130770683288574, "global_step": 180274, "epoch": 4292} {"train_loss": -7.243388652801514, "global_step": 180275, "epoch": 4292} {"train_loss": -7.14687967300415, "global_step": 180276, "epoch": 4292} {"train_loss": -7.26664924621582, "global_step": 180277, "epoch": 4292} {"train_loss": -7.041056156158447, "global_step": 180278, "epoch": 4292} {"train_loss": -7.130558490753174, "global_step": 180279, "epoch": 4292} {"train_loss": -7.0742387771606445, "global_step": 180280, "epoch": 4292} {"train_loss": -7.155943393707275, "global_step": 180281, "epoch": 4292} {"train_loss": -7.180600643157959, "global_step": 180282, "epoch": 4292} {"train_loss": -7.096445083618164, "global_step": 180283, "epoch": 4292} {"train_loss": -7.190284729003906, "global_step": 180284, "epoch": 4292} {"train_loss": -7.163482666015625, "global_step": 180285, "epoch": 4292} {"train_loss": -7.176613807678223, "global_step": 180286, "epoch": 4292} {"train_loss": -7.1566619873046875, "global_step": 180287, "epoch": 4292} {"train_loss": -7.087957859039307, "global_step": 180288, "epoch": 4292} {"train_loss": -7.041337013244629, "global_step": 180289, "epoch": 4292} {"train_loss": -7.097755432128906, "global_step": 180290, "epoch": 4292} {"train_loss": -7.117067337036133, "global_step": 180291, "epoch": 4292} {"train_loss": -7.0852251052856445, "global_step": 180292, "epoch": 4292} {"train_loss": -7.065057754516602, "global_step": 180293, "epoch": 4292} {"train_loss": -7.138827323913574, "global_step": 180294, "epoch": 4292} {"train_loss": -7.0445990562438965, "global_step": 180295, "epoch": 4292} {"train_loss": -7.06494140625, "global_step": 180296, "epoch": 4292} {"train_loss": -7.101398468017578, "global_step": 180297, "epoch": 4292} {"train_loss": -7.049379825592041, "global_step": 180298, "epoch": 4292} {"train_loss": -7.1206254959106445, "global_step": 180299, "epoch": 4292} {"train_loss": -7.017484188079834, "global_step": 180300, "epoch": 4292} {"train_loss": -7.134592056274414, "global_step": 180301, "epoch": 4292} {"train_loss": -7.0318498611450195, "global_step": 180302, "epoch": 4292} {"train_loss": -7.102072715759277, "global_step": 180303, "epoch": 4292} {"train_loss": -7.1263604164123535, "global_step": 180304, "epoch": 4292} {"train_loss": -7.115843511763073, "global_step": 180305, "epoch": 4292, "val_loss": 69434.953125} {"train_loss": -7.072526931762695, "global_step": 180306, "epoch": 4293} {"train_loss": -7.190795421600342, "global_step": 180307, "epoch": 4293} {"train_loss": -7.059375286102295, "global_step": 180308, "epoch": 4293} {"train_loss": -7.025156021118164, "global_step": 180309, "epoch": 4293} {"train_loss": -7.057476997375488, "global_step": 180310, "epoch": 4293} {"train_loss": -7.048581123352051, "global_step": 180311, "epoch": 4293} {"train_loss": -7.109377861022949, "global_step": 180312, "epoch": 4293} {"train_loss": -7.126477241516113, "global_step": 180313, "epoch": 4293} {"train_loss": -7.085144996643066, "global_step": 180314, "epoch": 4293} {"train_loss": -7.103015899658203, "global_step": 180315, "epoch": 4293} {"train_loss": -7.073741912841797, "global_step": 180316, "epoch": 4293} {"train_loss": -7.052620887756348, "global_step": 180317, "epoch": 4293} {"train_loss": -7.012223720550537, "global_step": 180318, "epoch": 4293} {"train_loss": -7.236785411834717, "global_step": 180319, "epoch": 4293} {"train_loss": -7.146167755126953, "global_step": 180320, "epoch": 4293} {"train_loss": -7.189816474914551, "global_step": 180321, "epoch": 4293} {"train_loss": -7.154815673828125, "global_step": 180322, "epoch": 4293} {"train_loss": -7.161374568939209, "global_step": 180323, "epoch": 4293} {"train_loss": -7.068324089050293, "global_step": 180324, "epoch": 4293} {"train_loss": -7.194937705993652, "global_step": 180325, "epoch": 4293} {"train_loss": -7.18930721282959, "global_step": 180326, "epoch": 4293} {"train_loss": -7.132468223571777, "global_step": 180327, "epoch": 4293} {"train_loss": -7.122992992401123, "global_step": 180328, "epoch": 4293} {"train_loss": -7.130558967590332, "global_step": 180329, "epoch": 4293} {"train_loss": -7.217290878295898, "global_step": 180330, "epoch": 4293} {"train_loss": -7.194786548614502, "global_step": 180331, "epoch": 4293} {"train_loss": -7.19393253326416, "global_step": 180332, "epoch": 4293} {"train_loss": -7.10058069229126, "global_step": 180333, "epoch": 4293} {"train_loss": -7.069401741027832, "global_step": 180334, "epoch": 4293} {"train_loss": -7.163519859313965, "global_step": 180335, "epoch": 4293} {"train_loss": -7.081507682800293, "global_step": 180336, "epoch": 4293} {"train_loss": -7.072025299072266, "global_step": 180337, "epoch": 4293} {"train_loss": -7.217629909515381, "global_step": 180338, "epoch": 4293} {"train_loss": -7.184507846832275, "global_step": 180339, "epoch": 4293} {"train_loss": -7.108620643615723, "global_step": 180340, "epoch": 4293} {"train_loss": -7.192111968994141, "global_step": 180341, "epoch": 4293} {"train_loss": -7.241390228271484, "global_step": 180342, "epoch": 4293} {"train_loss": -7.214902877807617, "global_step": 180343, "epoch": 4293} {"train_loss": -7.165987968444824, "global_step": 180344, "epoch": 4293} {"train_loss": -7.196606636047363, "global_step": 180345, "epoch": 4293} {"train_loss": -7.162091255187988, "global_step": 180346, "epoch": 4293} {"train_loss": -7.13219674428304, "global_step": 180347, "epoch": 4293, "val_loss": 69207.1953125} {"train_loss": -7.174843788146973, "global_step": 180348, "epoch": 4294} {"train_loss": -7.236122131347656, "global_step": 180349, "epoch": 4294} {"train_loss": -7.194546699523926, "global_step": 180350, "epoch": 4294} {"train_loss": -7.1246819496154785, "global_step": 180351, "epoch": 4294} {"train_loss": -7.000368595123291, "global_step": 180352, "epoch": 4294} {"train_loss": -6.964433670043945, "global_step": 180353, "epoch": 4294} {"train_loss": -7.095746994018555, "global_step": 180354, "epoch": 4294} {"train_loss": -7.045917510986328, "global_step": 180355, "epoch": 4294} {"train_loss": -7.049642562866211, "global_step": 180356, "epoch": 4294} {"train_loss": -7.039713382720947, "global_step": 180357, "epoch": 4294} {"train_loss": -7.025414943695068, "global_step": 180358, "epoch": 4294} {"train_loss": -6.952552795410156, "global_step": 180359, "epoch": 4294} {"train_loss": -7.027771949768066, "global_step": 180360, "epoch": 4294} {"train_loss": -7.13163423538208, "global_step": 180361, "epoch": 4294} {"train_loss": -7.061221122741699, "global_step": 180362, "epoch": 4294} {"train_loss": -7.136700630187988, "global_step": 180363, "epoch": 4294} {"train_loss": -6.969382286071777, "global_step": 180364, "epoch": 4294} {"train_loss": -7.079399108886719, "global_step": 180365, "epoch": 4294} {"train_loss": -7.0982160568237305, "global_step": 180366, "epoch": 4294} {"train_loss": -6.98670768737793, "global_step": 180367, "epoch": 4294} {"train_loss": -7.209711074829102, "global_step": 180368, "epoch": 4294} {"train_loss": -7.106234073638916, "global_step": 180369, "epoch": 4294} {"train_loss": -7.144232749938965, "global_step": 180370, "epoch": 4294} {"train_loss": -7.099576950073242, "global_step": 180371, "epoch": 4294} {"train_loss": -7.150489807128906, "global_step": 180372, "epoch": 4294} {"train_loss": -7.118776321411133, "global_step": 180373, "epoch": 4294} {"train_loss": -7.165277481079102, "global_step": 180374, "epoch": 4294} {"train_loss": -7.092660903930664, "global_step": 180375, "epoch": 4294} {"train_loss": -7.16707706451416, "global_step": 180376, "epoch": 4294} {"train_loss": -7.123044013977051, "global_step": 180377, "epoch": 4294} {"train_loss": -7.058325290679932, "global_step": 180378, "epoch": 4294} {"train_loss": -7.097478866577148, "global_step": 180379, "epoch": 4294} {"train_loss": -7.142920970916748, "global_step": 180380, "epoch": 4294} {"train_loss": -7.0530686378479, "global_step": 180381, "epoch": 4294} {"train_loss": -7.231406211853027, "global_step": 180382, "epoch": 4294} {"train_loss": -7.275148868560791, "global_step": 180383, "epoch": 4294} {"train_loss": -7.151271820068359, "global_step": 180384, "epoch": 4294} {"train_loss": -7.0683393478393555, "global_step": 180385, "epoch": 4294} {"train_loss": -7.213338375091553, "global_step": 180386, "epoch": 4294} {"train_loss": -7.182509422302246, "global_step": 180387, "epoch": 4294} {"train_loss": -7.059678554534912, "global_step": 180388, "epoch": 4294} {"train_loss": -7.10747994695391, "global_step": 180389, "epoch": 4294, "val_loss": 69270.6953125} {"train_loss": -7.188667297363281, "global_step": 180390, "epoch": 4295} {"train_loss": -7.0969038009643555, "global_step": 180391, "epoch": 4295} {"train_loss": -7.034933090209961, "global_step": 180392, "epoch": 4295} {"train_loss": -7.113350868225098, "global_step": 180393, "epoch": 4295} {"train_loss": -7.211254119873047, "global_step": 180394, "epoch": 4295} {"train_loss": -7.095171928405762, "global_step": 180395, "epoch": 4295} {"train_loss": -7.041277885437012, "global_step": 180396, "epoch": 4295} {"train_loss": -7.162822246551514, "global_step": 180397, "epoch": 4295} {"train_loss": -7.155512809753418, "global_step": 180398, "epoch": 4295} {"train_loss": -7.101889133453369, "global_step": 180399, "epoch": 4295} {"train_loss": -7.213136196136475, "global_step": 180400, "epoch": 4295} {"train_loss": -6.946198463439941, "global_step": 180401, "epoch": 4295} {"train_loss": -7.011147499084473, "global_step": 180402, "epoch": 4295} {"train_loss": -7.091975212097168, "global_step": 180403, "epoch": 4295} {"train_loss": -7.081208229064941, "global_step": 180404, "epoch": 4295} {"train_loss": -7.136145114898682, "global_step": 180405, "epoch": 4295} {"train_loss": -7.162269115447998, "global_step": 180406, "epoch": 4295} {"train_loss": -7.094444274902344, "global_step": 180407, "epoch": 4295} {"train_loss": -7.225656509399414, "global_step": 180408, "epoch": 4295} {"train_loss": -7.161338806152344, "global_step": 180409, "epoch": 4295} {"train_loss": -7.073215961456299, "global_step": 180410, "epoch": 4295} {"train_loss": -7.121273040771484, "global_step": 180411, "epoch": 4295} {"train_loss": -7.214364051818848, "global_step": 180412, "epoch": 4295} {"train_loss": -7.053554534912109, "global_step": 180413, "epoch": 4295} {"train_loss": -7.197754859924316, "global_step": 180414, "epoch": 4295} {"train_loss": -6.973209381103516, "global_step": 180415, "epoch": 4295} {"train_loss": -7.253607749938965, "global_step": 180416, "epoch": 4295} {"train_loss": -7.14185905456543, "global_step": 180417, "epoch": 4295} {"train_loss": -7.194024085998535, "global_step": 180418, "epoch": 4295} {"train_loss": -7.072518348693848, "global_step": 180419, "epoch": 4295} {"train_loss": -7.124375343322754, "global_step": 180420, "epoch": 4295} {"train_loss": -7.154101371765137, "global_step": 180421, "epoch": 4295} {"train_loss": -6.949184417724609, "global_step": 180422, "epoch": 4295} {"train_loss": -7.150163173675537, "global_step": 180423, "epoch": 4295} {"train_loss": -7.100898742675781, "global_step": 180424, "epoch": 4295} {"train_loss": -7.111067295074463, "global_step": 180425, "epoch": 4295} {"train_loss": -7.106637954711914, "global_step": 180426, "epoch": 4295} {"train_loss": -7.095520973205566, "global_step": 180427, "epoch": 4295} {"train_loss": -7.209382057189941, "global_step": 180428, "epoch": 4295} {"train_loss": -7.107454776763916, "global_step": 180429, "epoch": 4295} {"train_loss": -7.150210380554199, "global_step": 180430, "epoch": 4295} {"train_loss": -7.116912489845639, "global_step": 180431, "epoch": 4295, "val_loss": 69442.4140625} {"train_loss": -7.1404829025268555, "global_step": 180432, "epoch": 4296} {"train_loss": -7.059870719909668, "global_step": 180433, "epoch": 4296} {"train_loss": -7.053460121154785, "global_step": 180434, "epoch": 4296} {"train_loss": -7.128445625305176, "global_step": 180435, "epoch": 4296} {"train_loss": -7.088350296020508, "global_step": 180436, "epoch": 4296} {"train_loss": -6.998100757598877, "global_step": 180437, "epoch": 4296} {"train_loss": -7.138396263122559, "global_step": 180438, "epoch": 4296} {"train_loss": -6.945527076721191, "global_step": 180439, "epoch": 4296} {"train_loss": -6.977931976318359, "global_step": 180440, "epoch": 4296} {"train_loss": -7.068790435791016, "global_step": 180441, "epoch": 4296} {"train_loss": -7.104111194610596, "global_step": 180442, "epoch": 4296} {"train_loss": -7.158754348754883, "global_step": 180443, "epoch": 4296} {"train_loss": -7.1569061279296875, "global_step": 180444, "epoch": 4296} {"train_loss": -7.010255813598633, "global_step": 180445, "epoch": 4296} {"train_loss": -7.167782783508301, "global_step": 180446, "epoch": 4296} {"train_loss": -6.979035377502441, "global_step": 180447, "epoch": 4296} {"train_loss": -7.0993452072143555, "global_step": 180448, "epoch": 4296} {"train_loss": -7.098921775817871, "global_step": 180449, "epoch": 4296} {"train_loss": -7.096624374389648, "global_step": 180450, "epoch": 4296} {"train_loss": -7.1074018478393555, "global_step": 180451, "epoch": 4296} {"train_loss": -6.963857173919678, "global_step": 180452, "epoch": 4296} {"train_loss": -7.097918510437012, "global_step": 180453, "epoch": 4296} {"train_loss": -7.201910018920898, "global_step": 180454, "epoch": 4296} {"train_loss": -7.083204746246338, "global_step": 180455, "epoch": 4296} {"train_loss": -7.090763092041016, "global_step": 180456, "epoch": 4296} {"train_loss": -7.12023401260376, "global_step": 180457, "epoch": 4296} {"train_loss": -7.169281959533691, "global_step": 180458, "epoch": 4296} {"train_loss": -7.072147846221924, "global_step": 180459, "epoch": 4296} {"train_loss": -7.159563064575195, "global_step": 180460, "epoch": 4296} {"train_loss": -7.086218357086182, "global_step": 180461, "epoch": 4296} {"train_loss": -7.22432804107666, "global_step": 180462, "epoch": 4296} {"train_loss": -7.103233337402344, "global_step": 180463, "epoch": 4296} {"train_loss": -7.072201728820801, "global_step": 180464, "epoch": 4296} {"train_loss": -7.181053638458252, "global_step": 180465, "epoch": 4296} {"train_loss": -7.081210136413574, "global_step": 180466, "epoch": 4296} {"train_loss": -7.150135040283203, "global_step": 180467, "epoch": 4296} {"train_loss": -7.10269832611084, "global_step": 180468, "epoch": 4296} {"train_loss": -7.0931572914123535, "global_step": 180469, "epoch": 4296} {"train_loss": -7.0129289627075195, "global_step": 180470, "epoch": 4296} {"train_loss": -7.163066864013672, "global_step": 180471, "epoch": 4296} {"train_loss": -7.214513301849365, "global_step": 180472, "epoch": 4296} {"train_loss": -7.099550814855666, "global_step": 180473, "epoch": 4296, "val_loss": 69358.9921875} {"train_loss": -7.072664737701416, "global_step": 180474, "epoch": 4297} {"train_loss": -7.09260368347168, "global_step": 180475, "epoch": 4297} {"train_loss": -7.1345696449279785, "global_step": 180476, "epoch": 4297} {"train_loss": -7.204862594604492, "global_step": 180477, "epoch": 4297} {"train_loss": -7.033546447753906, "global_step": 180478, "epoch": 4297} {"train_loss": -7.048120975494385, "global_step": 180479, "epoch": 4297} {"train_loss": -7.141539573669434, "global_step": 180480, "epoch": 4297} {"train_loss": -7.080437660217285, "global_step": 180481, "epoch": 4297} {"train_loss": -7.126311302185059, "global_step": 180482, "epoch": 4297} {"train_loss": -7.125348091125488, "global_step": 180483, "epoch": 4297} {"train_loss": -7.051609516143799, "global_step": 180484, "epoch": 4297} {"train_loss": -6.956748008728027, "global_step": 180485, "epoch": 4297} {"train_loss": -7.193120002746582, "global_step": 180486, "epoch": 4297} {"train_loss": -6.9554033279418945, "global_step": 180487, "epoch": 4297} {"train_loss": -7.07905387878418, "global_step": 180488, "epoch": 4297} {"train_loss": -7.073709964752197, "global_step": 180489, "epoch": 4297} {"train_loss": -7.021135330200195, "global_step": 180490, "epoch": 4297} {"train_loss": -7.067826271057129, "global_step": 180491, "epoch": 4297} {"train_loss": -7.156275272369385, "global_step": 180492, "epoch": 4297} {"train_loss": -7.123797416687012, "global_step": 180493, "epoch": 4297} {"train_loss": -7.137655258178711, "global_step": 180494, "epoch": 4297} {"train_loss": -7.141210556030273, "global_step": 180495, "epoch": 4297} {"train_loss": -7.1985344886779785, "global_step": 180496, "epoch": 4297} {"train_loss": -7.044654369354248, "global_step": 180497, "epoch": 4297} {"train_loss": -7.045114517211914, "global_step": 180498, "epoch": 4297} {"train_loss": -7.139055252075195, "global_step": 180499, "epoch": 4297} {"train_loss": -7.096261024475098, "global_step": 180500, "epoch": 4297} {"train_loss": -7.19204044342041, "global_step": 180501, "epoch": 4297} {"train_loss": -7.1114702224731445, "global_step": 180502, "epoch": 4297} {"train_loss": -7.0023274421691895, "global_step": 180503, "epoch": 4297} {"train_loss": -7.020969390869141, "global_step": 180504, "epoch": 4297} {"train_loss": -6.994915962219238, "global_step": 180505, "epoch": 4297} {"train_loss": -7.0134663581848145, "global_step": 180506, "epoch": 4297} {"train_loss": -7.023325443267822, "global_step": 180507, "epoch": 4297} {"train_loss": -6.885642051696777, "global_step": 180508, "epoch": 4297} {"train_loss": -6.907435417175293, "global_step": 180509, "epoch": 4297} {"train_loss": -7.115558624267578, "global_step": 180510, "epoch": 4297} {"train_loss": -7.047359466552734, "global_step": 180511, "epoch": 4297} {"train_loss": -7.079614162445068, "global_step": 180512, "epoch": 4297} {"train_loss": -7.083014965057373, "global_step": 180513, "epoch": 4297} {"train_loss": -7.103048324584961, "global_step": 180514, "epoch": 4297} {"train_loss": -7.078268334979103, "global_step": 180515, "epoch": 4297, "val_loss": 69424.3046875} {"train_loss": -7.1729021072387695, "global_step": 180516, "epoch": 4298} {"train_loss": -7.129162788391113, "global_step": 180517, "epoch": 4298} {"train_loss": -7.167821407318115, "global_step": 180518, "epoch": 4298} {"train_loss": -7.157321929931641, "global_step": 180519, "epoch": 4298} {"train_loss": -7.219117641448975, "global_step": 180520, "epoch": 4298} {"train_loss": -7.074734210968018, "global_step": 180521, "epoch": 4298} {"train_loss": -7.130727291107178, "global_step": 180522, "epoch": 4298} {"train_loss": -7.218792915344238, "global_step": 180523, "epoch": 4298} {"train_loss": -7.150851249694824, "global_step": 180524, "epoch": 4298} {"train_loss": -7.1079583168029785, "global_step": 180525, "epoch": 4298} {"train_loss": -7.088435173034668, "global_step": 180526, "epoch": 4298} {"train_loss": -7.104794025421143, "global_step": 180527, "epoch": 4298} {"train_loss": -7.178789138793945, "global_step": 180528, "epoch": 4298} {"train_loss": -7.152299880981445, "global_step": 180529, "epoch": 4298} {"train_loss": -7.144201278686523, "global_step": 180530, "epoch": 4298} {"train_loss": -7.14169979095459, "global_step": 180531, "epoch": 4298} {"train_loss": -7.178828239440918, "global_step": 180532, "epoch": 4298} {"train_loss": -6.9868669509887695, "global_step": 180533, "epoch": 4298} {"train_loss": -7.146363258361816, "global_step": 180534, "epoch": 4298} {"train_loss": -7.002010345458984, "global_step": 180535, "epoch": 4298} {"train_loss": -6.851414203643799, "global_step": 180536, "epoch": 4298} {"train_loss": -6.778053283691406, "global_step": 180537, "epoch": 4298} {"train_loss": -7.074862003326416, "global_step": 180538, "epoch": 4298} {"train_loss": -6.666558265686035, "global_step": 180539, "epoch": 4298} {"train_loss": -6.947079181671143, "global_step": 180540, "epoch": 4298} {"train_loss": -6.891430854797363, "global_step": 180541, "epoch": 4298} {"train_loss": -6.750858306884766, "global_step": 180542, "epoch": 4298} {"train_loss": -7.057432651519775, "global_step": 180543, "epoch": 4298} {"train_loss": -6.969882965087891, "global_step": 180544, "epoch": 4298} {"train_loss": -7.025690078735352, "global_step": 180545, "epoch": 4298} {"train_loss": -6.993252754211426, "global_step": 180546, "epoch": 4298} {"train_loss": -6.986870765686035, "global_step": 180547, "epoch": 4298} {"train_loss": -7.124456405639648, "global_step": 180548, "epoch": 4298} {"train_loss": -7.130956172943115, "global_step": 180549, "epoch": 4298} {"train_loss": -7.026645183563232, "global_step": 180550, "epoch": 4298} {"train_loss": -7.140351295471191, "global_step": 180551, "epoch": 4298} {"train_loss": -7.161070823669434, "global_step": 180552, "epoch": 4298} {"train_loss": -7.001527786254883, "global_step": 180553, "epoch": 4298} {"train_loss": -7.049251556396484, "global_step": 180554, "epoch": 4298} {"train_loss": -7.075961112976074, "global_step": 180555, "epoch": 4298} {"train_loss": -6.9733991622924805, "global_step": 180556, "epoch": 4298} {"train_loss": -7.055742422739665, "global_step": 180557, "epoch": 4298, "val_loss": 69281.609375} {"train_loss": -7.121232032775879, "global_step": 180558, "epoch": 4299} {"train_loss": -7.237648963928223, "global_step": 180559, "epoch": 4299} {"train_loss": -7.172898292541504, "global_step": 180560, "epoch": 4299} {"train_loss": -7.186750411987305, "global_step": 180561, "epoch": 4299} {"train_loss": -7.1115875244140625, "global_step": 180562, "epoch": 4299} {"train_loss": -7.138844013214111, "global_step": 180563, "epoch": 4299} {"train_loss": -7.230712890625, "global_step": 180564, "epoch": 4299} {"train_loss": -7.178890705108643, "global_step": 180565, "epoch": 4299} {"train_loss": -7.181459426879883, "global_step": 180566, "epoch": 4299} {"train_loss": -7.141331195831299, "global_step": 180567, "epoch": 4299} {"train_loss": -7.123446464538574, "global_step": 180568, "epoch": 4299} {"train_loss": -7.148279190063477, "global_step": 180569, "epoch": 4299} {"train_loss": -7.017301559448242, "global_step": 180570, "epoch": 4299} {"train_loss": -7.1897993087768555, "global_step": 180571, "epoch": 4299} {"train_loss": -7.198365211486816, "global_step": 180572, "epoch": 4299} {"train_loss": -7.269179344177246, "global_step": 180573, "epoch": 4299} {"train_loss": -7.09744930267334, "global_step": 180574, "epoch": 4299} {"train_loss": -7.042178630828857, "global_step": 180575, "epoch": 4299} {"train_loss": -7.232052803039551, "global_step": 180576, "epoch": 4299} {"train_loss": -7.13485860824585, "global_step": 180577, "epoch": 4299} {"train_loss": -7.111432075500488, "global_step": 180578, "epoch": 4299} {"train_loss": -7.182274341583252, "global_step": 180579, "epoch": 4299} {"train_loss": -7.033115386962891, "global_step": 180580, "epoch": 4299} {"train_loss": -7.255373477935791, "global_step": 180581, "epoch": 4299} {"train_loss": -7.177462577819824, "global_step": 180582, "epoch": 4299} {"train_loss": -7.101579189300537, "global_step": 180583, "epoch": 4299} {"train_loss": -7.171248435974121, "global_step": 180584, "epoch": 4299} {"train_loss": -7.167415618896484, "global_step": 180585, "epoch": 4299} {"train_loss": -7.198648452758789, "global_step": 180586, "epoch": 4299} {"train_loss": -7.006340980529785, "global_step": 180587, "epoch": 4299} {"train_loss": -7.145112991333008, "global_step": 180588, "epoch": 4299} {"train_loss": -7.110537528991699, "global_step": 180589, "epoch": 4299} {"train_loss": -7.103919506072998, "global_step": 180590, "epoch": 4299} {"train_loss": -7.126406669616699, "global_step": 180591, "epoch": 4299} {"train_loss": -6.958409786224365, "global_step": 180592, "epoch": 4299} {"train_loss": -7.126726150512695, "global_step": 180593, "epoch": 4299} {"train_loss": -7.023407936096191, "global_step": 180594, "epoch": 4299} {"train_loss": -7.060018539428711, "global_step": 180595, "epoch": 4299} {"train_loss": -7.169681072235107, "global_step": 180596, "epoch": 4299} {"train_loss": -7.172659397125244, "global_step": 180597, "epoch": 4299} {"train_loss": -7.019777774810791, "global_step": 180598, "epoch": 4299} {"train_loss": -7.133945782979329, "global_step": 180599, "epoch": 4299, "val_loss": 69398.125} {"train_loss": -7.048103332519531, "global_step": 180600, "epoch": 4300} {"train_loss": -7.1650848388671875, "global_step": 180601, "epoch": 4300} {"train_loss": -6.960140228271484, "global_step": 180602, "epoch": 4300} {"train_loss": -7.104599952697754, "global_step": 180603, "epoch": 4300} {"train_loss": -7.091384410858154, "global_step": 180604, "epoch": 4300} {"train_loss": -7.081730842590332, "global_step": 180605, "epoch": 4300} {"train_loss": -7.097607612609863, "global_step": 180606, "epoch": 4300} {"train_loss": -6.89801549911499, "global_step": 180607, "epoch": 4300} {"train_loss": -7.092058181762695, "global_step": 180608, "epoch": 4300} {"train_loss": -6.963830947875977, "global_step": 180609, "epoch": 4300} {"train_loss": -6.997622489929199, "global_step": 180610, "epoch": 4300} {"train_loss": -7.1477813720703125, "global_step": 180611, "epoch": 4300} {"train_loss": -7.022154808044434, "global_step": 180612, "epoch": 4300} {"train_loss": -7.16392183303833, "global_step": 180613, "epoch": 4300} {"train_loss": -7.050528526306152, "global_step": 180614, "epoch": 4300} {"train_loss": -7.086028099060059, "global_step": 180615, "epoch": 4300} {"train_loss": -6.963925838470459, "global_step": 180616, "epoch": 4300} {"train_loss": -7.065183639526367, "global_step": 180617, "epoch": 4300} {"train_loss": -7.119515419006348, "global_step": 180618, "epoch": 4300} {"train_loss": -6.98729133605957, "global_step": 180619, "epoch": 4300} {"train_loss": -7.034677982330322, "global_step": 180620, "epoch": 4300} {"train_loss": -7.1411638259887695, "global_step": 180621, "epoch": 4300} {"train_loss": -7.136786460876465, "global_step": 180622, "epoch": 4300} {"train_loss": -7.036612510681152, "global_step": 180623, "epoch": 4300} {"train_loss": -7.162088871002197, "global_step": 180624, "epoch": 4300} {"train_loss": -7.1588969230651855, "global_step": 180625, "epoch": 4300} {"train_loss": -7.158660888671875, "global_step": 180626, "epoch": 4300} {"train_loss": -7.111616134643555, "global_step": 180627, "epoch": 4300} {"train_loss": -7.009815216064453, "global_step": 180628, "epoch": 4300} {"train_loss": -7.020509719848633, "global_step": 180629, "epoch": 4300} {"train_loss": -7.091615676879883, "global_step": 180630, "epoch": 4300} {"train_loss": -7.12309455871582, "global_step": 180631, "epoch": 4300} {"train_loss": -7.104077339172363, "global_step": 180632, "epoch": 4300} {"train_loss": -7.078075408935547, "global_step": 180633, "epoch": 4300} {"train_loss": -7.119839668273926, "global_step": 180634, "epoch": 4300} {"train_loss": -7.126794815063477, "global_step": 180635, "epoch": 4300} {"train_loss": -7.032773971557617, "global_step": 180636, "epoch": 4300} {"train_loss": -7.077657222747803, "global_step": 180637, "epoch": 4300} {"train_loss": -7.030916690826416, "global_step": 180638, "epoch": 4300} {"train_loss": -7.122714042663574, "global_step": 180639, "epoch": 4300} {"train_loss": -7.081982612609863, "global_step": 180640, "epoch": 4300} {"train_loss": -7.074245963777814, "global_step": 180641, "epoch": 4300, "train/sim_max_reward_0": 0.19573482261689337, "train/sim_max_reward_1": 0.9126378235078703, "train/sim_max_reward_2": 0.673179826775528, "train/sim_max_reward_3": 0.9779921354823943, "train/sim_max_reward_4": 0.9984967277835576, "train/sim_max_reward_5": 0.9550199056437582, "test/sim_max_reward_4300000": 0.8577794563469497, "test/sim_max_reward_4300001": 0.5555555345222609, "test/sim_max_reward_4300002": 0.9094143244439127, "test/sim_max_reward_4300003": 0.9942614311643758, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9344595471364597, "test/sim_max_reward_4300008": 0.28885218786708333, "test/sim_max_reward_4300009": 0.8566813592675718, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.5273249731703373, "test/sim_max_reward_4300012": 0.9619504258061108, "test/sim_max_reward_4300013": 0.8226124469659863, "test/sim_max_reward_4300014": 0.9956270975103948, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.0014415597887647577, "test/sim_max_reward_4300017": 0.8999668921171421, "test/sim_max_reward_4300018": 0.37786110147634683, "test/sim_max_reward_4300019": 0.18611377305629534, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9215623044783499, "test/sim_max_reward_4300022": 0.9279532063982351, "test/sim_max_reward_4300023": 0.939476076535028, "test/sim_max_reward_4300024": 0.4835266133130353, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.9788736183632497, "test/sim_max_reward_4300027": 0.9483131710320128, "test/sim_max_reward_4300028": 0.9277795629137663, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.25537331576713146, "test/sim_max_reward_4300031": 0.24027857643083345, "test/sim_max_reward_4300032": 0.9576741203343505, "test/sim_max_reward_4300033": 0.916147353595072, "test/sim_max_reward_4300034": 0.3563469893002779, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.20839943748990397, "test/sim_max_reward_4300037": 0.8610706166352426, "test/sim_max_reward_4300038": 0.9760317390721754, "test/sim_max_reward_4300039": 0.8715889689736863, "test/sim_max_reward_4300040": 0.9887384137342736, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7058641289508729, "test/sim_max_reward_4300043": 0.10647179625949231, "test/sim_max_reward_4300044": 0.8255474401108355, "test/sim_max_reward_4300045": 0.9654343014220191, "test/sim_max_reward_4300046": 0.7480639749480011, "test/sim_max_reward_4300047": 0.16968839913509579, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.12965824579307902, "train/mean_score": 0.7855102069683336, "test/mean_score": 0.5919119717287059, "val_loss": 69270.9140625} {"train_loss": -7.174921989440918, "global_step": 180642, "epoch": 4301} {"train_loss": -7.043833255767822, "global_step": 180643, "epoch": 4301} {"train_loss": -7.036033630371094, "global_step": 180644, "epoch": 4301} {"train_loss": -7.093311309814453, "global_step": 180645, "epoch": 4301} {"train_loss": -7.076817512512207, "global_step": 180646, "epoch": 4301} {"train_loss": -7.062419891357422, "global_step": 180647, "epoch": 4301} {"train_loss": -7.132390022277832, "global_step": 180648, "epoch": 4301} {"train_loss": -7.083782196044922, "global_step": 180649, "epoch": 4301} {"train_loss": -7.077157497406006, "global_step": 180650, "epoch": 4301} {"train_loss": -7.08077335357666, "global_step": 180651, "epoch": 4301} {"train_loss": -7.0888237953186035, "global_step": 180652, "epoch": 4301} {"train_loss": -7.099477291107178, "global_step": 180653, "epoch": 4301} {"train_loss": -7.156455993652344, "global_step": 180654, "epoch": 4301} {"train_loss": -7.085582733154297, "global_step": 180655, "epoch": 4301} {"train_loss": -7.161181449890137, "global_step": 180656, "epoch": 4301} {"train_loss": -7.049761772155762, "global_step": 180657, "epoch": 4301} {"train_loss": -7.010778427124023, "global_step": 180658, "epoch": 4301} {"train_loss": -7.104427814483643, "global_step": 180659, "epoch": 4301} {"train_loss": -7.067562103271484, "global_step": 180660, "epoch": 4301} {"train_loss": -7.1170573234558105, "global_step": 180661, "epoch": 4301} {"train_loss": -7.064040184020996, "global_step": 180662, "epoch": 4301} {"train_loss": -7.1798176765441895, "global_step": 180663, "epoch": 4301} {"train_loss": -7.0882792472839355, "global_step": 180664, "epoch": 4301} {"train_loss": -7.182933807373047, "global_step": 180665, "epoch": 4301} {"train_loss": -7.130849361419678, "global_step": 180666, "epoch": 4301} {"train_loss": -7.058853626251221, "global_step": 180667, "epoch": 4301} {"train_loss": -7.094968318939209, "global_step": 180668, "epoch": 4301} {"train_loss": -7.252536296844482, "global_step": 180669, "epoch": 4301} {"train_loss": -7.082228183746338, "global_step": 180670, "epoch": 4301} {"train_loss": -7.0541462898254395, "global_step": 180671, "epoch": 4301} {"train_loss": -7.041754722595215, "global_step": 180672, "epoch": 4301} {"train_loss": -7.048853874206543, "global_step": 180673, "epoch": 4301} {"train_loss": -7.112128257751465, "global_step": 180674, "epoch": 4301} {"train_loss": -7.129657745361328, "global_step": 180675, "epoch": 4301} {"train_loss": -7.086913585662842, "global_step": 180676, "epoch": 4301} {"train_loss": -7.130298614501953, "global_step": 180677, "epoch": 4301} {"train_loss": -7.116665840148926, "global_step": 180678, "epoch": 4301} {"train_loss": -7.198392391204834, "global_step": 180679, "epoch": 4301} {"train_loss": -7.244287014007568, "global_step": 180680, "epoch": 4301} {"train_loss": -7.090643405914307, "global_step": 180681, "epoch": 4301} {"train_loss": -7.139848709106445, "global_step": 180682, "epoch": 4301} {"train_loss": -7.106098106929234, "global_step": 180683, "epoch": 4301, "val_loss": 69353.0} {"train_loss": -7.269769668579102, "global_step": 180684, "epoch": 4302} {"train_loss": -7.3268256187438965, "global_step": 180685, "epoch": 4302} {"train_loss": -7.1104559898376465, "global_step": 180686, "epoch": 4302} {"train_loss": -7.134213447570801, "global_step": 180687, "epoch": 4302} {"train_loss": -7.18173885345459, "global_step": 180688, "epoch": 4302} {"train_loss": -7.17414665222168, "global_step": 180689, "epoch": 4302} {"train_loss": -7.089898109436035, "global_step": 180690, "epoch": 4302} {"train_loss": -7.24840784072876, "global_step": 180691, "epoch": 4302} {"train_loss": -7.212567329406738, "global_step": 180692, "epoch": 4302} {"train_loss": -7.183104515075684, "global_step": 180693, "epoch": 4302} {"train_loss": -7.1247639656066895, "global_step": 180694, "epoch": 4302} {"train_loss": -7.130719184875488, "global_step": 180695, "epoch": 4302} {"train_loss": -7.239017963409424, "global_step": 180696, "epoch": 4302} {"train_loss": -7.177268981933594, "global_step": 180697, "epoch": 4302} {"train_loss": -7.125550270080566, "global_step": 180698, "epoch": 4302} {"train_loss": -7.120279312133789, "global_step": 180699, "epoch": 4302} {"train_loss": -7.160039901733398, "global_step": 180700, "epoch": 4302} {"train_loss": -7.190492153167725, "global_step": 180701, "epoch": 4302} {"train_loss": -7.201804161071777, "global_step": 180702, "epoch": 4302} {"train_loss": -7.133697509765625, "global_step": 180703, "epoch": 4302} {"train_loss": -7.210951805114746, "global_step": 180704, "epoch": 4302} {"train_loss": -7.230205535888672, "global_step": 180705, "epoch": 4302} {"train_loss": -7.139129638671875, "global_step": 180706, "epoch": 4302} {"train_loss": -7.3519439697265625, "global_step": 180707, "epoch": 4302} {"train_loss": -7.2668561935424805, "global_step": 180708, "epoch": 4302} {"train_loss": -7.122164726257324, "global_step": 180709, "epoch": 4302} {"train_loss": -7.232690811157227, "global_step": 180710, "epoch": 4302} {"train_loss": -7.125785827636719, "global_step": 180711, "epoch": 4302} {"train_loss": -7.058689594268799, "global_step": 180712, "epoch": 4302} {"train_loss": -7.224379539489746, "global_step": 180713, "epoch": 4302} {"train_loss": -7.172801971435547, "global_step": 180714, "epoch": 4302} {"train_loss": -7.2394866943359375, "global_step": 180715, "epoch": 4302} {"train_loss": -7.1764678955078125, "global_step": 180716, "epoch": 4302} {"train_loss": -7.082786560058594, "global_step": 180717, "epoch": 4302} {"train_loss": -7.101553440093994, "global_step": 180718, "epoch": 4302} {"train_loss": -7.1416015625, "global_step": 180719, "epoch": 4302} {"train_loss": -7.053591251373291, "global_step": 180720, "epoch": 4302} {"train_loss": -7.141018867492676, "global_step": 180721, "epoch": 4302} {"train_loss": -7.159697532653809, "global_step": 180722, "epoch": 4302} {"train_loss": -7.167644023895264, "global_step": 180723, "epoch": 4302} {"train_loss": -7.147952079772949, "global_step": 180724, "epoch": 4302} {"train_loss": -7.171989191146124, "global_step": 180725, "epoch": 4302, "val_loss": 69306.8046875} {"train_loss": -7.1795735359191895, "global_step": 180726, "epoch": 4303} {"train_loss": -7.182456970214844, "global_step": 180727, "epoch": 4303} {"train_loss": -7.155941963195801, "global_step": 180728, "epoch": 4303} {"train_loss": -7.201910972595215, "global_step": 180729, "epoch": 4303} {"train_loss": -7.1634321212768555, "global_step": 180730, "epoch": 4303} {"train_loss": -7.253437042236328, "global_step": 180731, "epoch": 4303} {"train_loss": -7.0300469398498535, "global_step": 180732, "epoch": 4303} {"train_loss": -7.176642894744873, "global_step": 180733, "epoch": 4303} {"train_loss": -7.099470138549805, "global_step": 180734, "epoch": 4303} {"train_loss": -6.998462677001953, "global_step": 180735, "epoch": 4303} {"train_loss": -7.143518447875977, "global_step": 180736, "epoch": 4303} {"train_loss": -7.188265800476074, "global_step": 180737, "epoch": 4303} {"train_loss": -7.073536396026611, "global_step": 180738, "epoch": 4303} {"train_loss": -7.096527099609375, "global_step": 180739, "epoch": 4303} {"train_loss": -7.074407577514648, "global_step": 180740, "epoch": 4303} {"train_loss": -7.045653343200684, "global_step": 180741, "epoch": 4303} {"train_loss": -7.054753303527832, "global_step": 180742, "epoch": 4303} {"train_loss": -7.113550186157227, "global_step": 180743, "epoch": 4303} {"train_loss": -7.1689629554748535, "global_step": 180744, "epoch": 4303} {"train_loss": -7.161470413208008, "global_step": 180745, "epoch": 4303} {"train_loss": -6.92323112487793, "global_step": 180746, "epoch": 4303} {"train_loss": -7.015007972717285, "global_step": 180747, "epoch": 4303} {"train_loss": -7.116559982299805, "global_step": 180748, "epoch": 4303} {"train_loss": -6.939540386199951, "global_step": 180749, "epoch": 4303} {"train_loss": -7.1212005615234375, "global_step": 180750, "epoch": 4303} {"train_loss": -7.101042747497559, "global_step": 180751, "epoch": 4303} {"train_loss": -7.06166410446167, "global_step": 180752, "epoch": 4303} {"train_loss": -7.0186872482299805, "global_step": 180753, "epoch": 4303} {"train_loss": -7.161700248718262, "global_step": 180754, "epoch": 4303} {"train_loss": -7.058708190917969, "global_step": 180755, "epoch": 4303} {"train_loss": -7.140744209289551, "global_step": 180756, "epoch": 4303} {"train_loss": -7.1312456130981445, "global_step": 180757, "epoch": 4303} {"train_loss": -7.008956432342529, "global_step": 180758, "epoch": 4303} {"train_loss": -7.123661041259766, "global_step": 180759, "epoch": 4303} {"train_loss": -7.028252124786377, "global_step": 180760, "epoch": 4303} {"train_loss": -7.090515613555908, "global_step": 180761, "epoch": 4303} {"train_loss": -7.099994659423828, "global_step": 180762, "epoch": 4303} {"train_loss": -7.080382347106934, "global_step": 180763, "epoch": 4303} {"train_loss": -7.13587760925293, "global_step": 180764, "epoch": 4303} {"train_loss": -7.044877529144287, "global_step": 180765, "epoch": 4303} {"train_loss": -7.028305530548096, "global_step": 180766, "epoch": 4303} {"train_loss": -7.097729251498268, "global_step": 180767, "epoch": 4303, "val_loss": 69234.40625} {"train_loss": -7.006068706512451, "global_step": 180768, "epoch": 4304} {"train_loss": -7.090152263641357, "global_step": 180769, "epoch": 4304} {"train_loss": -7.14534330368042, "global_step": 180770, "epoch": 4304} {"train_loss": -6.955624580383301, "global_step": 180771, "epoch": 4304} {"train_loss": -7.098938941955566, "global_step": 180772, "epoch": 4304} {"train_loss": -7.000274181365967, "global_step": 180773, "epoch": 4304} {"train_loss": -6.957527160644531, "global_step": 180774, "epoch": 4304} {"train_loss": -7.190003395080566, "global_step": 180775, "epoch": 4304} {"train_loss": -7.05704402923584, "global_step": 180776, "epoch": 4304} {"train_loss": -7.030228614807129, "global_step": 180777, "epoch": 4304} {"train_loss": -7.227950096130371, "global_step": 180778, "epoch": 4304} {"train_loss": -7.15479850769043, "global_step": 180779, "epoch": 4304} {"train_loss": -7.0496978759765625, "global_step": 180780, "epoch": 4304} {"train_loss": -7.103246688842773, "global_step": 180781, "epoch": 4304} {"train_loss": -7.139960289001465, "global_step": 180782, "epoch": 4304} {"train_loss": -7.15097713470459, "global_step": 180783, "epoch": 4304} {"train_loss": -7.019253730773926, "global_step": 180784, "epoch": 4304} {"train_loss": -7.169642448425293, "global_step": 180785, "epoch": 4304} {"train_loss": -7.172871112823486, "global_step": 180786, "epoch": 4304} {"train_loss": -7.022234916687012, "global_step": 180787, "epoch": 4304} {"train_loss": -7.171406269073486, "global_step": 180788, "epoch": 4304} {"train_loss": -7.151667594909668, "global_step": 180789, "epoch": 4304} {"train_loss": -7.118265628814697, "global_step": 180790, "epoch": 4304} {"train_loss": -7.108222007751465, "global_step": 180791, "epoch": 4304} {"train_loss": -7.218197822570801, "global_step": 180792, "epoch": 4304} {"train_loss": -7.098651885986328, "global_step": 180793, "epoch": 4304} {"train_loss": -7.013686180114746, "global_step": 180794, "epoch": 4304} {"train_loss": -7.124513149261475, "global_step": 180795, "epoch": 4304} {"train_loss": -7.076533794403076, "global_step": 180796, "epoch": 4304} {"train_loss": -7.117746353149414, "global_step": 180797, "epoch": 4304} {"train_loss": -7.160529136657715, "global_step": 180798, "epoch": 4304} {"train_loss": -7.021178245544434, "global_step": 180799, "epoch": 4304} {"train_loss": -7.104334831237793, "global_step": 180800, "epoch": 4304} {"train_loss": -7.108954429626465, "global_step": 180801, "epoch": 4304} {"train_loss": -7.1625189781188965, "global_step": 180802, "epoch": 4304} {"train_loss": -7.03819465637207, "global_step": 180803, "epoch": 4304} {"train_loss": -7.164215087890625, "global_step": 180804, "epoch": 4304} {"train_loss": -7.17856502532959, "global_step": 180805, "epoch": 4304} {"train_loss": -7.092291831970215, "global_step": 180806, "epoch": 4304} {"train_loss": -7.205456733703613, "global_step": 180807, "epoch": 4304} {"train_loss": -7.0206804275512695, "global_step": 180808, "epoch": 4304} {"train_loss": -7.103794722330003, "global_step": 180809, "epoch": 4304, "val_loss": 69400.921875} {"train_loss": -7.2782464027404785, "global_step": 180810, "epoch": 4305} {"train_loss": -7.215737342834473, "global_step": 180811, "epoch": 4305} {"train_loss": -7.288173675537109, "global_step": 180812, "epoch": 4305} {"train_loss": -7.2043280601501465, "global_step": 180813, "epoch": 4305} {"train_loss": -7.1828765869140625, "global_step": 180814, "epoch": 4305} {"train_loss": -7.1560187339782715, "global_step": 180815, "epoch": 4305} {"train_loss": -7.18739128112793, "global_step": 180816, "epoch": 4305} {"train_loss": -7.214581489562988, "global_step": 180817, "epoch": 4305} {"train_loss": -7.039776802062988, "global_step": 180818, "epoch": 4305} {"train_loss": -7.0955352783203125, "global_step": 180819, "epoch": 4305} {"train_loss": -7.2658257484436035, "global_step": 180820, "epoch": 4305} {"train_loss": -7.064164161682129, "global_step": 180821, "epoch": 4305} {"train_loss": -7.170246124267578, "global_step": 180822, "epoch": 4305} {"train_loss": -7.16938591003418, "global_step": 180823, "epoch": 4305} {"train_loss": -7.164032936096191, "global_step": 180824, "epoch": 4305} {"train_loss": -7.086716651916504, "global_step": 180825, "epoch": 4305} {"train_loss": -7.124191761016846, "global_step": 180826, "epoch": 4305} {"train_loss": -7.2708892822265625, "global_step": 180827, "epoch": 4305} {"train_loss": -7.231310844421387, "global_step": 180828, "epoch": 4305} {"train_loss": -7.054178237915039, "global_step": 180829, "epoch": 4305} {"train_loss": -7.026208877563477, "global_step": 180830, "epoch": 4305} {"train_loss": -7.165241241455078, "global_step": 180831, "epoch": 4305} {"train_loss": -7.122515678405762, "global_step": 180832, "epoch": 4305} {"train_loss": -7.134565830230713, "global_step": 180833, "epoch": 4305} {"train_loss": -7.096821308135986, "global_step": 180834, "epoch": 4305} {"train_loss": -7.082910537719727, "global_step": 180835, "epoch": 4305} {"train_loss": -7.0040740966796875, "global_step": 180836, "epoch": 4305} {"train_loss": -7.157381057739258, "global_step": 180837, "epoch": 4305} {"train_loss": -7.198134422302246, "global_step": 180838, "epoch": 4305} {"train_loss": -7.136460304260254, "global_step": 180839, "epoch": 4305} {"train_loss": -7.104048728942871, "global_step": 180840, "epoch": 4305} {"train_loss": -7.181112289428711, "global_step": 180841, "epoch": 4305} {"train_loss": -7.0427961349487305, "global_step": 180842, "epoch": 4305} {"train_loss": -7.105278968811035, "global_step": 180843, "epoch": 4305} {"train_loss": -7.1740593910217285, "global_step": 180844, "epoch": 4305} {"train_loss": -7.083372592926025, "global_step": 180845, "epoch": 4305} {"train_loss": -7.126171588897705, "global_step": 180846, "epoch": 4305} {"train_loss": -7.166450500488281, "global_step": 180847, "epoch": 4305} {"train_loss": -7.041098117828369, "global_step": 180848, "epoch": 4305} {"train_loss": -7.110141754150391, "global_step": 180849, "epoch": 4305} {"train_loss": -7.075827598571777, "global_step": 180850, "epoch": 4305} {"train_loss": -7.142682245799473, "global_step": 180851, "epoch": 4305, "val_loss": 69264.7109375} {"train_loss": -7.1244306564331055, "global_step": 180852, "epoch": 4306} {"train_loss": -7.1620192527771, "global_step": 180853, "epoch": 4306} {"train_loss": -7.150867462158203, "global_step": 180854, "epoch": 4306} {"train_loss": -7.140916347503662, "global_step": 180855, "epoch": 4306} {"train_loss": -7.179290771484375, "global_step": 180856, "epoch": 4306} {"train_loss": -7.133056640625, "global_step": 180857, "epoch": 4306} {"train_loss": -7.031454086303711, "global_step": 180858, "epoch": 4306} {"train_loss": -7.101006031036377, "global_step": 180859, "epoch": 4306} {"train_loss": -7.074610233306885, "global_step": 180860, "epoch": 4306} {"train_loss": -7.1803879737854, "global_step": 180861, "epoch": 4306} {"train_loss": -7.253024578094482, "global_step": 180862, "epoch": 4306} {"train_loss": -6.9864583015441895, "global_step": 180863, "epoch": 4306} {"train_loss": -7.0462541580200195, "global_step": 180864, "epoch": 4306} {"train_loss": -7.1719865798950195, "global_step": 180865, "epoch": 4306} {"train_loss": -7.0684919357299805, "global_step": 180866, "epoch": 4306} {"train_loss": -7.04689884185791, "global_step": 180867, "epoch": 4306} {"train_loss": -7.036827564239502, "global_step": 180868, "epoch": 4306} {"train_loss": -7.064194679260254, "global_step": 180869, "epoch": 4306} {"train_loss": -6.986163139343262, "global_step": 180870, "epoch": 4306} {"train_loss": -7.173315525054932, "global_step": 180871, "epoch": 4306} {"train_loss": -7.058518409729004, "global_step": 180872, "epoch": 4306} {"train_loss": -7.047998428344727, "global_step": 180873, "epoch": 4306} {"train_loss": -7.0454301834106445, "global_step": 180874, "epoch": 4306} {"train_loss": -7.132894039154053, "global_step": 180875, "epoch": 4306} {"train_loss": -7.111084461212158, "global_step": 180876, "epoch": 4306} {"train_loss": -7.090099811553955, "global_step": 180877, "epoch": 4306} {"train_loss": -7.163609504699707, "global_step": 180878, "epoch": 4306} {"train_loss": -7.168312072753906, "global_step": 180879, "epoch": 4306} {"train_loss": -7.183462619781494, "global_step": 180880, "epoch": 4306} {"train_loss": -7.125845909118652, "global_step": 180881, "epoch": 4306} {"train_loss": -7.121949672698975, "global_step": 180882, "epoch": 4306} {"train_loss": -7.18819522857666, "global_step": 180883, "epoch": 4306} {"train_loss": -7.106590747833252, "global_step": 180884, "epoch": 4306} {"train_loss": -7.170957088470459, "global_step": 180885, "epoch": 4306} {"train_loss": -7.157852649688721, "global_step": 180886, "epoch": 4306} {"train_loss": -7.265244007110596, "global_step": 180887, "epoch": 4306} {"train_loss": -7.180825233459473, "global_step": 180888, "epoch": 4306} {"train_loss": -7.154544830322266, "global_step": 180889, "epoch": 4306} {"train_loss": -7.102272033691406, "global_step": 180890, "epoch": 4306} {"train_loss": -7.092837333679199, "global_step": 180891, "epoch": 4306} {"train_loss": -7.211211681365967, "global_step": 180892, "epoch": 4306} {"train_loss": -7.119580915996006, "global_step": 180893, "epoch": 4306, "val_loss": 69304.390625} {"train_loss": -7.188075542449951, "global_step": 180894, "epoch": 4307} {"train_loss": -7.157502174377441, "global_step": 180895, "epoch": 4307} {"train_loss": -6.915327072143555, "global_step": 180896, "epoch": 4307} {"train_loss": -7.016655921936035, "global_step": 180897, "epoch": 4307} {"train_loss": -7.088831901550293, "global_step": 180898, "epoch": 4307} {"train_loss": -6.980886459350586, "global_step": 180899, "epoch": 4307} {"train_loss": -7.052392482757568, "global_step": 180900, "epoch": 4307} {"train_loss": -6.975594520568848, "global_step": 180901, "epoch": 4307} {"train_loss": -7.025083541870117, "global_step": 180902, "epoch": 4307} {"train_loss": -6.988639831542969, "global_step": 180903, "epoch": 4307} {"train_loss": -7.032155990600586, "global_step": 180904, "epoch": 4307} {"train_loss": -6.859339714050293, "global_step": 180905, "epoch": 4307} {"train_loss": -6.799617767333984, "global_step": 180906, "epoch": 4307} {"train_loss": -6.913148880004883, "global_step": 180907, "epoch": 4307} {"train_loss": -6.8723673820495605, "global_step": 180908, "epoch": 4307} {"train_loss": -7.023168563842773, "global_step": 180909, "epoch": 4307} {"train_loss": -6.861623764038086, "global_step": 180910, "epoch": 4307} {"train_loss": -7.110352516174316, "global_step": 180911, "epoch": 4307} {"train_loss": -6.9878997802734375, "global_step": 180912, "epoch": 4307} {"train_loss": -7.030949592590332, "global_step": 180913, "epoch": 4307} {"train_loss": -6.911128997802734, "global_step": 180914, "epoch": 4307} {"train_loss": -6.951845169067383, "global_step": 180915, "epoch": 4307} {"train_loss": -6.997228145599365, "global_step": 180916, "epoch": 4307} {"train_loss": -6.973447799682617, "global_step": 180917, "epoch": 4307} {"train_loss": -6.983299255371094, "global_step": 180918, "epoch": 4307} {"train_loss": -7.0847673416137695, "global_step": 180919, "epoch": 4307} {"train_loss": -6.904228210449219, "global_step": 180920, "epoch": 4307} {"train_loss": -7.052522659301758, "global_step": 180921, "epoch": 4307} {"train_loss": -7.017691612243652, "global_step": 180922, "epoch": 4307} {"train_loss": -7.021096229553223, "global_step": 180923, "epoch": 4307} {"train_loss": -6.858247756958008, "global_step": 180924, "epoch": 4307} {"train_loss": -7.1460185050964355, "global_step": 180925, "epoch": 4307} {"train_loss": -7.139837265014648, "global_step": 180926, "epoch": 4307} {"train_loss": -7.0737433433532715, "global_step": 180927, "epoch": 4307} {"train_loss": -7.118513584136963, "global_step": 180928, "epoch": 4307} {"train_loss": -6.975743293762207, "global_step": 180929, "epoch": 4307} {"train_loss": -7.051154136657715, "global_step": 180930, "epoch": 4307} {"train_loss": -6.964122772216797, "global_step": 180931, "epoch": 4307} {"train_loss": -7.104270935058594, "global_step": 180932, "epoch": 4307} {"train_loss": -7.0350823402404785, "global_step": 180933, "epoch": 4307} {"train_loss": -7.145665168762207, "global_step": 180934, "epoch": 4307} {"train_loss": -7.009906439554124, "global_step": 180935, "epoch": 4307, "val_loss": 69318.78125} {"train_loss": -7.075772285461426, "global_step": 180936, "epoch": 4308} {"train_loss": -7.056883335113525, "global_step": 180937, "epoch": 4308} {"train_loss": -7.123427867889404, "global_step": 180938, "epoch": 4308} {"train_loss": -7.082133769989014, "global_step": 180939, "epoch": 4308} {"train_loss": -7.106315612792969, "global_step": 180940, "epoch": 4308} {"train_loss": -7.150623798370361, "global_step": 180941, "epoch": 4308} {"train_loss": -7.225033760070801, "global_step": 180942, "epoch": 4308} {"train_loss": -7.015725135803223, "global_step": 180943, "epoch": 4308} {"train_loss": -7.193092346191406, "global_step": 180944, "epoch": 4308} {"train_loss": -7.055363178253174, "global_step": 180945, "epoch": 4308} {"train_loss": -7.12958288192749, "global_step": 180946, "epoch": 4308} {"train_loss": -7.11138391494751, "global_step": 180947, "epoch": 4308} {"train_loss": -7.134515762329102, "global_step": 180948, "epoch": 4308} {"train_loss": -7.165771961212158, "global_step": 180949, "epoch": 4308} {"train_loss": -7.177743911743164, "global_step": 180950, "epoch": 4308} {"train_loss": -7.171389102935791, "global_step": 180951, "epoch": 4308} {"train_loss": -7.130082607269287, "global_step": 180952, "epoch": 4308} {"train_loss": -7.280921459197998, "global_step": 180953, "epoch": 4308} {"train_loss": -7.0247650146484375, "global_step": 180954, "epoch": 4308} {"train_loss": -7.144230842590332, "global_step": 180955, "epoch": 4308} {"train_loss": -7.120503902435303, "global_step": 180956, "epoch": 4308} {"train_loss": -7.180338382720947, "global_step": 180957, "epoch": 4308} {"train_loss": -7.19818115234375, "global_step": 180958, "epoch": 4308} {"train_loss": -7.140584945678711, "global_step": 180959, "epoch": 4308} {"train_loss": -7.100870609283447, "global_step": 180960, "epoch": 4308} {"train_loss": -7.136166572570801, "global_step": 180961, "epoch": 4308} {"train_loss": -7.159234046936035, "global_step": 180962, "epoch": 4308} {"train_loss": -7.146686553955078, "global_step": 180963, "epoch": 4308} {"train_loss": -7.349839210510254, "global_step": 180964, "epoch": 4308} {"train_loss": -7.133938789367676, "global_step": 180965, "epoch": 4308} {"train_loss": -7.240288734436035, "global_step": 180966, "epoch": 4308} {"train_loss": -7.080876350402832, "global_step": 180967, "epoch": 4308} {"train_loss": -7.053725242614746, "global_step": 180968, "epoch": 4308} {"train_loss": -7.246136665344238, "global_step": 180969, "epoch": 4308} {"train_loss": -7.115451812744141, "global_step": 180970, "epoch": 4308} {"train_loss": -7.056817054748535, "global_step": 180971, "epoch": 4308} {"train_loss": -7.1623921394348145, "global_step": 180972, "epoch": 4308} {"train_loss": -7.078523635864258, "global_step": 180973, "epoch": 4308} {"train_loss": -7.017269611358643, "global_step": 180974, "epoch": 4308} {"train_loss": -7.161849498748779, "global_step": 180975, "epoch": 4308} {"train_loss": -7.1068806648254395, "global_step": 180976, "epoch": 4308} {"train_loss": -7.135112376440139, "global_step": 180977, "epoch": 4308, "val_loss": 69367.3125} {"train_loss": -7.147136688232422, "global_step": 180978, "epoch": 4309} {"train_loss": -7.251709461212158, "global_step": 180979, "epoch": 4309} {"train_loss": -7.143144130706787, "global_step": 180980, "epoch": 4309} {"train_loss": -7.215503692626953, "global_step": 180981, "epoch": 4309} {"train_loss": -6.949728488922119, "global_step": 180982, "epoch": 4309} {"train_loss": -7.185100078582764, "global_step": 180983, "epoch": 4309} {"train_loss": -7.191967010498047, "global_step": 180984, "epoch": 4309} {"train_loss": -7.216462135314941, "global_step": 180985, "epoch": 4309} {"train_loss": -7.121416091918945, "global_step": 180986, "epoch": 4309} {"train_loss": -7.0845947265625, "global_step": 180987, "epoch": 4309} {"train_loss": -7.064390659332275, "global_step": 180988, "epoch": 4309} {"train_loss": -7.212973594665527, "global_step": 180989, "epoch": 4309} {"train_loss": -7.215717792510986, "global_step": 180990, "epoch": 4309} {"train_loss": -7.214747428894043, "global_step": 180991, "epoch": 4309} {"train_loss": -7.197055816650391, "global_step": 180992, "epoch": 4309} {"train_loss": -7.232578277587891, "global_step": 180993, "epoch": 4309} {"train_loss": -7.226284027099609, "global_step": 180994, "epoch": 4309} {"train_loss": -7.220306396484375, "global_step": 180995, "epoch": 4309} {"train_loss": -7.132284641265869, "global_step": 180996, "epoch": 4309} {"train_loss": -7.06567907333374, "global_step": 180997, "epoch": 4309} {"train_loss": -7.230737686157227, "global_step": 180998, "epoch": 4309} {"train_loss": -6.994714736938477, "global_step": 180999, "epoch": 4309} {"train_loss": -7.109827041625977, "global_step": 181000, "epoch": 4309} {"train_loss": -7.017836093902588, "global_step": 181001, "epoch": 4309} {"train_loss": -6.992923736572266, "global_step": 181002, "epoch": 4309} {"train_loss": -7.101705074310303, "global_step": 181003, "epoch": 4309} {"train_loss": -7.20646333694458, "global_step": 181004, "epoch": 4309} {"train_loss": -7.09876012802124, "global_step": 181005, "epoch": 4309} {"train_loss": -7.113195419311523, "global_step": 181006, "epoch": 4309} {"train_loss": -7.0705108642578125, "global_step": 181007, "epoch": 4309} {"train_loss": -6.997037887573242, "global_step": 181008, "epoch": 4309} {"train_loss": -7.152361869812012, "global_step": 181009, "epoch": 4309} {"train_loss": -6.979001998901367, "global_step": 181010, "epoch": 4309} {"train_loss": -6.995382308959961, "global_step": 181011, "epoch": 4309} {"train_loss": -7.100714206695557, "global_step": 181012, "epoch": 4309} {"train_loss": -6.8891682624816895, "global_step": 181013, "epoch": 4309} {"train_loss": -7.036720275878906, "global_step": 181014, "epoch": 4309} {"train_loss": -7.1302361488342285, "global_step": 181015, "epoch": 4309} {"train_loss": -7.060299873352051, "global_step": 181016, "epoch": 4309} {"train_loss": -6.970488548278809, "global_step": 181017, "epoch": 4309} {"train_loss": -7.063539505004883, "global_step": 181018, "epoch": 4309} {"train_loss": -7.111903213319325, "global_step": 181019, "epoch": 4309, "val_loss": 69324.828125} {"train_loss": -7.115146160125732, "global_step": 181020, "epoch": 4310} {"train_loss": -7.12716817855835, "global_step": 181021, "epoch": 4310} {"train_loss": -7.070230960845947, "global_step": 181022, "epoch": 4310} {"train_loss": -7.103604316711426, "global_step": 181023, "epoch": 4310} {"train_loss": -7.107742786407471, "global_step": 181024, "epoch": 4310} {"train_loss": -7.167015075683594, "global_step": 181025, "epoch": 4310} {"train_loss": -7.090979099273682, "global_step": 181026, "epoch": 4310} {"train_loss": -7.248232841491699, "global_step": 181027, "epoch": 4310} {"train_loss": -7.145524978637695, "global_step": 181028, "epoch": 4310} {"train_loss": -7.113837718963623, "global_step": 181029, "epoch": 4310} {"train_loss": -7.134395599365234, "global_step": 181030, "epoch": 4310} {"train_loss": -7.115355491638184, "global_step": 181031, "epoch": 4310} {"train_loss": -7.177163124084473, "global_step": 181032, "epoch": 4310} {"train_loss": -7.114109992980957, "global_step": 181033, "epoch": 4310} {"train_loss": -7.159893989562988, "global_step": 181034, "epoch": 4310} {"train_loss": -7.245464324951172, "global_step": 181035, "epoch": 4310} {"train_loss": -7.137887954711914, "global_step": 181036, "epoch": 4310} {"train_loss": -7.191354751586914, "global_step": 181037, "epoch": 4310} {"train_loss": -7.111699104309082, "global_step": 181038, "epoch": 4310} {"train_loss": -7.107431411743164, "global_step": 181039, "epoch": 4310} {"train_loss": -7.074983596801758, "global_step": 181040, "epoch": 4310} {"train_loss": -7.139044761657715, "global_step": 181041, "epoch": 4310} {"train_loss": -7.182461738586426, "global_step": 181042, "epoch": 4310} {"train_loss": -7.171840667724609, "global_step": 181043, "epoch": 4310} {"train_loss": -7.034963130950928, "global_step": 181044, "epoch": 4310} {"train_loss": -7.175379753112793, "global_step": 181045, "epoch": 4310} {"train_loss": -7.019340515136719, "global_step": 181046, "epoch": 4310} {"train_loss": -7.086606025695801, "global_step": 181047, "epoch": 4310} {"train_loss": -7.120758056640625, "global_step": 181048, "epoch": 4310} {"train_loss": -7.053878307342529, "global_step": 181049, "epoch": 4310} {"train_loss": -6.994997978210449, "global_step": 181050, "epoch": 4310} {"train_loss": -7.066622257232666, "global_step": 181051, "epoch": 4310} {"train_loss": -7.141844749450684, "global_step": 181052, "epoch": 4310} {"train_loss": -7.018052101135254, "global_step": 181053, "epoch": 4310} {"train_loss": -7.020352840423584, "global_step": 181054, "epoch": 4310} {"train_loss": -7.090514659881592, "global_step": 181055, "epoch": 4310} {"train_loss": -7.024050235748291, "global_step": 181056, "epoch": 4310} {"train_loss": -7.015100002288818, "global_step": 181057, "epoch": 4310} {"train_loss": -7.090693950653076, "global_step": 181058, "epoch": 4310} {"train_loss": -6.9724884033203125, "global_step": 181059, "epoch": 4310} {"train_loss": -7.175899505615234, "global_step": 181060, "epoch": 4310} {"train_loss": -7.1090924853370305, "global_step": 181061, "epoch": 4310, "val_loss": 69236.828125} {"train_loss": -7.058465957641602, "global_step": 181062, "epoch": 4311} {"train_loss": -7.098625659942627, "global_step": 181063, "epoch": 4311} {"train_loss": -6.981416702270508, "global_step": 181064, "epoch": 4311} {"train_loss": -7.07304573059082, "global_step": 181065, "epoch": 4311} {"train_loss": -7.003320693969727, "global_step": 181066, "epoch": 4311} {"train_loss": -7.115492820739746, "global_step": 181067, "epoch": 4311} {"train_loss": -7.071927547454834, "global_step": 181068, "epoch": 4311} {"train_loss": -7.044354438781738, "global_step": 181069, "epoch": 4311} {"train_loss": -7.162333965301514, "global_step": 181070, "epoch": 4311} {"train_loss": -7.132062911987305, "global_step": 181071, "epoch": 4311} {"train_loss": -7.169239044189453, "global_step": 181072, "epoch": 4311} {"train_loss": -7.157061576843262, "global_step": 181073, "epoch": 4311} {"train_loss": -7.147904396057129, "global_step": 181074, "epoch": 4311} {"train_loss": -7.052764892578125, "global_step": 181075, "epoch": 4311} {"train_loss": -7.0579962730407715, "global_step": 181076, "epoch": 4311} {"train_loss": -7.103937149047852, "global_step": 181077, "epoch": 4311} {"train_loss": -7.084312438964844, "global_step": 181078, "epoch": 4311} {"train_loss": -7.065549850463867, "global_step": 181079, "epoch": 4311} {"train_loss": -7.127736568450928, "global_step": 181080, "epoch": 4311} {"train_loss": -7.0651702880859375, "global_step": 181081, "epoch": 4311} {"train_loss": -7.126892566680908, "global_step": 181082, "epoch": 4311} {"train_loss": -7.161673545837402, "global_step": 181083, "epoch": 4311} {"train_loss": -7.101090431213379, "global_step": 181084, "epoch": 4311} {"train_loss": -7.035574913024902, "global_step": 181085, "epoch": 4311} {"train_loss": -7.187671661376953, "global_step": 181086, "epoch": 4311} {"train_loss": -7.02665901184082, "global_step": 181087, "epoch": 4311} {"train_loss": -7.209257125854492, "global_step": 181088, "epoch": 4311} {"train_loss": -7.171807765960693, "global_step": 181089, "epoch": 4311} {"train_loss": -7.0779829025268555, "global_step": 181090, "epoch": 4311} {"train_loss": -6.977221965789795, "global_step": 181091, "epoch": 4311} {"train_loss": -7.138324737548828, "global_step": 181092, "epoch": 4311} {"train_loss": -7.110482215881348, "global_step": 181093, "epoch": 4311} {"train_loss": -7.0925188064575195, "global_step": 181094, "epoch": 4311} {"train_loss": -7.107906341552734, "global_step": 181095, "epoch": 4311} {"train_loss": -6.970149040222168, "global_step": 181096, "epoch": 4311} {"train_loss": -6.95390510559082, "global_step": 181097, "epoch": 4311} {"train_loss": -7.081087112426758, "global_step": 181098, "epoch": 4311} {"train_loss": -7.151241779327393, "global_step": 181099, "epoch": 4311} {"train_loss": -7.157524108886719, "global_step": 181100, "epoch": 4311} {"train_loss": -7.128313064575195, "global_step": 181101, "epoch": 4311} {"train_loss": -7.205535411834717, "global_step": 181102, "epoch": 4311} {"train_loss": -7.097681068238758, "global_step": 181103, "epoch": 4311, "val_loss": 69292.9921875} {"train_loss": -7.1243510246276855, "global_step": 181104, "epoch": 4312} {"train_loss": -7.240904808044434, "global_step": 181105, "epoch": 4312} {"train_loss": -7.160382270812988, "global_step": 181106, "epoch": 4312} {"train_loss": -7.088905334472656, "global_step": 181107, "epoch": 4312} {"train_loss": -7.235003471374512, "global_step": 181108, "epoch": 4312} {"train_loss": -7.085367202758789, "global_step": 181109, "epoch": 4312} {"train_loss": -7.120858192443848, "global_step": 181110, "epoch": 4312} {"train_loss": -7.2384419441223145, "global_step": 181111, "epoch": 4312} {"train_loss": -7.174858570098877, "global_step": 181112, "epoch": 4312} {"train_loss": -7.178393363952637, "global_step": 181113, "epoch": 4312} {"train_loss": -7.141406059265137, "global_step": 181114, "epoch": 4312} {"train_loss": -7.169905662536621, "global_step": 181115, "epoch": 4312} {"train_loss": -7.172726631164551, "global_step": 181116, "epoch": 4312} {"train_loss": -7.179001808166504, "global_step": 181117, "epoch": 4312} {"train_loss": -7.14292049407959, "global_step": 181118, "epoch": 4312} {"train_loss": -7.140101432800293, "global_step": 181119, "epoch": 4312} {"train_loss": -7.1248250007629395, "global_step": 181120, "epoch": 4312} {"train_loss": -7.2224907875061035, "global_step": 181121, "epoch": 4312} {"train_loss": -7.098959922790527, "global_step": 181122, "epoch": 4312} {"train_loss": -7.124955654144287, "global_step": 181123, "epoch": 4312} {"train_loss": -7.067383766174316, "global_step": 181124, "epoch": 4312} {"train_loss": -7.0193023681640625, "global_step": 181125, "epoch": 4312} {"train_loss": -7.039009094238281, "global_step": 181126, "epoch": 4312} {"train_loss": -7.052310466766357, "global_step": 181127, "epoch": 4312} {"train_loss": -7.035073757171631, "global_step": 181128, "epoch": 4312} {"train_loss": -7.16440486907959, "global_step": 181129, "epoch": 4312} {"train_loss": -7.131753921508789, "global_step": 181130, "epoch": 4312} {"train_loss": -7.076633930206299, "global_step": 181131, "epoch": 4312} {"train_loss": -7.135128974914551, "global_step": 181132, "epoch": 4312} {"train_loss": -6.996121406555176, "global_step": 181133, "epoch": 4312} {"train_loss": -7.116610527038574, "global_step": 181134, "epoch": 4312} {"train_loss": -7.072505474090576, "global_step": 181135, "epoch": 4312} {"train_loss": -6.991851806640625, "global_step": 181136, "epoch": 4312} {"train_loss": -7.072147846221924, "global_step": 181137, "epoch": 4312} {"train_loss": -7.144829750061035, "global_step": 181138, "epoch": 4312} {"train_loss": -6.9837799072265625, "global_step": 181139, "epoch": 4312} {"train_loss": -7.044337749481201, "global_step": 181140, "epoch": 4312} {"train_loss": -7.098827362060547, "global_step": 181141, "epoch": 4312} {"train_loss": -6.987879753112793, "global_step": 181142, "epoch": 4312} {"train_loss": -7.036012649536133, "global_step": 181143, "epoch": 4312} {"train_loss": -7.024559020996094, "global_step": 181144, "epoch": 4312} {"train_loss": -7.1083957354227705, "global_step": 181145, "epoch": 4312, "val_loss": 69235.125} {"train_loss": -7.056013107299805, "global_step": 181146, "epoch": 4313} {"train_loss": -7.062723159790039, "global_step": 181147, "epoch": 4313} {"train_loss": -7.0912861824035645, "global_step": 181148, "epoch": 4313} {"train_loss": -7.090746879577637, "global_step": 181149, "epoch": 4313} {"train_loss": -7.150362968444824, "global_step": 181150, "epoch": 4313} {"train_loss": -7.112823486328125, "global_step": 181151, "epoch": 4313} {"train_loss": -6.93514347076416, "global_step": 181152, "epoch": 4313} {"train_loss": -7.066600799560547, "global_step": 181153, "epoch": 4313} {"train_loss": -7.119578838348389, "global_step": 181154, "epoch": 4313} {"train_loss": -7.109951019287109, "global_step": 181155, "epoch": 4313} {"train_loss": -7.045065879821777, "global_step": 181156, "epoch": 4313} {"train_loss": -7.120272636413574, "global_step": 181157, "epoch": 4313} {"train_loss": -7.053190231323242, "global_step": 181158, "epoch": 4313} {"train_loss": -7.005627632141113, "global_step": 181159, "epoch": 4313} {"train_loss": -7.12691068649292, "global_step": 181160, "epoch": 4313} {"train_loss": -6.955323219299316, "global_step": 181161, "epoch": 4313} {"train_loss": -7.1418914794921875, "global_step": 181162, "epoch": 4313} {"train_loss": -7.143919944763184, "global_step": 181163, "epoch": 4313} {"train_loss": -7.258511543273926, "global_step": 181164, "epoch": 4313} {"train_loss": -7.155974864959717, "global_step": 181165, "epoch": 4313} {"train_loss": -7.0887017250061035, "global_step": 181166, "epoch": 4313} {"train_loss": -7.1940741539001465, "global_step": 181167, "epoch": 4313} {"train_loss": -7.2128071784973145, "global_step": 181168, "epoch": 4313} {"train_loss": -7.166779041290283, "global_step": 181169, "epoch": 4313} {"train_loss": -7.253992557525635, "global_step": 181170, "epoch": 4313} {"train_loss": -7.03071403503418, "global_step": 181171, "epoch": 4313} {"train_loss": -7.118700981140137, "global_step": 181172, "epoch": 4313} {"train_loss": -7.048592567443848, "global_step": 181173, "epoch": 4313} {"train_loss": -7.132105827331543, "global_step": 181174, "epoch": 4313} {"train_loss": -7.159638404846191, "global_step": 181175, "epoch": 4313} {"train_loss": -7.028364658355713, "global_step": 181176, "epoch": 4313} {"train_loss": -7.079787254333496, "global_step": 181177, "epoch": 4313} {"train_loss": -7.0788164138793945, "global_step": 181178, "epoch": 4313} {"train_loss": -7.244868278503418, "global_step": 181179, "epoch": 4313} {"train_loss": -7.18962287902832, "global_step": 181180, "epoch": 4313} {"train_loss": -7.096872806549072, "global_step": 181181, "epoch": 4313} {"train_loss": -7.111185550689697, "global_step": 181182, "epoch": 4313} {"train_loss": -7.1058220863342285, "global_step": 181183, "epoch": 4313} {"train_loss": -7.125879287719727, "global_step": 181184, "epoch": 4313} {"train_loss": -7.21754264831543, "global_step": 181185, "epoch": 4313} {"train_loss": -7.111273765563965, "global_step": 181186, "epoch": 4313} {"train_loss": -7.112444230488369, "global_step": 181187, "epoch": 4313, "val_loss": 69527.2578125} {"train_loss": -7.251056671142578, "global_step": 181188, "epoch": 4314} {"train_loss": -7.177329063415527, "global_step": 181189, "epoch": 4314} {"train_loss": -7.1045050621032715, "global_step": 181190, "epoch": 4314} {"train_loss": -7.1391191482543945, "global_step": 181191, "epoch": 4314} {"train_loss": -7.098957538604736, "global_step": 181192, "epoch": 4314} {"train_loss": -7.22929573059082, "global_step": 181193, "epoch": 4314} {"train_loss": -7.092228889465332, "global_step": 181194, "epoch": 4314} {"train_loss": -7.10849666595459, "global_step": 181195, "epoch": 4314} {"train_loss": -7.235008239746094, "global_step": 181196, "epoch": 4314} {"train_loss": -7.218062877655029, "global_step": 181197, "epoch": 4314} {"train_loss": -7.148712158203125, "global_step": 181198, "epoch": 4314} {"train_loss": -7.142134189605713, "global_step": 181199, "epoch": 4314} {"train_loss": -7.07560920715332, "global_step": 181200, "epoch": 4314} {"train_loss": -7.1702446937561035, "global_step": 181201, "epoch": 4314} {"train_loss": -7.023270130157471, "global_step": 181202, "epoch": 4314} {"train_loss": -7.091485977172852, "global_step": 181203, "epoch": 4314} {"train_loss": -7.162144184112549, "global_step": 181204, "epoch": 4314} {"train_loss": -7.008275032043457, "global_step": 181205, "epoch": 4314} {"train_loss": -7.07054328918457, "global_step": 181206, "epoch": 4314} {"train_loss": -7.194092750549316, "global_step": 181207, "epoch": 4314} {"train_loss": -6.953108787536621, "global_step": 181208, "epoch": 4314} {"train_loss": -6.967277526855469, "global_step": 181209, "epoch": 4314} {"train_loss": -7.106807708740234, "global_step": 181210, "epoch": 4314} {"train_loss": -7.026000022888184, "global_step": 181211, "epoch": 4314} {"train_loss": -6.99553108215332, "global_step": 181212, "epoch": 4314} {"train_loss": -7.058905601501465, "global_step": 181213, "epoch": 4314} {"train_loss": -6.899937629699707, "global_step": 181214, "epoch": 4314} {"train_loss": -6.894219875335693, "global_step": 181215, "epoch": 4314} {"train_loss": -7.106472015380859, "global_step": 181216, "epoch": 4314} {"train_loss": -6.922667026519775, "global_step": 181217, "epoch": 4314} {"train_loss": -7.05463981628418, "global_step": 181218, "epoch": 4314} {"train_loss": -6.946292877197266, "global_step": 181219, "epoch": 4314} {"train_loss": -6.889203071594238, "global_step": 181220, "epoch": 4314} {"train_loss": -7.006366729736328, "global_step": 181221, "epoch": 4314} {"train_loss": -7.045041561126709, "global_step": 181222, "epoch": 4314} {"train_loss": -7.117952346801758, "global_step": 181223, "epoch": 4314} {"train_loss": -7.040577411651611, "global_step": 181224, "epoch": 4314} {"train_loss": -7.006464004516602, "global_step": 181225, "epoch": 4314} {"train_loss": -7.056037902832031, "global_step": 181226, "epoch": 4314} {"train_loss": -7.088630199432373, "global_step": 181227, "epoch": 4314} {"train_loss": -7.053159713745117, "global_step": 181228, "epoch": 4314} {"train_loss": -7.071936868485951, "global_step": 181229, "epoch": 4314, "val_loss": 69370.0078125} {"train_loss": -7.018632411956787, "global_step": 181230, "epoch": 4315} {"train_loss": -7.077643394470215, "global_step": 181231, "epoch": 4315} {"train_loss": -7.1045684814453125, "global_step": 181232, "epoch": 4315} {"train_loss": -7.056532859802246, "global_step": 181233, "epoch": 4315} {"train_loss": -7.168956279754639, "global_step": 181234, "epoch": 4315} {"train_loss": -7.111776828765869, "global_step": 181235, "epoch": 4315} {"train_loss": -7.1255903244018555, "global_step": 181236, "epoch": 4315} {"train_loss": -7.21737003326416, "global_step": 181237, "epoch": 4315} {"train_loss": -7.106801986694336, "global_step": 181238, "epoch": 4315} {"train_loss": -7.114868640899658, "global_step": 181239, "epoch": 4315} {"train_loss": -7.1097412109375, "global_step": 181240, "epoch": 4315} {"train_loss": -7.118515968322754, "global_step": 181241, "epoch": 4315} {"train_loss": -7.102506637573242, "global_step": 181242, "epoch": 4315} {"train_loss": -6.975305557250977, "global_step": 181243, "epoch": 4315} {"train_loss": -7.170391082763672, "global_step": 181244, "epoch": 4315} {"train_loss": -7.054614067077637, "global_step": 181245, "epoch": 4315} {"train_loss": -6.977823257446289, "global_step": 181246, "epoch": 4315} {"train_loss": -7.137951850891113, "global_step": 181247, "epoch": 4315} {"train_loss": -7.110169410705566, "global_step": 181248, "epoch": 4315} {"train_loss": -7.161993503570557, "global_step": 181249, "epoch": 4315} {"train_loss": -7.018703460693359, "global_step": 181250, "epoch": 4315} {"train_loss": -7.070127964019775, "global_step": 181251, "epoch": 4315} {"train_loss": -7.14114236831665, "global_step": 181252, "epoch": 4315} {"train_loss": -7.082555770874023, "global_step": 181253, "epoch": 4315} {"train_loss": -7.150818824768066, "global_step": 181254, "epoch": 4315} {"train_loss": -7.095519542694092, "global_step": 181255, "epoch": 4315} {"train_loss": -7.066950798034668, "global_step": 181256, "epoch": 4315} {"train_loss": -7.138636112213135, "global_step": 181257, "epoch": 4315} {"train_loss": -6.946858882904053, "global_step": 181258, "epoch": 4315} {"train_loss": -7.085602760314941, "global_step": 181259, "epoch": 4315} {"train_loss": -7.11402702331543, "global_step": 181260, "epoch": 4315} {"train_loss": -7.0935540199279785, "global_step": 181261, "epoch": 4315} {"train_loss": -7.216368675231934, "global_step": 181262, "epoch": 4315} {"train_loss": -7.132843971252441, "global_step": 181263, "epoch": 4315} {"train_loss": -7.208855628967285, "global_step": 181264, "epoch": 4315} {"train_loss": -7.177966594696045, "global_step": 181265, "epoch": 4315} {"train_loss": -7.111248970031738, "global_step": 181266, "epoch": 4315} {"train_loss": -7.201569557189941, "global_step": 181267, "epoch": 4315} {"train_loss": -7.1551408767700195, "global_step": 181268, "epoch": 4315} {"train_loss": -7.095033645629883, "global_step": 181269, "epoch": 4315} {"train_loss": -7.174127101898193, "global_step": 181270, "epoch": 4315} {"train_loss": -7.106128669920421, "global_step": 181271, "epoch": 4315, "val_loss": 69277.875} {"train_loss": -7.130073070526123, "global_step": 181272, "epoch": 4316} {"train_loss": -7.240164756774902, "global_step": 181273, "epoch": 4316} {"train_loss": -7.0806684494018555, "global_step": 181274, "epoch": 4316} {"train_loss": -7.004443168640137, "global_step": 181275, "epoch": 4316} {"train_loss": -7.193668365478516, "global_step": 181276, "epoch": 4316} {"train_loss": -7.051385879516602, "global_step": 181277, "epoch": 4316} {"train_loss": -6.929047584533691, "global_step": 181278, "epoch": 4316} {"train_loss": -6.986438751220703, "global_step": 181279, "epoch": 4316} {"train_loss": -7.10421895980835, "global_step": 181280, "epoch": 4316} {"train_loss": -7.021530628204346, "global_step": 181281, "epoch": 4316} {"train_loss": -7.070449352264404, "global_step": 181282, "epoch": 4316} {"train_loss": -7.035580635070801, "global_step": 181283, "epoch": 4316} {"train_loss": -6.995394706726074, "global_step": 181284, "epoch": 4316} {"train_loss": -7.119399070739746, "global_step": 181285, "epoch": 4316} {"train_loss": -7.147437572479248, "global_step": 181286, "epoch": 4316} {"train_loss": -7.208312034606934, "global_step": 181287, "epoch": 4316} {"train_loss": -7.012694835662842, "global_step": 181288, "epoch": 4316} {"train_loss": -7.142341613769531, "global_step": 181289, "epoch": 4316} {"train_loss": -7.085222244262695, "global_step": 181290, "epoch": 4316} {"train_loss": -7.184927463531494, "global_step": 181291, "epoch": 4316} {"train_loss": -7.036369800567627, "global_step": 181292, "epoch": 4316} {"train_loss": -7.069103717803955, "global_step": 181293, "epoch": 4316} {"train_loss": -7.0574750900268555, "global_step": 181294, "epoch": 4316} {"train_loss": -7.0645928382873535, "global_step": 181295, "epoch": 4316} {"train_loss": -7.146757125854492, "global_step": 181296, "epoch": 4316} {"train_loss": -7.141547203063965, "global_step": 181297, "epoch": 4316} {"train_loss": -7.034643173217773, "global_step": 181298, "epoch": 4316} {"train_loss": -7.184841156005859, "global_step": 181299, "epoch": 4316} {"train_loss": -7.187665939331055, "global_step": 181300, "epoch": 4316} {"train_loss": -7.097556114196777, "global_step": 181301, "epoch": 4316} {"train_loss": -7.127434730529785, "global_step": 181302, "epoch": 4316} {"train_loss": -7.089787483215332, "global_step": 181303, "epoch": 4316} {"train_loss": -7.115609169006348, "global_step": 181304, "epoch": 4316} {"train_loss": -7.188403129577637, "global_step": 181305, "epoch": 4316} {"train_loss": -7.033337593078613, "global_step": 181306, "epoch": 4316} {"train_loss": -7.203885078430176, "global_step": 181307, "epoch": 4316} {"train_loss": -7.057912349700928, "global_step": 181308, "epoch": 4316} {"train_loss": -7.064180374145508, "global_step": 181309, "epoch": 4316} {"train_loss": -7.207566261291504, "global_step": 181310, "epoch": 4316} {"train_loss": -6.980597496032715, "global_step": 181311, "epoch": 4316} {"train_loss": -7.187499046325684, "global_step": 181312, "epoch": 4316} {"train_loss": -7.095399584089007, "global_step": 181313, "epoch": 4316, "val_loss": 69238.515625} {"train_loss": -7.118905067443848, "global_step": 181314, "epoch": 4317} {"train_loss": -6.986898422241211, "global_step": 181315, "epoch": 4317} {"train_loss": -7.153191566467285, "global_step": 181316, "epoch": 4317} {"train_loss": -7.170162677764893, "global_step": 181317, "epoch": 4317} {"train_loss": -7.115951061248779, "global_step": 181318, "epoch": 4317} {"train_loss": -7.263148784637451, "global_step": 181319, "epoch": 4317} {"train_loss": -7.062470436096191, "global_step": 181320, "epoch": 4317} {"train_loss": -7.095326900482178, "global_step": 181321, "epoch": 4317} {"train_loss": -7.150671482086182, "global_step": 181322, "epoch": 4317} {"train_loss": -7.149785995483398, "global_step": 181323, "epoch": 4317} {"train_loss": -7.2198615074157715, "global_step": 181324, "epoch": 4317} {"train_loss": -7.21258544921875, "global_step": 181325, "epoch": 4317} {"train_loss": -7.312935829162598, "global_step": 181326, "epoch": 4317} {"train_loss": -7.268134593963623, "global_step": 181327, "epoch": 4317} {"train_loss": -7.1889567375183105, "global_step": 181328, "epoch": 4317} {"train_loss": -7.050276279449463, "global_step": 181329, "epoch": 4317} {"train_loss": -7.122320652008057, "global_step": 181330, "epoch": 4317} {"train_loss": -7.22562313079834, "global_step": 181331, "epoch": 4317} {"train_loss": -7.080955505371094, "global_step": 181332, "epoch": 4317} {"train_loss": -7.109073638916016, "global_step": 181333, "epoch": 4317} {"train_loss": -7.212573528289795, "global_step": 181334, "epoch": 4317} {"train_loss": -7.188441276550293, "global_step": 181335, "epoch": 4317} {"train_loss": -7.16294002532959, "global_step": 181336, "epoch": 4317} {"train_loss": -7.054669380187988, "global_step": 181337, "epoch": 4317} {"train_loss": -7.161426544189453, "global_step": 181338, "epoch": 4317} {"train_loss": -6.974332332611084, "global_step": 181339, "epoch": 4317} {"train_loss": -7.060146331787109, "global_step": 181340, "epoch": 4317} {"train_loss": -7.21338415145874, "global_step": 181341, "epoch": 4317} {"train_loss": -6.867861747741699, "global_step": 181342, "epoch": 4317} {"train_loss": -7.180403709411621, "global_step": 181343, "epoch": 4317} {"train_loss": -6.996220588684082, "global_step": 181344, "epoch": 4317} {"train_loss": -7.012238502502441, "global_step": 181345, "epoch": 4317} {"train_loss": -7.07143497467041, "global_step": 181346, "epoch": 4317} {"train_loss": -6.748504638671875, "global_step": 181347, "epoch": 4317} {"train_loss": -7.117593288421631, "global_step": 181348, "epoch": 4317} {"train_loss": -6.964968681335449, "global_step": 181349, "epoch": 4317} {"train_loss": -7.020049095153809, "global_step": 181350, "epoch": 4317} {"train_loss": -6.9547505378723145, "global_step": 181351, "epoch": 4317} {"train_loss": -7.024117469787598, "global_step": 181352, "epoch": 4317} {"train_loss": -7.02094841003418, "global_step": 181353, "epoch": 4317} {"train_loss": -7.034751892089844, "global_step": 181354, "epoch": 4317} {"train_loss": -7.101554302942185, "global_step": 181355, "epoch": 4317, "val_loss": 69592.75} {"train_loss": -7.036019802093506, "global_step": 181356, "epoch": 4318} {"train_loss": -7.032357215881348, "global_step": 181357, "epoch": 4318} {"train_loss": -7.030437469482422, "global_step": 181358, "epoch": 4318} {"train_loss": -7.103525161743164, "global_step": 181359, "epoch": 4318} {"train_loss": -7.01751708984375, "global_step": 181360, "epoch": 4318} {"train_loss": -7.093595504760742, "global_step": 181361, "epoch": 4318} {"train_loss": -7.031987190246582, "global_step": 181362, "epoch": 4318} {"train_loss": -7.104450225830078, "global_step": 181363, "epoch": 4318} {"train_loss": -7.009264945983887, "global_step": 181364, "epoch": 4318} {"train_loss": -7.164812088012695, "global_step": 181365, "epoch": 4318} {"train_loss": -7.064726829528809, "global_step": 181366, "epoch": 4318} {"train_loss": -7.1275315284729, "global_step": 181367, "epoch": 4318} {"train_loss": -6.9380269050598145, "global_step": 181368, "epoch": 4318} {"train_loss": -6.955188274383545, "global_step": 181369, "epoch": 4318} {"train_loss": -7.08000373840332, "global_step": 181370, "epoch": 4318} {"train_loss": -7.160444736480713, "global_step": 181371, "epoch": 4318} {"train_loss": -6.9893646240234375, "global_step": 181372, "epoch": 4318} {"train_loss": -6.977692604064941, "global_step": 181373, "epoch": 4318} {"train_loss": -7.07966423034668, "global_step": 181374, "epoch": 4318} {"train_loss": -7.0164642333984375, "global_step": 181375, "epoch": 4318} {"train_loss": -7.01631498336792, "global_step": 181376, "epoch": 4318} {"train_loss": -7.173959732055664, "global_step": 181377, "epoch": 4318} {"train_loss": -7.169798851013184, "global_step": 181378, "epoch": 4318} {"train_loss": -6.891951560974121, "global_step": 181379, "epoch": 4318} {"train_loss": -7.074321746826172, "global_step": 181380, "epoch": 4318} {"train_loss": -7.049098014831543, "global_step": 181381, "epoch": 4318} {"train_loss": -7.063094615936279, "global_step": 181382, "epoch": 4318} {"train_loss": -6.9868292808532715, "global_step": 181383, "epoch": 4318} {"train_loss": -7.003842353820801, "global_step": 181384, "epoch": 4318} {"train_loss": -7.093886375427246, "global_step": 181385, "epoch": 4318} {"train_loss": -6.820415496826172, "global_step": 181386, "epoch": 4318} {"train_loss": -7.031403541564941, "global_step": 181387, "epoch": 4318} {"train_loss": -6.909963607788086, "global_step": 181388, "epoch": 4318} {"train_loss": -6.986347198486328, "global_step": 181389, "epoch": 4318} {"train_loss": -7.043391704559326, "global_step": 181390, "epoch": 4318} {"train_loss": -6.968326568603516, "global_step": 181391, "epoch": 4318} {"train_loss": -6.99395227432251, "global_step": 181392, "epoch": 4318} {"train_loss": -6.887707710266113, "global_step": 181393, "epoch": 4318} {"train_loss": -7.006922245025635, "global_step": 181394, "epoch": 4318} {"train_loss": -6.972540378570557, "global_step": 181395, "epoch": 4318} {"train_loss": -7.002493858337402, "global_step": 181396, "epoch": 4318} {"train_loss": -7.02831845056443, "global_step": 181397, "epoch": 4318, "val_loss": 69462.4140625} {"train_loss": -6.965723037719727, "global_step": 181398, "epoch": 4319} {"train_loss": -7.020602226257324, "global_step": 181399, "epoch": 4319} {"train_loss": -7.070004463195801, "global_step": 181400, "epoch": 4319} {"train_loss": -6.997673034667969, "global_step": 181401, "epoch": 4319} {"train_loss": -6.999070644378662, "global_step": 181402, "epoch": 4319} {"train_loss": -7.039325714111328, "global_step": 181403, "epoch": 4319} {"train_loss": -7.080268859863281, "global_step": 181404, "epoch": 4319} {"train_loss": -6.971547603607178, "global_step": 181405, "epoch": 4319} {"train_loss": -6.978213787078857, "global_step": 181406, "epoch": 4319} {"train_loss": -7.056164264678955, "global_step": 181407, "epoch": 4319} {"train_loss": -6.943037986755371, "global_step": 181408, "epoch": 4319} {"train_loss": -7.014805793762207, "global_step": 181409, "epoch": 4319} {"train_loss": -7.122200965881348, "global_step": 181410, "epoch": 4319} {"train_loss": -7.099492073059082, "global_step": 181411, "epoch": 4319} {"train_loss": -7.126898765563965, "global_step": 181412, "epoch": 4319} {"train_loss": -7.174617767333984, "global_step": 181413, "epoch": 4319} {"train_loss": -7.165951728820801, "global_step": 181414, "epoch": 4319} {"train_loss": -7.1261444091796875, "global_step": 181415, "epoch": 4319} {"train_loss": -7.1818528175354, "global_step": 181416, "epoch": 4319} {"train_loss": -7.149356842041016, "global_step": 181417, "epoch": 4319} {"train_loss": -7.110285758972168, "global_step": 181418, "epoch": 4319} {"train_loss": -7.082206726074219, "global_step": 181419, "epoch": 4319} {"train_loss": -7.12747049331665, "global_step": 181420, "epoch": 4319} {"train_loss": -7.191265106201172, "global_step": 181421, "epoch": 4319} {"train_loss": -7.105813026428223, "global_step": 181422, "epoch": 4319} {"train_loss": -7.156661033630371, "global_step": 181423, "epoch": 4319} {"train_loss": -7.102102279663086, "global_step": 181424, "epoch": 4319} {"train_loss": -7.193591117858887, "global_step": 181425, "epoch": 4319} {"train_loss": -7.146346092224121, "global_step": 181426, "epoch": 4319} {"train_loss": -7.1041975021362305, "global_step": 181427, "epoch": 4319} {"train_loss": -7.193262100219727, "global_step": 181428, "epoch": 4319} {"train_loss": -7.202975749969482, "global_step": 181429, "epoch": 4319} {"train_loss": -7.195700168609619, "global_step": 181430, "epoch": 4319} {"train_loss": -7.234653472900391, "global_step": 181431, "epoch": 4319} {"train_loss": -7.249769687652588, "global_step": 181432, "epoch": 4319} {"train_loss": -7.23820161819458, "global_step": 181433, "epoch": 4319} {"train_loss": -7.1035990715026855, "global_step": 181434, "epoch": 4319} {"train_loss": -7.139764785766602, "global_step": 181435, "epoch": 4319} {"train_loss": -7.100029468536377, "global_step": 181436, "epoch": 4319} {"train_loss": -7.264671802520752, "global_step": 181437, "epoch": 4319} {"train_loss": -7.202160358428955, "global_step": 181438, "epoch": 4319} {"train_loss": -7.116075050263178, "global_step": 181439, "epoch": 4319, "val_loss": 69182.0546875} {"train_loss": -7.116689682006836, "global_step": 181440, "epoch": 4320} {"train_loss": -7.135408401489258, "global_step": 181441, "epoch": 4320} {"train_loss": -7.012316703796387, "global_step": 181442, "epoch": 4320} {"train_loss": -7.274223327636719, "global_step": 181443, "epoch": 4320} {"train_loss": -7.132099151611328, "global_step": 181444, "epoch": 4320} {"train_loss": -7.013881206512451, "global_step": 181445, "epoch": 4320} {"train_loss": -7.145881175994873, "global_step": 181446, "epoch": 4320} {"train_loss": -7.094677448272705, "global_step": 181447, "epoch": 4320} {"train_loss": -6.935904502868652, "global_step": 181448, "epoch": 4320} {"train_loss": -7.21768045425415, "global_step": 181449, "epoch": 4320} {"train_loss": -7.200735092163086, "global_step": 181450, "epoch": 4320} {"train_loss": -7.161552429199219, "global_step": 181451, "epoch": 4320} {"train_loss": -7.1166157722473145, "global_step": 181452, "epoch": 4320} {"train_loss": -7.130178928375244, "global_step": 181453, "epoch": 4320} {"train_loss": -7.043642520904541, "global_step": 181454, "epoch": 4320} {"train_loss": -7.233734130859375, "global_step": 181455, "epoch": 4320} {"train_loss": -7.0906982421875, "global_step": 181456, "epoch": 4320} {"train_loss": -7.043385028839111, "global_step": 181457, "epoch": 4320} {"train_loss": -7.153871536254883, "global_step": 181458, "epoch": 4320} {"train_loss": -6.919042587280273, "global_step": 181459, "epoch": 4320} {"train_loss": -7.091926574707031, "global_step": 181460, "epoch": 4320} {"train_loss": -7.0861382484436035, "global_step": 181461, "epoch": 4320} {"train_loss": -7.132444858551025, "global_step": 181462, "epoch": 4320} {"train_loss": -7.1832427978515625, "global_step": 181463, "epoch": 4320} {"train_loss": -7.040952682495117, "global_step": 181464, "epoch": 4320} {"train_loss": -7.187370300292969, "global_step": 181465, "epoch": 4320} {"train_loss": -7.14988374710083, "global_step": 181466, "epoch": 4320} {"train_loss": -7.105715274810791, "global_step": 181467, "epoch": 4320} {"train_loss": -7.194377422332764, "global_step": 181468, "epoch": 4320} {"train_loss": -7.082546710968018, "global_step": 181469, "epoch": 4320} {"train_loss": -7.11985969543457, "global_step": 181470, "epoch": 4320} {"train_loss": -7.152870178222656, "global_step": 181471, "epoch": 4320} {"train_loss": -6.994876861572266, "global_step": 181472, "epoch": 4320} {"train_loss": -7.056406497955322, "global_step": 181473, "epoch": 4320} {"train_loss": -7.1766815185546875, "global_step": 181474, "epoch": 4320} {"train_loss": -7.124547004699707, "global_step": 181475, "epoch": 4320} {"train_loss": -7.018339157104492, "global_step": 181476, "epoch": 4320} {"train_loss": -7.260065078735352, "global_step": 181477, "epoch": 4320} {"train_loss": -7.129502296447754, "global_step": 181478, "epoch": 4320} {"train_loss": -7.0671186447143555, "global_step": 181479, "epoch": 4320} {"train_loss": -7.16655158996582, "global_step": 181480, "epoch": 4320} {"train_loss": -7.112828368232364, "global_step": 181481, "epoch": 4320, "val_loss": 69163.3125} {"train_loss": -7.12241792678833, "global_step": 181482, "epoch": 4321} {"train_loss": -7.132017135620117, "global_step": 181483, "epoch": 4321} {"train_loss": -7.030641078948975, "global_step": 181484, "epoch": 4321} {"train_loss": -6.996574878692627, "global_step": 181485, "epoch": 4321} {"train_loss": -7.083654880523682, "global_step": 181486, "epoch": 4321} {"train_loss": -7.053702354431152, "global_step": 181487, "epoch": 4321} {"train_loss": -7.119456768035889, "global_step": 181488, "epoch": 4321} {"train_loss": -7.023797035217285, "global_step": 181489, "epoch": 4321} {"train_loss": -6.902648448944092, "global_step": 181490, "epoch": 4321} {"train_loss": -7.088594436645508, "global_step": 181491, "epoch": 4321} {"train_loss": -7.0428385734558105, "global_step": 181492, "epoch": 4321} {"train_loss": -7.175759792327881, "global_step": 181493, "epoch": 4321} {"train_loss": -7.0460100173950195, "global_step": 181494, "epoch": 4321} {"train_loss": -7.088789939880371, "global_step": 181495, "epoch": 4321} {"train_loss": -7.013650894165039, "global_step": 181496, "epoch": 4321} {"train_loss": -6.995589733123779, "global_step": 181497, "epoch": 4321} {"train_loss": -7.213929653167725, "global_step": 181498, "epoch": 4321} {"train_loss": -6.987916946411133, "global_step": 181499, "epoch": 4321} {"train_loss": -7.0989789962768555, "global_step": 181500, "epoch": 4321} {"train_loss": -7.0551958084106445, "global_step": 181501, "epoch": 4321} {"train_loss": -7.1409077644348145, "global_step": 181502, "epoch": 4321} {"train_loss": -7.0865583419799805, "global_step": 181503, "epoch": 4321} {"train_loss": -7.037755489349365, "global_step": 181504, "epoch": 4321} {"train_loss": -7.0248212814331055, "global_step": 181505, "epoch": 4321} {"train_loss": -7.135610580444336, "global_step": 181506, "epoch": 4321} {"train_loss": -7.079477787017822, "global_step": 181507, "epoch": 4321} {"train_loss": -7.087366580963135, "global_step": 181508, "epoch": 4321} {"train_loss": -7.106257438659668, "global_step": 181509, "epoch": 4321} {"train_loss": -7.138484954833984, "global_step": 181510, "epoch": 4321} {"train_loss": -7.194004058837891, "global_step": 181511, "epoch": 4321} {"train_loss": -7.100563049316406, "global_step": 181512, "epoch": 4321} {"train_loss": -7.067248821258545, "global_step": 181513, "epoch": 4321} {"train_loss": -7.103304862976074, "global_step": 181514, "epoch": 4321} {"train_loss": -7.1020097732543945, "global_step": 181515, "epoch": 4321} {"train_loss": -7.060972213745117, "global_step": 181516, "epoch": 4321} {"train_loss": -7.149549961090088, "global_step": 181517, "epoch": 4321} {"train_loss": -7.116174697875977, "global_step": 181518, "epoch": 4321} {"train_loss": -7.184241771697998, "global_step": 181519, "epoch": 4321} {"train_loss": -7.117631912231445, "global_step": 181520, "epoch": 4321} {"train_loss": -7.060986042022705, "global_step": 181521, "epoch": 4321} {"train_loss": -7.229240417480469, "global_step": 181522, "epoch": 4321} {"train_loss": -7.089678866522653, "global_step": 181523, "epoch": 4321, "val_loss": 69186.1484375} {"train_loss": -7.106716632843018, "global_step": 181524, "epoch": 4322} {"train_loss": -7.133829116821289, "global_step": 181525, "epoch": 4322} {"train_loss": -7.146734714508057, "global_step": 181526, "epoch": 4322} {"train_loss": -7.027471542358398, "global_step": 181527, "epoch": 4322} {"train_loss": -7.1758599281311035, "global_step": 181528, "epoch": 4322} {"train_loss": -7.086794376373291, "global_step": 181529, "epoch": 4322} {"train_loss": -7.204632759094238, "global_step": 181530, "epoch": 4322} {"train_loss": -7.094290733337402, "global_step": 181531, "epoch": 4322} {"train_loss": -6.981647968292236, "global_step": 181532, "epoch": 4322} {"train_loss": -7.075738906860352, "global_step": 181533, "epoch": 4322} {"train_loss": -7.139723777770996, "global_step": 181534, "epoch": 4322} {"train_loss": -7.144439220428467, "global_step": 181535, "epoch": 4322} {"train_loss": -7.137365818023682, "global_step": 181536, "epoch": 4322} {"train_loss": -7.1830949783325195, "global_step": 181537, "epoch": 4322} {"train_loss": -7.113112449645996, "global_step": 181538, "epoch": 4322} {"train_loss": -7.065956115722656, "global_step": 181539, "epoch": 4322} {"train_loss": -7.095921993255615, "global_step": 181540, "epoch": 4322} {"train_loss": -7.250496864318848, "global_step": 181541, "epoch": 4322} {"train_loss": -7.077879905700684, "global_step": 181542, "epoch": 4322} {"train_loss": -7.180221080780029, "global_step": 181543, "epoch": 4322} {"train_loss": -7.212767601013184, "global_step": 181544, "epoch": 4322} {"train_loss": -7.210720062255859, "global_step": 181545, "epoch": 4322} {"train_loss": -7.196999549865723, "global_step": 181546, "epoch": 4322} {"train_loss": -7.188781261444092, "global_step": 181547, "epoch": 4322} {"train_loss": -7.205003261566162, "global_step": 181548, "epoch": 4322} {"train_loss": -7.168008327484131, "global_step": 181549, "epoch": 4322} {"train_loss": -7.260004043579102, "global_step": 181550, "epoch": 4322} {"train_loss": -7.130319118499756, "global_step": 181551, "epoch": 4322} {"train_loss": -7.1260576248168945, "global_step": 181552, "epoch": 4322} {"train_loss": -7.259977340698242, "global_step": 181553, "epoch": 4322} {"train_loss": -7.167763710021973, "global_step": 181554, "epoch": 4322} {"train_loss": -7.140397548675537, "global_step": 181555, "epoch": 4322} {"train_loss": -7.0861124992370605, "global_step": 181556, "epoch": 4322} {"train_loss": -7.256199836730957, "global_step": 181557, "epoch": 4322} {"train_loss": -7.161113739013672, "global_step": 181558, "epoch": 4322} {"train_loss": -7.245240211486816, "global_step": 181559, "epoch": 4322} {"train_loss": -7.144228458404541, "global_step": 181560, "epoch": 4322} {"train_loss": -7.144992351531982, "global_step": 181561, "epoch": 4322} {"train_loss": -7.148881912231445, "global_step": 181562, "epoch": 4322} {"train_loss": -7.146785736083984, "global_step": 181563, "epoch": 4322} {"train_loss": -7.200965881347656, "global_step": 181564, "epoch": 4322} {"train_loss": -7.1515622820172995, "global_step": 181565, "epoch": 4322, "val_loss": 69276.9453125} {"train_loss": -7.206153869628906, "global_step": 181566, "epoch": 4323} {"train_loss": -7.110018253326416, "global_step": 181567, "epoch": 4323} {"train_loss": -7.047883987426758, "global_step": 181568, "epoch": 4323} {"train_loss": -7.104034423828125, "global_step": 181569, "epoch": 4323} {"train_loss": -7.077822208404541, "global_step": 181570, "epoch": 4323} {"train_loss": -6.914725303649902, "global_step": 181571, "epoch": 4323} {"train_loss": -6.975419044494629, "global_step": 181572, "epoch": 4323} {"train_loss": -7.0498504638671875, "global_step": 181573, "epoch": 4323} {"train_loss": -6.8285813331604, "global_step": 181574, "epoch": 4323} {"train_loss": -7.047123908996582, "global_step": 181575, "epoch": 4323} {"train_loss": -7.014889717102051, "global_step": 181576, "epoch": 4323} {"train_loss": -6.94826602935791, "global_step": 181577, "epoch": 4323} {"train_loss": -6.903942584991455, "global_step": 181578, "epoch": 4323} {"train_loss": -6.977569103240967, "global_step": 181579, "epoch": 4323} {"train_loss": -7.102585792541504, "global_step": 181580, "epoch": 4323} {"train_loss": -6.92413330078125, "global_step": 181581, "epoch": 4323} {"train_loss": -7.023382186889648, "global_step": 181582, "epoch": 4323} {"train_loss": -6.914193153381348, "global_step": 181583, "epoch": 4323} {"train_loss": -7.1108479499816895, "global_step": 181584, "epoch": 4323} {"train_loss": -7.065310478210449, "global_step": 181585, "epoch": 4323} {"train_loss": -7.0260725021362305, "global_step": 181586, "epoch": 4323} {"train_loss": -7.09334135055542, "global_step": 181587, "epoch": 4323} {"train_loss": -7.123833656311035, "global_step": 181588, "epoch": 4323} {"train_loss": -6.981720924377441, "global_step": 181589, "epoch": 4323} {"train_loss": -7.171349048614502, "global_step": 181590, "epoch": 4323} {"train_loss": -7.013530731201172, "global_step": 181591, "epoch": 4323} {"train_loss": -7.005631446838379, "global_step": 181592, "epoch": 4323} {"train_loss": -7.060873508453369, "global_step": 181593, "epoch": 4323} {"train_loss": -6.972784519195557, "global_step": 181594, "epoch": 4323} {"train_loss": -6.973105430603027, "global_step": 181595, "epoch": 4323} {"train_loss": -7.103116035461426, "global_step": 181596, "epoch": 4323} {"train_loss": -6.913153648376465, "global_step": 181597, "epoch": 4323} {"train_loss": -6.985663414001465, "global_step": 181598, "epoch": 4323} {"train_loss": -7.042524814605713, "global_step": 181599, "epoch": 4323} {"train_loss": -6.991119861602783, "global_step": 181600, "epoch": 4323} {"train_loss": -7.009405136108398, "global_step": 181601, "epoch": 4323} {"train_loss": -7.099249839782715, "global_step": 181602, "epoch": 4323} {"train_loss": -6.960429668426514, "global_step": 181603, "epoch": 4323} {"train_loss": -7.023563385009766, "global_step": 181604, "epoch": 4323} {"train_loss": -7.061872482299805, "global_step": 181605, "epoch": 4323} {"train_loss": -7.093421936035156, "global_step": 181606, "epoch": 4323} {"train_loss": -7.022774389811924, "global_step": 181607, "epoch": 4323, "val_loss": 69451.578125} {"train_loss": -7.197203636169434, "global_step": 181608, "epoch": 4324} {"train_loss": -7.05744743347168, "global_step": 181609, "epoch": 4324} {"train_loss": -7.104137420654297, "global_step": 181610, "epoch": 4324} {"train_loss": -7.069279193878174, "global_step": 181611, "epoch": 4324} {"train_loss": -7.101445198059082, "global_step": 181612, "epoch": 4324} {"train_loss": -7.052630424499512, "global_step": 181613, "epoch": 4324} {"train_loss": -7.05155086517334, "global_step": 181614, "epoch": 4324} {"train_loss": -7.117377281188965, "global_step": 181615, "epoch": 4324} {"train_loss": -7.200742721557617, "global_step": 181616, "epoch": 4324} {"train_loss": -7.056332588195801, "global_step": 181617, "epoch": 4324} {"train_loss": -7.130308628082275, "global_step": 181618, "epoch": 4324} {"train_loss": -7.0126190185546875, "global_step": 181619, "epoch": 4324} {"train_loss": -7.1260199546813965, "global_step": 181620, "epoch": 4324} {"train_loss": -7.1702680587768555, "global_step": 181621, "epoch": 4324} {"train_loss": -7.07940149307251, "global_step": 181622, "epoch": 4324} {"train_loss": -7.207428455352783, "global_step": 181623, "epoch": 4324} {"train_loss": -7.10585880279541, "global_step": 181624, "epoch": 4324} {"train_loss": -7.188109397888184, "global_step": 181625, "epoch": 4324} {"train_loss": -7.058262825012207, "global_step": 181626, "epoch": 4324} {"train_loss": -7.191737174987793, "global_step": 181627, "epoch": 4324} {"train_loss": -7.2387895584106445, "global_step": 181628, "epoch": 4324} {"train_loss": -7.025301933288574, "global_step": 181629, "epoch": 4324} {"train_loss": -7.132493495941162, "global_step": 181630, "epoch": 4324} {"train_loss": -6.951033115386963, "global_step": 181631, "epoch": 4324} {"train_loss": -7.166563510894775, "global_step": 181632, "epoch": 4324} {"train_loss": -7.304437160491943, "global_step": 181633, "epoch": 4324} {"train_loss": -7.290517807006836, "global_step": 181634, "epoch": 4324} {"train_loss": -7.162062644958496, "global_step": 181635, "epoch": 4324} {"train_loss": -7.128904819488525, "global_step": 181636, "epoch": 4324} {"train_loss": -7.149853706359863, "global_step": 181637, "epoch": 4324} {"train_loss": -7.153411388397217, "global_step": 181638, "epoch": 4324} {"train_loss": -7.181729316711426, "global_step": 181639, "epoch": 4324} {"train_loss": -7.144629001617432, "global_step": 181640, "epoch": 4324} {"train_loss": -7.239939212799072, "global_step": 181641, "epoch": 4324} {"train_loss": -7.26005744934082, "global_step": 181642, "epoch": 4324} {"train_loss": -7.208836555480957, "global_step": 181643, "epoch": 4324} {"train_loss": -7.292680740356445, "global_step": 181644, "epoch": 4324} {"train_loss": -7.199845790863037, "global_step": 181645, "epoch": 4324} {"train_loss": -7.258272647857666, "global_step": 181646, "epoch": 4324} {"train_loss": -7.333633899688721, "global_step": 181647, "epoch": 4324} {"train_loss": -7.226958274841309, "global_step": 181648, "epoch": 4324} {"train_loss": -7.156510693686349, "global_step": 181649, "epoch": 4324, "val_loss": 69351.3203125} {"train_loss": -7.266395568847656, "global_step": 181650, "epoch": 4325} {"train_loss": -7.282730579376221, "global_step": 181651, "epoch": 4325} {"train_loss": -7.201441764831543, "global_step": 181652, "epoch": 4325} {"train_loss": -7.10251522064209, "global_step": 181653, "epoch": 4325} {"train_loss": -7.129819393157959, "global_step": 181654, "epoch": 4325} {"train_loss": -7.152990341186523, "global_step": 181655, "epoch": 4325} {"train_loss": -7.084964752197266, "global_step": 181656, "epoch": 4325} {"train_loss": -7.1631903648376465, "global_step": 181657, "epoch": 4325} {"train_loss": -7.164045333862305, "global_step": 181658, "epoch": 4325} {"train_loss": -7.1403350830078125, "global_step": 181659, "epoch": 4325} {"train_loss": -7.0838446617126465, "global_step": 181660, "epoch": 4325} {"train_loss": -7.122937202453613, "global_step": 181661, "epoch": 4325} {"train_loss": -7.0664801597595215, "global_step": 181662, "epoch": 4325} {"train_loss": -7.159912109375, "global_step": 181663, "epoch": 4325} {"train_loss": -7.075005531311035, "global_step": 181664, "epoch": 4325} {"train_loss": -7.18585205078125, "global_step": 181665, "epoch": 4325} {"train_loss": -7.252973556518555, "global_step": 181666, "epoch": 4325} {"train_loss": -7.182710647583008, "global_step": 181667, "epoch": 4325} {"train_loss": -7.060672760009766, "global_step": 181668, "epoch": 4325} {"train_loss": -7.179807186126709, "global_step": 181669, "epoch": 4325} {"train_loss": -7.094490051269531, "global_step": 181670, "epoch": 4325} {"train_loss": -7.15423059463501, "global_step": 181671, "epoch": 4325} {"train_loss": -7.227784156799316, "global_step": 181672, "epoch": 4325} {"train_loss": -7.168613433837891, "global_step": 181673, "epoch": 4325} {"train_loss": -7.0360798835754395, "global_step": 181674, "epoch": 4325} {"train_loss": -7.173402786254883, "global_step": 181675, "epoch": 4325} {"train_loss": -7.13594913482666, "global_step": 181676, "epoch": 4325} {"train_loss": -7.080543518066406, "global_step": 181677, "epoch": 4325} {"train_loss": -7.045331954956055, "global_step": 181678, "epoch": 4325} {"train_loss": -7.0928874015808105, "global_step": 181679, "epoch": 4325} {"train_loss": -6.972489356994629, "global_step": 181680, "epoch": 4325} {"train_loss": -7.169942855834961, "global_step": 181681, "epoch": 4325} {"train_loss": -7.106180191040039, "global_step": 181682, "epoch": 4325} {"train_loss": -7.068542957305908, "global_step": 181683, "epoch": 4325} {"train_loss": -7.1997833251953125, "global_step": 181684, "epoch": 4325} {"train_loss": -7.0915751457214355, "global_step": 181685, "epoch": 4325} {"train_loss": -7.1171674728393555, "global_step": 181686, "epoch": 4325} {"train_loss": -7.07002592086792, "global_step": 181687, "epoch": 4325} {"train_loss": -7.0656914710998535, "global_step": 181688, "epoch": 4325} {"train_loss": -6.997283458709717, "global_step": 181689, "epoch": 4325} {"train_loss": -7.059004306793213, "global_step": 181690, "epoch": 4325} {"train_loss": -7.124246937888009, "global_step": 181691, "epoch": 4325, "val_loss": 69367.515625} {"train_loss": -7.045754432678223, "global_step": 181692, "epoch": 4326} {"train_loss": -7.108808517456055, "global_step": 181693, "epoch": 4326} {"train_loss": -7.0022172927856445, "global_step": 181694, "epoch": 4326} {"train_loss": -6.9726762771606445, "global_step": 181695, "epoch": 4326} {"train_loss": -6.993554592132568, "global_step": 181696, "epoch": 4326} {"train_loss": -6.9679718017578125, "global_step": 181697, "epoch": 4326} {"train_loss": -7.095396995544434, "global_step": 181698, "epoch": 4326} {"train_loss": -6.99882698059082, "global_step": 181699, "epoch": 4326} {"train_loss": -6.986737251281738, "global_step": 181700, "epoch": 4326} {"train_loss": -6.949221611022949, "global_step": 181701, "epoch": 4326} {"train_loss": -6.988777160644531, "global_step": 181702, "epoch": 4326} {"train_loss": -7.027861595153809, "global_step": 181703, "epoch": 4326} {"train_loss": -7.0134758949279785, "global_step": 181704, "epoch": 4326} {"train_loss": -7.008312702178955, "global_step": 181705, "epoch": 4326} {"train_loss": -7.018962383270264, "global_step": 181706, "epoch": 4326} {"train_loss": -7.125661373138428, "global_step": 181707, "epoch": 4326} {"train_loss": -7.0272216796875, "global_step": 181708, "epoch": 4326} {"train_loss": -7.069910049438477, "global_step": 181709, "epoch": 4326} {"train_loss": -7.056187629699707, "global_step": 181710, "epoch": 4326} {"train_loss": -6.961687088012695, "global_step": 181711, "epoch": 4326} {"train_loss": -7.060445308685303, "global_step": 181712, "epoch": 4326} {"train_loss": -7.035686016082764, "global_step": 181713, "epoch": 4326} {"train_loss": -6.91474723815918, "global_step": 181714, "epoch": 4326} {"train_loss": -6.96236515045166, "global_step": 181715, "epoch": 4326} {"train_loss": -7.087507724761963, "global_step": 181716, "epoch": 4326} {"train_loss": -7.097973346710205, "global_step": 181717, "epoch": 4326} {"train_loss": -7.0058913230896, "global_step": 181718, "epoch": 4326} {"train_loss": -7.051698684692383, "global_step": 181719, "epoch": 4326} {"train_loss": -7.179322719573975, "global_step": 181720, "epoch": 4326} {"train_loss": -7.120413780212402, "global_step": 181721, "epoch": 4326} {"train_loss": -7.121875762939453, "global_step": 181722, "epoch": 4326} {"train_loss": -7.01701545715332, "global_step": 181723, "epoch": 4326} {"train_loss": -7.125059127807617, "global_step": 181724, "epoch": 4326} {"train_loss": -7.106656551361084, "global_step": 181725, "epoch": 4326} {"train_loss": -7.019905090332031, "global_step": 181726, "epoch": 4326} {"train_loss": -7.147916793823242, "global_step": 181727, "epoch": 4326} {"train_loss": -6.97700309753418, "global_step": 181728, "epoch": 4326} {"train_loss": -7.124764442443848, "global_step": 181729, "epoch": 4326} {"train_loss": -7.154170989990234, "global_step": 181730, "epoch": 4326} {"train_loss": -7.128873348236084, "global_step": 181731, "epoch": 4326} {"train_loss": -7.125851631164551, "global_step": 181732, "epoch": 4326} {"train_loss": -7.046488353184292, "global_step": 181733, "epoch": 4326, "val_loss": 69332.4765625} {"train_loss": -7.117165565490723, "global_step": 181734, "epoch": 4327} {"train_loss": -7.203989028930664, "global_step": 181735, "epoch": 4327} {"train_loss": -7.091268539428711, "global_step": 181736, "epoch": 4327} {"train_loss": -7.119672775268555, "global_step": 181737, "epoch": 4327} {"train_loss": -7.140127182006836, "global_step": 181738, "epoch": 4327} {"train_loss": -7.132335662841797, "global_step": 181739, "epoch": 4327} {"train_loss": -7.184168815612793, "global_step": 181740, "epoch": 4327} {"train_loss": -7.128258228302002, "global_step": 181741, "epoch": 4327} {"train_loss": -7.051426410675049, "global_step": 181742, "epoch": 4327} {"train_loss": -7.015625476837158, "global_step": 181743, "epoch": 4327} {"train_loss": -7.202466011047363, "global_step": 181744, "epoch": 4327} {"train_loss": -7.153294563293457, "global_step": 181745, "epoch": 4327} {"train_loss": -7.198024749755859, "global_step": 181746, "epoch": 4327} {"train_loss": -7.211197853088379, "global_step": 181747, "epoch": 4327} {"train_loss": -7.142063140869141, "global_step": 181748, "epoch": 4327} {"train_loss": -7.10230827331543, "global_step": 181749, "epoch": 4327} {"train_loss": -7.241087913513184, "global_step": 181750, "epoch": 4327} {"train_loss": -7.223273277282715, "global_step": 181751, "epoch": 4327} {"train_loss": -7.145642280578613, "global_step": 181752, "epoch": 4327} {"train_loss": -7.107446670532227, "global_step": 181753, "epoch": 4327} {"train_loss": -7.157948970794678, "global_step": 181754, "epoch": 4327} {"train_loss": -7.2154221534729, "global_step": 181755, "epoch": 4327} {"train_loss": -6.926591396331787, "global_step": 181756, "epoch": 4327} {"train_loss": -7.098050594329834, "global_step": 181757, "epoch": 4327} {"train_loss": -7.007726669311523, "global_step": 181758, "epoch": 4327} {"train_loss": -7.054771423339844, "global_step": 181759, "epoch": 4327} {"train_loss": -7.133481025695801, "global_step": 181760, "epoch": 4327} {"train_loss": -7.087685585021973, "global_step": 181761, "epoch": 4327} {"train_loss": -7.0600481033325195, "global_step": 181762, "epoch": 4327} {"train_loss": -7.13528299331665, "global_step": 181763, "epoch": 4327} {"train_loss": -6.940743923187256, "global_step": 181764, "epoch": 4327} {"train_loss": -7.038417816162109, "global_step": 181765, "epoch": 4327} {"train_loss": -7.067897319793701, "global_step": 181766, "epoch": 4327} {"train_loss": -7.1992340087890625, "global_step": 181767, "epoch": 4327} {"train_loss": -7.1341633796691895, "global_step": 181768, "epoch": 4327} {"train_loss": -7.140852928161621, "global_step": 181769, "epoch": 4327} {"train_loss": -6.959938049316406, "global_step": 181770, "epoch": 4327} {"train_loss": -7.214245796203613, "global_step": 181771, "epoch": 4327} {"train_loss": -7.176300048828125, "global_step": 181772, "epoch": 4327} {"train_loss": -7.076186180114746, "global_step": 181773, "epoch": 4327} {"train_loss": -6.997555255889893, "global_step": 181774, "epoch": 4327} {"train_loss": -7.1148983637491865, "global_step": 181775, "epoch": 4327, "val_loss": 69323.296875} {"train_loss": -7.166782379150391, "global_step": 181776, "epoch": 4328} {"train_loss": -7.057811737060547, "global_step": 181777, "epoch": 4328} {"train_loss": -7.040234565734863, "global_step": 181778, "epoch": 4328} {"train_loss": -7.1674675941467285, "global_step": 181779, "epoch": 4328} {"train_loss": -7.127825736999512, "global_step": 181780, "epoch": 4328} {"train_loss": -7.100767135620117, "global_step": 181781, "epoch": 4328} {"train_loss": -7.095219135284424, "global_step": 181782, "epoch": 4328} {"train_loss": -7.104169845581055, "global_step": 181783, "epoch": 4328} {"train_loss": -7.107982635498047, "global_step": 181784, "epoch": 4328} {"train_loss": -7.105283260345459, "global_step": 181785, "epoch": 4328} {"train_loss": -7.093005180358887, "global_step": 181786, "epoch": 4328} {"train_loss": -7.137329578399658, "global_step": 181787, "epoch": 4328} {"train_loss": -7.081904888153076, "global_step": 181788, "epoch": 4328} {"train_loss": -7.067558765411377, "global_step": 181789, "epoch": 4328} {"train_loss": -7.0898542404174805, "global_step": 181790, "epoch": 4328} {"train_loss": -7.019323348999023, "global_step": 181791, "epoch": 4328} {"train_loss": -7.15887451171875, "global_step": 181792, "epoch": 4328} {"train_loss": -7.157876968383789, "global_step": 181793, "epoch": 4328} {"train_loss": -7.082281589508057, "global_step": 181794, "epoch": 4328} {"train_loss": -7.2160491943359375, "global_step": 181795, "epoch": 4328} {"train_loss": -7.203365802764893, "global_step": 181796, "epoch": 4328} {"train_loss": -7.18280553817749, "global_step": 181797, "epoch": 4328} {"train_loss": -7.1374969482421875, "global_step": 181798, "epoch": 4328} {"train_loss": -7.145380020141602, "global_step": 181799, "epoch": 4328} {"train_loss": -7.1167755126953125, "global_step": 181800, "epoch": 4328} {"train_loss": -7.127264022827148, "global_step": 181801, "epoch": 4328} {"train_loss": -7.213375091552734, "global_step": 181802, "epoch": 4328} {"train_loss": -7.046304702758789, "global_step": 181803, "epoch": 4328} {"train_loss": -7.103025436401367, "global_step": 181804, "epoch": 4328} {"train_loss": -7.215104103088379, "global_step": 181805, "epoch": 4328} {"train_loss": -7.104121208190918, "global_step": 181806, "epoch": 4328} {"train_loss": -7.077031135559082, "global_step": 181807, "epoch": 4328} {"train_loss": -7.026717662811279, "global_step": 181808, "epoch": 4328} {"train_loss": -7.219076156616211, "global_step": 181809, "epoch": 4328} {"train_loss": -7.119600296020508, "global_step": 181810, "epoch": 4328} {"train_loss": -7.212759494781494, "global_step": 181811, "epoch": 4328} {"train_loss": -7.08335542678833, "global_step": 181812, "epoch": 4328} {"train_loss": -7.034280776977539, "global_step": 181813, "epoch": 4328} {"train_loss": -7.270658493041992, "global_step": 181814, "epoch": 4328} {"train_loss": -6.930206298828125, "global_step": 181815, "epoch": 4328} {"train_loss": -7.0485358238220215, "global_step": 181816, "epoch": 4328} {"train_loss": -7.116636843908401, "global_step": 181817, "epoch": 4328, "val_loss": 69291.859375} {"train_loss": -7.1124067306518555, "global_step": 181818, "epoch": 4329} {"train_loss": -7.094952583312988, "global_step": 181819, "epoch": 4329} {"train_loss": -7.155126571655273, "global_step": 181820, "epoch": 4329} {"train_loss": -7.187121391296387, "global_step": 181821, "epoch": 4329} {"train_loss": -7.083812713623047, "global_step": 181822, "epoch": 4329} {"train_loss": -6.994960784912109, "global_step": 181823, "epoch": 4329} {"train_loss": -7.181666374206543, "global_step": 181824, "epoch": 4329} {"train_loss": -7.049421310424805, "global_step": 181825, "epoch": 4329} {"train_loss": -7.072134971618652, "global_step": 181826, "epoch": 4329} {"train_loss": -7.159674644470215, "global_step": 181827, "epoch": 4329} {"train_loss": -7.008512496948242, "global_step": 181828, "epoch": 4329} {"train_loss": -7.123403549194336, "global_step": 181829, "epoch": 4329} {"train_loss": -7.1355671882629395, "global_step": 181830, "epoch": 4329} {"train_loss": -6.913171768188477, "global_step": 181831, "epoch": 4329} {"train_loss": -7.201780319213867, "global_step": 181832, "epoch": 4329} {"train_loss": -6.957448959350586, "global_step": 181833, "epoch": 4329} {"train_loss": -7.008129596710205, "global_step": 181834, "epoch": 4329} {"train_loss": -7.0517401695251465, "global_step": 181835, "epoch": 4329} {"train_loss": -6.956362247467041, "global_step": 181836, "epoch": 4329} {"train_loss": -6.996218681335449, "global_step": 181837, "epoch": 4329} {"train_loss": -7.014065742492676, "global_step": 181838, "epoch": 4329} {"train_loss": -7.037143707275391, "global_step": 181839, "epoch": 4329} {"train_loss": -7.010783672332764, "global_step": 181840, "epoch": 4329} {"train_loss": -7.0143842697143555, "global_step": 181841, "epoch": 4329} {"train_loss": -7.0337347984313965, "global_step": 181842, "epoch": 4329} {"train_loss": -7.107737064361572, "global_step": 181843, "epoch": 4329} {"train_loss": -6.998134136199951, "global_step": 181844, "epoch": 4329} {"train_loss": -6.986601829528809, "global_step": 181845, "epoch": 4329} {"train_loss": -7.141143798828125, "global_step": 181846, "epoch": 4329} {"train_loss": -7.0139665603637695, "global_step": 181847, "epoch": 4329} {"train_loss": -6.952358245849609, "global_step": 181848, "epoch": 4329} {"train_loss": -7.050691604614258, "global_step": 181849, "epoch": 4329} {"train_loss": -6.91694450378418, "global_step": 181850, "epoch": 4329} {"train_loss": -7.141181468963623, "global_step": 181851, "epoch": 4329} {"train_loss": -7.147485256195068, "global_step": 181852, "epoch": 4329} {"train_loss": -7.062880516052246, "global_step": 181853, "epoch": 4329} {"train_loss": -7.1880269050598145, "global_step": 181854, "epoch": 4329} {"train_loss": -7.0990891456604, "global_step": 181855, "epoch": 4329} {"train_loss": -7.018238067626953, "global_step": 181856, "epoch": 4329} {"train_loss": -7.112271308898926, "global_step": 181857, "epoch": 4329} {"train_loss": -7.174787998199463, "global_step": 181858, "epoch": 4329} {"train_loss": -7.064990543183827, "global_step": 181859, "epoch": 4329, "val_loss": 69341.3046875} {"train_loss": -7.03029203414917, "global_step": 181860, "epoch": 4330} {"train_loss": -7.036538124084473, "global_step": 181861, "epoch": 4330} {"train_loss": -7.142702102661133, "global_step": 181862, "epoch": 4330} {"train_loss": -7.181225299835205, "global_step": 181863, "epoch": 4330} {"train_loss": -7.050100326538086, "global_step": 181864, "epoch": 4330} {"train_loss": -7.143752574920654, "global_step": 181865, "epoch": 4330} {"train_loss": -7.081496238708496, "global_step": 181866, "epoch": 4330} {"train_loss": -7.143899917602539, "global_step": 181867, "epoch": 4330} {"train_loss": -7.176523208618164, "global_step": 181868, "epoch": 4330} {"train_loss": -7.091413497924805, "global_step": 181869, "epoch": 4330} {"train_loss": -7.289241313934326, "global_step": 181870, "epoch": 4330} {"train_loss": -7.23727560043335, "global_step": 181871, "epoch": 4330} {"train_loss": -7.089531421661377, "global_step": 181872, "epoch": 4330} {"train_loss": -7.103753566741943, "global_step": 181873, "epoch": 4330} {"train_loss": -7.1388092041015625, "global_step": 181874, "epoch": 4330} {"train_loss": -7.192002296447754, "global_step": 181875, "epoch": 4330} {"train_loss": -7.240034103393555, "global_step": 181876, "epoch": 4330} {"train_loss": -7.147463798522949, "global_step": 181877, "epoch": 4330} {"train_loss": -7.086167335510254, "global_step": 181878, "epoch": 4330} {"train_loss": -7.1586151123046875, "global_step": 181879, "epoch": 4330} {"train_loss": -7.128134727478027, "global_step": 181880, "epoch": 4330} {"train_loss": -7.029801845550537, "global_step": 181881, "epoch": 4330} {"train_loss": -7.071468353271484, "global_step": 181882, "epoch": 4330} {"train_loss": -7.077090263366699, "global_step": 181883, "epoch": 4330} {"train_loss": -7.031523704528809, "global_step": 181884, "epoch": 4330} {"train_loss": -7.236628532409668, "global_step": 181885, "epoch": 4330} {"train_loss": -7.07814359664917, "global_step": 181886, "epoch": 4330} {"train_loss": -7.177716255187988, "global_step": 181887, "epoch": 4330} {"train_loss": -7.087977409362793, "global_step": 181888, "epoch": 4330} {"train_loss": -7.089050769805908, "global_step": 181889, "epoch": 4330} {"train_loss": -6.99248743057251, "global_step": 181890, "epoch": 4330} {"train_loss": -7.182155609130859, "global_step": 181891, "epoch": 4330} {"train_loss": -7.087125301361084, "global_step": 181892, "epoch": 4330} {"train_loss": -7.097902297973633, "global_step": 181893, "epoch": 4330} {"train_loss": -7.131270408630371, "global_step": 181894, "epoch": 4330} {"train_loss": -7.124566078186035, "global_step": 181895, "epoch": 4330} {"train_loss": -7.1406450271606445, "global_step": 181896, "epoch": 4330} {"train_loss": -7.062696933746338, "global_step": 181897, "epoch": 4330} {"train_loss": -7.161539077758789, "global_step": 181898, "epoch": 4330} {"train_loss": -7.186147212982178, "global_step": 181899, "epoch": 4330} {"train_loss": -7.227428436279297, "global_step": 181900, "epoch": 4330} {"train_loss": -7.126548415138608, "global_step": 181901, "epoch": 4330, "val_loss": 69387.8359375} {"train_loss": -7.125079154968262, "global_step": 181902, "epoch": 4331} {"train_loss": -7.122537612915039, "global_step": 181903, "epoch": 4331} {"train_loss": -7.20942497253418, "global_step": 181904, "epoch": 4331} {"train_loss": -7.159183979034424, "global_step": 181905, "epoch": 4331} {"train_loss": -7.2755818367004395, "global_step": 181906, "epoch": 4331} {"train_loss": -7.2298479080200195, "global_step": 181907, "epoch": 4331} {"train_loss": -7.100485801696777, "global_step": 181908, "epoch": 4331} {"train_loss": -7.18520975112915, "global_step": 181909, "epoch": 4331} {"train_loss": -7.130438327789307, "global_step": 181910, "epoch": 4331} {"train_loss": -7.170077323913574, "global_step": 181911, "epoch": 4331} {"train_loss": -7.120586395263672, "global_step": 181912, "epoch": 4331} {"train_loss": -7.258457183837891, "global_step": 181913, "epoch": 4331} {"train_loss": -7.165741443634033, "global_step": 181914, "epoch": 4331} {"train_loss": -7.1806111335754395, "global_step": 181915, "epoch": 4331} {"train_loss": -7.1116132736206055, "global_step": 181916, "epoch": 4331} {"train_loss": -7.071699142456055, "global_step": 181917, "epoch": 4331} {"train_loss": -7.158059120178223, "global_step": 181918, "epoch": 4331} {"train_loss": -7.1856842041015625, "global_step": 181919, "epoch": 4331} {"train_loss": -7.0869340896606445, "global_step": 181920, "epoch": 4331} {"train_loss": -7.026358604431152, "global_step": 181921, "epoch": 4331} {"train_loss": -7.115345001220703, "global_step": 181922, "epoch": 4331} {"train_loss": -7.289613723754883, "global_step": 181923, "epoch": 4331} {"train_loss": -7.133913040161133, "global_step": 181924, "epoch": 4331} {"train_loss": -7.208632469177246, "global_step": 181925, "epoch": 4331} {"train_loss": -7.116480350494385, "global_step": 181926, "epoch": 4331} {"train_loss": -7.3184380531311035, "global_step": 181927, "epoch": 4331} {"train_loss": -7.216386318206787, "global_step": 181928, "epoch": 4331} {"train_loss": -7.124914646148682, "global_step": 181929, "epoch": 4331} {"train_loss": -7.022920608520508, "global_step": 181930, "epoch": 4331} {"train_loss": -7.028629302978516, "global_step": 181931, "epoch": 4331} {"train_loss": -7.3173370361328125, "global_step": 181932, "epoch": 4331} {"train_loss": -7.065238952636719, "global_step": 181933, "epoch": 4331} {"train_loss": -7.20888614654541, "global_step": 181934, "epoch": 4331} {"train_loss": -7.270432472229004, "global_step": 181935, "epoch": 4331} {"train_loss": -7.071885108947754, "global_step": 181936, "epoch": 4331} {"train_loss": -7.200606346130371, "global_step": 181937, "epoch": 4331} {"train_loss": -7.131924629211426, "global_step": 181938, "epoch": 4331} {"train_loss": -7.167391777038574, "global_step": 181939, "epoch": 4331} {"train_loss": -7.134097576141357, "global_step": 181940, "epoch": 4331} {"train_loss": -7.166374683380127, "global_step": 181941, "epoch": 4331} {"train_loss": -7.1028218269348145, "global_step": 181942, "epoch": 4331} {"train_loss": -7.15409981636774, "global_step": 181943, "epoch": 4331, "val_loss": 69356.984375} {"train_loss": -7.21392297744751, "global_step": 181944, "epoch": 4332} {"train_loss": -7.015448570251465, "global_step": 181945, "epoch": 4332} {"train_loss": -7.1488423347473145, "global_step": 181946, "epoch": 4332} {"train_loss": -7.154449462890625, "global_step": 181947, "epoch": 4332} {"train_loss": -7.12211799621582, "global_step": 181948, "epoch": 4332} {"train_loss": -7.226171970367432, "global_step": 181949, "epoch": 4332} {"train_loss": -7.048614501953125, "global_step": 181950, "epoch": 4332} {"train_loss": -7.212091445922852, "global_step": 181951, "epoch": 4332} {"train_loss": -7.2285919189453125, "global_step": 181952, "epoch": 4332} {"train_loss": -7.113929748535156, "global_step": 181953, "epoch": 4332} {"train_loss": -7.267658233642578, "global_step": 181954, "epoch": 4332} {"train_loss": -7.164180278778076, "global_step": 181955, "epoch": 4332} {"train_loss": -7.405908584594727, "global_step": 181956, "epoch": 4332} {"train_loss": -7.184605121612549, "global_step": 181957, "epoch": 4332} {"train_loss": -7.293793201446533, "global_step": 181958, "epoch": 4332} {"train_loss": -7.208192825317383, "global_step": 181959, "epoch": 4332} {"train_loss": -7.107975006103516, "global_step": 181960, "epoch": 4332} {"train_loss": -7.078913688659668, "global_step": 181961, "epoch": 4332} {"train_loss": -7.222596168518066, "global_step": 181962, "epoch": 4332} {"train_loss": -6.891993522644043, "global_step": 181963, "epoch": 4332} {"train_loss": -7.0435919761657715, "global_step": 181964, "epoch": 4332} {"train_loss": -7.169822692871094, "global_step": 181965, "epoch": 4332} {"train_loss": -7.0120649337768555, "global_step": 181966, "epoch": 4332} {"train_loss": -7.1097822189331055, "global_step": 181967, "epoch": 4332} {"train_loss": -7.109289169311523, "global_step": 181968, "epoch": 4332} {"train_loss": -7.0736541748046875, "global_step": 181969, "epoch": 4332} {"train_loss": -7.1515936851501465, "global_step": 181970, "epoch": 4332} {"train_loss": -7.079686164855957, "global_step": 181971, "epoch": 4332} {"train_loss": -7.19798469543457, "global_step": 181972, "epoch": 4332} {"train_loss": -7.083473205566406, "global_step": 181973, "epoch": 4332} {"train_loss": -7.144501686096191, "global_step": 181974, "epoch": 4332} {"train_loss": -7.266523838043213, "global_step": 181975, "epoch": 4332} {"train_loss": -7.105194091796875, "global_step": 181976, "epoch": 4332} {"train_loss": -7.097632884979248, "global_step": 181977, "epoch": 4332} {"train_loss": -7.154426574707031, "global_step": 181978, "epoch": 4332} {"train_loss": -7.228743553161621, "global_step": 181979, "epoch": 4332} {"train_loss": -7.105121612548828, "global_step": 181980, "epoch": 4332} {"train_loss": -7.176792144775391, "global_step": 181981, "epoch": 4332} {"train_loss": -7.25235652923584, "global_step": 181982, "epoch": 4332} {"train_loss": -7.143626689910889, "global_step": 181983, "epoch": 4332} {"train_loss": -7.213564395904541, "global_step": 181984, "epoch": 4332} {"train_loss": -7.151951426551456, "global_step": 181985, "epoch": 4332, "val_loss": 69418.0625} {"train_loss": -7.167486190795898, "global_step": 181986, "epoch": 4333} {"train_loss": -7.1884002685546875, "global_step": 181987, "epoch": 4333} {"train_loss": -7.185608863830566, "global_step": 181988, "epoch": 4333} {"train_loss": -7.0119404792785645, "global_step": 181989, "epoch": 4333} {"train_loss": -7.101756572723389, "global_step": 181990, "epoch": 4333} {"train_loss": -7.076594352722168, "global_step": 181991, "epoch": 4333} {"train_loss": -7.041233062744141, "global_step": 181992, "epoch": 4333} {"train_loss": -7.133197784423828, "global_step": 181993, "epoch": 4333} {"train_loss": -7.088289260864258, "global_step": 181994, "epoch": 4333} {"train_loss": -7.036452293395996, "global_step": 181995, "epoch": 4333} {"train_loss": -7.101785659790039, "global_step": 181996, "epoch": 4333} {"train_loss": -6.940281867980957, "global_step": 181997, "epoch": 4333} {"train_loss": -7.099712371826172, "global_step": 181998, "epoch": 4333} {"train_loss": -7.002098083496094, "global_step": 181999, "epoch": 4333} {"train_loss": -7.050310134887695, "global_step": 182000, "epoch": 4333} {"train_loss": -7.027435779571533, "global_step": 182001, "epoch": 4333} {"train_loss": -7.00614070892334, "global_step": 182002, "epoch": 4333} {"train_loss": -7.283324718475342, "global_step": 182003, "epoch": 4333} {"train_loss": -7.19667911529541, "global_step": 182004, "epoch": 4333} {"train_loss": -7.123634338378906, "global_step": 182005, "epoch": 4333} {"train_loss": -7.096831321716309, "global_step": 182006, "epoch": 4333} {"train_loss": -6.969796180725098, "global_step": 182007, "epoch": 4333} {"train_loss": -7.062941551208496, "global_step": 182008, "epoch": 4333} {"train_loss": -7.054394721984863, "global_step": 182009, "epoch": 4333} {"train_loss": -7.155820846557617, "global_step": 182010, "epoch": 4333} {"train_loss": -7.154131889343262, "global_step": 182011, "epoch": 4333} {"train_loss": -7.070384502410889, "global_step": 182012, "epoch": 4333} {"train_loss": -7.014843463897705, "global_step": 182013, "epoch": 4333} {"train_loss": -7.214670658111572, "global_step": 182014, "epoch": 4333} {"train_loss": -7.175043106079102, "global_step": 182015, "epoch": 4333} {"train_loss": -6.976367950439453, "global_step": 182016, "epoch": 4333} {"train_loss": -7.030751705169678, "global_step": 182017, "epoch": 4333} {"train_loss": -7.0907979011535645, "global_step": 182018, "epoch": 4333} {"train_loss": -7.0477800369262695, "global_step": 182019, "epoch": 4333} {"train_loss": -7.064462661743164, "global_step": 182020, "epoch": 4333} {"train_loss": -7.193565368652344, "global_step": 182021, "epoch": 4333} {"train_loss": -7.067512512207031, "global_step": 182022, "epoch": 4333} {"train_loss": -7.156347274780273, "global_step": 182023, "epoch": 4333} {"train_loss": -7.082035064697266, "global_step": 182024, "epoch": 4333} {"train_loss": -7.079577445983887, "global_step": 182025, "epoch": 4333} {"train_loss": -7.009415149688721, "global_step": 182026, "epoch": 4333} {"train_loss": -7.082566931134179, "global_step": 182027, "epoch": 4333, "val_loss": 69537.9765625} {"train_loss": -7.131566524505615, "global_step": 182028, "epoch": 4334} {"train_loss": -7.101585388183594, "global_step": 182029, "epoch": 4334} {"train_loss": -7.004195690155029, "global_step": 182030, "epoch": 4334} {"train_loss": -7.062145709991455, "global_step": 182031, "epoch": 4334} {"train_loss": -6.96202278137207, "global_step": 182032, "epoch": 4334} {"train_loss": -6.926919937133789, "global_step": 182033, "epoch": 4334} {"train_loss": -7.135464668273926, "global_step": 182034, "epoch": 4334} {"train_loss": -6.99473762512207, "global_step": 182035, "epoch": 4334} {"train_loss": -7.033802509307861, "global_step": 182036, "epoch": 4334} {"train_loss": -7.076010704040527, "global_step": 182037, "epoch": 4334} {"train_loss": -7.132604598999023, "global_step": 182038, "epoch": 4334} {"train_loss": -7.068972587585449, "global_step": 182039, "epoch": 4334} {"train_loss": -7.023009300231934, "global_step": 182040, "epoch": 4334} {"train_loss": -7.201435089111328, "global_step": 182041, "epoch": 4334} {"train_loss": -7.191741943359375, "global_step": 182042, "epoch": 4334} {"train_loss": -7.076839923858643, "global_step": 182043, "epoch": 4334} {"train_loss": -7.083896636962891, "global_step": 182044, "epoch": 4334} {"train_loss": -7.072978973388672, "global_step": 182045, "epoch": 4334} {"train_loss": -7.1465535163879395, "global_step": 182046, "epoch": 4334} {"train_loss": -7.159631729125977, "global_step": 182047, "epoch": 4334} {"train_loss": -7.197315692901611, "global_step": 182048, "epoch": 4334} {"train_loss": -7.169427871704102, "global_step": 182049, "epoch": 4334} {"train_loss": -7.117179870605469, "global_step": 182050, "epoch": 4334} {"train_loss": -7.209684371948242, "global_step": 182051, "epoch": 4334} {"train_loss": -7.182429313659668, "global_step": 182052, "epoch": 4334} {"train_loss": -7.104543685913086, "global_step": 182053, "epoch": 4334} {"train_loss": -7.173775672912598, "global_step": 182054, "epoch": 4334} {"train_loss": -7.132884979248047, "global_step": 182055, "epoch": 4334} {"train_loss": -7.248877048492432, "global_step": 182056, "epoch": 4334} {"train_loss": -7.254530906677246, "global_step": 182057, "epoch": 4334} {"train_loss": -7.155556678771973, "global_step": 182058, "epoch": 4334} {"train_loss": -7.237445831298828, "global_step": 182059, "epoch": 4334} {"train_loss": -7.14046573638916, "global_step": 182060, "epoch": 4334} {"train_loss": -7.236532688140869, "global_step": 182061, "epoch": 4334} {"train_loss": -7.118921279907227, "global_step": 182062, "epoch": 4334} {"train_loss": -7.13795280456543, "global_step": 182063, "epoch": 4334} {"train_loss": -7.131638526916504, "global_step": 182064, "epoch": 4334} {"train_loss": -7.261132717132568, "global_step": 182065, "epoch": 4334} {"train_loss": -7.088291168212891, "global_step": 182066, "epoch": 4334} {"train_loss": -7.264334678649902, "global_step": 182067, "epoch": 4334} {"train_loss": -7.145332336425781, "global_step": 182068, "epoch": 4334} {"train_loss": -7.129318555196126, "global_step": 182069, "epoch": 4334, "val_loss": 69474.2578125} {"train_loss": -7.0909929275512695, "global_step": 182070, "epoch": 4335} {"train_loss": -7.242493152618408, "global_step": 182071, "epoch": 4335} {"train_loss": -7.0945940017700195, "global_step": 182072, "epoch": 4335} {"train_loss": -7.2156982421875, "global_step": 182073, "epoch": 4335} {"train_loss": -7.154992580413818, "global_step": 182074, "epoch": 4335} {"train_loss": -7.169859409332275, "global_step": 182075, "epoch": 4335} {"train_loss": -7.203241348266602, "global_step": 182076, "epoch": 4335} {"train_loss": -7.068484783172607, "global_step": 182077, "epoch": 4335} {"train_loss": -7.292200565338135, "global_step": 182078, "epoch": 4335} {"train_loss": -7.223682403564453, "global_step": 182079, "epoch": 4335} {"train_loss": -7.0993804931640625, "global_step": 182080, "epoch": 4335} {"train_loss": -7.2223310470581055, "global_step": 182081, "epoch": 4335} {"train_loss": -7.110721588134766, "global_step": 182082, "epoch": 4335} {"train_loss": -7.118952751159668, "global_step": 182083, "epoch": 4335} {"train_loss": -7.289306640625, "global_step": 182084, "epoch": 4335} {"train_loss": -7.090058326721191, "global_step": 182085, "epoch": 4335} {"train_loss": -7.073801040649414, "global_step": 182086, "epoch": 4335} {"train_loss": -7.189216136932373, "global_step": 182087, "epoch": 4335} {"train_loss": -7.109752655029297, "global_step": 182088, "epoch": 4335} {"train_loss": -7.16861629486084, "global_step": 182089, "epoch": 4335} {"train_loss": -7.085565567016602, "global_step": 182090, "epoch": 4335} {"train_loss": -7.092865943908691, "global_step": 182091, "epoch": 4335} {"train_loss": -7.090112209320068, "global_step": 182092, "epoch": 4335} {"train_loss": -7.204122543334961, "global_step": 182093, "epoch": 4335} {"train_loss": -7.135290145874023, "global_step": 182094, "epoch": 4335} {"train_loss": -7.170231819152832, "global_step": 182095, "epoch": 4335} {"train_loss": -7.141238212585449, "global_step": 182096, "epoch": 4335} {"train_loss": -7.123822212219238, "global_step": 182097, "epoch": 4335} {"train_loss": -7.121596336364746, "global_step": 182098, "epoch": 4335} {"train_loss": -7.1421427726745605, "global_step": 182099, "epoch": 4335} {"train_loss": -7.054211139678955, "global_step": 182100, "epoch": 4335} {"train_loss": -7.030977249145508, "global_step": 182101, "epoch": 4335} {"train_loss": -7.016877174377441, "global_step": 182102, "epoch": 4335} {"train_loss": -7.231980323791504, "global_step": 182103, "epoch": 4335} {"train_loss": -7.077108860015869, "global_step": 182104, "epoch": 4335} {"train_loss": -7.094742298126221, "global_step": 182105, "epoch": 4335} {"train_loss": -7.147490501403809, "global_step": 182106, "epoch": 4335} {"train_loss": -7.090527534484863, "global_step": 182107, "epoch": 4335} {"train_loss": -7.138565540313721, "global_step": 182108, "epoch": 4335} {"train_loss": -7.132152557373047, "global_step": 182109, "epoch": 4335} {"train_loss": -6.9810943603515625, "global_step": 182110, "epoch": 4335} {"train_loss": -7.135270618257069, "global_step": 182111, "epoch": 4335, "val_loss": 69387.9375} {"train_loss": -7.1220703125, "global_step": 182112, "epoch": 4336} {"train_loss": -7.029558181762695, "global_step": 182113, "epoch": 4336} {"train_loss": -7.108591556549072, "global_step": 182114, "epoch": 4336} {"train_loss": -7.06484317779541, "global_step": 182115, "epoch": 4336} {"train_loss": -7.060859680175781, "global_step": 182116, "epoch": 4336} {"train_loss": -7.1802473068237305, "global_step": 182117, "epoch": 4336} {"train_loss": -7.106993198394775, "global_step": 182118, "epoch": 4336} {"train_loss": -7.148141860961914, "global_step": 182119, "epoch": 4336} {"train_loss": -7.192660331726074, "global_step": 182120, "epoch": 4336} {"train_loss": -7.08596134185791, "global_step": 182121, "epoch": 4336} {"train_loss": -7.1704511642456055, "global_step": 182122, "epoch": 4336} {"train_loss": -7.054859161376953, "global_step": 182123, "epoch": 4336} {"train_loss": -7.0834527015686035, "global_step": 182124, "epoch": 4336} {"train_loss": -7.261087417602539, "global_step": 182125, "epoch": 4336} {"train_loss": -7.062887191772461, "global_step": 182126, "epoch": 4336} {"train_loss": -7.038602828979492, "global_step": 182127, "epoch": 4336} {"train_loss": -7.185388565063477, "global_step": 182128, "epoch": 4336} {"train_loss": -7.0580596923828125, "global_step": 182129, "epoch": 4336} {"train_loss": -7.16340446472168, "global_step": 182130, "epoch": 4336} {"train_loss": -7.0999603271484375, "global_step": 182131, "epoch": 4336} {"train_loss": -7.054508209228516, "global_step": 182132, "epoch": 4336} {"train_loss": -7.062289237976074, "global_step": 182133, "epoch": 4336} {"train_loss": -7.041060447692871, "global_step": 182134, "epoch": 4336} {"train_loss": -7.085331439971924, "global_step": 182135, "epoch": 4336} {"train_loss": -7.108469009399414, "global_step": 182136, "epoch": 4336} {"train_loss": -7.283679008483887, "global_step": 182137, "epoch": 4336} {"train_loss": -7.140069484710693, "global_step": 182138, "epoch": 4336} {"train_loss": -7.238417148590088, "global_step": 182139, "epoch": 4336} {"train_loss": -7.1562819480896, "global_step": 182140, "epoch": 4336} {"train_loss": -7.244779586791992, "global_step": 182141, "epoch": 4336} {"train_loss": -7.167577743530273, "global_step": 182142, "epoch": 4336} {"train_loss": -7.190889358520508, "global_step": 182143, "epoch": 4336} {"train_loss": -7.031187057495117, "global_step": 182144, "epoch": 4336} {"train_loss": -7.177707672119141, "global_step": 182145, "epoch": 4336} {"train_loss": -7.223287105560303, "global_step": 182146, "epoch": 4336} {"train_loss": -7.194052219390869, "global_step": 182147, "epoch": 4336} {"train_loss": -7.059659004211426, "global_step": 182148, "epoch": 4336} {"train_loss": -7.118206977844238, "global_step": 182149, "epoch": 4336} {"train_loss": -7.107440948486328, "global_step": 182150, "epoch": 4336} {"train_loss": -6.951699256896973, "global_step": 182151, "epoch": 4336} {"train_loss": -6.9915618896484375, "global_step": 182152, "epoch": 4336} {"train_loss": -7.120141392662411, "global_step": 182153, "epoch": 4336, "val_loss": 69363.765625} {"train_loss": -7.19329309463501, "global_step": 182154, "epoch": 4337} {"train_loss": -7.125008583068848, "global_step": 182155, "epoch": 4337} {"train_loss": -7.169414043426514, "global_step": 182156, "epoch": 4337} {"train_loss": -7.204496383666992, "global_step": 182157, "epoch": 4337} {"train_loss": -7.109013080596924, "global_step": 182158, "epoch": 4337} {"train_loss": -7.142998695373535, "global_step": 182159, "epoch": 4337} {"train_loss": -7.111000061035156, "global_step": 182160, "epoch": 4337} {"train_loss": -7.028810501098633, "global_step": 182161, "epoch": 4337} {"train_loss": -7.165334701538086, "global_step": 182162, "epoch": 4337} {"train_loss": -7.105911731719971, "global_step": 182163, "epoch": 4337} {"train_loss": -7.206120491027832, "global_step": 182164, "epoch": 4337} {"train_loss": -7.086236953735352, "global_step": 182165, "epoch": 4337} {"train_loss": -7.085052967071533, "global_step": 182166, "epoch": 4337} {"train_loss": -6.965291976928711, "global_step": 182167, "epoch": 4337} {"train_loss": -7.017849445343018, "global_step": 182168, "epoch": 4337} {"train_loss": -7.177830696105957, "global_step": 182169, "epoch": 4337} {"train_loss": -7.018915176391602, "global_step": 182170, "epoch": 4337} {"train_loss": -7.126858234405518, "global_step": 182171, "epoch": 4337} {"train_loss": -7.0510454177856445, "global_step": 182172, "epoch": 4337} {"train_loss": -7.113242149353027, "global_step": 182173, "epoch": 4337} {"train_loss": -7.136256217956543, "global_step": 182174, "epoch": 4337} {"train_loss": -6.915904998779297, "global_step": 182175, "epoch": 4337} {"train_loss": -7.101115703582764, "global_step": 182176, "epoch": 4337} {"train_loss": -7.027655601501465, "global_step": 182177, "epoch": 4337} {"train_loss": -7.153687953948975, "global_step": 182178, "epoch": 4337} {"train_loss": -7.141952991485596, "global_step": 182179, "epoch": 4337} {"train_loss": -7.051865577697754, "global_step": 182180, "epoch": 4337} {"train_loss": -7.170916557312012, "global_step": 182181, "epoch": 4337} {"train_loss": -6.984803676605225, "global_step": 182182, "epoch": 4337} {"train_loss": -7.159338474273682, "global_step": 182183, "epoch": 4337} {"train_loss": -7.061781883239746, "global_step": 182184, "epoch": 4337} {"train_loss": -7.141082763671875, "global_step": 182185, "epoch": 4337} {"train_loss": -7.070023536682129, "global_step": 182186, "epoch": 4337} {"train_loss": -7.017995834350586, "global_step": 182187, "epoch": 4337} {"train_loss": -7.090666770935059, "global_step": 182188, "epoch": 4337} {"train_loss": -6.971043586730957, "global_step": 182189, "epoch": 4337} {"train_loss": -7.016664981842041, "global_step": 182190, "epoch": 4337} {"train_loss": -7.087222099304199, "global_step": 182191, "epoch": 4337} {"train_loss": -7.138896942138672, "global_step": 182192, "epoch": 4337} {"train_loss": -7.133440971374512, "global_step": 182193, "epoch": 4337} {"train_loss": -7.042101860046387, "global_step": 182194, "epoch": 4337} {"train_loss": -7.0921897093455, "global_step": 182195, "epoch": 4337, "val_loss": 69318.0234375} {"train_loss": -7.138388633728027, "global_step": 182196, "epoch": 4338} {"train_loss": -7.144190311431885, "global_step": 182197, "epoch": 4338} {"train_loss": -7.092543601989746, "global_step": 182198, "epoch": 4338} {"train_loss": -7.182990550994873, "global_step": 182199, "epoch": 4338} {"train_loss": -7.057992935180664, "global_step": 182200, "epoch": 4338} {"train_loss": -7.156252384185791, "global_step": 182201, "epoch": 4338} {"train_loss": -7.11248254776001, "global_step": 182202, "epoch": 4338} {"train_loss": -7.176552772521973, "global_step": 182203, "epoch": 4338} {"train_loss": -7.171860218048096, "global_step": 182204, "epoch": 4338} {"train_loss": -7.104743480682373, "global_step": 182205, "epoch": 4338} {"train_loss": -6.976711750030518, "global_step": 182206, "epoch": 4338} {"train_loss": -7.107571601867676, "global_step": 182207, "epoch": 4338} {"train_loss": -7.05958366394043, "global_step": 182208, "epoch": 4338} {"train_loss": -7.020150661468506, "global_step": 182209, "epoch": 4338} {"train_loss": -7.1097564697265625, "global_step": 182210, "epoch": 4338} {"train_loss": -7.137988090515137, "global_step": 182211, "epoch": 4338} {"train_loss": -7.198225021362305, "global_step": 182212, "epoch": 4338} {"train_loss": -7.199361801147461, "global_step": 182213, "epoch": 4338} {"train_loss": -7.084330081939697, "global_step": 182214, "epoch": 4338} {"train_loss": -7.148820877075195, "global_step": 182215, "epoch": 4338} {"train_loss": -7.117639541625977, "global_step": 182216, "epoch": 4338} {"train_loss": -7.150167465209961, "global_step": 182217, "epoch": 4338} {"train_loss": -7.125819206237793, "global_step": 182218, "epoch": 4338} {"train_loss": -7.089754581451416, "global_step": 182219, "epoch": 4338} {"train_loss": -7.235470771789551, "global_step": 182220, "epoch": 4338} {"train_loss": -7.119184970855713, "global_step": 182221, "epoch": 4338} {"train_loss": -7.076234340667725, "global_step": 182222, "epoch": 4338} {"train_loss": -7.144400596618652, "global_step": 182223, "epoch": 4338} {"train_loss": -6.906933784484863, "global_step": 182224, "epoch": 4338} {"train_loss": -7.112081527709961, "global_step": 182225, "epoch": 4338} {"train_loss": -7.032440185546875, "global_step": 182226, "epoch": 4338} {"train_loss": -7.047057628631592, "global_step": 182227, "epoch": 4338} {"train_loss": -7.1660661697387695, "global_step": 182228, "epoch": 4338} {"train_loss": -7.0375800132751465, "global_step": 182229, "epoch": 4338} {"train_loss": -7.1930999755859375, "global_step": 182230, "epoch": 4338} {"train_loss": -7.0028767585754395, "global_step": 182231, "epoch": 4338} {"train_loss": -7.167888641357422, "global_step": 182232, "epoch": 4338} {"train_loss": -7.162744522094727, "global_step": 182233, "epoch": 4338} {"train_loss": -7.079760551452637, "global_step": 182234, "epoch": 4338} {"train_loss": -7.129756927490234, "global_step": 182235, "epoch": 4338} {"train_loss": -7.066811561584473, "global_step": 182236, "epoch": 4338} {"train_loss": -7.1111493564787365, "global_step": 182237, "epoch": 4338, "val_loss": 69208.8203125} {"train_loss": -7.188486099243164, "global_step": 182238, "epoch": 4339} {"train_loss": -7.161170959472656, "global_step": 182239, "epoch": 4339} {"train_loss": -7.211435794830322, "global_step": 182240, "epoch": 4339} {"train_loss": -7.140813827514648, "global_step": 182241, "epoch": 4339} {"train_loss": -7.139639854431152, "global_step": 182242, "epoch": 4339} {"train_loss": -7.076183795928955, "global_step": 182243, "epoch": 4339} {"train_loss": -7.040641784667969, "global_step": 182244, "epoch": 4339} {"train_loss": -7.031587600708008, "global_step": 182245, "epoch": 4339} {"train_loss": -7.072785377502441, "global_step": 182246, "epoch": 4339} {"train_loss": -7.025289535522461, "global_step": 182247, "epoch": 4339} {"train_loss": -7.097294330596924, "global_step": 182248, "epoch": 4339} {"train_loss": -7.144528865814209, "global_step": 182249, "epoch": 4339} {"train_loss": -7.117693901062012, "global_step": 182250, "epoch": 4339} {"train_loss": -7.119585037231445, "global_step": 182251, "epoch": 4339} {"train_loss": -7.0373005867004395, "global_step": 182252, "epoch": 4339} {"train_loss": -7.165866851806641, "global_step": 182253, "epoch": 4339} {"train_loss": -7.17286491394043, "global_step": 182254, "epoch": 4339} {"train_loss": -7.061087131500244, "global_step": 182255, "epoch": 4339} {"train_loss": -7.181948661804199, "global_step": 182256, "epoch": 4339} {"train_loss": -7.116299152374268, "global_step": 182257, "epoch": 4339} {"train_loss": -7.109790325164795, "global_step": 182258, "epoch": 4339} {"train_loss": -7.158539772033691, "global_step": 182259, "epoch": 4339} {"train_loss": -7.064706802368164, "global_step": 182260, "epoch": 4339} {"train_loss": -7.3072075843811035, "global_step": 182261, "epoch": 4339} {"train_loss": -7.122204780578613, "global_step": 182262, "epoch": 4339} {"train_loss": -6.9554219245910645, "global_step": 182263, "epoch": 4339} {"train_loss": -7.065755844116211, "global_step": 182264, "epoch": 4339} {"train_loss": -7.056643486022949, "global_step": 182265, "epoch": 4339} {"train_loss": -7.118903160095215, "global_step": 182266, "epoch": 4339} {"train_loss": -6.960362434387207, "global_step": 182267, "epoch": 4339} {"train_loss": -7.103919506072998, "global_step": 182268, "epoch": 4339} {"train_loss": -6.974597930908203, "global_step": 182269, "epoch": 4339} {"train_loss": -7.1843061447143555, "global_step": 182270, "epoch": 4339} {"train_loss": -7.208720684051514, "global_step": 182271, "epoch": 4339} {"train_loss": -7.136411666870117, "global_step": 182272, "epoch": 4339} {"train_loss": -7.247348785400391, "global_step": 182273, "epoch": 4339} {"train_loss": -6.947527885437012, "global_step": 182274, "epoch": 4339} {"train_loss": -7.204334259033203, "global_step": 182275, "epoch": 4339} {"train_loss": -7.02977180480957, "global_step": 182276, "epoch": 4339} {"train_loss": -7.047013759613037, "global_step": 182277, "epoch": 4339} {"train_loss": -7.087404251098633, "global_step": 182278, "epoch": 4339} {"train_loss": -7.1057060446058005, "global_step": 182279, "epoch": 4339, "val_loss": 69434.1015625} {"train_loss": -7.157943248748779, "global_step": 182280, "epoch": 4340} {"train_loss": -7.030228614807129, "global_step": 182281, "epoch": 4340} {"train_loss": -7.106326103210449, "global_step": 182282, "epoch": 4340} {"train_loss": -7.101859092712402, "global_step": 182283, "epoch": 4340} {"train_loss": -7.109701156616211, "global_step": 182284, "epoch": 4340} {"train_loss": -7.155165195465088, "global_step": 182285, "epoch": 4340} {"train_loss": -7.0394086837768555, "global_step": 182286, "epoch": 4340} {"train_loss": -7.0716352462768555, "global_step": 182287, "epoch": 4340} {"train_loss": -7.150033950805664, "global_step": 182288, "epoch": 4340} {"train_loss": -7.171503067016602, "global_step": 182289, "epoch": 4340} {"train_loss": -7.040185928344727, "global_step": 182290, "epoch": 4340} {"train_loss": -7.065103530883789, "global_step": 182291, "epoch": 4340} {"train_loss": -7.085927963256836, "global_step": 182292, "epoch": 4340} {"train_loss": -7.1050028800964355, "global_step": 182293, "epoch": 4340} {"train_loss": -7.085692882537842, "global_step": 182294, "epoch": 4340} {"train_loss": -6.982918739318848, "global_step": 182295, "epoch": 4340} {"train_loss": -7.018134593963623, "global_step": 182296, "epoch": 4340} {"train_loss": -7.070583820343018, "global_step": 182297, "epoch": 4340} {"train_loss": -7.151699066162109, "global_step": 182298, "epoch": 4340} {"train_loss": -7.1932220458984375, "global_step": 182299, "epoch": 4340} {"train_loss": -7.0939483642578125, "global_step": 182300, "epoch": 4340} {"train_loss": -7.0327324867248535, "global_step": 182301, "epoch": 4340} {"train_loss": -7.063752174377441, "global_step": 182302, "epoch": 4340} {"train_loss": -7.076657295227051, "global_step": 182303, "epoch": 4340} {"train_loss": -7.152320861816406, "global_step": 182304, "epoch": 4340} {"train_loss": -7.207874298095703, "global_step": 182305, "epoch": 4340} {"train_loss": -7.106721878051758, "global_step": 182306, "epoch": 4340} {"train_loss": -7.134439468383789, "global_step": 182307, "epoch": 4340} {"train_loss": -7.129250526428223, "global_step": 182308, "epoch": 4340} {"train_loss": -7.206341743469238, "global_step": 182309, "epoch": 4340} {"train_loss": -7.120231628417969, "global_step": 182310, "epoch": 4340} {"train_loss": -7.096953868865967, "global_step": 182311, "epoch": 4340} {"train_loss": -7.159287452697754, "global_step": 182312, "epoch": 4340} {"train_loss": -7.152235984802246, "global_step": 182313, "epoch": 4340} {"train_loss": -7.15371036529541, "global_step": 182314, "epoch": 4340} {"train_loss": -7.179555892944336, "global_step": 182315, "epoch": 4340} {"train_loss": -7.075745582580566, "global_step": 182316, "epoch": 4340} {"train_loss": -7.1904377937316895, "global_step": 182317, "epoch": 4340} {"train_loss": -7.199404716491699, "global_step": 182318, "epoch": 4340} {"train_loss": -7.219377517700195, "global_step": 182319, "epoch": 4340} {"train_loss": -7.164246082305908, "global_step": 182320, "epoch": 4340} {"train_loss": -7.11997788293021, "global_step": 182321, "epoch": 4340, "val_loss": 69181.1796875} {"train_loss": -7.133825302124023, "global_step": 182322, "epoch": 4341} {"train_loss": -7.138374328613281, "global_step": 182323, "epoch": 4341} {"train_loss": -7.253735542297363, "global_step": 182324, "epoch": 4341} {"train_loss": -7.190967559814453, "global_step": 182325, "epoch": 4341} {"train_loss": -7.140301704406738, "global_step": 182326, "epoch": 4341} {"train_loss": -7.036540985107422, "global_step": 182327, "epoch": 4341} {"train_loss": -7.122125625610352, "global_step": 182328, "epoch": 4341} {"train_loss": -7.206948280334473, "global_step": 182329, "epoch": 4341} {"train_loss": -6.993049144744873, "global_step": 182330, "epoch": 4341} {"train_loss": -6.9691925048828125, "global_step": 182331, "epoch": 4341} {"train_loss": -7.037472724914551, "global_step": 182332, "epoch": 4341} {"train_loss": -7.044893741607666, "global_step": 182333, "epoch": 4341} {"train_loss": -7.082629680633545, "global_step": 182334, "epoch": 4341} {"train_loss": -7.26734733581543, "global_step": 182335, "epoch": 4341} {"train_loss": -7.173264503479004, "global_step": 182336, "epoch": 4341} {"train_loss": -7.117116928100586, "global_step": 182337, "epoch": 4341} {"train_loss": -7.161359786987305, "global_step": 182338, "epoch": 4341} {"train_loss": -7.215095043182373, "global_step": 182339, "epoch": 4341} {"train_loss": -7.240678787231445, "global_step": 182340, "epoch": 4341} {"train_loss": -7.2238287925720215, "global_step": 182341, "epoch": 4341} {"train_loss": -7.260831356048584, "global_step": 182342, "epoch": 4341} {"train_loss": -7.099658012390137, "global_step": 182343, "epoch": 4341} {"train_loss": -7.173346519470215, "global_step": 182344, "epoch": 4341} {"train_loss": -7.140642166137695, "global_step": 182345, "epoch": 4341} {"train_loss": -7.124463081359863, "global_step": 182346, "epoch": 4341} {"train_loss": -7.032046318054199, "global_step": 182347, "epoch": 4341} {"train_loss": -7.238192558288574, "global_step": 182348, "epoch": 4341} {"train_loss": -7.11464786529541, "global_step": 182349, "epoch": 4341} {"train_loss": -7.255147933959961, "global_step": 182350, "epoch": 4341} {"train_loss": -7.099428653717041, "global_step": 182351, "epoch": 4341} {"train_loss": -7.1835246086120605, "global_step": 182352, "epoch": 4341} {"train_loss": -7.188961505889893, "global_step": 182353, "epoch": 4341} {"train_loss": -7.1245341300964355, "global_step": 182354, "epoch": 4341} {"train_loss": -7.171089172363281, "global_step": 182355, "epoch": 4341} {"train_loss": -7.0358428955078125, "global_step": 182356, "epoch": 4341} {"train_loss": -7.252976894378662, "global_step": 182357, "epoch": 4341} {"train_loss": -7.181290626525879, "global_step": 182358, "epoch": 4341} {"train_loss": -7.105600357055664, "global_step": 182359, "epoch": 4341} {"train_loss": -7.185020446777344, "global_step": 182360, "epoch": 4341} {"train_loss": -7.168449878692627, "global_step": 182361, "epoch": 4341} {"train_loss": -7.152983665466309, "global_step": 182362, "epoch": 4341} {"train_loss": -7.146757125854492, "global_step": 182363, "epoch": 4341, "val_loss": 69334.7109375} {"train_loss": -7.040363311767578, "global_step": 182364, "epoch": 4342} {"train_loss": -7.141009330749512, "global_step": 182365, "epoch": 4342} {"train_loss": -7.076630592346191, "global_step": 182366, "epoch": 4342} {"train_loss": -7.042965888977051, "global_step": 182367, "epoch": 4342} {"train_loss": -7.093044281005859, "global_step": 182368, "epoch": 4342} {"train_loss": -7.011172294616699, "global_step": 182369, "epoch": 4342} {"train_loss": -7.16774845123291, "global_step": 182370, "epoch": 4342} {"train_loss": -7.124819755554199, "global_step": 182371, "epoch": 4342} {"train_loss": -7.146931171417236, "global_step": 182372, "epoch": 4342} {"train_loss": -7.198976993560791, "global_step": 182373, "epoch": 4342} {"train_loss": -7.205313682556152, "global_step": 182374, "epoch": 4342} {"train_loss": -7.181950569152832, "global_step": 182375, "epoch": 4342} {"train_loss": -7.075140953063965, "global_step": 182376, "epoch": 4342} {"train_loss": -7.0157060623168945, "global_step": 182377, "epoch": 4342} {"train_loss": -7.208352565765381, "global_step": 182378, "epoch": 4342} {"train_loss": -7.123740196228027, "global_step": 182379, "epoch": 4342} {"train_loss": -7.078670978546143, "global_step": 182380, "epoch": 4342} {"train_loss": -7.153083324432373, "global_step": 182381, "epoch": 4342} {"train_loss": -7.099826335906982, "global_step": 182382, "epoch": 4342} {"train_loss": -7.089645862579346, "global_step": 182383, "epoch": 4342} {"train_loss": -7.157873153686523, "global_step": 182384, "epoch": 4342} {"train_loss": -7.087540626525879, "global_step": 182385, "epoch": 4342} {"train_loss": -7.2326555252075195, "global_step": 182386, "epoch": 4342} {"train_loss": -7.112401008605957, "global_step": 182387, "epoch": 4342} {"train_loss": -7.104755401611328, "global_step": 182388, "epoch": 4342} {"train_loss": -7.2163310050964355, "global_step": 182389, "epoch": 4342} {"train_loss": -7.0261945724487305, "global_step": 182390, "epoch": 4342} {"train_loss": -7.112767219543457, "global_step": 182391, "epoch": 4342} {"train_loss": -7.087012767791748, "global_step": 182392, "epoch": 4342} {"train_loss": -6.994300365447998, "global_step": 182393, "epoch": 4342} {"train_loss": -7.077325820922852, "global_step": 182394, "epoch": 4342} {"train_loss": -7.114466190338135, "global_step": 182395, "epoch": 4342} {"train_loss": -6.955539703369141, "global_step": 182396, "epoch": 4342} {"train_loss": -7.130228042602539, "global_step": 182397, "epoch": 4342} {"train_loss": -7.1124958992004395, "global_step": 182398, "epoch": 4342} {"train_loss": -7.126526832580566, "global_step": 182399, "epoch": 4342} {"train_loss": -7.082432746887207, "global_step": 182400, "epoch": 4342} {"train_loss": -7.056878089904785, "global_step": 182401, "epoch": 4342} {"train_loss": -6.904499053955078, "global_step": 182402, "epoch": 4342} {"train_loss": -7.111675262451172, "global_step": 182403, "epoch": 4342} {"train_loss": -6.9974846839904785, "global_step": 182404, "epoch": 4342} {"train_loss": -7.097728036698841, "global_step": 182405, "epoch": 4342, "val_loss": 69222.984375} {"train_loss": -6.9492902755737305, "global_step": 182406, "epoch": 4343} {"train_loss": -7.139017581939697, "global_step": 182407, "epoch": 4343} {"train_loss": -7.140944480895996, "global_step": 182408, "epoch": 4343} {"train_loss": -7.189236640930176, "global_step": 182409, "epoch": 4343} {"train_loss": -7.022703170776367, "global_step": 182410, "epoch": 4343} {"train_loss": -7.05637788772583, "global_step": 182411, "epoch": 4343} {"train_loss": -7.009626388549805, "global_step": 182412, "epoch": 4343} {"train_loss": -7.08377742767334, "global_step": 182413, "epoch": 4343} {"train_loss": -7.164340019226074, "global_step": 182414, "epoch": 4343} {"train_loss": -7.048131942749023, "global_step": 182415, "epoch": 4343} {"train_loss": -6.974881172180176, "global_step": 182416, "epoch": 4343} {"train_loss": -7.105934143066406, "global_step": 182417, "epoch": 4343} {"train_loss": -7.087660312652588, "global_step": 182418, "epoch": 4343} {"train_loss": -7.124819755554199, "global_step": 182419, "epoch": 4343} {"train_loss": -7.185394763946533, "global_step": 182420, "epoch": 4343} {"train_loss": -7.282559871673584, "global_step": 182421, "epoch": 4343} {"train_loss": -7.0869903564453125, "global_step": 182422, "epoch": 4343} {"train_loss": -7.1090240478515625, "global_step": 182423, "epoch": 4343} {"train_loss": -7.057944297790527, "global_step": 182424, "epoch": 4343} {"train_loss": -7.152868747711182, "global_step": 182425, "epoch": 4343} {"train_loss": -7.021027565002441, "global_step": 182426, "epoch": 4343} {"train_loss": -7.054433822631836, "global_step": 182427, "epoch": 4343} {"train_loss": -7.067556381225586, "global_step": 182428, "epoch": 4343} {"train_loss": -6.982536315917969, "global_step": 182429, "epoch": 4343} {"train_loss": -7.124100208282471, "global_step": 182430, "epoch": 4343} {"train_loss": -7.055379390716553, "global_step": 182431, "epoch": 4343} {"train_loss": -7.118104934692383, "global_step": 182432, "epoch": 4343} {"train_loss": -7.098420143127441, "global_step": 182433, "epoch": 4343} {"train_loss": -7.123600959777832, "global_step": 182434, "epoch": 4343} {"train_loss": -7.134703636169434, "global_step": 182435, "epoch": 4343} {"train_loss": -7.2375946044921875, "global_step": 182436, "epoch": 4343} {"train_loss": -7.07936429977417, "global_step": 182437, "epoch": 4343} {"train_loss": -7.099682331085205, "global_step": 182438, "epoch": 4343} {"train_loss": -7.148482799530029, "global_step": 182439, "epoch": 4343} {"train_loss": -7.186148643493652, "global_step": 182440, "epoch": 4343} {"train_loss": -7.032027244567871, "global_step": 182441, "epoch": 4343} {"train_loss": -7.072648048400879, "global_step": 182442, "epoch": 4343} {"train_loss": -7.0838823318481445, "global_step": 182443, "epoch": 4343} {"train_loss": -7.12385368347168, "global_step": 182444, "epoch": 4343} {"train_loss": -7.0967206954956055, "global_step": 182445, "epoch": 4343} {"train_loss": -7.143118858337402, "global_step": 182446, "epoch": 4343} {"train_loss": -7.097677798498244, "global_step": 182447, "epoch": 4343, "val_loss": 69330.7578125} {"train_loss": -7.174123764038086, "global_step": 182448, "epoch": 4344} {"train_loss": -7.188494682312012, "global_step": 182449, "epoch": 4344} {"train_loss": -7.255168914794922, "global_step": 182450, "epoch": 4344} {"train_loss": -7.200867652893066, "global_step": 182451, "epoch": 4344} {"train_loss": -7.294422149658203, "global_step": 182452, "epoch": 4344} {"train_loss": -7.119778156280518, "global_step": 182453, "epoch": 4344} {"train_loss": -7.150012493133545, "global_step": 182454, "epoch": 4344} {"train_loss": -7.174178600311279, "global_step": 182455, "epoch": 4344} {"train_loss": -7.063236236572266, "global_step": 182456, "epoch": 4344} {"train_loss": -7.151836395263672, "global_step": 182457, "epoch": 4344} {"train_loss": -7.081836223602295, "global_step": 182458, "epoch": 4344} {"train_loss": -7.176597595214844, "global_step": 182459, "epoch": 4344} {"train_loss": -7.076436996459961, "global_step": 182460, "epoch": 4344} {"train_loss": -7.153042793273926, "global_step": 182461, "epoch": 4344} {"train_loss": -7.088024616241455, "global_step": 182462, "epoch": 4344} {"train_loss": -7.106720924377441, "global_step": 182463, "epoch": 4344} {"train_loss": -7.0358686447143555, "global_step": 182464, "epoch": 4344} {"train_loss": -7.075352668762207, "global_step": 182465, "epoch": 4344} {"train_loss": -7.159461975097656, "global_step": 182466, "epoch": 4344} {"train_loss": -7.195136070251465, "global_step": 182467, "epoch": 4344} {"train_loss": -7.270490646362305, "global_step": 182468, "epoch": 4344} {"train_loss": -7.119414329528809, "global_step": 182469, "epoch": 4344} {"train_loss": -7.193975448608398, "global_step": 182470, "epoch": 4344} {"train_loss": -7.210762977600098, "global_step": 182471, "epoch": 4344} {"train_loss": -7.072246551513672, "global_step": 182472, "epoch": 4344} {"train_loss": -7.129805088043213, "global_step": 182473, "epoch": 4344} {"train_loss": -7.163265228271484, "global_step": 182474, "epoch": 4344} {"train_loss": -7.053157806396484, "global_step": 182475, "epoch": 4344} {"train_loss": -7.230885028839111, "global_step": 182476, "epoch": 4344} {"train_loss": -7.247923374176025, "global_step": 182477, "epoch": 4344} {"train_loss": -7.1289753913879395, "global_step": 182478, "epoch": 4344} {"train_loss": -7.302859783172607, "global_step": 182479, "epoch": 4344} {"train_loss": -7.202944755554199, "global_step": 182480, "epoch": 4344} {"train_loss": -7.252140045166016, "global_step": 182481, "epoch": 4344} {"train_loss": -7.141088485717773, "global_step": 182482, "epoch": 4344} {"train_loss": -7.0393266677856445, "global_step": 182483, "epoch": 4344} {"train_loss": -7.173762321472168, "global_step": 182484, "epoch": 4344} {"train_loss": -7.197303771972656, "global_step": 182485, "epoch": 4344} {"train_loss": -7.1312408447265625, "global_step": 182486, "epoch": 4344} {"train_loss": -7.120261192321777, "global_step": 182487, "epoch": 4344} {"train_loss": -7.2137651443481445, "global_step": 182488, "epoch": 4344} {"train_loss": -7.160307793390183, "global_step": 182489, "epoch": 4344, "val_loss": 69413.390625} {"train_loss": -7.166651725769043, "global_step": 182490, "epoch": 4345} {"train_loss": -7.2430524826049805, "global_step": 182491, "epoch": 4345} {"train_loss": -7.190533638000488, "global_step": 182492, "epoch": 4345} {"train_loss": -7.138994216918945, "global_step": 182493, "epoch": 4345} {"train_loss": -7.145456314086914, "global_step": 182494, "epoch": 4345} {"train_loss": -7.20290470123291, "global_step": 182495, "epoch": 4345} {"train_loss": -7.029433250427246, "global_step": 182496, "epoch": 4345} {"train_loss": -7.082204341888428, "global_step": 182497, "epoch": 4345} {"train_loss": -7.135460376739502, "global_step": 182498, "epoch": 4345} {"train_loss": -6.959372520446777, "global_step": 182499, "epoch": 4345} {"train_loss": -6.997318744659424, "global_step": 182500, "epoch": 4345} {"train_loss": -7.156349182128906, "global_step": 182501, "epoch": 4345} {"train_loss": -6.983811855316162, "global_step": 182502, "epoch": 4345} {"train_loss": -7.004886627197266, "global_step": 182503, "epoch": 4345} {"train_loss": -7.158377647399902, "global_step": 182504, "epoch": 4345} {"train_loss": -7.091749668121338, "global_step": 182505, "epoch": 4345} {"train_loss": -7.086833953857422, "global_step": 182506, "epoch": 4345} {"train_loss": -7.094934463500977, "global_step": 182507, "epoch": 4345} {"train_loss": -7.135900974273682, "global_step": 182508, "epoch": 4345} {"train_loss": -7.037066459655762, "global_step": 182509, "epoch": 4345} {"train_loss": -7.066150665283203, "global_step": 182510, "epoch": 4345} {"train_loss": -7.075685977935791, "global_step": 182511, "epoch": 4345} {"train_loss": -7.1192450523376465, "global_step": 182512, "epoch": 4345} {"train_loss": -7.190860748291016, "global_step": 182513, "epoch": 4345} {"train_loss": -7.095314979553223, "global_step": 182514, "epoch": 4345} {"train_loss": -7.064715385437012, "global_step": 182515, "epoch": 4345} {"train_loss": -7.0611748695373535, "global_step": 182516, "epoch": 4345} {"train_loss": -7.104948043823242, "global_step": 182517, "epoch": 4345} {"train_loss": -7.0938005447387695, "global_step": 182518, "epoch": 4345} {"train_loss": -7.06298303604126, "global_step": 182519, "epoch": 4345} {"train_loss": -7.13255500793457, "global_step": 182520, "epoch": 4345} {"train_loss": -7.153552055358887, "global_step": 182521, "epoch": 4345} {"train_loss": -7.153425216674805, "global_step": 182522, "epoch": 4345} {"train_loss": -7.0120649337768555, "global_step": 182523, "epoch": 4345} {"train_loss": -7.147449493408203, "global_step": 182524, "epoch": 4345} {"train_loss": -7.012968063354492, "global_step": 182525, "epoch": 4345} {"train_loss": -7.047492980957031, "global_step": 182526, "epoch": 4345} {"train_loss": -7.144726276397705, "global_step": 182527, "epoch": 4345} {"train_loss": -7.1056718826293945, "global_step": 182528, "epoch": 4345} {"train_loss": -7.083315849304199, "global_step": 182529, "epoch": 4345} {"train_loss": -6.946549415588379, "global_step": 182530, "epoch": 4345} {"train_loss": -7.095215366000221, "global_step": 182531, "epoch": 4345, "val_loss": 69586.390625} {"train_loss": -7.126284599304199, "global_step": 182532, "epoch": 4346} {"train_loss": -7.134618759155273, "global_step": 182533, "epoch": 4346} {"train_loss": -6.985218048095703, "global_step": 182534, "epoch": 4346} {"train_loss": -7.078151226043701, "global_step": 182535, "epoch": 4346} {"train_loss": -7.077014446258545, "global_step": 182536, "epoch": 4346} {"train_loss": -7.04417610168457, "global_step": 182537, "epoch": 4346} {"train_loss": -7.152373313903809, "global_step": 182538, "epoch": 4346} {"train_loss": -7.13504695892334, "global_step": 182539, "epoch": 4346} {"train_loss": -7.07569694519043, "global_step": 182540, "epoch": 4346} {"train_loss": -7.08658504486084, "global_step": 182541, "epoch": 4346} {"train_loss": -7.145669937133789, "global_step": 182542, "epoch": 4346} {"train_loss": -7.034672737121582, "global_step": 182543, "epoch": 4346} {"train_loss": -7.100434303283691, "global_step": 182544, "epoch": 4346} {"train_loss": -7.142989158630371, "global_step": 182545, "epoch": 4346} {"train_loss": -7.269490718841553, "global_step": 182546, "epoch": 4346} {"train_loss": -7.014216423034668, "global_step": 182547, "epoch": 4346} {"train_loss": -7.121313095092773, "global_step": 182548, "epoch": 4346} {"train_loss": -7.02669095993042, "global_step": 182549, "epoch": 4346} {"train_loss": -7.0711236000061035, "global_step": 182550, "epoch": 4346} {"train_loss": -7.030097961425781, "global_step": 182551, "epoch": 4346} {"train_loss": -7.046505928039551, "global_step": 182552, "epoch": 4346} {"train_loss": -6.988582611083984, "global_step": 182553, "epoch": 4346} {"train_loss": -7.084001541137695, "global_step": 182554, "epoch": 4346} {"train_loss": -7.064924716949463, "global_step": 182555, "epoch": 4346} {"train_loss": -6.962502479553223, "global_step": 182556, "epoch": 4346} {"train_loss": -7.070998191833496, "global_step": 182557, "epoch": 4346} {"train_loss": -6.974147319793701, "global_step": 182558, "epoch": 4346} {"train_loss": -7.221671104431152, "global_step": 182559, "epoch": 4346} {"train_loss": -7.107852458953857, "global_step": 182560, "epoch": 4346} {"train_loss": -7.038928031921387, "global_step": 182561, "epoch": 4346} {"train_loss": -7.184556007385254, "global_step": 182562, "epoch": 4346} {"train_loss": -7.11612606048584, "global_step": 182563, "epoch": 4346} {"train_loss": -7.105894088745117, "global_step": 182564, "epoch": 4346} {"train_loss": -7.114458084106445, "global_step": 182565, "epoch": 4346} {"train_loss": -7.160280704498291, "global_step": 182566, "epoch": 4346} {"train_loss": -7.026866912841797, "global_step": 182567, "epoch": 4346} {"train_loss": -6.992912292480469, "global_step": 182568, "epoch": 4346} {"train_loss": -6.937739849090576, "global_step": 182569, "epoch": 4346} {"train_loss": -6.951018333435059, "global_step": 182570, "epoch": 4346} {"train_loss": -7.0630106925964355, "global_step": 182571, "epoch": 4346} {"train_loss": -6.9051032066345215, "global_step": 182572, "epoch": 4346} {"train_loss": -7.071469159353347, "global_step": 182573, "epoch": 4346, "val_loss": 69566.6640625} {"train_loss": -7.023421287536621, "global_step": 182574, "epoch": 4347} {"train_loss": -6.917576789855957, "global_step": 182575, "epoch": 4347} {"train_loss": -7.093179702758789, "global_step": 182576, "epoch": 4347} {"train_loss": -7.024222373962402, "global_step": 182577, "epoch": 4347} {"train_loss": -7.017947196960449, "global_step": 182578, "epoch": 4347} {"train_loss": -7.083647727966309, "global_step": 182579, "epoch": 4347} {"train_loss": -6.945582866668701, "global_step": 182580, "epoch": 4347} {"train_loss": -7.0368170738220215, "global_step": 182581, "epoch": 4347} {"train_loss": -7.024374961853027, "global_step": 182582, "epoch": 4347} {"train_loss": -7.054718017578125, "global_step": 182583, "epoch": 4347} {"train_loss": -7.058798789978027, "global_step": 182584, "epoch": 4347} {"train_loss": -7.084837913513184, "global_step": 182585, "epoch": 4347} {"train_loss": -7.136733055114746, "global_step": 182586, "epoch": 4347} {"train_loss": -7.15059757232666, "global_step": 182587, "epoch": 4347} {"train_loss": -7.028221130371094, "global_step": 182588, "epoch": 4347} {"train_loss": -7.192559719085693, "global_step": 182589, "epoch": 4347} {"train_loss": -7.058073043823242, "global_step": 182590, "epoch": 4347} {"train_loss": -7.124085426330566, "global_step": 182591, "epoch": 4347} {"train_loss": -7.02128267288208, "global_step": 182592, "epoch": 4347} {"train_loss": -6.9933013916015625, "global_step": 182593, "epoch": 4347} {"train_loss": -7.179437637329102, "global_step": 182594, "epoch": 4347} {"train_loss": -7.097856044769287, "global_step": 182595, "epoch": 4347} {"train_loss": -7.080425262451172, "global_step": 182596, "epoch": 4347} {"train_loss": -7.149295806884766, "global_step": 182597, "epoch": 4347} {"train_loss": -7.081601142883301, "global_step": 182598, "epoch": 4347} {"train_loss": -7.127817630767822, "global_step": 182599, "epoch": 4347} {"train_loss": -7.021361351013184, "global_step": 182600, "epoch": 4347} {"train_loss": -7.0728912353515625, "global_step": 182601, "epoch": 4347} {"train_loss": -7.213024139404297, "global_step": 182602, "epoch": 4347} {"train_loss": -7.029778480529785, "global_step": 182603, "epoch": 4347} {"train_loss": -7.257326602935791, "global_step": 182604, "epoch": 4347} {"train_loss": -7.149963855743408, "global_step": 182605, "epoch": 4347} {"train_loss": -7.12408447265625, "global_step": 182606, "epoch": 4347} {"train_loss": -7.168745040893555, "global_step": 182607, "epoch": 4347} {"train_loss": -7.103350639343262, "global_step": 182608, "epoch": 4347} {"train_loss": -7.135076999664307, "global_step": 182609, "epoch": 4347} {"train_loss": -7.146157264709473, "global_step": 182610, "epoch": 4347} {"train_loss": -7.175745010375977, "global_step": 182611, "epoch": 4347} {"train_loss": -7.2304887771606445, "global_step": 182612, "epoch": 4347} {"train_loss": -7.066420555114746, "global_step": 182613, "epoch": 4347} {"train_loss": -7.074100494384766, "global_step": 182614, "epoch": 4347} {"train_loss": -7.093691757747105, "global_step": 182615, "epoch": 4347, "val_loss": 69365.4140625} {"train_loss": -7.120185852050781, "global_step": 182616, "epoch": 4348} {"train_loss": -7.157238960266113, "global_step": 182617, "epoch": 4348} {"train_loss": -7.208569049835205, "global_step": 182618, "epoch": 4348} {"train_loss": -7.200384140014648, "global_step": 182619, "epoch": 4348} {"train_loss": -7.098085403442383, "global_step": 182620, "epoch": 4348} {"train_loss": -7.08695125579834, "global_step": 182621, "epoch": 4348} {"train_loss": -7.009127140045166, "global_step": 182622, "epoch": 4348} {"train_loss": -7.060868263244629, "global_step": 182623, "epoch": 4348} {"train_loss": -7.092108249664307, "global_step": 182624, "epoch": 4348} {"train_loss": -7.101352691650391, "global_step": 182625, "epoch": 4348} {"train_loss": -7.130223274230957, "global_step": 182626, "epoch": 4348} {"train_loss": -7.125336647033691, "global_step": 182627, "epoch": 4348} {"train_loss": -7.122591972351074, "global_step": 182628, "epoch": 4348} {"train_loss": -7.051054954528809, "global_step": 182629, "epoch": 4348} {"train_loss": -7.156965255737305, "global_step": 182630, "epoch": 4348} {"train_loss": -7.2672882080078125, "global_step": 182631, "epoch": 4348} {"train_loss": -7.066224098205566, "global_step": 182632, "epoch": 4348} {"train_loss": -7.134364128112793, "global_step": 182633, "epoch": 4348} {"train_loss": -7.102457523345947, "global_step": 182634, "epoch": 4348} {"train_loss": -6.983046531677246, "global_step": 182635, "epoch": 4348} {"train_loss": -7.0912885665893555, "global_step": 182636, "epoch": 4348} {"train_loss": -7.035574436187744, "global_step": 182637, "epoch": 4348} {"train_loss": -7.08829402923584, "global_step": 182638, "epoch": 4348} {"train_loss": -7.002625465393066, "global_step": 182639, "epoch": 4348} {"train_loss": -7.147408485412598, "global_step": 182640, "epoch": 4348} {"train_loss": -6.99346923828125, "global_step": 182641, "epoch": 4348} {"train_loss": -7.185905933380127, "global_step": 182642, "epoch": 4348} {"train_loss": -7.070496082305908, "global_step": 182643, "epoch": 4348} {"train_loss": -7.076327323913574, "global_step": 182644, "epoch": 4348} {"train_loss": -7.122916221618652, "global_step": 182645, "epoch": 4348} {"train_loss": -7.036208152770996, "global_step": 182646, "epoch": 4348} {"train_loss": -7.103874206542969, "global_step": 182647, "epoch": 4348} {"train_loss": -7.271502494812012, "global_step": 182648, "epoch": 4348} {"train_loss": -7.115999221801758, "global_step": 182649, "epoch": 4348} {"train_loss": -7.103518962860107, "global_step": 182650, "epoch": 4348} {"train_loss": -7.120471954345703, "global_step": 182651, "epoch": 4348} {"train_loss": -7.079385280609131, "global_step": 182652, "epoch": 4348} {"train_loss": -7.064183712005615, "global_step": 182653, "epoch": 4348} {"train_loss": -7.131056308746338, "global_step": 182654, "epoch": 4348} {"train_loss": -7.048697471618652, "global_step": 182655, "epoch": 4348} {"train_loss": -7.197314739227295, "global_step": 182656, "epoch": 4348} {"train_loss": -7.106420516967773, "global_step": 182657, "epoch": 4348, "val_loss": 69334.0625} {"train_loss": -7.15294075012207, "global_step": 182658, "epoch": 4349} {"train_loss": -7.150661945343018, "global_step": 182659, "epoch": 4349} {"train_loss": -7.087492942810059, "global_step": 182660, "epoch": 4349} {"train_loss": -7.150332450866699, "global_step": 182661, "epoch": 4349} {"train_loss": -7.177612781524658, "global_step": 182662, "epoch": 4349} {"train_loss": -7.150959014892578, "global_step": 182663, "epoch": 4349} {"train_loss": -7.128485679626465, "global_step": 182664, "epoch": 4349} {"train_loss": -7.143985748291016, "global_step": 182665, "epoch": 4349} {"train_loss": -7.151393890380859, "global_step": 182666, "epoch": 4349} {"train_loss": -7.194661617279053, "global_step": 182667, "epoch": 4349} {"train_loss": -7.095213890075684, "global_step": 182668, "epoch": 4349} {"train_loss": -7.238039970397949, "global_step": 182669, "epoch": 4349} {"train_loss": -7.022403717041016, "global_step": 182670, "epoch": 4349} {"train_loss": -7.142319679260254, "global_step": 182671, "epoch": 4349} {"train_loss": -7.138962745666504, "global_step": 182672, "epoch": 4349} {"train_loss": -7.148615837097168, "global_step": 182673, "epoch": 4349} {"train_loss": -7.165839195251465, "global_step": 182674, "epoch": 4349} {"train_loss": -7.127784252166748, "global_step": 182675, "epoch": 4349} {"train_loss": -7.10599946975708, "global_step": 182676, "epoch": 4349} {"train_loss": -7.072545051574707, "global_step": 182677, "epoch": 4349} {"train_loss": -7.117173194885254, "global_step": 182678, "epoch": 4349} {"train_loss": -7.109576225280762, "global_step": 182679, "epoch": 4349} {"train_loss": -7.053295135498047, "global_step": 182680, "epoch": 4349} {"train_loss": -7.12259578704834, "global_step": 182681, "epoch": 4349} {"train_loss": -7.171092987060547, "global_step": 182682, "epoch": 4349} {"train_loss": -7.195821762084961, "global_step": 182683, "epoch": 4349} {"train_loss": -7.044250011444092, "global_step": 182684, "epoch": 4349} {"train_loss": -7.126104354858398, "global_step": 182685, "epoch": 4349} {"train_loss": -7.211228847503662, "global_step": 182686, "epoch": 4349} {"train_loss": -7.1604695320129395, "global_step": 182687, "epoch": 4349} {"train_loss": -7.119341850280762, "global_step": 182688, "epoch": 4349} {"train_loss": -7.1577043533325195, "global_step": 182689, "epoch": 4349} {"train_loss": -7.057100772857666, "global_step": 182690, "epoch": 4349} {"train_loss": -7.1219258308410645, "global_step": 182691, "epoch": 4349} {"train_loss": -7.145230293273926, "global_step": 182692, "epoch": 4349} {"train_loss": -7.219132423400879, "global_step": 182693, "epoch": 4349} {"train_loss": -7.076915740966797, "global_step": 182694, "epoch": 4349} {"train_loss": -7.202193260192871, "global_step": 182695, "epoch": 4349} {"train_loss": -7.093646049499512, "global_step": 182696, "epoch": 4349} {"train_loss": -7.154752731323242, "global_step": 182697, "epoch": 4349} {"train_loss": -7.24367618560791, "global_step": 182698, "epoch": 4349} {"train_loss": -7.136725017002651, "global_step": 182699, "epoch": 4349, "val_loss": 69178.4921875} {"train_loss": -7.183614730834961, "global_step": 182700, "epoch": 4350} {"train_loss": -7.173312664031982, "global_step": 182701, "epoch": 4350} {"train_loss": -7.21074104309082, "global_step": 182702, "epoch": 4350} {"train_loss": -7.1484174728393555, "global_step": 182703, "epoch": 4350} {"train_loss": -7.1417717933654785, "global_step": 182704, "epoch": 4350} {"train_loss": -7.254768371582031, "global_step": 182705, "epoch": 4350} {"train_loss": -7.136277675628662, "global_step": 182706, "epoch": 4350} {"train_loss": -7.177188396453857, "global_step": 182707, "epoch": 4350} {"train_loss": -7.199517250061035, "global_step": 182708, "epoch": 4350} {"train_loss": -7.122420310974121, "global_step": 182709, "epoch": 4350} {"train_loss": -7.29863166809082, "global_step": 182710, "epoch": 4350} {"train_loss": -7.220181941986084, "global_step": 182711, "epoch": 4350} {"train_loss": -7.216345310211182, "global_step": 182712, "epoch": 4350} {"train_loss": -7.1397294998168945, "global_step": 182713, "epoch": 4350} {"train_loss": -7.1411638259887695, "global_step": 182714, "epoch": 4350} {"train_loss": -7.236967086791992, "global_step": 182715, "epoch": 4350} {"train_loss": -7.118775367736816, "global_step": 182716, "epoch": 4350} {"train_loss": -7.280317306518555, "global_step": 182717, "epoch": 4350} {"train_loss": -7.166158199310303, "global_step": 182718, "epoch": 4350} {"train_loss": -7.024370193481445, "global_step": 182719, "epoch": 4350} {"train_loss": -7.195483207702637, "global_step": 182720, "epoch": 4350} {"train_loss": -7.110528469085693, "global_step": 182721, "epoch": 4350} {"train_loss": -7.16080379486084, "global_step": 182722, "epoch": 4350} {"train_loss": -7.024295806884766, "global_step": 182723, "epoch": 4350} {"train_loss": -7.220090866088867, "global_step": 182724, "epoch": 4350} {"train_loss": -7.136288642883301, "global_step": 182725, "epoch": 4350} {"train_loss": -7.0030837059021, "global_step": 182726, "epoch": 4350} {"train_loss": -7.100404739379883, "global_step": 182727, "epoch": 4350} {"train_loss": -6.889135360717773, "global_step": 182728, "epoch": 4350} {"train_loss": -7.080836296081543, "global_step": 182729, "epoch": 4350} {"train_loss": -6.966142654418945, "global_step": 182730, "epoch": 4350} {"train_loss": -7.078094005584717, "global_step": 182731, "epoch": 4350} {"train_loss": -6.900958061218262, "global_step": 182732, "epoch": 4350} {"train_loss": -7.043493747711182, "global_step": 182733, "epoch": 4350} {"train_loss": -7.054906845092773, "global_step": 182734, "epoch": 4350} {"train_loss": -6.900114059448242, "global_step": 182735, "epoch": 4350} {"train_loss": -7.109283924102783, "global_step": 182736, "epoch": 4350} {"train_loss": -6.963913440704346, "global_step": 182737, "epoch": 4350} {"train_loss": -6.970237731933594, "global_step": 182738, "epoch": 4350} {"train_loss": -6.988637924194336, "global_step": 182739, "epoch": 4350} {"train_loss": -6.9747724533081055, "global_step": 182740, "epoch": 4350} {"train_loss": -7.108798583348592, "global_step": 182741, "epoch": 4350, "train/sim_max_reward_0": 0.19778712528170064, "train/sim_max_reward_1": 0.5027509298782845, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.3828674969940972, "train/sim_max_reward_4": 0.9390816816456681, "train/sim_max_reward_5": 0.9395997290254307, "test/sim_max_reward_4300000": 0.8994731209027789, "test/sim_max_reward_4300001": 0.5603803001112715, "test/sim_max_reward_4300002": 0.9073595944979403, "test/sim_max_reward_4300003": 0.9901898471666224, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 1.0, "test/sim_max_reward_4300007": 0.9023158386977433, "test/sim_max_reward_4300008": 0.9794020187817813, "test/sim_max_reward_4300009": 0.9589868988041893, "test/sim_max_reward_4300010": 0.9513372456727762, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.8971770112869893, "test/sim_max_reward_4300013": 0.40717079479741736, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.10326298073484784, "test/sim_max_reward_4300017": 0.8780722118961033, "test/sim_max_reward_4300018": 0.399774826995181, "test/sim_max_reward_4300019": 0.18610984464100386, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 1.0, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.9370065208653106, "test/sim_max_reward_4300024": 0.7157093887903542, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.9767189295769317, "test/sim_max_reward_4300027": 0.9214710065563638, "test/sim_max_reward_4300028": 0.9700827293564388, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.4535356296038744, "test/sim_max_reward_4300031": 0.22137200295599488, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.686134270850667, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.9971895403082067, "test/sim_max_reward_4300036": 0.2004138758690891, "test/sim_max_reward_4300037": 1.0, "test/sim_max_reward_4300038": 0.918628202924034, "test/sim_max_reward_4300039": 0.995581361232566, "test/sim_max_reward_4300040": 0.9782583376931905, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7241404390013383, "test/sim_max_reward_4300043": 0.1026097166705852, "test/sim_max_reward_4300044": 0.9938049930133038, "test/sim_max_reward_4300045": 0.18913873142700124, "test/sim_max_reward_4300046": 0.9511019891296932, "test/sim_max_reward_4300047": 0.1953623683181364, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.11206227936180889, "train/mean_score": 0.6603478271375302, "test/mean_score": 0.6655433790660163, "val_loss": 69634.7890625} {"train_loss": -7.0161333084106445, "global_step": 182742, "epoch": 4351} {"train_loss": -6.976641654968262, "global_step": 182743, "epoch": 4351} {"train_loss": -7.110034942626953, "global_step": 182744, "epoch": 4351} {"train_loss": -7.0165205001831055, "global_step": 182745, "epoch": 4351} {"train_loss": -7.093618392944336, "global_step": 182746, "epoch": 4351} {"train_loss": -7.132838249206543, "global_step": 182747, "epoch": 4351} {"train_loss": -7.167236328125, "global_step": 182748, "epoch": 4351} {"train_loss": -7.188122749328613, "global_step": 182749, "epoch": 4351} {"train_loss": -7.051488876342773, "global_step": 182750, "epoch": 4351} {"train_loss": -7.062483787536621, "global_step": 182751, "epoch": 4351} {"train_loss": -7.037850856781006, "global_step": 182752, "epoch": 4351} {"train_loss": -7.108699798583984, "global_step": 182753, "epoch": 4351} {"train_loss": -7.1616315841674805, "global_step": 182754, "epoch": 4351} {"train_loss": -7.187157154083252, "global_step": 182755, "epoch": 4351} {"train_loss": -7.143628120422363, "global_step": 182756, "epoch": 4351} {"train_loss": -7.107604026794434, "global_step": 182757, "epoch": 4351} {"train_loss": -7.14949369430542, "global_step": 182758, "epoch": 4351} {"train_loss": -7.072007656097412, "global_step": 182759, "epoch": 4351} {"train_loss": -7.175165176391602, "global_step": 182760, "epoch": 4351} {"train_loss": -7.185449600219727, "global_step": 182761, "epoch": 4351} {"train_loss": -7.175481796264648, "global_step": 182762, "epoch": 4351} {"train_loss": -7.156466960906982, "global_step": 182763, "epoch": 4351} {"train_loss": -7.227723598480225, "global_step": 182764, "epoch": 4351} {"train_loss": -7.225249290466309, "global_step": 182765, "epoch": 4351} {"train_loss": -7.167003154754639, "global_step": 182766, "epoch": 4351} {"train_loss": -7.339405536651611, "global_step": 182767, "epoch": 4351} {"train_loss": -7.101508140563965, "global_step": 182768, "epoch": 4351} {"train_loss": -7.100700855255127, "global_step": 182769, "epoch": 4351} {"train_loss": -7.153051376342773, "global_step": 182770, "epoch": 4351} {"train_loss": -7.2898054122924805, "global_step": 182771, "epoch": 4351} {"train_loss": -7.120988368988037, "global_step": 182772, "epoch": 4351} {"train_loss": -7.1709418296813965, "global_step": 182773, "epoch": 4351} {"train_loss": -7.129697799682617, "global_step": 182774, "epoch": 4351} {"train_loss": -7.220853805541992, "global_step": 182775, "epoch": 4351} {"train_loss": -7.127665042877197, "global_step": 182776, "epoch": 4351} {"train_loss": -7.096177577972412, "global_step": 182777, "epoch": 4351} {"train_loss": -7.219397068023682, "global_step": 182778, "epoch": 4351} {"train_loss": -7.17026948928833, "global_step": 182779, "epoch": 4351} {"train_loss": -7.2019572257995605, "global_step": 182780, "epoch": 4351} {"train_loss": -7.161896705627441, "global_step": 182781, "epoch": 4351} {"train_loss": -7.2054338455200195, "global_step": 182782, "epoch": 4351} {"train_loss": -7.146086261385963, "global_step": 182783, "epoch": 4351, "val_loss": 69322.5078125} {"train_loss": -7.198695182800293, "global_step": 182784, "epoch": 4352} {"train_loss": -7.233522415161133, "global_step": 182785, "epoch": 4352} {"train_loss": -7.22249174118042, "global_step": 182786, "epoch": 4352} {"train_loss": -7.207495212554932, "global_step": 182787, "epoch": 4352} {"train_loss": -7.110167503356934, "global_step": 182788, "epoch": 4352} {"train_loss": -7.2314629554748535, "global_step": 182789, "epoch": 4352} {"train_loss": -7.149291038513184, "global_step": 182790, "epoch": 4352} {"train_loss": -7.144259929656982, "global_step": 182791, "epoch": 4352} {"train_loss": -7.1281843185424805, "global_step": 182792, "epoch": 4352} {"train_loss": -7.1801252365112305, "global_step": 182793, "epoch": 4352} {"train_loss": -7.111301422119141, "global_step": 182794, "epoch": 4352} {"train_loss": -7.073856353759766, "global_step": 182795, "epoch": 4352} {"train_loss": -6.978641033172607, "global_step": 182796, "epoch": 4352} {"train_loss": -7.119365692138672, "global_step": 182797, "epoch": 4352} {"train_loss": -7.136045455932617, "global_step": 182798, "epoch": 4352} {"train_loss": -6.990487098693848, "global_step": 182799, "epoch": 4352} {"train_loss": -7.216296672821045, "global_step": 182800, "epoch": 4352} {"train_loss": -6.982722759246826, "global_step": 182801, "epoch": 4352} {"train_loss": -7.085813045501709, "global_step": 182802, "epoch": 4352} {"train_loss": -7.170382499694824, "global_step": 182803, "epoch": 4352} {"train_loss": -7.039567947387695, "global_step": 182804, "epoch": 4352} {"train_loss": -7.193912029266357, "global_step": 182805, "epoch": 4352} {"train_loss": -7.04437255859375, "global_step": 182806, "epoch": 4352} {"train_loss": -7.136295318603516, "global_step": 182807, "epoch": 4352} {"train_loss": -7.041965484619141, "global_step": 182808, "epoch": 4352} {"train_loss": -7.002387046813965, "global_step": 182809, "epoch": 4352} {"train_loss": -7.22918176651001, "global_step": 182810, "epoch": 4352} {"train_loss": -7.110294342041016, "global_step": 182811, "epoch": 4352} {"train_loss": -7.193660259246826, "global_step": 182812, "epoch": 4352} {"train_loss": -7.2035627365112305, "global_step": 182813, "epoch": 4352} {"train_loss": -7.061798095703125, "global_step": 182814, "epoch": 4352} {"train_loss": -7.12359619140625, "global_step": 182815, "epoch": 4352} {"train_loss": -7.05964994430542, "global_step": 182816, "epoch": 4352} {"train_loss": -7.102411270141602, "global_step": 182817, "epoch": 4352} {"train_loss": -7.12164306640625, "global_step": 182818, "epoch": 4352} {"train_loss": -7.010626792907715, "global_step": 182819, "epoch": 4352} {"train_loss": -7.063706398010254, "global_step": 182820, "epoch": 4352} {"train_loss": -7.034348011016846, "global_step": 182821, "epoch": 4352} {"train_loss": -7.098258018493652, "global_step": 182822, "epoch": 4352} {"train_loss": -7.029667854309082, "global_step": 182823, "epoch": 4352} {"train_loss": -7.095579147338867, "global_step": 182824, "epoch": 4352} {"train_loss": -7.114931787763323, "global_step": 182825, "epoch": 4352, "val_loss": 69338.390625} {"train_loss": -7.106040000915527, "global_step": 182826, "epoch": 4353} {"train_loss": -7.085551738739014, "global_step": 182827, "epoch": 4353} {"train_loss": -7.122393608093262, "global_step": 182828, "epoch": 4353} {"train_loss": -7.102877616882324, "global_step": 182829, "epoch": 4353} {"train_loss": -7.113591194152832, "global_step": 182830, "epoch": 4353} {"train_loss": -7.196169853210449, "global_step": 182831, "epoch": 4353} {"train_loss": -7.146737575531006, "global_step": 182832, "epoch": 4353} {"train_loss": -7.118334770202637, "global_step": 182833, "epoch": 4353} {"train_loss": -7.183135986328125, "global_step": 182834, "epoch": 4353} {"train_loss": -7.074692726135254, "global_step": 182835, "epoch": 4353} {"train_loss": -7.090900421142578, "global_step": 182836, "epoch": 4353} {"train_loss": -7.168219566345215, "global_step": 182837, "epoch": 4353} {"train_loss": -7.086719512939453, "global_step": 182838, "epoch": 4353} {"train_loss": -7.084648132324219, "global_step": 182839, "epoch": 4353} {"train_loss": -7.136958122253418, "global_step": 182840, "epoch": 4353} {"train_loss": -7.035983085632324, "global_step": 182841, "epoch": 4353} {"train_loss": -7.136627674102783, "global_step": 182842, "epoch": 4353} {"train_loss": -7.200346946716309, "global_step": 182843, "epoch": 4353} {"train_loss": -7.144765853881836, "global_step": 182844, "epoch": 4353} {"train_loss": -7.111252784729004, "global_step": 182845, "epoch": 4353} {"train_loss": -7.243778705596924, "global_step": 182846, "epoch": 4353} {"train_loss": -7.131011962890625, "global_step": 182847, "epoch": 4353} {"train_loss": -7.132532119750977, "global_step": 182848, "epoch": 4353} {"train_loss": -7.203617572784424, "global_step": 182849, "epoch": 4353} {"train_loss": -7.092437267303467, "global_step": 182850, "epoch": 4353} {"train_loss": -7.0894269943237305, "global_step": 182851, "epoch": 4353} {"train_loss": -7.052011489868164, "global_step": 182852, "epoch": 4353} {"train_loss": -6.9542646408081055, "global_step": 182853, "epoch": 4353} {"train_loss": -7.230319976806641, "global_step": 182854, "epoch": 4353} {"train_loss": -6.96246862411499, "global_step": 182855, "epoch": 4353} {"train_loss": -7.098167896270752, "global_step": 182856, "epoch": 4353} {"train_loss": -7.1902031898498535, "global_step": 182857, "epoch": 4353} {"train_loss": -7.057828903198242, "global_step": 182858, "epoch": 4353} {"train_loss": -7.075830936431885, "global_step": 182859, "epoch": 4353} {"train_loss": -7.100876808166504, "global_step": 182860, "epoch": 4353} {"train_loss": -7.145595550537109, "global_step": 182861, "epoch": 4353} {"train_loss": -7.112236022949219, "global_step": 182862, "epoch": 4353} {"train_loss": -7.078658103942871, "global_step": 182863, "epoch": 4353} {"train_loss": -7.158716678619385, "global_step": 182864, "epoch": 4353} {"train_loss": -7.046822547912598, "global_step": 182865, "epoch": 4353} {"train_loss": -7.077004432678223, "global_step": 182866, "epoch": 4353} {"train_loss": -7.113482997530983, "global_step": 182867, "epoch": 4353, "val_loss": 69385.3359375} {"train_loss": -7.207590103149414, "global_step": 182868, "epoch": 4354} {"train_loss": -7.109160423278809, "global_step": 182869, "epoch": 4354} {"train_loss": -7.191507339477539, "global_step": 182870, "epoch": 4354} {"train_loss": -7.191756248474121, "global_step": 182871, "epoch": 4354} {"train_loss": -7.137827396392822, "global_step": 182872, "epoch": 4354} {"train_loss": -7.250580310821533, "global_step": 182873, "epoch": 4354} {"train_loss": -7.268099784851074, "global_step": 182874, "epoch": 4354} {"train_loss": -7.294273853302002, "global_step": 182875, "epoch": 4354} {"train_loss": -7.175586223602295, "global_step": 182876, "epoch": 4354} {"train_loss": -7.185441970825195, "global_step": 182877, "epoch": 4354} {"train_loss": -7.217197418212891, "global_step": 182878, "epoch": 4354} {"train_loss": -7.143499374389648, "global_step": 182879, "epoch": 4354} {"train_loss": -7.232445240020752, "global_step": 182880, "epoch": 4354} {"train_loss": -7.118934154510498, "global_step": 182881, "epoch": 4354} {"train_loss": -7.283330917358398, "global_step": 182882, "epoch": 4354} {"train_loss": -7.188236713409424, "global_step": 182883, "epoch": 4354} {"train_loss": -7.11366081237793, "global_step": 182884, "epoch": 4354} {"train_loss": -7.271573066711426, "global_step": 182885, "epoch": 4354} {"train_loss": -7.10255241394043, "global_step": 182886, "epoch": 4354} {"train_loss": -7.1308441162109375, "global_step": 182887, "epoch": 4354} {"train_loss": -7.133268356323242, "global_step": 182888, "epoch": 4354} {"train_loss": -7.065752983093262, "global_step": 182889, "epoch": 4354} {"train_loss": -7.1454572677612305, "global_step": 182890, "epoch": 4354} {"train_loss": -7.129206657409668, "global_step": 182891, "epoch": 4354} {"train_loss": -7.101927757263184, "global_step": 182892, "epoch": 4354} {"train_loss": -7.163630962371826, "global_step": 182893, "epoch": 4354} {"train_loss": -7.191649436950684, "global_step": 182894, "epoch": 4354} {"train_loss": -7.142024517059326, "global_step": 182895, "epoch": 4354} {"train_loss": -7.18284797668457, "global_step": 182896, "epoch": 4354} {"train_loss": -7.191851615905762, "global_step": 182897, "epoch": 4354} {"train_loss": -7.265275001525879, "global_step": 182898, "epoch": 4354} {"train_loss": -7.278055667877197, "global_step": 182899, "epoch": 4354} {"train_loss": -7.287831783294678, "global_step": 182900, "epoch": 4354} {"train_loss": -7.29239559173584, "global_step": 182901, "epoch": 4354} {"train_loss": -7.227502822875977, "global_step": 182902, "epoch": 4354} {"train_loss": -7.254250526428223, "global_step": 182903, "epoch": 4354} {"train_loss": -7.299250602722168, "global_step": 182904, "epoch": 4354} {"train_loss": -7.265814781188965, "global_step": 182905, "epoch": 4354} {"train_loss": -7.127264022827148, "global_step": 182906, "epoch": 4354} {"train_loss": -7.149550437927246, "global_step": 182907, "epoch": 4354} {"train_loss": -7.226583480834961, "global_step": 182908, "epoch": 4354} {"train_loss": -7.19545977456229, "global_step": 182909, "epoch": 4354, "val_loss": 69189.8203125} {"train_loss": -7.201261520385742, "global_step": 182910, "epoch": 4355} {"train_loss": -7.265185356140137, "global_step": 182911, "epoch": 4355} {"train_loss": -7.324869155883789, "global_step": 182912, "epoch": 4355} {"train_loss": -7.217336177825928, "global_step": 182913, "epoch": 4355} {"train_loss": -7.201294898986816, "global_step": 182914, "epoch": 4355} {"train_loss": -7.219248294830322, "global_step": 182915, "epoch": 4355} {"train_loss": -7.203203201293945, "global_step": 182916, "epoch": 4355} {"train_loss": -7.157127857208252, "global_step": 182917, "epoch": 4355} {"train_loss": -7.211427688598633, "global_step": 182918, "epoch": 4355} {"train_loss": -7.086350917816162, "global_step": 182919, "epoch": 4355} {"train_loss": -7.155069351196289, "global_step": 182920, "epoch": 4355} {"train_loss": -7.156754493713379, "global_step": 182921, "epoch": 4355} {"train_loss": -7.2195210456848145, "global_step": 182922, "epoch": 4355} {"train_loss": -7.2305827140808105, "global_step": 182923, "epoch": 4355} {"train_loss": -6.994030952453613, "global_step": 182924, "epoch": 4355} {"train_loss": -7.1969170570373535, "global_step": 182925, "epoch": 4355} {"train_loss": -7.086014270782471, "global_step": 182926, "epoch": 4355} {"train_loss": -7.129532814025879, "global_step": 182927, "epoch": 4355} {"train_loss": -7.223066329956055, "global_step": 182928, "epoch": 4355} {"train_loss": -7.201961040496826, "global_step": 182929, "epoch": 4355} {"train_loss": -7.180461883544922, "global_step": 182930, "epoch": 4355} {"train_loss": -7.067502498626709, "global_step": 182931, "epoch": 4355} {"train_loss": -7.177265167236328, "global_step": 182932, "epoch": 4355} {"train_loss": -7.0969085693359375, "global_step": 182933, "epoch": 4355} {"train_loss": -7.07363224029541, "global_step": 182934, "epoch": 4355} {"train_loss": -7.043554306030273, "global_step": 182935, "epoch": 4355} {"train_loss": -7.168745994567871, "global_step": 182936, "epoch": 4355} {"train_loss": -7.057216167449951, "global_step": 182937, "epoch": 4355} {"train_loss": -7.262906551361084, "global_step": 182938, "epoch": 4355} {"train_loss": -7.148408889770508, "global_step": 182939, "epoch": 4355} {"train_loss": -7.100830554962158, "global_step": 182940, "epoch": 4355} {"train_loss": -7.080460071563721, "global_step": 182941, "epoch": 4355} {"train_loss": -7.12221622467041, "global_step": 182942, "epoch": 4355} {"train_loss": -6.99462366104126, "global_step": 182943, "epoch": 4355} {"train_loss": -7.100811958312988, "global_step": 182944, "epoch": 4355} {"train_loss": -7.105939865112305, "global_step": 182945, "epoch": 4355} {"train_loss": -7.0137152671813965, "global_step": 182946, "epoch": 4355} {"train_loss": -7.070671081542969, "global_step": 182947, "epoch": 4355} {"train_loss": -7.07476806640625, "global_step": 182948, "epoch": 4355} {"train_loss": -7.0761919021606445, "global_step": 182949, "epoch": 4355} {"train_loss": -7.111979961395264, "global_step": 182950, "epoch": 4355} {"train_loss": -7.139108237766084, "global_step": 182951, "epoch": 4355, "val_loss": 69297.625} {"train_loss": -7.032937526702881, "global_step": 182952, "epoch": 4356} {"train_loss": -6.950706481933594, "global_step": 182953, "epoch": 4356} {"train_loss": -7.01470947265625, "global_step": 182954, "epoch": 4356} {"train_loss": -7.0585808753967285, "global_step": 182955, "epoch": 4356} {"train_loss": -6.860252380371094, "global_step": 182956, "epoch": 4356} {"train_loss": -7.045065879821777, "global_step": 182957, "epoch": 4356} {"train_loss": -6.942806720733643, "global_step": 182958, "epoch": 4356} {"train_loss": -7.13564395904541, "global_step": 182959, "epoch": 4356} {"train_loss": -7.01148796081543, "global_step": 182960, "epoch": 4356} {"train_loss": -7.003655910491943, "global_step": 182961, "epoch": 4356} {"train_loss": -7.068619251251221, "global_step": 182962, "epoch": 4356} {"train_loss": -7.121152877807617, "global_step": 182963, "epoch": 4356} {"train_loss": -6.954944610595703, "global_step": 182964, "epoch": 4356} {"train_loss": -7.013551712036133, "global_step": 182965, "epoch": 4356} {"train_loss": -7.104714393615723, "global_step": 182966, "epoch": 4356} {"train_loss": -7.079768180847168, "global_step": 182967, "epoch": 4356} {"train_loss": -7.10377836227417, "global_step": 182968, "epoch": 4356} {"train_loss": -7.251502513885498, "global_step": 182969, "epoch": 4356} {"train_loss": -7.0522356033325195, "global_step": 182970, "epoch": 4356} {"train_loss": -7.2292304039001465, "global_step": 182971, "epoch": 4356} {"train_loss": -7.105435848236084, "global_step": 182972, "epoch": 4356} {"train_loss": -7.171570301055908, "global_step": 182973, "epoch": 4356} {"train_loss": -7.094444751739502, "global_step": 182974, "epoch": 4356} {"train_loss": -7.182581424713135, "global_step": 182975, "epoch": 4356} {"train_loss": -6.990797996520996, "global_step": 182976, "epoch": 4356} {"train_loss": -7.148619651794434, "global_step": 182977, "epoch": 4356} {"train_loss": -7.003684043884277, "global_step": 182978, "epoch": 4356} {"train_loss": -7.061312198638916, "global_step": 182979, "epoch": 4356} {"train_loss": -7.182751655578613, "global_step": 182980, "epoch": 4356} {"train_loss": -7.094202518463135, "global_step": 182981, "epoch": 4356} {"train_loss": -7.067634582519531, "global_step": 182982, "epoch": 4356} {"train_loss": -7.075348854064941, "global_step": 182983, "epoch": 4356} {"train_loss": -7.123979568481445, "global_step": 182984, "epoch": 4356} {"train_loss": -6.977293491363525, "global_step": 182985, "epoch": 4356} {"train_loss": -7.042384147644043, "global_step": 182986, "epoch": 4356} {"train_loss": -6.987522602081299, "global_step": 182987, "epoch": 4356} {"train_loss": -6.986576557159424, "global_step": 182988, "epoch": 4356} {"train_loss": -7.076052665710449, "global_step": 182989, "epoch": 4356} {"train_loss": -7.030273914337158, "global_step": 182990, "epoch": 4356} {"train_loss": -7.03954553604126, "global_step": 182991, "epoch": 4356} {"train_loss": -7.1067399978637695, "global_step": 182992, "epoch": 4356} {"train_loss": -7.060415233884539, "global_step": 182993, "epoch": 4356, "val_loss": 69498.3359375} {"train_loss": -7.031085014343262, "global_step": 182994, "epoch": 4357} {"train_loss": -7.004183769226074, "global_step": 182995, "epoch": 4357} {"train_loss": -7.031492233276367, "global_step": 182996, "epoch": 4357} {"train_loss": -6.961577415466309, "global_step": 182997, "epoch": 4357} {"train_loss": -6.9092864990234375, "global_step": 182998, "epoch": 4357} {"train_loss": -7.041966438293457, "global_step": 182999, "epoch": 4357} {"train_loss": -6.965142726898193, "global_step": 183000, "epoch": 4357} {"train_loss": -7.037759780883789, "global_step": 183001, "epoch": 4357} {"train_loss": -6.986062526702881, "global_step": 183002, "epoch": 4357} {"train_loss": -7.061792373657227, "global_step": 183003, "epoch": 4357} {"train_loss": -7.039862155914307, "global_step": 183004, "epoch": 4357} {"train_loss": -7.02669620513916, "global_step": 183005, "epoch": 4357} {"train_loss": -7.019219398498535, "global_step": 183006, "epoch": 4357} {"train_loss": -7.008126258850098, "global_step": 183007, "epoch": 4357} {"train_loss": -6.964732646942139, "global_step": 183008, "epoch": 4357} {"train_loss": -6.986600875854492, "global_step": 183009, "epoch": 4357} {"train_loss": -7.125762939453125, "global_step": 183010, "epoch": 4357} {"train_loss": -6.894315242767334, "global_step": 183011, "epoch": 4357} {"train_loss": -7.090904235839844, "global_step": 183012, "epoch": 4357} {"train_loss": -7.074742317199707, "global_step": 183013, "epoch": 4357} {"train_loss": -6.874975681304932, "global_step": 183014, "epoch": 4357} {"train_loss": -6.952691555023193, "global_step": 183015, "epoch": 4357} {"train_loss": -7.062577247619629, "global_step": 183016, "epoch": 4357} {"train_loss": -7.034947395324707, "global_step": 183017, "epoch": 4357} {"train_loss": -7.023165702819824, "global_step": 183018, "epoch": 4357} {"train_loss": -7.057505130767822, "global_step": 183019, "epoch": 4357} {"train_loss": -7.057285308837891, "global_step": 183020, "epoch": 4357} {"train_loss": -7.017293930053711, "global_step": 183021, "epoch": 4357} {"train_loss": -6.995238780975342, "global_step": 183022, "epoch": 4357} {"train_loss": -6.991602897644043, "global_step": 183023, "epoch": 4357} {"train_loss": -7.123735427856445, "global_step": 183024, "epoch": 4357} {"train_loss": -7.086358547210693, "global_step": 183025, "epoch": 4357} {"train_loss": -7.175896167755127, "global_step": 183026, "epoch": 4357} {"train_loss": -7.223979473114014, "global_step": 183027, "epoch": 4357} {"train_loss": -7.303156852722168, "global_step": 183028, "epoch": 4357} {"train_loss": -7.2393927574157715, "global_step": 183029, "epoch": 4357} {"train_loss": -7.173198223114014, "global_step": 183030, "epoch": 4357} {"train_loss": -7.244656562805176, "global_step": 183031, "epoch": 4357} {"train_loss": -7.1273956298828125, "global_step": 183032, "epoch": 4357} {"train_loss": -7.064169883728027, "global_step": 183033, "epoch": 4357} {"train_loss": -7.139760971069336, "global_step": 183034, "epoch": 4357} {"train_loss": -7.0567077568599155, "global_step": 183035, "epoch": 4357, "val_loss": 69417.7734375} {"train_loss": -7.151264190673828, "global_step": 183036, "epoch": 4358} {"train_loss": -7.230859279632568, "global_step": 183037, "epoch": 4358} {"train_loss": -7.226346015930176, "global_step": 183038, "epoch": 4358} {"train_loss": -7.231202125549316, "global_step": 183039, "epoch": 4358} {"train_loss": -7.243744850158691, "global_step": 183040, "epoch": 4358} {"train_loss": -7.048205852508545, "global_step": 183041, "epoch": 4358} {"train_loss": -7.182450294494629, "global_step": 183042, "epoch": 4358} {"train_loss": -7.199371337890625, "global_step": 183043, "epoch": 4358} {"train_loss": -7.153173446655273, "global_step": 183044, "epoch": 4358} {"train_loss": -7.233989715576172, "global_step": 183045, "epoch": 4358} {"train_loss": -7.1013336181640625, "global_step": 183046, "epoch": 4358} {"train_loss": -7.2505292892456055, "global_step": 183047, "epoch": 4358} {"train_loss": -7.1851396560668945, "global_step": 183048, "epoch": 4358} {"train_loss": -7.198394775390625, "global_step": 183049, "epoch": 4358} {"train_loss": -7.2394304275512695, "global_step": 183050, "epoch": 4358} {"train_loss": -7.158051490783691, "global_step": 183051, "epoch": 4358} {"train_loss": -7.138350486755371, "global_step": 183052, "epoch": 4358} {"train_loss": -7.197607517242432, "global_step": 183053, "epoch": 4358} {"train_loss": -7.256592750549316, "global_step": 183054, "epoch": 4358} {"train_loss": -7.103000640869141, "global_step": 183055, "epoch": 4358} {"train_loss": -7.157155513763428, "global_step": 183056, "epoch": 4358} {"train_loss": -7.2192792892456055, "global_step": 183057, "epoch": 4358} {"train_loss": -7.161162376403809, "global_step": 183058, "epoch": 4358} {"train_loss": -7.1715803146362305, "global_step": 183059, "epoch": 4358} {"train_loss": -7.1915283203125, "global_step": 183060, "epoch": 4358} {"train_loss": -7.152792930603027, "global_step": 183061, "epoch": 4358} {"train_loss": -7.110797882080078, "global_step": 183062, "epoch": 4358} {"train_loss": -7.26169490814209, "global_step": 183063, "epoch": 4358} {"train_loss": -7.110982894897461, "global_step": 183064, "epoch": 4358} {"train_loss": -7.05288028717041, "global_step": 183065, "epoch": 4358} {"train_loss": -7.181699752807617, "global_step": 183066, "epoch": 4358} {"train_loss": -7.183112144470215, "global_step": 183067, "epoch": 4358} {"train_loss": -7.209727764129639, "global_step": 183068, "epoch": 4358} {"train_loss": -7.047133445739746, "global_step": 183069, "epoch": 4358} {"train_loss": -7.033304214477539, "global_step": 183070, "epoch": 4358} {"train_loss": -7.133726596832275, "global_step": 183071, "epoch": 4358} {"train_loss": -7.197616100311279, "global_step": 183072, "epoch": 4358} {"train_loss": -7.194460391998291, "global_step": 183073, "epoch": 4358} {"train_loss": -7.215268135070801, "global_step": 183074, "epoch": 4358} {"train_loss": -7.069107532501221, "global_step": 183075, "epoch": 4358} {"train_loss": -7.008890151977539, "global_step": 183076, "epoch": 4358} {"train_loss": -7.166679393677485, "global_step": 183077, "epoch": 4358, "val_loss": 69269.890625} {"train_loss": -6.8916096687316895, "global_step": 183078, "epoch": 4359} {"train_loss": -7.139275550842285, "global_step": 183079, "epoch": 4359} {"train_loss": -7.083656311035156, "global_step": 183080, "epoch": 4359} {"train_loss": -7.052419662475586, "global_step": 183081, "epoch": 4359} {"train_loss": -6.972282409667969, "global_step": 183082, "epoch": 4359} {"train_loss": -7.056167125701904, "global_step": 183083, "epoch": 4359} {"train_loss": -7.140739440917969, "global_step": 183084, "epoch": 4359} {"train_loss": -7.029349327087402, "global_step": 183085, "epoch": 4359} {"train_loss": -7.122486114501953, "global_step": 183086, "epoch": 4359} {"train_loss": -7.082901954650879, "global_step": 183087, "epoch": 4359} {"train_loss": -6.989280700683594, "global_step": 183088, "epoch": 4359} {"train_loss": -7.034505844116211, "global_step": 183089, "epoch": 4359} {"train_loss": -7.0759172439575195, "global_step": 183090, "epoch": 4359} {"train_loss": -7.0114946365356445, "global_step": 183091, "epoch": 4359} {"train_loss": -7.060519218444824, "global_step": 183092, "epoch": 4359} {"train_loss": -7.147463321685791, "global_step": 183093, "epoch": 4359} {"train_loss": -7.113740921020508, "global_step": 183094, "epoch": 4359} {"train_loss": -7.069112300872803, "global_step": 183095, "epoch": 4359} {"train_loss": -7.085773468017578, "global_step": 183096, "epoch": 4359} {"train_loss": -7.068979263305664, "global_step": 183097, "epoch": 4359} {"train_loss": -7.121993064880371, "global_step": 183098, "epoch": 4359} {"train_loss": -7.083772659301758, "global_step": 183099, "epoch": 4359} {"train_loss": -7.234813690185547, "global_step": 183100, "epoch": 4359} {"train_loss": -7.168106555938721, "global_step": 183101, "epoch": 4359} {"train_loss": -7.118167877197266, "global_step": 183102, "epoch": 4359} {"train_loss": -7.104761123657227, "global_step": 183103, "epoch": 4359} {"train_loss": -7.1840009689331055, "global_step": 183104, "epoch": 4359} {"train_loss": -7.224433898925781, "global_step": 183105, "epoch": 4359} {"train_loss": -7.145347595214844, "global_step": 183106, "epoch": 4359} {"train_loss": -7.121697902679443, "global_step": 183107, "epoch": 4359} {"train_loss": -6.970582485198975, "global_step": 183108, "epoch": 4359} {"train_loss": -7.026960372924805, "global_step": 183109, "epoch": 4359} {"train_loss": -7.073326587677002, "global_step": 183110, "epoch": 4359} {"train_loss": -6.983364105224609, "global_step": 183111, "epoch": 4359} {"train_loss": -7.131435871124268, "global_step": 183112, "epoch": 4359} {"train_loss": -7.086786270141602, "global_step": 183113, "epoch": 4359} {"train_loss": -6.964086055755615, "global_step": 183114, "epoch": 4359} {"train_loss": -7.119155406951904, "global_step": 183115, "epoch": 4359} {"train_loss": -6.96682071685791, "global_step": 183116, "epoch": 4359} {"train_loss": -7.073331832885742, "global_step": 183117, "epoch": 4359} {"train_loss": -7.0879011154174805, "global_step": 183118, "epoch": 4359} {"train_loss": -7.0791221005575995, "global_step": 183119, "epoch": 4359, "val_loss": 69481.3515625} {"train_loss": -7.222722053527832, "global_step": 183120, "epoch": 4360} {"train_loss": -7.119231700897217, "global_step": 183121, "epoch": 4360} {"train_loss": -7.082093238830566, "global_step": 183122, "epoch": 4360} {"train_loss": -7.1570024490356445, "global_step": 183123, "epoch": 4360} {"train_loss": -7.181832790374756, "global_step": 183124, "epoch": 4360} {"train_loss": -7.149768352508545, "global_step": 183125, "epoch": 4360} {"train_loss": -7.149572372436523, "global_step": 183126, "epoch": 4360} {"train_loss": -7.121753692626953, "global_step": 183127, "epoch": 4360} {"train_loss": -7.16749382019043, "global_step": 183128, "epoch": 4360} {"train_loss": -7.277087688446045, "global_step": 183129, "epoch": 4360} {"train_loss": -7.1026082038879395, "global_step": 183130, "epoch": 4360} {"train_loss": -7.085973262786865, "global_step": 183131, "epoch": 4360} {"train_loss": -7.241615295410156, "global_step": 183132, "epoch": 4360} {"train_loss": -7.186823844909668, "global_step": 183133, "epoch": 4360} {"train_loss": -7.17448091506958, "global_step": 183134, "epoch": 4360} {"train_loss": -7.066202163696289, "global_step": 183135, "epoch": 4360} {"train_loss": -7.130306720733643, "global_step": 183136, "epoch": 4360} {"train_loss": -7.158749580383301, "global_step": 183137, "epoch": 4360} {"train_loss": -7.156806945800781, "global_step": 183138, "epoch": 4360} {"train_loss": -7.099804878234863, "global_step": 183139, "epoch": 4360} {"train_loss": -7.144930839538574, "global_step": 183140, "epoch": 4360} {"train_loss": -7.125082969665527, "global_step": 183141, "epoch": 4360} {"train_loss": -7.138197898864746, "global_step": 183142, "epoch": 4360} {"train_loss": -7.150473594665527, "global_step": 183143, "epoch": 4360} {"train_loss": -7.118974685668945, "global_step": 183144, "epoch": 4360} {"train_loss": -7.102235794067383, "global_step": 183145, "epoch": 4360} {"train_loss": -7.139839172363281, "global_step": 183146, "epoch": 4360} {"train_loss": -7.185639381408691, "global_step": 183147, "epoch": 4360} {"train_loss": -7.218823432922363, "global_step": 183148, "epoch": 4360} {"train_loss": -7.102906227111816, "global_step": 183149, "epoch": 4360} {"train_loss": -7.112638473510742, "global_step": 183150, "epoch": 4360} {"train_loss": -7.103347301483154, "global_step": 183151, "epoch": 4360} {"train_loss": -7.058579921722412, "global_step": 183152, "epoch": 4360} {"train_loss": -7.171810626983643, "global_step": 183153, "epoch": 4360} {"train_loss": -7.219829559326172, "global_step": 183154, "epoch": 4360} {"train_loss": -7.154695510864258, "global_step": 183155, "epoch": 4360} {"train_loss": -7.1857500076293945, "global_step": 183156, "epoch": 4360} {"train_loss": -7.178637504577637, "global_step": 183157, "epoch": 4360} {"train_loss": -6.981622219085693, "global_step": 183158, "epoch": 4360} {"train_loss": -7.052305221557617, "global_step": 183159, "epoch": 4360} {"train_loss": -7.141566276550293, "global_step": 183160, "epoch": 4360} {"train_loss": -7.144839797701154, "global_step": 183161, "epoch": 4360, "val_loss": 69405.2421875} {"train_loss": -6.992011547088623, "global_step": 183162, "epoch": 4361} {"train_loss": -7.195927143096924, "global_step": 183163, "epoch": 4361} {"train_loss": -7.200685501098633, "global_step": 183164, "epoch": 4361} {"train_loss": -7.124267578125, "global_step": 183165, "epoch": 4361} {"train_loss": -7.094721794128418, "global_step": 183166, "epoch": 4361} {"train_loss": -7.134376049041748, "global_step": 183167, "epoch": 4361} {"train_loss": -7.113257884979248, "global_step": 183168, "epoch": 4361} {"train_loss": -7.149991035461426, "global_step": 183169, "epoch": 4361} {"train_loss": -7.178099155426025, "global_step": 183170, "epoch": 4361} {"train_loss": -7.114578723907471, "global_step": 183171, "epoch": 4361} {"train_loss": -7.002288818359375, "global_step": 183172, "epoch": 4361} {"train_loss": -7.192811012268066, "global_step": 183173, "epoch": 4361} {"train_loss": -7.102540969848633, "global_step": 183174, "epoch": 4361} {"train_loss": -7.006817817687988, "global_step": 183175, "epoch": 4361} {"train_loss": -7.18095064163208, "global_step": 183176, "epoch": 4361} {"train_loss": -7.131740570068359, "global_step": 183177, "epoch": 4361} {"train_loss": -7.198058605194092, "global_step": 183178, "epoch": 4361} {"train_loss": -7.1305389404296875, "global_step": 183179, "epoch": 4361} {"train_loss": -7.043048858642578, "global_step": 183180, "epoch": 4361} {"train_loss": -7.191893577575684, "global_step": 183181, "epoch": 4361} {"train_loss": -6.974360466003418, "global_step": 183182, "epoch": 4361} {"train_loss": -7.2020955085754395, "global_step": 183183, "epoch": 4361} {"train_loss": -7.036330223083496, "global_step": 183184, "epoch": 4361} {"train_loss": -7.053718566894531, "global_step": 183185, "epoch": 4361} {"train_loss": -7.14035701751709, "global_step": 183186, "epoch": 4361} {"train_loss": -7.0423994064331055, "global_step": 183187, "epoch": 4361} {"train_loss": -7.053124904632568, "global_step": 183188, "epoch": 4361} {"train_loss": -6.936145782470703, "global_step": 183189, "epoch": 4361} {"train_loss": -7.113550186157227, "global_step": 183190, "epoch": 4361} {"train_loss": -7.102667331695557, "global_step": 183191, "epoch": 4361} {"train_loss": -7.046439170837402, "global_step": 183192, "epoch": 4361} {"train_loss": -7.109304428100586, "global_step": 183193, "epoch": 4361} {"train_loss": -7.092752933502197, "global_step": 183194, "epoch": 4361} {"train_loss": -7.045985221862793, "global_step": 183195, "epoch": 4361} {"train_loss": -7.0756025314331055, "global_step": 183196, "epoch": 4361} {"train_loss": -7.082821846008301, "global_step": 183197, "epoch": 4361} {"train_loss": -7.072757720947266, "global_step": 183198, "epoch": 4361} {"train_loss": -7.141051292419434, "global_step": 183199, "epoch": 4361} {"train_loss": -7.057465553283691, "global_step": 183200, "epoch": 4361} {"train_loss": -6.920236587524414, "global_step": 183201, "epoch": 4361} {"train_loss": -7.1957597732543945, "global_step": 183202, "epoch": 4361} {"train_loss": -7.097949788683937, "global_step": 183203, "epoch": 4361, "val_loss": 69571.9140625} {"train_loss": -7.139405250549316, "global_step": 183204, "epoch": 4362} {"train_loss": -7.145685195922852, "global_step": 183205, "epoch": 4362} {"train_loss": -7.010498046875, "global_step": 183206, "epoch": 4362} {"train_loss": -7.071817398071289, "global_step": 183207, "epoch": 4362} {"train_loss": -7.0416717529296875, "global_step": 183208, "epoch": 4362} {"train_loss": -7.089320182800293, "global_step": 183209, "epoch": 4362} {"train_loss": -7.159576416015625, "global_step": 183210, "epoch": 4362} {"train_loss": -7.166635990142822, "global_step": 183211, "epoch": 4362} {"train_loss": -7.155482769012451, "global_step": 183212, "epoch": 4362} {"train_loss": -7.129843711853027, "global_step": 183213, "epoch": 4362} {"train_loss": -7.119093418121338, "global_step": 183214, "epoch": 4362} {"train_loss": -7.089797496795654, "global_step": 183215, "epoch": 4362} {"train_loss": -7.238193511962891, "global_step": 183216, "epoch": 4362} {"train_loss": -7.081528663635254, "global_step": 183217, "epoch": 4362} {"train_loss": -7.0809736251831055, "global_step": 183218, "epoch": 4362} {"train_loss": -7.112338066101074, "global_step": 183219, "epoch": 4362} {"train_loss": -7.128482818603516, "global_step": 183220, "epoch": 4362} {"train_loss": -7.097764015197754, "global_step": 183221, "epoch": 4362} {"train_loss": -7.069815158843994, "global_step": 183222, "epoch": 4362} {"train_loss": -7.084882736206055, "global_step": 183223, "epoch": 4362} {"train_loss": -7.108238220214844, "global_step": 183224, "epoch": 4362} {"train_loss": -7.118515491485596, "global_step": 183225, "epoch": 4362} {"train_loss": -7.207772731781006, "global_step": 183226, "epoch": 4362} {"train_loss": -7.207320213317871, "global_step": 183227, "epoch": 4362} {"train_loss": -7.094413757324219, "global_step": 183228, "epoch": 4362} {"train_loss": -7.108396530151367, "global_step": 183229, "epoch": 4362} {"train_loss": -7.0937089920043945, "global_step": 183230, "epoch": 4362} {"train_loss": -7.077762603759766, "global_step": 183231, "epoch": 4362} {"train_loss": -7.080842018127441, "global_step": 183232, "epoch": 4362} {"train_loss": -7.212940692901611, "global_step": 183233, "epoch": 4362} {"train_loss": -7.155938625335693, "global_step": 183234, "epoch": 4362} {"train_loss": -7.26150369644165, "global_step": 183235, "epoch": 4362} {"train_loss": -7.143579959869385, "global_step": 183236, "epoch": 4362} {"train_loss": -7.202906608581543, "global_step": 183237, "epoch": 4362} {"train_loss": -7.118021488189697, "global_step": 183238, "epoch": 4362} {"train_loss": -7.061570167541504, "global_step": 183239, "epoch": 4362} {"train_loss": -7.216090202331543, "global_step": 183240, "epoch": 4362} {"train_loss": -7.040102958679199, "global_step": 183241, "epoch": 4362} {"train_loss": -7.109416484832764, "global_step": 183242, "epoch": 4362} {"train_loss": -7.173807144165039, "global_step": 183243, "epoch": 4362} {"train_loss": -7.120051383972168, "global_step": 183244, "epoch": 4362} {"train_loss": -7.124812489464169, "global_step": 183245, "epoch": 4362, "val_loss": 69492.4140625} {"train_loss": -7.22565221786499, "global_step": 183246, "epoch": 4363} {"train_loss": -7.135095119476318, "global_step": 183247, "epoch": 4363} {"train_loss": -7.195513725280762, "global_step": 183248, "epoch": 4363} {"train_loss": -7.186211585998535, "global_step": 183249, "epoch": 4363} {"train_loss": -7.228938102722168, "global_step": 183250, "epoch": 4363} {"train_loss": -7.170071601867676, "global_step": 183251, "epoch": 4363} {"train_loss": -7.172430038452148, "global_step": 183252, "epoch": 4363} {"train_loss": -7.138761043548584, "global_step": 183253, "epoch": 4363} {"train_loss": -7.21574068069458, "global_step": 183254, "epoch": 4363} {"train_loss": -7.133000373840332, "global_step": 183255, "epoch": 4363} {"train_loss": -7.138652801513672, "global_step": 183256, "epoch": 4363} {"train_loss": -7.2467522621154785, "global_step": 183257, "epoch": 4363} {"train_loss": -7.198967456817627, "global_step": 183258, "epoch": 4363} {"train_loss": -7.143648624420166, "global_step": 183259, "epoch": 4363} {"train_loss": -7.2127485275268555, "global_step": 183260, "epoch": 4363} {"train_loss": -7.163247108459473, "global_step": 183261, "epoch": 4363} {"train_loss": -7.090428352355957, "global_step": 183262, "epoch": 4363} {"train_loss": -7.107712745666504, "global_step": 183263, "epoch": 4363} {"train_loss": -7.258542060852051, "global_step": 183264, "epoch": 4363} {"train_loss": -7.263924598693848, "global_step": 183265, "epoch": 4363} {"train_loss": -7.110403060913086, "global_step": 183266, "epoch": 4363} {"train_loss": -7.107304573059082, "global_step": 183267, "epoch": 4363} {"train_loss": -7.200771808624268, "global_step": 183268, "epoch": 4363} {"train_loss": -7.235282897949219, "global_step": 183269, "epoch": 4363} {"train_loss": -7.156944751739502, "global_step": 183270, "epoch": 4363} {"train_loss": -7.176648139953613, "global_step": 183271, "epoch": 4363} {"train_loss": -7.161266803741455, "global_step": 183272, "epoch": 4363} {"train_loss": -7.142088413238525, "global_step": 183273, "epoch": 4363} {"train_loss": -7.206695079803467, "global_step": 183274, "epoch": 4363} {"train_loss": -7.2510762214660645, "global_step": 183275, "epoch": 4363} {"train_loss": -7.1710309982299805, "global_step": 183276, "epoch": 4363} {"train_loss": -7.0983991622924805, "global_step": 183277, "epoch": 4363} {"train_loss": -7.0911865234375, "global_step": 183278, "epoch": 4363} {"train_loss": -7.171873092651367, "global_step": 183279, "epoch": 4363} {"train_loss": -7.19355583190918, "global_step": 183280, "epoch": 4363} {"train_loss": -7.1566667556762695, "global_step": 183281, "epoch": 4363} {"train_loss": -7.2451910972595215, "global_step": 183282, "epoch": 4363} {"train_loss": -7.290576934814453, "global_step": 183283, "epoch": 4363} {"train_loss": -7.221722602844238, "global_step": 183284, "epoch": 4363} {"train_loss": -7.17941951751709, "global_step": 183285, "epoch": 4363} {"train_loss": -7.25020694732666, "global_step": 183286, "epoch": 4363} {"train_loss": -7.182830765133812, "global_step": 183287, "epoch": 4363, "val_loss": 69538.125} {"train_loss": -7.184153079986572, "global_step": 183288, "epoch": 4364} {"train_loss": -7.1799163818359375, "global_step": 183289, "epoch": 4364} {"train_loss": -7.150289058685303, "global_step": 183290, "epoch": 4364} {"train_loss": -7.298813819885254, "global_step": 183291, "epoch": 4364} {"train_loss": -7.177382946014404, "global_step": 183292, "epoch": 4364} {"train_loss": -7.119566917419434, "global_step": 183293, "epoch": 4364} {"train_loss": -7.15469217300415, "global_step": 183294, "epoch": 4364} {"train_loss": -7.181452751159668, "global_step": 183295, "epoch": 4364} {"train_loss": -7.0321197509765625, "global_step": 183296, "epoch": 4364} {"train_loss": -7.178526401519775, "global_step": 183297, "epoch": 4364} {"train_loss": -7.154178619384766, "global_step": 183298, "epoch": 4364} {"train_loss": -7.148033142089844, "global_step": 183299, "epoch": 4364} {"train_loss": -7.255337715148926, "global_step": 183300, "epoch": 4364} {"train_loss": -7.131274223327637, "global_step": 183301, "epoch": 4364} {"train_loss": -7.311479091644287, "global_step": 183302, "epoch": 4364} {"train_loss": -7.226297855377197, "global_step": 183303, "epoch": 4364} {"train_loss": -7.163222312927246, "global_step": 183304, "epoch": 4364} {"train_loss": -7.226858139038086, "global_step": 183305, "epoch": 4364} {"train_loss": -7.123964786529541, "global_step": 183306, "epoch": 4364} {"train_loss": -7.081098556518555, "global_step": 183307, "epoch": 4364} {"train_loss": -7.184239387512207, "global_step": 183308, "epoch": 4364} {"train_loss": -7.080630302429199, "global_step": 183309, "epoch": 4364} {"train_loss": -7.154265880584717, "global_step": 183310, "epoch": 4364} {"train_loss": -7.02871561050415, "global_step": 183311, "epoch": 4364} {"train_loss": -7.131999969482422, "global_step": 183312, "epoch": 4364} {"train_loss": -7.119970321655273, "global_step": 183313, "epoch": 4364} {"train_loss": -7.07945442199707, "global_step": 183314, "epoch": 4364} {"train_loss": -7.1160078048706055, "global_step": 183315, "epoch": 4364} {"train_loss": -7.123544216156006, "global_step": 183316, "epoch": 4364} {"train_loss": -7.035953521728516, "global_step": 183317, "epoch": 4364} {"train_loss": -7.215669631958008, "global_step": 183318, "epoch": 4364} {"train_loss": -7.020752906799316, "global_step": 183319, "epoch": 4364} {"train_loss": -7.147229194641113, "global_step": 183320, "epoch": 4364} {"train_loss": -7.115042209625244, "global_step": 183321, "epoch": 4364} {"train_loss": -7.030341148376465, "global_step": 183322, "epoch": 4364} {"train_loss": -7.069529056549072, "global_step": 183323, "epoch": 4364} {"train_loss": -7.116778373718262, "global_step": 183324, "epoch": 4364} {"train_loss": -7.195538520812988, "global_step": 183325, "epoch": 4364} {"train_loss": -6.9832763671875, "global_step": 183326, "epoch": 4364} {"train_loss": -7.16980504989624, "global_step": 183327, "epoch": 4364} {"train_loss": -7.113408088684082, "global_step": 183328, "epoch": 4364} {"train_loss": -7.135267836706979, "global_step": 183329, "epoch": 4364, "val_loss": 69524.4609375} {"train_loss": -7.110806465148926, "global_step": 183330, "epoch": 4365} {"train_loss": -6.941762924194336, "global_step": 183331, "epoch": 4365} {"train_loss": -7.032598495483398, "global_step": 183332, "epoch": 4365} {"train_loss": -7.047687530517578, "global_step": 183333, "epoch": 4365} {"train_loss": -7.122973442077637, "global_step": 183334, "epoch": 4365} {"train_loss": -7.047310829162598, "global_step": 183335, "epoch": 4365} {"train_loss": -7.181430816650391, "global_step": 183336, "epoch": 4365} {"train_loss": -7.070769309997559, "global_step": 183337, "epoch": 4365} {"train_loss": -6.970759391784668, "global_step": 183338, "epoch": 4365} {"train_loss": -6.993086814880371, "global_step": 183339, "epoch": 4365} {"train_loss": -6.9466753005981445, "global_step": 183340, "epoch": 4365} {"train_loss": -7.213942527770996, "global_step": 183341, "epoch": 4365} {"train_loss": -7.039437294006348, "global_step": 183342, "epoch": 4365} {"train_loss": -6.995503902435303, "global_step": 183343, "epoch": 4365} {"train_loss": -6.968255043029785, "global_step": 183344, "epoch": 4365} {"train_loss": -7.004376411437988, "global_step": 183345, "epoch": 4365} {"train_loss": -7.076449394226074, "global_step": 183346, "epoch": 4365} {"train_loss": -7.03371524810791, "global_step": 183347, "epoch": 4365} {"train_loss": -7.129448890686035, "global_step": 183348, "epoch": 4365} {"train_loss": -6.945487022399902, "global_step": 183349, "epoch": 4365} {"train_loss": -7.109435081481934, "global_step": 183350, "epoch": 4365} {"train_loss": -7.049994468688965, "global_step": 183351, "epoch": 4365} {"train_loss": -6.9846510887146, "global_step": 183352, "epoch": 4365} {"train_loss": -7.048383712768555, "global_step": 183353, "epoch": 4365} {"train_loss": -7.177135944366455, "global_step": 183354, "epoch": 4365} {"train_loss": -7.163229465484619, "global_step": 183355, "epoch": 4365} {"train_loss": -7.060749053955078, "global_step": 183356, "epoch": 4365} {"train_loss": -7.091283798217773, "global_step": 183357, "epoch": 4365} {"train_loss": -7.152383804321289, "global_step": 183358, "epoch": 4365} {"train_loss": -7.110230445861816, "global_step": 183359, "epoch": 4365} {"train_loss": -7.128277778625488, "global_step": 183360, "epoch": 4365} {"train_loss": -7.134306907653809, "global_step": 183361, "epoch": 4365} {"train_loss": -7.0523481369018555, "global_step": 183362, "epoch": 4365} {"train_loss": -7.05782413482666, "global_step": 183363, "epoch": 4365} {"train_loss": -7.113898754119873, "global_step": 183364, "epoch": 4365} {"train_loss": -7.19912052154541, "global_step": 183365, "epoch": 4365} {"train_loss": -7.129233360290527, "global_step": 183366, "epoch": 4365} {"train_loss": -7.0334672927856445, "global_step": 183367, "epoch": 4365} {"train_loss": -7.056741237640381, "global_step": 183368, "epoch": 4365} {"train_loss": -7.081005096435547, "global_step": 183369, "epoch": 4365} {"train_loss": -7.005217552185059, "global_step": 183370, "epoch": 4365} {"train_loss": -7.069249436968849, "global_step": 183371, "epoch": 4365, "val_loss": 69590.6171875} {"train_loss": -7.15999174118042, "global_step": 183372, "epoch": 4366} {"train_loss": -7.001577854156494, "global_step": 183373, "epoch": 4366} {"train_loss": -7.171257972717285, "global_step": 183374, "epoch": 4366} {"train_loss": -7.151503562927246, "global_step": 183375, "epoch": 4366} {"train_loss": -7.102410793304443, "global_step": 183376, "epoch": 4366} {"train_loss": -7.195802688598633, "global_step": 183377, "epoch": 4366} {"train_loss": -7.157112121582031, "global_step": 183378, "epoch": 4366} {"train_loss": -7.144811630249023, "global_step": 183379, "epoch": 4366} {"train_loss": -7.1746826171875, "global_step": 183380, "epoch": 4366} {"train_loss": -7.103185176849365, "global_step": 183381, "epoch": 4366} {"train_loss": -7.242145538330078, "global_step": 183382, "epoch": 4366} {"train_loss": -7.1757402420043945, "global_step": 183383, "epoch": 4366} {"train_loss": -7.09160041809082, "global_step": 183384, "epoch": 4366} {"train_loss": -7.072659969329834, "global_step": 183385, "epoch": 4366} {"train_loss": -7.125817775726318, "global_step": 183386, "epoch": 4366} {"train_loss": -7.113933563232422, "global_step": 183387, "epoch": 4366} {"train_loss": -7.07940673828125, "global_step": 183388, "epoch": 4366} {"train_loss": -7.091154098510742, "global_step": 183389, "epoch": 4366} {"train_loss": -7.13169002532959, "global_step": 183390, "epoch": 4366} {"train_loss": -7.16072940826416, "global_step": 183391, "epoch": 4366} {"train_loss": -7.149797439575195, "global_step": 183392, "epoch": 4366} {"train_loss": -7.269299507141113, "global_step": 183393, "epoch": 4366} {"train_loss": -7.245632171630859, "global_step": 183394, "epoch": 4366} {"train_loss": -7.196322441101074, "global_step": 183395, "epoch": 4366} {"train_loss": -7.289021015167236, "global_step": 183396, "epoch": 4366} {"train_loss": -7.0742387771606445, "global_step": 183397, "epoch": 4366} {"train_loss": -7.135647296905518, "global_step": 183398, "epoch": 4366} {"train_loss": -7.154288291931152, "global_step": 183399, "epoch": 4366} {"train_loss": -7.200558662414551, "global_step": 183400, "epoch": 4366} {"train_loss": -7.155115127563477, "global_step": 183401, "epoch": 4366} {"train_loss": -7.154707908630371, "global_step": 183402, "epoch": 4366} {"train_loss": -7.033742904663086, "global_step": 183403, "epoch": 4366} {"train_loss": -6.9758620262146, "global_step": 183404, "epoch": 4366} {"train_loss": -7.0465288162231445, "global_step": 183405, "epoch": 4366} {"train_loss": -7.0838751792907715, "global_step": 183406, "epoch": 4366} {"train_loss": -7.083672523498535, "global_step": 183407, "epoch": 4366} {"train_loss": -7.076894760131836, "global_step": 183408, "epoch": 4366} {"train_loss": -7.072098731994629, "global_step": 183409, "epoch": 4366} {"train_loss": -7.0990729331970215, "global_step": 183410, "epoch": 4366} {"train_loss": -7.205977916717529, "global_step": 183411, "epoch": 4366} {"train_loss": -7.065460205078125, "global_step": 183412, "epoch": 4366} {"train_loss": -7.130496195384434, "global_step": 183413, "epoch": 4366, "val_loss": 69325.828125} {"train_loss": -7.09014368057251, "global_step": 183414, "epoch": 4367} {"train_loss": -7.1800384521484375, "global_step": 183415, "epoch": 4367} {"train_loss": -7.084485054016113, "global_step": 183416, "epoch": 4367} {"train_loss": -7.211451530456543, "global_step": 183417, "epoch": 4367} {"train_loss": -7.113015651702881, "global_step": 183418, "epoch": 4367} {"train_loss": -7.108026504516602, "global_step": 183419, "epoch": 4367} {"train_loss": -7.184659481048584, "global_step": 183420, "epoch": 4367} {"train_loss": -7.141304969787598, "global_step": 183421, "epoch": 4367} {"train_loss": -7.134666919708252, "global_step": 183422, "epoch": 4367} {"train_loss": -7.22097110748291, "global_step": 183423, "epoch": 4367} {"train_loss": -7.120522975921631, "global_step": 183424, "epoch": 4367} {"train_loss": -7.297535419464111, "global_step": 183425, "epoch": 4367} {"train_loss": -7.094465732574463, "global_step": 183426, "epoch": 4367} {"train_loss": -7.062195777893066, "global_step": 183427, "epoch": 4367} {"train_loss": -7.176350116729736, "global_step": 183428, "epoch": 4367} {"train_loss": -7.156318187713623, "global_step": 183429, "epoch": 4367} {"train_loss": -7.067442893981934, "global_step": 183430, "epoch": 4367} {"train_loss": -7.092203140258789, "global_step": 183431, "epoch": 4367} {"train_loss": -7.194714546203613, "global_step": 183432, "epoch": 4367} {"train_loss": -7.292563438415527, "global_step": 183433, "epoch": 4367} {"train_loss": -7.083146095275879, "global_step": 183434, "epoch": 4367} {"train_loss": -7.11842155456543, "global_step": 183435, "epoch": 4367} {"train_loss": -7.100677013397217, "global_step": 183436, "epoch": 4367} {"train_loss": -7.121356964111328, "global_step": 183437, "epoch": 4367} {"train_loss": -6.9509172439575195, "global_step": 183438, "epoch": 4367} {"train_loss": -7.02032470703125, "global_step": 183439, "epoch": 4367} {"train_loss": -7.109264373779297, "global_step": 183440, "epoch": 4367} {"train_loss": -7.066348075866699, "global_step": 183441, "epoch": 4367} {"train_loss": -7.148980617523193, "global_step": 183442, "epoch": 4367} {"train_loss": -7.124844551086426, "global_step": 183443, "epoch": 4367} {"train_loss": -6.903947353363037, "global_step": 183444, "epoch": 4367} {"train_loss": -7.099776268005371, "global_step": 183445, "epoch": 4367} {"train_loss": -7.0415167808532715, "global_step": 183446, "epoch": 4367} {"train_loss": -7.1919403076171875, "global_step": 183447, "epoch": 4367} {"train_loss": -7.108701705932617, "global_step": 183448, "epoch": 4367} {"train_loss": -7.067689895629883, "global_step": 183449, "epoch": 4367} {"train_loss": -7.156283378601074, "global_step": 183450, "epoch": 4367} {"train_loss": -7.107311725616455, "global_step": 183451, "epoch": 4367} {"train_loss": -7.057489395141602, "global_step": 183452, "epoch": 4367} {"train_loss": -7.051684856414795, "global_step": 183453, "epoch": 4367} {"train_loss": -7.006032943725586, "global_step": 183454, "epoch": 4367} {"train_loss": -7.113634098143804, "global_step": 183455, "epoch": 4367, "val_loss": 69633.71875} {"train_loss": -7.127233505249023, "global_step": 183456, "epoch": 4368} {"train_loss": -7.069889545440674, "global_step": 183457, "epoch": 4368} {"train_loss": -7.1296844482421875, "global_step": 183458, "epoch": 4368} {"train_loss": -7.190652847290039, "global_step": 183459, "epoch": 4368} {"train_loss": -7.038934707641602, "global_step": 183460, "epoch": 4368} {"train_loss": -7.150299549102783, "global_step": 183461, "epoch": 4368} {"train_loss": -7.192727088928223, "global_step": 183462, "epoch": 4368} {"train_loss": -7.161159515380859, "global_step": 183463, "epoch": 4368} {"train_loss": -7.182775497436523, "global_step": 183464, "epoch": 4368} {"train_loss": -7.140775680541992, "global_step": 183465, "epoch": 4368} {"train_loss": -7.082387924194336, "global_step": 183466, "epoch": 4368} {"train_loss": -7.040933609008789, "global_step": 183467, "epoch": 4368} {"train_loss": -7.106631278991699, "global_step": 183468, "epoch": 4368} {"train_loss": -7.016470432281494, "global_step": 183469, "epoch": 4368} {"train_loss": -7.126110076904297, "global_step": 183470, "epoch": 4368} {"train_loss": -7.118528366088867, "global_step": 183471, "epoch": 4368} {"train_loss": -7.144297122955322, "global_step": 183472, "epoch": 4368} {"train_loss": -7.049800872802734, "global_step": 183473, "epoch": 4368} {"train_loss": -7.1690192222595215, "global_step": 183474, "epoch": 4368} {"train_loss": -7.1093339920043945, "global_step": 183475, "epoch": 4368} {"train_loss": -7.209410667419434, "global_step": 183476, "epoch": 4368} {"train_loss": -7.128270149230957, "global_step": 183477, "epoch": 4368} {"train_loss": -7.016444206237793, "global_step": 183478, "epoch": 4368} {"train_loss": -7.094755172729492, "global_step": 183479, "epoch": 4368} {"train_loss": -7.043598651885986, "global_step": 183480, "epoch": 4368} {"train_loss": -7.103176116943359, "global_step": 183481, "epoch": 4368} {"train_loss": -7.1627326011657715, "global_step": 183482, "epoch": 4368} {"train_loss": -6.981584548950195, "global_step": 183483, "epoch": 4368} {"train_loss": -7.172994613647461, "global_step": 183484, "epoch": 4368} {"train_loss": -7.069478988647461, "global_step": 183485, "epoch": 4368} {"train_loss": -7.040143966674805, "global_step": 183486, "epoch": 4368} {"train_loss": -7.117318153381348, "global_step": 183487, "epoch": 4368} {"train_loss": -7.170982360839844, "global_step": 183488, "epoch": 4368} {"train_loss": -7.064266204833984, "global_step": 183489, "epoch": 4368} {"train_loss": -7.1136932373046875, "global_step": 183490, "epoch": 4368} {"train_loss": -7.06789493560791, "global_step": 183491, "epoch": 4368} {"train_loss": -7.1195573806762695, "global_step": 183492, "epoch": 4368} {"train_loss": -7.212944030761719, "global_step": 183493, "epoch": 4368} {"train_loss": -7.120297431945801, "global_step": 183494, "epoch": 4368} {"train_loss": -7.177463531494141, "global_step": 183495, "epoch": 4368} {"train_loss": -7.194672107696533, "global_step": 183496, "epoch": 4368} {"train_loss": -7.114380541301909, "global_step": 183497, "epoch": 4368, "val_loss": 69344.8359375} {"train_loss": -7.155759811401367, "global_step": 183498, "epoch": 4369} {"train_loss": -7.132057189941406, "global_step": 183499, "epoch": 4369} {"train_loss": -7.251062393188477, "global_step": 183500, "epoch": 4369} {"train_loss": -7.075257301330566, "global_step": 183501, "epoch": 4369} {"train_loss": -7.205677032470703, "global_step": 183502, "epoch": 4369} {"train_loss": -7.213910102844238, "global_step": 183503, "epoch": 4369} {"train_loss": -7.1969451904296875, "global_step": 183504, "epoch": 4369} {"train_loss": -7.208184242248535, "global_step": 183505, "epoch": 4369} {"train_loss": -7.149020671844482, "global_step": 183506, "epoch": 4369} {"train_loss": -7.196258544921875, "global_step": 183507, "epoch": 4369} {"train_loss": -7.203927993774414, "global_step": 183508, "epoch": 4369} {"train_loss": -7.144131660461426, "global_step": 183509, "epoch": 4369} {"train_loss": -7.291417121887207, "global_step": 183510, "epoch": 4369} {"train_loss": -7.289891242980957, "global_step": 183511, "epoch": 4369} {"train_loss": -7.1127705574035645, "global_step": 183512, "epoch": 4369} {"train_loss": -7.156577110290527, "global_step": 183513, "epoch": 4369} {"train_loss": -7.196785926818848, "global_step": 183514, "epoch": 4369} {"train_loss": -7.107570648193359, "global_step": 183515, "epoch": 4369} {"train_loss": -7.151426315307617, "global_step": 183516, "epoch": 4369} {"train_loss": -7.137474060058594, "global_step": 183517, "epoch": 4369} {"train_loss": -7.236751556396484, "global_step": 183518, "epoch": 4369} {"train_loss": -7.23356294631958, "global_step": 183519, "epoch": 4369} {"train_loss": -7.181666374206543, "global_step": 183520, "epoch": 4369} {"train_loss": -7.2335968017578125, "global_step": 183521, "epoch": 4369} {"train_loss": -7.1228437423706055, "global_step": 183522, "epoch": 4369} {"train_loss": -7.065520286560059, "global_step": 183523, "epoch": 4369} {"train_loss": -7.182866096496582, "global_step": 183524, "epoch": 4369} {"train_loss": -7.178206443786621, "global_step": 183525, "epoch": 4369} {"train_loss": -7.180665969848633, "global_step": 183526, "epoch": 4369} {"train_loss": -7.082135200500488, "global_step": 183527, "epoch": 4369} {"train_loss": -7.173450469970703, "global_step": 183528, "epoch": 4369} {"train_loss": -7.1665191650390625, "global_step": 183529, "epoch": 4369} {"train_loss": -7.09456729888916, "global_step": 183530, "epoch": 4369} {"train_loss": -7.046220302581787, "global_step": 183531, "epoch": 4369} {"train_loss": -7.092416763305664, "global_step": 183532, "epoch": 4369} {"train_loss": -7.28980016708374, "global_step": 183533, "epoch": 4369} {"train_loss": -6.850050926208496, "global_step": 183534, "epoch": 4369} {"train_loss": -7.014548301696777, "global_step": 183535, "epoch": 4369} {"train_loss": -6.978492259979248, "global_step": 183536, "epoch": 4369} {"train_loss": -7.059385299682617, "global_step": 183537, "epoch": 4369} {"train_loss": -7.0361104011535645, "global_step": 183538, "epoch": 4369} {"train_loss": -7.148645616713024, "global_step": 183539, "epoch": 4369, "val_loss": 69513.8515625} {"train_loss": -7.053926944732666, "global_step": 183540, "epoch": 4370} {"train_loss": -6.861782550811768, "global_step": 183541, "epoch": 4370} {"train_loss": -7.202633857727051, "global_step": 183542, "epoch": 4370} {"train_loss": -6.8619465827941895, "global_step": 183543, "epoch": 4370} {"train_loss": -6.800061225891113, "global_step": 183544, "epoch": 4370} {"train_loss": -7.015637397766113, "global_step": 183545, "epoch": 4370} {"train_loss": -6.764557361602783, "global_step": 183546, "epoch": 4370} {"train_loss": -6.998783588409424, "global_step": 183547, "epoch": 4370} {"train_loss": -6.958261489868164, "global_step": 183548, "epoch": 4370} {"train_loss": -6.92985200881958, "global_step": 183549, "epoch": 4370} {"train_loss": -7.010246753692627, "global_step": 183550, "epoch": 4370} {"train_loss": -6.914815425872803, "global_step": 183551, "epoch": 4370} {"train_loss": -7.066774368286133, "global_step": 183552, "epoch": 4370} {"train_loss": -7.065877914428711, "global_step": 183553, "epoch": 4370} {"train_loss": -7.072763919830322, "global_step": 183554, "epoch": 4370} {"train_loss": -7.075953006744385, "global_step": 183555, "epoch": 4370} {"train_loss": -7.100265026092529, "global_step": 183556, "epoch": 4370} {"train_loss": -7.199536323547363, "global_step": 183557, "epoch": 4370} {"train_loss": -7.155076026916504, "global_step": 183558, "epoch": 4370} {"train_loss": -7.151026248931885, "global_step": 183559, "epoch": 4370} {"train_loss": -7.017389297485352, "global_step": 183560, "epoch": 4370} {"train_loss": -7.159833908081055, "global_step": 183561, "epoch": 4370} {"train_loss": -7.1332244873046875, "global_step": 183562, "epoch": 4370} {"train_loss": -7.142568588256836, "global_step": 183563, "epoch": 4370} {"train_loss": -7.118350982666016, "global_step": 183564, "epoch": 4370} {"train_loss": -7.2640156745910645, "global_step": 183565, "epoch": 4370} {"train_loss": -7.219574928283691, "global_step": 183566, "epoch": 4370} {"train_loss": -7.173685073852539, "global_step": 183567, "epoch": 4370} {"train_loss": -7.15523624420166, "global_step": 183568, "epoch": 4370} {"train_loss": -7.113633155822754, "global_step": 183569, "epoch": 4370} {"train_loss": -7.1258134841918945, "global_step": 183570, "epoch": 4370} {"train_loss": -7.137707233428955, "global_step": 183571, "epoch": 4370} {"train_loss": -7.0464067459106445, "global_step": 183572, "epoch": 4370} {"train_loss": -7.1821818351745605, "global_step": 183573, "epoch": 4370} {"train_loss": -7.04655122756958, "global_step": 183574, "epoch": 4370} {"train_loss": -7.048296928405762, "global_step": 183575, "epoch": 4370} {"train_loss": -7.160793304443359, "global_step": 183576, "epoch": 4370} {"train_loss": -7.173749923706055, "global_step": 183577, "epoch": 4370} {"train_loss": -7.137181282043457, "global_step": 183578, "epoch": 4370} {"train_loss": -7.113574981689453, "global_step": 183579, "epoch": 4370} {"train_loss": -7.164295196533203, "global_step": 183580, "epoch": 4370} {"train_loss": -7.077179397855486, "global_step": 183581, "epoch": 4370, "val_loss": 69484.890625} {"train_loss": -7.092424392700195, "global_step": 183582, "epoch": 4371} {"train_loss": -7.13984489440918, "global_step": 183583, "epoch": 4371} {"train_loss": -7.043806076049805, "global_step": 183584, "epoch": 4371} {"train_loss": -7.03727912902832, "global_step": 183585, "epoch": 4371} {"train_loss": -7.238290786743164, "global_step": 183586, "epoch": 4371} {"train_loss": -7.080306053161621, "global_step": 183587, "epoch": 4371} {"train_loss": -7.088800430297852, "global_step": 183588, "epoch": 4371} {"train_loss": -7.1564741134643555, "global_step": 183589, "epoch": 4371} {"train_loss": -6.95326042175293, "global_step": 183590, "epoch": 4371} {"train_loss": -7.111880302429199, "global_step": 183591, "epoch": 4371} {"train_loss": -7.1236982345581055, "global_step": 183592, "epoch": 4371} {"train_loss": -7.16560173034668, "global_step": 183593, "epoch": 4371} {"train_loss": -7.053784370422363, "global_step": 183594, "epoch": 4371} {"train_loss": -7.118695259094238, "global_step": 183595, "epoch": 4371} {"train_loss": -7.199039459228516, "global_step": 183596, "epoch": 4371} {"train_loss": -7.112421989440918, "global_step": 183597, "epoch": 4371} {"train_loss": -7.1680121421813965, "global_step": 183598, "epoch": 4371} {"train_loss": -7.171862602233887, "global_step": 183599, "epoch": 4371} {"train_loss": -7.256111145019531, "global_step": 183600, "epoch": 4371} {"train_loss": -7.046291828155518, "global_step": 183601, "epoch": 4371} {"train_loss": -7.110919952392578, "global_step": 183602, "epoch": 4371} {"train_loss": -7.04995059967041, "global_step": 183603, "epoch": 4371} {"train_loss": -7.0654401779174805, "global_step": 183604, "epoch": 4371} {"train_loss": -7.04248046875, "global_step": 183605, "epoch": 4371} {"train_loss": -7.174575328826904, "global_step": 183606, "epoch": 4371} {"train_loss": -7.007061004638672, "global_step": 183607, "epoch": 4371} {"train_loss": -7.151654243469238, "global_step": 183608, "epoch": 4371} {"train_loss": -7.1656413078308105, "global_step": 183609, "epoch": 4371} {"train_loss": -6.962741374969482, "global_step": 183610, "epoch": 4371} {"train_loss": -7.0627946853637695, "global_step": 183611, "epoch": 4371} {"train_loss": -7.0649495124816895, "global_step": 183612, "epoch": 4371} {"train_loss": -7.028417587280273, "global_step": 183613, "epoch": 4371} {"train_loss": -7.076725959777832, "global_step": 183614, "epoch": 4371} {"train_loss": -6.910717487335205, "global_step": 183615, "epoch": 4371} {"train_loss": -7.13615608215332, "global_step": 183616, "epoch": 4371} {"train_loss": -7.033871650695801, "global_step": 183617, "epoch": 4371} {"train_loss": -6.948782920837402, "global_step": 183618, "epoch": 4371} {"train_loss": -7.188726425170898, "global_step": 183619, "epoch": 4371} {"train_loss": -7.030335426330566, "global_step": 183620, "epoch": 4371} {"train_loss": -7.067005634307861, "global_step": 183621, "epoch": 4371} {"train_loss": -7.003265857696533, "global_step": 183622, "epoch": 4371} {"train_loss": -7.090309971854801, "global_step": 183623, "epoch": 4371, "val_loss": 69669.8984375} {"train_loss": -6.953800201416016, "global_step": 183624, "epoch": 4372} {"train_loss": -7.155782699584961, "global_step": 183625, "epoch": 4372} {"train_loss": -7.152788162231445, "global_step": 183626, "epoch": 4372} {"train_loss": -7.072942733764648, "global_step": 183627, "epoch": 4372} {"train_loss": -7.145720481872559, "global_step": 183628, "epoch": 4372} {"train_loss": -7.05112886428833, "global_step": 183629, "epoch": 4372} {"train_loss": -7.121842384338379, "global_step": 183630, "epoch": 4372} {"train_loss": -7.136025428771973, "global_step": 183631, "epoch": 4372} {"train_loss": -7.236824989318848, "global_step": 183632, "epoch": 4372} {"train_loss": -7.130121231079102, "global_step": 183633, "epoch": 4372} {"train_loss": -7.110976696014404, "global_step": 183634, "epoch": 4372} {"train_loss": -7.039832592010498, "global_step": 183635, "epoch": 4372} {"train_loss": -7.177314758300781, "global_step": 183636, "epoch": 4372} {"train_loss": -7.13925313949585, "global_step": 183637, "epoch": 4372} {"train_loss": -7.0723137855529785, "global_step": 183638, "epoch": 4372} {"train_loss": -7.186145782470703, "global_step": 183639, "epoch": 4372} {"train_loss": -7.085418701171875, "global_step": 183640, "epoch": 4372} {"train_loss": -7.199731826782227, "global_step": 183641, "epoch": 4372} {"train_loss": -7.069370746612549, "global_step": 183642, "epoch": 4372} {"train_loss": -7.111146450042725, "global_step": 183643, "epoch": 4372} {"train_loss": -7.044939041137695, "global_step": 183644, "epoch": 4372} {"train_loss": -7.159141540527344, "global_step": 183645, "epoch": 4372} {"train_loss": -7.117952346801758, "global_step": 183646, "epoch": 4372} {"train_loss": -7.080676078796387, "global_step": 183647, "epoch": 4372} {"train_loss": -7.146904945373535, "global_step": 183648, "epoch": 4372} {"train_loss": -7.1820068359375, "global_step": 183649, "epoch": 4372} {"train_loss": -7.270819664001465, "global_step": 183650, "epoch": 4372} {"train_loss": -7.20306396484375, "global_step": 183651, "epoch": 4372} {"train_loss": -7.1791229248046875, "global_step": 183652, "epoch": 4372} {"train_loss": -7.090873718261719, "global_step": 183653, "epoch": 4372} {"train_loss": -7.207978248596191, "global_step": 183654, "epoch": 4372} {"train_loss": -7.118873596191406, "global_step": 183655, "epoch": 4372} {"train_loss": -7.223105430603027, "global_step": 183656, "epoch": 4372} {"train_loss": -7.1411566734313965, "global_step": 183657, "epoch": 4372} {"train_loss": -7.107865333557129, "global_step": 183658, "epoch": 4372} {"train_loss": -7.133970737457275, "global_step": 183659, "epoch": 4372} {"train_loss": -7.287134170532227, "global_step": 183660, "epoch": 4372} {"train_loss": -7.038674354553223, "global_step": 183661, "epoch": 4372} {"train_loss": -7.109997749328613, "global_step": 183662, "epoch": 4372} {"train_loss": -7.233080863952637, "global_step": 183663, "epoch": 4372} {"train_loss": -7.130666732788086, "global_step": 183664, "epoch": 4372} {"train_loss": -7.133660918190365, "global_step": 183665, "epoch": 4372, "val_loss": 69485.875} {"train_loss": -7.095305442810059, "global_step": 183666, "epoch": 4373} {"train_loss": -7.110771179199219, "global_step": 183667, "epoch": 4373} {"train_loss": -7.00856876373291, "global_step": 183668, "epoch": 4373} {"train_loss": -7.166344165802002, "global_step": 183669, "epoch": 4373} {"train_loss": -7.06144380569458, "global_step": 183670, "epoch": 4373} {"train_loss": -7.099691867828369, "global_step": 183671, "epoch": 4373} {"train_loss": -7.111929893493652, "global_step": 183672, "epoch": 4373} {"train_loss": -7.177982807159424, "global_step": 183673, "epoch": 4373} {"train_loss": -7.146205902099609, "global_step": 183674, "epoch": 4373} {"train_loss": -7.046590805053711, "global_step": 183675, "epoch": 4373} {"train_loss": -7.166472434997559, "global_step": 183676, "epoch": 4373} {"train_loss": -7.1718902587890625, "global_step": 183677, "epoch": 4373} {"train_loss": -7.2969865798950195, "global_step": 183678, "epoch": 4373} {"train_loss": -7.006714820861816, "global_step": 183679, "epoch": 4373} {"train_loss": -7.114331245422363, "global_step": 183680, "epoch": 4373} {"train_loss": -7.241806983947754, "global_step": 183681, "epoch": 4373} {"train_loss": -6.991808891296387, "global_step": 183682, "epoch": 4373} {"train_loss": -7.146836280822754, "global_step": 183683, "epoch": 4373} {"train_loss": -7.154791355133057, "global_step": 183684, "epoch": 4373} {"train_loss": -7.133179187774658, "global_step": 183685, "epoch": 4373} {"train_loss": -7.1830220222473145, "global_step": 183686, "epoch": 4373} {"train_loss": -7.174574375152588, "global_step": 183687, "epoch": 4373} {"train_loss": -7.181950569152832, "global_step": 183688, "epoch": 4373} {"train_loss": -7.349308967590332, "global_step": 183689, "epoch": 4373} {"train_loss": -7.2270660400390625, "global_step": 183690, "epoch": 4373} {"train_loss": -7.181880474090576, "global_step": 183691, "epoch": 4373} {"train_loss": -7.239021301269531, "global_step": 183692, "epoch": 4373} {"train_loss": -7.156152725219727, "global_step": 183693, "epoch": 4373} {"train_loss": -7.171261310577393, "global_step": 183694, "epoch": 4373} {"train_loss": -7.260714054107666, "global_step": 183695, "epoch": 4373} {"train_loss": -7.208042144775391, "global_step": 183696, "epoch": 4373} {"train_loss": -7.180588722229004, "global_step": 183697, "epoch": 4373} {"train_loss": -7.1555681228637695, "global_step": 183698, "epoch": 4373} {"train_loss": -7.136848449707031, "global_step": 183699, "epoch": 4373} {"train_loss": -7.1616950035095215, "global_step": 183700, "epoch": 4373} {"train_loss": -7.116703033447266, "global_step": 183701, "epoch": 4373} {"train_loss": -7.107187747955322, "global_step": 183702, "epoch": 4373} {"train_loss": -7.003483772277832, "global_step": 183703, "epoch": 4373} {"train_loss": -7.069262504577637, "global_step": 183704, "epoch": 4373} {"train_loss": -7.10763692855835, "global_step": 183705, "epoch": 4373} {"train_loss": -7.1069793701171875, "global_step": 183706, "epoch": 4373} {"train_loss": -7.146234841573806, "global_step": 183707, "epoch": 4373, "val_loss": 69284.6171875} {"train_loss": -7.157612323760986, "global_step": 183708, "epoch": 4374} {"train_loss": -7.183450698852539, "global_step": 183709, "epoch": 4374} {"train_loss": -7.032886505126953, "global_step": 183710, "epoch": 4374} {"train_loss": -7.088710308074951, "global_step": 183711, "epoch": 4374} {"train_loss": -7.161704063415527, "global_step": 183712, "epoch": 4374} {"train_loss": -7.123666763305664, "global_step": 183713, "epoch": 4374} {"train_loss": -7.0620951652526855, "global_step": 183714, "epoch": 4374} {"train_loss": -7.206239700317383, "global_step": 183715, "epoch": 4374} {"train_loss": -7.153407096862793, "global_step": 183716, "epoch": 4374} {"train_loss": -7.191110610961914, "global_step": 183717, "epoch": 4374} {"train_loss": -7.058794021606445, "global_step": 183718, "epoch": 4374} {"train_loss": -6.966391563415527, "global_step": 183719, "epoch": 4374} {"train_loss": -7.124149322509766, "global_step": 183720, "epoch": 4374} {"train_loss": -6.997739315032959, "global_step": 183721, "epoch": 4374} {"train_loss": -6.968118667602539, "global_step": 183722, "epoch": 4374} {"train_loss": -6.97595739364624, "global_step": 183723, "epoch": 4374} {"train_loss": -7.0725016593933105, "global_step": 183724, "epoch": 4374} {"train_loss": -7.070466995239258, "global_step": 183725, "epoch": 4374} {"train_loss": -7.13908052444458, "global_step": 183726, "epoch": 4374} {"train_loss": -7.053402900695801, "global_step": 183727, "epoch": 4374} {"train_loss": -7.044117450714111, "global_step": 183728, "epoch": 4374} {"train_loss": -7.100561141967773, "global_step": 183729, "epoch": 4374} {"train_loss": -7.078487396240234, "global_step": 183730, "epoch": 4374} {"train_loss": -7.182192325592041, "global_step": 183731, "epoch": 4374} {"train_loss": -7.0284528732299805, "global_step": 183732, "epoch": 4374} {"train_loss": -7.104761600494385, "global_step": 183733, "epoch": 4374} {"train_loss": -7.069151878356934, "global_step": 183734, "epoch": 4374} {"train_loss": -7.056008338928223, "global_step": 183735, "epoch": 4374} {"train_loss": -7.130770683288574, "global_step": 183736, "epoch": 4374} {"train_loss": -7.131070137023926, "global_step": 183737, "epoch": 4374} {"train_loss": -7.024111747741699, "global_step": 183738, "epoch": 4374} {"train_loss": -6.988716125488281, "global_step": 183739, "epoch": 4374} {"train_loss": -7.114681243896484, "global_step": 183740, "epoch": 4374} {"train_loss": -7.068136215209961, "global_step": 183741, "epoch": 4374} {"train_loss": -7.076447010040283, "global_step": 183742, "epoch": 4374} {"train_loss": -7.090167999267578, "global_step": 183743, "epoch": 4374} {"train_loss": -7.145908355712891, "global_step": 183744, "epoch": 4374} {"train_loss": -7.119042873382568, "global_step": 183745, "epoch": 4374} {"train_loss": -7.195174217224121, "global_step": 183746, "epoch": 4374} {"train_loss": -7.22114372253418, "global_step": 183747, "epoch": 4374} {"train_loss": -7.234057903289795, "global_step": 183748, "epoch": 4374} {"train_loss": -7.100857530321393, "global_step": 183749, "epoch": 4374, "val_loss": 69364.875} {"train_loss": -7.100347518920898, "global_step": 183750, "epoch": 4375} {"train_loss": -7.13794469833374, "global_step": 183751, "epoch": 4375} {"train_loss": -7.1122002601623535, "global_step": 183752, "epoch": 4375} {"train_loss": -7.137650489807129, "global_step": 183753, "epoch": 4375} {"train_loss": -7.153810024261475, "global_step": 183754, "epoch": 4375} {"train_loss": -7.184746742248535, "global_step": 183755, "epoch": 4375} {"train_loss": -7.230942726135254, "global_step": 183756, "epoch": 4375} {"train_loss": -7.245822906494141, "global_step": 183757, "epoch": 4375} {"train_loss": -7.205496788024902, "global_step": 183758, "epoch": 4375} {"train_loss": -7.134270668029785, "global_step": 183759, "epoch": 4375} {"train_loss": -7.175586223602295, "global_step": 183760, "epoch": 4375} {"train_loss": -7.133184432983398, "global_step": 183761, "epoch": 4375} {"train_loss": -7.1814656257629395, "global_step": 183762, "epoch": 4375} {"train_loss": -7.13104248046875, "global_step": 183763, "epoch": 4375} {"train_loss": -7.150318145751953, "global_step": 183764, "epoch": 4375} {"train_loss": -7.200425148010254, "global_step": 183765, "epoch": 4375} {"train_loss": -7.196136474609375, "global_step": 183766, "epoch": 4375} {"train_loss": -7.197066307067871, "global_step": 183767, "epoch": 4375} {"train_loss": -7.174184799194336, "global_step": 183768, "epoch": 4375} {"train_loss": -7.13662052154541, "global_step": 183769, "epoch": 4375} {"train_loss": -7.028541564941406, "global_step": 183770, "epoch": 4375} {"train_loss": -7.160571098327637, "global_step": 183771, "epoch": 4375} {"train_loss": -7.172057151794434, "global_step": 183772, "epoch": 4375} {"train_loss": -7.169122219085693, "global_step": 183773, "epoch": 4375} {"train_loss": -7.1866559982299805, "global_step": 183774, "epoch": 4375} {"train_loss": -6.926086902618408, "global_step": 183775, "epoch": 4375} {"train_loss": -7.16105318069458, "global_step": 183776, "epoch": 4375} {"train_loss": -7.015038967132568, "global_step": 183777, "epoch": 4375} {"train_loss": -6.974211692810059, "global_step": 183778, "epoch": 4375} {"train_loss": -7.218620777130127, "global_step": 183779, "epoch": 4375} {"train_loss": -6.998928546905518, "global_step": 183780, "epoch": 4375} {"train_loss": -7.108428001403809, "global_step": 183781, "epoch": 4375} {"train_loss": -7.10789680480957, "global_step": 183782, "epoch": 4375} {"train_loss": -7.127077579498291, "global_step": 183783, "epoch": 4375} {"train_loss": -7.104055404663086, "global_step": 183784, "epoch": 4375} {"train_loss": -7.174837589263916, "global_step": 183785, "epoch": 4375} {"train_loss": -7.108701229095459, "global_step": 183786, "epoch": 4375} {"train_loss": -7.169122695922852, "global_step": 183787, "epoch": 4375} {"train_loss": -7.119340896606445, "global_step": 183788, "epoch": 4375} {"train_loss": -7.211010456085205, "global_step": 183789, "epoch": 4375} {"train_loss": -7.212136268615723, "global_step": 183790, "epoch": 4375} {"train_loss": -7.142028717767625, "global_step": 183791, "epoch": 4375, "val_loss": 69510.359375} {"train_loss": -7.22263240814209, "global_step": 183792, "epoch": 4376} {"train_loss": -7.098881721496582, "global_step": 183793, "epoch": 4376} {"train_loss": -7.12812614440918, "global_step": 183794, "epoch": 4376} {"train_loss": -7.20319128036499, "global_step": 183795, "epoch": 4376} {"train_loss": -7.05073356628418, "global_step": 183796, "epoch": 4376} {"train_loss": -7.123129844665527, "global_step": 183797, "epoch": 4376} {"train_loss": -7.159045696258545, "global_step": 183798, "epoch": 4376} {"train_loss": -7.1922383308410645, "global_step": 183799, "epoch": 4376} {"train_loss": -7.19492244720459, "global_step": 183800, "epoch": 4376} {"train_loss": -7.186802864074707, "global_step": 183801, "epoch": 4376} {"train_loss": -7.119260787963867, "global_step": 183802, "epoch": 4376} {"train_loss": -7.10895299911499, "global_step": 183803, "epoch": 4376} {"train_loss": -7.123472213745117, "global_step": 183804, "epoch": 4376} {"train_loss": -7.215949058532715, "global_step": 183805, "epoch": 4376} {"train_loss": -7.247529029846191, "global_step": 183806, "epoch": 4376} {"train_loss": -7.230842590332031, "global_step": 183807, "epoch": 4376} {"train_loss": -7.23723030090332, "global_step": 183808, "epoch": 4376} {"train_loss": -7.244073390960693, "global_step": 183809, "epoch": 4376} {"train_loss": -7.098413944244385, "global_step": 183810, "epoch": 4376} {"train_loss": -7.295181751251221, "global_step": 183811, "epoch": 4376} {"train_loss": -7.188785552978516, "global_step": 183812, "epoch": 4376} {"train_loss": -7.13917350769043, "global_step": 183813, "epoch": 4376} {"train_loss": -7.259810447692871, "global_step": 183814, "epoch": 4376} {"train_loss": -7.187441825866699, "global_step": 183815, "epoch": 4376} {"train_loss": -6.893686294555664, "global_step": 183816, "epoch": 4376} {"train_loss": -6.998980522155762, "global_step": 183817, "epoch": 4376} {"train_loss": -6.993078231811523, "global_step": 183818, "epoch": 4376} {"train_loss": -6.7841997146606445, "global_step": 183819, "epoch": 4376} {"train_loss": -7.08748722076416, "global_step": 183820, "epoch": 4376} {"train_loss": -6.9141764640808105, "global_step": 183821, "epoch": 4376} {"train_loss": -6.998649597167969, "global_step": 183822, "epoch": 4376} {"train_loss": -7.053633689880371, "global_step": 183823, "epoch": 4376} {"train_loss": -6.902297496795654, "global_step": 183824, "epoch": 4376} {"train_loss": -7.008584022521973, "global_step": 183825, "epoch": 4376} {"train_loss": -6.949835777282715, "global_step": 183826, "epoch": 4376} {"train_loss": -7.190728187561035, "global_step": 183827, "epoch": 4376} {"train_loss": -6.916982650756836, "global_step": 183828, "epoch": 4376} {"train_loss": -7.119912624359131, "global_step": 183829, "epoch": 4376} {"train_loss": -6.957712650299072, "global_step": 183830, "epoch": 4376} {"train_loss": -6.965311527252197, "global_step": 183831, "epoch": 4376} {"train_loss": -7.058145999908447, "global_step": 183832, "epoch": 4376} {"train_loss": -7.097115403129941, "global_step": 183833, "epoch": 4376, "val_loss": 69460.0} {"train_loss": -7.184632301330566, "global_step": 183834, "epoch": 4377} {"train_loss": -7.147730350494385, "global_step": 183835, "epoch": 4377} {"train_loss": -7.05794095993042, "global_step": 183836, "epoch": 4377} {"train_loss": -7.056525707244873, "global_step": 183837, "epoch": 4377} {"train_loss": -7.110617637634277, "global_step": 183838, "epoch": 4377} {"train_loss": -7.152386665344238, "global_step": 183839, "epoch": 4377} {"train_loss": -7.1907877922058105, "global_step": 183840, "epoch": 4377} {"train_loss": -7.0355730056762695, "global_step": 183841, "epoch": 4377} {"train_loss": -7.0820817947387695, "global_step": 183842, "epoch": 4377} {"train_loss": -7.216657638549805, "global_step": 183843, "epoch": 4377} {"train_loss": -7.20902156829834, "global_step": 183844, "epoch": 4377} {"train_loss": -7.093113422393799, "global_step": 183845, "epoch": 4377} {"train_loss": -7.140525817871094, "global_step": 183846, "epoch": 4377} {"train_loss": -7.318702697753906, "global_step": 183847, "epoch": 4377} {"train_loss": -7.126159191131592, "global_step": 183848, "epoch": 4377} {"train_loss": -7.104884147644043, "global_step": 183849, "epoch": 4377} {"train_loss": -7.152215003967285, "global_step": 183850, "epoch": 4377} {"train_loss": -7.2619099617004395, "global_step": 183851, "epoch": 4377} {"train_loss": -7.108013153076172, "global_step": 183852, "epoch": 4377} {"train_loss": -7.159684181213379, "global_step": 183853, "epoch": 4377} {"train_loss": -7.108222961425781, "global_step": 183854, "epoch": 4377} {"train_loss": -7.113238334655762, "global_step": 183855, "epoch": 4377} {"train_loss": -7.162222385406494, "global_step": 183856, "epoch": 4377} {"train_loss": -7.201942443847656, "global_step": 183857, "epoch": 4377} {"train_loss": -7.150867462158203, "global_step": 183858, "epoch": 4377} {"train_loss": -7.103537559509277, "global_step": 183859, "epoch": 4377} {"train_loss": -7.225578784942627, "global_step": 183860, "epoch": 4377} {"train_loss": -7.235444068908691, "global_step": 183861, "epoch": 4377} {"train_loss": -7.183697700500488, "global_step": 183862, "epoch": 4377} {"train_loss": -7.272981643676758, "global_step": 183863, "epoch": 4377} {"train_loss": -7.195204734802246, "global_step": 183864, "epoch": 4377} {"train_loss": -7.152613639831543, "global_step": 183865, "epoch": 4377} {"train_loss": -7.193621635437012, "global_step": 183866, "epoch": 4377} {"train_loss": -7.115380764007568, "global_step": 183867, "epoch": 4377} {"train_loss": -7.204555034637451, "global_step": 183868, "epoch": 4377} {"train_loss": -7.100869178771973, "global_step": 183869, "epoch": 4377} {"train_loss": -7.2596564292907715, "global_step": 183870, "epoch": 4377} {"train_loss": -7.090836524963379, "global_step": 183871, "epoch": 4377} {"train_loss": -7.167401313781738, "global_step": 183872, "epoch": 4377} {"train_loss": -7.093057632446289, "global_step": 183873, "epoch": 4377} {"train_loss": -7.036041259765625, "global_step": 183874, "epoch": 4377} {"train_loss": -7.151050363268171, "global_step": 183875, "epoch": 4377, "val_loss": 69523.53125} {"train_loss": -7.09716796875, "global_step": 183876, "epoch": 4378} {"train_loss": -6.995988368988037, "global_step": 183877, "epoch": 4378} {"train_loss": -7.08200740814209, "global_step": 183878, "epoch": 4378} {"train_loss": -7.1103010177612305, "global_step": 183879, "epoch": 4378} {"train_loss": -7.095972061157227, "global_step": 183880, "epoch": 4378} {"train_loss": -6.994503021240234, "global_step": 183881, "epoch": 4378} {"train_loss": -6.928397178649902, "global_step": 183882, "epoch": 4378} {"train_loss": -7.12319278717041, "global_step": 183883, "epoch": 4378} {"train_loss": -7.071746826171875, "global_step": 183884, "epoch": 4378} {"train_loss": -7.051955223083496, "global_step": 183885, "epoch": 4378} {"train_loss": -7.2094926834106445, "global_step": 183886, "epoch": 4378} {"train_loss": -7.041215896606445, "global_step": 183887, "epoch": 4378} {"train_loss": -7.181100845336914, "global_step": 183888, "epoch": 4378} {"train_loss": -7.026717185974121, "global_step": 183889, "epoch": 4378} {"train_loss": -7.052973747253418, "global_step": 183890, "epoch": 4378} {"train_loss": -7.0492777824401855, "global_step": 183891, "epoch": 4378} {"train_loss": -7.052969932556152, "global_step": 183892, "epoch": 4378} {"train_loss": -6.961026191711426, "global_step": 183893, "epoch": 4378} {"train_loss": -7.058943748474121, "global_step": 183894, "epoch": 4378} {"train_loss": -7.077247619628906, "global_step": 183895, "epoch": 4378} {"train_loss": -7.191364765167236, "global_step": 183896, "epoch": 4378} {"train_loss": -7.0441436767578125, "global_step": 183897, "epoch": 4378} {"train_loss": -7.1518096923828125, "global_step": 183898, "epoch": 4378} {"train_loss": -7.165849685668945, "global_step": 183899, "epoch": 4378} {"train_loss": -7.094514846801758, "global_step": 183900, "epoch": 4378} {"train_loss": -7.014928817749023, "global_step": 183901, "epoch": 4378} {"train_loss": -7.154563903808594, "global_step": 183902, "epoch": 4378} {"train_loss": -7.176900386810303, "global_step": 183903, "epoch": 4378} {"train_loss": -7.144877910614014, "global_step": 183904, "epoch": 4378} {"train_loss": -7.136239051818848, "global_step": 183905, "epoch": 4378} {"train_loss": -7.176386833190918, "global_step": 183906, "epoch": 4378} {"train_loss": -7.1028289794921875, "global_step": 183907, "epoch": 4378} {"train_loss": -7.134909629821777, "global_step": 183908, "epoch": 4378} {"train_loss": -7.2665581703186035, "global_step": 183909, "epoch": 4378} {"train_loss": -7.0590362548828125, "global_step": 183910, "epoch": 4378} {"train_loss": -7.136307239532471, "global_step": 183911, "epoch": 4378} {"train_loss": -7.229942321777344, "global_step": 183912, "epoch": 4378} {"train_loss": -7.155040740966797, "global_step": 183913, "epoch": 4378} {"train_loss": -7.1490583419799805, "global_step": 183914, "epoch": 4378} {"train_loss": -7.04368782043457, "global_step": 183915, "epoch": 4378} {"train_loss": -7.191038131713867, "global_step": 183916, "epoch": 4378} {"train_loss": -7.103247358685448, "global_step": 183917, "epoch": 4378, "val_loss": 69445.7265625} {"train_loss": -7.185644149780273, "global_step": 183918, "epoch": 4379} {"train_loss": -7.132701396942139, "global_step": 183919, "epoch": 4379} {"train_loss": -7.1357245445251465, "global_step": 183920, "epoch": 4379} {"train_loss": -7.211809158325195, "global_step": 183921, "epoch": 4379} {"train_loss": -7.3071088790893555, "global_step": 183922, "epoch": 4379} {"train_loss": -7.1353840827941895, "global_step": 183923, "epoch": 4379} {"train_loss": -7.277427673339844, "global_step": 183924, "epoch": 4379} {"train_loss": -7.212621688842773, "global_step": 183925, "epoch": 4379} {"train_loss": -7.286470890045166, "global_step": 183926, "epoch": 4379} {"train_loss": -7.236870765686035, "global_step": 183927, "epoch": 4379} {"train_loss": -7.135656356811523, "global_step": 183928, "epoch": 4379} {"train_loss": -7.193915367126465, "global_step": 183929, "epoch": 4379} {"train_loss": -7.299469470977783, "global_step": 183930, "epoch": 4379} {"train_loss": -7.093113422393799, "global_step": 183931, "epoch": 4379} {"train_loss": -7.204987049102783, "global_step": 183932, "epoch": 4379} {"train_loss": -7.229804515838623, "global_step": 183933, "epoch": 4379} {"train_loss": -7.0436320304870605, "global_step": 183934, "epoch": 4379} {"train_loss": -7.076567649841309, "global_step": 183935, "epoch": 4379} {"train_loss": -7.082135200500488, "global_step": 183936, "epoch": 4379} {"train_loss": -7.021468162536621, "global_step": 183937, "epoch": 4379} {"train_loss": -7.348193168640137, "global_step": 183938, "epoch": 4379} {"train_loss": -7.086868762969971, "global_step": 183939, "epoch": 4379} {"train_loss": -7.06547737121582, "global_step": 183940, "epoch": 4379} {"train_loss": -7.194364070892334, "global_step": 183941, "epoch": 4379} {"train_loss": -7.177502632141113, "global_step": 183942, "epoch": 4379} {"train_loss": -7.1115241050720215, "global_step": 183943, "epoch": 4379} {"train_loss": -7.101639270782471, "global_step": 183944, "epoch": 4379} {"train_loss": -7.1866865158081055, "global_step": 183945, "epoch": 4379} {"train_loss": -7.176178455352783, "global_step": 183946, "epoch": 4379} {"train_loss": -7.060697555541992, "global_step": 183947, "epoch": 4379} {"train_loss": -7.124688148498535, "global_step": 183948, "epoch": 4379} {"train_loss": -7.085829257965088, "global_step": 183949, "epoch": 4379} {"train_loss": -7.229126930236816, "global_step": 183950, "epoch": 4379} {"train_loss": -7.2183098793029785, "global_step": 183951, "epoch": 4379} {"train_loss": -7.076821327209473, "global_step": 183952, "epoch": 4379} {"train_loss": -7.113855361938477, "global_step": 183953, "epoch": 4379} {"train_loss": -7.1512556076049805, "global_step": 183954, "epoch": 4379} {"train_loss": -7.232295036315918, "global_step": 183955, "epoch": 4379} {"train_loss": -7.130247116088867, "global_step": 183956, "epoch": 4379} {"train_loss": -7.241932392120361, "global_step": 183957, "epoch": 4379} {"train_loss": -7.138187885284424, "global_step": 183958, "epoch": 4379} {"train_loss": -7.1633124351501465, "global_step": 183959, "epoch": 4379, "val_loss": 69418.453125} {"train_loss": -7.200068950653076, "global_step": 183960, "epoch": 4380} {"train_loss": -7.226842880249023, "global_step": 183961, "epoch": 4380} {"train_loss": -7.270347595214844, "global_step": 183962, "epoch": 4380} {"train_loss": -7.23737907409668, "global_step": 183963, "epoch": 4380} {"train_loss": -7.093608856201172, "global_step": 183964, "epoch": 4380} {"train_loss": -7.1736741065979, "global_step": 183965, "epoch": 4380} {"train_loss": -7.249642372131348, "global_step": 183966, "epoch": 4380} {"train_loss": -7.344692230224609, "global_step": 183967, "epoch": 4380} {"train_loss": -7.258578300476074, "global_step": 183968, "epoch": 4380} {"train_loss": -7.151125907897949, "global_step": 183969, "epoch": 4380} {"train_loss": -7.244515895843506, "global_step": 183970, "epoch": 4380} {"train_loss": -7.185755729675293, "global_step": 183971, "epoch": 4380} {"train_loss": -7.1107611656188965, "global_step": 183972, "epoch": 4380} {"train_loss": -7.085480690002441, "global_step": 183973, "epoch": 4380} {"train_loss": -7.170348644256592, "global_step": 183974, "epoch": 4380} {"train_loss": -7.136247634887695, "global_step": 183975, "epoch": 4380} {"train_loss": -7.1772871017456055, "global_step": 183976, "epoch": 4380} {"train_loss": -7.227377891540527, "global_step": 183977, "epoch": 4380} {"train_loss": -7.170238494873047, "global_step": 183978, "epoch": 4380} {"train_loss": -7.028929710388184, "global_step": 183979, "epoch": 4380} {"train_loss": -7.140078544616699, "global_step": 183980, "epoch": 4380} {"train_loss": -6.992112159729004, "global_step": 183981, "epoch": 4380} {"train_loss": -7.0831756591796875, "global_step": 183982, "epoch": 4380} {"train_loss": -7.180359840393066, "global_step": 183983, "epoch": 4380} {"train_loss": -7.079225063323975, "global_step": 183984, "epoch": 4380} {"train_loss": -7.142483711242676, "global_step": 183985, "epoch": 4380} {"train_loss": -7.0543060302734375, "global_step": 183986, "epoch": 4380} {"train_loss": -7.005470275878906, "global_step": 183987, "epoch": 4380} {"train_loss": -7.053004264831543, "global_step": 183988, "epoch": 4380} {"train_loss": -6.91615104675293, "global_step": 183989, "epoch": 4380} {"train_loss": -7.199182510375977, "global_step": 183990, "epoch": 4380} {"train_loss": -6.972136974334717, "global_step": 183991, "epoch": 4380} {"train_loss": -6.928853988647461, "global_step": 183992, "epoch": 4380} {"train_loss": -7.072248935699463, "global_step": 183993, "epoch": 4380} {"train_loss": -6.9706854820251465, "global_step": 183994, "epoch": 4380} {"train_loss": -6.958040237426758, "global_step": 183995, "epoch": 4380} {"train_loss": -7.0132551193237305, "global_step": 183996, "epoch": 4380} {"train_loss": -7.067831039428711, "global_step": 183997, "epoch": 4380} {"train_loss": -7.00419807434082, "global_step": 183998, "epoch": 4380} {"train_loss": -6.836865425109863, "global_step": 183999, "epoch": 4380} {"train_loss": -7.065323829650879, "global_step": 184000, "epoch": 4380} {"train_loss": -7.106926055181594, "global_step": 184001, "epoch": 4380, "val_loss": 69388.6640625} {"train_loss": -7.052935600280762, "global_step": 184002, "epoch": 4381} {"train_loss": -7.04472541809082, "global_step": 184003, "epoch": 4381} {"train_loss": -7.192743301391602, "global_step": 184004, "epoch": 4381} {"train_loss": -7.043869972229004, "global_step": 184005, "epoch": 4381} {"train_loss": -7.166651248931885, "global_step": 184006, "epoch": 4381} {"train_loss": -7.001289367675781, "global_step": 184007, "epoch": 4381} {"train_loss": -7.0193772315979, "global_step": 184008, "epoch": 4381} {"train_loss": -7.095564365386963, "global_step": 184009, "epoch": 4381} {"train_loss": -7.094340801239014, "global_step": 184010, "epoch": 4381} {"train_loss": -7.154719352722168, "global_step": 184011, "epoch": 4381} {"train_loss": -7.004831314086914, "global_step": 184012, "epoch": 4381} {"train_loss": -7.109842777252197, "global_step": 184013, "epoch": 4381} {"train_loss": -7.087597846984863, "global_step": 184014, "epoch": 4381} {"train_loss": -7.06083345413208, "global_step": 184015, "epoch": 4381} {"train_loss": -7.072381973266602, "global_step": 184016, "epoch": 4381} {"train_loss": -7.07128381729126, "global_step": 184017, "epoch": 4381} {"train_loss": -7.0386152267456055, "global_step": 184018, "epoch": 4381} {"train_loss": -7.221137523651123, "global_step": 184019, "epoch": 4381} {"train_loss": -7.117743492126465, "global_step": 184020, "epoch": 4381} {"train_loss": -7.253352165222168, "global_step": 184021, "epoch": 4381} {"train_loss": -7.074342727661133, "global_step": 184022, "epoch": 4381} {"train_loss": -7.110088348388672, "global_step": 184023, "epoch": 4381} {"train_loss": -7.176693439483643, "global_step": 184024, "epoch": 4381} {"train_loss": -7.154671669006348, "global_step": 184025, "epoch": 4381} {"train_loss": -7.132718563079834, "global_step": 184026, "epoch": 4381} {"train_loss": -7.185403347015381, "global_step": 184027, "epoch": 4381} {"train_loss": -7.246105670928955, "global_step": 184028, "epoch": 4381} {"train_loss": -7.189467430114746, "global_step": 184029, "epoch": 4381} {"train_loss": -7.142027854919434, "global_step": 184030, "epoch": 4381} {"train_loss": -7.201333999633789, "global_step": 184031, "epoch": 4381} {"train_loss": -7.145626544952393, "global_step": 184032, "epoch": 4381} {"train_loss": -7.127179145812988, "global_step": 184033, "epoch": 4381} {"train_loss": -7.074731826782227, "global_step": 184034, "epoch": 4381} {"train_loss": -6.9636335372924805, "global_step": 184035, "epoch": 4381} {"train_loss": -7.197627067565918, "global_step": 184036, "epoch": 4381} {"train_loss": -7.1147284507751465, "global_step": 184037, "epoch": 4381} {"train_loss": -7.086332321166992, "global_step": 184038, "epoch": 4381} {"train_loss": -7.2408127784729, "global_step": 184039, "epoch": 4381} {"train_loss": -7.077963829040527, "global_step": 184040, "epoch": 4381} {"train_loss": -7.006009578704834, "global_step": 184041, "epoch": 4381} {"train_loss": -7.123564720153809, "global_step": 184042, "epoch": 4381} {"train_loss": -7.112487679436093, "global_step": 184043, "epoch": 4381, "val_loss": 69370.171875} {"train_loss": -7.078567028045654, "global_step": 184044, "epoch": 4382} {"train_loss": -7.016149520874023, "global_step": 184045, "epoch": 4382} {"train_loss": -7.226311683654785, "global_step": 184046, "epoch": 4382} {"train_loss": -7.031760215759277, "global_step": 184047, "epoch": 4382} {"train_loss": -7.069324970245361, "global_step": 184048, "epoch": 4382} {"train_loss": -7.14912223815918, "global_step": 184049, "epoch": 4382} {"train_loss": -6.992559432983398, "global_step": 184050, "epoch": 4382} {"train_loss": -7.021557807922363, "global_step": 184051, "epoch": 4382} {"train_loss": -7.078960418701172, "global_step": 184052, "epoch": 4382} {"train_loss": -7.14720344543457, "global_step": 184053, "epoch": 4382} {"train_loss": -7.217487812042236, "global_step": 184054, "epoch": 4382} {"train_loss": -7.154372692108154, "global_step": 184055, "epoch": 4382} {"train_loss": -7.159669876098633, "global_step": 184056, "epoch": 4382} {"train_loss": -7.138596534729004, "global_step": 184057, "epoch": 4382} {"train_loss": -7.085441589355469, "global_step": 184058, "epoch": 4382} {"train_loss": -7.1683759689331055, "global_step": 184059, "epoch": 4382} {"train_loss": -7.127513408660889, "global_step": 184060, "epoch": 4382} {"train_loss": -7.213802337646484, "global_step": 184061, "epoch": 4382} {"train_loss": -7.158051013946533, "global_step": 184062, "epoch": 4382} {"train_loss": -7.202124118804932, "global_step": 184063, "epoch": 4382} {"train_loss": -7.172512531280518, "global_step": 184064, "epoch": 4382} {"train_loss": -7.215119361877441, "global_step": 184065, "epoch": 4382} {"train_loss": -7.127573490142822, "global_step": 184066, "epoch": 4382} {"train_loss": -7.13983154296875, "global_step": 184067, "epoch": 4382} {"train_loss": -7.19551420211792, "global_step": 184068, "epoch": 4382} {"train_loss": -7.133303642272949, "global_step": 184069, "epoch": 4382} {"train_loss": -7.026312828063965, "global_step": 184070, "epoch": 4382} {"train_loss": -7.1456804275512695, "global_step": 184071, "epoch": 4382} {"train_loss": -7.161498546600342, "global_step": 184072, "epoch": 4382} {"train_loss": -7.151818752288818, "global_step": 184073, "epoch": 4382} {"train_loss": -7.070779800415039, "global_step": 184074, "epoch": 4382} {"train_loss": -7.036130428314209, "global_step": 184075, "epoch": 4382} {"train_loss": -7.112882614135742, "global_step": 184076, "epoch": 4382} {"train_loss": -7.060070037841797, "global_step": 184077, "epoch": 4382} {"train_loss": -7.079556465148926, "global_step": 184078, "epoch": 4382} {"train_loss": -7.100505352020264, "global_step": 184079, "epoch": 4382} {"train_loss": -7.162364959716797, "global_step": 184080, "epoch": 4382} {"train_loss": -7.093809127807617, "global_step": 184081, "epoch": 4382} {"train_loss": -7.2273335456848145, "global_step": 184082, "epoch": 4382} {"train_loss": -7.060685634613037, "global_step": 184083, "epoch": 4382} {"train_loss": -7.0855302810668945, "global_step": 184084, "epoch": 4382} {"train_loss": -7.1185609840211415, "global_step": 184085, "epoch": 4382, "val_loss": 69418.8671875} {"train_loss": -7.161357402801514, "global_step": 184086, "epoch": 4383} {"train_loss": -7.319120407104492, "global_step": 184087, "epoch": 4383} {"train_loss": -7.238600254058838, "global_step": 184088, "epoch": 4383} {"train_loss": -7.152433395385742, "global_step": 184089, "epoch": 4383} {"train_loss": -7.142155170440674, "global_step": 184090, "epoch": 4383} {"train_loss": -7.169835090637207, "global_step": 184091, "epoch": 4383} {"train_loss": -7.181877613067627, "global_step": 184092, "epoch": 4383} {"train_loss": -7.114959716796875, "global_step": 184093, "epoch": 4383} {"train_loss": -7.065847873687744, "global_step": 184094, "epoch": 4383} {"train_loss": -7.1044721603393555, "global_step": 184095, "epoch": 4383} {"train_loss": -7.066393852233887, "global_step": 184096, "epoch": 4383} {"train_loss": -7.105716228485107, "global_step": 184097, "epoch": 4383} {"train_loss": -7.124631881713867, "global_step": 184098, "epoch": 4383} {"train_loss": -7.054872035980225, "global_step": 184099, "epoch": 4383} {"train_loss": -7.154993057250977, "global_step": 184100, "epoch": 4383} {"train_loss": -7.114779472351074, "global_step": 184101, "epoch": 4383} {"train_loss": -7.034482955932617, "global_step": 184102, "epoch": 4383} {"train_loss": -7.098219394683838, "global_step": 184103, "epoch": 4383} {"train_loss": -7.122342586517334, "global_step": 184104, "epoch": 4383} {"train_loss": -7.100860118865967, "global_step": 184105, "epoch": 4383} {"train_loss": -7.085685729980469, "global_step": 184106, "epoch": 4383} {"train_loss": -7.115119934082031, "global_step": 184107, "epoch": 4383} {"train_loss": -7.050127029418945, "global_step": 184108, "epoch": 4383} {"train_loss": -7.071138381958008, "global_step": 184109, "epoch": 4383} {"train_loss": -7.115203857421875, "global_step": 184110, "epoch": 4383} {"train_loss": -7.109828948974609, "global_step": 184111, "epoch": 4383} {"train_loss": -7.0938591957092285, "global_step": 184112, "epoch": 4383} {"train_loss": -7.084300518035889, "global_step": 184113, "epoch": 4383} {"train_loss": -7.140423774719238, "global_step": 184114, "epoch": 4383} {"train_loss": -7.117281436920166, "global_step": 184115, "epoch": 4383} {"train_loss": -7.147546291351318, "global_step": 184116, "epoch": 4383} {"train_loss": -7.150180816650391, "global_step": 184117, "epoch": 4383} {"train_loss": -7.280698776245117, "global_step": 184118, "epoch": 4383} {"train_loss": -7.184022903442383, "global_step": 184119, "epoch": 4383} {"train_loss": -7.072832107543945, "global_step": 184120, "epoch": 4383} {"train_loss": -7.211888313293457, "global_step": 184121, "epoch": 4383} {"train_loss": -7.0918073654174805, "global_step": 184122, "epoch": 4383} {"train_loss": -7.086400985717773, "global_step": 184123, "epoch": 4383} {"train_loss": -7.166338920593262, "global_step": 184124, "epoch": 4383} {"train_loss": -7.166094779968262, "global_step": 184125, "epoch": 4383} {"train_loss": -7.08425760269165, "global_step": 184126, "epoch": 4383} {"train_loss": -7.124991280691964, "global_step": 184127, "epoch": 4383, "val_loss": 69332.7734375} {"train_loss": -7.1018805503845215, "global_step": 184128, "epoch": 4384} {"train_loss": -6.985634803771973, "global_step": 184129, "epoch": 4384} {"train_loss": -7.077703475952148, "global_step": 184130, "epoch": 4384} {"train_loss": -7.012758731842041, "global_step": 184131, "epoch": 4384} {"train_loss": -6.953736305236816, "global_step": 184132, "epoch": 4384} {"train_loss": -7.112907409667969, "global_step": 184133, "epoch": 4384} {"train_loss": -6.940490245819092, "global_step": 184134, "epoch": 4384} {"train_loss": -7.10383939743042, "global_step": 184135, "epoch": 4384} {"train_loss": -7.1185760498046875, "global_step": 184136, "epoch": 4384} {"train_loss": -7.034864902496338, "global_step": 184137, "epoch": 4384} {"train_loss": -7.083578109741211, "global_step": 184138, "epoch": 4384} {"train_loss": -6.882711410522461, "global_step": 184139, "epoch": 4384} {"train_loss": -7.132694244384766, "global_step": 184140, "epoch": 4384} {"train_loss": -7.0161848068237305, "global_step": 184141, "epoch": 4384} {"train_loss": -7.006808280944824, "global_step": 184142, "epoch": 4384} {"train_loss": -7.017178535461426, "global_step": 184143, "epoch": 4384} {"train_loss": -6.955049514770508, "global_step": 184144, "epoch": 4384} {"train_loss": -7.188021659851074, "global_step": 184145, "epoch": 4384} {"train_loss": -6.9309539794921875, "global_step": 184146, "epoch": 4384} {"train_loss": -7.091375827789307, "global_step": 184147, "epoch": 4384} {"train_loss": -7.14341926574707, "global_step": 184148, "epoch": 4384} {"train_loss": -6.99100399017334, "global_step": 184149, "epoch": 4384} {"train_loss": -7.097910404205322, "global_step": 184150, "epoch": 4384} {"train_loss": -7.044703006744385, "global_step": 184151, "epoch": 4384} {"train_loss": -6.963006973266602, "global_step": 184152, "epoch": 4384} {"train_loss": -7.036599159240723, "global_step": 184153, "epoch": 4384} {"train_loss": -7.145992279052734, "global_step": 184154, "epoch": 4384} {"train_loss": -7.054572105407715, "global_step": 184155, "epoch": 4384} {"train_loss": -7.071756839752197, "global_step": 184156, "epoch": 4384} {"train_loss": -7.093059062957764, "global_step": 184157, "epoch": 4384} {"train_loss": -6.964169979095459, "global_step": 184158, "epoch": 4384} {"train_loss": -7.030570030212402, "global_step": 184159, "epoch": 4384} {"train_loss": -7.075634479522705, "global_step": 184160, "epoch": 4384} {"train_loss": -7.0055155754089355, "global_step": 184161, "epoch": 4384} {"train_loss": -7.094603538513184, "global_step": 184162, "epoch": 4384} {"train_loss": -7.0994181632995605, "global_step": 184163, "epoch": 4384} {"train_loss": -7.094295501708984, "global_step": 184164, "epoch": 4384} {"train_loss": -7.146045207977295, "global_step": 184165, "epoch": 4384} {"train_loss": -7.120960235595703, "global_step": 184166, "epoch": 4384} {"train_loss": -7.0554680824279785, "global_step": 184167, "epoch": 4384} {"train_loss": -7.124429225921631, "global_step": 184168, "epoch": 4384} {"train_loss": -7.054289023081462, "global_step": 184169, "epoch": 4384, "val_loss": 69239.8203125} {"train_loss": -7.232419013977051, "global_step": 184170, "epoch": 4385} {"train_loss": -7.0574951171875, "global_step": 184171, "epoch": 4385} {"train_loss": -7.259345054626465, "global_step": 184172, "epoch": 4385} {"train_loss": -7.0234832763671875, "global_step": 184173, "epoch": 4385} {"train_loss": -7.069792747497559, "global_step": 184174, "epoch": 4385} {"train_loss": -7.178656578063965, "global_step": 184175, "epoch": 4385} {"train_loss": -6.987248420715332, "global_step": 184176, "epoch": 4385} {"train_loss": -7.136787414550781, "global_step": 184177, "epoch": 4385} {"train_loss": -7.080924034118652, "global_step": 184178, "epoch": 4385} {"train_loss": -7.058398246765137, "global_step": 184179, "epoch": 4385} {"train_loss": -7.071892738342285, "global_step": 184180, "epoch": 4385} {"train_loss": -7.0904717445373535, "global_step": 184181, "epoch": 4385} {"train_loss": -6.970178604125977, "global_step": 184182, "epoch": 4385} {"train_loss": -7.018294334411621, "global_step": 184183, "epoch": 4385} {"train_loss": -7.020208835601807, "global_step": 184184, "epoch": 4385} {"train_loss": -7.042412281036377, "global_step": 184185, "epoch": 4385} {"train_loss": -7.139437675476074, "global_step": 184186, "epoch": 4385} {"train_loss": -7.082543849945068, "global_step": 184187, "epoch": 4385} {"train_loss": -7.241085052490234, "global_step": 184188, "epoch": 4385} {"train_loss": -7.237644195556641, "global_step": 184189, "epoch": 4385} {"train_loss": -7.118149280548096, "global_step": 184190, "epoch": 4385} {"train_loss": -7.181919097900391, "global_step": 184191, "epoch": 4385} {"train_loss": -7.02458381652832, "global_step": 184192, "epoch": 4385} {"train_loss": -7.188714504241943, "global_step": 184193, "epoch": 4385} {"train_loss": -7.224435806274414, "global_step": 184194, "epoch": 4385} {"train_loss": -7.177618980407715, "global_step": 184195, "epoch": 4385} {"train_loss": -7.207042694091797, "global_step": 184196, "epoch": 4385} {"train_loss": -7.183023452758789, "global_step": 184197, "epoch": 4385} {"train_loss": -7.153457164764404, "global_step": 184198, "epoch": 4385} {"train_loss": -7.108609199523926, "global_step": 184199, "epoch": 4385} {"train_loss": -7.195001602172852, "global_step": 184200, "epoch": 4385} {"train_loss": -7.171645164489746, "global_step": 184201, "epoch": 4385} {"train_loss": -7.283395767211914, "global_step": 184202, "epoch": 4385} {"train_loss": -7.206785202026367, "global_step": 184203, "epoch": 4385} {"train_loss": -7.098468780517578, "global_step": 184204, "epoch": 4385} {"train_loss": -7.240001201629639, "global_step": 184205, "epoch": 4385} {"train_loss": -7.1561174392700195, "global_step": 184206, "epoch": 4385} {"train_loss": -7.093025207519531, "global_step": 184207, "epoch": 4385} {"train_loss": -7.177623748779297, "global_step": 184208, "epoch": 4385} {"train_loss": -7.20456600189209, "global_step": 184209, "epoch": 4385} {"train_loss": -7.104957580566406, "global_step": 184210, "epoch": 4385} {"train_loss": -7.130761521203177, "global_step": 184211, "epoch": 4385, "val_loss": 69454.8203125} {"train_loss": -7.231732368469238, "global_step": 184212, "epoch": 4386} {"train_loss": -7.18072509765625, "global_step": 184213, "epoch": 4386} {"train_loss": -7.200566291809082, "global_step": 184214, "epoch": 4386} {"train_loss": -7.213354110717773, "global_step": 184215, "epoch": 4386} {"train_loss": -7.290848731994629, "global_step": 184216, "epoch": 4386} {"train_loss": -7.197659492492676, "global_step": 184217, "epoch": 4386} {"train_loss": -7.157813549041748, "global_step": 184218, "epoch": 4386} {"train_loss": -7.154499053955078, "global_step": 184219, "epoch": 4386} {"train_loss": -7.195928573608398, "global_step": 184220, "epoch": 4386} {"train_loss": -7.176684379577637, "global_step": 184221, "epoch": 4386} {"train_loss": -7.161043167114258, "global_step": 184222, "epoch": 4386} {"train_loss": -7.211190700531006, "global_step": 184223, "epoch": 4386} {"train_loss": -7.221628665924072, "global_step": 184224, "epoch": 4386} {"train_loss": -7.080988883972168, "global_step": 184225, "epoch": 4386} {"train_loss": -7.225879669189453, "global_step": 184226, "epoch": 4386} {"train_loss": -7.27764368057251, "global_step": 184227, "epoch": 4386} {"train_loss": -7.1691060066223145, "global_step": 184228, "epoch": 4386} {"train_loss": -7.257390022277832, "global_step": 184229, "epoch": 4386} {"train_loss": -7.1948442459106445, "global_step": 184230, "epoch": 4386} {"train_loss": -7.018496990203857, "global_step": 184231, "epoch": 4386} {"train_loss": -7.197212219238281, "global_step": 184232, "epoch": 4386} {"train_loss": -7.270057678222656, "global_step": 184233, "epoch": 4386} {"train_loss": -7.0639214515686035, "global_step": 184234, "epoch": 4386} {"train_loss": -7.1468305587768555, "global_step": 184235, "epoch": 4386} {"train_loss": -7.108899116516113, "global_step": 184236, "epoch": 4386} {"train_loss": -7.112739086151123, "global_step": 184237, "epoch": 4386} {"train_loss": -7.015697479248047, "global_step": 184238, "epoch": 4386} {"train_loss": -7.278065204620361, "global_step": 184239, "epoch": 4386} {"train_loss": -7.089614391326904, "global_step": 184240, "epoch": 4386} {"train_loss": -7.082287311553955, "global_step": 184241, "epoch": 4386} {"train_loss": -7.117439270019531, "global_step": 184242, "epoch": 4386} {"train_loss": -6.984637260437012, "global_step": 184243, "epoch": 4386} {"train_loss": -7.023355484008789, "global_step": 184244, "epoch": 4386} {"train_loss": -7.2539567947387695, "global_step": 184245, "epoch": 4386} {"train_loss": -7.1039605140686035, "global_step": 184246, "epoch": 4386} {"train_loss": -7.142941474914551, "global_step": 184247, "epoch": 4386} {"train_loss": -7.158927917480469, "global_step": 184248, "epoch": 4386} {"train_loss": -7.052620887756348, "global_step": 184249, "epoch": 4386} {"train_loss": -7.163106918334961, "global_step": 184250, "epoch": 4386} {"train_loss": -7.031845569610596, "global_step": 184251, "epoch": 4386} {"train_loss": -7.183619022369385, "global_step": 184252, "epoch": 4386} {"train_loss": -7.156773964564006, "global_step": 184253, "epoch": 4386, "val_loss": 69563.9921875} {"train_loss": -7.110154628753662, "global_step": 184254, "epoch": 4387} {"train_loss": -7.1977643966674805, "global_step": 184255, "epoch": 4387} {"train_loss": -6.937399387359619, "global_step": 184256, "epoch": 4387} {"train_loss": -7.047138214111328, "global_step": 184257, "epoch": 4387} {"train_loss": -7.139939308166504, "global_step": 184258, "epoch": 4387} {"train_loss": -7.0600433349609375, "global_step": 184259, "epoch": 4387} {"train_loss": -7.1392059326171875, "global_step": 184260, "epoch": 4387} {"train_loss": -7.160953044891357, "global_step": 184261, "epoch": 4387} {"train_loss": -7.110921859741211, "global_step": 184262, "epoch": 4387} {"train_loss": -7.023619651794434, "global_step": 184263, "epoch": 4387} {"train_loss": -7.128415107727051, "global_step": 184264, "epoch": 4387} {"train_loss": -7.152894020080566, "global_step": 184265, "epoch": 4387} {"train_loss": -7.053279876708984, "global_step": 184266, "epoch": 4387} {"train_loss": -7.183986663818359, "global_step": 184267, "epoch": 4387} {"train_loss": -7.202495574951172, "global_step": 184268, "epoch": 4387} {"train_loss": -6.908339500427246, "global_step": 184269, "epoch": 4387} {"train_loss": -7.056694507598877, "global_step": 184270, "epoch": 4387} {"train_loss": -7.052934169769287, "global_step": 184271, "epoch": 4387} {"train_loss": -7.091088771820068, "global_step": 184272, "epoch": 4387} {"train_loss": -7.140431880950928, "global_step": 184273, "epoch": 4387} {"train_loss": -7.117738246917725, "global_step": 184274, "epoch": 4387} {"train_loss": -7.109160423278809, "global_step": 184275, "epoch": 4387} {"train_loss": -7.172101974487305, "global_step": 184276, "epoch": 4387} {"train_loss": -7.133855819702148, "global_step": 184277, "epoch": 4387} {"train_loss": -7.04130744934082, "global_step": 184278, "epoch": 4387} {"train_loss": -7.192163467407227, "global_step": 184279, "epoch": 4387} {"train_loss": -7.057900428771973, "global_step": 184280, "epoch": 4387} {"train_loss": -7.133822917938232, "global_step": 184281, "epoch": 4387} {"train_loss": -7.059589862823486, "global_step": 184282, "epoch": 4387} {"train_loss": -7.240534782409668, "global_step": 184283, "epoch": 4387} {"train_loss": -7.112734317779541, "global_step": 184284, "epoch": 4387} {"train_loss": -7.069680213928223, "global_step": 184285, "epoch": 4387} {"train_loss": -7.255544185638428, "global_step": 184286, "epoch": 4387} {"train_loss": -7.216799259185791, "global_step": 184287, "epoch": 4387} {"train_loss": -7.198397636413574, "global_step": 184288, "epoch": 4387} {"train_loss": -7.066948890686035, "global_step": 184289, "epoch": 4387} {"train_loss": -7.137477874755859, "global_step": 184290, "epoch": 4387} {"train_loss": -7.250874996185303, "global_step": 184291, "epoch": 4387} {"train_loss": -7.08305549621582, "global_step": 184292, "epoch": 4387} {"train_loss": -6.9607696533203125, "global_step": 184293, "epoch": 4387} {"train_loss": -7.095669746398926, "global_step": 184294, "epoch": 4387} {"train_loss": -7.113375845409575, "global_step": 184295, "epoch": 4387, "val_loss": 69522.8046875} {"train_loss": -7.135125637054443, "global_step": 184296, "epoch": 4388} {"train_loss": -7.149454116821289, "global_step": 184297, "epoch": 4388} {"train_loss": -7.134951591491699, "global_step": 184298, "epoch": 4388} {"train_loss": -7.227375030517578, "global_step": 184299, "epoch": 4388} {"train_loss": -7.17349910736084, "global_step": 184300, "epoch": 4388} {"train_loss": -7.1059417724609375, "global_step": 184301, "epoch": 4388} {"train_loss": -7.134868144989014, "global_step": 184302, "epoch": 4388} {"train_loss": -7.093541145324707, "global_step": 184303, "epoch": 4388} {"train_loss": -7.250105381011963, "global_step": 184304, "epoch": 4388} {"train_loss": -7.072737216949463, "global_step": 184305, "epoch": 4388} {"train_loss": -7.102819442749023, "global_step": 184306, "epoch": 4388} {"train_loss": -7.137434482574463, "global_step": 184307, "epoch": 4388} {"train_loss": -7.191831588745117, "global_step": 184308, "epoch": 4388} {"train_loss": -7.122409820556641, "global_step": 184309, "epoch": 4388} {"train_loss": -7.120506763458252, "global_step": 184310, "epoch": 4388} {"train_loss": -7.091158866882324, "global_step": 184311, "epoch": 4388} {"train_loss": -7.0709547996521, "global_step": 184312, "epoch": 4388} {"train_loss": -7.107506275177002, "global_step": 184313, "epoch": 4388} {"train_loss": -7.18659782409668, "global_step": 184314, "epoch": 4388} {"train_loss": -7.103140830993652, "global_step": 184315, "epoch": 4388} {"train_loss": -7.135793209075928, "global_step": 184316, "epoch": 4388} {"train_loss": -7.004622936248779, "global_step": 184317, "epoch": 4388} {"train_loss": -7.13502311706543, "global_step": 184318, "epoch": 4388} {"train_loss": -7.046205997467041, "global_step": 184319, "epoch": 4388} {"train_loss": -7.011780738830566, "global_step": 184320, "epoch": 4388} {"train_loss": -7.072028636932373, "global_step": 184321, "epoch": 4388} {"train_loss": -7.127248764038086, "global_step": 184322, "epoch": 4388} {"train_loss": -7.209816932678223, "global_step": 184323, "epoch": 4388} {"train_loss": -7.091093063354492, "global_step": 184324, "epoch": 4388} {"train_loss": -7.223579406738281, "global_step": 184325, "epoch": 4388} {"train_loss": -7.125655174255371, "global_step": 184326, "epoch": 4388} {"train_loss": -7.1300201416015625, "global_step": 184327, "epoch": 4388} {"train_loss": -7.016731262207031, "global_step": 184328, "epoch": 4388} {"train_loss": -7.081035614013672, "global_step": 184329, "epoch": 4388} {"train_loss": -7.056547164916992, "global_step": 184330, "epoch": 4388} {"train_loss": -7.042097091674805, "global_step": 184331, "epoch": 4388} {"train_loss": -7.202459812164307, "global_step": 184332, "epoch": 4388} {"train_loss": -7.121914863586426, "global_step": 184333, "epoch": 4388} {"train_loss": -7.091640949249268, "global_step": 184334, "epoch": 4388} {"train_loss": -7.192552089691162, "global_step": 184335, "epoch": 4388} {"train_loss": -7.155740737915039, "global_step": 184336, "epoch": 4388} {"train_loss": -7.124655485153198, "global_step": 184337, "epoch": 4388, "val_loss": 69386.34375} {"train_loss": -7.1337480545043945, "global_step": 184338, "epoch": 4389} {"train_loss": -7.282680511474609, "global_step": 184339, "epoch": 4389} {"train_loss": -7.180120468139648, "global_step": 184340, "epoch": 4389} {"train_loss": -7.1560797691345215, "global_step": 184341, "epoch": 4389} {"train_loss": -7.120571136474609, "global_step": 184342, "epoch": 4389} {"train_loss": -7.240012168884277, "global_step": 184343, "epoch": 4389} {"train_loss": -7.25354528427124, "global_step": 184344, "epoch": 4389} {"train_loss": -7.226590156555176, "global_step": 184345, "epoch": 4389} {"train_loss": -7.144135475158691, "global_step": 184346, "epoch": 4389} {"train_loss": -7.37113094329834, "global_step": 184347, "epoch": 4389} {"train_loss": -7.225241661071777, "global_step": 184348, "epoch": 4389} {"train_loss": -7.151044845581055, "global_step": 184349, "epoch": 4389} {"train_loss": -7.259078025817871, "global_step": 184350, "epoch": 4389} {"train_loss": -7.251153469085693, "global_step": 184351, "epoch": 4389} {"train_loss": -7.253324508666992, "global_step": 184352, "epoch": 4389} {"train_loss": -7.231258392333984, "global_step": 184353, "epoch": 4389} {"train_loss": -7.149276256561279, "global_step": 184354, "epoch": 4389} {"train_loss": -7.327666282653809, "global_step": 184355, "epoch": 4389} {"train_loss": -7.03093957901001, "global_step": 184356, "epoch": 4389} {"train_loss": -7.1710405349731445, "global_step": 184357, "epoch": 4389} {"train_loss": -7.172139644622803, "global_step": 184358, "epoch": 4389} {"train_loss": -7.077463626861572, "global_step": 184359, "epoch": 4389} {"train_loss": -7.170877933502197, "global_step": 184360, "epoch": 4389} {"train_loss": -7.146056175231934, "global_step": 184361, "epoch": 4389} {"train_loss": -7.237812519073486, "global_step": 184362, "epoch": 4389} {"train_loss": -6.979739189147949, "global_step": 184363, "epoch": 4389} {"train_loss": -7.138210296630859, "global_step": 184364, "epoch": 4389} {"train_loss": -6.97570276260376, "global_step": 184365, "epoch": 4389} {"train_loss": -6.909837245941162, "global_step": 184366, "epoch": 4389} {"train_loss": -7.049096584320068, "global_step": 184367, "epoch": 4389} {"train_loss": -6.96718168258667, "global_step": 184368, "epoch": 4389} {"train_loss": -7.00532865524292, "global_step": 184369, "epoch": 4389} {"train_loss": -6.947272300720215, "global_step": 184370, "epoch": 4389} {"train_loss": -7.124750137329102, "global_step": 184371, "epoch": 4389} {"train_loss": -7.071363925933838, "global_step": 184372, "epoch": 4389} {"train_loss": -7.037508964538574, "global_step": 184373, "epoch": 4389} {"train_loss": -7.149298191070557, "global_step": 184374, "epoch": 4389} {"train_loss": -7.154780864715576, "global_step": 184375, "epoch": 4389} {"train_loss": -7.162817478179932, "global_step": 184376, "epoch": 4389} {"train_loss": -7.02967643737793, "global_step": 184377, "epoch": 4389} {"train_loss": -7.076176643371582, "global_step": 184378, "epoch": 4389} {"train_loss": -7.142085677101498, "global_step": 184379, "epoch": 4389, "val_loss": 69269.421875} {"train_loss": -7.125497817993164, "global_step": 184380, "epoch": 4390} {"train_loss": -7.145729064941406, "global_step": 184381, "epoch": 4390} {"train_loss": -7.327077865600586, "global_step": 184382, "epoch": 4390} {"train_loss": -7.086182594299316, "global_step": 184383, "epoch": 4390} {"train_loss": -7.188352108001709, "global_step": 184384, "epoch": 4390} {"train_loss": -7.018065452575684, "global_step": 184385, "epoch": 4390} {"train_loss": -7.141495704650879, "global_step": 184386, "epoch": 4390} {"train_loss": -6.981263637542725, "global_step": 184387, "epoch": 4390} {"train_loss": -6.994885444641113, "global_step": 184388, "epoch": 4390} {"train_loss": -7.1090474128723145, "global_step": 184389, "epoch": 4390} {"train_loss": -7.119174003601074, "global_step": 184390, "epoch": 4390} {"train_loss": -7.113338470458984, "global_step": 184391, "epoch": 4390} {"train_loss": -7.04067325592041, "global_step": 184392, "epoch": 4390} {"train_loss": -7.118715286254883, "global_step": 184393, "epoch": 4390} {"train_loss": -7.194340705871582, "global_step": 184394, "epoch": 4390} {"train_loss": -7.110655784606934, "global_step": 184395, "epoch": 4390} {"train_loss": -7.1406049728393555, "global_step": 184396, "epoch": 4390} {"train_loss": -7.1697611808776855, "global_step": 184397, "epoch": 4390} {"train_loss": -7.042453765869141, "global_step": 184398, "epoch": 4390} {"train_loss": -7.122847557067871, "global_step": 184399, "epoch": 4390} {"train_loss": -7.26633358001709, "global_step": 184400, "epoch": 4390} {"train_loss": -7.202671051025391, "global_step": 184401, "epoch": 4390} {"train_loss": -7.096997261047363, "global_step": 184402, "epoch": 4390} {"train_loss": -7.1987762451171875, "global_step": 184403, "epoch": 4390} {"train_loss": -7.1290178298950195, "global_step": 184404, "epoch": 4390} {"train_loss": -7.1435346603393555, "global_step": 184405, "epoch": 4390} {"train_loss": -7.249246597290039, "global_step": 184406, "epoch": 4390} {"train_loss": -7.1824116706848145, "global_step": 184407, "epoch": 4390} {"train_loss": -7.276053428649902, "global_step": 184408, "epoch": 4390} {"train_loss": -7.219280242919922, "global_step": 184409, "epoch": 4390} {"train_loss": -7.200368404388428, "global_step": 184410, "epoch": 4390} {"train_loss": -7.262080669403076, "global_step": 184411, "epoch": 4390} {"train_loss": -7.1600542068481445, "global_step": 184412, "epoch": 4390} {"train_loss": -7.195735931396484, "global_step": 184413, "epoch": 4390} {"train_loss": -7.139435768127441, "global_step": 184414, "epoch": 4390} {"train_loss": -7.1101226806640625, "global_step": 184415, "epoch": 4390} {"train_loss": -7.238053798675537, "global_step": 184416, "epoch": 4390} {"train_loss": -7.216896057128906, "global_step": 184417, "epoch": 4390} {"train_loss": -7.197186470031738, "global_step": 184418, "epoch": 4390} {"train_loss": -7.273056983947754, "global_step": 184419, "epoch": 4390} {"train_loss": -7.200655937194824, "global_step": 184420, "epoch": 4390} {"train_loss": -7.1575052965255015, "global_step": 184421, "epoch": 4390, "val_loss": 69444.1953125} {"train_loss": -7.224752426147461, "global_step": 184422, "epoch": 4391} {"train_loss": -7.096714019775391, "global_step": 184423, "epoch": 4391} {"train_loss": -7.0980224609375, "global_step": 184424, "epoch": 4391} {"train_loss": -7.275414943695068, "global_step": 184425, "epoch": 4391} {"train_loss": -7.168004035949707, "global_step": 184426, "epoch": 4391} {"train_loss": -7.077891826629639, "global_step": 184427, "epoch": 4391} {"train_loss": -7.15524435043335, "global_step": 184428, "epoch": 4391} {"train_loss": -7.161072731018066, "global_step": 184429, "epoch": 4391} {"train_loss": -7.125688552856445, "global_step": 184430, "epoch": 4391} {"train_loss": -7.154435634613037, "global_step": 184431, "epoch": 4391} {"train_loss": -7.110575199127197, "global_step": 184432, "epoch": 4391} {"train_loss": -7.175403594970703, "global_step": 184433, "epoch": 4391} {"train_loss": -7.120616912841797, "global_step": 184434, "epoch": 4391} {"train_loss": -6.951210975646973, "global_step": 184435, "epoch": 4391} {"train_loss": -7.111690521240234, "global_step": 184436, "epoch": 4391} {"train_loss": -6.883482933044434, "global_step": 184437, "epoch": 4391} {"train_loss": -7.131541728973389, "global_step": 184438, "epoch": 4391} {"train_loss": -7.147912979125977, "global_step": 184439, "epoch": 4391} {"train_loss": -6.9705424308776855, "global_step": 184440, "epoch": 4391} {"train_loss": -7.208131790161133, "global_step": 184441, "epoch": 4391} {"train_loss": -7.092277526855469, "global_step": 184442, "epoch": 4391} {"train_loss": -7.103872776031494, "global_step": 184443, "epoch": 4391} {"train_loss": -7.009411334991455, "global_step": 184444, "epoch": 4391} {"train_loss": -7.06550407409668, "global_step": 184445, "epoch": 4391} {"train_loss": -7.134115695953369, "global_step": 184446, "epoch": 4391} {"train_loss": -6.827998161315918, "global_step": 184447, "epoch": 4391} {"train_loss": -6.951925277709961, "global_step": 184448, "epoch": 4391} {"train_loss": -7.061642646789551, "global_step": 184449, "epoch": 4391} {"train_loss": -7.041553497314453, "global_step": 184450, "epoch": 4391} {"train_loss": -7.011681079864502, "global_step": 184451, "epoch": 4391} {"train_loss": -7.1408162117004395, "global_step": 184452, "epoch": 4391} {"train_loss": -7.124284744262695, "global_step": 184453, "epoch": 4391} {"train_loss": -7.102843284606934, "global_step": 184454, "epoch": 4391} {"train_loss": -7.090304374694824, "global_step": 184455, "epoch": 4391} {"train_loss": -7.199251174926758, "global_step": 184456, "epoch": 4391} {"train_loss": -7.032189846038818, "global_step": 184457, "epoch": 4391} {"train_loss": -7.16309928894043, "global_step": 184458, "epoch": 4391} {"train_loss": -7.150317192077637, "global_step": 184459, "epoch": 4391} {"train_loss": -7.158109664916992, "global_step": 184460, "epoch": 4391} {"train_loss": -7.089683532714844, "global_step": 184461, "epoch": 4391} {"train_loss": -7.20846700668335, "global_step": 184462, "epoch": 4391} {"train_loss": -7.103734368369693, "global_step": 184463, "epoch": 4391, "val_loss": 69502.0859375} {"train_loss": -7.161075115203857, "global_step": 184464, "epoch": 4392} {"train_loss": -6.939817428588867, "global_step": 184465, "epoch": 4392} {"train_loss": -7.213678359985352, "global_step": 184466, "epoch": 4392} {"train_loss": -7.081293106079102, "global_step": 184467, "epoch": 4392} {"train_loss": -7.1478376388549805, "global_step": 184468, "epoch": 4392} {"train_loss": -7.149418830871582, "global_step": 184469, "epoch": 4392} {"train_loss": -7.076610565185547, "global_step": 184470, "epoch": 4392} {"train_loss": -7.151894569396973, "global_step": 184471, "epoch": 4392} {"train_loss": -7.169773578643799, "global_step": 184472, "epoch": 4392} {"train_loss": -7.213564872741699, "global_step": 184473, "epoch": 4392} {"train_loss": -7.151215076446533, "global_step": 184474, "epoch": 4392} {"train_loss": -7.064486503601074, "global_step": 184475, "epoch": 4392} {"train_loss": -7.169151306152344, "global_step": 184476, "epoch": 4392} {"train_loss": -7.109649658203125, "global_step": 184477, "epoch": 4392} {"train_loss": -7.13508415222168, "global_step": 184478, "epoch": 4392} {"train_loss": -7.185819149017334, "global_step": 184479, "epoch": 4392} {"train_loss": -7.210047245025635, "global_step": 184480, "epoch": 4392} {"train_loss": -7.186697959899902, "global_step": 184481, "epoch": 4392} {"train_loss": -7.146890640258789, "global_step": 184482, "epoch": 4392} {"train_loss": -7.225017547607422, "global_step": 184483, "epoch": 4392} {"train_loss": -7.209945201873779, "global_step": 184484, "epoch": 4392} {"train_loss": -7.312180519104004, "global_step": 184485, "epoch": 4392} {"train_loss": -7.165210247039795, "global_step": 184486, "epoch": 4392} {"train_loss": -7.179634094238281, "global_step": 184487, "epoch": 4392} {"train_loss": -7.173792839050293, "global_step": 184488, "epoch": 4392} {"train_loss": -7.242278099060059, "global_step": 184489, "epoch": 4392} {"train_loss": -7.15153169631958, "global_step": 184490, "epoch": 4392} {"train_loss": -7.170491695404053, "global_step": 184491, "epoch": 4392} {"train_loss": -7.0885009765625, "global_step": 184492, "epoch": 4392} {"train_loss": -7.251662254333496, "global_step": 184493, "epoch": 4392} {"train_loss": -7.174713134765625, "global_step": 184494, "epoch": 4392} {"train_loss": -7.111932754516602, "global_step": 184495, "epoch": 4392} {"train_loss": -7.138654708862305, "global_step": 184496, "epoch": 4392} {"train_loss": -7.161689758300781, "global_step": 184497, "epoch": 4392} {"train_loss": -7.176749229431152, "global_step": 184498, "epoch": 4392} {"train_loss": -7.178691864013672, "global_step": 184499, "epoch": 4392} {"train_loss": -7.122244358062744, "global_step": 184500, "epoch": 4392} {"train_loss": -7.206626892089844, "global_step": 184501, "epoch": 4392} {"train_loss": -7.375036716461182, "global_step": 184502, "epoch": 4392} {"train_loss": -7.200076103210449, "global_step": 184503, "epoch": 4392} {"train_loss": -7.150557518005371, "global_step": 184504, "epoch": 4392} {"train_loss": -7.168735345204671, "global_step": 184505, "epoch": 4392, "val_loss": 69345.4921875} {"train_loss": -7.16690731048584, "global_step": 184506, "epoch": 4393} {"train_loss": -7.147618293762207, "global_step": 184507, "epoch": 4393} {"train_loss": -7.230912208557129, "global_step": 184508, "epoch": 4393} {"train_loss": -7.2031145095825195, "global_step": 184509, "epoch": 4393} {"train_loss": -7.235379219055176, "global_step": 184510, "epoch": 4393} {"train_loss": -7.092113494873047, "global_step": 184511, "epoch": 4393} {"train_loss": -7.308812141418457, "global_step": 184512, "epoch": 4393} {"train_loss": -7.2262468338012695, "global_step": 184513, "epoch": 4393} {"train_loss": -7.173859596252441, "global_step": 184514, "epoch": 4393} {"train_loss": -7.235049247741699, "global_step": 184515, "epoch": 4393} {"train_loss": -7.212522983551025, "global_step": 184516, "epoch": 4393} {"train_loss": -7.163777828216553, "global_step": 184517, "epoch": 4393} {"train_loss": -7.250391006469727, "global_step": 184518, "epoch": 4393} {"train_loss": -7.183671474456787, "global_step": 184519, "epoch": 4393} {"train_loss": -7.166347503662109, "global_step": 184520, "epoch": 4393} {"train_loss": -7.164867401123047, "global_step": 184521, "epoch": 4393} {"train_loss": -7.163364410400391, "global_step": 184522, "epoch": 4393} {"train_loss": -7.254487991333008, "global_step": 184523, "epoch": 4393} {"train_loss": -7.208342552185059, "global_step": 184524, "epoch": 4393} {"train_loss": -7.28776216506958, "global_step": 184525, "epoch": 4393} {"train_loss": -7.152950286865234, "global_step": 184526, "epoch": 4393} {"train_loss": -7.154137134552002, "global_step": 184527, "epoch": 4393} {"train_loss": -7.237263202667236, "global_step": 184528, "epoch": 4393} {"train_loss": -7.2374348640441895, "global_step": 184529, "epoch": 4393} {"train_loss": -7.215462684631348, "global_step": 184530, "epoch": 4393} {"train_loss": -7.168972015380859, "global_step": 184531, "epoch": 4393} {"train_loss": -7.160369873046875, "global_step": 184532, "epoch": 4393} {"train_loss": -7.104667663574219, "global_step": 184533, "epoch": 4393} {"train_loss": -7.119807243347168, "global_step": 184534, "epoch": 4393} {"train_loss": -7.252243518829346, "global_step": 184535, "epoch": 4393} {"train_loss": -7.204969882965088, "global_step": 184536, "epoch": 4393} {"train_loss": -7.190046787261963, "global_step": 184537, "epoch": 4393} {"train_loss": -7.137041091918945, "global_step": 184538, "epoch": 4393} {"train_loss": -7.03318977355957, "global_step": 184539, "epoch": 4393} {"train_loss": -7.200251579284668, "global_step": 184540, "epoch": 4393} {"train_loss": -6.953083038330078, "global_step": 184541, "epoch": 4393} {"train_loss": -7.008844375610352, "global_step": 184542, "epoch": 4393} {"train_loss": -7.181828498840332, "global_step": 184543, "epoch": 4393} {"train_loss": -7.119686126708984, "global_step": 184544, "epoch": 4393} {"train_loss": -6.978021621704102, "global_step": 184545, "epoch": 4393} {"train_loss": -7.1813154220581055, "global_step": 184546, "epoch": 4393} {"train_loss": -7.172260659081595, "global_step": 184547, "epoch": 4393, "val_loss": 69399.9375} {"train_loss": -7.074626922607422, "global_step": 184548, "epoch": 4394} {"train_loss": -7.199364185333252, "global_step": 184549, "epoch": 4394} {"train_loss": -7.065986633300781, "global_step": 184550, "epoch": 4394} {"train_loss": -7.162876129150391, "global_step": 184551, "epoch": 4394} {"train_loss": -7.198261260986328, "global_step": 184552, "epoch": 4394} {"train_loss": -7.101255416870117, "global_step": 184553, "epoch": 4394} {"train_loss": -7.143087387084961, "global_step": 184554, "epoch": 4394} {"train_loss": -7.1164045333862305, "global_step": 184555, "epoch": 4394} {"train_loss": -7.150629043579102, "global_step": 184556, "epoch": 4394} {"train_loss": -7.1712799072265625, "global_step": 184557, "epoch": 4394} {"train_loss": -7.085573673248291, "global_step": 184558, "epoch": 4394} {"train_loss": -7.2437520027160645, "global_step": 184559, "epoch": 4394} {"train_loss": -7.148974418640137, "global_step": 184560, "epoch": 4394} {"train_loss": -7.111441612243652, "global_step": 184561, "epoch": 4394} {"train_loss": -7.213390350341797, "global_step": 184562, "epoch": 4394} {"train_loss": -7.264257431030273, "global_step": 184563, "epoch": 4394} {"train_loss": -7.158803939819336, "global_step": 184564, "epoch": 4394} {"train_loss": -7.20032262802124, "global_step": 184565, "epoch": 4394} {"train_loss": -7.1196794509887695, "global_step": 184566, "epoch": 4394} {"train_loss": -7.238400459289551, "global_step": 184567, "epoch": 4394} {"train_loss": -7.105073928833008, "global_step": 184568, "epoch": 4394} {"train_loss": -7.063885688781738, "global_step": 184569, "epoch": 4394} {"train_loss": -7.102905750274658, "global_step": 184570, "epoch": 4394} {"train_loss": -7.074357986450195, "global_step": 184571, "epoch": 4394} {"train_loss": -7.035521030426025, "global_step": 184572, "epoch": 4394} {"train_loss": -7.02301549911499, "global_step": 184573, "epoch": 4394} {"train_loss": -7.151022911071777, "global_step": 184574, "epoch": 4394} {"train_loss": -7.056439399719238, "global_step": 184575, "epoch": 4394} {"train_loss": -6.924782752990723, "global_step": 184576, "epoch": 4394} {"train_loss": -7.089892387390137, "global_step": 184577, "epoch": 4394} {"train_loss": -7.032549858093262, "global_step": 184578, "epoch": 4394} {"train_loss": -6.919058799743652, "global_step": 184579, "epoch": 4394} {"train_loss": -7.063717365264893, "global_step": 184580, "epoch": 4394} {"train_loss": -6.908560752868652, "global_step": 184581, "epoch": 4394} {"train_loss": -7.134696960449219, "global_step": 184582, "epoch": 4394} {"train_loss": -7.027766227722168, "global_step": 184583, "epoch": 4394} {"train_loss": -7.016441822052002, "global_step": 184584, "epoch": 4394} {"train_loss": -7.203672409057617, "global_step": 184585, "epoch": 4394} {"train_loss": -7.019839286804199, "global_step": 184586, "epoch": 4394} {"train_loss": -7.184831619262695, "global_step": 184587, "epoch": 4394} {"train_loss": -7.069797515869141, "global_step": 184588, "epoch": 4394} {"train_loss": -7.107148579188755, "global_step": 184589, "epoch": 4394, "val_loss": 69532.921875} {"train_loss": -7.126623630523682, "global_step": 184590, "epoch": 4395} {"train_loss": -7.1086106300354, "global_step": 184591, "epoch": 4395} {"train_loss": -7.135180473327637, "global_step": 184592, "epoch": 4395} {"train_loss": -6.974287986755371, "global_step": 184593, "epoch": 4395} {"train_loss": -7.0899200439453125, "global_step": 184594, "epoch": 4395} {"train_loss": -7.107367515563965, "global_step": 184595, "epoch": 4395} {"train_loss": -7.089895248413086, "global_step": 184596, "epoch": 4395} {"train_loss": -7.0845746994018555, "global_step": 184597, "epoch": 4395} {"train_loss": -7.165158748626709, "global_step": 184598, "epoch": 4395} {"train_loss": -7.123534202575684, "global_step": 184599, "epoch": 4395} {"train_loss": -7.160372734069824, "global_step": 184600, "epoch": 4395} {"train_loss": -7.132564544677734, "global_step": 184601, "epoch": 4395} {"train_loss": -7.030117511749268, "global_step": 184602, "epoch": 4395} {"train_loss": -7.156889915466309, "global_step": 184603, "epoch": 4395} {"train_loss": -7.18828010559082, "global_step": 184604, "epoch": 4395} {"train_loss": -7.107729911804199, "global_step": 184605, "epoch": 4395} {"train_loss": -7.25691032409668, "global_step": 184606, "epoch": 4395} {"train_loss": -7.213696479797363, "global_step": 184607, "epoch": 4395} {"train_loss": -7.206538677215576, "global_step": 184608, "epoch": 4395} {"train_loss": -7.148957252502441, "global_step": 184609, "epoch": 4395} {"train_loss": -7.179454803466797, "global_step": 184610, "epoch": 4395} {"train_loss": -7.120995998382568, "global_step": 184611, "epoch": 4395} {"train_loss": -7.176350116729736, "global_step": 184612, "epoch": 4395} {"train_loss": -6.999787330627441, "global_step": 184613, "epoch": 4395} {"train_loss": -7.192902565002441, "global_step": 184614, "epoch": 4395} {"train_loss": -7.154174327850342, "global_step": 184615, "epoch": 4395} {"train_loss": -7.070154190063477, "global_step": 184616, "epoch": 4395} {"train_loss": -7.125092506408691, "global_step": 184617, "epoch": 4395} {"train_loss": -7.196712493896484, "global_step": 184618, "epoch": 4395} {"train_loss": -7.079890251159668, "global_step": 184619, "epoch": 4395} {"train_loss": -7.154206275939941, "global_step": 184620, "epoch": 4395} {"train_loss": -7.150550842285156, "global_step": 184621, "epoch": 4395} {"train_loss": -7.1395111083984375, "global_step": 184622, "epoch": 4395} {"train_loss": -7.201748847961426, "global_step": 184623, "epoch": 4395} {"train_loss": -7.145318508148193, "global_step": 184624, "epoch": 4395} {"train_loss": -7.041755676269531, "global_step": 184625, "epoch": 4395} {"train_loss": -7.1092023849487305, "global_step": 184626, "epoch": 4395} {"train_loss": -7.077528953552246, "global_step": 184627, "epoch": 4395} {"train_loss": -7.213685989379883, "global_step": 184628, "epoch": 4395} {"train_loss": -7.053851127624512, "global_step": 184629, "epoch": 4395} {"train_loss": -7.187870502471924, "global_step": 184630, "epoch": 4395} {"train_loss": -7.1322839714231945, "global_step": 184631, "epoch": 4395, "val_loss": 69477.671875} {"train_loss": -7.1657304763793945, "global_step": 184632, "epoch": 4396} {"train_loss": -7.159829616546631, "global_step": 184633, "epoch": 4396} {"train_loss": -7.149031162261963, "global_step": 184634, "epoch": 4396} {"train_loss": -7.110894203186035, "global_step": 184635, "epoch": 4396} {"train_loss": -7.131534576416016, "global_step": 184636, "epoch": 4396} {"train_loss": -7.202754497528076, "global_step": 184637, "epoch": 4396} {"train_loss": -7.173149585723877, "global_step": 184638, "epoch": 4396} {"train_loss": -7.236420154571533, "global_step": 184639, "epoch": 4396} {"train_loss": -7.248043060302734, "global_step": 184640, "epoch": 4396} {"train_loss": -7.124434471130371, "global_step": 184641, "epoch": 4396} {"train_loss": -7.247152328491211, "global_step": 184642, "epoch": 4396} {"train_loss": -7.206257343292236, "global_step": 184643, "epoch": 4396} {"train_loss": -7.105828285217285, "global_step": 184644, "epoch": 4396} {"train_loss": -7.252105712890625, "global_step": 184645, "epoch": 4396} {"train_loss": -7.264107704162598, "global_step": 184646, "epoch": 4396} {"train_loss": -7.145355701446533, "global_step": 184647, "epoch": 4396} {"train_loss": -7.17561149597168, "global_step": 184648, "epoch": 4396} {"train_loss": -7.09315299987793, "global_step": 184649, "epoch": 4396} {"train_loss": -7.157464504241943, "global_step": 184650, "epoch": 4396} {"train_loss": -7.241859436035156, "global_step": 184651, "epoch": 4396} {"train_loss": -7.108338356018066, "global_step": 184652, "epoch": 4396} {"train_loss": -7.1752238273620605, "global_step": 184653, "epoch": 4396} {"train_loss": -7.200831413269043, "global_step": 184654, "epoch": 4396} {"train_loss": -7.251477241516113, "global_step": 184655, "epoch": 4396} {"train_loss": -7.153809547424316, "global_step": 184656, "epoch": 4396} {"train_loss": -7.101781368255615, "global_step": 184657, "epoch": 4396} {"train_loss": -7.189558982849121, "global_step": 184658, "epoch": 4396} {"train_loss": -7.159405708312988, "global_step": 184659, "epoch": 4396} {"train_loss": -7.238224983215332, "global_step": 184660, "epoch": 4396} {"train_loss": -7.203713417053223, "global_step": 184661, "epoch": 4396} {"train_loss": -7.154962539672852, "global_step": 184662, "epoch": 4396} {"train_loss": -7.155486106872559, "global_step": 184663, "epoch": 4396} {"train_loss": -7.082617282867432, "global_step": 184664, "epoch": 4396} {"train_loss": -7.208721160888672, "global_step": 184665, "epoch": 4396} {"train_loss": -7.182172775268555, "global_step": 184666, "epoch": 4396} {"train_loss": -7.207999229431152, "global_step": 184667, "epoch": 4396} {"train_loss": -7.154437065124512, "global_step": 184668, "epoch": 4396} {"train_loss": -7.073182106018066, "global_step": 184669, "epoch": 4396} {"train_loss": -7.067244529724121, "global_step": 184670, "epoch": 4396} {"train_loss": -7.08287239074707, "global_step": 184671, "epoch": 4396} {"train_loss": -7.227022171020508, "global_step": 184672, "epoch": 4396} {"train_loss": -7.166052466347104, "global_step": 184673, "epoch": 4396, "val_loss": 69571.2734375} {"train_loss": -7.114274978637695, "global_step": 184674, "epoch": 4397} {"train_loss": -7.1556396484375, "global_step": 184675, "epoch": 4397} {"train_loss": -7.0992865562438965, "global_step": 184676, "epoch": 4397} {"train_loss": -7.214622497558594, "global_step": 184677, "epoch": 4397} {"train_loss": -7.1142473220825195, "global_step": 184678, "epoch": 4397} {"train_loss": -7.089144229888916, "global_step": 184679, "epoch": 4397} {"train_loss": -7.252479553222656, "global_step": 184680, "epoch": 4397} {"train_loss": -7.074568748474121, "global_step": 184681, "epoch": 4397} {"train_loss": -7.071536064147949, "global_step": 184682, "epoch": 4397} {"train_loss": -7.1543450355529785, "global_step": 184683, "epoch": 4397} {"train_loss": -7.168758392333984, "global_step": 184684, "epoch": 4397} {"train_loss": -7.056418418884277, "global_step": 184685, "epoch": 4397} {"train_loss": -7.056957244873047, "global_step": 184686, "epoch": 4397} {"train_loss": -7.080798149108887, "global_step": 184687, "epoch": 4397} {"train_loss": -7.178767204284668, "global_step": 184688, "epoch": 4397} {"train_loss": -7.113688945770264, "global_step": 184689, "epoch": 4397} {"train_loss": -7.188748359680176, "global_step": 184690, "epoch": 4397} {"train_loss": -7.216115951538086, "global_step": 184691, "epoch": 4397} {"train_loss": -7.220456123352051, "global_step": 184692, "epoch": 4397} {"train_loss": -7.130656719207764, "global_step": 184693, "epoch": 4397} {"train_loss": -7.224291801452637, "global_step": 184694, "epoch": 4397} {"train_loss": -7.185764789581299, "global_step": 184695, "epoch": 4397} {"train_loss": -7.194973468780518, "global_step": 184696, "epoch": 4397} {"train_loss": -7.187175273895264, "global_step": 184697, "epoch": 4397} {"train_loss": -7.12738037109375, "global_step": 184698, "epoch": 4397} {"train_loss": -7.150880336761475, "global_step": 184699, "epoch": 4397} {"train_loss": -7.0506062507629395, "global_step": 184700, "epoch": 4397} {"train_loss": -7.214073181152344, "global_step": 184701, "epoch": 4397} {"train_loss": -7.114847183227539, "global_step": 184702, "epoch": 4397} {"train_loss": -6.975002765655518, "global_step": 184703, "epoch": 4397} {"train_loss": -7.003146648406982, "global_step": 184704, "epoch": 4397} {"train_loss": -6.905858516693115, "global_step": 184705, "epoch": 4397} {"train_loss": -7.070988178253174, "global_step": 184706, "epoch": 4397} {"train_loss": -7.192448616027832, "global_step": 184707, "epoch": 4397} {"train_loss": -7.02717399597168, "global_step": 184708, "epoch": 4397} {"train_loss": -6.953309535980225, "global_step": 184709, "epoch": 4397} {"train_loss": -7.149771690368652, "global_step": 184710, "epoch": 4397} {"train_loss": -7.001477241516113, "global_step": 184711, "epoch": 4397} {"train_loss": -7.0773420333862305, "global_step": 184712, "epoch": 4397} {"train_loss": -6.916440963745117, "global_step": 184713, "epoch": 4397} {"train_loss": -7.098313808441162, "global_step": 184714, "epoch": 4397} {"train_loss": -7.107579288028536, "global_step": 184715, "epoch": 4397, "val_loss": 69666.5546875} {"train_loss": -6.916332721710205, "global_step": 184716, "epoch": 4398} {"train_loss": -7.163174629211426, "global_step": 184717, "epoch": 4398} {"train_loss": -7.078944206237793, "global_step": 184718, "epoch": 4398} {"train_loss": -7.046234130859375, "global_step": 184719, "epoch": 4398} {"train_loss": -7.050926685333252, "global_step": 184720, "epoch": 4398} {"train_loss": -6.955540180206299, "global_step": 184721, "epoch": 4398} {"train_loss": -7.134275436401367, "global_step": 184722, "epoch": 4398} {"train_loss": -7.1050286293029785, "global_step": 184723, "epoch": 4398} {"train_loss": -7.230550765991211, "global_step": 184724, "epoch": 4398} {"train_loss": -7.100550174713135, "global_step": 184725, "epoch": 4398} {"train_loss": -7.147187232971191, "global_step": 184726, "epoch": 4398} {"train_loss": -7.138041019439697, "global_step": 184727, "epoch": 4398} {"train_loss": -7.164216041564941, "global_step": 184728, "epoch": 4398} {"train_loss": -7.150920867919922, "global_step": 184729, "epoch": 4398} {"train_loss": -7.051323413848877, "global_step": 184730, "epoch": 4398} {"train_loss": -7.032435417175293, "global_step": 184731, "epoch": 4398} {"train_loss": -7.177273750305176, "global_step": 184732, "epoch": 4398} {"train_loss": -6.958704948425293, "global_step": 184733, "epoch": 4398} {"train_loss": -7.141975402832031, "global_step": 184734, "epoch": 4398} {"train_loss": -7.059954643249512, "global_step": 184735, "epoch": 4398} {"train_loss": -7.124005317687988, "global_step": 184736, "epoch": 4398} {"train_loss": -7.1132493019104, "global_step": 184737, "epoch": 4398} {"train_loss": -7.180686950683594, "global_step": 184738, "epoch": 4398} {"train_loss": -7.233968257904053, "global_step": 184739, "epoch": 4398} {"train_loss": -7.21082878112793, "global_step": 184740, "epoch": 4398} {"train_loss": -7.273327350616455, "global_step": 184741, "epoch": 4398} {"train_loss": -7.119892120361328, "global_step": 184742, "epoch": 4398} {"train_loss": -7.1682820320129395, "global_step": 184743, "epoch": 4398} {"train_loss": -7.349496841430664, "global_step": 184744, "epoch": 4398} {"train_loss": -7.244553089141846, "global_step": 184745, "epoch": 4398} {"train_loss": -7.203893661499023, "global_step": 184746, "epoch": 4398} {"train_loss": -7.15131950378418, "global_step": 184747, "epoch": 4398} {"train_loss": -7.108020782470703, "global_step": 184748, "epoch": 4398} {"train_loss": -7.167689800262451, "global_step": 184749, "epoch": 4398} {"train_loss": -7.249136924743652, "global_step": 184750, "epoch": 4398} {"train_loss": -7.167352199554443, "global_step": 184751, "epoch": 4398} {"train_loss": -7.211594581604004, "global_step": 184752, "epoch": 4398} {"train_loss": -7.277225494384766, "global_step": 184753, "epoch": 4398} {"train_loss": -7.12341833114624, "global_step": 184754, "epoch": 4398} {"train_loss": -7.191594123840332, "global_step": 184755, "epoch": 4398} {"train_loss": -7.093811988830566, "global_step": 184756, "epoch": 4398} {"train_loss": -7.139083464940389, "global_step": 184757, "epoch": 4398, "val_loss": 69403.609375} {"train_loss": -7.167293548583984, "global_step": 184758, "epoch": 4399} {"train_loss": -7.17398738861084, "global_step": 184759, "epoch": 4399} {"train_loss": -7.191455364227295, "global_step": 184760, "epoch": 4399} {"train_loss": -7.094573020935059, "global_step": 184761, "epoch": 4399} {"train_loss": -7.221672058105469, "global_step": 184762, "epoch": 4399} {"train_loss": -7.180445194244385, "global_step": 184763, "epoch": 4399} {"train_loss": -7.149993896484375, "global_step": 184764, "epoch": 4399} {"train_loss": -7.205410957336426, "global_step": 184765, "epoch": 4399} {"train_loss": -7.122375011444092, "global_step": 184766, "epoch": 4399} {"train_loss": -7.184035301208496, "global_step": 184767, "epoch": 4399} {"train_loss": -7.125334739685059, "global_step": 184768, "epoch": 4399} {"train_loss": -7.169194221496582, "global_step": 184769, "epoch": 4399} {"train_loss": -7.156955718994141, "global_step": 184770, "epoch": 4399} {"train_loss": -7.2116498947143555, "global_step": 184771, "epoch": 4399} {"train_loss": -7.1820268630981445, "global_step": 184772, "epoch": 4399} {"train_loss": -7.148136615753174, "global_step": 184773, "epoch": 4399} {"train_loss": -7.2443318367004395, "global_step": 184774, "epoch": 4399} {"train_loss": -7.148894309997559, "global_step": 184775, "epoch": 4399} {"train_loss": -7.095680236816406, "global_step": 184776, "epoch": 4399} {"train_loss": -7.1426286697387695, "global_step": 184777, "epoch": 4399} {"train_loss": -7.119999885559082, "global_step": 184778, "epoch": 4399} {"train_loss": -7.048254489898682, "global_step": 184779, "epoch": 4399} {"train_loss": -7.238171577453613, "global_step": 184780, "epoch": 4399} {"train_loss": -7.145303726196289, "global_step": 184781, "epoch": 4399} {"train_loss": -7.105949401855469, "global_step": 184782, "epoch": 4399} {"train_loss": -6.89459228515625, "global_step": 184783, "epoch": 4399} {"train_loss": -6.935304641723633, "global_step": 184784, "epoch": 4399} {"train_loss": -7.179280757904053, "global_step": 184785, "epoch": 4399} {"train_loss": -7.102696418762207, "global_step": 184786, "epoch": 4399} {"train_loss": -7.050769329071045, "global_step": 184787, "epoch": 4399} {"train_loss": -7.111759185791016, "global_step": 184788, "epoch": 4399} {"train_loss": -7.0279130935668945, "global_step": 184789, "epoch": 4399} {"train_loss": -7.004539489746094, "global_step": 184790, "epoch": 4399} {"train_loss": -7.1710286140441895, "global_step": 184791, "epoch": 4399} {"train_loss": -7.124822616577148, "global_step": 184792, "epoch": 4399} {"train_loss": -7.134804725646973, "global_step": 184793, "epoch": 4399} {"train_loss": -6.930580139160156, "global_step": 184794, "epoch": 4399} {"train_loss": -6.982478618621826, "global_step": 184795, "epoch": 4399} {"train_loss": -7.00419807434082, "global_step": 184796, "epoch": 4399} {"train_loss": -7.121695041656494, "global_step": 184797, "epoch": 4399} {"train_loss": -7.065975666046143, "global_step": 184798, "epoch": 4399} {"train_loss": -7.116155874161493, "global_step": 184799, "epoch": 4399, "val_loss": 69630.0078125} {"train_loss": -7.052076816558838, "global_step": 184800, "epoch": 4400} {"train_loss": -7.123767852783203, "global_step": 184801, "epoch": 4400} {"train_loss": -7.035165786743164, "global_step": 184802, "epoch": 4400} {"train_loss": -7.171950340270996, "global_step": 184803, "epoch": 4400} {"train_loss": -7.158581256866455, "global_step": 184804, "epoch": 4400} {"train_loss": -7.060009956359863, "global_step": 184805, "epoch": 4400} {"train_loss": -7.205188274383545, "global_step": 184806, "epoch": 4400} {"train_loss": -7.145176887512207, "global_step": 184807, "epoch": 4400} {"train_loss": -7.013673782348633, "global_step": 184808, "epoch": 4400} {"train_loss": -7.104742050170898, "global_step": 184809, "epoch": 4400} {"train_loss": -7.058760643005371, "global_step": 184810, "epoch": 4400} {"train_loss": -7.132587432861328, "global_step": 184811, "epoch": 4400} {"train_loss": -7.095775127410889, "global_step": 184812, "epoch": 4400} {"train_loss": -7.029692649841309, "global_step": 184813, "epoch": 4400} {"train_loss": -7.125941753387451, "global_step": 184814, "epoch": 4400} {"train_loss": -7.017577171325684, "global_step": 184815, "epoch": 4400} {"train_loss": -7.122564315795898, "global_step": 184816, "epoch": 4400} {"train_loss": -6.9973907470703125, "global_step": 184817, "epoch": 4400} {"train_loss": -7.080323696136475, "global_step": 184818, "epoch": 4400} {"train_loss": -7.021303176879883, "global_step": 184819, "epoch": 4400} {"train_loss": -7.158576011657715, "global_step": 184820, "epoch": 4400} {"train_loss": -7.091242790222168, "global_step": 184821, "epoch": 4400} {"train_loss": -7.167272567749023, "global_step": 184822, "epoch": 4400} {"train_loss": -7.067120552062988, "global_step": 184823, "epoch": 4400} {"train_loss": -7.172792434692383, "global_step": 184824, "epoch": 4400} {"train_loss": -7.073488235473633, "global_step": 184825, "epoch": 4400} {"train_loss": -7.113045692443848, "global_step": 184826, "epoch": 4400} {"train_loss": -7.227849960327148, "global_step": 184827, "epoch": 4400} {"train_loss": -7.11306095123291, "global_step": 184828, "epoch": 4400} {"train_loss": -6.986309051513672, "global_step": 184829, "epoch": 4400} {"train_loss": -7.041302680969238, "global_step": 184830, "epoch": 4400} {"train_loss": -7.085690975189209, "global_step": 184831, "epoch": 4400} {"train_loss": -7.081684112548828, "global_step": 184832, "epoch": 4400} {"train_loss": -7.137783050537109, "global_step": 184833, "epoch": 4400} {"train_loss": -7.330240249633789, "global_step": 184834, "epoch": 4400} {"train_loss": -7.099165439605713, "global_step": 184835, "epoch": 4400} {"train_loss": -7.149456024169922, "global_step": 184836, "epoch": 4400} {"train_loss": -7.105042457580566, "global_step": 184837, "epoch": 4400} {"train_loss": -6.989641189575195, "global_step": 184838, "epoch": 4400} {"train_loss": -7.128447532653809, "global_step": 184839, "epoch": 4400} {"train_loss": -7.200646877288818, "global_step": 184840, "epoch": 4400} {"train_loss": -7.104055938266573, "global_step": 184841, "epoch": 4400, "train/sim_max_reward_0": 0.7083611267185493, "train/sim_max_reward_1": 0.8545423289473457, "train/sim_max_reward_2": 0.4453460445358769, "train/sim_max_reward_3": 0.9123329563522373, "train/sim_max_reward_4": 0.9062542841527066, "train/sim_max_reward_5": 0.8601103564061753, "test/sim_max_reward_4300000": 0.9360394549231903, "test/sim_max_reward_4300001": 0.6932090863114733, "test/sim_max_reward_4300002": 0.8630938548688677, "test/sim_max_reward_4300003": 0.889889641034109, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.6834458142152678, "test/sim_max_reward_4300008": 0.7565390015015886, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.9016792500443234, "test/sim_max_reward_4300011": 0.9824205522343915, "test/sim_max_reward_4300012": 0.9457059448270627, "test/sim_max_reward_4300013": 0.40319438569913996, "test/sim_max_reward_4300014": 0.9080175145015816, "test/sim_max_reward_4300015": 0.9182725760602186, "test/sim_max_reward_4300016": 0.0, "test/sim_max_reward_4300017": 0.4096808997817595, "test/sim_max_reward_4300018": 0.3457543612305965, "test/sim_max_reward_4300019": 0.18577318032171455, "test/sim_max_reward_4300020": 0.0723020660552248, "test/sim_max_reward_4300021": 0.3600945345657214, "test/sim_max_reward_4300022": 0.9678778467631896, "test/sim_max_reward_4300023": 0.32579269023454216, "test/sim_max_reward_4300024": 1.0, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.22102036925591576, "test/sim_max_reward_4300027": 0.9111128214182173, "test/sim_max_reward_4300028": 0.9060499479453417, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.20453359862732257, "test/sim_max_reward_4300031": 0.4323066299521545, "test/sim_max_reward_4300032": 0.8994412780408966, "test/sim_max_reward_4300033": 0.9345815614551066, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.8424646830293266, "test/sim_max_reward_4300036": 0.22045308976609404, "test/sim_max_reward_4300037": 0.7503911305150668, "test/sim_max_reward_4300038": 0.8439943622709298, "test/sim_max_reward_4300039": 0.9969683716217398, "test/sim_max_reward_4300040": 0.9862640133221673, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7079313891314595, "test/sim_max_reward_4300043": 0.16092337129128245, "test/sim_max_reward_4300044": 0.9119686681799051, "test/sim_max_reward_4300045": 0.19407494030317177, "test/sim_max_reward_4300046": 0.9450260832509387, "test/sim_max_reward_4300047": 0.09732418338042066, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.18189971429545904, "train/mean_score": 0.7811578495188152, "test/mean_score": 0.5782669393407233, "val_loss": 69461.03125} {"train_loss": -7.060657501220703, "global_step": 184842, "epoch": 4401} {"train_loss": -7.18123722076416, "global_step": 184843, "epoch": 4401} {"train_loss": -7.130344390869141, "global_step": 184844, "epoch": 4401} {"train_loss": -7.1733856201171875, "global_step": 184845, "epoch": 4401} {"train_loss": -7.033957481384277, "global_step": 184846, "epoch": 4401} {"train_loss": -7.165499687194824, "global_step": 184847, "epoch": 4401} {"train_loss": -7.151803970336914, "global_step": 184848, "epoch": 4401} {"train_loss": -7.092169284820557, "global_step": 184849, "epoch": 4401} {"train_loss": -7.0629425048828125, "global_step": 184850, "epoch": 4401} {"train_loss": -7.075192928314209, "global_step": 184851, "epoch": 4401} {"train_loss": -7.100440979003906, "global_step": 184852, "epoch": 4401} {"train_loss": -7.161920547485352, "global_step": 184853, "epoch": 4401} {"train_loss": -7.016846656799316, "global_step": 184854, "epoch": 4401} {"train_loss": -7.160085201263428, "global_step": 184855, "epoch": 4401} {"train_loss": -7.206268787384033, "global_step": 184856, "epoch": 4401} {"train_loss": -6.945603370666504, "global_step": 184857, "epoch": 4401} {"train_loss": -7.1881303787231445, "global_step": 184858, "epoch": 4401} {"train_loss": -6.988654613494873, "global_step": 184859, "epoch": 4401} {"train_loss": -7.133844375610352, "global_step": 184860, "epoch": 4401} {"train_loss": -6.975069046020508, "global_step": 184861, "epoch": 4401} {"train_loss": -7.1661272048950195, "global_step": 184862, "epoch": 4401} {"train_loss": -7.004324436187744, "global_step": 184863, "epoch": 4401} {"train_loss": -7.076338768005371, "global_step": 184864, "epoch": 4401} {"train_loss": -7.076025485992432, "global_step": 184865, "epoch": 4401} {"train_loss": -7.14742374420166, "global_step": 184866, "epoch": 4401} {"train_loss": -7.128767013549805, "global_step": 184867, "epoch": 4401} {"train_loss": -7.069813251495361, "global_step": 184868, "epoch": 4401} {"train_loss": -7.245322227478027, "global_step": 184869, "epoch": 4401} {"train_loss": -7.086166858673096, "global_step": 184870, "epoch": 4401} {"train_loss": -7.128329277038574, "global_step": 184871, "epoch": 4401} {"train_loss": -7.194186687469482, "global_step": 184872, "epoch": 4401} {"train_loss": -7.173758506774902, "global_step": 184873, "epoch": 4401} {"train_loss": -7.177985191345215, "global_step": 184874, "epoch": 4401} {"train_loss": -7.132245063781738, "global_step": 184875, "epoch": 4401} {"train_loss": -7.138890266418457, "global_step": 184876, "epoch": 4401} {"train_loss": -7.117877006530762, "global_step": 184877, "epoch": 4401} {"train_loss": -7.21149206161499, "global_step": 184878, "epoch": 4401} {"train_loss": -7.031749725341797, "global_step": 184879, "epoch": 4401} {"train_loss": -7.146944999694824, "global_step": 184880, "epoch": 4401} {"train_loss": -7.165964126586914, "global_step": 184881, "epoch": 4401} {"train_loss": -6.99965763092041, "global_step": 184882, "epoch": 4401} {"train_loss": -7.113245464506603, "global_step": 184883, "epoch": 4401, "val_loss": 69579.28125} {"train_loss": -7.135846138000488, "global_step": 184884, "epoch": 4402} {"train_loss": -7.021275997161865, "global_step": 184885, "epoch": 4402} {"train_loss": -7.24423360824585, "global_step": 184886, "epoch": 4402} {"train_loss": -7.099029541015625, "global_step": 184887, "epoch": 4402} {"train_loss": -6.9022979736328125, "global_step": 184888, "epoch": 4402} {"train_loss": -7.100415229797363, "global_step": 184889, "epoch": 4402} {"train_loss": -7.120853424072266, "global_step": 184890, "epoch": 4402} {"train_loss": -7.121150493621826, "global_step": 184891, "epoch": 4402} {"train_loss": -7.098758697509766, "global_step": 184892, "epoch": 4402} {"train_loss": -6.968155860900879, "global_step": 184893, "epoch": 4402} {"train_loss": -7.163652420043945, "global_step": 184894, "epoch": 4402} {"train_loss": -7.136384010314941, "global_step": 184895, "epoch": 4402} {"train_loss": -7.224493980407715, "global_step": 184896, "epoch": 4402} {"train_loss": -7.11529541015625, "global_step": 184897, "epoch": 4402} {"train_loss": -7.190976142883301, "global_step": 184898, "epoch": 4402} {"train_loss": -7.2177629470825195, "global_step": 184899, "epoch": 4402} {"train_loss": -7.102367401123047, "global_step": 184900, "epoch": 4402} {"train_loss": -7.111632347106934, "global_step": 184901, "epoch": 4402} {"train_loss": -7.053494453430176, "global_step": 184902, "epoch": 4402} {"train_loss": -7.171573162078857, "global_step": 184903, "epoch": 4402} {"train_loss": -7.131361961364746, "global_step": 184904, "epoch": 4402} {"train_loss": -7.08928108215332, "global_step": 184905, "epoch": 4402} {"train_loss": -7.127624988555908, "global_step": 184906, "epoch": 4402} {"train_loss": -6.961584568023682, "global_step": 184907, "epoch": 4402} {"train_loss": -7.041067123413086, "global_step": 184908, "epoch": 4402} {"train_loss": -7.137777328491211, "global_step": 184909, "epoch": 4402} {"train_loss": -7.130926132202148, "global_step": 184910, "epoch": 4402} {"train_loss": -7.145076274871826, "global_step": 184911, "epoch": 4402} {"train_loss": -7.201788425445557, "global_step": 184912, "epoch": 4402} {"train_loss": -6.956439971923828, "global_step": 184913, "epoch": 4402} {"train_loss": -7.017762660980225, "global_step": 184914, "epoch": 4402} {"train_loss": -7.2082977294921875, "global_step": 184915, "epoch": 4402} {"train_loss": -7.165395259857178, "global_step": 184916, "epoch": 4402} {"train_loss": -7.052094459533691, "global_step": 184917, "epoch": 4402} {"train_loss": -7.187376499176025, "global_step": 184918, "epoch": 4402} {"train_loss": -7.193652629852295, "global_step": 184919, "epoch": 4402} {"train_loss": -7.040661334991455, "global_step": 184920, "epoch": 4402} {"train_loss": -7.076589584350586, "global_step": 184921, "epoch": 4402} {"train_loss": -7.164439678192139, "global_step": 184922, "epoch": 4402} {"train_loss": -7.144278526306152, "global_step": 184923, "epoch": 4402} {"train_loss": -7.224058151245117, "global_step": 184924, "epoch": 4402} {"train_loss": -7.1132509254273915, "global_step": 184925, "epoch": 4402, "val_loss": 69463.59375} {"train_loss": -7.247612953186035, "global_step": 184926, "epoch": 4403} {"train_loss": -7.25568962097168, "global_step": 184927, "epoch": 4403} {"train_loss": -7.2221174240112305, "global_step": 184928, "epoch": 4403} {"train_loss": -7.204936981201172, "global_step": 184929, "epoch": 4403} {"train_loss": -7.202671051025391, "global_step": 184930, "epoch": 4403} {"train_loss": -7.109284400939941, "global_step": 184931, "epoch": 4403} {"train_loss": -7.202174186706543, "global_step": 184932, "epoch": 4403} {"train_loss": -7.177691459655762, "global_step": 184933, "epoch": 4403} {"train_loss": -7.079037666320801, "global_step": 184934, "epoch": 4403} {"train_loss": -7.198585510253906, "global_step": 184935, "epoch": 4403} {"train_loss": -7.1368327140808105, "global_step": 184936, "epoch": 4403} {"train_loss": -7.259756565093994, "global_step": 184937, "epoch": 4403} {"train_loss": -7.1577229499816895, "global_step": 184938, "epoch": 4403} {"train_loss": -7.134286880493164, "global_step": 184939, "epoch": 4403} {"train_loss": -7.207771301269531, "global_step": 184940, "epoch": 4403} {"train_loss": -7.288145065307617, "global_step": 184941, "epoch": 4403} {"train_loss": -7.184088230133057, "global_step": 184942, "epoch": 4403} {"train_loss": -7.146473407745361, "global_step": 184943, "epoch": 4403} {"train_loss": -7.255644798278809, "global_step": 184944, "epoch": 4403} {"train_loss": -7.10601806640625, "global_step": 184945, "epoch": 4403} {"train_loss": -7.044458866119385, "global_step": 184946, "epoch": 4403} {"train_loss": -7.188619613647461, "global_step": 184947, "epoch": 4403} {"train_loss": -7.168126106262207, "global_step": 184948, "epoch": 4403} {"train_loss": -7.232987403869629, "global_step": 184949, "epoch": 4403} {"train_loss": -7.26065731048584, "global_step": 184950, "epoch": 4403} {"train_loss": -7.213611602783203, "global_step": 184951, "epoch": 4403} {"train_loss": -7.19802188873291, "global_step": 184952, "epoch": 4403} {"train_loss": -7.097373008728027, "global_step": 184953, "epoch": 4403} {"train_loss": -7.244891166687012, "global_step": 184954, "epoch": 4403} {"train_loss": -7.196451187133789, "global_step": 184955, "epoch": 4403} {"train_loss": -7.22895622253418, "global_step": 184956, "epoch": 4403} {"train_loss": -7.245003700256348, "global_step": 184957, "epoch": 4403} {"train_loss": -7.110036373138428, "global_step": 184958, "epoch": 4403} {"train_loss": -7.120973110198975, "global_step": 184959, "epoch": 4403} {"train_loss": -7.060888767242432, "global_step": 184960, "epoch": 4403} {"train_loss": -7.182340145111084, "global_step": 184961, "epoch": 4403} {"train_loss": -7.093408584594727, "global_step": 184962, "epoch": 4403} {"train_loss": -7.1710357666015625, "global_step": 184963, "epoch": 4403} {"train_loss": -7.205635070800781, "global_step": 184964, "epoch": 4403} {"train_loss": -7.019593715667725, "global_step": 184965, "epoch": 4403} {"train_loss": -7.16603946685791, "global_step": 184966, "epoch": 4403} {"train_loss": -7.173572063446045, "global_step": 184967, "epoch": 4403, "val_loss": 69623.125} {"train_loss": -6.963291645050049, "global_step": 184968, "epoch": 4404} {"train_loss": -7.131706714630127, "global_step": 184969, "epoch": 4404} {"train_loss": -7.246908187866211, "global_step": 184970, "epoch": 4404} {"train_loss": -7.119028091430664, "global_step": 184971, "epoch": 4404} {"train_loss": -7.197784423828125, "global_step": 184972, "epoch": 4404} {"train_loss": -7.163867950439453, "global_step": 184973, "epoch": 4404} {"train_loss": -7.1388654708862305, "global_step": 184974, "epoch": 4404} {"train_loss": -7.114096641540527, "global_step": 184975, "epoch": 4404} {"train_loss": -7.2232208251953125, "global_step": 184976, "epoch": 4404} {"train_loss": -7.1738996505737305, "global_step": 184977, "epoch": 4404} {"train_loss": -7.181117057800293, "global_step": 184978, "epoch": 4404} {"train_loss": -7.190062046051025, "global_step": 184979, "epoch": 4404} {"train_loss": -7.168475151062012, "global_step": 184980, "epoch": 4404} {"train_loss": -7.354872703552246, "global_step": 184981, "epoch": 4404} {"train_loss": -7.202441215515137, "global_step": 184982, "epoch": 4404} {"train_loss": -7.224799633026123, "global_step": 184983, "epoch": 4404} {"train_loss": -7.265270233154297, "global_step": 184984, "epoch": 4404} {"train_loss": -7.285900115966797, "global_step": 184985, "epoch": 4404} {"train_loss": -7.152111053466797, "global_step": 184986, "epoch": 4404} {"train_loss": -7.3026018142700195, "global_step": 184987, "epoch": 4404} {"train_loss": -7.217789649963379, "global_step": 184988, "epoch": 4404} {"train_loss": -7.218221664428711, "global_step": 184989, "epoch": 4404} {"train_loss": -7.259713172912598, "global_step": 184990, "epoch": 4404} {"train_loss": -7.17177677154541, "global_step": 184991, "epoch": 4404} {"train_loss": -7.140048980712891, "global_step": 184992, "epoch": 4404} {"train_loss": -7.283786773681641, "global_step": 184993, "epoch": 4404} {"train_loss": -7.25557804107666, "global_step": 184994, "epoch": 4404} {"train_loss": -7.196540355682373, "global_step": 184995, "epoch": 4404} {"train_loss": -7.260406494140625, "global_step": 184996, "epoch": 4404} {"train_loss": -7.065726280212402, "global_step": 184997, "epoch": 4404} {"train_loss": -7.249747276306152, "global_step": 184998, "epoch": 4404} {"train_loss": -7.271876335144043, "global_step": 184999, "epoch": 4404} {"train_loss": -7.284064769744873, "global_step": 185000, "epoch": 4404} {"train_loss": -7.1994547843933105, "global_step": 185001, "epoch": 4404} {"train_loss": -7.097378730773926, "global_step": 185002, "epoch": 4404} {"train_loss": -7.114358901977539, "global_step": 185003, "epoch": 4404} {"train_loss": -7.18900203704834, "global_step": 185004, "epoch": 4404} {"train_loss": -7.148390769958496, "global_step": 185005, "epoch": 4404} {"train_loss": -7.172604560852051, "global_step": 185006, "epoch": 4404} {"train_loss": -7.133822917938232, "global_step": 185007, "epoch": 4404} {"train_loss": -7.228108882904053, "global_step": 185008, "epoch": 4404} {"train_loss": -7.1899875572749545, "global_step": 185009, "epoch": 4404, "val_loss": 69436.015625} {"train_loss": -7.173590660095215, "global_step": 185010, "epoch": 4405} {"train_loss": -7.248730659484863, "global_step": 185011, "epoch": 4405} {"train_loss": -7.225298881530762, "global_step": 185012, "epoch": 4405} {"train_loss": -7.198041915893555, "global_step": 185013, "epoch": 4405} {"train_loss": -7.280285358428955, "global_step": 185014, "epoch": 4405} {"train_loss": -7.158535003662109, "global_step": 185015, "epoch": 4405} {"train_loss": -7.173807621002197, "global_step": 185016, "epoch": 4405} {"train_loss": -7.255882263183594, "global_step": 185017, "epoch": 4405} {"train_loss": -7.127257347106934, "global_step": 185018, "epoch": 4405} {"train_loss": -7.163623332977295, "global_step": 185019, "epoch": 4405} {"train_loss": -7.26050329208374, "global_step": 185020, "epoch": 4405} {"train_loss": -7.12373685836792, "global_step": 185021, "epoch": 4405} {"train_loss": -7.03223180770874, "global_step": 185022, "epoch": 4405} {"train_loss": -7.0604352951049805, "global_step": 185023, "epoch": 4405} {"train_loss": -7.020359516143799, "global_step": 185024, "epoch": 4405} {"train_loss": -6.9626312255859375, "global_step": 185025, "epoch": 4405} {"train_loss": -7.1823272705078125, "global_step": 185026, "epoch": 4405} {"train_loss": -7.012316703796387, "global_step": 185027, "epoch": 4405} {"train_loss": -7.234759330749512, "global_step": 185028, "epoch": 4405} {"train_loss": -7.015194892883301, "global_step": 185029, "epoch": 4405} {"train_loss": -7.1024675369262695, "global_step": 185030, "epoch": 4405} {"train_loss": -7.126214027404785, "global_step": 185031, "epoch": 4405} {"train_loss": -7.061888217926025, "global_step": 185032, "epoch": 4405} {"train_loss": -7.111838340759277, "global_step": 185033, "epoch": 4405} {"train_loss": -7.023292541503906, "global_step": 185034, "epoch": 4405} {"train_loss": -7.255242347717285, "global_step": 185035, "epoch": 4405} {"train_loss": -7.204536437988281, "global_step": 185036, "epoch": 4405} {"train_loss": -7.206264495849609, "global_step": 185037, "epoch": 4405} {"train_loss": -7.20206356048584, "global_step": 185038, "epoch": 4405} {"train_loss": -7.112610340118408, "global_step": 185039, "epoch": 4405} {"train_loss": -7.177908897399902, "global_step": 185040, "epoch": 4405} {"train_loss": -7.175556182861328, "global_step": 185041, "epoch": 4405} {"train_loss": -7.196295738220215, "global_step": 185042, "epoch": 4405} {"train_loss": -7.155829906463623, "global_step": 185043, "epoch": 4405} {"train_loss": -7.255971908569336, "global_step": 185044, "epoch": 4405} {"train_loss": -7.154587268829346, "global_step": 185045, "epoch": 4405} {"train_loss": -7.196768760681152, "global_step": 185046, "epoch": 4405} {"train_loss": -7.160139083862305, "global_step": 185047, "epoch": 4405} {"train_loss": -7.186595916748047, "global_step": 185048, "epoch": 4405} {"train_loss": -7.321449279785156, "global_step": 185049, "epoch": 4405} {"train_loss": -7.187745571136475, "global_step": 185050, "epoch": 4405} {"train_loss": -7.15876198950268, "global_step": 185051, "epoch": 4405, "val_loss": 69598.5625} {"train_loss": -7.123646259307861, "global_step": 185052, "epoch": 4406} {"train_loss": -7.256412029266357, "global_step": 185053, "epoch": 4406} {"train_loss": -7.2920966148376465, "global_step": 185054, "epoch": 4406} {"train_loss": -7.2666473388671875, "global_step": 185055, "epoch": 4406} {"train_loss": -7.234928607940674, "global_step": 185056, "epoch": 4406} {"train_loss": -7.194392204284668, "global_step": 185057, "epoch": 4406} {"train_loss": -7.274043560028076, "global_step": 185058, "epoch": 4406} {"train_loss": -7.2126874923706055, "global_step": 185059, "epoch": 4406} {"train_loss": -7.1997270584106445, "global_step": 185060, "epoch": 4406} {"train_loss": -7.216334819793701, "global_step": 185061, "epoch": 4406} {"train_loss": -7.31382942199707, "global_step": 185062, "epoch": 4406} {"train_loss": -7.116599082946777, "global_step": 185063, "epoch": 4406} {"train_loss": -7.177860736846924, "global_step": 185064, "epoch": 4406} {"train_loss": -7.096772193908691, "global_step": 185065, "epoch": 4406} {"train_loss": -7.116412162780762, "global_step": 185066, "epoch": 4406} {"train_loss": -7.070460319519043, "global_step": 185067, "epoch": 4406} {"train_loss": -7.08102560043335, "global_step": 185068, "epoch": 4406} {"train_loss": -7.1842041015625, "global_step": 185069, "epoch": 4406} {"train_loss": -7.09359073638916, "global_step": 185070, "epoch": 4406} {"train_loss": -7.1660966873168945, "global_step": 185071, "epoch": 4406} {"train_loss": -7.220767974853516, "global_step": 185072, "epoch": 4406} {"train_loss": -7.037200450897217, "global_step": 185073, "epoch": 4406} {"train_loss": -7.191490173339844, "global_step": 185074, "epoch": 4406} {"train_loss": -7.27353572845459, "global_step": 185075, "epoch": 4406} {"train_loss": -7.0793962478637695, "global_step": 185076, "epoch": 4406} {"train_loss": -7.116879463195801, "global_step": 185077, "epoch": 4406} {"train_loss": -7.281659126281738, "global_step": 185078, "epoch": 4406} {"train_loss": -7.032347679138184, "global_step": 185079, "epoch": 4406} {"train_loss": -7.158111572265625, "global_step": 185080, "epoch": 4406} {"train_loss": -7.260455131530762, "global_step": 185081, "epoch": 4406} {"train_loss": -7.144458293914795, "global_step": 185082, "epoch": 4406} {"train_loss": -7.190471649169922, "global_step": 185083, "epoch": 4406} {"train_loss": -7.20625638961792, "global_step": 185084, "epoch": 4406} {"train_loss": -7.223354339599609, "global_step": 185085, "epoch": 4406} {"train_loss": -7.188563346862793, "global_step": 185086, "epoch": 4406} {"train_loss": -7.1779985427856445, "global_step": 185087, "epoch": 4406} {"train_loss": -7.069021701812744, "global_step": 185088, "epoch": 4406} {"train_loss": -7.094446659088135, "global_step": 185089, "epoch": 4406} {"train_loss": -7.119957447052002, "global_step": 185090, "epoch": 4406} {"train_loss": -7.004244804382324, "global_step": 185091, "epoch": 4406} {"train_loss": -7.118269920349121, "global_step": 185092, "epoch": 4406} {"train_loss": -7.1657013438996815, "global_step": 185093, "epoch": 4406, "val_loss": 69495.390625} {"train_loss": -7.053884983062744, "global_step": 185094, "epoch": 4407} {"train_loss": -7.1369524002075195, "global_step": 185095, "epoch": 4407} {"train_loss": -6.951980113983154, "global_step": 185096, "epoch": 4407} {"train_loss": -6.965849876403809, "global_step": 185097, "epoch": 4407} {"train_loss": -7.19588041305542, "global_step": 185098, "epoch": 4407} {"train_loss": -7.187047481536865, "global_step": 185099, "epoch": 4407} {"train_loss": -6.943631172180176, "global_step": 185100, "epoch": 4407} {"train_loss": -7.069430351257324, "global_step": 185101, "epoch": 4407} {"train_loss": -7.086874961853027, "global_step": 185102, "epoch": 4407} {"train_loss": -7.086938381195068, "global_step": 185103, "epoch": 4407} {"train_loss": -7.112975120544434, "global_step": 185104, "epoch": 4407} {"train_loss": -7.057432174682617, "global_step": 185105, "epoch": 4407} {"train_loss": -7.1143388748168945, "global_step": 185106, "epoch": 4407} {"train_loss": -7.0620832443237305, "global_step": 185107, "epoch": 4407} {"train_loss": -7.071994304656982, "global_step": 185108, "epoch": 4407} {"train_loss": -7.108731269836426, "global_step": 185109, "epoch": 4407} {"train_loss": -7.133546352386475, "global_step": 185110, "epoch": 4407} {"train_loss": -7.054643630981445, "global_step": 185111, "epoch": 4407} {"train_loss": -7.159860610961914, "global_step": 185112, "epoch": 4407} {"train_loss": -6.966297149658203, "global_step": 185113, "epoch": 4407} {"train_loss": -7.125909805297852, "global_step": 185114, "epoch": 4407} {"train_loss": -7.11440372467041, "global_step": 185115, "epoch": 4407} {"train_loss": -7.023741722106934, "global_step": 185116, "epoch": 4407} {"train_loss": -7.055976867675781, "global_step": 185117, "epoch": 4407} {"train_loss": -7.150084018707275, "global_step": 185118, "epoch": 4407} {"train_loss": -7.1688923835754395, "global_step": 185119, "epoch": 4407} {"train_loss": -7.020326137542725, "global_step": 185120, "epoch": 4407} {"train_loss": -7.162149906158447, "global_step": 185121, "epoch": 4407} {"train_loss": -7.224160194396973, "global_step": 185122, "epoch": 4407} {"train_loss": -7.262032508850098, "global_step": 185123, "epoch": 4407} {"train_loss": -7.221130847930908, "global_step": 185124, "epoch": 4407} {"train_loss": -7.376873970031738, "global_step": 185125, "epoch": 4407} {"train_loss": -7.0987701416015625, "global_step": 185126, "epoch": 4407} {"train_loss": -7.213301658630371, "global_step": 185127, "epoch": 4407} {"train_loss": -7.252262592315674, "global_step": 185128, "epoch": 4407} {"train_loss": -7.145866394042969, "global_step": 185129, "epoch": 4407} {"train_loss": -7.259894371032715, "global_step": 185130, "epoch": 4407} {"train_loss": -7.05982780456543, "global_step": 185131, "epoch": 4407} {"train_loss": -7.104276657104492, "global_step": 185132, "epoch": 4407} {"train_loss": -7.077876091003418, "global_step": 185133, "epoch": 4407} {"train_loss": -7.18465518951416, "global_step": 185134, "epoch": 4407} {"train_loss": -7.117836202893939, "global_step": 185135, "epoch": 4407, "val_loss": 69421.765625} {"train_loss": -7.094618797302246, "global_step": 185136, "epoch": 4408} {"train_loss": -7.220264434814453, "global_step": 185137, "epoch": 4408} {"train_loss": -7.04343318939209, "global_step": 185138, "epoch": 4408} {"train_loss": -7.0265021324157715, "global_step": 185139, "epoch": 4408} {"train_loss": -7.206792831420898, "global_step": 185140, "epoch": 4408} {"train_loss": -7.086700916290283, "global_step": 185141, "epoch": 4408} {"train_loss": -7.182934284210205, "global_step": 185142, "epoch": 4408} {"train_loss": -7.2597975730896, "global_step": 185143, "epoch": 4408} {"train_loss": -7.10020637512207, "global_step": 185144, "epoch": 4408} {"train_loss": -7.217991828918457, "global_step": 185145, "epoch": 4408} {"train_loss": -7.113833427429199, "global_step": 185146, "epoch": 4408} {"train_loss": -7.200576305389404, "global_step": 185147, "epoch": 4408} {"train_loss": -7.041250228881836, "global_step": 185148, "epoch": 4408} {"train_loss": -7.074760437011719, "global_step": 185149, "epoch": 4408} {"train_loss": -7.304797172546387, "global_step": 185150, "epoch": 4408} {"train_loss": -7.203322410583496, "global_step": 185151, "epoch": 4408} {"train_loss": -7.109004020690918, "global_step": 185152, "epoch": 4408} {"train_loss": -7.280266761779785, "global_step": 185153, "epoch": 4408} {"train_loss": -7.207967758178711, "global_step": 185154, "epoch": 4408} {"train_loss": -7.105989456176758, "global_step": 185155, "epoch": 4408} {"train_loss": -7.191150188446045, "global_step": 185156, "epoch": 4408} {"train_loss": -7.124302864074707, "global_step": 185157, "epoch": 4408} {"train_loss": -7.156491279602051, "global_step": 185158, "epoch": 4408} {"train_loss": -7.138570308685303, "global_step": 185159, "epoch": 4408} {"train_loss": -7.3437652587890625, "global_step": 185160, "epoch": 4408} {"train_loss": -7.189266204833984, "global_step": 185161, "epoch": 4408} {"train_loss": -7.169289588928223, "global_step": 185162, "epoch": 4408} {"train_loss": -7.2757673263549805, "global_step": 185163, "epoch": 4408} {"train_loss": -7.113974571228027, "global_step": 185164, "epoch": 4408} {"train_loss": -7.131155014038086, "global_step": 185165, "epoch": 4408} {"train_loss": -7.217135429382324, "global_step": 185166, "epoch": 4408} {"train_loss": -7.135107040405273, "global_step": 185167, "epoch": 4408} {"train_loss": -7.056370735168457, "global_step": 185168, "epoch": 4408} {"train_loss": -7.178516387939453, "global_step": 185169, "epoch": 4408} {"train_loss": -7.233266830444336, "global_step": 185170, "epoch": 4408} {"train_loss": -7.219430923461914, "global_step": 185171, "epoch": 4408} {"train_loss": -7.215543270111084, "global_step": 185172, "epoch": 4408} {"train_loss": -7.165672302246094, "global_step": 185173, "epoch": 4408} {"train_loss": -7.167382717132568, "global_step": 185174, "epoch": 4408} {"train_loss": -7.093585968017578, "global_step": 185175, "epoch": 4408} {"train_loss": -7.169593811035156, "global_step": 185176, "epoch": 4408} {"train_loss": -7.165973799569266, "global_step": 185177, "epoch": 4408, "val_loss": 69366.640625} {"train_loss": -7.165546417236328, "global_step": 185178, "epoch": 4409} {"train_loss": -7.134827613830566, "global_step": 185179, "epoch": 4409} {"train_loss": -7.229114532470703, "global_step": 185180, "epoch": 4409} {"train_loss": -7.193275451660156, "global_step": 185181, "epoch": 4409} {"train_loss": -7.182351589202881, "global_step": 185182, "epoch": 4409} {"train_loss": -7.095980167388916, "global_step": 185183, "epoch": 4409} {"train_loss": -7.121774673461914, "global_step": 185184, "epoch": 4409} {"train_loss": -7.231772422790527, "global_step": 185185, "epoch": 4409} {"train_loss": -7.200499534606934, "global_step": 185186, "epoch": 4409} {"train_loss": -7.158016204833984, "global_step": 185187, "epoch": 4409} {"train_loss": -7.2538580894470215, "global_step": 185188, "epoch": 4409} {"train_loss": -7.2274932861328125, "global_step": 185189, "epoch": 4409} {"train_loss": -7.201316833496094, "global_step": 185190, "epoch": 4409} {"train_loss": -7.140215873718262, "global_step": 185191, "epoch": 4409} {"train_loss": -7.2012939453125, "global_step": 185192, "epoch": 4409} {"train_loss": -7.164610862731934, "global_step": 185193, "epoch": 4409} {"train_loss": -7.079826831817627, "global_step": 185194, "epoch": 4409} {"train_loss": -7.197368144989014, "global_step": 185195, "epoch": 4409} {"train_loss": -6.974880695343018, "global_step": 185196, "epoch": 4409} {"train_loss": -7.11760139465332, "global_step": 185197, "epoch": 4409} {"train_loss": -7.12359619140625, "global_step": 185198, "epoch": 4409} {"train_loss": -7.026337623596191, "global_step": 185199, "epoch": 4409} {"train_loss": -7.080655097961426, "global_step": 185200, "epoch": 4409} {"train_loss": -7.169662952423096, "global_step": 185201, "epoch": 4409} {"train_loss": -7.122828006744385, "global_step": 185202, "epoch": 4409} {"train_loss": -7.140624046325684, "global_step": 185203, "epoch": 4409} {"train_loss": -6.954202175140381, "global_step": 185204, "epoch": 4409} {"train_loss": -7.102534294128418, "global_step": 185205, "epoch": 4409} {"train_loss": -7.093727111816406, "global_step": 185206, "epoch": 4409} {"train_loss": -7.016086578369141, "global_step": 185207, "epoch": 4409} {"train_loss": -7.114882946014404, "global_step": 185208, "epoch": 4409} {"train_loss": -7.154108047485352, "global_step": 185209, "epoch": 4409} {"train_loss": -7.096730709075928, "global_step": 185210, "epoch": 4409} {"train_loss": -7.093274116516113, "global_step": 185211, "epoch": 4409} {"train_loss": -7.287352561950684, "global_step": 185212, "epoch": 4409} {"train_loss": -7.142953872680664, "global_step": 185213, "epoch": 4409} {"train_loss": -7.11940860748291, "global_step": 185214, "epoch": 4409} {"train_loss": -7.226649284362793, "global_step": 185215, "epoch": 4409} {"train_loss": -7.083339691162109, "global_step": 185216, "epoch": 4409} {"train_loss": -7.167087554931641, "global_step": 185217, "epoch": 4409} {"train_loss": -7.189110279083252, "global_step": 185218, "epoch": 4409} {"train_loss": -7.140514986855643, "global_step": 185219, "epoch": 4409, "val_loss": 69517.984375} {"train_loss": -7.071342468261719, "global_step": 185220, "epoch": 4410} {"train_loss": -7.182741165161133, "global_step": 185221, "epoch": 4410} {"train_loss": -7.205462455749512, "global_step": 185222, "epoch": 4410} {"train_loss": -7.207281112670898, "global_step": 185223, "epoch": 4410} {"train_loss": -6.982665061950684, "global_step": 185224, "epoch": 4410} {"train_loss": -7.226348400115967, "global_step": 185225, "epoch": 4410} {"train_loss": -7.084097385406494, "global_step": 185226, "epoch": 4410} {"train_loss": -7.169475555419922, "global_step": 185227, "epoch": 4410} {"train_loss": -7.158645153045654, "global_step": 185228, "epoch": 4410} {"train_loss": -7.076186180114746, "global_step": 185229, "epoch": 4410} {"train_loss": -7.164956092834473, "global_step": 185230, "epoch": 4410} {"train_loss": -7.257885932922363, "global_step": 185231, "epoch": 4410} {"train_loss": -7.03548002243042, "global_step": 185232, "epoch": 4410} {"train_loss": -7.0283918380737305, "global_step": 185233, "epoch": 4410} {"train_loss": -7.016300201416016, "global_step": 185234, "epoch": 4410} {"train_loss": -6.939386367797852, "global_step": 185235, "epoch": 4410} {"train_loss": -7.1749091148376465, "global_step": 185236, "epoch": 4410} {"train_loss": -7.078517913818359, "global_step": 185237, "epoch": 4410} {"train_loss": -7.02168083190918, "global_step": 185238, "epoch": 4410} {"train_loss": -7.075537204742432, "global_step": 185239, "epoch": 4410} {"train_loss": -7.047334671020508, "global_step": 185240, "epoch": 4410} {"train_loss": -7.148761749267578, "global_step": 185241, "epoch": 4410} {"train_loss": -7.048391342163086, "global_step": 185242, "epoch": 4410} {"train_loss": -7.082612037658691, "global_step": 185243, "epoch": 4410} {"train_loss": -7.067959785461426, "global_step": 185244, "epoch": 4410} {"train_loss": -7.055091857910156, "global_step": 185245, "epoch": 4410} {"train_loss": -7.088290214538574, "global_step": 185246, "epoch": 4410} {"train_loss": -7.08998966217041, "global_step": 185247, "epoch": 4410} {"train_loss": -6.998631954193115, "global_step": 185248, "epoch": 4410} {"train_loss": -7.106989860534668, "global_step": 185249, "epoch": 4410} {"train_loss": -7.109645366668701, "global_step": 185250, "epoch": 4410} {"train_loss": -7.147818565368652, "global_step": 185251, "epoch": 4410} {"train_loss": -7.102779388427734, "global_step": 185252, "epoch": 4410} {"train_loss": -6.994142532348633, "global_step": 185253, "epoch": 4410} {"train_loss": -7.123626232147217, "global_step": 185254, "epoch": 4410} {"train_loss": -7.003333568572998, "global_step": 185255, "epoch": 4410} {"train_loss": -6.991662502288818, "global_step": 185256, "epoch": 4410} {"train_loss": -6.979288101196289, "global_step": 185257, "epoch": 4410} {"train_loss": -7.112614154815674, "global_step": 185258, "epoch": 4410} {"train_loss": -7.038485527038574, "global_step": 185259, "epoch": 4410} {"train_loss": -7.214579105377197, "global_step": 185260, "epoch": 4410} {"train_loss": -7.089875130426316, "global_step": 185261, "epoch": 4410, "val_loss": 69349.859375} {"train_loss": -7.112934112548828, "global_step": 185262, "epoch": 4411} {"train_loss": -7.184645652770996, "global_step": 185263, "epoch": 4411} {"train_loss": -7.068506240844727, "global_step": 185264, "epoch": 4411} {"train_loss": -7.096881866455078, "global_step": 185265, "epoch": 4411} {"train_loss": -7.1255693435668945, "global_step": 185266, "epoch": 4411} {"train_loss": -7.208249092102051, "global_step": 185267, "epoch": 4411} {"train_loss": -7.097843170166016, "global_step": 185268, "epoch": 4411} {"train_loss": -7.1500244140625, "global_step": 185269, "epoch": 4411} {"train_loss": -6.913204193115234, "global_step": 185270, "epoch": 4411} {"train_loss": -7.18880558013916, "global_step": 185271, "epoch": 4411} {"train_loss": -7.099692344665527, "global_step": 185272, "epoch": 4411} {"train_loss": -7.170515537261963, "global_step": 185273, "epoch": 4411} {"train_loss": -7.181052207946777, "global_step": 185274, "epoch": 4411} {"train_loss": -6.983851432800293, "global_step": 185275, "epoch": 4411} {"train_loss": -7.17938232421875, "global_step": 185276, "epoch": 4411} {"train_loss": -7.185094356536865, "global_step": 185277, "epoch": 4411} {"train_loss": -7.181277275085449, "global_step": 185278, "epoch": 4411} {"train_loss": -7.0417866706848145, "global_step": 185279, "epoch": 4411} {"train_loss": -7.235131740570068, "global_step": 185280, "epoch": 4411} {"train_loss": -7.128355979919434, "global_step": 185281, "epoch": 4411} {"train_loss": -7.168831825256348, "global_step": 185282, "epoch": 4411} {"train_loss": -7.06095552444458, "global_step": 185283, "epoch": 4411} {"train_loss": -7.119381904602051, "global_step": 185284, "epoch": 4411} {"train_loss": -7.145901679992676, "global_step": 185285, "epoch": 4411} {"train_loss": -7.092571258544922, "global_step": 185286, "epoch": 4411} {"train_loss": -7.19854211807251, "global_step": 185287, "epoch": 4411} {"train_loss": -7.249701499938965, "global_step": 185288, "epoch": 4411} {"train_loss": -7.175497531890869, "global_step": 185289, "epoch": 4411} {"train_loss": -7.204777717590332, "global_step": 185290, "epoch": 4411} {"train_loss": -7.123077392578125, "global_step": 185291, "epoch": 4411} {"train_loss": -7.12067174911499, "global_step": 185292, "epoch": 4411} {"train_loss": -7.113811492919922, "global_step": 185293, "epoch": 4411} {"train_loss": -7.183494567871094, "global_step": 185294, "epoch": 4411} {"train_loss": -7.219524383544922, "global_step": 185295, "epoch": 4411} {"train_loss": -7.2080793380737305, "global_step": 185296, "epoch": 4411} {"train_loss": -7.036866188049316, "global_step": 185297, "epoch": 4411} {"train_loss": -7.170949935913086, "global_step": 185298, "epoch": 4411} {"train_loss": -7.067807197570801, "global_step": 185299, "epoch": 4411} {"train_loss": -7.138963222503662, "global_step": 185300, "epoch": 4411} {"train_loss": -7.157705307006836, "global_step": 185301, "epoch": 4411} {"train_loss": -7.104227542877197, "global_step": 185302, "epoch": 4411} {"train_loss": -7.1349182696569535, "global_step": 185303, "epoch": 4411, "val_loss": 69566.46875} {"train_loss": -7.263551235198975, "global_step": 185304, "epoch": 4412} {"train_loss": -7.1926116943359375, "global_step": 185305, "epoch": 4412} {"train_loss": -7.097576141357422, "global_step": 185306, "epoch": 4412} {"train_loss": -7.189953804016113, "global_step": 185307, "epoch": 4412} {"train_loss": -7.116671562194824, "global_step": 185308, "epoch": 4412} {"train_loss": -7.151656150817871, "global_step": 185309, "epoch": 4412} {"train_loss": -7.262746810913086, "global_step": 185310, "epoch": 4412} {"train_loss": -7.1098127365112305, "global_step": 185311, "epoch": 4412} {"train_loss": -7.184399127960205, "global_step": 185312, "epoch": 4412} {"train_loss": -7.134316444396973, "global_step": 185313, "epoch": 4412} {"train_loss": -7.263849258422852, "global_step": 185314, "epoch": 4412} {"train_loss": -7.166400909423828, "global_step": 185315, "epoch": 4412} {"train_loss": -7.1830902099609375, "global_step": 185316, "epoch": 4412} {"train_loss": -7.25059700012207, "global_step": 185317, "epoch": 4412} {"train_loss": -7.182133674621582, "global_step": 185318, "epoch": 4412} {"train_loss": -7.141721248626709, "global_step": 185319, "epoch": 4412} {"train_loss": -7.139336585998535, "global_step": 185320, "epoch": 4412} {"train_loss": -7.090410232543945, "global_step": 185321, "epoch": 4412} {"train_loss": -7.117184638977051, "global_step": 185322, "epoch": 4412} {"train_loss": -7.1898932456970215, "global_step": 185323, "epoch": 4412} {"train_loss": -7.320706367492676, "global_step": 185324, "epoch": 4412} {"train_loss": -7.214564800262451, "global_step": 185325, "epoch": 4412} {"train_loss": -7.115169048309326, "global_step": 185326, "epoch": 4412} {"train_loss": -7.199377059936523, "global_step": 185327, "epoch": 4412} {"train_loss": -7.150331974029541, "global_step": 185328, "epoch": 4412} {"train_loss": -7.1415696144104, "global_step": 185329, "epoch": 4412} {"train_loss": -7.064173698425293, "global_step": 185330, "epoch": 4412} {"train_loss": -7.148111343383789, "global_step": 185331, "epoch": 4412} {"train_loss": -7.073276519775391, "global_step": 185332, "epoch": 4412} {"train_loss": -7.120173931121826, "global_step": 185333, "epoch": 4412} {"train_loss": -7.042966842651367, "global_step": 185334, "epoch": 4412} {"train_loss": -6.952031135559082, "global_step": 185335, "epoch": 4412} {"train_loss": -7.0753374099731445, "global_step": 185336, "epoch": 4412} {"train_loss": -7.079867362976074, "global_step": 185337, "epoch": 4412} {"train_loss": -7.152640342712402, "global_step": 185338, "epoch": 4412} {"train_loss": -7.029323577880859, "global_step": 185339, "epoch": 4412} {"train_loss": -6.8895392417907715, "global_step": 185340, "epoch": 4412} {"train_loss": -7.033666610717773, "global_step": 185341, "epoch": 4412} {"train_loss": -7.075484275817871, "global_step": 185342, "epoch": 4412} {"train_loss": -7.094402313232422, "global_step": 185343, "epoch": 4412} {"train_loss": -7.184100151062012, "global_step": 185344, "epoch": 4412} {"train_loss": -7.137373311179025, "global_step": 185345, "epoch": 4412, "val_loss": 69612.234375} {"train_loss": -7.066032409667969, "global_step": 185346, "epoch": 4413} {"train_loss": -7.072212219238281, "global_step": 185347, "epoch": 4413} {"train_loss": -7.183967590332031, "global_step": 185348, "epoch": 4413} {"train_loss": -7.0825300216674805, "global_step": 185349, "epoch": 4413} {"train_loss": -7.107763290405273, "global_step": 185350, "epoch": 4413} {"train_loss": -7.146365165710449, "global_step": 185351, "epoch": 4413} {"train_loss": -7.1160149574279785, "global_step": 185352, "epoch": 4413} {"train_loss": -7.229379653930664, "global_step": 185353, "epoch": 4413} {"train_loss": -7.105748176574707, "global_step": 185354, "epoch": 4413} {"train_loss": -7.2025041580200195, "global_step": 185355, "epoch": 4413} {"train_loss": -7.178993225097656, "global_step": 185356, "epoch": 4413} {"train_loss": -7.175954341888428, "global_step": 185357, "epoch": 4413} {"train_loss": -7.192633628845215, "global_step": 185358, "epoch": 4413} {"train_loss": -7.156696796417236, "global_step": 185359, "epoch": 4413} {"train_loss": -7.117722511291504, "global_step": 185360, "epoch": 4413} {"train_loss": -6.995900630950928, "global_step": 185361, "epoch": 4413} {"train_loss": -7.132408142089844, "global_step": 185362, "epoch": 4413} {"train_loss": -7.070383548736572, "global_step": 185363, "epoch": 4413} {"train_loss": -7.162137985229492, "global_step": 185364, "epoch": 4413} {"train_loss": -6.981123924255371, "global_step": 185365, "epoch": 4413} {"train_loss": -7.203390598297119, "global_step": 185366, "epoch": 4413} {"train_loss": -7.0577826499938965, "global_step": 185367, "epoch": 4413} {"train_loss": -7.083872318267822, "global_step": 185368, "epoch": 4413} {"train_loss": -7.130461692810059, "global_step": 185369, "epoch": 4413} {"train_loss": -7.007874965667725, "global_step": 185370, "epoch": 4413} {"train_loss": -7.23215389251709, "global_step": 185371, "epoch": 4413} {"train_loss": -6.990706443786621, "global_step": 185372, "epoch": 4413} {"train_loss": -7.0300750732421875, "global_step": 185373, "epoch": 4413} {"train_loss": -7.162149906158447, "global_step": 185374, "epoch": 4413} {"train_loss": -7.085522174835205, "global_step": 185375, "epoch": 4413} {"train_loss": -7.023490905761719, "global_step": 185376, "epoch": 4413} {"train_loss": -7.028683662414551, "global_step": 185377, "epoch": 4413} {"train_loss": -6.984898567199707, "global_step": 185378, "epoch": 4413} {"train_loss": -7.199275016784668, "global_step": 185379, "epoch": 4413} {"train_loss": -7.106546401977539, "global_step": 185380, "epoch": 4413} {"train_loss": -7.032253742218018, "global_step": 185381, "epoch": 4413} {"train_loss": -7.201332092285156, "global_step": 185382, "epoch": 4413} {"train_loss": -7.0442070960998535, "global_step": 185383, "epoch": 4413} {"train_loss": -7.146503448486328, "global_step": 185384, "epoch": 4413} {"train_loss": -7.075397491455078, "global_step": 185385, "epoch": 4413} {"train_loss": -6.9966535568237305, "global_step": 185386, "epoch": 4413} {"train_loss": -7.107924075353713, "global_step": 185387, "epoch": 4413, "val_loss": 69394.609375} {"train_loss": -7.134653091430664, "global_step": 185388, "epoch": 4414} {"train_loss": -7.174871444702148, "global_step": 185389, "epoch": 4414} {"train_loss": -7.220948219299316, "global_step": 185390, "epoch": 4414} {"train_loss": -7.094906806945801, "global_step": 185391, "epoch": 4414} {"train_loss": -7.1171345710754395, "global_step": 185392, "epoch": 4414} {"train_loss": -6.988493919372559, "global_step": 185393, "epoch": 4414} {"train_loss": -7.060873985290527, "global_step": 185394, "epoch": 4414} {"train_loss": -6.9667744636535645, "global_step": 185395, "epoch": 4414} {"train_loss": -7.129369735717773, "global_step": 185396, "epoch": 4414} {"train_loss": -7.107968807220459, "global_step": 185397, "epoch": 4414} {"train_loss": -7.268261909484863, "global_step": 185398, "epoch": 4414} {"train_loss": -7.101241111755371, "global_step": 185399, "epoch": 4414} {"train_loss": -7.120717525482178, "global_step": 185400, "epoch": 4414} {"train_loss": -7.191140174865723, "global_step": 185401, "epoch": 4414} {"train_loss": -7.144485950469971, "global_step": 185402, "epoch": 4414} {"train_loss": -7.233475208282471, "global_step": 185403, "epoch": 4414} {"train_loss": -7.208919525146484, "global_step": 185404, "epoch": 4414} {"train_loss": -7.09406042098999, "global_step": 185405, "epoch": 4414} {"train_loss": -7.14089298248291, "global_step": 185406, "epoch": 4414} {"train_loss": -7.198252201080322, "global_step": 185407, "epoch": 4414} {"train_loss": -7.14518928527832, "global_step": 185408, "epoch": 4414} {"train_loss": -7.2399115562438965, "global_step": 185409, "epoch": 4414} {"train_loss": -7.137745380401611, "global_step": 185410, "epoch": 4414} {"train_loss": -7.1283369064331055, "global_step": 185411, "epoch": 4414} {"train_loss": -7.087530612945557, "global_step": 185412, "epoch": 4414} {"train_loss": -7.119387626647949, "global_step": 185413, "epoch": 4414} {"train_loss": -7.1057562828063965, "global_step": 185414, "epoch": 4414} {"train_loss": -7.18770170211792, "global_step": 185415, "epoch": 4414} {"train_loss": -7.189445495605469, "global_step": 185416, "epoch": 4414} {"train_loss": -7.333743095397949, "global_step": 185417, "epoch": 4414} {"train_loss": -7.175999164581299, "global_step": 185418, "epoch": 4414} {"train_loss": -7.130220413208008, "global_step": 185419, "epoch": 4414} {"train_loss": -7.135519981384277, "global_step": 185420, "epoch": 4414} {"train_loss": -7.037245750427246, "global_step": 185421, "epoch": 4414} {"train_loss": -7.237172603607178, "global_step": 185422, "epoch": 4414} {"train_loss": -7.188785076141357, "global_step": 185423, "epoch": 4414} {"train_loss": -7.1601176261901855, "global_step": 185424, "epoch": 4414} {"train_loss": -7.131680965423584, "global_step": 185425, "epoch": 4414} {"train_loss": -7.168670654296875, "global_step": 185426, "epoch": 4414} {"train_loss": -7.159012794494629, "global_step": 185427, "epoch": 4414} {"train_loss": -7.21455192565918, "global_step": 185428, "epoch": 4414} {"train_loss": -7.151631661823818, "global_step": 185429, "epoch": 4414, "val_loss": 69418.5546875} {"train_loss": -7.15195894241333, "global_step": 185430, "epoch": 4415} {"train_loss": -7.176985263824463, "global_step": 185431, "epoch": 4415} {"train_loss": -7.119865894317627, "global_step": 185432, "epoch": 4415} {"train_loss": -7.276942253112793, "global_step": 185433, "epoch": 4415} {"train_loss": -7.255392551422119, "global_step": 185434, "epoch": 4415} {"train_loss": -7.1804022789001465, "global_step": 185435, "epoch": 4415} {"train_loss": -7.2478837966918945, "global_step": 185436, "epoch": 4415} {"train_loss": -7.169773101806641, "global_step": 185437, "epoch": 4415} {"train_loss": -7.062848091125488, "global_step": 185438, "epoch": 4415} {"train_loss": -7.099029541015625, "global_step": 185439, "epoch": 4415} {"train_loss": -7.127237319946289, "global_step": 185440, "epoch": 4415} {"train_loss": -7.323587894439697, "global_step": 185441, "epoch": 4415} {"train_loss": -7.13778829574585, "global_step": 185442, "epoch": 4415} {"train_loss": -7.238764762878418, "global_step": 185443, "epoch": 4415} {"train_loss": -7.266627311706543, "global_step": 185444, "epoch": 4415} {"train_loss": -7.1262054443359375, "global_step": 185445, "epoch": 4415} {"train_loss": -6.975390911102295, "global_step": 185446, "epoch": 4415} {"train_loss": -7.14893913269043, "global_step": 185447, "epoch": 4415} {"train_loss": -7.125526428222656, "global_step": 185448, "epoch": 4415} {"train_loss": -7.132327079772949, "global_step": 185449, "epoch": 4415} {"train_loss": -7.153716087341309, "global_step": 185450, "epoch": 4415} {"train_loss": -7.182679653167725, "global_step": 185451, "epoch": 4415} {"train_loss": -7.171199798583984, "global_step": 185452, "epoch": 4415} {"train_loss": -7.1761369705200195, "global_step": 185453, "epoch": 4415} {"train_loss": -7.090468883514404, "global_step": 185454, "epoch": 4415} {"train_loss": -7.150137901306152, "global_step": 185455, "epoch": 4415} {"train_loss": -7.164101600646973, "global_step": 185456, "epoch": 4415} {"train_loss": -6.972662448883057, "global_step": 185457, "epoch": 4415} {"train_loss": -7.187164783477783, "global_step": 185458, "epoch": 4415} {"train_loss": -7.094426155090332, "global_step": 185459, "epoch": 4415} {"train_loss": -7.081316947937012, "global_step": 185460, "epoch": 4415} {"train_loss": -7.254273414611816, "global_step": 185461, "epoch": 4415} {"train_loss": -7.064982891082764, "global_step": 185462, "epoch": 4415} {"train_loss": -7.122197151184082, "global_step": 185463, "epoch": 4415} {"train_loss": -7.194979667663574, "global_step": 185464, "epoch": 4415} {"train_loss": -7.10506534576416, "global_step": 185465, "epoch": 4415} {"train_loss": -7.174223899841309, "global_step": 185466, "epoch": 4415} {"train_loss": -7.27101469039917, "global_step": 185467, "epoch": 4415} {"train_loss": -7.2244062423706055, "global_step": 185468, "epoch": 4415} {"train_loss": -7.191816329956055, "global_step": 185469, "epoch": 4415} {"train_loss": -7.22062873840332, "global_step": 185470, "epoch": 4415} {"train_loss": -7.15917782556443, "global_step": 185471, "epoch": 4415, "val_loss": 69534.8515625} {"train_loss": -7.193285942077637, "global_step": 185472, "epoch": 4416} {"train_loss": -7.233163356781006, "global_step": 185473, "epoch": 4416} {"train_loss": -7.1914567947387695, "global_step": 185474, "epoch": 4416} {"train_loss": -7.182929992675781, "global_step": 185475, "epoch": 4416} {"train_loss": -7.179909706115723, "global_step": 185476, "epoch": 4416} {"train_loss": -7.237590312957764, "global_step": 185477, "epoch": 4416} {"train_loss": -7.083067893981934, "global_step": 185478, "epoch": 4416} {"train_loss": -7.144057750701904, "global_step": 185479, "epoch": 4416} {"train_loss": -7.209112644195557, "global_step": 185480, "epoch": 4416} {"train_loss": -7.099318027496338, "global_step": 185481, "epoch": 4416} {"train_loss": -7.098282337188721, "global_step": 185482, "epoch": 4416} {"train_loss": -7.23612117767334, "global_step": 185483, "epoch": 4416} {"train_loss": -7.193910598754883, "global_step": 185484, "epoch": 4416} {"train_loss": -7.174467086791992, "global_step": 185485, "epoch": 4416} {"train_loss": -7.199079990386963, "global_step": 185486, "epoch": 4416} {"train_loss": -7.196838855743408, "global_step": 185487, "epoch": 4416} {"train_loss": -7.1752119064331055, "global_step": 185488, "epoch": 4416} {"train_loss": -7.231717109680176, "global_step": 185489, "epoch": 4416} {"train_loss": -7.2739715576171875, "global_step": 185490, "epoch": 4416} {"train_loss": -7.128355503082275, "global_step": 185491, "epoch": 4416} {"train_loss": -7.176026344299316, "global_step": 185492, "epoch": 4416} {"train_loss": -7.277790546417236, "global_step": 185493, "epoch": 4416} {"train_loss": -7.265384674072266, "global_step": 185494, "epoch": 4416} {"train_loss": -7.335955619812012, "global_step": 185495, "epoch": 4416} {"train_loss": -7.1954755783081055, "global_step": 185496, "epoch": 4416} {"train_loss": -7.190656661987305, "global_step": 185497, "epoch": 4416} {"train_loss": -7.23360013961792, "global_step": 185498, "epoch": 4416} {"train_loss": -7.152609348297119, "global_step": 185499, "epoch": 4416} {"train_loss": -7.140522480010986, "global_step": 185500, "epoch": 4416} {"train_loss": -7.139867782592773, "global_step": 185501, "epoch": 4416} {"train_loss": -7.158594131469727, "global_step": 185502, "epoch": 4416} {"train_loss": -7.308262825012207, "global_step": 185503, "epoch": 4416} {"train_loss": -7.201536655426025, "global_step": 185504, "epoch": 4416} {"train_loss": -7.1824564933776855, "global_step": 185505, "epoch": 4416} {"train_loss": -7.260087013244629, "global_step": 185506, "epoch": 4416} {"train_loss": -7.263530254364014, "global_step": 185507, "epoch": 4416} {"train_loss": -7.160934925079346, "global_step": 185508, "epoch": 4416} {"train_loss": -7.157456398010254, "global_step": 185509, "epoch": 4416} {"train_loss": -7.147280216217041, "global_step": 185510, "epoch": 4416} {"train_loss": -7.054622173309326, "global_step": 185511, "epoch": 4416} {"train_loss": -7.000280857086182, "global_step": 185512, "epoch": 4416} {"train_loss": -7.1878385203225275, "global_step": 185513, "epoch": 4416, "val_loss": 69600.5234375} {"train_loss": -7.0987548828125, "global_step": 185514, "epoch": 4417} {"train_loss": -7.093840599060059, "global_step": 185515, "epoch": 4417} {"train_loss": -7.140100479125977, "global_step": 185516, "epoch": 4417} {"train_loss": -7.115052223205566, "global_step": 185517, "epoch": 4417} {"train_loss": -7.054627895355225, "global_step": 185518, "epoch": 4417} {"train_loss": -7.205275535583496, "global_step": 185519, "epoch": 4417} {"train_loss": -7.14774751663208, "global_step": 185520, "epoch": 4417} {"train_loss": -7.032101631164551, "global_step": 185521, "epoch": 4417} {"train_loss": -7.137425899505615, "global_step": 185522, "epoch": 4417} {"train_loss": -7.079944133758545, "global_step": 185523, "epoch": 4417} {"train_loss": -7.144744873046875, "global_step": 185524, "epoch": 4417} {"train_loss": -7.088409423828125, "global_step": 185525, "epoch": 4417} {"train_loss": -7.141683578491211, "global_step": 185526, "epoch": 4417} {"train_loss": -7.153024673461914, "global_step": 185527, "epoch": 4417} {"train_loss": -7.079153537750244, "global_step": 185528, "epoch": 4417} {"train_loss": -7.150473594665527, "global_step": 185529, "epoch": 4417} {"train_loss": -7.120037078857422, "global_step": 185530, "epoch": 4417} {"train_loss": -7.07951545715332, "global_step": 185531, "epoch": 4417} {"train_loss": -7.038876533508301, "global_step": 185532, "epoch": 4417} {"train_loss": -7.1193037033081055, "global_step": 185533, "epoch": 4417} {"train_loss": -7.160391807556152, "global_step": 185534, "epoch": 4417} {"train_loss": -7.115292549133301, "global_step": 185535, "epoch": 4417} {"train_loss": -7.184762001037598, "global_step": 185536, "epoch": 4417} {"train_loss": -7.191878795623779, "global_step": 185537, "epoch": 4417} {"train_loss": -7.206964492797852, "global_step": 185538, "epoch": 4417} {"train_loss": -7.17192268371582, "global_step": 185539, "epoch": 4417} {"train_loss": -7.051984786987305, "global_step": 185540, "epoch": 4417} {"train_loss": -7.218276023864746, "global_step": 185541, "epoch": 4417} {"train_loss": -7.253104209899902, "global_step": 185542, "epoch": 4417} {"train_loss": -7.065171718597412, "global_step": 185543, "epoch": 4417} {"train_loss": -7.097224235534668, "global_step": 185544, "epoch": 4417} {"train_loss": -7.155788898468018, "global_step": 185545, "epoch": 4417} {"train_loss": -7.095576286315918, "global_step": 185546, "epoch": 4417} {"train_loss": -6.966062068939209, "global_step": 185547, "epoch": 4417} {"train_loss": -7.17327880859375, "global_step": 185548, "epoch": 4417} {"train_loss": -6.84638786315918, "global_step": 185549, "epoch": 4417} {"train_loss": -7.0280046463012695, "global_step": 185550, "epoch": 4417} {"train_loss": -6.895049095153809, "global_step": 185551, "epoch": 4417} {"train_loss": -6.871533393859863, "global_step": 185552, "epoch": 4417} {"train_loss": -7.037505149841309, "global_step": 185553, "epoch": 4417} {"train_loss": -6.871097087860107, "global_step": 185554, "epoch": 4417} {"train_loss": -7.093342678887503, "global_step": 185555, "epoch": 4417, "val_loss": 69806.640625} {"train_loss": -6.967071533203125, "global_step": 185556, "epoch": 4418} {"train_loss": -7.091156005859375, "global_step": 185557, "epoch": 4418} {"train_loss": -6.869556427001953, "global_step": 185558, "epoch": 4418} {"train_loss": -7.052199840545654, "global_step": 185559, "epoch": 4418} {"train_loss": -6.997188568115234, "global_step": 185560, "epoch": 4418} {"train_loss": -7.121072769165039, "global_step": 185561, "epoch": 4418} {"train_loss": -6.992899417877197, "global_step": 185562, "epoch": 4418} {"train_loss": -7.005842208862305, "global_step": 185563, "epoch": 4418} {"train_loss": -7.051938533782959, "global_step": 185564, "epoch": 4418} {"train_loss": -7.035464286804199, "global_step": 185565, "epoch": 4418} {"train_loss": -7.053558349609375, "global_step": 185566, "epoch": 4418} {"train_loss": -7.057302474975586, "global_step": 185567, "epoch": 4418} {"train_loss": -7.169207572937012, "global_step": 185568, "epoch": 4418} {"train_loss": -7.023525238037109, "global_step": 185569, "epoch": 4418} {"train_loss": -7.111119270324707, "global_step": 185570, "epoch": 4418} {"train_loss": -7.20778751373291, "global_step": 185571, "epoch": 4418} {"train_loss": -7.147961616516113, "global_step": 185572, "epoch": 4418} {"train_loss": -7.1406426429748535, "global_step": 185573, "epoch": 4418} {"train_loss": -7.123624801635742, "global_step": 185574, "epoch": 4418} {"train_loss": -7.17884635925293, "global_step": 185575, "epoch": 4418} {"train_loss": -7.183766841888428, "global_step": 185576, "epoch": 4418} {"train_loss": -7.1069655418396, "global_step": 185577, "epoch": 4418} {"train_loss": -7.070869445800781, "global_step": 185578, "epoch": 4418} {"train_loss": -7.159623146057129, "global_step": 185579, "epoch": 4418} {"train_loss": -7.119268894195557, "global_step": 185580, "epoch": 4418} {"train_loss": -7.187093257904053, "global_step": 185581, "epoch": 4418} {"train_loss": -7.154242038726807, "global_step": 185582, "epoch": 4418} {"train_loss": -7.152290344238281, "global_step": 185583, "epoch": 4418} {"train_loss": -7.136744499206543, "global_step": 185584, "epoch": 4418} {"train_loss": -7.144071578979492, "global_step": 185585, "epoch": 4418} {"train_loss": -7.036538124084473, "global_step": 185586, "epoch": 4418} {"train_loss": -7.179288387298584, "global_step": 185587, "epoch": 4418} {"train_loss": -7.215127944946289, "global_step": 185588, "epoch": 4418} {"train_loss": -7.152850151062012, "global_step": 185589, "epoch": 4418} {"train_loss": -7.190582752227783, "global_step": 185590, "epoch": 4418} {"train_loss": -7.169504165649414, "global_step": 185591, "epoch": 4418} {"train_loss": -7.070461750030518, "global_step": 185592, "epoch": 4418} {"train_loss": -7.052889347076416, "global_step": 185593, "epoch": 4418} {"train_loss": -7.212677955627441, "global_step": 185594, "epoch": 4418} {"train_loss": -7.234246253967285, "global_step": 185595, "epoch": 4418} {"train_loss": -7.177482604980469, "global_step": 185596, "epoch": 4418} {"train_loss": -7.113358906337193, "global_step": 185597, "epoch": 4418, "val_loss": 69524.5546875} {"train_loss": -7.287976264953613, "global_step": 185598, "epoch": 4419} {"train_loss": -7.278599262237549, "global_step": 185599, "epoch": 4419} {"train_loss": -7.185523986816406, "global_step": 185600, "epoch": 4419} {"train_loss": -7.216395378112793, "global_step": 185601, "epoch": 4419} {"train_loss": -7.239410877227783, "global_step": 185602, "epoch": 4419} {"train_loss": -7.128358840942383, "global_step": 185603, "epoch": 4419} {"train_loss": -7.111687660217285, "global_step": 185604, "epoch": 4419} {"train_loss": -7.093709945678711, "global_step": 185605, "epoch": 4419} {"train_loss": -7.164401531219482, "global_step": 185606, "epoch": 4419} {"train_loss": -7.1009202003479, "global_step": 185607, "epoch": 4419} {"train_loss": -7.093723297119141, "global_step": 185608, "epoch": 4419} {"train_loss": -7.141338348388672, "global_step": 185609, "epoch": 4419} {"train_loss": -7.245711326599121, "global_step": 185610, "epoch": 4419} {"train_loss": -7.046102523803711, "global_step": 185611, "epoch": 4419} {"train_loss": -7.188510894775391, "global_step": 185612, "epoch": 4419} {"train_loss": -7.1148529052734375, "global_step": 185613, "epoch": 4419} {"train_loss": -7.205324172973633, "global_step": 185614, "epoch": 4419} {"train_loss": -7.120241165161133, "global_step": 185615, "epoch": 4419} {"train_loss": -7.1642560958862305, "global_step": 185616, "epoch": 4419} {"train_loss": -7.088470458984375, "global_step": 185617, "epoch": 4419} {"train_loss": -7.165457248687744, "global_step": 185618, "epoch": 4419} {"train_loss": -7.011484146118164, "global_step": 185619, "epoch": 4419} {"train_loss": -7.053297996520996, "global_step": 185620, "epoch": 4419} {"train_loss": -7.186380386352539, "global_step": 185621, "epoch": 4419} {"train_loss": -7.224421977996826, "global_step": 185622, "epoch": 4419} {"train_loss": -7.18728494644165, "global_step": 185623, "epoch": 4419} {"train_loss": -7.122632026672363, "global_step": 185624, "epoch": 4419} {"train_loss": -7.041294574737549, "global_step": 185625, "epoch": 4419} {"train_loss": -7.145380020141602, "global_step": 185626, "epoch": 4419} {"train_loss": -7.11995792388916, "global_step": 185627, "epoch": 4419} {"train_loss": -7.08128023147583, "global_step": 185628, "epoch": 4419} {"train_loss": -7.165503025054932, "global_step": 185629, "epoch": 4419} {"train_loss": -7.029878616333008, "global_step": 185630, "epoch": 4419} {"train_loss": -7.01011848449707, "global_step": 185631, "epoch": 4419} {"train_loss": -7.119609832763672, "global_step": 185632, "epoch": 4419} {"train_loss": -7.150684356689453, "global_step": 185633, "epoch": 4419} {"train_loss": -7.06721830368042, "global_step": 185634, "epoch": 4419} {"train_loss": -7.093270301818848, "global_step": 185635, "epoch": 4419} {"train_loss": -7.155864715576172, "global_step": 185636, "epoch": 4419} {"train_loss": -7.107546806335449, "global_step": 185637, "epoch": 4419} {"train_loss": -7.080095291137695, "global_step": 185638, "epoch": 4419} {"train_loss": -7.1362891764867875, "global_step": 185639, "epoch": 4419, "val_loss": 69427.671875} {"train_loss": -7.088910102844238, "global_step": 185640, "epoch": 4420} {"train_loss": -7.24907112121582, "global_step": 185641, "epoch": 4420} {"train_loss": -7.114779472351074, "global_step": 185642, "epoch": 4420} {"train_loss": -7.151271820068359, "global_step": 185643, "epoch": 4420} {"train_loss": -7.153212547302246, "global_step": 185644, "epoch": 4420} {"train_loss": -7.241103649139404, "global_step": 185645, "epoch": 4420} {"train_loss": -7.121838569641113, "global_step": 185646, "epoch": 4420} {"train_loss": -7.210201263427734, "global_step": 185647, "epoch": 4420} {"train_loss": -7.085671424865723, "global_step": 185648, "epoch": 4420} {"train_loss": -7.175829887390137, "global_step": 185649, "epoch": 4420} {"train_loss": -7.137340545654297, "global_step": 185650, "epoch": 4420} {"train_loss": -7.118396282196045, "global_step": 185651, "epoch": 4420} {"train_loss": -7.149022579193115, "global_step": 185652, "epoch": 4420} {"train_loss": -7.144587516784668, "global_step": 185653, "epoch": 4420} {"train_loss": -7.23454475402832, "global_step": 185654, "epoch": 4420} {"train_loss": -7.133430480957031, "global_step": 185655, "epoch": 4420} {"train_loss": -7.188203811645508, "global_step": 185656, "epoch": 4420} {"train_loss": -7.133448600769043, "global_step": 185657, "epoch": 4420} {"train_loss": -7.174985408782959, "global_step": 185658, "epoch": 4420} {"train_loss": -7.080913543701172, "global_step": 185659, "epoch": 4420} {"train_loss": -7.177194595336914, "global_step": 185660, "epoch": 4420} {"train_loss": -7.154988765716553, "global_step": 185661, "epoch": 4420} {"train_loss": -7.21533203125, "global_step": 185662, "epoch": 4420} {"train_loss": -7.169218063354492, "global_step": 185663, "epoch": 4420} {"train_loss": -7.173395156860352, "global_step": 185664, "epoch": 4420} {"train_loss": -7.187760353088379, "global_step": 185665, "epoch": 4420} {"train_loss": -7.114690780639648, "global_step": 185666, "epoch": 4420} {"train_loss": -7.211724758148193, "global_step": 185667, "epoch": 4420} {"train_loss": -7.2089972496032715, "global_step": 185668, "epoch": 4420} {"train_loss": -7.116600036621094, "global_step": 185669, "epoch": 4420} {"train_loss": -7.220892429351807, "global_step": 185670, "epoch": 4420} {"train_loss": -7.0545654296875, "global_step": 185671, "epoch": 4420} {"train_loss": -7.166046619415283, "global_step": 185672, "epoch": 4420} {"train_loss": -7.150671005249023, "global_step": 185673, "epoch": 4420} {"train_loss": -7.16396951675415, "global_step": 185674, "epoch": 4420} {"train_loss": -6.929698467254639, "global_step": 185675, "epoch": 4420} {"train_loss": -7.0755414962768555, "global_step": 185676, "epoch": 4420} {"train_loss": -7.192373275756836, "global_step": 185677, "epoch": 4420} {"train_loss": -7.062847137451172, "global_step": 185678, "epoch": 4420} {"train_loss": -7.163666725158691, "global_step": 185679, "epoch": 4420} {"train_loss": -7.081122875213623, "global_step": 185680, "epoch": 4420} {"train_loss": -7.147685505094982, "global_step": 185681, "epoch": 4420, "val_loss": 69448.046875} {"train_loss": -7.2320637702941895, "global_step": 185682, "epoch": 4421} {"train_loss": -7.020887851715088, "global_step": 185683, "epoch": 4421} {"train_loss": -7.108329772949219, "global_step": 185684, "epoch": 4421} {"train_loss": -7.145363807678223, "global_step": 185685, "epoch": 4421} {"train_loss": -7.090909957885742, "global_step": 185686, "epoch": 4421} {"train_loss": -7.071418762207031, "global_step": 185687, "epoch": 4421} {"train_loss": -7.083783149719238, "global_step": 185688, "epoch": 4421} {"train_loss": -7.199734210968018, "global_step": 185689, "epoch": 4421} {"train_loss": -7.155577659606934, "global_step": 185690, "epoch": 4421} {"train_loss": -7.104506492614746, "global_step": 185691, "epoch": 4421} {"train_loss": -7.179939270019531, "global_step": 185692, "epoch": 4421} {"train_loss": -7.069198131561279, "global_step": 185693, "epoch": 4421} {"train_loss": -7.140974044799805, "global_step": 185694, "epoch": 4421} {"train_loss": -7.146665573120117, "global_step": 185695, "epoch": 4421} {"train_loss": -7.139893531799316, "global_step": 185696, "epoch": 4421} {"train_loss": -7.105852127075195, "global_step": 185697, "epoch": 4421} {"train_loss": -7.151479721069336, "global_step": 185698, "epoch": 4421} {"train_loss": -7.146717071533203, "global_step": 185699, "epoch": 4421} {"train_loss": -7.289334297180176, "global_step": 185700, "epoch": 4421} {"train_loss": -7.180879592895508, "global_step": 185701, "epoch": 4421} {"train_loss": -7.209342956542969, "global_step": 185702, "epoch": 4421} {"train_loss": -7.246274948120117, "global_step": 185703, "epoch": 4421} {"train_loss": -7.123027801513672, "global_step": 185704, "epoch": 4421} {"train_loss": -7.338611602783203, "global_step": 185705, "epoch": 4421} {"train_loss": -7.360589981079102, "global_step": 185706, "epoch": 4421} {"train_loss": -7.2308454513549805, "global_step": 185707, "epoch": 4421} {"train_loss": -7.2331438064575195, "global_step": 185708, "epoch": 4421} {"train_loss": -7.240886211395264, "global_step": 185709, "epoch": 4421} {"train_loss": -7.331535339355469, "global_step": 185710, "epoch": 4421} {"train_loss": -7.218792915344238, "global_step": 185711, "epoch": 4421} {"train_loss": -7.343952655792236, "global_step": 185712, "epoch": 4421} {"train_loss": -7.244165897369385, "global_step": 185713, "epoch": 4421} {"train_loss": -7.2067952156066895, "global_step": 185714, "epoch": 4421} {"train_loss": -7.144576549530029, "global_step": 185715, "epoch": 4421} {"train_loss": -7.238353252410889, "global_step": 185716, "epoch": 4421} {"train_loss": -7.2766008377075195, "global_step": 185717, "epoch": 4421} {"train_loss": -7.321203231811523, "global_step": 185718, "epoch": 4421} {"train_loss": -7.237229824066162, "global_step": 185719, "epoch": 4421} {"train_loss": -7.25654411315918, "global_step": 185720, "epoch": 4421} {"train_loss": -7.337287902832031, "global_step": 185721, "epoch": 4421} {"train_loss": -7.197973251342773, "global_step": 185722, "epoch": 4421} {"train_loss": -7.19566703978039, "global_step": 185723, "epoch": 4421, "val_loss": 69428.578125} {"train_loss": -7.11208438873291, "global_step": 185724, "epoch": 4422} {"train_loss": -7.252202987670898, "global_step": 185725, "epoch": 4422} {"train_loss": -7.144199848175049, "global_step": 185726, "epoch": 4422} {"train_loss": -7.18498420715332, "global_step": 185727, "epoch": 4422} {"train_loss": -7.2467546463012695, "global_step": 185728, "epoch": 4422} {"train_loss": -7.274590492248535, "global_step": 185729, "epoch": 4422} {"train_loss": -7.1942338943481445, "global_step": 185730, "epoch": 4422} {"train_loss": -7.129456520080566, "global_step": 185731, "epoch": 4422} {"train_loss": -7.172601699829102, "global_step": 185732, "epoch": 4422} {"train_loss": -7.175480842590332, "global_step": 185733, "epoch": 4422} {"train_loss": -7.14057731628418, "global_step": 185734, "epoch": 4422} {"train_loss": -7.094656944274902, "global_step": 185735, "epoch": 4422} {"train_loss": -7.1492085456848145, "global_step": 185736, "epoch": 4422} {"train_loss": -7.293856620788574, "global_step": 185737, "epoch": 4422} {"train_loss": -7.124114990234375, "global_step": 185738, "epoch": 4422} {"train_loss": -7.1732330322265625, "global_step": 185739, "epoch": 4422} {"train_loss": -7.160674095153809, "global_step": 185740, "epoch": 4422} {"train_loss": -7.095078468322754, "global_step": 185741, "epoch": 4422} {"train_loss": -7.122568130493164, "global_step": 185742, "epoch": 4422} {"train_loss": -7.234199523925781, "global_step": 185743, "epoch": 4422} {"train_loss": -7.162446975708008, "global_step": 185744, "epoch": 4422} {"train_loss": -7.0941009521484375, "global_step": 185745, "epoch": 4422} {"train_loss": -7.122625350952148, "global_step": 185746, "epoch": 4422} {"train_loss": -7.117764949798584, "global_step": 185747, "epoch": 4422} {"train_loss": -7.205294609069824, "global_step": 185748, "epoch": 4422} {"train_loss": -7.131615161895752, "global_step": 185749, "epoch": 4422} {"train_loss": -7.2166314125061035, "global_step": 185750, "epoch": 4422} {"train_loss": -7.122149467468262, "global_step": 185751, "epoch": 4422} {"train_loss": -7.112887382507324, "global_step": 185752, "epoch": 4422} {"train_loss": -7.163140773773193, "global_step": 185753, "epoch": 4422} {"train_loss": -7.099720478057861, "global_step": 185754, "epoch": 4422} {"train_loss": -7.095437526702881, "global_step": 185755, "epoch": 4422} {"train_loss": -7.1129889488220215, "global_step": 185756, "epoch": 4422} {"train_loss": -7.12430477142334, "global_step": 185757, "epoch": 4422} {"train_loss": -7.185677528381348, "global_step": 185758, "epoch": 4422} {"train_loss": -7.196955680847168, "global_step": 185759, "epoch": 4422} {"train_loss": -7.089637756347656, "global_step": 185760, "epoch": 4422} {"train_loss": -7.191854476928711, "global_step": 185761, "epoch": 4422} {"train_loss": -7.200007438659668, "global_step": 185762, "epoch": 4422} {"train_loss": -7.108665466308594, "global_step": 185763, "epoch": 4422} {"train_loss": -7.135386943817139, "global_step": 185764, "epoch": 4422} {"train_loss": -7.158497299466815, "global_step": 185765, "epoch": 4422, "val_loss": 69422.3671875} {"train_loss": -7.205575942993164, "global_step": 185766, "epoch": 4423} {"train_loss": -7.116252422332764, "global_step": 185767, "epoch": 4423} {"train_loss": -7.1170759201049805, "global_step": 185768, "epoch": 4423} {"train_loss": -7.148272514343262, "global_step": 185769, "epoch": 4423} {"train_loss": -7.143628120422363, "global_step": 185770, "epoch": 4423} {"train_loss": -7.070634365081787, "global_step": 185771, "epoch": 4423} {"train_loss": -7.213632583618164, "global_step": 185772, "epoch": 4423} {"train_loss": -7.162222862243652, "global_step": 185773, "epoch": 4423} {"train_loss": -7.082644462585449, "global_step": 185774, "epoch": 4423} {"train_loss": -7.228388786315918, "global_step": 185775, "epoch": 4423} {"train_loss": -7.065084457397461, "global_step": 185776, "epoch": 4423} {"train_loss": -7.208606719970703, "global_step": 185777, "epoch": 4423} {"train_loss": -7.090529441833496, "global_step": 185778, "epoch": 4423} {"train_loss": -7.238441467285156, "global_step": 185779, "epoch": 4423} {"train_loss": -7.244542121887207, "global_step": 185780, "epoch": 4423} {"train_loss": -7.166114330291748, "global_step": 185781, "epoch": 4423} {"train_loss": -7.086321830749512, "global_step": 185782, "epoch": 4423} {"train_loss": -7.261264801025391, "global_step": 185783, "epoch": 4423} {"train_loss": -7.096907615661621, "global_step": 185784, "epoch": 4423} {"train_loss": -7.207842826843262, "global_step": 185785, "epoch": 4423} {"train_loss": -7.195837497711182, "global_step": 185786, "epoch": 4423} {"train_loss": -7.123719692230225, "global_step": 185787, "epoch": 4423} {"train_loss": -7.228996276855469, "global_step": 185788, "epoch": 4423} {"train_loss": -7.247096061706543, "global_step": 185789, "epoch": 4423} {"train_loss": -7.1464385986328125, "global_step": 185790, "epoch": 4423} {"train_loss": -7.132768154144287, "global_step": 185791, "epoch": 4423} {"train_loss": -7.157876014709473, "global_step": 185792, "epoch": 4423} {"train_loss": -7.162731170654297, "global_step": 185793, "epoch": 4423} {"train_loss": -7.062489032745361, "global_step": 185794, "epoch": 4423} {"train_loss": -7.218081474304199, "global_step": 185795, "epoch": 4423} {"train_loss": -7.159268379211426, "global_step": 185796, "epoch": 4423} {"train_loss": -7.110729217529297, "global_step": 185797, "epoch": 4423} {"train_loss": -7.090068817138672, "global_step": 185798, "epoch": 4423} {"train_loss": -7.206628322601318, "global_step": 185799, "epoch": 4423} {"train_loss": -7.150087356567383, "global_step": 185800, "epoch": 4423} {"train_loss": -7.189023494720459, "global_step": 185801, "epoch": 4423} {"train_loss": -7.116812705993652, "global_step": 185802, "epoch": 4423} {"train_loss": -7.135799884796143, "global_step": 185803, "epoch": 4423} {"train_loss": -7.1296305656433105, "global_step": 185804, "epoch": 4423} {"train_loss": -7.1391215324401855, "global_step": 185805, "epoch": 4423} {"train_loss": -7.170348167419434, "global_step": 185806, "epoch": 4423} {"train_loss": -7.15601753053211, "global_step": 185807, "epoch": 4423, "val_loss": 69491.4609375} {"train_loss": -7.16274356842041, "global_step": 185808, "epoch": 4424} {"train_loss": -7.320158004760742, "global_step": 185809, "epoch": 4424} {"train_loss": -7.178846836090088, "global_step": 185810, "epoch": 4424} {"train_loss": -7.16560697555542, "global_step": 185811, "epoch": 4424} {"train_loss": -7.074563026428223, "global_step": 185812, "epoch": 4424} {"train_loss": -7.184076309204102, "global_step": 185813, "epoch": 4424} {"train_loss": -7.199405670166016, "global_step": 185814, "epoch": 4424} {"train_loss": -7.183645248413086, "global_step": 185815, "epoch": 4424} {"train_loss": -7.152085781097412, "global_step": 185816, "epoch": 4424} {"train_loss": -7.159494400024414, "global_step": 185817, "epoch": 4424} {"train_loss": -7.2427873611450195, "global_step": 185818, "epoch": 4424} {"train_loss": -7.167219638824463, "global_step": 185819, "epoch": 4424} {"train_loss": -7.08264684677124, "global_step": 185820, "epoch": 4424} {"train_loss": -7.211199760437012, "global_step": 185821, "epoch": 4424} {"train_loss": -7.22603702545166, "global_step": 185822, "epoch": 4424} {"train_loss": -7.165497779846191, "global_step": 185823, "epoch": 4424} {"train_loss": -7.056229591369629, "global_step": 185824, "epoch": 4424} {"train_loss": -7.203885555267334, "global_step": 185825, "epoch": 4424} {"train_loss": -7.082549095153809, "global_step": 185826, "epoch": 4424} {"train_loss": -7.193531513214111, "global_step": 185827, "epoch": 4424} {"train_loss": -7.176731109619141, "global_step": 185828, "epoch": 4424} {"train_loss": -7.16793966293335, "global_step": 185829, "epoch": 4424} {"train_loss": -7.183008193969727, "global_step": 185830, "epoch": 4424} {"train_loss": -7.193816184997559, "global_step": 185831, "epoch": 4424} {"train_loss": -7.185454368591309, "global_step": 185832, "epoch": 4424} {"train_loss": -7.077419757843018, "global_step": 185833, "epoch": 4424} {"train_loss": -7.131168365478516, "global_step": 185834, "epoch": 4424} {"train_loss": -7.179773330688477, "global_step": 185835, "epoch": 4424} {"train_loss": -7.135307788848877, "global_step": 185836, "epoch": 4424} {"train_loss": -7.083930969238281, "global_step": 185837, "epoch": 4424} {"train_loss": -7.132433891296387, "global_step": 185838, "epoch": 4424} {"train_loss": -7.22715950012207, "global_step": 185839, "epoch": 4424} {"train_loss": -7.165338039398193, "global_step": 185840, "epoch": 4424} {"train_loss": -7.136406421661377, "global_step": 185841, "epoch": 4424} {"train_loss": -7.042522430419922, "global_step": 185842, "epoch": 4424} {"train_loss": -7.031320095062256, "global_step": 185843, "epoch": 4424} {"train_loss": -7.038747787475586, "global_step": 185844, "epoch": 4424} {"train_loss": -7.196910858154297, "global_step": 185845, "epoch": 4424} {"train_loss": -7.145176410675049, "global_step": 185846, "epoch": 4424} {"train_loss": -7.118281364440918, "global_step": 185847, "epoch": 4424} {"train_loss": -7.2049736976623535, "global_step": 185848, "epoch": 4424} {"train_loss": -7.1564087981269475, "global_step": 185849, "epoch": 4424, "val_loss": 69533.4609375} {"train_loss": -7.2241740226745605, "global_step": 185850, "epoch": 4425} {"train_loss": -7.179390907287598, "global_step": 185851, "epoch": 4425} {"train_loss": -7.122369766235352, "global_step": 185852, "epoch": 4425} {"train_loss": -7.092782497406006, "global_step": 185853, "epoch": 4425} {"train_loss": -7.184284210205078, "global_step": 185854, "epoch": 4425} {"train_loss": -7.198134422302246, "global_step": 185855, "epoch": 4425} {"train_loss": -7.037216663360596, "global_step": 185856, "epoch": 4425} {"train_loss": -7.2527875900268555, "global_step": 185857, "epoch": 4425} {"train_loss": -7.1154022216796875, "global_step": 185858, "epoch": 4425} {"train_loss": -7.229004383087158, "global_step": 185859, "epoch": 4425} {"train_loss": -7.07496452331543, "global_step": 185860, "epoch": 4425} {"train_loss": -7.114363193511963, "global_step": 185861, "epoch": 4425} {"train_loss": -7.1530351638793945, "global_step": 185862, "epoch": 4425} {"train_loss": -7.13188362121582, "global_step": 185863, "epoch": 4425} {"train_loss": -7.172945022583008, "global_step": 185864, "epoch": 4425} {"train_loss": -7.217782974243164, "global_step": 185865, "epoch": 4425} {"train_loss": -7.225851058959961, "global_step": 185866, "epoch": 4425} {"train_loss": -7.10527229309082, "global_step": 185867, "epoch": 4425} {"train_loss": -7.021117210388184, "global_step": 185868, "epoch": 4425} {"train_loss": -7.046148300170898, "global_step": 185869, "epoch": 4425} {"train_loss": -7.2962260246276855, "global_step": 185870, "epoch": 4425} {"train_loss": -6.955606460571289, "global_step": 185871, "epoch": 4425} {"train_loss": -7.192914962768555, "global_step": 185872, "epoch": 4425} {"train_loss": -7.133678436279297, "global_step": 185873, "epoch": 4425} {"train_loss": -6.97670316696167, "global_step": 185874, "epoch": 4425} {"train_loss": -7.222294807434082, "global_step": 185875, "epoch": 4425} {"train_loss": -7.088682174682617, "global_step": 185876, "epoch": 4425} {"train_loss": -7.125636100769043, "global_step": 185877, "epoch": 4425} {"train_loss": -7.093667984008789, "global_step": 185878, "epoch": 4425} {"train_loss": -7.113034248352051, "global_step": 185879, "epoch": 4425} {"train_loss": -7.06089973449707, "global_step": 185880, "epoch": 4425} {"train_loss": -7.110518932342529, "global_step": 185881, "epoch": 4425} {"train_loss": -7.178779125213623, "global_step": 185882, "epoch": 4425} {"train_loss": -7.162477016448975, "global_step": 185883, "epoch": 4425} {"train_loss": -7.257850170135498, "global_step": 185884, "epoch": 4425} {"train_loss": -7.122707843780518, "global_step": 185885, "epoch": 4425} {"train_loss": -7.161147594451904, "global_step": 185886, "epoch": 4425} {"train_loss": -7.091269493103027, "global_step": 185887, "epoch": 4425} {"train_loss": -7.098492622375488, "global_step": 185888, "epoch": 4425} {"train_loss": -7.118523597717285, "global_step": 185889, "epoch": 4425} {"train_loss": -7.214365005493164, "global_step": 185890, "epoch": 4425} {"train_loss": -7.133953332901001, "global_step": 185891, "epoch": 4425, "val_loss": 69649.828125} {"train_loss": -7.059601306915283, "global_step": 185892, "epoch": 4426} {"train_loss": -7.206549644470215, "global_step": 185893, "epoch": 4426} {"train_loss": -7.112580299377441, "global_step": 185894, "epoch": 4426} {"train_loss": -7.087752342224121, "global_step": 185895, "epoch": 4426} {"train_loss": -7.195173263549805, "global_step": 185896, "epoch": 4426} {"train_loss": -7.208449363708496, "global_step": 185897, "epoch": 4426} {"train_loss": -7.029058456420898, "global_step": 185898, "epoch": 4426} {"train_loss": -7.2426981925964355, "global_step": 185899, "epoch": 4426} {"train_loss": -7.098943710327148, "global_step": 185900, "epoch": 4426} {"train_loss": -7.092438697814941, "global_step": 185901, "epoch": 4426} {"train_loss": -7.119411468505859, "global_step": 185902, "epoch": 4426} {"train_loss": -7.044137954711914, "global_step": 185903, "epoch": 4426} {"train_loss": -7.0127410888671875, "global_step": 185904, "epoch": 4426} {"train_loss": -7.229334354400635, "global_step": 185905, "epoch": 4426} {"train_loss": -7.1222944259643555, "global_step": 185906, "epoch": 4426} {"train_loss": -7.183323383331299, "global_step": 185907, "epoch": 4426} {"train_loss": -7.203499794006348, "global_step": 185908, "epoch": 4426} {"train_loss": -7.123695373535156, "global_step": 185909, "epoch": 4426} {"train_loss": -7.16656494140625, "global_step": 185910, "epoch": 4426} {"train_loss": -7.195927619934082, "global_step": 185911, "epoch": 4426} {"train_loss": -7.08976936340332, "global_step": 185912, "epoch": 4426} {"train_loss": -7.039987564086914, "global_step": 185913, "epoch": 4426} {"train_loss": -7.130616188049316, "global_step": 185914, "epoch": 4426} {"train_loss": -7.024549961090088, "global_step": 185915, "epoch": 4426} {"train_loss": -7.139918327331543, "global_step": 185916, "epoch": 4426} {"train_loss": -7.150087356567383, "global_step": 185917, "epoch": 4426} {"train_loss": -7.117802143096924, "global_step": 185918, "epoch": 4426} {"train_loss": -6.8895745277404785, "global_step": 185919, "epoch": 4426} {"train_loss": -7.054001808166504, "global_step": 185920, "epoch": 4426} {"train_loss": -7.081719875335693, "global_step": 185921, "epoch": 4426} {"train_loss": -6.921584129333496, "global_step": 185922, "epoch": 4426} {"train_loss": -7.112354278564453, "global_step": 185923, "epoch": 4426} {"train_loss": -7.013036251068115, "global_step": 185924, "epoch": 4426} {"train_loss": -7.086334228515625, "global_step": 185925, "epoch": 4426} {"train_loss": -6.982753753662109, "global_step": 185926, "epoch": 4426} {"train_loss": -7.196394920349121, "global_step": 185927, "epoch": 4426} {"train_loss": -7.038173675537109, "global_step": 185928, "epoch": 4426} {"train_loss": -7.049422264099121, "global_step": 185929, "epoch": 4426} {"train_loss": -7.12525749206543, "global_step": 185930, "epoch": 4426} {"train_loss": -7.113790035247803, "global_step": 185931, "epoch": 4426} {"train_loss": -6.919948577880859, "global_step": 185932, "epoch": 4426} {"train_loss": -7.09987701688494, "global_step": 185933, "epoch": 4426, "val_loss": 69622.34375} {"train_loss": -7.164002418518066, "global_step": 185934, "epoch": 4427} {"train_loss": -7.077119827270508, "global_step": 185935, "epoch": 4427} {"train_loss": -7.060483455657959, "global_step": 185936, "epoch": 4427} {"train_loss": -7.123355865478516, "global_step": 185937, "epoch": 4427} {"train_loss": -7.033006191253662, "global_step": 185938, "epoch": 4427} {"train_loss": -7.049487113952637, "global_step": 185939, "epoch": 4427} {"train_loss": -7.234236717224121, "global_step": 185940, "epoch": 4427} {"train_loss": -7.129456520080566, "global_step": 185941, "epoch": 4427} {"train_loss": -7.192788600921631, "global_step": 185942, "epoch": 4427} {"train_loss": -7.059017181396484, "global_step": 185943, "epoch": 4427} {"train_loss": -7.268198013305664, "global_step": 185944, "epoch": 4427} {"train_loss": -7.208359718322754, "global_step": 185945, "epoch": 4427} {"train_loss": -7.218244552612305, "global_step": 185946, "epoch": 4427} {"train_loss": -7.264439582824707, "global_step": 185947, "epoch": 4427} {"train_loss": -7.138158321380615, "global_step": 185948, "epoch": 4427} {"train_loss": -7.108805179595947, "global_step": 185949, "epoch": 4427} {"train_loss": -7.14776086807251, "global_step": 185950, "epoch": 4427} {"train_loss": -7.1438775062561035, "global_step": 185951, "epoch": 4427} {"train_loss": -7.069589614868164, "global_step": 185952, "epoch": 4427} {"train_loss": -7.2703447341918945, "global_step": 185953, "epoch": 4427} {"train_loss": -7.274894714355469, "global_step": 185954, "epoch": 4427} {"train_loss": -7.186279296875, "global_step": 185955, "epoch": 4427} {"train_loss": -7.201129913330078, "global_step": 185956, "epoch": 4427} {"train_loss": -7.221674919128418, "global_step": 185957, "epoch": 4427} {"train_loss": -7.266585350036621, "global_step": 185958, "epoch": 4427} {"train_loss": -7.1476850509643555, "global_step": 185959, "epoch": 4427} {"train_loss": -7.168460845947266, "global_step": 185960, "epoch": 4427} {"train_loss": -7.155895233154297, "global_step": 185961, "epoch": 4427} {"train_loss": -7.147909164428711, "global_step": 185962, "epoch": 4427} {"train_loss": -7.14448356628418, "global_step": 185963, "epoch": 4427} {"train_loss": -7.278557777404785, "global_step": 185964, "epoch": 4427} {"train_loss": -7.214939117431641, "global_step": 185965, "epoch": 4427} {"train_loss": -7.2396087646484375, "global_step": 185966, "epoch": 4427} {"train_loss": -7.169713020324707, "global_step": 185967, "epoch": 4427} {"train_loss": -7.239562511444092, "global_step": 185968, "epoch": 4427} {"train_loss": -7.1260294914245605, "global_step": 185969, "epoch": 4427} {"train_loss": -7.1950178146362305, "global_step": 185970, "epoch": 4427} {"train_loss": -7.146788597106934, "global_step": 185971, "epoch": 4427} {"train_loss": -7.1574296951293945, "global_step": 185972, "epoch": 4427} {"train_loss": -7.191272735595703, "global_step": 185973, "epoch": 4427} {"train_loss": -7.241827964782715, "global_step": 185974, "epoch": 4427} {"train_loss": -7.172667991547358, "global_step": 185975, "epoch": 4427, "val_loss": 69479.0234375} {"train_loss": -7.224944114685059, "global_step": 185976, "epoch": 4428} {"train_loss": -7.1645402908325195, "global_step": 185977, "epoch": 4428} {"train_loss": -7.309206485748291, "global_step": 185978, "epoch": 4428} {"train_loss": -7.125006198883057, "global_step": 185979, "epoch": 4428} {"train_loss": -7.164806842803955, "global_step": 185980, "epoch": 4428} {"train_loss": -7.172198295593262, "global_step": 185981, "epoch": 4428} {"train_loss": -7.124412536621094, "global_step": 185982, "epoch": 4428} {"train_loss": -7.132987976074219, "global_step": 185983, "epoch": 4428} {"train_loss": -7.114290237426758, "global_step": 185984, "epoch": 4428} {"train_loss": -7.394941806793213, "global_step": 185985, "epoch": 4428} {"train_loss": -7.118651390075684, "global_step": 185986, "epoch": 4428} {"train_loss": -7.1982927322387695, "global_step": 185987, "epoch": 4428} {"train_loss": -7.0591020584106445, "global_step": 185988, "epoch": 4428} {"train_loss": -7.259320259094238, "global_step": 185989, "epoch": 4428} {"train_loss": -7.103819370269775, "global_step": 185990, "epoch": 4428} {"train_loss": -7.258924961090088, "global_step": 185991, "epoch": 4428} {"train_loss": -7.1455278396606445, "global_step": 185992, "epoch": 4428} {"train_loss": -7.247837543487549, "global_step": 185993, "epoch": 4428} {"train_loss": -7.157735824584961, "global_step": 185994, "epoch": 4428} {"train_loss": -7.174427509307861, "global_step": 185995, "epoch": 4428} {"train_loss": -7.264317512512207, "global_step": 185996, "epoch": 4428} {"train_loss": -7.257664680480957, "global_step": 185997, "epoch": 4428} {"train_loss": -7.277295112609863, "global_step": 185998, "epoch": 4428} {"train_loss": -7.196008682250977, "global_step": 185999, "epoch": 4428} {"train_loss": -7.122795104980469, "global_step": 186000, "epoch": 4428} {"train_loss": -7.117210388183594, "global_step": 186001, "epoch": 4428} {"train_loss": -7.245031356811523, "global_step": 186002, "epoch": 4428} {"train_loss": -7.233994007110596, "global_step": 186003, "epoch": 4428} {"train_loss": -7.210546493530273, "global_step": 186004, "epoch": 4428} {"train_loss": -7.2249345779418945, "global_step": 186005, "epoch": 4428} {"train_loss": -7.18797492980957, "global_step": 186006, "epoch": 4428} {"train_loss": -7.239552021026611, "global_step": 186007, "epoch": 4428} {"train_loss": -7.130744457244873, "global_step": 186008, "epoch": 4428} {"train_loss": -7.1450090408325195, "global_step": 186009, "epoch": 4428} {"train_loss": -7.207093238830566, "global_step": 186010, "epoch": 4428} {"train_loss": -7.102023601531982, "global_step": 186011, "epoch": 4428} {"train_loss": -7.130599021911621, "global_step": 186012, "epoch": 4428} {"train_loss": -7.238705635070801, "global_step": 186013, "epoch": 4428} {"train_loss": -7.130348205566406, "global_step": 186014, "epoch": 4428} {"train_loss": -7.179554462432861, "global_step": 186015, "epoch": 4428} {"train_loss": -7.182012557983398, "global_step": 186016, "epoch": 4428} {"train_loss": -7.188001712163289, "global_step": 186017, "epoch": 4428, "val_loss": 69468.421875} {"train_loss": -7.16402530670166, "global_step": 186018, "epoch": 4429} {"train_loss": -7.168041706085205, "global_step": 186019, "epoch": 4429} {"train_loss": -7.208251953125, "global_step": 186020, "epoch": 4429} {"train_loss": -7.020757675170898, "global_step": 186021, "epoch": 4429} {"train_loss": -7.06623649597168, "global_step": 186022, "epoch": 4429} {"train_loss": -7.07346248626709, "global_step": 186023, "epoch": 4429} {"train_loss": -7.005332946777344, "global_step": 186024, "epoch": 4429} {"train_loss": -7.125914096832275, "global_step": 186025, "epoch": 4429} {"train_loss": -7.098087310791016, "global_step": 186026, "epoch": 4429} {"train_loss": -7.009530544281006, "global_step": 186027, "epoch": 4429} {"train_loss": -7.1004133224487305, "global_step": 186028, "epoch": 4429} {"train_loss": -7.178927421569824, "global_step": 186029, "epoch": 4429} {"train_loss": -7.103872776031494, "global_step": 186030, "epoch": 4429} {"train_loss": -7.1738152503967285, "global_step": 186031, "epoch": 4429} {"train_loss": -7.009976387023926, "global_step": 186032, "epoch": 4429} {"train_loss": -7.141427993774414, "global_step": 186033, "epoch": 4429} {"train_loss": -7.095474720001221, "global_step": 186034, "epoch": 4429} {"train_loss": -7.211892127990723, "global_step": 186035, "epoch": 4429} {"train_loss": -7.005180835723877, "global_step": 186036, "epoch": 4429} {"train_loss": -6.954523086547852, "global_step": 186037, "epoch": 4429} {"train_loss": -7.085175514221191, "global_step": 186038, "epoch": 4429} {"train_loss": -7.087155342102051, "global_step": 186039, "epoch": 4429} {"train_loss": -7.26647424697876, "global_step": 186040, "epoch": 4429} {"train_loss": -7.08868408203125, "global_step": 186041, "epoch": 4429} {"train_loss": -7.186637878417969, "global_step": 186042, "epoch": 4429} {"train_loss": -7.07033634185791, "global_step": 186043, "epoch": 4429} {"train_loss": -7.125250816345215, "global_step": 186044, "epoch": 4429} {"train_loss": -7.066450119018555, "global_step": 186045, "epoch": 4429} {"train_loss": -7.124006271362305, "global_step": 186046, "epoch": 4429} {"train_loss": -7.1996331214904785, "global_step": 186047, "epoch": 4429} {"train_loss": -7.134469985961914, "global_step": 186048, "epoch": 4429} {"train_loss": -7.08383846282959, "global_step": 186049, "epoch": 4429} {"train_loss": -7.210943222045898, "global_step": 186050, "epoch": 4429} {"train_loss": -7.15471076965332, "global_step": 186051, "epoch": 4429} {"train_loss": -7.2252326011657715, "global_step": 186052, "epoch": 4429} {"train_loss": -7.14060115814209, "global_step": 186053, "epoch": 4429} {"train_loss": -7.129561901092529, "global_step": 186054, "epoch": 4429} {"train_loss": -7.1306328773498535, "global_step": 186055, "epoch": 4429} {"train_loss": -7.1202497482299805, "global_step": 186056, "epoch": 4429} {"train_loss": -7.074735641479492, "global_step": 186057, "epoch": 4429} {"train_loss": -7.139129638671875, "global_step": 186058, "epoch": 4429} {"train_loss": -7.117198660260155, "global_step": 186059, "epoch": 4429, "val_loss": 69646.421875} {"train_loss": -7.094864845275879, "global_step": 186060, "epoch": 4430} {"train_loss": -7.171614646911621, "global_step": 186061, "epoch": 4430} {"train_loss": -7.154079914093018, "global_step": 186062, "epoch": 4430} {"train_loss": -7.025050163269043, "global_step": 186063, "epoch": 4430} {"train_loss": -7.201382637023926, "global_step": 186064, "epoch": 4430} {"train_loss": -7.163451194763184, "global_step": 186065, "epoch": 4430} {"train_loss": -7.127036094665527, "global_step": 186066, "epoch": 4430} {"train_loss": -7.111568927764893, "global_step": 186067, "epoch": 4430} {"train_loss": -7.177152633666992, "global_step": 186068, "epoch": 4430} {"train_loss": -6.955241680145264, "global_step": 186069, "epoch": 4430} {"train_loss": -7.128748893737793, "global_step": 186070, "epoch": 4430} {"train_loss": -7.115932464599609, "global_step": 186071, "epoch": 4430} {"train_loss": -7.121375560760498, "global_step": 186072, "epoch": 4430} {"train_loss": -7.071083068847656, "global_step": 186073, "epoch": 4430} {"train_loss": -7.1054534912109375, "global_step": 186074, "epoch": 4430} {"train_loss": -7.217626094818115, "global_step": 186075, "epoch": 4430} {"train_loss": -7.125729084014893, "global_step": 186076, "epoch": 4430} {"train_loss": -7.169803619384766, "global_step": 186077, "epoch": 4430} {"train_loss": -7.2312164306640625, "global_step": 186078, "epoch": 4430} {"train_loss": -7.163271903991699, "global_step": 186079, "epoch": 4430} {"train_loss": -7.242208003997803, "global_step": 186080, "epoch": 4430} {"train_loss": -7.110238552093506, "global_step": 186081, "epoch": 4430} {"train_loss": -7.1455583572387695, "global_step": 186082, "epoch": 4430} {"train_loss": -7.206785678863525, "global_step": 186083, "epoch": 4430} {"train_loss": -7.008994102478027, "global_step": 186084, "epoch": 4430} {"train_loss": -7.185813903808594, "global_step": 186085, "epoch": 4430} {"train_loss": -7.214511394500732, "global_step": 186086, "epoch": 4430} {"train_loss": -7.218691349029541, "global_step": 186087, "epoch": 4430} {"train_loss": -7.185641288757324, "global_step": 186088, "epoch": 4430} {"train_loss": -7.1389055252075195, "global_step": 186089, "epoch": 4430} {"train_loss": -7.164529800415039, "global_step": 186090, "epoch": 4430} {"train_loss": -7.174548149108887, "global_step": 186091, "epoch": 4430} {"train_loss": -7.298647403717041, "global_step": 186092, "epoch": 4430} {"train_loss": -7.1284990310668945, "global_step": 186093, "epoch": 4430} {"train_loss": -7.187370300292969, "global_step": 186094, "epoch": 4430} {"train_loss": -7.180967807769775, "global_step": 186095, "epoch": 4430} {"train_loss": -7.133655548095703, "global_step": 186096, "epoch": 4430} {"train_loss": -7.219769477844238, "global_step": 186097, "epoch": 4430} {"train_loss": -7.201050758361816, "global_step": 186098, "epoch": 4430} {"train_loss": -7.152449131011963, "global_step": 186099, "epoch": 4430} {"train_loss": -7.107683181762695, "global_step": 186100, "epoch": 4430} {"train_loss": -7.151538701284499, "global_step": 186101, "epoch": 4430, "val_loss": 69359.375} {"train_loss": -7.180643558502197, "global_step": 186102, "epoch": 4431} {"train_loss": -7.150953769683838, "global_step": 186103, "epoch": 4431} {"train_loss": -7.256106376647949, "global_step": 186104, "epoch": 4431} {"train_loss": -7.202266693115234, "global_step": 186105, "epoch": 4431} {"train_loss": -7.160050868988037, "global_step": 186106, "epoch": 4431} {"train_loss": -7.230522155761719, "global_step": 186107, "epoch": 4431} {"train_loss": -7.173283576965332, "global_step": 186108, "epoch": 4431} {"train_loss": -7.206944942474365, "global_step": 186109, "epoch": 4431} {"train_loss": -7.207735538482666, "global_step": 186110, "epoch": 4431} {"train_loss": -7.278744697570801, "global_step": 186111, "epoch": 4431} {"train_loss": -7.220834732055664, "global_step": 186112, "epoch": 4431} {"train_loss": -7.260288238525391, "global_step": 186113, "epoch": 4431} {"train_loss": -7.2050957679748535, "global_step": 186114, "epoch": 4431} {"train_loss": -7.207085609436035, "global_step": 186115, "epoch": 4431} {"train_loss": -7.222517013549805, "global_step": 186116, "epoch": 4431} {"train_loss": -7.225984573364258, "global_step": 186117, "epoch": 4431} {"train_loss": -7.244471549987793, "global_step": 186118, "epoch": 4431} {"train_loss": -7.218771934509277, "global_step": 186119, "epoch": 4431} {"train_loss": -7.200722694396973, "global_step": 186120, "epoch": 4431} {"train_loss": -7.18525505065918, "global_step": 186121, "epoch": 4431} {"train_loss": -7.337529182434082, "global_step": 186122, "epoch": 4431} {"train_loss": -7.21364688873291, "global_step": 186123, "epoch": 4431} {"train_loss": -7.219718933105469, "global_step": 186124, "epoch": 4431} {"train_loss": -7.237231254577637, "global_step": 186125, "epoch": 4431} {"train_loss": -7.193982124328613, "global_step": 186126, "epoch": 4431} {"train_loss": -7.204896450042725, "global_step": 186127, "epoch": 4431} {"train_loss": -7.089296817779541, "global_step": 186128, "epoch": 4431} {"train_loss": -7.189082145690918, "global_step": 186129, "epoch": 4431} {"train_loss": -7.191667556762695, "global_step": 186130, "epoch": 4431} {"train_loss": -7.221003532409668, "global_step": 186131, "epoch": 4431} {"train_loss": -7.213170051574707, "global_step": 186132, "epoch": 4431} {"train_loss": -7.1150221824646, "global_step": 186133, "epoch": 4431} {"train_loss": -7.108396053314209, "global_step": 186134, "epoch": 4431} {"train_loss": -7.216036319732666, "global_step": 186135, "epoch": 4431} {"train_loss": -7.136959075927734, "global_step": 186136, "epoch": 4431} {"train_loss": -7.148946762084961, "global_step": 186137, "epoch": 4431} {"train_loss": -6.9452948570251465, "global_step": 186138, "epoch": 4431} {"train_loss": -7.012753963470459, "global_step": 186139, "epoch": 4431} {"train_loss": -7.100028991699219, "global_step": 186140, "epoch": 4431} {"train_loss": -7.104230880737305, "global_step": 186141, "epoch": 4431} {"train_loss": -7.2048749923706055, "global_step": 186142, "epoch": 4431} {"train_loss": -7.18450056938898, "global_step": 186143, "epoch": 4431, "val_loss": 69604.453125} {"train_loss": -7.123444080352783, "global_step": 186144, "epoch": 4432} {"train_loss": -7.023246765136719, "global_step": 186145, "epoch": 4432} {"train_loss": -7.101834774017334, "global_step": 186146, "epoch": 4432} {"train_loss": -7.037714958190918, "global_step": 186147, "epoch": 4432} {"train_loss": -7.182730197906494, "global_step": 186148, "epoch": 4432} {"train_loss": -7.068052768707275, "global_step": 186149, "epoch": 4432} {"train_loss": -7.1188530921936035, "global_step": 186150, "epoch": 4432} {"train_loss": -7.044731140136719, "global_step": 186151, "epoch": 4432} {"train_loss": -7.111944198608398, "global_step": 186152, "epoch": 4432} {"train_loss": -7.034412384033203, "global_step": 186153, "epoch": 4432} {"train_loss": -7.025334358215332, "global_step": 186154, "epoch": 4432} {"train_loss": -7.031780242919922, "global_step": 186155, "epoch": 4432} {"train_loss": -7.017112731933594, "global_step": 186156, "epoch": 4432} {"train_loss": -7.155302047729492, "global_step": 186157, "epoch": 4432} {"train_loss": -6.99642276763916, "global_step": 186158, "epoch": 4432} {"train_loss": -7.0846710205078125, "global_step": 186159, "epoch": 4432} {"train_loss": -6.969112873077393, "global_step": 186160, "epoch": 4432} {"train_loss": -6.9855241775512695, "global_step": 186161, "epoch": 4432} {"train_loss": -7.099847793579102, "global_step": 186162, "epoch": 4432} {"train_loss": -7.098822116851807, "global_step": 186163, "epoch": 4432} {"train_loss": -7.138187885284424, "global_step": 186164, "epoch": 4432} {"train_loss": -7.0286431312561035, "global_step": 186165, "epoch": 4432} {"train_loss": -7.176860809326172, "global_step": 186166, "epoch": 4432} {"train_loss": -7.000056266784668, "global_step": 186167, "epoch": 4432} {"train_loss": -7.157040596008301, "global_step": 186168, "epoch": 4432} {"train_loss": -7.123897075653076, "global_step": 186169, "epoch": 4432} {"train_loss": -7.140663146972656, "global_step": 186170, "epoch": 4432} {"train_loss": -7.0647430419921875, "global_step": 186171, "epoch": 4432} {"train_loss": -7.077603340148926, "global_step": 186172, "epoch": 4432} {"train_loss": -7.213162422180176, "global_step": 186173, "epoch": 4432} {"train_loss": -7.198422908782959, "global_step": 186174, "epoch": 4432} {"train_loss": -7.129768371582031, "global_step": 186175, "epoch": 4432} {"train_loss": -7.1455841064453125, "global_step": 186176, "epoch": 4432} {"train_loss": -7.082571983337402, "global_step": 186177, "epoch": 4432} {"train_loss": -7.138249397277832, "global_step": 186178, "epoch": 4432} {"train_loss": -7.097034454345703, "global_step": 186179, "epoch": 4432} {"train_loss": -7.08639669418335, "global_step": 186180, "epoch": 4432} {"train_loss": -7.164229393005371, "global_step": 186181, "epoch": 4432} {"train_loss": -7.153459548950195, "global_step": 186182, "epoch": 4432} {"train_loss": -7.128865718841553, "global_step": 186183, "epoch": 4432} {"train_loss": -7.086054801940918, "global_step": 186184, "epoch": 4432} {"train_loss": -7.094000157855806, "global_step": 186185, "epoch": 4432, "val_loss": 69426.046875} {"train_loss": -7.088204383850098, "global_step": 186186, "epoch": 4433} {"train_loss": -7.1511735916137695, "global_step": 186187, "epoch": 4433} {"train_loss": -7.068114757537842, "global_step": 186188, "epoch": 4433} {"train_loss": -7.190572261810303, "global_step": 186189, "epoch": 4433} {"train_loss": -7.209901809692383, "global_step": 186190, "epoch": 4433} {"train_loss": -7.208415508270264, "global_step": 186191, "epoch": 4433} {"train_loss": -7.172704696655273, "global_step": 186192, "epoch": 4433} {"train_loss": -7.201452255249023, "global_step": 186193, "epoch": 4433} {"train_loss": -7.232452392578125, "global_step": 186194, "epoch": 4433} {"train_loss": -7.3106369972229, "global_step": 186195, "epoch": 4433} {"train_loss": -7.247830390930176, "global_step": 186196, "epoch": 4433} {"train_loss": -7.259014129638672, "global_step": 186197, "epoch": 4433} {"train_loss": -7.191710472106934, "global_step": 186198, "epoch": 4433} {"train_loss": -7.145259857177734, "global_step": 186199, "epoch": 4433} {"train_loss": -7.204921722412109, "global_step": 186200, "epoch": 4433} {"train_loss": -7.245617866516113, "global_step": 186201, "epoch": 4433} {"train_loss": -7.103207111358643, "global_step": 186202, "epoch": 4433} {"train_loss": -7.311427116394043, "global_step": 186203, "epoch": 4433} {"train_loss": -7.29328727722168, "global_step": 186204, "epoch": 4433} {"train_loss": -7.2186760902404785, "global_step": 186205, "epoch": 4433} {"train_loss": -7.345150947570801, "global_step": 186206, "epoch": 4433} {"train_loss": -7.226965427398682, "global_step": 186207, "epoch": 4433} {"train_loss": -7.116301536560059, "global_step": 186208, "epoch": 4433} {"train_loss": -7.334390163421631, "global_step": 186209, "epoch": 4433} {"train_loss": -7.251629829406738, "global_step": 186210, "epoch": 4433} {"train_loss": -7.059782981872559, "global_step": 186211, "epoch": 4433} {"train_loss": -7.273639678955078, "global_step": 186212, "epoch": 4433} {"train_loss": -7.160407066345215, "global_step": 186213, "epoch": 4433} {"train_loss": -7.221597671508789, "global_step": 186214, "epoch": 4433} {"train_loss": -7.223470211029053, "global_step": 186215, "epoch": 4433} {"train_loss": -7.149618625640869, "global_step": 186216, "epoch": 4433} {"train_loss": -7.183624267578125, "global_step": 186217, "epoch": 4433} {"train_loss": -7.2901763916015625, "global_step": 186218, "epoch": 4433} {"train_loss": -7.242371559143066, "global_step": 186219, "epoch": 4433} {"train_loss": -7.219854831695557, "global_step": 186220, "epoch": 4433} {"train_loss": -7.255853652954102, "global_step": 186221, "epoch": 4433} {"train_loss": -7.216166019439697, "global_step": 186222, "epoch": 4433} {"train_loss": -7.2369184494018555, "global_step": 186223, "epoch": 4433} {"train_loss": -7.273979187011719, "global_step": 186224, "epoch": 4433} {"train_loss": -7.257826805114746, "global_step": 186225, "epoch": 4433} {"train_loss": -7.179778099060059, "global_step": 186226, "epoch": 4433} {"train_loss": -7.2139456158592585, "global_step": 186227, "epoch": 4433, "val_loss": 69399.046875} {"train_loss": -7.33371639251709, "global_step": 186228, "epoch": 4434} {"train_loss": -7.216731548309326, "global_step": 186229, "epoch": 4434} {"train_loss": -7.246101379394531, "global_step": 186230, "epoch": 4434} {"train_loss": -7.145880699157715, "global_step": 186231, "epoch": 4434} {"train_loss": -7.154627323150635, "global_step": 186232, "epoch": 4434} {"train_loss": -7.219424247741699, "global_step": 186233, "epoch": 4434} {"train_loss": -7.183802604675293, "global_step": 186234, "epoch": 4434} {"train_loss": -7.189953804016113, "global_step": 186235, "epoch": 4434} {"train_loss": -7.050711154937744, "global_step": 186236, "epoch": 4434} {"train_loss": -7.157926559448242, "global_step": 186237, "epoch": 4434} {"train_loss": -7.264786720275879, "global_step": 186238, "epoch": 4434} {"train_loss": -7.123022079467773, "global_step": 186239, "epoch": 4434} {"train_loss": -7.286656379699707, "global_step": 186240, "epoch": 4434} {"train_loss": -7.197383880615234, "global_step": 186241, "epoch": 4434} {"train_loss": -7.151886940002441, "global_step": 186242, "epoch": 4434} {"train_loss": -7.246984958648682, "global_step": 186243, "epoch": 4434} {"train_loss": -7.0728960037231445, "global_step": 186244, "epoch": 4434} {"train_loss": -7.143946647644043, "global_step": 186245, "epoch": 4434} {"train_loss": -7.183856964111328, "global_step": 186246, "epoch": 4434} {"train_loss": -7.212189674377441, "global_step": 186247, "epoch": 4434} {"train_loss": -7.191445827484131, "global_step": 186248, "epoch": 4434} {"train_loss": -7.21645450592041, "global_step": 186249, "epoch": 4434} {"train_loss": -7.241713047027588, "global_step": 186250, "epoch": 4434} {"train_loss": -7.289973258972168, "global_step": 186251, "epoch": 4434} {"train_loss": -7.1100921630859375, "global_step": 186252, "epoch": 4434} {"train_loss": -7.308764457702637, "global_step": 186253, "epoch": 4434} {"train_loss": -7.051519393920898, "global_step": 186254, "epoch": 4434} {"train_loss": -7.104888916015625, "global_step": 186255, "epoch": 4434} {"train_loss": -7.191354751586914, "global_step": 186256, "epoch": 4434} {"train_loss": -7.113438606262207, "global_step": 186257, "epoch": 4434} {"train_loss": -6.981042861938477, "global_step": 186258, "epoch": 4434} {"train_loss": -7.119821071624756, "global_step": 186259, "epoch": 4434} {"train_loss": -7.127481937408447, "global_step": 186260, "epoch": 4434} {"train_loss": -7.1130266189575195, "global_step": 186261, "epoch": 4434} {"train_loss": -7.171300888061523, "global_step": 186262, "epoch": 4434} {"train_loss": -7.086775302886963, "global_step": 186263, "epoch": 4434} {"train_loss": -7.048801898956299, "global_step": 186264, "epoch": 4434} {"train_loss": -7.125064849853516, "global_step": 186265, "epoch": 4434} {"train_loss": -6.938045978546143, "global_step": 186266, "epoch": 4434} {"train_loss": -7.04448127746582, "global_step": 186267, "epoch": 4434} {"train_loss": -7.112039089202881, "global_step": 186268, "epoch": 4434} {"train_loss": -7.154380026317778, "global_step": 186269, "epoch": 4434, "val_loss": 69785.4921875} {"train_loss": -7.048522472381592, "global_step": 186270, "epoch": 4435} {"train_loss": -7.067959308624268, "global_step": 186271, "epoch": 4435} {"train_loss": -7.126302719116211, "global_step": 186272, "epoch": 4435} {"train_loss": -7.006611347198486, "global_step": 186273, "epoch": 4435} {"train_loss": -7.132841110229492, "global_step": 186274, "epoch": 4435} {"train_loss": -7.109964370727539, "global_step": 186275, "epoch": 4435} {"train_loss": -7.019674301147461, "global_step": 186276, "epoch": 4435} {"train_loss": -7.002896308898926, "global_step": 186277, "epoch": 4435} {"train_loss": -7.115175247192383, "global_step": 186278, "epoch": 4435} {"train_loss": -7.102725982666016, "global_step": 186279, "epoch": 4435} {"train_loss": -7.0146870613098145, "global_step": 186280, "epoch": 4435} {"train_loss": -7.116157531738281, "global_step": 186281, "epoch": 4435} {"train_loss": -7.0616912841796875, "global_step": 186282, "epoch": 4435} {"train_loss": -7.164969444274902, "global_step": 186283, "epoch": 4435} {"train_loss": -7.143681049346924, "global_step": 186284, "epoch": 4435} {"train_loss": -7.128129959106445, "global_step": 186285, "epoch": 4435} {"train_loss": -7.079638481140137, "global_step": 186286, "epoch": 4435} {"train_loss": -7.13551139831543, "global_step": 186287, "epoch": 4435} {"train_loss": -7.134524345397949, "global_step": 186288, "epoch": 4435} {"train_loss": -7.166436672210693, "global_step": 186289, "epoch": 4435} {"train_loss": -7.14405632019043, "global_step": 186290, "epoch": 4435} {"train_loss": -7.131656646728516, "global_step": 186291, "epoch": 4435} {"train_loss": -7.165256977081299, "global_step": 186292, "epoch": 4435} {"train_loss": -7.155643463134766, "global_step": 186293, "epoch": 4435} {"train_loss": -7.041501045227051, "global_step": 186294, "epoch": 4435} {"train_loss": -7.098603248596191, "global_step": 186295, "epoch": 4435} {"train_loss": -7.152998924255371, "global_step": 186296, "epoch": 4435} {"train_loss": -7.12249755859375, "global_step": 186297, "epoch": 4435} {"train_loss": -7.053372383117676, "global_step": 186298, "epoch": 4435} {"train_loss": -7.108617782592773, "global_step": 186299, "epoch": 4435} {"train_loss": -7.116381645202637, "global_step": 186300, "epoch": 4435} {"train_loss": -7.100603103637695, "global_step": 186301, "epoch": 4435} {"train_loss": -7.020448207855225, "global_step": 186302, "epoch": 4435} {"train_loss": -7.184604644775391, "global_step": 186303, "epoch": 4435} {"train_loss": -7.159132480621338, "global_step": 186304, "epoch": 4435} {"train_loss": -7.135974884033203, "global_step": 186305, "epoch": 4435} {"train_loss": -7.1149725914001465, "global_step": 186306, "epoch": 4435} {"train_loss": -7.083057880401611, "global_step": 186307, "epoch": 4435} {"train_loss": -7.111678123474121, "global_step": 186308, "epoch": 4435} {"train_loss": -7.2152099609375, "global_step": 186309, "epoch": 4435} {"train_loss": -7.080687046051025, "global_step": 186310, "epoch": 4435} {"train_loss": -7.107377619970412, "global_step": 186311, "epoch": 4435, "val_loss": 69470.25} {"train_loss": -7.115981101989746, "global_step": 186312, "epoch": 4436} {"train_loss": -7.218825340270996, "global_step": 186313, "epoch": 4436} {"train_loss": -7.092392921447754, "global_step": 186314, "epoch": 4436} {"train_loss": -7.094947338104248, "global_step": 186315, "epoch": 4436} {"train_loss": -7.095237731933594, "global_step": 186316, "epoch": 4436} {"train_loss": -7.248786926269531, "global_step": 186317, "epoch": 4436} {"train_loss": -7.134050369262695, "global_step": 186318, "epoch": 4436} {"train_loss": -7.127976417541504, "global_step": 186319, "epoch": 4436} {"train_loss": -7.195782661437988, "global_step": 186320, "epoch": 4436} {"train_loss": -7.17486572265625, "global_step": 186321, "epoch": 4436} {"train_loss": -7.299790859222412, "global_step": 186322, "epoch": 4436} {"train_loss": -7.194976806640625, "global_step": 186323, "epoch": 4436} {"train_loss": -7.228151321411133, "global_step": 186324, "epoch": 4436} {"train_loss": -7.2145280838012695, "global_step": 186325, "epoch": 4436} {"train_loss": -7.193469524383545, "global_step": 186326, "epoch": 4436} {"train_loss": -7.2472076416015625, "global_step": 186327, "epoch": 4436} {"train_loss": -7.273223876953125, "global_step": 186328, "epoch": 4436} {"train_loss": -7.219609260559082, "global_step": 186329, "epoch": 4436} {"train_loss": -7.0664472579956055, "global_step": 186330, "epoch": 4436} {"train_loss": -7.128300666809082, "global_step": 186331, "epoch": 4436} {"train_loss": -7.229592800140381, "global_step": 186332, "epoch": 4436} {"train_loss": -7.072615146636963, "global_step": 186333, "epoch": 4436} {"train_loss": -7.20380973815918, "global_step": 186334, "epoch": 4436} {"train_loss": -7.202172756195068, "global_step": 186335, "epoch": 4436} {"train_loss": -7.07127571105957, "global_step": 186336, "epoch": 4436} {"train_loss": -7.204130172729492, "global_step": 186337, "epoch": 4436} {"train_loss": -7.138382911682129, "global_step": 186338, "epoch": 4436} {"train_loss": -7.071099281311035, "global_step": 186339, "epoch": 4436} {"train_loss": -7.180246353149414, "global_step": 186340, "epoch": 4436} {"train_loss": -7.174210548400879, "global_step": 186341, "epoch": 4436} {"train_loss": -7.128831386566162, "global_step": 186342, "epoch": 4436} {"train_loss": -7.090161323547363, "global_step": 186343, "epoch": 4436} {"train_loss": -6.918079376220703, "global_step": 186344, "epoch": 4436} {"train_loss": -7.132086753845215, "global_step": 186345, "epoch": 4436} {"train_loss": -7.00242805480957, "global_step": 186346, "epoch": 4436} {"train_loss": -7.122509002685547, "global_step": 186347, "epoch": 4436} {"train_loss": -7.137028217315674, "global_step": 186348, "epoch": 4436} {"train_loss": -6.916535377502441, "global_step": 186349, "epoch": 4436} {"train_loss": -7.109590530395508, "global_step": 186350, "epoch": 4436} {"train_loss": -7.034780502319336, "global_step": 186351, "epoch": 4436} {"train_loss": -7.0591230392456055, "global_step": 186352, "epoch": 4436} {"train_loss": -7.1356723081497915, "global_step": 186353, "epoch": 4436, "val_loss": 69512.6953125} {"train_loss": -7.133677005767822, "global_step": 186354, "epoch": 4437} {"train_loss": -7.070430755615234, "global_step": 186355, "epoch": 4437} {"train_loss": -7.2089009284973145, "global_step": 186356, "epoch": 4437} {"train_loss": -7.1183271408081055, "global_step": 186357, "epoch": 4437} {"train_loss": -7.170943260192871, "global_step": 186358, "epoch": 4437} {"train_loss": -7.130314826965332, "global_step": 186359, "epoch": 4437} {"train_loss": -7.154239654541016, "global_step": 186360, "epoch": 4437} {"train_loss": -7.181992530822754, "global_step": 186361, "epoch": 4437} {"train_loss": -7.095418930053711, "global_step": 186362, "epoch": 4437} {"train_loss": -7.24393367767334, "global_step": 186363, "epoch": 4437} {"train_loss": -7.184195518493652, "global_step": 186364, "epoch": 4437} {"train_loss": -7.193256378173828, "global_step": 186365, "epoch": 4437} {"train_loss": -7.165469646453857, "global_step": 186366, "epoch": 4437} {"train_loss": -7.168448448181152, "global_step": 186367, "epoch": 4437} {"train_loss": -7.182812690734863, "global_step": 186368, "epoch": 4437} {"train_loss": -7.145085334777832, "global_step": 186369, "epoch": 4437} {"train_loss": -7.216279983520508, "global_step": 186370, "epoch": 4437} {"train_loss": -7.133175849914551, "global_step": 186371, "epoch": 4437} {"train_loss": -7.151844501495361, "global_step": 186372, "epoch": 4437} {"train_loss": -7.068496227264404, "global_step": 186373, "epoch": 4437} {"train_loss": -7.145383834838867, "global_step": 186374, "epoch": 4437} {"train_loss": -7.213605880737305, "global_step": 186375, "epoch": 4437} {"train_loss": -7.127541542053223, "global_step": 186376, "epoch": 4437} {"train_loss": -7.073467254638672, "global_step": 186377, "epoch": 4437} {"train_loss": -7.233360290527344, "global_step": 186378, "epoch": 4437} {"train_loss": -7.195732593536377, "global_step": 186379, "epoch": 4437} {"train_loss": -7.096513748168945, "global_step": 186380, "epoch": 4437} {"train_loss": -7.114923477172852, "global_step": 186381, "epoch": 4437} {"train_loss": -7.140851974487305, "global_step": 186382, "epoch": 4437} {"train_loss": -7.101097106933594, "global_step": 186383, "epoch": 4437} {"train_loss": -7.1853108406066895, "global_step": 186384, "epoch": 4437} {"train_loss": -7.031368255615234, "global_step": 186385, "epoch": 4437} {"train_loss": -7.145083427429199, "global_step": 186386, "epoch": 4437} {"train_loss": -7.145729064941406, "global_step": 186387, "epoch": 4437} {"train_loss": -7.190542697906494, "global_step": 186388, "epoch": 4437} {"train_loss": -7.194910049438477, "global_step": 186389, "epoch": 4437} {"train_loss": -7.122543811798096, "global_step": 186390, "epoch": 4437} {"train_loss": -7.156847953796387, "global_step": 186391, "epoch": 4437} {"train_loss": -7.1159515380859375, "global_step": 186392, "epoch": 4437} {"train_loss": -7.145644187927246, "global_step": 186393, "epoch": 4437} {"train_loss": -7.1463942527771, "global_step": 186394, "epoch": 4437} {"train_loss": -7.151943774450393, "global_step": 186395, "epoch": 4437, "val_loss": 69456.7421875} {"train_loss": -7.209218978881836, "global_step": 186396, "epoch": 4438} {"train_loss": -7.195001125335693, "global_step": 186397, "epoch": 4438} {"train_loss": -7.074967384338379, "global_step": 186398, "epoch": 4438} {"train_loss": -7.1811323165893555, "global_step": 186399, "epoch": 4438} {"train_loss": -7.052939414978027, "global_step": 186400, "epoch": 4438} {"train_loss": -7.128749370574951, "global_step": 186401, "epoch": 4438} {"train_loss": -7.210792541503906, "global_step": 186402, "epoch": 4438} {"train_loss": -7.192485809326172, "global_step": 186403, "epoch": 4438} {"train_loss": -7.222679615020752, "global_step": 186404, "epoch": 4438} {"train_loss": -7.089201927185059, "global_step": 186405, "epoch": 4438} {"train_loss": -7.140108108520508, "global_step": 186406, "epoch": 4438} {"train_loss": -7.199910640716553, "global_step": 186407, "epoch": 4438} {"train_loss": -7.108463287353516, "global_step": 186408, "epoch": 4438} {"train_loss": -7.1042985916137695, "global_step": 186409, "epoch": 4438} {"train_loss": -7.085350036621094, "global_step": 186410, "epoch": 4438} {"train_loss": -7.051480770111084, "global_step": 186411, "epoch": 4438} {"train_loss": -7.076457977294922, "global_step": 186412, "epoch": 4438} {"train_loss": -7.086455345153809, "global_step": 186413, "epoch": 4438} {"train_loss": -6.821911811828613, "global_step": 186414, "epoch": 4438} {"train_loss": -6.699458122253418, "global_step": 186415, "epoch": 4438} {"train_loss": -6.999415397644043, "global_step": 186416, "epoch": 4438} {"train_loss": -6.831203937530518, "global_step": 186417, "epoch": 4438} {"train_loss": -6.992189884185791, "global_step": 186418, "epoch": 4438} {"train_loss": -6.936520576477051, "global_step": 186419, "epoch": 4438} {"train_loss": -6.943584442138672, "global_step": 186420, "epoch": 4438} {"train_loss": -6.99838399887085, "global_step": 186421, "epoch": 4438} {"train_loss": -7.1250529289245605, "global_step": 186422, "epoch": 4438} {"train_loss": -7.04002571105957, "global_step": 186423, "epoch": 4438} {"train_loss": -7.049549102783203, "global_step": 186424, "epoch": 4438} {"train_loss": -6.90153694152832, "global_step": 186425, "epoch": 4438} {"train_loss": -7.069137096405029, "global_step": 186426, "epoch": 4438} {"train_loss": -7.05087423324585, "global_step": 186427, "epoch": 4438} {"train_loss": -7.043330669403076, "global_step": 186428, "epoch": 4438} {"train_loss": -6.966371536254883, "global_step": 186429, "epoch": 4438} {"train_loss": -6.879306793212891, "global_step": 186430, "epoch": 4438} {"train_loss": -7.0421977043151855, "global_step": 186431, "epoch": 4438} {"train_loss": -6.981579780578613, "global_step": 186432, "epoch": 4438} {"train_loss": -7.00631046295166, "global_step": 186433, "epoch": 4438} {"train_loss": -6.905369281768799, "global_step": 186434, "epoch": 4438} {"train_loss": -6.924968719482422, "global_step": 186435, "epoch": 4438} {"train_loss": -6.931944847106934, "global_step": 186436, "epoch": 4438} {"train_loss": -7.031568663460868, "global_step": 186437, "epoch": 4438, "val_loss": 69470.625} {"train_loss": -7.04304313659668, "global_step": 186438, "epoch": 4439} {"train_loss": -7.025169849395752, "global_step": 186439, "epoch": 4439} {"train_loss": -7.02139949798584, "global_step": 186440, "epoch": 4439} {"train_loss": -6.897767543792725, "global_step": 186441, "epoch": 4439} {"train_loss": -7.041623592376709, "global_step": 186442, "epoch": 4439} {"train_loss": -6.942838668823242, "global_step": 186443, "epoch": 4439} {"train_loss": -6.943332672119141, "global_step": 186444, "epoch": 4439} {"train_loss": -7.052504062652588, "global_step": 186445, "epoch": 4439} {"train_loss": -6.992633819580078, "global_step": 186446, "epoch": 4439} {"train_loss": -7.0403900146484375, "global_step": 186447, "epoch": 4439} {"train_loss": -7.0042009353637695, "global_step": 186448, "epoch": 4439} {"train_loss": -6.985892295837402, "global_step": 186449, "epoch": 4439} {"train_loss": -7.023237705230713, "global_step": 186450, "epoch": 4439} {"train_loss": -7.045161247253418, "global_step": 186451, "epoch": 4439} {"train_loss": -7.066471099853516, "global_step": 186452, "epoch": 4439} {"train_loss": -7.045836448669434, "global_step": 186453, "epoch": 4439} {"train_loss": -7.059774398803711, "global_step": 186454, "epoch": 4439} {"train_loss": -7.023534774780273, "global_step": 186455, "epoch": 4439} {"train_loss": -7.125823974609375, "global_step": 186456, "epoch": 4439} {"train_loss": -7.049561500549316, "global_step": 186457, "epoch": 4439} {"train_loss": -7.193280220031738, "global_step": 186458, "epoch": 4439} {"train_loss": -7.140899658203125, "global_step": 186459, "epoch": 4439} {"train_loss": -7.147246360778809, "global_step": 186460, "epoch": 4439} {"train_loss": -7.15242338180542, "global_step": 186461, "epoch": 4439} {"train_loss": -7.12992000579834, "global_step": 186462, "epoch": 4439} {"train_loss": -7.223255157470703, "global_step": 186463, "epoch": 4439} {"train_loss": -7.160893440246582, "global_step": 186464, "epoch": 4439} {"train_loss": -7.232542991638184, "global_step": 186465, "epoch": 4439} {"train_loss": -7.113124370574951, "global_step": 186466, "epoch": 4439} {"train_loss": -7.180513858795166, "global_step": 186467, "epoch": 4439} {"train_loss": -7.152656555175781, "global_step": 186468, "epoch": 4439} {"train_loss": -7.24251127243042, "global_step": 186469, "epoch": 4439} {"train_loss": -7.145882606506348, "global_step": 186470, "epoch": 4439} {"train_loss": -7.119494438171387, "global_step": 186471, "epoch": 4439} {"train_loss": -7.1821417808532715, "global_step": 186472, "epoch": 4439} {"train_loss": -7.0816240310668945, "global_step": 186473, "epoch": 4439} {"train_loss": -7.208799362182617, "global_step": 186474, "epoch": 4439} {"train_loss": -7.258744239807129, "global_step": 186475, "epoch": 4439} {"train_loss": -7.194664001464844, "global_step": 186476, "epoch": 4439} {"train_loss": -7.236018657684326, "global_step": 186477, "epoch": 4439} {"train_loss": -7.223020076751709, "global_step": 186478, "epoch": 4439} {"train_loss": -7.103642543156941, "global_step": 186479, "epoch": 4439, "val_loss": 69433.015625} {"train_loss": -7.212691783905029, "global_step": 186480, "epoch": 4440} {"train_loss": -7.170233726501465, "global_step": 186481, "epoch": 4440} {"train_loss": -7.2228288650512695, "global_step": 186482, "epoch": 4440} {"train_loss": -7.1311421394348145, "global_step": 186483, "epoch": 4440} {"train_loss": -7.175944805145264, "global_step": 186484, "epoch": 4440} {"train_loss": -7.201891899108887, "global_step": 186485, "epoch": 4440} {"train_loss": -7.143745422363281, "global_step": 186486, "epoch": 4440} {"train_loss": -7.058754920959473, "global_step": 186487, "epoch": 4440} {"train_loss": -7.243277549743652, "global_step": 186488, "epoch": 4440} {"train_loss": -7.180904388427734, "global_step": 186489, "epoch": 4440} {"train_loss": -7.1156182289123535, "global_step": 186490, "epoch": 4440} {"train_loss": -7.166843414306641, "global_step": 186491, "epoch": 4440} {"train_loss": -7.152841567993164, "global_step": 186492, "epoch": 4440} {"train_loss": -7.1654558181762695, "global_step": 186493, "epoch": 4440} {"train_loss": -7.087920188903809, "global_step": 186494, "epoch": 4440} {"train_loss": -7.044277191162109, "global_step": 186495, "epoch": 4440} {"train_loss": -7.164401054382324, "global_step": 186496, "epoch": 4440} {"train_loss": -7.086476802825928, "global_step": 186497, "epoch": 4440} {"train_loss": -7.3300347328186035, "global_step": 186498, "epoch": 4440} {"train_loss": -7.171777248382568, "global_step": 186499, "epoch": 4440} {"train_loss": -7.093009948730469, "global_step": 186500, "epoch": 4440} {"train_loss": -7.135402679443359, "global_step": 186501, "epoch": 4440} {"train_loss": -7.107529640197754, "global_step": 186502, "epoch": 4440} {"train_loss": -7.180098533630371, "global_step": 186503, "epoch": 4440} {"train_loss": -7.124933242797852, "global_step": 186504, "epoch": 4440} {"train_loss": -7.156383037567139, "global_step": 186505, "epoch": 4440} {"train_loss": -7.189358711242676, "global_step": 186506, "epoch": 4440} {"train_loss": -7.227066993713379, "global_step": 186507, "epoch": 4440} {"train_loss": -7.125027179718018, "global_step": 186508, "epoch": 4440} {"train_loss": -7.1814470291137695, "global_step": 186509, "epoch": 4440} {"train_loss": -7.258752822875977, "global_step": 186510, "epoch": 4440} {"train_loss": -7.034853935241699, "global_step": 186511, "epoch": 4440} {"train_loss": -7.157492637634277, "global_step": 186512, "epoch": 4440} {"train_loss": -7.0692315101623535, "global_step": 186513, "epoch": 4440} {"train_loss": -7.075193405151367, "global_step": 186514, "epoch": 4440} {"train_loss": -7.109330177307129, "global_step": 186515, "epoch": 4440} {"train_loss": -7.195105075836182, "global_step": 186516, "epoch": 4440} {"train_loss": -7.164315223693848, "global_step": 186517, "epoch": 4440} {"train_loss": -7.198558330535889, "global_step": 186518, "epoch": 4440} {"train_loss": -7.2975687980651855, "global_step": 186519, "epoch": 4440} {"train_loss": -7.101162910461426, "global_step": 186520, "epoch": 4440} {"train_loss": -7.159010092417399, "global_step": 186521, "epoch": 4440, "val_loss": 69303.25} {"train_loss": -7.258662223815918, "global_step": 186522, "epoch": 4441} {"train_loss": -7.226624011993408, "global_step": 186523, "epoch": 4441} {"train_loss": -7.241647720336914, "global_step": 186524, "epoch": 4441} {"train_loss": -7.137673377990723, "global_step": 186525, "epoch": 4441} {"train_loss": -7.239400863647461, "global_step": 186526, "epoch": 4441} {"train_loss": -7.3053436279296875, "global_step": 186527, "epoch": 4441} {"train_loss": -7.285312175750732, "global_step": 186528, "epoch": 4441} {"train_loss": -7.191576957702637, "global_step": 186529, "epoch": 4441} {"train_loss": -7.1297807693481445, "global_step": 186530, "epoch": 4441} {"train_loss": -7.329442977905273, "global_step": 186531, "epoch": 4441} {"train_loss": -7.154114723205566, "global_step": 186532, "epoch": 4441} {"train_loss": -7.260032653808594, "global_step": 186533, "epoch": 4441} {"train_loss": -7.1652960777282715, "global_step": 186534, "epoch": 4441} {"train_loss": -7.201831817626953, "global_step": 186535, "epoch": 4441} {"train_loss": -7.2276835441589355, "global_step": 186536, "epoch": 4441} {"train_loss": -7.111091613769531, "global_step": 186537, "epoch": 4441} {"train_loss": -7.315265655517578, "global_step": 186538, "epoch": 4441} {"train_loss": -7.172414302825928, "global_step": 186539, "epoch": 4441} {"train_loss": -7.156002044677734, "global_step": 186540, "epoch": 4441} {"train_loss": -7.068079948425293, "global_step": 186541, "epoch": 4441} {"train_loss": -7.243129730224609, "global_step": 186542, "epoch": 4441} {"train_loss": -7.169739723205566, "global_step": 186543, "epoch": 4441} {"train_loss": -7.1929779052734375, "global_step": 186544, "epoch": 4441} {"train_loss": -7.317063808441162, "global_step": 186545, "epoch": 4441} {"train_loss": -7.11009407043457, "global_step": 186546, "epoch": 4441} {"train_loss": -7.072637557983398, "global_step": 186547, "epoch": 4441} {"train_loss": -7.186621189117432, "global_step": 186548, "epoch": 4441} {"train_loss": -7.093652725219727, "global_step": 186549, "epoch": 4441} {"train_loss": -7.065550804138184, "global_step": 186550, "epoch": 4441} {"train_loss": -7.142708778381348, "global_step": 186551, "epoch": 4441} {"train_loss": -6.979846954345703, "global_step": 186552, "epoch": 4441} {"train_loss": -7.218987464904785, "global_step": 186553, "epoch": 4441} {"train_loss": -7.020770072937012, "global_step": 186554, "epoch": 4441} {"train_loss": -7.049526214599609, "global_step": 186555, "epoch": 4441} {"train_loss": -7.0735697746276855, "global_step": 186556, "epoch": 4441} {"train_loss": -7.080121040344238, "global_step": 186557, "epoch": 4441} {"train_loss": -7.041974067687988, "global_step": 186558, "epoch": 4441} {"train_loss": -7.050850868225098, "global_step": 186559, "epoch": 4441} {"train_loss": -7.149842739105225, "global_step": 186560, "epoch": 4441} {"train_loss": -7.211394786834717, "global_step": 186561, "epoch": 4441} {"train_loss": -7.123100280761719, "global_step": 186562, "epoch": 4441} {"train_loss": -7.165530556724185, "global_step": 186563, "epoch": 4441, "val_loss": 69608.3203125} {"train_loss": -7.081026077270508, "global_step": 186564, "epoch": 4442} {"train_loss": -7.114684104919434, "global_step": 186565, "epoch": 4442} {"train_loss": -7.148870468139648, "global_step": 186566, "epoch": 4442} {"train_loss": -7.096887588500977, "global_step": 186567, "epoch": 4442} {"train_loss": -7.110074996948242, "global_step": 186568, "epoch": 4442} {"train_loss": -7.150494575500488, "global_step": 186569, "epoch": 4442} {"train_loss": -7.209538459777832, "global_step": 186570, "epoch": 4442} {"train_loss": -7.118661403656006, "global_step": 186571, "epoch": 4442} {"train_loss": -7.124566555023193, "global_step": 186572, "epoch": 4442} {"train_loss": -7.174681663513184, "global_step": 186573, "epoch": 4442} {"train_loss": -7.239212989807129, "global_step": 186574, "epoch": 4442} {"train_loss": -7.079864978790283, "global_step": 186575, "epoch": 4442} {"train_loss": -7.169340133666992, "global_step": 186576, "epoch": 4442} {"train_loss": -7.153415679931641, "global_step": 186577, "epoch": 4442} {"train_loss": -7.359548568725586, "global_step": 186578, "epoch": 4442} {"train_loss": -7.108968257904053, "global_step": 186579, "epoch": 4442} {"train_loss": -7.216422080993652, "global_step": 186580, "epoch": 4442} {"train_loss": -7.16274356842041, "global_step": 186581, "epoch": 4442} {"train_loss": -7.235195159912109, "global_step": 186582, "epoch": 4442} {"train_loss": -7.13728141784668, "global_step": 186583, "epoch": 4442} {"train_loss": -7.120437145233154, "global_step": 186584, "epoch": 4442} {"train_loss": -7.091195106506348, "global_step": 186585, "epoch": 4442} {"train_loss": -7.098177909851074, "global_step": 186586, "epoch": 4442} {"train_loss": -7.041265487670898, "global_step": 186587, "epoch": 4442} {"train_loss": -7.1453447341918945, "global_step": 186588, "epoch": 4442} {"train_loss": -7.046091079711914, "global_step": 186589, "epoch": 4442} {"train_loss": -7.1233720779418945, "global_step": 186590, "epoch": 4442} {"train_loss": -7.0164666175842285, "global_step": 186591, "epoch": 4442} {"train_loss": -7.034624099731445, "global_step": 186592, "epoch": 4442} {"train_loss": -7.237152099609375, "global_step": 186593, "epoch": 4442} {"train_loss": -7.179518699645996, "global_step": 186594, "epoch": 4442} {"train_loss": -7.126675605773926, "global_step": 186595, "epoch": 4442} {"train_loss": -7.145781517028809, "global_step": 186596, "epoch": 4442} {"train_loss": -7.194497585296631, "global_step": 186597, "epoch": 4442} {"train_loss": -7.153512954711914, "global_step": 186598, "epoch": 4442} {"train_loss": -7.301841735839844, "global_step": 186599, "epoch": 4442} {"train_loss": -7.1658735275268555, "global_step": 186600, "epoch": 4442} {"train_loss": -7.319113731384277, "global_step": 186601, "epoch": 4442} {"train_loss": -7.090492248535156, "global_step": 186602, "epoch": 4442} {"train_loss": -7.173318386077881, "global_step": 186603, "epoch": 4442} {"train_loss": -7.082711696624756, "global_step": 186604, "epoch": 4442} {"train_loss": -7.1503545216151645, "global_step": 186605, "epoch": 4442, "val_loss": 69349.421875} {"train_loss": -7.227046966552734, "global_step": 186606, "epoch": 4443} {"train_loss": -7.262454032897949, "global_step": 186607, "epoch": 4443} {"train_loss": -7.189306259155273, "global_step": 186608, "epoch": 4443} {"train_loss": -7.065223217010498, "global_step": 186609, "epoch": 4443} {"train_loss": -7.177999496459961, "global_step": 186610, "epoch": 4443} {"train_loss": -7.335939407348633, "global_step": 186611, "epoch": 4443} {"train_loss": -7.164130210876465, "global_step": 186612, "epoch": 4443} {"train_loss": -7.18939208984375, "global_step": 186613, "epoch": 4443} {"train_loss": -7.202191352844238, "global_step": 186614, "epoch": 4443} {"train_loss": -7.025595664978027, "global_step": 186615, "epoch": 4443} {"train_loss": -7.13167142868042, "global_step": 186616, "epoch": 4443} {"train_loss": -7.172738075256348, "global_step": 186617, "epoch": 4443} {"train_loss": -6.909848213195801, "global_step": 186618, "epoch": 4443} {"train_loss": -7.099063873291016, "global_step": 186619, "epoch": 4443} {"train_loss": -7.173673152923584, "global_step": 186620, "epoch": 4443} {"train_loss": -7.0384931564331055, "global_step": 186621, "epoch": 4443} {"train_loss": -7.131548881530762, "global_step": 186622, "epoch": 4443} {"train_loss": -7.118051528930664, "global_step": 186623, "epoch": 4443} {"train_loss": -7.187722206115723, "global_step": 186624, "epoch": 4443} {"train_loss": -7.15584659576416, "global_step": 186625, "epoch": 4443} {"train_loss": -7.181687355041504, "global_step": 186626, "epoch": 4443} {"train_loss": -7.2292022705078125, "global_step": 186627, "epoch": 4443} {"train_loss": -7.2197136878967285, "global_step": 186628, "epoch": 4443} {"train_loss": -7.258432388305664, "global_step": 186629, "epoch": 4443} {"train_loss": -7.139270782470703, "global_step": 186630, "epoch": 4443} {"train_loss": -7.205632209777832, "global_step": 186631, "epoch": 4443} {"train_loss": -7.173388481140137, "global_step": 186632, "epoch": 4443} {"train_loss": -7.141725063323975, "global_step": 186633, "epoch": 4443} {"train_loss": -7.176657199859619, "global_step": 186634, "epoch": 4443} {"train_loss": -7.2387518882751465, "global_step": 186635, "epoch": 4443} {"train_loss": -7.227712631225586, "global_step": 186636, "epoch": 4443} {"train_loss": -7.159184455871582, "global_step": 186637, "epoch": 4443} {"train_loss": -7.266392707824707, "global_step": 186638, "epoch": 4443} {"train_loss": -7.159928321838379, "global_step": 186639, "epoch": 4443} {"train_loss": -7.11519718170166, "global_step": 186640, "epoch": 4443} {"train_loss": -7.174731254577637, "global_step": 186641, "epoch": 4443} {"train_loss": -7.145650863647461, "global_step": 186642, "epoch": 4443} {"train_loss": -7.1425652503967285, "global_step": 186643, "epoch": 4443} {"train_loss": -7.039764881134033, "global_step": 186644, "epoch": 4443} {"train_loss": -7.1287946701049805, "global_step": 186645, "epoch": 4443} {"train_loss": -7.052327632904053, "global_step": 186646, "epoch": 4443} {"train_loss": -7.159422329493931, "global_step": 186647, "epoch": 4443, "val_loss": 69410.515625} {"train_loss": -7.133907318115234, "global_step": 186648, "epoch": 4444} {"train_loss": -7.209239482879639, "global_step": 186649, "epoch": 4444} {"train_loss": -7.26682186126709, "global_step": 186650, "epoch": 4444} {"train_loss": -7.1581854820251465, "global_step": 186651, "epoch": 4444} {"train_loss": -7.224325180053711, "global_step": 186652, "epoch": 4444} {"train_loss": -7.132816791534424, "global_step": 186653, "epoch": 4444} {"train_loss": -7.161191940307617, "global_step": 186654, "epoch": 4444} {"train_loss": -7.159935474395752, "global_step": 186655, "epoch": 4444} {"train_loss": -7.115163803100586, "global_step": 186656, "epoch": 4444} {"train_loss": -7.0327606201171875, "global_step": 186657, "epoch": 4444} {"train_loss": -7.176496505737305, "global_step": 186658, "epoch": 4444} {"train_loss": -7.014571666717529, "global_step": 186659, "epoch": 4444} {"train_loss": -7.166417598724365, "global_step": 186660, "epoch": 4444} {"train_loss": -7.099870681762695, "global_step": 186661, "epoch": 4444} {"train_loss": -7.133127689361572, "global_step": 186662, "epoch": 4444} {"train_loss": -7.056883811950684, "global_step": 186663, "epoch": 4444} {"train_loss": -7.146883964538574, "global_step": 186664, "epoch": 4444} {"train_loss": -7.274993896484375, "global_step": 186665, "epoch": 4444} {"train_loss": -7.105537414550781, "global_step": 186666, "epoch": 4444} {"train_loss": -7.209157943725586, "global_step": 186667, "epoch": 4444} {"train_loss": -7.180240154266357, "global_step": 186668, "epoch": 4444} {"train_loss": -7.193758964538574, "global_step": 186669, "epoch": 4444} {"train_loss": -7.235813140869141, "global_step": 186670, "epoch": 4444} {"train_loss": -7.337779998779297, "global_step": 186671, "epoch": 4444} {"train_loss": -7.191506385803223, "global_step": 186672, "epoch": 4444} {"train_loss": -7.140122890472412, "global_step": 186673, "epoch": 4444} {"train_loss": -7.251440525054932, "global_step": 186674, "epoch": 4444} {"train_loss": -7.150969982147217, "global_step": 186675, "epoch": 4444} {"train_loss": -7.130525588989258, "global_step": 186676, "epoch": 4444} {"train_loss": -7.105227470397949, "global_step": 186677, "epoch": 4444} {"train_loss": -7.098085403442383, "global_step": 186678, "epoch": 4444} {"train_loss": -7.233658790588379, "global_step": 186679, "epoch": 4444} {"train_loss": -7.2865166664123535, "global_step": 186680, "epoch": 4444} {"train_loss": -7.107622146606445, "global_step": 186681, "epoch": 4444} {"train_loss": -7.255928039550781, "global_step": 186682, "epoch": 4444} {"train_loss": -7.1763763427734375, "global_step": 186683, "epoch": 4444} {"train_loss": -7.091371059417725, "global_step": 186684, "epoch": 4444} {"train_loss": -7.174098968505859, "global_step": 186685, "epoch": 4444} {"train_loss": -7.249213218688965, "global_step": 186686, "epoch": 4444} {"train_loss": -7.112342834472656, "global_step": 186687, "epoch": 4444} {"train_loss": -7.195716857910156, "global_step": 186688, "epoch": 4444} {"train_loss": -7.1689565408797495, "global_step": 186689, "epoch": 4444, "val_loss": 69428.3125} {"train_loss": -7.356148719787598, "global_step": 186690, "epoch": 4445} {"train_loss": -7.194850444793701, "global_step": 186691, "epoch": 4445} {"train_loss": -7.148438453674316, "global_step": 186692, "epoch": 4445} {"train_loss": -7.242112159729004, "global_step": 186693, "epoch": 4445} {"train_loss": -7.268977642059326, "global_step": 186694, "epoch": 4445} {"train_loss": -7.232826232910156, "global_step": 186695, "epoch": 4445} {"train_loss": -7.094022274017334, "global_step": 186696, "epoch": 4445} {"train_loss": -7.061407089233398, "global_step": 186697, "epoch": 4445} {"train_loss": -7.251969814300537, "global_step": 186698, "epoch": 4445} {"train_loss": -7.129874229431152, "global_step": 186699, "epoch": 4445} {"train_loss": -7.229096412658691, "global_step": 186700, "epoch": 4445} {"train_loss": -7.1065874099731445, "global_step": 186701, "epoch": 4445} {"train_loss": -7.172390937805176, "global_step": 186702, "epoch": 4445} {"train_loss": -7.113746166229248, "global_step": 186703, "epoch": 4445} {"train_loss": -7.051782608032227, "global_step": 186704, "epoch": 4445} {"train_loss": -7.148479461669922, "global_step": 186705, "epoch": 4445} {"train_loss": -7.044044494628906, "global_step": 186706, "epoch": 4445} {"train_loss": -7.1345133781433105, "global_step": 186707, "epoch": 4445} {"train_loss": -7.029024600982666, "global_step": 186708, "epoch": 4445} {"train_loss": -7.1172332763671875, "global_step": 186709, "epoch": 4445} {"train_loss": -7.085078239440918, "global_step": 186710, "epoch": 4445} {"train_loss": -7.049783706665039, "global_step": 186711, "epoch": 4445} {"train_loss": -7.151300430297852, "global_step": 186712, "epoch": 4445} {"train_loss": -7.069543838500977, "global_step": 186713, "epoch": 4445} {"train_loss": -7.022980690002441, "global_step": 186714, "epoch": 4445} {"train_loss": -7.058978080749512, "global_step": 186715, "epoch": 4445} {"train_loss": -7.081955909729004, "global_step": 186716, "epoch": 4445} {"train_loss": -7.084205150604248, "global_step": 186717, "epoch": 4445} {"train_loss": -7.06254768371582, "global_step": 186718, "epoch": 4445} {"train_loss": -7.075172424316406, "global_step": 186719, "epoch": 4445} {"train_loss": -6.907538890838623, "global_step": 186720, "epoch": 4445} {"train_loss": -6.955745220184326, "global_step": 186721, "epoch": 4445} {"train_loss": -7.091845512390137, "global_step": 186722, "epoch": 4445} {"train_loss": -6.977715492248535, "global_step": 186723, "epoch": 4445} {"train_loss": -7.118679046630859, "global_step": 186724, "epoch": 4445} {"train_loss": -6.981088161468506, "global_step": 186725, "epoch": 4445} {"train_loss": -7.109403610229492, "global_step": 186726, "epoch": 4445} {"train_loss": -6.889045715332031, "global_step": 186727, "epoch": 4445} {"train_loss": -6.969700813293457, "global_step": 186728, "epoch": 4445} {"train_loss": -7.069436073303223, "global_step": 186729, "epoch": 4445} {"train_loss": -7.072098731994629, "global_step": 186730, "epoch": 4445} {"train_loss": -7.094915310541789, "global_step": 186731, "epoch": 4445, "val_loss": 69370.0859375} {"train_loss": -7.062941551208496, "global_step": 186732, "epoch": 4446} {"train_loss": -7.138360500335693, "global_step": 186733, "epoch": 4446} {"train_loss": -7.119054794311523, "global_step": 186734, "epoch": 4446} {"train_loss": -7.020502090454102, "global_step": 186735, "epoch": 4446} {"train_loss": -7.27292537689209, "global_step": 186736, "epoch": 4446} {"train_loss": -7.163471698760986, "global_step": 186737, "epoch": 4446} {"train_loss": -7.1664042472839355, "global_step": 186738, "epoch": 4446} {"train_loss": -7.190807819366455, "global_step": 186739, "epoch": 4446} {"train_loss": -7.193570137023926, "global_step": 186740, "epoch": 4446} {"train_loss": -7.155238628387451, "global_step": 186741, "epoch": 4446} {"train_loss": -7.177807807922363, "global_step": 186742, "epoch": 4446} {"train_loss": -7.089105606079102, "global_step": 186743, "epoch": 4446} {"train_loss": -7.117985725402832, "global_step": 186744, "epoch": 4446} {"train_loss": -7.180727958679199, "global_step": 186745, "epoch": 4446} {"train_loss": -7.2855072021484375, "global_step": 186746, "epoch": 4446} {"train_loss": -7.227909564971924, "global_step": 186747, "epoch": 4446} {"train_loss": -7.072391033172607, "global_step": 186748, "epoch": 4446} {"train_loss": -7.215494632720947, "global_step": 186749, "epoch": 4446} {"train_loss": -7.264854431152344, "global_step": 186750, "epoch": 4446} {"train_loss": -7.197565078735352, "global_step": 186751, "epoch": 4446} {"train_loss": -7.102570533752441, "global_step": 186752, "epoch": 4446} {"train_loss": -7.090459823608398, "global_step": 186753, "epoch": 4446} {"train_loss": -7.183979034423828, "global_step": 186754, "epoch": 4446} {"train_loss": -7.189096450805664, "global_step": 186755, "epoch": 4446} {"train_loss": -7.117857933044434, "global_step": 186756, "epoch": 4446} {"train_loss": -7.266088485717773, "global_step": 186757, "epoch": 4446} {"train_loss": -7.08465576171875, "global_step": 186758, "epoch": 4446} {"train_loss": -7.190247535705566, "global_step": 186759, "epoch": 4446} {"train_loss": -7.222005844116211, "global_step": 186760, "epoch": 4446} {"train_loss": -7.032462120056152, "global_step": 186761, "epoch": 4446} {"train_loss": -7.2671918869018555, "global_step": 186762, "epoch": 4446} {"train_loss": -7.02455997467041, "global_step": 186763, "epoch": 4446} {"train_loss": -7.126945972442627, "global_step": 186764, "epoch": 4446} {"train_loss": -7.069194793701172, "global_step": 186765, "epoch": 4446} {"train_loss": -7.145321846008301, "global_step": 186766, "epoch": 4446} {"train_loss": -7.138874530792236, "global_step": 186767, "epoch": 4446} {"train_loss": -7.0356035232543945, "global_step": 186768, "epoch": 4446} {"train_loss": -7.159881591796875, "global_step": 186769, "epoch": 4446} {"train_loss": -7.139987945556641, "global_step": 186770, "epoch": 4446} {"train_loss": -7.097444534301758, "global_step": 186771, "epoch": 4446} {"train_loss": -6.9445037841796875, "global_step": 186772, "epoch": 4446} {"train_loss": -7.143475736890521, "global_step": 186773, "epoch": 4446, "val_loss": 69517.640625} {"train_loss": -7.110990524291992, "global_step": 186774, "epoch": 4447} {"train_loss": -7.195309638977051, "global_step": 186775, "epoch": 4447} {"train_loss": -7.055624008178711, "global_step": 186776, "epoch": 4447} {"train_loss": -7.163312911987305, "global_step": 186777, "epoch": 4447} {"train_loss": -7.12602424621582, "global_step": 186778, "epoch": 4447} {"train_loss": -7.15109920501709, "global_step": 186779, "epoch": 4447} {"train_loss": -7.177770614624023, "global_step": 186780, "epoch": 4447} {"train_loss": -7.024993896484375, "global_step": 186781, "epoch": 4447} {"train_loss": -7.1765265464782715, "global_step": 186782, "epoch": 4447} {"train_loss": -7.20607328414917, "global_step": 186783, "epoch": 4447} {"train_loss": -7.138767719268799, "global_step": 186784, "epoch": 4447} {"train_loss": -7.18412971496582, "global_step": 186785, "epoch": 4447} {"train_loss": -7.135197162628174, "global_step": 186786, "epoch": 4447} {"train_loss": -7.095852851867676, "global_step": 186787, "epoch": 4447} {"train_loss": -7.262458801269531, "global_step": 186788, "epoch": 4447} {"train_loss": -7.220421314239502, "global_step": 186789, "epoch": 4447} {"train_loss": -7.0958709716796875, "global_step": 186790, "epoch": 4447} {"train_loss": -7.065008163452148, "global_step": 186791, "epoch": 4447} {"train_loss": -7.058036804199219, "global_step": 186792, "epoch": 4447} {"train_loss": -7.055849552154541, "global_step": 186793, "epoch": 4447} {"train_loss": -6.994856834411621, "global_step": 186794, "epoch": 4447} {"train_loss": -7.150921821594238, "global_step": 186795, "epoch": 4447} {"train_loss": -7.164405822753906, "global_step": 186796, "epoch": 4447} {"train_loss": -6.997877597808838, "global_step": 186797, "epoch": 4447} {"train_loss": -7.1702561378479, "global_step": 186798, "epoch": 4447} {"train_loss": -7.068819999694824, "global_step": 186799, "epoch": 4447} {"train_loss": -7.043207168579102, "global_step": 186800, "epoch": 4447} {"train_loss": -7.163083076477051, "global_step": 186801, "epoch": 4447} {"train_loss": -7.0588059425354, "global_step": 186802, "epoch": 4447} {"train_loss": -7.10615348815918, "global_step": 186803, "epoch": 4447} {"train_loss": -7.17192268371582, "global_step": 186804, "epoch": 4447} {"train_loss": -7.097563743591309, "global_step": 186805, "epoch": 4447} {"train_loss": -7.1627068519592285, "global_step": 186806, "epoch": 4447} {"train_loss": -7.058234691619873, "global_step": 186807, "epoch": 4447} {"train_loss": -7.094923973083496, "global_step": 186808, "epoch": 4447} {"train_loss": -7.150434494018555, "global_step": 186809, "epoch": 4447} {"train_loss": -7.084472179412842, "global_step": 186810, "epoch": 4447} {"train_loss": -7.077481746673584, "global_step": 186811, "epoch": 4447} {"train_loss": -7.0434160232543945, "global_step": 186812, "epoch": 4447} {"train_loss": -7.110951900482178, "global_step": 186813, "epoch": 4447} {"train_loss": -7.29018497467041, "global_step": 186814, "epoch": 4447} {"train_loss": -7.121829907099406, "global_step": 186815, "epoch": 4447, "val_loss": 69483.78125} {"train_loss": -7.188548564910889, "global_step": 186816, "epoch": 4448} {"train_loss": -7.1462602615356445, "global_step": 186817, "epoch": 4448} {"train_loss": -7.107192039489746, "global_step": 186818, "epoch": 4448} {"train_loss": -7.164644718170166, "global_step": 186819, "epoch": 4448} {"train_loss": -7.048879623413086, "global_step": 186820, "epoch": 4448} {"train_loss": -7.1769514083862305, "global_step": 186821, "epoch": 4448} {"train_loss": -7.1313982009887695, "global_step": 186822, "epoch": 4448} {"train_loss": -7.1423234939575195, "global_step": 186823, "epoch": 4448} {"train_loss": -7.271015167236328, "global_step": 186824, "epoch": 4448} {"train_loss": -7.161306381225586, "global_step": 186825, "epoch": 4448} {"train_loss": -7.174456596374512, "global_step": 186826, "epoch": 4448} {"train_loss": -7.21583366394043, "global_step": 186827, "epoch": 4448} {"train_loss": -7.246367931365967, "global_step": 186828, "epoch": 4448} {"train_loss": -7.1894097328186035, "global_step": 186829, "epoch": 4448} {"train_loss": -7.005539894104004, "global_step": 186830, "epoch": 4448} {"train_loss": -7.221637725830078, "global_step": 186831, "epoch": 4448} {"train_loss": -7.062839508056641, "global_step": 186832, "epoch": 4448} {"train_loss": -7.087066173553467, "global_step": 186833, "epoch": 4448} {"train_loss": -7.037775039672852, "global_step": 186834, "epoch": 4448} {"train_loss": -7.0654730796813965, "global_step": 186835, "epoch": 4448} {"train_loss": -7.232085227966309, "global_step": 186836, "epoch": 4448} {"train_loss": -7.1057281494140625, "global_step": 186837, "epoch": 4448} {"train_loss": -7.006068229675293, "global_step": 186838, "epoch": 4448} {"train_loss": -7.070626735687256, "global_step": 186839, "epoch": 4448} {"train_loss": -7.106977939605713, "global_step": 186840, "epoch": 4448} {"train_loss": -7.215781211853027, "global_step": 186841, "epoch": 4448} {"train_loss": -7.148893356323242, "global_step": 186842, "epoch": 4448} {"train_loss": -7.033845901489258, "global_step": 186843, "epoch": 4448} {"train_loss": -7.037674427032471, "global_step": 186844, "epoch": 4448} {"train_loss": -7.19514274597168, "global_step": 186845, "epoch": 4448} {"train_loss": -7.1140923500061035, "global_step": 186846, "epoch": 4448} {"train_loss": -7.15521764755249, "global_step": 186847, "epoch": 4448} {"train_loss": -7.1410112380981445, "global_step": 186848, "epoch": 4448} {"train_loss": -7.057191848754883, "global_step": 186849, "epoch": 4448} {"train_loss": -7.151638984680176, "global_step": 186850, "epoch": 4448} {"train_loss": -7.054966926574707, "global_step": 186851, "epoch": 4448} {"train_loss": -7.130910873413086, "global_step": 186852, "epoch": 4448} {"train_loss": -7.091464042663574, "global_step": 186853, "epoch": 4448} {"train_loss": -7.0545244216918945, "global_step": 186854, "epoch": 4448} {"train_loss": -7.0570268630981445, "global_step": 186855, "epoch": 4448} {"train_loss": -7.053264617919922, "global_step": 186856, "epoch": 4448} {"train_loss": -7.1206398123786565, "global_step": 186857, "epoch": 4448, "val_loss": 69480.96875} {"train_loss": -6.965540885925293, "global_step": 186858, "epoch": 4449} {"train_loss": -6.983938217163086, "global_step": 186859, "epoch": 4449} {"train_loss": -6.925260543823242, "global_step": 186860, "epoch": 4449} {"train_loss": -6.999392986297607, "global_step": 186861, "epoch": 4449} {"train_loss": -7.209475040435791, "global_step": 186862, "epoch": 4449} {"train_loss": -6.908140182495117, "global_step": 186863, "epoch": 4449} {"train_loss": -7.097080230712891, "global_step": 186864, "epoch": 4449} {"train_loss": -7.0064263343811035, "global_step": 186865, "epoch": 4449} {"train_loss": -7.005127429962158, "global_step": 186866, "epoch": 4449} {"train_loss": -6.899273872375488, "global_step": 186867, "epoch": 4449} {"train_loss": -7.131893157958984, "global_step": 186868, "epoch": 4449} {"train_loss": -7.021081447601318, "global_step": 186869, "epoch": 4449} {"train_loss": -7.15285587310791, "global_step": 186870, "epoch": 4449} {"train_loss": -6.966620445251465, "global_step": 186871, "epoch": 4449} {"train_loss": -7.043745994567871, "global_step": 186872, "epoch": 4449} {"train_loss": -7.094735622406006, "global_step": 186873, "epoch": 4449} {"train_loss": -7.058985233306885, "global_step": 186874, "epoch": 4449} {"train_loss": -7.239466667175293, "global_step": 186875, "epoch": 4449} {"train_loss": -7.0657734870910645, "global_step": 186876, "epoch": 4449} {"train_loss": -7.04804801940918, "global_step": 186877, "epoch": 4449} {"train_loss": -7.080879211425781, "global_step": 186878, "epoch": 4449} {"train_loss": -7.20851469039917, "global_step": 186879, "epoch": 4449} {"train_loss": -7.086291313171387, "global_step": 186880, "epoch": 4449} {"train_loss": -7.077288627624512, "global_step": 186881, "epoch": 4449} {"train_loss": -7.192024230957031, "global_step": 186882, "epoch": 4449} {"train_loss": -7.179228782653809, "global_step": 186883, "epoch": 4449} {"train_loss": -7.100773811340332, "global_step": 186884, "epoch": 4449} {"train_loss": -7.25267219543457, "global_step": 186885, "epoch": 4449} {"train_loss": -7.202236652374268, "global_step": 186886, "epoch": 4449} {"train_loss": -7.20434045791626, "global_step": 186887, "epoch": 4449} {"train_loss": -7.168889045715332, "global_step": 186888, "epoch": 4449} {"train_loss": -7.218953609466553, "global_step": 186889, "epoch": 4449} {"train_loss": -7.127297401428223, "global_step": 186890, "epoch": 4449} {"train_loss": -7.1508612632751465, "global_step": 186891, "epoch": 4449} {"train_loss": -7.236258506774902, "global_step": 186892, "epoch": 4449} {"train_loss": -7.163419246673584, "global_step": 186893, "epoch": 4449} {"train_loss": -7.19686222076416, "global_step": 186894, "epoch": 4449} {"train_loss": -7.0775909423828125, "global_step": 186895, "epoch": 4449} {"train_loss": -7.162983417510986, "global_step": 186896, "epoch": 4449} {"train_loss": -7.093358993530273, "global_step": 186897, "epoch": 4449} {"train_loss": -7.157505512237549, "global_step": 186898, "epoch": 4449} {"train_loss": -7.103809095564342, "global_step": 186899, "epoch": 4449, "val_loss": 69368.46875} {"train_loss": -7.133520126342773, "global_step": 186900, "epoch": 4450} {"train_loss": -7.126927375793457, "global_step": 186901, "epoch": 4450} {"train_loss": -7.024536609649658, "global_step": 186902, "epoch": 4450} {"train_loss": -7.316224098205566, "global_step": 186903, "epoch": 4450} {"train_loss": -7.1699018478393555, "global_step": 186904, "epoch": 4450} {"train_loss": -7.01779842376709, "global_step": 186905, "epoch": 4450} {"train_loss": -7.130880832672119, "global_step": 186906, "epoch": 4450} {"train_loss": -7.029897689819336, "global_step": 186907, "epoch": 4450} {"train_loss": -7.145089149475098, "global_step": 186908, "epoch": 4450} {"train_loss": -7.157362937927246, "global_step": 186909, "epoch": 4450} {"train_loss": -7.171178817749023, "global_step": 186910, "epoch": 4450} {"train_loss": -7.126122951507568, "global_step": 186911, "epoch": 4450} {"train_loss": -7.145526885986328, "global_step": 186912, "epoch": 4450} {"train_loss": -7.223713397979736, "global_step": 186913, "epoch": 4450} {"train_loss": -7.168065071105957, "global_step": 186914, "epoch": 4450} {"train_loss": -7.1244001388549805, "global_step": 186915, "epoch": 4450} {"train_loss": -7.085251808166504, "global_step": 186916, "epoch": 4450} {"train_loss": -7.176338195800781, "global_step": 186917, "epoch": 4450} {"train_loss": -7.254176139831543, "global_step": 186918, "epoch": 4450} {"train_loss": -7.153459072113037, "global_step": 186919, "epoch": 4450} {"train_loss": -7.161924362182617, "global_step": 186920, "epoch": 4450} {"train_loss": -7.256275177001953, "global_step": 186921, "epoch": 4450} {"train_loss": -7.1402740478515625, "global_step": 186922, "epoch": 4450} {"train_loss": -7.255167007446289, "global_step": 186923, "epoch": 4450} {"train_loss": -7.193521499633789, "global_step": 186924, "epoch": 4450} {"train_loss": -7.101483345031738, "global_step": 186925, "epoch": 4450} {"train_loss": -7.1727495193481445, "global_step": 186926, "epoch": 4450} {"train_loss": -7.21298885345459, "global_step": 186927, "epoch": 4450} {"train_loss": -7.045698642730713, "global_step": 186928, "epoch": 4450} {"train_loss": -7.124753475189209, "global_step": 186929, "epoch": 4450} {"train_loss": -7.190182685852051, "global_step": 186930, "epoch": 4450} {"train_loss": -7.152525424957275, "global_step": 186931, "epoch": 4450} {"train_loss": -7.247257709503174, "global_step": 186932, "epoch": 4450} {"train_loss": -7.2538886070251465, "global_step": 186933, "epoch": 4450} {"train_loss": -7.2527594566345215, "global_step": 186934, "epoch": 4450} {"train_loss": -7.208423614501953, "global_step": 186935, "epoch": 4450} {"train_loss": -7.251385688781738, "global_step": 186936, "epoch": 4450} {"train_loss": -7.174411296844482, "global_step": 186937, "epoch": 4450} {"train_loss": -7.238826751708984, "global_step": 186938, "epoch": 4450} {"train_loss": -7.298148155212402, "global_step": 186939, "epoch": 4450} {"train_loss": -7.141304016113281, "global_step": 186940, "epoch": 4450} {"train_loss": -7.169369584038144, "global_step": 186941, "epoch": 4450, "train/sim_max_reward_0": 0.38204820332103906, "train/sim_max_reward_1": 0.65205380976916, "train/sim_max_reward_2": 0.7710237904676808, "train/sim_max_reward_3": 0.4029155962910986, "train/sim_max_reward_4": 0.9697042695378583, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8961792438333313, "test/sim_max_reward_4300001": 0.5716103527356509, "test/sim_max_reward_4300002": 0.9907722409095556, "test/sim_max_reward_4300003": 0.9923725044117995, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.827342887437094, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.4655276799481324, "test/sim_max_reward_4300008": 0.9934053477784477, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.9698604868783204, "test/sim_max_reward_4300011": 0.9368103945516826, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.40195518034535516, "test/sim_max_reward_4300014": 0.9648651433664326, "test/sim_max_reward_4300015": 0.8911041152234855, "test/sim_max_reward_4300016": 0.8739452815835295, "test/sim_max_reward_4300017": 0.8676760303400554, "test/sim_max_reward_4300018": 0.3989496081133657, "test/sim_max_reward_4300019": 0.18601568010174008, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8233997833950393, "test/sim_max_reward_4300022": 0.937945261878038, "test/sim_max_reward_4300023": 0.8545079695207103, "test/sim_max_reward_4300024": 0.6793532805435841, "test/sim_max_reward_4300025": 0.8066656532549852, "test/sim_max_reward_4300026": 0.1759396903304668, "test/sim_max_reward_4300027": 0.9327178510070465, "test/sim_max_reward_4300028": 0.07842138483816632, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.16060615813473259, "test/sim_max_reward_4300031": 0.21899280584986705, "test/sim_max_reward_4300032": 0.9471974077958398, "test/sim_max_reward_4300033": 0.9902309377692263, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.5741821129930347, "test/sim_max_reward_4300036": 0.20304756138308575, "test/sim_max_reward_4300037": 0.865948118021824, "test/sim_max_reward_4300038": 0.9845079550783831, "test/sim_max_reward_4300039": 0.7478393497742121, "test/sim_max_reward_4300040": 0.94673816215175, "test/sim_max_reward_4300041": 0.9613325397518058, "test/sim_max_reward_4300042": 0.8525097595822207, "test/sim_max_reward_4300043": 0.1369465960128634, "test/sim_max_reward_4300044": 0.8021146471312421, "test/sim_max_reward_4300045": 0.8884067940766739, "test/sim_max_reward_4300046": 0.9323623347375156, "test/sim_max_reward_4300047": 0.15527312533427448, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.09664190744809423, "train/mean_score": 0.5617884047915039, "test/mean_score": 0.6199611086032389, "val_loss": 69527.5390625} {"train_loss": -7.25318717956543, "global_step": 186942, "epoch": 4451} {"train_loss": -7.168525695800781, "global_step": 186943, "epoch": 4451} {"train_loss": -7.1830620765686035, "global_step": 186944, "epoch": 4451} {"train_loss": -7.177699565887451, "global_step": 186945, "epoch": 4451} {"train_loss": -7.172735691070557, "global_step": 186946, "epoch": 4451} {"train_loss": -7.146711826324463, "global_step": 186947, "epoch": 4451} {"train_loss": -7.224262237548828, "global_step": 186948, "epoch": 4451} {"train_loss": -7.325488567352295, "global_step": 186949, "epoch": 4451} {"train_loss": -7.324394702911377, "global_step": 186950, "epoch": 4451} {"train_loss": -7.017972469329834, "global_step": 186951, "epoch": 4451} {"train_loss": -7.155642986297607, "global_step": 186952, "epoch": 4451} {"train_loss": -7.179455757141113, "global_step": 186953, "epoch": 4451} {"train_loss": -7.105901718139648, "global_step": 186954, "epoch": 4451} {"train_loss": -7.24677848815918, "global_step": 186955, "epoch": 4451} {"train_loss": -7.054262161254883, "global_step": 186956, "epoch": 4451} {"train_loss": -7.1734161376953125, "global_step": 186957, "epoch": 4451} {"train_loss": -7.025452613830566, "global_step": 186958, "epoch": 4451} {"train_loss": -7.137652397155762, "global_step": 186959, "epoch": 4451} {"train_loss": -7.009510040283203, "global_step": 186960, "epoch": 4451} {"train_loss": -7.036970615386963, "global_step": 186961, "epoch": 4451} {"train_loss": -7.224539756774902, "global_step": 186962, "epoch": 4451} {"train_loss": -7.221276760101318, "global_step": 186963, "epoch": 4451} {"train_loss": -7.093477725982666, "global_step": 186964, "epoch": 4451} {"train_loss": -7.14580774307251, "global_step": 186965, "epoch": 4451} {"train_loss": -7.220771312713623, "global_step": 186966, "epoch": 4451} {"train_loss": -7.135418891906738, "global_step": 186967, "epoch": 4451} {"train_loss": -7.181874752044678, "global_step": 186968, "epoch": 4451} {"train_loss": -7.225358486175537, "global_step": 186969, "epoch": 4451} {"train_loss": -7.222210884094238, "global_step": 186970, "epoch": 4451} {"train_loss": -7.0640974044799805, "global_step": 186971, "epoch": 4451} {"train_loss": -7.065860271453857, "global_step": 186972, "epoch": 4451} {"train_loss": -7.241167068481445, "global_step": 186973, "epoch": 4451} {"train_loss": -7.149672985076904, "global_step": 186974, "epoch": 4451} {"train_loss": -7.022850036621094, "global_step": 186975, "epoch": 4451} {"train_loss": -7.2339935302734375, "global_step": 186976, "epoch": 4451} {"train_loss": -7.180347442626953, "global_step": 186977, "epoch": 4451} {"train_loss": -7.194390773773193, "global_step": 186978, "epoch": 4451} {"train_loss": -7.19459342956543, "global_step": 186979, "epoch": 4451} {"train_loss": -7.069955825805664, "global_step": 186980, "epoch": 4451} {"train_loss": -7.233363151550293, "global_step": 186981, "epoch": 4451} {"train_loss": -7.243518829345703, "global_step": 186982, "epoch": 4451} {"train_loss": -7.1652689434233165, "global_step": 186983, "epoch": 4451, "val_loss": 69313.109375} {"train_loss": -7.237441062927246, "global_step": 186984, "epoch": 4452} {"train_loss": -7.2090888023376465, "global_step": 186985, "epoch": 4452} {"train_loss": -7.232650279998779, "global_step": 186986, "epoch": 4452} {"train_loss": -7.059602737426758, "global_step": 186987, "epoch": 4452} {"train_loss": -7.148849010467529, "global_step": 186988, "epoch": 4452} {"train_loss": -7.148898124694824, "global_step": 186989, "epoch": 4452} {"train_loss": -7.107011795043945, "global_step": 186990, "epoch": 4452} {"train_loss": -7.060190200805664, "global_step": 186991, "epoch": 4452} {"train_loss": -7.157150745391846, "global_step": 186992, "epoch": 4452} {"train_loss": -7.1049580574035645, "global_step": 186993, "epoch": 4452} {"train_loss": -7.204497814178467, "global_step": 186994, "epoch": 4452} {"train_loss": -7.075831413269043, "global_step": 186995, "epoch": 4452} {"train_loss": -7.21682071685791, "global_step": 186996, "epoch": 4452} {"train_loss": -7.241720199584961, "global_step": 186997, "epoch": 4452} {"train_loss": -7.103366851806641, "global_step": 186998, "epoch": 4452} {"train_loss": -7.088308811187744, "global_step": 186999, "epoch": 4452} {"train_loss": -7.254820346832275, "global_step": 187000, "epoch": 4452} {"train_loss": -7.171150207519531, "global_step": 187001, "epoch": 4452} {"train_loss": -7.246797561645508, "global_step": 187002, "epoch": 4452} {"train_loss": -7.19423770904541, "global_step": 187003, "epoch": 4452} {"train_loss": -7.211794376373291, "global_step": 187004, "epoch": 4452} {"train_loss": -7.177876949310303, "global_step": 187005, "epoch": 4452} {"train_loss": -7.156611442565918, "global_step": 187006, "epoch": 4452} {"train_loss": -7.1699538230896, "global_step": 187007, "epoch": 4452} {"train_loss": -7.207631587982178, "global_step": 187008, "epoch": 4452} {"train_loss": -7.22564697265625, "global_step": 187009, "epoch": 4452} {"train_loss": -7.119248390197754, "global_step": 187010, "epoch": 4452} {"train_loss": -7.216693878173828, "global_step": 187011, "epoch": 4452} {"train_loss": -7.146090507507324, "global_step": 187012, "epoch": 4452} {"train_loss": -7.129461288452148, "global_step": 187013, "epoch": 4452} {"train_loss": -7.344752311706543, "global_step": 187014, "epoch": 4452} {"train_loss": -6.951837062835693, "global_step": 187015, "epoch": 4452} {"train_loss": -7.175532341003418, "global_step": 187016, "epoch": 4452} {"train_loss": -7.011875152587891, "global_step": 187017, "epoch": 4452} {"train_loss": -7.15513277053833, "global_step": 187018, "epoch": 4452} {"train_loss": -7.246206283569336, "global_step": 187019, "epoch": 4452} {"train_loss": -7.002650260925293, "global_step": 187020, "epoch": 4452} {"train_loss": -7.1478590965271, "global_step": 187021, "epoch": 4452} {"train_loss": -6.844736099243164, "global_step": 187022, "epoch": 4452} {"train_loss": -7.046634674072266, "global_step": 187023, "epoch": 4452} {"train_loss": -7.055437088012695, "global_step": 187024, "epoch": 4452} {"train_loss": -7.144989978699457, "global_step": 187025, "epoch": 4452, "val_loss": 69469.9375} {"train_loss": -7.120765686035156, "global_step": 187026, "epoch": 4453} {"train_loss": -6.9606218338012695, "global_step": 187027, "epoch": 4453} {"train_loss": -7.164212703704834, "global_step": 187028, "epoch": 4453} {"train_loss": -7.153749465942383, "global_step": 187029, "epoch": 4453} {"train_loss": -7.105133533477783, "global_step": 187030, "epoch": 4453} {"train_loss": -7.112285137176514, "global_step": 187031, "epoch": 4453} {"train_loss": -7.294816970825195, "global_step": 187032, "epoch": 4453} {"train_loss": -7.2184672355651855, "global_step": 187033, "epoch": 4453} {"train_loss": -7.133596420288086, "global_step": 187034, "epoch": 4453} {"train_loss": -7.025449752807617, "global_step": 187035, "epoch": 4453} {"train_loss": -7.25960636138916, "global_step": 187036, "epoch": 4453} {"train_loss": -7.115400791168213, "global_step": 187037, "epoch": 4453} {"train_loss": -7.14710807800293, "global_step": 187038, "epoch": 4453} {"train_loss": -7.167064666748047, "global_step": 187039, "epoch": 4453} {"train_loss": -7.119825839996338, "global_step": 187040, "epoch": 4453} {"train_loss": -7.238706588745117, "global_step": 187041, "epoch": 4453} {"train_loss": -7.063431739807129, "global_step": 187042, "epoch": 4453} {"train_loss": -7.184713363647461, "global_step": 187043, "epoch": 4453} {"train_loss": -7.21124267578125, "global_step": 187044, "epoch": 4453} {"train_loss": -7.057492256164551, "global_step": 187045, "epoch": 4453} {"train_loss": -7.138710021972656, "global_step": 187046, "epoch": 4453} {"train_loss": -7.1913371086120605, "global_step": 187047, "epoch": 4453} {"train_loss": -7.065552711486816, "global_step": 187048, "epoch": 4453} {"train_loss": -7.159979820251465, "global_step": 187049, "epoch": 4453} {"train_loss": -7.160392761230469, "global_step": 187050, "epoch": 4453} {"train_loss": -7.001899719238281, "global_step": 187051, "epoch": 4453} {"train_loss": -7.075152397155762, "global_step": 187052, "epoch": 4453} {"train_loss": -7.0179595947265625, "global_step": 187053, "epoch": 4453} {"train_loss": -7.134378433227539, "global_step": 187054, "epoch": 4453} {"train_loss": -7.1701226234436035, "global_step": 187055, "epoch": 4453} {"train_loss": -7.065183639526367, "global_step": 187056, "epoch": 4453} {"train_loss": -7.207388877868652, "global_step": 187057, "epoch": 4453} {"train_loss": -7.178323745727539, "global_step": 187058, "epoch": 4453} {"train_loss": -7.148566246032715, "global_step": 187059, "epoch": 4453} {"train_loss": -7.1525444984436035, "global_step": 187060, "epoch": 4453} {"train_loss": -7.1361985206604, "global_step": 187061, "epoch": 4453} {"train_loss": -7.02558708190918, "global_step": 187062, "epoch": 4453} {"train_loss": -7.2412519454956055, "global_step": 187063, "epoch": 4453} {"train_loss": -7.176491737365723, "global_step": 187064, "epoch": 4453} {"train_loss": -7.107475757598877, "global_step": 187065, "epoch": 4453} {"train_loss": -7.191720962524414, "global_step": 187066, "epoch": 4453} {"train_loss": -7.135309491838727, "global_step": 187067, "epoch": 4453, "val_loss": 69407.7890625} {"train_loss": -7.128897666931152, "global_step": 187068, "epoch": 4454} {"train_loss": -7.284479141235352, "global_step": 187069, "epoch": 4454} {"train_loss": -7.094451904296875, "global_step": 187070, "epoch": 4454} {"train_loss": -7.2119951248168945, "global_step": 187071, "epoch": 4454} {"train_loss": -7.304717063903809, "global_step": 187072, "epoch": 4454} {"train_loss": -7.211167335510254, "global_step": 187073, "epoch": 4454} {"train_loss": -7.287074565887451, "global_step": 187074, "epoch": 4454} {"train_loss": -7.222864151000977, "global_step": 187075, "epoch": 4454} {"train_loss": -7.220990180969238, "global_step": 187076, "epoch": 4454} {"train_loss": -7.106487274169922, "global_step": 187077, "epoch": 4454} {"train_loss": -7.155460357666016, "global_step": 187078, "epoch": 4454} {"train_loss": -7.172749042510986, "global_step": 187079, "epoch": 4454} {"train_loss": -7.258942127227783, "global_step": 187080, "epoch": 4454} {"train_loss": -7.134022235870361, "global_step": 187081, "epoch": 4454} {"train_loss": -7.225468635559082, "global_step": 187082, "epoch": 4454} {"train_loss": -7.1907758712768555, "global_step": 187083, "epoch": 4454} {"train_loss": -6.988490104675293, "global_step": 187084, "epoch": 4454} {"train_loss": -7.063950538635254, "global_step": 187085, "epoch": 4454} {"train_loss": -7.077216148376465, "global_step": 187086, "epoch": 4454} {"train_loss": -7.126197338104248, "global_step": 187087, "epoch": 4454} {"train_loss": -7.19098424911499, "global_step": 187088, "epoch": 4454} {"train_loss": -7.14327335357666, "global_step": 187089, "epoch": 4454} {"train_loss": -7.153873443603516, "global_step": 187090, "epoch": 4454} {"train_loss": -7.154041767120361, "global_step": 187091, "epoch": 4454} {"train_loss": -7.033875465393066, "global_step": 187092, "epoch": 4454} {"train_loss": -7.140028953552246, "global_step": 187093, "epoch": 4454} {"train_loss": -7.110307216644287, "global_step": 187094, "epoch": 4454} {"train_loss": -7.127136707305908, "global_step": 187095, "epoch": 4454} {"train_loss": -7.138205051422119, "global_step": 187096, "epoch": 4454} {"train_loss": -7.204928874969482, "global_step": 187097, "epoch": 4454} {"train_loss": -7.087959289550781, "global_step": 187098, "epoch": 4454} {"train_loss": -7.12321662902832, "global_step": 187099, "epoch": 4454} {"train_loss": -7.068322658538818, "global_step": 187100, "epoch": 4454} {"train_loss": -7.176127910614014, "global_step": 187101, "epoch": 4454} {"train_loss": -7.071577072143555, "global_step": 187102, "epoch": 4454} {"train_loss": -7.092095375061035, "global_step": 187103, "epoch": 4454} {"train_loss": -7.194746971130371, "global_step": 187104, "epoch": 4454} {"train_loss": -7.155276298522949, "global_step": 187105, "epoch": 4454} {"train_loss": -7.073248386383057, "global_step": 187106, "epoch": 4454} {"train_loss": -7.180617332458496, "global_step": 187107, "epoch": 4454} {"train_loss": -7.0966033935546875, "global_step": 187108, "epoch": 4454} {"train_loss": -7.149089722406297, "global_step": 187109, "epoch": 4454, "val_loss": 69505.171875} {"train_loss": -7.16892147064209, "global_step": 187110, "epoch": 4455} {"train_loss": -7.082144737243652, "global_step": 187111, "epoch": 4455} {"train_loss": -7.258047580718994, "global_step": 187112, "epoch": 4455} {"train_loss": -7.2251811027526855, "global_step": 187113, "epoch": 4455} {"train_loss": -7.108058929443359, "global_step": 187114, "epoch": 4455} {"train_loss": -7.078715801239014, "global_step": 187115, "epoch": 4455} {"train_loss": -7.277178764343262, "global_step": 187116, "epoch": 4455} {"train_loss": -7.1793999671936035, "global_step": 187117, "epoch": 4455} {"train_loss": -7.177341461181641, "global_step": 187118, "epoch": 4455} {"train_loss": -7.209566116333008, "global_step": 187119, "epoch": 4455} {"train_loss": -7.098794937133789, "global_step": 187120, "epoch": 4455} {"train_loss": -7.173976898193359, "global_step": 187121, "epoch": 4455} {"train_loss": -7.161795139312744, "global_step": 187122, "epoch": 4455} {"train_loss": -7.216248035430908, "global_step": 187123, "epoch": 4455} {"train_loss": -7.183439254760742, "global_step": 187124, "epoch": 4455} {"train_loss": -7.185551166534424, "global_step": 187125, "epoch": 4455} {"train_loss": -7.266439437866211, "global_step": 187126, "epoch": 4455} {"train_loss": -7.094376564025879, "global_step": 187127, "epoch": 4455} {"train_loss": -7.218052864074707, "global_step": 187128, "epoch": 4455} {"train_loss": -7.184297561645508, "global_step": 187129, "epoch": 4455} {"train_loss": -7.195089340209961, "global_step": 187130, "epoch": 4455} {"train_loss": -7.225899696350098, "global_step": 187131, "epoch": 4455} {"train_loss": -7.1572265625, "global_step": 187132, "epoch": 4455} {"train_loss": -7.284986972808838, "global_step": 187133, "epoch": 4455} {"train_loss": -7.280444145202637, "global_step": 187134, "epoch": 4455} {"train_loss": -7.116573333740234, "global_step": 187135, "epoch": 4455} {"train_loss": -7.192632675170898, "global_step": 187136, "epoch": 4455} {"train_loss": -7.1675920486450195, "global_step": 187137, "epoch": 4455} {"train_loss": -6.956664085388184, "global_step": 187138, "epoch": 4455} {"train_loss": -7.079194068908691, "global_step": 187139, "epoch": 4455} {"train_loss": -7.091711044311523, "global_step": 187140, "epoch": 4455} {"train_loss": -7.140670299530029, "global_step": 187141, "epoch": 4455} {"train_loss": -7.070527076721191, "global_step": 187142, "epoch": 4455} {"train_loss": -6.97032356262207, "global_step": 187143, "epoch": 4455} {"train_loss": -7.048819541931152, "global_step": 187144, "epoch": 4455} {"train_loss": -7.177484035491943, "global_step": 187145, "epoch": 4455} {"train_loss": -7.02260160446167, "global_step": 187146, "epoch": 4455} {"train_loss": -7.235263347625732, "global_step": 187147, "epoch": 4455} {"train_loss": -7.044426918029785, "global_step": 187148, "epoch": 4455} {"train_loss": -7.075168132781982, "global_step": 187149, "epoch": 4455} {"train_loss": -7.148347854614258, "global_step": 187150, "epoch": 4455} {"train_loss": -7.152021419434321, "global_step": 187151, "epoch": 4455, "val_loss": 69697.9453125} {"train_loss": -7.0935378074646, "global_step": 187152, "epoch": 4456} {"train_loss": -7.24716329574585, "global_step": 187153, "epoch": 4456} {"train_loss": -7.1288557052612305, "global_step": 187154, "epoch": 4456} {"train_loss": -7.171380996704102, "global_step": 187155, "epoch": 4456} {"train_loss": -7.191555500030518, "global_step": 187156, "epoch": 4456} {"train_loss": -7.159960746765137, "global_step": 187157, "epoch": 4456} {"train_loss": -7.063044548034668, "global_step": 187158, "epoch": 4456} {"train_loss": -7.033470630645752, "global_step": 187159, "epoch": 4456} {"train_loss": -7.154688358306885, "global_step": 187160, "epoch": 4456} {"train_loss": -7.105047702789307, "global_step": 187161, "epoch": 4456} {"train_loss": -7.251104354858398, "global_step": 187162, "epoch": 4456} {"train_loss": -7.099020004272461, "global_step": 187163, "epoch": 4456} {"train_loss": -7.0859527587890625, "global_step": 187164, "epoch": 4456} {"train_loss": -7.042234420776367, "global_step": 187165, "epoch": 4456} {"train_loss": -7.118249416351318, "global_step": 187166, "epoch": 4456} {"train_loss": -7.18328332901001, "global_step": 187167, "epoch": 4456} {"train_loss": -7.207170486450195, "global_step": 187168, "epoch": 4456} {"train_loss": -7.06510066986084, "global_step": 187169, "epoch": 4456} {"train_loss": -7.145319938659668, "global_step": 187170, "epoch": 4456} {"train_loss": -7.048297882080078, "global_step": 187171, "epoch": 4456} {"train_loss": -7.094631671905518, "global_step": 187172, "epoch": 4456} {"train_loss": -7.05124568939209, "global_step": 187173, "epoch": 4456} {"train_loss": -7.135998249053955, "global_step": 187174, "epoch": 4456} {"train_loss": -7.195426940917969, "global_step": 187175, "epoch": 4456} {"train_loss": -7.183676719665527, "global_step": 187176, "epoch": 4456} {"train_loss": -7.144000053405762, "global_step": 187177, "epoch": 4456} {"train_loss": -6.998530864715576, "global_step": 187178, "epoch": 4456} {"train_loss": -7.105297088623047, "global_step": 187179, "epoch": 4456} {"train_loss": -7.1434431076049805, "global_step": 187180, "epoch": 4456} {"train_loss": -7.120706081390381, "global_step": 187181, "epoch": 4456} {"train_loss": -7.0570454597473145, "global_step": 187182, "epoch": 4456} {"train_loss": -7.198840141296387, "global_step": 187183, "epoch": 4456} {"train_loss": -7.171594619750977, "global_step": 187184, "epoch": 4456} {"train_loss": -7.102540016174316, "global_step": 187185, "epoch": 4456} {"train_loss": -7.095719814300537, "global_step": 187186, "epoch": 4456} {"train_loss": -7.125753402709961, "global_step": 187187, "epoch": 4456} {"train_loss": -7.089239597320557, "global_step": 187188, "epoch": 4456} {"train_loss": -7.08541202545166, "global_step": 187189, "epoch": 4456} {"train_loss": -7.288219928741455, "global_step": 187190, "epoch": 4456} {"train_loss": -7.158904075622559, "global_step": 187191, "epoch": 4456} {"train_loss": -7.080327987670898, "global_step": 187192, "epoch": 4456} {"train_loss": -7.128181968416486, "global_step": 187193, "epoch": 4456, "val_loss": 69430.234375} {"train_loss": -7.1306047439575195, "global_step": 187194, "epoch": 4457} {"train_loss": -7.174442768096924, "global_step": 187195, "epoch": 4457} {"train_loss": -7.1850433349609375, "global_step": 187196, "epoch": 4457} {"train_loss": -7.001051425933838, "global_step": 187197, "epoch": 4457} {"train_loss": -7.282103061676025, "global_step": 187198, "epoch": 4457} {"train_loss": -7.1380157470703125, "global_step": 187199, "epoch": 4457} {"train_loss": -7.2160797119140625, "global_step": 187200, "epoch": 4457} {"train_loss": -7.1737871170043945, "global_step": 187201, "epoch": 4457} {"train_loss": -7.236981391906738, "global_step": 187202, "epoch": 4457} {"train_loss": -7.121198654174805, "global_step": 187203, "epoch": 4457} {"train_loss": -7.257970333099365, "global_step": 187204, "epoch": 4457} {"train_loss": -7.213139533996582, "global_step": 187205, "epoch": 4457} {"train_loss": -7.2586870193481445, "global_step": 187206, "epoch": 4457} {"train_loss": -7.3053998947143555, "global_step": 187207, "epoch": 4457} {"train_loss": -7.287938594818115, "global_step": 187208, "epoch": 4457} {"train_loss": -7.247066497802734, "global_step": 187209, "epoch": 4457} {"train_loss": -7.267797470092773, "global_step": 187210, "epoch": 4457} {"train_loss": -7.148002624511719, "global_step": 187211, "epoch": 4457} {"train_loss": -7.289748191833496, "global_step": 187212, "epoch": 4457} {"train_loss": -7.208034992218018, "global_step": 187213, "epoch": 4457} {"train_loss": -7.1921281814575195, "global_step": 187214, "epoch": 4457} {"train_loss": -7.125347137451172, "global_step": 187215, "epoch": 4457} {"train_loss": -7.290886878967285, "global_step": 187216, "epoch": 4457} {"train_loss": -7.199943542480469, "global_step": 187217, "epoch": 4457} {"train_loss": -7.193293571472168, "global_step": 187218, "epoch": 4457} {"train_loss": -7.164802551269531, "global_step": 187219, "epoch": 4457} {"train_loss": -7.228719711303711, "global_step": 187220, "epoch": 4457} {"train_loss": -7.1886396408081055, "global_step": 187221, "epoch": 4457} {"train_loss": -7.191650390625, "global_step": 187222, "epoch": 4457} {"train_loss": -7.241916656494141, "global_step": 187223, "epoch": 4457} {"train_loss": -7.113836288452148, "global_step": 187224, "epoch": 4457} {"train_loss": -7.123316287994385, "global_step": 187225, "epoch": 4457} {"train_loss": -7.181670188903809, "global_step": 187226, "epoch": 4457} {"train_loss": -7.171271324157715, "global_step": 187227, "epoch": 4457} {"train_loss": -7.043255805969238, "global_step": 187228, "epoch": 4457} {"train_loss": -7.06272029876709, "global_step": 187229, "epoch": 4457} {"train_loss": -7.077889442443848, "global_step": 187230, "epoch": 4457} {"train_loss": -7.019030570983887, "global_step": 187231, "epoch": 4457} {"train_loss": -7.213276386260986, "global_step": 187232, "epoch": 4457} {"train_loss": -7.066051959991455, "global_step": 187233, "epoch": 4457} {"train_loss": -7.075948238372803, "global_step": 187234, "epoch": 4457} {"train_loss": -7.176657495044527, "global_step": 187235, "epoch": 4457, "val_loss": 69669.3203125} {"train_loss": -7.129583358764648, "global_step": 187236, "epoch": 4458} {"train_loss": -7.217731952667236, "global_step": 187237, "epoch": 4458} {"train_loss": -7.00222635269165, "global_step": 187238, "epoch": 4458} {"train_loss": -7.114964485168457, "global_step": 187239, "epoch": 4458} {"train_loss": -7.164127349853516, "global_step": 187240, "epoch": 4458} {"train_loss": -7.235107898712158, "global_step": 187241, "epoch": 4458} {"train_loss": -7.161669731140137, "global_step": 187242, "epoch": 4458} {"train_loss": -7.1434807777404785, "global_step": 187243, "epoch": 4458} {"train_loss": -7.200993537902832, "global_step": 187244, "epoch": 4458} {"train_loss": -7.191051006317139, "global_step": 187245, "epoch": 4458} {"train_loss": -7.105738639831543, "global_step": 187246, "epoch": 4458} {"train_loss": -7.25185489654541, "global_step": 187247, "epoch": 4458} {"train_loss": -7.214906692504883, "global_step": 187248, "epoch": 4458} {"train_loss": -7.126237869262695, "global_step": 187249, "epoch": 4458} {"train_loss": -7.185839653015137, "global_step": 187250, "epoch": 4458} {"train_loss": -7.137072563171387, "global_step": 187251, "epoch": 4458} {"train_loss": -7.217397689819336, "global_step": 187252, "epoch": 4458} {"train_loss": -7.242778778076172, "global_step": 187253, "epoch": 4458} {"train_loss": -7.091067790985107, "global_step": 187254, "epoch": 4458} {"train_loss": -7.145707130432129, "global_step": 187255, "epoch": 4458} {"train_loss": -7.11838436126709, "global_step": 187256, "epoch": 4458} {"train_loss": -7.259666442871094, "global_step": 187257, "epoch": 4458} {"train_loss": -7.172691345214844, "global_step": 187258, "epoch": 4458} {"train_loss": -7.236146450042725, "global_step": 187259, "epoch": 4458} {"train_loss": -7.1883955001831055, "global_step": 187260, "epoch": 4458} {"train_loss": -7.1927714347839355, "global_step": 187261, "epoch": 4458} {"train_loss": -7.249378681182861, "global_step": 187262, "epoch": 4458} {"train_loss": -7.102383613586426, "global_step": 187263, "epoch": 4458} {"train_loss": -7.189585208892822, "global_step": 187264, "epoch": 4458} {"train_loss": -7.257739067077637, "global_step": 187265, "epoch": 4458} {"train_loss": -7.028769016265869, "global_step": 187266, "epoch": 4458} {"train_loss": -7.093413829803467, "global_step": 187267, "epoch": 4458} {"train_loss": -7.15739631652832, "global_step": 187268, "epoch": 4458} {"train_loss": -7.160881996154785, "global_step": 187269, "epoch": 4458} {"train_loss": -7.25815486907959, "global_step": 187270, "epoch": 4458} {"train_loss": -7.247415542602539, "global_step": 187271, "epoch": 4458} {"train_loss": -7.0692949295043945, "global_step": 187272, "epoch": 4458} {"train_loss": -7.065398216247559, "global_step": 187273, "epoch": 4458} {"train_loss": -7.180935382843018, "global_step": 187274, "epoch": 4458} {"train_loss": -7.0453104972839355, "global_step": 187275, "epoch": 4458} {"train_loss": -7.2052788734436035, "global_step": 187276, "epoch": 4458} {"train_loss": -7.1619165397825695, "global_step": 187277, "epoch": 4458, "val_loss": 69734.8046875} {"train_loss": -7.06367301940918, "global_step": 187278, "epoch": 4459} {"train_loss": -7.221012115478516, "global_step": 187279, "epoch": 4459} {"train_loss": -7.172511100769043, "global_step": 187280, "epoch": 4459} {"train_loss": -7.220436096191406, "global_step": 187281, "epoch": 4459} {"train_loss": -7.0857648849487305, "global_step": 187282, "epoch": 4459} {"train_loss": -7.142580509185791, "global_step": 187283, "epoch": 4459} {"train_loss": -7.07417631149292, "global_step": 187284, "epoch": 4459} {"train_loss": -7.104523658752441, "global_step": 187285, "epoch": 4459} {"train_loss": -7.171738624572754, "global_step": 187286, "epoch": 4459} {"train_loss": -7.149225234985352, "global_step": 187287, "epoch": 4459} {"train_loss": -7.126481533050537, "global_step": 187288, "epoch": 4459} {"train_loss": -7.148889541625977, "global_step": 187289, "epoch": 4459} {"train_loss": -7.1827192306518555, "global_step": 187290, "epoch": 4459} {"train_loss": -7.141947269439697, "global_step": 187291, "epoch": 4459} {"train_loss": -7.195696830749512, "global_step": 187292, "epoch": 4459} {"train_loss": -7.130430698394775, "global_step": 187293, "epoch": 4459} {"train_loss": -7.104788303375244, "global_step": 187294, "epoch": 4459} {"train_loss": -7.245743751525879, "global_step": 187295, "epoch": 4459} {"train_loss": -7.136115550994873, "global_step": 187296, "epoch": 4459} {"train_loss": -7.036191463470459, "global_step": 187297, "epoch": 4459} {"train_loss": -7.2222137451171875, "global_step": 187298, "epoch": 4459} {"train_loss": -7.04290771484375, "global_step": 187299, "epoch": 4459} {"train_loss": -6.97421407699585, "global_step": 187300, "epoch": 4459} {"train_loss": -7.171955108642578, "global_step": 187301, "epoch": 4459} {"train_loss": -7.001880168914795, "global_step": 187302, "epoch": 4459} {"train_loss": -7.242856025695801, "global_step": 187303, "epoch": 4459} {"train_loss": -7.13810920715332, "global_step": 187304, "epoch": 4459} {"train_loss": -7.082940101623535, "global_step": 187305, "epoch": 4459} {"train_loss": -7.011519908905029, "global_step": 187306, "epoch": 4459} {"train_loss": -7.086544513702393, "global_step": 187307, "epoch": 4459} {"train_loss": -7.148960113525391, "global_step": 187308, "epoch": 4459} {"train_loss": -7.119333744049072, "global_step": 187309, "epoch": 4459} {"train_loss": -7.087829113006592, "global_step": 187310, "epoch": 4459} {"train_loss": -6.96350622177124, "global_step": 187311, "epoch": 4459} {"train_loss": -7.156131744384766, "global_step": 187312, "epoch": 4459} {"train_loss": -7.181282997131348, "global_step": 187313, "epoch": 4459} {"train_loss": -7.045988082885742, "global_step": 187314, "epoch": 4459} {"train_loss": -7.1414995193481445, "global_step": 187315, "epoch": 4459} {"train_loss": -7.063048362731934, "global_step": 187316, "epoch": 4459} {"train_loss": -7.100952625274658, "global_step": 187317, "epoch": 4459} {"train_loss": -7.0840349197387695, "global_step": 187318, "epoch": 4459} {"train_loss": -7.1207847481682185, "global_step": 187319, "epoch": 4459, "val_loss": 69449.3984375} {"train_loss": -7.09738826751709, "global_step": 187320, "epoch": 4460} {"train_loss": -7.129276275634766, "global_step": 187321, "epoch": 4460} {"train_loss": -7.121642112731934, "global_step": 187322, "epoch": 4460} {"train_loss": -7.106624603271484, "global_step": 187323, "epoch": 4460} {"train_loss": -7.18747091293335, "global_step": 187324, "epoch": 4460} {"train_loss": -7.205169677734375, "global_step": 187325, "epoch": 4460} {"train_loss": -7.165093421936035, "global_step": 187326, "epoch": 4460} {"train_loss": -7.120434761047363, "global_step": 187327, "epoch": 4460} {"train_loss": -7.207192420959473, "global_step": 187328, "epoch": 4460} {"train_loss": -7.152587413787842, "global_step": 187329, "epoch": 4460} {"train_loss": -6.9673871994018555, "global_step": 187330, "epoch": 4460} {"train_loss": -7.053211212158203, "global_step": 187331, "epoch": 4460} {"train_loss": -7.167742729187012, "global_step": 187332, "epoch": 4460} {"train_loss": -7.071386814117432, "global_step": 187333, "epoch": 4460} {"train_loss": -6.989701271057129, "global_step": 187334, "epoch": 4460} {"train_loss": -7.195427894592285, "global_step": 187335, "epoch": 4460} {"train_loss": -7.083270072937012, "global_step": 187336, "epoch": 4460} {"train_loss": -7.079463481903076, "global_step": 187337, "epoch": 4460} {"train_loss": -7.178065299987793, "global_step": 187338, "epoch": 4460} {"train_loss": -7.181854248046875, "global_step": 187339, "epoch": 4460} {"train_loss": -7.110507011413574, "global_step": 187340, "epoch": 4460} {"train_loss": -7.07765531539917, "global_step": 187341, "epoch": 4460} {"train_loss": -7.074226379394531, "global_step": 187342, "epoch": 4460} {"train_loss": -7.153898239135742, "global_step": 187343, "epoch": 4460} {"train_loss": -7.270899772644043, "global_step": 187344, "epoch": 4460} {"train_loss": -7.078141212463379, "global_step": 187345, "epoch": 4460} {"train_loss": -7.12973690032959, "global_step": 187346, "epoch": 4460} {"train_loss": -6.999073028564453, "global_step": 187347, "epoch": 4460} {"train_loss": -7.16868257522583, "global_step": 187348, "epoch": 4460} {"train_loss": -7.078370094299316, "global_step": 187349, "epoch": 4460} {"train_loss": -7.177183151245117, "global_step": 187350, "epoch": 4460} {"train_loss": -7.17000150680542, "global_step": 187351, "epoch": 4460} {"train_loss": -7.084168434143066, "global_step": 187352, "epoch": 4460} {"train_loss": -7.192547798156738, "global_step": 187353, "epoch": 4460} {"train_loss": -7.1211347579956055, "global_step": 187354, "epoch": 4460} {"train_loss": -7.078531265258789, "global_step": 187355, "epoch": 4460} {"train_loss": -7.120053768157959, "global_step": 187356, "epoch": 4460} {"train_loss": -7.09597110748291, "global_step": 187357, "epoch": 4460} {"train_loss": -7.124065399169922, "global_step": 187358, "epoch": 4460} {"train_loss": -7.302250385284424, "global_step": 187359, "epoch": 4460} {"train_loss": -7.171640872955322, "global_step": 187360, "epoch": 4460} {"train_loss": -7.130812315713792, "global_step": 187361, "epoch": 4460, "val_loss": 69444.4375} {"train_loss": -7.217755317687988, "global_step": 187362, "epoch": 4461} {"train_loss": -7.190891265869141, "global_step": 187363, "epoch": 4461} {"train_loss": -7.2815117835998535, "global_step": 187364, "epoch": 4461} {"train_loss": -7.2289652824401855, "global_step": 187365, "epoch": 4461} {"train_loss": -7.336373329162598, "global_step": 187366, "epoch": 4461} {"train_loss": -7.218657493591309, "global_step": 187367, "epoch": 4461} {"train_loss": -7.233606338500977, "global_step": 187368, "epoch": 4461} {"train_loss": -7.195822715759277, "global_step": 187369, "epoch": 4461} {"train_loss": -7.265353202819824, "global_step": 187370, "epoch": 4461} {"train_loss": -7.184618949890137, "global_step": 187371, "epoch": 4461} {"train_loss": -7.286831378936768, "global_step": 187372, "epoch": 4461} {"train_loss": -7.304542541503906, "global_step": 187373, "epoch": 4461} {"train_loss": -7.248333930969238, "global_step": 187374, "epoch": 4461} {"train_loss": -7.141674041748047, "global_step": 187375, "epoch": 4461} {"train_loss": -7.353140830993652, "global_step": 187376, "epoch": 4461} {"train_loss": -7.138406753540039, "global_step": 187377, "epoch": 4461} {"train_loss": -7.278614044189453, "global_step": 187378, "epoch": 4461} {"train_loss": -7.27211856842041, "global_step": 187379, "epoch": 4461} {"train_loss": -7.164337635040283, "global_step": 187380, "epoch": 4461} {"train_loss": -7.380739688873291, "global_step": 187381, "epoch": 4461} {"train_loss": -7.270651817321777, "global_step": 187382, "epoch": 4461} {"train_loss": -7.2637505531311035, "global_step": 187383, "epoch": 4461} {"train_loss": -7.243047714233398, "global_step": 187384, "epoch": 4461} {"train_loss": -7.227457046508789, "global_step": 187385, "epoch": 4461} {"train_loss": -7.126641750335693, "global_step": 187386, "epoch": 4461} {"train_loss": -7.065859317779541, "global_step": 187387, "epoch": 4461} {"train_loss": -7.051800727844238, "global_step": 187388, "epoch": 4461} {"train_loss": -7.232507705688477, "global_step": 187389, "epoch": 4461} {"train_loss": -7.092690467834473, "global_step": 187390, "epoch": 4461} {"train_loss": -7.221016883850098, "global_step": 187391, "epoch": 4461} {"train_loss": -7.322404861450195, "global_step": 187392, "epoch": 4461} {"train_loss": -7.141161918640137, "global_step": 187393, "epoch": 4461} {"train_loss": -7.035885810852051, "global_step": 187394, "epoch": 4461} {"train_loss": -7.157270431518555, "global_step": 187395, "epoch": 4461} {"train_loss": -7.151585578918457, "global_step": 187396, "epoch": 4461} {"train_loss": -7.119897842407227, "global_step": 187397, "epoch": 4461} {"train_loss": -7.220674991607666, "global_step": 187398, "epoch": 4461} {"train_loss": -7.1331281661987305, "global_step": 187399, "epoch": 4461} {"train_loss": -7.113786697387695, "global_step": 187400, "epoch": 4461} {"train_loss": -7.145907402038574, "global_step": 187401, "epoch": 4461} {"train_loss": -7.128810882568359, "global_step": 187402, "epoch": 4461} {"train_loss": -7.203567107518514, "global_step": 187403, "epoch": 4461, "val_loss": 69637.6953125} {"train_loss": -7.23612642288208, "global_step": 187404, "epoch": 4462} {"train_loss": -7.15704870223999, "global_step": 187405, "epoch": 4462} {"train_loss": -7.133461952209473, "global_step": 187406, "epoch": 4462} {"train_loss": -7.149899482727051, "global_step": 187407, "epoch": 4462} {"train_loss": -7.215856075286865, "global_step": 187408, "epoch": 4462} {"train_loss": -7.217772483825684, "global_step": 187409, "epoch": 4462} {"train_loss": -7.1394758224487305, "global_step": 187410, "epoch": 4462} {"train_loss": -7.342344284057617, "global_step": 187411, "epoch": 4462} {"train_loss": -7.221351623535156, "global_step": 187412, "epoch": 4462} {"train_loss": -7.099771499633789, "global_step": 187413, "epoch": 4462} {"train_loss": -7.1645917892456055, "global_step": 187414, "epoch": 4462} {"train_loss": -7.083996772766113, "global_step": 187415, "epoch": 4462} {"train_loss": -7.234580039978027, "global_step": 187416, "epoch": 4462} {"train_loss": -7.232048988342285, "global_step": 187417, "epoch": 4462} {"train_loss": -7.267285346984863, "global_step": 187418, "epoch": 4462} {"train_loss": -7.063508987426758, "global_step": 187419, "epoch": 4462} {"train_loss": -7.184088706970215, "global_step": 187420, "epoch": 4462} {"train_loss": -7.167972564697266, "global_step": 187421, "epoch": 4462} {"train_loss": -7.244601249694824, "global_step": 187422, "epoch": 4462} {"train_loss": -7.112322807312012, "global_step": 187423, "epoch": 4462} {"train_loss": -7.244930267333984, "global_step": 187424, "epoch": 4462} {"train_loss": -7.098738193511963, "global_step": 187425, "epoch": 4462} {"train_loss": -7.072653293609619, "global_step": 187426, "epoch": 4462} {"train_loss": -7.095913887023926, "global_step": 187427, "epoch": 4462} {"train_loss": -6.988986015319824, "global_step": 187428, "epoch": 4462} {"train_loss": -7.018103122711182, "global_step": 187429, "epoch": 4462} {"train_loss": -7.098886013031006, "global_step": 187430, "epoch": 4462} {"train_loss": -7.072544097900391, "global_step": 187431, "epoch": 4462} {"train_loss": -6.94722318649292, "global_step": 187432, "epoch": 4462} {"train_loss": -7.1455183029174805, "global_step": 187433, "epoch": 4462} {"train_loss": -7.004443645477295, "global_step": 187434, "epoch": 4462} {"train_loss": -7.142675876617432, "global_step": 187435, "epoch": 4462} {"train_loss": -7.117124557495117, "global_step": 187436, "epoch": 4462} {"train_loss": -7.0548248291015625, "global_step": 187437, "epoch": 4462} {"train_loss": -7.252228260040283, "global_step": 187438, "epoch": 4462} {"train_loss": -7.091328144073486, "global_step": 187439, "epoch": 4462} {"train_loss": -7.139390468597412, "global_step": 187440, "epoch": 4462} {"train_loss": -7.164674282073975, "global_step": 187441, "epoch": 4462} {"train_loss": -7.173788547515869, "global_step": 187442, "epoch": 4462} {"train_loss": -7.131839752197266, "global_step": 187443, "epoch": 4462} {"train_loss": -7.226626873016357, "global_step": 187444, "epoch": 4462} {"train_loss": -7.144716898600261, "global_step": 187445, "epoch": 4462, "val_loss": 69383.203125} {"train_loss": -7.2148051261901855, "global_step": 187446, "epoch": 4463} {"train_loss": -7.138313293457031, "global_step": 187447, "epoch": 4463} {"train_loss": -7.162336349487305, "global_step": 187448, "epoch": 4463} {"train_loss": -7.194196701049805, "global_step": 187449, "epoch": 4463} {"train_loss": -7.240120887756348, "global_step": 187450, "epoch": 4463} {"train_loss": -7.216252326965332, "global_step": 187451, "epoch": 4463} {"train_loss": -7.217568397521973, "global_step": 187452, "epoch": 4463} {"train_loss": -7.189879894256592, "global_step": 187453, "epoch": 4463} {"train_loss": -7.260044097900391, "global_step": 187454, "epoch": 4463} {"train_loss": -7.117955207824707, "global_step": 187455, "epoch": 4463} {"train_loss": -7.206263542175293, "global_step": 187456, "epoch": 4463} {"train_loss": -7.159201145172119, "global_step": 187457, "epoch": 4463} {"train_loss": -7.273416996002197, "global_step": 187458, "epoch": 4463} {"train_loss": -7.239443778991699, "global_step": 187459, "epoch": 4463} {"train_loss": -7.190879821777344, "global_step": 187460, "epoch": 4463} {"train_loss": -7.264097690582275, "global_step": 187461, "epoch": 4463} {"train_loss": -7.152463912963867, "global_step": 187462, "epoch": 4463} {"train_loss": -7.139453887939453, "global_step": 187463, "epoch": 4463} {"train_loss": -7.251652240753174, "global_step": 187464, "epoch": 4463} {"train_loss": -7.133088111877441, "global_step": 187465, "epoch": 4463} {"train_loss": -7.172821521759033, "global_step": 187466, "epoch": 4463} {"train_loss": -6.972517967224121, "global_step": 187467, "epoch": 4463} {"train_loss": -7.204039573669434, "global_step": 187468, "epoch": 4463} {"train_loss": -7.10603141784668, "global_step": 187469, "epoch": 4463} {"train_loss": -6.982563018798828, "global_step": 187470, "epoch": 4463} {"train_loss": -7.167135238647461, "global_step": 187471, "epoch": 4463} {"train_loss": -6.963397026062012, "global_step": 187472, "epoch": 4463} {"train_loss": -7.0683746337890625, "global_step": 187473, "epoch": 4463} {"train_loss": -7.18669319152832, "global_step": 187474, "epoch": 4463} {"train_loss": -7.112837314605713, "global_step": 187475, "epoch": 4463} {"train_loss": -7.142232418060303, "global_step": 187476, "epoch": 4463} {"train_loss": -7.091376304626465, "global_step": 187477, "epoch": 4463} {"train_loss": -7.187615871429443, "global_step": 187478, "epoch": 4463} {"train_loss": -7.237459182739258, "global_step": 187479, "epoch": 4463} {"train_loss": -7.200000762939453, "global_step": 187480, "epoch": 4463} {"train_loss": -7.221566200256348, "global_step": 187481, "epoch": 4463} {"train_loss": -7.219817638397217, "global_step": 187482, "epoch": 4463} {"train_loss": -7.253955841064453, "global_step": 187483, "epoch": 4463} {"train_loss": -7.177910804748535, "global_step": 187484, "epoch": 4463} {"train_loss": -7.259172439575195, "global_step": 187485, "epoch": 4463} {"train_loss": -7.191255569458008, "global_step": 187486, "epoch": 4463} {"train_loss": -7.174024820327759, "global_step": 187487, "epoch": 4463, "val_loss": 69601.171875} {"train_loss": -7.271209716796875, "global_step": 187488, "epoch": 4464} {"train_loss": -7.2006072998046875, "global_step": 187489, "epoch": 4464} {"train_loss": -7.3355607986450195, "global_step": 187490, "epoch": 4464} {"train_loss": -7.057835578918457, "global_step": 187491, "epoch": 4464} {"train_loss": -7.269068717956543, "global_step": 187492, "epoch": 4464} {"train_loss": -7.114722728729248, "global_step": 187493, "epoch": 4464} {"train_loss": -7.044684410095215, "global_step": 187494, "epoch": 4464} {"train_loss": -7.066573143005371, "global_step": 187495, "epoch": 4464} {"train_loss": -7.130716323852539, "global_step": 187496, "epoch": 4464} {"train_loss": -7.031222343444824, "global_step": 187497, "epoch": 4464} {"train_loss": -7.071584701538086, "global_step": 187498, "epoch": 4464} {"train_loss": -7.169403076171875, "global_step": 187499, "epoch": 4464} {"train_loss": -6.969480037689209, "global_step": 187500, "epoch": 4464} {"train_loss": -7.253312110900879, "global_step": 187501, "epoch": 4464} {"train_loss": -7.220748424530029, "global_step": 187502, "epoch": 4464} {"train_loss": -7.2614665031433105, "global_step": 187503, "epoch": 4464} {"train_loss": -7.120030403137207, "global_step": 187504, "epoch": 4464} {"train_loss": -7.199885845184326, "global_step": 187505, "epoch": 4464} {"train_loss": -7.217770099639893, "global_step": 187506, "epoch": 4464} {"train_loss": -7.205059051513672, "global_step": 187507, "epoch": 4464} {"train_loss": -7.108759880065918, "global_step": 187508, "epoch": 4464} {"train_loss": -7.10884428024292, "global_step": 187509, "epoch": 4464} {"train_loss": -7.351104259490967, "global_step": 187510, "epoch": 4464} {"train_loss": -7.019510746002197, "global_step": 187511, "epoch": 4464} {"train_loss": -7.139923095703125, "global_step": 187512, "epoch": 4464} {"train_loss": -7.216401100158691, "global_step": 187513, "epoch": 4464} {"train_loss": -7.1037139892578125, "global_step": 187514, "epoch": 4464} {"train_loss": -7.037866592407227, "global_step": 187515, "epoch": 4464} {"train_loss": -7.146390914916992, "global_step": 187516, "epoch": 4464} {"train_loss": -7.022317886352539, "global_step": 187517, "epoch": 4464} {"train_loss": -7.150836944580078, "global_step": 187518, "epoch": 4464} {"train_loss": -7.192399978637695, "global_step": 187519, "epoch": 4464} {"train_loss": -7.098320484161377, "global_step": 187520, "epoch": 4464} {"train_loss": -7.237812519073486, "global_step": 187521, "epoch": 4464} {"train_loss": -7.071241855621338, "global_step": 187522, "epoch": 4464} {"train_loss": -7.145994186401367, "global_step": 187523, "epoch": 4464} {"train_loss": -7.138898849487305, "global_step": 187524, "epoch": 4464} {"train_loss": -7.2002668380737305, "global_step": 187525, "epoch": 4464} {"train_loss": -7.206319808959961, "global_step": 187526, "epoch": 4464} {"train_loss": -7.139483451843262, "global_step": 187527, "epoch": 4464} {"train_loss": -7.094088554382324, "global_step": 187528, "epoch": 4464} {"train_loss": -7.150141454878307, "global_step": 187529, "epoch": 4464, "val_loss": 69600.265625} {"train_loss": -7.154618740081787, "global_step": 187530, "epoch": 4465} {"train_loss": -7.039891242980957, "global_step": 187531, "epoch": 4465} {"train_loss": -6.984476566314697, "global_step": 187532, "epoch": 4465} {"train_loss": -7.12434196472168, "global_step": 187533, "epoch": 4465} {"train_loss": -7.15538215637207, "global_step": 187534, "epoch": 4465} {"train_loss": -7.077385902404785, "global_step": 187535, "epoch": 4465} {"train_loss": -7.246598720550537, "global_step": 187536, "epoch": 4465} {"train_loss": -7.0793328285217285, "global_step": 187537, "epoch": 4465} {"train_loss": -7.194047927856445, "global_step": 187538, "epoch": 4465} {"train_loss": -7.192204475402832, "global_step": 187539, "epoch": 4465} {"train_loss": -7.051910877227783, "global_step": 187540, "epoch": 4465} {"train_loss": -7.130898475646973, "global_step": 187541, "epoch": 4465} {"train_loss": -7.167094707489014, "global_step": 187542, "epoch": 4465} {"train_loss": -7.12908935546875, "global_step": 187543, "epoch": 4465} {"train_loss": -7.285716533660889, "global_step": 187544, "epoch": 4465} {"train_loss": -7.209160804748535, "global_step": 187545, "epoch": 4465} {"train_loss": -7.218443870544434, "global_step": 187546, "epoch": 4465} {"train_loss": -7.214142799377441, "global_step": 187547, "epoch": 4465} {"train_loss": -7.224197864532471, "global_step": 187548, "epoch": 4465} {"train_loss": -7.211313247680664, "global_step": 187549, "epoch": 4465} {"train_loss": -7.233695983886719, "global_step": 187550, "epoch": 4465} {"train_loss": -7.18920373916626, "global_step": 187551, "epoch": 4465} {"train_loss": -7.261162757873535, "global_step": 187552, "epoch": 4465} {"train_loss": -7.236089706420898, "global_step": 187553, "epoch": 4465} {"train_loss": -7.270877838134766, "global_step": 187554, "epoch": 4465} {"train_loss": -7.207242012023926, "global_step": 187555, "epoch": 4465} {"train_loss": -7.242440223693848, "global_step": 187556, "epoch": 4465} {"train_loss": -7.126257419586182, "global_step": 187557, "epoch": 4465} {"train_loss": -7.213437080383301, "global_step": 187558, "epoch": 4465} {"train_loss": -7.152131080627441, "global_step": 187559, "epoch": 4465} {"train_loss": -7.232202053070068, "global_step": 187560, "epoch": 4465} {"train_loss": -7.212475776672363, "global_step": 187561, "epoch": 4465} {"train_loss": -7.223564147949219, "global_step": 187562, "epoch": 4465} {"train_loss": -7.213659286499023, "global_step": 187563, "epoch": 4465} {"train_loss": -7.156528472900391, "global_step": 187564, "epoch": 4465} {"train_loss": -7.1827898025512695, "global_step": 187565, "epoch": 4465} {"train_loss": -7.218317031860352, "global_step": 187566, "epoch": 4465} {"train_loss": -7.109866619110107, "global_step": 187567, "epoch": 4465} {"train_loss": -7.210365295410156, "global_step": 187568, "epoch": 4465} {"train_loss": -7.202986717224121, "global_step": 187569, "epoch": 4465} {"train_loss": -7.32291316986084, "global_step": 187570, "epoch": 4465} {"train_loss": -7.18470025062561, "global_step": 187571, "epoch": 4465, "val_loss": 69533.2890625} {"train_loss": -7.113909721374512, "global_step": 187572, "epoch": 4466} {"train_loss": -7.167665481567383, "global_step": 187573, "epoch": 4466} {"train_loss": -7.271417617797852, "global_step": 187574, "epoch": 4466} {"train_loss": -7.066799640655518, "global_step": 187575, "epoch": 4466} {"train_loss": -7.141008377075195, "global_step": 187576, "epoch": 4466} {"train_loss": -7.211065769195557, "global_step": 187577, "epoch": 4466} {"train_loss": -7.338688850402832, "global_step": 187578, "epoch": 4466} {"train_loss": -7.227545261383057, "global_step": 187579, "epoch": 4466} {"train_loss": -7.189023494720459, "global_step": 187580, "epoch": 4466} {"train_loss": -7.174285888671875, "global_step": 187581, "epoch": 4466} {"train_loss": -7.265315055847168, "global_step": 187582, "epoch": 4466} {"train_loss": -7.155656814575195, "global_step": 187583, "epoch": 4466} {"train_loss": -7.236640930175781, "global_step": 187584, "epoch": 4466} {"train_loss": -7.2601318359375, "global_step": 187585, "epoch": 4466} {"train_loss": -7.291413307189941, "global_step": 187586, "epoch": 4466} {"train_loss": -7.184883117675781, "global_step": 187587, "epoch": 4466} {"train_loss": -7.142620086669922, "global_step": 187588, "epoch": 4466} {"train_loss": -7.187170028686523, "global_step": 187589, "epoch": 4466} {"train_loss": -7.204116344451904, "global_step": 187590, "epoch": 4466} {"train_loss": -7.101430892944336, "global_step": 187591, "epoch": 4466} {"train_loss": -7.21803092956543, "global_step": 187592, "epoch": 4466} {"train_loss": -7.206488609313965, "global_step": 187593, "epoch": 4466} {"train_loss": -7.211116790771484, "global_step": 187594, "epoch": 4466} {"train_loss": -7.136186599731445, "global_step": 187595, "epoch": 4466} {"train_loss": -7.2704362869262695, "global_step": 187596, "epoch": 4466} {"train_loss": -7.226884365081787, "global_step": 187597, "epoch": 4466} {"train_loss": -7.33770751953125, "global_step": 187598, "epoch": 4466} {"train_loss": -7.215519905090332, "global_step": 187599, "epoch": 4466} {"train_loss": -7.0865325927734375, "global_step": 187600, "epoch": 4466} {"train_loss": -7.213126182556152, "global_step": 187601, "epoch": 4466} {"train_loss": -7.091050148010254, "global_step": 187602, "epoch": 4466} {"train_loss": -7.196985721588135, "global_step": 187603, "epoch": 4466} {"train_loss": -7.286121368408203, "global_step": 187604, "epoch": 4466} {"train_loss": -7.171056747436523, "global_step": 187605, "epoch": 4466} {"train_loss": -7.143385887145996, "global_step": 187606, "epoch": 4466} {"train_loss": -7.266556739807129, "global_step": 187607, "epoch": 4466} {"train_loss": -7.1912384033203125, "global_step": 187608, "epoch": 4466} {"train_loss": -7.216818809509277, "global_step": 187609, "epoch": 4466} {"train_loss": -7.147037506103516, "global_step": 187610, "epoch": 4466} {"train_loss": -7.077642440795898, "global_step": 187611, "epoch": 4466} {"train_loss": -7.149676322937012, "global_step": 187612, "epoch": 4466} {"train_loss": -7.195144346782139, "global_step": 187613, "epoch": 4466, "val_loss": 69593.8046875} {"train_loss": -7.085846900939941, "global_step": 187614, "epoch": 4467} {"train_loss": -6.898375511169434, "global_step": 187615, "epoch": 4467} {"train_loss": -7.2774152755737305, "global_step": 187616, "epoch": 4467} {"train_loss": -7.136325836181641, "global_step": 187617, "epoch": 4467} {"train_loss": -7.148358345031738, "global_step": 187618, "epoch": 4467} {"train_loss": -7.215311527252197, "global_step": 187619, "epoch": 4467} {"train_loss": -7.046874046325684, "global_step": 187620, "epoch": 4467} {"train_loss": -7.127466201782227, "global_step": 187621, "epoch": 4467} {"train_loss": -7.08422327041626, "global_step": 187622, "epoch": 4467} {"train_loss": -7.01286506652832, "global_step": 187623, "epoch": 4467} {"train_loss": -7.097354888916016, "global_step": 187624, "epoch": 4467} {"train_loss": -7.031340599060059, "global_step": 187625, "epoch": 4467} {"train_loss": -7.086913585662842, "global_step": 187626, "epoch": 4467} {"train_loss": -7.071691513061523, "global_step": 187627, "epoch": 4467} {"train_loss": -7.093697547912598, "global_step": 187628, "epoch": 4467} {"train_loss": -7.075137138366699, "global_step": 187629, "epoch": 4467} {"train_loss": -7.064120292663574, "global_step": 187630, "epoch": 4467} {"train_loss": -7.2183332443237305, "global_step": 187631, "epoch": 4467} {"train_loss": -7.038776397705078, "global_step": 187632, "epoch": 4467} {"train_loss": -7.15196418762207, "global_step": 187633, "epoch": 4467} {"train_loss": -7.30621337890625, "global_step": 187634, "epoch": 4467} {"train_loss": -7.032814979553223, "global_step": 187635, "epoch": 4467} {"train_loss": -7.115384101867676, "global_step": 187636, "epoch": 4467} {"train_loss": -7.206978797912598, "global_step": 187637, "epoch": 4467} {"train_loss": -7.1370344161987305, "global_step": 187638, "epoch": 4467} {"train_loss": -7.120938301086426, "global_step": 187639, "epoch": 4467} {"train_loss": -7.11857795715332, "global_step": 187640, "epoch": 4467} {"train_loss": -7.274033546447754, "global_step": 187641, "epoch": 4467} {"train_loss": -7.090034484863281, "global_step": 187642, "epoch": 4467} {"train_loss": -7.199859619140625, "global_step": 187643, "epoch": 4467} {"train_loss": -7.294279098510742, "global_step": 187644, "epoch": 4467} {"train_loss": -7.096338272094727, "global_step": 187645, "epoch": 4467} {"train_loss": -7.2353973388671875, "global_step": 187646, "epoch": 4467} {"train_loss": -7.245041847229004, "global_step": 187647, "epoch": 4467} {"train_loss": -7.073413848876953, "global_step": 187648, "epoch": 4467} {"train_loss": -7.2295002937316895, "global_step": 187649, "epoch": 4467} {"train_loss": -7.10630464553833, "global_step": 187650, "epoch": 4467} {"train_loss": -7.138550758361816, "global_step": 187651, "epoch": 4467} {"train_loss": -7.113382816314697, "global_step": 187652, "epoch": 4467} {"train_loss": -7.217796325683594, "global_step": 187653, "epoch": 4467} {"train_loss": -7.200199127197266, "global_step": 187654, "epoch": 4467} {"train_loss": -7.134408666974022, "global_step": 187655, "epoch": 4467, "val_loss": 69280.546875} {"train_loss": -7.237642765045166, "global_step": 187656, "epoch": 4468} {"train_loss": -7.196829319000244, "global_step": 187657, "epoch": 4468} {"train_loss": -7.205165863037109, "global_step": 187658, "epoch": 4468} {"train_loss": -7.1972174644470215, "global_step": 187659, "epoch": 4468} {"train_loss": -7.282670974731445, "global_step": 187660, "epoch": 4468} {"train_loss": -7.218194484710693, "global_step": 187661, "epoch": 4468} {"train_loss": -7.1662068367004395, "global_step": 187662, "epoch": 4468} {"train_loss": -7.151473522186279, "global_step": 187663, "epoch": 4468} {"train_loss": -7.223589897155762, "global_step": 187664, "epoch": 4468} {"train_loss": -7.129103183746338, "global_step": 187665, "epoch": 4468} {"train_loss": -7.178188800811768, "global_step": 187666, "epoch": 4468} {"train_loss": -7.11776065826416, "global_step": 187667, "epoch": 4468} {"train_loss": -7.133436679840088, "global_step": 187668, "epoch": 4468} {"train_loss": -7.173165798187256, "global_step": 187669, "epoch": 4468} {"train_loss": -7.172840118408203, "global_step": 187670, "epoch": 4468} {"train_loss": -7.18030309677124, "global_step": 187671, "epoch": 4468} {"train_loss": -7.14421272277832, "global_step": 187672, "epoch": 4468} {"train_loss": -7.051344394683838, "global_step": 187673, "epoch": 4468} {"train_loss": -7.106339454650879, "global_step": 187674, "epoch": 4468} {"train_loss": -7.132699966430664, "global_step": 187675, "epoch": 4468} {"train_loss": -7.04591703414917, "global_step": 187676, "epoch": 4468} {"train_loss": -7.25145959854126, "global_step": 187677, "epoch": 4468} {"train_loss": -7.154886722564697, "global_step": 187678, "epoch": 4468} {"train_loss": -7.129533767700195, "global_step": 187679, "epoch": 4468} {"train_loss": -7.165628433227539, "global_step": 187680, "epoch": 4468} {"train_loss": -7.23292350769043, "global_step": 187681, "epoch": 4468} {"train_loss": -7.205816268920898, "global_step": 187682, "epoch": 4468} {"train_loss": -7.25083065032959, "global_step": 187683, "epoch": 4468} {"train_loss": -7.162472724914551, "global_step": 187684, "epoch": 4468} {"train_loss": -7.223620414733887, "global_step": 187685, "epoch": 4468} {"train_loss": -7.075542449951172, "global_step": 187686, "epoch": 4468} {"train_loss": -7.186187744140625, "global_step": 187687, "epoch": 4468} {"train_loss": -7.214704513549805, "global_step": 187688, "epoch": 4468} {"train_loss": -7.132357597351074, "global_step": 187689, "epoch": 4468} {"train_loss": -7.3061723709106445, "global_step": 187690, "epoch": 4468} {"train_loss": -7.203779697418213, "global_step": 187691, "epoch": 4468} {"train_loss": -7.192501068115234, "global_step": 187692, "epoch": 4468} {"train_loss": -7.21490478515625, "global_step": 187693, "epoch": 4468} {"train_loss": -7.206521987915039, "global_step": 187694, "epoch": 4468} {"train_loss": -7.185829162597656, "global_step": 187695, "epoch": 4468} {"train_loss": -7.2146406173706055, "global_step": 187696, "epoch": 4468} {"train_loss": -7.182271083196004, "global_step": 187697, "epoch": 4468, "val_loss": 69582.28125} {"train_loss": -7.275386810302734, "global_step": 187698, "epoch": 4469} {"train_loss": -7.292314052581787, "global_step": 187699, "epoch": 4469} {"train_loss": -7.246231555938721, "global_step": 187700, "epoch": 4469} {"train_loss": -7.226850986480713, "global_step": 187701, "epoch": 4469} {"train_loss": -7.2632222175598145, "global_step": 187702, "epoch": 4469} {"train_loss": -7.309866428375244, "global_step": 187703, "epoch": 4469} {"train_loss": -7.2290849685668945, "global_step": 187704, "epoch": 4469} {"train_loss": -7.177080154418945, "global_step": 187705, "epoch": 4469} {"train_loss": -7.213393688201904, "global_step": 187706, "epoch": 4469} {"train_loss": -7.2757768630981445, "global_step": 187707, "epoch": 4469} {"train_loss": -7.36588191986084, "global_step": 187708, "epoch": 4469} {"train_loss": -7.291103839874268, "global_step": 187709, "epoch": 4469} {"train_loss": -7.20999813079834, "global_step": 187710, "epoch": 4469} {"train_loss": -7.173789024353027, "global_step": 187711, "epoch": 4469} {"train_loss": -7.266350746154785, "global_step": 187712, "epoch": 4469} {"train_loss": -7.2596259117126465, "global_step": 187713, "epoch": 4469} {"train_loss": -7.241550922393799, "global_step": 187714, "epoch": 4469} {"train_loss": -7.274161338806152, "global_step": 187715, "epoch": 4469} {"train_loss": -7.171786308288574, "global_step": 187716, "epoch": 4469} {"train_loss": -7.255690574645996, "global_step": 187717, "epoch": 4469} {"train_loss": -7.201519966125488, "global_step": 187718, "epoch": 4469} {"train_loss": -7.235645294189453, "global_step": 187719, "epoch": 4469} {"train_loss": -7.2433762550354, "global_step": 187720, "epoch": 4469} {"train_loss": -7.242312431335449, "global_step": 187721, "epoch": 4469} {"train_loss": -7.264101982116699, "global_step": 187722, "epoch": 4469} {"train_loss": -7.198252201080322, "global_step": 187723, "epoch": 4469} {"train_loss": -7.284309387207031, "global_step": 187724, "epoch": 4469} {"train_loss": -7.192727088928223, "global_step": 187725, "epoch": 4469} {"train_loss": -7.144317626953125, "global_step": 187726, "epoch": 4469} {"train_loss": -7.083747863769531, "global_step": 187727, "epoch": 4469} {"train_loss": -7.1795854568481445, "global_step": 187728, "epoch": 4469} {"train_loss": -7.149092674255371, "global_step": 187729, "epoch": 4469} {"train_loss": -7.263668060302734, "global_step": 187730, "epoch": 4469} {"train_loss": -7.1238603591918945, "global_step": 187731, "epoch": 4469} {"train_loss": -7.198451042175293, "global_step": 187732, "epoch": 4469} {"train_loss": -7.136233329772949, "global_step": 187733, "epoch": 4469} {"train_loss": -7.196247100830078, "global_step": 187734, "epoch": 4469} {"train_loss": -7.171417236328125, "global_step": 187735, "epoch": 4469} {"train_loss": -7.210399627685547, "global_step": 187736, "epoch": 4469} {"train_loss": -7.17737340927124, "global_step": 187737, "epoch": 4469} {"train_loss": -7.291602611541748, "global_step": 187738, "epoch": 4469} {"train_loss": -7.22555965468997, "global_step": 187739, "epoch": 4469, "val_loss": 69433.109375} {"train_loss": -7.320588111877441, "global_step": 187740, "epoch": 4470} {"train_loss": -7.204463958740234, "global_step": 187741, "epoch": 4470} {"train_loss": -7.196412086486816, "global_step": 187742, "epoch": 4470} {"train_loss": -7.3528852462768555, "global_step": 187743, "epoch": 4470} {"train_loss": -7.176290512084961, "global_step": 187744, "epoch": 4470} {"train_loss": -7.32351541519165, "global_step": 187745, "epoch": 4470} {"train_loss": -7.360663414001465, "global_step": 187746, "epoch": 4470} {"train_loss": -7.198481559753418, "global_step": 187747, "epoch": 4470} {"train_loss": -7.233728885650635, "global_step": 187748, "epoch": 4470} {"train_loss": -7.248754501342773, "global_step": 187749, "epoch": 4470} {"train_loss": -7.273322582244873, "global_step": 187750, "epoch": 4470} {"train_loss": -7.138774871826172, "global_step": 187751, "epoch": 4470} {"train_loss": -7.231257438659668, "global_step": 187752, "epoch": 4470} {"train_loss": -7.061817169189453, "global_step": 187753, "epoch": 4470} {"train_loss": -7.227962970733643, "global_step": 187754, "epoch": 4470} {"train_loss": -7.247063636779785, "global_step": 187755, "epoch": 4470} {"train_loss": -7.136946678161621, "global_step": 187756, "epoch": 4470} {"train_loss": -7.239498138427734, "global_step": 187757, "epoch": 4470} {"train_loss": -7.029083251953125, "global_step": 187758, "epoch": 4470} {"train_loss": -7.137190341949463, "global_step": 187759, "epoch": 4470} {"train_loss": -7.221615791320801, "global_step": 187760, "epoch": 4470} {"train_loss": -7.009550094604492, "global_step": 187761, "epoch": 4470} {"train_loss": -7.111100673675537, "global_step": 187762, "epoch": 4470} {"train_loss": -7.210355281829834, "global_step": 187763, "epoch": 4470} {"train_loss": -7.060052394866943, "global_step": 187764, "epoch": 4470} {"train_loss": -7.121506214141846, "global_step": 187765, "epoch": 4470} {"train_loss": -7.243096351623535, "global_step": 187766, "epoch": 4470} {"train_loss": -7.133218765258789, "global_step": 187767, "epoch": 4470} {"train_loss": -6.960114002227783, "global_step": 187768, "epoch": 4470} {"train_loss": -7.1380085945129395, "global_step": 187769, "epoch": 4470} {"train_loss": -6.945635795593262, "global_step": 187770, "epoch": 4470} {"train_loss": -6.898418426513672, "global_step": 187771, "epoch": 4470} {"train_loss": -7.079401969909668, "global_step": 187772, "epoch": 4470} {"train_loss": -7.06257438659668, "global_step": 187773, "epoch": 4470} {"train_loss": -7.020750522613525, "global_step": 187774, "epoch": 4470} {"train_loss": -7.039124011993408, "global_step": 187775, "epoch": 4470} {"train_loss": -6.924813747406006, "global_step": 187776, "epoch": 4470} {"train_loss": -7.016464710235596, "global_step": 187777, "epoch": 4470} {"train_loss": -6.849515438079834, "global_step": 187778, "epoch": 4470} {"train_loss": -6.948746681213379, "global_step": 187779, "epoch": 4470} {"train_loss": -6.983954906463623, "global_step": 187780, "epoch": 4470} {"train_loss": -7.126117274874733, "global_step": 187781, "epoch": 4470, "val_loss": 69424.390625} {"train_loss": -7.040668964385986, "global_step": 187782, "epoch": 4471} {"train_loss": -7.009559631347656, "global_step": 187783, "epoch": 4471} {"train_loss": -7.078734874725342, "global_step": 187784, "epoch": 4471} {"train_loss": -6.968743324279785, "global_step": 187785, "epoch": 4471} {"train_loss": -7.051059722900391, "global_step": 187786, "epoch": 4471} {"train_loss": -7.12600564956665, "global_step": 187787, "epoch": 4471} {"train_loss": -7.057997703552246, "global_step": 187788, "epoch": 4471} {"train_loss": -7.167121410369873, "global_step": 187789, "epoch": 4471} {"train_loss": -7.115053176879883, "global_step": 187790, "epoch": 4471} {"train_loss": -7.051318168640137, "global_step": 187791, "epoch": 4471} {"train_loss": -7.153964996337891, "global_step": 187792, "epoch": 4471} {"train_loss": -7.113474369049072, "global_step": 187793, "epoch": 4471} {"train_loss": -7.076125144958496, "global_step": 187794, "epoch": 4471} {"train_loss": -7.0118536949157715, "global_step": 187795, "epoch": 4471} {"train_loss": -7.054225921630859, "global_step": 187796, "epoch": 4471} {"train_loss": -7.095102310180664, "global_step": 187797, "epoch": 4471} {"train_loss": -7.254489898681641, "global_step": 187798, "epoch": 4471} {"train_loss": -7.141188621520996, "global_step": 187799, "epoch": 4471} {"train_loss": -7.212020397186279, "global_step": 187800, "epoch": 4471} {"train_loss": -7.194919586181641, "global_step": 187801, "epoch": 4471} {"train_loss": -7.226805210113525, "global_step": 187802, "epoch": 4471} {"train_loss": -7.204314231872559, "global_step": 187803, "epoch": 4471} {"train_loss": -7.013799667358398, "global_step": 187804, "epoch": 4471} {"train_loss": -7.275254249572754, "global_step": 187805, "epoch": 4471} {"train_loss": -7.130758285522461, "global_step": 187806, "epoch": 4471} {"train_loss": -7.079624176025391, "global_step": 187807, "epoch": 4471} {"train_loss": -7.189169883728027, "global_step": 187808, "epoch": 4471} {"train_loss": -7.097024917602539, "global_step": 187809, "epoch": 4471} {"train_loss": -7.097352981567383, "global_step": 187810, "epoch": 4471} {"train_loss": -7.1750664710998535, "global_step": 187811, "epoch": 4471} {"train_loss": -7.188589572906494, "global_step": 187812, "epoch": 4471} {"train_loss": -7.169349670410156, "global_step": 187813, "epoch": 4471} {"train_loss": -7.144585132598877, "global_step": 187814, "epoch": 4471} {"train_loss": -7.118661880493164, "global_step": 187815, "epoch": 4471} {"train_loss": -7.123695373535156, "global_step": 187816, "epoch": 4471} {"train_loss": -7.224039554595947, "global_step": 187817, "epoch": 4471} {"train_loss": -7.093565464019775, "global_step": 187818, "epoch": 4471} {"train_loss": -7.078200340270996, "global_step": 187819, "epoch": 4471} {"train_loss": -7.248725414276123, "global_step": 187820, "epoch": 4471} {"train_loss": -7.135262489318848, "global_step": 187821, "epoch": 4471} {"train_loss": -7.235997200012207, "global_step": 187822, "epoch": 4471} {"train_loss": -7.126011360259283, "global_step": 187823, "epoch": 4471, "val_loss": 69470.5859375} {"train_loss": -7.351537227630615, "global_step": 187824, "epoch": 4472} {"train_loss": -7.153098106384277, "global_step": 187825, "epoch": 4472} {"train_loss": -7.09929084777832, "global_step": 187826, "epoch": 4472} {"train_loss": -7.169873237609863, "global_step": 187827, "epoch": 4472} {"train_loss": -7.110884189605713, "global_step": 187828, "epoch": 4472} {"train_loss": -7.064431667327881, "global_step": 187829, "epoch": 4472} {"train_loss": -7.195507049560547, "global_step": 187830, "epoch": 4472} {"train_loss": -7.136661529541016, "global_step": 187831, "epoch": 4472} {"train_loss": -7.104772567749023, "global_step": 187832, "epoch": 4472} {"train_loss": -7.273704528808594, "global_step": 187833, "epoch": 4472} {"train_loss": -7.102900981903076, "global_step": 187834, "epoch": 4472} {"train_loss": -7.227972984313965, "global_step": 187835, "epoch": 4472} {"train_loss": -7.158927917480469, "global_step": 187836, "epoch": 4472} {"train_loss": -7.18878173828125, "global_step": 187837, "epoch": 4472} {"train_loss": -7.2465620040893555, "global_step": 187838, "epoch": 4472} {"train_loss": -7.280068397521973, "global_step": 187839, "epoch": 4472} {"train_loss": -7.2191033363342285, "global_step": 187840, "epoch": 4472} {"train_loss": -7.12192440032959, "global_step": 187841, "epoch": 4472} {"train_loss": -7.220685958862305, "global_step": 187842, "epoch": 4472} {"train_loss": -7.0956220626831055, "global_step": 187843, "epoch": 4472} {"train_loss": -7.105883598327637, "global_step": 187844, "epoch": 4472} {"train_loss": -7.178125381469727, "global_step": 187845, "epoch": 4472} {"train_loss": -7.172758102416992, "global_step": 187846, "epoch": 4472} {"train_loss": -7.134039402008057, "global_step": 187847, "epoch": 4472} {"train_loss": -7.239175319671631, "global_step": 187848, "epoch": 4472} {"train_loss": -7.1228227615356445, "global_step": 187849, "epoch": 4472} {"train_loss": -7.0235395431518555, "global_step": 187850, "epoch": 4472} {"train_loss": -7.069269180297852, "global_step": 187851, "epoch": 4472} {"train_loss": -7.263186454772949, "global_step": 187852, "epoch": 4472} {"train_loss": -7.156522750854492, "global_step": 187853, "epoch": 4472} {"train_loss": -7.070524215698242, "global_step": 187854, "epoch": 4472} {"train_loss": -7.125444412231445, "global_step": 187855, "epoch": 4472} {"train_loss": -7.111127853393555, "global_step": 187856, "epoch": 4472} {"train_loss": -7.0835723876953125, "global_step": 187857, "epoch": 4472} {"train_loss": -7.188037872314453, "global_step": 187858, "epoch": 4472} {"train_loss": -7.08266544342041, "global_step": 187859, "epoch": 4472} {"train_loss": -7.067885398864746, "global_step": 187860, "epoch": 4472} {"train_loss": -7.026425361633301, "global_step": 187861, "epoch": 4472} {"train_loss": -7.070531845092773, "global_step": 187862, "epoch": 4472} {"train_loss": -7.090507507324219, "global_step": 187863, "epoch": 4472} {"train_loss": -7.133588790893555, "global_step": 187864, "epoch": 4472} {"train_loss": -7.1492632911318825, "global_step": 187865, "epoch": 4472, "val_loss": 69710.8125} {"train_loss": -7.207920074462891, "global_step": 187866, "epoch": 4473} {"train_loss": -7.119675636291504, "global_step": 187867, "epoch": 4473} {"train_loss": -7.27264928817749, "global_step": 187868, "epoch": 4473} {"train_loss": -7.174285411834717, "global_step": 187869, "epoch": 4473} {"train_loss": -7.155569076538086, "global_step": 187870, "epoch": 4473} {"train_loss": -7.246569633483887, "global_step": 187871, "epoch": 4473} {"train_loss": -7.177670001983643, "global_step": 187872, "epoch": 4473} {"train_loss": -7.187018871307373, "global_step": 187873, "epoch": 4473} {"train_loss": -7.190296173095703, "global_step": 187874, "epoch": 4473} {"train_loss": -7.113900184631348, "global_step": 187875, "epoch": 4473} {"train_loss": -7.0605854988098145, "global_step": 187876, "epoch": 4473} {"train_loss": -7.173467636108398, "global_step": 187877, "epoch": 4473} {"train_loss": -7.123989105224609, "global_step": 187878, "epoch": 4473} {"train_loss": -7.212778091430664, "global_step": 187879, "epoch": 4473} {"train_loss": -7.089966773986816, "global_step": 187880, "epoch": 4473} {"train_loss": -7.023373603820801, "global_step": 187881, "epoch": 4473} {"train_loss": -7.1541852951049805, "global_step": 187882, "epoch": 4473} {"train_loss": -7.34065055847168, "global_step": 187883, "epoch": 4473} {"train_loss": -7.191572666168213, "global_step": 187884, "epoch": 4473} {"train_loss": -7.261050224304199, "global_step": 187885, "epoch": 4473} {"train_loss": -7.172645568847656, "global_step": 187886, "epoch": 4473} {"train_loss": -7.29397439956665, "global_step": 187887, "epoch": 4473} {"train_loss": -7.22576904296875, "global_step": 187888, "epoch": 4473} {"train_loss": -7.104207992553711, "global_step": 187889, "epoch": 4473} {"train_loss": -7.097784042358398, "global_step": 187890, "epoch": 4473} {"train_loss": -7.171571731567383, "global_step": 187891, "epoch": 4473} {"train_loss": -7.176916122436523, "global_step": 187892, "epoch": 4473} {"train_loss": -7.012686252593994, "global_step": 187893, "epoch": 4473} {"train_loss": -7.030440330505371, "global_step": 187894, "epoch": 4473} {"train_loss": -7.283109188079834, "global_step": 187895, "epoch": 4473} {"train_loss": -7.123035907745361, "global_step": 187896, "epoch": 4473} {"train_loss": -7.202545642852783, "global_step": 187897, "epoch": 4473} {"train_loss": -7.231741905212402, "global_step": 187898, "epoch": 4473} {"train_loss": -7.071455001831055, "global_step": 187899, "epoch": 4473} {"train_loss": -7.196805000305176, "global_step": 187900, "epoch": 4473} {"train_loss": -7.167266845703125, "global_step": 187901, "epoch": 4473} {"train_loss": -7.222878456115723, "global_step": 187902, "epoch": 4473} {"train_loss": -7.2651824951171875, "global_step": 187903, "epoch": 4473} {"train_loss": -7.293751239776611, "global_step": 187904, "epoch": 4473} {"train_loss": -7.150347709655762, "global_step": 187905, "epoch": 4473} {"train_loss": -7.181609630584717, "global_step": 187906, "epoch": 4473} {"train_loss": -7.17594145593189, "global_step": 187907, "epoch": 4473, "val_loss": 69522.40625} {"train_loss": -7.198432922363281, "global_step": 187908, "epoch": 4474} {"train_loss": -7.198991775512695, "global_step": 187909, "epoch": 4474} {"train_loss": -7.172360897064209, "global_step": 187910, "epoch": 4474} {"train_loss": -7.281257629394531, "global_step": 187911, "epoch": 4474} {"train_loss": -7.257734298706055, "global_step": 187912, "epoch": 4474} {"train_loss": -7.261618137359619, "global_step": 187913, "epoch": 4474} {"train_loss": -7.257094383239746, "global_step": 187914, "epoch": 4474} {"train_loss": -7.207464218139648, "global_step": 187915, "epoch": 4474} {"train_loss": -7.200604438781738, "global_step": 187916, "epoch": 4474} {"train_loss": -7.177577018737793, "global_step": 187917, "epoch": 4474} {"train_loss": -7.2187347412109375, "global_step": 187918, "epoch": 4474} {"train_loss": -7.20736837387085, "global_step": 187919, "epoch": 4474} {"train_loss": -7.107049465179443, "global_step": 187920, "epoch": 4474} {"train_loss": -7.258481502532959, "global_step": 187921, "epoch": 4474} {"train_loss": -7.25788688659668, "global_step": 187922, "epoch": 4474} {"train_loss": -7.195355415344238, "global_step": 187923, "epoch": 4474} {"train_loss": -7.216485023498535, "global_step": 187924, "epoch": 4474} {"train_loss": -7.181703567504883, "global_step": 187925, "epoch": 4474} {"train_loss": -7.212520599365234, "global_step": 187926, "epoch": 4474} {"train_loss": -7.144133567810059, "global_step": 187927, "epoch": 4474} {"train_loss": -7.333576679229736, "global_step": 187928, "epoch": 4474} {"train_loss": -7.190325736999512, "global_step": 187929, "epoch": 4474} {"train_loss": -7.224127769470215, "global_step": 187930, "epoch": 4474} {"train_loss": -7.21284294128418, "global_step": 187931, "epoch": 4474} {"train_loss": -7.177989959716797, "global_step": 187932, "epoch": 4474} {"train_loss": -7.310208320617676, "global_step": 187933, "epoch": 4474} {"train_loss": -7.282713413238525, "global_step": 187934, "epoch": 4474} {"train_loss": -7.33398962020874, "global_step": 187935, "epoch": 4474} {"train_loss": -7.157692909240723, "global_step": 187936, "epoch": 4474} {"train_loss": -7.346606731414795, "global_step": 187937, "epoch": 4474} {"train_loss": -7.202053070068359, "global_step": 187938, "epoch": 4474} {"train_loss": -7.30855655670166, "global_step": 187939, "epoch": 4474} {"train_loss": -7.299437522888184, "global_step": 187940, "epoch": 4474} {"train_loss": -7.21354866027832, "global_step": 187941, "epoch": 4474} {"train_loss": -7.252766132354736, "global_step": 187942, "epoch": 4474} {"train_loss": -7.1269378662109375, "global_step": 187943, "epoch": 4474} {"train_loss": -7.270654678344727, "global_step": 187944, "epoch": 4474} {"train_loss": -7.1335577964782715, "global_step": 187945, "epoch": 4474} {"train_loss": -7.285710334777832, "global_step": 187946, "epoch": 4474} {"train_loss": -7.140838623046875, "global_step": 187947, "epoch": 4474} {"train_loss": -7.13580322265625, "global_step": 187948, "epoch": 4474} {"train_loss": -7.221204383032663, "global_step": 187949, "epoch": 4474, "val_loss": 69615.9609375} {"train_loss": -7.267440319061279, "global_step": 187950, "epoch": 4475} {"train_loss": -7.1656084060668945, "global_step": 187951, "epoch": 4475} {"train_loss": -7.265420436859131, "global_step": 187952, "epoch": 4475} {"train_loss": -7.371286869049072, "global_step": 187953, "epoch": 4475} {"train_loss": -7.331230163574219, "global_step": 187954, "epoch": 4475} {"train_loss": -7.151127815246582, "global_step": 187955, "epoch": 4475} {"train_loss": -7.144515037536621, "global_step": 187956, "epoch": 4475} {"train_loss": -7.270753860473633, "global_step": 187957, "epoch": 4475} {"train_loss": -7.277504920959473, "global_step": 187958, "epoch": 4475} {"train_loss": -7.20789909362793, "global_step": 187959, "epoch": 4475} {"train_loss": -7.248978614807129, "global_step": 187960, "epoch": 4475} {"train_loss": -7.230267524719238, "global_step": 187961, "epoch": 4475} {"train_loss": -7.211345672607422, "global_step": 187962, "epoch": 4475} {"train_loss": -7.140783309936523, "global_step": 187963, "epoch": 4475} {"train_loss": -7.25095272064209, "global_step": 187964, "epoch": 4475} {"train_loss": -7.217781066894531, "global_step": 187965, "epoch": 4475} {"train_loss": -7.277535438537598, "global_step": 187966, "epoch": 4475} {"train_loss": -7.231034278869629, "global_step": 187967, "epoch": 4475} {"train_loss": -7.255068302154541, "global_step": 187968, "epoch": 4475} {"train_loss": -7.154150009155273, "global_step": 187969, "epoch": 4475} {"train_loss": -7.27485466003418, "global_step": 187970, "epoch": 4475} {"train_loss": -7.170061111450195, "global_step": 187971, "epoch": 4475} {"train_loss": -7.19526481628418, "global_step": 187972, "epoch": 4475} {"train_loss": -7.213185787200928, "global_step": 187973, "epoch": 4475} {"train_loss": -7.180656433105469, "global_step": 187974, "epoch": 4475} {"train_loss": -7.2398529052734375, "global_step": 187975, "epoch": 4475} {"train_loss": -7.279632568359375, "global_step": 187976, "epoch": 4475} {"train_loss": -7.257773399353027, "global_step": 187977, "epoch": 4475} {"train_loss": -7.176671028137207, "global_step": 187978, "epoch": 4475} {"train_loss": -7.237926006317139, "global_step": 187979, "epoch": 4475} {"train_loss": -7.1362810134887695, "global_step": 187980, "epoch": 4475} {"train_loss": -7.171677589416504, "global_step": 187981, "epoch": 4475} {"train_loss": -7.13714599609375, "global_step": 187982, "epoch": 4475} {"train_loss": -7.156649589538574, "global_step": 187983, "epoch": 4475} {"train_loss": -7.204805374145508, "global_step": 187984, "epoch": 4475} {"train_loss": -7.075098037719727, "global_step": 187985, "epoch": 4475} {"train_loss": -7.196174621582031, "global_step": 187986, "epoch": 4475} {"train_loss": -7.223594665527344, "global_step": 187987, "epoch": 4475} {"train_loss": -6.9921040534973145, "global_step": 187988, "epoch": 4475} {"train_loss": -7.17008638381958, "global_step": 187989, "epoch": 4475} {"train_loss": -7.051419734954834, "global_step": 187990, "epoch": 4475} {"train_loss": -7.198061341331119, "global_step": 187991, "epoch": 4475, "val_loss": 69505.96875} {"train_loss": -7.064927101135254, "global_step": 187992, "epoch": 4476} {"train_loss": -7.126461029052734, "global_step": 187993, "epoch": 4476} {"train_loss": -7.006969928741455, "global_step": 187994, "epoch": 4476} {"train_loss": -7.173114776611328, "global_step": 187995, "epoch": 4476} {"train_loss": -7.1029815673828125, "global_step": 187996, "epoch": 4476} {"train_loss": -7.099758148193359, "global_step": 187997, "epoch": 4476} {"train_loss": -7.2109375, "global_step": 187998, "epoch": 4476} {"train_loss": -7.039062976837158, "global_step": 187999, "epoch": 4476} {"train_loss": -7.1534271240234375, "global_step": 188000, "epoch": 4476} {"train_loss": -7.069589614868164, "global_step": 188001, "epoch": 4476} {"train_loss": -7.0648393630981445, "global_step": 188002, "epoch": 4476} {"train_loss": -7.114706516265869, "global_step": 188003, "epoch": 4476} {"train_loss": -7.185201644897461, "global_step": 188004, "epoch": 4476} {"train_loss": -7.179836750030518, "global_step": 188005, "epoch": 4476} {"train_loss": -7.0625505447387695, "global_step": 188006, "epoch": 4476} {"train_loss": -7.251569747924805, "global_step": 188007, "epoch": 4476} {"train_loss": -7.235593795776367, "global_step": 188008, "epoch": 4476} {"train_loss": -7.175187110900879, "global_step": 188009, "epoch": 4476} {"train_loss": -7.207960605621338, "global_step": 188010, "epoch": 4476} {"train_loss": -7.267091274261475, "global_step": 188011, "epoch": 4476} {"train_loss": -7.2143168449401855, "global_step": 188012, "epoch": 4476} {"train_loss": -7.138176918029785, "global_step": 188013, "epoch": 4476} {"train_loss": -7.255402565002441, "global_step": 188014, "epoch": 4476} {"train_loss": -7.335371017456055, "global_step": 188015, "epoch": 4476} {"train_loss": -7.231206893920898, "global_step": 188016, "epoch": 4476} {"train_loss": -7.220309257507324, "global_step": 188017, "epoch": 4476} {"train_loss": -7.217055320739746, "global_step": 188018, "epoch": 4476} {"train_loss": -7.266812324523926, "global_step": 188019, "epoch": 4476} {"train_loss": -7.143376350402832, "global_step": 188020, "epoch": 4476} {"train_loss": -7.219478607177734, "global_step": 188021, "epoch": 4476} {"train_loss": -7.136719703674316, "global_step": 188022, "epoch": 4476} {"train_loss": -7.161235809326172, "global_step": 188023, "epoch": 4476} {"train_loss": -7.194807052612305, "global_step": 188024, "epoch": 4476} {"train_loss": -7.2572832107543945, "global_step": 188025, "epoch": 4476} {"train_loss": -7.239227294921875, "global_step": 188026, "epoch": 4476} {"train_loss": -7.078516960144043, "global_step": 188027, "epoch": 4476} {"train_loss": -7.166102409362793, "global_step": 188028, "epoch": 4476} {"train_loss": -7.0052080154418945, "global_step": 188029, "epoch": 4476} {"train_loss": -6.978498458862305, "global_step": 188030, "epoch": 4476} {"train_loss": -7.203023433685303, "global_step": 188031, "epoch": 4476} {"train_loss": -7.033870220184326, "global_step": 188032, "epoch": 4476} {"train_loss": -7.155639603024437, "global_step": 188033, "epoch": 4476, "val_loss": 69625.9921875} {"train_loss": -7.262709140777588, "global_step": 188034, "epoch": 4477} {"train_loss": -7.03165340423584, "global_step": 188035, "epoch": 4477} {"train_loss": -7.158141136169434, "global_step": 188036, "epoch": 4477} {"train_loss": -7.154574394226074, "global_step": 188037, "epoch": 4477} {"train_loss": -7.12095832824707, "global_step": 188038, "epoch": 4477} {"train_loss": -7.182636260986328, "global_step": 188039, "epoch": 4477} {"train_loss": -7.2594523429870605, "global_step": 188040, "epoch": 4477} {"train_loss": -7.125937461853027, "global_step": 188041, "epoch": 4477} {"train_loss": -7.144917011260986, "global_step": 188042, "epoch": 4477} {"train_loss": -7.158144474029541, "global_step": 188043, "epoch": 4477} {"train_loss": -7.143251895904541, "global_step": 188044, "epoch": 4477} {"train_loss": -7.218638896942139, "global_step": 188045, "epoch": 4477} {"train_loss": -7.183811187744141, "global_step": 188046, "epoch": 4477} {"train_loss": -7.159997940063477, "global_step": 188047, "epoch": 4477} {"train_loss": -7.144284725189209, "global_step": 188048, "epoch": 4477} {"train_loss": -7.036133289337158, "global_step": 188049, "epoch": 4477} {"train_loss": -7.108219146728516, "global_step": 188050, "epoch": 4477} {"train_loss": -7.254289627075195, "global_step": 188051, "epoch": 4477} {"train_loss": -7.048572540283203, "global_step": 188052, "epoch": 4477} {"train_loss": -7.114463806152344, "global_step": 188053, "epoch": 4477} {"train_loss": -7.070752143859863, "global_step": 188054, "epoch": 4477} {"train_loss": -7.178193092346191, "global_step": 188055, "epoch": 4477} {"train_loss": -7.087655067443848, "global_step": 188056, "epoch": 4477} {"train_loss": -7.121496677398682, "global_step": 188057, "epoch": 4477} {"train_loss": -7.159207820892334, "global_step": 188058, "epoch": 4477} {"train_loss": -7.038243293762207, "global_step": 188059, "epoch": 4477} {"train_loss": -7.138706207275391, "global_step": 188060, "epoch": 4477} {"train_loss": -7.169921875, "global_step": 188061, "epoch": 4477} {"train_loss": -7.181199073791504, "global_step": 188062, "epoch": 4477} {"train_loss": -7.049482345581055, "global_step": 188063, "epoch": 4477} {"train_loss": -7.144868850708008, "global_step": 188064, "epoch": 4477} {"train_loss": -7.044076919555664, "global_step": 188065, "epoch": 4477} {"train_loss": -7.162562370300293, "global_step": 188066, "epoch": 4477} {"train_loss": -7.162781238555908, "global_step": 188067, "epoch": 4477} {"train_loss": -7.068030834197998, "global_step": 188068, "epoch": 4477} {"train_loss": -7.133324146270752, "global_step": 188069, "epoch": 4477} {"train_loss": -7.214014053344727, "global_step": 188070, "epoch": 4477} {"train_loss": -7.154906749725342, "global_step": 188071, "epoch": 4477} {"train_loss": -7.038532257080078, "global_step": 188072, "epoch": 4477} {"train_loss": -7.154060363769531, "global_step": 188073, "epoch": 4477} {"train_loss": -7.165586948394775, "global_step": 188074, "epoch": 4477} {"train_loss": -7.139353218532744, "global_step": 188075, "epoch": 4477, "val_loss": 69424.484375} {"train_loss": -7.178073406219482, "global_step": 188076, "epoch": 4478} {"train_loss": -7.179986000061035, "global_step": 188077, "epoch": 4478} {"train_loss": -7.183588027954102, "global_step": 188078, "epoch": 4478} {"train_loss": -7.175805568695068, "global_step": 188079, "epoch": 4478} {"train_loss": -7.2050275802612305, "global_step": 188080, "epoch": 4478} {"train_loss": -7.248467445373535, "global_step": 188081, "epoch": 4478} {"train_loss": -7.195612907409668, "global_step": 188082, "epoch": 4478} {"train_loss": -7.243886470794678, "global_step": 188083, "epoch": 4478} {"train_loss": -7.276205062866211, "global_step": 188084, "epoch": 4478} {"train_loss": -7.188624382019043, "global_step": 188085, "epoch": 4478} {"train_loss": -7.195287704467773, "global_step": 188086, "epoch": 4478} {"train_loss": -7.252270698547363, "global_step": 188087, "epoch": 4478} {"train_loss": -7.263411998748779, "global_step": 188088, "epoch": 4478} {"train_loss": -7.2318925857543945, "global_step": 188089, "epoch": 4478} {"train_loss": -7.205981731414795, "global_step": 188090, "epoch": 4478} {"train_loss": -7.306013584136963, "global_step": 188091, "epoch": 4478} {"train_loss": -7.203582763671875, "global_step": 188092, "epoch": 4478} {"train_loss": -7.261535167694092, "global_step": 188093, "epoch": 4478} {"train_loss": -7.2075653076171875, "global_step": 188094, "epoch": 4478} {"train_loss": -7.215211868286133, "global_step": 188095, "epoch": 4478} {"train_loss": -7.247040271759033, "global_step": 188096, "epoch": 4478} {"train_loss": -7.193115711212158, "global_step": 188097, "epoch": 4478} {"train_loss": -7.203088283538818, "global_step": 188098, "epoch": 4478} {"train_loss": -7.203925132751465, "global_step": 188099, "epoch": 4478} {"train_loss": -7.110530853271484, "global_step": 188100, "epoch": 4478} {"train_loss": -7.347109794616699, "global_step": 188101, "epoch": 4478} {"train_loss": -7.140502452850342, "global_step": 188102, "epoch": 4478} {"train_loss": -7.069801330566406, "global_step": 188103, "epoch": 4478} {"train_loss": -7.2829270362854, "global_step": 188104, "epoch": 4478} {"train_loss": -7.183626174926758, "global_step": 188105, "epoch": 4478} {"train_loss": -7.176579475402832, "global_step": 188106, "epoch": 4478} {"train_loss": -7.263189792633057, "global_step": 188107, "epoch": 4478} {"train_loss": -7.188390731811523, "global_step": 188108, "epoch": 4478} {"train_loss": -7.244471549987793, "global_step": 188109, "epoch": 4478} {"train_loss": -7.161635875701904, "global_step": 188110, "epoch": 4478} {"train_loss": -7.196435928344727, "global_step": 188111, "epoch": 4478} {"train_loss": -7.180084705352783, "global_step": 188112, "epoch": 4478} {"train_loss": -7.330224990844727, "global_step": 188113, "epoch": 4478} {"train_loss": -7.265754222869873, "global_step": 188114, "epoch": 4478} {"train_loss": -7.165395259857178, "global_step": 188115, "epoch": 4478} {"train_loss": -7.105413436889648, "global_step": 188116, "epoch": 4478} {"train_loss": -7.213088796252296, "global_step": 188117, "epoch": 4478, "val_loss": 69634.375} {"train_loss": -6.96303653717041, "global_step": 188118, "epoch": 4479} {"train_loss": -7.2404069900512695, "global_step": 188119, "epoch": 4479} {"train_loss": -7.1521196365356445, "global_step": 188120, "epoch": 4479} {"train_loss": -7.089733123779297, "global_step": 188121, "epoch": 4479} {"train_loss": -7.159383773803711, "global_step": 188122, "epoch": 4479} {"train_loss": -7.25208854675293, "global_step": 188123, "epoch": 4479} {"train_loss": -7.1506853103637695, "global_step": 188124, "epoch": 4479} {"train_loss": -7.222413063049316, "global_step": 188125, "epoch": 4479} {"train_loss": -7.109999179840088, "global_step": 188126, "epoch": 4479} {"train_loss": -7.104832649230957, "global_step": 188127, "epoch": 4479} {"train_loss": -7.307389259338379, "global_step": 188128, "epoch": 4479} {"train_loss": -7.115303039550781, "global_step": 188129, "epoch": 4479} {"train_loss": -7.167867660522461, "global_step": 188130, "epoch": 4479} {"train_loss": -7.177148342132568, "global_step": 188131, "epoch": 4479} {"train_loss": -7.227077484130859, "global_step": 188132, "epoch": 4479} {"train_loss": -7.228636741638184, "global_step": 188133, "epoch": 4479} {"train_loss": -7.238222122192383, "global_step": 188134, "epoch": 4479} {"train_loss": -7.209685802459717, "global_step": 188135, "epoch": 4479} {"train_loss": -7.218591690063477, "global_step": 188136, "epoch": 4479} {"train_loss": -7.22841215133667, "global_step": 188137, "epoch": 4479} {"train_loss": -7.193769454956055, "global_step": 188138, "epoch": 4479} {"train_loss": -7.298589706420898, "global_step": 188139, "epoch": 4479} {"train_loss": -7.229586124420166, "global_step": 188140, "epoch": 4479} {"train_loss": -7.195064067840576, "global_step": 188141, "epoch": 4479} {"train_loss": -7.2324981689453125, "global_step": 188142, "epoch": 4479} {"train_loss": -7.070281982421875, "global_step": 188143, "epoch": 4479} {"train_loss": -7.127924919128418, "global_step": 188144, "epoch": 4479} {"train_loss": -7.164856433868408, "global_step": 188145, "epoch": 4479} {"train_loss": -7.0625762939453125, "global_step": 188146, "epoch": 4479} {"train_loss": -7.051308631896973, "global_step": 188147, "epoch": 4479} {"train_loss": -7.052734375, "global_step": 188148, "epoch": 4479} {"train_loss": -7.166923522949219, "global_step": 188149, "epoch": 4479} {"train_loss": -7.056649684906006, "global_step": 188150, "epoch": 4479} {"train_loss": -7.1650614738464355, "global_step": 188151, "epoch": 4479} {"train_loss": -7.184106826782227, "global_step": 188152, "epoch": 4479} {"train_loss": -7.144579887390137, "global_step": 188153, "epoch": 4479} {"train_loss": -7.02341365814209, "global_step": 188154, "epoch": 4479} {"train_loss": -7.091102600097656, "global_step": 188155, "epoch": 4479} {"train_loss": -7.046937465667725, "global_step": 188156, "epoch": 4479} {"train_loss": -7.181017875671387, "global_step": 188157, "epoch": 4479} {"train_loss": -7.089670181274414, "global_step": 188158, "epoch": 4479} {"train_loss": -7.153823069163731, "global_step": 188159, "epoch": 4479, "val_loss": 69597.3671875} {"train_loss": -7.200579643249512, "global_step": 188160, "epoch": 4480} {"train_loss": -7.150014877319336, "global_step": 188161, "epoch": 4480} {"train_loss": -7.133936882019043, "global_step": 188162, "epoch": 4480} {"train_loss": -7.1042070388793945, "global_step": 188163, "epoch": 4480} {"train_loss": -7.248133659362793, "global_step": 188164, "epoch": 4480} {"train_loss": -7.18192720413208, "global_step": 188165, "epoch": 4480} {"train_loss": -7.0536789894104, "global_step": 188166, "epoch": 4480} {"train_loss": -7.159152030944824, "global_step": 188167, "epoch": 4480} {"train_loss": -7.100088119506836, "global_step": 188168, "epoch": 4480} {"train_loss": -7.270153522491455, "global_step": 188169, "epoch": 4480} {"train_loss": -7.125282287597656, "global_step": 188170, "epoch": 4480} {"train_loss": -7.179720878601074, "global_step": 188171, "epoch": 4480} {"train_loss": -7.133620262145996, "global_step": 188172, "epoch": 4480} {"train_loss": -7.197484970092773, "global_step": 188173, "epoch": 4480} {"train_loss": -7.137334823608398, "global_step": 188174, "epoch": 4480} {"train_loss": -7.143052101135254, "global_step": 188175, "epoch": 4480} {"train_loss": -7.181703090667725, "global_step": 188176, "epoch": 4480} {"train_loss": -7.097230434417725, "global_step": 188177, "epoch": 4480} {"train_loss": -7.128271579742432, "global_step": 188178, "epoch": 4480} {"train_loss": -7.150356292724609, "global_step": 188179, "epoch": 4480} {"train_loss": -7.196252822875977, "global_step": 188180, "epoch": 4480} {"train_loss": -7.185212135314941, "global_step": 188181, "epoch": 4480} {"train_loss": -7.13502311706543, "global_step": 188182, "epoch": 4480} {"train_loss": -7.284493446350098, "global_step": 188183, "epoch": 4480} {"train_loss": -7.26417875289917, "global_step": 188184, "epoch": 4480} {"train_loss": -7.121294021606445, "global_step": 188185, "epoch": 4480} {"train_loss": -7.106389999389648, "global_step": 188186, "epoch": 4480} {"train_loss": -7.051419258117676, "global_step": 188187, "epoch": 4480} {"train_loss": -7.230230808258057, "global_step": 188188, "epoch": 4480} {"train_loss": -7.219374656677246, "global_step": 188189, "epoch": 4480} {"train_loss": -7.225146770477295, "global_step": 188190, "epoch": 4480} {"train_loss": -7.303922176361084, "global_step": 188191, "epoch": 4480} {"train_loss": -7.205414295196533, "global_step": 188192, "epoch": 4480} {"train_loss": -7.134792327880859, "global_step": 188193, "epoch": 4480} {"train_loss": -7.26460599899292, "global_step": 188194, "epoch": 4480} {"train_loss": -7.099939346313477, "global_step": 188195, "epoch": 4480} {"train_loss": -7.197719573974609, "global_step": 188196, "epoch": 4480} {"train_loss": -7.173610687255859, "global_step": 188197, "epoch": 4480} {"train_loss": -7.139739990234375, "global_step": 188198, "epoch": 4480} {"train_loss": -7.137199401855469, "global_step": 188199, "epoch": 4480} {"train_loss": -7.11972188949585, "global_step": 188200, "epoch": 4480} {"train_loss": -7.168611583255586, "global_step": 188201, "epoch": 4480, "val_loss": 69576.265625} {"train_loss": -7.310182571411133, "global_step": 188202, "epoch": 4481} {"train_loss": -7.036139011383057, "global_step": 188203, "epoch": 4481} {"train_loss": -7.168036460876465, "global_step": 188204, "epoch": 4481} {"train_loss": -7.142573356628418, "global_step": 188205, "epoch": 4481} {"train_loss": -7.203946590423584, "global_step": 188206, "epoch": 4481} {"train_loss": -7.004037380218506, "global_step": 188207, "epoch": 4481} {"train_loss": -7.136449813842773, "global_step": 188208, "epoch": 4481} {"train_loss": -7.059516906738281, "global_step": 188209, "epoch": 4481} {"train_loss": -7.190860748291016, "global_step": 188210, "epoch": 4481} {"train_loss": -7.148242950439453, "global_step": 188211, "epoch": 4481} {"train_loss": -7.139969825744629, "global_step": 188212, "epoch": 4481} {"train_loss": -7.181793212890625, "global_step": 188213, "epoch": 4481} {"train_loss": -7.1316680908203125, "global_step": 188214, "epoch": 4481} {"train_loss": -7.263150215148926, "global_step": 188215, "epoch": 4481} {"train_loss": -7.2632246017456055, "global_step": 188216, "epoch": 4481} {"train_loss": -7.115248680114746, "global_step": 188217, "epoch": 4481} {"train_loss": -7.172679901123047, "global_step": 188218, "epoch": 4481} {"train_loss": -7.359697341918945, "global_step": 188219, "epoch": 4481} {"train_loss": -7.174911022186279, "global_step": 188220, "epoch": 4481} {"train_loss": -7.295339584350586, "global_step": 188221, "epoch": 4481} {"train_loss": -7.140002250671387, "global_step": 188222, "epoch": 4481} {"train_loss": -7.201811790466309, "global_step": 188223, "epoch": 4481} {"train_loss": -7.203901290893555, "global_step": 188224, "epoch": 4481} {"train_loss": -7.213802337646484, "global_step": 188225, "epoch": 4481} {"train_loss": -7.145160675048828, "global_step": 188226, "epoch": 4481} {"train_loss": -7.2032575607299805, "global_step": 188227, "epoch": 4481} {"train_loss": -7.129776954650879, "global_step": 188228, "epoch": 4481} {"train_loss": -7.236819267272949, "global_step": 188229, "epoch": 4481} {"train_loss": -7.253286838531494, "global_step": 188230, "epoch": 4481} {"train_loss": -7.156237602233887, "global_step": 188231, "epoch": 4481} {"train_loss": -7.197710990905762, "global_step": 188232, "epoch": 4481} {"train_loss": -7.230709075927734, "global_step": 188233, "epoch": 4481} {"train_loss": -7.201136112213135, "global_step": 188234, "epoch": 4481} {"train_loss": -7.116275787353516, "global_step": 188235, "epoch": 4481} {"train_loss": -7.240322113037109, "global_step": 188236, "epoch": 4481} {"train_loss": -7.068403244018555, "global_step": 188237, "epoch": 4481} {"train_loss": -7.058711051940918, "global_step": 188238, "epoch": 4481} {"train_loss": -7.234447956085205, "global_step": 188239, "epoch": 4481} {"train_loss": -6.875495433807373, "global_step": 188240, "epoch": 4481} {"train_loss": -7.07564640045166, "global_step": 188241, "epoch": 4481} {"train_loss": -7.197691917419434, "global_step": 188242, "epoch": 4481} {"train_loss": -7.161532640457153, "global_step": 188243, "epoch": 4481, "val_loss": 69452.078125} {"train_loss": -7.044818878173828, "global_step": 188244, "epoch": 4482} {"train_loss": -6.906572341918945, "global_step": 188245, "epoch": 4482} {"train_loss": -7.002881050109863, "global_step": 188246, "epoch": 4482} {"train_loss": -7.098045825958252, "global_step": 188247, "epoch": 4482} {"train_loss": -6.923218727111816, "global_step": 188248, "epoch": 4482} {"train_loss": -7.07244873046875, "global_step": 188249, "epoch": 4482} {"train_loss": -7.122742176055908, "global_step": 188250, "epoch": 4482} {"train_loss": -7.093056678771973, "global_step": 188251, "epoch": 4482} {"train_loss": -7.086345195770264, "global_step": 188252, "epoch": 4482} {"train_loss": -7.144735336303711, "global_step": 188253, "epoch": 4482} {"train_loss": -7.041994094848633, "global_step": 188254, "epoch": 4482} {"train_loss": -7.194984436035156, "global_step": 188255, "epoch": 4482} {"train_loss": -7.166728496551514, "global_step": 188256, "epoch": 4482} {"train_loss": -7.1492767333984375, "global_step": 188257, "epoch": 4482} {"train_loss": -7.154959678649902, "global_step": 188258, "epoch": 4482} {"train_loss": -7.091480255126953, "global_step": 188259, "epoch": 4482} {"train_loss": -7.165292739868164, "global_step": 188260, "epoch": 4482} {"train_loss": -7.110908508300781, "global_step": 188261, "epoch": 4482} {"train_loss": -7.062444686889648, "global_step": 188262, "epoch": 4482} {"train_loss": -7.065119743347168, "global_step": 188263, "epoch": 4482} {"train_loss": -7.056346893310547, "global_step": 188264, "epoch": 4482} {"train_loss": -7.118078708648682, "global_step": 188265, "epoch": 4482} {"train_loss": -7.299008369445801, "global_step": 188266, "epoch": 4482} {"train_loss": -7.12430477142334, "global_step": 188267, "epoch": 4482} {"train_loss": -7.125189781188965, "global_step": 188268, "epoch": 4482} {"train_loss": -7.285355567932129, "global_step": 188269, "epoch": 4482} {"train_loss": -7.135446548461914, "global_step": 188270, "epoch": 4482} {"train_loss": -7.213634490966797, "global_step": 188271, "epoch": 4482} {"train_loss": -7.112104415893555, "global_step": 188272, "epoch": 4482} {"train_loss": -7.133703231811523, "global_step": 188273, "epoch": 4482} {"train_loss": -7.168081283569336, "global_step": 188274, "epoch": 4482} {"train_loss": -7.239434242248535, "global_step": 188275, "epoch": 4482} {"train_loss": -7.154911041259766, "global_step": 188276, "epoch": 4482} {"train_loss": -7.28785514831543, "global_step": 188277, "epoch": 4482} {"train_loss": -7.099217414855957, "global_step": 188278, "epoch": 4482} {"train_loss": -7.103515625, "global_step": 188279, "epoch": 4482} {"train_loss": -7.198359489440918, "global_step": 188280, "epoch": 4482} {"train_loss": -7.229226589202881, "global_step": 188281, "epoch": 4482} {"train_loss": -7.22901725769043, "global_step": 188282, "epoch": 4482} {"train_loss": -7.269853591918945, "global_step": 188283, "epoch": 4482} {"train_loss": -7.17697811126709, "global_step": 188284, "epoch": 4482} {"train_loss": -7.136002438408988, "global_step": 188285, "epoch": 4482, "val_loss": 69436.2734375} {"train_loss": -7.320148468017578, "global_step": 188286, "epoch": 4483} {"train_loss": -7.236226558685303, "global_step": 188287, "epoch": 4483} {"train_loss": -7.247110366821289, "global_step": 188288, "epoch": 4483} {"train_loss": -7.200406074523926, "global_step": 188289, "epoch": 4483} {"train_loss": -7.197396278381348, "global_step": 188290, "epoch": 4483} {"train_loss": -7.163297176361084, "global_step": 188291, "epoch": 4483} {"train_loss": -7.154746055603027, "global_step": 188292, "epoch": 4483} {"train_loss": -7.221407890319824, "global_step": 188293, "epoch": 4483} {"train_loss": -7.1693339347839355, "global_step": 188294, "epoch": 4483} {"train_loss": -7.2432403564453125, "global_step": 188295, "epoch": 4483} {"train_loss": -7.209343910217285, "global_step": 188296, "epoch": 4483} {"train_loss": -7.290329933166504, "global_step": 188297, "epoch": 4483} {"train_loss": -7.084895133972168, "global_step": 188298, "epoch": 4483} {"train_loss": -7.219353675842285, "global_step": 188299, "epoch": 4483} {"train_loss": -7.345065593719482, "global_step": 188300, "epoch": 4483} {"train_loss": -7.265474319458008, "global_step": 188301, "epoch": 4483} {"train_loss": -7.2250213623046875, "global_step": 188302, "epoch": 4483} {"train_loss": -7.140219688415527, "global_step": 188303, "epoch": 4483} {"train_loss": -7.191323280334473, "global_step": 188304, "epoch": 4483} {"train_loss": -7.210646152496338, "global_step": 188305, "epoch": 4483} {"train_loss": -7.23056697845459, "global_step": 188306, "epoch": 4483} {"train_loss": -7.197412014007568, "global_step": 188307, "epoch": 4483} {"train_loss": -7.181200981140137, "global_step": 188308, "epoch": 4483} {"train_loss": -7.184030055999756, "global_step": 188309, "epoch": 4483} {"train_loss": -7.2346954345703125, "global_step": 188310, "epoch": 4483} {"train_loss": -7.091418743133545, "global_step": 188311, "epoch": 4483} {"train_loss": -7.274252891540527, "global_step": 188312, "epoch": 4483} {"train_loss": -7.260340213775635, "global_step": 188313, "epoch": 4483} {"train_loss": -7.06136417388916, "global_step": 188314, "epoch": 4483} {"train_loss": -7.2911882400512695, "global_step": 188315, "epoch": 4483} {"train_loss": -7.167147636413574, "global_step": 188316, "epoch": 4483} {"train_loss": -7.083858013153076, "global_step": 188317, "epoch": 4483} {"train_loss": -7.216366767883301, "global_step": 188318, "epoch": 4483} {"train_loss": -7.135017395019531, "global_step": 188319, "epoch": 4483} {"train_loss": -7.167789936065674, "global_step": 188320, "epoch": 4483} {"train_loss": -7.2724504470825195, "global_step": 188321, "epoch": 4483} {"train_loss": -7.206643104553223, "global_step": 188322, "epoch": 4483} {"train_loss": -7.147523403167725, "global_step": 188323, "epoch": 4483} {"train_loss": -7.125012397766113, "global_step": 188324, "epoch": 4483} {"train_loss": -7.21931266784668, "global_step": 188325, "epoch": 4483} {"train_loss": -7.308719158172607, "global_step": 188326, "epoch": 4483} {"train_loss": -7.205001433690389, "global_step": 188327, "epoch": 4483, "val_loss": 69352.8359375} {"train_loss": -7.237225532531738, "global_step": 188328, "epoch": 4484} {"train_loss": -7.268671989440918, "global_step": 188329, "epoch": 4484} {"train_loss": -7.164222717285156, "global_step": 188330, "epoch": 4484} {"train_loss": -7.228715896606445, "global_step": 188331, "epoch": 4484} {"train_loss": -7.258913040161133, "global_step": 188332, "epoch": 4484} {"train_loss": -7.246851921081543, "global_step": 188333, "epoch": 4484} {"train_loss": -7.10914421081543, "global_step": 188334, "epoch": 4484} {"train_loss": -6.989425182342529, "global_step": 188335, "epoch": 4484} {"train_loss": -7.1006388664245605, "global_step": 188336, "epoch": 4484} {"train_loss": -7.137115478515625, "global_step": 188337, "epoch": 4484} {"train_loss": -7.126725673675537, "global_step": 188338, "epoch": 4484} {"train_loss": -7.108504295349121, "global_step": 188339, "epoch": 4484} {"train_loss": -7.162590026855469, "global_step": 188340, "epoch": 4484} {"train_loss": -7.225282669067383, "global_step": 188341, "epoch": 4484} {"train_loss": -7.197700500488281, "global_step": 188342, "epoch": 4484} {"train_loss": -7.037509918212891, "global_step": 188343, "epoch": 4484} {"train_loss": -7.3230299949646, "global_step": 188344, "epoch": 4484} {"train_loss": -7.1683549880981445, "global_step": 188345, "epoch": 4484} {"train_loss": -7.116735458374023, "global_step": 188346, "epoch": 4484} {"train_loss": -7.202093601226807, "global_step": 188347, "epoch": 4484} {"train_loss": -7.175370216369629, "global_step": 188348, "epoch": 4484} {"train_loss": -7.182356834411621, "global_step": 188349, "epoch": 4484} {"train_loss": -7.36808443069458, "global_step": 188350, "epoch": 4484} {"train_loss": -7.180527687072754, "global_step": 188351, "epoch": 4484} {"train_loss": -7.164529800415039, "global_step": 188352, "epoch": 4484} {"train_loss": -7.098964691162109, "global_step": 188353, "epoch": 4484} {"train_loss": -7.0975422859191895, "global_step": 188354, "epoch": 4484} {"train_loss": -7.276549816131592, "global_step": 188355, "epoch": 4484} {"train_loss": -7.170927047729492, "global_step": 188356, "epoch": 4484} {"train_loss": -7.147613525390625, "global_step": 188357, "epoch": 4484} {"train_loss": -7.352534294128418, "global_step": 188358, "epoch": 4484} {"train_loss": -7.263261318206787, "global_step": 188359, "epoch": 4484} {"train_loss": -7.247785568237305, "global_step": 188360, "epoch": 4484} {"train_loss": -7.141952991485596, "global_step": 188361, "epoch": 4484} {"train_loss": -7.074983596801758, "global_step": 188362, "epoch": 4484} {"train_loss": -7.10097599029541, "global_step": 188363, "epoch": 4484} {"train_loss": -7.186699390411377, "global_step": 188364, "epoch": 4484} {"train_loss": -7.280333995819092, "global_step": 188365, "epoch": 4484} {"train_loss": -7.137117862701416, "global_step": 188366, "epoch": 4484} {"train_loss": -7.223409652709961, "global_step": 188367, "epoch": 4484} {"train_loss": -6.999548435211182, "global_step": 188368, "epoch": 4484} {"train_loss": -7.173677887235369, "global_step": 188369, "epoch": 4484, "val_loss": 69363.3046875} {"train_loss": -7.043262004852295, "global_step": 188370, "epoch": 4485} {"train_loss": -7.138359546661377, "global_step": 188371, "epoch": 4485} {"train_loss": -6.9802751541137695, "global_step": 188372, "epoch": 4485} {"train_loss": -7.107114315032959, "global_step": 188373, "epoch": 4485} {"train_loss": -7.135168552398682, "global_step": 188374, "epoch": 4485} {"train_loss": -7.117497444152832, "global_step": 188375, "epoch": 4485} {"train_loss": -7.249738693237305, "global_step": 188376, "epoch": 4485} {"train_loss": -7.089345455169678, "global_step": 188377, "epoch": 4485} {"train_loss": -7.226061820983887, "global_step": 188378, "epoch": 4485} {"train_loss": -7.271028518676758, "global_step": 188379, "epoch": 4485} {"train_loss": -7.150120735168457, "global_step": 188380, "epoch": 4485} {"train_loss": -7.280717849731445, "global_step": 188381, "epoch": 4485} {"train_loss": -7.195065021514893, "global_step": 188382, "epoch": 4485} {"train_loss": -7.188580513000488, "global_step": 188383, "epoch": 4485} {"train_loss": -7.138647079467773, "global_step": 188384, "epoch": 4485} {"train_loss": -7.192681312561035, "global_step": 188385, "epoch": 4485} {"train_loss": -7.257454872131348, "global_step": 188386, "epoch": 4485} {"train_loss": -7.120298385620117, "global_step": 188387, "epoch": 4485} {"train_loss": -7.219976425170898, "global_step": 188388, "epoch": 4485} {"train_loss": -7.217935562133789, "global_step": 188389, "epoch": 4485} {"train_loss": -7.1448540687561035, "global_step": 188390, "epoch": 4485} {"train_loss": -7.172767162322998, "global_step": 188391, "epoch": 4485} {"train_loss": -7.282662391662598, "global_step": 188392, "epoch": 4485} {"train_loss": -7.275175094604492, "global_step": 188393, "epoch": 4485} {"train_loss": -7.170482635498047, "global_step": 188394, "epoch": 4485} {"train_loss": -6.904285430908203, "global_step": 188395, "epoch": 4485} {"train_loss": -7.034775257110596, "global_step": 188396, "epoch": 4485} {"train_loss": -7.105438232421875, "global_step": 188397, "epoch": 4485} {"train_loss": -7.1893768310546875, "global_step": 188398, "epoch": 4485} {"train_loss": -7.001401424407959, "global_step": 188399, "epoch": 4485} {"train_loss": -7.174943447113037, "global_step": 188400, "epoch": 4485} {"train_loss": -7.1650848388671875, "global_step": 188401, "epoch": 4485} {"train_loss": -7.139634132385254, "global_step": 188402, "epoch": 4485} {"train_loss": -7.157464027404785, "global_step": 188403, "epoch": 4485} {"train_loss": -7.200267314910889, "global_step": 188404, "epoch": 4485} {"train_loss": -7.203791618347168, "global_step": 188405, "epoch": 4485} {"train_loss": -7.107069492340088, "global_step": 188406, "epoch": 4485} {"train_loss": -7.139328956604004, "global_step": 188407, "epoch": 4485} {"train_loss": -7.183298110961914, "global_step": 188408, "epoch": 4485} {"train_loss": -7.221953868865967, "global_step": 188409, "epoch": 4485} {"train_loss": -6.94778299331665, "global_step": 188410, "epoch": 4485} {"train_loss": -7.151823111942837, "global_step": 188411, "epoch": 4485, "val_loss": 69582.171875} {"train_loss": -7.155004501342773, "global_step": 188412, "epoch": 4486} {"train_loss": -7.1166486740112305, "global_step": 188413, "epoch": 4486} {"train_loss": -7.146852493286133, "global_step": 188414, "epoch": 4486} {"train_loss": -7.185527324676514, "global_step": 188415, "epoch": 4486} {"train_loss": -7.1522393226623535, "global_step": 188416, "epoch": 4486} {"train_loss": -7.1535515785217285, "global_step": 188417, "epoch": 4486} {"train_loss": -7.093280792236328, "global_step": 188418, "epoch": 4486} {"train_loss": -7.211490631103516, "global_step": 188419, "epoch": 4486} {"train_loss": -7.123340129852295, "global_step": 188420, "epoch": 4486} {"train_loss": -7.158248424530029, "global_step": 188421, "epoch": 4486} {"train_loss": -7.230855941772461, "global_step": 188422, "epoch": 4486} {"train_loss": -7.219398498535156, "global_step": 188423, "epoch": 4486} {"train_loss": -7.105831623077393, "global_step": 188424, "epoch": 4486} {"train_loss": -7.165562629699707, "global_step": 188425, "epoch": 4486} {"train_loss": -7.276495933532715, "global_step": 188426, "epoch": 4486} {"train_loss": -7.1873955726623535, "global_step": 188427, "epoch": 4486} {"train_loss": -7.225317478179932, "global_step": 188428, "epoch": 4486} {"train_loss": -7.194646835327148, "global_step": 188429, "epoch": 4486} {"train_loss": -7.149786472320557, "global_step": 188430, "epoch": 4486} {"train_loss": -7.2145891189575195, "global_step": 188431, "epoch": 4486} {"train_loss": -7.064143180847168, "global_step": 188432, "epoch": 4486} {"train_loss": -7.333955764770508, "global_step": 188433, "epoch": 4486} {"train_loss": -7.244623184204102, "global_step": 188434, "epoch": 4486} {"train_loss": -7.2676682472229, "global_step": 188435, "epoch": 4486} {"train_loss": -7.164695739746094, "global_step": 188436, "epoch": 4486} {"train_loss": -7.272439956665039, "global_step": 188437, "epoch": 4486} {"train_loss": -7.144283771514893, "global_step": 188438, "epoch": 4486} {"train_loss": -7.203118801116943, "global_step": 188439, "epoch": 4486} {"train_loss": -7.151712417602539, "global_step": 188440, "epoch": 4486} {"train_loss": -7.223618507385254, "global_step": 188441, "epoch": 4486} {"train_loss": -7.067643165588379, "global_step": 188442, "epoch": 4486} {"train_loss": -7.022680759429932, "global_step": 188443, "epoch": 4486} {"train_loss": -7.250638961791992, "global_step": 188444, "epoch": 4486} {"train_loss": -6.87221622467041, "global_step": 188445, "epoch": 4486} {"train_loss": -6.955483436584473, "global_step": 188446, "epoch": 4486} {"train_loss": -6.964602947235107, "global_step": 188447, "epoch": 4486} {"train_loss": -7.02915620803833, "global_step": 188448, "epoch": 4486} {"train_loss": -7.089646816253662, "global_step": 188449, "epoch": 4486} {"train_loss": -6.996039867401123, "global_step": 188450, "epoch": 4486} {"train_loss": -7.108962059020996, "global_step": 188451, "epoch": 4486} {"train_loss": -7.195072174072266, "global_step": 188452, "epoch": 4486} {"train_loss": -7.146016461508615, "global_step": 188453, "epoch": 4486, "val_loss": 69402.6015625} {"train_loss": -7.17391300201416, "global_step": 188454, "epoch": 4487} {"train_loss": -7.12093448638916, "global_step": 188455, "epoch": 4487} {"train_loss": -7.125231742858887, "global_step": 188456, "epoch": 4487} {"train_loss": -7.0597825050354, "global_step": 188457, "epoch": 4487} {"train_loss": -7.2209062576293945, "global_step": 188458, "epoch": 4487} {"train_loss": -7.192079544067383, "global_step": 188459, "epoch": 4487} {"train_loss": -7.091221809387207, "global_step": 188460, "epoch": 4487} {"train_loss": -7.232480049133301, "global_step": 188461, "epoch": 4487} {"train_loss": -7.133303642272949, "global_step": 188462, "epoch": 4487} {"train_loss": -7.12865686416626, "global_step": 188463, "epoch": 4487} {"train_loss": -7.092190742492676, "global_step": 188464, "epoch": 4487} {"train_loss": -7.198349952697754, "global_step": 188465, "epoch": 4487} {"train_loss": -7.272018909454346, "global_step": 188466, "epoch": 4487} {"train_loss": -7.330582618713379, "global_step": 188467, "epoch": 4487} {"train_loss": -7.137252330780029, "global_step": 188468, "epoch": 4487} {"train_loss": -7.208123207092285, "global_step": 188469, "epoch": 4487} {"train_loss": -7.2524261474609375, "global_step": 188470, "epoch": 4487} {"train_loss": -7.233190536499023, "global_step": 188471, "epoch": 4487} {"train_loss": -7.226877689361572, "global_step": 188472, "epoch": 4487} {"train_loss": -7.344052314758301, "global_step": 188473, "epoch": 4487} {"train_loss": -7.102817535400391, "global_step": 188474, "epoch": 4487} {"train_loss": -7.270487308502197, "global_step": 188475, "epoch": 4487} {"train_loss": -7.284074783325195, "global_step": 188476, "epoch": 4487} {"train_loss": -7.245511531829834, "global_step": 188477, "epoch": 4487} {"train_loss": -7.241703510284424, "global_step": 188478, "epoch": 4487} {"train_loss": -7.232257843017578, "global_step": 188479, "epoch": 4487} {"train_loss": -7.1639533042907715, "global_step": 188480, "epoch": 4487} {"train_loss": -7.162527561187744, "global_step": 188481, "epoch": 4487} {"train_loss": -7.140132904052734, "global_step": 188482, "epoch": 4487} {"train_loss": -7.119575500488281, "global_step": 188483, "epoch": 4487} {"train_loss": -7.216368675231934, "global_step": 188484, "epoch": 4487} {"train_loss": -7.13483190536499, "global_step": 188485, "epoch": 4487} {"train_loss": -7.213006019592285, "global_step": 188486, "epoch": 4487} {"train_loss": -7.287965774536133, "global_step": 188487, "epoch": 4487} {"train_loss": -7.042490005493164, "global_step": 188488, "epoch": 4487} {"train_loss": -7.036073207855225, "global_step": 188489, "epoch": 4487} {"train_loss": -7.202924728393555, "global_step": 188490, "epoch": 4487} {"train_loss": -7.13245964050293, "global_step": 188491, "epoch": 4487} {"train_loss": -7.040609836578369, "global_step": 188492, "epoch": 4487} {"train_loss": -7.10852575302124, "global_step": 188493, "epoch": 4487} {"train_loss": -7.021586894989014, "global_step": 188494, "epoch": 4487} {"train_loss": -7.174765007836478, "global_step": 188495, "epoch": 4487, "val_loss": 70031.7109375} {"train_loss": -7.089387893676758, "global_step": 188496, "epoch": 4488} {"train_loss": -7.167555809020996, "global_step": 188497, "epoch": 4488} {"train_loss": -7.1551899909973145, "global_step": 188498, "epoch": 4488} {"train_loss": -7.115589141845703, "global_step": 188499, "epoch": 4488} {"train_loss": -7.150517463684082, "global_step": 188500, "epoch": 4488} {"train_loss": -6.965809345245361, "global_step": 188501, "epoch": 4488} {"train_loss": -7.157621383666992, "global_step": 188502, "epoch": 4488} {"train_loss": -7.045804023742676, "global_step": 188503, "epoch": 4488} {"train_loss": -7.110213279724121, "global_step": 188504, "epoch": 4488} {"train_loss": -7.100381374359131, "global_step": 188505, "epoch": 4488} {"train_loss": -7.098545074462891, "global_step": 188506, "epoch": 4488} {"train_loss": -7.114853858947754, "global_step": 188507, "epoch": 4488} {"train_loss": -7.081370830535889, "global_step": 188508, "epoch": 4488} {"train_loss": -7.1349334716796875, "global_step": 188509, "epoch": 4488} {"train_loss": -7.130047798156738, "global_step": 188510, "epoch": 4488} {"train_loss": -7.065113067626953, "global_step": 188511, "epoch": 4488} {"train_loss": -7.050327301025391, "global_step": 188512, "epoch": 4488} {"train_loss": -7.124862194061279, "global_step": 188513, "epoch": 4488} {"train_loss": -7.153996467590332, "global_step": 188514, "epoch": 4488} {"train_loss": -7.048889636993408, "global_step": 188515, "epoch": 4488} {"train_loss": -7.113110065460205, "global_step": 188516, "epoch": 4488} {"train_loss": -7.148916244506836, "global_step": 188517, "epoch": 4488} {"train_loss": -7.04871940612793, "global_step": 188518, "epoch": 4488} {"train_loss": -7.217273712158203, "global_step": 188519, "epoch": 4488} {"train_loss": -7.031489372253418, "global_step": 188520, "epoch": 4488} {"train_loss": -7.273564338684082, "global_step": 188521, "epoch": 4488} {"train_loss": -7.140481472015381, "global_step": 188522, "epoch": 4488} {"train_loss": -7.213207721710205, "global_step": 188523, "epoch": 4488} {"train_loss": -7.18557596206665, "global_step": 188524, "epoch": 4488} {"train_loss": -7.186664581298828, "global_step": 188525, "epoch": 4488} {"train_loss": -7.104595184326172, "global_step": 188526, "epoch": 4488} {"train_loss": -7.144276142120361, "global_step": 188527, "epoch": 4488} {"train_loss": -7.2079010009765625, "global_step": 188528, "epoch": 4488} {"train_loss": -7.146653175354004, "global_step": 188529, "epoch": 4488} {"train_loss": -7.21036434173584, "global_step": 188530, "epoch": 4488} {"train_loss": -7.292764663696289, "global_step": 188531, "epoch": 4488} {"train_loss": -7.192756652832031, "global_step": 188532, "epoch": 4488} {"train_loss": -7.2361249923706055, "global_step": 188533, "epoch": 4488} {"train_loss": -7.283966064453125, "global_step": 188534, "epoch": 4488} {"train_loss": -7.2359466552734375, "global_step": 188535, "epoch": 4488} {"train_loss": -7.270718574523926, "global_step": 188536, "epoch": 4488} {"train_loss": -7.145533970424107, "global_step": 188537, "epoch": 4488, "val_loss": 69514.8359375} {"train_loss": -7.284707546234131, "global_step": 188538, "epoch": 4489} {"train_loss": -7.286257743835449, "global_step": 188539, "epoch": 4489} {"train_loss": -7.259800910949707, "global_step": 188540, "epoch": 4489} {"train_loss": -7.313996315002441, "global_step": 188541, "epoch": 4489} {"train_loss": -7.300276756286621, "global_step": 188542, "epoch": 4489} {"train_loss": -7.332727432250977, "global_step": 188543, "epoch": 4489} {"train_loss": -7.327592849731445, "global_step": 188544, "epoch": 4489} {"train_loss": -7.396224021911621, "global_step": 188545, "epoch": 4489} {"train_loss": -7.16826057434082, "global_step": 188546, "epoch": 4489} {"train_loss": -7.229208946228027, "global_step": 188547, "epoch": 4489} {"train_loss": -7.2773027420043945, "global_step": 188548, "epoch": 4489} {"train_loss": -7.199856758117676, "global_step": 188549, "epoch": 4489} {"train_loss": -7.185033798217773, "global_step": 188550, "epoch": 4489} {"train_loss": -7.1340227127075195, "global_step": 188551, "epoch": 4489} {"train_loss": -7.098268032073975, "global_step": 188552, "epoch": 4489} {"train_loss": -7.082719802856445, "global_step": 188553, "epoch": 4489} {"train_loss": -7.202428817749023, "global_step": 188554, "epoch": 4489} {"train_loss": -7.287569046020508, "global_step": 188555, "epoch": 4489} {"train_loss": -7.208700180053711, "global_step": 188556, "epoch": 4489} {"train_loss": -7.165563583374023, "global_step": 188557, "epoch": 4489} {"train_loss": -7.120887279510498, "global_step": 188558, "epoch": 4489} {"train_loss": -7.119467735290527, "global_step": 188559, "epoch": 4489} {"train_loss": -7.236050605773926, "global_step": 188560, "epoch": 4489} {"train_loss": -7.212865829467773, "global_step": 188561, "epoch": 4489} {"train_loss": -7.121284484863281, "global_step": 188562, "epoch": 4489} {"train_loss": -7.146627902984619, "global_step": 188563, "epoch": 4489} {"train_loss": -7.218064308166504, "global_step": 188564, "epoch": 4489} {"train_loss": -7.191257476806641, "global_step": 188565, "epoch": 4489} {"train_loss": -7.032379627227783, "global_step": 188566, "epoch": 4489} {"train_loss": -7.183450698852539, "global_step": 188567, "epoch": 4489} {"train_loss": -7.177257537841797, "global_step": 188568, "epoch": 4489} {"train_loss": -7.1378984451293945, "global_step": 188569, "epoch": 4489} {"train_loss": -7.100778579711914, "global_step": 188570, "epoch": 4489} {"train_loss": -7.282578945159912, "global_step": 188571, "epoch": 4489} {"train_loss": -7.298822402954102, "global_step": 188572, "epoch": 4489} {"train_loss": -7.150868892669678, "global_step": 188573, "epoch": 4489} {"train_loss": -7.149636745452881, "global_step": 188574, "epoch": 4489} {"train_loss": -7.353971481323242, "global_step": 188575, "epoch": 4489} {"train_loss": -7.101893424987793, "global_step": 188576, "epoch": 4489} {"train_loss": -7.181797027587891, "global_step": 188577, "epoch": 4489} {"train_loss": -7.127003192901611, "global_step": 188578, "epoch": 4489} {"train_loss": -7.205780256362188, "global_step": 188579, "epoch": 4489, "val_loss": 69540.4609375} {"train_loss": -7.174363136291504, "global_step": 188580, "epoch": 4490} {"train_loss": -7.2449541091918945, "global_step": 188581, "epoch": 4490} {"train_loss": -7.241220474243164, "global_step": 188582, "epoch": 4490} {"train_loss": -7.167762756347656, "global_step": 188583, "epoch": 4490} {"train_loss": -7.158069133758545, "global_step": 188584, "epoch": 4490} {"train_loss": -7.189873695373535, "global_step": 188585, "epoch": 4490} {"train_loss": -7.216527938842773, "global_step": 188586, "epoch": 4490} {"train_loss": -7.117352485656738, "global_step": 188587, "epoch": 4490} {"train_loss": -7.171020030975342, "global_step": 188588, "epoch": 4490} {"train_loss": -7.256951332092285, "global_step": 188589, "epoch": 4490} {"train_loss": -7.195562839508057, "global_step": 188590, "epoch": 4490} {"train_loss": -7.217645168304443, "global_step": 188591, "epoch": 4490} {"train_loss": -7.258208274841309, "global_step": 188592, "epoch": 4490} {"train_loss": -7.186601638793945, "global_step": 188593, "epoch": 4490} {"train_loss": -7.123721599578857, "global_step": 188594, "epoch": 4490} {"train_loss": -7.212389945983887, "global_step": 188595, "epoch": 4490} {"train_loss": -7.162417411804199, "global_step": 188596, "epoch": 4490} {"train_loss": -7.090247631072998, "global_step": 188597, "epoch": 4490} {"train_loss": -7.100274085998535, "global_step": 188598, "epoch": 4490} {"train_loss": -7.16878604888916, "global_step": 188599, "epoch": 4490} {"train_loss": -7.310230255126953, "global_step": 188600, "epoch": 4490} {"train_loss": -7.078238010406494, "global_step": 188601, "epoch": 4490} {"train_loss": -7.07349967956543, "global_step": 188602, "epoch": 4490} {"train_loss": -7.123104572296143, "global_step": 188603, "epoch": 4490} {"train_loss": -7.068259239196777, "global_step": 188604, "epoch": 4490} {"train_loss": -7.225402355194092, "global_step": 188605, "epoch": 4490} {"train_loss": -7.220555305480957, "global_step": 188606, "epoch": 4490} {"train_loss": -7.166196823120117, "global_step": 188607, "epoch": 4490} {"train_loss": -7.172825813293457, "global_step": 188608, "epoch": 4490} {"train_loss": -7.245519161224365, "global_step": 188609, "epoch": 4490} {"train_loss": -7.215677261352539, "global_step": 188610, "epoch": 4490} {"train_loss": -7.12841796875, "global_step": 188611, "epoch": 4490} {"train_loss": -7.226860523223877, "global_step": 188612, "epoch": 4490} {"train_loss": -7.203908920288086, "global_step": 188613, "epoch": 4490} {"train_loss": -7.214044570922852, "global_step": 188614, "epoch": 4490} {"train_loss": -7.232675552368164, "global_step": 188615, "epoch": 4490} {"train_loss": -7.187785625457764, "global_step": 188616, "epoch": 4490} {"train_loss": -7.116710662841797, "global_step": 188617, "epoch": 4490} {"train_loss": -7.257542133331299, "global_step": 188618, "epoch": 4490} {"train_loss": -7.198465824127197, "global_step": 188619, "epoch": 4490} {"train_loss": -7.10957145690918, "global_step": 188620, "epoch": 4490} {"train_loss": -7.182748442604428, "global_step": 188621, "epoch": 4490, "val_loss": 69474.5078125} {"train_loss": -7.20371150970459, "global_step": 188622, "epoch": 4491} {"train_loss": -7.1647539138793945, "global_step": 188623, "epoch": 4491} {"train_loss": -7.310028553009033, "global_step": 188624, "epoch": 4491} {"train_loss": -7.293972492218018, "global_step": 188625, "epoch": 4491} {"train_loss": -7.122784614562988, "global_step": 188626, "epoch": 4491} {"train_loss": -7.133039474487305, "global_step": 188627, "epoch": 4491} {"train_loss": -7.119731426239014, "global_step": 188628, "epoch": 4491} {"train_loss": -7.26336145401001, "global_step": 188629, "epoch": 4491} {"train_loss": -7.341373920440674, "global_step": 188630, "epoch": 4491} {"train_loss": -7.182455062866211, "global_step": 188631, "epoch": 4491} {"train_loss": -7.135166645050049, "global_step": 188632, "epoch": 4491} {"train_loss": -7.316269397735596, "global_step": 188633, "epoch": 4491} {"train_loss": -7.1918230056762695, "global_step": 188634, "epoch": 4491} {"train_loss": -7.096077919006348, "global_step": 188635, "epoch": 4491} {"train_loss": -7.289429664611816, "global_step": 188636, "epoch": 4491} {"train_loss": -7.193869590759277, "global_step": 188637, "epoch": 4491} {"train_loss": -7.2070770263671875, "global_step": 188638, "epoch": 4491} {"train_loss": -6.977419376373291, "global_step": 188639, "epoch": 4491} {"train_loss": -7.18791389465332, "global_step": 188640, "epoch": 4491} {"train_loss": -7.121496200561523, "global_step": 188641, "epoch": 4491} {"train_loss": -7.070732593536377, "global_step": 188642, "epoch": 4491} {"train_loss": -7.116535663604736, "global_step": 188643, "epoch": 4491} {"train_loss": -6.964289665222168, "global_step": 188644, "epoch": 4491} {"train_loss": -7.149227619171143, "global_step": 188645, "epoch": 4491} {"train_loss": -7.063182830810547, "global_step": 188646, "epoch": 4491} {"train_loss": -7.164236545562744, "global_step": 188647, "epoch": 4491} {"train_loss": -7.261219024658203, "global_step": 188648, "epoch": 4491} {"train_loss": -7.096063613891602, "global_step": 188649, "epoch": 4491} {"train_loss": -7.152004718780518, "global_step": 188650, "epoch": 4491} {"train_loss": -7.095364570617676, "global_step": 188651, "epoch": 4491} {"train_loss": -7.158185005187988, "global_step": 188652, "epoch": 4491} {"train_loss": -7.19654655456543, "global_step": 188653, "epoch": 4491} {"train_loss": -7.159488677978516, "global_step": 188654, "epoch": 4491} {"train_loss": -7.264891624450684, "global_step": 188655, "epoch": 4491} {"train_loss": -7.196877479553223, "global_step": 188656, "epoch": 4491} {"train_loss": -7.11093282699585, "global_step": 188657, "epoch": 4491} {"train_loss": -7.112168312072754, "global_step": 188658, "epoch": 4491} {"train_loss": -7.173033237457275, "global_step": 188659, "epoch": 4491} {"train_loss": -7.134864807128906, "global_step": 188660, "epoch": 4491} {"train_loss": -7.036667823791504, "global_step": 188661, "epoch": 4491} {"train_loss": -7.144330978393555, "global_step": 188662, "epoch": 4491} {"train_loss": -7.162946212859381, "global_step": 188663, "epoch": 4491, "val_loss": 69548.9921875} {"train_loss": -7.201085567474365, "global_step": 188664, "epoch": 4492} {"train_loss": -7.140778541564941, "global_step": 188665, "epoch": 4492} {"train_loss": -7.071921348571777, "global_step": 188666, "epoch": 4492} {"train_loss": -7.200245380401611, "global_step": 188667, "epoch": 4492} {"train_loss": -7.128443717956543, "global_step": 188668, "epoch": 4492} {"train_loss": -7.224076271057129, "global_step": 188669, "epoch": 4492} {"train_loss": -7.28956937789917, "global_step": 188670, "epoch": 4492} {"train_loss": -7.189820289611816, "global_step": 188671, "epoch": 4492} {"train_loss": -7.276121616363525, "global_step": 188672, "epoch": 4492} {"train_loss": -7.21916389465332, "global_step": 188673, "epoch": 4492} {"train_loss": -7.2353057861328125, "global_step": 188674, "epoch": 4492} {"train_loss": -7.186947822570801, "global_step": 188675, "epoch": 4492} {"train_loss": -7.258437633514404, "global_step": 188676, "epoch": 4492} {"train_loss": -7.287478923797607, "global_step": 188677, "epoch": 4492} {"train_loss": -7.288120269775391, "global_step": 188678, "epoch": 4492} {"train_loss": -7.2227983474731445, "global_step": 188679, "epoch": 4492} {"train_loss": -7.242938041687012, "global_step": 188680, "epoch": 4492} {"train_loss": -7.313636779785156, "global_step": 188681, "epoch": 4492} {"train_loss": -7.206592559814453, "global_step": 188682, "epoch": 4492} {"train_loss": -7.140427589416504, "global_step": 188683, "epoch": 4492} {"train_loss": -7.224277496337891, "global_step": 188684, "epoch": 4492} {"train_loss": -7.336960792541504, "global_step": 188685, "epoch": 4492} {"train_loss": -7.243264198303223, "global_step": 188686, "epoch": 4492} {"train_loss": -7.265619277954102, "global_step": 188687, "epoch": 4492} {"train_loss": -7.214749813079834, "global_step": 188688, "epoch": 4492} {"train_loss": -7.222233772277832, "global_step": 188689, "epoch": 4492} {"train_loss": -7.16450309753418, "global_step": 188690, "epoch": 4492} {"train_loss": -7.076079368591309, "global_step": 188691, "epoch": 4492} {"train_loss": -7.140252590179443, "global_step": 188692, "epoch": 4492} {"train_loss": -7.235433578491211, "global_step": 188693, "epoch": 4492} {"train_loss": -7.146489143371582, "global_step": 188694, "epoch": 4492} {"train_loss": -7.183107376098633, "global_step": 188695, "epoch": 4492} {"train_loss": -7.027435302734375, "global_step": 188696, "epoch": 4492} {"train_loss": -7.200847148895264, "global_step": 188697, "epoch": 4492} {"train_loss": -7.108534336090088, "global_step": 188698, "epoch": 4492} {"train_loss": -7.140294075012207, "global_step": 188699, "epoch": 4492} {"train_loss": -7.136087894439697, "global_step": 188700, "epoch": 4492} {"train_loss": -7.248273849487305, "global_step": 188701, "epoch": 4492} {"train_loss": -7.144107341766357, "global_step": 188702, "epoch": 4492} {"train_loss": -7.22471809387207, "global_step": 188703, "epoch": 4492} {"train_loss": -7.153341770172119, "global_step": 188704, "epoch": 4492} {"train_loss": -7.1963753927321665, "global_step": 188705, "epoch": 4492, "val_loss": 69554.390625} {"train_loss": -7.163482666015625, "global_step": 188706, "epoch": 4493} {"train_loss": -7.126813888549805, "global_step": 188707, "epoch": 4493} {"train_loss": -7.089366436004639, "global_step": 188708, "epoch": 4493} {"train_loss": -7.109074592590332, "global_step": 188709, "epoch": 4493} {"train_loss": -6.924957275390625, "global_step": 188710, "epoch": 4493} {"train_loss": -7.002580642700195, "global_step": 188711, "epoch": 4493} {"train_loss": -7.104897499084473, "global_step": 188712, "epoch": 4493} {"train_loss": -7.054331302642822, "global_step": 188713, "epoch": 4493} {"train_loss": -7.065016746520996, "global_step": 188714, "epoch": 4493} {"train_loss": -7.113142490386963, "global_step": 188715, "epoch": 4493} {"train_loss": -6.997704982757568, "global_step": 188716, "epoch": 4493} {"train_loss": -7.043989658355713, "global_step": 188717, "epoch": 4493} {"train_loss": -7.042597770690918, "global_step": 188718, "epoch": 4493} {"train_loss": -7.083390235900879, "global_step": 188719, "epoch": 4493} {"train_loss": -7.036144733428955, "global_step": 188720, "epoch": 4493} {"train_loss": -7.109218597412109, "global_step": 188721, "epoch": 4493} {"train_loss": -7.0846266746521, "global_step": 188722, "epoch": 4493} {"train_loss": -7.1036376953125, "global_step": 188723, "epoch": 4493} {"train_loss": -7.208414077758789, "global_step": 188724, "epoch": 4493} {"train_loss": -7.072700500488281, "global_step": 188725, "epoch": 4493} {"train_loss": -7.151473045349121, "global_step": 188726, "epoch": 4493} {"train_loss": -7.2748332023620605, "global_step": 188727, "epoch": 4493} {"train_loss": -7.189663887023926, "global_step": 188728, "epoch": 4493} {"train_loss": -7.166149139404297, "global_step": 188729, "epoch": 4493} {"train_loss": -7.188779830932617, "global_step": 188730, "epoch": 4493} {"train_loss": -7.114418983459473, "global_step": 188731, "epoch": 4493} {"train_loss": -7.04797887802124, "global_step": 188732, "epoch": 4493} {"train_loss": -7.170169830322266, "global_step": 188733, "epoch": 4493} {"train_loss": -7.141528129577637, "global_step": 188734, "epoch": 4493} {"train_loss": -7.124888896942139, "global_step": 188735, "epoch": 4493} {"train_loss": -7.142805099487305, "global_step": 188736, "epoch": 4493} {"train_loss": -7.133191108703613, "global_step": 188737, "epoch": 4493} {"train_loss": -7.2278971672058105, "global_step": 188738, "epoch": 4493} {"train_loss": -7.291201591491699, "global_step": 188739, "epoch": 4493} {"train_loss": -7.255762100219727, "global_step": 188740, "epoch": 4493} {"train_loss": -7.037242412567139, "global_step": 188741, "epoch": 4493} {"train_loss": -7.305992126464844, "global_step": 188742, "epoch": 4493} {"train_loss": -7.220041751861572, "global_step": 188743, "epoch": 4493} {"train_loss": -7.248513221740723, "global_step": 188744, "epoch": 4493} {"train_loss": -7.203740119934082, "global_step": 188745, "epoch": 4493} {"train_loss": -7.301755905151367, "global_step": 188746, "epoch": 4493} {"train_loss": -7.134751229059129, "global_step": 188747, "epoch": 4493, "val_loss": 69396.3515625} {"train_loss": -7.158478736877441, "global_step": 188748, "epoch": 4494} {"train_loss": -7.335904121398926, "global_step": 188749, "epoch": 4494} {"train_loss": -7.159001350402832, "global_step": 188750, "epoch": 4494} {"train_loss": -7.13651180267334, "global_step": 188751, "epoch": 4494} {"train_loss": -7.2305827140808105, "global_step": 188752, "epoch": 4494} {"train_loss": -7.209752082824707, "global_step": 188753, "epoch": 4494} {"train_loss": -7.287590980529785, "global_step": 188754, "epoch": 4494} {"train_loss": -7.246843338012695, "global_step": 188755, "epoch": 4494} {"train_loss": -7.204860687255859, "global_step": 188756, "epoch": 4494} {"train_loss": -7.214413642883301, "global_step": 188757, "epoch": 4494} {"train_loss": -7.157340049743652, "global_step": 188758, "epoch": 4494} {"train_loss": -7.249603271484375, "global_step": 188759, "epoch": 4494} {"train_loss": -7.167857646942139, "global_step": 188760, "epoch": 4494} {"train_loss": -7.151889324188232, "global_step": 188761, "epoch": 4494} {"train_loss": -7.230247497558594, "global_step": 188762, "epoch": 4494} {"train_loss": -7.323760032653809, "global_step": 188763, "epoch": 4494} {"train_loss": -7.212555885314941, "global_step": 188764, "epoch": 4494} {"train_loss": -7.251991271972656, "global_step": 188765, "epoch": 4494} {"train_loss": -7.270915985107422, "global_step": 188766, "epoch": 4494} {"train_loss": -7.077728748321533, "global_step": 188767, "epoch": 4494} {"train_loss": -7.154882431030273, "global_step": 188768, "epoch": 4494} {"train_loss": -7.02203369140625, "global_step": 188769, "epoch": 4494} {"train_loss": -7.201727867126465, "global_step": 188770, "epoch": 4494} {"train_loss": -7.020681381225586, "global_step": 188771, "epoch": 4494} {"train_loss": -7.206600189208984, "global_step": 188772, "epoch": 4494} {"train_loss": -7.112841606140137, "global_step": 188773, "epoch": 4494} {"train_loss": -6.982099533081055, "global_step": 188774, "epoch": 4494} {"train_loss": -7.183204174041748, "global_step": 188775, "epoch": 4494} {"train_loss": -6.983458995819092, "global_step": 188776, "epoch": 4494} {"train_loss": -7.106655597686768, "global_step": 188777, "epoch": 4494} {"train_loss": -7.162256240844727, "global_step": 188778, "epoch": 4494} {"train_loss": -7.09462833404541, "global_step": 188779, "epoch": 4494} {"train_loss": -7.071331977844238, "global_step": 188780, "epoch": 4494} {"train_loss": -7.159651756286621, "global_step": 188781, "epoch": 4494} {"train_loss": -7.150649547576904, "global_step": 188782, "epoch": 4494} {"train_loss": -7.254146575927734, "global_step": 188783, "epoch": 4494} {"train_loss": -7.220945358276367, "global_step": 188784, "epoch": 4494} {"train_loss": -7.141198635101318, "global_step": 188785, "epoch": 4494} {"train_loss": -7.276532173156738, "global_step": 188786, "epoch": 4494} {"train_loss": -7.229371547698975, "global_step": 188787, "epoch": 4494} {"train_loss": -7.17716121673584, "global_step": 188788, "epoch": 4494} {"train_loss": -7.176898343222482, "global_step": 188789, "epoch": 4494, "val_loss": 69591.5390625} {"train_loss": -7.231877326965332, "global_step": 188790, "epoch": 4495} {"train_loss": -7.1542510986328125, "global_step": 188791, "epoch": 4495} {"train_loss": -7.22806978225708, "global_step": 188792, "epoch": 4495} {"train_loss": -7.181699752807617, "global_step": 188793, "epoch": 4495} {"train_loss": -7.197767734527588, "global_step": 188794, "epoch": 4495} {"train_loss": -7.172101020812988, "global_step": 188795, "epoch": 4495} {"train_loss": -7.191670894622803, "global_step": 188796, "epoch": 4495} {"train_loss": -7.200274467468262, "global_step": 188797, "epoch": 4495} {"train_loss": -7.263747215270996, "global_step": 188798, "epoch": 4495} {"train_loss": -7.083085060119629, "global_step": 188799, "epoch": 4495} {"train_loss": -7.291151523590088, "global_step": 188800, "epoch": 4495} {"train_loss": -7.222405910491943, "global_step": 188801, "epoch": 4495} {"train_loss": -7.224120140075684, "global_step": 188802, "epoch": 4495} {"train_loss": -7.343559265136719, "global_step": 188803, "epoch": 4495} {"train_loss": -7.1668500900268555, "global_step": 188804, "epoch": 4495} {"train_loss": -7.200447082519531, "global_step": 188805, "epoch": 4495} {"train_loss": -7.185921669006348, "global_step": 188806, "epoch": 4495} {"train_loss": -7.2040910720825195, "global_step": 188807, "epoch": 4495} {"train_loss": -7.255873680114746, "global_step": 188808, "epoch": 4495} {"train_loss": -7.26566743850708, "global_step": 188809, "epoch": 4495} {"train_loss": -7.206600189208984, "global_step": 188810, "epoch": 4495} {"train_loss": -7.218510627746582, "global_step": 188811, "epoch": 4495} {"train_loss": -7.18647575378418, "global_step": 188812, "epoch": 4495} {"train_loss": -7.168299674987793, "global_step": 188813, "epoch": 4495} {"train_loss": -7.093106269836426, "global_step": 188814, "epoch": 4495} {"train_loss": -7.24210262298584, "global_step": 188815, "epoch": 4495} {"train_loss": -7.073602676391602, "global_step": 188816, "epoch": 4495} {"train_loss": -7.143786430358887, "global_step": 188817, "epoch": 4495} {"train_loss": -7.06285285949707, "global_step": 188818, "epoch": 4495} {"train_loss": -7.010749816894531, "global_step": 188819, "epoch": 4495} {"train_loss": -7.057692050933838, "global_step": 188820, "epoch": 4495} {"train_loss": -7.1200175285339355, "global_step": 188821, "epoch": 4495} {"train_loss": -7.199074745178223, "global_step": 188822, "epoch": 4495} {"train_loss": -7.191466808319092, "global_step": 188823, "epoch": 4495} {"train_loss": -7.137093544006348, "global_step": 188824, "epoch": 4495} {"train_loss": -7.100830078125, "global_step": 188825, "epoch": 4495} {"train_loss": -7.178781509399414, "global_step": 188826, "epoch": 4495} {"train_loss": -7.180389404296875, "global_step": 188827, "epoch": 4495} {"train_loss": -7.073958873748779, "global_step": 188828, "epoch": 4495} {"train_loss": -7.1280107498168945, "global_step": 188829, "epoch": 4495} {"train_loss": -7.1806488037109375, "global_step": 188830, "epoch": 4495} {"train_loss": -7.174534650076003, "global_step": 188831, "epoch": 4495, "val_loss": 69775.25} {"train_loss": -7.143143177032471, "global_step": 188832, "epoch": 4496} {"train_loss": -7.319958686828613, "global_step": 188833, "epoch": 4496} {"train_loss": -7.087067604064941, "global_step": 188834, "epoch": 4496} {"train_loss": -7.231666564941406, "global_step": 188835, "epoch": 4496} {"train_loss": -7.189602375030518, "global_step": 188836, "epoch": 4496} {"train_loss": -7.097667694091797, "global_step": 188837, "epoch": 4496} {"train_loss": -7.159304141998291, "global_step": 188838, "epoch": 4496} {"train_loss": -7.072163105010986, "global_step": 188839, "epoch": 4496} {"train_loss": -7.209928512573242, "global_step": 188840, "epoch": 4496} {"train_loss": -7.175079345703125, "global_step": 188841, "epoch": 4496} {"train_loss": -7.2264404296875, "global_step": 188842, "epoch": 4496} {"train_loss": -7.172305107116699, "global_step": 188843, "epoch": 4496} {"train_loss": -7.129588603973389, "global_step": 188844, "epoch": 4496} {"train_loss": -7.340656280517578, "global_step": 188845, "epoch": 4496} {"train_loss": -7.202472686767578, "global_step": 188846, "epoch": 4496} {"train_loss": -7.202349662780762, "global_step": 188847, "epoch": 4496} {"train_loss": -7.173843860626221, "global_step": 188848, "epoch": 4496} {"train_loss": -7.287829875946045, "global_step": 188849, "epoch": 4496} {"train_loss": -7.178131103515625, "global_step": 188850, "epoch": 4496} {"train_loss": -7.265486717224121, "global_step": 188851, "epoch": 4496} {"train_loss": -7.2922163009643555, "global_step": 188852, "epoch": 4496} {"train_loss": -7.20168399810791, "global_step": 188853, "epoch": 4496} {"train_loss": -7.124506950378418, "global_step": 188854, "epoch": 4496} {"train_loss": -7.140380859375, "global_step": 188855, "epoch": 4496} {"train_loss": -7.2459611892700195, "global_step": 188856, "epoch": 4496} {"train_loss": -7.228344917297363, "global_step": 188857, "epoch": 4496} {"train_loss": -7.158376693725586, "global_step": 188858, "epoch": 4496} {"train_loss": -7.301541805267334, "global_step": 188859, "epoch": 4496} {"train_loss": -7.212827682495117, "global_step": 188860, "epoch": 4496} {"train_loss": -7.237453460693359, "global_step": 188861, "epoch": 4496} {"train_loss": -7.194159507751465, "global_step": 188862, "epoch": 4496} {"train_loss": -7.175883769989014, "global_step": 188863, "epoch": 4496} {"train_loss": -7.110921859741211, "global_step": 188864, "epoch": 4496} {"train_loss": -7.175352096557617, "global_step": 188865, "epoch": 4496} {"train_loss": -7.224118232727051, "global_step": 188866, "epoch": 4496} {"train_loss": -7.236982345581055, "global_step": 188867, "epoch": 4496} {"train_loss": -7.238915920257568, "global_step": 188868, "epoch": 4496} {"train_loss": -7.101480960845947, "global_step": 188869, "epoch": 4496} {"train_loss": -7.146280288696289, "global_step": 188870, "epoch": 4496} {"train_loss": -7.306666374206543, "global_step": 188871, "epoch": 4496} {"train_loss": -7.1827497482299805, "global_step": 188872, "epoch": 4496} {"train_loss": -7.195293369747343, "global_step": 188873, "epoch": 4496, "val_loss": 69642.421875} {"train_loss": -7.239632606506348, "global_step": 188874, "epoch": 4497} {"train_loss": -7.274132251739502, "global_step": 188875, "epoch": 4497} {"train_loss": -7.170497417449951, "global_step": 188876, "epoch": 4497} {"train_loss": -7.161275863647461, "global_step": 188877, "epoch": 4497} {"train_loss": -7.1505842208862305, "global_step": 188878, "epoch": 4497} {"train_loss": -7.337310791015625, "global_step": 188879, "epoch": 4497} {"train_loss": -7.230249404907227, "global_step": 188880, "epoch": 4497} {"train_loss": -7.193131923675537, "global_step": 188881, "epoch": 4497} {"train_loss": -7.235876083374023, "global_step": 188882, "epoch": 4497} {"train_loss": -7.244322776794434, "global_step": 188883, "epoch": 4497} {"train_loss": -7.249224662780762, "global_step": 188884, "epoch": 4497} {"train_loss": -7.017403602600098, "global_step": 188885, "epoch": 4497} {"train_loss": -7.153639793395996, "global_step": 188886, "epoch": 4497} {"train_loss": -7.217120170593262, "global_step": 188887, "epoch": 4497} {"train_loss": -7.223609924316406, "global_step": 188888, "epoch": 4497} {"train_loss": -7.193824291229248, "global_step": 188889, "epoch": 4497} {"train_loss": -7.241161346435547, "global_step": 188890, "epoch": 4497} {"train_loss": -7.106083869934082, "global_step": 188891, "epoch": 4497} {"train_loss": -7.157935619354248, "global_step": 188892, "epoch": 4497} {"train_loss": -7.081494331359863, "global_step": 188893, "epoch": 4497} {"train_loss": -7.126687049865723, "global_step": 188894, "epoch": 4497} {"train_loss": -7.017106056213379, "global_step": 188895, "epoch": 4497} {"train_loss": -7.129842758178711, "global_step": 188896, "epoch": 4497} {"train_loss": -7.230645179748535, "global_step": 188897, "epoch": 4497} {"train_loss": -7.164676666259766, "global_step": 188898, "epoch": 4497} {"train_loss": -7.320308208465576, "global_step": 188899, "epoch": 4497} {"train_loss": -7.174399375915527, "global_step": 188900, "epoch": 4497} {"train_loss": -7.260125160217285, "global_step": 188901, "epoch": 4497} {"train_loss": -7.261584281921387, "global_step": 188902, "epoch": 4497} {"train_loss": -7.199816703796387, "global_step": 188903, "epoch": 4497} {"train_loss": -7.320396423339844, "global_step": 188904, "epoch": 4497} {"train_loss": -7.250614643096924, "global_step": 188905, "epoch": 4497} {"train_loss": -7.128020763397217, "global_step": 188906, "epoch": 4497} {"train_loss": -7.241422176361084, "global_step": 188907, "epoch": 4497} {"train_loss": -7.211912155151367, "global_step": 188908, "epoch": 4497} {"train_loss": -6.997215747833252, "global_step": 188909, "epoch": 4497} {"train_loss": -7.2387542724609375, "global_step": 188910, "epoch": 4497} {"train_loss": -7.186517715454102, "global_step": 188911, "epoch": 4497} {"train_loss": -7.301601886749268, "global_step": 188912, "epoch": 4497} {"train_loss": -7.224037170410156, "global_step": 188913, "epoch": 4497} {"train_loss": -7.083566665649414, "global_step": 188914, "epoch": 4497} {"train_loss": -7.194563593183245, "global_step": 188915, "epoch": 4497, "val_loss": 69618.2578125} {"train_loss": -7.263113498687744, "global_step": 188916, "epoch": 4498} {"train_loss": -7.067689895629883, "global_step": 188917, "epoch": 4498} {"train_loss": -7.221643447875977, "global_step": 188918, "epoch": 4498} {"train_loss": -7.214250087738037, "global_step": 188919, "epoch": 4498} {"train_loss": -7.1676926612854, "global_step": 188920, "epoch": 4498} {"train_loss": -7.202703952789307, "global_step": 188921, "epoch": 4498} {"train_loss": -7.192758560180664, "global_step": 188922, "epoch": 4498} {"train_loss": -7.14176607131958, "global_step": 188923, "epoch": 4498} {"train_loss": -7.064830303192139, "global_step": 188924, "epoch": 4498} {"train_loss": -7.083804130554199, "global_step": 188925, "epoch": 4498} {"train_loss": -7.1240234375, "global_step": 188926, "epoch": 4498} {"train_loss": -7.1778459548950195, "global_step": 188927, "epoch": 4498} {"train_loss": -7.153386116027832, "global_step": 188928, "epoch": 4498} {"train_loss": -7.20919942855835, "global_step": 188929, "epoch": 4498} {"train_loss": -7.242743492126465, "global_step": 188930, "epoch": 4498} {"train_loss": -7.340588569641113, "global_step": 188931, "epoch": 4498} {"train_loss": -7.275493621826172, "global_step": 188932, "epoch": 4498} {"train_loss": -7.139111518859863, "global_step": 188933, "epoch": 4498} {"train_loss": -7.212261199951172, "global_step": 188934, "epoch": 4498} {"train_loss": -7.122274398803711, "global_step": 188935, "epoch": 4498} {"train_loss": -7.258100509643555, "global_step": 188936, "epoch": 4498} {"train_loss": -7.28098201751709, "global_step": 188937, "epoch": 4498} {"train_loss": -7.208389759063721, "global_step": 188938, "epoch": 4498} {"train_loss": -7.161738872528076, "global_step": 188939, "epoch": 4498} {"train_loss": -7.112863540649414, "global_step": 188940, "epoch": 4498} {"train_loss": -7.127409934997559, "global_step": 188941, "epoch": 4498} {"train_loss": -7.1035661697387695, "global_step": 188942, "epoch": 4498} {"train_loss": -7.128549575805664, "global_step": 188943, "epoch": 4498} {"train_loss": -7.227455139160156, "global_step": 188944, "epoch": 4498} {"train_loss": -7.151782989501953, "global_step": 188945, "epoch": 4498} {"train_loss": -6.946689605712891, "global_step": 188946, "epoch": 4498} {"train_loss": -7.031659126281738, "global_step": 188947, "epoch": 4498} {"train_loss": -7.171143531799316, "global_step": 188948, "epoch": 4498} {"train_loss": -7.107635498046875, "global_step": 188949, "epoch": 4498} {"train_loss": -7.154098033905029, "global_step": 188950, "epoch": 4498} {"train_loss": -7.118907928466797, "global_step": 188951, "epoch": 4498} {"train_loss": -6.968798637390137, "global_step": 188952, "epoch": 4498} {"train_loss": -7.152895927429199, "global_step": 188953, "epoch": 4498} {"train_loss": -7.1363701820373535, "global_step": 188954, "epoch": 4498} {"train_loss": -6.9899492263793945, "global_step": 188955, "epoch": 4498} {"train_loss": -7.0832109451293945, "global_step": 188956, "epoch": 4498} {"train_loss": -7.151759045464652, "global_step": 188957, "epoch": 4498, "val_loss": 69649.6875} {"train_loss": -7.091556072235107, "global_step": 188958, "epoch": 4499} {"train_loss": -7.10797119140625, "global_step": 188959, "epoch": 4499} {"train_loss": -7.100101947784424, "global_step": 188960, "epoch": 4499} {"train_loss": -7.214589595794678, "global_step": 188961, "epoch": 4499} {"train_loss": -7.07252311706543, "global_step": 188962, "epoch": 4499} {"train_loss": -7.106544494628906, "global_step": 188963, "epoch": 4499} {"train_loss": -7.0551910400390625, "global_step": 188964, "epoch": 4499} {"train_loss": -7.218060493469238, "global_step": 188965, "epoch": 4499} {"train_loss": -7.090511322021484, "global_step": 188966, "epoch": 4499} {"train_loss": -7.1225175857543945, "global_step": 188967, "epoch": 4499} {"train_loss": -7.2033891677856445, "global_step": 188968, "epoch": 4499} {"train_loss": -7.101871013641357, "global_step": 188969, "epoch": 4499} {"train_loss": -7.024946212768555, "global_step": 188970, "epoch": 4499} {"train_loss": -7.067203521728516, "global_step": 188971, "epoch": 4499} {"train_loss": -7.074201583862305, "global_step": 188972, "epoch": 4499} {"train_loss": -7.16495418548584, "global_step": 188973, "epoch": 4499} {"train_loss": -7.150545597076416, "global_step": 188974, "epoch": 4499} {"train_loss": -7.063827037811279, "global_step": 188975, "epoch": 4499} {"train_loss": -7.1774001121521, "global_step": 188976, "epoch": 4499} {"train_loss": -7.057882785797119, "global_step": 188977, "epoch": 4499} {"train_loss": -7.192863464355469, "global_step": 188978, "epoch": 4499} {"train_loss": -7.131411552429199, "global_step": 188979, "epoch": 4499} {"train_loss": -7.141822814941406, "global_step": 188980, "epoch": 4499} {"train_loss": -7.1030988693237305, "global_step": 188981, "epoch": 4499} {"train_loss": -7.153538703918457, "global_step": 188982, "epoch": 4499} {"train_loss": -7.235281467437744, "global_step": 188983, "epoch": 4499} {"train_loss": -7.064894199371338, "global_step": 188984, "epoch": 4499} {"train_loss": -7.1186017990112305, "global_step": 188985, "epoch": 4499} {"train_loss": -7.182443618774414, "global_step": 188986, "epoch": 4499} {"train_loss": -7.04654598236084, "global_step": 188987, "epoch": 4499} {"train_loss": -7.119441032409668, "global_step": 188988, "epoch": 4499} {"train_loss": -7.0667548179626465, "global_step": 188989, "epoch": 4499} {"train_loss": -7.145010948181152, "global_step": 188990, "epoch": 4499} {"train_loss": -7.1800737380981445, "global_step": 188991, "epoch": 4499} {"train_loss": -7.201315879821777, "global_step": 188992, "epoch": 4499} {"train_loss": -7.16715145111084, "global_step": 188993, "epoch": 4499} {"train_loss": -7.235500335693359, "global_step": 188994, "epoch": 4499} {"train_loss": -7.125563144683838, "global_step": 188995, "epoch": 4499} {"train_loss": -7.077779769897461, "global_step": 188996, "epoch": 4499} {"train_loss": -7.227144241333008, "global_step": 188997, "epoch": 4499} {"train_loss": -7.105238437652588, "global_step": 188998, "epoch": 4499} {"train_loss": -7.129549389793759, "global_step": 188999, "epoch": 4499, "val_loss": 69510.828125} {"train_loss": -7.249016761779785, "global_step": 189000, "epoch": 4500} {"train_loss": -7.117964744567871, "global_step": 189001, "epoch": 4500} {"train_loss": -7.040562152862549, "global_step": 189002, "epoch": 4500} {"train_loss": -7.236169815063477, "global_step": 189003, "epoch": 4500} {"train_loss": -7.247647762298584, "global_step": 189004, "epoch": 4500} {"train_loss": -7.138459205627441, "global_step": 189005, "epoch": 4500} {"train_loss": -7.142397403717041, "global_step": 189006, "epoch": 4500} {"train_loss": -7.250048637390137, "global_step": 189007, "epoch": 4500} {"train_loss": -6.977543830871582, "global_step": 189008, "epoch": 4500} {"train_loss": -7.1709489822387695, "global_step": 189009, "epoch": 4500} {"train_loss": -7.234223365783691, "global_step": 189010, "epoch": 4500} {"train_loss": -7.238579750061035, "global_step": 189011, "epoch": 4500} {"train_loss": -7.295917510986328, "global_step": 189012, "epoch": 4500} {"train_loss": -7.143576622009277, "global_step": 189013, "epoch": 4500} {"train_loss": -7.233178615570068, "global_step": 189014, "epoch": 4500} {"train_loss": -7.181818008422852, "global_step": 189015, "epoch": 4500} {"train_loss": -7.121983051300049, "global_step": 189016, "epoch": 4500} {"train_loss": -7.1348114013671875, "global_step": 189017, "epoch": 4500} {"train_loss": -7.243503093719482, "global_step": 189018, "epoch": 4500} {"train_loss": -7.189518928527832, "global_step": 189019, "epoch": 4500} {"train_loss": -7.173547267913818, "global_step": 189020, "epoch": 4500} {"train_loss": -7.258522033691406, "global_step": 189021, "epoch": 4500} {"train_loss": -7.209961891174316, "global_step": 189022, "epoch": 4500} {"train_loss": -7.236445426940918, "global_step": 189023, "epoch": 4500} {"train_loss": -7.187460899353027, "global_step": 189024, "epoch": 4500} {"train_loss": -7.2092766761779785, "global_step": 189025, "epoch": 4500} {"train_loss": -7.1812744140625, "global_step": 189026, "epoch": 4500} {"train_loss": -7.186427116394043, "global_step": 189027, "epoch": 4500} {"train_loss": -7.198929309844971, "global_step": 189028, "epoch": 4500} {"train_loss": -7.18879508972168, "global_step": 189029, "epoch": 4500} {"train_loss": -7.155993461608887, "global_step": 189030, "epoch": 4500} {"train_loss": -7.167910099029541, "global_step": 189031, "epoch": 4500} {"train_loss": -7.171396732330322, "global_step": 189032, "epoch": 4500} {"train_loss": -7.267406463623047, "global_step": 189033, "epoch": 4500} {"train_loss": -7.13519287109375, "global_step": 189034, "epoch": 4500} {"train_loss": -7.183879375457764, "global_step": 189035, "epoch": 4500} {"train_loss": -7.19348669052124, "global_step": 189036, "epoch": 4500} {"train_loss": -7.19806432723999, "global_step": 189037, "epoch": 4500} {"train_loss": -7.192751884460449, "global_step": 189038, "epoch": 4500} {"train_loss": -7.096710205078125, "global_step": 189039, "epoch": 4500} {"train_loss": -7.128909111022949, "global_step": 189040, "epoch": 4500} {"train_loss": -7.187102022625151, "global_step": 189041, "epoch": 4500, "train/sim_max_reward_0": 0.9205088286635384, "train/sim_max_reward_1": 0.9578019082885018, "train/sim_max_reward_2": 0.5542562501623949, "train/sim_max_reward_3": 0.8511566533280174, "train/sim_max_reward_4": 0.9844053821762301, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.8800092065395743, "test/sim_max_reward_4300001": 0.6638558349883102, "test/sim_max_reward_4300002": 0.8646556253876925, "test/sim_max_reward_4300003": 0.9232166203208593, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.3157953249481369, "test/sim_max_reward_4300008": 0.9095094740094133, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.895278704142039, "test/sim_max_reward_4300011": 0.5356768834911767, "test/sim_max_reward_4300012": 0.9439314670829848, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 0.9156106007869816, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.4655505767906915, "test/sim_max_reward_4300017": 0.8250216371228531, "test/sim_max_reward_4300018": 0.4139027245914926, "test/sim_max_reward_4300019": 0.18596472851519932, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.8883875863316304, "test/sim_max_reward_4300022": 0.9890217974750105, "test/sim_max_reward_4300023": 0.4363791407685296, "test/sim_max_reward_4300024": 0.6820164362583565, "test/sim_max_reward_4300025": 0.8993987367377001, "test/sim_max_reward_4300026": 0.1787557868283087, "test/sim_max_reward_4300027": 0.8294918165795812, "test/sim_max_reward_4300028": 0.959619558609811, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.2588999325411608, "test/sim_max_reward_4300031": 0.5879022034658874, "test/sim_max_reward_4300032": 0.9890827371177494, "test/sim_max_reward_4300033": 0.6250287095245222, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.23427011213972576, "test/sim_max_reward_4300036": 0.2087900369514994, "test/sim_max_reward_4300037": 0.9327602867973479, "test/sim_max_reward_4300038": 0.9718091256230836, "test/sim_max_reward_4300039": 0.7846954155485526, "test/sim_max_reward_4300040": 0.8640427794828547, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7149257034351421, "test/sim_max_reward_4300043": 0.13388313216860084, "test/sim_max_reward_4300044": 0.04369426015635423, "test/sim_max_reward_4300045": 0.9573122600917061, "test/sim_max_reward_4300046": 0.8494519201878367, "test/sim_max_reward_4300047": 0.15030373715067089, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.1961294376782645, "train/mean_score": 0.7435189636634784, "test/mean_score": 0.5823973232635317, "val_loss": 69608.8515625} {"train_loss": -7.1505327224731445, "global_step": 189042, "epoch": 4501} {"train_loss": -7.135024547576904, "global_step": 189043, "epoch": 4501} {"train_loss": -7.150124549865723, "global_step": 189044, "epoch": 4501} {"train_loss": -7.148564338684082, "global_step": 189045, "epoch": 4501} {"train_loss": -7.167000770568848, "global_step": 189046, "epoch": 4501} {"train_loss": -6.977351188659668, "global_step": 189047, "epoch": 4501} {"train_loss": -7.174598693847656, "global_step": 189048, "epoch": 4501} {"train_loss": -7.304747581481934, "global_step": 189049, "epoch": 4501} {"train_loss": -6.947419166564941, "global_step": 189050, "epoch": 4501} {"train_loss": -6.9803361892700195, "global_step": 189051, "epoch": 4501} {"train_loss": -7.194136619567871, "global_step": 189052, "epoch": 4501} {"train_loss": -6.985811233520508, "global_step": 189053, "epoch": 4501} {"train_loss": -7.142244338989258, "global_step": 189054, "epoch": 4501} {"train_loss": -7.158939361572266, "global_step": 189055, "epoch": 4501} {"train_loss": -7.024941444396973, "global_step": 189056, "epoch": 4501} {"train_loss": -7.254306316375732, "global_step": 189057, "epoch": 4501} {"train_loss": -7.162452220916748, "global_step": 189058, "epoch": 4501} {"train_loss": -7.137420654296875, "global_step": 189059, "epoch": 4501} {"train_loss": -7.2144999504089355, "global_step": 189060, "epoch": 4501} {"train_loss": -7.189801216125488, "global_step": 189061, "epoch": 4501} {"train_loss": -7.232297897338867, "global_step": 189062, "epoch": 4501} {"train_loss": -7.218633651733398, "global_step": 189063, "epoch": 4501} {"train_loss": -7.1711225509643555, "global_step": 189064, "epoch": 4501} {"train_loss": -7.232743263244629, "global_step": 189065, "epoch": 4501} {"train_loss": -7.291481971740723, "global_step": 189066, "epoch": 4501} {"train_loss": -7.233066558837891, "global_step": 189067, "epoch": 4501} {"train_loss": -7.243526458740234, "global_step": 189068, "epoch": 4501} {"train_loss": -7.214176177978516, "global_step": 189069, "epoch": 4501} {"train_loss": -7.209157466888428, "global_step": 189070, "epoch": 4501} {"train_loss": -7.2588210105896, "global_step": 189071, "epoch": 4501} {"train_loss": -7.27241325378418, "global_step": 189072, "epoch": 4501} {"train_loss": -7.222047328948975, "global_step": 189073, "epoch": 4501} {"train_loss": -7.206552505493164, "global_step": 189074, "epoch": 4501} {"train_loss": -7.1925368309021, "global_step": 189075, "epoch": 4501} {"train_loss": -7.2505269050598145, "global_step": 189076, "epoch": 4501} {"train_loss": -7.120865345001221, "global_step": 189077, "epoch": 4501} {"train_loss": -7.1666154861450195, "global_step": 189078, "epoch": 4501} {"train_loss": -7.26613712310791, "global_step": 189079, "epoch": 4501} {"train_loss": -7.141289710998535, "global_step": 189080, "epoch": 4501} {"train_loss": -7.1341166496276855, "global_step": 189081, "epoch": 4501} {"train_loss": -7.0953240394592285, "global_step": 189082, "epoch": 4501} {"train_loss": -7.169929890405564, "global_step": 189083, "epoch": 4501, "val_loss": 69451.5546875} {"train_loss": -7.210562705993652, "global_step": 189084, "epoch": 4502} {"train_loss": -7.264060974121094, "global_step": 189085, "epoch": 4502} {"train_loss": -7.301637172698975, "global_step": 189086, "epoch": 4502} {"train_loss": -7.1386213302612305, "global_step": 189087, "epoch": 4502} {"train_loss": -7.2880754470825195, "global_step": 189088, "epoch": 4502} {"train_loss": -7.297119140625, "global_step": 189089, "epoch": 4502} {"train_loss": -7.2008843421936035, "global_step": 189090, "epoch": 4502} {"train_loss": -7.110170364379883, "global_step": 189091, "epoch": 4502} {"train_loss": -7.117341041564941, "global_step": 189092, "epoch": 4502} {"train_loss": -7.238197326660156, "global_step": 189093, "epoch": 4502} {"train_loss": -7.272493839263916, "global_step": 189094, "epoch": 4502} {"train_loss": -7.219514846801758, "global_step": 189095, "epoch": 4502} {"train_loss": -7.220155239105225, "global_step": 189096, "epoch": 4502} {"train_loss": -7.294201850891113, "global_step": 189097, "epoch": 4502} {"train_loss": -7.146111965179443, "global_step": 189098, "epoch": 4502} {"train_loss": -7.2058258056640625, "global_step": 189099, "epoch": 4502} {"train_loss": -7.187167167663574, "global_step": 189100, "epoch": 4502} {"train_loss": -7.281218528747559, "global_step": 189101, "epoch": 4502} {"train_loss": -7.14901876449585, "global_step": 189102, "epoch": 4502} {"train_loss": -7.2278523445129395, "global_step": 189103, "epoch": 4502} {"train_loss": -7.192166805267334, "global_step": 189104, "epoch": 4502} {"train_loss": -7.0889997482299805, "global_step": 189105, "epoch": 4502} {"train_loss": -7.167004108428955, "global_step": 189106, "epoch": 4502} {"train_loss": -7.216917037963867, "global_step": 189107, "epoch": 4502} {"train_loss": -7.181329727172852, "global_step": 189108, "epoch": 4502} {"train_loss": -7.191399574279785, "global_step": 189109, "epoch": 4502} {"train_loss": -7.169058799743652, "global_step": 189110, "epoch": 4502} {"train_loss": -7.174969673156738, "global_step": 189111, "epoch": 4502} {"train_loss": -7.055779457092285, "global_step": 189112, "epoch": 4502} {"train_loss": -7.029026031494141, "global_step": 189113, "epoch": 4502} {"train_loss": -7.10223913192749, "global_step": 189114, "epoch": 4502} {"train_loss": -7.154840469360352, "global_step": 189115, "epoch": 4502} {"train_loss": -7.282922267913818, "global_step": 189116, "epoch": 4502} {"train_loss": -7.100144863128662, "global_step": 189117, "epoch": 4502} {"train_loss": -7.221759796142578, "global_step": 189118, "epoch": 4502} {"train_loss": -7.271800994873047, "global_step": 189119, "epoch": 4502} {"train_loss": -7.1429548263549805, "global_step": 189120, "epoch": 4502} {"train_loss": -7.13314151763916, "global_step": 189121, "epoch": 4502} {"train_loss": -7.081178665161133, "global_step": 189122, "epoch": 4502} {"train_loss": -7.137015342712402, "global_step": 189123, "epoch": 4502} {"train_loss": -7.101536750793457, "global_step": 189124, "epoch": 4502} {"train_loss": -7.184556643168132, "global_step": 189125, "epoch": 4502, "val_loss": 69677.8046875} {"train_loss": -7.131043434143066, "global_step": 189126, "epoch": 4503} {"train_loss": -7.229114532470703, "global_step": 189127, "epoch": 4503} {"train_loss": -7.183608055114746, "global_step": 189128, "epoch": 4503} {"train_loss": -7.185328483581543, "global_step": 189129, "epoch": 4503} {"train_loss": -7.1078290939331055, "global_step": 189130, "epoch": 4503} {"train_loss": -7.156314849853516, "global_step": 189131, "epoch": 4503} {"train_loss": -7.170480728149414, "global_step": 189132, "epoch": 4503} {"train_loss": -7.132430076599121, "global_step": 189133, "epoch": 4503} {"train_loss": -7.21168327331543, "global_step": 189134, "epoch": 4503} {"train_loss": -7.206822395324707, "global_step": 189135, "epoch": 4503} {"train_loss": -7.164932727813721, "global_step": 189136, "epoch": 4503} {"train_loss": -7.1895036697387695, "global_step": 189137, "epoch": 4503} {"train_loss": -7.217312812805176, "global_step": 189138, "epoch": 4503} {"train_loss": -7.24935245513916, "global_step": 189139, "epoch": 4503} {"train_loss": -7.193798065185547, "global_step": 189140, "epoch": 4503} {"train_loss": -7.2311906814575195, "global_step": 189141, "epoch": 4503} {"train_loss": -7.152030944824219, "global_step": 189142, "epoch": 4503} {"train_loss": -7.251589775085449, "global_step": 189143, "epoch": 4503} {"train_loss": -7.165999412536621, "global_step": 189144, "epoch": 4503} {"train_loss": -7.146112442016602, "global_step": 189145, "epoch": 4503} {"train_loss": -7.173395156860352, "global_step": 189146, "epoch": 4503} {"train_loss": -7.133498191833496, "global_step": 189147, "epoch": 4503} {"train_loss": -7.097012996673584, "global_step": 189148, "epoch": 4503} {"train_loss": -7.230185031890869, "global_step": 189149, "epoch": 4503} {"train_loss": -6.898958206176758, "global_step": 189150, "epoch": 4503} {"train_loss": -7.110534191131592, "global_step": 189151, "epoch": 4503} {"train_loss": -7.121445655822754, "global_step": 189152, "epoch": 4503} {"train_loss": -7.193140029907227, "global_step": 189153, "epoch": 4503} {"train_loss": -7.183929443359375, "global_step": 189154, "epoch": 4503} {"train_loss": -7.141758918762207, "global_step": 189155, "epoch": 4503} {"train_loss": -7.214685916900635, "global_step": 189156, "epoch": 4503} {"train_loss": -7.149301528930664, "global_step": 189157, "epoch": 4503} {"train_loss": -7.2878098487854, "global_step": 189158, "epoch": 4503} {"train_loss": -7.240610599517822, "global_step": 189159, "epoch": 4503} {"train_loss": -7.2245988845825195, "global_step": 189160, "epoch": 4503} {"train_loss": -7.206974029541016, "global_step": 189161, "epoch": 4503} {"train_loss": -7.1850175857543945, "global_step": 189162, "epoch": 4503} {"train_loss": -7.304022789001465, "global_step": 189163, "epoch": 4503} {"train_loss": -7.1361494064331055, "global_step": 189164, "epoch": 4503} {"train_loss": -7.210403919219971, "global_step": 189165, "epoch": 4503} {"train_loss": -7.210567474365234, "global_step": 189166, "epoch": 4503} {"train_loss": -7.18083533786592, "global_step": 189167, "epoch": 4503, "val_loss": 69559.984375} {"train_loss": -7.202731609344482, "global_step": 189168, "epoch": 4504} {"train_loss": -7.192766189575195, "global_step": 189169, "epoch": 4504} {"train_loss": -7.171875953674316, "global_step": 189170, "epoch": 4504} {"train_loss": -7.1715240478515625, "global_step": 189171, "epoch": 4504} {"train_loss": -7.218267440795898, "global_step": 189172, "epoch": 4504} {"train_loss": -7.161625862121582, "global_step": 189173, "epoch": 4504} {"train_loss": -7.195193767547607, "global_step": 189174, "epoch": 4504} {"train_loss": -7.3141679763793945, "global_step": 189175, "epoch": 4504} {"train_loss": -7.0945353507995605, "global_step": 189176, "epoch": 4504} {"train_loss": -7.195313930511475, "global_step": 189177, "epoch": 4504} {"train_loss": -7.0842132568359375, "global_step": 189178, "epoch": 4504} {"train_loss": -7.060307502746582, "global_step": 189179, "epoch": 4504} {"train_loss": -7.236549377441406, "global_step": 189180, "epoch": 4504} {"train_loss": -6.997547626495361, "global_step": 189181, "epoch": 4504} {"train_loss": -7.226537227630615, "global_step": 189182, "epoch": 4504} {"train_loss": -7.095149040222168, "global_step": 189183, "epoch": 4504} {"train_loss": -7.109818935394287, "global_step": 189184, "epoch": 4504} {"train_loss": -7.1934123039245605, "global_step": 189185, "epoch": 4504} {"train_loss": -7.039088249206543, "global_step": 189186, "epoch": 4504} {"train_loss": -7.229674339294434, "global_step": 189187, "epoch": 4504} {"train_loss": -7.180632591247559, "global_step": 189188, "epoch": 4504} {"train_loss": -7.2068071365356445, "global_step": 189189, "epoch": 4504} {"train_loss": -7.191854000091553, "global_step": 189190, "epoch": 4504} {"train_loss": -7.109806060791016, "global_step": 189191, "epoch": 4504} {"train_loss": -7.212088108062744, "global_step": 189192, "epoch": 4504} {"train_loss": -7.193275451660156, "global_step": 189193, "epoch": 4504} {"train_loss": -7.133194923400879, "global_step": 189194, "epoch": 4504} {"train_loss": -7.086874008178711, "global_step": 189195, "epoch": 4504} {"train_loss": -7.198324203491211, "global_step": 189196, "epoch": 4504} {"train_loss": -7.143002510070801, "global_step": 189197, "epoch": 4504} {"train_loss": -7.012814044952393, "global_step": 189198, "epoch": 4504} {"train_loss": -7.150031566619873, "global_step": 189199, "epoch": 4504} {"train_loss": -7.140285968780518, "global_step": 189200, "epoch": 4504} {"train_loss": -7.182478427886963, "global_step": 189201, "epoch": 4504} {"train_loss": -7.137906074523926, "global_step": 189202, "epoch": 4504} {"train_loss": -7.231996536254883, "global_step": 189203, "epoch": 4504} {"train_loss": -7.105467796325684, "global_step": 189204, "epoch": 4504} {"train_loss": -7.117245197296143, "global_step": 189205, "epoch": 4504} {"train_loss": -7.160042762756348, "global_step": 189206, "epoch": 4504} {"train_loss": -7.060125350952148, "global_step": 189207, "epoch": 4504} {"train_loss": -7.076545715332031, "global_step": 189208, "epoch": 4504} {"train_loss": -7.154384476797921, "global_step": 189209, "epoch": 4504, "val_loss": 69729.5234375} {"train_loss": -7.168148994445801, "global_step": 189210, "epoch": 4505} {"train_loss": -7.100407600402832, "global_step": 189211, "epoch": 4505} {"train_loss": -7.180941581726074, "global_step": 189212, "epoch": 4505} {"train_loss": -7.223097801208496, "global_step": 189213, "epoch": 4505} {"train_loss": -7.196590423583984, "global_step": 189214, "epoch": 4505} {"train_loss": -7.180732727050781, "global_step": 189215, "epoch": 4505} {"train_loss": -7.151012420654297, "global_step": 189216, "epoch": 4505} {"train_loss": -7.147012710571289, "global_step": 189217, "epoch": 4505} {"train_loss": -7.1697797775268555, "global_step": 189218, "epoch": 4505} {"train_loss": -7.125217437744141, "global_step": 189219, "epoch": 4505} {"train_loss": -7.233731269836426, "global_step": 189220, "epoch": 4505} {"train_loss": -7.220642566680908, "global_step": 189221, "epoch": 4505} {"train_loss": -7.019996643066406, "global_step": 189222, "epoch": 4505} {"train_loss": -7.0947723388671875, "global_step": 189223, "epoch": 4505} {"train_loss": -7.116982460021973, "global_step": 189224, "epoch": 4505} {"train_loss": -7.087106227874756, "global_step": 189225, "epoch": 4505} {"train_loss": -7.188631057739258, "global_step": 189226, "epoch": 4505} {"train_loss": -7.059894561767578, "global_step": 189227, "epoch": 4505} {"train_loss": -7.177839279174805, "global_step": 189228, "epoch": 4505} {"train_loss": -7.106578826904297, "global_step": 189229, "epoch": 4505} {"train_loss": -7.084110260009766, "global_step": 189230, "epoch": 4505} {"train_loss": -7.162701606750488, "global_step": 189231, "epoch": 4505} {"train_loss": -7.190186500549316, "global_step": 189232, "epoch": 4505} {"train_loss": -7.173112869262695, "global_step": 189233, "epoch": 4505} {"train_loss": -7.126855850219727, "global_step": 189234, "epoch": 4505} {"train_loss": -7.128506660461426, "global_step": 189235, "epoch": 4505} {"train_loss": -7.147724151611328, "global_step": 189236, "epoch": 4505} {"train_loss": -7.076486587524414, "global_step": 189237, "epoch": 4505} {"train_loss": -7.029401779174805, "global_step": 189238, "epoch": 4505} {"train_loss": -7.179786682128906, "global_step": 189239, "epoch": 4505} {"train_loss": -7.1513471603393555, "global_step": 189240, "epoch": 4505} {"train_loss": -7.176348686218262, "global_step": 189241, "epoch": 4505} {"train_loss": -7.205717086791992, "global_step": 189242, "epoch": 4505} {"train_loss": -7.149639129638672, "global_step": 189243, "epoch": 4505} {"train_loss": -7.23686408996582, "global_step": 189244, "epoch": 4505} {"train_loss": -7.143185138702393, "global_step": 189245, "epoch": 4505} {"train_loss": -7.346083641052246, "global_step": 189246, "epoch": 4505} {"train_loss": -7.162900447845459, "global_step": 189247, "epoch": 4505} {"train_loss": -7.211366653442383, "global_step": 189248, "epoch": 4505} {"train_loss": -7.269382953643799, "global_step": 189249, "epoch": 4505} {"train_loss": -7.202931880950928, "global_step": 189250, "epoch": 4505} {"train_loss": -7.161074922198341, "global_step": 189251, "epoch": 4505, "val_loss": 69728.0} {"train_loss": -7.197854995727539, "global_step": 189252, "epoch": 4506} {"train_loss": -7.196448802947998, "global_step": 189253, "epoch": 4506} {"train_loss": -7.239152431488037, "global_step": 189254, "epoch": 4506} {"train_loss": -7.264649391174316, "global_step": 189255, "epoch": 4506} {"train_loss": -7.276477336883545, "global_step": 189256, "epoch": 4506} {"train_loss": -7.254156589508057, "global_step": 189257, "epoch": 4506} {"train_loss": -7.334773063659668, "global_step": 189258, "epoch": 4506} {"train_loss": -7.27677059173584, "global_step": 189259, "epoch": 4506} {"train_loss": -7.254012584686279, "global_step": 189260, "epoch": 4506} {"train_loss": -7.333493232727051, "global_step": 189261, "epoch": 4506} {"train_loss": -7.191908836364746, "global_step": 189262, "epoch": 4506} {"train_loss": -7.228361129760742, "global_step": 189263, "epoch": 4506} {"train_loss": -7.2701416015625, "global_step": 189264, "epoch": 4506} {"train_loss": -7.145813465118408, "global_step": 189265, "epoch": 4506} {"train_loss": -7.249251842498779, "global_step": 189266, "epoch": 4506} {"train_loss": -7.29701042175293, "global_step": 189267, "epoch": 4506} {"train_loss": -7.291911602020264, "global_step": 189268, "epoch": 4506} {"train_loss": -7.327681064605713, "global_step": 189269, "epoch": 4506} {"train_loss": -7.166584491729736, "global_step": 189270, "epoch": 4506} {"train_loss": -7.2041730880737305, "global_step": 189271, "epoch": 4506} {"train_loss": -7.062102317810059, "global_step": 189272, "epoch": 4506} {"train_loss": -7.153273105621338, "global_step": 189273, "epoch": 4506} {"train_loss": -7.254646301269531, "global_step": 189274, "epoch": 4506} {"train_loss": -7.176711082458496, "global_step": 189275, "epoch": 4506} {"train_loss": -7.130076885223389, "global_step": 189276, "epoch": 4506} {"train_loss": -7.25258731842041, "global_step": 189277, "epoch": 4506} {"train_loss": -7.1019182205200195, "global_step": 189278, "epoch": 4506} {"train_loss": -7.2510271072387695, "global_step": 189279, "epoch": 4506} {"train_loss": -7.322928428649902, "global_step": 189280, "epoch": 4506} {"train_loss": -7.14327335357666, "global_step": 189281, "epoch": 4506} {"train_loss": -7.145824432373047, "global_step": 189282, "epoch": 4506} {"train_loss": -7.150354385375977, "global_step": 189283, "epoch": 4506} {"train_loss": -7.240979194641113, "global_step": 189284, "epoch": 4506} {"train_loss": -7.254045486450195, "global_step": 189285, "epoch": 4506} {"train_loss": -7.284882545471191, "global_step": 189286, "epoch": 4506} {"train_loss": -7.190215110778809, "global_step": 189287, "epoch": 4506} {"train_loss": -7.100502967834473, "global_step": 189288, "epoch": 4506} {"train_loss": -7.218664169311523, "global_step": 189289, "epoch": 4506} {"train_loss": -7.152759552001953, "global_step": 189290, "epoch": 4506} {"train_loss": -7.171045780181885, "global_step": 189291, "epoch": 4506} {"train_loss": -7.249862194061279, "global_step": 189292, "epoch": 4506} {"train_loss": -7.220516352426438, "global_step": 189293, "epoch": 4506, "val_loss": 69751.6640625} {"train_loss": -7.261902809143066, "global_step": 189294, "epoch": 4507} {"train_loss": -7.175008773803711, "global_step": 189295, "epoch": 4507} {"train_loss": -7.210824489593506, "global_step": 189296, "epoch": 4507} {"train_loss": -7.238457202911377, "global_step": 189297, "epoch": 4507} {"train_loss": -7.253983497619629, "global_step": 189298, "epoch": 4507} {"train_loss": -7.1398515701293945, "global_step": 189299, "epoch": 4507} {"train_loss": -7.198577880859375, "global_step": 189300, "epoch": 4507} {"train_loss": -7.217182159423828, "global_step": 189301, "epoch": 4507} {"train_loss": -7.156768321990967, "global_step": 189302, "epoch": 4507} {"train_loss": -7.249247074127197, "global_step": 189303, "epoch": 4507} {"train_loss": -7.250389099121094, "global_step": 189304, "epoch": 4507} {"train_loss": -7.118807792663574, "global_step": 189305, "epoch": 4507} {"train_loss": -7.24818229675293, "global_step": 189306, "epoch": 4507} {"train_loss": -7.147758483886719, "global_step": 189307, "epoch": 4507} {"train_loss": -7.087480545043945, "global_step": 189308, "epoch": 4507} {"train_loss": -7.1596574783325195, "global_step": 189309, "epoch": 4507} {"train_loss": -7.202868938446045, "global_step": 189310, "epoch": 4507} {"train_loss": -7.066631317138672, "global_step": 189311, "epoch": 4507} {"train_loss": -7.017778396606445, "global_step": 189312, "epoch": 4507} {"train_loss": -7.131402015686035, "global_step": 189313, "epoch": 4507} {"train_loss": -7.188838481903076, "global_step": 189314, "epoch": 4507} {"train_loss": -7.1487226486206055, "global_step": 189315, "epoch": 4507} {"train_loss": -6.947197437286377, "global_step": 189316, "epoch": 4507} {"train_loss": -7.138801097869873, "global_step": 189317, "epoch": 4507} {"train_loss": -7.113503456115723, "global_step": 189318, "epoch": 4507} {"train_loss": -7.148799896240234, "global_step": 189319, "epoch": 4507} {"train_loss": -7.182720184326172, "global_step": 189320, "epoch": 4507} {"train_loss": -7.055825233459473, "global_step": 189321, "epoch": 4507} {"train_loss": -7.089145183563232, "global_step": 189322, "epoch": 4507} {"train_loss": -7.073078155517578, "global_step": 189323, "epoch": 4507} {"train_loss": -7.215986728668213, "global_step": 189324, "epoch": 4507} {"train_loss": -7.092637062072754, "global_step": 189325, "epoch": 4507} {"train_loss": -7.101733207702637, "global_step": 189326, "epoch": 4507} {"train_loss": -7.04904842376709, "global_step": 189327, "epoch": 4507} {"train_loss": -7.173251152038574, "global_step": 189328, "epoch": 4507} {"train_loss": -7.2514729499816895, "global_step": 189329, "epoch": 4507} {"train_loss": -7.242449760437012, "global_step": 189330, "epoch": 4507} {"train_loss": -7.096945762634277, "global_step": 189331, "epoch": 4507} {"train_loss": -7.116737365722656, "global_step": 189332, "epoch": 4507} {"train_loss": -7.166639804840088, "global_step": 189333, "epoch": 4507} {"train_loss": -7.147100448608398, "global_step": 189334, "epoch": 4507} {"train_loss": -7.153490021115258, "global_step": 189335, "epoch": 4507, "val_loss": 69437.359375} {"train_loss": -6.922544956207275, "global_step": 189336, "epoch": 4508} {"train_loss": -7.091855525970459, "global_step": 189337, "epoch": 4508} {"train_loss": -7.189617156982422, "global_step": 189338, "epoch": 4508} {"train_loss": -6.920084476470947, "global_step": 189339, "epoch": 4508} {"train_loss": -7.14871883392334, "global_step": 189340, "epoch": 4508} {"train_loss": -7.092573642730713, "global_step": 189341, "epoch": 4508} {"train_loss": -7.074023246765137, "global_step": 189342, "epoch": 4508} {"train_loss": -7.032967567443848, "global_step": 189343, "epoch": 4508} {"train_loss": -7.177252769470215, "global_step": 189344, "epoch": 4508} {"train_loss": -7.020529747009277, "global_step": 189345, "epoch": 4508} {"train_loss": -7.005928039550781, "global_step": 189346, "epoch": 4508} {"train_loss": -7.298296928405762, "global_step": 189347, "epoch": 4508} {"train_loss": -7.157675743103027, "global_step": 189348, "epoch": 4508} {"train_loss": -7.195533275604248, "global_step": 189349, "epoch": 4508} {"train_loss": -7.170835494995117, "global_step": 189350, "epoch": 4508} {"train_loss": -7.240133285522461, "global_step": 189351, "epoch": 4508} {"train_loss": -7.086642265319824, "global_step": 189352, "epoch": 4508} {"train_loss": -7.1937255859375, "global_step": 189353, "epoch": 4508} {"train_loss": -7.187333583831787, "global_step": 189354, "epoch": 4508} {"train_loss": -7.11607027053833, "global_step": 189355, "epoch": 4508} {"train_loss": -7.123973369598389, "global_step": 189356, "epoch": 4508} {"train_loss": -7.134505271911621, "global_step": 189357, "epoch": 4508} {"train_loss": -7.187489032745361, "global_step": 189358, "epoch": 4508} {"train_loss": -7.263555526733398, "global_step": 189359, "epoch": 4508} {"train_loss": -7.049093246459961, "global_step": 189360, "epoch": 4508} {"train_loss": -7.2181172370910645, "global_step": 189361, "epoch": 4508} {"train_loss": -7.165440559387207, "global_step": 189362, "epoch": 4508} {"train_loss": -7.147869110107422, "global_step": 189363, "epoch": 4508} {"train_loss": -7.245248794555664, "global_step": 189364, "epoch": 4508} {"train_loss": -7.131698131561279, "global_step": 189365, "epoch": 4508} {"train_loss": -7.240414142608643, "global_step": 189366, "epoch": 4508} {"train_loss": -7.155390739440918, "global_step": 189367, "epoch": 4508} {"train_loss": -7.109534740447998, "global_step": 189368, "epoch": 4508} {"train_loss": -7.128499984741211, "global_step": 189369, "epoch": 4508} {"train_loss": -7.112110137939453, "global_step": 189370, "epoch": 4508} {"train_loss": -7.137163162231445, "global_step": 189371, "epoch": 4508} {"train_loss": -7.271336078643799, "global_step": 189372, "epoch": 4508} {"train_loss": -7.013922214508057, "global_step": 189373, "epoch": 4508} {"train_loss": -6.995664596557617, "global_step": 189374, "epoch": 4508} {"train_loss": -7.196951866149902, "global_step": 189375, "epoch": 4508} {"train_loss": -6.907080173492432, "global_step": 189376, "epoch": 4508} {"train_loss": -7.126295225960868, "global_step": 189377, "epoch": 4508, "val_loss": 69497.8828125} {"train_loss": -6.985589027404785, "global_step": 189378, "epoch": 4509} {"train_loss": -6.904060363769531, "global_step": 189379, "epoch": 4509} {"train_loss": -7.152175426483154, "global_step": 189380, "epoch": 4509} {"train_loss": -7.028141975402832, "global_step": 189381, "epoch": 4509} {"train_loss": -7.249440670013428, "global_step": 189382, "epoch": 4509} {"train_loss": -7.11344051361084, "global_step": 189383, "epoch": 4509} {"train_loss": -7.155726432800293, "global_step": 189384, "epoch": 4509} {"train_loss": -7.185278415679932, "global_step": 189385, "epoch": 4509} {"train_loss": -7.079320907592773, "global_step": 189386, "epoch": 4509} {"train_loss": -7.115976333618164, "global_step": 189387, "epoch": 4509} {"train_loss": -7.148209571838379, "global_step": 189388, "epoch": 4509} {"train_loss": -7.107531547546387, "global_step": 189389, "epoch": 4509} {"train_loss": -7.159811019897461, "global_step": 189390, "epoch": 4509} {"train_loss": -7.188575267791748, "global_step": 189391, "epoch": 4509} {"train_loss": -7.173990726470947, "global_step": 189392, "epoch": 4509} {"train_loss": -7.179811954498291, "global_step": 189393, "epoch": 4509} {"train_loss": -7.214270114898682, "global_step": 189394, "epoch": 4509} {"train_loss": -7.11635684967041, "global_step": 189395, "epoch": 4509} {"train_loss": -7.116461753845215, "global_step": 189396, "epoch": 4509} {"train_loss": -7.059627532958984, "global_step": 189397, "epoch": 4509} {"train_loss": -7.135707855224609, "global_step": 189398, "epoch": 4509} {"train_loss": -7.122894287109375, "global_step": 189399, "epoch": 4509} {"train_loss": -7.107300281524658, "global_step": 189400, "epoch": 4509} {"train_loss": -7.157317638397217, "global_step": 189401, "epoch": 4509} {"train_loss": -7.0495195388793945, "global_step": 189402, "epoch": 4509} {"train_loss": -7.045676231384277, "global_step": 189403, "epoch": 4509} {"train_loss": -7.123045444488525, "global_step": 189404, "epoch": 4509} {"train_loss": -7.151368141174316, "global_step": 189405, "epoch": 4509} {"train_loss": -7.126161575317383, "global_step": 189406, "epoch": 4509} {"train_loss": -7.050907611846924, "global_step": 189407, "epoch": 4509} {"train_loss": -7.062733173370361, "global_step": 189408, "epoch": 4509} {"train_loss": -7.014298439025879, "global_step": 189409, "epoch": 4509} {"train_loss": -7.137035369873047, "global_step": 189410, "epoch": 4509} {"train_loss": -7.124167442321777, "global_step": 189411, "epoch": 4509} {"train_loss": -7.14411735534668, "global_step": 189412, "epoch": 4509} {"train_loss": -7.16497802734375, "global_step": 189413, "epoch": 4509} {"train_loss": -7.19774055480957, "global_step": 189414, "epoch": 4509} {"train_loss": -7.275704860687256, "global_step": 189415, "epoch": 4509} {"train_loss": -7.306573867797852, "global_step": 189416, "epoch": 4509} {"train_loss": -7.209256649017334, "global_step": 189417, "epoch": 4509} {"train_loss": -7.297139644622803, "global_step": 189418, "epoch": 4509} {"train_loss": -7.133941116787138, "global_step": 189419, "epoch": 4509, "val_loss": 69464.1875} {"train_loss": -7.257448196411133, "global_step": 189420, "epoch": 4510} {"train_loss": -7.241982460021973, "global_step": 189421, "epoch": 4510} {"train_loss": -7.293729782104492, "global_step": 189422, "epoch": 4510} {"train_loss": -7.232610702514648, "global_step": 189423, "epoch": 4510} {"train_loss": -7.195532321929932, "global_step": 189424, "epoch": 4510} {"train_loss": -7.300898551940918, "global_step": 189425, "epoch": 4510} {"train_loss": -7.138951301574707, "global_step": 189426, "epoch": 4510} {"train_loss": -7.166479110717773, "global_step": 189427, "epoch": 4510} {"train_loss": -7.216250419616699, "global_step": 189428, "epoch": 4510} {"train_loss": -7.292052268981934, "global_step": 189429, "epoch": 4510} {"train_loss": -7.247279644012451, "global_step": 189430, "epoch": 4510} {"train_loss": -7.205887794494629, "global_step": 189431, "epoch": 4510} {"train_loss": -7.2458906173706055, "global_step": 189432, "epoch": 4510} {"train_loss": -7.201231002807617, "global_step": 189433, "epoch": 4510} {"train_loss": -7.149416923522949, "global_step": 189434, "epoch": 4510} {"train_loss": -7.216191291809082, "global_step": 189435, "epoch": 4510} {"train_loss": -7.292232036590576, "global_step": 189436, "epoch": 4510} {"train_loss": -7.079343795776367, "global_step": 189437, "epoch": 4510} {"train_loss": -7.11201286315918, "global_step": 189438, "epoch": 4510} {"train_loss": -7.269809722900391, "global_step": 189439, "epoch": 4510} {"train_loss": -7.186110496520996, "global_step": 189440, "epoch": 4510} {"train_loss": -7.149165630340576, "global_step": 189441, "epoch": 4510} {"train_loss": -7.109952926635742, "global_step": 189442, "epoch": 4510} {"train_loss": -7.172921180725098, "global_step": 189443, "epoch": 4510} {"train_loss": -7.08039665222168, "global_step": 189444, "epoch": 4510} {"train_loss": -7.055577278137207, "global_step": 189445, "epoch": 4510} {"train_loss": -7.0903472900390625, "global_step": 189446, "epoch": 4510} {"train_loss": -7.207846164703369, "global_step": 189447, "epoch": 4510} {"train_loss": -6.986579895019531, "global_step": 189448, "epoch": 4510} {"train_loss": -7.225647449493408, "global_step": 189449, "epoch": 4510} {"train_loss": -7.181149959564209, "global_step": 189450, "epoch": 4510} {"train_loss": -7.118634223937988, "global_step": 189451, "epoch": 4510} {"train_loss": -7.2557291984558105, "global_step": 189452, "epoch": 4510} {"train_loss": -7.167383193969727, "global_step": 189453, "epoch": 4510} {"train_loss": -7.120317459106445, "global_step": 189454, "epoch": 4510} {"train_loss": -7.137857437133789, "global_step": 189455, "epoch": 4510} {"train_loss": -7.071020126342773, "global_step": 189456, "epoch": 4510} {"train_loss": -7.0883684158325195, "global_step": 189457, "epoch": 4510} {"train_loss": -7.106733322143555, "global_step": 189458, "epoch": 4510} {"train_loss": -7.075903415679932, "global_step": 189459, "epoch": 4510} {"train_loss": -7.052804946899414, "global_step": 189460, "epoch": 4510} {"train_loss": -7.167067891075497, "global_step": 189461, "epoch": 4510, "val_loss": 69685.1484375} {"train_loss": -7.037406921386719, "global_step": 189462, "epoch": 4511} {"train_loss": -7.103861331939697, "global_step": 189463, "epoch": 4511} {"train_loss": -6.979146957397461, "global_step": 189464, "epoch": 4511} {"train_loss": -7.125517845153809, "global_step": 189465, "epoch": 4511} {"train_loss": -7.231902122497559, "global_step": 189466, "epoch": 4511} {"train_loss": -7.125014781951904, "global_step": 189467, "epoch": 4511} {"train_loss": -7.243630409240723, "global_step": 189468, "epoch": 4511} {"train_loss": -7.115025043487549, "global_step": 189469, "epoch": 4511} {"train_loss": -7.056343078613281, "global_step": 189470, "epoch": 4511} {"train_loss": -7.239029884338379, "global_step": 189471, "epoch": 4511} {"train_loss": -7.062614917755127, "global_step": 189472, "epoch": 4511} {"train_loss": -7.180447578430176, "global_step": 189473, "epoch": 4511} {"train_loss": -7.164473056793213, "global_step": 189474, "epoch": 4511} {"train_loss": -7.148441314697266, "global_step": 189475, "epoch": 4511} {"train_loss": -7.193582534790039, "global_step": 189476, "epoch": 4511} {"train_loss": -7.178420543670654, "global_step": 189477, "epoch": 4511} {"train_loss": -7.169172286987305, "global_step": 189478, "epoch": 4511} {"train_loss": -7.186086654663086, "global_step": 189479, "epoch": 4511} {"train_loss": -7.208993434906006, "global_step": 189480, "epoch": 4511} {"train_loss": -7.127348899841309, "global_step": 189481, "epoch": 4511} {"train_loss": -7.19183349609375, "global_step": 189482, "epoch": 4511} {"train_loss": -7.184322357177734, "global_step": 189483, "epoch": 4511} {"train_loss": -7.223496913909912, "global_step": 189484, "epoch": 4511} {"train_loss": -7.259334564208984, "global_step": 189485, "epoch": 4511} {"train_loss": -7.221168518066406, "global_step": 189486, "epoch": 4511} {"train_loss": -7.271570682525635, "global_step": 189487, "epoch": 4511} {"train_loss": -7.245999336242676, "global_step": 189488, "epoch": 4511} {"train_loss": -7.254853248596191, "global_step": 189489, "epoch": 4511} {"train_loss": -7.1742353439331055, "global_step": 189490, "epoch": 4511} {"train_loss": -7.256834030151367, "global_step": 189491, "epoch": 4511} {"train_loss": -7.216402053833008, "global_step": 189492, "epoch": 4511} {"train_loss": -7.261330604553223, "global_step": 189493, "epoch": 4511} {"train_loss": -7.203189849853516, "global_step": 189494, "epoch": 4511} {"train_loss": -7.251394271850586, "global_step": 189495, "epoch": 4511} {"train_loss": -7.267936706542969, "global_step": 189496, "epoch": 4511} {"train_loss": -7.151301860809326, "global_step": 189497, "epoch": 4511} {"train_loss": -7.200747489929199, "global_step": 189498, "epoch": 4511} {"train_loss": -7.224517822265625, "global_step": 189499, "epoch": 4511} {"train_loss": -7.377328872680664, "global_step": 189500, "epoch": 4511} {"train_loss": -7.229987621307373, "global_step": 189501, "epoch": 4511} {"train_loss": -7.138933181762695, "global_step": 189502, "epoch": 4511} {"train_loss": -7.186267058054606, "global_step": 189503, "epoch": 4511, "val_loss": 69478.1796875} {"train_loss": -7.24800968170166, "global_step": 189504, "epoch": 4512} {"train_loss": -7.31806755065918, "global_step": 189505, "epoch": 4512} {"train_loss": -7.3294782638549805, "global_step": 189506, "epoch": 4512} {"train_loss": -7.314144134521484, "global_step": 189507, "epoch": 4512} {"train_loss": -7.285755157470703, "global_step": 189508, "epoch": 4512} {"train_loss": -7.299163341522217, "global_step": 189509, "epoch": 4512} {"train_loss": -7.253025531768799, "global_step": 189510, "epoch": 4512} {"train_loss": -7.304644584655762, "global_step": 189511, "epoch": 4512} {"train_loss": -7.236593246459961, "global_step": 189512, "epoch": 4512} {"train_loss": -7.286920070648193, "global_step": 189513, "epoch": 4512} {"train_loss": -7.166478157043457, "global_step": 189514, "epoch": 4512} {"train_loss": -7.236005783081055, "global_step": 189515, "epoch": 4512} {"train_loss": -7.120333671569824, "global_step": 189516, "epoch": 4512} {"train_loss": -7.101535797119141, "global_step": 189517, "epoch": 4512} {"train_loss": -7.109879493713379, "global_step": 189518, "epoch": 4512} {"train_loss": -7.105892181396484, "global_step": 189519, "epoch": 4512} {"train_loss": -6.9967041015625, "global_step": 189520, "epoch": 4512} {"train_loss": -7.028637886047363, "global_step": 189521, "epoch": 4512} {"train_loss": -7.147601127624512, "global_step": 189522, "epoch": 4512} {"train_loss": -7.190951347351074, "global_step": 189523, "epoch": 4512} {"train_loss": -7.120443344116211, "global_step": 189524, "epoch": 4512} {"train_loss": -7.094727993011475, "global_step": 189525, "epoch": 4512} {"train_loss": -7.182328224182129, "global_step": 189526, "epoch": 4512} {"train_loss": -7.14154052734375, "global_step": 189527, "epoch": 4512} {"train_loss": -7.090631008148193, "global_step": 189528, "epoch": 4512} {"train_loss": -7.1542558670043945, "global_step": 189529, "epoch": 4512} {"train_loss": -7.173760414123535, "global_step": 189530, "epoch": 4512} {"train_loss": -7.159549713134766, "global_step": 189531, "epoch": 4512} {"train_loss": -7.124084949493408, "global_step": 189532, "epoch": 4512} {"train_loss": -7.179683208465576, "global_step": 189533, "epoch": 4512} {"train_loss": -7.18493127822876, "global_step": 189534, "epoch": 4512} {"train_loss": -6.961015701293945, "global_step": 189535, "epoch": 4512} {"train_loss": -7.193085670471191, "global_step": 189536, "epoch": 4512} {"train_loss": -7.158635139465332, "global_step": 189537, "epoch": 4512} {"train_loss": -7.250788688659668, "global_step": 189538, "epoch": 4512} {"train_loss": -7.251848220825195, "global_step": 189539, "epoch": 4512} {"train_loss": -7.141773223876953, "global_step": 189540, "epoch": 4512} {"train_loss": -7.214568614959717, "global_step": 189541, "epoch": 4512} {"train_loss": -7.080530166625977, "global_step": 189542, "epoch": 4512} {"train_loss": -7.134888648986816, "global_step": 189543, "epoch": 4512} {"train_loss": -7.151745796203613, "global_step": 189544, "epoch": 4512} {"train_loss": -7.176260335104806, "global_step": 189545, "epoch": 4512, "val_loss": 69349.609375} {"train_loss": -7.299189567565918, "global_step": 189546, "epoch": 4513} {"train_loss": -7.1045684814453125, "global_step": 189547, "epoch": 4513} {"train_loss": -7.124410629272461, "global_step": 189548, "epoch": 4513} {"train_loss": -7.178937911987305, "global_step": 189549, "epoch": 4513} {"train_loss": -7.192403793334961, "global_step": 189550, "epoch": 4513} {"train_loss": -7.239439964294434, "global_step": 189551, "epoch": 4513} {"train_loss": -7.195415019989014, "global_step": 189552, "epoch": 4513} {"train_loss": -7.210749626159668, "global_step": 189553, "epoch": 4513} {"train_loss": -7.129270076751709, "global_step": 189554, "epoch": 4513} {"train_loss": -7.195825576782227, "global_step": 189555, "epoch": 4513} {"train_loss": -7.194210052490234, "global_step": 189556, "epoch": 4513} {"train_loss": -7.200648784637451, "global_step": 189557, "epoch": 4513} {"train_loss": -7.186183929443359, "global_step": 189558, "epoch": 4513} {"train_loss": -7.161772727966309, "global_step": 189559, "epoch": 4513} {"train_loss": -7.125288963317871, "global_step": 189560, "epoch": 4513} {"train_loss": -7.23689079284668, "global_step": 189561, "epoch": 4513} {"train_loss": -7.085053443908691, "global_step": 189562, "epoch": 4513} {"train_loss": -7.233819961547852, "global_step": 189563, "epoch": 4513} {"train_loss": -7.276121139526367, "global_step": 189564, "epoch": 4513} {"train_loss": -7.181947231292725, "global_step": 189565, "epoch": 4513} {"train_loss": -7.123589515686035, "global_step": 189566, "epoch": 4513} {"train_loss": -7.052165985107422, "global_step": 189567, "epoch": 4513} {"train_loss": -7.251721382141113, "global_step": 189568, "epoch": 4513} {"train_loss": -7.055828094482422, "global_step": 189569, "epoch": 4513} {"train_loss": -7.0687994956970215, "global_step": 189570, "epoch": 4513} {"train_loss": -7.102943420410156, "global_step": 189571, "epoch": 4513} {"train_loss": -7.146376132965088, "global_step": 189572, "epoch": 4513} {"train_loss": -7.127737998962402, "global_step": 189573, "epoch": 4513} {"train_loss": -7.160029888153076, "global_step": 189574, "epoch": 4513} {"train_loss": -7.141104698181152, "global_step": 189575, "epoch": 4513} {"train_loss": -7.107104778289795, "global_step": 189576, "epoch": 4513} {"train_loss": -7.040205955505371, "global_step": 189577, "epoch": 4513} {"train_loss": -7.019619941711426, "global_step": 189578, "epoch": 4513} {"train_loss": -6.995810508728027, "global_step": 189579, "epoch": 4513} {"train_loss": -6.98585319519043, "global_step": 189580, "epoch": 4513} {"train_loss": -7.154623985290527, "global_step": 189581, "epoch": 4513} {"train_loss": -6.920190811157227, "global_step": 189582, "epoch": 4513} {"train_loss": -7.11478853225708, "global_step": 189583, "epoch": 4513} {"train_loss": -6.982782363891602, "global_step": 189584, "epoch": 4513} {"train_loss": -6.951565742492676, "global_step": 189585, "epoch": 4513} {"train_loss": -7.101856231689453, "global_step": 189586, "epoch": 4513} {"train_loss": -7.1245612644013905, "global_step": 189587, "epoch": 4513, "val_loss": 69645.3359375} {"train_loss": -7.224353790283203, "global_step": 189588, "epoch": 4514} {"train_loss": -7.050884246826172, "global_step": 189589, "epoch": 4514} {"train_loss": -7.120527267456055, "global_step": 189590, "epoch": 4514} {"train_loss": -7.107419967651367, "global_step": 189591, "epoch": 4514} {"train_loss": -7.160401344299316, "global_step": 189592, "epoch": 4514} {"train_loss": -7.104076385498047, "global_step": 189593, "epoch": 4514} {"train_loss": -7.179855823516846, "global_step": 189594, "epoch": 4514} {"train_loss": -7.155982971191406, "global_step": 189595, "epoch": 4514} {"train_loss": -7.1767730712890625, "global_step": 189596, "epoch": 4514} {"train_loss": -7.049581050872803, "global_step": 189597, "epoch": 4514} {"train_loss": -7.236195087432861, "global_step": 189598, "epoch": 4514} {"train_loss": -7.126923561096191, "global_step": 189599, "epoch": 4514} {"train_loss": -7.184199333190918, "global_step": 189600, "epoch": 4514} {"train_loss": -7.189340591430664, "global_step": 189601, "epoch": 4514} {"train_loss": -7.204808712005615, "global_step": 189602, "epoch": 4514} {"train_loss": -7.227452278137207, "global_step": 189603, "epoch": 4514} {"train_loss": -7.24316930770874, "global_step": 189604, "epoch": 4514} {"train_loss": -7.1556243896484375, "global_step": 189605, "epoch": 4514} {"train_loss": -7.149216651916504, "global_step": 189606, "epoch": 4514} {"train_loss": -7.216279029846191, "global_step": 189607, "epoch": 4514} {"train_loss": -7.163787841796875, "global_step": 189608, "epoch": 4514} {"train_loss": -7.271489143371582, "global_step": 189609, "epoch": 4514} {"train_loss": -7.142350673675537, "global_step": 189610, "epoch": 4514} {"train_loss": -7.1446051597595215, "global_step": 189611, "epoch": 4514} {"train_loss": -7.110801696777344, "global_step": 189612, "epoch": 4514} {"train_loss": -7.2029595375061035, "global_step": 189613, "epoch": 4514} {"train_loss": -7.152956008911133, "global_step": 189614, "epoch": 4514} {"train_loss": -7.2109456062316895, "global_step": 189615, "epoch": 4514} {"train_loss": -7.089463233947754, "global_step": 189616, "epoch": 4514} {"train_loss": -7.224663734436035, "global_step": 189617, "epoch": 4514} {"train_loss": -7.235231399536133, "global_step": 189618, "epoch": 4514} {"train_loss": -7.191324710845947, "global_step": 189619, "epoch": 4514} {"train_loss": -7.235273838043213, "global_step": 189620, "epoch": 4514} {"train_loss": -7.114758014678955, "global_step": 189621, "epoch": 4514} {"train_loss": -7.267655849456787, "global_step": 189622, "epoch": 4514} {"train_loss": -7.098502159118652, "global_step": 189623, "epoch": 4514} {"train_loss": -7.079358100891113, "global_step": 189624, "epoch": 4514} {"train_loss": -7.203256607055664, "global_step": 189625, "epoch": 4514} {"train_loss": -7.134274482727051, "global_step": 189626, "epoch": 4514} {"train_loss": -7.162703990936279, "global_step": 189627, "epoch": 4514} {"train_loss": -7.100604057312012, "global_step": 189628, "epoch": 4514} {"train_loss": -7.165798107783, "global_step": 189629, "epoch": 4514, "val_loss": 69559.21875} {"train_loss": -7.223627090454102, "global_step": 189630, "epoch": 4515} {"train_loss": -7.221306800842285, "global_step": 189631, "epoch": 4515} {"train_loss": -7.148823261260986, "global_step": 189632, "epoch": 4515} {"train_loss": -7.2272725105285645, "global_step": 189633, "epoch": 4515} {"train_loss": -6.984689235687256, "global_step": 189634, "epoch": 4515} {"train_loss": -7.127682209014893, "global_step": 189635, "epoch": 4515} {"train_loss": -7.229269504547119, "global_step": 189636, "epoch": 4515} {"train_loss": -7.161840915679932, "global_step": 189637, "epoch": 4515} {"train_loss": -6.977619171142578, "global_step": 189638, "epoch": 4515} {"train_loss": -7.244283676147461, "global_step": 189639, "epoch": 4515} {"train_loss": -7.0673651695251465, "global_step": 189640, "epoch": 4515} {"train_loss": -7.248985290527344, "global_step": 189641, "epoch": 4515} {"train_loss": -7.079809188842773, "global_step": 189642, "epoch": 4515} {"train_loss": -7.162981033325195, "global_step": 189643, "epoch": 4515} {"train_loss": -7.248507499694824, "global_step": 189644, "epoch": 4515} {"train_loss": -7.180807590484619, "global_step": 189645, "epoch": 4515} {"train_loss": -7.2411580085754395, "global_step": 189646, "epoch": 4515} {"train_loss": -7.136031150817871, "global_step": 189647, "epoch": 4515} {"train_loss": -7.161470413208008, "global_step": 189648, "epoch": 4515} {"train_loss": -7.232947826385498, "global_step": 189649, "epoch": 4515} {"train_loss": -7.187869071960449, "global_step": 189650, "epoch": 4515} {"train_loss": -7.154967784881592, "global_step": 189651, "epoch": 4515} {"train_loss": -7.226656913757324, "global_step": 189652, "epoch": 4515} {"train_loss": -7.184412002563477, "global_step": 189653, "epoch": 4515} {"train_loss": -7.354398727416992, "global_step": 189654, "epoch": 4515} {"train_loss": -7.227112770080566, "global_step": 189655, "epoch": 4515} {"train_loss": -7.16953706741333, "global_step": 189656, "epoch": 4515} {"train_loss": -7.216565132141113, "global_step": 189657, "epoch": 4515} {"train_loss": -7.170137405395508, "global_step": 189658, "epoch": 4515} {"train_loss": -7.330385208129883, "global_step": 189659, "epoch": 4515} {"train_loss": -7.203110694885254, "global_step": 189660, "epoch": 4515} {"train_loss": -7.283749580383301, "global_step": 189661, "epoch": 4515} {"train_loss": -7.168513298034668, "global_step": 189662, "epoch": 4515} {"train_loss": -7.308542251586914, "global_step": 189663, "epoch": 4515} {"train_loss": -7.215341091156006, "global_step": 189664, "epoch": 4515} {"train_loss": -7.239150047302246, "global_step": 189665, "epoch": 4515} {"train_loss": -7.100651264190674, "global_step": 189666, "epoch": 4515} {"train_loss": -7.228542327880859, "global_step": 189667, "epoch": 4515} {"train_loss": -7.186274528503418, "global_step": 189668, "epoch": 4515} {"train_loss": -7.148678779602051, "global_step": 189669, "epoch": 4515} {"train_loss": -7.242739677429199, "global_step": 189670, "epoch": 4515} {"train_loss": -7.192060777119228, "global_step": 189671, "epoch": 4515, "val_loss": 69503.125} {"train_loss": -7.211474418640137, "global_step": 189672, "epoch": 4516} {"train_loss": -7.382941246032715, "global_step": 189673, "epoch": 4516} {"train_loss": -7.252530574798584, "global_step": 189674, "epoch": 4516} {"train_loss": -7.188490867614746, "global_step": 189675, "epoch": 4516} {"train_loss": -7.147014617919922, "global_step": 189676, "epoch": 4516} {"train_loss": -7.235426902770996, "global_step": 189677, "epoch": 4516} {"train_loss": -7.19262170791626, "global_step": 189678, "epoch": 4516} {"train_loss": -7.269009590148926, "global_step": 189679, "epoch": 4516} {"train_loss": -7.124096393585205, "global_step": 189680, "epoch": 4516} {"train_loss": -7.20026969909668, "global_step": 189681, "epoch": 4516} {"train_loss": -7.239616394042969, "global_step": 189682, "epoch": 4516} {"train_loss": -7.251490116119385, "global_step": 189683, "epoch": 4516} {"train_loss": -7.231385231018066, "global_step": 189684, "epoch": 4516} {"train_loss": -7.19265079498291, "global_step": 189685, "epoch": 4516} {"train_loss": -7.218178749084473, "global_step": 189686, "epoch": 4516} {"train_loss": -7.377900123596191, "global_step": 189687, "epoch": 4516} {"train_loss": -7.262051105499268, "global_step": 189688, "epoch": 4516} {"train_loss": -7.199067115783691, "global_step": 189689, "epoch": 4516} {"train_loss": -7.246123790740967, "global_step": 189690, "epoch": 4516} {"train_loss": -7.206856727600098, "global_step": 189691, "epoch": 4516} {"train_loss": -7.354608535766602, "global_step": 189692, "epoch": 4516} {"train_loss": -7.184021949768066, "global_step": 189693, "epoch": 4516} {"train_loss": -7.268852710723877, "global_step": 189694, "epoch": 4516} {"train_loss": -7.2433366775512695, "global_step": 189695, "epoch": 4516} {"train_loss": -7.217636585235596, "global_step": 189696, "epoch": 4516} {"train_loss": -7.211688995361328, "global_step": 189697, "epoch": 4516} {"train_loss": -7.315615653991699, "global_step": 189698, "epoch": 4516} {"train_loss": -7.2739152908325195, "global_step": 189699, "epoch": 4516} {"train_loss": -7.222570419311523, "global_step": 189700, "epoch": 4516} {"train_loss": -7.270495891571045, "global_step": 189701, "epoch": 4516} {"train_loss": -7.125833511352539, "global_step": 189702, "epoch": 4516} {"train_loss": -7.0946760177612305, "global_step": 189703, "epoch": 4516} {"train_loss": -7.003701210021973, "global_step": 189704, "epoch": 4516} {"train_loss": -7.2707109451293945, "global_step": 189705, "epoch": 4516} {"train_loss": -7.300413131713867, "global_step": 189706, "epoch": 4516} {"train_loss": -7.220706939697266, "global_step": 189707, "epoch": 4516} {"train_loss": -7.1712470054626465, "global_step": 189708, "epoch": 4516} {"train_loss": -7.2151079177856445, "global_step": 189709, "epoch": 4516} {"train_loss": -6.854295253753662, "global_step": 189710, "epoch": 4516} {"train_loss": -7.131767272949219, "global_step": 189711, "epoch": 4516} {"train_loss": -7.129518985748291, "global_step": 189712, "epoch": 4516} {"train_loss": -7.2134433927990145, "global_step": 189713, "epoch": 4516, "val_loss": 69358.609375} {"train_loss": -7.03279447555542, "global_step": 189714, "epoch": 4517} {"train_loss": -7.200795650482178, "global_step": 189715, "epoch": 4517} {"train_loss": -7.225442886352539, "global_step": 189716, "epoch": 4517} {"train_loss": -7.0547895431518555, "global_step": 189717, "epoch": 4517} {"train_loss": -7.174488067626953, "global_step": 189718, "epoch": 4517} {"train_loss": -7.209158897399902, "global_step": 189719, "epoch": 4517} {"train_loss": -7.035077095031738, "global_step": 189720, "epoch": 4517} {"train_loss": -7.114461898803711, "global_step": 189721, "epoch": 4517} {"train_loss": -7.131348133087158, "global_step": 189722, "epoch": 4517} {"train_loss": -6.925806522369385, "global_step": 189723, "epoch": 4517} {"train_loss": -7.132160186767578, "global_step": 189724, "epoch": 4517} {"train_loss": -6.977756500244141, "global_step": 189725, "epoch": 4517} {"train_loss": -7.219634056091309, "global_step": 189726, "epoch": 4517} {"train_loss": -7.053051471710205, "global_step": 189727, "epoch": 4517} {"train_loss": -7.163638591766357, "global_step": 189728, "epoch": 4517} {"train_loss": -7.122855186462402, "global_step": 189729, "epoch": 4517} {"train_loss": -7.066366195678711, "global_step": 189730, "epoch": 4517} {"train_loss": -7.112203598022461, "global_step": 189731, "epoch": 4517} {"train_loss": -7.131718635559082, "global_step": 189732, "epoch": 4517} {"train_loss": -7.080744743347168, "global_step": 189733, "epoch": 4517} {"train_loss": -7.146446704864502, "global_step": 189734, "epoch": 4517} {"train_loss": -7.289051055908203, "global_step": 189735, "epoch": 4517} {"train_loss": -7.099308013916016, "global_step": 189736, "epoch": 4517} {"train_loss": -6.974575042724609, "global_step": 189737, "epoch": 4517} {"train_loss": -7.197169303894043, "global_step": 189738, "epoch": 4517} {"train_loss": -7.024062156677246, "global_step": 189739, "epoch": 4517} {"train_loss": -7.146982192993164, "global_step": 189740, "epoch": 4517} {"train_loss": -7.198312282562256, "global_step": 189741, "epoch": 4517} {"train_loss": -7.096011161804199, "global_step": 189742, "epoch": 4517} {"train_loss": -7.144597053527832, "global_step": 189743, "epoch": 4517} {"train_loss": -7.210602760314941, "global_step": 189744, "epoch": 4517} {"train_loss": -7.1441144943237305, "global_step": 189745, "epoch": 4517} {"train_loss": -7.1751484870910645, "global_step": 189746, "epoch": 4517} {"train_loss": -7.020018577575684, "global_step": 189747, "epoch": 4517} {"train_loss": -7.114246368408203, "global_step": 189748, "epoch": 4517} {"train_loss": -7.151275157928467, "global_step": 189749, "epoch": 4517} {"train_loss": -7.009308338165283, "global_step": 189750, "epoch": 4517} {"train_loss": -7.157646179199219, "global_step": 189751, "epoch": 4517} {"train_loss": -7.253146171569824, "global_step": 189752, "epoch": 4517} {"train_loss": -7.158631801605225, "global_step": 189753, "epoch": 4517} {"train_loss": -7.245205402374268, "global_step": 189754, "epoch": 4517} {"train_loss": -7.126820223672049, "global_step": 189755, "epoch": 4517, "val_loss": 69807.046875} {"train_loss": -7.1284403800964355, "global_step": 189756, "epoch": 4518} {"train_loss": -7.15194034576416, "global_step": 189757, "epoch": 4518} {"train_loss": -7.102906227111816, "global_step": 189758, "epoch": 4518} {"train_loss": -6.965274810791016, "global_step": 189759, "epoch": 4518} {"train_loss": -7.262730598449707, "global_step": 189760, "epoch": 4518} {"train_loss": -7.2094035148620605, "global_step": 189761, "epoch": 4518} {"train_loss": -7.102756500244141, "global_step": 189762, "epoch": 4518} {"train_loss": -7.246685028076172, "global_step": 189763, "epoch": 4518} {"train_loss": -7.200606346130371, "global_step": 189764, "epoch": 4518} {"train_loss": -7.174274444580078, "global_step": 189765, "epoch": 4518} {"train_loss": -7.223546028137207, "global_step": 189766, "epoch": 4518} {"train_loss": -7.232813835144043, "global_step": 189767, "epoch": 4518} {"train_loss": -7.211542129516602, "global_step": 189768, "epoch": 4518} {"train_loss": -7.202925682067871, "global_step": 189769, "epoch": 4518} {"train_loss": -7.107435703277588, "global_step": 189770, "epoch": 4518} {"train_loss": -7.080165863037109, "global_step": 189771, "epoch": 4518} {"train_loss": -7.097999572753906, "global_step": 189772, "epoch": 4518} {"train_loss": -7.32187032699585, "global_step": 189773, "epoch": 4518} {"train_loss": -7.159735679626465, "global_step": 189774, "epoch": 4518} {"train_loss": -7.241408348083496, "global_step": 189775, "epoch": 4518} {"train_loss": -7.189734935760498, "global_step": 189776, "epoch": 4518} {"train_loss": -7.060172080993652, "global_step": 189777, "epoch": 4518} {"train_loss": -7.088284015655518, "global_step": 189778, "epoch": 4518} {"train_loss": -7.118020057678223, "global_step": 189779, "epoch": 4518} {"train_loss": -7.117669582366943, "global_step": 189780, "epoch": 4518} {"train_loss": -7.157071113586426, "global_step": 189781, "epoch": 4518} {"train_loss": -7.260266304016113, "global_step": 189782, "epoch": 4518} {"train_loss": -7.242290496826172, "global_step": 189783, "epoch": 4518} {"train_loss": -7.271658897399902, "global_step": 189784, "epoch": 4518} {"train_loss": -7.180506706237793, "global_step": 189785, "epoch": 4518} {"train_loss": -7.177302360534668, "global_step": 189786, "epoch": 4518} {"train_loss": -7.234864234924316, "global_step": 189787, "epoch": 4518} {"train_loss": -7.253506660461426, "global_step": 189788, "epoch": 4518} {"train_loss": -7.1079511642456055, "global_step": 189789, "epoch": 4518} {"train_loss": -7.181464195251465, "global_step": 189790, "epoch": 4518} {"train_loss": -7.2611494064331055, "global_step": 189791, "epoch": 4518} {"train_loss": -7.193241119384766, "global_step": 189792, "epoch": 4518} {"train_loss": -7.194662094116211, "global_step": 189793, "epoch": 4518} {"train_loss": -7.233890533447266, "global_step": 189794, "epoch": 4518} {"train_loss": -7.157425403594971, "global_step": 189795, "epoch": 4518} {"train_loss": -7.198371887207031, "global_step": 189796, "epoch": 4518} {"train_loss": -7.179669380187988, "global_step": 189797, "epoch": 4518, "val_loss": 69707.8203125} {"train_loss": -7.119533061981201, "global_step": 189798, "epoch": 4519} {"train_loss": -7.129782676696777, "global_step": 189799, "epoch": 4519} {"train_loss": -7.28024959564209, "global_step": 189800, "epoch": 4519} {"train_loss": -7.188374996185303, "global_step": 189801, "epoch": 4519} {"train_loss": -7.235470294952393, "global_step": 189802, "epoch": 4519} {"train_loss": -7.3472700119018555, "global_step": 189803, "epoch": 4519} {"train_loss": -7.170422554016113, "global_step": 189804, "epoch": 4519} {"train_loss": -7.236305236816406, "global_step": 189805, "epoch": 4519} {"train_loss": -7.244021892547607, "global_step": 189806, "epoch": 4519} {"train_loss": -7.223947525024414, "global_step": 189807, "epoch": 4519} {"train_loss": -7.228168487548828, "global_step": 189808, "epoch": 4519} {"train_loss": -7.297516822814941, "global_step": 189809, "epoch": 4519} {"train_loss": -7.4166646003723145, "global_step": 189810, "epoch": 4519} {"train_loss": -7.308568000793457, "global_step": 189811, "epoch": 4519} {"train_loss": -7.229615211486816, "global_step": 189812, "epoch": 4519} {"train_loss": -7.312196254730225, "global_step": 189813, "epoch": 4519} {"train_loss": -7.235356330871582, "global_step": 189814, "epoch": 4519} {"train_loss": -7.212462425231934, "global_step": 189815, "epoch": 4519} {"train_loss": -7.300899505615234, "global_step": 189816, "epoch": 4519} {"train_loss": -7.314554691314697, "global_step": 189817, "epoch": 4519} {"train_loss": -7.268434047698975, "global_step": 189818, "epoch": 4519} {"train_loss": -7.213527679443359, "global_step": 189819, "epoch": 4519} {"train_loss": -7.290262222290039, "global_step": 189820, "epoch": 4519} {"train_loss": -7.28389835357666, "global_step": 189821, "epoch": 4519} {"train_loss": -7.147682189941406, "global_step": 189822, "epoch": 4519} {"train_loss": -7.155489921569824, "global_step": 189823, "epoch": 4519} {"train_loss": -7.273623943328857, "global_step": 189824, "epoch": 4519} {"train_loss": -7.280857086181641, "global_step": 189825, "epoch": 4519} {"train_loss": -7.336403846740723, "global_step": 189826, "epoch": 4519} {"train_loss": -7.19753360748291, "global_step": 189827, "epoch": 4519} {"train_loss": -7.290642738342285, "global_step": 189828, "epoch": 4519} {"train_loss": -7.314499855041504, "global_step": 189829, "epoch": 4519} {"train_loss": -7.2152628898620605, "global_step": 189830, "epoch": 4519} {"train_loss": -7.224477767944336, "global_step": 189831, "epoch": 4519} {"train_loss": -7.254983901977539, "global_step": 189832, "epoch": 4519} {"train_loss": -7.2759904861450195, "global_step": 189833, "epoch": 4519} {"train_loss": -7.240546226501465, "global_step": 189834, "epoch": 4519} {"train_loss": -7.168147087097168, "global_step": 189835, "epoch": 4519} {"train_loss": -7.335899353027344, "global_step": 189836, "epoch": 4519} {"train_loss": -7.242359161376953, "global_step": 189837, "epoch": 4519} {"train_loss": -7.176499366760254, "global_step": 189838, "epoch": 4519} {"train_loss": -7.246026061830067, "global_step": 189839, "epoch": 4519, "val_loss": 69615.90625} {"train_loss": -7.246464252471924, "global_step": 189840, "epoch": 4520} {"train_loss": -7.246665954589844, "global_step": 189841, "epoch": 4520} {"train_loss": -7.240844249725342, "global_step": 189842, "epoch": 4520} {"train_loss": -7.308605670928955, "global_step": 189843, "epoch": 4520} {"train_loss": -7.196605682373047, "global_step": 189844, "epoch": 4520} {"train_loss": -7.2608160972595215, "global_step": 189845, "epoch": 4520} {"train_loss": -7.192734718322754, "global_step": 189846, "epoch": 4520} {"train_loss": -7.286641597747803, "global_step": 189847, "epoch": 4520} {"train_loss": -7.184800624847412, "global_step": 189848, "epoch": 4520} {"train_loss": -7.0771074295043945, "global_step": 189849, "epoch": 4520} {"train_loss": -7.255190372467041, "global_step": 189850, "epoch": 4520} {"train_loss": -7.214120864868164, "global_step": 189851, "epoch": 4520} {"train_loss": -7.178741455078125, "global_step": 189852, "epoch": 4520} {"train_loss": -7.219524383544922, "global_step": 189853, "epoch": 4520} {"train_loss": -7.1966753005981445, "global_step": 189854, "epoch": 4520} {"train_loss": -7.159709930419922, "global_step": 189855, "epoch": 4520} {"train_loss": -7.217117786407471, "global_step": 189856, "epoch": 4520} {"train_loss": -7.256465911865234, "global_step": 189857, "epoch": 4520} {"train_loss": -7.072469711303711, "global_step": 189858, "epoch": 4520} {"train_loss": -7.255833625793457, "global_step": 189859, "epoch": 4520} {"train_loss": -7.183231830596924, "global_step": 189860, "epoch": 4520} {"train_loss": -7.198110103607178, "global_step": 189861, "epoch": 4520} {"train_loss": -7.1889777183532715, "global_step": 189862, "epoch": 4520} {"train_loss": -7.141740798950195, "global_step": 189863, "epoch": 4520} {"train_loss": -7.171055793762207, "global_step": 189864, "epoch": 4520} {"train_loss": -7.173565864562988, "global_step": 189865, "epoch": 4520} {"train_loss": -7.144789695739746, "global_step": 189866, "epoch": 4520} {"train_loss": -7.228419303894043, "global_step": 189867, "epoch": 4520} {"train_loss": -7.177196502685547, "global_step": 189868, "epoch": 4520} {"train_loss": -7.111306190490723, "global_step": 189869, "epoch": 4520} {"train_loss": -7.213194370269775, "global_step": 189870, "epoch": 4520} {"train_loss": -7.179058074951172, "global_step": 189871, "epoch": 4520} {"train_loss": -7.217706203460693, "global_step": 189872, "epoch": 4520} {"train_loss": -7.239543914794922, "global_step": 189873, "epoch": 4520} {"train_loss": -7.1017608642578125, "global_step": 189874, "epoch": 4520} {"train_loss": -7.216066360473633, "global_step": 189875, "epoch": 4520} {"train_loss": -7.127742767333984, "global_step": 189876, "epoch": 4520} {"train_loss": -7.135436058044434, "global_step": 189877, "epoch": 4520} {"train_loss": -7.3274970054626465, "global_step": 189878, "epoch": 4520} {"train_loss": -7.173088073730469, "global_step": 189879, "epoch": 4520} {"train_loss": -7.160329818725586, "global_step": 189880, "epoch": 4520} {"train_loss": -7.196566275187901, "global_step": 189881, "epoch": 4520, "val_loss": 69685.9296875} {"train_loss": -7.176715850830078, "global_step": 189882, "epoch": 4521} {"train_loss": -7.344227313995361, "global_step": 189883, "epoch": 4521} {"train_loss": -7.158823013305664, "global_step": 189884, "epoch": 4521} {"train_loss": -7.175455093383789, "global_step": 189885, "epoch": 4521} {"train_loss": -7.25991153717041, "global_step": 189886, "epoch": 4521} {"train_loss": -7.176401615142822, "global_step": 189887, "epoch": 4521} {"train_loss": -7.196290016174316, "global_step": 189888, "epoch": 4521} {"train_loss": -7.271607875823975, "global_step": 189889, "epoch": 4521} {"train_loss": -7.186959743499756, "global_step": 189890, "epoch": 4521} {"train_loss": -7.296749114990234, "global_step": 189891, "epoch": 4521} {"train_loss": -7.129579544067383, "global_step": 189892, "epoch": 4521} {"train_loss": -7.151161193847656, "global_step": 189893, "epoch": 4521} {"train_loss": -7.101987838745117, "global_step": 189894, "epoch": 4521} {"train_loss": -7.219874382019043, "global_step": 189895, "epoch": 4521} {"train_loss": -7.022331237792969, "global_step": 189896, "epoch": 4521} {"train_loss": -7.128634929656982, "global_step": 189897, "epoch": 4521} {"train_loss": -7.243457794189453, "global_step": 189898, "epoch": 4521} {"train_loss": -7.209002494812012, "global_step": 189899, "epoch": 4521} {"train_loss": -7.146432876586914, "global_step": 189900, "epoch": 4521} {"train_loss": -7.302923679351807, "global_step": 189901, "epoch": 4521} {"train_loss": -7.16361665725708, "global_step": 189902, "epoch": 4521} {"train_loss": -7.208039283752441, "global_step": 189903, "epoch": 4521} {"train_loss": -7.227852821350098, "global_step": 189904, "epoch": 4521} {"train_loss": -7.289947986602783, "global_step": 189905, "epoch": 4521} {"train_loss": -7.21474552154541, "global_step": 189906, "epoch": 4521} {"train_loss": -7.0418500900268555, "global_step": 189907, "epoch": 4521} {"train_loss": -7.276849746704102, "global_step": 189908, "epoch": 4521} {"train_loss": -7.294894695281982, "global_step": 189909, "epoch": 4521} {"train_loss": -7.248745918273926, "global_step": 189910, "epoch": 4521} {"train_loss": -7.209789276123047, "global_step": 189911, "epoch": 4521} {"train_loss": -7.222369194030762, "global_step": 189912, "epoch": 4521} {"train_loss": -7.229010581970215, "global_step": 189913, "epoch": 4521} {"train_loss": -7.234571933746338, "global_step": 189914, "epoch": 4521} {"train_loss": -7.3074727058410645, "global_step": 189915, "epoch": 4521} {"train_loss": -7.253726005554199, "global_step": 189916, "epoch": 4521} {"train_loss": -7.269838333129883, "global_step": 189917, "epoch": 4521} {"train_loss": -7.215603351593018, "global_step": 189918, "epoch": 4521} {"train_loss": -7.211864471435547, "global_step": 189919, "epoch": 4521} {"train_loss": -7.143660545349121, "global_step": 189920, "epoch": 4521} {"train_loss": -7.13372278213501, "global_step": 189921, "epoch": 4521} {"train_loss": -7.196498870849609, "global_step": 189922, "epoch": 4521} {"train_loss": -7.210060982477097, "global_step": 189923, "epoch": 4521, "val_loss": 69677.765625} {"train_loss": -7.22071647644043, "global_step": 189924, "epoch": 4522} {"train_loss": -7.211350440979004, "global_step": 189925, "epoch": 4522} {"train_loss": -7.115891456604004, "global_step": 189926, "epoch": 4522} {"train_loss": -7.299158573150635, "global_step": 189927, "epoch": 4522} {"train_loss": -7.1601667404174805, "global_step": 189928, "epoch": 4522} {"train_loss": -7.198464870452881, "global_step": 189929, "epoch": 4522} {"train_loss": -7.204899787902832, "global_step": 189930, "epoch": 4522} {"train_loss": -7.190356731414795, "global_step": 189931, "epoch": 4522} {"train_loss": -7.316168785095215, "global_step": 189932, "epoch": 4522} {"train_loss": -7.2507500648498535, "global_step": 189933, "epoch": 4522} {"train_loss": -7.288386821746826, "global_step": 189934, "epoch": 4522} {"train_loss": -7.261831283569336, "global_step": 189935, "epoch": 4522} {"train_loss": -7.284475326538086, "global_step": 189936, "epoch": 4522} {"train_loss": -7.286681175231934, "global_step": 189937, "epoch": 4522} {"train_loss": -7.299856662750244, "global_step": 189938, "epoch": 4522} {"train_loss": -7.168941497802734, "global_step": 189939, "epoch": 4522} {"train_loss": -7.130833625793457, "global_step": 189940, "epoch": 4522} {"train_loss": -7.32012939453125, "global_step": 189941, "epoch": 4522} {"train_loss": -7.110857963562012, "global_step": 189942, "epoch": 4522} {"train_loss": -7.179984092712402, "global_step": 189943, "epoch": 4522} {"train_loss": -7.146933555603027, "global_step": 189944, "epoch": 4522} {"train_loss": -7.207425117492676, "global_step": 189945, "epoch": 4522} {"train_loss": -7.211733341217041, "global_step": 189946, "epoch": 4522} {"train_loss": -7.1454267501831055, "global_step": 189947, "epoch": 4522} {"train_loss": -7.161213397979736, "global_step": 189948, "epoch": 4522} {"train_loss": -7.21195125579834, "global_step": 189949, "epoch": 4522} {"train_loss": -7.092555046081543, "global_step": 189950, "epoch": 4522} {"train_loss": -7.161016941070557, "global_step": 189951, "epoch": 4522} {"train_loss": -7.035579681396484, "global_step": 189952, "epoch": 4522} {"train_loss": -7.075624465942383, "global_step": 189953, "epoch": 4522} {"train_loss": -7.138363838195801, "global_step": 189954, "epoch": 4522} {"train_loss": -7.115422248840332, "global_step": 189955, "epoch": 4522} {"train_loss": -7.1284003257751465, "global_step": 189956, "epoch": 4522} {"train_loss": -7.018172264099121, "global_step": 189957, "epoch": 4522} {"train_loss": -7.074402809143066, "global_step": 189958, "epoch": 4522} {"train_loss": -7.064403057098389, "global_step": 189959, "epoch": 4522} {"train_loss": -7.078857421875, "global_step": 189960, "epoch": 4522} {"train_loss": -7.12253475189209, "global_step": 189961, "epoch": 4522} {"train_loss": -7.133344650268555, "global_step": 189962, "epoch": 4522} {"train_loss": -7.141193866729736, "global_step": 189963, "epoch": 4522} {"train_loss": -7.0448455810546875, "global_step": 189964, "epoch": 4522} {"train_loss": -7.172005812327067, "global_step": 189965, "epoch": 4522, "val_loss": 69621.9609375} {"train_loss": -7.14668083190918, "global_step": 189966, "epoch": 4523} {"train_loss": -7.150594234466553, "global_step": 189967, "epoch": 4523} {"train_loss": -7.296323776245117, "global_step": 189968, "epoch": 4523} {"train_loss": -7.114163875579834, "global_step": 189969, "epoch": 4523} {"train_loss": -7.250333786010742, "global_step": 189970, "epoch": 4523} {"train_loss": -7.246798992156982, "global_step": 189971, "epoch": 4523} {"train_loss": -7.006932258605957, "global_step": 189972, "epoch": 4523} {"train_loss": -7.1575517654418945, "global_step": 189973, "epoch": 4523} {"train_loss": -7.112183094024658, "global_step": 189974, "epoch": 4523} {"train_loss": -7.090597152709961, "global_step": 189975, "epoch": 4523} {"train_loss": -7.174011707305908, "global_step": 189976, "epoch": 4523} {"train_loss": -7.214622974395752, "global_step": 189977, "epoch": 4523} {"train_loss": -7.161831855773926, "global_step": 189978, "epoch": 4523} {"train_loss": -7.225342273712158, "global_step": 189979, "epoch": 4523} {"train_loss": -7.251219749450684, "global_step": 189980, "epoch": 4523} {"train_loss": -7.233952045440674, "global_step": 189981, "epoch": 4523} {"train_loss": -7.290602207183838, "global_step": 189982, "epoch": 4523} {"train_loss": -7.190481662750244, "global_step": 189983, "epoch": 4523} {"train_loss": -7.219202041625977, "global_step": 189984, "epoch": 4523} {"train_loss": -7.204189300537109, "global_step": 189985, "epoch": 4523} {"train_loss": -7.253953456878662, "global_step": 189986, "epoch": 4523} {"train_loss": -7.290576457977295, "global_step": 189987, "epoch": 4523} {"train_loss": -7.238218307495117, "global_step": 189988, "epoch": 4523} {"train_loss": -7.214724540710449, "global_step": 189989, "epoch": 4523} {"train_loss": -7.1802978515625, "global_step": 189990, "epoch": 4523} {"train_loss": -7.192257881164551, "global_step": 189991, "epoch": 4523} {"train_loss": -7.152218341827393, "global_step": 189992, "epoch": 4523} {"train_loss": -7.285367488861084, "global_step": 189993, "epoch": 4523} {"train_loss": -7.271263122558594, "global_step": 189994, "epoch": 4523} {"train_loss": -7.250148296356201, "global_step": 189995, "epoch": 4523} {"train_loss": -7.247091293334961, "global_step": 189996, "epoch": 4523} {"train_loss": -7.104103088378906, "global_step": 189997, "epoch": 4523} {"train_loss": -7.170877933502197, "global_step": 189998, "epoch": 4523} {"train_loss": -7.247498989105225, "global_step": 189999, "epoch": 4523} {"train_loss": -7.225556373596191, "global_step": 190000, "epoch": 4523} {"train_loss": -7.301722526550293, "global_step": 190001, "epoch": 4523} {"train_loss": -7.233768463134766, "global_step": 190002, "epoch": 4523} {"train_loss": -7.249594688415527, "global_step": 190003, "epoch": 4523} {"train_loss": -7.137389183044434, "global_step": 190004, "epoch": 4523} {"train_loss": -7.178378105163574, "global_step": 190005, "epoch": 4523} {"train_loss": -7.191450119018555, "global_step": 190006, "epoch": 4523} {"train_loss": -7.204940988903954, "global_step": 190007, "epoch": 4523, "val_loss": 69563.7890625} {"train_loss": -7.309267520904541, "global_step": 190008, "epoch": 4524} {"train_loss": -7.159388065338135, "global_step": 190009, "epoch": 4524} {"train_loss": -7.235790729522705, "global_step": 190010, "epoch": 4524} {"train_loss": -7.317772388458252, "global_step": 190011, "epoch": 4524} {"train_loss": -7.257152557373047, "global_step": 190012, "epoch": 4524} {"train_loss": -7.306304931640625, "global_step": 190013, "epoch": 4524} {"train_loss": -7.182321548461914, "global_step": 190014, "epoch": 4524} {"train_loss": -7.2151079177856445, "global_step": 190015, "epoch": 4524} {"train_loss": -7.254486083984375, "global_step": 190016, "epoch": 4524} {"train_loss": -7.199069976806641, "global_step": 190017, "epoch": 4524} {"train_loss": -7.1215362548828125, "global_step": 190018, "epoch": 4524} {"train_loss": -7.203428745269775, "global_step": 190019, "epoch": 4524} {"train_loss": -7.1264729499816895, "global_step": 190020, "epoch": 4524} {"train_loss": -7.179912567138672, "global_step": 190021, "epoch": 4524} {"train_loss": -7.261753082275391, "global_step": 190022, "epoch": 4524} {"train_loss": -7.1594929695129395, "global_step": 190023, "epoch": 4524} {"train_loss": -7.235846042633057, "global_step": 190024, "epoch": 4524} {"train_loss": -7.218991279602051, "global_step": 190025, "epoch": 4524} {"train_loss": -7.168990135192871, "global_step": 190026, "epoch": 4524} {"train_loss": -7.091769218444824, "global_step": 190027, "epoch": 4524} {"train_loss": -7.258573532104492, "global_step": 190028, "epoch": 4524} {"train_loss": -7.205855846405029, "global_step": 190029, "epoch": 4524} {"train_loss": -7.190727233886719, "global_step": 190030, "epoch": 4524} {"train_loss": -7.22353982925415, "global_step": 190031, "epoch": 4524} {"train_loss": -7.256384372711182, "global_step": 190032, "epoch": 4524} {"train_loss": -7.222642421722412, "global_step": 190033, "epoch": 4524} {"train_loss": -7.196937561035156, "global_step": 190034, "epoch": 4524} {"train_loss": -7.184577941894531, "global_step": 190035, "epoch": 4524} {"train_loss": -7.158805847167969, "global_step": 190036, "epoch": 4524} {"train_loss": -7.0801615715026855, "global_step": 190037, "epoch": 4524} {"train_loss": -7.240802764892578, "global_step": 190038, "epoch": 4524} {"train_loss": -7.272634506225586, "global_step": 190039, "epoch": 4524} {"train_loss": -7.260782241821289, "global_step": 190040, "epoch": 4524} {"train_loss": -7.1996917724609375, "global_step": 190041, "epoch": 4524} {"train_loss": -7.225035190582275, "global_step": 190042, "epoch": 4524} {"train_loss": -7.158439636230469, "global_step": 190043, "epoch": 4524} {"train_loss": -7.155462265014648, "global_step": 190044, "epoch": 4524} {"train_loss": -7.265018463134766, "global_step": 190045, "epoch": 4524} {"train_loss": -7.207472324371338, "global_step": 190046, "epoch": 4524} {"train_loss": -7.194474220275879, "global_step": 190047, "epoch": 4524} {"train_loss": -7.08620548248291, "global_step": 190048, "epoch": 4524} {"train_loss": -7.204373246147519, "global_step": 190049, "epoch": 4524, "val_loss": 69517.6484375} {"train_loss": -7.1472930908203125, "global_step": 190050, "epoch": 4525} {"train_loss": -7.009908676147461, "global_step": 190051, "epoch": 4525} {"train_loss": -7.213029861450195, "global_step": 190052, "epoch": 4525} {"train_loss": -7.169880390167236, "global_step": 190053, "epoch": 4525} {"train_loss": -6.975268840789795, "global_step": 190054, "epoch": 4525} {"train_loss": -7.2531867027282715, "global_step": 190055, "epoch": 4525} {"train_loss": -7.102202415466309, "global_step": 190056, "epoch": 4525} {"train_loss": -7.126803874969482, "global_step": 190057, "epoch": 4525} {"train_loss": -7.165402412414551, "global_step": 190058, "epoch": 4525} {"train_loss": -7.229808807373047, "global_step": 190059, "epoch": 4525} {"train_loss": -7.161175727844238, "global_step": 190060, "epoch": 4525} {"train_loss": -7.105166435241699, "global_step": 190061, "epoch": 4525} {"train_loss": -7.265061378479004, "global_step": 190062, "epoch": 4525} {"train_loss": -7.198575496673584, "global_step": 190063, "epoch": 4525} {"train_loss": -7.168185234069824, "global_step": 190064, "epoch": 4525} {"train_loss": -7.122655868530273, "global_step": 190065, "epoch": 4525} {"train_loss": -7.201449394226074, "global_step": 190066, "epoch": 4525} {"train_loss": -7.2370452880859375, "global_step": 190067, "epoch": 4525} {"train_loss": -7.19434928894043, "global_step": 190068, "epoch": 4525} {"train_loss": -7.083579063415527, "global_step": 190069, "epoch": 4525} {"train_loss": -7.146763801574707, "global_step": 190070, "epoch": 4525} {"train_loss": -7.097660064697266, "global_step": 190071, "epoch": 4525} {"train_loss": -7.218179225921631, "global_step": 190072, "epoch": 4525} {"train_loss": -7.202208518981934, "global_step": 190073, "epoch": 4525} {"train_loss": -7.305450439453125, "global_step": 190074, "epoch": 4525} {"train_loss": -7.11921501159668, "global_step": 190075, "epoch": 4525} {"train_loss": -7.085836887359619, "global_step": 190076, "epoch": 4525} {"train_loss": -7.097628593444824, "global_step": 190077, "epoch": 4525} {"train_loss": -6.954848289489746, "global_step": 190078, "epoch": 4525} {"train_loss": -7.05048942565918, "global_step": 190079, "epoch": 4525} {"train_loss": -7.180233001708984, "global_step": 190080, "epoch": 4525} {"train_loss": -7.0419464111328125, "global_step": 190081, "epoch": 4525} {"train_loss": -7.117310047149658, "global_step": 190082, "epoch": 4525} {"train_loss": -7.045706748962402, "global_step": 190083, "epoch": 4525} {"train_loss": -7.170421123504639, "global_step": 190084, "epoch": 4525} {"train_loss": -7.1406965255737305, "global_step": 190085, "epoch": 4525} {"train_loss": -7.090264797210693, "global_step": 190086, "epoch": 4525} {"train_loss": -7.151007175445557, "global_step": 190087, "epoch": 4525} {"train_loss": -7.003956317901611, "global_step": 190088, "epoch": 4525} {"train_loss": -7.106078147888184, "global_step": 190089, "epoch": 4525} {"train_loss": -7.058041572570801, "global_step": 190090, "epoch": 4525} {"train_loss": -7.134765579586937, "global_step": 190091, "epoch": 4525, "val_loss": 69556.4375} {"train_loss": -7.084222793579102, "global_step": 190092, "epoch": 4526} {"train_loss": -7.141757011413574, "global_step": 190093, "epoch": 4526} {"train_loss": -7.238009452819824, "global_step": 190094, "epoch": 4526} {"train_loss": -7.116849899291992, "global_step": 190095, "epoch": 4526} {"train_loss": -7.09716272354126, "global_step": 190096, "epoch": 4526} {"train_loss": -7.147552490234375, "global_step": 190097, "epoch": 4526} {"train_loss": -7.266789436340332, "global_step": 190098, "epoch": 4526} {"train_loss": -7.204314231872559, "global_step": 190099, "epoch": 4526} {"train_loss": -7.098051071166992, "global_step": 190100, "epoch": 4526} {"train_loss": -7.181607246398926, "global_step": 190101, "epoch": 4526} {"train_loss": -7.313365936279297, "global_step": 190102, "epoch": 4526} {"train_loss": -7.122359752655029, "global_step": 190103, "epoch": 4526} {"train_loss": -7.190340995788574, "global_step": 190104, "epoch": 4526} {"train_loss": -7.205559730529785, "global_step": 190105, "epoch": 4526} {"train_loss": -7.211002826690674, "global_step": 190106, "epoch": 4526} {"train_loss": -6.990569114685059, "global_step": 190107, "epoch": 4526} {"train_loss": -7.259662628173828, "global_step": 190108, "epoch": 4526} {"train_loss": -7.230375289916992, "global_step": 190109, "epoch": 4526} {"train_loss": -7.11688756942749, "global_step": 190110, "epoch": 4526} {"train_loss": -7.147875785827637, "global_step": 190111, "epoch": 4526} {"train_loss": -7.017293930053711, "global_step": 190112, "epoch": 4526} {"train_loss": -7.187143325805664, "global_step": 190113, "epoch": 4526} {"train_loss": -7.2144012451171875, "global_step": 190114, "epoch": 4526} {"train_loss": -7.2266716957092285, "global_step": 190115, "epoch": 4526} {"train_loss": -7.106807708740234, "global_step": 190116, "epoch": 4526} {"train_loss": -7.247530460357666, "global_step": 190117, "epoch": 4526} {"train_loss": -7.046195983886719, "global_step": 190118, "epoch": 4526} {"train_loss": -7.26052188873291, "global_step": 190119, "epoch": 4526} {"train_loss": -7.14737606048584, "global_step": 190120, "epoch": 4526} {"train_loss": -7.131606101989746, "global_step": 190121, "epoch": 4526} {"train_loss": -7.076237201690674, "global_step": 190122, "epoch": 4526} {"train_loss": -7.195521831512451, "global_step": 190123, "epoch": 4526} {"train_loss": -7.092443466186523, "global_step": 190124, "epoch": 4526} {"train_loss": -7.1898417472839355, "global_step": 190125, "epoch": 4526} {"train_loss": -7.158078193664551, "global_step": 190126, "epoch": 4526} {"train_loss": -7.086812496185303, "global_step": 190127, "epoch": 4526} {"train_loss": -7.254968166351318, "global_step": 190128, "epoch": 4526} {"train_loss": -7.178050994873047, "global_step": 190129, "epoch": 4526} {"train_loss": -7.172780990600586, "global_step": 190130, "epoch": 4526} {"train_loss": -7.273126125335693, "global_step": 190131, "epoch": 4526} {"train_loss": -7.139068603515625, "global_step": 190132, "epoch": 4526} {"train_loss": -7.167396738415673, "global_step": 190133, "epoch": 4526, "val_loss": 69499.9296875} {"train_loss": -7.169083595275879, "global_step": 190134, "epoch": 4527} {"train_loss": -7.150147438049316, "global_step": 190135, "epoch": 4527} {"train_loss": -7.209835052490234, "global_step": 190136, "epoch": 4527} {"train_loss": -7.250029563903809, "global_step": 190137, "epoch": 4527} {"train_loss": -7.1082682609558105, "global_step": 190138, "epoch": 4527} {"train_loss": -7.246672630310059, "global_step": 190139, "epoch": 4527} {"train_loss": -7.227263450622559, "global_step": 190140, "epoch": 4527} {"train_loss": -7.065812587738037, "global_step": 190141, "epoch": 4527} {"train_loss": -7.095410346984863, "global_step": 190142, "epoch": 4527} {"train_loss": -7.20852518081665, "global_step": 190143, "epoch": 4527} {"train_loss": -7.06697940826416, "global_step": 190144, "epoch": 4527} {"train_loss": -7.19533634185791, "global_step": 190145, "epoch": 4527} {"train_loss": -7.205931663513184, "global_step": 190146, "epoch": 4527} {"train_loss": -7.179699420928955, "global_step": 190147, "epoch": 4527} {"train_loss": -7.141839981079102, "global_step": 190148, "epoch": 4527} {"train_loss": -7.197815895080566, "global_step": 190149, "epoch": 4527} {"train_loss": -7.162662982940674, "global_step": 190150, "epoch": 4527} {"train_loss": -7.176916122436523, "global_step": 190151, "epoch": 4527} {"train_loss": -7.076359272003174, "global_step": 190152, "epoch": 4527} {"train_loss": -7.154348373413086, "global_step": 190153, "epoch": 4527} {"train_loss": -7.046822547912598, "global_step": 190154, "epoch": 4527} {"train_loss": -7.151336193084717, "global_step": 190155, "epoch": 4527} {"train_loss": -7.024703025817871, "global_step": 190156, "epoch": 4527} {"train_loss": -7.129150867462158, "global_step": 190157, "epoch": 4527} {"train_loss": -7.035490989685059, "global_step": 190158, "epoch": 4527} {"train_loss": -7.183190822601318, "global_step": 190159, "epoch": 4527} {"train_loss": -7.235435485839844, "global_step": 190160, "epoch": 4527} {"train_loss": -7.1854047775268555, "global_step": 190161, "epoch": 4527} {"train_loss": -7.1015448570251465, "global_step": 190162, "epoch": 4527} {"train_loss": -7.118991374969482, "global_step": 190163, "epoch": 4527} {"train_loss": -7.249869346618652, "global_step": 190164, "epoch": 4527} {"train_loss": -7.245998382568359, "global_step": 190165, "epoch": 4527} {"train_loss": -7.166045188903809, "global_step": 190166, "epoch": 4527} {"train_loss": -7.130429267883301, "global_step": 190167, "epoch": 4527} {"train_loss": -7.179340839385986, "global_step": 190168, "epoch": 4527} {"train_loss": -7.198733806610107, "global_step": 190169, "epoch": 4527} {"train_loss": -7.295891761779785, "global_step": 190170, "epoch": 4527} {"train_loss": -7.202497482299805, "global_step": 190171, "epoch": 4527} {"train_loss": -7.311204433441162, "global_step": 190172, "epoch": 4527} {"train_loss": -7.255229473114014, "global_step": 190173, "epoch": 4527} {"train_loss": -7.144316673278809, "global_step": 190174, "epoch": 4527} {"train_loss": -7.170987129211426, "global_step": 190175, "epoch": 4527, "val_loss": 69519.859375} {"train_loss": -7.172603130340576, "global_step": 190176, "epoch": 4528} {"train_loss": -7.204004764556885, "global_step": 190177, "epoch": 4528} {"train_loss": -7.227024078369141, "global_step": 190178, "epoch": 4528} {"train_loss": -7.138922691345215, "global_step": 190179, "epoch": 4528} {"train_loss": -7.0937933921813965, "global_step": 190180, "epoch": 4528} {"train_loss": -7.168261528015137, "global_step": 190181, "epoch": 4528} {"train_loss": -7.095725059509277, "global_step": 190182, "epoch": 4528} {"train_loss": -7.198698043823242, "global_step": 190183, "epoch": 4528} {"train_loss": -7.133154392242432, "global_step": 190184, "epoch": 4528} {"train_loss": -7.230074882507324, "global_step": 190185, "epoch": 4528} {"train_loss": -7.099827766418457, "global_step": 190186, "epoch": 4528} {"train_loss": -7.102575302124023, "global_step": 190187, "epoch": 4528} {"train_loss": -7.120494365692139, "global_step": 190188, "epoch": 4528} {"train_loss": -7.165281295776367, "global_step": 190189, "epoch": 4528} {"train_loss": -7.157727241516113, "global_step": 190190, "epoch": 4528} {"train_loss": -7.178794860839844, "global_step": 190191, "epoch": 4528} {"train_loss": -7.19967794418335, "global_step": 190192, "epoch": 4528} {"train_loss": -7.1239190101623535, "global_step": 190193, "epoch": 4528} {"train_loss": -7.263955593109131, "global_step": 190194, "epoch": 4528} {"train_loss": -7.231141090393066, "global_step": 190195, "epoch": 4528} {"train_loss": -7.185318946838379, "global_step": 190196, "epoch": 4528} {"train_loss": -7.12864875793457, "global_step": 190197, "epoch": 4528} {"train_loss": -7.18662691116333, "global_step": 190198, "epoch": 4528} {"train_loss": -7.184954643249512, "global_step": 190199, "epoch": 4528} {"train_loss": -7.238467693328857, "global_step": 190200, "epoch": 4528} {"train_loss": -7.195405006408691, "global_step": 190201, "epoch": 4528} {"train_loss": -7.23779821395874, "global_step": 190202, "epoch": 4528} {"train_loss": -7.3204803466796875, "global_step": 190203, "epoch": 4528} {"train_loss": -7.187943935394287, "global_step": 190204, "epoch": 4528} {"train_loss": -7.1428141593933105, "global_step": 190205, "epoch": 4528} {"train_loss": -7.203207015991211, "global_step": 190206, "epoch": 4528} {"train_loss": -7.2974958419799805, "global_step": 190207, "epoch": 4528} {"train_loss": -7.226820468902588, "global_step": 190208, "epoch": 4528} {"train_loss": -7.201972484588623, "global_step": 190209, "epoch": 4528} {"train_loss": -7.361082077026367, "global_step": 190210, "epoch": 4528} {"train_loss": -7.19926118850708, "global_step": 190211, "epoch": 4528} {"train_loss": -7.342666149139404, "global_step": 190212, "epoch": 4528} {"train_loss": -7.163913726806641, "global_step": 190213, "epoch": 4528} {"train_loss": -7.301539897918701, "global_step": 190214, "epoch": 4528} {"train_loss": -7.133768081665039, "global_step": 190215, "epoch": 4528} {"train_loss": -7.259142875671387, "global_step": 190216, "epoch": 4528} {"train_loss": -7.195986361730666, "global_step": 190217, "epoch": 4528, "val_loss": 69513.4453125} {"train_loss": -7.096713066101074, "global_step": 190218, "epoch": 4529} {"train_loss": -7.1554365158081055, "global_step": 190219, "epoch": 4529} {"train_loss": -6.999020576477051, "global_step": 190220, "epoch": 4529} {"train_loss": -7.295666217803955, "global_step": 190221, "epoch": 4529} {"train_loss": -7.152218818664551, "global_step": 190222, "epoch": 4529} {"train_loss": -7.304603099822998, "global_step": 190223, "epoch": 4529} {"train_loss": -7.225931167602539, "global_step": 190224, "epoch": 4529} {"train_loss": -7.098720550537109, "global_step": 190225, "epoch": 4529} {"train_loss": -7.220417022705078, "global_step": 190226, "epoch": 4529} {"train_loss": -7.092167377471924, "global_step": 190227, "epoch": 4529} {"train_loss": -7.294352054595947, "global_step": 190228, "epoch": 4529} {"train_loss": -7.0999755859375, "global_step": 190229, "epoch": 4529} {"train_loss": -7.091924667358398, "global_step": 190230, "epoch": 4529} {"train_loss": -7.114731788635254, "global_step": 190231, "epoch": 4529} {"train_loss": -7.105923175811768, "global_step": 190232, "epoch": 4529} {"train_loss": -7.16689395904541, "global_step": 190233, "epoch": 4529} {"train_loss": -7.083433628082275, "global_step": 190234, "epoch": 4529} {"train_loss": -6.97976016998291, "global_step": 190235, "epoch": 4529} {"train_loss": -6.94186544418335, "global_step": 190236, "epoch": 4529} {"train_loss": -7.016966342926025, "global_step": 190237, "epoch": 4529} {"train_loss": -6.951249122619629, "global_step": 190238, "epoch": 4529} {"train_loss": -6.981575012207031, "global_step": 190239, "epoch": 4529} {"train_loss": -6.951704502105713, "global_step": 190240, "epoch": 4529} {"train_loss": -7.021510124206543, "global_step": 190241, "epoch": 4529} {"train_loss": -6.953027725219727, "global_step": 190242, "epoch": 4529} {"train_loss": -7.008181571960449, "global_step": 190243, "epoch": 4529} {"train_loss": -7.106757164001465, "global_step": 190244, "epoch": 4529} {"train_loss": -6.955714702606201, "global_step": 190245, "epoch": 4529} {"train_loss": -7.182709217071533, "global_step": 190246, "epoch": 4529} {"train_loss": -7.069949150085449, "global_step": 190247, "epoch": 4529} {"train_loss": -7.086726188659668, "global_step": 190248, "epoch": 4529} {"train_loss": -7.097128868103027, "global_step": 190249, "epoch": 4529} {"train_loss": -7.053839683532715, "global_step": 190250, "epoch": 4529} {"train_loss": -7.139544486999512, "global_step": 190251, "epoch": 4529} {"train_loss": -7.102900505065918, "global_step": 190252, "epoch": 4529} {"train_loss": -7.262444496154785, "global_step": 190253, "epoch": 4529} {"train_loss": -7.072445869445801, "global_step": 190254, "epoch": 4529} {"train_loss": -7.176862716674805, "global_step": 190255, "epoch": 4529} {"train_loss": -7.1623005867004395, "global_step": 190256, "epoch": 4529} {"train_loss": -7.14996862411499, "global_step": 190257, "epoch": 4529} {"train_loss": -7.221408843994141, "global_step": 190258, "epoch": 4529} {"train_loss": -7.105319261550903, "global_step": 190259, "epoch": 4529, "val_loss": 69557.140625} {"train_loss": -7.15293025970459, "global_step": 190260, "epoch": 4530} {"train_loss": -7.177844047546387, "global_step": 190261, "epoch": 4530} {"train_loss": -7.1118483543396, "global_step": 190262, "epoch": 4530} {"train_loss": -7.2614545822143555, "global_step": 190263, "epoch": 4530} {"train_loss": -7.26334810256958, "global_step": 190264, "epoch": 4530} {"train_loss": -7.184494495391846, "global_step": 190265, "epoch": 4530} {"train_loss": -7.150038719177246, "global_step": 190266, "epoch": 4530} {"train_loss": -7.310920238494873, "global_step": 190267, "epoch": 4530} {"train_loss": -7.255239486694336, "global_step": 190268, "epoch": 4530} {"train_loss": -7.147207260131836, "global_step": 190269, "epoch": 4530} {"train_loss": -7.195344924926758, "global_step": 190270, "epoch": 4530} {"train_loss": -7.222413539886475, "global_step": 190271, "epoch": 4530} {"train_loss": -7.175530433654785, "global_step": 190272, "epoch": 4530} {"train_loss": -7.164071083068848, "global_step": 190273, "epoch": 4530} {"train_loss": -7.284663200378418, "global_step": 190274, "epoch": 4530} {"train_loss": -7.1986541748046875, "global_step": 190275, "epoch": 4530} {"train_loss": -7.339731216430664, "global_step": 190276, "epoch": 4530} {"train_loss": -7.13316011428833, "global_step": 190277, "epoch": 4530} {"train_loss": -7.187748908996582, "global_step": 190278, "epoch": 4530} {"train_loss": -7.106907844543457, "global_step": 190279, "epoch": 4530} {"train_loss": -7.259276866912842, "global_step": 190280, "epoch": 4530} {"train_loss": -7.068443298339844, "global_step": 190281, "epoch": 4530} {"train_loss": -7.228609085083008, "global_step": 190282, "epoch": 4530} {"train_loss": -7.0968732833862305, "global_step": 190283, "epoch": 4530} {"train_loss": -7.0973052978515625, "global_step": 190284, "epoch": 4530} {"train_loss": -7.2183732986450195, "global_step": 190285, "epoch": 4530} {"train_loss": -7.148122787475586, "global_step": 190286, "epoch": 4530} {"train_loss": -7.103044033050537, "global_step": 190287, "epoch": 4530} {"train_loss": -7.240735054016113, "global_step": 190288, "epoch": 4530} {"train_loss": -7.174765586853027, "global_step": 190289, "epoch": 4530} {"train_loss": -7.11693811416626, "global_step": 190290, "epoch": 4530} {"train_loss": -7.1920084953308105, "global_step": 190291, "epoch": 4530} {"train_loss": -7.134774684906006, "global_step": 190292, "epoch": 4530} {"train_loss": -7.225466728210449, "global_step": 190293, "epoch": 4530} {"train_loss": -7.106173515319824, "global_step": 190294, "epoch": 4530} {"train_loss": -7.225192070007324, "global_step": 190295, "epoch": 4530} {"train_loss": -7.186355113983154, "global_step": 190296, "epoch": 4530} {"train_loss": -7.267116069793701, "global_step": 190297, "epoch": 4530} {"train_loss": -7.1970930099487305, "global_step": 190298, "epoch": 4530} {"train_loss": -7.237119197845459, "global_step": 190299, "epoch": 4530} {"train_loss": -7.3002519607543945, "global_step": 190300, "epoch": 4530} {"train_loss": -7.192180247533889, "global_step": 190301, "epoch": 4530, "val_loss": 69756.640625} {"train_loss": -7.077919960021973, "global_step": 190302, "epoch": 4531} {"train_loss": -7.175628662109375, "global_step": 190303, "epoch": 4531} {"train_loss": -7.208811283111572, "global_step": 190304, "epoch": 4531} {"train_loss": -7.188205718994141, "global_step": 190305, "epoch": 4531} {"train_loss": -7.241596221923828, "global_step": 190306, "epoch": 4531} {"train_loss": -7.219160079956055, "global_step": 190307, "epoch": 4531} {"train_loss": -7.226627349853516, "global_step": 190308, "epoch": 4531} {"train_loss": -7.259147644042969, "global_step": 190309, "epoch": 4531} {"train_loss": -7.141237258911133, "global_step": 190310, "epoch": 4531} {"train_loss": -7.2051591873168945, "global_step": 190311, "epoch": 4531} {"train_loss": -7.1326823234558105, "global_step": 190312, "epoch": 4531} {"train_loss": -7.240182876586914, "global_step": 190313, "epoch": 4531} {"train_loss": -7.205653190612793, "global_step": 190314, "epoch": 4531} {"train_loss": -7.086902141571045, "global_step": 190315, "epoch": 4531} {"train_loss": -7.311526298522949, "global_step": 190316, "epoch": 4531} {"train_loss": -7.12003755569458, "global_step": 190317, "epoch": 4531} {"train_loss": -7.048731803894043, "global_step": 190318, "epoch": 4531} {"train_loss": -7.205581188201904, "global_step": 190319, "epoch": 4531} {"train_loss": -7.115210056304932, "global_step": 190320, "epoch": 4531} {"train_loss": -7.14134407043457, "global_step": 190321, "epoch": 4531} {"train_loss": -7.171560764312744, "global_step": 190322, "epoch": 4531} {"train_loss": -7.178363800048828, "global_step": 190323, "epoch": 4531} {"train_loss": -7.249357223510742, "global_step": 190324, "epoch": 4531} {"train_loss": -7.155516147613525, "global_step": 190325, "epoch": 4531} {"train_loss": -7.266669273376465, "global_step": 190326, "epoch": 4531} {"train_loss": -7.208645343780518, "global_step": 190327, "epoch": 4531} {"train_loss": -7.203224182128906, "global_step": 190328, "epoch": 4531} {"train_loss": -7.304600715637207, "global_step": 190329, "epoch": 4531} {"train_loss": -7.265817165374756, "global_step": 190330, "epoch": 4531} {"train_loss": -7.211254119873047, "global_step": 190331, "epoch": 4531} {"train_loss": -7.138794422149658, "global_step": 190332, "epoch": 4531} {"train_loss": -7.212859153747559, "global_step": 190333, "epoch": 4531} {"train_loss": -7.143944263458252, "global_step": 190334, "epoch": 4531} {"train_loss": -7.141599655151367, "global_step": 190335, "epoch": 4531} {"train_loss": -7.129022598266602, "global_step": 190336, "epoch": 4531} {"train_loss": -7.1550445556640625, "global_step": 190337, "epoch": 4531} {"train_loss": -7.0150465965271, "global_step": 190338, "epoch": 4531} {"train_loss": -7.078043460845947, "global_step": 190339, "epoch": 4531} {"train_loss": -7.164987564086914, "global_step": 190340, "epoch": 4531} {"train_loss": -6.956672668457031, "global_step": 190341, "epoch": 4531} {"train_loss": -7.277268409729004, "global_step": 190342, "epoch": 4531} {"train_loss": -7.169102384930565, "global_step": 190343, "epoch": 4531, "val_loss": 69828.7578125} {"train_loss": -7.087957859039307, "global_step": 190344, "epoch": 4532} {"train_loss": -7.121279716491699, "global_step": 190345, "epoch": 4532} {"train_loss": -7.157261848449707, "global_step": 190346, "epoch": 4532} {"train_loss": -7.187231063842773, "global_step": 190347, "epoch": 4532} {"train_loss": -6.999610900878906, "global_step": 190348, "epoch": 4532} {"train_loss": -7.301987648010254, "global_step": 190349, "epoch": 4532} {"train_loss": -7.101931571960449, "global_step": 190350, "epoch": 4532} {"train_loss": -7.1860785484313965, "global_step": 190351, "epoch": 4532} {"train_loss": -7.115383148193359, "global_step": 190352, "epoch": 4532} {"train_loss": -7.133811950683594, "global_step": 190353, "epoch": 4532} {"train_loss": -7.221661567687988, "global_step": 190354, "epoch": 4532} {"train_loss": -7.181123733520508, "global_step": 190355, "epoch": 4532} {"train_loss": -7.236140251159668, "global_step": 190356, "epoch": 4532} {"train_loss": -7.1284332275390625, "global_step": 190357, "epoch": 4532} {"train_loss": -7.16734504699707, "global_step": 190358, "epoch": 4532} {"train_loss": -7.198343276977539, "global_step": 190359, "epoch": 4532} {"train_loss": -7.103550910949707, "global_step": 190360, "epoch": 4532} {"train_loss": -7.259788990020752, "global_step": 190361, "epoch": 4532} {"train_loss": -7.132104873657227, "global_step": 190362, "epoch": 4532} {"train_loss": -7.197454452514648, "global_step": 190363, "epoch": 4532} {"train_loss": -7.1511993408203125, "global_step": 190364, "epoch": 4532} {"train_loss": -7.340134620666504, "global_step": 190365, "epoch": 4532} {"train_loss": -7.193440914154053, "global_step": 190366, "epoch": 4532} {"train_loss": -7.168406009674072, "global_step": 190367, "epoch": 4532} {"train_loss": -7.292219161987305, "global_step": 190368, "epoch": 4532} {"train_loss": -7.208992958068848, "global_step": 190369, "epoch": 4532} {"train_loss": -7.065505027770996, "global_step": 190370, "epoch": 4532} {"train_loss": -7.264810562133789, "global_step": 190371, "epoch": 4532} {"train_loss": -7.2120513916015625, "global_step": 190372, "epoch": 4532} {"train_loss": -7.220178604125977, "global_step": 190373, "epoch": 4532} {"train_loss": -7.237281799316406, "global_step": 190374, "epoch": 4532} {"train_loss": -7.189205169677734, "global_step": 190375, "epoch": 4532} {"train_loss": -7.046632766723633, "global_step": 190376, "epoch": 4532} {"train_loss": -7.221163749694824, "global_step": 190377, "epoch": 4532} {"train_loss": -7.310116291046143, "global_step": 190378, "epoch": 4532} {"train_loss": -7.228486061096191, "global_step": 190379, "epoch": 4532} {"train_loss": -7.269733428955078, "global_step": 190380, "epoch": 4532} {"train_loss": -7.099503993988037, "global_step": 190381, "epoch": 4532} {"train_loss": -7.294093132019043, "global_step": 190382, "epoch": 4532} {"train_loss": -7.277834892272949, "global_step": 190383, "epoch": 4532} {"train_loss": -7.21086311340332, "global_step": 190384, "epoch": 4532} {"train_loss": -7.188869362785702, "global_step": 190385, "epoch": 4532, "val_loss": 69573.21875} {"train_loss": -7.360255718231201, "global_step": 190386, "epoch": 4533} {"train_loss": -7.274640083312988, "global_step": 190387, "epoch": 4533} {"train_loss": -7.3552775382995605, "global_step": 190388, "epoch": 4533} {"train_loss": -7.349045276641846, "global_step": 190389, "epoch": 4533} {"train_loss": -7.316713333129883, "global_step": 190390, "epoch": 4533} {"train_loss": -7.348519325256348, "global_step": 190391, "epoch": 4533} {"train_loss": -7.312539100646973, "global_step": 190392, "epoch": 4533} {"train_loss": -7.2514190673828125, "global_step": 190393, "epoch": 4533} {"train_loss": -7.2735595703125, "global_step": 190394, "epoch": 4533} {"train_loss": -7.232706069946289, "global_step": 190395, "epoch": 4533} {"train_loss": -7.27225399017334, "global_step": 190396, "epoch": 4533} {"train_loss": -7.220393180847168, "global_step": 190397, "epoch": 4533} {"train_loss": -7.210098743438721, "global_step": 190398, "epoch": 4533} {"train_loss": -7.240870475769043, "global_step": 190399, "epoch": 4533} {"train_loss": -7.229711532592773, "global_step": 190400, "epoch": 4533} {"train_loss": -7.223735809326172, "global_step": 190401, "epoch": 4533} {"train_loss": -7.141043663024902, "global_step": 190402, "epoch": 4533} {"train_loss": -7.120928764343262, "global_step": 190403, "epoch": 4533} {"train_loss": -7.1087188720703125, "global_step": 190404, "epoch": 4533} {"train_loss": -7.154684543609619, "global_step": 190405, "epoch": 4533} {"train_loss": -7.223233222961426, "global_step": 190406, "epoch": 4533} {"train_loss": -7.141636848449707, "global_step": 190407, "epoch": 4533} {"train_loss": -7.154897689819336, "global_step": 190408, "epoch": 4533} {"train_loss": -7.1134819984436035, "global_step": 190409, "epoch": 4533} {"train_loss": -7.155259132385254, "global_step": 190410, "epoch": 4533} {"train_loss": -7.025732040405273, "global_step": 190411, "epoch": 4533} {"train_loss": -7.1395769119262695, "global_step": 190412, "epoch": 4533} {"train_loss": -7.091708183288574, "global_step": 190413, "epoch": 4533} {"train_loss": -7.218350410461426, "global_step": 190414, "epoch": 4533} {"train_loss": -7.197436332702637, "global_step": 190415, "epoch": 4533} {"train_loss": -7.178177356719971, "global_step": 190416, "epoch": 4533} {"train_loss": -7.080047130584717, "global_step": 190417, "epoch": 4533} {"train_loss": -7.190658092498779, "global_step": 190418, "epoch": 4533} {"train_loss": -7.150328636169434, "global_step": 190419, "epoch": 4533} {"train_loss": -7.217046737670898, "global_step": 190420, "epoch": 4533} {"train_loss": -7.204163551330566, "global_step": 190421, "epoch": 4533} {"train_loss": -7.116135597229004, "global_step": 190422, "epoch": 4533} {"train_loss": -7.12592887878418, "global_step": 190423, "epoch": 4533} {"train_loss": -7.309022426605225, "global_step": 190424, "epoch": 4533} {"train_loss": -7.202859878540039, "global_step": 190425, "epoch": 4533} {"train_loss": -7.255338191986084, "global_step": 190426, "epoch": 4533} {"train_loss": -7.2081651119958785, "global_step": 190427, "epoch": 4533, "val_loss": 69482.625} {"train_loss": -7.24399471282959, "global_step": 190428, "epoch": 4534} {"train_loss": -7.123919486999512, "global_step": 190429, "epoch": 4534} {"train_loss": -7.1180315017700195, "global_step": 190430, "epoch": 4534} {"train_loss": -7.272479057312012, "global_step": 190431, "epoch": 4534} {"train_loss": -7.1489105224609375, "global_step": 190432, "epoch": 4534} {"train_loss": -7.2205281257629395, "global_step": 190433, "epoch": 4534} {"train_loss": -7.2840728759765625, "global_step": 190434, "epoch": 4534} {"train_loss": -7.1588134765625, "global_step": 190435, "epoch": 4534} {"train_loss": -7.204351425170898, "global_step": 190436, "epoch": 4534} {"train_loss": -7.294279098510742, "global_step": 190437, "epoch": 4534} {"train_loss": -7.0893073081970215, "global_step": 190438, "epoch": 4534} {"train_loss": -7.264148712158203, "global_step": 190439, "epoch": 4534} {"train_loss": -7.187497138977051, "global_step": 190440, "epoch": 4534} {"train_loss": -7.157540321350098, "global_step": 190441, "epoch": 4534} {"train_loss": -7.115560531616211, "global_step": 190442, "epoch": 4534} {"train_loss": -7.14605712890625, "global_step": 190443, "epoch": 4534} {"train_loss": -7.099915504455566, "global_step": 190444, "epoch": 4534} {"train_loss": -7.193358421325684, "global_step": 190445, "epoch": 4534} {"train_loss": -7.186703681945801, "global_step": 190446, "epoch": 4534} {"train_loss": -7.155891418457031, "global_step": 190447, "epoch": 4534} {"train_loss": -7.237863063812256, "global_step": 190448, "epoch": 4534} {"train_loss": -7.225685119628906, "global_step": 190449, "epoch": 4534} {"train_loss": -7.152050495147705, "global_step": 190450, "epoch": 4534} {"train_loss": -7.078542709350586, "global_step": 190451, "epoch": 4534} {"train_loss": -7.140429496765137, "global_step": 190452, "epoch": 4534} {"train_loss": -7.241421222686768, "global_step": 190453, "epoch": 4534} {"train_loss": -7.114396572113037, "global_step": 190454, "epoch": 4534} {"train_loss": -7.153354644775391, "global_step": 190455, "epoch": 4534} {"train_loss": -7.250356674194336, "global_step": 190456, "epoch": 4534} {"train_loss": -7.176135063171387, "global_step": 190457, "epoch": 4534} {"train_loss": -7.21865177154541, "global_step": 190458, "epoch": 4534} {"train_loss": -7.1910905838012695, "global_step": 190459, "epoch": 4534} {"train_loss": -7.1183576583862305, "global_step": 190460, "epoch": 4534} {"train_loss": -7.267653465270996, "global_step": 190461, "epoch": 4534} {"train_loss": -7.211019992828369, "global_step": 190462, "epoch": 4534} {"train_loss": -7.084390640258789, "global_step": 190463, "epoch": 4534} {"train_loss": -7.1497907638549805, "global_step": 190464, "epoch": 4534} {"train_loss": -7.174394607543945, "global_step": 190465, "epoch": 4534} {"train_loss": -7.120997428894043, "global_step": 190466, "epoch": 4534} {"train_loss": -7.154552459716797, "global_step": 190467, "epoch": 4534} {"train_loss": -7.220741271972656, "global_step": 190468, "epoch": 4534} {"train_loss": -7.182035219101679, "global_step": 190469, "epoch": 4534, "val_loss": 69602.390625} {"train_loss": -7.225439071655273, "global_step": 190470, "epoch": 4535} {"train_loss": -7.090756416320801, "global_step": 190471, "epoch": 4535} {"train_loss": -7.215970993041992, "global_step": 190472, "epoch": 4535} {"train_loss": -7.138578414916992, "global_step": 190473, "epoch": 4535} {"train_loss": -7.307469367980957, "global_step": 190474, "epoch": 4535} {"train_loss": -7.131503582000732, "global_step": 190475, "epoch": 4535} {"train_loss": -7.307631969451904, "global_step": 190476, "epoch": 4535} {"train_loss": -7.144460201263428, "global_step": 190477, "epoch": 4535} {"train_loss": -7.219805717468262, "global_step": 190478, "epoch": 4535} {"train_loss": -7.132656097412109, "global_step": 190479, "epoch": 4535} {"train_loss": -7.198526382446289, "global_step": 190480, "epoch": 4535} {"train_loss": -7.289181709289551, "global_step": 190481, "epoch": 4535} {"train_loss": -7.15385627746582, "global_step": 190482, "epoch": 4535} {"train_loss": -7.20701789855957, "global_step": 190483, "epoch": 4535} {"train_loss": -7.142779350280762, "global_step": 190484, "epoch": 4535} {"train_loss": -7.066519737243652, "global_step": 190485, "epoch": 4535} {"train_loss": -7.253129005432129, "global_step": 190486, "epoch": 4535} {"train_loss": -7.087139129638672, "global_step": 190487, "epoch": 4535} {"train_loss": -6.916841506958008, "global_step": 190488, "epoch": 4535} {"train_loss": -7.077869415283203, "global_step": 190489, "epoch": 4535} {"train_loss": -7.183314323425293, "global_step": 190490, "epoch": 4535} {"train_loss": -7.200806617736816, "global_step": 190491, "epoch": 4535} {"train_loss": -7.293932914733887, "global_step": 190492, "epoch": 4535} {"train_loss": -7.2626752853393555, "global_step": 190493, "epoch": 4535} {"train_loss": -7.138225078582764, "global_step": 190494, "epoch": 4535} {"train_loss": -7.206998825073242, "global_step": 190495, "epoch": 4535} {"train_loss": -7.105710983276367, "global_step": 190496, "epoch": 4535} {"train_loss": -7.177449703216553, "global_step": 190497, "epoch": 4535} {"train_loss": -7.142242908477783, "global_step": 190498, "epoch": 4535} {"train_loss": -7.164473056793213, "global_step": 190499, "epoch": 4535} {"train_loss": -7.148268699645996, "global_step": 190500, "epoch": 4535} {"train_loss": -7.177149772644043, "global_step": 190501, "epoch": 4535} {"train_loss": -7.137690544128418, "global_step": 190502, "epoch": 4535} {"train_loss": -7.07598352432251, "global_step": 190503, "epoch": 4535} {"train_loss": -7.163814544677734, "global_step": 190504, "epoch": 4535} {"train_loss": -7.216188907623291, "global_step": 190505, "epoch": 4535} {"train_loss": -7.169896125793457, "global_step": 190506, "epoch": 4535} {"train_loss": -7.0619916915893555, "global_step": 190507, "epoch": 4535} {"train_loss": -7.167181015014648, "global_step": 190508, "epoch": 4535} {"train_loss": -7.031907081604004, "global_step": 190509, "epoch": 4535} {"train_loss": -7.154664993286133, "global_step": 190510, "epoch": 4535} {"train_loss": -7.160288016001384, "global_step": 190511, "epoch": 4535, "val_loss": 69534.328125} {"train_loss": -7.056257724761963, "global_step": 190512, "epoch": 4536} {"train_loss": -7.141849517822266, "global_step": 190513, "epoch": 4536} {"train_loss": -7.103703498840332, "global_step": 190514, "epoch": 4536} {"train_loss": -7.0582685470581055, "global_step": 190515, "epoch": 4536} {"train_loss": -7.076235771179199, "global_step": 190516, "epoch": 4536} {"train_loss": -7.1245036125183105, "global_step": 190517, "epoch": 4536} {"train_loss": -7.141086578369141, "global_step": 190518, "epoch": 4536} {"train_loss": -7.06765604019165, "global_step": 190519, "epoch": 4536} {"train_loss": -7.204587936401367, "global_step": 190520, "epoch": 4536} {"train_loss": -7.173986434936523, "global_step": 190521, "epoch": 4536} {"train_loss": -7.182734489440918, "global_step": 190522, "epoch": 4536} {"train_loss": -7.181933879852295, "global_step": 190523, "epoch": 4536} {"train_loss": -7.125845909118652, "global_step": 190524, "epoch": 4536} {"train_loss": -7.162489891052246, "global_step": 190525, "epoch": 4536} {"train_loss": -7.211597442626953, "global_step": 190526, "epoch": 4536} {"train_loss": -7.188559532165527, "global_step": 190527, "epoch": 4536} {"train_loss": -7.199941635131836, "global_step": 190528, "epoch": 4536} {"train_loss": -7.230134010314941, "global_step": 190529, "epoch": 4536} {"train_loss": -7.270413398742676, "global_step": 190530, "epoch": 4536} {"train_loss": -7.287349700927734, "global_step": 190531, "epoch": 4536} {"train_loss": -7.185390472412109, "global_step": 190532, "epoch": 4536} {"train_loss": -7.199872970581055, "global_step": 190533, "epoch": 4536} {"train_loss": -7.26431941986084, "global_step": 190534, "epoch": 4536} {"train_loss": -7.254553318023682, "global_step": 190535, "epoch": 4536} {"train_loss": -7.301762580871582, "global_step": 190536, "epoch": 4536} {"train_loss": -7.223824977874756, "global_step": 190537, "epoch": 4536} {"train_loss": -7.351118087768555, "global_step": 190538, "epoch": 4536} {"train_loss": -7.311400890350342, "global_step": 190539, "epoch": 4536} {"train_loss": -7.24184513092041, "global_step": 190540, "epoch": 4536} {"train_loss": -7.292201519012451, "global_step": 190541, "epoch": 4536} {"train_loss": -7.222711563110352, "global_step": 190542, "epoch": 4536} {"train_loss": -7.251396179199219, "global_step": 190543, "epoch": 4536} {"train_loss": -7.200677871704102, "global_step": 190544, "epoch": 4536} {"train_loss": -7.238842010498047, "global_step": 190545, "epoch": 4536} {"train_loss": -7.25801944732666, "global_step": 190546, "epoch": 4536} {"train_loss": -7.218255043029785, "global_step": 190547, "epoch": 4536} {"train_loss": -7.283053874969482, "global_step": 190548, "epoch": 4536} {"train_loss": -7.204388618469238, "global_step": 190549, "epoch": 4536} {"train_loss": -7.285107135772705, "global_step": 190550, "epoch": 4536} {"train_loss": -7.223440647125244, "global_step": 190551, "epoch": 4536} {"train_loss": -7.223626613616943, "global_step": 190552, "epoch": 4536} {"train_loss": -7.203828357514881, "global_step": 190553, "epoch": 4536, "val_loss": 69537.28125} {"train_loss": -7.190608024597168, "global_step": 190554, "epoch": 4537} {"train_loss": -7.295836448669434, "global_step": 190555, "epoch": 4537} {"train_loss": -7.094074249267578, "global_step": 190556, "epoch": 4537} {"train_loss": -7.205599784851074, "global_step": 190557, "epoch": 4537} {"train_loss": -7.033224105834961, "global_step": 190558, "epoch": 4537} {"train_loss": -7.080787658691406, "global_step": 190559, "epoch": 4537} {"train_loss": -7.1924638748168945, "global_step": 190560, "epoch": 4537} {"train_loss": -7.120931625366211, "global_step": 190561, "epoch": 4537} {"train_loss": -6.9118146896362305, "global_step": 190562, "epoch": 4537} {"train_loss": -7.204045295715332, "global_step": 190563, "epoch": 4537} {"train_loss": -7.140573501586914, "global_step": 190564, "epoch": 4537} {"train_loss": -7.148911952972412, "global_step": 190565, "epoch": 4537} {"train_loss": -7.130268096923828, "global_step": 190566, "epoch": 4537} {"train_loss": -7.269338607788086, "global_step": 190567, "epoch": 4537} {"train_loss": -7.227389335632324, "global_step": 190568, "epoch": 4537} {"train_loss": -7.1026716232299805, "global_step": 190569, "epoch": 4537} {"train_loss": -7.107150077819824, "global_step": 190570, "epoch": 4537} {"train_loss": -7.135787010192871, "global_step": 190571, "epoch": 4537} {"train_loss": -7.204464912414551, "global_step": 190572, "epoch": 4537} {"train_loss": -7.055787563323975, "global_step": 190573, "epoch": 4537} {"train_loss": -7.1813459396362305, "global_step": 190574, "epoch": 4537} {"train_loss": -7.185539722442627, "global_step": 190575, "epoch": 4537} {"train_loss": -7.197794437408447, "global_step": 190576, "epoch": 4537} {"train_loss": -7.210149765014648, "global_step": 190577, "epoch": 4537} {"train_loss": -7.288786888122559, "global_step": 190578, "epoch": 4537} {"train_loss": -7.180637359619141, "global_step": 190579, "epoch": 4537} {"train_loss": -7.257529258728027, "global_step": 190580, "epoch": 4537} {"train_loss": -7.196234226226807, "global_step": 190581, "epoch": 4537} {"train_loss": -7.222807884216309, "global_step": 190582, "epoch": 4537} {"train_loss": -7.268330097198486, "global_step": 190583, "epoch": 4537} {"train_loss": -7.282050132751465, "global_step": 190584, "epoch": 4537} {"train_loss": -7.19563102722168, "global_step": 190585, "epoch": 4537} {"train_loss": -7.210680961608887, "global_step": 190586, "epoch": 4537} {"train_loss": -7.252377510070801, "global_step": 190587, "epoch": 4537} {"train_loss": -7.285416603088379, "global_step": 190588, "epoch": 4537} {"train_loss": -7.233840465545654, "global_step": 190589, "epoch": 4537} {"train_loss": -7.2010650634765625, "global_step": 190590, "epoch": 4537} {"train_loss": -7.236863136291504, "global_step": 190591, "epoch": 4537} {"train_loss": -7.184626579284668, "global_step": 190592, "epoch": 4537} {"train_loss": -7.1583476066589355, "global_step": 190593, "epoch": 4537} {"train_loss": -7.226163864135742, "global_step": 190594, "epoch": 4537} {"train_loss": -7.181483155205136, "global_step": 190595, "epoch": 4537, "val_loss": 69599.359375} {"train_loss": -7.0999932289123535, "global_step": 190596, "epoch": 4538} {"train_loss": -6.984488487243652, "global_step": 190597, "epoch": 4538} {"train_loss": -7.045819282531738, "global_step": 190598, "epoch": 4538} {"train_loss": -7.228372573852539, "global_step": 190599, "epoch": 4538} {"train_loss": -7.15116024017334, "global_step": 190600, "epoch": 4538} {"train_loss": -7.1490983963012695, "global_step": 190601, "epoch": 4538} {"train_loss": -7.114035606384277, "global_step": 190602, "epoch": 4538} {"train_loss": -7.094069480895996, "global_step": 190603, "epoch": 4538} {"train_loss": -7.077495098114014, "global_step": 190604, "epoch": 4538} {"train_loss": -7.057186126708984, "global_step": 190605, "epoch": 4538} {"train_loss": -7.060340404510498, "global_step": 190606, "epoch": 4538} {"train_loss": -7.126601219177246, "global_step": 190607, "epoch": 4538} {"train_loss": -7.107254505157471, "global_step": 190608, "epoch": 4538} {"train_loss": -7.104181289672852, "global_step": 190609, "epoch": 4538} {"train_loss": -7.150258541107178, "global_step": 190610, "epoch": 4538} {"train_loss": -7.1439666748046875, "global_step": 190611, "epoch": 4538} {"train_loss": -7.191329002380371, "global_step": 190612, "epoch": 4538} {"train_loss": -7.119600296020508, "global_step": 190613, "epoch": 4538} {"train_loss": -7.207721710205078, "global_step": 190614, "epoch": 4538} {"train_loss": -7.145873069763184, "global_step": 190615, "epoch": 4538} {"train_loss": -7.171103477478027, "global_step": 190616, "epoch": 4538} {"train_loss": -7.125387191772461, "global_step": 190617, "epoch": 4538} {"train_loss": -7.159859657287598, "global_step": 190618, "epoch": 4538} {"train_loss": -7.246673583984375, "global_step": 190619, "epoch": 4538} {"train_loss": -7.108595848083496, "global_step": 190620, "epoch": 4538} {"train_loss": -7.307472229003906, "global_step": 190621, "epoch": 4538} {"train_loss": -7.093939781188965, "global_step": 190622, "epoch": 4538} {"train_loss": -7.262106895446777, "global_step": 190623, "epoch": 4538} {"train_loss": -7.219010353088379, "global_step": 190624, "epoch": 4538} {"train_loss": -7.116133689880371, "global_step": 190625, "epoch": 4538} {"train_loss": -7.076726913452148, "global_step": 190626, "epoch": 4538} {"train_loss": -7.260987758636475, "global_step": 190627, "epoch": 4538} {"train_loss": -7.214487075805664, "global_step": 190628, "epoch": 4538} {"train_loss": -7.230544090270996, "global_step": 190629, "epoch": 4538} {"train_loss": -7.28624153137207, "global_step": 190630, "epoch": 4538} {"train_loss": -7.165772438049316, "global_step": 190631, "epoch": 4538} {"train_loss": -7.326066970825195, "global_step": 190632, "epoch": 4538} {"train_loss": -7.2626190185546875, "global_step": 190633, "epoch": 4538} {"train_loss": -7.253110408782959, "global_step": 190634, "epoch": 4538} {"train_loss": -7.255819320678711, "global_step": 190635, "epoch": 4538} {"train_loss": -7.216516971588135, "global_step": 190636, "epoch": 4538} {"train_loss": -7.163101162229266, "global_step": 190637, "epoch": 4538, "val_loss": 69641.7265625} {"train_loss": -7.177391052246094, "global_step": 190638, "epoch": 4539} {"train_loss": -7.152307987213135, "global_step": 190639, "epoch": 4539} {"train_loss": -7.198848247528076, "global_step": 190640, "epoch": 4539} {"train_loss": -7.204811096191406, "global_step": 190641, "epoch": 4539} {"train_loss": -7.261787414550781, "global_step": 190642, "epoch": 4539} {"train_loss": -7.201074600219727, "global_step": 190643, "epoch": 4539} {"train_loss": -7.25510835647583, "global_step": 190644, "epoch": 4539} {"train_loss": -7.149685859680176, "global_step": 190645, "epoch": 4539} {"train_loss": -7.321746826171875, "global_step": 190646, "epoch": 4539} {"train_loss": -7.220590591430664, "global_step": 190647, "epoch": 4539} {"train_loss": -7.258193492889404, "global_step": 190648, "epoch": 4539} {"train_loss": -7.310251235961914, "global_step": 190649, "epoch": 4539} {"train_loss": -7.265227317810059, "global_step": 190650, "epoch": 4539} {"train_loss": -7.254836082458496, "global_step": 190651, "epoch": 4539} {"train_loss": -7.2780327796936035, "global_step": 190652, "epoch": 4539} {"train_loss": -7.309944152832031, "global_step": 190653, "epoch": 4539} {"train_loss": -7.29413366317749, "global_step": 190654, "epoch": 4539} {"train_loss": -7.154656887054443, "global_step": 190655, "epoch": 4539} {"train_loss": -7.232710838317871, "global_step": 190656, "epoch": 4539} {"train_loss": -7.267988681793213, "global_step": 190657, "epoch": 4539} {"train_loss": -7.427496433258057, "global_step": 190658, "epoch": 4539} {"train_loss": -7.269946098327637, "global_step": 190659, "epoch": 4539} {"train_loss": -7.104561805725098, "global_step": 190660, "epoch": 4539} {"train_loss": -7.314275741577148, "global_step": 190661, "epoch": 4539} {"train_loss": -7.3034467697143555, "global_step": 190662, "epoch": 4539} {"train_loss": -7.183696746826172, "global_step": 190663, "epoch": 4539} {"train_loss": -7.095907211303711, "global_step": 190664, "epoch": 4539} {"train_loss": -7.13733434677124, "global_step": 190665, "epoch": 4539} {"train_loss": -7.114990711212158, "global_step": 190666, "epoch": 4539} {"train_loss": -7.112528324127197, "global_step": 190667, "epoch": 4539} {"train_loss": -7.254977703094482, "global_step": 190668, "epoch": 4539} {"train_loss": -7.099100589752197, "global_step": 190669, "epoch": 4539} {"train_loss": -7.160367012023926, "global_step": 190670, "epoch": 4539} {"train_loss": -7.129179954528809, "global_step": 190671, "epoch": 4539} {"train_loss": -7.14777135848999, "global_step": 190672, "epoch": 4539} {"train_loss": -7.232036590576172, "global_step": 190673, "epoch": 4539} {"train_loss": -7.1370086669921875, "global_step": 190674, "epoch": 4539} {"train_loss": -7.227545261383057, "global_step": 190675, "epoch": 4539} {"train_loss": -7.119579315185547, "global_step": 190676, "epoch": 4539} {"train_loss": -7.254339694976807, "global_step": 190677, "epoch": 4539} {"train_loss": -7.152527809143066, "global_step": 190678, "epoch": 4539} {"train_loss": -7.2119198980785555, "global_step": 190679, "epoch": 4539, "val_loss": 69713.0625} {"train_loss": -7.1584882736206055, "global_step": 190680, "epoch": 4540} {"train_loss": -7.121053695678711, "global_step": 190681, "epoch": 4540} {"train_loss": -7.282805442810059, "global_step": 190682, "epoch": 4540} {"train_loss": -7.1344804763793945, "global_step": 190683, "epoch": 4540} {"train_loss": -7.168320655822754, "global_step": 190684, "epoch": 4540} {"train_loss": -7.237376689910889, "global_step": 190685, "epoch": 4540} {"train_loss": -7.253026008605957, "global_step": 190686, "epoch": 4540} {"train_loss": -7.225017547607422, "global_step": 190687, "epoch": 4540} {"train_loss": -7.278243064880371, "global_step": 190688, "epoch": 4540} {"train_loss": -7.189467906951904, "global_step": 190689, "epoch": 4540} {"train_loss": -7.145462989807129, "global_step": 190690, "epoch": 4540} {"train_loss": -7.1255269050598145, "global_step": 190691, "epoch": 4540} {"train_loss": -7.128663539886475, "global_step": 190692, "epoch": 4540} {"train_loss": -7.118049621582031, "global_step": 190693, "epoch": 4540} {"train_loss": -7.183455467224121, "global_step": 190694, "epoch": 4540} {"train_loss": -7.192039966583252, "global_step": 190695, "epoch": 4540} {"train_loss": -7.0942583084106445, "global_step": 190696, "epoch": 4540} {"train_loss": -7.127194404602051, "global_step": 190697, "epoch": 4540} {"train_loss": -7.201035976409912, "global_step": 190698, "epoch": 4540} {"train_loss": -7.163819313049316, "global_step": 190699, "epoch": 4540} {"train_loss": -7.193369388580322, "global_step": 190700, "epoch": 4540} {"train_loss": -7.182145595550537, "global_step": 190701, "epoch": 4540} {"train_loss": -7.164472579956055, "global_step": 190702, "epoch": 4540} {"train_loss": -7.237593650817871, "global_step": 190703, "epoch": 4540} {"train_loss": -7.229970932006836, "global_step": 190704, "epoch": 4540} {"train_loss": -7.205321788787842, "global_step": 190705, "epoch": 4540} {"train_loss": -6.96341609954834, "global_step": 190706, "epoch": 4540} {"train_loss": -7.18271541595459, "global_step": 190707, "epoch": 4540} {"train_loss": -7.000439643859863, "global_step": 190708, "epoch": 4540} {"train_loss": -7.089705944061279, "global_step": 190709, "epoch": 4540} {"train_loss": -7.117647171020508, "global_step": 190710, "epoch": 4540} {"train_loss": -7.049508094787598, "global_step": 190711, "epoch": 4540} {"train_loss": -7.207953453063965, "global_step": 190712, "epoch": 4540} {"train_loss": -7.044041633605957, "global_step": 190713, "epoch": 4540} {"train_loss": -7.053640365600586, "global_step": 190714, "epoch": 4540} {"train_loss": -7.182853698730469, "global_step": 190715, "epoch": 4540} {"train_loss": -7.086813449859619, "global_step": 190716, "epoch": 4540} {"train_loss": -7.141132354736328, "global_step": 190717, "epoch": 4540} {"train_loss": -7.190199375152588, "global_step": 190718, "epoch": 4540} {"train_loss": -7.151625633239746, "global_step": 190719, "epoch": 4540} {"train_loss": -7.207624435424805, "global_step": 190720, "epoch": 4540} {"train_loss": -7.1570594764891124, "global_step": 190721, "epoch": 4540, "val_loss": 69485.96875} {"train_loss": -7.166630744934082, "global_step": 190722, "epoch": 4541} {"train_loss": -7.214953422546387, "global_step": 190723, "epoch": 4541} {"train_loss": -7.247771263122559, "global_step": 190724, "epoch": 4541} {"train_loss": -7.132638931274414, "global_step": 190725, "epoch": 4541} {"train_loss": -7.185839653015137, "global_step": 190726, "epoch": 4541} {"train_loss": -7.271083354949951, "global_step": 190727, "epoch": 4541} {"train_loss": -7.228503704071045, "global_step": 190728, "epoch": 4541} {"train_loss": -7.2800092697143555, "global_step": 190729, "epoch": 4541} {"train_loss": -7.160080909729004, "global_step": 190730, "epoch": 4541} {"train_loss": -7.32326602935791, "global_step": 190731, "epoch": 4541} {"train_loss": -7.3013176918029785, "global_step": 190732, "epoch": 4541} {"train_loss": -7.189662456512451, "global_step": 190733, "epoch": 4541} {"train_loss": -7.251850605010986, "global_step": 190734, "epoch": 4541} {"train_loss": -7.266561508178711, "global_step": 190735, "epoch": 4541} {"train_loss": -7.251060485839844, "global_step": 190736, "epoch": 4541} {"train_loss": -7.318493843078613, "global_step": 190737, "epoch": 4541} {"train_loss": -7.1833953857421875, "global_step": 190738, "epoch": 4541} {"train_loss": -7.259488105773926, "global_step": 190739, "epoch": 4541} {"train_loss": -7.309737205505371, "global_step": 190740, "epoch": 4541} {"train_loss": -7.2965826988220215, "global_step": 190741, "epoch": 4541} {"train_loss": -7.182849884033203, "global_step": 190742, "epoch": 4541} {"train_loss": -7.222493648529053, "global_step": 190743, "epoch": 4541} {"train_loss": -7.1026225090026855, "global_step": 190744, "epoch": 4541} {"train_loss": -7.185227394104004, "global_step": 190745, "epoch": 4541} {"train_loss": -7.182328224182129, "global_step": 190746, "epoch": 4541} {"train_loss": -7.087268352508545, "global_step": 190747, "epoch": 4541} {"train_loss": -7.2295308113098145, "global_step": 190748, "epoch": 4541} {"train_loss": -7.183940887451172, "global_step": 190749, "epoch": 4541} {"train_loss": -7.147040843963623, "global_step": 190750, "epoch": 4541} {"train_loss": -7.159925937652588, "global_step": 190751, "epoch": 4541} {"train_loss": -7.115862846374512, "global_step": 190752, "epoch": 4541} {"train_loss": -6.867746829986572, "global_step": 190753, "epoch": 4541} {"train_loss": -7.28661584854126, "global_step": 190754, "epoch": 4541} {"train_loss": -7.120123863220215, "global_step": 190755, "epoch": 4541} {"train_loss": -6.921451568603516, "global_step": 190756, "epoch": 4541} {"train_loss": -7.064417362213135, "global_step": 190757, "epoch": 4541} {"train_loss": -7.129087448120117, "global_step": 190758, "epoch": 4541} {"train_loss": -7.022805213928223, "global_step": 190759, "epoch": 4541} {"train_loss": -7.093111991882324, "global_step": 190760, "epoch": 4541} {"train_loss": -7.056279182434082, "global_step": 190761, "epoch": 4541} {"train_loss": -7.0653791427612305, "global_step": 190762, "epoch": 4541} {"train_loss": -7.171175343649728, "global_step": 190763, "epoch": 4541, "val_loss": 69638.7890625} {"train_loss": -7.0867462158203125, "global_step": 190764, "epoch": 4542} {"train_loss": -7.165331840515137, "global_step": 190765, "epoch": 4542} {"train_loss": -7.163079738616943, "global_step": 190766, "epoch": 4542} {"train_loss": -7.128837585449219, "global_step": 190767, "epoch": 4542} {"train_loss": -7.047111511230469, "global_step": 190768, "epoch": 4542} {"train_loss": -7.066518783569336, "global_step": 190769, "epoch": 4542} {"train_loss": -7.049571990966797, "global_step": 190770, "epoch": 4542} {"train_loss": -7.250094890594482, "global_step": 190771, "epoch": 4542} {"train_loss": -7.098334789276123, "global_step": 190772, "epoch": 4542} {"train_loss": -7.040694713592529, "global_step": 190773, "epoch": 4542} {"train_loss": -7.195074558258057, "global_step": 190774, "epoch": 4542} {"train_loss": -7.138688564300537, "global_step": 190775, "epoch": 4542} {"train_loss": -7.171400547027588, "global_step": 190776, "epoch": 4542} {"train_loss": -7.180302619934082, "global_step": 190777, "epoch": 4542} {"train_loss": -7.169424057006836, "global_step": 190778, "epoch": 4542} {"train_loss": -7.093524932861328, "global_step": 190779, "epoch": 4542} {"train_loss": -7.147127151489258, "global_step": 190780, "epoch": 4542} {"train_loss": -7.210325241088867, "global_step": 190781, "epoch": 4542} {"train_loss": -7.273408889770508, "global_step": 190782, "epoch": 4542} {"train_loss": -7.216962814331055, "global_step": 190783, "epoch": 4542} {"train_loss": -7.160454750061035, "global_step": 190784, "epoch": 4542} {"train_loss": -7.226515769958496, "global_step": 190785, "epoch": 4542} {"train_loss": -7.282229900360107, "global_step": 190786, "epoch": 4542} {"train_loss": -7.204032897949219, "global_step": 190787, "epoch": 4542} {"train_loss": -7.118436813354492, "global_step": 190788, "epoch": 4542} {"train_loss": -7.166888236999512, "global_step": 190789, "epoch": 4542} {"train_loss": -7.220536231994629, "global_step": 190790, "epoch": 4542} {"train_loss": -7.198390007019043, "global_step": 190791, "epoch": 4542} {"train_loss": -7.278415679931641, "global_step": 190792, "epoch": 4542} {"train_loss": -7.216505527496338, "global_step": 190793, "epoch": 4542} {"train_loss": -7.258047580718994, "global_step": 190794, "epoch": 4542} {"train_loss": -7.289997577667236, "global_step": 190795, "epoch": 4542} {"train_loss": -7.324792861938477, "global_step": 190796, "epoch": 4542} {"train_loss": -7.302209854125977, "global_step": 190797, "epoch": 4542} {"train_loss": -7.288108825683594, "global_step": 190798, "epoch": 4542} {"train_loss": -7.183650016784668, "global_step": 190799, "epoch": 4542} {"train_loss": -7.373990058898926, "global_step": 190800, "epoch": 4542} {"train_loss": -7.271651268005371, "global_step": 190801, "epoch": 4542} {"train_loss": -7.297762393951416, "global_step": 190802, "epoch": 4542} {"train_loss": -7.170127868652344, "global_step": 190803, "epoch": 4542} {"train_loss": -7.3230414390563965, "global_step": 190804, "epoch": 4542} {"train_loss": -7.199796040852864, "global_step": 190805, "epoch": 4542, "val_loss": 69553.390625} {"train_loss": -7.2612175941467285, "global_step": 190806, "epoch": 4543} {"train_loss": -7.320927619934082, "global_step": 190807, "epoch": 4543} {"train_loss": -7.2938618659973145, "global_step": 190808, "epoch": 4543} {"train_loss": -7.179210186004639, "global_step": 190809, "epoch": 4543} {"train_loss": -7.206401824951172, "global_step": 190810, "epoch": 4543} {"train_loss": -7.22926139831543, "global_step": 190811, "epoch": 4543} {"train_loss": -7.221278190612793, "global_step": 190812, "epoch": 4543} {"train_loss": -7.203990459442139, "global_step": 190813, "epoch": 4543} {"train_loss": -7.368887901306152, "global_step": 190814, "epoch": 4543} {"train_loss": -7.206920623779297, "global_step": 190815, "epoch": 4543} {"train_loss": -7.257986068725586, "global_step": 190816, "epoch": 4543} {"train_loss": -7.205291271209717, "global_step": 190817, "epoch": 4543} {"train_loss": -7.196347713470459, "global_step": 190818, "epoch": 4543} {"train_loss": -7.084532737731934, "global_step": 190819, "epoch": 4543} {"train_loss": -7.230875015258789, "global_step": 190820, "epoch": 4543} {"train_loss": -7.105545520782471, "global_step": 190821, "epoch": 4543} {"train_loss": -7.229852676391602, "global_step": 190822, "epoch": 4543} {"train_loss": -7.156516075134277, "global_step": 190823, "epoch": 4543} {"train_loss": -7.147277355194092, "global_step": 190824, "epoch": 4543} {"train_loss": -7.070368766784668, "global_step": 190825, "epoch": 4543} {"train_loss": -7.230377197265625, "global_step": 190826, "epoch": 4543} {"train_loss": -7.246009349822998, "global_step": 190827, "epoch": 4543} {"train_loss": -7.147742748260498, "global_step": 190828, "epoch": 4543} {"train_loss": -7.0380144119262695, "global_step": 190829, "epoch": 4543} {"train_loss": -7.188467979431152, "global_step": 190830, "epoch": 4543} {"train_loss": -7.144989490509033, "global_step": 190831, "epoch": 4543} {"train_loss": -7.144430637359619, "global_step": 190832, "epoch": 4543} {"train_loss": -7.203155517578125, "global_step": 190833, "epoch": 4543} {"train_loss": -7.0836181640625, "global_step": 190834, "epoch": 4543} {"train_loss": -7.172809600830078, "global_step": 190835, "epoch": 4543} {"train_loss": -7.177522659301758, "global_step": 190836, "epoch": 4543} {"train_loss": -7.222285270690918, "global_step": 190837, "epoch": 4543} {"train_loss": -7.143336772918701, "global_step": 190838, "epoch": 4543} {"train_loss": -7.07405948638916, "global_step": 190839, "epoch": 4543} {"train_loss": -7.220006465911865, "global_step": 190840, "epoch": 4543} {"train_loss": -6.9880452156066895, "global_step": 190841, "epoch": 4543} {"train_loss": -7.2012810707092285, "global_step": 190842, "epoch": 4543} {"train_loss": -7.205809116363525, "global_step": 190843, "epoch": 4543} {"train_loss": -7.132543563842773, "global_step": 190844, "epoch": 4543} {"train_loss": -7.170391082763672, "global_step": 190845, "epoch": 4543} {"train_loss": -7.232354164123535, "global_step": 190846, "epoch": 4543} {"train_loss": -7.181485811869304, "global_step": 190847, "epoch": 4543, "val_loss": 69739.4375} {"train_loss": -7.18459415435791, "global_step": 190848, "epoch": 4544} {"train_loss": -7.011416912078857, "global_step": 190849, "epoch": 4544} {"train_loss": -7.096923351287842, "global_step": 190850, "epoch": 4544} {"train_loss": -7.161883354187012, "global_step": 190851, "epoch": 4544} {"train_loss": -7.103906631469727, "global_step": 190852, "epoch": 4544} {"train_loss": -7.111545085906982, "global_step": 190853, "epoch": 4544} {"train_loss": -7.204216480255127, "global_step": 190854, "epoch": 4544} {"train_loss": -7.132131099700928, "global_step": 190855, "epoch": 4544} {"train_loss": -7.126593589782715, "global_step": 190856, "epoch": 4544} {"train_loss": -7.108808994293213, "global_step": 190857, "epoch": 4544} {"train_loss": -6.890985488891602, "global_step": 190858, "epoch": 4544} {"train_loss": -7.069976806640625, "global_step": 190859, "epoch": 4544} {"train_loss": -7.103126049041748, "global_step": 190860, "epoch": 4544} {"train_loss": -6.941327095031738, "global_step": 190861, "epoch": 4544} {"train_loss": -7.148612022399902, "global_step": 190862, "epoch": 4544} {"train_loss": -7.0278167724609375, "global_step": 190863, "epoch": 4544} {"train_loss": -7.055092811584473, "global_step": 190864, "epoch": 4544} {"train_loss": -7.083532810211182, "global_step": 190865, "epoch": 4544} {"train_loss": -7.176753997802734, "global_step": 190866, "epoch": 4544} {"train_loss": -7.094720840454102, "global_step": 190867, "epoch": 4544} {"train_loss": -7.151932716369629, "global_step": 190868, "epoch": 4544} {"train_loss": -7.210331916809082, "global_step": 190869, "epoch": 4544} {"train_loss": -7.1393537521362305, "global_step": 190870, "epoch": 4544} {"train_loss": -7.158042907714844, "global_step": 190871, "epoch": 4544} {"train_loss": -7.170502662658691, "global_step": 190872, "epoch": 4544} {"train_loss": -7.219442367553711, "global_step": 190873, "epoch": 4544} {"train_loss": -7.1615190505981445, "global_step": 190874, "epoch": 4544} {"train_loss": -7.13688850402832, "global_step": 190875, "epoch": 4544} {"train_loss": -7.074130058288574, "global_step": 190876, "epoch": 4544} {"train_loss": -7.12994384765625, "global_step": 190877, "epoch": 4544} {"train_loss": -7.033002853393555, "global_step": 190878, "epoch": 4544} {"train_loss": -7.226238250732422, "global_step": 190879, "epoch": 4544} {"train_loss": -7.141103267669678, "global_step": 190880, "epoch": 4544} {"train_loss": -7.064240455627441, "global_step": 190881, "epoch": 4544} {"train_loss": -7.204913139343262, "global_step": 190882, "epoch": 4544} {"train_loss": -7.148935317993164, "global_step": 190883, "epoch": 4544} {"train_loss": -7.0697102546691895, "global_step": 190884, "epoch": 4544} {"train_loss": -7.10490083694458, "global_step": 190885, "epoch": 4544} {"train_loss": -7.174798965454102, "global_step": 190886, "epoch": 4544} {"train_loss": -7.107784271240234, "global_step": 190887, "epoch": 4544} {"train_loss": -7.218452453613281, "global_step": 190888, "epoch": 4544} {"train_loss": -7.120277336665562, "global_step": 190889, "epoch": 4544, "val_loss": 69553.9140625} {"train_loss": -7.231297492980957, "global_step": 190890, "epoch": 4545} {"train_loss": -7.2343244552612305, "global_step": 190891, "epoch": 4545} {"train_loss": -7.205222129821777, "global_step": 190892, "epoch": 4545} {"train_loss": -7.272822856903076, "global_step": 190893, "epoch": 4545} {"train_loss": -7.296346187591553, "global_step": 190894, "epoch": 4545} {"train_loss": -7.233963489532471, "global_step": 190895, "epoch": 4545} {"train_loss": -7.232943534851074, "global_step": 190896, "epoch": 4545} {"train_loss": -7.193472862243652, "global_step": 190897, "epoch": 4545} {"train_loss": -7.3220953941345215, "global_step": 190898, "epoch": 4545} {"train_loss": -7.239357948303223, "global_step": 190899, "epoch": 4545} {"train_loss": -7.2731122970581055, "global_step": 190900, "epoch": 4545} {"train_loss": -7.175013542175293, "global_step": 190901, "epoch": 4545} {"train_loss": -7.2205491065979, "global_step": 190902, "epoch": 4545} {"train_loss": -7.221175670623779, "global_step": 190903, "epoch": 4545} {"train_loss": -7.307657241821289, "global_step": 190904, "epoch": 4545} {"train_loss": -7.216547012329102, "global_step": 190905, "epoch": 4545} {"train_loss": -7.315805435180664, "global_step": 190906, "epoch": 4545} {"train_loss": -7.292820453643799, "global_step": 190907, "epoch": 4545} {"train_loss": -7.2531657218933105, "global_step": 190908, "epoch": 4545} {"train_loss": -7.224887847900391, "global_step": 190909, "epoch": 4545} {"train_loss": -7.2587480545043945, "global_step": 190910, "epoch": 4545} {"train_loss": -7.2038421630859375, "global_step": 190911, "epoch": 4545} {"train_loss": -7.269059658050537, "global_step": 190912, "epoch": 4545} {"train_loss": -7.198217391967773, "global_step": 190913, "epoch": 4545} {"train_loss": -7.267236709594727, "global_step": 190914, "epoch": 4545} {"train_loss": -7.254533767700195, "global_step": 190915, "epoch": 4545} {"train_loss": -7.359325885772705, "global_step": 190916, "epoch": 4545} {"train_loss": -7.2851409912109375, "global_step": 190917, "epoch": 4545} {"train_loss": -7.2276740074157715, "global_step": 190918, "epoch": 4545} {"train_loss": -7.2276082038879395, "global_step": 190919, "epoch": 4545} {"train_loss": -7.248508453369141, "global_step": 190920, "epoch": 4545} {"train_loss": -7.22540283203125, "global_step": 190921, "epoch": 4545} {"train_loss": -7.17143440246582, "global_step": 190922, "epoch": 4545} {"train_loss": -7.294253826141357, "global_step": 190923, "epoch": 4545} {"train_loss": -7.157758712768555, "global_step": 190924, "epoch": 4545} {"train_loss": -7.260320663452148, "global_step": 190925, "epoch": 4545} {"train_loss": -7.153300762176514, "global_step": 190926, "epoch": 4545} {"train_loss": -7.213967323303223, "global_step": 190927, "epoch": 4545} {"train_loss": -7.204696178436279, "global_step": 190928, "epoch": 4545} {"train_loss": -7.161684989929199, "global_step": 190929, "epoch": 4545} {"train_loss": -7.100861072540283, "global_step": 190930, "epoch": 4545} {"train_loss": -7.236564284279233, "global_step": 190931, "epoch": 4545, "val_loss": 69591.859375} {"train_loss": -7.0875043869018555, "global_step": 190932, "epoch": 4546} {"train_loss": -7.192044258117676, "global_step": 190933, "epoch": 4546} {"train_loss": -7.2439680099487305, "global_step": 190934, "epoch": 4546} {"train_loss": -7.104481220245361, "global_step": 190935, "epoch": 4546} {"train_loss": -7.062322616577148, "global_step": 190936, "epoch": 4546} {"train_loss": -7.233212947845459, "global_step": 190937, "epoch": 4546} {"train_loss": -7.179337978363037, "global_step": 190938, "epoch": 4546} {"train_loss": -7.096981048583984, "global_step": 190939, "epoch": 4546} {"train_loss": -7.011081695556641, "global_step": 190940, "epoch": 4546} {"train_loss": -7.221425533294678, "global_step": 190941, "epoch": 4546} {"train_loss": -7.00938606262207, "global_step": 190942, "epoch": 4546} {"train_loss": -7.132415294647217, "global_step": 190943, "epoch": 4546} {"train_loss": -7.195484161376953, "global_step": 190944, "epoch": 4546} {"train_loss": -7.18776798248291, "global_step": 190945, "epoch": 4546} {"train_loss": -7.2079925537109375, "global_step": 190946, "epoch": 4546} {"train_loss": -7.277358055114746, "global_step": 190947, "epoch": 4546} {"train_loss": -7.244619846343994, "global_step": 190948, "epoch": 4546} {"train_loss": -7.281190872192383, "global_step": 190949, "epoch": 4546} {"train_loss": -7.2384934425354, "global_step": 190950, "epoch": 4546} {"train_loss": -7.317058563232422, "global_step": 190951, "epoch": 4546} {"train_loss": -7.235024452209473, "global_step": 190952, "epoch": 4546} {"train_loss": -7.238298416137695, "global_step": 190953, "epoch": 4546} {"train_loss": -7.272771835327148, "global_step": 190954, "epoch": 4546} {"train_loss": -7.196529388427734, "global_step": 190955, "epoch": 4546} {"train_loss": -7.095111846923828, "global_step": 190956, "epoch": 4546} {"train_loss": -7.224989414215088, "global_step": 190957, "epoch": 4546} {"train_loss": -7.114134788513184, "global_step": 190958, "epoch": 4546} {"train_loss": -7.155229568481445, "global_step": 190959, "epoch": 4546} {"train_loss": -7.248377799987793, "global_step": 190960, "epoch": 4546} {"train_loss": -7.195917129516602, "global_step": 190961, "epoch": 4546} {"train_loss": -7.1522393226623535, "global_step": 190962, "epoch": 4546} {"train_loss": -7.208156585693359, "global_step": 190963, "epoch": 4546} {"train_loss": -7.208066463470459, "global_step": 190964, "epoch": 4546} {"train_loss": -7.2366132736206055, "global_step": 190965, "epoch": 4546} {"train_loss": -7.171591758728027, "global_step": 190966, "epoch": 4546} {"train_loss": -7.353681564331055, "global_step": 190967, "epoch": 4546} {"train_loss": -7.289175033569336, "global_step": 190968, "epoch": 4546} {"train_loss": -7.334151268005371, "global_step": 190969, "epoch": 4546} {"train_loss": -7.214308738708496, "global_step": 190970, "epoch": 4546} {"train_loss": -7.191488742828369, "global_step": 190971, "epoch": 4546} {"train_loss": -7.283692359924316, "global_step": 190972, "epoch": 4546} {"train_loss": -7.201762755711873, "global_step": 190973, "epoch": 4546, "val_loss": 69575.5625} {"train_loss": -7.367241382598877, "global_step": 190974, "epoch": 4547} {"train_loss": -7.184117317199707, "global_step": 190975, "epoch": 4547} {"train_loss": -7.383151531219482, "global_step": 190976, "epoch": 4547} {"train_loss": -7.1985979080200195, "global_step": 190977, "epoch": 4547} {"train_loss": -7.13353157043457, "global_step": 190978, "epoch": 4547} {"train_loss": -7.301383972167969, "global_step": 190979, "epoch": 4547} {"train_loss": -7.228283882141113, "global_step": 190980, "epoch": 4547} {"train_loss": -7.25906229019165, "global_step": 190981, "epoch": 4547} {"train_loss": -7.17864990234375, "global_step": 190982, "epoch": 4547} {"train_loss": -7.255201816558838, "global_step": 190983, "epoch": 4547} {"train_loss": -7.3592119216918945, "global_step": 190984, "epoch": 4547} {"train_loss": -7.326951026916504, "global_step": 190985, "epoch": 4547} {"train_loss": -7.288207530975342, "global_step": 190986, "epoch": 4547} {"train_loss": -7.409052848815918, "global_step": 190987, "epoch": 4547} {"train_loss": -7.207474708557129, "global_step": 190988, "epoch": 4547} {"train_loss": -7.262763977050781, "global_step": 190989, "epoch": 4547} {"train_loss": -7.174343585968018, "global_step": 190990, "epoch": 4547} {"train_loss": -7.103790283203125, "global_step": 190991, "epoch": 4547} {"train_loss": -6.897710800170898, "global_step": 190992, "epoch": 4547} {"train_loss": -7.197646141052246, "global_step": 190993, "epoch": 4547} {"train_loss": -6.987677574157715, "global_step": 190994, "epoch": 4547} {"train_loss": -7.125626087188721, "global_step": 190995, "epoch": 4547} {"train_loss": -7.285713195800781, "global_step": 190996, "epoch": 4547} {"train_loss": -7.212318420410156, "global_step": 190997, "epoch": 4547} {"train_loss": -7.187774181365967, "global_step": 190998, "epoch": 4547} {"train_loss": -7.199438571929932, "global_step": 190999, "epoch": 4547} {"train_loss": -7.132059574127197, "global_step": 191000, "epoch": 4547} {"train_loss": -7.139639854431152, "global_step": 191001, "epoch": 4547} {"train_loss": -7.177639007568359, "global_step": 191002, "epoch": 4547} {"train_loss": -7.188436508178711, "global_step": 191003, "epoch": 4547} {"train_loss": -7.155120849609375, "global_step": 191004, "epoch": 4547} {"train_loss": -7.172289848327637, "global_step": 191005, "epoch": 4547} {"train_loss": -7.249789714813232, "global_step": 191006, "epoch": 4547} {"train_loss": -7.2210307121276855, "global_step": 191007, "epoch": 4547} {"train_loss": -7.1773576736450195, "global_step": 191008, "epoch": 4547} {"train_loss": -7.156702041625977, "global_step": 191009, "epoch": 4547} {"train_loss": -7.34218692779541, "global_step": 191010, "epoch": 4547} {"train_loss": -7.112253189086914, "global_step": 191011, "epoch": 4547} {"train_loss": -7.315258979797363, "global_step": 191012, "epoch": 4547} {"train_loss": -7.257858753204346, "global_step": 191013, "epoch": 4547} {"train_loss": -7.203364849090576, "global_step": 191014, "epoch": 4547} {"train_loss": -7.212361789885021, "global_step": 191015, "epoch": 4547, "val_loss": 69621.8359375} {"train_loss": -7.364729404449463, "global_step": 191016, "epoch": 4548} {"train_loss": -7.234347343444824, "global_step": 191017, "epoch": 4548} {"train_loss": -7.237335205078125, "global_step": 191018, "epoch": 4548} {"train_loss": -7.2295074462890625, "global_step": 191019, "epoch": 4548} {"train_loss": -7.233004570007324, "global_step": 191020, "epoch": 4548} {"train_loss": -7.161215782165527, "global_step": 191021, "epoch": 4548} {"train_loss": -7.230623245239258, "global_step": 191022, "epoch": 4548} {"train_loss": -7.19029426574707, "global_step": 191023, "epoch": 4548} {"train_loss": -7.1699419021606445, "global_step": 191024, "epoch": 4548} {"train_loss": -7.194570064544678, "global_step": 191025, "epoch": 4548} {"train_loss": -7.291414260864258, "global_step": 191026, "epoch": 4548} {"train_loss": -7.260475158691406, "global_step": 191027, "epoch": 4548} {"train_loss": -7.317509651184082, "global_step": 191028, "epoch": 4548} {"train_loss": -7.252897262573242, "global_step": 191029, "epoch": 4548} {"train_loss": -7.268190860748291, "global_step": 191030, "epoch": 4548} {"train_loss": -7.1343793869018555, "global_step": 191031, "epoch": 4548} {"train_loss": -7.201376914978027, "global_step": 191032, "epoch": 4548} {"train_loss": -7.236668586730957, "global_step": 191033, "epoch": 4548} {"train_loss": -7.258393287658691, "global_step": 191034, "epoch": 4548} {"train_loss": -7.193352699279785, "global_step": 191035, "epoch": 4548} {"train_loss": -7.1172637939453125, "global_step": 191036, "epoch": 4548} {"train_loss": -7.431437015533447, "global_step": 191037, "epoch": 4548} {"train_loss": -7.191592693328857, "global_step": 191038, "epoch": 4548} {"train_loss": -7.251289367675781, "global_step": 191039, "epoch": 4548} {"train_loss": -7.194242477416992, "global_step": 191040, "epoch": 4548} {"train_loss": -7.248898506164551, "global_step": 191041, "epoch": 4548} {"train_loss": -7.272371768951416, "global_step": 191042, "epoch": 4548} {"train_loss": -7.237008571624756, "global_step": 191043, "epoch": 4548} {"train_loss": -7.222438335418701, "global_step": 191044, "epoch": 4548} {"train_loss": -7.113498687744141, "global_step": 191045, "epoch": 4548} {"train_loss": -7.203974723815918, "global_step": 191046, "epoch": 4548} {"train_loss": -7.316549301147461, "global_step": 191047, "epoch": 4548} {"train_loss": -7.135401725769043, "global_step": 191048, "epoch": 4548} {"train_loss": -7.1556878089904785, "global_step": 191049, "epoch": 4548} {"train_loss": -7.134338855743408, "global_step": 191050, "epoch": 4548} {"train_loss": -7.258722305297852, "global_step": 191051, "epoch": 4548} {"train_loss": -7.182781219482422, "global_step": 191052, "epoch": 4548} {"train_loss": -7.257419586181641, "global_step": 191053, "epoch": 4548} {"train_loss": -7.1519775390625, "global_step": 191054, "epoch": 4548} {"train_loss": -7.031346797943115, "global_step": 191055, "epoch": 4548} {"train_loss": -7.111057281494141, "global_step": 191056, "epoch": 4548} {"train_loss": -7.216948168618338, "global_step": 191057, "epoch": 4548, "val_loss": 69614.375} {"train_loss": -7.168802261352539, "global_step": 191058, "epoch": 4549} {"train_loss": -7.2987518310546875, "global_step": 191059, "epoch": 4549} {"train_loss": -7.066206932067871, "global_step": 191060, "epoch": 4549} {"train_loss": -7.1442155838012695, "global_step": 191061, "epoch": 4549} {"train_loss": -7.2015485763549805, "global_step": 191062, "epoch": 4549} {"train_loss": -7.215911865234375, "global_step": 191063, "epoch": 4549} {"train_loss": -7.179557800292969, "global_step": 191064, "epoch": 4549} {"train_loss": -7.27130651473999, "global_step": 191065, "epoch": 4549} {"train_loss": -7.162845611572266, "global_step": 191066, "epoch": 4549} {"train_loss": -7.127280235290527, "global_step": 191067, "epoch": 4549} {"train_loss": -7.174962043762207, "global_step": 191068, "epoch": 4549} {"train_loss": -7.188920497894287, "global_step": 191069, "epoch": 4549} {"train_loss": -7.174273490905762, "global_step": 191070, "epoch": 4549} {"train_loss": -7.113051414489746, "global_step": 191071, "epoch": 4549} {"train_loss": -7.226480484008789, "global_step": 191072, "epoch": 4549} {"train_loss": -7.082927703857422, "global_step": 191073, "epoch": 4549} {"train_loss": -7.191982269287109, "global_step": 191074, "epoch": 4549} {"train_loss": -7.148908615112305, "global_step": 191075, "epoch": 4549} {"train_loss": -7.113321781158447, "global_step": 191076, "epoch": 4549} {"train_loss": -6.949001789093018, "global_step": 191077, "epoch": 4549} {"train_loss": -7.114201545715332, "global_step": 191078, "epoch": 4549} {"train_loss": -7.01151704788208, "global_step": 191079, "epoch": 4549} {"train_loss": -6.998600959777832, "global_step": 191080, "epoch": 4549} {"train_loss": -7.0565667152404785, "global_step": 191081, "epoch": 4549} {"train_loss": -7.033259391784668, "global_step": 191082, "epoch": 4549} {"train_loss": -6.9230194091796875, "global_step": 191083, "epoch": 4549} {"train_loss": -7.089120864868164, "global_step": 191084, "epoch": 4549} {"train_loss": -6.982979774475098, "global_step": 191085, "epoch": 4549} {"train_loss": -6.955625534057617, "global_step": 191086, "epoch": 4549} {"train_loss": -7.109107971191406, "global_step": 191087, "epoch": 4549} {"train_loss": -7.070904731750488, "global_step": 191088, "epoch": 4549} {"train_loss": -7.099617958068848, "global_step": 191089, "epoch": 4549} {"train_loss": -7.047083854675293, "global_step": 191090, "epoch": 4549} {"train_loss": -7.073760509490967, "global_step": 191091, "epoch": 4549} {"train_loss": -7.05885124206543, "global_step": 191092, "epoch": 4549} {"train_loss": -7.112356185913086, "global_step": 191093, "epoch": 4549} {"train_loss": -6.959766864776611, "global_step": 191094, "epoch": 4549} {"train_loss": -7.2373247146606445, "global_step": 191095, "epoch": 4549} {"train_loss": -7.000421524047852, "global_step": 191096, "epoch": 4549} {"train_loss": -7.195789813995361, "global_step": 191097, "epoch": 4549} {"train_loss": -7.130610466003418, "global_step": 191098, "epoch": 4549} {"train_loss": -7.110204991840181, "global_step": 191099, "epoch": 4549, "val_loss": 69674.609375} {"train_loss": -7.1138763427734375, "global_step": 191100, "epoch": 4550} {"train_loss": -7.149830341339111, "global_step": 191101, "epoch": 4550} {"train_loss": -7.15596866607666, "global_step": 191102, "epoch": 4550} {"train_loss": -7.091843605041504, "global_step": 191103, "epoch": 4550} {"train_loss": -7.192580223083496, "global_step": 191104, "epoch": 4550} {"train_loss": -7.149301528930664, "global_step": 191105, "epoch": 4550} {"train_loss": -7.1572723388671875, "global_step": 191106, "epoch": 4550} {"train_loss": -7.160280227661133, "global_step": 191107, "epoch": 4550} {"train_loss": -7.1781463623046875, "global_step": 191108, "epoch": 4550} {"train_loss": -7.176262855529785, "global_step": 191109, "epoch": 4550} {"train_loss": -7.1335649490356445, "global_step": 191110, "epoch": 4550} {"train_loss": -7.219420433044434, "global_step": 191111, "epoch": 4550} {"train_loss": -7.167437553405762, "global_step": 191112, "epoch": 4550} {"train_loss": -7.202929973602295, "global_step": 191113, "epoch": 4550} {"train_loss": -7.157838821411133, "global_step": 191114, "epoch": 4550} {"train_loss": -7.142045974731445, "global_step": 191115, "epoch": 4550} {"train_loss": -7.176703453063965, "global_step": 191116, "epoch": 4550} {"train_loss": -7.149205684661865, "global_step": 191117, "epoch": 4550} {"train_loss": -7.148138999938965, "global_step": 191118, "epoch": 4550} {"train_loss": -7.195705413818359, "global_step": 191119, "epoch": 4550} {"train_loss": -7.234340667724609, "global_step": 191120, "epoch": 4550} {"train_loss": -7.12888240814209, "global_step": 191121, "epoch": 4550} {"train_loss": -7.163484573364258, "global_step": 191122, "epoch": 4550} {"train_loss": -7.217236042022705, "global_step": 191123, "epoch": 4550} {"train_loss": -7.061341285705566, "global_step": 191124, "epoch": 4550} {"train_loss": -7.261826515197754, "global_step": 191125, "epoch": 4550} {"train_loss": -7.1814374923706055, "global_step": 191126, "epoch": 4550} {"train_loss": -7.226940631866455, "global_step": 191127, "epoch": 4550} {"train_loss": -7.257195949554443, "global_step": 191128, "epoch": 4550} {"train_loss": -7.242475509643555, "global_step": 191129, "epoch": 4550} {"train_loss": -7.103338241577148, "global_step": 191130, "epoch": 4550} {"train_loss": -7.122518062591553, "global_step": 191131, "epoch": 4550} {"train_loss": -7.191697120666504, "global_step": 191132, "epoch": 4550} {"train_loss": -7.188864707946777, "global_step": 191133, "epoch": 4550} {"train_loss": -7.2889556884765625, "global_step": 191134, "epoch": 4550} {"train_loss": -7.167336463928223, "global_step": 191135, "epoch": 4550} {"train_loss": -7.315475940704346, "global_step": 191136, "epoch": 4550} {"train_loss": -7.199407577514648, "global_step": 191137, "epoch": 4550} {"train_loss": -7.119819641113281, "global_step": 191138, "epoch": 4550} {"train_loss": -7.298406600952148, "global_step": 191139, "epoch": 4550} {"train_loss": -7.248734951019287, "global_step": 191140, "epoch": 4550} {"train_loss": -7.180818194434757, "global_step": 191141, "epoch": 4550, "train/sim_max_reward_0": 0.19733515068810586, "train/sim_max_reward_1": 0.8459154809237075, "train/sim_max_reward_2": 0.5537968721346596, "train/sim_max_reward_3": 0.42335775209727206, "train/sim_max_reward_4": 0.7936357964186983, "train/sim_max_reward_5": 0.8419903194707458, "test/sim_max_reward_4300000": 1.0, "test/sim_max_reward_4300001": 0.35913810688038966, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.978433888791207, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.8965164317203299, "test/sim_max_reward_4300008": 0.9944062422674232, "test/sim_max_reward_4300009": 0.9907298662383791, "test/sim_max_reward_4300010": 0.9353548042454293, "test/sim_max_reward_4300011": 0.9927767896010743, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9719524255521036, "test/sim_max_reward_4300016": 0.8014513380006022, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.3880489808242419, "test/sim_max_reward_4300019": 0.18612112266822411, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9715396598629841, "test/sim_max_reward_4300022": 0.6298346471470405, "test/sim_max_reward_4300023": 0.377587659084922, "test/sim_max_reward_4300024": 1.0, "test/sim_max_reward_4300025": 0.9522277198115632, "test/sim_max_reward_4300026": 0.12381392358313631, "test/sim_max_reward_4300027": 1.0, "test/sim_max_reward_4300028": 0.009942315372563716, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.23065925064952864, "test/sim_max_reward_4300031": 0.20948389006886045, "test/sim_max_reward_4300032": 0.9690505387906291, "test/sim_max_reward_4300033": 0.907918129141056, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.31389537771472087, "test/sim_max_reward_4300036": 0.20932005721914873, "test/sim_max_reward_4300037": 0.7013692612088016, "test/sim_max_reward_4300038": 0.8051365884529703, "test/sim_max_reward_4300039": 0.9414809016985514, "test/sim_max_reward_4300040": 0.6442094118559024, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.714118096513063, "test/sim_max_reward_4300043": 0.04682848432243473, "test/sim_max_reward_4300044": 0.8817089030396247, "test/sim_max_reward_4300045": 1.0, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.1841550231489816, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.12473324822185167, "train/mean_score": 0.6093385619555315, "test/mean_score": 0.6091955437701405, "val_loss": 69562.765625} {"train_loss": -7.2947821617126465, "global_step": 191142, "epoch": 4551} {"train_loss": -7.278469085693359, "global_step": 191143, "epoch": 4551} {"train_loss": -7.199899673461914, "global_step": 191144, "epoch": 4551} {"train_loss": -7.19606876373291, "global_step": 191145, "epoch": 4551} {"train_loss": -7.2679595947265625, "global_step": 191146, "epoch": 4551} {"train_loss": -7.136641979217529, "global_step": 191147, "epoch": 4551} {"train_loss": -7.280540943145752, "global_step": 191148, "epoch": 4551} {"train_loss": -7.329479217529297, "global_step": 191149, "epoch": 4551} {"train_loss": -7.189329147338867, "global_step": 191150, "epoch": 4551} {"train_loss": -7.262711048126221, "global_step": 191151, "epoch": 4551} {"train_loss": -7.107723712921143, "global_step": 191152, "epoch": 4551} {"train_loss": -7.200062274932861, "global_step": 191153, "epoch": 4551} {"train_loss": -7.05411434173584, "global_step": 191154, "epoch": 4551} {"train_loss": -7.187020778656006, "global_step": 191155, "epoch": 4551} {"train_loss": -7.28052282333374, "global_step": 191156, "epoch": 4551} {"train_loss": -7.165444374084473, "global_step": 191157, "epoch": 4551} {"train_loss": -7.252884387969971, "global_step": 191158, "epoch": 4551} {"train_loss": -7.112349987030029, "global_step": 191159, "epoch": 4551} {"train_loss": -7.230832099914551, "global_step": 191160, "epoch": 4551} {"train_loss": -7.044463157653809, "global_step": 191161, "epoch": 4551} {"train_loss": -7.138208389282227, "global_step": 191162, "epoch": 4551} {"train_loss": -7.183515548706055, "global_step": 191163, "epoch": 4551} {"train_loss": -7.181121826171875, "global_step": 191164, "epoch": 4551} {"train_loss": -7.19459867477417, "global_step": 191165, "epoch": 4551} {"train_loss": -7.2620391845703125, "global_step": 191166, "epoch": 4551} {"train_loss": -7.000309467315674, "global_step": 191167, "epoch": 4551} {"train_loss": -7.240678787231445, "global_step": 191168, "epoch": 4551} {"train_loss": -7.142865180969238, "global_step": 191169, "epoch": 4551} {"train_loss": -7.18621826171875, "global_step": 191170, "epoch": 4551} {"train_loss": -7.177659034729004, "global_step": 191171, "epoch": 4551} {"train_loss": -7.229580879211426, "global_step": 191172, "epoch": 4551} {"train_loss": -7.126226902008057, "global_step": 191173, "epoch": 4551} {"train_loss": -7.247274398803711, "global_step": 191174, "epoch": 4551} {"train_loss": -7.181312084197998, "global_step": 191175, "epoch": 4551} {"train_loss": -7.098658561706543, "global_step": 191176, "epoch": 4551} {"train_loss": -7.215851783752441, "global_step": 191177, "epoch": 4551} {"train_loss": -7.241418838500977, "global_step": 191178, "epoch": 4551} {"train_loss": -7.284404754638672, "global_step": 191179, "epoch": 4551} {"train_loss": -7.130138397216797, "global_step": 191180, "epoch": 4551} {"train_loss": -7.251123428344727, "global_step": 191181, "epoch": 4551} {"train_loss": -7.076396465301514, "global_step": 191182, "epoch": 4551} {"train_loss": -7.1908291180928545, "global_step": 191183, "epoch": 4551, "val_loss": 69653.609375} {"train_loss": -7.2178425788879395, "global_step": 191184, "epoch": 4552} {"train_loss": -7.163337707519531, "global_step": 191185, "epoch": 4552} {"train_loss": -7.224857330322266, "global_step": 191186, "epoch": 4552} {"train_loss": -7.223431587219238, "global_step": 191187, "epoch": 4552} {"train_loss": -7.2006096839904785, "global_step": 191188, "epoch": 4552} {"train_loss": -7.334013938903809, "global_step": 191189, "epoch": 4552} {"train_loss": -7.168861389160156, "global_step": 191190, "epoch": 4552} {"train_loss": -7.221966743469238, "global_step": 191191, "epoch": 4552} {"train_loss": -7.272088050842285, "global_step": 191192, "epoch": 4552} {"train_loss": -7.114349842071533, "global_step": 191193, "epoch": 4552} {"train_loss": -7.226107120513916, "global_step": 191194, "epoch": 4552} {"train_loss": -7.337693214416504, "global_step": 191195, "epoch": 4552} {"train_loss": -7.108308792114258, "global_step": 191196, "epoch": 4552} {"train_loss": -7.21095085144043, "global_step": 191197, "epoch": 4552} {"train_loss": -7.193980693817139, "global_step": 191198, "epoch": 4552} {"train_loss": -7.15986442565918, "global_step": 191199, "epoch": 4552} {"train_loss": -7.244327545166016, "global_step": 191200, "epoch": 4552} {"train_loss": -7.028379440307617, "global_step": 191201, "epoch": 4552} {"train_loss": -7.182018756866455, "global_step": 191202, "epoch": 4552} {"train_loss": -7.224338531494141, "global_step": 191203, "epoch": 4552} {"train_loss": -7.289335250854492, "global_step": 191204, "epoch": 4552} {"train_loss": -7.295090675354004, "global_step": 191205, "epoch": 4552} {"train_loss": -7.267995357513428, "global_step": 191206, "epoch": 4552} {"train_loss": -7.232101917266846, "global_step": 191207, "epoch": 4552} {"train_loss": -7.244284152984619, "global_step": 191208, "epoch": 4552} {"train_loss": -7.26080322265625, "global_step": 191209, "epoch": 4552} {"train_loss": -7.250387191772461, "global_step": 191210, "epoch": 4552} {"train_loss": -7.263857841491699, "global_step": 191211, "epoch": 4552} {"train_loss": -7.1773481369018555, "global_step": 191212, "epoch": 4552} {"train_loss": -7.281319618225098, "global_step": 191213, "epoch": 4552} {"train_loss": -7.234899997711182, "global_step": 191214, "epoch": 4552} {"train_loss": -7.205589771270752, "global_step": 191215, "epoch": 4552} {"train_loss": -7.355195999145508, "global_step": 191216, "epoch": 4552} {"train_loss": -7.286135673522949, "global_step": 191217, "epoch": 4552} {"train_loss": -7.233765602111816, "global_step": 191218, "epoch": 4552} {"train_loss": -7.273448944091797, "global_step": 191219, "epoch": 4552} {"train_loss": -7.274082183837891, "global_step": 191220, "epoch": 4552} {"train_loss": -7.247769355773926, "global_step": 191221, "epoch": 4552} {"train_loss": -7.0245041847229, "global_step": 191222, "epoch": 4552} {"train_loss": -7.167889595031738, "global_step": 191223, "epoch": 4552} {"train_loss": -7.269899845123291, "global_step": 191224, "epoch": 4552} {"train_loss": -7.218843766621181, "global_step": 191225, "epoch": 4552, "val_loss": 69635.078125} {"train_loss": -7.361701011657715, "global_step": 191226, "epoch": 4553} {"train_loss": -7.207544803619385, "global_step": 191227, "epoch": 4553} {"train_loss": -7.159276008605957, "global_step": 191228, "epoch": 4553} {"train_loss": -7.138426303863525, "global_step": 191229, "epoch": 4553} {"train_loss": -7.197373390197754, "global_step": 191230, "epoch": 4553} {"train_loss": -7.151566505432129, "global_step": 191231, "epoch": 4553} {"train_loss": -7.123390197753906, "global_step": 191232, "epoch": 4553} {"train_loss": -7.142974853515625, "global_step": 191233, "epoch": 4553} {"train_loss": -7.236867904663086, "global_step": 191234, "epoch": 4553} {"train_loss": -7.056328773498535, "global_step": 191235, "epoch": 4553} {"train_loss": -7.094615936279297, "global_step": 191236, "epoch": 4553} {"train_loss": -7.143620491027832, "global_step": 191237, "epoch": 4553} {"train_loss": -7.107116222381592, "global_step": 191238, "epoch": 4553} {"train_loss": -7.1694793701171875, "global_step": 191239, "epoch": 4553} {"train_loss": -6.971273899078369, "global_step": 191240, "epoch": 4553} {"train_loss": -7.175447463989258, "global_step": 191241, "epoch": 4553} {"train_loss": -7.106451988220215, "global_step": 191242, "epoch": 4553} {"train_loss": -7.095039367675781, "global_step": 191243, "epoch": 4553} {"train_loss": -7.063589096069336, "global_step": 191244, "epoch": 4553} {"train_loss": -7.074466705322266, "global_step": 191245, "epoch": 4553} {"train_loss": -7.115965366363525, "global_step": 191246, "epoch": 4553} {"train_loss": -6.994584083557129, "global_step": 191247, "epoch": 4553} {"train_loss": -7.22999382019043, "global_step": 191248, "epoch": 4553} {"train_loss": -6.915194511413574, "global_step": 191249, "epoch": 4553} {"train_loss": -7.0668721199035645, "global_step": 191250, "epoch": 4553} {"train_loss": -7.082522392272949, "global_step": 191251, "epoch": 4553} {"train_loss": -7.081310272216797, "global_step": 191252, "epoch": 4553} {"train_loss": -7.062772750854492, "global_step": 191253, "epoch": 4553} {"train_loss": -7.026751518249512, "global_step": 191254, "epoch": 4553} {"train_loss": -7.026697635650635, "global_step": 191255, "epoch": 4553} {"train_loss": -6.963695526123047, "global_step": 191256, "epoch": 4553} {"train_loss": -7.153510093688965, "global_step": 191257, "epoch": 4553} {"train_loss": -7.077308654785156, "global_step": 191258, "epoch": 4553} {"train_loss": -7.226827621459961, "global_step": 191259, "epoch": 4553} {"train_loss": -7.000391006469727, "global_step": 191260, "epoch": 4553} {"train_loss": -7.041863441467285, "global_step": 191261, "epoch": 4553} {"train_loss": -7.054096698760986, "global_step": 191262, "epoch": 4553} {"train_loss": -7.17458963394165, "global_step": 191263, "epoch": 4553} {"train_loss": -7.065468788146973, "global_step": 191264, "epoch": 4553} {"train_loss": -7.119788646697998, "global_step": 191265, "epoch": 4553} {"train_loss": -7.154253005981445, "global_step": 191266, "epoch": 4553} {"train_loss": -7.1091270333244685, "global_step": 191267, "epoch": 4553, "val_loss": 69805.9453125} {"train_loss": -7.217235565185547, "global_step": 191268, "epoch": 4554} {"train_loss": -7.148710250854492, "global_step": 191269, "epoch": 4554} {"train_loss": -7.25662088394165, "global_step": 191270, "epoch": 4554} {"train_loss": -7.247983932495117, "global_step": 191271, "epoch": 4554} {"train_loss": -7.171940803527832, "global_step": 191272, "epoch": 4554} {"train_loss": -7.158479690551758, "global_step": 191273, "epoch": 4554} {"train_loss": -7.216740608215332, "global_step": 191274, "epoch": 4554} {"train_loss": -7.186758518218994, "global_step": 191275, "epoch": 4554} {"train_loss": -7.289050102233887, "global_step": 191276, "epoch": 4554} {"train_loss": -7.191079139709473, "global_step": 191277, "epoch": 4554} {"train_loss": -7.232998847961426, "global_step": 191278, "epoch": 4554} {"train_loss": -7.213129043579102, "global_step": 191279, "epoch": 4554} {"train_loss": -7.167546272277832, "global_step": 191280, "epoch": 4554} {"train_loss": -7.253567218780518, "global_step": 191281, "epoch": 4554} {"train_loss": -7.157024383544922, "global_step": 191282, "epoch": 4554} {"train_loss": -7.273118495941162, "global_step": 191283, "epoch": 4554} {"train_loss": -7.216628074645996, "global_step": 191284, "epoch": 4554} {"train_loss": -7.2418317794799805, "global_step": 191285, "epoch": 4554} {"train_loss": -7.195959091186523, "global_step": 191286, "epoch": 4554} {"train_loss": -7.224340438842773, "global_step": 191287, "epoch": 4554} {"train_loss": -7.1886515617370605, "global_step": 191288, "epoch": 4554} {"train_loss": -7.213613510131836, "global_step": 191289, "epoch": 4554} {"train_loss": -7.195138454437256, "global_step": 191290, "epoch": 4554} {"train_loss": -7.135890007019043, "global_step": 191291, "epoch": 4554} {"train_loss": -7.271548748016357, "global_step": 191292, "epoch": 4554} {"train_loss": -7.227438926696777, "global_step": 191293, "epoch": 4554} {"train_loss": -7.144191741943359, "global_step": 191294, "epoch": 4554} {"train_loss": -7.258731842041016, "global_step": 191295, "epoch": 4554} {"train_loss": -7.195338249206543, "global_step": 191296, "epoch": 4554} {"train_loss": -7.147916316986084, "global_step": 191297, "epoch": 4554} {"train_loss": -7.270054340362549, "global_step": 191298, "epoch": 4554} {"train_loss": -7.172567367553711, "global_step": 191299, "epoch": 4554} {"train_loss": -7.087947845458984, "global_step": 191300, "epoch": 4554} {"train_loss": -7.2164154052734375, "global_step": 191301, "epoch": 4554} {"train_loss": -7.27207612991333, "global_step": 191302, "epoch": 4554} {"train_loss": -7.09599494934082, "global_step": 191303, "epoch": 4554} {"train_loss": -7.200446128845215, "global_step": 191304, "epoch": 4554} {"train_loss": -7.22217321395874, "global_step": 191305, "epoch": 4554} {"train_loss": -7.360437393188477, "global_step": 191306, "epoch": 4554} {"train_loss": -7.181956768035889, "global_step": 191307, "epoch": 4554} {"train_loss": -7.282951354980469, "global_step": 191308, "epoch": 4554} {"train_loss": -7.209183647519066, "global_step": 191309, "epoch": 4554, "val_loss": 69562.2890625} {"train_loss": -7.2414445877075195, "global_step": 191310, "epoch": 4555} {"train_loss": -7.284884452819824, "global_step": 191311, "epoch": 4555} {"train_loss": -7.260167121887207, "global_step": 191312, "epoch": 4555} {"train_loss": -7.267880439758301, "global_step": 191313, "epoch": 4555} {"train_loss": -7.216896057128906, "global_step": 191314, "epoch": 4555} {"train_loss": -6.967078685760498, "global_step": 191315, "epoch": 4555} {"train_loss": -7.20213508605957, "global_step": 191316, "epoch": 4555} {"train_loss": -7.078579902648926, "global_step": 191317, "epoch": 4555} {"train_loss": -7.235224723815918, "global_step": 191318, "epoch": 4555} {"train_loss": -7.241055965423584, "global_step": 191319, "epoch": 4555} {"train_loss": -7.219980239868164, "global_step": 191320, "epoch": 4555} {"train_loss": -7.263956069946289, "global_step": 191321, "epoch": 4555} {"train_loss": -7.1996002197265625, "global_step": 191322, "epoch": 4555} {"train_loss": -7.164186954498291, "global_step": 191323, "epoch": 4555} {"train_loss": -7.091316223144531, "global_step": 191324, "epoch": 4555} {"train_loss": -7.142496109008789, "global_step": 191325, "epoch": 4555} {"train_loss": -7.199306488037109, "global_step": 191326, "epoch": 4555} {"train_loss": -7.102264404296875, "global_step": 191327, "epoch": 4555} {"train_loss": -7.184538841247559, "global_step": 191328, "epoch": 4555} {"train_loss": -7.199225425720215, "global_step": 191329, "epoch": 4555} {"train_loss": -7.202005863189697, "global_step": 191330, "epoch": 4555} {"train_loss": -7.211806297302246, "global_step": 191331, "epoch": 4555} {"train_loss": -7.188389301300049, "global_step": 191332, "epoch": 4555} {"train_loss": -7.334018230438232, "global_step": 191333, "epoch": 4555} {"train_loss": -7.11043643951416, "global_step": 191334, "epoch": 4555} {"train_loss": -7.097984313964844, "global_step": 191335, "epoch": 4555} {"train_loss": -7.274752616882324, "global_step": 191336, "epoch": 4555} {"train_loss": -7.130171775817871, "global_step": 191337, "epoch": 4555} {"train_loss": -7.1651763916015625, "global_step": 191338, "epoch": 4555} {"train_loss": -7.2858734130859375, "global_step": 191339, "epoch": 4555} {"train_loss": -7.123831748962402, "global_step": 191340, "epoch": 4555} {"train_loss": -7.096330165863037, "global_step": 191341, "epoch": 4555} {"train_loss": -7.343412399291992, "global_step": 191342, "epoch": 4555} {"train_loss": -7.1478705406188965, "global_step": 191343, "epoch": 4555} {"train_loss": -7.120594024658203, "global_step": 191344, "epoch": 4555} {"train_loss": -7.278530120849609, "global_step": 191345, "epoch": 4555} {"train_loss": -7.192952632904053, "global_step": 191346, "epoch": 4555} {"train_loss": -7.140809535980225, "global_step": 191347, "epoch": 4555} {"train_loss": -7.083254814147949, "global_step": 191348, "epoch": 4555} {"train_loss": -7.249709129333496, "global_step": 191349, "epoch": 4555} {"train_loss": -7.073145866394043, "global_step": 191350, "epoch": 4555} {"train_loss": -7.188836960565476, "global_step": 191351, "epoch": 4555, "val_loss": 69750.5546875} {"train_loss": -7.112104892730713, "global_step": 191352, "epoch": 4556} {"train_loss": -7.152515411376953, "global_step": 191353, "epoch": 4556} {"train_loss": -7.124485015869141, "global_step": 191354, "epoch": 4556} {"train_loss": -7.238580703735352, "global_step": 191355, "epoch": 4556} {"train_loss": -7.321905612945557, "global_step": 191356, "epoch": 4556} {"train_loss": -7.165141582489014, "global_step": 191357, "epoch": 4556} {"train_loss": -7.225076198577881, "global_step": 191358, "epoch": 4556} {"train_loss": -7.181475639343262, "global_step": 191359, "epoch": 4556} {"train_loss": -7.102001190185547, "global_step": 191360, "epoch": 4556} {"train_loss": -7.27176570892334, "global_step": 191361, "epoch": 4556} {"train_loss": -7.167258262634277, "global_step": 191362, "epoch": 4556} {"train_loss": -7.2974467277526855, "global_step": 191363, "epoch": 4556} {"train_loss": -7.165834426879883, "global_step": 191364, "epoch": 4556} {"train_loss": -7.1357316970825195, "global_step": 191365, "epoch": 4556} {"train_loss": -7.111499786376953, "global_step": 191366, "epoch": 4556} {"train_loss": -7.094075679779053, "global_step": 191367, "epoch": 4556} {"train_loss": -7.01533317565918, "global_step": 191368, "epoch": 4556} {"train_loss": -7.039186477661133, "global_step": 191369, "epoch": 4556} {"train_loss": -7.193774700164795, "global_step": 191370, "epoch": 4556} {"train_loss": -7.075798988342285, "global_step": 191371, "epoch": 4556} {"train_loss": -7.059629917144775, "global_step": 191372, "epoch": 4556} {"train_loss": -7.2180280685424805, "global_step": 191373, "epoch": 4556} {"train_loss": -7.131552219390869, "global_step": 191374, "epoch": 4556} {"train_loss": -6.9786376953125, "global_step": 191375, "epoch": 4556} {"train_loss": -7.220892906188965, "global_step": 191376, "epoch": 4556} {"train_loss": -7.102167129516602, "global_step": 191377, "epoch": 4556} {"train_loss": -7.101539134979248, "global_step": 191378, "epoch": 4556} {"train_loss": -7.148805618286133, "global_step": 191379, "epoch": 4556} {"train_loss": -7.012382507324219, "global_step": 191380, "epoch": 4556} {"train_loss": -7.161914348602295, "global_step": 191381, "epoch": 4556} {"train_loss": -7.054959774017334, "global_step": 191382, "epoch": 4556} {"train_loss": -7.056977272033691, "global_step": 191383, "epoch": 4556} {"train_loss": -7.10072135925293, "global_step": 191384, "epoch": 4556} {"train_loss": -7.135090351104736, "global_step": 191385, "epoch": 4556} {"train_loss": -7.158031463623047, "global_step": 191386, "epoch": 4556} {"train_loss": -7.19993782043457, "global_step": 191387, "epoch": 4556} {"train_loss": -7.119388580322266, "global_step": 191388, "epoch": 4556} {"train_loss": -7.193848609924316, "global_step": 191389, "epoch": 4556} {"train_loss": -7.226430416107178, "global_step": 191390, "epoch": 4556} {"train_loss": -7.2044677734375, "global_step": 191391, "epoch": 4556} {"train_loss": -7.266936302185059, "global_step": 191392, "epoch": 4556} {"train_loss": -7.149229356220791, "global_step": 191393, "epoch": 4556, "val_loss": 69659.5078125} {"train_loss": -7.313098907470703, "global_step": 191394, "epoch": 4557} {"train_loss": -7.224792003631592, "global_step": 191395, "epoch": 4557} {"train_loss": -7.179577827453613, "global_step": 191396, "epoch": 4557} {"train_loss": -7.187744140625, "global_step": 191397, "epoch": 4557} {"train_loss": -7.32747220993042, "global_step": 191398, "epoch": 4557} {"train_loss": -7.312615871429443, "global_step": 191399, "epoch": 4557} {"train_loss": -7.31494665145874, "global_step": 191400, "epoch": 4557} {"train_loss": -7.197408676147461, "global_step": 191401, "epoch": 4557} {"train_loss": -7.32166862487793, "global_step": 191402, "epoch": 4557} {"train_loss": -7.15285062789917, "global_step": 191403, "epoch": 4557} {"train_loss": -7.19973087310791, "global_step": 191404, "epoch": 4557} {"train_loss": -7.260769844055176, "global_step": 191405, "epoch": 4557} {"train_loss": -7.375443935394287, "global_step": 191406, "epoch": 4557} {"train_loss": -7.264359474182129, "global_step": 191407, "epoch": 4557} {"train_loss": -7.2008209228515625, "global_step": 191408, "epoch": 4557} {"train_loss": -7.209718704223633, "global_step": 191409, "epoch": 4557} {"train_loss": -7.150439262390137, "global_step": 191410, "epoch": 4557} {"train_loss": -7.096467971801758, "global_step": 191411, "epoch": 4557} {"train_loss": -7.299835205078125, "global_step": 191412, "epoch": 4557} {"train_loss": -7.228174209594727, "global_step": 191413, "epoch": 4557} {"train_loss": -7.134832382202148, "global_step": 191414, "epoch": 4557} {"train_loss": -7.131875038146973, "global_step": 191415, "epoch": 4557} {"train_loss": -7.131589412689209, "global_step": 191416, "epoch": 4557} {"train_loss": -7.2367143630981445, "global_step": 191417, "epoch": 4557} {"train_loss": -7.205726623535156, "global_step": 191418, "epoch": 4557} {"train_loss": -7.191646575927734, "global_step": 191419, "epoch": 4557} {"train_loss": -7.1393537521362305, "global_step": 191420, "epoch": 4557} {"train_loss": -7.1824727058410645, "global_step": 191421, "epoch": 4557} {"train_loss": -7.180235385894775, "global_step": 191422, "epoch": 4557} {"train_loss": -7.154688358306885, "global_step": 191423, "epoch": 4557} {"train_loss": -7.207047462463379, "global_step": 191424, "epoch": 4557} {"train_loss": -7.0542168617248535, "global_step": 191425, "epoch": 4557} {"train_loss": -7.1832098960876465, "global_step": 191426, "epoch": 4557} {"train_loss": -7.1979169845581055, "global_step": 191427, "epoch": 4557} {"train_loss": -7.089559555053711, "global_step": 191428, "epoch": 4557} {"train_loss": -7.143338203430176, "global_step": 191429, "epoch": 4557} {"train_loss": -7.145941257476807, "global_step": 191430, "epoch": 4557} {"train_loss": -7.074365139007568, "global_step": 191431, "epoch": 4557} {"train_loss": -7.263791561126709, "global_step": 191432, "epoch": 4557} {"train_loss": -7.273202419281006, "global_step": 191433, "epoch": 4557} {"train_loss": -7.237493515014648, "global_step": 191434, "epoch": 4557} {"train_loss": -7.205581074669247, "global_step": 191435, "epoch": 4557, "val_loss": 69844.5859375} {"train_loss": -7.198236465454102, "global_step": 191436, "epoch": 4558} {"train_loss": -7.31038761138916, "global_step": 191437, "epoch": 4558} {"train_loss": -6.996433734893799, "global_step": 191438, "epoch": 4558} {"train_loss": -7.186385631561279, "global_step": 191439, "epoch": 4558} {"train_loss": -7.185863494873047, "global_step": 191440, "epoch": 4558} {"train_loss": -7.180029392242432, "global_step": 191441, "epoch": 4558} {"train_loss": -7.184124946594238, "global_step": 191442, "epoch": 4558} {"train_loss": -7.2039570808410645, "global_step": 191443, "epoch": 4558} {"train_loss": -7.266443252563477, "global_step": 191444, "epoch": 4558} {"train_loss": -7.112549781799316, "global_step": 191445, "epoch": 4558} {"train_loss": -7.070112228393555, "global_step": 191446, "epoch": 4558} {"train_loss": -7.258666515350342, "global_step": 191447, "epoch": 4558} {"train_loss": -7.080907344818115, "global_step": 191448, "epoch": 4558} {"train_loss": -7.238741874694824, "global_step": 191449, "epoch": 4558} {"train_loss": -7.093698978424072, "global_step": 191450, "epoch": 4558} {"train_loss": -7.154097557067871, "global_step": 191451, "epoch": 4558} {"train_loss": -7.100868225097656, "global_step": 191452, "epoch": 4558} {"train_loss": -7.126131534576416, "global_step": 191453, "epoch": 4558} {"train_loss": -7.17407751083374, "global_step": 191454, "epoch": 4558} {"train_loss": -7.232996940612793, "global_step": 191455, "epoch": 4558} {"train_loss": -7.174630165100098, "global_step": 191456, "epoch": 4558} {"train_loss": -7.168318748474121, "global_step": 191457, "epoch": 4558} {"train_loss": -7.152985572814941, "global_step": 191458, "epoch": 4558} {"train_loss": -7.016556739807129, "global_step": 191459, "epoch": 4558} {"train_loss": -7.014133453369141, "global_step": 191460, "epoch": 4558} {"train_loss": -7.147711277008057, "global_step": 191461, "epoch": 4558} {"train_loss": -7.028046607971191, "global_step": 191462, "epoch": 4558} {"train_loss": -7.101937770843506, "global_step": 191463, "epoch": 4558} {"train_loss": -7.109563827514648, "global_step": 191464, "epoch": 4558} {"train_loss": -7.127851486206055, "global_step": 191465, "epoch": 4558} {"train_loss": -7.231140613555908, "global_step": 191466, "epoch": 4558} {"train_loss": -7.179145336151123, "global_step": 191467, "epoch": 4558} {"train_loss": -7.062514305114746, "global_step": 191468, "epoch": 4558} {"train_loss": -7.187578201293945, "global_step": 191469, "epoch": 4558} {"train_loss": -7.182480812072754, "global_step": 191470, "epoch": 4558} {"train_loss": -7.143121719360352, "global_step": 191471, "epoch": 4558} {"train_loss": -7.1870927810668945, "global_step": 191472, "epoch": 4558} {"train_loss": -7.226104259490967, "global_step": 191473, "epoch": 4558} {"train_loss": -7.184474945068359, "global_step": 191474, "epoch": 4558} {"train_loss": -7.216851234436035, "global_step": 191475, "epoch": 4558} {"train_loss": -7.295222282409668, "global_step": 191476, "epoch": 4558} {"train_loss": -7.1570549465361095, "global_step": 191477, "epoch": 4558, "val_loss": 69862.28125} {"train_loss": -7.179693222045898, "global_step": 191478, "epoch": 4559} {"train_loss": -7.156643390655518, "global_step": 191479, "epoch": 4559} {"train_loss": -7.206860065460205, "global_step": 191480, "epoch": 4559} {"train_loss": -7.202343940734863, "global_step": 191481, "epoch": 4559} {"train_loss": -7.076573371887207, "global_step": 191482, "epoch": 4559} {"train_loss": -7.081137657165527, "global_step": 191483, "epoch": 4559} {"train_loss": -7.114021301269531, "global_step": 191484, "epoch": 4559} {"train_loss": -7.202083110809326, "global_step": 191485, "epoch": 4559} {"train_loss": -7.17672061920166, "global_step": 191486, "epoch": 4559} {"train_loss": -7.0920023918151855, "global_step": 191487, "epoch": 4559} {"train_loss": -7.151454925537109, "global_step": 191488, "epoch": 4559} {"train_loss": -7.225078582763672, "global_step": 191489, "epoch": 4559} {"train_loss": -7.169154167175293, "global_step": 191490, "epoch": 4559} {"train_loss": -7.14136266708374, "global_step": 191491, "epoch": 4559} {"train_loss": -7.0671234130859375, "global_step": 191492, "epoch": 4559} {"train_loss": -7.122557163238525, "global_step": 191493, "epoch": 4559} {"train_loss": -7.21563720703125, "global_step": 191494, "epoch": 4559} {"train_loss": -7.125476837158203, "global_step": 191495, "epoch": 4559} {"train_loss": -7.142001152038574, "global_step": 191496, "epoch": 4559} {"train_loss": -7.203543663024902, "global_step": 191497, "epoch": 4559} {"train_loss": -7.150127410888672, "global_step": 191498, "epoch": 4559} {"train_loss": -7.131746768951416, "global_step": 191499, "epoch": 4559} {"train_loss": -7.255408763885498, "global_step": 191500, "epoch": 4559} {"train_loss": -7.253297805786133, "global_step": 191501, "epoch": 4559} {"train_loss": -7.1819353103637695, "global_step": 191502, "epoch": 4559} {"train_loss": -7.206310272216797, "global_step": 191503, "epoch": 4559} {"train_loss": -7.202523231506348, "global_step": 191504, "epoch": 4559} {"train_loss": -7.2686052322387695, "global_step": 191505, "epoch": 4559} {"train_loss": -7.174635887145996, "global_step": 191506, "epoch": 4559} {"train_loss": -7.248619079589844, "global_step": 191507, "epoch": 4559} {"train_loss": -7.262754440307617, "global_step": 191508, "epoch": 4559} {"train_loss": -7.185474395751953, "global_step": 191509, "epoch": 4559} {"train_loss": -7.194025993347168, "global_step": 191510, "epoch": 4559} {"train_loss": -7.129411697387695, "global_step": 191511, "epoch": 4559} {"train_loss": -7.214425086975098, "global_step": 191512, "epoch": 4559} {"train_loss": -7.127753734588623, "global_step": 191513, "epoch": 4559} {"train_loss": -7.16635799407959, "global_step": 191514, "epoch": 4559} {"train_loss": -7.201437950134277, "global_step": 191515, "epoch": 4559} {"train_loss": -7.177297592163086, "global_step": 191516, "epoch": 4559} {"train_loss": -7.325157165527344, "global_step": 191517, "epoch": 4559} {"train_loss": -7.260917663574219, "global_step": 191518, "epoch": 4559} {"train_loss": -7.1797558807191395, "global_step": 191519, "epoch": 4559, "val_loss": 69485.7890625} {"train_loss": -7.182880401611328, "global_step": 191520, "epoch": 4560} {"train_loss": -7.31895637512207, "global_step": 191521, "epoch": 4560} {"train_loss": -7.174186706542969, "global_step": 191522, "epoch": 4560} {"train_loss": -7.407444953918457, "global_step": 191523, "epoch": 4560} {"train_loss": -7.141570568084717, "global_step": 191524, "epoch": 4560} {"train_loss": -7.3013200759887695, "global_step": 191525, "epoch": 4560} {"train_loss": -7.280605316162109, "global_step": 191526, "epoch": 4560} {"train_loss": -7.068340301513672, "global_step": 191527, "epoch": 4560} {"train_loss": -7.288299560546875, "global_step": 191528, "epoch": 4560} {"train_loss": -7.094284534454346, "global_step": 191529, "epoch": 4560} {"train_loss": -7.210867881774902, "global_step": 191530, "epoch": 4560} {"train_loss": -7.186033725738525, "global_step": 191531, "epoch": 4560} {"train_loss": -7.176616191864014, "global_step": 191532, "epoch": 4560} {"train_loss": -7.276293754577637, "global_step": 191533, "epoch": 4560} {"train_loss": -7.153179168701172, "global_step": 191534, "epoch": 4560} {"train_loss": -7.116728782653809, "global_step": 191535, "epoch": 4560} {"train_loss": -7.2483930587768555, "global_step": 191536, "epoch": 4560} {"train_loss": -7.326517105102539, "global_step": 191537, "epoch": 4560} {"train_loss": -7.145689010620117, "global_step": 191538, "epoch": 4560} {"train_loss": -7.271221160888672, "global_step": 191539, "epoch": 4560} {"train_loss": -7.285155296325684, "global_step": 191540, "epoch": 4560} {"train_loss": -7.238984107971191, "global_step": 191541, "epoch": 4560} {"train_loss": -7.2858123779296875, "global_step": 191542, "epoch": 4560} {"train_loss": -7.106746673583984, "global_step": 191543, "epoch": 4560} {"train_loss": -7.26843786239624, "global_step": 191544, "epoch": 4560} {"train_loss": -7.305202484130859, "global_step": 191545, "epoch": 4560} {"train_loss": -7.340919494628906, "global_step": 191546, "epoch": 4560} {"train_loss": -7.223294734954834, "global_step": 191547, "epoch": 4560} {"train_loss": -7.213263511657715, "global_step": 191548, "epoch": 4560} {"train_loss": -7.245527267456055, "global_step": 191549, "epoch": 4560} {"train_loss": -7.314560890197754, "global_step": 191550, "epoch": 4560} {"train_loss": -7.211133003234863, "global_step": 191551, "epoch": 4560} {"train_loss": -7.169192790985107, "global_step": 191552, "epoch": 4560} {"train_loss": -7.32273006439209, "global_step": 191553, "epoch": 4560} {"train_loss": -7.181083679199219, "global_step": 191554, "epoch": 4560} {"train_loss": -7.316532611846924, "global_step": 191555, "epoch": 4560} {"train_loss": -7.256834983825684, "global_step": 191556, "epoch": 4560} {"train_loss": -7.250655174255371, "global_step": 191557, "epoch": 4560} {"train_loss": -7.275990009307861, "global_step": 191558, "epoch": 4560} {"train_loss": -7.305408477783203, "global_step": 191559, "epoch": 4560} {"train_loss": -7.240916728973389, "global_step": 191560, "epoch": 4560} {"train_loss": -7.239391803741455, "global_step": 191561, "epoch": 4560, "val_loss": 69577.8359375} {"train_loss": -7.323579788208008, "global_step": 191562, "epoch": 4561} {"train_loss": -7.30638313293457, "global_step": 191563, "epoch": 4561} {"train_loss": -7.343549728393555, "global_step": 191564, "epoch": 4561} {"train_loss": -7.2245073318481445, "global_step": 191565, "epoch": 4561} {"train_loss": -7.231558799743652, "global_step": 191566, "epoch": 4561} {"train_loss": -7.2033796310424805, "global_step": 191567, "epoch": 4561} {"train_loss": -7.324883460998535, "global_step": 191568, "epoch": 4561} {"train_loss": -7.279157638549805, "global_step": 191569, "epoch": 4561} {"train_loss": -7.146450042724609, "global_step": 191570, "epoch": 4561} {"train_loss": -7.264721870422363, "global_step": 191571, "epoch": 4561} {"train_loss": -7.316429138183594, "global_step": 191572, "epoch": 4561} {"train_loss": -7.138950347900391, "global_step": 191573, "epoch": 4561} {"train_loss": -7.279463768005371, "global_step": 191574, "epoch": 4561} {"train_loss": -7.166094779968262, "global_step": 191575, "epoch": 4561} {"train_loss": -7.202249526977539, "global_step": 191576, "epoch": 4561} {"train_loss": -7.304073333740234, "global_step": 191577, "epoch": 4561} {"train_loss": -7.088194847106934, "global_step": 191578, "epoch": 4561} {"train_loss": -7.134803771972656, "global_step": 191579, "epoch": 4561} {"train_loss": -7.37991189956665, "global_step": 191580, "epoch": 4561} {"train_loss": -7.126717567443848, "global_step": 191581, "epoch": 4561} {"train_loss": -7.295011520385742, "global_step": 191582, "epoch": 4561} {"train_loss": -7.291122913360596, "global_step": 191583, "epoch": 4561} {"train_loss": -7.124955177307129, "global_step": 191584, "epoch": 4561} {"train_loss": -7.107357978820801, "global_step": 191585, "epoch": 4561} {"train_loss": -7.233590602874756, "global_step": 191586, "epoch": 4561} {"train_loss": -7.254546165466309, "global_step": 191587, "epoch": 4561} {"train_loss": -7.169275760650635, "global_step": 191588, "epoch": 4561} {"train_loss": -7.304124355316162, "global_step": 191589, "epoch": 4561} {"train_loss": -7.1722893714904785, "global_step": 191590, "epoch": 4561} {"train_loss": -7.277611255645752, "global_step": 191591, "epoch": 4561} {"train_loss": -7.3037333488464355, "global_step": 191592, "epoch": 4561} {"train_loss": -7.279202938079834, "global_step": 191593, "epoch": 4561} {"train_loss": -7.080719470977783, "global_step": 191594, "epoch": 4561} {"train_loss": -7.271161079406738, "global_step": 191595, "epoch": 4561} {"train_loss": -7.098203659057617, "global_step": 191596, "epoch": 4561} {"train_loss": -7.090441703796387, "global_step": 191597, "epoch": 4561} {"train_loss": -7.154642105102539, "global_step": 191598, "epoch": 4561} {"train_loss": -7.238364219665527, "global_step": 191599, "epoch": 4561} {"train_loss": -7.128060340881348, "global_step": 191600, "epoch": 4561} {"train_loss": -7.29630708694458, "global_step": 191601, "epoch": 4561} {"train_loss": -7.193561553955078, "global_step": 191602, "epoch": 4561} {"train_loss": -7.220421961375645, "global_step": 191603, "epoch": 4561, "val_loss": 69557.8984375} {"train_loss": -7.179108619689941, "global_step": 191604, "epoch": 4562} {"train_loss": -7.080186367034912, "global_step": 191605, "epoch": 4562} {"train_loss": -7.077741622924805, "global_step": 191606, "epoch": 4562} {"train_loss": -7.140101432800293, "global_step": 191607, "epoch": 4562} {"train_loss": -7.0999250411987305, "global_step": 191608, "epoch": 4562} {"train_loss": -7.203129768371582, "global_step": 191609, "epoch": 4562} {"train_loss": -7.086312770843506, "global_step": 191610, "epoch": 4562} {"train_loss": -7.1011152267456055, "global_step": 191611, "epoch": 4562} {"train_loss": -7.180628776550293, "global_step": 191612, "epoch": 4562} {"train_loss": -7.163906574249268, "global_step": 191613, "epoch": 4562} {"train_loss": -7.073353290557861, "global_step": 191614, "epoch": 4562} {"train_loss": -7.127233505249023, "global_step": 191615, "epoch": 4562} {"train_loss": -7.060758590698242, "global_step": 191616, "epoch": 4562} {"train_loss": -7.1653242111206055, "global_step": 191617, "epoch": 4562} {"train_loss": -7.289600849151611, "global_step": 191618, "epoch": 4562} {"train_loss": -7.189829349517822, "global_step": 191619, "epoch": 4562} {"train_loss": -7.2381463050842285, "global_step": 191620, "epoch": 4562} {"train_loss": -7.241881370544434, "global_step": 191621, "epoch": 4562} {"train_loss": -7.193029403686523, "global_step": 191622, "epoch": 4562} {"train_loss": -7.249651908874512, "global_step": 191623, "epoch": 4562} {"train_loss": -7.118243217468262, "global_step": 191624, "epoch": 4562} {"train_loss": -7.123257160186768, "global_step": 191625, "epoch": 4562} {"train_loss": -7.153693199157715, "global_step": 191626, "epoch": 4562} {"train_loss": -7.126636028289795, "global_step": 191627, "epoch": 4562} {"train_loss": -7.079418182373047, "global_step": 191628, "epoch": 4562} {"train_loss": -7.25058126449585, "global_step": 191629, "epoch": 4562} {"train_loss": -7.15625, "global_step": 191630, "epoch": 4562} {"train_loss": -7.1330437660217285, "global_step": 191631, "epoch": 4562} {"train_loss": -7.117338180541992, "global_step": 191632, "epoch": 4562} {"train_loss": -7.149176597595215, "global_step": 191633, "epoch": 4562} {"train_loss": -7.180131912231445, "global_step": 191634, "epoch": 4562} {"train_loss": -7.125042915344238, "global_step": 191635, "epoch": 4562} {"train_loss": -7.1320929527282715, "global_step": 191636, "epoch": 4562} {"train_loss": -7.123097896575928, "global_step": 191637, "epoch": 4562} {"train_loss": -7.151708126068115, "global_step": 191638, "epoch": 4562} {"train_loss": -7.283733367919922, "global_step": 191639, "epoch": 4562} {"train_loss": -7.178359508514404, "global_step": 191640, "epoch": 4562} {"train_loss": -7.116983413696289, "global_step": 191641, "epoch": 4562} {"train_loss": -7.263333797454834, "global_step": 191642, "epoch": 4562} {"train_loss": -7.233994007110596, "global_step": 191643, "epoch": 4562} {"train_loss": -7.2580084800720215, "global_step": 191644, "epoch": 4562} {"train_loss": -7.161973760241554, "global_step": 191645, "epoch": 4562, "val_loss": 69616.546875} {"train_loss": -7.191710472106934, "global_step": 191646, "epoch": 4563} {"train_loss": -7.308719158172607, "global_step": 191647, "epoch": 4563} {"train_loss": -7.11865234375, "global_step": 191648, "epoch": 4563} {"train_loss": -7.22084379196167, "global_step": 191649, "epoch": 4563} {"train_loss": -7.131020545959473, "global_step": 191650, "epoch": 4563} {"train_loss": -7.076258182525635, "global_step": 191651, "epoch": 4563} {"train_loss": -7.129295825958252, "global_step": 191652, "epoch": 4563} {"train_loss": -7.248091697692871, "global_step": 191653, "epoch": 4563} {"train_loss": -7.192417144775391, "global_step": 191654, "epoch": 4563} {"train_loss": -7.2234344482421875, "global_step": 191655, "epoch": 4563} {"train_loss": -7.2013092041015625, "global_step": 191656, "epoch": 4563} {"train_loss": -7.0950608253479, "global_step": 191657, "epoch": 4563} {"train_loss": -7.105979919433594, "global_step": 191658, "epoch": 4563} {"train_loss": -7.101045608520508, "global_step": 191659, "epoch": 4563} {"train_loss": -7.084481239318848, "global_step": 191660, "epoch": 4563} {"train_loss": -7.128193378448486, "global_step": 191661, "epoch": 4563} {"train_loss": -7.052623748779297, "global_step": 191662, "epoch": 4563} {"train_loss": -7.201596260070801, "global_step": 191663, "epoch": 4563} {"train_loss": -7.0956339836120605, "global_step": 191664, "epoch": 4563} {"train_loss": -7.1307244300842285, "global_step": 191665, "epoch": 4563} {"train_loss": -7.08858585357666, "global_step": 191666, "epoch": 4563} {"train_loss": -7.12320613861084, "global_step": 191667, "epoch": 4563} {"train_loss": -7.188191890716553, "global_step": 191668, "epoch": 4563} {"train_loss": -6.894444942474365, "global_step": 191669, "epoch": 4563} {"train_loss": -7.207449913024902, "global_step": 191670, "epoch": 4563} {"train_loss": -7.059878349304199, "global_step": 191671, "epoch": 4563} {"train_loss": -7.214284896850586, "global_step": 191672, "epoch": 4563} {"train_loss": -7.209649085998535, "global_step": 191673, "epoch": 4563} {"train_loss": -7.120003700256348, "global_step": 191674, "epoch": 4563} {"train_loss": -7.151580810546875, "global_step": 191675, "epoch": 4563} {"train_loss": -7.212034225463867, "global_step": 191676, "epoch": 4563} {"train_loss": -7.1614580154418945, "global_step": 191677, "epoch": 4563} {"train_loss": -7.21150016784668, "global_step": 191678, "epoch": 4563} {"train_loss": -7.175275802612305, "global_step": 191679, "epoch": 4563} {"train_loss": -7.175688743591309, "global_step": 191680, "epoch": 4563} {"train_loss": -7.225757598876953, "global_step": 191681, "epoch": 4563} {"train_loss": -7.278414249420166, "global_step": 191682, "epoch": 4563} {"train_loss": -7.213810920715332, "global_step": 191683, "epoch": 4563} {"train_loss": -7.254988670349121, "global_step": 191684, "epoch": 4563} {"train_loss": -7.24013614654541, "global_step": 191685, "epoch": 4563} {"train_loss": -7.237695693969727, "global_step": 191686, "epoch": 4563} {"train_loss": -7.164843139194307, "global_step": 191687, "epoch": 4563, "val_loss": 69561.4375} {"train_loss": -7.28791618347168, "global_step": 191688, "epoch": 4564} {"train_loss": -7.299553394317627, "global_step": 191689, "epoch": 4564} {"train_loss": -7.299831390380859, "global_step": 191690, "epoch": 4564} {"train_loss": -7.317404747009277, "global_step": 191691, "epoch": 4564} {"train_loss": -7.277671813964844, "global_step": 191692, "epoch": 4564} {"train_loss": -7.354641914367676, "global_step": 191693, "epoch": 4564} {"train_loss": -7.17759895324707, "global_step": 191694, "epoch": 4564} {"train_loss": -7.294919013977051, "global_step": 191695, "epoch": 4564} {"train_loss": -7.327779293060303, "global_step": 191696, "epoch": 4564} {"train_loss": -7.303141117095947, "global_step": 191697, "epoch": 4564} {"train_loss": -7.287130355834961, "global_step": 191698, "epoch": 4564} {"train_loss": -7.183700084686279, "global_step": 191699, "epoch": 4564} {"train_loss": -7.158415794372559, "global_step": 191700, "epoch": 4564} {"train_loss": -7.231966018676758, "global_step": 191701, "epoch": 4564} {"train_loss": -7.129965782165527, "global_step": 191702, "epoch": 4564} {"train_loss": -7.118600845336914, "global_step": 191703, "epoch": 4564} {"train_loss": -7.276636123657227, "global_step": 191704, "epoch": 4564} {"train_loss": -7.326415061950684, "global_step": 191705, "epoch": 4564} {"train_loss": -7.014093399047852, "global_step": 191706, "epoch": 4564} {"train_loss": -7.152892589569092, "global_step": 191707, "epoch": 4564} {"train_loss": -7.195716857910156, "global_step": 191708, "epoch": 4564} {"train_loss": -7.2502312660217285, "global_step": 191709, "epoch": 4564} {"train_loss": -7.14813756942749, "global_step": 191710, "epoch": 4564} {"train_loss": -7.140604019165039, "global_step": 191711, "epoch": 4564} {"train_loss": -7.267823219299316, "global_step": 191712, "epoch": 4564} {"train_loss": -7.2725043296813965, "global_step": 191713, "epoch": 4564} {"train_loss": -7.150228977203369, "global_step": 191714, "epoch": 4564} {"train_loss": -7.289810657501221, "global_step": 191715, "epoch": 4564} {"train_loss": -7.234172344207764, "global_step": 191716, "epoch": 4564} {"train_loss": -7.173068046569824, "global_step": 191717, "epoch": 4564} {"train_loss": -7.3501739501953125, "global_step": 191718, "epoch": 4564} {"train_loss": -7.168548583984375, "global_step": 191719, "epoch": 4564} {"train_loss": -7.173656463623047, "global_step": 191720, "epoch": 4564} {"train_loss": -7.183429718017578, "global_step": 191721, "epoch": 4564} {"train_loss": -7.2631988525390625, "global_step": 191722, "epoch": 4564} {"train_loss": -7.272465229034424, "global_step": 191723, "epoch": 4564} {"train_loss": -7.2545576095581055, "global_step": 191724, "epoch": 4564} {"train_loss": -7.1061530113220215, "global_step": 191725, "epoch": 4564} {"train_loss": -7.187765121459961, "global_step": 191726, "epoch": 4564} {"train_loss": -7.111766338348389, "global_step": 191727, "epoch": 4564} {"train_loss": -7.176152229309082, "global_step": 191728, "epoch": 4564} {"train_loss": -7.2236563591730025, "global_step": 191729, "epoch": 4564, "val_loss": 69719.2578125} {"train_loss": -7.2873921394348145, "global_step": 191730, "epoch": 4565} {"train_loss": -7.188660621643066, "global_step": 191731, "epoch": 4565} {"train_loss": -7.150775909423828, "global_step": 191732, "epoch": 4565} {"train_loss": -7.267136573791504, "global_step": 191733, "epoch": 4565} {"train_loss": -7.187412261962891, "global_step": 191734, "epoch": 4565} {"train_loss": -7.254419326782227, "global_step": 191735, "epoch": 4565} {"train_loss": -7.194113731384277, "global_step": 191736, "epoch": 4565} {"train_loss": -7.091798305511475, "global_step": 191737, "epoch": 4565} {"train_loss": -7.190975666046143, "global_step": 191738, "epoch": 4565} {"train_loss": -7.097099304199219, "global_step": 191739, "epoch": 4565} {"train_loss": -7.323553085327148, "global_step": 191740, "epoch": 4565} {"train_loss": -7.105337142944336, "global_step": 191741, "epoch": 4565} {"train_loss": -7.125324249267578, "global_step": 191742, "epoch": 4565} {"train_loss": -7.193023681640625, "global_step": 191743, "epoch": 4565} {"train_loss": -7.154910564422607, "global_step": 191744, "epoch": 4565} {"train_loss": -7.20120906829834, "global_step": 191745, "epoch": 4565} {"train_loss": -7.212244987487793, "global_step": 191746, "epoch": 4565} {"train_loss": -7.226592063903809, "global_step": 191747, "epoch": 4565} {"train_loss": -7.240882396697998, "global_step": 191748, "epoch": 4565} {"train_loss": -7.155218124389648, "global_step": 191749, "epoch": 4565} {"train_loss": -7.2584452629089355, "global_step": 191750, "epoch": 4565} {"train_loss": -7.1158061027526855, "global_step": 191751, "epoch": 4565} {"train_loss": -7.354738712310791, "global_step": 191752, "epoch": 4565} {"train_loss": -7.2108964920043945, "global_step": 191753, "epoch": 4565} {"train_loss": -7.1854166984558105, "global_step": 191754, "epoch": 4565} {"train_loss": -7.319820404052734, "global_step": 191755, "epoch": 4565} {"train_loss": -7.1333699226379395, "global_step": 191756, "epoch": 4565} {"train_loss": -7.088541030883789, "global_step": 191757, "epoch": 4565} {"train_loss": -7.144417762756348, "global_step": 191758, "epoch": 4565} {"train_loss": -7.105831146240234, "global_step": 191759, "epoch": 4565} {"train_loss": -7.142081260681152, "global_step": 191760, "epoch": 4565} {"train_loss": -7.227844715118408, "global_step": 191761, "epoch": 4565} {"train_loss": -7.201037406921387, "global_step": 191762, "epoch": 4565} {"train_loss": -7.320129871368408, "global_step": 191763, "epoch": 4565} {"train_loss": -7.252151966094971, "global_step": 191764, "epoch": 4565} {"train_loss": -7.2802629470825195, "global_step": 191765, "epoch": 4565} {"train_loss": -7.221861839294434, "global_step": 191766, "epoch": 4565} {"train_loss": -7.145509719848633, "global_step": 191767, "epoch": 4565} {"train_loss": -7.19689416885376, "global_step": 191768, "epoch": 4565} {"train_loss": -7.136509895324707, "global_step": 191769, "epoch": 4565} {"train_loss": -7.214132785797119, "global_step": 191770, "epoch": 4565} {"train_loss": -7.196095750445411, "global_step": 191771, "epoch": 4565, "val_loss": 69680.484375} {"train_loss": -7.1623382568359375, "global_step": 191772, "epoch": 4566} {"train_loss": -7.225823879241943, "global_step": 191773, "epoch": 4566} {"train_loss": -7.39837646484375, "global_step": 191774, "epoch": 4566} {"train_loss": -7.288999557495117, "global_step": 191775, "epoch": 4566} {"train_loss": -7.22210693359375, "global_step": 191776, "epoch": 4566} {"train_loss": -7.049530029296875, "global_step": 191777, "epoch": 4566} {"train_loss": -7.05009651184082, "global_step": 191778, "epoch": 4566} {"train_loss": -7.220427989959717, "global_step": 191779, "epoch": 4566} {"train_loss": -7.1724348068237305, "global_step": 191780, "epoch": 4566} {"train_loss": -7.292407035827637, "global_step": 191781, "epoch": 4566} {"train_loss": -7.157998085021973, "global_step": 191782, "epoch": 4566} {"train_loss": -7.12534236907959, "global_step": 191783, "epoch": 4566} {"train_loss": -7.1566243171691895, "global_step": 191784, "epoch": 4566} {"train_loss": -7.127316474914551, "global_step": 191785, "epoch": 4566} {"train_loss": -7.1787109375, "global_step": 191786, "epoch": 4566} {"train_loss": -7.177635192871094, "global_step": 191787, "epoch": 4566} {"train_loss": -7.341775894165039, "global_step": 191788, "epoch": 4566} {"train_loss": -7.252399444580078, "global_step": 191789, "epoch": 4566} {"train_loss": -7.215987205505371, "global_step": 191790, "epoch": 4566} {"train_loss": -7.2266130447387695, "global_step": 191791, "epoch": 4566} {"train_loss": -7.211395263671875, "global_step": 191792, "epoch": 4566} {"train_loss": -7.211262226104736, "global_step": 191793, "epoch": 4566} {"train_loss": -7.190061092376709, "global_step": 191794, "epoch": 4566} {"train_loss": -7.249526023864746, "global_step": 191795, "epoch": 4566} {"train_loss": -7.09427547454834, "global_step": 191796, "epoch": 4566} {"train_loss": -7.201986312866211, "global_step": 191797, "epoch": 4566} {"train_loss": -7.214898586273193, "global_step": 191798, "epoch": 4566} {"train_loss": -7.293667793273926, "global_step": 191799, "epoch": 4566} {"train_loss": -7.268847465515137, "global_step": 191800, "epoch": 4566} {"train_loss": -7.29497766494751, "global_step": 191801, "epoch": 4566} {"train_loss": -7.236639022827148, "global_step": 191802, "epoch": 4566} {"train_loss": -7.0998430252075195, "global_step": 191803, "epoch": 4566} {"train_loss": -7.248679161071777, "global_step": 191804, "epoch": 4566} {"train_loss": -7.165011405944824, "global_step": 191805, "epoch": 4566} {"train_loss": -7.233899116516113, "global_step": 191806, "epoch": 4566} {"train_loss": -7.198686599731445, "global_step": 191807, "epoch": 4566} {"train_loss": -7.015351295471191, "global_step": 191808, "epoch": 4566} {"train_loss": -7.157363414764404, "global_step": 191809, "epoch": 4566} {"train_loss": -7.120482921600342, "global_step": 191810, "epoch": 4566} {"train_loss": -7.19436502456665, "global_step": 191811, "epoch": 4566} {"train_loss": -7.196793556213379, "global_step": 191812, "epoch": 4566} {"train_loss": -7.19590729758853, "global_step": 191813, "epoch": 4566, "val_loss": 69616.8125} {"train_loss": -7.220437526702881, "global_step": 191814, "epoch": 4567} {"train_loss": -7.194657802581787, "global_step": 191815, "epoch": 4567} {"train_loss": -7.138014793395996, "global_step": 191816, "epoch": 4567} {"train_loss": -7.219921588897705, "global_step": 191817, "epoch": 4567} {"train_loss": -7.319014549255371, "global_step": 191818, "epoch": 4567} {"train_loss": -7.092206001281738, "global_step": 191819, "epoch": 4567} {"train_loss": -7.189480304718018, "global_step": 191820, "epoch": 4567} {"train_loss": -7.206314563751221, "global_step": 191821, "epoch": 4567} {"train_loss": -7.271514415740967, "global_step": 191822, "epoch": 4567} {"train_loss": -7.13998556137085, "global_step": 191823, "epoch": 4567} {"train_loss": -7.1436920166015625, "global_step": 191824, "epoch": 4567} {"train_loss": -7.157224655151367, "global_step": 191825, "epoch": 4567} {"train_loss": -7.076037883758545, "global_step": 191826, "epoch": 4567} {"train_loss": -7.055046081542969, "global_step": 191827, "epoch": 4567} {"train_loss": -7.179599761962891, "global_step": 191828, "epoch": 4567} {"train_loss": -7.109991073608398, "global_step": 191829, "epoch": 4567} {"train_loss": -7.033857345581055, "global_step": 191830, "epoch": 4567} {"train_loss": -7.166271686553955, "global_step": 191831, "epoch": 4567} {"train_loss": -7.023712158203125, "global_step": 191832, "epoch": 4567} {"train_loss": -6.960126876831055, "global_step": 191833, "epoch": 4567} {"train_loss": -7.196788787841797, "global_step": 191834, "epoch": 4567} {"train_loss": -6.987471580505371, "global_step": 191835, "epoch": 4567} {"train_loss": -7.089858055114746, "global_step": 191836, "epoch": 4567} {"train_loss": -7.03441047668457, "global_step": 191837, "epoch": 4567} {"train_loss": -7.182497024536133, "global_step": 191838, "epoch": 4567} {"train_loss": -7.12491512298584, "global_step": 191839, "epoch": 4567} {"train_loss": -7.129809379577637, "global_step": 191840, "epoch": 4567} {"train_loss": -7.303115367889404, "global_step": 191841, "epoch": 4567} {"train_loss": -7.071874618530273, "global_step": 191842, "epoch": 4567} {"train_loss": -7.127203941345215, "global_step": 191843, "epoch": 4567} {"train_loss": -7.210488319396973, "global_step": 191844, "epoch": 4567} {"train_loss": -7.18021821975708, "global_step": 191845, "epoch": 4567} {"train_loss": -7.174481391906738, "global_step": 191846, "epoch": 4567} {"train_loss": -7.127537727355957, "global_step": 191847, "epoch": 4567} {"train_loss": -7.117816925048828, "global_step": 191848, "epoch": 4567} {"train_loss": -7.244650840759277, "global_step": 191849, "epoch": 4567} {"train_loss": -7.065041542053223, "global_step": 191850, "epoch": 4567} {"train_loss": -7.215937614440918, "global_step": 191851, "epoch": 4567} {"train_loss": -7.214400768280029, "global_step": 191852, "epoch": 4567} {"train_loss": -7.2382659912109375, "global_step": 191853, "epoch": 4567} {"train_loss": -7.184810638427734, "global_step": 191854, "epoch": 4567} {"train_loss": -7.150471074240548, "global_step": 191855, "epoch": 4567, "val_loss": 69653.6640625} {"train_loss": -7.222962379455566, "global_step": 191856, "epoch": 4568} {"train_loss": -7.257197380065918, "global_step": 191857, "epoch": 4568} {"train_loss": -7.1644287109375, "global_step": 191858, "epoch": 4568} {"train_loss": -7.163285255432129, "global_step": 191859, "epoch": 4568} {"train_loss": -7.097667217254639, "global_step": 191860, "epoch": 4568} {"train_loss": -7.1259965896606445, "global_step": 191861, "epoch": 4568} {"train_loss": -7.214341163635254, "global_step": 191862, "epoch": 4568} {"train_loss": -7.206997871398926, "global_step": 191863, "epoch": 4568} {"train_loss": -7.209685325622559, "global_step": 191864, "epoch": 4568} {"train_loss": -7.174413681030273, "global_step": 191865, "epoch": 4568} {"train_loss": -7.173257827758789, "global_step": 191866, "epoch": 4568} {"train_loss": -7.2131452560424805, "global_step": 191867, "epoch": 4568} {"train_loss": -7.247281551361084, "global_step": 191868, "epoch": 4568} {"train_loss": -7.182465076446533, "global_step": 191869, "epoch": 4568} {"train_loss": -7.310614109039307, "global_step": 191870, "epoch": 4568} {"train_loss": -7.200182914733887, "global_step": 191871, "epoch": 4568} {"train_loss": -7.152066230773926, "global_step": 191872, "epoch": 4568} {"train_loss": -7.2192840576171875, "global_step": 191873, "epoch": 4568} {"train_loss": -7.085331916809082, "global_step": 191874, "epoch": 4568} {"train_loss": -7.158341407775879, "global_step": 191875, "epoch": 4568} {"train_loss": -7.130348205566406, "global_step": 191876, "epoch": 4568} {"train_loss": -7.149176597595215, "global_step": 191877, "epoch": 4568} {"train_loss": -7.153369903564453, "global_step": 191878, "epoch": 4568} {"train_loss": -7.16148567199707, "global_step": 191879, "epoch": 4568} {"train_loss": -7.019918441772461, "global_step": 191880, "epoch": 4568} {"train_loss": -7.288257598876953, "global_step": 191881, "epoch": 4568} {"train_loss": -7.165523529052734, "global_step": 191882, "epoch": 4568} {"train_loss": -7.144418716430664, "global_step": 191883, "epoch": 4568} {"train_loss": -7.382993221282959, "global_step": 191884, "epoch": 4568} {"train_loss": -7.233870506286621, "global_step": 191885, "epoch": 4568} {"train_loss": -7.217087745666504, "global_step": 191886, "epoch": 4568} {"train_loss": -7.2327399253845215, "global_step": 191887, "epoch": 4568} {"train_loss": -7.226339340209961, "global_step": 191888, "epoch": 4568} {"train_loss": -7.320305347442627, "global_step": 191889, "epoch": 4568} {"train_loss": -7.234176158905029, "global_step": 191890, "epoch": 4568} {"train_loss": -7.192024230957031, "global_step": 191891, "epoch": 4568} {"train_loss": -7.224969863891602, "global_step": 191892, "epoch": 4568} {"train_loss": -7.2609052658081055, "global_step": 191893, "epoch": 4568} {"train_loss": -7.198370933532715, "global_step": 191894, "epoch": 4568} {"train_loss": -7.1164326667785645, "global_step": 191895, "epoch": 4568} {"train_loss": -7.204172611236572, "global_step": 191896, "epoch": 4568} {"train_loss": -7.196763004575457, "global_step": 191897, "epoch": 4568, "val_loss": 69702.609375} {"train_loss": -7.250765800476074, "global_step": 191898, "epoch": 4569} {"train_loss": -7.084216117858887, "global_step": 191899, "epoch": 4569} {"train_loss": -7.166845798492432, "global_step": 191900, "epoch": 4569} {"train_loss": -7.0945940017700195, "global_step": 191901, "epoch": 4569} {"train_loss": -7.0405473709106445, "global_step": 191902, "epoch": 4569} {"train_loss": -7.244140148162842, "global_step": 191903, "epoch": 4569} {"train_loss": -7.031673431396484, "global_step": 191904, "epoch": 4569} {"train_loss": -7.087545394897461, "global_step": 191905, "epoch": 4569} {"train_loss": -7.2415924072265625, "global_step": 191906, "epoch": 4569} {"train_loss": -7.286860942840576, "global_step": 191907, "epoch": 4569} {"train_loss": -7.217477798461914, "global_step": 191908, "epoch": 4569} {"train_loss": -7.131518840789795, "global_step": 191909, "epoch": 4569} {"train_loss": -7.286896228790283, "global_step": 191910, "epoch": 4569} {"train_loss": -7.210799217224121, "global_step": 191911, "epoch": 4569} {"train_loss": -7.239640235900879, "global_step": 191912, "epoch": 4569} {"train_loss": -7.0596818923950195, "global_step": 191913, "epoch": 4569} {"train_loss": -7.154690742492676, "global_step": 191914, "epoch": 4569} {"train_loss": -7.215378761291504, "global_step": 191915, "epoch": 4569} {"train_loss": -7.085762023925781, "global_step": 191916, "epoch": 4569} {"train_loss": -7.097978591918945, "global_step": 191917, "epoch": 4569} {"train_loss": -7.29279899597168, "global_step": 191918, "epoch": 4569} {"train_loss": -7.174128532409668, "global_step": 191919, "epoch": 4569} {"train_loss": -7.212282657623291, "global_step": 191920, "epoch": 4569} {"train_loss": -7.2270612716674805, "global_step": 191921, "epoch": 4569} {"train_loss": -7.251877307891846, "global_step": 191922, "epoch": 4569} {"train_loss": -7.309762001037598, "global_step": 191923, "epoch": 4569} {"train_loss": -7.233023643493652, "global_step": 191924, "epoch": 4569} {"train_loss": -7.273262023925781, "global_step": 191925, "epoch": 4569} {"train_loss": -7.236170768737793, "global_step": 191926, "epoch": 4569} {"train_loss": -7.3195013999938965, "global_step": 191927, "epoch": 4569} {"train_loss": -7.251155376434326, "global_step": 191928, "epoch": 4569} {"train_loss": -7.239535331726074, "global_step": 191929, "epoch": 4569} {"train_loss": -7.282648086547852, "global_step": 191930, "epoch": 4569} {"train_loss": -7.171601295471191, "global_step": 191931, "epoch": 4569} {"train_loss": -7.238492012023926, "global_step": 191932, "epoch": 4569} {"train_loss": -7.244375705718994, "global_step": 191933, "epoch": 4569} {"train_loss": -7.334770202636719, "global_step": 191934, "epoch": 4569} {"train_loss": -7.248533248901367, "global_step": 191935, "epoch": 4569} {"train_loss": -7.317785263061523, "global_step": 191936, "epoch": 4569} {"train_loss": -7.131930351257324, "global_step": 191937, "epoch": 4569} {"train_loss": -7.299081802368164, "global_step": 191938, "epoch": 4569} {"train_loss": -7.213430790674119, "global_step": 191939, "epoch": 4569, "val_loss": 69652.96875} {"train_loss": -7.317636489868164, "global_step": 191940, "epoch": 4570} {"train_loss": -7.303388595581055, "global_step": 191941, "epoch": 4570} {"train_loss": -7.29611873626709, "global_step": 191942, "epoch": 4570} {"train_loss": -7.250349998474121, "global_step": 191943, "epoch": 4570} {"train_loss": -7.245745658874512, "global_step": 191944, "epoch": 4570} {"train_loss": -7.368281364440918, "global_step": 191945, "epoch": 4570} {"train_loss": -7.3574323654174805, "global_step": 191946, "epoch": 4570} {"train_loss": -7.293749809265137, "global_step": 191947, "epoch": 4570} {"train_loss": -7.352699279785156, "global_step": 191948, "epoch": 4570} {"train_loss": -7.226222038269043, "global_step": 191949, "epoch": 4570} {"train_loss": -7.1114115715026855, "global_step": 191950, "epoch": 4570} {"train_loss": -7.223846912384033, "global_step": 191951, "epoch": 4570} {"train_loss": -7.22018575668335, "global_step": 191952, "epoch": 4570} {"train_loss": -7.342926979064941, "global_step": 191953, "epoch": 4570} {"train_loss": -7.257320404052734, "global_step": 191954, "epoch": 4570} {"train_loss": -7.245118141174316, "global_step": 191955, "epoch": 4570} {"train_loss": -7.267522811889648, "global_step": 191956, "epoch": 4570} {"train_loss": -7.365777969360352, "global_step": 191957, "epoch": 4570} {"train_loss": -7.366369724273682, "global_step": 191958, "epoch": 4570} {"train_loss": -7.2846903800964355, "global_step": 191959, "epoch": 4570} {"train_loss": -7.234398365020752, "global_step": 191960, "epoch": 4570} {"train_loss": -7.242222785949707, "global_step": 191961, "epoch": 4570} {"train_loss": -7.34027624130249, "global_step": 191962, "epoch": 4570} {"train_loss": -7.182655334472656, "global_step": 191963, "epoch": 4570} {"train_loss": -7.3920207023620605, "global_step": 191964, "epoch": 4570} {"train_loss": -7.295446395874023, "global_step": 191965, "epoch": 4570} {"train_loss": -7.318686485290527, "global_step": 191966, "epoch": 4570} {"train_loss": -7.190042972564697, "global_step": 191967, "epoch": 4570} {"train_loss": -7.21549654006958, "global_step": 191968, "epoch": 4570} {"train_loss": -7.322416305541992, "global_step": 191969, "epoch": 4570} {"train_loss": -7.207314491271973, "global_step": 191970, "epoch": 4570} {"train_loss": -6.944965839385986, "global_step": 191971, "epoch": 4570} {"train_loss": -7.143686294555664, "global_step": 191972, "epoch": 4570} {"train_loss": -7.071489334106445, "global_step": 191973, "epoch": 4570} {"train_loss": -7.2170915603637695, "global_step": 191974, "epoch": 4570} {"train_loss": -7.252426624298096, "global_step": 191975, "epoch": 4570} {"train_loss": -7.211241722106934, "global_step": 191976, "epoch": 4570} {"train_loss": -7.137815952301025, "global_step": 191977, "epoch": 4570} {"train_loss": -7.226336479187012, "global_step": 191978, "epoch": 4570} {"train_loss": -7.2145280838012695, "global_step": 191979, "epoch": 4570} {"train_loss": -7.2475128173828125, "global_step": 191980, "epoch": 4570} {"train_loss": -7.248964457284837, "global_step": 191981, "epoch": 4570, "val_loss": 69772.828125} {"train_loss": -7.246151924133301, "global_step": 191982, "epoch": 4571} {"train_loss": -7.282861709594727, "global_step": 191983, "epoch": 4571} {"train_loss": -7.258638381958008, "global_step": 191984, "epoch": 4571} {"train_loss": -7.2731170654296875, "global_step": 191985, "epoch": 4571} {"train_loss": -7.285114288330078, "global_step": 191986, "epoch": 4571} {"train_loss": -7.220821380615234, "global_step": 191987, "epoch": 4571} {"train_loss": -7.173094749450684, "global_step": 191988, "epoch": 4571} {"train_loss": -7.190173625946045, "global_step": 191989, "epoch": 4571} {"train_loss": -7.214308738708496, "global_step": 191990, "epoch": 4571} {"train_loss": -7.171785354614258, "global_step": 191991, "epoch": 4571} {"train_loss": -7.200175762176514, "global_step": 191992, "epoch": 4571} {"train_loss": -6.980534076690674, "global_step": 191993, "epoch": 4571} {"train_loss": -7.124692916870117, "global_step": 191994, "epoch": 4571} {"train_loss": -7.125546932220459, "global_step": 191995, "epoch": 4571} {"train_loss": -6.972160339355469, "global_step": 191996, "epoch": 4571} {"train_loss": -6.662292003631592, "global_step": 191997, "epoch": 4571} {"train_loss": -7.076076030731201, "global_step": 191998, "epoch": 4571} {"train_loss": -7.10975456237793, "global_step": 191999, "epoch": 4571} {"train_loss": -6.87157678604126, "global_step": 192000, "epoch": 4571} {"train_loss": -7.136280536651611, "global_step": 192001, "epoch": 4571} {"train_loss": -6.959181785583496, "global_step": 192002, "epoch": 4571} {"train_loss": -7.157060623168945, "global_step": 192003, "epoch": 4571} {"train_loss": -7.099906921386719, "global_step": 192004, "epoch": 4571} {"train_loss": -6.890334129333496, "global_step": 192005, "epoch": 4571} {"train_loss": -7.054624557495117, "global_step": 192006, "epoch": 4571} {"train_loss": -6.987932205200195, "global_step": 192007, "epoch": 4571} {"train_loss": -7.043330192565918, "global_step": 192008, "epoch": 4571} {"train_loss": -7.088406562805176, "global_step": 192009, "epoch": 4571} {"train_loss": -7.085042953491211, "global_step": 192010, "epoch": 4571} {"train_loss": -6.952103614807129, "global_step": 192011, "epoch": 4571} {"train_loss": -6.9718451499938965, "global_step": 192012, "epoch": 4571} {"train_loss": -7.068120002746582, "global_step": 192013, "epoch": 4571} {"train_loss": -6.925915718078613, "global_step": 192014, "epoch": 4571} {"train_loss": -7.025928974151611, "global_step": 192015, "epoch": 4571} {"train_loss": -6.86722469329834, "global_step": 192016, "epoch": 4571} {"train_loss": -6.962606430053711, "global_step": 192017, "epoch": 4571} {"train_loss": -7.060283184051514, "global_step": 192018, "epoch": 4571} {"train_loss": -6.94818115234375, "global_step": 192019, "epoch": 4571} {"train_loss": -7.09991979598999, "global_step": 192020, "epoch": 4571} {"train_loss": -6.916812896728516, "global_step": 192021, "epoch": 4571} {"train_loss": -6.959619522094727, "global_step": 192022, "epoch": 4571} {"train_loss": -7.062851304099674, "global_step": 192023, "epoch": 4571, "val_loss": 69722.3984375} {"train_loss": -7.143830299377441, "global_step": 192024, "epoch": 4572} {"train_loss": -6.890704154968262, "global_step": 192025, "epoch": 4572} {"train_loss": -7.126490116119385, "global_step": 192026, "epoch": 4572} {"train_loss": -6.975286483764648, "global_step": 192027, "epoch": 4572} {"train_loss": -7.144757270812988, "global_step": 192028, "epoch": 4572} {"train_loss": -7.158778667449951, "global_step": 192029, "epoch": 4572} {"train_loss": -7.136916160583496, "global_step": 192030, "epoch": 4572} {"train_loss": -7.178716659545898, "global_step": 192031, "epoch": 4572} {"train_loss": -7.2115797996521, "global_step": 192032, "epoch": 4572} {"train_loss": -7.15887975692749, "global_step": 192033, "epoch": 4572} {"train_loss": -7.116148948669434, "global_step": 192034, "epoch": 4572} {"train_loss": -7.228726863861084, "global_step": 192035, "epoch": 4572} {"train_loss": -7.122353553771973, "global_step": 192036, "epoch": 4572} {"train_loss": -7.207375526428223, "global_step": 192037, "epoch": 4572} {"train_loss": -7.193043231964111, "global_step": 192038, "epoch": 4572} {"train_loss": -7.21939754486084, "global_step": 192039, "epoch": 4572} {"train_loss": -7.2691650390625, "global_step": 192040, "epoch": 4572} {"train_loss": -7.063865661621094, "global_step": 192041, "epoch": 4572} {"train_loss": -7.289155960083008, "global_step": 192042, "epoch": 4572} {"train_loss": -7.193570613861084, "global_step": 192043, "epoch": 4572} {"train_loss": -7.257413864135742, "global_step": 192044, "epoch": 4572} {"train_loss": -7.128636837005615, "global_step": 192045, "epoch": 4572} {"train_loss": -7.236227512359619, "global_step": 192046, "epoch": 4572} {"train_loss": -7.234382152557373, "global_step": 192047, "epoch": 4572} {"train_loss": -7.31706428527832, "global_step": 192048, "epoch": 4572} {"train_loss": -7.21323823928833, "global_step": 192049, "epoch": 4572} {"train_loss": -7.181528568267822, "global_step": 192050, "epoch": 4572} {"train_loss": -7.211415767669678, "global_step": 192051, "epoch": 4572} {"train_loss": -7.262689113616943, "global_step": 192052, "epoch": 4572} {"train_loss": -7.107648849487305, "global_step": 192053, "epoch": 4572} {"train_loss": -7.189136505126953, "global_step": 192054, "epoch": 4572} {"train_loss": -7.220940589904785, "global_step": 192055, "epoch": 4572} {"train_loss": -7.029939651489258, "global_step": 192056, "epoch": 4572} {"train_loss": -7.277531623840332, "global_step": 192057, "epoch": 4572} {"train_loss": -7.124074935913086, "global_step": 192058, "epoch": 4572} {"train_loss": -7.188152313232422, "global_step": 192059, "epoch": 4572} {"train_loss": -7.1406354904174805, "global_step": 192060, "epoch": 4572} {"train_loss": -7.143712043762207, "global_step": 192061, "epoch": 4572} {"train_loss": -7.164397239685059, "global_step": 192062, "epoch": 4572} {"train_loss": -7.314212799072266, "global_step": 192063, "epoch": 4572} {"train_loss": -7.256591796875, "global_step": 192064, "epoch": 4572} {"train_loss": -7.176145678474789, "global_step": 192065, "epoch": 4572, "val_loss": 69542.921875} {"train_loss": -7.338204383850098, "global_step": 192066, "epoch": 4573} {"train_loss": -7.2179646492004395, "global_step": 192067, "epoch": 4573} {"train_loss": -7.141038417816162, "global_step": 192068, "epoch": 4573} {"train_loss": -7.207906246185303, "global_step": 192069, "epoch": 4573} {"train_loss": -7.358502388000488, "global_step": 192070, "epoch": 4573} {"train_loss": -7.265518665313721, "global_step": 192071, "epoch": 4573} {"train_loss": -7.251137733459473, "global_step": 192072, "epoch": 4573} {"train_loss": -7.247519493103027, "global_step": 192073, "epoch": 4573} {"train_loss": -7.289096832275391, "global_step": 192074, "epoch": 4573} {"train_loss": -7.231352806091309, "global_step": 192075, "epoch": 4573} {"train_loss": -7.24570894241333, "global_step": 192076, "epoch": 4573} {"train_loss": -7.272205352783203, "global_step": 192077, "epoch": 4573} {"train_loss": -7.194753646850586, "global_step": 192078, "epoch": 4573} {"train_loss": -7.393274307250977, "global_step": 192079, "epoch": 4573} {"train_loss": -7.299531936645508, "global_step": 192080, "epoch": 4573} {"train_loss": -7.126274108886719, "global_step": 192081, "epoch": 4573} {"train_loss": -7.314084053039551, "global_step": 192082, "epoch": 4573} {"train_loss": -7.292698860168457, "global_step": 192083, "epoch": 4573} {"train_loss": -7.282093048095703, "global_step": 192084, "epoch": 4573} {"train_loss": -7.271444797515869, "global_step": 192085, "epoch": 4573} {"train_loss": -7.242578029632568, "global_step": 192086, "epoch": 4573} {"train_loss": -7.172923564910889, "global_step": 192087, "epoch": 4573} {"train_loss": -7.308469772338867, "global_step": 192088, "epoch": 4573} {"train_loss": -7.2127509117126465, "global_step": 192089, "epoch": 4573} {"train_loss": -7.221199989318848, "global_step": 192090, "epoch": 4573} {"train_loss": -7.297904014587402, "global_step": 192091, "epoch": 4573} {"train_loss": -7.24006462097168, "global_step": 192092, "epoch": 4573} {"train_loss": -7.285508155822754, "global_step": 192093, "epoch": 4573} {"train_loss": -7.313462257385254, "global_step": 192094, "epoch": 4573} {"train_loss": -7.222114562988281, "global_step": 192095, "epoch": 4573} {"train_loss": -7.195751190185547, "global_step": 192096, "epoch": 4573} {"train_loss": -7.191483497619629, "global_step": 192097, "epoch": 4573} {"train_loss": -7.083669185638428, "global_step": 192098, "epoch": 4573} {"train_loss": -7.098668098449707, "global_step": 192099, "epoch": 4573} {"train_loss": -7.105755805969238, "global_step": 192100, "epoch": 4573} {"train_loss": -7.069372653961182, "global_step": 192101, "epoch": 4573} {"train_loss": -7.134344100952148, "global_step": 192102, "epoch": 4573} {"train_loss": -7.211958885192871, "global_step": 192103, "epoch": 4573} {"train_loss": -7.091876029968262, "global_step": 192104, "epoch": 4573} {"train_loss": -7.0648908615112305, "global_step": 192105, "epoch": 4573} {"train_loss": -7.085524082183838, "global_step": 192106, "epoch": 4573} {"train_loss": -7.218308244432722, "global_step": 192107, "epoch": 4573, "val_loss": 69683.8671875} {"train_loss": -7.148910045623779, "global_step": 192108, "epoch": 4574} {"train_loss": -7.123180389404297, "global_step": 192109, "epoch": 4574} {"train_loss": -7.1329874992370605, "global_step": 192110, "epoch": 4574} {"train_loss": -7.202000617980957, "global_step": 192111, "epoch": 4574} {"train_loss": -7.180034160614014, "global_step": 192112, "epoch": 4574} {"train_loss": -7.181070804595947, "global_step": 192113, "epoch": 4574} {"train_loss": -7.22103214263916, "global_step": 192114, "epoch": 4574} {"train_loss": -7.208975315093994, "global_step": 192115, "epoch": 4574} {"train_loss": -7.281909942626953, "global_step": 192116, "epoch": 4574} {"train_loss": -7.275940895080566, "global_step": 192117, "epoch": 4574} {"train_loss": -7.250329971313477, "global_step": 192118, "epoch": 4574} {"train_loss": -7.278111457824707, "global_step": 192119, "epoch": 4574} {"train_loss": -7.280091285705566, "global_step": 192120, "epoch": 4574} {"train_loss": -7.243020057678223, "global_step": 192121, "epoch": 4574} {"train_loss": -7.318253993988037, "global_step": 192122, "epoch": 4574} {"train_loss": -7.257443428039551, "global_step": 192123, "epoch": 4574} {"train_loss": -7.2750654220581055, "global_step": 192124, "epoch": 4574} {"train_loss": -7.287352561950684, "global_step": 192125, "epoch": 4574} {"train_loss": -7.10743522644043, "global_step": 192126, "epoch": 4574} {"train_loss": -7.273483753204346, "global_step": 192127, "epoch": 4574} {"train_loss": -7.189499855041504, "global_step": 192128, "epoch": 4574} {"train_loss": -7.266849517822266, "global_step": 192129, "epoch": 4574} {"train_loss": -7.193693161010742, "global_step": 192130, "epoch": 4574} {"train_loss": -7.242931842803955, "global_step": 192131, "epoch": 4574} {"train_loss": -7.319184303283691, "global_step": 192132, "epoch": 4574} {"train_loss": -7.158070087432861, "global_step": 192133, "epoch": 4574} {"train_loss": -6.9782915115356445, "global_step": 192134, "epoch": 4574} {"train_loss": -7.144952297210693, "global_step": 192135, "epoch": 4574} {"train_loss": -7.32203483581543, "global_step": 192136, "epoch": 4574} {"train_loss": -7.18284273147583, "global_step": 192137, "epoch": 4574} {"train_loss": -7.12532377243042, "global_step": 192138, "epoch": 4574} {"train_loss": -7.186025142669678, "global_step": 192139, "epoch": 4574} {"train_loss": -7.231647491455078, "global_step": 192140, "epoch": 4574} {"train_loss": -7.2032365798950195, "global_step": 192141, "epoch": 4574} {"train_loss": -7.247072219848633, "global_step": 192142, "epoch": 4574} {"train_loss": -7.181297302246094, "global_step": 192143, "epoch": 4574} {"train_loss": -7.298654556274414, "global_step": 192144, "epoch": 4574} {"train_loss": -7.197128772735596, "global_step": 192145, "epoch": 4574} {"train_loss": -7.25584077835083, "global_step": 192146, "epoch": 4574} {"train_loss": -7.286375999450684, "global_step": 192147, "epoch": 4574} {"train_loss": -7.159939765930176, "global_step": 192148, "epoch": 4574} {"train_loss": -7.216374158859253, "global_step": 192149, "epoch": 4574, "val_loss": 69656.8515625} {"train_loss": -7.283738136291504, "global_step": 192150, "epoch": 4575} {"train_loss": -7.3159894943237305, "global_step": 192151, "epoch": 4575} {"train_loss": -7.25714111328125, "global_step": 192152, "epoch": 4575} {"train_loss": -7.131599426269531, "global_step": 192153, "epoch": 4575} {"train_loss": -7.1846466064453125, "global_step": 192154, "epoch": 4575} {"train_loss": -7.226496696472168, "global_step": 192155, "epoch": 4575} {"train_loss": -7.303563117980957, "global_step": 192156, "epoch": 4575} {"train_loss": -7.292641639709473, "global_step": 192157, "epoch": 4575} {"train_loss": -7.084360122680664, "global_step": 192158, "epoch": 4575} {"train_loss": -7.227631092071533, "global_step": 192159, "epoch": 4575} {"train_loss": -7.207223892211914, "global_step": 192160, "epoch": 4575} {"train_loss": -7.250818252563477, "global_step": 192161, "epoch": 4575} {"train_loss": -7.2866716384887695, "global_step": 192162, "epoch": 4575} {"train_loss": -7.229570388793945, "global_step": 192163, "epoch": 4575} {"train_loss": -7.252157688140869, "global_step": 192164, "epoch": 4575} {"train_loss": -7.326028347015381, "global_step": 192165, "epoch": 4575} {"train_loss": -7.279092788696289, "global_step": 192166, "epoch": 4575} {"train_loss": -7.195879936218262, "global_step": 192167, "epoch": 4575} {"train_loss": -7.309321403503418, "global_step": 192168, "epoch": 4575} {"train_loss": -7.324477195739746, "global_step": 192169, "epoch": 4575} {"train_loss": -7.185456275939941, "global_step": 192170, "epoch": 4575} {"train_loss": -7.267991065979004, "global_step": 192171, "epoch": 4575} {"train_loss": -7.132040977478027, "global_step": 192172, "epoch": 4575} {"train_loss": -7.268603324890137, "global_step": 192173, "epoch": 4575} {"train_loss": -7.317032337188721, "global_step": 192174, "epoch": 4575} {"train_loss": -7.2767510414123535, "global_step": 192175, "epoch": 4575} {"train_loss": -7.122088432312012, "global_step": 192176, "epoch": 4575} {"train_loss": -7.323657989501953, "global_step": 192177, "epoch": 4575} {"train_loss": -7.182985305786133, "global_step": 192178, "epoch": 4575} {"train_loss": -7.10004186630249, "global_step": 192179, "epoch": 4575} {"train_loss": -7.256723880767822, "global_step": 192180, "epoch": 4575} {"train_loss": -7.283554553985596, "global_step": 192181, "epoch": 4575} {"train_loss": -7.204413414001465, "global_step": 192182, "epoch": 4575} {"train_loss": -7.294768333435059, "global_step": 192183, "epoch": 4575} {"train_loss": -7.295228958129883, "global_step": 192184, "epoch": 4575} {"train_loss": -7.166232109069824, "global_step": 192185, "epoch": 4575} {"train_loss": -7.282999038696289, "global_step": 192186, "epoch": 4575} {"train_loss": -7.238000392913818, "global_step": 192187, "epoch": 4575} {"train_loss": -7.252299785614014, "global_step": 192188, "epoch": 4575} {"train_loss": -7.292908191680908, "global_step": 192189, "epoch": 4575} {"train_loss": -7.133101940155029, "global_step": 192190, "epoch": 4575} {"train_loss": -7.239511137916928, "global_step": 192191, "epoch": 4575, "val_loss": 69610.7109375} {"train_loss": -7.233645915985107, "global_step": 192192, "epoch": 4576} {"train_loss": -7.24713134765625, "global_step": 192193, "epoch": 4576} {"train_loss": -7.230440139770508, "global_step": 192194, "epoch": 4576} {"train_loss": -7.171926021575928, "global_step": 192195, "epoch": 4576} {"train_loss": -7.173863410949707, "global_step": 192196, "epoch": 4576} {"train_loss": -7.100083351135254, "global_step": 192197, "epoch": 4576} {"train_loss": -7.08101749420166, "global_step": 192198, "epoch": 4576} {"train_loss": -7.245635509490967, "global_step": 192199, "epoch": 4576} {"train_loss": -7.183990478515625, "global_step": 192200, "epoch": 4576} {"train_loss": -7.237320423126221, "global_step": 192201, "epoch": 4576} {"train_loss": -7.154311180114746, "global_step": 192202, "epoch": 4576} {"train_loss": -7.235618591308594, "global_step": 192203, "epoch": 4576} {"train_loss": -7.286460876464844, "global_step": 192204, "epoch": 4576} {"train_loss": -7.128273010253906, "global_step": 192205, "epoch": 4576} {"train_loss": -7.216335773468018, "global_step": 192206, "epoch": 4576} {"train_loss": -7.161273002624512, "global_step": 192207, "epoch": 4576} {"train_loss": -7.139368057250977, "global_step": 192208, "epoch": 4576} {"train_loss": -7.300405025482178, "global_step": 192209, "epoch": 4576} {"train_loss": -7.175295352935791, "global_step": 192210, "epoch": 4576} {"train_loss": -7.1546630859375, "global_step": 192211, "epoch": 4576} {"train_loss": -7.2192792892456055, "global_step": 192212, "epoch": 4576} {"train_loss": -7.212360382080078, "global_step": 192213, "epoch": 4576} {"train_loss": -7.148227214813232, "global_step": 192214, "epoch": 4576} {"train_loss": -7.267449855804443, "global_step": 192215, "epoch": 4576} {"train_loss": -7.21578311920166, "global_step": 192216, "epoch": 4576} {"train_loss": -7.137757301330566, "global_step": 192217, "epoch": 4576} {"train_loss": -7.322087287902832, "global_step": 192218, "epoch": 4576} {"train_loss": -7.239642143249512, "global_step": 192219, "epoch": 4576} {"train_loss": -7.22530460357666, "global_step": 192220, "epoch": 4576} {"train_loss": -7.213050842285156, "global_step": 192221, "epoch": 4576} {"train_loss": -7.166657447814941, "global_step": 192222, "epoch": 4576} {"train_loss": -7.2848310470581055, "global_step": 192223, "epoch": 4576} {"train_loss": -7.208547592163086, "global_step": 192224, "epoch": 4576} {"train_loss": -7.310101509094238, "global_step": 192225, "epoch": 4576} {"train_loss": -7.207025527954102, "global_step": 192226, "epoch": 4576} {"train_loss": -7.172032833099365, "global_step": 192227, "epoch": 4576} {"train_loss": -7.227202415466309, "global_step": 192228, "epoch": 4576} {"train_loss": -7.14704704284668, "global_step": 192229, "epoch": 4576} {"train_loss": -7.2552642822265625, "global_step": 192230, "epoch": 4576} {"train_loss": -7.227453231811523, "global_step": 192231, "epoch": 4576} {"train_loss": -7.245809555053711, "global_step": 192232, "epoch": 4576} {"train_loss": -7.206722145988827, "global_step": 192233, "epoch": 4576, "val_loss": 69735.375} {"train_loss": -7.124032020568848, "global_step": 192234, "epoch": 4577} {"train_loss": -7.133241176605225, "global_step": 192235, "epoch": 4577} {"train_loss": -7.192694664001465, "global_step": 192236, "epoch": 4577} {"train_loss": -7.227579116821289, "global_step": 192237, "epoch": 4577} {"train_loss": -7.170633316040039, "global_step": 192238, "epoch": 4577} {"train_loss": -7.078124046325684, "global_step": 192239, "epoch": 4577} {"train_loss": -7.243654251098633, "global_step": 192240, "epoch": 4577} {"train_loss": -7.1284990310668945, "global_step": 192241, "epoch": 4577} {"train_loss": -7.273775577545166, "global_step": 192242, "epoch": 4577} {"train_loss": -7.188183784484863, "global_step": 192243, "epoch": 4577} {"train_loss": -7.195701599121094, "global_step": 192244, "epoch": 4577} {"train_loss": -7.343306541442871, "global_step": 192245, "epoch": 4577} {"train_loss": -7.256564617156982, "global_step": 192246, "epoch": 4577} {"train_loss": -7.201752662658691, "global_step": 192247, "epoch": 4577} {"train_loss": -7.121819019317627, "global_step": 192248, "epoch": 4577} {"train_loss": -6.989485740661621, "global_step": 192249, "epoch": 4577} {"train_loss": -7.3659210205078125, "global_step": 192250, "epoch": 4577} {"train_loss": -7.197010040283203, "global_step": 192251, "epoch": 4577} {"train_loss": -7.097433567047119, "global_step": 192252, "epoch": 4577} {"train_loss": -7.1672043800354, "global_step": 192253, "epoch": 4577} {"train_loss": -7.171865940093994, "global_step": 192254, "epoch": 4577} {"train_loss": -7.264591217041016, "global_step": 192255, "epoch": 4577} {"train_loss": -7.167842864990234, "global_step": 192256, "epoch": 4577} {"train_loss": -7.121830463409424, "global_step": 192257, "epoch": 4577} {"train_loss": -7.289459705352783, "global_step": 192258, "epoch": 4577} {"train_loss": -7.149279594421387, "global_step": 192259, "epoch": 4577} {"train_loss": -7.196836948394775, "global_step": 192260, "epoch": 4577} {"train_loss": -7.289936542510986, "global_step": 192261, "epoch": 4577} {"train_loss": -7.16970157623291, "global_step": 192262, "epoch": 4577} {"train_loss": -7.156407833099365, "global_step": 192263, "epoch": 4577} {"train_loss": -7.1029887199401855, "global_step": 192264, "epoch": 4577} {"train_loss": -7.312647819519043, "global_step": 192265, "epoch": 4577} {"train_loss": -7.203978061676025, "global_step": 192266, "epoch": 4577} {"train_loss": -7.1692705154418945, "global_step": 192267, "epoch": 4577} {"train_loss": -7.101116180419922, "global_step": 192268, "epoch": 4577} {"train_loss": -7.314439296722412, "global_step": 192269, "epoch": 4577} {"train_loss": -7.245352745056152, "global_step": 192270, "epoch": 4577} {"train_loss": -7.3070173263549805, "global_step": 192271, "epoch": 4577} {"train_loss": -7.226846694946289, "global_step": 192272, "epoch": 4577} {"train_loss": -7.305544853210449, "global_step": 192273, "epoch": 4577} {"train_loss": -7.18386173248291, "global_step": 192274, "epoch": 4577} {"train_loss": -7.197264035542806, "global_step": 192275, "epoch": 4577, "val_loss": 69727.8515625} {"train_loss": -7.226049423217773, "global_step": 192276, "epoch": 4578} {"train_loss": -7.336268901824951, "global_step": 192277, "epoch": 4578} {"train_loss": -7.3054046630859375, "global_step": 192278, "epoch": 4578} {"train_loss": -7.351815223693848, "global_step": 192279, "epoch": 4578} {"train_loss": -7.239031791687012, "global_step": 192280, "epoch": 4578} {"train_loss": -7.202893257141113, "global_step": 192281, "epoch": 4578} {"train_loss": -7.311635494232178, "global_step": 192282, "epoch": 4578} {"train_loss": -7.276823997497559, "global_step": 192283, "epoch": 4578} {"train_loss": -7.1947922706604, "global_step": 192284, "epoch": 4578} {"train_loss": -7.301084518432617, "global_step": 192285, "epoch": 4578} {"train_loss": -7.32276725769043, "global_step": 192286, "epoch": 4578} {"train_loss": -7.193112850189209, "global_step": 192287, "epoch": 4578} {"train_loss": -7.3319411277771, "global_step": 192288, "epoch": 4578} {"train_loss": -7.398693084716797, "global_step": 192289, "epoch": 4578} {"train_loss": -7.19648551940918, "global_step": 192290, "epoch": 4578} {"train_loss": -7.294809341430664, "global_step": 192291, "epoch": 4578} {"train_loss": -7.235103607177734, "global_step": 192292, "epoch": 4578} {"train_loss": -7.3898162841796875, "global_step": 192293, "epoch": 4578} {"train_loss": -7.172518730163574, "global_step": 192294, "epoch": 4578} {"train_loss": -7.211690425872803, "global_step": 192295, "epoch": 4578} {"train_loss": -7.248495101928711, "global_step": 192296, "epoch": 4578} {"train_loss": -7.331839561462402, "global_step": 192297, "epoch": 4578} {"train_loss": -7.136599540710449, "global_step": 192298, "epoch": 4578} {"train_loss": -7.254657745361328, "global_step": 192299, "epoch": 4578} {"train_loss": -7.351182460784912, "global_step": 192300, "epoch": 4578} {"train_loss": -7.36386775970459, "global_step": 192301, "epoch": 4578} {"train_loss": -7.291725158691406, "global_step": 192302, "epoch": 4578} {"train_loss": -7.2333574295043945, "global_step": 192303, "epoch": 4578} {"train_loss": -7.200345993041992, "global_step": 192304, "epoch": 4578} {"train_loss": -7.097743988037109, "global_step": 192305, "epoch": 4578} {"train_loss": -7.426573753356934, "global_step": 192306, "epoch": 4578} {"train_loss": -7.3031415939331055, "global_step": 192307, "epoch": 4578} {"train_loss": -7.213813781738281, "global_step": 192308, "epoch": 4578} {"train_loss": -7.1767072677612305, "global_step": 192309, "epoch": 4578} {"train_loss": -7.2663774490356445, "global_step": 192310, "epoch": 4578} {"train_loss": -7.212527751922607, "global_step": 192311, "epoch": 4578} {"train_loss": -7.212916374206543, "global_step": 192312, "epoch": 4578} {"train_loss": -7.221689701080322, "global_step": 192313, "epoch": 4578} {"train_loss": -7.147773742675781, "global_step": 192314, "epoch": 4578} {"train_loss": -7.05033016204834, "global_step": 192315, "epoch": 4578} {"train_loss": -7.273366451263428, "global_step": 192316, "epoch": 4578} {"train_loss": -7.251738536925543, "global_step": 192317, "epoch": 4578, "val_loss": 69621.546875} {"train_loss": -7.199920177459717, "global_step": 192318, "epoch": 4579} {"train_loss": -7.236449241638184, "global_step": 192319, "epoch": 4579} {"train_loss": -7.171608924865723, "global_step": 192320, "epoch": 4579} {"train_loss": -7.226317882537842, "global_step": 192321, "epoch": 4579} {"train_loss": -7.136778831481934, "global_step": 192322, "epoch": 4579} {"train_loss": -7.243836879730225, "global_step": 192323, "epoch": 4579} {"train_loss": -7.184306621551514, "global_step": 192324, "epoch": 4579} {"train_loss": -7.130965232849121, "global_step": 192325, "epoch": 4579} {"train_loss": -7.165404319763184, "global_step": 192326, "epoch": 4579} {"train_loss": -7.270001411437988, "global_step": 192327, "epoch": 4579} {"train_loss": -7.058571815490723, "global_step": 192328, "epoch": 4579} {"train_loss": -7.123836517333984, "global_step": 192329, "epoch": 4579} {"train_loss": -7.153337478637695, "global_step": 192330, "epoch": 4579} {"train_loss": -6.996780872344971, "global_step": 192331, "epoch": 4579} {"train_loss": -7.164597034454346, "global_step": 192332, "epoch": 4579} {"train_loss": -7.137511253356934, "global_step": 192333, "epoch": 4579} {"train_loss": -7.198059558868408, "global_step": 192334, "epoch": 4579} {"train_loss": -6.960238933563232, "global_step": 192335, "epoch": 4579} {"train_loss": -7.097616195678711, "global_step": 192336, "epoch": 4579} {"train_loss": -7.1089043617248535, "global_step": 192337, "epoch": 4579} {"train_loss": -6.949038505554199, "global_step": 192338, "epoch": 4579} {"train_loss": -7.152829647064209, "global_step": 192339, "epoch": 4579} {"train_loss": -6.9778242111206055, "global_step": 192340, "epoch": 4579} {"train_loss": -7.029772758483887, "global_step": 192341, "epoch": 4579} {"train_loss": -6.9756574630737305, "global_step": 192342, "epoch": 4579} {"train_loss": -7.125082969665527, "global_step": 192343, "epoch": 4579} {"train_loss": -6.93949031829834, "global_step": 192344, "epoch": 4579} {"train_loss": -7.026176452636719, "global_step": 192345, "epoch": 4579} {"train_loss": -7.0380988121032715, "global_step": 192346, "epoch": 4579} {"train_loss": -7.030462741851807, "global_step": 192347, "epoch": 4579} {"train_loss": -7.016725540161133, "global_step": 192348, "epoch": 4579} {"train_loss": -7.010005950927734, "global_step": 192349, "epoch": 4579} {"train_loss": -7.161304473876953, "global_step": 192350, "epoch": 4579} {"train_loss": -7.158017158508301, "global_step": 192351, "epoch": 4579} {"train_loss": -7.11345100402832, "global_step": 192352, "epoch": 4579} {"train_loss": -7.054064750671387, "global_step": 192353, "epoch": 4579} {"train_loss": -7.152073860168457, "global_step": 192354, "epoch": 4579} {"train_loss": -7.176688194274902, "global_step": 192355, "epoch": 4579} {"train_loss": -6.960117340087891, "global_step": 192356, "epoch": 4579} {"train_loss": -7.136207103729248, "global_step": 192357, "epoch": 4579} {"train_loss": -7.198603630065918, "global_step": 192358, "epoch": 4579} {"train_loss": -7.107621862774804, "global_step": 192359, "epoch": 4579, "val_loss": 69545.75} {"train_loss": -7.145784378051758, "global_step": 192360, "epoch": 4580} {"train_loss": -7.133923530578613, "global_step": 192361, "epoch": 4580} {"train_loss": -7.1238203048706055, "global_step": 192362, "epoch": 4580} {"train_loss": -7.215691089630127, "global_step": 192363, "epoch": 4580} {"train_loss": -7.235840797424316, "global_step": 192364, "epoch": 4580} {"train_loss": -7.204216480255127, "global_step": 192365, "epoch": 4580} {"train_loss": -7.076223373413086, "global_step": 192366, "epoch": 4580} {"train_loss": -7.084997177124023, "global_step": 192367, "epoch": 4580} {"train_loss": -7.180895805358887, "global_step": 192368, "epoch": 4580} {"train_loss": -7.088384628295898, "global_step": 192369, "epoch": 4580} {"train_loss": -7.195487976074219, "global_step": 192370, "epoch": 4580} {"train_loss": -7.098834037780762, "global_step": 192371, "epoch": 4580} {"train_loss": -7.116697788238525, "global_step": 192372, "epoch": 4580} {"train_loss": -7.108259677886963, "global_step": 192373, "epoch": 4580} {"train_loss": -7.217630386352539, "global_step": 192374, "epoch": 4580} {"train_loss": -7.153219223022461, "global_step": 192375, "epoch": 4580} {"train_loss": -7.169365882873535, "global_step": 192376, "epoch": 4580} {"train_loss": -7.3198041915893555, "global_step": 192377, "epoch": 4580} {"train_loss": -7.144309997558594, "global_step": 192378, "epoch": 4580} {"train_loss": -7.184136867523193, "global_step": 192379, "epoch": 4580} {"train_loss": -7.124818325042725, "global_step": 192380, "epoch": 4580} {"train_loss": -7.1284685134887695, "global_step": 192381, "epoch": 4580} {"train_loss": -7.246957778930664, "global_step": 192382, "epoch": 4580} {"train_loss": -7.101888656616211, "global_step": 192383, "epoch": 4580} {"train_loss": -7.135979652404785, "global_step": 192384, "epoch": 4580} {"train_loss": -7.098913669586182, "global_step": 192385, "epoch": 4580} {"train_loss": -6.985516548156738, "global_step": 192386, "epoch": 4580} {"train_loss": -7.114315032958984, "global_step": 192387, "epoch": 4580} {"train_loss": -7.1353044509887695, "global_step": 192388, "epoch": 4580} {"train_loss": -7.057003021240234, "global_step": 192389, "epoch": 4580} {"train_loss": -7.050815105438232, "global_step": 192390, "epoch": 4580} {"train_loss": -7.032922744750977, "global_step": 192391, "epoch": 4580} {"train_loss": -6.969048976898193, "global_step": 192392, "epoch": 4580} {"train_loss": -7.167004585266113, "global_step": 192393, "epoch": 4580} {"train_loss": -6.945584297180176, "global_step": 192394, "epoch": 4580} {"train_loss": -7.231473445892334, "global_step": 192395, "epoch": 4580} {"train_loss": -6.996318817138672, "global_step": 192396, "epoch": 4580} {"train_loss": -7.107358455657959, "global_step": 192397, "epoch": 4580} {"train_loss": -7.149884223937988, "global_step": 192398, "epoch": 4580} {"train_loss": -7.025125980377197, "global_step": 192399, "epoch": 4580} {"train_loss": -7.1950812339782715, "global_step": 192400, "epoch": 4580} {"train_loss": -7.1264625163305375, "global_step": 192401, "epoch": 4580, "val_loss": 69839.6171875} {"train_loss": -7.229998588562012, "global_step": 192402, "epoch": 4581} {"train_loss": -7.024388313293457, "global_step": 192403, "epoch": 4581} {"train_loss": -7.181736469268799, "global_step": 192404, "epoch": 4581} {"train_loss": -7.068157196044922, "global_step": 192405, "epoch": 4581} {"train_loss": -7.164612770080566, "global_step": 192406, "epoch": 4581} {"train_loss": -7.110000133514404, "global_step": 192407, "epoch": 4581} {"train_loss": -7.156199932098389, "global_step": 192408, "epoch": 4581} {"train_loss": -7.299947738647461, "global_step": 192409, "epoch": 4581} {"train_loss": -7.158848285675049, "global_step": 192410, "epoch": 4581} {"train_loss": -7.212545394897461, "global_step": 192411, "epoch": 4581} {"train_loss": -7.087876319885254, "global_step": 192412, "epoch": 4581} {"train_loss": -7.107465744018555, "global_step": 192413, "epoch": 4581} {"train_loss": -7.032852649688721, "global_step": 192414, "epoch": 4581} {"train_loss": -7.100812911987305, "global_step": 192415, "epoch": 4581} {"train_loss": -7.262856483459473, "global_step": 192416, "epoch": 4581} {"train_loss": -7.271598815917969, "global_step": 192417, "epoch": 4581} {"train_loss": -7.123424530029297, "global_step": 192418, "epoch": 4581} {"train_loss": -7.118913173675537, "global_step": 192419, "epoch": 4581} {"train_loss": -7.141204357147217, "global_step": 192420, "epoch": 4581} {"train_loss": -7.129982948303223, "global_step": 192421, "epoch": 4581} {"train_loss": -7.173774719238281, "global_step": 192422, "epoch": 4581} {"train_loss": -7.22028923034668, "global_step": 192423, "epoch": 4581} {"train_loss": -7.2971625328063965, "global_step": 192424, "epoch": 4581} {"train_loss": -7.279593467712402, "global_step": 192425, "epoch": 4581} {"train_loss": -7.227143287658691, "global_step": 192426, "epoch": 4581} {"train_loss": -7.097596168518066, "global_step": 192427, "epoch": 4581} {"train_loss": -7.254589080810547, "global_step": 192428, "epoch": 4581} {"train_loss": -7.080904960632324, "global_step": 192429, "epoch": 4581} {"train_loss": -7.113696575164795, "global_step": 192430, "epoch": 4581} {"train_loss": -7.224858283996582, "global_step": 192431, "epoch": 4581} {"train_loss": -7.268750190734863, "global_step": 192432, "epoch": 4581} {"train_loss": -7.184209823608398, "global_step": 192433, "epoch": 4581} {"train_loss": -7.197721481323242, "global_step": 192434, "epoch": 4581} {"train_loss": -7.224424362182617, "global_step": 192435, "epoch": 4581} {"train_loss": -7.146885871887207, "global_step": 192436, "epoch": 4581} {"train_loss": -7.1349968910217285, "global_step": 192437, "epoch": 4581} {"train_loss": -7.166958332061768, "global_step": 192438, "epoch": 4581} {"train_loss": -7.2057695388793945, "global_step": 192439, "epoch": 4581} {"train_loss": -7.097734451293945, "global_step": 192440, "epoch": 4581} {"train_loss": -7.309072971343994, "global_step": 192441, "epoch": 4581} {"train_loss": -7.209234237670898, "global_step": 192442, "epoch": 4581} {"train_loss": -7.177117506663005, "global_step": 192443, "epoch": 4581, "val_loss": 69519.109375} {"train_loss": -7.277148246765137, "global_step": 192444, "epoch": 4582} {"train_loss": -7.409331321716309, "global_step": 192445, "epoch": 4582} {"train_loss": -7.275379180908203, "global_step": 192446, "epoch": 4582} {"train_loss": -7.226168632507324, "global_step": 192447, "epoch": 4582} {"train_loss": -7.178752899169922, "global_step": 192448, "epoch": 4582} {"train_loss": -7.268002510070801, "global_step": 192449, "epoch": 4582} {"train_loss": -7.284668922424316, "global_step": 192450, "epoch": 4582} {"train_loss": -7.270228385925293, "global_step": 192451, "epoch": 4582} {"train_loss": -7.19038200378418, "global_step": 192452, "epoch": 4582} {"train_loss": -7.090488910675049, "global_step": 192453, "epoch": 4582} {"train_loss": -7.083866119384766, "global_step": 192454, "epoch": 4582} {"train_loss": -7.092572212219238, "global_step": 192455, "epoch": 4582} {"train_loss": -7.247994899749756, "global_step": 192456, "epoch": 4582} {"train_loss": -7.199972152709961, "global_step": 192457, "epoch": 4582} {"train_loss": -7.192156791687012, "global_step": 192458, "epoch": 4582} {"train_loss": -7.182888507843018, "global_step": 192459, "epoch": 4582} {"train_loss": -7.277134418487549, "global_step": 192460, "epoch": 4582} {"train_loss": -7.132299423217773, "global_step": 192461, "epoch": 4582} {"train_loss": -7.211811065673828, "global_step": 192462, "epoch": 4582} {"train_loss": -7.196857452392578, "global_step": 192463, "epoch": 4582} {"train_loss": -7.200439453125, "global_step": 192464, "epoch": 4582} {"train_loss": -7.241271018981934, "global_step": 192465, "epoch": 4582} {"train_loss": -7.200575828552246, "global_step": 192466, "epoch": 4582} {"train_loss": -7.25880765914917, "global_step": 192467, "epoch": 4582} {"train_loss": -7.2144060134887695, "global_step": 192468, "epoch": 4582} {"train_loss": -7.218228340148926, "global_step": 192469, "epoch": 4582} {"train_loss": -7.166596412658691, "global_step": 192470, "epoch": 4582} {"train_loss": -7.255955696105957, "global_step": 192471, "epoch": 4582} {"train_loss": -7.207109451293945, "global_step": 192472, "epoch": 4582} {"train_loss": -7.272441864013672, "global_step": 192473, "epoch": 4582} {"train_loss": -7.308554649353027, "global_step": 192474, "epoch": 4582} {"train_loss": -7.287416934967041, "global_step": 192475, "epoch": 4582} {"train_loss": -7.2229838371276855, "global_step": 192476, "epoch": 4582} {"train_loss": -7.191743850708008, "global_step": 192477, "epoch": 4582} {"train_loss": -7.243558883666992, "global_step": 192478, "epoch": 4582} {"train_loss": -7.184723377227783, "global_step": 192479, "epoch": 4582} {"train_loss": -7.298255920410156, "global_step": 192480, "epoch": 4582} {"train_loss": -7.240107536315918, "global_step": 192481, "epoch": 4582} {"train_loss": -7.183188438415527, "global_step": 192482, "epoch": 4582} {"train_loss": -7.25054931640625, "global_step": 192483, "epoch": 4582} {"train_loss": -7.169795036315918, "global_step": 192484, "epoch": 4582} {"train_loss": -7.2205673626491, "global_step": 192485, "epoch": 4582, "val_loss": 69601.7578125} {"train_loss": -7.260548114776611, "global_step": 192486, "epoch": 4583} {"train_loss": -7.2114033699035645, "global_step": 192487, "epoch": 4583} {"train_loss": -7.317590236663818, "global_step": 192488, "epoch": 4583} {"train_loss": -7.215933799743652, "global_step": 192489, "epoch": 4583} {"train_loss": -7.257137298583984, "global_step": 192490, "epoch": 4583} {"train_loss": -7.249917984008789, "global_step": 192491, "epoch": 4583} {"train_loss": -7.14321756362915, "global_step": 192492, "epoch": 4583} {"train_loss": -7.218232154846191, "global_step": 192493, "epoch": 4583} {"train_loss": -7.176048278808594, "global_step": 192494, "epoch": 4583} {"train_loss": -7.269423961639404, "global_step": 192495, "epoch": 4583} {"train_loss": -7.305652618408203, "global_step": 192496, "epoch": 4583} {"train_loss": -7.124975681304932, "global_step": 192497, "epoch": 4583} {"train_loss": -7.174027442932129, "global_step": 192498, "epoch": 4583} {"train_loss": -7.321535110473633, "global_step": 192499, "epoch": 4583} {"train_loss": -7.323702335357666, "global_step": 192500, "epoch": 4583} {"train_loss": -7.164918899536133, "global_step": 192501, "epoch": 4583} {"train_loss": -7.181466102600098, "global_step": 192502, "epoch": 4583} {"train_loss": -7.22316837310791, "global_step": 192503, "epoch": 4583} {"train_loss": -7.181217670440674, "global_step": 192504, "epoch": 4583} {"train_loss": -7.197542190551758, "global_step": 192505, "epoch": 4583} {"train_loss": -6.933149814605713, "global_step": 192506, "epoch": 4583} {"train_loss": -7.104647636413574, "global_step": 192507, "epoch": 4583} {"train_loss": -7.189451217651367, "global_step": 192508, "epoch": 4583} {"train_loss": -6.987371444702148, "global_step": 192509, "epoch": 4583} {"train_loss": -7.112785339355469, "global_step": 192510, "epoch": 4583} {"train_loss": -7.148101806640625, "global_step": 192511, "epoch": 4583} {"train_loss": -7.200533866882324, "global_step": 192512, "epoch": 4583} {"train_loss": -7.094939708709717, "global_step": 192513, "epoch": 4583} {"train_loss": -7.208959579467773, "global_step": 192514, "epoch": 4583} {"train_loss": -7.1330885887146, "global_step": 192515, "epoch": 4583} {"train_loss": -7.1796674728393555, "global_step": 192516, "epoch": 4583} {"train_loss": -7.2858734130859375, "global_step": 192517, "epoch": 4583} {"train_loss": -7.186184406280518, "global_step": 192518, "epoch": 4583} {"train_loss": -7.229548454284668, "global_step": 192519, "epoch": 4583} {"train_loss": -7.186473846435547, "global_step": 192520, "epoch": 4583} {"train_loss": -7.133869171142578, "global_step": 192521, "epoch": 4583} {"train_loss": -7.209512233734131, "global_step": 192522, "epoch": 4583} {"train_loss": -7.155898094177246, "global_step": 192523, "epoch": 4583} {"train_loss": -7.254452705383301, "global_step": 192524, "epoch": 4583} {"train_loss": -7.260748863220215, "global_step": 192525, "epoch": 4583} {"train_loss": -7.2394890785217285, "global_step": 192526, "epoch": 4583} {"train_loss": -7.193318594069708, "global_step": 192527, "epoch": 4583, "val_loss": 69491.2890625} {"train_loss": -7.121484279632568, "global_step": 192528, "epoch": 4584} {"train_loss": -7.154333114624023, "global_step": 192529, "epoch": 4584} {"train_loss": -7.227950096130371, "global_step": 192530, "epoch": 4584} {"train_loss": -7.130258560180664, "global_step": 192531, "epoch": 4584} {"train_loss": -7.230496883392334, "global_step": 192532, "epoch": 4584} {"train_loss": -7.062259674072266, "global_step": 192533, "epoch": 4584} {"train_loss": -7.180547714233398, "global_step": 192534, "epoch": 4584} {"train_loss": -7.180375099182129, "global_step": 192535, "epoch": 4584} {"train_loss": -7.176582336425781, "global_step": 192536, "epoch": 4584} {"train_loss": -7.040076732635498, "global_step": 192537, "epoch": 4584} {"train_loss": -7.156680107116699, "global_step": 192538, "epoch": 4584} {"train_loss": -7.173886775970459, "global_step": 192539, "epoch": 4584} {"train_loss": -7.130503177642822, "global_step": 192540, "epoch": 4584} {"train_loss": -7.112191200256348, "global_step": 192541, "epoch": 4584} {"train_loss": -6.944393634796143, "global_step": 192542, "epoch": 4584} {"train_loss": -7.188636779785156, "global_step": 192543, "epoch": 4584} {"train_loss": -6.856330871582031, "global_step": 192544, "epoch": 4584} {"train_loss": -6.803013324737549, "global_step": 192545, "epoch": 4584} {"train_loss": -7.214666366577148, "global_step": 192546, "epoch": 4584} {"train_loss": -7.136310577392578, "global_step": 192547, "epoch": 4584} {"train_loss": -7.019649505615234, "global_step": 192548, "epoch": 4584} {"train_loss": -7.112349033355713, "global_step": 192549, "epoch": 4584} {"train_loss": -6.917351722717285, "global_step": 192550, "epoch": 4584} {"train_loss": -7.1829352378845215, "global_step": 192551, "epoch": 4584} {"train_loss": -7.079551696777344, "global_step": 192552, "epoch": 4584} {"train_loss": -7.078755855560303, "global_step": 192553, "epoch": 4584} {"train_loss": -7.081744194030762, "global_step": 192554, "epoch": 4584} {"train_loss": -6.9477858543396, "global_step": 192555, "epoch": 4584} {"train_loss": -7.168046951293945, "global_step": 192556, "epoch": 4584} {"train_loss": -6.964402675628662, "global_step": 192557, "epoch": 4584} {"train_loss": -7.190797328948975, "global_step": 192558, "epoch": 4584} {"train_loss": -6.9945969581604, "global_step": 192559, "epoch": 4584} {"train_loss": -7.0476484298706055, "global_step": 192560, "epoch": 4584} {"train_loss": -7.23002815246582, "global_step": 192561, "epoch": 4584} {"train_loss": -6.996753692626953, "global_step": 192562, "epoch": 4584} {"train_loss": -7.178493499755859, "global_step": 192563, "epoch": 4584} {"train_loss": -7.064664840698242, "global_step": 192564, "epoch": 4584} {"train_loss": -7.232363224029541, "global_step": 192565, "epoch": 4584} {"train_loss": -7.134688377380371, "global_step": 192566, "epoch": 4584} {"train_loss": -7.081910610198975, "global_step": 192567, "epoch": 4584} {"train_loss": -7.14787483215332, "global_step": 192568, "epoch": 4584} {"train_loss": -7.098183291299002, "global_step": 192569, "epoch": 4584, "val_loss": 69685.4765625} {"train_loss": -7.269864082336426, "global_step": 192570, "epoch": 4585} {"train_loss": -7.117243766784668, "global_step": 192571, "epoch": 4585} {"train_loss": -7.2198286056518555, "global_step": 192572, "epoch": 4585} {"train_loss": -7.167594909667969, "global_step": 192573, "epoch": 4585} {"train_loss": -7.209048748016357, "global_step": 192574, "epoch": 4585} {"train_loss": -7.158881664276123, "global_step": 192575, "epoch": 4585} {"train_loss": -7.130810260772705, "global_step": 192576, "epoch": 4585} {"train_loss": -7.124546527862549, "global_step": 192577, "epoch": 4585} {"train_loss": -7.222416877746582, "global_step": 192578, "epoch": 4585} {"train_loss": -7.322747230529785, "global_step": 192579, "epoch": 4585} {"train_loss": -7.202940464019775, "global_step": 192580, "epoch": 4585} {"train_loss": -7.298849105834961, "global_step": 192581, "epoch": 4585} {"train_loss": -7.274576187133789, "global_step": 192582, "epoch": 4585} {"train_loss": -7.287903785705566, "global_step": 192583, "epoch": 4585} {"train_loss": -7.222076892852783, "global_step": 192584, "epoch": 4585} {"train_loss": -7.177542686462402, "global_step": 192585, "epoch": 4585} {"train_loss": -7.127322196960449, "global_step": 192586, "epoch": 4585} {"train_loss": -7.270634174346924, "global_step": 192587, "epoch": 4585} {"train_loss": -7.239672660827637, "global_step": 192588, "epoch": 4585} {"train_loss": -7.21798038482666, "global_step": 192589, "epoch": 4585} {"train_loss": -7.250290870666504, "global_step": 192590, "epoch": 4585} {"train_loss": -7.230137348175049, "global_step": 192591, "epoch": 4585} {"train_loss": -7.327267169952393, "global_step": 192592, "epoch": 4585} {"train_loss": -7.2577619552612305, "global_step": 192593, "epoch": 4585} {"train_loss": -7.279755592346191, "global_step": 192594, "epoch": 4585} {"train_loss": -7.29777717590332, "global_step": 192595, "epoch": 4585} {"train_loss": -7.311999320983887, "global_step": 192596, "epoch": 4585} {"train_loss": -7.336286544799805, "global_step": 192597, "epoch": 4585} {"train_loss": -7.331543922424316, "global_step": 192598, "epoch": 4585} {"train_loss": -7.346451759338379, "global_step": 192599, "epoch": 4585} {"train_loss": -7.176122665405273, "global_step": 192600, "epoch": 4585} {"train_loss": -7.25111198425293, "global_step": 192601, "epoch": 4585} {"train_loss": -7.323888778686523, "global_step": 192602, "epoch": 4585} {"train_loss": -7.356784820556641, "global_step": 192603, "epoch": 4585} {"train_loss": -7.246266841888428, "global_step": 192604, "epoch": 4585} {"train_loss": -7.161195755004883, "global_step": 192605, "epoch": 4585} {"train_loss": -7.191496849060059, "global_step": 192606, "epoch": 4585} {"train_loss": -7.325841903686523, "global_step": 192607, "epoch": 4585} {"train_loss": -7.229883193969727, "global_step": 192608, "epoch": 4585} {"train_loss": -7.248739242553711, "global_step": 192609, "epoch": 4585} {"train_loss": -7.2582855224609375, "global_step": 192610, "epoch": 4585} {"train_loss": -7.24580504780724, "global_step": 192611, "epoch": 4585, "val_loss": 69522.984375} {"train_loss": -7.268711090087891, "global_step": 192612, "epoch": 4586} {"train_loss": -7.224655628204346, "global_step": 192613, "epoch": 4586} {"train_loss": -7.416661739349365, "global_step": 192614, "epoch": 4586} {"train_loss": -7.287774085998535, "global_step": 192615, "epoch": 4586} {"train_loss": -7.192747116088867, "global_step": 192616, "epoch": 4586} {"train_loss": -7.361225605010986, "global_step": 192617, "epoch": 4586} {"train_loss": -7.24404239654541, "global_step": 192618, "epoch": 4586} {"train_loss": -7.348323345184326, "global_step": 192619, "epoch": 4586} {"train_loss": -7.259750843048096, "global_step": 192620, "epoch": 4586} {"train_loss": -7.313320159912109, "global_step": 192621, "epoch": 4586} {"train_loss": -7.249074459075928, "global_step": 192622, "epoch": 4586} {"train_loss": -7.324681282043457, "global_step": 192623, "epoch": 4586} {"train_loss": -7.3108930587768555, "global_step": 192624, "epoch": 4586} {"train_loss": -7.289541721343994, "global_step": 192625, "epoch": 4586} {"train_loss": -7.264333724975586, "global_step": 192626, "epoch": 4586} {"train_loss": -7.190861225128174, "global_step": 192627, "epoch": 4586} {"train_loss": -7.142127513885498, "global_step": 192628, "epoch": 4586} {"train_loss": -7.296058177947998, "global_step": 192629, "epoch": 4586} {"train_loss": -7.271256923675537, "global_step": 192630, "epoch": 4586} {"train_loss": -7.2758331298828125, "global_step": 192631, "epoch": 4586} {"train_loss": -7.2588605880737305, "global_step": 192632, "epoch": 4586} {"train_loss": -7.138303756713867, "global_step": 192633, "epoch": 4586} {"train_loss": -7.268969535827637, "global_step": 192634, "epoch": 4586} {"train_loss": -7.2956037521362305, "global_step": 192635, "epoch": 4586} {"train_loss": -7.276538372039795, "global_step": 192636, "epoch": 4586} {"train_loss": -7.169081687927246, "global_step": 192637, "epoch": 4586} {"train_loss": -7.3525919914245605, "global_step": 192638, "epoch": 4586} {"train_loss": -7.23658561706543, "global_step": 192639, "epoch": 4586} {"train_loss": -7.176802635192871, "global_step": 192640, "epoch": 4586} {"train_loss": -7.2076544761657715, "global_step": 192641, "epoch": 4586} {"train_loss": -7.13070821762085, "global_step": 192642, "epoch": 4586} {"train_loss": -7.279153823852539, "global_step": 192643, "epoch": 4586} {"train_loss": -7.320279121398926, "global_step": 192644, "epoch": 4586} {"train_loss": -7.2544050216674805, "global_step": 192645, "epoch": 4586} {"train_loss": -7.281757354736328, "global_step": 192646, "epoch": 4586} {"train_loss": -7.18150520324707, "global_step": 192647, "epoch": 4586} {"train_loss": -7.197904586791992, "global_step": 192648, "epoch": 4586} {"train_loss": -7.173322677612305, "global_step": 192649, "epoch": 4586} {"train_loss": -7.310837745666504, "global_step": 192650, "epoch": 4586} {"train_loss": -7.2240800857543945, "global_step": 192651, "epoch": 4586} {"train_loss": -7.1654205322265625, "global_step": 192652, "epoch": 4586} {"train_loss": -7.254771925154186, "global_step": 192653, "epoch": 4586, "val_loss": 69673.6953125} {"train_loss": -7.277955055236816, "global_step": 192654, "epoch": 4587} {"train_loss": -7.183578968048096, "global_step": 192655, "epoch": 4587} {"train_loss": -7.196686744689941, "global_step": 192656, "epoch": 4587} {"train_loss": -7.2219648361206055, "global_step": 192657, "epoch": 4587} {"train_loss": -7.3101887702941895, "global_step": 192658, "epoch": 4587} {"train_loss": -7.19596004486084, "global_step": 192659, "epoch": 4587} {"train_loss": -7.304912567138672, "global_step": 192660, "epoch": 4587} {"train_loss": -7.286046981811523, "global_step": 192661, "epoch": 4587} {"train_loss": -7.266120910644531, "global_step": 192662, "epoch": 4587} {"train_loss": -7.190981388092041, "global_step": 192663, "epoch": 4587} {"train_loss": -7.219239711761475, "global_step": 192664, "epoch": 4587} {"train_loss": -6.9947428703308105, "global_step": 192665, "epoch": 4587} {"train_loss": -7.13237190246582, "global_step": 192666, "epoch": 4587} {"train_loss": -7.139035224914551, "global_step": 192667, "epoch": 4587} {"train_loss": -7.051178455352783, "global_step": 192668, "epoch": 4587} {"train_loss": -7.127046585083008, "global_step": 192669, "epoch": 4587} {"train_loss": -7.193136215209961, "global_step": 192670, "epoch": 4587} {"train_loss": -7.016604423522949, "global_step": 192671, "epoch": 4587} {"train_loss": -7.187198638916016, "global_step": 192672, "epoch": 4587} {"train_loss": -7.009652614593506, "global_step": 192673, "epoch": 4587} {"train_loss": -7.0330095291137695, "global_step": 192674, "epoch": 4587} {"train_loss": -7.2163496017456055, "global_step": 192675, "epoch": 4587} {"train_loss": -7.0358734130859375, "global_step": 192676, "epoch": 4587} {"train_loss": -7.084680557250977, "global_step": 192677, "epoch": 4587} {"train_loss": -7.092039585113525, "global_step": 192678, "epoch": 4587} {"train_loss": -7.02760124206543, "global_step": 192679, "epoch": 4587} {"train_loss": -7.161615371704102, "global_step": 192680, "epoch": 4587} {"train_loss": -7.066065788269043, "global_step": 192681, "epoch": 4587} {"train_loss": -7.003543853759766, "global_step": 192682, "epoch": 4587} {"train_loss": -7.169948577880859, "global_step": 192683, "epoch": 4587} {"train_loss": -7.17360782623291, "global_step": 192684, "epoch": 4587} {"train_loss": -7.077840328216553, "global_step": 192685, "epoch": 4587} {"train_loss": -7.1284332275390625, "global_step": 192686, "epoch": 4587} {"train_loss": -7.010466575622559, "global_step": 192687, "epoch": 4587} {"train_loss": -7.175292491912842, "global_step": 192688, "epoch": 4587} {"train_loss": -7.174707889556885, "global_step": 192689, "epoch": 4587} {"train_loss": -7.197014331817627, "global_step": 192690, "epoch": 4587} {"train_loss": -7.232791900634766, "global_step": 192691, "epoch": 4587} {"train_loss": -7.432974815368652, "global_step": 192692, "epoch": 4587} {"train_loss": -7.1899213790893555, "global_step": 192693, "epoch": 4587} {"train_loss": -7.150107383728027, "global_step": 192694, "epoch": 4587} {"train_loss": -7.157656976154873, "global_step": 192695, "epoch": 4587, "val_loss": 69616.7890625} {"train_loss": -7.150790214538574, "global_step": 192696, "epoch": 4588} {"train_loss": -7.270317077636719, "global_step": 192697, "epoch": 4588} {"train_loss": -7.193376541137695, "global_step": 192698, "epoch": 4588} {"train_loss": -7.22115421295166, "global_step": 192699, "epoch": 4588} {"train_loss": -7.264558792114258, "global_step": 192700, "epoch": 4588} {"train_loss": -7.24622106552124, "global_step": 192701, "epoch": 4588} {"train_loss": -7.293398857116699, "global_step": 192702, "epoch": 4588} {"train_loss": -7.18868350982666, "global_step": 192703, "epoch": 4588} {"train_loss": -7.179303169250488, "global_step": 192704, "epoch": 4588} {"train_loss": -7.266107559204102, "global_step": 192705, "epoch": 4588} {"train_loss": -7.263705253601074, "global_step": 192706, "epoch": 4588} {"train_loss": -7.2067365646362305, "global_step": 192707, "epoch": 4588} {"train_loss": -7.069437026977539, "global_step": 192708, "epoch": 4588} {"train_loss": -7.319145202636719, "global_step": 192709, "epoch": 4588} {"train_loss": -7.1901535987854, "global_step": 192710, "epoch": 4588} {"train_loss": -7.069313049316406, "global_step": 192711, "epoch": 4588} {"train_loss": -7.230171203613281, "global_step": 192712, "epoch": 4588} {"train_loss": -7.2007551193237305, "global_step": 192713, "epoch": 4588} {"train_loss": -7.166876792907715, "global_step": 192714, "epoch": 4588} {"train_loss": -7.307681083679199, "global_step": 192715, "epoch": 4588} {"train_loss": -7.140137672424316, "global_step": 192716, "epoch": 4588} {"train_loss": -7.32932186126709, "global_step": 192717, "epoch": 4588} {"train_loss": -7.228519439697266, "global_step": 192718, "epoch": 4588} {"train_loss": -7.169344425201416, "global_step": 192719, "epoch": 4588} {"train_loss": -7.184633255004883, "global_step": 192720, "epoch": 4588} {"train_loss": -7.2178955078125, "global_step": 192721, "epoch": 4588} {"train_loss": -7.296608924865723, "global_step": 192722, "epoch": 4588} {"train_loss": -7.213245391845703, "global_step": 192723, "epoch": 4588} {"train_loss": -7.210393905639648, "global_step": 192724, "epoch": 4588} {"train_loss": -7.262589454650879, "global_step": 192725, "epoch": 4588} {"train_loss": -7.039581298828125, "global_step": 192726, "epoch": 4588} {"train_loss": -7.279036521911621, "global_step": 192727, "epoch": 4588} {"train_loss": -7.234777927398682, "global_step": 192728, "epoch": 4588} {"train_loss": -7.2695536613464355, "global_step": 192729, "epoch": 4588} {"train_loss": -7.25144100189209, "global_step": 192730, "epoch": 4588} {"train_loss": -7.302892684936523, "global_step": 192731, "epoch": 4588} {"train_loss": -7.358524799346924, "global_step": 192732, "epoch": 4588} {"train_loss": -7.233233451843262, "global_step": 192733, "epoch": 4588} {"train_loss": -7.2517499923706055, "global_step": 192734, "epoch": 4588} {"train_loss": -7.353124618530273, "global_step": 192735, "epoch": 4588} {"train_loss": -7.336978435516357, "global_step": 192736, "epoch": 4588} {"train_loss": -7.2321903592064265, "global_step": 192737, "epoch": 4588, "val_loss": 69668.6015625} {"train_loss": -7.282704830169678, "global_step": 192738, "epoch": 4589} {"train_loss": -7.245536804199219, "global_step": 192739, "epoch": 4589} {"train_loss": -7.212637901306152, "global_step": 192740, "epoch": 4589} {"train_loss": -7.091050148010254, "global_step": 192741, "epoch": 4589} {"train_loss": -7.359540939331055, "global_step": 192742, "epoch": 4589} {"train_loss": -7.255568504333496, "global_step": 192743, "epoch": 4589} {"train_loss": -6.844989776611328, "global_step": 192744, "epoch": 4589} {"train_loss": -6.939727306365967, "global_step": 192745, "epoch": 4589} {"train_loss": -7.294734954833984, "global_step": 192746, "epoch": 4589} {"train_loss": -7.033884525299072, "global_step": 192747, "epoch": 4589} {"train_loss": -7.139437675476074, "global_step": 192748, "epoch": 4589} {"train_loss": -7.104195594787598, "global_step": 192749, "epoch": 4589} {"train_loss": -7.125007629394531, "global_step": 192750, "epoch": 4589} {"train_loss": -7.0970139503479, "global_step": 192751, "epoch": 4589} {"train_loss": -7.162934303283691, "global_step": 192752, "epoch": 4589} {"train_loss": -7.2249627113342285, "global_step": 192753, "epoch": 4589} {"train_loss": -7.106564521789551, "global_step": 192754, "epoch": 4589} {"train_loss": -7.024107456207275, "global_step": 192755, "epoch": 4589} {"train_loss": -7.205689430236816, "global_step": 192756, "epoch": 4589} {"train_loss": -7.09938907623291, "global_step": 192757, "epoch": 4589} {"train_loss": -7.283519744873047, "global_step": 192758, "epoch": 4589} {"train_loss": -6.9781646728515625, "global_step": 192759, "epoch": 4589} {"train_loss": -7.247988224029541, "global_step": 192760, "epoch": 4589} {"train_loss": -7.146549224853516, "global_step": 192761, "epoch": 4589} {"train_loss": -7.133574962615967, "global_step": 192762, "epoch": 4589} {"train_loss": -7.186436653137207, "global_step": 192763, "epoch": 4589} {"train_loss": -7.104585647583008, "global_step": 192764, "epoch": 4589} {"train_loss": -7.137042999267578, "global_step": 192765, "epoch": 4589} {"train_loss": -7.19212532043457, "global_step": 192766, "epoch": 4589} {"train_loss": -7.111952304840088, "global_step": 192767, "epoch": 4589} {"train_loss": -6.991117477416992, "global_step": 192768, "epoch": 4589} {"train_loss": -7.050302505493164, "global_step": 192769, "epoch": 4589} {"train_loss": -7.1408185958862305, "global_step": 192770, "epoch": 4589} {"train_loss": -6.970539569854736, "global_step": 192771, "epoch": 4589} {"train_loss": -7.23970890045166, "global_step": 192772, "epoch": 4589} {"train_loss": -7.102339267730713, "global_step": 192773, "epoch": 4589} {"train_loss": -7.122633934020996, "global_step": 192774, "epoch": 4589} {"train_loss": -7.174778461456299, "global_step": 192775, "epoch": 4589} {"train_loss": -7.156216621398926, "global_step": 192776, "epoch": 4589} {"train_loss": -7.177318096160889, "global_step": 192777, "epoch": 4589} {"train_loss": -7.303969860076904, "global_step": 192778, "epoch": 4589} {"train_loss": -7.141549496423631, "global_step": 192779, "epoch": 4589, "val_loss": 69694.4140625} {"train_loss": -7.196292877197266, "global_step": 192780, "epoch": 4590} {"train_loss": -7.131455898284912, "global_step": 192781, "epoch": 4590} {"train_loss": -7.215724945068359, "global_step": 192782, "epoch": 4590} {"train_loss": -7.203152656555176, "global_step": 192783, "epoch": 4590} {"train_loss": -7.20012903213501, "global_step": 192784, "epoch": 4590} {"train_loss": -7.319248199462891, "global_step": 192785, "epoch": 4590} {"train_loss": -7.232471942901611, "global_step": 192786, "epoch": 4590} {"train_loss": -7.283886909484863, "global_step": 192787, "epoch": 4590} {"train_loss": -7.296138763427734, "global_step": 192788, "epoch": 4590} {"train_loss": -7.266520023345947, "global_step": 192789, "epoch": 4590} {"train_loss": -7.223048210144043, "global_step": 192790, "epoch": 4590} {"train_loss": -7.29361629486084, "global_step": 192791, "epoch": 4590} {"train_loss": -7.0897321701049805, "global_step": 192792, "epoch": 4590} {"train_loss": -7.2894721031188965, "global_step": 192793, "epoch": 4590} {"train_loss": -7.319361209869385, "global_step": 192794, "epoch": 4590} {"train_loss": -7.171720504760742, "global_step": 192795, "epoch": 4590} {"train_loss": -7.2600908279418945, "global_step": 192796, "epoch": 4590} {"train_loss": -7.12755012512207, "global_step": 192797, "epoch": 4590} {"train_loss": -7.167086601257324, "global_step": 192798, "epoch": 4590} {"train_loss": -7.263160705566406, "global_step": 192799, "epoch": 4590} {"train_loss": -7.18070125579834, "global_step": 192800, "epoch": 4590} {"train_loss": -7.133668899536133, "global_step": 192801, "epoch": 4590} {"train_loss": -7.237489700317383, "global_step": 192802, "epoch": 4590} {"train_loss": -7.098154067993164, "global_step": 192803, "epoch": 4590} {"train_loss": -7.1380839347839355, "global_step": 192804, "epoch": 4590} {"train_loss": -7.159986972808838, "global_step": 192805, "epoch": 4590} {"train_loss": -7.24188232421875, "global_step": 192806, "epoch": 4590} {"train_loss": -7.16874885559082, "global_step": 192807, "epoch": 4590} {"train_loss": -7.194997787475586, "global_step": 192808, "epoch": 4590} {"train_loss": -7.113264083862305, "global_step": 192809, "epoch": 4590} {"train_loss": -7.220456123352051, "global_step": 192810, "epoch": 4590} {"train_loss": -7.129569053649902, "global_step": 192811, "epoch": 4590} {"train_loss": -7.331408500671387, "global_step": 192812, "epoch": 4590} {"train_loss": -7.174625396728516, "global_step": 192813, "epoch": 4590} {"train_loss": -7.148709774017334, "global_step": 192814, "epoch": 4590} {"train_loss": -7.22935152053833, "global_step": 192815, "epoch": 4590} {"train_loss": -7.109350204467773, "global_step": 192816, "epoch": 4590} {"train_loss": -7.0168328285217285, "global_step": 192817, "epoch": 4590} {"train_loss": -7.140801429748535, "global_step": 192818, "epoch": 4590} {"train_loss": -7.1174445152282715, "global_step": 192819, "epoch": 4590} {"train_loss": -7.187675476074219, "global_step": 192820, "epoch": 4590} {"train_loss": -7.198866106214977, "global_step": 192821, "epoch": 4590, "val_loss": 69825.859375} {"train_loss": -7.150180816650391, "global_step": 192822, "epoch": 4591} {"train_loss": -7.106675148010254, "global_step": 192823, "epoch": 4591} {"train_loss": -7.314295291900635, "global_step": 192824, "epoch": 4591} {"train_loss": -7.160107135772705, "global_step": 192825, "epoch": 4591} {"train_loss": -7.276751518249512, "global_step": 192826, "epoch": 4591} {"train_loss": -7.323012828826904, "global_step": 192827, "epoch": 4591} {"train_loss": -7.238248825073242, "global_step": 192828, "epoch": 4591} {"train_loss": -7.27631950378418, "global_step": 192829, "epoch": 4591} {"train_loss": -7.1946797370910645, "global_step": 192830, "epoch": 4591} {"train_loss": -7.122787952423096, "global_step": 192831, "epoch": 4591} {"train_loss": -7.1529860496521, "global_step": 192832, "epoch": 4591} {"train_loss": -7.0499091148376465, "global_step": 192833, "epoch": 4591} {"train_loss": -7.0868072509765625, "global_step": 192834, "epoch": 4591} {"train_loss": -7.136728286743164, "global_step": 192835, "epoch": 4591} {"train_loss": -7.12080717086792, "global_step": 192836, "epoch": 4591} {"train_loss": -7.015047550201416, "global_step": 192837, "epoch": 4591} {"train_loss": -7.112259864807129, "global_step": 192838, "epoch": 4591} {"train_loss": -7.302591800689697, "global_step": 192839, "epoch": 4591} {"train_loss": -7.11528205871582, "global_step": 192840, "epoch": 4591} {"train_loss": -7.216721057891846, "global_step": 192841, "epoch": 4591} {"train_loss": -7.209436893463135, "global_step": 192842, "epoch": 4591} {"train_loss": -7.212993621826172, "global_step": 192843, "epoch": 4591} {"train_loss": -7.250473976135254, "global_step": 192844, "epoch": 4591} {"train_loss": -7.192553520202637, "global_step": 192845, "epoch": 4591} {"train_loss": -7.197901725769043, "global_step": 192846, "epoch": 4591} {"train_loss": -7.251142501831055, "global_step": 192847, "epoch": 4591} {"train_loss": -7.127824783325195, "global_step": 192848, "epoch": 4591} {"train_loss": -7.284802436828613, "global_step": 192849, "epoch": 4591} {"train_loss": -7.247191429138184, "global_step": 192850, "epoch": 4591} {"train_loss": -7.112079620361328, "global_step": 192851, "epoch": 4591} {"train_loss": -7.235311508178711, "global_step": 192852, "epoch": 4591} {"train_loss": -7.260461807250977, "global_step": 192853, "epoch": 4591} {"train_loss": -7.126653671264648, "global_step": 192854, "epoch": 4591} {"train_loss": -7.186659812927246, "global_step": 192855, "epoch": 4591} {"train_loss": -7.344738006591797, "global_step": 192856, "epoch": 4591} {"train_loss": -7.171030521392822, "global_step": 192857, "epoch": 4591} {"train_loss": -7.253870010375977, "global_step": 192858, "epoch": 4591} {"train_loss": -7.264830589294434, "global_step": 192859, "epoch": 4591} {"train_loss": -7.276043891906738, "global_step": 192860, "epoch": 4591} {"train_loss": -7.292746543884277, "global_step": 192861, "epoch": 4591} {"train_loss": -7.213779926300049, "global_step": 192862, "epoch": 4591} {"train_loss": -7.199418442589896, "global_step": 192863, "epoch": 4591, "val_loss": 69676.484375} {"train_loss": -7.208375930786133, "global_step": 192864, "epoch": 4592} {"train_loss": -7.314020156860352, "global_step": 192865, "epoch": 4592} {"train_loss": -7.303871154785156, "global_step": 192866, "epoch": 4592} {"train_loss": -7.295177936553955, "global_step": 192867, "epoch": 4592} {"train_loss": -7.192541122436523, "global_step": 192868, "epoch": 4592} {"train_loss": -7.288914203643799, "global_step": 192869, "epoch": 4592} {"train_loss": -7.286733627319336, "global_step": 192870, "epoch": 4592} {"train_loss": -7.334150791168213, "global_step": 192871, "epoch": 4592} {"train_loss": -7.261934280395508, "global_step": 192872, "epoch": 4592} {"train_loss": -7.249267578125, "global_step": 192873, "epoch": 4592} {"train_loss": -7.2446489334106445, "global_step": 192874, "epoch": 4592} {"train_loss": -7.256706714630127, "global_step": 192875, "epoch": 4592} {"train_loss": -7.159017086029053, "global_step": 192876, "epoch": 4592} {"train_loss": -7.3003249168396, "global_step": 192877, "epoch": 4592} {"train_loss": -7.349577903747559, "global_step": 192878, "epoch": 4592} {"train_loss": -7.187650680541992, "global_step": 192879, "epoch": 4592} {"train_loss": -7.182380199432373, "global_step": 192880, "epoch": 4592} {"train_loss": -7.171092987060547, "global_step": 192881, "epoch": 4592} {"train_loss": -7.249842166900635, "global_step": 192882, "epoch": 4592} {"train_loss": -7.228509902954102, "global_step": 192883, "epoch": 4592} {"train_loss": -7.219122886657715, "global_step": 192884, "epoch": 4592} {"train_loss": -7.2023444175720215, "global_step": 192885, "epoch": 4592} {"train_loss": -7.210920333862305, "global_step": 192886, "epoch": 4592} {"train_loss": -7.271729946136475, "global_step": 192887, "epoch": 4592} {"train_loss": -7.301626205444336, "global_step": 192888, "epoch": 4592} {"train_loss": -7.24578857421875, "global_step": 192889, "epoch": 4592} {"train_loss": -7.256189823150635, "global_step": 192890, "epoch": 4592} {"train_loss": -7.241820335388184, "global_step": 192891, "epoch": 4592} {"train_loss": -7.248859405517578, "global_step": 192892, "epoch": 4592} {"train_loss": -7.209425926208496, "global_step": 192893, "epoch": 4592} {"train_loss": -7.23411750793457, "global_step": 192894, "epoch": 4592} {"train_loss": -7.174291133880615, "global_step": 192895, "epoch": 4592} {"train_loss": -7.152586936950684, "global_step": 192896, "epoch": 4592} {"train_loss": -7.2117719650268555, "global_step": 192897, "epoch": 4592} {"train_loss": -7.073539733886719, "global_step": 192898, "epoch": 4592} {"train_loss": -7.264918327331543, "global_step": 192899, "epoch": 4592} {"train_loss": -7.273305892944336, "global_step": 192900, "epoch": 4592} {"train_loss": -7.235742568969727, "global_step": 192901, "epoch": 4592} {"train_loss": -7.391488075256348, "global_step": 192902, "epoch": 4592} {"train_loss": -7.286998748779297, "global_step": 192903, "epoch": 4592} {"train_loss": -7.242118835449219, "global_step": 192904, "epoch": 4592} {"train_loss": -7.2452506337847025, "global_step": 192905, "epoch": 4592, "val_loss": 69797.25} {"train_loss": -7.27852725982666, "global_step": 192906, "epoch": 4593} {"train_loss": -7.229159832000732, "global_step": 192907, "epoch": 4593} {"train_loss": -7.287732124328613, "global_step": 192908, "epoch": 4593} {"train_loss": -7.340532302856445, "global_step": 192909, "epoch": 4593} {"train_loss": -7.169513702392578, "global_step": 192910, "epoch": 4593} {"train_loss": -7.2298688888549805, "global_step": 192911, "epoch": 4593} {"train_loss": -7.3351898193359375, "global_step": 192912, "epoch": 4593} {"train_loss": -7.303218841552734, "global_step": 192913, "epoch": 4593} {"train_loss": -7.231170654296875, "global_step": 192914, "epoch": 4593} {"train_loss": -7.149445056915283, "global_step": 192915, "epoch": 4593} {"train_loss": -7.273984432220459, "global_step": 192916, "epoch": 4593} {"train_loss": -7.196841716766357, "global_step": 192917, "epoch": 4593} {"train_loss": -7.122670650482178, "global_step": 192918, "epoch": 4593} {"train_loss": -7.154902935028076, "global_step": 192919, "epoch": 4593} {"train_loss": -7.2527031898498535, "global_step": 192920, "epoch": 4593} {"train_loss": -7.063838958740234, "global_step": 192921, "epoch": 4593} {"train_loss": -7.188557147979736, "global_step": 192922, "epoch": 4593} {"train_loss": -7.229719638824463, "global_step": 192923, "epoch": 4593} {"train_loss": -7.1318864822387695, "global_step": 192924, "epoch": 4593} {"train_loss": -7.236755847930908, "global_step": 192925, "epoch": 4593} {"train_loss": -7.175327301025391, "global_step": 192926, "epoch": 4593} {"train_loss": -7.1394877433776855, "global_step": 192927, "epoch": 4593} {"train_loss": -7.21876335144043, "global_step": 192928, "epoch": 4593} {"train_loss": -7.1385393142700195, "global_step": 192929, "epoch": 4593} {"train_loss": -7.278912544250488, "global_step": 192930, "epoch": 4593} {"train_loss": -7.254326820373535, "global_step": 192931, "epoch": 4593} {"train_loss": -7.058954238891602, "global_step": 192932, "epoch": 4593} {"train_loss": -7.300050735473633, "global_step": 192933, "epoch": 4593} {"train_loss": -7.244546890258789, "global_step": 192934, "epoch": 4593} {"train_loss": -7.080621719360352, "global_step": 192935, "epoch": 4593} {"train_loss": -7.352682113647461, "global_step": 192936, "epoch": 4593} {"train_loss": -7.108816146850586, "global_step": 192937, "epoch": 4593} {"train_loss": -7.1199493408203125, "global_step": 192938, "epoch": 4593} {"train_loss": -7.143863201141357, "global_step": 192939, "epoch": 4593} {"train_loss": -7.080368995666504, "global_step": 192940, "epoch": 4593} {"train_loss": -7.216657638549805, "global_step": 192941, "epoch": 4593} {"train_loss": -7.181124210357666, "global_step": 192942, "epoch": 4593} {"train_loss": -7.0895094871521, "global_step": 192943, "epoch": 4593} {"train_loss": -7.236907005310059, "global_step": 192944, "epoch": 4593} {"train_loss": -7.193502426147461, "global_step": 192945, "epoch": 4593} {"train_loss": -7.187936782836914, "global_step": 192946, "epoch": 4593} {"train_loss": -7.200192928314209, "global_step": 192947, "epoch": 4593, "val_loss": 69798.8125} {"train_loss": -7.169512748718262, "global_step": 192948, "epoch": 4594} {"train_loss": -7.201227188110352, "global_step": 192949, "epoch": 4594} {"train_loss": -7.2321882247924805, "global_step": 192950, "epoch": 4594} {"train_loss": -7.305591583251953, "global_step": 192951, "epoch": 4594} {"train_loss": -7.259750843048096, "global_step": 192952, "epoch": 4594} {"train_loss": -7.300595283508301, "global_step": 192953, "epoch": 4594} {"train_loss": -7.279342174530029, "global_step": 192954, "epoch": 4594} {"train_loss": -7.322747707366943, "global_step": 192955, "epoch": 4594} {"train_loss": -7.325136184692383, "global_step": 192956, "epoch": 4594} {"train_loss": -7.296582221984863, "global_step": 192957, "epoch": 4594} {"train_loss": -7.253260612487793, "global_step": 192958, "epoch": 4594} {"train_loss": -7.227427959442139, "global_step": 192959, "epoch": 4594} {"train_loss": -7.3495259284973145, "global_step": 192960, "epoch": 4594} {"train_loss": -7.216999053955078, "global_step": 192961, "epoch": 4594} {"train_loss": -7.199685573577881, "global_step": 192962, "epoch": 4594} {"train_loss": -7.298452377319336, "global_step": 192963, "epoch": 4594} {"train_loss": -7.197577476501465, "global_step": 192964, "epoch": 4594} {"train_loss": -7.237837314605713, "global_step": 192965, "epoch": 4594} {"train_loss": -7.234691143035889, "global_step": 192966, "epoch": 4594} {"train_loss": -7.211050033569336, "global_step": 192967, "epoch": 4594} {"train_loss": -7.100775718688965, "global_step": 192968, "epoch": 4594} {"train_loss": -7.303600788116455, "global_step": 192969, "epoch": 4594} {"train_loss": -7.159276962280273, "global_step": 192970, "epoch": 4594} {"train_loss": -7.145770072937012, "global_step": 192971, "epoch": 4594} {"train_loss": -7.162309169769287, "global_step": 192972, "epoch": 4594} {"train_loss": -7.210539817810059, "global_step": 192973, "epoch": 4594} {"train_loss": -7.1876630783081055, "global_step": 192974, "epoch": 4594} {"train_loss": -7.127820014953613, "global_step": 192975, "epoch": 4594} {"train_loss": -7.230440139770508, "global_step": 192976, "epoch": 4594} {"train_loss": -7.061502456665039, "global_step": 192977, "epoch": 4594} {"train_loss": -7.205458164215088, "global_step": 192978, "epoch": 4594} {"train_loss": -7.024595260620117, "global_step": 192979, "epoch": 4594} {"train_loss": -7.104389190673828, "global_step": 192980, "epoch": 4594} {"train_loss": -7.242663383483887, "global_step": 192981, "epoch": 4594} {"train_loss": -7.14838981628418, "global_step": 192982, "epoch": 4594} {"train_loss": -7.225383281707764, "global_step": 192983, "epoch": 4594} {"train_loss": -7.214715957641602, "global_step": 192984, "epoch": 4594} {"train_loss": -7.108171463012695, "global_step": 192985, "epoch": 4594} {"train_loss": -7.335710048675537, "global_step": 192986, "epoch": 4594} {"train_loss": -7.186626434326172, "global_step": 192987, "epoch": 4594} {"train_loss": -7.181715488433838, "global_step": 192988, "epoch": 4594} {"train_loss": -7.213070381255377, "global_step": 192989, "epoch": 4594, "val_loss": 69622.1640625} {"train_loss": -7.230954170227051, "global_step": 192990, "epoch": 4595} {"train_loss": -7.224200248718262, "global_step": 192991, "epoch": 4595} {"train_loss": -7.238824844360352, "global_step": 192992, "epoch": 4595} {"train_loss": -7.201250076293945, "global_step": 192993, "epoch": 4595} {"train_loss": -7.359823226928711, "global_step": 192994, "epoch": 4595} {"train_loss": -7.054511547088623, "global_step": 192995, "epoch": 4595} {"train_loss": -7.259110450744629, "global_step": 192996, "epoch": 4595} {"train_loss": -7.197296142578125, "global_step": 192997, "epoch": 4595} {"train_loss": -7.079713344573975, "global_step": 192998, "epoch": 4595} {"train_loss": -7.321751117706299, "global_step": 192999, "epoch": 4595} {"train_loss": -7.362401962280273, "global_step": 193000, "epoch": 4595} {"train_loss": -7.27518367767334, "global_step": 193001, "epoch": 4595} {"train_loss": -7.19174861907959, "global_step": 193002, "epoch": 4595} {"train_loss": -7.1328840255737305, "global_step": 193003, "epoch": 4595} {"train_loss": -7.258549690246582, "global_step": 193004, "epoch": 4595} {"train_loss": -7.273901462554932, "global_step": 193005, "epoch": 4595} {"train_loss": -7.262305736541748, "global_step": 193006, "epoch": 4595} {"train_loss": -7.207455635070801, "global_step": 193007, "epoch": 4595} {"train_loss": -7.07275390625, "global_step": 193008, "epoch": 4595} {"train_loss": -7.021664619445801, "global_step": 193009, "epoch": 4595} {"train_loss": -7.162054061889648, "global_step": 193010, "epoch": 4595} {"train_loss": -7.2410888671875, "global_step": 193011, "epoch": 4595} {"train_loss": -7.165321350097656, "global_step": 193012, "epoch": 4595} {"train_loss": -7.052767753601074, "global_step": 193013, "epoch": 4595} {"train_loss": -7.243462562561035, "global_step": 193014, "epoch": 4595} {"train_loss": -7.131283760070801, "global_step": 193015, "epoch": 4595} {"train_loss": -7.271386623382568, "global_step": 193016, "epoch": 4595} {"train_loss": -7.26032018661499, "global_step": 193017, "epoch": 4595} {"train_loss": -7.246979713439941, "global_step": 193018, "epoch": 4595} {"train_loss": -7.1881513595581055, "global_step": 193019, "epoch": 4595} {"train_loss": -7.246988296508789, "global_step": 193020, "epoch": 4595} {"train_loss": -7.374603271484375, "global_step": 193021, "epoch": 4595} {"train_loss": -7.168822288513184, "global_step": 193022, "epoch": 4595} {"train_loss": -7.251214981079102, "global_step": 193023, "epoch": 4595} {"train_loss": -7.239282608032227, "global_step": 193024, "epoch": 4595} {"train_loss": -7.250897407531738, "global_step": 193025, "epoch": 4595} {"train_loss": -7.207735538482666, "global_step": 193026, "epoch": 4595} {"train_loss": -7.210561752319336, "global_step": 193027, "epoch": 4595} {"train_loss": -7.210320472717285, "global_step": 193028, "epoch": 4595} {"train_loss": -7.193375587463379, "global_step": 193029, "epoch": 4595} {"train_loss": -7.309920310974121, "global_step": 193030, "epoch": 4595} {"train_loss": -7.217397553580148, "global_step": 193031, "epoch": 4595, "val_loss": 69561.1875} {"train_loss": -7.266292572021484, "global_step": 193032, "epoch": 4596} {"train_loss": -7.18031120300293, "global_step": 193033, "epoch": 4596} {"train_loss": -7.228641986846924, "global_step": 193034, "epoch": 4596} {"train_loss": -7.22589111328125, "global_step": 193035, "epoch": 4596} {"train_loss": -7.183023452758789, "global_step": 193036, "epoch": 4596} {"train_loss": -7.153238296508789, "global_step": 193037, "epoch": 4596} {"train_loss": -7.293537139892578, "global_step": 193038, "epoch": 4596} {"train_loss": -7.176551818847656, "global_step": 193039, "epoch": 4596} {"train_loss": -7.292530059814453, "global_step": 193040, "epoch": 4596} {"train_loss": -7.400010108947754, "global_step": 193041, "epoch": 4596} {"train_loss": -7.171021938323975, "global_step": 193042, "epoch": 4596} {"train_loss": -7.243841171264648, "global_step": 193043, "epoch": 4596} {"train_loss": -7.207987308502197, "global_step": 193044, "epoch": 4596} {"train_loss": -7.347441673278809, "global_step": 193045, "epoch": 4596} {"train_loss": -7.180943012237549, "global_step": 193046, "epoch": 4596} {"train_loss": -7.229153633117676, "global_step": 193047, "epoch": 4596} {"train_loss": -7.210262298583984, "global_step": 193048, "epoch": 4596} {"train_loss": -7.26319694519043, "global_step": 193049, "epoch": 4596} {"train_loss": -7.141849517822266, "global_step": 193050, "epoch": 4596} {"train_loss": -7.075806140899658, "global_step": 193051, "epoch": 4596} {"train_loss": -7.123059272766113, "global_step": 193052, "epoch": 4596} {"train_loss": -7.133206367492676, "global_step": 193053, "epoch": 4596} {"train_loss": -7.152320384979248, "global_step": 193054, "epoch": 4596} {"train_loss": -7.211402416229248, "global_step": 193055, "epoch": 4596} {"train_loss": -7.1197428703308105, "global_step": 193056, "epoch": 4596} {"train_loss": -7.203193664550781, "global_step": 193057, "epoch": 4596} {"train_loss": -7.296377182006836, "global_step": 193058, "epoch": 4596} {"train_loss": -7.282846927642822, "global_step": 193059, "epoch": 4596} {"train_loss": -7.170475959777832, "global_step": 193060, "epoch": 4596} {"train_loss": -7.140447616577148, "global_step": 193061, "epoch": 4596} {"train_loss": -7.235652923583984, "global_step": 193062, "epoch": 4596} {"train_loss": -7.155044078826904, "global_step": 193063, "epoch": 4596} {"train_loss": -7.17736291885376, "global_step": 193064, "epoch": 4596} {"train_loss": -7.2147932052612305, "global_step": 193065, "epoch": 4596} {"train_loss": -7.086806774139404, "global_step": 193066, "epoch": 4596} {"train_loss": -7.212475776672363, "global_step": 193067, "epoch": 4596} {"train_loss": -7.133548736572266, "global_step": 193068, "epoch": 4596} {"train_loss": -7.0723066329956055, "global_step": 193069, "epoch": 4596} {"train_loss": -7.251926422119141, "global_step": 193070, "epoch": 4596} {"train_loss": -7.028580665588379, "global_step": 193071, "epoch": 4596} {"train_loss": -7.080678939819336, "global_step": 193072, "epoch": 4596} {"train_loss": -7.1956680956340975, "global_step": 193073, "epoch": 4596, "val_loss": 69694.875} {"train_loss": -7.170779705047607, "global_step": 193074, "epoch": 4597} {"train_loss": -7.210561752319336, "global_step": 193075, "epoch": 4597} {"train_loss": -7.194218635559082, "global_step": 193076, "epoch": 4597} {"train_loss": -7.104396820068359, "global_step": 193077, "epoch": 4597} {"train_loss": -7.203249454498291, "global_step": 193078, "epoch": 4597} {"train_loss": -7.222597122192383, "global_step": 193079, "epoch": 4597} {"train_loss": -7.096555709838867, "global_step": 193080, "epoch": 4597} {"train_loss": -7.294403076171875, "global_step": 193081, "epoch": 4597} {"train_loss": -7.154455184936523, "global_step": 193082, "epoch": 4597} {"train_loss": -7.299696445465088, "global_step": 193083, "epoch": 4597} {"train_loss": -7.168303489685059, "global_step": 193084, "epoch": 4597} {"train_loss": -7.166293144226074, "global_step": 193085, "epoch": 4597} {"train_loss": -7.175682067871094, "global_step": 193086, "epoch": 4597} {"train_loss": -7.212386131286621, "global_step": 193087, "epoch": 4597} {"train_loss": -7.193444728851318, "global_step": 193088, "epoch": 4597} {"train_loss": -7.143102645874023, "global_step": 193089, "epoch": 4597} {"train_loss": -7.240655899047852, "global_step": 193090, "epoch": 4597} {"train_loss": -7.258970737457275, "global_step": 193091, "epoch": 4597} {"train_loss": -7.086878776550293, "global_step": 193092, "epoch": 4597} {"train_loss": -7.1888508796691895, "global_step": 193093, "epoch": 4597} {"train_loss": -7.146762847900391, "global_step": 193094, "epoch": 4597} {"train_loss": -7.106575012207031, "global_step": 193095, "epoch": 4597} {"train_loss": -7.210599899291992, "global_step": 193096, "epoch": 4597} {"train_loss": -7.016057014465332, "global_step": 193097, "epoch": 4597} {"train_loss": -7.191340446472168, "global_step": 193098, "epoch": 4597} {"train_loss": -7.071206092834473, "global_step": 193099, "epoch": 4597} {"train_loss": -7.077854156494141, "global_step": 193100, "epoch": 4597} {"train_loss": -7.11042594909668, "global_step": 193101, "epoch": 4597} {"train_loss": -7.022088050842285, "global_step": 193102, "epoch": 4597} {"train_loss": -7.203793525695801, "global_step": 193103, "epoch": 4597} {"train_loss": -6.951565742492676, "global_step": 193104, "epoch": 4597} {"train_loss": -7.052315711975098, "global_step": 193105, "epoch": 4597} {"train_loss": -7.090458869934082, "global_step": 193106, "epoch": 4597} {"train_loss": -7.000134468078613, "global_step": 193107, "epoch": 4597} {"train_loss": -7.208931922912598, "global_step": 193108, "epoch": 4597} {"train_loss": -6.981503009796143, "global_step": 193109, "epoch": 4597} {"train_loss": -7.058849334716797, "global_step": 193110, "epoch": 4597} {"train_loss": -7.237551689147949, "global_step": 193111, "epoch": 4597} {"train_loss": -7.047980785369873, "global_step": 193112, "epoch": 4597} {"train_loss": -7.129049301147461, "global_step": 193113, "epoch": 4597} {"train_loss": -7.090982437133789, "global_step": 193114, "epoch": 4597} {"train_loss": -7.141837528773716, "global_step": 193115, "epoch": 4597, "val_loss": 69846.9609375} {"train_loss": -7.028778553009033, "global_step": 193116, "epoch": 4598} {"train_loss": -7.2066874504089355, "global_step": 193117, "epoch": 4598} {"train_loss": -6.999209880828857, "global_step": 193118, "epoch": 4598} {"train_loss": -7.155069351196289, "global_step": 193119, "epoch": 4598} {"train_loss": -7.116921901702881, "global_step": 193120, "epoch": 4598} {"train_loss": -7.0593109130859375, "global_step": 193121, "epoch": 4598} {"train_loss": -7.144634246826172, "global_step": 193122, "epoch": 4598} {"train_loss": -7.0674214363098145, "global_step": 193123, "epoch": 4598} {"train_loss": -7.180591583251953, "global_step": 193124, "epoch": 4598} {"train_loss": -7.045953273773193, "global_step": 193125, "epoch": 4598} {"train_loss": -7.148684978485107, "global_step": 193126, "epoch": 4598} {"train_loss": -7.151440620422363, "global_step": 193127, "epoch": 4598} {"train_loss": -7.135138511657715, "global_step": 193128, "epoch": 4598} {"train_loss": -7.215364933013916, "global_step": 193129, "epoch": 4598} {"train_loss": -7.212277412414551, "global_step": 193130, "epoch": 4598} {"train_loss": -7.096017837524414, "global_step": 193131, "epoch": 4598} {"train_loss": -7.132922172546387, "global_step": 193132, "epoch": 4598} {"train_loss": -7.175893783569336, "global_step": 193133, "epoch": 4598} {"train_loss": -7.228419303894043, "global_step": 193134, "epoch": 4598} {"train_loss": -7.276933670043945, "global_step": 193135, "epoch": 4598} {"train_loss": -7.179912090301514, "global_step": 193136, "epoch": 4598} {"train_loss": -7.250861644744873, "global_step": 193137, "epoch": 4598} {"train_loss": -7.252608299255371, "global_step": 193138, "epoch": 4598} {"train_loss": -7.2036638259887695, "global_step": 193139, "epoch": 4598} {"train_loss": -7.257683753967285, "global_step": 193140, "epoch": 4598} {"train_loss": -7.2475786209106445, "global_step": 193141, "epoch": 4598} {"train_loss": -7.233944892883301, "global_step": 193142, "epoch": 4598} {"train_loss": -7.281135559082031, "global_step": 193143, "epoch": 4598} {"train_loss": -7.253053665161133, "global_step": 193144, "epoch": 4598} {"train_loss": -7.215039253234863, "global_step": 193145, "epoch": 4598} {"train_loss": -7.293838977813721, "global_step": 193146, "epoch": 4598} {"train_loss": -7.242643356323242, "global_step": 193147, "epoch": 4598} {"train_loss": -7.361830711364746, "global_step": 193148, "epoch": 4598} {"train_loss": -7.340485572814941, "global_step": 193149, "epoch": 4598} {"train_loss": -7.344650745391846, "global_step": 193150, "epoch": 4598} {"train_loss": -7.295053958892822, "global_step": 193151, "epoch": 4598} {"train_loss": -7.2997918128967285, "global_step": 193152, "epoch": 4598} {"train_loss": -7.188654899597168, "global_step": 193153, "epoch": 4598} {"train_loss": -7.256584167480469, "global_step": 193154, "epoch": 4598} {"train_loss": -7.265964508056641, "global_step": 193155, "epoch": 4598} {"train_loss": -7.305267333984375, "global_step": 193156, "epoch": 4598} {"train_loss": -7.205871298199608, "global_step": 193157, "epoch": 4598, "val_loss": 69536.53125} {"train_loss": -7.23960542678833, "global_step": 193158, "epoch": 4599} {"train_loss": -7.2336225509643555, "global_step": 193159, "epoch": 4599} {"train_loss": -7.281854629516602, "global_step": 193160, "epoch": 4599} {"train_loss": -7.248322486877441, "global_step": 193161, "epoch": 4599} {"train_loss": -7.25297212600708, "global_step": 193162, "epoch": 4599} {"train_loss": -7.2467474937438965, "global_step": 193163, "epoch": 4599} {"train_loss": -7.3382792472839355, "global_step": 193164, "epoch": 4599} {"train_loss": -7.300222396850586, "global_step": 193165, "epoch": 4599} {"train_loss": -7.343227386474609, "global_step": 193166, "epoch": 4599} {"train_loss": -7.270839691162109, "global_step": 193167, "epoch": 4599} {"train_loss": -7.289322853088379, "global_step": 193168, "epoch": 4599} {"train_loss": -7.352877616882324, "global_step": 193169, "epoch": 4599} {"train_loss": -7.324797630310059, "global_step": 193170, "epoch": 4599} {"train_loss": -7.334151268005371, "global_step": 193171, "epoch": 4599} {"train_loss": -7.284875392913818, "global_step": 193172, "epoch": 4599} {"train_loss": -7.340024948120117, "global_step": 193173, "epoch": 4599} {"train_loss": -7.354689121246338, "global_step": 193174, "epoch": 4599} {"train_loss": -7.097829818725586, "global_step": 193175, "epoch": 4599} {"train_loss": -7.126441955566406, "global_step": 193176, "epoch": 4599} {"train_loss": -7.221438884735107, "global_step": 193177, "epoch": 4599} {"train_loss": -7.192562103271484, "global_step": 193178, "epoch": 4599} {"train_loss": -7.229329586029053, "global_step": 193179, "epoch": 4599} {"train_loss": -7.201888561248779, "global_step": 193180, "epoch": 4599} {"train_loss": -7.236848831176758, "global_step": 193181, "epoch": 4599} {"train_loss": -7.164654731750488, "global_step": 193182, "epoch": 4599} {"train_loss": -7.302540302276611, "global_step": 193183, "epoch": 4599} {"train_loss": -7.235507965087891, "global_step": 193184, "epoch": 4599} {"train_loss": -7.267163276672363, "global_step": 193185, "epoch": 4599} {"train_loss": -7.217535972595215, "global_step": 193186, "epoch": 4599} {"train_loss": -7.139199256896973, "global_step": 193187, "epoch": 4599} {"train_loss": -7.26756477355957, "global_step": 193188, "epoch": 4599} {"train_loss": -7.293240547180176, "global_step": 193189, "epoch": 4599} {"train_loss": -7.290403842926025, "global_step": 193190, "epoch": 4599} {"train_loss": -7.266255855560303, "global_step": 193191, "epoch": 4599} {"train_loss": -7.343171119689941, "global_step": 193192, "epoch": 4599} {"train_loss": -7.191561698913574, "global_step": 193193, "epoch": 4599} {"train_loss": -7.248702049255371, "global_step": 193194, "epoch": 4599} {"train_loss": -7.336874008178711, "global_step": 193195, "epoch": 4599} {"train_loss": -7.242814064025879, "global_step": 193196, "epoch": 4599} {"train_loss": -7.291287899017334, "global_step": 193197, "epoch": 4599} {"train_loss": -6.9705095291137695, "global_step": 193198, "epoch": 4599} {"train_loss": -7.248468841825213, "global_step": 193199, "epoch": 4599, "val_loss": 69632.921875} {"train_loss": -7.2090044021606445, "global_step": 193200, "epoch": 4600} {"train_loss": -7.344668865203857, "global_step": 193201, "epoch": 4600} {"train_loss": -7.219771862030029, "global_step": 193202, "epoch": 4600} {"train_loss": -7.3124566078186035, "global_step": 193203, "epoch": 4600} {"train_loss": -7.17867374420166, "global_step": 193204, "epoch": 4600} {"train_loss": -7.265174865722656, "global_step": 193205, "epoch": 4600} {"train_loss": -7.18501091003418, "global_step": 193206, "epoch": 4600} {"train_loss": -7.141484260559082, "global_step": 193207, "epoch": 4600} {"train_loss": -7.202612400054932, "global_step": 193208, "epoch": 4600} {"train_loss": -7.225383758544922, "global_step": 193209, "epoch": 4600} {"train_loss": -7.331334114074707, "global_step": 193210, "epoch": 4600} {"train_loss": -7.138175010681152, "global_step": 193211, "epoch": 4600} {"train_loss": -7.1989827156066895, "global_step": 193212, "epoch": 4600} {"train_loss": -7.261173248291016, "global_step": 193213, "epoch": 4600} {"train_loss": -7.233150482177734, "global_step": 193214, "epoch": 4600} {"train_loss": -7.257850646972656, "global_step": 193215, "epoch": 4600} {"train_loss": -7.27176570892334, "global_step": 193216, "epoch": 4600} {"train_loss": -7.074019432067871, "global_step": 193217, "epoch": 4600} {"train_loss": -7.235403537750244, "global_step": 193218, "epoch": 4600} {"train_loss": -7.143481731414795, "global_step": 193219, "epoch": 4600} {"train_loss": -7.052657127380371, "global_step": 193220, "epoch": 4600} {"train_loss": -7.177583694458008, "global_step": 193221, "epoch": 4600} {"train_loss": -7.305154800415039, "global_step": 193222, "epoch": 4600} {"train_loss": -7.182950019836426, "global_step": 193223, "epoch": 4600} {"train_loss": -7.2002973556518555, "global_step": 193224, "epoch": 4600} {"train_loss": -7.199711799621582, "global_step": 193225, "epoch": 4600} {"train_loss": -7.298521041870117, "global_step": 193226, "epoch": 4600} {"train_loss": -7.191298961639404, "global_step": 193227, "epoch": 4600} {"train_loss": -7.2408576011657715, "global_step": 193228, "epoch": 4600} {"train_loss": -7.123378276824951, "global_step": 193229, "epoch": 4600} {"train_loss": -7.204249382019043, "global_step": 193230, "epoch": 4600} {"train_loss": -7.256274223327637, "global_step": 193231, "epoch": 4600} {"train_loss": -7.167031288146973, "global_step": 193232, "epoch": 4600} {"train_loss": -7.20505428314209, "global_step": 193233, "epoch": 4600} {"train_loss": -7.291996955871582, "global_step": 193234, "epoch": 4600} {"train_loss": -7.343982696533203, "global_step": 193235, "epoch": 4600} {"train_loss": -7.16047477722168, "global_step": 193236, "epoch": 4600} {"train_loss": -7.25260066986084, "global_step": 193237, "epoch": 4600} {"train_loss": -7.277955055236816, "global_step": 193238, "epoch": 4600} {"train_loss": -7.259012222290039, "global_step": 193239, "epoch": 4600} {"train_loss": -7.23674201965332, "global_step": 193240, "epoch": 4600} {"train_loss": -7.2222213972182505, "global_step": 193241, "epoch": 4600, "train/sim_max_reward_0": 0.1940307411747846, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.8239016442245004, "train/sim_max_reward_3": 0.14155355975978756, "train/sim_max_reward_4": 0.882437012492949, "train/sim_max_reward_5": 0.20271746005057953, "test/sim_max_reward_4300000": 1.0, "test/sim_max_reward_4300001": 0.15856306911424822, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 0.9620767192508227, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.2925525969529994, "test/sim_max_reward_4300008": 0.4179724538464782, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.8886403077897049, "test/sim_max_reward_4300011": 0.9921370555756205, "test/sim_max_reward_4300012": 0.9743344737717975, "test/sim_max_reward_4300013": 0.40135253704099605, "test/sim_max_reward_4300014": 0.9706335215873406, "test/sim_max_reward_4300015": 0.9902446307308165, "test/sim_max_reward_4300016": 0.9697884786587118, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.3699309528834029, "test/sim_max_reward_4300019": 0.18596055313358995, "test/sim_max_reward_4300020": 0.00997988488374456, "test/sim_max_reward_4300021": 0.8427281269655117, "test/sim_max_reward_4300022": 0.9261154498438464, "test/sim_max_reward_4300023": 0.4816021003351824, "test/sim_max_reward_4300024": 0.5357701995458446, "test/sim_max_reward_4300025": 0.9376378668424945, "test/sim_max_reward_4300026": 0.18561625347132682, "test/sim_max_reward_4300027": 0.9197540667606814, "test/sim_max_reward_4300028": 0.9490450180474205, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.28576044822862506, "test/sim_max_reward_4300031": 0.8973273149546684, "test/sim_max_reward_4300032": 0.9733286674562343, "test/sim_max_reward_4300033": 0.7035079419610724, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.0, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.5998030493906058, "test/sim_max_reward_4300038": 0.9384775634018152, "test/sim_max_reward_4300039": 0.8031068426042138, "test/sim_max_reward_4300040": 0.9954270533795078, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7042529559830778, "test/sim_max_reward_4300043": 0.10547533554938293, "test/sim_max_reward_4300044": 1.0, "test/sim_max_reward_4300045": 0.19640464140878075, "test/sim_max_reward_4300046": 0.8992149422636226, "test/sim_max_reward_4300047": 0.14015328361827797, "test/sim_max_reward_4300048": 0.0006845197585733277, "test/sim_max_reward_4300049": 0.0787847125078575, "train/mean_score": 0.5407734029504335, "test/mean_score": 0.5779834761974333, "val_loss": 69623.1015625} {"train_loss": -7.228011608123779, "global_step": 193242, "epoch": 4601} {"train_loss": -7.253262042999268, "global_step": 193243, "epoch": 4601} {"train_loss": -7.192024230957031, "global_step": 193244, "epoch": 4601} {"train_loss": -7.235041618347168, "global_step": 193245, "epoch": 4601} {"train_loss": -7.264243125915527, "global_step": 193246, "epoch": 4601} {"train_loss": -7.3158979415893555, "global_step": 193247, "epoch": 4601} {"train_loss": -7.197576522827148, "global_step": 193248, "epoch": 4601} {"train_loss": -7.129075050354004, "global_step": 193249, "epoch": 4601} {"train_loss": -7.239461898803711, "global_step": 193250, "epoch": 4601} {"train_loss": -7.215601921081543, "global_step": 193251, "epoch": 4601} {"train_loss": -7.2827229499816895, "global_step": 193252, "epoch": 4601} {"train_loss": -7.208796501159668, "global_step": 193253, "epoch": 4601} {"train_loss": -7.18508768081665, "global_step": 193254, "epoch": 4601} {"train_loss": -7.22944450378418, "global_step": 193255, "epoch": 4601} {"train_loss": -7.126044273376465, "global_step": 193256, "epoch": 4601} {"train_loss": -7.314483642578125, "global_step": 193257, "epoch": 4601} {"train_loss": -7.182168483734131, "global_step": 193258, "epoch": 4601} {"train_loss": -7.159930229187012, "global_step": 193259, "epoch": 4601} {"train_loss": -7.096571922302246, "global_step": 193260, "epoch": 4601} {"train_loss": -7.094579219818115, "global_step": 193261, "epoch": 4601} {"train_loss": -7.071727752685547, "global_step": 193262, "epoch": 4601} {"train_loss": -7.108556747436523, "global_step": 193263, "epoch": 4601} {"train_loss": -7.18499231338501, "global_step": 193264, "epoch": 4601} {"train_loss": -7.133851051330566, "global_step": 193265, "epoch": 4601} {"train_loss": -7.053380012512207, "global_step": 193266, "epoch": 4601} {"train_loss": -7.096044540405273, "global_step": 193267, "epoch": 4601} {"train_loss": -7.172292709350586, "global_step": 193268, "epoch": 4601} {"train_loss": -7.103005409240723, "global_step": 193269, "epoch": 4601} {"train_loss": -7.106879711151123, "global_step": 193270, "epoch": 4601} {"train_loss": -7.1263041496276855, "global_step": 193271, "epoch": 4601} {"train_loss": -7.0586748123168945, "global_step": 193272, "epoch": 4601} {"train_loss": -7.1348161697387695, "global_step": 193273, "epoch": 4601} {"train_loss": -7.164092063903809, "global_step": 193274, "epoch": 4601} {"train_loss": -7.272927284240723, "global_step": 193275, "epoch": 4601} {"train_loss": -7.18271541595459, "global_step": 193276, "epoch": 4601} {"train_loss": -7.272994041442871, "global_step": 193277, "epoch": 4601} {"train_loss": -7.165467262268066, "global_step": 193278, "epoch": 4601} {"train_loss": -7.192191123962402, "global_step": 193279, "epoch": 4601} {"train_loss": -7.255727767944336, "global_step": 193280, "epoch": 4601} {"train_loss": -7.161943435668945, "global_step": 193281, "epoch": 4601} {"train_loss": -7.270837306976318, "global_step": 193282, "epoch": 4601} {"train_loss": -7.180256548381987, "global_step": 193283, "epoch": 4601, "val_loss": 69759.3671875} {"train_loss": -7.220304012298584, "global_step": 193284, "epoch": 4602} {"train_loss": -7.2066545486450195, "global_step": 193285, "epoch": 4602} {"train_loss": -7.239113807678223, "global_step": 193286, "epoch": 4602} {"train_loss": -7.295610427856445, "global_step": 193287, "epoch": 4602} {"train_loss": -7.178133010864258, "global_step": 193288, "epoch": 4602} {"train_loss": -7.039815902709961, "global_step": 193289, "epoch": 4602} {"train_loss": -7.307405471801758, "global_step": 193290, "epoch": 4602} {"train_loss": -7.1304521560668945, "global_step": 193291, "epoch": 4602} {"train_loss": -7.152000427246094, "global_step": 193292, "epoch": 4602} {"train_loss": -7.165583610534668, "global_step": 193293, "epoch": 4602} {"train_loss": -7.09896183013916, "global_step": 193294, "epoch": 4602} {"train_loss": -7.135659694671631, "global_step": 193295, "epoch": 4602} {"train_loss": -7.143150329589844, "global_step": 193296, "epoch": 4602} {"train_loss": -7.222947120666504, "global_step": 193297, "epoch": 4602} {"train_loss": -7.303877830505371, "global_step": 193298, "epoch": 4602} {"train_loss": -7.241601943969727, "global_step": 193299, "epoch": 4602} {"train_loss": -7.29958963394165, "global_step": 193300, "epoch": 4602} {"train_loss": -7.228184223175049, "global_step": 193301, "epoch": 4602} {"train_loss": -7.341067790985107, "global_step": 193302, "epoch": 4602} {"train_loss": -7.238807201385498, "global_step": 193303, "epoch": 4602} {"train_loss": -7.195234775543213, "global_step": 193304, "epoch": 4602} {"train_loss": -7.313595771789551, "global_step": 193305, "epoch": 4602} {"train_loss": -7.177563667297363, "global_step": 193306, "epoch": 4602} {"train_loss": -7.233852386474609, "global_step": 193307, "epoch": 4602} {"train_loss": -7.200225353240967, "global_step": 193308, "epoch": 4602} {"train_loss": -7.18838357925415, "global_step": 193309, "epoch": 4602} {"train_loss": -7.1482014656066895, "global_step": 193310, "epoch": 4602} {"train_loss": -7.152120113372803, "global_step": 193311, "epoch": 4602} {"train_loss": -7.03972053527832, "global_step": 193312, "epoch": 4602} {"train_loss": -7.124024391174316, "global_step": 193313, "epoch": 4602} {"train_loss": -7.0714640617370605, "global_step": 193314, "epoch": 4602} {"train_loss": -7.052600383758545, "global_step": 193315, "epoch": 4602} {"train_loss": -7.152369022369385, "global_step": 193316, "epoch": 4602} {"train_loss": -7.160723686218262, "global_step": 193317, "epoch": 4602} {"train_loss": -6.950140953063965, "global_step": 193318, "epoch": 4602} {"train_loss": -7.136845588684082, "global_step": 193319, "epoch": 4602} {"train_loss": -7.070016860961914, "global_step": 193320, "epoch": 4602} {"train_loss": -7.177213668823242, "global_step": 193321, "epoch": 4602} {"train_loss": -7.029514312744141, "global_step": 193322, "epoch": 4602} {"train_loss": -7.2433061599731445, "global_step": 193323, "epoch": 4602} {"train_loss": -7.241480827331543, "global_step": 193324, "epoch": 4602} {"train_loss": -7.176515465690976, "global_step": 193325, "epoch": 4602, "val_loss": 69893.8984375} {"train_loss": -7.163042068481445, "global_step": 193326, "epoch": 4603} {"train_loss": -7.093842029571533, "global_step": 193327, "epoch": 4603} {"train_loss": -7.174156188964844, "global_step": 193328, "epoch": 4603} {"train_loss": -7.239483833312988, "global_step": 193329, "epoch": 4603} {"train_loss": -7.3072123527526855, "global_step": 193330, "epoch": 4603} {"train_loss": -7.288735389709473, "global_step": 193331, "epoch": 4603} {"train_loss": -7.153728485107422, "global_step": 193332, "epoch": 4603} {"train_loss": -7.158113479614258, "global_step": 193333, "epoch": 4603} {"train_loss": -7.08197021484375, "global_step": 193334, "epoch": 4603} {"train_loss": -7.158062934875488, "global_step": 193335, "epoch": 4603} {"train_loss": -7.112179756164551, "global_step": 193336, "epoch": 4603} {"train_loss": -7.075037002563477, "global_step": 193337, "epoch": 4603} {"train_loss": -7.214685440063477, "global_step": 193338, "epoch": 4603} {"train_loss": -7.145698070526123, "global_step": 193339, "epoch": 4603} {"train_loss": -7.028456687927246, "global_step": 193340, "epoch": 4603} {"train_loss": -7.126700401306152, "global_step": 193341, "epoch": 4603} {"train_loss": -7.063724517822266, "global_step": 193342, "epoch": 4603} {"train_loss": -7.184134483337402, "global_step": 193343, "epoch": 4603} {"train_loss": -7.115828514099121, "global_step": 193344, "epoch": 4603} {"train_loss": -7.110913276672363, "global_step": 193345, "epoch": 4603} {"train_loss": -7.1812238693237305, "global_step": 193346, "epoch": 4603} {"train_loss": -7.034538269042969, "global_step": 193347, "epoch": 4603} {"train_loss": -7.1917243003845215, "global_step": 193348, "epoch": 4603} {"train_loss": -7.093009948730469, "global_step": 193349, "epoch": 4603} {"train_loss": -7.2234344482421875, "global_step": 193350, "epoch": 4603} {"train_loss": -7.177383899688721, "global_step": 193351, "epoch": 4603} {"train_loss": -7.271034240722656, "global_step": 193352, "epoch": 4603} {"train_loss": -7.149483680725098, "global_step": 193353, "epoch": 4603} {"train_loss": -7.057466506958008, "global_step": 193354, "epoch": 4603} {"train_loss": -7.146555423736572, "global_step": 193355, "epoch": 4603} {"train_loss": -7.059841632843018, "global_step": 193356, "epoch": 4603} {"train_loss": -7.260091781616211, "global_step": 193357, "epoch": 4603} {"train_loss": -7.119930267333984, "global_step": 193358, "epoch": 4603} {"train_loss": -7.238217353820801, "global_step": 193359, "epoch": 4603} {"train_loss": -7.162184715270996, "global_step": 193360, "epoch": 4603} {"train_loss": -7.265072345733643, "global_step": 193361, "epoch": 4603} {"train_loss": -7.211531639099121, "global_step": 193362, "epoch": 4603} {"train_loss": -7.1654372215271, "global_step": 193363, "epoch": 4603} {"train_loss": -7.147621154785156, "global_step": 193364, "epoch": 4603} {"train_loss": -7.279114246368408, "global_step": 193365, "epoch": 4603} {"train_loss": -7.201099395751953, "global_step": 193366, "epoch": 4603} {"train_loss": -7.161668311981928, "global_step": 193367, "epoch": 4603, "val_loss": 69769.6796875} {"train_loss": -7.189807891845703, "global_step": 193368, "epoch": 4604} {"train_loss": -7.19736909866333, "global_step": 193369, "epoch": 4604} {"train_loss": -7.337894916534424, "global_step": 193370, "epoch": 4604} {"train_loss": -7.084473133087158, "global_step": 193371, "epoch": 4604} {"train_loss": -7.1765313148498535, "global_step": 193372, "epoch": 4604} {"train_loss": -7.318131446838379, "global_step": 193373, "epoch": 4604} {"train_loss": -7.319851875305176, "global_step": 193374, "epoch": 4604} {"train_loss": -7.227166175842285, "global_step": 193375, "epoch": 4604} {"train_loss": -7.343079566955566, "global_step": 193376, "epoch": 4604} {"train_loss": -7.293982982635498, "global_step": 193377, "epoch": 4604} {"train_loss": -7.250370979309082, "global_step": 193378, "epoch": 4604} {"train_loss": -7.341487407684326, "global_step": 193379, "epoch": 4604} {"train_loss": -7.282299041748047, "global_step": 193380, "epoch": 4604} {"train_loss": -7.278177738189697, "global_step": 193381, "epoch": 4604} {"train_loss": -7.10198974609375, "global_step": 193382, "epoch": 4604} {"train_loss": -7.133413314819336, "global_step": 193383, "epoch": 4604} {"train_loss": -7.269153118133545, "global_step": 193384, "epoch": 4604} {"train_loss": -7.046360015869141, "global_step": 193385, "epoch": 4604} {"train_loss": -7.164502143859863, "global_step": 193386, "epoch": 4604} {"train_loss": -7.208584785461426, "global_step": 193387, "epoch": 4604} {"train_loss": -7.089243412017822, "global_step": 193388, "epoch": 4604} {"train_loss": -7.104267597198486, "global_step": 193389, "epoch": 4604} {"train_loss": -7.1484174728393555, "global_step": 193390, "epoch": 4604} {"train_loss": -7.0647430419921875, "global_step": 193391, "epoch": 4604} {"train_loss": -7.214973449707031, "global_step": 193392, "epoch": 4604} {"train_loss": -7.256998538970947, "global_step": 193393, "epoch": 4604} {"train_loss": -7.059666156768799, "global_step": 193394, "epoch": 4604} {"train_loss": -7.164341449737549, "global_step": 193395, "epoch": 4604} {"train_loss": -7.215768814086914, "global_step": 193396, "epoch": 4604} {"train_loss": -7.263711929321289, "global_step": 193397, "epoch": 4604} {"train_loss": -7.091048240661621, "global_step": 193398, "epoch": 4604} {"train_loss": -7.10835599899292, "global_step": 193399, "epoch": 4604} {"train_loss": -7.083160400390625, "global_step": 193400, "epoch": 4604} {"train_loss": -7.111706733703613, "global_step": 193401, "epoch": 4604} {"train_loss": -7.034658908843994, "global_step": 193402, "epoch": 4604} {"train_loss": -7.144774436950684, "global_step": 193403, "epoch": 4604} {"train_loss": -7.212723731994629, "global_step": 193404, "epoch": 4604} {"train_loss": -7.0846052169799805, "global_step": 193405, "epoch": 4604} {"train_loss": -7.127499103546143, "global_step": 193406, "epoch": 4604} {"train_loss": -7.186333656311035, "global_step": 193407, "epoch": 4604} {"train_loss": -7.176351547241211, "global_step": 193408, "epoch": 4604} {"train_loss": -7.180938380105155, "global_step": 193409, "epoch": 4604, "val_loss": 69816.96875} {"train_loss": -7.175717353820801, "global_step": 193410, "epoch": 4605} {"train_loss": -7.162822723388672, "global_step": 193411, "epoch": 4605} {"train_loss": -7.025778770446777, "global_step": 193412, "epoch": 4605} {"train_loss": -7.187058448791504, "global_step": 193413, "epoch": 4605} {"train_loss": -7.250298023223877, "global_step": 193414, "epoch": 4605} {"train_loss": -7.062397003173828, "global_step": 193415, "epoch": 4605} {"train_loss": -7.087810516357422, "global_step": 193416, "epoch": 4605} {"train_loss": -7.116626739501953, "global_step": 193417, "epoch": 4605} {"train_loss": -7.16349458694458, "global_step": 193418, "epoch": 4605} {"train_loss": -7.143502235412598, "global_step": 193419, "epoch": 4605} {"train_loss": -7.192317008972168, "global_step": 193420, "epoch": 4605} {"train_loss": -7.174290180206299, "global_step": 193421, "epoch": 4605} {"train_loss": -7.123424530029297, "global_step": 193422, "epoch": 4605} {"train_loss": -7.220791339874268, "global_step": 193423, "epoch": 4605} {"train_loss": -7.225312232971191, "global_step": 193424, "epoch": 4605} {"train_loss": -7.1483635902404785, "global_step": 193425, "epoch": 4605} {"train_loss": -7.245622634887695, "global_step": 193426, "epoch": 4605} {"train_loss": -7.148647308349609, "global_step": 193427, "epoch": 4605} {"train_loss": -7.136747360229492, "global_step": 193428, "epoch": 4605} {"train_loss": -7.229120254516602, "global_step": 193429, "epoch": 4605} {"train_loss": -7.1405839920043945, "global_step": 193430, "epoch": 4605} {"train_loss": -7.206117630004883, "global_step": 193431, "epoch": 4605} {"train_loss": -7.200787544250488, "global_step": 193432, "epoch": 4605} {"train_loss": -7.127646446228027, "global_step": 193433, "epoch": 4605} {"train_loss": -7.152467727661133, "global_step": 193434, "epoch": 4605} {"train_loss": -7.1510210037231445, "global_step": 193435, "epoch": 4605} {"train_loss": -7.134706020355225, "global_step": 193436, "epoch": 4605} {"train_loss": -7.160459995269775, "global_step": 193437, "epoch": 4605} {"train_loss": -7.031548976898193, "global_step": 193438, "epoch": 4605} {"train_loss": -7.23983097076416, "global_step": 193439, "epoch": 4605} {"train_loss": -7.0716471672058105, "global_step": 193440, "epoch": 4605} {"train_loss": -7.120118141174316, "global_step": 193441, "epoch": 4605} {"train_loss": -7.1546831130981445, "global_step": 193442, "epoch": 4605} {"train_loss": -7.176668167114258, "global_step": 193443, "epoch": 4605} {"train_loss": -7.150928974151611, "global_step": 193444, "epoch": 4605} {"train_loss": -7.163459777832031, "global_step": 193445, "epoch": 4605} {"train_loss": -7.169723987579346, "global_step": 193446, "epoch": 4605} {"train_loss": -7.200933456420898, "global_step": 193447, "epoch": 4605} {"train_loss": -7.195544719696045, "global_step": 193448, "epoch": 4605} {"train_loss": -7.1468305587768555, "global_step": 193449, "epoch": 4605} {"train_loss": -7.061295509338379, "global_step": 193450, "epoch": 4605} {"train_loss": -7.155066456113543, "global_step": 193451, "epoch": 4605, "val_loss": 69950.1484375} {"train_loss": -6.955315589904785, "global_step": 193452, "epoch": 4606} {"train_loss": -7.130596160888672, "global_step": 193453, "epoch": 4606} {"train_loss": -7.109803199768066, "global_step": 193454, "epoch": 4606} {"train_loss": -6.9544677734375, "global_step": 193455, "epoch": 4606} {"train_loss": -7.133209705352783, "global_step": 193456, "epoch": 4606} {"train_loss": -7.222831726074219, "global_step": 193457, "epoch": 4606} {"train_loss": -7.129302978515625, "global_step": 193458, "epoch": 4606} {"train_loss": -7.1216230392456055, "global_step": 193459, "epoch": 4606} {"train_loss": -7.115229606628418, "global_step": 193460, "epoch": 4606} {"train_loss": -7.164722442626953, "global_step": 193461, "epoch": 4606} {"train_loss": -7.224804878234863, "global_step": 193462, "epoch": 4606} {"train_loss": -7.108885765075684, "global_step": 193463, "epoch": 4606} {"train_loss": -7.1171650886535645, "global_step": 193464, "epoch": 4606} {"train_loss": -7.163782119750977, "global_step": 193465, "epoch": 4606} {"train_loss": -7.146085739135742, "global_step": 193466, "epoch": 4606} {"train_loss": -7.1577911376953125, "global_step": 193467, "epoch": 4606} {"train_loss": -7.142971992492676, "global_step": 193468, "epoch": 4606} {"train_loss": -7.282470226287842, "global_step": 193469, "epoch": 4606} {"train_loss": -7.259765148162842, "global_step": 193470, "epoch": 4606} {"train_loss": -7.179186820983887, "global_step": 193471, "epoch": 4606} {"train_loss": -7.334444046020508, "global_step": 193472, "epoch": 4606} {"train_loss": -7.184309005737305, "global_step": 193473, "epoch": 4606} {"train_loss": -7.167280197143555, "global_step": 193474, "epoch": 4606} {"train_loss": -7.2365522384643555, "global_step": 193475, "epoch": 4606} {"train_loss": -7.2500410079956055, "global_step": 193476, "epoch": 4606} {"train_loss": -7.173088073730469, "global_step": 193477, "epoch": 4606} {"train_loss": -7.164921760559082, "global_step": 193478, "epoch": 4606} {"train_loss": -7.2502641677856445, "global_step": 193479, "epoch": 4606} {"train_loss": -7.107995986938477, "global_step": 193480, "epoch": 4606} {"train_loss": -7.113643646240234, "global_step": 193481, "epoch": 4606} {"train_loss": -7.207082748413086, "global_step": 193482, "epoch": 4606} {"train_loss": -7.280378341674805, "global_step": 193483, "epoch": 4606} {"train_loss": -7.182892322540283, "global_step": 193484, "epoch": 4606} {"train_loss": -7.274804592132568, "global_step": 193485, "epoch": 4606} {"train_loss": -7.224625587463379, "global_step": 193486, "epoch": 4606} {"train_loss": -7.2097673416137695, "global_step": 193487, "epoch": 4606} {"train_loss": -7.182714939117432, "global_step": 193488, "epoch": 4606} {"train_loss": -7.3258466720581055, "global_step": 193489, "epoch": 4606} {"train_loss": -7.273242950439453, "global_step": 193490, "epoch": 4606} {"train_loss": -7.197709083557129, "global_step": 193491, "epoch": 4606} {"train_loss": -7.3417253494262695, "global_step": 193492, "epoch": 4606} {"train_loss": -7.186223313921974, "global_step": 193493, "epoch": 4606, "val_loss": 69689.03125} {"train_loss": -7.299776077270508, "global_step": 193494, "epoch": 4607} {"train_loss": -7.2526397705078125, "global_step": 193495, "epoch": 4607} {"train_loss": -7.3560662269592285, "global_step": 193496, "epoch": 4607} {"train_loss": -7.333930492401123, "global_step": 193497, "epoch": 4607} {"train_loss": -7.21860408782959, "global_step": 193498, "epoch": 4607} {"train_loss": -7.258017539978027, "global_step": 193499, "epoch": 4607} {"train_loss": -7.207743167877197, "global_step": 193500, "epoch": 4607} {"train_loss": -7.243658065795898, "global_step": 193501, "epoch": 4607} {"train_loss": -7.356904029846191, "global_step": 193502, "epoch": 4607} {"train_loss": -7.235975742340088, "global_step": 193503, "epoch": 4607} {"train_loss": -7.245506286621094, "global_step": 193504, "epoch": 4607} {"train_loss": -7.414292335510254, "global_step": 193505, "epoch": 4607} {"train_loss": -7.313178539276123, "global_step": 193506, "epoch": 4607} {"train_loss": -7.258273124694824, "global_step": 193507, "epoch": 4607} {"train_loss": -7.186892509460449, "global_step": 193508, "epoch": 4607} {"train_loss": -7.354930877685547, "global_step": 193509, "epoch": 4607} {"train_loss": -7.2336835861206055, "global_step": 193510, "epoch": 4607} {"train_loss": -7.207077980041504, "global_step": 193511, "epoch": 4607} {"train_loss": -7.3547492027282715, "global_step": 193512, "epoch": 4607} {"train_loss": -7.317725658416748, "global_step": 193513, "epoch": 4607} {"train_loss": -7.259282112121582, "global_step": 193514, "epoch": 4607} {"train_loss": -7.2852067947387695, "global_step": 193515, "epoch": 4607} {"train_loss": -7.361517906188965, "global_step": 193516, "epoch": 4607} {"train_loss": -7.238611698150635, "global_step": 193517, "epoch": 4607} {"train_loss": -7.170714378356934, "global_step": 193518, "epoch": 4607} {"train_loss": -7.298532485961914, "global_step": 193519, "epoch": 4607} {"train_loss": -7.333410263061523, "global_step": 193520, "epoch": 4607} {"train_loss": -7.3098039627075195, "global_step": 193521, "epoch": 4607} {"train_loss": -7.313764572143555, "global_step": 193522, "epoch": 4607} {"train_loss": -7.352313041687012, "global_step": 193523, "epoch": 4607} {"train_loss": -7.210169792175293, "global_step": 193524, "epoch": 4607} {"train_loss": -7.191437244415283, "global_step": 193525, "epoch": 4607} {"train_loss": -7.140935897827148, "global_step": 193526, "epoch": 4607} {"train_loss": -7.3554511070251465, "global_step": 193527, "epoch": 4607} {"train_loss": -7.269374370574951, "global_step": 193528, "epoch": 4607} {"train_loss": -7.06813383102417, "global_step": 193529, "epoch": 4607} {"train_loss": -7.16226863861084, "global_step": 193530, "epoch": 4607} {"train_loss": -7.200406074523926, "global_step": 193531, "epoch": 4607} {"train_loss": -7.144403457641602, "global_step": 193532, "epoch": 4607} {"train_loss": -7.125866889953613, "global_step": 193533, "epoch": 4607} {"train_loss": -7.114644527435303, "global_step": 193534, "epoch": 4607} {"train_loss": -7.254173346928188, "global_step": 193535, "epoch": 4607, "val_loss": 69721.1953125} {"train_loss": -7.084203720092773, "global_step": 193536, "epoch": 4608} {"train_loss": -7.0865044593811035, "global_step": 193537, "epoch": 4608} {"train_loss": -7.239818096160889, "global_step": 193538, "epoch": 4608} {"train_loss": -7.148275375366211, "global_step": 193539, "epoch": 4608} {"train_loss": -7.130504131317139, "global_step": 193540, "epoch": 4608} {"train_loss": -7.017777442932129, "global_step": 193541, "epoch": 4608} {"train_loss": -7.186155319213867, "global_step": 193542, "epoch": 4608} {"train_loss": -7.184046745300293, "global_step": 193543, "epoch": 4608} {"train_loss": -7.203552722930908, "global_step": 193544, "epoch": 4608} {"train_loss": -7.29503059387207, "global_step": 193545, "epoch": 4608} {"train_loss": -7.143228054046631, "global_step": 193546, "epoch": 4608} {"train_loss": -7.2072248458862305, "global_step": 193547, "epoch": 4608} {"train_loss": -7.075995445251465, "global_step": 193548, "epoch": 4608} {"train_loss": -7.125455379486084, "global_step": 193549, "epoch": 4608} {"train_loss": -7.301262378692627, "global_step": 193550, "epoch": 4608} {"train_loss": -7.100596904754639, "global_step": 193551, "epoch": 4608} {"train_loss": -7.122520923614502, "global_step": 193552, "epoch": 4608} {"train_loss": -7.200613975524902, "global_step": 193553, "epoch": 4608} {"train_loss": -7.1762590408325195, "global_step": 193554, "epoch": 4608} {"train_loss": -7.241668701171875, "global_step": 193555, "epoch": 4608} {"train_loss": -7.11109733581543, "global_step": 193556, "epoch": 4608} {"train_loss": -7.110773086547852, "global_step": 193557, "epoch": 4608} {"train_loss": -7.217752456665039, "global_step": 193558, "epoch": 4608} {"train_loss": -7.06450080871582, "global_step": 193559, "epoch": 4608} {"train_loss": -7.2988080978393555, "global_step": 193560, "epoch": 4608} {"train_loss": -7.051463603973389, "global_step": 193561, "epoch": 4608} {"train_loss": -7.230710983276367, "global_step": 193562, "epoch": 4608} {"train_loss": -7.184269905090332, "global_step": 193563, "epoch": 4608} {"train_loss": -7.153453350067139, "global_step": 193564, "epoch": 4608} {"train_loss": -7.220446586608887, "global_step": 193565, "epoch": 4608} {"train_loss": -7.192464828491211, "global_step": 193566, "epoch": 4608} {"train_loss": -7.207289695739746, "global_step": 193567, "epoch": 4608} {"train_loss": -7.134544372558594, "global_step": 193568, "epoch": 4608} {"train_loss": -7.3107500076293945, "global_step": 193569, "epoch": 4608} {"train_loss": -7.197017669677734, "global_step": 193570, "epoch": 4608} {"train_loss": -7.297159194946289, "global_step": 193571, "epoch": 4608} {"train_loss": -7.244627475738525, "global_step": 193572, "epoch": 4608} {"train_loss": -7.225086688995361, "global_step": 193573, "epoch": 4608} {"train_loss": -7.250164031982422, "global_step": 193574, "epoch": 4608} {"train_loss": -7.226804256439209, "global_step": 193575, "epoch": 4608} {"train_loss": -7.3047075271606445, "global_step": 193576, "epoch": 4608} {"train_loss": -7.184788158961704, "global_step": 193577, "epoch": 4608, "val_loss": 69784.46875} {"train_loss": -7.279035568237305, "global_step": 193578, "epoch": 4609} {"train_loss": -7.201396942138672, "global_step": 193579, "epoch": 4609} {"train_loss": -7.275943279266357, "global_step": 193580, "epoch": 4609} {"train_loss": -7.232386589050293, "global_step": 193581, "epoch": 4609} {"train_loss": -7.357539653778076, "global_step": 193582, "epoch": 4609} {"train_loss": -7.2139363288879395, "global_step": 193583, "epoch": 4609} {"train_loss": -7.353801727294922, "global_step": 193584, "epoch": 4609} {"train_loss": -7.223419666290283, "global_step": 193585, "epoch": 4609} {"train_loss": -7.325166702270508, "global_step": 193586, "epoch": 4609} {"train_loss": -7.17733097076416, "global_step": 193587, "epoch": 4609} {"train_loss": -7.306468963623047, "global_step": 193588, "epoch": 4609} {"train_loss": -7.371488571166992, "global_step": 193589, "epoch": 4609} {"train_loss": -7.171633720397949, "global_step": 193590, "epoch": 4609} {"train_loss": -7.259420394897461, "global_step": 193591, "epoch": 4609} {"train_loss": -7.2474164962768555, "global_step": 193592, "epoch": 4609} {"train_loss": -7.335680961608887, "global_step": 193593, "epoch": 4609} {"train_loss": -7.221418857574463, "global_step": 193594, "epoch": 4609} {"train_loss": -7.250252723693848, "global_step": 193595, "epoch": 4609} {"train_loss": -7.250739097595215, "global_step": 193596, "epoch": 4609} {"train_loss": -7.210944652557373, "global_step": 193597, "epoch": 4609} {"train_loss": -7.107870101928711, "global_step": 193598, "epoch": 4609} {"train_loss": -7.210773468017578, "global_step": 193599, "epoch": 4609} {"train_loss": -7.209036350250244, "global_step": 193600, "epoch": 4609} {"train_loss": -7.11391544342041, "global_step": 193601, "epoch": 4609} {"train_loss": -7.220612049102783, "global_step": 193602, "epoch": 4609} {"train_loss": -7.080075263977051, "global_step": 193603, "epoch": 4609} {"train_loss": -7.274395942687988, "global_step": 193604, "epoch": 4609} {"train_loss": -7.209331512451172, "global_step": 193605, "epoch": 4609} {"train_loss": -7.290395259857178, "global_step": 193606, "epoch": 4609} {"train_loss": -7.131290435791016, "global_step": 193607, "epoch": 4609} {"train_loss": -7.197858810424805, "global_step": 193608, "epoch": 4609} {"train_loss": -7.23793888092041, "global_step": 193609, "epoch": 4609} {"train_loss": -7.113556385040283, "global_step": 193610, "epoch": 4609} {"train_loss": -7.1355061531066895, "global_step": 193611, "epoch": 4609} {"train_loss": -7.175920486450195, "global_step": 193612, "epoch": 4609} {"train_loss": -7.312231063842773, "global_step": 193613, "epoch": 4609} {"train_loss": -7.112023830413818, "global_step": 193614, "epoch": 4609} {"train_loss": -7.17488956451416, "global_step": 193615, "epoch": 4609} {"train_loss": -7.138547420501709, "global_step": 193616, "epoch": 4609} {"train_loss": -7.320011138916016, "global_step": 193617, "epoch": 4609} {"train_loss": -7.264354228973389, "global_step": 193618, "epoch": 4609} {"train_loss": -7.228177116030738, "global_step": 193619, "epoch": 4609, "val_loss": 69685.0234375} {"train_loss": -7.307109355926514, "global_step": 193620, "epoch": 4610} {"train_loss": -7.325370788574219, "global_step": 193621, "epoch": 4610} {"train_loss": -7.2425761222839355, "global_step": 193622, "epoch": 4610} {"train_loss": -7.306756973266602, "global_step": 193623, "epoch": 4610} {"train_loss": -7.188669681549072, "global_step": 193624, "epoch": 4610} {"train_loss": -7.170818328857422, "global_step": 193625, "epoch": 4610} {"train_loss": -7.372355937957764, "global_step": 193626, "epoch": 4610} {"train_loss": -7.200009822845459, "global_step": 193627, "epoch": 4610} {"train_loss": -7.282496452331543, "global_step": 193628, "epoch": 4610} {"train_loss": -7.228065490722656, "global_step": 193629, "epoch": 4610} {"train_loss": -7.131117820739746, "global_step": 193630, "epoch": 4610} {"train_loss": -7.259297847747803, "global_step": 193631, "epoch": 4610} {"train_loss": -7.258813858032227, "global_step": 193632, "epoch": 4610} {"train_loss": -7.262306213378906, "global_step": 193633, "epoch": 4610} {"train_loss": -7.35791015625, "global_step": 193634, "epoch": 4610} {"train_loss": -7.243879795074463, "global_step": 193635, "epoch": 4610} {"train_loss": -7.3479509353637695, "global_step": 193636, "epoch": 4610} {"train_loss": -7.344271659851074, "global_step": 193637, "epoch": 4610} {"train_loss": -7.268682479858398, "global_step": 193638, "epoch": 4610} {"train_loss": -7.171224117279053, "global_step": 193639, "epoch": 4610} {"train_loss": -7.275830268859863, "global_step": 193640, "epoch": 4610} {"train_loss": -7.237485408782959, "global_step": 193641, "epoch": 4610} {"train_loss": -7.233884811401367, "global_step": 193642, "epoch": 4610} {"train_loss": -7.173027038574219, "global_step": 193643, "epoch": 4610} {"train_loss": -7.226581573486328, "global_step": 193644, "epoch": 4610} {"train_loss": -7.290251731872559, "global_step": 193645, "epoch": 4610} {"train_loss": -7.281145095825195, "global_step": 193646, "epoch": 4610} {"train_loss": -7.179174900054932, "global_step": 193647, "epoch": 4610} {"train_loss": -7.295456886291504, "global_step": 193648, "epoch": 4610} {"train_loss": -7.180178642272949, "global_step": 193649, "epoch": 4610} {"train_loss": -7.170821189880371, "global_step": 193650, "epoch": 4610} {"train_loss": -7.255468368530273, "global_step": 193651, "epoch": 4610} {"train_loss": -7.327084064483643, "global_step": 193652, "epoch": 4610} {"train_loss": -7.142502307891846, "global_step": 193653, "epoch": 4610} {"train_loss": -7.213263034820557, "global_step": 193654, "epoch": 4610} {"train_loss": -7.230998992919922, "global_step": 193655, "epoch": 4610} {"train_loss": -7.202660083770752, "global_step": 193656, "epoch": 4610} {"train_loss": -7.322701454162598, "global_step": 193657, "epoch": 4610} {"train_loss": -7.230762481689453, "global_step": 193658, "epoch": 4610} {"train_loss": -7.245908737182617, "global_step": 193659, "epoch": 4610} {"train_loss": -7.1975932121276855, "global_step": 193660, "epoch": 4610} {"train_loss": -7.245590221314203, "global_step": 193661, "epoch": 4610, "val_loss": 69791.5859375} {"train_loss": -7.1719794273376465, "global_step": 193662, "epoch": 4611} {"train_loss": -7.138316631317139, "global_step": 193663, "epoch": 4611} {"train_loss": -7.204927444458008, "global_step": 193664, "epoch": 4611} {"train_loss": -7.0914506912231445, "global_step": 193665, "epoch": 4611} {"train_loss": -7.163249969482422, "global_step": 193666, "epoch": 4611} {"train_loss": -7.161584854125977, "global_step": 193667, "epoch": 4611} {"train_loss": -7.181604862213135, "global_step": 193668, "epoch": 4611} {"train_loss": -7.308287620544434, "global_step": 193669, "epoch": 4611} {"train_loss": -7.207276344299316, "global_step": 193670, "epoch": 4611} {"train_loss": -7.132410526275635, "global_step": 193671, "epoch": 4611} {"train_loss": -7.198858261108398, "global_step": 193672, "epoch": 4611} {"train_loss": -7.026650428771973, "global_step": 193673, "epoch": 4611} {"train_loss": -7.052572727203369, "global_step": 193674, "epoch": 4611} {"train_loss": -7.1798834800720215, "global_step": 193675, "epoch": 4611} {"train_loss": -7.081646919250488, "global_step": 193676, "epoch": 4611} {"train_loss": -7.1885271072387695, "global_step": 193677, "epoch": 4611} {"train_loss": -7.0142693519592285, "global_step": 193678, "epoch": 4611} {"train_loss": -7.255941390991211, "global_step": 193679, "epoch": 4611} {"train_loss": -7.175601005554199, "global_step": 193680, "epoch": 4611} {"train_loss": -7.04871129989624, "global_step": 193681, "epoch": 4611} {"train_loss": -7.193686485290527, "global_step": 193682, "epoch": 4611} {"train_loss": -7.052509307861328, "global_step": 193683, "epoch": 4611} {"train_loss": -7.107258319854736, "global_step": 193684, "epoch": 4611} {"train_loss": -7.1574320793151855, "global_step": 193685, "epoch": 4611} {"train_loss": -7.07595157623291, "global_step": 193686, "epoch": 4611} {"train_loss": -7.108391761779785, "global_step": 193687, "epoch": 4611} {"train_loss": -7.134516716003418, "global_step": 193688, "epoch": 4611} {"train_loss": -7.0966691970825195, "global_step": 193689, "epoch": 4611} {"train_loss": -7.136265277862549, "global_step": 193690, "epoch": 4611} {"train_loss": -6.989749908447266, "global_step": 193691, "epoch": 4611} {"train_loss": -6.978026390075684, "global_step": 193692, "epoch": 4611} {"train_loss": -7.286120414733887, "global_step": 193693, "epoch": 4611} {"train_loss": -7.02653694152832, "global_step": 193694, "epoch": 4611} {"train_loss": -7.154688835144043, "global_step": 193695, "epoch": 4611} {"train_loss": -7.044676780700684, "global_step": 193696, "epoch": 4611} {"train_loss": -7.151693344116211, "global_step": 193697, "epoch": 4611} {"train_loss": -7.157483100891113, "global_step": 193698, "epoch": 4611} {"train_loss": -7.113607406616211, "global_step": 193699, "epoch": 4611} {"train_loss": -7.093199729919434, "global_step": 193700, "epoch": 4611} {"train_loss": -7.119619369506836, "global_step": 193701, "epoch": 4611} {"train_loss": -7.149613380432129, "global_step": 193702, "epoch": 4611} {"train_loss": -7.1293526490529375, "global_step": 193703, "epoch": 4611, "val_loss": 69817.8046875} {"train_loss": -6.9946393966674805, "global_step": 193704, "epoch": 4612} {"train_loss": -7.227024078369141, "global_step": 193705, "epoch": 4612} {"train_loss": -7.0842790603637695, "global_step": 193706, "epoch": 4612} {"train_loss": -7.081488132476807, "global_step": 193707, "epoch": 4612} {"train_loss": -7.157611846923828, "global_step": 193708, "epoch": 4612} {"train_loss": -7.141884803771973, "global_step": 193709, "epoch": 4612} {"train_loss": -7.1190996170043945, "global_step": 193710, "epoch": 4612} {"train_loss": -7.069230556488037, "global_step": 193711, "epoch": 4612} {"train_loss": -7.234843730926514, "global_step": 193712, "epoch": 4612} {"train_loss": -7.15650749206543, "global_step": 193713, "epoch": 4612} {"train_loss": -7.218273162841797, "global_step": 193714, "epoch": 4612} {"train_loss": -7.236874580383301, "global_step": 193715, "epoch": 4612} {"train_loss": -7.222806930541992, "global_step": 193716, "epoch": 4612} {"train_loss": -7.2343597412109375, "global_step": 193717, "epoch": 4612} {"train_loss": -7.234148025512695, "global_step": 193718, "epoch": 4612} {"train_loss": -7.20201301574707, "global_step": 193719, "epoch": 4612} {"train_loss": -7.218128204345703, "global_step": 193720, "epoch": 4612} {"train_loss": -7.213406085968018, "global_step": 193721, "epoch": 4612} {"train_loss": -7.271455764770508, "global_step": 193722, "epoch": 4612} {"train_loss": -7.167682647705078, "global_step": 193723, "epoch": 4612} {"train_loss": -7.167530059814453, "global_step": 193724, "epoch": 4612} {"train_loss": -7.31221342086792, "global_step": 193725, "epoch": 4612} {"train_loss": -7.266846656799316, "global_step": 193726, "epoch": 4612} {"train_loss": -7.125101089477539, "global_step": 193727, "epoch": 4612} {"train_loss": -7.281465530395508, "global_step": 193728, "epoch": 4612} {"train_loss": -7.173293113708496, "global_step": 193729, "epoch": 4612} {"train_loss": -7.237096786499023, "global_step": 193730, "epoch": 4612} {"train_loss": -7.309002876281738, "global_step": 193731, "epoch": 4612} {"train_loss": -7.348172187805176, "global_step": 193732, "epoch": 4612} {"train_loss": -7.280963897705078, "global_step": 193733, "epoch": 4612} {"train_loss": -7.190472602844238, "global_step": 193734, "epoch": 4612} {"train_loss": -7.242143630981445, "global_step": 193735, "epoch": 4612} {"train_loss": -7.242679595947266, "global_step": 193736, "epoch": 4612} {"train_loss": -7.2312421798706055, "global_step": 193737, "epoch": 4612} {"train_loss": -7.199329376220703, "global_step": 193738, "epoch": 4612} {"train_loss": -7.162403106689453, "global_step": 193739, "epoch": 4612} {"train_loss": -7.304924964904785, "global_step": 193740, "epoch": 4612} {"train_loss": -7.216184616088867, "global_step": 193741, "epoch": 4612} {"train_loss": -7.268677711486816, "global_step": 193742, "epoch": 4612} {"train_loss": -7.180937767028809, "global_step": 193743, "epoch": 4612} {"train_loss": -7.314286231994629, "global_step": 193744, "epoch": 4612} {"train_loss": -7.209260123116629, "global_step": 193745, "epoch": 4612, "val_loss": 69711.390625} {"train_loss": -7.270699501037598, "global_step": 193746, "epoch": 4613} {"train_loss": -7.208076477050781, "global_step": 193747, "epoch": 4613} {"train_loss": -7.262030601501465, "global_step": 193748, "epoch": 4613} {"train_loss": -7.2819108963012695, "global_step": 193749, "epoch": 4613} {"train_loss": -7.24131965637207, "global_step": 193750, "epoch": 4613} {"train_loss": -7.239633560180664, "global_step": 193751, "epoch": 4613} {"train_loss": -7.2055206298828125, "global_step": 193752, "epoch": 4613} {"train_loss": -7.165463924407959, "global_step": 193753, "epoch": 4613} {"train_loss": -7.291550636291504, "global_step": 193754, "epoch": 4613} {"train_loss": -7.130134105682373, "global_step": 193755, "epoch": 4613} {"train_loss": -7.042896747589111, "global_step": 193756, "epoch": 4613} {"train_loss": -7.196385860443115, "global_step": 193757, "epoch": 4613} {"train_loss": -7.252290725708008, "global_step": 193758, "epoch": 4613} {"train_loss": -7.1648759841918945, "global_step": 193759, "epoch": 4613} {"train_loss": -7.229562759399414, "global_step": 193760, "epoch": 4613} {"train_loss": -7.28266716003418, "global_step": 193761, "epoch": 4613} {"train_loss": -7.304960250854492, "global_step": 193762, "epoch": 4613} {"train_loss": -7.226246356964111, "global_step": 193763, "epoch": 4613} {"train_loss": -7.073258399963379, "global_step": 193764, "epoch": 4613} {"train_loss": -7.133357048034668, "global_step": 193765, "epoch": 4613} {"train_loss": -7.214550971984863, "global_step": 193766, "epoch": 4613} {"train_loss": -7.373434066772461, "global_step": 193767, "epoch": 4613} {"train_loss": -7.223584175109863, "global_step": 193768, "epoch": 4613} {"train_loss": -7.347968101501465, "global_step": 193769, "epoch": 4613} {"train_loss": -7.262290000915527, "global_step": 193770, "epoch": 4613} {"train_loss": -7.251569747924805, "global_step": 193771, "epoch": 4613} {"train_loss": -7.2464823722839355, "global_step": 193772, "epoch": 4613} {"train_loss": -7.236629486083984, "global_step": 193773, "epoch": 4613} {"train_loss": -7.288485527038574, "global_step": 193774, "epoch": 4613} {"train_loss": -7.244233131408691, "global_step": 193775, "epoch": 4613} {"train_loss": -7.221157073974609, "global_step": 193776, "epoch": 4613} {"train_loss": -7.258397102355957, "global_step": 193777, "epoch": 4613} {"train_loss": -7.273182392120361, "global_step": 193778, "epoch": 4613} {"train_loss": -7.240531921386719, "global_step": 193779, "epoch": 4613} {"train_loss": -7.285431861877441, "global_step": 193780, "epoch": 4613} {"train_loss": -7.112984657287598, "global_step": 193781, "epoch": 4613} {"train_loss": -7.269158840179443, "global_step": 193782, "epoch": 4613} {"train_loss": -7.280492782592773, "global_step": 193783, "epoch": 4613} {"train_loss": -7.249231815338135, "global_step": 193784, "epoch": 4613} {"train_loss": -7.35001277923584, "global_step": 193785, "epoch": 4613} {"train_loss": -7.138991832733154, "global_step": 193786, "epoch": 4613} {"train_loss": -7.231777588526408, "global_step": 193787, "epoch": 4613, "val_loss": 69893.6875} {"train_loss": -7.268311500549316, "global_step": 193788, "epoch": 4614} {"train_loss": -7.132888317108154, "global_step": 193789, "epoch": 4614} {"train_loss": -7.17965841293335, "global_step": 193790, "epoch": 4614} {"train_loss": -7.185075759887695, "global_step": 193791, "epoch": 4614} {"train_loss": -7.209359169006348, "global_step": 193792, "epoch": 4614} {"train_loss": -7.112235069274902, "global_step": 193793, "epoch": 4614} {"train_loss": -7.20482063293457, "global_step": 193794, "epoch": 4614} {"train_loss": -7.113951683044434, "global_step": 193795, "epoch": 4614} {"train_loss": -7.322067737579346, "global_step": 193796, "epoch": 4614} {"train_loss": -7.1999101638793945, "global_step": 193797, "epoch": 4614} {"train_loss": -7.33721923828125, "global_step": 193798, "epoch": 4614} {"train_loss": -7.175101280212402, "global_step": 193799, "epoch": 4614} {"train_loss": -7.122776508331299, "global_step": 193800, "epoch": 4614} {"train_loss": -7.246593475341797, "global_step": 193801, "epoch": 4614} {"train_loss": -7.152576446533203, "global_step": 193802, "epoch": 4614} {"train_loss": -7.206189155578613, "global_step": 193803, "epoch": 4614} {"train_loss": -7.1840667724609375, "global_step": 193804, "epoch": 4614} {"train_loss": -7.248546600341797, "global_step": 193805, "epoch": 4614} {"train_loss": -7.204148769378662, "global_step": 193806, "epoch": 4614} {"train_loss": -7.223162651062012, "global_step": 193807, "epoch": 4614} {"train_loss": -7.301860809326172, "global_step": 193808, "epoch": 4614} {"train_loss": -7.260148525238037, "global_step": 193809, "epoch": 4614} {"train_loss": -7.19495964050293, "global_step": 193810, "epoch": 4614} {"train_loss": -7.241067886352539, "global_step": 193811, "epoch": 4614} {"train_loss": -7.245948791503906, "global_step": 193812, "epoch": 4614} {"train_loss": -7.251955986022949, "global_step": 193813, "epoch": 4614} {"train_loss": -7.170283317565918, "global_step": 193814, "epoch": 4614} {"train_loss": -7.223600387573242, "global_step": 193815, "epoch": 4614} {"train_loss": -7.20328950881958, "global_step": 193816, "epoch": 4614} {"train_loss": -7.153553009033203, "global_step": 193817, "epoch": 4614} {"train_loss": -7.301369667053223, "global_step": 193818, "epoch": 4614} {"train_loss": -7.242732524871826, "global_step": 193819, "epoch": 4614} {"train_loss": -7.249979019165039, "global_step": 193820, "epoch": 4614} {"train_loss": -7.306116104125977, "global_step": 193821, "epoch": 4614} {"train_loss": -7.066862106323242, "global_step": 193822, "epoch": 4614} {"train_loss": -7.2592573165893555, "global_step": 193823, "epoch": 4614} {"train_loss": -7.236356735229492, "global_step": 193824, "epoch": 4614} {"train_loss": -7.23097562789917, "global_step": 193825, "epoch": 4614} {"train_loss": -7.215996742248535, "global_step": 193826, "epoch": 4614} {"train_loss": -7.33051872253418, "global_step": 193827, "epoch": 4614} {"train_loss": -7.303789138793945, "global_step": 193828, "epoch": 4614} {"train_loss": -7.2211610816773915, "global_step": 193829, "epoch": 4614, "val_loss": 69740.8203125} {"train_loss": -7.341251373291016, "global_step": 193830, "epoch": 4615} {"train_loss": -7.1928815841674805, "global_step": 193831, "epoch": 4615} {"train_loss": -7.221497535705566, "global_step": 193832, "epoch": 4615} {"train_loss": -7.273526668548584, "global_step": 193833, "epoch": 4615} {"train_loss": -7.263751983642578, "global_step": 193834, "epoch": 4615} {"train_loss": -7.274896144866943, "global_step": 193835, "epoch": 4615} {"train_loss": -7.327133655548096, "global_step": 193836, "epoch": 4615} {"train_loss": -7.3433732986450195, "global_step": 193837, "epoch": 4615} {"train_loss": -7.310145378112793, "global_step": 193838, "epoch": 4615} {"train_loss": -7.1090087890625, "global_step": 193839, "epoch": 4615} {"train_loss": -7.29356575012207, "global_step": 193840, "epoch": 4615} {"train_loss": -7.316330909729004, "global_step": 193841, "epoch": 4615} {"train_loss": -7.244393348693848, "global_step": 193842, "epoch": 4615} {"train_loss": -7.223478317260742, "global_step": 193843, "epoch": 4615} {"train_loss": -7.143174648284912, "global_step": 193844, "epoch": 4615} {"train_loss": -7.245354652404785, "global_step": 193845, "epoch": 4615} {"train_loss": -7.051304817199707, "global_step": 193846, "epoch": 4615} {"train_loss": -7.099732398986816, "global_step": 193847, "epoch": 4615} {"train_loss": -7.1065521240234375, "global_step": 193848, "epoch": 4615} {"train_loss": -6.975257873535156, "global_step": 193849, "epoch": 4615} {"train_loss": -7.237710952758789, "global_step": 193850, "epoch": 4615} {"train_loss": -7.082653522491455, "global_step": 193851, "epoch": 4615} {"train_loss": -7.1007280349731445, "global_step": 193852, "epoch": 4615} {"train_loss": -7.241617202758789, "global_step": 193853, "epoch": 4615} {"train_loss": -7.068632125854492, "global_step": 193854, "epoch": 4615} {"train_loss": -7.211823463439941, "global_step": 193855, "epoch": 4615} {"train_loss": -7.128307342529297, "global_step": 193856, "epoch": 4615} {"train_loss": -7.253315448760986, "global_step": 193857, "epoch": 4615} {"train_loss": -7.177417755126953, "global_step": 193858, "epoch": 4615} {"train_loss": -7.190452575683594, "global_step": 193859, "epoch": 4615} {"train_loss": -7.074942588806152, "global_step": 193860, "epoch": 4615} {"train_loss": -7.190840244293213, "global_step": 193861, "epoch": 4615} {"train_loss": -7.243778228759766, "global_step": 193862, "epoch": 4615} {"train_loss": -7.155994892120361, "global_step": 193863, "epoch": 4615} {"train_loss": -7.237656593322754, "global_step": 193864, "epoch": 4615} {"train_loss": -7.168544769287109, "global_step": 193865, "epoch": 4615} {"train_loss": -7.1691741943359375, "global_step": 193866, "epoch": 4615} {"train_loss": -7.181780815124512, "global_step": 193867, "epoch": 4615} {"train_loss": -7.154144763946533, "global_step": 193868, "epoch": 4615} {"train_loss": -7.114274978637695, "global_step": 193869, "epoch": 4615} {"train_loss": -7.25793981552124, "global_step": 193870, "epoch": 4615} {"train_loss": -7.1940345877692815, "global_step": 193871, "epoch": 4615, "val_loss": 69736.2890625} {"train_loss": -7.225854873657227, "global_step": 193872, "epoch": 4616} {"train_loss": -7.283185005187988, "global_step": 193873, "epoch": 4616} {"train_loss": -7.264946937561035, "global_step": 193874, "epoch": 4616} {"train_loss": -7.2310991287231445, "global_step": 193875, "epoch": 4616} {"train_loss": -7.333924293518066, "global_step": 193876, "epoch": 4616} {"train_loss": -7.310178756713867, "global_step": 193877, "epoch": 4616} {"train_loss": -7.22650146484375, "global_step": 193878, "epoch": 4616} {"train_loss": -7.262421607971191, "global_step": 193879, "epoch": 4616} {"train_loss": -7.153926372528076, "global_step": 193880, "epoch": 4616} {"train_loss": -7.189016342163086, "global_step": 193881, "epoch": 4616} {"train_loss": -7.113734245300293, "global_step": 193882, "epoch": 4616} {"train_loss": -7.2462968826293945, "global_step": 193883, "epoch": 4616} {"train_loss": -7.153937816619873, "global_step": 193884, "epoch": 4616} {"train_loss": -7.22554349899292, "global_step": 193885, "epoch": 4616} {"train_loss": -7.30366325378418, "global_step": 193886, "epoch": 4616} {"train_loss": -7.17581844329834, "global_step": 193887, "epoch": 4616} {"train_loss": -7.353672027587891, "global_step": 193888, "epoch": 4616} {"train_loss": -7.072933197021484, "global_step": 193889, "epoch": 4616} {"train_loss": -7.1951775550842285, "global_step": 193890, "epoch": 4616} {"train_loss": -7.264204025268555, "global_step": 193891, "epoch": 4616} {"train_loss": -7.152587890625, "global_step": 193892, "epoch": 4616} {"train_loss": -7.3534040451049805, "global_step": 193893, "epoch": 4616} {"train_loss": -7.247115135192871, "global_step": 193894, "epoch": 4616} {"train_loss": -7.219537734985352, "global_step": 193895, "epoch": 4616} {"train_loss": -7.211941719055176, "global_step": 193896, "epoch": 4616} {"train_loss": -7.185427665710449, "global_step": 193897, "epoch": 4616} {"train_loss": -7.178889751434326, "global_step": 193898, "epoch": 4616} {"train_loss": -7.172918319702148, "global_step": 193899, "epoch": 4616} {"train_loss": -7.228781700134277, "global_step": 193900, "epoch": 4616} {"train_loss": -7.189728260040283, "global_step": 193901, "epoch": 4616} {"train_loss": -7.163180351257324, "global_step": 193902, "epoch": 4616} {"train_loss": -7.2327165603637695, "global_step": 193903, "epoch": 4616} {"train_loss": -7.110411643981934, "global_step": 193904, "epoch": 4616} {"train_loss": -7.05866813659668, "global_step": 193905, "epoch": 4616} {"train_loss": -7.105725288391113, "global_step": 193906, "epoch": 4616} {"train_loss": -7.218562602996826, "global_step": 193907, "epoch": 4616} {"train_loss": -7.068752288818359, "global_step": 193908, "epoch": 4616} {"train_loss": -7.138576030731201, "global_step": 193909, "epoch": 4616} {"train_loss": -7.318726539611816, "global_step": 193910, "epoch": 4616} {"train_loss": -7.140353202819824, "global_step": 193911, "epoch": 4616} {"train_loss": -7.096626281738281, "global_step": 193912, "epoch": 4616} {"train_loss": -7.204264981406076, "global_step": 193913, "epoch": 4616, "val_loss": 69884.859375} {"train_loss": -7.2010579109191895, "global_step": 193914, "epoch": 4617} {"train_loss": -7.168298721313477, "global_step": 193915, "epoch": 4617} {"train_loss": -7.168694496154785, "global_step": 193916, "epoch": 4617} {"train_loss": -7.1939802169799805, "global_step": 193917, "epoch": 4617} {"train_loss": -7.116265296936035, "global_step": 193918, "epoch": 4617} {"train_loss": -7.163025856018066, "global_step": 193919, "epoch": 4617} {"train_loss": -7.151943206787109, "global_step": 193920, "epoch": 4617} {"train_loss": -7.048503875732422, "global_step": 193921, "epoch": 4617} {"train_loss": -7.1273908615112305, "global_step": 193922, "epoch": 4617} {"train_loss": -7.134781837463379, "global_step": 193923, "epoch": 4617} {"train_loss": -7.233622074127197, "global_step": 193924, "epoch": 4617} {"train_loss": -7.123273849487305, "global_step": 193925, "epoch": 4617} {"train_loss": -7.206669807434082, "global_step": 193926, "epoch": 4617} {"train_loss": -7.076831817626953, "global_step": 193927, "epoch": 4617} {"train_loss": -7.2142181396484375, "global_step": 193928, "epoch": 4617} {"train_loss": -7.096449375152588, "global_step": 193929, "epoch": 4617} {"train_loss": -7.128081798553467, "global_step": 193930, "epoch": 4617} {"train_loss": -7.173675060272217, "global_step": 193931, "epoch": 4617} {"train_loss": -7.223194122314453, "global_step": 193932, "epoch": 4617} {"train_loss": -7.28555154800415, "global_step": 193933, "epoch": 4617} {"train_loss": -7.22304630279541, "global_step": 193934, "epoch": 4617} {"train_loss": -7.233236789703369, "global_step": 193935, "epoch": 4617} {"train_loss": -7.133554935455322, "global_step": 193936, "epoch": 4617} {"train_loss": -7.1248087882995605, "global_step": 193937, "epoch": 4617} {"train_loss": -7.2148637771606445, "global_step": 193938, "epoch": 4617} {"train_loss": -7.220769882202148, "global_step": 193939, "epoch": 4617} {"train_loss": -7.236766815185547, "global_step": 193940, "epoch": 4617} {"train_loss": -7.182516574859619, "global_step": 193941, "epoch": 4617} {"train_loss": -7.105135917663574, "global_step": 193942, "epoch": 4617} {"train_loss": -7.277713775634766, "global_step": 193943, "epoch": 4617} {"train_loss": -7.27827787399292, "global_step": 193944, "epoch": 4617} {"train_loss": -7.125937461853027, "global_step": 193945, "epoch": 4617} {"train_loss": -7.12319278717041, "global_step": 193946, "epoch": 4617} {"train_loss": -7.193615913391113, "global_step": 193947, "epoch": 4617} {"train_loss": -7.264978408813477, "global_step": 193948, "epoch": 4617} {"train_loss": -7.185733795166016, "global_step": 193949, "epoch": 4617} {"train_loss": -7.183743000030518, "global_step": 193950, "epoch": 4617} {"train_loss": -7.279310703277588, "global_step": 193951, "epoch": 4617} {"train_loss": -7.16873836517334, "global_step": 193952, "epoch": 4617} {"train_loss": -7.255777359008789, "global_step": 193953, "epoch": 4617} {"train_loss": -7.231886863708496, "global_step": 193954, "epoch": 4617} {"train_loss": -7.185299146743048, "global_step": 193955, "epoch": 4617, "val_loss": 69659.0625} {"train_loss": -7.2576704025268555, "global_step": 193956, "epoch": 4618} {"train_loss": -7.1172895431518555, "global_step": 193957, "epoch": 4618} {"train_loss": -7.235163688659668, "global_step": 193958, "epoch": 4618} {"train_loss": -7.285030364990234, "global_step": 193959, "epoch": 4618} {"train_loss": -7.30484676361084, "global_step": 193960, "epoch": 4618} {"train_loss": -7.309659481048584, "global_step": 193961, "epoch": 4618} {"train_loss": -7.162990570068359, "global_step": 193962, "epoch": 4618} {"train_loss": -7.202627658843994, "global_step": 193963, "epoch": 4618} {"train_loss": -7.198534965515137, "global_step": 193964, "epoch": 4618} {"train_loss": -7.099909782409668, "global_step": 193965, "epoch": 4618} {"train_loss": -7.047975540161133, "global_step": 193966, "epoch": 4618} {"train_loss": -7.264220237731934, "global_step": 193967, "epoch": 4618} {"train_loss": -7.147287845611572, "global_step": 193968, "epoch": 4618} {"train_loss": -7.1654276847839355, "global_step": 193969, "epoch": 4618} {"train_loss": -7.181604385375977, "global_step": 193970, "epoch": 4618} {"train_loss": -7.157096862792969, "global_step": 193971, "epoch": 4618} {"train_loss": -7.1118059158325195, "global_step": 193972, "epoch": 4618} {"train_loss": -7.134878158569336, "global_step": 193973, "epoch": 4618} {"train_loss": -7.198375701904297, "global_step": 193974, "epoch": 4618} {"train_loss": -7.013052940368652, "global_step": 193975, "epoch": 4618} {"train_loss": -7.229471206665039, "global_step": 193976, "epoch": 4618} {"train_loss": -7.228816986083984, "global_step": 193977, "epoch": 4618} {"train_loss": -7.173332214355469, "global_step": 193978, "epoch": 4618} {"train_loss": -7.134746074676514, "global_step": 193979, "epoch": 4618} {"train_loss": -7.196206092834473, "global_step": 193980, "epoch": 4618} {"train_loss": -7.25203800201416, "global_step": 193981, "epoch": 4618} {"train_loss": -7.084055423736572, "global_step": 193982, "epoch": 4618} {"train_loss": -7.200283527374268, "global_step": 193983, "epoch": 4618} {"train_loss": -7.18704891204834, "global_step": 193984, "epoch": 4618} {"train_loss": -7.124752998352051, "global_step": 193985, "epoch": 4618} {"train_loss": -7.308032035827637, "global_step": 193986, "epoch": 4618} {"train_loss": -7.288585186004639, "global_step": 193987, "epoch": 4618} {"train_loss": -7.294767379760742, "global_step": 193988, "epoch": 4618} {"train_loss": -7.308239936828613, "global_step": 193989, "epoch": 4618} {"train_loss": -7.254701137542725, "global_step": 193990, "epoch": 4618} {"train_loss": -7.279314041137695, "global_step": 193991, "epoch": 4618} {"train_loss": -7.17594575881958, "global_step": 193992, "epoch": 4618} {"train_loss": -7.2286224365234375, "global_step": 193993, "epoch": 4618} {"train_loss": -7.22834587097168, "global_step": 193994, "epoch": 4618} {"train_loss": -7.222095489501953, "global_step": 193995, "epoch": 4618} {"train_loss": -7.283921241760254, "global_step": 193996, "epoch": 4618} {"train_loss": -7.203640006837391, "global_step": 193997, "epoch": 4618, "val_loss": 69534.296875} {"train_loss": -7.3357696533203125, "global_step": 193998, "epoch": 4619} {"train_loss": -7.203492641448975, "global_step": 193999, "epoch": 4619} {"train_loss": -7.176173210144043, "global_step": 194000, "epoch": 4619} {"train_loss": -7.1671648025512695, "global_step": 194001, "epoch": 4619} {"train_loss": -7.067162990570068, "global_step": 194002, "epoch": 4619} {"train_loss": -7.132510185241699, "global_step": 194003, "epoch": 4619} {"train_loss": -7.1718034744262695, "global_step": 194004, "epoch": 4619} {"train_loss": -7.15676736831665, "global_step": 194005, "epoch": 4619} {"train_loss": -7.226061820983887, "global_step": 194006, "epoch": 4619} {"train_loss": -7.193571090698242, "global_step": 194007, "epoch": 4619} {"train_loss": -7.133389949798584, "global_step": 194008, "epoch": 4619} {"train_loss": -7.217039585113525, "global_step": 194009, "epoch": 4619} {"train_loss": -7.171528339385986, "global_step": 194010, "epoch": 4619} {"train_loss": -7.104242324829102, "global_step": 194011, "epoch": 4619} {"train_loss": -7.247892379760742, "global_step": 194012, "epoch": 4619} {"train_loss": -7.133733749389648, "global_step": 194013, "epoch": 4619} {"train_loss": -7.223794460296631, "global_step": 194014, "epoch": 4619} {"train_loss": -7.04134464263916, "global_step": 194015, "epoch": 4619} {"train_loss": -7.1336469650268555, "global_step": 194016, "epoch": 4619} {"train_loss": -7.161871433258057, "global_step": 194017, "epoch": 4619} {"train_loss": -7.181491851806641, "global_step": 194018, "epoch": 4619} {"train_loss": -7.338438034057617, "global_step": 194019, "epoch": 4619} {"train_loss": -7.254502296447754, "global_step": 194020, "epoch": 4619} {"train_loss": -7.218991279602051, "global_step": 194021, "epoch": 4619} {"train_loss": -7.243114471435547, "global_step": 194022, "epoch": 4619} {"train_loss": -7.239205360412598, "global_step": 194023, "epoch": 4619} {"train_loss": -7.2883758544921875, "global_step": 194024, "epoch": 4619} {"train_loss": -7.1192474365234375, "global_step": 194025, "epoch": 4619} {"train_loss": -7.139805793762207, "global_step": 194026, "epoch": 4619} {"train_loss": -7.23929500579834, "global_step": 194027, "epoch": 4619} {"train_loss": -7.280680179595947, "global_step": 194028, "epoch": 4619} {"train_loss": -7.243206024169922, "global_step": 194029, "epoch": 4619} {"train_loss": -7.155276775360107, "global_step": 194030, "epoch": 4619} {"train_loss": -7.359785079956055, "global_step": 194031, "epoch": 4619} {"train_loss": -7.243229866027832, "global_step": 194032, "epoch": 4619} {"train_loss": -7.16172981262207, "global_step": 194033, "epoch": 4619} {"train_loss": -7.327251434326172, "global_step": 194034, "epoch": 4619} {"train_loss": -7.188337802886963, "global_step": 194035, "epoch": 4619} {"train_loss": -7.199002742767334, "global_step": 194036, "epoch": 4619} {"train_loss": -7.12143611907959, "global_step": 194037, "epoch": 4619} {"train_loss": -7.234358787536621, "global_step": 194038, "epoch": 4619} {"train_loss": -7.197901248931885, "global_step": 194039, "epoch": 4619, "val_loss": 69776.21875} {"train_loss": -7.162972927093506, "global_step": 194040, "epoch": 4620} {"train_loss": -7.323237419128418, "global_step": 194041, "epoch": 4620} {"train_loss": -7.202025413513184, "global_step": 194042, "epoch": 4620} {"train_loss": -7.198055267333984, "global_step": 194043, "epoch": 4620} {"train_loss": -7.326373100280762, "global_step": 194044, "epoch": 4620} {"train_loss": -7.3342390060424805, "global_step": 194045, "epoch": 4620} {"train_loss": -7.171154975891113, "global_step": 194046, "epoch": 4620} {"train_loss": -7.264002323150635, "global_step": 194047, "epoch": 4620} {"train_loss": -7.325089454650879, "global_step": 194048, "epoch": 4620} {"train_loss": -7.180964469909668, "global_step": 194049, "epoch": 4620} {"train_loss": -7.233038425445557, "global_step": 194050, "epoch": 4620} {"train_loss": -7.2618584632873535, "global_step": 194051, "epoch": 4620} {"train_loss": -7.103355884552002, "global_step": 194052, "epoch": 4620} {"train_loss": -7.245862007141113, "global_step": 194053, "epoch": 4620} {"train_loss": -7.2298688888549805, "global_step": 194054, "epoch": 4620} {"train_loss": -7.1504621505737305, "global_step": 194055, "epoch": 4620} {"train_loss": -7.208690166473389, "global_step": 194056, "epoch": 4620} {"train_loss": -7.263406753540039, "global_step": 194057, "epoch": 4620} {"train_loss": -7.138655185699463, "global_step": 194058, "epoch": 4620} {"train_loss": -7.1649065017700195, "global_step": 194059, "epoch": 4620} {"train_loss": -7.241909027099609, "global_step": 194060, "epoch": 4620} {"train_loss": -7.268459320068359, "global_step": 194061, "epoch": 4620} {"train_loss": -7.231153964996338, "global_step": 194062, "epoch": 4620} {"train_loss": -7.254733085632324, "global_step": 194063, "epoch": 4620} {"train_loss": -7.18560791015625, "global_step": 194064, "epoch": 4620} {"train_loss": -7.390969276428223, "global_step": 194065, "epoch": 4620} {"train_loss": -7.276112079620361, "global_step": 194066, "epoch": 4620} {"train_loss": -7.335616111755371, "global_step": 194067, "epoch": 4620} {"train_loss": -7.199090003967285, "global_step": 194068, "epoch": 4620} {"train_loss": -7.358982086181641, "global_step": 194069, "epoch": 4620} {"train_loss": -7.340888977050781, "global_step": 194070, "epoch": 4620} {"train_loss": -7.272178649902344, "global_step": 194071, "epoch": 4620} {"train_loss": -7.328168869018555, "global_step": 194072, "epoch": 4620} {"train_loss": -7.239952564239502, "global_step": 194073, "epoch": 4620} {"train_loss": -7.1750712394714355, "global_step": 194074, "epoch": 4620} {"train_loss": -7.233864784240723, "global_step": 194075, "epoch": 4620} {"train_loss": -7.292923927307129, "global_step": 194076, "epoch": 4620} {"train_loss": -7.294602394104004, "global_step": 194077, "epoch": 4620} {"train_loss": -7.254096984863281, "global_step": 194078, "epoch": 4620} {"train_loss": -7.240882873535156, "global_step": 194079, "epoch": 4620} {"train_loss": -7.306361675262451, "global_step": 194080, "epoch": 4620} {"train_loss": -7.246364911397298, "global_step": 194081, "epoch": 4620, "val_loss": 69614.046875} {"train_loss": -7.252496719360352, "global_step": 194082, "epoch": 4621} {"train_loss": -7.271709442138672, "global_step": 194083, "epoch": 4621} {"train_loss": -7.152596473693848, "global_step": 194084, "epoch": 4621} {"train_loss": -7.198225498199463, "global_step": 194085, "epoch": 4621} {"train_loss": -7.290153503417969, "global_step": 194086, "epoch": 4621} {"train_loss": -7.2155985832214355, "global_step": 194087, "epoch": 4621} {"train_loss": -7.202587127685547, "global_step": 194088, "epoch": 4621} {"train_loss": -7.224813461303711, "global_step": 194089, "epoch": 4621} {"train_loss": -7.19643497467041, "global_step": 194090, "epoch": 4621} {"train_loss": -7.260148525238037, "global_step": 194091, "epoch": 4621} {"train_loss": -7.254561901092529, "global_step": 194092, "epoch": 4621} {"train_loss": -7.119466781616211, "global_step": 194093, "epoch": 4621} {"train_loss": -7.322466850280762, "global_step": 194094, "epoch": 4621} {"train_loss": -7.2298455238342285, "global_step": 194095, "epoch": 4621} {"train_loss": -7.183045864105225, "global_step": 194096, "epoch": 4621} {"train_loss": -7.355707168579102, "global_step": 194097, "epoch": 4621} {"train_loss": -7.244339942932129, "global_step": 194098, "epoch": 4621} {"train_loss": -7.325413703918457, "global_step": 194099, "epoch": 4621} {"train_loss": -7.21978759765625, "global_step": 194100, "epoch": 4621} {"train_loss": -7.326429843902588, "global_step": 194101, "epoch": 4621} {"train_loss": -7.277493476867676, "global_step": 194102, "epoch": 4621} {"train_loss": -7.225513458251953, "global_step": 194103, "epoch": 4621} {"train_loss": -7.193968772888184, "global_step": 194104, "epoch": 4621} {"train_loss": -7.1958513259887695, "global_step": 194105, "epoch": 4621} {"train_loss": -7.300942420959473, "global_step": 194106, "epoch": 4621} {"train_loss": -7.170113563537598, "global_step": 194107, "epoch": 4621} {"train_loss": -7.1586689949035645, "global_step": 194108, "epoch": 4621} {"train_loss": -7.234325408935547, "global_step": 194109, "epoch": 4621} {"train_loss": -7.252579689025879, "global_step": 194110, "epoch": 4621} {"train_loss": -7.222169399261475, "global_step": 194111, "epoch": 4621} {"train_loss": -7.273463249206543, "global_step": 194112, "epoch": 4621} {"train_loss": -7.093510627746582, "global_step": 194113, "epoch": 4621} {"train_loss": -7.175230026245117, "global_step": 194114, "epoch": 4621} {"train_loss": -7.212612152099609, "global_step": 194115, "epoch": 4621} {"train_loss": -7.21940803527832, "global_step": 194116, "epoch": 4621} {"train_loss": -7.2440290451049805, "global_step": 194117, "epoch": 4621} {"train_loss": -7.332786560058594, "global_step": 194118, "epoch": 4621} {"train_loss": -7.203225135803223, "global_step": 194119, "epoch": 4621} {"train_loss": -7.276638031005859, "global_step": 194120, "epoch": 4621} {"train_loss": -7.322333812713623, "global_step": 194121, "epoch": 4621} {"train_loss": -7.1604695320129395, "global_step": 194122, "epoch": 4621} {"train_loss": -7.230387619563511, "global_step": 194123, "epoch": 4621, "val_loss": 69726.4453125} {"train_loss": -7.27127742767334, "global_step": 194124, "epoch": 4622} {"train_loss": -7.151333808898926, "global_step": 194125, "epoch": 4622} {"train_loss": -7.213722229003906, "global_step": 194126, "epoch": 4622} {"train_loss": -7.387331008911133, "global_step": 194127, "epoch": 4622} {"train_loss": -7.294973373413086, "global_step": 194128, "epoch": 4622} {"train_loss": -7.321107864379883, "global_step": 194129, "epoch": 4622} {"train_loss": -7.3486433029174805, "global_step": 194130, "epoch": 4622} {"train_loss": -7.426487445831299, "global_step": 194131, "epoch": 4622} {"train_loss": -7.186833381652832, "global_step": 194132, "epoch": 4622} {"train_loss": -7.399989604949951, "global_step": 194133, "epoch": 4622} {"train_loss": -7.2131805419921875, "global_step": 194134, "epoch": 4622} {"train_loss": -7.265178680419922, "global_step": 194135, "epoch": 4622} {"train_loss": -7.331322193145752, "global_step": 194136, "epoch": 4622} {"train_loss": -7.317567825317383, "global_step": 194137, "epoch": 4622} {"train_loss": -7.337276458740234, "global_step": 194138, "epoch": 4622} {"train_loss": -7.3081488609313965, "global_step": 194139, "epoch": 4622} {"train_loss": -7.347334384918213, "global_step": 194140, "epoch": 4622} {"train_loss": -7.2334160804748535, "global_step": 194141, "epoch": 4622} {"train_loss": -7.2464165687561035, "global_step": 194142, "epoch": 4622} {"train_loss": -7.220961093902588, "global_step": 194143, "epoch": 4622} {"train_loss": -7.305166721343994, "global_step": 194144, "epoch": 4622} {"train_loss": -7.156383514404297, "global_step": 194145, "epoch": 4622} {"train_loss": -7.176689624786377, "global_step": 194146, "epoch": 4622} {"train_loss": -7.1735734939575195, "global_step": 194147, "epoch": 4622} {"train_loss": -7.247878074645996, "global_step": 194148, "epoch": 4622} {"train_loss": -7.199863433837891, "global_step": 194149, "epoch": 4622} {"train_loss": -7.204191207885742, "global_step": 194150, "epoch": 4622} {"train_loss": -7.283919334411621, "global_step": 194151, "epoch": 4622} {"train_loss": -7.1358795166015625, "global_step": 194152, "epoch": 4622} {"train_loss": -7.277296543121338, "global_step": 194153, "epoch": 4622} {"train_loss": -7.255443572998047, "global_step": 194154, "epoch": 4622} {"train_loss": -7.117334365844727, "global_step": 194155, "epoch": 4622} {"train_loss": -7.162966728210449, "global_step": 194156, "epoch": 4622} {"train_loss": -7.227426528930664, "global_step": 194157, "epoch": 4622} {"train_loss": -7.190746307373047, "global_step": 194158, "epoch": 4622} {"train_loss": -7.180741310119629, "global_step": 194159, "epoch": 4622} {"train_loss": -7.173482418060303, "global_step": 194160, "epoch": 4622} {"train_loss": -7.164943695068359, "global_step": 194161, "epoch": 4622} {"train_loss": -7.120048999786377, "global_step": 194162, "epoch": 4622} {"train_loss": -7.058045387268066, "global_step": 194163, "epoch": 4622} {"train_loss": -7.220376014709473, "global_step": 194164, "epoch": 4622} {"train_loss": -7.23421049118042, "global_step": 194165, "epoch": 4622, "val_loss": 69668.546875} {"train_loss": -7.071397304534912, "global_step": 194166, "epoch": 4623} {"train_loss": -7.180337905883789, "global_step": 194167, "epoch": 4623} {"train_loss": -6.984931945800781, "global_step": 194168, "epoch": 4623} {"train_loss": -7.1692986488342285, "global_step": 194169, "epoch": 4623} {"train_loss": -7.008852005004883, "global_step": 194170, "epoch": 4623} {"train_loss": -7.211569786071777, "global_step": 194171, "epoch": 4623} {"train_loss": -7.028543949127197, "global_step": 194172, "epoch": 4623} {"train_loss": -7.227202415466309, "global_step": 194173, "epoch": 4623} {"train_loss": -7.155191898345947, "global_step": 194174, "epoch": 4623} {"train_loss": -7.123537540435791, "global_step": 194175, "epoch": 4623} {"train_loss": -7.108039855957031, "global_step": 194176, "epoch": 4623} {"train_loss": -7.159905910491943, "global_step": 194177, "epoch": 4623} {"train_loss": -7.2309184074401855, "global_step": 194178, "epoch": 4623} {"train_loss": -7.16261100769043, "global_step": 194179, "epoch": 4623} {"train_loss": -7.186387538909912, "global_step": 194180, "epoch": 4623} {"train_loss": -7.295772552490234, "global_step": 194181, "epoch": 4623} {"train_loss": -7.150330543518066, "global_step": 194182, "epoch": 4623} {"train_loss": -7.205032825469971, "global_step": 194183, "epoch": 4623} {"train_loss": -7.175210952758789, "global_step": 194184, "epoch": 4623} {"train_loss": -7.250670433044434, "global_step": 194185, "epoch": 4623} {"train_loss": -7.150519371032715, "global_step": 194186, "epoch": 4623} {"train_loss": -7.1822404861450195, "global_step": 194187, "epoch": 4623} {"train_loss": -7.106416702270508, "global_step": 194188, "epoch": 4623} {"train_loss": -7.090665817260742, "global_step": 194189, "epoch": 4623} {"train_loss": -7.083652019500732, "global_step": 194190, "epoch": 4623} {"train_loss": -7.171712398529053, "global_step": 194191, "epoch": 4623} {"train_loss": -7.019808292388916, "global_step": 194192, "epoch": 4623} {"train_loss": -7.20190954208374, "global_step": 194193, "epoch": 4623} {"train_loss": -7.2182512283325195, "global_step": 194194, "epoch": 4623} {"train_loss": -7.043238639831543, "global_step": 194195, "epoch": 4623} {"train_loss": -7.260331153869629, "global_step": 194196, "epoch": 4623} {"train_loss": -7.061702251434326, "global_step": 194197, "epoch": 4623} {"train_loss": -7.205418109893799, "global_step": 194198, "epoch": 4623} {"train_loss": -6.986550807952881, "global_step": 194199, "epoch": 4623} {"train_loss": -7.136623382568359, "global_step": 194200, "epoch": 4623} {"train_loss": -7.231652736663818, "global_step": 194201, "epoch": 4623} {"train_loss": -7.2094197273254395, "global_step": 194202, "epoch": 4623} {"train_loss": -7.1999006271362305, "global_step": 194203, "epoch": 4623} {"train_loss": -7.240532875061035, "global_step": 194204, "epoch": 4623} {"train_loss": -7.246557235717773, "global_step": 194205, "epoch": 4623} {"train_loss": -7.204920291900635, "global_step": 194206, "epoch": 4623} {"train_loss": -7.15576864424206, "global_step": 194207, "epoch": 4623, "val_loss": 69615.7578125} {"train_loss": -7.197727203369141, "global_step": 194208, "epoch": 4624} {"train_loss": -7.369626045227051, "global_step": 194209, "epoch": 4624} {"train_loss": -7.154119491577148, "global_step": 194210, "epoch": 4624} {"train_loss": -7.2442779541015625, "global_step": 194211, "epoch": 4624} {"train_loss": -7.265895843505859, "global_step": 194212, "epoch": 4624} {"train_loss": -7.250990867614746, "global_step": 194213, "epoch": 4624} {"train_loss": -7.262096405029297, "global_step": 194214, "epoch": 4624} {"train_loss": -7.162278175354004, "global_step": 194215, "epoch": 4624} {"train_loss": -7.369385242462158, "global_step": 194216, "epoch": 4624} {"train_loss": -7.310511589050293, "global_step": 194217, "epoch": 4624} {"train_loss": -7.259708881378174, "global_step": 194218, "epoch": 4624} {"train_loss": -7.231029510498047, "global_step": 194219, "epoch": 4624} {"train_loss": -7.286848068237305, "global_step": 194220, "epoch": 4624} {"train_loss": -7.257144451141357, "global_step": 194221, "epoch": 4624} {"train_loss": -7.193516731262207, "global_step": 194222, "epoch": 4624} {"train_loss": -7.319387435913086, "global_step": 194223, "epoch": 4624} {"train_loss": -7.242554187774658, "global_step": 194224, "epoch": 4624} {"train_loss": -7.143998622894287, "global_step": 194225, "epoch": 4624} {"train_loss": -7.298956871032715, "global_step": 194226, "epoch": 4624} {"train_loss": -7.028250694274902, "global_step": 194227, "epoch": 4624} {"train_loss": -7.091504096984863, "global_step": 194228, "epoch": 4624} {"train_loss": -7.260026931762695, "global_step": 194229, "epoch": 4624} {"train_loss": -7.179976463317871, "global_step": 194230, "epoch": 4624} {"train_loss": -7.002286911010742, "global_step": 194231, "epoch": 4624} {"train_loss": -7.2708868980407715, "global_step": 194232, "epoch": 4624} {"train_loss": -6.9656476974487305, "global_step": 194233, "epoch": 4624} {"train_loss": -7.205987930297852, "global_step": 194234, "epoch": 4624} {"train_loss": -7.22667121887207, "global_step": 194235, "epoch": 4624} {"train_loss": -7.018425941467285, "global_step": 194236, "epoch": 4624} {"train_loss": -7.280660629272461, "global_step": 194237, "epoch": 4624} {"train_loss": -7.070940017700195, "global_step": 194238, "epoch": 4624} {"train_loss": -7.1858625411987305, "global_step": 194239, "epoch": 4624} {"train_loss": -7.190600395202637, "global_step": 194240, "epoch": 4624} {"train_loss": -7.153425216674805, "global_step": 194241, "epoch": 4624} {"train_loss": -7.136112213134766, "global_step": 194242, "epoch": 4624} {"train_loss": -7.13449764251709, "global_step": 194243, "epoch": 4624} {"train_loss": -7.2054829597473145, "global_step": 194244, "epoch": 4624} {"train_loss": -7.119350433349609, "global_step": 194245, "epoch": 4624} {"train_loss": -7.350956439971924, "global_step": 194246, "epoch": 4624} {"train_loss": -7.14284086227417, "global_step": 194247, "epoch": 4624} {"train_loss": -7.112190246582031, "global_step": 194248, "epoch": 4624} {"train_loss": -7.19833771387736, "global_step": 194249, "epoch": 4624, "val_loss": 69586.1484375} {"train_loss": -7.1710052490234375, "global_step": 194250, "epoch": 4625} {"train_loss": -7.1119303703308105, "global_step": 194251, "epoch": 4625} {"train_loss": -7.2049455642700195, "global_step": 194252, "epoch": 4625} {"train_loss": -7.260241508483887, "global_step": 194253, "epoch": 4625} {"train_loss": -7.204501152038574, "global_step": 194254, "epoch": 4625} {"train_loss": -7.183497905731201, "global_step": 194255, "epoch": 4625} {"train_loss": -7.145810604095459, "global_step": 194256, "epoch": 4625} {"train_loss": -7.131486892700195, "global_step": 194257, "epoch": 4625} {"train_loss": -7.2059526443481445, "global_step": 194258, "epoch": 4625} {"train_loss": -7.160339832305908, "global_step": 194259, "epoch": 4625} {"train_loss": -7.093031883239746, "global_step": 194260, "epoch": 4625} {"train_loss": -7.128821849822998, "global_step": 194261, "epoch": 4625} {"train_loss": -7.116915702819824, "global_step": 194262, "epoch": 4625} {"train_loss": -7.039525032043457, "global_step": 194263, "epoch": 4625} {"train_loss": -6.928097724914551, "global_step": 194264, "epoch": 4625} {"train_loss": -7.086669921875, "global_step": 194265, "epoch": 4625} {"train_loss": -7.13538932800293, "global_step": 194266, "epoch": 4625} {"train_loss": -6.992396354675293, "global_step": 194267, "epoch": 4625} {"train_loss": -7.179330348968506, "global_step": 194268, "epoch": 4625} {"train_loss": -6.969091415405273, "global_step": 194269, "epoch": 4625} {"train_loss": -7.172358512878418, "global_step": 194270, "epoch": 4625} {"train_loss": -7.0305399894714355, "global_step": 194271, "epoch": 4625} {"train_loss": -7.170804023742676, "global_step": 194272, "epoch": 4625} {"train_loss": -7.03782844543457, "global_step": 194273, "epoch": 4625} {"train_loss": -7.232452392578125, "global_step": 194274, "epoch": 4625} {"train_loss": -7.018741130828857, "global_step": 194275, "epoch": 4625} {"train_loss": -7.2112884521484375, "global_step": 194276, "epoch": 4625} {"train_loss": -7.117098808288574, "global_step": 194277, "epoch": 4625} {"train_loss": -7.160300254821777, "global_step": 194278, "epoch": 4625} {"train_loss": -7.080592155456543, "global_step": 194279, "epoch": 4625} {"train_loss": -7.10138463973999, "global_step": 194280, "epoch": 4625} {"train_loss": -7.101437568664551, "global_step": 194281, "epoch": 4625} {"train_loss": -7.107455253601074, "global_step": 194282, "epoch": 4625} {"train_loss": -7.061901092529297, "global_step": 194283, "epoch": 4625} {"train_loss": -7.207919120788574, "global_step": 194284, "epoch": 4625} {"train_loss": -7.197434902191162, "global_step": 194285, "epoch": 4625} {"train_loss": -7.206027984619141, "global_step": 194286, "epoch": 4625} {"train_loss": -7.187262058258057, "global_step": 194287, "epoch": 4625} {"train_loss": -7.311398506164551, "global_step": 194288, "epoch": 4625} {"train_loss": -7.140289306640625, "global_step": 194289, "epoch": 4625} {"train_loss": -7.288939952850342, "global_step": 194290, "epoch": 4625} {"train_loss": -7.140620015916371, "global_step": 194291, "epoch": 4625, "val_loss": 69719.890625} {"train_loss": -7.282289505004883, "global_step": 194292, "epoch": 4626} {"train_loss": -7.214731216430664, "global_step": 194293, "epoch": 4626} {"train_loss": -7.2203826904296875, "global_step": 194294, "epoch": 4626} {"train_loss": -7.213822841644287, "global_step": 194295, "epoch": 4626} {"train_loss": -7.287779808044434, "global_step": 194296, "epoch": 4626} {"train_loss": -7.230358600616455, "global_step": 194297, "epoch": 4626} {"train_loss": -7.362308502197266, "global_step": 194298, "epoch": 4626} {"train_loss": -7.247964382171631, "global_step": 194299, "epoch": 4626} {"train_loss": -7.312788009643555, "global_step": 194300, "epoch": 4626} {"train_loss": -7.171588897705078, "global_step": 194301, "epoch": 4626} {"train_loss": -7.223012924194336, "global_step": 194302, "epoch": 4626} {"train_loss": -7.3022990226745605, "global_step": 194303, "epoch": 4626} {"train_loss": -7.2478790283203125, "global_step": 194304, "epoch": 4626} {"train_loss": -7.202686309814453, "global_step": 194305, "epoch": 4626} {"train_loss": -7.296357154846191, "global_step": 194306, "epoch": 4626} {"train_loss": -7.212450981140137, "global_step": 194307, "epoch": 4626} {"train_loss": -7.252826690673828, "global_step": 194308, "epoch": 4626} {"train_loss": -7.1644606590271, "global_step": 194309, "epoch": 4626} {"train_loss": -7.208263397216797, "global_step": 194310, "epoch": 4626} {"train_loss": -7.258316993713379, "global_step": 194311, "epoch": 4626} {"train_loss": -7.234804630279541, "global_step": 194312, "epoch": 4626} {"train_loss": -7.256608009338379, "global_step": 194313, "epoch": 4626} {"train_loss": -7.286369323730469, "global_step": 194314, "epoch": 4626} {"train_loss": -7.280661106109619, "global_step": 194315, "epoch": 4626} {"train_loss": -7.2688703536987305, "global_step": 194316, "epoch": 4626} {"train_loss": -7.207956314086914, "global_step": 194317, "epoch": 4626} {"train_loss": -7.309139728546143, "global_step": 194318, "epoch": 4626} {"train_loss": -7.211423397064209, "global_step": 194319, "epoch": 4626} {"train_loss": -7.239881992340088, "global_step": 194320, "epoch": 4626} {"train_loss": -7.212626934051514, "global_step": 194321, "epoch": 4626} {"train_loss": -7.282121658325195, "global_step": 194322, "epoch": 4626} {"train_loss": -7.237177848815918, "global_step": 194323, "epoch": 4626} {"train_loss": -7.301187515258789, "global_step": 194324, "epoch": 4626} {"train_loss": -7.1783061027526855, "global_step": 194325, "epoch": 4626} {"train_loss": -7.314938068389893, "global_step": 194326, "epoch": 4626} {"train_loss": -7.322467803955078, "global_step": 194327, "epoch": 4626} {"train_loss": -7.15378475189209, "global_step": 194328, "epoch": 4626} {"train_loss": -7.260262489318848, "global_step": 194329, "epoch": 4626} {"train_loss": -7.290294647216797, "global_step": 194330, "epoch": 4626} {"train_loss": -7.309726238250732, "global_step": 194331, "epoch": 4626} {"train_loss": -7.218382835388184, "global_step": 194332, "epoch": 4626} {"train_loss": -7.248337995438349, "global_step": 194333, "epoch": 4626, "val_loss": 69795.296875} {"train_loss": -7.19490909576416, "global_step": 194334, "epoch": 4627} {"train_loss": -7.195407867431641, "global_step": 194335, "epoch": 4627} {"train_loss": -7.268304824829102, "global_step": 194336, "epoch": 4627} {"train_loss": -7.059235572814941, "global_step": 194337, "epoch": 4627} {"train_loss": -7.184848785400391, "global_step": 194338, "epoch": 4627} {"train_loss": -7.1907453536987305, "global_step": 194339, "epoch": 4627} {"train_loss": -7.231093406677246, "global_step": 194340, "epoch": 4627} {"train_loss": -7.272305965423584, "global_step": 194341, "epoch": 4627} {"train_loss": -7.2524614334106445, "global_step": 194342, "epoch": 4627} {"train_loss": -7.180111408233643, "global_step": 194343, "epoch": 4627} {"train_loss": -7.260189533233643, "global_step": 194344, "epoch": 4627} {"train_loss": -7.112646102905273, "global_step": 194345, "epoch": 4627} {"train_loss": -7.105842590332031, "global_step": 194346, "epoch": 4627} {"train_loss": -7.283090591430664, "global_step": 194347, "epoch": 4627} {"train_loss": -7.115013122558594, "global_step": 194348, "epoch": 4627} {"train_loss": -7.166895866394043, "global_step": 194349, "epoch": 4627} {"train_loss": -7.298584938049316, "global_step": 194350, "epoch": 4627} {"train_loss": -7.23743200302124, "global_step": 194351, "epoch": 4627} {"train_loss": -7.240015029907227, "global_step": 194352, "epoch": 4627} {"train_loss": -7.212655544281006, "global_step": 194353, "epoch": 4627} {"train_loss": -7.223725318908691, "global_step": 194354, "epoch": 4627} {"train_loss": -7.2253618240356445, "global_step": 194355, "epoch": 4627} {"train_loss": -7.218692302703857, "global_step": 194356, "epoch": 4627} {"train_loss": -7.191416263580322, "global_step": 194357, "epoch": 4627} {"train_loss": -7.198605060577393, "global_step": 194358, "epoch": 4627} {"train_loss": -7.143341064453125, "global_step": 194359, "epoch": 4627} {"train_loss": -7.2641072273254395, "global_step": 194360, "epoch": 4627} {"train_loss": -7.1304931640625, "global_step": 194361, "epoch": 4627} {"train_loss": -7.20766019821167, "global_step": 194362, "epoch": 4627} {"train_loss": -7.140108108520508, "global_step": 194363, "epoch": 4627} {"train_loss": -7.208712577819824, "global_step": 194364, "epoch": 4627} {"train_loss": -7.2349724769592285, "global_step": 194365, "epoch": 4627} {"train_loss": -7.013057708740234, "global_step": 194366, "epoch": 4627} {"train_loss": -7.334238052368164, "global_step": 194367, "epoch": 4627} {"train_loss": -7.317340850830078, "global_step": 194368, "epoch": 4627} {"train_loss": -7.184116363525391, "global_step": 194369, "epoch": 4627} {"train_loss": -7.28385591506958, "global_step": 194370, "epoch": 4627} {"train_loss": -7.192491054534912, "global_step": 194371, "epoch": 4627} {"train_loss": -7.148845672607422, "global_step": 194372, "epoch": 4627} {"train_loss": -7.26409912109375, "global_step": 194373, "epoch": 4627} {"train_loss": -7.27138614654541, "global_step": 194374, "epoch": 4627} {"train_loss": -7.2052725950876875, "global_step": 194375, "epoch": 4627, "val_loss": 69659.84375} {"train_loss": -7.330667495727539, "global_step": 194376, "epoch": 4628} {"train_loss": -7.249510288238525, "global_step": 194377, "epoch": 4628} {"train_loss": -7.2456560134887695, "global_step": 194378, "epoch": 4628} {"train_loss": -7.182312965393066, "global_step": 194379, "epoch": 4628} {"train_loss": -7.109025001525879, "global_step": 194380, "epoch": 4628} {"train_loss": -6.91563081741333, "global_step": 194381, "epoch": 4628} {"train_loss": -7.312603950500488, "global_step": 194382, "epoch": 4628} {"train_loss": -7.069666862487793, "global_step": 194383, "epoch": 4628} {"train_loss": -7.2701005935668945, "global_step": 194384, "epoch": 4628} {"train_loss": -7.122480392456055, "global_step": 194385, "epoch": 4628} {"train_loss": -7.110676288604736, "global_step": 194386, "epoch": 4628} {"train_loss": -7.154256820678711, "global_step": 194387, "epoch": 4628} {"train_loss": -7.250161170959473, "global_step": 194388, "epoch": 4628} {"train_loss": -7.129990577697754, "global_step": 194389, "epoch": 4628} {"train_loss": -7.193657875061035, "global_step": 194390, "epoch": 4628} {"train_loss": -7.222612380981445, "global_step": 194391, "epoch": 4628} {"train_loss": -7.307734489440918, "global_step": 194392, "epoch": 4628} {"train_loss": -7.111509323120117, "global_step": 194393, "epoch": 4628} {"train_loss": -7.213025093078613, "global_step": 194394, "epoch": 4628} {"train_loss": -7.1897406578063965, "global_step": 194395, "epoch": 4628} {"train_loss": -7.153247833251953, "global_step": 194396, "epoch": 4628} {"train_loss": -7.107796669006348, "global_step": 194397, "epoch": 4628} {"train_loss": -7.1176347732543945, "global_step": 194398, "epoch": 4628} {"train_loss": -7.173184394836426, "global_step": 194399, "epoch": 4628} {"train_loss": -7.137476921081543, "global_step": 194400, "epoch": 4628} {"train_loss": -7.194796085357666, "global_step": 194401, "epoch": 4628} {"train_loss": -7.208307266235352, "global_step": 194402, "epoch": 4628} {"train_loss": -7.206924915313721, "global_step": 194403, "epoch": 4628} {"train_loss": -7.226233005523682, "global_step": 194404, "epoch": 4628} {"train_loss": -7.202467441558838, "global_step": 194405, "epoch": 4628} {"train_loss": -7.1514177322387695, "global_step": 194406, "epoch": 4628} {"train_loss": -7.222500801086426, "global_step": 194407, "epoch": 4628} {"train_loss": -7.075615406036377, "global_step": 194408, "epoch": 4628} {"train_loss": -7.370417594909668, "global_step": 194409, "epoch": 4628} {"train_loss": -7.292367935180664, "global_step": 194410, "epoch": 4628} {"train_loss": -7.319262504577637, "global_step": 194411, "epoch": 4628} {"train_loss": -7.343484401702881, "global_step": 194412, "epoch": 4628} {"train_loss": -7.270110130310059, "global_step": 194413, "epoch": 4628} {"train_loss": -7.2608795166015625, "global_step": 194414, "epoch": 4628} {"train_loss": -7.136189937591553, "global_step": 194415, "epoch": 4628} {"train_loss": -7.249753952026367, "global_step": 194416, "epoch": 4628} {"train_loss": -7.198954105377197, "global_step": 194417, "epoch": 4628, "val_loss": 69756.546875} {"train_loss": -7.286794662475586, "global_step": 194418, "epoch": 4629} {"train_loss": -7.29395055770874, "global_step": 194419, "epoch": 4629} {"train_loss": -7.311053276062012, "global_step": 194420, "epoch": 4629} {"train_loss": -7.243144989013672, "global_step": 194421, "epoch": 4629} {"train_loss": -7.308319568634033, "global_step": 194422, "epoch": 4629} {"train_loss": -7.254306793212891, "global_step": 194423, "epoch": 4629} {"train_loss": -7.342526435852051, "global_step": 194424, "epoch": 4629} {"train_loss": -7.250510215759277, "global_step": 194425, "epoch": 4629} {"train_loss": -7.247433185577393, "global_step": 194426, "epoch": 4629} {"train_loss": -7.1520490646362305, "global_step": 194427, "epoch": 4629} {"train_loss": -7.293437957763672, "global_step": 194428, "epoch": 4629} {"train_loss": -7.359521865844727, "global_step": 194429, "epoch": 4629} {"train_loss": -7.253655433654785, "global_step": 194430, "epoch": 4629} {"train_loss": -7.370861530303955, "global_step": 194431, "epoch": 4629} {"train_loss": -7.196018218994141, "global_step": 194432, "epoch": 4629} {"train_loss": -7.171934127807617, "global_step": 194433, "epoch": 4629} {"train_loss": -7.30500602722168, "global_step": 194434, "epoch": 4629} {"train_loss": -7.174073696136475, "global_step": 194435, "epoch": 4629} {"train_loss": -7.21027946472168, "global_step": 194436, "epoch": 4629} {"train_loss": -7.205362319946289, "global_step": 194437, "epoch": 4629} {"train_loss": -7.232847690582275, "global_step": 194438, "epoch": 4629} {"train_loss": -7.080128192901611, "global_step": 194439, "epoch": 4629} {"train_loss": -7.163193702697754, "global_step": 194440, "epoch": 4629} {"train_loss": -7.278704643249512, "global_step": 194441, "epoch": 4629} {"train_loss": -7.190679550170898, "global_step": 194442, "epoch": 4629} {"train_loss": -7.249884128570557, "global_step": 194443, "epoch": 4629} {"train_loss": -7.258722305297852, "global_step": 194444, "epoch": 4629} {"train_loss": -7.257693290710449, "global_step": 194445, "epoch": 4629} {"train_loss": -7.268926620483398, "global_step": 194446, "epoch": 4629} {"train_loss": -7.319795608520508, "global_step": 194447, "epoch": 4629} {"train_loss": -7.236789703369141, "global_step": 194448, "epoch": 4629} {"train_loss": -7.102612495422363, "global_step": 194449, "epoch": 4629} {"train_loss": -7.325725078582764, "global_step": 194450, "epoch": 4629} {"train_loss": -7.1730499267578125, "global_step": 194451, "epoch": 4629} {"train_loss": -7.263356685638428, "global_step": 194452, "epoch": 4629} {"train_loss": -7.097405433654785, "global_step": 194453, "epoch": 4629} {"train_loss": -7.208152770996094, "global_step": 194454, "epoch": 4629} {"train_loss": -7.167474746704102, "global_step": 194455, "epoch": 4629} {"train_loss": -7.077915668487549, "global_step": 194456, "epoch": 4629} {"train_loss": -7.2947845458984375, "global_step": 194457, "epoch": 4629} {"train_loss": -7.241025924682617, "global_step": 194458, "epoch": 4629} {"train_loss": -7.236295688719976, "global_step": 194459, "epoch": 4629, "val_loss": 69765.8125} {"train_loss": -7.206567764282227, "global_step": 194460, "epoch": 4630} {"train_loss": -7.147246360778809, "global_step": 194461, "epoch": 4630} {"train_loss": -7.16828727722168, "global_step": 194462, "epoch": 4630} {"train_loss": -7.151300430297852, "global_step": 194463, "epoch": 4630} {"train_loss": -7.014502048492432, "global_step": 194464, "epoch": 4630} {"train_loss": -7.256902694702148, "global_step": 194465, "epoch": 4630} {"train_loss": -7.006356239318848, "global_step": 194466, "epoch": 4630} {"train_loss": -7.206228256225586, "global_step": 194467, "epoch": 4630} {"train_loss": -7.2373366355896, "global_step": 194468, "epoch": 4630} {"train_loss": -7.188592910766602, "global_step": 194469, "epoch": 4630} {"train_loss": -7.1926703453063965, "global_step": 194470, "epoch": 4630} {"train_loss": -7.121358394622803, "global_step": 194471, "epoch": 4630} {"train_loss": -7.0937604904174805, "global_step": 194472, "epoch": 4630} {"train_loss": -7.204246997833252, "global_step": 194473, "epoch": 4630} {"train_loss": -7.034714698791504, "global_step": 194474, "epoch": 4630} {"train_loss": -7.193665027618408, "global_step": 194475, "epoch": 4630} {"train_loss": -7.193881988525391, "global_step": 194476, "epoch": 4630} {"train_loss": -7.054505348205566, "global_step": 194477, "epoch": 4630} {"train_loss": -7.184510231018066, "global_step": 194478, "epoch": 4630} {"train_loss": -7.137704849243164, "global_step": 194479, "epoch": 4630} {"train_loss": -7.163328647613525, "global_step": 194480, "epoch": 4630} {"train_loss": -7.166799068450928, "global_step": 194481, "epoch": 4630} {"train_loss": -7.163549423217773, "global_step": 194482, "epoch": 4630} {"train_loss": -7.119402885437012, "global_step": 194483, "epoch": 4630} {"train_loss": -7.246478080749512, "global_step": 194484, "epoch": 4630} {"train_loss": -7.142653465270996, "global_step": 194485, "epoch": 4630} {"train_loss": -7.246818542480469, "global_step": 194486, "epoch": 4630} {"train_loss": -7.1660261154174805, "global_step": 194487, "epoch": 4630} {"train_loss": -7.188597679138184, "global_step": 194488, "epoch": 4630} {"train_loss": -7.301580429077148, "global_step": 194489, "epoch": 4630} {"train_loss": -7.305194854736328, "global_step": 194490, "epoch": 4630} {"train_loss": -7.275535583496094, "global_step": 194491, "epoch": 4630} {"train_loss": -7.2865800857543945, "global_step": 194492, "epoch": 4630} {"train_loss": -7.231685638427734, "global_step": 194493, "epoch": 4630} {"train_loss": -7.206803321838379, "global_step": 194494, "epoch": 4630} {"train_loss": -7.2283477783203125, "global_step": 194495, "epoch": 4630} {"train_loss": -7.087363243103027, "global_step": 194496, "epoch": 4630} {"train_loss": -7.275694370269775, "global_step": 194497, "epoch": 4630} {"train_loss": -7.196414947509766, "global_step": 194498, "epoch": 4630} {"train_loss": -7.323851585388184, "global_step": 194499, "epoch": 4630} {"train_loss": -7.255979061126709, "global_step": 194500, "epoch": 4630} {"train_loss": -7.187412557147798, "global_step": 194501, "epoch": 4630, "val_loss": 69871.8359375} {"train_loss": -7.323699951171875, "global_step": 194502, "epoch": 4631} {"train_loss": -7.278832912445068, "global_step": 194503, "epoch": 4631} {"train_loss": -7.192161560058594, "global_step": 194504, "epoch": 4631} {"train_loss": -7.243005275726318, "global_step": 194505, "epoch": 4631} {"train_loss": -7.252767562866211, "global_step": 194506, "epoch": 4631} {"train_loss": -7.225285053253174, "global_step": 194507, "epoch": 4631} {"train_loss": -7.2552571296691895, "global_step": 194508, "epoch": 4631} {"train_loss": -7.26649284362793, "global_step": 194509, "epoch": 4631} {"train_loss": -7.2235260009765625, "global_step": 194510, "epoch": 4631} {"train_loss": -7.268696308135986, "global_step": 194511, "epoch": 4631} {"train_loss": -7.255976676940918, "global_step": 194512, "epoch": 4631} {"train_loss": -7.195148944854736, "global_step": 194513, "epoch": 4631} {"train_loss": -7.37241792678833, "global_step": 194514, "epoch": 4631} {"train_loss": -7.179603099822998, "global_step": 194515, "epoch": 4631} {"train_loss": -7.286686897277832, "global_step": 194516, "epoch": 4631} {"train_loss": -7.248011589050293, "global_step": 194517, "epoch": 4631} {"train_loss": -7.296351432800293, "global_step": 194518, "epoch": 4631} {"train_loss": -7.3355865478515625, "global_step": 194519, "epoch": 4631} {"train_loss": -7.278069019317627, "global_step": 194520, "epoch": 4631} {"train_loss": -7.392043113708496, "global_step": 194521, "epoch": 4631} {"train_loss": -7.248980522155762, "global_step": 194522, "epoch": 4631} {"train_loss": -7.272919654846191, "global_step": 194523, "epoch": 4631} {"train_loss": -7.246646881103516, "global_step": 194524, "epoch": 4631} {"train_loss": -7.304784774780273, "global_step": 194525, "epoch": 4631} {"train_loss": -7.220129489898682, "global_step": 194526, "epoch": 4631} {"train_loss": -7.149585723876953, "global_step": 194527, "epoch": 4631} {"train_loss": -7.2759599685668945, "global_step": 194528, "epoch": 4631} {"train_loss": -7.245328426361084, "global_step": 194529, "epoch": 4631} {"train_loss": -7.158196926116943, "global_step": 194530, "epoch": 4631} {"train_loss": -7.20048713684082, "global_step": 194531, "epoch": 4631} {"train_loss": -7.23631477355957, "global_step": 194532, "epoch": 4631} {"train_loss": -7.304203987121582, "global_step": 194533, "epoch": 4631} {"train_loss": -7.1863017082214355, "global_step": 194534, "epoch": 4631} {"train_loss": -7.192766189575195, "global_step": 194535, "epoch": 4631} {"train_loss": -7.145135402679443, "global_step": 194536, "epoch": 4631} {"train_loss": -7.2173590660095215, "global_step": 194537, "epoch": 4631} {"train_loss": -7.181899070739746, "global_step": 194538, "epoch": 4631} {"train_loss": -7.105410575866699, "global_step": 194539, "epoch": 4631} {"train_loss": -7.1589155197143555, "global_step": 194540, "epoch": 4631} {"train_loss": -7.1889190673828125, "global_step": 194541, "epoch": 4631} {"train_loss": -7.226602554321289, "global_step": 194542, "epoch": 4631} {"train_loss": -7.239318927129109, "global_step": 194543, "epoch": 4631, "val_loss": 69777.8359375} {"train_loss": -7.250505447387695, "global_step": 194544, "epoch": 4632} {"train_loss": -7.131801605224609, "global_step": 194545, "epoch": 4632} {"train_loss": -7.251654624938965, "global_step": 194546, "epoch": 4632} {"train_loss": -7.174254894256592, "global_step": 194547, "epoch": 4632} {"train_loss": -7.2484130859375, "global_step": 194548, "epoch": 4632} {"train_loss": -7.23506498336792, "global_step": 194549, "epoch": 4632} {"train_loss": -7.178554534912109, "global_step": 194550, "epoch": 4632} {"train_loss": -7.173553466796875, "global_step": 194551, "epoch": 4632} {"train_loss": -7.152866840362549, "global_step": 194552, "epoch": 4632} {"train_loss": -7.1144256591796875, "global_step": 194553, "epoch": 4632} {"train_loss": -7.222197532653809, "global_step": 194554, "epoch": 4632} {"train_loss": -7.20512580871582, "global_step": 194555, "epoch": 4632} {"train_loss": -7.202737808227539, "global_step": 194556, "epoch": 4632} {"train_loss": -7.2523064613342285, "global_step": 194557, "epoch": 4632} {"train_loss": -6.7612762451171875, "global_step": 194558, "epoch": 4632} {"train_loss": -7.121718406677246, "global_step": 194559, "epoch": 4632} {"train_loss": -7.0012736320495605, "global_step": 194560, "epoch": 4632} {"train_loss": -7.254146099090576, "global_step": 194561, "epoch": 4632} {"train_loss": -7.064960479736328, "global_step": 194562, "epoch": 4632} {"train_loss": -7.10463809967041, "global_step": 194563, "epoch": 4632} {"train_loss": -7.036660194396973, "global_step": 194564, "epoch": 4632} {"train_loss": -7.118978023529053, "global_step": 194565, "epoch": 4632} {"train_loss": -7.127492904663086, "global_step": 194566, "epoch": 4632} {"train_loss": -6.937526702880859, "global_step": 194567, "epoch": 4632} {"train_loss": -7.1293816566467285, "global_step": 194568, "epoch": 4632} {"train_loss": -6.941566467285156, "global_step": 194569, "epoch": 4632} {"train_loss": -7.115023136138916, "global_step": 194570, "epoch": 4632} {"train_loss": -7.20046854019165, "global_step": 194571, "epoch": 4632} {"train_loss": -7.025403022766113, "global_step": 194572, "epoch": 4632} {"train_loss": -6.923842430114746, "global_step": 194573, "epoch": 4632} {"train_loss": -7.075510501861572, "global_step": 194574, "epoch": 4632} {"train_loss": -7.093880653381348, "global_step": 194575, "epoch": 4632} {"train_loss": -7.118094444274902, "global_step": 194576, "epoch": 4632} {"train_loss": -7.164224147796631, "global_step": 194577, "epoch": 4632} {"train_loss": -7.122808456420898, "global_step": 194578, "epoch": 4632} {"train_loss": -7.214159965515137, "global_step": 194579, "epoch": 4632} {"train_loss": -7.137749671936035, "global_step": 194580, "epoch": 4632} {"train_loss": -7.080103397369385, "global_step": 194581, "epoch": 4632} {"train_loss": -7.208743095397949, "global_step": 194582, "epoch": 4632} {"train_loss": -7.191058158874512, "global_step": 194583, "epoch": 4632} {"train_loss": -7.201047420501709, "global_step": 194584, "epoch": 4632} {"train_loss": -7.131748926071894, "global_step": 194585, "epoch": 4632, "val_loss": 69626.7578125} {"train_loss": -7.136509895324707, "global_step": 194586, "epoch": 4633} {"train_loss": -7.247036933898926, "global_step": 194587, "epoch": 4633} {"train_loss": -7.310007095336914, "global_step": 194588, "epoch": 4633} {"train_loss": -7.211519241333008, "global_step": 194589, "epoch": 4633} {"train_loss": -7.255374908447266, "global_step": 194590, "epoch": 4633} {"train_loss": -7.204778671264648, "global_step": 194591, "epoch": 4633} {"train_loss": -7.212501525878906, "global_step": 194592, "epoch": 4633} {"train_loss": -7.246352195739746, "global_step": 194593, "epoch": 4633} {"train_loss": -7.203900337219238, "global_step": 194594, "epoch": 4633} {"train_loss": -7.299903869628906, "global_step": 194595, "epoch": 4633} {"train_loss": -7.070043563842773, "global_step": 194596, "epoch": 4633} {"train_loss": -7.139723777770996, "global_step": 194597, "epoch": 4633} {"train_loss": -7.148185729980469, "global_step": 194598, "epoch": 4633} {"train_loss": -7.057814598083496, "global_step": 194599, "epoch": 4633} {"train_loss": -7.102048397064209, "global_step": 194600, "epoch": 4633} {"train_loss": -7.095550060272217, "global_step": 194601, "epoch": 4633} {"train_loss": -7.10967493057251, "global_step": 194602, "epoch": 4633} {"train_loss": -7.208885192871094, "global_step": 194603, "epoch": 4633} {"train_loss": -7.12747049331665, "global_step": 194604, "epoch": 4633} {"train_loss": -7.081485271453857, "global_step": 194605, "epoch": 4633} {"train_loss": -7.09295129776001, "global_step": 194606, "epoch": 4633} {"train_loss": -7.109626770019531, "global_step": 194607, "epoch": 4633} {"train_loss": -7.2250752449035645, "global_step": 194608, "epoch": 4633} {"train_loss": -7.113219261169434, "global_step": 194609, "epoch": 4633} {"train_loss": -7.16539192199707, "global_step": 194610, "epoch": 4633} {"train_loss": -7.320045471191406, "global_step": 194611, "epoch": 4633} {"train_loss": -7.131033897399902, "global_step": 194612, "epoch": 4633} {"train_loss": -7.200935363769531, "global_step": 194613, "epoch": 4633} {"train_loss": -7.217591762542725, "global_step": 194614, "epoch": 4633} {"train_loss": -7.136503219604492, "global_step": 194615, "epoch": 4633} {"train_loss": -7.250221252441406, "global_step": 194616, "epoch": 4633} {"train_loss": -7.181151390075684, "global_step": 194617, "epoch": 4633} {"train_loss": -7.247097969055176, "global_step": 194618, "epoch": 4633} {"train_loss": -7.232605934143066, "global_step": 194619, "epoch": 4633} {"train_loss": -7.228699684143066, "global_step": 194620, "epoch": 4633} {"train_loss": -7.347424507141113, "global_step": 194621, "epoch": 4633} {"train_loss": -7.2392683029174805, "global_step": 194622, "epoch": 4633} {"train_loss": -7.375215530395508, "global_step": 194623, "epoch": 4633} {"train_loss": -7.160373687744141, "global_step": 194624, "epoch": 4633} {"train_loss": -7.25355863571167, "global_step": 194625, "epoch": 4633} {"train_loss": -7.3521599769592285, "global_step": 194626, "epoch": 4633} {"train_loss": -7.1950220834641225, "global_step": 194627, "epoch": 4633, "val_loss": 69531.640625} {"train_loss": -7.140910625457764, "global_step": 194628, "epoch": 4634} {"train_loss": -7.3633880615234375, "global_step": 194629, "epoch": 4634} {"train_loss": -7.239603519439697, "global_step": 194630, "epoch": 4634} {"train_loss": -7.199445724487305, "global_step": 194631, "epoch": 4634} {"train_loss": -7.384466171264648, "global_step": 194632, "epoch": 4634} {"train_loss": -7.181456089019775, "global_step": 194633, "epoch": 4634} {"train_loss": -7.228433132171631, "global_step": 194634, "epoch": 4634} {"train_loss": -7.2370076179504395, "global_step": 194635, "epoch": 4634} {"train_loss": -7.205132961273193, "global_step": 194636, "epoch": 4634} {"train_loss": -7.3224568367004395, "global_step": 194637, "epoch": 4634} {"train_loss": -7.19638729095459, "global_step": 194638, "epoch": 4634} {"train_loss": -7.159365653991699, "global_step": 194639, "epoch": 4634} {"train_loss": -7.393866539001465, "global_step": 194640, "epoch": 4634} {"train_loss": -7.287224769592285, "global_step": 194641, "epoch": 4634} {"train_loss": -7.097444534301758, "global_step": 194642, "epoch": 4634} {"train_loss": -7.228573799133301, "global_step": 194643, "epoch": 4634} {"train_loss": -7.196664810180664, "global_step": 194644, "epoch": 4634} {"train_loss": -7.210925102233887, "global_step": 194645, "epoch": 4634} {"train_loss": -7.196784973144531, "global_step": 194646, "epoch": 4634} {"train_loss": -7.408990859985352, "global_step": 194647, "epoch": 4634} {"train_loss": -7.089020729064941, "global_step": 194648, "epoch": 4634} {"train_loss": -7.146681785583496, "global_step": 194649, "epoch": 4634} {"train_loss": -7.356994152069092, "global_step": 194650, "epoch": 4634} {"train_loss": -7.051497459411621, "global_step": 194651, "epoch": 4634} {"train_loss": -7.1567063331604, "global_step": 194652, "epoch": 4634} {"train_loss": -7.1239013671875, "global_step": 194653, "epoch": 4634} {"train_loss": -7.259239196777344, "global_step": 194654, "epoch": 4634} {"train_loss": -7.155254364013672, "global_step": 194655, "epoch": 4634} {"train_loss": -7.208925247192383, "global_step": 194656, "epoch": 4634} {"train_loss": -7.160966873168945, "global_step": 194657, "epoch": 4634} {"train_loss": -7.050980567932129, "global_step": 194658, "epoch": 4634} {"train_loss": -7.093013286590576, "global_step": 194659, "epoch": 4634} {"train_loss": -7.204949378967285, "global_step": 194660, "epoch": 4634} {"train_loss": -7.11042594909668, "global_step": 194661, "epoch": 4634} {"train_loss": -7.146764278411865, "global_step": 194662, "epoch": 4634} {"train_loss": -7.086036682128906, "global_step": 194663, "epoch": 4634} {"train_loss": -7.209583282470703, "global_step": 194664, "epoch": 4634} {"train_loss": -7.199016094207764, "global_step": 194665, "epoch": 4634} {"train_loss": -7.118935585021973, "global_step": 194666, "epoch": 4634} {"train_loss": -7.2133378982543945, "global_step": 194667, "epoch": 4634} {"train_loss": -7.155664443969727, "global_step": 194668, "epoch": 4634} {"train_loss": -7.199451855250767, "global_step": 194669, "epoch": 4634, "val_loss": 69728.71875} {"train_loss": -7.1837544441223145, "global_step": 194670, "epoch": 4635} {"train_loss": -7.281824111938477, "global_step": 194671, "epoch": 4635} {"train_loss": -7.18174409866333, "global_step": 194672, "epoch": 4635} {"train_loss": -7.372347831726074, "global_step": 194673, "epoch": 4635} {"train_loss": -7.24000358581543, "global_step": 194674, "epoch": 4635} {"train_loss": -7.220081329345703, "global_step": 194675, "epoch": 4635} {"train_loss": -7.24984073638916, "global_step": 194676, "epoch": 4635} {"train_loss": -7.270753860473633, "global_step": 194677, "epoch": 4635} {"train_loss": -7.154862403869629, "global_step": 194678, "epoch": 4635} {"train_loss": -7.167521953582764, "global_step": 194679, "epoch": 4635} {"train_loss": -7.234546184539795, "global_step": 194680, "epoch": 4635} {"train_loss": -7.172879695892334, "global_step": 194681, "epoch": 4635} {"train_loss": -7.208218574523926, "global_step": 194682, "epoch": 4635} {"train_loss": -7.181060791015625, "global_step": 194683, "epoch": 4635} {"train_loss": -7.138457775115967, "global_step": 194684, "epoch": 4635} {"train_loss": -7.039707183837891, "global_step": 194685, "epoch": 4635} {"train_loss": -7.2576141357421875, "global_step": 194686, "epoch": 4635} {"train_loss": -7.203918933868408, "global_step": 194687, "epoch": 4635} {"train_loss": -7.149133682250977, "global_step": 194688, "epoch": 4635} {"train_loss": -7.2865214347839355, "global_step": 194689, "epoch": 4635} {"train_loss": -7.300040245056152, "global_step": 194690, "epoch": 4635} {"train_loss": -7.226179599761963, "global_step": 194691, "epoch": 4635} {"train_loss": -7.2856340408325195, "global_step": 194692, "epoch": 4635} {"train_loss": -7.241322994232178, "global_step": 194693, "epoch": 4635} {"train_loss": -7.3247480392456055, "global_step": 194694, "epoch": 4635} {"train_loss": -7.274621963500977, "global_step": 194695, "epoch": 4635} {"train_loss": -7.151654243469238, "global_step": 194696, "epoch": 4635} {"train_loss": -7.096466064453125, "global_step": 194697, "epoch": 4635} {"train_loss": -7.174708366394043, "global_step": 194698, "epoch": 4635} {"train_loss": -7.20858097076416, "global_step": 194699, "epoch": 4635} {"train_loss": -7.263340473175049, "global_step": 194700, "epoch": 4635} {"train_loss": -7.1690778732299805, "global_step": 194701, "epoch": 4635} {"train_loss": -7.127928256988525, "global_step": 194702, "epoch": 4635} {"train_loss": -7.19148063659668, "global_step": 194703, "epoch": 4635} {"train_loss": -7.164390563964844, "global_step": 194704, "epoch": 4635} {"train_loss": -7.315019607543945, "global_step": 194705, "epoch": 4635} {"train_loss": -7.226128578186035, "global_step": 194706, "epoch": 4635} {"train_loss": -7.0640411376953125, "global_step": 194707, "epoch": 4635} {"train_loss": -7.165459632873535, "global_step": 194708, "epoch": 4635} {"train_loss": -7.247017860412598, "global_step": 194709, "epoch": 4635} {"train_loss": -7.18391752243042, "global_step": 194710, "epoch": 4635} {"train_loss": -7.210780847640264, "global_step": 194711, "epoch": 4635, "val_loss": 69702.03125} {"train_loss": -7.196288585662842, "global_step": 194712, "epoch": 4636} {"train_loss": -7.301626682281494, "global_step": 194713, "epoch": 4636} {"train_loss": -7.208051681518555, "global_step": 194714, "epoch": 4636} {"train_loss": -7.270416259765625, "global_step": 194715, "epoch": 4636} {"train_loss": -7.174812316894531, "global_step": 194716, "epoch": 4636} {"train_loss": -7.320724964141846, "global_step": 194717, "epoch": 4636} {"train_loss": -7.263214111328125, "global_step": 194718, "epoch": 4636} {"train_loss": -7.232946872711182, "global_step": 194719, "epoch": 4636} {"train_loss": -7.202965259552002, "global_step": 194720, "epoch": 4636} {"train_loss": -7.155218124389648, "global_step": 194721, "epoch": 4636} {"train_loss": -7.168280601501465, "global_step": 194722, "epoch": 4636} {"train_loss": -7.228069305419922, "global_step": 194723, "epoch": 4636} {"train_loss": -7.203290939331055, "global_step": 194724, "epoch": 4636} {"train_loss": -7.164096832275391, "global_step": 194725, "epoch": 4636} {"train_loss": -7.077356338500977, "global_step": 194726, "epoch": 4636} {"train_loss": -7.240205764770508, "global_step": 194727, "epoch": 4636} {"train_loss": -7.130183696746826, "global_step": 194728, "epoch": 4636} {"train_loss": -7.129417896270752, "global_step": 194729, "epoch": 4636} {"train_loss": -7.2588090896606445, "global_step": 194730, "epoch": 4636} {"train_loss": -7.295355796813965, "global_step": 194731, "epoch": 4636} {"train_loss": -7.121799945831299, "global_step": 194732, "epoch": 4636} {"train_loss": -7.256182670593262, "global_step": 194733, "epoch": 4636} {"train_loss": -7.33663272857666, "global_step": 194734, "epoch": 4636} {"train_loss": -7.214859962463379, "global_step": 194735, "epoch": 4636} {"train_loss": -7.244710922241211, "global_step": 194736, "epoch": 4636} {"train_loss": -7.264928340911865, "global_step": 194737, "epoch": 4636} {"train_loss": -7.289573669433594, "global_step": 194738, "epoch": 4636} {"train_loss": -7.272970199584961, "global_step": 194739, "epoch": 4636} {"train_loss": -7.273555278778076, "global_step": 194740, "epoch": 4636} {"train_loss": -7.345742702484131, "global_step": 194741, "epoch": 4636} {"train_loss": -7.235902786254883, "global_step": 194742, "epoch": 4636} {"train_loss": -7.31419563293457, "global_step": 194743, "epoch": 4636} {"train_loss": -7.251188278198242, "global_step": 194744, "epoch": 4636} {"train_loss": -7.321389198303223, "global_step": 194745, "epoch": 4636} {"train_loss": -7.394527435302734, "global_step": 194746, "epoch": 4636} {"train_loss": -7.262258529663086, "global_step": 194747, "epoch": 4636} {"train_loss": -7.2746734619140625, "global_step": 194748, "epoch": 4636} {"train_loss": -7.234554290771484, "global_step": 194749, "epoch": 4636} {"train_loss": -7.305331707000732, "global_step": 194750, "epoch": 4636} {"train_loss": -7.186440467834473, "global_step": 194751, "epoch": 4636} {"train_loss": -7.320611000061035, "global_step": 194752, "epoch": 4636} {"train_loss": -7.244370528629848, "global_step": 194753, "epoch": 4636, "val_loss": 69691.8671875} {"train_loss": -7.417242050170898, "global_step": 194754, "epoch": 4637} {"train_loss": -7.2425079345703125, "global_step": 194755, "epoch": 4637} {"train_loss": -7.293147087097168, "global_step": 194756, "epoch": 4637} {"train_loss": -7.321357250213623, "global_step": 194757, "epoch": 4637} {"train_loss": -7.292583465576172, "global_step": 194758, "epoch": 4637} {"train_loss": -7.222531318664551, "global_step": 194759, "epoch": 4637} {"train_loss": -7.245672225952148, "global_step": 194760, "epoch": 4637} {"train_loss": -7.234251976013184, "global_step": 194761, "epoch": 4637} {"train_loss": -7.285256862640381, "global_step": 194762, "epoch": 4637} {"train_loss": -7.3398756980896, "global_step": 194763, "epoch": 4637} {"train_loss": -7.346061706542969, "global_step": 194764, "epoch": 4637} {"train_loss": -7.307971954345703, "global_step": 194765, "epoch": 4637} {"train_loss": -7.375791549682617, "global_step": 194766, "epoch": 4637} {"train_loss": -7.272868633270264, "global_step": 194767, "epoch": 4637} {"train_loss": -7.322671890258789, "global_step": 194768, "epoch": 4637} {"train_loss": -7.3940887451171875, "global_step": 194769, "epoch": 4637} {"train_loss": -7.182692527770996, "global_step": 194770, "epoch": 4637} {"train_loss": -7.110509872436523, "global_step": 194771, "epoch": 4637} {"train_loss": -7.205484867095947, "global_step": 194772, "epoch": 4637} {"train_loss": -7.206404685974121, "global_step": 194773, "epoch": 4637} {"train_loss": -7.17708683013916, "global_step": 194774, "epoch": 4637} {"train_loss": -7.206488609313965, "global_step": 194775, "epoch": 4637} {"train_loss": -7.212928771972656, "global_step": 194776, "epoch": 4637} {"train_loss": -7.053803443908691, "global_step": 194777, "epoch": 4637} {"train_loss": -7.1233930587768555, "global_step": 194778, "epoch": 4637} {"train_loss": -7.292398929595947, "global_step": 194779, "epoch": 4637} {"train_loss": -7.333587646484375, "global_step": 194780, "epoch": 4637} {"train_loss": -7.235398292541504, "global_step": 194781, "epoch": 4637} {"train_loss": -7.18966007232666, "global_step": 194782, "epoch": 4637} {"train_loss": -7.087892532348633, "global_step": 194783, "epoch": 4637} {"train_loss": -7.240922927856445, "global_step": 194784, "epoch": 4637} {"train_loss": -7.179211616516113, "global_step": 194785, "epoch": 4637} {"train_loss": -7.187777519226074, "global_step": 194786, "epoch": 4637} {"train_loss": -7.248218536376953, "global_step": 194787, "epoch": 4637} {"train_loss": -7.162050247192383, "global_step": 194788, "epoch": 4637} {"train_loss": -7.217283248901367, "global_step": 194789, "epoch": 4637} {"train_loss": -7.129931449890137, "global_step": 194790, "epoch": 4637} {"train_loss": -7.206827640533447, "global_step": 194791, "epoch": 4637} {"train_loss": -7.167726516723633, "global_step": 194792, "epoch": 4637} {"train_loss": -7.329928398132324, "global_step": 194793, "epoch": 4637} {"train_loss": -7.206939697265625, "global_step": 194794, "epoch": 4637} {"train_loss": -7.240410225731986, "global_step": 194795, "epoch": 4637, "val_loss": 69587.2421875} {"train_loss": -7.260463237762451, "global_step": 194796, "epoch": 4638} {"train_loss": -7.262091636657715, "global_step": 194797, "epoch": 4638} {"train_loss": -7.2135725021362305, "global_step": 194798, "epoch": 4638} {"train_loss": -7.227688789367676, "global_step": 194799, "epoch": 4638} {"train_loss": -7.221357345581055, "global_step": 194800, "epoch": 4638} {"train_loss": -7.099987983703613, "global_step": 194801, "epoch": 4638} {"train_loss": -7.2422637939453125, "global_step": 194802, "epoch": 4638} {"train_loss": -7.1223978996276855, "global_step": 194803, "epoch": 4638} {"train_loss": -7.239963531494141, "global_step": 194804, "epoch": 4638} {"train_loss": -7.270337104797363, "global_step": 194805, "epoch": 4638} {"train_loss": -7.158537864685059, "global_step": 194806, "epoch": 4638} {"train_loss": -7.05247163772583, "global_step": 194807, "epoch": 4638} {"train_loss": -7.26592493057251, "global_step": 194808, "epoch": 4638} {"train_loss": -7.107329368591309, "global_step": 194809, "epoch": 4638} {"train_loss": -7.226042747497559, "global_step": 194810, "epoch": 4638} {"train_loss": -7.228693008422852, "global_step": 194811, "epoch": 4638} {"train_loss": -7.221052646636963, "global_step": 194812, "epoch": 4638} {"train_loss": -7.162925720214844, "global_step": 194813, "epoch": 4638} {"train_loss": -7.154388904571533, "global_step": 194814, "epoch": 4638} {"train_loss": -7.1511688232421875, "global_step": 194815, "epoch": 4638} {"train_loss": -7.213342666625977, "global_step": 194816, "epoch": 4638} {"train_loss": -7.226072311401367, "global_step": 194817, "epoch": 4638} {"train_loss": -7.000210762023926, "global_step": 194818, "epoch": 4638} {"train_loss": -7.018281936645508, "global_step": 194819, "epoch": 4638} {"train_loss": -7.281888484954834, "global_step": 194820, "epoch": 4638} {"train_loss": -7.279808044433594, "global_step": 194821, "epoch": 4638} {"train_loss": -7.102302551269531, "global_step": 194822, "epoch": 4638} {"train_loss": -7.161600589752197, "global_step": 194823, "epoch": 4638} {"train_loss": -7.134430885314941, "global_step": 194824, "epoch": 4638} {"train_loss": -7.184095859527588, "global_step": 194825, "epoch": 4638} {"train_loss": -7.051119804382324, "global_step": 194826, "epoch": 4638} {"train_loss": -7.129369735717773, "global_step": 194827, "epoch": 4638} {"train_loss": -7.183798789978027, "global_step": 194828, "epoch": 4638} {"train_loss": -7.211000919342041, "global_step": 194829, "epoch": 4638} {"train_loss": -7.284031867980957, "global_step": 194830, "epoch": 4638} {"train_loss": -7.256473064422607, "global_step": 194831, "epoch": 4638} {"train_loss": -7.260187149047852, "global_step": 194832, "epoch": 4638} {"train_loss": -7.248197555541992, "global_step": 194833, "epoch": 4638} {"train_loss": -7.335783958435059, "global_step": 194834, "epoch": 4638} {"train_loss": -7.228086471557617, "global_step": 194835, "epoch": 4638} {"train_loss": -7.309211730957031, "global_step": 194836, "epoch": 4638} {"train_loss": -7.19647410937718, "global_step": 194837, "epoch": 4638, "val_loss": 69639.859375} {"train_loss": -7.347618103027344, "global_step": 194838, "epoch": 4639} {"train_loss": -7.331399917602539, "global_step": 194839, "epoch": 4639} {"train_loss": -7.34332275390625, "global_step": 194840, "epoch": 4639} {"train_loss": -7.326920509338379, "global_step": 194841, "epoch": 4639} {"train_loss": -7.361719608306885, "global_step": 194842, "epoch": 4639} {"train_loss": -7.239109992980957, "global_step": 194843, "epoch": 4639} {"train_loss": -7.31882381439209, "global_step": 194844, "epoch": 4639} {"train_loss": -7.3333892822265625, "global_step": 194845, "epoch": 4639} {"train_loss": -7.3622727394104, "global_step": 194846, "epoch": 4639} {"train_loss": -7.325052261352539, "global_step": 194847, "epoch": 4639} {"train_loss": -7.30186128616333, "global_step": 194848, "epoch": 4639} {"train_loss": -7.314317226409912, "global_step": 194849, "epoch": 4639} {"train_loss": -7.289307594299316, "global_step": 194850, "epoch": 4639} {"train_loss": -7.410122394561768, "global_step": 194851, "epoch": 4639} {"train_loss": -7.21549129486084, "global_step": 194852, "epoch": 4639} {"train_loss": -7.134153842926025, "global_step": 194853, "epoch": 4639} {"train_loss": -7.130927562713623, "global_step": 194854, "epoch": 4639} {"train_loss": -7.294859886169434, "global_step": 194855, "epoch": 4639} {"train_loss": -7.122698783874512, "global_step": 194856, "epoch": 4639} {"train_loss": -7.137237548828125, "global_step": 194857, "epoch": 4639} {"train_loss": -7.197127342224121, "global_step": 194858, "epoch": 4639} {"train_loss": -7.139902114868164, "global_step": 194859, "epoch": 4639} {"train_loss": -7.02811336517334, "global_step": 194860, "epoch": 4639} {"train_loss": -7.1649274826049805, "global_step": 194861, "epoch": 4639} {"train_loss": -7.28781795501709, "global_step": 194862, "epoch": 4639} {"train_loss": -7.031764984130859, "global_step": 194863, "epoch": 4639} {"train_loss": -7.240849494934082, "global_step": 194864, "epoch": 4639} {"train_loss": -7.247241973876953, "global_step": 194865, "epoch": 4639} {"train_loss": -7.152017116546631, "global_step": 194866, "epoch": 4639} {"train_loss": -7.1072587966918945, "global_step": 194867, "epoch": 4639} {"train_loss": -6.957042694091797, "global_step": 194868, "epoch": 4639} {"train_loss": -7.152917385101318, "global_step": 194869, "epoch": 4639} {"train_loss": -7.023379325866699, "global_step": 194870, "epoch": 4639} {"train_loss": -7.033139228820801, "global_step": 194871, "epoch": 4639} {"train_loss": -7.166184425354004, "global_step": 194872, "epoch": 4639} {"train_loss": -7.159341812133789, "global_step": 194873, "epoch": 4639} {"train_loss": -7.188473224639893, "global_step": 194874, "epoch": 4639} {"train_loss": -7.195085048675537, "global_step": 194875, "epoch": 4639} {"train_loss": -7.197240352630615, "global_step": 194876, "epoch": 4639} {"train_loss": -7.104767799377441, "global_step": 194877, "epoch": 4639} {"train_loss": -7.170503616333008, "global_step": 194878, "epoch": 4639} {"train_loss": -7.210033825465611, "global_step": 194879, "epoch": 4639, "val_loss": 69875.46875} {"train_loss": -7.181857109069824, "global_step": 194880, "epoch": 4640} {"train_loss": -7.256497859954834, "global_step": 194881, "epoch": 4640} {"train_loss": -7.236778259277344, "global_step": 194882, "epoch": 4640} {"train_loss": -7.261621475219727, "global_step": 194883, "epoch": 4640} {"train_loss": -7.3473944664001465, "global_step": 194884, "epoch": 4640} {"train_loss": -7.183863162994385, "global_step": 194885, "epoch": 4640} {"train_loss": -7.244548797607422, "global_step": 194886, "epoch": 4640} {"train_loss": -7.201332092285156, "global_step": 194887, "epoch": 4640} {"train_loss": -7.185606002807617, "global_step": 194888, "epoch": 4640} {"train_loss": -7.354184150695801, "global_step": 194889, "epoch": 4640} {"train_loss": -7.139646530151367, "global_step": 194890, "epoch": 4640} {"train_loss": -7.152319431304932, "global_step": 194891, "epoch": 4640} {"train_loss": -6.890790939331055, "global_step": 194892, "epoch": 4640} {"train_loss": -7.1227240562438965, "global_step": 194893, "epoch": 4640} {"train_loss": -7.121546745300293, "global_step": 194894, "epoch": 4640} {"train_loss": -7.169732093811035, "global_step": 194895, "epoch": 4640} {"train_loss": -7.202008247375488, "global_step": 194896, "epoch": 4640} {"train_loss": -7.223621368408203, "global_step": 194897, "epoch": 4640} {"train_loss": -7.225294589996338, "global_step": 194898, "epoch": 4640} {"train_loss": -7.246769428253174, "global_step": 194899, "epoch": 4640} {"train_loss": -7.363673210144043, "global_step": 194900, "epoch": 4640} {"train_loss": -7.19738245010376, "global_step": 194901, "epoch": 4640} {"train_loss": -7.106771469116211, "global_step": 194902, "epoch": 4640} {"train_loss": -7.285533905029297, "global_step": 194903, "epoch": 4640} {"train_loss": -7.1009063720703125, "global_step": 194904, "epoch": 4640} {"train_loss": -7.299088001251221, "global_step": 194905, "epoch": 4640} {"train_loss": -7.249698638916016, "global_step": 194906, "epoch": 4640} {"train_loss": -7.192330360412598, "global_step": 194907, "epoch": 4640} {"train_loss": -7.209471702575684, "global_step": 194908, "epoch": 4640} {"train_loss": -7.20186185836792, "global_step": 194909, "epoch": 4640} {"train_loss": -7.186678886413574, "global_step": 194910, "epoch": 4640} {"train_loss": -7.198768615722656, "global_step": 194911, "epoch": 4640} {"train_loss": -7.256929397583008, "global_step": 194912, "epoch": 4640} {"train_loss": -7.216992378234863, "global_step": 194913, "epoch": 4640} {"train_loss": -7.081589698791504, "global_step": 194914, "epoch": 4640} {"train_loss": -7.14089298248291, "global_step": 194915, "epoch": 4640} {"train_loss": -7.281887054443359, "global_step": 194916, "epoch": 4640} {"train_loss": -7.275354862213135, "global_step": 194917, "epoch": 4640} {"train_loss": -7.187527656555176, "global_step": 194918, "epoch": 4640} {"train_loss": -7.27584981918335, "global_step": 194919, "epoch": 4640} {"train_loss": -7.044991493225098, "global_step": 194920, "epoch": 4640} {"train_loss": -7.203038590294974, "global_step": 194921, "epoch": 4640, "val_loss": 69872.3125} {"train_loss": -7.1643571853637695, "global_step": 194922, "epoch": 4641} {"train_loss": -7.005852699279785, "global_step": 194923, "epoch": 4641} {"train_loss": -7.191560745239258, "global_step": 194924, "epoch": 4641} {"train_loss": -7.134433746337891, "global_step": 194925, "epoch": 4641} {"train_loss": -7.0401129722595215, "global_step": 194926, "epoch": 4641} {"train_loss": -7.165422439575195, "global_step": 194927, "epoch": 4641} {"train_loss": -7.164156913757324, "global_step": 194928, "epoch": 4641} {"train_loss": -7.2012786865234375, "global_step": 194929, "epoch": 4641} {"train_loss": -7.041036128997803, "global_step": 194930, "epoch": 4641} {"train_loss": -7.145650863647461, "global_step": 194931, "epoch": 4641} {"train_loss": -7.197000026702881, "global_step": 194932, "epoch": 4641} {"train_loss": -7.081661224365234, "global_step": 194933, "epoch": 4641} {"train_loss": -7.2779622077941895, "global_step": 194934, "epoch": 4641} {"train_loss": -7.279470920562744, "global_step": 194935, "epoch": 4641} {"train_loss": -7.216738700866699, "global_step": 194936, "epoch": 4641} {"train_loss": -7.243957996368408, "global_step": 194937, "epoch": 4641} {"train_loss": -7.235284328460693, "global_step": 194938, "epoch": 4641} {"train_loss": -7.198520660400391, "global_step": 194939, "epoch": 4641} {"train_loss": -7.2661027908325195, "global_step": 194940, "epoch": 4641} {"train_loss": -7.198329448699951, "global_step": 194941, "epoch": 4641} {"train_loss": -7.280019760131836, "global_step": 194942, "epoch": 4641} {"train_loss": -7.26331901550293, "global_step": 194943, "epoch": 4641} {"train_loss": -7.237354755401611, "global_step": 194944, "epoch": 4641} {"train_loss": -7.254002571105957, "global_step": 194945, "epoch": 4641} {"train_loss": -7.299602508544922, "global_step": 194946, "epoch": 4641} {"train_loss": -7.277591228485107, "global_step": 194947, "epoch": 4641} {"train_loss": -7.229923248291016, "global_step": 194948, "epoch": 4641} {"train_loss": -7.215384006500244, "global_step": 194949, "epoch": 4641} {"train_loss": -7.2965593338012695, "global_step": 194950, "epoch": 4641} {"train_loss": -7.172511577606201, "global_step": 194951, "epoch": 4641} {"train_loss": -7.2087554931640625, "global_step": 194952, "epoch": 4641} {"train_loss": -7.292543888092041, "global_step": 194953, "epoch": 4641} {"train_loss": -7.2520365715026855, "global_step": 194954, "epoch": 4641} {"train_loss": -7.092891693115234, "global_step": 194955, "epoch": 4641} {"train_loss": -7.263430595397949, "global_step": 194956, "epoch": 4641} {"train_loss": -7.239797592163086, "global_step": 194957, "epoch": 4641} {"train_loss": -7.222536087036133, "global_step": 194958, "epoch": 4641} {"train_loss": -7.191018581390381, "global_step": 194959, "epoch": 4641} {"train_loss": -7.190365791320801, "global_step": 194960, "epoch": 4641} {"train_loss": -7.185577392578125, "global_step": 194961, "epoch": 4641} {"train_loss": -7.190710067749023, "global_step": 194962, "epoch": 4641} {"train_loss": -7.20243627684457, "global_step": 194963, "epoch": 4641, "val_loss": 70111.734375} {"train_loss": -6.995845794677734, "global_step": 194964, "epoch": 4642} {"train_loss": -7.0962934494018555, "global_step": 194965, "epoch": 4642} {"train_loss": -7.238703727722168, "global_step": 194966, "epoch": 4642} {"train_loss": -7.08865213394165, "global_step": 194967, "epoch": 4642} {"train_loss": -7.369235038757324, "global_step": 194968, "epoch": 4642} {"train_loss": -7.173576831817627, "global_step": 194969, "epoch": 4642} {"train_loss": -7.1145782470703125, "global_step": 194970, "epoch": 4642} {"train_loss": -7.153450012207031, "global_step": 194971, "epoch": 4642} {"train_loss": -7.057700157165527, "global_step": 194972, "epoch": 4642} {"train_loss": -7.163073539733887, "global_step": 194973, "epoch": 4642} {"train_loss": -7.065512657165527, "global_step": 194974, "epoch": 4642} {"train_loss": -7.1528167724609375, "global_step": 194975, "epoch": 4642} {"train_loss": -7.188370227813721, "global_step": 194976, "epoch": 4642} {"train_loss": -7.207129001617432, "global_step": 194977, "epoch": 4642} {"train_loss": -7.07989501953125, "global_step": 194978, "epoch": 4642} {"train_loss": -7.107320785522461, "global_step": 194979, "epoch": 4642} {"train_loss": -7.318172931671143, "global_step": 194980, "epoch": 4642} {"train_loss": -7.258479118347168, "global_step": 194981, "epoch": 4642} {"train_loss": -7.308380603790283, "global_step": 194982, "epoch": 4642} {"train_loss": -7.1600446701049805, "global_step": 194983, "epoch": 4642} {"train_loss": -7.3289594650268555, "global_step": 194984, "epoch": 4642} {"train_loss": -7.156156539916992, "global_step": 194985, "epoch": 4642} {"train_loss": -7.245138168334961, "global_step": 194986, "epoch": 4642} {"train_loss": -7.218900203704834, "global_step": 194987, "epoch": 4642} {"train_loss": -7.215282917022705, "global_step": 194988, "epoch": 4642} {"train_loss": -7.275732040405273, "global_step": 194989, "epoch": 4642} {"train_loss": -7.2628679275512695, "global_step": 194990, "epoch": 4642} {"train_loss": -7.180597305297852, "global_step": 194991, "epoch": 4642} {"train_loss": -7.322776794433594, "global_step": 194992, "epoch": 4642} {"train_loss": -7.198399543762207, "global_step": 194993, "epoch": 4642} {"train_loss": -7.239335060119629, "global_step": 194994, "epoch": 4642} {"train_loss": -7.116469383239746, "global_step": 194995, "epoch": 4642} {"train_loss": -7.202476501464844, "global_step": 194996, "epoch": 4642} {"train_loss": -7.178271293640137, "global_step": 194997, "epoch": 4642} {"train_loss": -7.195008277893066, "global_step": 194998, "epoch": 4642} {"train_loss": -7.291654586791992, "global_step": 194999, "epoch": 4642} {"train_loss": -7.292580604553223, "global_step": 195000, "epoch": 4642} {"train_loss": -7.257272720336914, "global_step": 195001, "epoch": 4642} {"train_loss": -7.34573221206665, "global_step": 195002, "epoch": 4642} {"train_loss": -7.246061325073242, "global_step": 195003, "epoch": 4642} {"train_loss": -7.226252555847168, "global_step": 195004, "epoch": 4642} {"train_loss": -7.204223553339641, "global_step": 195005, "epoch": 4642, "val_loss": 69822.3671875} {"train_loss": -7.196681976318359, "global_step": 195006, "epoch": 4643} {"train_loss": -7.251256465911865, "global_step": 195007, "epoch": 4643} {"train_loss": -7.208650588989258, "global_step": 195008, "epoch": 4643} {"train_loss": -7.266563415527344, "global_step": 195009, "epoch": 4643} {"train_loss": -7.297203540802002, "global_step": 195010, "epoch": 4643} {"train_loss": -7.18085241317749, "global_step": 195011, "epoch": 4643} {"train_loss": -7.311123371124268, "global_step": 195012, "epoch": 4643} {"train_loss": -7.256204605102539, "global_step": 195013, "epoch": 4643} {"train_loss": -7.338770389556885, "global_step": 195014, "epoch": 4643} {"train_loss": -7.253623008728027, "global_step": 195015, "epoch": 4643} {"train_loss": -7.181943893432617, "global_step": 195016, "epoch": 4643} {"train_loss": -7.1974897384643555, "global_step": 195017, "epoch": 4643} {"train_loss": -7.080512046813965, "global_step": 195018, "epoch": 4643} {"train_loss": -7.259462356567383, "global_step": 195019, "epoch": 4643} {"train_loss": -7.316320419311523, "global_step": 195020, "epoch": 4643} {"train_loss": -7.0432939529418945, "global_step": 195021, "epoch": 4643} {"train_loss": -7.285149097442627, "global_step": 195022, "epoch": 4643} {"train_loss": -7.020633220672607, "global_step": 195023, "epoch": 4643} {"train_loss": -7.054401397705078, "global_step": 195024, "epoch": 4643} {"train_loss": -7.154634475708008, "global_step": 195025, "epoch": 4643} {"train_loss": -7.040205955505371, "global_step": 195026, "epoch": 4643} {"train_loss": -7.127688884735107, "global_step": 195027, "epoch": 4643} {"train_loss": -7.228323936462402, "global_step": 195028, "epoch": 4643} {"train_loss": -7.050135612487793, "global_step": 195029, "epoch": 4643} {"train_loss": -7.1359333992004395, "global_step": 195030, "epoch": 4643} {"train_loss": -7.1945037841796875, "global_step": 195031, "epoch": 4643} {"train_loss": -7.200992584228516, "global_step": 195032, "epoch": 4643} {"train_loss": -7.226985931396484, "global_step": 195033, "epoch": 4643} {"train_loss": -7.1627678871154785, "global_step": 195034, "epoch": 4643} {"train_loss": -7.176319122314453, "global_step": 195035, "epoch": 4643} {"train_loss": -7.206026554107666, "global_step": 195036, "epoch": 4643} {"train_loss": -7.234312057495117, "global_step": 195037, "epoch": 4643} {"train_loss": -7.15622615814209, "global_step": 195038, "epoch": 4643} {"train_loss": -7.287349700927734, "global_step": 195039, "epoch": 4643} {"train_loss": -7.27118444442749, "global_step": 195040, "epoch": 4643} {"train_loss": -7.213367462158203, "global_step": 195041, "epoch": 4643} {"train_loss": -7.207026481628418, "global_step": 195042, "epoch": 4643} {"train_loss": -7.32245397567749, "global_step": 195043, "epoch": 4643} {"train_loss": -7.218360424041748, "global_step": 195044, "epoch": 4643} {"train_loss": -7.13293981552124, "global_step": 195045, "epoch": 4643} {"train_loss": -7.307226657867432, "global_step": 195046, "epoch": 4643} {"train_loss": -7.203044891357422, "global_step": 195047, "epoch": 4643, "val_loss": 69774.5859375} {"train_loss": -7.125128269195557, "global_step": 195048, "epoch": 4644} {"train_loss": -7.205655574798584, "global_step": 195049, "epoch": 4644} {"train_loss": -7.22096061706543, "global_step": 195050, "epoch": 4644} {"train_loss": -7.358349800109863, "global_step": 195051, "epoch": 4644} {"train_loss": -7.246519565582275, "global_step": 195052, "epoch": 4644} {"train_loss": -7.311592102050781, "global_step": 195053, "epoch": 4644} {"train_loss": -7.347139358520508, "global_step": 195054, "epoch": 4644} {"train_loss": -7.148768424987793, "global_step": 195055, "epoch": 4644} {"train_loss": -7.2463555335998535, "global_step": 195056, "epoch": 4644} {"train_loss": -7.327996253967285, "global_step": 195057, "epoch": 4644} {"train_loss": -7.304208278656006, "global_step": 195058, "epoch": 4644} {"train_loss": -7.208484649658203, "global_step": 195059, "epoch": 4644} {"train_loss": -7.3529276847839355, "global_step": 195060, "epoch": 4644} {"train_loss": -7.265851974487305, "global_step": 195061, "epoch": 4644} {"train_loss": -7.195240020751953, "global_step": 195062, "epoch": 4644} {"train_loss": -7.161044597625732, "global_step": 195063, "epoch": 4644} {"train_loss": -7.098140716552734, "global_step": 195064, "epoch": 4644} {"train_loss": -7.246925354003906, "global_step": 195065, "epoch": 4644} {"train_loss": -7.167844772338867, "global_step": 195066, "epoch": 4644} {"train_loss": -7.348236083984375, "global_step": 195067, "epoch": 4644} {"train_loss": -7.197835922241211, "global_step": 195068, "epoch": 4644} {"train_loss": -7.273004055023193, "global_step": 195069, "epoch": 4644} {"train_loss": -7.272377967834473, "global_step": 195070, "epoch": 4644} {"train_loss": -7.1580281257629395, "global_step": 195071, "epoch": 4644} {"train_loss": -7.269674301147461, "global_step": 195072, "epoch": 4644} {"train_loss": -7.31402587890625, "global_step": 195073, "epoch": 4644} {"train_loss": -7.273134231567383, "global_step": 195074, "epoch": 4644} {"train_loss": -7.285647392272949, "global_step": 195075, "epoch": 4644} {"train_loss": -7.122530937194824, "global_step": 195076, "epoch": 4644} {"train_loss": -7.224697113037109, "global_step": 195077, "epoch": 4644} {"train_loss": -7.220004081726074, "global_step": 195078, "epoch": 4644} {"train_loss": -7.330930709838867, "global_step": 195079, "epoch": 4644} {"train_loss": -7.239877700805664, "global_step": 195080, "epoch": 4644} {"train_loss": -7.2305755615234375, "global_step": 195081, "epoch": 4644} {"train_loss": -7.118653297424316, "global_step": 195082, "epoch": 4644} {"train_loss": -7.244210243225098, "global_step": 195083, "epoch": 4644} {"train_loss": -7.2177863121032715, "global_step": 195084, "epoch": 4644} {"train_loss": -7.197961330413818, "global_step": 195085, "epoch": 4644} {"train_loss": -7.241357803344727, "global_step": 195086, "epoch": 4644} {"train_loss": -7.260713577270508, "global_step": 195087, "epoch": 4644} {"train_loss": -7.241364002227783, "global_step": 195088, "epoch": 4644} {"train_loss": -7.241444599060785, "global_step": 195089, "epoch": 4644, "val_loss": 69871.4609375} {"train_loss": -7.248964786529541, "global_step": 195090, "epoch": 4645} {"train_loss": -7.277441024780273, "global_step": 195091, "epoch": 4645} {"train_loss": -7.083745956420898, "global_step": 195092, "epoch": 4645} {"train_loss": -7.268163681030273, "global_step": 195093, "epoch": 4645} {"train_loss": -7.176054000854492, "global_step": 195094, "epoch": 4645} {"train_loss": -7.202342987060547, "global_step": 195095, "epoch": 4645} {"train_loss": -7.277475833892822, "global_step": 195096, "epoch": 4645} {"train_loss": -7.086010456085205, "global_step": 195097, "epoch": 4645} {"train_loss": -7.20587158203125, "global_step": 195098, "epoch": 4645} {"train_loss": -7.259325981140137, "global_step": 195099, "epoch": 4645} {"train_loss": -7.31540584564209, "global_step": 195100, "epoch": 4645} {"train_loss": -7.232757568359375, "global_step": 195101, "epoch": 4645} {"train_loss": -7.272871971130371, "global_step": 195102, "epoch": 4645} {"train_loss": -7.250868797302246, "global_step": 195103, "epoch": 4645} {"train_loss": -7.168047904968262, "global_step": 195104, "epoch": 4645} {"train_loss": -7.163632392883301, "global_step": 195105, "epoch": 4645} {"train_loss": -7.214017868041992, "global_step": 195106, "epoch": 4645} {"train_loss": -7.167158126831055, "global_step": 195107, "epoch": 4645} {"train_loss": -7.1605939865112305, "global_step": 195108, "epoch": 4645} {"train_loss": -7.17824649810791, "global_step": 195109, "epoch": 4645} {"train_loss": -7.205568790435791, "global_step": 195110, "epoch": 4645} {"train_loss": -7.217573642730713, "global_step": 195111, "epoch": 4645} {"train_loss": -7.195626735687256, "global_step": 195112, "epoch": 4645} {"train_loss": -7.202959060668945, "global_step": 195113, "epoch": 4645} {"train_loss": -7.322138786315918, "global_step": 195114, "epoch": 4645} {"train_loss": -7.292211532592773, "global_step": 195115, "epoch": 4645} {"train_loss": -7.215239524841309, "global_step": 195116, "epoch": 4645} {"train_loss": -7.293210029602051, "global_step": 195117, "epoch": 4645} {"train_loss": -7.304896354675293, "global_step": 195118, "epoch": 4645} {"train_loss": -7.279499053955078, "global_step": 195119, "epoch": 4645} {"train_loss": -7.247220516204834, "global_step": 195120, "epoch": 4645} {"train_loss": -7.2128143310546875, "global_step": 195121, "epoch": 4645} {"train_loss": -7.306254863739014, "global_step": 195122, "epoch": 4645} {"train_loss": -7.173586368560791, "global_step": 195123, "epoch": 4645} {"train_loss": -7.261305332183838, "global_step": 195124, "epoch": 4645} {"train_loss": -7.1762285232543945, "global_step": 195125, "epoch": 4645} {"train_loss": -7.283625602722168, "global_step": 195126, "epoch": 4645} {"train_loss": -7.2570648193359375, "global_step": 195127, "epoch": 4645} {"train_loss": -7.153073310852051, "global_step": 195128, "epoch": 4645} {"train_loss": -7.26176643371582, "global_step": 195129, "epoch": 4645} {"train_loss": -7.1939544677734375, "global_step": 195130, "epoch": 4645} {"train_loss": -7.226467064448765, "global_step": 195131, "epoch": 4645, "val_loss": 69661.328125} {"train_loss": -7.191486835479736, "global_step": 195132, "epoch": 4646} {"train_loss": -7.171501159667969, "global_step": 195133, "epoch": 4646} {"train_loss": -7.0667195320129395, "global_step": 195134, "epoch": 4646} {"train_loss": -7.330113410949707, "global_step": 195135, "epoch": 4646} {"train_loss": -7.085844039916992, "global_step": 195136, "epoch": 4646} {"train_loss": -7.161439418792725, "global_step": 195137, "epoch": 4646} {"train_loss": -7.2801289558410645, "global_step": 195138, "epoch": 4646} {"train_loss": -7.119503974914551, "global_step": 195139, "epoch": 4646} {"train_loss": -7.250795364379883, "global_step": 195140, "epoch": 4646} {"train_loss": -7.140076160430908, "global_step": 195141, "epoch": 4646} {"train_loss": -7.108667373657227, "global_step": 195142, "epoch": 4646} {"train_loss": -7.1599273681640625, "global_step": 195143, "epoch": 4646} {"train_loss": -7.173472881317139, "global_step": 195144, "epoch": 4646} {"train_loss": -7.065042018890381, "global_step": 195145, "epoch": 4646} {"train_loss": -7.206070899963379, "global_step": 195146, "epoch": 4646} {"train_loss": -7.174065589904785, "global_step": 195147, "epoch": 4646} {"train_loss": -7.180950164794922, "global_step": 195148, "epoch": 4646} {"train_loss": -7.211396217346191, "global_step": 195149, "epoch": 4646} {"train_loss": -7.218744277954102, "global_step": 195150, "epoch": 4646} {"train_loss": -7.234752655029297, "global_step": 195151, "epoch": 4646} {"train_loss": -7.365083694458008, "global_step": 195152, "epoch": 4646} {"train_loss": -7.250026702880859, "global_step": 195153, "epoch": 4646} {"train_loss": -7.132029056549072, "global_step": 195154, "epoch": 4646} {"train_loss": -7.239352226257324, "global_step": 195155, "epoch": 4646} {"train_loss": -7.290836811065674, "global_step": 195156, "epoch": 4646} {"train_loss": -7.153933525085449, "global_step": 195157, "epoch": 4646} {"train_loss": -7.138533115386963, "global_step": 195158, "epoch": 4646} {"train_loss": -7.305951118469238, "global_step": 195159, "epoch": 4646} {"train_loss": -7.193161964416504, "global_step": 195160, "epoch": 4646} {"train_loss": -7.346496105194092, "global_step": 195161, "epoch": 4646} {"train_loss": -7.344586372375488, "global_step": 195162, "epoch": 4646} {"train_loss": -7.301704406738281, "global_step": 195163, "epoch": 4646} {"train_loss": -7.2785234451293945, "global_step": 195164, "epoch": 4646} {"train_loss": -7.339966773986816, "global_step": 195165, "epoch": 4646} {"train_loss": -7.199162483215332, "global_step": 195166, "epoch": 4646} {"train_loss": -7.248061656951904, "global_step": 195167, "epoch": 4646} {"train_loss": -7.272278308868408, "global_step": 195168, "epoch": 4646} {"train_loss": -7.240082740783691, "global_step": 195169, "epoch": 4646} {"train_loss": -7.183740615844727, "global_step": 195170, "epoch": 4646} {"train_loss": -7.174820899963379, "global_step": 195171, "epoch": 4646} {"train_loss": -7.382701873779297, "global_step": 195172, "epoch": 4646} {"train_loss": -7.215769801821027, "global_step": 195173, "epoch": 4646, "val_loss": 69789.34375} {"train_loss": -7.216329574584961, "global_step": 195174, "epoch": 4647} {"train_loss": -7.356756687164307, "global_step": 195175, "epoch": 4647} {"train_loss": -7.233785629272461, "global_step": 195176, "epoch": 4647} {"train_loss": -7.156441688537598, "global_step": 195177, "epoch": 4647} {"train_loss": -7.207969665527344, "global_step": 195178, "epoch": 4647} {"train_loss": -7.249759674072266, "global_step": 195179, "epoch": 4647} {"train_loss": -7.131004810333252, "global_step": 195180, "epoch": 4647} {"train_loss": -7.277577877044678, "global_step": 195181, "epoch": 4647} {"train_loss": -7.070992946624756, "global_step": 195182, "epoch": 4647} {"train_loss": -7.178188323974609, "global_step": 195183, "epoch": 4647} {"train_loss": -7.214486598968506, "global_step": 195184, "epoch": 4647} {"train_loss": -7.166111946105957, "global_step": 195185, "epoch": 4647} {"train_loss": -7.195448875427246, "global_step": 195186, "epoch": 4647} {"train_loss": -7.266814231872559, "global_step": 195187, "epoch": 4647} {"train_loss": -7.214216232299805, "global_step": 195188, "epoch": 4647} {"train_loss": -7.295276641845703, "global_step": 195189, "epoch": 4647} {"train_loss": -7.167968273162842, "global_step": 195190, "epoch": 4647} {"train_loss": -7.16105842590332, "global_step": 195191, "epoch": 4647} {"train_loss": -7.28204345703125, "global_step": 195192, "epoch": 4647} {"train_loss": -7.346288204193115, "global_step": 195193, "epoch": 4647} {"train_loss": -7.18997859954834, "global_step": 195194, "epoch": 4647} {"train_loss": -7.148481369018555, "global_step": 195195, "epoch": 4647} {"train_loss": -7.239359378814697, "global_step": 195196, "epoch": 4647} {"train_loss": -7.311183452606201, "global_step": 195197, "epoch": 4647} {"train_loss": -7.254172325134277, "global_step": 195198, "epoch": 4647} {"train_loss": -7.245767593383789, "global_step": 195199, "epoch": 4647} {"train_loss": -7.364415168762207, "global_step": 195200, "epoch": 4647} {"train_loss": -7.223165512084961, "global_step": 195201, "epoch": 4647} {"train_loss": -7.269294738769531, "global_step": 195202, "epoch": 4647} {"train_loss": -7.3386688232421875, "global_step": 195203, "epoch": 4647} {"train_loss": -7.234127998352051, "global_step": 195204, "epoch": 4647} {"train_loss": -7.278992652893066, "global_step": 195205, "epoch": 4647} {"train_loss": -7.156403064727783, "global_step": 195206, "epoch": 4647} {"train_loss": -7.198855400085449, "global_step": 195207, "epoch": 4647} {"train_loss": -7.338631629943848, "global_step": 195208, "epoch": 4647} {"train_loss": -7.185258388519287, "global_step": 195209, "epoch": 4647} {"train_loss": -7.201533317565918, "global_step": 195210, "epoch": 4647} {"train_loss": -7.092198371887207, "global_step": 195211, "epoch": 4647} {"train_loss": -7.175630569458008, "global_step": 195212, "epoch": 4647} {"train_loss": -7.008113861083984, "global_step": 195213, "epoch": 4647} {"train_loss": -7.122817516326904, "global_step": 195214, "epoch": 4647} {"train_loss": -7.221219153631301, "global_step": 195215, "epoch": 4647, "val_loss": 69798.671875} {"train_loss": -7.137465476989746, "global_step": 195216, "epoch": 4648} {"train_loss": -7.168546676635742, "global_step": 195217, "epoch": 4648} {"train_loss": -7.158619403839111, "global_step": 195218, "epoch": 4648} {"train_loss": -6.848917007446289, "global_step": 195219, "epoch": 4648} {"train_loss": -7.110978603363037, "global_step": 195220, "epoch": 4648} {"train_loss": -7.0663042068481445, "global_step": 195221, "epoch": 4648} {"train_loss": -7.325994491577148, "global_step": 195222, "epoch": 4648} {"train_loss": -7.163389205932617, "global_step": 195223, "epoch": 4648} {"train_loss": -7.078827857971191, "global_step": 195224, "epoch": 4648} {"train_loss": -7.193078517913818, "global_step": 195225, "epoch": 4648} {"train_loss": -7.118098258972168, "global_step": 195226, "epoch": 4648} {"train_loss": -7.270105838775635, "global_step": 195227, "epoch": 4648} {"train_loss": -7.12767219543457, "global_step": 195228, "epoch": 4648} {"train_loss": -7.225679397583008, "global_step": 195229, "epoch": 4648} {"train_loss": -7.1888580322265625, "global_step": 195230, "epoch": 4648} {"train_loss": -7.275649070739746, "global_step": 195231, "epoch": 4648} {"train_loss": -7.274876594543457, "global_step": 195232, "epoch": 4648} {"train_loss": -7.199652671813965, "global_step": 195233, "epoch": 4648} {"train_loss": -7.2279438972473145, "global_step": 195234, "epoch": 4648} {"train_loss": -7.152823448181152, "global_step": 195235, "epoch": 4648} {"train_loss": -7.13628625869751, "global_step": 195236, "epoch": 4648} {"train_loss": -7.283377170562744, "global_step": 195237, "epoch": 4648} {"train_loss": -7.202340126037598, "global_step": 195238, "epoch": 4648} {"train_loss": -7.240412712097168, "global_step": 195239, "epoch": 4648} {"train_loss": -7.202003002166748, "global_step": 195240, "epoch": 4648} {"train_loss": -7.288467884063721, "global_step": 195241, "epoch": 4648} {"train_loss": -7.277778148651123, "global_step": 195242, "epoch": 4648} {"train_loss": -7.344943046569824, "global_step": 195243, "epoch": 4648} {"train_loss": -7.34354829788208, "global_step": 195244, "epoch": 4648} {"train_loss": -7.319108009338379, "global_step": 195245, "epoch": 4648} {"train_loss": -7.236870288848877, "global_step": 195246, "epoch": 4648} {"train_loss": -7.271136283874512, "global_step": 195247, "epoch": 4648} {"train_loss": -7.179168701171875, "global_step": 195248, "epoch": 4648} {"train_loss": -7.327078819274902, "global_step": 195249, "epoch": 4648} {"train_loss": -7.239719390869141, "global_step": 195250, "epoch": 4648} {"train_loss": -7.293394565582275, "global_step": 195251, "epoch": 4648} {"train_loss": -7.2062177658081055, "global_step": 195252, "epoch": 4648} {"train_loss": -7.191961288452148, "global_step": 195253, "epoch": 4648} {"train_loss": -7.266776084899902, "global_step": 195254, "epoch": 4648} {"train_loss": -7.099966526031494, "global_step": 195255, "epoch": 4648} {"train_loss": -7.2914323806762695, "global_step": 195256, "epoch": 4648} {"train_loss": -7.2106199605124335, "global_step": 195257, "epoch": 4648, "val_loss": 69845.2421875} {"train_loss": -7.103398323059082, "global_step": 195258, "epoch": 4649} {"train_loss": -7.103182315826416, "global_step": 195259, "epoch": 4649} {"train_loss": -7.105330467224121, "global_step": 195260, "epoch": 4649} {"train_loss": -7.281944751739502, "global_step": 195261, "epoch": 4649} {"train_loss": -7.291736125946045, "global_step": 195262, "epoch": 4649} {"train_loss": -7.189953804016113, "global_step": 195263, "epoch": 4649} {"train_loss": -7.204782962799072, "global_step": 195264, "epoch": 4649} {"train_loss": -7.294817924499512, "global_step": 195265, "epoch": 4649} {"train_loss": -7.171420097351074, "global_step": 195266, "epoch": 4649} {"train_loss": -7.245635032653809, "global_step": 195267, "epoch": 4649} {"train_loss": -7.130048751831055, "global_step": 195268, "epoch": 4649} {"train_loss": -7.355854511260986, "global_step": 195269, "epoch": 4649} {"train_loss": -7.260662078857422, "global_step": 195270, "epoch": 4649} {"train_loss": -7.280101776123047, "global_step": 195271, "epoch": 4649} {"train_loss": -7.245761871337891, "global_step": 195272, "epoch": 4649} {"train_loss": -7.344631195068359, "global_step": 195273, "epoch": 4649} {"train_loss": -7.258608341217041, "global_step": 195274, "epoch": 4649} {"train_loss": -7.247533798217773, "global_step": 195275, "epoch": 4649} {"train_loss": -7.2823615074157715, "global_step": 195276, "epoch": 4649} {"train_loss": -7.182744979858398, "global_step": 195277, "epoch": 4649} {"train_loss": -7.15774393081665, "global_step": 195278, "epoch": 4649} {"train_loss": -7.324716567993164, "global_step": 195279, "epoch": 4649} {"train_loss": -7.321725368499756, "global_step": 195280, "epoch": 4649} {"train_loss": -7.3405961990356445, "global_step": 195281, "epoch": 4649} {"train_loss": -7.1974687576293945, "global_step": 195282, "epoch": 4649} {"train_loss": -7.2766828536987305, "global_step": 195283, "epoch": 4649} {"train_loss": -7.312952518463135, "global_step": 195284, "epoch": 4649} {"train_loss": -7.330511093139648, "global_step": 195285, "epoch": 4649} {"train_loss": -7.268725395202637, "global_step": 195286, "epoch": 4649} {"train_loss": -7.2397565841674805, "global_step": 195287, "epoch": 4649} {"train_loss": -7.281257152557373, "global_step": 195288, "epoch": 4649} {"train_loss": -7.319725036621094, "global_step": 195289, "epoch": 4649} {"train_loss": -7.246252059936523, "global_step": 195290, "epoch": 4649} {"train_loss": -7.2143731117248535, "global_step": 195291, "epoch": 4649} {"train_loss": -7.422821521759033, "global_step": 195292, "epoch": 4649} {"train_loss": -7.335862159729004, "global_step": 195293, "epoch": 4649} {"train_loss": -7.336756706237793, "global_step": 195294, "epoch": 4649} {"train_loss": -7.2692551612854, "global_step": 195295, "epoch": 4649} {"train_loss": -7.290034294128418, "global_step": 195296, "epoch": 4649} {"train_loss": -7.228203773498535, "global_step": 195297, "epoch": 4649} {"train_loss": -7.289635181427002, "global_step": 195298, "epoch": 4649} {"train_loss": -7.2594063849676225, "global_step": 195299, "epoch": 4649, "val_loss": 69723.3984375} {"train_loss": -7.290155410766602, "global_step": 195300, "epoch": 4650} {"train_loss": -7.372015953063965, "global_step": 195301, "epoch": 4650} {"train_loss": -7.283697605133057, "global_step": 195302, "epoch": 4650} {"train_loss": -7.240771293640137, "global_step": 195303, "epoch": 4650} {"train_loss": -7.368927955627441, "global_step": 195304, "epoch": 4650} {"train_loss": -7.169051170349121, "global_step": 195305, "epoch": 4650} {"train_loss": -7.208890438079834, "global_step": 195306, "epoch": 4650} {"train_loss": -7.301860809326172, "global_step": 195307, "epoch": 4650} {"train_loss": -7.324472904205322, "global_step": 195308, "epoch": 4650} {"train_loss": -7.313044548034668, "global_step": 195309, "epoch": 4650} {"train_loss": -7.224709987640381, "global_step": 195310, "epoch": 4650} {"train_loss": -7.2971954345703125, "global_step": 195311, "epoch": 4650} {"train_loss": -7.110570907592773, "global_step": 195312, "epoch": 4650} {"train_loss": -7.166582107543945, "global_step": 195313, "epoch": 4650} {"train_loss": -7.24883508682251, "global_step": 195314, "epoch": 4650} {"train_loss": -7.171985149383545, "global_step": 195315, "epoch": 4650} {"train_loss": -6.9917755126953125, "global_step": 195316, "epoch": 4650} {"train_loss": -7.1578779220581055, "global_step": 195317, "epoch": 4650} {"train_loss": -7.104208946228027, "global_step": 195318, "epoch": 4650} {"train_loss": -7.055070877075195, "global_step": 195319, "epoch": 4650} {"train_loss": -7.22025203704834, "global_step": 195320, "epoch": 4650} {"train_loss": -7.078041076660156, "global_step": 195321, "epoch": 4650} {"train_loss": -7.204534530639648, "global_step": 195322, "epoch": 4650} {"train_loss": -7.329948425292969, "global_step": 195323, "epoch": 4650} {"train_loss": -7.213107585906982, "global_step": 195324, "epoch": 4650} {"train_loss": -7.129483222961426, "global_step": 195325, "epoch": 4650} {"train_loss": -7.1653313636779785, "global_step": 195326, "epoch": 4650} {"train_loss": -7.1988420486450195, "global_step": 195327, "epoch": 4650} {"train_loss": -7.0503997802734375, "global_step": 195328, "epoch": 4650} {"train_loss": -7.321018218994141, "global_step": 195329, "epoch": 4650} {"train_loss": -7.147622108459473, "global_step": 195330, "epoch": 4650} {"train_loss": -7.092676162719727, "global_step": 195331, "epoch": 4650} {"train_loss": -7.262869358062744, "global_step": 195332, "epoch": 4650} {"train_loss": -7.02805233001709, "global_step": 195333, "epoch": 4650} {"train_loss": -7.032793998718262, "global_step": 195334, "epoch": 4650} {"train_loss": -7.119419097900391, "global_step": 195335, "epoch": 4650} {"train_loss": -7.065274238586426, "global_step": 195336, "epoch": 4650} {"train_loss": -7.256307125091553, "global_step": 195337, "epoch": 4650} {"train_loss": -7.071371078491211, "global_step": 195338, "epoch": 4650} {"train_loss": -7.250876426696777, "global_step": 195339, "epoch": 4650} {"train_loss": -7.164633274078369, "global_step": 195340, "epoch": 4650} {"train_loss": -7.182165202640352, "global_step": 195341, "epoch": 4650, "train/sim_max_reward_0": 0.3716206996901576, "train/sim_max_reward_1": 0.7366238698950381, "train/sim_max_reward_2": 0.5227394925904445, "train/sim_max_reward_3": 0.7861899615990409, "train/sim_max_reward_4": 0.9701494780930346, "train/sim_max_reward_5": 0.9109119784728699, "test/sim_max_reward_4300000": 0.8896410102294177, "test/sim_max_reward_4300001": 0.5291993982518378, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8798048303768721, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9724063739882871, "test/sim_max_reward_4300008": 0.8699872746352849, "test/sim_max_reward_4300009": 0.991875969832671, "test/sim_max_reward_4300010": 1.0, "test/sim_max_reward_4300011": 0.9101775916721948, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.4018254098502948, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9737071224775113, "test/sim_max_reward_4300016": 0.89099069521473, "test/sim_max_reward_4300017": 0.7042463943972839, "test/sim_max_reward_4300018": 0.9885091469885963, "test/sim_max_reward_4300019": 0.18608112305942334, "test/sim_max_reward_4300020": 0.9738320220835636, "test/sim_max_reward_4300021": 0.9606601511991544, "test/sim_max_reward_4300022": 1.0, "test/sim_max_reward_4300023": 0.9653099943008504, "test/sim_max_reward_4300024": 0.9782372622242721, "test/sim_max_reward_4300025": 1.0, "test/sim_max_reward_4300026": 0.17904422774226075, "test/sim_max_reward_4300027": 0.960062463909248, "test/sim_max_reward_4300028": 0.6801970550173786, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.2231428252183367, "test/sim_max_reward_4300031": 0.5351005110804636, "test/sim_max_reward_4300032": 0.9953779207672169, "test/sim_max_reward_4300033": 0.7065566151959713, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.10469514034259704, "test/sim_max_reward_4300036": 0.21437962415662817, "test/sim_max_reward_4300037": 1.0, "test/sim_max_reward_4300038": 0.9174180277404929, "test/sim_max_reward_4300039": 0.7561584119466831, "test/sim_max_reward_4300040": 0.7723634388650266, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.8995807820569274, "test/sim_max_reward_4300043": 0.16351205577482641, "test/sim_max_reward_4300044": 0.12003727957611782, "test/sim_max_reward_4300045": 1.0, "test/sim_max_reward_4300046": 0.9169314026925517, "test/sim_max_reward_4300047": 0.15478581705649502, "test/sim_max_reward_4300048": 0.0001821436005404843, "test/sim_max_reward_4300049": 0.21216651539276948, "train/mean_score": 0.7163725800567642, "test/mean_score": 0.6518803626744811, "val_loss": 69761.5234375} {"train_loss": -7.145790100097656, "global_step": 195342, "epoch": 4651} {"train_loss": -7.113431453704834, "global_step": 195343, "epoch": 4651} {"train_loss": -7.002233028411865, "global_step": 195344, "epoch": 4651} {"train_loss": -7.131548881530762, "global_step": 195345, "epoch": 4651} {"train_loss": -7.151702880859375, "global_step": 195346, "epoch": 4651} {"train_loss": -7.1131367683410645, "global_step": 195347, "epoch": 4651} {"train_loss": -7.164150238037109, "global_step": 195348, "epoch": 4651} {"train_loss": -7.152187347412109, "global_step": 195349, "epoch": 4651} {"train_loss": -7.0925679206848145, "global_step": 195350, "epoch": 4651} {"train_loss": -7.058938503265381, "global_step": 195351, "epoch": 4651} {"train_loss": -7.173272609710693, "global_step": 195352, "epoch": 4651} {"train_loss": -7.113550186157227, "global_step": 195353, "epoch": 4651} {"train_loss": -7.120997428894043, "global_step": 195354, "epoch": 4651} {"train_loss": -6.981776237487793, "global_step": 195355, "epoch": 4651} {"train_loss": -7.260095596313477, "global_step": 195356, "epoch": 4651} {"train_loss": -7.183812618255615, "global_step": 195357, "epoch": 4651} {"train_loss": -7.306832313537598, "global_step": 195358, "epoch": 4651} {"train_loss": -7.127008438110352, "global_step": 195359, "epoch": 4651} {"train_loss": -7.118391513824463, "global_step": 195360, "epoch": 4651} {"train_loss": -7.218020439147949, "global_step": 195361, "epoch": 4651} {"train_loss": -7.241544723510742, "global_step": 195362, "epoch": 4651} {"train_loss": -7.217415809631348, "global_step": 195363, "epoch": 4651} {"train_loss": -7.171141624450684, "global_step": 195364, "epoch": 4651} {"train_loss": -7.174996852874756, "global_step": 195365, "epoch": 4651} {"train_loss": -7.234108924865723, "global_step": 195366, "epoch": 4651} {"train_loss": -7.272792339324951, "global_step": 195367, "epoch": 4651} {"train_loss": -7.162208557128906, "global_step": 195368, "epoch": 4651} {"train_loss": -7.326413631439209, "global_step": 195369, "epoch": 4651} {"train_loss": -7.243164539337158, "global_step": 195370, "epoch": 4651} {"train_loss": -7.316353797912598, "global_step": 195371, "epoch": 4651} {"train_loss": -7.332360744476318, "global_step": 195372, "epoch": 4651} {"train_loss": -7.111020088195801, "global_step": 195373, "epoch": 4651} {"train_loss": -7.253643989562988, "global_step": 195374, "epoch": 4651} {"train_loss": -7.202598571777344, "global_step": 195375, "epoch": 4651} {"train_loss": -7.289861679077148, "global_step": 195376, "epoch": 4651} {"train_loss": -7.1309919357299805, "global_step": 195377, "epoch": 4651} {"train_loss": -7.17634391784668, "global_step": 195378, "epoch": 4651} {"train_loss": -7.201137542724609, "global_step": 195379, "epoch": 4651} {"train_loss": -7.132473945617676, "global_step": 195380, "epoch": 4651} {"train_loss": -7.178540229797363, "global_step": 195381, "epoch": 4651} {"train_loss": -7.279702663421631, "global_step": 195382, "epoch": 4651} {"train_loss": -7.182903993697393, "global_step": 195383, "epoch": 4651, "val_loss": 69790.7734375} {"train_loss": -7.26984977722168, "global_step": 195384, "epoch": 4652} {"train_loss": -7.283379554748535, "global_step": 195385, "epoch": 4652} {"train_loss": -7.274506568908691, "global_step": 195386, "epoch": 4652} {"train_loss": -7.19791316986084, "global_step": 195387, "epoch": 4652} {"train_loss": -7.211306095123291, "global_step": 195388, "epoch": 4652} {"train_loss": -7.266193389892578, "global_step": 195389, "epoch": 4652} {"train_loss": -7.129341125488281, "global_step": 195390, "epoch": 4652} {"train_loss": -7.225445747375488, "global_step": 195391, "epoch": 4652} {"train_loss": -7.280628204345703, "global_step": 195392, "epoch": 4652} {"train_loss": -7.207159996032715, "global_step": 195393, "epoch": 4652} {"train_loss": -7.331226348876953, "global_step": 195394, "epoch": 4652} {"train_loss": -7.249110221862793, "global_step": 195395, "epoch": 4652} {"train_loss": -7.314297676086426, "global_step": 195396, "epoch": 4652} {"train_loss": -7.17710018157959, "global_step": 195397, "epoch": 4652} {"train_loss": -7.214948654174805, "global_step": 195398, "epoch": 4652} {"train_loss": -7.249330997467041, "global_step": 195399, "epoch": 4652} {"train_loss": -7.248524188995361, "global_step": 195400, "epoch": 4652} {"train_loss": -7.206975936889648, "global_step": 195401, "epoch": 4652} {"train_loss": -7.295840263366699, "global_step": 195402, "epoch": 4652} {"train_loss": -7.255037307739258, "global_step": 195403, "epoch": 4652} {"train_loss": -7.082683563232422, "global_step": 195404, "epoch": 4652} {"train_loss": -7.169608116149902, "global_step": 195405, "epoch": 4652} {"train_loss": -7.162861347198486, "global_step": 195406, "epoch": 4652} {"train_loss": -7.287524223327637, "global_step": 195407, "epoch": 4652} {"train_loss": -7.177117347717285, "global_step": 195408, "epoch": 4652} {"train_loss": -7.306609153747559, "global_step": 195409, "epoch": 4652} {"train_loss": -7.209301471710205, "global_step": 195410, "epoch": 4652} {"train_loss": -7.315171241760254, "global_step": 195411, "epoch": 4652} {"train_loss": -7.130767345428467, "global_step": 195412, "epoch": 4652} {"train_loss": -7.349917411804199, "global_step": 195413, "epoch": 4652} {"train_loss": -7.101524353027344, "global_step": 195414, "epoch": 4652} {"train_loss": -7.044873237609863, "global_step": 195415, "epoch": 4652} {"train_loss": -7.208151817321777, "global_step": 195416, "epoch": 4652} {"train_loss": -7.192669868469238, "global_step": 195417, "epoch": 4652} {"train_loss": -7.00345516204834, "global_step": 195418, "epoch": 4652} {"train_loss": -7.129053592681885, "global_step": 195419, "epoch": 4652} {"train_loss": -7.025404453277588, "global_step": 195420, "epoch": 4652} {"train_loss": -7.1650710105896, "global_step": 195421, "epoch": 4652} {"train_loss": -7.088918685913086, "global_step": 195422, "epoch": 4652} {"train_loss": -7.068629741668701, "global_step": 195423, "epoch": 4652} {"train_loss": -7.111632823944092, "global_step": 195424, "epoch": 4652} {"train_loss": -7.195442483538673, "global_step": 195425, "epoch": 4652, "val_loss": 69730.296875} {"train_loss": -7.076711654663086, "global_step": 195426, "epoch": 4653} {"train_loss": -7.070851802825928, "global_step": 195427, "epoch": 4653} {"train_loss": -7.036990165710449, "global_step": 195428, "epoch": 4653} {"train_loss": -7.087072372436523, "global_step": 195429, "epoch": 4653} {"train_loss": -7.092035293579102, "global_step": 195430, "epoch": 4653} {"train_loss": -7.246532917022705, "global_step": 195431, "epoch": 4653} {"train_loss": -7.096523284912109, "global_step": 195432, "epoch": 4653} {"train_loss": -7.03858757019043, "global_step": 195433, "epoch": 4653} {"train_loss": -7.064894676208496, "global_step": 195434, "epoch": 4653} {"train_loss": -7.173434257507324, "global_step": 195435, "epoch": 4653} {"train_loss": -7.108065605163574, "global_step": 195436, "epoch": 4653} {"train_loss": -7.052247047424316, "global_step": 195437, "epoch": 4653} {"train_loss": -7.114995002746582, "global_step": 195438, "epoch": 4653} {"train_loss": -7.10562801361084, "global_step": 195439, "epoch": 4653} {"train_loss": -7.3361968994140625, "global_step": 195440, "epoch": 4653} {"train_loss": -7.316606521606445, "global_step": 195441, "epoch": 4653} {"train_loss": -7.192898273468018, "global_step": 195442, "epoch": 4653} {"train_loss": -7.12180757522583, "global_step": 195443, "epoch": 4653} {"train_loss": -7.124011516571045, "global_step": 195444, "epoch": 4653} {"train_loss": -7.152949810028076, "global_step": 195445, "epoch": 4653} {"train_loss": -7.111279010772705, "global_step": 195446, "epoch": 4653} {"train_loss": -7.083427429199219, "global_step": 195447, "epoch": 4653} {"train_loss": -7.206672191619873, "global_step": 195448, "epoch": 4653} {"train_loss": -7.198108673095703, "global_step": 195449, "epoch": 4653} {"train_loss": -7.071224689483643, "global_step": 195450, "epoch": 4653} {"train_loss": -7.151240348815918, "global_step": 195451, "epoch": 4653} {"train_loss": -7.228242874145508, "global_step": 195452, "epoch": 4653} {"train_loss": -7.1365647315979, "global_step": 195453, "epoch": 4653} {"train_loss": -7.237045764923096, "global_step": 195454, "epoch": 4653} {"train_loss": -7.086179733276367, "global_step": 195455, "epoch": 4653} {"train_loss": -7.160265922546387, "global_step": 195456, "epoch": 4653} {"train_loss": -7.2876739501953125, "global_step": 195457, "epoch": 4653} {"train_loss": -7.225935935974121, "global_step": 195458, "epoch": 4653} {"train_loss": -7.188836097717285, "global_step": 195459, "epoch": 4653} {"train_loss": -7.323661804199219, "global_step": 195460, "epoch": 4653} {"train_loss": -7.175839424133301, "global_step": 195461, "epoch": 4653} {"train_loss": -7.195606231689453, "global_step": 195462, "epoch": 4653} {"train_loss": -7.271413803100586, "global_step": 195463, "epoch": 4653} {"train_loss": -7.2473368644714355, "global_step": 195464, "epoch": 4653} {"train_loss": -7.263970851898193, "global_step": 195465, "epoch": 4653} {"train_loss": -7.181653022766113, "global_step": 195466, "epoch": 4653} {"train_loss": -7.1630400362468905, "global_step": 195467, "epoch": 4653, "val_loss": 69840.2890625} {"train_loss": -7.311558723449707, "global_step": 195468, "epoch": 4654} {"train_loss": -7.2100114822387695, "global_step": 195469, "epoch": 4654} {"train_loss": -7.157666206359863, "global_step": 195470, "epoch": 4654} {"train_loss": -7.232966423034668, "global_step": 195471, "epoch": 4654} {"train_loss": -7.143613815307617, "global_step": 195472, "epoch": 4654} {"train_loss": -7.122493743896484, "global_step": 195473, "epoch": 4654} {"train_loss": -7.18806791305542, "global_step": 195474, "epoch": 4654} {"train_loss": -7.190824031829834, "global_step": 195475, "epoch": 4654} {"train_loss": -7.080915451049805, "global_step": 195476, "epoch": 4654} {"train_loss": -7.20521879196167, "global_step": 195477, "epoch": 4654} {"train_loss": -7.208063125610352, "global_step": 195478, "epoch": 4654} {"train_loss": -7.105140686035156, "global_step": 195479, "epoch": 4654} {"train_loss": -7.094235897064209, "global_step": 195480, "epoch": 4654} {"train_loss": -7.219579696655273, "global_step": 195481, "epoch": 4654} {"train_loss": -7.130807876586914, "global_step": 195482, "epoch": 4654} {"train_loss": -7.128274917602539, "global_step": 195483, "epoch": 4654} {"train_loss": -7.148533821105957, "global_step": 195484, "epoch": 4654} {"train_loss": -7.213138580322266, "global_step": 195485, "epoch": 4654} {"train_loss": -7.273608207702637, "global_step": 195486, "epoch": 4654} {"train_loss": -7.200590133666992, "global_step": 195487, "epoch": 4654} {"train_loss": -7.172198295593262, "global_step": 195488, "epoch": 4654} {"train_loss": -7.2513909339904785, "global_step": 195489, "epoch": 4654} {"train_loss": -7.184556007385254, "global_step": 195490, "epoch": 4654} {"train_loss": -7.092421054840088, "global_step": 195491, "epoch": 4654} {"train_loss": -7.311744689941406, "global_step": 195492, "epoch": 4654} {"train_loss": -7.132719039916992, "global_step": 195493, "epoch": 4654} {"train_loss": -7.235899925231934, "global_step": 195494, "epoch": 4654} {"train_loss": -6.987823486328125, "global_step": 195495, "epoch": 4654} {"train_loss": -7.271021842956543, "global_step": 195496, "epoch": 4654} {"train_loss": -7.033425331115723, "global_step": 195497, "epoch": 4654} {"train_loss": -7.133763313293457, "global_step": 195498, "epoch": 4654} {"train_loss": -7.0335469245910645, "global_step": 195499, "epoch": 4654} {"train_loss": -7.1796875, "global_step": 195500, "epoch": 4654} {"train_loss": -7.133967876434326, "global_step": 195501, "epoch": 4654} {"train_loss": -7.193000793457031, "global_step": 195502, "epoch": 4654} {"train_loss": -7.131714820861816, "global_step": 195503, "epoch": 4654} {"train_loss": -7.114223480224609, "global_step": 195504, "epoch": 4654} {"train_loss": -7.179358005523682, "global_step": 195505, "epoch": 4654} {"train_loss": -7.14272403717041, "global_step": 195506, "epoch": 4654} {"train_loss": -7.238135814666748, "global_step": 195507, "epoch": 4654} {"train_loss": -7.177036285400391, "global_step": 195508, "epoch": 4654} {"train_loss": -7.1690690858023505, "global_step": 195509, "epoch": 4654, "val_loss": 69565.359375} {"train_loss": -7.145931243896484, "global_step": 195510, "epoch": 4655} {"train_loss": -7.266895294189453, "global_step": 195511, "epoch": 4655} {"train_loss": -7.209199905395508, "global_step": 195512, "epoch": 4655} {"train_loss": -7.2465128898620605, "global_step": 195513, "epoch": 4655} {"train_loss": -7.223829746246338, "global_step": 195514, "epoch": 4655} {"train_loss": -7.212718963623047, "global_step": 195515, "epoch": 4655} {"train_loss": -7.195520401000977, "global_step": 195516, "epoch": 4655} {"train_loss": -7.231741905212402, "global_step": 195517, "epoch": 4655} {"train_loss": -7.271955490112305, "global_step": 195518, "epoch": 4655} {"train_loss": -7.188587188720703, "global_step": 195519, "epoch": 4655} {"train_loss": -7.305781364440918, "global_step": 195520, "epoch": 4655} {"train_loss": -7.21289587020874, "global_step": 195521, "epoch": 4655} {"train_loss": -7.333833694458008, "global_step": 195522, "epoch": 4655} {"train_loss": -7.412144660949707, "global_step": 195523, "epoch": 4655} {"train_loss": -7.250185489654541, "global_step": 195524, "epoch": 4655} {"train_loss": -7.248554706573486, "global_step": 195525, "epoch": 4655} {"train_loss": -7.3243184089660645, "global_step": 195526, "epoch": 4655} {"train_loss": -7.270916938781738, "global_step": 195527, "epoch": 4655} {"train_loss": -7.2244062423706055, "global_step": 195528, "epoch": 4655} {"train_loss": -7.242434501647949, "global_step": 195529, "epoch": 4655} {"train_loss": -7.301758766174316, "global_step": 195530, "epoch": 4655} {"train_loss": -7.299365997314453, "global_step": 195531, "epoch": 4655} {"train_loss": -7.100445747375488, "global_step": 195532, "epoch": 4655} {"train_loss": -7.325628757476807, "global_step": 195533, "epoch": 4655} {"train_loss": -7.161931991577148, "global_step": 195534, "epoch": 4655} {"train_loss": -7.404223442077637, "global_step": 195535, "epoch": 4655} {"train_loss": -7.278287887573242, "global_step": 195536, "epoch": 4655} {"train_loss": -7.173125267028809, "global_step": 195537, "epoch": 4655} {"train_loss": -7.3219451904296875, "global_step": 195538, "epoch": 4655} {"train_loss": -7.180580139160156, "global_step": 195539, "epoch": 4655} {"train_loss": -7.14572811126709, "global_step": 195540, "epoch": 4655} {"train_loss": -7.281697750091553, "global_step": 195541, "epoch": 4655} {"train_loss": -7.305412769317627, "global_step": 195542, "epoch": 4655} {"train_loss": -7.1593146324157715, "global_step": 195543, "epoch": 4655} {"train_loss": -7.287908554077148, "global_step": 195544, "epoch": 4655} {"train_loss": -7.268991947174072, "global_step": 195545, "epoch": 4655} {"train_loss": -7.2510986328125, "global_step": 195546, "epoch": 4655} {"train_loss": -7.20629358291626, "global_step": 195547, "epoch": 4655} {"train_loss": -7.124448776245117, "global_step": 195548, "epoch": 4655} {"train_loss": -7.207969665527344, "global_step": 195549, "epoch": 4655} {"train_loss": -7.308126926422119, "global_step": 195550, "epoch": 4655} {"train_loss": -7.244467110860915, "global_step": 195551, "epoch": 4655, "val_loss": 69754.40625} {"train_loss": -7.206870079040527, "global_step": 195552, "epoch": 4656} {"train_loss": -7.191715240478516, "global_step": 195553, "epoch": 4656} {"train_loss": -7.252919673919678, "global_step": 195554, "epoch": 4656} {"train_loss": -7.218400001525879, "global_step": 195555, "epoch": 4656} {"train_loss": -7.213656902313232, "global_step": 195556, "epoch": 4656} {"train_loss": -7.382209777832031, "global_step": 195557, "epoch": 4656} {"train_loss": -7.2813262939453125, "global_step": 195558, "epoch": 4656} {"train_loss": -7.212337493896484, "global_step": 195559, "epoch": 4656} {"train_loss": -7.262945175170898, "global_step": 195560, "epoch": 4656} {"train_loss": -7.241713523864746, "global_step": 195561, "epoch": 4656} {"train_loss": -7.10781192779541, "global_step": 195562, "epoch": 4656} {"train_loss": -7.264133453369141, "global_step": 195563, "epoch": 4656} {"train_loss": -7.276367664337158, "global_step": 195564, "epoch": 4656} {"train_loss": -7.264481544494629, "global_step": 195565, "epoch": 4656} {"train_loss": -7.310851097106934, "global_step": 195566, "epoch": 4656} {"train_loss": -7.261440277099609, "global_step": 195567, "epoch": 4656} {"train_loss": -7.079410552978516, "global_step": 195568, "epoch": 4656} {"train_loss": -7.284386157989502, "global_step": 195569, "epoch": 4656} {"train_loss": -7.225767612457275, "global_step": 195570, "epoch": 4656} {"train_loss": -7.133824348449707, "global_step": 195571, "epoch": 4656} {"train_loss": -7.190594673156738, "global_step": 195572, "epoch": 4656} {"train_loss": -7.2330403327941895, "global_step": 195573, "epoch": 4656} {"train_loss": -7.298943519592285, "global_step": 195574, "epoch": 4656} {"train_loss": -7.3216352462768555, "global_step": 195575, "epoch": 4656} {"train_loss": -7.140340805053711, "global_step": 195576, "epoch": 4656} {"train_loss": -7.316344738006592, "global_step": 195577, "epoch": 4656} {"train_loss": -7.197301387786865, "global_step": 195578, "epoch": 4656} {"train_loss": -7.1313066482543945, "global_step": 195579, "epoch": 4656} {"train_loss": -7.218958854675293, "global_step": 195580, "epoch": 4656} {"train_loss": -7.149724006652832, "global_step": 195581, "epoch": 4656} {"train_loss": -7.300827980041504, "global_step": 195582, "epoch": 4656} {"train_loss": -7.170926094055176, "global_step": 195583, "epoch": 4656} {"train_loss": -7.226502418518066, "global_step": 195584, "epoch": 4656} {"train_loss": -7.27458381652832, "global_step": 195585, "epoch": 4656} {"train_loss": -7.286835670471191, "global_step": 195586, "epoch": 4656} {"train_loss": -7.230224132537842, "global_step": 195587, "epoch": 4656} {"train_loss": -7.252917289733887, "global_step": 195588, "epoch": 4656} {"train_loss": -7.217958450317383, "global_step": 195589, "epoch": 4656} {"train_loss": -7.1969828605651855, "global_step": 195590, "epoch": 4656} {"train_loss": -7.230482578277588, "global_step": 195591, "epoch": 4656} {"train_loss": -7.243300914764404, "global_step": 195592, "epoch": 4656} {"train_loss": -7.232951641082764, "global_step": 195593, "epoch": 4656, "val_loss": 69685.8046875} {"train_loss": -7.254493713378906, "global_step": 195594, "epoch": 4657} {"train_loss": -7.339773654937744, "global_step": 195595, "epoch": 4657} {"train_loss": -7.272918701171875, "global_step": 195596, "epoch": 4657} {"train_loss": -7.308567047119141, "global_step": 195597, "epoch": 4657} {"train_loss": -7.269902229309082, "global_step": 195598, "epoch": 4657} {"train_loss": -7.249680995941162, "global_step": 195599, "epoch": 4657} {"train_loss": -7.327925682067871, "global_step": 195600, "epoch": 4657} {"train_loss": -7.2537031173706055, "global_step": 195601, "epoch": 4657} {"train_loss": -7.389369010925293, "global_step": 195602, "epoch": 4657} {"train_loss": -7.339576721191406, "global_step": 195603, "epoch": 4657} {"train_loss": -7.36583948135376, "global_step": 195604, "epoch": 4657} {"train_loss": -7.372935771942139, "global_step": 195605, "epoch": 4657} {"train_loss": -7.277408599853516, "global_step": 195606, "epoch": 4657} {"train_loss": -7.294284343719482, "global_step": 195607, "epoch": 4657} {"train_loss": -7.240800857543945, "global_step": 195608, "epoch": 4657} {"train_loss": -7.212855815887451, "global_step": 195609, "epoch": 4657} {"train_loss": -7.307616710662842, "global_step": 195610, "epoch": 4657} {"train_loss": -7.255774974822998, "global_step": 195611, "epoch": 4657} {"train_loss": -7.317537784576416, "global_step": 195612, "epoch": 4657} {"train_loss": -7.117679119110107, "global_step": 195613, "epoch": 4657} {"train_loss": -7.20972204208374, "global_step": 195614, "epoch": 4657} {"train_loss": -7.225549697875977, "global_step": 195615, "epoch": 4657} {"train_loss": -7.237358570098877, "global_step": 195616, "epoch": 4657} {"train_loss": -7.278770446777344, "global_step": 195617, "epoch": 4657} {"train_loss": -7.256035804748535, "global_step": 195618, "epoch": 4657} {"train_loss": -7.251397132873535, "global_step": 195619, "epoch": 4657} {"train_loss": -7.307480812072754, "global_step": 195620, "epoch": 4657} {"train_loss": -7.119811058044434, "global_step": 195621, "epoch": 4657} {"train_loss": -7.249207973480225, "global_step": 195622, "epoch": 4657} {"train_loss": -7.082193851470947, "global_step": 195623, "epoch": 4657} {"train_loss": -7.313039779663086, "global_step": 195624, "epoch": 4657} {"train_loss": -7.1420512199401855, "global_step": 195625, "epoch": 4657} {"train_loss": -7.2591094970703125, "global_step": 195626, "epoch": 4657} {"train_loss": -7.281261444091797, "global_step": 195627, "epoch": 4657} {"train_loss": -7.188497543334961, "global_step": 195628, "epoch": 4657} {"train_loss": -7.175418376922607, "global_step": 195629, "epoch": 4657} {"train_loss": -7.049830436706543, "global_step": 195630, "epoch": 4657} {"train_loss": -7.219147205352783, "global_step": 195631, "epoch": 4657} {"train_loss": -7.254644870758057, "global_step": 195632, "epoch": 4657} {"train_loss": -7.191438674926758, "global_step": 195633, "epoch": 4657} {"train_loss": -7.28464412689209, "global_step": 195634, "epoch": 4657} {"train_loss": -7.252563987459455, "global_step": 195635, "epoch": 4657, "val_loss": 69684.8984375} {"train_loss": -7.1801910400390625, "global_step": 195636, "epoch": 4658} {"train_loss": -7.275943756103516, "global_step": 195637, "epoch": 4658} {"train_loss": -7.4014573097229, "global_step": 195638, "epoch": 4658} {"train_loss": -7.224588394165039, "global_step": 195639, "epoch": 4658} {"train_loss": -7.296189308166504, "global_step": 195640, "epoch": 4658} {"train_loss": -7.192927360534668, "global_step": 195641, "epoch": 4658} {"train_loss": -7.226658344268799, "global_step": 195642, "epoch": 4658} {"train_loss": -7.1993842124938965, "global_step": 195643, "epoch": 4658} {"train_loss": -7.196098327636719, "global_step": 195644, "epoch": 4658} {"train_loss": -7.2738752365112305, "global_step": 195645, "epoch": 4658} {"train_loss": -7.223637580871582, "global_step": 195646, "epoch": 4658} {"train_loss": -7.233705520629883, "global_step": 195647, "epoch": 4658} {"train_loss": -7.148876190185547, "global_step": 195648, "epoch": 4658} {"train_loss": -7.154045104980469, "global_step": 195649, "epoch": 4658} {"train_loss": -7.211846828460693, "global_step": 195650, "epoch": 4658} {"train_loss": -7.134897232055664, "global_step": 195651, "epoch": 4658} {"train_loss": -7.237653732299805, "global_step": 195652, "epoch": 4658} {"train_loss": -7.146440029144287, "global_step": 195653, "epoch": 4658} {"train_loss": -7.096759796142578, "global_step": 195654, "epoch": 4658} {"train_loss": -7.2231340408325195, "global_step": 195655, "epoch": 4658} {"train_loss": -7.224544048309326, "global_step": 195656, "epoch": 4658} {"train_loss": -7.231374740600586, "global_step": 195657, "epoch": 4658} {"train_loss": -7.249479293823242, "global_step": 195658, "epoch": 4658} {"train_loss": -7.1093831062316895, "global_step": 195659, "epoch": 4658} {"train_loss": -7.200023651123047, "global_step": 195660, "epoch": 4658} {"train_loss": -7.196474075317383, "global_step": 195661, "epoch": 4658} {"train_loss": -7.261181831359863, "global_step": 195662, "epoch": 4658} {"train_loss": -7.284170150756836, "global_step": 195663, "epoch": 4658} {"train_loss": -7.279565334320068, "global_step": 195664, "epoch": 4658} {"train_loss": -7.225702285766602, "global_step": 195665, "epoch": 4658} {"train_loss": -7.245168685913086, "global_step": 195666, "epoch": 4658} {"train_loss": -7.161136627197266, "global_step": 195667, "epoch": 4658} {"train_loss": -7.246035575866699, "global_step": 195668, "epoch": 4658} {"train_loss": -7.207368850708008, "global_step": 195669, "epoch": 4658} {"train_loss": -7.173346519470215, "global_step": 195670, "epoch": 4658} {"train_loss": -7.278167724609375, "global_step": 195671, "epoch": 4658} {"train_loss": -7.192800045013428, "global_step": 195672, "epoch": 4658} {"train_loss": -7.345437526702881, "global_step": 195673, "epoch": 4658} {"train_loss": -7.143235206604004, "global_step": 195674, "epoch": 4658} {"train_loss": -7.296990394592285, "global_step": 195675, "epoch": 4658} {"train_loss": -7.306889057159424, "global_step": 195676, "epoch": 4658} {"train_loss": -7.224799496786935, "global_step": 195677, "epoch": 4658, "val_loss": 69736.2890625} {"train_loss": -7.336753845214844, "global_step": 195678, "epoch": 4659} {"train_loss": -7.240408897399902, "global_step": 195679, "epoch": 4659} {"train_loss": -7.284220218658447, "global_step": 195680, "epoch": 4659} {"train_loss": -7.335477828979492, "global_step": 195681, "epoch": 4659} {"train_loss": -7.3662824630737305, "global_step": 195682, "epoch": 4659} {"train_loss": -7.31431245803833, "global_step": 195683, "epoch": 4659} {"train_loss": -7.386782646179199, "global_step": 195684, "epoch": 4659} {"train_loss": -7.336709022521973, "global_step": 195685, "epoch": 4659} {"train_loss": -7.2282514572143555, "global_step": 195686, "epoch": 4659} {"train_loss": -7.337761878967285, "global_step": 195687, "epoch": 4659} {"train_loss": -7.321722507476807, "global_step": 195688, "epoch": 4659} {"train_loss": -7.244184494018555, "global_step": 195689, "epoch": 4659} {"train_loss": -7.3028974533081055, "global_step": 195690, "epoch": 4659} {"train_loss": -7.302742958068848, "global_step": 195691, "epoch": 4659} {"train_loss": -7.247261047363281, "global_step": 195692, "epoch": 4659} {"train_loss": -7.283705234527588, "global_step": 195693, "epoch": 4659} {"train_loss": -7.410886764526367, "global_step": 195694, "epoch": 4659} {"train_loss": -7.194910526275635, "global_step": 195695, "epoch": 4659} {"train_loss": -7.306893348693848, "global_step": 195696, "epoch": 4659} {"train_loss": -7.344388008117676, "global_step": 195697, "epoch": 4659} {"train_loss": -7.257533073425293, "global_step": 195698, "epoch": 4659} {"train_loss": -7.213813781738281, "global_step": 195699, "epoch": 4659} {"train_loss": -7.312339782714844, "global_step": 195700, "epoch": 4659} {"train_loss": -7.230252742767334, "global_step": 195701, "epoch": 4659} {"train_loss": -7.186931133270264, "global_step": 195702, "epoch": 4659} {"train_loss": -7.323024749755859, "global_step": 195703, "epoch": 4659} {"train_loss": -7.163790702819824, "global_step": 195704, "epoch": 4659} {"train_loss": -7.310488224029541, "global_step": 195705, "epoch": 4659} {"train_loss": -7.173552513122559, "global_step": 195706, "epoch": 4659} {"train_loss": -7.080259323120117, "global_step": 195707, "epoch": 4659} {"train_loss": -7.177359580993652, "global_step": 195708, "epoch": 4659} {"train_loss": -7.155705451965332, "global_step": 195709, "epoch": 4659} {"train_loss": -7.074860572814941, "global_step": 195710, "epoch": 4659} {"train_loss": -7.242330551147461, "global_step": 195711, "epoch": 4659} {"train_loss": -7.178458213806152, "global_step": 195712, "epoch": 4659} {"train_loss": -7.174614429473877, "global_step": 195713, "epoch": 4659} {"train_loss": -7.290999412536621, "global_step": 195714, "epoch": 4659} {"train_loss": -7.134106636047363, "global_step": 195715, "epoch": 4659} {"train_loss": -7.24268913269043, "global_step": 195716, "epoch": 4659} {"train_loss": -7.205615043640137, "global_step": 195717, "epoch": 4659} {"train_loss": -7.271398067474365, "global_step": 195718, "epoch": 4659} {"train_loss": -7.254956710906256, "global_step": 195719, "epoch": 4659, "val_loss": 69997.734375} {"train_loss": -7.1381049156188965, "global_step": 195720, "epoch": 4660} {"train_loss": -7.322545528411865, "global_step": 195721, "epoch": 4660} {"train_loss": -7.15480375289917, "global_step": 195722, "epoch": 4660} {"train_loss": -7.075592041015625, "global_step": 195723, "epoch": 4660} {"train_loss": -7.254510879516602, "global_step": 195724, "epoch": 4660} {"train_loss": -7.333052635192871, "global_step": 195725, "epoch": 4660} {"train_loss": -7.306797027587891, "global_step": 195726, "epoch": 4660} {"train_loss": -7.278421401977539, "global_step": 195727, "epoch": 4660} {"train_loss": -7.2899932861328125, "global_step": 195728, "epoch": 4660} {"train_loss": -7.27646017074585, "global_step": 195729, "epoch": 4660} {"train_loss": -7.295391082763672, "global_step": 195730, "epoch": 4660} {"train_loss": -7.223527908325195, "global_step": 195731, "epoch": 4660} {"train_loss": -7.127274513244629, "global_step": 195732, "epoch": 4660} {"train_loss": -7.226591110229492, "global_step": 195733, "epoch": 4660} {"train_loss": -7.206772804260254, "global_step": 195734, "epoch": 4660} {"train_loss": -7.197030067443848, "global_step": 195735, "epoch": 4660} {"train_loss": -7.189426898956299, "global_step": 195736, "epoch": 4660} {"train_loss": -7.30903959274292, "global_step": 195737, "epoch": 4660} {"train_loss": -7.148148536682129, "global_step": 195738, "epoch": 4660} {"train_loss": -7.2959113121032715, "global_step": 195739, "epoch": 4660} {"train_loss": -7.289939880371094, "global_step": 195740, "epoch": 4660} {"train_loss": -7.3110857009887695, "global_step": 195741, "epoch": 4660} {"train_loss": -7.232408046722412, "global_step": 195742, "epoch": 4660} {"train_loss": -7.24397087097168, "global_step": 195743, "epoch": 4660} {"train_loss": -7.054232597351074, "global_step": 195744, "epoch": 4660} {"train_loss": -7.097264289855957, "global_step": 195745, "epoch": 4660} {"train_loss": -7.069584846496582, "global_step": 195746, "epoch": 4660} {"train_loss": -7.2411322593688965, "global_step": 195747, "epoch": 4660} {"train_loss": -7.198025703430176, "global_step": 195748, "epoch": 4660} {"train_loss": -7.147736072540283, "global_step": 195749, "epoch": 4660} {"train_loss": -7.196829795837402, "global_step": 195750, "epoch": 4660} {"train_loss": -7.320755958557129, "global_step": 195751, "epoch": 4660} {"train_loss": -7.213321685791016, "global_step": 195752, "epoch": 4660} {"train_loss": -7.211291313171387, "global_step": 195753, "epoch": 4660} {"train_loss": -7.25412654876709, "global_step": 195754, "epoch": 4660} {"train_loss": -7.189602851867676, "global_step": 195755, "epoch": 4660} {"train_loss": -7.231400489807129, "global_step": 195756, "epoch": 4660} {"train_loss": -7.213187217712402, "global_step": 195757, "epoch": 4660} {"train_loss": -7.252129554748535, "global_step": 195758, "epoch": 4660} {"train_loss": -7.299554824829102, "global_step": 195759, "epoch": 4660} {"train_loss": -7.240224838256836, "global_step": 195760, "epoch": 4660} {"train_loss": -7.224618332726615, "global_step": 195761, "epoch": 4660, "val_loss": 69637.8984375} {"train_loss": -7.234099864959717, "global_step": 195762, "epoch": 4661} {"train_loss": -7.3055572509765625, "global_step": 195763, "epoch": 4661} {"train_loss": -7.218214988708496, "global_step": 195764, "epoch": 4661} {"train_loss": -7.329681396484375, "global_step": 195765, "epoch": 4661} {"train_loss": -7.242377281188965, "global_step": 195766, "epoch": 4661} {"train_loss": -7.254094123840332, "global_step": 195767, "epoch": 4661} {"train_loss": -7.187752723693848, "global_step": 195768, "epoch": 4661} {"train_loss": -7.326714515686035, "global_step": 195769, "epoch": 4661} {"train_loss": -7.289999961853027, "global_step": 195770, "epoch": 4661} {"train_loss": -7.225067138671875, "global_step": 195771, "epoch": 4661} {"train_loss": -7.306169509887695, "global_step": 195772, "epoch": 4661} {"train_loss": -7.375798225402832, "global_step": 195773, "epoch": 4661} {"train_loss": -7.251703262329102, "global_step": 195774, "epoch": 4661} {"train_loss": -7.258059501647949, "global_step": 195775, "epoch": 4661} {"train_loss": -7.287583827972412, "global_step": 195776, "epoch": 4661} {"train_loss": -7.199756622314453, "global_step": 195777, "epoch": 4661} {"train_loss": -7.305368423461914, "global_step": 195778, "epoch": 4661} {"train_loss": -7.229160308837891, "global_step": 195779, "epoch": 4661} {"train_loss": -7.224095344543457, "global_step": 195780, "epoch": 4661} {"train_loss": -7.257974624633789, "global_step": 195781, "epoch": 4661} {"train_loss": -7.149981498718262, "global_step": 195782, "epoch": 4661} {"train_loss": -7.262120723724365, "global_step": 195783, "epoch": 4661} {"train_loss": -7.246368408203125, "global_step": 195784, "epoch": 4661} {"train_loss": -7.350049018859863, "global_step": 195785, "epoch": 4661} {"train_loss": -7.3438262939453125, "global_step": 195786, "epoch": 4661} {"train_loss": -7.166018486022949, "global_step": 195787, "epoch": 4661} {"train_loss": -7.203890323638916, "global_step": 195788, "epoch": 4661} {"train_loss": -7.0790910720825195, "global_step": 195789, "epoch": 4661} {"train_loss": -7.134232044219971, "global_step": 195790, "epoch": 4661} {"train_loss": -7.278485298156738, "global_step": 195791, "epoch": 4661} {"train_loss": -7.129233360290527, "global_step": 195792, "epoch": 4661} {"train_loss": -7.255364894866943, "global_step": 195793, "epoch": 4661} {"train_loss": -7.171382904052734, "global_step": 195794, "epoch": 4661} {"train_loss": -7.2725419998168945, "global_step": 195795, "epoch": 4661} {"train_loss": -7.244016647338867, "global_step": 195796, "epoch": 4661} {"train_loss": -7.222846031188965, "global_step": 195797, "epoch": 4661} {"train_loss": -7.1529860496521, "global_step": 195798, "epoch": 4661} {"train_loss": -7.304819107055664, "global_step": 195799, "epoch": 4661} {"train_loss": -7.328463554382324, "global_step": 195800, "epoch": 4661} {"train_loss": -7.085103511810303, "global_step": 195801, "epoch": 4661} {"train_loss": -7.2241950035095215, "global_step": 195802, "epoch": 4661} {"train_loss": -7.2410024007161455, "global_step": 195803, "epoch": 4661, "val_loss": 69661.71875} {"train_loss": -7.1958160400390625, "global_step": 195804, "epoch": 4662} {"train_loss": -7.248861789703369, "global_step": 195805, "epoch": 4662} {"train_loss": -7.163773536682129, "global_step": 195806, "epoch": 4662} {"train_loss": -7.19190788269043, "global_step": 195807, "epoch": 4662} {"train_loss": -7.1931376457214355, "global_step": 195808, "epoch": 4662} {"train_loss": -7.263004302978516, "global_step": 195809, "epoch": 4662} {"train_loss": -7.202826499938965, "global_step": 195810, "epoch": 4662} {"train_loss": -7.210253715515137, "global_step": 195811, "epoch": 4662} {"train_loss": -7.131509780883789, "global_step": 195812, "epoch": 4662} {"train_loss": -7.205725193023682, "global_step": 195813, "epoch": 4662} {"train_loss": -7.170456886291504, "global_step": 195814, "epoch": 4662} {"train_loss": -7.229639053344727, "global_step": 195815, "epoch": 4662} {"train_loss": -7.168962478637695, "global_step": 195816, "epoch": 4662} {"train_loss": -7.143712997436523, "global_step": 195817, "epoch": 4662} {"train_loss": -7.218854904174805, "global_step": 195818, "epoch": 4662} {"train_loss": -7.199164390563965, "global_step": 195819, "epoch": 4662} {"train_loss": -7.264664649963379, "global_step": 195820, "epoch": 4662} {"train_loss": -7.242958068847656, "global_step": 195821, "epoch": 4662} {"train_loss": -7.202608108520508, "global_step": 195822, "epoch": 4662} {"train_loss": -7.257559299468994, "global_step": 195823, "epoch": 4662} {"train_loss": -7.154004096984863, "global_step": 195824, "epoch": 4662} {"train_loss": -7.283198356628418, "global_step": 195825, "epoch": 4662} {"train_loss": -7.307310581207275, "global_step": 195826, "epoch": 4662} {"train_loss": -7.125102519989014, "global_step": 195827, "epoch": 4662} {"train_loss": -7.247200965881348, "global_step": 195828, "epoch": 4662} {"train_loss": -7.173210620880127, "global_step": 195829, "epoch": 4662} {"train_loss": -7.264987468719482, "global_step": 195830, "epoch": 4662} {"train_loss": -7.208808898925781, "global_step": 195831, "epoch": 4662} {"train_loss": -7.168947696685791, "global_step": 195832, "epoch": 4662} {"train_loss": -7.2937517166137695, "global_step": 195833, "epoch": 4662} {"train_loss": -7.373964309692383, "global_step": 195834, "epoch": 4662} {"train_loss": -7.416701316833496, "global_step": 195835, "epoch": 4662} {"train_loss": -7.253480434417725, "global_step": 195836, "epoch": 4662} {"train_loss": -7.321042537689209, "global_step": 195837, "epoch": 4662} {"train_loss": -7.253368377685547, "global_step": 195838, "epoch": 4662} {"train_loss": -7.304426193237305, "global_step": 195839, "epoch": 4662} {"train_loss": -7.270443916320801, "global_step": 195840, "epoch": 4662} {"train_loss": -7.300678253173828, "global_step": 195841, "epoch": 4662} {"train_loss": -7.15727424621582, "global_step": 195842, "epoch": 4662} {"train_loss": -7.310543060302734, "global_step": 195843, "epoch": 4662} {"train_loss": -7.264854907989502, "global_step": 195844, "epoch": 4662} {"train_loss": -7.233353728339786, "global_step": 195845, "epoch": 4662, "val_loss": 69829.171875} {"train_loss": -7.335993766784668, "global_step": 195846, "epoch": 4663} {"train_loss": -7.296181678771973, "global_step": 195847, "epoch": 4663} {"train_loss": -7.275607109069824, "global_step": 195848, "epoch": 4663} {"train_loss": -7.2851243019104, "global_step": 195849, "epoch": 4663} {"train_loss": -7.247833251953125, "global_step": 195850, "epoch": 4663} {"train_loss": -7.183745384216309, "global_step": 195851, "epoch": 4663} {"train_loss": -7.1731109619140625, "global_step": 195852, "epoch": 4663} {"train_loss": -7.229284286499023, "global_step": 195853, "epoch": 4663} {"train_loss": -7.197293281555176, "global_step": 195854, "epoch": 4663} {"train_loss": -7.133673667907715, "global_step": 195855, "epoch": 4663} {"train_loss": -7.177628517150879, "global_step": 195856, "epoch": 4663} {"train_loss": -7.218165397644043, "global_step": 195857, "epoch": 4663} {"train_loss": -7.112934112548828, "global_step": 195858, "epoch": 4663} {"train_loss": -7.128243446350098, "global_step": 195859, "epoch": 4663} {"train_loss": -7.250722885131836, "global_step": 195860, "epoch": 4663} {"train_loss": -7.103847980499268, "global_step": 195861, "epoch": 4663} {"train_loss": -7.109314918518066, "global_step": 195862, "epoch": 4663} {"train_loss": -7.193126678466797, "global_step": 195863, "epoch": 4663} {"train_loss": -7.165294170379639, "global_step": 195864, "epoch": 4663} {"train_loss": -7.093584060668945, "global_step": 195865, "epoch": 4663} {"train_loss": -7.151617527008057, "global_step": 195866, "epoch": 4663} {"train_loss": -7.278177261352539, "global_step": 195867, "epoch": 4663} {"train_loss": -7.108129978179932, "global_step": 195868, "epoch": 4663} {"train_loss": -7.206604957580566, "global_step": 195869, "epoch": 4663} {"train_loss": -7.1746063232421875, "global_step": 195870, "epoch": 4663} {"train_loss": -7.105172157287598, "global_step": 195871, "epoch": 4663} {"train_loss": -7.267474174499512, "global_step": 195872, "epoch": 4663} {"train_loss": -7.1357855796813965, "global_step": 195873, "epoch": 4663} {"train_loss": -7.282000541687012, "global_step": 195874, "epoch": 4663} {"train_loss": -7.104686737060547, "global_step": 195875, "epoch": 4663} {"train_loss": -7.212607383728027, "global_step": 195876, "epoch": 4663} {"train_loss": -7.117392539978027, "global_step": 195877, "epoch": 4663} {"train_loss": -7.217193603515625, "global_step": 195878, "epoch": 4663} {"train_loss": -7.209230422973633, "global_step": 195879, "epoch": 4663} {"train_loss": -7.184270858764648, "global_step": 195880, "epoch": 4663} {"train_loss": -7.229400157928467, "global_step": 195881, "epoch": 4663} {"train_loss": -7.175942420959473, "global_step": 195882, "epoch": 4663} {"train_loss": -7.084723472595215, "global_step": 195883, "epoch": 4663} {"train_loss": -7.265353202819824, "global_step": 195884, "epoch": 4663} {"train_loss": -7.115495681762695, "global_step": 195885, "epoch": 4663} {"train_loss": -7.269825458526611, "global_step": 195886, "epoch": 4663} {"train_loss": -7.190187806174869, "global_step": 195887, "epoch": 4663, "val_loss": 69560.765625} {"train_loss": -7.202078342437744, "global_step": 195888, "epoch": 4664} {"train_loss": -7.287148475646973, "global_step": 195889, "epoch": 4664} {"train_loss": -7.362893581390381, "global_step": 195890, "epoch": 4664} {"train_loss": -7.280026912689209, "global_step": 195891, "epoch": 4664} {"train_loss": -7.286918640136719, "global_step": 195892, "epoch": 4664} {"train_loss": -7.225494861602783, "global_step": 195893, "epoch": 4664} {"train_loss": -7.259704113006592, "global_step": 195894, "epoch": 4664} {"train_loss": -7.197484493255615, "global_step": 195895, "epoch": 4664} {"train_loss": -7.224608421325684, "global_step": 195896, "epoch": 4664} {"train_loss": -7.158190727233887, "global_step": 195897, "epoch": 4664} {"train_loss": -7.262218952178955, "global_step": 195898, "epoch": 4664} {"train_loss": -7.307684898376465, "global_step": 195899, "epoch": 4664} {"train_loss": -7.197027206420898, "global_step": 195900, "epoch": 4664} {"train_loss": -7.191653251647949, "global_step": 195901, "epoch": 4664} {"train_loss": -7.313163757324219, "global_step": 195902, "epoch": 4664} {"train_loss": -7.236319541931152, "global_step": 195903, "epoch": 4664} {"train_loss": -7.219000816345215, "global_step": 195904, "epoch": 4664} {"train_loss": -7.257109642028809, "global_step": 195905, "epoch": 4664} {"train_loss": -7.267935276031494, "global_step": 195906, "epoch": 4664} {"train_loss": -7.092245578765869, "global_step": 195907, "epoch": 4664} {"train_loss": -7.199560165405273, "global_step": 195908, "epoch": 4664} {"train_loss": -7.236721992492676, "global_step": 195909, "epoch": 4664} {"train_loss": -7.179004669189453, "global_step": 195910, "epoch": 4664} {"train_loss": -7.298510551452637, "global_step": 195911, "epoch": 4664} {"train_loss": -7.189126014709473, "global_step": 195912, "epoch": 4664} {"train_loss": -7.1732635498046875, "global_step": 195913, "epoch": 4664} {"train_loss": -7.157251358032227, "global_step": 195914, "epoch": 4664} {"train_loss": -7.222951889038086, "global_step": 195915, "epoch": 4664} {"train_loss": -7.266628265380859, "global_step": 195916, "epoch": 4664} {"train_loss": -7.16335391998291, "global_step": 195917, "epoch": 4664} {"train_loss": -7.2759809494018555, "global_step": 195918, "epoch": 4664} {"train_loss": -7.151973724365234, "global_step": 195919, "epoch": 4664} {"train_loss": -7.21949577331543, "global_step": 195920, "epoch": 4664} {"train_loss": -7.299684524536133, "global_step": 195921, "epoch": 4664} {"train_loss": -7.245609760284424, "global_step": 195922, "epoch": 4664} {"train_loss": -7.26947546005249, "global_step": 195923, "epoch": 4664} {"train_loss": -7.2342658042907715, "global_step": 195924, "epoch": 4664} {"train_loss": -7.229645252227783, "global_step": 195925, "epoch": 4664} {"train_loss": -7.30784797668457, "global_step": 195926, "epoch": 4664} {"train_loss": -7.234126567840576, "global_step": 195927, "epoch": 4664} {"train_loss": -7.202537536621094, "global_step": 195928, "epoch": 4664} {"train_loss": -7.235094161260696, "global_step": 195929, "epoch": 4664, "val_loss": 69882.6953125} {"train_loss": -7.192712783813477, "global_step": 195930, "epoch": 4665} {"train_loss": -7.282226085662842, "global_step": 195931, "epoch": 4665} {"train_loss": -7.220085620880127, "global_step": 195932, "epoch": 4665} {"train_loss": -7.22028923034668, "global_step": 195933, "epoch": 4665} {"train_loss": -7.209748268127441, "global_step": 195934, "epoch": 4665} {"train_loss": -7.145827770233154, "global_step": 195935, "epoch": 4665} {"train_loss": -7.233786582946777, "global_step": 195936, "epoch": 4665} {"train_loss": -7.182711601257324, "global_step": 195937, "epoch": 4665} {"train_loss": -7.190947532653809, "global_step": 195938, "epoch": 4665} {"train_loss": -7.1805009841918945, "global_step": 195939, "epoch": 4665} {"train_loss": -7.2365498542785645, "global_step": 195940, "epoch": 4665} {"train_loss": -7.230344295501709, "global_step": 195941, "epoch": 4665} {"train_loss": -7.125945568084717, "global_step": 195942, "epoch": 4665} {"train_loss": -7.186138153076172, "global_step": 195943, "epoch": 4665} {"train_loss": -7.137287616729736, "global_step": 195944, "epoch": 4665} {"train_loss": -7.170589447021484, "global_step": 195945, "epoch": 4665} {"train_loss": -7.261138916015625, "global_step": 195946, "epoch": 4665} {"train_loss": -6.929658889770508, "global_step": 195947, "epoch": 4665} {"train_loss": -7.096519470214844, "global_step": 195948, "epoch": 4665} {"train_loss": -7.11765193939209, "global_step": 195949, "epoch": 4665} {"train_loss": -7.11500358581543, "global_step": 195950, "epoch": 4665} {"train_loss": -7.129465103149414, "global_step": 195951, "epoch": 4665} {"train_loss": -7.151942253112793, "global_step": 195952, "epoch": 4665} {"train_loss": -6.927212715148926, "global_step": 195953, "epoch": 4665} {"train_loss": -7.164037704467773, "global_step": 195954, "epoch": 4665} {"train_loss": -7.098724842071533, "global_step": 195955, "epoch": 4665} {"train_loss": -7.139744758605957, "global_step": 195956, "epoch": 4665} {"train_loss": -7.207632541656494, "global_step": 195957, "epoch": 4665} {"train_loss": -7.122200965881348, "global_step": 195958, "epoch": 4665} {"train_loss": -7.155086040496826, "global_step": 195959, "epoch": 4665} {"train_loss": -7.117898464202881, "global_step": 195960, "epoch": 4665} {"train_loss": -7.205615997314453, "global_step": 195961, "epoch": 4665} {"train_loss": -7.224094867706299, "global_step": 195962, "epoch": 4665} {"train_loss": -7.305023670196533, "global_step": 195963, "epoch": 4665} {"train_loss": -7.2191972732543945, "global_step": 195964, "epoch": 4665} {"train_loss": -7.228183269500732, "global_step": 195965, "epoch": 4665} {"train_loss": -7.218486309051514, "global_step": 195966, "epoch": 4665} {"train_loss": -7.031207084655762, "global_step": 195967, "epoch": 4665} {"train_loss": -7.237719535827637, "global_step": 195968, "epoch": 4665} {"train_loss": -7.141028881072998, "global_step": 195969, "epoch": 4665} {"train_loss": -7.279314041137695, "global_step": 195970, "epoch": 4665} {"train_loss": -7.170166560581753, "global_step": 195971, "epoch": 4665, "val_loss": 69562.6875} {"train_loss": -7.221431732177734, "global_step": 195972, "epoch": 4666} {"train_loss": -7.161282539367676, "global_step": 195973, "epoch": 4666} {"train_loss": -7.196191310882568, "global_step": 195974, "epoch": 4666} {"train_loss": -7.278059959411621, "global_step": 195975, "epoch": 4666} {"train_loss": -7.168028831481934, "global_step": 195976, "epoch": 4666} {"train_loss": -7.193004608154297, "global_step": 195977, "epoch": 4666} {"train_loss": -7.197624206542969, "global_step": 195978, "epoch": 4666} {"train_loss": -7.245798110961914, "global_step": 195979, "epoch": 4666} {"train_loss": -7.239257335662842, "global_step": 195980, "epoch": 4666} {"train_loss": -7.146973133087158, "global_step": 195981, "epoch": 4666} {"train_loss": -7.163616180419922, "global_step": 195982, "epoch": 4666} {"train_loss": -7.218010902404785, "global_step": 195983, "epoch": 4666} {"train_loss": -7.108901500701904, "global_step": 195984, "epoch": 4666} {"train_loss": -7.148759841918945, "global_step": 195985, "epoch": 4666} {"train_loss": -7.173581123352051, "global_step": 195986, "epoch": 4666} {"train_loss": -7.217838764190674, "global_step": 195987, "epoch": 4666} {"train_loss": -7.231791019439697, "global_step": 195988, "epoch": 4666} {"train_loss": -7.280342102050781, "global_step": 195989, "epoch": 4666} {"train_loss": -7.215785026550293, "global_step": 195990, "epoch": 4666} {"train_loss": -7.249646186828613, "global_step": 195991, "epoch": 4666} {"train_loss": -7.358040809631348, "global_step": 195992, "epoch": 4666} {"train_loss": -7.251755714416504, "global_step": 195993, "epoch": 4666} {"train_loss": -7.230172634124756, "global_step": 195994, "epoch": 4666} {"train_loss": -7.113616943359375, "global_step": 195995, "epoch": 4666} {"train_loss": -7.213489532470703, "global_step": 195996, "epoch": 4666} {"train_loss": -7.225139141082764, "global_step": 195997, "epoch": 4666} {"train_loss": -7.155354976654053, "global_step": 195998, "epoch": 4666} {"train_loss": -7.264092445373535, "global_step": 195999, "epoch": 4666} {"train_loss": -7.341538429260254, "global_step": 196000, "epoch": 4666} {"train_loss": -7.2437744140625, "global_step": 196001, "epoch": 4666} {"train_loss": -7.317876815795898, "global_step": 196002, "epoch": 4666} {"train_loss": -7.232416152954102, "global_step": 196003, "epoch": 4666} {"train_loss": -7.193224906921387, "global_step": 196004, "epoch": 4666} {"train_loss": -7.251713752746582, "global_step": 196005, "epoch": 4666} {"train_loss": -7.304927825927734, "global_step": 196006, "epoch": 4666} {"train_loss": -7.224360942840576, "global_step": 196007, "epoch": 4666} {"train_loss": -7.21414852142334, "global_step": 196008, "epoch": 4666} {"train_loss": -7.310909748077393, "global_step": 196009, "epoch": 4666} {"train_loss": -7.2756266593933105, "global_step": 196010, "epoch": 4666} {"train_loss": -7.227421760559082, "global_step": 196011, "epoch": 4666} {"train_loss": -7.241095542907715, "global_step": 196012, "epoch": 4666} {"train_loss": -7.227226972579956, "global_step": 196013, "epoch": 4666, "val_loss": 69677.2890625} {"train_loss": -7.179357051849365, "global_step": 196014, "epoch": 4667} {"train_loss": -7.288854598999023, "global_step": 196015, "epoch": 4667} {"train_loss": -7.227231025695801, "global_step": 196016, "epoch": 4667} {"train_loss": -7.239776134490967, "global_step": 196017, "epoch": 4667} {"train_loss": -7.249645233154297, "global_step": 196018, "epoch": 4667} {"train_loss": -7.295855522155762, "global_step": 196019, "epoch": 4667} {"train_loss": -7.313080310821533, "global_step": 196020, "epoch": 4667} {"train_loss": -7.319631576538086, "global_step": 196021, "epoch": 4667} {"train_loss": -7.228172779083252, "global_step": 196022, "epoch": 4667} {"train_loss": -7.295743942260742, "global_step": 196023, "epoch": 4667} {"train_loss": -7.193353652954102, "global_step": 196024, "epoch": 4667} {"train_loss": -7.236921787261963, "global_step": 196025, "epoch": 4667} {"train_loss": -7.121591567993164, "global_step": 196026, "epoch": 4667} {"train_loss": -7.060076713562012, "global_step": 196027, "epoch": 4667} {"train_loss": -7.227019309997559, "global_step": 196028, "epoch": 4667} {"train_loss": -7.243326663970947, "global_step": 196029, "epoch": 4667} {"train_loss": -7.255840301513672, "global_step": 196030, "epoch": 4667} {"train_loss": -7.318965435028076, "global_step": 196031, "epoch": 4667} {"train_loss": -7.224582672119141, "global_step": 196032, "epoch": 4667} {"train_loss": -7.308907508850098, "global_step": 196033, "epoch": 4667} {"train_loss": -7.265222072601318, "global_step": 196034, "epoch": 4667} {"train_loss": -7.320603370666504, "global_step": 196035, "epoch": 4667} {"train_loss": -7.298175811767578, "global_step": 196036, "epoch": 4667} {"train_loss": -7.20474910736084, "global_step": 196037, "epoch": 4667} {"train_loss": -7.295722484588623, "global_step": 196038, "epoch": 4667} {"train_loss": -7.280187606811523, "global_step": 196039, "epoch": 4667} {"train_loss": -7.274886131286621, "global_step": 196040, "epoch": 4667} {"train_loss": -7.3059773445129395, "global_step": 196041, "epoch": 4667} {"train_loss": -7.25657320022583, "global_step": 196042, "epoch": 4667} {"train_loss": -7.1420769691467285, "global_step": 196043, "epoch": 4667} {"train_loss": -7.344655990600586, "global_step": 196044, "epoch": 4667} {"train_loss": -7.289952278137207, "global_step": 196045, "epoch": 4667} {"train_loss": -7.269150733947754, "global_step": 196046, "epoch": 4667} {"train_loss": -7.322569847106934, "global_step": 196047, "epoch": 4667} {"train_loss": -7.2583160400390625, "global_step": 196048, "epoch": 4667} {"train_loss": -7.341729164123535, "global_step": 196049, "epoch": 4667} {"train_loss": -7.22603702545166, "global_step": 196050, "epoch": 4667} {"train_loss": -7.077179908752441, "global_step": 196051, "epoch": 4667} {"train_loss": -7.0750041007995605, "global_step": 196052, "epoch": 4667} {"train_loss": -7.227235794067383, "global_step": 196053, "epoch": 4667} {"train_loss": -7.147040367126465, "global_step": 196054, "epoch": 4667} {"train_loss": -7.247471071424938, "global_step": 196055, "epoch": 4667, "val_loss": 69823.5859375} {"train_loss": -7.159882545471191, "global_step": 196056, "epoch": 4668} {"train_loss": -7.132758617401123, "global_step": 196057, "epoch": 4668} {"train_loss": -7.204498291015625, "global_step": 196058, "epoch": 4668} {"train_loss": -7.239580154418945, "global_step": 196059, "epoch": 4668} {"train_loss": -7.2345662117004395, "global_step": 196060, "epoch": 4668} {"train_loss": -7.284135818481445, "global_step": 196061, "epoch": 4668} {"train_loss": -7.356860637664795, "global_step": 196062, "epoch": 4668} {"train_loss": -7.230963706970215, "global_step": 196063, "epoch": 4668} {"train_loss": -7.338722229003906, "global_step": 196064, "epoch": 4668} {"train_loss": -7.304250717163086, "global_step": 196065, "epoch": 4668} {"train_loss": -7.335369110107422, "global_step": 196066, "epoch": 4668} {"train_loss": -7.344727039337158, "global_step": 196067, "epoch": 4668} {"train_loss": -7.307928562164307, "global_step": 196068, "epoch": 4668} {"train_loss": -7.365533828735352, "global_step": 196069, "epoch": 4668} {"train_loss": -7.316890239715576, "global_step": 196070, "epoch": 4668} {"train_loss": -7.293581485748291, "global_step": 196071, "epoch": 4668} {"train_loss": -7.207958698272705, "global_step": 196072, "epoch": 4668} {"train_loss": -7.287467956542969, "global_step": 196073, "epoch": 4668} {"train_loss": -7.237113952636719, "global_step": 196074, "epoch": 4668} {"train_loss": -7.254427909851074, "global_step": 196075, "epoch": 4668} {"train_loss": -7.273842811584473, "global_step": 196076, "epoch": 4668} {"train_loss": -7.253371238708496, "global_step": 196077, "epoch": 4668} {"train_loss": -7.266265392303467, "global_step": 196078, "epoch": 4668} {"train_loss": -7.328073501586914, "global_step": 196079, "epoch": 4668} {"train_loss": -7.3154497146606445, "global_step": 196080, "epoch": 4668} {"train_loss": -7.216988563537598, "global_step": 196081, "epoch": 4668} {"train_loss": -7.292652606964111, "global_step": 196082, "epoch": 4668} {"train_loss": -7.190932273864746, "global_step": 196083, "epoch": 4668} {"train_loss": -7.269007205963135, "global_step": 196084, "epoch": 4668} {"train_loss": -7.328401565551758, "global_step": 196085, "epoch": 4668} {"train_loss": -7.3805389404296875, "global_step": 196086, "epoch": 4668} {"train_loss": -7.29463005065918, "global_step": 196087, "epoch": 4668} {"train_loss": -7.310795307159424, "global_step": 196088, "epoch": 4668} {"train_loss": -7.276217460632324, "global_step": 196089, "epoch": 4668} {"train_loss": -7.249391555786133, "global_step": 196090, "epoch": 4668} {"train_loss": -7.283869743347168, "global_step": 196091, "epoch": 4668} {"train_loss": -7.219900608062744, "global_step": 196092, "epoch": 4668} {"train_loss": -7.30915641784668, "global_step": 196093, "epoch": 4668} {"train_loss": -7.176183223724365, "global_step": 196094, "epoch": 4668} {"train_loss": -7.254917621612549, "global_step": 196095, "epoch": 4668} {"train_loss": -7.284797668457031, "global_step": 196096, "epoch": 4668} {"train_loss": -7.269963298525129, "global_step": 196097, "epoch": 4668, "val_loss": 69634.1015625} {"train_loss": -7.2978196144104, "global_step": 196098, "epoch": 4669} {"train_loss": -7.178593158721924, "global_step": 196099, "epoch": 4669} {"train_loss": -7.325565338134766, "global_step": 196100, "epoch": 4669} {"train_loss": -7.104983329772949, "global_step": 196101, "epoch": 4669} {"train_loss": -7.313388824462891, "global_step": 196102, "epoch": 4669} {"train_loss": -7.3449249267578125, "global_step": 196103, "epoch": 4669} {"train_loss": -7.266768455505371, "global_step": 196104, "epoch": 4669} {"train_loss": -7.235196590423584, "global_step": 196105, "epoch": 4669} {"train_loss": -7.3034467697143555, "global_step": 196106, "epoch": 4669} {"train_loss": -7.19342565536499, "global_step": 196107, "epoch": 4669} {"train_loss": -7.238837242126465, "global_step": 196108, "epoch": 4669} {"train_loss": -7.345467567443848, "global_step": 196109, "epoch": 4669} {"train_loss": -7.278423309326172, "global_step": 196110, "epoch": 4669} {"train_loss": -7.212395668029785, "global_step": 196111, "epoch": 4669} {"train_loss": -7.318672180175781, "global_step": 196112, "epoch": 4669} {"train_loss": -7.2400312423706055, "global_step": 196113, "epoch": 4669} {"train_loss": -7.270162582397461, "global_step": 196114, "epoch": 4669} {"train_loss": -7.130727767944336, "global_step": 196115, "epoch": 4669} {"train_loss": -7.234335899353027, "global_step": 196116, "epoch": 4669} {"train_loss": -7.283498287200928, "global_step": 196117, "epoch": 4669} {"train_loss": -7.273063659667969, "global_step": 196118, "epoch": 4669} {"train_loss": -7.196839809417725, "global_step": 196119, "epoch": 4669} {"train_loss": -7.267461776733398, "global_step": 196120, "epoch": 4669} {"train_loss": -7.105472564697266, "global_step": 196121, "epoch": 4669} {"train_loss": -7.17919921875, "global_step": 196122, "epoch": 4669} {"train_loss": -7.259130001068115, "global_step": 196123, "epoch": 4669} {"train_loss": -7.3027238845825195, "global_step": 196124, "epoch": 4669} {"train_loss": -7.309821605682373, "global_step": 196125, "epoch": 4669} {"train_loss": -7.191679000854492, "global_step": 196126, "epoch": 4669} {"train_loss": -7.29607629776001, "global_step": 196127, "epoch": 4669} {"train_loss": -7.1774773597717285, "global_step": 196128, "epoch": 4669} {"train_loss": -7.302282810211182, "global_step": 196129, "epoch": 4669} {"train_loss": -7.067196846008301, "global_step": 196130, "epoch": 4669} {"train_loss": -7.205750465393066, "global_step": 196131, "epoch": 4669} {"train_loss": -7.2534260749816895, "global_step": 196132, "epoch": 4669} {"train_loss": -7.141508102416992, "global_step": 196133, "epoch": 4669} {"train_loss": -7.172675132751465, "global_step": 196134, "epoch": 4669} {"train_loss": -7.104381084442139, "global_step": 196135, "epoch": 4669} {"train_loss": -7.235715866088867, "global_step": 196136, "epoch": 4669} {"train_loss": -7.160040855407715, "global_step": 196137, "epoch": 4669} {"train_loss": -7.1148905754089355, "global_step": 196138, "epoch": 4669} {"train_loss": -7.227855285008748, "global_step": 196139, "epoch": 4669, "val_loss": 69836.3046875} {"train_loss": -7.258204460144043, "global_step": 196140, "epoch": 4670} {"train_loss": -7.238155364990234, "global_step": 196141, "epoch": 4670} {"train_loss": -7.251649856567383, "global_step": 196142, "epoch": 4670} {"train_loss": -7.191044807434082, "global_step": 196143, "epoch": 4670} {"train_loss": -7.101408958435059, "global_step": 196144, "epoch": 4670} {"train_loss": -7.2621660232543945, "global_step": 196145, "epoch": 4670} {"train_loss": -7.247793674468994, "global_step": 196146, "epoch": 4670} {"train_loss": -7.361748695373535, "global_step": 196147, "epoch": 4670} {"train_loss": -7.263357639312744, "global_step": 196148, "epoch": 4670} {"train_loss": -7.155844211578369, "global_step": 196149, "epoch": 4670} {"train_loss": -7.273333549499512, "global_step": 196150, "epoch": 4670} {"train_loss": -7.240624904632568, "global_step": 196151, "epoch": 4670} {"train_loss": -7.273347854614258, "global_step": 196152, "epoch": 4670} {"train_loss": -7.155426979064941, "global_step": 196153, "epoch": 4670} {"train_loss": -7.2475457191467285, "global_step": 196154, "epoch": 4670} {"train_loss": -7.201532363891602, "global_step": 196155, "epoch": 4670} {"train_loss": -7.244671821594238, "global_step": 196156, "epoch": 4670} {"train_loss": -7.2783002853393555, "global_step": 196157, "epoch": 4670} {"train_loss": -7.3199262619018555, "global_step": 196158, "epoch": 4670} {"train_loss": -7.136898994445801, "global_step": 196159, "epoch": 4670} {"train_loss": -7.265994548797607, "global_step": 196160, "epoch": 4670} {"train_loss": -7.215969085693359, "global_step": 196161, "epoch": 4670} {"train_loss": -7.180638790130615, "global_step": 196162, "epoch": 4670} {"train_loss": -7.2887864112854, "global_step": 196163, "epoch": 4670} {"train_loss": -7.269257545471191, "global_step": 196164, "epoch": 4670} {"train_loss": -7.180545806884766, "global_step": 196165, "epoch": 4670} {"train_loss": -7.350044250488281, "global_step": 196166, "epoch": 4670} {"train_loss": -7.2020721435546875, "global_step": 196167, "epoch": 4670} {"train_loss": -7.26724910736084, "global_step": 196168, "epoch": 4670} {"train_loss": -7.266231536865234, "global_step": 196169, "epoch": 4670} {"train_loss": -7.270632266998291, "global_step": 196170, "epoch": 4670} {"train_loss": -7.2551589012146, "global_step": 196171, "epoch": 4670} {"train_loss": -7.3536481857299805, "global_step": 196172, "epoch": 4670} {"train_loss": -7.175570964813232, "global_step": 196173, "epoch": 4670} {"train_loss": -7.270791053771973, "global_step": 196174, "epoch": 4670} {"train_loss": -7.306140899658203, "global_step": 196175, "epoch": 4670} {"train_loss": -7.137640953063965, "global_step": 196176, "epoch": 4670} {"train_loss": -7.228628158569336, "global_step": 196177, "epoch": 4670} {"train_loss": -7.306188583374023, "global_step": 196178, "epoch": 4670} {"train_loss": -7.252691268920898, "global_step": 196179, "epoch": 4670} {"train_loss": -7.204689025878906, "global_step": 196180, "epoch": 4670} {"train_loss": -7.246588548024495, "global_step": 196181, "epoch": 4670, "val_loss": 69653.1640625} {"train_loss": -7.2288923263549805, "global_step": 196182, "epoch": 4671} {"train_loss": -7.209080696105957, "global_step": 196183, "epoch": 4671} {"train_loss": -7.259589195251465, "global_step": 196184, "epoch": 4671} {"train_loss": -7.247628211975098, "global_step": 196185, "epoch": 4671} {"train_loss": -7.247361660003662, "global_step": 196186, "epoch": 4671} {"train_loss": -7.247838020324707, "global_step": 196187, "epoch": 4671} {"train_loss": -7.352531433105469, "global_step": 196188, "epoch": 4671} {"train_loss": -7.2781877517700195, "global_step": 196189, "epoch": 4671} {"train_loss": -7.311274528503418, "global_step": 196190, "epoch": 4671} {"train_loss": -7.197833061218262, "global_step": 196191, "epoch": 4671} {"train_loss": -7.420221328735352, "global_step": 196192, "epoch": 4671} {"train_loss": -7.204273700714111, "global_step": 196193, "epoch": 4671} {"train_loss": -7.260501861572266, "global_step": 196194, "epoch": 4671} {"train_loss": -7.320013046264648, "global_step": 196195, "epoch": 4671} {"train_loss": -7.334737777709961, "global_step": 196196, "epoch": 4671} {"train_loss": -7.174627780914307, "global_step": 196197, "epoch": 4671} {"train_loss": -7.277403831481934, "global_step": 196198, "epoch": 4671} {"train_loss": -7.289543628692627, "global_step": 196199, "epoch": 4671} {"train_loss": -7.190761089324951, "global_step": 196200, "epoch": 4671} {"train_loss": -7.225141525268555, "global_step": 196201, "epoch": 4671} {"train_loss": -7.231678009033203, "global_step": 196202, "epoch": 4671} {"train_loss": -7.21638822555542, "global_step": 196203, "epoch": 4671} {"train_loss": -7.316601753234863, "global_step": 196204, "epoch": 4671} {"train_loss": -7.280492782592773, "global_step": 196205, "epoch": 4671} {"train_loss": -7.224438667297363, "global_step": 196206, "epoch": 4671} {"train_loss": -7.306436538696289, "global_step": 196207, "epoch": 4671} {"train_loss": -7.328727722167969, "global_step": 196208, "epoch": 4671} {"train_loss": -7.106822967529297, "global_step": 196209, "epoch": 4671} {"train_loss": -7.1924824714660645, "global_step": 196210, "epoch": 4671} {"train_loss": -7.276116847991943, "global_step": 196211, "epoch": 4671} {"train_loss": -7.220200061798096, "global_step": 196212, "epoch": 4671} {"train_loss": -7.282461166381836, "global_step": 196213, "epoch": 4671} {"train_loss": -7.257669448852539, "global_step": 196214, "epoch": 4671} {"train_loss": -7.319790363311768, "global_step": 196215, "epoch": 4671} {"train_loss": -7.093337059020996, "global_step": 196216, "epoch": 4671} {"train_loss": -7.3176655769348145, "global_step": 196217, "epoch": 4671} {"train_loss": -7.231806755065918, "global_step": 196218, "epoch": 4671} {"train_loss": -7.158490180969238, "global_step": 196219, "epoch": 4671} {"train_loss": -7.227437973022461, "global_step": 196220, "epoch": 4671} {"train_loss": -7.117301940917969, "global_step": 196221, "epoch": 4671} {"train_loss": -7.210956573486328, "global_step": 196222, "epoch": 4671} {"train_loss": -7.24694732257298, "global_step": 196223, "epoch": 4671, "val_loss": 69718.0859375} {"train_loss": -7.1749162673950195, "global_step": 196224, "epoch": 4672} {"train_loss": -7.240671157836914, "global_step": 196225, "epoch": 4672} {"train_loss": -7.255019187927246, "global_step": 196226, "epoch": 4672} {"train_loss": -7.311795234680176, "global_step": 196227, "epoch": 4672} {"train_loss": -7.340381622314453, "global_step": 196228, "epoch": 4672} {"train_loss": -7.237282752990723, "global_step": 196229, "epoch": 4672} {"train_loss": -7.120608806610107, "global_step": 196230, "epoch": 4672} {"train_loss": -7.241102695465088, "global_step": 196231, "epoch": 4672} {"train_loss": -7.326031684875488, "global_step": 196232, "epoch": 4672} {"train_loss": -7.224606513977051, "global_step": 196233, "epoch": 4672} {"train_loss": -7.173372745513916, "global_step": 196234, "epoch": 4672} {"train_loss": -7.345760822296143, "global_step": 196235, "epoch": 4672} {"train_loss": -7.262315273284912, "global_step": 196236, "epoch": 4672} {"train_loss": -7.261542320251465, "global_step": 196237, "epoch": 4672} {"train_loss": -7.296552658081055, "global_step": 196238, "epoch": 4672} {"train_loss": -7.128900051116943, "global_step": 196239, "epoch": 4672} {"train_loss": -7.225884914398193, "global_step": 196240, "epoch": 4672} {"train_loss": -7.250347137451172, "global_step": 196241, "epoch": 4672} {"train_loss": -7.253571510314941, "global_step": 196242, "epoch": 4672} {"train_loss": -7.22078800201416, "global_step": 196243, "epoch": 4672} {"train_loss": -7.0399556159973145, "global_step": 196244, "epoch": 4672} {"train_loss": -7.040008068084717, "global_step": 196245, "epoch": 4672} {"train_loss": -7.216720104217529, "global_step": 196246, "epoch": 4672} {"train_loss": -6.984676361083984, "global_step": 196247, "epoch": 4672} {"train_loss": -7.285529136657715, "global_step": 196248, "epoch": 4672} {"train_loss": -7.122096538543701, "global_step": 196249, "epoch": 4672} {"train_loss": -7.215146064758301, "global_step": 196250, "epoch": 4672} {"train_loss": -7.304730415344238, "global_step": 196251, "epoch": 4672} {"train_loss": -7.140953063964844, "global_step": 196252, "epoch": 4672} {"train_loss": -7.1720147132873535, "global_step": 196253, "epoch": 4672} {"train_loss": -7.199930667877197, "global_step": 196254, "epoch": 4672} {"train_loss": -7.160597801208496, "global_step": 196255, "epoch": 4672} {"train_loss": -7.151073455810547, "global_step": 196256, "epoch": 4672} {"train_loss": -7.338692665100098, "global_step": 196257, "epoch": 4672} {"train_loss": -7.094374179840088, "global_step": 196258, "epoch": 4672} {"train_loss": -7.1777849197387695, "global_step": 196259, "epoch": 4672} {"train_loss": -7.233850479125977, "global_step": 196260, "epoch": 4672} {"train_loss": -7.098817825317383, "global_step": 196261, "epoch": 4672} {"train_loss": -7.281253814697266, "global_step": 196262, "epoch": 4672} {"train_loss": -7.288935661315918, "global_step": 196263, "epoch": 4672} {"train_loss": -7.039637565612793, "global_step": 196264, "epoch": 4672} {"train_loss": -7.207441443488712, "global_step": 196265, "epoch": 4672, "val_loss": 69732.0859375} {"train_loss": -7.211774826049805, "global_step": 196266, "epoch": 4673} {"train_loss": -7.127721786499023, "global_step": 196267, "epoch": 4673} {"train_loss": -7.222054481506348, "global_step": 196268, "epoch": 4673} {"train_loss": -7.193000316619873, "global_step": 196269, "epoch": 4673} {"train_loss": -7.094786643981934, "global_step": 196270, "epoch": 4673} {"train_loss": -7.228401184082031, "global_step": 196271, "epoch": 4673} {"train_loss": -7.003282070159912, "global_step": 196272, "epoch": 4673} {"train_loss": -7.297290802001953, "global_step": 196273, "epoch": 4673} {"train_loss": -7.147305488586426, "global_step": 196274, "epoch": 4673} {"train_loss": -6.9670562744140625, "global_step": 196275, "epoch": 4673} {"train_loss": -7.179730415344238, "global_step": 196276, "epoch": 4673} {"train_loss": -7.083721160888672, "global_step": 196277, "epoch": 4673} {"train_loss": -7.074530601501465, "global_step": 196278, "epoch": 4673} {"train_loss": -7.1779279708862305, "global_step": 196279, "epoch": 4673} {"train_loss": -7.042750358581543, "global_step": 196280, "epoch": 4673} {"train_loss": -7.122218608856201, "global_step": 196281, "epoch": 4673} {"train_loss": -6.971765518188477, "global_step": 196282, "epoch": 4673} {"train_loss": -7.232285022735596, "global_step": 196283, "epoch": 4673} {"train_loss": -7.07503604888916, "global_step": 196284, "epoch": 4673} {"train_loss": -7.15904426574707, "global_step": 196285, "epoch": 4673} {"train_loss": -7.128281593322754, "global_step": 196286, "epoch": 4673} {"train_loss": -7.165172576904297, "global_step": 196287, "epoch": 4673} {"train_loss": -7.092410087585449, "global_step": 196288, "epoch": 4673} {"train_loss": -7.171559810638428, "global_step": 196289, "epoch": 4673} {"train_loss": -7.140864372253418, "global_step": 196290, "epoch": 4673} {"train_loss": -7.12217378616333, "global_step": 196291, "epoch": 4673} {"train_loss": -7.192485332489014, "global_step": 196292, "epoch": 4673} {"train_loss": -7.1194987297058105, "global_step": 196293, "epoch": 4673} {"train_loss": -7.035528182983398, "global_step": 196294, "epoch": 4673} {"train_loss": -7.225345611572266, "global_step": 196295, "epoch": 4673} {"train_loss": -7.195782661437988, "global_step": 196296, "epoch": 4673} {"train_loss": -7.269708633422852, "global_step": 196297, "epoch": 4673} {"train_loss": -7.217197418212891, "global_step": 196298, "epoch": 4673} {"train_loss": -7.231980800628662, "global_step": 196299, "epoch": 4673} {"train_loss": -7.313251495361328, "global_step": 196300, "epoch": 4673} {"train_loss": -7.231572151184082, "global_step": 196301, "epoch": 4673} {"train_loss": -7.244341850280762, "global_step": 196302, "epoch": 4673} {"train_loss": -7.125356674194336, "global_step": 196303, "epoch": 4673} {"train_loss": -7.205291271209717, "global_step": 196304, "epoch": 4673} {"train_loss": -7.236051082611084, "global_step": 196305, "epoch": 4673} {"train_loss": -7.242770195007324, "global_step": 196306, "epoch": 4673} {"train_loss": -7.162169501894996, "global_step": 196307, "epoch": 4673, "val_loss": 69745.90625} {"train_loss": -7.340122699737549, "global_step": 196308, "epoch": 4674} {"train_loss": -7.293652534484863, "global_step": 196309, "epoch": 4674} {"train_loss": -7.293155670166016, "global_step": 196310, "epoch": 4674} {"train_loss": -7.296152114868164, "global_step": 196311, "epoch": 4674} {"train_loss": -7.2859344482421875, "global_step": 196312, "epoch": 4674} {"train_loss": -7.336559295654297, "global_step": 196313, "epoch": 4674} {"train_loss": -7.232281684875488, "global_step": 196314, "epoch": 4674} {"train_loss": -7.347975730895996, "global_step": 196315, "epoch": 4674} {"train_loss": -7.300477027893066, "global_step": 196316, "epoch": 4674} {"train_loss": -7.315852642059326, "global_step": 196317, "epoch": 4674} {"train_loss": -7.381036758422852, "global_step": 196318, "epoch": 4674} {"train_loss": -7.347800254821777, "global_step": 196319, "epoch": 4674} {"train_loss": -7.290239334106445, "global_step": 196320, "epoch": 4674} {"train_loss": -7.282679557800293, "global_step": 196321, "epoch": 4674} {"train_loss": -7.296462059020996, "global_step": 196322, "epoch": 4674} {"train_loss": -7.373514175415039, "global_step": 196323, "epoch": 4674} {"train_loss": -7.205109119415283, "global_step": 196324, "epoch": 4674} {"train_loss": -7.191187858581543, "global_step": 196325, "epoch": 4674} {"train_loss": -7.245800018310547, "global_step": 196326, "epoch": 4674} {"train_loss": -7.265456199645996, "global_step": 196327, "epoch": 4674} {"train_loss": -7.240190505981445, "global_step": 196328, "epoch": 4674} {"train_loss": -7.2266740798950195, "global_step": 196329, "epoch": 4674} {"train_loss": -7.267949104309082, "global_step": 196330, "epoch": 4674} {"train_loss": -7.226527690887451, "global_step": 196331, "epoch": 4674} {"train_loss": -7.395491600036621, "global_step": 196332, "epoch": 4674} {"train_loss": -7.277958869934082, "global_step": 196333, "epoch": 4674} {"train_loss": -7.222264766693115, "global_step": 196334, "epoch": 4674} {"train_loss": -7.327842712402344, "global_step": 196335, "epoch": 4674} {"train_loss": -7.277779579162598, "global_step": 196336, "epoch": 4674} {"train_loss": -7.264196395874023, "global_step": 196337, "epoch": 4674} {"train_loss": -7.296930313110352, "global_step": 196338, "epoch": 4674} {"train_loss": -7.2918195724487305, "global_step": 196339, "epoch": 4674} {"train_loss": -7.237964630126953, "global_step": 196340, "epoch": 4674} {"train_loss": -7.2787981033325195, "global_step": 196341, "epoch": 4674} {"train_loss": -7.293051719665527, "global_step": 196342, "epoch": 4674} {"train_loss": -7.236782550811768, "global_step": 196343, "epoch": 4674} {"train_loss": -7.237603187561035, "global_step": 196344, "epoch": 4674} {"train_loss": -7.301584243774414, "global_step": 196345, "epoch": 4674} {"train_loss": -7.2006988525390625, "global_step": 196346, "epoch": 4674} {"train_loss": -7.318629264831543, "global_step": 196347, "epoch": 4674} {"train_loss": -7.313487529754639, "global_step": 196348, "epoch": 4674} {"train_loss": -7.281801575706119, "global_step": 196349, "epoch": 4674, "val_loss": 69721.125} {"train_loss": -7.3530731201171875, "global_step": 196350, "epoch": 4675} {"train_loss": -7.301437854766846, "global_step": 196351, "epoch": 4675} {"train_loss": -7.379400253295898, "global_step": 196352, "epoch": 4675} {"train_loss": -7.260400772094727, "global_step": 196353, "epoch": 4675} {"train_loss": -7.250470161437988, "global_step": 196354, "epoch": 4675} {"train_loss": -7.309370994567871, "global_step": 196355, "epoch": 4675} {"train_loss": -7.283054351806641, "global_step": 196356, "epoch": 4675} {"train_loss": -7.267913341522217, "global_step": 196357, "epoch": 4675} {"train_loss": -7.361799716949463, "global_step": 196358, "epoch": 4675} {"train_loss": -7.367992877960205, "global_step": 196359, "epoch": 4675} {"train_loss": -7.296238422393799, "global_step": 196360, "epoch": 4675} {"train_loss": -7.246059417724609, "global_step": 196361, "epoch": 4675} {"train_loss": -7.241438865661621, "global_step": 196362, "epoch": 4675} {"train_loss": -7.403260231018066, "global_step": 196363, "epoch": 4675} {"train_loss": -7.21164608001709, "global_step": 196364, "epoch": 4675} {"train_loss": -7.3552775382995605, "global_step": 196365, "epoch": 4675} {"train_loss": -7.233400344848633, "global_step": 196366, "epoch": 4675} {"train_loss": -7.327478408813477, "global_step": 196367, "epoch": 4675} {"train_loss": -7.185379505157471, "global_step": 196368, "epoch": 4675} {"train_loss": -7.220970153808594, "global_step": 196369, "epoch": 4675} {"train_loss": -7.230574607849121, "global_step": 196370, "epoch": 4675} {"train_loss": -7.250300884246826, "global_step": 196371, "epoch": 4675} {"train_loss": -7.402743816375732, "global_step": 196372, "epoch": 4675} {"train_loss": -7.24420166015625, "global_step": 196373, "epoch": 4675} {"train_loss": -7.1987504959106445, "global_step": 196374, "epoch": 4675} {"train_loss": -7.323306083679199, "global_step": 196375, "epoch": 4675} {"train_loss": -7.321509838104248, "global_step": 196376, "epoch": 4675} {"train_loss": -7.10782527923584, "global_step": 196377, "epoch": 4675} {"train_loss": -7.294341087341309, "global_step": 196378, "epoch": 4675} {"train_loss": -7.42348051071167, "global_step": 196379, "epoch": 4675} {"train_loss": -7.288286209106445, "global_step": 196380, "epoch": 4675} {"train_loss": -7.195616722106934, "global_step": 196381, "epoch": 4675} {"train_loss": -7.254708290100098, "global_step": 196382, "epoch": 4675} {"train_loss": -7.267796993255615, "global_step": 196383, "epoch": 4675} {"train_loss": -7.356717109680176, "global_step": 196384, "epoch": 4675} {"train_loss": -7.323472023010254, "global_step": 196385, "epoch": 4675} {"train_loss": -7.2216620445251465, "global_step": 196386, "epoch": 4675} {"train_loss": -7.339626312255859, "global_step": 196387, "epoch": 4675} {"train_loss": -7.194522380828857, "global_step": 196388, "epoch": 4675} {"train_loss": -7.143487453460693, "global_step": 196389, "epoch": 4675} {"train_loss": -7.248518943786621, "global_step": 196390, "epoch": 4675} {"train_loss": -7.279867024648757, "global_step": 196391, "epoch": 4675, "val_loss": 69699.9140625} {"train_loss": -7.126448631286621, "global_step": 196392, "epoch": 4676} {"train_loss": -7.182269096374512, "global_step": 196393, "epoch": 4676} {"train_loss": -7.216165065765381, "global_step": 196394, "epoch": 4676} {"train_loss": -7.184414863586426, "global_step": 196395, "epoch": 4676} {"train_loss": -7.213804721832275, "global_step": 196396, "epoch": 4676} {"train_loss": -7.231631278991699, "global_step": 196397, "epoch": 4676} {"train_loss": -7.151197910308838, "global_step": 196398, "epoch": 4676} {"train_loss": -7.130614757537842, "global_step": 196399, "epoch": 4676} {"train_loss": -7.207350254058838, "global_step": 196400, "epoch": 4676} {"train_loss": -7.119261264801025, "global_step": 196401, "epoch": 4676} {"train_loss": -7.111941337585449, "global_step": 196402, "epoch": 4676} {"train_loss": -7.161118507385254, "global_step": 196403, "epoch": 4676} {"train_loss": -7.037510871887207, "global_step": 196404, "epoch": 4676} {"train_loss": -7.198504447937012, "global_step": 196405, "epoch": 4676} {"train_loss": -7.189820766448975, "global_step": 196406, "epoch": 4676} {"train_loss": -6.984463691711426, "global_step": 196407, "epoch": 4676} {"train_loss": -7.05716609954834, "global_step": 196408, "epoch": 4676} {"train_loss": -7.084802627563477, "global_step": 196409, "epoch": 4676} {"train_loss": -7.035236358642578, "global_step": 196410, "epoch": 4676} {"train_loss": -7.106627464294434, "global_step": 196411, "epoch": 4676} {"train_loss": -7.115904808044434, "global_step": 196412, "epoch": 4676} {"train_loss": -7.132452011108398, "global_step": 196413, "epoch": 4676} {"train_loss": -7.178630352020264, "global_step": 196414, "epoch": 4676} {"train_loss": -7.202200889587402, "global_step": 196415, "epoch": 4676} {"train_loss": -7.137007713317871, "global_step": 196416, "epoch": 4676} {"train_loss": -7.175511837005615, "global_step": 196417, "epoch": 4676} {"train_loss": -7.126818656921387, "global_step": 196418, "epoch": 4676} {"train_loss": -7.113747596740723, "global_step": 196419, "epoch": 4676} {"train_loss": -7.197876453399658, "global_step": 196420, "epoch": 4676} {"train_loss": -7.111435890197754, "global_step": 196421, "epoch": 4676} {"train_loss": -7.196785926818848, "global_step": 196422, "epoch": 4676} {"train_loss": -7.1743316650390625, "global_step": 196423, "epoch": 4676} {"train_loss": -7.327773094177246, "global_step": 196424, "epoch": 4676} {"train_loss": -7.213677406311035, "global_step": 196425, "epoch": 4676} {"train_loss": -7.314465045928955, "global_step": 196426, "epoch": 4676} {"train_loss": -7.188292503356934, "global_step": 196427, "epoch": 4676} {"train_loss": -7.300196647644043, "global_step": 196428, "epoch": 4676} {"train_loss": -7.312921047210693, "global_step": 196429, "epoch": 4676} {"train_loss": -7.19837760925293, "global_step": 196430, "epoch": 4676} {"train_loss": -7.1406450271606445, "global_step": 196431, "epoch": 4676} {"train_loss": -7.099634170532227, "global_step": 196432, "epoch": 4676} {"train_loss": -7.1655988693237305, "global_step": 196433, "epoch": 4676, "val_loss": 69627.015625} {"train_loss": -7.263971328735352, "global_step": 196434, "epoch": 4677} {"train_loss": -7.139827251434326, "global_step": 196435, "epoch": 4677} {"train_loss": -7.337590217590332, "global_step": 196436, "epoch": 4677} {"train_loss": -7.255407810211182, "global_step": 196437, "epoch": 4677} {"train_loss": -7.307312965393066, "global_step": 196438, "epoch": 4677} {"train_loss": -7.257957458496094, "global_step": 196439, "epoch": 4677} {"train_loss": -7.29287576675415, "global_step": 196440, "epoch": 4677} {"train_loss": -7.242578506469727, "global_step": 196441, "epoch": 4677} {"train_loss": -7.238402366638184, "global_step": 196442, "epoch": 4677} {"train_loss": -7.355569839477539, "global_step": 196443, "epoch": 4677} {"train_loss": -7.260126113891602, "global_step": 196444, "epoch": 4677} {"train_loss": -7.267160415649414, "global_step": 196445, "epoch": 4677} {"train_loss": -7.220757484436035, "global_step": 196446, "epoch": 4677} {"train_loss": -7.257060527801514, "global_step": 196447, "epoch": 4677} {"train_loss": -7.240005970001221, "global_step": 196448, "epoch": 4677} {"train_loss": -7.252374172210693, "global_step": 196449, "epoch": 4677} {"train_loss": -7.199092864990234, "global_step": 196450, "epoch": 4677} {"train_loss": -7.303175926208496, "global_step": 196451, "epoch": 4677} {"train_loss": -7.228281021118164, "global_step": 196452, "epoch": 4677} {"train_loss": -7.275798320770264, "global_step": 196453, "epoch": 4677} {"train_loss": -7.246238708496094, "global_step": 196454, "epoch": 4677} {"train_loss": -7.3553080558776855, "global_step": 196455, "epoch": 4677} {"train_loss": -7.287041664123535, "global_step": 196456, "epoch": 4677} {"train_loss": -7.261801719665527, "global_step": 196457, "epoch": 4677} {"train_loss": -7.280346870422363, "global_step": 196458, "epoch": 4677} {"train_loss": -7.278383255004883, "global_step": 196459, "epoch": 4677} {"train_loss": -7.2215352058410645, "global_step": 196460, "epoch": 4677} {"train_loss": -7.105503082275391, "global_step": 196461, "epoch": 4677} {"train_loss": -7.127889633178711, "global_step": 196462, "epoch": 4677} {"train_loss": -7.2686333656311035, "global_step": 196463, "epoch": 4677} {"train_loss": -7.251134872436523, "global_step": 196464, "epoch": 4677} {"train_loss": -7.212133407592773, "global_step": 196465, "epoch": 4677} {"train_loss": -7.218555450439453, "global_step": 196466, "epoch": 4677} {"train_loss": -7.085422992706299, "global_step": 196467, "epoch": 4677} {"train_loss": -7.080989837646484, "global_step": 196468, "epoch": 4677} {"train_loss": -7.124846935272217, "global_step": 196469, "epoch": 4677} {"train_loss": -7.157593727111816, "global_step": 196470, "epoch": 4677} {"train_loss": -7.284992218017578, "global_step": 196471, "epoch": 4677} {"train_loss": -7.154603958129883, "global_step": 196472, "epoch": 4677} {"train_loss": -7.192378044128418, "global_step": 196473, "epoch": 4677} {"train_loss": -7.214136123657227, "global_step": 196474, "epoch": 4677} {"train_loss": -7.231725408917382, "global_step": 196475, "epoch": 4677, "val_loss": 69887.671875} {"train_loss": -7.262382507324219, "global_step": 196476, "epoch": 4678} {"train_loss": -7.24803352355957, "global_step": 196477, "epoch": 4678} {"train_loss": -7.214387893676758, "global_step": 196478, "epoch": 4678} {"train_loss": -7.288050651550293, "global_step": 196479, "epoch": 4678} {"train_loss": -7.182411193847656, "global_step": 196480, "epoch": 4678} {"train_loss": -7.257984638214111, "global_step": 196481, "epoch": 4678} {"train_loss": -7.19422721862793, "global_step": 196482, "epoch": 4678} {"train_loss": -7.13358211517334, "global_step": 196483, "epoch": 4678} {"train_loss": -7.187717437744141, "global_step": 196484, "epoch": 4678} {"train_loss": -7.055962562561035, "global_step": 196485, "epoch": 4678} {"train_loss": -7.35532808303833, "global_step": 196486, "epoch": 4678} {"train_loss": -7.154483795166016, "global_step": 196487, "epoch": 4678} {"train_loss": -7.043680667877197, "global_step": 196488, "epoch": 4678} {"train_loss": -7.209941864013672, "global_step": 196489, "epoch": 4678} {"train_loss": -6.838327407836914, "global_step": 196490, "epoch": 4678} {"train_loss": -7.036888599395752, "global_step": 196491, "epoch": 4678} {"train_loss": -7.175948143005371, "global_step": 196492, "epoch": 4678} {"train_loss": -7.096375465393066, "global_step": 196493, "epoch": 4678} {"train_loss": -7.154940605163574, "global_step": 196494, "epoch": 4678} {"train_loss": -7.096775054931641, "global_step": 196495, "epoch": 4678} {"train_loss": -7.159134387969971, "global_step": 196496, "epoch": 4678} {"train_loss": -7.246063709259033, "global_step": 196497, "epoch": 4678} {"train_loss": -7.136823654174805, "global_step": 196498, "epoch": 4678} {"train_loss": -7.219459056854248, "global_step": 196499, "epoch": 4678} {"train_loss": -7.094614028930664, "global_step": 196500, "epoch": 4678} {"train_loss": -7.189834117889404, "global_step": 196501, "epoch": 4678} {"train_loss": -7.147353172302246, "global_step": 196502, "epoch": 4678} {"train_loss": -7.338435173034668, "global_step": 196503, "epoch": 4678} {"train_loss": -7.115942478179932, "global_step": 196504, "epoch": 4678} {"train_loss": -7.229065418243408, "global_step": 196505, "epoch": 4678} {"train_loss": -7.1493120193481445, "global_step": 196506, "epoch": 4678} {"train_loss": -7.157354354858398, "global_step": 196507, "epoch": 4678} {"train_loss": -7.147519111633301, "global_step": 196508, "epoch": 4678} {"train_loss": -7.179262161254883, "global_step": 196509, "epoch": 4678} {"train_loss": -7.0758376121521, "global_step": 196510, "epoch": 4678} {"train_loss": -7.188099384307861, "global_step": 196511, "epoch": 4678} {"train_loss": -7.213548183441162, "global_step": 196512, "epoch": 4678} {"train_loss": -7.344587326049805, "global_step": 196513, "epoch": 4678} {"train_loss": -7.242466449737549, "global_step": 196514, "epoch": 4678} {"train_loss": -7.098863124847412, "global_step": 196515, "epoch": 4678} {"train_loss": -7.300339221954346, "global_step": 196516, "epoch": 4678} {"train_loss": -7.174871410642352, "global_step": 196517, "epoch": 4678, "val_loss": 69672.6015625} {"train_loss": -7.361401557922363, "global_step": 196518, "epoch": 4679} {"train_loss": -7.27260684967041, "global_step": 196519, "epoch": 4679} {"train_loss": -7.193707466125488, "global_step": 196520, "epoch": 4679} {"train_loss": -7.211897850036621, "global_step": 196521, "epoch": 4679} {"train_loss": -7.363051414489746, "global_step": 196522, "epoch": 4679} {"train_loss": -7.2706074714660645, "global_step": 196523, "epoch": 4679} {"train_loss": -7.286198139190674, "global_step": 196524, "epoch": 4679} {"train_loss": -7.349776268005371, "global_step": 196525, "epoch": 4679} {"train_loss": -7.277579307556152, "global_step": 196526, "epoch": 4679} {"train_loss": -7.221978187561035, "global_step": 196527, "epoch": 4679} {"train_loss": -7.275720119476318, "global_step": 196528, "epoch": 4679} {"train_loss": -7.277314186096191, "global_step": 196529, "epoch": 4679} {"train_loss": -7.288115501403809, "global_step": 196530, "epoch": 4679} {"train_loss": -7.240017890930176, "global_step": 196531, "epoch": 4679} {"train_loss": -7.233137130737305, "global_step": 196532, "epoch": 4679} {"train_loss": -7.250846862792969, "global_step": 196533, "epoch": 4679} {"train_loss": -7.232820987701416, "global_step": 196534, "epoch": 4679} {"train_loss": -7.304847717285156, "global_step": 196535, "epoch": 4679} {"train_loss": -7.35814905166626, "global_step": 196536, "epoch": 4679} {"train_loss": -7.306486129760742, "global_step": 196537, "epoch": 4679} {"train_loss": -7.2370829582214355, "global_step": 196538, "epoch": 4679} {"train_loss": -7.296347618103027, "global_step": 196539, "epoch": 4679} {"train_loss": -7.296103000640869, "global_step": 196540, "epoch": 4679} {"train_loss": -7.203265190124512, "global_step": 196541, "epoch": 4679} {"train_loss": -7.265847682952881, "global_step": 196542, "epoch": 4679} {"train_loss": -7.354388236999512, "global_step": 196543, "epoch": 4679} {"train_loss": -7.244487285614014, "global_step": 196544, "epoch": 4679} {"train_loss": -7.215808868408203, "global_step": 196545, "epoch": 4679} {"train_loss": -7.3335394859313965, "global_step": 196546, "epoch": 4679} {"train_loss": -7.28339147567749, "global_step": 196547, "epoch": 4679} {"train_loss": -7.165216445922852, "global_step": 196548, "epoch": 4679} {"train_loss": -7.149123191833496, "global_step": 196549, "epoch": 4679} {"train_loss": -7.131660461425781, "global_step": 196550, "epoch": 4679} {"train_loss": -7.037069320678711, "global_step": 196551, "epoch": 4679} {"train_loss": -7.305821418762207, "global_step": 196552, "epoch": 4679} {"train_loss": -7.134862899780273, "global_step": 196553, "epoch": 4679} {"train_loss": -7.230674743652344, "global_step": 196554, "epoch": 4679} {"train_loss": -7.159573554992676, "global_step": 196555, "epoch": 4679} {"train_loss": -7.115509033203125, "global_step": 196556, "epoch": 4679} {"train_loss": -7.188932418823242, "global_step": 196557, "epoch": 4679} {"train_loss": -7.132524013519287, "global_step": 196558, "epoch": 4679} {"train_loss": -7.24718393598284, "global_step": 196559, "epoch": 4679, "val_loss": 69759.109375} {"train_loss": -7.094428062438965, "global_step": 196560, "epoch": 4680} {"train_loss": -7.134459018707275, "global_step": 196561, "epoch": 4680} {"train_loss": -7.316157341003418, "global_step": 196562, "epoch": 4680} {"train_loss": -7.193324089050293, "global_step": 196563, "epoch": 4680} {"train_loss": -7.0759148597717285, "global_step": 196564, "epoch": 4680} {"train_loss": -7.231109142303467, "global_step": 196565, "epoch": 4680} {"train_loss": -7.2121357917785645, "global_step": 196566, "epoch": 4680} {"train_loss": -7.027883052825928, "global_step": 196567, "epoch": 4680} {"train_loss": -7.196427345275879, "global_step": 196568, "epoch": 4680} {"train_loss": -7.235953330993652, "global_step": 196569, "epoch": 4680} {"train_loss": -7.184375762939453, "global_step": 196570, "epoch": 4680} {"train_loss": -7.252291679382324, "global_step": 196571, "epoch": 4680} {"train_loss": -7.121372222900391, "global_step": 196572, "epoch": 4680} {"train_loss": -7.236480712890625, "global_step": 196573, "epoch": 4680} {"train_loss": -7.182196617126465, "global_step": 196574, "epoch": 4680} {"train_loss": -7.303976058959961, "global_step": 196575, "epoch": 4680} {"train_loss": -7.335415363311768, "global_step": 196576, "epoch": 4680} {"train_loss": -7.256940841674805, "global_step": 196577, "epoch": 4680} {"train_loss": -7.257256507873535, "global_step": 196578, "epoch": 4680} {"train_loss": -7.139270782470703, "global_step": 196579, "epoch": 4680} {"train_loss": -7.305659294128418, "global_step": 196580, "epoch": 4680} {"train_loss": -7.301589012145996, "global_step": 196581, "epoch": 4680} {"train_loss": -7.364772796630859, "global_step": 196582, "epoch": 4680} {"train_loss": -7.334639549255371, "global_step": 196583, "epoch": 4680} {"train_loss": -7.312804222106934, "global_step": 196584, "epoch": 4680} {"train_loss": -7.24672794342041, "global_step": 196585, "epoch": 4680} {"train_loss": -7.24983549118042, "global_step": 196586, "epoch": 4680} {"train_loss": -7.190943717956543, "global_step": 196587, "epoch": 4680} {"train_loss": -7.271042823791504, "global_step": 196588, "epoch": 4680} {"train_loss": -7.354036808013916, "global_step": 196589, "epoch": 4680} {"train_loss": -7.2174906730651855, "global_step": 196590, "epoch": 4680} {"train_loss": -7.240495681762695, "global_step": 196591, "epoch": 4680} {"train_loss": -7.094479560852051, "global_step": 196592, "epoch": 4680} {"train_loss": -7.210719585418701, "global_step": 196593, "epoch": 4680} {"train_loss": -7.284032344818115, "global_step": 196594, "epoch": 4680} {"train_loss": -7.142513275146484, "global_step": 196595, "epoch": 4680} {"train_loss": -7.0813422203063965, "global_step": 196596, "epoch": 4680} {"train_loss": -7.253413200378418, "global_step": 196597, "epoch": 4680} {"train_loss": -7.139867305755615, "global_step": 196598, "epoch": 4680} {"train_loss": -7.077584266662598, "global_step": 196599, "epoch": 4680} {"train_loss": -7.189488410949707, "global_step": 196600, "epoch": 4680} {"train_loss": -7.215847492218018, "global_step": 196601, "epoch": 4680, "val_loss": 69676.1796875} {"train_loss": -7.085174083709717, "global_step": 196602, "epoch": 4681} {"train_loss": -7.169476509094238, "global_step": 196603, "epoch": 4681} {"train_loss": -7.2359490394592285, "global_step": 196604, "epoch": 4681} {"train_loss": -7.051889896392822, "global_step": 196605, "epoch": 4681} {"train_loss": -7.2117533683776855, "global_step": 196606, "epoch": 4681} {"train_loss": -7.284908294677734, "global_step": 196607, "epoch": 4681} {"train_loss": -7.211487770080566, "global_step": 196608, "epoch": 4681} {"train_loss": -7.301743507385254, "global_step": 196609, "epoch": 4681} {"train_loss": -7.179975509643555, "global_step": 196610, "epoch": 4681} {"train_loss": -7.239110469818115, "global_step": 196611, "epoch": 4681} {"train_loss": -7.1924333572387695, "global_step": 196612, "epoch": 4681} {"train_loss": -7.249958038330078, "global_step": 196613, "epoch": 4681} {"train_loss": -7.220948219299316, "global_step": 196614, "epoch": 4681} {"train_loss": -7.254304885864258, "global_step": 196615, "epoch": 4681} {"train_loss": -7.251416206359863, "global_step": 196616, "epoch": 4681} {"train_loss": -7.242441177368164, "global_step": 196617, "epoch": 4681} {"train_loss": -7.297018051147461, "global_step": 196618, "epoch": 4681} {"train_loss": -7.311291694641113, "global_step": 196619, "epoch": 4681} {"train_loss": -7.299882888793945, "global_step": 196620, "epoch": 4681} {"train_loss": -7.349844932556152, "global_step": 196621, "epoch": 4681} {"train_loss": -7.134172439575195, "global_step": 196622, "epoch": 4681} {"train_loss": -7.3366923332214355, "global_step": 196623, "epoch": 4681} {"train_loss": -7.2776947021484375, "global_step": 196624, "epoch": 4681} {"train_loss": -7.183509349822998, "global_step": 196625, "epoch": 4681} {"train_loss": -7.266702175140381, "global_step": 196626, "epoch": 4681} {"train_loss": -7.247707843780518, "global_step": 196627, "epoch": 4681} {"train_loss": -7.234903335571289, "global_step": 196628, "epoch": 4681} {"train_loss": -7.3071794509887695, "global_step": 196629, "epoch": 4681} {"train_loss": -7.212352275848389, "global_step": 196630, "epoch": 4681} {"train_loss": -7.243900299072266, "global_step": 196631, "epoch": 4681} {"train_loss": -7.228603839874268, "global_step": 196632, "epoch": 4681} {"train_loss": -7.2487969398498535, "global_step": 196633, "epoch": 4681} {"train_loss": -7.1955742835998535, "global_step": 196634, "epoch": 4681} {"train_loss": -7.236906051635742, "global_step": 196635, "epoch": 4681} {"train_loss": -7.198812484741211, "global_step": 196636, "epoch": 4681} {"train_loss": -7.284786224365234, "global_step": 196637, "epoch": 4681} {"train_loss": -7.1171464920043945, "global_step": 196638, "epoch": 4681} {"train_loss": -7.131561756134033, "global_step": 196639, "epoch": 4681} {"train_loss": -7.129430770874023, "global_step": 196640, "epoch": 4681} {"train_loss": -7.235401630401611, "global_step": 196641, "epoch": 4681} {"train_loss": -7.078936576843262, "global_step": 196642, "epoch": 4681} {"train_loss": -7.2233344827379495, "global_step": 196643, "epoch": 4681, "val_loss": 69749.421875} {"train_loss": -7.147191047668457, "global_step": 196644, "epoch": 4682} {"train_loss": -7.073052406311035, "global_step": 196645, "epoch": 4682} {"train_loss": -7.131779670715332, "global_step": 196646, "epoch": 4682} {"train_loss": -7.079585075378418, "global_step": 196647, "epoch": 4682} {"train_loss": -7.201580047607422, "global_step": 196648, "epoch": 4682} {"train_loss": -7.13906192779541, "global_step": 196649, "epoch": 4682} {"train_loss": -7.170306205749512, "global_step": 196650, "epoch": 4682} {"train_loss": -7.294809818267822, "global_step": 196651, "epoch": 4682} {"train_loss": -7.167503356933594, "global_step": 196652, "epoch": 4682} {"train_loss": -7.230016708374023, "global_step": 196653, "epoch": 4682} {"train_loss": -7.110232830047607, "global_step": 196654, "epoch": 4682} {"train_loss": -7.241901397705078, "global_step": 196655, "epoch": 4682} {"train_loss": -7.200972557067871, "global_step": 196656, "epoch": 4682} {"train_loss": -7.158891201019287, "global_step": 196657, "epoch": 4682} {"train_loss": -7.315549850463867, "global_step": 196658, "epoch": 4682} {"train_loss": -7.201626777648926, "global_step": 196659, "epoch": 4682} {"train_loss": -7.187164306640625, "global_step": 196660, "epoch": 4682} {"train_loss": -7.159736633300781, "global_step": 196661, "epoch": 4682} {"train_loss": -7.195856094360352, "global_step": 196662, "epoch": 4682} {"train_loss": -7.20528507232666, "global_step": 196663, "epoch": 4682} {"train_loss": -7.083544731140137, "global_step": 196664, "epoch": 4682} {"train_loss": -7.2418928146362305, "global_step": 196665, "epoch": 4682} {"train_loss": -7.121616840362549, "global_step": 196666, "epoch": 4682} {"train_loss": -7.145867824554443, "global_step": 196667, "epoch": 4682} {"train_loss": -7.115260124206543, "global_step": 196668, "epoch": 4682} {"train_loss": -7.161578178405762, "global_step": 196669, "epoch": 4682} {"train_loss": -6.955384254455566, "global_step": 196670, "epoch": 4682} {"train_loss": -7.255692005157471, "global_step": 196671, "epoch": 4682} {"train_loss": -7.284101486206055, "global_step": 196672, "epoch": 4682} {"train_loss": -7.155797958374023, "global_step": 196673, "epoch": 4682} {"train_loss": -7.208721160888672, "global_step": 196674, "epoch": 4682} {"train_loss": -7.342055797576904, "global_step": 196675, "epoch": 4682} {"train_loss": -7.189900875091553, "global_step": 196676, "epoch": 4682} {"train_loss": -7.211480140686035, "global_step": 196677, "epoch": 4682} {"train_loss": -7.100568771362305, "global_step": 196678, "epoch": 4682} {"train_loss": -7.052796363830566, "global_step": 196679, "epoch": 4682} {"train_loss": -7.192966461181641, "global_step": 196680, "epoch": 4682} {"train_loss": -7.286734580993652, "global_step": 196681, "epoch": 4682} {"train_loss": -7.233029365539551, "global_step": 196682, "epoch": 4682} {"train_loss": -7.042691230773926, "global_step": 196683, "epoch": 4682} {"train_loss": -7.2338151931762695, "global_step": 196684, "epoch": 4682} {"train_loss": -7.175101041793823, "global_step": 196685, "epoch": 4682, "val_loss": 69847.734375} {"train_loss": -7.106302738189697, "global_step": 196686, "epoch": 4683} {"train_loss": -7.215172290802002, "global_step": 196687, "epoch": 4683} {"train_loss": -7.206850528717041, "global_step": 196688, "epoch": 4683} {"train_loss": -7.223779201507568, "global_step": 196689, "epoch": 4683} {"train_loss": -7.270395278930664, "global_step": 196690, "epoch": 4683} {"train_loss": -7.249671936035156, "global_step": 196691, "epoch": 4683} {"train_loss": -7.296228408813477, "global_step": 196692, "epoch": 4683} {"train_loss": -7.279616832733154, "global_step": 196693, "epoch": 4683} {"train_loss": -7.123096466064453, "global_step": 196694, "epoch": 4683} {"train_loss": -7.227640151977539, "global_step": 196695, "epoch": 4683} {"train_loss": -7.2590532302856445, "global_step": 196696, "epoch": 4683} {"train_loss": -7.233482360839844, "global_step": 196697, "epoch": 4683} {"train_loss": -7.33285665512085, "global_step": 196698, "epoch": 4683} {"train_loss": -7.270003318786621, "global_step": 196699, "epoch": 4683} {"train_loss": -7.183014869689941, "global_step": 196700, "epoch": 4683} {"train_loss": -7.202872276306152, "global_step": 196701, "epoch": 4683} {"train_loss": -7.256470680236816, "global_step": 196702, "epoch": 4683} {"train_loss": -7.3270463943481445, "global_step": 196703, "epoch": 4683} {"train_loss": -7.198034286499023, "global_step": 196704, "epoch": 4683} {"train_loss": -7.245667457580566, "global_step": 196705, "epoch": 4683} {"train_loss": -7.227383136749268, "global_step": 196706, "epoch": 4683} {"train_loss": -7.226398468017578, "global_step": 196707, "epoch": 4683} {"train_loss": -7.260663986206055, "global_step": 196708, "epoch": 4683} {"train_loss": -7.208674430847168, "global_step": 196709, "epoch": 4683} {"train_loss": -7.319128036499023, "global_step": 196710, "epoch": 4683} {"train_loss": -7.213548183441162, "global_step": 196711, "epoch": 4683} {"train_loss": -7.212231159210205, "global_step": 196712, "epoch": 4683} {"train_loss": -7.178399085998535, "global_step": 196713, "epoch": 4683} {"train_loss": -7.189835071563721, "global_step": 196714, "epoch": 4683} {"train_loss": -7.285478115081787, "global_step": 196715, "epoch": 4683} {"train_loss": -7.298836708068848, "global_step": 196716, "epoch": 4683} {"train_loss": -7.210100173950195, "global_step": 196717, "epoch": 4683} {"train_loss": -7.324553489685059, "global_step": 196718, "epoch": 4683} {"train_loss": -7.253610134124756, "global_step": 196719, "epoch": 4683} {"train_loss": -7.282198905944824, "global_step": 196720, "epoch": 4683} {"train_loss": -7.296989917755127, "global_step": 196721, "epoch": 4683} {"train_loss": -7.143375396728516, "global_step": 196722, "epoch": 4683} {"train_loss": -7.183047771453857, "global_step": 196723, "epoch": 4683} {"train_loss": -7.259495735168457, "global_step": 196724, "epoch": 4683} {"train_loss": -7.224210739135742, "global_step": 196725, "epoch": 4683} {"train_loss": -7.267941474914551, "global_step": 196726, "epoch": 4683} {"train_loss": -7.23798410097758, "global_step": 196727, "epoch": 4683, "val_loss": 69888.9453125} {"train_loss": -7.242925643920898, "global_step": 196728, "epoch": 4684} {"train_loss": -7.324949264526367, "global_step": 196729, "epoch": 4684} {"train_loss": -7.420497417449951, "global_step": 196730, "epoch": 4684} {"train_loss": -7.381389141082764, "global_step": 196731, "epoch": 4684} {"train_loss": -7.410198211669922, "global_step": 196732, "epoch": 4684} {"train_loss": -7.279168605804443, "global_step": 196733, "epoch": 4684} {"train_loss": -7.345510005950928, "global_step": 196734, "epoch": 4684} {"train_loss": -7.380876064300537, "global_step": 196735, "epoch": 4684} {"train_loss": -7.274667739868164, "global_step": 196736, "epoch": 4684} {"train_loss": -7.237270355224609, "global_step": 196737, "epoch": 4684} {"train_loss": -7.295638561248779, "global_step": 196738, "epoch": 4684} {"train_loss": -7.233720779418945, "global_step": 196739, "epoch": 4684} {"train_loss": -7.331210136413574, "global_step": 196740, "epoch": 4684} {"train_loss": -7.299887657165527, "global_step": 196741, "epoch": 4684} {"train_loss": -7.234277725219727, "global_step": 196742, "epoch": 4684} {"train_loss": -7.300145626068115, "global_step": 196743, "epoch": 4684} {"train_loss": -7.33052921295166, "global_step": 196744, "epoch": 4684} {"train_loss": -7.307312965393066, "global_step": 196745, "epoch": 4684} {"train_loss": -7.230062007904053, "global_step": 196746, "epoch": 4684} {"train_loss": -7.216768264770508, "global_step": 196747, "epoch": 4684} {"train_loss": -7.185975074768066, "global_step": 196748, "epoch": 4684} {"train_loss": -7.320632457733154, "global_step": 196749, "epoch": 4684} {"train_loss": -7.406201362609863, "global_step": 196750, "epoch": 4684} {"train_loss": -7.3642497062683105, "global_step": 196751, "epoch": 4684} {"train_loss": -7.224358558654785, "global_step": 196752, "epoch": 4684} {"train_loss": -7.241887092590332, "global_step": 196753, "epoch": 4684} {"train_loss": -7.348106384277344, "global_step": 196754, "epoch": 4684} {"train_loss": -7.235146522521973, "global_step": 196755, "epoch": 4684} {"train_loss": -7.350009441375732, "global_step": 196756, "epoch": 4684} {"train_loss": -7.138671398162842, "global_step": 196757, "epoch": 4684} {"train_loss": -7.208258628845215, "global_step": 196758, "epoch": 4684} {"train_loss": -7.25709342956543, "global_step": 196759, "epoch": 4684} {"train_loss": -7.256532669067383, "global_step": 196760, "epoch": 4684} {"train_loss": -7.286725997924805, "global_step": 196761, "epoch": 4684} {"train_loss": -7.288270950317383, "global_step": 196762, "epoch": 4684} {"train_loss": -7.304727554321289, "global_step": 196763, "epoch": 4684} {"train_loss": -7.280599594116211, "global_step": 196764, "epoch": 4684} {"train_loss": -7.042829513549805, "global_step": 196765, "epoch": 4684} {"train_loss": -7.2345685958862305, "global_step": 196766, "epoch": 4684} {"train_loss": -7.246370792388916, "global_step": 196767, "epoch": 4684} {"train_loss": -7.252272605895996, "global_step": 196768, "epoch": 4684} {"train_loss": -7.279438018798828, "global_step": 196769, "epoch": 4684, "val_loss": 69810.890625} {"train_loss": -7.237469673156738, "global_step": 196770, "epoch": 4685} {"train_loss": -7.210638523101807, "global_step": 196771, "epoch": 4685} {"train_loss": -7.234763145446777, "global_step": 196772, "epoch": 4685} {"train_loss": -7.326685905456543, "global_step": 196773, "epoch": 4685} {"train_loss": -7.176794052124023, "global_step": 196774, "epoch": 4685} {"train_loss": -7.2086639404296875, "global_step": 196775, "epoch": 4685} {"train_loss": -7.168163776397705, "global_step": 196776, "epoch": 4685} {"train_loss": -7.2152099609375, "global_step": 196777, "epoch": 4685} {"train_loss": -7.226024627685547, "global_step": 196778, "epoch": 4685} {"train_loss": -7.3784966468811035, "global_step": 196779, "epoch": 4685} {"train_loss": -7.180941581726074, "global_step": 196780, "epoch": 4685} {"train_loss": -7.347583770751953, "global_step": 196781, "epoch": 4685} {"train_loss": -7.315320014953613, "global_step": 196782, "epoch": 4685} {"train_loss": -7.331090927124023, "global_step": 196783, "epoch": 4685} {"train_loss": -7.132402420043945, "global_step": 196784, "epoch": 4685} {"train_loss": -7.331498146057129, "global_step": 196785, "epoch": 4685} {"train_loss": -7.231307506561279, "global_step": 196786, "epoch": 4685} {"train_loss": -7.247537612915039, "global_step": 196787, "epoch": 4685} {"train_loss": -7.340333938598633, "global_step": 196788, "epoch": 4685} {"train_loss": -7.1519927978515625, "global_step": 196789, "epoch": 4685} {"train_loss": -7.3501386642456055, "global_step": 196790, "epoch": 4685} {"train_loss": -7.2857537269592285, "global_step": 196791, "epoch": 4685} {"train_loss": -7.389472007751465, "global_step": 196792, "epoch": 4685} {"train_loss": -7.344145774841309, "global_step": 196793, "epoch": 4685} {"train_loss": -7.275158882141113, "global_step": 196794, "epoch": 4685} {"train_loss": -7.2791595458984375, "global_step": 196795, "epoch": 4685} {"train_loss": -7.319901466369629, "global_step": 196796, "epoch": 4685} {"train_loss": -7.28508186340332, "global_step": 196797, "epoch": 4685} {"train_loss": -7.252477645874023, "global_step": 196798, "epoch": 4685} {"train_loss": -7.290926933288574, "global_step": 196799, "epoch": 4685} {"train_loss": -7.186609268188477, "global_step": 196800, "epoch": 4685} {"train_loss": -7.362689018249512, "global_step": 196801, "epoch": 4685} {"train_loss": -7.184604167938232, "global_step": 196802, "epoch": 4685} {"train_loss": -7.2259521484375, "global_step": 196803, "epoch": 4685} {"train_loss": -7.311883926391602, "global_step": 196804, "epoch": 4685} {"train_loss": -7.320737838745117, "global_step": 196805, "epoch": 4685} {"train_loss": -7.269302845001221, "global_step": 196806, "epoch": 4685} {"train_loss": -7.22217321395874, "global_step": 196807, "epoch": 4685} {"train_loss": -7.292491912841797, "global_step": 196808, "epoch": 4685} {"train_loss": -7.087657928466797, "global_step": 196809, "epoch": 4685} {"train_loss": -7.174177646636963, "global_step": 196810, "epoch": 4685} {"train_loss": -7.258500916617257, "global_step": 196811, "epoch": 4685, "val_loss": 69787.5078125} {"train_loss": -7.11589241027832, "global_step": 196812, "epoch": 4686} {"train_loss": -7.155029296875, "global_step": 196813, "epoch": 4686} {"train_loss": -7.276368141174316, "global_step": 196814, "epoch": 4686} {"train_loss": -7.077389717102051, "global_step": 196815, "epoch": 4686} {"train_loss": -7.341638565063477, "global_step": 196816, "epoch": 4686} {"train_loss": -7.080008506774902, "global_step": 196817, "epoch": 4686} {"train_loss": -7.142414569854736, "global_step": 196818, "epoch": 4686} {"train_loss": -7.2211594581604, "global_step": 196819, "epoch": 4686} {"train_loss": -7.153106689453125, "global_step": 196820, "epoch": 4686} {"train_loss": -7.218782424926758, "global_step": 196821, "epoch": 4686} {"train_loss": -7.146546363830566, "global_step": 196822, "epoch": 4686} {"train_loss": -7.2166900634765625, "global_step": 196823, "epoch": 4686} {"train_loss": -7.127554416656494, "global_step": 196824, "epoch": 4686} {"train_loss": -7.236510276794434, "global_step": 196825, "epoch": 4686} {"train_loss": -7.3127617835998535, "global_step": 196826, "epoch": 4686} {"train_loss": -7.013999938964844, "global_step": 196827, "epoch": 4686} {"train_loss": -7.181582927703857, "global_step": 196828, "epoch": 4686} {"train_loss": -7.126653671264648, "global_step": 196829, "epoch": 4686} {"train_loss": -7.1640095710754395, "global_step": 196830, "epoch": 4686} {"train_loss": -7.228379726409912, "global_step": 196831, "epoch": 4686} {"train_loss": -7.184413909912109, "global_step": 196832, "epoch": 4686} {"train_loss": -7.319896697998047, "global_step": 196833, "epoch": 4686} {"train_loss": -7.1803131103515625, "global_step": 196834, "epoch": 4686} {"train_loss": -7.318003177642822, "global_step": 196835, "epoch": 4686} {"train_loss": -7.287400245666504, "global_step": 196836, "epoch": 4686} {"train_loss": -7.200222492218018, "global_step": 196837, "epoch": 4686} {"train_loss": -7.215384483337402, "global_step": 196838, "epoch": 4686} {"train_loss": -7.201371669769287, "global_step": 196839, "epoch": 4686} {"train_loss": -7.284760475158691, "global_step": 196840, "epoch": 4686} {"train_loss": -7.379725456237793, "global_step": 196841, "epoch": 4686} {"train_loss": -7.237848281860352, "global_step": 196842, "epoch": 4686} {"train_loss": -7.268721580505371, "global_step": 196843, "epoch": 4686} {"train_loss": -7.23499059677124, "global_step": 196844, "epoch": 4686} {"train_loss": -7.208288192749023, "global_step": 196845, "epoch": 4686} {"train_loss": -7.336237907409668, "global_step": 196846, "epoch": 4686} {"train_loss": -7.3271074295043945, "global_step": 196847, "epoch": 4686} {"train_loss": -7.2673492431640625, "global_step": 196848, "epoch": 4686} {"train_loss": -7.231480598449707, "global_step": 196849, "epoch": 4686} {"train_loss": -7.283936500549316, "global_step": 196850, "epoch": 4686} {"train_loss": -7.18488073348999, "global_step": 196851, "epoch": 4686} {"train_loss": -7.311797142028809, "global_step": 196852, "epoch": 4686} {"train_loss": -7.219879763466971, "global_step": 196853, "epoch": 4686, "val_loss": 69765.984375} {"train_loss": -7.253287315368652, "global_step": 196854, "epoch": 4687} {"train_loss": -7.342756271362305, "global_step": 196855, "epoch": 4687} {"train_loss": -7.207712173461914, "global_step": 196856, "epoch": 4687} {"train_loss": -7.253111839294434, "global_step": 196857, "epoch": 4687} {"train_loss": -7.21688175201416, "global_step": 196858, "epoch": 4687} {"train_loss": -7.319901943206787, "global_step": 196859, "epoch": 4687} {"train_loss": -7.308904647827148, "global_step": 196860, "epoch": 4687} {"train_loss": -7.143226146697998, "global_step": 196861, "epoch": 4687} {"train_loss": -7.089875221252441, "global_step": 196862, "epoch": 4687} {"train_loss": -7.157678127288818, "global_step": 196863, "epoch": 4687} {"train_loss": -7.167211532592773, "global_step": 196864, "epoch": 4687} {"train_loss": -7.114314079284668, "global_step": 196865, "epoch": 4687} {"train_loss": -7.05348539352417, "global_step": 196866, "epoch": 4687} {"train_loss": -7.192038536071777, "global_step": 196867, "epoch": 4687} {"train_loss": -7.350718975067139, "global_step": 196868, "epoch": 4687} {"train_loss": -7.058948516845703, "global_step": 196869, "epoch": 4687} {"train_loss": -7.0599775314331055, "global_step": 196870, "epoch": 4687} {"train_loss": -7.034595489501953, "global_step": 196871, "epoch": 4687} {"train_loss": -7.158294677734375, "global_step": 196872, "epoch": 4687} {"train_loss": -6.973418235778809, "global_step": 196873, "epoch": 4687} {"train_loss": -7.303816318511963, "global_step": 196874, "epoch": 4687} {"train_loss": -7.272077560424805, "global_step": 196875, "epoch": 4687} {"train_loss": -7.228503704071045, "global_step": 196876, "epoch": 4687} {"train_loss": -7.203560829162598, "global_step": 196877, "epoch": 4687} {"train_loss": -7.333672523498535, "global_step": 196878, "epoch": 4687} {"train_loss": -7.34842586517334, "global_step": 196879, "epoch": 4687} {"train_loss": -7.273121356964111, "global_step": 196880, "epoch": 4687} {"train_loss": -7.156864166259766, "global_step": 196881, "epoch": 4687} {"train_loss": -7.176843643188477, "global_step": 196882, "epoch": 4687} {"train_loss": -7.178093433380127, "global_step": 196883, "epoch": 4687} {"train_loss": -7.213353157043457, "global_step": 196884, "epoch": 4687} {"train_loss": -7.251123428344727, "global_step": 196885, "epoch": 4687} {"train_loss": -7.183084487915039, "global_step": 196886, "epoch": 4687} {"train_loss": -7.147860527038574, "global_step": 196887, "epoch": 4687} {"train_loss": -7.319396018981934, "global_step": 196888, "epoch": 4687} {"train_loss": -7.330655097961426, "global_step": 196889, "epoch": 4687} {"train_loss": -7.282392501831055, "global_step": 196890, "epoch": 4687} {"train_loss": -7.24357271194458, "global_step": 196891, "epoch": 4687} {"train_loss": -7.112949371337891, "global_step": 196892, "epoch": 4687} {"train_loss": -7.285452365875244, "global_step": 196893, "epoch": 4687} {"train_loss": -7.189587116241455, "global_step": 196894, "epoch": 4687} {"train_loss": -7.206704718726022, "global_step": 196895, "epoch": 4687, "val_loss": 69903.3203125} {"train_loss": -7.35697603225708, "global_step": 196896, "epoch": 4688} {"train_loss": -7.257562637329102, "global_step": 196897, "epoch": 4688} {"train_loss": -7.235335350036621, "global_step": 196898, "epoch": 4688} {"train_loss": -7.106664657592773, "global_step": 196899, "epoch": 4688} {"train_loss": -7.160825252532959, "global_step": 196900, "epoch": 4688} {"train_loss": -7.287284851074219, "global_step": 196901, "epoch": 4688} {"train_loss": -7.257166862487793, "global_step": 196902, "epoch": 4688} {"train_loss": -7.278298377990723, "global_step": 196903, "epoch": 4688} {"train_loss": -7.210803985595703, "global_step": 196904, "epoch": 4688} {"train_loss": -7.212194442749023, "global_step": 196905, "epoch": 4688} {"train_loss": -7.353151798248291, "global_step": 196906, "epoch": 4688} {"train_loss": -7.32777738571167, "global_step": 196907, "epoch": 4688} {"train_loss": -7.178382873535156, "global_step": 196908, "epoch": 4688} {"train_loss": -7.169334888458252, "global_step": 196909, "epoch": 4688} {"train_loss": -7.15380859375, "global_step": 196910, "epoch": 4688} {"train_loss": -7.1104888916015625, "global_step": 196911, "epoch": 4688} {"train_loss": -7.214555740356445, "global_step": 196912, "epoch": 4688} {"train_loss": -7.195768356323242, "global_step": 196913, "epoch": 4688} {"train_loss": -7.2451653480529785, "global_step": 196914, "epoch": 4688} {"train_loss": -7.290769577026367, "global_step": 196915, "epoch": 4688} {"train_loss": -7.244977951049805, "global_step": 196916, "epoch": 4688} {"train_loss": -7.207924842834473, "global_step": 196917, "epoch": 4688} {"train_loss": -7.168979644775391, "global_step": 196918, "epoch": 4688} {"train_loss": -7.31711483001709, "global_step": 196919, "epoch": 4688} {"train_loss": -7.166694641113281, "global_step": 196920, "epoch": 4688} {"train_loss": -7.068905353546143, "global_step": 196921, "epoch": 4688} {"train_loss": -7.185178756713867, "global_step": 196922, "epoch": 4688} {"train_loss": -7.024231910705566, "global_step": 196923, "epoch": 4688} {"train_loss": -7.131585121154785, "global_step": 196924, "epoch": 4688} {"train_loss": -7.2760419845581055, "global_step": 196925, "epoch": 4688} {"train_loss": -7.084867000579834, "global_step": 196926, "epoch": 4688} {"train_loss": -7.234748363494873, "global_step": 196927, "epoch": 4688} {"train_loss": -7.015569686889648, "global_step": 196928, "epoch": 4688} {"train_loss": -7.103150367736816, "global_step": 196929, "epoch": 4688} {"train_loss": -7.171335220336914, "global_step": 196930, "epoch": 4688} {"train_loss": -7.152763366699219, "global_step": 196931, "epoch": 4688} {"train_loss": -7.19173526763916, "global_step": 196932, "epoch": 4688} {"train_loss": -7.165562629699707, "global_step": 196933, "epoch": 4688} {"train_loss": -7.308747291564941, "global_step": 196934, "epoch": 4688} {"train_loss": -7.134377956390381, "global_step": 196935, "epoch": 4688} {"train_loss": -7.255162239074707, "global_step": 196936, "epoch": 4688} {"train_loss": -7.202876249949138, "global_step": 196937, "epoch": 4688, "val_loss": 69716.0} {"train_loss": -7.248578071594238, "global_step": 196938, "epoch": 4689} {"train_loss": -7.229209899902344, "global_step": 196939, "epoch": 4689} {"train_loss": -7.218294620513916, "global_step": 196940, "epoch": 4689} {"train_loss": -7.246710777282715, "global_step": 196941, "epoch": 4689} {"train_loss": -7.179274559020996, "global_step": 196942, "epoch": 4689} {"train_loss": -7.202617645263672, "global_step": 196943, "epoch": 4689} {"train_loss": -7.254863739013672, "global_step": 196944, "epoch": 4689} {"train_loss": -7.207208633422852, "global_step": 196945, "epoch": 4689} {"train_loss": -7.200934410095215, "global_step": 196946, "epoch": 4689} {"train_loss": -7.125880241394043, "global_step": 196947, "epoch": 4689} {"train_loss": -7.0875396728515625, "global_step": 196948, "epoch": 4689} {"train_loss": -7.083474159240723, "global_step": 196949, "epoch": 4689} {"train_loss": -7.165541172027588, "global_step": 196950, "epoch": 4689} {"train_loss": -7.243234157562256, "global_step": 196951, "epoch": 4689} {"train_loss": -7.2478227615356445, "global_step": 196952, "epoch": 4689} {"train_loss": -7.250790596008301, "global_step": 196953, "epoch": 4689} {"train_loss": -7.195760726928711, "global_step": 196954, "epoch": 4689} {"train_loss": -7.187446594238281, "global_step": 196955, "epoch": 4689} {"train_loss": -7.198617935180664, "global_step": 196956, "epoch": 4689} {"train_loss": -7.097291946411133, "global_step": 196957, "epoch": 4689} {"train_loss": -7.112827777862549, "global_step": 196958, "epoch": 4689} {"train_loss": -7.155876636505127, "global_step": 196959, "epoch": 4689} {"train_loss": -7.032432556152344, "global_step": 196960, "epoch": 4689} {"train_loss": -7.194145679473877, "global_step": 196961, "epoch": 4689} {"train_loss": -7.212714672088623, "global_step": 196962, "epoch": 4689} {"train_loss": -7.202322959899902, "global_step": 196963, "epoch": 4689} {"train_loss": -7.200733661651611, "global_step": 196964, "epoch": 4689} {"train_loss": -7.189310073852539, "global_step": 196965, "epoch": 4689} {"train_loss": -7.103888511657715, "global_step": 196966, "epoch": 4689} {"train_loss": -7.391387939453125, "global_step": 196967, "epoch": 4689} {"train_loss": -7.259091377258301, "global_step": 196968, "epoch": 4689} {"train_loss": -7.195841312408447, "global_step": 196969, "epoch": 4689} {"train_loss": -7.364567279815674, "global_step": 196970, "epoch": 4689} {"train_loss": -7.204094409942627, "global_step": 196971, "epoch": 4689} {"train_loss": -7.230532646179199, "global_step": 196972, "epoch": 4689} {"train_loss": -7.203164100646973, "global_step": 196973, "epoch": 4689} {"train_loss": -7.224716663360596, "global_step": 196974, "epoch": 4689} {"train_loss": -7.2980055809021, "global_step": 196975, "epoch": 4689} {"train_loss": -7.221449851989746, "global_step": 196976, "epoch": 4689} {"train_loss": -7.178541660308838, "global_step": 196977, "epoch": 4689} {"train_loss": -7.210141658782959, "global_step": 196978, "epoch": 4689} {"train_loss": -7.201521078745524, "global_step": 196979, "epoch": 4689, "val_loss": 69870.6953125} {"train_loss": -7.202530860900879, "global_step": 196980, "epoch": 4690} {"train_loss": -7.261420726776123, "global_step": 196981, "epoch": 4690} {"train_loss": -7.253161430358887, "global_step": 196982, "epoch": 4690} {"train_loss": -7.230152130126953, "global_step": 196983, "epoch": 4690} {"train_loss": -7.346576690673828, "global_step": 196984, "epoch": 4690} {"train_loss": -7.251898765563965, "global_step": 196985, "epoch": 4690} {"train_loss": -7.242992401123047, "global_step": 196986, "epoch": 4690} {"train_loss": -7.266071319580078, "global_step": 196987, "epoch": 4690} {"train_loss": -7.216911315917969, "global_step": 196988, "epoch": 4690} {"train_loss": -7.23388147354126, "global_step": 196989, "epoch": 4690} {"train_loss": -7.279741287231445, "global_step": 196990, "epoch": 4690} {"train_loss": -7.17194938659668, "global_step": 196991, "epoch": 4690} {"train_loss": -7.208159923553467, "global_step": 196992, "epoch": 4690} {"train_loss": -7.254477500915527, "global_step": 196993, "epoch": 4690} {"train_loss": -7.363180160522461, "global_step": 196994, "epoch": 4690} {"train_loss": -7.182253360748291, "global_step": 196995, "epoch": 4690} {"train_loss": -7.233800411224365, "global_step": 196996, "epoch": 4690} {"train_loss": -7.250916481018066, "global_step": 196997, "epoch": 4690} {"train_loss": -7.1760573387146, "global_step": 196998, "epoch": 4690} {"train_loss": -7.271572589874268, "global_step": 196999, "epoch": 4690} {"train_loss": -7.271646976470947, "global_step": 197000, "epoch": 4690} {"train_loss": -7.243671894073486, "global_step": 197001, "epoch": 4690} {"train_loss": -7.197417259216309, "global_step": 197002, "epoch": 4690} {"train_loss": -7.280527114868164, "global_step": 197003, "epoch": 4690} {"train_loss": -7.372699737548828, "global_step": 197004, "epoch": 4690} {"train_loss": -7.423060417175293, "global_step": 197005, "epoch": 4690} {"train_loss": -7.318313121795654, "global_step": 197006, "epoch": 4690} {"train_loss": -7.39310359954834, "global_step": 197007, "epoch": 4690} {"train_loss": -7.30747652053833, "global_step": 197008, "epoch": 4690} {"train_loss": -7.352577209472656, "global_step": 197009, "epoch": 4690} {"train_loss": -7.234295845031738, "global_step": 197010, "epoch": 4690} {"train_loss": -7.336989402770996, "global_step": 197011, "epoch": 4690} {"train_loss": -7.1833109855651855, "global_step": 197012, "epoch": 4690} {"train_loss": -7.296905040740967, "global_step": 197013, "epoch": 4690} {"train_loss": -7.310141563415527, "global_step": 197014, "epoch": 4690} {"train_loss": -7.306683540344238, "global_step": 197015, "epoch": 4690} {"train_loss": -7.202358245849609, "global_step": 197016, "epoch": 4690} {"train_loss": -7.2610554695129395, "global_step": 197017, "epoch": 4690} {"train_loss": -7.250650405883789, "global_step": 197018, "epoch": 4690} {"train_loss": -7.150254726409912, "global_step": 197019, "epoch": 4690} {"train_loss": -7.215564727783203, "global_step": 197020, "epoch": 4690} {"train_loss": -7.261060283297584, "global_step": 197021, "epoch": 4690, "val_loss": 69810.3125} {"train_loss": -7.186556816101074, "global_step": 197022, "epoch": 4691} {"train_loss": -7.238398551940918, "global_step": 197023, "epoch": 4691} {"train_loss": -7.210633754730225, "global_step": 197024, "epoch": 4691} {"train_loss": -7.20819091796875, "global_step": 197025, "epoch": 4691} {"train_loss": -7.1788554191589355, "global_step": 197026, "epoch": 4691} {"train_loss": -7.109736442565918, "global_step": 197027, "epoch": 4691} {"train_loss": -7.260430335998535, "global_step": 197028, "epoch": 4691} {"train_loss": -7.335301399230957, "global_step": 197029, "epoch": 4691} {"train_loss": -7.1438703536987305, "global_step": 197030, "epoch": 4691} {"train_loss": -7.28645133972168, "global_step": 197031, "epoch": 4691} {"train_loss": -7.281211853027344, "global_step": 197032, "epoch": 4691} {"train_loss": -7.221247673034668, "global_step": 197033, "epoch": 4691} {"train_loss": -7.237791061401367, "global_step": 197034, "epoch": 4691} {"train_loss": -7.211804389953613, "global_step": 197035, "epoch": 4691} {"train_loss": -7.185420989990234, "global_step": 197036, "epoch": 4691} {"train_loss": -7.132918357849121, "global_step": 197037, "epoch": 4691} {"train_loss": -7.175324440002441, "global_step": 197038, "epoch": 4691} {"train_loss": -7.1924896240234375, "global_step": 197039, "epoch": 4691} {"train_loss": -7.139517784118652, "global_step": 197040, "epoch": 4691} {"train_loss": -7.251067638397217, "global_step": 197041, "epoch": 4691} {"train_loss": -7.158008575439453, "global_step": 197042, "epoch": 4691} {"train_loss": -7.211230278015137, "global_step": 197043, "epoch": 4691} {"train_loss": -7.222900867462158, "global_step": 197044, "epoch": 4691} {"train_loss": -7.165005683898926, "global_step": 197045, "epoch": 4691} {"train_loss": -7.2959771156311035, "global_step": 197046, "epoch": 4691} {"train_loss": -7.317795276641846, "global_step": 197047, "epoch": 4691} {"train_loss": -7.144232749938965, "global_step": 197048, "epoch": 4691} {"train_loss": -7.2413330078125, "global_step": 197049, "epoch": 4691} {"train_loss": -7.162115097045898, "global_step": 197050, "epoch": 4691} {"train_loss": -7.231540679931641, "global_step": 197051, "epoch": 4691} {"train_loss": -7.141284942626953, "global_step": 197052, "epoch": 4691} {"train_loss": -7.2861456871032715, "global_step": 197053, "epoch": 4691} {"train_loss": -7.212811470031738, "global_step": 197054, "epoch": 4691} {"train_loss": -7.134939193725586, "global_step": 197055, "epoch": 4691} {"train_loss": -7.078183650970459, "global_step": 197056, "epoch": 4691} {"train_loss": -7.100864410400391, "global_step": 197057, "epoch": 4691} {"train_loss": -7.173426628112793, "global_step": 197058, "epoch": 4691} {"train_loss": -7.164431095123291, "global_step": 197059, "epoch": 4691} {"train_loss": -7.153436183929443, "global_step": 197060, "epoch": 4691} {"train_loss": -7.220839023590088, "global_step": 197061, "epoch": 4691} {"train_loss": -7.244429588317871, "global_step": 197062, "epoch": 4691} {"train_loss": -7.200643005825224, "global_step": 197063, "epoch": 4691, "val_loss": 69952.1015625} {"train_loss": -7.237220764160156, "global_step": 197064, "epoch": 4692} {"train_loss": -7.209725856781006, "global_step": 197065, "epoch": 4692} {"train_loss": -7.1560468673706055, "global_step": 197066, "epoch": 4692} {"train_loss": -7.156479835510254, "global_step": 197067, "epoch": 4692} {"train_loss": -7.203665733337402, "global_step": 197068, "epoch": 4692} {"train_loss": -7.305420875549316, "global_step": 197069, "epoch": 4692} {"train_loss": -7.204549312591553, "global_step": 197070, "epoch": 4692} {"train_loss": -7.212871551513672, "global_step": 197071, "epoch": 4692} {"train_loss": -7.26542329788208, "global_step": 197072, "epoch": 4692} {"train_loss": -7.1366376876831055, "global_step": 197073, "epoch": 4692} {"train_loss": -7.329164505004883, "global_step": 197074, "epoch": 4692} {"train_loss": -7.219818115234375, "global_step": 197075, "epoch": 4692} {"train_loss": -7.210336208343506, "global_step": 197076, "epoch": 4692} {"train_loss": -7.211154937744141, "global_step": 197077, "epoch": 4692} {"train_loss": -7.181640148162842, "global_step": 197078, "epoch": 4692} {"train_loss": -7.225318908691406, "global_step": 197079, "epoch": 4692} {"train_loss": -7.138782978057861, "global_step": 197080, "epoch": 4692} {"train_loss": -7.13471794128418, "global_step": 197081, "epoch": 4692} {"train_loss": -7.254981994628906, "global_step": 197082, "epoch": 4692} {"train_loss": -7.193047523498535, "global_step": 197083, "epoch": 4692} {"train_loss": -7.24038028717041, "global_step": 197084, "epoch": 4692} {"train_loss": -7.1542253494262695, "global_step": 197085, "epoch": 4692} {"train_loss": -7.190103530883789, "global_step": 197086, "epoch": 4692} {"train_loss": -7.215603828430176, "global_step": 197087, "epoch": 4692} {"train_loss": -7.192987442016602, "global_step": 197088, "epoch": 4692} {"train_loss": -7.265223503112793, "global_step": 197089, "epoch": 4692} {"train_loss": -7.156532287597656, "global_step": 197090, "epoch": 4692} {"train_loss": -7.128969192504883, "global_step": 197091, "epoch": 4692} {"train_loss": -7.271766185760498, "global_step": 197092, "epoch": 4692} {"train_loss": -7.299582481384277, "global_step": 197093, "epoch": 4692} {"train_loss": -7.14332914352417, "global_step": 197094, "epoch": 4692} {"train_loss": -7.292279243469238, "global_step": 197095, "epoch": 4692} {"train_loss": -7.208428382873535, "global_step": 197096, "epoch": 4692} {"train_loss": -7.2097859382629395, "global_step": 197097, "epoch": 4692} {"train_loss": -7.2968339920043945, "global_step": 197098, "epoch": 4692} {"train_loss": -7.307106018066406, "global_step": 197099, "epoch": 4692} {"train_loss": -7.200719833374023, "global_step": 197100, "epoch": 4692} {"train_loss": -7.256150722503662, "global_step": 197101, "epoch": 4692} {"train_loss": -7.185067653656006, "global_step": 197102, "epoch": 4692} {"train_loss": -7.327974319458008, "global_step": 197103, "epoch": 4692} {"train_loss": -7.317577362060547, "global_step": 197104, "epoch": 4692} {"train_loss": -7.22279387428647, "global_step": 197105, "epoch": 4692, "val_loss": 69794.3203125} {"train_loss": -7.305241584777832, "global_step": 197106, "epoch": 4693} {"train_loss": -7.229365825653076, "global_step": 197107, "epoch": 4693} {"train_loss": -7.343603134155273, "global_step": 197108, "epoch": 4693} {"train_loss": -7.309364318847656, "global_step": 197109, "epoch": 4693} {"train_loss": -7.2125654220581055, "global_step": 197110, "epoch": 4693} {"train_loss": -7.289549827575684, "global_step": 197111, "epoch": 4693} {"train_loss": -7.261746406555176, "global_step": 197112, "epoch": 4693} {"train_loss": -7.395447731018066, "global_step": 197113, "epoch": 4693} {"train_loss": -7.328497409820557, "global_step": 197114, "epoch": 4693} {"train_loss": -7.340662479400635, "global_step": 197115, "epoch": 4693} {"train_loss": -7.215062141418457, "global_step": 197116, "epoch": 4693} {"train_loss": -7.316227912902832, "global_step": 197117, "epoch": 4693} {"train_loss": -7.370489120483398, "global_step": 197118, "epoch": 4693} {"train_loss": -7.353658676147461, "global_step": 197119, "epoch": 4693} {"train_loss": -7.324724197387695, "global_step": 197120, "epoch": 4693} {"train_loss": -7.333848476409912, "global_step": 197121, "epoch": 4693} {"train_loss": -7.233509063720703, "global_step": 197122, "epoch": 4693} {"train_loss": -7.3444695472717285, "global_step": 197123, "epoch": 4693} {"train_loss": -7.384838104248047, "global_step": 197124, "epoch": 4693} {"train_loss": -7.20991849899292, "global_step": 197125, "epoch": 4693} {"train_loss": -7.356740474700928, "global_step": 197126, "epoch": 4693} {"train_loss": -7.245521068572998, "global_step": 197127, "epoch": 4693} {"train_loss": -7.209622859954834, "global_step": 197128, "epoch": 4693} {"train_loss": -7.350205421447754, "global_step": 197129, "epoch": 4693} {"train_loss": -7.290934085845947, "global_step": 197130, "epoch": 4693} {"train_loss": -7.405252933502197, "global_step": 197131, "epoch": 4693} {"train_loss": -7.259520530700684, "global_step": 197132, "epoch": 4693} {"train_loss": -7.285731315612793, "global_step": 197133, "epoch": 4693} {"train_loss": -7.310990333557129, "global_step": 197134, "epoch": 4693} {"train_loss": -7.29766845703125, "global_step": 197135, "epoch": 4693} {"train_loss": -7.366748809814453, "global_step": 197136, "epoch": 4693} {"train_loss": -7.3586506843566895, "global_step": 197137, "epoch": 4693} {"train_loss": -7.221022605895996, "global_step": 197138, "epoch": 4693} {"train_loss": -7.212494850158691, "global_step": 197139, "epoch": 4693} {"train_loss": -7.263045787811279, "global_step": 197140, "epoch": 4693} {"train_loss": -7.3087005615234375, "global_step": 197141, "epoch": 4693} {"train_loss": -7.254255771636963, "global_step": 197142, "epoch": 4693} {"train_loss": -7.294646263122559, "global_step": 197143, "epoch": 4693} {"train_loss": -7.283529281616211, "global_step": 197144, "epoch": 4693} {"train_loss": -7.34426212310791, "global_step": 197145, "epoch": 4693} {"train_loss": -7.325644493103027, "global_step": 197146, "epoch": 4693} {"train_loss": -7.302378302528744, "global_step": 197147, "epoch": 4693, "val_loss": 69883.0390625} {"train_loss": -7.288420677185059, "global_step": 197148, "epoch": 4694} {"train_loss": -7.413269996643066, "global_step": 197149, "epoch": 4694} {"train_loss": -7.215029716491699, "global_step": 197150, "epoch": 4694} {"train_loss": -7.299524307250977, "global_step": 197151, "epoch": 4694} {"train_loss": -7.328632354736328, "global_step": 197152, "epoch": 4694} {"train_loss": -7.394513130187988, "global_step": 197153, "epoch": 4694} {"train_loss": -7.347338676452637, "global_step": 197154, "epoch": 4694} {"train_loss": -7.216280460357666, "global_step": 197155, "epoch": 4694} {"train_loss": -7.256261825561523, "global_step": 197156, "epoch": 4694} {"train_loss": -7.2109174728393555, "global_step": 197157, "epoch": 4694} {"train_loss": -7.168344974517822, "global_step": 197158, "epoch": 4694} {"train_loss": -7.097308158874512, "global_step": 197159, "epoch": 4694} {"train_loss": -7.320161819458008, "global_step": 197160, "epoch": 4694} {"train_loss": -7.17738676071167, "global_step": 197161, "epoch": 4694} {"train_loss": -7.338855266571045, "global_step": 197162, "epoch": 4694} {"train_loss": -7.241353511810303, "global_step": 197163, "epoch": 4694} {"train_loss": -7.289237976074219, "global_step": 197164, "epoch": 4694} {"train_loss": -7.200852394104004, "global_step": 197165, "epoch": 4694} {"train_loss": -7.271894931793213, "global_step": 197166, "epoch": 4694} {"train_loss": -7.3919677734375, "global_step": 197167, "epoch": 4694} {"train_loss": -7.211911678314209, "global_step": 197168, "epoch": 4694} {"train_loss": -7.355602264404297, "global_step": 197169, "epoch": 4694} {"train_loss": -7.268715858459473, "global_step": 197170, "epoch": 4694} {"train_loss": -7.261651039123535, "global_step": 197171, "epoch": 4694} {"train_loss": -7.203153610229492, "global_step": 197172, "epoch": 4694} {"train_loss": -7.264637470245361, "global_step": 197173, "epoch": 4694} {"train_loss": -7.275042533874512, "global_step": 197174, "epoch": 4694} {"train_loss": -7.293625831604004, "global_step": 197175, "epoch": 4694} {"train_loss": -7.325263023376465, "global_step": 197176, "epoch": 4694} {"train_loss": -7.297606468200684, "global_step": 197177, "epoch": 4694} {"train_loss": -7.165078163146973, "global_step": 197178, "epoch": 4694} {"train_loss": -7.290661334991455, "global_step": 197179, "epoch": 4694} {"train_loss": -7.297664642333984, "global_step": 197180, "epoch": 4694} {"train_loss": -7.2545976638793945, "global_step": 197181, "epoch": 4694} {"train_loss": -7.335235118865967, "global_step": 197182, "epoch": 4694} {"train_loss": -7.317098617553711, "global_step": 197183, "epoch": 4694} {"train_loss": -7.209750652313232, "global_step": 197184, "epoch": 4694} {"train_loss": -7.2880377769470215, "global_step": 197185, "epoch": 4694} {"train_loss": -7.376702308654785, "global_step": 197186, "epoch": 4694} {"train_loss": -7.351979732513428, "global_step": 197187, "epoch": 4694} {"train_loss": -7.291099548339844, "global_step": 197188, "epoch": 4694} {"train_loss": -7.27936323483785, "global_step": 197189, "epoch": 4694, "val_loss": 69752.0390625} {"train_loss": -7.296722412109375, "global_step": 197190, "epoch": 4695} {"train_loss": -7.383340835571289, "global_step": 197191, "epoch": 4695} {"train_loss": -7.1609063148498535, "global_step": 197192, "epoch": 4695} {"train_loss": -7.360642433166504, "global_step": 197193, "epoch": 4695} {"train_loss": -7.269343376159668, "global_step": 197194, "epoch": 4695} {"train_loss": -7.229676246643066, "global_step": 197195, "epoch": 4695} {"train_loss": -7.3723955154418945, "global_step": 197196, "epoch": 4695} {"train_loss": -7.324764251708984, "global_step": 197197, "epoch": 4695} {"train_loss": -7.30087947845459, "global_step": 197198, "epoch": 4695} {"train_loss": -7.253425598144531, "global_step": 197199, "epoch": 4695} {"train_loss": -7.3112287521362305, "global_step": 197200, "epoch": 4695} {"train_loss": -7.194819450378418, "global_step": 197201, "epoch": 4695} {"train_loss": -7.143217086791992, "global_step": 197202, "epoch": 4695} {"train_loss": -7.250102519989014, "global_step": 197203, "epoch": 4695} {"train_loss": -7.112006187438965, "global_step": 197204, "epoch": 4695} {"train_loss": -7.179330825805664, "global_step": 197205, "epoch": 4695} {"train_loss": -7.195640563964844, "global_step": 197206, "epoch": 4695} {"train_loss": -7.06445837020874, "global_step": 197207, "epoch": 4695} {"train_loss": -7.169452667236328, "global_step": 197208, "epoch": 4695} {"train_loss": -7.184412956237793, "global_step": 197209, "epoch": 4695} {"train_loss": -7.170149326324463, "global_step": 197210, "epoch": 4695} {"train_loss": -7.170000076293945, "global_step": 197211, "epoch": 4695} {"train_loss": -7.20327091217041, "global_step": 197212, "epoch": 4695} {"train_loss": -7.280890941619873, "global_step": 197213, "epoch": 4695} {"train_loss": -7.217241287231445, "global_step": 197214, "epoch": 4695} {"train_loss": -7.268813133239746, "global_step": 197215, "epoch": 4695} {"train_loss": -7.168927192687988, "global_step": 197216, "epoch": 4695} {"train_loss": -7.261358261108398, "global_step": 197217, "epoch": 4695} {"train_loss": -7.126835823059082, "global_step": 197218, "epoch": 4695} {"train_loss": -7.198296070098877, "global_step": 197219, "epoch": 4695} {"train_loss": -7.247801780700684, "global_step": 197220, "epoch": 4695} {"train_loss": -7.058406352996826, "global_step": 197221, "epoch": 4695} {"train_loss": -7.085536956787109, "global_step": 197222, "epoch": 4695} {"train_loss": -7.165606498718262, "global_step": 197223, "epoch": 4695} {"train_loss": -7.132908344268799, "global_step": 197224, "epoch": 4695} {"train_loss": -7.15009069442749, "global_step": 197225, "epoch": 4695} {"train_loss": -7.236183166503906, "global_step": 197226, "epoch": 4695} {"train_loss": -7.013294219970703, "global_step": 197227, "epoch": 4695} {"train_loss": -7.308070659637451, "global_step": 197228, "epoch": 4695} {"train_loss": -7.037761688232422, "global_step": 197229, "epoch": 4695} {"train_loss": -7.155298233032227, "global_step": 197230, "epoch": 4695} {"train_loss": -7.206169173831031, "global_step": 197231, "epoch": 4695, "val_loss": 69930.9609375} {"train_loss": -7.0598978996276855, "global_step": 197232, "epoch": 4696} {"train_loss": -7.297049045562744, "global_step": 197233, "epoch": 4696} {"train_loss": -7.142578125, "global_step": 197234, "epoch": 4696} {"train_loss": -7.047128677368164, "global_step": 197235, "epoch": 4696} {"train_loss": -7.276915550231934, "global_step": 197236, "epoch": 4696} {"train_loss": -7.1427412033081055, "global_step": 197237, "epoch": 4696} {"train_loss": -7.124818801879883, "global_step": 197238, "epoch": 4696} {"train_loss": -7.201471328735352, "global_step": 197239, "epoch": 4696} {"train_loss": -7.075040340423584, "global_step": 197240, "epoch": 4696} {"train_loss": -7.27311897277832, "global_step": 197241, "epoch": 4696} {"train_loss": -7.162684440612793, "global_step": 197242, "epoch": 4696} {"train_loss": -7.214800834655762, "global_step": 197243, "epoch": 4696} {"train_loss": -7.133110046386719, "global_step": 197244, "epoch": 4696} {"train_loss": -7.122276306152344, "global_step": 197245, "epoch": 4696} {"train_loss": -7.207697868347168, "global_step": 197246, "epoch": 4696} {"train_loss": -7.161820411682129, "global_step": 197247, "epoch": 4696} {"train_loss": -6.945109844207764, "global_step": 197248, "epoch": 4696} {"train_loss": -7.076559543609619, "global_step": 197249, "epoch": 4696} {"train_loss": -7.189239025115967, "global_step": 197250, "epoch": 4696} {"train_loss": -7.096029281616211, "global_step": 197251, "epoch": 4696} {"train_loss": -7.162677764892578, "global_step": 197252, "epoch": 4696} {"train_loss": -7.190173149108887, "global_step": 197253, "epoch": 4696} {"train_loss": -7.194013595581055, "global_step": 197254, "epoch": 4696} {"train_loss": -7.240866661071777, "global_step": 197255, "epoch": 4696} {"train_loss": -7.100575923919678, "global_step": 197256, "epoch": 4696} {"train_loss": -7.277998924255371, "global_step": 197257, "epoch": 4696} {"train_loss": -7.225372314453125, "global_step": 197258, "epoch": 4696} {"train_loss": -7.205515384674072, "global_step": 197259, "epoch": 4696} {"train_loss": -7.195523262023926, "global_step": 197260, "epoch": 4696} {"train_loss": -7.203029632568359, "global_step": 197261, "epoch": 4696} {"train_loss": -7.2017364501953125, "global_step": 197262, "epoch": 4696} {"train_loss": -7.236168384552002, "global_step": 197263, "epoch": 4696} {"train_loss": -7.206319808959961, "global_step": 197264, "epoch": 4696} {"train_loss": -7.214239120483398, "global_step": 197265, "epoch": 4696} {"train_loss": -7.330075263977051, "global_step": 197266, "epoch": 4696} {"train_loss": -7.180683135986328, "global_step": 197267, "epoch": 4696} {"train_loss": -7.2095136642456055, "global_step": 197268, "epoch": 4696} {"train_loss": -7.160262584686279, "global_step": 197269, "epoch": 4696} {"train_loss": -7.2138519287109375, "global_step": 197270, "epoch": 4696} {"train_loss": -7.197690010070801, "global_step": 197271, "epoch": 4696} {"train_loss": -7.200989723205566, "global_step": 197272, "epoch": 4696} {"train_loss": -7.179061038153512, "global_step": 197273, "epoch": 4696, "val_loss": 69493.6640625} {"train_loss": -7.176422119140625, "global_step": 197274, "epoch": 4697} {"train_loss": -7.225438594818115, "global_step": 197275, "epoch": 4697} {"train_loss": -7.086535930633545, "global_step": 197276, "epoch": 4697} {"train_loss": -7.169875621795654, "global_step": 197277, "epoch": 4697} {"train_loss": -7.272389888763428, "global_step": 197278, "epoch": 4697} {"train_loss": -7.206626892089844, "global_step": 197279, "epoch": 4697} {"train_loss": -7.280914306640625, "global_step": 197280, "epoch": 4697} {"train_loss": -7.303776741027832, "global_step": 197281, "epoch": 4697} {"train_loss": -7.257733345031738, "global_step": 197282, "epoch": 4697} {"train_loss": -7.355710029602051, "global_step": 197283, "epoch": 4697} {"train_loss": -7.309047698974609, "global_step": 197284, "epoch": 4697} {"train_loss": -7.254424095153809, "global_step": 197285, "epoch": 4697} {"train_loss": -7.218350410461426, "global_step": 197286, "epoch": 4697} {"train_loss": -7.176479339599609, "global_step": 197287, "epoch": 4697} {"train_loss": -7.234162330627441, "global_step": 197288, "epoch": 4697} {"train_loss": -7.224526882171631, "global_step": 197289, "epoch": 4697} {"train_loss": -7.219323635101318, "global_step": 197290, "epoch": 4697} {"train_loss": -7.292593955993652, "global_step": 197291, "epoch": 4697} {"train_loss": -7.307226181030273, "global_step": 197292, "epoch": 4697} {"train_loss": -7.199816703796387, "global_step": 197293, "epoch": 4697} {"train_loss": -7.155315399169922, "global_step": 197294, "epoch": 4697} {"train_loss": -7.263115406036377, "global_step": 197295, "epoch": 4697} {"train_loss": -7.167917251586914, "global_step": 197296, "epoch": 4697} {"train_loss": -7.253030300140381, "global_step": 197297, "epoch": 4697} {"train_loss": -7.258660316467285, "global_step": 197298, "epoch": 4697} {"train_loss": -7.278526306152344, "global_step": 197299, "epoch": 4697} {"train_loss": -7.254515647888184, "global_step": 197300, "epoch": 4697} {"train_loss": -7.3518829345703125, "global_step": 197301, "epoch": 4697} {"train_loss": -7.299613952636719, "global_step": 197302, "epoch": 4697} {"train_loss": -7.255362033843994, "global_step": 197303, "epoch": 4697} {"train_loss": -7.226977348327637, "global_step": 197304, "epoch": 4697} {"train_loss": -7.292930603027344, "global_step": 197305, "epoch": 4697} {"train_loss": -7.161876678466797, "global_step": 197306, "epoch": 4697} {"train_loss": -7.257984638214111, "global_step": 197307, "epoch": 4697} {"train_loss": -7.248108863830566, "global_step": 197308, "epoch": 4697} {"train_loss": -7.283110618591309, "global_step": 197309, "epoch": 4697} {"train_loss": -7.269636154174805, "global_step": 197310, "epoch": 4697} {"train_loss": -7.241911888122559, "global_step": 197311, "epoch": 4697} {"train_loss": -7.323286056518555, "global_step": 197312, "epoch": 4697} {"train_loss": -7.119285583496094, "global_step": 197313, "epoch": 4697} {"train_loss": -7.286767959594727, "global_step": 197314, "epoch": 4697} {"train_loss": -7.2465391499655585, "global_step": 197315, "epoch": 4697, "val_loss": 69627.984375} {"train_loss": -7.275724411010742, "global_step": 197316, "epoch": 4698} {"train_loss": -7.329222679138184, "global_step": 197317, "epoch": 4698} {"train_loss": -7.290310859680176, "global_step": 197318, "epoch": 4698} {"train_loss": -7.209173202514648, "global_step": 197319, "epoch": 4698} {"train_loss": -7.224604606628418, "global_step": 197320, "epoch": 4698} {"train_loss": -7.2970123291015625, "global_step": 197321, "epoch": 4698} {"train_loss": -7.268095016479492, "global_step": 197322, "epoch": 4698} {"train_loss": -7.217386245727539, "global_step": 197323, "epoch": 4698} {"train_loss": -7.188394546508789, "global_step": 197324, "epoch": 4698} {"train_loss": -7.260140419006348, "global_step": 197325, "epoch": 4698} {"train_loss": -7.211212635040283, "global_step": 197326, "epoch": 4698} {"train_loss": -7.236423492431641, "global_step": 197327, "epoch": 4698} {"train_loss": -7.270558834075928, "global_step": 197328, "epoch": 4698} {"train_loss": -7.228333473205566, "global_step": 197329, "epoch": 4698} {"train_loss": -7.1262898445129395, "global_step": 197330, "epoch": 4698} {"train_loss": -7.242142200469971, "global_step": 197331, "epoch": 4698} {"train_loss": -7.157795429229736, "global_step": 197332, "epoch": 4698} {"train_loss": -7.102838039398193, "global_step": 197333, "epoch": 4698} {"train_loss": -7.317352294921875, "global_step": 197334, "epoch": 4698} {"train_loss": -7.235965728759766, "global_step": 197335, "epoch": 4698} {"train_loss": -7.269351005554199, "global_step": 197336, "epoch": 4698} {"train_loss": -7.208664894104004, "global_step": 197337, "epoch": 4698} {"train_loss": -7.22342586517334, "global_step": 197338, "epoch": 4698} {"train_loss": -7.200026512145996, "global_step": 197339, "epoch": 4698} {"train_loss": -7.169204235076904, "global_step": 197340, "epoch": 4698} {"train_loss": -7.177722930908203, "global_step": 197341, "epoch": 4698} {"train_loss": -7.2962446212768555, "global_step": 197342, "epoch": 4698} {"train_loss": -7.073139190673828, "global_step": 197343, "epoch": 4698} {"train_loss": -7.175404071807861, "global_step": 197344, "epoch": 4698} {"train_loss": -7.131957054138184, "global_step": 197345, "epoch": 4698} {"train_loss": -7.1173319816589355, "global_step": 197346, "epoch": 4698} {"train_loss": -7.1151018142700195, "global_step": 197347, "epoch": 4698} {"train_loss": -7.071366786956787, "global_step": 197348, "epoch": 4698} {"train_loss": -7.267203330993652, "global_step": 197349, "epoch": 4698} {"train_loss": -7.143599033355713, "global_step": 197350, "epoch": 4698} {"train_loss": -7.16835355758667, "global_step": 197351, "epoch": 4698} {"train_loss": -7.182459831237793, "global_step": 197352, "epoch": 4698} {"train_loss": -6.91718053817749, "global_step": 197353, "epoch": 4698} {"train_loss": -7.23915958404541, "global_step": 197354, "epoch": 4698} {"train_loss": -7.024796485900879, "global_step": 197355, "epoch": 4698} {"train_loss": -7.219785690307617, "global_step": 197356, "epoch": 4698} {"train_loss": -7.19551294190543, "global_step": 197357, "epoch": 4698, "val_loss": 69778.125} {"train_loss": -7.119297027587891, "global_step": 197358, "epoch": 4699} {"train_loss": -7.209353923797607, "global_step": 197359, "epoch": 4699} {"train_loss": -7.212173938751221, "global_step": 197360, "epoch": 4699} {"train_loss": -7.252765655517578, "global_step": 197361, "epoch": 4699} {"train_loss": -7.2393927574157715, "global_step": 197362, "epoch": 4699} {"train_loss": -7.193791389465332, "global_step": 197363, "epoch": 4699} {"train_loss": -7.182356834411621, "global_step": 197364, "epoch": 4699} {"train_loss": -7.257172584533691, "global_step": 197365, "epoch": 4699} {"train_loss": -7.109035491943359, "global_step": 197366, "epoch": 4699} {"train_loss": -7.214444637298584, "global_step": 197367, "epoch": 4699} {"train_loss": -7.310871124267578, "global_step": 197368, "epoch": 4699} {"train_loss": -7.154855728149414, "global_step": 197369, "epoch": 4699} {"train_loss": -7.349671363830566, "global_step": 197370, "epoch": 4699} {"train_loss": -7.100669860839844, "global_step": 197371, "epoch": 4699} {"train_loss": -7.353121757507324, "global_step": 197372, "epoch": 4699} {"train_loss": -7.30064058303833, "global_step": 197373, "epoch": 4699} {"train_loss": -7.295244216918945, "global_step": 197374, "epoch": 4699} {"train_loss": -7.239022254943848, "global_step": 197375, "epoch": 4699} {"train_loss": -7.245369911193848, "global_step": 197376, "epoch": 4699} {"train_loss": -7.3538665771484375, "global_step": 197377, "epoch": 4699} {"train_loss": -7.180968761444092, "global_step": 197378, "epoch": 4699} {"train_loss": -7.241004467010498, "global_step": 197379, "epoch": 4699} {"train_loss": -7.27078914642334, "global_step": 197380, "epoch": 4699} {"train_loss": -7.424583435058594, "global_step": 197381, "epoch": 4699} {"train_loss": -7.240026473999023, "global_step": 197382, "epoch": 4699} {"train_loss": -7.214203357696533, "global_step": 197383, "epoch": 4699} {"train_loss": -7.24821662902832, "global_step": 197384, "epoch": 4699} {"train_loss": -7.3760576248168945, "global_step": 197385, "epoch": 4699} {"train_loss": -7.320463180541992, "global_step": 197386, "epoch": 4699} {"train_loss": -7.2277631759643555, "global_step": 197387, "epoch": 4699} {"train_loss": -7.22012996673584, "global_step": 197388, "epoch": 4699} {"train_loss": -7.182900905609131, "global_step": 197389, "epoch": 4699} {"train_loss": -7.234694480895996, "global_step": 197390, "epoch": 4699} {"train_loss": -7.2327494621276855, "global_step": 197391, "epoch": 4699} {"train_loss": -7.110992431640625, "global_step": 197392, "epoch": 4699} {"train_loss": -7.15013313293457, "global_step": 197393, "epoch": 4699} {"train_loss": -7.163309097290039, "global_step": 197394, "epoch": 4699} {"train_loss": -6.978335380554199, "global_step": 197395, "epoch": 4699} {"train_loss": -7.156128883361816, "global_step": 197396, "epoch": 4699} {"train_loss": -7.020453453063965, "global_step": 197397, "epoch": 4699} {"train_loss": -7.114797592163086, "global_step": 197398, "epoch": 4699} {"train_loss": -7.216816357203892, "global_step": 197399, "epoch": 4699, "val_loss": 69690.4375} {"train_loss": -7.141469955444336, "global_step": 197400, "epoch": 4700} {"train_loss": -7.13021993637085, "global_step": 197401, "epoch": 4700} {"train_loss": -7.192045211791992, "global_step": 197402, "epoch": 4700} {"train_loss": -7.284811019897461, "global_step": 197403, "epoch": 4700} {"train_loss": -7.137323379516602, "global_step": 197404, "epoch": 4700} {"train_loss": -7.1592206954956055, "global_step": 197405, "epoch": 4700} {"train_loss": -7.170412063598633, "global_step": 197406, "epoch": 4700} {"train_loss": -7.191890716552734, "global_step": 197407, "epoch": 4700} {"train_loss": -7.179502487182617, "global_step": 197408, "epoch": 4700} {"train_loss": -7.134106636047363, "global_step": 197409, "epoch": 4700} {"train_loss": -7.211301803588867, "global_step": 197410, "epoch": 4700} {"train_loss": -7.2952351570129395, "global_step": 197411, "epoch": 4700} {"train_loss": -7.281760215759277, "global_step": 197412, "epoch": 4700} {"train_loss": -7.311708927154541, "global_step": 197413, "epoch": 4700} {"train_loss": -7.287607669830322, "global_step": 197414, "epoch": 4700} {"train_loss": -7.382065773010254, "global_step": 197415, "epoch": 4700} {"train_loss": -7.267385005950928, "global_step": 197416, "epoch": 4700} {"train_loss": -7.2401556968688965, "global_step": 197417, "epoch": 4700} {"train_loss": -7.262988090515137, "global_step": 197418, "epoch": 4700} {"train_loss": -7.312747955322266, "global_step": 197419, "epoch": 4700} {"train_loss": -7.313013076782227, "global_step": 197420, "epoch": 4700} {"train_loss": -7.308122634887695, "global_step": 197421, "epoch": 4700} {"train_loss": -7.378022193908691, "global_step": 197422, "epoch": 4700} {"train_loss": -7.350584030151367, "global_step": 197423, "epoch": 4700} {"train_loss": -7.362799644470215, "global_step": 197424, "epoch": 4700} {"train_loss": -7.257761001586914, "global_step": 197425, "epoch": 4700} {"train_loss": -7.307214736938477, "global_step": 197426, "epoch": 4700} {"train_loss": -7.365453720092773, "global_step": 197427, "epoch": 4700} {"train_loss": -7.191038608551025, "global_step": 197428, "epoch": 4700} {"train_loss": -7.30285120010376, "global_step": 197429, "epoch": 4700} {"train_loss": -7.264554977416992, "global_step": 197430, "epoch": 4700} {"train_loss": -7.1269001960754395, "global_step": 197431, "epoch": 4700} {"train_loss": -7.203372001647949, "global_step": 197432, "epoch": 4700} {"train_loss": -7.273648262023926, "global_step": 197433, "epoch": 4700} {"train_loss": -7.239215850830078, "global_step": 197434, "epoch": 4700} {"train_loss": -7.1947550773620605, "global_step": 197435, "epoch": 4700} {"train_loss": -7.1662163734436035, "global_step": 197436, "epoch": 4700} {"train_loss": -7.129459381103516, "global_step": 197437, "epoch": 4700} {"train_loss": -7.10291051864624, "global_step": 197438, "epoch": 4700} {"train_loss": -7.216618537902832, "global_step": 197439, "epoch": 4700} {"train_loss": -7.238522529602051, "global_step": 197440, "epoch": 4700} {"train_loss": -7.239822932652065, "global_step": 197441, "epoch": 4700, "train/sim_max_reward_0": 0.9055934776268905, "train/sim_max_reward_1": 0.5410518694423172, "train/sim_max_reward_2": 0.5687233432336044, "train/sim_max_reward_3": 0.13409220303549282, "train/sim_max_reward_4": 0.9279887456774721, "train/sim_max_reward_5": 0.21151192869747648, "test/sim_max_reward_4300000": 1.0, "test/sim_max_reward_4300001": 0.5464382265249614, "test/sim_max_reward_4300002": 0.7713643231005742, "test/sim_max_reward_4300003": 0.8832084666002806, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.8128751150290936, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.922474883034468, "test/sim_max_reward_4300008": 0.9103856345158822, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 0.9503756011298604, "test/sim_max_reward_4300011": 0.7073028933359639, "test/sim_max_reward_4300012": 0.9806250898788308, "test/sim_max_reward_4300013": 0.9772350624608293, "test/sim_max_reward_4300014": 0.9500852742635872, "test/sim_max_reward_4300015": 0.933573842723893, "test/sim_max_reward_4300016": 0.4418342021219218, "test/sim_max_reward_4300017": 0.9621566705379361, "test/sim_max_reward_4300018": 0.3917649133021851, "test/sim_max_reward_4300019": 0.18609940214348897, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9338313420261515, "test/sim_max_reward_4300022": 0.7317500826088669, "test/sim_max_reward_4300023": 0.3287222280058085, "test/sim_max_reward_4300024": 0.8789733017946548, "test/sim_max_reward_4300025": 0.9897655901781514, "test/sim_max_reward_4300026": 0.17896733517274985, "test/sim_max_reward_4300027": 1.0, "test/sim_max_reward_4300028": 0.949760122519516, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.1165837400000965, "test/sim_max_reward_4300031": 0.400814560613229, "test/sim_max_reward_4300032": 0.941917760300049, "test/sim_max_reward_4300033": 0.7030420672976193, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.3686411071479708, "test/sim_max_reward_4300036": 0.20314283660386026, "test/sim_max_reward_4300037": 0.9927832597173176, "test/sim_max_reward_4300038": 0.3710882404346527, "test/sim_max_reward_4300039": 0.9423107611062339, "test/sim_max_reward_4300040": 0.6814805920409961, "test/sim_max_reward_4300041": 0.10269717104459147, "test/sim_max_reward_4300042": 0.9883781345982289, "test/sim_max_reward_4300043": 0.15178255315504083, "test/sim_max_reward_4300044": 0.04345707006804553, "test/sim_max_reward_4300045": 0.1864367235372199, "test/sim_max_reward_4300046": 1.0, "test/sim_max_reward_4300047": 0.08948637990958103, "test/sim_max_reward_4300048": 0.0, "test/sim_max_reward_4300049": 0.19898162013657375, "train/mean_score": 0.5481602612855423, "test/mean_score": 0.576368565710605, "val_loss": 70126.625} {"train_loss": -7.1906232833862305, "global_step": 197442, "epoch": 4701} {"train_loss": -7.233913421630859, "global_step": 197443, "epoch": 4701} {"train_loss": -7.291777610778809, "global_step": 197444, "epoch": 4701} {"train_loss": -7.1092424392700195, "global_step": 197445, "epoch": 4701} {"train_loss": -7.192275047302246, "global_step": 197446, "epoch": 4701} {"train_loss": -7.260474681854248, "global_step": 197447, "epoch": 4701} {"train_loss": -7.239433288574219, "global_step": 197448, "epoch": 4701} {"train_loss": -7.236209869384766, "global_step": 197449, "epoch": 4701} {"train_loss": -7.224037170410156, "global_step": 197450, "epoch": 4701} {"train_loss": -7.2117180824279785, "global_step": 197451, "epoch": 4701} {"train_loss": -7.214105129241943, "global_step": 197452, "epoch": 4701} {"train_loss": -7.289675235748291, "global_step": 197453, "epoch": 4701} {"train_loss": -7.216141700744629, "global_step": 197454, "epoch": 4701} {"train_loss": -7.102476596832275, "global_step": 197455, "epoch": 4701} {"train_loss": -7.267394065856934, "global_step": 197456, "epoch": 4701} {"train_loss": -7.065822601318359, "global_step": 197457, "epoch": 4701} {"train_loss": -7.207450866699219, "global_step": 197458, "epoch": 4701} {"train_loss": -7.30579137802124, "global_step": 197459, "epoch": 4701} {"train_loss": -7.063666343688965, "global_step": 197460, "epoch": 4701} {"train_loss": -7.2339067459106445, "global_step": 197461, "epoch": 4701} {"train_loss": -7.084470748901367, "global_step": 197462, "epoch": 4701} {"train_loss": -7.080265998840332, "global_step": 197463, "epoch": 4701} {"train_loss": -7.222361087799072, "global_step": 197464, "epoch": 4701} {"train_loss": -7.151937961578369, "global_step": 197465, "epoch": 4701} {"train_loss": -7.190350532531738, "global_step": 197466, "epoch": 4701} {"train_loss": -7.2539215087890625, "global_step": 197467, "epoch": 4701} {"train_loss": -7.091765403747559, "global_step": 197468, "epoch": 4701} {"train_loss": -7.218540191650391, "global_step": 197469, "epoch": 4701} {"train_loss": -7.226532459259033, "global_step": 197470, "epoch": 4701} {"train_loss": -7.38455057144165, "global_step": 197471, "epoch": 4701} {"train_loss": -7.249587535858154, "global_step": 197472, "epoch": 4701} {"train_loss": -7.259620189666748, "global_step": 197473, "epoch": 4701} {"train_loss": -7.302964687347412, "global_step": 197474, "epoch": 4701} {"train_loss": -7.289857864379883, "global_step": 197475, "epoch": 4701} {"train_loss": -7.210933208465576, "global_step": 197476, "epoch": 4701} {"train_loss": -7.215204238891602, "global_step": 197477, "epoch": 4701} {"train_loss": -7.380408763885498, "global_step": 197478, "epoch": 4701} {"train_loss": -7.183222770690918, "global_step": 197479, "epoch": 4701} {"train_loss": -7.354228973388672, "global_step": 197480, "epoch": 4701} {"train_loss": -7.27220344543457, "global_step": 197481, "epoch": 4701} {"train_loss": -7.268953323364258, "global_step": 197482, "epoch": 4701} {"train_loss": -7.219941990716117, "global_step": 197483, "epoch": 4701, "val_loss": 69850.6953125} {"train_loss": -7.405827522277832, "global_step": 197484, "epoch": 4702} {"train_loss": -7.154333591461182, "global_step": 197485, "epoch": 4702} {"train_loss": -7.25253438949585, "global_step": 197486, "epoch": 4702} {"train_loss": -7.350019931793213, "global_step": 197487, "epoch": 4702} {"train_loss": -7.171655654907227, "global_step": 197488, "epoch": 4702} {"train_loss": -7.19780969619751, "global_step": 197489, "epoch": 4702} {"train_loss": -7.302773475646973, "global_step": 197490, "epoch": 4702} {"train_loss": -7.3939208984375, "global_step": 197491, "epoch": 4702} {"train_loss": -7.289580345153809, "global_step": 197492, "epoch": 4702} {"train_loss": -7.167117118835449, "global_step": 197493, "epoch": 4702} {"train_loss": -7.21485710144043, "global_step": 197494, "epoch": 4702} {"train_loss": -7.27177095413208, "global_step": 197495, "epoch": 4702} {"train_loss": -7.235446929931641, "global_step": 197496, "epoch": 4702} {"train_loss": -7.315280914306641, "global_step": 197497, "epoch": 4702} {"train_loss": -7.371324062347412, "global_step": 197498, "epoch": 4702} {"train_loss": -7.217070579528809, "global_step": 197499, "epoch": 4702} {"train_loss": -7.301538944244385, "global_step": 197500, "epoch": 4702} {"train_loss": -7.293613433837891, "global_step": 197501, "epoch": 4702} {"train_loss": -7.250179767608643, "global_step": 197502, "epoch": 4702} {"train_loss": -7.241514205932617, "global_step": 197503, "epoch": 4702} {"train_loss": -7.241612434387207, "global_step": 197504, "epoch": 4702} {"train_loss": -7.174821853637695, "global_step": 197505, "epoch": 4702} {"train_loss": -7.138606548309326, "global_step": 197506, "epoch": 4702} {"train_loss": -7.2501983642578125, "global_step": 197507, "epoch": 4702} {"train_loss": -7.247099876403809, "global_step": 197508, "epoch": 4702} {"train_loss": -7.223871231079102, "global_step": 197509, "epoch": 4702} {"train_loss": -7.226118087768555, "global_step": 197510, "epoch": 4702} {"train_loss": -7.189474105834961, "global_step": 197511, "epoch": 4702} {"train_loss": -7.169875621795654, "global_step": 197512, "epoch": 4702} {"train_loss": -7.098817825317383, "global_step": 197513, "epoch": 4702} {"train_loss": -7.167051315307617, "global_step": 197514, "epoch": 4702} {"train_loss": -7.2623372077941895, "global_step": 197515, "epoch": 4702} {"train_loss": -7.3066511154174805, "global_step": 197516, "epoch": 4702} {"train_loss": -7.208658218383789, "global_step": 197517, "epoch": 4702} {"train_loss": -7.132200717926025, "global_step": 197518, "epoch": 4702} {"train_loss": -7.268835067749023, "global_step": 197519, "epoch": 4702} {"train_loss": -7.139472007751465, "global_step": 197520, "epoch": 4702} {"train_loss": -7.132315635681152, "global_step": 197521, "epoch": 4702} {"train_loss": -7.096675872802734, "global_step": 197522, "epoch": 4702} {"train_loss": -7.144015312194824, "global_step": 197523, "epoch": 4702} {"train_loss": -7.230372428894043, "global_step": 197524, "epoch": 4702} {"train_loss": -7.231479338237217, "global_step": 197525, "epoch": 4702, "val_loss": 69644.2578125} {"train_loss": -7.0785980224609375, "global_step": 197526, "epoch": 4703} {"train_loss": -7.111483097076416, "global_step": 197527, "epoch": 4703} {"train_loss": -7.185909271240234, "global_step": 197528, "epoch": 4703} {"train_loss": -7.215511798858643, "global_step": 197529, "epoch": 4703} {"train_loss": -7.075222492218018, "global_step": 197530, "epoch": 4703} {"train_loss": -7.258158206939697, "global_step": 197531, "epoch": 4703} {"train_loss": -7.0943450927734375, "global_step": 197532, "epoch": 4703} {"train_loss": -7.269045352935791, "global_step": 197533, "epoch": 4703} {"train_loss": -7.24967098236084, "global_step": 197534, "epoch": 4703} {"train_loss": -7.193772315979004, "global_step": 197535, "epoch": 4703} {"train_loss": -7.240386962890625, "global_step": 197536, "epoch": 4703} {"train_loss": -7.1075615882873535, "global_step": 197537, "epoch": 4703} {"train_loss": -7.215117454528809, "global_step": 197538, "epoch": 4703} {"train_loss": -7.146211624145508, "global_step": 197539, "epoch": 4703} {"train_loss": -7.073626518249512, "global_step": 197540, "epoch": 4703} {"train_loss": -7.171916961669922, "global_step": 197541, "epoch": 4703} {"train_loss": -7.220398426055908, "global_step": 197542, "epoch": 4703} {"train_loss": -7.222550392150879, "global_step": 197543, "epoch": 4703} {"train_loss": -7.216310501098633, "global_step": 197544, "epoch": 4703} {"train_loss": -7.278120994567871, "global_step": 197545, "epoch": 4703} {"train_loss": -7.277876853942871, "global_step": 197546, "epoch": 4703} {"train_loss": -7.185953140258789, "global_step": 197547, "epoch": 4703} {"train_loss": -7.220118045806885, "global_step": 197548, "epoch": 4703} {"train_loss": -7.14108943939209, "global_step": 197549, "epoch": 4703} {"train_loss": -7.134302139282227, "global_step": 197550, "epoch": 4703} {"train_loss": -7.1374735832214355, "global_step": 197551, "epoch": 4703} {"train_loss": -7.2666015625, "global_step": 197552, "epoch": 4703} {"train_loss": -7.204309940338135, "global_step": 197553, "epoch": 4703} {"train_loss": -7.2788496017456055, "global_step": 197554, "epoch": 4703} {"train_loss": -7.304178714752197, "global_step": 197555, "epoch": 4703} {"train_loss": -7.217957973480225, "global_step": 197556, "epoch": 4703} {"train_loss": -7.223896503448486, "global_step": 197557, "epoch": 4703} {"train_loss": -7.214471340179443, "global_step": 197558, "epoch": 4703} {"train_loss": -7.061831474304199, "global_step": 197559, "epoch": 4703} {"train_loss": -7.245611190795898, "global_step": 197560, "epoch": 4703} {"train_loss": -7.3025665283203125, "global_step": 197561, "epoch": 4703} {"train_loss": -7.179065227508545, "global_step": 197562, "epoch": 4703} {"train_loss": -7.245718955993652, "global_step": 197563, "epoch": 4703} {"train_loss": -7.111011505126953, "global_step": 197564, "epoch": 4703} {"train_loss": -7.318554878234863, "global_step": 197565, "epoch": 4703} {"train_loss": -7.032817840576172, "global_step": 197566, "epoch": 4703} {"train_loss": -7.194359143575032, "global_step": 197567, "epoch": 4703, "val_loss": 69741.3984375} {"train_loss": -7.2638840675354, "global_step": 197568, "epoch": 4704} {"train_loss": -7.2300310134887695, "global_step": 197569, "epoch": 4704} {"train_loss": -7.377574443817139, "global_step": 197570, "epoch": 4704} {"train_loss": -7.271059989929199, "global_step": 197571, "epoch": 4704} {"train_loss": -7.205758094787598, "global_step": 197572, "epoch": 4704} {"train_loss": -7.34892463684082, "global_step": 197573, "epoch": 4704} {"train_loss": -7.27477502822876, "global_step": 197574, "epoch": 4704} {"train_loss": -7.279905796051025, "global_step": 197575, "epoch": 4704} {"train_loss": -7.23802375793457, "global_step": 197576, "epoch": 4704} {"train_loss": -7.234274864196777, "global_step": 197577, "epoch": 4704} {"train_loss": -7.335063934326172, "global_step": 197578, "epoch": 4704} {"train_loss": -7.163880348205566, "global_step": 197579, "epoch": 4704} {"train_loss": -7.381953239440918, "global_step": 197580, "epoch": 4704} {"train_loss": -7.18634557723999, "global_step": 197581, "epoch": 4704} {"train_loss": -7.197478771209717, "global_step": 197582, "epoch": 4704} {"train_loss": -7.348029136657715, "global_step": 197583, "epoch": 4704} {"train_loss": -7.187426567077637, "global_step": 197584, "epoch": 4704} {"train_loss": -7.356029987335205, "global_step": 197585, "epoch": 4704} {"train_loss": -7.165620803833008, "global_step": 197586, "epoch": 4704} {"train_loss": -7.275460243225098, "global_step": 197587, "epoch": 4704} {"train_loss": -7.269871234893799, "global_step": 197588, "epoch": 4704} {"train_loss": -7.211864471435547, "global_step": 197589, "epoch": 4704} {"train_loss": -7.267712593078613, "global_step": 197590, "epoch": 4704} {"train_loss": -7.290408134460449, "global_step": 197591, "epoch": 4704} {"train_loss": -7.308149337768555, "global_step": 197592, "epoch": 4704} {"train_loss": -7.170647621154785, "global_step": 197593, "epoch": 4704} {"train_loss": -7.271240711212158, "global_step": 197594, "epoch": 4704} {"train_loss": -7.231846332550049, "global_step": 197595, "epoch": 4704} {"train_loss": -7.221835136413574, "global_step": 197596, "epoch": 4704} {"train_loss": -7.2854509353637695, "global_step": 197597, "epoch": 4704} {"train_loss": -7.151988506317139, "global_step": 197598, "epoch": 4704} {"train_loss": -7.219073295593262, "global_step": 197599, "epoch": 4704} {"train_loss": -7.226903915405273, "global_step": 197600, "epoch": 4704} {"train_loss": -7.272819519042969, "global_step": 197601, "epoch": 4704} {"train_loss": -7.238345146179199, "global_step": 197602, "epoch": 4704} {"train_loss": -7.3187761306762695, "global_step": 197603, "epoch": 4704} {"train_loss": -7.150617599487305, "global_step": 197604, "epoch": 4704} {"train_loss": -7.337437152862549, "global_step": 197605, "epoch": 4704} {"train_loss": -7.155386447906494, "global_step": 197606, "epoch": 4704} {"train_loss": -7.274474620819092, "global_step": 197607, "epoch": 4704} {"train_loss": -7.255057334899902, "global_step": 197608, "epoch": 4704} {"train_loss": -7.255464735485258, "global_step": 197609, "epoch": 4704, "val_loss": 69950.515625} {"train_loss": -7.30643367767334, "global_step": 197610, "epoch": 4705} {"train_loss": -7.363616943359375, "global_step": 197611, "epoch": 4705} {"train_loss": -7.212125778198242, "global_step": 197612, "epoch": 4705} {"train_loss": -7.3949785232543945, "global_step": 197613, "epoch": 4705} {"train_loss": -7.285542011260986, "global_step": 197614, "epoch": 4705} {"train_loss": -7.307511329650879, "global_step": 197615, "epoch": 4705} {"train_loss": -7.40187931060791, "global_step": 197616, "epoch": 4705} {"train_loss": -7.235361099243164, "global_step": 197617, "epoch": 4705} {"train_loss": -7.315771102905273, "global_step": 197618, "epoch": 4705} {"train_loss": -7.329135417938232, "global_step": 197619, "epoch": 4705} {"train_loss": -7.330144882202148, "global_step": 197620, "epoch": 4705} {"train_loss": -7.1425371170043945, "global_step": 197621, "epoch": 4705} {"train_loss": -7.173297882080078, "global_step": 197622, "epoch": 4705} {"train_loss": -7.018773555755615, "global_step": 197623, "epoch": 4705} {"train_loss": -7.0909504890441895, "global_step": 197624, "epoch": 4705} {"train_loss": -7.233822822570801, "global_step": 197625, "epoch": 4705} {"train_loss": -7.076963424682617, "global_step": 197626, "epoch": 4705} {"train_loss": -7.187902450561523, "global_step": 197627, "epoch": 4705} {"train_loss": -7.1530256271362305, "global_step": 197628, "epoch": 4705} {"train_loss": -7.127945899963379, "global_step": 197629, "epoch": 4705} {"train_loss": -7.11998987197876, "global_step": 197630, "epoch": 4705} {"train_loss": -7.159144401550293, "global_step": 197631, "epoch": 4705} {"train_loss": -7.331517219543457, "global_step": 197632, "epoch": 4705} {"train_loss": -7.18215274810791, "global_step": 197633, "epoch": 4705} {"train_loss": -7.189467430114746, "global_step": 197634, "epoch": 4705} {"train_loss": -7.236784934997559, "global_step": 197635, "epoch": 4705} {"train_loss": -7.228579044342041, "global_step": 197636, "epoch": 4705} {"train_loss": -7.191726207733154, "global_step": 197637, "epoch": 4705} {"train_loss": -7.351632595062256, "global_step": 197638, "epoch": 4705} {"train_loss": -7.209783554077148, "global_step": 197639, "epoch": 4705} {"train_loss": -7.161054611206055, "global_step": 197640, "epoch": 4705} {"train_loss": -7.267401695251465, "global_step": 197641, "epoch": 4705} {"train_loss": -7.376006126403809, "global_step": 197642, "epoch": 4705} {"train_loss": -7.269457817077637, "global_step": 197643, "epoch": 4705} {"train_loss": -7.135611057281494, "global_step": 197644, "epoch": 4705} {"train_loss": -7.3094916343688965, "global_step": 197645, "epoch": 4705} {"train_loss": -7.213286399841309, "global_step": 197646, "epoch": 4705} {"train_loss": -7.396090507507324, "global_step": 197647, "epoch": 4705} {"train_loss": -7.217691421508789, "global_step": 197648, "epoch": 4705} {"train_loss": -7.220724105834961, "global_step": 197649, "epoch": 4705} {"train_loss": -7.241795539855957, "global_step": 197650, "epoch": 4705} {"train_loss": -7.238217308407738, "global_step": 197651, "epoch": 4705, "val_loss": 69874.734375} {"train_loss": -7.278637409210205, "global_step": 197652, "epoch": 4706} {"train_loss": -7.2874884605407715, "global_step": 197653, "epoch": 4706} {"train_loss": -7.343554973602295, "global_step": 197654, "epoch": 4706} {"train_loss": -7.350247383117676, "global_step": 197655, "epoch": 4706} {"train_loss": -7.464121341705322, "global_step": 197656, "epoch": 4706} {"train_loss": -7.2885236740112305, "global_step": 197657, "epoch": 4706} {"train_loss": -7.2719011306762695, "global_step": 197658, "epoch": 4706} {"train_loss": -7.339114665985107, "global_step": 197659, "epoch": 4706} {"train_loss": -7.382514953613281, "global_step": 197660, "epoch": 4706} {"train_loss": -7.273518085479736, "global_step": 197661, "epoch": 4706} {"train_loss": -7.207738876342773, "global_step": 197662, "epoch": 4706} {"train_loss": -7.095577716827393, "global_step": 197663, "epoch": 4706} {"train_loss": -7.242539405822754, "global_step": 197664, "epoch": 4706} {"train_loss": -7.282304286956787, "global_step": 197665, "epoch": 4706} {"train_loss": -7.030205726623535, "global_step": 197666, "epoch": 4706} {"train_loss": -7.130733489990234, "global_step": 197667, "epoch": 4706} {"train_loss": -7.194225788116455, "global_step": 197668, "epoch": 4706} {"train_loss": -7.087970733642578, "global_step": 197669, "epoch": 4706} {"train_loss": -6.9478759765625, "global_step": 197670, "epoch": 4706} {"train_loss": -7.21769380569458, "global_step": 197671, "epoch": 4706} {"train_loss": -7.059305667877197, "global_step": 197672, "epoch": 4706} {"train_loss": -7.202334880828857, "global_step": 197673, "epoch": 4706} {"train_loss": -7.225076675415039, "global_step": 197674, "epoch": 4706} {"train_loss": -7.295167922973633, "global_step": 197675, "epoch": 4706} {"train_loss": -7.2071533203125, "global_step": 197676, "epoch": 4706} {"train_loss": -7.195871353149414, "global_step": 197677, "epoch": 4706} {"train_loss": -7.198442459106445, "global_step": 197678, "epoch": 4706} {"train_loss": -7.050632476806641, "global_step": 197679, "epoch": 4706} {"train_loss": -7.262676239013672, "global_step": 197680, "epoch": 4706} {"train_loss": -7.129388809204102, "global_step": 197681, "epoch": 4706} {"train_loss": -7.217473983764648, "global_step": 197682, "epoch": 4706} {"train_loss": -7.131709098815918, "global_step": 197683, "epoch": 4706} {"train_loss": -7.267703056335449, "global_step": 197684, "epoch": 4706} {"train_loss": -7.225815773010254, "global_step": 197685, "epoch": 4706} {"train_loss": -7.150884628295898, "global_step": 197686, "epoch": 4706} {"train_loss": -7.298982620239258, "global_step": 197687, "epoch": 4706} {"train_loss": -7.268991470336914, "global_step": 197688, "epoch": 4706} {"train_loss": -7.298987865447998, "global_step": 197689, "epoch": 4706} {"train_loss": -7.137853622436523, "global_step": 197690, "epoch": 4706} {"train_loss": -7.209423065185547, "global_step": 197691, "epoch": 4706} {"train_loss": -7.11406135559082, "global_step": 197692, "epoch": 4706} {"train_loss": -7.2167602607182095, "global_step": 197693, "epoch": 4706, "val_loss": 69913.4921875} {"train_loss": -7.211328983306885, "global_step": 197694, "epoch": 4707} {"train_loss": -7.058707237243652, "global_step": 197695, "epoch": 4707} {"train_loss": -7.246500015258789, "global_step": 197696, "epoch": 4707} {"train_loss": -7.297977924346924, "global_step": 197697, "epoch": 4707} {"train_loss": -7.180070877075195, "global_step": 197698, "epoch": 4707} {"train_loss": -7.278290748596191, "global_step": 197699, "epoch": 4707} {"train_loss": -7.225194931030273, "global_step": 197700, "epoch": 4707} {"train_loss": -7.278001308441162, "global_step": 197701, "epoch": 4707} {"train_loss": -7.26186466217041, "global_step": 197702, "epoch": 4707} {"train_loss": -7.097543716430664, "global_step": 197703, "epoch": 4707} {"train_loss": -7.312679290771484, "global_step": 197704, "epoch": 4707} {"train_loss": -7.344670295715332, "global_step": 197705, "epoch": 4707} {"train_loss": -7.105685710906982, "global_step": 197706, "epoch": 4707} {"train_loss": -7.366331100463867, "global_step": 197707, "epoch": 4707} {"train_loss": -7.165261268615723, "global_step": 197708, "epoch": 4707} {"train_loss": -7.093660354614258, "global_step": 197709, "epoch": 4707} {"train_loss": -7.098801612854004, "global_step": 197710, "epoch": 4707} {"train_loss": -7.222143173217773, "global_step": 197711, "epoch": 4707} {"train_loss": -7.25105094909668, "global_step": 197712, "epoch": 4707} {"train_loss": -7.0872392654418945, "global_step": 197713, "epoch": 4707} {"train_loss": -7.2517852783203125, "global_step": 197714, "epoch": 4707} {"train_loss": -7.213646411895752, "global_step": 197715, "epoch": 4707} {"train_loss": -7.228178024291992, "global_step": 197716, "epoch": 4707} {"train_loss": -7.233504772186279, "global_step": 197717, "epoch": 4707} {"train_loss": -7.443382740020752, "global_step": 197718, "epoch": 4707} {"train_loss": -7.23724365234375, "global_step": 197719, "epoch": 4707} {"train_loss": -7.106626987457275, "global_step": 197720, "epoch": 4707} {"train_loss": -7.347799301147461, "global_step": 197721, "epoch": 4707} {"train_loss": -7.19208288192749, "global_step": 197722, "epoch": 4707} {"train_loss": -7.128396987915039, "global_step": 197723, "epoch": 4707} {"train_loss": -7.255333423614502, "global_step": 197724, "epoch": 4707} {"train_loss": -7.236738204956055, "global_step": 197725, "epoch": 4707} {"train_loss": -7.076176643371582, "global_step": 197726, "epoch": 4707} {"train_loss": -7.261262893676758, "global_step": 197727, "epoch": 4707} {"train_loss": -7.366781711578369, "global_step": 197728, "epoch": 4707} {"train_loss": -7.167720794677734, "global_step": 197729, "epoch": 4707} {"train_loss": -7.2413649559021, "global_step": 197730, "epoch": 4707} {"train_loss": -7.381641387939453, "global_step": 197731, "epoch": 4707} {"train_loss": -7.205373764038086, "global_step": 197732, "epoch": 4707} {"train_loss": -7.313209533691406, "global_step": 197733, "epoch": 4707} {"train_loss": -7.208023548126221, "global_step": 197734, "epoch": 4707} {"train_loss": -7.226986748831613, "global_step": 197735, "epoch": 4707, "val_loss": 69712.6015625} {"train_loss": -7.316840171813965, "global_step": 197736, "epoch": 4708} {"train_loss": -7.214230537414551, "global_step": 197737, "epoch": 4708} {"train_loss": -7.438265800476074, "global_step": 197738, "epoch": 4708} {"train_loss": -7.178743362426758, "global_step": 197739, "epoch": 4708} {"train_loss": -7.2429728507995605, "global_step": 197740, "epoch": 4708} {"train_loss": -7.248884201049805, "global_step": 197741, "epoch": 4708} {"train_loss": -7.169593811035156, "global_step": 197742, "epoch": 4708} {"train_loss": -7.2134785652160645, "global_step": 197743, "epoch": 4708} {"train_loss": -7.157646179199219, "global_step": 197744, "epoch": 4708} {"train_loss": -7.273990631103516, "global_step": 197745, "epoch": 4708} {"train_loss": -7.174156188964844, "global_step": 197746, "epoch": 4708} {"train_loss": -7.141685485839844, "global_step": 197747, "epoch": 4708} {"train_loss": -7.270981788635254, "global_step": 197748, "epoch": 4708} {"train_loss": -7.155658721923828, "global_step": 197749, "epoch": 4708} {"train_loss": -7.203579425811768, "global_step": 197750, "epoch": 4708} {"train_loss": -7.156003952026367, "global_step": 197751, "epoch": 4708} {"train_loss": -7.225926399230957, "global_step": 197752, "epoch": 4708} {"train_loss": -7.2355756759643555, "global_step": 197753, "epoch": 4708} {"train_loss": -7.229732990264893, "global_step": 197754, "epoch": 4708} {"train_loss": -7.299168109893799, "global_step": 197755, "epoch": 4708} {"train_loss": -7.248051643371582, "global_step": 197756, "epoch": 4708} {"train_loss": -7.083555221557617, "global_step": 197757, "epoch": 4708} {"train_loss": -7.287146091461182, "global_step": 197758, "epoch": 4708} {"train_loss": -7.221837043762207, "global_step": 197759, "epoch": 4708} {"train_loss": -7.18612003326416, "global_step": 197760, "epoch": 4708} {"train_loss": -7.30588436126709, "global_step": 197761, "epoch": 4708} {"train_loss": -7.117429256439209, "global_step": 197762, "epoch": 4708} {"train_loss": -7.255537986755371, "global_step": 197763, "epoch": 4708} {"train_loss": -7.274466514587402, "global_step": 197764, "epoch": 4708} {"train_loss": -7.271705627441406, "global_step": 197765, "epoch": 4708} {"train_loss": -7.227892875671387, "global_step": 197766, "epoch": 4708} {"train_loss": -7.316866874694824, "global_step": 197767, "epoch": 4708} {"train_loss": -7.318774223327637, "global_step": 197768, "epoch": 4708} {"train_loss": -7.317079544067383, "global_step": 197769, "epoch": 4708} {"train_loss": -7.390239715576172, "global_step": 197770, "epoch": 4708} {"train_loss": -7.352881908416748, "global_step": 197771, "epoch": 4708} {"train_loss": -7.259082794189453, "global_step": 197772, "epoch": 4708} {"train_loss": -7.27851676940918, "global_step": 197773, "epoch": 4708} {"train_loss": -7.3656110763549805, "global_step": 197774, "epoch": 4708} {"train_loss": -7.418724536895752, "global_step": 197775, "epoch": 4708} {"train_loss": -7.249268054962158, "global_step": 197776, "epoch": 4708} {"train_loss": -7.252849079313732, "global_step": 197777, "epoch": 4708, "val_loss": 69731.8125} {"train_loss": -7.258669853210449, "global_step": 197778, "epoch": 4709} {"train_loss": -7.192437171936035, "global_step": 197779, "epoch": 4709} {"train_loss": -7.353216171264648, "global_step": 197780, "epoch": 4709} {"train_loss": -7.299827575683594, "global_step": 197781, "epoch": 4709} {"train_loss": -7.269010066986084, "global_step": 197782, "epoch": 4709} {"train_loss": -7.146353721618652, "global_step": 197783, "epoch": 4709} {"train_loss": -7.103801727294922, "global_step": 197784, "epoch": 4709} {"train_loss": -7.180408000946045, "global_step": 197785, "epoch": 4709} {"train_loss": -7.331799507141113, "global_step": 197786, "epoch": 4709} {"train_loss": -7.262345314025879, "global_step": 197787, "epoch": 4709} {"train_loss": -7.253022193908691, "global_step": 197788, "epoch": 4709} {"train_loss": -7.329615592956543, "global_step": 197789, "epoch": 4709} {"train_loss": -7.398018836975098, "global_step": 197790, "epoch": 4709} {"train_loss": -7.161149978637695, "global_step": 197791, "epoch": 4709} {"train_loss": -7.253220081329346, "global_step": 197792, "epoch": 4709} {"train_loss": -7.283283710479736, "global_step": 197793, "epoch": 4709} {"train_loss": -7.260941505432129, "global_step": 197794, "epoch": 4709} {"train_loss": -7.267839431762695, "global_step": 197795, "epoch": 4709} {"train_loss": -7.290923118591309, "global_step": 197796, "epoch": 4709} {"train_loss": -7.216008186340332, "global_step": 197797, "epoch": 4709} {"train_loss": -7.257798671722412, "global_step": 197798, "epoch": 4709} {"train_loss": -7.168985366821289, "global_step": 197799, "epoch": 4709} {"train_loss": -7.170914649963379, "global_step": 197800, "epoch": 4709} {"train_loss": -7.268604278564453, "global_step": 197801, "epoch": 4709} {"train_loss": -7.1888837814331055, "global_step": 197802, "epoch": 4709} {"train_loss": -7.301114082336426, "global_step": 197803, "epoch": 4709} {"train_loss": -7.3472394943237305, "global_step": 197804, "epoch": 4709} {"train_loss": -7.190317153930664, "global_step": 197805, "epoch": 4709} {"train_loss": -7.2107977867126465, "global_step": 197806, "epoch": 4709} {"train_loss": -7.172435283660889, "global_step": 197807, "epoch": 4709} {"train_loss": -7.059692859649658, "global_step": 197808, "epoch": 4709} {"train_loss": -7.183320045471191, "global_step": 197809, "epoch": 4709} {"train_loss": -7.333481788635254, "global_step": 197810, "epoch": 4709} {"train_loss": -7.1093854904174805, "global_step": 197811, "epoch": 4709} {"train_loss": -7.329648017883301, "global_step": 197812, "epoch": 4709} {"train_loss": -7.142751693725586, "global_step": 197813, "epoch": 4709} {"train_loss": -7.04305362701416, "global_step": 197814, "epoch": 4709} {"train_loss": -7.210052490234375, "global_step": 197815, "epoch": 4709} {"train_loss": -7.149021148681641, "global_step": 197816, "epoch": 4709} {"train_loss": -7.105935096740723, "global_step": 197817, "epoch": 4709} {"train_loss": -7.2516865730285645, "global_step": 197818, "epoch": 4709} {"train_loss": -7.224315620604015, "global_step": 197819, "epoch": 4709, "val_loss": 69885.78125} {"train_loss": -7.143953800201416, "global_step": 197820, "epoch": 4710} {"train_loss": -7.322009086608887, "global_step": 197821, "epoch": 4710} {"train_loss": -7.11153507232666, "global_step": 197822, "epoch": 4710} {"train_loss": -7.2673540115356445, "global_step": 197823, "epoch": 4710} {"train_loss": -7.23095703125, "global_step": 197824, "epoch": 4710} {"train_loss": -7.163548469543457, "global_step": 197825, "epoch": 4710} {"train_loss": -7.009207725524902, "global_step": 197826, "epoch": 4710} {"train_loss": -7.249266624450684, "global_step": 197827, "epoch": 4710} {"train_loss": -7.204965591430664, "global_step": 197828, "epoch": 4710} {"train_loss": -7.350454330444336, "global_step": 197829, "epoch": 4710} {"train_loss": -7.2719316482543945, "global_step": 197830, "epoch": 4710} {"train_loss": -7.277802467346191, "global_step": 197831, "epoch": 4710} {"train_loss": -7.267278671264648, "global_step": 197832, "epoch": 4710} {"train_loss": -7.295267105102539, "global_step": 197833, "epoch": 4710} {"train_loss": -7.199713706970215, "global_step": 197834, "epoch": 4710} {"train_loss": -7.140649318695068, "global_step": 197835, "epoch": 4710} {"train_loss": -7.2973809242248535, "global_step": 197836, "epoch": 4710} {"train_loss": -7.386295318603516, "global_step": 197837, "epoch": 4710} {"train_loss": -7.319971561431885, "global_step": 197838, "epoch": 4710} {"train_loss": -7.342679023742676, "global_step": 197839, "epoch": 4710} {"train_loss": -7.271350383758545, "global_step": 197840, "epoch": 4710} {"train_loss": -7.353822231292725, "global_step": 197841, "epoch": 4710} {"train_loss": -7.293322563171387, "global_step": 197842, "epoch": 4710} {"train_loss": -7.268606185913086, "global_step": 197843, "epoch": 4710} {"train_loss": -7.194443225860596, "global_step": 197844, "epoch": 4710} {"train_loss": -7.2646284103393555, "global_step": 197845, "epoch": 4710} {"train_loss": -7.224900245666504, "global_step": 197846, "epoch": 4710} {"train_loss": -7.215347766876221, "global_step": 197847, "epoch": 4710} {"train_loss": -7.2758636474609375, "global_step": 197848, "epoch": 4710} {"train_loss": -7.2295823097229, "global_step": 197849, "epoch": 4710} {"train_loss": -7.257786750793457, "global_step": 197850, "epoch": 4710} {"train_loss": -7.3485212326049805, "global_step": 197851, "epoch": 4710} {"train_loss": -7.237736701965332, "global_step": 197852, "epoch": 4710} {"train_loss": -7.2748212814331055, "global_step": 197853, "epoch": 4710} {"train_loss": -7.250118732452393, "global_step": 197854, "epoch": 4710} {"train_loss": -7.24835205078125, "global_step": 197855, "epoch": 4710} {"train_loss": -7.311007976531982, "global_step": 197856, "epoch": 4710} {"train_loss": -7.390589714050293, "global_step": 197857, "epoch": 4710} {"train_loss": -7.3253583908081055, "global_step": 197858, "epoch": 4710} {"train_loss": -7.330209255218506, "global_step": 197859, "epoch": 4710} {"train_loss": -7.351336479187012, "global_step": 197860, "epoch": 4710} {"train_loss": -7.263547715686617, "global_step": 197861, "epoch": 4710, "val_loss": 69697.8671875} {"train_loss": -7.282947540283203, "global_step": 197862, "epoch": 4711} {"train_loss": -7.309128761291504, "global_step": 197863, "epoch": 4711} {"train_loss": -7.3463640213012695, "global_step": 197864, "epoch": 4711} {"train_loss": -7.43548059463501, "global_step": 197865, "epoch": 4711} {"train_loss": -7.365490913391113, "global_step": 197866, "epoch": 4711} {"train_loss": -7.301095008850098, "global_step": 197867, "epoch": 4711} {"train_loss": -7.373804092407227, "global_step": 197868, "epoch": 4711} {"train_loss": -7.252435684204102, "global_step": 197869, "epoch": 4711} {"train_loss": -7.218626022338867, "global_step": 197870, "epoch": 4711} {"train_loss": -7.294857025146484, "global_step": 197871, "epoch": 4711} {"train_loss": -7.301276206970215, "global_step": 197872, "epoch": 4711} {"train_loss": -7.250644683837891, "global_step": 197873, "epoch": 4711} {"train_loss": -7.329363822937012, "global_step": 197874, "epoch": 4711} {"train_loss": -7.262166976928711, "global_step": 197875, "epoch": 4711} {"train_loss": -7.337123394012451, "global_step": 197876, "epoch": 4711} {"train_loss": -7.228975296020508, "global_step": 197877, "epoch": 4711} {"train_loss": -7.178118705749512, "global_step": 197878, "epoch": 4711} {"train_loss": -7.281688213348389, "global_step": 197879, "epoch": 4711} {"train_loss": -7.334130764007568, "global_step": 197880, "epoch": 4711} {"train_loss": -7.273548126220703, "global_step": 197881, "epoch": 4711} {"train_loss": -7.196215629577637, "global_step": 197882, "epoch": 4711} {"train_loss": -7.303032875061035, "global_step": 197883, "epoch": 4711} {"train_loss": -7.303293228149414, "global_step": 197884, "epoch": 4711} {"train_loss": -7.31003475189209, "global_step": 197885, "epoch": 4711} {"train_loss": -7.128698348999023, "global_step": 197886, "epoch": 4711} {"train_loss": -7.331470489501953, "global_step": 197887, "epoch": 4711} {"train_loss": -7.271129608154297, "global_step": 197888, "epoch": 4711} {"train_loss": -7.277423858642578, "global_step": 197889, "epoch": 4711} {"train_loss": -7.256680011749268, "global_step": 197890, "epoch": 4711} {"train_loss": -7.215304374694824, "global_step": 197891, "epoch": 4711} {"train_loss": -7.245122909545898, "global_step": 197892, "epoch": 4711} {"train_loss": -7.321839332580566, "global_step": 197893, "epoch": 4711} {"train_loss": -7.2491135597229, "global_step": 197894, "epoch": 4711} {"train_loss": -7.298612117767334, "global_step": 197895, "epoch": 4711} {"train_loss": -7.153413772583008, "global_step": 197896, "epoch": 4711} {"train_loss": -7.224601745605469, "global_step": 197897, "epoch": 4711} {"train_loss": -7.2829694747924805, "global_step": 197898, "epoch": 4711} {"train_loss": -7.206198692321777, "global_step": 197899, "epoch": 4711} {"train_loss": -7.184003829956055, "global_step": 197900, "epoch": 4711} {"train_loss": -7.289097785949707, "global_step": 197901, "epoch": 4711} {"train_loss": -7.156966209411621, "global_step": 197902, "epoch": 4711} {"train_loss": -7.271217357544672, "global_step": 197903, "epoch": 4711, "val_loss": 69799.078125} {"train_loss": -7.321187496185303, "global_step": 197904, "epoch": 4712} {"train_loss": -7.160296440124512, "global_step": 197905, "epoch": 4712} {"train_loss": -7.223401069641113, "global_step": 197906, "epoch": 4712} {"train_loss": -7.283599853515625, "global_step": 197907, "epoch": 4712} {"train_loss": -7.181140899658203, "global_step": 197908, "epoch": 4712} {"train_loss": -7.269906044006348, "global_step": 197909, "epoch": 4712} {"train_loss": -7.338257789611816, "global_step": 197910, "epoch": 4712} {"train_loss": -7.23952579498291, "global_step": 197911, "epoch": 4712} {"train_loss": -7.338321208953857, "global_step": 197912, "epoch": 4712} {"train_loss": -7.145663261413574, "global_step": 197913, "epoch": 4712} {"train_loss": -7.314708232879639, "global_step": 197914, "epoch": 4712} {"train_loss": -7.1395463943481445, "global_step": 197915, "epoch": 4712} {"train_loss": -7.184008598327637, "global_step": 197916, "epoch": 4712} {"train_loss": -7.124750137329102, "global_step": 197917, "epoch": 4712} {"train_loss": -7.182046890258789, "global_step": 197918, "epoch": 4712} {"train_loss": -7.218711853027344, "global_step": 197919, "epoch": 4712} {"train_loss": -7.059264183044434, "global_step": 197920, "epoch": 4712} {"train_loss": -7.071964263916016, "global_step": 197921, "epoch": 4712} {"train_loss": -7.009779453277588, "global_step": 197922, "epoch": 4712} {"train_loss": -7.121365547180176, "global_step": 197923, "epoch": 4712} {"train_loss": -6.889564514160156, "global_step": 197924, "epoch": 4712} {"train_loss": -7.193391799926758, "global_step": 197925, "epoch": 4712} {"train_loss": -7.074695587158203, "global_step": 197926, "epoch": 4712} {"train_loss": -7.121407985687256, "global_step": 197927, "epoch": 4712} {"train_loss": -7.262511253356934, "global_step": 197928, "epoch": 4712} {"train_loss": -7.129960060119629, "global_step": 197929, "epoch": 4712} {"train_loss": -7.131627082824707, "global_step": 197930, "epoch": 4712} {"train_loss": -7.117646217346191, "global_step": 197931, "epoch": 4712} {"train_loss": -7.150075912475586, "global_step": 197932, "epoch": 4712} {"train_loss": -7.126898765563965, "global_step": 197933, "epoch": 4712} {"train_loss": -7.164952278137207, "global_step": 197934, "epoch": 4712} {"train_loss": -7.051188945770264, "global_step": 197935, "epoch": 4712} {"train_loss": -7.170835971832275, "global_step": 197936, "epoch": 4712} {"train_loss": -7.162517070770264, "global_step": 197937, "epoch": 4712} {"train_loss": -7.246960639953613, "global_step": 197938, "epoch": 4712} {"train_loss": -7.241323471069336, "global_step": 197939, "epoch": 4712} {"train_loss": -7.239296913146973, "global_step": 197940, "epoch": 4712} {"train_loss": -7.231263637542725, "global_step": 197941, "epoch": 4712} {"train_loss": -7.247944355010986, "global_step": 197942, "epoch": 4712} {"train_loss": -7.232020378112793, "global_step": 197943, "epoch": 4712} {"train_loss": -7.265035629272461, "global_step": 197944, "epoch": 4712} {"train_loss": -7.181152411869594, "global_step": 197945, "epoch": 4712, "val_loss": 69644.7109375} {"train_loss": -7.240286827087402, "global_step": 197946, "epoch": 4713} {"train_loss": -7.3142218589782715, "global_step": 197947, "epoch": 4713} {"train_loss": -7.303621292114258, "global_step": 197948, "epoch": 4713} {"train_loss": -7.197011470794678, "global_step": 197949, "epoch": 4713} {"train_loss": -7.282443523406982, "global_step": 197950, "epoch": 4713} {"train_loss": -7.274379730224609, "global_step": 197951, "epoch": 4713} {"train_loss": -7.25993537902832, "global_step": 197952, "epoch": 4713} {"train_loss": -7.388731479644775, "global_step": 197953, "epoch": 4713} {"train_loss": -7.337482929229736, "global_step": 197954, "epoch": 4713} {"train_loss": -7.2859039306640625, "global_step": 197955, "epoch": 4713} {"train_loss": -7.348934173583984, "global_step": 197956, "epoch": 4713} {"train_loss": -7.3010454177856445, "global_step": 197957, "epoch": 4713} {"train_loss": -7.2562575340271, "global_step": 197958, "epoch": 4713} {"train_loss": -7.250931739807129, "global_step": 197959, "epoch": 4713} {"train_loss": -7.221578121185303, "global_step": 197960, "epoch": 4713} {"train_loss": -7.259010314941406, "global_step": 197961, "epoch": 4713} {"train_loss": -7.385265350341797, "global_step": 197962, "epoch": 4713} {"train_loss": -7.359927177429199, "global_step": 197963, "epoch": 4713} {"train_loss": -7.246899127960205, "global_step": 197964, "epoch": 4713} {"train_loss": -7.260261535644531, "global_step": 197965, "epoch": 4713} {"train_loss": -7.3115105628967285, "global_step": 197966, "epoch": 4713} {"train_loss": -7.211871147155762, "global_step": 197967, "epoch": 4713} {"train_loss": -7.396088123321533, "global_step": 197968, "epoch": 4713} {"train_loss": -7.389555931091309, "global_step": 197969, "epoch": 4713} {"train_loss": -7.348072528839111, "global_step": 197970, "epoch": 4713} {"train_loss": -7.373378753662109, "global_step": 197971, "epoch": 4713} {"train_loss": -7.38808536529541, "global_step": 197972, "epoch": 4713} {"train_loss": -7.219371318817139, "global_step": 197973, "epoch": 4713} {"train_loss": -7.305783271789551, "global_step": 197974, "epoch": 4713} {"train_loss": -7.321261405944824, "global_step": 197975, "epoch": 4713} {"train_loss": -7.314970970153809, "global_step": 197976, "epoch": 4713} {"train_loss": -7.347349166870117, "global_step": 197977, "epoch": 4713} {"train_loss": -7.336780548095703, "global_step": 197978, "epoch": 4713} {"train_loss": -7.300454139709473, "global_step": 197979, "epoch": 4713} {"train_loss": -7.140603065490723, "global_step": 197980, "epoch": 4713} {"train_loss": -7.2945404052734375, "global_step": 197981, "epoch": 4713} {"train_loss": -7.254300594329834, "global_step": 197982, "epoch": 4713} {"train_loss": -7.328764915466309, "global_step": 197983, "epoch": 4713} {"train_loss": -7.30202054977417, "global_step": 197984, "epoch": 4713} {"train_loss": -7.353282928466797, "global_step": 197985, "epoch": 4713} {"train_loss": -7.298315048217773, "global_step": 197986, "epoch": 4713} {"train_loss": -7.298151379539853, "global_step": 197987, "epoch": 4713, "val_loss": 69905.984375} {"train_loss": -7.144932746887207, "global_step": 197988, "epoch": 4714} {"train_loss": -7.277276992797852, "global_step": 197989, "epoch": 4714} {"train_loss": -7.285507678985596, "global_step": 197990, "epoch": 4714} {"train_loss": -7.252195835113525, "global_step": 197991, "epoch": 4714} {"train_loss": -7.305014610290527, "global_step": 197992, "epoch": 4714} {"train_loss": -7.438384056091309, "global_step": 197993, "epoch": 4714} {"train_loss": -7.30726432800293, "global_step": 197994, "epoch": 4714} {"train_loss": -7.42056941986084, "global_step": 197995, "epoch": 4714} {"train_loss": -7.3125081062316895, "global_step": 197996, "epoch": 4714} {"train_loss": -7.388570785522461, "global_step": 197997, "epoch": 4714} {"train_loss": -7.302091121673584, "global_step": 197998, "epoch": 4714} {"train_loss": -7.3474955558776855, "global_step": 197999, "epoch": 4714} {"train_loss": -7.382944107055664, "global_step": 198000, "epoch": 4714} {"train_loss": -7.341597557067871, "global_step": 198001, "epoch": 4714} {"train_loss": -7.334713935852051, "global_step": 198002, "epoch": 4714} {"train_loss": -7.298121452331543, "global_step": 198003, "epoch": 4714} {"train_loss": -7.282938480377197, "global_step": 198004, "epoch": 4714} {"train_loss": -7.353468894958496, "global_step": 198005, "epoch": 4714} {"train_loss": -7.3709282875061035, "global_step": 198006, "epoch": 4714} {"train_loss": -7.310240268707275, "global_step": 198007, "epoch": 4714} {"train_loss": -7.290201187133789, "global_step": 198008, "epoch": 4714} {"train_loss": -7.194024085998535, "global_step": 198009, "epoch": 4714} {"train_loss": -7.27664852142334, "global_step": 198010, "epoch": 4714} {"train_loss": -7.306483745574951, "global_step": 198011, "epoch": 4714} {"train_loss": -7.245038986206055, "global_step": 198012, "epoch": 4714} {"train_loss": -7.294507026672363, "global_step": 198013, "epoch": 4714} {"train_loss": -7.220285892486572, "global_step": 198014, "epoch": 4714} {"train_loss": -7.34121036529541, "global_step": 198015, "epoch": 4714} {"train_loss": -7.3147687911987305, "global_step": 198016, "epoch": 4714} {"train_loss": -7.361924171447754, "global_step": 198017, "epoch": 4714} {"train_loss": -7.120609283447266, "global_step": 198018, "epoch": 4714} {"train_loss": -7.249780654907227, "global_step": 198019, "epoch": 4714} {"train_loss": -7.344481468200684, "global_step": 198020, "epoch": 4714} {"train_loss": -7.195263862609863, "global_step": 198021, "epoch": 4714} {"train_loss": -7.319591522216797, "global_step": 198022, "epoch": 4714} {"train_loss": -7.264801502227783, "global_step": 198023, "epoch": 4714} {"train_loss": -7.231206893920898, "global_step": 198024, "epoch": 4714} {"train_loss": -7.2621564865112305, "global_step": 198025, "epoch": 4714} {"train_loss": -7.2043609619140625, "global_step": 198026, "epoch": 4714} {"train_loss": -7.299412727355957, "global_step": 198027, "epoch": 4714} {"train_loss": -7.24751615524292, "global_step": 198028, "epoch": 4714} {"train_loss": -7.292195921852475, "global_step": 198029, "epoch": 4714, "val_loss": 69682.9921875} {"train_loss": -7.294196128845215, "global_step": 198030, "epoch": 4715} {"train_loss": -7.298621654510498, "global_step": 198031, "epoch": 4715} {"train_loss": -7.322086334228516, "global_step": 198032, "epoch": 4715} {"train_loss": -7.1942644119262695, "global_step": 198033, "epoch": 4715} {"train_loss": -7.153467178344727, "global_step": 198034, "epoch": 4715} {"train_loss": -7.267024993896484, "global_step": 198035, "epoch": 4715} {"train_loss": -7.159615516662598, "global_step": 198036, "epoch": 4715} {"train_loss": -7.231596946716309, "global_step": 198037, "epoch": 4715} {"train_loss": -7.435569763183594, "global_step": 198038, "epoch": 4715} {"train_loss": -7.295389175415039, "global_step": 198039, "epoch": 4715} {"train_loss": -7.266058921813965, "global_step": 198040, "epoch": 4715} {"train_loss": -7.240833282470703, "global_step": 198041, "epoch": 4715} {"train_loss": -7.216716289520264, "global_step": 198042, "epoch": 4715} {"train_loss": -7.317620754241943, "global_step": 198043, "epoch": 4715} {"train_loss": -7.282956123352051, "global_step": 198044, "epoch": 4715} {"train_loss": -7.40608024597168, "global_step": 198045, "epoch": 4715} {"train_loss": -7.291665077209473, "global_step": 198046, "epoch": 4715} {"train_loss": -7.277370929718018, "global_step": 198047, "epoch": 4715} {"train_loss": -7.193391799926758, "global_step": 198048, "epoch": 4715} {"train_loss": -7.348850250244141, "global_step": 198049, "epoch": 4715} {"train_loss": -7.286660194396973, "global_step": 198050, "epoch": 4715} {"train_loss": -7.401974678039551, "global_step": 198051, "epoch": 4715} {"train_loss": -7.318398475646973, "global_step": 198052, "epoch": 4715} {"train_loss": -7.333558559417725, "global_step": 198053, "epoch": 4715} {"train_loss": -7.2730841636657715, "global_step": 198054, "epoch": 4715} {"train_loss": -7.265498638153076, "global_step": 198055, "epoch": 4715} {"train_loss": -7.250481605529785, "global_step": 198056, "epoch": 4715} {"train_loss": -7.206155776977539, "global_step": 198057, "epoch": 4715} {"train_loss": -7.301246643066406, "global_step": 198058, "epoch": 4715} {"train_loss": -7.212313652038574, "global_step": 198059, "epoch": 4715} {"train_loss": -7.207552909851074, "global_step": 198060, "epoch": 4715} {"train_loss": -7.120218753814697, "global_step": 198061, "epoch": 4715} {"train_loss": -7.18814754486084, "global_step": 198062, "epoch": 4715} {"train_loss": -7.113374710083008, "global_step": 198063, "epoch": 4715} {"train_loss": -7.125373840332031, "global_step": 198064, "epoch": 4715} {"train_loss": -7.076496124267578, "global_step": 198065, "epoch": 4715} {"train_loss": -7.210702896118164, "global_step": 198066, "epoch": 4715} {"train_loss": -7.170607566833496, "global_step": 198067, "epoch": 4715} {"train_loss": -7.091523170471191, "global_step": 198068, "epoch": 4715} {"train_loss": -7.19713830947876, "global_step": 198069, "epoch": 4715} {"train_loss": -7.1432929039001465, "global_step": 198070, "epoch": 4715} {"train_loss": -7.245511792954945, "global_step": 198071, "epoch": 4715, "val_loss": 69973.8984375} {"train_loss": -6.995680809020996, "global_step": 198072, "epoch": 4716} {"train_loss": -7.1969499588012695, "global_step": 198073, "epoch": 4716} {"train_loss": -7.08038330078125, "global_step": 198074, "epoch": 4716} {"train_loss": -7.185656547546387, "global_step": 198075, "epoch": 4716} {"train_loss": -7.177603721618652, "global_step": 198076, "epoch": 4716} {"train_loss": -7.101536750793457, "global_step": 198077, "epoch": 4716} {"train_loss": -7.139218330383301, "global_step": 198078, "epoch": 4716} {"train_loss": -7.271490573883057, "global_step": 198079, "epoch": 4716} {"train_loss": -7.211552619934082, "global_step": 198080, "epoch": 4716} {"train_loss": -7.304835319519043, "global_step": 198081, "epoch": 4716} {"train_loss": -7.121956825256348, "global_step": 198082, "epoch": 4716} {"train_loss": -7.2692952156066895, "global_step": 198083, "epoch": 4716} {"train_loss": -7.172580718994141, "global_step": 198084, "epoch": 4716} {"train_loss": -7.278580665588379, "global_step": 198085, "epoch": 4716} {"train_loss": -7.271407127380371, "global_step": 198086, "epoch": 4716} {"train_loss": -7.194995880126953, "global_step": 198087, "epoch": 4716} {"train_loss": -7.194183349609375, "global_step": 198088, "epoch": 4716} {"train_loss": -6.912425518035889, "global_step": 198089, "epoch": 4716} {"train_loss": -7.136525630950928, "global_step": 198090, "epoch": 4716} {"train_loss": -7.1048736572265625, "global_step": 198091, "epoch": 4716} {"train_loss": -7.132340908050537, "global_step": 198092, "epoch": 4716} {"train_loss": -7.258953094482422, "global_step": 198093, "epoch": 4716} {"train_loss": -7.126507759094238, "global_step": 198094, "epoch": 4716} {"train_loss": -7.092604160308838, "global_step": 198095, "epoch": 4716} {"train_loss": -7.421943664550781, "global_step": 198096, "epoch": 4716} {"train_loss": -7.064942836761475, "global_step": 198097, "epoch": 4716} {"train_loss": -7.073580741882324, "global_step": 198098, "epoch": 4716} {"train_loss": -7.213129043579102, "global_step": 198099, "epoch": 4716} {"train_loss": -7.104619026184082, "global_step": 198100, "epoch": 4716} {"train_loss": -7.198221206665039, "global_step": 198101, "epoch": 4716} {"train_loss": -7.154448509216309, "global_step": 198102, "epoch": 4716} {"train_loss": -7.099974632263184, "global_step": 198103, "epoch": 4716} {"train_loss": -7.1487932205200195, "global_step": 198104, "epoch": 4716} {"train_loss": -7.295098781585693, "global_step": 198105, "epoch": 4716} {"train_loss": -7.170382976531982, "global_step": 198106, "epoch": 4716} {"train_loss": -7.13541316986084, "global_step": 198107, "epoch": 4716} {"train_loss": -7.119747161865234, "global_step": 198108, "epoch": 4716} {"train_loss": -7.222071170806885, "global_step": 198109, "epoch": 4716} {"train_loss": -7.205535411834717, "global_step": 198110, "epoch": 4716} {"train_loss": -7.177674770355225, "global_step": 198111, "epoch": 4716} {"train_loss": -7.126502513885498, "global_step": 198112, "epoch": 4716} {"train_loss": -7.168505884352184, "global_step": 198113, "epoch": 4716, "val_loss": 69494.0703125} {"train_loss": -7.257107734680176, "global_step": 198114, "epoch": 4717} {"train_loss": -7.210788726806641, "global_step": 198115, "epoch": 4717} {"train_loss": -7.247224807739258, "global_step": 198116, "epoch": 4717} {"train_loss": -7.303054332733154, "global_step": 198117, "epoch": 4717} {"train_loss": -7.3133134841918945, "global_step": 198118, "epoch": 4717} {"train_loss": -7.303434371948242, "global_step": 198119, "epoch": 4717} {"train_loss": -7.231380462646484, "global_step": 198120, "epoch": 4717} {"train_loss": -7.2224931716918945, "global_step": 198121, "epoch": 4717} {"train_loss": -7.260745525360107, "global_step": 198122, "epoch": 4717} {"train_loss": -7.2608561515808105, "global_step": 198123, "epoch": 4717} {"train_loss": -7.242435455322266, "global_step": 198124, "epoch": 4717} {"train_loss": -7.24282169342041, "global_step": 198125, "epoch": 4717} {"train_loss": -7.274343013763428, "global_step": 198126, "epoch": 4717} {"train_loss": -7.162594795227051, "global_step": 198127, "epoch": 4717} {"train_loss": -7.329888343811035, "global_step": 198128, "epoch": 4717} {"train_loss": -7.324586391448975, "global_step": 198129, "epoch": 4717} {"train_loss": -7.294744491577148, "global_step": 198130, "epoch": 4717} {"train_loss": -7.266132354736328, "global_step": 198131, "epoch": 4717} {"train_loss": -7.209927558898926, "global_step": 198132, "epoch": 4717} {"train_loss": -7.155932426452637, "global_step": 198133, "epoch": 4717} {"train_loss": -7.275625228881836, "global_step": 198134, "epoch": 4717} {"train_loss": -7.3255085945129395, "global_step": 198135, "epoch": 4717} {"train_loss": -7.355319976806641, "global_step": 198136, "epoch": 4717} {"train_loss": -7.305546760559082, "global_step": 198137, "epoch": 4717} {"train_loss": -7.337946891784668, "global_step": 198138, "epoch": 4717} {"train_loss": -7.351655960083008, "global_step": 198139, "epoch": 4717} {"train_loss": -7.34340763092041, "global_step": 198140, "epoch": 4717} {"train_loss": -7.271500587463379, "global_step": 198141, "epoch": 4717} {"train_loss": -7.362644195556641, "global_step": 198142, "epoch": 4717} {"train_loss": -7.273927688598633, "global_step": 198143, "epoch": 4717} {"train_loss": -7.312592506408691, "global_step": 198144, "epoch": 4717} {"train_loss": -7.297721862792969, "global_step": 198145, "epoch": 4717} {"train_loss": -7.253593921661377, "global_step": 198146, "epoch": 4717} {"train_loss": -7.262723922729492, "global_step": 198147, "epoch": 4717} {"train_loss": -7.327855110168457, "global_step": 198148, "epoch": 4717} {"train_loss": -7.266211986541748, "global_step": 198149, "epoch": 4717} {"train_loss": -7.34839391708374, "global_step": 198150, "epoch": 4717} {"train_loss": -7.25251579284668, "global_step": 198151, "epoch": 4717} {"train_loss": -7.341111660003662, "global_step": 198152, "epoch": 4717} {"train_loss": -7.380123615264893, "global_step": 198153, "epoch": 4717} {"train_loss": -7.360440254211426, "global_step": 198154, "epoch": 4717} {"train_loss": -7.286330756686983, "global_step": 198155, "epoch": 4717, "val_loss": 69879.421875} {"train_loss": -7.278635501861572, "global_step": 198156, "epoch": 4718} {"train_loss": -7.410141468048096, "global_step": 198157, "epoch": 4718} {"train_loss": -7.314178466796875, "global_step": 198158, "epoch": 4718} {"train_loss": -7.259771347045898, "global_step": 198159, "epoch": 4718} {"train_loss": -7.394813060760498, "global_step": 198160, "epoch": 4718} {"train_loss": -7.140933036804199, "global_step": 198161, "epoch": 4718} {"train_loss": -7.312440872192383, "global_step": 198162, "epoch": 4718} {"train_loss": -7.326634883880615, "global_step": 198163, "epoch": 4718} {"train_loss": -7.414422512054443, "global_step": 198164, "epoch": 4718} {"train_loss": -7.355159759521484, "global_step": 198165, "epoch": 4718} {"train_loss": -7.375383377075195, "global_step": 198166, "epoch": 4718} {"train_loss": -7.289240837097168, "global_step": 198167, "epoch": 4718} {"train_loss": -7.261735916137695, "global_step": 198168, "epoch": 4718} {"train_loss": -7.293941497802734, "global_step": 198169, "epoch": 4718} {"train_loss": -7.149002552032471, "global_step": 198170, "epoch": 4718} {"train_loss": -7.2009968757629395, "global_step": 198171, "epoch": 4718} {"train_loss": -7.281642913818359, "global_step": 198172, "epoch": 4718} {"train_loss": -7.194616317749023, "global_step": 198173, "epoch": 4718} {"train_loss": -7.005837440490723, "global_step": 198174, "epoch": 4718} {"train_loss": -7.372627258300781, "global_step": 198175, "epoch": 4718} {"train_loss": -7.267735481262207, "global_step": 198176, "epoch": 4718} {"train_loss": -7.142407417297363, "global_step": 198177, "epoch": 4718} {"train_loss": -7.206443786621094, "global_step": 198178, "epoch": 4718} {"train_loss": -7.23777437210083, "global_step": 198179, "epoch": 4718} {"train_loss": -7.252036094665527, "global_step": 198180, "epoch": 4718} {"train_loss": -7.2203264236450195, "global_step": 198181, "epoch": 4718} {"train_loss": -7.126365661621094, "global_step": 198182, "epoch": 4718} {"train_loss": -7.32253360748291, "global_step": 198183, "epoch": 4718} {"train_loss": -7.126106262207031, "global_step": 198184, "epoch": 4718} {"train_loss": -7.08540153503418, "global_step": 198185, "epoch": 4718} {"train_loss": -7.227262496948242, "global_step": 198186, "epoch": 4718} {"train_loss": -7.254459857940674, "global_step": 198187, "epoch": 4718} {"train_loss": -7.207315444946289, "global_step": 198188, "epoch": 4718} {"train_loss": -7.205121040344238, "global_step": 198189, "epoch": 4718} {"train_loss": -7.317157745361328, "global_step": 198190, "epoch": 4718} {"train_loss": -7.22126579284668, "global_step": 198191, "epoch": 4718} {"train_loss": -7.155929088592529, "global_step": 198192, "epoch": 4718} {"train_loss": -7.1352033615112305, "global_step": 198193, "epoch": 4718} {"train_loss": -7.319371223449707, "global_step": 198194, "epoch": 4718} {"train_loss": -7.157781600952148, "global_step": 198195, "epoch": 4718} {"train_loss": -7.140477180480957, "global_step": 198196, "epoch": 4718} {"train_loss": -7.240821361541748, "global_step": 198197, "epoch": 4718, "val_loss": 69877.4765625} {"train_loss": -7.108677864074707, "global_step": 198198, "epoch": 4719} {"train_loss": -7.225345611572266, "global_step": 198199, "epoch": 4719} {"train_loss": -7.29583215713501, "global_step": 198200, "epoch": 4719} {"train_loss": -7.287627220153809, "global_step": 198201, "epoch": 4719} {"train_loss": -7.273638725280762, "global_step": 198202, "epoch": 4719} {"train_loss": -7.251636505126953, "global_step": 198203, "epoch": 4719} {"train_loss": -7.20510196685791, "global_step": 198204, "epoch": 4719} {"train_loss": -7.2705535888671875, "global_step": 198205, "epoch": 4719} {"train_loss": -7.236084461212158, "global_step": 198206, "epoch": 4719} {"train_loss": -7.352640151977539, "global_step": 198207, "epoch": 4719} {"train_loss": -7.2839884757995605, "global_step": 198208, "epoch": 4719} {"train_loss": -7.206799507141113, "global_step": 198209, "epoch": 4719} {"train_loss": -7.195474624633789, "global_step": 198210, "epoch": 4719} {"train_loss": -7.207409858703613, "global_step": 198211, "epoch": 4719} {"train_loss": -7.319764614105225, "global_step": 198212, "epoch": 4719} {"train_loss": -7.220861434936523, "global_step": 198213, "epoch": 4719} {"train_loss": -7.352189064025879, "global_step": 198214, "epoch": 4719} {"train_loss": -7.187201976776123, "global_step": 198215, "epoch": 4719} {"train_loss": -7.267487525939941, "global_step": 198216, "epoch": 4719} {"train_loss": -7.054588794708252, "global_step": 198217, "epoch": 4719} {"train_loss": -7.052001476287842, "global_step": 198218, "epoch": 4719} {"train_loss": -7.380974769592285, "global_step": 198219, "epoch": 4719} {"train_loss": -7.207870960235596, "global_step": 198220, "epoch": 4719} {"train_loss": -7.117349624633789, "global_step": 198221, "epoch": 4719} {"train_loss": -7.319650173187256, "global_step": 198222, "epoch": 4719} {"train_loss": -7.257443904876709, "global_step": 198223, "epoch": 4719} {"train_loss": -7.292288780212402, "global_step": 198224, "epoch": 4719} {"train_loss": -7.241042613983154, "global_step": 198225, "epoch": 4719} {"train_loss": -7.21331262588501, "global_step": 198226, "epoch": 4719} {"train_loss": -7.20719051361084, "global_step": 198227, "epoch": 4719} {"train_loss": -7.203369140625, "global_step": 198228, "epoch": 4719} {"train_loss": -7.341433048248291, "global_step": 198229, "epoch": 4719} {"train_loss": -7.24334716796875, "global_step": 198230, "epoch": 4719} {"train_loss": -7.238062858581543, "global_step": 198231, "epoch": 4719} {"train_loss": -7.271517753601074, "global_step": 198232, "epoch": 4719} {"train_loss": -7.344155311584473, "global_step": 198233, "epoch": 4719} {"train_loss": -7.280407905578613, "global_step": 198234, "epoch": 4719} {"train_loss": -7.294150352478027, "global_step": 198235, "epoch": 4719} {"train_loss": -7.37537956237793, "global_step": 198236, "epoch": 4719} {"train_loss": -7.289780616760254, "global_step": 198237, "epoch": 4719} {"train_loss": -7.302130699157715, "global_step": 198238, "epoch": 4719} {"train_loss": -7.252234663282122, "global_step": 198239, "epoch": 4719, "val_loss": 69706.5390625} {"train_loss": -7.304508209228516, "global_step": 198240, "epoch": 4720} {"train_loss": -7.221356391906738, "global_step": 198241, "epoch": 4720} {"train_loss": -7.337396621704102, "global_step": 198242, "epoch": 4720} {"train_loss": -7.216178894042969, "global_step": 198243, "epoch": 4720} {"train_loss": -7.445042133331299, "global_step": 198244, "epoch": 4720} {"train_loss": -7.177365303039551, "global_step": 198245, "epoch": 4720} {"train_loss": -7.277261734008789, "global_step": 198246, "epoch": 4720} {"train_loss": -7.232333183288574, "global_step": 198247, "epoch": 4720} {"train_loss": -7.158290863037109, "global_step": 198248, "epoch": 4720} {"train_loss": -7.145975112915039, "global_step": 198249, "epoch": 4720} {"train_loss": -7.125611305236816, "global_step": 198250, "epoch": 4720} {"train_loss": -7.38114070892334, "global_step": 198251, "epoch": 4720} {"train_loss": -7.226037979125977, "global_step": 198252, "epoch": 4720} {"train_loss": -7.1317033767700195, "global_step": 198253, "epoch": 4720} {"train_loss": -7.307809352874756, "global_step": 198254, "epoch": 4720} {"train_loss": -7.299927234649658, "global_step": 198255, "epoch": 4720} {"train_loss": -7.095761299133301, "global_step": 198256, "epoch": 4720} {"train_loss": -7.2597784996032715, "global_step": 198257, "epoch": 4720} {"train_loss": -7.22026252746582, "global_step": 198258, "epoch": 4720} {"train_loss": -7.152320861816406, "global_step": 198259, "epoch": 4720} {"train_loss": -7.116478443145752, "global_step": 198260, "epoch": 4720} {"train_loss": -7.3902482986450195, "global_step": 198261, "epoch": 4720} {"train_loss": -7.009491920471191, "global_step": 198262, "epoch": 4720} {"train_loss": -6.9049577713012695, "global_step": 198263, "epoch": 4720} {"train_loss": -7.2402143478393555, "global_step": 198264, "epoch": 4720} {"train_loss": -7.2194414138793945, "global_step": 198265, "epoch": 4720} {"train_loss": -7.183826923370361, "global_step": 198266, "epoch": 4720} {"train_loss": -7.261909484863281, "global_step": 198267, "epoch": 4720} {"train_loss": -7.181312561035156, "global_step": 198268, "epoch": 4720} {"train_loss": -7.105685234069824, "global_step": 198269, "epoch": 4720} {"train_loss": -7.277148723602295, "global_step": 198270, "epoch": 4720} {"train_loss": -7.334245681762695, "global_step": 198271, "epoch": 4720} {"train_loss": -7.255162239074707, "global_step": 198272, "epoch": 4720} {"train_loss": -7.319181442260742, "global_step": 198273, "epoch": 4720} {"train_loss": -7.219245433807373, "global_step": 198274, "epoch": 4720} {"train_loss": -7.227354049682617, "global_step": 198275, "epoch": 4720} {"train_loss": -7.231409072875977, "global_step": 198276, "epoch": 4720} {"train_loss": -7.312520980834961, "global_step": 198277, "epoch": 4720} {"train_loss": -7.392082691192627, "global_step": 198278, "epoch": 4720} {"train_loss": -7.258268356323242, "global_step": 198279, "epoch": 4720} {"train_loss": -7.314291954040527, "global_step": 198280, "epoch": 4720} {"train_loss": -7.231231451034546, "global_step": 198281, "epoch": 4720, "val_loss": 69849.0859375} {"train_loss": -7.253115653991699, "global_step": 198282, "epoch": 4721} {"train_loss": -7.18840217590332, "global_step": 198283, "epoch": 4721} {"train_loss": -7.264593124389648, "global_step": 198284, "epoch": 4721} {"train_loss": -7.201909065246582, "global_step": 198285, "epoch": 4721} {"train_loss": -7.351046562194824, "global_step": 198286, "epoch": 4721} {"train_loss": -7.348719596862793, "global_step": 198287, "epoch": 4721} {"train_loss": -7.341941833496094, "global_step": 198288, "epoch": 4721} {"train_loss": -7.2461957931518555, "global_step": 198289, "epoch": 4721} {"train_loss": -7.26412296295166, "global_step": 198290, "epoch": 4721} {"train_loss": -7.301888465881348, "global_step": 198291, "epoch": 4721} {"train_loss": -7.186278343200684, "global_step": 198292, "epoch": 4721} {"train_loss": -7.248764991760254, "global_step": 198293, "epoch": 4721} {"train_loss": -7.444817543029785, "global_step": 198294, "epoch": 4721} {"train_loss": -7.271818161010742, "global_step": 198295, "epoch": 4721} {"train_loss": -7.338825225830078, "global_step": 198296, "epoch": 4721} {"train_loss": -7.261297225952148, "global_step": 198297, "epoch": 4721} {"train_loss": -7.2694292068481445, "global_step": 198298, "epoch": 4721} {"train_loss": -7.268058776855469, "global_step": 198299, "epoch": 4721} {"train_loss": -7.3004889488220215, "global_step": 198300, "epoch": 4721} {"train_loss": -7.249680519104004, "global_step": 198301, "epoch": 4721} {"train_loss": -7.225835800170898, "global_step": 198302, "epoch": 4721} {"train_loss": -7.2919816970825195, "global_step": 198303, "epoch": 4721} {"train_loss": -7.267156600952148, "global_step": 198304, "epoch": 4721} {"train_loss": -7.269827842712402, "global_step": 198305, "epoch": 4721} {"train_loss": -7.3648529052734375, "global_step": 198306, "epoch": 4721} {"train_loss": -7.325679779052734, "global_step": 198307, "epoch": 4721} {"train_loss": -7.144681930541992, "global_step": 198308, "epoch": 4721} {"train_loss": -7.298740386962891, "global_step": 198309, "epoch": 4721} {"train_loss": -7.2458391189575195, "global_step": 198310, "epoch": 4721} {"train_loss": -7.185179710388184, "global_step": 198311, "epoch": 4721} {"train_loss": -7.132524490356445, "global_step": 198312, "epoch": 4721} {"train_loss": -7.240241050720215, "global_step": 198313, "epoch": 4721} {"train_loss": -7.189781188964844, "global_step": 198314, "epoch": 4721} {"train_loss": -7.1480207443237305, "global_step": 198315, "epoch": 4721} {"train_loss": -7.2017502784729, "global_step": 198316, "epoch": 4721} {"train_loss": -7.31467866897583, "global_step": 198317, "epoch": 4721} {"train_loss": -7.14962911605835, "global_step": 198318, "epoch": 4721} {"train_loss": -7.258120536804199, "global_step": 198319, "epoch": 4721} {"train_loss": -7.106086730957031, "global_step": 198320, "epoch": 4721} {"train_loss": -7.239330291748047, "global_step": 198321, "epoch": 4721} {"train_loss": -7.274827003479004, "global_step": 198322, "epoch": 4721} {"train_loss": -7.254515205110822, "global_step": 198323, "epoch": 4721, "val_loss": 70003.46875} {"train_loss": -7.212247848510742, "global_step": 198324, "epoch": 4722} {"train_loss": -7.2705206871032715, "global_step": 198325, "epoch": 4722} {"train_loss": -7.138162136077881, "global_step": 198326, "epoch": 4722} {"train_loss": -7.185325622558594, "global_step": 198327, "epoch": 4722} {"train_loss": -7.139285087585449, "global_step": 198328, "epoch": 4722} {"train_loss": -7.152944087982178, "global_step": 198329, "epoch": 4722} {"train_loss": -7.137151718139648, "global_step": 198330, "epoch": 4722} {"train_loss": -7.252302169799805, "global_step": 198331, "epoch": 4722} {"train_loss": -7.238455772399902, "global_step": 198332, "epoch": 4722} {"train_loss": -7.223141670227051, "global_step": 198333, "epoch": 4722} {"train_loss": -7.249984264373779, "global_step": 198334, "epoch": 4722} {"train_loss": -7.262726783752441, "global_step": 198335, "epoch": 4722} {"train_loss": -7.2963714599609375, "global_step": 198336, "epoch": 4722} {"train_loss": -7.26801061630249, "global_step": 198337, "epoch": 4722} {"train_loss": -7.205557346343994, "global_step": 198338, "epoch": 4722} {"train_loss": -7.152287483215332, "global_step": 198339, "epoch": 4722} {"train_loss": -7.274101734161377, "global_step": 198340, "epoch": 4722} {"train_loss": -7.270374298095703, "global_step": 198341, "epoch": 4722} {"train_loss": -7.249131202697754, "global_step": 198342, "epoch": 4722} {"train_loss": -7.162108421325684, "global_step": 198343, "epoch": 4722} {"train_loss": -7.263697624206543, "global_step": 198344, "epoch": 4722} {"train_loss": -7.22741174697876, "global_step": 198345, "epoch": 4722} {"train_loss": -7.106654167175293, "global_step": 198346, "epoch": 4722} {"train_loss": -7.170585632324219, "global_step": 198347, "epoch": 4722} {"train_loss": -7.312359809875488, "global_step": 198348, "epoch": 4722} {"train_loss": -7.3046770095825195, "global_step": 198349, "epoch": 4722} {"train_loss": -7.130086898803711, "global_step": 198350, "epoch": 4722} {"train_loss": -7.135993957519531, "global_step": 198351, "epoch": 4722} {"train_loss": -7.244658470153809, "global_step": 198352, "epoch": 4722} {"train_loss": -7.249297618865967, "global_step": 198353, "epoch": 4722} {"train_loss": -7.283139228820801, "global_step": 198354, "epoch": 4722} {"train_loss": -7.2791242599487305, "global_step": 198355, "epoch": 4722} {"train_loss": -7.282464504241943, "global_step": 198356, "epoch": 4722} {"train_loss": -7.206230163574219, "global_step": 198357, "epoch": 4722} {"train_loss": -7.25515079498291, "global_step": 198358, "epoch": 4722} {"train_loss": -7.299681663513184, "global_step": 198359, "epoch": 4722} {"train_loss": -7.288735389709473, "global_step": 198360, "epoch": 4722} {"train_loss": -7.271839618682861, "global_step": 198361, "epoch": 4722} {"train_loss": -7.244204521179199, "global_step": 198362, "epoch": 4722} {"train_loss": -7.0472564697265625, "global_step": 198363, "epoch": 4722} {"train_loss": -7.254281044006348, "global_step": 198364, "epoch": 4722} {"train_loss": -7.225355273201352, "global_step": 198365, "epoch": 4722, "val_loss": 69916.578125} {"train_loss": -7.222774505615234, "global_step": 198366, "epoch": 4723} {"train_loss": -7.17631721496582, "global_step": 198367, "epoch": 4723} {"train_loss": -7.283536911010742, "global_step": 198368, "epoch": 4723} {"train_loss": -7.177642822265625, "global_step": 198369, "epoch": 4723} {"train_loss": -7.237604141235352, "global_step": 198370, "epoch": 4723} {"train_loss": -7.246328353881836, "global_step": 198371, "epoch": 4723} {"train_loss": -7.242384910583496, "global_step": 198372, "epoch": 4723} {"train_loss": -7.267746925354004, "global_step": 198373, "epoch": 4723} {"train_loss": -7.226123809814453, "global_step": 198374, "epoch": 4723} {"train_loss": -7.176069259643555, "global_step": 198375, "epoch": 4723} {"train_loss": -7.091939449310303, "global_step": 198376, "epoch": 4723} {"train_loss": -7.1400651931762695, "global_step": 198377, "epoch": 4723} {"train_loss": -7.232709884643555, "global_step": 198378, "epoch": 4723} {"train_loss": -7.304411888122559, "global_step": 198379, "epoch": 4723} {"train_loss": -7.283758640289307, "global_step": 198380, "epoch": 4723} {"train_loss": -7.172931671142578, "global_step": 198381, "epoch": 4723} {"train_loss": -7.329793930053711, "global_step": 198382, "epoch": 4723} {"train_loss": -7.3000688552856445, "global_step": 198383, "epoch": 4723} {"train_loss": -7.315611839294434, "global_step": 198384, "epoch": 4723} {"train_loss": -7.298896789550781, "global_step": 198385, "epoch": 4723} {"train_loss": -7.249345302581787, "global_step": 198386, "epoch": 4723} {"train_loss": -7.322741985321045, "global_step": 198387, "epoch": 4723} {"train_loss": -7.191373825073242, "global_step": 198388, "epoch": 4723} {"train_loss": -7.091162204742432, "global_step": 198389, "epoch": 4723} {"train_loss": -7.161452293395996, "global_step": 198390, "epoch": 4723} {"train_loss": -7.250239849090576, "global_step": 198391, "epoch": 4723} {"train_loss": -7.207052230834961, "global_step": 198392, "epoch": 4723} {"train_loss": -7.103701114654541, "global_step": 198393, "epoch": 4723} {"train_loss": -7.130317687988281, "global_step": 198394, "epoch": 4723} {"train_loss": -7.247027397155762, "global_step": 198395, "epoch": 4723} {"train_loss": -7.205466270446777, "global_step": 198396, "epoch": 4723} {"train_loss": -7.3017354011535645, "global_step": 198397, "epoch": 4723} {"train_loss": -7.28225040435791, "global_step": 198398, "epoch": 4723} {"train_loss": -7.2529144287109375, "global_step": 198399, "epoch": 4723} {"train_loss": -7.374310493469238, "global_step": 198400, "epoch": 4723} {"train_loss": -7.133989334106445, "global_step": 198401, "epoch": 4723} {"train_loss": -7.223812103271484, "global_step": 198402, "epoch": 4723} {"train_loss": -7.217422962188721, "global_step": 198403, "epoch": 4723} {"train_loss": -7.265106678009033, "global_step": 198404, "epoch": 4723} {"train_loss": -7.33048152923584, "global_step": 198405, "epoch": 4723} {"train_loss": -7.097965717315674, "global_step": 198406, "epoch": 4723} {"train_loss": -7.228926681336903, "global_step": 198407, "epoch": 4723, "val_loss": 69946.625} {"train_loss": -7.243026256561279, "global_step": 198408, "epoch": 4724} {"train_loss": -7.174336910247803, "global_step": 198409, "epoch": 4724} {"train_loss": -7.27849006652832, "global_step": 198410, "epoch": 4724} {"train_loss": -7.140954971313477, "global_step": 198411, "epoch": 4724} {"train_loss": -7.232901573181152, "global_step": 198412, "epoch": 4724} {"train_loss": -7.086092948913574, "global_step": 198413, "epoch": 4724} {"train_loss": -7.11646842956543, "global_step": 198414, "epoch": 4724} {"train_loss": -7.02146053314209, "global_step": 198415, "epoch": 4724} {"train_loss": -7.081945419311523, "global_step": 198416, "epoch": 4724} {"train_loss": -7.057992935180664, "global_step": 198417, "epoch": 4724} {"train_loss": -6.979330062866211, "global_step": 198418, "epoch": 4724} {"train_loss": -7.089800834655762, "global_step": 198419, "epoch": 4724} {"train_loss": -7.12025260925293, "global_step": 198420, "epoch": 4724} {"train_loss": -7.085114479064941, "global_step": 198421, "epoch": 4724} {"train_loss": -7.117961883544922, "global_step": 198422, "epoch": 4724} {"train_loss": -6.950943946838379, "global_step": 198423, "epoch": 4724} {"train_loss": -7.146467208862305, "global_step": 198424, "epoch": 4724} {"train_loss": -7.038449764251709, "global_step": 198425, "epoch": 4724} {"train_loss": -7.184101104736328, "global_step": 198426, "epoch": 4724} {"train_loss": -7.182065010070801, "global_step": 198427, "epoch": 4724} {"train_loss": -7.227998733520508, "global_step": 198428, "epoch": 4724} {"train_loss": -7.110767364501953, "global_step": 198429, "epoch": 4724} {"train_loss": -7.1036152839660645, "global_step": 198430, "epoch": 4724} {"train_loss": -7.099174499511719, "global_step": 198431, "epoch": 4724} {"train_loss": -7.151644229888916, "global_step": 198432, "epoch": 4724} {"train_loss": -7.07478666305542, "global_step": 198433, "epoch": 4724} {"train_loss": -7.171464920043945, "global_step": 198434, "epoch": 4724} {"train_loss": -7.151823997497559, "global_step": 198435, "epoch": 4724} {"train_loss": -7.159099578857422, "global_step": 198436, "epoch": 4724} {"train_loss": -7.27951717376709, "global_step": 198437, "epoch": 4724} {"train_loss": -7.237947940826416, "global_step": 198438, "epoch": 4724} {"train_loss": -7.223957061767578, "global_step": 198439, "epoch": 4724} {"train_loss": -7.226264476776123, "global_step": 198440, "epoch": 4724} {"train_loss": -7.143080711364746, "global_step": 198441, "epoch": 4724} {"train_loss": -7.316592216491699, "global_step": 198442, "epoch": 4724} {"train_loss": -7.107296466827393, "global_step": 198443, "epoch": 4724} {"train_loss": -7.219287872314453, "global_step": 198444, "epoch": 4724} {"train_loss": -7.268402099609375, "global_step": 198445, "epoch": 4724} {"train_loss": -7.100411415100098, "global_step": 198446, "epoch": 4724} {"train_loss": -7.120150566101074, "global_step": 198447, "epoch": 4724} {"train_loss": -7.0526323318481445, "global_step": 198448, "epoch": 4724} {"train_loss": -7.148790881747291, "global_step": 198449, "epoch": 4724, "val_loss": 69854.390625} {"train_loss": -7.178074836730957, "global_step": 198450, "epoch": 4725} {"train_loss": -7.313882350921631, "global_step": 198451, "epoch": 4725} {"train_loss": -7.296046733856201, "global_step": 198452, "epoch": 4725} {"train_loss": -7.334871292114258, "global_step": 198453, "epoch": 4725} {"train_loss": -7.3293256759643555, "global_step": 198454, "epoch": 4725} {"train_loss": -7.163937568664551, "global_step": 198455, "epoch": 4725} {"train_loss": -7.312501430511475, "global_step": 198456, "epoch": 4725} {"train_loss": -7.316708564758301, "global_step": 198457, "epoch": 4725} {"train_loss": -7.265530109405518, "global_step": 198458, "epoch": 4725} {"train_loss": -7.327031135559082, "global_step": 198459, "epoch": 4725} {"train_loss": -7.200328826904297, "global_step": 198460, "epoch": 4725} {"train_loss": -7.190860748291016, "global_step": 198461, "epoch": 4725} {"train_loss": -7.176755905151367, "global_step": 198462, "epoch": 4725} {"train_loss": -7.211292743682861, "global_step": 198463, "epoch": 4725} {"train_loss": -7.359013080596924, "global_step": 198464, "epoch": 4725} {"train_loss": -7.274937629699707, "global_step": 198465, "epoch": 4725} {"train_loss": -7.325124740600586, "global_step": 198466, "epoch": 4725} {"train_loss": -7.306316375732422, "global_step": 198467, "epoch": 4725} {"train_loss": -7.227843284606934, "global_step": 198468, "epoch": 4725} {"train_loss": -7.3756608963012695, "global_step": 198469, "epoch": 4725} {"train_loss": -7.267828941345215, "global_step": 198470, "epoch": 4725} {"train_loss": -7.413585662841797, "global_step": 198471, "epoch": 4725} {"train_loss": -7.423710823059082, "global_step": 198472, "epoch": 4725} {"train_loss": -7.295682907104492, "global_step": 198473, "epoch": 4725} {"train_loss": -7.323040962219238, "global_step": 198474, "epoch": 4725} {"train_loss": -7.308145523071289, "global_step": 198475, "epoch": 4725} {"train_loss": -7.3566484451293945, "global_step": 198476, "epoch": 4725} {"train_loss": -7.293107032775879, "global_step": 198477, "epoch": 4725} {"train_loss": -7.442424297332764, "global_step": 198478, "epoch": 4725} {"train_loss": -7.386356353759766, "global_step": 198479, "epoch": 4725} {"train_loss": -7.338187217712402, "global_step": 198480, "epoch": 4725} {"train_loss": -7.339637756347656, "global_step": 198481, "epoch": 4725} {"train_loss": -7.2468671798706055, "global_step": 198482, "epoch": 4725} {"train_loss": -7.205747604370117, "global_step": 198483, "epoch": 4725} {"train_loss": -7.245034694671631, "global_step": 198484, "epoch": 4725} {"train_loss": -7.2655744552612305, "global_step": 198485, "epoch": 4725} {"train_loss": -7.306464195251465, "global_step": 198486, "epoch": 4725} {"train_loss": -7.22592306137085, "global_step": 198487, "epoch": 4725} {"train_loss": -7.299683570861816, "global_step": 198488, "epoch": 4725} {"train_loss": -7.2551374435424805, "global_step": 198489, "epoch": 4725} {"train_loss": -7.182278633117676, "global_step": 198490, "epoch": 4725} {"train_loss": -7.288177615120297, "global_step": 198491, "epoch": 4725, "val_loss": 69949.234375} {"train_loss": -7.219790458679199, "global_step": 198492, "epoch": 4726} {"train_loss": -7.024144172668457, "global_step": 198493, "epoch": 4726} {"train_loss": -7.105907440185547, "global_step": 198494, "epoch": 4726} {"train_loss": -7.235538482666016, "global_step": 198495, "epoch": 4726} {"train_loss": -7.046979904174805, "global_step": 198496, "epoch": 4726} {"train_loss": -7.204502105712891, "global_step": 198497, "epoch": 4726} {"train_loss": -7.299429893493652, "global_step": 198498, "epoch": 4726} {"train_loss": -7.1395368576049805, "global_step": 198499, "epoch": 4726} {"train_loss": -7.26776123046875, "global_step": 198500, "epoch": 4726} {"train_loss": -7.223973274230957, "global_step": 198501, "epoch": 4726} {"train_loss": -7.135147571563721, "global_step": 198502, "epoch": 4726} {"train_loss": -7.157739639282227, "global_step": 198503, "epoch": 4726} {"train_loss": -7.195688247680664, "global_step": 198504, "epoch": 4726} {"train_loss": -7.229150772094727, "global_step": 198505, "epoch": 4726} {"train_loss": -7.197116374969482, "global_step": 198506, "epoch": 4726} {"train_loss": -7.293617248535156, "global_step": 198507, "epoch": 4726} {"train_loss": -7.299895286560059, "global_step": 198508, "epoch": 4726} {"train_loss": -7.249582767486572, "global_step": 198509, "epoch": 4726} {"train_loss": -7.2187347412109375, "global_step": 198510, "epoch": 4726} {"train_loss": -7.275126934051514, "global_step": 198511, "epoch": 4726} {"train_loss": -7.282021999359131, "global_step": 198512, "epoch": 4726} {"train_loss": -7.172021389007568, "global_step": 198513, "epoch": 4726} {"train_loss": -7.185056686401367, "global_step": 198514, "epoch": 4726} {"train_loss": -7.352597236633301, "global_step": 198515, "epoch": 4726} {"train_loss": -7.24239444732666, "global_step": 198516, "epoch": 4726} {"train_loss": -7.249697685241699, "global_step": 198517, "epoch": 4726} {"train_loss": -7.327449798583984, "global_step": 198518, "epoch": 4726} {"train_loss": -7.363969802856445, "global_step": 198519, "epoch": 4726} {"train_loss": -7.1839280128479, "global_step": 198520, "epoch": 4726} {"train_loss": -7.274314880371094, "global_step": 198521, "epoch": 4726} {"train_loss": -7.270420074462891, "global_step": 198522, "epoch": 4726} {"train_loss": -7.281472682952881, "global_step": 198523, "epoch": 4726} {"train_loss": -7.248833656311035, "global_step": 198524, "epoch": 4726} {"train_loss": -7.26060676574707, "global_step": 198525, "epoch": 4726} {"train_loss": -7.281228065490723, "global_step": 198526, "epoch": 4726} {"train_loss": -7.248557090759277, "global_step": 198527, "epoch": 4726} {"train_loss": -7.280539512634277, "global_step": 198528, "epoch": 4726} {"train_loss": -7.264702320098877, "global_step": 198529, "epoch": 4726} {"train_loss": -7.108989715576172, "global_step": 198530, "epoch": 4726} {"train_loss": -7.262564182281494, "global_step": 198531, "epoch": 4726} {"train_loss": -7.227696418762207, "global_step": 198532, "epoch": 4726} {"train_loss": -7.2304257324763705, "global_step": 198533, "epoch": 4726, "val_loss": 69809.171875} {"train_loss": -7.274432182312012, "global_step": 198534, "epoch": 4727} {"train_loss": -7.246164321899414, "global_step": 198535, "epoch": 4727} {"train_loss": -7.2556562423706055, "global_step": 198536, "epoch": 4727} {"train_loss": -7.243145942687988, "global_step": 198537, "epoch": 4727} {"train_loss": -7.27293062210083, "global_step": 198538, "epoch": 4727} {"train_loss": -7.262041091918945, "global_step": 198539, "epoch": 4727} {"train_loss": -7.258932113647461, "global_step": 198540, "epoch": 4727} {"train_loss": -7.294867992401123, "global_step": 198541, "epoch": 4727} {"train_loss": -7.239702224731445, "global_step": 198542, "epoch": 4727} {"train_loss": -7.307197570800781, "global_step": 198543, "epoch": 4727} {"train_loss": -7.250802993774414, "global_step": 198544, "epoch": 4727} {"train_loss": -7.244174957275391, "global_step": 198545, "epoch": 4727} {"train_loss": -7.27830696105957, "global_step": 198546, "epoch": 4727} {"train_loss": -7.184046745300293, "global_step": 198547, "epoch": 4727} {"train_loss": -7.260685920715332, "global_step": 198548, "epoch": 4727} {"train_loss": -7.246478080749512, "global_step": 198549, "epoch": 4727} {"train_loss": -7.27137565612793, "global_step": 198550, "epoch": 4727} {"train_loss": -7.339591026306152, "global_step": 198551, "epoch": 4727} {"train_loss": -7.202181339263916, "global_step": 198552, "epoch": 4727} {"train_loss": -7.194178581237793, "global_step": 198553, "epoch": 4727} {"train_loss": -7.214582443237305, "global_step": 198554, "epoch": 4727} {"train_loss": -7.3028244972229, "global_step": 198555, "epoch": 4727} {"train_loss": -7.270381927490234, "global_step": 198556, "epoch": 4727} {"train_loss": -7.205509662628174, "global_step": 198557, "epoch": 4727} {"train_loss": -7.292281150817871, "global_step": 198558, "epoch": 4727} {"train_loss": -7.223875999450684, "global_step": 198559, "epoch": 4727} {"train_loss": -7.372598648071289, "global_step": 198560, "epoch": 4727} {"train_loss": -7.258098602294922, "global_step": 198561, "epoch": 4727} {"train_loss": -7.240121841430664, "global_step": 198562, "epoch": 4727} {"train_loss": -7.301397323608398, "global_step": 198563, "epoch": 4727} {"train_loss": -7.294901371002197, "global_step": 198564, "epoch": 4727} {"train_loss": -7.228371620178223, "global_step": 198565, "epoch": 4727} {"train_loss": -7.396027088165283, "global_step": 198566, "epoch": 4727} {"train_loss": -7.141105651855469, "global_step": 198567, "epoch": 4727} {"train_loss": -7.29701042175293, "global_step": 198568, "epoch": 4727} {"train_loss": -7.2689619064331055, "global_step": 198569, "epoch": 4727} {"train_loss": -7.350024700164795, "global_step": 198570, "epoch": 4727} {"train_loss": -7.345917701721191, "global_step": 198571, "epoch": 4727} {"train_loss": -7.2518792152404785, "global_step": 198572, "epoch": 4727} {"train_loss": -7.37410306930542, "global_step": 198573, "epoch": 4727} {"train_loss": -7.213724613189697, "global_step": 198574, "epoch": 4727} {"train_loss": -7.268881116594587, "global_step": 198575, "epoch": 4727, "val_loss": 69910.8203125} {"train_loss": -7.301481246948242, "global_step": 198576, "epoch": 4728} {"train_loss": -7.260991096496582, "global_step": 198577, "epoch": 4728} {"train_loss": -7.2118330001831055, "global_step": 198578, "epoch": 4728} {"train_loss": -7.10590934753418, "global_step": 198579, "epoch": 4728} {"train_loss": -7.169008255004883, "global_step": 198580, "epoch": 4728} {"train_loss": -7.161924839019775, "global_step": 198581, "epoch": 4728} {"train_loss": -7.274235248565674, "global_step": 198582, "epoch": 4728} {"train_loss": -7.240896224975586, "global_step": 198583, "epoch": 4728} {"train_loss": -7.2548136711120605, "global_step": 198584, "epoch": 4728} {"train_loss": -7.138247489929199, "global_step": 198585, "epoch": 4728} {"train_loss": -7.236542701721191, "global_step": 198586, "epoch": 4728} {"train_loss": -7.244322776794434, "global_step": 198587, "epoch": 4728} {"train_loss": -7.106899261474609, "global_step": 198588, "epoch": 4728} {"train_loss": -7.088936805725098, "global_step": 198589, "epoch": 4728} {"train_loss": -7.168464660644531, "global_step": 198590, "epoch": 4728} {"train_loss": -7.2221479415893555, "global_step": 198591, "epoch": 4728} {"train_loss": -7.23638391494751, "global_step": 198592, "epoch": 4728} {"train_loss": -7.127615928649902, "global_step": 198593, "epoch": 4728} {"train_loss": -7.201397895812988, "global_step": 198594, "epoch": 4728} {"train_loss": -7.2241058349609375, "global_step": 198595, "epoch": 4728} {"train_loss": -7.2422027587890625, "global_step": 198596, "epoch": 4728} {"train_loss": -7.2244977951049805, "global_step": 198597, "epoch": 4728} {"train_loss": -7.304283142089844, "global_step": 198598, "epoch": 4728} {"train_loss": -7.24492883682251, "global_step": 198599, "epoch": 4728} {"train_loss": -7.1897430419921875, "global_step": 198600, "epoch": 4728} {"train_loss": -7.230482578277588, "global_step": 198601, "epoch": 4728} {"train_loss": -7.329680442810059, "global_step": 198602, "epoch": 4728} {"train_loss": -7.277463436126709, "global_step": 198603, "epoch": 4728} {"train_loss": -7.315110683441162, "global_step": 198604, "epoch": 4728} {"train_loss": -7.313909530639648, "global_step": 198605, "epoch": 4728} {"train_loss": -7.2554755210876465, "global_step": 198606, "epoch": 4728} {"train_loss": -7.3110246658325195, "global_step": 198607, "epoch": 4728} {"train_loss": -7.2204461097717285, "global_step": 198608, "epoch": 4728} {"train_loss": -7.2534499168396, "global_step": 198609, "epoch": 4728} {"train_loss": -7.2621259689331055, "global_step": 198610, "epoch": 4728} {"train_loss": -7.196493148803711, "global_step": 198611, "epoch": 4728} {"train_loss": -7.262274265289307, "global_step": 198612, "epoch": 4728} {"train_loss": -7.189507484436035, "global_step": 198613, "epoch": 4728} {"train_loss": -7.201566696166992, "global_step": 198614, "epoch": 4728} {"train_loss": -7.151649475097656, "global_step": 198615, "epoch": 4728} {"train_loss": -7.3292436599731445, "global_step": 198616, "epoch": 4728} {"train_loss": -7.22681873185294, "global_step": 198617, "epoch": 4728, "val_loss": 69923.421875} {"train_loss": -7.241302013397217, "global_step": 198618, "epoch": 4729} {"train_loss": -7.2004475593566895, "global_step": 198619, "epoch": 4729} {"train_loss": -7.224448204040527, "global_step": 198620, "epoch": 4729} {"train_loss": -7.2220916748046875, "global_step": 198621, "epoch": 4729} {"train_loss": -7.34848165512085, "global_step": 198622, "epoch": 4729} {"train_loss": -7.277944087982178, "global_step": 198623, "epoch": 4729} {"train_loss": -7.186151504516602, "global_step": 198624, "epoch": 4729} {"train_loss": -7.217358112335205, "global_step": 198625, "epoch": 4729} {"train_loss": -7.255422592163086, "global_step": 198626, "epoch": 4729} {"train_loss": -7.329489707946777, "global_step": 198627, "epoch": 4729} {"train_loss": -7.2209625244140625, "global_step": 198628, "epoch": 4729} {"train_loss": -7.235124588012695, "global_step": 198629, "epoch": 4729} {"train_loss": -7.281038284301758, "global_step": 198630, "epoch": 4729} {"train_loss": -7.229984760284424, "global_step": 198631, "epoch": 4729} {"train_loss": -7.315363883972168, "global_step": 198632, "epoch": 4729} {"train_loss": -7.2259440422058105, "global_step": 198633, "epoch": 4729} {"train_loss": -7.292253494262695, "global_step": 198634, "epoch": 4729} {"train_loss": -7.283989906311035, "global_step": 198635, "epoch": 4729} {"train_loss": -7.234528541564941, "global_step": 198636, "epoch": 4729} {"train_loss": -7.21282958984375, "global_step": 198637, "epoch": 4729} {"train_loss": -7.231361389160156, "global_step": 198638, "epoch": 4729} {"train_loss": -7.311172962188721, "global_step": 198639, "epoch": 4729} {"train_loss": -7.266539573669434, "global_step": 198640, "epoch": 4729} {"train_loss": -7.070394515991211, "global_step": 198641, "epoch": 4729} {"train_loss": -7.305200576782227, "global_step": 198642, "epoch": 4729} {"train_loss": -7.167287826538086, "global_step": 198643, "epoch": 4729} {"train_loss": -7.146716117858887, "global_step": 198644, "epoch": 4729} {"train_loss": -7.179457187652588, "global_step": 198645, "epoch": 4729} {"train_loss": -7.101479530334473, "global_step": 198646, "epoch": 4729} {"train_loss": -7.253940105438232, "global_step": 198647, "epoch": 4729} {"train_loss": -7.172076225280762, "global_step": 198648, "epoch": 4729} {"train_loss": -7.163987636566162, "global_step": 198649, "epoch": 4729} {"train_loss": -7.141793251037598, "global_step": 198650, "epoch": 4729} {"train_loss": -7.133871078491211, "global_step": 198651, "epoch": 4729} {"train_loss": -7.135367393493652, "global_step": 198652, "epoch": 4729} {"train_loss": -7.261678695678711, "global_step": 198653, "epoch": 4729} {"train_loss": -7.180319786071777, "global_step": 198654, "epoch": 4729} {"train_loss": -7.134876251220703, "global_step": 198655, "epoch": 4729} {"train_loss": -7.246590614318848, "global_step": 198656, "epoch": 4729} {"train_loss": -7.226497173309326, "global_step": 198657, "epoch": 4729} {"train_loss": -7.156826496124268, "global_step": 198658, "epoch": 4729} {"train_loss": -7.221931900296893, "global_step": 198659, "epoch": 4729, "val_loss": 70082.1484375} {"train_loss": -7.140518665313721, "global_step": 198660, "epoch": 4730} {"train_loss": -7.0727128982543945, "global_step": 198661, "epoch": 4730} {"train_loss": -7.3498101234436035, "global_step": 198662, "epoch": 4730} {"train_loss": -7.214953899383545, "global_step": 198663, "epoch": 4730} {"train_loss": -7.266273498535156, "global_step": 198664, "epoch": 4730} {"train_loss": -7.14781379699707, "global_step": 198665, "epoch": 4730} {"train_loss": -7.2253265380859375, "global_step": 198666, "epoch": 4730} {"train_loss": -7.230128288269043, "global_step": 198667, "epoch": 4730} {"train_loss": -7.179553031921387, "global_step": 198668, "epoch": 4730} {"train_loss": -7.189448833465576, "global_step": 198669, "epoch": 4730} {"train_loss": -7.272489070892334, "global_step": 198670, "epoch": 4730} {"train_loss": -7.176853179931641, "global_step": 198671, "epoch": 4730} {"train_loss": -7.234982013702393, "global_step": 198672, "epoch": 4730} {"train_loss": -7.23664665222168, "global_step": 198673, "epoch": 4730} {"train_loss": -7.325562000274658, "global_step": 198674, "epoch": 4730} {"train_loss": -7.290030479431152, "global_step": 198675, "epoch": 4730} {"train_loss": -7.260782241821289, "global_step": 198676, "epoch": 4730} {"train_loss": -7.136709690093994, "global_step": 198677, "epoch": 4730} {"train_loss": -7.372829437255859, "global_step": 198678, "epoch": 4730} {"train_loss": -7.317592620849609, "global_step": 198679, "epoch": 4730} {"train_loss": -7.316465377807617, "global_step": 198680, "epoch": 4730} {"train_loss": -7.4523115158081055, "global_step": 198681, "epoch": 4730} {"train_loss": -7.3087544441223145, "global_step": 198682, "epoch": 4730} {"train_loss": -7.2978620529174805, "global_step": 198683, "epoch": 4730} {"train_loss": -7.251673221588135, "global_step": 198684, "epoch": 4730} {"train_loss": -7.355127334594727, "global_step": 198685, "epoch": 4730} {"train_loss": -7.4123358726501465, "global_step": 198686, "epoch": 4730} {"train_loss": -7.3336615562438965, "global_step": 198687, "epoch": 4730} {"train_loss": -7.22429084777832, "global_step": 198688, "epoch": 4730} {"train_loss": -7.405147552490234, "global_step": 198689, "epoch": 4730} {"train_loss": -7.372218132019043, "global_step": 198690, "epoch": 4730} {"train_loss": -7.385954856872559, "global_step": 198691, "epoch": 4730} {"train_loss": -7.288929462432861, "global_step": 198692, "epoch": 4730} {"train_loss": -7.225595951080322, "global_step": 198693, "epoch": 4730} {"train_loss": -7.276140213012695, "global_step": 198694, "epoch": 4730} {"train_loss": -7.385781288146973, "global_step": 198695, "epoch": 4730} {"train_loss": -7.32277250289917, "global_step": 198696, "epoch": 4730} {"train_loss": -7.388577938079834, "global_step": 198697, "epoch": 4730} {"train_loss": -7.368827819824219, "global_step": 198698, "epoch": 4730} {"train_loss": -7.2410054206848145, "global_step": 198699, "epoch": 4730} {"train_loss": -7.3979573249816895, "global_step": 198700, "epoch": 4730} {"train_loss": -7.286048139844622, "global_step": 198701, "epoch": 4730, "val_loss": 69994.140625} {"train_loss": -7.260367393493652, "global_step": 198702, "epoch": 4731} {"train_loss": -7.329529762268066, "global_step": 198703, "epoch": 4731} {"train_loss": -7.288636207580566, "global_step": 198704, "epoch": 4731} {"train_loss": -7.291256904602051, "global_step": 198705, "epoch": 4731} {"train_loss": -7.35733699798584, "global_step": 198706, "epoch": 4731} {"train_loss": -7.469995498657227, "global_step": 198707, "epoch": 4731} {"train_loss": -7.130934715270996, "global_step": 198708, "epoch": 4731} {"train_loss": -6.963392734527588, "global_step": 198709, "epoch": 4731} {"train_loss": -7.184294700622559, "global_step": 198710, "epoch": 4731} {"train_loss": -7.379461288452148, "global_step": 198711, "epoch": 4731} {"train_loss": -7.234154224395752, "global_step": 198712, "epoch": 4731} {"train_loss": -7.212441444396973, "global_step": 198713, "epoch": 4731} {"train_loss": -7.181865692138672, "global_step": 198714, "epoch": 4731} {"train_loss": -7.225709438323975, "global_step": 198715, "epoch": 4731} {"train_loss": -7.379532814025879, "global_step": 198716, "epoch": 4731} {"train_loss": -7.368568420410156, "global_step": 198717, "epoch": 4731} {"train_loss": -7.347369194030762, "global_step": 198718, "epoch": 4731} {"train_loss": -7.353108882904053, "global_step": 198719, "epoch": 4731} {"train_loss": -7.259438991546631, "global_step": 198720, "epoch": 4731} {"train_loss": -7.339331150054932, "global_step": 198721, "epoch": 4731} {"train_loss": -7.252396583557129, "global_step": 198722, "epoch": 4731} {"train_loss": -7.320894241333008, "global_step": 198723, "epoch": 4731} {"train_loss": -7.330583572387695, "global_step": 198724, "epoch": 4731} {"train_loss": -7.1408843994140625, "global_step": 198725, "epoch": 4731} {"train_loss": -7.304703235626221, "global_step": 198726, "epoch": 4731} {"train_loss": -7.361847877502441, "global_step": 198727, "epoch": 4731} {"train_loss": -7.227704048156738, "global_step": 198728, "epoch": 4731} {"train_loss": -7.253171920776367, "global_step": 198729, "epoch": 4731} {"train_loss": -7.153836250305176, "global_step": 198730, "epoch": 4731} {"train_loss": -7.198616027832031, "global_step": 198731, "epoch": 4731} {"train_loss": -7.253550052642822, "global_step": 198732, "epoch": 4731} {"train_loss": -7.129488945007324, "global_step": 198733, "epoch": 4731} {"train_loss": -7.397932052612305, "global_step": 198734, "epoch": 4731} {"train_loss": -7.162374019622803, "global_step": 198735, "epoch": 4731} {"train_loss": -7.259852409362793, "global_step": 198736, "epoch": 4731} {"train_loss": -7.086447715759277, "global_step": 198737, "epoch": 4731} {"train_loss": -7.2274651527404785, "global_step": 198738, "epoch": 4731} {"train_loss": -7.253997325897217, "global_step": 198739, "epoch": 4731} {"train_loss": -7.183838844299316, "global_step": 198740, "epoch": 4731} {"train_loss": -7.212088584899902, "global_step": 198741, "epoch": 4731} {"train_loss": -7.246134281158447, "global_step": 198742, "epoch": 4731} {"train_loss": -7.253183853058588, "global_step": 198743, "epoch": 4731, "val_loss": 69827.1484375} {"train_loss": -7.156158447265625, "global_step": 198744, "epoch": 4732} {"train_loss": -7.201754570007324, "global_step": 198745, "epoch": 4732} {"train_loss": -7.115233898162842, "global_step": 198746, "epoch": 4732} {"train_loss": -7.229540824890137, "global_step": 198747, "epoch": 4732} {"train_loss": -7.087730407714844, "global_step": 198748, "epoch": 4732} {"train_loss": -7.174163818359375, "global_step": 198749, "epoch": 4732} {"train_loss": -7.185591697692871, "global_step": 198750, "epoch": 4732} {"train_loss": -7.0998735427856445, "global_step": 198751, "epoch": 4732} {"train_loss": -7.204244613647461, "global_step": 198752, "epoch": 4732} {"train_loss": -7.25437068939209, "global_step": 198753, "epoch": 4732} {"train_loss": -7.192908763885498, "global_step": 198754, "epoch": 4732} {"train_loss": -7.304190158843994, "global_step": 198755, "epoch": 4732} {"train_loss": -7.182101249694824, "global_step": 198756, "epoch": 4732} {"train_loss": -7.188941955566406, "global_step": 198757, "epoch": 4732} {"train_loss": -7.165738105773926, "global_step": 198758, "epoch": 4732} {"train_loss": -7.28000545501709, "global_step": 198759, "epoch": 4732} {"train_loss": -7.171838760375977, "global_step": 198760, "epoch": 4732} {"train_loss": -7.145583152770996, "global_step": 198761, "epoch": 4732} {"train_loss": -7.292716979980469, "global_step": 198762, "epoch": 4732} {"train_loss": -7.178136825561523, "global_step": 198763, "epoch": 4732} {"train_loss": -7.195148468017578, "global_step": 198764, "epoch": 4732} {"train_loss": -7.1721086502075195, "global_step": 198765, "epoch": 4732} {"train_loss": -7.202941417694092, "global_step": 198766, "epoch": 4732} {"train_loss": -7.232411861419678, "global_step": 198767, "epoch": 4732} {"train_loss": -7.1886491775512695, "global_step": 198768, "epoch": 4732} {"train_loss": -7.257704257965088, "global_step": 198769, "epoch": 4732} {"train_loss": -7.109216690063477, "global_step": 198770, "epoch": 4732} {"train_loss": -7.1886796951293945, "global_step": 198771, "epoch": 4732} {"train_loss": -7.10230827331543, "global_step": 198772, "epoch": 4732} {"train_loss": -7.21413516998291, "global_step": 198773, "epoch": 4732} {"train_loss": -7.19944429397583, "global_step": 198774, "epoch": 4732} {"train_loss": -7.156589031219482, "global_step": 198775, "epoch": 4732} {"train_loss": -7.172859191894531, "global_step": 198776, "epoch": 4732} {"train_loss": -7.255112648010254, "global_step": 198777, "epoch": 4732} {"train_loss": -7.277955055236816, "global_step": 198778, "epoch": 4732} {"train_loss": -7.311622142791748, "global_step": 198779, "epoch": 4732} {"train_loss": -7.39235782623291, "global_step": 198780, "epoch": 4732} {"train_loss": -7.348280906677246, "global_step": 198781, "epoch": 4732} {"train_loss": -7.269103050231934, "global_step": 198782, "epoch": 4732} {"train_loss": -7.279577732086182, "global_step": 198783, "epoch": 4732} {"train_loss": -7.246949195861816, "global_step": 198784, "epoch": 4732} {"train_loss": -7.2091425486973355, "global_step": 198785, "epoch": 4732, "val_loss": 69837.6875} {"train_loss": -7.25192928314209, "global_step": 198786, "epoch": 4733} {"train_loss": -7.279830455780029, "global_step": 198787, "epoch": 4733} {"train_loss": -7.203001976013184, "global_step": 198788, "epoch": 4733} {"train_loss": -7.278813362121582, "global_step": 198789, "epoch": 4733} {"train_loss": -7.191691875457764, "global_step": 198790, "epoch": 4733} {"train_loss": -7.298562049865723, "global_step": 198791, "epoch": 4733} {"train_loss": -7.088164329528809, "global_step": 198792, "epoch": 4733} {"train_loss": -7.127838611602783, "global_step": 198793, "epoch": 4733} {"train_loss": -7.177766799926758, "global_step": 198794, "epoch": 4733} {"train_loss": -7.120181083679199, "global_step": 198795, "epoch": 4733} {"train_loss": -7.266475200653076, "global_step": 198796, "epoch": 4733} {"train_loss": -7.202164649963379, "global_step": 198797, "epoch": 4733} {"train_loss": -7.203899383544922, "global_step": 198798, "epoch": 4733} {"train_loss": -7.292436599731445, "global_step": 198799, "epoch": 4733} {"train_loss": -7.342843055725098, "global_step": 198800, "epoch": 4733} {"train_loss": -7.2167863845825195, "global_step": 198801, "epoch": 4733} {"train_loss": -7.1836934089660645, "global_step": 198802, "epoch": 4733} {"train_loss": -7.272532939910889, "global_step": 198803, "epoch": 4733} {"train_loss": -7.204092979431152, "global_step": 198804, "epoch": 4733} {"train_loss": -7.334935188293457, "global_step": 198805, "epoch": 4733} {"train_loss": -7.261841773986816, "global_step": 198806, "epoch": 4733} {"train_loss": -7.15241813659668, "global_step": 198807, "epoch": 4733} {"train_loss": -7.36617374420166, "global_step": 198808, "epoch": 4733} {"train_loss": -7.125423431396484, "global_step": 198809, "epoch": 4733} {"train_loss": -7.296722412109375, "global_step": 198810, "epoch": 4733} {"train_loss": -7.316011905670166, "global_step": 198811, "epoch": 4733} {"train_loss": -7.1181745529174805, "global_step": 198812, "epoch": 4733} {"train_loss": -7.236930847167969, "global_step": 198813, "epoch": 4733} {"train_loss": -7.286594867706299, "global_step": 198814, "epoch": 4733} {"train_loss": -7.116064071655273, "global_step": 198815, "epoch": 4733} {"train_loss": -7.125241279602051, "global_step": 198816, "epoch": 4733} {"train_loss": -7.105569839477539, "global_step": 198817, "epoch": 4733} {"train_loss": -7.279105186462402, "global_step": 198818, "epoch": 4733} {"train_loss": -7.0086493492126465, "global_step": 198819, "epoch": 4733} {"train_loss": -7.063731670379639, "global_step": 198820, "epoch": 4733} {"train_loss": -7.338403701782227, "global_step": 198821, "epoch": 4733} {"train_loss": -7.189755916595459, "global_step": 198822, "epoch": 4733} {"train_loss": -7.192163944244385, "global_step": 198823, "epoch": 4733} {"train_loss": -7.229376792907715, "global_step": 198824, "epoch": 4733} {"train_loss": -7.2892255783081055, "global_step": 198825, "epoch": 4733} {"train_loss": -7.355861663818359, "global_step": 198826, "epoch": 4733} {"train_loss": -7.217947710128057, "global_step": 198827, "epoch": 4733, "val_loss": 69865.734375} {"train_loss": -7.269519805908203, "global_step": 198828, "epoch": 4734} {"train_loss": -7.304622650146484, "global_step": 198829, "epoch": 4734} {"train_loss": -7.307375907897949, "global_step": 198830, "epoch": 4734} {"train_loss": -7.229189395904541, "global_step": 198831, "epoch": 4734} {"train_loss": -7.067389011383057, "global_step": 198832, "epoch": 4734} {"train_loss": -7.316857814788818, "global_step": 198833, "epoch": 4734} {"train_loss": -7.17680549621582, "global_step": 198834, "epoch": 4734} {"train_loss": -7.278334617614746, "global_step": 198835, "epoch": 4734} {"train_loss": -7.267778396606445, "global_step": 198836, "epoch": 4734} {"train_loss": -7.15449333190918, "global_step": 198837, "epoch": 4734} {"train_loss": -7.148874282836914, "global_step": 198838, "epoch": 4734} {"train_loss": -7.064884185791016, "global_step": 198839, "epoch": 4734} {"train_loss": -7.066271781921387, "global_step": 198840, "epoch": 4734} {"train_loss": -7.178541660308838, "global_step": 198841, "epoch": 4734} {"train_loss": -7.070862293243408, "global_step": 198842, "epoch": 4734} {"train_loss": -7.26579475402832, "global_step": 198843, "epoch": 4734} {"train_loss": -7.199538230895996, "global_step": 198844, "epoch": 4734} {"train_loss": -7.101760387420654, "global_step": 198845, "epoch": 4734} {"train_loss": -7.168534278869629, "global_step": 198846, "epoch": 4734} {"train_loss": -7.209253787994385, "global_step": 198847, "epoch": 4734} {"train_loss": -7.175363540649414, "global_step": 198848, "epoch": 4734} {"train_loss": -6.982535362243652, "global_step": 198849, "epoch": 4734} {"train_loss": -7.278182029724121, "global_step": 198850, "epoch": 4734} {"train_loss": -7.202718734741211, "global_step": 198851, "epoch": 4734} {"train_loss": -7.2106451988220215, "global_step": 198852, "epoch": 4734} {"train_loss": -7.193907737731934, "global_step": 198853, "epoch": 4734} {"train_loss": -7.160689353942871, "global_step": 198854, "epoch": 4734} {"train_loss": -7.216899394989014, "global_step": 198855, "epoch": 4734} {"train_loss": -7.077773094177246, "global_step": 198856, "epoch": 4734} {"train_loss": -7.107804298400879, "global_step": 198857, "epoch": 4734} {"train_loss": -7.143056869506836, "global_step": 198858, "epoch": 4734} {"train_loss": -7.219654083251953, "global_step": 198859, "epoch": 4734} {"train_loss": -7.213961601257324, "global_step": 198860, "epoch": 4734} {"train_loss": -7.281928062438965, "global_step": 198861, "epoch": 4734} {"train_loss": -7.230201244354248, "global_step": 198862, "epoch": 4734} {"train_loss": -7.268507957458496, "global_step": 198863, "epoch": 4734} {"train_loss": -7.229644298553467, "global_step": 198864, "epoch": 4734} {"train_loss": -7.268068790435791, "global_step": 198865, "epoch": 4734} {"train_loss": -7.310021877288818, "global_step": 198866, "epoch": 4734} {"train_loss": -7.185548782348633, "global_step": 198867, "epoch": 4734} {"train_loss": -7.198568820953369, "global_step": 198868, "epoch": 4734} {"train_loss": -7.194364207131522, "global_step": 198869, "epoch": 4734, "val_loss": 69830.328125} {"train_loss": -7.228719711303711, "global_step": 198870, "epoch": 4735} {"train_loss": -7.376881122589111, "global_step": 198871, "epoch": 4735} {"train_loss": -7.383936405181885, "global_step": 198872, "epoch": 4735} {"train_loss": -7.33830451965332, "global_step": 198873, "epoch": 4735} {"train_loss": -7.340257167816162, "global_step": 198874, "epoch": 4735} {"train_loss": -7.369462966918945, "global_step": 198875, "epoch": 4735} {"train_loss": -7.373213291168213, "global_step": 198876, "epoch": 4735} {"train_loss": -7.368707656860352, "global_step": 198877, "epoch": 4735} {"train_loss": -7.316033363342285, "global_step": 198878, "epoch": 4735} {"train_loss": -7.287737846374512, "global_step": 198879, "epoch": 4735} {"train_loss": -7.340411186218262, "global_step": 198880, "epoch": 4735} {"train_loss": -7.415604114532471, "global_step": 198881, "epoch": 4735} {"train_loss": -7.399472236633301, "global_step": 198882, "epoch": 4735} {"train_loss": -7.298752784729004, "global_step": 198883, "epoch": 4735} {"train_loss": -7.227541923522949, "global_step": 198884, "epoch": 4735} {"train_loss": -7.444758892059326, "global_step": 198885, "epoch": 4735} {"train_loss": -7.261952877044678, "global_step": 198886, "epoch": 4735} {"train_loss": -7.340312480926514, "global_step": 198887, "epoch": 4735} {"train_loss": -7.338648319244385, "global_step": 198888, "epoch": 4735} {"train_loss": -7.234564781188965, "global_step": 198889, "epoch": 4735} {"train_loss": -7.285188674926758, "global_step": 198890, "epoch": 4735} {"train_loss": -7.3808722496032715, "global_step": 198891, "epoch": 4735} {"train_loss": -7.198894500732422, "global_step": 198892, "epoch": 4735} {"train_loss": -7.310372352600098, "global_step": 198893, "epoch": 4735} {"train_loss": -7.392447471618652, "global_step": 198894, "epoch": 4735} {"train_loss": -7.331422328948975, "global_step": 198895, "epoch": 4735} {"train_loss": -7.232820510864258, "global_step": 198896, "epoch": 4735} {"train_loss": -7.332564353942871, "global_step": 198897, "epoch": 4735} {"train_loss": -7.165914535522461, "global_step": 198898, "epoch": 4735} {"train_loss": -7.321276664733887, "global_step": 198899, "epoch": 4735} {"train_loss": -7.293310165405273, "global_step": 198900, "epoch": 4735} {"train_loss": -7.248199462890625, "global_step": 198901, "epoch": 4735} {"train_loss": -7.275482177734375, "global_step": 198902, "epoch": 4735} {"train_loss": -7.206295013427734, "global_step": 198903, "epoch": 4735} {"train_loss": -7.146584987640381, "global_step": 198904, "epoch": 4735} {"train_loss": -7.278405666351318, "global_step": 198905, "epoch": 4735} {"train_loss": -7.316603183746338, "global_step": 198906, "epoch": 4735} {"train_loss": -7.253657817840576, "global_step": 198907, "epoch": 4735} {"train_loss": -7.190760135650635, "global_step": 198908, "epoch": 4735} {"train_loss": -7.08820104598999, "global_step": 198909, "epoch": 4735} {"train_loss": -7.266948699951172, "global_step": 198910, "epoch": 4735} {"train_loss": -7.29258192153204, "global_step": 198911, "epoch": 4735, "val_loss": 69854.125} {"train_loss": -7.267516136169434, "global_step": 198912, "epoch": 4736} {"train_loss": -7.2936201095581055, "global_step": 198913, "epoch": 4736} {"train_loss": -7.241097450256348, "global_step": 198914, "epoch": 4736} {"train_loss": -7.2764410972595215, "global_step": 198915, "epoch": 4736} {"train_loss": -7.2345733642578125, "global_step": 198916, "epoch": 4736} {"train_loss": -7.2669243812561035, "global_step": 198917, "epoch": 4736} {"train_loss": -7.2190704345703125, "global_step": 198918, "epoch": 4736} {"train_loss": -7.213706016540527, "global_step": 198919, "epoch": 4736} {"train_loss": -7.252882957458496, "global_step": 198920, "epoch": 4736} {"train_loss": -7.258160591125488, "global_step": 198921, "epoch": 4736} {"train_loss": -7.202587604522705, "global_step": 198922, "epoch": 4736} {"train_loss": -7.219115734100342, "global_step": 198923, "epoch": 4736} {"train_loss": -7.181926250457764, "global_step": 198924, "epoch": 4736} {"train_loss": -7.207915306091309, "global_step": 198925, "epoch": 4736} {"train_loss": -7.20311164855957, "global_step": 198926, "epoch": 4736} {"train_loss": -7.129541397094727, "global_step": 198927, "epoch": 4736} {"train_loss": -7.103623390197754, "global_step": 198928, "epoch": 4736} {"train_loss": -7.172111511230469, "global_step": 198929, "epoch": 4736} {"train_loss": -7.1334228515625, "global_step": 198930, "epoch": 4736} {"train_loss": -7.205359935760498, "global_step": 198931, "epoch": 4736} {"train_loss": -7.062570571899414, "global_step": 198932, "epoch": 4736} {"train_loss": -7.236795425415039, "global_step": 198933, "epoch": 4736} {"train_loss": -7.143520355224609, "global_step": 198934, "epoch": 4736} {"train_loss": -7.091684341430664, "global_step": 198935, "epoch": 4736} {"train_loss": -7.244206428527832, "global_step": 198936, "epoch": 4736} {"train_loss": -7.242863178253174, "global_step": 198937, "epoch": 4736} {"train_loss": -7.173859596252441, "global_step": 198938, "epoch": 4736} {"train_loss": -7.178140640258789, "global_step": 198939, "epoch": 4736} {"train_loss": -7.290321350097656, "global_step": 198940, "epoch": 4736} {"train_loss": -7.236569881439209, "global_step": 198941, "epoch": 4736} {"train_loss": -7.047800064086914, "global_step": 198942, "epoch": 4736} {"train_loss": -7.300456523895264, "global_step": 198943, "epoch": 4736} {"train_loss": -7.178073883056641, "global_step": 198944, "epoch": 4736} {"train_loss": -7.230029106140137, "global_step": 198945, "epoch": 4736} {"train_loss": -7.162473678588867, "global_step": 198946, "epoch": 4736} {"train_loss": -7.288777828216553, "global_step": 198947, "epoch": 4736} {"train_loss": -7.274211406707764, "global_step": 198948, "epoch": 4736} {"train_loss": -7.176297664642334, "global_step": 198949, "epoch": 4736} {"train_loss": -7.0893378257751465, "global_step": 198950, "epoch": 4736} {"train_loss": -7.235861778259277, "global_step": 198951, "epoch": 4736} {"train_loss": -7.23563289642334, "global_step": 198952, "epoch": 4736} {"train_loss": -7.204615184238979, "global_step": 198953, "epoch": 4736, "val_loss": 69869.96875} {"train_loss": -7.151873588562012, "global_step": 198954, "epoch": 4737} {"train_loss": -7.250574111938477, "global_step": 198955, "epoch": 4737} {"train_loss": -7.180851459503174, "global_step": 198956, "epoch": 4737} {"train_loss": -7.26882266998291, "global_step": 198957, "epoch": 4737} {"train_loss": -7.231832504272461, "global_step": 198958, "epoch": 4737} {"train_loss": -7.261629104614258, "global_step": 198959, "epoch": 4737} {"train_loss": -7.2293572425842285, "global_step": 198960, "epoch": 4737} {"train_loss": -7.152486801147461, "global_step": 198961, "epoch": 4737} {"train_loss": -7.266946792602539, "global_step": 198962, "epoch": 4737} {"train_loss": -7.248188018798828, "global_step": 198963, "epoch": 4737} {"train_loss": -7.181129455566406, "global_step": 198964, "epoch": 4737} {"train_loss": -7.216466903686523, "global_step": 198965, "epoch": 4737} {"train_loss": -7.253207683563232, "global_step": 198966, "epoch": 4737} {"train_loss": -7.296131134033203, "global_step": 198967, "epoch": 4737} {"train_loss": -7.22845983505249, "global_step": 198968, "epoch": 4737} {"train_loss": -7.289768218994141, "global_step": 198969, "epoch": 4737} {"train_loss": -7.1924357414245605, "global_step": 198970, "epoch": 4737} {"train_loss": -7.287623405456543, "global_step": 198971, "epoch": 4737} {"train_loss": -7.2987236976623535, "global_step": 198972, "epoch": 4737} {"train_loss": -7.126727104187012, "global_step": 198973, "epoch": 4737} {"train_loss": -7.314043045043945, "global_step": 198974, "epoch": 4737} {"train_loss": -7.167848587036133, "global_step": 198975, "epoch": 4737} {"train_loss": -7.408825874328613, "global_step": 198976, "epoch": 4737} {"train_loss": -7.205012321472168, "global_step": 198977, "epoch": 4737} {"train_loss": -7.132345676422119, "global_step": 198978, "epoch": 4737} {"train_loss": -7.316227912902832, "global_step": 198979, "epoch": 4737} {"train_loss": -7.338312149047852, "global_step": 198980, "epoch": 4737} {"train_loss": -7.0626983642578125, "global_step": 198981, "epoch": 4737} {"train_loss": -7.134889602661133, "global_step": 198982, "epoch": 4737} {"train_loss": -7.191842079162598, "global_step": 198983, "epoch": 4737} {"train_loss": -7.097354888916016, "global_step": 198984, "epoch": 4737} {"train_loss": -7.325082778930664, "global_step": 198985, "epoch": 4737} {"train_loss": -7.18996000289917, "global_step": 198986, "epoch": 4737} {"train_loss": -6.944766044616699, "global_step": 198987, "epoch": 4737} {"train_loss": -7.163491249084473, "global_step": 198988, "epoch": 4737} {"train_loss": -7.190074920654297, "global_step": 198989, "epoch": 4737} {"train_loss": -7.171137809753418, "global_step": 198990, "epoch": 4737} {"train_loss": -7.311541557312012, "global_step": 198991, "epoch": 4737} {"train_loss": -7.075516700744629, "global_step": 198992, "epoch": 4737} {"train_loss": -7.161822319030762, "global_step": 198993, "epoch": 4737} {"train_loss": -7.262237548828125, "global_step": 198994, "epoch": 4737} {"train_loss": -7.212359893889654, "global_step": 198995, "epoch": 4737, "val_loss": 69806.859375} {"train_loss": -7.164053916931152, "global_step": 198996, "epoch": 4738} {"train_loss": -7.253798484802246, "global_step": 198997, "epoch": 4738} {"train_loss": -7.05419921875, "global_step": 198998, "epoch": 4738} {"train_loss": -7.2000932693481445, "global_step": 198999, "epoch": 4738} {"train_loss": -7.257321357727051, "global_step": 199000, "epoch": 4738} {"train_loss": -7.206567764282227, "global_step": 199001, "epoch": 4738} {"train_loss": -7.246946811676025, "global_step": 199002, "epoch": 4738} {"train_loss": -7.3662109375, "global_step": 199003, "epoch": 4738} {"train_loss": -7.182571887969971, "global_step": 199004, "epoch": 4738} {"train_loss": -7.27706241607666, "global_step": 199005, "epoch": 4738} {"train_loss": -7.333225250244141, "global_step": 199006, "epoch": 4738} {"train_loss": -7.2853288650512695, "global_step": 199007, "epoch": 4738} {"train_loss": -7.245171546936035, "global_step": 199008, "epoch": 4738} {"train_loss": -7.305603981018066, "global_step": 199009, "epoch": 4738} {"train_loss": -7.272004127502441, "global_step": 199010, "epoch": 4738} {"train_loss": -7.261135101318359, "global_step": 199011, "epoch": 4738} {"train_loss": -7.265561103820801, "global_step": 199012, "epoch": 4738} {"train_loss": -7.361318588256836, "global_step": 199013, "epoch": 4738} {"train_loss": -7.257852554321289, "global_step": 199014, "epoch": 4738} {"train_loss": -7.261542320251465, "global_step": 199015, "epoch": 4738} {"train_loss": -7.218122959136963, "global_step": 199016, "epoch": 4738} {"train_loss": -7.195523262023926, "global_step": 199017, "epoch": 4738} {"train_loss": -7.252994537353516, "global_step": 199018, "epoch": 4738} {"train_loss": -7.337059020996094, "global_step": 199019, "epoch": 4738} {"train_loss": -7.2756667137146, "global_step": 199020, "epoch": 4738} {"train_loss": -7.166337966918945, "global_step": 199021, "epoch": 4738} {"train_loss": -7.075498580932617, "global_step": 199022, "epoch": 4738} {"train_loss": -7.092787265777588, "global_step": 199023, "epoch": 4738} {"train_loss": -6.94270133972168, "global_step": 199024, "epoch": 4738} {"train_loss": -6.944509506225586, "global_step": 199025, "epoch": 4738} {"train_loss": -7.1944074630737305, "global_step": 199026, "epoch": 4738} {"train_loss": -6.857907295227051, "global_step": 199027, "epoch": 4738} {"train_loss": -7.150115966796875, "global_step": 199028, "epoch": 4738} {"train_loss": -6.794197082519531, "global_step": 199029, "epoch": 4738} {"train_loss": -7.09859037399292, "global_step": 199030, "epoch": 4738} {"train_loss": -6.916887283325195, "global_step": 199031, "epoch": 4738} {"train_loss": -7.166316032409668, "global_step": 199032, "epoch": 4738} {"train_loss": -6.867180824279785, "global_step": 199033, "epoch": 4738} {"train_loss": -7.094582557678223, "global_step": 199034, "epoch": 4738} {"train_loss": -7.076249122619629, "global_step": 199035, "epoch": 4738} {"train_loss": -7.022157192230225, "global_step": 199036, "epoch": 4738} {"train_loss": -7.164330732254755, "global_step": 199037, "epoch": 4738, "val_loss": 69885.2578125} {"train_loss": -7.212003707885742, "global_step": 199038, "epoch": 4739} {"train_loss": -7.077645301818848, "global_step": 199039, "epoch": 4739} {"train_loss": -7.227446556091309, "global_step": 199040, "epoch": 4739} {"train_loss": -7.192933082580566, "global_step": 199041, "epoch": 4739} {"train_loss": -7.217676162719727, "global_step": 199042, "epoch": 4739} {"train_loss": -7.117271423339844, "global_step": 199043, "epoch": 4739} {"train_loss": -7.102567672729492, "global_step": 199044, "epoch": 4739} {"train_loss": -7.137271404266357, "global_step": 199045, "epoch": 4739} {"train_loss": -7.212638854980469, "global_step": 199046, "epoch": 4739} {"train_loss": -7.181770324707031, "global_step": 199047, "epoch": 4739} {"train_loss": -7.314409255981445, "global_step": 199048, "epoch": 4739} {"train_loss": -7.212601661682129, "global_step": 199049, "epoch": 4739} {"train_loss": -7.258020877838135, "global_step": 199050, "epoch": 4739} {"train_loss": -7.168952941894531, "global_step": 199051, "epoch": 4739} {"train_loss": -7.237961769104004, "global_step": 199052, "epoch": 4739} {"train_loss": -7.287790298461914, "global_step": 199053, "epoch": 4739} {"train_loss": -7.163495063781738, "global_step": 199054, "epoch": 4739} {"train_loss": -7.344264984130859, "global_step": 199055, "epoch": 4739} {"train_loss": -7.11562442779541, "global_step": 199056, "epoch": 4739} {"train_loss": -7.3478312492370605, "global_step": 199057, "epoch": 4739} {"train_loss": -7.324581623077393, "global_step": 199058, "epoch": 4739} {"train_loss": -7.325869560241699, "global_step": 199059, "epoch": 4739} {"train_loss": -7.380153656005859, "global_step": 199060, "epoch": 4739} {"train_loss": -7.341259956359863, "global_step": 199061, "epoch": 4739} {"train_loss": -7.324787139892578, "global_step": 199062, "epoch": 4739} {"train_loss": -7.389026165008545, "global_step": 199063, "epoch": 4739} {"train_loss": -7.481939315795898, "global_step": 199064, "epoch": 4739} {"train_loss": -7.367598533630371, "global_step": 199065, "epoch": 4739} {"train_loss": -7.400280475616455, "global_step": 199066, "epoch": 4739} {"train_loss": -7.444765090942383, "global_step": 199067, "epoch": 4739} {"train_loss": -7.313674449920654, "global_step": 199068, "epoch": 4739} {"train_loss": -7.227846622467041, "global_step": 199069, "epoch": 4739} {"train_loss": -7.379627704620361, "global_step": 199070, "epoch": 4739} {"train_loss": -7.282721519470215, "global_step": 199071, "epoch": 4739} {"train_loss": -7.353854656219482, "global_step": 199072, "epoch": 4739} {"train_loss": -7.2921462059021, "global_step": 199073, "epoch": 4739} {"train_loss": -7.300692081451416, "global_step": 199074, "epoch": 4739} {"train_loss": -7.316025733947754, "global_step": 199075, "epoch": 4739} {"train_loss": -7.325456142425537, "global_step": 199076, "epoch": 4739} {"train_loss": -7.322624206542969, "global_step": 199077, "epoch": 4739} {"train_loss": -7.32914924621582, "global_step": 199078, "epoch": 4739} {"train_loss": -7.276916129248483, "global_step": 199079, "epoch": 4739, "val_loss": 69822.3046875} {"train_loss": -7.2923407554626465, "global_step": 199080, "epoch": 4740} {"train_loss": -7.28359317779541, "global_step": 199081, "epoch": 4740} {"train_loss": -7.236290454864502, "global_step": 199082, "epoch": 4740} {"train_loss": -7.3191986083984375, "global_step": 199083, "epoch": 4740} {"train_loss": -7.269832611083984, "global_step": 199084, "epoch": 4740} {"train_loss": -7.3011884689331055, "global_step": 199085, "epoch": 4740} {"train_loss": -7.305850982666016, "global_step": 199086, "epoch": 4740} {"train_loss": -7.19902229309082, "global_step": 199087, "epoch": 4740} {"train_loss": -7.201229572296143, "global_step": 199088, "epoch": 4740} {"train_loss": -7.196938514709473, "global_step": 199089, "epoch": 4740} {"train_loss": -7.230016231536865, "global_step": 199090, "epoch": 4740} {"train_loss": -7.384459018707275, "global_step": 199091, "epoch": 4740} {"train_loss": -7.238888740539551, "global_step": 199092, "epoch": 4740} {"train_loss": -7.241503715515137, "global_step": 199093, "epoch": 4740} {"train_loss": -7.176013946533203, "global_step": 199094, "epoch": 4740} {"train_loss": -7.14723539352417, "global_step": 199095, "epoch": 4740} {"train_loss": -7.253410339355469, "global_step": 199096, "epoch": 4740} {"train_loss": -7.2727131843566895, "global_step": 199097, "epoch": 4740} {"train_loss": -7.203119277954102, "global_step": 199098, "epoch": 4740} {"train_loss": -7.349813461303711, "global_step": 199099, "epoch": 4740} {"train_loss": -7.237310409545898, "global_step": 199100, "epoch": 4740} {"train_loss": -7.322805404663086, "global_step": 199101, "epoch": 4740} {"train_loss": -7.161523342132568, "global_step": 199102, "epoch": 4740} {"train_loss": -7.210745334625244, "global_step": 199103, "epoch": 4740} {"train_loss": -7.281957626342773, "global_step": 199104, "epoch": 4740} {"train_loss": -7.227727890014648, "global_step": 199105, "epoch": 4740} {"train_loss": -7.30244779586792, "global_step": 199106, "epoch": 4740} {"train_loss": -7.230158805847168, "global_step": 199107, "epoch": 4740} {"train_loss": -7.176548004150391, "global_step": 199108, "epoch": 4740} {"train_loss": -7.318559169769287, "global_step": 199109, "epoch": 4740} {"train_loss": -7.307849884033203, "global_step": 199110, "epoch": 4740} {"train_loss": -7.21632194519043, "global_step": 199111, "epoch": 4740} {"train_loss": -7.443159103393555, "global_step": 199112, "epoch": 4740} {"train_loss": -7.226093292236328, "global_step": 199113, "epoch": 4740} {"train_loss": -7.285123348236084, "global_step": 199114, "epoch": 4740} {"train_loss": -7.235470771789551, "global_step": 199115, "epoch": 4740} {"train_loss": -7.202553749084473, "global_step": 199116, "epoch": 4740} {"train_loss": -7.2367262840271, "global_step": 199117, "epoch": 4740} {"train_loss": -7.153193473815918, "global_step": 199118, "epoch": 4740} {"train_loss": -7.192397117614746, "global_step": 199119, "epoch": 4740} {"train_loss": -7.235280990600586, "global_step": 199120, "epoch": 4740} {"train_loss": -7.254187095732916, "global_step": 199121, "epoch": 4740, "val_loss": 69815.21875} {"train_loss": -7.3256940841674805, "global_step": 199122, "epoch": 4741} {"train_loss": -7.268956184387207, "global_step": 199123, "epoch": 4741} {"train_loss": -7.224886417388916, "global_step": 199124, "epoch": 4741} {"train_loss": -7.1567535400390625, "global_step": 199125, "epoch": 4741} {"train_loss": -7.216970920562744, "global_step": 199126, "epoch": 4741} {"train_loss": -7.050966262817383, "global_step": 199127, "epoch": 4741} {"train_loss": -7.130341053009033, "global_step": 199128, "epoch": 4741} {"train_loss": -7.260158061981201, "global_step": 199129, "epoch": 4741} {"train_loss": -7.077725887298584, "global_step": 199130, "epoch": 4741} {"train_loss": -7.1775054931640625, "global_step": 199131, "epoch": 4741} {"train_loss": -7.067594528198242, "global_step": 199132, "epoch": 4741} {"train_loss": -7.0092668533325195, "global_step": 199133, "epoch": 4741} {"train_loss": -7.18106746673584, "global_step": 199134, "epoch": 4741} {"train_loss": -6.990708351135254, "global_step": 199135, "epoch": 4741} {"train_loss": -7.223020076751709, "global_step": 199136, "epoch": 4741} {"train_loss": -6.969244956970215, "global_step": 199137, "epoch": 4741} {"train_loss": -7.051131725311279, "global_step": 199138, "epoch": 4741} {"train_loss": -7.176673889160156, "global_step": 199139, "epoch": 4741} {"train_loss": -7.057278633117676, "global_step": 199140, "epoch": 4741} {"train_loss": -7.050795555114746, "global_step": 199141, "epoch": 4741} {"train_loss": -7.2022905349731445, "global_step": 199142, "epoch": 4741} {"train_loss": -7.129359245300293, "global_step": 199143, "epoch": 4741} {"train_loss": -7.169325828552246, "global_step": 199144, "epoch": 4741} {"train_loss": -7.183478832244873, "global_step": 199145, "epoch": 4741} {"train_loss": -7.18891716003418, "global_step": 199146, "epoch": 4741} {"train_loss": -7.198281288146973, "global_step": 199147, "epoch": 4741} {"train_loss": -7.202029228210449, "global_step": 199148, "epoch": 4741} {"train_loss": -7.216304779052734, "global_step": 199149, "epoch": 4741} {"train_loss": -7.218815803527832, "global_step": 199150, "epoch": 4741} {"train_loss": -7.203828811645508, "global_step": 199151, "epoch": 4741} {"train_loss": -7.21488618850708, "global_step": 199152, "epoch": 4741} {"train_loss": -7.226595878601074, "global_step": 199153, "epoch": 4741} {"train_loss": -7.194388389587402, "global_step": 199154, "epoch": 4741} {"train_loss": -7.316097736358643, "global_step": 199155, "epoch": 4741} {"train_loss": -7.257893085479736, "global_step": 199156, "epoch": 4741} {"train_loss": -7.218020915985107, "global_step": 199157, "epoch": 4741} {"train_loss": -7.197522163391113, "global_step": 199158, "epoch": 4741} {"train_loss": -7.378741264343262, "global_step": 199159, "epoch": 4741} {"train_loss": -7.141427516937256, "global_step": 199160, "epoch": 4741} {"train_loss": -7.261415004730225, "global_step": 199161, "epoch": 4741} {"train_loss": -7.226244926452637, "global_step": 199162, "epoch": 4741} {"train_loss": -7.1762310436793735, "global_step": 199163, "epoch": 4741, "val_loss": 69855.546875} {"train_loss": -7.316627502441406, "global_step": 199164, "epoch": 4742} {"train_loss": -7.272856712341309, "global_step": 199165, "epoch": 4742} {"train_loss": -7.258162975311279, "global_step": 199166, "epoch": 4742} {"train_loss": -7.247367858886719, "global_step": 199167, "epoch": 4742} {"train_loss": -7.303225994110107, "global_step": 199168, "epoch": 4742} {"train_loss": -7.3354315757751465, "global_step": 199169, "epoch": 4742} {"train_loss": -7.198366165161133, "global_step": 199170, "epoch": 4742} {"train_loss": -7.275026321411133, "global_step": 199171, "epoch": 4742} {"train_loss": -7.174468040466309, "global_step": 199172, "epoch": 4742} {"train_loss": -7.3199052810668945, "global_step": 199173, "epoch": 4742} {"train_loss": -7.337866306304932, "global_step": 199174, "epoch": 4742} {"train_loss": -7.240671634674072, "global_step": 199175, "epoch": 4742} {"train_loss": -7.296184062957764, "global_step": 199176, "epoch": 4742} {"train_loss": -7.324837684631348, "global_step": 199177, "epoch": 4742} {"train_loss": -7.312378883361816, "global_step": 199178, "epoch": 4742} {"train_loss": -7.237603664398193, "global_step": 199179, "epoch": 4742} {"train_loss": -7.322292327880859, "global_step": 199180, "epoch": 4742} {"train_loss": -7.262493133544922, "global_step": 199181, "epoch": 4742} {"train_loss": -7.266098976135254, "global_step": 199182, "epoch": 4742} {"train_loss": -7.246143341064453, "global_step": 199183, "epoch": 4742} {"train_loss": -7.329121112823486, "global_step": 199184, "epoch": 4742} {"train_loss": -7.424670219421387, "global_step": 199185, "epoch": 4742} {"train_loss": -7.26132869720459, "global_step": 199186, "epoch": 4742} {"train_loss": -7.276772499084473, "global_step": 199187, "epoch": 4742} {"train_loss": -7.40627384185791, "global_step": 199188, "epoch": 4742} {"train_loss": -7.4373369216918945, "global_step": 199189, "epoch": 4742} {"train_loss": -7.428307056427002, "global_step": 199190, "epoch": 4742} {"train_loss": -7.324591636657715, "global_step": 199191, "epoch": 4742} {"train_loss": -7.309565544128418, "global_step": 199192, "epoch": 4742} {"train_loss": -7.361275672912598, "global_step": 199193, "epoch": 4742} {"train_loss": -7.313763618469238, "global_step": 199194, "epoch": 4742} {"train_loss": -7.223931312561035, "global_step": 199195, "epoch": 4742} {"train_loss": -7.312896728515625, "global_step": 199196, "epoch": 4742} {"train_loss": -7.363544464111328, "global_step": 199197, "epoch": 4742} {"train_loss": -7.319002151489258, "global_step": 199198, "epoch": 4742} {"train_loss": -7.255996227264404, "global_step": 199199, "epoch": 4742} {"train_loss": -7.3353729248046875, "global_step": 199200, "epoch": 4742} {"train_loss": -7.329974174499512, "global_step": 199201, "epoch": 4742} {"train_loss": -7.340655326843262, "global_step": 199202, "epoch": 4742} {"train_loss": -7.352712154388428, "global_step": 199203, "epoch": 4742} {"train_loss": -7.320577144622803, "global_step": 199204, "epoch": 4742} {"train_loss": -7.3099702426365445, "global_step": 199205, "epoch": 4742, "val_loss": 69866.109375} {"train_loss": -7.2837233543396, "global_step": 199206, "epoch": 4743} {"train_loss": -7.273536682128906, "global_step": 199207, "epoch": 4743} {"train_loss": -7.310629367828369, "global_step": 199208, "epoch": 4743} {"train_loss": -7.311650276184082, "global_step": 199209, "epoch": 4743} {"train_loss": -7.268030643463135, "global_step": 199210, "epoch": 4743} {"train_loss": -7.307358264923096, "global_step": 199211, "epoch": 4743} {"train_loss": -7.445232391357422, "global_step": 199212, "epoch": 4743} {"train_loss": -7.279083728790283, "global_step": 199213, "epoch": 4743} {"train_loss": -7.382004737854004, "global_step": 199214, "epoch": 4743} {"train_loss": -7.282541275024414, "global_step": 199215, "epoch": 4743} {"train_loss": -7.25732421875, "global_step": 199216, "epoch": 4743} {"train_loss": -7.252852439880371, "global_step": 199217, "epoch": 4743} {"train_loss": -7.317262649536133, "global_step": 199218, "epoch": 4743} {"train_loss": -7.178656578063965, "global_step": 199219, "epoch": 4743} {"train_loss": -7.298785209655762, "global_step": 199220, "epoch": 4743} {"train_loss": -7.344765663146973, "global_step": 199221, "epoch": 4743} {"train_loss": -7.287294387817383, "global_step": 199222, "epoch": 4743} {"train_loss": -7.290928840637207, "global_step": 199223, "epoch": 4743} {"train_loss": -7.276909351348877, "global_step": 199224, "epoch": 4743} {"train_loss": -7.270542144775391, "global_step": 199225, "epoch": 4743} {"train_loss": -7.241489410400391, "global_step": 199226, "epoch": 4743} {"train_loss": -7.387034893035889, "global_step": 199227, "epoch": 4743} {"train_loss": -7.330326080322266, "global_step": 199228, "epoch": 4743} {"train_loss": -7.289149284362793, "global_step": 199229, "epoch": 4743} {"train_loss": -7.339162349700928, "global_step": 199230, "epoch": 4743} {"train_loss": -7.2236785888671875, "global_step": 199231, "epoch": 4743} {"train_loss": -7.274908542633057, "global_step": 199232, "epoch": 4743} {"train_loss": -7.196401119232178, "global_step": 199233, "epoch": 4743} {"train_loss": -7.367504119873047, "global_step": 199234, "epoch": 4743} {"train_loss": -7.323469161987305, "global_step": 199235, "epoch": 4743} {"train_loss": -7.252236366271973, "global_step": 199236, "epoch": 4743} {"train_loss": -7.325325965881348, "global_step": 199237, "epoch": 4743} {"train_loss": -7.252687454223633, "global_step": 199238, "epoch": 4743} {"train_loss": -7.349276542663574, "global_step": 199239, "epoch": 4743} {"train_loss": -7.126758098602295, "global_step": 199240, "epoch": 4743} {"train_loss": -7.215432167053223, "global_step": 199241, "epoch": 4743} {"train_loss": -7.334935188293457, "global_step": 199242, "epoch": 4743} {"train_loss": -7.255707740783691, "global_step": 199243, "epoch": 4743} {"train_loss": -7.150865077972412, "global_step": 199244, "epoch": 4743} {"train_loss": -7.255119323730469, "global_step": 199245, "epoch": 4743} {"train_loss": -7.165224075317383, "global_step": 199246, "epoch": 4743} {"train_loss": -7.279879751659575, "global_step": 199247, "epoch": 4743, "val_loss": 69817.7890625} {"train_loss": -7.220746040344238, "global_step": 199248, "epoch": 4744} {"train_loss": -7.298834800720215, "global_step": 199249, "epoch": 4744} {"train_loss": -7.332904815673828, "global_step": 199250, "epoch": 4744} {"train_loss": -7.281697750091553, "global_step": 199251, "epoch": 4744} {"train_loss": -7.224187850952148, "global_step": 199252, "epoch": 4744} {"train_loss": -7.4081549644470215, "global_step": 199253, "epoch": 4744} {"train_loss": -7.161025047302246, "global_step": 199254, "epoch": 4744} {"train_loss": -7.165213108062744, "global_step": 199255, "epoch": 4744} {"train_loss": -7.2563934326171875, "global_step": 199256, "epoch": 4744} {"train_loss": -7.2528181076049805, "global_step": 199257, "epoch": 4744} {"train_loss": -7.137091636657715, "global_step": 199258, "epoch": 4744} {"train_loss": -7.206176280975342, "global_step": 199259, "epoch": 4744} {"train_loss": -7.1810407638549805, "global_step": 199260, "epoch": 4744} {"train_loss": -7.268820285797119, "global_step": 199261, "epoch": 4744} {"train_loss": -7.378411769866943, "global_step": 199262, "epoch": 4744} {"train_loss": -7.248654365539551, "global_step": 199263, "epoch": 4744} {"train_loss": -7.177164077758789, "global_step": 199264, "epoch": 4744} {"train_loss": -7.163266181945801, "global_step": 199265, "epoch": 4744} {"train_loss": -7.2536163330078125, "global_step": 199266, "epoch": 4744} {"train_loss": -7.163499355316162, "global_step": 199267, "epoch": 4744} {"train_loss": -7.184140205383301, "global_step": 199268, "epoch": 4744} {"train_loss": -7.184819221496582, "global_step": 199269, "epoch": 4744} {"train_loss": -7.283344268798828, "global_step": 199270, "epoch": 4744} {"train_loss": -7.312191963195801, "global_step": 199271, "epoch": 4744} {"train_loss": -7.246977806091309, "global_step": 199272, "epoch": 4744} {"train_loss": -7.397876739501953, "global_step": 199273, "epoch": 4744} {"train_loss": -7.169001579284668, "global_step": 199274, "epoch": 4744} {"train_loss": -7.1770501136779785, "global_step": 199275, "epoch": 4744} {"train_loss": -7.2220659255981445, "global_step": 199276, "epoch": 4744} {"train_loss": -7.240386962890625, "global_step": 199277, "epoch": 4744} {"train_loss": -7.308547019958496, "global_step": 199278, "epoch": 4744} {"train_loss": -7.22562313079834, "global_step": 199279, "epoch": 4744} {"train_loss": -7.255407333374023, "global_step": 199280, "epoch": 4744} {"train_loss": -7.196145057678223, "global_step": 199281, "epoch": 4744} {"train_loss": -7.201329708099365, "global_step": 199282, "epoch": 4744} {"train_loss": -7.207541465759277, "global_step": 199283, "epoch": 4744} {"train_loss": -7.232199192047119, "global_step": 199284, "epoch": 4744} {"train_loss": -7.235896110534668, "global_step": 199285, "epoch": 4744} {"train_loss": -7.1883721351623535, "global_step": 199286, "epoch": 4744} {"train_loss": -7.264191627502441, "global_step": 199287, "epoch": 4744} {"train_loss": -7.143182277679443, "global_step": 199288, "epoch": 4744} {"train_loss": -7.236818211419242, "global_step": 199289, "epoch": 4744, "val_loss": 69723.7578125} {"train_loss": -7.196025371551514, "global_step": 199290, "epoch": 4745} {"train_loss": -7.1791887283325195, "global_step": 199291, "epoch": 4745} {"train_loss": -7.334830284118652, "global_step": 199292, "epoch": 4745} {"train_loss": -7.357240676879883, "global_step": 199293, "epoch": 4745} {"train_loss": -7.227740287780762, "global_step": 199294, "epoch": 4745} {"train_loss": -7.282411098480225, "global_step": 199295, "epoch": 4745} {"train_loss": -7.29210901260376, "global_step": 199296, "epoch": 4745} {"train_loss": -7.356585502624512, "global_step": 199297, "epoch": 4745} {"train_loss": -7.257500648498535, "global_step": 199298, "epoch": 4745} {"train_loss": -7.354989051818848, "global_step": 199299, "epoch": 4745} {"train_loss": -7.255116939544678, "global_step": 199300, "epoch": 4745} {"train_loss": -7.291618347167969, "global_step": 199301, "epoch": 4745} {"train_loss": -7.321743011474609, "global_step": 199302, "epoch": 4745} {"train_loss": -7.2479376792907715, "global_step": 199303, "epoch": 4745} {"train_loss": -7.374577522277832, "global_step": 199304, "epoch": 4745} {"train_loss": -7.309562683105469, "global_step": 199305, "epoch": 4745} {"train_loss": -7.222601413726807, "global_step": 199306, "epoch": 4745} {"train_loss": -7.275206565856934, "global_step": 199307, "epoch": 4745} {"train_loss": -7.243459701538086, "global_step": 199308, "epoch": 4745} {"train_loss": -7.311067581176758, "global_step": 199309, "epoch": 4745} {"train_loss": -7.299060821533203, "global_step": 199310, "epoch": 4745} {"train_loss": -7.405641078948975, "global_step": 199311, "epoch": 4745} {"train_loss": -7.343662261962891, "global_step": 199312, "epoch": 4745} {"train_loss": -7.29329776763916, "global_step": 199313, "epoch": 4745} {"train_loss": -7.340260028839111, "global_step": 199314, "epoch": 4745} {"train_loss": -7.379489421844482, "global_step": 199315, "epoch": 4745} {"train_loss": -7.3251261711120605, "global_step": 199316, "epoch": 4745} {"train_loss": -7.373198509216309, "global_step": 199317, "epoch": 4745} {"train_loss": -7.280097007751465, "global_step": 199318, "epoch": 4745} {"train_loss": -7.406981468200684, "global_step": 199319, "epoch": 4745} {"train_loss": -7.359687805175781, "global_step": 199320, "epoch": 4745} {"train_loss": -7.340826988220215, "global_step": 199321, "epoch": 4745} {"train_loss": -7.330619812011719, "global_step": 199322, "epoch": 4745} {"train_loss": -7.221364974975586, "global_step": 199323, "epoch": 4745} {"train_loss": -7.164859294891357, "global_step": 199324, "epoch": 4745} {"train_loss": -7.305190086364746, "global_step": 199325, "epoch": 4745} {"train_loss": -7.404081344604492, "global_step": 199326, "epoch": 4745} {"train_loss": -7.338033676147461, "global_step": 199327, "epoch": 4745} {"train_loss": -7.2980451583862305, "global_step": 199328, "epoch": 4745} {"train_loss": -7.301951885223389, "global_step": 199329, "epoch": 4745} {"train_loss": -7.325724124908447, "global_step": 199330, "epoch": 4745} {"train_loss": -7.305891786302839, "global_step": 199331, "epoch": 4745, "val_loss": 69798.0234375} {"train_loss": -7.146264553070068, "global_step": 199332, "epoch": 4746} {"train_loss": -7.258749961853027, "global_step": 199333, "epoch": 4746} {"train_loss": -7.281203269958496, "global_step": 199334, "epoch": 4746} {"train_loss": -7.287895202636719, "global_step": 199335, "epoch": 4746} {"train_loss": -7.330954551696777, "global_step": 199336, "epoch": 4746} {"train_loss": -7.403972625732422, "global_step": 199337, "epoch": 4746} {"train_loss": -7.266147613525391, "global_step": 199338, "epoch": 4746} {"train_loss": -7.303526878356934, "global_step": 199339, "epoch": 4746} {"train_loss": -7.4052629470825195, "global_step": 199340, "epoch": 4746} {"train_loss": -7.307366371154785, "global_step": 199341, "epoch": 4746} {"train_loss": -7.274550437927246, "global_step": 199342, "epoch": 4746} {"train_loss": -7.396368980407715, "global_step": 199343, "epoch": 4746} {"train_loss": -7.34632682800293, "global_step": 199344, "epoch": 4746} {"train_loss": -7.263719081878662, "global_step": 199345, "epoch": 4746} {"train_loss": -7.263875484466553, "global_step": 199346, "epoch": 4746} {"train_loss": -7.317700386047363, "global_step": 199347, "epoch": 4746} {"train_loss": -7.332523345947266, "global_step": 199348, "epoch": 4746} {"train_loss": -7.216527938842773, "global_step": 199349, "epoch": 4746} {"train_loss": -7.242580890655518, "global_step": 199350, "epoch": 4746} {"train_loss": -7.197659492492676, "global_step": 199351, "epoch": 4746} {"train_loss": -7.275193214416504, "global_step": 199352, "epoch": 4746} {"train_loss": -7.439565181732178, "global_step": 199353, "epoch": 4746} {"train_loss": -7.25147008895874, "global_step": 199354, "epoch": 4746} {"train_loss": -7.145507335662842, "global_step": 199355, "epoch": 4746} {"train_loss": -7.231137275695801, "global_step": 199356, "epoch": 4746} {"train_loss": -7.364727973937988, "global_step": 199357, "epoch": 4746} {"train_loss": -7.038141250610352, "global_step": 199358, "epoch": 4746} {"train_loss": -7.163442611694336, "global_step": 199359, "epoch": 4746} {"train_loss": -7.222496509552002, "global_step": 199360, "epoch": 4746} {"train_loss": -7.224344253540039, "global_step": 199361, "epoch": 4746} {"train_loss": -7.29970645904541, "global_step": 199362, "epoch": 4746} {"train_loss": -7.221743583679199, "global_step": 199363, "epoch": 4746} {"train_loss": -7.281402587890625, "global_step": 199364, "epoch": 4746} {"train_loss": -7.1909589767456055, "global_step": 199365, "epoch": 4746} {"train_loss": -7.303171634674072, "global_step": 199366, "epoch": 4746} {"train_loss": -7.2574920654296875, "global_step": 199367, "epoch": 4746} {"train_loss": -7.327993392944336, "global_step": 199368, "epoch": 4746} {"train_loss": -7.141582012176514, "global_step": 199369, "epoch": 4746} {"train_loss": -7.189347743988037, "global_step": 199370, "epoch": 4746} {"train_loss": -7.156360626220703, "global_step": 199371, "epoch": 4746} {"train_loss": -7.254458427429199, "global_step": 199372, "epoch": 4746} {"train_loss": -7.262767428443546, "global_step": 199373, "epoch": 4746, "val_loss": 69810.359375} {"train_loss": -7.285285472869873, "global_step": 199374, "epoch": 4747} {"train_loss": -7.2587103843688965, "global_step": 199375, "epoch": 4747} {"train_loss": -7.262887954711914, "global_step": 199376, "epoch": 4747} {"train_loss": -7.205658912658691, "global_step": 199377, "epoch": 4747} {"train_loss": -7.338447570800781, "global_step": 199378, "epoch": 4747} {"train_loss": -7.306543350219727, "global_step": 199379, "epoch": 4747} {"train_loss": -7.301594257354736, "global_step": 199380, "epoch": 4747} {"train_loss": -7.22329044342041, "global_step": 199381, "epoch": 4747} {"train_loss": -7.322471618652344, "global_step": 199382, "epoch": 4747} {"train_loss": -7.325550079345703, "global_step": 199383, "epoch": 4747} {"train_loss": -7.296303749084473, "global_step": 199384, "epoch": 4747} {"train_loss": -7.2955756187438965, "global_step": 199385, "epoch": 4747} {"train_loss": -7.25956392288208, "global_step": 199386, "epoch": 4747} {"train_loss": -7.299125671386719, "global_step": 199387, "epoch": 4747} {"train_loss": -7.428246974945068, "global_step": 199388, "epoch": 4747} {"train_loss": -7.226675987243652, "global_step": 199389, "epoch": 4747} {"train_loss": -7.265188217163086, "global_step": 199390, "epoch": 4747} {"train_loss": -7.284748077392578, "global_step": 199391, "epoch": 4747} {"train_loss": -7.2145256996154785, "global_step": 199392, "epoch": 4747} {"train_loss": -7.337972640991211, "global_step": 199393, "epoch": 4747} {"train_loss": -7.267172336578369, "global_step": 199394, "epoch": 4747} {"train_loss": -7.216956615447998, "global_step": 199395, "epoch": 4747} {"train_loss": -7.268406391143799, "global_step": 199396, "epoch": 4747} {"train_loss": -7.356618404388428, "global_step": 199397, "epoch": 4747} {"train_loss": -7.301387786865234, "global_step": 199398, "epoch": 4747} {"train_loss": -7.343048095703125, "global_step": 199399, "epoch": 4747} {"train_loss": -7.189950942993164, "global_step": 199400, "epoch": 4747} {"train_loss": -7.306788444519043, "global_step": 199401, "epoch": 4747} {"train_loss": -7.305395126342773, "global_step": 199402, "epoch": 4747} {"train_loss": -7.049141883850098, "global_step": 199403, "epoch": 4747} {"train_loss": -7.202966690063477, "global_step": 199404, "epoch": 4747} {"train_loss": -7.366189002990723, "global_step": 199405, "epoch": 4747} {"train_loss": -7.237178802490234, "global_step": 199406, "epoch": 4747} {"train_loss": -7.241554260253906, "global_step": 199407, "epoch": 4747} {"train_loss": -7.290660858154297, "global_step": 199408, "epoch": 4747} {"train_loss": -7.187970161437988, "global_step": 199409, "epoch": 4747} {"train_loss": -7.164772033691406, "global_step": 199410, "epoch": 4747} {"train_loss": -7.272721290588379, "global_step": 199411, "epoch": 4747} {"train_loss": -7.164638519287109, "global_step": 199412, "epoch": 4747} {"train_loss": -7.232173442840576, "global_step": 199413, "epoch": 4747} {"train_loss": -7.284209251403809, "global_step": 199414, "epoch": 4747} {"train_loss": -7.265945695695423, "global_step": 199415, "epoch": 4747, "val_loss": 69857.1640625} {"train_loss": -7.156871318817139, "global_step": 199416, "epoch": 4748} {"train_loss": -7.238030433654785, "global_step": 199417, "epoch": 4748} {"train_loss": -7.273642539978027, "global_step": 199418, "epoch": 4748} {"train_loss": -7.321540355682373, "global_step": 199419, "epoch": 4748} {"train_loss": -7.298645973205566, "global_step": 199420, "epoch": 4748} {"train_loss": -7.359552383422852, "global_step": 199421, "epoch": 4748} {"train_loss": -7.2819108963012695, "global_step": 199422, "epoch": 4748} {"train_loss": -7.115594863891602, "global_step": 199423, "epoch": 4748} {"train_loss": -7.2126336097717285, "global_step": 199424, "epoch": 4748} {"train_loss": -7.297679901123047, "global_step": 199425, "epoch": 4748} {"train_loss": -7.357091903686523, "global_step": 199426, "epoch": 4748} {"train_loss": -7.322181224822998, "global_step": 199427, "epoch": 4748} {"train_loss": -7.3256449699401855, "global_step": 199428, "epoch": 4748} {"train_loss": -7.326794147491455, "global_step": 199429, "epoch": 4748} {"train_loss": -7.2786478996276855, "global_step": 199430, "epoch": 4748} {"train_loss": -7.312139987945557, "global_step": 199431, "epoch": 4748} {"train_loss": -7.354499816894531, "global_step": 199432, "epoch": 4748} {"train_loss": -7.269658088684082, "global_step": 199433, "epoch": 4748} {"train_loss": -7.347795486450195, "global_step": 199434, "epoch": 4748} {"train_loss": -7.339751243591309, "global_step": 199435, "epoch": 4748} {"train_loss": -7.287590503692627, "global_step": 199436, "epoch": 4748} {"train_loss": -7.314327239990234, "global_step": 199437, "epoch": 4748} {"train_loss": -7.258796691894531, "global_step": 199438, "epoch": 4748} {"train_loss": -7.314828872680664, "global_step": 199439, "epoch": 4748} {"train_loss": -7.186942100524902, "global_step": 199440, "epoch": 4748} {"train_loss": -7.218729019165039, "global_step": 199441, "epoch": 4748} {"train_loss": -7.410162925720215, "global_step": 199442, "epoch": 4748} {"train_loss": -7.272719860076904, "global_step": 199443, "epoch": 4748} {"train_loss": -7.292450904846191, "global_step": 199444, "epoch": 4748} {"train_loss": -7.264258861541748, "global_step": 199445, "epoch": 4748} {"train_loss": -7.150250434875488, "global_step": 199446, "epoch": 4748} {"train_loss": -7.413477420806885, "global_step": 199447, "epoch": 4748} {"train_loss": -7.335331916809082, "global_step": 199448, "epoch": 4748} {"train_loss": -7.316467761993408, "global_step": 199449, "epoch": 4748} {"train_loss": -7.269249439239502, "global_step": 199450, "epoch": 4748} {"train_loss": -7.205812454223633, "global_step": 199451, "epoch": 4748} {"train_loss": -7.20741605758667, "global_step": 199452, "epoch": 4748} {"train_loss": -7.299404621124268, "global_step": 199453, "epoch": 4748} {"train_loss": -7.27235221862793, "global_step": 199454, "epoch": 4748} {"train_loss": -7.265399932861328, "global_step": 199455, "epoch": 4748} {"train_loss": -7.170478820800781, "global_step": 199456, "epoch": 4748} {"train_loss": -7.278662068503244, "global_step": 199457, "epoch": 4748, "val_loss": 69956.3515625} {"train_loss": -7.337853908538818, "global_step": 199458, "epoch": 4749} {"train_loss": -7.19932746887207, "global_step": 199459, "epoch": 4749} {"train_loss": -7.390871524810791, "global_step": 199460, "epoch": 4749} {"train_loss": -7.207480430603027, "global_step": 199461, "epoch": 4749} {"train_loss": -7.107856750488281, "global_step": 199462, "epoch": 4749} {"train_loss": -7.164346694946289, "global_step": 199463, "epoch": 4749} {"train_loss": -7.176159858703613, "global_step": 199464, "epoch": 4749} {"train_loss": -7.280309677124023, "global_step": 199465, "epoch": 4749} {"train_loss": -7.170042037963867, "global_step": 199466, "epoch": 4749} {"train_loss": -7.196273326873779, "global_step": 199467, "epoch": 4749} {"train_loss": -7.2371826171875, "global_step": 199468, "epoch": 4749} {"train_loss": -7.141373634338379, "global_step": 199469, "epoch": 4749} {"train_loss": -7.337576866149902, "global_step": 199470, "epoch": 4749} {"train_loss": -7.2195892333984375, "global_step": 199471, "epoch": 4749} {"train_loss": -7.184467792510986, "global_step": 199472, "epoch": 4749} {"train_loss": -7.270633697509766, "global_step": 199473, "epoch": 4749} {"train_loss": -7.219944953918457, "global_step": 199474, "epoch": 4749} {"train_loss": -7.291792869567871, "global_step": 199475, "epoch": 4749} {"train_loss": -7.337368011474609, "global_step": 199476, "epoch": 4749} {"train_loss": -7.342864036560059, "global_step": 199477, "epoch": 4749} {"train_loss": -7.283993244171143, "global_step": 199478, "epoch": 4749} {"train_loss": -7.3119354248046875, "global_step": 199479, "epoch": 4749} {"train_loss": -7.3774919509887695, "global_step": 199480, "epoch": 4749} {"train_loss": -7.391143798828125, "global_step": 199481, "epoch": 4749} {"train_loss": -7.2836103439331055, "global_step": 199482, "epoch": 4749} {"train_loss": -7.270925521850586, "global_step": 199483, "epoch": 4749} {"train_loss": -7.355407238006592, "global_step": 199484, "epoch": 4749} {"train_loss": -7.309615612030029, "global_step": 199485, "epoch": 4749} {"train_loss": -7.236874580383301, "global_step": 199486, "epoch": 4749} {"train_loss": -7.302204132080078, "global_step": 199487, "epoch": 4749} {"train_loss": -7.339196681976318, "global_step": 199488, "epoch": 4749} {"train_loss": -7.18914794921875, "global_step": 199489, "epoch": 4749} {"train_loss": -7.300400733947754, "global_step": 199490, "epoch": 4749} {"train_loss": -7.382122993469238, "global_step": 199491, "epoch": 4749} {"train_loss": -7.174959182739258, "global_step": 199492, "epoch": 4749} {"train_loss": -7.156660556793213, "global_step": 199493, "epoch": 4749} {"train_loss": -7.25225830078125, "global_step": 199494, "epoch": 4749} {"train_loss": -7.300982475280762, "global_step": 199495, "epoch": 4749} {"train_loss": -7.22592306137085, "global_step": 199496, "epoch": 4749} {"train_loss": -7.286884307861328, "global_step": 199497, "epoch": 4749} {"train_loss": -7.287742614746094, "global_step": 199498, "epoch": 4749} {"train_loss": -7.262243202754429, "global_step": 199499, "epoch": 4749, "val_loss": 69846.8359375} {"train_loss": -7.325913429260254, "global_step": 199500, "epoch": 4750} {"train_loss": -7.275694370269775, "global_step": 199501, "epoch": 4750} {"train_loss": -7.24481201171875, "global_step": 199502, "epoch": 4750} {"train_loss": -7.316434860229492, "global_step": 199503, "epoch": 4750} {"train_loss": -7.331431865692139, "global_step": 199504, "epoch": 4750} {"train_loss": -7.301068305969238, "global_step": 199505, "epoch": 4750} {"train_loss": -7.250606060028076, "global_step": 199506, "epoch": 4750} {"train_loss": -7.236575126647949, "global_step": 199507, "epoch": 4750} {"train_loss": -7.3459062576293945, "global_step": 199508, "epoch": 4750} {"train_loss": -7.252107620239258, "global_step": 199509, "epoch": 4750} {"train_loss": -7.229747772216797, "global_step": 199510, "epoch": 4750} {"train_loss": -7.233421325683594, "global_step": 199511, "epoch": 4750} {"train_loss": -7.274524688720703, "global_step": 199512, "epoch": 4750} {"train_loss": -7.251689910888672, "global_step": 199513, "epoch": 4750} {"train_loss": -7.267660617828369, "global_step": 199514, "epoch": 4750} {"train_loss": -7.3198466300964355, "global_step": 199515, "epoch": 4750} {"train_loss": -7.348525047302246, "global_step": 199516, "epoch": 4750} {"train_loss": -7.3008809089660645, "global_step": 199517, "epoch": 4750} {"train_loss": -7.262124061584473, "global_step": 199518, "epoch": 4750} {"train_loss": -7.2862372398376465, "global_step": 199519, "epoch": 4750} {"train_loss": -7.203487873077393, "global_step": 199520, "epoch": 4750} {"train_loss": -7.151391506195068, "global_step": 199521, "epoch": 4750} {"train_loss": -7.351491451263428, "global_step": 199522, "epoch": 4750} {"train_loss": -7.18260383605957, "global_step": 199523, "epoch": 4750} {"train_loss": -7.230014801025391, "global_step": 199524, "epoch": 4750} {"train_loss": -7.211518287658691, "global_step": 199525, "epoch": 4750} {"train_loss": -7.222663879394531, "global_step": 199526, "epoch": 4750} {"train_loss": -7.27861213684082, "global_step": 199527, "epoch": 4750} {"train_loss": -7.389493942260742, "global_step": 199528, "epoch": 4750} {"train_loss": -7.321119785308838, "global_step": 199529, "epoch": 4750} {"train_loss": -7.1570963859558105, "global_step": 199530, "epoch": 4750} {"train_loss": -7.214512825012207, "global_step": 199531, "epoch": 4750} {"train_loss": -7.190219879150391, "global_step": 199532, "epoch": 4750} {"train_loss": -7.2217864990234375, "global_step": 199533, "epoch": 4750} {"train_loss": -7.051303863525391, "global_step": 199534, "epoch": 4750} {"train_loss": -7.183672904968262, "global_step": 199535, "epoch": 4750} {"train_loss": -7.278909683227539, "global_step": 199536, "epoch": 4750} {"train_loss": -7.004007816314697, "global_step": 199537, "epoch": 4750} {"train_loss": -7.145479202270508, "global_step": 199538, "epoch": 4750} {"train_loss": -7.165520668029785, "global_step": 199539, "epoch": 4750} {"train_loss": -7.138592720031738, "global_step": 199540, "epoch": 4750} {"train_loss": -7.240512019111996, "global_step": 199541, "epoch": 4750, "train/sim_max_reward_0": 0.43501054038919834, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.6421008345601054, "train/sim_max_reward_3": 0.3963110717238165, "train/sim_max_reward_4": 0.9898853300469069, "train/sim_max_reward_5": 0.5597487031277444, "test/sim_max_reward_4300000": 0.9512393533653627, "test/sim_max_reward_4300001": 0.6726274292807874, "test/sim_max_reward_4300002": 0.9243874510689294, "test/sim_max_reward_4300003": 0.9603292543589671, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.4156681143758841, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.045127646075307386, "test/sim_max_reward_4300008": 0.899866041502576, "test/sim_max_reward_4300009": 0.9402464557061178, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 0.8203651749118313, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.8427548244561287, "test/sim_max_reward_4300016": 0.7703975405403817, "test/sim_max_reward_4300017": 0.9110959442298109, "test/sim_max_reward_4300018": 0.40039288987274785, "test/sim_max_reward_4300019": 0.22881950562910694, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9039893410581146, "test/sim_max_reward_4300022": 0.9389722592491271, "test/sim_max_reward_4300023": 0.3280568493953967, "test/sim_max_reward_4300024": 0.9554077315386319, "test/sim_max_reward_4300025": 0.9808427083035046, "test/sim_max_reward_4300026": 0.28180207017351955, "test/sim_max_reward_4300027": 0.5791340897114562, "test/sim_max_reward_4300028": 0.9572245444206962, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.10296267998617531, "test/sim_max_reward_4300031": 0.9216880032912623, "test/sim_max_reward_4300032": 0.9803616674531253, "test/sim_max_reward_4300033": 1.0, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.18851856090826466, "test/sim_max_reward_4300036": 0.19934220170285197, "test/sim_max_reward_4300037": 0.9651687591274016, "test/sim_max_reward_4300038": 0.5092971753954404, "test/sim_max_reward_4300039": 0.4612289309177075, "test/sim_max_reward_4300040": 0.36681961203258123, "test/sim_max_reward_4300041": 0.8572269561534804, "test/sim_max_reward_4300042": 0.7141384026436532, "test/sim_max_reward_4300043": 0.05924948261902138, "test/sim_max_reward_4300044": 0.9712236510787702, "test/sim_max_reward_4300045": 0.20062212349028155, "test/sim_max_reward_4300046": 0.8644280229924532, "test/sim_max_reward_4300047": 0.12562678941453026, "test/sim_max_reward_4300048": 0.02503654717099139, "test/sim_max_reward_4300049": 0.29277550164379185, "train/mean_score": 0.670509413307962, "test/mean_score": 0.5706059278411092, "val_loss": 70055.328125} {"train_loss": -7.110964298248291, "global_step": 199542, "epoch": 4751} {"train_loss": -7.221056938171387, "global_step": 199543, "epoch": 4751} {"train_loss": -7.180455207824707, "global_step": 199544, "epoch": 4751} {"train_loss": -7.248468399047852, "global_step": 199545, "epoch": 4751} {"train_loss": -7.1568989753723145, "global_step": 199546, "epoch": 4751} {"train_loss": -7.208956241607666, "global_step": 199547, "epoch": 4751} {"train_loss": -7.220759868621826, "global_step": 199548, "epoch": 4751} {"train_loss": -7.120926856994629, "global_step": 199549, "epoch": 4751} {"train_loss": -7.213263511657715, "global_step": 199550, "epoch": 4751} {"train_loss": -7.090778350830078, "global_step": 199551, "epoch": 4751} {"train_loss": -7.089488506317139, "global_step": 199552, "epoch": 4751} {"train_loss": -7.202141761779785, "global_step": 199553, "epoch": 4751} {"train_loss": -7.228011608123779, "global_step": 199554, "epoch": 4751} {"train_loss": -7.331869125366211, "global_step": 199555, "epoch": 4751} {"train_loss": -7.152650833129883, "global_step": 199556, "epoch": 4751} {"train_loss": -7.164109230041504, "global_step": 199557, "epoch": 4751} {"train_loss": -7.249595642089844, "global_step": 199558, "epoch": 4751} {"train_loss": -7.1357221603393555, "global_step": 199559, "epoch": 4751} {"train_loss": -7.277647972106934, "global_step": 199560, "epoch": 4751} {"train_loss": -7.07867431640625, "global_step": 199561, "epoch": 4751} {"train_loss": -7.28687858581543, "global_step": 199562, "epoch": 4751} {"train_loss": -7.179723739624023, "global_step": 199563, "epoch": 4751} {"train_loss": -7.25620174407959, "global_step": 199564, "epoch": 4751} {"train_loss": -7.270956993103027, "global_step": 199565, "epoch": 4751} {"train_loss": -7.228132247924805, "global_step": 199566, "epoch": 4751} {"train_loss": -7.264368057250977, "global_step": 199567, "epoch": 4751} {"train_loss": -7.2338714599609375, "global_step": 199568, "epoch": 4751} {"train_loss": -7.211330413818359, "global_step": 199569, "epoch": 4751} {"train_loss": -7.205326557159424, "global_step": 199570, "epoch": 4751} {"train_loss": -7.238314628601074, "global_step": 199571, "epoch": 4751} {"train_loss": -7.21503210067749, "global_step": 199572, "epoch": 4751} {"train_loss": -7.224550724029541, "global_step": 199573, "epoch": 4751} {"train_loss": -7.242847442626953, "global_step": 199574, "epoch": 4751} {"train_loss": -7.096321105957031, "global_step": 199575, "epoch": 4751} {"train_loss": -7.231512069702148, "global_step": 199576, "epoch": 4751} {"train_loss": -7.230990886688232, "global_step": 199577, "epoch": 4751} {"train_loss": -7.224538803100586, "global_step": 199578, "epoch": 4751} {"train_loss": -7.207268714904785, "global_step": 199579, "epoch": 4751} {"train_loss": -7.19442081451416, "global_step": 199580, "epoch": 4751} {"train_loss": -7.138518333435059, "global_step": 199581, "epoch": 4751} {"train_loss": -7.049007415771484, "global_step": 199582, "epoch": 4751} {"train_loss": -7.198841503688267, "global_step": 199583, "epoch": 4751, "val_loss": 69978.3046875} {"train_loss": -6.950159072875977, "global_step": 199584, "epoch": 4752} {"train_loss": -7.245443344116211, "global_step": 199585, "epoch": 4752} {"train_loss": -6.997411727905273, "global_step": 199586, "epoch": 4752} {"train_loss": -7.26146125793457, "global_step": 199587, "epoch": 4752} {"train_loss": -7.18064546585083, "global_step": 199588, "epoch": 4752} {"train_loss": -7.261388778686523, "global_step": 199589, "epoch": 4752} {"train_loss": -7.219438552856445, "global_step": 199590, "epoch": 4752} {"train_loss": -7.167198181152344, "global_step": 199591, "epoch": 4752} {"train_loss": -7.210228443145752, "global_step": 199592, "epoch": 4752} {"train_loss": -7.299506187438965, "global_step": 199593, "epoch": 4752} {"train_loss": -7.153167247772217, "global_step": 199594, "epoch": 4752} {"train_loss": -7.231344223022461, "global_step": 199595, "epoch": 4752} {"train_loss": -7.27369499206543, "global_step": 199596, "epoch": 4752} {"train_loss": -7.157712936401367, "global_step": 199597, "epoch": 4752} {"train_loss": -7.176830291748047, "global_step": 199598, "epoch": 4752} {"train_loss": -7.179844856262207, "global_step": 199599, "epoch": 4752} {"train_loss": -7.265773773193359, "global_step": 199600, "epoch": 4752} {"train_loss": -7.258635520935059, "global_step": 199601, "epoch": 4752} {"train_loss": -7.291038513183594, "global_step": 199602, "epoch": 4752} {"train_loss": -7.246414661407471, "global_step": 199603, "epoch": 4752} {"train_loss": -7.188078880310059, "global_step": 199604, "epoch": 4752} {"train_loss": -7.245995044708252, "global_step": 199605, "epoch": 4752} {"train_loss": -7.313526153564453, "global_step": 199606, "epoch": 4752} {"train_loss": -7.322000026702881, "global_step": 199607, "epoch": 4752} {"train_loss": -7.2506890296936035, "global_step": 199608, "epoch": 4752} {"train_loss": -7.263395309448242, "global_step": 199609, "epoch": 4752} {"train_loss": -7.2958903312683105, "global_step": 199610, "epoch": 4752} {"train_loss": -7.231890678405762, "global_step": 199611, "epoch": 4752} {"train_loss": -7.261851787567139, "global_step": 199612, "epoch": 4752} {"train_loss": -7.244959831237793, "global_step": 199613, "epoch": 4752} {"train_loss": -7.274534702301025, "global_step": 199614, "epoch": 4752} {"train_loss": -7.25416898727417, "global_step": 199615, "epoch": 4752} {"train_loss": -7.23659610748291, "global_step": 199616, "epoch": 4752} {"train_loss": -7.199125289916992, "global_step": 199617, "epoch": 4752} {"train_loss": -7.328979015350342, "global_step": 199618, "epoch": 4752} {"train_loss": -7.354211807250977, "global_step": 199619, "epoch": 4752} {"train_loss": -7.198751449584961, "global_step": 199620, "epoch": 4752} {"train_loss": -7.316312789916992, "global_step": 199621, "epoch": 4752} {"train_loss": -7.122584342956543, "global_step": 199622, "epoch": 4752} {"train_loss": -7.323029518127441, "global_step": 199623, "epoch": 4752} {"train_loss": -7.240317344665527, "global_step": 199624, "epoch": 4752} {"train_loss": -7.2334957009270076, "global_step": 199625, "epoch": 4752, "val_loss": 69538.953125} {"train_loss": -7.348822593688965, "global_step": 199626, "epoch": 4753} {"train_loss": -7.274600028991699, "global_step": 199627, "epoch": 4753} {"train_loss": -7.244050979614258, "global_step": 199628, "epoch": 4753} {"train_loss": -7.347623825073242, "global_step": 199629, "epoch": 4753} {"train_loss": -7.424705505371094, "global_step": 199630, "epoch": 4753} {"train_loss": -7.28857421875, "global_step": 199631, "epoch": 4753} {"train_loss": -7.26072883605957, "global_step": 199632, "epoch": 4753} {"train_loss": -7.3004631996154785, "global_step": 199633, "epoch": 4753} {"train_loss": -7.294801712036133, "global_step": 199634, "epoch": 4753} {"train_loss": -7.267935752868652, "global_step": 199635, "epoch": 4753} {"train_loss": -7.301016807556152, "global_step": 199636, "epoch": 4753} {"train_loss": -7.265390396118164, "global_step": 199637, "epoch": 4753} {"train_loss": -7.296153545379639, "global_step": 199638, "epoch": 4753} {"train_loss": -7.408628463745117, "global_step": 199639, "epoch": 4753} {"train_loss": -7.367799282073975, "global_step": 199640, "epoch": 4753} {"train_loss": -7.134859561920166, "global_step": 199641, "epoch": 4753} {"train_loss": -7.323267936706543, "global_step": 199642, "epoch": 4753} {"train_loss": -7.275857925415039, "global_step": 199643, "epoch": 4753} {"train_loss": -7.211179733276367, "global_step": 199644, "epoch": 4753} {"train_loss": -7.271491527557373, "global_step": 199645, "epoch": 4753} {"train_loss": -7.353488922119141, "global_step": 199646, "epoch": 4753} {"train_loss": -7.253943920135498, "global_step": 199647, "epoch": 4753} {"train_loss": -7.2845611572265625, "global_step": 199648, "epoch": 4753} {"train_loss": -7.273807525634766, "global_step": 199649, "epoch": 4753} {"train_loss": -7.412345886230469, "global_step": 199650, "epoch": 4753} {"train_loss": -7.290010929107666, "global_step": 199651, "epoch": 4753} {"train_loss": -7.236701965332031, "global_step": 199652, "epoch": 4753} {"train_loss": -7.1676530838012695, "global_step": 199653, "epoch": 4753} {"train_loss": -7.229987144470215, "global_step": 199654, "epoch": 4753} {"train_loss": -7.243328094482422, "global_step": 199655, "epoch": 4753} {"train_loss": -7.316536903381348, "global_step": 199656, "epoch": 4753} {"train_loss": -7.191498756408691, "global_step": 199657, "epoch": 4753} {"train_loss": -7.13746976852417, "global_step": 199658, "epoch": 4753} {"train_loss": -7.286194324493408, "global_step": 199659, "epoch": 4753} {"train_loss": -7.215713024139404, "global_step": 199660, "epoch": 4753} {"train_loss": -7.215004920959473, "global_step": 199661, "epoch": 4753} {"train_loss": -7.194661617279053, "global_step": 199662, "epoch": 4753} {"train_loss": -7.271117210388184, "global_step": 199663, "epoch": 4753} {"train_loss": -7.319563865661621, "global_step": 199664, "epoch": 4753} {"train_loss": -7.250831127166748, "global_step": 199665, "epoch": 4753} {"train_loss": -7.181546688079834, "global_step": 199666, "epoch": 4753} {"train_loss": -7.272222076143537, "global_step": 199667, "epoch": 4753, "val_loss": 69840.8359375} {"train_loss": -7.280575275421143, "global_step": 199668, "epoch": 4754} {"train_loss": -7.1650896072387695, "global_step": 199669, "epoch": 4754} {"train_loss": -7.188112735748291, "global_step": 199670, "epoch": 4754} {"train_loss": -7.2856035232543945, "global_step": 199671, "epoch": 4754} {"train_loss": -7.181519508361816, "global_step": 199672, "epoch": 4754} {"train_loss": -7.304788589477539, "global_step": 199673, "epoch": 4754} {"train_loss": -7.150809288024902, "global_step": 199674, "epoch": 4754} {"train_loss": -7.329166889190674, "global_step": 199675, "epoch": 4754} {"train_loss": -7.201582908630371, "global_step": 199676, "epoch": 4754} {"train_loss": -7.218846321105957, "global_step": 199677, "epoch": 4754} {"train_loss": -7.094364166259766, "global_step": 199678, "epoch": 4754} {"train_loss": -7.204713344573975, "global_step": 199679, "epoch": 4754} {"train_loss": -7.28431510925293, "global_step": 199680, "epoch": 4754} {"train_loss": -7.217401027679443, "global_step": 199681, "epoch": 4754} {"train_loss": -7.310503959655762, "global_step": 199682, "epoch": 4754} {"train_loss": -7.311603546142578, "global_step": 199683, "epoch": 4754} {"train_loss": -7.275368690490723, "global_step": 199684, "epoch": 4754} {"train_loss": -7.271458625793457, "global_step": 199685, "epoch": 4754} {"train_loss": -7.24131965637207, "global_step": 199686, "epoch": 4754} {"train_loss": -7.183391571044922, "global_step": 199687, "epoch": 4754} {"train_loss": -7.21814489364624, "global_step": 199688, "epoch": 4754} {"train_loss": -7.2330121994018555, "global_step": 199689, "epoch": 4754} {"train_loss": -7.229405403137207, "global_step": 199690, "epoch": 4754} {"train_loss": -7.296483993530273, "global_step": 199691, "epoch": 4754} {"train_loss": -7.214487075805664, "global_step": 199692, "epoch": 4754} {"train_loss": -7.260220050811768, "global_step": 199693, "epoch": 4754} {"train_loss": -7.2794036865234375, "global_step": 199694, "epoch": 4754} {"train_loss": -7.21415376663208, "global_step": 199695, "epoch": 4754} {"train_loss": -7.237707138061523, "global_step": 199696, "epoch": 4754} {"train_loss": -7.3336873054504395, "global_step": 199697, "epoch": 4754} {"train_loss": -7.319518089294434, "global_step": 199698, "epoch": 4754} {"train_loss": -7.260952949523926, "global_step": 199699, "epoch": 4754} {"train_loss": -7.222768783569336, "global_step": 199700, "epoch": 4754} {"train_loss": -7.134559631347656, "global_step": 199701, "epoch": 4754} {"train_loss": -7.366749286651611, "global_step": 199702, "epoch": 4754} {"train_loss": -7.229537010192871, "global_step": 199703, "epoch": 4754} {"train_loss": -7.190474510192871, "global_step": 199704, "epoch": 4754} {"train_loss": -7.411948204040527, "global_step": 199705, "epoch": 4754} {"train_loss": -7.1916351318359375, "global_step": 199706, "epoch": 4754} {"train_loss": -7.283806800842285, "global_step": 199707, "epoch": 4754} {"train_loss": -7.250771522521973, "global_step": 199708, "epoch": 4754} {"train_loss": -7.245433364595685, "global_step": 199709, "epoch": 4754, "val_loss": 70102.6796875} {"train_loss": -7.197068214416504, "global_step": 199710, "epoch": 4755} {"train_loss": -7.122253894805908, "global_step": 199711, "epoch": 4755} {"train_loss": -7.139809608459473, "global_step": 199712, "epoch": 4755} {"train_loss": -7.301365852355957, "global_step": 199713, "epoch": 4755} {"train_loss": -7.1574883460998535, "global_step": 199714, "epoch": 4755} {"train_loss": -7.174295425415039, "global_step": 199715, "epoch": 4755} {"train_loss": -7.346332550048828, "global_step": 199716, "epoch": 4755} {"train_loss": -7.118398666381836, "global_step": 199717, "epoch": 4755} {"train_loss": -7.3692731857299805, "global_step": 199718, "epoch": 4755} {"train_loss": -7.284261226654053, "global_step": 199719, "epoch": 4755} {"train_loss": -7.210484504699707, "global_step": 199720, "epoch": 4755} {"train_loss": -7.266554832458496, "global_step": 199721, "epoch": 4755} {"train_loss": -7.215419769287109, "global_step": 199722, "epoch": 4755} {"train_loss": -7.10993766784668, "global_step": 199723, "epoch": 4755} {"train_loss": -7.206302642822266, "global_step": 199724, "epoch": 4755} {"train_loss": -7.131769180297852, "global_step": 199725, "epoch": 4755} {"train_loss": -7.1911492347717285, "global_step": 199726, "epoch": 4755} {"train_loss": -7.202508926391602, "global_step": 199727, "epoch": 4755} {"train_loss": -7.178415775299072, "global_step": 199728, "epoch": 4755} {"train_loss": -7.190114498138428, "global_step": 199729, "epoch": 4755} {"train_loss": -7.151610851287842, "global_step": 199730, "epoch": 4755} {"train_loss": -7.222873210906982, "global_step": 199731, "epoch": 4755} {"train_loss": -7.182642459869385, "global_step": 199732, "epoch": 4755} {"train_loss": -7.204290390014648, "global_step": 199733, "epoch": 4755} {"train_loss": -7.102296352386475, "global_step": 199734, "epoch": 4755} {"train_loss": -7.204301834106445, "global_step": 199735, "epoch": 4755} {"train_loss": -7.109130859375, "global_step": 199736, "epoch": 4755} {"train_loss": -7.234745979309082, "global_step": 199737, "epoch": 4755} {"train_loss": -7.12739372253418, "global_step": 199738, "epoch": 4755} {"train_loss": -7.1776442527771, "global_step": 199739, "epoch": 4755} {"train_loss": -7.216860294342041, "global_step": 199740, "epoch": 4755} {"train_loss": -7.107956886291504, "global_step": 199741, "epoch": 4755} {"train_loss": -7.184041976928711, "global_step": 199742, "epoch": 4755} {"train_loss": -7.164955139160156, "global_step": 199743, "epoch": 4755} {"train_loss": -7.218781471252441, "global_step": 199744, "epoch": 4755} {"train_loss": -7.191840648651123, "global_step": 199745, "epoch": 4755} {"train_loss": -7.209778308868408, "global_step": 199746, "epoch": 4755} {"train_loss": -7.312390327453613, "global_step": 199747, "epoch": 4755} {"train_loss": -7.2890729904174805, "global_step": 199748, "epoch": 4755} {"train_loss": -7.233685493469238, "global_step": 199749, "epoch": 4755} {"train_loss": -7.325990676879883, "global_step": 199750, "epoch": 4755} {"train_loss": -7.204604080745152, "global_step": 199751, "epoch": 4755, "val_loss": 69713.3359375} {"train_loss": -7.267600059509277, "global_step": 199752, "epoch": 4756} {"train_loss": -7.248062610626221, "global_step": 199753, "epoch": 4756} {"train_loss": -7.2344818115234375, "global_step": 199754, "epoch": 4756} {"train_loss": -7.290193557739258, "global_step": 199755, "epoch": 4756} {"train_loss": -7.245184421539307, "global_step": 199756, "epoch": 4756} {"train_loss": -7.287574291229248, "global_step": 199757, "epoch": 4756} {"train_loss": -7.244325637817383, "global_step": 199758, "epoch": 4756} {"train_loss": -7.215649127960205, "global_step": 199759, "epoch": 4756} {"train_loss": -7.17824649810791, "global_step": 199760, "epoch": 4756} {"train_loss": -7.269510269165039, "global_step": 199761, "epoch": 4756} {"train_loss": -7.248249053955078, "global_step": 199762, "epoch": 4756} {"train_loss": -7.3815155029296875, "global_step": 199763, "epoch": 4756} {"train_loss": -7.197437286376953, "global_step": 199764, "epoch": 4756} {"train_loss": -7.308836936950684, "global_step": 199765, "epoch": 4756} {"train_loss": -7.229362964630127, "global_step": 199766, "epoch": 4756} {"train_loss": -7.25528621673584, "global_step": 199767, "epoch": 4756} {"train_loss": -7.330556392669678, "global_step": 199768, "epoch": 4756} {"train_loss": -7.1758575439453125, "global_step": 199769, "epoch": 4756} {"train_loss": -7.352840423583984, "global_step": 199770, "epoch": 4756} {"train_loss": -7.367173194885254, "global_step": 199771, "epoch": 4756} {"train_loss": -7.230040550231934, "global_step": 199772, "epoch": 4756} {"train_loss": -7.287644386291504, "global_step": 199773, "epoch": 4756} {"train_loss": -7.372865676879883, "global_step": 199774, "epoch": 4756} {"train_loss": -7.25580358505249, "global_step": 199775, "epoch": 4756} {"train_loss": -7.35114049911499, "global_step": 199776, "epoch": 4756} {"train_loss": -7.211489677429199, "global_step": 199777, "epoch": 4756} {"train_loss": -7.243203163146973, "global_step": 199778, "epoch": 4756} {"train_loss": -7.237687110900879, "global_step": 199779, "epoch": 4756} {"train_loss": -7.323075294494629, "global_step": 199780, "epoch": 4756} {"train_loss": -7.254426956176758, "global_step": 199781, "epoch": 4756} {"train_loss": -7.259927749633789, "global_step": 199782, "epoch": 4756} {"train_loss": -7.235024929046631, "global_step": 199783, "epoch": 4756} {"train_loss": -7.158495903015137, "global_step": 199784, "epoch": 4756} {"train_loss": -7.2302398681640625, "global_step": 199785, "epoch": 4756} {"train_loss": -7.389739036560059, "global_step": 199786, "epoch": 4756} {"train_loss": -7.232051849365234, "global_step": 199787, "epoch": 4756} {"train_loss": -7.217874050140381, "global_step": 199788, "epoch": 4756} {"train_loss": -7.2583794593811035, "global_step": 199789, "epoch": 4756} {"train_loss": -7.245720863342285, "global_step": 199790, "epoch": 4756} {"train_loss": -7.330499649047852, "global_step": 199791, "epoch": 4756} {"train_loss": -7.23493766784668, "global_step": 199792, "epoch": 4756} {"train_loss": -7.267282962799072, "global_step": 199793, "epoch": 4756, "val_loss": 69898.109375} {"train_loss": -7.285240173339844, "global_step": 199794, "epoch": 4757} {"train_loss": -7.408662796020508, "global_step": 199795, "epoch": 4757} {"train_loss": -7.2453460693359375, "global_step": 199796, "epoch": 4757} {"train_loss": -7.2942633628845215, "global_step": 199797, "epoch": 4757} {"train_loss": -7.182720184326172, "global_step": 199798, "epoch": 4757} {"train_loss": -7.2595133781433105, "global_step": 199799, "epoch": 4757} {"train_loss": -7.145792484283447, "global_step": 199800, "epoch": 4757} {"train_loss": -7.220084190368652, "global_step": 199801, "epoch": 4757} {"train_loss": -7.396509170532227, "global_step": 199802, "epoch": 4757} {"train_loss": -7.256648063659668, "global_step": 199803, "epoch": 4757} {"train_loss": -7.293368339538574, "global_step": 199804, "epoch": 4757} {"train_loss": -7.216865539550781, "global_step": 199805, "epoch": 4757} {"train_loss": -7.272095680236816, "global_step": 199806, "epoch": 4757} {"train_loss": -7.258584022521973, "global_step": 199807, "epoch": 4757} {"train_loss": -7.318615913391113, "global_step": 199808, "epoch": 4757} {"train_loss": -7.341106414794922, "global_step": 199809, "epoch": 4757} {"train_loss": -7.3116254806518555, "global_step": 199810, "epoch": 4757} {"train_loss": -7.188600540161133, "global_step": 199811, "epoch": 4757} {"train_loss": -7.294239521026611, "global_step": 199812, "epoch": 4757} {"train_loss": -7.290400505065918, "global_step": 199813, "epoch": 4757} {"train_loss": -7.283536911010742, "global_step": 199814, "epoch": 4757} {"train_loss": -7.32879638671875, "global_step": 199815, "epoch": 4757} {"train_loss": -7.276273250579834, "global_step": 199816, "epoch": 4757} {"train_loss": -7.264632225036621, "global_step": 199817, "epoch": 4757} {"train_loss": -7.026270866394043, "global_step": 199818, "epoch": 4757} {"train_loss": -7.178729057312012, "global_step": 199819, "epoch": 4757} {"train_loss": -7.228401184082031, "global_step": 199820, "epoch": 4757} {"train_loss": -7.154420852661133, "global_step": 199821, "epoch": 4757} {"train_loss": -7.198857307434082, "global_step": 199822, "epoch": 4757} {"train_loss": -7.160554885864258, "global_step": 199823, "epoch": 4757} {"train_loss": -7.137588024139404, "global_step": 199824, "epoch": 4757} {"train_loss": -7.2828779220581055, "global_step": 199825, "epoch": 4757} {"train_loss": -7.189897060394287, "global_step": 199826, "epoch": 4757} {"train_loss": -7.272172927856445, "global_step": 199827, "epoch": 4757} {"train_loss": -7.182705879211426, "global_step": 199828, "epoch": 4757} {"train_loss": -7.266565322875977, "global_step": 199829, "epoch": 4757} {"train_loss": -7.311848163604736, "global_step": 199830, "epoch": 4757} {"train_loss": -7.269478797912598, "global_step": 199831, "epoch": 4757} {"train_loss": -7.321105480194092, "global_step": 199832, "epoch": 4757} {"train_loss": -7.275189399719238, "global_step": 199833, "epoch": 4757} {"train_loss": -7.225527763366699, "global_step": 199834, "epoch": 4757} {"train_loss": -7.252151909328642, "global_step": 199835, "epoch": 4757, "val_loss": 69715.6953125} {"train_loss": -7.271266460418701, "global_step": 199836, "epoch": 4758} {"train_loss": -7.344662666320801, "global_step": 199837, "epoch": 4758} {"train_loss": -7.203099727630615, "global_step": 199838, "epoch": 4758} {"train_loss": -7.20681095123291, "global_step": 199839, "epoch": 4758} {"train_loss": -7.246479511260986, "global_step": 199840, "epoch": 4758} {"train_loss": -7.2391557693481445, "global_step": 199841, "epoch": 4758} {"train_loss": -7.228252410888672, "global_step": 199842, "epoch": 4758} {"train_loss": -7.18410587310791, "global_step": 199843, "epoch": 4758} {"train_loss": -7.241645812988281, "global_step": 199844, "epoch": 4758} {"train_loss": -7.359663009643555, "global_step": 199845, "epoch": 4758} {"train_loss": -7.186395645141602, "global_step": 199846, "epoch": 4758} {"train_loss": -7.288941383361816, "global_step": 199847, "epoch": 4758} {"train_loss": -7.333977222442627, "global_step": 199848, "epoch": 4758} {"train_loss": -7.241718769073486, "global_step": 199849, "epoch": 4758} {"train_loss": -7.359724044799805, "global_step": 199850, "epoch": 4758} {"train_loss": -7.218419075012207, "global_step": 199851, "epoch": 4758} {"train_loss": -7.170600891113281, "global_step": 199852, "epoch": 4758} {"train_loss": -7.20351505279541, "global_step": 199853, "epoch": 4758} {"train_loss": -7.214759349822998, "global_step": 199854, "epoch": 4758} {"train_loss": -7.2048163414001465, "global_step": 199855, "epoch": 4758} {"train_loss": -7.274344444274902, "global_step": 199856, "epoch": 4758} {"train_loss": -7.23887825012207, "global_step": 199857, "epoch": 4758} {"train_loss": -7.199796676635742, "global_step": 199858, "epoch": 4758} {"train_loss": -7.241152286529541, "global_step": 199859, "epoch": 4758} {"train_loss": -7.349071979522705, "global_step": 199860, "epoch": 4758} {"train_loss": -7.310418605804443, "global_step": 199861, "epoch": 4758} {"train_loss": -7.226064682006836, "global_step": 199862, "epoch": 4758} {"train_loss": -7.258279323577881, "global_step": 199863, "epoch": 4758} {"train_loss": -7.29209041595459, "global_step": 199864, "epoch": 4758} {"train_loss": -7.312857151031494, "global_step": 199865, "epoch": 4758} {"train_loss": -7.15452241897583, "global_step": 199866, "epoch": 4758} {"train_loss": -7.270707130432129, "global_step": 199867, "epoch": 4758} {"train_loss": -7.332379341125488, "global_step": 199868, "epoch": 4758} {"train_loss": -7.232776165008545, "global_step": 199869, "epoch": 4758} {"train_loss": -7.393157005310059, "global_step": 199870, "epoch": 4758} {"train_loss": -7.280346870422363, "global_step": 199871, "epoch": 4758} {"train_loss": -7.2580060958862305, "global_step": 199872, "epoch": 4758} {"train_loss": -7.239591121673584, "global_step": 199873, "epoch": 4758} {"train_loss": -7.340542793273926, "global_step": 199874, "epoch": 4758} {"train_loss": -7.281350612640381, "global_step": 199875, "epoch": 4758} {"train_loss": -7.381776809692383, "global_step": 199876, "epoch": 4758} {"train_loss": -7.2649335861206055, "global_step": 199877, "epoch": 4758, "val_loss": 69765.875} {"train_loss": -7.41432523727417, "global_step": 199878, "epoch": 4759} {"train_loss": -7.280636787414551, "global_step": 199879, "epoch": 4759} {"train_loss": -7.333770275115967, "global_step": 199880, "epoch": 4759} {"train_loss": -7.276226043701172, "global_step": 199881, "epoch": 4759} {"train_loss": -7.242353439331055, "global_step": 199882, "epoch": 4759} {"train_loss": -7.222947597503662, "global_step": 199883, "epoch": 4759} {"train_loss": -7.294356346130371, "global_step": 199884, "epoch": 4759} {"train_loss": -7.208839416503906, "global_step": 199885, "epoch": 4759} {"train_loss": -7.292006492614746, "global_step": 199886, "epoch": 4759} {"train_loss": -7.179255962371826, "global_step": 199887, "epoch": 4759} {"train_loss": -7.308879852294922, "global_step": 199888, "epoch": 4759} {"train_loss": -7.393418312072754, "global_step": 199889, "epoch": 4759} {"train_loss": -7.270807266235352, "global_step": 199890, "epoch": 4759} {"train_loss": -7.280642986297607, "global_step": 199891, "epoch": 4759} {"train_loss": -7.224112033843994, "global_step": 199892, "epoch": 4759} {"train_loss": -7.340443134307861, "global_step": 199893, "epoch": 4759} {"train_loss": -7.221566200256348, "global_step": 199894, "epoch": 4759} {"train_loss": -7.233620643615723, "global_step": 199895, "epoch": 4759} {"train_loss": -7.266397476196289, "global_step": 199896, "epoch": 4759} {"train_loss": -7.204488754272461, "global_step": 199897, "epoch": 4759} {"train_loss": -7.177852630615234, "global_step": 199898, "epoch": 4759} {"train_loss": -7.255281448364258, "global_step": 199899, "epoch": 4759} {"train_loss": -7.056597709655762, "global_step": 199900, "epoch": 4759} {"train_loss": -7.158534049987793, "global_step": 199901, "epoch": 4759} {"train_loss": -7.3875732421875, "global_step": 199902, "epoch": 4759} {"train_loss": -7.066644668579102, "global_step": 199903, "epoch": 4759} {"train_loss": -7.2276291847229, "global_step": 199904, "epoch": 4759} {"train_loss": -7.161040306091309, "global_step": 199905, "epoch": 4759} {"train_loss": -7.209220886230469, "global_step": 199906, "epoch": 4759} {"train_loss": -7.264734268188477, "global_step": 199907, "epoch": 4759} {"train_loss": -7.329588890075684, "global_step": 199908, "epoch": 4759} {"train_loss": -7.251955032348633, "global_step": 199909, "epoch": 4759} {"train_loss": -7.188808441162109, "global_step": 199910, "epoch": 4759} {"train_loss": -7.292684555053711, "global_step": 199911, "epoch": 4759} {"train_loss": -7.253922462463379, "global_step": 199912, "epoch": 4759} {"train_loss": -7.331333637237549, "global_step": 199913, "epoch": 4759} {"train_loss": -7.148232936859131, "global_step": 199914, "epoch": 4759} {"train_loss": -7.222718238830566, "global_step": 199915, "epoch": 4759} {"train_loss": -7.257484436035156, "global_step": 199916, "epoch": 4759} {"train_loss": -7.131312847137451, "global_step": 199917, "epoch": 4759} {"train_loss": -7.140181064605713, "global_step": 199918, "epoch": 4759} {"train_loss": -7.24513198080517, "global_step": 199919, "epoch": 4759, "val_loss": 69821.6875} {"train_loss": -7.2554521560668945, "global_step": 199920, "epoch": 4760} {"train_loss": -7.206036567687988, "global_step": 199921, "epoch": 4760} {"train_loss": -7.31695556640625, "global_step": 199922, "epoch": 4760} {"train_loss": -7.297039031982422, "global_step": 199923, "epoch": 4760} {"train_loss": -7.198464393615723, "global_step": 199924, "epoch": 4760} {"train_loss": -7.2042236328125, "global_step": 199925, "epoch": 4760} {"train_loss": -7.369659423828125, "global_step": 199926, "epoch": 4760} {"train_loss": -7.2361602783203125, "global_step": 199927, "epoch": 4760} {"train_loss": -7.22650146484375, "global_step": 199928, "epoch": 4760} {"train_loss": -7.2352094650268555, "global_step": 199929, "epoch": 4760} {"train_loss": -7.190464019775391, "global_step": 199930, "epoch": 4760} {"train_loss": -7.323447227478027, "global_step": 199931, "epoch": 4760} {"train_loss": -7.2417826652526855, "global_step": 199932, "epoch": 4760} {"train_loss": -7.358334541320801, "global_step": 199933, "epoch": 4760} {"train_loss": -7.275673866271973, "global_step": 199934, "epoch": 4760} {"train_loss": -7.395333290100098, "global_step": 199935, "epoch": 4760} {"train_loss": -7.354340553283691, "global_step": 199936, "epoch": 4760} {"train_loss": -7.239312648773193, "global_step": 199937, "epoch": 4760} {"train_loss": -7.308313369750977, "global_step": 199938, "epoch": 4760} {"train_loss": -7.351865768432617, "global_step": 199939, "epoch": 4760} {"train_loss": -7.420172691345215, "global_step": 199940, "epoch": 4760} {"train_loss": -7.373307228088379, "global_step": 199941, "epoch": 4760} {"train_loss": -7.329869270324707, "global_step": 199942, "epoch": 4760} {"train_loss": -7.378506660461426, "global_step": 199943, "epoch": 4760} {"train_loss": -7.302294731140137, "global_step": 199944, "epoch": 4760} {"train_loss": -7.36333703994751, "global_step": 199945, "epoch": 4760} {"train_loss": -7.291816234588623, "global_step": 199946, "epoch": 4760} {"train_loss": -7.301540851593018, "global_step": 199947, "epoch": 4760} {"train_loss": -7.324045181274414, "global_step": 199948, "epoch": 4760} {"train_loss": -7.28870964050293, "global_step": 199949, "epoch": 4760} {"train_loss": -7.350970268249512, "global_step": 199950, "epoch": 4760} {"train_loss": -7.393385887145996, "global_step": 199951, "epoch": 4760} {"train_loss": -7.321030616760254, "global_step": 199952, "epoch": 4760} {"train_loss": -7.167933464050293, "global_step": 199953, "epoch": 4760} {"train_loss": -7.328383445739746, "global_step": 199954, "epoch": 4760} {"train_loss": -7.399045467376709, "global_step": 199955, "epoch": 4760} {"train_loss": -7.197347640991211, "global_step": 199956, "epoch": 4760} {"train_loss": -7.24403190612793, "global_step": 199957, "epoch": 4760} {"train_loss": -7.306770324707031, "global_step": 199958, "epoch": 4760} {"train_loss": -7.360970497131348, "global_step": 199959, "epoch": 4760} {"train_loss": -7.345563888549805, "global_step": 199960, "epoch": 4760} {"train_loss": -7.302237839925857, "global_step": 199961, "epoch": 4760, "val_loss": 69991.046875} {"train_loss": -7.239986419677734, "global_step": 199962, "epoch": 4761} {"train_loss": -7.378167152404785, "global_step": 199963, "epoch": 4761} {"train_loss": -7.360419750213623, "global_step": 199964, "epoch": 4761} {"train_loss": -7.204815864562988, "global_step": 199965, "epoch": 4761} {"train_loss": -7.375335693359375, "global_step": 199966, "epoch": 4761} {"train_loss": -7.3898844718933105, "global_step": 199967, "epoch": 4761} {"train_loss": -7.288606643676758, "global_step": 199968, "epoch": 4761} {"train_loss": -7.313187599182129, "global_step": 199969, "epoch": 4761} {"train_loss": -7.373129844665527, "global_step": 199970, "epoch": 4761} {"train_loss": -7.267417907714844, "global_step": 199971, "epoch": 4761} {"train_loss": -7.3082275390625, "global_step": 199972, "epoch": 4761} {"train_loss": -7.078176975250244, "global_step": 199973, "epoch": 4761} {"train_loss": -7.206085205078125, "global_step": 199974, "epoch": 4761} {"train_loss": -7.250822067260742, "global_step": 199975, "epoch": 4761} {"train_loss": -7.18343448638916, "global_step": 199976, "epoch": 4761} {"train_loss": -7.277164936065674, "global_step": 199977, "epoch": 4761} {"train_loss": -7.15467643737793, "global_step": 199978, "epoch": 4761} {"train_loss": -7.275769233703613, "global_step": 199979, "epoch": 4761} {"train_loss": -7.235542297363281, "global_step": 199980, "epoch": 4761} {"train_loss": -7.141902923583984, "global_step": 199981, "epoch": 4761} {"train_loss": -7.274578094482422, "global_step": 199982, "epoch": 4761} {"train_loss": -7.162458419799805, "global_step": 199983, "epoch": 4761} {"train_loss": -7.234903335571289, "global_step": 199984, "epoch": 4761} {"train_loss": -7.213350296020508, "global_step": 199985, "epoch": 4761} {"train_loss": -7.164335250854492, "global_step": 199986, "epoch": 4761} {"train_loss": -7.178067207336426, "global_step": 199987, "epoch": 4761} {"train_loss": -7.195237159729004, "global_step": 199988, "epoch": 4761} {"train_loss": -7.137992858886719, "global_step": 199989, "epoch": 4761} {"train_loss": -7.251157760620117, "global_step": 199990, "epoch": 4761} {"train_loss": -7.273578643798828, "global_step": 199991, "epoch": 4761} {"train_loss": -7.228285789489746, "global_step": 199992, "epoch": 4761} {"train_loss": -7.34470272064209, "global_step": 199993, "epoch": 4761} {"train_loss": -7.202357292175293, "global_step": 199994, "epoch": 4761} {"train_loss": -7.238066673278809, "global_step": 199995, "epoch": 4761} {"train_loss": -7.226473808288574, "global_step": 199996, "epoch": 4761} {"train_loss": -7.2822747230529785, "global_step": 199997, "epoch": 4761} {"train_loss": -7.308999061584473, "global_step": 199998, "epoch": 4761} {"train_loss": -7.314138889312744, "global_step": 199999, "epoch": 4761} {"train_loss": -7.223149299621582, "global_step": 200000, "epoch": 4761} {"train_loss": -7.325473308563232, "global_step": 200001, "epoch": 4761} {"train_loss": -7.230040550231934, "global_step": 200002, "epoch": 4761} {"train_loss": -7.251346429189046, "global_step": 200003, "epoch": 4761, "val_loss": 69897.140625} {"train_loss": -7.220922470092773, "global_step": 200004, "epoch": 4762} {"train_loss": -7.297413349151611, "global_step": 200005, "epoch": 4762} {"train_loss": -7.320389747619629, "global_step": 200006, "epoch": 4762} {"train_loss": -7.253812789916992, "global_step": 200007, "epoch": 4762} {"train_loss": -7.3031415939331055, "global_step": 200008, "epoch": 4762} {"train_loss": -7.212869167327881, "global_step": 200009, "epoch": 4762} {"train_loss": -7.175931930541992, "global_step": 200010, "epoch": 4762} {"train_loss": -7.17759895324707, "global_step": 200011, "epoch": 4762} {"train_loss": -7.134561061859131, "global_step": 200012, "epoch": 4762} {"train_loss": -7.299680709838867, "global_step": 200013, "epoch": 4762} {"train_loss": -7.126086235046387, "global_step": 200014, "epoch": 4762} {"train_loss": -7.187477111816406, "global_step": 200015, "epoch": 4762} {"train_loss": -7.184554576873779, "global_step": 200016, "epoch": 4762} {"train_loss": -7.08443546295166, "global_step": 200017, "epoch": 4762} {"train_loss": -7.2806806564331055, "global_step": 200018, "epoch": 4762} {"train_loss": -7.1186981201171875, "global_step": 200019, "epoch": 4762} {"train_loss": -7.2151265144348145, "global_step": 200020, "epoch": 4762} {"train_loss": -7.195357799530029, "global_step": 200021, "epoch": 4762} {"train_loss": -7.125755786895752, "global_step": 200022, "epoch": 4762} {"train_loss": -7.159976005554199, "global_step": 200023, "epoch": 4762} {"train_loss": -7.0050482749938965, "global_step": 200024, "epoch": 4762} {"train_loss": -7.2125115394592285, "global_step": 200025, "epoch": 4762} {"train_loss": -7.115176677703857, "global_step": 200026, "epoch": 4762} {"train_loss": -7.227892875671387, "global_step": 200027, "epoch": 4762} {"train_loss": -7.1560211181640625, "global_step": 200028, "epoch": 4762} {"train_loss": -7.13664436340332, "global_step": 200029, "epoch": 4762} {"train_loss": -7.161276817321777, "global_step": 200030, "epoch": 4762} {"train_loss": -7.174983024597168, "global_step": 200031, "epoch": 4762} {"train_loss": -7.153984069824219, "global_step": 200032, "epoch": 4762} {"train_loss": -7.145245552062988, "global_step": 200033, "epoch": 4762} {"train_loss": -7.177125453948975, "global_step": 200034, "epoch": 4762} {"train_loss": -7.140048980712891, "global_step": 200035, "epoch": 4762} {"train_loss": -7.151214122772217, "global_step": 200036, "epoch": 4762} {"train_loss": -7.018796443939209, "global_step": 200037, "epoch": 4762} {"train_loss": -7.35188102722168, "global_step": 200038, "epoch": 4762} {"train_loss": -7.1254472732543945, "global_step": 200039, "epoch": 4762} {"train_loss": -7.104143142700195, "global_step": 200040, "epoch": 4762} {"train_loss": -7.164640426635742, "global_step": 200041, "epoch": 4762} {"train_loss": -7.116158485412598, "global_step": 200042, "epoch": 4762} {"train_loss": -7.17778205871582, "global_step": 200043, "epoch": 4762} {"train_loss": -7.164918899536133, "global_step": 200044, "epoch": 4762} {"train_loss": -7.176093805403936, "global_step": 200045, "epoch": 4762, "val_loss": 69733.28125} {"train_loss": -7.126691818237305, "global_step": 200046, "epoch": 4763} {"train_loss": -7.157649517059326, "global_step": 200047, "epoch": 4763} {"train_loss": -7.320598602294922, "global_step": 200048, "epoch": 4763} {"train_loss": -7.253950119018555, "global_step": 200049, "epoch": 4763} {"train_loss": -7.2850775718688965, "global_step": 200050, "epoch": 4763} {"train_loss": -7.335856914520264, "global_step": 200051, "epoch": 4763} {"train_loss": -7.287377834320068, "global_step": 200052, "epoch": 4763} {"train_loss": -7.163358688354492, "global_step": 200053, "epoch": 4763} {"train_loss": -7.17521858215332, "global_step": 200054, "epoch": 4763} {"train_loss": -7.269583702087402, "global_step": 200055, "epoch": 4763} {"train_loss": -7.368043899536133, "global_step": 200056, "epoch": 4763} {"train_loss": -7.125339031219482, "global_step": 200057, "epoch": 4763} {"train_loss": -7.306883811950684, "global_step": 200058, "epoch": 4763} {"train_loss": -7.261651515960693, "global_step": 200059, "epoch": 4763} {"train_loss": -7.261770248413086, "global_step": 200060, "epoch": 4763} {"train_loss": -7.249255180358887, "global_step": 200061, "epoch": 4763} {"train_loss": -7.2508392333984375, "global_step": 200062, "epoch": 4763} {"train_loss": -7.286696434020996, "global_step": 200063, "epoch": 4763} {"train_loss": -7.2829999923706055, "global_step": 200064, "epoch": 4763} {"train_loss": -7.326540470123291, "global_step": 200065, "epoch": 4763} {"train_loss": -7.182028770446777, "global_step": 200066, "epoch": 4763} {"train_loss": -7.288759231567383, "global_step": 200067, "epoch": 4763} {"train_loss": -7.109248161315918, "global_step": 200068, "epoch": 4763} {"train_loss": -7.2033371925354, "global_step": 200069, "epoch": 4763} {"train_loss": -7.223677158355713, "global_step": 200070, "epoch": 4763} {"train_loss": -7.040397644042969, "global_step": 200071, "epoch": 4763} {"train_loss": -7.14019775390625, "global_step": 200072, "epoch": 4763} {"train_loss": -7.285948753356934, "global_step": 200073, "epoch": 4763} {"train_loss": -6.895339488983154, "global_step": 200074, "epoch": 4763} {"train_loss": -7.184289932250977, "global_step": 200075, "epoch": 4763} {"train_loss": -7.101691246032715, "global_step": 200076, "epoch": 4763} {"train_loss": -7.156912803649902, "global_step": 200077, "epoch": 4763} {"train_loss": -7.200909614562988, "global_step": 200078, "epoch": 4763} {"train_loss": -7.092188835144043, "global_step": 200079, "epoch": 4763} {"train_loss": -7.128145217895508, "global_step": 200080, "epoch": 4763} {"train_loss": -7.229230880737305, "global_step": 200081, "epoch": 4763} {"train_loss": -7.106268882751465, "global_step": 200082, "epoch": 4763} {"train_loss": -7.217751979827881, "global_step": 200083, "epoch": 4763} {"train_loss": -7.020998001098633, "global_step": 200084, "epoch": 4763} {"train_loss": -7.100876808166504, "global_step": 200085, "epoch": 4763} {"train_loss": -7.203824520111084, "global_step": 200086, "epoch": 4763} {"train_loss": -7.199090049380348, "global_step": 200087, "epoch": 4763, "val_loss": 70094.125} {"train_loss": -7.067955017089844, "global_step": 200088, "epoch": 4764} {"train_loss": -7.257867336273193, "global_step": 200089, "epoch": 4764} {"train_loss": -7.20447301864624, "global_step": 200090, "epoch": 4764} {"train_loss": -7.166632652282715, "global_step": 200091, "epoch": 4764} {"train_loss": -7.206104755401611, "global_step": 200092, "epoch": 4764} {"train_loss": -7.301943778991699, "global_step": 200093, "epoch": 4764} {"train_loss": -7.135821342468262, "global_step": 200094, "epoch": 4764} {"train_loss": -7.208070755004883, "global_step": 200095, "epoch": 4764} {"train_loss": -7.250012397766113, "global_step": 200096, "epoch": 4764} {"train_loss": -7.279313087463379, "global_step": 200097, "epoch": 4764} {"train_loss": -7.311056137084961, "global_step": 200098, "epoch": 4764} {"train_loss": -7.1337080001831055, "global_step": 200099, "epoch": 4764} {"train_loss": -7.245705604553223, "global_step": 200100, "epoch": 4764} {"train_loss": -7.254060745239258, "global_step": 200101, "epoch": 4764} {"train_loss": -7.191221237182617, "global_step": 200102, "epoch": 4764} {"train_loss": -7.265541076660156, "global_step": 200103, "epoch": 4764} {"train_loss": -7.133579254150391, "global_step": 200104, "epoch": 4764} {"train_loss": -7.312800407409668, "global_step": 200105, "epoch": 4764} {"train_loss": -7.215190887451172, "global_step": 200106, "epoch": 4764} {"train_loss": -7.4330058097839355, "global_step": 200107, "epoch": 4764} {"train_loss": -7.268171787261963, "global_step": 200108, "epoch": 4764} {"train_loss": -7.288321495056152, "global_step": 200109, "epoch": 4764} {"train_loss": -7.325545310974121, "global_step": 200110, "epoch": 4764} {"train_loss": -7.235289096832275, "global_step": 200111, "epoch": 4764} {"train_loss": -7.258848190307617, "global_step": 200112, "epoch": 4764} {"train_loss": -7.278307914733887, "global_step": 200113, "epoch": 4764} {"train_loss": -7.2016825675964355, "global_step": 200114, "epoch": 4764} {"train_loss": -7.351173400878906, "global_step": 200115, "epoch": 4764} {"train_loss": -7.350768089294434, "global_step": 200116, "epoch": 4764} {"train_loss": -7.373625755310059, "global_step": 200117, "epoch": 4764} {"train_loss": -7.357964515686035, "global_step": 200118, "epoch": 4764} {"train_loss": -7.378412246704102, "global_step": 200119, "epoch": 4764} {"train_loss": -7.337594509124756, "global_step": 200120, "epoch": 4764} {"train_loss": -7.314678192138672, "global_step": 200121, "epoch": 4764} {"train_loss": -7.390932083129883, "global_step": 200122, "epoch": 4764} {"train_loss": -7.334850311279297, "global_step": 200123, "epoch": 4764} {"train_loss": -7.27103853225708, "global_step": 200124, "epoch": 4764} {"train_loss": -7.287317276000977, "global_step": 200125, "epoch": 4764} {"train_loss": -7.287639141082764, "global_step": 200126, "epoch": 4764} {"train_loss": -7.295165538787842, "global_step": 200127, "epoch": 4764} {"train_loss": -7.291081428527832, "global_step": 200128, "epoch": 4764} {"train_loss": -7.269095137005761, "global_step": 200129, "epoch": 4764, "val_loss": 69895.4375} {"train_loss": -7.382405757904053, "global_step": 200130, "epoch": 4765} {"train_loss": -7.358547210693359, "global_step": 200131, "epoch": 4765} {"train_loss": -7.287799835205078, "global_step": 200132, "epoch": 4765} {"train_loss": -7.2380218505859375, "global_step": 200133, "epoch": 4765} {"train_loss": -7.459318161010742, "global_step": 200134, "epoch": 4765} {"train_loss": -7.26320743560791, "global_step": 200135, "epoch": 4765} {"train_loss": -7.32066535949707, "global_step": 200136, "epoch": 4765} {"train_loss": -7.349252223968506, "global_step": 200137, "epoch": 4765} {"train_loss": -7.208554267883301, "global_step": 200138, "epoch": 4765} {"train_loss": -7.268528938293457, "global_step": 200139, "epoch": 4765} {"train_loss": -7.340648651123047, "global_step": 200140, "epoch": 4765} {"train_loss": -7.19897985458374, "global_step": 200141, "epoch": 4765} {"train_loss": -7.326188564300537, "global_step": 200142, "epoch": 4765} {"train_loss": -7.16661262512207, "global_step": 200143, "epoch": 4765} {"train_loss": -7.228395938873291, "global_step": 200144, "epoch": 4765} {"train_loss": -7.268799781799316, "global_step": 200145, "epoch": 4765} {"train_loss": -7.181660175323486, "global_step": 200146, "epoch": 4765} {"train_loss": -7.371556282043457, "global_step": 200147, "epoch": 4765} {"train_loss": -7.410504341125488, "global_step": 200148, "epoch": 4765} {"train_loss": -7.232674598693848, "global_step": 200149, "epoch": 4765} {"train_loss": -7.318672180175781, "global_step": 200150, "epoch": 4765} {"train_loss": -7.248350620269775, "global_step": 200151, "epoch": 4765} {"train_loss": -7.276979446411133, "global_step": 200152, "epoch": 4765} {"train_loss": -7.3496317863464355, "global_step": 200153, "epoch": 4765} {"train_loss": -7.423402309417725, "global_step": 200154, "epoch": 4765} {"train_loss": -7.232561111450195, "global_step": 200155, "epoch": 4765} {"train_loss": -7.305545806884766, "global_step": 200156, "epoch": 4765} {"train_loss": -7.282719612121582, "global_step": 200157, "epoch": 4765} {"train_loss": -7.26505184173584, "global_step": 200158, "epoch": 4765} {"train_loss": -7.209836959838867, "global_step": 200159, "epoch": 4765} {"train_loss": -7.143878936767578, "global_step": 200160, "epoch": 4765} {"train_loss": -7.3465142250061035, "global_step": 200161, "epoch": 4765} {"train_loss": -7.239606857299805, "global_step": 200162, "epoch": 4765} {"train_loss": -7.270388603210449, "global_step": 200163, "epoch": 4765} {"train_loss": -7.2794270515441895, "global_step": 200164, "epoch": 4765} {"train_loss": -7.2480854988098145, "global_step": 200165, "epoch": 4765} {"train_loss": -7.338295936584473, "global_step": 200166, "epoch": 4765} {"train_loss": -7.147150039672852, "global_step": 200167, "epoch": 4765} {"train_loss": -7.296853542327881, "global_step": 200168, "epoch": 4765} {"train_loss": -7.34090518951416, "global_step": 200169, "epoch": 4765} {"train_loss": -7.236730575561523, "global_step": 200170, "epoch": 4765} {"train_loss": -7.287235839026315, "global_step": 200171, "epoch": 4765, "val_loss": 69905.6953125} {"train_loss": -7.138001441955566, "global_step": 200172, "epoch": 4766} {"train_loss": -7.176519393920898, "global_step": 200173, "epoch": 4766} {"train_loss": -7.413437843322754, "global_step": 200174, "epoch": 4766} {"train_loss": -7.219754219055176, "global_step": 200175, "epoch": 4766} {"train_loss": -7.342186450958252, "global_step": 200176, "epoch": 4766} {"train_loss": -7.263152599334717, "global_step": 200177, "epoch": 4766} {"train_loss": -7.24981164932251, "global_step": 200178, "epoch": 4766} {"train_loss": -7.271224021911621, "global_step": 200179, "epoch": 4766} {"train_loss": -7.27747917175293, "global_step": 200180, "epoch": 4766} {"train_loss": -7.172891616821289, "global_step": 200181, "epoch": 4766} {"train_loss": -7.319815635681152, "global_step": 200182, "epoch": 4766} {"train_loss": -7.319510459899902, "global_step": 200183, "epoch": 4766} {"train_loss": -7.251894474029541, "global_step": 200184, "epoch": 4766} {"train_loss": -7.207756519317627, "global_step": 200185, "epoch": 4766} {"train_loss": -7.412554740905762, "global_step": 200186, "epoch": 4766} {"train_loss": -7.455779075622559, "global_step": 200187, "epoch": 4766} {"train_loss": -7.405605792999268, "global_step": 200188, "epoch": 4766} {"train_loss": -7.34006404876709, "global_step": 200189, "epoch": 4766} {"train_loss": -7.319456100463867, "global_step": 200190, "epoch": 4766} {"train_loss": -7.252402305603027, "global_step": 200191, "epoch": 4766} {"train_loss": -7.290694236755371, "global_step": 200192, "epoch": 4766} {"train_loss": -7.435372352600098, "global_step": 200193, "epoch": 4766} {"train_loss": -7.44064998626709, "global_step": 200194, "epoch": 4766} {"train_loss": -7.326131820678711, "global_step": 200195, "epoch": 4766} {"train_loss": -7.361177921295166, "global_step": 200196, "epoch": 4766} {"train_loss": -7.278746604919434, "global_step": 200197, "epoch": 4766} {"train_loss": -7.481621742248535, "global_step": 200198, "epoch": 4766} {"train_loss": -7.363475799560547, "global_step": 200199, "epoch": 4766} {"train_loss": -7.055394172668457, "global_step": 200200, "epoch": 4766} {"train_loss": -7.285223960876465, "global_step": 200201, "epoch": 4766} {"train_loss": -7.321210861206055, "global_step": 200202, "epoch": 4766} {"train_loss": -7.2985382080078125, "global_step": 200203, "epoch": 4766} {"train_loss": -7.256531715393066, "global_step": 200204, "epoch": 4766} {"train_loss": -7.42162561416626, "global_step": 200205, "epoch": 4766} {"train_loss": -7.247293949127197, "global_step": 200206, "epoch": 4766} {"train_loss": -7.07728910446167, "global_step": 200207, "epoch": 4766} {"train_loss": -7.247466564178467, "global_step": 200208, "epoch": 4766} {"train_loss": -7.283310890197754, "global_step": 200209, "epoch": 4766} {"train_loss": -7.278864860534668, "global_step": 200210, "epoch": 4766} {"train_loss": -7.317230224609375, "global_step": 200211, "epoch": 4766} {"train_loss": -7.255484104156494, "global_step": 200212, "epoch": 4766} {"train_loss": -7.292994941983904, "global_step": 200213, "epoch": 4766, "val_loss": 69803.6484375} {"train_loss": -7.324119567871094, "global_step": 200214, "epoch": 4767} {"train_loss": -7.196325302124023, "global_step": 200215, "epoch": 4767} {"train_loss": -7.244885444641113, "global_step": 200216, "epoch": 4767} {"train_loss": -7.333058834075928, "global_step": 200217, "epoch": 4767} {"train_loss": -7.341272830963135, "global_step": 200218, "epoch": 4767} {"train_loss": -7.2919158935546875, "global_step": 200219, "epoch": 4767} {"train_loss": -7.197754859924316, "global_step": 200220, "epoch": 4767} {"train_loss": -7.275423049926758, "global_step": 200221, "epoch": 4767} {"train_loss": -7.376282691955566, "global_step": 200222, "epoch": 4767} {"train_loss": -7.186575889587402, "global_step": 200223, "epoch": 4767} {"train_loss": -7.1986188888549805, "global_step": 200224, "epoch": 4767} {"train_loss": -7.28835916519165, "global_step": 200225, "epoch": 4767} {"train_loss": -7.182559967041016, "global_step": 200226, "epoch": 4767} {"train_loss": -7.244363784790039, "global_step": 200227, "epoch": 4767} {"train_loss": -7.409243106842041, "global_step": 200228, "epoch": 4767} {"train_loss": -7.279420852661133, "global_step": 200229, "epoch": 4767} {"train_loss": -7.280570983886719, "global_step": 200230, "epoch": 4767} {"train_loss": -7.263177871704102, "global_step": 200231, "epoch": 4767} {"train_loss": -7.244699478149414, "global_step": 200232, "epoch": 4767} {"train_loss": -7.210314750671387, "global_step": 200233, "epoch": 4767} {"train_loss": -7.314183235168457, "global_step": 200234, "epoch": 4767} {"train_loss": -7.213247299194336, "global_step": 200235, "epoch": 4767} {"train_loss": -7.19404411315918, "global_step": 200236, "epoch": 4767} {"train_loss": -7.344797134399414, "global_step": 200237, "epoch": 4767} {"train_loss": -7.222877025604248, "global_step": 200238, "epoch": 4767} {"train_loss": -7.209565162658691, "global_step": 200239, "epoch": 4767} {"train_loss": -7.312206268310547, "global_step": 200240, "epoch": 4767} {"train_loss": -7.163124084472656, "global_step": 200241, "epoch": 4767} {"train_loss": -7.200642108917236, "global_step": 200242, "epoch": 4767} {"train_loss": -7.145516395568848, "global_step": 200243, "epoch": 4767} {"train_loss": -6.966292381286621, "global_step": 200244, "epoch": 4767} {"train_loss": -7.255528926849365, "global_step": 200245, "epoch": 4767} {"train_loss": -7.212606430053711, "global_step": 200246, "epoch": 4767} {"train_loss": -7.246557235717773, "global_step": 200247, "epoch": 4767} {"train_loss": -7.063691139221191, "global_step": 200248, "epoch": 4767} {"train_loss": -7.220128536224365, "global_step": 200249, "epoch": 4767} {"train_loss": -7.2779130935668945, "global_step": 200250, "epoch": 4767} {"train_loss": -7.214934349060059, "global_step": 200251, "epoch": 4767} {"train_loss": -7.111255168914795, "global_step": 200252, "epoch": 4767} {"train_loss": -7.225009918212891, "global_step": 200253, "epoch": 4767} {"train_loss": -7.160689830780029, "global_step": 200254, "epoch": 4767} {"train_loss": -7.234270686195011, "global_step": 200255, "epoch": 4767, "val_loss": 69984.734375} {"train_loss": -7.102907657623291, "global_step": 200256, "epoch": 4768} {"train_loss": -7.109539031982422, "global_step": 200257, "epoch": 4768} {"train_loss": -7.168208599090576, "global_step": 200258, "epoch": 4768} {"train_loss": -7.062304973602295, "global_step": 200259, "epoch": 4768} {"train_loss": -7.266864776611328, "global_step": 200260, "epoch": 4768} {"train_loss": -7.274724006652832, "global_step": 200261, "epoch": 4768} {"train_loss": -7.0964884757995605, "global_step": 200262, "epoch": 4768} {"train_loss": -7.248854160308838, "global_step": 200263, "epoch": 4768} {"train_loss": -7.207297325134277, "global_step": 200264, "epoch": 4768} {"train_loss": -7.166337966918945, "global_step": 200265, "epoch": 4768} {"train_loss": -7.152347564697266, "global_step": 200266, "epoch": 4768} {"train_loss": -7.208325386047363, "global_step": 200267, "epoch": 4768} {"train_loss": -7.232752799987793, "global_step": 200268, "epoch": 4768} {"train_loss": -7.244141578674316, "global_step": 200269, "epoch": 4768} {"train_loss": -7.14628791809082, "global_step": 200270, "epoch": 4768} {"train_loss": -7.265763282775879, "global_step": 200271, "epoch": 4768} {"train_loss": -7.246000289916992, "global_step": 200272, "epoch": 4768} {"train_loss": -7.363846302032471, "global_step": 200273, "epoch": 4768} {"train_loss": -7.296794891357422, "global_step": 200274, "epoch": 4768} {"train_loss": -7.277561664581299, "global_step": 200275, "epoch": 4768} {"train_loss": -7.201436996459961, "global_step": 200276, "epoch": 4768} {"train_loss": -7.217930316925049, "global_step": 200277, "epoch": 4768} {"train_loss": -7.207106113433838, "global_step": 200278, "epoch": 4768} {"train_loss": -7.118334770202637, "global_step": 200279, "epoch": 4768} {"train_loss": -7.129496097564697, "global_step": 200280, "epoch": 4768} {"train_loss": -7.270174980163574, "global_step": 200281, "epoch": 4768} {"train_loss": -7.1480207443237305, "global_step": 200282, "epoch": 4768} {"train_loss": -7.269824981689453, "global_step": 200283, "epoch": 4768} {"train_loss": -7.327801704406738, "global_step": 200284, "epoch": 4768} {"train_loss": -7.243476867675781, "global_step": 200285, "epoch": 4768} {"train_loss": -7.350704193115234, "global_step": 200286, "epoch": 4768} {"train_loss": -7.130498886108398, "global_step": 200287, "epoch": 4768} {"train_loss": -7.286190986633301, "global_step": 200288, "epoch": 4768} {"train_loss": -7.243144989013672, "global_step": 200289, "epoch": 4768} {"train_loss": -7.177213191986084, "global_step": 200290, "epoch": 4768} {"train_loss": -7.279974460601807, "global_step": 200291, "epoch": 4768} {"train_loss": -7.260842323303223, "global_step": 200292, "epoch": 4768} {"train_loss": -7.253866195678711, "global_step": 200293, "epoch": 4768} {"train_loss": -7.362944602966309, "global_step": 200294, "epoch": 4768} {"train_loss": -7.326289176940918, "global_step": 200295, "epoch": 4768} {"train_loss": -7.357851982116699, "global_step": 200296, "epoch": 4768} {"train_loss": -7.22974427541097, "global_step": 200297, "epoch": 4768, "val_loss": 69805.4921875} {"train_loss": -7.3711957931518555, "global_step": 200298, "epoch": 4769} {"train_loss": -7.272193908691406, "global_step": 200299, "epoch": 4769} {"train_loss": -7.258820056915283, "global_step": 200300, "epoch": 4769} {"train_loss": -7.280301094055176, "global_step": 200301, "epoch": 4769} {"train_loss": -7.438231468200684, "global_step": 200302, "epoch": 4769} {"train_loss": -7.340848922729492, "global_step": 200303, "epoch": 4769} {"train_loss": -7.272640228271484, "global_step": 200304, "epoch": 4769} {"train_loss": -7.334577560424805, "global_step": 200305, "epoch": 4769} {"train_loss": -7.391819000244141, "global_step": 200306, "epoch": 4769} {"train_loss": -7.251034736633301, "global_step": 200307, "epoch": 4769} {"train_loss": -7.423786640167236, "global_step": 200308, "epoch": 4769} {"train_loss": -7.264911651611328, "global_step": 200309, "epoch": 4769} {"train_loss": -7.404776573181152, "global_step": 200310, "epoch": 4769} {"train_loss": -7.272068977355957, "global_step": 200311, "epoch": 4769} {"train_loss": -7.286238670349121, "global_step": 200312, "epoch": 4769} {"train_loss": -7.350762367248535, "global_step": 200313, "epoch": 4769} {"train_loss": -7.36883544921875, "global_step": 200314, "epoch": 4769} {"train_loss": -7.292771816253662, "global_step": 200315, "epoch": 4769} {"train_loss": -7.269116401672363, "global_step": 200316, "epoch": 4769} {"train_loss": -7.278931617736816, "global_step": 200317, "epoch": 4769} {"train_loss": -7.381638526916504, "global_step": 200318, "epoch": 4769} {"train_loss": -7.29430627822876, "global_step": 200319, "epoch": 4769} {"train_loss": -7.278216361999512, "global_step": 200320, "epoch": 4769} {"train_loss": -7.41564416885376, "global_step": 200321, "epoch": 4769} {"train_loss": -7.384194374084473, "global_step": 200322, "epoch": 4769} {"train_loss": -7.2681965827941895, "global_step": 200323, "epoch": 4769} {"train_loss": -7.362475395202637, "global_step": 200324, "epoch": 4769} {"train_loss": -7.282012462615967, "global_step": 200325, "epoch": 4769} {"train_loss": -7.327571392059326, "global_step": 200326, "epoch": 4769} {"train_loss": -7.3692755699157715, "global_step": 200327, "epoch": 4769} {"train_loss": -7.344184875488281, "global_step": 200328, "epoch": 4769} {"train_loss": -7.246035099029541, "global_step": 200329, "epoch": 4769} {"train_loss": -7.068944931030273, "global_step": 200330, "epoch": 4769} {"train_loss": -7.195065498352051, "global_step": 200331, "epoch": 4769} {"train_loss": -7.34805965423584, "global_step": 200332, "epoch": 4769} {"train_loss": -7.213850975036621, "global_step": 200333, "epoch": 4769} {"train_loss": -7.207476615905762, "global_step": 200334, "epoch": 4769} {"train_loss": -7.367746353149414, "global_step": 200335, "epoch": 4769} {"train_loss": -7.157026290893555, "global_step": 200336, "epoch": 4769} {"train_loss": -6.959396839141846, "global_step": 200337, "epoch": 4769} {"train_loss": -7.35075569152832, "global_step": 200338, "epoch": 4769} {"train_loss": -7.293968132563999, "global_step": 200339, "epoch": 4769, "val_loss": 69973.828125} {"train_loss": -7.037930488586426, "global_step": 200340, "epoch": 4770} {"train_loss": -7.291322708129883, "global_step": 200341, "epoch": 4770} {"train_loss": -6.913987159729004, "global_step": 200342, "epoch": 4770} {"train_loss": -7.29442024230957, "global_step": 200343, "epoch": 4770} {"train_loss": -7.174689292907715, "global_step": 200344, "epoch": 4770} {"train_loss": -7.119387626647949, "global_step": 200345, "epoch": 4770} {"train_loss": -7.218372344970703, "global_step": 200346, "epoch": 4770} {"train_loss": -7.0328569412231445, "global_step": 200347, "epoch": 4770} {"train_loss": -7.2791547775268555, "global_step": 200348, "epoch": 4770} {"train_loss": -7.148555278778076, "global_step": 200349, "epoch": 4770} {"train_loss": -7.206476211547852, "global_step": 200350, "epoch": 4770} {"train_loss": -7.156620025634766, "global_step": 200351, "epoch": 4770} {"train_loss": -7.1318745613098145, "global_step": 200352, "epoch": 4770} {"train_loss": -7.176592826843262, "global_step": 200353, "epoch": 4770} {"train_loss": -7.142907619476318, "global_step": 200354, "epoch": 4770} {"train_loss": -7.08858585357666, "global_step": 200355, "epoch": 4770} {"train_loss": -7.16550874710083, "global_step": 200356, "epoch": 4770} {"train_loss": -7.171040058135986, "global_step": 200357, "epoch": 4770} {"train_loss": -7.317396640777588, "global_step": 200358, "epoch": 4770} {"train_loss": -7.250850200653076, "global_step": 200359, "epoch": 4770} {"train_loss": -7.199106216430664, "global_step": 200360, "epoch": 4770} {"train_loss": -7.273774147033691, "global_step": 200361, "epoch": 4770} {"train_loss": -7.274439334869385, "global_step": 200362, "epoch": 4770} {"train_loss": -7.211348533630371, "global_step": 200363, "epoch": 4770} {"train_loss": -7.241846084594727, "global_step": 200364, "epoch": 4770} {"train_loss": -7.158917427062988, "global_step": 200365, "epoch": 4770} {"train_loss": -7.220546722412109, "global_step": 200366, "epoch": 4770} {"train_loss": -7.302360534667969, "global_step": 200367, "epoch": 4770} {"train_loss": -7.242114543914795, "global_step": 200368, "epoch": 4770} {"train_loss": -7.142093658447266, "global_step": 200369, "epoch": 4770} {"train_loss": -7.2554802894592285, "global_step": 200370, "epoch": 4770} {"train_loss": -7.276217460632324, "global_step": 200371, "epoch": 4770} {"train_loss": -7.308473587036133, "global_step": 200372, "epoch": 4770} {"train_loss": -7.261772155761719, "global_step": 200373, "epoch": 4770} {"train_loss": -7.351945877075195, "global_step": 200374, "epoch": 4770} {"train_loss": -7.221250534057617, "global_step": 200375, "epoch": 4770} {"train_loss": -7.2291364669799805, "global_step": 200376, "epoch": 4770} {"train_loss": -7.246001243591309, "global_step": 200377, "epoch": 4770} {"train_loss": -7.226340293884277, "global_step": 200378, "epoch": 4770} {"train_loss": -7.219592094421387, "global_step": 200379, "epoch": 4770} {"train_loss": -7.318138599395752, "global_step": 200380, "epoch": 4770} {"train_loss": -7.208648454575312, "global_step": 200381, "epoch": 4770, "val_loss": 69704.875} {"train_loss": -7.361935615539551, "global_step": 200382, "epoch": 4771} {"train_loss": -7.271675109863281, "global_step": 200383, "epoch": 4771} {"train_loss": -7.214534759521484, "global_step": 200384, "epoch": 4771} {"train_loss": -7.223076343536377, "global_step": 200385, "epoch": 4771} {"train_loss": -7.295083522796631, "global_step": 200386, "epoch": 4771} {"train_loss": -7.287174224853516, "global_step": 200387, "epoch": 4771} {"train_loss": -7.126914024353027, "global_step": 200388, "epoch": 4771} {"train_loss": -7.254873275756836, "global_step": 200389, "epoch": 4771} {"train_loss": -7.195167541503906, "global_step": 200390, "epoch": 4771} {"train_loss": -6.977795600891113, "global_step": 200391, "epoch": 4771} {"train_loss": -7.2028608322143555, "global_step": 200392, "epoch": 4771} {"train_loss": -7.067057132720947, "global_step": 200393, "epoch": 4771} {"train_loss": -7.106327056884766, "global_step": 200394, "epoch": 4771} {"train_loss": -7.194110870361328, "global_step": 200395, "epoch": 4771} {"train_loss": -7.163517475128174, "global_step": 200396, "epoch": 4771} {"train_loss": -7.118618965148926, "global_step": 200397, "epoch": 4771} {"train_loss": -7.198376655578613, "global_step": 200398, "epoch": 4771} {"train_loss": -7.256502628326416, "global_step": 200399, "epoch": 4771} {"train_loss": -7.067864418029785, "global_step": 200400, "epoch": 4771} {"train_loss": -7.158635139465332, "global_step": 200401, "epoch": 4771} {"train_loss": -7.0521392822265625, "global_step": 200402, "epoch": 4771} {"train_loss": -7.1682586669921875, "global_step": 200403, "epoch": 4771} {"train_loss": -7.170754432678223, "global_step": 200404, "epoch": 4771} {"train_loss": -7.085400581359863, "global_step": 200405, "epoch": 4771} {"train_loss": -7.149972915649414, "global_step": 200406, "epoch": 4771} {"train_loss": -7.2014312744140625, "global_step": 200407, "epoch": 4771} {"train_loss": -7.1347737312316895, "global_step": 200408, "epoch": 4771} {"train_loss": -7.208727836608887, "global_step": 200409, "epoch": 4771} {"train_loss": -7.298792362213135, "global_step": 200410, "epoch": 4771} {"train_loss": -7.1828227043151855, "global_step": 200411, "epoch": 4771} {"train_loss": -7.240912437438965, "global_step": 200412, "epoch": 4771} {"train_loss": -7.15786600112915, "global_step": 200413, "epoch": 4771} {"train_loss": -7.1868438720703125, "global_step": 200414, "epoch": 4771} {"train_loss": -7.150439262390137, "global_step": 200415, "epoch": 4771} {"train_loss": -7.171756267547607, "global_step": 200416, "epoch": 4771} {"train_loss": -7.223757743835449, "global_step": 200417, "epoch": 4771} {"train_loss": -7.311932563781738, "global_step": 200418, "epoch": 4771} {"train_loss": -7.354374408721924, "global_step": 200419, "epoch": 4771} {"train_loss": -7.27131986618042, "global_step": 200420, "epoch": 4771} {"train_loss": -7.248430252075195, "global_step": 200421, "epoch": 4771} {"train_loss": -7.341561317443848, "global_step": 200422, "epoch": 4771} {"train_loss": -7.195244051161266, "global_step": 200423, "epoch": 4771, "val_loss": 69929.7890625} {"train_loss": -7.197464466094971, "global_step": 200424, "epoch": 4772} {"train_loss": -7.356818199157715, "global_step": 200425, "epoch": 4772} {"train_loss": -7.274787902832031, "global_step": 200426, "epoch": 4772} {"train_loss": -7.272268295288086, "global_step": 200427, "epoch": 4772} {"train_loss": -7.2944746017456055, "global_step": 200428, "epoch": 4772} {"train_loss": -7.204700946807861, "global_step": 200429, "epoch": 4772} {"train_loss": -7.286076545715332, "global_step": 200430, "epoch": 4772} {"train_loss": -7.292415618896484, "global_step": 200431, "epoch": 4772} {"train_loss": -7.405157089233398, "global_step": 200432, "epoch": 4772} {"train_loss": -7.294071197509766, "global_step": 200433, "epoch": 4772} {"train_loss": -7.269313812255859, "global_step": 200434, "epoch": 4772} {"train_loss": -7.345358848571777, "global_step": 200435, "epoch": 4772} {"train_loss": -7.27581787109375, "global_step": 200436, "epoch": 4772} {"train_loss": -7.186692237854004, "global_step": 200437, "epoch": 4772} {"train_loss": -7.192661762237549, "global_step": 200438, "epoch": 4772} {"train_loss": -7.362370491027832, "global_step": 200439, "epoch": 4772} {"train_loss": -7.329127311706543, "global_step": 200440, "epoch": 4772} {"train_loss": -7.306154251098633, "global_step": 200441, "epoch": 4772} {"train_loss": -7.305280685424805, "global_step": 200442, "epoch": 4772} {"train_loss": -7.229310989379883, "global_step": 200443, "epoch": 4772} {"train_loss": -7.22083854675293, "global_step": 200444, "epoch": 4772} {"train_loss": -7.3561553955078125, "global_step": 200445, "epoch": 4772} {"train_loss": -7.285695552825928, "global_step": 200446, "epoch": 4772} {"train_loss": -7.299380779266357, "global_step": 200447, "epoch": 4772} {"train_loss": -7.376608848571777, "global_step": 200448, "epoch": 4772} {"train_loss": -7.116766452789307, "global_step": 200449, "epoch": 4772} {"train_loss": -7.261721134185791, "global_step": 200450, "epoch": 4772} {"train_loss": -7.194842338562012, "global_step": 200451, "epoch": 4772} {"train_loss": -7.3896989822387695, "global_step": 200452, "epoch": 4772} {"train_loss": -7.203510761260986, "global_step": 200453, "epoch": 4772} {"train_loss": -7.334896087646484, "global_step": 200454, "epoch": 4772} {"train_loss": -7.34010648727417, "global_step": 200455, "epoch": 4772} {"train_loss": -7.206179618835449, "global_step": 200456, "epoch": 4772} {"train_loss": -7.245251655578613, "global_step": 200457, "epoch": 4772} {"train_loss": -7.281063079833984, "global_step": 200458, "epoch": 4772} {"train_loss": -7.285139560699463, "global_step": 200459, "epoch": 4772} {"train_loss": -7.4211530685424805, "global_step": 200460, "epoch": 4772} {"train_loss": -7.369815826416016, "global_step": 200461, "epoch": 4772} {"train_loss": -7.332521438598633, "global_step": 200462, "epoch": 4772} {"train_loss": -7.302215099334717, "global_step": 200463, "epoch": 4772} {"train_loss": -7.259249687194824, "global_step": 200464, "epoch": 4772} {"train_loss": -7.285350311370123, "global_step": 200465, "epoch": 4772, "val_loss": 69852.5} {"train_loss": -7.3172526359558105, "global_step": 200466, "epoch": 4773} {"train_loss": -7.307403087615967, "global_step": 200467, "epoch": 4773} {"train_loss": -7.304074287414551, "global_step": 200468, "epoch": 4773} {"train_loss": -7.3526082038879395, "global_step": 200469, "epoch": 4773} {"train_loss": -7.4102067947387695, "global_step": 200470, "epoch": 4773} {"train_loss": -7.388174533843994, "global_step": 200471, "epoch": 4773} {"train_loss": -7.255090713500977, "global_step": 200472, "epoch": 4773} {"train_loss": -7.203651428222656, "global_step": 200473, "epoch": 4773} {"train_loss": -7.286181449890137, "global_step": 200474, "epoch": 4773} {"train_loss": -7.2874555587768555, "global_step": 200475, "epoch": 4773} {"train_loss": -7.361507415771484, "global_step": 200476, "epoch": 4773} {"train_loss": -7.152068614959717, "global_step": 200477, "epoch": 4773} {"train_loss": -7.225032806396484, "global_step": 200478, "epoch": 4773} {"train_loss": -7.22622013092041, "global_step": 200479, "epoch": 4773} {"train_loss": -7.432322025299072, "global_step": 200480, "epoch": 4773} {"train_loss": -7.359910011291504, "global_step": 200481, "epoch": 4773} {"train_loss": -7.331648349761963, "global_step": 200482, "epoch": 4773} {"train_loss": -7.355872631072998, "global_step": 200483, "epoch": 4773} {"train_loss": -7.428773880004883, "global_step": 200484, "epoch": 4773} {"train_loss": -7.3220696449279785, "global_step": 200485, "epoch": 4773} {"train_loss": -7.294095993041992, "global_step": 200486, "epoch": 4773} {"train_loss": -7.224170207977295, "global_step": 200487, "epoch": 4773} {"train_loss": -7.335904121398926, "global_step": 200488, "epoch": 4773} {"train_loss": -7.2687201499938965, "global_step": 200489, "epoch": 4773} {"train_loss": -7.34745979309082, "global_step": 200490, "epoch": 4773} {"train_loss": -7.33808708190918, "global_step": 200491, "epoch": 4773} {"train_loss": -7.326582908630371, "global_step": 200492, "epoch": 4773} {"train_loss": -7.3534746170043945, "global_step": 200493, "epoch": 4773} {"train_loss": -7.385596752166748, "global_step": 200494, "epoch": 4773} {"train_loss": -7.419882774353027, "global_step": 200495, "epoch": 4773} {"train_loss": -7.326512813568115, "global_step": 200496, "epoch": 4773} {"train_loss": -7.2027130126953125, "global_step": 200497, "epoch": 4773} {"train_loss": -7.343663215637207, "global_step": 200498, "epoch": 4773} {"train_loss": -7.200298309326172, "global_step": 200499, "epoch": 4773} {"train_loss": -7.185305595397949, "global_step": 200500, "epoch": 4773} {"train_loss": -7.286531448364258, "global_step": 200501, "epoch": 4773} {"train_loss": -7.336829662322998, "global_step": 200502, "epoch": 4773} {"train_loss": -7.194536209106445, "global_step": 200503, "epoch": 4773} {"train_loss": -7.360611915588379, "global_step": 200504, "epoch": 4773} {"train_loss": -7.330272197723389, "global_step": 200505, "epoch": 4773} {"train_loss": -7.305818557739258, "global_step": 200506, "epoch": 4773} {"train_loss": -7.304791586739676, "global_step": 200507, "epoch": 4773, "val_loss": 69782.9453125} {"train_loss": -7.321429252624512, "global_step": 200508, "epoch": 4774} {"train_loss": -7.222132682800293, "global_step": 200509, "epoch": 4774} {"train_loss": -7.214816093444824, "global_step": 200510, "epoch": 4774} {"train_loss": -7.299992561340332, "global_step": 200511, "epoch": 4774} {"train_loss": -7.290163993835449, "global_step": 200512, "epoch": 4774} {"train_loss": -7.115944862365723, "global_step": 200513, "epoch": 4774} {"train_loss": -7.2443952560424805, "global_step": 200514, "epoch": 4774} {"train_loss": -7.233375549316406, "global_step": 200515, "epoch": 4774} {"train_loss": -7.253460884094238, "global_step": 200516, "epoch": 4774} {"train_loss": -7.19896125793457, "global_step": 200517, "epoch": 4774} {"train_loss": -7.102324485778809, "global_step": 200518, "epoch": 4774} {"train_loss": -7.228869915008545, "global_step": 200519, "epoch": 4774} {"train_loss": -7.137935638427734, "global_step": 200520, "epoch": 4774} {"train_loss": -7.075260162353516, "global_step": 200521, "epoch": 4774} {"train_loss": -7.322640895843506, "global_step": 200522, "epoch": 4774} {"train_loss": -7.118884086608887, "global_step": 200523, "epoch": 4774} {"train_loss": -7.187300205230713, "global_step": 200524, "epoch": 4774} {"train_loss": -7.1822509765625, "global_step": 200525, "epoch": 4774} {"train_loss": -7.085956573486328, "global_step": 200526, "epoch": 4774} {"train_loss": -7.094128608703613, "global_step": 200527, "epoch": 4774} {"train_loss": -7.143520355224609, "global_step": 200528, "epoch": 4774} {"train_loss": -7.25466251373291, "global_step": 200529, "epoch": 4774} {"train_loss": -7.0288848876953125, "global_step": 200530, "epoch": 4774} {"train_loss": -7.112560272216797, "global_step": 200531, "epoch": 4774} {"train_loss": -7.181536674499512, "global_step": 200532, "epoch": 4774} {"train_loss": -7.002546310424805, "global_step": 200533, "epoch": 4774} {"train_loss": -7.100360870361328, "global_step": 200534, "epoch": 4774} {"train_loss": -6.9652910232543945, "global_step": 200535, "epoch": 4774} {"train_loss": -7.092208385467529, "global_step": 200536, "epoch": 4774} {"train_loss": -7.058807849884033, "global_step": 200537, "epoch": 4774} {"train_loss": -6.997207164764404, "global_step": 200538, "epoch": 4774} {"train_loss": -7.223787307739258, "global_step": 200539, "epoch": 4774} {"train_loss": -6.957600116729736, "global_step": 200540, "epoch": 4774} {"train_loss": -7.268383502960205, "global_step": 200541, "epoch": 4774} {"train_loss": -7.078335762023926, "global_step": 200542, "epoch": 4774} {"train_loss": -7.218780040740967, "global_step": 200543, "epoch": 4774} {"train_loss": -7.116333961486816, "global_step": 200544, "epoch": 4774} {"train_loss": -7.021565914154053, "global_step": 200545, "epoch": 4774} {"train_loss": -7.14535665512085, "global_step": 200546, "epoch": 4774} {"train_loss": -7.001691818237305, "global_step": 200547, "epoch": 4774} {"train_loss": -7.153430938720703, "global_step": 200548, "epoch": 4774} {"train_loss": -7.145414431889852, "global_step": 200549, "epoch": 4774, "val_loss": 70003.5546875} {"train_loss": -7.211053371429443, "global_step": 200550, "epoch": 4775} {"train_loss": -7.2372002601623535, "global_step": 200551, "epoch": 4775} {"train_loss": -7.143056392669678, "global_step": 200552, "epoch": 4775} {"train_loss": -7.139276504516602, "global_step": 200553, "epoch": 4775} {"train_loss": -7.212408542633057, "global_step": 200554, "epoch": 4775} {"train_loss": -7.1438093185424805, "global_step": 200555, "epoch": 4775} {"train_loss": -7.169782638549805, "global_step": 200556, "epoch": 4775} {"train_loss": -7.220138072967529, "global_step": 200557, "epoch": 4775} {"train_loss": -7.1172966957092285, "global_step": 200558, "epoch": 4775} {"train_loss": -7.205435752868652, "global_step": 200559, "epoch": 4775} {"train_loss": -7.192178726196289, "global_step": 200560, "epoch": 4775} {"train_loss": -7.133047103881836, "global_step": 200561, "epoch": 4775} {"train_loss": -7.250083923339844, "global_step": 200562, "epoch": 4775} {"train_loss": -7.1319580078125, "global_step": 200563, "epoch": 4775} {"train_loss": -7.190523147583008, "global_step": 200564, "epoch": 4775} {"train_loss": -7.336848258972168, "global_step": 200565, "epoch": 4775} {"train_loss": -7.156126976013184, "global_step": 200566, "epoch": 4775} {"train_loss": -7.2678070068359375, "global_step": 200567, "epoch": 4775} {"train_loss": -7.210780620574951, "global_step": 200568, "epoch": 4775} {"train_loss": -7.12967586517334, "global_step": 200569, "epoch": 4775} {"train_loss": -7.284947395324707, "global_step": 200570, "epoch": 4775} {"train_loss": -7.292624473571777, "global_step": 200571, "epoch": 4775} {"train_loss": -7.150432109832764, "global_step": 200572, "epoch": 4775} {"train_loss": -7.225770950317383, "global_step": 200573, "epoch": 4775} {"train_loss": -7.282304763793945, "global_step": 200574, "epoch": 4775} {"train_loss": -7.192436218261719, "global_step": 200575, "epoch": 4775} {"train_loss": -7.105627536773682, "global_step": 200576, "epoch": 4775} {"train_loss": -7.200231075286865, "global_step": 200577, "epoch": 4775} {"train_loss": -7.324156761169434, "global_step": 200578, "epoch": 4775} {"train_loss": -7.219630241394043, "global_step": 200579, "epoch": 4775} {"train_loss": -7.3591227531433105, "global_step": 200580, "epoch": 4775} {"train_loss": -7.329996109008789, "global_step": 200581, "epoch": 4775} {"train_loss": -7.20811653137207, "global_step": 200582, "epoch": 4775} {"train_loss": -7.259646415710449, "global_step": 200583, "epoch": 4775} {"train_loss": -7.264311790466309, "global_step": 200584, "epoch": 4775} {"train_loss": -7.325223922729492, "global_step": 200585, "epoch": 4775} {"train_loss": -7.326099395751953, "global_step": 200586, "epoch": 4775} {"train_loss": -7.111201286315918, "global_step": 200587, "epoch": 4775} {"train_loss": -7.265439510345459, "global_step": 200588, "epoch": 4775} {"train_loss": -7.304862022399902, "global_step": 200589, "epoch": 4775} {"train_loss": -7.1107401847839355, "global_step": 200590, "epoch": 4775} {"train_loss": -7.219250815255301, "global_step": 200591, "epoch": 4775, "val_loss": 69829.4921875} {"train_loss": -7.244993209838867, "global_step": 200592, "epoch": 4776} {"train_loss": -7.193215370178223, "global_step": 200593, "epoch": 4776} {"train_loss": -7.292222023010254, "global_step": 200594, "epoch": 4776} {"train_loss": -7.249209403991699, "global_step": 200595, "epoch": 4776} {"train_loss": -7.308470249176025, "global_step": 200596, "epoch": 4776} {"train_loss": -7.319952964782715, "global_step": 200597, "epoch": 4776} {"train_loss": -7.322352886199951, "global_step": 200598, "epoch": 4776} {"train_loss": -7.3442769050598145, "global_step": 200599, "epoch": 4776} {"train_loss": -7.125950336456299, "global_step": 200600, "epoch": 4776} {"train_loss": -7.249853610992432, "global_step": 200601, "epoch": 4776} {"train_loss": -7.262436866760254, "global_step": 200602, "epoch": 4776} {"train_loss": -7.342584609985352, "global_step": 200603, "epoch": 4776} {"train_loss": -7.2983808517456055, "global_step": 200604, "epoch": 4776} {"train_loss": -7.246826171875, "global_step": 200605, "epoch": 4776} {"train_loss": -7.193265438079834, "global_step": 200606, "epoch": 4776} {"train_loss": -7.212352275848389, "global_step": 200607, "epoch": 4776} {"train_loss": -7.181158065795898, "global_step": 200608, "epoch": 4776} {"train_loss": -7.196922779083252, "global_step": 200609, "epoch": 4776} {"train_loss": -7.206097602844238, "global_step": 200610, "epoch": 4776} {"train_loss": -7.300280570983887, "global_step": 200611, "epoch": 4776} {"train_loss": -7.297103404998779, "global_step": 200612, "epoch": 4776} {"train_loss": -7.268880844116211, "global_step": 200613, "epoch": 4776} {"train_loss": -7.343138694763184, "global_step": 200614, "epoch": 4776} {"train_loss": -7.320683479309082, "global_step": 200615, "epoch": 4776} {"train_loss": -7.24749755859375, "global_step": 200616, "epoch": 4776} {"train_loss": -7.314571380615234, "global_step": 200617, "epoch": 4776} {"train_loss": -7.3254170417785645, "global_step": 200618, "epoch": 4776} {"train_loss": -7.383289813995361, "global_step": 200619, "epoch": 4776} {"train_loss": -7.37565803527832, "global_step": 200620, "epoch": 4776} {"train_loss": -7.432912826538086, "global_step": 200621, "epoch": 4776} {"train_loss": -7.27254056930542, "global_step": 200622, "epoch": 4776} {"train_loss": -7.311160564422607, "global_step": 200623, "epoch": 4776} {"train_loss": -7.3957438468933105, "global_step": 200624, "epoch": 4776} {"train_loss": -7.287284851074219, "global_step": 200625, "epoch": 4776} {"train_loss": -7.3784685134887695, "global_step": 200626, "epoch": 4776} {"train_loss": -7.341355323791504, "global_step": 200627, "epoch": 4776} {"train_loss": -7.3234357833862305, "global_step": 200628, "epoch": 4776} {"train_loss": -7.313920021057129, "global_step": 200629, "epoch": 4776} {"train_loss": -7.198966026306152, "global_step": 200630, "epoch": 4776} {"train_loss": -7.282829284667969, "global_step": 200631, "epoch": 4776} {"train_loss": -7.136623382568359, "global_step": 200632, "epoch": 4776} {"train_loss": -7.284121286301386, "global_step": 200633, "epoch": 4776, "val_loss": 70024.8515625} {"train_loss": -7.150930404663086, "global_step": 200634, "epoch": 4777} {"train_loss": -7.3441481590271, "global_step": 200635, "epoch": 4777} {"train_loss": -7.308578968048096, "global_step": 200636, "epoch": 4777} {"train_loss": -7.094452857971191, "global_step": 200637, "epoch": 4777} {"train_loss": -7.25856351852417, "global_step": 200638, "epoch": 4777} {"train_loss": -7.337526321411133, "global_step": 200639, "epoch": 4777} {"train_loss": -7.239933490753174, "global_step": 200640, "epoch": 4777} {"train_loss": -7.309896469116211, "global_step": 200641, "epoch": 4777} {"train_loss": -7.188091278076172, "global_step": 200642, "epoch": 4777} {"train_loss": -7.2438459396362305, "global_step": 200643, "epoch": 4777} {"train_loss": -7.356715202331543, "global_step": 200644, "epoch": 4777} {"train_loss": -7.251394271850586, "global_step": 200645, "epoch": 4777} {"train_loss": -7.27447509765625, "global_step": 200646, "epoch": 4777} {"train_loss": -7.277185440063477, "global_step": 200647, "epoch": 4777} {"train_loss": -7.285943984985352, "global_step": 200648, "epoch": 4777} {"train_loss": -7.409026145935059, "global_step": 200649, "epoch": 4777} {"train_loss": -7.338729381561279, "global_step": 200650, "epoch": 4777} {"train_loss": -7.314916610717773, "global_step": 200651, "epoch": 4777} {"train_loss": -7.349088668823242, "global_step": 200652, "epoch": 4777} {"train_loss": -7.3316144943237305, "global_step": 200653, "epoch": 4777} {"train_loss": -7.353996276855469, "global_step": 200654, "epoch": 4777} {"train_loss": -7.329677581787109, "global_step": 200655, "epoch": 4777} {"train_loss": -7.371799468994141, "global_step": 200656, "epoch": 4777} {"train_loss": -7.242105484008789, "global_step": 200657, "epoch": 4777} {"train_loss": -7.205537796020508, "global_step": 200658, "epoch": 4777} {"train_loss": -7.337005615234375, "global_step": 200659, "epoch": 4777} {"train_loss": -7.187596321105957, "global_step": 200660, "epoch": 4777} {"train_loss": -7.224551677703857, "global_step": 200661, "epoch": 4777} {"train_loss": -7.262465000152588, "global_step": 200662, "epoch": 4777} {"train_loss": -7.271685600280762, "global_step": 200663, "epoch": 4777} {"train_loss": -7.35301399230957, "global_step": 200664, "epoch": 4777} {"train_loss": -7.236091613769531, "global_step": 200665, "epoch": 4777} {"train_loss": -7.2643890380859375, "global_step": 200666, "epoch": 4777} {"train_loss": -7.22320032119751, "global_step": 200667, "epoch": 4777} {"train_loss": -7.201662063598633, "global_step": 200668, "epoch": 4777} {"train_loss": -7.255699157714844, "global_step": 200669, "epoch": 4777} {"train_loss": -7.069957733154297, "global_step": 200670, "epoch": 4777} {"train_loss": -7.159772872924805, "global_step": 200671, "epoch": 4777} {"train_loss": -7.249882698059082, "global_step": 200672, "epoch": 4777} {"train_loss": -7.249802112579346, "global_step": 200673, "epoch": 4777} {"train_loss": -7.230644226074219, "global_step": 200674, "epoch": 4777} {"train_loss": -7.263221774782453, "global_step": 200675, "epoch": 4777, "val_loss": 69918.8828125} {"train_loss": -7.213515758514404, "global_step": 200676, "epoch": 4778} {"train_loss": -7.171625137329102, "global_step": 200677, "epoch": 4778} {"train_loss": -7.210482597351074, "global_step": 200678, "epoch": 4778} {"train_loss": -7.061550617218018, "global_step": 200679, "epoch": 4778} {"train_loss": -7.13492488861084, "global_step": 200680, "epoch": 4778} {"train_loss": -7.144438743591309, "global_step": 200681, "epoch": 4778} {"train_loss": -7.147207260131836, "global_step": 200682, "epoch": 4778} {"train_loss": -7.071893692016602, "global_step": 200683, "epoch": 4778} {"train_loss": -7.113940715789795, "global_step": 200684, "epoch": 4778} {"train_loss": -7.064732074737549, "global_step": 200685, "epoch": 4778} {"train_loss": -7.1318559646606445, "global_step": 200686, "epoch": 4778} {"train_loss": -7.140677452087402, "global_step": 200687, "epoch": 4778} {"train_loss": -7.053188323974609, "global_step": 200688, "epoch": 4778} {"train_loss": -7.056745529174805, "global_step": 200689, "epoch": 4778} {"train_loss": -7.129082202911377, "global_step": 200690, "epoch": 4778} {"train_loss": -7.198619842529297, "global_step": 200691, "epoch": 4778} {"train_loss": -7.1228346824646, "global_step": 200692, "epoch": 4778} {"train_loss": -7.251502990722656, "global_step": 200693, "epoch": 4778} {"train_loss": -7.223116397857666, "global_step": 200694, "epoch": 4778} {"train_loss": -7.185059070587158, "global_step": 200695, "epoch": 4778} {"train_loss": -7.228333473205566, "global_step": 200696, "epoch": 4778} {"train_loss": -7.229636192321777, "global_step": 200697, "epoch": 4778} {"train_loss": -7.3238348960876465, "global_step": 200698, "epoch": 4778} {"train_loss": -7.146385192871094, "global_step": 200699, "epoch": 4778} {"train_loss": -7.242537021636963, "global_step": 200700, "epoch": 4778} {"train_loss": -7.192718505859375, "global_step": 200701, "epoch": 4778} {"train_loss": -7.255731582641602, "global_step": 200702, "epoch": 4778} {"train_loss": -7.157676696777344, "global_step": 200703, "epoch": 4778} {"train_loss": -7.307033061981201, "global_step": 200704, "epoch": 4778} {"train_loss": -7.187319755554199, "global_step": 200705, "epoch": 4778} {"train_loss": -7.263247966766357, "global_step": 200706, "epoch": 4778} {"train_loss": -7.223276138305664, "global_step": 200707, "epoch": 4778} {"train_loss": -7.289259433746338, "global_step": 200708, "epoch": 4778} {"train_loss": -7.299947738647461, "global_step": 200709, "epoch": 4778} {"train_loss": -7.237820625305176, "global_step": 200710, "epoch": 4778} {"train_loss": -7.3083953857421875, "global_step": 200711, "epoch": 4778} {"train_loss": -7.24415397644043, "global_step": 200712, "epoch": 4778} {"train_loss": -7.272834777832031, "global_step": 200713, "epoch": 4778} {"train_loss": -7.237996578216553, "global_step": 200714, "epoch": 4778} {"train_loss": -7.309621810913086, "global_step": 200715, "epoch": 4778} {"train_loss": -7.288954734802246, "global_step": 200716, "epoch": 4778} {"train_loss": -7.197941530318487, "global_step": 200717, "epoch": 4778, "val_loss": 69874.90625} {"train_loss": -7.325575828552246, "global_step": 200718, "epoch": 4779} {"train_loss": -7.3290815353393555, "global_step": 200719, "epoch": 4779} {"train_loss": -7.298184871673584, "global_step": 200720, "epoch": 4779} {"train_loss": -7.290391445159912, "global_step": 200721, "epoch": 4779} {"train_loss": -7.232417106628418, "global_step": 200722, "epoch": 4779} {"train_loss": -7.192707061767578, "global_step": 200723, "epoch": 4779} {"train_loss": -7.203618049621582, "global_step": 200724, "epoch": 4779} {"train_loss": -7.290246963500977, "global_step": 200725, "epoch": 4779} {"train_loss": -7.222831726074219, "global_step": 200726, "epoch": 4779} {"train_loss": -7.276864051818848, "global_step": 200727, "epoch": 4779} {"train_loss": -7.248193740844727, "global_step": 200728, "epoch": 4779} {"train_loss": -7.2893171310424805, "global_step": 200729, "epoch": 4779} {"train_loss": -7.3334269523620605, "global_step": 200730, "epoch": 4779} {"train_loss": -7.371424674987793, "global_step": 200731, "epoch": 4779} {"train_loss": -7.211664199829102, "global_step": 200732, "epoch": 4779} {"train_loss": -7.35171365737915, "global_step": 200733, "epoch": 4779} {"train_loss": -7.322849750518799, "global_step": 200734, "epoch": 4779} {"train_loss": -7.275387763977051, "global_step": 200735, "epoch": 4779} {"train_loss": -7.375082969665527, "global_step": 200736, "epoch": 4779} {"train_loss": -7.321835041046143, "global_step": 200737, "epoch": 4779} {"train_loss": -7.297421455383301, "global_step": 200738, "epoch": 4779} {"train_loss": -7.280487060546875, "global_step": 200739, "epoch": 4779} {"train_loss": -7.189017295837402, "global_step": 200740, "epoch": 4779} {"train_loss": -7.3033623695373535, "global_step": 200741, "epoch": 4779} {"train_loss": -7.242090225219727, "global_step": 200742, "epoch": 4779} {"train_loss": -7.22435188293457, "global_step": 200743, "epoch": 4779} {"train_loss": -7.343286514282227, "global_step": 200744, "epoch": 4779} {"train_loss": -7.1043901443481445, "global_step": 200745, "epoch": 4779} {"train_loss": -7.421267509460449, "global_step": 200746, "epoch": 4779} {"train_loss": -7.262365341186523, "global_step": 200747, "epoch": 4779} {"train_loss": -7.241584777832031, "global_step": 200748, "epoch": 4779} {"train_loss": -7.351175785064697, "global_step": 200749, "epoch": 4779} {"train_loss": -7.235633850097656, "global_step": 200750, "epoch": 4779} {"train_loss": -7.138583183288574, "global_step": 200751, "epoch": 4779} {"train_loss": -7.2406721115112305, "global_step": 200752, "epoch": 4779} {"train_loss": -7.247218132019043, "global_step": 200753, "epoch": 4779} {"train_loss": -7.317041397094727, "global_step": 200754, "epoch": 4779} {"train_loss": -7.257884502410889, "global_step": 200755, "epoch": 4779} {"train_loss": -7.381154537200928, "global_step": 200756, "epoch": 4779} {"train_loss": -7.259438514709473, "global_step": 200757, "epoch": 4779} {"train_loss": -7.134182453155518, "global_step": 200758, "epoch": 4779} {"train_loss": -7.274718874976749, "global_step": 200759, "epoch": 4779, "val_loss": 69830.5078125} {"train_loss": -7.165082931518555, "global_step": 200760, "epoch": 4780} {"train_loss": -7.3352556228637695, "global_step": 200761, "epoch": 4780} {"train_loss": -7.302577495574951, "global_step": 200762, "epoch": 4780} {"train_loss": -7.2256927490234375, "global_step": 200763, "epoch": 4780} {"train_loss": -7.215229034423828, "global_step": 200764, "epoch": 4780} {"train_loss": -7.337429046630859, "global_step": 200765, "epoch": 4780} {"train_loss": -7.304741382598877, "global_step": 200766, "epoch": 4780} {"train_loss": -7.288458824157715, "global_step": 200767, "epoch": 4780} {"train_loss": -7.249026298522949, "global_step": 200768, "epoch": 4780} {"train_loss": -7.263590335845947, "global_step": 200769, "epoch": 4780} {"train_loss": -7.343495845794678, "global_step": 200770, "epoch": 4780} {"train_loss": -7.386433124542236, "global_step": 200771, "epoch": 4780} {"train_loss": -7.303068161010742, "global_step": 200772, "epoch": 4780} {"train_loss": -7.312049865722656, "global_step": 200773, "epoch": 4780} {"train_loss": -7.365029335021973, "global_step": 200774, "epoch": 4780} {"train_loss": -7.33615779876709, "global_step": 200775, "epoch": 4780} {"train_loss": -7.265379905700684, "global_step": 200776, "epoch": 4780} {"train_loss": -7.254491806030273, "global_step": 200777, "epoch": 4780} {"train_loss": -7.2612104415893555, "global_step": 200778, "epoch": 4780} {"train_loss": -7.248961448669434, "global_step": 200779, "epoch": 4780} {"train_loss": -7.282793998718262, "global_step": 200780, "epoch": 4780} {"train_loss": -7.1751017570495605, "global_step": 200781, "epoch": 4780} {"train_loss": -7.358151435852051, "global_step": 200782, "epoch": 4780} {"train_loss": -7.090008735656738, "global_step": 200783, "epoch": 4780} {"train_loss": -7.225548267364502, "global_step": 200784, "epoch": 4780} {"train_loss": -7.192709922790527, "global_step": 200785, "epoch": 4780} {"train_loss": -7.213712215423584, "global_step": 200786, "epoch": 4780} {"train_loss": -7.271255970001221, "global_step": 200787, "epoch": 4780} {"train_loss": -7.322566986083984, "global_step": 200788, "epoch": 4780} {"train_loss": -7.21270751953125, "global_step": 200789, "epoch": 4780} {"train_loss": -7.230188369750977, "global_step": 200790, "epoch": 4780} {"train_loss": -6.973770618438721, "global_step": 200791, "epoch": 4780} {"train_loss": -7.179013252258301, "global_step": 200792, "epoch": 4780} {"train_loss": -7.12626838684082, "global_step": 200793, "epoch": 4780} {"train_loss": -7.27665376663208, "global_step": 200794, "epoch": 4780} {"train_loss": -7.2135090827941895, "global_step": 200795, "epoch": 4780} {"train_loss": -7.220013618469238, "global_step": 200796, "epoch": 4780} {"train_loss": -7.171527862548828, "global_step": 200797, "epoch": 4780} {"train_loss": -7.295186996459961, "global_step": 200798, "epoch": 4780} {"train_loss": -7.2525811195373535, "global_step": 200799, "epoch": 4780} {"train_loss": -7.12106990814209, "global_step": 200800, "epoch": 4780} {"train_loss": -7.250111273356846, "global_step": 200801, "epoch": 4780, "val_loss": 69841.4609375} {"train_loss": -7.33461856842041, "global_step": 200802, "epoch": 4781} {"train_loss": -7.226100444793701, "global_step": 200803, "epoch": 4781} {"train_loss": -7.260371685028076, "global_step": 200804, "epoch": 4781} {"train_loss": -7.1979875564575195, "global_step": 200805, "epoch": 4781} {"train_loss": -7.371609687805176, "global_step": 200806, "epoch": 4781} {"train_loss": -7.331366062164307, "global_step": 200807, "epoch": 4781} {"train_loss": -7.363450527191162, "global_step": 200808, "epoch": 4781} {"train_loss": -7.3625593185424805, "global_step": 200809, "epoch": 4781} {"train_loss": -7.2439470291137695, "global_step": 200810, "epoch": 4781} {"train_loss": -7.39810848236084, "global_step": 200811, "epoch": 4781} {"train_loss": -7.37489652633667, "global_step": 200812, "epoch": 4781} {"train_loss": -7.259483337402344, "global_step": 200813, "epoch": 4781} {"train_loss": -7.275041580200195, "global_step": 200814, "epoch": 4781} {"train_loss": -7.323388576507568, "global_step": 200815, "epoch": 4781} {"train_loss": -7.312034606933594, "global_step": 200816, "epoch": 4781} {"train_loss": -7.355169773101807, "global_step": 200817, "epoch": 4781} {"train_loss": -7.338159561157227, "global_step": 200818, "epoch": 4781} {"train_loss": -7.288246154785156, "global_step": 200819, "epoch": 4781} {"train_loss": -7.232922554016113, "global_step": 200820, "epoch": 4781} {"train_loss": -7.305865287780762, "global_step": 200821, "epoch": 4781} {"train_loss": -7.371700286865234, "global_step": 200822, "epoch": 4781} {"train_loss": -7.254509449005127, "global_step": 200823, "epoch": 4781} {"train_loss": -7.261886119842529, "global_step": 200824, "epoch": 4781} {"train_loss": -7.250635623931885, "global_step": 200825, "epoch": 4781} {"train_loss": -7.318970203399658, "global_step": 200826, "epoch": 4781} {"train_loss": -7.3733110427856445, "global_step": 200827, "epoch": 4781} {"train_loss": -7.302655220031738, "global_step": 200828, "epoch": 4781} {"train_loss": -7.3645524978637695, "global_step": 200829, "epoch": 4781} {"train_loss": -7.2964582443237305, "global_step": 200830, "epoch": 4781} {"train_loss": -7.3488993644714355, "global_step": 200831, "epoch": 4781} {"train_loss": -7.311734199523926, "global_step": 200832, "epoch": 4781} {"train_loss": -7.223081111907959, "global_step": 200833, "epoch": 4781} {"train_loss": -7.312980651855469, "global_step": 200834, "epoch": 4781} {"train_loss": -7.280220031738281, "global_step": 200835, "epoch": 4781} {"train_loss": -7.269762992858887, "global_step": 200836, "epoch": 4781} {"train_loss": -7.274665832519531, "global_step": 200837, "epoch": 4781} {"train_loss": -7.330782890319824, "global_step": 200838, "epoch": 4781} {"train_loss": -7.36001443862915, "global_step": 200839, "epoch": 4781} {"train_loss": -7.410458564758301, "global_step": 200840, "epoch": 4781} {"train_loss": -7.135440349578857, "global_step": 200841, "epoch": 4781} {"train_loss": -7.4237141609191895, "global_step": 200842, "epoch": 4781} {"train_loss": -7.310574656441098, "global_step": 200843, "epoch": 4781, "val_loss": 69905.0625} {"train_loss": -7.334902763366699, "global_step": 200844, "epoch": 4782} {"train_loss": -7.341639518737793, "global_step": 200845, "epoch": 4782} {"train_loss": -7.216362476348877, "global_step": 200846, "epoch": 4782} {"train_loss": -7.313593864440918, "global_step": 200847, "epoch": 4782} {"train_loss": -7.240056037902832, "global_step": 200848, "epoch": 4782} {"train_loss": -7.251214027404785, "global_step": 200849, "epoch": 4782} {"train_loss": -7.301379203796387, "global_step": 200850, "epoch": 4782} {"train_loss": -7.26982307434082, "global_step": 200851, "epoch": 4782} {"train_loss": -7.293383598327637, "global_step": 200852, "epoch": 4782} {"train_loss": -7.125447750091553, "global_step": 200853, "epoch": 4782} {"train_loss": -7.187872409820557, "global_step": 200854, "epoch": 4782} {"train_loss": -7.263111114501953, "global_step": 200855, "epoch": 4782} {"train_loss": -7.086453437805176, "global_step": 200856, "epoch": 4782} {"train_loss": -7.184640884399414, "global_step": 200857, "epoch": 4782} {"train_loss": -7.1554670333862305, "global_step": 200858, "epoch": 4782} {"train_loss": -7.13006067276001, "global_step": 200859, "epoch": 4782} {"train_loss": -7.191154956817627, "global_step": 200860, "epoch": 4782} {"train_loss": -7.173686504364014, "global_step": 200861, "epoch": 4782} {"train_loss": -7.139204978942871, "global_step": 200862, "epoch": 4782} {"train_loss": -7.176387786865234, "global_step": 200863, "epoch": 4782} {"train_loss": -7.228951454162598, "global_step": 200864, "epoch": 4782} {"train_loss": -7.076842784881592, "global_step": 200865, "epoch": 4782} {"train_loss": -7.128015518188477, "global_step": 200866, "epoch": 4782} {"train_loss": -7.041015148162842, "global_step": 200867, "epoch": 4782} {"train_loss": -7.045208930969238, "global_step": 200868, "epoch": 4782} {"train_loss": -7.205513954162598, "global_step": 200869, "epoch": 4782} {"train_loss": -6.920840740203857, "global_step": 200870, "epoch": 4782} {"train_loss": -7.245037078857422, "global_step": 200871, "epoch": 4782} {"train_loss": -7.006923675537109, "global_step": 200872, "epoch": 4782} {"train_loss": -7.209698677062988, "global_step": 200873, "epoch": 4782} {"train_loss": -7.144454002380371, "global_step": 200874, "epoch": 4782} {"train_loss": -7.1231584548950195, "global_step": 200875, "epoch": 4782} {"train_loss": -7.249372482299805, "global_step": 200876, "epoch": 4782} {"train_loss": -7.031843185424805, "global_step": 200877, "epoch": 4782} {"train_loss": -7.292613506317139, "global_step": 200878, "epoch": 4782} {"train_loss": -7.101665496826172, "global_step": 200879, "epoch": 4782} {"train_loss": -7.303079605102539, "global_step": 200880, "epoch": 4782} {"train_loss": -7.315369606018066, "global_step": 200881, "epoch": 4782} {"train_loss": -7.26774787902832, "global_step": 200882, "epoch": 4782} {"train_loss": -7.153158187866211, "global_step": 200883, "epoch": 4782} {"train_loss": -7.1992292404174805, "global_step": 200884, "epoch": 4782} {"train_loss": -7.188479854947045, "global_step": 200885, "epoch": 4782, "val_loss": 69715.265625} {"train_loss": -7.167778968811035, "global_step": 200886, "epoch": 4783} {"train_loss": -7.1990461349487305, "global_step": 200887, "epoch": 4783} {"train_loss": -7.160612106323242, "global_step": 200888, "epoch": 4783} {"train_loss": -7.278812408447266, "global_step": 200889, "epoch": 4783} {"train_loss": -7.080857276916504, "global_step": 200890, "epoch": 4783} {"train_loss": -7.313418388366699, "global_step": 200891, "epoch": 4783} {"train_loss": -7.313191890716553, "global_step": 200892, "epoch": 4783} {"train_loss": -7.160305023193359, "global_step": 200893, "epoch": 4783} {"train_loss": -7.2252326011657715, "global_step": 200894, "epoch": 4783} {"train_loss": -7.312287330627441, "global_step": 200895, "epoch": 4783} {"train_loss": -7.342974662780762, "global_step": 200896, "epoch": 4783} {"train_loss": -7.24262809753418, "global_step": 200897, "epoch": 4783} {"train_loss": -7.279910087585449, "global_step": 200898, "epoch": 4783} {"train_loss": -7.398186206817627, "global_step": 200899, "epoch": 4783} {"train_loss": -7.218353271484375, "global_step": 200900, "epoch": 4783} {"train_loss": -7.289093971252441, "global_step": 200901, "epoch": 4783} {"train_loss": -7.226885795593262, "global_step": 200902, "epoch": 4783} {"train_loss": -7.285328388214111, "global_step": 200903, "epoch": 4783} {"train_loss": -7.3296942710876465, "global_step": 200904, "epoch": 4783} {"train_loss": -7.324831962585449, "global_step": 200905, "epoch": 4783} {"train_loss": -7.2995781898498535, "global_step": 200906, "epoch": 4783} {"train_loss": -7.351388454437256, "global_step": 200907, "epoch": 4783} {"train_loss": -7.35957145690918, "global_step": 200908, "epoch": 4783} {"train_loss": -7.172101020812988, "global_step": 200909, "epoch": 4783} {"train_loss": -7.221112251281738, "global_step": 200910, "epoch": 4783} {"train_loss": -7.233740329742432, "global_step": 200911, "epoch": 4783} {"train_loss": -7.308602333068848, "global_step": 200912, "epoch": 4783} {"train_loss": -7.18733024597168, "global_step": 200913, "epoch": 4783} {"train_loss": -7.268138885498047, "global_step": 200914, "epoch": 4783} {"train_loss": -7.115449905395508, "global_step": 200915, "epoch": 4783} {"train_loss": -7.256715774536133, "global_step": 200916, "epoch": 4783} {"train_loss": -7.407111167907715, "global_step": 200917, "epoch": 4783} {"train_loss": -7.1583099365234375, "global_step": 200918, "epoch": 4783} {"train_loss": -7.259006500244141, "global_step": 200919, "epoch": 4783} {"train_loss": -7.17395544052124, "global_step": 200920, "epoch": 4783} {"train_loss": -7.238744735717773, "global_step": 200921, "epoch": 4783} {"train_loss": -7.128749370574951, "global_step": 200922, "epoch": 4783} {"train_loss": -7.216308116912842, "global_step": 200923, "epoch": 4783} {"train_loss": -7.171875953674316, "global_step": 200924, "epoch": 4783} {"train_loss": -7.2389020919799805, "global_step": 200925, "epoch": 4783} {"train_loss": -7.235067844390869, "global_step": 200926, "epoch": 4783} {"train_loss": -7.247650918506441, "global_step": 200927, "epoch": 4783, "val_loss": 69848.796875} {"train_loss": -7.215512275695801, "global_step": 200928, "epoch": 4784} {"train_loss": -7.115077972412109, "global_step": 200929, "epoch": 4784} {"train_loss": -7.235518455505371, "global_step": 200930, "epoch": 4784} {"train_loss": -7.2503180503845215, "global_step": 200931, "epoch": 4784} {"train_loss": -7.153275489807129, "global_step": 200932, "epoch": 4784} {"train_loss": -7.217163562774658, "global_step": 200933, "epoch": 4784} {"train_loss": -7.256657123565674, "global_step": 200934, "epoch": 4784} {"train_loss": -7.2187042236328125, "global_step": 200935, "epoch": 4784} {"train_loss": -7.208895683288574, "global_step": 200936, "epoch": 4784} {"train_loss": -7.2711262702941895, "global_step": 200937, "epoch": 4784} {"train_loss": -7.20280647277832, "global_step": 200938, "epoch": 4784} {"train_loss": -7.410788536071777, "global_step": 200939, "epoch": 4784} {"train_loss": -7.11781644821167, "global_step": 200940, "epoch": 4784} {"train_loss": -7.226306438446045, "global_step": 200941, "epoch": 4784} {"train_loss": -7.300518989562988, "global_step": 200942, "epoch": 4784} {"train_loss": -7.1089019775390625, "global_step": 200943, "epoch": 4784} {"train_loss": -7.130370140075684, "global_step": 200944, "epoch": 4784} {"train_loss": -7.205389976501465, "global_step": 200945, "epoch": 4784} {"train_loss": -7.312527656555176, "global_step": 200946, "epoch": 4784} {"train_loss": -7.257393836975098, "global_step": 200947, "epoch": 4784} {"train_loss": -7.131372451782227, "global_step": 200948, "epoch": 4784} {"train_loss": -7.155519485473633, "global_step": 200949, "epoch": 4784} {"train_loss": -7.322412490844727, "global_step": 200950, "epoch": 4784} {"train_loss": -7.29864501953125, "global_step": 200951, "epoch": 4784} {"train_loss": -7.202213764190674, "global_step": 200952, "epoch": 4784} {"train_loss": -7.275692462921143, "global_step": 200953, "epoch": 4784} {"train_loss": -7.301206588745117, "global_step": 200954, "epoch": 4784} {"train_loss": -7.154226779937744, "global_step": 200955, "epoch": 4784} {"train_loss": -7.301848888397217, "global_step": 200956, "epoch": 4784} {"train_loss": -7.192374229431152, "global_step": 200957, "epoch": 4784} {"train_loss": -7.277909755706787, "global_step": 200958, "epoch": 4784} {"train_loss": -7.38697624206543, "global_step": 200959, "epoch": 4784} {"train_loss": -7.186275482177734, "global_step": 200960, "epoch": 4784} {"train_loss": -7.356402397155762, "global_step": 200961, "epoch": 4784} {"train_loss": -7.222597122192383, "global_step": 200962, "epoch": 4784} {"train_loss": -7.311901092529297, "global_step": 200963, "epoch": 4784} {"train_loss": -7.185725212097168, "global_step": 200964, "epoch": 4784} {"train_loss": -7.349078178405762, "global_step": 200965, "epoch": 4784} {"train_loss": -7.24080753326416, "global_step": 200966, "epoch": 4784} {"train_loss": -7.245222091674805, "global_step": 200967, "epoch": 4784} {"train_loss": -7.332448959350586, "global_step": 200968, "epoch": 4784} {"train_loss": -7.241306497937157, "global_step": 200969, "epoch": 4784, "val_loss": 70026.2578125} {"train_loss": -7.470953941345215, "global_step": 200970, "epoch": 4785} {"train_loss": -7.217210292816162, "global_step": 200971, "epoch": 4785} {"train_loss": -7.377536773681641, "global_step": 200972, "epoch": 4785} {"train_loss": -7.410558700561523, "global_step": 200973, "epoch": 4785} {"train_loss": -7.286205291748047, "global_step": 200974, "epoch": 4785} {"train_loss": -7.24851655960083, "global_step": 200975, "epoch": 4785} {"train_loss": -7.349249362945557, "global_step": 200976, "epoch": 4785} {"train_loss": -7.271268844604492, "global_step": 200977, "epoch": 4785} {"train_loss": -7.320147514343262, "global_step": 200978, "epoch": 4785} {"train_loss": -7.378435134887695, "global_step": 200979, "epoch": 4785} {"train_loss": -7.346883773803711, "global_step": 200980, "epoch": 4785} {"train_loss": -7.352889060974121, "global_step": 200981, "epoch": 4785} {"train_loss": -7.398724555969238, "global_step": 200982, "epoch": 4785} {"train_loss": -7.286998748779297, "global_step": 200983, "epoch": 4785} {"train_loss": -7.31156063079834, "global_step": 200984, "epoch": 4785} {"train_loss": -7.317827224731445, "global_step": 200985, "epoch": 4785} {"train_loss": -7.093090057373047, "global_step": 200986, "epoch": 4785} {"train_loss": -7.213436603546143, "global_step": 200987, "epoch": 4785} {"train_loss": -7.181846618652344, "global_step": 200988, "epoch": 4785} {"train_loss": -7.139746189117432, "global_step": 200989, "epoch": 4785} {"train_loss": -7.325922966003418, "global_step": 200990, "epoch": 4785} {"train_loss": -7.1048173904418945, "global_step": 200991, "epoch": 4785} {"train_loss": -7.218973636627197, "global_step": 200992, "epoch": 4785} {"train_loss": -7.254851341247559, "global_step": 200993, "epoch": 4785} {"train_loss": -7.177389144897461, "global_step": 200994, "epoch": 4785} {"train_loss": -7.356821537017822, "global_step": 200995, "epoch": 4785} {"train_loss": -7.222972869873047, "global_step": 200996, "epoch": 4785} {"train_loss": -7.192643165588379, "global_step": 200997, "epoch": 4785} {"train_loss": -7.237762928009033, "global_step": 200998, "epoch": 4785} {"train_loss": -7.126030921936035, "global_step": 200999, "epoch": 4785} {"train_loss": -7.244904518127441, "global_step": 201000, "epoch": 4785} {"train_loss": -6.995615005493164, "global_step": 201001, "epoch": 4785} {"train_loss": -7.301815032958984, "global_step": 201002, "epoch": 4785} {"train_loss": -7.165243148803711, "global_step": 201003, "epoch": 4785} {"train_loss": -7.299148082733154, "global_step": 201004, "epoch": 4785} {"train_loss": -7.225237846374512, "global_step": 201005, "epoch": 4785} {"train_loss": -7.170614242553711, "global_step": 201006, "epoch": 4785} {"train_loss": -7.132826328277588, "global_step": 201007, "epoch": 4785} {"train_loss": -7.154120445251465, "global_step": 201008, "epoch": 4785} {"train_loss": -7.143194675445557, "global_step": 201009, "epoch": 4785} {"train_loss": -7.252264022827148, "global_step": 201010, "epoch": 4785} {"train_loss": -7.2497574261256625, "global_step": 201011, "epoch": 4785, "val_loss": 69866.1953125} {"train_loss": -7.2541680335998535, "global_step": 201012, "epoch": 4786} {"train_loss": -7.248141288757324, "global_step": 201013, "epoch": 4786} {"train_loss": -7.232351779937744, "global_step": 201014, "epoch": 4786} {"train_loss": -7.269627094268799, "global_step": 201015, "epoch": 4786} {"train_loss": -7.215418815612793, "global_step": 201016, "epoch": 4786} {"train_loss": -7.223596096038818, "global_step": 201017, "epoch": 4786} {"train_loss": -7.258762359619141, "global_step": 201018, "epoch": 4786} {"train_loss": -7.323504447937012, "global_step": 201019, "epoch": 4786} {"train_loss": -7.263786315917969, "global_step": 201020, "epoch": 4786} {"train_loss": -7.314062118530273, "global_step": 201021, "epoch": 4786} {"train_loss": -7.258035659790039, "global_step": 201022, "epoch": 4786} {"train_loss": -7.322224140167236, "global_step": 201023, "epoch": 4786} {"train_loss": -7.323495864868164, "global_step": 201024, "epoch": 4786} {"train_loss": -7.345647811889648, "global_step": 201025, "epoch": 4786} {"train_loss": -7.285796642303467, "global_step": 201026, "epoch": 4786} {"train_loss": -7.368270397186279, "global_step": 201027, "epoch": 4786} {"train_loss": -7.40806770324707, "global_step": 201028, "epoch": 4786} {"train_loss": -7.192084789276123, "global_step": 201029, "epoch": 4786} {"train_loss": -7.240995407104492, "global_step": 201030, "epoch": 4786} {"train_loss": -7.382781028747559, "global_step": 201031, "epoch": 4786} {"train_loss": -7.176286697387695, "global_step": 201032, "epoch": 4786} {"train_loss": -7.2354326248168945, "global_step": 201033, "epoch": 4786} {"train_loss": -7.24683952331543, "global_step": 201034, "epoch": 4786} {"train_loss": -7.318026542663574, "global_step": 201035, "epoch": 4786} {"train_loss": -7.3793182373046875, "global_step": 201036, "epoch": 4786} {"train_loss": -7.313247203826904, "global_step": 201037, "epoch": 4786} {"train_loss": -7.272348403930664, "global_step": 201038, "epoch": 4786} {"train_loss": -7.195743560791016, "global_step": 201039, "epoch": 4786} {"train_loss": -7.4504828453063965, "global_step": 201040, "epoch": 4786} {"train_loss": -7.252104759216309, "global_step": 201041, "epoch": 4786} {"train_loss": -7.371824264526367, "global_step": 201042, "epoch": 4786} {"train_loss": -7.342289447784424, "global_step": 201043, "epoch": 4786} {"train_loss": -7.311748504638672, "global_step": 201044, "epoch": 4786} {"train_loss": -7.340728282928467, "global_step": 201045, "epoch": 4786} {"train_loss": -7.406112194061279, "global_step": 201046, "epoch": 4786} {"train_loss": -7.320167541503906, "global_step": 201047, "epoch": 4786} {"train_loss": -7.365666389465332, "global_step": 201048, "epoch": 4786} {"train_loss": -7.441413402557373, "global_step": 201049, "epoch": 4786} {"train_loss": -7.290097713470459, "global_step": 201050, "epoch": 4786} {"train_loss": -7.226132869720459, "global_step": 201051, "epoch": 4786} {"train_loss": -7.264073848724365, "global_step": 201052, "epoch": 4786} {"train_loss": -7.301778884161086, "global_step": 201053, "epoch": 4786, "val_loss": 69809.515625} {"train_loss": -7.359194755554199, "global_step": 201054, "epoch": 4787} {"train_loss": -7.341872215270996, "global_step": 201055, "epoch": 4787} {"train_loss": -7.239980697631836, "global_step": 201056, "epoch": 4787} {"train_loss": -7.2820940017700195, "global_step": 201057, "epoch": 4787} {"train_loss": -7.231276512145996, "global_step": 201058, "epoch": 4787} {"train_loss": -7.307004451751709, "global_step": 201059, "epoch": 4787} {"train_loss": -7.3042988777160645, "global_step": 201060, "epoch": 4787} {"train_loss": -7.2963056564331055, "global_step": 201061, "epoch": 4787} {"train_loss": -7.418206214904785, "global_step": 201062, "epoch": 4787} {"train_loss": -7.159431457519531, "global_step": 201063, "epoch": 4787} {"train_loss": -7.243824005126953, "global_step": 201064, "epoch": 4787} {"train_loss": -7.2120280265808105, "global_step": 201065, "epoch": 4787} {"train_loss": -7.2065348625183105, "global_step": 201066, "epoch": 4787} {"train_loss": -7.325558662414551, "global_step": 201067, "epoch": 4787} {"train_loss": -7.279050827026367, "global_step": 201068, "epoch": 4787} {"train_loss": -7.1356658935546875, "global_step": 201069, "epoch": 4787} {"train_loss": -7.317746162414551, "global_step": 201070, "epoch": 4787} {"train_loss": -7.201913833618164, "global_step": 201071, "epoch": 4787} {"train_loss": -7.119289398193359, "global_step": 201072, "epoch": 4787} {"train_loss": -7.269488334655762, "global_step": 201073, "epoch": 4787} {"train_loss": -7.111670970916748, "global_step": 201074, "epoch": 4787} {"train_loss": -7.244784355163574, "global_step": 201075, "epoch": 4787} {"train_loss": -7.316926956176758, "global_step": 201076, "epoch": 4787} {"train_loss": -7.300497531890869, "global_step": 201077, "epoch": 4787} {"train_loss": -7.3695878982543945, "global_step": 201078, "epoch": 4787} {"train_loss": -7.148430824279785, "global_step": 201079, "epoch": 4787} {"train_loss": -7.345996856689453, "global_step": 201080, "epoch": 4787} {"train_loss": -7.18363618850708, "global_step": 201081, "epoch": 4787} {"train_loss": -7.304255485534668, "global_step": 201082, "epoch": 4787} {"train_loss": -7.192543029785156, "global_step": 201083, "epoch": 4787} {"train_loss": -7.294848442077637, "global_step": 201084, "epoch": 4787} {"train_loss": -7.276324272155762, "global_step": 201085, "epoch": 4787} {"train_loss": -7.232167720794678, "global_step": 201086, "epoch": 4787} {"train_loss": -7.289416790008545, "global_step": 201087, "epoch": 4787} {"train_loss": -7.323780059814453, "global_step": 201088, "epoch": 4787} {"train_loss": -7.337166786193848, "global_step": 201089, "epoch": 4787} {"train_loss": -7.330346584320068, "global_step": 201090, "epoch": 4787} {"train_loss": -7.217411994934082, "global_step": 201091, "epoch": 4787} {"train_loss": -7.339687824249268, "global_step": 201092, "epoch": 4787} {"train_loss": -7.394007682800293, "global_step": 201093, "epoch": 4787} {"train_loss": -7.279743671417236, "global_step": 201094, "epoch": 4787} {"train_loss": -7.272485426494053, "global_step": 201095, "epoch": 4787, "val_loss": 69707.3359375} {"train_loss": -7.333545684814453, "global_step": 201096, "epoch": 4788} {"train_loss": -7.342321395874023, "global_step": 201097, "epoch": 4788} {"train_loss": -7.349041938781738, "global_step": 201098, "epoch": 4788} {"train_loss": -7.338593482971191, "global_step": 201099, "epoch": 4788} {"train_loss": -7.303227424621582, "global_step": 201100, "epoch": 4788} {"train_loss": -7.335476398468018, "global_step": 201101, "epoch": 4788} {"train_loss": -7.229372024536133, "global_step": 201102, "epoch": 4788} {"train_loss": -7.32138204574585, "global_step": 201103, "epoch": 4788} {"train_loss": -7.321023941040039, "global_step": 201104, "epoch": 4788} {"train_loss": -7.316867828369141, "global_step": 201105, "epoch": 4788} {"train_loss": -7.296036243438721, "global_step": 201106, "epoch": 4788} {"train_loss": -7.397856712341309, "global_step": 201107, "epoch": 4788} {"train_loss": -7.293076515197754, "global_step": 201108, "epoch": 4788} {"train_loss": -7.290369987487793, "global_step": 201109, "epoch": 4788} {"train_loss": -7.276547431945801, "global_step": 201110, "epoch": 4788} {"train_loss": -7.358285903930664, "global_step": 201111, "epoch": 4788} {"train_loss": -7.289344787597656, "global_step": 201112, "epoch": 4788} {"train_loss": -7.323861122131348, "global_step": 201113, "epoch": 4788} {"train_loss": -7.348026275634766, "global_step": 201114, "epoch": 4788} {"train_loss": -7.196866035461426, "global_step": 201115, "epoch": 4788} {"train_loss": -7.220900535583496, "global_step": 201116, "epoch": 4788} {"train_loss": -7.2003278732299805, "global_step": 201117, "epoch": 4788} {"train_loss": -7.175969123840332, "global_step": 201118, "epoch": 4788} {"train_loss": -7.057267189025879, "global_step": 201119, "epoch": 4788} {"train_loss": -7.21110200881958, "global_step": 201120, "epoch": 4788} {"train_loss": -7.1785478591918945, "global_step": 201121, "epoch": 4788} {"train_loss": -7.2018208503723145, "global_step": 201122, "epoch": 4788} {"train_loss": -7.293748378753662, "global_step": 201123, "epoch": 4788} {"train_loss": -7.342722415924072, "global_step": 201124, "epoch": 4788} {"train_loss": -7.181405544281006, "global_step": 201125, "epoch": 4788} {"train_loss": -7.3208770751953125, "global_step": 201126, "epoch": 4788} {"train_loss": -7.276669979095459, "global_step": 201127, "epoch": 4788} {"train_loss": -7.220489501953125, "global_step": 201128, "epoch": 4788} {"train_loss": -7.2517242431640625, "global_step": 201129, "epoch": 4788} {"train_loss": -7.324370384216309, "global_step": 201130, "epoch": 4788} {"train_loss": -7.239398956298828, "global_step": 201131, "epoch": 4788} {"train_loss": -7.241324424743652, "global_step": 201132, "epoch": 4788} {"train_loss": -7.422844409942627, "global_step": 201133, "epoch": 4788} {"train_loss": -7.112955093383789, "global_step": 201134, "epoch": 4788} {"train_loss": -7.318194389343262, "global_step": 201135, "epoch": 4788} {"train_loss": -7.448733806610107, "global_step": 201136, "epoch": 4788} {"train_loss": -7.279293991270519, "global_step": 201137, "epoch": 4788, "val_loss": 69918.125} {"train_loss": -7.314377307891846, "global_step": 201138, "epoch": 4789} {"train_loss": -7.2868571281433105, "global_step": 201139, "epoch": 4789} {"train_loss": -7.245542526245117, "global_step": 201140, "epoch": 4789} {"train_loss": -7.271634101867676, "global_step": 201141, "epoch": 4789} {"train_loss": -7.329927444458008, "global_step": 201142, "epoch": 4789} {"train_loss": -7.317380905151367, "global_step": 201143, "epoch": 4789} {"train_loss": -7.2975921630859375, "global_step": 201144, "epoch": 4789} {"train_loss": -7.2625250816345215, "global_step": 201145, "epoch": 4789} {"train_loss": -7.263337135314941, "global_step": 201146, "epoch": 4789} {"train_loss": -7.2776336669921875, "global_step": 201147, "epoch": 4789} {"train_loss": -7.284964084625244, "global_step": 201148, "epoch": 4789} {"train_loss": -7.23374080657959, "global_step": 201149, "epoch": 4789} {"train_loss": -7.154550552368164, "global_step": 201150, "epoch": 4789} {"train_loss": -7.320648193359375, "global_step": 201151, "epoch": 4789} {"train_loss": -7.187767028808594, "global_step": 201152, "epoch": 4789} {"train_loss": -7.036606311798096, "global_step": 201153, "epoch": 4789} {"train_loss": -7.304126739501953, "global_step": 201154, "epoch": 4789} {"train_loss": -7.1944169998168945, "global_step": 201155, "epoch": 4789} {"train_loss": -7.203296661376953, "global_step": 201156, "epoch": 4789} {"train_loss": -7.2347412109375, "global_step": 201157, "epoch": 4789} {"train_loss": -7.338271617889404, "global_step": 201158, "epoch": 4789} {"train_loss": -7.264886856079102, "global_step": 201159, "epoch": 4789} {"train_loss": -7.307589054107666, "global_step": 201160, "epoch": 4789} {"train_loss": -7.2461676597595215, "global_step": 201161, "epoch": 4789} {"train_loss": -7.289584636688232, "global_step": 201162, "epoch": 4789} {"train_loss": -7.400042533874512, "global_step": 201163, "epoch": 4789} {"train_loss": -7.308443546295166, "global_step": 201164, "epoch": 4789} {"train_loss": -7.215673446655273, "global_step": 201165, "epoch": 4789} {"train_loss": -7.259050369262695, "global_step": 201166, "epoch": 4789} {"train_loss": -7.235701560974121, "global_step": 201167, "epoch": 4789} {"train_loss": -7.3621721267700195, "global_step": 201168, "epoch": 4789} {"train_loss": -7.278346061706543, "global_step": 201169, "epoch": 4789} {"train_loss": -7.332708358764648, "global_step": 201170, "epoch": 4789} {"train_loss": -7.394896984100342, "global_step": 201171, "epoch": 4789} {"train_loss": -7.191619396209717, "global_step": 201172, "epoch": 4789} {"train_loss": -7.240135192871094, "global_step": 201173, "epoch": 4789} {"train_loss": -7.254887104034424, "global_step": 201174, "epoch": 4789} {"train_loss": -7.171755790710449, "global_step": 201175, "epoch": 4789} {"train_loss": -7.247426986694336, "global_step": 201176, "epoch": 4789} {"train_loss": -6.9878387451171875, "global_step": 201177, "epoch": 4789} {"train_loss": -7.198016166687012, "global_step": 201178, "epoch": 4789} {"train_loss": -7.254737558818999, "global_step": 201179, "epoch": 4789, "val_loss": 69889.3515625} {"train_loss": -7.191074371337891, "global_step": 201180, "epoch": 4790} {"train_loss": -7.2325592041015625, "global_step": 201181, "epoch": 4790} {"train_loss": -7.150291442871094, "global_step": 201182, "epoch": 4790} {"train_loss": -7.273247718811035, "global_step": 201183, "epoch": 4790} {"train_loss": -7.3418869972229, "global_step": 201184, "epoch": 4790} {"train_loss": -7.13095235824585, "global_step": 201185, "epoch": 4790} {"train_loss": -7.149529457092285, "global_step": 201186, "epoch": 4790} {"train_loss": -7.325441360473633, "global_step": 201187, "epoch": 4790} {"train_loss": -7.168830871582031, "global_step": 201188, "epoch": 4790} {"train_loss": -7.2233476638793945, "global_step": 201189, "epoch": 4790} {"train_loss": -7.234894275665283, "global_step": 201190, "epoch": 4790} {"train_loss": -7.323531150817871, "global_step": 201191, "epoch": 4790} {"train_loss": -7.169288635253906, "global_step": 201192, "epoch": 4790} {"train_loss": -7.174001216888428, "global_step": 201193, "epoch": 4790} {"train_loss": -7.318388938903809, "global_step": 201194, "epoch": 4790} {"train_loss": -7.188803672790527, "global_step": 201195, "epoch": 4790} {"train_loss": -7.217069149017334, "global_step": 201196, "epoch": 4790} {"train_loss": -7.112562656402588, "global_step": 201197, "epoch": 4790} {"train_loss": -7.168892860412598, "global_step": 201198, "epoch": 4790} {"train_loss": -7.160964488983154, "global_step": 201199, "epoch": 4790} {"train_loss": -7.252121925354004, "global_step": 201200, "epoch": 4790} {"train_loss": -7.324322700500488, "global_step": 201201, "epoch": 4790} {"train_loss": -7.163928031921387, "global_step": 201202, "epoch": 4790} {"train_loss": -7.219982624053955, "global_step": 201203, "epoch": 4790} {"train_loss": -7.081657886505127, "global_step": 201204, "epoch": 4790} {"train_loss": -7.200511932373047, "global_step": 201205, "epoch": 4790} {"train_loss": -7.14702033996582, "global_step": 201206, "epoch": 4790} {"train_loss": -7.17183256149292, "global_step": 201207, "epoch": 4790} {"train_loss": -7.184097766876221, "global_step": 201208, "epoch": 4790} {"train_loss": -7.197679042816162, "global_step": 201209, "epoch": 4790} {"train_loss": -7.289019584655762, "global_step": 201210, "epoch": 4790} {"train_loss": -7.248135566711426, "global_step": 201211, "epoch": 4790} {"train_loss": -7.341731071472168, "global_step": 201212, "epoch": 4790} {"train_loss": -7.278902053833008, "global_step": 201213, "epoch": 4790} {"train_loss": -7.402376651763916, "global_step": 201214, "epoch": 4790} {"train_loss": -7.339143753051758, "global_step": 201215, "epoch": 4790} {"train_loss": -7.287567615509033, "global_step": 201216, "epoch": 4790} {"train_loss": -7.283102512359619, "global_step": 201217, "epoch": 4790} {"train_loss": -7.219707489013672, "global_step": 201218, "epoch": 4790} {"train_loss": -7.223662853240967, "global_step": 201219, "epoch": 4790} {"train_loss": -7.3523125648498535, "global_step": 201220, "epoch": 4790} {"train_loss": -7.229825269608271, "global_step": 201221, "epoch": 4790, "val_loss": 69841.578125} {"train_loss": -7.383857727050781, "global_step": 201222, "epoch": 4791} {"train_loss": -7.203570365905762, "global_step": 201223, "epoch": 4791} {"train_loss": -7.400464057922363, "global_step": 201224, "epoch": 4791} {"train_loss": -7.413037300109863, "global_step": 201225, "epoch": 4791} {"train_loss": -7.231204509735107, "global_step": 201226, "epoch": 4791} {"train_loss": -7.303221702575684, "global_step": 201227, "epoch": 4791} {"train_loss": -7.328775405883789, "global_step": 201228, "epoch": 4791} {"train_loss": -7.332015037536621, "global_step": 201229, "epoch": 4791} {"train_loss": -7.360523223876953, "global_step": 201230, "epoch": 4791} {"train_loss": -7.329368591308594, "global_step": 201231, "epoch": 4791} {"train_loss": -7.293993949890137, "global_step": 201232, "epoch": 4791} {"train_loss": -7.2325439453125, "global_step": 201233, "epoch": 4791} {"train_loss": -7.437084674835205, "global_step": 201234, "epoch": 4791} {"train_loss": -7.240394592285156, "global_step": 201235, "epoch": 4791} {"train_loss": -7.11036491394043, "global_step": 201236, "epoch": 4791} {"train_loss": -7.264001846313477, "global_step": 201237, "epoch": 4791} {"train_loss": -7.209466934204102, "global_step": 201238, "epoch": 4791} {"train_loss": -7.3001251220703125, "global_step": 201239, "epoch": 4791} {"train_loss": -7.350464820861816, "global_step": 201240, "epoch": 4791} {"train_loss": -7.030974388122559, "global_step": 201241, "epoch": 4791} {"train_loss": -7.276465892791748, "global_step": 201242, "epoch": 4791} {"train_loss": -7.278022766113281, "global_step": 201243, "epoch": 4791} {"train_loss": -7.203982830047607, "global_step": 201244, "epoch": 4791} {"train_loss": -7.3487396240234375, "global_step": 201245, "epoch": 4791} {"train_loss": -7.403928756713867, "global_step": 201246, "epoch": 4791} {"train_loss": -7.212494850158691, "global_step": 201247, "epoch": 4791} {"train_loss": -7.281567096710205, "global_step": 201248, "epoch": 4791} {"train_loss": -7.262653350830078, "global_step": 201249, "epoch": 4791} {"train_loss": -7.202649116516113, "global_step": 201250, "epoch": 4791} {"train_loss": -7.282365798950195, "global_step": 201251, "epoch": 4791} {"train_loss": -7.291993141174316, "global_step": 201252, "epoch": 4791} {"train_loss": -7.365809440612793, "global_step": 201253, "epoch": 4791} {"train_loss": -7.329153060913086, "global_step": 201254, "epoch": 4791} {"train_loss": -7.334421634674072, "global_step": 201255, "epoch": 4791} {"train_loss": -7.305067539215088, "global_step": 201256, "epoch": 4791} {"train_loss": -7.336899280548096, "global_step": 201257, "epoch": 4791} {"train_loss": -7.318717002868652, "global_step": 201258, "epoch": 4791} {"train_loss": -7.366781711578369, "global_step": 201259, "epoch": 4791} {"train_loss": -7.315993309020996, "global_step": 201260, "epoch": 4791} {"train_loss": -7.393773078918457, "global_step": 201261, "epoch": 4791} {"train_loss": -7.335476875305176, "global_step": 201262, "epoch": 4791} {"train_loss": -7.298926489693778, "global_step": 201263, "epoch": 4791, "val_loss": 69660.890625} {"train_loss": -7.410511016845703, "global_step": 201264, "epoch": 4792} {"train_loss": -7.369494915008545, "global_step": 201265, "epoch": 4792} {"train_loss": -7.296132564544678, "global_step": 201266, "epoch": 4792} {"train_loss": -7.274764060974121, "global_step": 201267, "epoch": 4792} {"train_loss": -7.511756896972656, "global_step": 201268, "epoch": 4792} {"train_loss": -7.41170597076416, "global_step": 201269, "epoch": 4792} {"train_loss": -7.174915313720703, "global_step": 201270, "epoch": 4792} {"train_loss": -7.336947917938232, "global_step": 201271, "epoch": 4792} {"train_loss": -7.2732720375061035, "global_step": 201272, "epoch": 4792} {"train_loss": -7.214451789855957, "global_step": 201273, "epoch": 4792} {"train_loss": -7.2395830154418945, "global_step": 201274, "epoch": 4792} {"train_loss": -7.378649711608887, "global_step": 201275, "epoch": 4792} {"train_loss": -7.3386735916137695, "global_step": 201276, "epoch": 4792} {"train_loss": -7.240964889526367, "global_step": 201277, "epoch": 4792} {"train_loss": -7.3687639236450195, "global_step": 201278, "epoch": 4792} {"train_loss": -7.287468910217285, "global_step": 201279, "epoch": 4792} {"train_loss": -7.31321907043457, "global_step": 201280, "epoch": 4792} {"train_loss": -7.323392391204834, "global_step": 201281, "epoch": 4792} {"train_loss": -7.1776628494262695, "global_step": 201282, "epoch": 4792} {"train_loss": -7.183920383453369, "global_step": 201283, "epoch": 4792} {"train_loss": -7.224663257598877, "global_step": 201284, "epoch": 4792} {"train_loss": -7.26340389251709, "global_step": 201285, "epoch": 4792} {"train_loss": -7.10312032699585, "global_step": 201286, "epoch": 4792} {"train_loss": -7.297840118408203, "global_step": 201287, "epoch": 4792} {"train_loss": -7.368721008300781, "global_step": 201288, "epoch": 4792} {"train_loss": -7.1957855224609375, "global_step": 201289, "epoch": 4792} {"train_loss": -7.249263763427734, "global_step": 201290, "epoch": 4792} {"train_loss": -7.237313747406006, "global_step": 201291, "epoch": 4792} {"train_loss": -7.258150100708008, "global_step": 201292, "epoch": 4792} {"train_loss": -7.284756183624268, "global_step": 201293, "epoch": 4792} {"train_loss": -7.280394077301025, "global_step": 201294, "epoch": 4792} {"train_loss": -7.2399444580078125, "global_step": 201295, "epoch": 4792} {"train_loss": -7.205872058868408, "global_step": 201296, "epoch": 4792} {"train_loss": -7.1822829246521, "global_step": 201297, "epoch": 4792} {"train_loss": -7.291573524475098, "global_step": 201298, "epoch": 4792} {"train_loss": -7.268415927886963, "global_step": 201299, "epoch": 4792} {"train_loss": -7.288122177124023, "global_step": 201300, "epoch": 4792} {"train_loss": -7.240687370300293, "global_step": 201301, "epoch": 4792} {"train_loss": -7.36374044418335, "global_step": 201302, "epoch": 4792} {"train_loss": -7.223330974578857, "global_step": 201303, "epoch": 4792} {"train_loss": -7.1495680809021, "global_step": 201304, "epoch": 4792} {"train_loss": -7.277149484271095, "global_step": 201305, "epoch": 4792, "val_loss": 69830.359375} {"train_loss": -7.223354339599609, "global_step": 201306, "epoch": 4793} {"train_loss": -7.335246562957764, "global_step": 201307, "epoch": 4793} {"train_loss": -7.3832292556762695, "global_step": 201308, "epoch": 4793} {"train_loss": -7.396822929382324, "global_step": 201309, "epoch": 4793} {"train_loss": -7.314238548278809, "global_step": 201310, "epoch": 4793} {"train_loss": -7.314003944396973, "global_step": 201311, "epoch": 4793} {"train_loss": -7.181463241577148, "global_step": 201312, "epoch": 4793} {"train_loss": -7.155993461608887, "global_step": 201313, "epoch": 4793} {"train_loss": -7.269570350646973, "global_step": 201314, "epoch": 4793} {"train_loss": -7.16050910949707, "global_step": 201315, "epoch": 4793} {"train_loss": -7.070996284484863, "global_step": 201316, "epoch": 4793} {"train_loss": -7.238857269287109, "global_step": 201317, "epoch": 4793} {"train_loss": -7.290628433227539, "global_step": 201318, "epoch": 4793} {"train_loss": -7.151157379150391, "global_step": 201319, "epoch": 4793} {"train_loss": -7.347216606140137, "global_step": 201320, "epoch": 4793} {"train_loss": -7.191003322601318, "global_step": 201321, "epoch": 4793} {"train_loss": -7.257800102233887, "global_step": 201322, "epoch": 4793} {"train_loss": -7.303407669067383, "global_step": 201323, "epoch": 4793} {"train_loss": -7.203701019287109, "global_step": 201324, "epoch": 4793} {"train_loss": -7.2228899002075195, "global_step": 201325, "epoch": 4793} {"train_loss": -7.19549560546875, "global_step": 201326, "epoch": 4793} {"train_loss": -7.25186824798584, "global_step": 201327, "epoch": 4793} {"train_loss": -7.181604385375977, "global_step": 201328, "epoch": 4793} {"train_loss": -7.179133415222168, "global_step": 201329, "epoch": 4793} {"train_loss": -7.342589378356934, "global_step": 201330, "epoch": 4793} {"train_loss": -7.19242000579834, "global_step": 201331, "epoch": 4793} {"train_loss": -7.281576156616211, "global_step": 201332, "epoch": 4793} {"train_loss": -7.171728610992432, "global_step": 201333, "epoch": 4793} {"train_loss": -7.108556747436523, "global_step": 201334, "epoch": 4793} {"train_loss": -7.30478572845459, "global_step": 201335, "epoch": 4793} {"train_loss": -7.258818626403809, "global_step": 201336, "epoch": 4793} {"train_loss": -7.213490009307861, "global_step": 201337, "epoch": 4793} {"train_loss": -7.164429664611816, "global_step": 201338, "epoch": 4793} {"train_loss": -7.25144624710083, "global_step": 201339, "epoch": 4793} {"train_loss": -7.1935319900512695, "global_step": 201340, "epoch": 4793} {"train_loss": -7.150080680847168, "global_step": 201341, "epoch": 4793} {"train_loss": -7.27639102935791, "global_step": 201342, "epoch": 4793} {"train_loss": -7.324942588806152, "global_step": 201343, "epoch": 4793} {"train_loss": -7.318996429443359, "global_step": 201344, "epoch": 4793} {"train_loss": -7.341897964477539, "global_step": 201345, "epoch": 4793} {"train_loss": -7.387545585632324, "global_step": 201346, "epoch": 4793} {"train_loss": -7.2471245129903155, "global_step": 201347, "epoch": 4793, "val_loss": 69790.1015625} {"train_loss": -7.395040512084961, "global_step": 201348, "epoch": 4794} {"train_loss": -7.378086090087891, "global_step": 201349, "epoch": 4794} {"train_loss": -7.244020462036133, "global_step": 201350, "epoch": 4794} {"train_loss": -7.333012580871582, "global_step": 201351, "epoch": 4794} {"train_loss": -7.352912902832031, "global_step": 201352, "epoch": 4794} {"train_loss": -7.244599342346191, "global_step": 201353, "epoch": 4794} {"train_loss": -7.331294059753418, "global_step": 201354, "epoch": 4794} {"train_loss": -7.391419410705566, "global_step": 201355, "epoch": 4794} {"train_loss": -7.391740798950195, "global_step": 201356, "epoch": 4794} {"train_loss": -7.252737998962402, "global_step": 201357, "epoch": 4794} {"train_loss": -7.30828857421875, "global_step": 201358, "epoch": 4794} {"train_loss": -7.282337665557861, "global_step": 201359, "epoch": 4794} {"train_loss": -7.306732654571533, "global_step": 201360, "epoch": 4794} {"train_loss": -7.287552833557129, "global_step": 201361, "epoch": 4794} {"train_loss": -7.349112510681152, "global_step": 201362, "epoch": 4794} {"train_loss": -7.309759140014648, "global_step": 201363, "epoch": 4794} {"train_loss": -7.155993461608887, "global_step": 201364, "epoch": 4794} {"train_loss": -7.220696449279785, "global_step": 201365, "epoch": 4794} {"train_loss": -7.30880069732666, "global_step": 201366, "epoch": 4794} {"train_loss": -7.158519268035889, "global_step": 201367, "epoch": 4794} {"train_loss": -7.2336812019348145, "global_step": 201368, "epoch": 4794} {"train_loss": -7.228448390960693, "global_step": 201369, "epoch": 4794} {"train_loss": -7.090032577514648, "global_step": 201370, "epoch": 4794} {"train_loss": -7.353394985198975, "global_step": 201371, "epoch": 4794} {"train_loss": -7.245611190795898, "global_step": 201372, "epoch": 4794} {"train_loss": -7.26828145980835, "global_step": 201373, "epoch": 4794} {"train_loss": -7.353328227996826, "global_step": 201374, "epoch": 4794} {"train_loss": -7.289494037628174, "global_step": 201375, "epoch": 4794} {"train_loss": -7.420546531677246, "global_step": 201376, "epoch": 4794} {"train_loss": -7.29922342300415, "global_step": 201377, "epoch": 4794} {"train_loss": -7.24287223815918, "global_step": 201378, "epoch": 4794} {"train_loss": -7.36571741104126, "global_step": 201379, "epoch": 4794} {"train_loss": -7.29258918762207, "global_step": 201380, "epoch": 4794} {"train_loss": -7.319239616394043, "global_step": 201381, "epoch": 4794} {"train_loss": -7.3400797843933105, "global_step": 201382, "epoch": 4794} {"train_loss": -7.295179843902588, "global_step": 201383, "epoch": 4794} {"train_loss": -7.342865943908691, "global_step": 201384, "epoch": 4794} {"train_loss": -7.158673286437988, "global_step": 201385, "epoch": 4794} {"train_loss": -7.2517924308776855, "global_step": 201386, "epoch": 4794} {"train_loss": -7.160592555999756, "global_step": 201387, "epoch": 4794} {"train_loss": -7.272837162017822, "global_step": 201388, "epoch": 4794} {"train_loss": -7.28808119183495, "global_step": 201389, "epoch": 4794, "val_loss": 69899.4375} {"train_loss": -7.1934404373168945, "global_step": 201390, "epoch": 4795} {"train_loss": -7.043027400970459, "global_step": 201391, "epoch": 4795} {"train_loss": -7.175450801849365, "global_step": 201392, "epoch": 4795} {"train_loss": -7.350989818572998, "global_step": 201393, "epoch": 4795} {"train_loss": -7.199366092681885, "global_step": 201394, "epoch": 4795} {"train_loss": -7.278298377990723, "global_step": 201395, "epoch": 4795} {"train_loss": -7.297080993652344, "global_step": 201396, "epoch": 4795} {"train_loss": -7.226584434509277, "global_step": 201397, "epoch": 4795} {"train_loss": -7.322238922119141, "global_step": 201398, "epoch": 4795} {"train_loss": -7.2818145751953125, "global_step": 201399, "epoch": 4795} {"train_loss": -7.26548957824707, "global_step": 201400, "epoch": 4795} {"train_loss": -7.348790645599365, "global_step": 201401, "epoch": 4795} {"train_loss": -7.265618324279785, "global_step": 201402, "epoch": 4795} {"train_loss": -7.343113422393799, "global_step": 201403, "epoch": 4795} {"train_loss": -7.353398323059082, "global_step": 201404, "epoch": 4795} {"train_loss": -7.271850109100342, "global_step": 201405, "epoch": 4795} {"train_loss": -7.2747297286987305, "global_step": 201406, "epoch": 4795} {"train_loss": -7.296041488647461, "global_step": 201407, "epoch": 4795} {"train_loss": -7.384903907775879, "global_step": 201408, "epoch": 4795} {"train_loss": -7.282625675201416, "global_step": 201409, "epoch": 4795} {"train_loss": -7.378485679626465, "global_step": 201410, "epoch": 4795} {"train_loss": -7.400716781616211, "global_step": 201411, "epoch": 4795} {"train_loss": -7.289388656616211, "global_step": 201412, "epoch": 4795} {"train_loss": -7.361495018005371, "global_step": 201413, "epoch": 4795} {"train_loss": -7.317296028137207, "global_step": 201414, "epoch": 4795} {"train_loss": -7.259703636169434, "global_step": 201415, "epoch": 4795} {"train_loss": -7.272111892700195, "global_step": 201416, "epoch": 4795} {"train_loss": -7.288405418395996, "global_step": 201417, "epoch": 4795} {"train_loss": -7.353226661682129, "global_step": 201418, "epoch": 4795} {"train_loss": -7.1907639503479, "global_step": 201419, "epoch": 4795} {"train_loss": -7.225217342376709, "global_step": 201420, "epoch": 4795} {"train_loss": -7.26089334487915, "global_step": 201421, "epoch": 4795} {"train_loss": -7.122707366943359, "global_step": 201422, "epoch": 4795} {"train_loss": -7.354586124420166, "global_step": 201423, "epoch": 4795} {"train_loss": -7.272136211395264, "global_step": 201424, "epoch": 4795} {"train_loss": -7.318292617797852, "global_step": 201425, "epoch": 4795} {"train_loss": -7.310786247253418, "global_step": 201426, "epoch": 4795} {"train_loss": -7.239896774291992, "global_step": 201427, "epoch": 4795} {"train_loss": -7.130377769470215, "global_step": 201428, "epoch": 4795} {"train_loss": -7.209298610687256, "global_step": 201429, "epoch": 4795} {"train_loss": -7.162476539611816, "global_step": 201430, "epoch": 4795} {"train_loss": -7.273313715344384, "global_step": 201431, "epoch": 4795, "val_loss": 69789.3359375} {"train_loss": -7.206611633300781, "global_step": 201432, "epoch": 4796} {"train_loss": -7.281103610992432, "global_step": 201433, "epoch": 4796} {"train_loss": -7.254965782165527, "global_step": 201434, "epoch": 4796} {"train_loss": -7.155303001403809, "global_step": 201435, "epoch": 4796} {"train_loss": -7.256629943847656, "global_step": 201436, "epoch": 4796} {"train_loss": -7.138930320739746, "global_step": 201437, "epoch": 4796} {"train_loss": -7.1477508544921875, "global_step": 201438, "epoch": 4796} {"train_loss": -7.136593818664551, "global_step": 201439, "epoch": 4796} {"train_loss": -7.148557662963867, "global_step": 201440, "epoch": 4796} {"train_loss": -7.289238929748535, "global_step": 201441, "epoch": 4796} {"train_loss": -7.3063435554504395, "global_step": 201442, "epoch": 4796} {"train_loss": -7.191629409790039, "global_step": 201443, "epoch": 4796} {"train_loss": -7.319737434387207, "global_step": 201444, "epoch": 4796} {"train_loss": -7.16190242767334, "global_step": 201445, "epoch": 4796} {"train_loss": -7.290193557739258, "global_step": 201446, "epoch": 4796} {"train_loss": -7.10284423828125, "global_step": 201447, "epoch": 4796} {"train_loss": -7.028521537780762, "global_step": 201448, "epoch": 4796} {"train_loss": -7.207511901855469, "global_step": 201449, "epoch": 4796} {"train_loss": -7.192013740539551, "global_step": 201450, "epoch": 4796} {"train_loss": -7.171436309814453, "global_step": 201451, "epoch": 4796} {"train_loss": -7.338876247406006, "global_step": 201452, "epoch": 4796} {"train_loss": -7.168639183044434, "global_step": 201453, "epoch": 4796} {"train_loss": -7.036252975463867, "global_step": 201454, "epoch": 4796} {"train_loss": -7.2120537757873535, "global_step": 201455, "epoch": 4796} {"train_loss": -7.155677795410156, "global_step": 201456, "epoch": 4796} {"train_loss": -7.1754021644592285, "global_step": 201457, "epoch": 4796} {"train_loss": -7.172895431518555, "global_step": 201458, "epoch": 4796} {"train_loss": -7.243183612823486, "global_step": 201459, "epoch": 4796} {"train_loss": -7.315206050872803, "global_step": 201460, "epoch": 4796} {"train_loss": -7.172241687774658, "global_step": 201461, "epoch": 4796} {"train_loss": -7.245372772216797, "global_step": 201462, "epoch": 4796} {"train_loss": -7.086705207824707, "global_step": 201463, "epoch": 4796} {"train_loss": -7.290250778198242, "global_step": 201464, "epoch": 4796} {"train_loss": -7.0818071365356445, "global_step": 201465, "epoch": 4796} {"train_loss": -7.205262660980225, "global_step": 201466, "epoch": 4796} {"train_loss": -7.291431427001953, "global_step": 201467, "epoch": 4796} {"train_loss": -7.321493148803711, "global_step": 201468, "epoch": 4796} {"train_loss": -7.25063943862915, "global_step": 201469, "epoch": 4796} {"train_loss": -7.274150848388672, "global_step": 201470, "epoch": 4796} {"train_loss": -7.291101455688477, "global_step": 201471, "epoch": 4796} {"train_loss": -7.2338361740112305, "global_step": 201472, "epoch": 4796} {"train_loss": -7.208446865990048, "global_step": 201473, "epoch": 4796, "val_loss": 69847.890625} {"train_loss": -7.262408256530762, "global_step": 201474, "epoch": 4797} {"train_loss": -7.2195563316345215, "global_step": 201475, "epoch": 4797} {"train_loss": -7.402066707611084, "global_step": 201476, "epoch": 4797} {"train_loss": -7.283843994140625, "global_step": 201477, "epoch": 4797} {"train_loss": -7.295254230499268, "global_step": 201478, "epoch": 4797} {"train_loss": -7.308230876922607, "global_step": 201479, "epoch": 4797} {"train_loss": -7.305179595947266, "global_step": 201480, "epoch": 4797} {"train_loss": -7.3479461669921875, "global_step": 201481, "epoch": 4797} {"train_loss": -7.436960697174072, "global_step": 201482, "epoch": 4797} {"train_loss": -7.309708595275879, "global_step": 201483, "epoch": 4797} {"train_loss": -7.340855598449707, "global_step": 201484, "epoch": 4797} {"train_loss": -7.253945350646973, "global_step": 201485, "epoch": 4797} {"train_loss": -7.294106960296631, "global_step": 201486, "epoch": 4797} {"train_loss": -7.369816303253174, "global_step": 201487, "epoch": 4797} {"train_loss": -7.297311782836914, "global_step": 201488, "epoch": 4797} {"train_loss": -7.29718542098999, "global_step": 201489, "epoch": 4797} {"train_loss": -7.343045234680176, "global_step": 201490, "epoch": 4797} {"train_loss": -7.313209533691406, "global_step": 201491, "epoch": 4797} {"train_loss": -7.315077781677246, "global_step": 201492, "epoch": 4797} {"train_loss": -7.3653364181518555, "global_step": 201493, "epoch": 4797} {"train_loss": -7.2750043869018555, "global_step": 201494, "epoch": 4797} {"train_loss": -7.23133659362793, "global_step": 201495, "epoch": 4797} {"train_loss": -7.34108829498291, "global_step": 201496, "epoch": 4797} {"train_loss": -7.20994758605957, "global_step": 201497, "epoch": 4797} {"train_loss": -7.400736331939697, "global_step": 201498, "epoch": 4797} {"train_loss": -7.311640739440918, "global_step": 201499, "epoch": 4797} {"train_loss": -7.226110458374023, "global_step": 201500, "epoch": 4797} {"train_loss": -7.32916259765625, "global_step": 201501, "epoch": 4797} {"train_loss": -7.336639881134033, "global_step": 201502, "epoch": 4797} {"train_loss": -7.221639633178711, "global_step": 201503, "epoch": 4797} {"train_loss": -7.252829551696777, "global_step": 201504, "epoch": 4797} {"train_loss": -7.264979362487793, "global_step": 201505, "epoch": 4797} {"train_loss": -7.366034030914307, "global_step": 201506, "epoch": 4797} {"train_loss": -7.311136245727539, "global_step": 201507, "epoch": 4797} {"train_loss": -7.289153099060059, "global_step": 201508, "epoch": 4797} {"train_loss": -7.158407211303711, "global_step": 201509, "epoch": 4797} {"train_loss": -7.218672275543213, "global_step": 201510, "epoch": 4797} {"train_loss": -7.344247341156006, "global_step": 201511, "epoch": 4797} {"train_loss": -7.208483695983887, "global_step": 201512, "epoch": 4797} {"train_loss": -7.390276908874512, "global_step": 201513, "epoch": 4797} {"train_loss": -7.356166839599609, "global_step": 201514, "epoch": 4797} {"train_loss": -7.295748018083119, "global_step": 201515, "epoch": 4797, "val_loss": 70007.25} {"train_loss": -7.27976655960083, "global_step": 201516, "epoch": 4798} {"train_loss": -7.131683826446533, "global_step": 201517, "epoch": 4798} {"train_loss": -7.195187568664551, "global_step": 201518, "epoch": 4798} {"train_loss": -7.3166375160217285, "global_step": 201519, "epoch": 4798} {"train_loss": -7.2040228843688965, "global_step": 201520, "epoch": 4798} {"train_loss": -7.2375664710998535, "global_step": 201521, "epoch": 4798} {"train_loss": -7.172603607177734, "global_step": 201522, "epoch": 4798} {"train_loss": -7.15645170211792, "global_step": 201523, "epoch": 4798} {"train_loss": -7.259458065032959, "global_step": 201524, "epoch": 4798} {"train_loss": -7.098506927490234, "global_step": 201525, "epoch": 4798} {"train_loss": -7.263364791870117, "global_step": 201526, "epoch": 4798} {"train_loss": -7.279292106628418, "global_step": 201527, "epoch": 4798} {"train_loss": -7.140728950500488, "global_step": 201528, "epoch": 4798} {"train_loss": -7.257073879241943, "global_step": 201529, "epoch": 4798} {"train_loss": -7.249212265014648, "global_step": 201530, "epoch": 4798} {"train_loss": -7.355616092681885, "global_step": 201531, "epoch": 4798} {"train_loss": -7.151999473571777, "global_step": 201532, "epoch": 4798} {"train_loss": -7.322934150695801, "global_step": 201533, "epoch": 4798} {"train_loss": -7.278617858886719, "global_step": 201534, "epoch": 4798} {"train_loss": -7.27541446685791, "global_step": 201535, "epoch": 4798} {"train_loss": -7.325601100921631, "global_step": 201536, "epoch": 4798} {"train_loss": -7.327108860015869, "global_step": 201537, "epoch": 4798} {"train_loss": -7.3006768226623535, "global_step": 201538, "epoch": 4798} {"train_loss": -7.246297359466553, "global_step": 201539, "epoch": 4798} {"train_loss": -7.35774040222168, "global_step": 201540, "epoch": 4798} {"train_loss": -7.268712997436523, "global_step": 201541, "epoch": 4798} {"train_loss": -7.168335437774658, "global_step": 201542, "epoch": 4798} {"train_loss": -7.31075382232666, "global_step": 201543, "epoch": 4798} {"train_loss": -7.32651424407959, "global_step": 201544, "epoch": 4798} {"train_loss": -7.142818450927734, "global_step": 201545, "epoch": 4798} {"train_loss": -7.209664821624756, "global_step": 201546, "epoch": 4798} {"train_loss": -7.243313312530518, "global_step": 201547, "epoch": 4798} {"train_loss": -7.277438640594482, "global_step": 201548, "epoch": 4798} {"train_loss": -7.197598457336426, "global_step": 201549, "epoch": 4798} {"train_loss": -7.215725421905518, "global_step": 201550, "epoch": 4798} {"train_loss": -7.235874176025391, "global_step": 201551, "epoch": 4798} {"train_loss": -7.3105998039245605, "global_step": 201552, "epoch": 4798} {"train_loss": -7.248618125915527, "global_step": 201553, "epoch": 4798} {"train_loss": -7.101237773895264, "global_step": 201554, "epoch": 4798} {"train_loss": -7.2225165367126465, "global_step": 201555, "epoch": 4798} {"train_loss": -7.237475872039795, "global_step": 201556, "epoch": 4798} {"train_loss": -7.244627191906884, "global_step": 201557, "epoch": 4798, "val_loss": 69772.703125} {"train_loss": -7.338071823120117, "global_step": 201558, "epoch": 4799} {"train_loss": -7.241636276245117, "global_step": 201559, "epoch": 4799} {"train_loss": -7.3564229011535645, "global_step": 201560, "epoch": 4799} {"train_loss": -7.166041374206543, "global_step": 201561, "epoch": 4799} {"train_loss": -7.177095413208008, "global_step": 201562, "epoch": 4799} {"train_loss": -7.1400146484375, "global_step": 201563, "epoch": 4799} {"train_loss": -7.2057013511657715, "global_step": 201564, "epoch": 4799} {"train_loss": -7.173984527587891, "global_step": 201565, "epoch": 4799} {"train_loss": -7.04765510559082, "global_step": 201566, "epoch": 4799} {"train_loss": -7.146239280700684, "global_step": 201567, "epoch": 4799} {"train_loss": -7.16468620300293, "global_step": 201568, "epoch": 4799} {"train_loss": -6.887773036956787, "global_step": 201569, "epoch": 4799} {"train_loss": -7.200613498687744, "global_step": 201570, "epoch": 4799} {"train_loss": -7.1675801277160645, "global_step": 201571, "epoch": 4799} {"train_loss": -7.207561492919922, "global_step": 201572, "epoch": 4799} {"train_loss": -7.195966720581055, "global_step": 201573, "epoch": 4799} {"train_loss": -7.123957633972168, "global_step": 201574, "epoch": 4799} {"train_loss": -7.261319637298584, "global_step": 201575, "epoch": 4799} {"train_loss": -7.142055034637451, "global_step": 201576, "epoch": 4799} {"train_loss": -7.102749824523926, "global_step": 201577, "epoch": 4799} {"train_loss": -7.133589744567871, "global_step": 201578, "epoch": 4799} {"train_loss": -7.123615264892578, "global_step": 201579, "epoch": 4799} {"train_loss": -7.145278453826904, "global_step": 201580, "epoch": 4799} {"train_loss": -7.086882591247559, "global_step": 201581, "epoch": 4799} {"train_loss": -7.295599937438965, "global_step": 201582, "epoch": 4799} {"train_loss": -7.173027992248535, "global_step": 201583, "epoch": 4799} {"train_loss": -7.120624542236328, "global_step": 201584, "epoch": 4799} {"train_loss": -7.301564693450928, "global_step": 201585, "epoch": 4799} {"train_loss": -7.301550388336182, "global_step": 201586, "epoch": 4799} {"train_loss": -7.25570011138916, "global_step": 201587, "epoch": 4799} {"train_loss": -7.205982208251953, "global_step": 201588, "epoch": 4799} {"train_loss": -7.296962738037109, "global_step": 201589, "epoch": 4799} {"train_loss": -7.3299407958984375, "global_step": 201590, "epoch": 4799} {"train_loss": -7.33380126953125, "global_step": 201591, "epoch": 4799} {"train_loss": -7.294873237609863, "global_step": 201592, "epoch": 4799} {"train_loss": -7.304146766662598, "global_step": 201593, "epoch": 4799} {"train_loss": -7.412631988525391, "global_step": 201594, "epoch": 4799} {"train_loss": -7.384897708892822, "global_step": 201595, "epoch": 4799} {"train_loss": -7.323173522949219, "global_step": 201596, "epoch": 4799} {"train_loss": -7.364016056060791, "global_step": 201597, "epoch": 4799} {"train_loss": -7.250857353210449, "global_step": 201598, "epoch": 4799} {"train_loss": -7.220874582018171, "global_step": 201599, "epoch": 4799, "val_loss": 69768.9453125} {"train_loss": -7.390271186828613, "global_step": 201600, "epoch": 4800} {"train_loss": -7.371763229370117, "global_step": 201601, "epoch": 4800} {"train_loss": -7.342597007751465, "global_step": 201602, "epoch": 4800} {"train_loss": -7.308399200439453, "global_step": 201603, "epoch": 4800} {"train_loss": -7.337852478027344, "global_step": 201604, "epoch": 4800} {"train_loss": -7.334985733032227, "global_step": 201605, "epoch": 4800} {"train_loss": -7.397944927215576, "global_step": 201606, "epoch": 4800} {"train_loss": -7.371166229248047, "global_step": 201607, "epoch": 4800} {"train_loss": -7.223728179931641, "global_step": 201608, "epoch": 4800} {"train_loss": -7.389715194702148, "global_step": 201609, "epoch": 4800} {"train_loss": -7.318597793579102, "global_step": 201610, "epoch": 4800} {"train_loss": -7.332361698150635, "global_step": 201611, "epoch": 4800} {"train_loss": -7.2640380859375, "global_step": 201612, "epoch": 4800} {"train_loss": -7.4503936767578125, "global_step": 201613, "epoch": 4800} {"train_loss": -7.333538055419922, "global_step": 201614, "epoch": 4800} {"train_loss": -7.256623268127441, "global_step": 201615, "epoch": 4800} {"train_loss": -7.3457794189453125, "global_step": 201616, "epoch": 4800} {"train_loss": -7.362792015075684, "global_step": 201617, "epoch": 4800} {"train_loss": -7.25705623626709, "global_step": 201618, "epoch": 4800} {"train_loss": -7.427397727966309, "global_step": 201619, "epoch": 4800} {"train_loss": -7.270709991455078, "global_step": 201620, "epoch": 4800} {"train_loss": -7.265071868896484, "global_step": 201621, "epoch": 4800} {"train_loss": -7.37984561920166, "global_step": 201622, "epoch": 4800} {"train_loss": -7.261003494262695, "global_step": 201623, "epoch": 4800} {"train_loss": -7.153587341308594, "global_step": 201624, "epoch": 4800} {"train_loss": -7.199151039123535, "global_step": 201625, "epoch": 4800} {"train_loss": -7.106784343719482, "global_step": 201626, "epoch": 4800} {"train_loss": -6.9467315673828125, "global_step": 201627, "epoch": 4800} {"train_loss": -7.0955424308776855, "global_step": 201628, "epoch": 4800} {"train_loss": -7.0323357582092285, "global_step": 201629, "epoch": 4800} {"train_loss": -6.8848161697387695, "global_step": 201630, "epoch": 4800} {"train_loss": -7.2714948654174805, "global_step": 201631, "epoch": 4800} {"train_loss": -6.880866050720215, "global_step": 201632, "epoch": 4800} {"train_loss": -7.083551406860352, "global_step": 201633, "epoch": 4800} {"train_loss": -7.067283630371094, "global_step": 201634, "epoch": 4800} {"train_loss": -7.160057067871094, "global_step": 201635, "epoch": 4800} {"train_loss": -7.037210464477539, "global_step": 201636, "epoch": 4800} {"train_loss": -7.177817344665527, "global_step": 201637, "epoch": 4800} {"train_loss": -7.08098030090332, "global_step": 201638, "epoch": 4800} {"train_loss": -7.206046104431152, "global_step": 201639, "epoch": 4800} {"train_loss": -7.082793235778809, "global_step": 201640, "epoch": 4800} {"train_loss": -7.229566505977085, "global_step": 201641, "epoch": 4800, "train/sim_max_reward_0": 0.19033475454157764, "train/sim_max_reward_1": 0.9525749892701284, "train/sim_max_reward_2": 0.5554690590762988, "train/sim_max_reward_3": 0.1304207752411336, "train/sim_max_reward_4": 0.9880635953063727, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4300000": 0.9143073528575832, "test/sim_max_reward_4300001": 0.6917529769297202, "test/sim_max_reward_4300002": 0.9670183584927028, "test/sim_max_reward_4300003": 0.8503643675683046, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9320599104905263, "test/sim_max_reward_4300006": 0.9999248264514545, "test/sim_max_reward_4300007": 0.30804487546976617, "test/sim_max_reward_4300008": 0.983303489791277, "test/sim_max_reward_4300009": 0.9909248575182089, "test/sim_max_reward_4300010": 0.9936936479955935, "test/sim_max_reward_4300011": 0.9593753005027501, "test/sim_max_reward_4300012": 0.9871297873311835, "test/sim_max_reward_4300013": 0.5581487039433971, "test/sim_max_reward_4300014": 1.0, "test/sim_max_reward_4300015": 0.9297045574343745, "test/sim_max_reward_4300016": 0.8195310024472187, "test/sim_max_reward_4300017": 0.47595554877754376, "test/sim_max_reward_4300018": 0.9220430208334236, "test/sim_max_reward_4300019": 0.18624024545217657, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.805413608046762, "test/sim_max_reward_4300022": 0.938947626439812, "test/sim_max_reward_4300023": 0.9491575944745329, "test/sim_max_reward_4300024": 0.8753532804479898, "test/sim_max_reward_4300025": 0.9820306385493299, "test/sim_max_reward_4300026": 0.11394588039791634, "test/sim_max_reward_4300027": 0.9161131036577717, "test/sim_max_reward_4300028": 0.7509630149338548, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.14527395425865347, "test/sim_max_reward_4300031": 0.20862047667674563, "test/sim_max_reward_4300032": 0.9368397735091076, "test/sim_max_reward_4300033": 0.9474779812520598, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.657264807092621, "test/sim_max_reward_4300036": 0.20289289500464042, "test/sim_max_reward_4300037": 0.8616975551296212, "test/sim_max_reward_4300038": 0.9320831275077965, "test/sim_max_reward_4300039": 1.0, "test/sim_max_reward_4300040": 0.9965056452896985, "test/sim_max_reward_4300041": 0.8762026584279379, "test/sim_max_reward_4300042": 0.7125680008591709, "test/sim_max_reward_4300043": 0.11475057586894194, "test/sim_max_reward_4300044": 0.04345707006804553, "test/sim_max_reward_4300045": 0.8949809270545527, "test/sim_max_reward_4300046": 0.8339388691802873, "test/sim_max_reward_4300047": 0.11754137787262176, "test/sim_max_reward_4300048": 0.007206984073541225, "test/sim_max_reward_4300049": 0.18720838033151807, "train/mean_score": 0.5016413221329498, "test/mean_score": 0.6498758548300405, "val_loss": 70078.3984375} {"train_loss": -7.150296211242676, "global_step": 201642, "epoch": 4801} {"train_loss": -7.098013401031494, "global_step": 201643, "epoch": 4801} {"train_loss": -7.136677265167236, "global_step": 201644, "epoch": 4801} {"train_loss": -7.185054779052734, "global_step": 201645, "epoch": 4801} {"train_loss": -7.204418182373047, "global_step": 201646, "epoch": 4801} {"train_loss": -7.162041664123535, "global_step": 201647, "epoch": 4801} {"train_loss": -7.293709754943848, "global_step": 201648, "epoch": 4801} {"train_loss": -7.2315874099731445, "global_step": 201649, "epoch": 4801} {"train_loss": -7.193211555480957, "global_step": 201650, "epoch": 4801} {"train_loss": -7.273122787475586, "global_step": 201651, "epoch": 4801} {"train_loss": -7.206543922424316, "global_step": 201652, "epoch": 4801} {"train_loss": -7.214875221252441, "global_step": 201653, "epoch": 4801} {"train_loss": -7.27622652053833, "global_step": 201654, "epoch": 4801} {"train_loss": -7.143899917602539, "global_step": 201655, "epoch": 4801} {"train_loss": -7.328647613525391, "global_step": 201656, "epoch": 4801} {"train_loss": -7.265591621398926, "global_step": 201657, "epoch": 4801} {"train_loss": -7.185568809509277, "global_step": 201658, "epoch": 4801} {"train_loss": -7.3133769035339355, "global_step": 201659, "epoch": 4801} {"train_loss": -7.251757621765137, "global_step": 201660, "epoch": 4801} {"train_loss": -7.20656156539917, "global_step": 201661, "epoch": 4801} {"train_loss": -7.237095832824707, "global_step": 201662, "epoch": 4801} {"train_loss": -7.153911590576172, "global_step": 201663, "epoch": 4801} {"train_loss": -7.270393371582031, "global_step": 201664, "epoch": 4801} {"train_loss": -7.378015041351318, "global_step": 201665, "epoch": 4801} {"train_loss": -7.262355804443359, "global_step": 201666, "epoch": 4801} {"train_loss": -7.226276397705078, "global_step": 201667, "epoch": 4801} {"train_loss": -7.268636703491211, "global_step": 201668, "epoch": 4801} {"train_loss": -7.273811340332031, "global_step": 201669, "epoch": 4801} {"train_loss": -7.177147388458252, "global_step": 201670, "epoch": 4801} {"train_loss": -7.262564659118652, "global_step": 201671, "epoch": 4801} {"train_loss": -7.158573150634766, "global_step": 201672, "epoch": 4801} {"train_loss": -7.322538375854492, "global_step": 201673, "epoch": 4801} {"train_loss": -7.133437156677246, "global_step": 201674, "epoch": 4801} {"train_loss": -7.240056991577148, "global_step": 201675, "epoch": 4801} {"train_loss": -7.275495529174805, "global_step": 201676, "epoch": 4801} {"train_loss": -7.300334930419922, "global_step": 201677, "epoch": 4801} {"train_loss": -7.299023628234863, "global_step": 201678, "epoch": 4801} {"train_loss": -7.154115676879883, "global_step": 201679, "epoch": 4801} {"train_loss": -7.2150678634643555, "global_step": 201680, "epoch": 4801} {"train_loss": -7.301779747009277, "global_step": 201681, "epoch": 4801} {"train_loss": -7.2501678466796875, "global_step": 201682, "epoch": 4801} {"train_loss": -7.233927488327026, "global_step": 201683, "epoch": 4801, "val_loss": 69838.3359375} {"train_loss": -7.161864280700684, "global_step": 201684, "epoch": 4802} {"train_loss": -7.195745944976807, "global_step": 201685, "epoch": 4802} {"train_loss": -7.300690650939941, "global_step": 201686, "epoch": 4802} {"train_loss": -7.36424446105957, "global_step": 201687, "epoch": 4802} {"train_loss": -7.159333229064941, "global_step": 201688, "epoch": 4802} {"train_loss": -7.113827705383301, "global_step": 201689, "epoch": 4802} {"train_loss": -7.138001918792725, "global_step": 201690, "epoch": 4802} {"train_loss": -7.199936866760254, "global_step": 201691, "epoch": 4802} {"train_loss": -6.9692487716674805, "global_step": 201692, "epoch": 4802} {"train_loss": -7.267589569091797, "global_step": 201693, "epoch": 4802} {"train_loss": -7.18214225769043, "global_step": 201694, "epoch": 4802} {"train_loss": -7.091565132141113, "global_step": 201695, "epoch": 4802} {"train_loss": -7.128818988800049, "global_step": 201696, "epoch": 4802} {"train_loss": -7.161665916442871, "global_step": 201697, "epoch": 4802} {"train_loss": -7.188154220581055, "global_step": 201698, "epoch": 4802} {"train_loss": -7.032308578491211, "global_step": 201699, "epoch": 4802} {"train_loss": -7.159734725952148, "global_step": 201700, "epoch": 4802} {"train_loss": -7.149003982543945, "global_step": 201701, "epoch": 4802} {"train_loss": -7.273250579833984, "global_step": 201702, "epoch": 4802} {"train_loss": -7.213271141052246, "global_step": 201703, "epoch": 4802} {"train_loss": -7.221562385559082, "global_step": 201704, "epoch": 4802} {"train_loss": -7.242863178253174, "global_step": 201705, "epoch": 4802} {"train_loss": -7.148053169250488, "global_step": 201706, "epoch": 4802} {"train_loss": -7.283180236816406, "global_step": 201707, "epoch": 4802} {"train_loss": -7.1937150955200195, "global_step": 201708, "epoch": 4802} {"train_loss": -7.366807460784912, "global_step": 201709, "epoch": 4802} {"train_loss": -7.2493791580200195, "global_step": 201710, "epoch": 4802} {"train_loss": -7.312967300415039, "global_step": 201711, "epoch": 4802} {"train_loss": -7.1768951416015625, "global_step": 201712, "epoch": 4802} {"train_loss": -7.239311218261719, "global_step": 201713, "epoch": 4802} {"train_loss": -7.316912651062012, "global_step": 201714, "epoch": 4802} {"train_loss": -7.200601100921631, "global_step": 201715, "epoch": 4802} {"train_loss": -7.245689392089844, "global_step": 201716, "epoch": 4802} {"train_loss": -7.324866771697998, "global_step": 201717, "epoch": 4802} {"train_loss": -7.271642684936523, "global_step": 201718, "epoch": 4802} {"train_loss": -7.324347019195557, "global_step": 201719, "epoch": 4802} {"train_loss": -7.354223251342773, "global_step": 201720, "epoch": 4802} {"train_loss": -7.354458808898926, "global_step": 201721, "epoch": 4802} {"train_loss": -7.285050868988037, "global_step": 201722, "epoch": 4802} {"train_loss": -7.287139892578125, "global_step": 201723, "epoch": 4802} {"train_loss": -7.169116020202637, "global_step": 201724, "epoch": 4802} {"train_loss": -7.2202823389144175, "global_step": 201725, "epoch": 4802, "val_loss": 69661.2421875} {"train_loss": -7.3566813468933105, "global_step": 201726, "epoch": 4803} {"train_loss": -7.150964736938477, "global_step": 201727, "epoch": 4803} {"train_loss": -7.2210307121276855, "global_step": 201728, "epoch": 4803} {"train_loss": -7.188776016235352, "global_step": 201729, "epoch": 4803} {"train_loss": -7.244752883911133, "global_step": 201730, "epoch": 4803} {"train_loss": -7.213855743408203, "global_step": 201731, "epoch": 4803} {"train_loss": -7.224732398986816, "global_step": 201732, "epoch": 4803} {"train_loss": -7.2852559089660645, "global_step": 201733, "epoch": 4803} {"train_loss": -7.065877914428711, "global_step": 201734, "epoch": 4803} {"train_loss": -7.198238372802734, "global_step": 201735, "epoch": 4803} {"train_loss": -7.202670574188232, "global_step": 201736, "epoch": 4803} {"train_loss": -7.232155799865723, "global_step": 201737, "epoch": 4803} {"train_loss": -7.134973526000977, "global_step": 201738, "epoch": 4803} {"train_loss": -7.210687637329102, "global_step": 201739, "epoch": 4803} {"train_loss": -7.366579532623291, "global_step": 201740, "epoch": 4803} {"train_loss": -7.215761661529541, "global_step": 201741, "epoch": 4803} {"train_loss": -7.275764465332031, "global_step": 201742, "epoch": 4803} {"train_loss": -7.143263816833496, "global_step": 201743, "epoch": 4803} {"train_loss": -7.206001281738281, "global_step": 201744, "epoch": 4803} {"train_loss": -7.228941917419434, "global_step": 201745, "epoch": 4803} {"train_loss": -7.424278736114502, "global_step": 201746, "epoch": 4803} {"train_loss": -7.277487754821777, "global_step": 201747, "epoch": 4803} {"train_loss": -7.277673244476318, "global_step": 201748, "epoch": 4803} {"train_loss": -7.265553951263428, "global_step": 201749, "epoch": 4803} {"train_loss": -7.325935363769531, "global_step": 201750, "epoch": 4803} {"train_loss": -7.344460964202881, "global_step": 201751, "epoch": 4803} {"train_loss": -7.298315048217773, "global_step": 201752, "epoch": 4803} {"train_loss": -7.3018293380737305, "global_step": 201753, "epoch": 4803} {"train_loss": -7.340898513793945, "global_step": 201754, "epoch": 4803} {"train_loss": -7.439706802368164, "global_step": 201755, "epoch": 4803} {"train_loss": -7.335515975952148, "global_step": 201756, "epoch": 4803} {"train_loss": -7.210726737976074, "global_step": 201757, "epoch": 4803} {"train_loss": -7.248884201049805, "global_step": 201758, "epoch": 4803} {"train_loss": -7.079802513122559, "global_step": 201759, "epoch": 4803} {"train_loss": -7.281519889831543, "global_step": 201760, "epoch": 4803} {"train_loss": -7.266887664794922, "global_step": 201761, "epoch": 4803} {"train_loss": -7.379934310913086, "global_step": 201762, "epoch": 4803} {"train_loss": -7.35753059387207, "global_step": 201763, "epoch": 4803} {"train_loss": -7.361466884613037, "global_step": 201764, "epoch": 4803} {"train_loss": -7.4227986335754395, "global_step": 201765, "epoch": 4803} {"train_loss": -7.4177937507629395, "global_step": 201766, "epoch": 4803} {"train_loss": -7.2718846797943115, "global_step": 201767, "epoch": 4803, "val_loss": 69768.7421875} {"train_loss": -7.32343864440918, "global_step": 201768, "epoch": 4804} {"train_loss": -7.193610191345215, "global_step": 201769, "epoch": 4804} {"train_loss": -7.3302106857299805, "global_step": 201770, "epoch": 4804} {"train_loss": -7.39912223815918, "global_step": 201771, "epoch": 4804} {"train_loss": -7.146513938903809, "global_step": 201772, "epoch": 4804} {"train_loss": -7.373516082763672, "global_step": 201773, "epoch": 4804} {"train_loss": -7.3579230308532715, "global_step": 201774, "epoch": 4804} {"train_loss": -7.273188591003418, "global_step": 201775, "epoch": 4804} {"train_loss": -7.329769134521484, "global_step": 201776, "epoch": 4804} {"train_loss": -7.22857666015625, "global_step": 201777, "epoch": 4804} {"train_loss": -7.284287452697754, "global_step": 201778, "epoch": 4804} {"train_loss": -7.26820182800293, "global_step": 201779, "epoch": 4804} {"train_loss": -7.289077281951904, "global_step": 201780, "epoch": 4804} {"train_loss": -7.375232219696045, "global_step": 201781, "epoch": 4804} {"train_loss": -7.353289604187012, "global_step": 201782, "epoch": 4804} {"train_loss": -7.262238502502441, "global_step": 201783, "epoch": 4804} {"train_loss": -7.226580619812012, "global_step": 201784, "epoch": 4804} {"train_loss": -7.4145917892456055, "global_step": 201785, "epoch": 4804} {"train_loss": -7.335301876068115, "global_step": 201786, "epoch": 4804} {"train_loss": -7.35505485534668, "global_step": 201787, "epoch": 4804} {"train_loss": -7.367008686065674, "global_step": 201788, "epoch": 4804} {"train_loss": -7.311394691467285, "global_step": 201789, "epoch": 4804} {"train_loss": -7.320618152618408, "global_step": 201790, "epoch": 4804} {"train_loss": -7.169299602508545, "global_step": 201791, "epoch": 4804} {"train_loss": -7.1692399978637695, "global_step": 201792, "epoch": 4804} {"train_loss": -7.252835273742676, "global_step": 201793, "epoch": 4804} {"train_loss": -7.3888258934021, "global_step": 201794, "epoch": 4804} {"train_loss": -7.165350914001465, "global_step": 201795, "epoch": 4804} {"train_loss": -7.125921249389648, "global_step": 201796, "epoch": 4804} {"train_loss": -7.287935733795166, "global_step": 201797, "epoch": 4804} {"train_loss": -7.1905317306518555, "global_step": 201798, "epoch": 4804} {"train_loss": -7.230807304382324, "global_step": 201799, "epoch": 4804} {"train_loss": -7.111356735229492, "global_step": 201800, "epoch": 4804} {"train_loss": -7.365752696990967, "global_step": 201801, "epoch": 4804} {"train_loss": -7.239738941192627, "global_step": 201802, "epoch": 4804} {"train_loss": -7.1810407638549805, "global_step": 201803, "epoch": 4804} {"train_loss": -7.296764373779297, "global_step": 201804, "epoch": 4804} {"train_loss": -7.2670722007751465, "global_step": 201805, "epoch": 4804} {"train_loss": -7.220221042633057, "global_step": 201806, "epoch": 4804} {"train_loss": -7.32231330871582, "global_step": 201807, "epoch": 4804} {"train_loss": -7.191317081451416, "global_step": 201808, "epoch": 4804} {"train_loss": -7.2759166445050925, "global_step": 201809, "epoch": 4804, "val_loss": 70108.0234375} {"train_loss": -7.311158180236816, "global_step": 201810, "epoch": 4805} {"train_loss": -7.172799110412598, "global_step": 201811, "epoch": 4805} {"train_loss": -7.258770942687988, "global_step": 201812, "epoch": 4805} {"train_loss": -7.2976298332214355, "global_step": 201813, "epoch": 4805} {"train_loss": -7.161134719848633, "global_step": 201814, "epoch": 4805} {"train_loss": -7.194551944732666, "global_step": 201815, "epoch": 4805} {"train_loss": -7.220310688018799, "global_step": 201816, "epoch": 4805} {"train_loss": -7.195940971374512, "global_step": 201817, "epoch": 4805} {"train_loss": -7.327174663543701, "global_step": 201818, "epoch": 4805} {"train_loss": -7.247531890869141, "global_step": 201819, "epoch": 4805} {"train_loss": -7.185691833496094, "global_step": 201820, "epoch": 4805} {"train_loss": -7.235492706298828, "global_step": 201821, "epoch": 4805} {"train_loss": -7.318862438201904, "global_step": 201822, "epoch": 4805} {"train_loss": -7.188368797302246, "global_step": 201823, "epoch": 4805} {"train_loss": -7.3569464683532715, "global_step": 201824, "epoch": 4805} {"train_loss": -7.202631950378418, "global_step": 201825, "epoch": 4805} {"train_loss": -7.286428451538086, "global_step": 201826, "epoch": 4805} {"train_loss": -7.23367977142334, "global_step": 201827, "epoch": 4805} {"train_loss": -7.078091621398926, "global_step": 201828, "epoch": 4805} {"train_loss": -7.322076797485352, "global_step": 201829, "epoch": 4805} {"train_loss": -7.243587017059326, "global_step": 201830, "epoch": 4805} {"train_loss": -7.263030052185059, "global_step": 201831, "epoch": 4805} {"train_loss": -7.158808708190918, "global_step": 201832, "epoch": 4805} {"train_loss": -7.233075141906738, "global_step": 201833, "epoch": 4805} {"train_loss": -7.352838039398193, "global_step": 201834, "epoch": 4805} {"train_loss": -7.238675117492676, "global_step": 201835, "epoch": 4805} {"train_loss": -7.152347087860107, "global_step": 201836, "epoch": 4805} {"train_loss": -7.302543640136719, "global_step": 201837, "epoch": 4805} {"train_loss": -7.310555934906006, "global_step": 201838, "epoch": 4805} {"train_loss": -7.293505668640137, "global_step": 201839, "epoch": 4805} {"train_loss": -7.300151824951172, "global_step": 201840, "epoch": 4805} {"train_loss": -7.2206244468688965, "global_step": 201841, "epoch": 4805} {"train_loss": -7.277702808380127, "global_step": 201842, "epoch": 4805} {"train_loss": -7.230432510375977, "global_step": 201843, "epoch": 4805} {"train_loss": -7.312283039093018, "global_step": 201844, "epoch": 4805} {"train_loss": -7.3235368728637695, "global_step": 201845, "epoch": 4805} {"train_loss": -7.300681114196777, "global_step": 201846, "epoch": 4805} {"train_loss": -7.324840545654297, "global_step": 201847, "epoch": 4805} {"train_loss": -7.24755334854126, "global_step": 201848, "epoch": 4805} {"train_loss": -7.301670074462891, "global_step": 201849, "epoch": 4805} {"train_loss": -7.490509033203125, "global_step": 201850, "epoch": 4805} {"train_loss": -7.2628645442780995, "global_step": 201851, "epoch": 4805, "val_loss": 69944.2890625} {"train_loss": -7.321929454803467, "global_step": 201852, "epoch": 4806} {"train_loss": -7.300920486450195, "global_step": 201853, "epoch": 4806} {"train_loss": -7.328147888183594, "global_step": 201854, "epoch": 4806} {"train_loss": -7.41267204284668, "global_step": 201855, "epoch": 4806} {"train_loss": -7.243108749389648, "global_step": 201856, "epoch": 4806} {"train_loss": -7.2874040603637695, "global_step": 201857, "epoch": 4806} {"train_loss": -7.197316646575928, "global_step": 201858, "epoch": 4806} {"train_loss": -7.275240898132324, "global_step": 201859, "epoch": 4806} {"train_loss": -7.3436713218688965, "global_step": 201860, "epoch": 4806} {"train_loss": -7.359880447387695, "global_step": 201861, "epoch": 4806} {"train_loss": -7.3792338371276855, "global_step": 201862, "epoch": 4806} {"train_loss": -7.342331886291504, "global_step": 201863, "epoch": 4806} {"train_loss": -7.240228176116943, "global_step": 201864, "epoch": 4806} {"train_loss": -7.202338218688965, "global_step": 201865, "epoch": 4806} {"train_loss": -7.347870826721191, "global_step": 201866, "epoch": 4806} {"train_loss": -7.38577938079834, "global_step": 201867, "epoch": 4806} {"train_loss": -7.158938407897949, "global_step": 201868, "epoch": 4806} {"train_loss": -7.3446502685546875, "global_step": 201869, "epoch": 4806} {"train_loss": -7.238428115844727, "global_step": 201870, "epoch": 4806} {"train_loss": -7.189584732055664, "global_step": 201871, "epoch": 4806} {"train_loss": -7.292072296142578, "global_step": 201872, "epoch": 4806} {"train_loss": -7.237075328826904, "global_step": 201873, "epoch": 4806} {"train_loss": -7.27790641784668, "global_step": 201874, "epoch": 4806} {"train_loss": -7.3369340896606445, "global_step": 201875, "epoch": 4806} {"train_loss": -7.324771404266357, "global_step": 201876, "epoch": 4806} {"train_loss": -7.233172416687012, "global_step": 201877, "epoch": 4806} {"train_loss": -7.259486198425293, "global_step": 201878, "epoch": 4806} {"train_loss": -7.319060325622559, "global_step": 201879, "epoch": 4806} {"train_loss": -7.189778804779053, "global_step": 201880, "epoch": 4806} {"train_loss": -7.239164352416992, "global_step": 201881, "epoch": 4806} {"train_loss": -7.317388534545898, "global_step": 201882, "epoch": 4806} {"train_loss": -7.32796573638916, "global_step": 201883, "epoch": 4806} {"train_loss": -7.235628128051758, "global_step": 201884, "epoch": 4806} {"train_loss": -7.30908203125, "global_step": 201885, "epoch": 4806} {"train_loss": -7.288514614105225, "global_step": 201886, "epoch": 4806} {"train_loss": -7.233197212219238, "global_step": 201887, "epoch": 4806} {"train_loss": -7.288387775421143, "global_step": 201888, "epoch": 4806} {"train_loss": -7.309253692626953, "global_step": 201889, "epoch": 4806} {"train_loss": -7.365115165710449, "global_step": 201890, "epoch": 4806} {"train_loss": -7.305131435394287, "global_step": 201891, "epoch": 4806} {"train_loss": -7.298778057098389, "global_step": 201892, "epoch": 4806} {"train_loss": -7.289651757194882, "global_step": 201893, "epoch": 4806, "val_loss": 69863.1484375} {"train_loss": -7.201563835144043, "global_step": 201894, "epoch": 4807} {"train_loss": -7.374573230743408, "global_step": 201895, "epoch": 4807} {"train_loss": -7.275158882141113, "global_step": 201896, "epoch": 4807} {"train_loss": -7.318123817443848, "global_step": 201897, "epoch": 4807} {"train_loss": -7.3911638259887695, "global_step": 201898, "epoch": 4807} {"train_loss": -7.31489372253418, "global_step": 201899, "epoch": 4807} {"train_loss": -7.383980751037598, "global_step": 201900, "epoch": 4807} {"train_loss": -7.349985599517822, "global_step": 201901, "epoch": 4807} {"train_loss": -7.379449844360352, "global_step": 201902, "epoch": 4807} {"train_loss": -7.335940837860107, "global_step": 201903, "epoch": 4807} {"train_loss": -7.3364763259887695, "global_step": 201904, "epoch": 4807} {"train_loss": -7.428741931915283, "global_step": 201905, "epoch": 4807} {"train_loss": -7.377915859222412, "global_step": 201906, "epoch": 4807} {"train_loss": -7.399866104125977, "global_step": 201907, "epoch": 4807} {"train_loss": -7.280342102050781, "global_step": 201908, "epoch": 4807} {"train_loss": -7.31226921081543, "global_step": 201909, "epoch": 4807} {"train_loss": -7.45072603225708, "global_step": 201910, "epoch": 4807} {"train_loss": -7.324576377868652, "global_step": 201911, "epoch": 4807} {"train_loss": -7.353603363037109, "global_step": 201912, "epoch": 4807} {"train_loss": -7.284440994262695, "global_step": 201913, "epoch": 4807} {"train_loss": -7.296455383300781, "global_step": 201914, "epoch": 4807} {"train_loss": -7.281638145446777, "global_step": 201915, "epoch": 4807} {"train_loss": -7.220198631286621, "global_step": 201916, "epoch": 4807} {"train_loss": -7.165794849395752, "global_step": 201917, "epoch": 4807} {"train_loss": -7.182000160217285, "global_step": 201918, "epoch": 4807} {"train_loss": -7.330633163452148, "global_step": 201919, "epoch": 4807} {"train_loss": -7.07657527923584, "global_step": 201920, "epoch": 4807} {"train_loss": -7.3738694190979, "global_step": 201921, "epoch": 4807} {"train_loss": -7.284663200378418, "global_step": 201922, "epoch": 4807} {"train_loss": -7.149150371551514, "global_step": 201923, "epoch": 4807} {"train_loss": -7.315522193908691, "global_step": 201924, "epoch": 4807} {"train_loss": -7.292359352111816, "global_step": 201925, "epoch": 4807} {"train_loss": -7.314085006713867, "global_step": 201926, "epoch": 4807} {"train_loss": -7.351954460144043, "global_step": 201927, "epoch": 4807} {"train_loss": -7.22526216506958, "global_step": 201928, "epoch": 4807} {"train_loss": -7.333413600921631, "global_step": 201929, "epoch": 4807} {"train_loss": -7.2133965492248535, "global_step": 201930, "epoch": 4807} {"train_loss": -7.335447311401367, "global_step": 201931, "epoch": 4807} {"train_loss": -7.302246570587158, "global_step": 201932, "epoch": 4807} {"train_loss": -7.1472344398498535, "global_step": 201933, "epoch": 4807} {"train_loss": -7.224613666534424, "global_step": 201934, "epoch": 4807} {"train_loss": -7.296331961949666, "global_step": 201935, "epoch": 4807, "val_loss": 69928.2734375} {"train_loss": -7.2801408767700195, "global_step": 201936, "epoch": 4808} {"train_loss": -7.213040351867676, "global_step": 201937, "epoch": 4808} {"train_loss": -7.379785060882568, "global_step": 201938, "epoch": 4808} {"train_loss": -7.301880359649658, "global_step": 201939, "epoch": 4808} {"train_loss": -7.345489978790283, "global_step": 201940, "epoch": 4808} {"train_loss": -7.270721912384033, "global_step": 201941, "epoch": 4808} {"train_loss": -7.18723201751709, "global_step": 201942, "epoch": 4808} {"train_loss": -7.2597808837890625, "global_step": 201943, "epoch": 4808} {"train_loss": -7.337125778198242, "global_step": 201944, "epoch": 4808} {"train_loss": -7.31960391998291, "global_step": 201945, "epoch": 4808} {"train_loss": -7.174293518066406, "global_step": 201946, "epoch": 4808} {"train_loss": -7.208873748779297, "global_step": 201947, "epoch": 4808} {"train_loss": -7.201189041137695, "global_step": 201948, "epoch": 4808} {"train_loss": -7.12970495223999, "global_step": 201949, "epoch": 4808} {"train_loss": -7.115447044372559, "global_step": 201950, "epoch": 4808} {"train_loss": -7.191133975982666, "global_step": 201951, "epoch": 4808} {"train_loss": -7.160445690155029, "global_step": 201952, "epoch": 4808} {"train_loss": -7.175120830535889, "global_step": 201953, "epoch": 4808} {"train_loss": -7.158576011657715, "global_step": 201954, "epoch": 4808} {"train_loss": -7.17990255355835, "global_step": 201955, "epoch": 4808} {"train_loss": -7.161489009857178, "global_step": 201956, "epoch": 4808} {"train_loss": -7.060970306396484, "global_step": 201957, "epoch": 4808} {"train_loss": -7.228865146636963, "global_step": 201958, "epoch": 4808} {"train_loss": -7.0747809410095215, "global_step": 201959, "epoch": 4808} {"train_loss": -7.2904558181762695, "global_step": 201960, "epoch": 4808} {"train_loss": -7.028874397277832, "global_step": 201961, "epoch": 4808} {"train_loss": -7.054930686950684, "global_step": 201962, "epoch": 4808} {"train_loss": -7.142585754394531, "global_step": 201963, "epoch": 4808} {"train_loss": -7.018491744995117, "global_step": 201964, "epoch": 4808} {"train_loss": -7.212091445922852, "global_step": 201965, "epoch": 4808} {"train_loss": -7.206593990325928, "global_step": 201966, "epoch": 4808} {"train_loss": -7.298666954040527, "global_step": 201967, "epoch": 4808} {"train_loss": -7.317284107208252, "global_step": 201968, "epoch": 4808} {"train_loss": -7.199605941772461, "global_step": 201969, "epoch": 4808} {"train_loss": -7.243466854095459, "global_step": 201970, "epoch": 4808} {"train_loss": -7.294938087463379, "global_step": 201971, "epoch": 4808} {"train_loss": -7.158510208129883, "global_step": 201972, "epoch": 4808} {"train_loss": -7.294389247894287, "global_step": 201973, "epoch": 4808} {"train_loss": -7.108487606048584, "global_step": 201974, "epoch": 4808} {"train_loss": -7.385001182556152, "global_step": 201975, "epoch": 4808} {"train_loss": -7.352963447570801, "global_step": 201976, "epoch": 4808} {"train_loss": -7.213711409341721, "global_step": 201977, "epoch": 4808, "val_loss": 69928.1015625} {"train_loss": -7.298583507537842, "global_step": 201978, "epoch": 4809} {"train_loss": -7.192464351654053, "global_step": 201979, "epoch": 4809} {"train_loss": -7.163140773773193, "global_step": 201980, "epoch": 4809} {"train_loss": -7.385946273803711, "global_step": 201981, "epoch": 4809} {"train_loss": -7.153702259063721, "global_step": 201982, "epoch": 4809} {"train_loss": -7.1680450439453125, "global_step": 201983, "epoch": 4809} {"train_loss": -7.227871894836426, "global_step": 201984, "epoch": 4809} {"train_loss": -7.14869499206543, "global_step": 201985, "epoch": 4809} {"train_loss": -7.384621620178223, "global_step": 201986, "epoch": 4809} {"train_loss": -7.097878456115723, "global_step": 201987, "epoch": 4809} {"train_loss": -7.266179084777832, "global_step": 201988, "epoch": 4809} {"train_loss": -7.264575958251953, "global_step": 201989, "epoch": 4809} {"train_loss": -7.28488826751709, "global_step": 201990, "epoch": 4809} {"train_loss": -7.270166397094727, "global_step": 201991, "epoch": 4809} {"train_loss": -7.22565221786499, "global_step": 201992, "epoch": 4809} {"train_loss": -7.415975570678711, "global_step": 201993, "epoch": 4809} {"train_loss": -7.3394083976745605, "global_step": 201994, "epoch": 4809} {"train_loss": -7.373811721801758, "global_step": 201995, "epoch": 4809} {"train_loss": -7.155020713806152, "global_step": 201996, "epoch": 4809} {"train_loss": -7.155747890472412, "global_step": 201997, "epoch": 4809} {"train_loss": -7.330194473266602, "global_step": 201998, "epoch": 4809} {"train_loss": -7.233355522155762, "global_step": 201999, "epoch": 4809} {"train_loss": -7.179752349853516, "global_step": 202000, "epoch": 4809} {"train_loss": -7.287793159484863, "global_step": 202001, "epoch": 4809} {"train_loss": -7.193921089172363, "global_step": 202002, "epoch": 4809} {"train_loss": -7.314573287963867, "global_step": 202003, "epoch": 4809} {"train_loss": -7.146381378173828, "global_step": 202004, "epoch": 4809} {"train_loss": -7.2252607345581055, "global_step": 202005, "epoch": 4809} {"train_loss": -7.202154636383057, "global_step": 202006, "epoch": 4809} {"train_loss": -7.228172302246094, "global_step": 202007, "epoch": 4809} {"train_loss": -7.291919231414795, "global_step": 202008, "epoch": 4809} {"train_loss": -7.1477155685424805, "global_step": 202009, "epoch": 4809} {"train_loss": -7.304311752319336, "global_step": 202010, "epoch": 4809} {"train_loss": -7.2409491539001465, "global_step": 202011, "epoch": 4809} {"train_loss": -7.215670585632324, "global_step": 202012, "epoch": 4809} {"train_loss": -7.28433895111084, "global_step": 202013, "epoch": 4809} {"train_loss": -7.292462348937988, "global_step": 202014, "epoch": 4809} {"train_loss": -7.286254405975342, "global_step": 202015, "epoch": 4809} {"train_loss": -7.212944984436035, "global_step": 202016, "epoch": 4809} {"train_loss": -7.202856063842773, "global_step": 202017, "epoch": 4809} {"train_loss": -7.266750335693359, "global_step": 202018, "epoch": 4809} {"train_loss": -7.242954288210187, "global_step": 202019, "epoch": 4809, "val_loss": 69933.7109375} {"train_loss": -7.245701789855957, "global_step": 202020, "epoch": 4810} {"train_loss": -7.3547773361206055, "global_step": 202021, "epoch": 4810} {"train_loss": -7.348593711853027, "global_step": 202022, "epoch": 4810} {"train_loss": -7.309365749359131, "global_step": 202023, "epoch": 4810} {"train_loss": -7.227786540985107, "global_step": 202024, "epoch": 4810} {"train_loss": -7.296823501586914, "global_step": 202025, "epoch": 4810} {"train_loss": -7.2820658683776855, "global_step": 202026, "epoch": 4810} {"train_loss": -7.213501453399658, "global_step": 202027, "epoch": 4810} {"train_loss": -7.178985595703125, "global_step": 202028, "epoch": 4810} {"train_loss": -7.250126361846924, "global_step": 202029, "epoch": 4810} {"train_loss": -7.394362926483154, "global_step": 202030, "epoch": 4810} {"train_loss": -7.230442047119141, "global_step": 202031, "epoch": 4810} {"train_loss": -7.320661544799805, "global_step": 202032, "epoch": 4810} {"train_loss": -7.236285209655762, "global_step": 202033, "epoch": 4810} {"train_loss": -7.266313552856445, "global_step": 202034, "epoch": 4810} {"train_loss": -7.239804267883301, "global_step": 202035, "epoch": 4810} {"train_loss": -7.335163116455078, "global_step": 202036, "epoch": 4810} {"train_loss": -7.239770412445068, "global_step": 202037, "epoch": 4810} {"train_loss": -7.233578681945801, "global_step": 202038, "epoch": 4810} {"train_loss": -7.39387845993042, "global_step": 202039, "epoch": 4810} {"train_loss": -7.196002006530762, "global_step": 202040, "epoch": 4810} {"train_loss": -7.262555122375488, "global_step": 202041, "epoch": 4810} {"train_loss": -7.252649784088135, "global_step": 202042, "epoch": 4810} {"train_loss": -7.294894218444824, "global_step": 202043, "epoch": 4810} {"train_loss": -7.336766719818115, "global_step": 202044, "epoch": 4810} {"train_loss": -7.303496360778809, "global_step": 202045, "epoch": 4810} {"train_loss": -7.346762657165527, "global_step": 202046, "epoch": 4810} {"train_loss": -7.283867359161377, "global_step": 202047, "epoch": 4810} {"train_loss": -7.1879563331604, "global_step": 202048, "epoch": 4810} {"train_loss": -7.304059028625488, "global_step": 202049, "epoch": 4810} {"train_loss": -7.264639854431152, "global_step": 202050, "epoch": 4810} {"train_loss": -7.2269511222839355, "global_step": 202051, "epoch": 4810} {"train_loss": -7.278293609619141, "global_step": 202052, "epoch": 4810} {"train_loss": -7.23914098739624, "global_step": 202053, "epoch": 4810} {"train_loss": -7.3163228034973145, "global_step": 202054, "epoch": 4810} {"train_loss": -7.254547119140625, "global_step": 202055, "epoch": 4810} {"train_loss": -7.310577392578125, "global_step": 202056, "epoch": 4810} {"train_loss": -7.375341415405273, "global_step": 202057, "epoch": 4810} {"train_loss": -7.254179954528809, "global_step": 202058, "epoch": 4810} {"train_loss": -7.309497833251953, "global_step": 202059, "epoch": 4810} {"train_loss": -7.159638404846191, "global_step": 202060, "epoch": 4810} {"train_loss": -7.278091158185687, "global_step": 202061, "epoch": 4810, "val_loss": 69990.8359375} {"train_loss": -7.234061241149902, "global_step": 202062, "epoch": 4811} {"train_loss": -7.373679161071777, "global_step": 202063, "epoch": 4811} {"train_loss": -7.232100963592529, "global_step": 202064, "epoch": 4811} {"train_loss": -7.231097221374512, "global_step": 202065, "epoch": 4811} {"train_loss": -7.3676981925964355, "global_step": 202066, "epoch": 4811} {"train_loss": -7.272481441497803, "global_step": 202067, "epoch": 4811} {"train_loss": -7.2434492111206055, "global_step": 202068, "epoch": 4811} {"train_loss": -7.210052967071533, "global_step": 202069, "epoch": 4811} {"train_loss": -7.224002361297607, "global_step": 202070, "epoch": 4811} {"train_loss": -7.165927886962891, "global_step": 202071, "epoch": 4811} {"train_loss": -7.365347862243652, "global_step": 202072, "epoch": 4811} {"train_loss": -7.346804618835449, "global_step": 202073, "epoch": 4811} {"train_loss": -7.306499481201172, "global_step": 202074, "epoch": 4811} {"train_loss": -7.294665336608887, "global_step": 202075, "epoch": 4811} {"train_loss": -7.375208854675293, "global_step": 202076, "epoch": 4811} {"train_loss": -7.379286766052246, "global_step": 202077, "epoch": 4811} {"train_loss": -7.406686782836914, "global_step": 202078, "epoch": 4811} {"train_loss": -7.280508995056152, "global_step": 202079, "epoch": 4811} {"train_loss": -7.287270545959473, "global_step": 202080, "epoch": 4811} {"train_loss": -7.3653788566589355, "global_step": 202081, "epoch": 4811} {"train_loss": -7.272096633911133, "global_step": 202082, "epoch": 4811} {"train_loss": -7.313074111938477, "global_step": 202083, "epoch": 4811} {"train_loss": -7.379350185394287, "global_step": 202084, "epoch": 4811} {"train_loss": -7.290525913238525, "global_step": 202085, "epoch": 4811} {"train_loss": -7.410039901733398, "global_step": 202086, "epoch": 4811} {"train_loss": -7.379816055297852, "global_step": 202087, "epoch": 4811} {"train_loss": -7.323108673095703, "global_step": 202088, "epoch": 4811} {"train_loss": -7.365198135375977, "global_step": 202089, "epoch": 4811} {"train_loss": -7.285733222961426, "global_step": 202090, "epoch": 4811} {"train_loss": -7.400640487670898, "global_step": 202091, "epoch": 4811} {"train_loss": -7.256753921508789, "global_step": 202092, "epoch": 4811} {"train_loss": -7.30135440826416, "global_step": 202093, "epoch": 4811} {"train_loss": -7.303417205810547, "global_step": 202094, "epoch": 4811} {"train_loss": -7.3561296463012695, "global_step": 202095, "epoch": 4811} {"train_loss": -7.400564193725586, "global_step": 202096, "epoch": 4811} {"train_loss": -7.161940097808838, "global_step": 202097, "epoch": 4811} {"train_loss": -7.2705488204956055, "global_step": 202098, "epoch": 4811} {"train_loss": -7.23316764831543, "global_step": 202099, "epoch": 4811} {"train_loss": -7.279425621032715, "global_step": 202100, "epoch": 4811} {"train_loss": -7.369751930236816, "global_step": 202101, "epoch": 4811} {"train_loss": -7.206719398498535, "global_step": 202102, "epoch": 4811} {"train_loss": -7.306039287930443, "global_step": 202103, "epoch": 4811, "val_loss": 69888.4375} {"train_loss": -7.2665228843688965, "global_step": 202104, "epoch": 4812} {"train_loss": -7.361215591430664, "global_step": 202105, "epoch": 4812} {"train_loss": -7.2550272941589355, "global_step": 202106, "epoch": 4812} {"train_loss": -7.347418785095215, "global_step": 202107, "epoch": 4812} {"train_loss": -7.253222942352295, "global_step": 202108, "epoch": 4812} {"train_loss": -7.302572250366211, "global_step": 202109, "epoch": 4812} {"train_loss": -7.402490615844727, "global_step": 202110, "epoch": 4812} {"train_loss": -7.139617443084717, "global_step": 202111, "epoch": 4812} {"train_loss": -7.2610392570495605, "global_step": 202112, "epoch": 4812} {"train_loss": -7.347623348236084, "global_step": 202113, "epoch": 4812} {"train_loss": -7.25261926651001, "global_step": 202114, "epoch": 4812} {"train_loss": -7.246528625488281, "global_step": 202115, "epoch": 4812} {"train_loss": -7.276066780090332, "global_step": 202116, "epoch": 4812} {"train_loss": -7.212090492248535, "global_step": 202117, "epoch": 4812} {"train_loss": -7.31022834777832, "global_step": 202118, "epoch": 4812} {"train_loss": -7.238902568817139, "global_step": 202119, "epoch": 4812} {"train_loss": -7.299067974090576, "global_step": 202120, "epoch": 4812} {"train_loss": -7.265076637268066, "global_step": 202121, "epoch": 4812} {"train_loss": -7.294081687927246, "global_step": 202122, "epoch": 4812} {"train_loss": -7.200109004974365, "global_step": 202123, "epoch": 4812} {"train_loss": -7.23987340927124, "global_step": 202124, "epoch": 4812} {"train_loss": -7.231729507446289, "global_step": 202125, "epoch": 4812} {"train_loss": -7.3067426681518555, "global_step": 202126, "epoch": 4812} {"train_loss": -7.219861030578613, "global_step": 202127, "epoch": 4812} {"train_loss": -7.193413734436035, "global_step": 202128, "epoch": 4812} {"train_loss": -7.2796478271484375, "global_step": 202129, "epoch": 4812} {"train_loss": -7.05987548828125, "global_step": 202130, "epoch": 4812} {"train_loss": -7.1862897872924805, "global_step": 202131, "epoch": 4812} {"train_loss": -7.208494186401367, "global_step": 202132, "epoch": 4812} {"train_loss": -7.234296798706055, "global_step": 202133, "epoch": 4812} {"train_loss": -7.339692115783691, "global_step": 202134, "epoch": 4812} {"train_loss": -7.348509311676025, "global_step": 202135, "epoch": 4812} {"train_loss": -7.171938896179199, "global_step": 202136, "epoch": 4812} {"train_loss": -7.26621150970459, "global_step": 202137, "epoch": 4812} {"train_loss": -7.163793087005615, "global_step": 202138, "epoch": 4812} {"train_loss": -7.099315166473389, "global_step": 202139, "epoch": 4812} {"train_loss": -7.180063724517822, "global_step": 202140, "epoch": 4812} {"train_loss": -7.256920337677002, "global_step": 202141, "epoch": 4812} {"train_loss": -7.161953926086426, "global_step": 202142, "epoch": 4812} {"train_loss": -7.234308242797852, "global_step": 202143, "epoch": 4812} {"train_loss": -7.339963912963867, "global_step": 202144, "epoch": 4812} {"train_loss": -7.248686654227121, "global_step": 202145, "epoch": 4812, "val_loss": 70057.96875} {"train_loss": -7.25126838684082, "global_step": 202146, "epoch": 4813} {"train_loss": -7.296019077301025, "global_step": 202147, "epoch": 4813} {"train_loss": -7.218646049499512, "global_step": 202148, "epoch": 4813} {"train_loss": -7.2468647956848145, "global_step": 202149, "epoch": 4813} {"train_loss": -7.283780574798584, "global_step": 202150, "epoch": 4813} {"train_loss": -7.343449592590332, "global_step": 202151, "epoch": 4813} {"train_loss": -7.270587921142578, "global_step": 202152, "epoch": 4813} {"train_loss": -7.306355953216553, "global_step": 202153, "epoch": 4813} {"train_loss": -7.341535568237305, "global_step": 202154, "epoch": 4813} {"train_loss": -7.266716957092285, "global_step": 202155, "epoch": 4813} {"train_loss": -7.256405353546143, "global_step": 202156, "epoch": 4813} {"train_loss": -7.182136535644531, "global_step": 202157, "epoch": 4813} {"train_loss": -7.270369529724121, "global_step": 202158, "epoch": 4813} {"train_loss": -7.263673782348633, "global_step": 202159, "epoch": 4813} {"train_loss": -7.2955803871154785, "global_step": 202160, "epoch": 4813} {"train_loss": -7.259705543518066, "global_step": 202161, "epoch": 4813} {"train_loss": -7.267132759094238, "global_step": 202162, "epoch": 4813} {"train_loss": -7.22686767578125, "global_step": 202163, "epoch": 4813} {"train_loss": -7.2749176025390625, "global_step": 202164, "epoch": 4813} {"train_loss": -7.266534805297852, "global_step": 202165, "epoch": 4813} {"train_loss": -7.256096839904785, "global_step": 202166, "epoch": 4813} {"train_loss": -7.3037800788879395, "global_step": 202167, "epoch": 4813} {"train_loss": -7.199700832366943, "global_step": 202168, "epoch": 4813} {"train_loss": -7.331785202026367, "global_step": 202169, "epoch": 4813} {"train_loss": -7.3272247314453125, "global_step": 202170, "epoch": 4813} {"train_loss": -7.257202625274658, "global_step": 202171, "epoch": 4813} {"train_loss": -7.375124931335449, "global_step": 202172, "epoch": 4813} {"train_loss": -7.228499889373779, "global_step": 202173, "epoch": 4813} {"train_loss": -7.235313892364502, "global_step": 202174, "epoch": 4813} {"train_loss": -7.280605792999268, "global_step": 202175, "epoch": 4813} {"train_loss": -7.1678009033203125, "global_step": 202176, "epoch": 4813} {"train_loss": -7.271583557128906, "global_step": 202177, "epoch": 4813} {"train_loss": -7.296194076538086, "global_step": 202178, "epoch": 4813} {"train_loss": -7.217222213745117, "global_step": 202179, "epoch": 4813} {"train_loss": -7.275435447692871, "global_step": 202180, "epoch": 4813} {"train_loss": -7.3194169998168945, "global_step": 202181, "epoch": 4813} {"train_loss": -7.32305908203125, "global_step": 202182, "epoch": 4813} {"train_loss": -7.272784233093262, "global_step": 202183, "epoch": 4813} {"train_loss": -7.225454330444336, "global_step": 202184, "epoch": 4813} {"train_loss": -7.225334167480469, "global_step": 202185, "epoch": 4813} {"train_loss": -7.325327396392822, "global_step": 202186, "epoch": 4813} {"train_loss": -7.269381171181088, "global_step": 202187, "epoch": 4813, "val_loss": 69998.7265625} {"train_loss": -7.447356224060059, "global_step": 202188, "epoch": 4814} {"train_loss": -7.31634521484375, "global_step": 202189, "epoch": 4814} {"train_loss": -7.301848411560059, "global_step": 202190, "epoch": 4814} {"train_loss": -7.261916160583496, "global_step": 202191, "epoch": 4814} {"train_loss": -7.268830299377441, "global_step": 202192, "epoch": 4814} {"train_loss": -7.304329872131348, "global_step": 202193, "epoch": 4814} {"train_loss": -7.275599956512451, "global_step": 202194, "epoch": 4814} {"train_loss": -7.256308555603027, "global_step": 202195, "epoch": 4814} {"train_loss": -7.229048252105713, "global_step": 202196, "epoch": 4814} {"train_loss": -7.323135852813721, "global_step": 202197, "epoch": 4814} {"train_loss": -7.208590030670166, "global_step": 202198, "epoch": 4814} {"train_loss": -7.250904560089111, "global_step": 202199, "epoch": 4814} {"train_loss": -7.2503180503845215, "global_step": 202200, "epoch": 4814} {"train_loss": -7.179791450500488, "global_step": 202201, "epoch": 4814} {"train_loss": -7.247196197509766, "global_step": 202202, "epoch": 4814} {"train_loss": -7.38508939743042, "global_step": 202203, "epoch": 4814} {"train_loss": -7.30356502532959, "global_step": 202204, "epoch": 4814} {"train_loss": -7.272696018218994, "global_step": 202205, "epoch": 4814} {"train_loss": -7.325835227966309, "global_step": 202206, "epoch": 4814} {"train_loss": -7.110733509063721, "global_step": 202207, "epoch": 4814} {"train_loss": -7.228443622589111, "global_step": 202208, "epoch": 4814} {"train_loss": -7.302419185638428, "global_step": 202209, "epoch": 4814} {"train_loss": -7.154140472412109, "global_step": 202210, "epoch": 4814} {"train_loss": -7.276957035064697, "global_step": 202211, "epoch": 4814} {"train_loss": -7.171041488647461, "global_step": 202212, "epoch": 4814} {"train_loss": -7.284367561340332, "global_step": 202213, "epoch": 4814} {"train_loss": -7.111140727996826, "global_step": 202214, "epoch": 4814} {"train_loss": -7.277846336364746, "global_step": 202215, "epoch": 4814} {"train_loss": -7.260787010192871, "global_step": 202216, "epoch": 4814} {"train_loss": -7.364504814147949, "global_step": 202217, "epoch": 4814} {"train_loss": -7.15627384185791, "global_step": 202218, "epoch": 4814} {"train_loss": -7.358057022094727, "global_step": 202219, "epoch": 4814} {"train_loss": -7.319951057434082, "global_step": 202220, "epoch": 4814} {"train_loss": -7.354445457458496, "global_step": 202221, "epoch": 4814} {"train_loss": -7.326887130737305, "global_step": 202222, "epoch": 4814} {"train_loss": -7.166209697723389, "global_step": 202223, "epoch": 4814} {"train_loss": -7.2154645919799805, "global_step": 202224, "epoch": 4814} {"train_loss": -7.272823810577393, "global_step": 202225, "epoch": 4814} {"train_loss": -7.258980751037598, "global_step": 202226, "epoch": 4814} {"train_loss": -7.31297492980957, "global_step": 202227, "epoch": 4814} {"train_loss": -7.236746311187744, "global_step": 202228, "epoch": 4814} {"train_loss": -7.266173192432949, "global_step": 202229, "epoch": 4814, "val_loss": 69798.9921875} {"train_loss": -7.399094581604004, "global_step": 202230, "epoch": 4815} {"train_loss": -7.1105852127075195, "global_step": 202231, "epoch": 4815} {"train_loss": -7.27962589263916, "global_step": 202232, "epoch": 4815} {"train_loss": -7.32730770111084, "global_step": 202233, "epoch": 4815} {"train_loss": -7.22997522354126, "global_step": 202234, "epoch": 4815} {"train_loss": -7.354729652404785, "global_step": 202235, "epoch": 4815} {"train_loss": -7.337525844573975, "global_step": 202236, "epoch": 4815} {"train_loss": -7.199000358581543, "global_step": 202237, "epoch": 4815} {"train_loss": -7.298308372497559, "global_step": 202238, "epoch": 4815} {"train_loss": -7.35612154006958, "global_step": 202239, "epoch": 4815} {"train_loss": -7.286475658416748, "global_step": 202240, "epoch": 4815} {"train_loss": -7.191822528839111, "global_step": 202241, "epoch": 4815} {"train_loss": -7.25501823425293, "global_step": 202242, "epoch": 4815} {"train_loss": -7.246176719665527, "global_step": 202243, "epoch": 4815} {"train_loss": -7.294708251953125, "global_step": 202244, "epoch": 4815} {"train_loss": -7.313008785247803, "global_step": 202245, "epoch": 4815} {"train_loss": -7.30741548538208, "global_step": 202246, "epoch": 4815} {"train_loss": -7.332217693328857, "global_step": 202247, "epoch": 4815} {"train_loss": -7.333159446716309, "global_step": 202248, "epoch": 4815} {"train_loss": -7.319777965545654, "global_step": 202249, "epoch": 4815} {"train_loss": -7.291782855987549, "global_step": 202250, "epoch": 4815} {"train_loss": -7.265408515930176, "global_step": 202251, "epoch": 4815} {"train_loss": -7.349408149719238, "global_step": 202252, "epoch": 4815} {"train_loss": -7.349127769470215, "global_step": 202253, "epoch": 4815} {"train_loss": -7.323002338409424, "global_step": 202254, "epoch": 4815} {"train_loss": -7.260354042053223, "global_step": 202255, "epoch": 4815} {"train_loss": -7.360102653503418, "global_step": 202256, "epoch": 4815} {"train_loss": -7.356271743774414, "global_step": 202257, "epoch": 4815} {"train_loss": -7.359084606170654, "global_step": 202258, "epoch": 4815} {"train_loss": -7.353081226348877, "global_step": 202259, "epoch": 4815} {"train_loss": -7.241928577423096, "global_step": 202260, "epoch": 4815} {"train_loss": -7.064727306365967, "global_step": 202261, "epoch": 4815} {"train_loss": -7.366821765899658, "global_step": 202262, "epoch": 4815} {"train_loss": -7.263045310974121, "global_step": 202263, "epoch": 4815} {"train_loss": -7.200732231140137, "global_step": 202264, "epoch": 4815} {"train_loss": -7.338597297668457, "global_step": 202265, "epoch": 4815} {"train_loss": -7.171359539031982, "global_step": 202266, "epoch": 4815} {"train_loss": -7.184505462646484, "global_step": 202267, "epoch": 4815} {"train_loss": -7.362927436828613, "global_step": 202268, "epoch": 4815} {"train_loss": -7.129349231719971, "global_step": 202269, "epoch": 4815} {"train_loss": -7.213685512542725, "global_step": 202270, "epoch": 4815} {"train_loss": -7.282578593208676, "global_step": 202271, "epoch": 4815, "val_loss": 70162.1328125} {"train_loss": -7.155993461608887, "global_step": 202272, "epoch": 4816} {"train_loss": -7.243708610534668, "global_step": 202273, "epoch": 4816} {"train_loss": -7.319702625274658, "global_step": 202274, "epoch": 4816} {"train_loss": -7.238099575042725, "global_step": 202275, "epoch": 4816} {"train_loss": -7.315839767456055, "global_step": 202276, "epoch": 4816} {"train_loss": -7.200650215148926, "global_step": 202277, "epoch": 4816} {"train_loss": -7.262113571166992, "global_step": 202278, "epoch": 4816} {"train_loss": -7.176745414733887, "global_step": 202279, "epoch": 4816} {"train_loss": -7.294546127319336, "global_step": 202280, "epoch": 4816} {"train_loss": -7.183866500854492, "global_step": 202281, "epoch": 4816} {"train_loss": -7.3564839363098145, "global_step": 202282, "epoch": 4816} {"train_loss": -7.162940979003906, "global_step": 202283, "epoch": 4816} {"train_loss": -7.290757656097412, "global_step": 202284, "epoch": 4816} {"train_loss": -7.3456268310546875, "global_step": 202285, "epoch": 4816} {"train_loss": -7.160602569580078, "global_step": 202286, "epoch": 4816} {"train_loss": -7.356131076812744, "global_step": 202287, "epoch": 4816} {"train_loss": -7.209133148193359, "global_step": 202288, "epoch": 4816} {"train_loss": -7.285665512084961, "global_step": 202289, "epoch": 4816} {"train_loss": -7.148321151733398, "global_step": 202290, "epoch": 4816} {"train_loss": -7.2079057693481445, "global_step": 202291, "epoch": 4816} {"train_loss": -7.185374736785889, "global_step": 202292, "epoch": 4816} {"train_loss": -7.314105987548828, "global_step": 202293, "epoch": 4816} {"train_loss": -7.350454807281494, "global_step": 202294, "epoch": 4816} {"train_loss": -7.234192371368408, "global_step": 202295, "epoch": 4816} {"train_loss": -7.3930792808532715, "global_step": 202296, "epoch": 4816} {"train_loss": -7.292764186859131, "global_step": 202297, "epoch": 4816} {"train_loss": -7.330112457275391, "global_step": 202298, "epoch": 4816} {"train_loss": -7.218026161193848, "global_step": 202299, "epoch": 4816} {"train_loss": -7.277376174926758, "global_step": 202300, "epoch": 4816} {"train_loss": -7.306052207946777, "global_step": 202301, "epoch": 4816} {"train_loss": -7.247162818908691, "global_step": 202302, "epoch": 4816} {"train_loss": -7.29819393157959, "global_step": 202303, "epoch": 4816} {"train_loss": -7.354025840759277, "global_step": 202304, "epoch": 4816} {"train_loss": -7.3015336990356445, "global_step": 202305, "epoch": 4816} {"train_loss": -7.314545631408691, "global_step": 202306, "epoch": 4816} {"train_loss": -7.3434906005859375, "global_step": 202307, "epoch": 4816} {"train_loss": -7.404007911682129, "global_step": 202308, "epoch": 4816} {"train_loss": -7.322790622711182, "global_step": 202309, "epoch": 4816} {"train_loss": -7.239454746246338, "global_step": 202310, "epoch": 4816} {"train_loss": -7.318824291229248, "global_step": 202311, "epoch": 4816} {"train_loss": -7.3340559005737305, "global_step": 202312, "epoch": 4816} {"train_loss": -7.275222596668062, "global_step": 202313, "epoch": 4816, "val_loss": 69868.4453125} {"train_loss": -7.236915588378906, "global_step": 202314, "epoch": 4817} {"train_loss": -7.286979675292969, "global_step": 202315, "epoch": 4817} {"train_loss": -7.25007438659668, "global_step": 202316, "epoch": 4817} {"train_loss": -7.332032680511475, "global_step": 202317, "epoch": 4817} {"train_loss": -7.134378910064697, "global_step": 202318, "epoch": 4817} {"train_loss": -7.187835693359375, "global_step": 202319, "epoch": 4817} {"train_loss": -7.329008102416992, "global_step": 202320, "epoch": 4817} {"train_loss": -7.247499465942383, "global_step": 202321, "epoch": 4817} {"train_loss": -7.1814188957214355, "global_step": 202322, "epoch": 4817} {"train_loss": -7.263945579528809, "global_step": 202323, "epoch": 4817} {"train_loss": -7.164037704467773, "global_step": 202324, "epoch": 4817} {"train_loss": -7.156683921813965, "global_step": 202325, "epoch": 4817} {"train_loss": -7.285757541656494, "global_step": 202326, "epoch": 4817} {"train_loss": -7.012186527252197, "global_step": 202327, "epoch": 4817} {"train_loss": -7.102907657623291, "global_step": 202328, "epoch": 4817} {"train_loss": -7.000925064086914, "global_step": 202329, "epoch": 4817} {"train_loss": -7.1788177490234375, "global_step": 202330, "epoch": 4817} {"train_loss": -7.131259441375732, "global_step": 202331, "epoch": 4817} {"train_loss": -7.129459381103516, "global_step": 202332, "epoch": 4817} {"train_loss": -7.249645709991455, "global_step": 202333, "epoch": 4817} {"train_loss": -7.15311336517334, "global_step": 202334, "epoch": 4817} {"train_loss": -7.257820129394531, "global_step": 202335, "epoch": 4817} {"train_loss": -7.2559614181518555, "global_step": 202336, "epoch": 4817} {"train_loss": -7.333917617797852, "global_step": 202337, "epoch": 4817} {"train_loss": -7.167385101318359, "global_step": 202338, "epoch": 4817} {"train_loss": -7.276385307312012, "global_step": 202339, "epoch": 4817} {"train_loss": -7.282005310058594, "global_step": 202340, "epoch": 4817} {"train_loss": -7.130181312561035, "global_step": 202341, "epoch": 4817} {"train_loss": -7.3636298179626465, "global_step": 202342, "epoch": 4817} {"train_loss": -7.3249616622924805, "global_step": 202343, "epoch": 4817} {"train_loss": -7.3092522621154785, "global_step": 202344, "epoch": 4817} {"train_loss": -7.403007507324219, "global_step": 202345, "epoch": 4817} {"train_loss": -7.208742141723633, "global_step": 202346, "epoch": 4817} {"train_loss": -7.2967071533203125, "global_step": 202347, "epoch": 4817} {"train_loss": -7.163862705230713, "global_step": 202348, "epoch": 4817} {"train_loss": -7.266683101654053, "global_step": 202349, "epoch": 4817} {"train_loss": -7.289670944213867, "global_step": 202350, "epoch": 4817} {"train_loss": -7.162561893463135, "global_step": 202351, "epoch": 4817} {"train_loss": -7.317827224731445, "global_step": 202352, "epoch": 4817} {"train_loss": -7.139043807983398, "global_step": 202353, "epoch": 4817} {"train_loss": -7.162838935852051, "global_step": 202354, "epoch": 4817} {"train_loss": -7.226160151617868, "global_step": 202355, "epoch": 4817, "val_loss": 70138.078125} {"train_loss": -7.08271598815918, "global_step": 202356, "epoch": 4818} {"train_loss": -7.22296667098999, "global_step": 202357, "epoch": 4818} {"train_loss": -7.28510856628418, "global_step": 202358, "epoch": 4818} {"train_loss": -7.182355880737305, "global_step": 202359, "epoch": 4818} {"train_loss": -7.276009559631348, "global_step": 202360, "epoch": 4818} {"train_loss": -7.166023254394531, "global_step": 202361, "epoch": 4818} {"train_loss": -7.302068710327148, "global_step": 202362, "epoch": 4818} {"train_loss": -7.270880699157715, "global_step": 202363, "epoch": 4818} {"train_loss": -7.267438888549805, "global_step": 202364, "epoch": 4818} {"train_loss": -7.30318546295166, "global_step": 202365, "epoch": 4818} {"train_loss": -7.356279373168945, "global_step": 202366, "epoch": 4818} {"train_loss": -7.218953609466553, "global_step": 202367, "epoch": 4818} {"train_loss": -7.302164077758789, "global_step": 202368, "epoch": 4818} {"train_loss": -7.223182201385498, "global_step": 202369, "epoch": 4818} {"train_loss": -7.376690864562988, "global_step": 202370, "epoch": 4818} {"train_loss": -7.330901145935059, "global_step": 202371, "epoch": 4818} {"train_loss": -7.285508155822754, "global_step": 202372, "epoch": 4818} {"train_loss": -7.190586090087891, "global_step": 202373, "epoch": 4818} {"train_loss": -7.307696342468262, "global_step": 202374, "epoch": 4818} {"train_loss": -7.221378326416016, "global_step": 202375, "epoch": 4818} {"train_loss": -7.399744033813477, "global_step": 202376, "epoch": 4818} {"train_loss": -7.209162712097168, "global_step": 202377, "epoch": 4818} {"train_loss": -7.217953681945801, "global_step": 202378, "epoch": 4818} {"train_loss": -7.247498512268066, "global_step": 202379, "epoch": 4818} {"train_loss": -7.332786560058594, "global_step": 202380, "epoch": 4818} {"train_loss": -7.2341814041137695, "global_step": 202381, "epoch": 4818} {"train_loss": -7.282596588134766, "global_step": 202382, "epoch": 4818} {"train_loss": -7.180710792541504, "global_step": 202383, "epoch": 4818} {"train_loss": -7.280190467834473, "global_step": 202384, "epoch": 4818} {"train_loss": -7.304778099060059, "global_step": 202385, "epoch": 4818} {"train_loss": -7.286773681640625, "global_step": 202386, "epoch": 4818} {"train_loss": -7.324810981750488, "global_step": 202387, "epoch": 4818} {"train_loss": -7.39603328704834, "global_step": 202388, "epoch": 4818} {"train_loss": -7.291623115539551, "global_step": 202389, "epoch": 4818} {"train_loss": -7.254927158355713, "global_step": 202390, "epoch": 4818} {"train_loss": -7.24273681640625, "global_step": 202391, "epoch": 4818} {"train_loss": -7.29746150970459, "global_step": 202392, "epoch": 4818} {"train_loss": -7.248028755187988, "global_step": 202393, "epoch": 4818} {"train_loss": -7.2751054763793945, "global_step": 202394, "epoch": 4818} {"train_loss": -7.379753112792969, "global_step": 202395, "epoch": 4818} {"train_loss": -7.294312477111816, "global_step": 202396, "epoch": 4818} {"train_loss": -7.2722458725883845, "global_step": 202397, "epoch": 4818, "val_loss": 69809.546875} {"train_loss": -7.33271598815918, "global_step": 202398, "epoch": 4819} {"train_loss": -7.447424411773682, "global_step": 202399, "epoch": 4819} {"train_loss": -7.320976734161377, "global_step": 202400, "epoch": 4819} {"train_loss": -7.369994163513184, "global_step": 202401, "epoch": 4819} {"train_loss": -7.34782600402832, "global_step": 202402, "epoch": 4819} {"train_loss": -7.262129783630371, "global_step": 202403, "epoch": 4819} {"train_loss": -7.254404544830322, "global_step": 202404, "epoch": 4819} {"train_loss": -7.253850936889648, "global_step": 202405, "epoch": 4819} {"train_loss": -7.284088134765625, "global_step": 202406, "epoch": 4819} {"train_loss": -7.277792930603027, "global_step": 202407, "epoch": 4819} {"train_loss": -7.308197021484375, "global_step": 202408, "epoch": 4819} {"train_loss": -7.354639053344727, "global_step": 202409, "epoch": 4819} {"train_loss": -7.345645904541016, "global_step": 202410, "epoch": 4819} {"train_loss": -7.234029293060303, "global_step": 202411, "epoch": 4819} {"train_loss": -7.412027359008789, "global_step": 202412, "epoch": 4819} {"train_loss": -7.310867786407471, "global_step": 202413, "epoch": 4819} {"train_loss": -7.286454200744629, "global_step": 202414, "epoch": 4819} {"train_loss": -7.3108696937561035, "global_step": 202415, "epoch": 4819} {"train_loss": -7.431585311889648, "global_step": 202416, "epoch": 4819} {"train_loss": -7.405614376068115, "global_step": 202417, "epoch": 4819} {"train_loss": -7.550060272216797, "global_step": 202418, "epoch": 4819} {"train_loss": -7.309272289276123, "global_step": 202419, "epoch": 4819} {"train_loss": -7.443750381469727, "global_step": 202420, "epoch": 4819} {"train_loss": -7.432208061218262, "global_step": 202421, "epoch": 4819} {"train_loss": -7.293948173522949, "global_step": 202422, "epoch": 4819} {"train_loss": -7.432897567749023, "global_step": 202423, "epoch": 4819} {"train_loss": -7.321687698364258, "global_step": 202424, "epoch": 4819} {"train_loss": -7.3075666427612305, "global_step": 202425, "epoch": 4819} {"train_loss": -7.328938007354736, "global_step": 202426, "epoch": 4819} {"train_loss": -7.3380961418151855, "global_step": 202427, "epoch": 4819} {"train_loss": -7.27686882019043, "global_step": 202428, "epoch": 4819} {"train_loss": -7.2918596267700195, "global_step": 202429, "epoch": 4819} {"train_loss": -7.346051216125488, "global_step": 202430, "epoch": 4819} {"train_loss": -7.2768778800964355, "global_step": 202431, "epoch": 4819} {"train_loss": -7.319681644439697, "global_step": 202432, "epoch": 4819} {"train_loss": -7.332097053527832, "global_step": 202433, "epoch": 4819} {"train_loss": -7.308813095092773, "global_step": 202434, "epoch": 4819} {"train_loss": -7.287135124206543, "global_step": 202435, "epoch": 4819} {"train_loss": -7.378440856933594, "global_step": 202436, "epoch": 4819} {"train_loss": -7.361231803894043, "global_step": 202437, "epoch": 4819} {"train_loss": -7.374281406402588, "global_step": 202438, "epoch": 4819} {"train_loss": -7.3388194016047885, "global_step": 202439, "epoch": 4819, "val_loss": 69845.8359375} {"train_loss": -7.3483757972717285, "global_step": 202440, "epoch": 4820} {"train_loss": -7.271320819854736, "global_step": 202441, "epoch": 4820} {"train_loss": -7.248141288757324, "global_step": 202442, "epoch": 4820} {"train_loss": -7.285211563110352, "global_step": 202443, "epoch": 4820} {"train_loss": -7.214850902557373, "global_step": 202444, "epoch": 4820} {"train_loss": -7.311634063720703, "global_step": 202445, "epoch": 4820} {"train_loss": -7.465583801269531, "global_step": 202446, "epoch": 4820} {"train_loss": -7.201466083526611, "global_step": 202447, "epoch": 4820} {"train_loss": -7.104485988616943, "global_step": 202448, "epoch": 4820} {"train_loss": -7.367921829223633, "global_step": 202449, "epoch": 4820} {"train_loss": -7.147592544555664, "global_step": 202450, "epoch": 4820} {"train_loss": -7.100525856018066, "global_step": 202451, "epoch": 4820} {"train_loss": -7.241206169128418, "global_step": 202452, "epoch": 4820} {"train_loss": -7.044974327087402, "global_step": 202453, "epoch": 4820} {"train_loss": -7.3372344970703125, "global_step": 202454, "epoch": 4820} {"train_loss": -7.1483845710754395, "global_step": 202455, "epoch": 4820} {"train_loss": -7.141026496887207, "global_step": 202456, "epoch": 4820} {"train_loss": -7.249581336975098, "global_step": 202457, "epoch": 4820} {"train_loss": -7.161552429199219, "global_step": 202458, "epoch": 4820} {"train_loss": -7.317660331726074, "global_step": 202459, "epoch": 4820} {"train_loss": -7.023429870605469, "global_step": 202460, "epoch": 4820} {"train_loss": -7.092421531677246, "global_step": 202461, "epoch": 4820} {"train_loss": -7.157896518707275, "global_step": 202462, "epoch": 4820} {"train_loss": -7.086903095245361, "global_step": 202463, "epoch": 4820} {"train_loss": -7.175664901733398, "global_step": 202464, "epoch": 4820} {"train_loss": -7.327659606933594, "global_step": 202465, "epoch": 4820} {"train_loss": -7.209405899047852, "global_step": 202466, "epoch": 4820} {"train_loss": -7.248504638671875, "global_step": 202467, "epoch": 4820} {"train_loss": -7.232758522033691, "global_step": 202468, "epoch": 4820} {"train_loss": -7.245180606842041, "global_step": 202469, "epoch": 4820} {"train_loss": -7.299200057983398, "global_step": 202470, "epoch": 4820} {"train_loss": -7.215437889099121, "global_step": 202471, "epoch": 4820} {"train_loss": -7.301780700683594, "global_step": 202472, "epoch": 4820} {"train_loss": -7.199017524719238, "global_step": 202473, "epoch": 4820} {"train_loss": -7.333868980407715, "global_step": 202474, "epoch": 4820} {"train_loss": -7.230735778808594, "global_step": 202475, "epoch": 4820} {"train_loss": -7.185248374938965, "global_step": 202476, "epoch": 4820} {"train_loss": -7.326695919036865, "global_step": 202477, "epoch": 4820} {"train_loss": -7.222999572753906, "global_step": 202478, "epoch": 4820} {"train_loss": -7.331151008605957, "global_step": 202479, "epoch": 4820} {"train_loss": -7.429601192474365, "global_step": 202480, "epoch": 4820} {"train_loss": -7.232543911252703, "global_step": 202481, "epoch": 4820, "val_loss": 70030.625} {"train_loss": -7.285574913024902, "global_step": 202482, "epoch": 4821} {"train_loss": -7.199714660644531, "global_step": 202483, "epoch": 4821} {"train_loss": -7.283514022827148, "global_step": 202484, "epoch": 4821} {"train_loss": -7.277966022491455, "global_step": 202485, "epoch": 4821} {"train_loss": -7.308638095855713, "global_step": 202486, "epoch": 4821} {"train_loss": -7.370633125305176, "global_step": 202487, "epoch": 4821} {"train_loss": -7.26922607421875, "global_step": 202488, "epoch": 4821} {"train_loss": -7.283597469329834, "global_step": 202489, "epoch": 4821} {"train_loss": -7.259753227233887, "global_step": 202490, "epoch": 4821} {"train_loss": -7.362530708312988, "global_step": 202491, "epoch": 4821} {"train_loss": -7.4155426025390625, "global_step": 202492, "epoch": 4821} {"train_loss": -7.295004844665527, "global_step": 202493, "epoch": 4821} {"train_loss": -7.3009138107299805, "global_step": 202494, "epoch": 4821} {"train_loss": -7.259989261627197, "global_step": 202495, "epoch": 4821} {"train_loss": -7.346020221710205, "global_step": 202496, "epoch": 4821} {"train_loss": -7.200933933258057, "global_step": 202497, "epoch": 4821} {"train_loss": -7.203045845031738, "global_step": 202498, "epoch": 4821} {"train_loss": -7.167708396911621, "global_step": 202499, "epoch": 4821} {"train_loss": -7.349634647369385, "global_step": 202500, "epoch": 4821} {"train_loss": -7.219664573669434, "global_step": 202501, "epoch": 4821} {"train_loss": -7.241279602050781, "global_step": 202502, "epoch": 4821} {"train_loss": -7.235602378845215, "global_step": 202503, "epoch": 4821} {"train_loss": -7.2018842697143555, "global_step": 202504, "epoch": 4821} {"train_loss": -7.200210094451904, "global_step": 202505, "epoch": 4821} {"train_loss": -7.26798152923584, "global_step": 202506, "epoch": 4821} {"train_loss": -7.231263637542725, "global_step": 202507, "epoch": 4821} {"train_loss": -7.24887228012085, "global_step": 202508, "epoch": 4821} {"train_loss": -7.234601974487305, "global_step": 202509, "epoch": 4821} {"train_loss": -7.175371170043945, "global_step": 202510, "epoch": 4821} {"train_loss": -7.2845377922058105, "global_step": 202511, "epoch": 4821} {"train_loss": -7.245728969573975, "global_step": 202512, "epoch": 4821} {"train_loss": -7.1929426193237305, "global_step": 202513, "epoch": 4821} {"train_loss": -7.309778213500977, "global_step": 202514, "epoch": 4821} {"train_loss": -7.370250701904297, "global_step": 202515, "epoch": 4821} {"train_loss": -7.2786455154418945, "global_step": 202516, "epoch": 4821} {"train_loss": -7.278860569000244, "global_step": 202517, "epoch": 4821} {"train_loss": -7.408539295196533, "global_step": 202518, "epoch": 4821} {"train_loss": -7.322466850280762, "global_step": 202519, "epoch": 4821} {"train_loss": -7.258231163024902, "global_step": 202520, "epoch": 4821} {"train_loss": -7.385270595550537, "global_step": 202521, "epoch": 4821} {"train_loss": -7.351335525512695, "global_step": 202522, "epoch": 4821} {"train_loss": -7.27998914037432, "global_step": 202523, "epoch": 4821, "val_loss": 69864.5078125} {"train_loss": -7.354010581970215, "global_step": 202524, "epoch": 4822} {"train_loss": -7.394387245178223, "global_step": 202525, "epoch": 4822} {"train_loss": -7.325077056884766, "global_step": 202526, "epoch": 4822} {"train_loss": -7.293084144592285, "global_step": 202527, "epoch": 4822} {"train_loss": -7.322203636169434, "global_step": 202528, "epoch": 4822} {"train_loss": -7.278848171234131, "global_step": 202529, "epoch": 4822} {"train_loss": -7.329790115356445, "global_step": 202530, "epoch": 4822} {"train_loss": -7.214096546173096, "global_step": 202531, "epoch": 4822} {"train_loss": -7.379454612731934, "global_step": 202532, "epoch": 4822} {"train_loss": -7.299114227294922, "global_step": 202533, "epoch": 4822} {"train_loss": -7.212724685668945, "global_step": 202534, "epoch": 4822} {"train_loss": -7.290375709533691, "global_step": 202535, "epoch": 4822} {"train_loss": -7.417283058166504, "global_step": 202536, "epoch": 4822} {"train_loss": -7.418001651763916, "global_step": 202537, "epoch": 4822} {"train_loss": -7.254052639007568, "global_step": 202538, "epoch": 4822} {"train_loss": -7.41224479675293, "global_step": 202539, "epoch": 4822} {"train_loss": -7.3147172927856445, "global_step": 202540, "epoch": 4822} {"train_loss": -7.3842597007751465, "global_step": 202541, "epoch": 4822} {"train_loss": -7.253073215484619, "global_step": 202542, "epoch": 4822} {"train_loss": -7.342331886291504, "global_step": 202543, "epoch": 4822} {"train_loss": -7.282126426696777, "global_step": 202544, "epoch": 4822} {"train_loss": -7.220114231109619, "global_step": 202545, "epoch": 4822} {"train_loss": -7.369692802429199, "global_step": 202546, "epoch": 4822} {"train_loss": -7.262488842010498, "global_step": 202547, "epoch": 4822} {"train_loss": -7.109123229980469, "global_step": 202548, "epoch": 4822} {"train_loss": -7.081439971923828, "global_step": 202549, "epoch": 4822} {"train_loss": -7.127064228057861, "global_step": 202550, "epoch": 4822} {"train_loss": -7.067873954772949, "global_step": 202551, "epoch": 4822} {"train_loss": -7.204672336578369, "global_step": 202552, "epoch": 4822} {"train_loss": -7.314199924468994, "global_step": 202553, "epoch": 4822} {"train_loss": -7.238198280334473, "global_step": 202554, "epoch": 4822} {"train_loss": -7.201822757720947, "global_step": 202555, "epoch": 4822} {"train_loss": -7.231539726257324, "global_step": 202556, "epoch": 4822} {"train_loss": -7.212627410888672, "global_step": 202557, "epoch": 4822} {"train_loss": -7.053953170776367, "global_step": 202558, "epoch": 4822} {"train_loss": -7.284483909606934, "global_step": 202559, "epoch": 4822} {"train_loss": -7.210373878479004, "global_step": 202560, "epoch": 4822} {"train_loss": -7.1072773933410645, "global_step": 202561, "epoch": 4822} {"train_loss": -7.281164169311523, "global_step": 202562, "epoch": 4822} {"train_loss": -7.290469169616699, "global_step": 202563, "epoch": 4822} {"train_loss": -7.0965189933776855, "global_step": 202564, "epoch": 4822} {"train_loss": -7.263272626059396, "global_step": 202565, "epoch": 4822, "val_loss": 69887.4609375} {"train_loss": -7.225682258605957, "global_step": 202566, "epoch": 4823} {"train_loss": -7.164583206176758, "global_step": 202567, "epoch": 4823} {"train_loss": -7.225404262542725, "global_step": 202568, "epoch": 4823} {"train_loss": -7.054592132568359, "global_step": 202569, "epoch": 4823} {"train_loss": -7.154962062835693, "global_step": 202570, "epoch": 4823} {"train_loss": -7.223869323730469, "global_step": 202571, "epoch": 4823} {"train_loss": -7.111525535583496, "global_step": 202572, "epoch": 4823} {"train_loss": -7.163840293884277, "global_step": 202573, "epoch": 4823} {"train_loss": -7.20402717590332, "global_step": 202574, "epoch": 4823} {"train_loss": -7.2369465827941895, "global_step": 202575, "epoch": 4823} {"train_loss": -7.198118686676025, "global_step": 202576, "epoch": 4823} {"train_loss": -7.318803787231445, "global_step": 202577, "epoch": 4823} {"train_loss": -7.262577056884766, "global_step": 202578, "epoch": 4823} {"train_loss": -7.266615867614746, "global_step": 202579, "epoch": 4823} {"train_loss": -7.252276420593262, "global_step": 202580, "epoch": 4823} {"train_loss": -7.282378196716309, "global_step": 202581, "epoch": 4823} {"train_loss": -7.3744659423828125, "global_step": 202582, "epoch": 4823} {"train_loss": -7.148268699645996, "global_step": 202583, "epoch": 4823} {"train_loss": -7.183773994445801, "global_step": 202584, "epoch": 4823} {"train_loss": -7.232972145080566, "global_step": 202585, "epoch": 4823} {"train_loss": -7.209247589111328, "global_step": 202586, "epoch": 4823} {"train_loss": -7.240398406982422, "global_step": 202587, "epoch": 4823} {"train_loss": -7.2688703536987305, "global_step": 202588, "epoch": 4823} {"train_loss": -7.269997596740723, "global_step": 202589, "epoch": 4823} {"train_loss": -7.158648490905762, "global_step": 202590, "epoch": 4823} {"train_loss": -7.34218692779541, "global_step": 202591, "epoch": 4823} {"train_loss": -7.177149295806885, "global_step": 202592, "epoch": 4823} {"train_loss": -7.230619430541992, "global_step": 202593, "epoch": 4823} {"train_loss": -7.306769371032715, "global_step": 202594, "epoch": 4823} {"train_loss": -7.330246925354004, "global_step": 202595, "epoch": 4823} {"train_loss": -7.304840087890625, "global_step": 202596, "epoch": 4823} {"train_loss": -7.261646270751953, "global_step": 202597, "epoch": 4823} {"train_loss": -7.262211799621582, "global_step": 202598, "epoch": 4823} {"train_loss": -7.221607208251953, "global_step": 202599, "epoch": 4823} {"train_loss": -7.323732376098633, "global_step": 202600, "epoch": 4823} {"train_loss": -7.342959403991699, "global_step": 202601, "epoch": 4823} {"train_loss": -7.342800140380859, "global_step": 202602, "epoch": 4823} {"train_loss": -7.347648620605469, "global_step": 202603, "epoch": 4823} {"train_loss": -7.316439628601074, "global_step": 202604, "epoch": 4823} {"train_loss": -7.252913475036621, "global_step": 202605, "epoch": 4823} {"train_loss": -7.395174503326416, "global_step": 202606, "epoch": 4823} {"train_loss": -7.250619570414226, "global_step": 202607, "epoch": 4823, "val_loss": 69807.8828125} {"train_loss": -7.376738548278809, "global_step": 202608, "epoch": 4824} {"train_loss": -7.3509931564331055, "global_step": 202609, "epoch": 4824} {"train_loss": -7.4259772300720215, "global_step": 202610, "epoch": 4824} {"train_loss": -7.327400207519531, "global_step": 202611, "epoch": 4824} {"train_loss": -7.332493782043457, "global_step": 202612, "epoch": 4824} {"train_loss": -7.440957546234131, "global_step": 202613, "epoch": 4824} {"train_loss": -7.258724212646484, "global_step": 202614, "epoch": 4824} {"train_loss": -7.315319538116455, "global_step": 202615, "epoch": 4824} {"train_loss": -7.310254096984863, "global_step": 202616, "epoch": 4824} {"train_loss": -7.202033996582031, "global_step": 202617, "epoch": 4824} {"train_loss": -7.307940483093262, "global_step": 202618, "epoch": 4824} {"train_loss": -7.315624237060547, "global_step": 202619, "epoch": 4824} {"train_loss": -7.2311577796936035, "global_step": 202620, "epoch": 4824} {"train_loss": -7.259938716888428, "global_step": 202621, "epoch": 4824} {"train_loss": -7.32856559753418, "global_step": 202622, "epoch": 4824} {"train_loss": -7.207460880279541, "global_step": 202623, "epoch": 4824} {"train_loss": -7.2748870849609375, "global_step": 202624, "epoch": 4824} {"train_loss": -7.361493110656738, "global_step": 202625, "epoch": 4824} {"train_loss": -7.337405204772949, "global_step": 202626, "epoch": 4824} {"train_loss": -7.320415496826172, "global_step": 202627, "epoch": 4824} {"train_loss": -7.331148147583008, "global_step": 202628, "epoch": 4824} {"train_loss": -7.321871757507324, "global_step": 202629, "epoch": 4824} {"train_loss": -7.271695137023926, "global_step": 202630, "epoch": 4824} {"train_loss": -7.320968151092529, "global_step": 202631, "epoch": 4824} {"train_loss": -7.360418319702148, "global_step": 202632, "epoch": 4824} {"train_loss": -7.246984481811523, "global_step": 202633, "epoch": 4824} {"train_loss": -7.25581169128418, "global_step": 202634, "epoch": 4824} {"train_loss": -7.288210391998291, "global_step": 202635, "epoch": 4824} {"train_loss": -7.390973091125488, "global_step": 202636, "epoch": 4824} {"train_loss": -7.357966423034668, "global_step": 202637, "epoch": 4824} {"train_loss": -7.389756202697754, "global_step": 202638, "epoch": 4824} {"train_loss": -7.233911037445068, "global_step": 202639, "epoch": 4824} {"train_loss": -7.385724067687988, "global_step": 202640, "epoch": 4824} {"train_loss": -7.199031829833984, "global_step": 202641, "epoch": 4824} {"train_loss": -7.241811275482178, "global_step": 202642, "epoch": 4824} {"train_loss": -7.239429473876953, "global_step": 202643, "epoch": 4824} {"train_loss": -7.262594699859619, "global_step": 202644, "epoch": 4824} {"train_loss": -7.2501115798950195, "global_step": 202645, "epoch": 4824} {"train_loss": -7.247469902038574, "global_step": 202646, "epoch": 4824} {"train_loss": -7.252874851226807, "global_step": 202647, "epoch": 4824} {"train_loss": -7.288012504577637, "global_step": 202648, "epoch": 4824} {"train_loss": -7.297964720498948, "global_step": 202649, "epoch": 4824, "val_loss": 69907.8984375} {"train_loss": -7.283537864685059, "global_step": 202650, "epoch": 4825} {"train_loss": -7.258881568908691, "global_step": 202651, "epoch": 4825} {"train_loss": -7.221128463745117, "global_step": 202652, "epoch": 4825} {"train_loss": -7.265092849731445, "global_step": 202653, "epoch": 4825} {"train_loss": -7.186294078826904, "global_step": 202654, "epoch": 4825} {"train_loss": -7.195971488952637, "global_step": 202655, "epoch": 4825} {"train_loss": -7.1208906173706055, "global_step": 202656, "epoch": 4825} {"train_loss": -7.354576110839844, "global_step": 202657, "epoch": 4825} {"train_loss": -7.274855613708496, "global_step": 202658, "epoch": 4825} {"train_loss": -7.277461528778076, "global_step": 202659, "epoch": 4825} {"train_loss": -7.367711067199707, "global_step": 202660, "epoch": 4825} {"train_loss": -7.329100131988525, "global_step": 202661, "epoch": 4825} {"train_loss": -7.167875289916992, "global_step": 202662, "epoch": 4825} {"train_loss": -7.365114212036133, "global_step": 202663, "epoch": 4825} {"train_loss": -7.217808723449707, "global_step": 202664, "epoch": 4825} {"train_loss": -7.289358139038086, "global_step": 202665, "epoch": 4825} {"train_loss": -7.298333644866943, "global_step": 202666, "epoch": 4825} {"train_loss": -7.285994529724121, "global_step": 202667, "epoch": 4825} {"train_loss": -7.327848434448242, "global_step": 202668, "epoch": 4825} {"train_loss": -7.142984390258789, "global_step": 202669, "epoch": 4825} {"train_loss": -7.178646087646484, "global_step": 202670, "epoch": 4825} {"train_loss": -7.280468463897705, "global_step": 202671, "epoch": 4825} {"train_loss": -7.301077842712402, "global_step": 202672, "epoch": 4825} {"train_loss": -7.250174522399902, "global_step": 202673, "epoch": 4825} {"train_loss": -7.1465935707092285, "global_step": 202674, "epoch": 4825} {"train_loss": -7.213833332061768, "global_step": 202675, "epoch": 4825} {"train_loss": -7.242504596710205, "global_step": 202676, "epoch": 4825} {"train_loss": -7.351622581481934, "global_step": 202677, "epoch": 4825} {"train_loss": -7.245092391967773, "global_step": 202678, "epoch": 4825} {"train_loss": -7.219022274017334, "global_step": 202679, "epoch": 4825} {"train_loss": -7.365716934204102, "global_step": 202680, "epoch": 4825} {"train_loss": -7.162238121032715, "global_step": 202681, "epoch": 4825} {"train_loss": -7.306419372558594, "global_step": 202682, "epoch": 4825} {"train_loss": -7.2688469886779785, "global_step": 202683, "epoch": 4825} {"train_loss": -7.244757652282715, "global_step": 202684, "epoch": 4825} {"train_loss": -7.293634414672852, "global_step": 202685, "epoch": 4825} {"train_loss": -7.212728977203369, "global_step": 202686, "epoch": 4825} {"train_loss": -7.348001480102539, "global_step": 202687, "epoch": 4825} {"train_loss": -7.247345924377441, "global_step": 202688, "epoch": 4825} {"train_loss": -7.375851631164551, "global_step": 202689, "epoch": 4825} {"train_loss": -7.369780540466309, "global_step": 202690, "epoch": 4825} {"train_loss": -7.267392612638927, "global_step": 202691, "epoch": 4825, "val_loss": 69765.71875} {"train_loss": -7.387144088745117, "global_step": 202692, "epoch": 4826} {"train_loss": -7.3854265213012695, "global_step": 202693, "epoch": 4826} {"train_loss": -7.354402542114258, "global_step": 202694, "epoch": 4826} {"train_loss": -7.31874418258667, "global_step": 202695, "epoch": 4826} {"train_loss": -7.411865234375, "global_step": 202696, "epoch": 4826} {"train_loss": -7.353999614715576, "global_step": 202697, "epoch": 4826} {"train_loss": -7.208683013916016, "global_step": 202698, "epoch": 4826} {"train_loss": -7.280298233032227, "global_step": 202699, "epoch": 4826} {"train_loss": -7.435474395751953, "global_step": 202700, "epoch": 4826} {"train_loss": -7.297763824462891, "global_step": 202701, "epoch": 4826} {"train_loss": -7.213624954223633, "global_step": 202702, "epoch": 4826} {"train_loss": -7.291513442993164, "global_step": 202703, "epoch": 4826} {"train_loss": -7.3207502365112305, "global_step": 202704, "epoch": 4826} {"train_loss": -7.316308975219727, "global_step": 202705, "epoch": 4826} {"train_loss": -7.333461761474609, "global_step": 202706, "epoch": 4826} {"train_loss": -7.308834552764893, "global_step": 202707, "epoch": 4826} {"train_loss": -7.437782287597656, "global_step": 202708, "epoch": 4826} {"train_loss": -7.3405537605285645, "global_step": 202709, "epoch": 4826} {"train_loss": -7.346639633178711, "global_step": 202710, "epoch": 4826} {"train_loss": -7.3156843185424805, "global_step": 202711, "epoch": 4826} {"train_loss": -7.355347633361816, "global_step": 202712, "epoch": 4826} {"train_loss": -7.331404209136963, "global_step": 202713, "epoch": 4826} {"train_loss": -7.386898994445801, "global_step": 202714, "epoch": 4826} {"train_loss": -7.3583855628967285, "global_step": 202715, "epoch": 4826} {"train_loss": -7.350760459899902, "global_step": 202716, "epoch": 4826} {"train_loss": -7.230910301208496, "global_step": 202717, "epoch": 4826} {"train_loss": -7.3062286376953125, "global_step": 202718, "epoch": 4826} {"train_loss": -7.359466552734375, "global_step": 202719, "epoch": 4826} {"train_loss": -7.329452037811279, "global_step": 202720, "epoch": 4826} {"train_loss": -7.285661220550537, "global_step": 202721, "epoch": 4826} {"train_loss": -7.314483165740967, "global_step": 202722, "epoch": 4826} {"train_loss": -7.40786600112915, "global_step": 202723, "epoch": 4826} {"train_loss": -7.356551170349121, "global_step": 202724, "epoch": 4826} {"train_loss": -7.282248497009277, "global_step": 202725, "epoch": 4826} {"train_loss": -7.289798736572266, "global_step": 202726, "epoch": 4826} {"train_loss": -7.341073989868164, "global_step": 202727, "epoch": 4826} {"train_loss": -7.344263553619385, "global_step": 202728, "epoch": 4826} {"train_loss": -7.211027145385742, "global_step": 202729, "epoch": 4826} {"train_loss": -7.322626113891602, "global_step": 202730, "epoch": 4826} {"train_loss": -7.220026016235352, "global_step": 202731, "epoch": 4826} {"train_loss": -7.127678871154785, "global_step": 202732, "epoch": 4826} {"train_loss": -7.320340054375785, "global_step": 202733, "epoch": 4826, "val_loss": 69799.015625} {"train_loss": -7.231513977050781, "global_step": 202734, "epoch": 4827} {"train_loss": -7.21146297454834, "global_step": 202735, "epoch": 4827} {"train_loss": -7.113136291503906, "global_step": 202736, "epoch": 4827} {"train_loss": -7.255462646484375, "global_step": 202737, "epoch": 4827} {"train_loss": -7.167061805725098, "global_step": 202738, "epoch": 4827} {"train_loss": -7.141568183898926, "global_step": 202739, "epoch": 4827} {"train_loss": -7.108329772949219, "global_step": 202740, "epoch": 4827} {"train_loss": -7.300337791442871, "global_step": 202741, "epoch": 4827} {"train_loss": -7.297848701477051, "global_step": 202742, "epoch": 4827} {"train_loss": -7.214087009429932, "global_step": 202743, "epoch": 4827} {"train_loss": -7.343621730804443, "global_step": 202744, "epoch": 4827} {"train_loss": -7.270659446716309, "global_step": 202745, "epoch": 4827} {"train_loss": -7.292158126831055, "global_step": 202746, "epoch": 4827} {"train_loss": -7.276005744934082, "global_step": 202747, "epoch": 4827} {"train_loss": -7.210716247558594, "global_step": 202748, "epoch": 4827} {"train_loss": -7.216965675354004, "global_step": 202749, "epoch": 4827} {"train_loss": -7.212024211883545, "global_step": 202750, "epoch": 4827} {"train_loss": -7.285553932189941, "global_step": 202751, "epoch": 4827} {"train_loss": -7.213772773742676, "global_step": 202752, "epoch": 4827} {"train_loss": -7.206849575042725, "global_step": 202753, "epoch": 4827} {"train_loss": -7.33547306060791, "global_step": 202754, "epoch": 4827} {"train_loss": -7.242713451385498, "global_step": 202755, "epoch": 4827} {"train_loss": -7.125559329986572, "global_step": 202756, "epoch": 4827} {"train_loss": -7.32835054397583, "global_step": 202757, "epoch": 4827} {"train_loss": -7.116106033325195, "global_step": 202758, "epoch": 4827} {"train_loss": -7.334221839904785, "global_step": 202759, "epoch": 4827} {"train_loss": -7.292968273162842, "global_step": 202760, "epoch": 4827} {"train_loss": -7.07826042175293, "global_step": 202761, "epoch": 4827} {"train_loss": -7.282967567443848, "global_step": 202762, "epoch": 4827} {"train_loss": -7.216108322143555, "global_step": 202763, "epoch": 4827} {"train_loss": -7.266032695770264, "global_step": 202764, "epoch": 4827} {"train_loss": -7.290395736694336, "global_step": 202765, "epoch": 4827} {"train_loss": -7.288036346435547, "global_step": 202766, "epoch": 4827} {"train_loss": -7.265954971313477, "global_step": 202767, "epoch": 4827} {"train_loss": -7.342912673950195, "global_step": 202768, "epoch": 4827} {"train_loss": -7.215697288513184, "global_step": 202769, "epoch": 4827} {"train_loss": -7.169914245605469, "global_step": 202770, "epoch": 4827} {"train_loss": -7.287621974945068, "global_step": 202771, "epoch": 4827} {"train_loss": -7.2526164054870605, "global_step": 202772, "epoch": 4827} {"train_loss": -7.177044868469238, "global_step": 202773, "epoch": 4827} {"train_loss": -7.178632736206055, "global_step": 202774, "epoch": 4827} {"train_loss": -7.238404273986816, "global_step": 202775, "epoch": 4827, "val_loss": 69892.7109375} {"train_loss": -7.2493815422058105, "global_step": 202776, "epoch": 4828} {"train_loss": -7.236066818237305, "global_step": 202777, "epoch": 4828} {"train_loss": -7.356931209564209, "global_step": 202778, "epoch": 4828} {"train_loss": -7.382993221282959, "global_step": 202779, "epoch": 4828} {"train_loss": -7.346575736999512, "global_step": 202780, "epoch": 4828} {"train_loss": -7.339269638061523, "global_step": 202781, "epoch": 4828} {"train_loss": -7.316400051116943, "global_step": 202782, "epoch": 4828} {"train_loss": -7.31121301651001, "global_step": 202783, "epoch": 4828} {"train_loss": -7.310574531555176, "global_step": 202784, "epoch": 4828} {"train_loss": -7.278971195220947, "global_step": 202785, "epoch": 4828} {"train_loss": -7.229053497314453, "global_step": 202786, "epoch": 4828} {"train_loss": -7.2186689376831055, "global_step": 202787, "epoch": 4828} {"train_loss": -7.176668167114258, "global_step": 202788, "epoch": 4828} {"train_loss": -7.279415130615234, "global_step": 202789, "epoch": 4828} {"train_loss": -7.344144821166992, "global_step": 202790, "epoch": 4828} {"train_loss": -7.177149772644043, "global_step": 202791, "epoch": 4828} {"train_loss": -7.368561744689941, "global_step": 202792, "epoch": 4828} {"train_loss": -7.258258819580078, "global_step": 202793, "epoch": 4828} {"train_loss": -7.321901798248291, "global_step": 202794, "epoch": 4828} {"train_loss": -7.206958293914795, "global_step": 202795, "epoch": 4828} {"train_loss": -7.273120880126953, "global_step": 202796, "epoch": 4828} {"train_loss": -7.367008209228516, "global_step": 202797, "epoch": 4828} {"train_loss": -7.32419490814209, "global_step": 202798, "epoch": 4828} {"train_loss": -7.251102924346924, "global_step": 202799, "epoch": 4828} {"train_loss": -7.293124675750732, "global_step": 202800, "epoch": 4828} {"train_loss": -7.33920955657959, "global_step": 202801, "epoch": 4828} {"train_loss": -7.341785430908203, "global_step": 202802, "epoch": 4828} {"train_loss": -7.343832969665527, "global_step": 202803, "epoch": 4828} {"train_loss": -7.361763954162598, "global_step": 202804, "epoch": 4828} {"train_loss": -7.236985206604004, "global_step": 202805, "epoch": 4828} {"train_loss": -7.265439033508301, "global_step": 202806, "epoch": 4828} {"train_loss": -7.283389091491699, "global_step": 202807, "epoch": 4828} {"train_loss": -7.3356404304504395, "global_step": 202808, "epoch": 4828} {"train_loss": -7.336937427520752, "global_step": 202809, "epoch": 4828} {"train_loss": -7.216695785522461, "global_step": 202810, "epoch": 4828} {"train_loss": -7.344923973083496, "global_step": 202811, "epoch": 4828} {"train_loss": -7.258369445800781, "global_step": 202812, "epoch": 4828} {"train_loss": -7.338527679443359, "global_step": 202813, "epoch": 4828} {"train_loss": -7.341766357421875, "global_step": 202814, "epoch": 4828} {"train_loss": -7.30061674118042, "global_step": 202815, "epoch": 4828} {"train_loss": -7.210235595703125, "global_step": 202816, "epoch": 4828} {"train_loss": -7.2955729847862605, "global_step": 202817, "epoch": 4828, "val_loss": 69989.15625} {"train_loss": -7.250914573669434, "global_step": 202818, "epoch": 4829} {"train_loss": -7.290308952331543, "global_step": 202819, "epoch": 4829} {"train_loss": -7.228089809417725, "global_step": 202820, "epoch": 4829} {"train_loss": -7.451456069946289, "global_step": 202821, "epoch": 4829} {"train_loss": -7.294254302978516, "global_step": 202822, "epoch": 4829} {"train_loss": -7.320527076721191, "global_step": 202823, "epoch": 4829} {"train_loss": -7.446987152099609, "global_step": 202824, "epoch": 4829} {"train_loss": -7.298595428466797, "global_step": 202825, "epoch": 4829} {"train_loss": -7.338999271392822, "global_step": 202826, "epoch": 4829} {"train_loss": -7.417259216308594, "global_step": 202827, "epoch": 4829} {"train_loss": -7.339920997619629, "global_step": 202828, "epoch": 4829} {"train_loss": -7.295520782470703, "global_step": 202829, "epoch": 4829} {"train_loss": -7.262034893035889, "global_step": 202830, "epoch": 4829} {"train_loss": -7.297966957092285, "global_step": 202831, "epoch": 4829} {"train_loss": -7.38996696472168, "global_step": 202832, "epoch": 4829} {"train_loss": -7.276595592498779, "global_step": 202833, "epoch": 4829} {"train_loss": -7.351321220397949, "global_step": 202834, "epoch": 4829} {"train_loss": -7.24066686630249, "global_step": 202835, "epoch": 4829} {"train_loss": -7.3107194900512695, "global_step": 202836, "epoch": 4829} {"train_loss": -7.291014671325684, "global_step": 202837, "epoch": 4829} {"train_loss": -7.191427230834961, "global_step": 202838, "epoch": 4829} {"train_loss": -7.338852882385254, "global_step": 202839, "epoch": 4829} {"train_loss": -7.277559280395508, "global_step": 202840, "epoch": 4829} {"train_loss": -7.3432159423828125, "global_step": 202841, "epoch": 4829} {"train_loss": -7.320047378540039, "global_step": 202842, "epoch": 4829} {"train_loss": -7.220815658569336, "global_step": 202843, "epoch": 4829} {"train_loss": -7.2038445472717285, "global_step": 202844, "epoch": 4829} {"train_loss": -7.334145545959473, "global_step": 202845, "epoch": 4829} {"train_loss": -7.269505023956299, "global_step": 202846, "epoch": 4829} {"train_loss": -7.2027082443237305, "global_step": 202847, "epoch": 4829} {"train_loss": -7.126827239990234, "global_step": 202848, "epoch": 4829} {"train_loss": -7.211318016052246, "global_step": 202849, "epoch": 4829} {"train_loss": -7.339739799499512, "global_step": 202850, "epoch": 4829} {"train_loss": -7.139518737792969, "global_step": 202851, "epoch": 4829} {"train_loss": -7.161832332611084, "global_step": 202852, "epoch": 4829} {"train_loss": -7.393639087677002, "global_step": 202853, "epoch": 4829} {"train_loss": -7.100453853607178, "global_step": 202854, "epoch": 4829} {"train_loss": -7.170423984527588, "global_step": 202855, "epoch": 4829} {"train_loss": -7.182699203491211, "global_step": 202856, "epoch": 4829} {"train_loss": -7.26168155670166, "global_step": 202857, "epoch": 4829} {"train_loss": -7.169649124145508, "global_step": 202858, "epoch": 4829} {"train_loss": -7.275762989407494, "global_step": 202859, "epoch": 4829, "val_loss": 70081.0} {"train_loss": -7.278947830200195, "global_step": 202860, "epoch": 4830} {"train_loss": -7.222841262817383, "global_step": 202861, "epoch": 4830} {"train_loss": -7.206108093261719, "global_step": 202862, "epoch": 4830} {"train_loss": -7.264932155609131, "global_step": 202863, "epoch": 4830} {"train_loss": -7.2447590827941895, "global_step": 202864, "epoch": 4830} {"train_loss": -7.311720371246338, "global_step": 202865, "epoch": 4830} {"train_loss": -7.381498336791992, "global_step": 202866, "epoch": 4830} {"train_loss": -7.195362091064453, "global_step": 202867, "epoch": 4830} {"train_loss": -7.195162773132324, "global_step": 202868, "epoch": 4830} {"train_loss": -7.294431686401367, "global_step": 202869, "epoch": 4830} {"train_loss": -7.224295616149902, "global_step": 202870, "epoch": 4830} {"train_loss": -7.309003829956055, "global_step": 202871, "epoch": 4830} {"train_loss": -7.286398887634277, "global_step": 202872, "epoch": 4830} {"train_loss": -7.40577507019043, "global_step": 202873, "epoch": 4830} {"train_loss": -7.310667037963867, "global_step": 202874, "epoch": 4830} {"train_loss": -7.371467113494873, "global_step": 202875, "epoch": 4830} {"train_loss": -7.335108757019043, "global_step": 202876, "epoch": 4830} {"train_loss": -7.285808563232422, "global_step": 202877, "epoch": 4830} {"train_loss": -7.289759635925293, "global_step": 202878, "epoch": 4830} {"train_loss": -7.2869367599487305, "global_step": 202879, "epoch": 4830} {"train_loss": -7.29790735244751, "global_step": 202880, "epoch": 4830} {"train_loss": -7.278022289276123, "global_step": 202881, "epoch": 4830} {"train_loss": -7.362531661987305, "global_step": 202882, "epoch": 4830} {"train_loss": -7.394606590270996, "global_step": 202883, "epoch": 4830} {"train_loss": -7.257106781005859, "global_step": 202884, "epoch": 4830} {"train_loss": -7.364830017089844, "global_step": 202885, "epoch": 4830} {"train_loss": -7.253990650177002, "global_step": 202886, "epoch": 4830} {"train_loss": -7.3863372802734375, "global_step": 202887, "epoch": 4830} {"train_loss": -7.373076438903809, "global_step": 202888, "epoch": 4830} {"train_loss": -7.405223369598389, "global_step": 202889, "epoch": 4830} {"train_loss": -7.356921195983887, "global_step": 202890, "epoch": 4830} {"train_loss": -7.340574264526367, "global_step": 202891, "epoch": 4830} {"train_loss": -7.292231559753418, "global_step": 202892, "epoch": 4830} {"train_loss": -7.343989372253418, "global_step": 202893, "epoch": 4830} {"train_loss": -7.273071765899658, "global_step": 202894, "epoch": 4830} {"train_loss": -7.325235843658447, "global_step": 202895, "epoch": 4830} {"train_loss": -7.309587478637695, "global_step": 202896, "epoch": 4830} {"train_loss": -7.298233985900879, "global_step": 202897, "epoch": 4830} {"train_loss": -7.469906806945801, "global_step": 202898, "epoch": 4830} {"train_loss": -7.3818817138671875, "global_step": 202899, "epoch": 4830} {"train_loss": -7.37867546081543, "global_step": 202900, "epoch": 4830} {"train_loss": -7.311396928060622, "global_step": 202901, "epoch": 4830, "val_loss": 69912.5390625} {"train_loss": -7.448209762573242, "global_step": 202902, "epoch": 4831} {"train_loss": -7.3298187255859375, "global_step": 202903, "epoch": 4831} {"train_loss": -7.326169013977051, "global_step": 202904, "epoch": 4831} {"train_loss": -7.279790878295898, "global_step": 202905, "epoch": 4831} {"train_loss": -7.338947772979736, "global_step": 202906, "epoch": 4831} {"train_loss": -7.366467475891113, "global_step": 202907, "epoch": 4831} {"train_loss": -7.356009483337402, "global_step": 202908, "epoch": 4831} {"train_loss": -7.301244735717773, "global_step": 202909, "epoch": 4831} {"train_loss": -7.342462539672852, "global_step": 202910, "epoch": 4831} {"train_loss": -7.370314121246338, "global_step": 202911, "epoch": 4831} {"train_loss": -7.294768333435059, "global_step": 202912, "epoch": 4831} {"train_loss": -7.293851852416992, "global_step": 202913, "epoch": 4831} {"train_loss": -7.266502380371094, "global_step": 202914, "epoch": 4831} {"train_loss": -7.286669731140137, "global_step": 202915, "epoch": 4831} {"train_loss": -7.260293483734131, "global_step": 202916, "epoch": 4831} {"train_loss": -7.2486772537231445, "global_step": 202917, "epoch": 4831} {"train_loss": -7.1553754806518555, "global_step": 202918, "epoch": 4831} {"train_loss": -7.156294822692871, "global_step": 202919, "epoch": 4831} {"train_loss": -7.239345550537109, "global_step": 202920, "epoch": 4831} {"train_loss": -7.299033164978027, "global_step": 202921, "epoch": 4831} {"train_loss": -7.316962242126465, "global_step": 202922, "epoch": 4831} {"train_loss": -7.190680503845215, "global_step": 202923, "epoch": 4831} {"train_loss": -7.249993801116943, "global_step": 202924, "epoch": 4831} {"train_loss": -7.26755428314209, "global_step": 202925, "epoch": 4831} {"train_loss": -7.241524696350098, "global_step": 202926, "epoch": 4831} {"train_loss": -7.214310169219971, "global_step": 202927, "epoch": 4831} {"train_loss": -7.228215217590332, "global_step": 202928, "epoch": 4831} {"train_loss": -7.266696453094482, "global_step": 202929, "epoch": 4831} {"train_loss": -7.1013078689575195, "global_step": 202930, "epoch": 4831} {"train_loss": -7.337610244750977, "global_step": 202931, "epoch": 4831} {"train_loss": -7.271045207977295, "global_step": 202932, "epoch": 4831} {"train_loss": -7.100338935852051, "global_step": 202933, "epoch": 4831} {"train_loss": -7.2437214851379395, "global_step": 202934, "epoch": 4831} {"train_loss": -7.225022792816162, "global_step": 202935, "epoch": 4831} {"train_loss": -7.181571960449219, "global_step": 202936, "epoch": 4831} {"train_loss": -7.330754280090332, "global_step": 202937, "epoch": 4831} {"train_loss": -7.191943645477295, "global_step": 202938, "epoch": 4831} {"train_loss": -7.084306240081787, "global_step": 202939, "epoch": 4831} {"train_loss": -7.283702850341797, "global_step": 202940, "epoch": 4831} {"train_loss": -7.234227657318115, "global_step": 202941, "epoch": 4831} {"train_loss": -7.110183238983154, "global_step": 202942, "epoch": 4831} {"train_loss": -7.258069276809692, "global_step": 202943, "epoch": 4831, "val_loss": 70063.671875} {"train_loss": -7.270660400390625, "global_step": 202944, "epoch": 4832} {"train_loss": -7.0169548988342285, "global_step": 202945, "epoch": 4832} {"train_loss": -7.253154754638672, "global_step": 202946, "epoch": 4832} {"train_loss": -7.159058570861816, "global_step": 202947, "epoch": 4832} {"train_loss": -7.107240676879883, "global_step": 202948, "epoch": 4832} {"train_loss": -7.298185348510742, "global_step": 202949, "epoch": 4832} {"train_loss": -7.046931266784668, "global_step": 202950, "epoch": 4832} {"train_loss": -7.223422527313232, "global_step": 202951, "epoch": 4832} {"train_loss": -7.166692733764648, "global_step": 202952, "epoch": 4832} {"train_loss": -7.222811698913574, "global_step": 202953, "epoch": 4832} {"train_loss": -7.222052574157715, "global_step": 202954, "epoch": 4832} {"train_loss": -7.213796138763428, "global_step": 202955, "epoch": 4832} {"train_loss": -7.29622745513916, "global_step": 202956, "epoch": 4832} {"train_loss": -7.218581199645996, "global_step": 202957, "epoch": 4832} {"train_loss": -7.257521152496338, "global_step": 202958, "epoch": 4832} {"train_loss": -7.204033374786377, "global_step": 202959, "epoch": 4832} {"train_loss": -7.255241394042969, "global_step": 202960, "epoch": 4832} {"train_loss": -7.295363426208496, "global_step": 202961, "epoch": 4832} {"train_loss": -7.308009147644043, "global_step": 202962, "epoch": 4832} {"train_loss": -7.247153282165527, "global_step": 202963, "epoch": 4832} {"train_loss": -7.203632354736328, "global_step": 202964, "epoch": 4832} {"train_loss": -7.227101802825928, "global_step": 202965, "epoch": 4832} {"train_loss": -7.187864303588867, "global_step": 202966, "epoch": 4832} {"train_loss": -7.312682151794434, "global_step": 202967, "epoch": 4832} {"train_loss": -7.339828014373779, "global_step": 202968, "epoch": 4832} {"train_loss": -7.3343095779418945, "global_step": 202969, "epoch": 4832} {"train_loss": -7.365645408630371, "global_step": 202970, "epoch": 4832} {"train_loss": -7.303049087524414, "global_step": 202971, "epoch": 4832} {"train_loss": -7.317941665649414, "global_step": 202972, "epoch": 4832} {"train_loss": -7.372702121734619, "global_step": 202973, "epoch": 4832} {"train_loss": -7.360210418701172, "global_step": 202974, "epoch": 4832} {"train_loss": -7.281182765960693, "global_step": 202975, "epoch": 4832} {"train_loss": -7.244854927062988, "global_step": 202976, "epoch": 4832} {"train_loss": -7.291438579559326, "global_step": 202977, "epoch": 4832} {"train_loss": -7.220905303955078, "global_step": 202978, "epoch": 4832} {"train_loss": -7.304067611694336, "global_step": 202979, "epoch": 4832} {"train_loss": -7.219173431396484, "global_step": 202980, "epoch": 4832} {"train_loss": -7.275473117828369, "global_step": 202981, "epoch": 4832} {"train_loss": -7.303764343261719, "global_step": 202982, "epoch": 4832} {"train_loss": -7.274325370788574, "global_step": 202983, "epoch": 4832} {"train_loss": -7.328883171081543, "global_step": 202984, "epoch": 4832} {"train_loss": -7.252356143224807, "global_step": 202985, "epoch": 4832, "val_loss": 69818.1640625} {"train_loss": -7.349653244018555, "global_step": 202986, "epoch": 4833} {"train_loss": -7.2992658615112305, "global_step": 202987, "epoch": 4833} {"train_loss": -7.345570087432861, "global_step": 202988, "epoch": 4833} {"train_loss": -7.2796454429626465, "global_step": 202989, "epoch": 4833} {"train_loss": -7.360623836517334, "global_step": 202990, "epoch": 4833} {"train_loss": -7.315299987792969, "global_step": 202991, "epoch": 4833} {"train_loss": -7.331366539001465, "global_step": 202992, "epoch": 4833} {"train_loss": -7.172943592071533, "global_step": 202993, "epoch": 4833} {"train_loss": -7.446878910064697, "global_step": 202994, "epoch": 4833} {"train_loss": -7.308361053466797, "global_step": 202995, "epoch": 4833} {"train_loss": -7.174971580505371, "global_step": 202996, "epoch": 4833} {"train_loss": -7.195932388305664, "global_step": 202997, "epoch": 4833} {"train_loss": -7.258338928222656, "global_step": 202998, "epoch": 4833} {"train_loss": -7.081006050109863, "global_step": 202999, "epoch": 4833} {"train_loss": -7.428407669067383, "global_step": 203000, "epoch": 4833} {"train_loss": -7.099947929382324, "global_step": 203001, "epoch": 4833} {"train_loss": -7.361550331115723, "global_step": 203002, "epoch": 4833} {"train_loss": -7.303560256958008, "global_step": 203003, "epoch": 4833} {"train_loss": -7.213481903076172, "global_step": 203004, "epoch": 4833} {"train_loss": -7.400293350219727, "global_step": 203005, "epoch": 4833} {"train_loss": -7.125782489776611, "global_step": 203006, "epoch": 4833} {"train_loss": -7.162546157836914, "global_step": 203007, "epoch": 4833} {"train_loss": -7.219757556915283, "global_step": 203008, "epoch": 4833} {"train_loss": -7.180255889892578, "global_step": 203009, "epoch": 4833} {"train_loss": -7.200817584991455, "global_step": 203010, "epoch": 4833} {"train_loss": -7.245260238647461, "global_step": 203011, "epoch": 4833} {"train_loss": -7.19143009185791, "global_step": 203012, "epoch": 4833} {"train_loss": -7.198812484741211, "global_step": 203013, "epoch": 4833} {"train_loss": -7.151279449462891, "global_step": 203014, "epoch": 4833} {"train_loss": -7.248530387878418, "global_step": 203015, "epoch": 4833} {"train_loss": -7.2660722732543945, "global_step": 203016, "epoch": 4833} {"train_loss": -7.30110502243042, "global_step": 203017, "epoch": 4833} {"train_loss": -7.294209957122803, "global_step": 203018, "epoch": 4833} {"train_loss": -7.2260284423828125, "global_step": 203019, "epoch": 4833} {"train_loss": -7.166712760925293, "global_step": 203020, "epoch": 4833} {"train_loss": -7.242195129394531, "global_step": 203021, "epoch": 4833} {"train_loss": -7.189558029174805, "global_step": 203022, "epoch": 4833} {"train_loss": -7.218327522277832, "global_step": 203023, "epoch": 4833} {"train_loss": -7.265987873077393, "global_step": 203024, "epoch": 4833} {"train_loss": -7.2396931648254395, "global_step": 203025, "epoch": 4833} {"train_loss": -7.259235382080078, "global_step": 203026, "epoch": 4833} {"train_loss": -7.254648594629197, "global_step": 203027, "epoch": 4833, "val_loss": 69883.78125} {"train_loss": -7.3473358154296875, "global_step": 203028, "epoch": 4834} {"train_loss": -7.217584133148193, "global_step": 203029, "epoch": 4834} {"train_loss": -7.262539386749268, "global_step": 203030, "epoch": 4834} {"train_loss": -7.203754425048828, "global_step": 203031, "epoch": 4834} {"train_loss": -7.212738037109375, "global_step": 203032, "epoch": 4834} {"train_loss": -7.372480869293213, "global_step": 203033, "epoch": 4834} {"train_loss": -7.299277305603027, "global_step": 203034, "epoch": 4834} {"train_loss": -7.1961493492126465, "global_step": 203035, "epoch": 4834} {"train_loss": -7.24276876449585, "global_step": 203036, "epoch": 4834} {"train_loss": -7.313055515289307, "global_step": 203037, "epoch": 4834} {"train_loss": -7.241020679473877, "global_step": 203038, "epoch": 4834} {"train_loss": -7.24721622467041, "global_step": 203039, "epoch": 4834} {"train_loss": -7.282881736755371, "global_step": 203040, "epoch": 4834} {"train_loss": -7.358241081237793, "global_step": 203041, "epoch": 4834} {"train_loss": -7.372852325439453, "global_step": 203042, "epoch": 4834} {"train_loss": -7.239185333251953, "global_step": 203043, "epoch": 4834} {"train_loss": -7.401994705200195, "global_step": 203044, "epoch": 4834} {"train_loss": -7.190240859985352, "global_step": 203045, "epoch": 4834} {"train_loss": -7.171740531921387, "global_step": 203046, "epoch": 4834} {"train_loss": -7.414498805999756, "global_step": 203047, "epoch": 4834} {"train_loss": -7.332829475402832, "global_step": 203048, "epoch": 4834} {"train_loss": -7.186725616455078, "global_step": 203049, "epoch": 4834} {"train_loss": -7.3096513748168945, "global_step": 203050, "epoch": 4834} {"train_loss": -7.249635696411133, "global_step": 203051, "epoch": 4834} {"train_loss": -7.365653038024902, "global_step": 203052, "epoch": 4834} {"train_loss": -7.281124114990234, "global_step": 203053, "epoch": 4834} {"train_loss": -7.3223419189453125, "global_step": 203054, "epoch": 4834} {"train_loss": -7.352071285247803, "global_step": 203055, "epoch": 4834} {"train_loss": -7.355468273162842, "global_step": 203056, "epoch": 4834} {"train_loss": -7.319789886474609, "global_step": 203057, "epoch": 4834} {"train_loss": -7.461355209350586, "global_step": 203058, "epoch": 4834} {"train_loss": -7.3557233810424805, "global_step": 203059, "epoch": 4834} {"train_loss": -7.1907124519348145, "global_step": 203060, "epoch": 4834} {"train_loss": -7.397193908691406, "global_step": 203061, "epoch": 4834} {"train_loss": -7.21932315826416, "global_step": 203062, "epoch": 4834} {"train_loss": -7.3934831619262695, "global_step": 203063, "epoch": 4834} {"train_loss": -7.375082015991211, "global_step": 203064, "epoch": 4834} {"train_loss": -7.15836238861084, "global_step": 203065, "epoch": 4834} {"train_loss": -7.453841686248779, "global_step": 203066, "epoch": 4834} {"train_loss": -7.220637321472168, "global_step": 203067, "epoch": 4834} {"train_loss": -7.287869453430176, "global_step": 203068, "epoch": 4834} {"train_loss": -7.29443883895874, "global_step": 203069, "epoch": 4834, "val_loss": 69900.9453125} {"train_loss": -7.136323928833008, "global_step": 203070, "epoch": 4835} {"train_loss": -7.2947516441345215, "global_step": 203071, "epoch": 4835} {"train_loss": -7.197452545166016, "global_step": 203072, "epoch": 4835} {"train_loss": -7.1645097732543945, "global_step": 203073, "epoch": 4835} {"train_loss": -7.332516670227051, "global_step": 203074, "epoch": 4835} {"train_loss": -7.370906352996826, "global_step": 203075, "epoch": 4835} {"train_loss": -7.287489891052246, "global_step": 203076, "epoch": 4835} {"train_loss": -7.331182956695557, "global_step": 203077, "epoch": 4835} {"train_loss": -7.310278415679932, "global_step": 203078, "epoch": 4835} {"train_loss": -7.242272853851318, "global_step": 203079, "epoch": 4835} {"train_loss": -7.387537956237793, "global_step": 203080, "epoch": 4835} {"train_loss": -7.4154052734375, "global_step": 203081, "epoch": 4835} {"train_loss": -7.202841758728027, "global_step": 203082, "epoch": 4835} {"train_loss": -7.285110950469971, "global_step": 203083, "epoch": 4835} {"train_loss": -7.294040679931641, "global_step": 203084, "epoch": 4835} {"train_loss": -7.228050231933594, "global_step": 203085, "epoch": 4835} {"train_loss": -7.285610675811768, "global_step": 203086, "epoch": 4835} {"train_loss": -7.419483184814453, "global_step": 203087, "epoch": 4835} {"train_loss": -7.285792350769043, "global_step": 203088, "epoch": 4835} {"train_loss": -7.367918014526367, "global_step": 203089, "epoch": 4835} {"train_loss": -7.318169593811035, "global_step": 203090, "epoch": 4835} {"train_loss": -7.26207160949707, "global_step": 203091, "epoch": 4835} {"train_loss": -7.316365718841553, "global_step": 203092, "epoch": 4835} {"train_loss": -7.252880096435547, "global_step": 203093, "epoch": 4835} {"train_loss": -7.292426586151123, "global_step": 203094, "epoch": 4835} {"train_loss": -7.338580131530762, "global_step": 203095, "epoch": 4835} {"train_loss": -7.360229969024658, "global_step": 203096, "epoch": 4835} {"train_loss": -7.338960647583008, "global_step": 203097, "epoch": 4835} {"train_loss": -7.309680938720703, "global_step": 203098, "epoch": 4835} {"train_loss": -7.323423385620117, "global_step": 203099, "epoch": 4835} {"train_loss": -7.371167182922363, "global_step": 203100, "epoch": 4835} {"train_loss": -7.328578948974609, "global_step": 203101, "epoch": 4835} {"train_loss": -7.3484368324279785, "global_step": 203102, "epoch": 4835} {"train_loss": -7.432250499725342, "global_step": 203103, "epoch": 4835} {"train_loss": -7.27532958984375, "global_step": 203104, "epoch": 4835} {"train_loss": -7.305911540985107, "global_step": 203105, "epoch": 4835} {"train_loss": -7.381837368011475, "global_step": 203106, "epoch": 4835} {"train_loss": -7.272159576416016, "global_step": 203107, "epoch": 4835} {"train_loss": -7.379255771636963, "global_step": 203108, "epoch": 4835} {"train_loss": -7.245734214782715, "global_step": 203109, "epoch": 4835} {"train_loss": -7.244409084320068, "global_step": 203110, "epoch": 4835} {"train_loss": -7.304745969318208, "global_step": 203111, "epoch": 4835, "val_loss": 69902.4921875} {"train_loss": -7.356003761291504, "global_step": 203112, "epoch": 4836} {"train_loss": -7.183290481567383, "global_step": 203113, "epoch": 4836} {"train_loss": -7.316303253173828, "global_step": 203114, "epoch": 4836} {"train_loss": -7.236759662628174, "global_step": 203115, "epoch": 4836} {"train_loss": -7.317044258117676, "global_step": 203116, "epoch": 4836} {"train_loss": -7.286078929901123, "global_step": 203117, "epoch": 4836} {"train_loss": -7.124624252319336, "global_step": 203118, "epoch": 4836} {"train_loss": -7.193670272827148, "global_step": 203119, "epoch": 4836} {"train_loss": -7.188586235046387, "global_step": 203120, "epoch": 4836} {"train_loss": -7.1420183181762695, "global_step": 203121, "epoch": 4836} {"train_loss": -7.208970069885254, "global_step": 203122, "epoch": 4836} {"train_loss": -7.307157516479492, "global_step": 203123, "epoch": 4836} {"train_loss": -7.19118595123291, "global_step": 203124, "epoch": 4836} {"train_loss": -7.106388568878174, "global_step": 203125, "epoch": 4836} {"train_loss": -7.218763828277588, "global_step": 203126, "epoch": 4836} {"train_loss": -7.076305389404297, "global_step": 203127, "epoch": 4836} {"train_loss": -7.1740498542785645, "global_step": 203128, "epoch": 4836} {"train_loss": -7.134822368621826, "global_step": 203129, "epoch": 4836} {"train_loss": -7.170133590698242, "global_step": 203130, "epoch": 4836} {"train_loss": -7.2704315185546875, "global_step": 203131, "epoch": 4836} {"train_loss": -7.07688045501709, "global_step": 203132, "epoch": 4836} {"train_loss": -7.371100425720215, "global_step": 203133, "epoch": 4836} {"train_loss": -7.308017730712891, "global_step": 203134, "epoch": 4836} {"train_loss": -7.35179328918457, "global_step": 203135, "epoch": 4836} {"train_loss": -7.397855758666992, "global_step": 203136, "epoch": 4836} {"train_loss": -7.316682815551758, "global_step": 203137, "epoch": 4836} {"train_loss": -7.2449140548706055, "global_step": 203138, "epoch": 4836} {"train_loss": -7.354351043701172, "global_step": 203139, "epoch": 4836} {"train_loss": -7.239670753479004, "global_step": 203140, "epoch": 4836} {"train_loss": -7.390514373779297, "global_step": 203141, "epoch": 4836} {"train_loss": -7.355695724487305, "global_step": 203142, "epoch": 4836} {"train_loss": -7.231217384338379, "global_step": 203143, "epoch": 4836} {"train_loss": -7.365945816040039, "global_step": 203144, "epoch": 4836} {"train_loss": -7.306124687194824, "global_step": 203145, "epoch": 4836} {"train_loss": -7.331974029541016, "global_step": 203146, "epoch": 4836} {"train_loss": -7.18197774887085, "global_step": 203147, "epoch": 4836} {"train_loss": -7.212494373321533, "global_step": 203148, "epoch": 4836} {"train_loss": -7.2123703956604, "global_step": 203149, "epoch": 4836} {"train_loss": -7.248147487640381, "global_step": 203150, "epoch": 4836} {"train_loss": -7.308759689331055, "global_step": 203151, "epoch": 4836} {"train_loss": -7.194314002990723, "global_step": 203152, "epoch": 4836} {"train_loss": -7.247950190589542, "global_step": 203153, "epoch": 4836, "val_loss": 69786.46875} {"train_loss": -7.207244873046875, "global_step": 203154, "epoch": 4837} {"train_loss": -7.056821823120117, "global_step": 203155, "epoch": 4837} {"train_loss": -7.1868181228637695, "global_step": 203156, "epoch": 4837} {"train_loss": -7.247495651245117, "global_step": 203157, "epoch": 4837} {"train_loss": -7.2136688232421875, "global_step": 203158, "epoch": 4837} {"train_loss": -7.1742706298828125, "global_step": 203159, "epoch": 4837} {"train_loss": -7.291249752044678, "global_step": 203160, "epoch": 4837} {"train_loss": -7.169480323791504, "global_step": 203161, "epoch": 4837} {"train_loss": -7.191971778869629, "global_step": 203162, "epoch": 4837} {"train_loss": -7.321536064147949, "global_step": 203163, "epoch": 4837} {"train_loss": -7.273445129394531, "global_step": 203164, "epoch": 4837} {"train_loss": -7.244065284729004, "global_step": 203165, "epoch": 4837} {"train_loss": -7.285273551940918, "global_step": 203166, "epoch": 4837} {"train_loss": -7.206425666809082, "global_step": 203167, "epoch": 4837} {"train_loss": -7.319019794464111, "global_step": 203168, "epoch": 4837} {"train_loss": -7.240940093994141, "global_step": 203169, "epoch": 4837} {"train_loss": -7.29274845123291, "global_step": 203170, "epoch": 4837} {"train_loss": -7.22170352935791, "global_step": 203171, "epoch": 4837} {"train_loss": -7.27741813659668, "global_step": 203172, "epoch": 4837} {"train_loss": -7.226802349090576, "global_step": 203173, "epoch": 4837} {"train_loss": -7.208865165710449, "global_step": 203174, "epoch": 4837} {"train_loss": -7.282227516174316, "global_step": 203175, "epoch": 4837} {"train_loss": -7.224597930908203, "global_step": 203176, "epoch": 4837} {"train_loss": -7.296039581298828, "global_step": 203177, "epoch": 4837} {"train_loss": -7.354503631591797, "global_step": 203178, "epoch": 4837} {"train_loss": -7.3722076416015625, "global_step": 203179, "epoch": 4837} {"train_loss": -7.3657755851745605, "global_step": 203180, "epoch": 4837} {"train_loss": -7.262331962585449, "global_step": 203181, "epoch": 4837} {"train_loss": -7.262554168701172, "global_step": 203182, "epoch": 4837} {"train_loss": -7.284109592437744, "global_step": 203183, "epoch": 4837} {"train_loss": -7.287456035614014, "global_step": 203184, "epoch": 4837} {"train_loss": -7.243224143981934, "global_step": 203185, "epoch": 4837} {"train_loss": -7.247855186462402, "global_step": 203186, "epoch": 4837} {"train_loss": -7.2960205078125, "global_step": 203187, "epoch": 4837} {"train_loss": -7.260406494140625, "global_step": 203188, "epoch": 4837} {"train_loss": -7.173313140869141, "global_step": 203189, "epoch": 4837} {"train_loss": -7.38642692565918, "global_step": 203190, "epoch": 4837} {"train_loss": -7.214621543884277, "global_step": 203191, "epoch": 4837} {"train_loss": -7.291589736938477, "global_step": 203192, "epoch": 4837} {"train_loss": -7.331229209899902, "global_step": 203193, "epoch": 4837} {"train_loss": -7.31289529800415, "global_step": 203194, "epoch": 4837} {"train_loss": -7.2591361204783125, "global_step": 203195, "epoch": 4837, "val_loss": 69910.4609375} {"train_loss": -7.4076247215271, "global_step": 203196, "epoch": 4838} {"train_loss": -7.2499189376831055, "global_step": 203197, "epoch": 4838} {"train_loss": -7.315468788146973, "global_step": 203198, "epoch": 4838} {"train_loss": -7.345644950866699, "global_step": 203199, "epoch": 4838} {"train_loss": -7.213630676269531, "global_step": 203200, "epoch": 4838} {"train_loss": -7.321428298950195, "global_step": 203201, "epoch": 4838} {"train_loss": -7.440403461456299, "global_step": 203202, "epoch": 4838} {"train_loss": -7.294114112854004, "global_step": 203203, "epoch": 4838} {"train_loss": -7.1067681312561035, "global_step": 203204, "epoch": 4838} {"train_loss": -7.358921527862549, "global_step": 203205, "epoch": 4838} {"train_loss": -7.207460403442383, "global_step": 203206, "epoch": 4838} {"train_loss": -7.240367889404297, "global_step": 203207, "epoch": 4838} {"train_loss": -7.303328514099121, "global_step": 203208, "epoch": 4838} {"train_loss": -7.247269630432129, "global_step": 203209, "epoch": 4838} {"train_loss": -7.33618688583374, "global_step": 203210, "epoch": 4838} {"train_loss": -7.269946098327637, "global_step": 203211, "epoch": 4838} {"train_loss": -7.138572692871094, "global_step": 203212, "epoch": 4838} {"train_loss": -7.2943925857543945, "global_step": 203213, "epoch": 4838} {"train_loss": -7.259641647338867, "global_step": 203214, "epoch": 4838} {"train_loss": -7.259883880615234, "global_step": 203215, "epoch": 4838} {"train_loss": -7.294299125671387, "global_step": 203216, "epoch": 4838} {"train_loss": -7.317557334899902, "global_step": 203217, "epoch": 4838} {"train_loss": -7.225894927978516, "global_step": 203218, "epoch": 4838} {"train_loss": -7.381692886352539, "global_step": 203219, "epoch": 4838} {"train_loss": -7.439931869506836, "global_step": 203220, "epoch": 4838} {"train_loss": -7.269002914428711, "global_step": 203221, "epoch": 4838} {"train_loss": -7.312592029571533, "global_step": 203222, "epoch": 4838} {"train_loss": -7.30217170715332, "global_step": 203223, "epoch": 4838} {"train_loss": -7.35414981842041, "global_step": 203224, "epoch": 4838} {"train_loss": -7.184558868408203, "global_step": 203225, "epoch": 4838} {"train_loss": -7.256208419799805, "global_step": 203226, "epoch": 4838} {"train_loss": -7.306407928466797, "global_step": 203227, "epoch": 4838} {"train_loss": -7.21794319152832, "global_step": 203228, "epoch": 4838} {"train_loss": -7.0799102783203125, "global_step": 203229, "epoch": 4838} {"train_loss": -7.320120811462402, "global_step": 203230, "epoch": 4838} {"train_loss": -7.154017925262451, "global_step": 203231, "epoch": 4838} {"train_loss": -7.273951053619385, "global_step": 203232, "epoch": 4838} {"train_loss": -7.2919158935546875, "global_step": 203233, "epoch": 4838} {"train_loss": -7.216343879699707, "global_step": 203234, "epoch": 4838} {"train_loss": -7.2851433753967285, "global_step": 203235, "epoch": 4838} {"train_loss": -7.369255542755127, "global_step": 203236, "epoch": 4838} {"train_loss": -7.277696030480521, "global_step": 203237, "epoch": 4838, "val_loss": 69772.640625} {"train_loss": -7.288808822631836, "global_step": 203238, "epoch": 4839} {"train_loss": -7.383326530456543, "global_step": 203239, "epoch": 4839} {"train_loss": -7.330463886260986, "global_step": 203240, "epoch": 4839} {"train_loss": -7.339210510253906, "global_step": 203241, "epoch": 4839} {"train_loss": -7.264875411987305, "global_step": 203242, "epoch": 4839} {"train_loss": -7.438623905181885, "global_step": 203243, "epoch": 4839} {"train_loss": -7.189702033996582, "global_step": 203244, "epoch": 4839} {"train_loss": -7.342067241668701, "global_step": 203245, "epoch": 4839} {"train_loss": -7.2655439376831055, "global_step": 203246, "epoch": 4839} {"train_loss": -7.241938591003418, "global_step": 203247, "epoch": 4839} {"train_loss": -7.300250053405762, "global_step": 203248, "epoch": 4839} {"train_loss": -7.090030193328857, "global_step": 203249, "epoch": 4839} {"train_loss": -7.2386369705200195, "global_step": 203250, "epoch": 4839} {"train_loss": -7.265523910522461, "global_step": 203251, "epoch": 4839} {"train_loss": -7.206564903259277, "global_step": 203252, "epoch": 4839} {"train_loss": -7.253011226654053, "global_step": 203253, "epoch": 4839} {"train_loss": -7.244366645812988, "global_step": 203254, "epoch": 4839} {"train_loss": -7.261472702026367, "global_step": 203255, "epoch": 4839} {"train_loss": -7.298477649688721, "global_step": 203256, "epoch": 4839} {"train_loss": -7.148612022399902, "global_step": 203257, "epoch": 4839} {"train_loss": -7.212290287017822, "global_step": 203258, "epoch": 4839} {"train_loss": -7.215151786804199, "global_step": 203259, "epoch": 4839} {"train_loss": -7.266182899475098, "global_step": 203260, "epoch": 4839} {"train_loss": -7.196950912475586, "global_step": 203261, "epoch": 4839} {"train_loss": -7.236635208129883, "global_step": 203262, "epoch": 4839} {"train_loss": -7.284494400024414, "global_step": 203263, "epoch": 4839} {"train_loss": -7.310817718505859, "global_step": 203264, "epoch": 4839} {"train_loss": -7.347451210021973, "global_step": 203265, "epoch": 4839} {"train_loss": -7.220679759979248, "global_step": 203266, "epoch": 4839} {"train_loss": -7.277300834655762, "global_step": 203267, "epoch": 4839} {"train_loss": -7.287419319152832, "global_step": 203268, "epoch": 4839} {"train_loss": -7.257107257843018, "global_step": 203269, "epoch": 4839} {"train_loss": -7.295942306518555, "global_step": 203270, "epoch": 4839} {"train_loss": -7.28972864151001, "global_step": 203271, "epoch": 4839} {"train_loss": -7.249231338500977, "global_step": 203272, "epoch": 4839} {"train_loss": -7.153002738952637, "global_step": 203273, "epoch": 4839} {"train_loss": -7.2421770095825195, "global_step": 203274, "epoch": 4839} {"train_loss": -7.250556468963623, "global_step": 203275, "epoch": 4839} {"train_loss": -7.331032752990723, "global_step": 203276, "epoch": 4839} {"train_loss": -7.22315788269043, "global_step": 203277, "epoch": 4839} {"train_loss": -7.147618293762207, "global_step": 203278, "epoch": 4839} {"train_loss": -7.258353210630871, "global_step": 203279, "epoch": 4839, "val_loss": 69804.6484375} {"train_loss": -7.08651065826416, "global_step": 203280, "epoch": 4840} {"train_loss": -7.329853057861328, "global_step": 203281, "epoch": 4840} {"train_loss": -7.088757038116455, "global_step": 203282, "epoch": 4840} {"train_loss": -7.177897930145264, "global_step": 203283, "epoch": 4840} {"train_loss": -7.270839691162109, "global_step": 203284, "epoch": 4840} {"train_loss": -7.318838119506836, "global_step": 203285, "epoch": 4840} {"train_loss": -7.335387706756592, "global_step": 203286, "epoch": 4840} {"train_loss": -7.230172634124756, "global_step": 203287, "epoch": 4840} {"train_loss": -7.1900529861450195, "global_step": 203288, "epoch": 4840} {"train_loss": -7.281593322753906, "global_step": 203289, "epoch": 4840} {"train_loss": -7.200119972229004, "global_step": 203290, "epoch": 4840} {"train_loss": -7.234289169311523, "global_step": 203291, "epoch": 4840} {"train_loss": -7.253915786743164, "global_step": 203292, "epoch": 4840} {"train_loss": -7.177031517028809, "global_step": 203293, "epoch": 4840} {"train_loss": -7.307960033416748, "global_step": 203294, "epoch": 4840} {"train_loss": -7.160876274108887, "global_step": 203295, "epoch": 4840} {"train_loss": -7.207885265350342, "global_step": 203296, "epoch": 4840} {"train_loss": -7.285409927368164, "global_step": 203297, "epoch": 4840} {"train_loss": -7.289912223815918, "global_step": 203298, "epoch": 4840} {"train_loss": -7.298854827880859, "global_step": 203299, "epoch": 4840} {"train_loss": -7.304003715515137, "global_step": 203300, "epoch": 4840} {"train_loss": -7.26744270324707, "global_step": 203301, "epoch": 4840} {"train_loss": -7.280226707458496, "global_step": 203302, "epoch": 4840} {"train_loss": -7.367574691772461, "global_step": 203303, "epoch": 4840} {"train_loss": -7.152632236480713, "global_step": 203304, "epoch": 4840} {"train_loss": -7.326581954956055, "global_step": 203305, "epoch": 4840} {"train_loss": -7.309568405151367, "global_step": 203306, "epoch": 4840} {"train_loss": -7.368971347808838, "global_step": 203307, "epoch": 4840} {"train_loss": -7.371334075927734, "global_step": 203308, "epoch": 4840} {"train_loss": -7.281520366668701, "global_step": 203309, "epoch": 4840} {"train_loss": -7.390219688415527, "global_step": 203310, "epoch": 4840} {"train_loss": -7.21048641204834, "global_step": 203311, "epoch": 4840} {"train_loss": -7.276481628417969, "global_step": 203312, "epoch": 4840} {"train_loss": -7.313094139099121, "global_step": 203313, "epoch": 4840} {"train_loss": -7.282941818237305, "global_step": 203314, "epoch": 4840} {"train_loss": -7.342730522155762, "global_step": 203315, "epoch": 4840} {"train_loss": -7.249813556671143, "global_step": 203316, "epoch": 4840} {"train_loss": -7.453621864318848, "global_step": 203317, "epoch": 4840} {"train_loss": -7.253839015960693, "global_step": 203318, "epoch": 4840} {"train_loss": -7.385626792907715, "global_step": 203319, "epoch": 4840} {"train_loss": -7.354640007019043, "global_step": 203320, "epoch": 4840} {"train_loss": -7.277141775403704, "global_step": 203321, "epoch": 4840, "val_loss": 69889.375} {"train_loss": -7.195003032684326, "global_step": 203322, "epoch": 4841} {"train_loss": -7.341468811035156, "global_step": 203323, "epoch": 4841} {"train_loss": -7.38145637512207, "global_step": 203324, "epoch": 4841} {"train_loss": -7.214654445648193, "global_step": 203325, "epoch": 4841} {"train_loss": -7.2955803871154785, "global_step": 203326, "epoch": 4841} {"train_loss": -7.370909690856934, "global_step": 203327, "epoch": 4841} {"train_loss": -7.453555583953857, "global_step": 203328, "epoch": 4841} {"train_loss": -7.353302955627441, "global_step": 203329, "epoch": 4841} {"train_loss": -7.312126636505127, "global_step": 203330, "epoch": 4841} {"train_loss": -7.278197288513184, "global_step": 203331, "epoch": 4841} {"train_loss": -7.211075782775879, "global_step": 203332, "epoch": 4841} {"train_loss": -7.453433513641357, "global_step": 203333, "epoch": 4841} {"train_loss": -7.355226039886475, "global_step": 203334, "epoch": 4841} {"train_loss": -7.2743120193481445, "global_step": 203335, "epoch": 4841} {"train_loss": -7.506021499633789, "global_step": 203336, "epoch": 4841} {"train_loss": -7.278676986694336, "global_step": 203337, "epoch": 4841} {"train_loss": -7.318088531494141, "global_step": 203338, "epoch": 4841} {"train_loss": -7.386804580688477, "global_step": 203339, "epoch": 4841} {"train_loss": -7.264988899230957, "global_step": 203340, "epoch": 4841} {"train_loss": -7.2629475593566895, "global_step": 203341, "epoch": 4841} {"train_loss": -7.325014114379883, "global_step": 203342, "epoch": 4841} {"train_loss": -7.26458215713501, "global_step": 203343, "epoch": 4841} {"train_loss": -7.306211948394775, "global_step": 203344, "epoch": 4841} {"train_loss": -7.197264671325684, "global_step": 203345, "epoch": 4841} {"train_loss": -7.331765174865723, "global_step": 203346, "epoch": 4841} {"train_loss": -7.427908420562744, "global_step": 203347, "epoch": 4841} {"train_loss": -7.272549629211426, "global_step": 203348, "epoch": 4841} {"train_loss": -7.3097100257873535, "global_step": 203349, "epoch": 4841} {"train_loss": -7.216263771057129, "global_step": 203350, "epoch": 4841} {"train_loss": -7.296584606170654, "global_step": 203351, "epoch": 4841} {"train_loss": -7.379999160766602, "global_step": 203352, "epoch": 4841} {"train_loss": -7.257858753204346, "global_step": 203353, "epoch": 4841} {"train_loss": -7.37315559387207, "global_step": 203354, "epoch": 4841} {"train_loss": -7.333209037780762, "global_step": 203355, "epoch": 4841} {"train_loss": -7.302447319030762, "global_step": 203356, "epoch": 4841} {"train_loss": -7.511989116668701, "global_step": 203357, "epoch": 4841} {"train_loss": -7.265381813049316, "global_step": 203358, "epoch": 4841} {"train_loss": -7.301564693450928, "global_step": 203359, "epoch": 4841} {"train_loss": -7.337079048156738, "global_step": 203360, "epoch": 4841} {"train_loss": -7.20872688293457, "global_step": 203361, "epoch": 4841} {"train_loss": -7.161783218383789, "global_step": 203362, "epoch": 4841} {"train_loss": -7.313281695048015, "global_step": 203363, "epoch": 4841, "val_loss": 69857.703125} {"train_loss": -7.269627094268799, "global_step": 203364, "epoch": 4842} {"train_loss": -7.224251747131348, "global_step": 203365, "epoch": 4842} {"train_loss": -7.161619186401367, "global_step": 203366, "epoch": 4842} {"train_loss": -7.193320274353027, "global_step": 203367, "epoch": 4842} {"train_loss": -7.280125617980957, "global_step": 203368, "epoch": 4842} {"train_loss": -7.278494358062744, "global_step": 203369, "epoch": 4842} {"train_loss": -7.155341148376465, "global_step": 203370, "epoch": 4842} {"train_loss": -7.13730001449585, "global_step": 203371, "epoch": 4842} {"train_loss": -7.068941116333008, "global_step": 203372, "epoch": 4842} {"train_loss": -7.264634132385254, "global_step": 203373, "epoch": 4842} {"train_loss": -7.161619186401367, "global_step": 203374, "epoch": 4842} {"train_loss": -7.172707557678223, "global_step": 203375, "epoch": 4842} {"train_loss": -7.254474639892578, "global_step": 203376, "epoch": 4842} {"train_loss": -7.025760650634766, "global_step": 203377, "epoch": 4842} {"train_loss": -7.21809720993042, "global_step": 203378, "epoch": 4842} {"train_loss": -7.297441482543945, "global_step": 203379, "epoch": 4842} {"train_loss": -7.28356409072876, "global_step": 203380, "epoch": 4842} {"train_loss": -7.2090864181518555, "global_step": 203381, "epoch": 4842} {"train_loss": -7.335180282592773, "global_step": 203382, "epoch": 4842} {"train_loss": -7.338535308837891, "global_step": 203383, "epoch": 4842} {"train_loss": -7.309481143951416, "global_step": 203384, "epoch": 4842} {"train_loss": -7.290087699890137, "global_step": 203385, "epoch": 4842} {"train_loss": -7.301891326904297, "global_step": 203386, "epoch": 4842} {"train_loss": -7.240795135498047, "global_step": 203387, "epoch": 4842} {"train_loss": -7.235065937042236, "global_step": 203388, "epoch": 4842} {"train_loss": -7.335364818572998, "global_step": 203389, "epoch": 4842} {"train_loss": -7.309892654418945, "global_step": 203390, "epoch": 4842} {"train_loss": -7.318881511688232, "global_step": 203391, "epoch": 4842} {"train_loss": -7.403779029846191, "global_step": 203392, "epoch": 4842} {"train_loss": -7.316176891326904, "global_step": 203393, "epoch": 4842} {"train_loss": -7.30833625793457, "global_step": 203394, "epoch": 4842} {"train_loss": -7.338608741760254, "global_step": 203395, "epoch": 4842} {"train_loss": -7.362266540527344, "global_step": 203396, "epoch": 4842} {"train_loss": -7.285099029541016, "global_step": 203397, "epoch": 4842} {"train_loss": -7.320633888244629, "global_step": 203398, "epoch": 4842} {"train_loss": -7.327836990356445, "global_step": 203399, "epoch": 4842} {"train_loss": -7.375067234039307, "global_step": 203400, "epoch": 4842} {"train_loss": -7.373004913330078, "global_step": 203401, "epoch": 4842} {"train_loss": -7.358068466186523, "global_step": 203402, "epoch": 4842} {"train_loss": -7.270959854125977, "global_step": 203403, "epoch": 4842} {"train_loss": -7.247469902038574, "global_step": 203404, "epoch": 4842} {"train_loss": -7.268901677358718, "global_step": 203405, "epoch": 4842, "val_loss": 69764.921875} {"train_loss": -7.351775169372559, "global_step": 203406, "epoch": 4843} {"train_loss": -7.344488620758057, "global_step": 203407, "epoch": 4843} {"train_loss": -7.37713098526001, "global_step": 203408, "epoch": 4843} {"train_loss": -7.310538291931152, "global_step": 203409, "epoch": 4843} {"train_loss": -7.397353172302246, "global_step": 203410, "epoch": 4843} {"train_loss": -7.270874500274658, "global_step": 203411, "epoch": 4843} {"train_loss": -7.267167091369629, "global_step": 203412, "epoch": 4843} {"train_loss": -7.36226749420166, "global_step": 203413, "epoch": 4843} {"train_loss": -7.448639392852783, "global_step": 203414, "epoch": 4843} {"train_loss": -7.36231803894043, "global_step": 203415, "epoch": 4843} {"train_loss": -7.425232887268066, "global_step": 203416, "epoch": 4843} {"train_loss": -7.249356746673584, "global_step": 203417, "epoch": 4843} {"train_loss": -7.281672477722168, "global_step": 203418, "epoch": 4843} {"train_loss": -7.375759124755859, "global_step": 203419, "epoch": 4843} {"train_loss": -7.204273223876953, "global_step": 203420, "epoch": 4843} {"train_loss": -7.273838996887207, "global_step": 203421, "epoch": 4843} {"train_loss": -7.262538909912109, "global_step": 203422, "epoch": 4843} {"train_loss": -7.193526744842529, "global_step": 203423, "epoch": 4843} {"train_loss": -7.249638557434082, "global_step": 203424, "epoch": 4843} {"train_loss": -7.168846130371094, "global_step": 203425, "epoch": 4843} {"train_loss": -7.165153503417969, "global_step": 203426, "epoch": 4843} {"train_loss": -7.246925354003906, "global_step": 203427, "epoch": 4843} {"train_loss": -7.172611713409424, "global_step": 203428, "epoch": 4843} {"train_loss": -7.23977518081665, "global_step": 203429, "epoch": 4843} {"train_loss": -7.183762550354004, "global_step": 203430, "epoch": 4843} {"train_loss": -7.144893169403076, "global_step": 203431, "epoch": 4843} {"train_loss": -7.2662835121154785, "global_step": 203432, "epoch": 4843} {"train_loss": -7.239965438842773, "global_step": 203433, "epoch": 4843} {"train_loss": -7.31081485748291, "global_step": 203434, "epoch": 4843} {"train_loss": -7.240955352783203, "global_step": 203435, "epoch": 4843} {"train_loss": -7.189587593078613, "global_step": 203436, "epoch": 4843} {"train_loss": -7.202098369598389, "global_step": 203437, "epoch": 4843} {"train_loss": -7.300412178039551, "global_step": 203438, "epoch": 4843} {"train_loss": -7.192785739898682, "global_step": 203439, "epoch": 4843} {"train_loss": -7.137110233306885, "global_step": 203440, "epoch": 4843} {"train_loss": -7.216127872467041, "global_step": 203441, "epoch": 4843} {"train_loss": -7.143677234649658, "global_step": 203442, "epoch": 4843} {"train_loss": -7.283576965332031, "global_step": 203443, "epoch": 4843} {"train_loss": -7.146976470947266, "global_step": 203444, "epoch": 4843} {"train_loss": -7.242719650268555, "global_step": 203445, "epoch": 4843} {"train_loss": -7.181626319885254, "global_step": 203446, "epoch": 4843} {"train_loss": -7.257049935204642, "global_step": 203447, "epoch": 4843, "val_loss": 69966.6484375} {"train_loss": -7.329657077789307, "global_step": 203448, "epoch": 4844} {"train_loss": -7.12106990814209, "global_step": 203449, "epoch": 4844} {"train_loss": -7.270340919494629, "global_step": 203450, "epoch": 4844} {"train_loss": -7.288449287414551, "global_step": 203451, "epoch": 4844} {"train_loss": -7.250785827636719, "global_step": 203452, "epoch": 4844} {"train_loss": -7.383950233459473, "global_step": 203453, "epoch": 4844} {"train_loss": -7.238500595092773, "global_step": 203454, "epoch": 4844} {"train_loss": -7.219453811645508, "global_step": 203455, "epoch": 4844} {"train_loss": -7.251951217651367, "global_step": 203456, "epoch": 4844} {"train_loss": -7.362990379333496, "global_step": 203457, "epoch": 4844} {"train_loss": -7.237259864807129, "global_step": 203458, "epoch": 4844} {"train_loss": -7.36046028137207, "global_step": 203459, "epoch": 4844} {"train_loss": -7.286399841308594, "global_step": 203460, "epoch": 4844} {"train_loss": -7.273871421813965, "global_step": 203461, "epoch": 4844} {"train_loss": -7.3577728271484375, "global_step": 203462, "epoch": 4844} {"train_loss": -7.3483710289001465, "global_step": 203463, "epoch": 4844} {"train_loss": -7.256235122680664, "global_step": 203464, "epoch": 4844} {"train_loss": -7.327353477478027, "global_step": 203465, "epoch": 4844} {"train_loss": -7.428581237792969, "global_step": 203466, "epoch": 4844} {"train_loss": -7.328103065490723, "global_step": 203467, "epoch": 4844} {"train_loss": -7.372100353240967, "global_step": 203468, "epoch": 4844} {"train_loss": -7.35679817199707, "global_step": 203469, "epoch": 4844} {"train_loss": -7.3950910568237305, "global_step": 203470, "epoch": 4844} {"train_loss": -7.314607620239258, "global_step": 203471, "epoch": 4844} {"train_loss": -7.294619560241699, "global_step": 203472, "epoch": 4844} {"train_loss": -7.400112628936768, "global_step": 203473, "epoch": 4844} {"train_loss": -7.3713178634643555, "global_step": 203474, "epoch": 4844} {"train_loss": -7.343358993530273, "global_step": 203475, "epoch": 4844} {"train_loss": -7.283058166503906, "global_step": 203476, "epoch": 4844} {"train_loss": -7.331458568572998, "global_step": 203477, "epoch": 4844} {"train_loss": -7.268815994262695, "global_step": 203478, "epoch": 4844} {"train_loss": -7.183849334716797, "global_step": 203479, "epoch": 4844} {"train_loss": -7.342458248138428, "global_step": 203480, "epoch": 4844} {"train_loss": -7.26129150390625, "global_step": 203481, "epoch": 4844} {"train_loss": -7.287062644958496, "global_step": 203482, "epoch": 4844} {"train_loss": -7.282605171203613, "global_step": 203483, "epoch": 4844} {"train_loss": -7.260158538818359, "global_step": 203484, "epoch": 4844} {"train_loss": -7.322024345397949, "global_step": 203485, "epoch": 4844} {"train_loss": -7.400393009185791, "global_step": 203486, "epoch": 4844} {"train_loss": -7.322052001953125, "global_step": 203487, "epoch": 4844} {"train_loss": -7.427748203277588, "global_step": 203488, "epoch": 4844} {"train_loss": -7.310827266602289, "global_step": 203489, "epoch": 4844, "val_loss": 69948.71875} {"train_loss": -7.487959861755371, "global_step": 203490, "epoch": 4845} {"train_loss": -7.383869171142578, "global_step": 203491, "epoch": 4845} {"train_loss": -7.3858232498168945, "global_step": 203492, "epoch": 4845} {"train_loss": -7.39045524597168, "global_step": 203493, "epoch": 4845} {"train_loss": -7.339069366455078, "global_step": 203494, "epoch": 4845} {"train_loss": -7.347744941711426, "global_step": 203495, "epoch": 4845} {"train_loss": -7.343488693237305, "global_step": 203496, "epoch": 4845} {"train_loss": -7.28413724899292, "global_step": 203497, "epoch": 4845} {"train_loss": -7.376551628112793, "global_step": 203498, "epoch": 4845} {"train_loss": -7.430171966552734, "global_step": 203499, "epoch": 4845} {"train_loss": -7.393978595733643, "global_step": 203500, "epoch": 4845} {"train_loss": -7.414762496948242, "global_step": 203501, "epoch": 4845} {"train_loss": -7.300684452056885, "global_step": 203502, "epoch": 4845} {"train_loss": -7.2614216804504395, "global_step": 203503, "epoch": 4845} {"train_loss": -7.2455854415893555, "global_step": 203504, "epoch": 4845} {"train_loss": -7.365593433380127, "global_step": 203505, "epoch": 4845} {"train_loss": -7.311387062072754, "global_step": 203506, "epoch": 4845} {"train_loss": -7.318678379058838, "global_step": 203507, "epoch": 4845} {"train_loss": -7.295823097229004, "global_step": 203508, "epoch": 4845} {"train_loss": -7.285935401916504, "global_step": 203509, "epoch": 4845} {"train_loss": -7.274698257446289, "global_step": 203510, "epoch": 4845} {"train_loss": -7.271825790405273, "global_step": 203511, "epoch": 4845} {"train_loss": -7.259078025817871, "global_step": 203512, "epoch": 4845} {"train_loss": -7.407163619995117, "global_step": 203513, "epoch": 4845} {"train_loss": -7.454645156860352, "global_step": 203514, "epoch": 4845} {"train_loss": -7.256584644317627, "global_step": 203515, "epoch": 4845} {"train_loss": -7.345058441162109, "global_step": 203516, "epoch": 4845} {"train_loss": -7.320828914642334, "global_step": 203517, "epoch": 4845} {"train_loss": -7.326875686645508, "global_step": 203518, "epoch": 4845} {"train_loss": -7.331992149353027, "global_step": 203519, "epoch": 4845} {"train_loss": -7.321989059448242, "global_step": 203520, "epoch": 4845} {"train_loss": -7.382381439208984, "global_step": 203521, "epoch": 4845} {"train_loss": -7.331389904022217, "global_step": 203522, "epoch": 4845} {"train_loss": -7.227487564086914, "global_step": 203523, "epoch": 4845} {"train_loss": -7.164697170257568, "global_step": 203524, "epoch": 4845} {"train_loss": -7.235674858093262, "global_step": 203525, "epoch": 4845} {"train_loss": -7.318904876708984, "global_step": 203526, "epoch": 4845} {"train_loss": -7.07432746887207, "global_step": 203527, "epoch": 4845} {"train_loss": -7.217462539672852, "global_step": 203528, "epoch": 4845} {"train_loss": -7.317907333374023, "global_step": 203529, "epoch": 4845} {"train_loss": -7.156030654907227, "global_step": 203530, "epoch": 4845} {"train_loss": -7.315255278632755, "global_step": 203531, "epoch": 4845, "val_loss": 69923.375} {"train_loss": -7.237368583679199, "global_step": 203532, "epoch": 4846} {"train_loss": -7.416232109069824, "global_step": 203533, "epoch": 4846} {"train_loss": -7.219254493713379, "global_step": 203534, "epoch": 4846} {"train_loss": -7.235220432281494, "global_step": 203535, "epoch": 4846} {"train_loss": -7.291492462158203, "global_step": 203536, "epoch": 4846} {"train_loss": -7.273409366607666, "global_step": 203537, "epoch": 4846} {"train_loss": -7.281443119049072, "global_step": 203538, "epoch": 4846} {"train_loss": -7.322717666625977, "global_step": 203539, "epoch": 4846} {"train_loss": -7.324858665466309, "global_step": 203540, "epoch": 4846} {"train_loss": -7.306676864624023, "global_step": 203541, "epoch": 4846} {"train_loss": -7.203463554382324, "global_step": 203542, "epoch": 4846} {"train_loss": -7.248482704162598, "global_step": 203543, "epoch": 4846} {"train_loss": -7.324348449707031, "global_step": 203544, "epoch": 4846} {"train_loss": -7.285862445831299, "global_step": 203545, "epoch": 4846} {"train_loss": -7.27277946472168, "global_step": 203546, "epoch": 4846} {"train_loss": -7.278511047363281, "global_step": 203547, "epoch": 4846} {"train_loss": -7.325927734375, "global_step": 203548, "epoch": 4846} {"train_loss": -7.1794352531433105, "global_step": 203549, "epoch": 4846} {"train_loss": -7.334293842315674, "global_step": 203550, "epoch": 4846} {"train_loss": -7.219799041748047, "global_step": 203551, "epoch": 4846} {"train_loss": -7.292804718017578, "global_step": 203552, "epoch": 4846} {"train_loss": -7.344882011413574, "global_step": 203553, "epoch": 4846} {"train_loss": -7.213952541351318, "global_step": 203554, "epoch": 4846} {"train_loss": -7.184553146362305, "global_step": 203555, "epoch": 4846} {"train_loss": -7.182894706726074, "global_step": 203556, "epoch": 4846} {"train_loss": -7.204054832458496, "global_step": 203557, "epoch": 4846} {"train_loss": -7.23482608795166, "global_step": 203558, "epoch": 4846} {"train_loss": -7.174177169799805, "global_step": 203559, "epoch": 4846} {"train_loss": -7.235065460205078, "global_step": 203560, "epoch": 4846} {"train_loss": -7.1280903816223145, "global_step": 203561, "epoch": 4846} {"train_loss": -7.076763153076172, "global_step": 203562, "epoch": 4846} {"train_loss": -7.253882884979248, "global_step": 203563, "epoch": 4846} {"train_loss": -7.1250410079956055, "global_step": 203564, "epoch": 4846} {"train_loss": -7.127628326416016, "global_step": 203565, "epoch": 4846} {"train_loss": -7.238495826721191, "global_step": 203566, "epoch": 4846} {"train_loss": -7.196910858154297, "global_step": 203567, "epoch": 4846} {"train_loss": -7.31979513168335, "global_step": 203568, "epoch": 4846} {"train_loss": -7.1572651863098145, "global_step": 203569, "epoch": 4846} {"train_loss": -7.268271446228027, "global_step": 203570, "epoch": 4846} {"train_loss": -7.129136562347412, "global_step": 203571, "epoch": 4846} {"train_loss": -7.2707085609436035, "global_step": 203572, "epoch": 4846} {"train_loss": -7.243487312680199, "global_step": 203573, "epoch": 4846, "val_loss": 70028.0390625} {"train_loss": -7.361780166625977, "global_step": 203574, "epoch": 4847} {"train_loss": -7.147919654846191, "global_step": 203575, "epoch": 4847} {"train_loss": -7.252012252807617, "global_step": 203576, "epoch": 4847} {"train_loss": -7.360251426696777, "global_step": 203577, "epoch": 4847} {"train_loss": -7.216369152069092, "global_step": 203578, "epoch": 4847} {"train_loss": -7.325750827789307, "global_step": 203579, "epoch": 4847} {"train_loss": -7.270719528198242, "global_step": 203580, "epoch": 4847} {"train_loss": -7.303494453430176, "global_step": 203581, "epoch": 4847} {"train_loss": -7.376992225646973, "global_step": 203582, "epoch": 4847} {"train_loss": -7.313239097595215, "global_step": 203583, "epoch": 4847} {"train_loss": -7.3277130126953125, "global_step": 203584, "epoch": 4847} {"train_loss": -7.2531561851501465, "global_step": 203585, "epoch": 4847} {"train_loss": -7.283377170562744, "global_step": 203586, "epoch": 4847} {"train_loss": -7.349418640136719, "global_step": 203587, "epoch": 4847} {"train_loss": -7.1992082595825195, "global_step": 203588, "epoch": 4847} {"train_loss": -7.312138557434082, "global_step": 203589, "epoch": 4847} {"train_loss": -7.303606033325195, "global_step": 203590, "epoch": 4847} {"train_loss": -7.25956916809082, "global_step": 203591, "epoch": 4847} {"train_loss": -7.38032341003418, "global_step": 203592, "epoch": 4847} {"train_loss": -7.218791961669922, "global_step": 203593, "epoch": 4847} {"train_loss": -7.320503234863281, "global_step": 203594, "epoch": 4847} {"train_loss": -7.341869831085205, "global_step": 203595, "epoch": 4847} {"train_loss": -7.275125026702881, "global_step": 203596, "epoch": 4847} {"train_loss": -7.213015556335449, "global_step": 203597, "epoch": 4847} {"train_loss": -7.304521083831787, "global_step": 203598, "epoch": 4847} {"train_loss": -7.308692932128906, "global_step": 203599, "epoch": 4847} {"train_loss": -7.247718334197998, "global_step": 203600, "epoch": 4847} {"train_loss": -7.249159812927246, "global_step": 203601, "epoch": 4847} {"train_loss": -7.330474853515625, "global_step": 203602, "epoch": 4847} {"train_loss": -7.269820213317871, "global_step": 203603, "epoch": 4847} {"train_loss": -7.189572334289551, "global_step": 203604, "epoch": 4847} {"train_loss": -7.327479839324951, "global_step": 203605, "epoch": 4847} {"train_loss": -7.183363914489746, "global_step": 203606, "epoch": 4847} {"train_loss": -7.330634593963623, "global_step": 203607, "epoch": 4847} {"train_loss": -7.250048637390137, "global_step": 203608, "epoch": 4847} {"train_loss": -7.399833679199219, "global_step": 203609, "epoch": 4847} {"train_loss": -7.283394813537598, "global_step": 203610, "epoch": 4847} {"train_loss": -7.343103408813477, "global_step": 203611, "epoch": 4847} {"train_loss": -7.264962196350098, "global_step": 203612, "epoch": 4847} {"train_loss": -7.234960556030273, "global_step": 203613, "epoch": 4847} {"train_loss": -7.258620738983154, "global_step": 203614, "epoch": 4847} {"train_loss": -7.284948246819632, "global_step": 203615, "epoch": 4847, "val_loss": 69997.140625} {"train_loss": -7.363781929016113, "global_step": 203616, "epoch": 4848} {"train_loss": -7.272043228149414, "global_step": 203617, "epoch": 4848} {"train_loss": -7.150259971618652, "global_step": 203618, "epoch": 4848} {"train_loss": -7.169037818908691, "global_step": 203619, "epoch": 4848} {"train_loss": -7.156424522399902, "global_step": 203620, "epoch": 4848} {"train_loss": -7.196688652038574, "global_step": 203621, "epoch": 4848} {"train_loss": -7.1092047691345215, "global_step": 203622, "epoch": 4848} {"train_loss": -7.209985733032227, "global_step": 203623, "epoch": 4848} {"train_loss": -7.168152809143066, "global_step": 203624, "epoch": 4848} {"train_loss": -7.177319526672363, "global_step": 203625, "epoch": 4848} {"train_loss": -7.141510009765625, "global_step": 203626, "epoch": 4848} {"train_loss": -7.295636177062988, "global_step": 203627, "epoch": 4848} {"train_loss": -7.305147647857666, "global_step": 203628, "epoch": 4848} {"train_loss": -7.259212493896484, "global_step": 203629, "epoch": 4848} {"train_loss": -7.286423683166504, "global_step": 203630, "epoch": 4848} {"train_loss": -7.16745662689209, "global_step": 203631, "epoch": 4848} {"train_loss": -7.076845169067383, "global_step": 203632, "epoch": 4848} {"train_loss": -7.192997932434082, "global_step": 203633, "epoch": 4848} {"train_loss": -7.160816669464111, "global_step": 203634, "epoch": 4848} {"train_loss": -7.198354721069336, "global_step": 203635, "epoch": 4848} {"train_loss": -7.284087657928467, "global_step": 203636, "epoch": 4848} {"train_loss": -7.29841423034668, "global_step": 203637, "epoch": 4848} {"train_loss": -7.191428184509277, "global_step": 203638, "epoch": 4848} {"train_loss": -7.485480308532715, "global_step": 203639, "epoch": 4848} {"train_loss": -7.269397735595703, "global_step": 203640, "epoch": 4848} {"train_loss": -7.280372619628906, "global_step": 203641, "epoch": 4848} {"train_loss": -7.21196985244751, "global_step": 203642, "epoch": 4848} {"train_loss": -7.320254325866699, "global_step": 203643, "epoch": 4848} {"train_loss": -7.327079772949219, "global_step": 203644, "epoch": 4848} {"train_loss": -7.184845447540283, "global_step": 203645, "epoch": 4848} {"train_loss": -7.392360687255859, "global_step": 203646, "epoch": 4848} {"train_loss": -7.300247669219971, "global_step": 203647, "epoch": 4848} {"train_loss": -7.31724739074707, "global_step": 203648, "epoch": 4848} {"train_loss": -7.317226886749268, "global_step": 203649, "epoch": 4848} {"train_loss": -7.1852264404296875, "global_step": 203650, "epoch": 4848} {"train_loss": -7.2464823722839355, "global_step": 203651, "epoch": 4848} {"train_loss": -7.337699890136719, "global_step": 203652, "epoch": 4848} {"train_loss": -7.127657413482666, "global_step": 203653, "epoch": 4848} {"train_loss": -7.091371536254883, "global_step": 203654, "epoch": 4848} {"train_loss": -7.148589134216309, "global_step": 203655, "epoch": 4848} {"train_loss": -7.206269264221191, "global_step": 203656, "epoch": 4848} {"train_loss": -7.231717790876116, "global_step": 203657, "epoch": 4848, "val_loss": 69964.5625} {"train_loss": -7.267096519470215, "global_step": 203658, "epoch": 4849} {"train_loss": -7.044439315795898, "global_step": 203659, "epoch": 4849} {"train_loss": -7.177713394165039, "global_step": 203660, "epoch": 4849} {"train_loss": -7.1843156814575195, "global_step": 203661, "epoch": 4849} {"train_loss": -7.076005935668945, "global_step": 203662, "epoch": 4849} {"train_loss": -7.269064903259277, "global_step": 203663, "epoch": 4849} {"train_loss": -7.1224365234375, "global_step": 203664, "epoch": 4849} {"train_loss": -7.146143436431885, "global_step": 203665, "epoch": 4849} {"train_loss": -7.17959451675415, "global_step": 203666, "epoch": 4849} {"train_loss": -7.236208915710449, "global_step": 203667, "epoch": 4849} {"train_loss": -7.244716167449951, "global_step": 203668, "epoch": 4849} {"train_loss": -7.2166748046875, "global_step": 203669, "epoch": 4849} {"train_loss": -7.168452739715576, "global_step": 203670, "epoch": 4849} {"train_loss": -7.319504737854004, "global_step": 203671, "epoch": 4849} {"train_loss": -7.156060695648193, "global_step": 203672, "epoch": 4849} {"train_loss": -7.304310321807861, "global_step": 203673, "epoch": 4849} {"train_loss": -7.3228254318237305, "global_step": 203674, "epoch": 4849} {"train_loss": -7.318365573883057, "global_step": 203675, "epoch": 4849} {"train_loss": -7.19441032409668, "global_step": 203676, "epoch": 4849} {"train_loss": -7.266234397888184, "global_step": 203677, "epoch": 4849} {"train_loss": -7.204061985015869, "global_step": 203678, "epoch": 4849} {"train_loss": -7.378384590148926, "global_step": 203679, "epoch": 4849} {"train_loss": -7.290228843688965, "global_step": 203680, "epoch": 4849} {"train_loss": -7.162958145141602, "global_step": 203681, "epoch": 4849} {"train_loss": -7.138555526733398, "global_step": 203682, "epoch": 4849} {"train_loss": -7.192244529724121, "global_step": 203683, "epoch": 4849} {"train_loss": -7.244588375091553, "global_step": 203684, "epoch": 4849} {"train_loss": -7.319141387939453, "global_step": 203685, "epoch": 4849} {"train_loss": -7.29424524307251, "global_step": 203686, "epoch": 4849} {"train_loss": -7.322571754455566, "global_step": 203687, "epoch": 4849} {"train_loss": -7.323939800262451, "global_step": 203688, "epoch": 4849} {"train_loss": -7.285894393920898, "global_step": 203689, "epoch": 4849} {"train_loss": -7.368529319763184, "global_step": 203690, "epoch": 4849} {"train_loss": -7.304324150085449, "global_step": 203691, "epoch": 4849} {"train_loss": -7.351977348327637, "global_step": 203692, "epoch": 4849} {"train_loss": -7.381492614746094, "global_step": 203693, "epoch": 4849} {"train_loss": -7.415182113647461, "global_step": 203694, "epoch": 4849} {"train_loss": -7.387444496154785, "global_step": 203695, "epoch": 4849} {"train_loss": -7.31639289855957, "global_step": 203696, "epoch": 4849} {"train_loss": -7.362516403198242, "global_step": 203697, "epoch": 4849} {"train_loss": -7.350038528442383, "global_step": 203698, "epoch": 4849} {"train_loss": -7.260840495427449, "global_step": 203699, "epoch": 4849, "val_loss": 69978.1875} {"train_loss": -7.36418342590332, "global_step": 203700, "epoch": 4850} {"train_loss": -7.335002422332764, "global_step": 203701, "epoch": 4850} {"train_loss": -7.341996192932129, "global_step": 203702, "epoch": 4850} {"train_loss": -7.452911376953125, "global_step": 203703, "epoch": 4850} {"train_loss": -7.380892276763916, "global_step": 203704, "epoch": 4850} {"train_loss": -7.353694438934326, "global_step": 203705, "epoch": 4850} {"train_loss": -7.461437702178955, "global_step": 203706, "epoch": 4850} {"train_loss": -7.346880912780762, "global_step": 203707, "epoch": 4850} {"train_loss": -7.423023223876953, "global_step": 203708, "epoch": 4850} {"train_loss": -7.473433494567871, "global_step": 203709, "epoch": 4850} {"train_loss": -7.3629608154296875, "global_step": 203710, "epoch": 4850} {"train_loss": -7.284722328186035, "global_step": 203711, "epoch": 4850} {"train_loss": -7.457181453704834, "global_step": 203712, "epoch": 4850} {"train_loss": -7.412327766418457, "global_step": 203713, "epoch": 4850} {"train_loss": -7.454135894775391, "global_step": 203714, "epoch": 4850} {"train_loss": -7.424091815948486, "global_step": 203715, "epoch": 4850} {"train_loss": -7.383592128753662, "global_step": 203716, "epoch": 4850} {"train_loss": -7.400733947753906, "global_step": 203717, "epoch": 4850} {"train_loss": -7.4104838371276855, "global_step": 203718, "epoch": 4850} {"train_loss": -7.350604057312012, "global_step": 203719, "epoch": 4850} {"train_loss": -7.240841865539551, "global_step": 203720, "epoch": 4850} {"train_loss": -7.289926528930664, "global_step": 203721, "epoch": 4850} {"train_loss": -7.395094871520996, "global_step": 203722, "epoch": 4850} {"train_loss": -7.323876857757568, "global_step": 203723, "epoch": 4850} {"train_loss": -7.265288352966309, "global_step": 203724, "epoch": 4850} {"train_loss": -7.4504194259643555, "global_step": 203725, "epoch": 4850} {"train_loss": -7.264894962310791, "global_step": 203726, "epoch": 4850} {"train_loss": -7.349958419799805, "global_step": 203727, "epoch": 4850} {"train_loss": -7.200592517852783, "global_step": 203728, "epoch": 4850} {"train_loss": -7.129377365112305, "global_step": 203729, "epoch": 4850} {"train_loss": -7.200497150421143, "global_step": 203730, "epoch": 4850} {"train_loss": -7.157763481140137, "global_step": 203731, "epoch": 4850} {"train_loss": -7.3151984214782715, "global_step": 203732, "epoch": 4850} {"train_loss": -7.25412654876709, "global_step": 203733, "epoch": 4850} {"train_loss": -7.3184614181518555, "global_step": 203734, "epoch": 4850} {"train_loss": -7.328252792358398, "global_step": 203735, "epoch": 4850} {"train_loss": -7.195499420166016, "global_step": 203736, "epoch": 4850} {"train_loss": -7.27154541015625, "global_step": 203737, "epoch": 4850} {"train_loss": -7.21124792098999, "global_step": 203738, "epoch": 4850} {"train_loss": -7.227928161621094, "global_step": 203739, "epoch": 4850} {"train_loss": -7.214953422546387, "global_step": 203740, "epoch": 4850} {"train_loss": -7.326004505157471, "global_step": 203741, "epoch": 4850, "train/sim_max_reward_0": 0.19413687381641148, "train/sim_max_reward_1": 0.8927580610356085, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.4618092883147991, "train/sim_max_reward_4": 0.9900436926200363, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4300000": 0.9057611795310235, "test/sim_max_reward_4300001": 0.9880848840888349, "test/sim_max_reward_4300002": 0.9630484341581695, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 1.0, "test/sim_max_reward_4300006": 0.0, "test/sim_max_reward_4300007": 0.9674976788567746, "test/sim_max_reward_4300008": 0.9529478523473907, "test/sim_max_reward_4300009": 0.9114020334746681, "test/sim_max_reward_4300010": 0.0, "test/sim_max_reward_4300011": 0.9190380888341508, "test/sim_max_reward_4300012": 0.9222216051240504, "test/sim_max_reward_4300013": 0.9906007446524484, "test/sim_max_reward_4300014": 0.9658022900879959, "test/sim_max_reward_4300015": 0.871773135126283, "test/sim_max_reward_4300016": 0.9860635196723829, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.3951934324193288, "test/sim_max_reward_4300019": 0.18635989609620357, "test/sim_max_reward_4300020": 0.15369389206998368, "test/sim_max_reward_4300021": 0.7813044612807106, "test/sim_max_reward_4300022": 0.7930793850137684, "test/sim_max_reward_4300023": 0.32639742548257683, "test/sim_max_reward_4300024": 0.5313995907346104, "test/sim_max_reward_4300025": 0.9148087929553813, "test/sim_max_reward_4300026": 0.17243454348235934, "test/sim_max_reward_4300027": 0.7167658236360793, "test/sim_max_reward_4300028": 0.9103091172360612, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.27501152570907456, "test/sim_max_reward_4300031": 0.8787274050082979, "test/sim_max_reward_4300032": 0.9368757555957594, "test/sim_max_reward_4300033": 0.8246050771069279, "test/sim_max_reward_4300034": 0.0, "test/sim_max_reward_4300035": 0.03359141772906101, "test/sim_max_reward_4300036": 0.199194115563479, "test/sim_max_reward_4300037": 0.7098430943704152, "test/sim_max_reward_4300038": 0.9474319151848799, "test/sim_max_reward_4300039": 0.798061560594855, "test/sim_max_reward_4300040": 1.0, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7113286692639246, "test/sim_max_reward_4300043": 0.1143087685226021, "test/sim_max_reward_4300044": 0.05097439889868903, "test/sim_max_reward_4300045": 0.973245306461334, "test/sim_max_reward_4300046": 0.9718999835280423, "test/sim_max_reward_4300047": 0.14189387495808564, "test/sim_max_reward_4300048": 0.003958410926258479, "test/sim_max_reward_4300049": 0.09720487198943008, "train/mean_score": 0.7564579859644759, "test/mean_score": 0.5981995612516328, "val_loss": 70087.2265625} {"train_loss": -7.297545909881592, "global_step": 203742, "epoch": 4851} {"train_loss": -7.341947078704834, "global_step": 203743, "epoch": 4851} {"train_loss": -7.387100696563721, "global_step": 203744, "epoch": 4851} {"train_loss": -7.257364273071289, "global_step": 203745, "epoch": 4851} {"train_loss": -7.303698539733887, "global_step": 203746, "epoch": 4851} {"train_loss": -7.428661823272705, "global_step": 203747, "epoch": 4851} {"train_loss": -7.239645004272461, "global_step": 203748, "epoch": 4851} {"train_loss": -7.272054672241211, "global_step": 203749, "epoch": 4851} {"train_loss": -7.159250259399414, "global_step": 203750, "epoch": 4851} {"train_loss": -7.237730979919434, "global_step": 203751, "epoch": 4851} {"train_loss": -7.233757495880127, "global_step": 203752, "epoch": 4851} {"train_loss": -7.211540222167969, "global_step": 203753, "epoch": 4851} {"train_loss": -7.369324684143066, "global_step": 203754, "epoch": 4851} {"train_loss": -7.201281547546387, "global_step": 203755, "epoch": 4851} {"train_loss": -7.2554497718811035, "global_step": 203756, "epoch": 4851} {"train_loss": -7.192093849182129, "global_step": 203757, "epoch": 4851} {"train_loss": -7.302988529205322, "global_step": 203758, "epoch": 4851} {"train_loss": -7.334072589874268, "global_step": 203759, "epoch": 4851} {"train_loss": -7.281326770782471, "global_step": 203760, "epoch": 4851} {"train_loss": -7.274620056152344, "global_step": 203761, "epoch": 4851} {"train_loss": -7.14283561706543, "global_step": 203762, "epoch": 4851} {"train_loss": -7.2204694747924805, "global_step": 203763, "epoch": 4851} {"train_loss": -7.315784454345703, "global_step": 203764, "epoch": 4851} {"train_loss": -7.276442050933838, "global_step": 203765, "epoch": 4851} {"train_loss": -7.310077667236328, "global_step": 203766, "epoch": 4851} {"train_loss": -7.192905426025391, "global_step": 203767, "epoch": 4851} {"train_loss": -7.303532600402832, "global_step": 203768, "epoch": 4851} {"train_loss": -7.1898274421691895, "global_step": 203769, "epoch": 4851} {"train_loss": -7.104804992675781, "global_step": 203770, "epoch": 4851} {"train_loss": -7.262770652770996, "global_step": 203771, "epoch": 4851} {"train_loss": -7.222060203552246, "global_step": 203772, "epoch": 4851} {"train_loss": -7.1693034172058105, "global_step": 203773, "epoch": 4851} {"train_loss": -7.231822967529297, "global_step": 203774, "epoch": 4851} {"train_loss": -7.1739821434021, "global_step": 203775, "epoch": 4851} {"train_loss": -7.302219390869141, "global_step": 203776, "epoch": 4851} {"train_loss": -7.353475570678711, "global_step": 203777, "epoch": 4851} {"train_loss": -7.312790393829346, "global_step": 203778, "epoch": 4851} {"train_loss": -7.214635848999023, "global_step": 203779, "epoch": 4851} {"train_loss": -7.289386749267578, "global_step": 203780, "epoch": 4851} {"train_loss": -7.241124629974365, "global_step": 203781, "epoch": 4851} {"train_loss": -7.322662830352783, "global_step": 203782, "epoch": 4851} {"train_loss": -7.264196974890573, "global_step": 203783, "epoch": 4851, "val_loss": 69904.7578125} {"train_loss": -7.410662651062012, "global_step": 203784, "epoch": 4852} {"train_loss": -7.349885940551758, "global_step": 203785, "epoch": 4852} {"train_loss": -7.239217758178711, "global_step": 203786, "epoch": 4852} {"train_loss": -7.358709335327148, "global_step": 203787, "epoch": 4852} {"train_loss": -7.199012756347656, "global_step": 203788, "epoch": 4852} {"train_loss": -7.21738338470459, "global_step": 203789, "epoch": 4852} {"train_loss": -7.330972671508789, "global_step": 203790, "epoch": 4852} {"train_loss": -7.322368621826172, "global_step": 203791, "epoch": 4852} {"train_loss": -7.32318115234375, "global_step": 203792, "epoch": 4852} {"train_loss": -7.234601020812988, "global_step": 203793, "epoch": 4852} {"train_loss": -7.298859596252441, "global_step": 203794, "epoch": 4852} {"train_loss": -7.358029365539551, "global_step": 203795, "epoch": 4852} {"train_loss": -7.210384368896484, "global_step": 203796, "epoch": 4852} {"train_loss": -7.3634419441223145, "global_step": 203797, "epoch": 4852} {"train_loss": -7.28145694732666, "global_step": 203798, "epoch": 4852} {"train_loss": -7.31687593460083, "global_step": 203799, "epoch": 4852} {"train_loss": -7.239376068115234, "global_step": 203800, "epoch": 4852} {"train_loss": -7.400511741638184, "global_step": 203801, "epoch": 4852} {"train_loss": -7.266381740570068, "global_step": 203802, "epoch": 4852} {"train_loss": -7.43513298034668, "global_step": 203803, "epoch": 4852} {"train_loss": -7.33370304107666, "global_step": 203804, "epoch": 4852} {"train_loss": -7.2579240798950195, "global_step": 203805, "epoch": 4852} {"train_loss": -7.386586666107178, "global_step": 203806, "epoch": 4852} {"train_loss": -7.258452415466309, "global_step": 203807, "epoch": 4852} {"train_loss": -7.250168800354004, "global_step": 203808, "epoch": 4852} {"train_loss": -7.40095329284668, "global_step": 203809, "epoch": 4852} {"train_loss": -7.2785420417785645, "global_step": 203810, "epoch": 4852} {"train_loss": -7.2761335372924805, "global_step": 203811, "epoch": 4852} {"train_loss": -7.286031723022461, "global_step": 203812, "epoch": 4852} {"train_loss": -7.321314811706543, "global_step": 203813, "epoch": 4852} {"train_loss": -7.389429092407227, "global_step": 203814, "epoch": 4852} {"train_loss": -7.218935012817383, "global_step": 203815, "epoch": 4852} {"train_loss": -7.215390205383301, "global_step": 203816, "epoch": 4852} {"train_loss": -7.279147148132324, "global_step": 203817, "epoch": 4852} {"train_loss": -7.3058600425720215, "global_step": 203818, "epoch": 4852} {"train_loss": -7.268128395080566, "global_step": 203819, "epoch": 4852} {"train_loss": -7.217846870422363, "global_step": 203820, "epoch": 4852} {"train_loss": -7.230278015136719, "global_step": 203821, "epoch": 4852} {"train_loss": -7.3185811042785645, "global_step": 203822, "epoch": 4852} {"train_loss": -7.237399101257324, "global_step": 203823, "epoch": 4852} {"train_loss": -7.281435012817383, "global_step": 203824, "epoch": 4852} {"train_loss": -7.297786099570138, "global_step": 203825, "epoch": 4852, "val_loss": 69937.734375} {"train_loss": -7.403547286987305, "global_step": 203826, "epoch": 4853} {"train_loss": -7.316193580627441, "global_step": 203827, "epoch": 4853} {"train_loss": -7.294232368469238, "global_step": 203828, "epoch": 4853} {"train_loss": -7.306551933288574, "global_step": 203829, "epoch": 4853} {"train_loss": -7.375128746032715, "global_step": 203830, "epoch": 4853} {"train_loss": -7.43856143951416, "global_step": 203831, "epoch": 4853} {"train_loss": -7.380037307739258, "global_step": 203832, "epoch": 4853} {"train_loss": -7.291226863861084, "global_step": 203833, "epoch": 4853} {"train_loss": -7.287285327911377, "global_step": 203834, "epoch": 4853} {"train_loss": -7.354228973388672, "global_step": 203835, "epoch": 4853} {"train_loss": -7.271205902099609, "global_step": 203836, "epoch": 4853} {"train_loss": -7.244666576385498, "global_step": 203837, "epoch": 4853} {"train_loss": -7.354744911193848, "global_step": 203838, "epoch": 4853} {"train_loss": -7.311277866363525, "global_step": 203839, "epoch": 4853} {"train_loss": -7.264911651611328, "global_step": 203840, "epoch": 4853} {"train_loss": -7.357867240905762, "global_step": 203841, "epoch": 4853} {"train_loss": -7.4022216796875, "global_step": 203842, "epoch": 4853} {"train_loss": -7.335780620574951, "global_step": 203843, "epoch": 4853} {"train_loss": -7.31165885925293, "global_step": 203844, "epoch": 4853} {"train_loss": -7.37667989730835, "global_step": 203845, "epoch": 4853} {"train_loss": -7.238345146179199, "global_step": 203846, "epoch": 4853} {"train_loss": -7.2099199295043945, "global_step": 203847, "epoch": 4853} {"train_loss": -7.2794575691223145, "global_step": 203848, "epoch": 4853} {"train_loss": -7.268834114074707, "global_step": 203849, "epoch": 4853} {"train_loss": -7.3688225746154785, "global_step": 203850, "epoch": 4853} {"train_loss": -7.28566837310791, "global_step": 203851, "epoch": 4853} {"train_loss": -7.31634521484375, "global_step": 203852, "epoch": 4853} {"train_loss": -7.349737167358398, "global_step": 203853, "epoch": 4853} {"train_loss": -7.255648612976074, "global_step": 203854, "epoch": 4853} {"train_loss": -7.339568138122559, "global_step": 203855, "epoch": 4853} {"train_loss": -7.362824440002441, "global_step": 203856, "epoch": 4853} {"train_loss": -7.293076515197754, "global_step": 203857, "epoch": 4853} {"train_loss": -7.402123928070068, "global_step": 203858, "epoch": 4853} {"train_loss": -7.280033588409424, "global_step": 203859, "epoch": 4853} {"train_loss": -7.306467056274414, "global_step": 203860, "epoch": 4853} {"train_loss": -7.235738277435303, "global_step": 203861, "epoch": 4853} {"train_loss": -7.245033264160156, "global_step": 203862, "epoch": 4853} {"train_loss": -7.270314693450928, "global_step": 203863, "epoch": 4853} {"train_loss": -7.326406955718994, "global_step": 203864, "epoch": 4853} {"train_loss": -7.155057430267334, "global_step": 203865, "epoch": 4853} {"train_loss": -7.251059055328369, "global_step": 203866, "epoch": 4853} {"train_loss": -7.308446339198521, "global_step": 203867, "epoch": 4853, "val_loss": 70000.8984375} {"train_loss": -7.201963424682617, "global_step": 203868, "epoch": 4854} {"train_loss": -7.295745849609375, "global_step": 203869, "epoch": 4854} {"train_loss": -7.205324172973633, "global_step": 203870, "epoch": 4854} {"train_loss": -7.342445373535156, "global_step": 203871, "epoch": 4854} {"train_loss": -7.23753547668457, "global_step": 203872, "epoch": 4854} {"train_loss": -7.407078742980957, "global_step": 203873, "epoch": 4854} {"train_loss": -7.334693431854248, "global_step": 203874, "epoch": 4854} {"train_loss": -7.181981086730957, "global_step": 203875, "epoch": 4854} {"train_loss": -7.397150039672852, "global_step": 203876, "epoch": 4854} {"train_loss": -7.243806838989258, "global_step": 203877, "epoch": 4854} {"train_loss": -7.292692184448242, "global_step": 203878, "epoch": 4854} {"train_loss": -7.317156791687012, "global_step": 203879, "epoch": 4854} {"train_loss": -7.3740081787109375, "global_step": 203880, "epoch": 4854} {"train_loss": -7.250459671020508, "global_step": 203881, "epoch": 4854} {"train_loss": -7.388280391693115, "global_step": 203882, "epoch": 4854} {"train_loss": -7.268959045410156, "global_step": 203883, "epoch": 4854} {"train_loss": -7.199633598327637, "global_step": 203884, "epoch": 4854} {"train_loss": -7.314985275268555, "global_step": 203885, "epoch": 4854} {"train_loss": -7.30565071105957, "global_step": 203886, "epoch": 4854} {"train_loss": -7.390111923217773, "global_step": 203887, "epoch": 4854} {"train_loss": -7.187450408935547, "global_step": 203888, "epoch": 4854} {"train_loss": -7.288106441497803, "global_step": 203889, "epoch": 4854} {"train_loss": -7.253323554992676, "global_step": 203890, "epoch": 4854} {"train_loss": -7.232158184051514, "global_step": 203891, "epoch": 4854} {"train_loss": -7.342446804046631, "global_step": 203892, "epoch": 4854} {"train_loss": -7.155730724334717, "global_step": 203893, "epoch": 4854} {"train_loss": -7.196141719818115, "global_step": 203894, "epoch": 4854} {"train_loss": -7.161061763763428, "global_step": 203895, "epoch": 4854} {"train_loss": -7.2065277099609375, "global_step": 203896, "epoch": 4854} {"train_loss": -7.306625843048096, "global_step": 203897, "epoch": 4854} {"train_loss": -7.208260536193848, "global_step": 203898, "epoch": 4854} {"train_loss": -7.342370986938477, "global_step": 203899, "epoch": 4854} {"train_loss": -7.1533074378967285, "global_step": 203900, "epoch": 4854} {"train_loss": -7.1952433586120605, "global_step": 203901, "epoch": 4854} {"train_loss": -7.145597457885742, "global_step": 203902, "epoch": 4854} {"train_loss": -7.231122016906738, "global_step": 203903, "epoch": 4854} {"train_loss": -7.263105392456055, "global_step": 203904, "epoch": 4854} {"train_loss": -7.224269866943359, "global_step": 203905, "epoch": 4854} {"train_loss": -7.299175262451172, "global_step": 203906, "epoch": 4854} {"train_loss": -7.243063926696777, "global_step": 203907, "epoch": 4854} {"train_loss": -7.255362510681152, "global_step": 203908, "epoch": 4854} {"train_loss": -7.263888767787388, "global_step": 203909, "epoch": 4854, "val_loss": 69801.4921875} {"train_loss": -7.277528285980225, "global_step": 203910, "epoch": 4855} {"train_loss": -7.413763046264648, "global_step": 203911, "epoch": 4855} {"train_loss": -7.312307357788086, "global_step": 203912, "epoch": 4855} {"train_loss": -7.188516139984131, "global_step": 203913, "epoch": 4855} {"train_loss": -7.333152770996094, "global_step": 203914, "epoch": 4855} {"train_loss": -7.2205681800842285, "global_step": 203915, "epoch": 4855} {"train_loss": -7.239117622375488, "global_step": 203916, "epoch": 4855} {"train_loss": -7.252054214477539, "global_step": 203917, "epoch": 4855} {"train_loss": -7.213156700134277, "global_step": 203918, "epoch": 4855} {"train_loss": -7.273651123046875, "global_step": 203919, "epoch": 4855} {"train_loss": -7.274142265319824, "global_step": 203920, "epoch": 4855} {"train_loss": -7.297920227050781, "global_step": 203921, "epoch": 4855} {"train_loss": -7.179203987121582, "global_step": 203922, "epoch": 4855} {"train_loss": -7.268980503082275, "global_step": 203923, "epoch": 4855} {"train_loss": -7.237122535705566, "global_step": 203924, "epoch": 4855} {"train_loss": -7.06397819519043, "global_step": 203925, "epoch": 4855} {"train_loss": -7.104065418243408, "global_step": 203926, "epoch": 4855} {"train_loss": -7.256425380706787, "global_step": 203927, "epoch": 4855} {"train_loss": -7.099811553955078, "global_step": 203928, "epoch": 4855} {"train_loss": -7.203034400939941, "global_step": 203929, "epoch": 4855} {"train_loss": -7.183877944946289, "global_step": 203930, "epoch": 4855} {"train_loss": -6.996002197265625, "global_step": 203931, "epoch": 4855} {"train_loss": -7.075444221496582, "global_step": 203932, "epoch": 4855} {"train_loss": -7.106610298156738, "global_step": 203933, "epoch": 4855} {"train_loss": -7.216159343719482, "global_step": 203934, "epoch": 4855} {"train_loss": -7.136683464050293, "global_step": 203935, "epoch": 4855} {"train_loss": -7.297870635986328, "global_step": 203936, "epoch": 4855} {"train_loss": -7.081624984741211, "global_step": 203937, "epoch": 4855} {"train_loss": -7.187790870666504, "global_step": 203938, "epoch": 4855} {"train_loss": -7.277670860290527, "global_step": 203939, "epoch": 4855} {"train_loss": -7.086647033691406, "global_step": 203940, "epoch": 4855} {"train_loss": -7.207558631896973, "global_step": 203941, "epoch": 4855} {"train_loss": -7.211865425109863, "global_step": 203942, "epoch": 4855} {"train_loss": -7.273955345153809, "global_step": 203943, "epoch": 4855} {"train_loss": -7.12969970703125, "global_step": 203944, "epoch": 4855} {"train_loss": -7.245030403137207, "global_step": 203945, "epoch": 4855} {"train_loss": -7.324560165405273, "global_step": 203946, "epoch": 4855} {"train_loss": -7.269564151763916, "global_step": 203947, "epoch": 4855} {"train_loss": -7.220238208770752, "global_step": 203948, "epoch": 4855} {"train_loss": -7.271535873413086, "global_step": 203949, "epoch": 4855} {"train_loss": -7.255393028259277, "global_step": 203950, "epoch": 4855} {"train_loss": -7.214932668776739, "global_step": 203951, "epoch": 4855, "val_loss": 69875.734375} {"train_loss": -7.262312889099121, "global_step": 203952, "epoch": 4856} {"train_loss": -7.252252578735352, "global_step": 203953, "epoch": 4856} {"train_loss": -7.370068550109863, "global_step": 203954, "epoch": 4856} {"train_loss": -7.433283805847168, "global_step": 203955, "epoch": 4856} {"train_loss": -7.396590232849121, "global_step": 203956, "epoch": 4856} {"train_loss": -7.300912857055664, "global_step": 203957, "epoch": 4856} {"train_loss": -7.295831680297852, "global_step": 203958, "epoch": 4856} {"train_loss": -7.29033088684082, "global_step": 203959, "epoch": 4856} {"train_loss": -7.466339588165283, "global_step": 203960, "epoch": 4856} {"train_loss": -7.466578483581543, "global_step": 203961, "epoch": 4856} {"train_loss": -7.342958450317383, "global_step": 203962, "epoch": 4856} {"train_loss": -7.283656120300293, "global_step": 203963, "epoch": 4856} {"train_loss": -7.327712059020996, "global_step": 203964, "epoch": 4856} {"train_loss": -7.268342018127441, "global_step": 203965, "epoch": 4856} {"train_loss": -7.36070442199707, "global_step": 203966, "epoch": 4856} {"train_loss": -7.401185035705566, "global_step": 203967, "epoch": 4856} {"train_loss": -7.393674850463867, "global_step": 203968, "epoch": 4856} {"train_loss": -7.366572380065918, "global_step": 203969, "epoch": 4856} {"train_loss": -7.291386604309082, "global_step": 203970, "epoch": 4856} {"train_loss": -7.4030585289001465, "global_step": 203971, "epoch": 4856} {"train_loss": -7.393160820007324, "global_step": 203972, "epoch": 4856} {"train_loss": -7.382246017456055, "global_step": 203973, "epoch": 4856} {"train_loss": -7.438262939453125, "global_step": 203974, "epoch": 4856} {"train_loss": -7.416797161102295, "global_step": 203975, "epoch": 4856} {"train_loss": -7.411559581756592, "global_step": 203976, "epoch": 4856} {"train_loss": -7.391997814178467, "global_step": 203977, "epoch": 4856} {"train_loss": -7.480656623840332, "global_step": 203978, "epoch": 4856} {"train_loss": -7.347225666046143, "global_step": 203979, "epoch": 4856} {"train_loss": -7.3537092208862305, "global_step": 203980, "epoch": 4856} {"train_loss": -7.3066864013671875, "global_step": 203981, "epoch": 4856} {"train_loss": -7.303679466247559, "global_step": 203982, "epoch": 4856} {"train_loss": -7.403480529785156, "global_step": 203983, "epoch": 4856} {"train_loss": -7.293567180633545, "global_step": 203984, "epoch": 4856} {"train_loss": -7.438117027282715, "global_step": 203985, "epoch": 4856} {"train_loss": -7.35877799987793, "global_step": 203986, "epoch": 4856} {"train_loss": -7.359525680541992, "global_step": 203987, "epoch": 4856} {"train_loss": -7.329683780670166, "global_step": 203988, "epoch": 4856} {"train_loss": -7.4064555168151855, "global_step": 203989, "epoch": 4856} {"train_loss": -7.351343154907227, "global_step": 203990, "epoch": 4856} {"train_loss": -7.380050182342529, "global_step": 203991, "epoch": 4856} {"train_loss": -7.388585567474365, "global_step": 203992, "epoch": 4856} {"train_loss": -7.364383073080154, "global_step": 203993, "epoch": 4856, "val_loss": 69878.390625} {"train_loss": -7.4408745765686035, "global_step": 203994, "epoch": 4857} {"train_loss": -7.428747653961182, "global_step": 203995, "epoch": 4857} {"train_loss": -7.243157863616943, "global_step": 203996, "epoch": 4857} {"train_loss": -7.34269380569458, "global_step": 203997, "epoch": 4857} {"train_loss": -7.404244899749756, "global_step": 203998, "epoch": 4857} {"train_loss": -7.426348686218262, "global_step": 203999, "epoch": 4857} {"train_loss": -7.3694167137146, "global_step": 204000, "epoch": 4857} {"train_loss": -7.2485456466674805, "global_step": 204001, "epoch": 4857} {"train_loss": -7.299590587615967, "global_step": 204002, "epoch": 4857} {"train_loss": -7.254626274108887, "global_step": 204003, "epoch": 4857} {"train_loss": -7.162694931030273, "global_step": 204004, "epoch": 4857} {"train_loss": -7.367132186889648, "global_step": 204005, "epoch": 4857} {"train_loss": -7.277435302734375, "global_step": 204006, "epoch": 4857} {"train_loss": -7.253313064575195, "global_step": 204007, "epoch": 4857} {"train_loss": -7.356380939483643, "global_step": 204008, "epoch": 4857} {"train_loss": -7.4199419021606445, "global_step": 204009, "epoch": 4857} {"train_loss": -7.403944969177246, "global_step": 204010, "epoch": 4857} {"train_loss": -7.306431770324707, "global_step": 204011, "epoch": 4857} {"train_loss": -7.314736366271973, "global_step": 204012, "epoch": 4857} {"train_loss": -7.102963447570801, "global_step": 204013, "epoch": 4857} {"train_loss": -7.416794776916504, "global_step": 204014, "epoch": 4857} {"train_loss": -7.2825517654418945, "global_step": 204015, "epoch": 4857} {"train_loss": -7.147372245788574, "global_step": 204016, "epoch": 4857} {"train_loss": -7.346203804016113, "global_step": 204017, "epoch": 4857} {"train_loss": -7.1383957862854, "global_step": 204018, "epoch": 4857} {"train_loss": -7.276289463043213, "global_step": 204019, "epoch": 4857} {"train_loss": -7.176865577697754, "global_step": 204020, "epoch": 4857} {"train_loss": -7.094837665557861, "global_step": 204021, "epoch": 4857} {"train_loss": -7.2648138999938965, "global_step": 204022, "epoch": 4857} {"train_loss": -7.1749773025512695, "global_step": 204023, "epoch": 4857} {"train_loss": -7.228570938110352, "global_step": 204024, "epoch": 4857} {"train_loss": -7.193915367126465, "global_step": 204025, "epoch": 4857} {"train_loss": -7.345073699951172, "global_step": 204026, "epoch": 4857} {"train_loss": -7.3056535720825195, "global_step": 204027, "epoch": 4857} {"train_loss": -7.185962677001953, "global_step": 204028, "epoch": 4857} {"train_loss": -7.191363334655762, "global_step": 204029, "epoch": 4857} {"train_loss": -7.2565016746521, "global_step": 204030, "epoch": 4857} {"train_loss": -7.181812763214111, "global_step": 204031, "epoch": 4857} {"train_loss": -7.154707908630371, "global_step": 204032, "epoch": 4857} {"train_loss": -7.238162040710449, "global_step": 204033, "epoch": 4857} {"train_loss": -7.268886566162109, "global_step": 204034, "epoch": 4857} {"train_loss": -7.27186598096575, "global_step": 204035, "epoch": 4857, "val_loss": 69990.8671875} {"train_loss": -7.239934921264648, "global_step": 204036, "epoch": 4858} {"train_loss": -7.178142547607422, "global_step": 204037, "epoch": 4858} {"train_loss": -7.212301254272461, "global_step": 204038, "epoch": 4858} {"train_loss": -7.180620193481445, "global_step": 204039, "epoch": 4858} {"train_loss": -7.104419708251953, "global_step": 204040, "epoch": 4858} {"train_loss": -7.139829635620117, "global_step": 204041, "epoch": 4858} {"train_loss": -7.275257587432861, "global_step": 204042, "epoch": 4858} {"train_loss": -7.29685115814209, "global_step": 204043, "epoch": 4858} {"train_loss": -7.138185977935791, "global_step": 204044, "epoch": 4858} {"train_loss": -7.312550067901611, "global_step": 204045, "epoch": 4858} {"train_loss": -7.203061103820801, "global_step": 204046, "epoch": 4858} {"train_loss": -7.163844585418701, "global_step": 204047, "epoch": 4858} {"train_loss": -7.261112213134766, "global_step": 204048, "epoch": 4858} {"train_loss": -7.227275848388672, "global_step": 204049, "epoch": 4858} {"train_loss": -7.279300689697266, "global_step": 204050, "epoch": 4858} {"train_loss": -7.111079216003418, "global_step": 204051, "epoch": 4858} {"train_loss": -7.3499956130981445, "global_step": 204052, "epoch": 4858} {"train_loss": -7.195791244506836, "global_step": 204053, "epoch": 4858} {"train_loss": -7.129061698913574, "global_step": 204054, "epoch": 4858} {"train_loss": -7.237162113189697, "global_step": 204055, "epoch": 4858} {"train_loss": -7.029110908508301, "global_step": 204056, "epoch": 4858} {"train_loss": -7.226114749908447, "global_step": 204057, "epoch": 4858} {"train_loss": -7.104721546173096, "global_step": 204058, "epoch": 4858} {"train_loss": -7.1144256591796875, "global_step": 204059, "epoch": 4858} {"train_loss": -7.159327507019043, "global_step": 204060, "epoch": 4858} {"train_loss": -7.187834739685059, "global_step": 204061, "epoch": 4858} {"train_loss": -7.157980442047119, "global_step": 204062, "epoch": 4858} {"train_loss": -7.235300540924072, "global_step": 204063, "epoch": 4858} {"train_loss": -7.212457656860352, "global_step": 204064, "epoch": 4858} {"train_loss": -7.216635704040527, "global_step": 204065, "epoch": 4858} {"train_loss": -7.177093029022217, "global_step": 204066, "epoch": 4858} {"train_loss": -7.29913330078125, "global_step": 204067, "epoch": 4858} {"train_loss": -7.124591827392578, "global_step": 204068, "epoch": 4858} {"train_loss": -7.241135597229004, "global_step": 204069, "epoch": 4858} {"train_loss": -7.2822065353393555, "global_step": 204070, "epoch": 4858} {"train_loss": -7.196800708770752, "global_step": 204071, "epoch": 4858} {"train_loss": -7.2729291915893555, "global_step": 204072, "epoch": 4858} {"train_loss": -7.3449578285217285, "global_step": 204073, "epoch": 4858} {"train_loss": -7.293536186218262, "global_step": 204074, "epoch": 4858} {"train_loss": -7.296940326690674, "global_step": 204075, "epoch": 4858} {"train_loss": -7.350167751312256, "global_step": 204076, "epoch": 4858} {"train_loss": -7.212624833697364, "global_step": 204077, "epoch": 4858, "val_loss": 69891.078125} {"train_loss": -7.259006023406982, "global_step": 204078, "epoch": 4859} {"train_loss": -7.143891334533691, "global_step": 204079, "epoch": 4859} {"train_loss": -7.299118995666504, "global_step": 204080, "epoch": 4859} {"train_loss": -7.3093061447143555, "global_step": 204081, "epoch": 4859} {"train_loss": -7.334802627563477, "global_step": 204082, "epoch": 4859} {"train_loss": -7.315040588378906, "global_step": 204083, "epoch": 4859} {"train_loss": -7.307887077331543, "global_step": 204084, "epoch": 4859} {"train_loss": -7.371459484100342, "global_step": 204085, "epoch": 4859} {"train_loss": -7.297206878662109, "global_step": 204086, "epoch": 4859} {"train_loss": -7.29721736907959, "global_step": 204087, "epoch": 4859} {"train_loss": -7.26462459564209, "global_step": 204088, "epoch": 4859} {"train_loss": -7.313779830932617, "global_step": 204089, "epoch": 4859} {"train_loss": -7.333699703216553, "global_step": 204090, "epoch": 4859} {"train_loss": -7.3966875076293945, "global_step": 204091, "epoch": 4859} {"train_loss": -7.339786529541016, "global_step": 204092, "epoch": 4859} {"train_loss": -7.32508659362793, "global_step": 204093, "epoch": 4859} {"train_loss": -7.295177459716797, "global_step": 204094, "epoch": 4859} {"train_loss": -7.332777500152588, "global_step": 204095, "epoch": 4859} {"train_loss": -7.388819694519043, "global_step": 204096, "epoch": 4859} {"train_loss": -7.359743118286133, "global_step": 204097, "epoch": 4859} {"train_loss": -7.2467193603515625, "global_step": 204098, "epoch": 4859} {"train_loss": -7.301453113555908, "global_step": 204099, "epoch": 4859} {"train_loss": -7.377909183502197, "global_step": 204100, "epoch": 4859} {"train_loss": -7.353070259094238, "global_step": 204101, "epoch": 4859} {"train_loss": -7.372429847717285, "global_step": 204102, "epoch": 4859} {"train_loss": -7.354180812835693, "global_step": 204103, "epoch": 4859} {"train_loss": -7.348608016967773, "global_step": 204104, "epoch": 4859} {"train_loss": -7.224266052246094, "global_step": 204105, "epoch": 4859} {"train_loss": -7.344921588897705, "global_step": 204106, "epoch": 4859} {"train_loss": -7.254021644592285, "global_step": 204107, "epoch": 4859} {"train_loss": -7.348546028137207, "global_step": 204108, "epoch": 4859} {"train_loss": -7.356340408325195, "global_step": 204109, "epoch": 4859} {"train_loss": -7.2986040115356445, "global_step": 204110, "epoch": 4859} {"train_loss": -7.346508502960205, "global_step": 204111, "epoch": 4859} {"train_loss": -7.341821670532227, "global_step": 204112, "epoch": 4859} {"train_loss": -7.459715843200684, "global_step": 204113, "epoch": 4859} {"train_loss": -7.315354347229004, "global_step": 204114, "epoch": 4859} {"train_loss": -7.366676330566406, "global_step": 204115, "epoch": 4859} {"train_loss": -7.382437705993652, "global_step": 204116, "epoch": 4859} {"train_loss": -7.3556952476501465, "global_step": 204117, "epoch": 4859} {"train_loss": -7.242184162139893, "global_step": 204118, "epoch": 4859} {"train_loss": -7.323001214436123, "global_step": 204119, "epoch": 4859, "val_loss": 69827.421875} {"train_loss": -7.272867679595947, "global_step": 204120, "epoch": 4860} {"train_loss": -7.355162620544434, "global_step": 204121, "epoch": 4860} {"train_loss": -7.164485454559326, "global_step": 204122, "epoch": 4860} {"train_loss": -7.123692512512207, "global_step": 204123, "epoch": 4860} {"train_loss": -7.280396461486816, "global_step": 204124, "epoch": 4860} {"train_loss": -7.172911643981934, "global_step": 204125, "epoch": 4860} {"train_loss": -7.200976371765137, "global_step": 204126, "epoch": 4860} {"train_loss": -7.334898948669434, "global_step": 204127, "epoch": 4860} {"train_loss": -7.1363983154296875, "global_step": 204128, "epoch": 4860} {"train_loss": -7.21174430847168, "global_step": 204129, "epoch": 4860} {"train_loss": -7.3374762535095215, "global_step": 204130, "epoch": 4860} {"train_loss": -7.185332298278809, "global_step": 204131, "epoch": 4860} {"train_loss": -7.324065208435059, "global_step": 204132, "epoch": 4860} {"train_loss": -7.263089179992676, "global_step": 204133, "epoch": 4860} {"train_loss": -7.250970363616943, "global_step": 204134, "epoch": 4860} {"train_loss": -7.370586395263672, "global_step": 204135, "epoch": 4860} {"train_loss": -7.218165874481201, "global_step": 204136, "epoch": 4860} {"train_loss": -7.265606880187988, "global_step": 204137, "epoch": 4860} {"train_loss": -7.355173587799072, "global_step": 204138, "epoch": 4860} {"train_loss": -7.204448699951172, "global_step": 204139, "epoch": 4860} {"train_loss": -7.271861553192139, "global_step": 204140, "epoch": 4860} {"train_loss": -7.312638282775879, "global_step": 204141, "epoch": 4860} {"train_loss": -7.340033531188965, "global_step": 204142, "epoch": 4860} {"train_loss": -7.392941951751709, "global_step": 204143, "epoch": 4860} {"train_loss": -7.246119499206543, "global_step": 204144, "epoch": 4860} {"train_loss": -7.317685127258301, "global_step": 204145, "epoch": 4860} {"train_loss": -7.302094459533691, "global_step": 204146, "epoch": 4860} {"train_loss": -7.311910629272461, "global_step": 204147, "epoch": 4860} {"train_loss": -7.271859169006348, "global_step": 204148, "epoch": 4860} {"train_loss": -7.221211910247803, "global_step": 204149, "epoch": 4860} {"train_loss": -7.381834983825684, "global_step": 204150, "epoch": 4860} {"train_loss": -7.3156328201293945, "global_step": 204151, "epoch": 4860} {"train_loss": -7.225378036499023, "global_step": 204152, "epoch": 4860} {"train_loss": -7.235202312469482, "global_step": 204153, "epoch": 4860} {"train_loss": -7.348587512969971, "global_step": 204154, "epoch": 4860} {"train_loss": -7.273723602294922, "global_step": 204155, "epoch": 4860} {"train_loss": -7.3815693855285645, "global_step": 204156, "epoch": 4860} {"train_loss": -7.301969051361084, "global_step": 204157, "epoch": 4860} {"train_loss": -7.3284807205200195, "global_step": 204158, "epoch": 4860} {"train_loss": -7.30497407913208, "global_step": 204159, "epoch": 4860} {"train_loss": -7.343491554260254, "global_step": 204160, "epoch": 4860} {"train_loss": -7.279283228374663, "global_step": 204161, "epoch": 4860, "val_loss": 69898.5625} {"train_loss": -7.346784591674805, "global_step": 204162, "epoch": 4861} {"train_loss": -7.396798133850098, "global_step": 204163, "epoch": 4861} {"train_loss": -7.2199177742004395, "global_step": 204164, "epoch": 4861} {"train_loss": -7.217949390411377, "global_step": 204165, "epoch": 4861} {"train_loss": -7.307570457458496, "global_step": 204166, "epoch": 4861} {"train_loss": -7.286665439605713, "global_step": 204167, "epoch": 4861} {"train_loss": -7.279252052307129, "global_step": 204168, "epoch": 4861} {"train_loss": -7.3452606201171875, "global_step": 204169, "epoch": 4861} {"train_loss": -7.3518171310424805, "global_step": 204170, "epoch": 4861} {"train_loss": -7.1699724197387695, "global_step": 204171, "epoch": 4861} {"train_loss": -7.276007652282715, "global_step": 204172, "epoch": 4861} {"train_loss": -7.252726078033447, "global_step": 204173, "epoch": 4861} {"train_loss": -7.274304389953613, "global_step": 204174, "epoch": 4861} {"train_loss": -7.3983259201049805, "global_step": 204175, "epoch": 4861} {"train_loss": -7.121481895446777, "global_step": 204176, "epoch": 4861} {"train_loss": -7.347965240478516, "global_step": 204177, "epoch": 4861} {"train_loss": -7.3876848220825195, "global_step": 204178, "epoch": 4861} {"train_loss": -7.294280052185059, "global_step": 204179, "epoch": 4861} {"train_loss": -7.325039386749268, "global_step": 204180, "epoch": 4861} {"train_loss": -7.25600528717041, "global_step": 204181, "epoch": 4861} {"train_loss": -7.297252178192139, "global_step": 204182, "epoch": 4861} {"train_loss": -7.141823768615723, "global_step": 204183, "epoch": 4861} {"train_loss": -7.300865650177002, "global_step": 204184, "epoch": 4861} {"train_loss": -7.2905168533325195, "global_step": 204185, "epoch": 4861} {"train_loss": -7.221597671508789, "global_step": 204186, "epoch": 4861} {"train_loss": -7.282470226287842, "global_step": 204187, "epoch": 4861} {"train_loss": -7.266293525695801, "global_step": 204188, "epoch": 4861} {"train_loss": -7.2896013259887695, "global_step": 204189, "epoch": 4861} {"train_loss": -7.1343889236450195, "global_step": 204190, "epoch": 4861} {"train_loss": -7.240753650665283, "global_step": 204191, "epoch": 4861} {"train_loss": -7.235713005065918, "global_step": 204192, "epoch": 4861} {"train_loss": -7.2793498039245605, "global_step": 204193, "epoch": 4861} {"train_loss": -7.218625068664551, "global_step": 204194, "epoch": 4861} {"train_loss": -7.3292317390441895, "global_step": 204195, "epoch": 4861} {"train_loss": -7.332723140716553, "global_step": 204196, "epoch": 4861} {"train_loss": -7.358031272888184, "global_step": 204197, "epoch": 4861} {"train_loss": -7.282486915588379, "global_step": 204198, "epoch": 4861} {"train_loss": -7.361756324768066, "global_step": 204199, "epoch": 4861} {"train_loss": -7.225184440612793, "global_step": 204200, "epoch": 4861} {"train_loss": -7.307033538818359, "global_step": 204201, "epoch": 4861} {"train_loss": -7.340662479400635, "global_step": 204202, "epoch": 4861} {"train_loss": -7.286183436711629, "global_step": 204203, "epoch": 4861, "val_loss": 70061.2109375} {"train_loss": -7.361135005950928, "global_step": 204204, "epoch": 4862} {"train_loss": -7.359714508056641, "global_step": 204205, "epoch": 4862} {"train_loss": -7.3464508056640625, "global_step": 204206, "epoch": 4862} {"train_loss": -7.383857250213623, "global_step": 204207, "epoch": 4862} {"train_loss": -7.317792892456055, "global_step": 204208, "epoch": 4862} {"train_loss": -7.338521480560303, "global_step": 204209, "epoch": 4862} {"train_loss": -7.30518913269043, "global_step": 204210, "epoch": 4862} {"train_loss": -7.32358980178833, "global_step": 204211, "epoch": 4862} {"train_loss": -7.265694618225098, "global_step": 204212, "epoch": 4862} {"train_loss": -7.336621284484863, "global_step": 204213, "epoch": 4862} {"train_loss": -7.287172794342041, "global_step": 204214, "epoch": 4862} {"train_loss": -7.377895832061768, "global_step": 204215, "epoch": 4862} {"train_loss": -7.330666542053223, "global_step": 204216, "epoch": 4862} {"train_loss": -7.316749572753906, "global_step": 204217, "epoch": 4862} {"train_loss": -7.3447585105896, "global_step": 204218, "epoch": 4862} {"train_loss": -7.258221626281738, "global_step": 204219, "epoch": 4862} {"train_loss": -7.2922282218933105, "global_step": 204220, "epoch": 4862} {"train_loss": -7.340914726257324, "global_step": 204221, "epoch": 4862} {"train_loss": -7.2684712409973145, "global_step": 204222, "epoch": 4862} {"train_loss": -7.280738830566406, "global_step": 204223, "epoch": 4862} {"train_loss": -7.241072177886963, "global_step": 204224, "epoch": 4862} {"train_loss": -7.492205619812012, "global_step": 204225, "epoch": 4862} {"train_loss": -7.289501667022705, "global_step": 204226, "epoch": 4862} {"train_loss": -7.3342485427856445, "global_step": 204227, "epoch": 4862} {"train_loss": -7.227025985717773, "global_step": 204228, "epoch": 4862} {"train_loss": -7.354550361633301, "global_step": 204229, "epoch": 4862} {"train_loss": -7.29617977142334, "global_step": 204230, "epoch": 4862} {"train_loss": -7.263436317443848, "global_step": 204231, "epoch": 4862} {"train_loss": -7.258335113525391, "global_step": 204232, "epoch": 4862} {"train_loss": -7.352210998535156, "global_step": 204233, "epoch": 4862} {"train_loss": -7.35776424407959, "global_step": 204234, "epoch": 4862} {"train_loss": -7.283661842346191, "global_step": 204235, "epoch": 4862} {"train_loss": -7.251625061035156, "global_step": 204236, "epoch": 4862} {"train_loss": -7.270289897918701, "global_step": 204237, "epoch": 4862} {"train_loss": -7.272721290588379, "global_step": 204238, "epoch": 4862} {"train_loss": -7.218402862548828, "global_step": 204239, "epoch": 4862} {"train_loss": -7.323144912719727, "global_step": 204240, "epoch": 4862} {"train_loss": -7.24700927734375, "global_step": 204241, "epoch": 4862} {"train_loss": -7.45662784576416, "global_step": 204242, "epoch": 4862} {"train_loss": -7.261149883270264, "global_step": 204243, "epoch": 4862} {"train_loss": -7.273970127105713, "global_step": 204244, "epoch": 4862} {"train_loss": -7.311667533147903, "global_step": 204245, "epoch": 4862, "val_loss": 69935.6015625} {"train_loss": -7.465301036834717, "global_step": 204246, "epoch": 4863} {"train_loss": -7.336102485656738, "global_step": 204247, "epoch": 4863} {"train_loss": -7.332798480987549, "global_step": 204248, "epoch": 4863} {"train_loss": -7.297341346740723, "global_step": 204249, "epoch": 4863} {"train_loss": -7.286670207977295, "global_step": 204250, "epoch": 4863} {"train_loss": -7.16616153717041, "global_step": 204251, "epoch": 4863} {"train_loss": -7.003771781921387, "global_step": 204252, "epoch": 4863} {"train_loss": -7.207048416137695, "global_step": 204253, "epoch": 4863} {"train_loss": -7.201019763946533, "global_step": 204254, "epoch": 4863} {"train_loss": -7.135858535766602, "global_step": 204255, "epoch": 4863} {"train_loss": -7.149957656860352, "global_step": 204256, "epoch": 4863} {"train_loss": -7.1354827880859375, "global_step": 204257, "epoch": 4863} {"train_loss": -7.143070220947266, "global_step": 204258, "epoch": 4863} {"train_loss": -7.165895462036133, "global_step": 204259, "epoch": 4863} {"train_loss": -7.095908164978027, "global_step": 204260, "epoch": 4863} {"train_loss": -7.176102638244629, "global_step": 204261, "epoch": 4863} {"train_loss": -6.9713544845581055, "global_step": 204262, "epoch": 4863} {"train_loss": -7.165416717529297, "global_step": 204263, "epoch": 4863} {"train_loss": -7.153012275695801, "global_step": 204264, "epoch": 4863} {"train_loss": -7.170525074005127, "global_step": 204265, "epoch": 4863} {"train_loss": -7.228625297546387, "global_step": 204266, "epoch": 4863} {"train_loss": -7.091609477996826, "global_step": 204267, "epoch": 4863} {"train_loss": -7.194648742675781, "global_step": 204268, "epoch": 4863} {"train_loss": -7.197035312652588, "global_step": 204269, "epoch": 4863} {"train_loss": -7.266228199005127, "global_step": 204270, "epoch": 4863} {"train_loss": -7.233698844909668, "global_step": 204271, "epoch": 4863} {"train_loss": -7.214943885803223, "global_step": 204272, "epoch": 4863} {"train_loss": -7.185528755187988, "global_step": 204273, "epoch": 4863} {"train_loss": -7.214226722717285, "global_step": 204274, "epoch": 4863} {"train_loss": -7.255448341369629, "global_step": 204275, "epoch": 4863} {"train_loss": -7.267751216888428, "global_step": 204276, "epoch": 4863} {"train_loss": -7.2970170974731445, "global_step": 204277, "epoch": 4863} {"train_loss": -7.24050235748291, "global_step": 204278, "epoch": 4863} {"train_loss": -7.157352447509766, "global_step": 204279, "epoch": 4863} {"train_loss": -7.265189170837402, "global_step": 204280, "epoch": 4863} {"train_loss": -7.217862606048584, "global_step": 204281, "epoch": 4863} {"train_loss": -7.304140090942383, "global_step": 204282, "epoch": 4863} {"train_loss": -7.266024112701416, "global_step": 204283, "epoch": 4863} {"train_loss": -7.342644691467285, "global_step": 204284, "epoch": 4863} {"train_loss": -7.203094005584717, "global_step": 204285, "epoch": 4863} {"train_loss": -7.3085432052612305, "global_step": 204286, "epoch": 4863} {"train_loss": -7.214948824473789, "global_step": 204287, "epoch": 4863, "val_loss": 69894.8125} {"train_loss": -7.314866065979004, "global_step": 204288, "epoch": 4864} {"train_loss": -7.268767356872559, "global_step": 204289, "epoch": 4864} {"train_loss": -7.2445526123046875, "global_step": 204290, "epoch": 4864} {"train_loss": -7.379899978637695, "global_step": 204291, "epoch": 4864} {"train_loss": -7.320262908935547, "global_step": 204292, "epoch": 4864} {"train_loss": -7.372455596923828, "global_step": 204293, "epoch": 4864} {"train_loss": -7.3203582763671875, "global_step": 204294, "epoch": 4864} {"train_loss": -7.290195941925049, "global_step": 204295, "epoch": 4864} {"train_loss": -7.399599075317383, "global_step": 204296, "epoch": 4864} {"train_loss": -7.302071571350098, "global_step": 204297, "epoch": 4864} {"train_loss": -7.312928676605225, "global_step": 204298, "epoch": 4864} {"train_loss": -7.3368916511535645, "global_step": 204299, "epoch": 4864} {"train_loss": -7.339615821838379, "global_step": 204300, "epoch": 4864} {"train_loss": -7.394170761108398, "global_step": 204301, "epoch": 4864} {"train_loss": -7.406911849975586, "global_step": 204302, "epoch": 4864} {"train_loss": -7.306612968444824, "global_step": 204303, "epoch": 4864} {"train_loss": -7.424843788146973, "global_step": 204304, "epoch": 4864} {"train_loss": -7.235584735870361, "global_step": 204305, "epoch": 4864} {"train_loss": -7.303199768066406, "global_step": 204306, "epoch": 4864} {"train_loss": -7.362298965454102, "global_step": 204307, "epoch": 4864} {"train_loss": -7.243762969970703, "global_step": 204308, "epoch": 4864} {"train_loss": -7.3534040451049805, "global_step": 204309, "epoch": 4864} {"train_loss": -7.215453624725342, "global_step": 204310, "epoch": 4864} {"train_loss": -7.253798484802246, "global_step": 204311, "epoch": 4864} {"train_loss": -7.363964080810547, "global_step": 204312, "epoch": 4864} {"train_loss": -7.339590072631836, "global_step": 204313, "epoch": 4864} {"train_loss": -7.3657026290893555, "global_step": 204314, "epoch": 4864} {"train_loss": -7.278289318084717, "global_step": 204315, "epoch": 4864} {"train_loss": -7.444052696228027, "global_step": 204316, "epoch": 4864} {"train_loss": -7.3001909255981445, "global_step": 204317, "epoch": 4864} {"train_loss": -7.421909332275391, "global_step": 204318, "epoch": 4864} {"train_loss": -7.368025302886963, "global_step": 204319, "epoch": 4864} {"train_loss": -7.255309581756592, "global_step": 204320, "epoch": 4864} {"train_loss": -7.292388916015625, "global_step": 204321, "epoch": 4864} {"train_loss": -7.313337326049805, "global_step": 204322, "epoch": 4864} {"train_loss": -7.256217002868652, "global_step": 204323, "epoch": 4864} {"train_loss": -7.230312347412109, "global_step": 204324, "epoch": 4864} {"train_loss": -7.241571426391602, "global_step": 204325, "epoch": 4864} {"train_loss": -7.371100425720215, "global_step": 204326, "epoch": 4864} {"train_loss": -7.377250671386719, "global_step": 204327, "epoch": 4864} {"train_loss": -7.356337547302246, "global_step": 204328, "epoch": 4864} {"train_loss": -7.322780166353498, "global_step": 204329, "epoch": 4864, "val_loss": 69938.15625} {"train_loss": -7.312619209289551, "global_step": 204330, "epoch": 4865} {"train_loss": -7.486222267150879, "global_step": 204331, "epoch": 4865} {"train_loss": -7.350818157196045, "global_step": 204332, "epoch": 4865} {"train_loss": -7.293625831604004, "global_step": 204333, "epoch": 4865} {"train_loss": -7.3723344802856445, "global_step": 204334, "epoch": 4865} {"train_loss": -7.249526023864746, "global_step": 204335, "epoch": 4865} {"train_loss": -7.305806636810303, "global_step": 204336, "epoch": 4865} {"train_loss": -7.40989351272583, "global_step": 204337, "epoch": 4865} {"train_loss": -7.246579170227051, "global_step": 204338, "epoch": 4865} {"train_loss": -7.267395973205566, "global_step": 204339, "epoch": 4865} {"train_loss": -7.399139404296875, "global_step": 204340, "epoch": 4865} {"train_loss": -7.319160461425781, "global_step": 204341, "epoch": 4865} {"train_loss": -7.282948017120361, "global_step": 204342, "epoch": 4865} {"train_loss": -7.234273910522461, "global_step": 204343, "epoch": 4865} {"train_loss": -7.397021293640137, "global_step": 204344, "epoch": 4865} {"train_loss": -7.328426361083984, "global_step": 204345, "epoch": 4865} {"train_loss": -7.4008002281188965, "global_step": 204346, "epoch": 4865} {"train_loss": -7.395358085632324, "global_step": 204347, "epoch": 4865} {"train_loss": -7.326605319976807, "global_step": 204348, "epoch": 4865} {"train_loss": -7.283567905426025, "global_step": 204349, "epoch": 4865} {"train_loss": -7.349549770355225, "global_step": 204350, "epoch": 4865} {"train_loss": -7.247226715087891, "global_step": 204351, "epoch": 4865} {"train_loss": -7.266289710998535, "global_step": 204352, "epoch": 4865} {"train_loss": -7.327304840087891, "global_step": 204353, "epoch": 4865} {"train_loss": -7.311639308929443, "global_step": 204354, "epoch": 4865} {"train_loss": -7.170163154602051, "global_step": 204355, "epoch": 4865} {"train_loss": -7.303359031677246, "global_step": 204356, "epoch": 4865} {"train_loss": -7.11080265045166, "global_step": 204357, "epoch": 4865} {"train_loss": -7.171960830688477, "global_step": 204358, "epoch": 4865} {"train_loss": -7.3048415184021, "global_step": 204359, "epoch": 4865} {"train_loss": -7.298557281494141, "global_step": 204360, "epoch": 4865} {"train_loss": -7.243924140930176, "global_step": 204361, "epoch": 4865} {"train_loss": -7.369688987731934, "global_step": 204362, "epoch": 4865} {"train_loss": -7.292430400848389, "global_step": 204363, "epoch": 4865} {"train_loss": -7.253528594970703, "global_step": 204364, "epoch": 4865} {"train_loss": -7.304030418395996, "global_step": 204365, "epoch": 4865} {"train_loss": -7.3001203536987305, "global_step": 204366, "epoch": 4865} {"train_loss": -7.385212421417236, "global_step": 204367, "epoch": 4865} {"train_loss": -7.212163925170898, "global_step": 204368, "epoch": 4865} {"train_loss": -7.293083190917969, "global_step": 204369, "epoch": 4865} {"train_loss": -7.273649215698242, "global_step": 204370, "epoch": 4865} {"train_loss": -7.3041265578497026, "global_step": 204371, "epoch": 4865, "val_loss": 70065.7109375} {"train_loss": -7.332681655883789, "global_step": 204372, "epoch": 4866} {"train_loss": -7.376801013946533, "global_step": 204373, "epoch": 4866} {"train_loss": -7.3323493003845215, "global_step": 204374, "epoch": 4866} {"train_loss": -7.348700523376465, "global_step": 204375, "epoch": 4866} {"train_loss": -7.224315643310547, "global_step": 204376, "epoch": 4866} {"train_loss": -7.277658462524414, "global_step": 204377, "epoch": 4866} {"train_loss": -7.368400573730469, "global_step": 204378, "epoch": 4866} {"train_loss": -7.370171546936035, "global_step": 204379, "epoch": 4866} {"train_loss": -7.343487739562988, "global_step": 204380, "epoch": 4866} {"train_loss": -7.363471031188965, "global_step": 204381, "epoch": 4866} {"train_loss": -7.334190845489502, "global_step": 204382, "epoch": 4866} {"train_loss": -7.259408950805664, "global_step": 204383, "epoch": 4866} {"train_loss": -7.388901233673096, "global_step": 204384, "epoch": 4866} {"train_loss": -7.288536548614502, "global_step": 204385, "epoch": 4866} {"train_loss": -7.3431010246276855, "global_step": 204386, "epoch": 4866} {"train_loss": -7.349033832550049, "global_step": 204387, "epoch": 4866} {"train_loss": -7.335585594177246, "global_step": 204388, "epoch": 4866} {"train_loss": -7.262223243713379, "global_step": 204389, "epoch": 4866} {"train_loss": -7.172153949737549, "global_step": 204390, "epoch": 4866} {"train_loss": -7.329462051391602, "global_step": 204391, "epoch": 4866} {"train_loss": -7.251755714416504, "global_step": 204392, "epoch": 4866} {"train_loss": -7.111360549926758, "global_step": 204393, "epoch": 4866} {"train_loss": -7.27723503112793, "global_step": 204394, "epoch": 4866} {"train_loss": -7.273199081420898, "global_step": 204395, "epoch": 4866} {"train_loss": -7.28127384185791, "global_step": 204396, "epoch": 4866} {"train_loss": -7.364023685455322, "global_step": 204397, "epoch": 4866} {"train_loss": -7.345002174377441, "global_step": 204398, "epoch": 4866} {"train_loss": -7.292422771453857, "global_step": 204399, "epoch": 4866} {"train_loss": -7.316501617431641, "global_step": 204400, "epoch": 4866} {"train_loss": -7.176365852355957, "global_step": 204401, "epoch": 4866} {"train_loss": -7.282326698303223, "global_step": 204402, "epoch": 4866} {"train_loss": -7.2864274978637695, "global_step": 204403, "epoch": 4866} {"train_loss": -7.230010986328125, "global_step": 204404, "epoch": 4866} {"train_loss": -7.22517204284668, "global_step": 204405, "epoch": 4866} {"train_loss": -7.330422878265381, "global_step": 204406, "epoch": 4866} {"train_loss": -7.268960475921631, "global_step": 204407, "epoch": 4866} {"train_loss": -7.152753829956055, "global_step": 204408, "epoch": 4866} {"train_loss": -7.3828887939453125, "global_step": 204409, "epoch": 4866} {"train_loss": -7.225281715393066, "global_step": 204410, "epoch": 4866} {"train_loss": -7.344784736633301, "global_step": 204411, "epoch": 4866} {"train_loss": -7.244394779205322, "global_step": 204412, "epoch": 4866} {"train_loss": -7.292252392995925, "global_step": 204413, "epoch": 4866, "val_loss": 70123.796875} {"train_loss": -7.286723613739014, "global_step": 204414, "epoch": 4867} {"train_loss": -7.240451812744141, "global_step": 204415, "epoch": 4867} {"train_loss": -7.460994243621826, "global_step": 204416, "epoch": 4867} {"train_loss": -7.224908351898193, "global_step": 204417, "epoch": 4867} {"train_loss": -7.270748138427734, "global_step": 204418, "epoch": 4867} {"train_loss": -7.228146553039551, "global_step": 204419, "epoch": 4867} {"train_loss": -7.212862491607666, "global_step": 204420, "epoch": 4867} {"train_loss": -7.118650913238525, "global_step": 204421, "epoch": 4867} {"train_loss": -7.283026218414307, "global_step": 204422, "epoch": 4867} {"train_loss": -7.277719020843506, "global_step": 204423, "epoch": 4867} {"train_loss": -7.306665897369385, "global_step": 204424, "epoch": 4867} {"train_loss": -7.316067695617676, "global_step": 204425, "epoch": 4867} {"train_loss": -7.28948974609375, "global_step": 204426, "epoch": 4867} {"train_loss": -7.311067581176758, "global_step": 204427, "epoch": 4867} {"train_loss": -7.335556983947754, "global_step": 204428, "epoch": 4867} {"train_loss": -7.281435012817383, "global_step": 204429, "epoch": 4867} {"train_loss": -7.310670375823975, "global_step": 204430, "epoch": 4867} {"train_loss": -7.30438232421875, "global_step": 204431, "epoch": 4867} {"train_loss": -7.251312255859375, "global_step": 204432, "epoch": 4867} {"train_loss": -7.336169242858887, "global_step": 204433, "epoch": 4867} {"train_loss": -7.383085250854492, "global_step": 204434, "epoch": 4867} {"train_loss": -7.187702178955078, "global_step": 204435, "epoch": 4867} {"train_loss": -7.302935600280762, "global_step": 204436, "epoch": 4867} {"train_loss": -7.194548606872559, "global_step": 204437, "epoch": 4867} {"train_loss": -7.206563949584961, "global_step": 204438, "epoch": 4867} {"train_loss": -7.2485151290893555, "global_step": 204439, "epoch": 4867} {"train_loss": -7.31728982925415, "global_step": 204440, "epoch": 4867} {"train_loss": -7.305047035217285, "global_step": 204441, "epoch": 4867} {"train_loss": -7.3121442794799805, "global_step": 204442, "epoch": 4867} {"train_loss": -7.2290544509887695, "global_step": 204443, "epoch": 4867} {"train_loss": -7.342731952667236, "global_step": 204444, "epoch": 4867} {"train_loss": -7.263683319091797, "global_step": 204445, "epoch": 4867} {"train_loss": -7.2103495597839355, "global_step": 204446, "epoch": 4867} {"train_loss": -7.263426303863525, "global_step": 204447, "epoch": 4867} {"train_loss": -7.221362590789795, "global_step": 204448, "epoch": 4867} {"train_loss": -7.144949913024902, "global_step": 204449, "epoch": 4867} {"train_loss": -7.293906211853027, "global_step": 204450, "epoch": 4867} {"train_loss": -7.1481804847717285, "global_step": 204451, "epoch": 4867} {"train_loss": -7.307672500610352, "global_step": 204452, "epoch": 4867} {"train_loss": -7.287772178649902, "global_step": 204453, "epoch": 4867} {"train_loss": -7.204253196716309, "global_step": 204454, "epoch": 4867} {"train_loss": -7.2694221110571, "global_step": 204455, "epoch": 4867, "val_loss": 69979.921875} {"train_loss": -7.193998336791992, "global_step": 204456, "epoch": 4868} {"train_loss": -7.3120832443237305, "global_step": 204457, "epoch": 4868} {"train_loss": -7.293024063110352, "global_step": 204458, "epoch": 4868} {"train_loss": -7.154168605804443, "global_step": 204459, "epoch": 4868} {"train_loss": -7.289566993713379, "global_step": 204460, "epoch": 4868} {"train_loss": -7.24021577835083, "global_step": 204461, "epoch": 4868} {"train_loss": -7.273864269256592, "global_step": 204462, "epoch": 4868} {"train_loss": -7.2430925369262695, "global_step": 204463, "epoch": 4868} {"train_loss": -7.165022850036621, "global_step": 204464, "epoch": 4868} {"train_loss": -7.088569641113281, "global_step": 204465, "epoch": 4868} {"train_loss": -7.348331451416016, "global_step": 204466, "epoch": 4868} {"train_loss": -7.152576446533203, "global_step": 204467, "epoch": 4868} {"train_loss": -7.166229248046875, "global_step": 204468, "epoch": 4868} {"train_loss": -7.142462730407715, "global_step": 204469, "epoch": 4868} {"train_loss": -7.1865644454956055, "global_step": 204470, "epoch": 4868} {"train_loss": -7.179522514343262, "global_step": 204471, "epoch": 4868} {"train_loss": -7.166501522064209, "global_step": 204472, "epoch": 4868} {"train_loss": -7.135239601135254, "global_step": 204473, "epoch": 4868} {"train_loss": -7.059344291687012, "global_step": 204474, "epoch": 4868} {"train_loss": -7.183314800262451, "global_step": 204475, "epoch": 4868} {"train_loss": -7.063262939453125, "global_step": 204476, "epoch": 4868} {"train_loss": -7.242552757263184, "global_step": 204477, "epoch": 4868} {"train_loss": -7.290923595428467, "global_step": 204478, "epoch": 4868} {"train_loss": -7.117317199707031, "global_step": 204479, "epoch": 4868} {"train_loss": -7.249472141265869, "global_step": 204480, "epoch": 4868} {"train_loss": -7.085631370544434, "global_step": 204481, "epoch": 4868} {"train_loss": -7.1442365646362305, "global_step": 204482, "epoch": 4868} {"train_loss": -7.389098167419434, "global_step": 204483, "epoch": 4868} {"train_loss": -7.1079936027526855, "global_step": 204484, "epoch": 4868} {"train_loss": -7.226741790771484, "global_step": 204485, "epoch": 4868} {"train_loss": -7.131059646606445, "global_step": 204486, "epoch": 4868} {"train_loss": -7.152099609375, "global_step": 204487, "epoch": 4868} {"train_loss": -7.3628034591674805, "global_step": 204488, "epoch": 4868} {"train_loss": -7.150321960449219, "global_step": 204489, "epoch": 4868} {"train_loss": -7.229672431945801, "global_step": 204490, "epoch": 4868} {"train_loss": -7.258066654205322, "global_step": 204491, "epoch": 4868} {"train_loss": -7.2057695388793945, "global_step": 204492, "epoch": 4868} {"train_loss": -7.261541366577148, "global_step": 204493, "epoch": 4868} {"train_loss": -7.256293296813965, "global_step": 204494, "epoch": 4868} {"train_loss": -7.298708915710449, "global_step": 204495, "epoch": 4868} {"train_loss": -7.216006278991699, "global_step": 204496, "epoch": 4868} {"train_loss": -7.208136683418637, "global_step": 204497, "epoch": 4868, "val_loss": 69810.6015625} {"train_loss": -7.351955413818359, "global_step": 204498, "epoch": 4869} {"train_loss": -7.196985244750977, "global_step": 204499, "epoch": 4869} {"train_loss": -7.419286727905273, "global_step": 204500, "epoch": 4869} {"train_loss": -7.413480758666992, "global_step": 204501, "epoch": 4869} {"train_loss": -7.261529445648193, "global_step": 204502, "epoch": 4869} {"train_loss": -7.355581283569336, "global_step": 204503, "epoch": 4869} {"train_loss": -7.380277633666992, "global_step": 204504, "epoch": 4869} {"train_loss": -7.275084495544434, "global_step": 204505, "epoch": 4869} {"train_loss": -7.257755279541016, "global_step": 204506, "epoch": 4869} {"train_loss": -7.246477127075195, "global_step": 204507, "epoch": 4869} {"train_loss": -7.3704514503479, "global_step": 204508, "epoch": 4869} {"train_loss": -7.424446105957031, "global_step": 204509, "epoch": 4869} {"train_loss": -7.3060102462768555, "global_step": 204510, "epoch": 4869} {"train_loss": -7.249416351318359, "global_step": 204511, "epoch": 4869} {"train_loss": -7.38341760635376, "global_step": 204512, "epoch": 4869} {"train_loss": -7.079896450042725, "global_step": 204513, "epoch": 4869} {"train_loss": -7.204736709594727, "global_step": 204514, "epoch": 4869} {"train_loss": -7.263285160064697, "global_step": 204515, "epoch": 4869} {"train_loss": -7.218393802642822, "global_step": 204516, "epoch": 4869} {"train_loss": -7.308492660522461, "global_step": 204517, "epoch": 4869} {"train_loss": -7.1996073722839355, "global_step": 204518, "epoch": 4869} {"train_loss": -7.280804634094238, "global_step": 204519, "epoch": 4869} {"train_loss": -7.236146926879883, "global_step": 204520, "epoch": 4869} {"train_loss": -7.276977062225342, "global_step": 204521, "epoch": 4869} {"train_loss": -7.260934829711914, "global_step": 204522, "epoch": 4869} {"train_loss": -7.325733184814453, "global_step": 204523, "epoch": 4869} {"train_loss": -7.243119716644287, "global_step": 204524, "epoch": 4869} {"train_loss": -7.375144004821777, "global_step": 204525, "epoch": 4869} {"train_loss": -7.260321617126465, "global_step": 204526, "epoch": 4869} {"train_loss": -7.286781311035156, "global_step": 204527, "epoch": 4869} {"train_loss": -7.3062052726745605, "global_step": 204528, "epoch": 4869} {"train_loss": -7.218493461608887, "global_step": 204529, "epoch": 4869} {"train_loss": -7.274436950683594, "global_step": 204530, "epoch": 4869} {"train_loss": -7.328741550445557, "global_step": 204531, "epoch": 4869} {"train_loss": -7.349949836730957, "global_step": 204532, "epoch": 4869} {"train_loss": -7.330470085144043, "global_step": 204533, "epoch": 4869} {"train_loss": -7.302711486816406, "global_step": 204534, "epoch": 4869} {"train_loss": -7.1791887283325195, "global_step": 204535, "epoch": 4869} {"train_loss": -7.359072208404541, "global_step": 204536, "epoch": 4869} {"train_loss": -7.251143455505371, "global_step": 204537, "epoch": 4869} {"train_loss": -7.338698863983154, "global_step": 204538, "epoch": 4869} {"train_loss": -7.289943513416109, "global_step": 204539, "epoch": 4869, "val_loss": 69988.625} {"train_loss": -7.344555854797363, "global_step": 204540, "epoch": 4870} {"train_loss": -7.435050010681152, "global_step": 204541, "epoch": 4870} {"train_loss": -7.200521469116211, "global_step": 204542, "epoch": 4870} {"train_loss": -7.356230735778809, "global_step": 204543, "epoch": 4870} {"train_loss": -7.410416603088379, "global_step": 204544, "epoch": 4870} {"train_loss": -7.2878313064575195, "global_step": 204545, "epoch": 4870} {"train_loss": -7.189617156982422, "global_step": 204546, "epoch": 4870} {"train_loss": -7.184882164001465, "global_step": 204547, "epoch": 4870} {"train_loss": -7.403288841247559, "global_step": 204548, "epoch": 4870} {"train_loss": -7.437954902648926, "global_step": 204549, "epoch": 4870} {"train_loss": -7.345903396606445, "global_step": 204550, "epoch": 4870} {"train_loss": -7.214607238769531, "global_step": 204551, "epoch": 4870} {"train_loss": -7.242928981781006, "global_step": 204552, "epoch": 4870} {"train_loss": -7.319027900695801, "global_step": 204553, "epoch": 4870} {"train_loss": -7.363620281219482, "global_step": 204554, "epoch": 4870} {"train_loss": -7.354903221130371, "global_step": 204555, "epoch": 4870} {"train_loss": -7.215980529785156, "global_step": 204556, "epoch": 4870} {"train_loss": -7.376901149749756, "global_step": 204557, "epoch": 4870} {"train_loss": -7.341288089752197, "global_step": 204558, "epoch": 4870} {"train_loss": -7.220372200012207, "global_step": 204559, "epoch": 4870} {"train_loss": -7.390213489532471, "global_step": 204560, "epoch": 4870} {"train_loss": -7.390994548797607, "global_step": 204561, "epoch": 4870} {"train_loss": -7.28985595703125, "global_step": 204562, "epoch": 4870} {"train_loss": -7.227195739746094, "global_step": 204563, "epoch": 4870} {"train_loss": -7.050313472747803, "global_step": 204564, "epoch": 4870} {"train_loss": -7.333280086517334, "global_step": 204565, "epoch": 4870} {"train_loss": -7.316944599151611, "global_step": 204566, "epoch": 4870} {"train_loss": -7.233092308044434, "global_step": 204567, "epoch": 4870} {"train_loss": -7.430253982543945, "global_step": 204568, "epoch": 4870} {"train_loss": -7.242308616638184, "global_step": 204569, "epoch": 4870} {"train_loss": -7.232473373413086, "global_step": 204570, "epoch": 4870} {"train_loss": -7.307888031005859, "global_step": 204571, "epoch": 4870} {"train_loss": -7.126447677612305, "global_step": 204572, "epoch": 4870} {"train_loss": -7.204276084899902, "global_step": 204573, "epoch": 4870} {"train_loss": -7.223695755004883, "global_step": 204574, "epoch": 4870} {"train_loss": -7.139523029327393, "global_step": 204575, "epoch": 4870} {"train_loss": -7.273797035217285, "global_step": 204576, "epoch": 4870} {"train_loss": -7.199646949768066, "global_step": 204577, "epoch": 4870} {"train_loss": -7.332650184631348, "global_step": 204578, "epoch": 4870} {"train_loss": -7.149984359741211, "global_step": 204579, "epoch": 4870} {"train_loss": -7.196430206298828, "global_step": 204580, "epoch": 4870} {"train_loss": -7.282710007258824, "global_step": 204581, "epoch": 4870, "val_loss": 69884.1328125} {"train_loss": -7.260466575622559, "global_step": 204582, "epoch": 4871} {"train_loss": -7.162195205688477, "global_step": 204583, "epoch": 4871} {"train_loss": -7.344888687133789, "global_step": 204584, "epoch": 4871} {"train_loss": -7.250772953033447, "global_step": 204585, "epoch": 4871} {"train_loss": -7.2095136642456055, "global_step": 204586, "epoch": 4871} {"train_loss": -7.22771692276001, "global_step": 204587, "epoch": 4871} {"train_loss": -7.2160139083862305, "global_step": 204588, "epoch": 4871} {"train_loss": -7.303277492523193, "global_step": 204589, "epoch": 4871} {"train_loss": -7.321064472198486, "global_step": 204590, "epoch": 4871} {"train_loss": -7.346764087677002, "global_step": 204591, "epoch": 4871} {"train_loss": -7.374067306518555, "global_step": 204592, "epoch": 4871} {"train_loss": -7.276175498962402, "global_step": 204593, "epoch": 4871} {"train_loss": -7.357248306274414, "global_step": 204594, "epoch": 4871} {"train_loss": -7.21072244644165, "global_step": 204595, "epoch": 4871} {"train_loss": -7.307667255401611, "global_step": 204596, "epoch": 4871} {"train_loss": -7.2699103355407715, "global_step": 204597, "epoch": 4871} {"train_loss": -7.305920600891113, "global_step": 204598, "epoch": 4871} {"train_loss": -7.301921367645264, "global_step": 204599, "epoch": 4871} {"train_loss": -7.337279796600342, "global_step": 204600, "epoch": 4871} {"train_loss": -7.411716461181641, "global_step": 204601, "epoch": 4871} {"train_loss": -7.304714202880859, "global_step": 204602, "epoch": 4871} {"train_loss": -7.215274333953857, "global_step": 204603, "epoch": 4871} {"train_loss": -7.317625522613525, "global_step": 204604, "epoch": 4871} {"train_loss": -7.164557456970215, "global_step": 204605, "epoch": 4871} {"train_loss": -7.318994998931885, "global_step": 204606, "epoch": 4871} {"train_loss": -7.330864906311035, "global_step": 204607, "epoch": 4871} {"train_loss": -7.366324424743652, "global_step": 204608, "epoch": 4871} {"train_loss": -7.289040565490723, "global_step": 204609, "epoch": 4871} {"train_loss": -7.307351112365723, "global_step": 204610, "epoch": 4871} {"train_loss": -7.243167400360107, "global_step": 204611, "epoch": 4871} {"train_loss": -7.381214141845703, "global_step": 204612, "epoch": 4871} {"train_loss": -7.348212242126465, "global_step": 204613, "epoch": 4871} {"train_loss": -7.39334774017334, "global_step": 204614, "epoch": 4871} {"train_loss": -7.342518329620361, "global_step": 204615, "epoch": 4871} {"train_loss": -7.315415382385254, "global_step": 204616, "epoch": 4871} {"train_loss": -7.2794694900512695, "global_step": 204617, "epoch": 4871} {"train_loss": -7.2806525230407715, "global_step": 204618, "epoch": 4871} {"train_loss": -7.27956485748291, "global_step": 204619, "epoch": 4871} {"train_loss": -7.313589572906494, "global_step": 204620, "epoch": 4871} {"train_loss": -7.235317230224609, "global_step": 204621, "epoch": 4871} {"train_loss": -7.372337818145752, "global_step": 204622, "epoch": 4871} {"train_loss": -7.290980929420108, "global_step": 204623, "epoch": 4871, "val_loss": 69877.1953125} {"train_loss": -7.437795639038086, "global_step": 204624, "epoch": 4872} {"train_loss": -7.17283296585083, "global_step": 204625, "epoch": 4872} {"train_loss": -7.068997859954834, "global_step": 204626, "epoch": 4872} {"train_loss": -7.24812126159668, "global_step": 204627, "epoch": 4872} {"train_loss": -7.154590606689453, "global_step": 204628, "epoch": 4872} {"train_loss": -7.1490912437438965, "global_step": 204629, "epoch": 4872} {"train_loss": -7.225055694580078, "global_step": 204630, "epoch": 4872} {"train_loss": -7.092263221740723, "global_step": 204631, "epoch": 4872} {"train_loss": -7.356023788452148, "global_step": 204632, "epoch": 4872} {"train_loss": -7.163697719573975, "global_step": 204633, "epoch": 4872} {"train_loss": -7.302951812744141, "global_step": 204634, "epoch": 4872} {"train_loss": -7.231047630310059, "global_step": 204635, "epoch": 4872} {"train_loss": -7.138971328735352, "global_step": 204636, "epoch": 4872} {"train_loss": -7.284503936767578, "global_step": 204637, "epoch": 4872} {"train_loss": -7.206352233886719, "global_step": 204638, "epoch": 4872} {"train_loss": -7.421602249145508, "global_step": 204639, "epoch": 4872} {"train_loss": -7.21544075012207, "global_step": 204640, "epoch": 4872} {"train_loss": -7.2822160720825195, "global_step": 204641, "epoch": 4872} {"train_loss": -7.283146381378174, "global_step": 204642, "epoch": 4872} {"train_loss": -7.157073974609375, "global_step": 204643, "epoch": 4872} {"train_loss": -7.388559341430664, "global_step": 204644, "epoch": 4872} {"train_loss": -7.266481399536133, "global_step": 204645, "epoch": 4872} {"train_loss": -7.27565336227417, "global_step": 204646, "epoch": 4872} {"train_loss": -7.191830635070801, "global_step": 204647, "epoch": 4872} {"train_loss": -7.338911056518555, "global_step": 204648, "epoch": 4872} {"train_loss": -7.3335862159729, "global_step": 204649, "epoch": 4872} {"train_loss": -7.318528652191162, "global_step": 204650, "epoch": 4872} {"train_loss": -7.291704177856445, "global_step": 204651, "epoch": 4872} {"train_loss": -7.325691223144531, "global_step": 204652, "epoch": 4872} {"train_loss": -7.379952907562256, "global_step": 204653, "epoch": 4872} {"train_loss": -7.317707061767578, "global_step": 204654, "epoch": 4872} {"train_loss": -7.438899517059326, "global_step": 204655, "epoch": 4872} {"train_loss": -7.495796203613281, "global_step": 204656, "epoch": 4872} {"train_loss": -7.436280250549316, "global_step": 204657, "epoch": 4872} {"train_loss": -7.295538902282715, "global_step": 204658, "epoch": 4872} {"train_loss": -7.403660774230957, "global_step": 204659, "epoch": 4872} {"train_loss": -7.450220584869385, "global_step": 204660, "epoch": 4872} {"train_loss": -7.405527114868164, "global_step": 204661, "epoch": 4872} {"train_loss": -7.296116828918457, "global_step": 204662, "epoch": 4872} {"train_loss": -7.367193222045898, "global_step": 204663, "epoch": 4872} {"train_loss": -7.310248851776123, "global_step": 204664, "epoch": 4872} {"train_loss": -7.291642972401211, "global_step": 204665, "epoch": 4872, "val_loss": 69822.71875} {"train_loss": -7.455463409423828, "global_step": 204666, "epoch": 4873} {"train_loss": -7.382963180541992, "global_step": 204667, "epoch": 4873} {"train_loss": -7.364811897277832, "global_step": 204668, "epoch": 4873} {"train_loss": -7.325793266296387, "global_step": 204669, "epoch": 4873} {"train_loss": -7.377026081085205, "global_step": 204670, "epoch": 4873} {"train_loss": -7.274593353271484, "global_step": 204671, "epoch": 4873} {"train_loss": -7.4143781661987305, "global_step": 204672, "epoch": 4873} {"train_loss": -7.3608551025390625, "global_step": 204673, "epoch": 4873} {"train_loss": -7.328209400177002, "global_step": 204674, "epoch": 4873} {"train_loss": -7.368809700012207, "global_step": 204675, "epoch": 4873} {"train_loss": -7.364110946655273, "global_step": 204676, "epoch": 4873} {"train_loss": -7.376653671264648, "global_step": 204677, "epoch": 4873} {"train_loss": -7.175358295440674, "global_step": 204678, "epoch": 4873} {"train_loss": -7.379611968994141, "global_step": 204679, "epoch": 4873} {"train_loss": -7.246841907501221, "global_step": 204680, "epoch": 4873} {"train_loss": -7.353366851806641, "global_step": 204681, "epoch": 4873} {"train_loss": -7.301396369934082, "global_step": 204682, "epoch": 4873} {"train_loss": -7.246798515319824, "global_step": 204683, "epoch": 4873} {"train_loss": -7.317818641662598, "global_step": 204684, "epoch": 4873} {"train_loss": -7.391446590423584, "global_step": 204685, "epoch": 4873} {"train_loss": -7.410704135894775, "global_step": 204686, "epoch": 4873} {"train_loss": -7.413703918457031, "global_step": 204687, "epoch": 4873} {"train_loss": -7.298227787017822, "global_step": 204688, "epoch": 4873} {"train_loss": -7.4030656814575195, "global_step": 204689, "epoch": 4873} {"train_loss": -7.334733009338379, "global_step": 204690, "epoch": 4873} {"train_loss": -7.318728446960449, "global_step": 204691, "epoch": 4873} {"train_loss": -7.183248996734619, "global_step": 204692, "epoch": 4873} {"train_loss": -7.272111892700195, "global_step": 204693, "epoch": 4873} {"train_loss": -7.3556671142578125, "global_step": 204694, "epoch": 4873} {"train_loss": -7.2925615310668945, "global_step": 204695, "epoch": 4873} {"train_loss": -7.261068820953369, "global_step": 204696, "epoch": 4873} {"train_loss": -7.359771728515625, "global_step": 204697, "epoch": 4873} {"train_loss": -7.251197338104248, "global_step": 204698, "epoch": 4873} {"train_loss": -7.279892921447754, "global_step": 204699, "epoch": 4873} {"train_loss": -7.338654518127441, "global_step": 204700, "epoch": 4873} {"train_loss": -7.203625679016113, "global_step": 204701, "epoch": 4873} {"train_loss": -7.320573806762695, "global_step": 204702, "epoch": 4873} {"train_loss": -7.431238174438477, "global_step": 204703, "epoch": 4873} {"train_loss": -7.303864479064941, "global_step": 204704, "epoch": 4873} {"train_loss": -7.3141584396362305, "global_step": 204705, "epoch": 4873} {"train_loss": -7.353169918060303, "global_step": 204706, "epoch": 4873} {"train_loss": -7.331594342277164, "global_step": 204707, "epoch": 4873, "val_loss": 70064.71875} {"train_loss": -7.273345947265625, "global_step": 204708, "epoch": 4874} {"train_loss": -7.33155632019043, "global_step": 204709, "epoch": 4874} {"train_loss": -7.334815979003906, "global_step": 204710, "epoch": 4874} {"train_loss": -7.249460220336914, "global_step": 204711, "epoch": 4874} {"train_loss": -7.361905574798584, "global_step": 204712, "epoch": 4874} {"train_loss": -7.117221832275391, "global_step": 204713, "epoch": 4874} {"train_loss": -7.295742034912109, "global_step": 204714, "epoch": 4874} {"train_loss": -7.3187971115112305, "global_step": 204715, "epoch": 4874} {"train_loss": -7.273325443267822, "global_step": 204716, "epoch": 4874} {"train_loss": -7.310781002044678, "global_step": 204717, "epoch": 4874} {"train_loss": -7.322882652282715, "global_step": 204718, "epoch": 4874} {"train_loss": -7.249575138092041, "global_step": 204719, "epoch": 4874} {"train_loss": -7.307656288146973, "global_step": 204720, "epoch": 4874} {"train_loss": -7.390104293823242, "global_step": 204721, "epoch": 4874} {"train_loss": -7.245635032653809, "global_step": 204722, "epoch": 4874} {"train_loss": -7.3120880126953125, "global_step": 204723, "epoch": 4874} {"train_loss": -7.2008562088012695, "global_step": 204724, "epoch": 4874} {"train_loss": -7.2746262550354, "global_step": 204725, "epoch": 4874} {"train_loss": -7.2378764152526855, "global_step": 204726, "epoch": 4874} {"train_loss": -7.345431804656982, "global_step": 204727, "epoch": 4874} {"train_loss": -7.195189476013184, "global_step": 204728, "epoch": 4874} {"train_loss": -7.181588649749756, "global_step": 204729, "epoch": 4874} {"train_loss": -7.279272079467773, "global_step": 204730, "epoch": 4874} {"train_loss": -7.280664443969727, "global_step": 204731, "epoch": 4874} {"train_loss": -7.236847877502441, "global_step": 204732, "epoch": 4874} {"train_loss": -7.319614410400391, "global_step": 204733, "epoch": 4874} {"train_loss": -7.139042854309082, "global_step": 204734, "epoch": 4874} {"train_loss": -7.259850025177002, "global_step": 204735, "epoch": 4874} {"train_loss": -7.263258457183838, "global_step": 204736, "epoch": 4874} {"train_loss": -7.174129962921143, "global_step": 204737, "epoch": 4874} {"train_loss": -7.208551406860352, "global_step": 204738, "epoch": 4874} {"train_loss": -7.268777847290039, "global_step": 204739, "epoch": 4874} {"train_loss": -7.166260719299316, "global_step": 204740, "epoch": 4874} {"train_loss": -7.289052486419678, "global_step": 204741, "epoch": 4874} {"train_loss": -7.287134647369385, "global_step": 204742, "epoch": 4874} {"train_loss": -7.235825538635254, "global_step": 204743, "epoch": 4874} {"train_loss": -7.296152591705322, "global_step": 204744, "epoch": 4874} {"train_loss": -7.178782939910889, "global_step": 204745, "epoch": 4874} {"train_loss": -7.228723049163818, "global_step": 204746, "epoch": 4874} {"train_loss": -7.156590461730957, "global_step": 204747, "epoch": 4874} {"train_loss": -7.23930549621582, "global_step": 204748, "epoch": 4874} {"train_loss": -7.260216781071255, "global_step": 204749, "epoch": 4874, "val_loss": 69966.59375} {"train_loss": -7.277013301849365, "global_step": 204750, "epoch": 4875} {"train_loss": -7.253087520599365, "global_step": 204751, "epoch": 4875} {"train_loss": -7.153182029724121, "global_step": 204752, "epoch": 4875} {"train_loss": -7.273694038391113, "global_step": 204753, "epoch": 4875} {"train_loss": -7.273029327392578, "global_step": 204754, "epoch": 4875} {"train_loss": -7.209425449371338, "global_step": 204755, "epoch": 4875} {"train_loss": -7.40714168548584, "global_step": 204756, "epoch": 4875} {"train_loss": -7.2507829666137695, "global_step": 204757, "epoch": 4875} {"train_loss": -7.348649978637695, "global_step": 204758, "epoch": 4875} {"train_loss": -7.192807674407959, "global_step": 204759, "epoch": 4875} {"train_loss": -7.2725701332092285, "global_step": 204760, "epoch": 4875} {"train_loss": -7.1890153884887695, "global_step": 204761, "epoch": 4875} {"train_loss": -7.307886123657227, "global_step": 204762, "epoch": 4875} {"train_loss": -7.142541885375977, "global_step": 204763, "epoch": 4875} {"train_loss": -7.1129302978515625, "global_step": 204764, "epoch": 4875} {"train_loss": -7.279829978942871, "global_step": 204765, "epoch": 4875} {"train_loss": -7.32695198059082, "global_step": 204766, "epoch": 4875} {"train_loss": -7.359397888183594, "global_step": 204767, "epoch": 4875} {"train_loss": -7.419806480407715, "global_step": 204768, "epoch": 4875} {"train_loss": -7.217025279998779, "global_step": 204769, "epoch": 4875} {"train_loss": -7.292544841766357, "global_step": 204770, "epoch": 4875} {"train_loss": -7.295110702514648, "global_step": 204771, "epoch": 4875} {"train_loss": -7.304405689239502, "global_step": 204772, "epoch": 4875} {"train_loss": -7.328152656555176, "global_step": 204773, "epoch": 4875} {"train_loss": -7.240302562713623, "global_step": 204774, "epoch": 4875} {"train_loss": -7.381984710693359, "global_step": 204775, "epoch": 4875} {"train_loss": -7.354763507843018, "global_step": 204776, "epoch": 4875} {"train_loss": -7.328054904937744, "global_step": 204777, "epoch": 4875} {"train_loss": -7.464130401611328, "global_step": 204778, "epoch": 4875} {"train_loss": -7.3503499031066895, "global_step": 204779, "epoch": 4875} {"train_loss": -7.301071643829346, "global_step": 204780, "epoch": 4875} {"train_loss": -7.294916152954102, "global_step": 204781, "epoch": 4875} {"train_loss": -7.265678882598877, "global_step": 204782, "epoch": 4875} {"train_loss": -7.232812404632568, "global_step": 204783, "epoch": 4875} {"train_loss": -7.397429466247559, "global_step": 204784, "epoch": 4875} {"train_loss": -7.198779582977295, "global_step": 204785, "epoch": 4875} {"train_loss": -7.160858154296875, "global_step": 204786, "epoch": 4875} {"train_loss": -7.367387771606445, "global_step": 204787, "epoch": 4875} {"train_loss": -7.161208629608154, "global_step": 204788, "epoch": 4875} {"train_loss": -7.207010269165039, "global_step": 204789, "epoch": 4875} {"train_loss": -7.399468898773193, "global_step": 204790, "epoch": 4875} {"train_loss": -7.2800504593622115, "global_step": 204791, "epoch": 4875, "val_loss": 70073.640625} {"train_loss": -7.243524551391602, "global_step": 204792, "epoch": 4876} {"train_loss": -7.180429458618164, "global_step": 204793, "epoch": 4876} {"train_loss": -7.289739608764648, "global_step": 204794, "epoch": 4876} {"train_loss": -7.307976722717285, "global_step": 204795, "epoch": 4876} {"train_loss": -7.174228668212891, "global_step": 204796, "epoch": 4876} {"train_loss": -7.297821998596191, "global_step": 204797, "epoch": 4876} {"train_loss": -7.265824794769287, "global_step": 204798, "epoch": 4876} {"train_loss": -7.279632568359375, "global_step": 204799, "epoch": 4876} {"train_loss": -7.198588848114014, "global_step": 204800, "epoch": 4876} {"train_loss": -7.331695079803467, "global_step": 204801, "epoch": 4876} {"train_loss": -7.362261772155762, "global_step": 204802, "epoch": 4876} {"train_loss": -7.204763412475586, "global_step": 204803, "epoch": 4876} {"train_loss": -7.258030891418457, "global_step": 204804, "epoch": 4876} {"train_loss": -7.227777481079102, "global_step": 204805, "epoch": 4876} {"train_loss": -7.367680072784424, "global_step": 204806, "epoch": 4876} {"train_loss": -7.2440571784973145, "global_step": 204807, "epoch": 4876} {"train_loss": -7.3279523849487305, "global_step": 204808, "epoch": 4876} {"train_loss": -7.204073905944824, "global_step": 204809, "epoch": 4876} {"train_loss": -7.280194282531738, "global_step": 204810, "epoch": 4876} {"train_loss": -7.272491455078125, "global_step": 204811, "epoch": 4876} {"train_loss": -7.117722511291504, "global_step": 204812, "epoch": 4876} {"train_loss": -7.307507038116455, "global_step": 204813, "epoch": 4876} {"train_loss": -7.354386329650879, "global_step": 204814, "epoch": 4876} {"train_loss": -7.288823127746582, "global_step": 204815, "epoch": 4876} {"train_loss": -7.279291152954102, "global_step": 204816, "epoch": 4876} {"train_loss": -7.333185195922852, "global_step": 204817, "epoch": 4876} {"train_loss": -7.257070541381836, "global_step": 204818, "epoch": 4876} {"train_loss": -7.351092338562012, "global_step": 204819, "epoch": 4876} {"train_loss": -7.337308883666992, "global_step": 204820, "epoch": 4876} {"train_loss": -7.304854393005371, "global_step": 204821, "epoch": 4876} {"train_loss": -7.328842639923096, "global_step": 204822, "epoch": 4876} {"train_loss": -7.28453254699707, "global_step": 204823, "epoch": 4876} {"train_loss": -7.269155979156494, "global_step": 204824, "epoch": 4876} {"train_loss": -7.336648464202881, "global_step": 204825, "epoch": 4876} {"train_loss": -7.3782758712768555, "global_step": 204826, "epoch": 4876} {"train_loss": -7.1852216720581055, "global_step": 204827, "epoch": 4876} {"train_loss": -7.344546318054199, "global_step": 204828, "epoch": 4876} {"train_loss": -7.239080429077148, "global_step": 204829, "epoch": 4876} {"train_loss": -7.187377452850342, "global_step": 204830, "epoch": 4876} {"train_loss": -7.3649396896362305, "global_step": 204831, "epoch": 4876} {"train_loss": -7.167065143585205, "global_step": 204832, "epoch": 4876} {"train_loss": -7.275274708157494, "global_step": 204833, "epoch": 4876, "val_loss": 70247.0859375} {"train_loss": -7.314229965209961, "global_step": 204834, "epoch": 4877} {"train_loss": -7.306056976318359, "global_step": 204835, "epoch": 4877} {"train_loss": -7.3181562423706055, "global_step": 204836, "epoch": 4877} {"train_loss": -7.295657157897949, "global_step": 204837, "epoch": 4877} {"train_loss": -7.288303852081299, "global_step": 204838, "epoch": 4877} {"train_loss": -7.354809761047363, "global_step": 204839, "epoch": 4877} {"train_loss": -7.2696919441223145, "global_step": 204840, "epoch": 4877} {"train_loss": -7.315020561218262, "global_step": 204841, "epoch": 4877} {"train_loss": -7.303452014923096, "global_step": 204842, "epoch": 4877} {"train_loss": -7.262105941772461, "global_step": 204843, "epoch": 4877} {"train_loss": -7.44374942779541, "global_step": 204844, "epoch": 4877} {"train_loss": -7.390138626098633, "global_step": 204845, "epoch": 4877} {"train_loss": -7.469522953033447, "global_step": 204846, "epoch": 4877} {"train_loss": -7.339438438415527, "global_step": 204847, "epoch": 4877} {"train_loss": -7.3136186599731445, "global_step": 204848, "epoch": 4877} {"train_loss": -7.357956886291504, "global_step": 204849, "epoch": 4877} {"train_loss": -7.336863994598389, "global_step": 204850, "epoch": 4877} {"train_loss": -7.3699164390563965, "global_step": 204851, "epoch": 4877} {"train_loss": -7.330414295196533, "global_step": 204852, "epoch": 4877} {"train_loss": -7.26595401763916, "global_step": 204853, "epoch": 4877} {"train_loss": -7.331464767456055, "global_step": 204854, "epoch": 4877} {"train_loss": -7.290404319763184, "global_step": 204855, "epoch": 4877} {"train_loss": -7.273017883300781, "global_step": 204856, "epoch": 4877} {"train_loss": -7.397061347961426, "global_step": 204857, "epoch": 4877} {"train_loss": -7.384136199951172, "global_step": 204858, "epoch": 4877} {"train_loss": -7.316690444946289, "global_step": 204859, "epoch": 4877} {"train_loss": -7.2946085929870605, "global_step": 204860, "epoch": 4877} {"train_loss": -7.29448127746582, "global_step": 204861, "epoch": 4877} {"train_loss": -7.323980331420898, "global_step": 204862, "epoch": 4877} {"train_loss": -7.177770614624023, "global_step": 204863, "epoch": 4877} {"train_loss": -7.283818244934082, "global_step": 204864, "epoch": 4877} {"train_loss": -7.146402359008789, "global_step": 204865, "epoch": 4877} {"train_loss": -7.338131427764893, "global_step": 204866, "epoch": 4877} {"train_loss": -7.298537731170654, "global_step": 204867, "epoch": 4877} {"train_loss": -7.152608394622803, "global_step": 204868, "epoch": 4877} {"train_loss": -7.348339557647705, "global_step": 204869, "epoch": 4877} {"train_loss": -7.20382022857666, "global_step": 204870, "epoch": 4877} {"train_loss": -7.15273904800415, "global_step": 204871, "epoch": 4877} {"train_loss": -7.258495330810547, "global_step": 204872, "epoch": 4877} {"train_loss": -7.236250400543213, "global_step": 204873, "epoch": 4877} {"train_loss": -7.261323928833008, "global_step": 204874, "epoch": 4877} {"train_loss": -7.301104193642026, "global_step": 204875, "epoch": 4877, "val_loss": 70002.7421875} {"train_loss": -7.19575309753418, "global_step": 204876, "epoch": 4878} {"train_loss": -7.401668548583984, "global_step": 204877, "epoch": 4878} {"train_loss": -7.2807111740112305, "global_step": 204878, "epoch": 4878} {"train_loss": -7.204246520996094, "global_step": 204879, "epoch": 4878} {"train_loss": -7.24513053894043, "global_step": 204880, "epoch": 4878} {"train_loss": -7.368830680847168, "global_step": 204881, "epoch": 4878} {"train_loss": -7.345007419586182, "global_step": 204882, "epoch": 4878} {"train_loss": -7.309804916381836, "global_step": 204883, "epoch": 4878} {"train_loss": -7.418092727661133, "global_step": 204884, "epoch": 4878} {"train_loss": -7.324405670166016, "global_step": 204885, "epoch": 4878} {"train_loss": -7.309796333312988, "global_step": 204886, "epoch": 4878} {"train_loss": -7.41298770904541, "global_step": 204887, "epoch": 4878} {"train_loss": -7.4288554191589355, "global_step": 204888, "epoch": 4878} {"train_loss": -7.393658638000488, "global_step": 204889, "epoch": 4878} {"train_loss": -7.2746124267578125, "global_step": 204890, "epoch": 4878} {"train_loss": -7.403397560119629, "global_step": 204891, "epoch": 4878} {"train_loss": -7.30327033996582, "global_step": 204892, "epoch": 4878} {"train_loss": -7.1781768798828125, "global_step": 204893, "epoch": 4878} {"train_loss": -7.307174205780029, "global_step": 204894, "epoch": 4878} {"train_loss": -7.466462135314941, "global_step": 204895, "epoch": 4878} {"train_loss": -7.371197700500488, "global_step": 204896, "epoch": 4878} {"train_loss": -7.379899501800537, "global_step": 204897, "epoch": 4878} {"train_loss": -7.293825149536133, "global_step": 204898, "epoch": 4878} {"train_loss": -7.378870010375977, "global_step": 204899, "epoch": 4878} {"train_loss": -7.294976234436035, "global_step": 204900, "epoch": 4878} {"train_loss": -7.292015552520752, "global_step": 204901, "epoch": 4878} {"train_loss": -7.346209526062012, "global_step": 204902, "epoch": 4878} {"train_loss": -7.331693649291992, "global_step": 204903, "epoch": 4878} {"train_loss": -7.345062255859375, "global_step": 204904, "epoch": 4878} {"train_loss": -7.400505542755127, "global_step": 204905, "epoch": 4878} {"train_loss": -7.420448303222656, "global_step": 204906, "epoch": 4878} {"train_loss": -7.355608940124512, "global_step": 204907, "epoch": 4878} {"train_loss": -7.372554779052734, "global_step": 204908, "epoch": 4878} {"train_loss": -7.343753814697266, "global_step": 204909, "epoch": 4878} {"train_loss": -7.308539867401123, "global_step": 204910, "epoch": 4878} {"train_loss": -7.132363319396973, "global_step": 204911, "epoch": 4878} {"train_loss": -7.415002822875977, "global_step": 204912, "epoch": 4878} {"train_loss": -7.276180267333984, "global_step": 204913, "epoch": 4878} {"train_loss": -7.223102569580078, "global_step": 204914, "epoch": 4878} {"train_loss": -7.404869079589844, "global_step": 204915, "epoch": 4878} {"train_loss": -7.188028812408447, "global_step": 204916, "epoch": 4878} {"train_loss": -7.326821667807443, "global_step": 204917, "epoch": 4878, "val_loss": 70142.390625} {"train_loss": -7.2245965003967285, "global_step": 204918, "epoch": 4879} {"train_loss": -7.1322102546691895, "global_step": 204919, "epoch": 4879} {"train_loss": -7.35613489151001, "global_step": 204920, "epoch": 4879} {"train_loss": -7.328238487243652, "global_step": 204921, "epoch": 4879} {"train_loss": -7.362201690673828, "global_step": 204922, "epoch": 4879} {"train_loss": -7.344902992248535, "global_step": 204923, "epoch": 4879} {"train_loss": -7.2896270751953125, "global_step": 204924, "epoch": 4879} {"train_loss": -7.292634010314941, "global_step": 204925, "epoch": 4879} {"train_loss": -7.2903361320495605, "global_step": 204926, "epoch": 4879} {"train_loss": -7.258554458618164, "global_step": 204927, "epoch": 4879} {"train_loss": -7.385095596313477, "global_step": 204928, "epoch": 4879} {"train_loss": -7.35535192489624, "global_step": 204929, "epoch": 4879} {"train_loss": -7.1944355964660645, "global_step": 204930, "epoch": 4879} {"train_loss": -7.3993988037109375, "global_step": 204931, "epoch": 4879} {"train_loss": -7.405550956726074, "global_step": 204932, "epoch": 4879} {"train_loss": -7.261610984802246, "global_step": 204933, "epoch": 4879} {"train_loss": -7.290641784667969, "global_step": 204934, "epoch": 4879} {"train_loss": -7.2339067459106445, "global_step": 204935, "epoch": 4879} {"train_loss": -7.427284240722656, "global_step": 204936, "epoch": 4879} {"train_loss": -7.277668476104736, "global_step": 204937, "epoch": 4879} {"train_loss": -7.364943504333496, "global_step": 204938, "epoch": 4879} {"train_loss": -7.27977180480957, "global_step": 204939, "epoch": 4879} {"train_loss": -7.281534671783447, "global_step": 204940, "epoch": 4879} {"train_loss": -7.324830055236816, "global_step": 204941, "epoch": 4879} {"train_loss": -7.379877090454102, "global_step": 204942, "epoch": 4879} {"train_loss": -7.373177528381348, "global_step": 204943, "epoch": 4879} {"train_loss": -7.306590557098389, "global_step": 204944, "epoch": 4879} {"train_loss": -7.194199085235596, "global_step": 204945, "epoch": 4879} {"train_loss": -7.2686004638671875, "global_step": 204946, "epoch": 4879} {"train_loss": -7.208244323730469, "global_step": 204947, "epoch": 4879} {"train_loss": -7.29448127746582, "global_step": 204948, "epoch": 4879} {"train_loss": -7.150537490844727, "global_step": 204949, "epoch": 4879} {"train_loss": -7.366330146789551, "global_step": 204950, "epoch": 4879} {"train_loss": -7.2677435874938965, "global_step": 204951, "epoch": 4879} {"train_loss": -7.276841163635254, "global_step": 204952, "epoch": 4879} {"train_loss": -7.3260064125061035, "global_step": 204953, "epoch": 4879} {"train_loss": -7.351920127868652, "global_step": 204954, "epoch": 4879} {"train_loss": -7.1614885330200195, "global_step": 204955, "epoch": 4879} {"train_loss": -7.30717658996582, "global_step": 204956, "epoch": 4879} {"train_loss": -7.313968658447266, "global_step": 204957, "epoch": 4879} {"train_loss": -7.220821380615234, "global_step": 204958, "epoch": 4879} {"train_loss": -7.2939673491886685, "global_step": 204959, "epoch": 4879, "val_loss": 70159.1328125} {"train_loss": -7.263364791870117, "global_step": 204960, "epoch": 4880} {"train_loss": -7.35917329788208, "global_step": 204961, "epoch": 4880} {"train_loss": -7.242435932159424, "global_step": 204962, "epoch": 4880} {"train_loss": -7.226917266845703, "global_step": 204963, "epoch": 4880} {"train_loss": -7.216620445251465, "global_step": 204964, "epoch": 4880} {"train_loss": -7.166407585144043, "global_step": 204965, "epoch": 4880} {"train_loss": -7.22641134262085, "global_step": 204966, "epoch": 4880} {"train_loss": -7.194239616394043, "global_step": 204967, "epoch": 4880} {"train_loss": -7.248578071594238, "global_step": 204968, "epoch": 4880} {"train_loss": -7.2673659324646, "global_step": 204969, "epoch": 4880} {"train_loss": -7.188473701477051, "global_step": 204970, "epoch": 4880} {"train_loss": -7.234796524047852, "global_step": 204971, "epoch": 4880} {"train_loss": -7.096792221069336, "global_step": 204972, "epoch": 4880} {"train_loss": -7.22953987121582, "global_step": 204973, "epoch": 4880} {"train_loss": -7.2178144454956055, "global_step": 204974, "epoch": 4880} {"train_loss": -7.082466125488281, "global_step": 204975, "epoch": 4880} {"train_loss": -7.231320381164551, "global_step": 204976, "epoch": 4880} {"train_loss": -7.205203533172607, "global_step": 204977, "epoch": 4880} {"train_loss": -7.274794578552246, "global_step": 204978, "epoch": 4880} {"train_loss": -7.210371017456055, "global_step": 204979, "epoch": 4880} {"train_loss": -7.392939567565918, "global_step": 204980, "epoch": 4880} {"train_loss": -7.290987968444824, "global_step": 204981, "epoch": 4880} {"train_loss": -7.200656890869141, "global_step": 204982, "epoch": 4880} {"train_loss": -7.276024341583252, "global_step": 204983, "epoch": 4880} {"train_loss": -7.1900835037231445, "global_step": 204984, "epoch": 4880} {"train_loss": -7.377035617828369, "global_step": 204985, "epoch": 4880} {"train_loss": -7.155802249908447, "global_step": 204986, "epoch": 4880} {"train_loss": -7.248224258422852, "global_step": 204987, "epoch": 4880} {"train_loss": -7.224199295043945, "global_step": 204988, "epoch": 4880} {"train_loss": -7.339280128479004, "global_step": 204989, "epoch": 4880} {"train_loss": -7.323155403137207, "global_step": 204990, "epoch": 4880} {"train_loss": -7.2523369789123535, "global_step": 204991, "epoch": 4880} {"train_loss": -7.346792221069336, "global_step": 204992, "epoch": 4880} {"train_loss": -7.304723739624023, "global_step": 204993, "epoch": 4880} {"train_loss": -7.270207405090332, "global_step": 204994, "epoch": 4880} {"train_loss": -7.3613810539245605, "global_step": 204995, "epoch": 4880} {"train_loss": -7.282341003417969, "global_step": 204996, "epoch": 4880} {"train_loss": -7.243161201477051, "global_step": 204997, "epoch": 4880} {"train_loss": -7.273380279541016, "global_step": 204998, "epoch": 4880} {"train_loss": -7.348911285400391, "global_step": 204999, "epoch": 4880} {"train_loss": -7.273909568786621, "global_step": 205000, "epoch": 4880} {"train_loss": -7.254541079203288, "global_step": 205001, "epoch": 4880, "val_loss": 70000.46875} {"train_loss": -7.261792182922363, "global_step": 205002, "epoch": 4881} {"train_loss": -7.387090682983398, "global_step": 205003, "epoch": 4881} {"train_loss": -7.327597618103027, "global_step": 205004, "epoch": 4881} {"train_loss": -7.272636413574219, "global_step": 205005, "epoch": 4881} {"train_loss": -7.383769989013672, "global_step": 205006, "epoch": 4881} {"train_loss": -7.267855644226074, "global_step": 205007, "epoch": 4881} {"train_loss": -7.324561595916748, "global_step": 205008, "epoch": 4881} {"train_loss": -7.227492332458496, "global_step": 205009, "epoch": 4881} {"train_loss": -7.330609321594238, "global_step": 205010, "epoch": 4881} {"train_loss": -7.27519416809082, "global_step": 205011, "epoch": 4881} {"train_loss": -7.192190170288086, "global_step": 205012, "epoch": 4881} {"train_loss": -7.338921546936035, "global_step": 205013, "epoch": 4881} {"train_loss": -7.2311906814575195, "global_step": 205014, "epoch": 4881} {"train_loss": -7.163388252258301, "global_step": 205015, "epoch": 4881} {"train_loss": -7.273172378540039, "global_step": 205016, "epoch": 4881} {"train_loss": -7.212547302246094, "global_step": 205017, "epoch": 4881} {"train_loss": -7.279261589050293, "global_step": 205018, "epoch": 4881} {"train_loss": -7.3210129737854, "global_step": 205019, "epoch": 4881} {"train_loss": -7.374698638916016, "global_step": 205020, "epoch": 4881} {"train_loss": -7.293211936950684, "global_step": 205021, "epoch": 4881} {"train_loss": -7.223252296447754, "global_step": 205022, "epoch": 4881} {"train_loss": -7.362844467163086, "global_step": 205023, "epoch": 4881} {"train_loss": -7.332737445831299, "global_step": 205024, "epoch": 4881} {"train_loss": -7.334588527679443, "global_step": 205025, "epoch": 4881} {"train_loss": -7.249109268188477, "global_step": 205026, "epoch": 4881} {"train_loss": -7.307732105255127, "global_step": 205027, "epoch": 4881} {"train_loss": -7.283951282501221, "global_step": 205028, "epoch": 4881} {"train_loss": -7.31272029876709, "global_step": 205029, "epoch": 4881} {"train_loss": -7.207266807556152, "global_step": 205030, "epoch": 4881} {"train_loss": -7.23873233795166, "global_step": 205031, "epoch": 4881} {"train_loss": -7.270749092102051, "global_step": 205032, "epoch": 4881} {"train_loss": -7.3403401374816895, "global_step": 205033, "epoch": 4881} {"train_loss": -7.227256774902344, "global_step": 205034, "epoch": 4881} {"train_loss": -7.334216594696045, "global_step": 205035, "epoch": 4881} {"train_loss": -7.389028549194336, "global_step": 205036, "epoch": 4881} {"train_loss": -7.262934684753418, "global_step": 205037, "epoch": 4881} {"train_loss": -7.343118667602539, "global_step": 205038, "epoch": 4881} {"train_loss": -7.340125560760498, "global_step": 205039, "epoch": 4881} {"train_loss": -7.303366184234619, "global_step": 205040, "epoch": 4881} {"train_loss": -7.294014930725098, "global_step": 205041, "epoch": 4881} {"train_loss": -7.4260406494140625, "global_step": 205042, "epoch": 4881} {"train_loss": -7.293621744428362, "global_step": 205043, "epoch": 4881, "val_loss": 69952.28125} {"train_loss": -7.2816972732543945, "global_step": 205044, "epoch": 4882} {"train_loss": -7.36810827255249, "global_step": 205045, "epoch": 4882} {"train_loss": -7.163913726806641, "global_step": 205046, "epoch": 4882} {"train_loss": -7.2218732833862305, "global_step": 205047, "epoch": 4882} {"train_loss": -7.389681816101074, "global_step": 205048, "epoch": 4882} {"train_loss": -7.292701721191406, "global_step": 205049, "epoch": 4882} {"train_loss": -7.324270248413086, "global_step": 205050, "epoch": 4882} {"train_loss": -7.3026347160339355, "global_step": 205051, "epoch": 4882} {"train_loss": -7.2879109382629395, "global_step": 205052, "epoch": 4882} {"train_loss": -7.304810523986816, "global_step": 205053, "epoch": 4882} {"train_loss": -7.366921424865723, "global_step": 205054, "epoch": 4882} {"train_loss": -7.274875164031982, "global_step": 205055, "epoch": 4882} {"train_loss": -7.2779388427734375, "global_step": 205056, "epoch": 4882} {"train_loss": -7.251540184020996, "global_step": 205057, "epoch": 4882} {"train_loss": -7.407102108001709, "global_step": 205058, "epoch": 4882} {"train_loss": -7.23978328704834, "global_step": 205059, "epoch": 4882} {"train_loss": -7.335739612579346, "global_step": 205060, "epoch": 4882} {"train_loss": -7.289315223693848, "global_step": 205061, "epoch": 4882} {"train_loss": -7.367295742034912, "global_step": 205062, "epoch": 4882} {"train_loss": -7.283563613891602, "global_step": 205063, "epoch": 4882} {"train_loss": -7.253686904907227, "global_step": 205064, "epoch": 4882} {"train_loss": -7.3347015380859375, "global_step": 205065, "epoch": 4882} {"train_loss": -7.317609786987305, "global_step": 205066, "epoch": 4882} {"train_loss": -7.38724422454834, "global_step": 205067, "epoch": 4882} {"train_loss": -7.380282878875732, "global_step": 205068, "epoch": 4882} {"train_loss": -7.279809951782227, "global_step": 205069, "epoch": 4882} {"train_loss": -7.3435821533203125, "global_step": 205070, "epoch": 4882} {"train_loss": -7.326434135437012, "global_step": 205071, "epoch": 4882} {"train_loss": -7.419607162475586, "global_step": 205072, "epoch": 4882} {"train_loss": -7.3614912033081055, "global_step": 205073, "epoch": 4882} {"train_loss": -7.3320698738098145, "global_step": 205074, "epoch": 4882} {"train_loss": -7.350503921508789, "global_step": 205075, "epoch": 4882} {"train_loss": -7.29163122177124, "global_step": 205076, "epoch": 4882} {"train_loss": -7.267076015472412, "global_step": 205077, "epoch": 4882} {"train_loss": -7.266887664794922, "global_step": 205078, "epoch": 4882} {"train_loss": -7.321193695068359, "global_step": 205079, "epoch": 4882} {"train_loss": -7.256841659545898, "global_step": 205080, "epoch": 4882} {"train_loss": -7.333444595336914, "global_step": 205081, "epoch": 4882} {"train_loss": -7.294527530670166, "global_step": 205082, "epoch": 4882} {"train_loss": -7.363766670227051, "global_step": 205083, "epoch": 4882} {"train_loss": -7.272618770599365, "global_step": 205084, "epoch": 4882} {"train_loss": -7.312989530109224, "global_step": 205085, "epoch": 4882, "val_loss": 69905.46875} {"train_loss": -7.3282318115234375, "global_step": 205086, "epoch": 4883} {"train_loss": -7.396610260009766, "global_step": 205087, "epoch": 4883} {"train_loss": -7.355344295501709, "global_step": 205088, "epoch": 4883} {"train_loss": -7.2502288818359375, "global_step": 205089, "epoch": 4883} {"train_loss": -7.305502891540527, "global_step": 205090, "epoch": 4883} {"train_loss": -7.378352165222168, "global_step": 205091, "epoch": 4883} {"train_loss": -7.228445529937744, "global_step": 205092, "epoch": 4883} {"train_loss": -7.427570343017578, "global_step": 205093, "epoch": 4883} {"train_loss": -7.317316055297852, "global_step": 205094, "epoch": 4883} {"train_loss": -7.3307881355285645, "global_step": 205095, "epoch": 4883} {"train_loss": -7.345654487609863, "global_step": 205096, "epoch": 4883} {"train_loss": -7.338712215423584, "global_step": 205097, "epoch": 4883} {"train_loss": -7.22199821472168, "global_step": 205098, "epoch": 4883} {"train_loss": -7.3222737312316895, "global_step": 205099, "epoch": 4883} {"train_loss": -7.316919326782227, "global_step": 205100, "epoch": 4883} {"train_loss": -7.461985111236572, "global_step": 205101, "epoch": 4883} {"train_loss": -7.42749547958374, "global_step": 205102, "epoch": 4883} {"train_loss": -7.363002777099609, "global_step": 205103, "epoch": 4883} {"train_loss": -7.468400955200195, "global_step": 205104, "epoch": 4883} {"train_loss": -7.357142448425293, "global_step": 205105, "epoch": 4883} {"train_loss": -7.3351240158081055, "global_step": 205106, "epoch": 4883} {"train_loss": -7.338304042816162, "global_step": 205107, "epoch": 4883} {"train_loss": -7.338811874389648, "global_step": 205108, "epoch": 4883} {"train_loss": -7.344299793243408, "global_step": 205109, "epoch": 4883} {"train_loss": -7.391806602478027, "global_step": 205110, "epoch": 4883} {"train_loss": -7.334486961364746, "global_step": 205111, "epoch": 4883} {"train_loss": -7.3002824783325195, "global_step": 205112, "epoch": 4883} {"train_loss": -7.351983070373535, "global_step": 205113, "epoch": 4883} {"train_loss": -7.381989479064941, "global_step": 205114, "epoch": 4883} {"train_loss": -7.266397953033447, "global_step": 205115, "epoch": 4883} {"train_loss": -7.345075607299805, "global_step": 205116, "epoch": 4883} {"train_loss": -7.364943981170654, "global_step": 205117, "epoch": 4883} {"train_loss": -7.453245162963867, "global_step": 205118, "epoch": 4883} {"train_loss": -7.362401962280273, "global_step": 205119, "epoch": 4883} {"train_loss": -7.277799606323242, "global_step": 205120, "epoch": 4883} {"train_loss": -7.322343826293945, "global_step": 205121, "epoch": 4883} {"train_loss": -7.302755832672119, "global_step": 205122, "epoch": 4883} {"train_loss": -7.279606819152832, "global_step": 205123, "epoch": 4883} {"train_loss": -7.335028648376465, "global_step": 205124, "epoch": 4883} {"train_loss": -7.3181986808776855, "global_step": 205125, "epoch": 4883} {"train_loss": -7.422055244445801, "global_step": 205126, "epoch": 4883} {"train_loss": -7.3452297278812955, "global_step": 205127, "epoch": 4883, "val_loss": 69820.234375} {"train_loss": -7.341388702392578, "global_step": 205128, "epoch": 4884} {"train_loss": -7.374940395355225, "global_step": 205129, "epoch": 4884} {"train_loss": -7.346769332885742, "global_step": 205130, "epoch": 4884} {"train_loss": -7.447734832763672, "global_step": 205131, "epoch": 4884} {"train_loss": -7.403581619262695, "global_step": 205132, "epoch": 4884} {"train_loss": -7.341904640197754, "global_step": 205133, "epoch": 4884} {"train_loss": -7.39731502532959, "global_step": 205134, "epoch": 4884} {"train_loss": -7.422627925872803, "global_step": 205135, "epoch": 4884} {"train_loss": -7.401390075683594, "global_step": 205136, "epoch": 4884} {"train_loss": -7.485870838165283, "global_step": 205137, "epoch": 4884} {"train_loss": -7.4144744873046875, "global_step": 205138, "epoch": 4884} {"train_loss": -7.396754264831543, "global_step": 205139, "epoch": 4884} {"train_loss": -7.400440216064453, "global_step": 205140, "epoch": 4884} {"train_loss": -7.268898963928223, "global_step": 205141, "epoch": 4884} {"train_loss": -7.3356828689575195, "global_step": 205142, "epoch": 4884} {"train_loss": -7.3046464920043945, "global_step": 205143, "epoch": 4884} {"train_loss": -7.1850762367248535, "global_step": 205144, "epoch": 4884} {"train_loss": -7.2183427810668945, "global_step": 205145, "epoch": 4884} {"train_loss": -7.308685779571533, "global_step": 205146, "epoch": 4884} {"train_loss": -7.116630554199219, "global_step": 205147, "epoch": 4884} {"train_loss": -7.10391902923584, "global_step": 205148, "epoch": 4884} {"train_loss": -7.481733322143555, "global_step": 205149, "epoch": 4884} {"train_loss": -7.371064186096191, "global_step": 205150, "epoch": 4884} {"train_loss": -7.2204813957214355, "global_step": 205151, "epoch": 4884} {"train_loss": -7.396332740783691, "global_step": 205152, "epoch": 4884} {"train_loss": -7.169538497924805, "global_step": 205153, "epoch": 4884} {"train_loss": -7.223845958709717, "global_step": 205154, "epoch": 4884} {"train_loss": -7.183116912841797, "global_step": 205155, "epoch": 4884} {"train_loss": -7.170068740844727, "global_step": 205156, "epoch": 4884} {"train_loss": -7.286486625671387, "global_step": 205157, "epoch": 4884} {"train_loss": -7.025484561920166, "global_step": 205158, "epoch": 4884} {"train_loss": -7.1199541091918945, "global_step": 205159, "epoch": 4884} {"train_loss": -7.0783467292785645, "global_step": 205160, "epoch": 4884} {"train_loss": -7.095692157745361, "global_step": 205161, "epoch": 4884} {"train_loss": -7.270882606506348, "global_step": 205162, "epoch": 4884} {"train_loss": -7.048341274261475, "global_step": 205163, "epoch": 4884} {"train_loss": -7.4111175537109375, "global_step": 205164, "epoch": 4884} {"train_loss": -7.144613742828369, "global_step": 205165, "epoch": 4884} {"train_loss": -7.307179927825928, "global_step": 205166, "epoch": 4884} {"train_loss": -7.219504356384277, "global_step": 205167, "epoch": 4884} {"train_loss": -7.185714244842529, "global_step": 205168, "epoch": 4884} {"train_loss": -7.276326906113398, "global_step": 205169, "epoch": 4884, "val_loss": 70020.4609375} {"train_loss": -7.400908470153809, "global_step": 205170, "epoch": 4885} {"train_loss": -7.224163055419922, "global_step": 205171, "epoch": 4885} {"train_loss": -7.376290321350098, "global_step": 205172, "epoch": 4885} {"train_loss": -7.227339267730713, "global_step": 205173, "epoch": 4885} {"train_loss": -7.306872844696045, "global_step": 205174, "epoch": 4885} {"train_loss": -7.204380989074707, "global_step": 205175, "epoch": 4885} {"train_loss": -7.2181196212768555, "global_step": 205176, "epoch": 4885} {"train_loss": -7.2288713455200195, "global_step": 205177, "epoch": 4885} {"train_loss": -7.283945083618164, "global_step": 205178, "epoch": 4885} {"train_loss": -7.191947937011719, "global_step": 205179, "epoch": 4885} {"train_loss": -7.215597152709961, "global_step": 205180, "epoch": 4885} {"train_loss": -7.3687520027160645, "global_step": 205181, "epoch": 4885} {"train_loss": -7.172830104827881, "global_step": 205182, "epoch": 4885} {"train_loss": -7.206611633300781, "global_step": 205183, "epoch": 4885} {"train_loss": -7.278683662414551, "global_step": 205184, "epoch": 4885} {"train_loss": -7.150331974029541, "global_step": 205185, "epoch": 4885} {"train_loss": -7.306202411651611, "global_step": 205186, "epoch": 4885} {"train_loss": -7.26171875, "global_step": 205187, "epoch": 4885} {"train_loss": -7.135215759277344, "global_step": 205188, "epoch": 4885} {"train_loss": -7.096296310424805, "global_step": 205189, "epoch": 4885} {"train_loss": -7.242486953735352, "global_step": 205190, "epoch": 4885} {"train_loss": -7.136916160583496, "global_step": 205191, "epoch": 4885} {"train_loss": -7.153985500335693, "global_step": 205192, "epoch": 4885} {"train_loss": -7.096091270446777, "global_step": 205193, "epoch": 4885} {"train_loss": -7.19423770904541, "global_step": 205194, "epoch": 4885} {"train_loss": -7.108926296234131, "global_step": 205195, "epoch": 4885} {"train_loss": -7.177243232727051, "global_step": 205196, "epoch": 4885} {"train_loss": -7.18599796295166, "global_step": 205197, "epoch": 4885} {"train_loss": -7.024934768676758, "global_step": 205198, "epoch": 4885} {"train_loss": -7.138815879821777, "global_step": 205199, "epoch": 4885} {"train_loss": -7.267423152923584, "global_step": 205200, "epoch": 4885} {"train_loss": -7.219542026519775, "global_step": 205201, "epoch": 4885} {"train_loss": -7.2092719078063965, "global_step": 205202, "epoch": 4885} {"train_loss": -7.195953845977783, "global_step": 205203, "epoch": 4885} {"train_loss": -7.158571243286133, "global_step": 205204, "epoch": 4885} {"train_loss": -7.2398295402526855, "global_step": 205205, "epoch": 4885} {"train_loss": -7.209194183349609, "global_step": 205206, "epoch": 4885} {"train_loss": -7.229823589324951, "global_step": 205207, "epoch": 4885} {"train_loss": -7.403302192687988, "global_step": 205208, "epoch": 4885} {"train_loss": -7.246756553649902, "global_step": 205209, "epoch": 4885} {"train_loss": -7.339878559112549, "global_step": 205210, "epoch": 4885} {"train_loss": -7.222819033123198, "global_step": 205211, "epoch": 4885, "val_loss": 69892.8828125} {"train_loss": -7.326401710510254, "global_step": 205212, "epoch": 4886} {"train_loss": -7.331570625305176, "global_step": 205213, "epoch": 4886} {"train_loss": -7.328081130981445, "global_step": 205214, "epoch": 4886} {"train_loss": -7.321048736572266, "global_step": 205215, "epoch": 4886} {"train_loss": -7.248239040374756, "global_step": 205216, "epoch": 4886} {"train_loss": -7.469442367553711, "global_step": 205217, "epoch": 4886} {"train_loss": -7.246358871459961, "global_step": 205218, "epoch": 4886} {"train_loss": -7.302093982696533, "global_step": 205219, "epoch": 4886} {"train_loss": -7.253952980041504, "global_step": 205220, "epoch": 4886} {"train_loss": -7.370655059814453, "global_step": 205221, "epoch": 4886} {"train_loss": -7.4415602684021, "global_step": 205222, "epoch": 4886} {"train_loss": -7.398707389831543, "global_step": 205223, "epoch": 4886} {"train_loss": -7.3018670082092285, "global_step": 205224, "epoch": 4886} {"train_loss": -7.262801647186279, "global_step": 205225, "epoch": 4886} {"train_loss": -7.431393623352051, "global_step": 205226, "epoch": 4886} {"train_loss": -7.365062713623047, "global_step": 205227, "epoch": 4886} {"train_loss": -7.364068984985352, "global_step": 205228, "epoch": 4886} {"train_loss": -7.2063727378845215, "global_step": 205229, "epoch": 4886} {"train_loss": -7.364567279815674, "global_step": 205230, "epoch": 4886} {"train_loss": -7.3353681564331055, "global_step": 205231, "epoch": 4886} {"train_loss": -7.3930487632751465, "global_step": 205232, "epoch": 4886} {"train_loss": -7.464565277099609, "global_step": 205233, "epoch": 4886} {"train_loss": -7.4411091804504395, "global_step": 205234, "epoch": 4886} {"train_loss": -7.361361503601074, "global_step": 205235, "epoch": 4886} {"train_loss": -7.3447065353393555, "global_step": 205236, "epoch": 4886} {"train_loss": -7.206577301025391, "global_step": 205237, "epoch": 4886} {"train_loss": -7.318562030792236, "global_step": 205238, "epoch": 4886} {"train_loss": -7.292364120483398, "global_step": 205239, "epoch": 4886} {"train_loss": -7.295955657958984, "global_step": 205240, "epoch": 4886} {"train_loss": -7.3519673347473145, "global_step": 205241, "epoch": 4886} {"train_loss": -7.311617851257324, "global_step": 205242, "epoch": 4886} {"train_loss": -7.172698020935059, "global_step": 205243, "epoch": 4886} {"train_loss": -7.272918701171875, "global_step": 205244, "epoch": 4886} {"train_loss": -7.273625373840332, "global_step": 205245, "epoch": 4886} {"train_loss": -7.165532112121582, "global_step": 205246, "epoch": 4886} {"train_loss": -7.290507793426514, "global_step": 205247, "epoch": 4886} {"train_loss": -7.304847240447998, "global_step": 205248, "epoch": 4886} {"train_loss": -7.257919788360596, "global_step": 205249, "epoch": 4886} {"train_loss": -7.270990371704102, "global_step": 205250, "epoch": 4886} {"train_loss": -7.36405086517334, "global_step": 205251, "epoch": 4886} {"train_loss": -7.3928351402282715, "global_step": 205252, "epoch": 4886} {"train_loss": -7.3213525386083695, "global_step": 205253, "epoch": 4886, "val_loss": 70074.921875} {"train_loss": -7.294737815856934, "global_step": 205254, "epoch": 4887} {"train_loss": -7.301051139831543, "global_step": 205255, "epoch": 4887} {"train_loss": -7.35122013092041, "global_step": 205256, "epoch": 4887} {"train_loss": -7.328341960906982, "global_step": 205257, "epoch": 4887} {"train_loss": -7.213042259216309, "global_step": 205258, "epoch": 4887} {"train_loss": -7.282524108886719, "global_step": 205259, "epoch": 4887} {"train_loss": -7.239561557769775, "global_step": 205260, "epoch": 4887} {"train_loss": -7.334939479827881, "global_step": 205261, "epoch": 4887} {"train_loss": -7.175232887268066, "global_step": 205262, "epoch": 4887} {"train_loss": -7.230920791625977, "global_step": 205263, "epoch": 4887} {"train_loss": -7.264137268066406, "global_step": 205264, "epoch": 4887} {"train_loss": -7.199271202087402, "global_step": 205265, "epoch": 4887} {"train_loss": -7.255647659301758, "global_step": 205266, "epoch": 4887} {"train_loss": -7.170407772064209, "global_step": 205267, "epoch": 4887} {"train_loss": -7.178584098815918, "global_step": 205268, "epoch": 4887} {"train_loss": -7.263484954833984, "global_step": 205269, "epoch": 4887} {"train_loss": -7.244421005249023, "global_step": 205270, "epoch": 4887} {"train_loss": -7.252295970916748, "global_step": 205271, "epoch": 4887} {"train_loss": -7.310857772827148, "global_step": 205272, "epoch": 4887} {"train_loss": -7.331366062164307, "global_step": 205273, "epoch": 4887} {"train_loss": -7.425154685974121, "global_step": 205274, "epoch": 4887} {"train_loss": -7.40474796295166, "global_step": 205275, "epoch": 4887} {"train_loss": -7.35759973526001, "global_step": 205276, "epoch": 4887} {"train_loss": -7.372539520263672, "global_step": 205277, "epoch": 4887} {"train_loss": -7.231980323791504, "global_step": 205278, "epoch": 4887} {"train_loss": -7.3389153480529785, "global_step": 205279, "epoch": 4887} {"train_loss": -7.395469665527344, "global_step": 205280, "epoch": 4887} {"train_loss": -7.346079349517822, "global_step": 205281, "epoch": 4887} {"train_loss": -7.360221862792969, "global_step": 205282, "epoch": 4887} {"train_loss": -7.41003942489624, "global_step": 205283, "epoch": 4887} {"train_loss": -7.339227676391602, "global_step": 205284, "epoch": 4887} {"train_loss": -7.260825157165527, "global_step": 205285, "epoch": 4887} {"train_loss": -7.307074069976807, "global_step": 205286, "epoch": 4887} {"train_loss": -7.299809455871582, "global_step": 205287, "epoch": 4887} {"train_loss": -7.26971435546875, "global_step": 205288, "epoch": 4887} {"train_loss": -7.2754011154174805, "global_step": 205289, "epoch": 4887} {"train_loss": -7.37782096862793, "global_step": 205290, "epoch": 4887} {"train_loss": -7.3817458152771, "global_step": 205291, "epoch": 4887} {"train_loss": -7.365288734436035, "global_step": 205292, "epoch": 4887} {"train_loss": -7.473217010498047, "global_step": 205293, "epoch": 4887} {"train_loss": -7.221689224243164, "global_step": 205294, "epoch": 4887} {"train_loss": -7.303431987762451, "global_step": 205295, "epoch": 4887, "val_loss": 69934.15625} {"train_loss": -7.474123477935791, "global_step": 205296, "epoch": 4888} {"train_loss": -7.340061187744141, "global_step": 205297, "epoch": 4888} {"train_loss": -7.2565813064575195, "global_step": 205298, "epoch": 4888} {"train_loss": -7.361417293548584, "global_step": 205299, "epoch": 4888} {"train_loss": -7.311811447143555, "global_step": 205300, "epoch": 4888} {"train_loss": -7.340883255004883, "global_step": 205301, "epoch": 4888} {"train_loss": -7.473748683929443, "global_step": 205302, "epoch": 4888} {"train_loss": -7.293308258056641, "global_step": 205303, "epoch": 4888} {"train_loss": -7.138585567474365, "global_step": 205304, "epoch": 4888} {"train_loss": -7.265287399291992, "global_step": 205305, "epoch": 4888} {"train_loss": -7.215414524078369, "global_step": 205306, "epoch": 4888} {"train_loss": -7.330822944641113, "global_step": 205307, "epoch": 4888} {"train_loss": -7.326227188110352, "global_step": 205308, "epoch": 4888} {"train_loss": -7.28752326965332, "global_step": 205309, "epoch": 4888} {"train_loss": -7.351207733154297, "global_step": 205310, "epoch": 4888} {"train_loss": -7.190010070800781, "global_step": 205311, "epoch": 4888} {"train_loss": -7.173554420471191, "global_step": 205312, "epoch": 4888} {"train_loss": -7.218322277069092, "global_step": 205313, "epoch": 4888} {"train_loss": -7.264735221862793, "global_step": 205314, "epoch": 4888} {"train_loss": -7.378544330596924, "global_step": 205315, "epoch": 4888} {"train_loss": -7.339369773864746, "global_step": 205316, "epoch": 4888} {"train_loss": -7.29332971572876, "global_step": 205317, "epoch": 4888} {"train_loss": -7.284729480743408, "global_step": 205318, "epoch": 4888} {"train_loss": -7.276023864746094, "global_step": 205319, "epoch": 4888} {"train_loss": -7.24171781539917, "global_step": 205320, "epoch": 4888} {"train_loss": -7.30441427230835, "global_step": 205321, "epoch": 4888} {"train_loss": -7.213197708129883, "global_step": 205322, "epoch": 4888} {"train_loss": -7.284090042114258, "global_step": 205323, "epoch": 4888} {"train_loss": -7.351605415344238, "global_step": 205324, "epoch": 4888} {"train_loss": -7.358771324157715, "global_step": 205325, "epoch": 4888} {"train_loss": -7.292628765106201, "global_step": 205326, "epoch": 4888} {"train_loss": -7.33760929107666, "global_step": 205327, "epoch": 4888} {"train_loss": -7.287486553192139, "global_step": 205328, "epoch": 4888} {"train_loss": -7.433865547180176, "global_step": 205329, "epoch": 4888} {"train_loss": -7.334468364715576, "global_step": 205330, "epoch": 4888} {"train_loss": -7.306994438171387, "global_step": 205331, "epoch": 4888} {"train_loss": -7.414143085479736, "global_step": 205332, "epoch": 4888} {"train_loss": -7.355268478393555, "global_step": 205333, "epoch": 4888} {"train_loss": -7.33343505859375, "global_step": 205334, "epoch": 4888} {"train_loss": -7.400056838989258, "global_step": 205335, "epoch": 4888} {"train_loss": -7.280495643615723, "global_step": 205336, "epoch": 4888} {"train_loss": -7.313150076639085, "global_step": 205337, "epoch": 4888, "val_loss": 70000.1640625} {"train_loss": -7.430831432342529, "global_step": 205338, "epoch": 4889} {"train_loss": -7.462090015411377, "global_step": 205339, "epoch": 4889} {"train_loss": -7.371626853942871, "global_step": 205340, "epoch": 4889} {"train_loss": -7.357725620269775, "global_step": 205341, "epoch": 4889} {"train_loss": -7.378435134887695, "global_step": 205342, "epoch": 4889} {"train_loss": -7.255864143371582, "global_step": 205343, "epoch": 4889} {"train_loss": -7.221469879150391, "global_step": 205344, "epoch": 4889} {"train_loss": -7.36935567855835, "global_step": 205345, "epoch": 4889} {"train_loss": -7.299703598022461, "global_step": 205346, "epoch": 4889} {"train_loss": -7.356396675109863, "global_step": 205347, "epoch": 4889} {"train_loss": -7.277860164642334, "global_step": 205348, "epoch": 4889} {"train_loss": -7.389553070068359, "global_step": 205349, "epoch": 4889} {"train_loss": -7.2801289558410645, "global_step": 205350, "epoch": 4889} {"train_loss": -7.3585968017578125, "global_step": 205351, "epoch": 4889} {"train_loss": -7.344595432281494, "global_step": 205352, "epoch": 4889} {"train_loss": -7.332637786865234, "global_step": 205353, "epoch": 4889} {"train_loss": -7.412371635437012, "global_step": 205354, "epoch": 4889} {"train_loss": -7.360821723937988, "global_step": 205355, "epoch": 4889} {"train_loss": -7.315249443054199, "global_step": 205356, "epoch": 4889} {"train_loss": -7.333605766296387, "global_step": 205357, "epoch": 4889} {"train_loss": -7.345442771911621, "global_step": 205358, "epoch": 4889} {"train_loss": -7.499795436859131, "global_step": 205359, "epoch": 4889} {"train_loss": -7.464835166931152, "global_step": 205360, "epoch": 4889} {"train_loss": -7.355618953704834, "global_step": 205361, "epoch": 4889} {"train_loss": -7.275713920593262, "global_step": 205362, "epoch": 4889} {"train_loss": -7.295363903045654, "global_step": 205363, "epoch": 4889} {"train_loss": -7.254606246948242, "global_step": 205364, "epoch": 4889} {"train_loss": -7.346602439880371, "global_step": 205365, "epoch": 4889} {"train_loss": -7.288873672485352, "global_step": 205366, "epoch": 4889} {"train_loss": -7.2945990562438965, "global_step": 205367, "epoch": 4889} {"train_loss": -7.395787715911865, "global_step": 205368, "epoch": 4889} {"train_loss": -7.468122482299805, "global_step": 205369, "epoch": 4889} {"train_loss": -7.378172874450684, "global_step": 205370, "epoch": 4889} {"train_loss": -7.441710472106934, "global_step": 205371, "epoch": 4889} {"train_loss": -7.353346824645996, "global_step": 205372, "epoch": 4889} {"train_loss": -7.2625732421875, "global_step": 205373, "epoch": 4889} {"train_loss": -7.384424686431885, "global_step": 205374, "epoch": 4889} {"train_loss": -7.266696453094482, "global_step": 205375, "epoch": 4889} {"train_loss": -7.339469909667969, "global_step": 205376, "epoch": 4889} {"train_loss": -7.188482284545898, "global_step": 205377, "epoch": 4889} {"train_loss": -7.248283386230469, "global_step": 205378, "epoch": 4889} {"train_loss": -7.341651030949184, "global_step": 205379, "epoch": 4889, "val_loss": 70092.3515625} {"train_loss": -7.1952643394470215, "global_step": 205380, "epoch": 4890} {"train_loss": -7.358697891235352, "global_step": 205381, "epoch": 4890} {"train_loss": -7.268117427825928, "global_step": 205382, "epoch": 4890} {"train_loss": -7.24710750579834, "global_step": 205383, "epoch": 4890} {"train_loss": -7.3257527351379395, "global_step": 205384, "epoch": 4890} {"train_loss": -7.218961238861084, "global_step": 205385, "epoch": 4890} {"train_loss": -7.292089462280273, "global_step": 205386, "epoch": 4890} {"train_loss": -7.185637474060059, "global_step": 205387, "epoch": 4890} {"train_loss": -7.261092662811279, "global_step": 205388, "epoch": 4890} {"train_loss": -7.3072052001953125, "global_step": 205389, "epoch": 4890} {"train_loss": -7.303213596343994, "global_step": 205390, "epoch": 4890} {"train_loss": -7.260268688201904, "global_step": 205391, "epoch": 4890} {"train_loss": -7.259007453918457, "global_step": 205392, "epoch": 4890} {"train_loss": -7.193447113037109, "global_step": 205393, "epoch": 4890} {"train_loss": -7.105806350708008, "global_step": 205394, "epoch": 4890} {"train_loss": -7.321872234344482, "global_step": 205395, "epoch": 4890} {"train_loss": -7.253861427307129, "global_step": 205396, "epoch": 4890} {"train_loss": -7.263744354248047, "global_step": 205397, "epoch": 4890} {"train_loss": -7.281091690063477, "global_step": 205398, "epoch": 4890} {"train_loss": -7.281136512756348, "global_step": 205399, "epoch": 4890} {"train_loss": -7.2378740310668945, "global_step": 205400, "epoch": 4890} {"train_loss": -7.314205169677734, "global_step": 205401, "epoch": 4890} {"train_loss": -7.323789596557617, "global_step": 205402, "epoch": 4890} {"train_loss": -7.231044769287109, "global_step": 205403, "epoch": 4890} {"train_loss": -7.2334089279174805, "global_step": 205404, "epoch": 4890} {"train_loss": -7.293194770812988, "global_step": 205405, "epoch": 4890} {"train_loss": -7.210195541381836, "global_step": 205406, "epoch": 4890} {"train_loss": -7.347823619842529, "global_step": 205407, "epoch": 4890} {"train_loss": -7.283713340759277, "global_step": 205408, "epoch": 4890} {"train_loss": -7.310165882110596, "global_step": 205409, "epoch": 4890} {"train_loss": -7.356166839599609, "global_step": 205410, "epoch": 4890} {"train_loss": -7.279953956604004, "global_step": 205411, "epoch": 4890} {"train_loss": -7.302966117858887, "global_step": 205412, "epoch": 4890} {"train_loss": -7.238739967346191, "global_step": 205413, "epoch": 4890} {"train_loss": -7.40260124206543, "global_step": 205414, "epoch": 4890} {"train_loss": -7.209298133850098, "global_step": 205415, "epoch": 4890} {"train_loss": -7.318149089813232, "global_step": 205416, "epoch": 4890} {"train_loss": -7.282922744750977, "global_step": 205417, "epoch": 4890} {"train_loss": -7.361915588378906, "global_step": 205418, "epoch": 4890} {"train_loss": -7.25853157043457, "global_step": 205419, "epoch": 4890} {"train_loss": -7.214847564697266, "global_step": 205420, "epoch": 4890} {"train_loss": -7.275325729733422, "global_step": 205421, "epoch": 4890, "val_loss": 69857.3203125} {"train_loss": -7.358550071716309, "global_step": 205422, "epoch": 4891} {"train_loss": -7.278512001037598, "global_step": 205423, "epoch": 4891} {"train_loss": -7.261399745941162, "global_step": 205424, "epoch": 4891} {"train_loss": -7.2937421798706055, "global_step": 205425, "epoch": 4891} {"train_loss": -7.352240562438965, "global_step": 205426, "epoch": 4891} {"train_loss": -7.380622863769531, "global_step": 205427, "epoch": 4891} {"train_loss": -7.322380542755127, "global_step": 205428, "epoch": 4891} {"train_loss": -7.299516677856445, "global_step": 205429, "epoch": 4891} {"train_loss": -7.284143447875977, "global_step": 205430, "epoch": 4891} {"train_loss": -7.241182327270508, "global_step": 205431, "epoch": 4891} {"train_loss": -7.284379005432129, "global_step": 205432, "epoch": 4891} {"train_loss": -7.350006103515625, "global_step": 205433, "epoch": 4891} {"train_loss": -7.329800605773926, "global_step": 205434, "epoch": 4891} {"train_loss": -7.312740325927734, "global_step": 205435, "epoch": 4891} {"train_loss": -7.219764709472656, "global_step": 205436, "epoch": 4891} {"train_loss": -7.309800624847412, "global_step": 205437, "epoch": 4891} {"train_loss": -7.205417633056641, "global_step": 205438, "epoch": 4891} {"train_loss": -7.319362163543701, "global_step": 205439, "epoch": 4891} {"train_loss": -7.2613654136657715, "global_step": 205440, "epoch": 4891} {"train_loss": -7.311429977416992, "global_step": 205441, "epoch": 4891} {"train_loss": -7.264946937561035, "global_step": 205442, "epoch": 4891} {"train_loss": -7.344071388244629, "global_step": 205443, "epoch": 4891} {"train_loss": -7.304509162902832, "global_step": 205444, "epoch": 4891} {"train_loss": -7.326442241668701, "global_step": 205445, "epoch": 4891} {"train_loss": -7.257449150085449, "global_step": 205446, "epoch": 4891} {"train_loss": -7.338314056396484, "global_step": 205447, "epoch": 4891} {"train_loss": -7.309005260467529, "global_step": 205448, "epoch": 4891} {"train_loss": -7.368992805480957, "global_step": 205449, "epoch": 4891} {"train_loss": -7.21543550491333, "global_step": 205450, "epoch": 4891} {"train_loss": -7.362534523010254, "global_step": 205451, "epoch": 4891} {"train_loss": -7.254592418670654, "global_step": 205452, "epoch": 4891} {"train_loss": -7.263600826263428, "global_step": 205453, "epoch": 4891} {"train_loss": -7.251696586608887, "global_step": 205454, "epoch": 4891} {"train_loss": -7.2347822189331055, "global_step": 205455, "epoch": 4891} {"train_loss": -7.433620452880859, "global_step": 205456, "epoch": 4891} {"train_loss": -7.393408298492432, "global_step": 205457, "epoch": 4891} {"train_loss": -7.409719944000244, "global_step": 205458, "epoch": 4891} {"train_loss": -7.330739974975586, "global_step": 205459, "epoch": 4891} {"train_loss": -7.420924186706543, "global_step": 205460, "epoch": 4891} {"train_loss": -7.225513935089111, "global_step": 205461, "epoch": 4891} {"train_loss": -7.141267776489258, "global_step": 205462, "epoch": 4891} {"train_loss": -7.303244920003982, "global_step": 205463, "epoch": 4891, "val_loss": 69993.3828125} {"train_loss": -7.26645565032959, "global_step": 205464, "epoch": 4892} {"train_loss": -7.177960395812988, "global_step": 205465, "epoch": 4892} {"train_loss": -7.3309454917907715, "global_step": 205466, "epoch": 4892} {"train_loss": -7.298213958740234, "global_step": 205467, "epoch": 4892} {"train_loss": -7.410851955413818, "global_step": 205468, "epoch": 4892} {"train_loss": -7.375331401824951, "global_step": 205469, "epoch": 4892} {"train_loss": -7.296210289001465, "global_step": 205470, "epoch": 4892} {"train_loss": -7.313836097717285, "global_step": 205471, "epoch": 4892} {"train_loss": -7.287849426269531, "global_step": 205472, "epoch": 4892} {"train_loss": -7.345614433288574, "global_step": 205473, "epoch": 4892} {"train_loss": -7.370937347412109, "global_step": 205474, "epoch": 4892} {"train_loss": -7.333726406097412, "global_step": 205475, "epoch": 4892} {"train_loss": -7.261907577514648, "global_step": 205476, "epoch": 4892} {"train_loss": -7.223983287811279, "global_step": 205477, "epoch": 4892} {"train_loss": -7.268747329711914, "global_step": 205478, "epoch": 4892} {"train_loss": -7.199599266052246, "global_step": 205479, "epoch": 4892} {"train_loss": -7.23452091217041, "global_step": 205480, "epoch": 4892} {"train_loss": -7.224505424499512, "global_step": 205481, "epoch": 4892} {"train_loss": -7.2130126953125, "global_step": 205482, "epoch": 4892} {"train_loss": -7.201267719268799, "global_step": 205483, "epoch": 4892} {"train_loss": -7.322869777679443, "global_step": 205484, "epoch": 4892} {"train_loss": -7.146303653717041, "global_step": 205485, "epoch": 4892} {"train_loss": -7.156774044036865, "global_step": 205486, "epoch": 4892} {"train_loss": -7.299520015716553, "global_step": 205487, "epoch": 4892} {"train_loss": -7.189644813537598, "global_step": 205488, "epoch": 4892} {"train_loss": -7.219609260559082, "global_step": 205489, "epoch": 4892} {"train_loss": -7.297101020812988, "global_step": 205490, "epoch": 4892} {"train_loss": -7.161982536315918, "global_step": 205491, "epoch": 4892} {"train_loss": -7.297501087188721, "global_step": 205492, "epoch": 4892} {"train_loss": -7.209824562072754, "global_step": 205493, "epoch": 4892} {"train_loss": -7.224133014678955, "global_step": 205494, "epoch": 4892} {"train_loss": -7.233007431030273, "global_step": 205495, "epoch": 4892} {"train_loss": -7.152803897857666, "global_step": 205496, "epoch": 4892} {"train_loss": -7.293401718139648, "global_step": 205497, "epoch": 4892} {"train_loss": -7.204075813293457, "global_step": 205498, "epoch": 4892} {"train_loss": -7.2119221687316895, "global_step": 205499, "epoch": 4892} {"train_loss": -7.2171478271484375, "global_step": 205500, "epoch": 4892} {"train_loss": -7.274924278259277, "global_step": 205501, "epoch": 4892} {"train_loss": -7.298735618591309, "global_step": 205502, "epoch": 4892} {"train_loss": -7.294355392456055, "global_step": 205503, "epoch": 4892} {"train_loss": -7.290072441101074, "global_step": 205504, "epoch": 4892} {"train_loss": -7.259750093732562, "global_step": 205505, "epoch": 4892, "val_loss": 70090.671875} {"train_loss": -7.31318473815918, "global_step": 205506, "epoch": 4893} {"train_loss": -7.246262550354004, "global_step": 205507, "epoch": 4893} {"train_loss": -7.226754665374756, "global_step": 205508, "epoch": 4893} {"train_loss": -7.159083366394043, "global_step": 205509, "epoch": 4893} {"train_loss": -7.242719650268555, "global_step": 205510, "epoch": 4893} {"train_loss": -7.305009841918945, "global_step": 205511, "epoch": 4893} {"train_loss": -7.20345401763916, "global_step": 205512, "epoch": 4893} {"train_loss": -7.244565963745117, "global_step": 205513, "epoch": 4893} {"train_loss": -7.140687465667725, "global_step": 205514, "epoch": 4893} {"train_loss": -7.1447296142578125, "global_step": 205515, "epoch": 4893} {"train_loss": -7.142647743225098, "global_step": 205516, "epoch": 4893} {"train_loss": -7.051879405975342, "global_step": 205517, "epoch": 4893} {"train_loss": -7.301332473754883, "global_step": 205518, "epoch": 4893} {"train_loss": -7.258222579956055, "global_step": 205519, "epoch": 4893} {"train_loss": -7.20930814743042, "global_step": 205520, "epoch": 4893} {"train_loss": -7.3509111404418945, "global_step": 205521, "epoch": 4893} {"train_loss": -7.282107353210449, "global_step": 205522, "epoch": 4893} {"train_loss": -7.397449493408203, "global_step": 205523, "epoch": 4893} {"train_loss": -7.265212059020996, "global_step": 205524, "epoch": 4893} {"train_loss": -7.211366653442383, "global_step": 205525, "epoch": 4893} {"train_loss": -7.262474060058594, "global_step": 205526, "epoch": 4893} {"train_loss": -7.225814342498779, "global_step": 205527, "epoch": 4893} {"train_loss": -7.33775520324707, "global_step": 205528, "epoch": 4893} {"train_loss": -7.307195663452148, "global_step": 205529, "epoch": 4893} {"train_loss": -7.3390350341796875, "global_step": 205530, "epoch": 4893} {"train_loss": -7.307538986206055, "global_step": 205531, "epoch": 4893} {"train_loss": -7.299150466918945, "global_step": 205532, "epoch": 4893} {"train_loss": -7.20461368560791, "global_step": 205533, "epoch": 4893} {"train_loss": -7.32745885848999, "global_step": 205534, "epoch": 4893} {"train_loss": -7.410140514373779, "global_step": 205535, "epoch": 4893} {"train_loss": -7.338406562805176, "global_step": 205536, "epoch": 4893} {"train_loss": -7.275904655456543, "global_step": 205537, "epoch": 4893} {"train_loss": -7.275875091552734, "global_step": 205538, "epoch": 4893} {"train_loss": -7.315473556518555, "global_step": 205539, "epoch": 4893} {"train_loss": -7.424237251281738, "global_step": 205540, "epoch": 4893} {"train_loss": -7.163651466369629, "global_step": 205541, "epoch": 4893} {"train_loss": -7.307209014892578, "global_step": 205542, "epoch": 4893} {"train_loss": -7.146692276000977, "global_step": 205543, "epoch": 4893} {"train_loss": -7.232427597045898, "global_step": 205544, "epoch": 4893} {"train_loss": -7.338840484619141, "global_step": 205545, "epoch": 4893} {"train_loss": -7.305298328399658, "global_step": 205546, "epoch": 4893} {"train_loss": -7.2655517146700905, "global_step": 205547, "epoch": 4893, "val_loss": 69895.7421875} {"train_loss": -7.345688819885254, "global_step": 205548, "epoch": 4894} {"train_loss": -7.1758713722229, "global_step": 205549, "epoch": 4894} {"train_loss": -7.370880603790283, "global_step": 205550, "epoch": 4894} {"train_loss": -7.265273094177246, "global_step": 205551, "epoch": 4894} {"train_loss": -7.379812717437744, "global_step": 205552, "epoch": 4894} {"train_loss": -7.365313529968262, "global_step": 205553, "epoch": 4894} {"train_loss": -7.244729042053223, "global_step": 205554, "epoch": 4894} {"train_loss": -7.302340507507324, "global_step": 205555, "epoch": 4894} {"train_loss": -7.421723365783691, "global_step": 205556, "epoch": 4894} {"train_loss": -7.366274356842041, "global_step": 205557, "epoch": 4894} {"train_loss": -7.355504035949707, "global_step": 205558, "epoch": 4894} {"train_loss": -7.2770538330078125, "global_step": 205559, "epoch": 4894} {"train_loss": -7.450203895568848, "global_step": 205560, "epoch": 4894} {"train_loss": -7.342061996459961, "global_step": 205561, "epoch": 4894} {"train_loss": -7.319399833679199, "global_step": 205562, "epoch": 4894} {"train_loss": -7.410526275634766, "global_step": 205563, "epoch": 4894} {"train_loss": -7.338220119476318, "global_step": 205564, "epoch": 4894} {"train_loss": -7.374922752380371, "global_step": 205565, "epoch": 4894} {"train_loss": -7.231952667236328, "global_step": 205566, "epoch": 4894} {"train_loss": -7.2915802001953125, "global_step": 205567, "epoch": 4894} {"train_loss": -7.353564262390137, "global_step": 205568, "epoch": 4894} {"train_loss": -7.159762382507324, "global_step": 205569, "epoch": 4894} {"train_loss": -7.3482279777526855, "global_step": 205570, "epoch": 4894} {"train_loss": -7.299467086791992, "global_step": 205571, "epoch": 4894} {"train_loss": -7.207924842834473, "global_step": 205572, "epoch": 4894} {"train_loss": -7.359954357147217, "global_step": 205573, "epoch": 4894} {"train_loss": -7.207193374633789, "global_step": 205574, "epoch": 4894} {"train_loss": -7.3232741355896, "global_step": 205575, "epoch": 4894} {"train_loss": -7.275540351867676, "global_step": 205576, "epoch": 4894} {"train_loss": -7.272216796875, "global_step": 205577, "epoch": 4894} {"train_loss": -7.348697185516357, "global_step": 205578, "epoch": 4894} {"train_loss": -7.077522277832031, "global_step": 205579, "epoch": 4894} {"train_loss": -7.280973434448242, "global_step": 205580, "epoch": 4894} {"train_loss": -7.272984504699707, "global_step": 205581, "epoch": 4894} {"train_loss": -7.191664695739746, "global_step": 205582, "epoch": 4894} {"train_loss": -7.394289970397949, "global_step": 205583, "epoch": 4894} {"train_loss": -7.167611598968506, "global_step": 205584, "epoch": 4894} {"train_loss": -7.298009872436523, "global_step": 205585, "epoch": 4894} {"train_loss": -7.363054275512695, "global_step": 205586, "epoch": 4894} {"train_loss": -7.262457847595215, "global_step": 205587, "epoch": 4894} {"train_loss": -7.239870071411133, "global_step": 205588, "epoch": 4894} {"train_loss": -7.302776030131748, "global_step": 205589, "epoch": 4894, "val_loss": 69948.9140625} {"train_loss": -7.228189468383789, "global_step": 205590, "epoch": 4895} {"train_loss": -7.349153518676758, "global_step": 205591, "epoch": 4895} {"train_loss": -7.270608901977539, "global_step": 205592, "epoch": 4895} {"train_loss": -7.192720413208008, "global_step": 205593, "epoch": 4895} {"train_loss": -7.266463279724121, "global_step": 205594, "epoch": 4895} {"train_loss": -7.221320152282715, "global_step": 205595, "epoch": 4895} {"train_loss": -7.33690881729126, "global_step": 205596, "epoch": 4895} {"train_loss": -7.216031551361084, "global_step": 205597, "epoch": 4895} {"train_loss": -7.142264366149902, "global_step": 205598, "epoch": 4895} {"train_loss": -7.299617767333984, "global_step": 205599, "epoch": 4895} {"train_loss": -7.174283981323242, "global_step": 205600, "epoch": 4895} {"train_loss": -7.217487812042236, "global_step": 205601, "epoch": 4895} {"train_loss": -7.179865837097168, "global_step": 205602, "epoch": 4895} {"train_loss": -7.252167224884033, "global_step": 205603, "epoch": 4895} {"train_loss": -7.334120750427246, "global_step": 205604, "epoch": 4895} {"train_loss": -7.398177146911621, "global_step": 205605, "epoch": 4895} {"train_loss": -7.329571723937988, "global_step": 205606, "epoch": 4895} {"train_loss": -7.185885429382324, "global_step": 205607, "epoch": 4895} {"train_loss": -7.2878313064575195, "global_step": 205608, "epoch": 4895} {"train_loss": -7.362072467803955, "global_step": 205609, "epoch": 4895} {"train_loss": -7.262554168701172, "global_step": 205610, "epoch": 4895} {"train_loss": -7.3042802810668945, "global_step": 205611, "epoch": 4895} {"train_loss": -7.325005531311035, "global_step": 205612, "epoch": 4895} {"train_loss": -7.204337120056152, "global_step": 205613, "epoch": 4895} {"train_loss": -7.260617256164551, "global_step": 205614, "epoch": 4895} {"train_loss": -7.348296165466309, "global_step": 205615, "epoch": 4895} {"train_loss": -7.234887599945068, "global_step": 205616, "epoch": 4895} {"train_loss": -7.307175159454346, "global_step": 205617, "epoch": 4895} {"train_loss": -7.299097537994385, "global_step": 205618, "epoch": 4895} {"train_loss": -7.243793487548828, "global_step": 205619, "epoch": 4895} {"train_loss": -7.2749128341674805, "global_step": 205620, "epoch": 4895} {"train_loss": -7.307382106781006, "global_step": 205621, "epoch": 4895} {"train_loss": -7.202851295471191, "global_step": 205622, "epoch": 4895} {"train_loss": -7.251705646514893, "global_step": 205623, "epoch": 4895} {"train_loss": -7.415838718414307, "global_step": 205624, "epoch": 4895} {"train_loss": -7.372666835784912, "global_step": 205625, "epoch": 4895} {"train_loss": -7.128866672515869, "global_step": 205626, "epoch": 4895} {"train_loss": -7.226635932922363, "global_step": 205627, "epoch": 4895} {"train_loss": -7.302617073059082, "global_step": 205628, "epoch": 4895} {"train_loss": -7.234583854675293, "global_step": 205629, "epoch": 4895} {"train_loss": -7.262240886688232, "global_step": 205630, "epoch": 4895} {"train_loss": -7.266912596566336, "global_step": 205631, "epoch": 4895, "val_loss": 69844.2265625} {"train_loss": -7.375635147094727, "global_step": 205632, "epoch": 4896} {"train_loss": -7.1954874992370605, "global_step": 205633, "epoch": 4896} {"train_loss": -7.294678688049316, "global_step": 205634, "epoch": 4896} {"train_loss": -7.335021018981934, "global_step": 205635, "epoch": 4896} {"train_loss": -7.385752201080322, "global_step": 205636, "epoch": 4896} {"train_loss": -7.319637298583984, "global_step": 205637, "epoch": 4896} {"train_loss": -7.335148811340332, "global_step": 205638, "epoch": 4896} {"train_loss": -7.346787452697754, "global_step": 205639, "epoch": 4896} {"train_loss": -7.349722862243652, "global_step": 205640, "epoch": 4896} {"train_loss": -7.3166913986206055, "global_step": 205641, "epoch": 4896} {"train_loss": -7.354629993438721, "global_step": 205642, "epoch": 4896} {"train_loss": -7.3429975509643555, "global_step": 205643, "epoch": 4896} {"train_loss": -7.362314224243164, "global_step": 205644, "epoch": 4896} {"train_loss": -7.300841331481934, "global_step": 205645, "epoch": 4896} {"train_loss": -7.37132453918457, "global_step": 205646, "epoch": 4896} {"train_loss": -7.320169448852539, "global_step": 205647, "epoch": 4896} {"train_loss": -7.415973663330078, "global_step": 205648, "epoch": 4896} {"train_loss": -7.245815753936768, "global_step": 205649, "epoch": 4896} {"train_loss": -7.300591468811035, "global_step": 205650, "epoch": 4896} {"train_loss": -7.3299455642700195, "global_step": 205651, "epoch": 4896} {"train_loss": -7.242329120635986, "global_step": 205652, "epoch": 4896} {"train_loss": -7.306328773498535, "global_step": 205653, "epoch": 4896} {"train_loss": -7.32292366027832, "global_step": 205654, "epoch": 4896} {"train_loss": -7.3928070068359375, "global_step": 205655, "epoch": 4896} {"train_loss": -7.403075218200684, "global_step": 205656, "epoch": 4896} {"train_loss": -7.1411237716674805, "global_step": 205657, "epoch": 4896} {"train_loss": -7.253871440887451, "global_step": 205658, "epoch": 4896} {"train_loss": -7.210953712463379, "global_step": 205659, "epoch": 4896} {"train_loss": -7.229128360748291, "global_step": 205660, "epoch": 4896} {"train_loss": -7.298911094665527, "global_step": 205661, "epoch": 4896} {"train_loss": -7.363775730133057, "global_step": 205662, "epoch": 4896} {"train_loss": -7.357654571533203, "global_step": 205663, "epoch": 4896} {"train_loss": -7.323617935180664, "global_step": 205664, "epoch": 4896} {"train_loss": -7.329840660095215, "global_step": 205665, "epoch": 4896} {"train_loss": -7.216169357299805, "global_step": 205666, "epoch": 4896} {"train_loss": -7.351301193237305, "global_step": 205667, "epoch": 4896} {"train_loss": -7.396781921386719, "global_step": 205668, "epoch": 4896} {"train_loss": -7.360170841217041, "global_step": 205669, "epoch": 4896} {"train_loss": -7.33757209777832, "global_step": 205670, "epoch": 4896} {"train_loss": -7.277766227722168, "global_step": 205671, "epoch": 4896} {"train_loss": -7.35865592956543, "global_step": 205672, "epoch": 4896} {"train_loss": -7.318590482076009, "global_step": 205673, "epoch": 4896, "val_loss": 69910.9765625} {"train_loss": -7.361856937408447, "global_step": 205674, "epoch": 4897} {"train_loss": -7.279822826385498, "global_step": 205675, "epoch": 4897} {"train_loss": -7.439470291137695, "global_step": 205676, "epoch": 4897} {"train_loss": -7.3704633712768555, "global_step": 205677, "epoch": 4897} {"train_loss": -7.406403541564941, "global_step": 205678, "epoch": 4897} {"train_loss": -7.275394439697266, "global_step": 205679, "epoch": 4897} {"train_loss": -7.202922821044922, "global_step": 205680, "epoch": 4897} {"train_loss": -7.305893421173096, "global_step": 205681, "epoch": 4897} {"train_loss": -7.3077569007873535, "global_step": 205682, "epoch": 4897} {"train_loss": -7.20994234085083, "global_step": 205683, "epoch": 4897} {"train_loss": -7.336432456970215, "global_step": 205684, "epoch": 4897} {"train_loss": -7.392771244049072, "global_step": 205685, "epoch": 4897} {"train_loss": -7.293190956115723, "global_step": 205686, "epoch": 4897} {"train_loss": -7.270992279052734, "global_step": 205687, "epoch": 4897} {"train_loss": -7.276718616485596, "global_step": 205688, "epoch": 4897} {"train_loss": -7.2504072189331055, "global_step": 205689, "epoch": 4897} {"train_loss": -7.33219051361084, "global_step": 205690, "epoch": 4897} {"train_loss": -7.158376216888428, "global_step": 205691, "epoch": 4897} {"train_loss": -7.190402507781982, "global_step": 205692, "epoch": 4897} {"train_loss": -7.317636966705322, "global_step": 205693, "epoch": 4897} {"train_loss": -7.220590591430664, "global_step": 205694, "epoch": 4897} {"train_loss": -7.187880516052246, "global_step": 205695, "epoch": 4897} {"train_loss": -7.284631252288818, "global_step": 205696, "epoch": 4897} {"train_loss": -7.297369003295898, "global_step": 205697, "epoch": 4897} {"train_loss": -7.343794822692871, "global_step": 205698, "epoch": 4897} {"train_loss": -7.278332710266113, "global_step": 205699, "epoch": 4897} {"train_loss": -7.342046737670898, "global_step": 205700, "epoch": 4897} {"train_loss": -7.1489105224609375, "global_step": 205701, "epoch": 4897} {"train_loss": -7.323493957519531, "global_step": 205702, "epoch": 4897} {"train_loss": -7.317797660827637, "global_step": 205703, "epoch": 4897} {"train_loss": -7.373058319091797, "global_step": 205704, "epoch": 4897} {"train_loss": -7.3366899490356445, "global_step": 205705, "epoch": 4897} {"train_loss": -7.320631980895996, "global_step": 205706, "epoch": 4897} {"train_loss": -7.29814338684082, "global_step": 205707, "epoch": 4897} {"train_loss": -7.191197872161865, "global_step": 205708, "epoch": 4897} {"train_loss": -7.338854789733887, "global_step": 205709, "epoch": 4897} {"train_loss": -7.384072303771973, "global_step": 205710, "epoch": 4897} {"train_loss": -7.297384262084961, "global_step": 205711, "epoch": 4897} {"train_loss": -7.308352947235107, "global_step": 205712, "epoch": 4897} {"train_loss": -7.3578877449035645, "global_step": 205713, "epoch": 4897} {"train_loss": -7.213467121124268, "global_step": 205714, "epoch": 4897} {"train_loss": -7.296529338473365, "global_step": 205715, "epoch": 4897, "val_loss": 69950.453125} {"train_loss": -7.290347576141357, "global_step": 205716, "epoch": 4898} {"train_loss": -7.2143120765686035, "global_step": 205717, "epoch": 4898} {"train_loss": -7.319753170013428, "global_step": 205718, "epoch": 4898} {"train_loss": -7.286462306976318, "global_step": 205719, "epoch": 4898} {"train_loss": -7.226457595825195, "global_step": 205720, "epoch": 4898} {"train_loss": -7.367243766784668, "global_step": 205721, "epoch": 4898} {"train_loss": -7.3585052490234375, "global_step": 205722, "epoch": 4898} {"train_loss": -7.301799774169922, "global_step": 205723, "epoch": 4898} {"train_loss": -7.214037895202637, "global_step": 205724, "epoch": 4898} {"train_loss": -7.254794597625732, "global_step": 205725, "epoch": 4898} {"train_loss": -7.327816009521484, "global_step": 205726, "epoch": 4898} {"train_loss": -7.367742538452148, "global_step": 205727, "epoch": 4898} {"train_loss": -7.37545108795166, "global_step": 205728, "epoch": 4898} {"train_loss": -7.35986328125, "global_step": 205729, "epoch": 4898} {"train_loss": -7.314485549926758, "global_step": 205730, "epoch": 4898} {"train_loss": -7.372976303100586, "global_step": 205731, "epoch": 4898} {"train_loss": -7.318775177001953, "global_step": 205732, "epoch": 4898} {"train_loss": -7.156449794769287, "global_step": 205733, "epoch": 4898} {"train_loss": -7.318138122558594, "global_step": 205734, "epoch": 4898} {"train_loss": -7.371311187744141, "global_step": 205735, "epoch": 4898} {"train_loss": -7.378137588500977, "global_step": 205736, "epoch": 4898} {"train_loss": -7.327702045440674, "global_step": 205737, "epoch": 4898} {"train_loss": -7.3137030601501465, "global_step": 205738, "epoch": 4898} {"train_loss": -7.31540584564209, "global_step": 205739, "epoch": 4898} {"train_loss": -7.320535659790039, "global_step": 205740, "epoch": 4898} {"train_loss": -7.257308006286621, "global_step": 205741, "epoch": 4898} {"train_loss": -6.996973991394043, "global_step": 205742, "epoch": 4898} {"train_loss": -7.246520042419434, "global_step": 205743, "epoch": 4898} {"train_loss": -7.091853141784668, "global_step": 205744, "epoch": 4898} {"train_loss": -6.982775688171387, "global_step": 205745, "epoch": 4898} {"train_loss": -7.321606159210205, "global_step": 205746, "epoch": 4898} {"train_loss": -6.974067687988281, "global_step": 205747, "epoch": 4898} {"train_loss": -7.156857490539551, "global_step": 205748, "epoch": 4898} {"train_loss": -7.030153274536133, "global_step": 205749, "epoch": 4898} {"train_loss": -7.122812271118164, "global_step": 205750, "epoch": 4898} {"train_loss": -7.106366157531738, "global_step": 205751, "epoch": 4898} {"train_loss": -7.227967262268066, "global_step": 205752, "epoch": 4898} {"train_loss": -7.143343925476074, "global_step": 205753, "epoch": 4898} {"train_loss": -7.215603828430176, "global_step": 205754, "epoch": 4898} {"train_loss": -7.125877857208252, "global_step": 205755, "epoch": 4898} {"train_loss": -7.191066741943359, "global_step": 205756, "epoch": 4898} {"train_loss": -7.244625818161738, "global_step": 205757, "epoch": 4898, "val_loss": 69954.515625} {"train_loss": -7.198346138000488, "global_step": 205758, "epoch": 4899} {"train_loss": -7.172856330871582, "global_step": 205759, "epoch": 4899} {"train_loss": -7.21912956237793, "global_step": 205760, "epoch": 4899} {"train_loss": -7.261693954467773, "global_step": 205761, "epoch": 4899} {"train_loss": -7.242769718170166, "global_step": 205762, "epoch": 4899} {"train_loss": -7.279238700866699, "global_step": 205763, "epoch": 4899} {"train_loss": -7.366171836853027, "global_step": 205764, "epoch": 4899} {"train_loss": -7.272182464599609, "global_step": 205765, "epoch": 4899} {"train_loss": -7.260746002197266, "global_step": 205766, "epoch": 4899} {"train_loss": -7.336559295654297, "global_step": 205767, "epoch": 4899} {"train_loss": -7.390658378601074, "global_step": 205768, "epoch": 4899} {"train_loss": -7.3605804443359375, "global_step": 205769, "epoch": 4899} {"train_loss": -7.294541358947754, "global_step": 205770, "epoch": 4899} {"train_loss": -7.30898904800415, "global_step": 205771, "epoch": 4899} {"train_loss": -7.266533851623535, "global_step": 205772, "epoch": 4899} {"train_loss": -7.3273820877075195, "global_step": 205773, "epoch": 4899} {"train_loss": -7.2320051193237305, "global_step": 205774, "epoch": 4899} {"train_loss": -7.315577507019043, "global_step": 205775, "epoch": 4899} {"train_loss": -7.35915470123291, "global_step": 205776, "epoch": 4899} {"train_loss": -7.354844093322754, "global_step": 205777, "epoch": 4899} {"train_loss": -7.34609842300415, "global_step": 205778, "epoch": 4899} {"train_loss": -7.408205032348633, "global_step": 205779, "epoch": 4899} {"train_loss": -7.294282913208008, "global_step": 205780, "epoch": 4899} {"train_loss": -7.271100044250488, "global_step": 205781, "epoch": 4899} {"train_loss": -7.309451580047607, "global_step": 205782, "epoch": 4899} {"train_loss": -7.359576225280762, "global_step": 205783, "epoch": 4899} {"train_loss": -7.253337383270264, "global_step": 205784, "epoch": 4899} {"train_loss": -7.2617034912109375, "global_step": 205785, "epoch": 4899} {"train_loss": -7.175201416015625, "global_step": 205786, "epoch": 4899} {"train_loss": -7.306038856506348, "global_step": 205787, "epoch": 4899} {"train_loss": -7.307165145874023, "global_step": 205788, "epoch": 4899} {"train_loss": -7.315603256225586, "global_step": 205789, "epoch": 4899} {"train_loss": -7.299493312835693, "global_step": 205790, "epoch": 4899} {"train_loss": -7.355258941650391, "global_step": 205791, "epoch": 4899} {"train_loss": -7.279667854309082, "global_step": 205792, "epoch": 4899} {"train_loss": -7.126832008361816, "global_step": 205793, "epoch": 4899} {"train_loss": -7.336950302124023, "global_step": 205794, "epoch": 4899} {"train_loss": -7.3397603034973145, "global_step": 205795, "epoch": 4899} {"train_loss": -7.231581687927246, "global_step": 205796, "epoch": 4899} {"train_loss": -7.316351890563965, "global_step": 205797, "epoch": 4899} {"train_loss": -7.259831428527832, "global_step": 205798, "epoch": 4899} {"train_loss": -7.288300366628738, "global_step": 205799, "epoch": 4899, "val_loss": 70096.9921875} {"train_loss": -7.339856147766113, "global_step": 205800, "epoch": 4900} {"train_loss": -7.225165843963623, "global_step": 205801, "epoch": 4900} {"train_loss": -7.238569259643555, "global_step": 205802, "epoch": 4900} {"train_loss": -7.2398223876953125, "global_step": 205803, "epoch": 4900} {"train_loss": -7.2776899337768555, "global_step": 205804, "epoch": 4900} {"train_loss": -7.335779666900635, "global_step": 205805, "epoch": 4900} {"train_loss": -7.333344459533691, "global_step": 205806, "epoch": 4900} {"train_loss": -7.363847732543945, "global_step": 205807, "epoch": 4900} {"train_loss": -7.252608299255371, "global_step": 205808, "epoch": 4900} {"train_loss": -7.222442626953125, "global_step": 205809, "epoch": 4900} {"train_loss": -7.329595565795898, "global_step": 205810, "epoch": 4900} {"train_loss": -7.374868392944336, "global_step": 205811, "epoch": 4900} {"train_loss": -7.243278503417969, "global_step": 205812, "epoch": 4900} {"train_loss": -7.255434989929199, "global_step": 205813, "epoch": 4900} {"train_loss": -7.340620994567871, "global_step": 205814, "epoch": 4900} {"train_loss": -7.284667015075684, "global_step": 205815, "epoch": 4900} {"train_loss": -7.351202964782715, "global_step": 205816, "epoch": 4900} {"train_loss": -7.262872695922852, "global_step": 205817, "epoch": 4900} {"train_loss": -7.364790916442871, "global_step": 205818, "epoch": 4900} {"train_loss": -7.318246841430664, "global_step": 205819, "epoch": 4900} {"train_loss": -7.235785961151123, "global_step": 205820, "epoch": 4900} {"train_loss": -7.356847763061523, "global_step": 205821, "epoch": 4900} {"train_loss": -7.384533405303955, "global_step": 205822, "epoch": 4900} {"train_loss": -7.348455429077148, "global_step": 205823, "epoch": 4900} {"train_loss": -7.469934463500977, "global_step": 205824, "epoch": 4900} {"train_loss": -7.290979385375977, "global_step": 205825, "epoch": 4900} {"train_loss": -7.26420783996582, "global_step": 205826, "epoch": 4900} {"train_loss": -7.358287811279297, "global_step": 205827, "epoch": 4900} {"train_loss": -7.3586530685424805, "global_step": 205828, "epoch": 4900} {"train_loss": -7.225028038024902, "global_step": 205829, "epoch": 4900} {"train_loss": -7.240851402282715, "global_step": 205830, "epoch": 4900} {"train_loss": -7.362306594848633, "global_step": 205831, "epoch": 4900} {"train_loss": -7.239804267883301, "global_step": 205832, "epoch": 4900} {"train_loss": -7.314664840698242, "global_step": 205833, "epoch": 4900} {"train_loss": -7.366020679473877, "global_step": 205834, "epoch": 4900} {"train_loss": -7.255855083465576, "global_step": 205835, "epoch": 4900} {"train_loss": -7.361243724822998, "global_step": 205836, "epoch": 4900} {"train_loss": -7.274949073791504, "global_step": 205837, "epoch": 4900} {"train_loss": -7.2388434410095215, "global_step": 205838, "epoch": 4900} {"train_loss": -7.440102577209473, "global_step": 205839, "epoch": 4900} {"train_loss": -7.283979892730713, "global_step": 205840, "epoch": 4900} {"train_loss": -7.311079854056949, "global_step": 205841, "epoch": 4900, "train/sim_max_reward_0": 0.9826350120529973, "train/sim_max_reward_1": 0.9430284118271701, "train/sim_max_reward_2": 0.9574335596926891, "train/sim_max_reward_3": 0.13992846981698762, "train/sim_max_reward_4": 0.8806026144904064, "train/sim_max_reward_5": 0.9146678291605973, "test/sim_max_reward_4300000": 0.9217801268488974, "test/sim_max_reward_4300001": 0.7049386318119528, "test/sim_max_reward_4300002": 0.9377317292800188, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9885387513187304, "test/sim_max_reward_4300006": 0.14001644108382874, "test/sim_max_reward_4300007": 0.8780078313273666, "test/sim_max_reward_4300008": 1.0, "test/sim_max_reward_4300009": 0.9580700367114555, "test/sim_max_reward_4300010": 0.9711775914520433, "test/sim_max_reward_4300011": 0.9887137008073192, "test/sim_max_reward_4300012": 1.0, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 0.96246919407682, "test/sim_max_reward_4300015": 1.0, "test/sim_max_reward_4300016": 0.7726714800871758, "test/sim_max_reward_4300017": 1.0, "test/sim_max_reward_4300018": 0.9963853795450444, "test/sim_max_reward_4300019": 0.1861696249310688, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.9566890407791596, "test/sim_max_reward_4300022": 0.822226846662902, "test/sim_max_reward_4300023": 1.0, "test/sim_max_reward_4300024": 0.9890666067025676, "test/sim_max_reward_4300025": 0.908875532489087, "test/sim_max_reward_4300026": 0.14726918386436913, "test/sim_max_reward_4300027": 0.8487376757860432, "test/sim_max_reward_4300028": 1.0, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.26557185072271094, "test/sim_max_reward_4300031": 0.22270405507695537, "test/sim_max_reward_4300032": 1.0, "test/sim_max_reward_4300033": 0.6705152066458245, "test/sim_max_reward_4300034": 0.9843499925623764, "test/sim_max_reward_4300035": 0.6442822449466379, "test/sim_max_reward_4300036": 0.20401644580084857, "test/sim_max_reward_4300037": 1.0, "test/sim_max_reward_4300038": 0.3073916583745935, "test/sim_max_reward_4300039": 0.7836042587452794, "test/sim_max_reward_4300040": 0.9565442500674005, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.7191724174039749, "test/sim_max_reward_4300043": 0.050626492989405004, "test/sim_max_reward_4300044": 0.04715698000410037, "test/sim_max_reward_4300045": 0.9082206293100246, "test/sim_max_reward_4300046": 0.9597485322740389, "test/sim_max_reward_4300047": 0.10054635758390987, "test/sim_max_reward_4300048": 0.0047557387266443235, "test/sim_max_reward_4300049": 0.17451693575468671, "train/mean_score": 0.8030493161734747, "test/mean_score": 0.6619818711472909, "val_loss": 70006.8046875} {"train_loss": -7.359748363494873, "global_step": 205842, "epoch": 4901} {"train_loss": -7.247046947479248, "global_step": 205843, "epoch": 4901} {"train_loss": -7.315975666046143, "global_step": 205844, "epoch": 4901} {"train_loss": -7.356013298034668, "global_step": 205845, "epoch": 4901} {"train_loss": -7.354535102844238, "global_step": 205846, "epoch": 4901} {"train_loss": -7.401782989501953, "global_step": 205847, "epoch": 4901} {"train_loss": -7.2919158935546875, "global_step": 205848, "epoch": 4901} {"train_loss": -7.2561540603637695, "global_step": 205849, "epoch": 4901} {"train_loss": -7.412997245788574, "global_step": 205850, "epoch": 4901} {"train_loss": -7.394634246826172, "global_step": 205851, "epoch": 4901} {"train_loss": -7.36865234375, "global_step": 205852, "epoch": 4901} {"train_loss": -7.2499799728393555, "global_step": 205853, "epoch": 4901} {"train_loss": -7.313473701477051, "global_step": 205854, "epoch": 4901} {"train_loss": -7.215331077575684, "global_step": 205855, "epoch": 4901} {"train_loss": -7.335343360900879, "global_step": 205856, "epoch": 4901} {"train_loss": -7.28499698638916, "global_step": 205857, "epoch": 4901} {"train_loss": -7.291707992553711, "global_step": 205858, "epoch": 4901} {"train_loss": -7.430172443389893, "global_step": 205859, "epoch": 4901} {"train_loss": -7.365481376647949, "global_step": 205860, "epoch": 4901} {"train_loss": -7.3387885093688965, "global_step": 205861, "epoch": 4901} {"train_loss": -7.400482654571533, "global_step": 205862, "epoch": 4901} {"train_loss": -7.217709541320801, "global_step": 205863, "epoch": 4901} {"train_loss": -7.379227638244629, "global_step": 205864, "epoch": 4901} {"train_loss": -7.319228172302246, "global_step": 205865, "epoch": 4901} {"train_loss": -7.290524482727051, "global_step": 205866, "epoch": 4901} {"train_loss": -7.3615617752075195, "global_step": 205867, "epoch": 4901} {"train_loss": -7.28581428527832, "global_step": 205868, "epoch": 4901} {"train_loss": -7.267573356628418, "global_step": 205869, "epoch": 4901} {"train_loss": -7.269461631774902, "global_step": 205870, "epoch": 4901} {"train_loss": -7.4593706130981445, "global_step": 205871, "epoch": 4901} {"train_loss": -7.3289875984191895, "global_step": 205872, "epoch": 4901} {"train_loss": -7.268599033355713, "global_step": 205873, "epoch": 4901} {"train_loss": -7.27131986618042, "global_step": 205874, "epoch": 4901} {"train_loss": -7.124541282653809, "global_step": 205875, "epoch": 4901} {"train_loss": -7.1547160148620605, "global_step": 205876, "epoch": 4901} {"train_loss": -7.189813613891602, "global_step": 205877, "epoch": 4901} {"train_loss": -7.066967487335205, "global_step": 205878, "epoch": 4901} {"train_loss": -7.353901386260986, "global_step": 205879, "epoch": 4901} {"train_loss": -7.088618278503418, "global_step": 205880, "epoch": 4901} {"train_loss": -7.338165283203125, "global_step": 205881, "epoch": 4901} {"train_loss": -7.27518892288208, "global_step": 205882, "epoch": 4901} {"train_loss": -7.293672255107334, "global_step": 205883, "epoch": 4901, "val_loss": 70155.8515625} {"train_loss": -7.17862606048584, "global_step": 205884, "epoch": 4902} {"train_loss": -7.134609222412109, "global_step": 205885, "epoch": 4902} {"train_loss": -7.093236923217773, "global_step": 205886, "epoch": 4902} {"train_loss": -7.220042705535889, "global_step": 205887, "epoch": 4902} {"train_loss": -7.319218635559082, "global_step": 205888, "epoch": 4902} {"train_loss": -7.239948272705078, "global_step": 205889, "epoch": 4902} {"train_loss": -7.192644119262695, "global_step": 205890, "epoch": 4902} {"train_loss": -7.197574615478516, "global_step": 205891, "epoch": 4902} {"train_loss": -7.2818403244018555, "global_step": 205892, "epoch": 4902} {"train_loss": -7.181445598602295, "global_step": 205893, "epoch": 4902} {"train_loss": -7.224656105041504, "global_step": 205894, "epoch": 4902} {"train_loss": -7.340205669403076, "global_step": 205895, "epoch": 4902} {"train_loss": -7.203512191772461, "global_step": 205896, "epoch": 4902} {"train_loss": -7.257653713226318, "global_step": 205897, "epoch": 4902} {"train_loss": -7.319892883300781, "global_step": 205898, "epoch": 4902} {"train_loss": -7.34256649017334, "global_step": 205899, "epoch": 4902} {"train_loss": -7.330747604370117, "global_step": 205900, "epoch": 4902} {"train_loss": -7.188205718994141, "global_step": 205901, "epoch": 4902} {"train_loss": -7.260902404785156, "global_step": 205902, "epoch": 4902} {"train_loss": -7.405764579772949, "global_step": 205903, "epoch": 4902} {"train_loss": -7.2877373695373535, "global_step": 205904, "epoch": 4902} {"train_loss": -7.287008762359619, "global_step": 205905, "epoch": 4902} {"train_loss": -7.39360237121582, "global_step": 205906, "epoch": 4902} {"train_loss": -7.284569263458252, "global_step": 205907, "epoch": 4902} {"train_loss": -7.397188186645508, "global_step": 205908, "epoch": 4902} {"train_loss": -7.2862420082092285, "global_step": 205909, "epoch": 4902} {"train_loss": -7.416936874389648, "global_step": 205910, "epoch": 4902} {"train_loss": -7.361240386962891, "global_step": 205911, "epoch": 4902} {"train_loss": -7.226299285888672, "global_step": 205912, "epoch": 4902} {"train_loss": -7.3614654541015625, "global_step": 205913, "epoch": 4902} {"train_loss": -7.300921440124512, "global_step": 205914, "epoch": 4902} {"train_loss": -7.284034252166748, "global_step": 205915, "epoch": 4902} {"train_loss": -7.380882263183594, "global_step": 205916, "epoch": 4902} {"train_loss": -7.365471363067627, "global_step": 205917, "epoch": 4902} {"train_loss": -7.297330856323242, "global_step": 205918, "epoch": 4902} {"train_loss": -7.313046932220459, "global_step": 205919, "epoch": 4902} {"train_loss": -7.267786979675293, "global_step": 205920, "epoch": 4902} {"train_loss": -7.405236721038818, "global_step": 205921, "epoch": 4902} {"train_loss": -7.308709621429443, "global_step": 205922, "epoch": 4902} {"train_loss": -7.383548259735107, "global_step": 205923, "epoch": 4902} {"train_loss": -7.357739448547363, "global_step": 205924, "epoch": 4902} {"train_loss": -7.29194188117981, "global_step": 205925, "epoch": 4902, "val_loss": 70082.8671875} {"train_loss": -7.29897403717041, "global_step": 205926, "epoch": 4903} {"train_loss": -7.36716365814209, "global_step": 205927, "epoch": 4903} {"train_loss": -7.341672897338867, "global_step": 205928, "epoch": 4903} {"train_loss": -7.367799758911133, "global_step": 205929, "epoch": 4903} {"train_loss": -7.360872268676758, "global_step": 205930, "epoch": 4903} {"train_loss": -7.335897445678711, "global_step": 205931, "epoch": 4903} {"train_loss": -7.253656387329102, "global_step": 205932, "epoch": 4903} {"train_loss": -7.289119243621826, "global_step": 205933, "epoch": 4903} {"train_loss": -7.2961225509643555, "global_step": 205934, "epoch": 4903} {"train_loss": -7.339148998260498, "global_step": 205935, "epoch": 4903} {"train_loss": -7.294632434844971, "global_step": 205936, "epoch": 4903} {"train_loss": -7.304719924926758, "global_step": 205937, "epoch": 4903} {"train_loss": -7.217868804931641, "global_step": 205938, "epoch": 4903} {"train_loss": -7.349218845367432, "global_step": 205939, "epoch": 4903} {"train_loss": -7.278083801269531, "global_step": 205940, "epoch": 4903} {"train_loss": -7.270119667053223, "global_step": 205941, "epoch": 4903} {"train_loss": -7.308200836181641, "global_step": 205942, "epoch": 4903} {"train_loss": -7.289318084716797, "global_step": 205943, "epoch": 4903} {"train_loss": -7.287546157836914, "global_step": 205944, "epoch": 4903} {"train_loss": -7.229500770568848, "global_step": 205945, "epoch": 4903} {"train_loss": -7.224355697631836, "global_step": 205946, "epoch": 4903} {"train_loss": -7.250210285186768, "global_step": 205947, "epoch": 4903} {"train_loss": -7.328480243682861, "global_step": 205948, "epoch": 4903} {"train_loss": -7.326668739318848, "global_step": 205949, "epoch": 4903} {"train_loss": -7.278428554534912, "global_step": 205950, "epoch": 4903} {"train_loss": -7.185943603515625, "global_step": 205951, "epoch": 4903} {"train_loss": -7.385520935058594, "global_step": 205952, "epoch": 4903} {"train_loss": -7.308094501495361, "global_step": 205953, "epoch": 4903} {"train_loss": -7.226872444152832, "global_step": 205954, "epoch": 4903} {"train_loss": -7.231285572052002, "global_step": 205955, "epoch": 4903} {"train_loss": -7.108481407165527, "global_step": 205956, "epoch": 4903} {"train_loss": -7.308547019958496, "global_step": 205957, "epoch": 4903} {"train_loss": -7.260786533355713, "global_step": 205958, "epoch": 4903} {"train_loss": -7.170958518981934, "global_step": 205959, "epoch": 4903} {"train_loss": -7.227968692779541, "global_step": 205960, "epoch": 4903} {"train_loss": -7.239774227142334, "global_step": 205961, "epoch": 4903} {"train_loss": -7.254623889923096, "global_step": 205962, "epoch": 4903} {"train_loss": -7.277387619018555, "global_step": 205963, "epoch": 4903} {"train_loss": -7.265716552734375, "global_step": 205964, "epoch": 4903} {"train_loss": -7.360037326812744, "global_step": 205965, "epoch": 4903} {"train_loss": -7.3964152336120605, "global_step": 205966, "epoch": 4903} {"train_loss": -7.283070802688599, "global_step": 205967, "epoch": 4903, "val_loss": 70151.6015625} {"train_loss": -7.237347602844238, "global_step": 205968, "epoch": 4904} {"train_loss": -7.264200210571289, "global_step": 205969, "epoch": 4904} {"train_loss": -7.311124801635742, "global_step": 205970, "epoch": 4904} {"train_loss": -7.305238723754883, "global_step": 205971, "epoch": 4904} {"train_loss": -7.212652206420898, "global_step": 205972, "epoch": 4904} {"train_loss": -7.413382530212402, "global_step": 205973, "epoch": 4904} {"train_loss": -7.3173508644104, "global_step": 205974, "epoch": 4904} {"train_loss": -7.3472700119018555, "global_step": 205975, "epoch": 4904} {"train_loss": -7.279078006744385, "global_step": 205976, "epoch": 4904} {"train_loss": -7.282041072845459, "global_step": 205977, "epoch": 4904} {"train_loss": -7.300326347351074, "global_step": 205978, "epoch": 4904} {"train_loss": -7.334019660949707, "global_step": 205979, "epoch": 4904} {"train_loss": -7.2787628173828125, "global_step": 205980, "epoch": 4904} {"train_loss": -7.367082595825195, "global_step": 205981, "epoch": 4904} {"train_loss": -7.444607734680176, "global_step": 205982, "epoch": 4904} {"train_loss": -7.327336311340332, "global_step": 205983, "epoch": 4904} {"train_loss": -7.36802864074707, "global_step": 205984, "epoch": 4904} {"train_loss": -7.329413414001465, "global_step": 205985, "epoch": 4904} {"train_loss": -7.398369789123535, "global_step": 205986, "epoch": 4904} {"train_loss": -7.316757678985596, "global_step": 205987, "epoch": 4904} {"train_loss": -7.3974223136901855, "global_step": 205988, "epoch": 4904} {"train_loss": -7.309595108032227, "global_step": 205989, "epoch": 4904} {"train_loss": -7.351408004760742, "global_step": 205990, "epoch": 4904} {"train_loss": -7.25067138671875, "global_step": 205991, "epoch": 4904} {"train_loss": -7.412199974060059, "global_step": 205992, "epoch": 4904} {"train_loss": -7.242936134338379, "global_step": 205993, "epoch": 4904} {"train_loss": -7.340205192565918, "global_step": 205994, "epoch": 4904} {"train_loss": -7.446229934692383, "global_step": 205995, "epoch": 4904} {"train_loss": -7.255669593811035, "global_step": 205996, "epoch": 4904} {"train_loss": -7.3834381103515625, "global_step": 205997, "epoch": 4904} {"train_loss": -7.263859748840332, "global_step": 205998, "epoch": 4904} {"train_loss": -7.219815254211426, "global_step": 205999, "epoch": 4904} {"train_loss": -7.441684722900391, "global_step": 206000, "epoch": 4904} {"train_loss": -7.367466449737549, "global_step": 206001, "epoch": 4904} {"train_loss": -7.195215702056885, "global_step": 206002, "epoch": 4904} {"train_loss": -7.363504409790039, "global_step": 206003, "epoch": 4904} {"train_loss": -7.242627143859863, "global_step": 206004, "epoch": 4904} {"train_loss": -7.2295355796813965, "global_step": 206005, "epoch": 4904} {"train_loss": -7.3478922843933105, "global_step": 206006, "epoch": 4904} {"train_loss": -7.141444206237793, "global_step": 206007, "epoch": 4904} {"train_loss": -7.363206386566162, "global_step": 206008, "epoch": 4904} {"train_loss": -7.314193180629185, "global_step": 206009, "epoch": 4904, "val_loss": 70066.984375} {"train_loss": -7.34413480758667, "global_step": 206010, "epoch": 4905} {"train_loss": -7.334056854248047, "global_step": 206011, "epoch": 4905} {"train_loss": -7.299567699432373, "global_step": 206012, "epoch": 4905} {"train_loss": -7.424770355224609, "global_step": 206013, "epoch": 4905} {"train_loss": -7.317201614379883, "global_step": 206014, "epoch": 4905} {"train_loss": -7.371334552764893, "global_step": 206015, "epoch": 4905} {"train_loss": -7.284188270568848, "global_step": 206016, "epoch": 4905} {"train_loss": -7.280640602111816, "global_step": 206017, "epoch": 4905} {"train_loss": -7.420561790466309, "global_step": 206018, "epoch": 4905} {"train_loss": -7.258191108703613, "global_step": 206019, "epoch": 4905} {"train_loss": -7.305149078369141, "global_step": 206020, "epoch": 4905} {"train_loss": -7.304115295410156, "global_step": 206021, "epoch": 4905} {"train_loss": -7.321898460388184, "global_step": 206022, "epoch": 4905} {"train_loss": -7.278411865234375, "global_step": 206023, "epoch": 4905} {"train_loss": -7.419495582580566, "global_step": 206024, "epoch": 4905} {"train_loss": -7.306530952453613, "global_step": 206025, "epoch": 4905} {"train_loss": -7.282785892486572, "global_step": 206026, "epoch": 4905} {"train_loss": -7.351370811462402, "global_step": 206027, "epoch": 4905} {"train_loss": -7.267815589904785, "global_step": 206028, "epoch": 4905} {"train_loss": -7.369479179382324, "global_step": 206029, "epoch": 4905} {"train_loss": -7.291996002197266, "global_step": 206030, "epoch": 4905} {"train_loss": -7.254233360290527, "global_step": 206031, "epoch": 4905} {"train_loss": -7.347654342651367, "global_step": 206032, "epoch": 4905} {"train_loss": -7.364770412445068, "global_step": 206033, "epoch": 4905} {"train_loss": -7.252877235412598, "global_step": 206034, "epoch": 4905} {"train_loss": -7.419354438781738, "global_step": 206035, "epoch": 4905} {"train_loss": -7.231210708618164, "global_step": 206036, "epoch": 4905} {"train_loss": -7.247745513916016, "global_step": 206037, "epoch": 4905} {"train_loss": -7.30677604675293, "global_step": 206038, "epoch": 4905} {"train_loss": -7.249198913574219, "global_step": 206039, "epoch": 4905} {"train_loss": -7.372046947479248, "global_step": 206040, "epoch": 4905} {"train_loss": -7.252559661865234, "global_step": 206041, "epoch": 4905} {"train_loss": -7.369564056396484, "global_step": 206042, "epoch": 4905} {"train_loss": -7.325888633728027, "global_step": 206043, "epoch": 4905} {"train_loss": -7.284169673919678, "global_step": 206044, "epoch": 4905} {"train_loss": -7.385651588439941, "global_step": 206045, "epoch": 4905} {"train_loss": -7.2808380126953125, "global_step": 206046, "epoch": 4905} {"train_loss": -7.281642913818359, "global_step": 206047, "epoch": 4905} {"train_loss": -7.322606086730957, "global_step": 206048, "epoch": 4905} {"train_loss": -7.350024223327637, "global_step": 206049, "epoch": 4905} {"train_loss": -7.342310905456543, "global_step": 206050, "epoch": 4905} {"train_loss": -7.319173063550677, "global_step": 206051, "epoch": 4905, "val_loss": 69935.921875} {"train_loss": -7.417110919952393, "global_step": 206052, "epoch": 4906} {"train_loss": -7.367842674255371, "global_step": 206053, "epoch": 4906} {"train_loss": -7.2921247482299805, "global_step": 206054, "epoch": 4906} {"train_loss": -7.223123550415039, "global_step": 206055, "epoch": 4906} {"train_loss": -7.374759674072266, "global_step": 206056, "epoch": 4906} {"train_loss": -7.3088274002075195, "global_step": 206057, "epoch": 4906} {"train_loss": -7.254373550415039, "global_step": 206058, "epoch": 4906} {"train_loss": -7.339071273803711, "global_step": 206059, "epoch": 4906} {"train_loss": -7.274692535400391, "global_step": 206060, "epoch": 4906} {"train_loss": -7.410322666168213, "global_step": 206061, "epoch": 4906} {"train_loss": -7.3745269775390625, "global_step": 206062, "epoch": 4906} {"train_loss": -7.231115341186523, "global_step": 206063, "epoch": 4906} {"train_loss": -7.295749187469482, "global_step": 206064, "epoch": 4906} {"train_loss": -7.263641357421875, "global_step": 206065, "epoch": 4906} {"train_loss": -7.340035438537598, "global_step": 206066, "epoch": 4906} {"train_loss": -7.279870510101318, "global_step": 206067, "epoch": 4906} {"train_loss": -7.380595684051514, "global_step": 206068, "epoch": 4906} {"train_loss": -7.410152435302734, "global_step": 206069, "epoch": 4906} {"train_loss": -7.352935791015625, "global_step": 206070, "epoch": 4906} {"train_loss": -7.336811065673828, "global_step": 206071, "epoch": 4906} {"train_loss": -7.435326099395752, "global_step": 206072, "epoch": 4906} {"train_loss": -7.365879058837891, "global_step": 206073, "epoch": 4906} {"train_loss": -7.338038444519043, "global_step": 206074, "epoch": 4906} {"train_loss": -7.346014022827148, "global_step": 206075, "epoch": 4906} {"train_loss": -7.317634582519531, "global_step": 206076, "epoch": 4906} {"train_loss": -7.336194038391113, "global_step": 206077, "epoch": 4906} {"train_loss": -7.464049339294434, "global_step": 206078, "epoch": 4906} {"train_loss": -7.455841064453125, "global_step": 206079, "epoch": 4906} {"train_loss": -7.305939674377441, "global_step": 206080, "epoch": 4906} {"train_loss": -7.417994976043701, "global_step": 206081, "epoch": 4906} {"train_loss": -7.435564994812012, "global_step": 206082, "epoch": 4906} {"train_loss": -7.379899978637695, "global_step": 206083, "epoch": 4906} {"train_loss": -7.363067150115967, "global_step": 206084, "epoch": 4906} {"train_loss": -7.3370208740234375, "global_step": 206085, "epoch": 4906} {"train_loss": -7.335180282592773, "global_step": 206086, "epoch": 4906} {"train_loss": -7.416214942932129, "global_step": 206087, "epoch": 4906} {"train_loss": -7.366337776184082, "global_step": 206088, "epoch": 4906} {"train_loss": -7.288959980010986, "global_step": 206089, "epoch": 4906} {"train_loss": -7.3257246017456055, "global_step": 206090, "epoch": 4906} {"train_loss": -7.433719158172607, "global_step": 206091, "epoch": 4906} {"train_loss": -7.488351345062256, "global_step": 206092, "epoch": 4906} {"train_loss": -7.355328571228754, "global_step": 206093, "epoch": 4906, "val_loss": 69865.421875} {"train_loss": -7.277113437652588, "global_step": 206094, "epoch": 4907} {"train_loss": -7.385217666625977, "global_step": 206095, "epoch": 4907} {"train_loss": -7.37738037109375, "global_step": 206096, "epoch": 4907} {"train_loss": -7.177285194396973, "global_step": 206097, "epoch": 4907} {"train_loss": -7.316642761230469, "global_step": 206098, "epoch": 4907} {"train_loss": -7.372485160827637, "global_step": 206099, "epoch": 4907} {"train_loss": -7.220365524291992, "global_step": 206100, "epoch": 4907} {"train_loss": -6.917703628540039, "global_step": 206101, "epoch": 4907} {"train_loss": -7.254166603088379, "global_step": 206102, "epoch": 4907} {"train_loss": -7.004736423492432, "global_step": 206103, "epoch": 4907} {"train_loss": -6.881916046142578, "global_step": 206104, "epoch": 4907} {"train_loss": -7.245077610015869, "global_step": 206105, "epoch": 4907} {"train_loss": -6.853157997131348, "global_step": 206106, "epoch": 4907} {"train_loss": -7.192065238952637, "global_step": 206107, "epoch": 4907} {"train_loss": -6.9865546226501465, "global_step": 206108, "epoch": 4907} {"train_loss": -7.107865333557129, "global_step": 206109, "epoch": 4907} {"train_loss": -7.229852199554443, "global_step": 206110, "epoch": 4907} {"train_loss": -6.787981986999512, "global_step": 206111, "epoch": 4907} {"train_loss": -7.238513946533203, "global_step": 206112, "epoch": 4907} {"train_loss": -6.961271286010742, "global_step": 206113, "epoch": 4907} {"train_loss": -7.167422294616699, "global_step": 206114, "epoch": 4907} {"train_loss": -7.157334804534912, "global_step": 206115, "epoch": 4907} {"train_loss": -7.132704734802246, "global_step": 206116, "epoch": 4907} {"train_loss": -7.051016807556152, "global_step": 206117, "epoch": 4907} {"train_loss": -7.104454040527344, "global_step": 206118, "epoch": 4907} {"train_loss": -7.076356887817383, "global_step": 206119, "epoch": 4907} {"train_loss": -7.206604957580566, "global_step": 206120, "epoch": 4907} {"train_loss": -7.200153827667236, "global_step": 206121, "epoch": 4907} {"train_loss": -7.127390384674072, "global_step": 206122, "epoch": 4907} {"train_loss": -7.196826934814453, "global_step": 206123, "epoch": 4907} {"train_loss": -7.1043500900268555, "global_step": 206124, "epoch": 4907} {"train_loss": -7.156624794006348, "global_step": 206125, "epoch": 4907} {"train_loss": -7.228898048400879, "global_step": 206126, "epoch": 4907} {"train_loss": -7.200867652893066, "global_step": 206127, "epoch": 4907} {"train_loss": -7.167604446411133, "global_step": 206128, "epoch": 4907} {"train_loss": -7.227912902832031, "global_step": 206129, "epoch": 4907} {"train_loss": -6.997845649719238, "global_step": 206130, "epoch": 4907} {"train_loss": -7.186434745788574, "global_step": 206131, "epoch": 4907} {"train_loss": -7.123133659362793, "global_step": 206132, "epoch": 4907} {"train_loss": -7.1947736740112305, "global_step": 206133, "epoch": 4907} {"train_loss": -7.206712245941162, "global_step": 206134, "epoch": 4907} {"train_loss": -7.148815177735829, "global_step": 206135, "epoch": 4907, "val_loss": 69949.8984375} {"train_loss": -7.265426158905029, "global_step": 206136, "epoch": 4908} {"train_loss": -7.32346773147583, "global_step": 206137, "epoch": 4908} {"train_loss": -7.156589508056641, "global_step": 206138, "epoch": 4908} {"train_loss": -7.245626926422119, "global_step": 206139, "epoch": 4908} {"train_loss": -7.353781223297119, "global_step": 206140, "epoch": 4908} {"train_loss": -7.311917304992676, "global_step": 206141, "epoch": 4908} {"train_loss": -7.251540184020996, "global_step": 206142, "epoch": 4908} {"train_loss": -7.400111675262451, "global_step": 206143, "epoch": 4908} {"train_loss": -7.266847610473633, "global_step": 206144, "epoch": 4908} {"train_loss": -7.152194023132324, "global_step": 206145, "epoch": 4908} {"train_loss": -7.261172294616699, "global_step": 206146, "epoch": 4908} {"train_loss": -7.335921287536621, "global_step": 206147, "epoch": 4908} {"train_loss": -7.325501441955566, "global_step": 206148, "epoch": 4908} {"train_loss": -7.268182754516602, "global_step": 206149, "epoch": 4908} {"train_loss": -7.342697620391846, "global_step": 206150, "epoch": 4908} {"train_loss": -7.433836460113525, "global_step": 206151, "epoch": 4908} {"train_loss": -7.304538726806641, "global_step": 206152, "epoch": 4908} {"train_loss": -7.303054332733154, "global_step": 206153, "epoch": 4908} {"train_loss": -7.1974029541015625, "global_step": 206154, "epoch": 4908} {"train_loss": -7.328030586242676, "global_step": 206155, "epoch": 4908} {"train_loss": -7.377956390380859, "global_step": 206156, "epoch": 4908} {"train_loss": -7.192299842834473, "global_step": 206157, "epoch": 4908} {"train_loss": -7.383468151092529, "global_step": 206158, "epoch": 4908} {"train_loss": -7.311325550079346, "global_step": 206159, "epoch": 4908} {"train_loss": -7.356941223144531, "global_step": 206160, "epoch": 4908} {"train_loss": -7.412505149841309, "global_step": 206161, "epoch": 4908} {"train_loss": -7.172541618347168, "global_step": 206162, "epoch": 4908} {"train_loss": -7.300261497497559, "global_step": 206163, "epoch": 4908} {"train_loss": -7.236780643463135, "global_step": 206164, "epoch": 4908} {"train_loss": -7.41625452041626, "global_step": 206165, "epoch": 4908} {"train_loss": -7.311245918273926, "global_step": 206166, "epoch": 4908} {"train_loss": -7.3128814697265625, "global_step": 206167, "epoch": 4908} {"train_loss": -7.38737154006958, "global_step": 206168, "epoch": 4908} {"train_loss": -7.322603225708008, "global_step": 206169, "epoch": 4908} {"train_loss": -7.255179405212402, "global_step": 206170, "epoch": 4908} {"train_loss": -7.310258865356445, "global_step": 206171, "epoch": 4908} {"train_loss": -7.317499160766602, "global_step": 206172, "epoch": 4908} {"train_loss": -7.310654163360596, "global_step": 206173, "epoch": 4908} {"train_loss": -7.315549850463867, "global_step": 206174, "epoch": 4908} {"train_loss": -7.38308048248291, "global_step": 206175, "epoch": 4908} {"train_loss": -7.340246200561523, "global_step": 206176, "epoch": 4908} {"train_loss": -7.3079552536919, "global_step": 206177, "epoch": 4908, "val_loss": 69790.265625} {"train_loss": -7.395401477813721, "global_step": 206178, "epoch": 4909} {"train_loss": -7.214385032653809, "global_step": 206179, "epoch": 4909} {"train_loss": -7.1477556228637695, "global_step": 206180, "epoch": 4909} {"train_loss": -7.325958728790283, "global_step": 206181, "epoch": 4909} {"train_loss": -7.303676128387451, "global_step": 206182, "epoch": 4909} {"train_loss": -7.411088943481445, "global_step": 206183, "epoch": 4909} {"train_loss": -7.26516056060791, "global_step": 206184, "epoch": 4909} {"train_loss": -7.319626331329346, "global_step": 206185, "epoch": 4909} {"train_loss": -7.4677534103393555, "global_step": 206186, "epoch": 4909} {"train_loss": -7.405945777893066, "global_step": 206187, "epoch": 4909} {"train_loss": -7.331702709197998, "global_step": 206188, "epoch": 4909} {"train_loss": -7.36899471282959, "global_step": 206189, "epoch": 4909} {"train_loss": -7.303806304931641, "global_step": 206190, "epoch": 4909} {"train_loss": -7.298713207244873, "global_step": 206191, "epoch": 4909} {"train_loss": -7.3957953453063965, "global_step": 206192, "epoch": 4909} {"train_loss": -7.352968692779541, "global_step": 206193, "epoch": 4909} {"train_loss": -7.371639251708984, "global_step": 206194, "epoch": 4909} {"train_loss": -7.320770740509033, "global_step": 206195, "epoch": 4909} {"train_loss": -7.351949691772461, "global_step": 206196, "epoch": 4909} {"train_loss": -7.295827865600586, "global_step": 206197, "epoch": 4909} {"train_loss": -7.279168128967285, "global_step": 206198, "epoch": 4909} {"train_loss": -7.337128639221191, "global_step": 206199, "epoch": 4909} {"train_loss": -7.3319292068481445, "global_step": 206200, "epoch": 4909} {"train_loss": -7.415072441101074, "global_step": 206201, "epoch": 4909} {"train_loss": -7.264023780822754, "global_step": 206202, "epoch": 4909} {"train_loss": -7.27446985244751, "global_step": 206203, "epoch": 4909} {"train_loss": -7.358796119689941, "global_step": 206204, "epoch": 4909} {"train_loss": -7.255587577819824, "global_step": 206205, "epoch": 4909} {"train_loss": -7.329530715942383, "global_step": 206206, "epoch": 4909} {"train_loss": -7.335883140563965, "global_step": 206207, "epoch": 4909} {"train_loss": -7.2793474197387695, "global_step": 206208, "epoch": 4909} {"train_loss": -7.343532562255859, "global_step": 206209, "epoch": 4909} {"train_loss": -7.271938800811768, "global_step": 206210, "epoch": 4909} {"train_loss": -7.424197673797607, "global_step": 206211, "epoch": 4909} {"train_loss": -7.347060203552246, "global_step": 206212, "epoch": 4909} {"train_loss": -7.363304138183594, "global_step": 206213, "epoch": 4909} {"train_loss": -7.357691764831543, "global_step": 206214, "epoch": 4909} {"train_loss": -7.407331466674805, "global_step": 206215, "epoch": 4909} {"train_loss": -7.405032157897949, "global_step": 206216, "epoch": 4909} {"train_loss": -7.316988945007324, "global_step": 206217, "epoch": 4909} {"train_loss": -7.497615814208984, "global_step": 206218, "epoch": 4909} {"train_loss": -7.337596927370344, "global_step": 206219, "epoch": 4909, "val_loss": 70117.6953125} {"train_loss": -7.3411102294921875, "global_step": 206220, "epoch": 4910} {"train_loss": -7.294983386993408, "global_step": 206221, "epoch": 4910} {"train_loss": -7.342878818511963, "global_step": 206222, "epoch": 4910} {"train_loss": -7.407933235168457, "global_step": 206223, "epoch": 4910} {"train_loss": -7.256349563598633, "global_step": 206224, "epoch": 4910} {"train_loss": -7.280400276184082, "global_step": 206225, "epoch": 4910} {"train_loss": -7.181795120239258, "global_step": 206226, "epoch": 4910} {"train_loss": -7.139621257781982, "global_step": 206227, "epoch": 4910} {"train_loss": -7.235892295837402, "global_step": 206228, "epoch": 4910} {"train_loss": -7.172796249389648, "global_step": 206229, "epoch": 4910} {"train_loss": -7.20076847076416, "global_step": 206230, "epoch": 4910} {"train_loss": -7.192958354949951, "global_step": 206231, "epoch": 4910} {"train_loss": -7.020173072814941, "global_step": 206232, "epoch": 4910} {"train_loss": -7.172677993774414, "global_step": 206233, "epoch": 4910} {"train_loss": -7.050422191619873, "global_step": 206234, "epoch": 4910} {"train_loss": -7.156079292297363, "global_step": 206235, "epoch": 4910} {"train_loss": -7.184979438781738, "global_step": 206236, "epoch": 4910} {"train_loss": -6.9218549728393555, "global_step": 206237, "epoch": 4910} {"train_loss": -7.263251304626465, "global_step": 206238, "epoch": 4910} {"train_loss": -6.982776641845703, "global_step": 206239, "epoch": 4910} {"train_loss": -7.201371192932129, "global_step": 206240, "epoch": 4910} {"train_loss": -7.1592559814453125, "global_step": 206241, "epoch": 4910} {"train_loss": -7.183747291564941, "global_step": 206242, "epoch": 4910} {"train_loss": -7.221141338348389, "global_step": 206243, "epoch": 4910} {"train_loss": -7.215682029724121, "global_step": 206244, "epoch": 4910} {"train_loss": -7.196817398071289, "global_step": 206245, "epoch": 4910} {"train_loss": -7.221076011657715, "global_step": 206246, "epoch": 4910} {"train_loss": -7.285986423492432, "global_step": 206247, "epoch": 4910} {"train_loss": -7.269296646118164, "global_step": 206248, "epoch": 4910} {"train_loss": -7.278928756713867, "global_step": 206249, "epoch": 4910} {"train_loss": -7.303431510925293, "global_step": 206250, "epoch": 4910} {"train_loss": -7.315752029418945, "global_step": 206251, "epoch": 4910} {"train_loss": -7.371285438537598, "global_step": 206252, "epoch": 4910} {"train_loss": -7.342852592468262, "global_step": 206253, "epoch": 4910} {"train_loss": -7.306236267089844, "global_step": 206254, "epoch": 4910} {"train_loss": -7.410942077636719, "global_step": 206255, "epoch": 4910} {"train_loss": -7.386398792266846, "global_step": 206256, "epoch": 4910} {"train_loss": -7.314248561859131, "global_step": 206257, "epoch": 4910} {"train_loss": -7.333046913146973, "global_step": 206258, "epoch": 4910} {"train_loss": -7.301939964294434, "global_step": 206259, "epoch": 4910} {"train_loss": -7.3070783615112305, "global_step": 206260, "epoch": 4910} {"train_loss": -7.24054859933399, "global_step": 206261, "epoch": 4910, "val_loss": 70005.390625} {"train_loss": -7.266375541687012, "global_step": 206262, "epoch": 4911} {"train_loss": -7.367465972900391, "global_step": 206263, "epoch": 4911} {"train_loss": -7.362315654754639, "global_step": 206264, "epoch": 4911} {"train_loss": -7.333939552307129, "global_step": 206265, "epoch": 4911} {"train_loss": -7.325693130493164, "global_step": 206266, "epoch": 4911} {"train_loss": -7.418403625488281, "global_step": 206267, "epoch": 4911} {"train_loss": -7.435676097869873, "global_step": 206268, "epoch": 4911} {"train_loss": -7.379865646362305, "global_step": 206269, "epoch": 4911} {"train_loss": -7.350632667541504, "global_step": 206270, "epoch": 4911} {"train_loss": -7.374191761016846, "global_step": 206271, "epoch": 4911} {"train_loss": -7.380174160003662, "global_step": 206272, "epoch": 4911} {"train_loss": -7.322697639465332, "global_step": 206273, "epoch": 4911} {"train_loss": -7.406955718994141, "global_step": 206274, "epoch": 4911} {"train_loss": -7.219167232513428, "global_step": 206275, "epoch": 4911} {"train_loss": -7.304675102233887, "global_step": 206276, "epoch": 4911} {"train_loss": -7.284877300262451, "global_step": 206277, "epoch": 4911} {"train_loss": -7.324395656585693, "global_step": 206278, "epoch": 4911} {"train_loss": -7.348659515380859, "global_step": 206279, "epoch": 4911} {"train_loss": -7.308058261871338, "global_step": 206280, "epoch": 4911} {"train_loss": -7.378171920776367, "global_step": 206281, "epoch": 4911} {"train_loss": -7.459711074829102, "global_step": 206282, "epoch": 4911} {"train_loss": -7.219473838806152, "global_step": 206283, "epoch": 4911} {"train_loss": -7.2987189292907715, "global_step": 206284, "epoch": 4911} {"train_loss": -7.358829021453857, "global_step": 206285, "epoch": 4911} {"train_loss": -7.355876922607422, "global_step": 206286, "epoch": 4911} {"train_loss": -7.271292209625244, "global_step": 206287, "epoch": 4911} {"train_loss": -7.331728935241699, "global_step": 206288, "epoch": 4911} {"train_loss": -7.236126899719238, "global_step": 206289, "epoch": 4911} {"train_loss": -7.098249912261963, "global_step": 206290, "epoch": 4911} {"train_loss": -7.08561897277832, "global_step": 206291, "epoch": 4911} {"train_loss": -7.329862594604492, "global_step": 206292, "epoch": 4911} {"train_loss": -7.284847259521484, "global_step": 206293, "epoch": 4911} {"train_loss": -7.3747358322143555, "global_step": 206294, "epoch": 4911} {"train_loss": -7.281038284301758, "global_step": 206295, "epoch": 4911} {"train_loss": -7.172027587890625, "global_step": 206296, "epoch": 4911} {"train_loss": -7.267603397369385, "global_step": 206297, "epoch": 4911} {"train_loss": -7.056073188781738, "global_step": 206298, "epoch": 4911} {"train_loss": -7.280688285827637, "global_step": 206299, "epoch": 4911} {"train_loss": -7.213258266448975, "global_step": 206300, "epoch": 4911} {"train_loss": -7.1725873947143555, "global_step": 206301, "epoch": 4911} {"train_loss": -7.391452312469482, "global_step": 206302, "epoch": 4911} {"train_loss": -7.300868227368309, "global_step": 206303, "epoch": 4911, "val_loss": 70207.2265625} {"train_loss": -7.258105278015137, "global_step": 206304, "epoch": 4912} {"train_loss": -7.344551086425781, "global_step": 206305, "epoch": 4912} {"train_loss": -7.232170104980469, "global_step": 206306, "epoch": 4912} {"train_loss": -7.223613262176514, "global_step": 206307, "epoch": 4912} {"train_loss": -7.268531322479248, "global_step": 206308, "epoch": 4912} {"train_loss": -7.203894138336182, "global_step": 206309, "epoch": 4912} {"train_loss": -7.289639949798584, "global_step": 206310, "epoch": 4912} {"train_loss": -7.1664719581604, "global_step": 206311, "epoch": 4912} {"train_loss": -7.234818458557129, "global_step": 206312, "epoch": 4912} {"train_loss": -7.193006992340088, "global_step": 206313, "epoch": 4912} {"train_loss": -7.234181880950928, "global_step": 206314, "epoch": 4912} {"train_loss": -7.264398574829102, "global_step": 206315, "epoch": 4912} {"train_loss": -7.344122886657715, "global_step": 206316, "epoch": 4912} {"train_loss": -7.176078796386719, "global_step": 206317, "epoch": 4912} {"train_loss": -7.233621597290039, "global_step": 206318, "epoch": 4912} {"train_loss": -7.23344612121582, "global_step": 206319, "epoch": 4912} {"train_loss": -7.22035026550293, "global_step": 206320, "epoch": 4912} {"train_loss": -7.337756156921387, "global_step": 206321, "epoch": 4912} {"train_loss": -7.210273742675781, "global_step": 206322, "epoch": 4912} {"train_loss": -7.313229560852051, "global_step": 206323, "epoch": 4912} {"train_loss": -7.305758476257324, "global_step": 206324, "epoch": 4912} {"train_loss": -7.300693511962891, "global_step": 206325, "epoch": 4912} {"train_loss": -7.1579437255859375, "global_step": 206326, "epoch": 4912} {"train_loss": -7.296341896057129, "global_step": 206327, "epoch": 4912} {"train_loss": -7.178746223449707, "global_step": 206328, "epoch": 4912} {"train_loss": -7.230445861816406, "global_step": 206329, "epoch": 4912} {"train_loss": -7.23429536819458, "global_step": 206330, "epoch": 4912} {"train_loss": -7.235367774963379, "global_step": 206331, "epoch": 4912} {"train_loss": -7.29991340637207, "global_step": 206332, "epoch": 4912} {"train_loss": -7.292051792144775, "global_step": 206333, "epoch": 4912} {"train_loss": -7.353029251098633, "global_step": 206334, "epoch": 4912} {"train_loss": -7.34235954284668, "global_step": 206335, "epoch": 4912} {"train_loss": -7.296640872955322, "global_step": 206336, "epoch": 4912} {"train_loss": -7.377199172973633, "global_step": 206337, "epoch": 4912} {"train_loss": -7.339564323425293, "global_step": 206338, "epoch": 4912} {"train_loss": -7.38007926940918, "global_step": 206339, "epoch": 4912} {"train_loss": -7.390843868255615, "global_step": 206340, "epoch": 4912} {"train_loss": -7.3775105476379395, "global_step": 206341, "epoch": 4912} {"train_loss": -7.396947860717773, "global_step": 206342, "epoch": 4912} {"train_loss": -7.385431289672852, "global_step": 206343, "epoch": 4912} {"train_loss": -7.297222137451172, "global_step": 206344, "epoch": 4912} {"train_loss": -7.28357534181504, "global_step": 206345, "epoch": 4912, "val_loss": 69997.6484375} {"train_loss": -7.405729293823242, "global_step": 206346, "epoch": 4913} {"train_loss": -7.333127975463867, "global_step": 206347, "epoch": 4913} {"train_loss": -7.356800556182861, "global_step": 206348, "epoch": 4913} {"train_loss": -7.396614074707031, "global_step": 206349, "epoch": 4913} {"train_loss": -7.363922595977783, "global_step": 206350, "epoch": 4913} {"train_loss": -7.314963340759277, "global_step": 206351, "epoch": 4913} {"train_loss": -7.33259391784668, "global_step": 206352, "epoch": 4913} {"train_loss": -7.149677276611328, "global_step": 206353, "epoch": 4913} {"train_loss": -7.416290283203125, "global_step": 206354, "epoch": 4913} {"train_loss": -7.313410758972168, "global_step": 206355, "epoch": 4913} {"train_loss": -7.311629772186279, "global_step": 206356, "epoch": 4913} {"train_loss": -7.380964279174805, "global_step": 206357, "epoch": 4913} {"train_loss": -7.450726509094238, "global_step": 206358, "epoch": 4913} {"train_loss": -7.371258735656738, "global_step": 206359, "epoch": 4913} {"train_loss": -7.333799362182617, "global_step": 206360, "epoch": 4913} {"train_loss": -7.292788028717041, "global_step": 206361, "epoch": 4913} {"train_loss": -7.406002998352051, "global_step": 206362, "epoch": 4913} {"train_loss": -7.383008003234863, "global_step": 206363, "epoch": 4913} {"train_loss": -7.240667343139648, "global_step": 206364, "epoch": 4913} {"train_loss": -7.3141937255859375, "global_step": 206365, "epoch": 4913} {"train_loss": -7.2422332763671875, "global_step": 206366, "epoch": 4913} {"train_loss": -7.299089431762695, "global_step": 206367, "epoch": 4913} {"train_loss": -7.207756996154785, "global_step": 206368, "epoch": 4913} {"train_loss": -7.2294111251831055, "global_step": 206369, "epoch": 4913} {"train_loss": -7.304430961608887, "global_step": 206370, "epoch": 4913} {"train_loss": -7.31828498840332, "global_step": 206371, "epoch": 4913} {"train_loss": -7.225733757019043, "global_step": 206372, "epoch": 4913} {"train_loss": -7.0124921798706055, "global_step": 206373, "epoch": 4913} {"train_loss": -7.273832321166992, "global_step": 206374, "epoch": 4913} {"train_loss": -7.211898326873779, "global_step": 206375, "epoch": 4913} {"train_loss": -7.163051605224609, "global_step": 206376, "epoch": 4913} {"train_loss": -7.240952014923096, "global_step": 206377, "epoch": 4913} {"train_loss": -7.18902587890625, "global_step": 206378, "epoch": 4913} {"train_loss": -7.2070512771606445, "global_step": 206379, "epoch": 4913} {"train_loss": -7.257289409637451, "global_step": 206380, "epoch": 4913} {"train_loss": -7.220890045166016, "global_step": 206381, "epoch": 4913} {"train_loss": -7.304190635681152, "global_step": 206382, "epoch": 4913} {"train_loss": -7.293834686279297, "global_step": 206383, "epoch": 4913} {"train_loss": -7.2223992347717285, "global_step": 206384, "epoch": 4913} {"train_loss": -7.240228652954102, "global_step": 206385, "epoch": 4913} {"train_loss": -7.14625358581543, "global_step": 206386, "epoch": 4913} {"train_loss": -7.283393791743687, "global_step": 206387, "epoch": 4913, "val_loss": 69937.7578125} {"train_loss": -7.286092758178711, "global_step": 206388, "epoch": 4914} {"train_loss": -7.207948684692383, "global_step": 206389, "epoch": 4914} {"train_loss": -7.228221893310547, "global_step": 206390, "epoch": 4914} {"train_loss": -7.07466983795166, "global_step": 206391, "epoch": 4914} {"train_loss": -7.267759799957275, "global_step": 206392, "epoch": 4914} {"train_loss": -7.140137195587158, "global_step": 206393, "epoch": 4914} {"train_loss": -7.3958330154418945, "global_step": 206394, "epoch": 4914} {"train_loss": -7.2076568603515625, "global_step": 206395, "epoch": 4914} {"train_loss": -7.297121047973633, "global_step": 206396, "epoch": 4914} {"train_loss": -7.34788179397583, "global_step": 206397, "epoch": 4914} {"train_loss": -7.1833624839782715, "global_step": 206398, "epoch": 4914} {"train_loss": -7.373615264892578, "global_step": 206399, "epoch": 4914} {"train_loss": -7.2629218101501465, "global_step": 206400, "epoch": 4914} {"train_loss": -7.361963272094727, "global_step": 206401, "epoch": 4914} {"train_loss": -7.316202163696289, "global_step": 206402, "epoch": 4914} {"train_loss": -7.20926570892334, "global_step": 206403, "epoch": 4914} {"train_loss": -7.390764236450195, "global_step": 206404, "epoch": 4914} {"train_loss": -7.463768005371094, "global_step": 206405, "epoch": 4914} {"train_loss": -7.343132972717285, "global_step": 206406, "epoch": 4914} {"train_loss": -7.360779762268066, "global_step": 206407, "epoch": 4914} {"train_loss": -7.364840507507324, "global_step": 206408, "epoch": 4914} {"train_loss": -7.405483245849609, "global_step": 206409, "epoch": 4914} {"train_loss": -7.251821517944336, "global_step": 206410, "epoch": 4914} {"train_loss": -7.343815803527832, "global_step": 206411, "epoch": 4914} {"train_loss": -7.360649108886719, "global_step": 206412, "epoch": 4914} {"train_loss": -7.359245300292969, "global_step": 206413, "epoch": 4914} {"train_loss": -7.274561882019043, "global_step": 206414, "epoch": 4914} {"train_loss": -7.399125099182129, "global_step": 206415, "epoch": 4914} {"train_loss": -7.327237606048584, "global_step": 206416, "epoch": 4914} {"train_loss": -7.397009372711182, "global_step": 206417, "epoch": 4914} {"train_loss": -7.259586334228516, "global_step": 206418, "epoch": 4914} {"train_loss": -7.3322434425354, "global_step": 206419, "epoch": 4914} {"train_loss": -7.3453474044799805, "global_step": 206420, "epoch": 4914} {"train_loss": -7.298439025878906, "global_step": 206421, "epoch": 4914} {"train_loss": -7.240154266357422, "global_step": 206422, "epoch": 4914} {"train_loss": -7.283124923706055, "global_step": 206423, "epoch": 4914} {"train_loss": -7.353525161743164, "global_step": 206424, "epoch": 4914} {"train_loss": -7.256475925445557, "global_step": 206425, "epoch": 4914} {"train_loss": -7.225554466247559, "global_step": 206426, "epoch": 4914} {"train_loss": -7.208442211151123, "global_step": 206427, "epoch": 4914} {"train_loss": -7.207652568817139, "global_step": 206428, "epoch": 4914} {"train_loss": -7.297604186194284, "global_step": 206429, "epoch": 4914, "val_loss": 70174.625} {"train_loss": -7.311872959136963, "global_step": 206430, "epoch": 4915} {"train_loss": -7.289053916931152, "global_step": 206431, "epoch": 4915} {"train_loss": -7.270590782165527, "global_step": 206432, "epoch": 4915} {"train_loss": -7.260742664337158, "global_step": 206433, "epoch": 4915} {"train_loss": -7.2146992683410645, "global_step": 206434, "epoch": 4915} {"train_loss": -7.3379716873168945, "global_step": 206435, "epoch": 4915} {"train_loss": -7.246576309204102, "global_step": 206436, "epoch": 4915} {"train_loss": -7.427877426147461, "global_step": 206437, "epoch": 4915} {"train_loss": -7.336365699768066, "global_step": 206438, "epoch": 4915} {"train_loss": -7.287817001342773, "global_step": 206439, "epoch": 4915} {"train_loss": -7.344918251037598, "global_step": 206440, "epoch": 4915} {"train_loss": -7.229797840118408, "global_step": 206441, "epoch": 4915} {"train_loss": -7.297250747680664, "global_step": 206442, "epoch": 4915} {"train_loss": -7.350332260131836, "global_step": 206443, "epoch": 4915} {"train_loss": -7.254990577697754, "global_step": 206444, "epoch": 4915} {"train_loss": -7.23726749420166, "global_step": 206445, "epoch": 4915} {"train_loss": -7.338454246520996, "global_step": 206446, "epoch": 4915} {"train_loss": -7.318346977233887, "global_step": 206447, "epoch": 4915} {"train_loss": -7.247570991516113, "global_step": 206448, "epoch": 4915} {"train_loss": -7.329110145568848, "global_step": 206449, "epoch": 4915} {"train_loss": -7.334193706512451, "global_step": 206450, "epoch": 4915} {"train_loss": -7.291066646575928, "global_step": 206451, "epoch": 4915} {"train_loss": -7.427692413330078, "global_step": 206452, "epoch": 4915} {"train_loss": -7.210771083831787, "global_step": 206453, "epoch": 4915} {"train_loss": -7.236368179321289, "global_step": 206454, "epoch": 4915} {"train_loss": -7.333104610443115, "global_step": 206455, "epoch": 4915} {"train_loss": -7.314046859741211, "global_step": 206456, "epoch": 4915} {"train_loss": -7.261702060699463, "global_step": 206457, "epoch": 4915} {"train_loss": -7.404894828796387, "global_step": 206458, "epoch": 4915} {"train_loss": -7.346292495727539, "global_step": 206459, "epoch": 4915} {"train_loss": -7.396291732788086, "global_step": 206460, "epoch": 4915} {"train_loss": -7.439748764038086, "global_step": 206461, "epoch": 4915} {"train_loss": -7.461267948150635, "global_step": 206462, "epoch": 4915} {"train_loss": -7.313955307006836, "global_step": 206463, "epoch": 4915} {"train_loss": -7.320398330688477, "global_step": 206464, "epoch": 4915} {"train_loss": -7.320900917053223, "global_step": 206465, "epoch": 4915} {"train_loss": -7.288883209228516, "global_step": 206466, "epoch": 4915} {"train_loss": -7.382846832275391, "global_step": 206467, "epoch": 4915} {"train_loss": -7.321111679077148, "global_step": 206468, "epoch": 4915} {"train_loss": -7.206045150756836, "global_step": 206469, "epoch": 4915} {"train_loss": -7.385344982147217, "global_step": 206470, "epoch": 4915} {"train_loss": -7.312841642470587, "global_step": 206471, "epoch": 4915, "val_loss": 70105.5390625} {"train_loss": -7.2369704246521, "global_step": 206472, "epoch": 4916} {"train_loss": -7.347504138946533, "global_step": 206473, "epoch": 4916} {"train_loss": -7.210814476013184, "global_step": 206474, "epoch": 4916} {"train_loss": -7.327230930328369, "global_step": 206475, "epoch": 4916} {"train_loss": -7.286953926086426, "global_step": 206476, "epoch": 4916} {"train_loss": -7.330446243286133, "global_step": 206477, "epoch": 4916} {"train_loss": -7.404134750366211, "global_step": 206478, "epoch": 4916} {"train_loss": -7.350000858306885, "global_step": 206479, "epoch": 4916} {"train_loss": -7.29464054107666, "global_step": 206480, "epoch": 4916} {"train_loss": -7.2817888259887695, "global_step": 206481, "epoch": 4916} {"train_loss": -7.307117462158203, "global_step": 206482, "epoch": 4916} {"train_loss": -7.344124794006348, "global_step": 206483, "epoch": 4916} {"train_loss": -7.327610015869141, "global_step": 206484, "epoch": 4916} {"train_loss": -7.451545238494873, "global_step": 206485, "epoch": 4916} {"train_loss": -7.312652111053467, "global_step": 206486, "epoch": 4916} {"train_loss": -7.319921493530273, "global_step": 206487, "epoch": 4916} {"train_loss": -7.385014533996582, "global_step": 206488, "epoch": 4916} {"train_loss": -7.3385748863220215, "global_step": 206489, "epoch": 4916} {"train_loss": -7.181424140930176, "global_step": 206490, "epoch": 4916} {"train_loss": -7.304265022277832, "global_step": 206491, "epoch": 4916} {"train_loss": -7.277482986450195, "global_step": 206492, "epoch": 4916} {"train_loss": -7.234144687652588, "global_step": 206493, "epoch": 4916} {"train_loss": -7.301530838012695, "global_step": 206494, "epoch": 4916} {"train_loss": -7.218348503112793, "global_step": 206495, "epoch": 4916} {"train_loss": -7.253345966339111, "global_step": 206496, "epoch": 4916} {"train_loss": -7.275666236877441, "global_step": 206497, "epoch": 4916} {"train_loss": -7.427249908447266, "global_step": 206498, "epoch": 4916} {"train_loss": -7.214110374450684, "global_step": 206499, "epoch": 4916} {"train_loss": -7.306090831756592, "global_step": 206500, "epoch": 4916} {"train_loss": -7.341418743133545, "global_step": 206501, "epoch": 4916} {"train_loss": -7.259727478027344, "global_step": 206502, "epoch": 4916} {"train_loss": -7.3168840408325195, "global_step": 206503, "epoch": 4916} {"train_loss": -7.320832252502441, "global_step": 206504, "epoch": 4916} {"train_loss": -7.140571594238281, "global_step": 206505, "epoch": 4916} {"train_loss": -7.316015720367432, "global_step": 206506, "epoch": 4916} {"train_loss": -7.382372856140137, "global_step": 206507, "epoch": 4916} {"train_loss": -7.286844253540039, "global_step": 206508, "epoch": 4916} {"train_loss": -7.440957546234131, "global_step": 206509, "epoch": 4916} {"train_loss": -7.320198059082031, "global_step": 206510, "epoch": 4916} {"train_loss": -7.319691181182861, "global_step": 206511, "epoch": 4916} {"train_loss": -7.345969200134277, "global_step": 206512, "epoch": 4916} {"train_loss": -7.309163388751802, "global_step": 206513, "epoch": 4916, "val_loss": 69982.6875} {"train_loss": -7.226436138153076, "global_step": 206514, "epoch": 4917} {"train_loss": -7.362464904785156, "global_step": 206515, "epoch": 4917} {"train_loss": -7.422921657562256, "global_step": 206516, "epoch": 4917} {"train_loss": -7.29283332824707, "global_step": 206517, "epoch": 4917} {"train_loss": -7.439617156982422, "global_step": 206518, "epoch": 4917} {"train_loss": -7.363621711730957, "global_step": 206519, "epoch": 4917} {"train_loss": -7.427850723266602, "global_step": 206520, "epoch": 4917} {"train_loss": -7.3702592849731445, "global_step": 206521, "epoch": 4917} {"train_loss": -7.402196407318115, "global_step": 206522, "epoch": 4917} {"train_loss": -7.411198616027832, "global_step": 206523, "epoch": 4917} {"train_loss": -7.346920490264893, "global_step": 206524, "epoch": 4917} {"train_loss": -7.3786115646362305, "global_step": 206525, "epoch": 4917} {"train_loss": -7.309739112854004, "global_step": 206526, "epoch": 4917} {"train_loss": -7.502641677856445, "global_step": 206527, "epoch": 4917} {"train_loss": -7.374833106994629, "global_step": 206528, "epoch": 4917} {"train_loss": -7.298399925231934, "global_step": 206529, "epoch": 4917} {"train_loss": -7.455591201782227, "global_step": 206530, "epoch": 4917} {"train_loss": -7.158046722412109, "global_step": 206531, "epoch": 4917} {"train_loss": -7.190471172332764, "global_step": 206532, "epoch": 4917} {"train_loss": -7.2344818115234375, "global_step": 206533, "epoch": 4917} {"train_loss": -7.364262580871582, "global_step": 206534, "epoch": 4917} {"train_loss": -7.30485725402832, "global_step": 206535, "epoch": 4917} {"train_loss": -7.249749183654785, "global_step": 206536, "epoch": 4917} {"train_loss": -7.358077049255371, "global_step": 206537, "epoch": 4917} {"train_loss": -7.38877010345459, "global_step": 206538, "epoch": 4917} {"train_loss": -7.329578399658203, "global_step": 206539, "epoch": 4917} {"train_loss": -7.3708624839782715, "global_step": 206540, "epoch": 4917} {"train_loss": -7.351587295532227, "global_step": 206541, "epoch": 4917} {"train_loss": -7.33345890045166, "global_step": 206542, "epoch": 4917} {"train_loss": -7.336142539978027, "global_step": 206543, "epoch": 4917} {"train_loss": -7.47833251953125, "global_step": 206544, "epoch": 4917} {"train_loss": -7.325522422790527, "global_step": 206545, "epoch": 4917} {"train_loss": -7.295650482177734, "global_step": 206546, "epoch": 4917} {"train_loss": -7.452740669250488, "global_step": 206547, "epoch": 4917} {"train_loss": -7.341835975646973, "global_step": 206548, "epoch": 4917} {"train_loss": -7.196994781494141, "global_step": 206549, "epoch": 4917} {"train_loss": -7.324434280395508, "global_step": 206550, "epoch": 4917} {"train_loss": -7.390105247497559, "global_step": 206551, "epoch": 4917} {"train_loss": -7.309201240539551, "global_step": 206552, "epoch": 4917} {"train_loss": -7.35556697845459, "global_step": 206553, "epoch": 4917} {"train_loss": -7.2240447998046875, "global_step": 206554, "epoch": 4917} {"train_loss": -7.342698744365147, "global_step": 206555, "epoch": 4917, "val_loss": 69847.0390625} {"train_loss": -7.312225341796875, "global_step": 206556, "epoch": 4918} {"train_loss": -7.351542949676514, "global_step": 206557, "epoch": 4918} {"train_loss": -7.347017288208008, "global_step": 206558, "epoch": 4918} {"train_loss": -7.342406749725342, "global_step": 206559, "epoch": 4918} {"train_loss": -7.371386528015137, "global_step": 206560, "epoch": 4918} {"train_loss": -7.3371734619140625, "global_step": 206561, "epoch": 4918} {"train_loss": -7.457099914550781, "global_step": 206562, "epoch": 4918} {"train_loss": -7.341484546661377, "global_step": 206563, "epoch": 4918} {"train_loss": -7.341650009155273, "global_step": 206564, "epoch": 4918} {"train_loss": -7.277332305908203, "global_step": 206565, "epoch": 4918} {"train_loss": -7.333645820617676, "global_step": 206566, "epoch": 4918} {"train_loss": -7.288751602172852, "global_step": 206567, "epoch": 4918} {"train_loss": -7.419354438781738, "global_step": 206568, "epoch": 4918} {"train_loss": -7.326085090637207, "global_step": 206569, "epoch": 4918} {"train_loss": -7.280474662780762, "global_step": 206570, "epoch": 4918} {"train_loss": -7.387510299682617, "global_step": 206571, "epoch": 4918} {"train_loss": -7.296899795532227, "global_step": 206572, "epoch": 4918} {"train_loss": -7.378325939178467, "global_step": 206573, "epoch": 4918} {"train_loss": -7.321174144744873, "global_step": 206574, "epoch": 4918} {"train_loss": -7.25045919418335, "global_step": 206575, "epoch": 4918} {"train_loss": -7.33375358581543, "global_step": 206576, "epoch": 4918} {"train_loss": -7.278478622436523, "global_step": 206577, "epoch": 4918} {"train_loss": -7.38173770904541, "global_step": 206578, "epoch": 4918} {"train_loss": -7.300271034240723, "global_step": 206579, "epoch": 4918} {"train_loss": -7.340030193328857, "global_step": 206580, "epoch": 4918} {"train_loss": -7.279329299926758, "global_step": 206581, "epoch": 4918} {"train_loss": -7.163043022155762, "global_step": 206582, "epoch": 4918} {"train_loss": -7.371471405029297, "global_step": 206583, "epoch": 4918} {"train_loss": -7.238670349121094, "global_step": 206584, "epoch": 4918} {"train_loss": -7.168577194213867, "global_step": 206585, "epoch": 4918} {"train_loss": -7.323451995849609, "global_step": 206586, "epoch": 4918} {"train_loss": -7.268190383911133, "global_step": 206587, "epoch": 4918} {"train_loss": -7.204451560974121, "global_step": 206588, "epoch": 4918} {"train_loss": -7.27890157699585, "global_step": 206589, "epoch": 4918} {"train_loss": -7.236737251281738, "global_step": 206590, "epoch": 4918} {"train_loss": -7.236072063446045, "global_step": 206591, "epoch": 4918} {"train_loss": -7.203500270843506, "global_step": 206592, "epoch": 4918} {"train_loss": -7.087044715881348, "global_step": 206593, "epoch": 4918} {"train_loss": -7.299224853515625, "global_step": 206594, "epoch": 4918} {"train_loss": -7.085773468017578, "global_step": 206595, "epoch": 4918} {"train_loss": -7.319697380065918, "global_step": 206596, "epoch": 4918} {"train_loss": -7.297404550370716, "global_step": 206597, "epoch": 4918, "val_loss": 70077.328125} {"train_loss": -7.313839912414551, "global_step": 206598, "epoch": 4919} {"train_loss": -7.255438327789307, "global_step": 206599, "epoch": 4919} {"train_loss": -7.228907108306885, "global_step": 206600, "epoch": 4919} {"train_loss": -7.327293395996094, "global_step": 206601, "epoch": 4919} {"train_loss": -7.264673709869385, "global_step": 206602, "epoch": 4919} {"train_loss": -7.231930732727051, "global_step": 206603, "epoch": 4919} {"train_loss": -7.207617282867432, "global_step": 206604, "epoch": 4919} {"train_loss": -7.321288108825684, "global_step": 206605, "epoch": 4919} {"train_loss": -7.26536750793457, "global_step": 206606, "epoch": 4919} {"train_loss": -7.179985046386719, "global_step": 206607, "epoch": 4919} {"train_loss": -7.343716621398926, "global_step": 206608, "epoch": 4919} {"train_loss": -7.068885803222656, "global_step": 206609, "epoch": 4919} {"train_loss": -7.29014778137207, "global_step": 206610, "epoch": 4919} {"train_loss": -7.358084678649902, "global_step": 206611, "epoch": 4919} {"train_loss": -7.121797561645508, "global_step": 206612, "epoch": 4919} {"train_loss": -6.988097190856934, "global_step": 206613, "epoch": 4919} {"train_loss": -7.256021499633789, "global_step": 206614, "epoch": 4919} {"train_loss": -6.98673152923584, "global_step": 206615, "epoch": 4919} {"train_loss": -7.323037147521973, "global_step": 206616, "epoch": 4919} {"train_loss": -7.2293291091918945, "global_step": 206617, "epoch": 4919} {"train_loss": -7.223752021789551, "global_step": 206618, "epoch": 4919} {"train_loss": -7.158410549163818, "global_step": 206619, "epoch": 4919} {"train_loss": -7.267622947692871, "global_step": 206620, "epoch": 4919} {"train_loss": -7.257948875427246, "global_step": 206621, "epoch": 4919} {"train_loss": -7.2960920333862305, "global_step": 206622, "epoch": 4919} {"train_loss": -7.224906921386719, "global_step": 206623, "epoch": 4919} {"train_loss": -7.270784378051758, "global_step": 206624, "epoch": 4919} {"train_loss": -7.289529800415039, "global_step": 206625, "epoch": 4919} {"train_loss": -7.192193984985352, "global_step": 206626, "epoch": 4919} {"train_loss": -7.288917541503906, "global_step": 206627, "epoch": 4919} {"train_loss": -7.354959487915039, "global_step": 206628, "epoch": 4919} {"train_loss": -7.216053009033203, "global_step": 206629, "epoch": 4919} {"train_loss": -7.299282550811768, "global_step": 206630, "epoch": 4919} {"train_loss": -7.289804458618164, "global_step": 206631, "epoch": 4919} {"train_loss": -7.300925254821777, "global_step": 206632, "epoch": 4919} {"train_loss": -7.292019844055176, "global_step": 206633, "epoch": 4919} {"train_loss": -7.29782772064209, "global_step": 206634, "epoch": 4919} {"train_loss": -7.167496204376221, "global_step": 206635, "epoch": 4919} {"train_loss": -7.16989803314209, "global_step": 206636, "epoch": 4919} {"train_loss": -7.245553970336914, "global_step": 206637, "epoch": 4919} {"train_loss": -7.156517028808594, "global_step": 206638, "epoch": 4919} {"train_loss": -7.23559402284168, "global_step": 206639, "epoch": 4919, "val_loss": 70127.078125} {"train_loss": -7.392121315002441, "global_step": 206640, "epoch": 4920} {"train_loss": -7.2436065673828125, "global_step": 206641, "epoch": 4920} {"train_loss": -7.182797431945801, "global_step": 206642, "epoch": 4920} {"train_loss": -7.399157524108887, "global_step": 206643, "epoch": 4920} {"train_loss": -7.224889278411865, "global_step": 206644, "epoch": 4920} {"train_loss": -7.262999534606934, "global_step": 206645, "epoch": 4920} {"train_loss": -7.216183185577393, "global_step": 206646, "epoch": 4920} {"train_loss": -7.241513252258301, "global_step": 206647, "epoch": 4920} {"train_loss": -7.243915557861328, "global_step": 206648, "epoch": 4920} {"train_loss": -7.135886192321777, "global_step": 206649, "epoch": 4920} {"train_loss": -7.134947776794434, "global_step": 206650, "epoch": 4920} {"train_loss": -7.034010887145996, "global_step": 206651, "epoch": 4920} {"train_loss": -7.276687145233154, "global_step": 206652, "epoch": 4920} {"train_loss": -7.226295471191406, "global_step": 206653, "epoch": 4920} {"train_loss": -7.228115558624268, "global_step": 206654, "epoch": 4920} {"train_loss": -7.154569625854492, "global_step": 206655, "epoch": 4920} {"train_loss": -7.1375017166137695, "global_step": 206656, "epoch": 4920} {"train_loss": -7.225788116455078, "global_step": 206657, "epoch": 4920} {"train_loss": -6.930566787719727, "global_step": 206658, "epoch": 4920} {"train_loss": -7.259134769439697, "global_step": 206659, "epoch": 4920} {"train_loss": -7.1993513107299805, "global_step": 206660, "epoch": 4920} {"train_loss": -7.139832496643066, "global_step": 206661, "epoch": 4920} {"train_loss": -7.147447109222412, "global_step": 206662, "epoch": 4920} {"train_loss": -7.299161911010742, "global_step": 206663, "epoch": 4920} {"train_loss": -7.065745830535889, "global_step": 206664, "epoch": 4920} {"train_loss": -7.369078159332275, "global_step": 206665, "epoch": 4920} {"train_loss": -7.053432941436768, "global_step": 206666, "epoch": 4920} {"train_loss": -7.2775397300720215, "global_step": 206667, "epoch": 4920} {"train_loss": -7.193444728851318, "global_step": 206668, "epoch": 4920} {"train_loss": -7.258745193481445, "global_step": 206669, "epoch": 4920} {"train_loss": -7.220681190490723, "global_step": 206670, "epoch": 4920} {"train_loss": -7.2568793296813965, "global_step": 206671, "epoch": 4920} {"train_loss": -7.252204418182373, "global_step": 206672, "epoch": 4920} {"train_loss": -7.2793755531311035, "global_step": 206673, "epoch": 4920} {"train_loss": -7.285521984100342, "global_step": 206674, "epoch": 4920} {"train_loss": -7.28226375579834, "global_step": 206675, "epoch": 4920} {"train_loss": -7.3255414962768555, "global_step": 206676, "epoch": 4920} {"train_loss": -7.284444808959961, "global_step": 206677, "epoch": 4920} {"train_loss": -7.322168827056885, "global_step": 206678, "epoch": 4920} {"train_loss": -7.330121994018555, "global_step": 206679, "epoch": 4920} {"train_loss": -7.348627090454102, "global_step": 206680, "epoch": 4920} {"train_loss": -7.229364542734055, "global_step": 206681, "epoch": 4920, "val_loss": 70005.2421875} {"train_loss": -7.260656356811523, "global_step": 206682, "epoch": 4921} {"train_loss": -7.245543479919434, "global_step": 206683, "epoch": 4921} {"train_loss": -7.412193775177002, "global_step": 206684, "epoch": 4921} {"train_loss": -7.425141334533691, "global_step": 206685, "epoch": 4921} {"train_loss": -7.294067859649658, "global_step": 206686, "epoch": 4921} {"train_loss": -7.445349216461182, "global_step": 206687, "epoch": 4921} {"train_loss": -7.439079284667969, "global_step": 206688, "epoch": 4921} {"train_loss": -7.315019607543945, "global_step": 206689, "epoch": 4921} {"train_loss": -7.380200386047363, "global_step": 206690, "epoch": 4921} {"train_loss": -7.392936706542969, "global_step": 206691, "epoch": 4921} {"train_loss": -7.331459045410156, "global_step": 206692, "epoch": 4921} {"train_loss": -7.326102256774902, "global_step": 206693, "epoch": 4921} {"train_loss": -7.438200950622559, "global_step": 206694, "epoch": 4921} {"train_loss": -7.390408515930176, "global_step": 206695, "epoch": 4921} {"train_loss": -7.3793230056762695, "global_step": 206696, "epoch": 4921} {"train_loss": -7.217268466949463, "global_step": 206697, "epoch": 4921} {"train_loss": -7.333054542541504, "global_step": 206698, "epoch": 4921} {"train_loss": -7.364627361297607, "global_step": 206699, "epoch": 4921} {"train_loss": -7.404112815856934, "global_step": 206700, "epoch": 4921} {"train_loss": -7.326281547546387, "global_step": 206701, "epoch": 4921} {"train_loss": -7.432831764221191, "global_step": 206702, "epoch": 4921} {"train_loss": -7.441274642944336, "global_step": 206703, "epoch": 4921} {"train_loss": -7.388199329376221, "global_step": 206704, "epoch": 4921} {"train_loss": -7.357737064361572, "global_step": 206705, "epoch": 4921} {"train_loss": -7.337934494018555, "global_step": 206706, "epoch": 4921} {"train_loss": -7.245121002197266, "global_step": 206707, "epoch": 4921} {"train_loss": -7.361123085021973, "global_step": 206708, "epoch": 4921} {"train_loss": -7.19849157333374, "global_step": 206709, "epoch": 4921} {"train_loss": -7.33809757232666, "global_step": 206710, "epoch": 4921} {"train_loss": -7.411525726318359, "global_step": 206711, "epoch": 4921} {"train_loss": -7.391469478607178, "global_step": 206712, "epoch": 4921} {"train_loss": -7.384969711303711, "global_step": 206713, "epoch": 4921} {"train_loss": -7.344194412231445, "global_step": 206714, "epoch": 4921} {"train_loss": -7.306278228759766, "global_step": 206715, "epoch": 4921} {"train_loss": -7.311960220336914, "global_step": 206716, "epoch": 4921} {"train_loss": -7.33931827545166, "global_step": 206717, "epoch": 4921} {"train_loss": -7.299778461456299, "global_step": 206718, "epoch": 4921} {"train_loss": -7.30624532699585, "global_step": 206719, "epoch": 4921} {"train_loss": -7.416922569274902, "global_step": 206720, "epoch": 4921} {"train_loss": -7.390777111053467, "global_step": 206721, "epoch": 4921} {"train_loss": -7.250734329223633, "global_step": 206722, "epoch": 4921} {"train_loss": -7.351144529524303, "global_step": 206723, "epoch": 4921, "val_loss": 69920.03125} {"train_loss": -7.300364017486572, "global_step": 206724, "epoch": 4922} {"train_loss": -7.384405136108398, "global_step": 206725, "epoch": 4922} {"train_loss": -7.45111608505249, "global_step": 206726, "epoch": 4922} {"train_loss": -7.367105007171631, "global_step": 206727, "epoch": 4922} {"train_loss": -7.4592437744140625, "global_step": 206728, "epoch": 4922} {"train_loss": -7.489252090454102, "global_step": 206729, "epoch": 4922} {"train_loss": -7.39920711517334, "global_step": 206730, "epoch": 4922} {"train_loss": -7.418951988220215, "global_step": 206731, "epoch": 4922} {"train_loss": -7.339846611022949, "global_step": 206732, "epoch": 4922} {"train_loss": -7.441873073577881, "global_step": 206733, "epoch": 4922} {"train_loss": -7.373787879943848, "global_step": 206734, "epoch": 4922} {"train_loss": -7.4397406578063965, "global_step": 206735, "epoch": 4922} {"train_loss": -7.383403778076172, "global_step": 206736, "epoch": 4922} {"train_loss": -7.292637825012207, "global_step": 206737, "epoch": 4922} {"train_loss": -7.429609298706055, "global_step": 206738, "epoch": 4922} {"train_loss": -7.341076374053955, "global_step": 206739, "epoch": 4922} {"train_loss": -7.302778720855713, "global_step": 206740, "epoch": 4922} {"train_loss": -7.4475908279418945, "global_step": 206741, "epoch": 4922} {"train_loss": -7.488958358764648, "global_step": 206742, "epoch": 4922} {"train_loss": -7.43129825592041, "global_step": 206743, "epoch": 4922} {"train_loss": -7.380491256713867, "global_step": 206744, "epoch": 4922} {"train_loss": -7.357370376586914, "global_step": 206745, "epoch": 4922} {"train_loss": -7.418346881866455, "global_step": 206746, "epoch": 4922} {"train_loss": -7.304362773895264, "global_step": 206747, "epoch": 4922} {"train_loss": -7.387790679931641, "global_step": 206748, "epoch": 4922} {"train_loss": -7.396622657775879, "global_step": 206749, "epoch": 4922} {"train_loss": -7.426579475402832, "global_step": 206750, "epoch": 4922} {"train_loss": -7.261734962463379, "global_step": 206751, "epoch": 4922} {"train_loss": -7.2802934646606445, "global_step": 206752, "epoch": 4922} {"train_loss": -7.306449890136719, "global_step": 206753, "epoch": 4922} {"train_loss": -7.403672695159912, "global_step": 206754, "epoch": 4922} {"train_loss": -7.406543731689453, "global_step": 206755, "epoch": 4922} {"train_loss": -7.356846332550049, "global_step": 206756, "epoch": 4922} {"train_loss": -7.316154479980469, "global_step": 206757, "epoch": 4922} {"train_loss": -7.356115341186523, "global_step": 206758, "epoch": 4922} {"train_loss": -7.420061111450195, "global_step": 206759, "epoch": 4922} {"train_loss": -7.353999137878418, "global_step": 206760, "epoch": 4922} {"train_loss": -7.320277690887451, "global_step": 206761, "epoch": 4922} {"train_loss": -7.362664699554443, "global_step": 206762, "epoch": 4922} {"train_loss": -7.356723785400391, "global_step": 206763, "epoch": 4922} {"train_loss": -7.303973197937012, "global_step": 206764, "epoch": 4922} {"train_loss": -7.374148107710338, "global_step": 206765, "epoch": 4922, "val_loss": 69985.0078125} {"train_loss": -7.33244514465332, "global_step": 206766, "epoch": 4923} {"train_loss": -7.3254194259643555, "global_step": 206767, "epoch": 4923} {"train_loss": -7.281583309173584, "global_step": 206768, "epoch": 4923} {"train_loss": -7.392516136169434, "global_step": 206769, "epoch": 4923} {"train_loss": -7.291582107543945, "global_step": 206770, "epoch": 4923} {"train_loss": -7.268043518066406, "global_step": 206771, "epoch": 4923} {"train_loss": -7.2977190017700195, "global_step": 206772, "epoch": 4923} {"train_loss": -7.3778791427612305, "global_step": 206773, "epoch": 4923} {"train_loss": -7.370787143707275, "global_step": 206774, "epoch": 4923} {"train_loss": -7.461732387542725, "global_step": 206775, "epoch": 4923} {"train_loss": -7.39318323135376, "global_step": 206776, "epoch": 4923} {"train_loss": -7.345536231994629, "global_step": 206777, "epoch": 4923} {"train_loss": -7.310697555541992, "global_step": 206778, "epoch": 4923} {"train_loss": -7.456681251525879, "global_step": 206779, "epoch": 4923} {"train_loss": -7.463390350341797, "global_step": 206780, "epoch": 4923} {"train_loss": -7.239260673522949, "global_step": 206781, "epoch": 4923} {"train_loss": -7.35709285736084, "global_step": 206782, "epoch": 4923} {"train_loss": -7.388583183288574, "global_step": 206783, "epoch": 4923} {"train_loss": -7.3188090324401855, "global_step": 206784, "epoch": 4923} {"train_loss": -7.205275535583496, "global_step": 206785, "epoch": 4923} {"train_loss": -7.291542053222656, "global_step": 206786, "epoch": 4923} {"train_loss": -7.39722204208374, "global_step": 206787, "epoch": 4923} {"train_loss": -7.312830924987793, "global_step": 206788, "epoch": 4923} {"train_loss": -7.270236968994141, "global_step": 206789, "epoch": 4923} {"train_loss": -7.307865619659424, "global_step": 206790, "epoch": 4923} {"train_loss": -7.401039123535156, "global_step": 206791, "epoch": 4923} {"train_loss": -7.131472587585449, "global_step": 206792, "epoch": 4923} {"train_loss": -7.226810455322266, "global_step": 206793, "epoch": 4923} {"train_loss": -7.104979991912842, "global_step": 206794, "epoch": 4923} {"train_loss": -7.254111289978027, "global_step": 206795, "epoch": 4923} {"train_loss": -7.130953311920166, "global_step": 206796, "epoch": 4923} {"train_loss": -7.246475696563721, "global_step": 206797, "epoch": 4923} {"train_loss": -7.34808349609375, "global_step": 206798, "epoch": 4923} {"train_loss": -7.16086483001709, "global_step": 206799, "epoch": 4923} {"train_loss": -7.226686000823975, "global_step": 206800, "epoch": 4923} {"train_loss": -7.141458511352539, "global_step": 206801, "epoch": 4923} {"train_loss": -7.2473883628845215, "global_step": 206802, "epoch": 4923} {"train_loss": -7.302475929260254, "global_step": 206803, "epoch": 4923} {"train_loss": -7.101970672607422, "global_step": 206804, "epoch": 4923} {"train_loss": -7.247559547424316, "global_step": 206805, "epoch": 4923} {"train_loss": -7.310101509094238, "global_step": 206806, "epoch": 4923} {"train_loss": -7.2929104169209795, "global_step": 206807, "epoch": 4923, "val_loss": 69978.7421875} {"train_loss": -7.313747406005859, "global_step": 206808, "epoch": 4924} {"train_loss": -7.228222370147705, "global_step": 206809, "epoch": 4924} {"train_loss": -7.291611671447754, "global_step": 206810, "epoch": 4924} {"train_loss": -7.388973712921143, "global_step": 206811, "epoch": 4924} {"train_loss": -7.232510566711426, "global_step": 206812, "epoch": 4924} {"train_loss": -7.299134254455566, "global_step": 206813, "epoch": 4924} {"train_loss": -7.1219482421875, "global_step": 206814, "epoch": 4924} {"train_loss": -7.2532124519348145, "global_step": 206815, "epoch": 4924} {"train_loss": -7.267138481140137, "global_step": 206816, "epoch": 4924} {"train_loss": -7.1637139320373535, "global_step": 206817, "epoch": 4924} {"train_loss": -7.3576555252075195, "global_step": 206818, "epoch": 4924} {"train_loss": -7.454015731811523, "global_step": 206819, "epoch": 4924} {"train_loss": -7.300562858581543, "global_step": 206820, "epoch": 4924} {"train_loss": -7.31463623046875, "global_step": 206821, "epoch": 4924} {"train_loss": -7.391030311584473, "global_step": 206822, "epoch": 4924} {"train_loss": -7.232109069824219, "global_step": 206823, "epoch": 4924} {"train_loss": -7.40181303024292, "global_step": 206824, "epoch": 4924} {"train_loss": -7.330063819885254, "global_step": 206825, "epoch": 4924} {"train_loss": -7.442331314086914, "global_step": 206826, "epoch": 4924} {"train_loss": -7.417421817779541, "global_step": 206827, "epoch": 4924} {"train_loss": -7.381916522979736, "global_step": 206828, "epoch": 4924} {"train_loss": -7.372799396514893, "global_step": 206829, "epoch": 4924} {"train_loss": -7.2592315673828125, "global_step": 206830, "epoch": 4924} {"train_loss": -7.292510986328125, "global_step": 206831, "epoch": 4924} {"train_loss": -7.313543319702148, "global_step": 206832, "epoch": 4924} {"train_loss": -7.276797294616699, "global_step": 206833, "epoch": 4924} {"train_loss": -7.2888288497924805, "global_step": 206834, "epoch": 4924} {"train_loss": -7.316124439239502, "global_step": 206835, "epoch": 4924} {"train_loss": -7.304542541503906, "global_step": 206836, "epoch": 4924} {"train_loss": -7.276492118835449, "global_step": 206837, "epoch": 4924} {"train_loss": -7.463368892669678, "global_step": 206838, "epoch": 4924} {"train_loss": -7.396106719970703, "global_step": 206839, "epoch": 4924} {"train_loss": -7.225640296936035, "global_step": 206840, "epoch": 4924} {"train_loss": -7.326173305511475, "global_step": 206841, "epoch": 4924} {"train_loss": -7.211591720581055, "global_step": 206842, "epoch": 4924} {"train_loss": -7.268306255340576, "global_step": 206843, "epoch": 4924} {"train_loss": -7.390108108520508, "global_step": 206844, "epoch": 4924} {"train_loss": -7.342984199523926, "global_step": 206845, "epoch": 4924} {"train_loss": -7.465991973876953, "global_step": 206846, "epoch": 4924} {"train_loss": -7.370882987976074, "global_step": 206847, "epoch": 4924} {"train_loss": -7.312480926513672, "global_step": 206848, "epoch": 4924} {"train_loss": -7.316072066624959, "global_step": 206849, "epoch": 4924, "val_loss": 70052.140625} {"train_loss": -7.322509765625, "global_step": 206850, "epoch": 4925} {"train_loss": -7.4390716552734375, "global_step": 206851, "epoch": 4925} {"train_loss": -7.3123931884765625, "global_step": 206852, "epoch": 4925} {"train_loss": -7.401381969451904, "global_step": 206853, "epoch": 4925} {"train_loss": -7.274598121643066, "global_step": 206854, "epoch": 4925} {"train_loss": -7.231174945831299, "global_step": 206855, "epoch": 4925} {"train_loss": -7.210302352905273, "global_step": 206856, "epoch": 4925} {"train_loss": -7.244323253631592, "global_step": 206857, "epoch": 4925} {"train_loss": -7.122870922088623, "global_step": 206858, "epoch": 4925} {"train_loss": -7.229334831237793, "global_step": 206859, "epoch": 4925} {"train_loss": -7.1319427490234375, "global_step": 206860, "epoch": 4925} {"train_loss": -7.165482521057129, "global_step": 206861, "epoch": 4925} {"train_loss": -7.144144535064697, "global_step": 206862, "epoch": 4925} {"train_loss": -6.906327247619629, "global_step": 206863, "epoch": 4925} {"train_loss": -7.235103607177734, "global_step": 206864, "epoch": 4925} {"train_loss": -7.082307815551758, "global_step": 206865, "epoch": 4925} {"train_loss": -7.234447956085205, "global_step": 206866, "epoch": 4925} {"train_loss": -7.149314880371094, "global_step": 206867, "epoch": 4925} {"train_loss": -7.018491268157959, "global_step": 206868, "epoch": 4925} {"train_loss": -7.1729278564453125, "global_step": 206869, "epoch": 4925} {"train_loss": -7.216525077819824, "global_step": 206870, "epoch": 4925} {"train_loss": -7.1110920906066895, "global_step": 206871, "epoch": 4925} {"train_loss": -7.247463703155518, "global_step": 206872, "epoch": 4925} {"train_loss": -7.207919120788574, "global_step": 206873, "epoch": 4925} {"train_loss": -7.223963737487793, "global_step": 206874, "epoch": 4925} {"train_loss": -7.190950393676758, "global_step": 206875, "epoch": 4925} {"train_loss": -7.214972972869873, "global_step": 206876, "epoch": 4925} {"train_loss": -7.10977840423584, "global_step": 206877, "epoch": 4925} {"train_loss": -7.177132606506348, "global_step": 206878, "epoch": 4925} {"train_loss": -7.286242485046387, "global_step": 206879, "epoch": 4925} {"train_loss": -7.239770889282227, "global_step": 206880, "epoch": 4925} {"train_loss": -7.234376907348633, "global_step": 206881, "epoch": 4925} {"train_loss": -7.276058673858643, "global_step": 206882, "epoch": 4925} {"train_loss": -7.224703788757324, "global_step": 206883, "epoch": 4925} {"train_loss": -7.259552955627441, "global_step": 206884, "epoch": 4925} {"train_loss": -7.221888542175293, "global_step": 206885, "epoch": 4925} {"train_loss": -7.239606857299805, "global_step": 206886, "epoch": 4925} {"train_loss": -7.209214687347412, "global_step": 206887, "epoch": 4925} {"train_loss": -7.3075995445251465, "global_step": 206888, "epoch": 4925} {"train_loss": -7.337407112121582, "global_step": 206889, "epoch": 4925} {"train_loss": -7.297236442565918, "global_step": 206890, "epoch": 4925} {"train_loss": -7.218214364278884, "global_step": 206891, "epoch": 4925, "val_loss": 69901.5859375} {"train_loss": -7.393220901489258, "global_step": 206892, "epoch": 4926} {"train_loss": -7.356200695037842, "global_step": 206893, "epoch": 4926} {"train_loss": -7.26528787612915, "global_step": 206894, "epoch": 4926} {"train_loss": -7.337919235229492, "global_step": 206895, "epoch": 4926} {"train_loss": -7.365119934082031, "global_step": 206896, "epoch": 4926} {"train_loss": -7.377760887145996, "global_step": 206897, "epoch": 4926} {"train_loss": -7.423520088195801, "global_step": 206898, "epoch": 4926} {"train_loss": -7.425745010375977, "global_step": 206899, "epoch": 4926} {"train_loss": -7.352568626403809, "global_step": 206900, "epoch": 4926} {"train_loss": -7.417234420776367, "global_step": 206901, "epoch": 4926} {"train_loss": -7.310460090637207, "global_step": 206902, "epoch": 4926} {"train_loss": -7.398083209991455, "global_step": 206903, "epoch": 4926} {"train_loss": -7.51601505279541, "global_step": 206904, "epoch": 4926} {"train_loss": -7.406264305114746, "global_step": 206905, "epoch": 4926} {"train_loss": -7.354778289794922, "global_step": 206906, "epoch": 4926} {"train_loss": -7.338850498199463, "global_step": 206907, "epoch": 4926} {"train_loss": -7.265947341918945, "global_step": 206908, "epoch": 4926} {"train_loss": -7.383596420288086, "global_step": 206909, "epoch": 4926} {"train_loss": -7.38757848739624, "global_step": 206910, "epoch": 4926} {"train_loss": -7.308587551116943, "global_step": 206911, "epoch": 4926} {"train_loss": -7.254781246185303, "global_step": 206912, "epoch": 4926} {"train_loss": -7.348332405090332, "global_step": 206913, "epoch": 4926} {"train_loss": -7.319734573364258, "global_step": 206914, "epoch": 4926} {"train_loss": -7.463016033172607, "global_step": 206915, "epoch": 4926} {"train_loss": -7.2550048828125, "global_step": 206916, "epoch": 4926} {"train_loss": -7.354263782501221, "global_step": 206917, "epoch": 4926} {"train_loss": -7.2884063720703125, "global_step": 206918, "epoch": 4926} {"train_loss": -7.304481029510498, "global_step": 206919, "epoch": 4926} {"train_loss": -7.228837966918945, "global_step": 206920, "epoch": 4926} {"train_loss": -7.452142238616943, "global_step": 206921, "epoch": 4926} {"train_loss": -7.313503265380859, "global_step": 206922, "epoch": 4926} {"train_loss": -7.3871941566467285, "global_step": 206923, "epoch": 4926} {"train_loss": -7.284424781799316, "global_step": 206924, "epoch": 4926} {"train_loss": -7.405439376831055, "global_step": 206925, "epoch": 4926} {"train_loss": -7.27137565612793, "global_step": 206926, "epoch": 4926} {"train_loss": -7.234414100646973, "global_step": 206927, "epoch": 4926} {"train_loss": -7.384232997894287, "global_step": 206928, "epoch": 4926} {"train_loss": -7.284872531890869, "global_step": 206929, "epoch": 4926} {"train_loss": -7.2742486000061035, "global_step": 206930, "epoch": 4926} {"train_loss": -7.305177211761475, "global_step": 206931, "epoch": 4926} {"train_loss": -7.216651916503906, "global_step": 206932, "epoch": 4926} {"train_loss": -7.339196398144677, "global_step": 206933, "epoch": 4926, "val_loss": 70069.9296875} {"train_loss": -7.327570915222168, "global_step": 206934, "epoch": 4927} {"train_loss": -7.416088581085205, "global_step": 206935, "epoch": 4927} {"train_loss": -7.419675827026367, "global_step": 206936, "epoch": 4927} {"train_loss": -7.33585262298584, "global_step": 206937, "epoch": 4927} {"train_loss": -7.254691123962402, "global_step": 206938, "epoch": 4927} {"train_loss": -7.272993087768555, "global_step": 206939, "epoch": 4927} {"train_loss": -7.227994918823242, "global_step": 206940, "epoch": 4927} {"train_loss": -7.262255668640137, "global_step": 206941, "epoch": 4927} {"train_loss": -7.179426670074463, "global_step": 206942, "epoch": 4927} {"train_loss": -7.429714679718018, "global_step": 206943, "epoch": 4927} {"train_loss": -7.296639919281006, "global_step": 206944, "epoch": 4927} {"train_loss": -7.248010635375977, "global_step": 206945, "epoch": 4927} {"train_loss": -7.43227481842041, "global_step": 206946, "epoch": 4927} {"train_loss": -7.320794582366943, "global_step": 206947, "epoch": 4927} {"train_loss": -7.28536319732666, "global_step": 206948, "epoch": 4927} {"train_loss": -7.209981918334961, "global_step": 206949, "epoch": 4927} {"train_loss": -7.340665817260742, "global_step": 206950, "epoch": 4927} {"train_loss": -7.267300605773926, "global_step": 206951, "epoch": 4927} {"train_loss": -7.265171051025391, "global_step": 206952, "epoch": 4927} {"train_loss": -7.320873260498047, "global_step": 206953, "epoch": 4927} {"train_loss": -7.2415337562561035, "global_step": 206954, "epoch": 4927} {"train_loss": -7.063486099243164, "global_step": 206955, "epoch": 4927} {"train_loss": -7.364468574523926, "global_step": 206956, "epoch": 4927} {"train_loss": -7.221857070922852, "global_step": 206957, "epoch": 4927} {"train_loss": -7.36580228805542, "global_step": 206958, "epoch": 4927} {"train_loss": -7.430480003356934, "global_step": 206959, "epoch": 4927} {"train_loss": -7.3411359786987305, "global_step": 206960, "epoch": 4927} {"train_loss": -7.371124267578125, "global_step": 206961, "epoch": 4927} {"train_loss": -7.322249412536621, "global_step": 206962, "epoch": 4927} {"train_loss": -7.281830310821533, "global_step": 206963, "epoch": 4927} {"train_loss": -7.293593406677246, "global_step": 206964, "epoch": 4927} {"train_loss": -7.299455165863037, "global_step": 206965, "epoch": 4927} {"train_loss": -7.27235221862793, "global_step": 206966, "epoch": 4927} {"train_loss": -7.151330947875977, "global_step": 206967, "epoch": 4927} {"train_loss": -7.336699962615967, "global_step": 206968, "epoch": 4927} {"train_loss": -7.312813758850098, "global_step": 206969, "epoch": 4927} {"train_loss": -7.299746513366699, "global_step": 206970, "epoch": 4927} {"train_loss": -7.261337757110596, "global_step": 206971, "epoch": 4927} {"train_loss": -7.348974704742432, "global_step": 206972, "epoch": 4927} {"train_loss": -7.218444347381592, "global_step": 206973, "epoch": 4927} {"train_loss": -7.162774085998535, "global_step": 206974, "epoch": 4927} {"train_loss": -7.292917240233648, "global_step": 206975, "epoch": 4927, "val_loss": 69984.140625} {"train_loss": -7.3182830810546875, "global_step": 206976, "epoch": 4928} {"train_loss": -7.34779167175293, "global_step": 206977, "epoch": 4928} {"train_loss": -7.255809783935547, "global_step": 206978, "epoch": 4928} {"train_loss": -7.312558174133301, "global_step": 206979, "epoch": 4928} {"train_loss": -7.288196563720703, "global_step": 206980, "epoch": 4928} {"train_loss": -7.220922470092773, "global_step": 206981, "epoch": 4928} {"train_loss": -7.2527265548706055, "global_step": 206982, "epoch": 4928} {"train_loss": -7.353697299957275, "global_step": 206983, "epoch": 4928} {"train_loss": -7.296243190765381, "global_step": 206984, "epoch": 4928} {"train_loss": -7.336327075958252, "global_step": 206985, "epoch": 4928} {"train_loss": -7.218057632446289, "global_step": 206986, "epoch": 4928} {"train_loss": -7.297023773193359, "global_step": 206987, "epoch": 4928} {"train_loss": -7.314014911651611, "global_step": 206988, "epoch": 4928} {"train_loss": -7.224286079406738, "global_step": 206989, "epoch": 4928} {"train_loss": -7.16679048538208, "global_step": 206990, "epoch": 4928} {"train_loss": -7.412522792816162, "global_step": 206991, "epoch": 4928} {"train_loss": -7.363490581512451, "global_step": 206992, "epoch": 4928} {"train_loss": -7.200784683227539, "global_step": 206993, "epoch": 4928} {"train_loss": -7.223233222961426, "global_step": 206994, "epoch": 4928} {"train_loss": -7.167860507965088, "global_step": 206995, "epoch": 4928} {"train_loss": -7.236057758331299, "global_step": 206996, "epoch": 4928} {"train_loss": -7.288959503173828, "global_step": 206997, "epoch": 4928} {"train_loss": -7.398693561553955, "global_step": 206998, "epoch": 4928} {"train_loss": -7.362138271331787, "global_step": 206999, "epoch": 4928} {"train_loss": -7.429302215576172, "global_step": 207000, "epoch": 4928} {"train_loss": -7.375723361968994, "global_step": 207001, "epoch": 4928} {"train_loss": -7.302670478820801, "global_step": 207002, "epoch": 4928} {"train_loss": -7.392673492431641, "global_step": 207003, "epoch": 4928} {"train_loss": -7.320072174072266, "global_step": 207004, "epoch": 4928} {"train_loss": -7.288815021514893, "global_step": 207005, "epoch": 4928} {"train_loss": -7.35698127746582, "global_step": 207006, "epoch": 4928} {"train_loss": -7.326262474060059, "global_step": 207007, "epoch": 4928} {"train_loss": -7.324190139770508, "global_step": 207008, "epoch": 4928} {"train_loss": -7.306789398193359, "global_step": 207009, "epoch": 4928} {"train_loss": -7.38969087600708, "global_step": 207010, "epoch": 4928} {"train_loss": -7.273481369018555, "global_step": 207011, "epoch": 4928} {"train_loss": -7.349553108215332, "global_step": 207012, "epoch": 4928} {"train_loss": -7.352871894836426, "global_step": 207013, "epoch": 4928} {"train_loss": -7.323775768280029, "global_step": 207014, "epoch": 4928} {"train_loss": -7.37448263168335, "global_step": 207015, "epoch": 4928} {"train_loss": -7.335417747497559, "global_step": 207016, "epoch": 4928} {"train_loss": -7.308425074531918, "global_step": 207017, "epoch": 4928, "val_loss": 70021.8046875} {"train_loss": -7.255378723144531, "global_step": 207018, "epoch": 4929} {"train_loss": -7.255956649780273, "global_step": 207019, "epoch": 4929} {"train_loss": -7.394763946533203, "global_step": 207020, "epoch": 4929} {"train_loss": -7.418878555297852, "global_step": 207021, "epoch": 4929} {"train_loss": -7.4808244705200195, "global_step": 207022, "epoch": 4929} {"train_loss": -7.3346757888793945, "global_step": 207023, "epoch": 4929} {"train_loss": -7.410412788391113, "global_step": 207024, "epoch": 4929} {"train_loss": -7.315867900848389, "global_step": 207025, "epoch": 4929} {"train_loss": -7.3391337394714355, "global_step": 207026, "epoch": 4929} {"train_loss": -7.263062000274658, "global_step": 207027, "epoch": 4929} {"train_loss": -7.272526741027832, "global_step": 207028, "epoch": 4929} {"train_loss": -7.365015506744385, "global_step": 207029, "epoch": 4929} {"train_loss": -7.283215522766113, "global_step": 207030, "epoch": 4929} {"train_loss": -7.260315418243408, "global_step": 207031, "epoch": 4929} {"train_loss": -7.3467607498168945, "global_step": 207032, "epoch": 4929} {"train_loss": -7.409433364868164, "global_step": 207033, "epoch": 4929} {"train_loss": -7.422502517700195, "global_step": 207034, "epoch": 4929} {"train_loss": -7.358621120452881, "global_step": 207035, "epoch": 4929} {"train_loss": -7.217538833618164, "global_step": 207036, "epoch": 4929} {"train_loss": -7.369372367858887, "global_step": 207037, "epoch": 4929} {"train_loss": -7.255956649780273, "global_step": 207038, "epoch": 4929} {"train_loss": -7.334354400634766, "global_step": 207039, "epoch": 4929} {"train_loss": -7.287994384765625, "global_step": 207040, "epoch": 4929} {"train_loss": -7.291624546051025, "global_step": 207041, "epoch": 4929} {"train_loss": -7.411657333374023, "global_step": 207042, "epoch": 4929} {"train_loss": -7.42087984085083, "global_step": 207043, "epoch": 4929} {"train_loss": -7.329786777496338, "global_step": 207044, "epoch": 4929} {"train_loss": -7.342228889465332, "global_step": 207045, "epoch": 4929} {"train_loss": -7.320591449737549, "global_step": 207046, "epoch": 4929} {"train_loss": -7.237174034118652, "global_step": 207047, "epoch": 4929} {"train_loss": -7.284801483154297, "global_step": 207048, "epoch": 4929} {"train_loss": -7.3080596923828125, "global_step": 207049, "epoch": 4929} {"train_loss": -7.394329071044922, "global_step": 207050, "epoch": 4929} {"train_loss": -7.241949558258057, "global_step": 207051, "epoch": 4929} {"train_loss": -7.198540687561035, "global_step": 207052, "epoch": 4929} {"train_loss": -7.323856353759766, "global_step": 207053, "epoch": 4929} {"train_loss": -7.3744730949401855, "global_step": 207054, "epoch": 4929} {"train_loss": -7.297482490539551, "global_step": 207055, "epoch": 4929} {"train_loss": -7.4409685134887695, "global_step": 207056, "epoch": 4929} {"train_loss": -7.402389049530029, "global_step": 207057, "epoch": 4929} {"train_loss": -7.292709827423096, "global_step": 207058, "epoch": 4929} {"train_loss": -7.330101478667486, "global_step": 207059, "epoch": 4929, "val_loss": 69902.9921875} {"train_loss": -7.364331245422363, "global_step": 207060, "epoch": 4930} {"train_loss": -7.47305965423584, "global_step": 207061, "epoch": 4930} {"train_loss": -7.307552337646484, "global_step": 207062, "epoch": 4930} {"train_loss": -7.225495338439941, "global_step": 207063, "epoch": 4930} {"train_loss": -7.36256217956543, "global_step": 207064, "epoch": 4930} {"train_loss": -7.397878646850586, "global_step": 207065, "epoch": 4930} {"train_loss": -7.360143661499023, "global_step": 207066, "epoch": 4930} {"train_loss": -7.328535079956055, "global_step": 207067, "epoch": 4930} {"train_loss": -7.2952985763549805, "global_step": 207068, "epoch": 4930} {"train_loss": -7.345975399017334, "global_step": 207069, "epoch": 4930} {"train_loss": -7.443665504455566, "global_step": 207070, "epoch": 4930} {"train_loss": -7.385163307189941, "global_step": 207071, "epoch": 4930} {"train_loss": -7.3940911293029785, "global_step": 207072, "epoch": 4930} {"train_loss": -7.16434383392334, "global_step": 207073, "epoch": 4930} {"train_loss": -7.2587714195251465, "global_step": 207074, "epoch": 4930} {"train_loss": -7.332620143890381, "global_step": 207075, "epoch": 4930} {"train_loss": -7.358892440795898, "global_step": 207076, "epoch": 4930} {"train_loss": -7.183384418487549, "global_step": 207077, "epoch": 4930} {"train_loss": -7.267552375793457, "global_step": 207078, "epoch": 4930} {"train_loss": -7.315343856811523, "global_step": 207079, "epoch": 4930} {"train_loss": -7.267662048339844, "global_step": 207080, "epoch": 4930} {"train_loss": -7.358861923217773, "global_step": 207081, "epoch": 4930} {"train_loss": -7.277291297912598, "global_step": 207082, "epoch": 4930} {"train_loss": -7.4108476638793945, "global_step": 207083, "epoch": 4930} {"train_loss": -7.315971851348877, "global_step": 207084, "epoch": 4930} {"train_loss": -7.309338569641113, "global_step": 207085, "epoch": 4930} {"train_loss": -7.3393754959106445, "global_step": 207086, "epoch": 4930} {"train_loss": -7.248903274536133, "global_step": 207087, "epoch": 4930} {"train_loss": -7.388008117675781, "global_step": 207088, "epoch": 4930} {"train_loss": -7.426866054534912, "global_step": 207089, "epoch": 4930} {"train_loss": -7.253863334655762, "global_step": 207090, "epoch": 4930} {"train_loss": -7.386117935180664, "global_step": 207091, "epoch": 4930} {"train_loss": -7.285964488983154, "global_step": 207092, "epoch": 4930} {"train_loss": -7.317741394042969, "global_step": 207093, "epoch": 4930} {"train_loss": -7.3539910316467285, "global_step": 207094, "epoch": 4930} {"train_loss": -7.279890060424805, "global_step": 207095, "epoch": 4930} {"train_loss": -7.3250226974487305, "global_step": 207096, "epoch": 4930} {"train_loss": -7.345056533813477, "global_step": 207097, "epoch": 4930} {"train_loss": -7.4161248207092285, "global_step": 207098, "epoch": 4930} {"train_loss": -7.277198791503906, "global_step": 207099, "epoch": 4930} {"train_loss": -7.338748931884766, "global_step": 207100, "epoch": 4930} {"train_loss": -7.330707334336781, "global_step": 207101, "epoch": 4930, "val_loss": 70074.1328125} {"train_loss": -7.444903373718262, "global_step": 207102, "epoch": 4931} {"train_loss": -7.337116718292236, "global_step": 207103, "epoch": 4931} {"train_loss": -7.4210591316223145, "global_step": 207104, "epoch": 4931} {"train_loss": -7.322849273681641, "global_step": 207105, "epoch": 4931} {"train_loss": -7.329279899597168, "global_step": 207106, "epoch": 4931} {"train_loss": -7.386632442474365, "global_step": 207107, "epoch": 4931} {"train_loss": -7.293860912322998, "global_step": 207108, "epoch": 4931} {"train_loss": -7.318624496459961, "global_step": 207109, "epoch": 4931} {"train_loss": -7.413811206817627, "global_step": 207110, "epoch": 4931} {"train_loss": -7.344405174255371, "global_step": 207111, "epoch": 4931} {"train_loss": -7.4029693603515625, "global_step": 207112, "epoch": 4931} {"train_loss": -7.198303699493408, "global_step": 207113, "epoch": 4931} {"train_loss": -7.327038764953613, "global_step": 207114, "epoch": 4931} {"train_loss": -7.233002662658691, "global_step": 207115, "epoch": 4931} {"train_loss": -7.361689567565918, "global_step": 207116, "epoch": 4931} {"train_loss": -7.235145092010498, "global_step": 207117, "epoch": 4931} {"train_loss": -7.25061559677124, "global_step": 207118, "epoch": 4931} {"train_loss": -7.270503997802734, "global_step": 207119, "epoch": 4931} {"train_loss": -7.2901930809021, "global_step": 207120, "epoch": 4931} {"train_loss": -7.18911075592041, "global_step": 207121, "epoch": 4931} {"train_loss": -7.313658237457275, "global_step": 207122, "epoch": 4931} {"train_loss": -7.0205159187316895, "global_step": 207123, "epoch": 4931} {"train_loss": -7.120762348175049, "global_step": 207124, "epoch": 4931} {"train_loss": -7.1440653800964355, "global_step": 207125, "epoch": 4931} {"train_loss": -7.013637065887451, "global_step": 207126, "epoch": 4931} {"train_loss": -7.151933193206787, "global_step": 207127, "epoch": 4931} {"train_loss": -7.063345909118652, "global_step": 207128, "epoch": 4931} {"train_loss": -7.129554748535156, "global_step": 207129, "epoch": 4931} {"train_loss": -7.338925838470459, "global_step": 207130, "epoch": 4931} {"train_loss": -7.0051469802856445, "global_step": 207131, "epoch": 4931} {"train_loss": -7.254777431488037, "global_step": 207132, "epoch": 4931} {"train_loss": -7.119724273681641, "global_step": 207133, "epoch": 4931} {"train_loss": -7.2635321617126465, "global_step": 207134, "epoch": 4931} {"train_loss": -7.085511684417725, "global_step": 207135, "epoch": 4931} {"train_loss": -7.198765754699707, "global_step": 207136, "epoch": 4931} {"train_loss": -7.220880031585693, "global_step": 207137, "epoch": 4931} {"train_loss": -7.2590012550354, "global_step": 207138, "epoch": 4931} {"train_loss": -7.309624671936035, "global_step": 207139, "epoch": 4931} {"train_loss": -7.284798622131348, "global_step": 207140, "epoch": 4931} {"train_loss": -7.317529201507568, "global_step": 207141, "epoch": 4931} {"train_loss": -7.289310455322266, "global_step": 207142, "epoch": 4931} {"train_loss": -7.252587954203288, "global_step": 207143, "epoch": 4931, "val_loss": 70149.15625} {"train_loss": -7.236979961395264, "global_step": 207144, "epoch": 4932} {"train_loss": -7.316008567810059, "global_step": 207145, "epoch": 4932} {"train_loss": -7.345020771026611, "global_step": 207146, "epoch": 4932} {"train_loss": -7.2665696144104, "global_step": 207147, "epoch": 4932} {"train_loss": -7.312370300292969, "global_step": 207148, "epoch": 4932} {"train_loss": -7.3098464012146, "global_step": 207149, "epoch": 4932} {"train_loss": -7.343209266662598, "global_step": 207150, "epoch": 4932} {"train_loss": -7.397418022155762, "global_step": 207151, "epoch": 4932} {"train_loss": -7.508246421813965, "global_step": 207152, "epoch": 4932} {"train_loss": -7.351308345794678, "global_step": 207153, "epoch": 4932} {"train_loss": -7.341630458831787, "global_step": 207154, "epoch": 4932} {"train_loss": -7.409043788909912, "global_step": 207155, "epoch": 4932} {"train_loss": -7.3330159187316895, "global_step": 207156, "epoch": 4932} {"train_loss": -7.337797164916992, "global_step": 207157, "epoch": 4932} {"train_loss": -7.328738689422607, "global_step": 207158, "epoch": 4932} {"train_loss": -7.379453659057617, "global_step": 207159, "epoch": 4932} {"train_loss": -7.426031589508057, "global_step": 207160, "epoch": 4932} {"train_loss": -7.3282365798950195, "global_step": 207161, "epoch": 4932} {"train_loss": -7.326667785644531, "global_step": 207162, "epoch": 4932} {"train_loss": -7.28987979888916, "global_step": 207163, "epoch": 4932} {"train_loss": -7.386553764343262, "global_step": 207164, "epoch": 4932} {"train_loss": -7.394654273986816, "global_step": 207165, "epoch": 4932} {"train_loss": -7.467736721038818, "global_step": 207166, "epoch": 4932} {"train_loss": -7.422087669372559, "global_step": 207167, "epoch": 4932} {"train_loss": -7.4496870040893555, "global_step": 207168, "epoch": 4932} {"train_loss": -7.453586101531982, "global_step": 207169, "epoch": 4932} {"train_loss": -7.3740949630737305, "global_step": 207170, "epoch": 4932} {"train_loss": -7.270079612731934, "global_step": 207171, "epoch": 4932} {"train_loss": -7.356489181518555, "global_step": 207172, "epoch": 4932} {"train_loss": -7.283864974975586, "global_step": 207173, "epoch": 4932} {"train_loss": -7.372869491577148, "global_step": 207174, "epoch": 4932} {"train_loss": -7.389869689941406, "global_step": 207175, "epoch": 4932} {"train_loss": -7.375490188598633, "global_step": 207176, "epoch": 4932} {"train_loss": -7.306972503662109, "global_step": 207177, "epoch": 4932} {"train_loss": -7.293340682983398, "global_step": 207178, "epoch": 4932} {"train_loss": -7.41768741607666, "global_step": 207179, "epoch": 4932} {"train_loss": -7.3518266677856445, "global_step": 207180, "epoch": 4932} {"train_loss": -7.264897346496582, "global_step": 207181, "epoch": 4932} {"train_loss": -7.352102279663086, "global_step": 207182, "epoch": 4932} {"train_loss": -7.405828475952148, "global_step": 207183, "epoch": 4932} {"train_loss": -7.359920501708984, "global_step": 207184, "epoch": 4932} {"train_loss": -7.355875287737165, "global_step": 207185, "epoch": 4932, "val_loss": 70171.734375} {"train_loss": -7.3457441329956055, "global_step": 207186, "epoch": 4933} {"train_loss": -7.339983940124512, "global_step": 207187, "epoch": 4933} {"train_loss": -7.41839599609375, "global_step": 207188, "epoch": 4933} {"train_loss": -7.338146209716797, "global_step": 207189, "epoch": 4933} {"train_loss": -7.268115997314453, "global_step": 207190, "epoch": 4933} {"train_loss": -7.3133440017700195, "global_step": 207191, "epoch": 4933} {"train_loss": -7.3892011642456055, "global_step": 207192, "epoch": 4933} {"train_loss": -7.32349967956543, "global_step": 207193, "epoch": 4933} {"train_loss": -7.429996490478516, "global_step": 207194, "epoch": 4933} {"train_loss": -7.379245758056641, "global_step": 207195, "epoch": 4933} {"train_loss": -7.306659698486328, "global_step": 207196, "epoch": 4933} {"train_loss": -7.368501663208008, "global_step": 207197, "epoch": 4933} {"train_loss": -7.30853271484375, "global_step": 207198, "epoch": 4933} {"train_loss": -7.422171592712402, "global_step": 207199, "epoch": 4933} {"train_loss": -7.473106384277344, "global_step": 207200, "epoch": 4933} {"train_loss": -7.382140636444092, "global_step": 207201, "epoch": 4933} {"train_loss": -7.319974899291992, "global_step": 207202, "epoch": 4933} {"train_loss": -7.335776329040527, "global_step": 207203, "epoch": 4933} {"train_loss": -7.135066509246826, "global_step": 207204, "epoch": 4933} {"train_loss": -7.038910388946533, "global_step": 207205, "epoch": 4933} {"train_loss": -7.400816917419434, "global_step": 207206, "epoch": 4933} {"train_loss": -7.202708721160889, "global_step": 207207, "epoch": 4933} {"train_loss": -7.245057106018066, "global_step": 207208, "epoch": 4933} {"train_loss": -7.302293300628662, "global_step": 207209, "epoch": 4933} {"train_loss": -7.246862411499023, "global_step": 207210, "epoch": 4933} {"train_loss": -7.313507080078125, "global_step": 207211, "epoch": 4933} {"train_loss": -7.198424816131592, "global_step": 207212, "epoch": 4933} {"train_loss": -7.344691753387451, "global_step": 207213, "epoch": 4933} {"train_loss": -7.24289608001709, "global_step": 207214, "epoch": 4933} {"train_loss": -7.296886444091797, "global_step": 207215, "epoch": 4933} {"train_loss": -7.304245948791504, "global_step": 207216, "epoch": 4933} {"train_loss": -7.182857990264893, "global_step": 207217, "epoch": 4933} {"train_loss": -7.153565406799316, "global_step": 207218, "epoch": 4933} {"train_loss": -7.383388519287109, "global_step": 207219, "epoch": 4933} {"train_loss": -7.135565757751465, "global_step": 207220, "epoch": 4933} {"train_loss": -7.188024520874023, "global_step": 207221, "epoch": 4933} {"train_loss": -7.270622730255127, "global_step": 207222, "epoch": 4933} {"train_loss": -7.253056526184082, "global_step": 207223, "epoch": 4933} {"train_loss": -7.344111919403076, "global_step": 207224, "epoch": 4933} {"train_loss": -7.253750324249268, "global_step": 207225, "epoch": 4933} {"train_loss": -7.34725284576416, "global_step": 207226, "epoch": 4933} {"train_loss": -7.299832105636597, "global_step": 207227, "epoch": 4933, "val_loss": 69840.4375} {"train_loss": -7.334559440612793, "global_step": 207228, "epoch": 4934} {"train_loss": -7.313997268676758, "global_step": 207229, "epoch": 4934} {"train_loss": -7.251442909240723, "global_step": 207230, "epoch": 4934} {"train_loss": -7.254242897033691, "global_step": 207231, "epoch": 4934} {"train_loss": -7.419168472290039, "global_step": 207232, "epoch": 4934} {"train_loss": -7.321863174438477, "global_step": 207233, "epoch": 4934} {"train_loss": -7.35245418548584, "global_step": 207234, "epoch": 4934} {"train_loss": -7.29776668548584, "global_step": 207235, "epoch": 4934} {"train_loss": -7.144042015075684, "global_step": 207236, "epoch": 4934} {"train_loss": -7.3138933181762695, "global_step": 207237, "epoch": 4934} {"train_loss": -7.218145847320557, "global_step": 207238, "epoch": 4934} {"train_loss": -7.306286334991455, "global_step": 207239, "epoch": 4934} {"train_loss": -7.284301280975342, "global_step": 207240, "epoch": 4934} {"train_loss": -7.329916000366211, "global_step": 207241, "epoch": 4934} {"train_loss": -7.206633567810059, "global_step": 207242, "epoch": 4934} {"train_loss": -7.363182067871094, "global_step": 207243, "epoch": 4934} {"train_loss": -7.359785556793213, "global_step": 207244, "epoch": 4934} {"train_loss": -7.305953025817871, "global_step": 207245, "epoch": 4934} {"train_loss": -7.404455661773682, "global_step": 207246, "epoch": 4934} {"train_loss": -7.423311710357666, "global_step": 207247, "epoch": 4934} {"train_loss": -7.341113090515137, "global_step": 207248, "epoch": 4934} {"train_loss": -7.31502103805542, "global_step": 207249, "epoch": 4934} {"train_loss": -7.2331132888793945, "global_step": 207250, "epoch": 4934} {"train_loss": -7.355989456176758, "global_step": 207251, "epoch": 4934} {"train_loss": -7.385270595550537, "global_step": 207252, "epoch": 4934} {"train_loss": -7.37016487121582, "global_step": 207253, "epoch": 4934} {"train_loss": -7.406877517700195, "global_step": 207254, "epoch": 4934} {"train_loss": -7.303287506103516, "global_step": 207255, "epoch": 4934} {"train_loss": -7.2938737869262695, "global_step": 207256, "epoch": 4934} {"train_loss": -7.338559627532959, "global_step": 207257, "epoch": 4934} {"train_loss": -7.324216842651367, "global_step": 207258, "epoch": 4934} {"train_loss": -7.462425708770752, "global_step": 207259, "epoch": 4934} {"train_loss": -7.355735778808594, "global_step": 207260, "epoch": 4934} {"train_loss": -7.289290904998779, "global_step": 207261, "epoch": 4934} {"train_loss": -7.30672025680542, "global_step": 207262, "epoch": 4934} {"train_loss": -7.41744327545166, "global_step": 207263, "epoch": 4934} {"train_loss": -7.418911933898926, "global_step": 207264, "epoch": 4934} {"train_loss": -7.417961120605469, "global_step": 207265, "epoch": 4934} {"train_loss": -7.375053405761719, "global_step": 207266, "epoch": 4934} {"train_loss": -7.326171875, "global_step": 207267, "epoch": 4934} {"train_loss": -7.4343061447143555, "global_step": 207268, "epoch": 4934} {"train_loss": -7.334177301043556, "global_step": 207269, "epoch": 4934, "val_loss": 70040.5390625} {"train_loss": -7.339785575866699, "global_step": 207270, "epoch": 4935} {"train_loss": -7.448513984680176, "global_step": 207271, "epoch": 4935} {"train_loss": -7.441313743591309, "global_step": 207272, "epoch": 4935} {"train_loss": -7.275745868682861, "global_step": 207273, "epoch": 4935} {"train_loss": -7.259915351867676, "global_step": 207274, "epoch": 4935} {"train_loss": -7.279319763183594, "global_step": 207275, "epoch": 4935} {"train_loss": -7.218481063842773, "global_step": 207276, "epoch": 4935} {"train_loss": -7.313451290130615, "global_step": 207277, "epoch": 4935} {"train_loss": -7.330513000488281, "global_step": 207278, "epoch": 4935} {"train_loss": -7.331263542175293, "global_step": 207279, "epoch": 4935} {"train_loss": -7.215569019317627, "global_step": 207280, "epoch": 4935} {"train_loss": -7.27007532119751, "global_step": 207281, "epoch": 4935} {"train_loss": -7.3540449142456055, "global_step": 207282, "epoch": 4935} {"train_loss": -7.210697174072266, "global_step": 207283, "epoch": 4935} {"train_loss": -7.3595380783081055, "global_step": 207284, "epoch": 4935} {"train_loss": -7.229347229003906, "global_step": 207285, "epoch": 4935} {"train_loss": -7.422514915466309, "global_step": 207286, "epoch": 4935} {"train_loss": -7.2130866050720215, "global_step": 207287, "epoch": 4935} {"train_loss": -7.312744140625, "global_step": 207288, "epoch": 4935} {"train_loss": -7.375363349914551, "global_step": 207289, "epoch": 4935} {"train_loss": -7.233066558837891, "global_step": 207290, "epoch": 4935} {"train_loss": -7.333738327026367, "global_step": 207291, "epoch": 4935} {"train_loss": -7.254756927490234, "global_step": 207292, "epoch": 4935} {"train_loss": -7.222110748291016, "global_step": 207293, "epoch": 4935} {"train_loss": -7.198291778564453, "global_step": 207294, "epoch": 4935} {"train_loss": -7.088118553161621, "global_step": 207295, "epoch": 4935} {"train_loss": -7.3778581619262695, "global_step": 207296, "epoch": 4935} {"train_loss": -7.172546863555908, "global_step": 207297, "epoch": 4935} {"train_loss": -7.211434364318848, "global_step": 207298, "epoch": 4935} {"train_loss": -7.3051838874816895, "global_step": 207299, "epoch": 4935} {"train_loss": -7.138484477996826, "global_step": 207300, "epoch": 4935} {"train_loss": -7.249149322509766, "global_step": 207301, "epoch": 4935} {"train_loss": -7.285397529602051, "global_step": 207302, "epoch": 4935} {"train_loss": -7.378854751586914, "global_step": 207303, "epoch": 4935} {"train_loss": -7.238164901733398, "global_step": 207304, "epoch": 4935} {"train_loss": -7.286474227905273, "global_step": 207305, "epoch": 4935} {"train_loss": -7.166580677032471, "global_step": 207306, "epoch": 4935} {"train_loss": -7.246251106262207, "global_step": 207307, "epoch": 4935} {"train_loss": -7.134994029998779, "global_step": 207308, "epoch": 4935} {"train_loss": -7.262415885925293, "global_step": 207309, "epoch": 4935} {"train_loss": -7.221531867980957, "global_step": 207310, "epoch": 4935} {"train_loss": -7.270971275511242, "global_step": 207311, "epoch": 4935, "val_loss": 70256.859375} {"train_loss": -7.26507568359375, "global_step": 207312, "epoch": 4936} {"train_loss": -7.291693687438965, "global_step": 207313, "epoch": 4936} {"train_loss": -7.301666259765625, "global_step": 207314, "epoch": 4936} {"train_loss": -7.144567012786865, "global_step": 207315, "epoch": 4936} {"train_loss": -7.2155938148498535, "global_step": 207316, "epoch": 4936} {"train_loss": -7.265279769897461, "global_step": 207317, "epoch": 4936} {"train_loss": -7.251304626464844, "global_step": 207318, "epoch": 4936} {"train_loss": -7.308847427368164, "global_step": 207319, "epoch": 4936} {"train_loss": -7.2970476150512695, "global_step": 207320, "epoch": 4936} {"train_loss": -7.154429912567139, "global_step": 207321, "epoch": 4936} {"train_loss": -7.3379058837890625, "global_step": 207322, "epoch": 4936} {"train_loss": -7.2621989250183105, "global_step": 207323, "epoch": 4936} {"train_loss": -7.18364143371582, "global_step": 207324, "epoch": 4936} {"train_loss": -7.313793659210205, "global_step": 207325, "epoch": 4936} {"train_loss": -7.241662979125977, "global_step": 207326, "epoch": 4936} {"train_loss": -7.320331573486328, "global_step": 207327, "epoch": 4936} {"train_loss": -7.333324432373047, "global_step": 207328, "epoch": 4936} {"train_loss": -7.286989212036133, "global_step": 207329, "epoch": 4936} {"train_loss": -7.316535949707031, "global_step": 207330, "epoch": 4936} {"train_loss": -7.395904064178467, "global_step": 207331, "epoch": 4936} {"train_loss": -7.343415260314941, "global_step": 207332, "epoch": 4936} {"train_loss": -7.314943313598633, "global_step": 207333, "epoch": 4936} {"train_loss": -7.399554252624512, "global_step": 207334, "epoch": 4936} {"train_loss": -7.3094482421875, "global_step": 207335, "epoch": 4936} {"train_loss": -7.339512348175049, "global_step": 207336, "epoch": 4936} {"train_loss": -7.275759220123291, "global_step": 207337, "epoch": 4936} {"train_loss": -7.3493452072143555, "global_step": 207338, "epoch": 4936} {"train_loss": -7.459749221801758, "global_step": 207339, "epoch": 4936} {"train_loss": -7.272208213806152, "global_step": 207340, "epoch": 4936} {"train_loss": -7.396214485168457, "global_step": 207341, "epoch": 4936} {"train_loss": -7.323593616485596, "global_step": 207342, "epoch": 4936} {"train_loss": -7.347504615783691, "global_step": 207343, "epoch": 4936} {"train_loss": -7.377518653869629, "global_step": 207344, "epoch": 4936} {"train_loss": -7.259232997894287, "global_step": 207345, "epoch": 4936} {"train_loss": -7.408987045288086, "global_step": 207346, "epoch": 4936} {"train_loss": -7.376523971557617, "global_step": 207347, "epoch": 4936} {"train_loss": -7.345025062561035, "global_step": 207348, "epoch": 4936} {"train_loss": -7.44973087310791, "global_step": 207349, "epoch": 4936} {"train_loss": -7.319157600402832, "global_step": 207350, "epoch": 4936} {"train_loss": -7.417623996734619, "global_step": 207351, "epoch": 4936} {"train_loss": -7.451605796813965, "global_step": 207352, "epoch": 4936} {"train_loss": -7.318289949780419, "global_step": 207353, "epoch": 4936, "val_loss": 69940.6796875} {"train_loss": -7.346059799194336, "global_step": 207354, "epoch": 4937} {"train_loss": -7.491562366485596, "global_step": 207355, "epoch": 4937} {"train_loss": -7.278260231018066, "global_step": 207356, "epoch": 4937} {"train_loss": -7.212368011474609, "global_step": 207357, "epoch": 4937} {"train_loss": -7.290847301483154, "global_step": 207358, "epoch": 4937} {"train_loss": -7.185191631317139, "global_step": 207359, "epoch": 4937} {"train_loss": -7.405434608459473, "global_step": 207360, "epoch": 4937} {"train_loss": -7.219066619873047, "global_step": 207361, "epoch": 4937} {"train_loss": -7.200085639953613, "global_step": 207362, "epoch": 4937} {"train_loss": -7.3657450675964355, "global_step": 207363, "epoch": 4937} {"train_loss": -7.245429992675781, "global_step": 207364, "epoch": 4937} {"train_loss": -7.206672668457031, "global_step": 207365, "epoch": 4937} {"train_loss": -7.350323677062988, "global_step": 207366, "epoch": 4937} {"train_loss": -7.328201770782471, "global_step": 207367, "epoch": 4937} {"train_loss": -7.354670524597168, "global_step": 207368, "epoch": 4937} {"train_loss": -7.289949893951416, "global_step": 207369, "epoch": 4937} {"train_loss": -7.390006065368652, "global_step": 207370, "epoch": 4937} {"train_loss": -7.413825511932373, "global_step": 207371, "epoch": 4937} {"train_loss": -7.327295303344727, "global_step": 207372, "epoch": 4937} {"train_loss": -7.227076530456543, "global_step": 207373, "epoch": 4937} {"train_loss": -7.351191520690918, "global_step": 207374, "epoch": 4937} {"train_loss": -7.339871406555176, "global_step": 207375, "epoch": 4937} {"train_loss": -7.315122604370117, "global_step": 207376, "epoch": 4937} {"train_loss": -7.41826057434082, "global_step": 207377, "epoch": 4937} {"train_loss": -7.432194232940674, "global_step": 207378, "epoch": 4937} {"train_loss": -7.302672386169434, "global_step": 207379, "epoch": 4937} {"train_loss": -7.429626941680908, "global_step": 207380, "epoch": 4937} {"train_loss": -7.404501914978027, "global_step": 207381, "epoch": 4937} {"train_loss": -7.314040660858154, "global_step": 207382, "epoch": 4937} {"train_loss": -7.262995719909668, "global_step": 207383, "epoch": 4937} {"train_loss": -7.22407341003418, "global_step": 207384, "epoch": 4937} {"train_loss": -7.4024176597595215, "global_step": 207385, "epoch": 4937} {"train_loss": -7.279753684997559, "global_step": 207386, "epoch": 4937} {"train_loss": -7.164772033691406, "global_step": 207387, "epoch": 4937} {"train_loss": -7.3895769119262695, "global_step": 207388, "epoch": 4937} {"train_loss": -7.206665515899658, "global_step": 207389, "epoch": 4937} {"train_loss": -7.129909992218018, "global_step": 207390, "epoch": 4937} {"train_loss": -7.275207042694092, "global_step": 207391, "epoch": 4937} {"train_loss": -7.229358673095703, "global_step": 207392, "epoch": 4937} {"train_loss": -7.227021217346191, "global_step": 207393, "epoch": 4937} {"train_loss": -7.224925994873047, "global_step": 207394, "epoch": 4937} {"train_loss": -7.302338952109928, "global_step": 207395, "epoch": 4937, "val_loss": 70084.3125} {"train_loss": -7.232274532318115, "global_step": 207396, "epoch": 4938} {"train_loss": -7.3209381103515625, "global_step": 207397, "epoch": 4938} {"train_loss": -7.192008972167969, "global_step": 207398, "epoch": 4938} {"train_loss": -7.243799209594727, "global_step": 207399, "epoch": 4938} {"train_loss": -7.343474388122559, "global_step": 207400, "epoch": 4938} {"train_loss": -7.41166877746582, "global_step": 207401, "epoch": 4938} {"train_loss": -7.308459758758545, "global_step": 207402, "epoch": 4938} {"train_loss": -7.263824462890625, "global_step": 207403, "epoch": 4938} {"train_loss": -7.364158630371094, "global_step": 207404, "epoch": 4938} {"train_loss": -7.345511436462402, "global_step": 207405, "epoch": 4938} {"train_loss": -7.469910621643066, "global_step": 207406, "epoch": 4938} {"train_loss": -7.384908676147461, "global_step": 207407, "epoch": 4938} {"train_loss": -7.428686141967773, "global_step": 207408, "epoch": 4938} {"train_loss": -7.30403995513916, "global_step": 207409, "epoch": 4938} {"train_loss": -7.370657920837402, "global_step": 207410, "epoch": 4938} {"train_loss": -7.292013168334961, "global_step": 207411, "epoch": 4938} {"train_loss": -7.303489685058594, "global_step": 207412, "epoch": 4938} {"train_loss": -7.286625862121582, "global_step": 207413, "epoch": 4938} {"train_loss": -7.324086666107178, "global_step": 207414, "epoch": 4938} {"train_loss": -7.21645450592041, "global_step": 207415, "epoch": 4938} {"train_loss": -7.159503936767578, "global_step": 207416, "epoch": 4938} {"train_loss": -7.251884460449219, "global_step": 207417, "epoch": 4938} {"train_loss": -7.422262191772461, "global_step": 207418, "epoch": 4938} {"train_loss": -7.128871917724609, "global_step": 207419, "epoch": 4938} {"train_loss": -7.042163372039795, "global_step": 207420, "epoch": 4938} {"train_loss": -7.2733683586120605, "global_step": 207421, "epoch": 4938} {"train_loss": -7.212800979614258, "global_step": 207422, "epoch": 4938} {"train_loss": -7.12933874130249, "global_step": 207423, "epoch": 4938} {"train_loss": -7.385325908660889, "global_step": 207424, "epoch": 4938} {"train_loss": -7.219242095947266, "global_step": 207425, "epoch": 4938} {"train_loss": -7.365695953369141, "global_step": 207426, "epoch": 4938} {"train_loss": -7.238734245300293, "global_step": 207427, "epoch": 4938} {"train_loss": -7.350246429443359, "global_step": 207428, "epoch": 4938} {"train_loss": -7.284720420837402, "global_step": 207429, "epoch": 4938} {"train_loss": -7.1673688888549805, "global_step": 207430, "epoch": 4938} {"train_loss": -7.266048431396484, "global_step": 207431, "epoch": 4938} {"train_loss": -7.244637489318848, "global_step": 207432, "epoch": 4938} {"train_loss": -7.320862770080566, "global_step": 207433, "epoch": 4938} {"train_loss": -7.2449188232421875, "global_step": 207434, "epoch": 4938} {"train_loss": -7.357718467712402, "global_step": 207435, "epoch": 4938} {"train_loss": -7.425068378448486, "global_step": 207436, "epoch": 4938} {"train_loss": -7.289962371190389, "global_step": 207437, "epoch": 4938, "val_loss": 69915.4140625} {"train_loss": -7.3288373947143555, "global_step": 207438, "epoch": 4939} {"train_loss": -7.233327388763428, "global_step": 207439, "epoch": 4939} {"train_loss": -7.329779148101807, "global_step": 207440, "epoch": 4939} {"train_loss": -7.41145658493042, "global_step": 207441, "epoch": 4939} {"train_loss": -7.385735034942627, "global_step": 207442, "epoch": 4939} {"train_loss": -7.337499618530273, "global_step": 207443, "epoch": 4939} {"train_loss": -7.319066047668457, "global_step": 207444, "epoch": 4939} {"train_loss": -7.367026329040527, "global_step": 207445, "epoch": 4939} {"train_loss": -7.324968338012695, "global_step": 207446, "epoch": 4939} {"train_loss": -7.33831262588501, "global_step": 207447, "epoch": 4939} {"train_loss": -7.372629165649414, "global_step": 207448, "epoch": 4939} {"train_loss": -7.257904052734375, "global_step": 207449, "epoch": 4939} {"train_loss": -7.468451499938965, "global_step": 207450, "epoch": 4939} {"train_loss": -7.396939754486084, "global_step": 207451, "epoch": 4939} {"train_loss": -7.232542514801025, "global_step": 207452, "epoch": 4939} {"train_loss": -7.395540237426758, "global_step": 207453, "epoch": 4939} {"train_loss": -7.3286919593811035, "global_step": 207454, "epoch": 4939} {"train_loss": -7.354101181030273, "global_step": 207455, "epoch": 4939} {"train_loss": -7.450711250305176, "global_step": 207456, "epoch": 4939} {"train_loss": -7.44146728515625, "global_step": 207457, "epoch": 4939} {"train_loss": -7.296207904815674, "global_step": 207458, "epoch": 4939} {"train_loss": -7.375385284423828, "global_step": 207459, "epoch": 4939} {"train_loss": -7.399152755737305, "global_step": 207460, "epoch": 4939} {"train_loss": -7.302227973937988, "global_step": 207461, "epoch": 4939} {"train_loss": -7.306816577911377, "global_step": 207462, "epoch": 4939} {"train_loss": -7.459039688110352, "global_step": 207463, "epoch": 4939} {"train_loss": -7.388411045074463, "global_step": 207464, "epoch": 4939} {"train_loss": -7.380871772766113, "global_step": 207465, "epoch": 4939} {"train_loss": -7.230450630187988, "global_step": 207466, "epoch": 4939} {"train_loss": -7.330503463745117, "global_step": 207467, "epoch": 4939} {"train_loss": -7.468206405639648, "global_step": 207468, "epoch": 4939} {"train_loss": -7.133847713470459, "global_step": 207469, "epoch": 4939} {"train_loss": -7.316157817840576, "global_step": 207470, "epoch": 4939} {"train_loss": -7.386319160461426, "global_step": 207471, "epoch": 4939} {"train_loss": -7.333039283752441, "global_step": 207472, "epoch": 4939} {"train_loss": -7.374093055725098, "global_step": 207473, "epoch": 4939} {"train_loss": -7.312472343444824, "global_step": 207474, "epoch": 4939} {"train_loss": -7.3705291748046875, "global_step": 207475, "epoch": 4939} {"train_loss": -7.455986976623535, "global_step": 207476, "epoch": 4939} {"train_loss": -7.457670211791992, "global_step": 207477, "epoch": 4939} {"train_loss": -7.36379337310791, "global_step": 207478, "epoch": 4939} {"train_loss": -7.352829308736892, "global_step": 207479, "epoch": 4939, "val_loss": 70078.9375} {"train_loss": -7.293491363525391, "global_step": 207480, "epoch": 4940} {"train_loss": -7.341189861297607, "global_step": 207481, "epoch": 4940} {"train_loss": -7.331079959869385, "global_step": 207482, "epoch": 4940} {"train_loss": -7.328066825866699, "global_step": 207483, "epoch": 4940} {"train_loss": -7.3405022621154785, "global_step": 207484, "epoch": 4940} {"train_loss": -7.330864429473877, "global_step": 207485, "epoch": 4940} {"train_loss": -7.331018447875977, "global_step": 207486, "epoch": 4940} {"train_loss": -7.274741172790527, "global_step": 207487, "epoch": 4940} {"train_loss": -7.321053504943848, "global_step": 207488, "epoch": 4940} {"train_loss": -7.380054950714111, "global_step": 207489, "epoch": 4940} {"train_loss": -7.202184677124023, "global_step": 207490, "epoch": 4940} {"train_loss": -7.404694080352783, "global_step": 207491, "epoch": 4940} {"train_loss": -7.317619323730469, "global_step": 207492, "epoch": 4940} {"train_loss": -7.174572944641113, "global_step": 207493, "epoch": 4940} {"train_loss": -7.1803483963012695, "global_step": 207494, "epoch": 4940} {"train_loss": -7.267138957977295, "global_step": 207495, "epoch": 4940} {"train_loss": -7.153029441833496, "global_step": 207496, "epoch": 4940} {"train_loss": -7.212893486022949, "global_step": 207497, "epoch": 4940} {"train_loss": -7.302460670471191, "global_step": 207498, "epoch": 4940} {"train_loss": -7.239048957824707, "global_step": 207499, "epoch": 4940} {"train_loss": -7.186727523803711, "global_step": 207500, "epoch": 4940} {"train_loss": -7.17265510559082, "global_step": 207501, "epoch": 4940} {"train_loss": -7.238809585571289, "global_step": 207502, "epoch": 4940} {"train_loss": -7.164238929748535, "global_step": 207503, "epoch": 4940} {"train_loss": -7.206141948699951, "global_step": 207504, "epoch": 4940} {"train_loss": -7.212408542633057, "global_step": 207505, "epoch": 4940} {"train_loss": -7.235223770141602, "global_step": 207506, "epoch": 4940} {"train_loss": -7.190627098083496, "global_step": 207507, "epoch": 4940} {"train_loss": -7.348304748535156, "global_step": 207508, "epoch": 4940} {"train_loss": -7.3147149085998535, "global_step": 207509, "epoch": 4940} {"train_loss": -7.239575386047363, "global_step": 207510, "epoch": 4940} {"train_loss": -7.19953727722168, "global_step": 207511, "epoch": 4940} {"train_loss": -7.21778678894043, "global_step": 207512, "epoch": 4940} {"train_loss": -7.292084217071533, "global_step": 207513, "epoch": 4940} {"train_loss": -7.2059736251831055, "global_step": 207514, "epoch": 4940} {"train_loss": -7.361518859863281, "global_step": 207515, "epoch": 4940} {"train_loss": -7.275368690490723, "global_step": 207516, "epoch": 4940} {"train_loss": -7.323367595672607, "global_step": 207517, "epoch": 4940} {"train_loss": -7.22057580947876, "global_step": 207518, "epoch": 4940} {"train_loss": -7.227882385253906, "global_step": 207519, "epoch": 4940} {"train_loss": -7.38875150680542, "global_step": 207520, "epoch": 4940} {"train_loss": -7.262566600527082, "global_step": 207521, "epoch": 4940, "val_loss": 70031.9453125} {"train_loss": -7.35601806640625, "global_step": 207522, "epoch": 4941} {"train_loss": -7.3212738037109375, "global_step": 207523, "epoch": 4941} {"train_loss": -7.417870044708252, "global_step": 207524, "epoch": 4941} {"train_loss": -7.379534721374512, "global_step": 207525, "epoch": 4941} {"train_loss": -7.316791534423828, "global_step": 207526, "epoch": 4941} {"train_loss": -7.342146873474121, "global_step": 207527, "epoch": 4941} {"train_loss": -7.304022312164307, "global_step": 207528, "epoch": 4941} {"train_loss": -7.363203525543213, "global_step": 207529, "epoch": 4941} {"train_loss": -7.257936477661133, "global_step": 207530, "epoch": 4941} {"train_loss": -7.2623291015625, "global_step": 207531, "epoch": 4941} {"train_loss": -7.262841701507568, "global_step": 207532, "epoch": 4941} {"train_loss": -7.2826666831970215, "global_step": 207533, "epoch": 4941} {"train_loss": -7.317992210388184, "global_step": 207534, "epoch": 4941} {"train_loss": -7.1323089599609375, "global_step": 207535, "epoch": 4941} {"train_loss": -7.33751916885376, "global_step": 207536, "epoch": 4941} {"train_loss": -7.360480785369873, "global_step": 207537, "epoch": 4941} {"train_loss": -7.313855171203613, "global_step": 207538, "epoch": 4941} {"train_loss": -7.248536109924316, "global_step": 207539, "epoch": 4941} {"train_loss": -7.266304016113281, "global_step": 207540, "epoch": 4941} {"train_loss": -7.279223918914795, "global_step": 207541, "epoch": 4941} {"train_loss": -7.291647911071777, "global_step": 207542, "epoch": 4941} {"train_loss": -7.339015007019043, "global_step": 207543, "epoch": 4941} {"train_loss": -7.368793487548828, "global_step": 207544, "epoch": 4941} {"train_loss": -7.394077301025391, "global_step": 207545, "epoch": 4941} {"train_loss": -7.179800033569336, "global_step": 207546, "epoch": 4941} {"train_loss": -7.389455795288086, "global_step": 207547, "epoch": 4941} {"train_loss": -7.329110145568848, "global_step": 207548, "epoch": 4941} {"train_loss": -7.222172260284424, "global_step": 207549, "epoch": 4941} {"train_loss": -7.377630233764648, "global_step": 207550, "epoch": 4941} {"train_loss": -7.201910972595215, "global_step": 207551, "epoch": 4941} {"train_loss": -7.286138534545898, "global_step": 207552, "epoch": 4941} {"train_loss": -7.335958957672119, "global_step": 207553, "epoch": 4941} {"train_loss": -7.316939353942871, "global_step": 207554, "epoch": 4941} {"train_loss": -7.371177673339844, "global_step": 207555, "epoch": 4941} {"train_loss": -7.23834228515625, "global_step": 207556, "epoch": 4941} {"train_loss": -7.3767499923706055, "global_step": 207557, "epoch": 4941} {"train_loss": -7.306048393249512, "global_step": 207558, "epoch": 4941} {"train_loss": -7.271388053894043, "global_step": 207559, "epoch": 4941} {"train_loss": -7.306635856628418, "global_step": 207560, "epoch": 4941} {"train_loss": -7.319142818450928, "global_step": 207561, "epoch": 4941} {"train_loss": -7.230022430419922, "global_step": 207562, "epoch": 4941} {"train_loss": -7.307591188521612, "global_step": 207563, "epoch": 4941, "val_loss": 69803.953125} {"train_loss": -7.399324417114258, "global_step": 207564, "epoch": 4942} {"train_loss": -7.194147109985352, "global_step": 207565, "epoch": 4942} {"train_loss": -7.471756458282471, "global_step": 207566, "epoch": 4942} {"train_loss": -7.3730902671813965, "global_step": 207567, "epoch": 4942} {"train_loss": -7.348156929016113, "global_step": 207568, "epoch": 4942} {"train_loss": -7.310871124267578, "global_step": 207569, "epoch": 4942} {"train_loss": -7.472241401672363, "global_step": 207570, "epoch": 4942} {"train_loss": -7.270772933959961, "global_step": 207571, "epoch": 4942} {"train_loss": -7.445587635040283, "global_step": 207572, "epoch": 4942} {"train_loss": -7.318501949310303, "global_step": 207573, "epoch": 4942} {"train_loss": -7.23808479309082, "global_step": 207574, "epoch": 4942} {"train_loss": -7.328463554382324, "global_step": 207575, "epoch": 4942} {"train_loss": -7.387628078460693, "global_step": 207576, "epoch": 4942} {"train_loss": -7.203285217285156, "global_step": 207577, "epoch": 4942} {"train_loss": -7.292192459106445, "global_step": 207578, "epoch": 4942} {"train_loss": -7.297496318817139, "global_step": 207579, "epoch": 4942} {"train_loss": -7.210235595703125, "global_step": 207580, "epoch": 4942} {"train_loss": -7.250644683837891, "global_step": 207581, "epoch": 4942} {"train_loss": -7.210894584655762, "global_step": 207582, "epoch": 4942} {"train_loss": -7.0112624168396, "global_step": 207583, "epoch": 4942} {"train_loss": -7.3537917137146, "global_step": 207584, "epoch": 4942} {"train_loss": -7.1829376220703125, "global_step": 207585, "epoch": 4942} {"train_loss": -7.243474006652832, "global_step": 207586, "epoch": 4942} {"train_loss": -7.245266914367676, "global_step": 207587, "epoch": 4942} {"train_loss": -7.220256805419922, "global_step": 207588, "epoch": 4942} {"train_loss": -7.274688243865967, "global_step": 207589, "epoch": 4942} {"train_loss": -7.099714279174805, "global_step": 207590, "epoch": 4942} {"train_loss": -7.283463954925537, "global_step": 207591, "epoch": 4942} {"train_loss": -7.196849346160889, "global_step": 207592, "epoch": 4942} {"train_loss": -7.299373626708984, "global_step": 207593, "epoch": 4942} {"train_loss": -7.235446929931641, "global_step": 207594, "epoch": 4942} {"train_loss": -7.217804908752441, "global_step": 207595, "epoch": 4942} {"train_loss": -7.1526994705200195, "global_step": 207596, "epoch": 4942} {"train_loss": -7.199716567993164, "global_step": 207597, "epoch": 4942} {"train_loss": -7.167660236358643, "global_step": 207598, "epoch": 4942} {"train_loss": -7.136047840118408, "global_step": 207599, "epoch": 4942} {"train_loss": -7.166284561157227, "global_step": 207600, "epoch": 4942} {"train_loss": -7.196171760559082, "global_step": 207601, "epoch": 4942} {"train_loss": -7.222269058227539, "global_step": 207602, "epoch": 4942} {"train_loss": -7.238653659820557, "global_step": 207603, "epoch": 4942} {"train_loss": -7.263833522796631, "global_step": 207604, "epoch": 4942} {"train_loss": -7.260444266455514, "global_step": 207605, "epoch": 4942, "val_loss": 69950.7578125} {"train_loss": -7.297982692718506, "global_step": 207606, "epoch": 4943} {"train_loss": -7.297431945800781, "global_step": 207607, "epoch": 4943} {"train_loss": -7.331446647644043, "global_step": 207608, "epoch": 4943} {"train_loss": -7.269106864929199, "global_step": 207609, "epoch": 4943} {"train_loss": -7.3930816650390625, "global_step": 207610, "epoch": 4943} {"train_loss": -7.2549238204956055, "global_step": 207611, "epoch": 4943} {"train_loss": -7.389350891113281, "global_step": 207612, "epoch": 4943} {"train_loss": -7.357525825500488, "global_step": 207613, "epoch": 4943} {"train_loss": -7.351930618286133, "global_step": 207614, "epoch": 4943} {"train_loss": -7.281485557556152, "global_step": 207615, "epoch": 4943} {"train_loss": -7.241087913513184, "global_step": 207616, "epoch": 4943} {"train_loss": -7.363982200622559, "global_step": 207617, "epoch": 4943} {"train_loss": -7.356492042541504, "global_step": 207618, "epoch": 4943} {"train_loss": -7.366799831390381, "global_step": 207619, "epoch": 4943} {"train_loss": -7.33057165145874, "global_step": 207620, "epoch": 4943} {"train_loss": -7.4225873947143555, "global_step": 207621, "epoch": 4943} {"train_loss": -7.308320045471191, "global_step": 207622, "epoch": 4943} {"train_loss": -7.3991193771362305, "global_step": 207623, "epoch": 4943} {"train_loss": -7.306412696838379, "global_step": 207624, "epoch": 4943} {"train_loss": -7.255363941192627, "global_step": 207625, "epoch": 4943} {"train_loss": -7.324240207672119, "global_step": 207626, "epoch": 4943} {"train_loss": -7.388141632080078, "global_step": 207627, "epoch": 4943} {"train_loss": -7.43333101272583, "global_step": 207628, "epoch": 4943} {"train_loss": -7.399094581604004, "global_step": 207629, "epoch": 4943} {"train_loss": -7.373539447784424, "global_step": 207630, "epoch": 4943} {"train_loss": -7.443968772888184, "global_step": 207631, "epoch": 4943} {"train_loss": -7.324874401092529, "global_step": 207632, "epoch": 4943} {"train_loss": -7.386659622192383, "global_step": 207633, "epoch": 4943} {"train_loss": -7.339509010314941, "global_step": 207634, "epoch": 4943} {"train_loss": -7.304017066955566, "global_step": 207635, "epoch": 4943} {"train_loss": -7.340102195739746, "global_step": 207636, "epoch": 4943} {"train_loss": -7.451746940612793, "global_step": 207637, "epoch": 4943} {"train_loss": -7.290984630584717, "global_step": 207638, "epoch": 4943} {"train_loss": -7.355197906494141, "global_step": 207639, "epoch": 4943} {"train_loss": -7.318417549133301, "global_step": 207640, "epoch": 4943} {"train_loss": -7.2269287109375, "global_step": 207641, "epoch": 4943} {"train_loss": -7.317718505859375, "global_step": 207642, "epoch": 4943} {"train_loss": -7.25681209564209, "global_step": 207643, "epoch": 4943} {"train_loss": -7.221914291381836, "global_step": 207644, "epoch": 4943} {"train_loss": -7.2793450355529785, "global_step": 207645, "epoch": 4943} {"train_loss": -7.327338695526123, "global_step": 207646, "epoch": 4943} {"train_loss": -7.333233265649705, "global_step": 207647, "epoch": 4943, "val_loss": 69928.1875} {"train_loss": -7.3326263427734375, "global_step": 207648, "epoch": 4944} {"train_loss": -7.255531311035156, "global_step": 207649, "epoch": 4944} {"train_loss": -7.3185505867004395, "global_step": 207650, "epoch": 4944} {"train_loss": -7.353851795196533, "global_step": 207651, "epoch": 4944} {"train_loss": -7.313932418823242, "global_step": 207652, "epoch": 4944} {"train_loss": -7.328779220581055, "global_step": 207653, "epoch": 4944} {"train_loss": -7.340952396392822, "global_step": 207654, "epoch": 4944} {"train_loss": -7.251356601715088, "global_step": 207655, "epoch": 4944} {"train_loss": -7.395936489105225, "global_step": 207656, "epoch": 4944} {"train_loss": -7.358821868896484, "global_step": 207657, "epoch": 4944} {"train_loss": -7.253081321716309, "global_step": 207658, "epoch": 4944} {"train_loss": -7.230780601501465, "global_step": 207659, "epoch": 4944} {"train_loss": -7.33343505859375, "global_step": 207660, "epoch": 4944} {"train_loss": -7.2927045822143555, "global_step": 207661, "epoch": 4944} {"train_loss": -7.165152549743652, "global_step": 207662, "epoch": 4944} {"train_loss": -7.360677719116211, "global_step": 207663, "epoch": 4944} {"train_loss": -7.38523530960083, "global_step": 207664, "epoch": 4944} {"train_loss": -7.246071815490723, "global_step": 207665, "epoch": 4944} {"train_loss": -7.290462970733643, "global_step": 207666, "epoch": 4944} {"train_loss": -7.295351982116699, "global_step": 207667, "epoch": 4944} {"train_loss": -7.264777183532715, "global_step": 207668, "epoch": 4944} {"train_loss": -7.3047895431518555, "global_step": 207669, "epoch": 4944} {"train_loss": -7.31632137298584, "global_step": 207670, "epoch": 4944} {"train_loss": -7.348685264587402, "global_step": 207671, "epoch": 4944} {"train_loss": -7.2786030769348145, "global_step": 207672, "epoch": 4944} {"train_loss": -7.195246696472168, "global_step": 207673, "epoch": 4944} {"train_loss": -7.281573295593262, "global_step": 207674, "epoch": 4944} {"train_loss": -7.345280647277832, "global_step": 207675, "epoch": 4944} {"train_loss": -7.278388023376465, "global_step": 207676, "epoch": 4944} {"train_loss": -7.2095513343811035, "global_step": 207677, "epoch": 4944} {"train_loss": -7.294556140899658, "global_step": 207678, "epoch": 4944} {"train_loss": -7.190515518188477, "global_step": 207679, "epoch": 4944} {"train_loss": -7.2084574699401855, "global_step": 207680, "epoch": 4944} {"train_loss": -7.278015613555908, "global_step": 207681, "epoch": 4944} {"train_loss": -7.172573089599609, "global_step": 207682, "epoch": 4944} {"train_loss": -7.21665096282959, "global_step": 207683, "epoch": 4944} {"train_loss": -7.176665306091309, "global_step": 207684, "epoch": 4944} {"train_loss": -7.18632173538208, "global_step": 207685, "epoch": 4944} {"train_loss": -7.333286285400391, "global_step": 207686, "epoch": 4944} {"train_loss": -7.3407721519470215, "global_step": 207687, "epoch": 4944} {"train_loss": -7.285272598266602, "global_step": 207688, "epoch": 4944} {"train_loss": -7.283278737749372, "global_step": 207689, "epoch": 4944, "val_loss": 69954.890625} {"train_loss": -7.2872138023376465, "global_step": 207690, "epoch": 4945} {"train_loss": -7.341583251953125, "global_step": 207691, "epoch": 4945} {"train_loss": -7.339549541473389, "global_step": 207692, "epoch": 4945} {"train_loss": -7.263855934143066, "global_step": 207693, "epoch": 4945} {"train_loss": -7.345123291015625, "global_step": 207694, "epoch": 4945} {"train_loss": -7.2877349853515625, "global_step": 207695, "epoch": 4945} {"train_loss": -7.384905815124512, "global_step": 207696, "epoch": 4945} {"train_loss": -7.253584861755371, "global_step": 207697, "epoch": 4945} {"train_loss": -7.2482123374938965, "global_step": 207698, "epoch": 4945} {"train_loss": -7.18585729598999, "global_step": 207699, "epoch": 4945} {"train_loss": -7.207028388977051, "global_step": 207700, "epoch": 4945} {"train_loss": -7.281246662139893, "global_step": 207701, "epoch": 4945} {"train_loss": -7.238433837890625, "global_step": 207702, "epoch": 4945} {"train_loss": -7.4242401123046875, "global_step": 207703, "epoch": 4945} {"train_loss": -7.370975494384766, "global_step": 207704, "epoch": 4945} {"train_loss": -7.378177165985107, "global_step": 207705, "epoch": 4945} {"train_loss": -7.4022111892700195, "global_step": 207706, "epoch": 4945} {"train_loss": -7.274062156677246, "global_step": 207707, "epoch": 4945} {"train_loss": -7.464818000793457, "global_step": 207708, "epoch": 4945} {"train_loss": -7.256763935089111, "global_step": 207709, "epoch": 4945} {"train_loss": -7.2257585525512695, "global_step": 207710, "epoch": 4945} {"train_loss": -7.432933807373047, "global_step": 207711, "epoch": 4945} {"train_loss": -7.290660381317139, "global_step": 207712, "epoch": 4945} {"train_loss": -7.3404107093811035, "global_step": 207713, "epoch": 4945} {"train_loss": -7.334705352783203, "global_step": 207714, "epoch": 4945} {"train_loss": -7.227634906768799, "global_step": 207715, "epoch": 4945} {"train_loss": -7.354270935058594, "global_step": 207716, "epoch": 4945} {"train_loss": -7.392821311950684, "global_step": 207717, "epoch": 4945} {"train_loss": -7.375387668609619, "global_step": 207718, "epoch": 4945} {"train_loss": -7.342449188232422, "global_step": 207719, "epoch": 4945} {"train_loss": -7.381931781768799, "global_step": 207720, "epoch": 4945} {"train_loss": -7.297314643859863, "global_step": 207721, "epoch": 4945} {"train_loss": -7.197060585021973, "global_step": 207722, "epoch": 4945} {"train_loss": -7.2648749351501465, "global_step": 207723, "epoch": 4945} {"train_loss": -7.307670593261719, "global_step": 207724, "epoch": 4945} {"train_loss": -7.236641883850098, "global_step": 207725, "epoch": 4945} {"train_loss": -7.500244140625, "global_step": 207726, "epoch": 4945} {"train_loss": -7.282984256744385, "global_step": 207727, "epoch": 4945} {"train_loss": -7.246344566345215, "global_step": 207728, "epoch": 4945} {"train_loss": -7.3158063888549805, "global_step": 207729, "epoch": 4945} {"train_loss": -7.192560195922852, "global_step": 207730, "epoch": 4945} {"train_loss": -7.313597769964309, "global_step": 207731, "epoch": 4945, "val_loss": 70091.0078125} {"train_loss": -7.23490047454834, "global_step": 207732, "epoch": 4946} {"train_loss": -7.235248565673828, "global_step": 207733, "epoch": 4946} {"train_loss": -7.396455764770508, "global_step": 207734, "epoch": 4946} {"train_loss": -7.247159004211426, "global_step": 207735, "epoch": 4946} {"train_loss": -7.327141284942627, "global_step": 207736, "epoch": 4946} {"train_loss": -7.4032135009765625, "global_step": 207737, "epoch": 4946} {"train_loss": -7.334280967712402, "global_step": 207738, "epoch": 4946} {"train_loss": -7.426767349243164, "global_step": 207739, "epoch": 4946} {"train_loss": -7.358104705810547, "global_step": 207740, "epoch": 4946} {"train_loss": -7.378042221069336, "global_step": 207741, "epoch": 4946} {"train_loss": -7.36953592300415, "global_step": 207742, "epoch": 4946} {"train_loss": -7.345064640045166, "global_step": 207743, "epoch": 4946} {"train_loss": -7.301054000854492, "global_step": 207744, "epoch": 4946} {"train_loss": -7.405749320983887, "global_step": 207745, "epoch": 4946} {"train_loss": -7.460030555725098, "global_step": 207746, "epoch": 4946} {"train_loss": -7.246413230895996, "global_step": 207747, "epoch": 4946} {"train_loss": -7.234206199645996, "global_step": 207748, "epoch": 4946} {"train_loss": -7.343224048614502, "global_step": 207749, "epoch": 4946} {"train_loss": -7.1547698974609375, "global_step": 207750, "epoch": 4946} {"train_loss": -7.340670585632324, "global_step": 207751, "epoch": 4946} {"train_loss": -7.2673540115356445, "global_step": 207752, "epoch": 4946} {"train_loss": -7.20770263671875, "global_step": 207753, "epoch": 4946} {"train_loss": -7.269656181335449, "global_step": 207754, "epoch": 4946} {"train_loss": -7.384244918823242, "global_step": 207755, "epoch": 4946} {"train_loss": -7.32169771194458, "global_step": 207756, "epoch": 4946} {"train_loss": -7.192061901092529, "global_step": 207757, "epoch": 4946} {"train_loss": -7.239301681518555, "global_step": 207758, "epoch": 4946} {"train_loss": -7.301419734954834, "global_step": 207759, "epoch": 4946} {"train_loss": -7.191842555999756, "global_step": 207760, "epoch": 4946} {"train_loss": -7.277238845825195, "global_step": 207761, "epoch": 4946} {"train_loss": -7.195084571838379, "global_step": 207762, "epoch": 4946} {"train_loss": -7.194540023803711, "global_step": 207763, "epoch": 4946} {"train_loss": -7.2430806159973145, "global_step": 207764, "epoch": 4946} {"train_loss": -7.330212593078613, "global_step": 207765, "epoch": 4946} {"train_loss": -7.408024787902832, "global_step": 207766, "epoch": 4946} {"train_loss": -7.312984466552734, "global_step": 207767, "epoch": 4946} {"train_loss": -7.33359432220459, "global_step": 207768, "epoch": 4946} {"train_loss": -7.24318790435791, "global_step": 207769, "epoch": 4946} {"train_loss": -7.4151740074157715, "global_step": 207770, "epoch": 4946} {"train_loss": -7.454002857208252, "global_step": 207771, "epoch": 4946} {"train_loss": -7.305853366851807, "global_step": 207772, "epoch": 4946} {"train_loss": -7.311160882314046, "global_step": 207773, "epoch": 4946, "val_loss": 69953.671875} {"train_loss": -7.340418815612793, "global_step": 207774, "epoch": 4947} {"train_loss": -7.344470977783203, "global_step": 207775, "epoch": 4947} {"train_loss": -7.462431907653809, "global_step": 207776, "epoch": 4947} {"train_loss": -7.461007118225098, "global_step": 207777, "epoch": 4947} {"train_loss": -7.44948673248291, "global_step": 207778, "epoch": 4947} {"train_loss": -7.491756916046143, "global_step": 207779, "epoch": 4947} {"train_loss": -7.519283294677734, "global_step": 207780, "epoch": 4947} {"train_loss": -7.439349174499512, "global_step": 207781, "epoch": 4947} {"train_loss": -7.395449161529541, "global_step": 207782, "epoch": 4947} {"train_loss": -7.388975143432617, "global_step": 207783, "epoch": 4947} {"train_loss": -7.405388832092285, "global_step": 207784, "epoch": 4947} {"train_loss": -7.160036087036133, "global_step": 207785, "epoch": 4947} {"train_loss": -7.426172256469727, "global_step": 207786, "epoch": 4947} {"train_loss": -7.389652252197266, "global_step": 207787, "epoch": 4947} {"train_loss": -7.259577751159668, "global_step": 207788, "epoch": 4947} {"train_loss": -7.328857898712158, "global_step": 207789, "epoch": 4947} {"train_loss": -7.3894429206848145, "global_step": 207790, "epoch": 4947} {"train_loss": -7.452763557434082, "global_step": 207791, "epoch": 4947} {"train_loss": -7.341430187225342, "global_step": 207792, "epoch": 4947} {"train_loss": -7.447047710418701, "global_step": 207793, "epoch": 4947} {"train_loss": -7.368380546569824, "global_step": 207794, "epoch": 4947} {"train_loss": -7.289925575256348, "global_step": 207795, "epoch": 4947} {"train_loss": -7.328704833984375, "global_step": 207796, "epoch": 4947} {"train_loss": -7.392675399780273, "global_step": 207797, "epoch": 4947} {"train_loss": -7.354195594787598, "global_step": 207798, "epoch": 4947} {"train_loss": -7.42351770401001, "global_step": 207799, "epoch": 4947} {"train_loss": -7.342637062072754, "global_step": 207800, "epoch": 4947} {"train_loss": -7.3957366943359375, "global_step": 207801, "epoch": 4947} {"train_loss": -7.296026229858398, "global_step": 207802, "epoch": 4947} {"train_loss": -7.174258232116699, "global_step": 207803, "epoch": 4947} {"train_loss": -7.406299591064453, "global_step": 207804, "epoch": 4947} {"train_loss": -7.474313735961914, "global_step": 207805, "epoch": 4947} {"train_loss": -7.454193592071533, "global_step": 207806, "epoch": 4947} {"train_loss": -7.320724010467529, "global_step": 207807, "epoch": 4947} {"train_loss": -7.283824920654297, "global_step": 207808, "epoch": 4947} {"train_loss": -7.547624111175537, "global_step": 207809, "epoch": 4947} {"train_loss": -7.475671291351318, "global_step": 207810, "epoch": 4947} {"train_loss": -7.376662254333496, "global_step": 207811, "epoch": 4947} {"train_loss": -7.4031219482421875, "global_step": 207812, "epoch": 4947} {"train_loss": -7.432073593139648, "global_step": 207813, "epoch": 4947} {"train_loss": -7.3540873527526855, "global_step": 207814, "epoch": 4947} {"train_loss": -7.386167503538585, "global_step": 207815, "epoch": 4947, "val_loss": 69954.9453125} {"train_loss": -7.312625408172607, "global_step": 207816, "epoch": 4948} {"train_loss": -7.398260116577148, "global_step": 207817, "epoch": 4948} {"train_loss": -7.27042293548584, "global_step": 207818, "epoch": 4948} {"train_loss": -7.4862213134765625, "global_step": 207819, "epoch": 4948} {"train_loss": -7.444356918334961, "global_step": 207820, "epoch": 4948} {"train_loss": -7.442588806152344, "global_step": 207821, "epoch": 4948} {"train_loss": -7.309147357940674, "global_step": 207822, "epoch": 4948} {"train_loss": -7.294951438903809, "global_step": 207823, "epoch": 4948} {"train_loss": -7.463375568389893, "global_step": 207824, "epoch": 4948} {"train_loss": -7.278432846069336, "global_step": 207825, "epoch": 4948} {"train_loss": -7.285090446472168, "global_step": 207826, "epoch": 4948} {"train_loss": -7.249457836151123, "global_step": 207827, "epoch": 4948} {"train_loss": -7.3646135330200195, "global_step": 207828, "epoch": 4948} {"train_loss": -7.393665313720703, "global_step": 207829, "epoch": 4948} {"train_loss": -7.294130325317383, "global_step": 207830, "epoch": 4948} {"train_loss": -7.236640930175781, "global_step": 207831, "epoch": 4948} {"train_loss": -7.365910053253174, "global_step": 207832, "epoch": 4948} {"train_loss": -7.488804817199707, "global_step": 207833, "epoch": 4948} {"train_loss": -7.198227882385254, "global_step": 207834, "epoch": 4948} {"train_loss": -7.34115743637085, "global_step": 207835, "epoch": 4948} {"train_loss": -7.313037395477295, "global_step": 207836, "epoch": 4948} {"train_loss": -7.301189422607422, "global_step": 207837, "epoch": 4948} {"train_loss": -7.433280944824219, "global_step": 207838, "epoch": 4948} {"train_loss": -7.195730209350586, "global_step": 207839, "epoch": 4948} {"train_loss": -7.216266632080078, "global_step": 207840, "epoch": 4948} {"train_loss": -7.352790355682373, "global_step": 207841, "epoch": 4948} {"train_loss": -7.339280128479004, "global_step": 207842, "epoch": 4948} {"train_loss": -7.317492485046387, "global_step": 207843, "epoch": 4948} {"train_loss": -7.285922050476074, "global_step": 207844, "epoch": 4948} {"train_loss": -7.385564804077148, "global_step": 207845, "epoch": 4948} {"train_loss": -7.308475494384766, "global_step": 207846, "epoch": 4948} {"train_loss": -7.344662666320801, "global_step": 207847, "epoch": 4948} {"train_loss": -7.291422367095947, "global_step": 207848, "epoch": 4948} {"train_loss": -7.343567371368408, "global_step": 207849, "epoch": 4948} {"train_loss": -7.291323661804199, "global_step": 207850, "epoch": 4948} {"train_loss": -7.25352144241333, "global_step": 207851, "epoch": 4948} {"train_loss": -7.232749938964844, "global_step": 207852, "epoch": 4948} {"train_loss": -7.287951469421387, "global_step": 207853, "epoch": 4948} {"train_loss": -7.17665958404541, "global_step": 207854, "epoch": 4948} {"train_loss": -7.173549175262451, "global_step": 207855, "epoch": 4948} {"train_loss": -7.308865547180176, "global_step": 207856, "epoch": 4948} {"train_loss": -7.3153121812003, "global_step": 207857, "epoch": 4948, "val_loss": 70091.7734375} {"train_loss": -7.158985614776611, "global_step": 207858, "epoch": 4949} {"train_loss": -7.293339729309082, "global_step": 207859, "epoch": 4949} {"train_loss": -7.04299783706665, "global_step": 207860, "epoch": 4949} {"train_loss": -7.184010028839111, "global_step": 207861, "epoch": 4949} {"train_loss": -7.2135820388793945, "global_step": 207862, "epoch": 4949} {"train_loss": -7.094134330749512, "global_step": 207863, "epoch": 4949} {"train_loss": -7.281323432922363, "global_step": 207864, "epoch": 4949} {"train_loss": -7.024906158447266, "global_step": 207865, "epoch": 4949} {"train_loss": -7.058152198791504, "global_step": 207866, "epoch": 4949} {"train_loss": -7.1826605796813965, "global_step": 207867, "epoch": 4949} {"train_loss": -7.117725849151611, "global_step": 207868, "epoch": 4949} {"train_loss": -7.16703987121582, "global_step": 207869, "epoch": 4949} {"train_loss": -7.0845465660095215, "global_step": 207870, "epoch": 4949} {"train_loss": -7.178112983703613, "global_step": 207871, "epoch": 4949} {"train_loss": -7.186919212341309, "global_step": 207872, "epoch": 4949} {"train_loss": -7.236127853393555, "global_step": 207873, "epoch": 4949} {"train_loss": -7.171483993530273, "global_step": 207874, "epoch": 4949} {"train_loss": -7.245245456695557, "global_step": 207875, "epoch": 4949} {"train_loss": -7.163454055786133, "global_step": 207876, "epoch": 4949} {"train_loss": -7.314567565917969, "global_step": 207877, "epoch": 4949} {"train_loss": -7.183812618255615, "global_step": 207878, "epoch": 4949} {"train_loss": -7.300288200378418, "global_step": 207879, "epoch": 4949} {"train_loss": -7.2880425453186035, "global_step": 207880, "epoch": 4949} {"train_loss": -7.331674575805664, "global_step": 207881, "epoch": 4949} {"train_loss": -7.280226707458496, "global_step": 207882, "epoch": 4949} {"train_loss": -7.310291290283203, "global_step": 207883, "epoch": 4949} {"train_loss": -7.293914318084717, "global_step": 207884, "epoch": 4949} {"train_loss": -7.307514190673828, "global_step": 207885, "epoch": 4949} {"train_loss": -7.397857666015625, "global_step": 207886, "epoch": 4949} {"train_loss": -7.380007743835449, "global_step": 207887, "epoch": 4949} {"train_loss": -7.338639259338379, "global_step": 207888, "epoch": 4949} {"train_loss": -7.366819381713867, "global_step": 207889, "epoch": 4949} {"train_loss": -7.256130218505859, "global_step": 207890, "epoch": 4949} {"train_loss": -7.32114315032959, "global_step": 207891, "epoch": 4949} {"train_loss": -7.297998905181885, "global_step": 207892, "epoch": 4949} {"train_loss": -7.250283718109131, "global_step": 207893, "epoch": 4949} {"train_loss": -7.307187080383301, "global_step": 207894, "epoch": 4949} {"train_loss": -7.374885082244873, "global_step": 207895, "epoch": 4949} {"train_loss": -7.4350762367248535, "global_step": 207896, "epoch": 4949} {"train_loss": -7.349145889282227, "global_step": 207897, "epoch": 4949} {"train_loss": -7.306946277618408, "global_step": 207898, "epoch": 4949} {"train_loss": -7.248418887456258, "global_step": 207899, "epoch": 4949, "val_loss": 69987.6328125} {"train_loss": -7.425750732421875, "global_step": 207900, "epoch": 4950} {"train_loss": -7.209447383880615, "global_step": 207901, "epoch": 4950} {"train_loss": -7.283393859863281, "global_step": 207902, "epoch": 4950} {"train_loss": -7.259363174438477, "global_step": 207903, "epoch": 4950} {"train_loss": -7.3615617752075195, "global_step": 207904, "epoch": 4950} {"train_loss": -7.343465328216553, "global_step": 207905, "epoch": 4950} {"train_loss": -7.466284275054932, "global_step": 207906, "epoch": 4950} {"train_loss": -7.378695487976074, "global_step": 207907, "epoch": 4950} {"train_loss": -7.392650127410889, "global_step": 207908, "epoch": 4950} {"train_loss": -7.398359298706055, "global_step": 207909, "epoch": 4950} {"train_loss": -7.260851860046387, "global_step": 207910, "epoch": 4950} {"train_loss": -7.4011335372924805, "global_step": 207911, "epoch": 4950} {"train_loss": -7.323524475097656, "global_step": 207912, "epoch": 4950} {"train_loss": -7.439648151397705, "global_step": 207913, "epoch": 4950} {"train_loss": -7.364676475524902, "global_step": 207914, "epoch": 4950} {"train_loss": -7.412250995635986, "global_step": 207915, "epoch": 4950} {"train_loss": -7.306262969970703, "global_step": 207916, "epoch": 4950} {"train_loss": -7.364527702331543, "global_step": 207917, "epoch": 4950} {"train_loss": -7.370975017547607, "global_step": 207918, "epoch": 4950} {"train_loss": -7.3388776779174805, "global_step": 207919, "epoch": 4950} {"train_loss": -7.368277549743652, "global_step": 207920, "epoch": 4950} {"train_loss": -7.4668192863464355, "global_step": 207921, "epoch": 4950} {"train_loss": -7.453070163726807, "global_step": 207922, "epoch": 4950} {"train_loss": -7.4147210121154785, "global_step": 207923, "epoch": 4950} {"train_loss": -7.331327438354492, "global_step": 207924, "epoch": 4950} {"train_loss": -7.344372272491455, "global_step": 207925, "epoch": 4950} {"train_loss": -7.3679118156433105, "global_step": 207926, "epoch": 4950} {"train_loss": -7.455679893493652, "global_step": 207927, "epoch": 4950} {"train_loss": -7.427950859069824, "global_step": 207928, "epoch": 4950} {"train_loss": -7.367587566375732, "global_step": 207929, "epoch": 4950} {"train_loss": -7.364312648773193, "global_step": 207930, "epoch": 4950} {"train_loss": -7.358320236206055, "global_step": 207931, "epoch": 4950} {"train_loss": -7.326133728027344, "global_step": 207932, "epoch": 4950} {"train_loss": -7.364831924438477, "global_step": 207933, "epoch": 4950} {"train_loss": -7.346306800842285, "global_step": 207934, "epoch": 4950} {"train_loss": -7.250527381896973, "global_step": 207935, "epoch": 4950} {"train_loss": -7.331240653991699, "global_step": 207936, "epoch": 4950} {"train_loss": -7.299408435821533, "global_step": 207937, "epoch": 4950} {"train_loss": -7.349210739135742, "global_step": 207938, "epoch": 4950} {"train_loss": -7.323590278625488, "global_step": 207939, "epoch": 4950} {"train_loss": -7.37986946105957, "global_step": 207940, "epoch": 4950} {"train_loss": -7.360199133555095, "global_step": 207941, "epoch": 4950, "train/sim_max_reward_0": 0.19221671363608395, "train/sim_max_reward_1": 0.9847618687852417, "train/sim_max_reward_2": 0.5521983057582902, "train/sim_max_reward_3": 0.9039857585389625, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.866298793549961, "test/sim_max_reward_4300000": 0.9624956860779058, "test/sim_max_reward_4300001": 0.5613417818225477, "test/sim_max_reward_4300002": 1.0, "test/sim_max_reward_4300003": 1.0, "test/sim_max_reward_4300004": 0.015834104809286244, "test/sim_max_reward_4300005": 0.9616234196401635, "test/sim_max_reward_4300006": 0.15748915675514083, "test/sim_max_reward_4300007": 0.29168526520989013, "test/sim_max_reward_4300008": 0.943740449221737, "test/sim_max_reward_4300009": 1.0, "test/sim_max_reward_4300010": 1.0, "test/sim_max_reward_4300011": 1.0, "test/sim_max_reward_4300012": 0.9012291676041357, "test/sim_max_reward_4300013": 1.0, "test/sim_max_reward_4300014": 0.9860772179465602, "test/sim_max_reward_4300015": 0.9793396540080519, "test/sim_max_reward_4300016": 0.9654753399672859, "test/sim_max_reward_4300017": 0.9630847438412121, "test/sim_max_reward_4300018": 0.39737852880416913, "test/sim_max_reward_4300019": 0.18619874520187893, "test/sim_max_reward_4300020": 0.0, "test/sim_max_reward_4300021": 0.971402993093506, "test/sim_max_reward_4300022": 0.9493783356989384, "test/sim_max_reward_4300023": 0.734277198328677, "test/sim_max_reward_4300024": 0.9931426767353195, "test/sim_max_reward_4300025": 0.9908487846663685, "test/sim_max_reward_4300026": 0.181619718322149, "test/sim_max_reward_4300027": 0.8041120943658803, "test/sim_max_reward_4300028": 0.9563071853019137, "test/sim_max_reward_4300029": 0.0, "test/sim_max_reward_4300030": 0.2630862592849014, "test/sim_max_reward_4300031": 0.4343683036428075, "test/sim_max_reward_4300032": 0.9979157049144313, "test/sim_max_reward_4300033": 0.7245951331292722, "test/sim_max_reward_4300034": 0.2680312661138692, "test/sim_max_reward_4300035": 0.8821918202362663, "test/sim_max_reward_4300036": 0.22116569481390422, "test/sim_max_reward_4300037": 0.8653992684057675, "test/sim_max_reward_4300038": 1.0, "test/sim_max_reward_4300039": 0.8034919469994284, "test/sim_max_reward_4300040": 0.9559651283733546, "test/sim_max_reward_4300041": 0.0, "test/sim_max_reward_4300042": 0.5935289725062194, "test/sim_max_reward_4300043": 0.09596200835008387, "test/sim_max_reward_4300044": 0.9547923812962508, "test/sim_max_reward_4300045": 0.9987138157598552, "test/sim_max_reward_4300046": 0.8702698620852624, "test/sim_max_reward_4300047": 0.13396666543624805, "test/sim_max_reward_4300048": 0.02511439497804281, "test/sim_max_reward_4300049": 0.15769345873592971, "train/mean_score": 0.7499102400447565, "test/mean_score": 0.6620066866496921, "val_loss": 69952.6953125} {"train_loss": -7.357501983642578, "global_step": 207942, "epoch": 4951} {"train_loss": -7.224579334259033, "global_step": 207943, "epoch": 4951} {"train_loss": -7.361559867858887, "global_step": 207944, "epoch": 4951} {"train_loss": -7.4965081214904785, "global_step": 207945, "epoch": 4951} {"train_loss": -7.335963249206543, "global_step": 207946, "epoch": 4951} {"train_loss": -7.336393356323242, "global_step": 207947, "epoch": 4951} {"train_loss": -7.296408653259277, "global_step": 207948, "epoch": 4951} {"train_loss": -7.181139945983887, "global_step": 207949, "epoch": 4951} {"train_loss": -7.35825252532959, "global_step": 207950, "epoch": 4951} {"train_loss": -7.381283283233643, "global_step": 207951, "epoch": 4951} {"train_loss": -7.361176490783691, "global_step": 207952, "epoch": 4951} {"train_loss": -7.432010650634766, "global_step": 207953, "epoch": 4951} {"train_loss": -7.397528648376465, "global_step": 207954, "epoch": 4951} {"train_loss": -7.221038818359375, "global_step": 207955, "epoch": 4951} {"train_loss": -7.319721221923828, "global_step": 207956, "epoch": 4951} {"train_loss": -7.328890323638916, "global_step": 207957, "epoch": 4951} {"train_loss": -7.232904434204102, "global_step": 207958, "epoch": 4951} {"train_loss": -7.323134422302246, "global_step": 207959, "epoch": 4951} {"train_loss": -7.275821685791016, "global_step": 207960, "epoch": 4951} {"train_loss": -7.34397029876709, "global_step": 207961, "epoch": 4951} {"train_loss": -7.257805824279785, "global_step": 207962, "epoch": 4951} {"train_loss": -7.1616926193237305, "global_step": 207963, "epoch": 4951} {"train_loss": -7.303159713745117, "global_step": 207964, "epoch": 4951} {"train_loss": -7.251009941101074, "global_step": 207965, "epoch": 4951} {"train_loss": -7.294422149658203, "global_step": 207966, "epoch": 4951} {"train_loss": -7.31380033493042, "global_step": 207967, "epoch": 4951} {"train_loss": -7.247132778167725, "global_step": 207968, "epoch": 4951} {"train_loss": -7.24305534362793, "global_step": 207969, "epoch": 4951} {"train_loss": -7.352360725402832, "global_step": 207970, "epoch": 4951} {"train_loss": -7.316550254821777, "global_step": 207971, "epoch": 4951} {"train_loss": -7.233895778656006, "global_step": 207972, "epoch": 4951} {"train_loss": -7.227222919464111, "global_step": 207973, "epoch": 4951} {"train_loss": -7.226339817047119, "global_step": 207974, "epoch": 4951} {"train_loss": -7.332571029663086, "global_step": 207975, "epoch": 4951} {"train_loss": -7.267256736755371, "global_step": 207976, "epoch": 4951} {"train_loss": -7.232572078704834, "global_step": 207977, "epoch": 4951} {"train_loss": -7.296639442443848, "global_step": 207978, "epoch": 4951} {"train_loss": -7.281641483306885, "global_step": 207979, "epoch": 4951} {"train_loss": -7.322994232177734, "global_step": 207980, "epoch": 4951} {"train_loss": -7.242304801940918, "global_step": 207981, "epoch": 4951} {"train_loss": -7.297798156738281, "global_step": 207982, "epoch": 4951} {"train_loss": -7.298773459025791, "global_step": 207983, "epoch": 4951, "val_loss": 69899.3046875} {"train_loss": -7.286619186401367, "global_step": 207984, "epoch": 4952} {"train_loss": -7.359567642211914, "global_step": 207985, "epoch": 4952} {"train_loss": -7.322722911834717, "global_step": 207986, "epoch": 4952} {"train_loss": -7.363923072814941, "global_step": 207987, "epoch": 4952} {"train_loss": -7.257570266723633, "global_step": 207988, "epoch": 4952} {"train_loss": -7.235624313354492, "global_step": 207989, "epoch": 4952} {"train_loss": -7.307775497436523, "global_step": 207990, "epoch": 4952} {"train_loss": -7.423425674438477, "global_step": 207991, "epoch": 4952} {"train_loss": -7.302831649780273, "global_step": 207992, "epoch": 4952} {"train_loss": -7.250547885894775, "global_step": 207993, "epoch": 4952} {"train_loss": -7.376255512237549, "global_step": 207994, "epoch": 4952} {"train_loss": -7.3841447830200195, "global_step": 207995, "epoch": 4952} {"train_loss": -7.344916343688965, "global_step": 207996, "epoch": 4952} {"train_loss": -7.167713165283203, "global_step": 207997, "epoch": 4952} {"train_loss": -7.363306999206543, "global_step": 207998, "epoch": 4952} {"train_loss": -7.26563835144043, "global_step": 207999, "epoch": 4952} {"train_loss": -7.365785598754883, "global_step": 208000, "epoch": 4952} {"train_loss": -7.328932762145996, "global_step": 208001, "epoch": 4952} {"train_loss": -7.303211212158203, "global_step": 208002, "epoch": 4952} {"train_loss": -7.426705360412598, "global_step": 208003, "epoch": 4952} {"train_loss": -7.337151050567627, "global_step": 208004, "epoch": 4952} {"train_loss": -7.4362359046936035, "global_step": 208005, "epoch": 4952} {"train_loss": -7.36014986038208, "global_step": 208006, "epoch": 4952} {"train_loss": -7.444875717163086, "global_step": 208007, "epoch": 4952} {"train_loss": -7.456829071044922, "global_step": 208008, "epoch": 4952} {"train_loss": -7.3885698318481445, "global_step": 208009, "epoch": 4952} {"train_loss": -7.413331031799316, "global_step": 208010, "epoch": 4952} {"train_loss": -7.401771545410156, "global_step": 208011, "epoch": 4952} {"train_loss": -7.508496284484863, "global_step": 208012, "epoch": 4952} {"train_loss": -7.3445258140563965, "global_step": 208013, "epoch": 4952} {"train_loss": -7.2789626121521, "global_step": 208014, "epoch": 4952} {"train_loss": -7.370004177093506, "global_step": 208015, "epoch": 4952} {"train_loss": -7.345635890960693, "global_step": 208016, "epoch": 4952} {"train_loss": -7.437127590179443, "global_step": 208017, "epoch": 4952} {"train_loss": -7.383788585662842, "global_step": 208018, "epoch": 4952} {"train_loss": -7.284804821014404, "global_step": 208019, "epoch": 4952} {"train_loss": -7.28521203994751, "global_step": 208020, "epoch": 4952} {"train_loss": -7.363778114318848, "global_step": 208021, "epoch": 4952} {"train_loss": -7.3655853271484375, "global_step": 208022, "epoch": 4952} {"train_loss": -7.272404670715332, "global_step": 208023, "epoch": 4952} {"train_loss": -7.3652496337890625, "global_step": 208024, "epoch": 4952} {"train_loss": -7.344294593447731, "global_step": 208025, "epoch": 4952, "val_loss": 70081.140625} {"train_loss": -7.234860420227051, "global_step": 208026, "epoch": 4953} {"train_loss": -7.234748840332031, "global_step": 208027, "epoch": 4953} {"train_loss": -7.2442240715026855, "global_step": 208028, "epoch": 4953} {"train_loss": -7.503475189208984, "global_step": 208029, "epoch": 4953} {"train_loss": -7.157251358032227, "global_step": 208030, "epoch": 4953} {"train_loss": -7.199516296386719, "global_step": 208031, "epoch": 4953} {"train_loss": -7.271378517150879, "global_step": 208032, "epoch": 4953} {"train_loss": -7.19085693359375, "global_step": 208033, "epoch": 4953} {"train_loss": -7.180412769317627, "global_step": 208034, "epoch": 4953} {"train_loss": -7.222722053527832, "global_step": 208035, "epoch": 4953} {"train_loss": -7.3119096755981445, "global_step": 208036, "epoch": 4953} {"train_loss": -7.166820526123047, "global_step": 208037, "epoch": 4953} {"train_loss": -7.310130596160889, "global_step": 208038, "epoch": 4953} {"train_loss": -7.223506927490234, "global_step": 208039, "epoch": 4953} {"train_loss": -7.237309455871582, "global_step": 208040, "epoch": 4953} {"train_loss": -7.282327175140381, "global_step": 208041, "epoch": 4953} {"train_loss": -7.268994331359863, "global_step": 208042, "epoch": 4953} {"train_loss": -7.235867500305176, "global_step": 208043, "epoch": 4953} {"train_loss": -7.317933559417725, "global_step": 208044, "epoch": 4953} {"train_loss": -7.278517723083496, "global_step": 208045, "epoch": 4953} {"train_loss": -7.252040863037109, "global_step": 208046, "epoch": 4953} {"train_loss": -7.316775321960449, "global_step": 208047, "epoch": 4953} {"train_loss": -7.254133224487305, "global_step": 208048, "epoch": 4953} {"train_loss": -7.417916774749756, "global_step": 208049, "epoch": 4953} {"train_loss": -7.16644287109375, "global_step": 208050, "epoch": 4953} {"train_loss": -7.234853744506836, "global_step": 208051, "epoch": 4953} {"train_loss": -7.302837371826172, "global_step": 208052, "epoch": 4953} {"train_loss": -7.271973609924316, "global_step": 208053, "epoch": 4953} {"train_loss": -7.284487247467041, "global_step": 208054, "epoch": 4953} {"train_loss": -7.310847282409668, "global_step": 208055, "epoch": 4953} {"train_loss": -7.319502830505371, "global_step": 208056, "epoch": 4953} {"train_loss": -7.3381028175354, "global_step": 208057, "epoch": 4953} {"train_loss": -7.350573539733887, "global_step": 208058, "epoch": 4953} {"train_loss": -7.154060363769531, "global_step": 208059, "epoch": 4953} {"train_loss": -7.276878356933594, "global_step": 208060, "epoch": 4953} {"train_loss": -7.326773643493652, "global_step": 208061, "epoch": 4953} {"train_loss": -7.341835021972656, "global_step": 208062, "epoch": 4953} {"train_loss": -7.362379550933838, "global_step": 208063, "epoch": 4953} {"train_loss": -7.365268707275391, "global_step": 208064, "epoch": 4953} {"train_loss": -7.304915428161621, "global_step": 208065, "epoch": 4953} {"train_loss": -7.289207458496094, "global_step": 208066, "epoch": 4953} {"train_loss": -7.2781906354995005, "global_step": 208067, "epoch": 4953, "val_loss": 69882.1796875} {"train_loss": -7.377172946929932, "global_step": 208068, "epoch": 4954} {"train_loss": -7.293398857116699, "global_step": 208069, "epoch": 4954} {"train_loss": -7.338642120361328, "global_step": 208070, "epoch": 4954} {"train_loss": -7.410691261291504, "global_step": 208071, "epoch": 4954} {"train_loss": -7.233678817749023, "global_step": 208072, "epoch": 4954} {"train_loss": -7.4591064453125, "global_step": 208073, "epoch": 4954} {"train_loss": -7.386646747589111, "global_step": 208074, "epoch": 4954} {"train_loss": -7.315248489379883, "global_step": 208075, "epoch": 4954} {"train_loss": -7.320199012756348, "global_step": 208076, "epoch": 4954} {"train_loss": -7.485569000244141, "global_step": 208077, "epoch": 4954} {"train_loss": -7.341638565063477, "global_step": 208078, "epoch": 4954} {"train_loss": -7.361326694488525, "global_step": 208079, "epoch": 4954} {"train_loss": -7.396015644073486, "global_step": 208080, "epoch": 4954} {"train_loss": -7.354305267333984, "global_step": 208081, "epoch": 4954} {"train_loss": -7.365182876586914, "global_step": 208082, "epoch": 4954} {"train_loss": -7.39919376373291, "global_step": 208083, "epoch": 4954} {"train_loss": -7.417912483215332, "global_step": 208084, "epoch": 4954} {"train_loss": -7.386486530303955, "global_step": 208085, "epoch": 4954} {"train_loss": -7.427460193634033, "global_step": 208086, "epoch": 4954} {"train_loss": -7.289142608642578, "global_step": 208087, "epoch": 4954} {"train_loss": -7.332096099853516, "global_step": 208088, "epoch": 4954} {"train_loss": -7.4182233810424805, "global_step": 208089, "epoch": 4954} {"train_loss": -7.324383735656738, "global_step": 208090, "epoch": 4954} {"train_loss": -7.367806434631348, "global_step": 208091, "epoch": 4954} {"train_loss": -7.32451057434082, "global_step": 208092, "epoch": 4954} {"train_loss": -7.378303527832031, "global_step": 208093, "epoch": 4954} {"train_loss": -7.356667518615723, "global_step": 208094, "epoch": 4954} {"train_loss": -7.4878458976745605, "global_step": 208095, "epoch": 4954} {"train_loss": -7.389518737792969, "global_step": 208096, "epoch": 4954} {"train_loss": -7.448285102844238, "global_step": 208097, "epoch": 4954} {"train_loss": -7.3803629875183105, "global_step": 208098, "epoch": 4954} {"train_loss": -7.3609299659729, "global_step": 208099, "epoch": 4954} {"train_loss": -7.434310436248779, "global_step": 208100, "epoch": 4954} {"train_loss": -7.352146148681641, "global_step": 208101, "epoch": 4954} {"train_loss": -7.377097129821777, "global_step": 208102, "epoch": 4954} {"train_loss": -7.36480712890625, "global_step": 208103, "epoch": 4954} {"train_loss": -7.377805709838867, "global_step": 208104, "epoch": 4954} {"train_loss": -7.370582580566406, "global_step": 208105, "epoch": 4954} {"train_loss": -7.386789321899414, "global_step": 208106, "epoch": 4954} {"train_loss": -7.2867865562438965, "global_step": 208107, "epoch": 4954} {"train_loss": -7.354919910430908, "global_step": 208108, "epoch": 4954} {"train_loss": -7.370315108980451, "global_step": 208109, "epoch": 4954, "val_loss": 70186.28125} {"train_loss": -7.320860862731934, "global_step": 208110, "epoch": 4955} {"train_loss": -7.372859954833984, "global_step": 208111, "epoch": 4955} {"train_loss": -7.4601569175720215, "global_step": 208112, "epoch": 4955} {"train_loss": -7.2983856201171875, "global_step": 208113, "epoch": 4955} {"train_loss": -7.237587928771973, "global_step": 208114, "epoch": 4955} {"train_loss": -7.414624214172363, "global_step": 208115, "epoch": 4955} {"train_loss": -7.2483601570129395, "global_step": 208116, "epoch": 4955} {"train_loss": -7.205232620239258, "global_step": 208117, "epoch": 4955} {"train_loss": -7.292017936706543, "global_step": 208118, "epoch": 4955} {"train_loss": -7.122941017150879, "global_step": 208119, "epoch": 4955} {"train_loss": -7.211010932922363, "global_step": 208120, "epoch": 4955} {"train_loss": -7.352816581726074, "global_step": 208121, "epoch": 4955} {"train_loss": -7.187021732330322, "global_step": 208122, "epoch": 4955} {"train_loss": -7.254860877990723, "global_step": 208123, "epoch": 4955} {"train_loss": -7.352374076843262, "global_step": 208124, "epoch": 4955} {"train_loss": -7.298501014709473, "global_step": 208125, "epoch": 4955} {"train_loss": -7.371065139770508, "global_step": 208126, "epoch": 4955} {"train_loss": -7.3673810958862305, "global_step": 208127, "epoch": 4955} {"train_loss": -7.358248233795166, "global_step": 208128, "epoch": 4955} {"train_loss": -7.31386661529541, "global_step": 208129, "epoch": 4955} {"train_loss": -7.31813907623291, "global_step": 208130, "epoch": 4955} {"train_loss": -7.346063613891602, "global_step": 208131, "epoch": 4955} {"train_loss": -7.342682361602783, "global_step": 208132, "epoch": 4955} {"train_loss": -7.44073486328125, "global_step": 208133, "epoch": 4955} {"train_loss": -7.306734085083008, "global_step": 208134, "epoch": 4955} {"train_loss": -7.352307319641113, "global_step": 208135, "epoch": 4955} {"train_loss": -7.381977558135986, "global_step": 208136, "epoch": 4955} {"train_loss": -7.356978416442871, "global_step": 208137, "epoch": 4955} {"train_loss": -7.470846176147461, "global_step": 208138, "epoch": 4955} {"train_loss": -7.388579845428467, "global_step": 208139, "epoch": 4955} {"train_loss": -7.389748573303223, "global_step": 208140, "epoch": 4955} {"train_loss": -7.403119087219238, "global_step": 208141, "epoch": 4955} {"train_loss": -7.34411096572876, "global_step": 208142, "epoch": 4955} {"train_loss": -7.235232353210449, "global_step": 208143, "epoch": 4955} {"train_loss": -7.346628665924072, "global_step": 208144, "epoch": 4955} {"train_loss": -7.519947052001953, "global_step": 208145, "epoch": 4955} {"train_loss": -7.384986400604248, "global_step": 208146, "epoch": 4955} {"train_loss": -7.286710739135742, "global_step": 208147, "epoch": 4955} {"train_loss": -7.338242530822754, "global_step": 208148, "epoch": 4955} {"train_loss": -7.218144416809082, "global_step": 208149, "epoch": 4955} {"train_loss": -7.233325958251953, "global_step": 208150, "epoch": 4955} {"train_loss": -7.325426692054386, "global_step": 208151, "epoch": 4955, "val_loss": 69860.515625} {"train_loss": -7.404731750488281, "global_step": 208152, "epoch": 4956} {"train_loss": -7.132106781005859, "global_step": 208153, "epoch": 4956} {"train_loss": -7.292357921600342, "global_step": 208154, "epoch": 4956} {"train_loss": -7.3649091720581055, "global_step": 208155, "epoch": 4956} {"train_loss": -7.101956367492676, "global_step": 208156, "epoch": 4956} {"train_loss": -7.352312088012695, "global_step": 208157, "epoch": 4956} {"train_loss": -7.150203704833984, "global_step": 208158, "epoch": 4956} {"train_loss": -7.071188926696777, "global_step": 208159, "epoch": 4956} {"train_loss": -7.263952732086182, "global_step": 208160, "epoch": 4956} {"train_loss": -7.127664566040039, "global_step": 208161, "epoch": 4956} {"train_loss": -7.190926551818848, "global_step": 208162, "epoch": 4956} {"train_loss": -7.24018669128418, "global_step": 208163, "epoch": 4956} {"train_loss": -7.085269927978516, "global_step": 208164, "epoch": 4956} {"train_loss": -7.342189788818359, "global_step": 208165, "epoch": 4956} {"train_loss": -7.009331226348877, "global_step": 208166, "epoch": 4956} {"train_loss": -7.206873893737793, "global_step": 208167, "epoch": 4956} {"train_loss": -7.108969688415527, "global_step": 208168, "epoch": 4956} {"train_loss": -7.182772636413574, "global_step": 208169, "epoch": 4956} {"train_loss": -7.174458026885986, "global_step": 208170, "epoch": 4956} {"train_loss": -7.175442218780518, "global_step": 208171, "epoch": 4956} {"train_loss": -7.21349573135376, "global_step": 208172, "epoch": 4956} {"train_loss": -7.1929850578308105, "global_step": 208173, "epoch": 4956} {"train_loss": -7.192184925079346, "global_step": 208174, "epoch": 4956} {"train_loss": -7.169947624206543, "global_step": 208175, "epoch": 4956} {"train_loss": -7.229117393493652, "global_step": 208176, "epoch": 4956} {"train_loss": -7.176286697387695, "global_step": 208177, "epoch": 4956} {"train_loss": -7.258271217346191, "global_step": 208178, "epoch": 4956} {"train_loss": -7.154069900512695, "global_step": 208179, "epoch": 4956} {"train_loss": -7.142172813415527, "global_step": 208180, "epoch": 4956} {"train_loss": -7.2117767333984375, "global_step": 208181, "epoch": 4956} {"train_loss": -7.239110946655273, "global_step": 208182, "epoch": 4956} {"train_loss": -7.120876312255859, "global_step": 208183, "epoch": 4956} {"train_loss": -7.319031238555908, "global_step": 208184, "epoch": 4956} {"train_loss": -7.130955696105957, "global_step": 208185, "epoch": 4956} {"train_loss": -7.262971878051758, "global_step": 208186, "epoch": 4956} {"train_loss": -7.193612575531006, "global_step": 208187, "epoch": 4956} {"train_loss": -7.272159576416016, "global_step": 208188, "epoch": 4956} {"train_loss": -7.258108615875244, "global_step": 208189, "epoch": 4956} {"train_loss": -7.308794021606445, "global_step": 208190, "epoch": 4956} {"train_loss": -7.308923244476318, "global_step": 208191, "epoch": 4956} {"train_loss": -7.1568145751953125, "global_step": 208192, "epoch": 4956} {"train_loss": -7.205823307945614, "global_step": 208193, "epoch": 4956, "val_loss": 69841.0078125} {"train_loss": -7.407647609710693, "global_step": 208194, "epoch": 4957} {"train_loss": -7.348297119140625, "global_step": 208195, "epoch": 4957} {"train_loss": -7.268241882324219, "global_step": 208196, "epoch": 4957} {"train_loss": -7.388731002807617, "global_step": 208197, "epoch": 4957} {"train_loss": -7.27006196975708, "global_step": 208198, "epoch": 4957} {"train_loss": -7.2567267417907715, "global_step": 208199, "epoch": 4957} {"train_loss": -7.277153968811035, "global_step": 208200, "epoch": 4957} {"train_loss": -7.379114151000977, "global_step": 208201, "epoch": 4957} {"train_loss": -7.258702278137207, "global_step": 208202, "epoch": 4957} {"train_loss": -7.296599388122559, "global_step": 208203, "epoch": 4957} {"train_loss": -7.317478179931641, "global_step": 208204, "epoch": 4957} {"train_loss": -7.162399768829346, "global_step": 208205, "epoch": 4957} {"train_loss": -7.344184398651123, "global_step": 208206, "epoch": 4957} {"train_loss": -7.308097839355469, "global_step": 208207, "epoch": 4957} {"train_loss": -7.288971900939941, "global_step": 208208, "epoch": 4957} {"train_loss": -7.3010101318359375, "global_step": 208209, "epoch": 4957} {"train_loss": -7.313641548156738, "global_step": 208210, "epoch": 4957} {"train_loss": -7.1794281005859375, "global_step": 208211, "epoch": 4957} {"train_loss": -7.255903720855713, "global_step": 208212, "epoch": 4957} {"train_loss": -7.427577495574951, "global_step": 208213, "epoch": 4957} {"train_loss": -7.154132843017578, "global_step": 208214, "epoch": 4957} {"train_loss": -7.0156025886535645, "global_step": 208215, "epoch": 4957} {"train_loss": -7.2832841873168945, "global_step": 208216, "epoch": 4957} {"train_loss": -7.208930969238281, "global_step": 208217, "epoch": 4957} {"train_loss": -7.164292335510254, "global_step": 208218, "epoch": 4957} {"train_loss": -7.311068534851074, "global_step": 208219, "epoch": 4957} {"train_loss": -7.121051788330078, "global_step": 208220, "epoch": 4957} {"train_loss": -7.278318405151367, "global_step": 208221, "epoch": 4957} {"train_loss": -7.296130657196045, "global_step": 208222, "epoch": 4957} {"train_loss": -7.153096675872803, "global_step": 208223, "epoch": 4957} {"train_loss": -7.375130653381348, "global_step": 208224, "epoch": 4957} {"train_loss": -7.3611369132995605, "global_step": 208225, "epoch": 4957} {"train_loss": -7.144709587097168, "global_step": 208226, "epoch": 4957} {"train_loss": -7.266629219055176, "global_step": 208227, "epoch": 4957} {"train_loss": -7.1763482093811035, "global_step": 208228, "epoch": 4957} {"train_loss": -7.069701194763184, "global_step": 208229, "epoch": 4957} {"train_loss": -7.346571445465088, "global_step": 208230, "epoch": 4957} {"train_loss": -7.327669143676758, "global_step": 208231, "epoch": 4957} {"train_loss": -7.316990852355957, "global_step": 208232, "epoch": 4957} {"train_loss": -7.460096836090088, "global_step": 208233, "epoch": 4957} {"train_loss": -7.298251628875732, "global_step": 208234, "epoch": 4957} {"train_loss": -7.273586148307437, "global_step": 208235, "epoch": 4957, "val_loss": 69999.984375} {"train_loss": -7.4218363761901855, "global_step": 208236, "epoch": 4958} {"train_loss": -7.429108619689941, "global_step": 208237, "epoch": 4958} {"train_loss": -7.316103935241699, "global_step": 208238, "epoch": 4958} {"train_loss": -7.241309642791748, "global_step": 208239, "epoch": 4958} {"train_loss": -7.340581893920898, "global_step": 208240, "epoch": 4958} {"train_loss": -7.509118556976318, "global_step": 208241, "epoch": 4958} {"train_loss": -7.352843761444092, "global_step": 208242, "epoch": 4958} {"train_loss": -7.437479019165039, "global_step": 208243, "epoch": 4958} {"train_loss": -7.361237049102783, "global_step": 208244, "epoch": 4958} {"train_loss": -7.501870155334473, "global_step": 208245, "epoch": 4958} {"train_loss": -7.408853530883789, "global_step": 208246, "epoch": 4958} {"train_loss": -7.33398962020874, "global_step": 208247, "epoch": 4958} {"train_loss": -7.416252136230469, "global_step": 208248, "epoch": 4958} {"train_loss": -7.453912734985352, "global_step": 208249, "epoch": 4958} {"train_loss": -7.385821342468262, "global_step": 208250, "epoch": 4958} {"train_loss": -7.369091033935547, "global_step": 208251, "epoch": 4958} {"train_loss": -7.429681777954102, "global_step": 208252, "epoch": 4958} {"train_loss": -7.293407917022705, "global_step": 208253, "epoch": 4958} {"train_loss": -7.4662017822265625, "global_step": 208254, "epoch": 4958} {"train_loss": -7.276730537414551, "global_step": 208255, "epoch": 4958} {"train_loss": -7.371489524841309, "global_step": 208256, "epoch": 4958} {"train_loss": -7.369218826293945, "global_step": 208257, "epoch": 4958} {"train_loss": -7.351897239685059, "global_step": 208258, "epoch": 4958} {"train_loss": -7.347226142883301, "global_step": 208259, "epoch": 4958} {"train_loss": -7.361035346984863, "global_step": 208260, "epoch": 4958} {"train_loss": -7.389955043792725, "global_step": 208261, "epoch": 4958} {"train_loss": -7.406327724456787, "global_step": 208262, "epoch": 4958} {"train_loss": -7.407429218292236, "global_step": 208263, "epoch": 4958} {"train_loss": -7.437638282775879, "global_step": 208264, "epoch": 4958} {"train_loss": -7.312799453735352, "global_step": 208265, "epoch": 4958} {"train_loss": -7.418341636657715, "global_step": 208266, "epoch": 4958} {"train_loss": -7.508268356323242, "global_step": 208267, "epoch": 4958} {"train_loss": -7.302946090698242, "global_step": 208268, "epoch": 4958} {"train_loss": -7.21358585357666, "global_step": 208269, "epoch": 4958} {"train_loss": -7.304145812988281, "global_step": 208270, "epoch": 4958} {"train_loss": -7.365938186645508, "global_step": 208271, "epoch": 4958} {"train_loss": -7.19647216796875, "global_step": 208272, "epoch": 4958} {"train_loss": -7.203301906585693, "global_step": 208273, "epoch": 4958} {"train_loss": -7.331404685974121, "global_step": 208274, "epoch": 4958} {"train_loss": -7.226415157318115, "global_step": 208275, "epoch": 4958} {"train_loss": -7.193264961242676, "global_step": 208276, "epoch": 4958} {"train_loss": -7.360450506210327, "global_step": 208277, "epoch": 4958, "val_loss": 70127.734375} {"train_loss": -7.244795799255371, "global_step": 208278, "epoch": 4959} {"train_loss": -7.288956642150879, "global_step": 208279, "epoch": 4959} {"train_loss": -7.260723114013672, "global_step": 208280, "epoch": 4959} {"train_loss": -7.177611351013184, "global_step": 208281, "epoch": 4959} {"train_loss": -7.4113898277282715, "global_step": 208282, "epoch": 4959} {"train_loss": -7.286538124084473, "global_step": 208283, "epoch": 4959} {"train_loss": -7.387749195098877, "global_step": 208284, "epoch": 4959} {"train_loss": -7.168337821960449, "global_step": 208285, "epoch": 4959} {"train_loss": -7.235298156738281, "global_step": 208286, "epoch": 4959} {"train_loss": -7.187704086303711, "global_step": 208287, "epoch": 4959} {"train_loss": -7.257061004638672, "global_step": 208288, "epoch": 4959} {"train_loss": -7.311290740966797, "global_step": 208289, "epoch": 4959} {"train_loss": -7.060549259185791, "global_step": 208290, "epoch": 4959} {"train_loss": -7.246386528015137, "global_step": 208291, "epoch": 4959} {"train_loss": -7.180431842803955, "global_step": 208292, "epoch": 4959} {"train_loss": -7.335508346557617, "global_step": 208293, "epoch": 4959} {"train_loss": -7.385886192321777, "global_step": 208294, "epoch": 4959} {"train_loss": -7.281744956970215, "global_step": 208295, "epoch": 4959} {"train_loss": -7.314963340759277, "global_step": 208296, "epoch": 4959} {"train_loss": -7.21456241607666, "global_step": 208297, "epoch": 4959} {"train_loss": -7.225003719329834, "global_step": 208298, "epoch": 4959} {"train_loss": -7.131837844848633, "global_step": 208299, "epoch": 4959} {"train_loss": -7.321169853210449, "global_step": 208300, "epoch": 4959} {"train_loss": -7.4051384925842285, "global_step": 208301, "epoch": 4959} {"train_loss": -7.217649459838867, "global_step": 208302, "epoch": 4959} {"train_loss": -7.384897232055664, "global_step": 208303, "epoch": 4959} {"train_loss": -7.263310432434082, "global_step": 208304, "epoch": 4959} {"train_loss": -7.34695291519165, "global_step": 208305, "epoch": 4959} {"train_loss": -7.232634544372559, "global_step": 208306, "epoch": 4959} {"train_loss": -7.27085542678833, "global_step": 208307, "epoch": 4959} {"train_loss": -7.366490840911865, "global_step": 208308, "epoch": 4959} {"train_loss": -7.2708892822265625, "global_step": 208309, "epoch": 4959} {"train_loss": -7.362512111663818, "global_step": 208310, "epoch": 4959} {"train_loss": -7.323763847351074, "global_step": 208311, "epoch": 4959} {"train_loss": -7.301610469818115, "global_step": 208312, "epoch": 4959} {"train_loss": -7.210930824279785, "global_step": 208313, "epoch": 4959} {"train_loss": -7.3500847816467285, "global_step": 208314, "epoch": 4959} {"train_loss": -7.311437606811523, "global_step": 208315, "epoch": 4959} {"train_loss": -7.253561973571777, "global_step": 208316, "epoch": 4959} {"train_loss": -7.291685581207275, "global_step": 208317, "epoch": 4959} {"train_loss": -7.40031623840332, "global_step": 208318, "epoch": 4959} {"train_loss": -7.280137936274211, "global_step": 208319, "epoch": 4959, "val_loss": 70037.5859375} {"train_loss": -7.360566139221191, "global_step": 208320, "epoch": 4960} {"train_loss": -7.339814186096191, "global_step": 208321, "epoch": 4960} {"train_loss": -7.402883052825928, "global_step": 208322, "epoch": 4960} {"train_loss": -7.294916152954102, "global_step": 208323, "epoch": 4960} {"train_loss": -7.420871734619141, "global_step": 208324, "epoch": 4960} {"train_loss": -7.430697441101074, "global_step": 208325, "epoch": 4960} {"train_loss": -7.461345195770264, "global_step": 208326, "epoch": 4960} {"train_loss": -7.397375106811523, "global_step": 208327, "epoch": 4960} {"train_loss": -7.323678016662598, "global_step": 208328, "epoch": 4960} {"train_loss": -7.441084861755371, "global_step": 208329, "epoch": 4960} {"train_loss": -7.460456848144531, "global_step": 208330, "epoch": 4960} {"train_loss": -7.460735321044922, "global_step": 208331, "epoch": 4960} {"train_loss": -7.5101423263549805, "global_step": 208332, "epoch": 4960} {"train_loss": -7.372402667999268, "global_step": 208333, "epoch": 4960} {"train_loss": -7.402692794799805, "global_step": 208334, "epoch": 4960} {"train_loss": -7.476602554321289, "global_step": 208335, "epoch": 4960} {"train_loss": -7.453805923461914, "global_step": 208336, "epoch": 4960} {"train_loss": -7.334765434265137, "global_step": 208337, "epoch": 4960} {"train_loss": -7.291750907897949, "global_step": 208338, "epoch": 4960} {"train_loss": -7.322810649871826, "global_step": 208339, "epoch": 4960} {"train_loss": -7.38458251953125, "global_step": 208340, "epoch": 4960} {"train_loss": -7.2798357009887695, "global_step": 208341, "epoch": 4960} {"train_loss": -7.438567638397217, "global_step": 208342, "epoch": 4960} {"train_loss": -7.267430305480957, "global_step": 208343, "epoch": 4960} {"train_loss": -7.300627708435059, "global_step": 208344, "epoch": 4960} {"train_loss": -7.265919208526611, "global_step": 208345, "epoch": 4960} {"train_loss": -7.225737571716309, "global_step": 208346, "epoch": 4960} {"train_loss": -7.3490777015686035, "global_step": 208347, "epoch": 4960} {"train_loss": -7.4242095947265625, "global_step": 208348, "epoch": 4960} {"train_loss": -7.238980293273926, "global_step": 208349, "epoch": 4960} {"train_loss": -7.150275707244873, "global_step": 208350, "epoch": 4960} {"train_loss": -7.246837615966797, "global_step": 208351, "epoch": 4960} {"train_loss": -7.202268123626709, "global_step": 208352, "epoch": 4960} {"train_loss": -7.203760147094727, "global_step": 208353, "epoch": 4960} {"train_loss": -7.374965667724609, "global_step": 208354, "epoch": 4960} {"train_loss": -7.238171100616455, "global_step": 208355, "epoch": 4960} {"train_loss": -7.322544097900391, "global_step": 208356, "epoch": 4960} {"train_loss": -7.214648246765137, "global_step": 208357, "epoch": 4960} {"train_loss": -7.199732303619385, "global_step": 208358, "epoch": 4960} {"train_loss": -7.189301490783691, "global_step": 208359, "epoch": 4960} {"train_loss": -7.265149116516113, "global_step": 208360, "epoch": 4960} {"train_loss": -7.330080316180275, "global_step": 208361, "epoch": 4960, "val_loss": 70124.6484375} {"train_loss": -7.272151947021484, "global_step": 208362, "epoch": 4961} {"train_loss": -7.282012939453125, "global_step": 208363, "epoch": 4961} {"train_loss": -7.244640350341797, "global_step": 208364, "epoch": 4961} {"train_loss": -7.269354820251465, "global_step": 208365, "epoch": 4961} {"train_loss": -7.283176422119141, "global_step": 208366, "epoch": 4961} {"train_loss": -7.294100284576416, "global_step": 208367, "epoch": 4961} {"train_loss": -7.259072780609131, "global_step": 208368, "epoch": 4961} {"train_loss": -7.361152172088623, "global_step": 208369, "epoch": 4961} {"train_loss": -7.252383232116699, "global_step": 208370, "epoch": 4961} {"train_loss": -7.357239723205566, "global_step": 208371, "epoch": 4961} {"train_loss": -7.289840221405029, "global_step": 208372, "epoch": 4961} {"train_loss": -7.249272346496582, "global_step": 208373, "epoch": 4961} {"train_loss": -7.268631935119629, "global_step": 208374, "epoch": 4961} {"train_loss": -7.263720512390137, "global_step": 208375, "epoch": 4961} {"train_loss": -7.254805564880371, "global_step": 208376, "epoch": 4961} {"train_loss": -7.416234970092773, "global_step": 208377, "epoch": 4961} {"train_loss": -7.390820026397705, "global_step": 208378, "epoch": 4961} {"train_loss": -7.284412860870361, "global_step": 208379, "epoch": 4961} {"train_loss": -7.399727821350098, "global_step": 208380, "epoch": 4961} {"train_loss": -7.353778839111328, "global_step": 208381, "epoch": 4961} {"train_loss": -7.25840950012207, "global_step": 208382, "epoch": 4961} {"train_loss": -7.445036888122559, "global_step": 208383, "epoch": 4961} {"train_loss": -7.288669586181641, "global_step": 208384, "epoch": 4961} {"train_loss": -7.367444038391113, "global_step": 208385, "epoch": 4961} {"train_loss": -7.344073295593262, "global_step": 208386, "epoch": 4961} {"train_loss": -7.253409385681152, "global_step": 208387, "epoch": 4961} {"train_loss": -7.348196029663086, "global_step": 208388, "epoch": 4961} {"train_loss": -7.199392318725586, "global_step": 208389, "epoch": 4961} {"train_loss": -7.240855693817139, "global_step": 208390, "epoch": 4961} {"train_loss": -7.375009059906006, "global_step": 208391, "epoch": 4961} {"train_loss": -7.342711925506592, "global_step": 208392, "epoch": 4961} {"train_loss": -7.277421951293945, "global_step": 208393, "epoch": 4961} {"train_loss": -7.384188652038574, "global_step": 208394, "epoch": 4961} {"train_loss": -7.334216117858887, "global_step": 208395, "epoch": 4961} {"train_loss": -7.299134254455566, "global_step": 208396, "epoch": 4961} {"train_loss": -7.234832763671875, "global_step": 208397, "epoch": 4961} {"train_loss": -7.399607181549072, "global_step": 208398, "epoch": 4961} {"train_loss": -7.271407604217529, "global_step": 208399, "epoch": 4961} {"train_loss": -7.404884338378906, "global_step": 208400, "epoch": 4961} {"train_loss": -7.235436916351318, "global_step": 208401, "epoch": 4961} {"train_loss": -7.270242214202881, "global_step": 208402, "epoch": 4961} {"train_loss": -7.3095573811304, "global_step": 208403, "epoch": 4961, "val_loss": 70088.9296875} {"train_loss": -7.298637390136719, "global_step": 208404, "epoch": 4962} {"train_loss": -7.135699272155762, "global_step": 208405, "epoch": 4962} {"train_loss": -7.410205841064453, "global_step": 208406, "epoch": 4962} {"train_loss": -7.21878719329834, "global_step": 208407, "epoch": 4962} {"train_loss": -7.311471939086914, "global_step": 208408, "epoch": 4962} {"train_loss": -7.337740898132324, "global_step": 208409, "epoch": 4962} {"train_loss": -7.387470245361328, "global_step": 208410, "epoch": 4962} {"train_loss": -7.386026859283447, "global_step": 208411, "epoch": 4962} {"train_loss": -7.415131568908691, "global_step": 208412, "epoch": 4962} {"train_loss": -7.31016731262207, "global_step": 208413, "epoch": 4962} {"train_loss": -7.349769592285156, "global_step": 208414, "epoch": 4962} {"train_loss": -7.416584014892578, "global_step": 208415, "epoch": 4962} {"train_loss": -7.391712665557861, "global_step": 208416, "epoch": 4962} {"train_loss": -7.252090930938721, "global_step": 208417, "epoch": 4962} {"train_loss": -7.455956935882568, "global_step": 208418, "epoch": 4962} {"train_loss": -7.387939929962158, "global_step": 208419, "epoch": 4962} {"train_loss": -7.349092960357666, "global_step": 208420, "epoch": 4962} {"train_loss": -7.344737529754639, "global_step": 208421, "epoch": 4962} {"train_loss": -7.322895050048828, "global_step": 208422, "epoch": 4962} {"train_loss": -7.359746932983398, "global_step": 208423, "epoch": 4962} {"train_loss": -7.2810139656066895, "global_step": 208424, "epoch": 4962} {"train_loss": -7.341828346252441, "global_step": 208425, "epoch": 4962} {"train_loss": -7.358799934387207, "global_step": 208426, "epoch": 4962} {"train_loss": -7.374218940734863, "global_step": 208427, "epoch": 4962} {"train_loss": -7.476990699768066, "global_step": 208428, "epoch": 4962} {"train_loss": -7.418426036834717, "global_step": 208429, "epoch": 4962} {"train_loss": -7.484077453613281, "global_step": 208430, "epoch": 4962} {"train_loss": -7.35988712310791, "global_step": 208431, "epoch": 4962} {"train_loss": -7.371675491333008, "global_step": 208432, "epoch": 4962} {"train_loss": -7.331748008728027, "global_step": 208433, "epoch": 4962} {"train_loss": -7.361797332763672, "global_step": 208434, "epoch": 4962} {"train_loss": -7.397260665893555, "global_step": 208435, "epoch": 4962} {"train_loss": -7.360342979431152, "global_step": 208436, "epoch": 4962} {"train_loss": -7.483227729797363, "global_step": 208437, "epoch": 4962} {"train_loss": -7.191864967346191, "global_step": 208438, "epoch": 4962} {"train_loss": -7.156874656677246, "global_step": 208439, "epoch": 4962} {"train_loss": -7.3786301612854, "global_step": 208440, "epoch": 4962} {"train_loss": -7.330686569213867, "global_step": 208441, "epoch": 4962} {"train_loss": -7.325423717498779, "global_step": 208442, "epoch": 4962} {"train_loss": -7.29013729095459, "global_step": 208443, "epoch": 4962} {"train_loss": -7.275001525878906, "global_step": 208444, "epoch": 4962} {"train_loss": -7.343702645528884, "global_step": 208445, "epoch": 4962, "val_loss": 70085.9921875} {"train_loss": -7.22750186920166, "global_step": 208446, "epoch": 4963} {"train_loss": -7.257535457611084, "global_step": 208447, "epoch": 4963} {"train_loss": -7.306949615478516, "global_step": 208448, "epoch": 4963} {"train_loss": -7.222593307495117, "global_step": 208449, "epoch": 4963} {"train_loss": -7.324757099151611, "global_step": 208450, "epoch": 4963} {"train_loss": -7.3466033935546875, "global_step": 208451, "epoch": 4963} {"train_loss": -7.2490692138671875, "global_step": 208452, "epoch": 4963} {"train_loss": -7.350079536437988, "global_step": 208453, "epoch": 4963} {"train_loss": -7.264009475708008, "global_step": 208454, "epoch": 4963} {"train_loss": -7.388441562652588, "global_step": 208455, "epoch": 4963} {"train_loss": -7.352529525756836, "global_step": 208456, "epoch": 4963} {"train_loss": -7.168053150177002, "global_step": 208457, "epoch": 4963} {"train_loss": -7.1849517822265625, "global_step": 208458, "epoch": 4963} {"train_loss": -7.259461879730225, "global_step": 208459, "epoch": 4963} {"train_loss": -7.2589263916015625, "global_step": 208460, "epoch": 4963} {"train_loss": -7.2363691329956055, "global_step": 208461, "epoch": 4963} {"train_loss": -7.2852373123168945, "global_step": 208462, "epoch": 4963} {"train_loss": -7.060184478759766, "global_step": 208463, "epoch": 4963} {"train_loss": -7.286445617675781, "global_step": 208464, "epoch": 4963} {"train_loss": -7.234485626220703, "global_step": 208465, "epoch": 4963} {"train_loss": -7.343656539916992, "global_step": 208466, "epoch": 4963} {"train_loss": -7.338942050933838, "global_step": 208467, "epoch": 4963} {"train_loss": -7.3557305335998535, "global_step": 208468, "epoch": 4963} {"train_loss": -7.291550636291504, "global_step": 208469, "epoch": 4963} {"train_loss": -7.380740165710449, "global_step": 208470, "epoch": 4963} {"train_loss": -7.353235721588135, "global_step": 208471, "epoch": 4963} {"train_loss": -7.4494709968566895, "global_step": 208472, "epoch": 4963} {"train_loss": -7.369555473327637, "global_step": 208473, "epoch": 4963} {"train_loss": -7.276002407073975, "global_step": 208474, "epoch": 4963} {"train_loss": -7.384640693664551, "global_step": 208475, "epoch": 4963} {"train_loss": -7.360987663269043, "global_step": 208476, "epoch": 4963} {"train_loss": -7.294284820556641, "global_step": 208477, "epoch": 4963} {"train_loss": -7.359984397888184, "global_step": 208478, "epoch": 4963} {"train_loss": -7.276338577270508, "global_step": 208479, "epoch": 4963} {"train_loss": -7.429879665374756, "global_step": 208480, "epoch": 4963} {"train_loss": -7.327208518981934, "global_step": 208481, "epoch": 4963} {"train_loss": -7.325157165527344, "global_step": 208482, "epoch": 4963} {"train_loss": -7.4297895431518555, "global_step": 208483, "epoch": 4963} {"train_loss": -7.427484035491943, "global_step": 208484, "epoch": 4963} {"train_loss": -7.357668876647949, "global_step": 208485, "epoch": 4963} {"train_loss": -7.361066818237305, "global_step": 208486, "epoch": 4963} {"train_loss": -7.312722069876535, "global_step": 208487, "epoch": 4963, "val_loss": 69897.125} {"train_loss": -7.3240227699279785, "global_step": 208488, "epoch": 4964} {"train_loss": -7.361087322235107, "global_step": 208489, "epoch": 4964} {"train_loss": -7.413865089416504, "global_step": 208490, "epoch": 4964} {"train_loss": -7.26167106628418, "global_step": 208491, "epoch": 4964} {"train_loss": -7.371424674987793, "global_step": 208492, "epoch": 4964} {"train_loss": -7.309589385986328, "global_step": 208493, "epoch": 4964} {"train_loss": -7.36794376373291, "global_step": 208494, "epoch": 4964} {"train_loss": -7.350131034851074, "global_step": 208495, "epoch": 4964} {"train_loss": -7.220933437347412, "global_step": 208496, "epoch": 4964} {"train_loss": -7.3318986892700195, "global_step": 208497, "epoch": 4964} {"train_loss": -7.302490234375, "global_step": 208498, "epoch": 4964} {"train_loss": -7.266684532165527, "global_step": 208499, "epoch": 4964} {"train_loss": -7.42115592956543, "global_step": 208500, "epoch": 4964} {"train_loss": -7.324437141418457, "global_step": 208501, "epoch": 4964} {"train_loss": -7.363506317138672, "global_step": 208502, "epoch": 4964} {"train_loss": -7.344306945800781, "global_step": 208503, "epoch": 4964} {"train_loss": -7.482813835144043, "global_step": 208504, "epoch": 4964} {"train_loss": -7.380927085876465, "global_step": 208505, "epoch": 4964} {"train_loss": -7.3316850662231445, "global_step": 208506, "epoch": 4964} {"train_loss": -7.353546142578125, "global_step": 208507, "epoch": 4964} {"train_loss": -7.396518230438232, "global_step": 208508, "epoch": 4964} {"train_loss": -7.400757789611816, "global_step": 208509, "epoch": 4964} {"train_loss": -7.445541858673096, "global_step": 208510, "epoch": 4964} {"train_loss": -7.357547760009766, "global_step": 208511, "epoch": 4964} {"train_loss": -7.400445938110352, "global_step": 208512, "epoch": 4964} {"train_loss": -7.424200057983398, "global_step": 208513, "epoch": 4964} {"train_loss": -7.4127302169799805, "global_step": 208514, "epoch": 4964} {"train_loss": -7.399804592132568, "global_step": 208515, "epoch": 4964} {"train_loss": -7.346954345703125, "global_step": 208516, "epoch": 4964} {"train_loss": -7.385260105133057, "global_step": 208517, "epoch": 4964} {"train_loss": -7.343441009521484, "global_step": 208518, "epoch": 4964} {"train_loss": -7.297823905944824, "global_step": 208519, "epoch": 4964} {"train_loss": -7.475378036499023, "global_step": 208520, "epoch": 4964} {"train_loss": -7.442465305328369, "global_step": 208521, "epoch": 4964} {"train_loss": -7.40501594543457, "global_step": 208522, "epoch": 4964} {"train_loss": -7.344216346740723, "global_step": 208523, "epoch": 4964} {"train_loss": -7.338029861450195, "global_step": 208524, "epoch": 4964} {"train_loss": -7.302597522735596, "global_step": 208525, "epoch": 4964} {"train_loss": -7.439653396606445, "global_step": 208526, "epoch": 4964} {"train_loss": -7.329439640045166, "global_step": 208527, "epoch": 4964} {"train_loss": -7.306623935699463, "global_step": 208528, "epoch": 4964} {"train_loss": -7.36371694292341, "global_step": 208529, "epoch": 4964, "val_loss": 69933.96875} {"train_loss": -7.33202600479126, "global_step": 208530, "epoch": 4965} {"train_loss": -7.263586521148682, "global_step": 208531, "epoch": 4965} {"train_loss": -7.376183032989502, "global_step": 208532, "epoch": 4965} {"train_loss": -7.351492404937744, "global_step": 208533, "epoch": 4965} {"train_loss": -7.195647239685059, "global_step": 208534, "epoch": 4965} {"train_loss": -7.251121520996094, "global_step": 208535, "epoch": 4965} {"train_loss": -7.20998477935791, "global_step": 208536, "epoch": 4965} {"train_loss": -7.133617877960205, "global_step": 208537, "epoch": 4965} {"train_loss": -7.239173889160156, "global_step": 208538, "epoch": 4965} {"train_loss": -7.3374857902526855, "global_step": 208539, "epoch": 4965} {"train_loss": -7.135638236999512, "global_step": 208540, "epoch": 4965} {"train_loss": -7.278982162475586, "global_step": 208541, "epoch": 4965} {"train_loss": -7.242084980010986, "global_step": 208542, "epoch": 4965} {"train_loss": -7.24211311340332, "global_step": 208543, "epoch": 4965} {"train_loss": -7.412637710571289, "global_step": 208544, "epoch": 4965} {"train_loss": -7.237854480743408, "global_step": 208545, "epoch": 4965} {"train_loss": -7.263113021850586, "global_step": 208546, "epoch": 4965} {"train_loss": -7.329697608947754, "global_step": 208547, "epoch": 4965} {"train_loss": -7.235102653503418, "global_step": 208548, "epoch": 4965} {"train_loss": -7.161638259887695, "global_step": 208549, "epoch": 4965} {"train_loss": -7.337857723236084, "global_step": 208550, "epoch": 4965} {"train_loss": -7.242856979370117, "global_step": 208551, "epoch": 4965} {"train_loss": -7.238393783569336, "global_step": 208552, "epoch": 4965} {"train_loss": -7.219377517700195, "global_step": 208553, "epoch": 4965} {"train_loss": -7.266526699066162, "global_step": 208554, "epoch": 4965} {"train_loss": -7.2228803634643555, "global_step": 208555, "epoch": 4965} {"train_loss": -7.1934967041015625, "global_step": 208556, "epoch": 4965} {"train_loss": -7.241542816162109, "global_step": 208557, "epoch": 4965} {"train_loss": -7.246225357055664, "global_step": 208558, "epoch": 4965} {"train_loss": -7.389520168304443, "global_step": 208559, "epoch": 4965} {"train_loss": -6.935282230377197, "global_step": 208560, "epoch": 4965} {"train_loss": -7.318927764892578, "global_step": 208561, "epoch": 4965} {"train_loss": -7.128396987915039, "global_step": 208562, "epoch": 4965} {"train_loss": -7.244340896606445, "global_step": 208563, "epoch": 4965} {"train_loss": -7.349984169006348, "global_step": 208564, "epoch": 4965} {"train_loss": -7.185652732849121, "global_step": 208565, "epoch": 4965} {"train_loss": -7.254389762878418, "global_step": 208566, "epoch": 4965} {"train_loss": -7.183706283569336, "global_step": 208567, "epoch": 4965} {"train_loss": -7.233921051025391, "global_step": 208568, "epoch": 4965} {"train_loss": -7.164477348327637, "global_step": 208569, "epoch": 4965} {"train_loss": -7.3299665451049805, "global_step": 208570, "epoch": 4965} {"train_loss": -7.246303013392857, "global_step": 208571, "epoch": 4965, "val_loss": 70145.03125} {"train_loss": -7.185430526733398, "global_step": 208572, "epoch": 4966} {"train_loss": -7.37761926651001, "global_step": 208573, "epoch": 4966} {"train_loss": -7.240475654602051, "global_step": 208574, "epoch": 4966} {"train_loss": -7.21605920791626, "global_step": 208575, "epoch": 4966} {"train_loss": -7.310276031494141, "global_step": 208576, "epoch": 4966} {"train_loss": -7.2826337814331055, "global_step": 208577, "epoch": 4966} {"train_loss": -7.313354015350342, "global_step": 208578, "epoch": 4966} {"train_loss": -7.421031951904297, "global_step": 208579, "epoch": 4966} {"train_loss": -7.23777437210083, "global_step": 208580, "epoch": 4966} {"train_loss": -7.394381999969482, "global_step": 208581, "epoch": 4966} {"train_loss": -7.3487138748168945, "global_step": 208582, "epoch": 4966} {"train_loss": -7.333512306213379, "global_step": 208583, "epoch": 4966} {"train_loss": -7.304666042327881, "global_step": 208584, "epoch": 4966} {"train_loss": -7.341897487640381, "global_step": 208585, "epoch": 4966} {"train_loss": -7.242696762084961, "global_step": 208586, "epoch": 4966} {"train_loss": -7.383293151855469, "global_step": 208587, "epoch": 4966} {"train_loss": -7.332144737243652, "global_step": 208588, "epoch": 4966} {"train_loss": -7.310898780822754, "global_step": 208589, "epoch": 4966} {"train_loss": -7.272353172302246, "global_step": 208590, "epoch": 4966} {"train_loss": -7.370121955871582, "global_step": 208591, "epoch": 4966} {"train_loss": -7.277172088623047, "global_step": 208592, "epoch": 4966} {"train_loss": -7.197890281677246, "global_step": 208593, "epoch": 4966} {"train_loss": -7.348936080932617, "global_step": 208594, "epoch": 4966} {"train_loss": -7.3927412033081055, "global_step": 208595, "epoch": 4966} {"train_loss": -7.150230407714844, "global_step": 208596, "epoch": 4966} {"train_loss": -7.283904075622559, "global_step": 208597, "epoch": 4966} {"train_loss": -7.316919326782227, "global_step": 208598, "epoch": 4966} {"train_loss": -7.42818546295166, "global_step": 208599, "epoch": 4966} {"train_loss": -7.245991230010986, "global_step": 208600, "epoch": 4966} {"train_loss": -7.392465591430664, "global_step": 208601, "epoch": 4966} {"train_loss": -7.346975803375244, "global_step": 208602, "epoch": 4966} {"train_loss": -7.368436336517334, "global_step": 208603, "epoch": 4966} {"train_loss": -7.418323516845703, "global_step": 208604, "epoch": 4966} {"train_loss": -7.3498854637146, "global_step": 208605, "epoch": 4966} {"train_loss": -7.35844612121582, "global_step": 208606, "epoch": 4966} {"train_loss": -7.290566444396973, "global_step": 208607, "epoch": 4966} {"train_loss": -7.4756879806518555, "global_step": 208608, "epoch": 4966} {"train_loss": -7.304265975952148, "global_step": 208609, "epoch": 4966} {"train_loss": -7.3502583503723145, "global_step": 208610, "epoch": 4966} {"train_loss": -7.464742183685303, "global_step": 208611, "epoch": 4966} {"train_loss": -7.383737564086914, "global_step": 208612, "epoch": 4966} {"train_loss": -7.328349476768857, "global_step": 208613, "epoch": 4966, "val_loss": 70051.453125} {"train_loss": -7.40612268447876, "global_step": 208614, "epoch": 4967} {"train_loss": -7.478682518005371, "global_step": 208615, "epoch": 4967} {"train_loss": -7.37625789642334, "global_step": 208616, "epoch": 4967} {"train_loss": -7.498143672943115, "global_step": 208617, "epoch": 4967} {"train_loss": -7.393501281738281, "global_step": 208618, "epoch": 4967} {"train_loss": -7.403590202331543, "global_step": 208619, "epoch": 4967} {"train_loss": -7.36630916595459, "global_step": 208620, "epoch": 4967} {"train_loss": -7.340297698974609, "global_step": 208621, "epoch": 4967} {"train_loss": -7.375235557556152, "global_step": 208622, "epoch": 4967} {"train_loss": -7.307553291320801, "global_step": 208623, "epoch": 4967} {"train_loss": -7.296636581420898, "global_step": 208624, "epoch": 4967} {"train_loss": -7.317603588104248, "global_step": 208625, "epoch": 4967} {"train_loss": -7.416876316070557, "global_step": 208626, "epoch": 4967} {"train_loss": -7.322830677032471, "global_step": 208627, "epoch": 4967} {"train_loss": -7.379887580871582, "global_step": 208628, "epoch": 4967} {"train_loss": -7.340405464172363, "global_step": 208629, "epoch": 4967} {"train_loss": -7.431607246398926, "global_step": 208630, "epoch": 4967} {"train_loss": -7.450816631317139, "global_step": 208631, "epoch": 4967} {"train_loss": -7.308598518371582, "global_step": 208632, "epoch": 4967} {"train_loss": -7.472231864929199, "global_step": 208633, "epoch": 4967} {"train_loss": -7.430994987487793, "global_step": 208634, "epoch": 4967} {"train_loss": -7.325443267822266, "global_step": 208635, "epoch": 4967} {"train_loss": -7.318911552429199, "global_step": 208636, "epoch": 4967} {"train_loss": -7.363370895385742, "global_step": 208637, "epoch": 4967} {"train_loss": -7.290116786956787, "global_step": 208638, "epoch": 4967} {"train_loss": -7.247448921203613, "global_step": 208639, "epoch": 4967} {"train_loss": -7.276298999786377, "global_step": 208640, "epoch": 4967} {"train_loss": -7.2731614112854, "global_step": 208641, "epoch": 4967} {"train_loss": -7.314235687255859, "global_step": 208642, "epoch": 4967} {"train_loss": -7.280149459838867, "global_step": 208643, "epoch": 4967} {"train_loss": -7.344759464263916, "global_step": 208644, "epoch": 4967} {"train_loss": -7.285958766937256, "global_step": 208645, "epoch": 4967} {"train_loss": -7.384653091430664, "global_step": 208646, "epoch": 4967} {"train_loss": -7.296750068664551, "global_step": 208647, "epoch": 4967} {"train_loss": -7.372126579284668, "global_step": 208648, "epoch": 4967} {"train_loss": -7.29766321182251, "global_step": 208649, "epoch": 4967} {"train_loss": -7.33682918548584, "global_step": 208650, "epoch": 4967} {"train_loss": -7.268834114074707, "global_step": 208651, "epoch": 4967} {"train_loss": -7.37205696105957, "global_step": 208652, "epoch": 4967} {"train_loss": -7.2598137855529785, "global_step": 208653, "epoch": 4967} {"train_loss": -7.38559627532959, "global_step": 208654, "epoch": 4967} {"train_loss": -7.3493411768050425, "global_step": 208655, "epoch": 4967, "val_loss": 70145.3046875} {"train_loss": -7.351742267608643, "global_step": 208656, "epoch": 4968} {"train_loss": -7.385684967041016, "global_step": 208657, "epoch": 4968} {"train_loss": -7.289441108703613, "global_step": 208658, "epoch": 4968} {"train_loss": -7.376626491546631, "global_step": 208659, "epoch": 4968} {"train_loss": -7.412337303161621, "global_step": 208660, "epoch": 4968} {"train_loss": -7.2213592529296875, "global_step": 208661, "epoch": 4968} {"train_loss": -7.364766597747803, "global_step": 208662, "epoch": 4968} {"train_loss": -7.3206939697265625, "global_step": 208663, "epoch": 4968} {"train_loss": -7.370955467224121, "global_step": 208664, "epoch": 4968} {"train_loss": -7.436756610870361, "global_step": 208665, "epoch": 4968} {"train_loss": -7.365238189697266, "global_step": 208666, "epoch": 4968} {"train_loss": -7.445216655731201, "global_step": 208667, "epoch": 4968} {"train_loss": -7.445735931396484, "global_step": 208668, "epoch": 4968} {"train_loss": -7.362030029296875, "global_step": 208669, "epoch": 4968} {"train_loss": -7.322869300842285, "global_step": 208670, "epoch": 4968} {"train_loss": -7.380134105682373, "global_step": 208671, "epoch": 4968} {"train_loss": -7.442437171936035, "global_step": 208672, "epoch": 4968} {"train_loss": -7.319094657897949, "global_step": 208673, "epoch": 4968} {"train_loss": -7.234206676483154, "global_step": 208674, "epoch": 4968} {"train_loss": -7.3628129959106445, "global_step": 208675, "epoch": 4968} {"train_loss": -7.361839294433594, "global_step": 208676, "epoch": 4968} {"train_loss": -7.3078765869140625, "global_step": 208677, "epoch": 4968} {"train_loss": -7.436662673950195, "global_step": 208678, "epoch": 4968} {"train_loss": -7.402256011962891, "global_step": 208679, "epoch": 4968} {"train_loss": -7.246183395385742, "global_step": 208680, "epoch": 4968} {"train_loss": -7.3106160163879395, "global_step": 208681, "epoch": 4968} {"train_loss": -7.4172821044921875, "global_step": 208682, "epoch": 4968} {"train_loss": -7.27225399017334, "global_step": 208683, "epoch": 4968} {"train_loss": -7.2850542068481445, "global_step": 208684, "epoch": 4968} {"train_loss": -7.21922492980957, "global_step": 208685, "epoch": 4968} {"train_loss": -7.328641891479492, "global_step": 208686, "epoch": 4968} {"train_loss": -7.378170490264893, "global_step": 208687, "epoch": 4968} {"train_loss": -7.245237350463867, "global_step": 208688, "epoch": 4968} {"train_loss": -7.377770900726318, "global_step": 208689, "epoch": 4968} {"train_loss": -7.3274078369140625, "global_step": 208690, "epoch": 4968} {"train_loss": -7.220036506652832, "global_step": 208691, "epoch": 4968} {"train_loss": -7.318221092224121, "global_step": 208692, "epoch": 4968} {"train_loss": -7.296734809875488, "global_step": 208693, "epoch": 4968} {"train_loss": -7.199335098266602, "global_step": 208694, "epoch": 4968} {"train_loss": -7.321956634521484, "global_step": 208695, "epoch": 4968} {"train_loss": -7.272738456726074, "global_step": 208696, "epoch": 4968} {"train_loss": -7.334921087537493, "global_step": 208697, "epoch": 4968, "val_loss": 70008.2890625} {"train_loss": -7.205724239349365, "global_step": 208698, "epoch": 4969} {"train_loss": -7.19285774230957, "global_step": 208699, "epoch": 4969} {"train_loss": -7.279854774475098, "global_step": 208700, "epoch": 4969} {"train_loss": -7.355535507202148, "global_step": 208701, "epoch": 4969} {"train_loss": -7.237824440002441, "global_step": 208702, "epoch": 4969} {"train_loss": -7.342748641967773, "global_step": 208703, "epoch": 4969} {"train_loss": -7.199658393859863, "global_step": 208704, "epoch": 4969} {"train_loss": -7.311728477478027, "global_step": 208705, "epoch": 4969} {"train_loss": -7.287057876586914, "global_step": 208706, "epoch": 4969} {"train_loss": -7.428023338317871, "global_step": 208707, "epoch": 4969} {"train_loss": -7.318937301635742, "global_step": 208708, "epoch": 4969} {"train_loss": -7.361419677734375, "global_step": 208709, "epoch": 4969} {"train_loss": -7.322750568389893, "global_step": 208710, "epoch": 4969} {"train_loss": -7.456270694732666, "global_step": 208711, "epoch": 4969} {"train_loss": -7.443545341491699, "global_step": 208712, "epoch": 4969} {"train_loss": -7.364175796508789, "global_step": 208713, "epoch": 4969} {"train_loss": -7.389923572540283, "global_step": 208714, "epoch": 4969} {"train_loss": -7.442817687988281, "global_step": 208715, "epoch": 4969} {"train_loss": -7.464554786682129, "global_step": 208716, "epoch": 4969} {"train_loss": -7.284914970397949, "global_step": 208717, "epoch": 4969} {"train_loss": -7.453530788421631, "global_step": 208718, "epoch": 4969} {"train_loss": -7.4153265953063965, "global_step": 208719, "epoch": 4969} {"train_loss": -7.354794502258301, "global_step": 208720, "epoch": 4969} {"train_loss": -7.395758152008057, "global_step": 208721, "epoch": 4969} {"train_loss": -7.377675533294678, "global_step": 208722, "epoch": 4969} {"train_loss": -7.301167964935303, "global_step": 208723, "epoch": 4969} {"train_loss": -7.4383745193481445, "global_step": 208724, "epoch": 4969} {"train_loss": -7.408596992492676, "global_step": 208725, "epoch": 4969} {"train_loss": -7.338820457458496, "global_step": 208726, "epoch": 4969} {"train_loss": -7.416013240814209, "global_step": 208727, "epoch": 4969} {"train_loss": -7.419628620147705, "global_step": 208728, "epoch": 4969} {"train_loss": -7.251554489135742, "global_step": 208729, "epoch": 4969} {"train_loss": -7.327023506164551, "global_step": 208730, "epoch": 4969} {"train_loss": -7.328679084777832, "global_step": 208731, "epoch": 4969} {"train_loss": -7.3428521156311035, "global_step": 208732, "epoch": 4969} {"train_loss": -7.222097396850586, "global_step": 208733, "epoch": 4969} {"train_loss": -7.282169818878174, "global_step": 208734, "epoch": 4969} {"train_loss": -7.360194206237793, "global_step": 208735, "epoch": 4969} {"train_loss": -7.234305381774902, "global_step": 208736, "epoch": 4969} {"train_loss": -7.308724880218506, "global_step": 208737, "epoch": 4969} {"train_loss": -7.329513072967529, "global_step": 208738, "epoch": 4969} {"train_loss": -7.339214143298921, "global_step": 208739, "epoch": 4969, "val_loss": 69983.6171875} {"train_loss": -7.235313415527344, "global_step": 208740, "epoch": 4970} {"train_loss": -7.409503936767578, "global_step": 208741, "epoch": 4970} {"train_loss": -7.144131183624268, "global_step": 208742, "epoch": 4970} {"train_loss": -7.226783275604248, "global_step": 208743, "epoch": 4970} {"train_loss": -7.237792491912842, "global_step": 208744, "epoch": 4970} {"train_loss": -7.302242279052734, "global_step": 208745, "epoch": 4970} {"train_loss": -7.305110454559326, "global_step": 208746, "epoch": 4970} {"train_loss": -7.277157306671143, "global_step": 208747, "epoch": 4970} {"train_loss": -7.28841495513916, "global_step": 208748, "epoch": 4970} {"train_loss": -7.308679580688477, "global_step": 208749, "epoch": 4970} {"train_loss": -7.3767595291137695, "global_step": 208750, "epoch": 4970} {"train_loss": -7.354969024658203, "global_step": 208751, "epoch": 4970} {"train_loss": -7.355966567993164, "global_step": 208752, "epoch": 4970} {"train_loss": -7.401113033294678, "global_step": 208753, "epoch": 4970} {"train_loss": -7.414572715759277, "global_step": 208754, "epoch": 4970} {"train_loss": -7.363690376281738, "global_step": 208755, "epoch": 4970} {"train_loss": -7.313758850097656, "global_step": 208756, "epoch": 4970} {"train_loss": -7.287346839904785, "global_step": 208757, "epoch": 4970} {"train_loss": -7.387812614440918, "global_step": 208758, "epoch": 4970} {"train_loss": -7.277279853820801, "global_step": 208759, "epoch": 4970} {"train_loss": -7.34796142578125, "global_step": 208760, "epoch": 4970} {"train_loss": -7.477517604827881, "global_step": 208761, "epoch": 4970} {"train_loss": -7.3863525390625, "global_step": 208762, "epoch": 4970} {"train_loss": -7.512940406799316, "global_step": 208763, "epoch": 4970} {"train_loss": -7.450571060180664, "global_step": 208764, "epoch": 4970} {"train_loss": -7.375247001647949, "global_step": 208765, "epoch": 4970} {"train_loss": -7.454403877258301, "global_step": 208766, "epoch": 4970} {"train_loss": -7.453207969665527, "global_step": 208767, "epoch": 4970} {"train_loss": -7.304283142089844, "global_step": 208768, "epoch": 4970} {"train_loss": -7.283984184265137, "global_step": 208769, "epoch": 4970} {"train_loss": -7.427536487579346, "global_step": 208770, "epoch": 4970} {"train_loss": -7.34165096282959, "global_step": 208771, "epoch": 4970} {"train_loss": -7.191429138183594, "global_step": 208772, "epoch": 4970} {"train_loss": -7.26381778717041, "global_step": 208773, "epoch": 4970} {"train_loss": -7.358989715576172, "global_step": 208774, "epoch": 4970} {"train_loss": -7.207468032836914, "global_step": 208775, "epoch": 4970} {"train_loss": -7.226134777069092, "global_step": 208776, "epoch": 4970} {"train_loss": -7.3655619621276855, "global_step": 208777, "epoch": 4970} {"train_loss": -7.216622352600098, "global_step": 208778, "epoch": 4970} {"train_loss": -7.224880218505859, "global_step": 208779, "epoch": 4970} {"train_loss": -7.311168670654297, "global_step": 208780, "epoch": 4970} {"train_loss": -7.326957668576922, "global_step": 208781, "epoch": 4970, "val_loss": 70028.8203125} {"train_loss": -7.256772041320801, "global_step": 208782, "epoch": 4971} {"train_loss": -7.363169193267822, "global_step": 208783, "epoch": 4971} {"train_loss": -7.232316493988037, "global_step": 208784, "epoch": 4971} {"train_loss": -7.376379013061523, "global_step": 208785, "epoch": 4971} {"train_loss": -7.371042251586914, "global_step": 208786, "epoch": 4971} {"train_loss": -7.3922529220581055, "global_step": 208787, "epoch": 4971} {"train_loss": -7.447041034698486, "global_step": 208788, "epoch": 4971} {"train_loss": -7.344970703125, "global_step": 208789, "epoch": 4971} {"train_loss": -7.376289367675781, "global_step": 208790, "epoch": 4971} {"train_loss": -7.412140369415283, "global_step": 208791, "epoch": 4971} {"train_loss": -7.233769416809082, "global_step": 208792, "epoch": 4971} {"train_loss": -7.302398204803467, "global_step": 208793, "epoch": 4971} {"train_loss": -7.345456123352051, "global_step": 208794, "epoch": 4971} {"train_loss": -7.302272796630859, "global_step": 208795, "epoch": 4971} {"train_loss": -7.339394569396973, "global_step": 208796, "epoch": 4971} {"train_loss": -7.404575347900391, "global_step": 208797, "epoch": 4971} {"train_loss": -7.313865661621094, "global_step": 208798, "epoch": 4971} {"train_loss": -7.328730583190918, "global_step": 208799, "epoch": 4971} {"train_loss": -7.375278472900391, "global_step": 208800, "epoch": 4971} {"train_loss": -7.5162458419799805, "global_step": 208801, "epoch": 4971} {"train_loss": -7.446249485015869, "global_step": 208802, "epoch": 4971} {"train_loss": -7.318768501281738, "global_step": 208803, "epoch": 4971} {"train_loss": -7.35484504699707, "global_step": 208804, "epoch": 4971} {"train_loss": -7.195990562438965, "global_step": 208805, "epoch": 4971} {"train_loss": -7.40399169921875, "global_step": 208806, "epoch": 4971} {"train_loss": -7.241727352142334, "global_step": 208807, "epoch": 4971} {"train_loss": -7.345183372497559, "global_step": 208808, "epoch": 4971} {"train_loss": -7.178397178649902, "global_step": 208809, "epoch": 4971} {"train_loss": -7.216594696044922, "global_step": 208810, "epoch": 4971} {"train_loss": -7.339451789855957, "global_step": 208811, "epoch": 4971} {"train_loss": -7.31123161315918, "global_step": 208812, "epoch": 4971} {"train_loss": -7.220615386962891, "global_step": 208813, "epoch": 4971} {"train_loss": -7.220744609832764, "global_step": 208814, "epoch": 4971} {"train_loss": -7.298581123352051, "global_step": 208815, "epoch": 4971} {"train_loss": -7.229292869567871, "global_step": 208816, "epoch": 4971} {"train_loss": -7.161899566650391, "global_step": 208817, "epoch": 4971} {"train_loss": -7.1846418380737305, "global_step": 208818, "epoch": 4971} {"train_loss": -7.400177955627441, "global_step": 208819, "epoch": 4971} {"train_loss": -7.190582752227783, "global_step": 208820, "epoch": 4971} {"train_loss": -7.318578720092773, "global_step": 208821, "epoch": 4971} {"train_loss": -7.2336883544921875, "global_step": 208822, "epoch": 4971} {"train_loss": -7.314430634180705, "global_step": 208823, "epoch": 4971, "val_loss": 70108.71875} {"train_loss": -7.312564373016357, "global_step": 208824, "epoch": 4972} {"train_loss": -7.4079437255859375, "global_step": 208825, "epoch": 4972} {"train_loss": -7.280884742736816, "global_step": 208826, "epoch": 4972} {"train_loss": -7.353837013244629, "global_step": 208827, "epoch": 4972} {"train_loss": -7.415292739868164, "global_step": 208828, "epoch": 4972} {"train_loss": -7.292313575744629, "global_step": 208829, "epoch": 4972} {"train_loss": -7.267172813415527, "global_step": 208830, "epoch": 4972} {"train_loss": -7.32764196395874, "global_step": 208831, "epoch": 4972} {"train_loss": -7.460338592529297, "global_step": 208832, "epoch": 4972} {"train_loss": -7.31989860534668, "global_step": 208833, "epoch": 4972} {"train_loss": -7.3513593673706055, "global_step": 208834, "epoch": 4972} {"train_loss": -7.243819713592529, "global_step": 208835, "epoch": 4972} {"train_loss": -7.301609039306641, "global_step": 208836, "epoch": 4972} {"train_loss": -7.243044853210449, "global_step": 208837, "epoch": 4972} {"train_loss": -7.381741046905518, "global_step": 208838, "epoch": 4972} {"train_loss": -7.327248573303223, "global_step": 208839, "epoch": 4972} {"train_loss": -7.251330375671387, "global_step": 208840, "epoch": 4972} {"train_loss": -7.335178375244141, "global_step": 208841, "epoch": 4972} {"train_loss": -7.286166191101074, "global_step": 208842, "epoch": 4972} {"train_loss": -7.349663734436035, "global_step": 208843, "epoch": 4972} {"train_loss": -7.266168594360352, "global_step": 208844, "epoch": 4972} {"train_loss": -7.414638519287109, "global_step": 208845, "epoch": 4972} {"train_loss": -7.432126998901367, "global_step": 208846, "epoch": 4972} {"train_loss": -7.466296195983887, "global_step": 208847, "epoch": 4972} {"train_loss": -7.335536956787109, "global_step": 208848, "epoch": 4972} {"train_loss": -7.31712532043457, "global_step": 208849, "epoch": 4972} {"train_loss": -7.383322715759277, "global_step": 208850, "epoch": 4972} {"train_loss": -7.33489465713501, "global_step": 208851, "epoch": 4972} {"train_loss": -7.302502632141113, "global_step": 208852, "epoch": 4972} {"train_loss": -7.339694976806641, "global_step": 208853, "epoch": 4972} {"train_loss": -7.33708381652832, "global_step": 208854, "epoch": 4972} {"train_loss": -7.276009559631348, "global_step": 208855, "epoch": 4972} {"train_loss": -7.222863674163818, "global_step": 208856, "epoch": 4972} {"train_loss": -7.381296157836914, "global_step": 208857, "epoch": 4972} {"train_loss": -7.166571617126465, "global_step": 208858, "epoch": 4972} {"train_loss": -7.2025651931762695, "global_step": 208859, "epoch": 4972} {"train_loss": -7.24014949798584, "global_step": 208860, "epoch": 4972} {"train_loss": -7.066649913787842, "global_step": 208861, "epoch": 4972} {"train_loss": -7.260171890258789, "global_step": 208862, "epoch": 4972} {"train_loss": -7.038928985595703, "global_step": 208863, "epoch": 4972} {"train_loss": -7.307862281799316, "global_step": 208864, "epoch": 4972} {"train_loss": -7.303580193292527, "global_step": 208865, "epoch": 4972, "val_loss": 69988.546875} {"train_loss": -7.121657848358154, "global_step": 208866, "epoch": 4973} {"train_loss": -7.332566738128662, "global_step": 208867, "epoch": 4973} {"train_loss": -7.005688667297363, "global_step": 208868, "epoch": 4973} {"train_loss": -7.311729431152344, "global_step": 208869, "epoch": 4973} {"train_loss": -7.010190486907959, "global_step": 208870, "epoch": 4973} {"train_loss": -7.429169178009033, "global_step": 208871, "epoch": 4973} {"train_loss": -6.852145195007324, "global_step": 208872, "epoch": 4973} {"train_loss": -7.303571701049805, "global_step": 208873, "epoch": 4973} {"train_loss": -7.034836769104004, "global_step": 208874, "epoch": 4973} {"train_loss": -7.096273899078369, "global_step": 208875, "epoch": 4973} {"train_loss": -7.069103240966797, "global_step": 208876, "epoch": 4973} {"train_loss": -7.208437919616699, "global_step": 208877, "epoch": 4973} {"train_loss": -7.173011779785156, "global_step": 208878, "epoch": 4973} {"train_loss": -7.195483207702637, "global_step": 208879, "epoch": 4973} {"train_loss": -7.221920013427734, "global_step": 208880, "epoch": 4973} {"train_loss": -7.221249580383301, "global_step": 208881, "epoch": 4973} {"train_loss": -7.296270370483398, "global_step": 208882, "epoch": 4973} {"train_loss": -7.26278018951416, "global_step": 208883, "epoch": 4973} {"train_loss": -7.330258846282959, "global_step": 208884, "epoch": 4973} {"train_loss": -7.262360095977783, "global_step": 208885, "epoch": 4973} {"train_loss": -7.294198989868164, "global_step": 208886, "epoch": 4973} {"train_loss": -7.309133529663086, "global_step": 208887, "epoch": 4973} {"train_loss": -7.346920967102051, "global_step": 208888, "epoch": 4973} {"train_loss": -7.249217987060547, "global_step": 208889, "epoch": 4973} {"train_loss": -7.367712020874023, "global_step": 208890, "epoch": 4973} {"train_loss": -7.331597805023193, "global_step": 208891, "epoch": 4973} {"train_loss": -7.314435005187988, "global_step": 208892, "epoch": 4973} {"train_loss": -7.38129997253418, "global_step": 208893, "epoch": 4973} {"train_loss": -7.225022315979004, "global_step": 208894, "epoch": 4973} {"train_loss": -7.277400493621826, "global_step": 208895, "epoch": 4973} {"train_loss": -7.369862079620361, "global_step": 208896, "epoch": 4973} {"train_loss": -7.288247108459473, "global_step": 208897, "epoch": 4973} {"train_loss": -7.330060005187988, "global_step": 208898, "epoch": 4973} {"train_loss": -7.289938926696777, "global_step": 208899, "epoch": 4973} {"train_loss": -7.375312805175781, "global_step": 208900, "epoch": 4973} {"train_loss": -7.302884578704834, "global_step": 208901, "epoch": 4973} {"train_loss": -7.264404296875, "global_step": 208902, "epoch": 4973} {"train_loss": -7.306682109832764, "global_step": 208903, "epoch": 4973} {"train_loss": -7.279586315155029, "global_step": 208904, "epoch": 4973} {"train_loss": -7.294918060302734, "global_step": 208905, "epoch": 4973} {"train_loss": -7.346209526062012, "global_step": 208906, "epoch": 4973} {"train_loss": -7.253089303062076, "global_step": 208907, "epoch": 4973, "val_loss": 69874.078125} {"train_loss": -7.334352016448975, "global_step": 208908, "epoch": 4974} {"train_loss": -7.489282131195068, "global_step": 208909, "epoch": 4974} {"train_loss": -7.377128601074219, "global_step": 208910, "epoch": 4974} {"train_loss": -7.389659404754639, "global_step": 208911, "epoch": 4974} {"train_loss": -7.393225193023682, "global_step": 208912, "epoch": 4974} {"train_loss": -7.390311241149902, "global_step": 208913, "epoch": 4974} {"train_loss": -7.3809590339660645, "global_step": 208914, "epoch": 4974} {"train_loss": -7.320643424987793, "global_step": 208915, "epoch": 4974} {"train_loss": -7.363611221313477, "global_step": 208916, "epoch": 4974} {"train_loss": -7.451536178588867, "global_step": 208917, "epoch": 4974} {"train_loss": -7.354304313659668, "global_step": 208918, "epoch": 4974} {"train_loss": -7.502881050109863, "global_step": 208919, "epoch": 4974} {"train_loss": -7.385689735412598, "global_step": 208920, "epoch": 4974} {"train_loss": -7.28607177734375, "global_step": 208921, "epoch": 4974} {"train_loss": -7.31711483001709, "global_step": 208922, "epoch": 4974} {"train_loss": -7.375531196594238, "global_step": 208923, "epoch": 4974} {"train_loss": -7.4141459465026855, "global_step": 208924, "epoch": 4974} {"train_loss": -7.314727783203125, "global_step": 208925, "epoch": 4974} {"train_loss": -7.313859462738037, "global_step": 208926, "epoch": 4974} {"train_loss": -7.448927879333496, "global_step": 208927, "epoch": 4974} {"train_loss": -7.37394905090332, "global_step": 208928, "epoch": 4974} {"train_loss": -7.310042381286621, "global_step": 208929, "epoch": 4974} {"train_loss": -7.469557285308838, "global_step": 208930, "epoch": 4974} {"train_loss": -7.42428731918335, "global_step": 208931, "epoch": 4974} {"train_loss": -7.405645370483398, "global_step": 208932, "epoch": 4974} {"train_loss": -7.363463401794434, "global_step": 208933, "epoch": 4974} {"train_loss": -7.346119403839111, "global_step": 208934, "epoch": 4974} {"train_loss": -7.463345527648926, "global_step": 208935, "epoch": 4974} {"train_loss": -7.467157363891602, "global_step": 208936, "epoch": 4974} {"train_loss": -7.133169651031494, "global_step": 208937, "epoch": 4974} {"train_loss": -7.276213645935059, "global_step": 208938, "epoch": 4974} {"train_loss": -7.351755619049072, "global_step": 208939, "epoch": 4974} {"train_loss": -7.279218673706055, "global_step": 208940, "epoch": 4974} {"train_loss": -7.324641704559326, "global_step": 208941, "epoch": 4974} {"train_loss": -7.210258483886719, "global_step": 208942, "epoch": 4974} {"train_loss": -7.40565824508667, "global_step": 208943, "epoch": 4974} {"train_loss": -7.355739593505859, "global_step": 208944, "epoch": 4974} {"train_loss": -7.219244480133057, "global_step": 208945, "epoch": 4974} {"train_loss": -7.319492340087891, "global_step": 208946, "epoch": 4974} {"train_loss": -7.364387512207031, "global_step": 208947, "epoch": 4974} {"train_loss": -7.302431106567383, "global_step": 208948, "epoch": 4974} {"train_loss": -7.357976799919491, "global_step": 208949, "epoch": 4974, "val_loss": 70078.7109375} {"train_loss": -7.293793201446533, "global_step": 208950, "epoch": 4975} {"train_loss": -7.278908729553223, "global_step": 208951, "epoch": 4975} {"train_loss": -7.288273811340332, "global_step": 208952, "epoch": 4975} {"train_loss": -7.191317081451416, "global_step": 208953, "epoch": 4975} {"train_loss": -7.246290683746338, "global_step": 208954, "epoch": 4975} {"train_loss": -7.225611686706543, "global_step": 208955, "epoch": 4975} {"train_loss": -7.1174235343933105, "global_step": 208956, "epoch": 4975} {"train_loss": -7.151975154876709, "global_step": 208957, "epoch": 4975} {"train_loss": -7.183962345123291, "global_step": 208958, "epoch": 4975} {"train_loss": -6.996832847595215, "global_step": 208959, "epoch": 4975} {"train_loss": -7.237673759460449, "global_step": 208960, "epoch": 4975} {"train_loss": -7.083990097045898, "global_step": 208961, "epoch": 4975} {"train_loss": -7.117576599121094, "global_step": 208962, "epoch": 4975} {"train_loss": -7.052221298217773, "global_step": 208963, "epoch": 4975} {"train_loss": -7.187719345092773, "global_step": 208964, "epoch": 4975} {"train_loss": -7.040538787841797, "global_step": 208965, "epoch": 4975} {"train_loss": -7.144846439361572, "global_step": 208966, "epoch": 4975} {"train_loss": -7.166624546051025, "global_step": 208967, "epoch": 4975} {"train_loss": -7.097118377685547, "global_step": 208968, "epoch": 4975} {"train_loss": -7.219512462615967, "global_step": 208969, "epoch": 4975} {"train_loss": -7.201053619384766, "global_step": 208970, "epoch": 4975} {"train_loss": -7.214544773101807, "global_step": 208971, "epoch": 4975} {"train_loss": -7.177359104156494, "global_step": 208972, "epoch": 4975} {"train_loss": -7.213764190673828, "global_step": 208973, "epoch": 4975} {"train_loss": -7.318015098571777, "global_step": 208974, "epoch": 4975} {"train_loss": -7.30369758605957, "global_step": 208975, "epoch": 4975} {"train_loss": -7.162430286407471, "global_step": 208976, "epoch": 4975} {"train_loss": -7.395967483520508, "global_step": 208977, "epoch": 4975} {"train_loss": -7.25522518157959, "global_step": 208978, "epoch": 4975} {"train_loss": -7.166721343994141, "global_step": 208979, "epoch": 4975} {"train_loss": -7.320623397827148, "global_step": 208980, "epoch": 4975} {"train_loss": -7.194892883300781, "global_step": 208981, "epoch": 4975} {"train_loss": -7.330684185028076, "global_step": 208982, "epoch": 4975} {"train_loss": -7.274114608764648, "global_step": 208983, "epoch": 4975} {"train_loss": -7.244773864746094, "global_step": 208984, "epoch": 4975} {"train_loss": -7.254228591918945, "global_step": 208985, "epoch": 4975} {"train_loss": -7.346488952636719, "global_step": 208986, "epoch": 4975} {"train_loss": -7.350776195526123, "global_step": 208987, "epoch": 4975} {"train_loss": -7.3040056228637695, "global_step": 208988, "epoch": 4975} {"train_loss": -7.264589309692383, "global_step": 208989, "epoch": 4975} {"train_loss": -7.330028533935547, "global_step": 208990, "epoch": 4975} {"train_loss": -7.219509249641781, "global_step": 208991, "epoch": 4975, "val_loss": 69979.328125} {"train_loss": -7.251426696777344, "global_step": 208992, "epoch": 4976} {"train_loss": -7.358156204223633, "global_step": 208993, "epoch": 4976} {"train_loss": -7.257824897766113, "global_step": 208994, "epoch": 4976} {"train_loss": -7.367412090301514, "global_step": 208995, "epoch": 4976} {"train_loss": -7.360342979431152, "global_step": 208996, "epoch": 4976} {"train_loss": -7.385293960571289, "global_step": 208997, "epoch": 4976} {"train_loss": -7.367570400238037, "global_step": 208998, "epoch": 4976} {"train_loss": -7.3403472900390625, "global_step": 208999, "epoch": 4976} {"train_loss": -7.351612567901611, "global_step": 209000, "epoch": 4976} {"train_loss": -7.4040093421936035, "global_step": 209001, "epoch": 4976} {"train_loss": -7.415351867675781, "global_step": 209002, "epoch": 4976} {"train_loss": -7.446159362792969, "global_step": 209003, "epoch": 4976} {"train_loss": -7.301738739013672, "global_step": 209004, "epoch": 4976} {"train_loss": -7.326687812805176, "global_step": 209005, "epoch": 4976} {"train_loss": -7.401559829711914, "global_step": 209006, "epoch": 4976} {"train_loss": -7.311188697814941, "global_step": 209007, "epoch": 4976} {"train_loss": -7.369863033294678, "global_step": 209008, "epoch": 4976} {"train_loss": -7.330866813659668, "global_step": 209009, "epoch": 4976} {"train_loss": -7.414370059967041, "global_step": 209010, "epoch": 4976} {"train_loss": -7.498008728027344, "global_step": 209011, "epoch": 4976} {"train_loss": -7.358127117156982, "global_step": 209012, "epoch": 4976} {"train_loss": -7.312135696411133, "global_step": 209013, "epoch": 4976} {"train_loss": -7.324735641479492, "global_step": 209014, "epoch": 4976} {"train_loss": -7.379936218261719, "global_step": 209015, "epoch": 4976} {"train_loss": -7.1755781173706055, "global_step": 209016, "epoch": 4976} {"train_loss": -7.369309902191162, "global_step": 209017, "epoch": 4976} {"train_loss": -7.34483003616333, "global_step": 209018, "epoch": 4976} {"train_loss": -7.238162994384766, "global_step": 209019, "epoch": 4976} {"train_loss": -7.3432722091674805, "global_step": 209020, "epoch": 4976} {"train_loss": -7.285243511199951, "global_step": 209021, "epoch": 4976} {"train_loss": -7.363722801208496, "global_step": 209022, "epoch": 4976} {"train_loss": -7.341858863830566, "global_step": 209023, "epoch": 4976} {"train_loss": -7.1663007736206055, "global_step": 209024, "epoch": 4976} {"train_loss": -7.336404800415039, "global_step": 209025, "epoch": 4976} {"train_loss": -7.306425094604492, "global_step": 209026, "epoch": 4976} {"train_loss": -7.227933883666992, "global_step": 209027, "epoch": 4976} {"train_loss": -7.251731872558594, "global_step": 209028, "epoch": 4976} {"train_loss": -7.345531463623047, "global_step": 209029, "epoch": 4976} {"train_loss": -7.288969039916992, "global_step": 209030, "epoch": 4976} {"train_loss": -7.413474082946777, "global_step": 209031, "epoch": 4976} {"train_loss": -7.3009819984436035, "global_step": 209032, "epoch": 4976} {"train_loss": -7.335712126323155, "global_step": 209033, "epoch": 4976, "val_loss": 70071.0859375} {"train_loss": -7.363232612609863, "global_step": 209034, "epoch": 4977} {"train_loss": -7.462616443634033, "global_step": 209035, "epoch": 4977} {"train_loss": -7.336357593536377, "global_step": 209036, "epoch": 4977} {"train_loss": -7.333241939544678, "global_step": 209037, "epoch": 4977} {"train_loss": -7.28653621673584, "global_step": 209038, "epoch": 4977} {"train_loss": -7.322161674499512, "global_step": 209039, "epoch": 4977} {"train_loss": -7.347835540771484, "global_step": 209040, "epoch": 4977} {"train_loss": -7.290473937988281, "global_step": 209041, "epoch": 4977} {"train_loss": -7.4359588623046875, "global_step": 209042, "epoch": 4977} {"train_loss": -7.265332221984863, "global_step": 209043, "epoch": 4977} {"train_loss": -7.44573974609375, "global_step": 209044, "epoch": 4977} {"train_loss": -7.364176273345947, "global_step": 209045, "epoch": 4977} {"train_loss": -7.438966274261475, "global_step": 209046, "epoch": 4977} {"train_loss": -7.352524757385254, "global_step": 209047, "epoch": 4977} {"train_loss": -7.3874711990356445, "global_step": 209048, "epoch": 4977} {"train_loss": -7.359224796295166, "global_step": 209049, "epoch": 4977} {"train_loss": -7.4639506340026855, "global_step": 209050, "epoch": 4977} {"train_loss": -7.32271671295166, "global_step": 209051, "epoch": 4977} {"train_loss": -7.3851470947265625, "global_step": 209052, "epoch": 4977} {"train_loss": -7.468796730041504, "global_step": 209053, "epoch": 4977} {"train_loss": -7.458734512329102, "global_step": 209054, "epoch": 4977} {"train_loss": -7.461493015289307, "global_step": 209055, "epoch": 4977} {"train_loss": -7.424120903015137, "global_step": 209056, "epoch": 4977} {"train_loss": -7.367929935455322, "global_step": 209057, "epoch": 4977} {"train_loss": -7.448330402374268, "global_step": 209058, "epoch": 4977} {"train_loss": -7.321075439453125, "global_step": 209059, "epoch": 4977} {"train_loss": -7.389069557189941, "global_step": 209060, "epoch": 4977} {"train_loss": -7.384919166564941, "global_step": 209061, "epoch": 4977} {"train_loss": -7.295426368713379, "global_step": 209062, "epoch": 4977} {"train_loss": -7.390215873718262, "global_step": 209063, "epoch": 4977} {"train_loss": -7.389317035675049, "global_step": 209064, "epoch": 4977} {"train_loss": -7.395900726318359, "global_step": 209065, "epoch": 4977} {"train_loss": -7.391971588134766, "global_step": 209066, "epoch": 4977} {"train_loss": -7.36712121963501, "global_step": 209067, "epoch": 4977} {"train_loss": -7.422573089599609, "global_step": 209068, "epoch": 4977} {"train_loss": -7.425860404968262, "global_step": 209069, "epoch": 4977} {"train_loss": -7.378970146179199, "global_step": 209070, "epoch": 4977} {"train_loss": -7.349486351013184, "global_step": 209071, "epoch": 4977} {"train_loss": -7.487263202667236, "global_step": 209072, "epoch": 4977} {"train_loss": -7.303369522094727, "global_step": 209073, "epoch": 4977} {"train_loss": -7.36007833480835, "global_step": 209074, "epoch": 4977} {"train_loss": -7.38226150331043, "global_step": 209075, "epoch": 4977, "val_loss": 70050.015625} {"train_loss": -7.509834289550781, "global_step": 209076, "epoch": 4978} {"train_loss": -7.334369659423828, "global_step": 209077, "epoch": 4978} {"train_loss": -7.346955299377441, "global_step": 209078, "epoch": 4978} {"train_loss": -7.363665580749512, "global_step": 209079, "epoch": 4978} {"train_loss": -7.284804344177246, "global_step": 209080, "epoch": 4978} {"train_loss": -7.326165199279785, "global_step": 209081, "epoch": 4978} {"train_loss": -7.298761367797852, "global_step": 209082, "epoch": 4978} {"train_loss": -7.237427711486816, "global_step": 209083, "epoch": 4978} {"train_loss": -7.159064292907715, "global_step": 209084, "epoch": 4978} {"train_loss": -7.248929023742676, "global_step": 209085, "epoch": 4978} {"train_loss": -7.155804634094238, "global_step": 209086, "epoch": 4978} {"train_loss": -7.175526142120361, "global_step": 209087, "epoch": 4978} {"train_loss": -7.180417060852051, "global_step": 209088, "epoch": 4978} {"train_loss": -7.2269978523254395, "global_step": 209089, "epoch": 4978} {"train_loss": -7.278993606567383, "global_step": 209090, "epoch": 4978} {"train_loss": -7.262589931488037, "global_step": 209091, "epoch": 4978} {"train_loss": -7.263145923614502, "global_step": 209092, "epoch": 4978} {"train_loss": -7.132866382598877, "global_step": 209093, "epoch": 4978} {"train_loss": -7.326826572418213, "global_step": 209094, "epoch": 4978} {"train_loss": -7.150075912475586, "global_step": 209095, "epoch": 4978} {"train_loss": -7.254393100738525, "global_step": 209096, "epoch": 4978} {"train_loss": -7.255441665649414, "global_step": 209097, "epoch": 4978} {"train_loss": -7.303367614746094, "global_step": 209098, "epoch": 4978} {"train_loss": -7.298454284667969, "global_step": 209099, "epoch": 4978} {"train_loss": -7.242789268493652, "global_step": 209100, "epoch": 4978} {"train_loss": -7.2173027992248535, "global_step": 209101, "epoch": 4978} {"train_loss": -7.335563659667969, "global_step": 209102, "epoch": 4978} {"train_loss": -7.2891459465026855, "global_step": 209103, "epoch": 4978} {"train_loss": -7.32337760925293, "global_step": 209104, "epoch": 4978} {"train_loss": -7.441346645355225, "global_step": 209105, "epoch": 4978} {"train_loss": -7.299056529998779, "global_step": 209106, "epoch": 4978} {"train_loss": -7.251289367675781, "global_step": 209107, "epoch": 4978} {"train_loss": -7.397829055786133, "global_step": 209108, "epoch": 4978} {"train_loss": -7.36740779876709, "global_step": 209109, "epoch": 4978} {"train_loss": -7.375058174133301, "global_step": 209110, "epoch": 4978} {"train_loss": -7.393217086791992, "global_step": 209111, "epoch": 4978} {"train_loss": -7.35878849029541, "global_step": 209112, "epoch": 4978} {"train_loss": -7.291388511657715, "global_step": 209113, "epoch": 4978} {"train_loss": -7.361176490783691, "global_step": 209114, "epoch": 4978} {"train_loss": -7.431832313537598, "global_step": 209115, "epoch": 4978} {"train_loss": -7.298531532287598, "global_step": 209116, "epoch": 4978} {"train_loss": -7.295607226235526, "global_step": 209117, "epoch": 4978, "val_loss": 69942.9453125} {"train_loss": -7.445645809173584, "global_step": 209118, "epoch": 4979} {"train_loss": -7.278368949890137, "global_step": 209119, "epoch": 4979} {"train_loss": -7.359316825866699, "global_step": 209120, "epoch": 4979} {"train_loss": -7.338361740112305, "global_step": 209121, "epoch": 4979} {"train_loss": -7.336755752563477, "global_step": 209122, "epoch": 4979} {"train_loss": -7.435718059539795, "global_step": 209123, "epoch": 4979} {"train_loss": -7.344278335571289, "global_step": 209124, "epoch": 4979} {"train_loss": -7.362360954284668, "global_step": 209125, "epoch": 4979} {"train_loss": -7.310779094696045, "global_step": 209126, "epoch": 4979} {"train_loss": -7.370424747467041, "global_step": 209127, "epoch": 4979} {"train_loss": -7.426761150360107, "global_step": 209128, "epoch": 4979} {"train_loss": -7.373402118682861, "global_step": 209129, "epoch": 4979} {"train_loss": -7.301453590393066, "global_step": 209130, "epoch": 4979} {"train_loss": -7.353351593017578, "global_step": 209131, "epoch": 4979} {"train_loss": -7.361339569091797, "global_step": 209132, "epoch": 4979} {"train_loss": -7.269650459289551, "global_step": 209133, "epoch": 4979} {"train_loss": -7.306070804595947, "global_step": 209134, "epoch": 4979} {"train_loss": -7.333653926849365, "global_step": 209135, "epoch": 4979} {"train_loss": -7.398853302001953, "global_step": 209136, "epoch": 4979} {"train_loss": -7.279469966888428, "global_step": 209137, "epoch": 4979} {"train_loss": -7.303826332092285, "global_step": 209138, "epoch": 4979} {"train_loss": -7.365880966186523, "global_step": 209139, "epoch": 4979} {"train_loss": -7.280701160430908, "global_step": 209140, "epoch": 4979} {"train_loss": -7.30560827255249, "global_step": 209141, "epoch": 4979} {"train_loss": -7.284671306610107, "global_step": 209142, "epoch": 4979} {"train_loss": -7.28287410736084, "global_step": 209143, "epoch": 4979} {"train_loss": -7.3159074783325195, "global_step": 209144, "epoch": 4979} {"train_loss": -7.423363208770752, "global_step": 209145, "epoch": 4979} {"train_loss": -7.369109630584717, "global_step": 209146, "epoch": 4979} {"train_loss": -7.379661560058594, "global_step": 209147, "epoch": 4979} {"train_loss": -7.331496715545654, "global_step": 209148, "epoch": 4979} {"train_loss": -7.342264652252197, "global_step": 209149, "epoch": 4979} {"train_loss": -7.44366979598999, "global_step": 209150, "epoch": 4979} {"train_loss": -7.285984039306641, "global_step": 209151, "epoch": 4979} {"train_loss": -7.3131818771362305, "global_step": 209152, "epoch": 4979} {"train_loss": -7.41677188873291, "global_step": 209153, "epoch": 4979} {"train_loss": -7.411810874938965, "global_step": 209154, "epoch": 4979} {"train_loss": -7.43502140045166, "global_step": 209155, "epoch": 4979} {"train_loss": -7.392899036407471, "global_step": 209156, "epoch": 4979} {"train_loss": -7.405221939086914, "global_step": 209157, "epoch": 4979} {"train_loss": -7.3852996826171875, "global_step": 209158, "epoch": 4979} {"train_loss": -7.354892299288795, "global_step": 209159, "epoch": 4979, "val_loss": 69996.5625} {"train_loss": -7.590523719787598, "global_step": 209160, "epoch": 4980} {"train_loss": -7.307106018066406, "global_step": 209161, "epoch": 4980} {"train_loss": -7.361908912658691, "global_step": 209162, "epoch": 4980} {"train_loss": -7.497467041015625, "global_step": 209163, "epoch": 4980} {"train_loss": -7.433452606201172, "global_step": 209164, "epoch": 4980} {"train_loss": -7.209084510803223, "global_step": 209165, "epoch": 4980} {"train_loss": -7.38464879989624, "global_step": 209166, "epoch": 4980} {"train_loss": -7.278853416442871, "global_step": 209167, "epoch": 4980} {"train_loss": -7.300451278686523, "global_step": 209168, "epoch": 4980} {"train_loss": -7.487593173980713, "global_step": 209169, "epoch": 4980} {"train_loss": -7.316887855529785, "global_step": 209170, "epoch": 4980} {"train_loss": -7.3425421714782715, "global_step": 209171, "epoch": 4980} {"train_loss": -7.507543087005615, "global_step": 209172, "epoch": 4980} {"train_loss": -7.424280166625977, "global_step": 209173, "epoch": 4980} {"train_loss": -7.40549898147583, "global_step": 209174, "epoch": 4980} {"train_loss": -7.375565528869629, "global_step": 209175, "epoch": 4980} {"train_loss": -7.4397077560424805, "global_step": 209176, "epoch": 4980} {"train_loss": -7.403472900390625, "global_step": 209177, "epoch": 4980} {"train_loss": -7.40494441986084, "global_step": 209178, "epoch": 4980} {"train_loss": -7.312172889709473, "global_step": 209179, "epoch": 4980} {"train_loss": -7.339390754699707, "global_step": 209180, "epoch": 4980} {"train_loss": -7.433930397033691, "global_step": 209181, "epoch": 4980} {"train_loss": -7.4131622314453125, "global_step": 209182, "epoch": 4980} {"train_loss": -7.407678604125977, "global_step": 209183, "epoch": 4980} {"train_loss": -7.369697570800781, "global_step": 209184, "epoch": 4980} {"train_loss": -7.3401079177856445, "global_step": 209185, "epoch": 4980} {"train_loss": -7.412734031677246, "global_step": 209186, "epoch": 4980} {"train_loss": -7.423066139221191, "global_step": 209187, "epoch": 4980} {"train_loss": -7.35856819152832, "global_step": 209188, "epoch": 4980} {"train_loss": -7.469010353088379, "global_step": 209189, "epoch": 4980} {"train_loss": -7.402056694030762, "global_step": 209190, "epoch": 4980} {"train_loss": -7.364310264587402, "global_step": 209191, "epoch": 4980} {"train_loss": -7.442376613616943, "global_step": 209192, "epoch": 4980} {"train_loss": -7.376826286315918, "global_step": 209193, "epoch": 4980} {"train_loss": -7.4616570472717285, "global_step": 209194, "epoch": 4980} {"train_loss": -7.290327072143555, "global_step": 209195, "epoch": 4980} {"train_loss": -7.345161437988281, "global_step": 209196, "epoch": 4980} {"train_loss": -7.456136703491211, "global_step": 209197, "epoch": 4980} {"train_loss": -7.382999420166016, "global_step": 209198, "epoch": 4980} {"train_loss": -7.418705463409424, "global_step": 209199, "epoch": 4980} {"train_loss": -7.468983173370361, "global_step": 209200, "epoch": 4980} {"train_loss": -7.39583819253104, "global_step": 209201, "epoch": 4980, "val_loss": 70013.4375} {"train_loss": -7.35405969619751, "global_step": 209202, "epoch": 4981} {"train_loss": -7.44688606262207, "global_step": 209203, "epoch": 4981} {"train_loss": -7.383120059967041, "global_step": 209204, "epoch": 4981} {"train_loss": -7.429617404937744, "global_step": 209205, "epoch": 4981} {"train_loss": -7.297090530395508, "global_step": 209206, "epoch": 4981} {"train_loss": -7.316183090209961, "global_step": 209207, "epoch": 4981} {"train_loss": -7.226406097412109, "global_step": 209208, "epoch": 4981} {"train_loss": -7.389181613922119, "global_step": 209209, "epoch": 4981} {"train_loss": -7.388127326965332, "global_step": 209210, "epoch": 4981} {"train_loss": -7.216549873352051, "global_step": 209211, "epoch": 4981} {"train_loss": -7.332077980041504, "global_step": 209212, "epoch": 4981} {"train_loss": -7.320310592651367, "global_step": 209213, "epoch": 4981} {"train_loss": -7.252144813537598, "global_step": 209214, "epoch": 4981} {"train_loss": -7.284772872924805, "global_step": 209215, "epoch": 4981} {"train_loss": -7.384734153747559, "global_step": 209216, "epoch": 4981} {"train_loss": -7.22804069519043, "global_step": 209217, "epoch": 4981} {"train_loss": -7.257859706878662, "global_step": 209218, "epoch": 4981} {"train_loss": -7.299703598022461, "global_step": 209219, "epoch": 4981} {"train_loss": -7.2655348777771, "global_step": 209220, "epoch": 4981} {"train_loss": -7.401579856872559, "global_step": 209221, "epoch": 4981} {"train_loss": -7.163843154907227, "global_step": 209222, "epoch": 4981} {"train_loss": -7.428074836730957, "global_step": 209223, "epoch": 4981} {"train_loss": -7.340235710144043, "global_step": 209224, "epoch": 4981} {"train_loss": -7.352349281311035, "global_step": 209225, "epoch": 4981} {"train_loss": -7.210175514221191, "global_step": 209226, "epoch": 4981} {"train_loss": -7.253310680389404, "global_step": 209227, "epoch": 4981} {"train_loss": -7.2396087646484375, "global_step": 209228, "epoch": 4981} {"train_loss": -7.472839832305908, "global_step": 209229, "epoch": 4981} {"train_loss": -7.319846153259277, "global_step": 209230, "epoch": 4981} {"train_loss": -7.308802127838135, "global_step": 209231, "epoch": 4981} {"train_loss": -7.354645729064941, "global_step": 209232, "epoch": 4981} {"train_loss": -7.330909729003906, "global_step": 209233, "epoch": 4981} {"train_loss": -7.390181064605713, "global_step": 209234, "epoch": 4981} {"train_loss": -7.30195426940918, "global_step": 209235, "epoch": 4981} {"train_loss": -7.415793418884277, "global_step": 209236, "epoch": 4981} {"train_loss": -7.246294021606445, "global_step": 209237, "epoch": 4981} {"train_loss": -7.319607257843018, "global_step": 209238, "epoch": 4981} {"train_loss": -7.363156795501709, "global_step": 209239, "epoch": 4981} {"train_loss": -7.3031415939331055, "global_step": 209240, "epoch": 4981} {"train_loss": -7.311931610107422, "global_step": 209241, "epoch": 4981} {"train_loss": -7.204586029052734, "global_step": 209242, "epoch": 4981} {"train_loss": -7.319402024859474, "global_step": 209243, "epoch": 4981, "val_loss": 70250.8359375} {"train_loss": -7.239912033081055, "global_step": 209244, "epoch": 4982} {"train_loss": -7.253382682800293, "global_step": 209245, "epoch": 4982} {"train_loss": -7.237886905670166, "global_step": 209246, "epoch": 4982} {"train_loss": -7.257540702819824, "global_step": 209247, "epoch": 4982} {"train_loss": -7.420386791229248, "global_step": 209248, "epoch": 4982} {"train_loss": -7.1932902336120605, "global_step": 209249, "epoch": 4982} {"train_loss": -7.208552360534668, "global_step": 209250, "epoch": 4982} {"train_loss": -7.362415313720703, "global_step": 209251, "epoch": 4982} {"train_loss": -7.329531669616699, "global_step": 209252, "epoch": 4982} {"train_loss": -7.350037097930908, "global_step": 209253, "epoch": 4982} {"train_loss": -7.372035980224609, "global_step": 209254, "epoch": 4982} {"train_loss": -7.338092803955078, "global_step": 209255, "epoch": 4982} {"train_loss": -7.304500579833984, "global_step": 209256, "epoch": 4982} {"train_loss": -7.298719882965088, "global_step": 209257, "epoch": 4982} {"train_loss": -7.181528568267822, "global_step": 209258, "epoch": 4982} {"train_loss": -7.316862106323242, "global_step": 209259, "epoch": 4982} {"train_loss": -7.291536331176758, "global_step": 209260, "epoch": 4982} {"train_loss": -7.328661918640137, "global_step": 209261, "epoch": 4982} {"train_loss": -7.251229763031006, "global_step": 209262, "epoch": 4982} {"train_loss": -7.210631847381592, "global_step": 209263, "epoch": 4982} {"train_loss": -7.3466033935546875, "global_step": 209264, "epoch": 4982} {"train_loss": -7.3830952644348145, "global_step": 209265, "epoch": 4982} {"train_loss": -7.372337341308594, "global_step": 209266, "epoch": 4982} {"train_loss": -7.417507648468018, "global_step": 209267, "epoch": 4982} {"train_loss": -7.334465980529785, "global_step": 209268, "epoch": 4982} {"train_loss": -7.390378952026367, "global_step": 209269, "epoch": 4982} {"train_loss": -7.302883148193359, "global_step": 209270, "epoch": 4982} {"train_loss": -7.355895042419434, "global_step": 209271, "epoch": 4982} {"train_loss": -7.264157772064209, "global_step": 209272, "epoch": 4982} {"train_loss": -7.371302604675293, "global_step": 209273, "epoch": 4982} {"train_loss": -7.337601661682129, "global_step": 209274, "epoch": 4982} {"train_loss": -7.303086757659912, "global_step": 209275, "epoch": 4982} {"train_loss": -7.346805572509766, "global_step": 209276, "epoch": 4982} {"train_loss": -7.403541088104248, "global_step": 209277, "epoch": 4982} {"train_loss": -7.073614597320557, "global_step": 209278, "epoch": 4982} {"train_loss": -7.326476573944092, "global_step": 209279, "epoch": 4982} {"train_loss": -7.458377838134766, "global_step": 209280, "epoch": 4982} {"train_loss": -7.174195289611816, "global_step": 209281, "epoch": 4982} {"train_loss": -7.210379600524902, "global_step": 209282, "epoch": 4982} {"train_loss": -7.379636764526367, "global_step": 209283, "epoch": 4982} {"train_loss": -7.323857307434082, "global_step": 209284, "epoch": 4982} {"train_loss": -7.309216578801473, "global_step": 209285, "epoch": 4982, "val_loss": 70214.7109375} {"train_loss": -7.348668098449707, "global_step": 209286, "epoch": 4983} {"train_loss": -7.40886926651001, "global_step": 209287, "epoch": 4983} {"train_loss": -7.315622329711914, "global_step": 209288, "epoch": 4983} {"train_loss": -7.309170722961426, "global_step": 209289, "epoch": 4983} {"train_loss": -7.3487138748168945, "global_step": 209290, "epoch": 4983} {"train_loss": -7.433568000793457, "global_step": 209291, "epoch": 4983} {"train_loss": -7.323512554168701, "global_step": 209292, "epoch": 4983} {"train_loss": -7.34910774230957, "global_step": 209293, "epoch": 4983} {"train_loss": -7.398265361785889, "global_step": 209294, "epoch": 4983} {"train_loss": -7.368292808532715, "global_step": 209295, "epoch": 4983} {"train_loss": -7.340385437011719, "global_step": 209296, "epoch": 4983} {"train_loss": -7.365032196044922, "global_step": 209297, "epoch": 4983} {"train_loss": -7.391984939575195, "global_step": 209298, "epoch": 4983} {"train_loss": -7.316664218902588, "global_step": 209299, "epoch": 4983} {"train_loss": -7.429438591003418, "global_step": 209300, "epoch": 4983} {"train_loss": -7.417957305908203, "global_step": 209301, "epoch": 4983} {"train_loss": -7.2788896560668945, "global_step": 209302, "epoch": 4983} {"train_loss": -7.398061752319336, "global_step": 209303, "epoch": 4983} {"train_loss": -7.32392692565918, "global_step": 209304, "epoch": 4983} {"train_loss": -7.360029220581055, "global_step": 209305, "epoch": 4983} {"train_loss": -7.408411979675293, "global_step": 209306, "epoch": 4983} {"train_loss": -7.292871475219727, "global_step": 209307, "epoch": 4983} {"train_loss": -7.230640411376953, "global_step": 209308, "epoch": 4983} {"train_loss": -7.321257591247559, "global_step": 209309, "epoch": 4983} {"train_loss": -7.352602005004883, "global_step": 209310, "epoch": 4983} {"train_loss": -7.23609733581543, "global_step": 209311, "epoch": 4983} {"train_loss": -7.4007568359375, "global_step": 209312, "epoch": 4983} {"train_loss": -7.355152130126953, "global_step": 209313, "epoch": 4983} {"train_loss": -7.367012023925781, "global_step": 209314, "epoch": 4983} {"train_loss": -7.287698268890381, "global_step": 209315, "epoch": 4983} {"train_loss": -7.259392738342285, "global_step": 209316, "epoch": 4983} {"train_loss": -7.256156921386719, "global_step": 209317, "epoch": 4983} {"train_loss": -7.299264907836914, "global_step": 209318, "epoch": 4983} {"train_loss": -7.299149990081787, "global_step": 209319, "epoch": 4983} {"train_loss": -7.280731201171875, "global_step": 209320, "epoch": 4983} {"train_loss": -7.275118827819824, "global_step": 209321, "epoch": 4983} {"train_loss": -7.235454559326172, "global_step": 209322, "epoch": 4983} {"train_loss": -7.172205924987793, "global_step": 209323, "epoch": 4983} {"train_loss": -7.133106231689453, "global_step": 209324, "epoch": 4983} {"train_loss": -7.344517707824707, "global_step": 209325, "epoch": 4983} {"train_loss": -7.264007091522217, "global_step": 209326, "epoch": 4983} {"train_loss": -7.320536829176403, "global_step": 209327, "epoch": 4983, "val_loss": 70260.71875} {"train_loss": -7.248550891876221, "global_step": 209328, "epoch": 4984} {"train_loss": -7.2780561447143555, "global_step": 209329, "epoch": 4984} {"train_loss": -7.1208696365356445, "global_step": 209330, "epoch": 4984} {"train_loss": -7.378628730773926, "global_step": 209331, "epoch": 4984} {"train_loss": -7.200714111328125, "global_step": 209332, "epoch": 4984} {"train_loss": -7.169701099395752, "global_step": 209333, "epoch": 4984} {"train_loss": -7.277928352355957, "global_step": 209334, "epoch": 4984} {"train_loss": -7.162029266357422, "global_step": 209335, "epoch": 4984} {"train_loss": -7.275768280029297, "global_step": 209336, "epoch": 4984} {"train_loss": -7.132758617401123, "global_step": 209337, "epoch": 4984} {"train_loss": -7.142806053161621, "global_step": 209338, "epoch": 4984} {"train_loss": -7.3723063468933105, "global_step": 209339, "epoch": 4984} {"train_loss": -7.198412895202637, "global_step": 209340, "epoch": 4984} {"train_loss": -7.370156764984131, "global_step": 209341, "epoch": 4984} {"train_loss": -7.238961219787598, "global_step": 209342, "epoch": 4984} {"train_loss": -7.261483192443848, "global_step": 209343, "epoch": 4984} {"train_loss": -7.259108066558838, "global_step": 209344, "epoch": 4984} {"train_loss": -7.365790367126465, "global_step": 209345, "epoch": 4984} {"train_loss": -7.267662048339844, "global_step": 209346, "epoch": 4984} {"train_loss": -7.1428751945495605, "global_step": 209347, "epoch": 4984} {"train_loss": -7.439152717590332, "global_step": 209348, "epoch": 4984} {"train_loss": -7.17207145690918, "global_step": 209349, "epoch": 4984} {"train_loss": -7.417187690734863, "global_step": 209350, "epoch": 4984} {"train_loss": -7.2953901290893555, "global_step": 209351, "epoch": 4984} {"train_loss": -7.293861389160156, "global_step": 209352, "epoch": 4984} {"train_loss": -7.277654647827148, "global_step": 209353, "epoch": 4984} {"train_loss": -7.432343482971191, "global_step": 209354, "epoch": 4984} {"train_loss": -7.459888458251953, "global_step": 209355, "epoch": 4984} {"train_loss": -7.334955215454102, "global_step": 209356, "epoch": 4984} {"train_loss": -7.326489448547363, "global_step": 209357, "epoch": 4984} {"train_loss": -7.3326849937438965, "global_step": 209358, "epoch": 4984} {"train_loss": -7.314356803894043, "global_step": 209359, "epoch": 4984} {"train_loss": -7.403733253479004, "global_step": 209360, "epoch": 4984} {"train_loss": -7.47486686706543, "global_step": 209361, "epoch": 4984} {"train_loss": -7.305469512939453, "global_step": 209362, "epoch": 4984} {"train_loss": -7.413621425628662, "global_step": 209363, "epoch": 4984} {"train_loss": -7.271756649017334, "global_step": 209364, "epoch": 4984} {"train_loss": -7.354822158813477, "global_step": 209365, "epoch": 4984} {"train_loss": -7.339801788330078, "global_step": 209366, "epoch": 4984} {"train_loss": -7.422811508178711, "global_step": 209367, "epoch": 4984} {"train_loss": -7.519440174102783, "global_step": 209368, "epoch": 4984} {"train_loss": -7.305823780241466, "global_step": 209369, "epoch": 4984, "val_loss": 70077.9453125} {"train_loss": -7.397467613220215, "global_step": 209370, "epoch": 4985} {"train_loss": -7.484676361083984, "global_step": 209371, "epoch": 4985} {"train_loss": -7.370091438293457, "global_step": 209372, "epoch": 4985} {"train_loss": -7.459814071655273, "global_step": 209373, "epoch": 4985} {"train_loss": -7.375027656555176, "global_step": 209374, "epoch": 4985} {"train_loss": -7.382501125335693, "global_step": 209375, "epoch": 4985} {"train_loss": -7.256872177124023, "global_step": 209376, "epoch": 4985} {"train_loss": -7.278947353363037, "global_step": 209377, "epoch": 4985} {"train_loss": -7.139589786529541, "global_step": 209378, "epoch": 4985} {"train_loss": -7.345686435699463, "global_step": 209379, "epoch": 4985} {"train_loss": -7.321270942687988, "global_step": 209380, "epoch": 4985} {"train_loss": -7.301239013671875, "global_step": 209381, "epoch": 4985} {"train_loss": -7.358310699462891, "global_step": 209382, "epoch": 4985} {"train_loss": -7.360699653625488, "global_step": 209383, "epoch": 4985} {"train_loss": -7.450723648071289, "global_step": 209384, "epoch": 4985} {"train_loss": -7.422702789306641, "global_step": 209385, "epoch": 4985} {"train_loss": -7.346395492553711, "global_step": 209386, "epoch": 4985} {"train_loss": -7.454005241394043, "global_step": 209387, "epoch": 4985} {"train_loss": -7.257394313812256, "global_step": 209388, "epoch": 4985} {"train_loss": -7.34550666809082, "global_step": 209389, "epoch": 4985} {"train_loss": -7.33452033996582, "global_step": 209390, "epoch": 4985} {"train_loss": -7.3333940505981445, "global_step": 209391, "epoch": 4985} {"train_loss": -7.368367671966553, "global_step": 209392, "epoch": 4985} {"train_loss": -7.299765586853027, "global_step": 209393, "epoch": 4985} {"train_loss": -7.342601776123047, "global_step": 209394, "epoch": 4985} {"train_loss": -7.3634748458862305, "global_step": 209395, "epoch": 4985} {"train_loss": -7.359434127807617, "global_step": 209396, "epoch": 4985} {"train_loss": -7.332388877868652, "global_step": 209397, "epoch": 4985} {"train_loss": -7.291686534881592, "global_step": 209398, "epoch": 4985} {"train_loss": -7.342554092407227, "global_step": 209399, "epoch": 4985} {"train_loss": -7.350362777709961, "global_step": 209400, "epoch": 4985} {"train_loss": -7.325579643249512, "global_step": 209401, "epoch": 4985} {"train_loss": -7.17497444152832, "global_step": 209402, "epoch": 4985} {"train_loss": -7.209970474243164, "global_step": 209403, "epoch": 4985} {"train_loss": -7.151535987854004, "global_step": 209404, "epoch": 4985} {"train_loss": -7.356943130493164, "global_step": 209405, "epoch": 4985} {"train_loss": -7.221792221069336, "global_step": 209406, "epoch": 4985} {"train_loss": -7.245920181274414, "global_step": 209407, "epoch": 4985} {"train_loss": -7.281168460845947, "global_step": 209408, "epoch": 4985} {"train_loss": -7.256078720092773, "global_step": 209409, "epoch": 4985} {"train_loss": -7.281244277954102, "global_step": 209410, "epoch": 4985} {"train_loss": -7.3224235489254905, "global_step": 209411, "epoch": 4985, "val_loss": 70079.171875} {"train_loss": -7.163607597351074, "global_step": 209412, "epoch": 4986} {"train_loss": -7.325905799865723, "global_step": 209413, "epoch": 4986} {"train_loss": -7.029500961303711, "global_step": 209414, "epoch": 4986} {"train_loss": -7.30355978012085, "global_step": 209415, "epoch": 4986} {"train_loss": -7.072141647338867, "global_step": 209416, "epoch": 4986} {"train_loss": -7.289002895355225, "global_step": 209417, "epoch": 4986} {"train_loss": -7.186539649963379, "global_step": 209418, "epoch": 4986} {"train_loss": -7.324830055236816, "global_step": 209419, "epoch": 4986} {"train_loss": -7.432011604309082, "global_step": 209420, "epoch": 4986} {"train_loss": -7.26669979095459, "global_step": 209421, "epoch": 4986} {"train_loss": -7.333762168884277, "global_step": 209422, "epoch": 4986} {"train_loss": -7.263840675354004, "global_step": 209423, "epoch": 4986} {"train_loss": -7.230152606964111, "global_step": 209424, "epoch": 4986} {"train_loss": -7.338644504547119, "global_step": 209425, "epoch": 4986} {"train_loss": -7.394757270812988, "global_step": 209426, "epoch": 4986} {"train_loss": -7.348971366882324, "global_step": 209427, "epoch": 4986} {"train_loss": -7.338287353515625, "global_step": 209428, "epoch": 4986} {"train_loss": -7.25745153427124, "global_step": 209429, "epoch": 4986} {"train_loss": -7.272439002990723, "global_step": 209430, "epoch": 4986} {"train_loss": -7.334869384765625, "global_step": 209431, "epoch": 4986} {"train_loss": -7.262896537780762, "global_step": 209432, "epoch": 4986} {"train_loss": -7.367419242858887, "global_step": 209433, "epoch": 4986} {"train_loss": -7.307102203369141, "global_step": 209434, "epoch": 4986} {"train_loss": -7.358788013458252, "global_step": 209435, "epoch": 4986} {"train_loss": -7.3101606369018555, "global_step": 209436, "epoch": 4986} {"train_loss": -7.295759677886963, "global_step": 209437, "epoch": 4986} {"train_loss": -7.261516571044922, "global_step": 209438, "epoch": 4986} {"train_loss": -7.331666946411133, "global_step": 209439, "epoch": 4986} {"train_loss": -7.378373622894287, "global_step": 209440, "epoch": 4986} {"train_loss": -7.390716075897217, "global_step": 209441, "epoch": 4986} {"train_loss": -7.363649368286133, "global_step": 209442, "epoch": 4986} {"train_loss": -7.4064483642578125, "global_step": 209443, "epoch": 4986} {"train_loss": -7.28300142288208, "global_step": 209444, "epoch": 4986} {"train_loss": -7.350647926330566, "global_step": 209445, "epoch": 4986} {"train_loss": -7.394899368286133, "global_step": 209446, "epoch": 4986} {"train_loss": -7.360300064086914, "global_step": 209447, "epoch": 4986} {"train_loss": -7.330167770385742, "global_step": 209448, "epoch": 4986} {"train_loss": -7.391434669494629, "global_step": 209449, "epoch": 4986} {"train_loss": -7.365102767944336, "global_step": 209450, "epoch": 4986} {"train_loss": -7.344286918640137, "global_step": 209451, "epoch": 4986} {"train_loss": -7.420320510864258, "global_step": 209452, "epoch": 4986} {"train_loss": -7.313233420962379, "global_step": 209453, "epoch": 4986, "val_loss": 70195.4921875} {"train_loss": -7.288380146026611, "global_step": 209454, "epoch": 4987} {"train_loss": -7.3970537185668945, "global_step": 209455, "epoch": 4987} {"train_loss": -7.424068927764893, "global_step": 209456, "epoch": 4987} {"train_loss": -7.35563850402832, "global_step": 209457, "epoch": 4987} {"train_loss": -7.377645492553711, "global_step": 209458, "epoch": 4987} {"train_loss": -7.2301554679870605, "global_step": 209459, "epoch": 4987} {"train_loss": -7.297624588012695, "global_step": 209460, "epoch": 4987} {"train_loss": -7.240812301635742, "global_step": 209461, "epoch": 4987} {"train_loss": -7.245322227478027, "global_step": 209462, "epoch": 4987} {"train_loss": -7.282520294189453, "global_step": 209463, "epoch": 4987} {"train_loss": -7.3295111656188965, "global_step": 209464, "epoch": 4987} {"train_loss": -7.361215114593506, "global_step": 209465, "epoch": 4987} {"train_loss": -7.305147647857666, "global_step": 209466, "epoch": 4987} {"train_loss": -7.242356777191162, "global_step": 209467, "epoch": 4987} {"train_loss": -7.312399864196777, "global_step": 209468, "epoch": 4987} {"train_loss": -7.363823890686035, "global_step": 209469, "epoch": 4987} {"train_loss": -7.317739486694336, "global_step": 209470, "epoch": 4987} {"train_loss": -7.343340873718262, "global_step": 209471, "epoch": 4987} {"train_loss": -7.374159336090088, "global_step": 209472, "epoch": 4987} {"train_loss": -7.359235763549805, "global_step": 209473, "epoch": 4987} {"train_loss": -7.484251499176025, "global_step": 209474, "epoch": 4987} {"train_loss": -7.3979082107543945, "global_step": 209475, "epoch": 4987} {"train_loss": -7.414547920227051, "global_step": 209476, "epoch": 4987} {"train_loss": -7.48153018951416, "global_step": 209477, "epoch": 4987} {"train_loss": -7.439845561981201, "global_step": 209478, "epoch": 4987} {"train_loss": -7.312891960144043, "global_step": 209479, "epoch": 4987} {"train_loss": -7.414387226104736, "global_step": 209480, "epoch": 4987} {"train_loss": -7.418351173400879, "global_step": 209481, "epoch": 4987} {"train_loss": -7.490349769592285, "global_step": 209482, "epoch": 4987} {"train_loss": -7.30220890045166, "global_step": 209483, "epoch": 4987} {"train_loss": -7.338863372802734, "global_step": 209484, "epoch": 4987} {"train_loss": -7.218857765197754, "global_step": 209485, "epoch": 4987} {"train_loss": -7.3606390953063965, "global_step": 209486, "epoch": 4987} {"train_loss": -7.329644203186035, "global_step": 209487, "epoch": 4987} {"train_loss": -7.371428489685059, "global_step": 209488, "epoch": 4987} {"train_loss": -7.221380710601807, "global_step": 209489, "epoch": 4987} {"train_loss": -7.281349182128906, "global_step": 209490, "epoch": 4987} {"train_loss": -7.267209053039551, "global_step": 209491, "epoch": 4987} {"train_loss": -7.310765266418457, "global_step": 209492, "epoch": 4987} {"train_loss": -7.295510768890381, "global_step": 209493, "epoch": 4987} {"train_loss": -7.238076686859131, "global_step": 209494, "epoch": 4987} {"train_loss": -7.336442084539504, "global_step": 209495, "epoch": 4987, "val_loss": 70135.8125} {"train_loss": -7.240755081176758, "global_step": 209496, "epoch": 4988} {"train_loss": -7.324970722198486, "global_step": 209497, "epoch": 4988} {"train_loss": -7.4133100509643555, "global_step": 209498, "epoch": 4988} {"train_loss": -7.263042449951172, "global_step": 209499, "epoch": 4988} {"train_loss": -7.347585678100586, "global_step": 209500, "epoch": 4988} {"train_loss": -7.238907814025879, "global_step": 209501, "epoch": 4988} {"train_loss": -7.471114158630371, "global_step": 209502, "epoch": 4988} {"train_loss": -7.412125587463379, "global_step": 209503, "epoch": 4988} {"train_loss": -7.171270847320557, "global_step": 209504, "epoch": 4988} {"train_loss": -7.341198921203613, "global_step": 209505, "epoch": 4988} {"train_loss": -7.193647384643555, "global_step": 209506, "epoch": 4988} {"train_loss": -7.373941421508789, "global_step": 209507, "epoch": 4988} {"train_loss": -7.31973934173584, "global_step": 209508, "epoch": 4988} {"train_loss": -7.340484619140625, "global_step": 209509, "epoch": 4988} {"train_loss": -7.266191482543945, "global_step": 209510, "epoch": 4988} {"train_loss": -7.31394100189209, "global_step": 209511, "epoch": 4988} {"train_loss": -7.141684532165527, "global_step": 209512, "epoch": 4988} {"train_loss": -7.373236179351807, "global_step": 209513, "epoch": 4988} {"train_loss": -7.267147541046143, "global_step": 209514, "epoch": 4988} {"train_loss": -7.040952682495117, "global_step": 209515, "epoch": 4988} {"train_loss": -7.369420051574707, "global_step": 209516, "epoch": 4988} {"train_loss": -7.139636039733887, "global_step": 209517, "epoch": 4988} {"train_loss": -7.247347354888916, "global_step": 209518, "epoch": 4988} {"train_loss": -7.26143217086792, "global_step": 209519, "epoch": 4988} {"train_loss": -7.329845428466797, "global_step": 209520, "epoch": 4988} {"train_loss": -7.335665702819824, "global_step": 209521, "epoch": 4988} {"train_loss": -7.221292495727539, "global_step": 209522, "epoch": 4988} {"train_loss": -7.34480619430542, "global_step": 209523, "epoch": 4988} {"train_loss": -7.220363616943359, "global_step": 209524, "epoch": 4988} {"train_loss": -7.348172187805176, "global_step": 209525, "epoch": 4988} {"train_loss": -7.239322662353516, "global_step": 209526, "epoch": 4988} {"train_loss": -7.395538330078125, "global_step": 209527, "epoch": 4988} {"train_loss": -7.250225067138672, "global_step": 209528, "epoch": 4988} {"train_loss": -7.351696968078613, "global_step": 209529, "epoch": 4988} {"train_loss": -7.349562644958496, "global_step": 209530, "epoch": 4988} {"train_loss": -7.329078674316406, "global_step": 209531, "epoch": 4988} {"train_loss": -7.3116455078125, "global_step": 209532, "epoch": 4988} {"train_loss": -7.3703293800354, "global_step": 209533, "epoch": 4988} {"train_loss": -7.366595268249512, "global_step": 209534, "epoch": 4988} {"train_loss": -7.3923234939575195, "global_step": 209535, "epoch": 4988} {"train_loss": -7.315028190612793, "global_step": 209536, "epoch": 4988} {"train_loss": -7.301448617662702, "global_step": 209537, "epoch": 4988, "val_loss": 70116.75} {"train_loss": -7.3052978515625, "global_step": 209538, "epoch": 4989} {"train_loss": -7.433089733123779, "global_step": 209539, "epoch": 4989} {"train_loss": -7.327792644500732, "global_step": 209540, "epoch": 4989} {"train_loss": -7.274942398071289, "global_step": 209541, "epoch": 4989} {"train_loss": -7.339895248413086, "global_step": 209542, "epoch": 4989} {"train_loss": -7.362781524658203, "global_step": 209543, "epoch": 4989} {"train_loss": -7.332187652587891, "global_step": 209544, "epoch": 4989} {"train_loss": -7.41147518157959, "global_step": 209545, "epoch": 4989} {"train_loss": -7.2908935546875, "global_step": 209546, "epoch": 4989} {"train_loss": -7.360240936279297, "global_step": 209547, "epoch": 4989} {"train_loss": -7.311349868774414, "global_step": 209548, "epoch": 4989} {"train_loss": -7.340841293334961, "global_step": 209549, "epoch": 4989} {"train_loss": -7.394686222076416, "global_step": 209550, "epoch": 4989} {"train_loss": -7.30947208404541, "global_step": 209551, "epoch": 4989} {"train_loss": -7.423370838165283, "global_step": 209552, "epoch": 4989} {"train_loss": -7.346753120422363, "global_step": 209553, "epoch": 4989} {"train_loss": -7.452602386474609, "global_step": 209554, "epoch": 4989} {"train_loss": -7.379544258117676, "global_step": 209555, "epoch": 4989} {"train_loss": -7.334784507751465, "global_step": 209556, "epoch": 4989} {"train_loss": -7.411696434020996, "global_step": 209557, "epoch": 4989} {"train_loss": -7.387546539306641, "global_step": 209558, "epoch": 4989} {"train_loss": -7.425591945648193, "global_step": 209559, "epoch": 4989} {"train_loss": -7.4046783447265625, "global_step": 209560, "epoch": 4989} {"train_loss": -7.4291510581970215, "global_step": 209561, "epoch": 4989} {"train_loss": -7.345387935638428, "global_step": 209562, "epoch": 4989} {"train_loss": -7.376541614532471, "global_step": 209563, "epoch": 4989} {"train_loss": -7.226042747497559, "global_step": 209564, "epoch": 4989} {"train_loss": -7.332303047180176, "global_step": 209565, "epoch": 4989} {"train_loss": -7.405805587768555, "global_step": 209566, "epoch": 4989} {"train_loss": -7.297883033752441, "global_step": 209567, "epoch": 4989} {"train_loss": -7.381098747253418, "global_step": 209568, "epoch": 4989} {"train_loss": -7.295830726623535, "global_step": 209569, "epoch": 4989} {"train_loss": -7.492158889770508, "global_step": 209570, "epoch": 4989} {"train_loss": -7.233041286468506, "global_step": 209571, "epoch": 4989} {"train_loss": -7.328664779663086, "global_step": 209572, "epoch": 4989} {"train_loss": -7.438516616821289, "global_step": 209573, "epoch": 4989} {"train_loss": -7.330362796783447, "global_step": 209574, "epoch": 4989} {"train_loss": -7.26019287109375, "global_step": 209575, "epoch": 4989} {"train_loss": -7.415374755859375, "global_step": 209576, "epoch": 4989} {"train_loss": -7.416326522827148, "global_step": 209577, "epoch": 4989} {"train_loss": -7.2744903564453125, "global_step": 209578, "epoch": 4989} {"train_loss": -7.357044730867658, "global_step": 209579, "epoch": 4989, "val_loss": 70148.9921875} {"train_loss": -7.396115303039551, "global_step": 209580, "epoch": 4990} {"train_loss": -7.275299549102783, "global_step": 209581, "epoch": 4990} {"train_loss": -7.357692718505859, "global_step": 209582, "epoch": 4990} {"train_loss": -7.266608238220215, "global_step": 209583, "epoch": 4990} {"train_loss": -7.280435562133789, "global_step": 209584, "epoch": 4990} {"train_loss": -7.332840919494629, "global_step": 209585, "epoch": 4990} {"train_loss": -7.439842224121094, "global_step": 209586, "epoch": 4990} {"train_loss": -7.247286796569824, "global_step": 209587, "epoch": 4990} {"train_loss": -7.460879325866699, "global_step": 209588, "epoch": 4990} {"train_loss": -7.341874122619629, "global_step": 209589, "epoch": 4990} {"train_loss": -7.437618732452393, "global_step": 209590, "epoch": 4990} {"train_loss": -7.421306133270264, "global_step": 209591, "epoch": 4990} {"train_loss": -7.215855121612549, "global_step": 209592, "epoch": 4990} {"train_loss": -7.36209774017334, "global_step": 209593, "epoch": 4990} {"train_loss": -7.272815704345703, "global_step": 209594, "epoch": 4990} {"train_loss": -7.269296646118164, "global_step": 209595, "epoch": 4990} {"train_loss": -7.290421485900879, "global_step": 209596, "epoch": 4990} {"train_loss": -7.2810587882995605, "global_step": 209597, "epoch": 4990} {"train_loss": -7.341886520385742, "global_step": 209598, "epoch": 4990} {"train_loss": -7.364156723022461, "global_step": 209599, "epoch": 4990} {"train_loss": -7.348361968994141, "global_step": 209600, "epoch": 4990} {"train_loss": -7.3794450759887695, "global_step": 209601, "epoch": 4990} {"train_loss": -7.3251118659973145, "global_step": 209602, "epoch": 4990} {"train_loss": -7.308919429779053, "global_step": 209603, "epoch": 4990} {"train_loss": -7.25224494934082, "global_step": 209604, "epoch": 4990} {"train_loss": -7.286951065063477, "global_step": 209605, "epoch": 4990} {"train_loss": -7.328606128692627, "global_step": 209606, "epoch": 4990} {"train_loss": -7.29833984375, "global_step": 209607, "epoch": 4990} {"train_loss": -7.487987518310547, "global_step": 209608, "epoch": 4990} {"train_loss": -7.347909450531006, "global_step": 209609, "epoch": 4990} {"train_loss": -7.312655448913574, "global_step": 209610, "epoch": 4990} {"train_loss": -7.4123735427856445, "global_step": 209611, "epoch": 4990} {"train_loss": -7.324989318847656, "global_step": 209612, "epoch": 4990} {"train_loss": -7.271642208099365, "global_step": 209613, "epoch": 4990} {"train_loss": -7.206011772155762, "global_step": 209614, "epoch": 4990} {"train_loss": -7.397983074188232, "global_step": 209615, "epoch": 4990} {"train_loss": -7.470793724060059, "global_step": 209616, "epoch": 4990} {"train_loss": -7.298521041870117, "global_step": 209617, "epoch": 4990} {"train_loss": -7.457432746887207, "global_step": 209618, "epoch": 4990} {"train_loss": -7.412403583526611, "global_step": 209619, "epoch": 4990} {"train_loss": -7.387953281402588, "global_step": 209620, "epoch": 4990} {"train_loss": -7.342775163196382, "global_step": 209621, "epoch": 4990, "val_loss": 70100.5390625} {"train_loss": -7.328901767730713, "global_step": 209622, "epoch": 4991} {"train_loss": -7.379120349884033, "global_step": 209623, "epoch": 4991} {"train_loss": -7.364614009857178, "global_step": 209624, "epoch": 4991} {"train_loss": -7.346421718597412, "global_step": 209625, "epoch": 4991} {"train_loss": -7.414897918701172, "global_step": 209626, "epoch": 4991} {"train_loss": -7.337965965270996, "global_step": 209627, "epoch": 4991} {"train_loss": -7.3060832023620605, "global_step": 209628, "epoch": 4991} {"train_loss": -7.374788284301758, "global_step": 209629, "epoch": 4991} {"train_loss": -7.354001045227051, "global_step": 209630, "epoch": 4991} {"train_loss": -7.2830610275268555, "global_step": 209631, "epoch": 4991} {"train_loss": -7.284124374389648, "global_step": 209632, "epoch": 4991} {"train_loss": -7.238245010375977, "global_step": 209633, "epoch": 4991} {"train_loss": -7.291275978088379, "global_step": 209634, "epoch": 4991} {"train_loss": -7.407084941864014, "global_step": 209635, "epoch": 4991} {"train_loss": -7.225465297698975, "global_step": 209636, "epoch": 4991} {"train_loss": -7.2493577003479, "global_step": 209637, "epoch": 4991} {"train_loss": -7.481940269470215, "global_step": 209638, "epoch": 4991} {"train_loss": -7.232730865478516, "global_step": 209639, "epoch": 4991} {"train_loss": -7.370576858520508, "global_step": 209640, "epoch": 4991} {"train_loss": -7.321303844451904, "global_step": 209641, "epoch": 4991} {"train_loss": -7.164397239685059, "global_step": 209642, "epoch": 4991} {"train_loss": -7.209601879119873, "global_step": 209643, "epoch": 4991} {"train_loss": -7.164076805114746, "global_step": 209644, "epoch": 4991} {"train_loss": -7.108474254608154, "global_step": 209645, "epoch": 4991} {"train_loss": -7.268013000488281, "global_step": 209646, "epoch": 4991} {"train_loss": -7.192367076873779, "global_step": 209647, "epoch": 4991} {"train_loss": -7.208873271942139, "global_step": 209648, "epoch": 4991} {"train_loss": -7.200318336486816, "global_step": 209649, "epoch": 4991} {"train_loss": -7.213593006134033, "global_step": 209650, "epoch": 4991} {"train_loss": -7.205687046051025, "global_step": 209651, "epoch": 4991} {"train_loss": -7.058131694793701, "global_step": 209652, "epoch": 4991} {"train_loss": -7.167291641235352, "global_step": 209653, "epoch": 4991} {"train_loss": -6.975837707519531, "global_step": 209654, "epoch": 4991} {"train_loss": -7.458192825317383, "global_step": 209655, "epoch": 4991} {"train_loss": -7.158397674560547, "global_step": 209656, "epoch": 4991} {"train_loss": -7.188357353210449, "global_step": 209657, "epoch": 4991} {"train_loss": -7.2986836433410645, "global_step": 209658, "epoch": 4991} {"train_loss": -7.1424407958984375, "global_step": 209659, "epoch": 4991} {"train_loss": -7.237089157104492, "global_step": 209660, "epoch": 4991} {"train_loss": -7.182823657989502, "global_step": 209661, "epoch": 4991} {"train_loss": -7.180286407470703, "global_step": 209662, "epoch": 4991} {"train_loss": -7.2571249689374655, "global_step": 209663, "epoch": 4991, "val_loss": 69973.765625} {"train_loss": -7.367776393890381, "global_step": 209664, "epoch": 4992} {"train_loss": -7.246915340423584, "global_step": 209665, "epoch": 4992} {"train_loss": -7.416622161865234, "global_step": 209666, "epoch": 4992} {"train_loss": -7.356345176696777, "global_step": 209667, "epoch": 4992} {"train_loss": -7.319731712341309, "global_step": 209668, "epoch": 4992} {"train_loss": -7.24733304977417, "global_step": 209669, "epoch": 4992} {"train_loss": -7.430643558502197, "global_step": 209670, "epoch": 4992} {"train_loss": -7.356815338134766, "global_step": 209671, "epoch": 4992} {"train_loss": -7.360661506652832, "global_step": 209672, "epoch": 4992} {"train_loss": -7.363705158233643, "global_step": 209673, "epoch": 4992} {"train_loss": -7.373225688934326, "global_step": 209674, "epoch": 4992} {"train_loss": -7.3466267585754395, "global_step": 209675, "epoch": 4992} {"train_loss": -7.314774036407471, "global_step": 209676, "epoch": 4992} {"train_loss": -7.385190486907959, "global_step": 209677, "epoch": 4992} {"train_loss": -7.324241638183594, "global_step": 209678, "epoch": 4992} {"train_loss": -7.337616920471191, "global_step": 209679, "epoch": 4992} {"train_loss": -7.38855504989624, "global_step": 209680, "epoch": 4992} {"train_loss": -7.3101325035095215, "global_step": 209681, "epoch": 4992} {"train_loss": -7.400823593139648, "global_step": 209682, "epoch": 4992} {"train_loss": -7.335996627807617, "global_step": 209683, "epoch": 4992} {"train_loss": -7.334405899047852, "global_step": 209684, "epoch": 4992} {"train_loss": -7.31227445602417, "global_step": 209685, "epoch": 4992} {"train_loss": -7.356170654296875, "global_step": 209686, "epoch": 4992} {"train_loss": -7.345554351806641, "global_step": 209687, "epoch": 4992} {"train_loss": -7.3821306228637695, "global_step": 209688, "epoch": 4992} {"train_loss": -7.208227157592773, "global_step": 209689, "epoch": 4992} {"train_loss": -7.399039268493652, "global_step": 209690, "epoch": 4992} {"train_loss": -7.2609028816223145, "global_step": 209691, "epoch": 4992} {"train_loss": -7.288083076477051, "global_step": 209692, "epoch": 4992} {"train_loss": -7.351966381072998, "global_step": 209693, "epoch": 4992} {"train_loss": -7.293517589569092, "global_step": 209694, "epoch": 4992} {"train_loss": -7.291201591491699, "global_step": 209695, "epoch": 4992} {"train_loss": -7.2380900382995605, "global_step": 209696, "epoch": 4992} {"train_loss": -7.231695652008057, "global_step": 209697, "epoch": 4992} {"train_loss": -7.242481231689453, "global_step": 209698, "epoch": 4992} {"train_loss": -7.308136940002441, "global_step": 209699, "epoch": 4992} {"train_loss": -7.269630432128906, "global_step": 209700, "epoch": 4992} {"train_loss": -7.256584644317627, "global_step": 209701, "epoch": 4992} {"train_loss": -7.248173713684082, "global_step": 209702, "epoch": 4992} {"train_loss": -7.285900115966797, "global_step": 209703, "epoch": 4992} {"train_loss": -7.360562801361084, "global_step": 209704, "epoch": 4992} {"train_loss": -7.321897563480196, "global_step": 209705, "epoch": 4992, "val_loss": 70072.6328125} {"train_loss": -7.303528308868408, "global_step": 209706, "epoch": 4993} {"train_loss": -7.354885578155518, "global_step": 209707, "epoch": 4993} {"train_loss": -7.27493953704834, "global_step": 209708, "epoch": 4993} {"train_loss": -7.260432720184326, "global_step": 209709, "epoch": 4993} {"train_loss": -7.313282489776611, "global_step": 209710, "epoch": 4993} {"train_loss": -7.409560203552246, "global_step": 209711, "epoch": 4993} {"train_loss": -7.307474136352539, "global_step": 209712, "epoch": 4993} {"train_loss": -7.296298980712891, "global_step": 209713, "epoch": 4993} {"train_loss": -7.297233581542969, "global_step": 209714, "epoch": 4993} {"train_loss": -7.447869777679443, "global_step": 209715, "epoch": 4993} {"train_loss": -7.266574382781982, "global_step": 209716, "epoch": 4993} {"train_loss": -7.318100929260254, "global_step": 209717, "epoch": 4993} {"train_loss": -7.393280982971191, "global_step": 209718, "epoch": 4993} {"train_loss": -7.245569229125977, "global_step": 209719, "epoch": 4993} {"train_loss": -7.329695701599121, "global_step": 209720, "epoch": 4993} {"train_loss": -7.395568370819092, "global_step": 209721, "epoch": 4993} {"train_loss": -7.306074142456055, "global_step": 209722, "epoch": 4993} {"train_loss": -7.36175012588501, "global_step": 209723, "epoch": 4993} {"train_loss": -7.396146297454834, "global_step": 209724, "epoch": 4993} {"train_loss": -7.322163105010986, "global_step": 209725, "epoch": 4993} {"train_loss": -7.431800365447998, "global_step": 209726, "epoch": 4993} {"train_loss": -7.34271240234375, "global_step": 209727, "epoch": 4993} {"train_loss": -7.278494834899902, "global_step": 209728, "epoch": 4993} {"train_loss": -7.420099258422852, "global_step": 209729, "epoch": 4993} {"train_loss": -7.407939910888672, "global_step": 209730, "epoch": 4993} {"train_loss": -7.410743236541748, "global_step": 209731, "epoch": 4993} {"train_loss": -7.469234943389893, "global_step": 209732, "epoch": 4993} {"train_loss": -7.509051322937012, "global_step": 209733, "epoch": 4993} {"train_loss": -7.496399879455566, "global_step": 209734, "epoch": 4993} {"train_loss": -7.315435886383057, "global_step": 209735, "epoch": 4993} {"train_loss": -7.3868255615234375, "global_step": 209736, "epoch": 4993} {"train_loss": -7.336514472961426, "global_step": 209737, "epoch": 4993} {"train_loss": -7.401867866516113, "global_step": 209738, "epoch": 4993} {"train_loss": -7.310037136077881, "global_step": 209739, "epoch": 4993} {"train_loss": -7.444356918334961, "global_step": 209740, "epoch": 4993} {"train_loss": -7.406668663024902, "global_step": 209741, "epoch": 4993} {"train_loss": -7.425101280212402, "global_step": 209742, "epoch": 4993} {"train_loss": -7.381527900695801, "global_step": 209743, "epoch": 4993} {"train_loss": -7.302393913269043, "global_step": 209744, "epoch": 4993} {"train_loss": -7.402259826660156, "global_step": 209745, "epoch": 4993} {"train_loss": -7.24364709854126, "global_step": 209746, "epoch": 4993} {"train_loss": -7.357449054718018, "global_step": 209747, "epoch": 4993, "val_loss": 69983.0546875} {"train_loss": -7.492462635040283, "global_step": 209748, "epoch": 4994} {"train_loss": -7.4170026779174805, "global_step": 209749, "epoch": 4994} {"train_loss": -7.25804328918457, "global_step": 209750, "epoch": 4994} {"train_loss": -7.348258972167969, "global_step": 209751, "epoch": 4994} {"train_loss": -7.255308151245117, "global_step": 209752, "epoch": 4994} {"train_loss": -7.089251518249512, "global_step": 209753, "epoch": 4994} {"train_loss": -7.21742582321167, "global_step": 209754, "epoch": 4994} {"train_loss": -7.215115070343018, "global_step": 209755, "epoch": 4994} {"train_loss": -7.124807357788086, "global_step": 209756, "epoch": 4994} {"train_loss": -7.257388591766357, "global_step": 209757, "epoch": 4994} {"train_loss": -7.145203590393066, "global_step": 209758, "epoch": 4994} {"train_loss": -7.2020769119262695, "global_step": 209759, "epoch": 4994} {"train_loss": -7.208532333374023, "global_step": 209760, "epoch": 4994} {"train_loss": -6.950893402099609, "global_step": 209761, "epoch": 4994} {"train_loss": -7.189704895019531, "global_step": 209762, "epoch": 4994} {"train_loss": -7.242551803588867, "global_step": 209763, "epoch": 4994} {"train_loss": -6.965722560882568, "global_step": 209764, "epoch": 4994} {"train_loss": -7.271291255950928, "global_step": 209765, "epoch": 4994} {"train_loss": -7.16386079788208, "global_step": 209766, "epoch": 4994} {"train_loss": -7.138602256774902, "global_step": 209767, "epoch": 4994} {"train_loss": -7.172819137573242, "global_step": 209768, "epoch": 4994} {"train_loss": -7.127096176147461, "global_step": 209769, "epoch": 4994} {"train_loss": -7.223855972290039, "global_step": 209770, "epoch": 4994} {"train_loss": -7.021220684051514, "global_step": 209771, "epoch": 4994} {"train_loss": -7.228233814239502, "global_step": 209772, "epoch": 4994} {"train_loss": -7.167942047119141, "global_step": 209773, "epoch": 4994} {"train_loss": -7.212244033813477, "global_step": 209774, "epoch": 4994} {"train_loss": -7.114474296569824, "global_step": 209775, "epoch": 4994} {"train_loss": -7.338191032409668, "global_step": 209776, "epoch": 4994} {"train_loss": -7.209792613983154, "global_step": 209777, "epoch": 4994} {"train_loss": -7.187908172607422, "global_step": 209778, "epoch": 4994} {"train_loss": -7.147651672363281, "global_step": 209779, "epoch": 4994} {"train_loss": -7.324193000793457, "global_step": 209780, "epoch": 4994} {"train_loss": -7.150260925292969, "global_step": 209781, "epoch": 4994} {"train_loss": -7.2897539138793945, "global_step": 209782, "epoch": 4994} {"train_loss": -7.284596920013428, "global_step": 209783, "epoch": 4994} {"train_loss": -7.291961669921875, "global_step": 209784, "epoch": 4994} {"train_loss": -7.304361343383789, "global_step": 209785, "epoch": 4994} {"train_loss": -7.293444633483887, "global_step": 209786, "epoch": 4994} {"train_loss": -7.411308288574219, "global_step": 209787, "epoch": 4994} {"train_loss": -7.3003668785095215, "global_step": 209788, "epoch": 4994} {"train_loss": -7.2218038241068525, "global_step": 209789, "epoch": 4994, "val_loss": 70055.1015625} {"train_loss": -7.352863311767578, "global_step": 209790, "epoch": 4995} {"train_loss": -7.40215539932251, "global_step": 209791, "epoch": 4995} {"train_loss": -7.235597133636475, "global_step": 209792, "epoch": 4995} {"train_loss": -7.370066165924072, "global_step": 209793, "epoch": 4995} {"train_loss": -7.36348819732666, "global_step": 209794, "epoch": 4995} {"train_loss": -7.333783149719238, "global_step": 209795, "epoch": 4995} {"train_loss": -7.320282936096191, "global_step": 209796, "epoch": 4995} {"train_loss": -7.4003143310546875, "global_step": 209797, "epoch": 4995} {"train_loss": -7.419089317321777, "global_step": 209798, "epoch": 4995} {"train_loss": -7.497323989868164, "global_step": 209799, "epoch": 4995} {"train_loss": -7.437044143676758, "global_step": 209800, "epoch": 4995} {"train_loss": -7.368907451629639, "global_step": 209801, "epoch": 4995} {"train_loss": -7.412139892578125, "global_step": 209802, "epoch": 4995} {"train_loss": -7.355771064758301, "global_step": 209803, "epoch": 4995} {"train_loss": -7.367132186889648, "global_step": 209804, "epoch": 4995} {"train_loss": -7.328719139099121, "global_step": 209805, "epoch": 4995} {"train_loss": -7.319277286529541, "global_step": 209806, "epoch": 4995} {"train_loss": -7.440805435180664, "global_step": 209807, "epoch": 4995} {"train_loss": -7.367044448852539, "global_step": 209808, "epoch": 4995} {"train_loss": -7.237886428833008, "global_step": 209809, "epoch": 4995} {"train_loss": -7.289292335510254, "global_step": 209810, "epoch": 4995} {"train_loss": -7.3700103759765625, "global_step": 209811, "epoch": 4995} {"train_loss": -7.266061305999756, "global_step": 209812, "epoch": 4995} {"train_loss": -7.323911190032959, "global_step": 209813, "epoch": 4995} {"train_loss": -7.297453880310059, "global_step": 209814, "epoch": 4995} {"train_loss": -7.349307537078857, "global_step": 209815, "epoch": 4995} {"train_loss": -7.288232803344727, "global_step": 209816, "epoch": 4995} {"train_loss": -7.238250732421875, "global_step": 209817, "epoch": 4995} {"train_loss": -7.41456413269043, "global_step": 209818, "epoch": 4995} {"train_loss": -7.3339643478393555, "global_step": 209819, "epoch": 4995} {"train_loss": -7.302607536315918, "global_step": 209820, "epoch": 4995} {"train_loss": -7.403402328491211, "global_step": 209821, "epoch": 4995} {"train_loss": -7.275123596191406, "global_step": 209822, "epoch": 4995} {"train_loss": -7.402983665466309, "global_step": 209823, "epoch": 4995} {"train_loss": -7.258055210113525, "global_step": 209824, "epoch": 4995} {"train_loss": -7.35950231552124, "global_step": 209825, "epoch": 4995} {"train_loss": -7.3406081199646, "global_step": 209826, "epoch": 4995} {"train_loss": -7.2833452224731445, "global_step": 209827, "epoch": 4995} {"train_loss": -7.3198442459106445, "global_step": 209828, "epoch": 4995} {"train_loss": -7.291469573974609, "global_step": 209829, "epoch": 4995} {"train_loss": -7.277785301208496, "global_step": 209830, "epoch": 4995} {"train_loss": -7.340428772426787, "global_step": 209831, "epoch": 4995, "val_loss": 69905.875} {"train_loss": -7.355739593505859, "global_step": 209832, "epoch": 4996} {"train_loss": -7.3974223136901855, "global_step": 209833, "epoch": 4996} {"train_loss": -7.155404567718506, "global_step": 209834, "epoch": 4996} {"train_loss": -7.272887706756592, "global_step": 209835, "epoch": 4996} {"train_loss": -7.3149824142456055, "global_step": 209836, "epoch": 4996} {"train_loss": -7.158064842224121, "global_step": 209837, "epoch": 4996} {"train_loss": -7.388791084289551, "global_step": 209838, "epoch": 4996} {"train_loss": -7.331418037414551, "global_step": 209839, "epoch": 4996} {"train_loss": -7.2397236824035645, "global_step": 209840, "epoch": 4996} {"train_loss": -7.188266754150391, "global_step": 209841, "epoch": 4996} {"train_loss": -7.4252705574035645, "global_step": 209842, "epoch": 4996} {"train_loss": -7.296714782714844, "global_step": 209843, "epoch": 4996} {"train_loss": -7.409670829772949, "global_step": 209844, "epoch": 4996} {"train_loss": -7.366543769836426, "global_step": 209845, "epoch": 4996} {"train_loss": -7.325607776641846, "global_step": 209846, "epoch": 4996} {"train_loss": -7.427739143371582, "global_step": 209847, "epoch": 4996} {"train_loss": -7.473691940307617, "global_step": 209848, "epoch": 4996} {"train_loss": -7.3597331047058105, "global_step": 209849, "epoch": 4996} {"train_loss": -7.3618879318237305, "global_step": 209850, "epoch": 4996} {"train_loss": -7.229545593261719, "global_step": 209851, "epoch": 4996} {"train_loss": -7.208578586578369, "global_step": 209852, "epoch": 4996} {"train_loss": -7.339470863342285, "global_step": 209853, "epoch": 4996} {"train_loss": -7.3111090660095215, "global_step": 209854, "epoch": 4996} {"train_loss": -7.3169050216674805, "global_step": 209855, "epoch": 4996} {"train_loss": -7.366742134094238, "global_step": 209856, "epoch": 4996} {"train_loss": -7.320216178894043, "global_step": 209857, "epoch": 4996} {"train_loss": -7.259863376617432, "global_step": 209858, "epoch": 4996} {"train_loss": -7.267390251159668, "global_step": 209859, "epoch": 4996} {"train_loss": -7.33631706237793, "global_step": 209860, "epoch": 4996} {"train_loss": -7.293688774108887, "global_step": 209861, "epoch": 4996} {"train_loss": -7.192943096160889, "global_step": 209862, "epoch": 4996} {"train_loss": -7.299623489379883, "global_step": 209863, "epoch": 4996} {"train_loss": -7.343343734741211, "global_step": 209864, "epoch": 4996} {"train_loss": -7.316863059997559, "global_step": 209865, "epoch": 4996} {"train_loss": -7.336426734924316, "global_step": 209866, "epoch": 4996} {"train_loss": -7.206593036651611, "global_step": 209867, "epoch": 4996} {"train_loss": -7.272161483764648, "global_step": 209868, "epoch": 4996} {"train_loss": -7.336933135986328, "global_step": 209869, "epoch": 4996} {"train_loss": -7.3073649406433105, "global_step": 209870, "epoch": 4996} {"train_loss": -7.37388277053833, "global_step": 209871, "epoch": 4996} {"train_loss": -7.375429153442383, "global_step": 209872, "epoch": 4996} {"train_loss": -7.31307467960176, "global_step": 209873, "epoch": 4996, "val_loss": 70085.2890625} {"train_loss": -7.371240615844727, "global_step": 209874, "epoch": 4997} {"train_loss": -7.220782279968262, "global_step": 209875, "epoch": 4997} {"train_loss": -7.253418922424316, "global_step": 209876, "epoch": 4997} {"train_loss": -7.346785545349121, "global_step": 209877, "epoch": 4997} {"train_loss": -7.3153181076049805, "global_step": 209878, "epoch": 4997} {"train_loss": -7.304421424865723, "global_step": 209879, "epoch": 4997} {"train_loss": -7.341115474700928, "global_step": 209880, "epoch": 4997} {"train_loss": -7.278817176818848, "global_step": 209881, "epoch": 4997} {"train_loss": -7.283311367034912, "global_step": 209882, "epoch": 4997} {"train_loss": -7.33876895904541, "global_step": 209883, "epoch": 4997} {"train_loss": -7.412952423095703, "global_step": 209884, "epoch": 4997} {"train_loss": -7.39517068862915, "global_step": 209885, "epoch": 4997} {"train_loss": -7.268758296966553, "global_step": 209886, "epoch": 4997} {"train_loss": -7.352335453033447, "global_step": 209887, "epoch": 4997} {"train_loss": -7.300936698913574, "global_step": 209888, "epoch": 4997} {"train_loss": -7.320953845977783, "global_step": 209889, "epoch": 4997} {"train_loss": -7.396088600158691, "global_step": 209890, "epoch": 4997} {"train_loss": -7.216300010681152, "global_step": 209891, "epoch": 4997} {"train_loss": -7.34969425201416, "global_step": 209892, "epoch": 4997} {"train_loss": -7.235543251037598, "global_step": 209893, "epoch": 4997} {"train_loss": -7.289713382720947, "global_step": 209894, "epoch": 4997} {"train_loss": -7.348419189453125, "global_step": 209895, "epoch": 4997} {"train_loss": -7.452269077301025, "global_step": 209896, "epoch": 4997} {"train_loss": -7.401725769042969, "global_step": 209897, "epoch": 4997} {"train_loss": -7.287994384765625, "global_step": 209898, "epoch": 4997} {"train_loss": -7.379246711730957, "global_step": 209899, "epoch": 4997} {"train_loss": -7.346830368041992, "global_step": 209900, "epoch": 4997} {"train_loss": -7.411351203918457, "global_step": 209901, "epoch": 4997} {"train_loss": -7.423582077026367, "global_step": 209902, "epoch": 4997} {"train_loss": -7.308889389038086, "global_step": 209903, "epoch": 4997} {"train_loss": -7.274137020111084, "global_step": 209904, "epoch": 4997} {"train_loss": -7.3804030418396, "global_step": 209905, "epoch": 4997} {"train_loss": -7.482723712921143, "global_step": 209906, "epoch": 4997} {"train_loss": -7.275628566741943, "global_step": 209907, "epoch": 4997} {"train_loss": -7.35091495513916, "global_step": 209908, "epoch": 4997} {"train_loss": -7.308520317077637, "global_step": 209909, "epoch": 4997} {"train_loss": -7.434090614318848, "global_step": 209910, "epoch": 4997} {"train_loss": -7.4712018966674805, "global_step": 209911, "epoch": 4997} {"train_loss": -7.367568016052246, "global_step": 209912, "epoch": 4997} {"train_loss": -7.285393714904785, "global_step": 209913, "epoch": 4997} {"train_loss": -7.456933498382568, "global_step": 209914, "epoch": 4997} {"train_loss": -7.341403461637951, "global_step": 209915, "epoch": 4997, "val_loss": 69926.203125} {"train_loss": -7.4605231285095215, "global_step": 209916, "epoch": 4998} {"train_loss": -7.5119853019714355, "global_step": 209917, "epoch": 4998} {"train_loss": -7.2824506759643555, "global_step": 209918, "epoch": 4998} {"train_loss": -7.214024543762207, "global_step": 209919, "epoch": 4998} {"train_loss": -7.265263557434082, "global_step": 209920, "epoch": 4998} {"train_loss": -7.424156188964844, "global_step": 209921, "epoch": 4998} {"train_loss": -7.302082538604736, "global_step": 209922, "epoch": 4998} {"train_loss": -7.261961460113525, "global_step": 209923, "epoch": 4998} {"train_loss": -7.46683931350708, "global_step": 209924, "epoch": 4998} {"train_loss": -7.3299150466918945, "global_step": 209925, "epoch": 4998} {"train_loss": -7.2850141525268555, "global_step": 209926, "epoch": 4998} {"train_loss": -7.395382881164551, "global_step": 209927, "epoch": 4998} {"train_loss": -7.348761081695557, "global_step": 209928, "epoch": 4998} {"train_loss": -7.266338348388672, "global_step": 209929, "epoch": 4998} {"train_loss": -7.331465721130371, "global_step": 209930, "epoch": 4998} {"train_loss": -7.1855010986328125, "global_step": 209931, "epoch": 4998} {"train_loss": -7.319363117218018, "global_step": 209932, "epoch": 4998} {"train_loss": -7.441589832305908, "global_step": 209933, "epoch": 4998} {"train_loss": -7.176122665405273, "global_step": 209934, "epoch": 4998} {"train_loss": -7.19406795501709, "global_step": 209935, "epoch": 4998} {"train_loss": -7.433226585388184, "global_step": 209936, "epoch": 4998} {"train_loss": -7.209383010864258, "global_step": 209937, "epoch": 4998} {"train_loss": -7.234772682189941, "global_step": 209938, "epoch": 4998} {"train_loss": -7.280918121337891, "global_step": 209939, "epoch": 4998} {"train_loss": -7.253086090087891, "global_step": 209940, "epoch": 4998} {"train_loss": -7.403537750244141, "global_step": 209941, "epoch": 4998} {"train_loss": -7.281532287597656, "global_step": 209942, "epoch": 4998} {"train_loss": -7.312577247619629, "global_step": 209943, "epoch": 4998} {"train_loss": -7.422390937805176, "global_step": 209944, "epoch": 4998} {"train_loss": -7.2595930099487305, "global_step": 209945, "epoch": 4998} {"train_loss": -7.266236782073975, "global_step": 209946, "epoch": 4998} {"train_loss": -7.319394111633301, "global_step": 209947, "epoch": 4998} {"train_loss": -7.2674055099487305, "global_step": 209948, "epoch": 4998} {"train_loss": -7.319530963897705, "global_step": 209949, "epoch": 4998} {"train_loss": -7.235381126403809, "global_step": 209950, "epoch": 4998} {"train_loss": -7.342207908630371, "global_step": 209951, "epoch": 4998} {"train_loss": -7.279655456542969, "global_step": 209952, "epoch": 4998} {"train_loss": -7.3385844230651855, "global_step": 209953, "epoch": 4998} {"train_loss": -7.341611862182617, "global_step": 209954, "epoch": 4998} {"train_loss": -7.222902297973633, "global_step": 209955, "epoch": 4998} {"train_loss": -7.383305072784424, "global_step": 209956, "epoch": 4998} {"train_loss": -7.313189597356887, "global_step": 209957, "epoch": 4998, "val_loss": 70113.109375} {"train_loss": -7.388129711151123, "global_step": 209958, "epoch": 4999} {"train_loss": -7.364372730255127, "global_step": 209959, "epoch": 4999} {"train_loss": -7.303920269012451, "global_step": 209960, "epoch": 4999} {"train_loss": -7.158392906188965, "global_step": 209961, "epoch": 4999} {"train_loss": -7.426767826080322, "global_step": 209962, "epoch": 4999} {"train_loss": -7.3571271896362305, "global_step": 209963, "epoch": 4999} {"train_loss": -7.302888870239258, "global_step": 209964, "epoch": 4999} {"train_loss": -7.31212043762207, "global_step": 209965, "epoch": 4999} {"train_loss": -7.2717695236206055, "global_step": 209966, "epoch": 4999} {"train_loss": -7.355033874511719, "global_step": 209967, "epoch": 4999} {"train_loss": -7.436254024505615, "global_step": 209968, "epoch": 4999} {"train_loss": -7.293619155883789, "global_step": 209969, "epoch": 4999} {"train_loss": -7.2660393714904785, "global_step": 209970, "epoch": 4999} {"train_loss": -7.388894557952881, "global_step": 209971, "epoch": 4999} {"train_loss": -7.335658550262451, "global_step": 209972, "epoch": 4999} {"train_loss": -7.328241348266602, "global_step": 209973, "epoch": 4999} {"train_loss": -7.369227409362793, "global_step": 209974, "epoch": 4999} {"train_loss": -7.267139911651611, "global_step": 209975, "epoch": 4999} {"train_loss": -7.321893692016602, "global_step": 209976, "epoch": 4999} {"train_loss": -7.520174026489258, "global_step": 209977, "epoch": 4999} {"train_loss": -7.375086784362793, "global_step": 209978, "epoch": 4999} {"train_loss": -7.440165996551514, "global_step": 209979, "epoch": 4999} {"train_loss": -7.341659069061279, "global_step": 209980, "epoch": 4999} {"train_loss": -7.271304130554199, "global_step": 209981, "epoch": 4999} {"train_loss": -7.264764785766602, "global_step": 209982, "epoch": 4999} {"train_loss": -7.3480730056762695, "global_step": 209983, "epoch": 4999} {"train_loss": -7.27574348449707, "global_step": 209984, "epoch": 4999} {"train_loss": -7.359342098236084, "global_step": 209985, "epoch": 4999} {"train_loss": -7.340349197387695, "global_step": 209986, "epoch": 4999} {"train_loss": -7.38182258605957, "global_step": 209987, "epoch": 4999} {"train_loss": -7.287681579589844, "global_step": 209988, "epoch": 4999} {"train_loss": -7.432500839233398, "global_step": 209989, "epoch": 4999} {"train_loss": -7.221117973327637, "global_step": 209990, "epoch": 4999} {"train_loss": -7.258767127990723, "global_step": 209991, "epoch": 4999} {"train_loss": -7.310037612915039, "global_step": 209992, "epoch": 4999} {"train_loss": -7.291297912597656, "global_step": 209993, "epoch": 4999} {"train_loss": -7.368644714355469, "global_step": 209994, "epoch": 4999} {"train_loss": -7.182768821716309, "global_step": 209995, "epoch": 4999} {"train_loss": -7.308986186981201, "global_step": 209996, "epoch": 4999} {"train_loss": -7.235526084899902, "global_step": 209997, "epoch": 4999} {"train_loss": -7.202567100524902, "global_step": 209998, "epoch": 4999} {"train_loss": -7.322721118018741, "global_step": 209999, "epoch": 4999, "val_loss": 69938.8984375}